71 int regexScan(regex_t *regex,
char *regexStr, FILE *scanFilePtr,
char *fileName)
85 while (fgets(textBuff, 1024, scanFilePtr) != NULL)
88 retCode = regexec(regex, textBuff, 1, rm, 0);
91 sprintf(msgBuff,
"%s: regex found at line %d at position %d. -> %.*s \n",
92 fileName, lineCount, rm[0].rm_so+1, rm[0].rm_eo-rm[0].rm_so, textBuff + rm[0].rm_so);
99 else if (retCode == REG_NOMATCH)
105 regerror(retCode, regex, msgBuff,
sizeof(msgBuff));
106 fprintf(stderr,
"Out of memory? - regex match failure: %s\n", msgBuff);
115 sprintf(msgBuff,
"%s: %s not found\n", fileName, regexStr);
139 sprintf(sqlSelect,
"SELECT pfile_sha1, pfile_md5, pfile_size, ufile_name FROM pfile, uploadtree WHERE pfile_fk = pfile_pk and pfile_pk = '%s'", pfileNum);
140 result = PQexec(
pgConn, sqlSelect);
145 if (PQntuples(result) == 0)
150 fprintf(stderr,
"Database does not contain pfile_pk: %s\n", pfileNum);
153 else if (PQntuples(result) != 1)
158 fprintf(stderr,
"Database contains multiple pfile_pk: %s\n", pfileNum);
163 sprintf(pfileRepoName,
"%s.%s.%s", PQgetvalue(result, 0, 0), PQgetvalue(result, 0, 1), PQgetvalue(result, 0, 2));
165 sprintf(pfileRealName,
"%s", PQgetvalue(result, 0, 3));
184 PGresult *result, *pfileResult;
186 int fileCount, i, retCode;
188 char fileRealName[1000];
189 char fileRepoName[1000];
196 sprintf(sqlSelect,
"SELECT upload_pk, upload_mode, upload_filename from upload where upload_pk = '%s'", uploadNum);
197 result = PQexec(
pgConn, sqlSelect);
202 if (PQntuples(result) == 0)
204 fprintf(stderr,
"No uploads appear to be available here!\n");
211 if ((atoi(PQgetvalue(result, 0, 1)) & 96) != 96)
213 fprintf(stderr,
"Upload %s was not successfully processed after upload!\n", uploadNum);
219 sprintf(sqlSelect,
"SELECT uploadtree.pfile_fk, ufile_name from uploadtree, upload" 220 " where upload_fk = upload_pk and uploadtree.pfile_fk <> 0 and ufile_mode = 32768 and upload_pk = '%s'", uploadNum);
221 result = PQexec(
pgConn, sqlSelect);
225 fileCount = PQntuples(result);
229 retCode = regcomp(®ex, regexStr, REG_ICASE+REG_EXTENDED);
232 fprintf(stderr,
"regex %s failed to compile\n", regexStr);
237 for (i=0; i<fileCount; i++)
240 sprintf(sqlSelect,
"SELECT pfile_sha1, pfile_md5, pfile_size, ufile_name" 241 " FROM pfile, uploadtree WHERE pfile_fk = pfile_pk and pfile_pk = '%s'", PQgetvalue(result, i, 0));
242 pfileResult = PQexec(
pgConn, sqlSelect);
247 if (PQntuples(pfileResult) == 1)
252 if (
pfileNumToNames(PQgetvalue(result, i, 0), fileRepoName, fileRealName) != 0)
254 fprintf(stderr,
"ERROR: Unable to locate pfile_pk '%s'\n", PQgetvalue(result, i, 0));
262 fprintf(stderr,
"ERROR: Unable to open '%s/%s'\n",
"files", fileRepoName);
267 regexScan(®ex, regexStr, scanFilePtr, fileRealName);
271 fprintf(stderr,
"WARNING: File: %s - Located %d instances of pfile_pk %s ! Size = %s bytes!\n",
272 PQgetvalue(result, i, 1), PQntuples(pfileResult), PQgetvalue(result, i, 0), PQgetvalue(pfileResult, i, 2));
286 printf(
"Usage: %s [options] [id [id ...]]\n",Name);
287 printf(
" -i :: initialize the database, then exit.\n");
288 printf(
" -c SYSCONFDIR :: FOSSology configuration directory.\n");
289 printf(
" -h :: show available command line options.\n");
290 printf(
" -v :: increase agent logging verbosity.\n");
291 printf(
" -r :: regex expression to load from command line.\n");
292 printf(
" filename :: filename to process with regex.\n");
296 int main (
int argc,
char *argv[])
304 bool regexSet =
false;
311 int scannedCount = 0;
318 char agent_rev[myBUFSIZ];
328 sprintf(agent_rev,
"%s.%s", VERSION, COMMIT_HASH);
330 fprintf(stdout,
"regexscan reports version info as '%s.%s'.\n", VERSION, COMMIT_HASH);
334 while((c = getopt(argc,argv,
"chir:v")) != -1)
344 sprintf(regexStr,
"%s", optarg);
362 fprintf (stderr,
"No regex value has been requested!\n");
369 nonoptargs = argc - optind;
380 printf(
"UploadPK is: %ld\n", UploadPK);
381 sprintf(uploadNum,
"%ld", UploadPK);
383 if (scannedCount == 0)
385 fprintf(stderr,
"Failed to successfully scan: upload - %s!\n", uploadNum);
392 sprintf(fileName,
"%s", argv[optind]);
394 scanFilePtr = fopen(fileName,
"r");
397 fprintf(stderr,
"ERROR: Unable to open '%s'\n", fileName);
403 retCode = regcomp(®ex, regexStr, REG_ICASE+REG_EXTENDED);
406 fprintf(stderr,
"regex %s failed to compile\n", regexStr);
412 retCode =
regexScan(®ex, (
char *)regexStr, scanFilePtr, (
char *)fileName);
416 fprintf(stderr,
"Failed to successfully scan: %s!\n", fileName);
int fo_checkPQresult(PGconn *pgConn, PGresult *result, char *sql, char *FileID, int LineNumb)
Check the result status of a postgres SELECT.
void Usage(char *Name)
Usage description for this regexscan agent.
Store the results of a regex match.
char * fo_scheduler_current()
Get the last read string from the scheduler.
PGconn * pgConn
Database connection.
void fo_scheduler_disconnect(int retcode)
Disconnect the scheduler connection.
void fo_scheduler_connect(int *argc, char **argv, PGconn **db_conn)
Establish a connection between an agent and the scheduler.
FILE * fo_RepFread(char *Type, char *Filename)
Perform an fopen for reading only.
int agent_verbose
Common verbose flags for the agents, this is used so that the scheduler can change the verbose level ...
int fo_scheduler_userID()
Gets the id of the user that created the job that the agent is running.
The main FOSSology C library.
char * fo_scheduler_next()
Get the next data to process from the scheduler.
int pfileNumToNames(char *pfileNum, char *pfileRepoName, char *pfileRealName)
Creates filenames from pfile_pk value.
int regexScan(regex_t *regex, char *regexStr, FILE *scanFilePtr, char *fileName)
Scan a file for a regex - regular expression. the regex is compiled in this function for performanc...
char * fo_sysconfig(const char *sectionname, const char *variablename)
gets a system configuration variable from the configuration data.
int regexScanUpload(char *uploadNum, char *regexStr)
Scan an Upload for a regex - regular expression. gets a list of files in an upload and calls regexS...