Changeset: df9f9c031311 for MonetDB URL: http://dev.monetdb.org/hg/MonetDB?cmd=changeset;node=df9f9c031311 Modified Files: monetdb5/extras/rdf/rdfschema.c Branch: rdf Log Message:
change delimiter in sample data, split into two files (instances + candidates) diffs (162 lines): diff --git a/monetdb5/extras/rdf/rdfschema.c b/monetdb5/extras/rdf/rdfschema.c --- a/monetdb5/extras/rdf/rdfschema.c +++ b/monetdb5/extras/rdf/rdfschema.c @@ -6196,7 +6196,7 @@ static str printFullSampleData(CSSampleExtend *csSampleEx, int num, BAT *mbat, PropStat *propStat, CSset *freqCSset){ int i,j, k; - FILE *fout, *foutsol, *fouttb, *foutis; + FILE *fout, *foutrand, *foutsol, *fouttb, *foutis; char filename[100], filename4[100], filename2[100], filename3[100]; int ret; @@ -6254,13 +6254,15 @@ str printFullSampleData(CSSampleExtend * fout = fopen(filename,"wt"); foutsol = fopen(filename4,"wt"); + foutrand = fopen("sampleDataFullRandom.txt","wt"); fouttb = fopen(filename2,"wt"); foutis = fopen(filename3,"wt"); for (i = 0; i < num; i++){ sample = csSampleEx[i]; freqCS = freqCSset->items[sample.freqIdx]; - fprintf(fout,"Table %d\n", i); + fprintf(fout,"Table %d, %d tuples\n", i, freqCS.support); + fprintf(foutrand,"Table %d, %d tuples\n", i, freqCS.support); fprintf(foutsol, "Table %d\n", i); for (j = 0; j < (int)sample.candidateCount; j++){ //fprintf(fout," " BUNFMT,sample.candidates[j]); @@ -6272,12 +6274,12 @@ str printFullSampleData(CSSampleExtend * getStringName(sample.candidates[j], &canStr, mapi, mbat, 1); #if USE_SHORT_NAMES getPropNameShort(&canStrShort, canStr); - if (j+1 == (int)sample.candidateCount) fprintf(fout, "%s", canStrShort); - else fprintf(fout, "%s;", canStrShort); + if (j+1 == (int)sample.candidateCount) fprintf(foutrand, "%s", canStrShort); + else fprintf(foutrand, "%s|", canStrShort); GDKfree(canStrShort); #else - if (j+1 == (int)sample.candidateCount) fprintf(fout, "%s", canStr); - else fprintf(fout, "%s;", canStr); + if (j+1 == (int)sample.candidateCount) fprintf(foutrand, "%s", canStr); + else fprintf(foutrand, "%s|", canStr); #endif GDKfree(canStr); @@ -6292,18 +6294,18 @@ str printFullSampleData(CSSampleExtend * #if USE_SHORT_NAMES getPropNameShort(&canStrShort, canStr); if (j+1 == (int)sample.candidateCount) fprintf(foutsol, "%s (%s)", canStrShort, canStr); - else fprintf(foutsol, "%s (%s);", canStrShort, canStr); + else fprintf(foutsol, "%s (%s)|", canStrShort, canStr); GDKfree(canStrShort); #else if (j+1 == (int)sample.candidateCount) fprintf(foutsol, "%s", canStr); - else fprintf(foutsol, "%s;", canStr); + else fprintf(foutsol, "%s|", canStr); #endif GDKfree(canStr); } } - fprintf(fout, "\n"); + fprintf(foutrand, "\n"); fprintf(foutsol, "\n"); // print origin of candidates for solutions file @@ -6335,9 +6337,6 @@ str printFullSampleData(CSSampleExtend * else fprintf(fouttb,"CREATE TABLE tbSample%d \n (\n", i); - //Number of tuples - fprintf(fout, "%d\n", freqCS.support); - // Compute property order (descending by support) and number of properties that are printed found = 0; numPropsInSampleTable = (sample.numProp>(1+NUM_PROP_SUPPORT_SAMPLE+NUM_PROP_TFIDF_SAMPLE))?(1+NUM_PROP_SUPPORT_SAMPLE+NUM_PROP_TFIDF_SAMPLE):sample.numProp; @@ -6426,7 +6425,7 @@ str printFullSampleData(CSSampleExtend * takeOid(sample.lstProp[index], &propStr); #if USE_SHORT_NAMES getPropNameShort(&propStrShort, propStr); - fprintf(fout,";%s", propStrShort); + fprintf(fout,"|%s", propStrShort); pch = strstr (propStrShort,"-"); if (pch != NULL) *pch = '\0'; //Remove - characters from prop //WEBCRAWL specific problem @@ -6507,14 +6506,14 @@ str printFullSampleData(CSSampleExtend * } else{ if (sample.lstIsMVCol[j] == 1){ // - fprintf(fout,";<"BUNFMT">",*objOid); + fprintf(fout,"|<"BUNFMT">",*objOid); } else{ str objStrShort = NULL; takeOid(*objOid, &objStr); getPropNameShort(&objStrShort, objStr); - fprintf(fout,";<%s>", objStrShort); + fprintf(fout,"|<%s>", objStrShort); fprintf(foutis,"|<%s>", objStrShort); GDKfree(objStrShort); GDKfree(objStr); @@ -6526,11 +6525,11 @@ str printFullSampleData(CSSampleExtend * else if (tmpBat->ttype == TYPE_flt){ objFlt = (float *) BUNtail(tmpi, k); if (*objFlt == flt_nil){ - fprintf(fout,";NULL"); + fprintf(fout,"|NULL"); fprintf(foutis,"|NULL"); } else{ - fprintf(fout,";%f", *objFlt); + fprintf(fout,"|%f", *objFlt); fprintf(foutis,"|%f", *objFlt); } @@ -6538,11 +6537,11 @@ str printFullSampleData(CSSampleExtend * else if (tmpBat->ttype == TYPE_int){ objInt = (int *) BUNtail(tmpi, k); if (*objInt == int_nil){ - fprintf(fout,";NULL"); + fprintf(fout,"|NULL"); fprintf(foutis,"|NULL"); } else{ - fprintf(fout,";%d", *objInt); + fprintf(fout,"|%d", *objInt); fprintf(foutis,"|%d", *objInt); } @@ -6551,11 +6550,11 @@ str printFullSampleData(CSSampleExtend * objStr = NULL; objStr = BUNtail(tmpi, k); if (strcmp(objStr, str_nil) == 0){ - fprintf(fout,";NULL"); + fprintf(fout,"|NULL"); fprintf(foutis,"|NULL"); } else{ - fprintf(fout,";%s", objStr); + fprintf(fout,"|%s", objStr); fprintf(foutis,"| %s", objStr); } } @@ -6572,6 +6571,7 @@ str printFullSampleData(CSSampleExtend * fprintf(fout, "\n"); fprintf(foutsol, "\n"); + fprintf(foutrand, "\n"); fprintf(foutis, "\" > tmp.txt \n \n"); if (sample.name != BUN_NONE){ @@ -6608,6 +6608,7 @@ str printFullSampleData(CSSampleExtend * fclose(fout); fclose(foutsol); + fclose(foutrand); fclose(fouttb); fclose(foutis); _______________________________________________ checkin-list mailing list checkin-list@monetdb.org https://www.monetdb.org/mailman/listinfo/checkin-list