You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
fprintf(stderr, "Warning: there are %d poor quality (length < 10000) genome assemblies in the total %d genome assemblied.\n", badNumber, totalNumber);
316
+
fprintf(stderr, "Warning: there are %d poor quality (length < %ld) genome assemblies in the total %d genome assemblied.\n", badNumber, minLen, totalNumber);
317
317
}
318
318
cerr << "\t===the totalSize is: " << totalSize << endl;
319
319
cerr << "\t===the maxSize is: " << maxSize << endl;
@@ -520,7 +520,7 @@ bool sketchSequences(string inputFile, int kmerSize, int sketchSize, string sket
520
520
returntrue;
521
521
}
522
522
523
-
boolsketchFiles(string inputFile, int kmerSize, int sketchSize, string sketchFunc, bool isContainment, int containCompress, vector<SketchInfo>& sketches, int threads){
523
+
boolsketchFiles(string inputFile, uint64_t minLen, int kmerSize, int sketchSize, string sketchFunc, bool isContainment, int containCompress, vector<SketchInfo>& sketches, int threads){
524
524
fprintf(stderr, "input fileList, sketch by file\n");
525
525
fstream fs(inputFile);
526
526
if(!fs){
@@ -691,7 +691,7 @@ bool sketchFiles(string inputFile, int kmerSize, int sketchSize, string sketchFu
691
691
tmpSketchInfo.fileName = fileList[i];
692
692
tmpSketchInfo.totalSeqLength = totalLength;
693
693
tmpSketchInfo.fileSeqs = curFileSeqs;
694
-
if(totalLength >= 10000)//filter the poor quality genome assemblies whose length less than 10k bp(fastANI paper)
694
+
if(totalLength >= minLen)//filter the poor quality genome assemblies whose length less than minLen(fastANI paper)
boolsketchSequences(string inputFile, int kmerSize, int sketchSize, string sketchFunc, bool isContainment, int containCompress, vector<SketchInfo>& sketches, int threads);
41
-
boolsketchFiles(string inputFile, int kmerSize, int sketchSize, string sketchFunc, bool isContainment, int containCompress, vector<SketchInfo>& sketches, int threads);
41
+
boolsketchFiles(string inputFile, uint64_t minLen, int kmerSize, int sketchSize, string sketchFunc, bool isContainment, int containCompress, vector<SketchInfo>& sketches, int threads);
fprintf(stdout, " -m <int>\t: set the filter minimum genome length (minLen), genome with total length less the minLen will be ignore, for both clust-mst and clust-greedy\n");
50
51
fprintf(stdout, " -k <int>\t: set kmer size, automatically calculate the kmer size without -k option, for both clust-mst and clust-greedy\n");
51
52
fprintf(stdout, " -s <int>\t: set sketch size, default 1000, for both clust-mst and clust-greedy\n");
52
53
fprintf(stdout, " -c <int>\t: set sampling ratio to compute viriable sketchSize, sketchSize = genomeSize/samplingRatio, only support with MinHash sketch function of clust-greedy\n");
0 commit comments