Patch building of the Single copy reference DB to make a single blast

database for Large and Small Single copy


Former-commit-id: 9bad3443085b2b6b066c7f33f3eaf2e49b5e8992
Former-commit-id: 15ce54a189d9def4b824c149f0ba5ba036794567
This commit is contained in:
2015-10-07 12:29:48 -03:00
parent cbc32a6326
commit b75035064c
10 changed files with 75 additions and 71 deletions
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
+65 -63
View File
@@ -1,63 +1,65 @@
2015-10-07 11:25:33 [OA INFO ] 89006 -- Selecting Viridiplantae genebank entries... 2015-10-07 12:22:15 [OA INFO ] 90184 -- Selecting Viridiplantae genebank entries...
2015-10-07 11:25:42 [OA INFO ] 89006 -- --> 695 entries selected 2015-10-07 12:22:24 [OA INFO ] 90184 -- --> 695 entries selected
2015-10-07 11:25:42 [OA INFO ] 89006 -- Done 2015-10-07 12:22:24 [OA INFO ] 90184 -- Done
2015-10-07 11:25:42 [OA INFO ] 89006 -- Extracting Long Single Copies (LSC)... 2015-10-07 12:22:24 [OA INFO ] 90184 -- Extracting Long Single Copies (LSC)...
2015-10-07 11:26:36 [OA INFO ] 89006 -- --> 64 retreived sequences 2015-10-07 12:23:17 [OA INFO ] 90184 -- --> 64 retreived sequences
2015-10-07 11:26:36 [OA INFO ] 89006 -- Done 2015-10-07 12:23:17 [OA INFO ] 90184 -- Done
2015-10-07 11:26:36 [OA INFO ] 89006 -- Building LSC coorientation graph... 2015-10-07 12:23:17 [OA INFO ] 90184 -- Building LSC coorientation graph...
2015-10-07 11:26:36 [OA INFO ] 89127 -- Build temporary blast DB... 2015-10-07 12:23:17 [OA INFO ] 90306 -- Build temporary blast DB...
2015-10-07 11:26:36 [OA INFO ] 89127 -- Done 2015-10-07 12:23:18 [OA INFO ] 90306 -- Done
2015-10-07 11:26:36 [OA INFO ] 89127 -- Running Blast... 2015-10-07 12:23:18 [OA INFO ] 90306 -- Running Blast...
2015-10-07 11:27:47 [OA INFO ] 89127 -- Done 2015-10-07 12:24:29 [OA INFO ] 90306 -- Done
2015-10-07 11:27:47 [OA INFO ] 89006 -- --> 6 connected componants 2015-10-07 12:24:29 [OA INFO ] 90184 -- --> 6 connected componants
2015-10-07 11:27:47 [OA INFO ] 89006 -- Done 2015-10-07 12:24:29 [OA INFO ] 90184 -- Done
2015-10-07 11:27:47 [OA INFO ] 89006 -- Indexing LCS... 2015-10-07 12:24:29 [OA INFO ] 90184 -- Indexing LCS...
2015-10-07 11:27:47 [OA INFO ] 89006 -- Done 2015-10-07 12:24:30 [OA INFO ] 90184 -- Done
2015-10-07 11:27:47 [OA INFO ] 89006 -- Extracting main connected components for LCS... 2015-10-07 12:24:30 [OA INFO ] 90184 -- Extracting main connected components for LCS...
2015-10-07 11:27:48 [OA INFO ] 89006 -- --> 40 sequences 2015-10-07 12:24:30 [OA INFO ] 90184 -- --> 40 sequences
2015-10-07 11:27:48 [OA INFO ] 89006 -- Done 2015-10-07 12:24:30 [OA INFO ] 90184 -- Done
2015-10-07 11:27:48 [OA INFO ] 89006 -- Extracting second connected components for LCS... 2015-10-07 12:24:30 [OA INFO ] 90184 -- Extracting second connected components for LCS...
2015-10-07 11:27:48 [OA INFO ] 89006 -- --> 5 sequences 2015-10-07 12:24:30 [OA INFO ] 90184 -- --> 5 sequences
2015-10-07 11:27:48 [OA INFO ] 89006 -- Done 2015-10-07 12:24:30 [OA INFO ] 90184 -- Done
2015-10-07 11:27:48 [OA INFO ] 89006 -- merging both connected components for LCS... 2015-10-07 12:24:30 [OA INFO ] 90184 -- merging both connected components for LCS...
2015-10-07 11:27:48 [OA INFO ] 89006 -- --> 45 sequences in total 2015-10-07 12:24:30 [OA INFO ] 90184 -- --> 45 sequences in total
2015-10-07 11:27:48 [OA INFO ] 89006 -- Done 2015-10-07 12:24:30 [OA INFO ] 90184 -- Done
2015-10-07 11:27:48 [OA INFO ] 89006 -- Checking LCS homogeneity... 2015-10-07 12:24:30 [OA INFO ] 90184 -- Checking LCS homogeneity...
2015-10-07 11:27:48 [OA INFO ] 89258 -- Build temporary blast DB... 2015-10-07 12:24:30 [OA INFO ] 90439 -- Build temporary blast DB...
2015-10-07 11:27:48 [OA INFO ] 89258 -- Done 2015-10-07 12:24:30 [OA INFO ] 90439 -- Done
2015-10-07 11:27:48 [OA INFO ] 89258 -- Running Blast... 2015-10-07 12:24:30 [OA INFO ] 90439 -- Running Blast...
2015-10-07 11:28:50 [OA INFO ] 89258 -- Done 2015-10-07 12:25:35 [OA INFO ] 90439 -- Done
2015-10-07 11:28:50 [OA INFO ] 89006 -- --> 1 connected componants 2015-10-07 12:25:35 [OA INFO ] 90184 -- --> 1 connected componants
2015-10-07 11:28:50 [OA INFO ] 89006 -- Done 2015-10-07 12:25:35 [OA INFO ] 90184 -- Done
2015-10-07 11:28:50 [OA INFO ] 89006 -- Installing LCS reference databases... 2015-10-07 12:25:35 [OA INFO ] 90184 -- Installing LCS reference databases...
2015-10-07 11:28:50 [OA INFO ] 89006 -- Done 2015-10-07 12:25:35 [OA INFO ] 90184 -- Done
2015-10-07 11:28:50 [OA INFO ] 89006 -- Extracting Short Single Copies (SSC)... 2015-10-07 12:25:35 [OA INFO ] 90184 -- Extracting Short Single Copies (SSC)...
2015-10-07 11:29:42 [OA INFO ] 89006 -- --> 76 retreived sequences 2015-10-07 12:26:28 [OA INFO ] 90184 -- --> 76 retreived sequences
2015-10-07 11:29:42 [OA INFO ] 89006 -- Done 2015-10-07 12:26:28 [OA INFO ] 90184 -- Done
2015-10-07 11:29:42 [OA INFO ] 89006 -- Building SSC coorientation graph... 2015-10-07 12:26:28 [OA INFO ] 90184 -- Building SSC coorientation graph...
2015-10-07 11:29:42 [OA INFO ] 89336 -- Build temporary blast DB... 2015-10-07 12:26:28 [OA INFO ] 90517 -- Build temporary blast DB...
2015-10-07 11:29:42 [OA INFO ] 89336 -- Done 2015-10-07 12:26:28 [OA INFO ] 90517 -- Done
2015-10-07 11:29:42 [OA INFO ] 89336 -- Running Blast... 2015-10-07 12:26:28 [OA INFO ] 90517 -- Running Blast...
2015-10-07 11:30:03 [OA INFO ] 89336 -- Done 2015-10-07 12:26:49 [OA INFO ] 90517 -- Done
2015-10-07 11:30:03 [OA INFO ] 89006 -- --> 1 connected componants 2015-10-07 12:26:49 [OA INFO ] 90184 -- --> 1 connected componants
2015-10-07 11:30:03 [OA INFO ] 89006 -- Done 2015-10-07 12:26:49 [OA INFO ] 90184 -- Done
2015-10-07 11:30:03 [OA INFO ] 89006 -- Indexing SSC... 2015-10-07 12:26:49 [OA INFO ] 90184 -- Indexing SSC...
2015-10-07 11:30:03 [OA INFO ] 89006 -- Done 2015-10-07 12:26:49 [OA INFO ] 90184 -- Done
2015-10-07 11:30:03 [OA INFO ] 89006 -- Extracting main connected components for SSC... 2015-10-07 12:26:49 [OA INFO ] 90184 -- Extracting main connected components for SSC...
2015-10-07 11:30:03 [OA INFO ] 89006 -- --> 72 sequences 2015-10-07 12:26:49 [OA INFO ] 90184 -- --> 72 sequences
2015-10-07 11:30:03 [OA INFO ] 89006 -- Done 2015-10-07 12:26:49 [OA INFO ] 90184 -- Done
2015-10-07 11:30:03 [OA INFO ] 89006 -- Extracting second connected components for SSC... 2015-10-07 12:26:49 [OA INFO ] 90184 -- Extracting second connected components for SSC...
2015-10-07 11:30:03 [OA INFO ] 89006 -- --> 0 sequences 2015-10-07 12:26:49 [OA INFO ] 90184 -- --> 0 sequences
2015-10-07 11:30:03 [OA INFO ] 89006 -- Done 2015-10-07 12:26:49 [OA INFO ] 90184 -- Done
2015-10-07 11:30:03 [OA INFO ] 89006 -- merging both connected components for SSC... 2015-10-07 12:26:49 [OA INFO ] 90184 -- merging both connected components for SSC...
2015-10-07 11:30:03 [OA INFO ] 89006 -- --> 72 sequences in total 2015-10-07 12:26:49 [OA INFO ] 90184 -- --> 72 sequences in total
2015-10-07 11:30:03 [OA INFO ] 89006 -- Done 2015-10-07 12:26:49 [OA INFO ] 90184 -- Done
2015-10-07 11:30:03 [OA INFO ] 89006 -- Checking SSC homogeneity... 2015-10-07 12:26:49 [OA INFO ] 90184 -- Checking SSC homogeneity...
2015-10-07 11:30:03 [OA INFO ] 89497 -- Build temporary blast DB... 2015-10-07 12:26:49 [OA INFO ] 90675 -- Build temporary blast DB...
2015-10-07 11:30:03 [OA INFO ] 89497 -- Done 2015-10-07 12:26:49 [OA INFO ] 90675 -- Done
2015-10-07 11:30:03 [OA INFO ] 89497 -- Running Blast... 2015-10-07 12:26:49 [OA INFO ] 90675 -- Running Blast...
2015-10-07 11:30:23 [OA INFO ] 89497 -- Done 2015-10-07 12:27:10 [OA INFO ] 90675 -- Done
2015-10-07 11:30:23 [OA INFO ] 89006 -- --> 1 connected componants 2015-10-07 12:27:10 [OA INFO ] 90184 -- --> 1 connected componants
2015-10-07 11:30:23 [OA INFO ] 89006 -- Done 2015-10-07 12:27:10 [OA INFO ] 90184 -- Done
2015-10-07 11:30:23 [OA INFO ] 89006 -- Installing SSC reference databases... 2015-10-07 12:27:10 [OA INFO ] 90184 -- Installing SSC reference databases...
2015-10-07 11:30:23 [OA INFO ] 89006 -- Done 2015-10-07 12:27:10 [OA INFO ] 90184 -- Done
2015-10-07 12:27:10 [OA INFO ] 90184 -- Installing blast version of the SC_RefDB reference databases...
2015-10-07 12:27:10 [OA INFO ] 90184 -- Done
+10 -8
View File
@@ -89,9 +89,6 @@ pushTmpDir ORG.buildSCDB
cp LSC.direct.fasta "${IR_DATA_DIR}/LSC_RefDB.fasta" cp LSC.direct.fasta "${IR_DATA_DIR}/LSC_RefDB.fasta"
cp LSC_RefDB.tgf "${IR_DATA_DIR}/LSC_RefDB.tgf" cp LSC_RefDB.tgf "${IR_DATA_DIR}/LSC_RefDB.tgf"
makeblastdb -in "${IR_DATA_DIR}/LSC_RefDB.fasta" \
-dbtype nucl \
-out "${IR_DATA_DIR}/LSC_RefDB" >& /dev/null
loginfo "Done" loginfo "Done"
# #
@@ -163,12 +160,17 @@ pushTmpDir ORG.buildSCDB
loginfo "Installing SSC reference databases..." loginfo "Installing SSC reference databases..."
cp SSC.direct.fasta "${IR_DATA_DIR}/SSC_RefDB.fasta" cp SSC.direct.fasta "${IR_DATA_DIR}/SSC_RefDB.fasta"
cp SSC_RefDB.tgf "${IR_DATA_DIR}/SSC_RefDB.tgf" cp SSC_RefDB.tgf "${IR_DATA_DIR}/SSC_RefDB.tgf"
makeblastdb -in "${IR_DATA_DIR}/SSC_RefDB.fasta" \
-dbtype nucl \
-out "${IR_DATA_DIR}/SSC_RefDB" >& /dev/null
loginfo "Done" loginfo "Done"
loginfo "Installing blast version of the SC_RefDB reference databases..."
cat "${IR_DATA_DIR}/LSC_RefDB.fasta" \
"${IR_DATA_DIR}/SSC_RefDB.fasta" > SC_RefDB.fasta
makeblastdb -in SC_RefDB.fasta \
-dbtype nucl \
-out "${IR_DATA_DIR}/SC_RefDB" >& /dev/null
loginfo "Done"
popTmpDir popTmpDir