835f3ad66aac1927fa501bad9511e56f62d706c4 hiram Tue Apr 27 14:36:26 2021 -0700 lastz chainNet run per user request refs #27388 diff --git src/hg/makeDb/doc/susScr11/lastzRuns.txt src/hg/makeDb/doc/susScr11/lastzRuns.txt new file mode 100644 index 0000000..8a7c9f4 --- /dev/null +++ src/hg/makeDb/doc/susScr11/lastzRuns.txt @@ -0,0 +1,102 @@ +############################################################################## +# LASTZ sheep GCA_002844635.1 (DONE - 2021-04-20 - Hiram) + mkdir /hive/data/genomes/susScr11/bed/lastzGCA_002844635.1.2021-04-20 + cd /hive/data/genomes/susScr11/bed/lastzGCA_002844635.1.2021-04-20 + + printf '# GCA_002844635.1 vs hg38 +BLASTZ=/cluster/bin/penn/lastz-distrib-1.04.03/bin/lastz +BLASTZ_T=2 +BLASTZ_O=400 +BLASTZ_E=30 +BLASTZ_M=254 +# default BLASTZ_Q score matrix: +# A C G T +# A 91 -114 -31 -123 +# C -114 100 -125 -31 +# G -31 -125 100 -114 +# T -123 -31 -114 91 + +# TARGET: Human Hg38 +SEQ1_DIR=/hive/data/genomes/hg38/hg38.2bit +SEQ1_LEN=/hive/data/genomes/hg38/chrom.sizes +SEQ1_CHUNK=20000000 +SEQ1_LAP=10000 + +# QUERY: sheep GCA_002844635.1 +SEQ2_DIR=/hive/data/genomes/asmHubs/GCF/002/742/125/GCA_002844635.1/GCA_002844635.1.2bit +SEQ2_LEN=/hive/data/genomes/asmHubs/GCF/002/742/125/GCA_002844635.1/GCA_002844635.1.chrom.sizes.txt +SEQ2_CHUNK=20000000 +SEQ2_LAP=0 +SEQ2_LIMIT=100 + +BASE=/hive/data/genomes/hg38/bed/lastzGCA_002844635.1.2021-04-20 +TMPDIR=/dev/shm +' > DEF + +export targetDb="hg38" +export asmId="GCA_002844635.1" +export gcPath="GCA/002/844/635" +cd /hive/data/genomes/$targetDb/bed/lastz${asmId}.2021-04-20 +time (doBlastzChainNet.pl -trackHub -noDbNameCheck -verbose=2 `pwd`/DEF \ + -workhorse=hgwdev -smallClusterHub=hgwdev -bigClusterHub=ku \ + -syntenicNet -chainMinScore=3000 -chainLinearGap=medium) > do.log 2>&1 +cat fb.${targetDb}.chain.${asmId}Link.txt +cat fb.${targetDb}.chainSyn.${asmId}Link.txt + +grep -w real do.log | sed -e 's/^/ # /;' + # real 318m24.582s + +sed -e 's/^/ # /;' fb.$targetDb.chain.${asmId}Link.txt + # 2431952924 bases of 2501912388 (97.204%) in intersection +sed -e 's/^/ # /;' fb.$targetDb.chainSyn.${asmId}Link.txt + # 2409981908 bases of 2501912388 (96.326%) in intersection + +time (doRecipBest.pl -trackHub -load -workhorse=hgwdev -buildDir=`pwd` \ +-query2Bit="/hive/data/genomes/asmHubs/$gcPath/${asmId}/${asmId}.2bit" \ +-querySizes="/hive/data/genomes/asmHubs/$gcPath/${asmId}/${asmId}.chrom.sizes.txt" \ +$targetDb ${asmId}) >> rbest.log 2>&1 +grep -w real rbest.log | sed -e 's/^/ # /;' + # real 93m2.731s + +sed -e 's/^/ # /;' fb.$targetDb.chainRBest.$asmId.txt + # 2381230203 bases of 2501912388 (95.176%) in intersection + +## Overall time for the above: +# real 411m27.346s + +### the swap to the assembly hub +export target="susScr11" +export Target="SusScr11" +export query="GCA_002844635.1" +export asmId="GCA_002844635.1_USMARCv1.0" +export gcPath="GCA/002/844/635" + +mkdir -p /hive/data/genomes/asmHubs/refseqBuild/$gcPath/$asmId/trackData/blastz.$target.swap +cd /hive/data/genomes/asmHubs/refseqBuild/$gcPath/$asmId/trackData/blastz.$target.swap + +time (doBlastzChainNet.pl -trackHub -noDbNameCheck -verbose=2 -swapDir=`pwd` \ + /hive/data/genomes/${target}/bed/lastz.${query}/DEF -syntenicNet \ + -workhorse=hgwdev -smallClusterHub=hgwdev -bigClusterHub=ku \ + -swap -chainMinScore=3000 -chainLinearGap=medium) >> swap.log 2>&1 +grep -w real swap.log | sed -e 's/^/ # /;' + # real 90m38.556s + +sed -e 's/^/ # /;' fb.${query}.chain.${Target}Link.txt + # 2543057365 bases of 2755438182 (92.292%) in intersection +sed -e 's/^/ # /;' fb.${query}.chainSyn.${Target}Link.txt + # 2514166037 bases of 2755438182 (91.244%) in intersection + +time (doRecipBest.pl -trackHub -load -workhorse=hgwdev -buildDir=`pwd` \ +-target2Bit="/hive/data/genomes/asmHubs/$gcPath/${query}/${query}.2bit" \ +-targetSizes="/hive/data/genomes/asmHubs/$gcPath/${query}/${query}.chrom.sizes.txt" \ +$query $target) >> rbest.log 2>&1 +grep -w real rbest.log | sed -e 's/^/ # /;' + # real 86m43.960s + +sed -e 's/^/ # /;' fb.${query}.chainRBest.${Target}.txt + # 2388751543 bases of 2755438182 (86.692%) in intersection + +# Complete run time for all the swap operation: + # real 285m1.340s + +##############################################################################