6997c15d6e5bba74c31803ae79cd1be779688f7a
gperez2
  Sun Aug 13 14:28:50 2023 -0700
crab-eating macaque (GCA_011100615.1) vs. macFas5, lastz/chain/net run for user, refs #31769

diff --git src/hg/makeDb/doc/macFas5/lastzRuns.txt src/hg/makeDb/doc/macFas5/lastzRuns.txt
index 64dcc24..ec63cb0 100644
--- src/hg/makeDb/doc/macFas5/lastzRuns.txt
+++ src/hg/makeDb/doc/macFas5/lastzRuns.txt
@@ -1,252 +1,347 @@
 # for emacs: -*- mode: sh; -*-
 
 #########################################################################
 # LASTZ Crab-eating macaque/macFas5 Green monkey/chlSab1 -
 #              (DONE - 2014-05-15 - Hiram)
     mkdir /hive/data/genomes/macFas5/bed/lastzChlSab1.2014-05-15
     cd /hive/data/genomes/macFas5/bed/lastzChlSab1.2014-05-15
 
     cat << '_EOF_' > DEF
 # Crab-eating macaque vs. Green monkey
 # parameters used are from the human-chimp tuning from long ago
 
 BLASTZ=/cluster/bin/penn/lastz-distrib-1.03.52/bin/lastz
 BLASTZ_M=245
 BLASTZ_O=600
 BLASTZ_E=150
 
 BLASTZ_T=2
 BLASTZ_Y=15000
 BLASTZ_K=4500
 BLASTZ_Q=/scratch/data/blastz/human_chimp.v2.q
 #     A    C    G    T
 #     90 -330 -236 -356
 #   -330  100 -318 -236
 #   -236 -318  100 -330
 #   -356 -236 -330   90
 
 # TARGET: Crab-eating macaque
 SEQ1_DIR=/hive/data/genomes/macFas5/macFas5.2bit
 SEQ1_LEN=/hive/data/genomes/macFas5/chrom.sizes
 SEQ1_CHUNK=20000000
 SEQ1_LAP=10000
 SEQ1_LIMIT=50
 
 # QUERY: Green monkey chlSab1
 SEQ2_DIR=/hive/data/genomes/chlSab1/chlSab1.2bit
 SEQ2_LEN=/hive/data/genomes/chlSab1/chrom.sizes
 SEQ2_CHUNK=10000000
 SEQ2_LAP=0
 SEQ2_LIMIT=200
 
 BASE=/hive/data/genomes/macFas5/bed/lastzChlSab1.2014-05-15
 TMPDIR=/dev/shm
 '_EOF_'
     # << happy emacs
 
     time (doBlastzChainNet.pl -verbose=2 `pwd`/DEF \
      -chainMinScore=5000 -chainLinearGap=medium \
         -workhorse=hgwdev -smallClusterHub=ku -bigClusterHub=ku \
              -syntenicNet) > do.log 2>&1
     # real    595m54.836s
 
     cat fb.macFas5.chainChlSab1Link.txt 
     # 2602112483 bases of 2803866698 (92.804%) in intersection
 
     time (doRecipBest.pl -buildDir=`pwd` macFas5 chlSab1) > rbest.log 2>&1 &
     # real    73m55.625s
 
     # and for the swap:
     mkdir /hive/data/genomes/chlSab1/bed/blastz.macFas5.swap
     cd /hive/data/genomes/chlSab1/bed/blastz.macFas5.swap
 
     time (doBlastzChainNet.pl -verbose=2 \
       /hive/data/genomes/macFas5/bed/lastzChlSab1.2014-05-15/DEF \
      -chainMinScore=5000 -chainLinearGap=medium \
         -workhorse=hgwdev -smallClusterHub=ku -bigClusterHub=ku \
              -swap -syntenicNet) > do.log 2>&1
 XXX - running - Wed Jan 21 09:38:12 PST 2015
     #  real    117m56.319s
 
     cat fb.chlSab1.chainMacFas5Link.txt 
     # 2665801248 bases of 2725905606 (97.795%) in intersection
 
     time (doRecipBest.pl -buildDir=`pwd` chlSab1 macFas5) > rbest.log 2>&1
     # real    79m30.931s
 
 #########################################################################
 # LASTZ Crab-eating macaque/macFas5 Green monkey/papHam1 -
 #              (DONE - 2014-05-15 - Hiram)
     mkdir /hive/data/genomes/macFas5/bed/lastzPapHam1.2014-05-15
     cd /hive/data/genomes/macFas5/bed/lastzPapHam1.2014-05-15
 
     cat << '_EOF_' > DEF
 # Crab-eating macaque vs. Baboon
 # parameters used are from the human-chimp tuning from long ago
 
 BLASTZ=/cluster/bin/penn/lastz-distrib-1.03.52/bin/lastz
 BLASTZ_M=245
 BLASTZ_O=600
 BLASTZ_E=150
 
 BLASTZ_T=2
 BLASTZ_Y=15000
 BLASTZ_K=4500
 BLASTZ_Q=/scratch/data/blastz/human_chimp.v2.q
 #     A    C    G    T
 #     90 -330 -236 -356
 #   -330  100 -318 -236
 #   -236 -318  100 -330
 #   -356 -236 -330   90
 
 # TARGET: Crab-eating macaque
 SEQ1_DIR=/hive/data/genomes/macFas5/macFas5.2bit
 SEQ1_LEN=/hive/data/genomes/macFas5/chrom.sizes
 SEQ1_CHUNK=20000000
 SEQ1_LAP=10000
 SEQ1_LIMIT=50
 
 # QUERY: Baboon papHam1
 SEQ2_DIR=/hive/data/genomes/papHam1/papHam1.2bit
 SEQ2_LEN=/hive/data/genomes/papHam1/chrom.sizes
 SEQ2_CHUNK=10000000
 SEQ2_LAP=0
 SEQ2_LIMIT=1500
 
 BASE=/hive/data/genomes/macFas5/bed/lastzPapHam1.2014-05-15
 TMPDIR=/dev/shm
 '_EOF_'
     # << happy emacs
 
     time (doBlastzChainNet.pl -verbose=2 `pwd`/DEF \
      -chainMinScore=5000 -chainLinearGap=medium \
         -workhorse=hgwdev -smallClusterHub=ku -bigClusterHub=ku \
              -syntenicNet) > do.log 2>&1
     # real    525m11.457s
     # real    73m16.304s
 
     cat fb.macFas5.chainPapHam1Link.txt 
     # 2486618688 bases of 2803866698 (88.685%) in intersection
 
     time (doRecipBest.pl -buildDir=`pwd` macFas5 papHam1) > rbest.log 2>&1 &
     # real    109m2.057s
 
     # and for the swap:   (DONE - 2015-01-26 - Hiram)
     mkdir /hive/data/genomes/papHam1/bed/blastz.macFas5.swap
     cd /hive/data/genomes/papHam1/bed/blastz.macFas5.swap
 
     time (doBlastzChainNet.pl -verbose=2 \
       /hive/data/genomes/macFas5/bed/lastzPapHam1.2014-05-15/DEF \
      -chainMinScore=5000 -chainLinearGap=medium \
         -workhorse=hgwdev -smallClusterHub=ku -bigClusterHub=ku \
              -swap -syntenicNet) > do.log 2>&1
     #  real    619m9.663s
 
     cat fb.papHam1.chainMacFas5Link.txt 
     # 2522131870 bases of 2741849051 (91.987%) in intersection
 
     time (doRecipBest.pl -buildDir=`pwd` papHam1 macFas5) > rbest.log 2>&1
     # real    244m37.728s
 
 ##############################################################################
 # LASTZ Crab-eating macaque MacFas5 vs. Rhesus RheMac2
 #	(DONE - 2021-10-12 - hiram)
 
     cd /cluster/home/hiram/kent/src/hg/makeDb/doc/macFas5
 
     time (~/kent/src/hg/utils/automation/pairLastz.sh macFas5 rheMac2 \
       primate primate) > macFas5.rheMac2.log 2>&1 &
     #	real	366m28.349s
     #	user	0m1.422s
     #	sys	0m1.082s
 
     # the following make doc is in that log file, copied here:
 
     mkdir /hive/data/genomes/macFas5/bed/lastzRheMac2.2021-10-12
     cd /hive/data/genomes/macFas5/bed/lastzRheMac2.2021-10-12
 
     printf '# Rhesus RheMac2 vs. Crab-eating macaque MacFas5
 BLASTZ=/cluster/bin/penn/lastz-distrib-1.04.03/bin/lastz
 BLASTZ_T=2
 BLASTZ_O=600
 BLASTZ_E=150
 BLASTZ_M=254
 BLASTZ_K=4500
 BLASTZ_Y=15000
 BLASTZ_Q=/hive/data/staging/data/blastz/human_chimp.v2.q
 #       A     C     G     T
 # A    90  -330  -236  -356
 # C  -330   100  -318  -236
 # G  -236  -318   100  -330
 # T  -356  -236  -330    90
 
 # TARGET: Crab-eating macaque MacFas5
 SEQ1_DIR=/hive/data/genomes/macFas5/macFas5.2bit
 SEQ1_LEN=/hive/data/genomes/macFas5/chrom.sizes
 SEQ1_CHUNK=20000000
 SEQ1_LAP=10000
 SEQ1_LIMIT=40
 
 # QUERY: Rhesus RheMac2
 SEQ2_DIR=/hive/data/genomes/rheMac2/rheMac2.2bit
 SEQ2_LEN=/hive/data/genomes/rheMac2/chrom.sizes
 SEQ2_CHUNK=20000000
 SEQ2_LAP=0
 SEQ2_LIMIT=100
 
 BASE=/hive/data/genomes/macFas5/bed/lastzRheMac2.2021-10-12
 TMPDIR=/dev/shm
 
 ' > DEF
 
     time (~/kent/src/hg/utils/automation/doBlastzChainNet.pl  -verbose=2 `pwd`/DEF -syntenicNet \
         -workhorse=hgwdev -smallClusterHub=hgwdev -bigClusterHub=ku \
         -chainMinScore=5000 -chainLinearGap=medium) > do.log 2>&1
     grep -w real do.log | sed -e 's/^/    # /;'
     # real	158m45.932s
 
     sed -e 's/^/    # /;' fb.macFas5.chainRheMac2Link.txt
     # 2614119665 bases of 2803866698 (93.233%) in intersection
     sed -e 's/^/    # /;' fb.macFas5.chainSynRheMac2Link.txt
     # 2604737022 bases of 2803866698 (92.898%) in intersection
 
     time (~/kent/src/hg/utils/automation/doRecipBest.pl  -load -workhorse=hgwdev -buildDir=`pwd` \
        \
        \
         macFas5 rheMac2) > rbest.log 2>&1
 
     grep -w real rbest.log | sed -e 's/^/    # /;'
     # real	77m6.953s
 
     sed -e 's/^/    # /;' fb.macFas5.chainRBest.RheMac2.txt
     # 2596696673 bases of 2803866698 (92.611%) in intersection
 
     ### and for the swap
 
     cd /hive/data/genomes/rheMac2/bed/blastz.macFas5.swap
 
    time (~/kent/src/hg/utils/automation/doBlastzChainNet.pl  -swap -verbose=2 \
     /hive/data/genomes/macFas5/bed/lastzRheMac2.2021-10-12/DEF -swapDir=`pwd` \
   -syntenicNet -workhorse=hgwdev -smallClusterHub=hgwdev -bigClusterHub=ku \
     -chainMinScore=5000 -chainLinearGap=medium) > swap.log 2>&1
 
     grep -w real swap.log | sed -e 's/^/    # /;'
     # real	76m2.171s
 
     sed -e 's/^/    # /;' fb.rheMac2.chainMacFas5Link.txt
     # 2600572513 bases of 2646704109 (98.257%) in intersection
     sed -e 's/^/    # /;' fb.rheMac2.chainSynMacFas5Link.txt
     # 2595637716 bases of 2646704109 (98.071%) in intersection
 \    time (~/kent/src/hg/utils/automation/doRecipBest.pl  -load -workhorse=hgwdev -buildDir=`pwd` \
     \
     \
    rheMac2 macFas5) > rbest.log 2>&1
 
     grep -w real rbest.log | sed -e 's/^/    # /;'
     # real	54m32.803s
 
     sed -e 's/^/    # /;' fb.rheMac2.chainRBest.MacFas5.txt
     # 2596730835 bases of 2646704109 (98.112%) in intersection
 
 
 ##############################################################################
+# LASTZ crab-eating macaque GCA_011100615.1 vs. Crab-eating macaque MacFas5
+#    (DONE - 2023-07-19 - Gerardo)
+
+    mkdir /hive/data/genomes/asmHubs/allBuild/GCA/011/100/615/GCA_011100615.1_Macaca_fascicularis_6.0/trackData/lastzMacFas5.2023-07-19
+    cd /hive/data/genomes/asmHubs/allBuild/GCA/011/100/615/GCA_011100615.1_Macaca_fascicularis_6.0/trackData/lastzMacFas5.2023-07-19
+
+    printf '# Crab-eating macaque MacFas5 vs. crab-eating macaque GCA_011100615.1
+BLASTZ=/cluster/bin/penn/lastz-distrib-1.04.03/bin/lastz
+BLASTZ_T=2
+BLASTZ_O=600
+BLASTZ_E=150
+BLASTZ_M=254
+BLASTZ_K=4500
+BLASTZ_Y=15000
+BLASTZ_Q=/hive/data/staging/data/blastz/human_chimp.v2.q
+#       A     C     G     T
+# A    90  -330  -236  -356
+# C  -330   100  -318  -236
+# G  -236  -318   100  -330
+# T  -356  -236  -330    90
+
+# TARGET: crab-eating macaque 2020-03-10 GCA_011100615.1_Macaca_fascicularis_6.0
+SEQ1_DIR=/hive/data/genomes/asmHubs/GCA/011/100/615/GCA_011100615.1/GCA_011100615.1.2bit
+SEQ1_LEN=/hive/data/genomes/asmHubs/GCA/011/100/615/GCA_011100615.1/GCA_011100615.1.chrom.sizes.txt
+SEQ1_CHUNK=20000000
+SEQ1_LAP=10000
+SEQ1_LIMIT=40
+
+# QUERY: Crab-eating macaque  macFas5
+SEQ2_DIR=/hive/data/genomes/macFas5/macFas5.2bit
+SEQ2_LEN=/hive/data/genomes/macFas5/chrom.sizes
+SEQ2_CHUNK=20000000
+SEQ2_LAP=0
+SEQ2_LIMIT=100
+
+BASE=/hive/data/genomes/asmHubs/allBuild/GCA/011/100/615/GCA_011100615.1_Macaca_fascicularis_6.0/trackData/lastzMacFas5.2023-07-19
+TMPDIR=/dev/shm
+
+' > DEF
+
+    time (~/kent/src/hg/utils/automation/doBlastzChainNet.pl -trackHub -noDbNameCheck -verbose=2 `pwd`/DEF -syntenicNet \
+      -tAsmId GCA_011100615.1_Macaca_fascicularis_6.0  -workhorse=hgwdev -smallClusterHub=hgwdev -bigClusterHub=ku \
+        -chainMinScore=5000 -chainLinearGap=medium) > do.log 2>&1
+    grep -w real do.log | sed -e 's/^/    # /;'
+    # real	115m11.046s
+
+    sed -e 's/^/    # /;' fb.GCA_011100615.1.chainMacFas5Link.txt
+    # 2761984914 bases of 2906138557 (95.040%) in intersection
+    sed -e 's/^/    # /;' fb.GCA_011100615.1.chainSynMacFas5Link.txt
+    # 2731406308 bases of 2906138557 (93.987%) in intersection
+
+    time (~/kent/src/hg/utils/automation/doRecipBest.pl -trackHub -load -workhorse=hgwdev -buildDir=`pwd` \
+      -target2Bit="/hive/data/genomes/asmHubs/GCA/011/100/615/GCA_011100615.1/GCA_011100615.1.2bit" \
+-targetSizes="/hive/data/genomes/asmHubs/GCA/011/100/615/GCA_011100615.1/GCA_011100615.1.chrom.sizes.txt" \
+       \
+        GCA_011100615.1 macFas5) > rbest.log 2>&1
+
+    grep -w real rbest.log | sed -e 's/^/    # /;'
+    # real	75m47.657s
+
+    sed -e 's/^/    # /;' fb.GCA_011100615.1.chainRBest.MacFas5.txt
+    # 2678569575 bases of 2906138557 (92.169%) in intersection
+
+    ### and for the swap
+
+    cd /hive/data/genomes/macFas5/bed/blastz.GCA_011100615.1.swap
+
+   time (~/kent/src/hg/utils/automation/doBlastzChainNet.pl -trackHub -noDbNameCheck -swap -verbose=2 \
+  -tAsmId GCA_011100615.1_Macaca_fascicularis_6.0  /hive/data/genomes/asmHubs/allBuild/GCA/011/100/615/GCA_011100615.1_Macaca_fascicularis_6.0/trackData/lastzMacFas5.2023-07-19/DEF -swapDir=`pwd` \
+  -syntenicNet -workhorse=hgwdev -smallClusterHub=hgwdev -bigClusterHub=ku \
+    -chainMinScore=5000 -chainLinearGap=medium) > swap.log 2>&1
+
+    grep -w real swap.log | sed -e 's/^/    # /;'
+    # real	90m44.045s
+
+    sed -e 's/^/    # /;' fb.macFas5.chainGCA_011100615.1Link.txt
+    # 2690649811 bases of 2946843737 (91.306%) in intersection
+    sed -e 's/^/    # /;' fb.macFas5.chainSynGCA_011100615.1Link.txt
+    # 2679307687 bases of 2946843737 (90.921%) in intersection
+\    time (~/kent/src/hg/utils/automation/doRecipBest.pl -trackHub -load -workhorse=hgwdev -buildDir=`pwd` \
+   -query2bit="/hive/data/genomes/asmHubs/GCA/011/100/615/GCA_011100615.1/GCA_011100615.1.2bit" \
+-querySizes="/hive/data/genomes/asmHubs/GCA/011/100/615/GCA_011100615.1/GCA_011100615.1.chrom.sizes.txt" \
+    \
+   macFas5 GCA_011100615.1) > rbest.log 2>&1
+
+    grep -w real rbest.log | sed -e 's/^/    # /;'
+    # real	72m23.439s
+
+    sed -e 's/^/    # /;' fb.macFas5.chainRBest.GCA_011100615.1.txt
+    # 2680072146 bases of 2946843737 (90.947%) in intersection
+
+real	354m14.218s
+user	0m3.158s
+sys	0m3.325s
+##############################################################################