src/hg/makeDb/doc/bosTau4.txt 1.23
1.23 2010/04/01 17:33:10 hiram
never got susScr1 to work finished with susScr2 lastz
Index: src/hg/makeDb/doc/bosTau4.txt
===================================================================
RCS file: /projects/compbio/cvsroot/kent/src/hg/makeDb/doc/bosTau4.txt,v
retrieving revision 1.22
retrieving revision 1.23
diff -b -B -U 4 -r1.22 -r1.23
--- src/hg/makeDb/doc/bosTau4.txt 25 Jan 2010 19:16:14 -0000 1.22
+++ src/hg/makeDb/doc/bosTau4.txt 1 Apr 2010 17:33:10 -0000 1.23
@@ -1828,12 +1828,12 @@
md5sum bosTau4ToBosTauMd3.over.chain.gz >> md5sum.txt
popd
#########################################################################
-# susScr1 Pig BLASTZ/CHAIN/NET (WORKING - 2010-01-21 - Hiram)
+# susScr1 Pig BLASTZ/CHAIN/NET (DONE - 2010-01-25 - Hiram)
screen # use a screen to manage this multi-day job
- mkdir /hive/data/genomes/bosTau4/bed/lastzSusScr1.2010-01-21
- cd /hive/data/genomes/bosTau4/bed/lastzSusScr1.2010-01-21
+ mkdir /hive/data/genomes/bosTau4/bed/lastzSusScr1.2010-01-25
+ cd /hive/data/genomes/bosTau4/bed/lastzSusScr1.2010-01-25
cat << '_EOF_' > DEF
# Pig vs. Cow
BLASTZ_M=50
@@ -1850,21 +1850,26 @@
SEQ2_LEN=/scratch/data/susScr1/chrom.sizes
SEQ2_CHUNK=10000000
SEQ2_LAP=0
-BASE=/hive/data/genomes/bosTau4/bed/lastzSusScr1.2010-01-21
+BASE=/hive/data/genomes/bosTau4/bed/lastzSusScr1.2010-01-25
TMPDIR=/scratch/tmp
'_EOF_'
# << this line keeps emacs coloring happy
time nice -n +19 doBlastzChainNet.pl -verbose=2 \
`pwd`/DEF \
-noLoadChainSplit -syntenicNet \
- -workhorse=hgwdev -smallClusterHub=memk -bigClusterHub=pk \
+ -workhorse=hgwdev -smallClusterHub=memk -bigClusterHub=swarm \
-chainMinScore=3000 -chainLinearGap=medium > do.log 2>&1 &
+ # real 2377m21.473s
+ # never did get this to work. susScr2 as target bosTau4 as query
+ # did finish but with immense chain pileups
+ # failed second time too
+ # XXX - re-running as 01-25 (was 01-21) Mon Jan 25 11:29:32 PST 2010
# real 3811m31.428s
# failed
-XXX - running Thu Jan 21 14:49:43 PST 2010
+ # XXX - running Thu Jan 25 14:49:43 PST 2010
time nice -n +19 $HOME/kent/src/hg/utils/automation/doBlastzChainNet.pl \
`pwd`/DEF -verbose=2 \
-bigClusterHub=memk -chainMinScore=3000 -chainLinearGap=medium \
@@ -1888,4 +1893,52 @@
cat fb.bosTau4.chainRn4Link.txt
# 664253901 bases of 2731830700 (24.315%) in intersection
#########################################################################
+# lastz swap Pig SusScr2 (DONE - 2010-03-31 - Hiram)
+ # the primary lastz run on susScr2
+ cd /hive/data/genomes/susScr2/bed/lastzBosTau4.2010-03-27
+ cat fb.susScr2.chainBosTau4Link.txt
+ # 1478903080 bases of 2231298548 (66.280%) in intersection
+
+ # and the swap
+ mkdir /hive/data/genomes/bosTau4/bed/blastz.susScr2.swap
+ cd /hive/data/genomes/bosTau4/bed/blastz.susScr2.swap
+ time nice -n +19 doBlastzChainNet.pl -verbose=2 \
+ /hive/data/genomes/susScr2/bed/lastzBosTau4.2010-03-27/DEF \
+ -swap -noLoadChainSplit -syntenicNet \
+ -workhorse=hgwdev -smallClusterHub=encodek -bigClusterHub=pk \
+ -chainMinScore=3000 -chainLinearGap=medium > swap.log 2>&1 &
+ # most interesting, this failed on the first step chainSwap
+ # but the failure didn't make it stop, it continued and produced
+ # zero results to the end. Running manually:
+ cd /hive/data/genomes/bosTau4/bed/blastz.susScr2.swap/axtChain
+export sizeG=188743680
+ulimit -d $sizeG
+ulimit -v $sizeG
+
+chainSwap /hive/data/genomes/susScr2/bed/lastzBosTau4.2010-03-27/axtChain/susScr2.bosTau4.all.chain.gz stdout \
+| nice chainSort stdin stdout | nice gzip -c > bosTau4.susScr2.all.chain.gz
+
+ # it also runs out of memory in the lift over file creation:
+ export sizeG=188743680
+ ulimit -d $sizeG
+ ulimit -v $sizeG
+
+ netChainSubset -verbose=0 noClass.net bosTau4.susScr2.all.chain.gz stdout \
+ | chainStitchId stdin stdout | gzip -c > bosTau4.susScr2.over.chain.gz
+
+ # and netChains.csh is finished manually with this added:
+# memory limit 160 Gb
+limit datasize 163840m
+limit vmemoryuse 163840m
+
+ # manually run the loadUp.csh with this added:
+# memory limit 160 Gb
+limit datasize 163840m
+limit vmemoryuse 163840m
+ # real 498m5.861s
+
+ cat fb.bosTau4.chainSusScr2Link.txt
+ # 1383557633 bases of 2731830700 (50.646%) in intersection
+
+#########################################################################