54452ec022a6073410955c04e110a1784f71fb57 angie Wed Nov 13 17:37:34 2019 -0800 dbSnp153: add new ucscNote otherMapErr for mappings with the same rs# as a mapping w/inconsistent SPDI in BadCoords/Map Err subtrack. refs #23283 diff --git src/hg/utils/automation/doBigDbSnp.pl src/hg/utils/automation/doBigDbSnp.pl index f3d1e5d..311f80a 100755 --- src/hg/utils/automation/doBigDbSnp.pl +++ src/hg/utils/automation/doBigDbSnp.pl @@ -503,37 +503,44 @@ ); $bossScript->execute() }; } # doFixHg19ChrM ######################################################################### # * step: check [workhorse] sub doCheck { my $runDir = $buildDir; my $whatItDoes = "It runs checkBigDbSnp on merged bigDbSnp files."; my $bossScript = newBash HgRemoteScript("$runDir/doCheck.sh", $workhorse, $runDir, $whatItDoes); + foreach my $db (@dbList) { + $bossScript->add(<<_EOF_ +cut -f 4 $db.$outRoot.badCoords.bed | sort -u > $db.badCoords.ids.txt +_EOF_ + ); + } $bossScript->add(<<_EOF_ pids="" _EOF_ ); foreach my $db (@dbList) { $bossScript->add(<<_EOF_ -time checkBigDbSnp $db.$outRoot.bigDbSnp $HgAutomate::clusterData/$db/$db.2bit $db.$outRoot.checked.bigDbSnp & +time checkBigDbSnp -mapErrIds=$db.badCoords.ids.txt \\ + $db.$outRoot.bigDbSnp $HgAutomate::clusterData/$db/$db.2bit $db.$outRoot.checked.bigDbSnp & echo \$! pids+=" \$!" _EOF_ ); } $bossScript->add(<<_EOF_ for pid in \$pids; do if wait \$pid; then echo pid \$pid done else echo pid \$pid FAILED exit 1 fi done _EOF_ @@ -575,30 +582,31 @@ system("chmod a+x $makeSubsetsScript") == 0 || die "Unable to chmod $makeSubsetsScript"; my $whatItDoes = "It runs bedToBigBed on merged & checked bigDbSnp files and makes ". "Mult, Common and ClinVar subsets."; my $bossScript = newBash HgRemoteScript("$runDir/doBigBed.sh", $workhorse, $runDir, $whatItDoes); $bossScript->add(<<_EOF_ pids="" _EOF_ ); foreach my $db (@dbList) { $bossScript->add(<<_EOF_ time bedToBigBed -tab -as=\$HOME/kent/src/hg/lib/bigDbSnp.as -type=bed4+ -extraIndex=name \\ $db.$outRoot.checked.bigDbSnp /hive/data/genomes/$db/chrom.sizes $db.$outRoot.bb & +pids+=" \$!" time bedToBigBed -tab -type=bed4 -extraIndex=name \\ $db.$outRoot.badCoords.bed /hive/data/genomes/$db/chrom.sizes $db.${outRoot}BadCoords.bb & pids+=" \$!" $makeSubsetsScript $db & pids+=" \$!" _EOF_ ); } $bossScript->add(<<_EOF_ for pid in \$pids; do if wait \$pid; then echo pid \$pid done else echo pid \$pid FAILED exit 1