675293a87172d440c9c78b1c1bdc54610bc35a77 braney Tue May 7 14:14:26 2024 -0700 changes to HPRC rearrangements track in response to SAB refs #33484 diff --git src/hg/makeDb/doc/hg38/hprcInDel.txt src/hg/makeDb/doc/hg38/hprcInDel.txt index f57fad4..5452755 100644 --- src/hg/makeDb/doc/hg38/hprcInDel.txt +++ src/hg/makeDb/doc/hg38/hprcInDel.txt @@ -8,29 +8,29 @@ rm -rf topLevel mkdir topLevel for i in ../chain/*.chain; do f=`basename $i .chain`;echo netChainSubset ../net/$f.net $i topLevel/$f.chain -type=top; done > subset.jobs para make subset.jobs rm -rf indels mkdir indels for chain in topLevel/*.chain; do name=`basename $chain | sed 's?.*chainHprc??' | sed 's/\.chain//'` echo chainInDel $chain $name indels/$name.txt done > indel.jobs para make indel.jobs sort -S 50G -k1,1 -k2,2n -k3,3n -k5,5n indels/* > sortIndels.bed -awk '{if (($3 > $2) && ($5 == 0)) print}' sortIndels.bed | chainArrangeCollect -exact arrHumDel stdin stdout | awk '{$11=$3-$2;print $0,$5"-"$3 - $2"bp" }' > $deletions.bed -bedToBigBed $deletions.bed /cluster/data/hg38/chrom.sizes $deletions.bb -as=$HOME/kent/src/hg/lib/chainArrange.as -type=bed9+3 +tawk '{if (($3 > $2) && ($5 == 0)) print}' sortIndels.bed | chainArrangeCollect -exact arrHumDel stdin stdout | tawk '{$11=$3-$2;print $0,$5":"$3 - $2"bp", "# genomes in HPRC with ins: "$5"
Size of ins: "$3 - $2"bp"}' > $deletions.bed +bedToBigBed -tab $deletions.bed /cluster/data/hg38/chrom.sizes $deletions.bb -as=$HOME/kent/src/hg/lib/chainArrange.as -type=bed9+4 rm -f /gbdb/hg38/hprcArr$VERSION/$deletions.bb ln -s `pwd`/$deletions.bb /gbdb/hg38/hprcArr$VERSION -awk '{if ($3 == $2) print}' sortIndels.bed | chainArrangeCollect -exact arrHumIns stdin stdout | awk '{print $0,$5"-"$11"bp" }' >$inserts.bed -bedToBigBed $inserts.bed /cluster/data/hg38/chrom.sizes $inserts.bb -as=$HOME/kent/src/hg/lib/chainArrange.as -type=bed9+3 +tawk '{if ($3 == $2) print}' sortIndels.bed | chainArrangeCollect -exact arrHumIns stdin stdout | tawk '{print $0,$5":"$11"bp","# genomes in HPRC with del: "$5"
Size of del: "$11"bp" }' >$inserts.bed +bedToBigBed -tab $inserts.bed /cluster/data/hg38/chrom.sizes $inserts.bb -as=$HOME/kent/src/hg/lib/chainArrange.as -type=bed9+4 rm -f /gbdb/hg38/hprcArr$VERSION/$inserts.bb ln -s `pwd`/$inserts.bb /gbdb/hg38/hprcArr$VERSION -awk '{if (($3 > $2) && ($5 != 0)) print}' sortIndels.bed | chainArrangeCollect -exact arrHumOth stdin stdout | awk '{print $0,$5"-"$11"bp-"$3-$2"bp" }' >$double.bed -bedToBigBed $double.bed /cluster/data/hg38/chrom.sizes $double.bb -as=$HOME/kent/src/hg/lib/chainArrange.as -type=bed9+3 +tawk '{if (($3 > $2) && ($5 != 0)) print}' sortIndels.bed | chainArrangeCollect -exact arrHumOth stdin stdout | tawk '{print $0,$5":"$11"bp-"$3-$2"bp","# genomes in HPRC with ins: "$5"
Size of ins: "$3-$2"bp
Size of del: "$11"bp" }' >$double.bed +bedToBigBed -tab $double.bed /cluster/data/hg38/chrom.sizes $double.bb -as=$HOME/kent/src/hg/lib/chainArrange.as -type=bed9+4 rm -f /gbdb/hg38/hprcArr$VERSION/$double.bb ln -s `pwd`/$double.bb /gbdb/hg38/hprcArr$VERSION