fc930b43fb71b4d45cbe2ad449837434dc6f21fa chmalee Tue Sep 29 09:42:45 2020 -0700 Get geneReviews build script to use updated hg38 gencodeAnnotV35 tables to look for genes diff --git src/hg/utils/otto/geneReviews/buildGeneReviews.sh src/hg/utils/otto/geneReviews/buildGeneReviews.sh index 0801051..6112a99 100755 --- src/hg/utils/otto/geneReviews/buildGeneReviews.sh +++ src/hg/utils/otto/geneReviews/buildGeneReviews.sh @@ -12,36 +12,46 @@ # Load the internal working table geneReviewsGrshortTitleNBKid to # hg38/19/18 hgsql $1 -e 'drop table if exists geneReviewsGrshortTitleNBKidNew' hgsql $1 -e 'create table geneReviewsGrshortTitleNBKidNew select * from geneReviewsGrshortTitleNBKid limit 0' hgsql $1 -e \ 'load data local infile "geneReviewsGrshortTitleNBKid.tab" into table geneReviewsGrshortTitleNBKidNew' # for each refGen in grRefGene.lst, create a non-overlapping bed row. if [ -e "geneReviews.tab" ] then rm geneReviews.tab fi cat grRefGene.lst | while read G do + if [ "$1" = "hg38" ] + then + hgsql $1 -N -e \ + "SELECT e.chrom,e.txStart,e.txEnd,e.name2 \ + FROM gencodeAnnotV35 e where e.name2 ='${G}' \ + ORDER BY e.chrom,e.txStart;" > temp.in + bedRemoveOverlap temp.in temp.out + cat temp.out >> geneReviews.tab + else hgsql $1 -N -e \ "SELECT e.chrom,e.txStart,e.txEnd,j.geneSymbol \ FROM knownGene e, kgXref j WHERE e.name = j.kgID AND \ j.geneSymbol ='${G}' ORDER BY e.chrom,e.txStart;" > temp.in bedRemoveOverlap temp.in temp.out cat temp.out >> geneReviews.tab + fi done rm temp.* # load the collapsed bed4 file to database hgsql $1 -e 'drop table if exists geneReviewsNew' hgLoadBed $1 geneReviewsNew geneReviews.tab # Create and load geneReviewsDetail table hgsql $1 -N -e \ "SELECT s.geneSymbol, s.grShort, t.NBKid, t.grTitle \ FROM geneReviewsGrshortNBKidNew s, geneReviewsGrshortTitleNBKidNew t \ WHERE s.grShort = t.grShort ORDER BY s.geneSymbol;" > geneReviewsDetail.tab hgsql $1 -e 'drop table if exists geneReviewsDetailNew' hgsql $1 -e 'create table geneReviewsDetailNew select * from geneReviewsDetail limit 0'