4389d5f48220ed09aff243f8ff13b064e7dc7e0b braney Wed Feb 22 17:32:10 2012 -0800 moving various pieces of code to build the omim table into one place #6943 diff --git src/utils/omim/buildOmimTracks.csh src/utils/omim/buildOmimTracks.csh index 6142f69..5c4a34c 100755 --- src/utils/omim/buildOmimTracks.csh +++ src/utils/omim/buildOmimTracks.csh @@ -1,167 +1,167 @@ #!/bin/tcsh # BUILD $1 OMIM RELATED TRACKS cat genemap|sed -e 's/|/\t/g' > genemap.tab hgLoadSqlTab -warn $1 omimGeneMap ~/kent/src/hg/lib/omimGeneMap.sql genemap.tab # Load mim2gene table fgrep -v "gene/phenotype" mim2gene.txt > j.tmp.1 fgrep "gene/phenotype" mim2gene.txt > j.tmp.2 cut -f 2 j.tmp.2|sed -e 's/\//\t/' >j.tmp cut -f 1 j.tmp.2 >j.1 cut -f 1 j.tmp >j.g cut -f 2 j.tmp >j.p cut -f 3-5 j.tmp.2 >j.345 paste j.1 j.g j.345 >jj.g paste j.1 j.p j.345 >jj.p cat j.tmp.1 jj.g jj.p >mim2gene.updated.txt rm j.* jj.* cut -f 1 mim2gene.updated.txt >j1 cut -f 2 mim2gene.updated.txt >j2 cut -f 3 mim2gene.updated.txt >j3 paste j1 j3 j2 >mim2gene.tab hgsql $1 -e 'drop table mim2gene' hgsql $1 < ~/kent/src/hg/lib/mim2gene.sql hgsql $1 -e 'load data local infile "mim2gene.tab" into table mim2gene ignore 1 lines' hgsql $1 -e 'drop table omim2gene' hgsql $1 < ~/kent/src/hg/lib/omim2gene.sql hgsql $1 -e 'load data local infile "mim2gene.updated.txt" into table omim2gene ignore 1 lines' # build omimGeneSymbol table doOmimGeneSymbols $1 j.out cat j.out |sort -u >omimGeneSymbol.tab hgLoadSqlTab -warn $1 omimGeneSymbol ~/kent/src/hg/lib/omimGeneSymbol.sql omimGeneSymbol.tab -perl ./script1.pl --gene-map-file=genemap >omimPhenotype.tab +perl ./parseGeneMap.pl --gene-map-file=genemap >omimPhenotype.tab hgLoadSqlTab -warn $1 omimPhenotype ~/kent/src/hg/lib/omimPhenotype.sql omimPhenotype.tab hgsql $1 -e 'update omimPhenotype set omimPhenoMapKey = -1 where omimPhenoMapKey=0' hgsql $1 -e 'update omimPhenotype set phenotypeId = -1 where phenotypeId=0' doOmimGene2 $1 j.tmp cat j.tmp |sort -u > omimGene2.tab hgLoadBed $1 omimGene2 omimGene2.tab rm j.tmp ############################################################## # build the omimAvSnp track mkdir -p av cd av # get the mimAV.txt data file from OMIM cp ../mimAV.txt . -p cut -f 1 mimAV.txt >j1 cut -f 2 mimAV.txt >j2 cut -f 3 mimAV.txt >j3 cut -f 4 mimAV.txt >j4 cut -f 5 mimAV.txt >j5 cat j1 |sed -e 's/\./\t/' >j1.2 cat j4 |sed -e 's/,/\t/' >j4-2 cut -f 1 j4-2 >j4.1 cut -f 2 j4-2 >j4.2 paste j1 j1.2 j3 j4 j4.1 j4.2 j5 j2 >omimAv.tab hgsql $1 -e 'drop table omimAv' hgsql $1 < ~/src/hg/lib/omimAv.sql hgsql $1 -e 'load data local infile "omimAv.tab" into table omimAv ignore 1 lines' hgsql $1 -e 'update omimAv set repl2 = rtrim(ltrim(repl2))' doOmimAv $1 omimAvRepl.tab j.err hgsql $1 -e "drop table omimAvRepl" hgsql $1 < ~/kent/src/hg/lib/omimAvRepl.sql hgsql $1 -e 'load data local infile "omimAvRepl.tab" into table omimAvRepl' rm j1.2 j1 j2 j3 j4 j4-2 j4.1 j4.2 j5 if ($1 == "hg18") then hgsql $1 -N -e 'select chrom, chromStart, chromEnd, avId from omimAvRepl r, snp130 s where s.name = dbSnpId order by avId' |sort -u > omimAvSnp.tab else hgsql $1 -N -e 'select chrom, chromStart, chromEnd, avId from omimAvRepl r, snp132 s where s.name = dbSnpId order by avId' |sort -u > omimAvSnp.tab endif hgLoadBed -allowStartEqualEnd $1 omimAvSnp omimAvSnp.tab cd .. ############################################################## echo build omimLocation ... mkdir -p location cd location doOmimLocation $1 omimLocation.bed j.err hgLoadBed $1 omimLocation omimLocation.bed # Remove all gene entries in omimGene2 from omimLocation table hgsql $1 -N -e \ 'delete from omimLocation where name in (select name from omimGene2) ' # Per OMIM request, delete all the gray entries in omimLocation table. mkdir -p cleanUpOmimLocation cd cleanUpOmimLocation echo cleaning omimLocation ... hgsql $1 -N -e \ 'select distinct name from omimLocation' |sort -u >j.all hgsql $1 -N -e \ 'select distinct name from omimLocation, omimPhenotype where name=omimId and omimPhenoMapKey=1' >j.1 hgsql $1 -N -e \ 'select distinct name from omimLocation, omimPhenotype where name=omimId and omimPhenoMapKey=2' >j.2 hgsql $1 -N -e \ 'select distinct name from omimLocation, omimPhenotype where name=omimId and omimPhenoMapKey=3' >j.3 hgsql $1 -N -e \ 'select distinct name from omimLocation, omimPhenotype where name=omimId and omimPhenoMapKey=4' >j.4 cat j.1 j.2 j.3 j.4 |sort -u >j.1234 diff j.all j.1234 |grep "<" |sed -e "s/</do1 ${1}/" >doall #cat doall cat << '_EOF_' > do1 hgsql $1 -e "delete from omimLocation where name='${2}'" '_EOF_' #sleep 3 #echo after sleep chmod +x do1 chmod +x doall ./doall ############################################################## # remember to check in new mim2gene.sql