src/hg/makeDb/doc/hg18.txt 1.422
1.422 2010/06/02 23:00:02 angie
Updated gwasCatalog.
Index: src/hg/makeDb/doc/hg18.txt
===================================================================
RCS file: /projects/compbio/cvsroot/kent/src/hg/makeDb/doc/hg18.txt,v
retrieving revision 1.421
retrieving revision 1.422
diff -b -B -U 4 -r1.421 -r1.422
--- src/hg/makeDb/doc/hg18.txt 1 Jun 2010 17:56:24 -0000 1.421
+++ src/hg/makeDb/doc/hg18.txt 2 Jun 2010 23:00:02 -0000 1.422
@@ -29606,9 +29606,10 @@
# load the table
hgLoadBed -allowStartEqualEnd hg18 snpArrayIlluminaHumanOmni1_Quad snpArrayIlluminaHumanOmni1_Quad.tab -tab -sqlTable=snpArrayIlluminaHumanOmni1_Quad.sql
#############################################################################
-# NHGRI GWAS CATALOG (DONE 5/12/10)
+# NHGRI GWAS CATALOG (DONE 6/2/10)
+# Updated 5/12/10
# Updated 4/1/10
# Updated 3/1/10
# Originally done 1/19/10
# Area of possible future improvement: for SNPs that can't be mapped via our SNP track,
@@ -29618,10 +29619,11 @@
# Done once, don't need to redo:
cut -f 1-4 ../snp130/snp130.bed \
| sort -k4,4 \
> snp130Coords.bed
- mkdir /hive/data/genomes/hg18/bed/gwasCatalog/100512
- cd /hive/data/genomes/hg18/bed/gwasCatalog/100512
+ set today = `date +%y%m%d`
+ mkdir /hive/data/genomes/hg18/bed/gwasCatalog/$today
+ cd /hive/data/genomes/hg18/bed/gwasCatalog/$today
wget http://www.genome.gov/admin/gwascatalog.txt
# Column headers:
# 1 Date Added to Catalog
# 2 PubMedID
@@ -29677,19 +29679,20 @@
| sort -k1,1 -k2n,2n \
> gwasCatalog.bed
hgLoadBed hg18 gwasCatalog gwasCatalog.bed \
-tab -sqlTable=$HOME/kent/src/hg/lib/gwasCatalog.sql -notItemRgb -allowStartEqualEnd
-#Loaded 3461 elements of size 22
+#Loaded 3545 elements of size 22
# For David: find examples of risk alleles for which dbSNP observed
# alleles are complementary (A/T or C/G) -- how do we know what strand the
# risk allele is on?? -- asking corresp. author Teri Manolio.
- hgsql hg18 -e 'select snp.name,gc.riskAllele,snp.strand,snp.refNcbi,snp.observed \
+ hgsql hg18 -NBe 'select snp.name,gc.riskAllele,snp.strand,snp.refNcbi,snp.observed \
from gwasCatalog as gc, snp130 as snp \
where gc.riskAllele rlike "^rs[0-9]+-[ACGT]" and \
gc.name = snp.name and snp.observed in ("C/G", "A/T") \
- order by gc.name limit 20;'
- # count(*) = 170
+ order by gc.name;' > ambigStrand.txt
+ wc -l ambigStrand.txt
+#174 ambigStrand.txt
#############################################################################
# CRG MAPABILITY (2010-01-19 - 2010-01-28, hartera, DONE)