src/hg/makeDb/doc/hg19.txt 1.70
1.70 2010/01/05 03:04:20 hartera
Changed data for Burge RNA-seq track to BED format. Moved Exoniphy trackDb entry to human level trackDb.ra file.
Index: src/hg/makeDb/doc/hg19.txt
===================================================================
RCS file: /projects/compbio/cvsroot/kent/src/hg/makeDb/doc/hg19.txt,v
retrieving revision 1.69
retrieving revision 1.70
diff -b -B -U 4 -r1.69 -r1.70
--- src/hg/makeDb/doc/hg19.txt 28 Dec 2009 19:38:30 -0000 1.69
+++ src/hg/makeDb/doc/hg19.txt 5 Jan 2010 03:04:20 -0000 1.70
@@ -7272,10 +7272,12 @@
# BURGE LAB DATA MAPPED WITH GEMMAPPER. PROVIDED BY THOMAS DERRIEN FROM RODERIC
# GUIGO'S LAB AT CRG. (E-MAIL: thomas.derrien@crg.es). Data received on
# 09/14/09.
# (hartera, 2009-09-28, DONE)
-# 2009-12-14. Set cdsStart = cdsEnd = 0. Moved track data directory to
+# 2009-12-14, hartera. Set cdsStart = cdsEnd = 0. Moved track data directory to
# /hive/data/genomes/hg18/bed.
+# 2010-01-04, hartera. Change the data to BED format and re-loaded tables. BED
+# is more appropriate for this data type.
mkdir /hive/groups/gencode/browser/hg19/burgeRnaSeqGemMapperAlign
cd /hive/groups/gencode/browser/hg19/burgeRnaSeqGemMapperAlign
@@ -7350,8 +7352,31 @@
# Then move data to directory in hg19 genome bed directory
cd /hive/data/genomes/hg19/bed
mv /hive/groups/gencode/browser/hg19/burgeRnaSeqGemMapperAlign ./
+ # 2010-01-04 Change the data to BED format. For genePred format,
+ # there is always a track configuration added for colouring tracks by
+ # genomic codons which does not make sense for this data. Also, BED is
+ # more appropriate for this data type.
+ cd /hive/data/genomes/hg19/bed/burgeRnaSeqGemMapperAlign
+ # Convert gff to genePred and then genePred to BED, drop old table and
+ # then load database with BED format data. Need to fix the cdStart and
+ # cdsEnd fields to be 0.
+ foreach f (`ls burgeRnaSeqGemMapperAlign*.gff`)
+ echo $f >> bed.log
+ set g=$f:r
+ echo $g
+ ldHgGene -exon=read -nobin -out=${g}.gp hg19 $g $f >>& bed.log
+ awk 'BEGIN {FS="\t"} {OFS="\t"} {print $1,$2,$3,$4,$5,0,0,$8,$9,$10}' \
+ ${g}.gp > ${g}Fixed.gp
+ genePredToBed ${g}Fixed.gp > ${g}.bed
+ echo "Dropping table $g"
+ hgsql -e "drop table ${g};" hg19
+ hgLoadBed hg19 $g ${g}.bed >>& bed.log
+ end
+ # Changed track type in trackDb/human/trackDb.ra to bed 12 and
+ # then did make alpha in trackDb directory.
+
##########################################################################
# BUILD ALLEN BRAIN TRACK (DONE 09/30/09 kent)
# Make the working directory
@@ -8239,10 +8264,12 @@
hgsql hg19 < ~/src/hg/lib/geneNetworkId.sql
hgsql hg19 -e \
'load data local infile "GN_human_RefSeq.txt" into table geneNetworkId'
-######################################################################## EXONIPHY (2009-12-28, hartera, DONE)
-
+########################################################################
+# EXONIPHY (2009-12-28, hartera, DONE)
+# 2010-01-05, hartera. Moved trackDb entry for exoniphy up to human directory
+# level as it is the same for all assemblies.
# New predictions for hg19 run by Melissa Hubisz
# (mjhubisz at gmail.com) for hg19 and sent by
# Adam Siepel (acs4 at cornell.edu) on 2009-12-18
mkdir -p /hive/data/genomes/hg19/bed/exoniphy.2009-12-18
@@ -8256,4 +8283,9 @@
ldHgGene -genePredExt -gtf hg19 exoniphy exoniphy.gff
# Read 620689 transcripts in 647299 lines in 1 files
# 620689 groups 24 seqs 1 sources 4 feature types
# 186601 gene predictions
+ # Added a copy of the hg18 track description to trackDb/human/hg19 and
+ # updated it and added a trackDb entry to the trackDb.ra there.
+ # 2010-01-04. Moved exoniphy trackDb entry up to the human level
+ # trackDb.ra since the entry is the same for hg16-19. Removed the entry in
+ # trackDb.ra in each of those assembly directories.