src/hg/makeDb/doc/hg18.txt 1.399
1.399 2010/02/18 20:28:39 hartera
Added a Signal track for the Burge RNA-seq data. Updated trackDb entry for this track to include views.
Index: src/hg/makeDb/doc/hg18.txt
===================================================================
RCS file: /projects/compbio/cvsroot/kent/src/hg/makeDb/doc/hg18.txt,v
retrieving revision 1.398
retrieving revision 1.399
diff -b -B -U 4 -r1.398 -r1.399
--- src/hg/makeDb/doc/hg18.txt 18 Feb 2010 18:53:24 -0000 1.398
+++ src/hg/makeDb/doc/hg18.txt 18 Feb 2010 20:28:39 -0000 1.399
@@ -28929,8 +28929,13 @@
# 2009-12-14, hartera. Set cdsStart = cdsEnd = 0. Moved track data directory to
# /hive/data/genomes/hg18/bed.
# 2010-01-04, hartera. Change the data to BED format and re-loaded tables. BED
# is more appropriate for this data type.
+# The data is too dense in places (feedback from QA) so it would be more
+# appropriate to have a Signal track as for the ENCODE RNA-seq data tracks.
+# 2010-02-09, hartera. Create bedGraph Signal subtracks for each tissue/cell
+# using reads/per million mapped reads as the data value.
+# 2010-02-17, hartera. Updated trackDb.ra entry to include views.
mkdir /hive/groups/gencode/browser/hg18/burgeRnaSeqGemMapperAlign
cd /hive/groups/gencode/browser/hg18/burgeRnaSeqGemMapperAlign
@@ -29026,8 +29031,32 @@
end
# Changed track type in trackDb/human/trackDb.ra to bed 12 and
# then did make alpha in trackDb directory.
+ # 2010-02-09. Add a Signal track so it is easier to view the data in
+ # regions where there is a high density of reads.
+ cd /hive/data/genomes/hg18/bed/burgeRnaSeqGemMapperAlign
+ # Use bedItemOverlapCount to get counts of overlapping items for each base.
+ # Need to sort the bed files and then get the number of reads mapped for
+ # that tissue. Divide the counts by the number of million mapped reads to
+ # get reads per million mapped reads as the data value.
+ foreach f (`ls *.bed`)
+ echo $f
+ set g=$f:r
+ sort $f | bedItemOverlapCount hg18 stdin > ${f}.count
+ set size=`hgsql -Ne "select count(distinct name) from ${g};" hg18`
+ awk -v size=${size} 'BEGIN {OFS="\t"} {print $1,$2,$3,($4 / (size/1000000));}' ${f}.count > ${g}.bedGraph
+ end
+ # Load the bedGraph tables into the database as Raw Signal tracks.
+ foreach f (`ls *.bedGraph`)
+ echo $f
+ set g=$f:r
+ hgLoadBed -bedGraph=4 hg18 ${g}AllRawSignal $f >>& load.log
+ end
+ # 2010-02-17
+ # trackDb.ra entry in trackDb/human was updated to include views for the
+ # Raw Signal and Alignment subtracks.
+
############################################################################
# TRANSMAP vertebrate.2009-09-13 build (2009-09-20 markd)
vertebrate-wide transMap alignments were built Tracks are created and loaded
@@ -29341,8 +29370,9 @@
end
# Added a trackDb entry for this subtrack of the ENCODE Mapability
# track in kent/src/hg/makeDb/trackDb/human/hg18/trackDb.wgEncode.ra
# use bigWigInfo to check min and max values.
+
#####################################################################
# tRNAs track (2010-01-12, Fan DONE)
#
ssh hgwdev