a7d5080da217a1cc9ab8006cc34ccac66b4dbcff markd Sun Jan 16 14:54:57 2022 -0800 import of GENCODE 39lift37' diff --git src/hg/makeDb/doc/hg19.gencode.txt src/hg/makeDb/doc/hg19.gencode.txt index 9ca2aeb..a38ce53 100644 --- src/hg/makeDb/doc/hg19.gencode.txt +++ src/hg/makeDb/doc/hg19.gencode.txt @@ -924,15 +924,61 @@ These are missing from data/release_39lift37/gencode.v39lift37.metadata.Transcript_source.gz data/release_39lift37/gencode.v39lift37.metadata.Gene_source.gz this is the weird cases of SPRV3 which has now has a transcript past the PAR echo -e 'ENST00000302805.2\tensembl_havana_transcript_homo_sapiens' >> tables/wgEncodeGencodeTranscriptSourceV39lift37.tab echo -e 'ENSG00000168939.6\tensembl_havana_transcript_homo_sapiens' >> tables/wgEncodeGencodeGeneSourceV39lift37.tab rm loaded/wgEncodeGencode*Support* (time nice make -j 10 -f ~/kent/src/hg/makeDb/outside/gencode/gencodeLoad.mk) >&build.4.out& # commit all jkmake alpha DBS=hg19 ############################################################################## +2022-01-16: import of UCSC GENCODE group processing of GENCODE V39lift37 (markd) + # final release + + # edit hg/makeDb/outside/gencode/gencodeLoad.mk to set release and ensembl versions + + # download, build and load tables + mkdir -p /hive/data/genomes/hg19/bed/gencodeV39lift37/hgcImport + pushd /hive/data/genomes/hg19/bed/gencodeV39lift37/hgcImport + + (time nice make -j 10 -f ~/kent/src/hg/makeDb/outside/gencode/gencodeLoad.mk) >&build.1.out& + + # compare tables from previous release to see if number changed makes + # sense. Results are in gencode-cmp.tsv + # generate trackDb and joiner blurb + pushd ~/kent/src/hg/makeDb/trackDb + ../../makeDb/outside/gencode/bin/gencodeGenerateTrackDbs hg19 39lift37 105 'Oct 2021' + + # Update human/hg19/wgEncodeGencodeSuper.html and update 'Release Notes' + # to describe new release. + + # edit human/hg19/trackDb.gencode.ra to add new .ra file include + jkmake DBS=hg19 + + # edit all.joiner to add ~/tmp/gencodeV39lift37.joiner + # verify with: + pushd /hive/data/genomes/hg19/bed/gencodeV39lift37/hgcImport + make -f ~/kent/src/hg/makeDb/outside/gencode/gencodeLoad.mk joinerCheck + + # generates joiner errors + The gene/transcript pair is missing from metadata: + ENSG00000168939.6 / ENST00000302805.2 / SPRY3 + These are missing from + data/release_39lift37/gencode.v39lift37.metadata.Transcript_source.gz + data/release_39lift37/gencode.v39lift37.metadata.Gene_source.gz + + this is the weird cases of SPRV3 which has now has a transcript past the PAR + + echo -e 'ENST00000302805.2\tensembl_havana_transcript_homo_sapiens' >> tables/wgEncodeGencodeTranscriptSourceV39lift37.tab + echo -e 'ENSG00000168939.6\tensembl_havana_transcript_homo_sapiens' >> tables/wgEncodeGencodeGeneSourceV39lift37.tab + rm loaded/wgEncodeGencode*Support* + (time nice make -j 10 -f ~/kent/src/hg/makeDb/outside/gencode/gencodeLoad.mk) >&build.4.out& + + # commit all + jkmake alpha DBS=hg19 + +##############################################################################