976e5f5a2582e99913f82839e86efccdca88d814 angie Fri Mar 22 13:12:51 2013 -0700 Adding information from the Database of Non-Synonymous Functional Prediction(dbNSFP, https://sites.google.com/site/jpopgen/dbNSFP, http://dbnsfp.houstonbioinformatics.org/dbNSFPzip/dbNSFP2.0.readme.txt). dbNSFP2.0 contains precomputed predictions from a variety of tools of the effects of all possible missense variants on protein-coding Gencode rel 9 (Ens 64) transcripts. For example, it contains scores and predictions from SIFT, PolyPhen2 and similar tools (MutationTaster, MutationAssessor, LRT), as well as GERP scores at CDS positions and associated domain information from InterPro and IDs from UniProt. Each subset is extracted into a bigBed or bigWig file so that users of the Variant Annotation Integrator will be able to apply one or more of these prediction methods to their variants. refs #6152 diff --git src/hg/lib/dbNsfpSeqChange.as src/hg/lib/dbNsfpSeqChange.as new file mode 100644 index 0000000..5aa456d --- /dev/null +++ src/hg/lib/dbNsfpSeqChange.as @@ -0,0 +1,21 @@ +table dbNsfpSeqChange +"Coding sequence missense changes annotated by dbNSFP (http://dbnsfp.houstonbioinformatics.org/)" + ( + string chrom; "Reference sequence chromosome or scaffold" + uint chromStart; "Start position in chromosome" + uint chromEnd; "End position in chromosome" + enum('A','C','G','T') refAl; "Allele found in reference assembly" + lstring ensTxId; "Ensembl transcript ID(s); can be comma-sep'd list of overlapping transcripts" + lstring ensGeneId; "Ensembl gene ID(s); usually single, but can be comma-sep'd list parallel to ensTxId" + enum('+','-') strand; "Strand of Ensembl transcript(s)" + string refCodon; "Codon from reference assembly; can be list????" + string codonPos; "Position of change in codon (1, 2 or 3); can be list" + char[1] refAa; "Amino acid for refCodon or '.' (in which case we can recompute)" + string aaPos; "Offset of changed amino acid (1-based); can be list" + enum('A','C','G','T') altAl1; "alternate allele #1" + char[1] altAa1; "Amino acid for codon with altAl1 substituted at codonPos" + enum('A','C','G','T','.') altAl2; "alternate allele #2" + char[1] altAa2; "Amino acid for codon with altAl2 substituted at codonPos" + enum('A','C','G','T','.') altAl3; "alternate allele #3" + char[1] altAa3; "Amino acid for codon with altAl3 substituted at codonPos" + )