976e5f5a2582e99913f82839e86efccdca88d814
angie
  Fri Mar 22 13:12:51 2013 -0700
Adding information from the Database of Non-Synonymous Functional Prediction(dbNSFP, https://sites.google.com/site/jpopgen/dbNSFP,
http://dbnsfp.houstonbioinformatics.org/dbNSFPzip/dbNSFP2.0.readme.txt).
dbNSFP2.0 contains precomputed predictions from a variety of tools of the
effects of all possible missense variants on protein-coding Gencode rel 9
(Ens 64) transcripts.  For example, it contains scores and predictions
from SIFT, PolyPhen2 and similar tools (MutationTaster, MutationAssessor,
LRT), as well as GERP scores at CDS positions and associated domain
information from InterPro and IDs from UniProt.  Each subset is
extracted into a bigBed or bigWig file so that users of the Variant
Annotation Integrator will be able to apply one or more of these
prediction methods to their variants.
refs #6152

diff --git src/hg/lib/dbNsfpSeqChange.as src/hg/lib/dbNsfpSeqChange.as
new file mode 100644
index 0000000..5aa456d
--- /dev/null
+++ src/hg/lib/dbNsfpSeqChange.as
@@ -0,0 +1,21 @@
+table dbNsfpSeqChange
+"Coding sequence missense changes annotated by dbNSFP (http://dbnsfp.houstonbioinformatics.org/)"
+    (
+    string chrom;      "Reference sequence chromosome or scaffold"
+    uint   chromStart; "Start position in chromosome"
+    uint   chromEnd;   "End position in chromosome"
+    enum('A','C','G','T') refAl;   "Allele found in reference assembly"
+    lstring ensTxId;   "Ensembl transcript ID(s); can be comma-sep'd list of overlapping transcripts"
+    lstring ensGeneId; "Ensembl gene ID(s); usually single, but can be comma-sep'd list parallel to ensTxId"
+    enum('+','-') strand; "Strand of Ensembl transcript(s)"
+    string refCodon;   "Codon from reference assembly; can be list????"
+    string codonPos;   "Position of change in codon (1, 2 or 3); can be list"
+    char[1] refAa;     "Amino acid for refCodon or '.' (in which case we can recompute)"
+    string aaPos;      "Offset of changed amino acid (1-based); can be list"
+    enum('A','C','G','T') altAl1;       "alternate allele #1"
+    char[1] altAa1;                     "Amino acid for codon with altAl1 substituted at codonPos"
+    enum('A','C','G','T','.') altAl2;   "alternate allele #2"
+    char[1] altAa2;                     "Amino acid for codon with altAl2 substituted at codonPos"
+    enum('A','C','G','T','.') altAl3;   "alternate allele #3"
+    char[1] altAa3;                     "Amino acid for codon with altAl3 substituted at codonPos"
+    )