src/hg/hgTracks/bamTrack.c 1.11

1.11 2009/10/16 00:34:31 angie
Added enhanced coloring options (user-requested) to hgTrackUi and implemented 3 out of 5 in hgTracks.
Index: src/hg/hgTracks/bamTrack.c
===================================================================
RCS file: /projects/compbio/cvsroot/kent/src/hg/hgTracks/bamTrack.c,v
retrieving revision 1.10
retrieving revision 1.11
diff -b -B -U 1000000 -r1.10 -r1.11
--- src/hg/hgTracks/bamTrack.c	8 Oct 2009 06:38:23 -0000	1.10
+++ src/hg/hgTracks/bamTrack.c	16 Oct 2009 00:34:31 -0000	1.11
@@ -1,294 +1,461 @@
 /* bamTrack -- handlers for alignments in BAM format (produced by MAQ,
  * BWA and some other short-read alignment tools). */
 
 #ifdef USE_BAM
 
 #include "common.h"
 #include "hCommon.h"
 #include "hash.h"
 #include "linefile.h"
 #include "jksql.h"
 #include "hdb.h"
 #include "hgTracks.h"
+#include "cds.h"
 #include "bamFile.h"
 
 static char const rcsid[] = "$Id$";
 
 struct bamTrackData
     {
     struct track *tg;
     struct hash *pairHash;
     int minAliQual;
+    char *colorMode;
+    char *grayMode;
+    boolean grayUnpaired;
+    char *userTag;
     };
 
 struct simpleFeature *sfFromNumericCigar(const bam1_t *bam, int *retLength)
 /* Translate BAM's numeric CIGAR encoding into a list of simpleFeatures, 
  * and tally up length on reference sequence while we're at it. */
 {
 const bam1_core_t *core = &bam->core;
 struct simpleFeature *sf, *sfList = NULL;
 int tLength=0, tPos = core->pos, qPos = 0;
 unsigned int *cigar = bam1_cigar(bam);
 int i;
 for (i = 0;  i < core->n_cigar;  i++)
     {
     char op;
     int n = bamUnpackCigarElement(cigar[i], &op);
     switch (op)
 	{
 	case 'M': // match or mismatch (gapless aligned block)
 	    AllocVar(sf);
 	    sf->start = tPos;
 	    sf->qStart = qPos;
 	    tPos = sf->end = tPos + n;
 	    qPos = sf->qEnd = qPos + n;
 	    slAddHead(&sfList, sf);
 	    tLength += n;
 	    break;
 	case 'I': // inserted in query
 	case 'S': // skipped query bases at beginning or end ("soft clipping")
 	    qPos += n;
 	    break;
 	case 'D': // deleted from query
 	case 'N': // long deletion from query (intron as opposed to small del)
 	    tPos += n;
 	    tLength += n;
 	    break;
 	case 'H': // skipped query bases not stored in record's query sequence ("hard clipping")
 	case 'P': // P="silent deletion from padded reference sequence" -- ignore these.
 	    break;
 	default:
 	    errAbort("sfFromNumericCigar: unrecognized CIGAR op %c -- update me", op);
 	}
     }
 if (retLength != NULL)
     *retLength = tLength;
 return sfList;
 }
 
 struct linkedFeatures *bamToLf(const bam1_t *bam, void *data)
 /* Translate a BAM record into a linkedFeatures item. */
 {
+struct bamTrackData *btd = (struct bamTrackData *)data;
 const bam1_core_t *core = &bam->core;
 struct linkedFeatures *lf;
 AllocVar(lf);
 lf->score = core->qual;
 safef(lf->name, sizeof(lf->name), bam1_qname(bam));
 lf->orientation = (core->flag & BAM_FREVERSE) ? -1 : 1;
 int length;
 lf->components = sfFromNumericCigar(bam, &length);
 lf->start = lf->tallStart = core->pos;
 lf->end = lf->tallEnd = core->pos + length;
 lf->extra = bamGetQuerySequence(bam);
-lf->grayIx = maxShade;
+if (sameString(btd->colorMode, BAM_COLOR_MODE_GRAY) &&
+    sameString(btd->grayMode, BAM_GRAY_MODE_ALI_QUAL))
+    {
+    // hardcode transform coefficients for now; if user demand, make into tdb/cart vars.
+    int min = 0, max = 99;
+    int minShade = 2;
+    int ix = minShade + (maxShade - minShade) * ((double)(core->qual - min) / (double)(max-min));
+    if (ix > maxShade)
+	ix = maxShade;
+    if (ix < minShade)
+	ix = minShade;
+    lf->grayIx = ix;
+    }
+else
+    lf->grayIx = maxShade;
 return lf;
 }
 
 boolean passesFilters(const bam1_t *bam, struct bamTrackData *btd)
 /* Return TRUE if bam passes hgTrackUi-set filters. */
 {
 if (bam == NULL)
     return FALSE;
 const bam1_core_t *core = &bam->core;
 // Always reject unmapped items -- nowhere to draw them.
 if (core->flag & BAM_FUNMAP)
     return FALSE;
 if (core->qual < btd->minAliQual)
     return FALSE;
 return TRUE;
 }
 
 int addBam(const bam1_t *bam, void *data)
 /* bam_fetch() calls this on each bam alignment retrieved.  Translate each bam 
  * into a linkedFeatures item, and add it to tg->items. */
 {
 struct bamTrackData *btd = (struct bamTrackData *)data;
 if (!passesFilters(bam, btd))
     return 0;
 struct linkedFeatures *lf = bamToLf(bam, data);
 struct track *tg = btd->tg;
 slAddHead(&(tg->items), lf);
 return 0;
 }
 
 static struct linkedFeatures *lfStub(int startEnd, int orientation)
 /* Make a linkedFeatures for a zero-length item (so that an arrow will be drawn
  * toward the given coord. */
 {
 struct linkedFeatures *lf;
 AllocVar(lf);
 safef(lf->name, sizeof(lf->name), "stub");
 lf->orientation = orientation;
 struct simpleFeature *sf;
 AllocVar(sf);
 sf->start = sf->end = lf->start = lf->end = lf->tallStart = lf->tallEnd = startEnd;
 lf->components = sf;
 lf->extra = cloneString("");
 lf->grayIx = maxShade;
 return lf;
 }
 
 static struct linkedFeaturesSeries *lfsFromLf(struct linkedFeatures *lf)
 /* Make a linkedFeaturesSeries from one or two linkedFeatures elements. */
 {
 struct linkedFeaturesSeries *lfs;
 AllocVar(lfs);
 lfs->name = cloneString(lf->name);
 lfs->grayIx = lf->grayIx;
 if (lf->next != NULL)
     slSort(&lf, linkedFeaturesCmpStart);
 lfs->orientation = 0;
 lfs->start = lf->start;
 lfs->end = lf->next ? lf->next->end : lf->end;
 lfs->features = lf;
 return lfs;
 }
 
 int addBamPaired(const bam1_t *bam, void *data)
 /* bam_fetch() calls this on each bam alignment retrieved.  Translate each bam 
  * into a linkedFeaturesSeries item, and either store it until we find its mate
  * or add it to tg->items. */
 {
 const bam1_core_t *core = &bam->core;
 struct bamTrackData *btd = (struct bamTrackData *)data;
 if (! passesFilters(bam, btd))
     return 0;
 struct linkedFeatures *lf = bamToLf(bam, data);
 struct track *tg = btd->tg;
 if (! (core->flag & BAM_FPAIRED))
     {
     slAddHead(&(tg->items), lfsFromLf(lf));
     }
 else
     {
     struct linkedFeatures *lfMate = (struct linkedFeatures *)hashFindVal(btd->pairHash, lf->name);
     if (lfMate == NULL)
 	{
 	if (core->flag & BAM_FPROPER_PAIR)
 	    {
 	    // If we know that this is properly paired, but don't have the mate,
 	    // make a bogus item off the edge of the window so that if we don't
 	    // encounter its mate later, we can at least draw an arrow off the
 	    // edge of the window.
 	    struct linkedFeatures *stub;
 	    if (core->mpos < 0)
 		{
 		int offscreen = (lf->orientation > 0) ? winEnd + 10 : winStart - 10;
 		if (offscreen < 0) offscreen = 0;
 		stub = lfStub(offscreen, -lf->orientation);
 		}
 	    else
 		{
 		stub = lfStub(core->mpos, -lf->orientation);
 		}
 	    lf->next = stub;
 	    }
-	else
+	else if (btd->grayUnpaired)
 	    // not properly paired: make it a lighter shade.
-	    lf->grayIx -= 2;
+	    lf->grayIx -= 3;
 	hashAdd(btd->pairHash, lf->name, lf);
 	}
     else
 	{
 	lfMate->next = lf;
 	slAddHead(&(tg->items), lfsFromLf(lfMate));
 	hashRemove(btd->pairHash, lf->name);
 	}
     }
 return 0;
 }
 
 #define MAX_ITEMS_FOR_MAPBOX 1500
 static void dontMapItem(struct track *tg, struct hvGfx *hvg, void *item,
 			char *itemName, char *mapItemName, int start, int end,
 			int x, int y, int width, int height)
 /* When there are many many items, drawing hgc links can really slow us down. */
 {
 }
 
+static int linkedFeaturesCmpOri(const void *va, const void *vb)
+/* Help sort linkedFeatures by strand, then by starting pos. */
+{
+const struct linkedFeatures *a = *((struct linkedFeatures **)va);
+const struct linkedFeatures *b = *((struct linkedFeatures **)vb);
+int ret = a->orientation - b->orientation;
+if (ret == 0)
+    ret = a->start - b->start;
+return ret;
+}
+
 void bamLoadItemsCore(struct track *tg, boolean isPaired)
 /* Load BAM data into tg->items item list, unless zoomed out so far
  * that the data would just end up in dense mode and be super-slow. */
 {
 char *seqNameForBam = chromName;
 char *stripPrefix = trackDbSetting(tg->tdb, "stripPrefix");
 if (stripPrefix && startsWith(stripPrefix, chromName))
     seqNameForBam = chromName + strlen(stripPrefix);
 char posForBam[512];
 safef(posForBam, sizeof(posForBam), "%s:%d-%d", seqNameForBam, winStart, winEnd);
 
 struct hash *pairHash = isPaired ? hashNew(18) : NULL;
-char cartVarName[512];
-safef(cartVarName, sizeof(cartVarName), "%s_minAliQual", tg->tdb->tableName);
-int minAliQual = cartUsualInt(cart, cartVarName, 0);
-struct bamTrackData btd = {tg, pairHash, minAliQual};
+char cartVarName[1024];
+safef(cartVarName, sizeof(cartVarName), "%s_" BAM_MIN_ALI_QUAL, tg->tdb->tableName);
+int minAliQual = cartUsualInt(cart, cartVarName,
+	       atoi(trackDbSettingOrDefault(tg->tdb, BAM_MIN_ALI_QUAL, BAM_MIN_ALI_QUAL_DEFAULT)));
+safef(cartVarName, sizeof(cartVarName), "%s_" BAM_COLOR_MODE, tg->tdb->tableName);
+char *colorMode = cartUsualString(cart, cartVarName,
+		         trackDbSettingOrDefault(tg->tdb, BAM_COLOR_MODE, BAM_COLOR_MODE_DEFAULT));
+safef(cartVarName, sizeof(cartVarName), "%s_" BAM_GRAY_MODE, tg->tdb->tableName);
+char *grayMode = cartUsualString(cart, cartVarName,
+		         trackDbSettingOrDefault(tg->tdb, BAM_GRAY_MODE, BAM_GRAY_MODE_DEFAULT));
+boolean grayUnpaired = (sameString(colorMode, BAM_COLOR_MODE_GRAY) &&
+			sameString(grayMode, BAM_GRAY_MODE_UNPAIRED));
+safef(cartVarName, sizeof(cartVarName), "%s_" BAM_COLOR_TAG, tg->tdb->tableName);
+char *userTag = cartUsualString(cart, cartVarName,
+		         trackDbSettingOrDefault(tg->tdb, BAM_COLOR_TAG, BAM_COLOR_TAG_DEFAULT));
+struct bamTrackData btd = {tg, pairHash, minAliQual, colorMode, grayMode, grayUnpaired, userTag};
 char *fileName;
 if (tg->customPt)
     {
     fileName = trackDbSetting(tg->tdb, "bigDataUrl");
     if (fileName == NULL)
 	errAbort("bamLoadItemsCore: can't find bigDataUrl for custom track %s", tg->mapName);
     }
 else
     fileName = bamFileNameFromTable(database, tg->mapName, seqNameForBam);
 bamFetch(fileName, posForBam, (isPaired ? addBamPaired : addBam), &btd);
 if (isPaired)
     {
     struct hashEl *hel;
     struct hashCookie cookie = hashFirst(pairHash);
     int count = 0;
     while ((hel = hashNext(&cookie)) != NULL)
 	{
 	struct linkedFeatures *lf = hel->val;
 	slAddHead(&(tg->items), lfsFromLf(lf));
 	count++;
 	}
     }
 if (tg->visibility != tvDense)
     {
     slReverse(&(tg->items));
-    slSort(&(tg->items), isPaired ? linkedFeaturesSeriesCmp : linkedFeaturesCmpStart);
+    if (isPaired)
+	slSort(&(tg->items), linkedFeaturesSeriesCmp);
+    else if (sameString(colorMode, BAM_COLOR_MODE_STRAND))
+	slSort(&(tg->items), linkedFeaturesCmpOri);
+    else
+	slSort(&(tg->items), linkedFeaturesCmpStart);
     if (slCount(tg->items) > MAX_ITEMS_FOR_MAPBOX)
 	tg->mapItem = dontMapItem;
     }
 }
 
 void bamLoadItems(struct track *tg)
 /* Load single-ended-only BAM data into tg->items item list, unless zoomed out so far
  * that the data would just end up in dense mode and be super-slow. */
 {
 bamLoadItemsCore(tg, FALSE);
 }
 
 void bamPairedLoadItems(struct track *tg)
 /* Load possibly paired BAM data into tg->items item list, unless zoomed out so far
  * that the data would just end up in dense mode and be super-slow. */
 {
 bamLoadItemsCore(tg, TRUE);
 }
 
+void bamDrawAt(struct track *tg, void *item,
+	struct hvGfx *hvg, int xOff, int y, double scale,
+	MgFont *font, Color color, enum trackVisibility vis)
+/* Draw a single bam linkedFeatures item.  Borrows a lot from linkedFeaturesDrawAt,
+ * but cuts a lot of unneeded features (like coding region) and adds a couple
+ * additional sources of color. */
+{
+struct linkedFeatures *lf = item;
+struct simpleFeature *sf;
+int heightPer = tg->heightPer;
+int x1 = round((double)((int)lf->start-winStart)*scale) + xOff;
+int x2 = round((double)((int)lf->end-winStart)*scale) + xOff;
+int w = x2-x1;
+int midY = y + (heightPer>>1);
+char *exonArrowsDense = trackDbSetting(tg->tdb, "exonArrowsDense");
+boolean exonArrowsEvenWhenDense = (exonArrowsDense != NULL &&
+				   !sameWord(exonArrowsDense, "off"));
+boolean exonArrows = (tg->exonArrows &&
+		      (vis != tvDense || exonArrowsEvenWhenDense));
+struct dnaSeq *mrnaSeq = NULL;
+enum baseColorDrawOpt drawOpt = baseColorDrawOff;
+boolean indelShowDoubleInsert, indelShowQueryInsert, indelShowPolyA;
+struct psl *psl = NULL;
+if (vis != tvDense)
+    {
+    drawOpt = baseColorDrawSetup(hvg, tg, lf, &mrnaSeq, &psl);
+    if (drawOpt > baseColorDrawOff)
+	exonArrows = FALSE;
+    }
+
+char cartVarName[1024];
+safef(cartVarName, sizeof(cartVarName), "%s_" BAM_COLOR_MODE, tg->tdb->tableName);
+char *colorMode = cartUsualString(cart, cartVarName,
+		         trackDbSettingOrDefault(tg->tdb, BAM_COLOR_MODE, BAM_COLOR_MODE_DEFAULT));
+static Color darkBlueColor = 0;
+static Color darkRedColor = 0;
+if (darkRedColor == 0)
+    {
+    darkRedColor = hvGfxFindColorIx(hvg, 100,0,0);
+    darkBlueColor = hvGfxFindColorIx(hvg, 0,0,100);
+    }
+if (sameString(colorMode, BAM_COLOR_MODE_STRAND))
+    color = (lf->orientation < 0) ? darkRedColor : darkBlueColor;
+else if (lf->filterColor > 0)
+    color = lf->filterColor;
+else if (tg->colorShades)
+    color = tg->colorShades[lf->grayIx];
+
+
+indelEnabled(cart, tg->tdb, basesPerPixel, &indelShowDoubleInsert, &indelShowQueryInsert,
+	     &indelShowPolyA);
+if (!indelShowDoubleInsert)
+    innerLine(hvg, x1, midY, w, color);
+for (sf = lf->components; sf != NULL; sf = sf->next)
+    {
+    int s = sf->start,  e = sf->end;
+    baseColorDrawItem(tg, lf, sf->grayIx, hvg, xOff, y, scale, font, s, e, heightPer,
+		      zoomedToCodonLevel, mrnaSeq, sf, psl, drawOpt, MAXPIXELS, winStart, color);
+    if (tg->exonArrowsAlways ||
+	(exonArrows &&
+	 (sf->start <= winStart || sf->start == lf->start) &&
+	 (sf->end >= winEnd || sf->end == lf->end)))
+	{
+	Color barbColor = hvGfxContrastingColor(hvg, color);
+	x1 = round((double)((int)s-winStart)*scale) + xOff;
+	x2 = round((double)((int)e-winStart)*scale) + xOff;
+	w = x2-x1;
+	clippedBarbs(hvg, x1+1, midY, x2-x1-2, tl.barbHeight, tl.barbSpacing, lf->orientation,
+		     barbColor, TRUE);
+	}
+    }
+if (indelShowDoubleInsert)
+    {
+    int intronGap = 0;
+    if (vis != tvDense)
+	intronGap = atoi(trackDbSettingOrDefault(tg->tdb, "intronGap", "0"));
+    lfDrawSpecialGaps(lf, intronGap, TRUE, 0, tg, hvg, xOff, y, scale, color, color, vis);
+    }
+if (vis != tvDense)
+    {
+    /* If highlighting differences between aligned sequence and genome when
+     * zoomed way out, this must be done in a separate pass after exons are
+     * drawn so that exons sharing the pixel don't overdraw differences. */
+    if (indelShowQueryInsert || indelShowPolyA)
+	baseColorOverdrawQInsert(tg, lf, hvg, xOff, y, scale, heightPer, mrnaSeq, psl, winStart,
+				 drawOpt, indelShowQueryInsert, indelShowPolyA);
+    baseColorOverdrawDiff(tg, lf, hvg, xOff, y, scale, heightPer, mrnaSeq, psl, winStart, drawOpt);
+    baseColorDrawCleanup(lf, &mrnaSeq, &psl);
+    }
+}
+
+void bamPairedDrawAt(struct track *tg, void *item, struct hvGfx *hvg, int xOff, int y,
+		     double scale, MgFont *font, Color color, enum trackVisibility vis)
+/* Draw a bam linked features series item at position. (like linkedFeaturesSeriesDrawAt,
+ * but calls bamDrawAt instead of linkedFeaturesDrawAt) */
+{
+struct linkedFeaturesSeries *lfs = item;
+struct linkedFeatures *lf;
+int midY = y + (tg->heightPer>>1);
+int prevEnd = lfs->start;
+
+if ((lf = lfs->features) == NULL)
+    return;
+for (lf = lfs->features; lf != NULL; lf = lf->next)
+    {
+
+    int x1 = round((double)((int)prevEnd-winStart)*scale) + xOff;
+    int x2 = round((double)((int)lf->start-winStart)*scale) + xOff;
+    int w = x2-x1;
+    if (w > 0)
+	hvGfxLine(hvg, x1, midY, x2, midY, color);
+    bamDrawAt(tg, lf, hvg, xOff, y, scale, font, color, vis);
+    prevEnd = lf->end;
+    }
+}
+
+
 void bamMethods(struct track *track)
 /* Methods for BAM alignment files. */
 {
 track->canPack = TRUE;
 char varName[1024];
-safef(varName, sizeof(varName), "%s_pairEndsByName", track->mapName);
+safef(varName, sizeof(varName), "%s_" BAM_PAIR_ENDS_BY_NAME, track->mapName);
 boolean isPaired = cartUsualBoolean(cart, varName,
-				    (trackDbSetting(track->tdb, "pairEndsByName") != NULL));
+				    (trackDbSetting(track->tdb, BAM_PAIR_ENDS_BY_NAME) != NULL));
 if (isPaired)
     {
     linkedFeaturesSeriesMethods(track);
     track->loadItems = bamPairedLoadItems;
+    track->drawItemAt = bamPairedDrawAt;
     }
 else
     {
     linkedFeaturesMethods(track);
     track->loadItems = bamLoadItems;
+    track->drawItemAt = bamDrawAt;
     }
 track->labelNextItemButtonable = track->nextItemButtonable = FALSE;
 track->labelNextPrevItem = NULL;
 track->nextPrevItem = NULL;
 track->colorShades = shadesOfGray;
 }
 
 #endif /* USE_BAM */