800586745616553f76c9c435f0a4fb89db39c976
hiram
  Thu Jan 24 11:07:58 2019 -0800
checking bbi file stats needs errCatch refs #18869

diff --git src/hg/hubApi/hubApi.c src/hg/hubApi/hubApi.c
index 73f3610..80704fc 100644
--- src/hg/hubApi/hubApi.c
+++ src/hg/hubApi/hubApi.c
@@ -1,135 +1,298 @@
 /* hubApi - access mechanism to hub data resources. */
 #include "common.h"
 #include "linefile.h"
 #include "hash.h"
 #include "options.h"
 #include "jksql.h"
 #include "htmshell.h"
 #include "web.h"
 #include "cheapcgi.h"
 #include "cart.h"
 #include "hui.h"
 #include "udc.h"
 #include "knetUdc.h"
 #include "genbank.h"
 #include "trackHub.h"
 #include "hgConfig.h"
 #include "hCommon.h"
 #include "hPrint.h"
+#include "bigWig.h"
+#include "hubConnect.h"
+#include "obscure.h"
 
 /* Global Variables */
 struct cart *cart;             /* CGI and other variables */
 struct hash *oldVars = NULL;
+static struct hash *trackCounter = NULL;
+static long totalTracks = 0;
+static boolean measureTiming = FALSE;	/* set by CGI parameters */
+static boolean allTrackSettings = FALSE;	/* checkbox setting */
+
+static void trackSettings(struct trackDb *tdb)
+/* process the settingsHash for a track */
+{
+hPrintf("    <ul>\n");
+struct hashEl *hel;
+struct hashCookie hc = hashFirst(tdb->settingsHash);
+while ((hel = hashNext(&hc)) != NULL)
+    {
+    hPrintf("    <li>%s : %s</li>\n", hel->name, (char *)hel->val);
+    }
+hPrintf("    </ul>\n");
+}
+
+static void bbiBriefMeasure(char *type, char *bigDataUrl, long *chromCount, long *itemCount)
+/* check a bigDataUrl to find chrom count and item count */
+{
+*chromCount = 0;
+*itemCount = 0;
+if (startsWithWord("bigBed", type))
+    {
+    struct bbiFile *bbi = bigBedFileOpen(bigDataUrl);
+    struct bbiChromInfo *chromList = bbiChromList(bbi);
+    *chromCount = slCount(chromList);
+    *itemCount = bigBedItemCount(bbi);
+    bbiFileClose(&bbi);
+    }
+else if (startsWithWord("bigWig", type))
+    {
+    struct bbiFile *bwf = bigWigFileOpen(bigDataUrl);
+    struct bbiChromInfo *chromList = bbiChromList(bwf);
+    struct bbiSummaryElement sum = bbiTotalSummary(bwf);
+    *chromCount = slCount(chromList);
+    *itemCount = sum.validCount;
+    bbiFileClose(&bwf);
+    }
+}
 
 static void trackList(struct trackDb *tdb)
+/* process the track list to show all tracks */
 {
 if (tdb)
     {
+    struct hash *countTracks = hashNew(0);
     hPrintf("    <ul>\n");
     struct trackDb *track = tdb;
     for ( ; track; track = track->next )
 	{
-	    hPrintf("    <li>%s</li>\n", track->track);
+        char *bigDataUrl = hashFindVal(track->settingsHash, "bigDataUrl");
+      char *compositeTrack = hashFindVal(track->settingsHash, "compositeTrack");
+        boolean compositeOn = sameOk("on", compositeTrack) ? TRUE : FALSE;
+        boolean depthSearch = cartUsualBoolean(cart, "depthSearch", FALSE);
+        if (compositeOn)
+           hashIncInt(countTracks, "composite container");
+        else
+           hashIncInt(countTracks, track->type);
+        if (depthSearch && bigDataUrl)
+	    {
+	    long chromCount = 0;
+	    long itemCount = 0;
+	    bbiBriefMeasure(track->type, bigDataUrl, &chromCount, &itemCount);
+	    if (startsWithWord("bigBed", track->type))
+	    	hPrintf("    <li>%s : %s : %ld chroms : %ld item count</li>\n", track->track, track->type, chromCount, itemCount);
+	    else if (startsWithWord("bigWig", track->type))
+	    	hPrintf("    <li>%s : %s : %ld chroms : %ld bases covered</li>\n", track->track, track->type, chromCount, itemCount);
+	    else
+	    	hPrintf("    <li>%s : %s : %ld chroms : %ld count</li>\n", track->track, track->type, chromCount, itemCount);
+	    }
+        else
+	    {
+	    if (compositeOn)
+		hPrintf("    <li>%s : %s : composite track container</li>\n", track->track, track->type);
+	    else if (! depthSearch)
+		hPrintf("    <li>%s : %s : %s</li>\n", track->track, track->type, bigDataUrl);
+            else
+		hPrintf("    <li>%s : %s</li>\n", track->track, track->type);
+	    }
+        if (allTrackSettings)
+            trackSettings(track); /* show all settings */
+	}
+    hPrintf("    <li>%d different track types</li>\n", countTracks->elCount);
+    if (countTracks->elCount)
+	{
+        hPrintf("        <ul>\n");
+        struct hashEl *hel;
+        struct hashCookie hc = hashFirst(countTracks);
+        while ((hel = hashNext(&hc)) != NULL)
+	    {
+            int prevCount = ptToInt(hashFindVal(trackCounter, hel->name));
+	    totalTracks += ptToInt(hel->val);
+	    hashReplace(trackCounter, hel->name, intToPt(prevCount + ptToInt(hel->val)));
+	    hPrintf("        <li>%d - %s</li>\n", ptToInt(hel->val), hel->name);
+	    }
+        hPrintf("        </ul>\n");
 	}
     hPrintf("    </ul>\n");
     }
 }
 
 static void assemblySettings(struct trackHubGenome *thg)
+/* display all the assembly 'settingsHash' */
 {
 hPrintf("    <ul>\n");
 struct hashEl *hel;
 struct hashCookie hc = hashFirst(thg->settingsHash);
 while ((hel = hashNext(&hc)) != NULL)
     {
     hPrintf("    <li>%s : %s</li>\n", hel->name, (char *)hel->val);
-    if (sameWord("trackDb", hel->name))
+    if (sameWord("trackDb", hel->name))	/* examine the trackDb structure */
 	{
         struct trackDb *tdb = trackHubTracksForGenome(thg->trackHub, thg);
 	trackList(tdb);
         }
     }
 hPrintf("    </ul>\n");
 }
 
 static void genomeList (struct trackHub *hubTop)
+/* follow the pointers from the trackHub to trackHubGenome and around
+ * in a circle from one to the other to find all hub resources
+ */
 {
 struct trackHubGenome *thg = hubTop->genomeList;
 
 hPrintf("<h4>genome sequences (and tracks) present in this track hub</h4>\n");
 hPrintf("<ul>\n");
+long lastTime = clock1000();
 for ( ; thg; thg = thg->next )
     {
+    if (thg->organism)
+	{
 	hPrintf("<li>%s - %s - %s</li>\n", thg->organism, thg->name, thg->description);
+	}
+    else
+	{	/* can there be a description when organism is empty ? */
+	hPrintf("<li>%s</li>\n", thg->name);
+	}
     if (thg->settingsHash)
 	assemblySettings(thg);
+    if (measureTiming)
+	{
+	long thisTime = clock1000();
+	hPrintf("<em>processing time %s: %ld millis</em><br>\n", thg->name, thisTime - lastTime);
+	}
+    }
+if (trackCounter->elCount)
+    {
+    hPrintf("    <li>%ld total tracks counted, %d different types:</li>\n", totalTracks, trackCounter->elCount);
+    hPrintf("    <ul>\n");
+    struct hashEl *hel;
+    struct hashCookie hc = hashFirst(trackCounter);
+    while ((hel = hashNext(&hc)) != NULL)
+	{
+	hPrintf("    <li>%d - %s - total</li>\n", ptToInt(hel->val), hel->name);
+	}
+    hPrintf("    </ul>\n");
     }
 hPrintf("</ul>\n");
 }
 
+static void displayPublicHubs()
+/* show URLs to all public hubs */
+{
+hPrintf("<h3>public hub URLs from hgwdev-gi</h3>\n");
+hPrintf("<ul>\n");
+struct sqlConnection *conn = hConnectCentral();
+// Build a query to find all public hub URL's
+struct dyString *query = sqlDyStringCreate("select hubUrl from %s",
+                                           hubPublicTableName());
+struct sqlResult *sr = sqlGetResult(conn, query->string);
+char **row;
+while ((row = sqlNextRow(sr)) != NULL)
+{
+    hPrintf("<li>%s</li>\n", row[0]);
+}
+
+hPrintf("</ul>\n");
+}
+
 void doMiddle(struct cart *theCart)
 /* Set up globals and make web page */
 {
 cart = theCart;
+measureTiming = hPrintStatus() && isNotEmpty(cartOptionalString(cart, "measureTiming"));
+measureTiming = TRUE;
 char *database = NULL;
 char *genome = NULL;
 char *url = "https://genome-test.gi.ucsc.edu/~hiram/hubs/Plants/hub.txt";
 getDbAndGenome(cart, &database, &genome, oldVars);
 initGenbankTableNames(database);
 
 char *docRoot = cfgOptionDefault("browser.documentRoot", DOCUMENT_ROOT);
-// fprintf(stderr, "# DBG: docRoot: '%s'\n", docRoot);
 
 int timeout = cartUsualInt(cart, "udcTimeout", 300);
 if (udcCacheTimeout() < timeout)
     udcSetCacheTimeout(timeout);
 knetUdcInstall();
 
 char *pathInfo = getenv("PATH_INFO");
 
 if ((NULL == pathInfo) || strlen(pathInfo) < 1) {
    pathInfo = cloneString("noPathInfo");
 }
-// fprintf(stderr, "# DBG: pathInfo: '%s'\n", pathInfo);
 
 cartWebStart(cart, database, "access mechanism to hub data resources");
 
-
 char *urlInput = cartUsualString(cart, "urlHub", url);
+long lastTime = clock1000();
 struct trackHub *hub = trackHubOpen(urlInput, "");
+if (measureTiming)
+    {
+    long thisTime = clock1000();
+    hPrintf("<em>hub open time: %ld millis</em><br>\n", thisTime - lastTime);
+    }
+
+
 hPrintf("<form action='%s' name='hubApiUrl' id='hubApiUrl' method='GET'\n\n", "../cgi-bin/hubApi");
 hPrintf("<br>Enter hub URL:&nbsp;");
 hPrintf("<input type='text' name='urlHub' id='urlHub' size='60' value='%s'>\n", urlInput);
 hWrites("&nbsp;");
-// hPrintf("<em>after box</em>");
 hButton("goApi", "go");
+boolean depthSearch = cartUsualBoolean(cart, "depthSearch", FALSE);
+hPrintf("<br>\n&nbsp;&nbsp;");
+hCheckBox("depthSearch", cartUsualBoolean(cart, "depthSearch", FALSE));
+hPrintf("&nbsp;perform full bbi file measurement : %s<br>\n", depthSearch ? "TRUE" : "FALSE");
+hPrintf("\n&nbsp;&nbsp;");
+allTrackSettings = cartUsualBoolean(cart, "allTrackSettings", FALSE);
+hCheckBox("allTrackSettings", allTrackSettings);
+hPrintf("&nbsp;display all track settings for each track : %s<br>\n", allTrackSettings ? "TRUE" : "FALSE");
+
 hPrintf("<br>\n</form>\n");
 
 hPrintf("<p>URL: %s<br>\n", urlInput);
 hPrintf("name: %s<br>\n", hub->shortLabel);
 hPrintf("description: %s<br>\n", hub->longLabel);
 hPrintf("default db: '%s'<br>\n", isEmpty(hub->defaultDb) ? "(none available)" : hub->defaultDb);
 printf("pathInfo:'%s'<br>\ndocRoot:'%s'<br>\n", pathInfo, docRoot);
 
 if (hub->genomeList)
     genomeList(hub);
 
 hPrintf("<h2>cart dump</h2>");
 hPrintf("<pre>\n");
 cartDump(cart);
 hPrintf("</pre>\n");
 hPrintf("</p>\n");
+
+displayPublicHubs();
+
 cartWebEnd();
 }
 
 /* Null terminated list of CGI Variables we don't want to save
  * permanently. */
 char *excludeVars[] = {"Submit", "submit", NULL,};
 
 int main(int argc, char *argv[])
 /* Process command line. */
 {
+long enteredMainTime = clock1000();
 cgiSpoof(&argc, argv);
+measureTiming = TRUE;
+verboseTimeInit();
+trackCounter = hashNew(0);
 cartEmptyShell(doMiddle, hUserCookie(), excludeVars, oldVars);
+if (measureTiming)
+    hPrintf("<em>Overall total time: %ld millis</em><br>\n", clock1000() - enteredMainTime);
 return 0;
 }