ba87d8471c9c78f15412ccad2aaba9b46d1af38e
hiram
  Tue Jul 2 16:14:47 2024 -0700
eliminte the dependency upon specific genArk genome names, use the genark table for questions about existence, refs #32596

diff --git src/hg/inc/genark.h src/hg/inc/genark.h
index a5d85a8..25876f7 100644
--- src/hg/inc/genark.h
+++ src/hg/inc/genark.h
@@ -84,31 +84,43 @@
 /* Print out genark as a line in a tab-separated file. */
 
 #define genarkCommaOut(el,f) genarkOutput(el,f,',',',');
 /* Print out genark as a comma separated list including final comma. */
 
 void genarkJsonOutput(struct genark *el, FILE *f);
 /* Print out genark in JSON format. */
 
 /* -------------------------------- End autoSql Generated Code -------------------------------- */
 
 char *genarkUrl(char *accession);
 /* Return the URL to the genark assembly with this accession if present,
  * otherwise return NULL
  * */
 
-char *genArkHubTxt(char *gcX);
-/* given a GC[AF]_012345678.9 name, return hub.txt URL */
+char *genArkPath(char *genome);
+/* given a GenArk hub genome name, e.g. GCA_021951015.1 return the path:
+ *               GCA/021/951/015
+ * prefix that with desired server URL: https://hgdownload.soe.ucsc.edu/hubs/
+ *   if desired.  Or suffix add /hub.txt to get the hub.txt URL
+ *   The path returned does not depend upon this GCx_ naming scheme,
+ *   it simply uses the hub URL as returned from genarkUrl(genome) and
+ *   returns the middle part without the https://... prefix
+ */
 
 char *genarkTableName();
 /* return the genark table name from the environment, 
  * or hg.conf, or use the default.  Cache the result */
 
 /* temporary function while the genark table is in transistion with
  * new coluns being added, July 2024.  Allows compatibility with existing
  * genark table.
  */
 int genArkColumnCount();
 /* return number of columns in genark table */
 
+boolean isGenArk(char *genome);
+/* given a genome name, see if it is in the genark table to determine
+ *  yes/no this is a genark genome assembly
+ */
+
 #endif /* GENARK_H */