ca23d9f5054fc863beb18d7ef4919b550b2f8d9c
chmalee
  Mon Jun 1 10:45:37 2026 -0700
Allow dot in genome names in hubspace uploads, refs #37665

diff --git src/hg/hgHubConnect/hooks/pre-finish.c src/hg/hgHubConnect/hooks/pre-finish.c
index 1a5ade8b314..ca5ba1323a8 100644
--- src/hg/hgHubConnect/hooks/pre-finish.c
+++ src/hg/hgHubConnect/hooks/pre-finish.c
@@ -1,274 +1,276 @@
 /* pre-finish  - tus daemon pre-finish hook program. Reads
  * a JSON encoded request to finsh an upload from a tus
  * client and moves a downloaded file to a specific user
  * directory. */
 #include "common.h"
 #include "linefile.h"
 #include "hash.h"
 #include "options.h"
 #include "wikiLink.h"
 #include "customTrack.h"
 #include "userdata.h"
 #include "jsonQuery.h"
 #include "jsHelper.h"
 #include "errCatch.h"
 #include "obscure.h"
 #include "hooklib.h"
 #include "jksql.h"
 #include "hdb.h"
 #include "hubSpace.h"
 #include "hubSpaceKeys.h"
 #include "md5.h"
 #include "cheapcgi.h"
 
 void usage()
 /* Explain usage and exit. */
 {
 errAbort(
   "pre-finish - tus daemon pre-finish hook program\n"
   "usage:\n"
   "   pre-finish < input\n"
   );
 }
 
 /* Command line validation table. */
 static struct optionSpec options[] = {
    {NULL, 0},
 };
 
 int preFinish()
 /* pre-finish hook for tus daemon. Read JSON encoded hook request from
  * stdin and write a JSON encoded hook to stdout. Writing to stderr
  * will be redirected to the tusd log and not seen by the user, so for
  * errors that the user needs to see, they need to be in the JSON response */
 {
 // TODO: create response object and do all error catching through that
 char *reqId = getenv("TUS_ID");
 // always return an exit status to the daemon and print to stdout, as
 // stdout gets sent by the daemon back to the client
 int exitStatus = 0;
 struct jsonElement *response = makeDefaultResponse();
 if (!(reqId))
     {
     rejectUpload(response, "not a TUS request");
     exitStatus = 1;
     }
 else
     {
     char *tusFile = NULL, *tusInfo = NULL;
     struct errCatch *errCatch = errCatchNew(0);
     if (errCatchStart(errCatch))
         {
         // the variables for the row entry for this file, some can be NULL
         char *userName = NULL;
         char *dataDir = NULL, *userDataDir = NULL;
         char *fileName = NULL;
         long long fileSize = 0;
         char *fileType = NULL;
         char *db = NULL;
         char *reqLm = NULL;
         time_t lastModified = 0;
         boolean isHubToolsUpload = FALSE;
         char *parentDir = NULL, *encodedParentDir = NULL;
 
         struct lineFile *lf = lineFileStdin(FALSE);
         char *request = lineFileReadAll(lf);
         struct jsonElement *req = jsonParse(request);
         fprintf(stderr, "Hook request:\n");
         jsonPrintToFile(req, NULL, stderr, 0);
         char *reqCookie= jsonQueryString(req, "", "Event.HTTPRequest.Header.Cookie[0]", NULL);
         if (reqCookie)
             {
             setenv("HTTP_COOKIE", reqCookie, 0);
             }
         fprintf(stderr, "reqCookie='%s'\n", reqCookie);
         userName = getUserName();
         if (!userName)
             {
             // maybe an apiKey was provided, use that instead to look up the userName
             char *apiKey = jsonQueryString(req, "", "Event.Upload.MetaData.apiKey", NULL);
             userName = hubSpaceUserNameForApiKey(NULL, apiKey);
             if (!userName)
                 errAbort("You are not logged in. Please navigate to My Data -> My Sessions and log in or create an account.");
             }
         fprintf(stderr, "userName='%s'\n", userName);
         // NOTE: All Upload.MetaData values are strings
         // Check multiple possible metadata keys for filename (Uppy sends 'filename' and 'name' by default,
         // our JS code also sets 'fileName' - try all to handle resumed uploads with old metadata)
         char *rawFileName = jsonQueryString(req, "", "Event.Upload.MetaData.fileName", NULL);
         if (!rawFileName)
             rawFileName = jsonQueryString(req, "", "Event.Upload.MetaData.filename", NULL);
         if (!rawFileName)
             rawFileName = jsonQueryString(req, "", "Event.Upload.MetaData.name", NULL);
         fileName = rawFileName ? cgiEncodeFull(rawFileName) : NULL;
         fileSize = jsonQueryInt(req, "",  "Event.Upload.Size", 0, NULL);
         fileType = jsonQueryString(req, "", "Event.Upload.MetaData.fileType", NULL);
         db = jsonQueryString(req, "", "Event.Upload.MetaData.genome", NULL);
         // Blocks newline injection into the synthesized hub.txt.
+        // The allowed character class must match sanitizeGenomeName() in
+        // src/hg/js/hgMyData.js.
         if (db && db[0])
             {
             char *p;
             for (p = db; *p; p++)
-                if (!(isalnum((unsigned char)*p) || *p == '_' || *p == '-'))
-                    errAbort("Invalid genome name '%s': only letters, digits, '_' and '-' are allowed", db);
+                if (!(isalnum((unsigned char)*p) || *p == '_' || *p == '-' || *p == '.'))
+                    errAbort("Invalid genome name '%s': only letters, digits, '.', '_' and '-' are allowed", db);
             }
         reqLm = jsonQueryString(req, "", "Event.Upload.MetaData.lastModified", NULL);
         if (reqLm)
             lastModified = sqlLongLong(reqLm) / 1000; // yes Javascript dates are in millis
         else
             lastModified = time(NULL); // fallback to current time if not provided
         parentDir = jsonQueryString(req, "", "Event.Upload.MetaData.parentDir", NULL);
         fprintf(stderr, "parentDir = '%s'\n", parentDir ? parentDir : "(null)");
         // strip out plain leading '.' and '/' components
         // middle '.' components are dealt with later
         if (parentDir && (startsWith("./", parentDir) || startsWith("/", parentDir)))
             parentDir = skipBeyondDelimit(parentDir, '/');
         tusFile = jsonQueryString(req, "", "Event.Upload.Storage.Path", NULL);
         tusInfo = jsonQueryString(req, "", "Event.Upload.Storage.InfoPath", NULL);
         if (fileName == NULL)
             {
             errAbort("No filename found in upload metadata (checked fileName, filename, and name)");
             }
         else if (tusFile == NULL)
             {
             errAbort("No Event.Path setting");
             }
         else
             {
             userDataDir = dataDir = getDataDir(userName);
             // if parentDir provided we are throwing the files in there
             if (parentDir)
                 {
                 encodedParentDir = encodePath(parentDir);
                 if (!endsWith(encodedParentDir, "/"))
                     encodedParentDir = catTwoStrings(encodedParentDir, "/");
                 dataDir = catTwoStrings(dataDir, encodedParentDir);
                 }
             // the directory may not exist yet
             int oldUmask = 00;
             if (!isDirectory(dataDir))
                 {
                 fprintf(stderr, "making directory '%s'\n", dataDir);
                 // the directory needs to be 777, so ignore umask for now
                 oldUmask = umask(0);
                 makeDirsOnPath(dataDir);
                 // restore umask
                 umask(oldUmask);
                 }
             mustRemove(tusInfo);
             }
 
         // we've passed all the checks so we can write a new or updated row
         // to the mysql table and return to the client that we were successful
         if (exitStatus == 0)
             {
             // create a hub for this upload, which can be edited later
             struct hubSpace *row = NULL;
             AllocVar(row);
             row->userName = userName;
             row->fileName = fileName;
             row->fileSize = fileSize;
             row->fileType = fileType;
             row->creationTime = NULL; // automatically handled by mysql
             row->lastModified = sqlUnixTimeToDate(&lastModified, TRUE);
             row->db = db;
             // resolve any symlinks in the path, because tusd sets the path as
             // the command line specified dataDir + pre-create's ChangeFileInfo
             // this was leading to a bug where the uploaded file had the symlinked
             // path, but the containing hub.txt and directory row had the realpath,
             // which was causing confusion in the UI code
             char *canonicalPath = realpath(tusFile, NULL);
             if (canonicalPath != NULL)
                 row->location = canonicalPath;
             else
                 {
                 // all upload data should have been received and thus the realpath
                 // should not fail, but just in case, put something valid here
                 row->location = tusFile;
                 }
             row->md5sum = md5HexForFile(row->location);
             row->parentDir = encodedParentDir ? encodedParentDir : "";
             // Derive hubType server-side; never trust the client's hubType.
             // A 2bit always promotes its hub to assembly. Otherwise inherit
             // the existing hub's type, defaulting to trackHub.
             char *parentDirForCheck = encodedParentDir ? hubNameFromPath(encodedParentDir) : "";
             if (sameOk(fileType, "2bit"))
                 row->hubType = "assemblyHub";
             else
                 {
                 char *existingType = existingHubTypeForDir(userName, parentDirForCheck);
                 row->hubType = existingType ? existingType : "trackHub";
                 }
             char *batchHasHubTxtStr = jsonQueryString(req, "", "Event.Upload.MetaData.batchHasHubTxt", NULL);
             boolean batchHasHubTxt = sameOk(batchHasHubTxtStr, "true");
             boolean userOwnNamedHubTxt = userHasOwnNamedHubTxtInDir(userName, parentDirForCheck);
             boolean userAuth = batchHasHubTxt || userOwnNamedHubTxt;
             boolean isHubTxt = sameOk(fileType, "hub.txt");
             boolean isTwoBit = sameOk(fileType, "2bit");
 
             // Serialize hub.txt read-modify-write across parallel pre-finish
             // processes for the same hub. flock is held for the entire
             // decision + action so writeHubText's fileExists check and the
             // upgrade's read-rewrite are atomic with respect to siblings.
             // Without a parentDir there is no hub to protect.
             int hubLockFd = encodedParentDir ? lockHubDir(dataDir) : -1;
             if (!isHubToolsUpload && !isHubTxt)
                 {
                 if (!userAuth)
                     {
                     if (isTwoBit)
                         {
                         if (!literalHubTxtExistsOnDisk(parentDirForCheck, userDataDir))
                             createNewTempHubForUpload(reqId, row, userDataDir, encodedParentDir);
                         upgradeExistingHubToAssembly(row, userDataDir, encodedParentDir);
                         }
                     else
                         createNewTempHubForUpload(reqId, row, userDataDir, encodedParentDir);
                     }
                 else if (isTwoBit)
                     {
                     // user's hub.txt is authoritative; just flip rows to assemblyHub.
                     upgradeExistingHubToAssembly(row, userDataDir, encodedParentDir);
                     }
                 }
             unlockHubDir(hubLockFd);
             // first make the parentDir rows
             makeParentDirRows(row->userName, sqlDateToUnixTime(row->lastModified), row->db, row->parentDir, userDataDir, row->hubType);
             row->parentDir = encodedParentDir ? hubNameFromPath(encodedParentDir) : "";
             addHubSpaceRowForFile(row);
             fprintf(stderr, "added hubSpace row for file '%s'\n", fileName);
             fflush(stderr);
             }
         }
     if (errCatch->gotError)
         {
         // App-level reject: exit 0 + RejectUpload=true is the tusd protocol for
         // forwarding HTTPResponse verbatim. Non-zero gets wrapped.
         rejectUpload(response, errCatch->message->string);
         // must remove the tusd temp files so if the users tries again after a temp error
         // the upload will work
         if (tusFile)
             {
             mustRemove(tusFile);
             mustRemove(tusInfo);
             }
         // TODO: if the first mysql request in createNewTempHubForUpload() works but then
         // either of makeParentDirRows() or addHubSpaceRowForFile() fails, we need to also
         // drop any rows we may have added because the upload didn't full go through
         exitStatus = 0;
         }
     errCatchEnd(errCatch);
     }
 // always print a response no matter what
 jsonPrintToFile(response, NULL, stdout, 0);
 return exitStatus;
 }
 
 int main(int argc, char *argv[])
 /* Process command line. */
 {
 optionInit(&argc, argv, options);
 if (argc != 1)
     usage();
 return preFinish();
 }