325f711f30c884459738f065f3415ce2914ec828
braney
  Wed Aug 13 16:18:51 2025 -0700
get hgConvert and hgLiftOver to use genark assemblies that are not in
the UCSC taxId list

diff --git src/hg/makeDb/doc/genarkOrg.txt src/hg/makeDb/doc/genarkOrg.txt
index 49af77240df..56c6073e73a 100644
--- src/hg/makeDb/doc/genarkOrg.txt
+++ src/hg/makeDb/doc/genarkOrg.txt
@@ -15,18 +15,18 @@
 grep "genbank common" names.dmp | tawk '{print $1, $3}' | sort > taxIdCommon.txt
 
 # mapping of genark accessions to NCBI Common names
 join -t $'\t' taxIdCommon.txt taxIdGC.txt | tawk '{print $3,$2}' | sort > gcToCommon.txt
 
 # get list of scientific names from NCBI taxonomy database
 grep "scientific" names.dmp | tawk '{print $1, $3}' | sort > taxIdScientific.txt
 
 # mapping of genark accessions to NCBI Scientific names
 join -t $'\t' taxIdScientific.txt taxIdGC.txt | tawk '{print $3,$2}' | sort > gcToSci.txt
 
 # get list of all GCs to make "other" file
 cut -f 2 taxIdGC.txt | sort > gc.txt
 tawk '{print $1, "Other"}' gc.txt > gcToOther.txt
 
-cat gcToUCSCOrg.txt gcToCommon.txt gcToSci.txt gcToOther.txt  | tawk '{if (!seen[$1]) print; seen[$1]=1}' | sort >  genarkOrg.txt
+cat gcToUCSCOrg.txt gcToCommon.txt gcToSci.txt gcToOther.txt  | tawk '{if (!seen[$1]) { $2 = toupper(substr($2,1,1)) tolower(substr($2,2));  print}; seen[$1]=1}' | sort >  genarkOrg.txt
 
 # load as genarkOrg table..