0bc6be88baf4061ca10c6f207331ec04e36c17f1
hiram
  Fri Feb 2 11:34:37 2024 -0800
better name for this table refs #23589

diff --git src/hg/lib/asmSummary.as src/hg/lib/asmSummary.as
new file mode 100644
index 0000000..4e5b7b2
--- /dev/null
+++ src/hg/lib/asmSummary.as
@@ -0,0 +1,41 @@
+table asmSummary
+"NCBI assembly_summary data, see: https://ftp.ncbi.nlm.nih.gov/genomes/ASSEMBLY_REPORTS/README_assembly_summary.txt"
+    (
+    string assemblyAccession;	"www.ncbi.nlm.nih.gov/assembly/?term=xxx"
+    string bioproject;	"www.ncbi.nlm.nih.gov/bioproject/?term=xxx"
+    string biosample;	"www.ncbi.nlm.nih.gov/biosample/?term=xxx"
+    string wgsMaster;	"www.ncbi.nlm.nih.gov/nuccore/xxx"
+    string refseqCategory;	"representative or reference"
+    uint taxId;	"www.ncbi.nlm.nih.gov/taxonomy/?term=xxx"
+    uint speciesTaxid;	"www.ncbi.nlm.nih.gov/taxonomy/?term=xxx"
+    string organismName;	"binomial scientific name"
+    string infraspecificName;	"strain/cultivar/ecotype/breed"
+    string isolate;	"source of sample"
+    string versionStatus;	"latest/suppressed/replaced"
+    string assemblyLevel;	"Contig/Scaffold/Complete Genome/Chromosome"
+    string releaseType;	"Major/Minor/Patch"
+    string genomeRep;	"Full/Partial"
+    string seqRelDate;	"date YYYY/MM/DD sequence released to INSDC"
+    string asmName;	"submitter supplied name"
+    string asmSubmitter;	"institution submitting assembly"
+    string gbrsPairedAsm;	"GenBank<->RefSeq GCA/GCF relationship"
+    string pairedAsmComp;	"identical/different for GCA<->GCF relationship"
+    string ftpPath;	"ftp.ncbi.nlm.nih.gov/genomes/all/GCx/012/345/678/asmId"
+    string excludedFromRefseq;	"noted reason for exclusion from RefSeq"
+    string relationToTypeMaterial;	"note of assembly relation to sample"
+    string assemblyType;	"haploid/diploid/haploid-with-alt-loci/alternate-pseudohaplotype"
+    string phyloGroup;	"bacteria/viral/archaea/fungi/metagenomes/invertebrate/other/vertebrate_other/plant/vertebrate_mammalian/protozoa"
+    bigint genomeSize;	"total length of all top-level sequences in the primary assembly"
+    bigint genomeSizeUngapped;	"genome length not counting gaps (gap == 10 or more Ns)"
+    float gcPercent;	"GC percent"
+    ushort repliconCount;	"total number of chromosomes, organelle genomes and plasmids"
+    uint scaffoldCount;	"number of scaffolds: placed, unlocalzes, unplace, alternate loci and patch"
+    uint contigCount;	"number of conts in the primary assembly"
+    string annotationProvider;	"the group that provied the annotation on the assembly"
+    string annotationName;	"the name of the annotation"
+    string annotationDate;	"annotation date YYYY/MM/DD"
+    string totalGeneCount;	"total gene count in annotation"
+    uint proteinCodingGeneCount;	"protein coding gene count in annotation"
+    string nonCodingGeneCount;	"non coding gene count in annotation"
+    string pubmedId;	"comma separated list of PubMed ID(s)"
+    )