4ba0a7d92cc93673915bb6f24ae81435ea179ce3 hiram Wed Jan 31 17:02:58 2024 -0800 beginning to add a searchable table of genome meta data refs #23589; diff --git src/hg/lib/genomeData.sql src/hg/lib/genomeData.sql new file mode 100644 index 0000000..fb2ec78 --- /dev/null +++ src/hg/lib/genomeData.sql @@ -0,0 +1,47 @@ +# genomeData.sql was originally generated by the autoSql program, which also +# generated genomeData.c and genomeData.h. This creates the database representation of +# an object which can be loaded and saved from RAM in a fairly +# automatic way. + +#SQL table for NCBI assembly_summary data. +CREATE TABLE genomeData ( + assemblyAccession varchar(255) NOT NULL, # assemblyAccession + bioproject varchar(255), # bioproject + biosample varchar(255), # biosample + wgsMaster varchar(255), # wgsMaster + refseqCategory varchar(255), # refseqCategory + taxId int unsigned NOT NULL, # taxId + speciesTaxid int unsigned NOT NULL, # speciesTaxid + organismName varchar(255) NOT NULL, # organismName + infraspecificName varchar(255), # infraspecificName + isolate varchar(255), # isolate + versionStatus varchar(255) NOT NULL, # versionStatus + assemblyLevel varchar(255) NOT NULL, # assemblyLevel + releaseType varchar(255) NOT NULL, # releaseType + genomeRep varchar(255) NOT NULL, # genomeRep + seqRelDate varchar(255) NOT NULL, # seqRelDate + asmName varchar(255) NOT NULL, # asmName + asmSubmitter varchar(255), # asmSubmitter + gbrsPairedAsm varchar(255), # gbrsPairedAsm + pairedAsmComp varchar(255), # pairedAsmComp + ftpPath varchar(255), # ftpPath + excludedFromRefseq varchar(255), # excludedFromRefseq + relationToTypeMaterial varchar(255), # relationToTypeMaterial + assemblyType tinyint unsigned NOT NULL, # assemblyType + phyloGroup varchar(255) NOT NULL, # phyloGroup + genomeSize bigint NOT NULL, # genomeSize + genomeSizeUngapped bigint NOT NULL, # genomeSizeUngapped + gcPercent float NOT NULL, # gcPercent + repliconCount smallint unsigned NOT NULL, # repliconCount + scaffoldCount int unsigned NOT NULL, # scaffoldCount + contigCount int unsigned NOT NULL, # contigCount + annotationProvider varchar(255) NOT NULL, # annotationProvider + annotationName varchar(255) NOT NULL, # annotationName + annotationDate varchar(255) NOT NULL, # annotationDate + totalGeneCount varchar(255), # totalGeneCount + proteinCodingGeneCount int unsigned, # proteinCodingGeneCount + nonCodingGeneCount varchar(255), # nonCodingGeneCount + pubmedId varchar(255), # pubmedId + #Indices + PRIMARY KEY(assemblyAccession) +);