986c4ede954e44904eb314772fb2cf83a48d307c max Wed May 6 06:24:47 2026 -0700 varFreqs: lift GenomeAsia (gasp + gaspIndel) GRCh37 -> hg38 Both subtracks were served at /gbdb/hg38/ but the upstream callset is GRCh37 (caught in QA, see #36642 note 2026-05-04). Lifted with CrossMap using hg19ToHg38.over.chain.gz; recipe matches tishkoff180 / mxbFreq. gasp (SNVs): 66,236,516 -> 66,222,771 (99.98%; 6,240 unmapped + 7,505 alt/random) gaspIndel: 4,415,156 -> 4,410,871 (99.90%; 3,332 unmapped + 953 alt/random) New driver script: scripts/varFreqs/gaspLift.sh. gaspIndel bigDataUrl renamed from All.indels.annot.cont_withmaf.vcf.gz to ga100k.indels.vcf.gz (old name was a verbatim copy of the upstream download name). varFreqsAll combined bigBed regenerated to fold in the corrected coordinates (36.5 GB, 1,166,451,644 items, 125 fields). refs #36642 Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com> diff --git src/hg/makeDb/trackDb/human/varFreqs.ra src/hg/makeDb/trackDb/human/varFreqs.ra index 339c35c94f8..dc64555b103 100644 --- src/hg/makeDb/trackDb/human/varFreqs.ra +++ src/hg/makeDb/trackDb/human/varFreqs.ra @@ -11,31 +11,31 @@ longLabel Variant Frequencies: All Databases Combined with Consequence Annotations type bigBed 9 + parent varFreqs on bigDataUrl /gbdb/$D/varFreqs/varFreqsAll.bb visibility pack itemRgb on maxWindowToDraw 5000000 priority 0.1 #mouseOver $aaChange $dnaChange # Variant type and consequence filters filterValues.varType SNV|SNV,INS|Insertion,DEL|Deletion,MNV|MNV filterLabel.varType Variant Type filterValues.consequence missense|Missense,synonymous|Synonymous,stop_gained|Stop Gained,frameshift|Frameshift,splice_donor|Splice Donor,splice_acceptor|Splice Acceptor,intron|Intron,.|Intergenic filterLabel.consequence Consequence # Source database filter - filterValues.sources AllOfUs|AllOfUs,SPARK|SPARK WES,SFARI_WGS|SFARI WGS,GenomeAsia|GenomeAsia SNVs,GenomeAsiaIndel|GenomeAsia Indels,KOVA|KOVA Korea,ToMMo|ToMMo Japan,IndiGen|IndiGenomes India,FinnGen|FinnGen Finland,Saudi|Saudi,SweGen|SweGen Sweden,TOPMed|TOPMed,ABraOM|ABraOM Brazil,ALFA|ALFA,MGRB|MGRB Australia,HRC|HRC,MexBB|Mexico Biobank,SGDP|SGDP,HGDP1kG|gnomAD HGDP+1kG,GREGoR|GREGoR,SCHEMA|SCHEMA,GA4K|GA4K PacBio LR,CoLoRSdb|CoLoRSdb PacBio LR,SVatalog|SVatalog 101 10XG SR + filterValues.sources AllOfUs|AllOfUs,SPARK|SPARK WES,SFARI_WGS|SFARI WGS,GenomeAsia|GenomeAsia SNVs,GenomeAsiaIndel|GenomeAsia Indels,KOVA|KOVA Korea,ToMMo|ToMMo Japan,IndiGen|IndiGenomes India,FinnGen|FinnGen Finland,Saudi|Saudi,SweGen|SweGen Sweden,TOPMed|TOPMed,ABraOM|ABraOM Brazil,ALFA|ALFA,MGRB|MGRB Australia,HRC|HRC,MexBB|Mexico Biobank,SGDP|SGDP,HGDP1kG|gnomAD HGDP+1kG,GREGoR|GREGoR,SCHEMA|SCHEMA,GA4K|GA4K PacBio LR,CoLoRSdb|CoLoRSdb PacBio LR,SVatalog|SVatalog 101 10XG SR,Tishkoff180|Tishkoff 180 African WGS filterType.sources multipleListOr filterLabel.sources Source Database # Length filters filterByRange.refLen on filterLabel.refLen Reference Length filterByRange.altLen on filterLabel.altLen Alternate Length filterByRange.varLen on filterLabel.varLen Length Change # Max AF filter filterByRange.maxAF on filterLabel.maxAF Max Allele Frequency filterLimits.maxAF 0:1 # Total AC filter filterByRange.totalAC on @@ -77,30 +77,32 @@ filterLabel.MexBBAF Mexico Biobank AF filterByRange.SGDPAF on filterLabel.SGDPAF SGDP AF filterByRange.HGDP1kGAF on filterLabel.HGDP1kGAF gnomAD HGDP+1kG AF (4k cohort) filterByRange.GREGoRAF on filterLabel.GREGoRAF GREGoR AF filterByRange.SCHEMAAF on filterLabel.SCHEMAAF SCHEMA AF filterByRange.GA4KAF on filterLabel.GA4KAF GA4K PacBio LR AF filterByRange.CoLoRSdbAF on filterLabel.CoLoRSdbAF CoLoRSdb PacBio LR AF filterByRange.SVatalogAF on filterLabel.SVatalogAF SVatalog 101 10XG SR AF + filterByRange.Tishkoff180AF on + filterLabel.Tishkoff180AF Tishkoff 180 African WGS AF # Per-database AC filters filterByRange.AllOfUsAC on filterLabel.AllOfUsAC AllOfUs AC filterByRange.SPARKAC on filterLabel.SPARKAC SPARK WES AC filterByRange.SFARI_WGSAC on filterLabel.SFARI_WGSAC SFARI WGS AC filterByRange.GenomeAsiaAC on filterLabel.GenomeAsiaAC GenomeAsia SNVs AC filterByRange.GenomeAsiaIndelAC on filterLabel.GenomeAsiaIndelAC GenomeAsia Indels AC filterByRange.KOVAAC on filterLabel.KOVAAC KOVA Korea AC filterByRange.ToMMoAC on filterLabel.ToMMoAC ToMMo Japan AC @@ -126,30 +128,32 @@ filterLabel.MexBBAC Mexico Biobank AC filterByRange.SGDPAC on filterLabel.SGDPAC SGDP AC filterByRange.HGDP1kGAC on filterLabel.HGDP1kGAC gnomAD HGDP+1kG AC (4k cohort) filterByRange.GREGoRAC on filterLabel.GREGoRAC GREGoR AC filterByRange.SCHEMAAC on filterLabel.SCHEMAAC SCHEMA AC filterByRange.GA4KAC on filterLabel.GA4KAC GA4K PacBio LR AC filterByRange.CoLoRSdbAC on filterLabel.CoLoRSdbAC CoLoRSdb PacBio LR AC filterByRange.SVatalogAC on filterLabel.SVatalogAC SVatalog 101 10XG SR AC + filterByRange.Tishkoff180AC on + filterLabel.Tishkoff180AC Tishkoff 180 African WGS AC # Population-specific AF filters # AllOfUs local-ancestry populations # NB: these are local-ancestry-stratified frequencies (per-position, per-haplotype-class), # NOT the AllOfUs paper's global Rye ancestry categories. See varFreqs.html for details. filterByRange.AllOfUsAF_AFR on filterLabel.AllOfUsAF_AFR AllOfUs African AF (local ancestry) filterByRange.AllOfUsAF_AMR on filterLabel.AllOfUsAF_AMR AllOfUs Indigenous American AF (local ancestry) filterByRange.AllOfUsAF_EAS on filterLabel.AllOfUsAF_EAS AllOfUs East Asian AF (local ancestry) filterByRange.AllOfUsAF_EUR on filterLabel.AllOfUsAF_EUR AllOfUs European AF (local ancestry) filterByRange.AllOfUsAF_OCE on filterLabel.AllOfUsAF_OCE AllOfUs Oceanian AF (local ancestry) filterByRange.AllOfUsAF_SAS on @@ -367,40 +371,40 @@ type vcfTabix parent varFreqs on bigDataUrl /gbdb/$D/varFreqs/mgrb/MGRB.phase3.GRCh38.norm.vcf.gz dataVersion Phase 3 visibility dense # no downloads as per Matt Hobbs email Jan 28 2026 tableBrowser off track gasp shortLabel GenomeAsia 1.7k SNVs longLabel Variant Frequencies: GenomeAsia Pilot - Substitutions type vcfTabix parent varFreqs on bigDataUrl /gbdb/$D/varFreqs/ga100k/ga100k.subst.vcf.gz visibility dense - dataVersion Pilot 2019 (GRCh37 - to be lifted) + dataVersion Pilot 2019 (GRCh37 lifted to hg38 with CrossMap) track gaspIndel shortLabel GenomeAsia 1.7k Indels longLabel Variant Frequencies: GenomeAsia Pilot - Indels type vcfTabix parent varFreqs on - bigDataUrl /gbdb/$D/varFreqs/ga100k/All.indels.annot.cont_withmaf.vcf.gz + bigDataUrl /gbdb/$D/varFreqs/ga100k/ga100k.indels.vcf.gz visibility dense - dataVersion Pilot 2019 (GRCh37 - to be lifted) + dataVersion Pilot 2019 (GRCh37 lifted to hg38 with CrossMap) html gasp track abraom shortLabel Brazil ABraOM 1k WGS longLabel Variant Frequencies: ABraOM Brazil - 1,171 unrelated individuals type vcfTabix parent varFreqs on bigDataUrl /gbdb/$D/varFreqs/abraom/abraom.vcf.gz visibility dense dataVersion SABE-WGS-1171 Sep 2020 track indigenomes shortLabel India IndiGenomes 1k WGS longLabel Variant Frequencies: IndiGenomes India - 1,029 samples type vcfTabix