5ca30cc929e4339791f5e9886caadc4e7922df56 hiram Mon May 17 12:51:02 2021 -0700 shorten the version string and extract the version number correctly refs #27575 diff --git src/hg/utils/automation/doNcbiRefSeq.pl src/hg/utils/automation/doNcbiRefSeq.pl index 2f93677..f74e1db 100755 --- src/hg/utils/automation/doNcbiRefSeq.pl +++ src/hg/utils/automation/doNcbiRefSeq.pl @@ -329,31 +329,31 @@ my $dbTwoBit = "$HgAutomate::clusterData/$db/$db.2bit"; $dbTwoBit = $target2bit if (-s "$target2bit"); $bossScript->add(<<_EOF_ # establish all variables to use here export asmId=$asmId export downloadDir=$downloadDir export ncbiGffGz=\$downloadDir/\${asmId}_genomic.gff.gz export db=$db export gff3ToRefLink=$gff3ToRefLink export gbffToCds=$gbffToCds export dateStamp=`date "+%F"` -export annotationRelease=`zcat \$ncbiGffGz | head -100 | grep ^#.annotation-source | sed -e 's/.*annotation-source //'` +export annotationRelease=`zcat \$ncbiGffGz | head -100 | grep ^#.annotation-source | sed -e 's/.*annotation-source //; s/ Updated Annotation Release//;'` if [ "\$annotationRelease" == "" ]; then export annotationRelease=\$asmId fi export versionDate=`ls -L --full-time \$ncbiGffGz | awk '{print \$6;}'` echo "\$annotationRelease (\$versionDate)" > ncbiRefSeqVersion.txt # this produces the genePred in NCBI coordinates # 8/23/17: gff3ToGenePred quits over illegal attribute SO_type... make it legal (so_type): if [ -s ../../../download/\${asmId}.remove.dups.list ]; then zcat \$ncbiGffGz | grep -v -f ../../../download/\${asmId}.remove.dups.list \\ | sed -re 's/([;\\t])SO_type=/\\1so_type=/;' \\ | gff3ToGenePred $warnOnly -refseqHacks -attrsOut=\$asmId.attrs.txt \\ -unprocessedRootsOut=\$asmId.unprocessedRoots.txt stdin \$asmId.gp else zcat \$ncbiGffGz \\ @@ -562,30 +562,31 @@ my $bossScript = newBash HgRemoteScript("$runDir/doLoad.bash", $dbHost, $runDir, $whatItDoes); my $gbdbDir = "$HgAutomate::gbdb/\$db/ncbiRefSeq"; my $dbTwoBit = "$HgAutomate::clusterData/$db/$db.2bit"; $dbTwoBit = $target2bit if (-s "$target2bit"); my $genePredCheckDb = "genePredCheck -db=\$db"; if (! $dbExists) { $genePredCheckDb = "genePredCheck"; } my $verString = `cat $buildDir/process/ncbiRefSeqVersion.txt`; chomp $verString; $verString =~ s/.*elease //; + $verString =~ s/^[^0-9]*//; $verString =~ s/ .*//; $bossScript->add(<<_EOF_ # establish all variables to use here export db="$db" export asmId="$asmId" export verString="$verString" _EOF_ ); if (! $dbExists) { $bossScript->add(<<_EOF_ export target2bit=$dbTwoBit