src/hg/encode/encodeValidate/doEncodeValidate.pl 1.149
1.149 2009/02/13 18:28:08 mikep
assuming last column is optional as missing from some data
Index: src/hg/encode/encodeValidate/doEncodeValidate.pl
===================================================================
RCS file: /projects/compbio/cvsroot/kent/src/hg/encode/encodeValidate/doEncodeValidate.pl,v
retrieving revision 1.148
retrieving revision 1.149
diff -b -B -U 4 -r1.148 -r1.149
--- src/hg/encode/encodeValidate/doEncodeValidate.pl 13 Feb 2009 18:21:58 -0000 1.148
+++ src/hg/encode/encodeValidate/doEncodeValidate.pl 13 Feb 2009 18:28:08 -0000 1.149
@@ -912,8 +912,9 @@
}
sub validateBowtie
# Unkown format (for download) from Wold lab.
+# Assume last column is optional
# Sample lines:-
# HWI-EAS229_75_30DY0AAXX:7:1:0:1545/1 + chr1 5983615 NCGTCCATCTCACATCGTCAGGAAAGGGGGAAGCACTGGATGGCTGTGGCCTCACAGGCAGGGAGAGTGGGGTCC IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII 0 0:G>N
# HWI-EAS229_75_30DY0AAXX:7:1:0:1591/1 - uc002fcb.1|22|70699936 45 CTATTTCCACCAAGCAGCCAAGCTCAAGGGAATCGGGGAGTACGTGAACATCCGCACAGGGATGCCCTGCCACTN IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII 0 0:T>N]
# HWI-EAS229_75_30DY0AAXX:7:1:0:1766/1 - chr18 72954304 GCAGCCACCAGAAGCGGGAAGAGGTGAAGACAGAGCCTCCTGCAGAGCTCCCACTCTGCCAACGCCTTGACTTTN IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII 0 0:G>N,59:T>G
@@ -927,9 +928,9 @@
chomp;
$lineNumber++;
next if m/^#/; # allow comment lines, consistent with lineFile and hgLoadBed
die "Failed bowtie validation, file '$file'; line $lineNumber: line=[$_]\n"
- unless $_ =~ m/^([A-Za-z0-9:>_,\.\|\/-]+)\t([+-])\t([A-Za-z0-9:>_,\.\|\/-]+)\t(\d+)\t(\w+)\t(\w+)\t(\d+)\t([A-Za-z0-9:>_,\.\|\/-]+)$/;
+ unless $_ =~ m/^([A-Za-z0-9:>_,\.\|\/-]+)\t([+-])\t([A-Za-z0-9:>_,\.\|\/-]+)\t(\d+)\t(\w+)\t(\w+)\t(\d+)\t([A-Za-z0-9:>_,\.\|\/-]+)?$/;
last if($opt_quick && $lineNumber >= $quickCount);
}
$fh->close();
HgAutomate::verbose(2, "File \'$file\' passed $type validation\n");