34dc2bb14c176fb8f788df267fdb3fd4c8f461b4
braney
Fri Feb 17 07:00:46 2023 -0800
fix some encoding issues and an errant printf on the TOGO hgc page.
diff --git src/hg/hgc/togaClick.c src/hg/hgc/togaClick.c
index 5608e5c..00a4c8c 100644
--- src/hg/hgc/togaClick.c
+++ src/hg/hgc/togaClick.c
@@ -327,42 +327,42 @@
printf("We define the following variables:\n
\n");
printf("
c: number of reference bases in the intersection between chain blocks and coding exons of the gene under consideration.
\n");
printf("
C: number of reference bases in the intersection between chain blocks and coding exons of all genes.
\n");
printf("
a: number of reference bases in the intersection between chain blocks and coding exons and introns of the gene under consideration.
\n");
printf("
A: number of reference bases in the intersection between chain blocks and coding exons and introns of all genes and the intersection\n");
printf("between chain blocks and intergenic regions (excludes UTRs).
\n");
printf("
f: number of reference bases in chain blocks overlapping the 10 kb flanks of the gene under consideration.\n");
printf("Alignment blocks overlapping exons of another gene that is located in these 10 kb flanks are ignored.
\n");
printf("
i: number of reference bases in the intersection between chain blocks and introns of the gene under consideration.
\n");
printf("
CDS (coding sequence): length of the coding region of the gene under consideration.
\n");
printf("
I: sum of all intron lengths of the gene under consideration.
\n");
printf("
\n");
printf("Using these variables, TOGA computes the following features:\n");
printf("
\n");
-printf("
“global CDS fraction” as C / A. Chains with a high value have alignments that largely overlap coding exons,");
+printf("
"global CDS fraction" as C / A. Chains with a high value have alignments that largely overlap coding exons,");
printf("which is a hallmark of paralogous or processed pseudogene chains. In contrast, chains with a low value also align many ");
printf("intronic and intergenic regions, which is a hallmark of orthologous chains.
\n");
-printf("
“local CDS fraction” as c / a. Orthologous chains tend to have a lower value, as intronic ");
+printf("
"local CDS fraction" as c / a. Orthologous chains tend to have a lower value, as intronic ");
printf("regions partially align. This feature is not computed for single-exon genes.
\n");
-printf("
“local intron fraction” as i / I. Orthologous chains tend to have a higher value.");
+printf("
"local intron fraction" as i / I. Orthologous chains tend to have a higher value.");
printf("This feature is not computed for single-exon genes.
\n");
-printf("
“flank fraction” as f / 20,000. Orthologous chains tend to have higher values,");
+printf("
"flank fraction" as f / 20,000. Orthologous chains tend to have higher values,");
printf("as flanking intergenic regions partially align. This feature is important to detect orthologous loci of single-exon genes.
\n");
-printf("
“synteny” as log10 of the number of genes, whose coding exons overlap by at least one base aligning");
+printf("
"synteny" as log10 of the number of genes, whose coding exons overlap by at least one base aligning");
printf("blocks of this chain. Orthologous chains tend to cover several genes located in a conserved order, resulting in higher synteny values.
\n");
-printf("
“local CDS coverage” as c / CDS, which is only used for single-exon genes.
\n");
+printf("
"local CDS coverage" as c / CDS, which is only used for single-exon genes.
\n");
printf("
\n");
printf("\n\n \n");
htmlHorizontalLine();
// show inact mut plot
printf("
Visualization of inactivating mutations on exon-intron structure
\n");
printf("%s \n", info->svg_line);
printf(" Exons shown in grey are missing (often overlap assembly gaps).\nExons shown in");
printf(" red or blue are deleted or do not align at all.\nRed indicates that the exon deletion ");
printf("shifts the reading frame, while blue indicates that exon deletion(s) are framepreserving. \n");
// GLP features
printf("Show features used for transcript classification\n");
@@ -419,31 +419,30 @@
printf("\n \n");
// show exons data
htmlHorizontalLine();
printf("
\n \n");
// TODO: check whether I need this
-printf("%s", hgTracksPathAndSettings());
hPrintf("");
hPrintf("");
hPrintf("");
printTrackHtml(tdb); // and do I need this?
}
void doHillerLabTOGAGene(char *database, struct trackDb *tdb, char *item, char *table_name)
/* Put up TOGA Gene track info. */
{
//int start = cartInt(cart, "o");
char headerTitle[512];
char suffix[512];
@@ -516,42 +515,42 @@
printf("We define the following variables:\n
\n");
printf("
c: number of reference bases in the intersection between chain blocks and coding exons of the gene under consideration.
\n");
printf("
C: number of reference bases in the intersection between chain blocks and coding exons of all genes.
\n");
printf("
a: number of reference bases in the intersection between chain blocks and coding exons and introns of the gene under consideration.
\n");
printf("
A: number of reference bases in the intersection between chain blocks and coding exons and introns of all genes and the intersection\n");
printf("between chain blocks and intergenic regions (excludes UTRs).
\n");
printf("
f: number of reference bases in chain blocks overlapping the 10 kb flanks of the gene under consideration.\n");
printf("Alignment blocks overlapping exons of another gene that is located in these 10 kb flanks are ignored.
\n");
printf("
i: number of reference bases in the intersection between chain blocks and introns of the gene under consideration.
\n");
printf("
CDS (coding sequence): length of the coding region of the gene under consideration.
\n");
printf("
I: sum of all intron lengths of the gene under consideration.
\n");
printf("
\n");
printf("Using these variables, TOGA computes the following features:\n");
printf("
\n");
- printf("
“global CDS fraction” as C / A. Chains with a high value have alignments that largely overlap coding exons,");
+ printf("
"global CDS fraction" as C / A. Chains with a high value have alignments that largely overlap coding exons,");
printf("which is a hallmark of paralogous or processed pseudogene chains. In contrast, chains with a low value also align many ");
printf("intronic and intergenic regions, which is a hallmark of orthologous chains.
\n");
- printf("
“local CDS fraction” as c / a. Orthologous chains tend to have a lower value, as intronic ");
+ printf("
"local CDS fraction" as c / a. Orthologous chains tend to have a lower value, as intronic ");
printf("regions partially align. This feature is not computed for single-exon genes.
\n");
- printf("
“local intron fraction” as i / I. Orthologous chains tend to have a higher value.");
+ printf("
"local intron fraction" as i / I. Orthologous chains tend to have a higher value.");
printf("This feature is not computed for single-exon genes.
\n");
- printf("
“flank fraction” as f / 20,000. Orthologous chains tend to have higher values,");
+ printf("
"flank fraction" as f / 20,000. Orthologous chains tend to have higher values,");
printf("as flanking intergenic regions partially align. This feature is important to detect orthologous loci of single-exon genes.
\n");
- printf("
“synteny” as log10 of the number of genes, whose coding exons overlap by at least one base aligning");
+ printf("
"synteny" as log10 of the number of genes, whose coding exons overlap by at least one base aligning");
printf("blocks of this chain. Orthologous chains tend to cover several genes located in a conserved order, resulting in higher synteny values.
\n");
- printf("
“local CDS coverage” as c / CDS, which is only used for single-exon genes.
\n");
+ printf("
"local CDS coverage" as c / CDS, which is only used for single-exon genes.
\n");
printf("
\n");
printf("\n\n \n");
htmlHorizontalLine();
// show inact mut plot
printf("
Visualization of inactivating mutations on exon-intron structure
\n");
printf("%s \n", info->svg_line);
printf(" Exons shown in grey are missing (often overlap assembly gaps).\nExons shown in");
printf(" red or blue are deleted or do not align at all.\nRed indicates that the exon deletion ");
printf("shifts the reading frame, while blue indicates that exon deletion(s) are framepreserving. \n");
// GLP features
printf("Show features used for transcript classification\n");