diff --git a/packages/apollo-shared/src/GFF3/gff3ToAnnotationFeature.test.ts b/packages/apollo-shared/src/GFF3/gff3ToAnnotationFeature.test.ts index 9dbfec41..f2cb5f24 100644 --- a/packages/apollo-shared/src/GFF3/gff3ToAnnotationFeature.test.ts +++ b/packages/apollo-shared/src/GFF3/gff3ToAnnotationFeature.test.ts @@ -4,6 +4,7 @@ import gff from '@gmod/gff' import { assert, use } from 'chai' import chaiExclude from 'chai-exclude' +import { readFileSync } from 'node:fs' import { gff3ToAnnotationFeature } from './gff3ToAnnotationFeature' import { AnnotationFeatureSnapshot } from '@apollo-annotation/mst' @@ -106,15 +107,66 @@ function compareFeatures( ) } -describe('gff3ToAnnotationFeature', () => { - for (const testCase of testCases) { - const [description, featureLine, convertedFeature] = testCase - it(`converts ${description}`, () => { - const gff3Feature = gff.parseStringSync(featureLine, { - parseSequences: false, - }) - const feature = gff3ToAnnotationFeature(gff3Feature[0]) - compareFeatures(convertedFeature, feature) - }) +function readSingleFeatureFile(fn: string): GFF3Feature { + const lines = readFileSync(fn).toString().split('\n') + const feature: string[] = [] + for (const line of lines) { + if (!line.startsWith('#')) { + feature.push(line) + } } + const inGff = gff.parseStringSync(feature.join('\n')) as GFF3Feature[] + if (inGff.length != 1) { + throw new Error(`Exactly 1 feature expected in file ${fn}`) + } + return inGff[0] +} + +function readAnnotationFeatureSnapshot(fn: string): AnnotationFeatureSnapshot { + const lines = readFileSync(fn).toString() + return JSON.parse(lines) as AnnotationFeatureSnapshot +} + +describe('gff3ToAnnotationFeature examples', () => { + it('Convert one CDS', () => { + const actual = gff3ToAnnotationFeature( + readSingleFeatureFile('test_data/one_cds.gff3'), + ) + const expected = readAnnotationFeatureSnapshot('test_data/one_cds.json') + compareFeatures(actual, expected) + }) + it('Convert two CDSs', () => { + const actual = gff3ToAnnotationFeature( + readSingleFeatureFile('test_data/two_cds.gff3'), + ) + const expected = readAnnotationFeatureSnapshot('test_data/two_cds.json') + compareFeatures(actual, expected) + }) + it('Convert example 1', () => { + const actual = gff3ToAnnotationFeature( + readSingleFeatureFile('test_data/example01.gff3'), + ) + const expected = readAnnotationFeatureSnapshot('test_data/example01.json') + compareFeatures(actual, expected) + }) + it('Convert example 2', () => { + const actual = gff3ToAnnotationFeature( + readSingleFeatureFile('test_data/example02.gff3'), + ) + const expected = readAnnotationFeatureSnapshot('test_data/example02.json') + compareFeatures(actual, expected) + }) }) + +// describe('gff3ToAnnotationFeature', () => { +// for (const testCase of testCases) { +// const [description, featureLine, convertedFeature] = testCase +// it(`converts ${description}`, () => { +// const gff3Feature = gff.parseStringSync(featureLine, { +// parseSequences: false, +// }) +// const feature = gff3ToAnnotationFeature(gff3Feature[0]) +// compareFeatures(convertedFeature, feature) +// }) +// } +// }) diff --git a/packages/apollo-shared/src/GFF3/gff3ToAnnotationFeature.ts b/packages/apollo-shared/src/GFF3/gff3ToAnnotationFeature.ts index add25725..afddf059 100644 --- a/packages/apollo-shared/src/GFF3/gff3ToAnnotationFeature.ts +++ b/packages/apollo-shared/src/GFF3/gff3ToAnnotationFeature.ts @@ -112,7 +112,6 @@ function convertFeatureAttributes( convertedAttributes.gff_source = [source] } if (attributesCollections.length > 0) { - // const newAttributes: Record = {} for (const attributesCollection of attributesCollections) { for (const [key, val] of Object.entries(attributesCollection)) { if (!val || key === 'Parent') { @@ -121,7 +120,7 @@ function convertFeatureAttributes( const newKey = isGFFReservedAttribute(key) ? gffToInternal[key] : key const existingVal = convertedAttributes[newKey] if (existingVal) { - const valSet = new Set(...existingVal, ...val) + const valSet = new Set([...existingVal, ...val]) convertedAttributes[newKey] = [...valSet] } else { convertedAttributes[newKey] = val diff --git a/packages/apollo-shared/test_data/example01.gff3 b/packages/apollo-shared/test_data/example01.gff3 new file mode 100644 index 00000000..bdedf2aa --- /dev/null +++ b/packages/apollo-shared/test_data/example01.gff3 @@ -0,0 +1,26 @@ +##gff-version 3 +##sequence-region chr1 1000 9000 +#example01 +chr1 . gene 1000 9000 . + . ID=gene10001;Name=EDEN +chr1 . TF_binding_site 1000 1012 . + . ID=tfbs10001;Parent=gene10001 +chr1 . mRNA 1050 9000 . + . ID=mRNA10001;Parent=gene10001;Name=EDEN.1 +chr1 . mRNA 1050 9000 . + . ID=mRNA10002;Parent=gene10001;Name=EDEN.2 +chr1 . mRNA 1300 9000 . + . ID=mRNA10003;Parent=gene10001;Name=EDEN.3 +chr1 . exon 1050 1500 . + . ID=exon10001;Parent=mRNA10001,mRNA10002 +chr1 . exon 1300 1500 . + . ID=exon10002;Parent=mRNA10003 +chr1 . exon 3000 3902 . + . ID=exon10003;Parent=mRNA10001,mRNA10003 +chr1 . exon 5000 5500 . + . ID=exon10004;Parent=mRNA10001,mRNA10002,mRNA10003 +chr1 . exon 7000 9000 . + . ID=exon10005;Parent=mRNA10001,mRNA10002,mRNA10003 +chr1 . CDS 1201 1500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1 +chr1 . CDS 3000 3902 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1 +chr1 . CDS 5000 5500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1 +chr1 . CDS 7000 7600 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1 +chr1 . CDS 1201 1500 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2 +chr1 . CDS 5000 5500 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2 +chr1 . CDS 7000 7600 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2 +chr1 . CDS 3301 3902 . + 0 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3 +chr1 . CDS 5000 5500 . + 1 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3 +chr1 . CDS 7000 7600 . + 1 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3 +chr1 . CDS 3391 3902 . + 0 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4 +chr1 . CDS 5000 5500 . + 1 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4 +chr1 . CDS 7000 7600 . + 1 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4 diff --git a/packages/apollo-shared/test_data/example01.json b/packages/apollo-shared/test_data/example01.json new file mode 100644 index 00000000..3027490a --- /dev/null +++ b/packages/apollo-shared/test_data/example01.json @@ -0,0 +1,236 @@ +{ + "_id": "66d7151100dcdf7dda49178d", + "refSeq": "chr1", + "type": "gene", + "min": 999, + "max": 9000, + "strand": 1, + "children": { + "66d7151100dcdf7dda49177a": { + "_id": "66d7151100dcdf7dda49177a", + "refSeq": "chr1", + "type": "TF_binding_site", + "min": 999, + "max": 1012, + "strand": 1, + "attributes": { + "gff_id": ["tfbs10001"] + } + }, + "66d7151100dcdf7dda491780": { + "_id": "66d7151100dcdf7dda491780", + "refSeq": "chr1", + "type": "mRNA", + "min": 1049, + "max": 9000, + "strand": 1, + "children": { + "66d7151100dcdf7dda49177b": { + "_id": "66d7151100dcdf7dda49177b", + "refSeq": "chr1", + "type": "exon", + "min": 1049, + "max": 1500, + "strand": 1, + "attributes": { + "gff_id": ["exon10001"] + } + }, + "66d7151100dcdf7dda49177c": { + "_id": "66d7151100dcdf7dda49177c", + "refSeq": "chr1", + "type": "exon", + "min": 2999, + "max": 3902, + "strand": 1, + "attributes": { + "gff_id": ["exon10003"] + } + }, + "66d7151100dcdf7dda49177d": { + "_id": "66d7151100dcdf7dda49177d", + "refSeq": "chr1", + "type": "exon", + "min": 4999, + "max": 5500, + "strand": 1, + "attributes": { + "gff_id": ["exon10004"] + } + }, + "66d7151100dcdf7dda49177e": { + "_id": "66d7151100dcdf7dda49177e", + "refSeq": "chr1", + "type": "exon", + "min": 6999, + "max": 9000, + "strand": 1, + "attributes": { + "gff_id": ["exon10005"] + } + }, + "66d7151100dcdf7dda49177f": { + "_id": "66d7151100dcdf7dda49177f", + "refSeq": "chr1", + "type": "CDS", + "min": 1200, + "max": 7600, + "strand": 1, + "attributes": { + "gff_id": ["cds10001"], + "gff_name": ["edenprotein.1"] + } + } + }, + "attributes": { + "gff_id": ["mRNA10001"], + "gff_name": ["EDEN.1"] + } + }, + "66d7151100dcdf7dda491785": { + "_id": "66d7151100dcdf7dda491785", + "refSeq": "chr1", + "type": "mRNA", + "min": 1049, + "max": 9000, + "strand": 1, + "children": { + "66d7151100dcdf7dda491781": { + "_id": "66d7151100dcdf7dda491781", + "refSeq": "chr1", + "type": "exon", + "min": 1049, + "max": 1500, + "strand": 1, + "attributes": { + "gff_id": ["exon10001"] + } + }, + "66d7151100dcdf7dda491782": { + "_id": "66d7151100dcdf7dda491782", + "refSeq": "chr1", + "type": "exon", + "min": 4999, + "max": 5500, + "strand": 1, + "attributes": { + "gff_id": ["exon10004"] + } + }, + "66d7151100dcdf7dda491783": { + "_id": "66d7151100dcdf7dda491783", + "refSeq": "chr1", + "type": "exon", + "min": 6999, + "max": 9000, + "strand": 1, + "attributes": { + "gff_id": ["exon10005"] + } + }, + "66d7151100dcdf7dda491784": { + "_id": "66d7151100dcdf7dda491784", + "refSeq": "chr1", + "type": "CDS", + "min": 1200, + "max": 7600, + "strand": 1, + "attributes": { + "gff_id": ["cds10002"], + "gff_name": ["edenprotein.2"] + } + } + }, + "attributes": { + "gff_id": ["mRNA10002"], + "gff_name": ["EDEN.2"] + } + }, + "66d7151100dcdf7dda49178c": { + "_id": "66d7151100dcdf7dda49178c", + "refSeq": "chr1", + "type": "mRNA", + "min": 1299, + "max": 9000, + "strand": 1, + "children": { + "66d7151100dcdf7dda491786": { + "_id": "66d7151100dcdf7dda491786", + "refSeq": "chr1", + "type": "exon", + "min": 1299, + "max": 1500, + "strand": 1, + "attributes": { + "gff_id": ["exon10002"] + } + }, + "66d7151100dcdf7dda491787": { + "_id": "66d7151100dcdf7dda491787", + "refSeq": "chr1", + "type": "exon", + "min": 2999, + "max": 3902, + "strand": 1, + "attributes": { + "gff_id": ["exon10003"] + } + }, + "66d7151100dcdf7dda491788": { + "_id": "66d7151100dcdf7dda491788", + "refSeq": "chr1", + "type": "exon", + "min": 4999, + "max": 5500, + "strand": 1, + "attributes": { + "gff_id": ["exon10004"] + } + }, + "66d7151100dcdf7dda491789": { + "_id": "66d7151100dcdf7dda491789", + "refSeq": "chr1", + "type": "exon", + "min": 6999, + "max": 9000, + "strand": 1, + "attributes": { + "gff_id": ["exon10005"] + } + }, + "66d7151100dcdf7dda49178a": { + "_id": "66d7151100dcdf7dda49178a", + "refSeq": "chr1", + "type": "CDS", + "min": 3300, + "max": 7600, + "strand": 1, + "attributes": { + "gff_id": ["cds10003"], + "gff_name": ["edenprotein.3"] + } + }, + "66d7151100dcdf7dda49178b": { + "_id": "66d7151100dcdf7dda49178b", + "refSeq": "chr1", + "type": "CDS", + "min": 3390, + "max": 7600, + "strand": 1, + "attributes": { + "gff_id": ["cds10004"], + "gff_name": ["edenprotein.4"] + } + } + }, + "attributes": { + "gff_id": ["mRNA10003"], + "gff_name": ["EDEN.3"] + } + } + }, + "attributes": { + "gff_id": ["gene10001"], + "gff_name": ["EDEN"] + } +} diff --git a/packages/apollo-shared/test_data/example02.gff3 b/packages/apollo-shared/test_data/example02.gff3 new file mode 100644 index 00000000..34eb3a6b --- /dev/null +++ b/packages/apollo-shared/test_data/example02.gff3 @@ -0,0 +1,31 @@ +##gff-version 3 +##sequence-region chr1 1000 9000 +# example 2 +chr1 . gene 1000 9000 . + . ID=gene10001;Name=EDEN +chr1 . mRNA 1050 9000 . + . ID=mRNA10001;Parent=gene10001;Name=EDEN.1 +chr1 . mRNA 1050 9000 . + . ID=mRNA10002;Parent=gene10001;Name=EDEN.2 +chr1 . mRNA 1300 9000 . + . ID=mRNA10003;Parent=gene10001;Name=EDEN.3 +chr1 . exon 1050 1500 . + . ID=exon10001;Parent=mRNA10001 +chr1 . exon 1050 1500 . + . ID=exon10002;Parent=mRNA10002 +chr1 . exon 1300 1500 . + . ID=exon10003;Parent=mRNA10003 +chr1 . exon 3000 3902 . + . ID=exon10004;Parent=mRNA10001 +chr1 . exon 3000 3902 . + . ID=exon10005;Parent=mRNA10003 +chr1 . exon 5000 5500 . + . ID=exon10006;Parent=mRNA10001 +chr1 . exon 5000 5500 . + . ID=exon10007;Parent=mRNA10002 +chr1 . exon 5000 5500 . + . ID=exon10008;Parent=mRNA10003 +chr1 . exon 7000 9000 . + . ID=exon10009;Parent=mRNA10001 +chr1 . exon 7000 9000 . + . ID=exon20010;Parent=mRNA10002 +chr1 . exon 7000 9000 . + . ID=exon20011;Parent=mRNA10003 +chr1 . CDS 1201 1500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1 +chr1 . CDS 3000 3902 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1 +chr1 . CDS 5000 5500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1 +chr1 . CDS 7000 7600 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1 +chr1 . CDS 1201 1500 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2 +chr1 . CDS 5000 5500 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2 +chr1 . CDS 7000 7600 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2 +chr1 . CDS 3301 3902 . + 0 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3 +chr1 . CDS 5000 5500 . + 1 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3 +chr1 . CDS 7000 7600 . + 1 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3 +chr1 . CDS 3391 3902 . + 0 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4 +chr1 . CDS 5000 5500 . + 1 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4 +chr1 . CDS 7000 7600 . + 1 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4 diff --git a/packages/apollo-shared/test_data/example02.json b/packages/apollo-shared/test_data/example02.json new file mode 100644 index 00000000..26bfe71b --- /dev/null +++ b/packages/apollo-shared/test_data/example02.json @@ -0,0 +1,225 @@ +{ + "_id": "66d7151100dcdf7dda49178d", + "refSeq": "chr1", + "type": "gene", + "min": 999, + "max": 9000, + "strand": 1, + "children": { + "66d7151100dcdf7dda491780": { + "_id": "66d7151100dcdf7dda491780", + "refSeq": "chr1", + "type": "mRNA", + "min": 1049, + "max": 9000, + "strand": 1, + "children": { + "66d7151100dcdf7dda49177b": { + "_id": "66d7151100dcdf7dda49177b", + "refSeq": "chr1", + "type": "exon", + "min": 1049, + "max": 1500, + "strand": 1, + "attributes": { + "gff_id": ["exon10001"] + } + }, + "66d7151100dcdf7dda49177c": { + "_id": "66d7151100dcdf7dda49177c", + "refSeq": "chr1", + "type": "exon", + "min": 2999, + "max": 3902, + "strand": 1, + "attributes": { + "gff_id": ["exon10003"] + } + }, + "66d7151100dcdf7dda49177d": { + "_id": "66d7151100dcdf7dda49177d", + "refSeq": "chr1", + "type": "exon", + "min": 4999, + "max": 5500, + "strand": 1, + "attributes": { + "gff_id": ["exon10004"] + } + }, + "66d7151100dcdf7dda49177e": { + "_id": "66d7151100dcdf7dda49177e", + "refSeq": "chr1", + "type": "exon", + "min": 6999, + "max": 9000, + "strand": 1, + "attributes": { + "gff_id": ["exon10005"] + } + }, + "66d7151100dcdf7dda49177f": { + "_id": "66d7151100dcdf7dda49177f", + "refSeq": "chr1", + "type": "CDS", + "min": 1200, + "max": 7600, + "strand": 1, + "attributes": { + "gff_id": ["cds10001"], + "gff_name": ["edenprotein.1"] + } + } + }, + "attributes": { + "gff_id": ["mRNA10001"], + "gff_name": ["EDEN.1"] + } + }, + "66d7151100dcdf7dda491785": { + "_id": "66d7151100dcdf7dda491785", + "refSeq": "chr1", + "type": "mRNA", + "min": 1049, + "max": 9000, + "strand": 1, + "children": { + "66d7151100dcdf7dda491781": { + "_id": "66d7151100dcdf7dda491781", + "refSeq": "chr1", + "type": "exon", + "min": 1049, + "max": 1500, + "strand": 1, + "attributes": { + "gff_id": ["exon10001"] + } + }, + "66d7151100dcdf7dda491782": { + "_id": "66d7151100dcdf7dda491782", + "refSeq": "chr1", + "type": "exon", + "min": 4999, + "max": 5500, + "strand": 1, + "attributes": { + "gff_id": ["exon10004"] + } + }, + "66d7151100dcdf7dda491783": { + "_id": "66d7151100dcdf7dda491783", + "refSeq": "chr1", + "type": "exon", + "min": 6999, + "max": 9000, + "strand": 1, + "attributes": { + "gff_id": ["exon10005"] + } + }, + "66d7151100dcdf7dda491784": { + "_id": "66d7151100dcdf7dda491784", + "refSeq": "chr1", + "type": "CDS", + "min": 1200, + "max": 7600, + "strand": 1, + "attributes": { + "gff_id": ["cds10002"], + "gff_name": ["edenprotein.2"] + } + } + }, + "attributes": { + "gff_id": ["mRNA10002"], + "gff_name": ["EDEN.2"] + } + }, + "66d7151100dcdf7dda49178c": { + "_id": "66d7151100dcdf7dda49178c", + "refSeq": "chr1", + "type": "mRNA", + "min": 1299, + "max": 9000, + "strand": 1, + "children": { + "66d7151100dcdf7dda491786": { + "_id": "66d7151100dcdf7dda491786", + "refSeq": "chr1", + "type": "exon", + "min": 1299, + "max": 1500, + "strand": 1, + "attributes": { + "gff_id": ["exon10002"] + } + }, + "66d7151100dcdf7dda491787": { + "_id": "66d7151100dcdf7dda491787", + "refSeq": "chr1", + "type": "exon", + "min": 2999, + "max": 3902, + "strand": 1, + "attributes": { + "gff_id": ["exon10003"] + } + }, + "66d7151100dcdf7dda491788": { + "_id": "66d7151100dcdf7dda491788", + "refSeq": "chr1", + "type": "exon", + "min": 4999, + "max": 5500, + "strand": 1, + "attributes": { + "gff_id": ["exon10004"] + } + }, + "66d7151100dcdf7dda491789": { + "_id": "66d7151100dcdf7dda491789", + "refSeq": "chr1", + "type": "exon", + "min": 6999, + "max": 9000, + "strand": 1, + "attributes": { + "gff_id": ["exon10005"] + } + }, + "66d7151100dcdf7dda49178a": { + "_id": "66d7151100dcdf7dda49178a", + "refSeq": "chr1", + "type": "CDS", + "min": 3300, + "max": 7600, + "strand": 1, + "attributes": { + "gff_id": ["cds10003"], + "gff_name": ["edenprotein.3"] + } + }, + "66d7151100dcdf7dda49178b": { + "_id": "66d7151100dcdf7dda49178b", + "refSeq": "chr1", + "type": "CDS", + "min": 3390, + "max": 7600, + "strand": 1, + "attributes": { + "gff_id": ["cds10004"], + "gff_name": ["edenprotein.4"] + } + } + }, + "attributes": { + "gff_id": ["mRNA10003"], + "gff_name": ["EDEN.3"] + } + } + }, + "attributes": { + "gff_id": ["gene10001"], + "gff_name": ["EDEN"] + } +} diff --git a/packages/apollo-shared/test_data/example03.gff3 b/packages/apollo-shared/test_data/example03.gff3 new file mode 100644 index 00000000..9705469a --- /dev/null +++ b/packages/apollo-shared/test_data/example03.gff3 @@ -0,0 +1,35 @@ +##gff-version 3 +# example 3 +chr1 . gene 1000 9000 . + . ID=gene10001;Name=EDEN;testid=t003 +chr1 . mRNA 1050 9000 . + . ID=mRNA10001;Parent=gene10001;Name=EDEN.1;testid=t004 +chr1 . mRNA 1050 9000 . + . ID=mRNA10002;Parent=gene10001;Name=EDEN.2;testid=t005 +chr1 . mRNA 1300 9000 . + . ID=mRNA10003;Parent=gene10001;Name=EDEN.3;testid=t006 +chr1 . mRNA 1300 9000 . + . ID=mRNA10004;Parent=gene10001;Name=EDEN.3;testid=t007 +chr1 . exon 1050 1500 . + . ID=exon10001;Parent=mRNA10001;testid=t008 +chr1 . exon 1050 1500 . + . ID=exon10002;Parent=mRNA10002;testid=t009 +chr1 . exon 1300 1500 . + . ID=exon10003;Parent=mRNA10003;testid=t010 +chr1 . exon 3000 3902 . + . ID=exon10004;Parent=mRNA10001;testid=t011 +chr1 . exon 3000 3902 . + . ID=exon10005;Parent=mRNA10003;testid=t012 +chr1 . exon 5000 5500 . + . ID=exon10006;Parent=mRNA10001;testid=t013 +chr1 . exon 5000 5500 . + . ID=exon10007;Parent=mRNA10002;testid=t014 +chr1 . exon 5000 5500 . + . ID=exon10008;Parent=mRNA10003;testid=t015 +chr1 . exon 7000 9000 . + . ID=exon10009;Parent=mRNA10001;testid=t016 +chr1 . exon 7000 9000 . + . ID=exon10010;Parent=mRNA10002;testid=t017 +chr1 . exon 7000 9000 . + . ID=exon10011;Parent=mRNA10003;testid=t018 +chr1 . exon 1300 1500 . + . ID=exon10012;Parent=mRNA10004;testid=t019 +chr1 . exon 3000 3902 . + . ID=exon10013;Parent=mRNA10004;testid=t020 +chr1 . exon 5000 5500 . + . ID=exon10014;Parent=mRNA10004;testid=t021 +chr1 . exon 7000 9000 . + . ID=exon10015;Parent=mRNA10004;testid=t022 +chr1 . CDS 1201 1500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t023 +chr1 . CDS 3000 3902 . + 0 ID=cds10002;Parent=mRNA10001;Name=edenprotein.1;testid=t024 +chr1 . CDS 5000 5500 . + 0 ID=cds10003;Parent=mRNA10001;Name=edenprotein.1;testid=t025 +chr1 . CDS 7000 7600 . + 0 ID=cds10004;Parent=mRNA10001;Name=edenprotein.1;testid=t026 +chr1 . CDS 1201 1500 . + 0 ID=cds10005;Parent=mRNA10002;Name=edenprotein.2;testid=t027 +chr1 . CDS 5000 5500 . + 0 ID=cds10006;Parent=mRNA10002;Name=edenprotein.2;testid=t028 +chr1 . CDS 7000 7600 . + 0 ID=cds10007;Parent=mRNA10002;Name=edenprotein.2;testid=t029 +chr1 . CDS 3301 3902 . + 0 ID=cds10008;Parent=mRNA10003;Name=edenprotein.3;testid=t030 +chr1 . CDS 5000 5500 . + 1 ID=cds10009;Parent=mRNA10003;Name=edenprotein.3;testid=t031 +chr1 . CDS 7000 7600 . + 1 ID=cds10010;Parent=mRNA10003;Name=edenprotein.3;testid=t032 +chr1 . CDS 3391 3902 . + 0 ID=cds10011;Parent=mRNA10004;Name=edenprotein.4;testid=t033 +chr1 . CDS 5000 5500 . + 1 ID=cds10012;Parent=mRNA10004;Name=edenprotein.4;testid=t034 +chr1 . CDS 7000 7600 . + 1 ID=cds10013;Parent=mRNA10004;Name=edenprotein.4;testid=t035 diff --git a/packages/apollo-shared/test_data/example04.gff3 b/packages/apollo-shared/test_data/example04.gff3 new file mode 100644 index 00000000..ca6982e5 --- /dev/null +++ b/packages/apollo-shared/test_data/example04.gff3 @@ -0,0 +1,30 @@ +##gff-version 3 +# example 4 +chr1 . gene 1000 9000 . + . ID=gene10001;Name=EDEN;testid=t003 +chr1 . mRNA 1050 9000 . + . ID=mRNA10001;Parent=gene10001;Name=EDEN.1;testid=t004 +chr1 . mRNA 1050 9000 . + . ID=mRNA10002;Parent=gene10001;Name=EDEN.2;testid=t005 +chr1 . mRNA 1300 9000 . + . ID=mRNA10003;Parent=gene10001;Name=EDEN.3;testid=t006 +chr1 . exon 1050 1500 . + . ID=exon10001;Parent=mRNA10001,mRNA10002;testid=t007 +chr1 . exon 1300 1500 . + . ID=exon10002;Parent=mRNA10003;testid=t008 +chr1 . exon 3000 3902 . + . ID=exon10003;Parent=mRNA10001,mRNA10003;testid=t009 +chr1 . exon 5000 5500 . + . ID=exon10004;Parent=mRNA10001,mRNA10002,mRNA10003;testid=t010 +chr1 . exon 7000 9000 . + . ID=exon10005;Parent=mRNA10001,mRNA10002,mRNA10003;testid=t011 +chr1 . five_prime_UTR 1050 1200 . + . ID=five_prime_UTR10001;Parent=mRNA10001,mRNA10002;testid=t012 +chr1 . five_prime_UTR 1300 1500 . + . ID=five_prime_UTR10002;Parent=mRNA10003;testid=t013 +chr1 . five_prime_UTR 3000 3300 . + . ID=five_prime_UTR10003;Parent=mRNA10003;testid=t014 +chr1 . five_prime_UTR 3000 3390 . + . ID=five_prime_UTR10004;Parent=mRNA10003;testid=t015 +chr1 . five_prime_UTR 3000 3390 . + . ID=five_prime_UTR10004;Parent=mRNA10003;testid=t016 +chr1 . three_prime_UTR 7601 9000 . + . ID=three_prime_UTR10001;Parent=mRNA10001,mRNA10002,mRNA10003;testid=t017 +chr1 . CDS 1201 1500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t018 +chr1 . CDS 3000 3902 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t019 +chr1 . CDS 5000 5500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t020 +chr1 . CDS 7000 7600 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t021 +chr1 . CDS 1201 1500 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2;testid=t022 +chr1 . CDS 5000 5500 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2;testid=t023 +chr1 . CDS 7000 7600 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2;testid=t024 +chr1 . CDS 3301 3902 . + 0 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3;testid=t025 +chr1 . CDS 5000 5500 . + 1 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3;testid=t026 +chr1 . CDS 7000 7600 . + 1 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3;testid=t027 +chr1 . CDS 3391 3902 . + 0 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4;testid=t028 +chr1 . CDS 5000 5500 . + 1 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4;testid=t029 +chr1 . CDS 7000 7600 . + 1 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4;testid=t030 diff --git a/packages/apollo-shared/test_data/example05.gff3 b/packages/apollo-shared/test_data/example05.gff3 new file mode 100644 index 00000000..70031fe0 --- /dev/null +++ b/packages/apollo-shared/test_data/example05.gff3 @@ -0,0 +1,30 @@ +##gff-version 3 +# example 5 +chr1 . gene 1000 9000 . + . ID=gene10001;Name=EDEN;testid=t003 +chr1 . mRNA 1050 9000 . + . ID=mRNA10001;Parent=gene10001;Name=EDEN.1;testid=t004 +chr1 . mRNA 1050 9000 . + . ID=mRNA10002;Parent=gene10001;Name=EDEN.2;testid=t005 +chr1 . mRNA 1300 9000 . + . ID=mRNA10003;Parent=gene10001;Name=EDEN.3;testid=t006 +chr1 . exon 1050 1500 . + . ID=exon10001;Parent=mRNA10001,mRNA10002;testid=t007 +chr1 . exon 1300 1500 . + . ID=exon10002;Parent=mRNA10003;testid=t008 +chr1 . exon 3000 3902 . + . ID=exon10003;Parent=mRNA10001,mRNA10003;testid=t009 +chr1 . exon 5000 5500 . + . ID=exon10004;Parent=mRNA10001,mRNA10002,mRNA10003;testid=t010 +chr1 . exon 7000 9000 . + . ID=exon10005;Parent=mRNA10001,mRNA10002,mRNA10003;testid=t011 +chr1 . five_prime_UTR 1050 1200 . + . ID=five_prime_UTR10001;Parent=mRNA10001,mRNA10002;testid=t012 +chr1 . five_prime_UTR 1300 1500 . + . ID=five_prime_UTR10002;Parent=mRNA10003;testid=t013 +chr1 . five_prime_UTR 3000 3300 . + . ID=five_prime_UTR10003;Parent=mRNA10003;testid=t014 +chr1 . five_prime_UTR 3000 3390 . + . ID=five_prime_UTR10004;Parent=mRNA10003;testid=t015 +chr1 . five_prime_UTR 3000 3390 . + . ID=five_prime_UTR10004;Parent=mRNA10003;testid=t016 +chr1 . three_prime_UTR 7601 9000 . + . ID=three_prime_UTR10001;Parent=mRNA10001,mRNA10002,mRNA10003;testid=t017 +chr1 . CDS 1201 1500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t018 +chr1 . CDS 3000 3902 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t019 +chr1 . CDS 5000 5500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t020 +chr1 . CDS 7000 7600 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t021 +chr1 . CDS 1201 1500 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2;testid=t022 +chr1 . CDS 5000 5500 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2;testid=t023 +chr1 . CDS 7000 7600 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2;testid=t024 +chr1 . CDS 3301 3902 . + 0 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3;testid=t025 +chr1 . CDS 5000 5500 . + 1 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3;testid=t026 +chr1 . CDS 7000 7600 . + 1 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3;testid=t027 +chr1 . CDS 3391 3902 . + 0 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4;testid=t028 +chr1 . CDS 5000 5500 . + 1 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4;testid=t029 +chr1 . CDS 7000 7600 . + 1 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4;testid=t030 diff --git a/packages/apollo-shared/test_data/example06.gff3 b/packages/apollo-shared/test_data/example06.gff3 new file mode 100644 index 00000000..a762a093 --- /dev/null +++ b/packages/apollo-shared/test_data/example06.gff3 @@ -0,0 +1,30 @@ +##gff-version 3 +# example 6 +chr1 . gene 1000 9000 . + . ID=gene10001;Name=EDEN;testid=t003 +chr1 . mRNA 1050 9000 . + . ID=mRNA10001;Parent=gene10001;Name=EDEN.1;testid=t004 +chr1 . mRNA 1050 9000 . + . ID=mRNA10002;Parent=gene10001;Name=EDEN.2;testid=t005 +chr1 . mRNA 1300 9000 . + . ID=mRNA10003;Parent=gene10001;Name=EDEN.3;testid=t006 +chr1 . exon 1050 1500 . + . ID=exon10001;Parent=mRNA10001,mRNA10002;testid=t007 +chr1 . exon 1300 1500 . + . ID=exon10002;Parent=mRNA10003;testid=t008 +chr1 . exon 3000 3902 . + . ID=exon10003;Parent=mRNA10001,mRNA10003;testid=t009 +chr1 . exon 5000 5500 . + . ID=exon10004;Parent=mRNA10001,mRNA10002,mRNA10003;testid=t010 +chr1 . exon 7000 9000 . + . ID=exon10005;Parent=mRNA10001,mRNA10002,mRNA10003;testid=t011 +chr1 . five_prime_UTR 1050 1200 . + . ID=five_prime_UTR10001;Parent=mRNA10001,mRNA10002;testid=t012 +chr1 . five_prime_UTR 1300 1500 . + . ID=five_prime_UTR10002;Parent=mRNA10003;testid=t013 +chr1 . five_prime_UTR 3000 3300 . + . ID=five_prime_UTR10003;Parent=mRNA10003;testid=t014 +chr1 . five_prime_UTR 3000 3390 . + . ID=five_prime_UTR10004;Parent=mRNA10003;testid=t015 +chr1 . five_prime_UTR 3000 3390 . + . ID=five_prime_UTR10004;Parent=mRNA10003;testid=t016 +chr1 . three_prime_UTR 7601 9000 . + . ID=three_prime_UTR10001;Parent=mRNA10001,mRNA10002,mRNA10003;testid=t017 +chr1 . CDS 1201 1500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t018 +chr1 . CDS 3000 3902 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t019 +chr1 . CDS 5000 5500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t020 +chr1 . CDS 7000 7600 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t021 +chr1 . CDS 1201 1500 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2;testid=t022 +chr1 . CDS 5000 5500 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2;testid=t023 +chr1 . CDS 7000 7600 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2;testid=t024 +chr1 . CDS 3301 3902 . + 0 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3;testid=t025 +chr1 . CDS 5000 5500 . + 1 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3;testid=t026 +chr1 . CDS 7000 7600 . + 1 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3;testid=t027 +chr1 . CDS 3391 3902 . + 0 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4;testid=t028 +chr1 . CDS 5000 5500 . + 1 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4;testid=t029 +chr1 . CDS 7000 7600 . + 1 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4;testid=t030 diff --git a/packages/apollo-shared/test_data/example07.gff3 b/packages/apollo-shared/test_data/example07.gff3 new file mode 100644 index 00000000..c1bb5fca --- /dev/null +++ b/packages/apollo-shared/test_data/example07.gff3 @@ -0,0 +1,30 @@ +##gff-version 3 +# example 2 +chr1 . gene 1000 9000 . + . ID=gene10001;Name=EDEN;testid=t003 +chr1 . mRNA 1050 9000 . + . ID=mRNA10001;Parent=gene10001;Name=EDEN.1;testid=t004 +chr1 . mRNA 1050 9000 . + . ID=mRNA10002;Parent=gene10001;Name=EDEN.2;testid=t005 +chr1 . mRNA 1300 9000 . + . ID=mRNA10003;Parent=gene10001;Name=EDEN.3;testid=t006 +chr1 . exon 1050 1500 . + . ID=exon10001;Parent=mRNA10001;testid=t007 +chr1 . exon 1050 1500 . + . ID=exon10002;Parent=mRNA10002;testid=t008 +chr1 . exon 1300 1500 . + . ID=exon10003;Parent=mRNA10003;testid=t009 +chr1 . exon 3000 3902 . + . ID=exon10004;Parent=mRNA10001;testid=t010 +chr1 . exon 3000 3902 . + . ID=exon10005;Parent=mRNA10003;testid=t011 +chr1 . exon 5000 5500 . + . ID=exon10006;Parent=mRNA10001;testid=t012 +chr1 . exon 5000 5500 . + . ID=exon10007;Parent=mRNA10002;testid=t013 +chr1 . exon 5000 5500 . + . ID=exon10008;Parent=mRNA10003;testid=t014 +chr1 . exon 7000 9000 . + . ID=exon10009;Parent=mRNA10001;testid=t015 +chr1 . exon 7000 9000 . + . ID=exon20010;Parent=mRNA10002;testid=t016 +chr1 . exon 7000 9000 . + . ID=exon20011;Parent=mRNA10003;testid=t017 +chr1 . CDS 1201 1500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t018 +chr1 . CDS 3000 3902 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t019 +chr1 . CDS 5000 5500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t020 +chr1 . CDS 7000 7600 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t021 +chr1 . CDS 1201 1500 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2;testid=t022 +chr1 . CDS 5000 5500 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2;testid=t023 +chr1 . CDS 7000 7600 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2;testid=t024 +chr1 . CDS 3301 3902 . + 0 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3;testid=t025 +chr1 . CDS 5000 5500 . + 1 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3;testid=t026 +chr1 . CDS 7000 7600 . + 1 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3;testid=t027 +chr1 . CDS 3391 3902 . + 0 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4;testid=t028 +chr1 . CDS 5000 5500 . + 1 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4;testid=t029 +chr1 . CDS 7000 7600 . + 1 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4;testid=t030 diff --git a/packages/apollo-shared/test_data/gene_mrna.gff3 b/packages/apollo-shared/test_data/gene_mrna.gff3 new file mode 100644 index 00000000..55efcbad --- /dev/null +++ b/packages/apollo-shared/test_data/gene_mrna.gff3 @@ -0,0 +1,4 @@ +##gff-version 3 +##sequence-region ctgA 1000 2000 +ctgA example gene 1000 2000 . . . ID=gene01;Name=geneA;Alias=hga +ctgA example mRNA 1000 2000 . . . Parent=gene01;Name=mrnaA;Alias=hga diff --git a/packages/apollo-shared/test_data/gene_representations.gff3 b/packages/apollo-shared/test_data/gene_representations.gff3 new file mode 100644 index 00000000..6f7c0596 --- /dev/null +++ b/packages/apollo-shared/test_data/gene_representations.gff3 @@ -0,0 +1,1844 @@ +##gff-version 3 +# example 1 +chr1 . gene 1000 9000 . + . ID=gene10001;Name=EDEN +chr1 . TF_binding_site 1000 1012 . + . ID=tfbs10001;Parent=gene10001 +chr1 . mRNA 1050 9000 . + . ID=mRNA10001;Parent=gene10001;Name=EDEN.1 +chr1 . mRNA 1050 9000 . + . ID=mRNA10002;Parent=gene10001;Name=EDEN.2 +chr1 . mRNA 1300 9000 . + . ID=mRNA10003;Parent=gene10001;Name=EDEN.3 +chr1 . exon 1300 1500 . + . ID=exon10001;Parent=mRNA10003 +chr1 . exon 1050 1500 . + . ID=exon10002;Parent=mRNA10001,mRNA10002 +chr1 . exon 3000 3902 . + . ID=exon10003;Parent=mRNA10001,mRNA10003 +chr1 . exon 5000 5500 . + . ID=exon10004;Parent=mRNA10001,mRNA10002,mRNA10003 +chr1 . exon 7000 9000 . + . ID=exon10005;Parent=mRNA10001,mRNA10002,mRNA10003 +chr1 . CDS 1201 1500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1 +chr1 . CDS 3000 3902 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1 +chr1 . CDS 5000 5500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1 +chr1 . CDS 7000 7600 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1 +chr1 . CDS 1201 1500 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2 +chr1 . CDS 5000 5500 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2 +chr1 . CDS 7000 7600 . + 0 ID=cds10002;Parent=mRNA10002;Name=edenprotein.2 +chr1 . CDS 3301 3902 . + 0 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3 +chr1 . CDS 5000 5500 . + 1 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3 +chr1 . CDS 7000 7600 . + 1 ID=cds10003;Parent=mRNA10003;Name=edenprotein.3 +chr1 . CDS 3391 3902 . + 0 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4 +chr1 . CDS 5000 5500 . + 1 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4 +chr1 . CDS 7000 7600 . + 1 ID=cds10004;Parent=mRNA10003;Name=edenprotein.4 +# example 2 +chr1 . gene 11000 19000 . + . ID=gene20001;Name=EDEN +chr1 . mRNA 11050 19000 . + . ID=mRNA20001;Parent=gene20001;Name=EDEN.1 +chr1 . mRNA 11050 19000 . + . ID=mRNA20002;Parent=gene20001;Name=EDEN.2 +chr1 . mRNA 11300 19000 . + . ID=mRNA20003;Parent=gene20001;Name=EDEN.3 +chr1 . exon 11050 11500 . + . ID=exon20001;Parent=mRNA20001 +chr1 . exon 11050 11500 . + . ID=exon20002;Parent=mRNA20002 +chr1 . exon 11300 11500 . + . ID=exon20003;Parent=mRNA20003 +chr1 . exon 13000 13902 . + . ID=exon20004;Parent=mRNA20001 +chr1 . exon 13000 13902 . + . ID=exon20005;Parent=mRNA20003 +chr1 . exon 15000 15500 . + . ID=exon20006;Parent=mRNA20001 +chr1 . exon 15000 15500 . + . ID=exon20007;Parent=mRNA20002 +chr1 . exon 15000 15500 . + . ID=exon20008;Parent=mRNA20003 +chr1 . exon 17000 19000 . + . ID=exon20009;Parent=mRNA20001 +chr1 . exon 17000 19000 . + . ID=exon20010;Parent=mRNA20002 +chr1 . exon 17000 19000 . + . ID=exon20011;Parent=mRNA20003 +chr1 . CDS 11201 11500 . + 0 ID=cds20001;Parent=mRNA20001;Name=edenprotein.1 +chr1 . CDS 13000 13902 . + 0 ID=cds20001;Parent=mRNA20001;Name=edenprotein.1 +chr1 . CDS 15000 15500 . + 0 ID=cds20001;Parent=mRNA20001;Name=edenprotein.1 +chr1 . CDS 17000 17600 . + 0 ID=cds20001;Parent=mRNA20001;Name=edenprotein.1 +chr1 . CDS 11201 11500 . + 0 ID=cds20002;Parent=mRNA20002;Name=edenprotein.2 +chr1 . CDS 15000 15500 . + 0 ID=cds20002;Parent=mRNA20002;Name=edenprotein.2 +chr1 . CDS 17000 17600 . + 0 ID=cds20002;Parent=mRNA20002;Name=edenprotein.2 +chr1 . CDS 13301 13902 . + 0 ID=cds20003;Parent=mRNA20003;Name=edenprotein.3 +chr1 . CDS 15000 15500 . + 1 ID=cds20003;Parent=mRNA20003;Name=edenprotein.3 +chr1 . CDS 17000 17600 . + 1 ID=cds20003;Parent=mRNA20003;Name=edenprotein.3 +chr1 . CDS 13391 13902 . + 0 ID=cds20004;Parent=mRNA20003;Name=edenprotein.4 +chr1 . CDS 15000 15500 . + 1 ID=cds20004;Parent=mRNA20003;Name=edenprotein.4 +chr1 . CDS 17000 17600 . + 1 ID=cds20004;Parent=mRNA20003;Name=edenprotein.4 +# example 3 +chr1 . gene 21000 29000 . + . ID=gene30001;Name=EDEN +chr1 . mRNA 21050 29000 . + . ID=mRNA30001;Parent=gene30001;Name=EDEN.1 +chr1 . mRNA 21050 29000 . + . ID=mRNA30002;Parent=gene30001;Name=EDEN.2 +chr1 . mRNA 21300 29000 . + . ID=mRNA30003;Parent=gene30001;Name=EDEN.3 +chr1 . mRNA 21300 29000 . + . ID=mRNA30004;Parent=gene30001;Name=EDEN.3 +chr1 . exon 21050 21500 . + . ID=exon30001;Parent=mRNA30001 +chr1 . exon 21050 21500 . + . ID=exon30002;Parent=mRNA30002 +chr1 . exon 21300 21500 . + . ID=exon30003;Parent=mRNA30003 +chr1 . exon 23000 23902 . + . ID=exon30004;Parent=mRNA30001 +chr1 . exon 23000 23902 . + . ID=exon30005;Parent=mRNA30003 +chr1 . exon 25000 25500 . + . ID=exon30006;Parent=mRNA30001 +chr1 . exon 25000 25500 . + . ID=exon30007;Parent=mRNA30002 +chr1 . exon 25000 25500 . + . ID=exon30008;Parent=mRNA30003 +chr1 . exon 27000 29000 . + . ID=exon30009;Parent=mRNA30001 +chr1 . exon 27000 29000 . + . ID=exon30010;Parent=mRNA30002 +chr1 . exon 27000 29000 . + . ID=exon30011;Parent=mRNA30003 +chr1 . exon 21300 21500 . + . ID=exon30012;Parent=mRNA30004 +chr1 . exon 23000 23902 . + . ID=exon30013;Parent=mRNA30004 +chr1 . exon 25000 25500 . + . ID=exon30014;Parent=mRNA30004 +chr1 . exon 27000 29000 . + . ID=exon30015;Parent=mRNA30004 +chr1 . CDS 21201 21500 . + 0 ID=cds30001;Parent=mRNA30001;Name=edenprotein.1 +chr1 . CDS 23000 23902 . + 0 ID=cds30002;Parent=mRNA30001;Name=edenprotein.1 +chr1 . CDS 25000 25500 . + 0 ID=cds30003;Parent=mRNA30001;Name=edenprotein.1 +chr1 . CDS 27000 27600 . + 0 ID=cds30004;Parent=mRNA30001;Name=edenprotein.1 +chr1 . CDS 21201 21500 . + 0 ID=cds30005;Parent=mRNA30002;Name=edenprotein.2 +chr1 . CDS 25000 25500 . + 0 ID=cds30006;Parent=mRNA30002;Name=edenprotein.2 +chr1 . CDS 27000 27600 . + 0 ID=cds30007;Parent=mRNA30002;Name=edenprotein.2 +chr1 . CDS 23301 23902 . + 0 ID=cds30008;Parent=mRNA30003;Name=edenprotein.3 +chr1 . CDS 25000 25500 . + 1 ID=cds30009;Parent=mRNA30003;Name=edenprotein.3 +chr1 . CDS 27000 27600 . + 1 ID=cds30010;Parent=mRNA30003;Name=edenprotein.3 +chr1 . CDS 23391 23902 . + 0 ID=cds30011;Parent=mRNA30004;Name=edenprotein.4 +chr1 . CDS 25000 25500 . + 1 ID=cds30012;Parent=mRNA30004;Name=edenprotein.4 +chr1 . CDS 27000 27600 . + 1 ID=cds30013;Parent=mRNA30004;Name=edenprotein.4 +# example 4 +chr1 . gene 31000 39000 . + . ID=gene40001;Name=EDEN +chr1 . mRNA 31050 39000 . + . ID=mRNA40001;Parent=gene40001;Name=EDEN.1 +chr1 . mRNA 31050 39000 . + . ID=mRNA40002;Parent=gene40001;Name=EDEN.2 +chr1 . mRNA 31300 39000 . + . ID=mRNA40003;Parent=gene40001;Name=EDEN.3 +chr1 . exon 31050 31500 . + . ID=exon40001;Parent=mRNA40001,mRNA40002 +chr1 . exon 31300 31500 . + . ID=exon40002;Parent=mRNA40003 +chr1 . exon 33000 33902 . + . ID=exon40003;Parent=mRNA40001,mRNA40003 +chr1 . exon 35000 35500 . + . ID=exon40004;Parent=mRNA40001,mRNA40002,mRNA40003 +chr1 . exon 37000 39000 . + . ID=exon40005;Parent=mRNA40001,mRNA40002,mRNA40003 +chr1 . five_prime_UTR 31050 31200 . + . ID=five_prime_UTR40001;Parent=mRNA40001,mRNA40002 +chr1 . five_prime_UTR 31300 31500 . + . ID=five_prime_UTR40002;Parent=mRNA40003 +chr1 . five_prime_UTR 33000 33300 . + . ID=five_prime_UTR40003;Parent=mRNA40003 +chr1 . five_prime_UTR 33000 33390 . + . ID=five_prime_UTR40004;Parent=mRNA40003 +chr1 . five_prime_UTR 33000 33390 . + . ID=five_prime_UTR40004;Parent=mRNA40003 +chr1 . three_prime_UTR 37601 39000 . + . ID=three_prime_UTR40001;Parent=mRNA40001,mRNA40002,mRNA40003 +chr1 . CDS 31201 31500 . + 0 ID=cds40001;Parent=mRNA40001;Name=edenprotein.1 +chr1 . CDS 33000 33902 . + 0 ID=cds40001;Parent=mRNA40001;Name=edenprotein.1 +chr1 . CDS 35000 35500 . + 0 ID=cds40001;Parent=mRNA40001;Name=edenprotein.1 +chr1 . CDS 37000 37600 . + 0 ID=cds40001;Parent=mRNA40001;Name=edenprotein.1 +chr1 . CDS 31201 31500 . + 0 ID=cds40002;Parent=mRNA40002;Name=edenprotein.2 +chr1 . CDS 35000 35500 . + 0 ID=cds40002;Parent=mRNA40002;Name=edenprotein.2 +chr1 . CDS 37000 37600 . + 0 ID=cds40002;Parent=mRNA40002;Name=edenprotein.2 +chr1 . CDS 33301 33902 . + 0 ID=cds40003;Parent=mRNA40003;Name=edenprotein.3 +chr1 . CDS 35000 35500 . + 1 ID=cds40003;Parent=mRNA40003;Name=edenprotein.3 +chr1 . CDS 37000 37600 . + 1 ID=cds40003;Parent=mRNA40003;Name=edenprotein.3 +chr1 . CDS 33391 33902 . + 0 ID=cds40004;Parent=mRNA40003;Name=edenprotein.4 +chr1 . CDS 35000 35500 . + 1 ID=cds40004;Parent=mRNA40003;Name=edenprotein.4 +chr1 . CDS 37000 37600 . + 1 ID=cds40004;Parent=mRNA40003;Name=edenprotein.4 +# example 5 +chr1 . gene 41000 49000 . + . ID=gene50001;Name=EDEN +chr1 . mRNA 41050 49000 . + . ID=mRNA50001;Parent=gene50001;Name=EDEN.1 +chr1 . mRNA 41050 49000 . + . ID=mRNA50002;Parent=gene50001;Name=EDEN.2 +chr1 . mRNA 41300 49000 . + . ID=mRNA50003;Parent=gene50001;Name=EDEN.3 +chr1 . exon 41050 41500 . + . ID=exon50001;Parent=mRNA50001,mRNA50002 +chr1 . exon 41300 41500 . + . ID=exon50002;Parent=mRNA50003 +chr1 . exon 43000 43902 . + . ID=exon50003;Parent=mRNA50001,mRNA50003 +chr1 . exon 45000 45500 . + . ID=exon50004;Parent=mRNA50001,mRNA50002,mRNA50003 +chr1 . exon 47000 49000 . + . ID=exon50005;Parent=mRNA50001,mRNA50002,mRNA50003 +chr1 . five_prime_UTR 41050 41200 . + . ID=five_prime_UTR50001;Parent=mRNA50001,mRNA50002 +chr1 . five_prime_UTR 41300 41500 . + . ID=five_prime_UTR50002;Parent=mRNA50003 +chr1 . five_prime_UTR 43000 43300 . + . ID=five_prime_UTR50003;Parent=mRNA50003 +chr1 . five_prime_UTR 43000 43390 . + . ID=five_prime_UTR50004;Parent=mRNA50003 +chr1 . five_prime_UTR 43000 43390 . + . ID=five_prime_UTR50004;Parent=mRNA50003 +chr1 . three_prime_UTR 47601 49000 . + . ID=three_prime_UTR50001;Parent=mRNA50001,mRNA50002,mRNA50003 +chr1 . CDS 41201 41500 . + 0 ID=cds50001;Parent=mRNA50001;Name=edenprotein.1 +chr1 . CDS 43000 43902 . + 0 ID=cds50001;Parent=mRNA50001;Name=edenprotein.1 +chr1 . CDS 45000 45500 . + 0 ID=cds50001;Parent=mRNA50001;Name=edenprotein.1 +chr1 . CDS 47000 47600 . + 0 ID=cds50001;Parent=mRNA50001;Name=edenprotein.1 +chr1 . CDS 41201 41500 . + 0 ID=cds50002;Parent=mRNA50002;Name=edenprotein.2 +chr1 . CDS 45000 45500 . + 0 ID=cds50002;Parent=mRNA50002;Name=edenprotein.2 +chr1 . CDS 47000 47600 . + 0 ID=cds50002;Parent=mRNA50002;Name=edenprotein.2 +chr1 . CDS 43301 43902 . + 0 ID=cds50003;Parent=mRNA50003;Name=edenprotein.3 +chr1 . CDS 45000 45500 . + 1 ID=cds50003;Parent=mRNA50003;Name=edenprotein.3 +chr1 . CDS 47000 47600 . + 1 ID=cds50003;Parent=mRNA50003;Name=edenprotein.3 +chr1 . CDS 43391 43902 . + 0 ID=cds50004;Parent=mRNA50003;Name=edenprotein.4 +chr1 . CDS 45000 45500 . + 1 ID=cds50004;Parent=mRNA50003;Name=edenprotein.4 +chr1 . CDS 47000 47600 . + 1 ID=cds50004;Parent=mRNA50003;Name=edenprotein.4 +# example 6 +chr1 . gene 51000 59000 . + . ID=gene60001;Name=EDEN +chr1 . mRNA 51050 59000 . + . ID=mRNA60001;Parent=gene60001;Name=EDEN.1 +chr1 . mRNA 51050 59000 . + . ID=mRNA60002;Parent=gene60001;Name=EDEN.2 +chr1 . mRNA 51300 59000 . + . ID=mRNA60003;Parent=gene60001;Name=EDEN.3 +chr1 . exon 51050 51500 . + . ID=exon60001;Parent=mRNA60001,mRNA60002 +chr1 . exon 51300 51500 . + . ID=exon60002;Parent=mRNA60003 +chr1 . exon 53000 53902 . + . ID=exon60003;Parent=mRNA60001,mRNA60003 +chr1 . exon 55000 55500 . + . ID=exon60004;Parent=mRNA60001,mRNA60002,mRNA60003 +chr1 . exon 57000 59000 . + . ID=exon60005;Parent=mRNA60001,mRNA60002,mRNA60003 +chr1 . five_prime_UTR 51050 51200 . + . ID=five_prime_UTR60001;Parent=mRNA60001,mRNA60002 +chr1 . five_prime_UTR 51300 51500 . + . ID=five_prime_UTR60002;Parent=mRNA60003 +chr1 . five_prime_UTR 53000 53300 . + . ID=five_prime_UTR60003;Parent=mRNA60003 +chr1 . five_prime_UTR 53000 53390 . + . ID=five_prime_UTR60004;Parent=mRNA60003 +chr1 . five_prime_UTR 53000 53390 . + . ID=five_prime_UTR60004;Parent=mRNA60003 +chr1 . three_prime_UTR 57601 59000 . + . ID=three_prime_UTR60001;Parent=mRNA60001,mRNA60002,mRNA60003 +chr1 . CDS 51201 51500 . + 0 ID=cds60001;Parent=mRNA60001;Name=edenprotein.1 +chr1 . CDS 53000 53902 . + 0 ID=cds60001;Parent=mRNA60001;Name=edenprotein.1 +chr1 . CDS 55000 55500 . + 0 ID=cds60001;Parent=mRNA60001;Name=edenprotein.1 +chr1 . CDS 57000 57600 . + 0 ID=cds60001;Parent=mRNA60001;Name=edenprotein.1 +chr1 . CDS 51201 51500 . + 0 ID=cds60002;Parent=mRNA60002;Name=edenprotein.2 +chr1 . CDS 55000 55500 . + 0 ID=cds60002;Parent=mRNA60002;Name=edenprotein.2 +chr1 . CDS 57000 57600 . + 0 ID=cds60002;Parent=mRNA60002;Name=edenprotein.2 +chr1 . CDS 53301 53902 . + 0 ID=cds60003;Parent=mRNA60003;Name=edenprotein.3 +chr1 . CDS 55000 55500 . + 1 ID=cds60003;Parent=mRNA60003;Name=edenprotein.3 +chr1 . CDS 57000 57600 . + 1 ID=cds60003;Parent=mRNA60003;Name=edenprotein.3 +chr1 . CDS 53391 53902 . + 0 ID=cds60004;Parent=mRNA60003;Name=edenprotein.4 +chr1 . CDS 55000 55500 . + 1 ID=cds60004;Parent=mRNA60003;Name=edenprotein.4 +chr1 . CDS 57000 57600 . + 1 ID=cds60004;Parent=mRNA60003;Name=edenprotein.4 +##FASTA +>chr1 +cattgttgcggagttgaacaACGGCATTAGGAACACTTCCGTCTCtcacttttatacgat +tatgattggttctttagccttggtttagattggtagtagtagcggcgctaatgctacctg +aattgagaactcgagcgggggctaggcaaattctgattcagcctgacttctcttggaacc +ctgcccataaatcaaagggttagtgcggccaaaacgttggacaacggtattagaagacca +acctgaccaccaaaccgtcaattaaccggtatcttctcggaaacggcggttctctcctag +atagcgatctgtggtctcaccatgcaatttaaacaggtgagtaaagattgctacaaatac +gagactagctgtcaccagatgctgttcatctgttggctccttggtcgctccgttgtaccc +aggctactttgaaagagcgcagaatacttagacggtatcgatcatggtagcatagcattc +tgataacatgtatggagttcgaacatccgtctggggccggacggtccgtttgaggttggt +tgatctgggtgatagtcagcaagatagacgttagataacaaattaaaggattttacctta +gattgcgactagtacaacggtacatcggtgattcgcgctctactagatcacgctatgggt +accataaacaaacggtggaccttctcaagctggttgacgcctcagcaacataggcttcct +cctccacgcatctcagcataaaaggcttataaactgcttctttgtgccagagcaactcaa +ttaagcccttggtaccgtgggcacgcattctgtcacggtgaccaactgttcatcctgaat +cgccgaatgggactatttggtacaggaatcaagcggatggcactactgcagcttatttac +gacggtattcttaaagtttttaagacaatgtatttcatgggtagttcggtttgttttatt +gctacacaggctcttgtagacgacctacttagcactacggccgagcgcaataacccccgg +aaagcacttgctactgggaggcgggtttatccatcggcaataggggttatcagtactacc +aagaagattgtgaagatattaacagcattgaaaaaagttcggactgggcatgaaacgtgt +gtcagagttagagtccttgagggactgaatgggtttgtcccaggcccaagcttgaggtgg +atgtcacctcgggtactgcctctattacagaggtatcttaatggcgcatccagccttgtg +gctgggtctacgtacgcgtgggcaccatacgtatgttggcaggaaaggtcaatcatgctt +gtttcctcgtcgcagaaacgttcacactattggctcgcgggatcgaacgggcctgattat +ttttccagctcctgcgttcctatcacgccaactgtcgctaataaaatgttatatagagat +aacccattgctatgcaaggatggagaaaccgcttcacaacaccctagaattacttcagca +ctaacatctaagataccgggaaaaccgtaggtgccacttggttttgagggcaatgcctct +tgcactggcgattcgtggagtaaccttgctaccgatttccaccttttctaggtatgatta +catgcgatcgccattgtcagtcgtcgtacgaaatccaggaaggaattcgaatacatgacc +gaaagctatggcatcataagcgtggctctttactaaggacacgtgtagtcggctgatttc +gcgcagaacttcgctcaccggacagtgactgctgtccgaacttgggggcagcgtagattc +tagctagagaccgcagcgaaaatgccactcgctaggtggctatggacgtccagctatagg +cccccacattcgtatgtatactccggtaattgagtctacctttcgaaagatcaaagttca +caaaccttctctcacgttaacatagatgctcgcacatagctagtccggtgataaagcggc +cgtgcatgcgagtatttagcgcacggaacagatattaggctgcgaaataccctcatatgc +tacagcgcaggtaacagacggttgatctccccgtagaattccctcaaggccggatcgttc +tcatgagtagcctttgtctgacatttcctctcaatagattgcagactcctgtgtcgtggg +aaaacttcgcggaatcgctgtcgttacataaatctaaacagtgcagtccaagctatttac +taccacgtatcataatgaacatctctttgtgaaatacgccggtacgccgagagatcgccc +acattgcgtgtcaccaagacccagtgtctattgggcgcgctggttatagtatgcggaggc +acccgatgtgctgctaatcactacaaactcgacaccaagaggcgaccgcgtgcgggaggg +ctagaacgcgagagccacgtcaacgtggtggtaccgctcctgatgatacgagcactgtgc +tggcaccgctgccctatgtccagctaacaggtgtcacataatatcgcatctatagttgag +tatcttatcgctagcgttacttgtgagttctcgggtagaatcgtcgtagcattctagtcc +ttagcgtaagcaacgatatcgccgatattataggggcaataggtctcacccaccacgggt +gtatatttaacgccctaagtagttaacggagactattaaacaattatgcacgtgaaagat +tagggtactgcacacgtgtcacgttgacgatgtaaacaccataaaggttgttctgtgatg +cgatgcccatacctgcggtgcaacgtcctaaacttatgcggatcaccttctaattcagcc +gacgttgagaacgccagctatactctgtgagtacaaggtgaaagccccagatcaaaatat +tggagtcttgtccgtagctcttgggtggagagtgtgaccacgtttatcccttaatactga +gactcttctcgttccacgccccggacattcgcgatacagcctagtttgataggtggctac +aagggctctatccgaatagcacaaaactcagtcctagtgcgtataggtcgtgctctgcgg +ttatacgctccacagaagaaagtacccactgcagtttgtcggtgggacttagcaaaacct +gtaaccaaaaccgcacatggactctgttttggtggcgtggagtgtgcccgccgcctttat +gctgggtcaaaatactatatgatttgttgtggtcgggcgcgacattggctcttatggttt +ataactattattcggtgcacagaaccgacttatgccccgattttgcacctcccgagagaa +atggtactagtcattgtctcggggttttacaactcaaggataatctgccagcggtacccc +gaaaaatcccatcccgaacggctggtacctatgctggagaccgaaatggagccagtgcta +tgcaaaccctcgctctttctatttggcccgaccagctgcgagagtcattcgacatacatt +gcgatggctggttcatctctctgcttcggattccgatcctgctgcctatggccacaacac +gaaagagatcttggatacgtcctcaccatagtccaacggacaaatatggaggtgtacgcg +cacggatacgagtacgacgggccgcccaatgctggtccttcgtgttatactgtttacttg +cctccggtaagagtgtacagcttgtacccacgcggtggaggaccttacgcgtcgtccgca +ggtgtggagatttcgctacctgttgcattggggcctcgccttacgtttttttcgacggag +gcccgacccgccaggccagaccctcatcattgggatttttactgccttggacggcagatt +ctgatgctggtaacgcgcttggcacacaccctggtcgtaattacgtactatcacctctat +tttaccaggggcgggccccgcctcaacgatcggtagtctcgttagaacagttgcttatac +tccgttagcactcacaactcggagaatgagcttacacagtccgtaatagtctccacagct +tcccctggaaggttcgtacaggggccctggggtctaatgtgctaccgcctaacttcgtta +gtgtaaggtctcgtgtgcacctccaataacgctgcatttttgtatagaactcctttatag +gcctgactcttcggaacagcccactaattgacgtgcacgatgctgcatatacccttctca +atgacgcataccggtgactaaatcctgtggctggttgacactttgcataacccaccacga +aaacgcggtttgcacgtggttggaagcgagtaccggttaagggaagttacgtaaacccaa +catagtgagcgatgcttaaaacactgcatgcgaacaacgaccggaacgagagcctaatag +aaccaaatggataggtggttacgaaatccgcgcacaagtgtcgtgccactctcgtaaaga +atgattgcttgcttatctatgagaaacctaataggcacgcacgtgtcgccagggaaaaac +caccatccgacaagacgctgaaaatcgagatagatgcagcccgcgcgtactttaagcacg +atagccatcttgagcgcgacgattcagcttacggagattacttctcaaagcggacacctc +gacgctgaagctctctatcgatgcacttgcatgtccatctacggcttgagcgaaccatgc +ttaacgcttggatgacgttgttagtcggattcgatcgtaccatactgtcctatccatcat +aacttcccgaattaaaactcattttctaccctcatttgtttcattggcgcatatgagcgc +cccatgggcgctgatcgacacaggcttgtagcgcacggctcgtcttgcagtagataacca +tagtctttacgtcgcatatattaatatatcctcagacttccactgcggtattttggatcg +tggcgtctgggacagtcacactctttaacgggagcgcgttcaatgtctgagtccatccgt +gcagttcggtgcgattttattcttccctgcatcttccggattccttcttcttgtcggaga +attcgccgctcgatcaaactcatcattggtacttattgaccgtttcatgctattacaccg +gtacactgatgataacgctgcggttttatcccccccaatacgcgcacacacgcttctttc +ggtgcgtcctgtcgtacccctattgcgcatcatggcactccagccgagcaatgctttgga +caggtgtaaccaagctggatctagcgtgggttcgacacagctcggttcgtataaccacac +gcatgaactgcgagtgcctcgccccagcgccgctgtctacttgctgtttagaggaagaag +caacagcttgcacccaatccgcatatctgcatataggtggccgttcctccgtggcgcgcc +gctacgttgtagcgcacggatcaaaagcgctgtgttactatacactggttcggagacggt +tcatgacgagcgcgctatatgtcggcatctgcgccccatgagcggccgctgtccggcggc +acgaataatatagtgcaagaaaaaccgaagactacggttatatatgatggaacggccctc +acagcattctaacaggtttgacaaacttaataaatgatgggccgcgcctgctgtgaatcc +cggacggtttggccggaaatacctaggcagtctttggaaaagcttttcctagatcaccat +atcgttgtcagtggccaaggtttcgttaactctcggcgtacccagtatcggcgcaatagg +cctttgatcaacccttggaagattagtcgatcgtaacttcctacatcccggtgaaaggct +ttaattctaagtcttcgccacaaacgcttcaggagcgtcgagttctatcactttcgaggt +actgccacttactatacaccggtacacttgttaagcaagtgtttgcggatgtggttaaat +tttgatggcagatttctgggtgttttagctatagctgtatcctcgaggtcgtcgtttaac +cgctcctgttgctagatcatatgtatcgttgttcgagacgctagtagtcgctcctaccga +atcttacaggttcgatctctgctcggcttttgccgcgggccggtgcttgtgctataatta +taatgataagggcagtggccgcacaactgcagattactgacacttgagtgagaactaagc +cttgaagcatagtgttgaatgttgtagaaaagtatactgtgacaaaaacagggcctggtg +tcaagtgtcctcagtgatctggatatcatcacgccttgttagcaggatttacccgcatag +taatggccggactttatattgccctgctgcgctagctagtactgcgggggctctcttccc +cctattgatattccgggcagaatgcgcgggtagtcagcattcatgtcaggcttctatcaa +cgtctcattcacccttggagtgtgacctacgtgttagaggcaatgtagcccgagagcccg +ttcaaagacaaactcccgaattaaacagacaccggttatgggagtgtgagtagtgacttc +cgaccagtgtttggtttcagcctgtcggttaacctcgcagggctaggagaatgagctgct +agtaggtgattaccgaagtctccccagaaagggaacagtcttatagagtagagaatgtca +aatagcgttattgagttctgtctactgcactaccaagagcatgcccaccagagatgcgtc +gcagtcgtagcgtagacgtcgtaatgacccaggtggcgttcggcctattcgcgtcggacg +cgcgcgctactacaacgaagggttctgaaagtgcatgttcacactgaaattctaagtgtt +agtaaacaaacgcgtgtattccagggtcgtgtgtgacattatggctgtctgcgcccctca +atgatcatcaagacgttcaattgtatgttaacgtagatatcaggtttagttatccgtata +ctttttacgccgcgcgcttggaacagattctcctaacagccctcgcggtttcaaaaagaa +ccaaagtctataccatccttgttcccaattctgcctggttgcggagaaaagaccgcctcc +atacgtacccgactcggtattggtaagtggggaagcagtcgaacgcatatttcttggtta +tatcacaggccacgttctatatcggaagtggccggattacgatttgacgttctatccccg +agagcgcattcttgtttgttactactaccacgcgggcgcttcttattcccagaccagagg +gaatgtgcggaagctttttccacagattggcggaactccagcgtgcttagtgcaggcgga +gaacgtccgttcagtggtgcgtgctttatttttcaatctgacccgacctgcgctcaaggg +ttgcaagttgttgtgcgcccgagtaataggcgactcgtcgcaatgggtctggtacattgc +attttcatcggtacggcgcttcataaagtgcggcaaatttctcaccccagtactcatgtt +tatagggtatcaggacccgaagcttctctgttccaaagaaatgtactgtttggctcccct +gtccatattggaggtagatcacttgtggattatgcaatgaatgaatgaaagtttggtgct +ccccaccggggcgctctcaaagagagtgagctaaatttgaacatttaaattgctattcca +acccggagtcctgaccggaacagtaatgaaacttcaaccatgccggacagactagaagaa +gggaaagttgcttgtatatgggagtaaaaatgatgttggtgccgtaatggtgccggaagt +gactatagagcatgtcgtgacgcaccggtaggcagtgctataatcgtatgtccttcaggc +gccgccggacctacgaagctgaaattagacaccggcacactagccccgtcagcgacggtg +cgcggccgctgccctgcagcgaatggggctaacacgcataaaacgcccgcataaccactc +gagctacgggaattcactcaggctgttgcttcgacgtgtagtctcattacataatcataa +tacctccaagaccaacggctgctcatgactctcttaccttgttagggacatttcggcact +agggaagagctgaggactttgaaaacgtcgataaaaccatcgcgggaactagctgcgtta +gaactccatattttacgggtcgcaagcttgaggtcctgtcccggcagctgcaagtgctac +ggcaggaggggatctacctaacgtgcagtaacgagcccctgcccgtaatgaggcgtactc +gtctctaatcgtcagtaagttactatgtccgaggacgcctctacgagttgaactctggct +aggcccacctgtccgcgccctgctcgggtaccccatctgcttatccaacttcacctcgcc +ttacggaatctctggttgccagtcatccgatggtcattaagcagcgtggtacatcgtagc +caatacttcagggcgccagccatattcccagccaagcggctgcataattacagcgcctgg +cacgactaatcgatcccacaagcctggtagatgacccttagccctaaagcgccctctgac +ctatctgcacgtgatacttgattatttgtaatgagcggacagggtagatgactaatatac +agggtcgtctaggtttgcacaatgcagacatcatccgcgcaaggcccggacggctgtact +cacacagctagctccatctccctcagcagcactaagattcccacgtgaccagggcgacgg +gcctcagccaaacgtatccttgatatctacttaagtcaaggttgactccgaaccctatgg +gtcggtgccgttaacagggagtctatatctcggcgttccattgcttgtttcaaactcctg +ctataaggtgaaagcgctggagggcatagtttatgcccaaagttgcgcgtagatccgtcg +ggatatgtgctataataaggactgctcgaggtaggcggtaacggctcccgccttcagtag +gcgcggaactcgaatcggagttacaggacttgaccgagtcatatccaagtttatgttacc +cgatcggatccggatgctcgtatctgcgacgaggtcggaagacggacgaaatacgattca +accgcgcgaaccattagcatctaacctttagcctcaatgggtgttaacgtggtgggctca +ctcggcgtactctttgtgcaactattccgtatgaacaacagtcaagttgcgacatgatgc +tcttacgtgattcccacagtttcccacctcaggatgctttctttagctaaacccaatagt +tatggcggcaccttcagactcccacgaggacggctatgacgttgctaaaccattcgccgc +caaaggctagcgctaacgagttctgtgagtttgttccgggccagatctccaggatggtcg +caacaacgcagtaccggttttatactggtgaccctctacctgttattaagttacagcgtt +gtcctacgtacatggtcgtgagtactcgcgtagtcaaacgccaggactagcagcgagaat +tattgtcgcgatacttactacaatacttacccgatattgacgtgcagggttgaaagagat +ggacagttgaatatctattttgacggaatcctcaaaactccctccacctcaggtaacggc +cctgtccgggaccgcattcttgcatatattggttcccagagcgtatctaagttagtctct +tgaccgttcaccgactctagggcgactcgttatcgccctccgaaacgatgctttcgttac +ctcaatgatgacaggctgtaacgtaagtgatcccaatctcactcgtgccttgtccaccgt +tccgtgaagacgaagcaatacgcggaatacgtggcttcgtaatattttgacgatatgggg +ctgggacgctcaagacttccatgacaaacaaagtgaagagcaactgcatccctcatcatg +atcactattaccagagtagcgatggataacgctaatttggtcagggcagctatcgcatcc +cgcaggtgtaggcggagactttttcttttgttgcgagttgacaggtaatctcacggtata +agcacggttatttacgcaagcgacgtccctgggagaatccgcccacgtaggaccccataa +tccataaatactgcggtcgaaaccttcatatcgtgacagaaccgctttctagggatgcgg +tccccgcattcagagttctactttggccagcgtgagacttaacaactccacttacgcggt +acattgaagtcgttcagtccagtgtgacctgtgtaccgaataacgtgtagaccagcgcgt +ctacgacttagcgcggctccactccaaagcaccttttgggactttccaacgagcctgttg +gccgttaagcggtatttcacaaatagatcaccctagtgtcggtaaccgactaccctattg +ggatcatcgtgagctcgaaacactagaggcggaccaacggatgacatttgattcggctct +acagagcttgtcgccagagaaaaactgtggcaatctacgctcgcggggaattgactttag +cggcccctagacaggtgtgggacactagtctagattcacgtcctacacgacataacagca +ccttcctggccagcccagaaatagtacctggacgacatccagccttccgacgccataatg +tgagccgtagcgcccacgacgatcaacgaggagaaatttacaaaggctgtgtgaatgcta +cgtcgtctaccattgctcatcgaaacgaacgcaacgcacagcatacaacgtttaccatgc +cggagcgggatcctcaagtacagaaaacagaggtctaaacatgatccgaacaaatcggta +ggtttacacagctacctcgtccattggcgtactgcatcgatcgtgcttactacggtcatg +ccggcccgcgatgcacgtacgaaggaataccctgtctgcccccgcgcgagttacgctgtc +tcgcacataccgagcactgtcgttcgaagctaaactatgagcccagccgagctccttatg +gccgcaacgctggtgcggccagctgataaattccacagtacacgatcctcgtgtaagatc +tcgggcatagtaagtcatttcacatggttaggagagatagaatacatggttctggtagct +caaccaggatttgtggaacccttggcccttggtgagtgctacaataaaattctccgtatg +ggacaaccaaagggtgctggatgtgacttcccggcccaggttagatgtccatatcattca +tacattgcccgaccgacccaatgcctaaatcagaggcgccttagctagttcttgtagtgt +gccacgtccggccacgcagacacgaccctcggcgagtgatcaccattaccggattggcat +cgaagtctttttctgggaagttagccagtttggtgtgcggtgcttagaatcttattccca +gtcaaacgcccctgggacgaattgctaaccctagttgccacgccggaaccatcttcggga +gagtagacaaatccgagttagatatgttagcgtcttcgtgagtctgaaatgtatcacttc +accgcagaatacgcgaatgtctgtttgccctggactgacggaattggcttaaaagccgac +tagagcattttggtacggttcctatccgcgatgtaattacctatctaggttatcgctaga +cgaatagcgagtacagtgtagcaggccctttgttagcaagttgctctaaacagttgtcaa +aacgtaggcacaatagtgcgattcttctaaatccgggaagctcatggcgctgggcagaaa +tatcacatacgggaataatcaacctccattttggttcgttttactcgatgagtgcccctt +gcttgagacgagcgttctgagttgatggcatgtcgaaaggtttacgcggtgagtagagca +ctttacccctacagatcggaatcctcgaggaggacagttggaacttcacattaacctttg +ttcgattgcatgaaggttgtgttctgggagtaggctcccaaggtagcggttcatgctggg +ggcagccctaagtttgtattatgtgagtttgcgtctgaaactacatttagcatgaggaac +gtaagctttctggagggatcttctaaagccaggtatcgcccgctacgatgccggagccgg +tggttcacagctacctgtgctcaaaggcttaaggctaatcatagcaacagtgcgaaagga +cgtctttcagatttcgaaaggtgctgacacaacaagggtcagggcggtcctacccttctg +attccctacctggttttttagcaagggtcaaggctaggcttatactcccgaacgctttaa +acactatcccacccctgacggggggaagttgcgcgttaagtataagaataagatttaaca +gtacactttaggttcctcttccgcgagccgtcatacagcaccgagcgccgttgaaacgcg +attaacgcgtattgtcgtgcgaaaaaaaaacgctcgccagcatattggagtgtcgacttg +aaatattgaacaacaccgcatatcaaggacgaatagtagggcttcactacctccacctga +cggccctaggacttatactcgaaaaagaccttccatcacgatgtcccttaccggcgagag +ggctatatacgcatgaatagcagatcttgccgtcgctgagtgtcacccagggttgctcca +gaaaggagatagggcggagagccatcgacagcagctctcgtctaggtggtagcagctaag +gagtcgtgtcgtcgcgccgagttggaacattatcgatgtacatcaatgcagtaatgatgc +tgatagactcgggagtttcctcaaacccagagttacgagaagacgcaggtctatcagtta +gaaggagtcagtattggcctttgaaagatcttatgctcatgcccaatcgtagttaaacgc +gaatcgggaaggccaatctggcggttttgacccccggactcttaagacgtccaatgtggc +tagacataagtaacgaattactctataccgaggggcgggaaccggccaatttattacgag +agcacgagagccttgtagcggccagcacactatcctcgagtccctctatcctgagacgta +gatatacatatacgcctagagagaatagccgtctaggcttccgtcgccctctccgtcgtt +cgcgtgaaccgtaagtcttccgcattcccttcctcaagcgcgttggtgtgagagtggtat +tgaggcccagtcttataacgcatatacttgtgcactctattacttaccatgggaaccaat +ggcactctcgaatcatgctcacagctgagcaacggtgctgctcaccaattacatatgagt +cgtggtttagcgttggagcggaagatgaatttccatctgttcgcgcgcatcactaaccaa +tatacggttatcccagcgctatctagttctgaccgggttggtagcgaacccttttgcaag +ccggcttagtggatgtgaagtgggagtgataacttaagccgccacgttcgggggggactc +gtttatattggtgctggaatacgaacggcgtgattcgtagtcgccctaatcgggcgcgac +aacacatgtagtactgtcgaggcggtttaaacccacagtaggtactctatcagcagaatt +atgctagaagtttcacaacaactttccgcatgaggctcagcggcagcgtcgcactcccaa +tggccagtgccggtagcgatgtttggtggaattagttccttcggaatacgaaccggattt +aaagagcctcggagaacctaaacgaatccgtacgcatcttgcccaaggtgctgagccttg +tcgcctttctcagttccacctacattaatgcaatgcgttcgaagctctgaccgcaaacag +gaatcaagttcagacagagtgcaagagtttcgcaataattgggaacgacccacttgatat +aggtgcttttagagatgtgtgtacgaccgtccttcgagcatacctacgggttacaattgc +tccggtaagtcaaggcacatagaaaacatagccaactgagagtgtatacaagattacctc +atgtagactgaaatacacacatcgctttaagctctcaaccgatgtagaacagattttggg +cggcgttgacagcgtgcccgctcaccggtttgctcccttctcaccaaataaccatgagac +gactttggtgactggactgccagatgacgggctacaaccgttttggttccgaattcgctc +taactcaactaacatcatactatatgcgccaggatattctcgcggttggacccccctgcc +aattcgggttaaaaccactccccccatgtagggagctgccgcaattacaatatcgacgat +cccagatggacgctcacaaaatatcagtcctttcacgatccgctcatatagacggatgaa +gggactgaggctgttagatagtgacgtcgagcatggcgtagacgagcgcaaccgggtcga +ggcccgcattaccgtgacacccagttgaaaggatttacactgcttcattcgatatttacc +actttgtatgaggagctcaacctaagtcaacacggaccatcatacaggtcgccagtaatg +agaaggctgctgtgccatggagaagcgctgctacagcacacaacgaacatcttgcaatgt +gaaggagggtgctcttttgggatgagcctacggggatgtgtatccctgccctgtaggcag +ttgggacttagcgcgactatctagataactaaggcgccagccgcggctgtttgccgaagt +cgtgctgatgctgtacaacgaagggcgagcgtgttaacatgctacacgttgacctagact +agtccaagtctgaaagtcccaatttaggtcgggtagtacagtcctcggttccagtcccat +gttgtgccgacaaggacaagcgatcatcaaatcgactgaaattgaatcagctacctcaga +ccacattcagctctcggtaacatgggaggcttgtggttgcaccgtaaaagggggatagcc +catccatcctgtaaacctacaatcgcgcgtagcttaatacgctcacattagacattcgat +cgagagacctggtttcaagagccttcccttttgctttagtgggccaaatcgcaaccctgc +tcccctcccttacgccttatacacttcagtgcaaattcatgcgttcagcgaacaactgga +cttctgttgtacgtagtccacgggggcttattcattatagaaagccccctactgtcaccg +ttatatggttcacacatgagctgatcacctagagagtcgtcatgcacattcgcctaacaa +ggacatatgagtaaccgggaggggatatcttcgatttgcagcaccaatcgacgttgtact +ggtctattgtcggttaggtccgattatccgaccggcaatgaggcaagcccatctattcag +gaaacttaggcagttccctgtgctggcccgacgtcgatgagttaagtctatacaggccgg +ccgcgagtagttaacgagaccaacatagaactatcatactagccggcaatgatcaatagg +gtcttagtgccactgtccttcgagccctcgcctaatttagcgcgaccggtttcctattgg +cctgtggggttgcgggcgcgtccgctttaagaatggtccttaacacctacccggagatcc +attgcatagcacactctccccattagcctagacacgtcgtcgcccgtcgactttggctgg +aatttaatcgccggggatatcgaactttcacgccctttaacgacgaggaaacctaccgtc +gcctggctggtaaatgggtgccttacggggactcacgatgctgtgaaccgcccgccagtc +tctggggctcccaaaatccaggttggaattacggacctccgccggtactacgcattacgg +ggtggaaagtcctaagataggtgaatgaaagggcttcgctaaaccagtaagtcattaaca +ggacatcggcgtcacgtctcgcgggtttacacggcgcacaaatcctattcccatgataaa +caccttatgccaatccacatccctcgctgcctaataaaattgtcacacctgcgctactga +ctaacgtttacgcaatgagagatgaattccgacacccacgcttgttgcaagcacagccgt +atgggttctcgggtaaggtaacacgaggcacactccggcgcggccacttcggcccctccc +tgacgatgaccctcattggtcaagcatcagtcgaatgattcgtaacaaggagcaaccgac +tcagtagagagggtgaatctcacgcgctagcctgaggaccgcctaagtgcttgctgtgcg +tcgcggcagtcgcgaggtgcgggctaaagtaaataattactggtcttacctaattaaagt +tggtggttagggacaacgttaccactaccagggtgcgcccctgaattcgggtatcggact +atccagggcgccttttgcggccttaaatacctttttaatcacgctggagctagaaggcca +tcgggatagacggggttctaggtactcgaaaaaacaggcctaataactttattgcgcttg +gactaacctatgtacaacacgttgtagcatactatggaatgttactgacctacacggata +gcatttgttcgggagcgtcattgacctcccagaccctatgccgatctgcaccattcagtg +accatccacaagtctctaggtttagccaaaggtgacaggtcaagcacttgcgcatgtcca +ctagtcgattatgcaacgtctctgaacagttagcacttatctcccgccgtgtgactcacg +cagtgaacttacctatagcatacgcctactattgaatgttcgttgttctaacacagcgct +aatacctcactggcagaggtgcgcacgctcctagtatgggagggagtcaggtcagagtgt +atgagactgatttttattcccgataggggttcagtgaaatcgacctctcaaaagagaggc +gcagaattcgctgataagctctgctacgatcgctaaggcacgataagcagggcggtgaag +gttggagcaagataatatcacccggacgcgggtcctgtcgcaacgagcggccgtgagacc +tggtgcgcaccgtgtctcgatcggccgaatatcggaacccactgcgtgactcaaatgata +tttttgctatctgtgggggatttatgtcccggtagaactctgcttctagcagaggataaa +ctttacaaggacggcgaatatggtgtcagagcgccctaatgatcccgtgctattccgcgg +gccaccggccgttaatggacttcgggttagaaggatgggttattcatcttccacagaaac +gcccagccgcaatcgtgggtttactcgaccgcggttatctgcctacttagctgcattcct +aaaacaggattaaaaaggccgcgagggttgcgaacctatggttgagaacagagtcataga +gtcagatgcgcagggacggcacggatccacatggcagttaactaatattaataccccctt +agcctcgtatatgggcgtgtgcagtcttgtccactcgcggacgcgtatccgagcgattct +gtcttccaacgctattcgttaccactttggcacctctttgctaagcaggatgagaacatc +tcactcactacgagccttgactttcagcacgcggtacgagggcactgggcttctcgtcct +ttgctagatgtaggtgccttcccgccctcatgacgatgtcacgtctatcggtttattaag +gtcggggaccattacgagattaccccgcgaccttcgtccaaatgggatcacggcaacgtt +ccacgaggggcgcgttgcctgagccactcgggtatccccttccgatatccgcagaagtct +agctaggagcaccgccaagcattacccgattaagcaaagcctactcatcgcatacacggt +tcttggggtttgcgtcagatagcaacttccggcggcagtagagatgatattttatccgat +tgagcttgcccagcgcaccctcgggccccgtggctcttctcttaaatgtgccctgcacga +tgttagcggttcctactcctccccgagccctatgggtggacagactcgccctctgaggct +gcgtgttcaactggttccaagtccggcgcctgtggatctacgacgcgaccagcaacatta +taccaatgtctaggcttagctcgaaaactagtaagccttagaactagggtcgtagcttct +tctaaatgaagggcagcgtcatagccatccacgttagcgcttactcaatcgcctgtcggc +tgtcatgttaccgctgccgtaagttcgtgaacataaaatacaacacattttaggtttaac +aaggattgtttaccgccacgtactggtgccggtagtgaaacgaaaaacctcagcatcggg +aggaggagaacggaatccctaccaatcttatctctacttaaagaacaaagcgcgcggtac +atggcgcagacgagaatgaatccccgaacgggccgagttagactcctcaacctgtcgaaa +agttgcgatccgctagatcgtagagtacggacttaaaaaagaaaagaaggtctctacccg +agcggtgagcccaaccagttccaggttgctgccggattcttccacacggcggtgccatat +ggacgaccccgtactttgggcattctaggctacctactgcgaacgcctcgcgttcatgcg +caaagttttctctagataggcgcgctttggtaagcatagtaataggttcttcagcgtcta +aagcccgcccattaggcctggcgactctgctttagtggtaaagagatagcatcgatgtac +atcgatggagagagtattttcacgaaagtgcgcgccgtacactatttatcggcatgcgcg +ctaaactggagggtctaataaccagatcacgcaacgaggtcccatgtacggttcgcattg +cgaaagtatgggatactagaggttttatcgggcctcgcttgaggtctgtctgggactggc +gcacatcgctcgtcgcccagtcgatagcggggtgattaaataagaaatatgttagtgccc +ggatttggaaccaaccagtcccggtagcggtacaaaaagcctttcctgctagttctatgc +ttaaagcgtactcctgttacaatccgtaggcaacctgaagaggcaacctggttttccttt +atttcgactttgtttgccatttccaatgtgatactgtgcggcgaccttaatgctttttgg +taaaaccataccgagatccagcgcacgcgacattcagaccggtcccggtttggcggtcaa +cctcgtactctgcactgttcagctagaggggtctcctatcccgaggtaccggtcgtctaa +cgggtggttacaggggctggtcctactctaccaacagttaaggagggcaacaagttcgat +ggggcatcgtataacttgaatgccattggacaaataataattgctccacgtcccaaacct +caactgaccttgtacgcataggtgccacctgcacgcaaccgagctcgttcaagtgtcctt +cttagctggcgccgagtgaacctgcatctgagagtctacccaacgatctagtatcataat +gtctgtagccagcgactatgacacttagagagccgcctaagaaagtgtttgcggctcctg +ccccggtgcgcttgttcggtgggaggtcgttatatagaaccatggggatataatgaatgg +taacatatctgccacgttgacaagccgctattatgaattcagggttggatactattatgg +cccttcacggtcacttgtaggacggccccaaacaggattagtaaagtcggtggtctaagt +gtaagcgataggcaaactgcggttattcgcgtagaccgcttgatgatgtaaaataacagt +tttcatgtctttgcaattaccgcgtgtagtctgaggacttaaggccccttctcggatagt +gaaatagttcaggtccggctgttgacaggtgtcctgaccggaacgctttacagctcctga +ggagcgtagcgccctacgtccttcctgatccagccgcacccatagctagtaaacaagttg +actgcgagacacaaagtcaagggcctgggcaagcgcgggccggactgcttgtcgaatatt +gaagcgtactcgatccagatctgcgccattgagttaaaaggactatacgcctgtctccag +ccgattgcagaaaggacagatcctaatagaagaactggggctccattctctcaccgacac +cctcctattcctatcccactggccccattgctggtaacccaaacctctcacgacgattca +gcgctgcgattaaagagtggagtaaggttaaaatcggttggggcgagtagtgtttgatgc +aagatccattgattatcgccagtgggatggcggcaaaggtaccatacctcgagcttattt +gggtgcctcactcctcggggaaccatatagacttgcacttggcaaaatatggtcgggttc +aaccgaccttttatgcctggaccctctgctgagggcctcttgatcaaaatgcttgcgttg +cttataagttgccgcttgatgtccaggattattattccagcgtggaacgggaaatgatag +cttatctgttactcagggcgcctgaattagggttgccattacataaaggaacgacaaggt +gagcactgggagggcgcattcttataaccgggcatatgcgcggaacaccagcgttggatg +gcctacctccgcggaggtcggggtcgaaggcccccgtttcctggaacaataacactgtcc +cacttggtttgtaaagaacctccactcgtcatgacacggcctagcggtgttatcggcgac +gataatcatgggtctttacaagtgaatcaggcttaccaggcggaccaggaggaaacactc +cacgagtgagacctggatccggggggatggcatacatcccatacgctcactcagcatgca +cgttcctagcacatgctggaatcttgcaagctggacagagtgtattgtggcccttgagct +atacttctaacgccagatccatgtttgcaaacatagctccagtggcctattcgacggttt +agcctctgcaccatgttatggctcttataggtgttgggtcgacagtgggtgactagacgt +aaagagagtatgccgtggttgaaccgagacctaaaaagctcaagatcacgacggatatct +ttaacggataccagcaatcggctaagaccagtgtctactactcgtgatcggcaccggccg +cccgttatctggtgtagtagtcagccccgcatcacccgtgcctatgcgagccttgactct +atcagtctaagagcacacgtttagacctgagccaagcgtaggtcactatcgagtcaacct +taaccctagttgattaatgctcttgacgtgtatgattacaccgaccgcgaataaactctc +acgcgcgtgacggtttcctcgctagaagaagccatatactgtacacactgctgtgaccga +caagacttacctttggtttacgtacaggtggacagttgtttctcccctcgggtcgatagc +gtttggtcgtgattccaataagtgccagatgtcggaacaacatgtttccataaagacgcg +tgacatgatatggtttgctatgaagccactacgaaaatgccagtgcttctctttatattt +tgcagatgtggaagaagtgcatccattatagtccttttacgtacctggattctccgccag +cactgccactactttcttactatccgttggggggggacgctcaacagagcgcggactcag +gaatcagataacgaccggaacggggcatatgcccagcattcgttgttgtaaagcgattga +gtttgggctgctaaggggccggcagttcgttccgggatacccgcaaaatttatgcctttg +tccggtgattctaggtttagctcgatccacgaatacgacaatacaaggtttgcctcctct +ttcgtctatcacgcaagcttagagttgctaaaatttcgtagtccgtgcgttaaagctccc +tacatttctaagctgtacgacaccacactatcttgcaacaagagtcactctatttctcat +atccgaatgaatatcgtcctgtacacgggtggcaatctcggcaagatggccgagatgtgt +agcactgtcacgttcaaaagctcaaacttctgcccactgccagccctaacagaatctgga +gacatcataccagcgctgtcccatgtggcggagagttgcttcaatagaacgctatcaccg +tgggatcacatacgtcactactccgtgtgacactatttattattcctttacctccaatac +gcccgtccttgcatcgcattttgtagtaagacatcagacgacgttactgccacggaacca +taaaacgtgctgagcccacgtaaacgtcctatcggtgaggtccgctcatcgtacgactct +gaaatttggaaactaccagtttgttggcggtgaatatccaacctgtcggcatacacgctc +acgcgtatggttggtacatgcgaaaaactacccaagcaccgggcgcgcgagacactatga +gtttagtgatgatttacggagcacgttttttgaactcaacagaccgattgaatccttcaa +acagggttactcgttcgtgacaaccgattacagcattctgaacgtggtacgtgcacatag +cttggagagttgcgcgaatctctttcgtaccgtattctacctgatcgctagctttccggg +gtaacgacatcggcaatgatgagtagcagccagtatccatactggacaggtactccatat +aaaactcccgcttcaacacgcgagatttgaaccgcacagtgattgtgctgagtcctagtc +accatcccgatcttgtacacgggtaggggtgtaacgtgggcagatgatgcttacccttcc +gctggcttgtaaaggtgccccgcttcacttgatgagctgcgtcgacaagaccacccaacc +cgagccacgtggttccgacgactcaatgatttccagtatggtccaatcgagcaccttcca +ctcatgaaatttgagcactgttggggatcgagtatgtgttttgcagtgggtctgtagcat +ggaaagatgtaccctaacccggctctggcattatcaacggtggattgggtggttaaacag +cttcccttcggagacttaatggactaaaacgaatgaatcagacgccgagaacgagaactc +accatctggcccaggagccatatttttgattggtaaatcgctcgcatagtgcccgatacg +atgcgtacttgagcgtaaacggcgcagcctctaatcataggtgattgctaagtctacggt +catccccagtggctgacgaggaattaaagacctatttccgtacttgttgcgcgccttcaa +ttatccagcgtataccccgatggctactgctacatgtctaaagtgactagccagaaaaac +ctaaccctcgcccacgaggccttgatcatctcaatcatagagtaatgttcattgaattgc +acggctcttggtgtgcacattgagacaatttctaaaccgacaagtttaatggccgagctc +ctcctgcgtccagctggaccttcatgcaggcatgaaggtccatatatattgtcctcccat +agcccgccgaccgggtctgactcaactgtgttttcgctatcccaggctagcacttctatt +ctttgttacgtccagtcatagtgttactatagggtaattttagtcatagtagacggccgc +tttttcgtatggcccgagaccgtccaccggctacccaattaagtcacatccggatcttgg +gtctagatattcctatcgaaaatagtctcgccgcctcactgcgtagttcagggggcgtca +cacttgttcgcggcttttcctcatgggatctttacccgatggttgatgcaataaatgtct +acaccggactggcgtgtccgagacgactttatacacgtgtgacgagtagatcagatcgta +cgaatggtctgtctcacctatcccagtgggaggatggaaaacactcctgcctaccgggtc +gaattatttacgcgtgttacaatatgtaatttagaaaaagggattgctggtcgatgcgtc +tccaagggattttttatctaaaagcatccttttgggtgtactctgatcgcacgtcgcaga +cagcagtgggttttgacgcagtccgtaggcccacagactcgtttgttgtttattaatccc +aggggagcgttgaagccacacctattctgtagctgtttgaaaggtagctagcccggatat +tactcaaggtgactcccttcagaatcacacgtcgctggagtcgccacagggtggcatata +cgagtgatagagcaccttactttcgaggtagcggtacattagtgcaacgatgaacccact +atagtcttagtgatttcatgttttacttacgcgaaaacgtggggttttgtcaacacgtat +acgttgaatgcacatgcctcatcctaaactgatgcactgccacaagtctgaaagagcgac +agtctgcaacatagcggaaggttacgcccaagccagtggtgatcccccataagcttggag +ggactccccttagcgttggatgtctttgccccagcggcctcggtgtacgggttctccacc +ccactatggtttggaactatgaagaggtacggcaacctacccgaggcaccaaatcgtgaa +cctacgcctatatatacggatagcagggtatccattcttaccatgagctcgtaaaccact +ccgctgaattcgatgggctttggcgcacatcaccgtttctatcacagatctgtcaacgga +atctaacgctatttactcggcgcacacagatcggaaaacccaactgtggcgcgggacgga +ctccaggaatcgttacgcgttatcaccttcggctaagtcttgacgacattagagctatat +ggtattaatagtagctgtacatcaaatgataaaattatctgaattataagtgatagcgcc +cacataatgacacacacgttttagatagttagtagacgctcgagactttgcgagcaagaa +tggactgttaaccttaggggcgggttcccgcttacaaaagctgattcgctcctagagatc +tataagcgaagttcaacccctaattaccattgcataagaccgggagaacctgtgacacct +gttcccatgggattagcgaaggattgttgacttattgccgagtgacctagtattgattaa +aaatgcgacgtgaagtaaccaggccttcgatgggcgtctccgaatgggccagtaacaacc +atatacaaactacaagttaaacccgaaaccgtggctaccatgctcatctagtcgggttcc +cgatggaacattccacggtgagcggccttggatgtcggaccaccatttggcaggacaacc +gtcacgattcgcaacagcggttaaagcaagatggacgccaataatgatattcgaaagtgg +ggttaaaactggccgccgcttgatcggtcctacttagtagcgtctcagatgctagaacca +ttccgagtgcaatgtgtgctagcaacagtggaatcggtctataacggtttcatgatccct +tctccggccatccattgagaacgattctacattaatctgttaagcgaccgccaatcactg +attagctccagaaaacctaagattaccgtatataagaatcaacctgctaaagtaggaagg +cgcaggttgccgatgaacagatcaagttcatacaggagctcttaatccaccgtacccaag +acctagtcaagcgggatgtcgttaacaactttgtacagacatttgggagcattgcaccac +agactccaatgaataacgcatccgctaggaccggatatagactgaagaaagtatagtcag +ctgcctcctaaaggaggcagtagtaggagccaacctaacgtcgtggatacgcattactcg +gtagcgtggtaaacacacgaacccgatctcagaattttagcggcgagaagttccataaat +catatttctacttcgtgctccggcttcatctgatggtggtcattattctccatatgcatc +cagtagagcttgcgcttcacgcaaagttccaggatgctcacatatgtccatacggcgcta +ctacatttactcgaacacttggaagcccgccgtcgggtgtatgactagcctttgactgag +actcagcctcgcaattgtatgtaactagcgtatcccggcaaagtttataggtccatatta +acaacagatgggagtagagcagcagcttttattcggactggcacctcatcgctttcgctg +tctgcgggatcaccggtctctcttgaacgtgttagagcctgagggatctgagggcacaca +cggcacttgtatccggaaaacctatgtatagagcctcggttgccagtactagttcgtggt +ccatagcgcctgaggggattaaacgcctccggaaacacgcgagttgttcttgtgcacgta +aaaatcacttgatgttatcgtgttcggccccagtcgctgtctcacttcaaaccagcgccg +tatccattctatgcaattacgattatacttttgacccgatctacgaatcagttacccatg +aatgcgacctgcgataacatacagtgcgacctccagtcctgttcgattaaatcgacagag +ggtcccgaacgcatccaagcggcttgggtcccgctggcaccgctgggaagtaggtagaga +cgtattgaaggaagcgtgtacagattggtgattacggtgctcttataggaccagactcgg +gcgattctacggggtcgtccacactatggacccgagcatcgaatcagtatgtcaatctga +agggactaatcggggagacgctggactccgtcaggagtgaccagaagcagggatgcaaag +acatcccggacgtggatagactacaaatcggacactcagatacatacctctagaaaatac +tattccccgtttctattccgttccgcggccttttacgtttagcttggagcaaactatata +gccgaggagggtactacaacgcgacgcacttatatcccaatgaaagaataaaagctggta +agacaacgctagccactctacctgtgttgcactcgcgatattagggagacaggttacaat +cagctgacacatgactagctgacccggagcactcaattctgcccatcggggatctgatca +aattcgtcgtcgcattggacggcttccctgcgtagcgaaggaatggttaccgtacgcctc +ccaacacacggcggtcaaaatagtcttcagcaacagtaacacaaatctcttcctagtact +cttggtacacggccctagagttaattgtgtgcccccccatactctctacatgtgataaca +gcgacccactaggttgccaaacagagtcggaagtcctatcgagtccagggcgctgtaggg +cctacagactctccgatgtcctgtgttcttcgtaattgcaatattttcgggacccttctg +ctgttgtcagattcagtctgttccatcttctggaaatgttgaggaactcgaaaacgctaa +ctccctgatatttgtggccttacatcaaccgtcctcaggtgaagcccaatgctaaaggag +tgaaccagacgtgcaggaagaagctgttgaccctttaaagctctagttcttgtcaggtgt +tccgactcgctggcgagagtatgatccagtaagcggcggacctgcgaccacatgatgagg +tccctacaaaatcctatgctccctgcgaattacaactcacagagaacagcctaggctttc +ttagttattgatgcacattctactgacgaacgcagcattcgaactaaaccattggtaatg +taattgtgacacgtgggaatctatttaaagctgcaagaactccaccacgtgttcatccac +atcggtctctgtggaatggtccaggaccgtcccaatagggggaattgcgagacccaacta +atcgagtgattgaacatgggagcaattcccgaatagaaacttgcaacgcgcagtactacg +acgatggtagcaataacgacgcgctacttcagctcatgggtctaaattagggcgaacgat +tgcacctaatctgctggcttctctagattgtagatccacagggccaattaacagtgcaaa +gaatagcgtcatatgattagtttgaaaataatatacatgaaaatcgagcacccgcatcaa +taagctacgagagtctttggagagtgccaatacacctagcacatgctgtgcttatgttat +gaaaattcatacttgactaacgttagccaccagccgatggcgctgtcacaacgaccctgg +gttaccgtttagttctctaagaagggtcactctaccagcggggttaaatataccggccga +ctgtctcgagagtgggttgagataactcaatttggatcagcattaagtctagagcgattc +tcgcggagcgatctatgcgcactgacttactcttggaatgtcactcgcggcttacatgcc +tccttgttccgcggattgaatattttatgcggtagtcatgactttaatcgtttctacaga +aaagaccgtttgaaatggcagaggaaacaaccctgctggatcctccctaagtcacatccg +gacggacagattctacttaacctccaataaattgagaaaaatgcaaaaggatgccaatac +ctatagtacattttacgtttcccgtgtggttcgtgccaacccctggacggtggatgtccc +cggtgggtttttggaccgggcgaaattattggccaacccggaaacccaccgagagcctaa +gacgtgcatgatagttataagtttaatgggagccttaattgcaaccgatgggggcgggta +tttgtctcctacaccgacactatggttgttatttgcggcttcactcaactacaatctggt +ctgtagagagtaaccccgtattatcttcccttgcgccctgggtgcgttagcggaagtatg +gggattaaggggcgtgaacaatgcttctaagagcccggcgctaacggacggtgtcacaga +gtgtctaggcagagtccccactgtggaatacgcatgcgtagcgaaccgcgcgagtcagta +ggaacacattgggagcgattgttcctcctatcagccggcctagcaagcatgacgtcaaac +cttagtgagcagcccaagaaataacgctcggactgcaacagatctaagcgggaaatatat +cgatagcgaggaagccgagaggactaagcagagagacgaagaggtgagccggagtgattt +agccccagatggcaggtatagcttccgttcacaacgaattgaacagaaagtccggcgccc +ctggaatttcgaaacgtcaccaggttggccgtaaggttggtaactcaacaccctaagact +agcggtcttgcgtcatgcaagcggggcgtgtagcctgcacagacataatacggtagggag +gttaggcgtggggcgacacagtaagatctgatgaatccatgtacgttgcctccccgtcgt +acgcagttgatacttcgcatcatacttagcagaaagcatcatcgcgacctctcgtacaat +ggcaaaaaggagggcttcgtgcacggggtagagtcttccgcactctaatgaatcaacagt +cgaggttcatggccacaaatgtaacgacgcgatatgactcgttatgtctaggtcccactg +cggatctccttagaagcgaattgtataaatctcatagccccccccttagcaagtggtacg +tagcccacacgatttacgcagagtggggtaagacctcccccacgacttggggaacgcgcg +ctcaccggatagctactgccactgtagagccactagcgcatagtgtatccatagtgatgt +acgtagccaagcggggagtccttgtcttatgactagcgccatggggctatcaactgagaa +cggatgcacaaacggtccggccattcgcacagtccgccggtcactaatgaccggtctgca +tggggctgcaacgatcgcccaaggattggaaattgttaataagagtccagtggacaattt +agtaacgcgacgcgcatctctccccgcctaacaaggctcatttttagcttgacggcgcgt +ctcacgttgccgggctcagctcgagctcacgtgccgcgcggggttacctcaggtttgagg +aatgtgtcttgaacggttcgtaccggcttagcgtcgggtgctcctcagggttcccagcaa +cattcttaccgcaatccaatactgagggcgctaccaatctaacgtatcactgacccagta +aaactcggtattacgggggcgatatatgtgcttgcctcaacatagaactaccgccttgac +gttagaacgttaagttagagcacctgcccatctggattgcggcgataaaatcgattattg +tcacctggatgaggaatatggcggacaaacgatcgtgtggacctgcgccgcaaccgtggg +atgccgcagcagaatatctacagagcgtttgcaggagggccacgcggtatccacgtaagt +tcgcgcaatagcagcatcatctcgttcggggttgctgctctcagactgtcgatacgtccg +aataccagcaacccctcgaggctttgtaatatttacggagtcctaagggatttggtgccc +caagtatagttttgccgaagggggggcacagtgccgtgactacgattgggctattgggca +acccgaccccgtgcgcacacgtttgatctcagacagagggcaaaaagacgaagccacgag +ctcttcgaaatcaatctacatctatgctgggataagttctggtccacacctagatccgag +aatggaccgtggataacgagcaccgttacctttgaggcggcagcacttttaacaccgtaa +aagtaactctatagttgtcagcctttaaagattgcgttcccaatacggtacgcaccgtct +actaccgtcaacacaccgtagcttaggtccccccgcggcagcgcttccatcgtggagggc +tgtcccccatcctccgtagaactgcgtttaccggtctggggagactccctaaagaaacac +cacaggtgaggtggacgggaatcaagttaacgcattcacgtaattcactcctgttcactt +acataagagaagttctggttcgcgccttaagtgccatccatgaggcatacgatgcgatgg +ggaccacgcctgtagactagagaaacaccatcaagttgataaggagtgaaaattagtata +ggtctggcccgctcgtctgttgatagggcctttaaatgtaataggcctccgctctgaacg +agtccgtacttatctgttggatagtaagaacacggttctcagtccgcaaggtagtatatg +actacgcgtcgatggacctaaagatacgtttggcatcgtcctgagcagcttatgaaaatt +gctgcgcgtttcaggtggaagaatctgtgttattagtgcggggacggtagtttcgtaggg +aattatgggtagtacagatctatggacgggaggtgactgtcagcagactgtgcgcaggcg +ctggtggtataatcgctgggaccacgtactggcaagacgcatgcagcctggtgacatcca +caccgccctcgctcagataggacggacgtgcggcaataccctatctggctcctggacacg +gaaaaacagcagtttaaaaaaaagtgggttttgtgcattatcactttgtccgttcgacag +tttattgcacctcccagcatgctagtaaccccttgctctgatttgagatttattatcgta +acacggagtcgacgtgaagtttgatctgcggagaataggccgagaagcccctacgtaccc +tatgattcccgccatgtgcggtgtaaaattaaccactacttatggatttcatccaaatta +actgacgcattatatatacctcgagtgtgtaagccggccctcgcggtaccaaatttcggg +ctgcatacctagaagtgtatgtcatctaaacctaaggatcgggtagtgacgtgtaactaa +cacgtgggacaatgtctgtcctgagctacgtcttaagaagtatttagtcctacgtactca +ggcatcgatactccccgatgttgggtgcagtggggcgtccgggcggctaagatagtccag +ccactccttatgtgaatttatcaaaccgggaagaccagtgcataggccacgacctacgta +gcacctccgtacaaccttgctccagggcacgtctaaatgtcgtactgggttcggactcca +tgcctggcgactagcctggcggtccacatattttacaaatccgagacaacaaagcacttc +caaagtcgcgtggaccttaaggaaggcaacacaggggacatttagccactctaaagaccc +gcatactccagggcatacacgtaacgcgttctcttcactacggagtccgcgagcgaacga +ctaagggcgagggccgtagatctccttctcgtaaatataatcaaggttgccagcgcttat +cggtgccaccgatccgaagagcgtaaggacgttacagtgtaggatacatggtttgcgccc +gtccatacataatcgaccatcaaatcgaaagcgcgtatgcagtacctcgtactgcccaaa +ggacagagcgcattacgtcaccccgagcgtagcttaccatgttaagaccgtgctcatggt +ttccacccgtaagatgagcacagattgcttgctctaggtaacatagtaataagagaacat +tcatagacgttggaccacggttgaaagaccgcctcttaactactgaaaaacaatatttgt +ccttagtaaccaagatacattaatcaatcctccgctaatgaagttggtaggcaagccttc +agtagcgtaccgtggatttgtgtttactgcatttacaccgcggctgggtacgaagcggtg +tcgggcacgcacacgcgttcgatactgtaggtttcgttggggttgcttgttgccgctaac +gttcgggtcgcttacttctgcaggcttgattactgagttcattcgatcggttcccaactt +cggactattgcgccatcatcaatgtgggaaatcatttttaggaatacacctcgtacatgc +atatgaagtctgcgtgcaacagactttccatgatgcgagctgggcttcccgtcctgcggg +atgcaattggcccagtgcgcgaaggctgggctgattacggacatatctgctgtcctgaca +atcgatggtgtagagcgtaacaatcattccaatttttcgacacgggccagggctttaggc +cactacgcacctgggttaacactcggcgacccgcctaacactgggtggacattcccgagt +tataacgacacctcattttcaacaaccacaaaaaggcataggcaaccgaactaacctttt +gtttagttacttctggtatgttcatagtgtagggcaggtgatcggttaaacgcttgtacg +gaccccattctgtagcgcttttctgaacgataacactacgttgggagatacttgttgcgc +agtcgtgggttaaaagcgagccgacgataaactgcaataaggaaagcggacctgtcacct +cccgcgggtaaatctactcgctcgtttagaggccgtaaagcgacataacggtgtccagta +caagcccaactggtttagagaattcttctcctactacattcaccgtccgtatttcggcgc +gccctacggtattcgtggtgttctgagcatacatgggatggactatcacccctgcgcgta +aggactagcagttgtaagtcacgttaaggttgcgtaggcaactgttggagtgcgtccata +cttttcagcaccccgaatttgtacgcccaagttgtatcgtcgtgctgggacgagactcag +cctttaccctaagcgtttaggaaagcgatgttttaccgcagacgcatatgagagaacgtt +gcaagatcgatctttctcgcgcacgttctgtagctagacctgcagctaatctaactgccg +aactgttaggatgttttctctcctagacgcagggaccagttgtaagtaagggtttctcat +cgctaggctagggtgatggtaggtgataccaatggagcggcgcgttaaaagggttgtaat +ctcggtgatatgtgcaccatagattgttccgttattttccttggtcatttagatacgaga +taggggcgccccagtgccacgaggtccatcttatgctgttgcgtagctagagccctacaa +ctttctaagtaaaacctccatcgagtgcgcttggagaatttcatgtaccgtggcggtacc +ttacttgatgccgcgacccctatctaattaaagaccgcttcccgatgggcgaccttaatc +ttgctgcagtccaagttaacttcctctacgcccgatgacaaatttagccggagtaagttg +ttaacctagcctaatttgtaccgaattttgggttgtgagaagaccatttctacccgacga +tcatgggttcctctcaactatacctagtgtcggttaatgatttatggcaaacaatccccc +aatgtagcacccatatgggcgcaattatgtgaacttcaacactaactattggtttagtta +gtgatatttagcgcaaataagaggcatgggctgcgaaaagattgtgtttccgcaatgcta +gggaacctgacggcatacccgagatgatagttaggtgagcccgaatcatgcttgattaac +gtaacgtctatcactacccgtgggcttttgcgattgcgatgcgttactcaaggcatactc +aatggggctggtaataccgatatgggcctgtgtcttagcagcgacgtgtcgataatcgaa +gtacaatacgccagtctacgttagggctttgctaacacatcacccacagttgaagcatca +cgcacagccctcattaggttgtcgtcaacctggaactcctagcaggctgggcagtatggc +atccttcacgaacaatcttaagagacgcacttgacacaggttgcgacagtcaggatgggg +agcttctgaaaatctctacataaggtggcctcgtgatatcgtattaactcggagagcggt +tggactaatgagtgagtccaatcagtgatcggtttttaatgccgggaccacggcttgcgg +ctgcgcgatctatttccctcgcgttacacaaggggtaggcataagcaacaagcccaaaaa +aatcctcacgcaggcgtcaggtacagactttttccctcagcaacgcaaggtacacgtgta +gtcgaatgtggtcataaccagcagctgtcttgcgcaagggcggtgctacacgcatgtttc +actccacagtgacatgatgcccgctcttcggttgttctatgcagcgcgctggtcgcacct +taagcccagttcaatccatgcaattcaccgttgcagcactagatcatataccgcatactt +cgtcagagcacaaccagatcacttacaacgaccgcaagctaagcatccctatcgtgcgta +tgtgtcgaggcgcaagtactatggtcggatgaggaggtgtgccctcaggacacacagtat +cgctcctcattcgacgacgcaagtcgtctagttctatgataggcgaagtgagtactgcgg +atcactacgcccaagacttggagtgacgacgccggctactagcgatggcagttcagaatg +gtgccttccaagggacactcggtcctaatcaggcacacgcgtctcaaagccactactcat +tcatgagctcgctggcgtggcagtggtcttatgcggctagcgaccagaatttctactagc +cttaggcgtacaagcgttgggcaggtcgcgagtaacctctacactctatcatggaccaca +cccatccatgttttaaacacagaggtcttaagaatagcgatggtacggttgagaacgtgg +gagttttttgctctacagcaagcacgttgcagtgaggagagctttaatcctaaatcataa +gtgatactggtgccgagcatctttcggacgaatatgaagacccaacgctaatgtgcctgt +tcgtcggcacattctcttgggacacccgctacccacatgtatgtgaattgggcccgtctt +gattgtgtcgtagatgccaacggttcaatcagccccgacgacgagaagcatttctacgtc +tccagccttgcaacggtttctagagtcttgctgttcgtaaattgaagaatctactgtgca +gactttatcgacccacgatacgctaatccgagcgcgactcggtctcggaaaattatccga +gggagctcgttcaatgcggcggaggctctgagtgaagtttaaggctgagatagtcacacg +cattcgggtccctacaccttgtttcgaatgtccaacgcgaactctgggcaacatcgcgag +actttgaaagatgagggggctgtgacagggcctttgtaataggggtactttaagggcggc +acaatgtgatacctatgtattcctatggtctgggtcagttatttaaattgaccggacaag +aatctgactcgtagactgctgtatagatcacgattagagtttggcaatggttctgaaagt +gatcatgtctaacgtaccggatgacactagtaataactgcagcagcgtgacgatgtaggg +gacttactctgtttacgggtctcgtctgccataaacatcctgctccggcagcggtcaaag +acgtcctattatcgcactcgggcagaaactccagtcatggtgaggcacaccaacagtgtg +gggtcggttcgtggttaccaagccaccatttttcggcccaaactcatcttgaatagtcgt +cctcattcatttgatcgatcgtcattacaaggttcataaatgcccagcgccgcgtctccg +gccagatggaagagctacgtgcaggcggtaagcaattgacgctatagccctatatacgta +tgtgggactcaaggcgacatgctataccgactggtatcgaggcgaacgacaattgctatg +ggtcatcacctcatatttagattcagcccctggtggcgtcgctttgaccaactagttaag +gttgaggagttcgctctcaaacctgataacgagctaggccatgtaccaaccttggctgtg +caccgacgagctgaaggaccgagctgctaggaggtcgcagtatcgattgctctttcagcc +ttctaaaggtgcgacagaaacttgaacctctcggtactctaacactaggggtacgagtgg +ataactcgattacattagtcctggtacaaaagtcctccttccgggcgccttaagctgctt +taaagctatgtccgcttacgagaaaggggcgcacggtccgatctacttacagactgtcaa +aacggtgtagtcggaatgggctcgaacgacgctaatagatacacgcgcattggcatggta +cttcaccaatactatatctttaaagaagggcggcgagcctatttacccacttcgattagg +ggataacacaggtgattgagttttctggaaccgtcatctaatagccgaagcagtccacat +tacagtccattgcatttaaccactaggaatcgcgccaatcttgcgcttatgttgtttagg +aggggccacgctagatcttgcctatcctgagttatatgagggacgatcctacatgtatcc +tcaaagttcgcgctcatccttagattctaggagatggattactaagtgtgtgtccatagt +ttaacgcaacacataatgttcgtgtcgtgatgcgtatccttggtcccgacctactactct +agacctatacgatagcgttcaaagctccaccatcgatgcaacgtggtcgtaccagtactt +atgaaaccttttttcgcagttcgaaccgcctggaaagaagcatacgcaatatcgtgtgat +cagcacgcagggtatcagttaaagagcccaagacttagtctatcgagcagaagaccgatt +agggtatacaccatgtcagaatcgcctccagactagtggctgatatcgtacgttacacga +ggtcgctcttgtcgagtgctcgaacgatctatcccctagatcacgcgtcccagtcggagt +atcccgcctcggatcgaaatgacggctaaaaggtgtaatcacgcgcgtaattcctgcaag +ctctctgagttctgctcgctggttcgaatgagcctgcaggcagtacctacaattcctgct +cggaggacctgttgcgagggatgcccccatacactgctgagggtaagtagctgaagtata +aaggcggcaatcttctgacaaacacccttcttccccttggttaaccagacaagctggatt +tatcacccctcccggggacactgccctgttttatatcgcggacttgcatcagtcgcagta +gtccgcgtagatgtggggacccctcccaccttacatggcaacgcgtgatggagtagtatc +tcgcgtcagtgagcgagttcgcatatttgtagggcgtcataacaaatgtaaatgctagta +agtgaaagatgtcaacatgcgggctcggttttgcgctccaggtatatcctgcatctgatg +aacttttcaatgaccgtgtctggcgcagggctgtcgttttgcaggaggggatgcccagcg +catctcgagaatcatcggctaatcaacgcgaaaaagttaatcttctatcagtcagcgggc +tataactccttgaccaacagaggatcgcaggtatttgtactgtggagaaacaatcgtaag +atggccggccatgaggcaaggattgtaatataccggggtggttatcgaagaagtaaagta +aggcctaccttctggggagcaatggggttctcagacgctaactcttcgttcacctacaac +acgattggacttagagagggacctacggacccgaaattcacataggggggttccccgata +agccaaggcaggatagagtctgaatccatggacttccatcaaacccctgtggtggttccg +ttcaagtcagggagtatcacgactcacttactgagtcacgtcctcaatatgactgaagtc +gataagacgaaggcttaatttacggaacccccgtttagtaatcaagaaacgcattggcgc +gggtctaacgtaagctcttcacaccgccgtctacgaaccagttcccggcgttgcatggtg +atcgccgggttcccttggagggagtaccttgtgccctgcccgtatggtcgttcctaaata +gcgaccaagtattagttgactgttgcgacttaaaatccaacccataagcatatatcgtgc +acccagggactggagggcctcagccccttctttcgaaacttaaaccgtcttcttatgggt +gaaatgtaagtttctacgtctggaataaacggttcgggccaccatgaagcgtctcgtgtg +atagagattcgcaatgagtctgggaagtagaatcacaccaagttagaaaaattctccaac +tcagctaccgcgacccatccgttggggtaacgcaagggtattagccgctcagaggccaaa +gattagagaaacgcgacgcctgcggctgtcttgtgactactccgaccatgccgtcagctg +gagaccctacggtgggtagttgggtagagcgccgatagctaattctcgagtggaactgcg +gaatgtgtcatatgaggtagcgatattgggctatcacaagtacgtgagcctgtgaaaacg +gacgactcactagcaagtaagcacggccctggcgtggcggcggtacgcgtacaaacctcc +actgcttggggaataaggtgcgaacaccgtgatccattgaggcgtggaggcatagggccg +gagtgttcccgtaccaattacgagctaagaccgcctgtccagccctggtgattacgtagt +aagctcggtacaagcctgtaattagcttccgggtggcggacattcgttcatattgccagt +cacggcagaggccgcgctagctaggccagccccgatgaaacacgtgctagttttctatcg +tgcctaaggatcgatggctatcgcggcattgttaacttatcaagcagccgaatcggcgat +agtggacacaacatgaacacgctaagctctgagtgccagactctaccgcggcgaatccta +ggccctgctggggctcccccacagagcagtaatggtcttctgcggccgcgtgcattcaat +ccgcgctggtcaatgcgttccatcgtgccttaagcggggcagtgtgataagacaattttg +ggggtttcatggagatatcttcagaaacctcgcgaggtgcgtttagataccacacgcgcg +gcggtcttttcacacaattcagtccgcggccggtaacctaactttgcttatcaatacata +atcctcccaaatgtacggtttcgaaggagatacctctcccctgttagactctaggttttg +cagtgctacctagagatcacaccagcattaaaccaaggtatcagcatcgtaacatgggga +ggcacgcgcttggcggtaagtacccgccacgattactctgtttcatagcgccaacgcccg +tatagtgtgcttttaacgtcctcagaaatcaccgactgatcagtatggcgacatcggagg +gaggttggcgaaatgttgcttttatagatcgttaaaacctatcgttggcgcgtatcgcct +ccatagaacttcttactcacctagtctgatcccgggactggtcgaaatggagacgacgta +gcttgagatctggatcgatcgactgatatcacacttaaatatgatcagattttactacgg +tcgatctccatatatctatcccagcacttgatacctcctgtccagccgactgcttggacc +ctagcacgcgatattagagggcgcgttgtagctcaaagtaaccagtgggacgacccgagt +gaggttaccgctggcacgtaagggtgacatgactcccccagaaacactgaatttgtctag +cagtacatcataatctgagaacatttagcgaagacgagaacaagctgtctcaatggacgt +aggacgagaggaatgtgacggttataatacgcgacctctatgtgtctattaaatccctac +gggccgtagcgagcaagctcgggatctttagtagcggatcgggtcttctacatggcgcac +caggtttgatatttcgagctagagttgctctaaagaaacgctcttgcttgggaaagtgac +ctggggtacgacgaagacacgggcctggttgcataccgtctcaccttcattcatcgagcg +cgatagcgtagcattatccagcacgggaggcacctggcatgggcgtgaaatacaatccga +agagcagcatgaaaaaaaaatgagcggtcgtgacccgagggtgcgtccctccgaacgttg +ttcgttgccaaggtaagggacccacgccaagcatggttagggaagcgtgaccgacacaac +atagaggacaatctcaatatgccttctgggtatcacctgggtgtgtagcagtgctactgt +tacaagtcgcgccatctgcgacgtcgttcgtccctattccctcctaaaggccccgactct +gaaaaaacctacaatcctagacacgttgtggcccagcacaacgcgtctgctatacagcaa +gtcattcgtcgaatggggcaacacgtataagaaggccgtgattccaagggcacatggcgg +gtctctcaatgatctacgacgtgacgcaaacggggaaaggctggaccgttgtccggtagg +cgatccatcataaaaggcgtctggttctgtggttattgtgtacacgtttgaaatatctga +ctgtagaacgatggaggtctctacgtagctctgcacgattccctcgggctcacgttcatg +gcaaggcgacatcacatgaacagggttgggtaacagccatctctgaagcattcccccagc +tcgcacggctcctttacccgctactacgtcatgcactggctagagacccaccaactattg +tgcaagtaaagaccataaaattttggagctgtagcgaaagcgagttgctgcgatggttag +accaacattgggtcaaactattctaatccggctaggctcattaagcatcgcagattgccg +atactaatgctaacgagcgatgaatgggcctcttcgagacgcgtccgtacctgcgaatat +caaccatgaaccctaatctggaaagtttgatgccgctgtgatagccactcctgtgtcgcg +acggcaacgtaatgtacgtgcttggtttgagctctaaacataccttcgttagagttggtc +agaggaggatattgtcatagcgctacaaccagcgccaaaggatagctccgtggctggtcg +gacgcgctagaatctaggcagaacacgtgcggcttcttgcactctgacgctcacgcattg +gactttggcggtcatctggttctcataagtccgaatcacagtagataaagatccgcgtga +taagatatgcctacgtacttaagtagcaccctctgttcttggcgatcctatcattgcggg +ttctatacatatgttgatccaaccatcggccgccgggccgtcgtaggatctaatggccaa +cacatcaatcaaatcactcgcgaggacgcggaggtcccgtccataggtgtgtatgttggt +acgcagcacctaatctggtctggtcaagcaactggcttgttccagtatataatctcagat +agactgccctgaaagtagacaatgataaatatgtaagagcggggaaatcccatcgtcgac +tgtgttgcggacgattagcttgcaaagagaggtgtgagcggctgtcttaaattatggact +cctcgcttccgtcgaacgtctgactagagaatctcttggaggtacacacgaacgtaggtt +cctcacagtatgtggcatggacaccggacaggtcacttgtatttatccattgaacgtgat +atagtgtgtcgagtcgttatacaatacatactccaagcgtactccctttgggtaacgggt +ttgggtacatattaccatggtgtggaccgatttgtaaccctataagcgttccgggtactt +taccatcgcggatgcgatcgcggatctacctatgtcagcgacatactgcccgtccaaaag +tgattcagtatgtgttaatcagcgtattgcatcatcagtcattgagagtggaccgttctc +gaagagcaagattcctgaccctttccactgggccatccagtacacccaattatatgcaga +cgaaaagctccatacatatataatacctcttcacaccgtgtgcagagaccaacttgatcg +atattgtactcactcgtacggaataattagaagggcccgactgtcgagaccgttagcatt +tgcattatcgcggtgagcgtatagaaacaattataggctttgctgcgatcgcagtgtctg +ggacagagtctcctagacctagatcagcttaaaacaatgattgtaggtaatgtgcgttgc +cgtcgggccacacctttcagttcggttacaccgactcagaattatcttctatcgggaccc +tcaaactgataatggggtcaaatggtggtggtcccgtctttctgcagtgctttgtgagca +gaatagctctcgagcgctccagtacgcctgagtatggctgcgcccaccaattggcgccgt +taatgcgtggcgacacaagagaaccagtccacataagttatgcccttaagaagatcaccg +ggtttgcgccatcctgattcaggtaacggacgtccgtgtacacgaaccatactaatgagt +tctacatcgctccaacgcgtcttgaaccctatcgacaattacaaatgcaaagtattagtt +gggtcagtgcgtagcttatccaagggctgcagtaagtcgtccccatgacagacggacggc +ataagggccaaaaattccgccgcattagctgttaataatgccatccagaaccggacagtc +tcgatatataacttacggctgcgaactggcccttatgaattacatccacgtgctagttaa +caggacggatcgcccggactaattgccgatcggccgtcccattctccgtacgatgtactg +aacccaggcgtgtgaatgggtatgtcaacgtttacccatcgaccctgcctatagacctga +gtttcattccagttgagcgtagaatgggatgagcagctttgcttgaggtgcgatattcgg +gagacctggtcagcaggattgatggttttatagtgctggattccctgctgaaattctctc +ttctgccgcatgtgaagaaggccttgcttcccttccacatgattgtaagatttcctaagg +cctcccagctgcgtggaactgtgagtcaattaaacctctttcctttataaattacccagt +ctcaggtatttccttatcgtggtatgagaacggattaatacagttgtgtaagccagctcc +ttataataaatctctctccctctctctgcctctcatctatgtatgtatgtatctgtcatc +tatctcctataagttgtttcttttgagaactctgactaacatagacattaaataaacaat +ttgtatactgaataattatataactactgcttgggggtgtggttgtgttgtgtggtgagg +gggtgtagaaatgtctaggggttgatctagcctaacaccttccagatgaccctaggttct +ggcctttccccaaagagtcctggtctactcagtcatctcccacaatttggccatcttctt +gggtgctcaggacaataaatgacccagccagatcctctagagtcgacctgcaggcatgca +agcttggcgtaatcatggtcatagctgtttgctgtgtgaaattgttatgcgctcacattg +cacacaacatacgagccggaagcatacagtgtagagcctggggtggcgtatgagtgagct +aactcacattaatttgcgtttgcgctcactgccgcttttcagtcggggaaactgtcgtga +cagctgcatttaatgatcggtcatcgcgcggggagatgcggttttgcgtattgtgccgca +ggtggttatttctctcaacagtgagacgggcacagctgattgccctcaccggctgggctg +agagagttgcagcaagcgtacacgcggggtttgcccagcagggcgaaattcctgttgtga +tgtggattccgaatcgggcaaatgccctataaatcaaagcatagtccgagatagggtttg +agtgtgttcagttttgggacagaggtcactataaagaacgttgactgcacgtcaagggcg +agaaacgtcatcaggcgattgcactacgtgacatcaccaatcagttttttgggtcaggtg +cgtgagacttatcggaactaaaggagcccgttttagcttcggggaaacgcgaagtgtcgg +aagaaggaaaacgaagagcgggtatcgcggaatgtacgtgctgagcgaaaccaacgcgcg +ttacggtcaagcgtgtatgtgttttggaggtaagtttccctgataaagcggaacaggggc +tatgtgtttacgggggtcgcatggagtacaagggggcaggacaagatttgcgcgacatgg +ttttttttaaattgcgggagatggttggctgtcccgatgagattagaacctgcttttgtt +ttagtttcggttcggtcagttcggactttggattggttttgttgggtatttaagaagggt +gtttgtgggatgtttttttttgggtcgagcatcactggactatgtgtgtcctgcgtatcg +tggcggggcctcgaacttagaggtaggacgattccgatgcaacaaccttatgctttactc +caagcgatggtgaggcaaccttgtacagaagtgcaaccgccattgtggctgggtcggccc +aaggaacggatattctcctgggtactgacaacccaggtctactgggttctatcgacggta +cagtcaagcctcgagtttactgtctcccacttaagtccgctctgggcattaatgagtctg +tggggtatcaagggtcacccaacgaagtagctagtcccgttgtacatttcgcgcgttacc +tagggagcacggtgagctacgagggtgtagctgcacacagcacggtatataggaacgcaa +acatagtagtatgtccctatgcataacagggagaagtgactctccgacggtcatttatcc +cagactctcctcgctccctactaattgttctatatacaatcggagtaaattggtacctct +ctgacaacataggggggttgaagtttatgccacgcagtctgttacacttttgccggggaa +ttgtgtagaccatgactcaaggtggtggtgcgagttactctactatctactgcttctcat +tacacatctcttggcttacaggccccagttatcagttacgaggctgccttaagagaaggc +caacattcatgatcagatccccgcacacgggatgatagtctgagatctgccggacgctcg +tctgctacaagtgtgggttgagcatagggtaagcctaagggctcgtaatggtacttcgcg +atgtttattcgatatgagctacaaggtataacgttgccttcaccatttcggctcacgact +cttacctcgcctcaccgctagacaccctgaccaaccgttagggtactgacaaccgatcag +gcgactcctaaaggacctctcagcctcccagacatgaggtccgctcgcatgctgttcagc +gagtccatatcaggaacagcaacgagacaaggcgagagcaacactagacttggagacata +ccaccacatctgtttactcttgattcaggaagacctgtggtaactgggcgacgcgtgcgt +ttatccgtcttccaatctccacagaatctgctccgtcagagggatgtatgactaacgcac +tgattttttgttcagtaaccgggcgcggattacggggcgtattccaggggtacattcaac +gggaccccaaggaaaagttcggggtatttaaggaggcggtccaactctcggacttattgg +gcgacgtaatgataagcacacctctgctcatacagtgcacgaagaccggcattgttcaaa +cacagccgtccattccgcgactattgtcctgtgtacaggtgcctcgggtcccaaatccag +cttatacccaaaactctcccggacttttttcgtccttgcaggaggaaaggacctgactcc +acgtttattaggggatcgttgggcccggacaatcgtgtattcaacataataaatgggttc +tagtttaaagccggaggtgacggtggattatggactagaggtaaacatttccggcgtagg +tcagaaagaatatagaccctaaatttacgcaaaacgtgcacacgattgtaggtggagtcg +tattaggaactcagggcgggtggaacgagtgtgttttaggcttaccatgaaccgtcgcgc +ggaaaatgatgacagaatggacggtgcttttttgcggggccaacaaaactcgcttatgtt +cgccattggatgtaagtaccgctatactacgcagcgaccccttacgacattgttgatttc +caatgctttcatggaggtttgtgagcggtcgctaggaatcttcctccagcgagtagccag +ctggccactagttagcaaccagagttcatatgagctccagtaacacgaaggtacataagg +aacgcaagcaagttcgggactacatagaacttggggtgcgtctaagccggggatcttaat +agacaagaggccatcgtatgggtcaaatttcatgtttcgtcagatgccctatccgtggac +acctaaatcaagcatcatatcctaatgctatttgctctcgctttggtatgattcatatgc +agccctgtccgtaaaatgacgggccagaggatacctgtcactacctatttcagattacca +ctgttcgaaaccttgctctgaaatcgatcttcgtagagtgttcgttaatcgccgcgtgaa +ttatataatcccccaaggagtacccttcgtcggtgcagtctacgtaactttcccaggtta +gcccccatctaatcgacgtacgtgagggggctacgggagatcgcacaagccgaagcattt +ctgctctgtttcgttacaactggaatcctcatcacgcagcgctaccggatgccatcccta +gtcatccccgcgagtttaaccagtcgagatggctcgaaccgtgtttcgaaggctggctat +tgaaccagttataaagcaggggcgactgtccgtcggacttcgatataaactatcacaaat +ttggcataagtatatacagccaagaaggctcagataggcacacgcacccaaatagtgacc +gcctacgttcaggttgcccggcaacgaagcgcgcttgctccattaatccactatcagagg +taacgaccctctttcaccgtagctgcccccatgtcggggcaacagtttcccaccgataac +gtgttctgtctagtacgtgaaacggattggctaacccctgtcagcctaattagatgacat +cctcgtacctctagagaaggtgaggagaccgctggaacataagtaaacagtttaccaaac +aatgatcatacatataacagaaaggagagatgcccggtggggtcgaagatacagctgtgg +ttgatatctgcaacggccaggctgtcatgaagatcacgcgcacgaagctatttatgaaag +atacccatgccggggcggcagcggtacctagtcctaaataccgacacgtagcaacgcgtc +ccctgaggcccaccctagtcaagggaacttaaaatatacgctgactttgtctaccaatca +tcttcgattaacaccggcatactaagtctaccctggacccagcaatgagaaaaacttttc +cgaatgatcattgtgagtttacagagattaggaacaccaaaaaaatttacgtacgtccgg +ttacccctgtgtgacccttggccacaaaccgtaaggtgcagcatgggcgttgagtccagg +gtttgtgacaccagacatgaataccctgtggcgggttgttagcatgttattcggatccga +tttcagagggtccgttgataccgggcagtacaagacaccccacaccactgaggtggtacg +tccgccagtctgctccctacgttatgcaaaattccttccccggcgttcttgcctgtacta +ctcctaaagggccgtgaaatccgacgttgctgctccgtctcgggacacccacacaacagc +tacggaaaatcgtgaggatgcacaagggtcttgcattgttgatctatacagctcttcgca +cggtgtgctactgttttccacaatgggcaaggggcgtgtaggtcttatgtaggagtaccc +cgtgatctggctataccttgctatctattccaccaaaatagccggggtcttatagtttta +ttccggatctatcaagtgacaagtccatggggtaaacggtaagtttcgtacgctgggcgg +tgatccccgcttataaacgagcaaaccgccaaagcaaccattgccgggcttccagctagt +aaatgttgggtgtcaatcgtgcatgtgactacttacccacaaagggacgcttgaagcgcc +tgaactcgtcacgtcatgcctagctcccggttgaaacacgaagacgcgtgaacctatctt +tgcttactattcgcctcctttaagaggcttcttgatgtggctctgcgacatggacagtag +tagttgtacctgggtatgttagtgaaattacaagtacctcaaaaacgaattacgtgtata +cattgttgcggagttgaacaACGGCATTAGGAACACTTCCGTCTCtcacttttatacgat +tatgattggttctttagccttggtttagattggtagtagtagcggcgctaatgctacctg +aattgagaactcgagcgggggctaggcaaattctgattcagcctgacttctcttggaacc +ctgcccataaatcaaagggttagtgcggccaaaacgttggacaacggtattagaagacca +acctgaccaccaaaccgtcaattaaccggtatcttctcggaaacggcggttctctcctag +atagcgatctgtggtctcaccatgcaatttaaacaggtgagtaaagattgctacaaatac +gagactagctgtcaccagatgctgttcatctgttggctccttggtcgctccgttgtaccc +aggctactttgaaagagcgcagaatacttagacggtatcgatcatggtagcatagcattc +tgataacatgtatggagttcgaacatccgtctggggccggacggtccgtttgaggttggt +tgatctgggtgatagtcagcaagatagacgttagataacaaattaaaggattttacctta +gattgcgactagtacaacggtacatcggtgattcgcgctctactagatcacgctatgggt +accataaacaaacggtggaccttctcaagctggttgacgcctcagcaacataggcttcct +cctccacgcatctcagcataaaaggcttataaactgcttctttgtgccagagcaactcaa +ttaagcccttggtaccgtgggcacgcattctgtcacggtgaccaactgttcatcctgaat +cgccgaatgggactatttggtacaggaatcaagcggatggcactactgcagcttatttac +gacggtattcttaaagtttttaagacaatgtatttcatgggtagttcggtttgttttatt +gctacacaggctcttgtagacgacctacttagcactacggccgagcgcaataacccccgg +aaagcacttgctactgggaggcgggtttatccatcggcaataggggttatcagtactacc +aagaagattgtgaagatattaacagcattgaaaaaagttcggactgggcatgaaacgtgt +gtcagagttagagtccttgagggactgaatgggtttgtcccaggcccaagcttgaggtgg +atgtcacctcgggtactgcctctattacagaggtatcttaatggcgcatccagccttgtg +gctgggtctacgtacgcgtgggcaccatacgtatgttggcaggaaaggtcaatcatgctt +gtttcctcgtcgcagaaacgttcacactattggctcgcgggatcgaacgggcctgattat +ttttccagctcctgcgttcctatcacgccaactgtcgctaataaaatgttatatagagat +aacccattgctatgcaaggatggagaaaccgcttcacaacaccctagaattacttcagca +ctaacatctaagataccgggaaaaccgtaggtgccacttggttttgagggcaatgcctct +tgcactggcgattcgtggagtaaccttgctaccgatttccaccttttctaggtatgatta +catgcgatcgccattgtcagtcgtcgtacgaaatccaggaaggaattcgaatacatgacc +gaaagctatggcatcataagcgtggctctttactaaggacacgtgtagtcggctgatttc +gcgcagaacttcgctcaccggacagtgactgctgtccgaacttgggggcagcgtagattc +tagctagagaccgcagcgaaaatgccactcgctaggtggctatggacgtccagctatagg +cccccacattcgtatgtatactccggtaattgagtctacctttcgaaagatcaaagttca +caaaccttctctcacgttaacatagatgctcgcacatagctagtccggtgataaagcggc +cgtgcatgcgagtatttagcgcacggaacagatattaggctgcgaaataccctcatatgc +tacagcgcaggtaacagacggttgatctccccgtagaattccctcaaggccggatcgttc +tcatgagtagcctttgtctgacatttcctctcaatagattgcagactcctgtgtcgtggg +aaaacttcgcggaatcgctgtcgttacataaatctaaacagtgcagtccaagctatttac +taccacgtatcataatgaacatctctttgtgaaatacgccggtacgccgagagatcgccc +acattgcgtgtcaccaagacccagtgtctattgggcgcgctggttatagtatgcggaggc +acccgatgtgctgctaatcactacaaactcgacaccaagaggcgaccgcgtgcgggaggg +ctagaacgcgagagccacgtcaacgtggtggtaccgctcctgatgatacgagcactgtgc +tggcaccgctgccctatgtccagctaacaggtgtcacataatatcgcatctatagttgag +tatcttatcgctagcgttacttgtgagttctcgggtagaatcgtcgtagcattctagtcc +ttagcgtaagcaacgatatcgccgatattataggggcaataggtctcacccaccacgggt +gtatatttaacgccctaagtagttaacggagactattaaacaattatgcacgtgaaagat +tagggtactgcacacgtgtcacgttgacgatgtaaacaccataaaggttgttctgtgatg +cgatgcccatacctgcggtgcaacgtcctaaacttatgcggatcaccttctaattcagcc +gacgttgagaacgccagctatactctgtgagtacaaggtgaaagccccagatcaaaatat +tggagtcttgtccgtagctcttgggtggagagtgtgaccacgtttatcccttaatactga +gactcttctcgttccacgccccggacattcgcgatacagcctagtttgataggtggctac +aagggctctatccgaatagcacaaaactcagtcctagtgcgtataggtcgtgctctgcgg +ttatacgctccacagaagaaagtacccactgcagtttgtcggtgggacttagcaaaacct +gtaaccaaaaccgcacatggactctgttttggtggcgtggagtgtgcccgccgcctttat +gctgggtcaaaatactatatgatttgttgtggtcgggcgcgacattggctcttatggttt +ataactattattcggtgcacagaaccgacttatgccccgattttgcacctcccgagagaa +atggtactagtcattgtctcggggttttacaactcaaggataatctgccagcggtacccc +gaaaaatcccatcccgaacggctggtacctatgctggagaccgaaatggagccagtgcta +tgcaaaccctcgctctttctatttggcccgaccagctgcgagagtcattcgacatacatt +gcgatggctggttcatctctctgcttcggattccgatcctgctgcctatggccacaacac +gaaagagatcttggatacgtcctcaccatagtccaacggacaaatatggaggtgtacgcg +cacggatacgagtacgacgggccgcccaatgctggtccttcgtgttatactgtttacttg +cctccggtaagagtgtacagcttgtacccacgcggtggaggaccttacgcgtcgtccgca +ggtgtggagatttcgctacctgttgcattggggcctcgccttacgtttttttcgacggag +gcccgacccgccaggccagaccctcatcattgggatttttactgccttggacggcagatt +ctgatgctggtaacgcgcttggcacacaccctggtcgtaattacgtactatcacctctat +tttaccaggggcgggccccgcctcaacgatcggtagtctcgttagaacagttgcttatac +tccgttagcactcacaactcggagaatgagcttacacagtccgtaatagtctccacagct +tcccctggaaggttcgtacaggggccctggggtctaatgtgctaccgcctaacttcgtta +gtgtaaggtctcgtgtgcacctccaataacgctgcatttttgtatagaactcctttatag +gcctgactcttcggaacagcccactaattgacgtgcacgatgctgcatatacccttctca +atgacgcataccggtgactaaatcctgtggctggttgacactttgcataacccaccacga +aaacgcggtttgcacgtggttggaagcgagtaccggttaagggaagttacgtaaacccaa +catagtgagcgatgcttaaaacactgcatgcgaacaacgaccggaacgagagcctaatag +aaccaaatggataggtggttacgaaatccgcgcacaagtgtcgtgccactctcgtaaaga +atgattgcttgcttatctatgagaaacctaataggcacgcacgtgtcgccagggaaaaac +caccatccgacaagacgctgaaaatcgagatagatgcagcccgcgcgtactttaagcacg +atagccatcttgagcgcgacgattcagcttacggagattacttctcaaagcggacacctc +gacgctgaagctctctatcgatgcacttgcatgtccatctacggcttgagcgaaccatgc +ttaacgcttggatgacgttgttagtcggattcgatcgtaccatactgtcctatccatcat +aacttcccgaattaaaactcattttctaccctcatttgtttcattggcgcatatgagcgc +cccatgggcgctgatcgacacaggcttgtagcgcacggctcgtcttgcagtagataacca +tagtctttacgtcgcatatattaatatatcctcagacttccactgcggtattttggatcg +tggcgtctgggacagtcacactctttaacgggagcgcgttcaatgtctgagtccatccgt +gcagttcggtgcgattttattcttccctgcatcttccggattccttcttcttgtcggaga +attcgccgctcgatcaaactcatcattggtacttattgaccgtttcatgctattacaccg +gtacactgatgataacgctgcggttttatcccccccaatacgcgcacacacgcttctttc +ggtgcgtcctgtcgtacccctattgcgcatcatggcactccagccgagcaatgctttgga +caggtgtaaccaagctggatctagcgtgggttcgacacagctcggttcgtataaccacac +gcatgaactgcgagtgcctcgccccagcgccgctgtctacttgctgtttagaggaagaag +caacagcttgcacccaatccgcatatctgcatataggtggccgttcctccgtggcgcgcc +gctacgttgtagcgcacggatcaaaagcgctgtgttactatacactggttcggagacggt +tcatgacgagcgcgctatatgtcggcatctgcgccccatgagcggccgctgtccggcggc +acgaataatatagtgcaagaaaaaccgaagactacggttatatatgatggaacggccctc +acagcattctaacaggtttgacaaacttaataaatgatgggccgcgcctgctgtgaatcc +cggacggtttggccggaaatacctaggcagtctttggaaaagcttttcctagatcaccat +atcgttgtcagtggccaaggtttcgttaactctcggcgtacccagtatcggcgcaatagg +cctttgatcaacccttggaagattagtcgatcgtaacttcctacatcccggtgaaaggct +ttaattctaagtcttcgccacaaacgcttcaggagcgtcgagttctatcactttcgaggt +actgccacttactatacaccggtacacttgttaagcaagtgtttgcggatgtggttaaat +tttgatggcagatttctgggtgttttagctatagctgtatcctcgaggtcgtcgtttaac +cgctcctgttgctagatcatatgtatcgttgttcgagacgctagtagtcgctcctaccga +atcttacaggttcgatctctgctcggcttttgccgcgggccggtgcttgtgctataatta +taatgataagggcagtggccgcacaactgcagattactgacacttgagtgagaactaagc +cttgaagcatagtgttgaatgttgtagaaaagtatactgtgacaaaaacagggcctggtg +tcaagtgtcctcagtgatctggatatcatcacgccttgttagcaggatttacccgcatag +taatggccggactttatattgccctgctgcgctagctagtactgcgggggctctcttccc +cctattgatattccgggcagaatgcgcgggtagtcagcattcatgtcaggcttctatcaa +cgtctcattcacccttggagtgtgacctacgtgttagaggcaatgtagcccgagagcccg +ttcaaagacaaactcccgaattaaacagacaccggttatgggagtgtgagtagtgacttc +cgaccagtgtttggtttcagcctgtcggttaacctcgcagggctaggagaatgagctgct +agtaggtgattaccgaagtctccccagaaagggaacagtcttatagagtagagaatgtca +aatagcgttattgagttctgtctactgcactaccaagagcatgcccaccagagatgcgtc +gcagtcgtagcgtagacgtcgtaatgacccaggtggcgttcggcctattcgcgtcggacg +cgcgcgctactacaacgaagggttctgaaagtgcatgttcacactgaaattctaagtgtt +agtaaacaaacgcgtgtattccagggtcgtgtgtgacattatggctgtctgcgcccctca +atgatcatcaagacgttcaattgtatgttaacgtagatatcaggtttagttatccgtata +ctttttacgccgcgcgcttggaacagattctcctaacagccctcgcggtttcaaaaagaa +ccaaagtctataccatccttgttcccaattctgcctggttgcggagaaaagaccgcctcc +atacgtacccgactcggtattggtaagtggggaagcagtcgaacgcatatttcttggtta +tatcacaggccacgttctatatcggaagtggccggattacgatttgacgttctatccccg +agagcgcattcttgtttgttactactaccacgcgggcgcttcttattcccagaccagagg +gaatgtgcggaagctttttccacagattggcggaactccagcgtgcttagtgcaggcgga +gaacgtccgttcagtggtgcgtgctttatttttcaatctgacccgacctgcgctcaaggg +ttgcaagttgttgtgcgcccgagtaataggcgactcgtcgcaatgggtctggtacattgc +attttcatcggtacggcgcttcataaagtgcggcaaatttctcaccccagtactcatgtt +tatagggtatcaggacccgaagcttctctgttccaaagaaatgtactgtttggctcccct +gtccatattggaggtagatcacttgtggattatgcaatgaatgaatgaaagtttggtgct +ccccaccggggcgctctcaaagagagtgagctaaatttgaacatttaaattgctattcca +acccggagtcctgaccggaacagtaatgaaacttcaaccatgccggacagactagaagaa +gggaaagttgcttgtatatgggagtaaaaatgatgttggtgccgtaatggtgccggaagt +gactatagagcatgtcgtgacgcaccggtaggcagtgctataatcgtatgtccttcaggc +gccgccggacctacgaagctgaaattagacaccggcacactagccccgtcagcgacggtg +cgcggccgctgccctgcagcgaatggggctaacacgcataaaacgcccgcataaccactc +gagctacgggaattcactcaggctgttgcttcgacgtgtagtctcattacataatcataa +tacctccaagaccaacggctgctcatgactctcttaccttgttagggacatttcggcact +agggaagagctgaggactttgaaaacgtcgataaaaccatcgcgggaactagctgcgtta +gaactccatattttacgggtcgcaagcttgaggtcctgtcccggcagctgcaagtgctac +ggcaggaggggatctacctaacgtgcagtaacgagcccctgcccgtaatgaggcgtactc +gtctctaatcgtcagtaagttactatgtccgaggacgcctctacgagttgaactctggct +aggcccacctgtccgcgccctgctcgggtaccccatctgcttatccaacttcacctcgcc +ttacggaatctctggttgccagtcatccgatggtcattaagcagcgtggtacatcgtagc +caatacttcagggcgccagccatattcccagccaagcggctgcataattacagcgcctgg +cacgactaatcgatcccacaagcctggtagatgacccttagccctaaagcgccctctgac +ctatctgcacgtgatacttgattatttgtaatgagcggacagggtagatgactaatatac +agggtcgtctaggtttgcacaatgcagacatcatccgcgcaaggcccggacggctgtact +cacacagctagctccatctccctcagcagcactaagattcccacgtgaccagggcgacgg +gcctcagccaaacgtatccttgatatctacttaagtcaaggttgactccgaaccctatgg +gtcggtgccgttaacagggagtctatatctcggcgttccattgcttgtttcaaactcctg +ctataaggtgaaagcgctggagggcatagtttatgcccaaagttgcgcgtagatccgtcg +ggatatgtgctataataaggactgctcgaggtaggcggtaacggctcccgccttcagtag +gcgcggaactcgaatcggagttacaggacttgaccgagtcatatccaagtttatgttacc +cgatcggatccggatgctcgtatctgcgacgaggtcggaagacggacgaaatacgattca +accgcgcgaaccattagcatctaacctttagcctcaatgggtgttaacgtggtgggctca +ctcggcgtactctttgtgcaactattccgtatgaacaacagtcaagttgcgacatgatgc +tcttacgtgattcccacagtttcccacctcaggatgctttctttagctaaacccaatagt +tatggcggcaccttcagactcccacgaggacggctatgacgttgctaaaccattcgccgc +caaaggctagcgctaacgagttctgtgagtttgttccgggccagatctccaggatggtcg +caacaacgcagtaccggttttatactggtgaccctctacctgttattaagttacagcgtt +gtcctacgtacatggtcgtgagtactcgcgtagtcaaacgccaggactagcagcgagaat +tattgtcgcgatacttactacaatacttacccgatattgacgtgcagggttgaaagagat +ggacagttgaatatctattttgacggaatcctcaaaactccctccacctcaggtaacggc +cctgtccgggaccgcattcttgcatatattggttcccagagcgtatctaagttagtctct +tgaccgttcaccgactctagggcgactcgttatcgccctccgaaacgatgctttcgttac +ctcaatgatgacaggctgtaacgtaagtgatcccaatctcactcgtgccttgtccaccgt +tccgtgaagacgaagcaatacgcggaatacgtggcttcgtaatattttgacgatatgggg +ctgggacgctcaagacttccatgacaaacaaagtgaagagcaactgcatccctcatcatg +atcactattaccagagtagcgatggataacgctaatttggtcagggcagctatcgcatcc +cgcaggtgtaggcggagactttttcttttgttgcgagttgacaggtaatctcacggtata +agcacggttatttacgcaagcgacgtccctgggagaatccgcccacgtaggaccccataa +tccataaatactgcggtcgaaaccttcatatcgtgacagaaccgctttctagggatgcgg +tccccgcattcagagttctactttggccagcgtgagacttaacaactccacttacgcggt +acattgaagtcgttcagtccagtgtgacctgtgtaccgaataacgtgtagaccagcgcgt +ctacgacttagcgcggctccactccaaagcaccttttgggactttccaacgagcctgttg +gccgttaagcggtatttcacaaatagatcaccctagtgtcggtaaccgactaccctattg +ggatcatcgtgagctcgaaacactagaggcggaccaacggatgacatttgattcggctct +acagagcttgtcgccagagaaaaactgtggcaatctacgctcgcggggaattgactttag +cggcccctagacaggtgtgggacactagtctagattcacgtcctacacgacataacagca +ccttcctggccagcccagaaatagtacctggacgacatccagccttccgacgccataatg +tgagccgtagcgcccacgacgatcaacgaggagaaatttacaaaggctgtgtgaatgcta +cgtcgtctaccattgctcatcgaaacgaacgcaacgcacagcatacaacgtttaccatgc +cggagcgggatcctcaagtacagaaaacagaggtctaaacatgatccgaacaaatcggta +ggtttacacagctacctcgtccattggcgtactgcatcgatcgtgcttactacggtcatg +ccggcccgcgatgcacgtacgaaggaataccctgtctgcccccgcgcgagttacgctgtc +tcgcacataccgagcactgtcgttcgaagctaaactatgagcccagccgagctccttatg +gccgcaacgctggtgcggccagctgataaattccacagtacacgatcctcgtgtaagatc +tcgggcatagtaagtcatttcacatggttaggagagatagaatacatggttctggtagct +caaccaggatttgtggaacccttggcccttggtgagtgctacaataaaattctccgtatg +ggacaaccaaagggtgctggatgtgacttcccggcccaggttagatgtccatatcattca +tacattgcccgaccgacccaatgcctaaatcagaggcgccttagctagttcttgtagtgt +gccacgtccggccacgcagacacgaccctcggcgagtgatcaccattaccggattggcat +cgaagtctttttctgggaagttagccagtttggtgtgcggtgcttagaatcttattccca +gtcaaacgcccctgggacgaattgctaaccctagttgccacgccggaaccatcttcggga +gagtagacaaatccgagttagatatgttagcgtcttcgtgagtctgaaatgtatcacttc +accgcagaatacgcgaatgtctgtttgccctggactgacggaattggcttaaaagccgac +tagagcattttggtacggttcctatccgcgatgtaattacctatctaggttatcgctaga +cgaatagcgagtacagtgtagcaggccctttgttagcaagttgctctaaacagttgtcaa +aacgtaggcacaatagtgcgattcttctaaatccgggaagctcatggcgctgggcagaaa +tatcacatacgggaataatcaacctccattttggttcgttttactcgatgagtgcccctt +gcttgagacgagcgttctgagttgatggcatgtcgaaaggtttacgcggtgagtagagca +ctttacccctacagatcggaatcctcgaggaggacagttggaacttcacattaacctttg +ttcgattgcatgaaggttgtgttctgggagtaggctcccaaggtagcggttcatgctggg +ggcagccctaagtttgtattatgtgagtttgcgtctgaaactacatttagcatgaggaac +gtaagctttctggagggatcttctaaagccaggtatcgcccgctacgatgccggagccgg +tggttcacagctacctgtgctcaaaggcttaaggctaatcatagcaacagtgcgaaagga +cgtctttcagatttcgaaaggtgctgacacaacaagggtcagggcggtcctacccttctg +attccctacctggttttttagcaagggtcaaggctaggcttatactcccgaacgctttaa +acactatcccacccctgacggggggaagttgcgcgttaagtataagaataagatttaaca +gtacactttaggttcctcttccgcgagccgtcatacagcaccgagcgccgttgaaacgcg +attaacgcgtattgtcgtgcgaaaaaaaaacgctcgccagcatattggagtgtcgacttg +aaatattgaacaacaccgcatatcaaggacgaatagtagggcttcactacctccacctga +cggccctaggacttatactcgaaaaagaccttccatcacgatgtcccttaccggcgagag +ggctatatacgcatgaatagcagatcttgccgtcgctgagtgtcacccagggttgctcca +gaaaggagatagggcggagagccatcgacagcagctctcgtctaggtggtagcagctaag +gagtcgtgtcgtcgcgccgagttggaacattatcgatgtacatcaatgcagtaatgatgc +tgatagactcgggagtttcctcaaacccagagttacgagaagacgcaggtctatcagtta +gaaggagtcagtattggcctttgaaagatcttatgctcatgcccaatcgtagttaaacgc +gaatcgggaaggccaatctggcggttttgacccccggactcttaagacgtccaatgtggc +tagacataagtaacgaattactctataccgaggggcgggaaccggccaatttattacgag +agcacgagagccttgtagcggccagcacactatcctcgagtccctctatcctgagacgta +gatatacatatacgcctagagagaatagccgtctaggcttccgtcgccctctccgtcgtt +cgcgtgaaccgtaagtcttccgcattcccttcctcaagcgcgttggtgtgagagtggtat +tgaggcccagtcttataacgcatatacttgtgcactctattacttaccatgggaaccaat +ggcactctcgaatcatgctcacagctgagcaacggtgctgctcaccaattacatatgagt +cgtggtttagcgttggagcggaagatgaatttccatctgttcgcgcgcatcactaaccaa +tatacggttatcccagcgctatctagttctgaccgggttggtagcgaacccttttgcaag +ccggcttagtggatgtgaagtgggagtgataacttaagccgccacgttcgggggggactc +gtttatattggtgctggaatacgaacggcgtgattcgtagtcgccctaatcgggcgcgac +aacacatgtagtactgtcgaggcggtttaaacccacagtaggtactctatcagcagaatt +atgctagaagtttcacaacaactttccgcatgaggctcagcggcagcgtcgcactcccaa +tggccagtgccggtagcgatgtttggtggaattagttccttcggaatacgaaccggattt +aaagagcctcggagaacctaaacgaatccgtacgcatcttgcccaaggtgctgagccttg +tcgcctttctcagttccacctacattaatgcaatgcgttcgaagctctgaccgcaaacag +gaatcaagttcagacagagtgcaagagtttcgcaataattgggaacgacccacttgatat +aggtgcttttagagatgtgtgtacgaccgtccttcgagcatacctacgggttacaattgc +tccggtaagtcaaggcacatagaaaacatagccaactgagagtgtatacaagattacctc +atgtagactgaaatacacacatcgctttaagctctcaaccgatgtagaacagattttggg +cggcgttgacagcgtgcccgctcaccggtttgctcccttctcaccaaataaccatgagac +gactttggtgactggactgccagatgacgggctacaaccgttttggttccgaattcgctc +taactcaactaacatcatactatatgcgccaggatattctcgcggttggacccccctgcc +aattcgggttaaaaccactccccccatgtagggagctgccgcaattacaatatcgacgat +cccagatggacgctcacaaaatatcagtcctttcacgatccgctcatatagacggatgaa +gggactgaggctgttagatagtgacgtcgagcatggcgtagacgagcgcaaccgggtcga +ggcccgcattaccgtgacacccagttgaaaggatttacactgcttcattcgatatttacc +actttgtatgaggagctcaacctaagtcaacacggaccatcatacaggtcgccagtaatg +agaaggctgctgtgccatggagaagcgctgctacagcacacaacgaacatcttgcaatgt +gaaggagggtgctcttttgggatgagcctacggggatgtgtatccctgccctgtaggcag +ttgggacttagcgcgactatctagataactaaggcgccagccgcggctgtttgccgaagt +cgtgctgatgctgtacaacgaagggcgagcgtgttaacatgctacacgttgacctagact +agtccaagtctgaaagtcccaatttaggtcgggtagtacagtcctcggttccagtcccat +gttgtgccgacaaggacaagcgatcatcaaatcgactgaaattgaatcagctacctcaga +ccacattcagctctcggtaacatgggaggcttgtggttgcaccgtaaaagggggatagcc +catccatcctgtaaacctacaatcgcgcgtagcttaatacgctcacattagacattcgat +cgagagacctggtttcaagagccttcccttttgctttagtgggccaaatcgcaaccctgc +tcccctcccttacgccttatacacttcagtgcaaattcatgcgttcagcgaacaactgga +cttctgttgtacgtagtccacgggggcttattcattatagaaagccccctactgtcaccg +ttatatggttcacacatgagctgatcacctagagagtcgtcatgcacattcgcctaacaa +ggacatatgagtaaccgggaggggatatcttcgatttgcagcaccaatcgacgttgtact +ggtctattgtcggttaggtccgattatccgaccggcaatgaggcaagcccatctattcag +gaaacttaggcagttccctgtgctggcccgacgtcgatgagttaagtctatacaggccgg +ccgcgagtagttaacgagaccaacatagaactatcatactagccggcaatgatcaatagg +gtcttagtgccactgtccttcgagccctcgcctaatttagcgcgaccggtttcctattgg +cctgtggggttgcgggcgcgtccgctttaagaatggtccttaacacctacccggagatcc +attgcatagcacactctccccattagcctagacacgtcgtcgcccgtcgactttggctgg +aatttaatcgccggggatatcgaactttcacgccctttaacgacgaggaaacctaccgtc +gcctggctggtaaatgggtgccttacggggactcacgatgctgtgaaccgcccgccagtc +tctggggctcccaaaatccaggttggaattacggacctccgccggtactacgcattacgg +ggtggaaagtcctaagataggtgaatgaaagggcttcgctaaaccagtaagtcattaaca +ggacatcggcgtcacgtctcgcgggtttacacggcgcacaaatcctattcccatgataaa +caccttatgccaatccacatccctcgctgcctaataaaattgtcacacctgcgctactga +ctaacgtttacgcaatgagagatgaattccgacacccacgcttgttgcaagcacagccgt +atgggttctcgggtaaggtaacacgaggcacactccggcgcggccacttcggcccctccc +tgacgatgaccctcattggtcaagcatcagtcgaatgattcgtaacaaggagcaaccgac +tcagtagagagggtgaatctcacgcgctagcctgaggaccgcctaagtgcttgctgtgcg +tcgcggcagtcgcgaggtgcgggctaaagtaaataattactggtcttacctaattaaagt +tggtggttagggacaacgttaccactaccagggtgcgcccctgaattcgggtatcggact +atccagggcgccttttgcggccttaaatacctttttaatcacgctggagctagaaggcca +tcgggatagacggggttctaggtactcgaaaaaacaggcctaataactttattgcgcttg +gactaacctatgtacaacacgttgtagcatactatggaatgttactgacctacacggata +gcatttgttcgggagcgtcattgacctcccagaccctatgccgatctgcaccattcagtg +accatccacaagtctctaggtttagccaaaggtgacaggtcaagcacttgcgcatgtcca +ctagtcgattatgcaacgtctctgaacagttagcacttatctcccgccgtgtgactcacg +cagtgaacttacctatagcatacgcctactattgaatgttcgttgttctaacacagcgct +aatacctcactggcagaggtgcgcacgctcctagtatgggagggagtcaggtcagagtgt +atgagactgatttttattcccgataggggttcagtgaaatcgacctctcaaaagagaggc +gcagaattcgctgataagctctgctacgatcgctaaggcacgataagcagggcggtgaag +gttggagcaagataatatcacccggacgcgggtcctgtcgcaacgagcggccgtgagacc +tggtgcgcaccgtgtctcgatcggccgaatatcggaacccactgcgtgactcaaatgata +tttttgctatctgtgggggatttatgtcccggtagaactctgcttctagcagaggataaa +ctttacaaggacggcgaatatggtgtcagagcgccctaatgatcccgtgctattccgcgg +gccaccggccgttaatggacttcgggttagaaggatgggttattcatcttccacagaaac +gcccagccgcaatcgtgggtttactcgaccgcggttatctgcctacttagctgcattcct +aaaacaggattaaaaaggccgcgagggttgcgaacctatggttgagaacagagtcataga +gtcagatgcgcagggacggcacggatccacatggcagttaactaatattaataccccctt +agcctcgtatatgggcgtgtgcagtcttgtccactcgcggacgcgtatccgagcgattct +gtcttccaacgctattcgttaccactttggcacctctttgctaagcaggatgagaacatc +tcactcactacgagccttgactttcagcacgcggtacgagggcactgggcttctcgtcct +ttgctagatgtaggtgccttcccgccctcatgacgatgtcacgtctatcggtttattaag +gtcggggaccattacgagattaccccgcgaccttcgtccaaatgggatcacggcaacgtt +ccacgaggggcgcgttgcctgagccactcgggtatccccttccgatatccgcagaagtct +agctaggagcaccgccaagcattacccgattaagcaaagcctactcatcgcatacacggt +tcttggggtttgcgtcagatagcaacttccggcggcagtagagatgatattttatccgat +tgagcttgcccagcgcaccctcgggccccgtggctcttctcttaaatgtgccctgcacga +tgttagcggttcctactcctccccgagccctatgggtggacagactcgccctctgaggct +gcgtgttcaactggttccaagtccggcgcctgtggatctacgacgcgaccagcaacatta +taccaatgtctaggcttagctcgaaaactagtaagccttagaactagggtcgtagcttct +tctaaatgaagggcagcgtcatagccatccacgttagcgcttactcaatcgcctgtcggc +tgtcatgttaccgctgccgtaagttcgtgaacataaaatacaacacattttaggtttaac +aaggattgtttaccgccacgtactggtgccggtagtgaaacgaaaaacctcagcatcggg +aggaggagaacggaatccctaccaatcttatctctacttaaagaacaaagcgcgcggtac +atggcgcagacgagaatgaatccccgaacgggccgagttagactcctcaacctgtcgaaa +agttgcgatccgctagatcgtagagtacggacttaaaaaagaaaagaaggtctctacccg +agcggtgagcccaaccagttccaggttgctgccggattcttccacacggcggtgccatat +ggacgaccccgtactttgggcattctaggctacctactgcgaacgcctcgcgttcatgcg +caaagttttctctagataggcgcgctttggtaagcatagtaataggttcttcagcgtcta +aagcccgcccattaggcctggcgactctgctttagtggtaaagagatagcatcgatgtac +atcgatggagagagtattttcacgaaagtgcgcgccgtacactatttatcggcatgcgcg +ctaaactggagggtctaataaccagatcacgcaacgaggtcccatgtacggttcgcattg +cgaaagtatgggatactagaggttttatcgggcctcgcttgaggtctgtctgggactggc +gcacatcgctcgtcgcccagtcgatagcggggtgattaaataagaaatatgttagtgccc +ggatttggaaccaaccagtcccggtagcggtacaaaaagcctttcctgctagttctatgc +ttaaagcgtactcctgttacaatccgtaggcaacctgaagaggcaacctggttttccttt +atttcgactttgtttgccatttccaatgtgatactgtgcggcgaccttaatgctttttgg +taaaaccataccgagatccagcgcacgcgacattcagaccggtcccggtttggcggtcaa +cctcgtactctgcactgttcagctagaggggtctcctatcccgaggtaccggtcgtctaa +cgggtggttacaggggctggtcctactctaccaacagttaaggagggcaacaagttcgat +ggggcatcgtataacttgaatgccattggacaaataataattgctccacgtcccaaacct +caactgaccttgtacgcataggtgccacctgcacgcaaccgagctcgttcaagtgtcctt +cttagctggcgccgagtgaacctgcatctgagagtctacccaacgatctagtatcataat +gtctgtagccagcgactatgacacttagagagccgcctaagaaagtgtttgcggctcctg +ccccggtgcgcttgttcggtgggaggtcgttatatagaaccatggggatataatgaatgg +taacatatctgccacgttgacaagccgctattatgaattcagggttggatactattatgg +cccttcacggtcacttgtaggacggccccaaacaggattagtaaagtcggtggtctaagt +gtaagcgataggcaaactgcggttattcgcgtagaccgcttgatgatgtaaaataacagt +tttcatgtctttgcaattaccgcgtgtagtctgaggacttaaggccccttctcggatagt +gaaatagttcaggtccggctgttgacaggtgtcctgaccggaacgctttacagctcctga +ggagcgtagcgccctacgtccttcctgatccagccgcacccatagctagtaaacaagttg +actgcgagacacaaagtcaagggcctgggcaagcgcgggccggactgcttgtcgaatatt +gaagcgtactcgatccagatctgcgccattgagttaaaaggactatacgcctgtctccag +ccgattgcagaaaggacagatcctaatagaagaactggggctccattctctcaccgacac +cctcctattcctatcccactggccccattgctggtaacccaaacctctcacgacgattca +gcgctgcgattaaagagtggagtaaggttaaaatcggttggggcgagtagtgtttgatgc +aagatccattgattatcgccagtgggatggcggcaaaggtaccatacctcgagcttattt +gggtgcctcactcctcggggaaccatatagacttgcacttggcaaaatatggtcgggttc +aaccgaccttttatgcctggaccctctgctgagggcctcttgatcaaaatgcttgcgttg +cttataagttgccgcttgatgtccaggattattattccagcgtggaacgggaaatgatag +cttatctgttactcagggcgcctgaattagggttgccattacataaaggaacgacaaggt +gagcactgggagggcgcattcttataaccgggcatatgcgcggaacaccagcgttggatg +gcctacctccgcggaggtcggggtcgaaggcccccgtttcctggaacaataacactgtcc +cacttggtttgtaaagaacctccactcgtcatgacacggcctagcggtgttatcggcgac +gataatcatgggtctttacaagtgaatcaggcttaccaggcggaccaggaggaaacactc +cacgagtgagacctggatccggggggatggcatacatcccatacgctcactcagcatgca +cgttcctagcacatgctggaatcttgcaagctggacagagtgtattgtggcccttgagct +atacttctaacgccagatccatgtttgcaaacatagctccagtggcctattcgacggttt +agcctctgcaccatgttatggctcttataggtgttgggtcgacagtgggtgactagacgt +aaagagagtatgccgtggttgaaccgagacctaaaaagctcaagatcacgacggatatct +ttaacggataccagcaatcggctaagaccagtgtctactactcgtgatcggcaccggccg +cccgttatctggtgtagtagtcagccccgcatcacccgtgcctatgcgagccttgactct +atcagtctaagagcacacgtttagacctgagccaagcgtaggtcactatcgagtcaacct +taaccctagttgattaatgctcttgacgtgtatgattacaccgaccgcgaataaactctc +acgcgcgtgacggtttcctcgctagaagaagccatatactgtacacactgctgtgaccga +caagacttacctttggtttacgtacaggtggacagttgtttctcccctcgggtcgatagc +gtttggtcgtgattccaataagtgccagatgtcggaacaacatgtttccataaagacgcg +tgacatgatatggtttgctatgaagccactacgaaaatgccagtgcttctctttatattt +tgcagatgtggaagaagtgcatccattatagtccttttacgtacctggattctccgccag +cactgccactactttcttactatccgttggggggggacgctcaacagagcgcggactcag +gaatcagataacgaccggaacggggcatatgcccagcattcgttgttgtaaagcgattga +gtttgggctgctaaggggccggcagttcgttccgggatacccgcaaaatttatgcctttg +tccggtgattctaggtttagctcgatccacgaatacgacaatacaaggtttgcctcctct +ttcgtctatcacgcaagcttagagttgctaaaatttcgtagtccgtgcgttaaagctccc +tacatttctaagctgtacgacaccacactatcttgcaacaagagtcactctatttctcat +atccgaatgaatatcgtcctgtacacgggtggcaatctcggcaagatggccgagatgtgt +agcactgtcacgttcaaaagctcaaacttctgcccactgccagccctaacagaatctgga +gacatcataccagcgctgtcccatgtggcggagagttgcttcaatagaacgctatcaccg +tgggatcacatacgtcactactccgtgtgacactatttattattcctttacctccaatac +gcccgtccttgcatcgcattttgtagtaagacatcagacgacgttactgccacggaacca +taaaacgtgctgagcccacgtaaacgtcctatcggtgaggtccgctcatcgtacgactct +gaaatttggaaactaccagtttgttggcggtgaatatccaacctgtcggcatacacgctc +acgcgtatggttggtacatgcgaaaaactacccaagcaccgggcgcgcgagacactatga +gtttagtgatgatttacggagcacgttttttgaactcaacagaccgattgaatccttcaa +acagggttactcgttcgtgacaaccgattacagcattctgaacgtggtacgtgcacatag +cttggagagttgcgcgaatctctttcgtaccgtattctacctgatcgctagctttccggg +gtaacgacatcggcaatgatgagtagcagccagtatccatactggacaggtactccatat +aaaactcccgcttcaacacgcgagatttgaaccgcacagtgattgtgctgagtcctagtc +accatcccgatcttgtacacgggtaggggtgtaacgtgggcagatgatgcttacccttcc +gctggcttgtaaaggtgccccgcttcacttgatgagctgcgtcgacaagaccacccaacc +cgagccacgtggttccgacgactcaatgatttccagtatggtccaatcgagcaccttcca +ctcatgaaatttgagcactgttggggatcgagtatgtgttttgcagtgggtctgtagcat +ggaaagatgtaccctaacccggctctggcattatcaacggtggattgggtggttaaacag +cttcccttcggagacttaatggactaaaacgaatgaatcagacgccgagaacgagaactc +accatctggcccaggagccatatttttgattggtaaatcgctcgcatagtgcccgatacg +atgcgtacttgagcgtaaacggcgcagcctctaatcataggtgattgctaagtctacggt +catccccagtggctgacgaggaattaaagacctatttccgtacttgttgcgcgccttcaa +ttatccagcgtataccccgatggctactgctacatgtctaaagtgactagccagaaaaac +ctaaccctcgcccacgaggccttgatcatctcaatcatagagtaatgttcattgaattgc +acggctcttggtgtgcacattgagacaatttctaaaccgacaagtttaatggccgagctc +ctcctgcgtccagctggaccttcatgcaggcatgaaggtccatatatattgtcctcccat +agcccgccgaccgggtctgactcaactgtgttttcgctatcccaggctagcacttctatt +ctttgttacgtccagtcatagtgttactatagggtaattttagtcatagtagacggccgc +tttttcgtatggcccgagaccgtccaccggctacccaattaagtcacatccggatcttgg +gtctagatattcctatcgaaaatagtctcgccgcctcactgcgtagttcagggggcgtca +cacttgttcgcggcttttcctcatgggatctttacccgatggttgatgcaataaatgtct +acaccggactggcgtgtccgagacgactttatacacgtgtgacgagtagatcagatcgta +cgaatggtctgtctcacctatcccagtgggaggatggaaaacactcctgcctaccgggtc +gaattatttacgcgtgttacaatatgtaatttagaaaaagggattgctggtcgatgcgtc +tccaagggattttttatctaaaagcatccttttgggtgtactctgatcgcacgtcgcaga +cagcagtgggttttgacgcagtccgtaggcccacagactcgtttgttgtttattaatccc +aggggagcgttgaagccacacctattctgtagctgtttgaaaggtagctagcccggatat +tactcaaggtgactcccttcagaatcacacgtcgctggagtcgccacagggtggcatata +cgagtgatagagcaccttactttcgaggtagcggtacattagtgcaacgatgaacccact +atagtcttagtgatttcatgttttacttacgcgaaaacgtggggttttgtcaacacgtat +acgttgaatgcacatgcctcatcctaaactgatgcactgccacaagtctgaaagagcgac +agtctgcaacatagcggaaggttacgcccaagccagtggtgatcccccataagcttggag +ggactccccttagcgttggatgtctttgccccagcggcctcggtgtacgggttctccacc +ccactatggtttggaactatgaagaggtacggcaacctacccgaggcaccaaatcgtgaa +cctacgcctatatatacggatagcagggtatccattcttaccatgagctcgtaaaccact +ccgctgaattcgatgggctttggcgcacatcaccgtttctatcacagatctgtcaacgga +atctaacgctatttactcggcgcacacagatcggaaaacccaactgtggcgcgggacgga +ctccaggaatcgttacgcgttatcaccttcggctaagtcttgacgacattagagctatat +ggtattaatagtagctgtacatcaaatgataaaattatctgaattataagtgatagcgcc +cacataatgacacacacgttttagatagttagtagacgctcgagactttgcgagcaagaa +tggactgttaaccttaggggcgggttcccgcttacaaaagctgattcgctcctagagatc +tataagcgaagttcaacccctaattaccattgcataagaccgggagaacctgtgacacct +gttcccatgggattagcgaaggattgttgacttattgccgagtgacctagtattgattaa +aaatgcgacgtgaagtaaccaggccttcgatgggcgtctccgaatgggccagtaacaacc +atatacaaactacaagttaaacccgaaaccgtggctaccatgctcatctagtcgggttcc +cgatggaacattccacggtgagcggccttggatgtcggaccaccatttggcaggacaacc +gtcacgattcgcaacagcggttaaagcaagatggacgccaataatgatattcgaaagtgg +ggttaaaactggccgccgcttgatcggtcctacttagtagcgtctcagatgctagaacca +ttccgagtgcaatgtgtgctagcaacagtggaatcggtctataacggtttcatgatccct +tctccggccatccattgagaacgattctacattaatctgttaagcgaccgccaatcactg +attagctccagaaaacctaagattaccgtatataagaatcaacctgctaaagtaggaagg +cgcaggttgccgatgaacagatcaagttcatacaggagctcttaatccaccgtacccaag +acctagtcaagcgggatgtcgttaacaactttgtacagacatttgggagcattgcaccac +agactccaatgaataacgcatccgctaggaccggatatagactgaagaaagtatagtcag +ctgcctcctaaaggaggcagtagtaggagccaacctaacgtcgtggatacgcattactcg +gtagcgtggtaaacacacgaacccgatctcagaattttagcggcgagaagttccataaat +catatttctacttcgtgctccggcttcatctgatggtggtcattattctccatatgcatc +cagtagagcttgcgcttcacgcaaagttccaggatgctcacatatgtccatacggcgcta +ctacatttactcgaacacttggaagcccgccgtcgggtgtatgactagcctttgactgag +actcagcctcgcaattgtatgtaactagcgtatcccggcaaagtttataggtccatatta +acaacagatgggagtagagcagcagcttttattcggactggcacctcatcgctttcgctg +tctgcgggatcaccggtctctcttgaacgtgttagagcctgagggatctgagggcacaca +cggcacttgtatccggaaaacctatgtatagagcctcggttgccagtactagttcgtggt +ccatagcgcctgaggggattaaacgcctccggaaacacgcgagttgttcttgtgcacgta +aaaatcacttgatgttatcgtgttcggccccagtcgctgtctcacttcaaaccagcgccg +tatccattctatgcaattacgattatacttttgacccgatctacgaatcagttacccatg +aatgcgacctgcgataacatacagtgcgacctccagtcctgttcgattaaatcgacagag +ggtcccgaacgcatccaagcggcttgggtcccgctggcaccgctgggaagtaggtagaga +cgtattgaaggaagcgtgtacagattggtgattacggtgctcttataggaccagactcgg +gcgattctacggggtcgtccacactatggacccgagcatcgaatcagtatgtcaatctga +agggactaatcggggagacgctggactccgtcaggagtgaccagaagcagggatgcaaag +acatcccggacgtggatagactacaaatcggacactcagatacatacctctagaaaatac +tattccccgtttctattccgttccgcggccttttacgtttagcttggagcaaactatata +gccgaggagggtactacaacgcgacgcacttatatcccaatgaaagaataaaagctggta +agacaacgctagccactctacctgtgttgcactcgcgatattagggagacaggttacaat +cagctgacacatgactagctgacccggagcactcaattctgcccatcggggatctgatca +aattcgtcgtcgcattggacggcttccctgcgtagcgaaggaatggttaccgtacgcctc +ccaacacacggcggtcaaaatagtcttcagcaacagtaacacaaatctcttcctagtact +cttggtacacggccctagagttaattgtgtgcccccccatactctctacatgtgataaca +gcgacccactaggttgccaaacagagtcggaagtcctatcgagtccagggcgctgtaggg +cctacagactctccgatgtcctgtgttcttcgtaattgcaatattttcgggacccttctg +ctgttgtcagattcagtctgttccatcttctggaaatgttgaggaactcgaaaacgctaa +ctccctgatatttgtggccttacatcaaccgtcctcaggtgaagcccaatgctaaaggag +tgaaccagacgtgcaggaagaagctgttgaccctttaaagctctagttcttgtcaggtgt +tccgactcgctggcgagagtatgatccagtaagcggcggacctgcgaccacatgatgagg +tccctacaaaatcctatgctccctgcgaattacaactcacagagaacagcctaggctttc +ttagttattgatgcacattctactgacgaacgcagcattcgaactaaaccattggtaatg +taattgtgacacgtgggaatctatttaaagctgcaagaactccaccacgtgttcatccac +atcggtctctgtggaatggtccaggaccgtcccaatagggggaattgcgagacccaacta +atcgagtgattgaacatgggagcaattcccgaatagaaacttgcaacgcgcagtactacg +acgatggtagcaataacgacgcgctacttcagctcatgggtctaaattagggcgaacgat +tgcacctaatctgctggcttctctagattgtagatccacagggccaattaacagtgcaaa +gaatagcgtcatatgattagtttgaaaataatatacatgaaaatcgagcacccgcatcaa +taagctacgagagtctttggagagtgccaatacacctagcacatgctgtgcttatgttat +gaaaattcatacttgactaacgttagccaccagccgatggcgctgtcacaacgaccctgg +gttaccgtttagttctctaagaagggtcactctaccagcggggttaaatataccggccga +ctgtctcgagagtgggttgagataactcaatttggatcagcattaagtctagagcgattc +tcgcggagcgatctatgcgcactgacttactcttggaatgtcactcgcggcttacatgcc +tccttgttccgcggattgaatattttatgcggtagtcatgactttaatcgtttctacaga +aaagaccgtttgaaatggcagaggaaacaaccctgctggatcctccctaagtcacatccg +gacggacagattctacttaacctccaataaattgagaaaaatgcaaaaggatgccaatac +ctatagtacattttacgtttcccgtgtggttcgtgccaacccctggacggtggatgtccc +cggtgggtttttggaccgggcgaaattattggccaacccggaaacccaccgagagcctaa +gacgtgcatgatagttataagtttaatgggagccttaattgcaaccgatgggggcgggta +tttgtctcctacaccgacactatggttgttatttgcggcttcactcaactacaatctggt +ctgtagagagtaaccccgtattatcttcccttgcgccctgggtgcgttagcggaagtatg +gggattaaggggcgtgaacaatgcttctaagagcccggcgctaacggacggtgtcacaga +gtgtctaggcagagtccccactgtggaatacgcatgcgtagcgaaccgcgcgagtcagta +ggaacacattgggagcgattgttcctcctatcagccggcctagcaagcatgacgtcaaac +cttagtgagcagcccaagaaataacgctcggactgcaacagatctaagcgggaaatatat +cgatagcgaggaagccgagaggactaagcagagagacgaagaggtgagccggagtgattt +agccccagatggcaggtatagcttccgttcacaacgaattgaacagaaagtccggcgccc +ctggaatttcgaaacgtcaccaggttggccgtaaggttggtaactcaacaccctaagact +agcggtcttgcgtcatgcaagcggggcgtgtagcctgcacagacataatacggtagggag +gttaggcgtggggcgacacagtaagatctgatgaatccatgtacgttgcctccccgtcgt +acgcagttgatacttcgcatcatacttagcagaaagcatcatcgcgacctctcgtacaat +ggcaaaaaggagggcttcgtgcacggggtagagtcttccgcactctaatgaatcaacagt +cgaggttcatggccacaaatgtaacgacgcgatatgactcgttatgtctaggtcccactg +cggatctccttagaagcgaattgtataaatctcatagccccccccttagcaagtggtacg +tagcccacacgatttacgcagagtggggtaagacctcccccacgacttggggaacgcgcg +ctcaccggatagctactgccactgtagagccactagcgcatagtgtatccatagtgatgt +acgtagccaagcggggagtccttgtcttatgactagcgccatggggctatcaactgagaa +cggatgcacaaacggtccggccattcgcacagtccgccggtcactaatgaccggtctgca +tggggctgcaacgatcgcccaaggattggaaattgttaataagagtccagtggacaattt +agtaacgcgacgcgcatctctccccgcctaacaaggctcatttttagcttgacggcgcgt +ctcacgttgccgggctcagctcgagctcacgtgccgcgcggggttacctcaggtttgagg +aatgtgtcttgaacggttcgtaccggcttagcgtcgggtgctcctcagggttcccagcaa +cattcttaccgcaatccaatactgagggcgctaccaatctaacgtatcactgacccagta +aaactcggtattacgggggcgatatatgtgcttgcctcaacatagaactaccgccttgac +gttagaacgttaagttagagcacctgcccatctggattgcggcgataaaatcgattattg +tcacctggatgaggaatatggcggacaaacgatcgtgtggacctgcgccgcaaccgtggg +atgccgcagcagaatatctacagagcgtttgcaggagggccacgcggtatccacgtaagt +tcgcgcaatagcagcatcatctcgttcggggttgctgctctcagactgtcgatacgtccg +aataccagcaacccctcgaggctttgtaatatttacggagtcctaagggatttggtgccc +caagtatagttttgccgaagggggggcacagtgccgtgactacgattgggctattgggca +acccgaccccgtgcgcacacgtttgatctcagacagagggcaaaaagacgaagccacgag +ctcttcgaaatcaatctacatctatgctgggataagttctggtccacacctagatccgag +aatggaccgtggataacgagcaccgttacctttgaggcggcagcacttttaacaccgtaa +aagtaactctatagttgtcagcctttaaagattgcgttcccaatacggtacgcaccgtct +actaccgtcaacacaccgtagcttaggtccccccgcggcagcgcttccatcgtggagggc +tgtcccccatcctccgtagaactgcgtttaccggtctggggagactccctaaagaaacac +cacaggtgaggtggacgggaatcaagttaacgcattcacgtaattcactcctgttcactt +acataagagaagttctggttcgcgccttaagtgccatccatgaggcatacgatgcgatgg +ggaccacgcctgtagactagagaaacaccatcaagttgataaggagtgaaaattagtata +ggtctggcccgctcgtctgttgatagggcctttaaatgtaataggcctccgctctgaacg +agtccgtacttatctgttggatagtaagaacacggttctcagtccgcaaggtagtatatg +actacgcgtcgatggacctaaagatacgtttggcatcgtcctgagcagcttatgaaaatt +gctgcgcgtttcaggtggaagaatctgtgttattagtgcggggacggtagtttcgtaggg +aattatgggtagtacagatctatggacgggaggtgactgtcagcagactgtgcgcaggcg +ctggtggtataatcgctgggaccacgtactggcaagacgcatgcagcctggtgacatcca +caccgccctcgctcagataggacggacgtgcggcaataccctatctggctcctggacacg +gaaaaacagcagtttaaaaaaaagtgggttttgtgcattatcactttgtccgttcgacag +tttattgcacctcccagcatgctagtaaccccttgctctgatttgagatttattatcgta +acacggagtcgacgtgaagtttgatctgcggagaataggccgagaagcccctacgtaccc +tatgattcccgccatgtgcggtgtaaaattaaccactacttatggatttcatccaaatta +actgacgcattatatatacctcgagtgtgtaagccggccctcgcggtaccaaatttcggg +ctgcatacctagaagtgtatgtcatctaaacctaaggatcgggtagtgacgtgtaactaa +cacgtgggacaatgtctgtcctgagctacgtcttaagaagtatttagtcctacgtactca +ggcatcgatactccccgatgttgggtgcagtggggcgtccgggcggctaagatagtccag +ccactccttatgtgaatttatcaaaccgggaagaccagtgcataggccacgacctacgta +gcacctccgtacaaccttgctccagggcacgtctaaatgtcgtactgggttcggactcca +tgcctggcgactagcctggcggtccacatattttacaaatccgagacaacaaagcacttc +caaagtcgcgtggaccttaaggaaggcaacacaggggacatttagccactctaaagaccc +gcatactccagggcatacacgtaacgcgttctcttcactacggagtccgcgagcgaacga +ctaagggcgagggccgtagatctccttctcgtaaatataatcaaggttgccagcgcttat +cggtgccaccgatccgaagagcgtaaggacgttacagtgtaggatacatggtttgcgccc +gtccatacataatcgaccatcaaatcgaaagcgcgtatgcagtacctcgtactgcccaaa +ggacagagcgcattacgtcaccccgagcgtagcttaccatgttaagaccgtgctcatggt +ttccacccgtaagatgagcacagattgcttgctctaggtaacatagtaataagagaacat +tcatagacgttggaccacggttgaaagaccgcctcttaactactgaaaaacaatatttgt +ccttagtaaccaagatacattaatcaatcctccgctaatgaagttggtaggcaagccttc +agtagcgtaccgtggatttgtgtttactgcatttacaccgcggctgggtacgaagcggtg +tcgggcacgcacacgcgttcgatactgtaggtttcgttggggttgcttgttgccgctaac +gttcgggtcgcttacttctgcaggcttgattactgagttcattcgatcggttcccaactt +cggactattgcgccatcatcaatgtgggaaatcatttttaggaatacacctcgtacatgc +atatgaagtctgcgtgcaacagactttccatgatgcgagctgggcttcccgtcctgcggg +atgcaattggcccagtgcgcgaaggctgggctgattacggacatatctgctgtcctgaca +atcgatggtgtagagcgtaacaatcattccaatttttcgacacgggccagggctttaggc +cactacgcacctgggttaacactcggcgacccgcctaacactgggtggacattcccgagt +tataacgacacctcattttcaacaaccacaaaaaggcataggcaaccgaactaacctttt +gtttagttacttctggtatgttcatagtgtagggcaggtgatcggttaaacgcttgtacg +gaccccattctgtagcgcttttctgaacgataacactacgttgggagatacttgttgcgc +agtcgtgggttaaaagcgagccgacgataaactgcaataaggaaagcggacctgtcacct +cccgcgggtaaatctactcgctcgtttagaggccgtaaagcgacataacggtgtccagta +caagcccaactggtttagagaattcttctcctactacattcaccgtccgtatttcggcgc +gccctacggtattcgtggtgttctgagcatacatgggatggactatcacccctgcgcgta +aggactagcagttgtaagtcacgttaaggttgcgtaggcaactgttggagtgcgtccata +cttttcagcaccccgaatttgtacgcccaagttgtatcgtcgtgctgggacgagactcag +cctttaccctaagcgtttaggaaagcgatgttttaccgcagacgcatatgagagaacgtt +gcaagatcgatctttctcgcgcacgttctgtagctagacctgcagctaatctaactgccg +aactgttaggatgttttctctcctagacgcagggaccagttgtaagtaagggtttctcat +cgctaggctagggtgatggtaggtgataccaatggagcggcgcgttaaaagggttgtaat +ctcggtgatatgtgcaccatagattgttccgttattttccttggtcatttagatacgaga +taggggcgccccagtgccacgaggtccatcttatgctgttgcgtagctagagccctacaa +ctttctaagtaaaacctccatcgagtgcgcttggagaatttcatgtaccgtggcggtacc +ttacttgatgccgcgacccctatctaattaaagaccgcttcccgatgggcgaccttaatc +ttgctgcagtccaagttaacttcctctacgcccgatgacaaatttagccggagtaagttg +ttaacctagcctaatttgtaccgaattttgggttgtgagaagaccatttctacccgacga +tcatgggttcctctcaactatacctagtgtcggttaatgatttatggcaaacaatccccc +aatgtagcacccatatgggcgcaattatgtgaacttcaacactaactattggtttagtta +gtgatatttagcgcaaataagaggcatgggctgcgaaaagattgtgtttccgcaatgcta +gggaacctgacggcatacccgagatgatagttaggtgagcccgaatcatgcttgattaac +gtaacgtctatcactacccgtgggcttttgcgattgcgatgcgttactcaaggcatactc +aatggggctggtaataccgatatgggcctgtgtcttagcagcgacgtgtcgataatcgaa +gtacaatacgccagtctacgttagggctttgctaacacatcacccacagttgaagcatca +cgcacagccctcattaggttgtcgtcaacctggaactcctagcaggctgggcagtatggc +atccttcacgaacaatcttaagagacgcacttgacacaggttgcgacagtcaggatgggg +agcttctgaaaatctctacataaggtggcctcgtgatatcgtattaactcggagagcggt +tggactaatgagtgagtccaatcagtgatcggtttttaatgccgggaccacggcttgcgg +ctgcgcgatctatttccctcgcgttacacaaggggtaggcataagcaacaagcccaaaaa +aatcctcacgcaggcgtcaggtacagactttttccctcagcaacgcaaggtacacgtgta +gtcgaatgtggtcataaccagcagctgtcttgcgcaagggcggtgctacacgcatgtttc +actccacagtgacatgatgcccgctcttcggttgttctatgcagcgcgctggtcgcacct +taagcccagttcaatccatgcaattcaccgttgcagcactagatcatataccgcatactt +cgtcagagcacaaccagatcacttacaacgaccgcaagctaagcatccctatcgtgcgta +tgtgtcgaggcgcaagtactatggtcggatgaggaggtgtgccctcaggacacacagtat +cgctcctcattcgacgacgcaagtcgtctagttctatgataggcgaagtgagtactgcgg +atcactacgcccaagacttggagtgacgacgccggctactagcgatggcagttcagaatg +gtgccttccaagggacactcggtcctaatcaggcacacgcgtctcaaagccactactcat +tcatgagctcgctggcgtggcagtggtcttatgcggctagcgaccagaatttctactagc +cttaggcgtacaagcgttgggcaggtcgcgagtaacctctacactctatcatggaccaca +cccatccatgttttaaacacagaggtcttaagaatagcgatggtacggttgagaacgtgg +gagttttttgctctacagcaagcacgttgcagtgaggagagctttaatcctaaatcataa +gtgatactggtgccgagcatctttcggacgaatatgaagacccaacgctaatgtgcctgt +tcgtcggcacattctcttgggacacccgctacccacatgtatgtgaattgggcccgtctt +gattgtgtcgtagatgccaacggttcaatcagccccgacgacgagaagcatttctacgtc +tccagccttgcaacggtttctagagtcttgctgttcgtaaattgaagaatctactgtgca +gactttatcgacccacgatacgctaatccgagcgcgactcggtctcggaaaattatccga +gggagctcgttcaatgcggcggaggctctgagtgaagtttaaggctgagatagtcacacg +cattcgggtccctacaccttgtttcgaatgtccaacgcgaactctgggcaacatcgcgag +actttgaaagatgagggggctgtgacagggcctttgtaataggggtactttaagggcggc +acaatgtgatacctatgtattcctatggtctgggtcagttatttaaattgaccggacaag +aatctgactcgtagactgctgtatagatcacgattagagtttggcaatggttctgaaagt +gatcatgtctaacgtaccggatgacactagtaataactgcagcagcgtgacgatgtaggg +gacttactctgtttacgggtctcgtctgccataaacatcctgctccggcagcggtcaaag +acgtcctattatcgcactcgggcagaaactccagtcatggtgaggcacaccaacagtgtg +gggtcggttcgtggttaccaagccaccatttttcggcccaaactcatcttgaatagtcgt +cctcattcatttgatcgatcgtcattacaaggttcataaatgcccagcgccgcgtctccg +gccagatggaagagctacgtgcaggcggtaagcaattgacgctatagccctatatacgta +tgtgggactcaaggcgacatgctataccgactggtatcgaggcgaacgacaattgctatg +ggtcatcacctcatatttagattcagcccctggtggcgtcgctttgaccaactagttaag +gttgaggagttcgctctcaaacctgataacgagctaggccatgtaccaaccttggctgtg +caccgacgagctgaaggaccgagctgctaggaggtcgcagtatcgattgctctttcagcc +ttctaaaggtgcgacagaaacttgaacctctcggtactctaacactaggggtacgagtgg +ataactcgattacattagtcctggtacaaaagtcctccttccgggcgccttaagctgctt +taaagctatgtccgcttacgagaaaggggcgcacggtccgatctacttacagactgtcaa +aacggtgtagtcggaatgggctcgaacgacgctaatagatacacgcgcattggcatggta +cttcaccaatactatatctttaaagaagggcggcgagcctatttacccacttcgattagg +ggataacacaggtgattgagttttctggaaccgtcatctaatagccgaagcagtccacat +tacagtccattgcatttaaccactaggaatcgcgccaatcttgcgcttatgttgtttagg +aggggccacgctagatcttgcctatcctgagttatatgagggacgatcctacatgtatcc +tcaaagttcgcgctcatccttagattctaggagatggattactaagtgtgtgtccatagt +ttaacgcaacacataatgttcgtgtcgtgatgcgtatccttggtcccgacctactactct +agacctatacgatagcgttcaaagctccaccatcgatgcaacgtggtcgtaccagtactt +atgaaaccttttttcgcagttcgaaccgcctggaaagaagcatacgcaatatcgtgtgat +cagcacgcagggtatcagttaaagagcccaagacttagtctatcgagcagaagaccgatt +agggtatacaccatgtcagaatcgcctccagactagtggctgatatcgtacgttacacga +ggtcgctcttgtcgagtgctcgaacgatctatcccctagatcacgcgtcccagtcggagt +atcccgcctcggatcgaaatgacggctaaaaggtgtaatcacgcgcgtaattcctgcaag +ctctctgagttctgctcgctggttcgaatgagcctgcaggcagtacctacaattcctgct +cggaggacctgttgcgagggatgcccccatacactgctgagggtaagtagctgaagtata +aaggcggcaatcttctgacaaacacccttcttccccttggttaaccagacaagctggatt +tatcacccctcccggggacactgccctgttttatatcgcggacttgcatcagtcgcagta +gtccgcgtagatgtggggacccctcccaccttacatggcaacgcgtgatggagtagtatc +tcgcgtcagtgagcgagttcgcatatttgtagggcgtcataacaaatgtaaatgctagta +agtgaaagatgtcaacatgcgggctcggttttgcgctccaggtatatcctgcatctgatg +aacttttcaatgaccgtgtctggcgcagggctgtcgttttgcaggaggggatgcccagcg +catctcgagaatcatcggctaatcaacgcgaaaaagttaatcttctatcagtcagcgggc +tataactccttgaccaacagaggatcgcaggtatttgtactgtggagaaacaatcgtaag +atggccggccatgaggcaaggattgtaatataccggggtggttatcgaagaagtaaagta +aggcctaccttctggggagcaatggggttctcagacgctaactcttcgttcacctacaac +acgattggacttagagagggacctacggacccgaaattcacataggggggttccccgata +agccaaggcaggatagagtctgaatccatggacttccatcaaacccctgtggtggttccg +ttcaagtcagggagtatcacgactcacttactgagtcacgtcctcaatatgactgaagtc +gataagacgaaggcttaatttacggaacccccgtttagtaatcaagaaacgcattggcgc +gggtctaacgtaagctcttcacaccgccgtctacgaaccagttcccggcgttgcatggtg +atcgccgggttcccttggagggagtaccttgtgccctgcccgtatggtcgttcctaaata +gcgaccaagtattagttgactgttgcgacttaaaatccaacccataagcatatatcgtgc +acccagggactggagggcctcagccccttctttcgaaacttaaaccgtcttcttatgggt +gaaatgtaagtttctacgtctggaataaacggttcgggccaccatgaagcgtctcgtgtg +atagagattcgcaatgagtctgggaagtagaatcacaccaagttagaaaaattctccaac +tcagctaccgcgacccatccgttggggtaacgcaagggtattagccgctcagaggccaaa +gattagagaaacgcgacgcctgcggctgtcttgtgactactccgaccatgccgtcagctg +gagaccctacggtgggtagttgggtagagcgccgatagctaattctcgagtggaactgcg +gaatgtgtcatatgaggtagcgatattgggctatcacaagtacgtgagcctgtgaaaacg +gacgactcactagcaagtaagcacggccctggcgtggcggcggtacgcgtacaaacctcc +actgcttggggaataaggtgcgaacaccgtgatccattgaggcgtggaggcatagggccg +gagtgttcccgtaccaattacgagctaagaccgcctgtccagccctggtgattacgtagt +aagctcggtacaagcctgtaattagcttccgggtggcggacattcgttcatattgccagt +cacggcagaggccgcgctagctaggccagccccgatgaaacacgtgctagttttctatcg +tgcctaaggatcgatggctatcgcggcattgttaacttatcaagcagccgaatcggcgat +agtggacacaacatgaacacgctaagctctgagtgccagactctaccgcggcgaatccta +ggccctgctggggctcccccacagagcagtaatggtcttctgcggccgcgtgcattcaat +ccgcgctggtcaatgcgttccatcgtgccttaagcggggcagtgtgataagacaattttg +ggggtttcatggagatatcttcagaaacctcgcgaggtgcgtttagataccacacgcgcg +gcggtcttttcacacaattcagtccgcggccggtaacctaactttgcttatcaatacata +atcctcccaaatgtacggtttcgaaggagatacctctcccctgttagactctaggttttg +cagtgctacctagagatcacaccagcattaaaccaaggtatcagcatcgtaacatgggga +ggcacgcgcttggcggtaagtacccgccacgattactctgtttcatagcgccaacgcccg +tatagtgtgcttttaacgtcctcagaaatcaccgactgatcagtatggcgacatcggagg +gaggttggcgaaatgttgcttttatagatcgttaaaacctatcgttggcgcgtatcgcct +ccatagaacttcttactcacctagtctgatcccgggactggtcgaaatggagacgacgta +gcttgagatctggatcgatcgactgatatcacacttaaatatgatcagattttactacgg +tcgatctccatatatctatcccagcacttgatacctcctgtccagccgactgcttggacc +ctagcacgcgatattagagggcgcgttgtagctcaaagtaaccagtgggacgacccgagt +gaggttaccgctggcacgtaagggtgacatgactcccccagaaacactgaatttgtctag +cagtacatcataatctgagaacatttagcgaagacgagaacaagctgtctcaatggacgt +aggacgagaggaatgtgacggttataatacgcgacctctatgtgtctattaaatccctac +gggccgtagcgagcaagctcgggatctttagtagcggatcgggtcttctacatggcgcac +caggtttgatatttcgagctagagttgctctaaagaaacgctcttgcttgggaaagtgac +ctggggtacgacgaagacacgggcctggttgcataccgtctcaccttcattcatcgagcg +cgatagcgtagcattatccagcacgggaggcacctggcatgggcgtgaaatacaatccga +agagcagcatgaaaaaaaaatgagcggtcgtgacccgagggtgcgtccctccgaacgttg +ttcgttgccaaggtaagggacccacgccaagcatggttagggaagcgtgaccgacacaac +atagaggacaatctcaatatgccttctgggtatcacctgggtgtgtagcagtgctactgt +tacaagtcgcgccatctgcgacgtcgttcgtccctattccctcctaaaggccccgactct +gaaaaaacctacaatcctagacacgttgtggcccagcacaacgcgtctgctatacagcaa +gtcattcgtcgaatggggcaacacgtataagaaggccgtgattccaagggcacatggcgg +gtctctcaatgatctacgacgtgacgcaaacggggaaaggctggaccgttgtccggtagg +cgatccatcataaaaggcgtctggttctgtggttattgtgtacacgtttgaaatatctga +ctgtagaacgatggaggtctctacgtagctctgcacgattccctcgggctcacgttcatg +gcaaggcgacatcacatgaacagggttgggtaacagccatctctgaagcattcccccagc +tcgcacggctcctttacccgctactacgtcatgcactggctagagacccaccaactattg +tgcaagtaaagaccataaaattttggagctgtagcgaaagcgagttgctgcgatggttag +accaacattgggtcaaactattctaatccggctaggctcattaagcatcgcagattgccg +atactaatgctaacgagcgatgaatgggcctcttcgagacgcgtccgtacctgcgaatat +caaccatgaaccctaatctggaaagtttgatgccgctgtgatagccactcctgtgtcgcg +acggcaacgtaatgtacgtgcttggtttgagctctaaacataccttcgttagagttggtc +agaggaggatattgtcatagcgctacaaccagcgccaaaggatagctccgtggctggtcg +gacgcgctagaatctaggcagaacacgtgcggcttcttgcactctgacgctcacgcattg +gactttggcggtcatctggttctcataagtccgaatcacagtagataaagatccgcgtga +taagatatgcctacgtacttaagtagcaccctctgttcttggcgatcctatcattgcggg +ttctatacatatgttgatccaaccatcggccgccgggccgtcgtaggatctaatggccaa +cacatcaatcaaatcactcgcgaggacgcggaggtcccgtccataggtgtgtatgttggt +acgcagcacctaatctggtctggtcaagcaactggcttgttccagtatataatctcagat +agactgccctgaaagtagacaatgataaatatgtaagagcggggaaatcccatcgtcgac +tgtgttgcggacgattagcttgcaaagagaggtgtgagcggctgtcttaaattatggact +cctcgcttccgtcgaacgtctgactagagaatctcttggaggtacacacgaacgtaggtt +cctcacagtatgtggcatggacaccggacaggtcacttgtatttatccattgaacgtgat +atagtgtgtcgagtcgttatacaatacatactccaagcgtactccctttgggtaacgggt +ttgggtacatattaccatggtgtggaccgatttgtaaccctataagcgttccgggtactt +taccatcgcggatgcgatcgcggatctacctatgtcagcgacatactgcccgtccaaaag +tgattcagtatgtgttaatcagcgtattgcatcatcagtcattgagagtggaccgttctc +gaagagcaagattcctgaccctttccactgggccatccagtacacccaattatatgcaga +cgaaaagctccatacatatataatacctcttcacaccgtgtgcagagaccaacttgatcg +atattgtactcactcgtacggaataattagaagggcccgactgtcgagaccgttagcatt +tgcattatcgcggtgagcgtatagaaacaattataggctttgctgcgatcgcagtgtctg +ggacagagtctcctagacctagatcagcttaaaacaatgattgtaggtaatgtgcgttgc +cgtcgggccacacctttcagttcggttacaccgactcagaattatcttctatcgggaccc +tcaaactgataatggggtcaaatggtggtggtcccgtctttctgcagtgctttgtgagca +gaatagctctcgagcgctccagtacgcctgagtatggctgcgcccaccaattggcgccgt +taatgcgtggcgacacaagagaaccagtccacataagttatgcccttaagaagatcaccg +ggtttgcgccatcctgattcaggtaacggacgtccgtgtacacgaaccatactaatgagt +tctacatcgctccaacgcgtcttgaaccctatcgacaattacaaatgcaaagtattagtt +gggtcagtgcgtagcttatccaagggctgcagtaagtcgtccccatgacagacggacggc +ataagggccaaaaattccgccgcattagctgttaataatgccatccagaaccggacagtc +tcgatatataacttacggctgcgaactggcccttatgaattacatccacgtgctagttaa +caggacggatcgcccggactaattgccgatcggccgtcccattctccgtacgatgtactg +aacccaggcgtgtgaatgggtatgtcaacgtttacccatcgaccctgcctatagacctga +gtttcattccagttgagcgtagaatgggatgagcagctttgcttgaggtgcgatattcgg +gagacctggtcagcaggattgatggttttatagtgctggattccctgctgaaattctctc +ttctgccgcatgtgaagaaggccttgcttcccttccacatgattgtaagatttcctaagg +cctcccagctgcgtggaactgtgagtcaattaaacctctttcctttataaattacccagt +ctcaggtatttccttatcgtggtatgagaacggattaatacagttgtgtaagccagctcc +ttataataaatctctctccctctctctgcctctcatctatgtatgtatgtatctgtcatc +tatctcctataagttgtttcttttgagaactctgactaacatagacattaaataaacaat +ttgtatactgaataattatataactactgcttgggggtgtggttgtgttgtgtggtgagg +gggtgtagaaatgtctaggggttgatctagcctaacaccttccagatgaccctaggttct +ggcctttccccaaagagtcctggtctactcagtcatctcccacaatttggccatcttctt +gggtgctcaggacaataaatgacccagccagatcctctagagtcgacctgcaggcatgca +agcttggcgtaatcatggtcatagctgtttgctgtgtgaaattgttatgcgctcacattg +cacacaacatacgagccggaagcatacagtgtagagcctggggtggcgtatgagtgagct +aactcacattaatttgcgtttgcgctcactgccgcttttcagtcggggaaactgtcgtga +cagctgcatttaatgatcggtcatcgcgcggggagatgcggttttgcgtattgtgccgca +ggtggttatttctctcaacagtgagacgggcacagctgattgccctcaccggctgggctg +agagagttgcagcaagcgtacacgcggggtttgcccagcagggcgaaattcctgttgtga +tgtggattccgaatcgggcaaatgccctataaatcaaagcatagtccgagatagggtttg +agtgtgttcagttttgggacagaggtcactataaagaacgttgactgcacgtcaagggcg +agaaacgtcatcaggcgattgcactacgtgacatcaccaatcagttttttgggtcaggtg +cgtgagacttatcggaactaaaggagcccgttttagcttcggggaaacgcgaagtgtcgg +aagaaggaaaacgaagagcgggtatcgcggaatgtacgtgctgagcgaaaccaacgcgcg +ttacggtcaagcgtgtatgtgttttggaggtaagtttccctgataaagcggaacaggggc +tatgtgtttacgggggtcgcatggagtacaagggggcaggacaagatttgcgcgacatgg +ttttttttaaattgcgggagatggttggctgtcccgatgagattagaacctgcttttgtt +ttagtttcggttcggtcagttcggactttggattggttttgttgggtatttaagaagggt +gtttgtgggatgtttttttttgggtcgagcatcactggactatgtgtgtcctgcgtatcg +tggcggggcctcgaacttagaggtaggacgattccgatgcaacaaccttatgctttactc +caagcgatggtgaggcaaccttgtacagaagtgcaaccgccattgtggctgggtcggccc +aaggaacggatattctcctgggtactgacaacccaggtctactgggttctatcgacggta +cagtcaagcctcgagtttactgtctcccacttaagtccgctctgggcattaatgagtctg +tggggtatcaagggtcacccaacgaagtagctagtcccgttgtacatttcgcgcgttacc +tagggagcacggtgagctacgagggtgtagctgcacacagcacggtatataggaacgcaa +acatagtagtatgtccctatgcataacagggagaagtgactctccgacggtcatttatcc +cagactctcctcgctccctactaattgttctatatacaatcggagtaaattggtacctct +ctgacaacataggggggttgaagtttatgccacgcagtctgttacacttttgccggggaa +ttgtgtagaccatgactcaaggtggtggtgcgagttactctactatctactgcttctcat +tacacatctcttggcttacaggccccagttatcagttacgaggctgccttaagagaaggc +caacattcatgatcagatccccgcacacgggatgatagtctgagatctgccggacgctcg +tctgctacaagtgtgggttgagcatagggtaagcctaagggctcgtaatggtacttcgcg +atgtttattcgatatgagctacaaggtataacgttgccttcaccatttcggctcacgact +cttacctcgcctcaccgctagacaccctgaccaaccgttagggtactgacaaccgatcag +gcgactcctaaaggacctctcagcctcccagacatgaggtccgctcgcatgctgttcagc +gagtccatatcaggaacagcaacgagacaaggcgagagcaacactagacttggagacata +ccaccacatctgtttactcttgattcaggaagacctgtggtaactgggcgacgcgtgcgt +ttatccgtcttccaatctccacagaatctgctccgtcagagggatgtatgactaacgcac +tgattttttgttcagtaaccgggcgcggattacggggcgtattccaggggtacattcaac +gggaccccaaggaaaagttcggggtatttaaggaggcggtccaactctcggacttattgg +gcgacgtaatgataagcacacctctgctcatacagtgcacgaagaccggcattgttcaaa +cacagccgtccattccgcgactattgtcctgtgtacaggtgcctcgggtcccaaatccag +cttatacccaaaactctcccggacttttttcgtccttgcaggaggaaaggacctgactcc +acgtttattaggggatcgttgggcccggacaatcgtgtattcaacataataaatgggttc +tagtttaaagccggaggtgacggtggattatggactagaggtaaacatttccggcgtagg +tcagaaagaatatagaccctaaatttacgcaaaacgtgcacacgattgtaggtggagtcg +tattaggaactcagggcgggtggaacgagtgtgttttaggcttaccatgaaccgtcgcgc +ggaaaatgatgacagaatggacggtgcttttttgcggggccaacaaaactcgcttatgtt +cgccattggatgtaagtaccgctatactacgcagcgaccccttacgacattgttgatttc +caatgctttcatggaggtttgtgagcggtcgctaggaatcttcctccagcgagtagccag +ctggccactagttagcaaccagagttcatatgagctccagtaacacgaaggtacataagg +aacgcaagcaagttcgggactacatagaacttggggtgcgtctaagccggggatcttaat +agacaagaggccatcgtatgggtcaaatttcatgtttcgtcagatgccctatccgtggac +acctaaatcaagcatcatatcctaatgctatttgctctcgctttggtatgattcatatgc +agccctgtccgtaaaatgacgggccagaggatacctgtcactacctatttcagattacca +ctgttcgaaaccttgctctgaaatcgatcttcgtagagtgttcgttaatcgccgcgtgaa +ttatataatcccccaaggagtacccttcgtcggtgcagtctacgtaactttcccaggtta +gcccccatctaatcgacgtacgtgagggggctacgggagatcgcacaagccgaagcattt +ctgctctgtttcgttacaactggaatcctcatcacgcagcgctaccggatgccatcccta +gtcatccccgcgagtttaaccagtcgagatggctcgaaccgtgtttcgaaggctggctat +tgaaccagttataaagcaggggcgactgtccgtcggacttcgatataaactatcacaaat +ttggcataagtatatacagccaagaaggctcagataggcacacgcacccaaatagtgacc +gcctacgttcaggttgcccggcaacgaagcgcgcttgctccattaatccactatcagagg +taacgaccctctttcaccgtagctgcccccatgtcggggcaacagtttcccaccgataac +gtgttctgtctagtacgtgaaacggattggctaacccctgtcagcctaattagatgacat +cctcgtacctctagagaaggtgaggagaccgctggaacataagtaaacagtttaccaaac +aatgatcatacatataacagaaaggagagatgcccggtggggtcgaagatacagctgtgg +ttgatatctgcaacggccaggctgtcatgaagatcacgcgcacgaagctatttatgaaag +atacccatgccggggcggcagcggtacctagtcctaaataccgacacgtagcaacgcgtc +ccctgaggcccaccctagtcaagggaacttaaaatatacgctgactttgtctaccaatca +tcttcgattaacaccggcatactaagtctaccctggacccagcaatgagaaaaacttttc +cgaatgatcattgtgagtttacagagattaggaacaccaaaaaaatttacgtacgtccgg +ttacccctgtgtgacccttggccacaaaccgtaaggtgcagcatgggcgttgagtccagg +gtttgtgacaccagacatgaataccctgtggcgggttgttagcatgttattcggatccga +tttcagagggtccgttgataccgggcagtacaagacaccccacaccactgaggtggtacg +tccgccagtctgctccctacgttatgcaaaattccttccccggcgttcttgcctgtacta +ctcctaaagggccgtgaaatccgacgttgctgctccgtctcgggacacccacacaacagc +tacggaaaatcgtgaggatgcacaagggtcttgcattgttgatctatacagctcttcgca +cggtgtgctactgttttccacaatgggcaaggggcgtgtaggtcttatgtaggagtaccc +cgtgatctggctataccttgctatctattccaccaaaatagccggggtcttatagtttta +ttccggatctatcaagtgacaagtccatggggtaaacggtaagtttcgtacgctgggcgg +tgatccccgcttataaacgagcaaaccgccaaagcaaccattgccgggcttccagctagt +aaatgttgggtgtcaatcgtgcatgtgactacttacccacaaagggacgcttgaagcgcc +tgaactcgtcacgtcatgcctagctcccggttgaaacacgaagacgcgtgaacctatctt +tgcttactattcgcctcctttaagaggcttcttgatgtggctctgcgacatggacagtag +tagttgtacctgggtatgttagtgaaattacaagtacctcaaaaacgaattacgtgtata +gagattatgtcactccgtcac diff --git a/packages/apollo-shared/test_data/one_cds.gff3 b/packages/apollo-shared/test_data/one_cds.gff3 new file mode 100644 index 00000000..81626f6e --- /dev/null +++ b/packages/apollo-shared/test_data/one_cds.gff3 @@ -0,0 +1,9 @@ +##gff-version 3 +##sequence-region chr1 1000 9000 +#example01 +chr1 . gene 1000 9000 . + . ID=gene10001;Name=EDEN;testid=t003 +chr1 . mRNA 1050 9000 . + . ID=mRNA10001;Parent=gene10001;Name=EDEN.1;testid=t004,t001,t004 +chr1 . exon 1050 1500 . + . ID=exon10001;Parent=mRNA10001;testid=t007 +chr1 . exon 5000 5500 . + . ID=exon10004;Parent=mRNA10001;testid=t010 +chr1 . CDS 1201 1500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t012,t013,t014 +chr1 . CDS 5000 5000 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t015,t014 diff --git a/packages/apollo-shared/test_data/one_cds.json b/packages/apollo-shared/test_data/one_cds.json new file mode 100644 index 00000000..185f5579 --- /dev/null +++ b/packages/apollo-shared/test_data/one_cds.json @@ -0,0 +1,67 @@ +{ + "_id": "66d70e4ccc30b55b65e5f619", + "refSeq": "chr1", + "type": "gene", + "min": 999, + "max": 9000, + "strand": 1, + "children": { + "66d70e4ccc30b55b65e5f618": { + "_id": "66d70e4ccc30b55b65e5f618", + "refSeq": "chr1", + "type": "mRNA", + "min": 1049, + "max": 9000, + "strand": 1, + "children": { + "66d70e4ccc30b55b65e5f615": { + "_id": "66d70e4ccc30b55b65e5f615", + "refSeq": "chr1", + "type": "exon", + "min": 1049, + "max": 1500, + "strand": 1, + "attributes": { + "gff_id": ["exon10001"], + "testid": ["t007"] + } + }, + "66d70e4ccc30b55b65e5f616": { + "_id": "66d70e4ccc30b55b65e5f616", + "refSeq": "chr1", + "type": "exon", + "min": 4999, + "max": 5500, + "strand": 1, + "attributes": { + "gff_id": ["exon10004"], + "testid": ["t010"] + } + }, + "66d70e4ccc30b55b65e5f617": { + "_id": "66d70e4ccc30b55b65e5f617", + "refSeq": "chr1", + "type": "CDS", + "min": 1200, + "max": 5000, + "strand": 1, + "attributes": { + "gff_id": ["cds10001"], + "gff_name": ["edenprotein.1"], + "testid": ["t012", "t013", "t014", "t015"] + } + } + }, + "attributes": { + "gff_id": ["mRNA10001"], + "gff_name": ["EDEN.1"], + "testid": ["t004", "t001", "t004"] + } + } + }, + "attributes": { + "gff_id": ["gene10001"], + "gff_name": ["EDEN"], + "testid": ["t003"] + } +} diff --git a/packages/apollo-shared/test_data/two_cds.gff3 b/packages/apollo-shared/test_data/two_cds.gff3 new file mode 100644 index 00000000..fd58a8a3 --- /dev/null +++ b/packages/apollo-shared/test_data/two_cds.gff3 @@ -0,0 +1,9 @@ +##gff-version 3 +##sequence-region chr1 1000 9000 +#example01 +chr1 . gene 1000 9000 . + . ID=gene10001;Name=EDEN;testid=t003 +chr1 . mRNA 1050 9000 . + . ID=mRNA10001;Parent=gene10001;Name=EDEN.1;testid=t004,t001,t004 +chr1 . exon 1050 1500 . + . ID=exon10001;Parent=mRNA10001;testid=t007 +chr1 . exon 5000 5500 . + . ID=exon10004;Parent=mRNA10001;testid=t010 +chr1 . CDS 1201 1500 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t012,t013,t014 +chr1 . CDS 5000 5000 . + 0 ID=cds10001;Parent=mRNA10001;Name=edenprotein.1;testid=t014 diff --git a/packages/apollo-shared/test_data/two_cds.json b/packages/apollo-shared/test_data/two_cds.json new file mode 100644 index 00000000..6500195a --- /dev/null +++ b/packages/apollo-shared/test_data/two_cds.json @@ -0,0 +1,67 @@ +{ + "_id": "66d70f3b9c7a7460925687a3", + "refSeq": "chr1", + "type": "gene", + "min": 999, + "max": 9000, + "strand": 1, + "children": { + "66d70f3b9c7a7460925687a2": { + "_id": "66d70f3b9c7a7460925687a2", + "refSeq": "chr1", + "type": "mRNA", + "min": 1049, + "max": 9000, + "strand": 1, + "children": { + "66d70f3b9c7a74609256879f": { + "_id": "66d70f3b9c7a74609256879f", + "refSeq": "chr1", + "type": "exon", + "min": 1049, + "max": 1500, + "strand": 1, + "attributes": { + "gff_id": ["exon10001"], + "testid": ["t007"] + } + }, + "66d70f3b9c7a7460925687a0": { + "_id": "66d70f3b9c7a7460925687a0", + "refSeq": "chr1", + "type": "exon", + "min": 4999, + "max": 5500, + "strand": 1, + "attributes": { + "gff_id": ["exon10004"], + "testid": ["t010"] + } + }, + "66d70f3b9c7a7460925687a1": { + "_id": "66d70f3b9c7a7460925687a1", + "refSeq": "chr1", + "type": "CDS", + "min": 1200, + "max": 5000, + "strand": 1, + "attributes": { + "gff_id": ["cds10001"], + "gff_name": ["edenprotein.1"], + "testid": ["t012", "t013", "t014"] + } + } + }, + "attributes": { + "gff_id": ["mRNA10001"], + "gff_name": ["EDEN.1"], + "testid": ["t004", "t001", "t004"] + } + } + }, + "attributes": { + "gff_id": ["gene10001"], + "gff_name": ["EDEN"], + "testid": ["t003"] + } +}