From 3b0328ea8507668b0db2b8269d872e8a4369df6d Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Tue, 18 Jun 2024 15:49:20 +0200 Subject: [PATCH 01/25] Add bowtie2 and minimap2 modules --- modules.json | 20 + modules/nf-core/bowtie2/align/environment.yml | 9 + modules/nf-core/bowtie2/align/main.nf | 117 ++++ modules/nf-core/bowtie2/align/meta.yml | 95 +++ .../bowtie2/align/tests/cram_crai.config | 5 + .../bowtie2/align/tests/large_index.config | 5 + .../nf-core/bowtie2/align/tests/main.nf.test | 623 ++++++++++++++++++ .../bowtie2/align/tests/main.nf.test.snap | 311 +++++++++ .../nf-core/bowtie2/align/tests/sam.config | 5 + .../nf-core/bowtie2/align/tests/sam2.config | 5 + modules/nf-core/bowtie2/align/tests/tags.yml | 2 + modules/nf-core/bowtie2/build/environment.yml | 7 + modules/nf-core/bowtie2/build/main.nf | 42 ++ modules/nf-core/bowtie2/build/meta.yml | 46 ++ .../nf-core/bowtie2/build/tests/main.nf.test | 31 + .../bowtie2/build/tests/main.nf.test.snap | 45 ++ modules/nf-core/bowtie2/build/tests/tags.yml | 2 + .../nf-core/minimap2/align/environment.yml | 11 + modules/nf-core/minimap2/align/main.nf | 67 ++ modules/nf-core/minimap2/align/meta.yml | 84 +++ .../nf-core/minimap2/align/tests/main.nf.test | 244 +++++++ .../minimap2/align/tests/main.nf.test.snap | 208 ++++++ modules/nf-core/minimap2/align/tests/tags.yml | 2 + .../nf-core/minimap2/index/environment.yml | 7 + modules/nf-core/minimap2/index/main.nf | 44 ++ modules/nf-core/minimap2/index/meta.yml | 43 ++ .../nf-core/minimap2/index/tests/main.nf.test | 32 + .../minimap2/index/tests/main.nf.test.snap | 68 ++ modules/nf-core/minimap2/index/tests/tags.yml | 2 + nextflow_schema.json | 5 +- viral_pathogen_List.csv | 268 ++++++++ 31 files changed, 2453 insertions(+), 2 deletions(-) create mode 100644 modules/nf-core/bowtie2/align/environment.yml create mode 100644 modules/nf-core/bowtie2/align/main.nf create mode 100644 modules/nf-core/bowtie2/align/meta.yml create mode 100644 modules/nf-core/bowtie2/align/tests/cram_crai.config create mode 100644 modules/nf-core/bowtie2/align/tests/large_index.config create mode 100644 modules/nf-core/bowtie2/align/tests/main.nf.test create mode 100644 modules/nf-core/bowtie2/align/tests/main.nf.test.snap create mode 100644 modules/nf-core/bowtie2/align/tests/sam.config create mode 100644 modules/nf-core/bowtie2/align/tests/sam2.config create mode 100644 modules/nf-core/bowtie2/align/tests/tags.yml create mode 100644 modules/nf-core/bowtie2/build/environment.yml create mode 100644 modules/nf-core/bowtie2/build/main.nf create mode 100644 modules/nf-core/bowtie2/build/meta.yml create mode 100644 modules/nf-core/bowtie2/build/tests/main.nf.test create mode 100644 modules/nf-core/bowtie2/build/tests/main.nf.test.snap create mode 100644 modules/nf-core/bowtie2/build/tests/tags.yml create mode 100644 modules/nf-core/minimap2/align/environment.yml create mode 100644 modules/nf-core/minimap2/align/main.nf create mode 100644 modules/nf-core/minimap2/align/meta.yml create mode 100644 modules/nf-core/minimap2/align/tests/main.nf.test create mode 100644 modules/nf-core/minimap2/align/tests/main.nf.test.snap create mode 100644 modules/nf-core/minimap2/align/tests/tags.yml create mode 100644 modules/nf-core/minimap2/index/environment.yml create mode 100644 modules/nf-core/minimap2/index/main.nf create mode 100644 modules/nf-core/minimap2/index/meta.yml create mode 100644 modules/nf-core/minimap2/index/tests/main.nf.test create mode 100644 modules/nf-core/minimap2/index/tests/main.nf.test.snap create mode 100644 modules/nf-core/minimap2/index/tests/tags.yml create mode 100644 viral_pathogen_List.csv diff --git a/modules.json b/modules.json index d45b766..93a1f1a 100644 --- a/modules.json +++ b/modules.json @@ -5,6 +5,16 @@ "https://github.com/nf-core/modules.git": { "modules": { "nf-core": { + "bowtie2/align": { + "branch": "master", + "git_sha": "e4bad511789f16d0df39ee306b2cd50418365048", + "installed_by": ["modules"] + }, + "bowtie2/build": { + "branch": "master", + "git_sha": "1fea64f5132a813ec97c1c6d3a74e0aee7142b6d", + "installed_by": ["modules"] + }, "fastqc": { "branch": "master", "git_sha": "285a50500f9e02578d90b3ce6382ea3c30216acd", @@ -15,6 +25,16 @@ "git_sha": "77decb880af3f0ea6d22b2383c3f1ed86aac4aa2", "installed_by": ["modules"] }, + "minimap2/align": { + "branch": "master", + "git_sha": "e83b347b3e674de6bb1bb7bdf9b2674768c8e0fe", + "installed_by": ["modules"] + }, + "minimap2/index": { + "branch": "master", + "git_sha": "72e277acfd9e61a9f1368eafb4a9e83f5bcaa9f5", + "installed_by": ["modules"] + }, "multiqc": { "branch": "master", "git_sha": "b7ebe95761cd389603f9cc0e0dc384c0f663815a", diff --git a/modules/nf-core/bowtie2/align/environment.yml b/modules/nf-core/bowtie2/align/environment.yml new file mode 100644 index 0000000..d279635 --- /dev/null +++ b/modules/nf-core/bowtie2/align/environment.yml @@ -0,0 +1,9 @@ +name: bowtie2_align +channels: + - conda-forge + - bioconda + - defaults +dependencies: + - bioconda::bowtie2=2.5.2 + - bioconda::samtools=1.18 + - conda-forge::pigz=2.6 diff --git a/modules/nf-core/bowtie2/align/main.nf b/modules/nf-core/bowtie2/align/main.nf new file mode 100644 index 0000000..809525a --- /dev/null +++ b/modules/nf-core/bowtie2/align/main.nf @@ -0,0 +1,117 @@ +process BOWTIE2_ALIGN { + tag "$meta.id" + label 'process_high' + + conda "${moduleDir}/environment.yml" + container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ? + 'https://depot.galaxyproject.org/singularity/mulled-v2-ac74a7f02cebcfcc07d8e8d1d750af9c83b4d45a:f70b31a2db15c023d641c32f433fb02cd04df5a6-0' : + 'biocontainers/mulled-v2-ac74a7f02cebcfcc07d8e8d1d750af9c83b4d45a:f70b31a2db15c023d641c32f433fb02cd04df5a6-0' }" + + input: + tuple val(meta) , path(reads) + tuple val(meta2), path(index) + tuple val(meta3), path(fasta) + val save_unaligned + val sort_bam + + output: + tuple val(meta), path("*.sam") , emit: sam , optional:true + tuple val(meta), path("*.bam") , emit: bam , optional:true + tuple val(meta), path("*.cram") , emit: cram , optional:true + tuple val(meta), path("*.csi") , emit: csi , optional:true + tuple val(meta), path("*.crai") , emit: crai , optional:true + tuple val(meta), path("*.log") , emit: log + tuple val(meta), path("*fastq.gz") , emit: fastq , optional:true + path "versions.yml" , emit: versions + + when: + task.ext.when == null || task.ext.when + + script: + def args = task.ext.args ?: "" + def args2 = task.ext.args2 ?: "" + def prefix = task.ext.prefix ?: "${meta.id}" + + def unaligned = "" + def reads_args = "" + if (meta.single_end) { + unaligned = save_unaligned ? "--un-gz ${prefix}.unmapped.fastq.gz" : "" + reads_args = "-U ${reads}" + } else { + unaligned = save_unaligned ? "--un-conc-gz ${prefix}.unmapped.fastq.gz" : "" + reads_args = "-1 ${reads[0]} -2 ${reads[1]}" + } + + def samtools_command = sort_bam ? 'sort' : 'view' + def extension_pattern = /(--output-fmt|-O)+\s+(\S+)/ + def extension_matcher = (args2 =~ extension_pattern) + def extension = extension_matcher.getCount() > 0 ? extension_matcher[0][2].toLowerCase() : "bam" + def reference = fasta && extension=="cram" ? "--reference ${fasta}" : "" + if (!fasta && extension=="cram") error "Fasta reference is required for CRAM output" + + """ + INDEX=`find -L ./ -name "*.rev.1.bt2" | sed "s/\\.rev.1.bt2\$//"` + [ -z "\$INDEX" ] && INDEX=`find -L ./ -name "*.rev.1.bt2l" | sed "s/\\.rev.1.bt2l\$//"` + [ -z "\$INDEX" ] && echo "Bowtie2 index files not found" 1>&2 && exit 1 + + bowtie2 \\ + -x \$INDEX \\ + $reads_args \\ + --threads $task.cpus \\ + $unaligned \\ + $args \\ + 2> >(tee ${prefix}.bowtie2.log >&2) \\ + | samtools $samtools_command $args2 --threads $task.cpus ${reference} -o ${prefix}.${extension} - + + if [ -f ${prefix}.unmapped.fastq.1.gz ]; then + mv ${prefix}.unmapped.fastq.1.gz ${prefix}.unmapped_1.fastq.gz + fi + + if [ -f ${prefix}.unmapped.fastq.2.gz ]; then + mv ${prefix}.unmapped.fastq.2.gz ${prefix}.unmapped_2.fastq.gz + fi + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + bowtie2: \$(echo \$(bowtie2 --version 2>&1) | sed 's/^.*bowtie2-align-s version //; s/ .*\$//') + samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//') + pigz: \$( pigz --version 2>&1 | sed 's/pigz //g' ) + END_VERSIONS + """ + + stub: + def args2 = task.ext.args2 ?: "" + def prefix = task.ext.prefix ?: "${meta.id}" + def extension_pattern = /(--output-fmt|-O)+\s+(\S+)/ + def extension = (args2 ==~ extension_pattern) ? (args2 =~ extension_pattern)[0][2].toLowerCase() : "bam" + def create_unmapped = "" + if (meta.single_end) { + create_unmapped = save_unaligned ? "touch ${prefix}.unmapped.fastq.gz" : "" + } else { + create_unmapped = save_unaligned ? "touch ${prefix}.unmapped_1.fastq.gz && touch ${prefix}.unmapped_2.fastq.gz" : "" + } + def reference = fasta && extension=="cram" ? "--reference ${fasta}" : "" + if (!fasta && extension=="cram") error "Fasta reference is required for CRAM output" + + def create_index = "" + if (extension == "cram") { + create_index = "touch ${prefix}.crai" + } else if (extension == "bam") { + create_index = "touch ${prefix}.csi" + } + + """ + touch ${prefix}.${extension} + ${create_index} + touch ${prefix}.bowtie2.log + ${create_unmapped} + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + bowtie2: \$(echo \$(bowtie2 --version 2>&1) | sed 's/^.*bowtie2-align-s version //; s/ .*\$//') + samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//') + pigz: \$( pigz --version 2>&1 | sed 's/pigz //g' ) + END_VERSIONS + """ + +} diff --git a/modules/nf-core/bowtie2/align/meta.yml b/modules/nf-core/bowtie2/align/meta.yml new file mode 100644 index 0000000..38610e0 --- /dev/null +++ b/modules/nf-core/bowtie2/align/meta.yml @@ -0,0 +1,95 @@ +name: bowtie2_align +description: Align reads to a reference genome using bowtie2 +keywords: + - align + - map + - fasta + - fastq + - genome + - reference +tools: + - bowtie2: + description: | + Bowtie 2 is an ultrafast and memory-efficient tool for aligning + sequencing reads to long reference sequences. + homepage: http://bowtie-bio.sourceforge.net/bowtie2/index.shtml + documentation: http://bowtie-bio.sourceforge.net/bowtie2/manual.shtml + doi: 10.1038/nmeth.1923 + licence: ["GPL-3.0-or-later"] +input: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - reads: + type: file + description: | + List of input FastQ files of size 1 and 2 for single-end and paired-end data, + respectively. + - meta2: + type: map + description: | + Groovy Map containing reference information + e.g. [ id:'test', single_end:false ] + - index: + type: file + description: Bowtie2 genome index files + pattern: "*.ebwt" + - meta3: + type: map + description: | + Groovy Map containing reference information + e.g. [ id:'test', single_end:false ] + - fasta: + type: file + description: Bowtie2 genome fasta file + pattern: "*.fasta" + - save_unaligned: + type: boolean + description: | + Save reads that do not map to the reference (true) or discard them (false) + (default: false) + - sort_bam: + type: boolean + description: use samtools sort (true) or samtools view (false) + pattern: "true or false" +output: + - sam: + type: file + description: Output SAM file containing read alignments + pattern: "*.sam" + - bam: + type: file + description: Output BAM file containing read alignments + pattern: "*.bam" + - cram: + type: file + description: Output CRAM file containing read alignments + pattern: "*.cram" + - csi: + type: file + description: Output SAM/BAM index for large inputs + pattern: "*.csi" + - crai: + type: file + description: Output CRAM index + pattern: "*.crai" + - log: + type: file + description: Aligment log + pattern: "*.log" + - fastq: + type: file + description: Unaligned FastQ files + pattern: "*.fastq.gz" + - versions: + type: file + description: File containing software versions + pattern: "versions.yml" +authors: + - "@joseespinosa" + - "@drpatelh" +maintainers: + - "@joseespinosa" + - "@drpatelh" diff --git a/modules/nf-core/bowtie2/align/tests/cram_crai.config b/modules/nf-core/bowtie2/align/tests/cram_crai.config new file mode 100644 index 0000000..03f1d5e --- /dev/null +++ b/modules/nf-core/bowtie2/align/tests/cram_crai.config @@ -0,0 +1,5 @@ +process { + withName: BOWTIE2_ALIGN { + ext.args2 = '--output-fmt cram --write-index' + } +} diff --git a/modules/nf-core/bowtie2/align/tests/large_index.config b/modules/nf-core/bowtie2/align/tests/large_index.config new file mode 100644 index 0000000..fdc1c59 --- /dev/null +++ b/modules/nf-core/bowtie2/align/tests/large_index.config @@ -0,0 +1,5 @@ +process { + withName: BOWTIE2_BUILD { + ext.args = '--large-index' + } +} \ No newline at end of file diff --git a/modules/nf-core/bowtie2/align/tests/main.nf.test b/modules/nf-core/bowtie2/align/tests/main.nf.test new file mode 100644 index 0000000..03aeaf9 --- /dev/null +++ b/modules/nf-core/bowtie2/align/tests/main.nf.test @@ -0,0 +1,623 @@ +nextflow_process { + + name "Test Process BOWTIE2_ALIGN" + script "../main.nf" + process "BOWTIE2_ALIGN" + tag "modules" + tag "modules_nfcore" + tag "bowtie2" + tag "bowtie2/build" + tag "bowtie2/align" + + test("sarscov2 - fastq, index, fasta, false, false - bam") { + + setup { + run("BOWTIE2_BUILD") { + script "../../build/main.nf" + process { + """ + input[0] = [ + [ id:'test'], + file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true) + ] + """ + } + } + } + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:true ], // meta map + file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true) + ] + input[1] = BOWTIE2_BUILD.out.index + input[2] = [[ id:'test'], file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)] + input[3] = false //save_unaligned + input[4] = false //sort + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot( + file(process.out.bam[0][1]).name, + process.out.log, + process.out.fastq, + process.out.versions + ).match() } + ) + } + + } + + test("sarscov2 - fastq, index, fasta, false, false - sam") { + + config "./sam.config" + setup { + run("BOWTIE2_BUILD") { + script "../../build/main.nf" + process { + """ + input[0] = [ + [ id:'test'], + file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true) + ] + """ + } + } + } + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:true ], // meta map + file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true) + ] + input[1] = BOWTIE2_BUILD.out.index + input[2] = [[ id:'test'], file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)] + input[3] = false //save_unaligned + input[4] = false //sort + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot( + file(process.out.sam[0][1]).readLines()[0..4], + process.out.log, + process.out.fastq, + process.out.versions + ).match() } + ) + } + + } + + test("sarscov2 - fastq, index, fasta, false, false - sam2") { + + config "./sam2.config" + setup { + run("BOWTIE2_BUILD") { + script "../../build/main.nf" + process { + """ + input[0] = [ + [ id:'test'], + file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true) + ] + """ + } + } + } + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:true ], // meta map + file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true) + ] + input[1] = BOWTIE2_BUILD.out.index + input[2] = [[ id:'test'], file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)] + input[3] = false //save_unaligned + input[4] = false //sort + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot( + file(process.out.sam[0][1]).readLines()[0..4], + process.out.log, + process.out.fastq, + process.out.versions + ).match() } + ) + } + + } + + test("sarscov2 - fastq, index, fasta, false, true - bam") { + + setup { + run("BOWTIE2_BUILD") { + script "../../build/main.nf" + process { + """ + input[0] = [ + [ id:'test'], + file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true) + ] + """ + } + } + } + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:true ], // meta map + file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true) + ] + input[1] = BOWTIE2_BUILD.out.index + input[2] = [[ id:'test'], file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)] + input[3] = false //save_unaligned + input[4] = false //sort + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot( + file(process.out.bam[0][1]).name, + process.out.log, + process.out.fastq, + process.out.versions + ).match() } + ) + } + + } + + test("sarscov2 - [fastq1, fastq2], index, fasta, false, false - bam") { + + setup { + run("BOWTIE2_BUILD") { + script "../../build/main.nf" + process { + """ + input[0] = [ + [ id:'test'], + file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true) + ] + """ + } + } + } + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:false ], // meta map + [ + file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true), + file(params.test_data['sarscov2']['illumina']['test_2_fastq_gz'], checkIfExists: true) + ] + ] + input[1] = BOWTIE2_BUILD.out.index + input[2] = [[ id:'test'], file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)] + input[3] = false //save_unaligned + input[4] = false //sort + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot( + file(process.out.bam[0][1]).name, + process.out.log, + process.out.fastq, + process.out.versions + ).match() } + ) + } + + } + + test("sarscov2 - [fastq1, fastq2], index, fasta, false, true - bam") { + + setup { + run("BOWTIE2_BUILD") { + script "../../build/main.nf" + process { + """ + input[0] = [ + [ id:'test'], + file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true) + ] + """ + } + } + } + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:false ], // meta map + [ + file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true), + file(params.test_data['sarscov2']['illumina']['test_2_fastq_gz'], checkIfExists: true) + ] + ] + input[1] = BOWTIE2_BUILD.out.index + input[2] = [[ id:'test'], file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)] + input[3] = false //save_unaligned + input[4] = false //sort + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot( + file(process.out.bam[0][1]).name, + process.out.log, + process.out.fastq, + process.out.versions + ).match() } + ) + } + + } + + test("sarscov2 - fastq, large_index, fasta, false, false - bam") { + + config "./large_index.config" + setup { + run("BOWTIE2_BUILD") { + script "../../build/main.nf" + process { + """ + input[0] = [ + [ id:'test'], + file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true) + ] + """ + } + } + } + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:true ], // meta map + file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true) + ] + input[1] = BOWTIE2_BUILD.out.index + input[2] = [[ id:'test'], file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)] + input[3] = false //save_unaligned + input[4] = false //sort + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot( + file(process.out.bam[0][1]).name, + process.out.log, + process.out.fastq, + process.out.versions + ).match() } + ) + } + + } + + test("sarscov2 - [fastq1, fastq2], large_index, fasta, false, false - bam") { + + config "./large_index.config" + setup { + run("BOWTIE2_BUILD") { + script "../../build/main.nf" + process { + """ + input[0] = [ + [ id:'test'], + file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true) + ] + """ + } + } + } + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:false ], // meta map + [ + file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true), + file(params.test_data['sarscov2']['illumina']['test_2_fastq_gz'], checkIfExists: true) + ] + ] + input[1] = BOWTIE2_BUILD.out.index + input[2] = [[ id:'test'], file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)] + input[3] = false //save_unaligned + input[4] = false //sort + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot( + file(process.out.bam[0][1]).name, + process.out.log, + process.out.fastq, + process.out.versions + ).match() } + ) + } + + } + + test("sarscov2 - [fastq1, fastq2], index, fasta, true, false - bam") { + + setup { + run("BOWTIE2_BUILD") { + script "../../build/main.nf" + process { + """ + input[0] = [ + [ id:'test'], + file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true) + ] + """ + } + } + } + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:false ], // meta map + [ + file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true), + file(params.test_data['sarscov2']['illumina']['test_2_fastq_gz'], checkIfExists: true) + ] + ] + input[1] = BOWTIE2_BUILD.out.index + input[2] = [[ id:'test'], file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)] + input[3] = false //save_unaligned + input[4] = false //sort + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot( + file(process.out.bam[0][1]).name, + process.out.log, + process.out.fastq, + process.out.versions + ).match() } + ) + } + + } + + test("sarscov2 - fastq, index, fasta, true, false - bam") { + + setup { + run("BOWTIE2_BUILD") { + script "../../build/main.nf" + process { + """ + input[0] = [ + [ id:'test'], + file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true) + ] + """ + } + } + } + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:true ], // meta map + file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true) + ] + input[1] = BOWTIE2_BUILD.out.index + input[2] = [[ id:'test'], file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)] + input[3] = false //save_unaligned + input[4] = false //sort + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot( + file(process.out.bam[0][1]).name, + process.out.log, + process.out.fastq, + process.out.versions + ).match() } + + ) + } + + } + + test("sarscov2 - [fastq1, fastq2], index, fasta, true, true - cram") { + + config "./cram_crai.config" + setup { + run("BOWTIE2_BUILD") { + script "../../build/main.nf" + process { + """ + input[0] = [ + [ id:'test'], + file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true) + ] + """ + } + } + } + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:false ], // meta map + [ + file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true), + file(params.test_data['sarscov2']['illumina']['test_2_fastq_gz'], checkIfExists: true) + ] + ] + input[1] = BOWTIE2_BUILD.out.index + input[2] = [[ id:'test'], file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)] + input[3] = false //save_unaligned + input[4] = true //sort + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot( + file(process.out.cram[0][1]).name, + file(process.out.crai[0][1]).name + ).match() } + ) + } + + } + + test("sarscov2 - [fastq1, fastq2], index, fasta, false, false - stub") { + + options "-stub" + setup { + run("BOWTIE2_BUILD") { + script "../../build/main.nf" + process { + """ + input[0] = [ + [ id:'test'], + file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true) + ] + """ + } + } + } + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:false ], // meta map + [ + file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true), + file(params.test_data['sarscov2']['illumina']['test_2_fastq_gz'], checkIfExists: true) + ] + ] + input[1] = BOWTIE2_BUILD.out.index + input[2] = [[ id:'test'], file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)] + input[3] = false //save_unaligned + input[4] = false //sort + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot( + file(process.out.bam[0][1]).name, + file(process.out.csi[0][1]).name, + file(process.out.log[0][1]).name, + process.out.fastq, + process.out.versions + ).match() } + ) + } + + } + + test("sarscov2 - fastq, index, fasta, true, false - stub") { + + options "-stub" + setup { + run("BOWTIE2_BUILD") { + script "../../build/main.nf" + process { + """ + input[0] = [ + [ id:'test'], + file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true) + ] + """ + } + } + } + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:true ], // meta map + file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true) + ] + input[1] = BOWTIE2_BUILD.out.index + input[2] = [[ id:'test'], file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)] + input[3] = false //save_unaligned + input[4] = false //sort + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot( + file(process.out.bam[0][1]).name, + file(process.out.csi[0][1]).name, + file(process.out.log[0][1]).name, + process.out.fastq, + process.out.versions + ).match() } + ) + } + + } + +} diff --git a/modules/nf-core/bowtie2/align/tests/main.nf.test.snap b/modules/nf-core/bowtie2/align/tests/main.nf.test.snap new file mode 100644 index 0000000..028e7da --- /dev/null +++ b/modules/nf-core/bowtie2/align/tests/main.nf.test.snap @@ -0,0 +1,311 @@ +{ + "sarscov2 - [fastq1, fastq2], large_index, fasta, false, false - bam": { + "content": [ + "test.bam", + [ + [ + { + "id": "test", + "single_end": false + }, + "test.bowtie2.log:md5,bd89ce1b28c93bf822bae391ffcedd19" + ] + ], + [ + + ], + [ + "versions.yml:md5,01d18ab035146ea790e9a0f70adb758f" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "23.10.1" + }, + "timestamp": "2024-03-18T13:19:25.337323" + }, + "sarscov2 - fastq, index, fasta, false, false - sam2": { + "content": [ + [ + "ERR5069949.2151832\t16\tMT192765.1\t17453\t42\t150M\t*\t0\t0\tACGCACATTGCTAACTAAGGGCACACTAGAACCAGAATATTTCAATTCAGTGTGTAGACTTATGAAAACTATAGGTCCAGACATGTTCCTCGGAACTTGTCGGCGTTGTCCTGCTGAAATTGTTGACACTGTGAGTGCTTTGGTTTATGA\tAAAA versions.yml + "${task.process}": + bowtie2: \$(echo \$(bowtie2 --version 2>&1) | sed 's/^.*bowtie2-align-s version //; s/ .*\$//') + END_VERSIONS + """ + + stub: + """ + mkdir bowtie2 + touch bowtie2/${fasta.baseName}.{1..4}.bt2 + touch bowtie2/${fasta.baseName}.rev.{1,2}.bt2 + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + bowtie2: \$(echo \$(bowtie2 --version 2>&1) | sed 's/^.*bowtie2-align-s version //; s/ .*\$//') + END_VERSIONS + """ +} diff --git a/modules/nf-core/bowtie2/build/meta.yml b/modules/nf-core/bowtie2/build/meta.yml new file mode 100644 index 0000000..2d68799 --- /dev/null +++ b/modules/nf-core/bowtie2/build/meta.yml @@ -0,0 +1,46 @@ +name: bowtie2_build +description: Builds bowtie index for reference genome +keywords: + - build + - index + - fasta + - genome + - reference +tools: + - bowtie2: + description: | + Bowtie 2 is an ultrafast and memory-efficient tool for aligning + sequencing reads to long reference sequences. + homepage: http://bowtie-bio.sourceforge.net/bowtie2/index.shtml + documentation: http://bowtie-bio.sourceforge.net/bowtie2/manual.shtml + doi: 10.1038/nmeth.1923 + licence: ["GPL-3.0-or-later"] +input: + - meta: + type: map + description: | + Groovy Map containing reference information + e.g. [ id:'test', single_end:false ] + - fasta: + type: file + description: Input genome fasta file +output: + - meta: + type: map + description: | + Groovy Map containing reference information + e.g. [ id:'test', single_end:false ] + - index: + type: file + description: Bowtie2 genome index files + pattern: "*.bt2" + - versions: + type: file + description: File containing software versions + pattern: "versions.yml" +authors: + - "@joseespinosa" + - "@drpatelh" +maintainers: + - "@joseespinosa" + - "@drpatelh" diff --git a/modules/nf-core/bowtie2/build/tests/main.nf.test b/modules/nf-core/bowtie2/build/tests/main.nf.test new file mode 100644 index 0000000..1637602 --- /dev/null +++ b/modules/nf-core/bowtie2/build/tests/main.nf.test @@ -0,0 +1,31 @@ +nextflow_process { + + name "Test Process BOWTIE2_BUILD" + script "modules/nf-core/bowtie2/build/main.nf" + process "BOWTIE2_BUILD" + tag "modules" + tag "modules_nfcore" + tag "bowtie2" + tag "bowtie2/build" + + test("Should run without failures") { + + when { + process { + """ + input[0] = [ + [ id:'test' ], + file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true) + ] + """ + } + } + + then { + assert process.success + assert snapshot(process.out).match() + } + + } + +} diff --git a/modules/nf-core/bowtie2/build/tests/main.nf.test.snap b/modules/nf-core/bowtie2/build/tests/main.nf.test.snap new file mode 100644 index 0000000..6875e02 --- /dev/null +++ b/modules/nf-core/bowtie2/build/tests/main.nf.test.snap @@ -0,0 +1,45 @@ +{ + "Should run without failures": { + "content": [ + { + "0": [ + [ + { + "id": "test" + }, + [ + "genome.1.bt2:md5,cbe3d0bbea55bc57c99b4bfa25b5fbdf", + "genome.2.bt2:md5,47b153cd1319abc88dda532462651fcf", + "genome.3.bt2:md5,4ed93abba181d8dfab2e303e33114777", + "genome.4.bt2:md5,c25be5f8b0378abf7a58c8a880b87626", + "genome.rev.1.bt2:md5,52be6950579598a990570fbcf5372184", + "genome.rev.2.bt2:md5,e3b4ef343dea4dd571642010a7d09597" + ] + ] + ], + "1": [ + "versions.yml:md5,1df11e9b82891527271c889c880d3974" + ], + "index": [ + [ + { + "id": "test" + }, + [ + "genome.1.bt2:md5,cbe3d0bbea55bc57c99b4bfa25b5fbdf", + "genome.2.bt2:md5,47b153cd1319abc88dda532462651fcf", + "genome.3.bt2:md5,4ed93abba181d8dfab2e303e33114777", + "genome.4.bt2:md5,c25be5f8b0378abf7a58c8a880b87626", + "genome.rev.1.bt2:md5,52be6950579598a990570fbcf5372184", + "genome.rev.2.bt2:md5,e3b4ef343dea4dd571642010a7d09597" + ] + ] + ], + "versions": [ + "versions.yml:md5,1df11e9b82891527271c889c880d3974" + ] + } + ], + "timestamp": "2023-11-23T11:51:01.107681997" + } +} \ No newline at end of file diff --git a/modules/nf-core/bowtie2/build/tests/tags.yml b/modules/nf-core/bowtie2/build/tests/tags.yml new file mode 100644 index 0000000..81aa61d --- /dev/null +++ b/modules/nf-core/bowtie2/build/tests/tags.yml @@ -0,0 +1,2 @@ +bowtie2/build: + - modules/nf-core/bowtie2/build/** diff --git a/modules/nf-core/minimap2/align/environment.yml b/modules/nf-core/minimap2/align/environment.yml new file mode 100644 index 0000000..41e8fe9 --- /dev/null +++ b/modules/nf-core/minimap2/align/environment.yml @@ -0,0 +1,11 @@ +name: minimap2_align + +channels: + - conda-forge + - bioconda + - defaults + +dependencies: + - bioconda::htslib=1.20 + - bioconda::minimap2=2.28 + - bioconda::samtools=1.20 diff --git a/modules/nf-core/minimap2/align/main.nf b/modules/nf-core/minimap2/align/main.nf new file mode 100644 index 0000000..66745ef --- /dev/null +++ b/modules/nf-core/minimap2/align/main.nf @@ -0,0 +1,67 @@ +process MINIMAP2_ALIGN { + tag "$meta.id" + label 'process_high' + + // Note: the versions here need to match the versions used in the mulled container below and minimap2/index + conda "${moduleDir}/environment.yml" + container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ? + 'https://depot.galaxyproject.org/singularity/mulled-v2-66534bcbb7031a148b13e2ad42583020b9cd25c4:3161f532a5ea6f1dec9be5667c9efc2afdac6104-0' : + 'biocontainers/mulled-v2-66534bcbb7031a148b13e2ad42583020b9cd25c4:3161f532a5ea6f1dec9be5667c9efc2afdac6104-0' }" + + input: + tuple val(meta), path(reads) + tuple val(meta2), path(reference) + val bam_format + val bam_index_extension + val cigar_paf_format + val cigar_bam + + output: + tuple val(meta), path("*.paf") , optional: true, emit: paf + tuple val(meta), path("*.bam") , optional: true, emit: bam + tuple val(meta), path("*.bam.${bam_index_extension}"), optional: true, emit: index + path "versions.yml" , emit: versions + + when: + task.ext.when == null || task.ext.when + + script: + def args = task.ext.args ?: '' + def args2 = task.ext.args2 ?: '' + def prefix = task.ext.prefix ?: "${meta.id}" + def bam_index = bam_index_extension ? "${prefix}.bam##idx##${prefix}.bam.${bam_index_extension} --write-index" : "${prefix}.bam" + def bam_output = bam_format ? "-a | samtools sort -@ ${task.cpus-1} -o ${bam_index} ${args2}" : "-o ${prefix}.paf" + def cigar_paf = cigar_paf_format && !bam_format ? "-c" : '' + def set_cigar_bam = cigar_bam && bam_format ? "-L" : '' + """ + minimap2 \\ + $args \\ + -t $task.cpus \\ + ${reference ?: reads} \\ + $reads \\ + $cigar_paf \\ + $set_cigar_bam \\ + $bam_output + + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + minimap2: \$(minimap2 --version 2>&1) + samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//') + END_VERSIONS + """ + + stub: + def prefix = task.ext.prefix ?: "${meta.id}" + def output_file = bam_format ? "${prefix}.bam" : "${prefix}.paf" + def bam_index = bam_index_extension ? "touch ${prefix}.bam.${bam_index_extension}" : "" + """ + touch $output_file + ${bam_index} + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + minimap2: \$(minimap2 --version 2>&1) + END_VERSIONS + """ +} diff --git a/modules/nf-core/minimap2/align/meta.yml b/modules/nf-core/minimap2/align/meta.yml new file mode 100644 index 0000000..8996f88 --- /dev/null +++ b/modules/nf-core/minimap2/align/meta.yml @@ -0,0 +1,84 @@ +name: minimap2_align +description: A versatile pairwise aligner for genomic and spliced nucleotide sequences +keywords: + - align + - fasta + - fastq + - genome + - paf + - reference +tools: + - minimap2: + description: | + A versatile pairwise aligner for genomic and spliced nucleotide sequences. + homepage: https://github.com/lh3/minimap2 + documentation: https://github.com/lh3/minimap2#uguide + licence: ["MIT"] +input: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - reads: + type: file + description: | + List of input FASTA or FASTQ files of size 1 and 2 for single-end + and paired-end data, respectively. + - meta2: + type: map + description: | + Groovy Map containing reference information + e.g. [ id:'test_ref'] + - reference: + type: file + description: | + Reference database in FASTA format. + - bam_format: + type: boolean + description: Specify that output should be in BAM format + - bam_index_extension: + type: string + description: BAM alignment index extension (e.g. "bai") + - cigar_paf_format: + type: boolean + description: Specify that output CIGAR should be in PAF format + - cigar_bam: + type: boolean + description: | + Write CIGAR with >65535 ops at the CG tag. This is recommended when + doing XYZ (https://github.com/lh3/minimap2#working-with-65535-cigar-operations) +output: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - paf: + type: file + description: Alignment in PAF format + pattern: "*.paf" + - bam: + type: file + description: Alignment in BAM format + pattern: "*.bam" + - index: + type: file + description: BAM alignment index + pattern: "*.bam.*" + - versions: + type: file + description: File containing software versions + pattern: "versions.yml" +authors: + - "@heuermh" + - "@sofstam" + - "@sateeshperi" + - "@jfy133" + - "@fellen31" +maintainers: + - "@heuermh" + - "@sofstam" + - "@sateeshperi" + - "@jfy133" + - "@fellen31" diff --git a/modules/nf-core/minimap2/align/tests/main.nf.test b/modules/nf-core/minimap2/align/tests/main.nf.test new file mode 100644 index 0000000..c93f436 --- /dev/null +++ b/modules/nf-core/minimap2/align/tests/main.nf.test @@ -0,0 +1,244 @@ +nextflow_process { + + name "Test Process MINIMAP2_ALIGN" + script "../main.nf" + process "MINIMAP2_ALIGN" + + tag "modules" + tag "modules_nfcore" + tag "minimap2" + tag "minimap2/align" + + test("sarscov2 - fastq, fasta, true, [], false, false") { + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:true ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_1.fastq.gz', checkIfExists: true) + ] + input[1] = [ + [ id:'test_ref' ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ] + input[2] = true + input[3] = [] + input[4] = false + input[5] = false + """ + } + } + + then { + assertAll( + { assert process.success }, + { assert snapshot( + file(process.out.bam[0][1]).name, + process.out.versions + ).match() } + ) + } + + } + + test("sarscov2 - fastq, fasta, true, 'bai', false, false") { + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:true ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_1.fastq.gz', checkIfExists: true) + ] + input[1] = [ + [ id:'test_ref' ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ] + input[2] = true + input[3] = 'bai' + input[4] = false + input[5] = false + """ + } + } + + then { + assertAll( + { assert process.success }, + { assert snapshot( + file(process.out.bam[0][1]).name, + file(process.out.index[0][1]).name, + process.out.versions + ).match() } + ) + } + + } + + test("sarscov2 - [fastq1, fastq2], fasta, true, false, false") { + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:false ], // meta map + [ + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_1.fastq.gz', checkIfExists: true), + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_2.fastq.gz', checkIfExists: true) + ] + ] + input[1] = [ + [ id:'test_ref' ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ] + input[2] = true + input[3] = [] + input[4] = false + input[5] = false + """ + } + } + + then { + assertAll( + { assert process.success }, + { assert snapshot( + file(process.out.bam[0][1]).name, + process.out.versions + ).match() } + ) + } + + } + + test("sarscov2 - fastq, [], true, false, false") { + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:true ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_1.fastq.gz', checkIfExists: true), + ] + input[1] = [ + [ id:'test_ref' ], // meta map + [] + ] + input[2] = true + input[3] = [] + input[4] = false + input[5] = false + """ + } + } + + then { + assertAll( + { assert process.success }, + { assert snapshot( + file(process.out.bam[0][1]).name, + process.out.versions + ).match() } + ) + } + + } + + test("sarscov2 - fastq, fasta, true, [], false, false - stub") { + + options "-stub" + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:true ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_1.fastq.gz', checkIfExists: true) + ] + input[1] = [ + [ id:'test_ref' ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ] + input[2] = true + input[3] = [] + input[4] = false + input[5] = false + """ + } + } + + then { + assertAll( + { assert process.success }, + { assert snapshot(process.out).match() } + ) + } + + } + + test("sarscov2 - fastq, fasta, true, 'bai', false, false - stub") { + + options "-stub" + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:true ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_1.fastq.gz', checkIfExists: true) + ] + input[1] = [ + [ id:'test_ref' ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ] + input[2] = true + input[3] = 'bai' + input[4] = false + input[5] = false + """ + } + } + + then { + assertAll( + { assert process.success }, + { assert snapshot(process.out).match() } + ) + } + + } + + test("sarscov2 - fastq, fasta, false, [], false, false - stub") { + + options "-stub" + + when { + process { + """ + input[0] = [ + [ id:'test', single_end:true ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_1.fastq.gz', checkIfExists: true) + ] + input[1] = [ + [ id:'test_ref' ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ] + input[2] = false + input[3] = [] + input[4] = false + input[5] = false + """ + } + } + + then { + assertAll( + { assert process.success }, + { assert snapshot(process.out).match() } + ) + } + + } + +} \ No newline at end of file diff --git a/modules/nf-core/minimap2/align/tests/main.nf.test.snap b/modules/nf-core/minimap2/align/tests/main.nf.test.snap new file mode 100644 index 0000000..ecb3e4e --- /dev/null +++ b/modules/nf-core/minimap2/align/tests/main.nf.test.snap @@ -0,0 +1,208 @@ +{ + "sarscov2 - fastq, fasta, true, 'bai', false, false - stub": { + "content": [ + { + "0": [ + + ], + "1": [ + [ + { + "id": "test", + "single_end": true + }, + "test.bam:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "2": [ + [ + { + "id": "test", + "single_end": true + }, + "test.bam.bai:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "3": [ + "versions.yml:md5,98b8f5f36aa54b82210094f0b0d11938" + ], + "bam": [ + [ + { + "id": "test", + "single_end": true + }, + "test.bam:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "index": [ + [ + { + "id": "test", + "single_end": true + }, + "test.bam.bai:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "paf": [ + + ], + "versions": [ + "versions.yml:md5,98b8f5f36aa54b82210094f0b0d11938" + ] + } + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-06-03T11:29:44.669021368" + }, + "sarscov2 - fastq, fasta, false, [], false, false - stub": { + "content": [ + { + "0": [ + [ + { + "id": "test", + "single_end": true + }, + "test.paf:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "1": [ + + ], + "2": [ + + ], + "3": [ + "versions.yml:md5,98b8f5f36aa54b82210094f0b0d11938" + ], + "bam": [ + + ], + "index": [ + + ], + "paf": [ + [ + { + "id": "test", + "single_end": true + }, + "test.paf:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "versions": [ + "versions.yml:md5,98b8f5f36aa54b82210094f0b0d11938" + ] + } + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-06-03T11:15:52.738781039" + }, + "sarscov2 - fastq, fasta, true, [], false, false - stub": { + "content": [ + { + "0": [ + + ], + "1": [ + [ + { + "id": "test", + "single_end": true + }, + "test.bam:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "2": [ + + ], + "3": [ + "versions.yml:md5,98b8f5f36aa54b82210094f0b0d11938" + ], + "bam": [ + [ + { + "id": "test", + "single_end": true + }, + "test.bam:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "index": [ + + ], + "paf": [ + + ], + "versions": [ + "versions.yml:md5,98b8f5f36aa54b82210094f0b0d11938" + ] + } + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-06-03T11:15:23.033808223" + }, + "sarscov2 - [fastq1, fastq2], fasta, true, false, false": { + "content": [ + "test.bam", + [ + "versions.yml:md5,3548eeba9066efbf8d78ea99f8d813fd" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-06-03T12:21:31.582849048" + }, + "sarscov2 - fastq, fasta, true, [], false, false": { + "content": [ + "test.bam", + [ + "versions.yml:md5,3548eeba9066efbf8d78ea99f8d813fd" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-06-03T12:29:11.968586416" + }, + "sarscov2 - fastq, fasta, true, 'bai', false, false": { + "content": [ + "test.bam", + "test.bam.bai", + [ + "versions.yml:md5,3548eeba9066efbf8d78ea99f8d813fd" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-06-03T12:21:20.362186362" + }, + "sarscov2 - fastq, [], true, false, false": { + "content": [ + "test.bam", + [ + "versions.yml:md5,3548eeba9066efbf8d78ea99f8d813fd" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-06-03T12:21:37.233709954" + } +} \ No newline at end of file diff --git a/modules/nf-core/minimap2/align/tests/tags.yml b/modules/nf-core/minimap2/align/tests/tags.yml new file mode 100644 index 0000000..39dba37 --- /dev/null +++ b/modules/nf-core/minimap2/align/tests/tags.yml @@ -0,0 +1,2 @@ +minimap2/align: + - "modules/nf-core/minimap2/align/**" diff --git a/modules/nf-core/minimap2/index/environment.yml b/modules/nf-core/minimap2/index/environment.yml new file mode 100644 index 0000000..8a912a1 --- /dev/null +++ b/modules/nf-core/minimap2/index/environment.yml @@ -0,0 +1,7 @@ +name: minimap2_index +channels: + - conda-forge + - bioconda + - defaults +dependencies: + - bioconda::minimap2=2.28 diff --git a/modules/nf-core/minimap2/index/main.nf b/modules/nf-core/minimap2/index/main.nf new file mode 100644 index 0000000..3832021 --- /dev/null +++ b/modules/nf-core/minimap2/index/main.nf @@ -0,0 +1,44 @@ +process MINIMAP2_INDEX { + label 'process_low' + + // Note: the versions here need to match the versions used in minimap2/align + conda "${moduleDir}/environment.yml" + container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ? + 'https://depot.galaxyproject.org/singularity/minimap2:2.28--he4a0461_0' : + 'biocontainers/minimap2:2.28--he4a0461_0' }" + + input: + tuple val(meta), path(fasta) + + output: + tuple val(meta), path("*.mmi"), emit: index + path "versions.yml" , emit: versions + + when: + task.ext.when == null || task.ext.when + + script: + def args = task.ext.args ?: '' + """ + minimap2 \\ + -t $task.cpus \\ + -d ${fasta.baseName}.mmi \\ + $args \\ + $fasta + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + minimap2: \$(minimap2 --version 2>&1) + END_VERSIONS + """ + + stub: + """ + touch ${fasta.baseName}.mmi + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + minimap2: \$(minimap2 --version 2>&1) + END_VERSIONS + """ +} diff --git a/modules/nf-core/minimap2/index/meta.yml b/modules/nf-core/minimap2/index/meta.yml new file mode 100644 index 0000000..1d29e3f --- /dev/null +++ b/modules/nf-core/minimap2/index/meta.yml @@ -0,0 +1,43 @@ +name: minimap2_index +description: Provides fasta index required by minimap2 alignment. +keywords: + - index + - fasta + - reference +tools: + - minimap2: + description: | + A versatile pairwise aligner for genomic and spliced nucleotide sequences. + homepage: https://github.com/lh3/minimap2 + documentation: https://github.com/lh3/minimap2#uguide + licence: ["MIT"] +input: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - fasta: + type: file + description: | + Reference database in FASTA format. +output: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - index: + type: file + description: Minimap2 fasta index. + pattern: "*.mmi" + - versions: + type: file + description: File containing software versions + pattern: "versions.yml" +authors: + - "@yuukiiwa" + - "@drpatelh" +maintainers: + - "@yuukiiwa" + - "@drpatelh" diff --git a/modules/nf-core/minimap2/index/tests/main.nf.test b/modules/nf-core/minimap2/index/tests/main.nf.test new file mode 100644 index 0000000..97840ff --- /dev/null +++ b/modules/nf-core/minimap2/index/tests/main.nf.test @@ -0,0 +1,32 @@ +nextflow_process { + + name "Test Process MINIMAP2_INDEX" + script "../main.nf" + process "MINIMAP2_INDEX" + + tag "modules" + tag "modules_nfcore" + tag "minimap2" + tag "minimap2/index" + + test("minimap2 index") { + + when { + process { + """ + input[0] = [ + [ id:'test' ], + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ] + """ + } + } + + then { + assert process.success + assert snapshot(process.out).match() + } + + } + +} \ No newline at end of file diff --git a/modules/nf-core/minimap2/index/tests/main.nf.test.snap b/modules/nf-core/minimap2/index/tests/main.nf.test.snap new file mode 100644 index 0000000..0b09882 --- /dev/null +++ b/modules/nf-core/minimap2/index/tests/main.nf.test.snap @@ -0,0 +1,68 @@ +{ + "Should run without failures": { + "content": [ + { + "0": [ + [ + { + "id": "test_ref" + }, + "genome.mmi:md5,72e450f12dc691e763c697463bdb1571" + ] + ], + "1": [ + "versions.yml:md5,0fced0ee8015e7f50b82566e3db8f7b0" + ], + "index": [ + [ + { + "id": "test_ref" + }, + "genome.mmi:md5,72e450f12dc691e763c697463bdb1571" + ] + ], + "versions": [ + "versions.yml:md5,0fced0ee8015e7f50b82566e3db8f7b0" + ] + } + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "23.10.1" + }, + "timestamp": "2024-03-18T11:46:30.000058092" + }, + "minimap2 index": { + "content": [ + { + "0": [ + [ + { + "id": "test" + }, + "genome.mmi:md5,72e450f12dc691e763c697463bdb1571" + ] + ], + "1": [ + "versions.yml:md5,2f8340380c6741e9261a284262a90bde" + ], + "index": [ + [ + { + "id": "test" + }, + "genome.mmi:md5,72e450f12dc691e763c697463bdb1571" + ] + ], + "versions": [ + "versions.yml:md5,2f8340380c6741e9261a284262a90bde" + ] + } + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "23.10.1" + }, + "timestamp": "2024-04-05T10:58:29.828187662" + } +} \ No newline at end of file diff --git a/modules/nf-core/minimap2/index/tests/tags.yml b/modules/nf-core/minimap2/index/tests/tags.yml new file mode 100644 index 0000000..e5ef8e1 --- /dev/null +++ b/modules/nf-core/minimap2/index/tests/tags.yml @@ -0,0 +1,2 @@ +minimap2/index: + - modules/nf-core/minimap2/index/** diff --git a/nextflow_schema.json b/nextflow_schema.json index dd51229..e1507e0 100644 --- a/nextflow_schema.json +++ b/nextflow_schema.json @@ -25,7 +25,7 @@ }, "taxid": { "type": "string", - "description": "The taxonomy ID of the species identified in classification results." + "description": "The taxonomy ID of the species identified in classification results. A list of taxids separated by spaces." }, "viral_pathogen_genome": { "type": "string", @@ -323,7 +323,8 @@ }, "fastq_output": { "type": "boolean", - "description": "Turn on saving extracted kraken2 reads in fastq format." + "description": "Turn on saving extracted kraken2 reads in fastq format.", + "default": true } } } diff --git a/viral_pathogen_List.csv b/viral_pathogen_List.csv new file mode 100644 index 0000000..7209ff7 --- /dev/null +++ b/viral_pathogen_List.csv @@ -0,0 +1,268 @@ +Organism_Name,Species,Genus,Family,Taxid +Human mastadenovirus A,Human mastadenovirus A,Mastadenovirus,Adenoviridae,129875 +Human mastadenovirus B,Human mastadenovirus B,Mastadenovirus,Adenoviridae,108098 +Human mastadenovirus C,Human mastadenovirus C,Mastadenovirus,Adenoviridae,129951 +Human mastadenovirus D,Human mastadenovirus D,Mastadenovirus,Adenoviridae,130310 +Human mastadenovirus F,Human mastadenovirus F,Mastadenovirus,Adenoviridae,130309 +Anelloviridae sp.,Anelloviridae sp.,,Anelloviridae,2055263 +Gyrovirus 4,Gyrovirus homsa3,Gyrovirus,Anelloviridae,1214955 +Gyrovirus GyV3,Gyrovirus homsa1,Gyrovirus,Anelloviridae,1163715 +Gyrovirus Tu243,Gyrovirus homsa4,Gyrovirus,Anelloviridae,1415627 +Gyrovirus Tu789,Gyrovirus homsa2,Gyrovirus,Anelloviridae,1415628 +Small anellovirus 1,Small anellovirus,,Anelloviridae,289366 +Small anellovirus 2,Small anellovirus,,Anelloviridae,289367 +Torque teno midi virus 1,Gammatorquevirus homidi1,Gammatorquevirus,Anelloviridae,687379 +Torque teno midi virus 10,Gammatorquevirus homidi10,Gammatorquevirus,Anelloviridae,2065051 +Torque teno midi virus 11,Gammatorquevirus homidi11,Gammatorquevirus,Anelloviridae,2065052 +Torque teno midi virus 12,Gammatorquevirus homidi12,Gammatorquevirus,Anelloviridae,2065053 +Torque teno midi virus 13,Gammatorquevirus homidi13,Gammatorquevirus,Anelloviridae,2065054 +Torque teno midi virus 14,Gammatorquevirus homidi14,Gammatorquevirus,Anelloviridae,2065055 +Torque teno midi virus 2,Gammatorquevirus homidi2,Gammatorquevirus,Anelloviridae,687380 +Torque teno midi virus 3,Gammatorquevirus homidi3,Gammatorquevirus,Anelloviridae,2065044 +Torque teno midi virus 4,Gammatorquevirus homidi4,Gammatorquevirus,Anelloviridae,2065045 +Torque teno midi virus 5,Gammatorquevirus homidi5,Gammatorquevirus,Anelloviridae,2065046 +Torque teno midi virus 6,Gammatorquevirus homidi6,Gammatorquevirus,Anelloviridae,2065047 +Torque teno midi virus 7,Gammatorquevirus homidi7,Gammatorquevirus,Anelloviridae,2065048 +Torque teno midi virus 8,Gammatorquevirus homidi8,Gammatorquevirus,Anelloviridae,2065049 +Torque teno midi virus 9,Gammatorquevirus homidi9,Gammatorquevirus,Anelloviridae,2065050 +Torque teno mini virus 1,Betatorquevirus homini1,Betatorquevirus,Anelloviridae,687369 +Torque teno mini virus 10,Betatorquevirus homini10,Betatorquevirus,Anelloviridae,2065036 +Torque teno mini virus 11,Betatorquevirus homini11,Betatorquevirus,Anelloviridae,2065037 +Torque teno mini virus 12,Betatorquevirus homini12,Betatorquevirus,Anelloviridae,2065038 +Torque teno mini virus 18,Betatorquevirus homini18,Betatorquevirus,Anelloviridae,1859149 +Torque teno mini virus 5,Betatorquevirus homini5,Betatorquevirus,Anelloviridae,687373 +Torque teno mini virus 6,Betatorquevirus homini6,Betatorquevirus,Anelloviridae,687374 +Torque teno mini virus 8,Betatorquevirus homini8,Betatorquevirus,Anelloviridae,687376 +Torque teno mini virus ALA22,Betatorquevirus homini27,Betatorquevirus,Anelloviridae,1535290 +Torque teno mini virus ALH8,Betatorquevirus homini16,Betatorquevirus,Anelloviridae,1535291 +Torque teno mini virus SHA,Betatorquevirus homini26,Betatorquevirus,Anelloviridae,2057931 +Torque teno virus,Torque teno virus,,Anelloviridae,68887 +Torque teno virus 9,Alphatorquevirus homin9,Alphatorquevirus,Anelloviridae,687348 +TTV-like mini virus,TTV-like mini virus,Betatorquevirus,Anelloviridae,93678 +Mammarenavirus chapareense,Mammarenavirus chapareense,Mammarenavirus,Arenaviridae,3052302 +Mammarenavirus lujoense,Mammarenavirus lujoense,Mammarenavirus,Arenaviridae,3052314 +Astrovirus MLB2,Astrovirus MLB2,,Astroviridae,683172 +Astrovirus MLB3,Astrovirus MLB3,,Astroviridae,1247114 +Astrovirus VA1,Mamastrovirus 9,Mamastrovirus,Astroviridae,645687 +Astrovirus VA3,Astrovirus VA3,,Astroviridae,683174 +Astrovirus VA4,Astrovirus VA4,,Astroviridae,1247113 +Bastrovirus 7,Bastrovirus BAS-1,,Astroviridae,1803394 +HMO Astrovirus A,HMO Astrovirus A,Mamastrovirus,Astroviridae,682382 +Human astrovirus BF34,Burkina Faso astrovirus,Mamastrovirus,Astroviridae,1518575 +Norovirus GI,Norwalk virus,Norovirus,Caliciviridae,122928 +Norovirus GI/Hu/JP/2007/GI.P3_GI.3/Shimizu/KK2866,Norwalk virus,Norovirus,Caliciviridae,1529909 +Norovirus GII,Norwalk virus,Norovirus,Caliciviridae,122929 +Norovirus GII.17,Norwalk virus,Norovirus,Caliciviridae,552592 +Norovirus GII/Hu/JP/2007/GII.P15_GII.15/Sapporo/HK299,Norwalk virus,Norovirus,Caliciviridae,1529918 +Norovirus GII/Hu/JP/2011/GII/Yuzawa/Gira2HS,Norwalk virus,Norovirus,Caliciviridae,1529924 +Norovirus GIV,Norwalk virus,Norovirus,Caliciviridae,262897 +Sapovirus Hu/GI/Sapporo/MT-2010/1982,Sapporo virus,Sapovirus,Caliciviridae,758863 +Cyclovirus NG12,Cyclovirus mmadu,Cyclovirus,Circoviridae,742922 +Cyclovirus NG14,Cyclovirus mutum,Cyclovirus,Circoviridae,742923 +Cyclovirus PK5006,Cyclovirus insaan,Cyclovirus,Circoviridae,742915 +Cyclovirus PK5034,Cyclovirus homa,Cyclovirus,Circoviridae,742916 +Cyclovirus PK5222,Cyclovirus manukha,Cyclovirus,Circoviridae,742917 +Cyclovirus PK5510,Cyclovirus maanav,Cyclovirus,Circoviridae,742918 +Cyclovirus SL-108277,Cyclovirus manitan,Cyclovirus,Circoviridae,1520935 +Cyclovirus TN25,Cyclovirus bashri,Cyclovirus,Circoviridae,742924 +Cyclovirus VN,Cyclovirus nhanloai,Cyclovirus,Circoviridae,1348500 +Human associated cyclovirus 10,Cyclovirus humana,Cyclovirus,Circoviridae,2038728 +Human circovirus VS6600022,Human circovirus VS6600022,Circovirus,Circoviridae,1525173 +Human cyclovirus VS5700009,Cyclovirus munthu,Cyclovirus,Circoviridae,1345637 +Human fecal virus Jorvi2,Human fecal virus Jorvi2,,Circoviridae,2017081 +Human fecal virus Jorvi3,Human fecal virus Jorvi3,,Circoviridae,2017082 +Human fecal virus Jorvi4,Human fecal virus Jorvi4,,Circoviridae,2017083 +Human PoSCV5-like circular virus,Human PoSCV5-like circular virus,,Circoviridae,1965018 +Human stool-associated circular virus NG13,Circovirus eniyan,Circovirus,Circoviridae,743300 +Indian encephalitis associated cyclovirus,Cyclovirus manusyan,Cyclovirus,Circoviridae,1755290 +Betacoronavirus England 1,Middle East respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,1263720 +Human coronavirus HKU1,Human coronavirus HKU1,Betacoronavirus,Coronaviridae,290028 +Middle East respiratory syndrome-related coronavirus,Middle East respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,1335626 +SARS coronavirus Tor2,Severe acute respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,227984 +Severe acute respiratory syndrome coronavirus 2,Severe acute respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,2697049 +Bundibugyo ebolavirus,Orthoebolavirus bundibugyoense,Orthoebolavirus,Filoviridae,565995 +Orthomarburgvirus marburgense,Orthomarburgvirus marburgense,Orthomarburgvirus,Filoviridae,3052505 +Sudan ebolavirus,Orthoebolavirus sudanense,Orthoebolavirus,Filoviridae,186540 +Tai Forest ebolavirus,Orthoebolavirus taiense,Orthoebolavirus,Filoviridae,186541 +Hepacivirus platyrrhini,Hepacivirus platyrrhini,Hepacivirus,Flaviviridae,3052236 +Hepatitis C virus genotype 3,Hepacivirus hominis,Hepacivirus,Flaviviridae,356114 +Hepatitis C virus genotype 4,Hepacivirus hominis,Hepacivirus,Flaviviridae,33745 +Hepatitis C virus genotype 5,Hepacivirus hominis,Hepacivirus,Flaviviridae,33746 +Hepatitis C virus genotype 7,Hepacivirus hominis,Hepacivirus,Flaviviridae,1544901 +Human hepegivirus,Pegivirus columbiaense,Pegivirus,Flaviviridae,1704090 +Human pegivirus 2,Pegivirus columbiaense,Pegivirus,Flaviviridae,1729141 +Zika virus,Orthoflavivirus zikaense,Orthoflavivirus,Flaviviridae,64320 +Gemycircularvirus C1c,Gemykibivirus humas3,Gemykibivirus,Genomoviridae,1673681 +Gemycircularvirus HV-GcV1,Gemycircularvirus HV-GcV1,Gemycircularvirus,Genomoviridae,1862824 +Gemycircularvirus HV-GcV2,Gemykibivirus humas5,Gemykibivirus,Genomoviridae,1862825 +Gemycircularvirus sp.,Gemycircularvirus sp.,Gemycircularvirus,Genomoviridae,1983771 +Human associated gemyvongvirus 1,Gemyvongvirus humas1,Gemyvongvirus,Genomoviridae,1985415 +Human gemycircularvirus GeTz1,Gemykibivirus humas4,Gemykibivirus,Genomoviridae,1792832 +Human genital-associated circular DNA virus-1,Gemygorvirus sewopo1,Gemygorvirus,Genomoviridae,1488574 +Orthohantavirus sinnombreense,Orthohantavirus sinnombreense,Orthohantavirus,Hantaviridae,3052499 +Rubella virus,Rubivirus rubellae,Rubivirus,Matonaviridae,11041 +Beiji nairovirus,Beiji nairovirus,Orthonairovirus,Nairoviridae,2304647 +Songling virus,Songling virus,Orthonairovirus,Nairoviridae,2795181 +Yezo virus,Yezo virus,Orthonairovirus,Nairoviridae,2825847 +Human alphaherpesvirus 2,Simplexvirus humanalpha2,Simplexvirus,Orthoherpesviridae,10310 +Human alphaherpesvirus 3,Varicellovirus humanalpha3,Varicellovirus,Orthoherpesviridae,10335 +Human betaherpesvirus 5,Cytomegalovirus humanbeta5,Cytomegalovirus,Orthoherpesviridae,10359 +Human betaherpesvirus 6A,Roseolovirus humanbeta6a,Roseolovirus,Orthoherpesviridae,32603 +Human betaherpesvirus 6B,Roseolovirus humanbeta6b,Roseolovirus,Orthoherpesviridae,32604 +Human betaherpesvirus 7,Roseolovirus humanbeta7,Roseolovirus,Orthoherpesviridae,10372 +human gammaherpesvirus 4,Lymphocryptovirus humangamma4,Lymphocryptovirus,Orthoherpesviridae,10376 +Human gammaherpesvirus 8,Rhadinovirus humangamma8,Rhadinovirus,Orthoherpesviridae,37296 +Human herpesvirus 4 type 2,Lymphocryptovirus humangamma4,Lymphocryptovirus,Orthoherpesviridae,12509 +Influenza A virus (A/California/07/2009(H1N1)),Alphainfluenzavirus influenzae,Alphainfluenzavirus,Orthomyxoviridae,641809 +Influenza A virus (A/New York/392/2004(H3N2)),Alphainfluenzavirus influenzae,Alphainfluenzavirus,Orthomyxoviridae,335341 +Influenza A virus (A/Shanghai/02/2013(H7N9)),Alphainfluenzavirus influenzae,Alphainfluenzavirus,Orthomyxoviridae,1332244 +Gammapapillomavirus sp.,Gammapapillomavirus sp.,Gammapapillomavirus,Papillomaviridae,2049444 +Human papillomavirus,Human papillomavirus,,Papillomaviridae,10566 +Human papillomavirus 116,Gammapapillomavirus 9,Gammapapillomavirus,Papillomaviridae,915428 +Human papillomavirus 121,Gammapapillomavirus 10,Gammapapillomavirus,Papillomaviridae,915429 +Human papillomavirus 126,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1055684 +Human papillomavirus 127,Gammapapillomavirus 12,Gammapapillomavirus,Papillomaviridae,746832 +Human papillomavirus 132,Gammapapillomavirus 12,Gammapapillomavirus,Papillomaviridae,909331 +Human papillomavirus 134,Gammapapillomavirus 7,Gammapapillomavirus,Papillomaviridae,909333 +Human papillomavirus 135,Gammapapillomavirus 15,Gammapapillomavirus,Papillomaviridae,1070408 +Human papillomavirus 136,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1070409 +Human papillomavirus 140,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1070413 +Human papillomavirus 154,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1195796 +human papillomavirus 166,Gammapapillomavirus 19,Gammapapillomavirus,Papillomaviridae,1315259 +Human papillomavirus 167,Gammapapillomavirus 21,Gammapapillomavirus,Papillomaviridae,1420545 +Human papillomavirus 172,Gammapapillomavirus 22,Gammapapillomavirus,Papillomaviridae,1434987 +Human papillomavirus 175,Gammapapillomavirus 23,Gammapapillomavirus,Papillomaviridae,1434782 +Human papillomavirus 178,Gammapapillomavirus 24,Gammapapillomavirus,Papillomaviridae,1478160 +Human papillomavirus 179,Gammapapillomavirus 15,Gammapapillomavirus,Papillomaviridae,1472342 +Human papillomavirus 184,Gammapapillomavirus 25,Gammapapillomavirus,Papillomaviridae,1472343 +Human papillomavirus 187,Gammapapillomavirus 26,Gammapapillomavirus,Papillomaviridae,1851130 +Human papillomavirus 201,Gammapapillomavirus 27,Gammapapillomavirus,Papillomaviridae,1682340 +Human papillomavirus 204,Mupapillomavirus 3,Mupapillomavirus,Papillomaviridae,1650736 +Human papillomavirus KC5,Human papillomavirus KC5,Gammapapillomavirus,Papillomaviridae,1647924 +Human papillomavirus type 161,Gammapapillomavirus 19,Gammapapillomavirus,Papillomaviridae,1315264 +Human papillomavirus type 85,Human papillomavirus type 85,,Papillomaviridae,652810 +Sosuga virus,Pararubulavirus sosugaense,Pararubulavirus,Paramyxoviridae,1452514 +Bocaparvovirus primate1,Bocaparvovirus primate1,Bocaparvovirus,Parvoviridae,3052040 +Bufavirus-3,Bufavirus-3,,Parvoviridae,1391667 +Cutavirus,Protoparvovirus primate3,Protoparvovirus,Parvoviridae,1867125 +Human bocavirus 2c PK,Bocaparvovirus primate2,Bocaparvovirus,Parvoviridae,1511882 +Human bocavirus 3,Bocaparvovirus primate1,Bocaparvovirus,Parvoviridae,638313 +Human bocavirus 4 NI,Bocaparvovirus primate2,Bocaparvovirus,Parvoviridae,1511883 +Human erythrovirus V9,Human erythrovirus V9,Erythroparvovirus,Parvoviridae,72197 +Human parvovirus 4 G1,Tetraparvovirus primate1,Tetraparvovirus,Parvoviridae,1511919 +Parvovirus NIH-CQV,Parvovirus NIH-CQV,,Parvoviridae,1341019 +Orthobunyavirus bwambaense,Orthobunyavirus bwambaense,Orthobunyavirus,Peribunyaviridae,3052384 +Catu virus,Orthobunyavirus catuense,Orthobunyavirus,Peribunyaviridae,1678225 +Fort Sherman virus,Orthobunyavirus shermanense,Orthobunyavirus,Peribunyaviridae,273345 +Guaroa virus,Orthobunyavirus guaroaense,Orthobunyavirus,Peribunyaviridae,80941 +Ilesha virus,Orthobunyavirus ileshaense,Orthobunyavirus,Peribunyaviridae,273341 +Madrid virus,Orthobunyavirus madridense,Orthobunyavirus,Peribunyaviridae,348013 +Alenquer virus,Phlebovirus alenquerense,Phlebovirus,Phenuiviridae,629726 +Chandiru virus,Phlebovirus candiruense,Phlebovirus,Phenuiviridae,629725 +Cocle virus,Phlebovirus cocleense,Phlebovirus,Phenuiviridae,1649829 +Dar es Salaam virus TZ-189,Tanzavirus daressalaamense,Tanzavirus,Phenuiviridae,2576944 +Echarate virus,Phlebovirus echarateense,Phlebovirus,Phenuiviridae,1000646 +Heartland virus,Bandavirus heartlandense,Bandavirus,Phenuiviridae,1216928 +Maldonado virus,Phlebovirus maldonadoense,Phlebovirus,Phenuiviridae,1004889 +Punta Toro virus,Phlebovirus toroense,Phlebovirus,Phenuiviridae,11587 +Sandfly fever Turkey virus,Phlebovirus siciliaense,Phlebovirus,Phenuiviridae,688699 +Severe fever with thrombocytopenia virus,Bandavirus dabieense,Bandavirus,Phenuiviridae,1003835 +SFTS virus HB29,Bandavirus dabieense,Bandavirus,Phenuiviridae,992212 +aichivirus A1,Aichivirus A,Kobuvirus,Picornaviridae,1313215 +Cosavirus A,Cosavirus A,Cosavirus,Picornaviridae,1330491 +Cosavirus D,Cosavirus D,Cosavirus,Picornaviridae,2003650 +Cosavirus E,Cosavirus E,Cosavirus,Picornaviridae,2003651 +Cosavirus F,Cosavirus F,Cosavirus,Picornaviridae,2003652 +Cosavirus JMY-2014,Cosavirus JMY-2014,Cosavirus,Picornaviridae,1582094 +Coxsackievirus B3,Enterovirus B,Enterovirus,Picornaviridae,12072 +enterovirus A114,Enterovirus A,Enterovirus,Picornaviridae,2760809 +Human cosavirus,Human cosavirus,Cosavirus,Picornaviridae,1233383 +Human cosavirus B,Cosavirus B,Cosavirus,Picornaviridae,586420 +rosavirus A2,Rosavirus A,Rosavirus,Picornaviridae,1511807 +Salivirus A,Salivirus A,Salivirus,Picornaviridae,1330524 +Salivirus FHB,Salivirus FHB,Salivirus,Picornaviridae,1547495 +Salivirus NG-J1,Salivirus A,Salivirus,Picornaviridae,651733 +Human polyomavirus 6,Deltapolyomavirus sextihominis,Deltapolyomavirus,Polyomaviridae,746830 +Human polyomavirus 7,Deltapolyomavirus septihominis,Deltapolyomavirus,Polyomaviridae,746831 +Human polyomavirus 9,Alphapolyomavirus nonihominis,Alphapolyomavirus,Polyomaviridae,943908 +LI polyomavirus,Alphapolyomavirus quardecihominis,Alphapolyomavirus,Polyomaviridae,1965344 +Merkel cell polyomavirus,Alphapolyomavirus quintihominis,Alphapolyomavirus,Polyomaviridae,493803 +MW polyomavirus,Deltapolyomavirus decihominis,Deltapolyomavirus,Polyomaviridae,1203539 +New Jersey polyomavirus-2013,Alphapolyomavirus terdecihominis,Alphapolyomavirus,Polyomaviridae,1497391 +STL polyomavirus,Deltapolyomavirus undecihominis,Deltapolyomavirus,Polyomaviridae,1277649 +Trichodysplasia spinulosa-associated polyomavirus,Alphapolyomavirus octihominis,Alphapolyomavirus,Polyomaviridae,862909 +Akhmeta virus,Akhmeta virus,Orthopoxvirus,Poxviridae,2200830 +Monkeypox virus,Monkeypox virus,Orthopoxvirus,Poxviridae,10244 +NY_014 poxvirus,NY_014 poxvirus,Centapoxvirus,Poxviridae,2025360 +Human lung-associated vientovirus FB,Vientovirus,Torbevirus,Redondoviridae,2571082 +Central cimpanzee simian foamy virus,Central cimpanzee simian foamy virus,Simiispumavirus,Retroviridae,2170194 +Eastern chimpanzee simian foamy virus,Eastern chimpanzee simian foamy virus,Simiispumavirus,Retroviridae,2170195 +Guenon simian foamy virus,Guenon simian foamy virus,Simiispumavirus,Retroviridae,2170197 +Human endogenous retrovirus K113,Human endogenous retrovirus K,,Retroviridae,166122 +Human immunodeficiency virus 1,Human immunodeficiency virus 1,Lentivirus,Retroviridae,11676 +Human immunodeficiency virus 2,Human immunodeficiency virus 2,Lentivirus,Retroviridae,11709 +Human T-lymphotropic virus 4,Human T-lymphotropic virus 4,Deltaretrovirus,Retroviridae,318279 +Tibrovirus congo,Tibrovirus congo,Tibrovirus,Rhabdoviridae,1987017 +Chandipura virus,Vesiculovirus chandipura,Vesiculovirus,Rhabdoviridae,11272 +Lyssavirus duvenhage,Lyssavirus duvenhage,Lyssavirus,Rhabdoviridae,38767 +Ekpoma virus 1,Tibrovirus alphaekpoma,Tibrovirus,Rhabdoviridae,1987020 +Ekpoma virus 2,Tibrovirus betaekpoma,Tibrovirus,Rhabdoviridae,1987021 +European bat lyssavirus 2,Lyssavirus helsinki,Lyssavirus,Rhabdoviridae,57483 +Le Dantec virus,Ledantevirus ledantec,Ledantevirus,Rhabdoviridae,318848 +Mundri virus,Mundri virus,,Rhabdoviridae,2913478 +Lebombo virus,Lebombo virus,Orbivirus,Sedoreoviridae,40057 +Orungo virus,Orungo virus,Orbivirus,Sedoreoviridae,40058 +Human associated huchismacovirus 1,Human associated huchismacovirus 1,Huchismacovirus,Smacoviridae,2169934 +Human associated huchismacovirus 2,Human associated huchismacovirus 2,Huchismacovirus,Smacoviridae,2169935 +Human associated huchismacovirus 3,Human associated huchismacovirus 3,Huchismacovirus,Smacoviridae,2169936 +Human associated porprismacovirus,Inpeasmacovirus humas1,Inpeasmacovirus,Smacoviridae,2530494 +Human associated porprismacovirus 3,Porprismacovirus humas4,Porprismacovirus,Smacoviridae,2496633 +Human feces smacovirus 2,Porprismacovirus humas1,Porprismacovirus,Smacoviridae,1820158 +Human feces smacovirus 3,Porprismacovirus humas3,Porprismacovirus,Smacoviridae,1820159 +Human smacovirus 1,Human smacovirus 1,Huchismacovirus,Smacoviridae,1595998 +Mammalian orthoreovirus 3 Dearing,Mammalian orthoreovirus,Orthoreovirus,Spinareoviridae,10886 +Ross River virus,Ross River virus,Alphavirus,Togaviridae,11029 +Circo-like virus-Brazil hs1,Circo-like virus-Brazil,,,1346815 +Hudisavirus sp.,Hudisavirus sp.,,,2021738 +West Nile virus strain NY-99,West Nile virus,Flavivirus,Flaviviridae,1968826 +BK polyomavirus MM,BK polyomavirus,Betapolyomavirus,Polyomaviridae,1417981 +Banana virus X,Banna virus,Bannavirus,Reoviridae,307671 +Bombali virus,Ebolavirus,Ebolavirus,Filoviridae,2010960 +Bourbon virus,Bourbon virus,Thogotovirus,Orthomyxoviridae,1618189 +Dhori virus (strain Indian/1313/61),Dhori virus,Thogotovirus,Orthomyxoviridae,11319 +Encephalomyocarditis virus,Encephalomyocarditis virus,Cardiovirus,Picornaviridae,12104 +Eyach virus,Eyach virus,Coltivirus,Reoviridae,62352 +Henipavirus hendraense,Hendra virus,Henipavirus,Paramyxoviridae,3052223 +Henipavirus nipahense,Nipah virus,Henipavirus,Paramyxoviridae,3052225 +Hepatitis B virus,Hepatitis B virus,Orthohepadnavirus,Hepadnaviridae,10407 +Hepatitis delta virus,Hepatitis delta virus,Deltavirus,Deltaflexiviridae,12475 +Hepatovirus A,Hepatitis A virus,Hepatovirus,Picornaviridae,12092 +Human foamy virus,Human foamy virus,Spumavirus,Retroviridae,11641 +human metapneumovirus,Human metapneumovirus,Metapneumovirus,Paramyxoviridae,162145 +Human orthorubulavirus 2,Human orthorubulavirus 2,Orthorubulavirus,Paramyxoviridae,2560525 +Human papillomavirus,Human papillomavirus,Papillomavirus,Papillomaviridae,10566 +Betapolyomavirus tertihominis,KI Polyomavirus,Betapolyomavirus,Polyomaviridae,1891764 +Human respirovirus 1,Human Respirovirus 1,Respirovirus,Paramyxoviridae,12730 +Human respirovirus 3,Human Respirovirus 3,Respirovirus,Paramyxoviridae,11216 +Human torovirus,Human torovirus,Torovirus,Toroviridae,67605 +Influenza B virus (B/Lee/1940),Influenza B virus,Betainfluenzavirus,Orthomyxoviridae,518987 +Influenza C virus (C/Ann Arbor/1/50),Influenza C virus,Gammainfluenzavirus,Orthomyxoviridae,11553 +Japanese encephalitis virus,Japanese encephalitis virus,Flavivirus,Flaviviridae,11072 +Measles morbillivirus,Morbillivirus,Morbillivirus,Paramyxoviridae,11234 +Merkel cell polyomavirus,Merkel cell polyomavirus,Orthopolyomavirus,Polyomaviridae,493803 +Molluscum contagiosum virus subtype 1,Molluscum contagiosum virus,Molluscipoxvirus,Poxviridae,10280 +Mumps orthorubulaviru,Mumps virus,Orthorubulavirus,Paramyxoviridae,2560602 +Murray Valley encephalitis virus,Murray valley encephalitis virus,Flavivirus,Flaviviridae,11079 +Orf virus,Orf virus,Parapoxvirus,Poxviridae,10258 +Orthomarburgvirus marburgense,Lake Victoria marburgvirus,Marburgvirus,Filoviridae,3052505 +Rotavirus A,Rotavirus A,Rotavirus,Reoviridae,28875 +Rotavirus C,Rotavirus C,Rotavirus,Reoviridae,36427 +St. Louis encephalitis virus,Saint Louis encephalitis virus,Flavivirus,Flaviviridae,11080 +Thogotovirus,Thogotovirus,Thogotovirus,Orthomyxoviridae,35323 +Tick-borne encephalitis virus,Tick-borne encephalitis virus,Flavivirus,Flaviviridae,11084 +Torque teno virus 6,Torque teno virus,Anellovirus,Anelloviridae,687345 +WU Polyomavirus,WU polyomavirus,Betapolyomavirus,Polyomaviridae,440266 +Yaba monkey tumor virus,Yaba monkey tumor virus,Yatapoxvirus,Poxviridae,38804 +Yaba-like disease virus,Yaba-like disease virus,Yatapoxvirus,Poxviridae,132475 +Zika virus,Zika virus,Flavivirus,Flaviviridae,64320 +dengue virus type 1,Dengue virus,Flavivirus,Flaviviridae,11053 \ No newline at end of file From 182fa6a3e0a06e32b0c5dce2088217dbf694fc2c Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Tue, 18 Jun 2024 16:22:12 +0200 Subject: [PATCH 02/25] ignore prettier check for viral_pathogen_List --- .nf-core.yml | 1 + viral_pathogen_List.csv | 536 ++++++++++++++++++++-------------------- 2 files changed, 269 insertions(+), 268 deletions(-) diff --git a/.nf-core.yml b/.nf-core.yml index ed5f0f0..633a8ff 100644 --- a/.nf-core.yml +++ b/.nf-core.yml @@ -15,6 +15,7 @@ lint: - assets/email_template.html - assets/email_template.txt - docs/README.md + - viral_pathogen_List.csv multiqc_config: - report_comment diff --git a/viral_pathogen_List.csv b/viral_pathogen_List.csv index 7209ff7..0f6b85d 100644 --- a/viral_pathogen_List.csv +++ b/viral_pathogen_List.csv @@ -1,268 +1,268 @@ -Organism_Name,Species,Genus,Family,Taxid -Human mastadenovirus A,Human mastadenovirus A,Mastadenovirus,Adenoviridae,129875 -Human mastadenovirus B,Human mastadenovirus B,Mastadenovirus,Adenoviridae,108098 -Human mastadenovirus C,Human mastadenovirus C,Mastadenovirus,Adenoviridae,129951 -Human mastadenovirus D,Human mastadenovirus D,Mastadenovirus,Adenoviridae,130310 -Human mastadenovirus F,Human mastadenovirus F,Mastadenovirus,Adenoviridae,130309 -Anelloviridae sp.,Anelloviridae sp.,,Anelloviridae,2055263 -Gyrovirus 4,Gyrovirus homsa3,Gyrovirus,Anelloviridae,1214955 -Gyrovirus GyV3,Gyrovirus homsa1,Gyrovirus,Anelloviridae,1163715 -Gyrovirus Tu243,Gyrovirus homsa4,Gyrovirus,Anelloviridae,1415627 -Gyrovirus Tu789,Gyrovirus homsa2,Gyrovirus,Anelloviridae,1415628 -Small anellovirus 1,Small anellovirus,,Anelloviridae,289366 -Small anellovirus 2,Small anellovirus,,Anelloviridae,289367 -Torque teno midi virus 1,Gammatorquevirus homidi1,Gammatorquevirus,Anelloviridae,687379 -Torque teno midi virus 10,Gammatorquevirus homidi10,Gammatorquevirus,Anelloviridae,2065051 -Torque teno midi virus 11,Gammatorquevirus homidi11,Gammatorquevirus,Anelloviridae,2065052 -Torque teno midi virus 12,Gammatorquevirus homidi12,Gammatorquevirus,Anelloviridae,2065053 -Torque teno midi virus 13,Gammatorquevirus homidi13,Gammatorquevirus,Anelloviridae,2065054 -Torque teno midi virus 14,Gammatorquevirus homidi14,Gammatorquevirus,Anelloviridae,2065055 -Torque teno midi virus 2,Gammatorquevirus homidi2,Gammatorquevirus,Anelloviridae,687380 -Torque teno midi virus 3,Gammatorquevirus homidi3,Gammatorquevirus,Anelloviridae,2065044 -Torque teno midi virus 4,Gammatorquevirus homidi4,Gammatorquevirus,Anelloviridae,2065045 -Torque teno midi virus 5,Gammatorquevirus homidi5,Gammatorquevirus,Anelloviridae,2065046 -Torque teno midi virus 6,Gammatorquevirus homidi6,Gammatorquevirus,Anelloviridae,2065047 -Torque teno midi virus 7,Gammatorquevirus homidi7,Gammatorquevirus,Anelloviridae,2065048 -Torque teno midi virus 8,Gammatorquevirus homidi8,Gammatorquevirus,Anelloviridae,2065049 -Torque teno midi virus 9,Gammatorquevirus homidi9,Gammatorquevirus,Anelloviridae,2065050 -Torque teno mini virus 1,Betatorquevirus homini1,Betatorquevirus,Anelloviridae,687369 -Torque teno mini virus 10,Betatorquevirus homini10,Betatorquevirus,Anelloviridae,2065036 -Torque teno mini virus 11,Betatorquevirus homini11,Betatorquevirus,Anelloviridae,2065037 -Torque teno mini virus 12,Betatorquevirus homini12,Betatorquevirus,Anelloviridae,2065038 -Torque teno mini virus 18,Betatorquevirus homini18,Betatorquevirus,Anelloviridae,1859149 -Torque teno mini virus 5,Betatorquevirus homini5,Betatorquevirus,Anelloviridae,687373 -Torque teno mini virus 6,Betatorquevirus homini6,Betatorquevirus,Anelloviridae,687374 -Torque teno mini virus 8,Betatorquevirus homini8,Betatorquevirus,Anelloviridae,687376 -Torque teno mini virus ALA22,Betatorquevirus homini27,Betatorquevirus,Anelloviridae,1535290 -Torque teno mini virus ALH8,Betatorquevirus homini16,Betatorquevirus,Anelloviridae,1535291 -Torque teno mini virus SHA,Betatorquevirus homini26,Betatorquevirus,Anelloviridae,2057931 -Torque teno virus,Torque teno virus,,Anelloviridae,68887 -Torque teno virus 9,Alphatorquevirus homin9,Alphatorquevirus,Anelloviridae,687348 -TTV-like mini virus,TTV-like mini virus,Betatorquevirus,Anelloviridae,93678 -Mammarenavirus chapareense,Mammarenavirus chapareense,Mammarenavirus,Arenaviridae,3052302 -Mammarenavirus lujoense,Mammarenavirus lujoense,Mammarenavirus,Arenaviridae,3052314 -Astrovirus MLB2,Astrovirus MLB2,,Astroviridae,683172 -Astrovirus MLB3,Astrovirus MLB3,,Astroviridae,1247114 -Astrovirus VA1,Mamastrovirus 9,Mamastrovirus,Astroviridae,645687 -Astrovirus VA3,Astrovirus VA3,,Astroviridae,683174 -Astrovirus VA4,Astrovirus VA4,,Astroviridae,1247113 -Bastrovirus 7,Bastrovirus BAS-1,,Astroviridae,1803394 -HMO Astrovirus A,HMO Astrovirus A,Mamastrovirus,Astroviridae,682382 -Human astrovirus BF34,Burkina Faso astrovirus,Mamastrovirus,Astroviridae,1518575 -Norovirus GI,Norwalk virus,Norovirus,Caliciviridae,122928 -Norovirus GI/Hu/JP/2007/GI.P3_GI.3/Shimizu/KK2866,Norwalk virus,Norovirus,Caliciviridae,1529909 -Norovirus GII,Norwalk virus,Norovirus,Caliciviridae,122929 -Norovirus GII.17,Norwalk virus,Norovirus,Caliciviridae,552592 -Norovirus GII/Hu/JP/2007/GII.P15_GII.15/Sapporo/HK299,Norwalk virus,Norovirus,Caliciviridae,1529918 -Norovirus GII/Hu/JP/2011/GII/Yuzawa/Gira2HS,Norwalk virus,Norovirus,Caliciviridae,1529924 -Norovirus GIV,Norwalk virus,Norovirus,Caliciviridae,262897 -Sapovirus Hu/GI/Sapporo/MT-2010/1982,Sapporo virus,Sapovirus,Caliciviridae,758863 -Cyclovirus NG12,Cyclovirus mmadu,Cyclovirus,Circoviridae,742922 -Cyclovirus NG14,Cyclovirus mutum,Cyclovirus,Circoviridae,742923 -Cyclovirus PK5006,Cyclovirus insaan,Cyclovirus,Circoviridae,742915 -Cyclovirus PK5034,Cyclovirus homa,Cyclovirus,Circoviridae,742916 -Cyclovirus PK5222,Cyclovirus manukha,Cyclovirus,Circoviridae,742917 -Cyclovirus PK5510,Cyclovirus maanav,Cyclovirus,Circoviridae,742918 -Cyclovirus SL-108277,Cyclovirus manitan,Cyclovirus,Circoviridae,1520935 -Cyclovirus TN25,Cyclovirus bashri,Cyclovirus,Circoviridae,742924 -Cyclovirus VN,Cyclovirus nhanloai,Cyclovirus,Circoviridae,1348500 -Human associated cyclovirus 10,Cyclovirus humana,Cyclovirus,Circoviridae,2038728 -Human circovirus VS6600022,Human circovirus VS6600022,Circovirus,Circoviridae,1525173 -Human cyclovirus VS5700009,Cyclovirus munthu,Cyclovirus,Circoviridae,1345637 -Human fecal virus Jorvi2,Human fecal virus Jorvi2,,Circoviridae,2017081 -Human fecal virus Jorvi3,Human fecal virus Jorvi3,,Circoviridae,2017082 -Human fecal virus Jorvi4,Human fecal virus Jorvi4,,Circoviridae,2017083 -Human PoSCV5-like circular virus,Human PoSCV5-like circular virus,,Circoviridae,1965018 -Human stool-associated circular virus NG13,Circovirus eniyan,Circovirus,Circoviridae,743300 -Indian encephalitis associated cyclovirus,Cyclovirus manusyan,Cyclovirus,Circoviridae,1755290 -Betacoronavirus England 1,Middle East respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,1263720 -Human coronavirus HKU1,Human coronavirus HKU1,Betacoronavirus,Coronaviridae,290028 -Middle East respiratory syndrome-related coronavirus,Middle East respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,1335626 -SARS coronavirus Tor2,Severe acute respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,227984 -Severe acute respiratory syndrome coronavirus 2,Severe acute respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,2697049 -Bundibugyo ebolavirus,Orthoebolavirus bundibugyoense,Orthoebolavirus,Filoviridae,565995 -Orthomarburgvirus marburgense,Orthomarburgvirus marburgense,Orthomarburgvirus,Filoviridae,3052505 -Sudan ebolavirus,Orthoebolavirus sudanense,Orthoebolavirus,Filoviridae,186540 -Tai Forest ebolavirus,Orthoebolavirus taiense,Orthoebolavirus,Filoviridae,186541 -Hepacivirus platyrrhini,Hepacivirus platyrrhini,Hepacivirus,Flaviviridae,3052236 -Hepatitis C virus genotype 3,Hepacivirus hominis,Hepacivirus,Flaviviridae,356114 -Hepatitis C virus genotype 4,Hepacivirus hominis,Hepacivirus,Flaviviridae,33745 -Hepatitis C virus genotype 5,Hepacivirus hominis,Hepacivirus,Flaviviridae,33746 -Hepatitis C virus genotype 7,Hepacivirus hominis,Hepacivirus,Flaviviridae,1544901 -Human hepegivirus,Pegivirus columbiaense,Pegivirus,Flaviviridae,1704090 -Human pegivirus 2,Pegivirus columbiaense,Pegivirus,Flaviviridae,1729141 -Zika virus,Orthoflavivirus zikaense,Orthoflavivirus,Flaviviridae,64320 -Gemycircularvirus C1c,Gemykibivirus humas3,Gemykibivirus,Genomoviridae,1673681 -Gemycircularvirus HV-GcV1,Gemycircularvirus HV-GcV1,Gemycircularvirus,Genomoviridae,1862824 -Gemycircularvirus HV-GcV2,Gemykibivirus humas5,Gemykibivirus,Genomoviridae,1862825 -Gemycircularvirus sp.,Gemycircularvirus sp.,Gemycircularvirus,Genomoviridae,1983771 -Human associated gemyvongvirus 1,Gemyvongvirus humas1,Gemyvongvirus,Genomoviridae,1985415 -Human gemycircularvirus GeTz1,Gemykibivirus humas4,Gemykibivirus,Genomoviridae,1792832 -Human genital-associated circular DNA virus-1,Gemygorvirus sewopo1,Gemygorvirus,Genomoviridae,1488574 -Orthohantavirus sinnombreense,Orthohantavirus sinnombreense,Orthohantavirus,Hantaviridae,3052499 -Rubella virus,Rubivirus rubellae,Rubivirus,Matonaviridae,11041 -Beiji nairovirus,Beiji nairovirus,Orthonairovirus,Nairoviridae,2304647 -Songling virus,Songling virus,Orthonairovirus,Nairoviridae,2795181 -Yezo virus,Yezo virus,Orthonairovirus,Nairoviridae,2825847 -Human alphaherpesvirus 2,Simplexvirus humanalpha2,Simplexvirus,Orthoherpesviridae,10310 -Human alphaherpesvirus 3,Varicellovirus humanalpha3,Varicellovirus,Orthoherpesviridae,10335 -Human betaherpesvirus 5,Cytomegalovirus humanbeta5,Cytomegalovirus,Orthoherpesviridae,10359 -Human betaherpesvirus 6A,Roseolovirus humanbeta6a,Roseolovirus,Orthoherpesviridae,32603 -Human betaherpesvirus 6B,Roseolovirus humanbeta6b,Roseolovirus,Orthoherpesviridae,32604 -Human betaherpesvirus 7,Roseolovirus humanbeta7,Roseolovirus,Orthoherpesviridae,10372 -human gammaherpesvirus 4,Lymphocryptovirus humangamma4,Lymphocryptovirus,Orthoherpesviridae,10376 -Human gammaherpesvirus 8,Rhadinovirus humangamma8,Rhadinovirus,Orthoherpesviridae,37296 -Human herpesvirus 4 type 2,Lymphocryptovirus humangamma4,Lymphocryptovirus,Orthoherpesviridae,12509 -Influenza A virus (A/California/07/2009(H1N1)),Alphainfluenzavirus influenzae,Alphainfluenzavirus,Orthomyxoviridae,641809 -Influenza A virus (A/New York/392/2004(H3N2)),Alphainfluenzavirus influenzae,Alphainfluenzavirus,Orthomyxoviridae,335341 -Influenza A virus (A/Shanghai/02/2013(H7N9)),Alphainfluenzavirus influenzae,Alphainfluenzavirus,Orthomyxoviridae,1332244 -Gammapapillomavirus sp.,Gammapapillomavirus sp.,Gammapapillomavirus,Papillomaviridae,2049444 -Human papillomavirus,Human papillomavirus,,Papillomaviridae,10566 -Human papillomavirus 116,Gammapapillomavirus 9,Gammapapillomavirus,Papillomaviridae,915428 -Human papillomavirus 121,Gammapapillomavirus 10,Gammapapillomavirus,Papillomaviridae,915429 -Human papillomavirus 126,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1055684 -Human papillomavirus 127,Gammapapillomavirus 12,Gammapapillomavirus,Papillomaviridae,746832 -Human papillomavirus 132,Gammapapillomavirus 12,Gammapapillomavirus,Papillomaviridae,909331 -Human papillomavirus 134,Gammapapillomavirus 7,Gammapapillomavirus,Papillomaviridae,909333 -Human papillomavirus 135,Gammapapillomavirus 15,Gammapapillomavirus,Papillomaviridae,1070408 -Human papillomavirus 136,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1070409 -Human papillomavirus 140,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1070413 -Human papillomavirus 154,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1195796 -human papillomavirus 166,Gammapapillomavirus 19,Gammapapillomavirus,Papillomaviridae,1315259 -Human papillomavirus 167,Gammapapillomavirus 21,Gammapapillomavirus,Papillomaviridae,1420545 -Human papillomavirus 172,Gammapapillomavirus 22,Gammapapillomavirus,Papillomaviridae,1434987 -Human papillomavirus 175,Gammapapillomavirus 23,Gammapapillomavirus,Papillomaviridae,1434782 -Human papillomavirus 178,Gammapapillomavirus 24,Gammapapillomavirus,Papillomaviridae,1478160 -Human papillomavirus 179,Gammapapillomavirus 15,Gammapapillomavirus,Papillomaviridae,1472342 -Human papillomavirus 184,Gammapapillomavirus 25,Gammapapillomavirus,Papillomaviridae,1472343 -Human papillomavirus 187,Gammapapillomavirus 26,Gammapapillomavirus,Papillomaviridae,1851130 -Human papillomavirus 201,Gammapapillomavirus 27,Gammapapillomavirus,Papillomaviridae,1682340 -Human papillomavirus 204,Mupapillomavirus 3,Mupapillomavirus,Papillomaviridae,1650736 -Human papillomavirus KC5,Human papillomavirus KC5,Gammapapillomavirus,Papillomaviridae,1647924 -Human papillomavirus type 161,Gammapapillomavirus 19,Gammapapillomavirus,Papillomaviridae,1315264 -Human papillomavirus type 85,Human papillomavirus type 85,,Papillomaviridae,652810 -Sosuga virus,Pararubulavirus sosugaense,Pararubulavirus,Paramyxoviridae,1452514 -Bocaparvovirus primate1,Bocaparvovirus primate1,Bocaparvovirus,Parvoviridae,3052040 -Bufavirus-3,Bufavirus-3,,Parvoviridae,1391667 -Cutavirus,Protoparvovirus primate3,Protoparvovirus,Parvoviridae,1867125 -Human bocavirus 2c PK,Bocaparvovirus primate2,Bocaparvovirus,Parvoviridae,1511882 -Human bocavirus 3,Bocaparvovirus primate1,Bocaparvovirus,Parvoviridae,638313 -Human bocavirus 4 NI,Bocaparvovirus primate2,Bocaparvovirus,Parvoviridae,1511883 -Human erythrovirus V9,Human erythrovirus V9,Erythroparvovirus,Parvoviridae,72197 -Human parvovirus 4 G1,Tetraparvovirus primate1,Tetraparvovirus,Parvoviridae,1511919 -Parvovirus NIH-CQV,Parvovirus NIH-CQV,,Parvoviridae,1341019 -Orthobunyavirus bwambaense,Orthobunyavirus bwambaense,Orthobunyavirus,Peribunyaviridae,3052384 -Catu virus,Orthobunyavirus catuense,Orthobunyavirus,Peribunyaviridae,1678225 -Fort Sherman virus,Orthobunyavirus shermanense,Orthobunyavirus,Peribunyaviridae,273345 -Guaroa virus,Orthobunyavirus guaroaense,Orthobunyavirus,Peribunyaviridae,80941 -Ilesha virus,Orthobunyavirus ileshaense,Orthobunyavirus,Peribunyaviridae,273341 -Madrid virus,Orthobunyavirus madridense,Orthobunyavirus,Peribunyaviridae,348013 -Alenquer virus,Phlebovirus alenquerense,Phlebovirus,Phenuiviridae,629726 -Chandiru virus,Phlebovirus candiruense,Phlebovirus,Phenuiviridae,629725 -Cocle virus,Phlebovirus cocleense,Phlebovirus,Phenuiviridae,1649829 -Dar es Salaam virus TZ-189,Tanzavirus daressalaamense,Tanzavirus,Phenuiviridae,2576944 -Echarate virus,Phlebovirus echarateense,Phlebovirus,Phenuiviridae,1000646 -Heartland virus,Bandavirus heartlandense,Bandavirus,Phenuiviridae,1216928 -Maldonado virus,Phlebovirus maldonadoense,Phlebovirus,Phenuiviridae,1004889 -Punta Toro virus,Phlebovirus toroense,Phlebovirus,Phenuiviridae,11587 -Sandfly fever Turkey virus,Phlebovirus siciliaense,Phlebovirus,Phenuiviridae,688699 -Severe fever with thrombocytopenia virus,Bandavirus dabieense,Bandavirus,Phenuiviridae,1003835 -SFTS virus HB29,Bandavirus dabieense,Bandavirus,Phenuiviridae,992212 -aichivirus A1,Aichivirus A,Kobuvirus,Picornaviridae,1313215 -Cosavirus A,Cosavirus A,Cosavirus,Picornaviridae,1330491 -Cosavirus D,Cosavirus D,Cosavirus,Picornaviridae,2003650 -Cosavirus E,Cosavirus E,Cosavirus,Picornaviridae,2003651 -Cosavirus F,Cosavirus F,Cosavirus,Picornaviridae,2003652 -Cosavirus JMY-2014,Cosavirus JMY-2014,Cosavirus,Picornaviridae,1582094 -Coxsackievirus B3,Enterovirus B,Enterovirus,Picornaviridae,12072 -enterovirus A114,Enterovirus A,Enterovirus,Picornaviridae,2760809 -Human cosavirus,Human cosavirus,Cosavirus,Picornaviridae,1233383 -Human cosavirus B,Cosavirus B,Cosavirus,Picornaviridae,586420 -rosavirus A2,Rosavirus A,Rosavirus,Picornaviridae,1511807 -Salivirus A,Salivirus A,Salivirus,Picornaviridae,1330524 -Salivirus FHB,Salivirus FHB,Salivirus,Picornaviridae,1547495 -Salivirus NG-J1,Salivirus A,Salivirus,Picornaviridae,651733 -Human polyomavirus 6,Deltapolyomavirus sextihominis,Deltapolyomavirus,Polyomaviridae,746830 -Human polyomavirus 7,Deltapolyomavirus septihominis,Deltapolyomavirus,Polyomaviridae,746831 -Human polyomavirus 9,Alphapolyomavirus nonihominis,Alphapolyomavirus,Polyomaviridae,943908 -LI polyomavirus,Alphapolyomavirus quardecihominis,Alphapolyomavirus,Polyomaviridae,1965344 -Merkel cell polyomavirus,Alphapolyomavirus quintihominis,Alphapolyomavirus,Polyomaviridae,493803 -MW polyomavirus,Deltapolyomavirus decihominis,Deltapolyomavirus,Polyomaviridae,1203539 -New Jersey polyomavirus-2013,Alphapolyomavirus terdecihominis,Alphapolyomavirus,Polyomaviridae,1497391 -STL polyomavirus,Deltapolyomavirus undecihominis,Deltapolyomavirus,Polyomaviridae,1277649 -Trichodysplasia spinulosa-associated polyomavirus,Alphapolyomavirus octihominis,Alphapolyomavirus,Polyomaviridae,862909 -Akhmeta virus,Akhmeta virus,Orthopoxvirus,Poxviridae,2200830 -Monkeypox virus,Monkeypox virus,Orthopoxvirus,Poxviridae,10244 -NY_014 poxvirus,NY_014 poxvirus,Centapoxvirus,Poxviridae,2025360 -Human lung-associated vientovirus FB,Vientovirus,Torbevirus,Redondoviridae,2571082 -Central cimpanzee simian foamy virus,Central cimpanzee simian foamy virus,Simiispumavirus,Retroviridae,2170194 -Eastern chimpanzee simian foamy virus,Eastern chimpanzee simian foamy virus,Simiispumavirus,Retroviridae,2170195 -Guenon simian foamy virus,Guenon simian foamy virus,Simiispumavirus,Retroviridae,2170197 -Human endogenous retrovirus K113,Human endogenous retrovirus K,,Retroviridae,166122 -Human immunodeficiency virus 1,Human immunodeficiency virus 1,Lentivirus,Retroviridae,11676 -Human immunodeficiency virus 2,Human immunodeficiency virus 2,Lentivirus,Retroviridae,11709 -Human T-lymphotropic virus 4,Human T-lymphotropic virus 4,Deltaretrovirus,Retroviridae,318279 -Tibrovirus congo,Tibrovirus congo,Tibrovirus,Rhabdoviridae,1987017 -Chandipura virus,Vesiculovirus chandipura,Vesiculovirus,Rhabdoviridae,11272 -Lyssavirus duvenhage,Lyssavirus duvenhage,Lyssavirus,Rhabdoviridae,38767 -Ekpoma virus 1,Tibrovirus alphaekpoma,Tibrovirus,Rhabdoviridae,1987020 -Ekpoma virus 2,Tibrovirus betaekpoma,Tibrovirus,Rhabdoviridae,1987021 -European bat lyssavirus 2,Lyssavirus helsinki,Lyssavirus,Rhabdoviridae,57483 -Le Dantec virus,Ledantevirus ledantec,Ledantevirus,Rhabdoviridae,318848 -Mundri virus,Mundri virus,,Rhabdoviridae,2913478 -Lebombo virus,Lebombo virus,Orbivirus,Sedoreoviridae,40057 -Orungo virus,Orungo virus,Orbivirus,Sedoreoviridae,40058 -Human associated huchismacovirus 1,Human associated huchismacovirus 1,Huchismacovirus,Smacoviridae,2169934 -Human associated huchismacovirus 2,Human associated huchismacovirus 2,Huchismacovirus,Smacoviridae,2169935 -Human associated huchismacovirus 3,Human associated huchismacovirus 3,Huchismacovirus,Smacoviridae,2169936 -Human associated porprismacovirus,Inpeasmacovirus humas1,Inpeasmacovirus,Smacoviridae,2530494 -Human associated porprismacovirus 3,Porprismacovirus humas4,Porprismacovirus,Smacoviridae,2496633 -Human feces smacovirus 2,Porprismacovirus humas1,Porprismacovirus,Smacoviridae,1820158 -Human feces smacovirus 3,Porprismacovirus humas3,Porprismacovirus,Smacoviridae,1820159 -Human smacovirus 1,Human smacovirus 1,Huchismacovirus,Smacoviridae,1595998 -Mammalian orthoreovirus 3 Dearing,Mammalian orthoreovirus,Orthoreovirus,Spinareoviridae,10886 -Ross River virus,Ross River virus,Alphavirus,Togaviridae,11029 -Circo-like virus-Brazil hs1,Circo-like virus-Brazil,,,1346815 -Hudisavirus sp.,Hudisavirus sp.,,,2021738 -West Nile virus strain NY-99,West Nile virus,Flavivirus,Flaviviridae,1968826 -BK polyomavirus MM,BK polyomavirus,Betapolyomavirus,Polyomaviridae,1417981 -Banana virus X,Banna virus,Bannavirus,Reoviridae,307671 -Bombali virus,Ebolavirus,Ebolavirus,Filoviridae,2010960 -Bourbon virus,Bourbon virus,Thogotovirus,Orthomyxoviridae,1618189 -Dhori virus (strain Indian/1313/61),Dhori virus,Thogotovirus,Orthomyxoviridae,11319 -Encephalomyocarditis virus,Encephalomyocarditis virus,Cardiovirus,Picornaviridae,12104 -Eyach virus,Eyach virus,Coltivirus,Reoviridae,62352 -Henipavirus hendraense,Hendra virus,Henipavirus,Paramyxoviridae,3052223 -Henipavirus nipahense,Nipah virus,Henipavirus,Paramyxoviridae,3052225 -Hepatitis B virus,Hepatitis B virus,Orthohepadnavirus,Hepadnaviridae,10407 -Hepatitis delta virus,Hepatitis delta virus,Deltavirus,Deltaflexiviridae,12475 -Hepatovirus A,Hepatitis A virus,Hepatovirus,Picornaviridae,12092 -Human foamy virus,Human foamy virus,Spumavirus,Retroviridae,11641 -human metapneumovirus,Human metapneumovirus,Metapneumovirus,Paramyxoviridae,162145 -Human orthorubulavirus 2,Human orthorubulavirus 2,Orthorubulavirus,Paramyxoviridae,2560525 -Human papillomavirus,Human papillomavirus,Papillomavirus,Papillomaviridae,10566 -Betapolyomavirus tertihominis,KI Polyomavirus,Betapolyomavirus,Polyomaviridae,1891764 -Human respirovirus 1,Human Respirovirus 1,Respirovirus,Paramyxoviridae,12730 -Human respirovirus 3,Human Respirovirus 3,Respirovirus,Paramyxoviridae,11216 -Human torovirus,Human torovirus,Torovirus,Toroviridae,67605 -Influenza B virus (B/Lee/1940),Influenza B virus,Betainfluenzavirus,Orthomyxoviridae,518987 -Influenza C virus (C/Ann Arbor/1/50),Influenza C virus,Gammainfluenzavirus,Orthomyxoviridae,11553 -Japanese encephalitis virus,Japanese encephalitis virus,Flavivirus,Flaviviridae,11072 -Measles morbillivirus,Morbillivirus,Morbillivirus,Paramyxoviridae,11234 -Merkel cell polyomavirus,Merkel cell polyomavirus,Orthopolyomavirus,Polyomaviridae,493803 -Molluscum contagiosum virus subtype 1,Molluscum contagiosum virus,Molluscipoxvirus,Poxviridae,10280 -Mumps orthorubulaviru,Mumps virus,Orthorubulavirus,Paramyxoviridae,2560602 -Murray Valley encephalitis virus,Murray valley encephalitis virus,Flavivirus,Flaviviridae,11079 -Orf virus,Orf virus,Parapoxvirus,Poxviridae,10258 -Orthomarburgvirus marburgense,Lake Victoria marburgvirus,Marburgvirus,Filoviridae,3052505 -Rotavirus A,Rotavirus A,Rotavirus,Reoviridae,28875 -Rotavirus C,Rotavirus C,Rotavirus,Reoviridae,36427 -St. Louis encephalitis virus,Saint Louis encephalitis virus,Flavivirus,Flaviviridae,11080 -Thogotovirus,Thogotovirus,Thogotovirus,Orthomyxoviridae,35323 -Tick-borne encephalitis virus,Tick-borne encephalitis virus,Flavivirus,Flaviviridae,11084 -Torque teno virus 6,Torque teno virus,Anellovirus,Anelloviridae,687345 -WU Polyomavirus,WU polyomavirus,Betapolyomavirus,Polyomaviridae,440266 -Yaba monkey tumor virus,Yaba monkey tumor virus,Yatapoxvirus,Poxviridae,38804 -Yaba-like disease virus,Yaba-like disease virus,Yatapoxvirus,Poxviridae,132475 -Zika virus,Zika virus,Flavivirus,Flaviviridae,64320 -dengue virus type 1,Dengue virus,Flavivirus,Flaviviridae,11053 \ No newline at end of file +Organism_Name,Species,Genus,Family,Taxid +Human mastadenovirus A,Human mastadenovirus A,Mastadenovirus,Adenoviridae,129875 +Human mastadenovirus B,Human mastadenovirus B,Mastadenovirus,Adenoviridae,108098 +Human mastadenovirus C,Human mastadenovirus C,Mastadenovirus,Adenoviridae,129951 +Human mastadenovirus D,Human mastadenovirus D,Mastadenovirus,Adenoviridae,130310 +Human mastadenovirus F,Human mastadenovirus F,Mastadenovirus,Adenoviridae,130309 +Anelloviridae sp.,Anelloviridae sp.,,Anelloviridae,2055263 +Gyrovirus 4,Gyrovirus homsa3,Gyrovirus,Anelloviridae,1214955 +Gyrovirus GyV3,Gyrovirus homsa1,Gyrovirus,Anelloviridae,1163715 +Gyrovirus Tu243,Gyrovirus homsa4,Gyrovirus,Anelloviridae,1415627 +Gyrovirus Tu789,Gyrovirus homsa2,Gyrovirus,Anelloviridae,1415628 +Small anellovirus 1,Small anellovirus,,Anelloviridae,289366 +Small anellovirus 2,Small anellovirus,,Anelloviridae,289367 +Torque teno midi virus 1,Gammatorquevirus homidi1,Gammatorquevirus,Anelloviridae,687379 +Torque teno midi virus 10,Gammatorquevirus homidi10,Gammatorquevirus,Anelloviridae,2065051 +Torque teno midi virus 11,Gammatorquevirus homidi11,Gammatorquevirus,Anelloviridae,2065052 +Torque teno midi virus 12,Gammatorquevirus homidi12,Gammatorquevirus,Anelloviridae,2065053 +Torque teno midi virus 13,Gammatorquevirus homidi13,Gammatorquevirus,Anelloviridae,2065054 +Torque teno midi virus 14,Gammatorquevirus homidi14,Gammatorquevirus,Anelloviridae,2065055 +Torque teno midi virus 2,Gammatorquevirus homidi2,Gammatorquevirus,Anelloviridae,687380 +Torque teno midi virus 3,Gammatorquevirus homidi3,Gammatorquevirus,Anelloviridae,2065044 +Torque teno midi virus 4,Gammatorquevirus homidi4,Gammatorquevirus,Anelloviridae,2065045 +Torque teno midi virus 5,Gammatorquevirus homidi5,Gammatorquevirus,Anelloviridae,2065046 +Torque teno midi virus 6,Gammatorquevirus homidi6,Gammatorquevirus,Anelloviridae,2065047 +Torque teno midi virus 7,Gammatorquevirus homidi7,Gammatorquevirus,Anelloviridae,2065048 +Torque teno midi virus 8,Gammatorquevirus homidi8,Gammatorquevirus,Anelloviridae,2065049 +Torque teno midi virus 9,Gammatorquevirus homidi9,Gammatorquevirus,Anelloviridae,2065050 +Torque teno mini virus 1,Betatorquevirus homini1,Betatorquevirus,Anelloviridae,687369 +Torque teno mini virus 10,Betatorquevirus homini10,Betatorquevirus,Anelloviridae,2065036 +Torque teno mini virus 11,Betatorquevirus homini11,Betatorquevirus,Anelloviridae,2065037 +Torque teno mini virus 12,Betatorquevirus homini12,Betatorquevirus,Anelloviridae,2065038 +Torque teno mini virus 18,Betatorquevirus homini18,Betatorquevirus,Anelloviridae,1859149 +Torque teno mini virus 5,Betatorquevirus homini5,Betatorquevirus,Anelloviridae,687373 +Torque teno mini virus 6,Betatorquevirus homini6,Betatorquevirus,Anelloviridae,687374 +Torque teno mini virus 8,Betatorquevirus homini8,Betatorquevirus,Anelloviridae,687376 +Torque teno mini virus ALA22,Betatorquevirus homini27,Betatorquevirus,Anelloviridae,1535290 +Torque teno mini virus ALH8,Betatorquevirus homini16,Betatorquevirus,Anelloviridae,1535291 +Torque teno mini virus SHA,Betatorquevirus homini26,Betatorquevirus,Anelloviridae,2057931 +Torque teno virus,Torque teno virus,,Anelloviridae,68887 +Torque teno virus 9,Alphatorquevirus homin9,Alphatorquevirus,Anelloviridae,687348 +TTV-like mini virus,TTV-like mini virus,Betatorquevirus,Anelloviridae,93678 +Mammarenavirus chapareense,Mammarenavirus chapareense,Mammarenavirus,Arenaviridae,3052302 +Mammarenavirus lujoense,Mammarenavirus lujoense,Mammarenavirus,Arenaviridae,3052314 +Astrovirus MLB2,Astrovirus MLB2,,Astroviridae,683172 +Astrovirus MLB3,Astrovirus MLB3,,Astroviridae,1247114 +Astrovirus VA1,Mamastrovirus 9,Mamastrovirus,Astroviridae,645687 +Astrovirus VA3,Astrovirus VA3,,Astroviridae,683174 +Astrovirus VA4,Astrovirus VA4,,Astroviridae,1247113 +Bastrovirus 7,Bastrovirus BAS-1,,Astroviridae,1803394 +HMO Astrovirus A,HMO Astrovirus A,Mamastrovirus,Astroviridae,682382 +Human astrovirus BF34,Burkina Faso astrovirus,Mamastrovirus,Astroviridae,1518575 +Norovirus GI,Norwalk virus,Norovirus,Caliciviridae,122928 +Norovirus GI/Hu/JP/2007/GI.P3_GI.3/Shimizu/KK2866,Norwalk virus,Norovirus,Caliciviridae,1529909 +Norovirus GII,Norwalk virus,Norovirus,Caliciviridae,122929 +Norovirus GII.17,Norwalk virus,Norovirus,Caliciviridae,552592 +Norovirus GII/Hu/JP/2007/GII.P15_GII.15/Sapporo/HK299,Norwalk virus,Norovirus,Caliciviridae,1529918 +Norovirus GII/Hu/JP/2011/GII/Yuzawa/Gira2HS,Norwalk virus,Norovirus,Caliciviridae,1529924 +Norovirus GIV,Norwalk virus,Norovirus,Caliciviridae,262897 +Sapovirus Hu/GI/Sapporo/MT-2010/1982,Sapporo virus,Sapovirus,Caliciviridae,758863 +Cyclovirus NG12,Cyclovirus mmadu,Cyclovirus,Circoviridae,742922 +Cyclovirus NG14,Cyclovirus mutum,Cyclovirus,Circoviridae,742923 +Cyclovirus PK5006,Cyclovirus insaan,Cyclovirus,Circoviridae,742915 +Cyclovirus PK5034,Cyclovirus homa,Cyclovirus,Circoviridae,742916 +Cyclovirus PK5222,Cyclovirus manukha,Cyclovirus,Circoviridae,742917 +Cyclovirus PK5510,Cyclovirus maanav,Cyclovirus,Circoviridae,742918 +Cyclovirus SL-108277,Cyclovirus manitan,Cyclovirus,Circoviridae,1520935 +Cyclovirus TN25,Cyclovirus bashri,Cyclovirus,Circoviridae,742924 +Cyclovirus VN,Cyclovirus nhanloai,Cyclovirus,Circoviridae,1348500 +Human associated cyclovirus 10,Cyclovirus humana,Cyclovirus,Circoviridae,2038728 +Human circovirus VS6600022,Human circovirus VS6600022,Circovirus,Circoviridae,1525173 +Human cyclovirus VS5700009,Cyclovirus munthu,Cyclovirus,Circoviridae,1345637 +Human fecal virus Jorvi2,Human fecal virus Jorvi2,,Circoviridae,2017081 +Human fecal virus Jorvi3,Human fecal virus Jorvi3,,Circoviridae,2017082 +Human fecal virus Jorvi4,Human fecal virus Jorvi4,,Circoviridae,2017083 +Human PoSCV5-like circular virus,Human PoSCV5-like circular virus,,Circoviridae,1965018 +Human stool-associated circular virus NG13,Circovirus eniyan,Circovirus,Circoviridae,743300 +Indian encephalitis associated cyclovirus,Cyclovirus manusyan,Cyclovirus,Circoviridae,1755290 +Betacoronavirus England 1,Middle East respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,1263720 +Human coronavirus HKU1,Human coronavirus HKU1,Betacoronavirus,Coronaviridae,290028 +Middle East respiratory syndrome-related coronavirus,Middle East respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,1335626 +SARS coronavirus Tor2,Severe acute respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,227984 +Severe acute respiratory syndrome coronavirus 2,Severe acute respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,2697049 +Bundibugyo ebolavirus,Orthoebolavirus bundibugyoense,Orthoebolavirus,Filoviridae,565995 +Orthomarburgvirus marburgense,Orthomarburgvirus marburgense,Orthomarburgvirus,Filoviridae,3052505 +Sudan ebolavirus,Orthoebolavirus sudanense,Orthoebolavirus,Filoviridae,186540 +Tai Forest ebolavirus,Orthoebolavirus taiense,Orthoebolavirus,Filoviridae,186541 +Hepacivirus platyrrhini,Hepacivirus platyrrhini,Hepacivirus,Flaviviridae,3052236 +Hepatitis C virus genotype 3,Hepacivirus hominis,Hepacivirus,Flaviviridae,356114 +Hepatitis C virus genotype 4,Hepacivirus hominis,Hepacivirus,Flaviviridae,33745 +Hepatitis C virus genotype 5,Hepacivirus hominis,Hepacivirus,Flaviviridae,33746 +Hepatitis C virus genotype 7,Hepacivirus hominis,Hepacivirus,Flaviviridae,1544901 +Human hepegivirus,Pegivirus columbiaense,Pegivirus,Flaviviridae,1704090 +Human pegivirus 2,Pegivirus columbiaense,Pegivirus,Flaviviridae,1729141 +Zika virus,Orthoflavivirus zikaense,Orthoflavivirus,Flaviviridae,64320 +Gemycircularvirus C1c,Gemykibivirus humas3,Gemykibivirus,Genomoviridae,1673681 +Gemycircularvirus HV-GcV1,Gemycircularvirus HV-GcV1,Gemycircularvirus,Genomoviridae,1862824 +Gemycircularvirus HV-GcV2,Gemykibivirus humas5,Gemykibivirus,Genomoviridae,1862825 +Gemycircularvirus sp.,Gemycircularvirus sp.,Gemycircularvirus,Genomoviridae,1983771 +Human associated gemyvongvirus 1,Gemyvongvirus humas1,Gemyvongvirus,Genomoviridae,1985415 +Human gemycircularvirus GeTz1,Gemykibivirus humas4,Gemykibivirus,Genomoviridae,1792832 +Human genital-associated circular DNA virus-1,Gemygorvirus sewopo1,Gemygorvirus,Genomoviridae,1488574 +Orthohantavirus sinnombreense,Orthohantavirus sinnombreense,Orthohantavirus,Hantaviridae,3052499 +Rubella virus,Rubivirus rubellae,Rubivirus,Matonaviridae,11041 +Beiji nairovirus,Beiji nairovirus,Orthonairovirus,Nairoviridae,2304647 +Songling virus,Songling virus,Orthonairovirus,Nairoviridae,2795181 +Yezo virus,Yezo virus,Orthonairovirus,Nairoviridae,2825847 +Human alphaherpesvirus 2,Simplexvirus humanalpha2,Simplexvirus,Orthoherpesviridae,10310 +Human alphaherpesvirus 3,Varicellovirus humanalpha3,Varicellovirus,Orthoherpesviridae,10335 +Human betaherpesvirus 5,Cytomegalovirus humanbeta5,Cytomegalovirus,Orthoherpesviridae,10359 +Human betaherpesvirus 6A,Roseolovirus humanbeta6a,Roseolovirus,Orthoherpesviridae,32603 +Human betaherpesvirus 6B,Roseolovirus humanbeta6b,Roseolovirus,Orthoherpesviridae,32604 +Human betaherpesvirus 7,Roseolovirus humanbeta7,Roseolovirus,Orthoherpesviridae,10372 +human gammaherpesvirus 4,Lymphocryptovirus humangamma4,Lymphocryptovirus,Orthoherpesviridae,10376 +Human gammaherpesvirus 8,Rhadinovirus humangamma8,Rhadinovirus,Orthoherpesviridae,37296 +Human herpesvirus 4 type 2,Lymphocryptovirus humangamma4,Lymphocryptovirus,Orthoherpesviridae,12509 +Influenza A virus (A/California/07/2009(H1N1)),Alphainfluenzavirus influenzae,Alphainfluenzavirus,Orthomyxoviridae,641809 +Influenza A virus (A/New York/392/2004(H3N2)),Alphainfluenzavirus influenzae,Alphainfluenzavirus,Orthomyxoviridae,335341 +Influenza A virus (A/Shanghai/02/2013(H7N9)),Alphainfluenzavirus influenzae,Alphainfluenzavirus,Orthomyxoviridae,1332244 +Gammapapillomavirus sp.,Gammapapillomavirus sp.,Gammapapillomavirus,Papillomaviridae,2049444 +Human papillomavirus,Human papillomavirus,,Papillomaviridae,10566 +Human papillomavirus 116,Gammapapillomavirus 9,Gammapapillomavirus,Papillomaviridae,915428 +Human papillomavirus 121,Gammapapillomavirus 10,Gammapapillomavirus,Papillomaviridae,915429 +Human papillomavirus 126,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1055684 +Human papillomavirus 127,Gammapapillomavirus 12,Gammapapillomavirus,Papillomaviridae,746832 +Human papillomavirus 132,Gammapapillomavirus 12,Gammapapillomavirus,Papillomaviridae,909331 +Human papillomavirus 134,Gammapapillomavirus 7,Gammapapillomavirus,Papillomaviridae,909333 +Human papillomavirus 135,Gammapapillomavirus 15,Gammapapillomavirus,Papillomaviridae,1070408 +Human papillomavirus 136,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1070409 +Human papillomavirus 140,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1070413 +Human papillomavirus 154,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1195796 +human papillomavirus 166,Gammapapillomavirus 19,Gammapapillomavirus,Papillomaviridae,1315259 +Human papillomavirus 167,Gammapapillomavirus 21,Gammapapillomavirus,Papillomaviridae,1420545 +Human papillomavirus 172,Gammapapillomavirus 22,Gammapapillomavirus,Papillomaviridae,1434987 +Human papillomavirus 175,Gammapapillomavirus 23,Gammapapillomavirus,Papillomaviridae,1434782 +Human papillomavirus 178,Gammapapillomavirus 24,Gammapapillomavirus,Papillomaviridae,1478160 +Human papillomavirus 179,Gammapapillomavirus 15,Gammapapillomavirus,Papillomaviridae,1472342 +Human papillomavirus 184,Gammapapillomavirus 25,Gammapapillomavirus,Papillomaviridae,1472343 +Human papillomavirus 187,Gammapapillomavirus 26,Gammapapillomavirus,Papillomaviridae,1851130 +Human papillomavirus 201,Gammapapillomavirus 27,Gammapapillomavirus,Papillomaviridae,1682340 +Human papillomavirus 204,Mupapillomavirus 3,Mupapillomavirus,Papillomaviridae,1650736 +Human papillomavirus KC5,Human papillomavirus KC5,Gammapapillomavirus,Papillomaviridae,1647924 +Human papillomavirus type 161,Gammapapillomavirus 19,Gammapapillomavirus,Papillomaviridae,1315264 +Human papillomavirus type 85,Human papillomavirus type 85,,Papillomaviridae,652810 +Sosuga virus,Pararubulavirus sosugaense,Pararubulavirus,Paramyxoviridae,1452514 +Bocaparvovirus primate1,Bocaparvovirus primate1,Bocaparvovirus,Parvoviridae,3052040 +Bufavirus-3,Bufavirus-3,,Parvoviridae,1391667 +Cutavirus,Protoparvovirus primate3,Protoparvovirus,Parvoviridae,1867125 +Human bocavirus 2c PK,Bocaparvovirus primate2,Bocaparvovirus,Parvoviridae,1511882 +Human bocavirus 3,Bocaparvovirus primate1,Bocaparvovirus,Parvoviridae,638313 +Human bocavirus 4 NI,Bocaparvovirus primate2,Bocaparvovirus,Parvoviridae,1511883 +Human erythrovirus V9,Human erythrovirus V9,Erythroparvovirus,Parvoviridae,72197 +Human parvovirus 4 G1,Tetraparvovirus primate1,Tetraparvovirus,Parvoviridae,1511919 +Parvovirus NIH-CQV,Parvovirus NIH-CQV,,Parvoviridae,1341019 +Orthobunyavirus bwambaense,Orthobunyavirus bwambaense,Orthobunyavirus,Peribunyaviridae,3052384 +Catu virus,Orthobunyavirus catuense,Orthobunyavirus,Peribunyaviridae,1678225 +Fort Sherman virus,Orthobunyavirus shermanense,Orthobunyavirus,Peribunyaviridae,273345 +Guaroa virus,Orthobunyavirus guaroaense,Orthobunyavirus,Peribunyaviridae,80941 +Ilesha virus,Orthobunyavirus ileshaense,Orthobunyavirus,Peribunyaviridae,273341 +Madrid virus,Orthobunyavirus madridense,Orthobunyavirus,Peribunyaviridae,348013 +Alenquer virus,Phlebovirus alenquerense,Phlebovirus,Phenuiviridae,629726 +Chandiru virus,Phlebovirus candiruense,Phlebovirus,Phenuiviridae,629725 +Cocle virus,Phlebovirus cocleense,Phlebovirus,Phenuiviridae,1649829 +Dar es Salaam virus TZ-189,Tanzavirus daressalaamense,Tanzavirus,Phenuiviridae,2576944 +Echarate virus,Phlebovirus echarateense,Phlebovirus,Phenuiviridae,1000646 +Heartland virus,Bandavirus heartlandense,Bandavirus,Phenuiviridae,1216928 +Maldonado virus,Phlebovirus maldonadoense,Phlebovirus,Phenuiviridae,1004889 +Punta Toro virus,Phlebovirus toroense,Phlebovirus,Phenuiviridae,11587 +Sandfly fever Turkey virus,Phlebovirus siciliaense,Phlebovirus,Phenuiviridae,688699 +Severe fever with thrombocytopenia virus,Bandavirus dabieense,Bandavirus,Phenuiviridae,1003835 +SFTS virus HB29,Bandavirus dabieense,Bandavirus,Phenuiviridae,992212 +aichivirus A1,Aichivirus A,Kobuvirus,Picornaviridae,1313215 +Cosavirus A,Cosavirus A,Cosavirus,Picornaviridae,1330491 +Cosavirus D,Cosavirus D,Cosavirus,Picornaviridae,2003650 +Cosavirus E,Cosavirus E,Cosavirus,Picornaviridae,2003651 +Cosavirus F,Cosavirus F,Cosavirus,Picornaviridae,2003652 +Cosavirus JMY-2014,Cosavirus JMY-2014,Cosavirus,Picornaviridae,1582094 +Coxsackievirus B3,Enterovirus B,Enterovirus,Picornaviridae,12072 +enterovirus A114,Enterovirus A,Enterovirus,Picornaviridae,2760809 +Human cosavirus,Human cosavirus,Cosavirus,Picornaviridae,1233383 +Human cosavirus B,Cosavirus B,Cosavirus,Picornaviridae,586420 +rosavirus A2,Rosavirus A,Rosavirus,Picornaviridae,1511807 +Salivirus A,Salivirus A,Salivirus,Picornaviridae,1330524 +Salivirus FHB,Salivirus FHB,Salivirus,Picornaviridae,1547495 +Salivirus NG-J1,Salivirus A,Salivirus,Picornaviridae,651733 +Human polyomavirus 6,Deltapolyomavirus sextihominis,Deltapolyomavirus,Polyomaviridae,746830 +Human polyomavirus 7,Deltapolyomavirus septihominis,Deltapolyomavirus,Polyomaviridae,746831 +Human polyomavirus 9,Alphapolyomavirus nonihominis,Alphapolyomavirus,Polyomaviridae,943908 +LI polyomavirus,Alphapolyomavirus quardecihominis,Alphapolyomavirus,Polyomaviridae,1965344 +Merkel cell polyomavirus,Alphapolyomavirus quintihominis,Alphapolyomavirus,Polyomaviridae,493803 +MW polyomavirus,Deltapolyomavirus decihominis,Deltapolyomavirus,Polyomaviridae,1203539 +New Jersey polyomavirus-2013,Alphapolyomavirus terdecihominis,Alphapolyomavirus,Polyomaviridae,1497391 +STL polyomavirus,Deltapolyomavirus undecihominis,Deltapolyomavirus,Polyomaviridae,1277649 +Trichodysplasia spinulosa-associated polyomavirus,Alphapolyomavirus octihominis,Alphapolyomavirus,Polyomaviridae,862909 +Akhmeta virus,Akhmeta virus,Orthopoxvirus,Poxviridae,2200830 +Monkeypox virus,Monkeypox virus,Orthopoxvirus,Poxviridae,10244 +NY_014 poxvirus,NY_014 poxvirus,Centapoxvirus,Poxviridae,2025360 +Human lung-associated vientovirus FB,Vientovirus,Torbevirus,Redondoviridae,2571082 +Central cimpanzee simian foamy virus,Central cimpanzee simian foamy virus,Simiispumavirus,Retroviridae,2170194 +Eastern chimpanzee simian foamy virus,Eastern chimpanzee simian foamy virus,Simiispumavirus,Retroviridae,2170195 +Guenon simian foamy virus,Guenon simian foamy virus,Simiispumavirus,Retroviridae,2170197 +Human endogenous retrovirus K113,Human endogenous retrovirus K,,Retroviridae,166122 +Human immunodeficiency virus 1,Human immunodeficiency virus 1,Lentivirus,Retroviridae,11676 +Human immunodeficiency virus 2,Human immunodeficiency virus 2,Lentivirus,Retroviridae,11709 +Human T-lymphotropic virus 4,Human T-lymphotropic virus 4,Deltaretrovirus,Retroviridae,318279 +Tibrovirus congo,Tibrovirus congo,Tibrovirus,Rhabdoviridae,1987017 +Chandipura virus,Vesiculovirus chandipura,Vesiculovirus,Rhabdoviridae,11272 +Lyssavirus duvenhage,Lyssavirus duvenhage,Lyssavirus,Rhabdoviridae,38767 +Ekpoma virus 1,Tibrovirus alphaekpoma,Tibrovirus,Rhabdoviridae,1987020 +Ekpoma virus 2,Tibrovirus betaekpoma,Tibrovirus,Rhabdoviridae,1987021 +European bat lyssavirus 2,Lyssavirus helsinki,Lyssavirus,Rhabdoviridae,57483 +Le Dantec virus,Ledantevirus ledantec,Ledantevirus,Rhabdoviridae,318848 +Mundri virus,Mundri virus,,Rhabdoviridae,2913478 +Lebombo virus,Lebombo virus,Orbivirus,Sedoreoviridae,40057 +Orungo virus,Orungo virus,Orbivirus,Sedoreoviridae,40058 +Human associated huchismacovirus 1,Human associated huchismacovirus 1,Huchismacovirus,Smacoviridae,2169934 +Human associated huchismacovirus 2,Human associated huchismacovirus 2,Huchismacovirus,Smacoviridae,2169935 +Human associated huchismacovirus 3,Human associated huchismacovirus 3,Huchismacovirus,Smacoviridae,2169936 +Human associated porprismacovirus,Inpeasmacovirus humas1,Inpeasmacovirus,Smacoviridae,2530494 +Human associated porprismacovirus 3,Porprismacovirus humas4,Porprismacovirus,Smacoviridae,2496633 +Human feces smacovirus 2,Porprismacovirus humas1,Porprismacovirus,Smacoviridae,1820158 +Human feces smacovirus 3,Porprismacovirus humas3,Porprismacovirus,Smacoviridae,1820159 +Human smacovirus 1,Human smacovirus 1,Huchismacovirus,Smacoviridae,1595998 +Mammalian orthoreovirus 3 Dearing,Mammalian orthoreovirus,Orthoreovirus,Spinareoviridae,10886 +Ross River virus,Ross River virus,Alphavirus,Togaviridae,11029 +Circo-like virus-Brazil hs1,Circo-like virus-Brazil,,,1346815 +Hudisavirus sp.,Hudisavirus sp.,,,2021738 +West Nile virus strain NY-99,West Nile virus,Flavivirus,Flaviviridae,1968826 +BK polyomavirus MM,BK polyomavirus,Betapolyomavirus,Polyomaviridae,1417981 +Banana virus X,Banna virus,Bannavirus,Reoviridae,307671 +Bombali virus,Ebolavirus,Ebolavirus,Filoviridae,2010960 +Bourbon virus,Bourbon virus,Thogotovirus,Orthomyxoviridae,1618189 +Dhori virus (strain Indian/1313/61),Dhori virus,Thogotovirus,Orthomyxoviridae,11319 +Encephalomyocarditis virus,Encephalomyocarditis virus,Cardiovirus,Picornaviridae,12104 +Eyach virus,Eyach virus,Coltivirus,Reoviridae,62352 +Henipavirus hendraense,Hendra virus,Henipavirus,Paramyxoviridae,3052223 +Henipavirus nipahense,Nipah virus,Henipavirus,Paramyxoviridae,3052225 +Hepatitis B virus,Hepatitis B virus,Orthohepadnavirus,Hepadnaviridae,10407 +Hepatitis delta virus,Hepatitis delta virus,Deltavirus,Deltaflexiviridae,12475 +Hepatovirus A,Hepatitis A virus,Hepatovirus,Picornaviridae,12092 +Human foamy virus,Human foamy virus,Spumavirus,Retroviridae,11641 +human metapneumovirus,Human metapneumovirus,Metapneumovirus,Paramyxoviridae,162145 +Human orthorubulavirus 2,Human orthorubulavirus 2,Orthorubulavirus,Paramyxoviridae,2560525 +Human papillomavirus,Human papillomavirus,Papillomavirus,Papillomaviridae,10566 +Betapolyomavirus tertihominis,KI Polyomavirus,Betapolyomavirus,Polyomaviridae,1891764 +Human respirovirus 1,Human Respirovirus 1,Respirovirus,Paramyxoviridae,12730 +Human respirovirus 3,Human Respirovirus 3,Respirovirus,Paramyxoviridae,11216 +Human torovirus,Human torovirus,Torovirus,Toroviridae,67605 +Influenza B virus (B/Lee/1940),Influenza B virus,Betainfluenzavirus,Orthomyxoviridae,518987 +Influenza C virus (C/Ann Arbor/1/50),Influenza C virus,Gammainfluenzavirus,Orthomyxoviridae,11553 +Japanese encephalitis virus,Japanese encephalitis virus,Flavivirus,Flaviviridae,11072 +Measles morbillivirus,Morbillivirus,Morbillivirus,Paramyxoviridae,11234 +Merkel cell polyomavirus,Merkel cell polyomavirus,Orthopolyomavirus,Polyomaviridae,493803 +Molluscum contagiosum virus subtype 1,Molluscum contagiosum virus,Molluscipoxvirus,Poxviridae,10280 +Mumps orthorubulaviru,Mumps virus,Orthorubulavirus,Paramyxoviridae,2560602 +Murray Valley encephalitis virus,Murray valley encephalitis virus,Flavivirus,Flaviviridae,11079 +Orf virus,Orf virus,Parapoxvirus,Poxviridae,10258 +Orthomarburgvirus marburgense,Lake Victoria marburgvirus,Marburgvirus,Filoviridae,3052505 +Rotavirus A,Rotavirus A,Rotavirus,Reoviridae,28875 +Rotavirus C,Rotavirus C,Rotavirus,Reoviridae,36427 +St. Louis encephalitis virus,Saint Louis encephalitis virus,Flavivirus,Flaviviridae,11080 +Thogotovirus,Thogotovirus,Thogotovirus,Orthomyxoviridae,35323 +Tick-borne encephalitis virus,Tick-borne encephalitis virus,Flavivirus,Flaviviridae,11084 +Torque teno virus 6,Torque teno virus,Anellovirus,Anelloviridae,687345 +WU Polyomavirus,WU polyomavirus,Betapolyomavirus,Polyomaviridae,440266 +Yaba monkey tumor virus,Yaba monkey tumor virus,Yatapoxvirus,Poxviridae,38804 +Yaba-like disease virus,Yaba-like disease virus,Yatapoxvirus,Poxviridae,132475 +Zika virus,Zika virus,Flavivirus,Flaviviridae,64320 +dengue virus type 1,Dengue virus,Flavivirus,Flaviviridae,11053 From 70fa4630e5416dee5a1d8838b1eb4dd75a90faf9 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Mon, 24 Jun 2024 13:02:09 +0200 Subject: [PATCH 03/25] update the pathogen list --- viral_pathogen_List.csv | 565 +++++++++++++++++++++------------------- 1 file changed, 297 insertions(+), 268 deletions(-) diff --git a/viral_pathogen_List.csv b/viral_pathogen_List.csv index 0f6b85d..940bbbe 100644 --- a/viral_pathogen_List.csv +++ b/viral_pathogen_List.csv @@ -1,268 +1,297 @@ -Organism_Name,Species,Genus,Family,Taxid -Human mastadenovirus A,Human mastadenovirus A,Mastadenovirus,Adenoviridae,129875 -Human mastadenovirus B,Human mastadenovirus B,Mastadenovirus,Adenoviridae,108098 -Human mastadenovirus C,Human mastadenovirus C,Mastadenovirus,Adenoviridae,129951 -Human mastadenovirus D,Human mastadenovirus D,Mastadenovirus,Adenoviridae,130310 -Human mastadenovirus F,Human mastadenovirus F,Mastadenovirus,Adenoviridae,130309 -Anelloviridae sp.,Anelloviridae sp.,,Anelloviridae,2055263 -Gyrovirus 4,Gyrovirus homsa3,Gyrovirus,Anelloviridae,1214955 -Gyrovirus GyV3,Gyrovirus homsa1,Gyrovirus,Anelloviridae,1163715 -Gyrovirus Tu243,Gyrovirus homsa4,Gyrovirus,Anelloviridae,1415627 -Gyrovirus Tu789,Gyrovirus homsa2,Gyrovirus,Anelloviridae,1415628 -Small anellovirus 1,Small anellovirus,,Anelloviridae,289366 -Small anellovirus 2,Small anellovirus,,Anelloviridae,289367 -Torque teno midi virus 1,Gammatorquevirus homidi1,Gammatorquevirus,Anelloviridae,687379 -Torque teno midi virus 10,Gammatorquevirus homidi10,Gammatorquevirus,Anelloviridae,2065051 -Torque teno midi virus 11,Gammatorquevirus homidi11,Gammatorquevirus,Anelloviridae,2065052 -Torque teno midi virus 12,Gammatorquevirus homidi12,Gammatorquevirus,Anelloviridae,2065053 -Torque teno midi virus 13,Gammatorquevirus homidi13,Gammatorquevirus,Anelloviridae,2065054 -Torque teno midi virus 14,Gammatorquevirus homidi14,Gammatorquevirus,Anelloviridae,2065055 -Torque teno midi virus 2,Gammatorquevirus homidi2,Gammatorquevirus,Anelloviridae,687380 -Torque teno midi virus 3,Gammatorquevirus homidi3,Gammatorquevirus,Anelloviridae,2065044 -Torque teno midi virus 4,Gammatorquevirus homidi4,Gammatorquevirus,Anelloviridae,2065045 -Torque teno midi virus 5,Gammatorquevirus homidi5,Gammatorquevirus,Anelloviridae,2065046 -Torque teno midi virus 6,Gammatorquevirus homidi6,Gammatorquevirus,Anelloviridae,2065047 -Torque teno midi virus 7,Gammatorquevirus homidi7,Gammatorquevirus,Anelloviridae,2065048 -Torque teno midi virus 8,Gammatorquevirus homidi8,Gammatorquevirus,Anelloviridae,2065049 -Torque teno midi virus 9,Gammatorquevirus homidi9,Gammatorquevirus,Anelloviridae,2065050 -Torque teno mini virus 1,Betatorquevirus homini1,Betatorquevirus,Anelloviridae,687369 -Torque teno mini virus 10,Betatorquevirus homini10,Betatorquevirus,Anelloviridae,2065036 -Torque teno mini virus 11,Betatorquevirus homini11,Betatorquevirus,Anelloviridae,2065037 -Torque teno mini virus 12,Betatorquevirus homini12,Betatorquevirus,Anelloviridae,2065038 -Torque teno mini virus 18,Betatorquevirus homini18,Betatorquevirus,Anelloviridae,1859149 -Torque teno mini virus 5,Betatorquevirus homini5,Betatorquevirus,Anelloviridae,687373 -Torque teno mini virus 6,Betatorquevirus homini6,Betatorquevirus,Anelloviridae,687374 -Torque teno mini virus 8,Betatorquevirus homini8,Betatorquevirus,Anelloviridae,687376 -Torque teno mini virus ALA22,Betatorquevirus homini27,Betatorquevirus,Anelloviridae,1535290 -Torque teno mini virus ALH8,Betatorquevirus homini16,Betatorquevirus,Anelloviridae,1535291 -Torque teno mini virus SHA,Betatorquevirus homini26,Betatorquevirus,Anelloviridae,2057931 -Torque teno virus,Torque teno virus,,Anelloviridae,68887 -Torque teno virus 9,Alphatorquevirus homin9,Alphatorquevirus,Anelloviridae,687348 -TTV-like mini virus,TTV-like mini virus,Betatorquevirus,Anelloviridae,93678 -Mammarenavirus chapareense,Mammarenavirus chapareense,Mammarenavirus,Arenaviridae,3052302 -Mammarenavirus lujoense,Mammarenavirus lujoense,Mammarenavirus,Arenaviridae,3052314 -Astrovirus MLB2,Astrovirus MLB2,,Astroviridae,683172 -Astrovirus MLB3,Astrovirus MLB3,,Astroviridae,1247114 -Astrovirus VA1,Mamastrovirus 9,Mamastrovirus,Astroviridae,645687 -Astrovirus VA3,Astrovirus VA3,,Astroviridae,683174 -Astrovirus VA4,Astrovirus VA4,,Astroviridae,1247113 -Bastrovirus 7,Bastrovirus BAS-1,,Astroviridae,1803394 -HMO Astrovirus A,HMO Astrovirus A,Mamastrovirus,Astroviridae,682382 -Human astrovirus BF34,Burkina Faso astrovirus,Mamastrovirus,Astroviridae,1518575 -Norovirus GI,Norwalk virus,Norovirus,Caliciviridae,122928 -Norovirus GI/Hu/JP/2007/GI.P3_GI.3/Shimizu/KK2866,Norwalk virus,Norovirus,Caliciviridae,1529909 -Norovirus GII,Norwalk virus,Norovirus,Caliciviridae,122929 -Norovirus GII.17,Norwalk virus,Norovirus,Caliciviridae,552592 -Norovirus GII/Hu/JP/2007/GII.P15_GII.15/Sapporo/HK299,Norwalk virus,Norovirus,Caliciviridae,1529918 -Norovirus GII/Hu/JP/2011/GII/Yuzawa/Gira2HS,Norwalk virus,Norovirus,Caliciviridae,1529924 -Norovirus GIV,Norwalk virus,Norovirus,Caliciviridae,262897 -Sapovirus Hu/GI/Sapporo/MT-2010/1982,Sapporo virus,Sapovirus,Caliciviridae,758863 -Cyclovirus NG12,Cyclovirus mmadu,Cyclovirus,Circoviridae,742922 -Cyclovirus NG14,Cyclovirus mutum,Cyclovirus,Circoviridae,742923 -Cyclovirus PK5006,Cyclovirus insaan,Cyclovirus,Circoviridae,742915 -Cyclovirus PK5034,Cyclovirus homa,Cyclovirus,Circoviridae,742916 -Cyclovirus PK5222,Cyclovirus manukha,Cyclovirus,Circoviridae,742917 -Cyclovirus PK5510,Cyclovirus maanav,Cyclovirus,Circoviridae,742918 -Cyclovirus SL-108277,Cyclovirus manitan,Cyclovirus,Circoviridae,1520935 -Cyclovirus TN25,Cyclovirus bashri,Cyclovirus,Circoviridae,742924 -Cyclovirus VN,Cyclovirus nhanloai,Cyclovirus,Circoviridae,1348500 -Human associated cyclovirus 10,Cyclovirus humana,Cyclovirus,Circoviridae,2038728 -Human circovirus VS6600022,Human circovirus VS6600022,Circovirus,Circoviridae,1525173 -Human cyclovirus VS5700009,Cyclovirus munthu,Cyclovirus,Circoviridae,1345637 -Human fecal virus Jorvi2,Human fecal virus Jorvi2,,Circoviridae,2017081 -Human fecal virus Jorvi3,Human fecal virus Jorvi3,,Circoviridae,2017082 -Human fecal virus Jorvi4,Human fecal virus Jorvi4,,Circoviridae,2017083 -Human PoSCV5-like circular virus,Human PoSCV5-like circular virus,,Circoviridae,1965018 -Human stool-associated circular virus NG13,Circovirus eniyan,Circovirus,Circoviridae,743300 -Indian encephalitis associated cyclovirus,Cyclovirus manusyan,Cyclovirus,Circoviridae,1755290 -Betacoronavirus England 1,Middle East respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,1263720 -Human coronavirus HKU1,Human coronavirus HKU1,Betacoronavirus,Coronaviridae,290028 -Middle East respiratory syndrome-related coronavirus,Middle East respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,1335626 -SARS coronavirus Tor2,Severe acute respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,227984 -Severe acute respiratory syndrome coronavirus 2,Severe acute respiratory syndrome-related coronavirus,Betacoronavirus,Coronaviridae,2697049 -Bundibugyo ebolavirus,Orthoebolavirus bundibugyoense,Orthoebolavirus,Filoviridae,565995 -Orthomarburgvirus marburgense,Orthomarburgvirus marburgense,Orthomarburgvirus,Filoviridae,3052505 -Sudan ebolavirus,Orthoebolavirus sudanense,Orthoebolavirus,Filoviridae,186540 -Tai Forest ebolavirus,Orthoebolavirus taiense,Orthoebolavirus,Filoviridae,186541 -Hepacivirus platyrrhini,Hepacivirus platyrrhini,Hepacivirus,Flaviviridae,3052236 -Hepatitis C virus genotype 3,Hepacivirus hominis,Hepacivirus,Flaviviridae,356114 -Hepatitis C virus genotype 4,Hepacivirus hominis,Hepacivirus,Flaviviridae,33745 -Hepatitis C virus genotype 5,Hepacivirus hominis,Hepacivirus,Flaviviridae,33746 -Hepatitis C virus genotype 7,Hepacivirus hominis,Hepacivirus,Flaviviridae,1544901 -Human hepegivirus,Pegivirus columbiaense,Pegivirus,Flaviviridae,1704090 -Human pegivirus 2,Pegivirus columbiaense,Pegivirus,Flaviviridae,1729141 -Zika virus,Orthoflavivirus zikaense,Orthoflavivirus,Flaviviridae,64320 -Gemycircularvirus C1c,Gemykibivirus humas3,Gemykibivirus,Genomoviridae,1673681 -Gemycircularvirus HV-GcV1,Gemycircularvirus HV-GcV1,Gemycircularvirus,Genomoviridae,1862824 -Gemycircularvirus HV-GcV2,Gemykibivirus humas5,Gemykibivirus,Genomoviridae,1862825 -Gemycircularvirus sp.,Gemycircularvirus sp.,Gemycircularvirus,Genomoviridae,1983771 -Human associated gemyvongvirus 1,Gemyvongvirus humas1,Gemyvongvirus,Genomoviridae,1985415 -Human gemycircularvirus GeTz1,Gemykibivirus humas4,Gemykibivirus,Genomoviridae,1792832 -Human genital-associated circular DNA virus-1,Gemygorvirus sewopo1,Gemygorvirus,Genomoviridae,1488574 -Orthohantavirus sinnombreense,Orthohantavirus sinnombreense,Orthohantavirus,Hantaviridae,3052499 -Rubella virus,Rubivirus rubellae,Rubivirus,Matonaviridae,11041 -Beiji nairovirus,Beiji nairovirus,Orthonairovirus,Nairoviridae,2304647 -Songling virus,Songling virus,Orthonairovirus,Nairoviridae,2795181 -Yezo virus,Yezo virus,Orthonairovirus,Nairoviridae,2825847 -Human alphaherpesvirus 2,Simplexvirus humanalpha2,Simplexvirus,Orthoherpesviridae,10310 -Human alphaherpesvirus 3,Varicellovirus humanalpha3,Varicellovirus,Orthoherpesviridae,10335 -Human betaherpesvirus 5,Cytomegalovirus humanbeta5,Cytomegalovirus,Orthoherpesviridae,10359 -Human betaherpesvirus 6A,Roseolovirus humanbeta6a,Roseolovirus,Orthoherpesviridae,32603 -Human betaherpesvirus 6B,Roseolovirus humanbeta6b,Roseolovirus,Orthoherpesviridae,32604 -Human betaherpesvirus 7,Roseolovirus humanbeta7,Roseolovirus,Orthoherpesviridae,10372 -human gammaherpesvirus 4,Lymphocryptovirus humangamma4,Lymphocryptovirus,Orthoherpesviridae,10376 -Human gammaherpesvirus 8,Rhadinovirus humangamma8,Rhadinovirus,Orthoherpesviridae,37296 -Human herpesvirus 4 type 2,Lymphocryptovirus humangamma4,Lymphocryptovirus,Orthoherpesviridae,12509 -Influenza A virus (A/California/07/2009(H1N1)),Alphainfluenzavirus influenzae,Alphainfluenzavirus,Orthomyxoviridae,641809 -Influenza A virus (A/New York/392/2004(H3N2)),Alphainfluenzavirus influenzae,Alphainfluenzavirus,Orthomyxoviridae,335341 -Influenza A virus (A/Shanghai/02/2013(H7N9)),Alphainfluenzavirus influenzae,Alphainfluenzavirus,Orthomyxoviridae,1332244 -Gammapapillomavirus sp.,Gammapapillomavirus sp.,Gammapapillomavirus,Papillomaviridae,2049444 -Human papillomavirus,Human papillomavirus,,Papillomaviridae,10566 -Human papillomavirus 116,Gammapapillomavirus 9,Gammapapillomavirus,Papillomaviridae,915428 -Human papillomavirus 121,Gammapapillomavirus 10,Gammapapillomavirus,Papillomaviridae,915429 -Human papillomavirus 126,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1055684 -Human papillomavirus 127,Gammapapillomavirus 12,Gammapapillomavirus,Papillomaviridae,746832 -Human papillomavirus 132,Gammapapillomavirus 12,Gammapapillomavirus,Papillomaviridae,909331 -Human papillomavirus 134,Gammapapillomavirus 7,Gammapapillomavirus,Papillomaviridae,909333 -Human papillomavirus 135,Gammapapillomavirus 15,Gammapapillomavirus,Papillomaviridae,1070408 -Human papillomavirus 136,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1070409 -Human papillomavirus 140,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1070413 -Human papillomavirus 154,Gammapapillomavirus 11,Gammapapillomavirus,Papillomaviridae,1195796 -human papillomavirus 166,Gammapapillomavirus 19,Gammapapillomavirus,Papillomaviridae,1315259 -Human papillomavirus 167,Gammapapillomavirus 21,Gammapapillomavirus,Papillomaviridae,1420545 -Human papillomavirus 172,Gammapapillomavirus 22,Gammapapillomavirus,Papillomaviridae,1434987 -Human papillomavirus 175,Gammapapillomavirus 23,Gammapapillomavirus,Papillomaviridae,1434782 -Human papillomavirus 178,Gammapapillomavirus 24,Gammapapillomavirus,Papillomaviridae,1478160 -Human papillomavirus 179,Gammapapillomavirus 15,Gammapapillomavirus,Papillomaviridae,1472342 -Human papillomavirus 184,Gammapapillomavirus 25,Gammapapillomavirus,Papillomaviridae,1472343 -Human papillomavirus 187,Gammapapillomavirus 26,Gammapapillomavirus,Papillomaviridae,1851130 -Human papillomavirus 201,Gammapapillomavirus 27,Gammapapillomavirus,Papillomaviridae,1682340 -Human papillomavirus 204,Mupapillomavirus 3,Mupapillomavirus,Papillomaviridae,1650736 -Human papillomavirus KC5,Human papillomavirus KC5,Gammapapillomavirus,Papillomaviridae,1647924 -Human papillomavirus type 161,Gammapapillomavirus 19,Gammapapillomavirus,Papillomaviridae,1315264 -Human papillomavirus type 85,Human papillomavirus type 85,,Papillomaviridae,652810 -Sosuga virus,Pararubulavirus sosugaense,Pararubulavirus,Paramyxoviridae,1452514 -Bocaparvovirus primate1,Bocaparvovirus primate1,Bocaparvovirus,Parvoviridae,3052040 -Bufavirus-3,Bufavirus-3,,Parvoviridae,1391667 -Cutavirus,Protoparvovirus primate3,Protoparvovirus,Parvoviridae,1867125 -Human bocavirus 2c PK,Bocaparvovirus primate2,Bocaparvovirus,Parvoviridae,1511882 -Human bocavirus 3,Bocaparvovirus primate1,Bocaparvovirus,Parvoviridae,638313 -Human bocavirus 4 NI,Bocaparvovirus primate2,Bocaparvovirus,Parvoviridae,1511883 -Human erythrovirus V9,Human erythrovirus V9,Erythroparvovirus,Parvoviridae,72197 -Human parvovirus 4 G1,Tetraparvovirus primate1,Tetraparvovirus,Parvoviridae,1511919 -Parvovirus NIH-CQV,Parvovirus NIH-CQV,,Parvoviridae,1341019 -Orthobunyavirus bwambaense,Orthobunyavirus bwambaense,Orthobunyavirus,Peribunyaviridae,3052384 -Catu virus,Orthobunyavirus catuense,Orthobunyavirus,Peribunyaviridae,1678225 -Fort Sherman virus,Orthobunyavirus shermanense,Orthobunyavirus,Peribunyaviridae,273345 -Guaroa virus,Orthobunyavirus guaroaense,Orthobunyavirus,Peribunyaviridae,80941 -Ilesha virus,Orthobunyavirus ileshaense,Orthobunyavirus,Peribunyaviridae,273341 -Madrid virus,Orthobunyavirus madridense,Orthobunyavirus,Peribunyaviridae,348013 -Alenquer virus,Phlebovirus alenquerense,Phlebovirus,Phenuiviridae,629726 -Chandiru virus,Phlebovirus candiruense,Phlebovirus,Phenuiviridae,629725 -Cocle virus,Phlebovirus cocleense,Phlebovirus,Phenuiviridae,1649829 -Dar es Salaam virus TZ-189,Tanzavirus daressalaamense,Tanzavirus,Phenuiviridae,2576944 -Echarate virus,Phlebovirus echarateense,Phlebovirus,Phenuiviridae,1000646 -Heartland virus,Bandavirus heartlandense,Bandavirus,Phenuiviridae,1216928 -Maldonado virus,Phlebovirus maldonadoense,Phlebovirus,Phenuiviridae,1004889 -Punta Toro virus,Phlebovirus toroense,Phlebovirus,Phenuiviridae,11587 -Sandfly fever Turkey virus,Phlebovirus siciliaense,Phlebovirus,Phenuiviridae,688699 -Severe fever with thrombocytopenia virus,Bandavirus dabieense,Bandavirus,Phenuiviridae,1003835 -SFTS virus HB29,Bandavirus dabieense,Bandavirus,Phenuiviridae,992212 -aichivirus A1,Aichivirus A,Kobuvirus,Picornaviridae,1313215 -Cosavirus A,Cosavirus A,Cosavirus,Picornaviridae,1330491 -Cosavirus D,Cosavirus D,Cosavirus,Picornaviridae,2003650 -Cosavirus E,Cosavirus E,Cosavirus,Picornaviridae,2003651 -Cosavirus F,Cosavirus F,Cosavirus,Picornaviridae,2003652 -Cosavirus JMY-2014,Cosavirus JMY-2014,Cosavirus,Picornaviridae,1582094 -Coxsackievirus B3,Enterovirus B,Enterovirus,Picornaviridae,12072 -enterovirus A114,Enterovirus A,Enterovirus,Picornaviridae,2760809 -Human cosavirus,Human cosavirus,Cosavirus,Picornaviridae,1233383 -Human cosavirus B,Cosavirus B,Cosavirus,Picornaviridae,586420 -rosavirus A2,Rosavirus A,Rosavirus,Picornaviridae,1511807 -Salivirus A,Salivirus A,Salivirus,Picornaviridae,1330524 -Salivirus FHB,Salivirus FHB,Salivirus,Picornaviridae,1547495 -Salivirus NG-J1,Salivirus A,Salivirus,Picornaviridae,651733 -Human polyomavirus 6,Deltapolyomavirus sextihominis,Deltapolyomavirus,Polyomaviridae,746830 -Human polyomavirus 7,Deltapolyomavirus septihominis,Deltapolyomavirus,Polyomaviridae,746831 -Human polyomavirus 9,Alphapolyomavirus nonihominis,Alphapolyomavirus,Polyomaviridae,943908 -LI polyomavirus,Alphapolyomavirus quardecihominis,Alphapolyomavirus,Polyomaviridae,1965344 -Merkel cell polyomavirus,Alphapolyomavirus quintihominis,Alphapolyomavirus,Polyomaviridae,493803 -MW polyomavirus,Deltapolyomavirus decihominis,Deltapolyomavirus,Polyomaviridae,1203539 -New Jersey polyomavirus-2013,Alphapolyomavirus terdecihominis,Alphapolyomavirus,Polyomaviridae,1497391 -STL polyomavirus,Deltapolyomavirus undecihominis,Deltapolyomavirus,Polyomaviridae,1277649 -Trichodysplasia spinulosa-associated polyomavirus,Alphapolyomavirus octihominis,Alphapolyomavirus,Polyomaviridae,862909 -Akhmeta virus,Akhmeta virus,Orthopoxvirus,Poxviridae,2200830 -Monkeypox virus,Monkeypox virus,Orthopoxvirus,Poxviridae,10244 -NY_014 poxvirus,NY_014 poxvirus,Centapoxvirus,Poxviridae,2025360 -Human lung-associated vientovirus FB,Vientovirus,Torbevirus,Redondoviridae,2571082 -Central cimpanzee simian foamy virus,Central cimpanzee simian foamy virus,Simiispumavirus,Retroviridae,2170194 -Eastern chimpanzee simian foamy virus,Eastern chimpanzee simian foamy virus,Simiispumavirus,Retroviridae,2170195 -Guenon simian foamy virus,Guenon simian foamy virus,Simiispumavirus,Retroviridae,2170197 -Human endogenous retrovirus K113,Human endogenous retrovirus K,,Retroviridae,166122 -Human immunodeficiency virus 1,Human immunodeficiency virus 1,Lentivirus,Retroviridae,11676 -Human immunodeficiency virus 2,Human immunodeficiency virus 2,Lentivirus,Retroviridae,11709 -Human T-lymphotropic virus 4,Human T-lymphotropic virus 4,Deltaretrovirus,Retroviridae,318279 -Tibrovirus congo,Tibrovirus congo,Tibrovirus,Rhabdoviridae,1987017 -Chandipura virus,Vesiculovirus chandipura,Vesiculovirus,Rhabdoviridae,11272 -Lyssavirus duvenhage,Lyssavirus duvenhage,Lyssavirus,Rhabdoviridae,38767 -Ekpoma virus 1,Tibrovirus alphaekpoma,Tibrovirus,Rhabdoviridae,1987020 -Ekpoma virus 2,Tibrovirus betaekpoma,Tibrovirus,Rhabdoviridae,1987021 -European bat lyssavirus 2,Lyssavirus helsinki,Lyssavirus,Rhabdoviridae,57483 -Le Dantec virus,Ledantevirus ledantec,Ledantevirus,Rhabdoviridae,318848 -Mundri virus,Mundri virus,,Rhabdoviridae,2913478 -Lebombo virus,Lebombo virus,Orbivirus,Sedoreoviridae,40057 -Orungo virus,Orungo virus,Orbivirus,Sedoreoviridae,40058 -Human associated huchismacovirus 1,Human associated huchismacovirus 1,Huchismacovirus,Smacoviridae,2169934 -Human associated huchismacovirus 2,Human associated huchismacovirus 2,Huchismacovirus,Smacoviridae,2169935 -Human associated huchismacovirus 3,Human associated huchismacovirus 3,Huchismacovirus,Smacoviridae,2169936 -Human associated porprismacovirus,Inpeasmacovirus humas1,Inpeasmacovirus,Smacoviridae,2530494 -Human associated porprismacovirus 3,Porprismacovirus humas4,Porprismacovirus,Smacoviridae,2496633 -Human feces smacovirus 2,Porprismacovirus humas1,Porprismacovirus,Smacoviridae,1820158 -Human feces smacovirus 3,Porprismacovirus humas3,Porprismacovirus,Smacoviridae,1820159 -Human smacovirus 1,Human smacovirus 1,Huchismacovirus,Smacoviridae,1595998 -Mammalian orthoreovirus 3 Dearing,Mammalian orthoreovirus,Orthoreovirus,Spinareoviridae,10886 -Ross River virus,Ross River virus,Alphavirus,Togaviridae,11029 -Circo-like virus-Brazil hs1,Circo-like virus-Brazil,,,1346815 -Hudisavirus sp.,Hudisavirus sp.,,,2021738 -West Nile virus strain NY-99,West Nile virus,Flavivirus,Flaviviridae,1968826 -BK polyomavirus MM,BK polyomavirus,Betapolyomavirus,Polyomaviridae,1417981 -Banana virus X,Banna virus,Bannavirus,Reoviridae,307671 -Bombali virus,Ebolavirus,Ebolavirus,Filoviridae,2010960 -Bourbon virus,Bourbon virus,Thogotovirus,Orthomyxoviridae,1618189 -Dhori virus (strain Indian/1313/61),Dhori virus,Thogotovirus,Orthomyxoviridae,11319 -Encephalomyocarditis virus,Encephalomyocarditis virus,Cardiovirus,Picornaviridae,12104 -Eyach virus,Eyach virus,Coltivirus,Reoviridae,62352 -Henipavirus hendraense,Hendra virus,Henipavirus,Paramyxoviridae,3052223 -Henipavirus nipahense,Nipah virus,Henipavirus,Paramyxoviridae,3052225 -Hepatitis B virus,Hepatitis B virus,Orthohepadnavirus,Hepadnaviridae,10407 -Hepatitis delta virus,Hepatitis delta virus,Deltavirus,Deltaflexiviridae,12475 -Hepatovirus A,Hepatitis A virus,Hepatovirus,Picornaviridae,12092 -Human foamy virus,Human foamy virus,Spumavirus,Retroviridae,11641 -human metapneumovirus,Human metapneumovirus,Metapneumovirus,Paramyxoviridae,162145 -Human orthorubulavirus 2,Human orthorubulavirus 2,Orthorubulavirus,Paramyxoviridae,2560525 -Human papillomavirus,Human papillomavirus,Papillomavirus,Papillomaviridae,10566 -Betapolyomavirus tertihominis,KI Polyomavirus,Betapolyomavirus,Polyomaviridae,1891764 -Human respirovirus 1,Human Respirovirus 1,Respirovirus,Paramyxoviridae,12730 -Human respirovirus 3,Human Respirovirus 3,Respirovirus,Paramyxoviridae,11216 -Human torovirus,Human torovirus,Torovirus,Toroviridae,67605 -Influenza B virus (B/Lee/1940),Influenza B virus,Betainfluenzavirus,Orthomyxoviridae,518987 -Influenza C virus (C/Ann Arbor/1/50),Influenza C virus,Gammainfluenzavirus,Orthomyxoviridae,11553 -Japanese encephalitis virus,Japanese encephalitis virus,Flavivirus,Flaviviridae,11072 -Measles morbillivirus,Morbillivirus,Morbillivirus,Paramyxoviridae,11234 -Merkel cell polyomavirus,Merkel cell polyomavirus,Orthopolyomavirus,Polyomaviridae,493803 -Molluscum contagiosum virus subtype 1,Molluscum contagiosum virus,Molluscipoxvirus,Poxviridae,10280 -Mumps orthorubulaviru,Mumps virus,Orthorubulavirus,Paramyxoviridae,2560602 -Murray Valley encephalitis virus,Murray valley encephalitis virus,Flavivirus,Flaviviridae,11079 -Orf virus,Orf virus,Parapoxvirus,Poxviridae,10258 -Orthomarburgvirus marburgense,Lake Victoria marburgvirus,Marburgvirus,Filoviridae,3052505 -Rotavirus A,Rotavirus A,Rotavirus,Reoviridae,28875 -Rotavirus C,Rotavirus C,Rotavirus,Reoviridae,36427 -St. Louis encephalitis virus,Saint Louis encephalitis virus,Flavivirus,Flaviviridae,11080 -Thogotovirus,Thogotovirus,Thogotovirus,Orthomyxoviridae,35323 -Tick-borne encephalitis virus,Tick-borne encephalitis virus,Flavivirus,Flaviviridae,11084 -Torque teno virus 6,Torque teno virus,Anellovirus,Anelloviridae,687345 -WU Polyomavirus,WU polyomavirus,Betapolyomavirus,Polyomaviridae,440266 -Yaba monkey tumor virus,Yaba monkey tumor virus,Yatapoxvirus,Poxviridae,38804 -Yaba-like disease virus,Yaba-like disease virus,Yatapoxvirus,Poxviridae,132475 -Zika virus,Zika virus,Flavivirus,Flaviviridae,64320 -dengue virus type 1,Dengue virus,Flavivirus,Flaviviridae,11053 +Organism_Name;Species;Genus;Family;Taxid;Notes +Human mastadenovirus A;Human mastadenovirus A;Mastadenovirus;Adenoviridae;129875; +Human mastadenovirus B;Human mastadenovirus B;Mastadenovirus;Adenoviridae;108098; +Human mastadenovirus C;Human mastadenovirus C;Mastadenovirus;Adenoviridae;129951; +Human mastadenovirus D;Human mastadenovirus D;Mastadenovirus;Adenoviridae;130310; +Human mastadenovirus E;Human mastadenovirus E;Mastadenovirus;Adenoviridae;130308; +human adenovirus 52;Human mastadenovirus G;Mastadenovirus;Adenoviridae;332179; +Human mastadenovirus F;Human mastadenovirus F;Mastadenovirus;Adenoviridae;130309; +Lyssavirus rabies;Rabies virus ;Lyssavirus;Alpharhabdovirinae;11292; +Anelloviridae sp.;Anelloviridae sp.;;Anelloviridae;2055263; +Gyrovirus 4;Gyrovirus homsa3;Gyrovirus;Anelloviridae;1214955; +Gyrovirus GyV3;Gyrovirus homsa1;Gyrovirus;Anelloviridae;1163715; +Gyrovirus Tu243;Gyrovirus homsa4;Gyrovirus;Anelloviridae;1415627; +Gyrovirus Tu789;Gyrovirus homsa2;Gyrovirus;Anelloviridae;1415628; +Small anellovirus 1;Small anellovirus;;Anelloviridae;289366; +Small anellovirus 2;Small anellovirus;;Anelloviridae;289367; +Torque teno midi virus 1;Gammatorquevirus homidi1;Gammatorquevirus;Anelloviridae;687379; +Torque teno midi virus 10;Gammatorquevirus homidi10;Gammatorquevirus;Anelloviridae;2065051; +Torque teno midi virus 11;Gammatorquevirus homidi11;Gammatorquevirus;Anelloviridae;2065052; +Torque teno midi virus 12;Gammatorquevirus homidi12;Gammatorquevirus;Anelloviridae;2065053; +Torque teno midi virus 13;Gammatorquevirus homidi13;Gammatorquevirus;Anelloviridae;2065054; +Torque teno midi virus 14;Gammatorquevirus homidi14;Gammatorquevirus;Anelloviridae;2065055; +Torque teno midi virus 2;Gammatorquevirus homidi2;Gammatorquevirus;Anelloviridae;687380; +Torque teno midi virus 3;Gammatorquevirus homidi3;Gammatorquevirus;Anelloviridae;2065044; +Torque teno midi virus 4;Gammatorquevirus homidi4;Gammatorquevirus;Anelloviridae;2065045; +Torque teno midi virus 5;Gammatorquevirus homidi5;Gammatorquevirus;Anelloviridae;2065046; +Torque teno midi virus 6;Gammatorquevirus homidi6;Gammatorquevirus;Anelloviridae;2065047; +Torque teno midi virus 7;Gammatorquevirus homidi7;Gammatorquevirus;Anelloviridae;2065048; +Torque teno midi virus 8;Gammatorquevirus homidi8;Gammatorquevirus;Anelloviridae;2065049; +Torque teno midi virus 9;Gammatorquevirus homidi9;Gammatorquevirus;Anelloviridae;2065050; +Torque teno mini virus 1;Betatorquevirus homini1;Betatorquevirus;Anelloviridae;687369; +Torque teno mini virus 10;Betatorquevirus homini10;Betatorquevirus;Anelloviridae;2065036; +Torque teno mini virus 11;Betatorquevirus homini11;Betatorquevirus;Anelloviridae;2065037; +Torque teno mini virus 12;Betatorquevirus homini12;Betatorquevirus;Anelloviridae;2065038; +Torque teno mini virus 18;Betatorquevirus homini18;Betatorquevirus;Anelloviridae;1859149; +Torque teno mini virus 5;Betatorquevirus homini5;Betatorquevirus;Anelloviridae;687373; +Torque teno mini virus 6;Betatorquevirus homini6;Betatorquevirus;Anelloviridae;687374; +Torque teno mini virus 8;Betatorquevirus homini8;Betatorquevirus;Anelloviridae;687376; +Torque teno mini virus ALA22;Betatorquevirus homini27;Betatorquevirus;Anelloviridae;1535290; +Torque teno mini virus ALH8;Betatorquevirus homini16;Betatorquevirus;Anelloviridae;1535291; +Torque teno mini virus SHA;Betatorquevirus homini26;Betatorquevirus;Anelloviridae;2057931; +Torque teno virus;Torque teno virus;;Anelloviridae;68887; +Torque teno virus 9;Alphatorquevirus homin9;Alphatorquevirus;Anelloviridae;687348; +TTV-like mini virus;TTV-like mini virus;Betatorquevirus;Anelloviridae;93678; +Torque teno virus 6;Torque teno virus;Anellovirus;Anelloviridae;687345; +Mammarenavirus chapareense;Mammarenavirus chapareense;Mammarenavirus;Arenaviridae;3052302; +Mammarenavirus lujoense;Mammarenavirus lujoense;Mammarenavirus;Arenaviridae;3052314; +Mammarenavirus juninense;Mammarenavirus juninense;Mammarenavirus;Arenaviridae;2169991; +Mammarenavirus lassaense;Mammarenavirus lassaense ;Mammarenavirus;Arenaviridae;3052310; +Mammarenavirus choriomeningitidis;Mammarenavirus choriomeningitidis;Mammarenavirus;Arenaviridae;3052303; +Mammarenavirus machupoense;Mammarenavirus machupoense;Mammarenavirus;Arenaviridae;3052317; +Sabia virus;Mammarenavirus brazilense;Mammarenavirus;Arenaviridae;2907957; +Mammarenavirus whitewaterense;Mammarenavirus whitewaterense;Mammarenavirus;Arenaviridae;3052331; +Astrovirus MLB2;Astrovirus MLB2;;Astroviridae;683172; +Astrovirus MLB3;Astrovirus MLB3;;Astroviridae;1247114; +Astrovirus VA1;Mamastrovirus 9;Mamastrovirus;Astroviridae;645687; +Astrovirus VA3;Astrovirus VA3;;Astroviridae;683174; +Astrovirus VA4;Astrovirus VA4;;Astroviridae;1247113; +Bastrovirus 7;Bastrovirus BAS-1;;Astroviridae;1803394; +HMO Astrovirus A;HMO Astrovirus A;Mamastrovirus;Astroviridae;682382; +Human astrovirus BF34;Burkina Faso astrovirus;Mamastrovirus;Astroviridae;1518575; +Borna disease virus 1;Orthobornavirus bornaense;Orthobornavirus;Bornaviridae;1714621; +Borna disease virus 2;Orthobornavirus bornaense;Orthobornavirus;Bornaviridae;1714622; +Norovirus GI;Norwalk virus;Norovirus;Caliciviridae;122928; +Norovirus GI/Hu/JP/2007/GI.P3_GI.3/Shimizu/KK2866;Norwalk virus;Norovirus;Caliciviridae;1529909; +Norovirus GII;Norwalk virus;Norovirus;Caliciviridae;122929; +Norovirus GII.17;Norwalk virus;Norovirus;Caliciviridae;552592; +Norovirus GII/Hu/JP/2007/GII.P15_GII.15/Sapporo/HK299;Norwalk virus;Norovirus;Caliciviridae;1529918; +Norovirus GII/Hu/JP/2011/GII/Yuzawa/Gira2HS;Norwalk virus;Norovirus;Caliciviridae;1529924; +Norovirus GIV;Norwalk virus;Norovirus;Caliciviridae;262897; +Sapovirus Hu/GI/Sapporo/MT-2010/1982;Sapporo virus;Sapovirus;Caliciviridae;758863; +Cyclovirus NG12;Cyclovirus mmadu;Cyclovirus;Circoviridae;742922; +Cyclovirus NG14;Cyclovirus mutum;Cyclovirus;Circoviridae;742923; +Cyclovirus PK5006;Cyclovirus insaan;Cyclovirus;Circoviridae;742915; +Cyclovirus PK5034;Cyclovirus homa;Cyclovirus;Circoviridae;742916; +Cyclovirus PK5222;Cyclovirus manukha;Cyclovirus;Circoviridae;742917; +Cyclovirus PK5510;Cyclovirus maanav;Cyclovirus;Circoviridae;742918; +Cyclovirus SL-108277;Cyclovirus manitan;Cyclovirus;Circoviridae;1520935; +Cyclovirus TN25;Cyclovirus bashri;Cyclovirus;Circoviridae;742924; +Cyclovirus VN;Cyclovirus nhanloai;Cyclovirus;Circoviridae;1348500; +Human associated cyclovirus 10;Cyclovirus humana;Cyclovirus;Circoviridae;2038728; +Human circovirus VS6600022;Human circovirus VS6600022;Circovirus;Circoviridae;1525173; +Human cyclovirus VS5700009;Cyclovirus munthu;Cyclovirus;Circoviridae;1345637; +Human fecal virus Jorvi2;Human fecal virus Jorvi2;;Circoviridae;2017081; +Human fecal virus Jorvi3;Human fecal virus Jorvi3;;Circoviridae;2017082; +Human fecal virus Jorvi4;Human fecal virus Jorvi4;;Circoviridae;2017083; +Human PoSCV5-like circular virus;Human PoSCV5-like circular virus;;Circoviridae;1965018; +Human stool-associated circular virus NG13;Circovirus eniyan;Circovirus;Circoviridae;743300; +Indian encephalitis associated cyclovirus;Cyclovirus manusyan;Cyclovirus;Circoviridae;1755290; +Betacoronavirus England 1;Middle East respiratory syndrome-related coronavirus;Betacoronavirus;Coronaviridae;1263720; +Human coronavirus HKU1;Human coronavirus HKU1;Betacoronavirus;Coronaviridae;290028; +Middle East respiratory syndrome-related coronavirus;Middle East respiratory syndrome-related coronavirus;Betacoronavirus;Coronaviridae;1335626; +SARS coronavirus Tor2;Severe acute respiratory syndrome-related coronavirus;Betacoronavirus;Coronaviridae;227984; +Severe acute respiratory syndrome coronavirus 2;Severe acute respiratory syndrome-related coronavirus;Betacoronavirus;Coronaviridae;2697049; +Hepatitis delta virus;Hepatitis delta virus;Deltavirus;Deltaflexiviridae;12475; +Bundibugyo ebolavirus;Orthoebolavirus bundibugyoense;Orthoebolavirus;Filoviridae;565995; +Orthomarburgvirus marburgense;Orthomarburgvirus marburgense;Orthomarburgvirus;Filoviridae;3052505; +Sudan ebolavirus;Orthoebolavirus sudanense;Orthoebolavirus;Filoviridae;186540; +Tai Forest ebolavirus;Orthoebolavirus taiense;Orthoebolavirus;Filoviridae;186541; +Bombali virus;Ebolavirus;Ebolavirus;Filoviridae;2010960; +Orthomarburgvirus marburgense;Lake Victoria marburgvirus;Marburgvirus;Filoviridae;3052505; +Hepacivirus platyrrhini;Hepacivirus platyrrhini;Hepacivirus;Flaviviridae;3052236; +Hepatitis C virus genotype 3;Hepacivirus hominis;Hepacivirus;Flaviviridae;356114; +Hepatitis C virus genotype 4;Hepacivirus hominis;Hepacivirus;Flaviviridae;33745; +Hepatitis C virus genotype 5;Hepacivirus hominis;Hepacivirus;Flaviviridae;33746; +Hepatitis C virus genotype 7;Hepacivirus hominis;Hepacivirus;Flaviviridae;1544901; +Human hepegivirus;Pegivirus columbiaense;Pegivirus;Flaviviridae;1704090; +Human pegivirus 2;Pegivirus columbiaense;Pegivirus;Flaviviridae;1729141; +Zika virus;Orthoflavivirus zikaense;Orthoflavivirus;Flaviviridae;64320; +West Nile virus strain NY-99;West Nile virus;Flavivirus;Flaviviridae;1968826; +Japanese encephalitis virus;Japanese encephalitis virus;Flavivirus;Flaviviridae;11072; +Murray Valley encephalitis virus;Murray valley encephalitis virus;Flavivirus;Flaviviridae;11079; +St. Louis encephalitis virus;Saint Louis encephalitis virus;Flavivirus;Flaviviridae;11080; +Tick-borne encephalitis virus;Tick-borne encephalitis virus;Flavivirus;Flaviviridae;11084; +Zika virus;Zika virus;Flavivirus;Flaviviridae;64320; +dengue virus type 1; Orthoflavivirus denguei;Orthoflavivirus;Flaviviridae;11053; +dengue virus type 2; Orthoflavivirus denguei;Orthoflavivirus;Flaviviridae;11060; +dengue virus type 3; Orthoflavivirus denguei;Orthoflavivirus;Flaviviridae;11069; +dengue virus type 4; Orthoflavivirus denguei;Orthoflavivirus;Flaviviridae;11070; +Hepatitis C virus genotype 1;Hepacivirus hominis;Hepacivirus;Flaviviridae;41856; +"Hepatitis C virus genotype 2 strain=HC-J6CH";Hepacivirus hominis;Hepacivirus;Flaviviridae;40271; +Hepatitis C virus genotype 3;Hepacivirus hominis;Hepacivirus;Flaviviridae;356114; +Hepatitis C virus genotype 4;Hepacivirus hominis;Hepacivirus;Flaviviridae;33745; +Hepatitis C virus genotype 5;Hepacivirus hominis;Hepacivirus;Flaviviridae;33746; +Hepatitis C virus genotype 7;Hepacivirus hominis;Hepacivirus;Flaviviridae;1544901; +Gemycircularvirus C1c;Gemykibivirus humas3;Gemykibivirus;Genomoviridae;1673681; +Gemycircularvirus HV-GcV1;Gemycircularvirus HV-GcV1;Gemycircularvirus;Genomoviridae;1862824; +Gemycircularvirus HV-GcV2;Gemykibivirus humas5;Gemykibivirus;Genomoviridae;1862825; +Gemycircularvirus sp.;Gemycircularvirus sp.;Gemycircularvirus;Genomoviridae;1983771; +Human associated gemyvongvirus 1;Gemyvongvirus humas1;Gemyvongvirus;Genomoviridae;1985415; +Human gemycircularvirus GeTz1;Gemykibivirus humas4;Gemykibivirus;Genomoviridae;1792832; +Human genital-associated circular DNA virus-1;Gemygorvirus sewopo1;Gemygorvirus;Genomoviridae;1488574; +Orthohantavirus sinnombreense;Orthohantavirus sinnombreense;Orthohantavirus;Hantaviridae;3052499; +Hepatitis B virus;Hepatitis B virus;Orthohepadnavirus;Hepadnaviridae;10407; +Hepatitis E virus rat/R63/DEU/2009;Rocahepevirus ratti ;Orthohepevirinae;Hepeviridae;879096;Human Hepatitis E virus doesn't have complete genome +Rubella virus;Rubivirus rubellae;Rubivirus;Matonaviridae;11041; +Beiji nairovirus;Beiji nairovirus;Orthonairovirus;Nairoviridae;2304647; +Songling virus;Songling virus;Orthonairovirus;Nairoviridae;2795181; +Yezo virus;Yezo virus;Orthonairovirus;Nairoviridae;2825847; +Human alphaherpesvirus 1;implexvirus humanalpha1;Simplexvirus;Orthoherpesviridae;10298; +Human alphaherpesvirus 2;Simplexvirus humanalpha2;Simplexvirus;Orthoherpesviridae;10310; +Human alphaherpesvirus 3;Varicellovirus humanalpha3;Varicellovirus;Orthoherpesviridae;10335; +Human betaherpesvirus 5;Cytomegalovirus humanbeta5;Cytomegalovirus;Orthoherpesviridae;10359; +Human betaherpesvirus 6A;Roseolovirus humanbeta6a;Roseolovirus;Orthoherpesviridae;32603; +Human betaherpesvirus 6B;Roseolovirus humanbeta6b;Roseolovirus;Orthoherpesviridae;32604; +Human betaherpesvirus 7;Roseolovirus humanbeta7;Roseolovirus;Orthoherpesviridae;10372; +human gammaherpesvirus 4;Lymphocryptovirus humangamma4;Lymphocryptovirus;Orthoherpesviridae;10376; +Human gammaherpesvirus 8;Rhadinovirus humangamma8;Rhadinovirus;Orthoherpesviridae;37296; +Human herpesvirus 4 type 2;Lymphocryptovirus humangamma4;Lymphocryptovirus;Orthoherpesviridae;12509; +Influenza A virus (A/California/07/2009(H1N1));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;641809; +Influenza A virus (A/Korea/426/1968(H2N2));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;488241; +Influenza A virus (A/New York/392/2004(H3N2));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;335341; +Influenza A virus (A/goose/Guangdong/1/1996(H5N1));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;93838; +Influenza A virus (A/chicken/Mexico/23-12/2012(H5N2));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;1399123;No complete genome +Influenza A virus (A/Shanghai/02/2013(H7N9));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;1332244; +Influenza A virus (A/Hong Kong/1073/99(H9N2));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;130760; +Influenza B virus (B/Lee/1940);Influenza B virus;Betainfluenzavirus;Orthomyxoviridae;518987; +Influenza C virus (C/Ann Arbor/1/50);Influenza C virus;Gammainfluenzavirus;Orthomyxoviridae;11553; +Influenza D virus (D/swine/Oklahoma/1334/2011);Influenza D virus;Deltainfluenzavirus;Orthomyxoviridae;1173138; +Bourbon virus;Bourbon virus;Thogotovirus;Orthomyxoviridae;1618189; +Dhori virus (strain Indian/1313/61);Dhori virus;Thogotovirus;Orthomyxoviridae;11319; +Thogotovirus;Thogotovirus;Thogotovirus;Orthomyxoviridae;35323; +Gammapapillomavirus sp.;Gammapapillomavirus sp.;Gammapapillomavirus;Papillomaviridae;2049444; +Human papillomavirus;Human papillomavirus;;Papillomaviridae;10566; +Human papillomavirus 116;Gammapapillomavirus 9;Gammapapillomavirus;Papillomaviridae;915428; +Human papillomavirus 121;Gammapapillomavirus 10;Gammapapillomavirus;Papillomaviridae;915429; +Human papillomavirus 126;Gammapapillomavirus 11;Gammapapillomavirus;Papillomaviridae;1055684; +Human papillomavirus 127;Gammapapillomavirus 12;Gammapapillomavirus;Papillomaviridae;746832; +Human papillomavirus 132;Gammapapillomavirus 12;Gammapapillomavirus;Papillomaviridae;909331; +Human papillomavirus 134;Gammapapillomavirus 7;Gammapapillomavirus;Papillomaviridae;909333; +Human papillomavirus 135;Gammapapillomavirus 15;Gammapapillomavirus;Papillomaviridae;1070408; +Human papillomavirus 136;Gammapapillomavirus 11;Gammapapillomavirus;Papillomaviridae;1070409; +Human papillomavirus 140;Gammapapillomavirus 11;Gammapapillomavirus;Papillomaviridae;1070413; +Human papillomavirus 154;Gammapapillomavirus 11;Gammapapillomavirus;Papillomaviridae;1195796; +human papillomavirus 166;Gammapapillomavirus 19;Gammapapillomavirus;Papillomaviridae;1315259; +Human papillomavirus 167;Gammapapillomavirus 21;Gammapapillomavirus;Papillomaviridae;1420545; +Human papillomavirus 172;Gammapapillomavirus 22;Gammapapillomavirus;Papillomaviridae;1434987; +Human papillomavirus 175;Gammapapillomavirus 23;Gammapapillomavirus;Papillomaviridae;1434782; +Human papillomavirus 178;Gammapapillomavirus 24;Gammapapillomavirus;Papillomaviridae;1478160; +Human papillomavirus 179;Gammapapillomavirus 15;Gammapapillomavirus;Papillomaviridae;1472342; +Human papillomavirus 184;Gammapapillomavirus 25;Gammapapillomavirus;Papillomaviridae;1472343; +Human papillomavirus 187;Gammapapillomavirus 26;Gammapapillomavirus;Papillomaviridae;1851130; +Human papillomavirus 201;Gammapapillomavirus 27;Gammapapillomavirus;Papillomaviridae;1682340; +Human papillomavirus 204;Mupapillomavirus 3;Mupapillomavirus;Papillomaviridae;1650736; +Human papillomavirus KC5;Human papillomavirus KC5;Gammapapillomavirus;Papillomaviridae;1647924; +Human papillomavirus type 161;Gammapapillomavirus 19;Gammapapillomavirus;Papillomaviridae;1315264; +Human papillomavirus type 85;Human papillomavirus type 85;;Papillomaviridae;652810; +Human papillomavirus;Human papillomavirus;Papillomavirus;Papillomaviridae;10566; +Sosuga virus;Pararubulavirus sosugaense;Pararubulavirus;Paramyxoviridae;1452514; +Henipavirus hendraense;Hendra virus;Henipavirus;Paramyxoviridae;3052223; +Henipavirus nipahense;Nipah virus;Henipavirus;Paramyxoviridae;3052225; +human metapneumovirus;Human metapneumovirus;Metapneumovirus;Paramyxoviridae;162145; +Human orthorubulavirus 2;Human orthorubulavirus 2;Orthorubulavirus;Paramyxoviridae;2560525; +Human respirovirus 1;Human Respirovirus 1;Respirovirus;Paramyxoviridae;12730; +Human respirovirus 3;Human Respirovirus 3;Respirovirus;Paramyxoviridae;11216; +Measles morbillivirus;Morbillivirus;Morbillivirus;Paramyxoviridae;11234; +Mumps orthorubulaviru;Mumps virus;Orthorubulavirus;Paramyxoviridae;2560602; +Bocaparvovirus primate1;Bocaparvovirus primate1;Bocaparvovirus;Parvoviridae;3052040; +Bufavirus-3;Bufavirus-3;;Parvoviridae;1391667; +Cutavirus;Protoparvovirus primate3;Protoparvovirus;Parvoviridae;1867125; +Human bocavirus 2c PK;Bocaparvovirus primate2;Bocaparvovirus;Parvoviridae;1511882; +Human bocavirus 3;Bocaparvovirus primate1;Bocaparvovirus;Parvoviridae;638313; +Human bocavirus 4 NI;Bocaparvovirus primate2;Bocaparvovirus;Parvoviridae;1511883; +Human erythrovirus V9;Human erythrovirus V9;Erythroparvovirus;Parvoviridae;72197; +Human parvovirus 4 G1;Tetraparvovirus primate1;Tetraparvovirus;Parvoviridae;1511919; +Parvovirus NIH-CQV;Parvovirus NIH-CQV;;Parvoviridae;1341019; +Orthobunyavirus bwambaense;Orthobunyavirus bwambaense;Orthobunyavirus;Peribunyaviridae;3052384; +California encephalitis virus;Orthobunyavirus;Orthobunyavirus ;Peribunyaviridae;35305; +Catu virus;Orthobunyavirus catuense;Orthobunyavirus;Peribunyaviridae;1678225; +Fort Sherman virus;Orthobunyavirus shermanense;Orthobunyavirus;Peribunyaviridae;273345; +Guaroa virus;Orthobunyavirus guaroaense;Orthobunyavirus;Peribunyaviridae;80941; +Ilesha virus;Orthobunyavirus ileshaense;Orthobunyavirus;Peribunyaviridae;273341; +Madrid virus;Orthobunyavirus madridense;Orthobunyavirus;Peribunyaviridae;348013; +Alenquer virus;Phlebovirus alenquerense;Phlebovirus;Phenuiviridae;629726; +Chandiru virus;Phlebovirus candiruense;Phlebovirus;Phenuiviridae;629725; +Cocle virus;Phlebovirus cocleense;Phlebovirus;Phenuiviridae;1649829; +Dar es Salaam virus TZ-189;Tanzavirus daressalaamense;Tanzavirus;Phenuiviridae;2576944; +Echarate virus;Phlebovirus echarateense;Phlebovirus;Phenuiviridae;1000646; +Heartland virus;Bandavirus heartlandense;Bandavirus;Phenuiviridae;1216928; +Maldonado virus;Phlebovirus maldonadoense;Phlebovirus;Phenuiviridae;1004889; +Punta Toro virus;Phlebovirus toroense;Phlebovirus;Phenuiviridae;11587; +Sandfly fever Turkey virus;Phlebovirus siciliaense;Phlebovirus;Phenuiviridae;688699; +Severe fever with thrombocytopenia virus;Bandavirus dabieense;Bandavirus;Phenuiviridae;1003835; +SFTS virus HB29;Bandavirus dabieense;Bandavirus;Phenuiviridae;992212; +aichivirus A1;Aichivirus A;Kobuvirus;Picornaviridae;1313215; +Cosavirus A;Cosavirus A;Cosavirus;Picornaviridae;1330491; +Cosavirus D;Cosavirus D;Cosavirus;Picornaviridae;2003650; +Cosavirus E;Cosavirus E;Cosavirus;Picornaviridae;2003651; +Cosavirus F;Cosavirus F;Cosavirus;Picornaviridae;2003652; +Cosavirus JMY-2014;Cosavirus JMY-2014;Cosavirus;Picornaviridae;1582094; +Coxsackievirus B3;Enterovirus B;Enterovirus;Picornaviridae;12072; +enterovirus A114;Enterovirus A;Enterovirus;Picornaviridae;2760809; +Human cosavirus;Human cosavirus;Cosavirus;Picornaviridae;1233383; +Human cosavirus B;Cosavirus B;Cosavirus;Picornaviridae;586420; +rosavirus A2;Rosavirus A;Rosavirus;Picornaviridae;1511807; +Salivirus A;Salivirus A;Salivirus;Picornaviridae;1330524; +Salivirus FHB;Salivirus FHB;Salivirus;Picornaviridae;1547495; +Salivirus NG-J1;Salivirus A;Salivirus;Picornaviridae;651733; +Encephalomyocarditis virus;Encephalomyocarditis virus;Cardiovirus;Picornaviridae;12104; +Hepatovirus A;Hepatitis A virus;Hepatovirus;Picornaviridae;12092; +Human polyomavirus 6;Deltapolyomavirus sextihominis;Deltapolyomavirus;Polyomaviridae;746830; +Human polyomavirus 7;Deltapolyomavirus septihominis;Deltapolyomavirus;Polyomaviridae;746831; +Human polyomavirus 9;Alphapolyomavirus nonihominis;Alphapolyomavirus;Polyomaviridae;943908; +LI polyomavirus;Alphapolyomavirus quardecihominis;Alphapolyomavirus;Polyomaviridae;1965344; +Merkel cell polyomavirus;Alphapolyomavirus quintihominis;Alphapolyomavirus;Polyomaviridae;493803; +MW polyomavirus;Deltapolyomavirus decihominis;Deltapolyomavirus;Polyomaviridae;1203539; +New Jersey polyomavirus-2013;Alphapolyomavirus terdecihominis;Alphapolyomavirus;Polyomaviridae;1497391; +STL polyomavirus;Deltapolyomavirus undecihominis;Deltapolyomavirus;Polyomaviridae;1277649; +Trichodysplasia spinulosa-associated polyomavirus;Alphapolyomavirus octihominis;Alphapolyomavirus;Polyomaviridae;862909; +BK polyomavirus MM;BK polyomavirus;Betapolyomavirus;Polyomaviridae;1417981; +Betapolyomavirus tertihominis;KI Polyomavirus;Betapolyomavirus;Polyomaviridae;1891764; +Merkel cell polyomavirus;Merkel cell polyomavirus;Orthopolyomavirus;Polyomaviridae;493803; +WU Polyomavirus;WU polyomavirus;Betapolyomavirus;Polyomaviridae;440266; +Akhmeta virus;Akhmeta virus;Orthopoxvirus;Poxviridae;2200830; +Monkeypox virus;Monkeypox virus;Orthopoxvirus;Poxviridae;10244; +NY_014 poxvirus;NY_014 poxvirus;Centapoxvirus;Poxviridae;2025360; +Molluscum contagiosum virus subtype 1;Molluscum contagiosum virus;Molluscipoxvirus;Poxviridae;10280; +Orf virus;Orf virus;Parapoxvirus;Poxviridae;10258; +Yaba monkey tumor virus;Yaba monkey tumor virus;Yatapoxvirus;Poxviridae;38804; +Yaba-like disease virus;Yaba-like disease virus;Yatapoxvirus;Poxviridae;132475; +Human lung-associated vientovirus FB;Vientovirus;Torbevirus;Redondoviridae;2571082; +Banana virus X;Banna virus;Bannavirus;Reoviridae;307671; +Eyach virus;Eyach virus;Coltivirus;Reoviridae;62352; +Rotavirus A;Rotavirus A;Rotavirus;Reoviridae;28875; +Rotavirus C;Rotavirus C;Rotavirus;Reoviridae;36427; +Central cimpanzee simian foamy virus;Central cimpanzee simian foamy virus;Simiispumavirus;Retroviridae;2170194; +Eastern chimpanzee simian foamy virus;Eastern chimpanzee simian foamy virus;Simiispumavirus;Retroviridae;2170195; +Guenon simian foamy virus;Guenon simian foamy virus;Simiispumavirus;Retroviridae;2170197; +Human endogenous retrovirus K113;Human endogenous retrovirus K;;Retroviridae;166122; +Human immunodeficiency virus 1;Human immunodeficiency virus 1;Lentivirus;Retroviridae;11676; +Human immunodeficiency virus 2;Human immunodeficiency virus 2;Lentivirus;Retroviridae;11709; +Human T-lymphotropic virus 4;Human T-lymphotropic virus 4;Deltaretrovirus;Retroviridae;318279; +Human foamy virus;Human foamy virus;Spumavirus;Retroviridae;11641; +Tibrovirus congo;Tibrovirus congo;Tibrovirus;Rhabdoviridae;1987017; +Chandipura virus;Vesiculovirus chandipura;Vesiculovirus;Rhabdoviridae;11272; +Lyssavirus duvenhage;Lyssavirus duvenhage;Lyssavirus;Rhabdoviridae;38767; +Ekpoma virus 1;Tibrovirus alphaekpoma;Tibrovirus;Rhabdoviridae;1987020; +Ekpoma virus 2;Tibrovirus betaekpoma;Tibrovirus;Rhabdoviridae;1987021; +European bat lyssavirus 2;Lyssavirus helsinki;Lyssavirus;Rhabdoviridae;57483; +Le Dantec virus;Ledantevirus ledantec;Ledantevirus;Rhabdoviridae;318848; +Mundri virus;Mundri virus;;Rhabdoviridae;2913478; +Lebombo virus;Lebombo virus;Orbivirus;Sedoreoviridae;40057; +Orungo virus;Orungo virus;Orbivirus;Sedoreoviridae;40058; +Human associated huchismacovirus 1;Human associated huchismacovirus 1;Huchismacovirus;Smacoviridae;2169934; +Human associated huchismacovirus 2;Human associated huchismacovirus 2;Huchismacovirus;Smacoviridae;2169935; +Human associated huchismacovirus 3;Human associated huchismacovirus 3;Huchismacovirus;Smacoviridae;2169936; +Human associated porprismacovirus;Inpeasmacovirus humas1;Inpeasmacovirus;Smacoviridae;2530494; +Human associated porprismacovirus 3;Porprismacovirus humas4;Porprismacovirus;Smacoviridae;2496633; +Human feces smacovirus 2;Porprismacovirus humas1;Porprismacovirus;Smacoviridae;1820158; +Human feces smacovirus 3;Porprismacovirus humas3;Porprismacovirus;Smacoviridae;1820159; +Human smacovirus 1;Human smacovirus 1;Huchismacovirus;Smacoviridae;1595998; +Mammalian orthoreovirus 3 Dearing;Mammalian orthoreovirus;Orthoreovirus;Spinareoviridae;10886; +Ross River virus;Ross River virus;Alphavirus;Togaviridae;11029; +"Chikungunya virus strain=S27-African prototype";Chikungunya virus;Alphavirus;Togaviridae ;37124; +Human torovirus;Human torovirus;Torovirus;Toroviridae;67605; +Circo-like virus-Brazil hs1;Circo-like virus-Brazil;;;1346815; +Hudisavirus sp.;Hudisavirus sp.;;;2021738; \ No newline at end of file From 25241c0d5a64b91ac816185d17de4f348a7be4f6 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Mon, 24 Jun 2024 13:02:30 +0200 Subject: [PATCH 04/25] Update .nf-core.yml Co-authored-by: Sofia Stamouli <91951607+sofstam@users.noreply.github.com> --- .nf-core.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.nf-core.yml b/.nf-core.yml index 633a8ff..f45d9f7 100644 --- a/.nf-core.yml +++ b/.nf-core.yml @@ -15,7 +15,7 @@ lint: - assets/email_template.html - assets/email_template.txt - docs/README.md - - viral_pathogen_List.csv + - viral_pathogen_list.csv multiqc_config: - report_comment From 87791e4e649905bebefda286ad85c5da71089b18 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Mon, 24 Jun 2024 13:02:53 +0200 Subject: [PATCH 05/25] Update nextflow_schema.json Co-authored-by: Sofia Stamouli <91951607+sofstam@users.noreply.github.com> --- nextflow_schema.json | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/nextflow_schema.json b/nextflow_schema.json index e1507e0..9077ebf 100644 --- a/nextflow_schema.json +++ b/nextflow_schema.json @@ -25,7 +25,7 @@ }, "taxid": { "type": "string", - "description": "The taxonomy ID of the species identified in classification results. A list of taxids separated by spaces." + "description": "The taxonomy ID of the species identified in the classification results or a list of taxids separated by spaces." }, "viral_pathogen_genome": { "type": "string", From 2788b9e85adeb10c58c17ac56df552839442c51c Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Mon, 24 Jun 2024 13:22:50 +0200 Subject: [PATCH 06/25] add test_taxid.config and rename the pathogen list name --- .nf-core.yml | 2 +- conf/test_taxid.config | 36 +++++++++++++++++++ ...pathogen_List.csv => viralPathogenList.csv | 0 3 files changed, 37 insertions(+), 1 deletion(-) create mode 100644 conf/test_taxid.config rename viral_pathogen_List.csv => viralPathogenList.csv (100%) diff --git a/.nf-core.yml b/.nf-core.yml index f45d9f7..d55deec 100644 --- a/.nf-core.yml +++ b/.nf-core.yml @@ -15,7 +15,7 @@ lint: - assets/email_template.html - assets/email_template.txt - docs/README.md - - viral_pathogen_list.csv + - viralPathogenList.csv multiqc_config: - report_comment diff --git a/conf/test_taxid.config b/conf/test_taxid.config new file mode 100644 index 0000000..51dce1f --- /dev/null +++ b/conf/test_taxid.config @@ -0,0 +1,36 @@ +/* +~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + Nextflow config file for running minimal tests +~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + Defines a input taxid list to run a fast and simple pipeline test. + + Use as follows: + nextflow run genomic-medicine-sweden/meta-val -profile test_taxid, --outdir + +---------------------------------------------------------------------------------------- +*/ + +params { + config_profile_name = 'Test profile' + config_profile_description = 'Minimal test dataset to check pipeline function' + + // Limit resources so that this can run on GitHub Actions + max_cpus = 2 + max_memory = '6.GB' + max_time = '6.h' + + // Input data + input = 'assets/samplesheet_v1.csv' + + taxid = '211044 11676' //separated by space + + // Extract reads + extract_kraken2_reads = true + fastq_output = true + + extract_centrifuge_reads = true + extract_diamond_reads = true + + // Genome references + genome = 'R64-1-1' +} diff --git a/viral_pathogen_List.csv b/viralPathogenList.csv similarity index 100% rename from viral_pathogen_List.csv rename to viralPathogenList.csv From aab25e2e3d3c4202ad08142fb8f64da3d92f7e95 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Mon, 24 Jun 2024 13:24:22 +0200 Subject: [PATCH 07/25] update the test.config --- conf/test.config | 3 --- 1 file changed, 3 deletions(-) diff --git a/conf/test.config b/conf/test.config index e07e314..0b6517e 100644 --- a/conf/test.config +++ b/conf/test.config @@ -20,11 +20,8 @@ params { max_time = '6.h' // Input data - //input = '../final_test_data/samplesheet_v3.csv' input = 'assets/samplesheet_v1.csv' - taxid = '211044 11676' //separated by space - // Extract reads extract_kraken2_reads = true fastq_output = true From c065fe886b39871d610893b995407b72f4f26747 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Mon, 24 Jun 2024 13:29:10 +0200 Subject: [PATCH 08/25] add a new line to viralPahogenList.csv --- viralPathogenList.csv | 594 +++++++++++++++++++++--------------------- 1 file changed, 297 insertions(+), 297 deletions(-) diff --git a/viralPathogenList.csv b/viralPathogenList.csv index 940bbbe..78e208b 100644 --- a/viralPathogenList.csv +++ b/viralPathogenList.csv @@ -1,297 +1,297 @@ -Organism_Name;Species;Genus;Family;Taxid;Notes -Human mastadenovirus A;Human mastadenovirus A;Mastadenovirus;Adenoviridae;129875; -Human mastadenovirus B;Human mastadenovirus B;Mastadenovirus;Adenoviridae;108098; -Human mastadenovirus C;Human mastadenovirus C;Mastadenovirus;Adenoviridae;129951; -Human mastadenovirus D;Human mastadenovirus D;Mastadenovirus;Adenoviridae;130310; -Human mastadenovirus E;Human mastadenovirus E;Mastadenovirus;Adenoviridae;130308; -human adenovirus 52;Human mastadenovirus G;Mastadenovirus;Adenoviridae;332179; -Human mastadenovirus F;Human mastadenovirus F;Mastadenovirus;Adenoviridae;130309; -Lyssavirus rabies;Rabies virus ;Lyssavirus;Alpharhabdovirinae;11292; -Anelloviridae sp.;Anelloviridae sp.;;Anelloviridae;2055263; -Gyrovirus 4;Gyrovirus homsa3;Gyrovirus;Anelloviridae;1214955; -Gyrovirus GyV3;Gyrovirus homsa1;Gyrovirus;Anelloviridae;1163715; -Gyrovirus Tu243;Gyrovirus homsa4;Gyrovirus;Anelloviridae;1415627; -Gyrovirus Tu789;Gyrovirus homsa2;Gyrovirus;Anelloviridae;1415628; -Small anellovirus 1;Small anellovirus;;Anelloviridae;289366; -Small anellovirus 2;Small anellovirus;;Anelloviridae;289367; -Torque teno midi virus 1;Gammatorquevirus homidi1;Gammatorquevirus;Anelloviridae;687379; -Torque teno midi virus 10;Gammatorquevirus homidi10;Gammatorquevirus;Anelloviridae;2065051; -Torque teno midi virus 11;Gammatorquevirus homidi11;Gammatorquevirus;Anelloviridae;2065052; -Torque teno midi virus 12;Gammatorquevirus homidi12;Gammatorquevirus;Anelloviridae;2065053; -Torque teno midi virus 13;Gammatorquevirus homidi13;Gammatorquevirus;Anelloviridae;2065054; -Torque teno midi virus 14;Gammatorquevirus homidi14;Gammatorquevirus;Anelloviridae;2065055; -Torque teno midi virus 2;Gammatorquevirus homidi2;Gammatorquevirus;Anelloviridae;687380; -Torque teno midi virus 3;Gammatorquevirus homidi3;Gammatorquevirus;Anelloviridae;2065044; -Torque teno midi virus 4;Gammatorquevirus homidi4;Gammatorquevirus;Anelloviridae;2065045; -Torque teno midi virus 5;Gammatorquevirus homidi5;Gammatorquevirus;Anelloviridae;2065046; -Torque teno midi virus 6;Gammatorquevirus homidi6;Gammatorquevirus;Anelloviridae;2065047; -Torque teno midi virus 7;Gammatorquevirus homidi7;Gammatorquevirus;Anelloviridae;2065048; -Torque teno midi virus 8;Gammatorquevirus homidi8;Gammatorquevirus;Anelloviridae;2065049; -Torque teno midi virus 9;Gammatorquevirus homidi9;Gammatorquevirus;Anelloviridae;2065050; -Torque teno mini virus 1;Betatorquevirus homini1;Betatorquevirus;Anelloviridae;687369; -Torque teno mini virus 10;Betatorquevirus homini10;Betatorquevirus;Anelloviridae;2065036; -Torque teno mini virus 11;Betatorquevirus homini11;Betatorquevirus;Anelloviridae;2065037; -Torque teno mini virus 12;Betatorquevirus homini12;Betatorquevirus;Anelloviridae;2065038; -Torque teno mini virus 18;Betatorquevirus homini18;Betatorquevirus;Anelloviridae;1859149; -Torque teno mini virus 5;Betatorquevirus homini5;Betatorquevirus;Anelloviridae;687373; -Torque teno mini virus 6;Betatorquevirus homini6;Betatorquevirus;Anelloviridae;687374; -Torque teno mini virus 8;Betatorquevirus homini8;Betatorquevirus;Anelloviridae;687376; -Torque teno mini virus ALA22;Betatorquevirus homini27;Betatorquevirus;Anelloviridae;1535290; -Torque teno mini virus ALH8;Betatorquevirus homini16;Betatorquevirus;Anelloviridae;1535291; -Torque teno mini virus SHA;Betatorquevirus homini26;Betatorquevirus;Anelloviridae;2057931; -Torque teno virus;Torque teno virus;;Anelloviridae;68887; -Torque teno virus 9;Alphatorquevirus homin9;Alphatorquevirus;Anelloviridae;687348; -TTV-like mini virus;TTV-like mini virus;Betatorquevirus;Anelloviridae;93678; -Torque teno virus 6;Torque teno virus;Anellovirus;Anelloviridae;687345; -Mammarenavirus chapareense;Mammarenavirus chapareense;Mammarenavirus;Arenaviridae;3052302; -Mammarenavirus lujoense;Mammarenavirus lujoense;Mammarenavirus;Arenaviridae;3052314; -Mammarenavirus juninense;Mammarenavirus juninense;Mammarenavirus;Arenaviridae;2169991; -Mammarenavirus lassaense;Mammarenavirus lassaense ;Mammarenavirus;Arenaviridae;3052310; -Mammarenavirus choriomeningitidis;Mammarenavirus choriomeningitidis;Mammarenavirus;Arenaviridae;3052303; -Mammarenavirus machupoense;Mammarenavirus machupoense;Mammarenavirus;Arenaviridae;3052317; -Sabia virus;Mammarenavirus brazilense;Mammarenavirus;Arenaviridae;2907957; -Mammarenavirus whitewaterense;Mammarenavirus whitewaterense;Mammarenavirus;Arenaviridae;3052331; -Astrovirus MLB2;Astrovirus MLB2;;Astroviridae;683172; -Astrovirus MLB3;Astrovirus MLB3;;Astroviridae;1247114; -Astrovirus VA1;Mamastrovirus 9;Mamastrovirus;Astroviridae;645687; -Astrovirus VA3;Astrovirus VA3;;Astroviridae;683174; -Astrovirus VA4;Astrovirus VA4;;Astroviridae;1247113; -Bastrovirus 7;Bastrovirus BAS-1;;Astroviridae;1803394; -HMO Astrovirus A;HMO Astrovirus A;Mamastrovirus;Astroviridae;682382; -Human astrovirus BF34;Burkina Faso astrovirus;Mamastrovirus;Astroviridae;1518575; -Borna disease virus 1;Orthobornavirus bornaense;Orthobornavirus;Bornaviridae;1714621; -Borna disease virus 2;Orthobornavirus bornaense;Orthobornavirus;Bornaviridae;1714622; -Norovirus GI;Norwalk virus;Norovirus;Caliciviridae;122928; -Norovirus GI/Hu/JP/2007/GI.P3_GI.3/Shimizu/KK2866;Norwalk virus;Norovirus;Caliciviridae;1529909; -Norovirus GII;Norwalk virus;Norovirus;Caliciviridae;122929; -Norovirus GII.17;Norwalk virus;Norovirus;Caliciviridae;552592; -Norovirus GII/Hu/JP/2007/GII.P15_GII.15/Sapporo/HK299;Norwalk virus;Norovirus;Caliciviridae;1529918; -Norovirus GII/Hu/JP/2011/GII/Yuzawa/Gira2HS;Norwalk virus;Norovirus;Caliciviridae;1529924; -Norovirus GIV;Norwalk virus;Norovirus;Caliciviridae;262897; -Sapovirus Hu/GI/Sapporo/MT-2010/1982;Sapporo virus;Sapovirus;Caliciviridae;758863; -Cyclovirus NG12;Cyclovirus mmadu;Cyclovirus;Circoviridae;742922; -Cyclovirus NG14;Cyclovirus mutum;Cyclovirus;Circoviridae;742923; -Cyclovirus PK5006;Cyclovirus insaan;Cyclovirus;Circoviridae;742915; -Cyclovirus PK5034;Cyclovirus homa;Cyclovirus;Circoviridae;742916; -Cyclovirus PK5222;Cyclovirus manukha;Cyclovirus;Circoviridae;742917; -Cyclovirus PK5510;Cyclovirus maanav;Cyclovirus;Circoviridae;742918; -Cyclovirus SL-108277;Cyclovirus manitan;Cyclovirus;Circoviridae;1520935; -Cyclovirus TN25;Cyclovirus bashri;Cyclovirus;Circoviridae;742924; -Cyclovirus VN;Cyclovirus nhanloai;Cyclovirus;Circoviridae;1348500; -Human associated cyclovirus 10;Cyclovirus humana;Cyclovirus;Circoviridae;2038728; -Human circovirus VS6600022;Human circovirus VS6600022;Circovirus;Circoviridae;1525173; -Human cyclovirus VS5700009;Cyclovirus munthu;Cyclovirus;Circoviridae;1345637; -Human fecal virus Jorvi2;Human fecal virus Jorvi2;;Circoviridae;2017081; -Human fecal virus Jorvi3;Human fecal virus Jorvi3;;Circoviridae;2017082; -Human fecal virus Jorvi4;Human fecal virus Jorvi4;;Circoviridae;2017083; -Human PoSCV5-like circular virus;Human PoSCV5-like circular virus;;Circoviridae;1965018; -Human stool-associated circular virus NG13;Circovirus eniyan;Circovirus;Circoviridae;743300; -Indian encephalitis associated cyclovirus;Cyclovirus manusyan;Cyclovirus;Circoviridae;1755290; -Betacoronavirus England 1;Middle East respiratory syndrome-related coronavirus;Betacoronavirus;Coronaviridae;1263720; -Human coronavirus HKU1;Human coronavirus HKU1;Betacoronavirus;Coronaviridae;290028; -Middle East respiratory syndrome-related coronavirus;Middle East respiratory syndrome-related coronavirus;Betacoronavirus;Coronaviridae;1335626; -SARS coronavirus Tor2;Severe acute respiratory syndrome-related coronavirus;Betacoronavirus;Coronaviridae;227984; -Severe acute respiratory syndrome coronavirus 2;Severe acute respiratory syndrome-related coronavirus;Betacoronavirus;Coronaviridae;2697049; -Hepatitis delta virus;Hepatitis delta virus;Deltavirus;Deltaflexiviridae;12475; -Bundibugyo ebolavirus;Orthoebolavirus bundibugyoense;Orthoebolavirus;Filoviridae;565995; -Orthomarburgvirus marburgense;Orthomarburgvirus marburgense;Orthomarburgvirus;Filoviridae;3052505; -Sudan ebolavirus;Orthoebolavirus sudanense;Orthoebolavirus;Filoviridae;186540; -Tai Forest ebolavirus;Orthoebolavirus taiense;Orthoebolavirus;Filoviridae;186541; -Bombali virus;Ebolavirus;Ebolavirus;Filoviridae;2010960; -Orthomarburgvirus marburgense;Lake Victoria marburgvirus;Marburgvirus;Filoviridae;3052505; -Hepacivirus platyrrhini;Hepacivirus platyrrhini;Hepacivirus;Flaviviridae;3052236; -Hepatitis C virus genotype 3;Hepacivirus hominis;Hepacivirus;Flaviviridae;356114; -Hepatitis C virus genotype 4;Hepacivirus hominis;Hepacivirus;Flaviviridae;33745; -Hepatitis C virus genotype 5;Hepacivirus hominis;Hepacivirus;Flaviviridae;33746; -Hepatitis C virus genotype 7;Hepacivirus hominis;Hepacivirus;Flaviviridae;1544901; -Human hepegivirus;Pegivirus columbiaense;Pegivirus;Flaviviridae;1704090; -Human pegivirus 2;Pegivirus columbiaense;Pegivirus;Flaviviridae;1729141; -Zika virus;Orthoflavivirus zikaense;Orthoflavivirus;Flaviviridae;64320; -West Nile virus strain NY-99;West Nile virus;Flavivirus;Flaviviridae;1968826; -Japanese encephalitis virus;Japanese encephalitis virus;Flavivirus;Flaviviridae;11072; -Murray Valley encephalitis virus;Murray valley encephalitis virus;Flavivirus;Flaviviridae;11079; -St. Louis encephalitis virus;Saint Louis encephalitis virus;Flavivirus;Flaviviridae;11080; -Tick-borne encephalitis virus;Tick-borne encephalitis virus;Flavivirus;Flaviviridae;11084; -Zika virus;Zika virus;Flavivirus;Flaviviridae;64320; -dengue virus type 1; Orthoflavivirus denguei;Orthoflavivirus;Flaviviridae;11053; -dengue virus type 2; Orthoflavivirus denguei;Orthoflavivirus;Flaviviridae;11060; -dengue virus type 3; Orthoflavivirus denguei;Orthoflavivirus;Flaviviridae;11069; -dengue virus type 4; Orthoflavivirus denguei;Orthoflavivirus;Flaviviridae;11070; -Hepatitis C virus genotype 1;Hepacivirus hominis;Hepacivirus;Flaviviridae;41856; -"Hepatitis C virus genotype 2 strain=HC-J6CH";Hepacivirus hominis;Hepacivirus;Flaviviridae;40271; -Hepatitis C virus genotype 3;Hepacivirus hominis;Hepacivirus;Flaviviridae;356114; -Hepatitis C virus genotype 4;Hepacivirus hominis;Hepacivirus;Flaviviridae;33745; -Hepatitis C virus genotype 5;Hepacivirus hominis;Hepacivirus;Flaviviridae;33746; -Hepatitis C virus genotype 7;Hepacivirus hominis;Hepacivirus;Flaviviridae;1544901; -Gemycircularvirus C1c;Gemykibivirus humas3;Gemykibivirus;Genomoviridae;1673681; -Gemycircularvirus HV-GcV1;Gemycircularvirus HV-GcV1;Gemycircularvirus;Genomoviridae;1862824; -Gemycircularvirus HV-GcV2;Gemykibivirus humas5;Gemykibivirus;Genomoviridae;1862825; -Gemycircularvirus sp.;Gemycircularvirus sp.;Gemycircularvirus;Genomoviridae;1983771; -Human associated gemyvongvirus 1;Gemyvongvirus humas1;Gemyvongvirus;Genomoviridae;1985415; -Human gemycircularvirus GeTz1;Gemykibivirus humas4;Gemykibivirus;Genomoviridae;1792832; -Human genital-associated circular DNA virus-1;Gemygorvirus sewopo1;Gemygorvirus;Genomoviridae;1488574; -Orthohantavirus sinnombreense;Orthohantavirus sinnombreense;Orthohantavirus;Hantaviridae;3052499; -Hepatitis B virus;Hepatitis B virus;Orthohepadnavirus;Hepadnaviridae;10407; -Hepatitis E virus rat/R63/DEU/2009;Rocahepevirus ratti ;Orthohepevirinae;Hepeviridae;879096;Human Hepatitis E virus doesn't have complete genome -Rubella virus;Rubivirus rubellae;Rubivirus;Matonaviridae;11041; -Beiji nairovirus;Beiji nairovirus;Orthonairovirus;Nairoviridae;2304647; -Songling virus;Songling virus;Orthonairovirus;Nairoviridae;2795181; -Yezo virus;Yezo virus;Orthonairovirus;Nairoviridae;2825847; -Human alphaherpesvirus 1;implexvirus humanalpha1;Simplexvirus;Orthoherpesviridae;10298; -Human alphaherpesvirus 2;Simplexvirus humanalpha2;Simplexvirus;Orthoherpesviridae;10310; -Human alphaherpesvirus 3;Varicellovirus humanalpha3;Varicellovirus;Orthoherpesviridae;10335; -Human betaherpesvirus 5;Cytomegalovirus humanbeta5;Cytomegalovirus;Orthoherpesviridae;10359; -Human betaherpesvirus 6A;Roseolovirus humanbeta6a;Roseolovirus;Orthoherpesviridae;32603; -Human betaherpesvirus 6B;Roseolovirus humanbeta6b;Roseolovirus;Orthoherpesviridae;32604; -Human betaherpesvirus 7;Roseolovirus humanbeta7;Roseolovirus;Orthoherpesviridae;10372; -human gammaherpesvirus 4;Lymphocryptovirus humangamma4;Lymphocryptovirus;Orthoherpesviridae;10376; -Human gammaherpesvirus 8;Rhadinovirus humangamma8;Rhadinovirus;Orthoherpesviridae;37296; -Human herpesvirus 4 type 2;Lymphocryptovirus humangamma4;Lymphocryptovirus;Orthoherpesviridae;12509; -Influenza A virus (A/California/07/2009(H1N1));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;641809; -Influenza A virus (A/Korea/426/1968(H2N2));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;488241; -Influenza A virus (A/New York/392/2004(H3N2));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;335341; -Influenza A virus (A/goose/Guangdong/1/1996(H5N1));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;93838; -Influenza A virus (A/chicken/Mexico/23-12/2012(H5N2));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;1399123;No complete genome -Influenza A virus (A/Shanghai/02/2013(H7N9));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;1332244; -Influenza A virus (A/Hong Kong/1073/99(H9N2));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;130760; -Influenza B virus (B/Lee/1940);Influenza B virus;Betainfluenzavirus;Orthomyxoviridae;518987; -Influenza C virus (C/Ann Arbor/1/50);Influenza C virus;Gammainfluenzavirus;Orthomyxoviridae;11553; -Influenza D virus (D/swine/Oklahoma/1334/2011);Influenza D virus;Deltainfluenzavirus;Orthomyxoviridae;1173138; -Bourbon virus;Bourbon virus;Thogotovirus;Orthomyxoviridae;1618189; -Dhori virus (strain Indian/1313/61);Dhori virus;Thogotovirus;Orthomyxoviridae;11319; -Thogotovirus;Thogotovirus;Thogotovirus;Orthomyxoviridae;35323; -Gammapapillomavirus sp.;Gammapapillomavirus sp.;Gammapapillomavirus;Papillomaviridae;2049444; -Human papillomavirus;Human papillomavirus;;Papillomaviridae;10566; -Human papillomavirus 116;Gammapapillomavirus 9;Gammapapillomavirus;Papillomaviridae;915428; -Human papillomavirus 121;Gammapapillomavirus 10;Gammapapillomavirus;Papillomaviridae;915429; -Human papillomavirus 126;Gammapapillomavirus 11;Gammapapillomavirus;Papillomaviridae;1055684; -Human papillomavirus 127;Gammapapillomavirus 12;Gammapapillomavirus;Papillomaviridae;746832; -Human papillomavirus 132;Gammapapillomavirus 12;Gammapapillomavirus;Papillomaviridae;909331; -Human papillomavirus 134;Gammapapillomavirus 7;Gammapapillomavirus;Papillomaviridae;909333; -Human papillomavirus 135;Gammapapillomavirus 15;Gammapapillomavirus;Papillomaviridae;1070408; -Human papillomavirus 136;Gammapapillomavirus 11;Gammapapillomavirus;Papillomaviridae;1070409; -Human papillomavirus 140;Gammapapillomavirus 11;Gammapapillomavirus;Papillomaviridae;1070413; -Human papillomavirus 154;Gammapapillomavirus 11;Gammapapillomavirus;Papillomaviridae;1195796; -human papillomavirus 166;Gammapapillomavirus 19;Gammapapillomavirus;Papillomaviridae;1315259; -Human papillomavirus 167;Gammapapillomavirus 21;Gammapapillomavirus;Papillomaviridae;1420545; -Human papillomavirus 172;Gammapapillomavirus 22;Gammapapillomavirus;Papillomaviridae;1434987; -Human papillomavirus 175;Gammapapillomavirus 23;Gammapapillomavirus;Papillomaviridae;1434782; -Human papillomavirus 178;Gammapapillomavirus 24;Gammapapillomavirus;Papillomaviridae;1478160; -Human papillomavirus 179;Gammapapillomavirus 15;Gammapapillomavirus;Papillomaviridae;1472342; -Human papillomavirus 184;Gammapapillomavirus 25;Gammapapillomavirus;Papillomaviridae;1472343; -Human papillomavirus 187;Gammapapillomavirus 26;Gammapapillomavirus;Papillomaviridae;1851130; -Human papillomavirus 201;Gammapapillomavirus 27;Gammapapillomavirus;Papillomaviridae;1682340; -Human papillomavirus 204;Mupapillomavirus 3;Mupapillomavirus;Papillomaviridae;1650736; -Human papillomavirus KC5;Human papillomavirus KC5;Gammapapillomavirus;Papillomaviridae;1647924; -Human papillomavirus type 161;Gammapapillomavirus 19;Gammapapillomavirus;Papillomaviridae;1315264; -Human papillomavirus type 85;Human papillomavirus type 85;;Papillomaviridae;652810; -Human papillomavirus;Human papillomavirus;Papillomavirus;Papillomaviridae;10566; -Sosuga virus;Pararubulavirus sosugaense;Pararubulavirus;Paramyxoviridae;1452514; -Henipavirus hendraense;Hendra virus;Henipavirus;Paramyxoviridae;3052223; -Henipavirus nipahense;Nipah virus;Henipavirus;Paramyxoviridae;3052225; -human metapneumovirus;Human metapneumovirus;Metapneumovirus;Paramyxoviridae;162145; -Human orthorubulavirus 2;Human orthorubulavirus 2;Orthorubulavirus;Paramyxoviridae;2560525; -Human respirovirus 1;Human Respirovirus 1;Respirovirus;Paramyxoviridae;12730; -Human respirovirus 3;Human Respirovirus 3;Respirovirus;Paramyxoviridae;11216; -Measles morbillivirus;Morbillivirus;Morbillivirus;Paramyxoviridae;11234; -Mumps orthorubulaviru;Mumps virus;Orthorubulavirus;Paramyxoviridae;2560602; -Bocaparvovirus primate1;Bocaparvovirus primate1;Bocaparvovirus;Parvoviridae;3052040; -Bufavirus-3;Bufavirus-3;;Parvoviridae;1391667; -Cutavirus;Protoparvovirus primate3;Protoparvovirus;Parvoviridae;1867125; -Human bocavirus 2c PK;Bocaparvovirus primate2;Bocaparvovirus;Parvoviridae;1511882; -Human bocavirus 3;Bocaparvovirus primate1;Bocaparvovirus;Parvoviridae;638313; -Human bocavirus 4 NI;Bocaparvovirus primate2;Bocaparvovirus;Parvoviridae;1511883; -Human erythrovirus V9;Human erythrovirus V9;Erythroparvovirus;Parvoviridae;72197; -Human parvovirus 4 G1;Tetraparvovirus primate1;Tetraparvovirus;Parvoviridae;1511919; -Parvovirus NIH-CQV;Parvovirus NIH-CQV;;Parvoviridae;1341019; -Orthobunyavirus bwambaense;Orthobunyavirus bwambaense;Orthobunyavirus;Peribunyaviridae;3052384; -California encephalitis virus;Orthobunyavirus;Orthobunyavirus ;Peribunyaviridae;35305; -Catu virus;Orthobunyavirus catuense;Orthobunyavirus;Peribunyaviridae;1678225; -Fort Sherman virus;Orthobunyavirus shermanense;Orthobunyavirus;Peribunyaviridae;273345; -Guaroa virus;Orthobunyavirus guaroaense;Orthobunyavirus;Peribunyaviridae;80941; -Ilesha virus;Orthobunyavirus ileshaense;Orthobunyavirus;Peribunyaviridae;273341; -Madrid virus;Orthobunyavirus madridense;Orthobunyavirus;Peribunyaviridae;348013; -Alenquer virus;Phlebovirus alenquerense;Phlebovirus;Phenuiviridae;629726; -Chandiru virus;Phlebovirus candiruense;Phlebovirus;Phenuiviridae;629725; -Cocle virus;Phlebovirus cocleense;Phlebovirus;Phenuiviridae;1649829; -Dar es Salaam virus TZ-189;Tanzavirus daressalaamense;Tanzavirus;Phenuiviridae;2576944; -Echarate virus;Phlebovirus echarateense;Phlebovirus;Phenuiviridae;1000646; -Heartland virus;Bandavirus heartlandense;Bandavirus;Phenuiviridae;1216928; -Maldonado virus;Phlebovirus maldonadoense;Phlebovirus;Phenuiviridae;1004889; -Punta Toro virus;Phlebovirus toroense;Phlebovirus;Phenuiviridae;11587; -Sandfly fever Turkey virus;Phlebovirus siciliaense;Phlebovirus;Phenuiviridae;688699; -Severe fever with thrombocytopenia virus;Bandavirus dabieense;Bandavirus;Phenuiviridae;1003835; -SFTS virus HB29;Bandavirus dabieense;Bandavirus;Phenuiviridae;992212; -aichivirus A1;Aichivirus A;Kobuvirus;Picornaviridae;1313215; -Cosavirus A;Cosavirus A;Cosavirus;Picornaviridae;1330491; -Cosavirus D;Cosavirus D;Cosavirus;Picornaviridae;2003650; -Cosavirus E;Cosavirus E;Cosavirus;Picornaviridae;2003651; -Cosavirus F;Cosavirus F;Cosavirus;Picornaviridae;2003652; -Cosavirus JMY-2014;Cosavirus JMY-2014;Cosavirus;Picornaviridae;1582094; -Coxsackievirus B3;Enterovirus B;Enterovirus;Picornaviridae;12072; -enterovirus A114;Enterovirus A;Enterovirus;Picornaviridae;2760809; -Human cosavirus;Human cosavirus;Cosavirus;Picornaviridae;1233383; -Human cosavirus B;Cosavirus B;Cosavirus;Picornaviridae;586420; -rosavirus A2;Rosavirus A;Rosavirus;Picornaviridae;1511807; -Salivirus A;Salivirus A;Salivirus;Picornaviridae;1330524; -Salivirus FHB;Salivirus FHB;Salivirus;Picornaviridae;1547495; -Salivirus NG-J1;Salivirus A;Salivirus;Picornaviridae;651733; -Encephalomyocarditis virus;Encephalomyocarditis virus;Cardiovirus;Picornaviridae;12104; -Hepatovirus A;Hepatitis A virus;Hepatovirus;Picornaviridae;12092; -Human polyomavirus 6;Deltapolyomavirus sextihominis;Deltapolyomavirus;Polyomaviridae;746830; -Human polyomavirus 7;Deltapolyomavirus septihominis;Deltapolyomavirus;Polyomaviridae;746831; -Human polyomavirus 9;Alphapolyomavirus nonihominis;Alphapolyomavirus;Polyomaviridae;943908; -LI polyomavirus;Alphapolyomavirus quardecihominis;Alphapolyomavirus;Polyomaviridae;1965344; -Merkel cell polyomavirus;Alphapolyomavirus quintihominis;Alphapolyomavirus;Polyomaviridae;493803; -MW polyomavirus;Deltapolyomavirus decihominis;Deltapolyomavirus;Polyomaviridae;1203539; -New Jersey polyomavirus-2013;Alphapolyomavirus terdecihominis;Alphapolyomavirus;Polyomaviridae;1497391; -STL polyomavirus;Deltapolyomavirus undecihominis;Deltapolyomavirus;Polyomaviridae;1277649; -Trichodysplasia spinulosa-associated polyomavirus;Alphapolyomavirus octihominis;Alphapolyomavirus;Polyomaviridae;862909; -BK polyomavirus MM;BK polyomavirus;Betapolyomavirus;Polyomaviridae;1417981; -Betapolyomavirus tertihominis;KI Polyomavirus;Betapolyomavirus;Polyomaviridae;1891764; -Merkel cell polyomavirus;Merkel cell polyomavirus;Orthopolyomavirus;Polyomaviridae;493803; -WU Polyomavirus;WU polyomavirus;Betapolyomavirus;Polyomaviridae;440266; -Akhmeta virus;Akhmeta virus;Orthopoxvirus;Poxviridae;2200830; -Monkeypox virus;Monkeypox virus;Orthopoxvirus;Poxviridae;10244; -NY_014 poxvirus;NY_014 poxvirus;Centapoxvirus;Poxviridae;2025360; -Molluscum contagiosum virus subtype 1;Molluscum contagiosum virus;Molluscipoxvirus;Poxviridae;10280; -Orf virus;Orf virus;Parapoxvirus;Poxviridae;10258; -Yaba monkey tumor virus;Yaba monkey tumor virus;Yatapoxvirus;Poxviridae;38804; -Yaba-like disease virus;Yaba-like disease virus;Yatapoxvirus;Poxviridae;132475; -Human lung-associated vientovirus FB;Vientovirus;Torbevirus;Redondoviridae;2571082; -Banana virus X;Banna virus;Bannavirus;Reoviridae;307671; -Eyach virus;Eyach virus;Coltivirus;Reoviridae;62352; -Rotavirus A;Rotavirus A;Rotavirus;Reoviridae;28875; -Rotavirus C;Rotavirus C;Rotavirus;Reoviridae;36427; -Central cimpanzee simian foamy virus;Central cimpanzee simian foamy virus;Simiispumavirus;Retroviridae;2170194; -Eastern chimpanzee simian foamy virus;Eastern chimpanzee simian foamy virus;Simiispumavirus;Retroviridae;2170195; -Guenon simian foamy virus;Guenon simian foamy virus;Simiispumavirus;Retroviridae;2170197; -Human endogenous retrovirus K113;Human endogenous retrovirus K;;Retroviridae;166122; -Human immunodeficiency virus 1;Human immunodeficiency virus 1;Lentivirus;Retroviridae;11676; -Human immunodeficiency virus 2;Human immunodeficiency virus 2;Lentivirus;Retroviridae;11709; -Human T-lymphotropic virus 4;Human T-lymphotropic virus 4;Deltaretrovirus;Retroviridae;318279; -Human foamy virus;Human foamy virus;Spumavirus;Retroviridae;11641; -Tibrovirus congo;Tibrovirus congo;Tibrovirus;Rhabdoviridae;1987017; -Chandipura virus;Vesiculovirus chandipura;Vesiculovirus;Rhabdoviridae;11272; -Lyssavirus duvenhage;Lyssavirus duvenhage;Lyssavirus;Rhabdoviridae;38767; -Ekpoma virus 1;Tibrovirus alphaekpoma;Tibrovirus;Rhabdoviridae;1987020; -Ekpoma virus 2;Tibrovirus betaekpoma;Tibrovirus;Rhabdoviridae;1987021; -European bat lyssavirus 2;Lyssavirus helsinki;Lyssavirus;Rhabdoviridae;57483; -Le Dantec virus;Ledantevirus ledantec;Ledantevirus;Rhabdoviridae;318848; -Mundri virus;Mundri virus;;Rhabdoviridae;2913478; -Lebombo virus;Lebombo virus;Orbivirus;Sedoreoviridae;40057; -Orungo virus;Orungo virus;Orbivirus;Sedoreoviridae;40058; -Human associated huchismacovirus 1;Human associated huchismacovirus 1;Huchismacovirus;Smacoviridae;2169934; -Human associated huchismacovirus 2;Human associated huchismacovirus 2;Huchismacovirus;Smacoviridae;2169935; -Human associated huchismacovirus 3;Human associated huchismacovirus 3;Huchismacovirus;Smacoviridae;2169936; -Human associated porprismacovirus;Inpeasmacovirus humas1;Inpeasmacovirus;Smacoviridae;2530494; -Human associated porprismacovirus 3;Porprismacovirus humas4;Porprismacovirus;Smacoviridae;2496633; -Human feces smacovirus 2;Porprismacovirus humas1;Porprismacovirus;Smacoviridae;1820158; -Human feces smacovirus 3;Porprismacovirus humas3;Porprismacovirus;Smacoviridae;1820159; -Human smacovirus 1;Human smacovirus 1;Huchismacovirus;Smacoviridae;1595998; -Mammalian orthoreovirus 3 Dearing;Mammalian orthoreovirus;Orthoreovirus;Spinareoviridae;10886; -Ross River virus;Ross River virus;Alphavirus;Togaviridae;11029; -"Chikungunya virus strain=S27-African prototype";Chikungunya virus;Alphavirus;Togaviridae ;37124; -Human torovirus;Human torovirus;Torovirus;Toroviridae;67605; -Circo-like virus-Brazil hs1;Circo-like virus-Brazil;;;1346815; -Hudisavirus sp.;Hudisavirus sp.;;;2021738; \ No newline at end of file +Organism_Name;Species;Genus;Family;Taxid;Notes +Human mastadenovirus A;Human mastadenovirus A;Mastadenovirus;Adenoviridae;129875; +Human mastadenovirus B;Human mastadenovirus B;Mastadenovirus;Adenoviridae;108098; +Human mastadenovirus C;Human mastadenovirus C;Mastadenovirus;Adenoviridae;129951; +Human mastadenovirus D;Human mastadenovirus D;Mastadenovirus;Adenoviridae;130310; +Human mastadenovirus E;Human mastadenovirus E;Mastadenovirus;Adenoviridae;130308; +human adenovirus 52;Human mastadenovirus G;Mastadenovirus;Adenoviridae;332179; +Human mastadenovirus F;Human mastadenovirus F;Mastadenovirus;Adenoviridae;130309; +Lyssavirus rabies;Rabies virus ;Lyssavirus;Alpharhabdovirinae;11292; +Anelloviridae sp.;Anelloviridae sp.;;Anelloviridae;2055263; +Gyrovirus 4;Gyrovirus homsa3;Gyrovirus;Anelloviridae;1214955; +Gyrovirus GyV3;Gyrovirus homsa1;Gyrovirus;Anelloviridae;1163715; +Gyrovirus Tu243;Gyrovirus homsa4;Gyrovirus;Anelloviridae;1415627; +Gyrovirus Tu789;Gyrovirus homsa2;Gyrovirus;Anelloviridae;1415628; +Small anellovirus 1;Small anellovirus;;Anelloviridae;289366; +Small anellovirus 2;Small anellovirus;;Anelloviridae;289367; +Torque teno midi virus 1;Gammatorquevirus homidi1;Gammatorquevirus;Anelloviridae;687379; +Torque teno midi virus 10;Gammatorquevirus homidi10;Gammatorquevirus;Anelloviridae;2065051; +Torque teno midi virus 11;Gammatorquevirus homidi11;Gammatorquevirus;Anelloviridae;2065052; +Torque teno midi virus 12;Gammatorquevirus homidi12;Gammatorquevirus;Anelloviridae;2065053; +Torque teno midi virus 13;Gammatorquevirus homidi13;Gammatorquevirus;Anelloviridae;2065054; +Torque teno midi virus 14;Gammatorquevirus homidi14;Gammatorquevirus;Anelloviridae;2065055; +Torque teno midi virus 2;Gammatorquevirus homidi2;Gammatorquevirus;Anelloviridae;687380; +Torque teno midi virus 3;Gammatorquevirus homidi3;Gammatorquevirus;Anelloviridae;2065044; +Torque teno midi virus 4;Gammatorquevirus homidi4;Gammatorquevirus;Anelloviridae;2065045; +Torque teno midi virus 5;Gammatorquevirus homidi5;Gammatorquevirus;Anelloviridae;2065046; +Torque teno midi virus 6;Gammatorquevirus homidi6;Gammatorquevirus;Anelloviridae;2065047; +Torque teno midi virus 7;Gammatorquevirus homidi7;Gammatorquevirus;Anelloviridae;2065048; +Torque teno midi virus 8;Gammatorquevirus homidi8;Gammatorquevirus;Anelloviridae;2065049; +Torque teno midi virus 9;Gammatorquevirus homidi9;Gammatorquevirus;Anelloviridae;2065050; +Torque teno mini virus 1;Betatorquevirus homini1;Betatorquevirus;Anelloviridae;687369; +Torque teno mini virus 10;Betatorquevirus homini10;Betatorquevirus;Anelloviridae;2065036; +Torque teno mini virus 11;Betatorquevirus homini11;Betatorquevirus;Anelloviridae;2065037; +Torque teno mini virus 12;Betatorquevirus homini12;Betatorquevirus;Anelloviridae;2065038; +Torque teno mini virus 18;Betatorquevirus homini18;Betatorquevirus;Anelloviridae;1859149; +Torque teno mini virus 5;Betatorquevirus homini5;Betatorquevirus;Anelloviridae;687373; +Torque teno mini virus 6;Betatorquevirus homini6;Betatorquevirus;Anelloviridae;687374; +Torque teno mini virus 8;Betatorquevirus homini8;Betatorquevirus;Anelloviridae;687376; +Torque teno mini virus ALA22;Betatorquevirus homini27;Betatorquevirus;Anelloviridae;1535290; +Torque teno mini virus ALH8;Betatorquevirus homini16;Betatorquevirus;Anelloviridae;1535291; +Torque teno mini virus SHA;Betatorquevirus homini26;Betatorquevirus;Anelloviridae;2057931; +Torque teno virus;Torque teno virus;;Anelloviridae;68887; +Torque teno virus 9;Alphatorquevirus homin9;Alphatorquevirus;Anelloviridae;687348; +TTV-like mini virus;TTV-like mini virus;Betatorquevirus;Anelloviridae;93678; +Torque teno virus 6;Torque teno virus;Anellovirus;Anelloviridae;687345; +Mammarenavirus chapareense;Mammarenavirus chapareense;Mammarenavirus;Arenaviridae;3052302; +Mammarenavirus lujoense;Mammarenavirus lujoense;Mammarenavirus;Arenaviridae;3052314; +Mammarenavirus juninense;Mammarenavirus juninense;Mammarenavirus;Arenaviridae;2169991; +Mammarenavirus lassaense;Mammarenavirus lassaense ;Mammarenavirus;Arenaviridae;3052310; +Mammarenavirus choriomeningitidis;Mammarenavirus choriomeningitidis;Mammarenavirus;Arenaviridae;3052303; +Mammarenavirus machupoense;Mammarenavirus machupoense;Mammarenavirus;Arenaviridae;3052317; +Sabia virus;Mammarenavirus brazilense;Mammarenavirus;Arenaviridae;2907957; +Mammarenavirus whitewaterense;Mammarenavirus whitewaterense;Mammarenavirus;Arenaviridae;3052331; +Astrovirus MLB2;Astrovirus MLB2;;Astroviridae;683172; +Astrovirus MLB3;Astrovirus MLB3;;Astroviridae;1247114; +Astrovirus VA1;Mamastrovirus 9;Mamastrovirus;Astroviridae;645687; +Astrovirus VA3;Astrovirus VA3;;Astroviridae;683174; +Astrovirus VA4;Astrovirus VA4;;Astroviridae;1247113; +Bastrovirus 7;Bastrovirus BAS-1;;Astroviridae;1803394; +HMO Astrovirus A;HMO Astrovirus A;Mamastrovirus;Astroviridae;682382; +Human astrovirus BF34;Burkina Faso astrovirus;Mamastrovirus;Astroviridae;1518575; +Borna disease virus 1;Orthobornavirus bornaense;Orthobornavirus;Bornaviridae;1714621; +Borna disease virus 2;Orthobornavirus bornaense;Orthobornavirus;Bornaviridae;1714622; +Norovirus GI;Norwalk virus;Norovirus;Caliciviridae;122928; +Norovirus GI/Hu/JP/2007/GI.P3_GI.3/Shimizu/KK2866;Norwalk virus;Norovirus;Caliciviridae;1529909; +Norovirus GII;Norwalk virus;Norovirus;Caliciviridae;122929; +Norovirus GII.17;Norwalk virus;Norovirus;Caliciviridae;552592; +Norovirus GII/Hu/JP/2007/GII.P15_GII.15/Sapporo/HK299;Norwalk virus;Norovirus;Caliciviridae;1529918; +Norovirus GII/Hu/JP/2011/GII/Yuzawa/Gira2HS;Norwalk virus;Norovirus;Caliciviridae;1529924; +Norovirus GIV;Norwalk virus;Norovirus;Caliciviridae;262897; +Sapovirus Hu/GI/Sapporo/MT-2010/1982;Sapporo virus;Sapovirus;Caliciviridae;758863; +Cyclovirus NG12;Cyclovirus mmadu;Cyclovirus;Circoviridae;742922; +Cyclovirus NG14;Cyclovirus mutum;Cyclovirus;Circoviridae;742923; +Cyclovirus PK5006;Cyclovirus insaan;Cyclovirus;Circoviridae;742915; +Cyclovirus PK5034;Cyclovirus homa;Cyclovirus;Circoviridae;742916; +Cyclovirus PK5222;Cyclovirus manukha;Cyclovirus;Circoviridae;742917; +Cyclovirus PK5510;Cyclovirus maanav;Cyclovirus;Circoviridae;742918; +Cyclovirus SL-108277;Cyclovirus manitan;Cyclovirus;Circoviridae;1520935; +Cyclovirus TN25;Cyclovirus bashri;Cyclovirus;Circoviridae;742924; +Cyclovirus VN;Cyclovirus nhanloai;Cyclovirus;Circoviridae;1348500; +Human associated cyclovirus 10;Cyclovirus humana;Cyclovirus;Circoviridae;2038728; +Human circovirus VS6600022;Human circovirus VS6600022;Circovirus;Circoviridae;1525173; +Human cyclovirus VS5700009;Cyclovirus munthu;Cyclovirus;Circoviridae;1345637; +Human fecal virus Jorvi2;Human fecal virus Jorvi2;;Circoviridae;2017081; +Human fecal virus Jorvi3;Human fecal virus Jorvi3;;Circoviridae;2017082; +Human fecal virus Jorvi4;Human fecal virus Jorvi4;;Circoviridae;2017083; +Human PoSCV5-like circular virus;Human PoSCV5-like circular virus;;Circoviridae;1965018; +Human stool-associated circular virus NG13;Circovirus eniyan;Circovirus;Circoviridae;743300; +Indian encephalitis associated cyclovirus;Cyclovirus manusyan;Cyclovirus;Circoviridae;1755290; +Betacoronavirus England 1;Middle East respiratory syndrome-related coronavirus;Betacoronavirus;Coronaviridae;1263720; +Human coronavirus HKU1;Human coronavirus HKU1;Betacoronavirus;Coronaviridae;290028; +Middle East respiratory syndrome-related coronavirus;Middle East respiratory syndrome-related coronavirus;Betacoronavirus;Coronaviridae;1335626; +SARS coronavirus Tor2;Severe acute respiratory syndrome-related coronavirus;Betacoronavirus;Coronaviridae;227984; +Severe acute respiratory syndrome coronavirus 2;Severe acute respiratory syndrome-related coronavirus;Betacoronavirus;Coronaviridae;2697049; +Hepatitis delta virus;Hepatitis delta virus;Deltavirus;Deltaflexiviridae;12475; +Bundibugyo ebolavirus;Orthoebolavirus bundibugyoense;Orthoebolavirus;Filoviridae;565995; +Orthomarburgvirus marburgense;Orthomarburgvirus marburgense;Orthomarburgvirus;Filoviridae;3052505; +Sudan ebolavirus;Orthoebolavirus sudanense;Orthoebolavirus;Filoviridae;186540; +Tai Forest ebolavirus;Orthoebolavirus taiense;Orthoebolavirus;Filoviridae;186541; +Bombali virus;Ebolavirus;Ebolavirus;Filoviridae;2010960; +Orthomarburgvirus marburgense;Lake Victoria marburgvirus;Marburgvirus;Filoviridae;3052505; +Hepacivirus platyrrhini;Hepacivirus platyrrhini;Hepacivirus;Flaviviridae;3052236; +Hepatitis C virus genotype 3;Hepacivirus hominis;Hepacivirus;Flaviviridae;356114; +Hepatitis C virus genotype 4;Hepacivirus hominis;Hepacivirus;Flaviviridae;33745; +Hepatitis C virus genotype 5;Hepacivirus hominis;Hepacivirus;Flaviviridae;33746; +Hepatitis C virus genotype 7;Hepacivirus hominis;Hepacivirus;Flaviviridae;1544901; +Human hepegivirus;Pegivirus columbiaense;Pegivirus;Flaviviridae;1704090; +Human pegivirus 2;Pegivirus columbiaense;Pegivirus;Flaviviridae;1729141; +Zika virus;Orthoflavivirus zikaense;Orthoflavivirus;Flaviviridae;64320; +West Nile virus strain NY-99;West Nile virus;Flavivirus;Flaviviridae;1968826; +Japanese encephalitis virus;Japanese encephalitis virus;Flavivirus;Flaviviridae;11072; +Murray Valley encephalitis virus;Murray valley encephalitis virus;Flavivirus;Flaviviridae;11079; +St. Louis encephalitis virus;Saint Louis encephalitis virus;Flavivirus;Flaviviridae;11080; +Tick-borne encephalitis virus;Tick-borne encephalitis virus;Flavivirus;Flaviviridae;11084; +Zika virus;Zika virus;Flavivirus;Flaviviridae;64320; +dengue virus type 1; Orthoflavivirus denguei;Orthoflavivirus;Flaviviridae;11053; +dengue virus type 2; Orthoflavivirus denguei;Orthoflavivirus;Flaviviridae;11060; +dengue virus type 3; Orthoflavivirus denguei;Orthoflavivirus;Flaviviridae;11069; +dengue virus type 4; Orthoflavivirus denguei;Orthoflavivirus;Flaviviridae;11070; +Hepatitis C virus genotype 1;Hepacivirus hominis;Hepacivirus;Flaviviridae;41856; +"Hepatitis C virus genotype 2 strain=HC-J6CH";Hepacivirus hominis;Hepacivirus;Flaviviridae;40271; +Hepatitis C virus genotype 3;Hepacivirus hominis;Hepacivirus;Flaviviridae;356114; +Hepatitis C virus genotype 4;Hepacivirus hominis;Hepacivirus;Flaviviridae;33745; +Hepatitis C virus genotype 5;Hepacivirus hominis;Hepacivirus;Flaviviridae;33746; +Hepatitis C virus genotype 7;Hepacivirus hominis;Hepacivirus;Flaviviridae;1544901; +Gemycircularvirus C1c;Gemykibivirus humas3;Gemykibivirus;Genomoviridae;1673681; +Gemycircularvirus HV-GcV1;Gemycircularvirus HV-GcV1;Gemycircularvirus;Genomoviridae;1862824; +Gemycircularvirus HV-GcV2;Gemykibivirus humas5;Gemykibivirus;Genomoviridae;1862825; +Gemycircularvirus sp.;Gemycircularvirus sp.;Gemycircularvirus;Genomoviridae;1983771; +Human associated gemyvongvirus 1;Gemyvongvirus humas1;Gemyvongvirus;Genomoviridae;1985415; +Human gemycircularvirus GeTz1;Gemykibivirus humas4;Gemykibivirus;Genomoviridae;1792832; +Human genital-associated circular DNA virus-1;Gemygorvirus sewopo1;Gemygorvirus;Genomoviridae;1488574; +Orthohantavirus sinnombreense;Orthohantavirus sinnombreense;Orthohantavirus;Hantaviridae;3052499; +Hepatitis B virus;Hepatitis B virus;Orthohepadnavirus;Hepadnaviridae;10407; +Hepatitis E virus rat/R63/DEU/2009;Rocahepevirus ratti ;Orthohepevirinae;Hepeviridae;879096;Human Hepatitis E virus doesn't have complete genome +Rubella virus;Rubivirus rubellae;Rubivirus;Matonaviridae;11041; +Beiji nairovirus;Beiji nairovirus;Orthonairovirus;Nairoviridae;2304647; +Songling virus;Songling virus;Orthonairovirus;Nairoviridae;2795181; +Yezo virus;Yezo virus;Orthonairovirus;Nairoviridae;2825847; +Human alphaherpesvirus 1;implexvirus humanalpha1;Simplexvirus;Orthoherpesviridae;10298; +Human alphaherpesvirus 2;Simplexvirus humanalpha2;Simplexvirus;Orthoherpesviridae;10310; +Human alphaherpesvirus 3;Varicellovirus humanalpha3;Varicellovirus;Orthoherpesviridae;10335; +Human betaherpesvirus 5;Cytomegalovirus humanbeta5;Cytomegalovirus;Orthoherpesviridae;10359; +Human betaherpesvirus 6A;Roseolovirus humanbeta6a;Roseolovirus;Orthoherpesviridae;32603; +Human betaherpesvirus 6B;Roseolovirus humanbeta6b;Roseolovirus;Orthoherpesviridae;32604; +Human betaherpesvirus 7;Roseolovirus humanbeta7;Roseolovirus;Orthoherpesviridae;10372; +human gammaherpesvirus 4;Lymphocryptovirus humangamma4;Lymphocryptovirus;Orthoherpesviridae;10376; +Human gammaherpesvirus 8;Rhadinovirus humangamma8;Rhadinovirus;Orthoherpesviridae;37296; +Human herpesvirus 4 type 2;Lymphocryptovirus humangamma4;Lymphocryptovirus;Orthoherpesviridae;12509; +Influenza A virus (A/California/07/2009(H1N1));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;641809; +Influenza A virus (A/Korea/426/1968(H2N2));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;488241; +Influenza A virus (A/New York/392/2004(H3N2));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;335341; +Influenza A virus (A/goose/Guangdong/1/1996(H5N1));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;93838; +Influenza A virus (A/chicken/Mexico/23-12/2012(H5N2));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;1399123;No complete genome +Influenza A virus (A/Shanghai/02/2013(H7N9));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;1332244; +Influenza A virus (A/Hong Kong/1073/99(H9N2));Alphainfluenzavirus influenzae;Alphainfluenzavirus;Orthomyxoviridae;130760; +Influenza B virus (B/Lee/1940);Influenza B virus;Betainfluenzavirus;Orthomyxoviridae;518987; +Influenza C virus (C/Ann Arbor/1/50);Influenza C virus;Gammainfluenzavirus;Orthomyxoviridae;11553; +Influenza D virus (D/swine/Oklahoma/1334/2011);Influenza D virus;Deltainfluenzavirus;Orthomyxoviridae;1173138; +Bourbon virus;Bourbon virus;Thogotovirus;Orthomyxoviridae;1618189; +Dhori virus (strain Indian/1313/61);Dhori virus;Thogotovirus;Orthomyxoviridae;11319; +Thogotovirus;Thogotovirus;Thogotovirus;Orthomyxoviridae;35323; +Gammapapillomavirus sp.;Gammapapillomavirus sp.;Gammapapillomavirus;Papillomaviridae;2049444; +Human papillomavirus;Human papillomavirus;;Papillomaviridae;10566; +Human papillomavirus 116;Gammapapillomavirus 9;Gammapapillomavirus;Papillomaviridae;915428; +Human papillomavirus 121;Gammapapillomavirus 10;Gammapapillomavirus;Papillomaviridae;915429; +Human papillomavirus 126;Gammapapillomavirus 11;Gammapapillomavirus;Papillomaviridae;1055684; +Human papillomavirus 127;Gammapapillomavirus 12;Gammapapillomavirus;Papillomaviridae;746832; +Human papillomavirus 132;Gammapapillomavirus 12;Gammapapillomavirus;Papillomaviridae;909331; +Human papillomavirus 134;Gammapapillomavirus 7;Gammapapillomavirus;Papillomaviridae;909333; +Human papillomavirus 135;Gammapapillomavirus 15;Gammapapillomavirus;Papillomaviridae;1070408; +Human papillomavirus 136;Gammapapillomavirus 11;Gammapapillomavirus;Papillomaviridae;1070409; +Human papillomavirus 140;Gammapapillomavirus 11;Gammapapillomavirus;Papillomaviridae;1070413; +Human papillomavirus 154;Gammapapillomavirus 11;Gammapapillomavirus;Papillomaviridae;1195796; +human papillomavirus 166;Gammapapillomavirus 19;Gammapapillomavirus;Papillomaviridae;1315259; +Human papillomavirus 167;Gammapapillomavirus 21;Gammapapillomavirus;Papillomaviridae;1420545; +Human papillomavirus 172;Gammapapillomavirus 22;Gammapapillomavirus;Papillomaviridae;1434987; +Human papillomavirus 175;Gammapapillomavirus 23;Gammapapillomavirus;Papillomaviridae;1434782; +Human papillomavirus 178;Gammapapillomavirus 24;Gammapapillomavirus;Papillomaviridae;1478160; +Human papillomavirus 179;Gammapapillomavirus 15;Gammapapillomavirus;Papillomaviridae;1472342; +Human papillomavirus 184;Gammapapillomavirus 25;Gammapapillomavirus;Papillomaviridae;1472343; +Human papillomavirus 187;Gammapapillomavirus 26;Gammapapillomavirus;Papillomaviridae;1851130; +Human papillomavirus 201;Gammapapillomavirus 27;Gammapapillomavirus;Papillomaviridae;1682340; +Human papillomavirus 204;Mupapillomavirus 3;Mupapillomavirus;Papillomaviridae;1650736; +Human papillomavirus KC5;Human papillomavirus KC5;Gammapapillomavirus;Papillomaviridae;1647924; +Human papillomavirus type 161;Gammapapillomavirus 19;Gammapapillomavirus;Papillomaviridae;1315264; +Human papillomavirus type 85;Human papillomavirus type 85;;Papillomaviridae;652810; +Human papillomavirus;Human papillomavirus;Papillomavirus;Papillomaviridae;10566; +Sosuga virus;Pararubulavirus sosugaense;Pararubulavirus;Paramyxoviridae;1452514; +Henipavirus hendraense;Hendra virus;Henipavirus;Paramyxoviridae;3052223; +Henipavirus nipahense;Nipah virus;Henipavirus;Paramyxoviridae;3052225; +human metapneumovirus;Human metapneumovirus;Metapneumovirus;Paramyxoviridae;162145; +Human orthorubulavirus 2;Human orthorubulavirus 2;Orthorubulavirus;Paramyxoviridae;2560525; +Human respirovirus 1;Human Respirovirus 1;Respirovirus;Paramyxoviridae;12730; +Human respirovirus 3;Human Respirovirus 3;Respirovirus;Paramyxoviridae;11216; +Measles morbillivirus;Morbillivirus;Morbillivirus;Paramyxoviridae;11234; +Mumps orthorubulaviru;Mumps virus;Orthorubulavirus;Paramyxoviridae;2560602; +Bocaparvovirus primate1;Bocaparvovirus primate1;Bocaparvovirus;Parvoviridae;3052040; +Bufavirus-3;Bufavirus-3;;Parvoviridae;1391667; +Cutavirus;Protoparvovirus primate3;Protoparvovirus;Parvoviridae;1867125; +Human bocavirus 2c PK;Bocaparvovirus primate2;Bocaparvovirus;Parvoviridae;1511882; +Human bocavirus 3;Bocaparvovirus primate1;Bocaparvovirus;Parvoviridae;638313; +Human bocavirus 4 NI;Bocaparvovirus primate2;Bocaparvovirus;Parvoviridae;1511883; +Human erythrovirus V9;Human erythrovirus V9;Erythroparvovirus;Parvoviridae;72197; +Human parvovirus 4 G1;Tetraparvovirus primate1;Tetraparvovirus;Parvoviridae;1511919; +Parvovirus NIH-CQV;Parvovirus NIH-CQV;;Parvoviridae;1341019; +Orthobunyavirus bwambaense;Orthobunyavirus bwambaense;Orthobunyavirus;Peribunyaviridae;3052384; +California encephalitis virus;Orthobunyavirus;Orthobunyavirus ;Peribunyaviridae;35305; +Catu virus;Orthobunyavirus catuense;Orthobunyavirus;Peribunyaviridae;1678225; +Fort Sherman virus;Orthobunyavirus shermanense;Orthobunyavirus;Peribunyaviridae;273345; +Guaroa virus;Orthobunyavirus guaroaense;Orthobunyavirus;Peribunyaviridae;80941; +Ilesha virus;Orthobunyavirus ileshaense;Orthobunyavirus;Peribunyaviridae;273341; +Madrid virus;Orthobunyavirus madridense;Orthobunyavirus;Peribunyaviridae;348013; +Alenquer virus;Phlebovirus alenquerense;Phlebovirus;Phenuiviridae;629726; +Chandiru virus;Phlebovirus candiruense;Phlebovirus;Phenuiviridae;629725; +Cocle virus;Phlebovirus cocleense;Phlebovirus;Phenuiviridae;1649829; +Dar es Salaam virus TZ-189;Tanzavirus daressalaamense;Tanzavirus;Phenuiviridae;2576944; +Echarate virus;Phlebovirus echarateense;Phlebovirus;Phenuiviridae;1000646; +Heartland virus;Bandavirus heartlandense;Bandavirus;Phenuiviridae;1216928; +Maldonado virus;Phlebovirus maldonadoense;Phlebovirus;Phenuiviridae;1004889; +Punta Toro virus;Phlebovirus toroense;Phlebovirus;Phenuiviridae;11587; +Sandfly fever Turkey virus;Phlebovirus siciliaense;Phlebovirus;Phenuiviridae;688699; +Severe fever with thrombocytopenia virus;Bandavirus dabieense;Bandavirus;Phenuiviridae;1003835; +SFTS virus HB29;Bandavirus dabieense;Bandavirus;Phenuiviridae;992212; +aichivirus A1;Aichivirus A;Kobuvirus;Picornaviridae;1313215; +Cosavirus A;Cosavirus A;Cosavirus;Picornaviridae;1330491; +Cosavirus D;Cosavirus D;Cosavirus;Picornaviridae;2003650; +Cosavirus E;Cosavirus E;Cosavirus;Picornaviridae;2003651; +Cosavirus F;Cosavirus F;Cosavirus;Picornaviridae;2003652; +Cosavirus JMY-2014;Cosavirus JMY-2014;Cosavirus;Picornaviridae;1582094; +Coxsackievirus B3;Enterovirus B;Enterovirus;Picornaviridae;12072; +enterovirus A114;Enterovirus A;Enterovirus;Picornaviridae;2760809; +Human cosavirus;Human cosavirus;Cosavirus;Picornaviridae;1233383; +Human cosavirus B;Cosavirus B;Cosavirus;Picornaviridae;586420; +rosavirus A2;Rosavirus A;Rosavirus;Picornaviridae;1511807; +Salivirus A;Salivirus A;Salivirus;Picornaviridae;1330524; +Salivirus FHB;Salivirus FHB;Salivirus;Picornaviridae;1547495; +Salivirus NG-J1;Salivirus A;Salivirus;Picornaviridae;651733; +Encephalomyocarditis virus;Encephalomyocarditis virus;Cardiovirus;Picornaviridae;12104; +Hepatovirus A;Hepatitis A virus;Hepatovirus;Picornaviridae;12092; +Human polyomavirus 6;Deltapolyomavirus sextihominis;Deltapolyomavirus;Polyomaviridae;746830; +Human polyomavirus 7;Deltapolyomavirus septihominis;Deltapolyomavirus;Polyomaviridae;746831; +Human polyomavirus 9;Alphapolyomavirus nonihominis;Alphapolyomavirus;Polyomaviridae;943908; +LI polyomavirus;Alphapolyomavirus quardecihominis;Alphapolyomavirus;Polyomaviridae;1965344; +Merkel cell polyomavirus;Alphapolyomavirus quintihominis;Alphapolyomavirus;Polyomaviridae;493803; +MW polyomavirus;Deltapolyomavirus decihominis;Deltapolyomavirus;Polyomaviridae;1203539; +New Jersey polyomavirus-2013;Alphapolyomavirus terdecihominis;Alphapolyomavirus;Polyomaviridae;1497391; +STL polyomavirus;Deltapolyomavirus undecihominis;Deltapolyomavirus;Polyomaviridae;1277649; +Trichodysplasia spinulosa-associated polyomavirus;Alphapolyomavirus octihominis;Alphapolyomavirus;Polyomaviridae;862909; +BK polyomavirus MM;BK polyomavirus;Betapolyomavirus;Polyomaviridae;1417981; +Betapolyomavirus tertihominis;KI Polyomavirus;Betapolyomavirus;Polyomaviridae;1891764; +Merkel cell polyomavirus;Merkel cell polyomavirus;Orthopolyomavirus;Polyomaviridae;493803; +WU Polyomavirus;WU polyomavirus;Betapolyomavirus;Polyomaviridae;440266; +Akhmeta virus;Akhmeta virus;Orthopoxvirus;Poxviridae;2200830; +Monkeypox virus;Monkeypox virus;Orthopoxvirus;Poxviridae;10244; +NY_014 poxvirus;NY_014 poxvirus;Centapoxvirus;Poxviridae;2025360; +Molluscum contagiosum virus subtype 1;Molluscum contagiosum virus;Molluscipoxvirus;Poxviridae;10280; +Orf virus;Orf virus;Parapoxvirus;Poxviridae;10258; +Yaba monkey tumor virus;Yaba monkey tumor virus;Yatapoxvirus;Poxviridae;38804; +Yaba-like disease virus;Yaba-like disease virus;Yatapoxvirus;Poxviridae;132475; +Human lung-associated vientovirus FB;Vientovirus;Torbevirus;Redondoviridae;2571082; +Banana virus X;Banna virus;Bannavirus;Reoviridae;307671; +Eyach virus;Eyach virus;Coltivirus;Reoviridae;62352; +Rotavirus A;Rotavirus A;Rotavirus;Reoviridae;28875; +Rotavirus C;Rotavirus C;Rotavirus;Reoviridae;36427; +Central cimpanzee simian foamy virus;Central cimpanzee simian foamy virus;Simiispumavirus;Retroviridae;2170194; +Eastern chimpanzee simian foamy virus;Eastern chimpanzee simian foamy virus;Simiispumavirus;Retroviridae;2170195; +Guenon simian foamy virus;Guenon simian foamy virus;Simiispumavirus;Retroviridae;2170197; +Human endogenous retrovirus K113;Human endogenous retrovirus K;;Retroviridae;166122; +Human immunodeficiency virus 1;Human immunodeficiency virus 1;Lentivirus;Retroviridae;11676; +Human immunodeficiency virus 2;Human immunodeficiency virus 2;Lentivirus;Retroviridae;11709; +Human T-lymphotropic virus 4;Human T-lymphotropic virus 4;Deltaretrovirus;Retroviridae;318279; +Human foamy virus;Human foamy virus;Spumavirus;Retroviridae;11641; +Tibrovirus congo;Tibrovirus congo;Tibrovirus;Rhabdoviridae;1987017; +Chandipura virus;Vesiculovirus chandipura;Vesiculovirus;Rhabdoviridae;11272; +Lyssavirus duvenhage;Lyssavirus duvenhage;Lyssavirus;Rhabdoviridae;38767; +Ekpoma virus 1;Tibrovirus alphaekpoma;Tibrovirus;Rhabdoviridae;1987020; +Ekpoma virus 2;Tibrovirus betaekpoma;Tibrovirus;Rhabdoviridae;1987021; +European bat lyssavirus 2;Lyssavirus helsinki;Lyssavirus;Rhabdoviridae;57483; +Le Dantec virus;Ledantevirus ledantec;Ledantevirus;Rhabdoviridae;318848; +Mundri virus;Mundri virus;;Rhabdoviridae;2913478; +Lebombo virus;Lebombo virus;Orbivirus;Sedoreoviridae;40057; +Orungo virus;Orungo virus;Orbivirus;Sedoreoviridae;40058; +Human associated huchismacovirus 1;Human associated huchismacovirus 1;Huchismacovirus;Smacoviridae;2169934; +Human associated huchismacovirus 2;Human associated huchismacovirus 2;Huchismacovirus;Smacoviridae;2169935; +Human associated huchismacovirus 3;Human associated huchismacovirus 3;Huchismacovirus;Smacoviridae;2169936; +Human associated porprismacovirus;Inpeasmacovirus humas1;Inpeasmacovirus;Smacoviridae;2530494; +Human associated porprismacovirus 3;Porprismacovirus humas4;Porprismacovirus;Smacoviridae;2496633; +Human feces smacovirus 2;Porprismacovirus humas1;Porprismacovirus;Smacoviridae;1820158; +Human feces smacovirus 3;Porprismacovirus humas3;Porprismacovirus;Smacoviridae;1820159; +Human smacovirus 1;Human smacovirus 1;Huchismacovirus;Smacoviridae;1595998; +Mammalian orthoreovirus 3 Dearing;Mammalian orthoreovirus;Orthoreovirus;Spinareoviridae;10886; +Ross River virus;Ross River virus;Alphavirus;Togaviridae;11029; +"Chikungunya virus strain=S27-African prototype";Chikungunya virus;Alphavirus;Togaviridae ;37124; +Human torovirus;Human torovirus;Torovirus;Toroviridae;67605; +Circo-like virus-Brazil hs1;Circo-like virus-Brazil;;;1346815; +Hudisavirus sp.;Hudisavirus sp.;;;2021738; From 0ff8eede297da7ae6bcc66a9470c0e3abf4c70ce Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Wed, 10 Jul 2024 10:35:32 +0200 Subject: [PATCH 09/25] screen pathogens for short reads and update moduels of extractcentrifugereads and extractdiamondreads --- .../test_data/reference/accession2taxid.map | 102 + assets/test_data/reference/reference.fna | 5826 +++++++++++++++++ conf/modules.config | 31 +- conf/test.config | 1 + conf/test_full.config | 12 +- conf/test_taxid.config | 4 +- modules.json | 42 +- modules/local/extractcentrifugereads.nf | 3 + modules/local/extractdiamondreads.nf | 3 + .../nf-core/samtools/flagstat/environment.yml | 8 + modules/nf-core/samtools/flagstat/main.nf | 46 + modules/nf-core/samtools/flagstat/meta.yml | 51 + .../samtools/flagstat/tests/main.nf.test | 36 + .../samtools/flagstat/tests/main.nf.test.snap | 32 + .../nf-core/samtools/flagstat/tests/tags.yml | 2 + .../nf-core/samtools/idxstats/environment.yml | 8 + modules/nf-core/samtools/idxstats/main.nf | 48 + modules/nf-core/samtools/idxstats/meta.yml | 52 + .../samtools/idxstats/tests/main.nf.test | 36 + .../samtools/idxstats/tests/main.nf.test.snap | 32 + .../nf-core/samtools/idxstats/tests/tags.yml | 2 + .../nf-core/samtools/index/environment.yml | 8 + modules/nf-core/samtools/index/main.nf | 48 + modules/nf-core/samtools/index/meta.yml | 57 + .../samtools/index/tests/csi.nextflow.config | 7 + .../nf-core/samtools/index/tests/main.nf.test | 87 + .../samtools/index/tests/main.nf.test.snap | 74 + modules/nf-core/samtools/index/tests/tags.yml | 2 + modules/nf-core/samtools/sort/environment.yml | 8 + modules/nf-core/samtools/sort/main.nf | 63 + modules/nf-core/samtools/sort/meta.yml | 71 + .../nf-core/samtools/sort/tests/main.nf.test | 104 + .../samtools/sort/tests/main.nf.test.snap | 114 + .../samtools/sort/tests/nextflow.config | 8 + modules/nf-core/samtools/sort/tests/tags.yml | 3 + .../nf-core/samtools/stats/environment.yml | 8 + modules/nf-core/samtools/stats/main.nf | 49 + modules/nf-core/samtools/stats/meta.yml | 63 + .../nf-core/samtools/stats/tests/main.nf.test | 65 + .../samtools/stats/tests/main.nf.test.snap | 72 + modules/nf-core/samtools/stats/tests/tags.yml | 2 + nextflow.config | 7 +- nextflow_schema.json | 58 +- .../nf-core/bam_sort_stats_samtools/main.nf | 50 + .../nf-core/bam_sort_stats_samtools/meta.yml | 70 + .../tests/main.nf.test | 134 + .../tests/main.nf.test.snap | 354 + .../bam_sort_stats_samtools/tests/tags.yml | 2 + .../nf-core/bam_stats_samtools/main.nf | 32 + .../nf-core/bam_stats_samtools/meta.yml | 43 + .../bam_stats_samtools/tests/main.nf.test | 188 + .../tests/main.nf.test.snap | 350 + .../nf-core/bam_stats_samtools/tests/tags.yml | 2 + .../nf-core/fastq_align_bowtie2/main.nf | 45 + .../nf-core/fastq_align_bowtie2/meta.yml | 67 + .../fastq_align_bowtie2/tests/main.nf.test | 189 + .../tests/main.nf.test.snap | 126 + .../fastq_align_bowtie2/tests/nextflow.config | 8 + .../fastq_align_bowtie2/tests/tags.yml | 2 + ...athogenList.csv => viral_pathogen_list.csv | 0 workflows/metaval.nf | 51 +- 61 files changed, 9008 insertions(+), 60 deletions(-) create mode 100644 assets/test_data/reference/accession2taxid.map create mode 100644 assets/test_data/reference/reference.fna create mode 100644 modules/nf-core/samtools/flagstat/environment.yml create mode 100644 modules/nf-core/samtools/flagstat/main.nf create mode 100644 modules/nf-core/samtools/flagstat/meta.yml create mode 100644 modules/nf-core/samtools/flagstat/tests/main.nf.test create mode 100644 modules/nf-core/samtools/flagstat/tests/main.nf.test.snap create mode 100644 modules/nf-core/samtools/flagstat/tests/tags.yml create mode 100644 modules/nf-core/samtools/idxstats/environment.yml create mode 100644 modules/nf-core/samtools/idxstats/main.nf create mode 100644 modules/nf-core/samtools/idxstats/meta.yml create mode 100644 modules/nf-core/samtools/idxstats/tests/main.nf.test create mode 100644 modules/nf-core/samtools/idxstats/tests/main.nf.test.snap create mode 100644 modules/nf-core/samtools/idxstats/tests/tags.yml create mode 100644 modules/nf-core/samtools/index/environment.yml create mode 100644 modules/nf-core/samtools/index/main.nf create mode 100644 modules/nf-core/samtools/index/meta.yml create mode 100644 modules/nf-core/samtools/index/tests/csi.nextflow.config create mode 100644 modules/nf-core/samtools/index/tests/main.nf.test create mode 100644 modules/nf-core/samtools/index/tests/main.nf.test.snap create mode 100644 modules/nf-core/samtools/index/tests/tags.yml create mode 100644 modules/nf-core/samtools/sort/environment.yml create mode 100644 modules/nf-core/samtools/sort/main.nf create mode 100644 modules/nf-core/samtools/sort/meta.yml create mode 100644 modules/nf-core/samtools/sort/tests/main.nf.test create mode 100644 modules/nf-core/samtools/sort/tests/main.nf.test.snap create mode 100644 modules/nf-core/samtools/sort/tests/nextflow.config create mode 100644 modules/nf-core/samtools/sort/tests/tags.yml create mode 100644 modules/nf-core/samtools/stats/environment.yml create mode 100644 modules/nf-core/samtools/stats/main.nf create mode 100644 modules/nf-core/samtools/stats/meta.yml create mode 100644 modules/nf-core/samtools/stats/tests/main.nf.test create mode 100644 modules/nf-core/samtools/stats/tests/main.nf.test.snap create mode 100644 modules/nf-core/samtools/stats/tests/tags.yml create mode 100644 subworkflows/nf-core/bam_sort_stats_samtools/main.nf create mode 100644 subworkflows/nf-core/bam_sort_stats_samtools/meta.yml create mode 100644 subworkflows/nf-core/bam_sort_stats_samtools/tests/main.nf.test create mode 100644 subworkflows/nf-core/bam_sort_stats_samtools/tests/main.nf.test.snap create mode 100644 subworkflows/nf-core/bam_sort_stats_samtools/tests/tags.yml create mode 100644 subworkflows/nf-core/bam_stats_samtools/main.nf create mode 100644 subworkflows/nf-core/bam_stats_samtools/meta.yml create mode 100644 subworkflows/nf-core/bam_stats_samtools/tests/main.nf.test create mode 100644 subworkflows/nf-core/bam_stats_samtools/tests/main.nf.test.snap create mode 100644 subworkflows/nf-core/bam_stats_samtools/tests/tags.yml create mode 100644 subworkflows/nf-core/fastq_align_bowtie2/main.nf create mode 100644 subworkflows/nf-core/fastq_align_bowtie2/meta.yml create mode 100644 subworkflows/nf-core/fastq_align_bowtie2/tests/main.nf.test create mode 100644 subworkflows/nf-core/fastq_align_bowtie2/tests/main.nf.test.snap create mode 100644 subworkflows/nf-core/fastq_align_bowtie2/tests/nextflow.config create mode 100644 subworkflows/nf-core/fastq_align_bowtie2/tests/tags.yml rename viralPathogenList.csv => viral_pathogen_list.csv (100%) diff --git a/assets/test_data/reference/accession2taxid.map b/assets/test_data/reference/accession2taxid.map new file mode 100644 index 0000000..7762521 --- /dev/null +++ b/assets/test_data/reference/accession2taxid.map @@ -0,0 +1,102 @@ +NC_002205.1 518987 +NC_002206.1 518987 +NC_002207.1 518987 +NC_002208.1 518987 +NC_002209.1 518987 +NC_002210.1 518987 +NC_002211.1 518987 +NC_002204.1 518987 +NC_004910.1 130760 +NC_004911.1 130760 +NC_004912.1 130760 +NC_004908.1 130760 +NC_004905.2 130760 +NC_004909.1 130760 +NC_004907.1 130760 +NC_004906.1 130760 +NC_006307.2 11553 +NC_006308.2 11553 +NC_006309.2 11553 +NC_006310.2 11553 +NC_006311.1 11553 +NC_006312.2 11553 +NC_006306.2 11553 +NC_007357.1 93838 +NC_007358.1 93838 +NC_007359.1 93838 +NC_007362.1 93838 +NC_007360.1 93838 +NC_007361.1 93838 +NC_007363.1 93838 +NC_007364.1 93838 +NC_007373.1 335341 +NC_007372.1 335341 +NC_007371.1 335341 +NC_007366.1 335341 +NC_007369.1 335341 +NC_007368.1 335341 +NC_007367.1 335341 +NC_007370.1 335341 +NC_002023.1 211044 +NC_002021.1 211044 +NC_002022.1 211044 +NC_002017.1 211044 +NC_002019.1 211044 +NC_002018.1 211044 +NC_002016.1 211044 +NC_002020.1 211044 +NC_007378.1 488241 +NC_007375.1 488241 +NC_007376.1 488241 +NC_007374.1 488241 +NC_007381.1 488241 +NC_007382.1 488241 +NC_007377.1 488241 +NC_007380.1 488241 +NC_026422.1 1332244 +NC_026423.1 1332244 +NC_026424.1 1332244 +NC_026425.1 1332244 +NC_026426.1 1332244 +NC_026429.1 1332244 +NC_026427.1 1332244 +NC_026428.1 1332244 +NC_026438.1 641809 +NC_026435.1 641809 +NC_026437.1 641809 +NC_026433.1 641809 +NC_026436.1 641809 +NC_026434.1 641809 +NC_026431.1 641809 +NC_026432.1 641809 +NC_036616.1 1173138 +NC_036615.1 1173138 +NC_036619.1 1173138 +NC_036618.1 1173138 +NC_036617.1 1173138 +NC_036620.1 1173138 +NC_036621.1 1173138 +NC_060925.1 9606 +NC_060926.1 9606 +NC_060927.1 9606 +NC_060928.1 9606 +NC_060929.1 9606 +NC_060930.1 9606 +NC_060931.1 9606 +NC_060932.1 9606 +NC_060933.1 9606 +NC_060934.1 9606 +NC_060935.1 9606 +NC_060936.1 9606 +NC_060937.1 9606 +NC_060938.1 9606 +NC_060939.1 9606 +NC_060940.1 9606 +NC_060941.1 9606 +NC_060942.1 9606 +NC_060943.1 9606 +NC_060944.1 9606 +NC_060945.1 9606 +NC_060946.1 9606 +NC_060947.1 9606 +NC_060948.1 9606 diff --git a/assets/test_data/reference/reference.fna b/assets/test_data/reference/reference.fna new file mode 100644 index 0000000..cf8c4d3 --- /dev/null +++ b/assets/test_data/reference/reference.fna @@ -0,0 +1,5826 @@ +>NC_002205.1 Influenza B virus (B/Lee/1940) segment 2, complete sequence +ATGACGTTGGCTAAAATTGAACTACTAAAGCAGCTGTTAAGGGACAATGAAGCCAAAACGGTGTTGAGACAGACAACGGT +AGACCAATACAACATAATAAGAAAATTCAATACATCAAGAATTGAAAAGAACCCTTCATTAAGAATGAAGTGGGCCATGT +GTTCCAATTTTCCCTTAGCTCTGACCAAGGGTGATATGGCAAATCGAATCCCCTTGGAATACAAGGGAATACAACTTAAA +ACAAATGCTGAAGACATAGGAACTAAAGGACAAATGTGTTCAATAGCAGCAGTTACCTGGTGGAATACATATGGGCCCAT +AGGGGATACTGAAGGGTTTGAAAAGGTCTACGAAAGCTTTTTTCTCAGAAAGATGAGACTTGACAATGCCACTTGGGGCC +GAATAACCTTTGGCCCTGTTGAGAGAGTAAGAAAAAGAGTACTACTAAACCCGCTCACCAAGGAAATGCCCCCAGATGAA +GCGAGCAATGTAATAATGGAAATATTATTCCCTAAAGAAGCAGGAATACCAAGAGAATCTACTTGGATACATAGAGAACT +GATAAAAGAAAAAAGAGAAAAATTGAAGGGAACGATGATAACTCCCATTGTACTGGCATACATGCTTGAGAGAGAACTAG +TTGCCCGAAGAAGGTTCCTGCCAGTAGCAGGAGCAACATCAGCAGAGTTCATAGAAATGCTACATTGCTTACAAGGTGAA +AATTGGAGACAAATATATCATCCAGGAGGGAATAAACTAACTGAATCTAGATCTCAATCAATGATTGTAGCTTGCAGGAA +GATAATCAGAAGATCAATAGTTGCATCAAACCCACTAGAGCTAGCTGTAGAGATTGCAAATAAGACTGTGATAGACACTG +AACCTTTAAAATCATGTCTGGCAGCCCTGGATGGAGGTGATGTAGCCTGTGACATAATAAGAGCTGCATTAGGATTAAAA +ATTAGACAAAGACAAAGATTTGGGAGACTTGAACTAAAGAGAATATCAGGAAGAGGATTCAAAAATGATGAAGAGATATT +AATCGGAAACGGAACAATACAAAAGATTGGAATATGGGACGGAGAAGAGGAATTCCATGTAAGATGTGGCGAATGCAGGG +GGATATTGAAAAAAAGCCAAATGAGAATGGAAAAACTACTGATAAATTCAGCCAAAAAGGAGGACATGAAAGATTTAATA +ATCTTATGCATGGTATTTTCTCAAGACACTAGGATGTTCCAAGGAGTGAGAGGAGAGATAAATTTTCTTAATCGAGCAGG +CCAACTTTTATCCCCCATGTACCAACTCCAACGATACTTTCTGAATAGGAGCAATGACCTTTTTGATCAATGGGGATATG +AGGAATCACCTAAAGCAAGTGAGCTACATGGGATAAATGAATTAATGAATGCATCTGACTATACATTGAAAGGGGTTGTA +GTAACAAAAAATGTGATTGATGATTTTAGTTCTACTGAAACAGAAAAAGTATCTATAACAAAAAATCTTAGTTTAATAAA +AAGGACTGGGGAAGTTATAATGGGAGCCAATGACGTAAGTGAATTAGAATCACAAGCACAGCTAATGATAACGTATGATA +CACCCAAGATGTGGGAAATGGGAACAACCAAAGAACTGGTACAAAACACTTACCAATGGGTGCTTAAAAATTTAGTAACA +TTGAAGGCTCAGTTTCTTTTGGGAAAAGAAGACATGTTCCAATGGGATGCATTTGAAGCATTTGAAAGCATAATCCCTCA +GAAGATGGCTGGTCAGTACAGTGGATTTGCAAGAGCAGTGCTCAAACAAATGAGAGACCAAGAGGTTATGAAAACTGACC +AATTCATAAAATTGTTGCCTTTCTGTTTTTCGCCACCAAAATTAAGGAGCAATGGAGAGCCTTATCAATTTTTGAGGCTT +ATGCTGAAAGGAGGAGGGGAAAATTTCATCGAAGTAAGGAAAGGGTCCCCCTTGTTCTCCTACAATCCACAAACGGAAAT +CCTAACTATATGCGGCAGAATGATGTCATTAAAAGGAAAAATTGAGGATGAAGAAAGAAATAGATCAATGGGGAATGCAG +TACTGGCAGGCTTTCTTGTTAGTGGCAAATATGACCCTGATCTTGGAGATTTCAAAACCATTGAGGAACTTGAAAGACTA +AAACCGGGAGAAAAAGCCAACATCTTACTTTACCAAGGAAAGCCCGTTAAAGTAGTTAAAAGGAAAAGATATAGTGCTTT +ATCCAATGATATTTCACAAGGGATTAAGAGACAAAGAATGACAGTTGAGTCCATGGGGTGGGCCTTGAGCTAA +>NC_002206.1 Influenza B virus (B/Lee/1940) segment 3, complete sequence +ATGGATACTTTTATTACAAAGAATTTCCAGACTACAATAATACAAAAGGCCAAAAACACAATGGCAGAATTTAGTGAAGA +TCCTGAATTACAGCCAGCAGTACTATTCAACATCTGCGTCCATCTGGAGGTCTGCTATGTAATAAGTGATATGAACTTTC +TTGATGAGGAAGGAAAGACATATACAGCATTAGAAGGACAAGGAAAAGAGCAAAATTTGAGACCACAGTATGAAGTGATT +GAGGGAATGCCAAGAAACATAGCATGGATGGTTCAAAGATCCTTAGCCCAAGAGCATGGAATAGAGACTCCAAGGTATCT +GGCTGATTTATTTGATTATAAAACCAAGAGGTTTATCGAAGTCGGAATAACAAAGGGATTGGCTGATGATTACTTTTGGA +AAAAGAAAGAAAAGTTGGGGAATAGCATGGAACTGATGATATTCAGCTACAATCAAGACTACTCGTTAAGTGATGAATCT +TCATTGGATGAGGAAGGAAAAGGGAGAGTGCTAAGCAGACTCACAGAACTTCAGGCTGAGTTAAGTTTGAAAAACCTATG +GCAAGTTCTAATAGGGGAAGAAGAAATTGAAAAAGGAATTGACTTCAAACTTGGACAAACAATATCTAAACTGAGGAATA +TATCTGTTCCAGCTGGTTTCTCCAATTTTGAAGGGATGAGAAGTTACATAGACAACATAGACCCTAAAGGAGCAATAGAG +AGAAATCTAGCAAGGATGTCTCCCTTAGTATCAGTTACACCCAAAAAGTTGAAATGGGAGGACCTGAGACCCATAGGGCC +TCACATTTACAACCATGAGCTACCAGAAGTTCCATATAATGCCTTTCTCCTCATGTCTGATGAGTTGGGGCTGGCCAATA +TGACTGAAGGAAAGTCCAAGAAACCGAAGACCTTAGCTAAGGAATGTCTAGAAAGGTATTCAACACTACGTGATCAAACT +GACCCAATATTGATAATGAAAAGCGAAAAAGCTAACGAAAACTTCTTATGGAGGTTATGGAGGGACTGTGTAAATACAAT +AAGCAATGAGGAAACAGGCAACGAATTACAGAAAACCAATTATGCCAAGTGGGCCACAGGAGATGGACTAACATACCAAA +AAATAATGAAAGAAGTAGCAATAGATGACGAAACGATGTACCAAGAAGAACCCAAAATACCCAATAAATGTAGAGTGGCT +GCTTGGGTTCAGGCAGAGATGAATCTACTGAGTACTCTGACAAGTAAAAGGGCCCTGGATCTGCCAGAAATAGGGCCAGA +TGTAGCACCCGTGGAGCATGTAGGGAGTGAAAGAAGGAAATACTTTGTTAATGAAATCAACTACTGTAAAGCCTCTACAG +TTATGATGAAGTATGTACTTTTTCACACTTCATTATTAAATGAAAGCAATGCTAGTATGGGAAAATATAAAGTAATACCA +ATCACCAACAGAGTGGTAAATGAAAAAGGGGAAAGCTTTGACATGCTTTATGGTCTGGCGGTTAAGGGGCAATCTCATTT +GCGGGGGGACACGGATGTTGTAACAGTTGTGACTTTCGAGTTTAGTAGTACAGATCCTAGAGTGGACTCAGGAAAGTGGC +CAAAATATACTGTCTTTAAAATTGGCTCCCTATTTGTGAGTGGAAGAGAAAAACCTGTGTACCTATATTGCCGAGTGAAT +GGTACAAACAAAATCCAAATGAAATGGGGAATGGAAGCTAGAAGATGTCTGCTTCAATCAATGCAACAAATGGAGGCAAT +TGTTGATCAAGAATCATCGATACAAGGGTATGATATGACCAAAGCTTGTTTCAAGGGAGACAGAGTGAATAATCCCAAAA +CTTTCAGTATTGGGACTCAGGAAGGCAAACTAGTAAAAGGGTCCTTTGGGAAAGCACTAAGAGTAATATTCACCAAATGT +TTGATGCATTATGTATTTGGAAATGCTCAATTGGAGGGGTTTAGTGCCGAATCTAGGAGACTTCTACTGTTAATTCAGGC +ATTAAAAGACAGGAAGGGCCCTTGGGTATTTGACTTGGAGGGAATGTACTTTGGAGTAGAGGAATGTATTAGTAACAATC +CTTGGGTAATACAGAGTGCATACTGGTTTAATGAATGGTTGGGCATTGAAAAAGAAGGAAGTAAAGTGTTAGAATCAATA +GATGAAATAATGGATGAATGAACGAAGGGCATAGCGCTCAATTT +>NC_002207.1 Influenza B virus (B/Lee/1940) segment 4, complete sequence +AGCAGAAGCGTTGCATTTTCTAATATCCACAAAATGAAGGCAATAATTGTACTACTCATGGTAGTAACATCCAATGCAGA +TCGAATCTGCACTGGGATAACATCGTCAAACTCACCTCATGTGGTTAAAACTGCCACTCAAGGGGAAGTCAATGTGACTG +GTGTGATACCACTAACAACAACACCTACCAAATCTCATTTTGCAAATCTCAAAGGAACACAGACCAGAGGAAAACTATGC +CCAAACTGTTTTAACTGCACAGATCTGGACGTGGCCCTAGGCAGACCAAAATGCATGGGGAACACACCCTCCGCAAAAGT +CTCAATACTCCATGAAGTCAAACCTGCTACATCTGGATGCTTTCCTATAATGCACGACAGAACAAAAATCAGACAACTAC +CTAATCTTCTCAGAGGATATGAAAACATCAGGTTATCAACCAGTAATGTTATCAATACAGAGACGGCACCAGGAGGACCC +TACAAGGTGGGGACCTCAGGATCTTGCCCTAACGTTGCTAATGGGAACGGCTTCTTCAACACAATGGCTTGGGTTATCCC +AAAAGACAACAACAAGACAGCAATAAATCCAGTAACAGTAGAAGTACCATACATTTGTTCAGAAGGGGAAGACCAAATTA +CTGTTTGGGGGTTCCACTCTGATGACAAAACCCAAATGGAAAGACTCTATGGAGACTCAAATCCTCAAAAGTTCACCTCA +TCTGCCAATGGAGTAACCACACATTATGTTTCTCAGATTGGTGGCTTCCCAAATCAAACAGAAGACGAAGGGCTAAAACA +AAGCGGCAGAATTGTTGTTGATTACATGGTACAAAAACCTGGAAAAACAGGAACAATTGTTTATCAAAGAGGCATTTTAT +TGCCTCAAAAAGTGTGGTGCGCAAGTGGCAGGAGCAAGGTAATAAAAGGGTCCTTGCCTTTAATTGGTGAAGCAGATTGC +CTCCACGAAAAGTACGGTGGATTAAATAAAAGCAAGCCTTACTACACAGGAGAGCATGCAAAGGCCATAGGAAATTGCCC +AATATGGGTGAAAACACCCTTGAAGCTGGCCAATGGAACCAAATATAGACCGCCTGCAAAACTATTAAAGGAAAGAGGTT +TCTTCGGAGCTATTGCTGGTTTCTTGGAAGGAGGATGGGAAGGAATGATTGCAGGTTGGCACGGATACACATCTCATGGA +GCACATGGAGTGGCAGTGGCAGCAGACCTTAAGAGTACACAAGAAGCTATAAACAAGATAACAAAAAATCTCAACTATTT +AAGTGAGCTAGAAGTAAAAAACCTTCAAAGACTAAGCGGAGCAATGAATGAGCTTCACGACGAAATACTCGAGCTAGACG +AAAAAGTGGATGATCTAAGAGCTGATACAATAAGCTCACAAATAGAGCTTGCAGTCTTGCTTTCCAACGAAGGGATAATA +AACAGTGAAGATGAGCATCTCTTGGCACTTGAAAGAAAACTGAAGAAAATGCTTGGCCCCTCTGCTGTAGAAATAGGGAA +TGGGTGCTTTGAAACCAAACACAAATGCAACCAGACTTGCCTAGACAGGATAGCTGCTGGCACCTTTAATGCAGGAGATT +TTTCTCTTCCCACTTTTGATTCATTAAACATTACTGCTGCATCTTTAAATGATGATGGCTTGGATAATCATACTATACTG +CTCTACTACTCAACTGCTGCTTCTAGCTTGGCTGTAACATTAATGATAGCTATCTTCATTGTCTACATGGTCTCCAGAGA +CAATGTTTCTTGTTCCATCTGTCTGTGAGGGAGATTAAGCCCTGTGTTTTCCTTTACTGTAGTGCTCATTTGCTTGTCAC +CATTACAAAGAAACGTTATTGAAAAATGCTCTTGTTACTACT +>NC_002208.1 Influenza B virus (B/Lee/1940) segment 5, complete sequence +GGCAGAAGCACAGCATTTTCTTGTGAGCTTCGAGCACTAATAAAACTGAAAATCAAAATGTCCAACATGGATATTGACAG +TATAAATACCGGAACAATCGATAAAACACCAGAAGAACTGACTCCCGGAACCAGTGGGGCAACCAGACCAATCATCAAGC +CAGCAACCCTTGCTCCGCCAAGCAACAAACGAACCCGAAATCCATCTCCAGAAAGGACAACCACAAGCAGTGAAACCGAT +ATCGGAAGGAAAATCCAAAAGAAACAAACCCCAACAGAGATAAAGAAGAGCGTCTACAAAATGGTGGTAAAACTGGGTGA +ATTCTACAACCAGATGATGGTCAAAGCTGGACTTAATGATGACATGGAAAGGAATCTAATTCAAAATGCACAAGCTGTGG +AGAGAATCCTATTGGCTGCAACTGATGACAAGAAAACTGAATACCAAAAGAAAAGGAATGCCAGAGATGTCAAAGAAGGG +AAGGAAGAAATAGACCACAACAAGACAGGAGGCACCTTTTATAAGATGGTAAGAGATGATAAAACCATCTACTTCAGCCC +TATAAAAATTACCTTTTTAAAAGAAGAGGTGAAAACAATGTACAAGACCACCATGGGGAGTGATGGTTTCAGTGGACTAA +ATCACATTATGATTGGACATTCACAGATGAACGATGTCTGTTTCCAAAGATCAAAGGGACTGAAAAGGGTTGGACTTGAC +CCTTCATTAATCAGTACTTTTGCCGGAAGCACACTACCCAGAAGATCAGGTACAACTGGTGTTGCAATCAAAGGAGGTGG +AACTTTAGTGGATGAAGCCATCCGATTTATAGGAAGAGCAATGGCAGACAGAGGGCTACTGAGAGACATCAAGGCCAAGA +CGGCCTATGAAAAGATTCTTCTGAATCTGAAAAACAAGTGCTCTGCGCCGCAACAAAAGGCTCTAGTTGATCAAGTGATC +GGAAGTAGGAACCCAGGGATTGCAGACATAGAAGACCTAACTCTGCTTGCCAGAAGCATGGTAGTTGTCAGACCCTCTGT +AGCGAGCAAAGTGGTGCTTCCCATAAGCATTTATGCTAAAATACCTCAACTAGGATTCAATACCGAAGAATACTCTATGG +TTGGGTATGAAGCCATGGCTCTTTATAATATGGCAACACCTGTTTCCATATTAAGAATGGGAGATGACGCAAAAGATAAA +TCTCAACTATTCTTCATGTCGTGCTTCGGAGCTGCCTATGAAGATCTAAGAGTGTTATCTGCACTAACGGGCACCGAATT +TAAGCCTAGATCAGCACTAAAATGCAAGGGTTTCCATGTCCCGGCTAAGGAGCAAGTAGAAGGAATGGGGGCAGCTCTGA +TGTCCATCAAGCTTCAGTTCTGGGCCCCAATGACCAGATCTGGAGGGAATGAAGTAAGTGGAGAAGGAGGGTCTGGTCAA +ATAAGTTGCAGCCCTGTGTTTGCAGTAGAAAGACCTATTGCTCTAAGCAAGCAAGCTGTAAGAAGAATGCTGTCAATGAA +CGTTGAAGGACGTGATGCAGATGTCAAAGGAAATCTACTCAAAATGATGAATGATTCAATGGCAAAGAAAACCAGTGGAA +ATGCTTTCATTGGGAAGAAAATGTTTCAAATATCAGACAAAAACAAAGTCAATCCCATTGAGATTCCAATTAAGCAGACC +ATCCCCAATTTCTTCTTTGGGAGGGACACAGCAGAGGATTATGATGACCTCGATTATTAAAGCAATAAAATAGACACTAT +GGCTGTGACTGTTTCAGTACGTTTGGGATGTGGGTGTTTACTCTTATTGAAATAAATGTAAAAAATGCTGTTGTTTCTAC +T +>NC_002209.1 Influenza B virus (B/Lee/1940) segment 6, complete sequence +AGCAGAAGCAGAGCATATTCTTAGAACTGAAGTGAACAGGCCAAAAATGAACAATGCTACCTTCAACTGTACAAACATTA +ACCCTATTACTCACATCAGGGGGAGTATTATTATCACTATATGTGTCAGCCTCATTGTCATACTTATTGTATTCGGATGT +ATTGCTAAAATTTTCATCAACAAAAACAACTGCACCAACAATGTCATTAGAGTGCACAAACGCATCAAATGCCCAGACTG +TGAACCATTCTGCAACAAAAGAGATGACATTTCCACCCCCAGAGCCGGAGTGGACATACCCTCGTTTATCTTGCCAGGGC +TCAACCTTTCAGAAGGCACTCCTAATTAGCCCTCATAGGTTCGGAGAGATCAAAGGAAACTCAGCTCCCTTGATAATAAG +AGAACCTTTTGTTGCTTGTGGACCAAAAGAATGCAGACACTTTGCTCTGACCCATTATGCAGCTCAGCCGGGGGGATACT +ACAATGGAACAAGAAAGGACAGAAACAAGCTGAGGCATCTAGTATCAGTCAAATTGGGAAAAATCCCAACTGTGGAAAAC +TCCATTTTCCACATGGCAGCTTGGAGCGGATCCGCATGCCATGATGGTAGAGAATGGACATATATCGGAGTTGATGGTCC +TGACAATGATGCATTGGTCAAAATAAAATATGGAGAAGCATATACTGACACATATCATTCCTATGCACACAACATCCTAA +GAACACAAGAAAGTGCCTGCAATTGCATCGGGGGAGATTGTTATCTTATGATAACAGACGGCTCAGCTTCAGGAATTAGT +AAATGCAGATTTCTTAAAATTAGAGAGGGTCGAATAATAAAAGAAATACTTCCAACAGGAAGAGTGGAGCACACTGAAGA +GTGCACATGCGGGTTCGCCAGCAATAAAACCATAGAATGTGCCTGTAGAGACAACAGTTACACAGCAAAAAGACCCTTTG +TCAAATTAAATGTGGAAACTGATACAGCTGAAATAAGATTGATGTGCACAAAGACTTATCTAGACACTCCCAGACCGGAT +GATGGAAGCATAGCAGGGCCTTGCGAATCTAATGGAGACAAGTGGCTTGGAGGCATCAAAGGAGGATTCGTCCATCAAAG +AATGGCATCTAAGATTGGAAGATGGTACTCCCGAACGATGTCTAAAACTAACAGAATGGGGATGGAACTGTATGTAAAGT +ATGATGGTGACCCATGGACTGACAGTGATGCTCTTACTCTTAGTGGAGTAATGGTTTCCATAGAAGAACCTGGTTGGTAT +TCTTTTGGCTTCGAAATAAAGGACAAGAAATGTGATGTCCCTTGTATTGGGATAGAGATGGTACACGATGGTGGAAAAGA +TACTTGGCATTCAGCTGCAACAGCCATTTACTGTTTGATGGGCTCAGGACAATTGCTATGGGACACTGTCACAGGCGTTG +ATATGGCTTTATAATAGAGGAATGGTTGGATCTGTTCTAAACCCTTTGTTCCTATTTTATTTGAACAGTTGTTCTTACTA +GATTTAATTGTTTCTGAAAAATGCTCTTGTTACTACT +>NC_002210.1 Influenza B virus (B/Lee/1940) segment 7, complete sequence +AGCAGAAGCACGCACTTTCTTAAAATGTCGCTGTTTGGAGACACAATTGCCTACCTGCTTTCACTAATAGAAGATGGAGA +AGGCAAAGCAGAACTAGCTGAAAAATTACACTGTTGGTTCGGTGGGAAAGAATTTGACCTAGATTCTGCTTTGGAATGGA +TAAAAAACAAAAGGTGCCTAACTGATATACAAAAAGCACTAATTGGTGCCTCTATATGCTTTTTAAAACCCAAAGACCAA +GAAAGAAAAAGGAGATTCATCACAGAGCCCCTGTCAGGAATGGGAACAACAGCAACAAAGAAGAAAGGCCTAATTCTAGC +TGAGAGAAAAATGAGAAGATGTGTAAGCTTTCATGAAGCATTTGAAATAGCAGAAGGCCACGAAAGCTCAGCATTACTAT +ATTGTCTTATGGTCATGTACCTAAACCCTGAAAACTATTCAATGCAAGTAAAACTAGGAACGCTCTGTGCTTTATGCGAG +AAACAAGCATCGCACTCGCATAGAGCCCATAGCAGAGCAGCAAGGTCTTCGGTACCTGGAGTAAGACGAGAAATGCAGAT +GGTTTCAGCTATGAACACAGCAAAGACAATGAATGGAATGGGAAAGGGAGAAGACGTCCAAAAACTAGCAGAAGAGCTGC +AAAACAACATTGGAGTGTTGAGATCTCTAGGAGCAAGTCAAAAGAATGGAGAAGGAATTGCCAAAGATGTAATGGAAGTG +CTAAAACAGAGCTCTATGGGAAATTCAGCTCTTGTGAGGAAATACTTATAATGCTCGAACCACTTCAGATTCTTTCAATT +TGTTCTTTCATTTTATCAGCTCTCCATTTCATGGCTTGGACAATAGGGCATTTGAATCAAATAAAAAGAGGGGTAAACTT +GAAAATACAAATAAGGAATCCAAATAAGGAGGCAATAAACAGAGAGGTGTCAATTCTGAGACACAATTACCAAAAGGAAA +TCCAAGCCAAAGAAACAATGAAGAAAATACTCTCTGACAACATGGAAGTATTGGGTGACCACATAGTAGTTGAAGGGCTT +TCAACTGATGAGATAATAAAAATGGGTGAAACAGTTTTGGAGGTGGAAGAATTGCAATGAGCCCAATTTTCACTGTATTT +CTTACTATGCATTTAAGCAAATTGTAATCAATGTCAGTGAATAAAACTGGAAAAAGTGCGTTGTTTCTACT +>NC_002211.1 Influenza B virus (B/Lee/1940) segment 8, complete sequence +CGCAGAAGCAGAGGATTTATTTAGTCACTGGCAAACGGAAAGATGGCGGACAACATGACCACAACACAAATTGAGGTGGG +TCCGGGAGCAACCAATGCCACTATAAACTTTGAAGCAGGAATTCTGGAGTGCTATGAAAGGTTTTCATGGCAAAGAGCCC +TTGACTATCCTGGTCAAGACCGCCTACACAGACTAAAACGAAAATTAGAATCAAGAATAAAGACTCACAACAAGAGTGAG +CCTGAGAATAAAAGGATGTCTCTTGAAGAGAGAAAAGCAATTGGGGTAAAAATGATGAAAGTGCTTCTGTTTATGGATCC +CTCTGCTGGAATTGAAGGGTTTGAGCCATACTGTGTGAAAAATCCCTCAACTAGCAAATGTCCAAATTACGATTGGACCG +ATTACCCTCCAACCCCAGGAAAGTACCTTGATGACATAGAAGAAGAGCCGGAAAATGTCGATCACCCAATTGAGGTAGTA +TTAAGGGACATGAACAATAAAGATGCACGACAAAAGATAAAGGATGAAGTAAACACTCAGAAAGAGGGGAAATTCCGTTT +GACAATAAAAAGGGATATACGTAATGTGTTGTCCTTGAGAGTGTTGGTGAACGGAACCTTCCTCAAGCACCCTAATGGAG +ACAAGTCCTTATCAACTCTTCATAGATTGAATGCATATGACCAGAATGGAGGGCTTGTTGCTAAACTTGTTGCTACTGAT +GATCGGACAGTGGAGGATGAAAAAGATGGCCATCGGATCCTCAACTCACTCTTCGAGCGTTTTGATGAAGGACATTCAAA +GCCAATTCGAGCAGCTGAAACTGCGGTGGGAGTCTTATCCCAATTTGGTCAAGAGCACCGATTATCACCAGAAGAGGGAG +ACAATTAGACTGGCCACGGAAGAACTTTATCTCTTGAGTAAAAGAATTGATGATAGTATATTGTTCCACAAAACAGTAAT +AGCTAACAGCTCCATAATAGCTGACATGATTGTATCATTATCATTACTGGAAACATTGTATGAAATGAAGGATGTGGTTG +AAGTGTACAGCAGGCAGTGCTTATGAATGTAAAATAAAAATCCTCTTGTTACTACT +>NC_002204.1 Influenza B virus RNA 1, complete sequence +AGCAGAAGCGGAGCTTTAAGATGAATATAAATCCATATTTTCTTTTCATAGATGTACCTATACAGGCAGCAATTTCAACA +ACATTCCCATACACCGGTGTTCCCCCTTATTCTCATGGAACGGGAACAGGCTACACAATAGACACCGTGATTAGAACACA +CGAGTACTCAAACAAGGGAAAACAATACATTTCTGATGTTACAGGATGTGTAATGGTAGATCCAACAAATGGGCCATTAC +CCGAAGACAATGAACCGAGTGCCTATGCACAATTGGATTGTGTTCTGGAGGCTTTGGATAGAATGGATGAAGAACATCCA +GGTCTGTTTCAAGCAGGGTCACAGAATGCCATGGAGGCACTAATGGTCACAACAGTGGACAAATTGACTCAGGGGAGACA +GACCTTTGATTGGACGGTGTGTAGAAACCAACCTGCTGCAACGGCACTGAACACAACAATAACCTCTTTTAGGTTGAATG +ATTTAAATGGAGCCGACAAGGGTGGATTAGTGCCCTTTTGCCAAGATATCATTGATTCATTAGACAAACCTGAAATGATT +TTCTTCACAGTAAAGAATATAAAGAAAAAATTGCCTGCTAAAAACAGAAAGGGTTTCCTTATAAAAAGAATACCTATGAA +GGTAAAAGACAGAATAACAAGAGTGGAATACATCAAAAGAGCATTATCATTAAACACAATGACTAAAGATGCTGAAAGAG +GCAAACTAAAAAGAAGAGCAATTGCCACCGCTGGGATACAAATCAGAGGATTTGTATTAGTAGTTGAAAACTTGGCTAAA +AATATCTGTGAAAATCTAGAGCAAAGTGGTTTACCCGTAGGTGGAAACGAAAAGAAGGCCAAACTATCAAATGCAGTGGC +TAAAATGCTCAGTAATTGTCCACCAGGAGGGATCAGTATGACTGTGACAGGAGACAATACTAAATGGAATGAATGCTTAA +ATCCAAGAATCTTTTTGGCTATGACTGAAAGAATAACCAGAGACAGCCCAATTTGGTTCCGGGATTTTTGTAGTATAGCA +CCGGTCTTGTTCTCCAATAAAATAGCTAGATTGGGAAAAGGGTTCATGATAACAAGTAAAACAAAAAGACTAAAAGCTCA +AATACCTTGTCCCGATCTGTTTAATATACCATTAGAAAGATATAATGAAGAAACAAGGGCAAAACTGAAAAAGCTAAAAC +CTTTCTTCAATGAAGAAGGAACGGCATCTCTTTCGCCAGGAATGATGATGGGAATGTTTAATATGCTATCTACAGTATTA +GGAGTAGCCGCACTAGGGATAAAAAACATTGGAAACAAAGAATACTTATGGGATGGACTGCAGTCTTCGGATGATTTTGC +TCTGTTTGTTAATGCAAAAGATGAAGAGACATGTATGGAAGGAATAAACGATTTTTACCGAACATGTAAGCTATTGGGAA +TAAACATGAGCAAAAAGAAAAGTTACTGTAATGAAACTGGGATGTTTGAATTTACCAGCATGTTTTACAGAGATGGATTT +GTATCTAATTTTGCAATGGAACTCCCTTCATTTGGAGTCGCTGGAGTGAATGAATCAGCAGACATGGCAATAGGAATGAC +AATAATAAAGAACAATATGATCAACAATGGGATGGGCCCAGCAACGGCACAAACAGCCATACAATTATTCATAGCTGACT +ATAGATACACCTACAAATGCCACAGGGGAGATTCCAAAGTGGAAGGGAAGAGAATGAAAATTATAAAGGAGCTATGGGAA +AACACTAAAGGAAGAGATGGTCTATTAGTAGCAGATGGTGGGCCTAATCTTTACAATTTGAGAAACCTGCATATTCCAGA +AATAATATTAAAATACAACATAATGGACCCTGAGTACAAAGGACGGTTACTGCATCCTCAAAATCCCTTTGTAGGACATT +TGTCTATTGAGGGTATCAAAGAAGCAGATATAACACCTGCACATGGCCCAATAAAGAAAATGGACTACGATGCGGTATCT +GGAACTCATAGTTGGAGAACCAAAAGGAACAGATCTATACTAAACACTGATCAGAGGAACATGATTCTTGAGGAACAATG +CTACGCTAAGTGTTGCAACCTTTTTGAGGCTTGCTTTAACAGTGCGTCATACAGGAAACCAGTAGGCCAGCACAGCATGC +TTGAAGCTATGGCCCACAGATTAAGAATGGATGCACGACTGGACTATGAGTCAGGAAGGATGTCAAAAGAGGATTTCGAA +AAAGCAATGGCTCACCTTGGTGAGATTGGGTACATGTAAGCTCCGGAAATGTCTATGGGGTTATTGGTCATCGTTGAATA +CATGCGGTGCACAAATGATTAAAATGAAAAAAGGCTCGTGTTTCTACT +>NC_004910.1 Influenza A virus pb2 gene for polymerase Pb2, genomic RNA, strain A/Hong Kong/1073/99(H9N2) +GCCAAAAGCAGGTCAATTATATTCAATATGGAAAGAATAAAAGAACTAAGAAATTTGATGTCGCAATCTCGCACTCGCGA +GATACTGACAAAAACCACTGTGGATCATATGGCCATAATTAAGAAGTACACATCAGGAAGACAGGAGAAGAATCCCGCTC +TTAGAATGAAATGGATGATGGCGATGAAATACCCGATCACAGCTGACAAAAGAATAATGGAGATGATCCCTGAAAGGAAT +GAGCAAGGCCAAACTCTTTGGAGCAAAACAAATGACGCTGGATCAGACAGGGTAATGGTATCACCTCTGGCTGTAACGTG +GTGGAACAGAAATGGACCAACAACAAGTACAGTCCATTATCCAAAGGTGTATAAAACCTACTTTGAAAAGGTTGAAAGAT +TAAAACACGGAACCTTTGGCCCTGTTCATTTCCGGAATCAAGTCAAAATACGCCGCAGGGTTGACATGAACCCTGGCCAT +GCAGATCTCAGCGCTAAAGAAGCACAAGATGTCATCATGGAGGTCGTTTTCCCAAATGAAGTTGGAGCCAGGATATTGAC +ATCAGAATCACAGCTGACAATAACAAAGGAAAAGAGGGAGGAACTCAAGAATTGTAATATTGCTCCTTTAATGGTGGCAT +ATATGTTGGAAAGAGAATTGGTTCGCAAGACCAGATTCCTACCCGTGGCTGGCGGGACAAGCAGCGTATATATAGAAGTA +TTGCATTTGACTCAAGGAACTTGCTGGGAGCAGATGTACACACCAGGAGGGGAGGTAAGAAATGATGATGTTGACCAAAG +TTTAATCATTGCTGCTAGGAACATTGTCAGGAGAGCAACAGTATCAGCAGACCCATTGGCTTCACTCCTGGAAATGTGCC +ATAGCACACAAATTGGCGGAGTAAGAATGGTAGACATCCTTAAACAAAACCCAACAGAAGAGCAAGCTGTAGATATATGC +AAGGCAGCAATGGGTTTGAAAATCAGCTCATCCTTCAGCTTTGGAGGGTTCACTTTCAAAAGAACAAAGGGGTCTTCTGT +CAAAAGAGAGGAAGAAGTGCTTACAGGCAACCTCCAAACATTGAAGATAAAAGTACATGAAGGATATGAGGAATTCACAA +TGGTTGGACGAAGAGCAACAGCCATTCTAAGAAAAGCAACCAGAAGGATGATCCAACTGATAGTCAGCGGAAGGGACGAG +CAATCAATTGCTGAGGCAATTATTGTGGCAATGGTGTTCTCACAAGAAGATTGCATGGTAAAGGCAGTCCGAGGTGATTT +GAATTTCGTAAACAGAGCAAATCAACGACTGAATCCCATGCACCAACTCCTGAGACACTTTCAAAAGGATGCAAAGGTGC +TGTTTCAAAACTGGGGAATTGAACCCATCGACAATGTCATGGGTATGATTGGAATATTGCCTGACATGACCCCCAGCACG +GAAATGTCACTAAGAGGAGTGAGAGTTAGCAAAATGGGGGTGGATGAATATTCTAGCACTGAAAGGGTGGTCGTGAGCAT +TGACCGTTTCTTAAGGGTCCGAGATCAGCGAGGAAATGTACTCCTATCCCCTGAAGAAGTTAGTGAAACACAGGGAATGG +AAAAGTTGACGATAACTTATTCATCGTCTATGATGTGGGAGATTAACGGGCCAGAATCAGTGCTAGTTAACACATATCAA +TGGATCATTAGGAATTGGGAGACTGTAAAGATCCAATGGTCCCAAGAACCCACCATGCTATACAATAAGATGGAGTTTGA +ACCATTTCAATCTTTAGTACCAAAGGCTGCCAGAAGCCAATATAGTGGATTTGTGAGAACGCTATTCCAGCAGATGCGTG +ATGTTTTGGGAACGTTCGACACTGTTCAAATAATCAAACTACTACCATTTGCAGCAGCCCCACCGGAACAGAGTAGGATG +CAATTTTCTTCTCTGACTGTGAATGTGAGGGGATCAGGAATGAGAATACTTGTGAGAGGTAACTCCCCTGCATTTAACTA +CAACAAGACAACTAAGAGGCTTACAATACTTGGGAAGGACGCAGGTGCGCTTACAGAGGACCCAGATGAAGGAACAGCAG +GAGTAGAGTCTGCAGTATTGAGAGGATTTCTAATCCTCGGCAAAGAAGACAAAAGATATGGACCAGCATTAAGCATCAAT +GAACTGAGCAATCTTACGAAAGGGGAGAAAGCTAATGTATTGATAGGGCAAGGAGACGTAGTGTTGGTAATGAAACGGAA +ACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAGTGTCGAATTGTTT +AAAAACGACCTTGTTTCTACT +>NC_004911.1 Influenza A virus pb1 gene for polymerase Pb1, genomic RNA, strain A/Hong Kong/1073/99(H9N2) +GCAAAAGCAGGCAAACCATTTGAATGGATGTCAATCCGACTTTACTTTTCTTAAAAGTGCCAGCGCAAAATGCAATAAGT +ACCACATTCCCTTATACTGGAGATCCCCCATATAGCCATGGAACAGGAACAGGATACACCATGGACACAGTCAACAGAAC +ACATCAATATTCAGAAAAAGGGAGGTGGACAACAAACACAGAGACCGGAGCACCCCAACTCAACCCTATTGATGGACCAT +TACCTGAAGACAATGAGCCGAGCGGGTATGCACAAACAGATTGTGTATTGGAAGCAATGGCTTTCCTTGAAGAATCCCAC +CCAGGACTCTTTGAAAACTCATGTCTTGAAACGATGGAAGTTGTCCAGCAAACGAGAGTGGATAAGCTGACCCAAGGTCG +CCAGACTTATGACTGGACATTGAATAGAAACCAGCCGGCTGCAACTGCTTTGGCCAACACCATAGAAGTATTCAGATCGA +ACGGTCTAACAGCCAATGAGTCAGGAAGGTTAATAGATTTCCTCAAGGACGTAATGGAATCAATGGATAAGGAAGAAATG +GAAATAACAACACATTTCCAGAGAAAGAGAAGAGTGAGGGACAACATGACCAAGAAAATGGTCACACAAAGAACAATAGG +GAAGAAGAAGCAAAAGCTGACAAAAAAGAGCTACCTAATAAGAGCACTGACACTGAACACAATGACAAAAGATGCTGAAA +GGGGAAAATTGAAAAGACGAGCGATTGCAACACCCGGAATGCAAATCAGAGGATTCGTGCACTTTGTCGAAGCACTAGCA +AGGAGCATCTGTGAAAAACTTGAGCAATCTGGACTCCCCGTTGGAGGGAATGAGAAGAAGGCTAAATTGGCAAATGTTGT +GAGAAAGATGATGACTAACTCACAAGACACAGAGCTCTCCTTTACAGTTACCGGAGACAACACCAAATGGAATGAGAATC +AGAATCCTCGAATATTTCTAGCAATGATAACATACATCACAAGGAACCAACCTGAATGGTTTAGAAATGTCTTGAGCATT +GCCCCTATAATGTTCTCAAATAAAATGGCGAGGTTAGGAAAAGGATACATGTTCGAGAGTAAGAGCATGAAGCTACGGAC +ACAAATACCAGCAGAAATGCTTGCAAACATTGACTTGAAATACTTCAACGAATCGACGAGAAAGAAAATTGAGAAAATAA +GACCTCTACTAATAGAGGGCACAGCCTCATTGAGTCCAGGGATGATGATGGGCATGTTTAATATGCTAAGTACGGTCTTA +GGAGTCTCAATCTTAAATCTTGGGCAGAAGAGGTACACCAAAACCACATACTGGTGGGATGGGCTCCAATCCTCTGATGA +TTTCGCTCTCATAGTGAATGCACCAAATCATGAGGGAATACAAGCAGGAGTGGATAGATTCTATAGGACTTGCAAGCTAG +TTGGAATCAACATGAGCAAAAAGAAGTCTTACATAAATCGGACAGGAACATTTGAGTTCACAAGCTTTTTCTACCGCTAT +GGGTTTGTAGCCAACTTCAGCATGGAGCTGCCCAGCTTTGGAGTTTCCGGAATTAATGAATCGGCTGACATGAGCATTGG +AGTTACAGTGATAAAGAATAATATGATAAACAACGACCTTGGACCAGCAACAGCCCAGATGGCTCTTCAGCTGTTCATTA +AAGACTACAGATACACCTACCGATGCCACAGAGGTGATACACAAATTCAAACTAGAAGATCATTTGAATTGAAGAAGCTG +TGGGAGCAGACCCGCTCAAAGGCAGGACTGTTGGTTTCAGATGGAGGGCCGAATTTATACAACATCCGGAATCTTCACAT +TCCAGAAGTTTGCTTGAAGTGGGAGTTGATGGATGAAGATTACCAGGGAAGACTGTGTAACCCTCTGAACCCGTTTGTCA +GTCATAAGGAAGTTGAATCCGTCAACAATGCTGTGGTAATGCCAGCCCATGGTCCGGCCAAGAGCATGGAATATGATGCC +GTTGCAACTACACATTCATGGATTCCCAAGAGAAATCGCTCCATTCTCAACACTAGCCAAAGGGGAATTCTTGAGGATGA +ACAAATGTACCAGAAGTGCTGCACTCTATTCGAGAAATTCTTCCCTAGCAGTTCATATCGGAGGCCAGTTGGAATTTCCA +GCATGATGGAGGCCATGGTGTCTAGGGCCCGAATTGATGCACGGATTGACTTCGAGTCTGGAAGGATTAAGAAAGAAGAA +TTTGCTGAGATCTTGAAGATCTGTTCCACCATTGAAGAGCTCGGACGGCAAGGGAAGTGAATTTGGCTTGTCCTTCATGA +AAAAATGC +>NC_004912.1 Influenza A virus pa gene for polymerase PA, genomic RNA, strain A/Hong Kong/1073/99(H9N2) +AAAGCAGGTACTGATCCAAAATGGAAGACTTTGTGCGACAGTGCTTCAATCCAATGATTGTCGAGCTTGCGGAAAAGACA +ATGAAGGAATATGGGGAAGACCCGAAAATTGAAACAAATAAGTTCGCTGCAATATGCACACACTTAGAAGTCTGCTTCAT +GTATTCAGACTTCCATTTCATTGACGAACGAGGCGAATCAATAATTGTGGAATCTGGTGATCCAAATGCATTGTTGAAGC +ACAGGTTTGAAATAATTGAAGGAAGAGACCGAGCAATGGCCTGGACAGTGGTGAATAGCATCTGCAACACAACAGGAGTC +GATAAACCCAAATTTCTTCCGGATCTATACGACTACAAGGAAAACCGATTCACTGAAATTGGTGTGACACGGAGGGAAGT +TCACATATATTACTTAGAAAAAGCTAACAAGATAAAATCCGAGAAAACACATATCCACATCTTTTCATTCACTGGAGAAG +AAATGGCCACTAAAGCTGACTACACCCTTGATGAAGAGAGCAGGGCAAGAATAAAAACCAGACTATTCACCATAAGACAG +GAAATGGCAAGCAGGGGTCTATGGGATTCCTTTCGTCAGTCCGAGAGAGGCGAAGAGACAATTGAAGAAAGATTTGAAAT +CACAGGGACCATGCGTAGGCTTGCCGACCAAAGTCTCCCACCTAACTTCTCCAGCCTTGAAAACTTTAGAGCCTATGTGG +ATGGATTCAAACCGAACGGCTGCATTGAGGGCAAGCTTTCTCAAATGTCGAAAGAAGTGAACGCCAGAATTGAGCCATTT +CTGAAGACAACACCACGTCCCCTCAGATTGCCTGATGGACCTCCCTGCTCCCAGCGGTCGAAATTCTTGCTGATGGATGC +TCTGAAATTAAGCATTGAGGACCCGAGCCATGAGGGGGAGGGGATACCGCTATATGATGCGATAAAATGCATGAAAACAT +TCTTCGGCTGGAGAGAGCCCAACATCATCAAGCCACACGAGAAGGGCATAAATCCCAATTATCTTCTGGCTTGGAAGCAG +GTGCTGGCAGAACTCCAGGATATTGAAAATGAGGATAAAATCCCAAAAACAAAGAACATGAAGAAAACAAGCCAATTAAT +GTGGGCACTCGGGGAGAATATGGCACCGGAAAAATTGGACTTTGAGGACTGCAAAGATATTGGCGATCTGAAACAGTATC +AAAGTGATGAGCCAGAGCTCAGATCGATAGCAAGCTGGATCCAGAGTGAGTTCAACAAGGCATGTGAATTGACCGATTCG +AGCTGGATAGAACTCGATGAGATAGGGGAAGATGTTGCCCCAATTGAGCACATTGCAAGCATGAGAAGGAACTACTTCAC +AGCGGAAGTGTCTCATTGCAGGGCCACTGAGTACATAATGAAGGGGGTTTACATAAATACAGCTTTGCTCAATGCATCTT +GTGCAGCCATGGATGACTTCCAACTGATTCCAATGATAAGCAAATGCAGAACAAAAGAAGGAAGAAGGAAGACAAACCTG +TATGGGTTCATTATAAAAGGAAGGTCCCATTTGAGAAATGATACTGACGTGGTGAACTTTGTGAGTATGGAATTCTCCCT +TACTGACCCAAGGCTGGAGCCACACAAATGGGAAAAGTACTGTGTTCTTGAAGTAGGGGAAATGCTCTTGCGGACTGCAA +TAGGCCAGGTGTCAAGGCCCATGTTCCTGTATGTGAGAACTAACGGAACCTCCAAAATTAAGATGAAATGGGGGATGGAA +ATGAGACGCTGCCTTCTTCAATCTCTTCAACAGATTGAGAGCATGATCGAGGCTGAGTCTTCTATCAAAGAGAAAGACAT +GACCAAAGAATTCTTTGAAAACAGATCGGAGACATGGCCAATTGGAGAGTCACCTAAGGGAGTGGAGGAAGGCTCAATCG +GGAAGGTGTGCAGAACCTTACTAGCAAAATCTGTGTTCAACAGCCTATATTCATCTCCACAACTCGAAGGATTTTCAGCT +GAATCGAGAAAACTACTACTCATTGTTCAAGCACTTAGGGACAACCTGGAACCTGGAACCTTTGATCTTGAAGGGCTATA +TGGAGCAATTGAGGAGTGCCTGATTAATGATCCCTGGGTTTTGCTTAATGCATCTTGGTTCAACTCCTTCCTCACACATG +CACTAAAATAGTTGTGGCAATGCTACTATTTGCTATCCATACTGTCCAAAAAAGTACCTTGTTTC +>NC_004908.1 Influenza A virus ha gene for Hemagglutinin, genomic RNA, strain A/Hong Kong/1073/99(H9N2) +GCAAAAGCAGGGGAATTACTTAACTAGCAAAATGGAAACAATATCACTAATAACTATACTACTAGTAGTAACAGCAAGCA +ATGCAGATAAAATCTGCATCGGCCACCAGTCAACAAACTCCACAGAAACTGTGGACACGCTAACAGAAACCAATGTTCCT +GTGACACATGCCAAAGAATTGCTCCACACAGAGCATAATGGAATGCTGTGTGCAACAAGCCTGGGACATCCCCTCATTCT +AGACACATGCACTATTGAAGGACTAGTCTATGGCAACCCTTCTTGTGACCTGCTGTTGGGAGGAAGAGAATGGTCCTACA +TCGTCGAAAGATCATCAGCTGTAAATGGAACGTGTTACCCTGGGAATGTAGAAAACCTAGAGGAACTCAGGACACTTTTT +AGTTCCGCTAGTTCCTACCAAAGAATCCAAATCTTCCCAGACACAACCTGGAATGTGACTTACACTGGAACAAGCAGAGC +ATGTTCAGGTTCATTCTACAGGAGTATGAGATGGCTGACTCAAAAGAGCGGTTTTTACCCTGTTCAAGACGCCCAATACA +CAAATAACAGGGGAAAGAGCATTCTTTTCGTGTGGGGCATACATCACCCACCCACCTATACCGAGCAAACAAATTTGTAC +ATAAGAAACGACACAACAACAAGCGTGACAACAGAAGATTTGAATAGGACCTTCAAACCAGTGATAGGGCCAAGGCCCCT +TGTCAATGGTCTGCAGGGAAGAATTGATTATTATTGGTCGGTACTAAAACCAGGCCAAACATTGCGAGTACGATCCAATG +GGAATCTAATTGCTCCATGGTATGGACACGTTCTTTCAGGAGGGAGCCATGGAAGAATCCTGAAGACTGATTTAAAAGGT +GGTAATTGTGTAGTGCAATGTCAGACTGAAAAAGGTGGCTTAAACAGTACATTGCCATTCCACAATATCAGTAAATATGC +ATTTGGAACCTGCCCCAAATATGTAAGAGTTAATAGTCTCAAACTGGCAGTCGGTCTGAGGAACGTGCCTGCTAGATCAA +GTAGAGGACTATTTGGAGCCATAGCTGGATTCATAGAAGGAGGTTGGCCAGGACTAGTCGCTGGCTGGTATGGTTTCCAG +CATTCAAATGATCAAGGGGTTGGTATGGCTGCAGATAGGGATTCAACTCAAAAGGCAATTGATAAAATAACATCCAAGGT +GAATAATATAGTCGACAAGATGAACAAGCAATATGAAATAATTGATCATGAATTCAGTGAGGTTGAAACTAGACTCAATA +TGATCAATAATAAGATTGATGACCAAATACAAGACGTATGGGCATATAATGCAGAATTGCTAGTACTACTTGAAAATCAA +AAAACACTCGATGAGCATGATGCGAACGTGAACAATCTATATAACAAGGTGAAGAGGGCACTGGGCTCCAATGCTATGGA +AGATGGGAAAGGCTGTTTCGAGCTATACCATAAATGTGATGATCAGTGCATGGAAACAATTCGGAACGGGACCTATAATA +GGAGAAAGTATAGAGAGGAATCAAGACTAGAAAGGCAGAAAATAGAGGGGGTTAAGCTGGAATCTGAGGGAACTTACAAA +ATCCTCACCATTTATTCGACTGTCGCCTCATCTCTTGTGCTTGCAATGGGGTTTGCTGCCTTCCTGTTCTGGGCCATGTC +CAATGGATCTTGCAGATGCAACATTTGTATATAA +>NC_004905.2 Influenza A virus (A/Hong Kong/1073/99(H9N2)) segment 5, complete sequence +AGCAGGGTTAATAATCACTCACTGAGTGACATCAACATCATGGCGTCGCAAGGCACCAAACGATCCTATGAACAGATGGA +AACTGGTGGAGAACGCCAGAATGCCACTGAGATCAGGGCATCTGTTGGAAGAATGGTTGGTGGAATTGGGAGGTTTTACG +TACAGATGTGCACTGAACTCAAACTCAGCGACCAAGAAGGAAGGTTGATCCAGAACAGTATAACAATAGAGAGAATGGTT +CTCTCCGCATTTGATGAAAGGAGGAACAGGTACCTAGAGGAACATCCCAGTGCGGGGAAGGACCCGAAGAAGACCGGAGG +TCCAATCTACCGAAGGAGAGACGGGAAATGGGTGAGAGAGCTGATTCTGTATGACAAAGAGGAGATAAGGAGAATTTGGC +GTCAAGCGAACAATGGAGAAGACGCAACTGCTGGTCTCACTCATATGATGATCTGGCATTCCAACCTAAATGATGCCACA +TACCAGAGAACAAGAGCCCTCGTGCGGACTGGAATGGACCCCAGAATGTGCTCTCTGATGCAAGGATCAACCCTCCCGAG +GAGATCTGGAGCTGCTGGTGCAGCAATAAAGGGAGTCGGGACAATGGTAATGGAACTAATTCGGATGATAAAGCGAGGCA +TTAATGACCGGAACTTCTGGAGAGGCGATAATGGACGAAGAACAAGGATTGCATATGAGAGAATGTGCAACATCCTCAAA +GGGAAATTTCAAACAGCAGCACAAAGAGCAATGATGGATCAGGTGCGAGAAAGCAGAAATCCTGGGAATGCTGAAATTGA +AGATCTCATCTTTCTGGCACGGTCTGCACTCATCCTGAGAGGATCCGTAGCCCATAAGTCCTGCTTGCCTGCTTGTGTGT +ACGGGCTCGCTGTGGCCAGTGGATATGATTTTGAGAGGGAAGGGTACTCTCTGGTTGGGATAGATCCTTTCCGTCTGCTT +CAGAACAGTCAGGTCTTCAGTCTTATTAGACCAAATGAGAATCCAGCACATAAAAGTCAATTGGTATGGATGGCATGCCA +TTCTGCAGCATTTGAGGACCTGAGAGTCTCAAGTTTCATTAGAGGAACAAGAGTGATCCCAAGAGGACAACTATCCACTA +GAGGAGTTCAGATTGCTTCAAATGAGAACGTGGAAGCAATGGATTCCAGCACTCTTGAACTGAGAAGCAGATATTGGGCT +ATAAGGACCAGGAGTGGAGGAAACACCAATCAACAGAGAGCATCTGCAGGACAAATCAGTGTACAGCCCACTTTCTCAGT +ACAGAGAAATCTTCCCTTCGAAAGACCGACCATTATGGCTGCGTTTAAGGGGAATACCGAGGGCAGAACATCTGACATGA +GGACTGAAATCATAAGGATGATGGAAAGTGCCAGACCAGAAGATGTGTCTTTCCAGGGGCGGGGAGTCTTCGAGCTCTCG +GACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAGTAATGAAGGATCTTATTTCTTCGGAGACAATGCAGA +GGAATATGACAATTGAGGAAAAATACCCTTGTTTCTA +>NC_004909.1 Influenza A virus na gene for neuraminidase, genomic RNA, strain A/Hong Kong/1073/99(H9N2) +ATGAATCCAAATCAAAAGATAATAGCACTTGGCTCTGTTTCTATAACTATTGCGACAATATGTTTACTCATGCAGATTGC +CATCTTAGCAACGACTATGACACTACATTTCAATGAATGTACCAACCCATCGAACAATCAAGCAGTGCCATGTGAACCAA +TCATAATAGAAAGGAACATAACAGAGATAGTGCATTTGAATAATACTACCATAGAGAAGGAAAGTTGTCCTAAAGTAGCA +GAATACAAGAATTGGTCAAAACCGCAATGTCAAATTACAGGGTTCGCCCCTTTCTCCAAGGACAACTCAATTAGGCTTTC +TGCAGGCGGGGATATTTGGGTGACAAGAGAACCTTATGTATCGTGCGGTCTTGGTAAATGTTACCAATTTGCACTTGGGC +AGGGAACCACTTTGAACAACAAACACTCAAATGGCACAATACATGATAGGAGTCCCCATAGAACCCTTTTAATGAACGAG +TTGGGTGTTCCATTTCATTTGGGAACCAAACAAGTGTGCATAGCATGGTCCAGCTCAAGCTGCCATGATGGGAAGGCATG +GTTACATGTTTGTGTCACTGGGGATGATAGAAATGCGACTGCTAGCATCATTTATGATGGGATGCTTACCGACAGTATTG +GTTCATGGTCTAAGAACATCCTCAGAACTCAGGAGTCAGAATGCGTTTGCATCAATGGAACTTGTACAGTAGTAATGACT +GATGGAAGTGCATCAGGAAGGGCTGATACTAAAATACTATTCATTAGAGAAGGGAAAATTGTCCACATTGGTCCACTGTC +AGGAAGTGCTCAGCATGTGGAGGAATGCTCCTGTTACCCCCGGTATCCAGAAGTTAGATGTGTTTGCAGAGACAATTGGA +AGGGCTCCAATAGACCCGTGCTATATATAAATGTGGCAGATTATAGTGTTGATTCTAGTTATGTGTGCTCAGGACTTGTT +GGCGACACACCAAGAAATGACGATAGCTCCAGCAGCAGTAACTGCAGGGATCCTAATAACGAGAGAGGGGGCCCAGGAGT +GAAAGGGTGGGCCTTTGACAATGGAAATGATGTTTGGATGGGACGAACAATCAAGAAAGATTCGCGCTCTGGTTATGAGA +CTTTCAGGGTCGTTGGTGGTTGGACTACGGCTAATTCCAAGTCACAAATAAATAGGCAAGTCATAGTTGACAGTGATAAC +TGGTCTGGGTATTCTGGTATATTCTCTGTTGAAGGAAAAACCTGCATCAACAGGTGTTTTTATGTGGAGTTGATAAGAGG +GAGACCACAGGAGACCAGAGTATGGTGGACTTCAAATAGCATCATTGTATTTTGTGGAACTTCAGGTACCTATGGAACAG +GCTCATGGCCTGATGGAGCGAATATCAATTTCATGTCTATATAAGCTTTCGCAATTTT +>NC_004907.1 Influenza A virus (A/Hong Kong/1073/99(H9N2)) segment 7, complete sequence +GGGGAATTCCAAAAGCAGGTAGATATTGAAAGATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCATCCCA +TCAGGCCCCCTCAAAGCCGAGATCGCGCAGAGACTTGAGGATGTTTTTGCAGGGAAGAACACAGATCTTGAGGCTCTCAT +GGAATGGCTAAAGACAAGACCAATCCTGTCACCTCTGACTAAGGGGATTTTAGGGTTTGTGTTCACGCTCACCGTGCCCA +GTGAGCGAGGACTGCAGCGTAGACGATTTGTCCAAAATGCCCTAAATGGGAATGGAGACCCAAACAACATGGACAGGGCA +GTTAAACTATACAAGAAGCTGAAGAGGGAAATGACATTCCATGGAGCAAAGGAAGTTGCACTCAGTTACTCAACTGGTGC +GCTTGCCAGTTGCATGGGTCTCATATACAACCGGATGGGAACAGTGACCACAGAAGTGGCTCTTGGCCTAGTATGTGCCA +CTTGTGAACAGATTGCTGATGCCCAACATCGGTCCCACAGGCAGATGGCGACTACCACCAACCCACTAATCAGGCATGAG +AACAGAATGGTACTAGCCAGCACTACGGCTAAGGCCATGGAGCAGATGGCTGGATCAAGTGAGCAGGCAGCAGAAGCCAT +GGAAGTCGCAAGTCAGGCTAGGCAAATGGTGCAGGCTATGAGGACAATTGGGACTCACCCTAGTTCCAGTGCAGGTCTAA +AAGATGATCTTATTGAAAATTTGCAGGCTTACCAGAAACGGATGGGAGTGCAAATGCAGAGATTCAAGTGATCCTCTCGT +TGTTGCAGCAAGTATCATTGGGATATTGCACTTGATATTGTGGATTCTTGATCGTCTTTTCTTCAAATGCATTTATCGTC +GCTTTAAATACGGTTTGAAAAGAGGGCCTTCTACGGAAGGAGTGCCTGAGTCTATGAGGGAAGAGTATCGGCAGGAACAG +CAGAATGCTGTGGATGTTGACGATGGTCATTTTGTCAACATAGAGCTGGAGTAAAAGATCTTCCT +>NC_004906.1 Influenza A virus (A/Hong Kong/1073/99(H9N2)) segment 8, complete sequence +AGCAAAAGCAGGGTGACAAAGACATAATGGATTCCAACACTGTGTCAAGCTTTCAGGTAGACTGCTTTCTTTGGCATGTC +CGCAAACGATTTGCAGACCAAGAACTGGGTGATGCCCCATTCCTTGACCGGCTTCGCCGAGATCAGAAGTCCCTAAGAGG +AAGAGGCAGCACTCTTGGTCTGGACATCAGAACTGCCACTCGTGAAGGAAAGCATATAGTGGAGCGGATTCTGGAGGAAG +AATCTGACGAGGCACTTAAAATGACTATCGCTTCAGTGCCTGCTTCACGCTACCTAACTGAAATGACTCTTGAGGAAATG +TCAAGGGATTGGTTAATGCTCATTCCCAAGCAGAAAGTGACAGGGCCCCTTTGCATTAGAATGGACCAGGCAGTAATGGG +TAAAACCATCATATTGAAAGCAAACTTTAGTGTGATTTTTAATCGACTTGAAGCTCTGATACTACTTAGAGCGTTTACAG +ATGAAGGAGCAATAGTGGGCGAAATCTCACCATTACCTTCCCTTCCAGGACATACTGACGAGGATGTCAAAAATGCAATT +GGGGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCGAGTCTCTGAAACTCTACAGAGATTCACTTGGAGAAG +CAGTGATGAGAATGGGAGATCTCCACTCCCTCCAAAACAGAAACGGAAAGTGGAGAGAACAATTGAGCCAGAAGTTTGAA +GAGATAAGATGGTTAATTGAAGAAATGCGACATAGGTTAAGAATTACAGAGAATAGCTTTGAGCAAATAACCTTTATGCA +AGCCTTACAACTATTGCTTGAAGTGGAGCAAGAGATAAGAACTTTCTCGTTTCAGCTTATTTAATGATAAAAAACACCCT +TGTTTCTACT +>NC_006307.2 Influenza C virus (C/Ann Arbor/1/50) PB2 gene for polymerase 2, complete cds +AGCAGAAGCAGAGGATTGGAAATGTCTTTTCTATTGACAATAGCAAAGGAATACAAAAGACTATGCCAAGATGCTAAGGC +AGCTCAAATGATGACAGTAGGAACTGTATCAAACTACACTACGTTCAAGAAATGGACTACATCAAGGAAGGAAAAGAATC +CTTCACTAAGAATGAGATGGGCAATGAGCAGCAAATTCCCAATAATAGCTAACAAGAGAATGCTGGAAGAAGCTCAAATT +CCTAAAGAACACAACAATGTAGCCCTTTGGGAAGACACAGAAGATGTTTCAAAAAGGGATCATGTTCTTGCAAGCGCCTC +TTGTATAAATTATTGGAATTTTTGTGGACCTTGTGTCAACAATTCAGAAGTGATCAAAGAAGTTTATAAATCTAGATTTG +GAAGATTAGAAAGAAGGAAAGAAATAATGTGGAAAGAACTTAGATTTACATTAGTTGATAGACAACGAAGAAGAGTTGAC +ACTCAGCCTGTAGAACAAAGATTGAGAACTGGAGAAATTAAAGACTTGCAAATGTGGACTTTGTTCGAAGATGAAGCTCC +TCTTGCTAGCAAATTTATTTTAGACAATTATGGTCTAGTCAAAGAAATGAGATCAAAGTTTGCAAACAAACCTCTGAATA +AAGAAGTAGTTGCACACATGTTAGAAAAACAATTCAATCCGGAAAGTAGATTCTTGCCTGTTTTCGGAGCTATAAGGCCA +GAAAGAATGGAATTGATCCATGCATTAGGAGGAGAAACTTGGATACAAGAAGCTAACACTGCAGGGATTTCCAATGTTGA +TCAAAGGAAAAATGATATGAGAGCAGTATGTAGGAAAGTTTGTCTTGCAGCAAATGCAAGTATAATGAACGCCAAAAGCA +AACTGGTTGAGTATATAAAAAGTACAAGTATGAGAATTGGAGAAACAGAAAGAAAGCTTGAAGAACTTATACTTGAAACC +GATGATGTCTCACCTGAAGTAACATTATGTAAATCTGCTTTAGGAGGACCATTAGGAAAAACTCTATCTTTTGGGCCCAT +GCTACTCAAGAAAATTTCTGGTTCCGGAGTAAAAGTTAAAGATACAGTATATATCCAAGGTGTCAGAGCAGTACAATTTG +AATACTGGAGTGAGCAAGAAGAATTCTATGGAGAATATAAGTCAGCCACCGCTTTATTCAGCAGAAAGGAAAGATCACTA +GAATGGATTACAATAGGAGGAGGAATAAATGAAGACAGAAAGAGACTTCTAGCTATGTGCATGATATTTTGCAGAGATGG +AGATTATTTTAAAGACGCCCCTGCAACAATAACAATGGCAGATTTAAGTACGAAGTTAGGAAGAGAAATTCCATATCAAT +ATGTGATGATGAATTGGATACAAAAATCAGAAGATAATCTCGAAGCCTTATTATACAGTAGGGGAATTGTAGAAACCAAT +CCAGGAAAAATGGGGAGCTCAATGGGAATTGATGGTTCCAAAAGAGCAATTAAATCTTTAAGGGCTGTCACAATACAATC +AGGAAAGATTGACATGCCAGAATCAAAAGAAAAAATTCACCTTGAGCTCTCTGATAATCTTGAAGCATTTGATTCATCAG +GAAGAATTGTTGCAACAATTTTAGACCTTCCTAGTGACAAAAAGGTAACATTTCAGGATGTAAGCTTTCAACATCCTGAT +CTGGCAGTATTGAGAGATGAGAAAACGGCCATAACAAAAGGGTATGAAGCGCTAATCAAAAGGCTAGGAACAGGGGACAA +TGATATTCCTTCCTTAATTGCAAAGAAGGATTATTTGTCTCTTTATAATTTACCAGAAGTAAAATTAATGGCTCCCTTAA +TCAGACCCAATAGAAAAGGAGTTTATTCCAGAGTTGCTAGAAAATTAGTGTCTACACAAGTTACTACTGGACATTATTCA +TTACATGAATTGATAAAGGTCTTACCCTTTACTTATTTCGCCCCAAAACAGGGAATGTTTGAAGGAAGGCTTTTCTTTAG +CAACGATAGCTTTGTTGAGCCTGGAGTAAATAACAATGTATTTTCTTGGAGTAAGGCTGACAGTTCTAAAATATATTGTC +ATGGAATAGCGATAAGGGTACCTTTAGTTGTTGGAGATGAACACATGGACACTTCGTTAGCACTATTAGAAGGGTTTAGT +GTTTGTGAAAACGACCCCAGAGCACCAATGGTAACAAGACAAGATTTAATTGATGTGGGATTTGGGCAAAAAGTTAGACT +CTTCGTAGGCCAAGGGAGCGTTAGAACCTTCAAGCGAACTGCCTCACAAAGGGCTGCATCAAGCGATGTAAATAAGAATG +TGAAAAAGATAAAGATGTCTAACTAAAAATCCTCTTGCTACTGCT +>NC_006308.2 Influenza C virus (C/Ann Arbor/1/50) PB1 gene for polymerase 1, complete cds +AGCAGAAGCAGAGGATTATGGAAATCAACCCATATTTGATGTTTCTAAACAACGACGTCACATCGCTGATATCAACAACA +TACCCCTATACAGGGCCACCTCCAATGTCACATGGATCATCAACCAAATACACTTTGGAAACTATTAAAAGAACATATGA +CTACTCAAGAACATCAGTTGAAAAAACATCGAAAGTTTTCAATATACCAAGAAGAAAGTTTTGCAATTGTCTTGAAGACA +AAGATGAGTTGGTAAAACCAACAGGAAACGTTGATATCAGTTCCTTGTTGGGCCTTGCAGAGATGATGGAGAAAAGAATG +GGGGAAGGATTTTTTAAGCATTGTGTAATGGAGGCAGAAACAGAAATACTTAAAATGCACTTCTCTAGACTTACGGAAGG +AAGACAAACATATGATTGGACTTCTGAAAGAAACATGCCAGCGGCCACTGCTTTGCAACTGACAGTTGATGCCATAAAAG +AAACAGAAGGACCATTTAAAGGGACAACAATGCTTGAATATTGCAATAAAATGATAGAAATGCTTGATTGGAAAGAAGTT +AAATTCAGAAAAGTCAAAACAATGGTGAGAAGGGAGAAAGATAAAAGAAGTGGGAAGGAGATAAAAACTAAAGTACCTGT +AATGGGAATTGACTCAATTAAACATGATGAGTTTTTAATTAGAGCATTAACTATTAATACCATGGCCAAAGATGGGGAAA +GAGGGAAATTGCAAAGAAGAGCAATTGCAACACCCGGTATGATAGTAAGACCATTTTCAAAAATTGTTGAAACTGTAGCA +CAGAAAATATGTGAGAAATTGAAAGAAAGCGGTCTACCTGTTGGTGGTAATGAGAAGAAAGCAAAACTTAAGACTACTGT +TACTTCTCTCAATGCCAGGATGAACAGTGATCAGTTTGCAGTTAATATAACTGGAGACAATAGTAAATGGAATGAATGCC +AACAACCTGAGGCTTATTTAGCACTTTTGGCTTACATCACCAAAGACTCCTCTGATTTAATGAAAGACTTATGCAGTGTT +GCTCCAGTGCTTTTCTGTAATAAGTTTGTGAAACTTGGACAAGGAATAAGACTTTCAAATAAAAGAAAAACAAAGGAAGT +CATAATAAAAGCTGAGAAAATGGGAAAATACAAGAATCTAATGAGAGAAGAATATAAAAACCTTTTTGAACCCTTAGAGA +AATATATTCAGAAGGATGTCTGTTTTTTACCTGGAGGAATGCTTATGGGAATGTTCAACATGCTGTCAACAGTTCTTGGA +GTAAGTACATTATGTTATATGGATGAAGAACTAAAAGCCAAAGGATGTTTTTGGACTGGACTCCAATCTTCTGATGACTT +TGTTCTTTTTGCAGTTGCTTCAAACTGGTCAAATATACATTGGACAATAAGACGGTTTAATGCTGTATGCAAGTTAATTG +GTATAAACATGTCTCTTGAAAAATCGTATGGTTCTCTCCCAGAACTCTTTGAATTTACAAGTATGTTCTTTGATGGAGAA +TTTGTGTCCAATCTTGCTATGGAATTGCCAGCTTTCACTACTGCAGGAGTTAATGAAGGAGTTGATTTTACAGCTGCAAT +GTCAATTATTAAGACAAATATGATAAATAACAGCTTATCACCTTCTACTGCTTTAATGGCCTTAAGGATATGTCTCCAAG +AATTTAGAGCGACTTATAGAGTCCATCCTTGGGATTCAAGAGTGAAAGGTGGGAGAATGAAAATAATAAATGAGTTCATA +AAAACCATAGAAAATAAAGATGGATTATTAATTGCTGATGGTGGGAAACTGATGAACAACATTAGCACCCTTCATATTCC +TGAGGAAGTACTGAAGTTTGAAAAAATGGATGAACAATATAGAAATAGGGTATTCAACCCCAAAAATCCCTTTACTAACT +TTGACAAAACTATTGATATATTTAGAGCACATGGCCCAATAAGGGTTGAAGAAAATGAAGCAGTAGTTTCAACTCATAGC +TTCAGAACTAGAGCAAACAGAACCCTATTGAATACAGATATGAGAGCAATGATGGCAGAAGAGAAAAGATATCAAATGGT +TTGCGACATGTTTAAAAGCGTGTTTGAATCAGCGGACATAAATCCTCCAATTGGGGCTATGAGCATTGGAGAGGCCATAG +AAGAAAAACTATTAGAGAGAGCTAAAATGAAAAGAGACATTGGGGCAATAGAAGATTCAGAATATGAAGAAATAAAAGAC +ATTATAAGGGATGCAAAGAAAGCTAGAATTGAAAGTAGATGAGGAGGGGCTGTTAAACCCTTTCCTCCTACTTGCACATA +TTTTTGTTATTCCATTAAATGAAAAAATCCTCTTGCTACTGCT +>NC_006309.2 Influenza C virus (C/Ann Arbor/1/50) P3 gene for polymerase 3, complete cds +AGCAGAAGCAGGGGATCCGAAATGTCAAAAACTTTTGCCGAAATAGCAGAGGCTTTTCTAGAGCCAGAAGCTGTAAGAAT +AGCCAAAGAAGCAGTAGAAGAATATGGGGATCACGAAAGAAAAATAATACAAATTGGAATACACTTTCAAGTTTGCTGCA +TGTTCTGTGATGAGTATTTGAGTACAAATGGGAGTGATAGATTTGTGCTCATTGAAGGAAGAAAAAGAGGAACTGCAGTG +TCTTTACAAAATGAGCTATGTAAAAGTTATGATCTTGAACCACTACCTTTTCTTTGTGACATTTTTGACAGGGAGGAAAA +ACAATTCGTTGAAATTGGAATAACAAGAAAAGCAGATGATAGCTATTTTCAATCCAAGTTTGGTAAACTTGGAAATAGCT +GCAAGATATTTGTATTCTCCTATGATGGAAGATTAGACAAAAATTGTGAAGGCCCTATGGAGGAACAAAAATTGAGAATT +TTCAGTTTTCTTGCAACTGCTGCTGATTTTCTTAGGAAAGAAAACATGTTTAACGAAATCTTCTTACCAGACAATGAAGA +AACCATCATTGAAATGAAGAAAGGAAAAACATTTCTAAAATTGAGGGATGAAAGTGTTCCTTTACCTTTTCAAACTTATG +AACAGATGAAAGATTACTGCGAAAAATTTAAAGGAAATCCAAGAGAATTAGCTTCTAAAGTAAGCCAAATGCAAAGCAAT +ATTAAATTACCAATAAAACATTATGAGCAGAATAAATTTCGACAAATACGTCTACCAAAGGGACCAATGGCACCCTATAC +CCACAAGTTCTTAATGGAAGAAGCATGGATGTTTACAAAAATTAGTGATCCAGAAAGATCAAGAGCTGGTGAAATTCTCA +TTGATTTCTTCAAGAAAGGGAATCTTTCTGCAATCAGACCCAAAGACAAACCATTACAAGGGAAATATCCCATACATTAC +AAAAATCTTTGGAATCAGATTAAAGCAGCAATTGCCGATAGAACCATGGTAATAAATGAAAATGATCATTCAGAGTTTCT +AGGAGGAATTGGAAGAGCCTCTAAAAAGATCCCAGAGGTTTCTCTGACACAAGATGTAATAACAACAGAAGGATTAAAAC +AATCAGAAAATAAGTTACCAGAACCAAGATCTTTCCCTAAATGGTTCAATGCTGAGTGGATGTGGGCAATAAAAGATTCT +GACCTTACTGGATGGGTGCCCATGGCAGAATACCCTCCTGCTGATAATGAATTGGAAGATTACGCTGAACATCTAAATAA +AACCATGGAAGGGGTCTTGCAAGGAACAAATTGCGCAAGAGAAATGGGGAAATGCATTCTTACTGTTGGGGCACTAATGA +CTGAATGTAGACTATTTCCTGGGAAAATAAAAGTGGTGCCCATATATGCTAGAAGTAAAGAAAGGAAATCAATGCAAGAA +GGGCTTCCGGTGCCCTCAGAAATGGACTGTTTATTTGGTATATGCGTCAAGTCAAAATCACATTTAAACAAGGATGATGG +AATGTACACAATAATAACATTTGAATTCTCAATAAGAGAGCCTAATTTAGAAAAACATCAAAAATATACTGTATTTGAAG +CAGGACACACAACAGTTAGAATGAAGAAAGGAGAGTCAGTTATTGGAAGAGAAGTCCCTCTTTATTTATACTGTAGGACA +ACTGCCCTTTCCAAAATCAAGAATGACTGGCTATCAAAGGCTAGAAGATGTTTCATCACAACTATGGACACAGTGGAAAC +CATATGTCTAAGAGAGTCAGCAAAGGCTGAAGAAAATCTAGTTGAAAAGACATTAAACGAAAAACAGATGTGGATTGGGA +AGAAAAATGGAGAGTTAATTGCTCAACCTTTAAGAGAAGCTTTAAGAGTACAGCTGGTACAACAATTCTATTTCTGCATC +TATAATGACAGTCAATTAGAAGGCTTTTGTAATGAGCAGAAGAAAATCCTAATGGCTCTTGAAGGTGACAAGAAAAATAA +ATCATCTTTTGGATTTAATCCAGAAGGATTATTAGAAAAGATTGAAGAGTGTCTTATAAATAATCCGATGTGCCTTTTTA +TGGCTCAAAGGTTGAATGAACTTGTAATTGAGGCCTCAAAAAGAGGCGCTAAGTTTTTCAAAATTGATTGATCATTATAA +GAAAAAATCCCCTTGCTACTGCT +>NC_006310.2 Influenza C virus (C/Ann Arbor/1/50) HEF gene for hemagglutinin-esterase-fusion, complete cds +AGCAGAAGCAGGGGTTTAATAATGTTTTTCTCATTACTCTTGATGTTGGGCCTCACAGAGGCTGAAAAAATAAAGATATG +CCTTCAAAAGCAAGTGAACAGTAGCTTCAGCCTACACAATGGCTTCGGAGGAAATTTGTATGCCACGGAAGAAAAAAGAA +TGTTTGAGCTTGTTAAGCCCAAAGCTGGAGCCTCTGTCTTGAATCAAAGTACATGGATTGGCTTTGGAGATTCAAGGACT +GACAAAAGCAATTCAGCTTTTCCTAGGTCTGCGGATGTTTCAGCAAAAACTGCTGATAAGTTTCGTTCTTTGTCTGGTGG +ATCCTTGATGTTGAGTATGTTTGGACCACCTGGGAAGGTAGACTACCTTTACCAAGGATGTGGAAAACATAAGGTTTTTT +ATGAAGGAGTTAACTGGAGTCCACATGCTGCTATAAATTGTTACAGAAAAAATTGGACTGATATCAAACTGAATTTCCAG +AAAAACATTTATGAACTGGCTTCACAATCACATTGCATGAGCTTGGTGAATGCCTTGGACAAAACTATTCCTTTACAAGC +GACTGCAGGGGTTGCAAAAAATTGCAACAACAGCTTCTTAAAAAATCCAGCATTGTACACACAAGAAGTCAATCCTTCAG +TAGAAAAATGTGGGAAAGAAAATCTTGCTTTCTTCACACTTCCAACCCAATTTGGAACCTATGAGTGCAAACTGCATCTT +GTGGCTTCTTGCTATTTCATCTATGATAGTAAAGAAGTGTACAATAAAAGAGGATGTGACAACTACTTTCAAGTGATCTA +TGATTCATCTGGAAAAGTTGTTGGAGGACTAGATAACAGGGTATCACCTTACACAGGGAATTCTGGAGACACCCCAACAA +TGCAATGTGACATGCTCCAGCTGAAACCTGGAAGATATTCAGTAAGAAGCTCTCCAAGATTCCTTTTAATGCCCGAAAGA +AGTTATTGCTTTGACATGAAAGAAAAAGGACCAGTCACTGCTGTCCAATCCATTTGGGGAAAAGGCAGAGAATCTGACCA +TGCAGTGGATCAAGCTTGCTTGAGCACTCCAGGGTGCATGTTGATCCAAAAGCAAAAGCCATACATTGGAGAAGCTGATG +ATCACCATGGAGATCAAGAAATGAGGGAGTTGCTGTCAGGACTGGACTATGAAGCTAGATGCATATCACAATCAGGGTGG +GTGAATGAAACCAGCCCTTTTACGGAAGAATACCTCCTTCCTCCCAAATTTGGAAGATGCCCCTTGGCTGCAAAGGAAGA +ATCCATTCCAAAAATCCCAGATGGCCTTCTAATTCCCACCAGTGGAACTGATACCACTGTAACCAAACCTAAGAGCAGAA +TTTTTGGAATCGATGACCTCATTATTGGTTTGCTCTTTGTTGCAATCGTTGAAGCAGGAATTGGAGGCTATCTGCTTGGA +AGTAGAAAAGTATCAGGAGGAGGTGTGACAAAAGAATCAGCTGAAAAAGGGTTTGAGAAAATTGGAAATGACATACAAAT +CCTAAGATCTTCTACAAATATCGCAATAGAAAAACTGAATGACAGAATTTCTCATGATGAGCAAGCCATCAGAGATCTAA +CTTTAGAAATTGAAAATGCAAGATCTGAAGCTTTGTTAGGAGAATTGGGAATAATAAGAGCCTTGTTGGTAGGAAATATA +AGCATAGGATTACAAGAATCTTTATGGGAACTAGCTTCAGAAATAACAAATAGAGCAGGAGATCTAGCAGTTGAAGTCTC +TCCAGGTTGCTGGGTAATTGACAATAACATTTGTGATCAAAGTTGTCAAAACTTTATTTTCAAGTTCAACGAAACTGCAC +CTGTTCCAACCATTCCCCCTCTTGACACAAAAATTGATCTGCAATCAGATCCTTTTTACTGGGGAAGCAGCTTGGGCTTA +GCAATAACTGCTGCTATTTCATTGGCAGCTTTGGTGATCTCTGGGATCGCCATCTGCAGAACTAAATGACTGGGACAATT +TTAAAAAATGGATAATATATTAGTCAATATTTTGTACAGTTTTATAAAAAACAAAAATCCCCTTGCTACTGCT +>NC_006311.1 Influenza C virus (C/Ann Arbor/1/50) segment 5, complete sequence +AGCAGAAGCAGGAGATTTGATTTTCAAAAATGTCTGACAGACGTCAAAACAGAAAGACGCCAGATGAGCAACGCAAAGCC +AATGCTCTCATAATAAATGAGAACATTGAAGCCTACATTGCCATTTGTAAGGAAGTGGGCCTTAATGGCGATGAAATGTT +GATCCTGGAAAATGGCATAGCAATTGAAAAAGCTATAAGAATATGTTGTGATGGAAAGTATCAGGAAAAAAGGGAAAAGA +AAGCAAGAGAAGCCCAAAGAGCGGACAGCAACTTCAATGCAGATTCCATTGGGATCAGACTAGTTAAAAGAGCTGGTTCA +GGCACCAATATAACCTACCATGCAGTTGTTGAATTGACAAGCCGCTCAAGAATTGTTCAAATTCTCAAATCTCATTGGGG +AAATGAACTAAACAGAGCAAAAATTGCAGGAAAAAGACTCGGCTTCTCTGCACTCTTTGCTTCTAACTTAGAAGCAATTA +TTTATCAAAGAGGAAGAAATGCAGCAAGAAGAAACGGTTCTGCTGAATTGTTCACTCTCACTCAAGGGGCTGGAATCGAA +ACTAGATATAAATGGATAATGGAAAAGCACATCGGAATTGGAGTTCTTATAGCTGACGCAAAAGGTTTAATAAATGGAAA +GAGAGAAGGCAAAAGAGGAGTTGATGCCAATGTAAAATTGAGAGCAGGAACGACTGGTTCCCCTCTGGAAAGAGCCATGC +AAGGAATTGAGAAAAAAGCGTTTCCTGGGCCTTTAAGAGCACTAGCAAGAAGAGTTGTAAAAGCAAACTACAATGATGCC +AGAGAAGCTCTAAATGTCATCGCAGAAGCATCACTCCTGTTAAAGCCTCAGATAACCAACAAGATGACAATGCCTTGGTG +TATGTGGTTGGCTGCCAGACTTACTCTGAAAGATGAGTTTGCCAATTTCTGTGCATATGCAGGAAGAAGAGCCTTTGAAG +TCTTCAATATTGCAATGGAGAAAATTGGAATTTGTTCCTTTCAAGGGACAATAATGAACGATGATGAAATTGAATCAATA +GAGGACAAGGCTCAAGTATTAATGATGGCATGCTTTGGACTTGCTTATGAAGACTTCAGTTTGGTCTCTGCTATGGTTAG +CCACCCTCTTAAGTTGAGAAACAGAATGAAAATAGGAAACTTCAGAGTCGGTGAAAAAGTTTCAACAGTGCTTTCTCCCT +TATTGAGATTCACAAGATGGGCAGAGTTTGCTCAAAGATTTGCTCTTCAGGCAAATACTTCAAGAGAAGGCGCTCAAATC +AGCAATTCAGCAGTTTTTGCAGTGGAAAGGAAGATAACCACAGATGTCCAAAGAGTTGAAGAGCTACTAAATAAAGTTCA +AGCTCATGAAGATGAACCATTACAAACACTTTACAAAAAAGTAAGAGAACAAATTTCCATAATTGGAAGGAACAAGTCTG +AAATAAAGGAGTTTCTAGGGTCTTCAATGTATGATTTAAATGATCAAGAAAAACAAAATCCAATAAATTTCAGGTCTGGA +GCACACCCTTTCTTTTTCGAATTCGACCCAGACTACAACCCCATAAGAGTGAAAAGACCCAAAAAACCAATAGCAAAGAG +AAATTCAAATATCAGCAGATTGGAAGAAGAAGGAATGGATGAAAATTCAGAGATTGGACAAGCCAAGAAGATGAAACCTT +TGGATCAATTGACCAGCACTAGTAGCAACATTCCTGGAAAAAATTAAAGTCAGATTAAATTCATCACATATTTTATGATC +AACTGTTGTATTGCTATATATAATTCAAAAATCTCCTTGCTACTGCT +>NC_006312.2 Influenza C virus (C/Ann Arbor/1/50) M1, CM2 genes for matrix protein, CM2 protein, complete cds +AGCAGAAGCAGGGGATTTCAAAACAATGGCACATGAAATACTGATTGCTGAAACAGAGGCATTTCTAAAAAATGTTGCTC +CTGAGACCAGGACAGCAATAATTTCAGCAATAACAGGAGGAAAATCAGCCTGCAAATCAGCAGCTAAACTGATTAAGAAT +GAACATCTTCCCCTAATGTCTGGAGAAGCCACCACAATGCACATCGTTATGAGGTGCTTATATCCTGAAATAAAACCATG +GAAAAAGGCAAGCGACATGCTGAATAAAGCAACTTCTAGTTTGAAAAAATCAGAAGGAAGAGACATAAGAAAGCAAATGA +AAGCAGCTGGAGACTTCTTGGGAGTGGAGTCAATGATGAAAATGAGGGCCTTCAGAGATGACCAAATAATGGAAATGGTT +GAAGAAGTATATGATCACCCAGACGACTACACACCAGACATCCGAATAGGAACAATCACAGCTTGGTTGAGATGCAAAAA +CAAGAAAAGTGAAAGATACAGGAGTAATGTCTCAGAAAGTGGAAGAACAGCTTTAAAAATTCATGAAGTAAGAAAAGCCA +GCACAGCAATGAACGAGATTGCTGGTATTACTGGCCTTGGAGAAGAAGCACTATCTCTCCAAAGACAAACAGAAAGTTTG +GCCATATTATGTAATCACACTTTTGGAAGTAATATAATGAGACCCCACTTGGAAAAAGCAATAAAAGGAGTTGAAGGCAG +AGTTGGAGAGATGGGACGAATGGCAATGAAATGGTTAGTTGTTATAATATGTTTCTCTATAACAAGTCAACCTGCTTCTG +CTTGCAATCTAAAGACCTGTCTAAAACTATTTAACAATACTGATGCGGTAACTGTTCATTGTTTTAATGAAAACCAAGGA +TACATGCTAACATTAGCCTCTTTGGGATTAGGGATAATTACTATGTTGTATTTATTAGTAAAAATCATAATTGAACTTGT +CAATGGTTTTGTGCTCGGCAGATGGGAGAGATGGTGTGGAGATATAAAGACCACAATTATGCCTGAAATTGACTCGATGG +AAAAAGATATTGCCCTTTCTAGGGAGAGACTTGACCTGGGAGAGGATGCTCCTGACGAAACCGACAACTCACCAATTCCT +TTTTCCAATGATGGTATTTTTGAAATTTAATTACCTTGAAAAAATCCCCTTGCTACTGCT +>NC_006306.2 Influenza C virus (C/Ann Arbor/1/50) segment 7, complete sequence +AGCAGAAGCAGGGGTACTTTTCCAAAATGTCCGACAAAACAGTCAAATCAACAAATTTAATGGCATTTGTAGCCACAAAA +ATGTTAGAGAGACAAGAAGATTTAGACACATGCACTGAAATGCAAGTAGAAAAAATGAAAACGTCAACAAAAGCCAGGTT +GAAAACAGAATCTTCTTTTGCACCTAGAACATGGGAAGATGCAATAAAAGATGGTGAGCTTCTATTCAACGGGACGATTC +TGCAAGCAGAGTCTCCTACAATGACGCCAGCGTCCGTAGAAATGAAGGGGAAGAAATTTCCTATTGATTTTGCTCCAAGA +AACATAGCACCAATTGGGCAAAATCCAATATATTTGTCACCATGTATTCCTAACTTTGATGGAAACGTCTGGGAAGCAAC +GATGTATCATCATCGTGGAGCAACTTTGACAAAGACAATGAATTGCAACTGTTTTCAAAGAACAATTTGGTGCCATCCAA +ATCCTTCACGTATGAGATTGAGCTATGCATTTGTTTTGTATTGCAGAAATACTAAGAAGATCTGTGGATACCTCATCGCT +AGACAAGTGGCCGGAATTGAAACAGGAATTAGAAAATGTTTCAGATGCATTAAAAGCGGATTCGTTATGGCTACCGATGA +AATCTCTCTCACTATACTCCAAAGTATCAAATCAGGAGCCCAGCTCGATCCCTATTGGGGAAATGAAACACCAGATATTG +ACAAGACTGAAGCTTATATGCTCTCGCTTAGAGAAGCTGGACCTTAACCTGAGCAAAGCAGTCTTAGGAATCCAAAATTC +TGAAGATCTTATTTTGATCATATATAACAGAGATGTTTGTAAAAACACTATATTAATGATAAAATCTTTGTGTAATTCAC +TTATATAATTGTTTTAAGTTGTTATTCCAAAGTTAAAAAACCCCTTGCTCCTGCT +>NC_007357.1 Influenza A virus (A/Goose/Guangdong/1/96(H5N1)) polymerase (PB2) gene, complete cds +AGCAAAAGCAGGTCAATTATATTCAATATGGAAAGAATAAAAGAACTAAGAGATCTAATGTCGCAGTCCCGCACTCGCGA +GATACTAACAAAAACCACTGTGGATCATATGGCCATAATCAAGAAATACACATCAGGAAGACAAGAGAAGAACCCTGCTC +TCAGAATGAAATGGATGATGGCAATGAAATATCCAATCACAGCAGACAAGAGAATAATGGAGATGATTCCTGAAAGGAAT +GAGCAAGGACAAACGCTTTGGAGCAAGACAAATGATGCTGGGTCGGACAGAGTGATGGTGTCTCCCCTAGCTGTAACTTG +GTGGAACAGGAATGGGCCGACAACAAGTACAGTCCATTATCCAAAGGTTTACAAAACATACTTTGAGAAGGTTGAAAGGT +TAAAACATGGAACCTTCGGTCCCGTTCATTTCCGAAACCAAGTTAAAATACGTCGCCGGGTGGATATAAACCCGGGCCAT +GCAGATCTCAGTGCTAAAGAAGCACAAGATGTTATCATGGAGGTCGTTTTCCCAAATGAAGTGGGAGCTAGAATATTGAC +ATCAGAGTCGCAATTGACAATAACAAAAGAGAAGAAAGAAGAGCTCCAGGATTGTAAAATTGCTCCTTTAATGGTGGCAT +ACATGTTGGAAAGAGAACTGGTCCGCAAAACCAGATTTCTACCGGTAGCAGGCGGAACAAGCAGTGTGTACATTGAGGTA +TTGCATTTGACTCAAGGGACCTGTTGGGAACAGATGTACACTCCCGGCGGAGAAGTAAGAAATGATGATGTTGACCAGAG +TTTGATCATCGCTGCCAGAAACATTGTTAGGAGAGCAACAGTATCAGCGGACCCACTGGCATCACTCTTGGAGATGTGTC +ACAGCACACAAATTGGGGGAATAAGGATGGTGGACATCCTTAGGCAAAACCCAACTGAGGAGCAAGCTGTGGATATATGC +AAAGCAGCAATGGGTTTGAGGATCAGTTCATCCTTTAGCTTTGGAGGCTTCACTTTCAAAAGAACAAATGGATCATCCGT +CAAGAAGGAAGAGGAAGTGCTTACAGGCAACCTCCAAACATTGAAAATAAAAGTACATGAGGGGTATGAAGAATTCACAA +TGGTTGGGCGGAGAGCAACAGCTATCCTGAGGAAAGCAACTAGAAGGCTGATTCAGTTGATAGTAAGTGGAAGAGATGAA +CAATCAATCGCTGAAGCGATCATTGTAGCAATGGTGTTCTCACAGGAGGATTGCATGATAAAGGCAGTCCGAGGCGATCT +GAATTTCGTGAACAGAGCAAACCAAAGATTGAACCCCATGCATCAACTCCTGAGGCACTTCCAAAAAGATGCAAAAGTGC +TGTTTCAGAACTGGGGAATTGAACCTATTGACAATGTCATGGGGATGATCGGAATATTACCTGACATGACTCCAAGCGCA +GAGATGTCACTGAGAGGAGTGAGAGTTAGTAAGATGGGAGTAGATGAATATTCCAGCACGGAGAGAGTGGTGGTGAGTAT +TGACCGTTTCTTGAGGGTCCGAGATCAGCAGGGGAACGTACTCTTATCTCCTGAAGAGGTTAGTGAAACACAGGGAACAG +AGAAGTTGACAATAACATATTCATCCTCAATGATGTGGGAAATCAACGGTCCTGAGTCAGTGCTTGTTAACACTTATCAA +TGGATCATCAGGAATTGGGAGACTGTAAAGATTCAATGGTCTCAAGATCCCACAATGCTGTACAATAAGATGGAGTTTGA +ATCGTTCCAATCCTTGGTGCCAAAGGCTGCCAGAAGCCAATATAGTGGATTTGTGAGAACACTATTCCAACAGATGCGTG +ATGTTTTGGGGACATTTGATACTGTCCAAATAATCAAGCTGCTACCATTTGCAGCAGCCCCACCGGAGCCGAGCAGAATG +CAGTTTTCTTCTCTAACTGTGAATGTGAGAGGCTCAGGAATGAGAATACTCGTGAGGGGTAACTCCCCCGTGTTCAACTA +CAACAAGGCAACCAAAAGGCTTACAGTCCTCGGAAAGGACGCAGGTGCATTAACAGAAGATCCAGACGAGGGAACAGCCG +GGGTGGAATCTGCAGTATTGAGGGGATTCCTAATTCTAGGCAGAGAGGACAAAAGATATGGACCCGCATTGAGCATCAAT +GAACTGAGCAATCTTGCAAAAGGGGAGAAGGCTAATGTATTGATAATGCAAGGAGACGTGGTGTTGGTAATGAAACGGAA +ACGGGACTTTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAGTGTTGAATAGTTT +AAAAACGACCTTGTTTCTACT +>NC_007358.1 Influenza A virus (A/goose/Guangdong/1/1996(H5N1)) polymerase (PB1) and PB1-F2 protein (PB1-F2) genes, complete cds +AGCAAAAGCAGGCAAACCATTTGAATGGATGTCAATCCGACTTTACTTTTCTTAAAAGTGCCAGCGCAAAATGCTATAAG +TACCACATTCCCTTATACTGGAGATCCTCCATACAGCCATGGAACAGGAACAGGATACACCATGGACACAGTCAACAGAA +CACATCAATATTCAGAAAAGGGGAAATGGACAACGAACACAGAGACTGGAGCACCCCAACTCAATCCGATTGATGGACCA +CTACCTGAGGATAATGAGCCGAGTGGGTATGCACAAACAGATTGTGTATTGGAAGCAATGGCTTTCCTTGAAGAATCCCA +CCCAGGGATCTTTGAAAACTCGTGTCTTGAAACGATGGAAGTTGTTCAGCAAACAAGAGTGGATAAGCTGACCCAAGGTC +GCCAAACCTATGACTGGACATTGAAAAGAAACCAGCCGGCTGCAACCGCTTTGGCCAACACTATAGAGGTCTTCAGATCG +AATGGTCTAACAGCCAATGAATCGGGAAGGCTAATAGATTTCCTCAAAGACGTGATGGAATCAATGGATAAGGGAGAAAT +GGAAATAATAACACATTTCCAGAGAAAGAGAAGAGTGAGGGACAACATGACCAAGAAAATGGTCACACAAAGAACAATAG +GGAAGAAAAAACAAAGGCTGAACAAAAGGAGCTACCTAATAAGAGCACTGACACTGAACACAATGACAAAAGACGCAGAA +AGAGGCAAATTGAAGAGGCGGGCAATTGCAACACCCGGGATGCAAATCAGAGGATTCGTGTACTTTGTCGAAACACTAGC +GAGGAGTATCTGTGAGAAACTTGAGCAATCTGGACTCCCCGTCGGAGGGAATGAAAAGAAGGCTAAATTGGCAAATGTCG +TGAGGAAGATGATGACTAACTCACAAGATACAGAGCTCTCTTTTACAATTACTGGAGACAACACCAAATGGAATGAGAAT +CAGAACCCTCGGATGTTTCTAGCAATGATAACATACATCACAAGGAACCAACCTGAATGGTTTAGAAATGTCTTAAGCAT +TGCTCCTATAATGTTCTCAAACAAGATGGCAAGATTAGGGAAAGGATACATGTTCGAAAGTAAGAGCATGAAGCTACGGA +CACAAATACCAGCAGAAATGCTTGCAAGCATTGACTTGAAATACTTCAACGAATCAACGAGAAAGAAAATCGAGAAAATA +AGACCTCTACTAATAGATGGCACAGCCTCATTGAGTCCTGGAATGATGATGGGCATGTTCAATATGCTGAGTACAGTCTT +AGGAGTTTCAATCCTGAATCTTGGGCAGAAGAGGTACACCAAAACCACATACTGGTGGGACGGACTCCAATCCTCTGATG +ATTTCGCTCTCATAGTGAATGCACCAAATCATGAGGGAATAGAAGCAGGGGTGGATAGGTTCTATAGGACTTGCAAACTA +GTTGGAATCAATATGACCAAGAAGAAGTCTTACATAAATCGGACAGGAACATGTGAATTCACAAGCTTCTTCTACCGCTA +TGGGTTCGTAGCCAACTTCAGTATGGAGCTGCCCAGCTTTGGAGTGTCTGGGATTAATGAATCGGCTGACATGAGCATTG +GTGTTACAGTGATAAAGAACAATATGATGGACAACGACCTTGGACCAGCAACAGCTCAGATGGCTCTTCAGCTATTCATT +AAGGACTACAGATACCCATACCGATGCCACAGGGGGGATACACAAATCCAAACGAGGAGATCATTCGAGCTGAAGAAGCT +GTGGGAGCAGACCCGCTCAAAGGCAGGACTGTTGGTTTCAGATGGAGGACCAAACCCATACAATATCCGGAATCTCCACA +TTCCGGAGGCTGGCTTGAAGTGGGAATTGATGGATGAAGACTACCAGGGCAGACTGTGTAATCCTCTGAACCCGTTTGTT +AGTCATAAGGAAATTGAGTCTGTCAACAATGCTGTGGTAATGCCAGCTCATGGCCCAGCCAAGAGCATGGAATATGATGC +AGTTGCGACTACACATTCATGGATTCCCAAGAGGAATCGTTCCATTCTCAACACCAGCCAAAGGGGGATTCTTGAGGATG +AACAGATGTATCAGAAGTGCTGCAATCTATTCGAGAAATTCTTCCCTAGCAGTTCATATCGGAGGCCAGTTGGAATTTCC +AGCATGGTGGAGGCCATGGTGTCTAGGGCCCGAATTGATGCACGAATTGACTTCGAGTCTGGAAGGATTAAGAAAGAAGA +GTTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCGGACGGCAAAAATAGTGAATTTAGCTTGTCCTTCATG +AAAAAATGCCTTGTTTCTACT +>NC_007359.1 Influenza A virus (A/goose/Guangdong/1/1996(H5N1)) polymerase (PA) and PA-X protein (PA-X) genes, complete cds +AGCAAAAGCAGGTACTGATCCAAAATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATTGTCGAGCTTGCGGAAAA +GGCAATGAAAGAATATGGGGAAGATCCGAAAATCGAAACGAACAAATTTGCCGCAATATGCACGCACTTAGAAGTCTGTT +TCATGTATTCAGATTTCCACTTTATTGATGAACGGGGCGAATCAACAATTATAGAATCTGGCGATCCCAATGCATTATTG +AAACACCGGTTTGAAATAATCGAAGGGAGGGACCGAACAATGGCCTGGACAGTGGTGAATAGTATCTGCAACACCACAGG +AGTTGAGAAGCCTAAATTTCTCCCAGATTTGTATGACTACAAGGAGAACCGATTTATTGAAATTGGAGTGACACGGAGGG +AAGTTCACACATACTATCTAGAAAAAGCCAACAAGATAAAATCTGAGAAGACACACATTCACATATTCTCATTCACTGGA +GAGGAAATGGCCACCAAAGCGGACTACACCCTTGATGAAGAAAGCAGGGCCCGAATCAAAACCAGGCTGTTCACTATAAG +GCAGGAAATGGCCAGTAGGGGTTTATGGGATTCCTTTCGTCAGTCCGAGAGAGGCGAAGAGACAGTTGAAGAAAGATTTG +AAATCACAGGGACTATGTGCAGGCTTGCCGACCAAAGTCTCCCACCTAATTTCTCCAGCCTTGAAAAATTTAGAGCCTAT +GTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAGCTTTCTCAAATGTCGAAAGAAGTAAACGCCAGAATTGAGCC +ATTTCTGAAGACAACACCACGCCCTCTTAGATTACCTGATGGGCCTCCCTGCTCTCAGCGGTCGAAGTTTTTGCTGATGG +ATGCCCTTAAATTAAGCATCGAAGACCCGAGTCATGAGGGGGAGGGGATACCGCTATATGATGCAATCAAATGCATGAAA +ACATTTTTCGGCTGGAAAGAGCCCAACATTGTAAAACCACATGAAAAAGGCATAAACCCCAATTACCTCCTGGCTTGGAA +GCAGGTGCTGGCAGAGCTCCAAGATATTGAAAACGAGGAGAAAATTCCAAAGACAAAGAACATGAGGAAAACAAGCCAAT +TGAAGTGGGCACTTGGTGAGAATATGGCACCAGAGAAAGTAGACTTTGAGGATTGCAAAGATGTTAGCGATCTAAGGCAG +TATGACAGTGATGAACCAAAGCCTAGATCACTAGCAAGCTGGATCCAGAGTGAATTCAACAAGGCATGCGAATTGACAGA +TTCAAGTTGGATTGAACTTGATGAAATAGGGGAAGACGTTGCTCCAATTGAGCACATTGCAAGTATGAGAAGGAACTATT +TCACAGCGGAAGTATCCCATTGCAGGGCTACTGAATACATAATGAAGGGAGTGTACATAAACACAGCTTTGTTGAATGCA +TCCTGTGCAGCCATGGATGACTTCCAACTGATCCCAATGATAAGCAAATGCAGAACCAAAGAAGGAAGACGGAAAACTAA +CCTGTATGGATTCCTTATAAAAGGAAGATCCCATTTGAGAAATGACACCGATGTGGTAAACTTTGTGAGTATGGAATTCT +CTCTTACTGATCCGAGGCTGGAGCCACACAGATGGGAAAAGTACTGCGTTCTTCGGATAGGAGACATGCTCTTACGGACT +GAAATAGGCCAAGTGTCAAGGCCCATGTTTCTTTATGTGAGAACCAATGGAACCTCCAAGATCAAGATGAAATGGGGCAT +GGAAATGAGGCGATGCCCTTTTCAATCCCTTCAACAGATTGAGAGCATGATTGAGGCCGAGTCTTCTGTCAAAGAAAAAG +ACATGACTAAAGAATTCTTTGAAAACAAATCAGAAACATGGCCAATTGGAGAATCACCCAAGGGAGTGGAGGAAGGCTCC +ATCGGGAAGGTGTGCAGAACCTTACTGGCTAAATCTGTTTTCAACAGTCTATATGCATCTCCACAACTCGAGGGGTTTTC +AGCTGAATCAAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGC +TATATGAAGCAATTGAGGAGTGCCTGATTAATGATCCCTGGGTTTTGCTTAATGCATCTTGGTTCAACTCCTTCCTCACA +CATGCACTAAGATAGTTGTGGCAATGCTACTATTTGCTATCCATACTGTCCAAAAAAGTACCTTGTTTCTACT +>NC_007362.1 Influenza A virus (A/goose/Guangdong/1/1996(H5N1)) hemagglutinin (HA) gene, complete cds +GCAGGGGTATAATCTGTCAAAATGGAGAAAATAGTGCTTCTTCTTGCAATAGTCAGTCTTGTCAAAAGTGATCAGATTTG +CATTGGTTACCATGCAAACAACTCGACAGAGCAGGTTGACACAATAATGGAAAAGAACGTTACTGTTACACATGCCCAAG +ACATACTGGAAAAGACACACAATGGGAAGCTCTGCGATCTAAATGGAGTGAAGCCTCTCATTTTGAGAGATTGTAGTGTA +GCTGGATGGCTCCTCGGAAACCCTATGTGTGACGAATTCATCAATGTGCCGGAATGGTCTTACATAGTGGAGAAGGCCAG +TCCAGCCAATGACCTCTGTTACCCAGGGGATTTCAACGACTATGAAGAACTGAAACACCTATTGAGCAGAACAAACCATT +TTGAGAAAATTCAGATCATCCCCAAAAGTTCTTGGTCCAATCATGATGCCTCATCAGGGGTGAGCTCAGCATGTCCATAC +CATGGGAGGTCCTCCTTTTTCAGAAATGTGGTATGGCTTATCAAAAAGAACAGTGCATACCCAACAATAAAGAGGAGCTA +CAATAATACCAACCAAGAAGATCTTTTAGTACTGTGGGGGATTCACCATCCTAATGATGCGGCAGAGCAGACAAAGCTCT +ATCAAAACCCAACCACTTACATTTCCGTTGGAACATCAACACTGAACCAGAGATTGGTTCCAGAAATAGCTACTAGACCC +AAAGTAAACGGGCAAAGTGGAAGAATGGAGTTCTTCTGGACAATTTTAAAGCCGAATGATGCCATCAATTTCGAGAGTAA +TGGAAATTTCATTGCTCCAGAATATGCATACAAAATTGTCAAGAAAGGGGACTCAGCAATTATGAAAAGTGAATTGGAAT +ATGGTAACTGCAACACCAAGTGTCAAACTCCAATGGGGGCGATAAACTCTAGTATGCCATTCCACAACATACACCCCCTC +ACCATCGGGGAATGCCCCAAATATGTGAAATCAAACAGATTAGTCCTTGCGACTGGACTCAGAAATACCCCTCAGAGAGA +GAGAAGAAGAAAAAAGAGAGGACTATTTGGAGCTATAGCAGGTTTTATAGAGGGAGGATGGCAGGGAATGGTAGATGGTT +GGTATGGGTACCACCATAGCAATGAGCAGGGGAGTGGATACGCTGCAGACAAAGAATCCACTCAAAAGGCAATAGATGGA +GTCACCAATAAGGTCAACTCGATCATTGACAAAATGAACACTCAGTTTGAGGCCGTTGGAAGGGAATTTAATAACTTGGA +AAGGAGGATAGAGAATTTAAACAAGCAGATGGAAGACGGATTCCTAGATGTCTGGACTTATAATGCTGAACTTCTGGTTC +TCATGGAAAATGAGAGAACTCTAGACTTTCATGACTCAAATGTCAAGAACCTTTATGACAAGGTCCGACTACAGCTTAGG +GATAATGCAAAGGAGCTGGGTAATGGTTGTTTCGAGTTCTATCACAAATGTGATAATGAATGTATGGAAAGTGTAAAAAA +CGGAACGTATGACTACCCGCAGTATTCAGAAGAAGCAAGACTAAACAGAGAGGAAATAAGTGGAGTAAAATTGGAATCAA +TGGGAACTTACCAAATACTGTCAATTTATTCAACAGTGGCGAGTTCCCTAGCACTGGCAATCATGGTAGCTGGTCTATCT +TTATGGATGTGCTCCAATGGATCGTTACAATGCAGAATTTGCATTTAAATTTGTGAGTTCAGATTGTAGTTAAAAACACC +>NC_007360.1 Influenza A virus (A/Goose/Guangdong/1/96(H5N1)) nucleocapsid protein (NP) gene, complete cds +AGCAAAAGCAGGGTAGATAATCACTCACTGAGTGACATCAACATCATGGCGTCTCAGGGCACCAAACGATCTTATGAACA +GATGGAAACTGGTGGAGAACGCCAGAATGCTACTGAGATCAGAGCATCTGTTGGAAGAATGGTTGGTGGAATTGGGAGGT +TTTATATACAGATGTGCACTGAACTCAAACTCAGCGACTATGAAGGAAGGCTGATTCAGAACAGCATAACAATAGAGAGA +ATGGTTCTCTCTGCATTTGATGAAAGGAGGAACAAATACCTGGAAGAACATCCCAGTGCGGGGAAGGACCCAAAGAAAAC +TGGAGGTCCAATCTACCGAAGAAGAGACGGAAAATGGGTGAGAGAGCTGATTCTGTATGACAAAGAGGAGATCAGGAGAA +TTTGGCGTCAAGCGAACAATGGAGAAGATGCAACTGCTGGTCTCACTCACATGATGATCTGGCATTCCAATCTAAATGAT +GCCACATACCAGAGAACAAGAGCTCTCGTGCGTACTGGGATGGACCCTAGAATGTGCTCTCTGATGCAAGGATCAACTCT +CCCGAGGAGATCTGGAGCTGCTGGTGCGGCAGTAAAGGGAGTCGGAACGATGGTGATGGAACTAATTCGGATGATAAAGC +GAGGGATTAACGATCGGAATTTCTGGAGAGGTGAAAATGGGCGAAGAACAAGAATTGCATATGAGAGAATGTGCAACATC +CTCAAAGGGAAATTCCAAACAGCAGCACAAAGAGCAATGATGGATCAGGTACGGGAAAGCAGAAATCCTGGGAATGCTGA +GATTGAAGATCTCATATTTCTGGCACGGTCTGCACTCATCCTGAGAGGATCAGTGGCCCACAAGTCCTGCTTGCCTGCTT +GTGTGTACGGGCTTGCCGTGGCCAGTGGATATGACTTTGAGAGAGAAGGGTACTCTCTGGTCGGGATTGATCCTTTCCGT +CTGCTGCAAAACAGCCAGGTCTTTAGTCTAATTAGACCAAATGAGAATCCAGCACATAAAAGTCAATTGGTGTGGATGGC +ATGCCATTCTGCAGCATTTGAAGATCTGAGAGTCTCAAGCTTCATCAGAGGGACAAGAGTGGCCCCAAGGGGACAACTAT +CTACTAGAGGAGTTCAAATTGCTTCAAATGAGAACATGGAAACAATGGACTCCAGCACTCTTGAACTGAGAAGCAGATAT +TGGGCTATAAGGACCAGGAGTGGAGGAAACACCAACCAGCAGAGAGCATCTGCAGGACAAATCAGTGTGCAGCCTACTTT +CTCGGTACAGAGAAATCTTCCCTTCGAAAGAGCGACCATTATGGCGGCATTCACAGGGAATACAGAGGGCAGAACATCTG +ACATGAGGACTGAAATCATAAGGATGATGGAAAGCTCCAGACCAGAAGATGTGTCTTTCCAGGGGCGGGGAGTCTTCGAG +CTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAGTAATGAAGGATCTTATTTCTTCGGAGACAA +TGCAGAGGAATATGACAATTGAAGAAAAATACCCTTGTTTCTACT +>NC_007361.1 Influenza A virus (A/Goose/Guangdong/1/96(H5N1)) neuraminidase (NA) gene, complete cds +AGCAAAAGCAGGAGATTAAAATGAATCCAAATCAGAAGATAATAACCATTGGATCAATCTGTATGGTAGTTGGGATAATT +AGCTTGATGTTACAAATTGGGAACATAATCTCAATATGGGTCAGTCATTCAATTCAGACAGGGAATCAACACCAAGCTGA +ACCATGCAATCAAAGCATTATTACTTATGAAAACAACACCTGGGTAAATCAAACATATGTCAACATCAGCAATACCAATT +TTCTTACTGAAAAAGCTGTGGCTTCAGTAACATTAGCGGGCAATTCATCTCTTTGCCCCATTAGCGGATGGGCTGTACAC +AGTAAGGACAACGGTATAAGAATCGGTTCCAAGGGGGATGTGTTTGTTATAAGAGAGCCGTTCATCTCATGCTCCCACTT +GGAATGCAGAACTTTCTTTTTGACTCAGGGAGCCTTGCTGAATGACAAGCACTCCAATGGGACCGTCAAAGACAGAAGCC +CTCACAGAACATTGATGAGTTGTCCTGTGGGTGAGGCTCCCTCCCCATATAACTCAAGGTTTGAGTCTGTTGCTTGGTCG +GCAAGTGCTTGCCATGATGGCACCAGTTGGTTGACAATTGGAATTTCTGGCCCAGACAATGGGGCTGTGGCTGTATTGAA +ATACAACGGCATAATAACAGACACTATCAAGAGTTGGAGGAACAACATACTGAGAACTCAAGAGTCTGAATGTGCATGTG +TAAATGGCTCTTGCTTTACTGTAATGACTGACGGACCAAGTAATGGGCAGGCCTCATATAAGATCTTCAAAATGGAAAAA +GGGAAAGTAGTTAAATCAGTCGAATTGAATGCCCCTAATTATCACTATGAGGAGTGCTCCTGTTATCCTGATGCTGGCGA +AATCACATGTGTGTGCAGGGATAATTGGCATGGCTCAAATCGGCCATGGGTATCTTTCAATCAAAATTTGGAGTATCAAA +TAGGATATATATGCAGTGGAGTTTTCGGAGACAATCCACGCCCCAATGATGGAACAGGCAGTTGTGGTCCGGTGTCCCCT +AACGGGGCATATGGAGTAAAAGGGTTTTCATTTAAATACGGCAATGGTGTTTGGATCGGGAGAACCAAAAGCACTAATTC +CAGGAGCGGCTTTGAAATGATTTGGGATCCAAATGGGTGGACTGGAACGGACAGTAGCTTCTCGGTGAAACAAGATATCG +TAGCAATAACTGATTGGTCAGGATATAGCGGGAGTTTTGTCCAGCATCCAGAACTGACAGGATTAGATTGCATAAGACCT +TGTTTCTGGGTTGAGCTAATCAGAGGGCGGCCCAAAGAGAGCACAATTTGGACTAGTGGGAGCAGCATATCTTTTTGTGG +TGTAAATAGTGACACTGTGGGTTGGTCTTGGCCAGACGATGCCGAGTTGCCATTCACCATTGACAAGTAGTTTGTTCAAA +AAACTCCTTGTTTCTACT +>NC_007363.1 Influenza A virus (A/goose/Guangdong/1/1996(H5N1)) segment 7, complete sequence +AGCAAAAGCAGGTAGATATTGAAAAATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCGTCCCGTCAGGCC +CCCTCAAAGCCGAGATCGCGCAGAGACTTGAGGATGTCTTTGCAGGAAAGAACACCGATCTCGAGGCTCTCATGGAATGG +CTAAAGACAAGACCAATCCTGTCACCTCTGACTAAAGGGATTTTAGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCG +AGGACTGCAGCGTAGACGCTTTGTCCAGAATGCCTTAAATGGAAATGGAGATCCAAACAATATGGATAGGGCAGTTAAGC +TATACAAGAAGCTGAAAAGAGAAATAACATTCCATGGGGCTAAGGAGGTCGCACTCAGCTACTCAACCGGTGCACTTGCC +AGTTGTATGGGTCTCATATACAACAGGATGGGAACGGTGACCACAGAAGTGGCTTTTGGCCTAGTGTGTGCCACTTGTGA +GCAGATTGCAGATTCACAGCATCGGTCTCACAGACAGATGGCAACTACCACCAACCCACTAATCAGGCATGAGAACAGAA +TGGTGCTGGCCAGCACTACAGCTAAGGCTATGGAGCAGATGGCTGGATCGAGTGAGCAGGCAGCGGAAGCCATGGAGGTT +GCTAGTCAGGCTAGGCAGATGGTGCAGGCAATGAGGACAATTGGGACTCATCCTAGCTCCAGTGCCGGTCTGAAAGATAA +TCTTCTTGAAAATTTGCAGGCCTACCAAAAACGAATGGGAGTGCAAATGCAGCGATTCAAGTGATCCTCTTGTTGTTGCC +GCAAGTATCATTGGGATACTGCACTTGATATTGTGGATTCTTGATCGTCTTTTCTTCAAATGCATTTATCGTCGCCTTAA +ATACGGTTTGAAAAGAGGGCCTTCTACGGAAGGGGTACCTGAGTCTATGAGGGAAGAGTATCGGCAGGAACAGCAGAGTG +CTGTGGATGTTGACGATGGTCATTTTGTCAACATAGAGCTGGAGTAAAAAACTACCTTGTTTCTACT +>NC_007364.1 Influenza A virus (A/goose/Guangdong/1/1996(H5N1)) segment 8, complete sequence +GTGACAAAGACATAATGGATTCCAACACGATAACCTCGTTTCAGGTAGATTGTTATCTATGGCACATAAGAAAGCTACTC +AGTATGAGAGACATGTGTGATGCCCCCTTTGATGACAGGCTCCGAAGAGACCAAAAGGCATTAAAGGGAAGAGGCAGCAC +ACTTGGACTCGATTTAAGAGTGGCTACAATGGAGGGGAAAAAGATCGTTGAGGACATCCTGAAGAGTGAGACAAATGAAA +ACCTCAAAATAGCCATTGCTTCCAGTCCTGCTCCTCGGTATATCACCGATATGAGCATAGAGGAGATGAGCCGAGAATGG +TACATGCTGATGCCTAGGCAGAAAATAACTGGAGGCCTTATGGTGAAAATGGACCAAGCCATAATGGATAAAAGAATTAT +CCTTAAAGCAAATTTCTCAGTTCTATTTGATCAACTAGAGACATTAGTCTCTCTGAGGGCATTCACAGAAAGTGGTGCTA +TTGTGGCTGAAATATTTCCCATTCCCTCCGTACCAGGACATTTTACAGAGGATGTCAAAAATGCAATTGGAATCCTCATC +GGTGGACTTGAATGGAATGATAACTCAATTCGAGCGTCTGAAAATATACAGAGATTCGCTTGGGGAATCCATGATGAGAA +TGGGGGACCTTCACTCCCTCCAAAACAGAAACGCTACATGGCGAAACGAGTTGAGTCAGAAGTTTGAAGAGATCAGATGG +CTCATTGCTGAATGTAGAAATATACTGACAAAGACTGAAAATAGCTTTGAACAGATAACATTTTTGCAAGCATTGCAACT +CTTACTTGAAGTTGAGAGTGAGATAAGGACCTTCTCTTTTCAGCTTATTTAATACTAAAAAACAC +>NC_007373.1 Influenza A virus (A/New York/392/2004(H3N2)) segment 1, complete sequence +AGCAAAAGCAGGTCAATTATATTCAGTATGGAAAGAATAAAAGAACTACGGAACCTGATGTCGCAGTCTCGCACTCGCGA +GATACTGACAAAAACCACAGTGGACCATATGGCCATAATTAAGAAGTACACATCGGGGAGACAGGAAAAGAACCCGTCAC +TTAGGATGAAATGGATGATGGCAATGAAATACCCAATCACTGCTGACAAAAGGATAACAGAAATGGTTCCGGAGAGAAAT +GAACAAGGACAAACTCTATGGAGTAAAATGAGTGATGCTGGATCAGATCGAGTGATGGTATCACCTTTGGCTGTAACATG +GTGGAATAGAAATGGACCCGTGGCAAGTACGGTCCATTACCCAAAAGTATACAAGACTTATTTTGACAAAGTCGAAAGGT +TAAAACATGGAACCTTTGGCCCTGTTCATTTTAGAAATCAAGTCAAGATACGCAGAAGAGTAGACATAAACCCTGGTCAT +GCAGACCTCAGTGCCAAAGAGGCACAAGATGTAATTATGGAAGTTGTTTTTCCCAATGAAGTGGGAGCCAGGATACTAAC +ATCAGAATCGCAATTAACAATAACTAAAGAGAAAAAAGAAGAACTCCGAGATTGCAAAATTTCTCCCTTGATGGTTGCAT +ACATGTTAGAGAGAGAACTTGTCCGAAAAACAAGATTTCTCCCAGTTGCTGGCGGAACAAGCAGTATATACATTGAAGTC +TTACATTTGACTCAAGGAACGTGTTGGGAACAAATGTACACTCCAGGTGGAGAAGTGAGGAATGACGATGTTGACCAAAG +CCTAATTATTGCGGCCAGGAACATAGTAAGAAGAGCTGCAGTATCAGCAGATCCACTAGCATCTTTATTGGAGATGTGCC +ACAGCACACAAATTGGCGGGACAAGGATGGTGGACATTCTTAGACAGAACCCGACTGAAGAACAAGCTGTGGATATATGC +AAGGCTGCAATGGGATTGAGAATCAGCTCATCCTTCAGCTTTGGTGGGTTTACATTTAAAAGAACAAGCGGGTCATCAGT +CAAAAAAGAGGAAGAAGTGCTTACAGGCAATCTCCAAACATTGAAGATAAGAGTACATGAGGGGTATGAGGAGTTCACAA +TGGTGGGGAAAAGAGCAACAGCTATACTCAGAAAAGCAACCAGAAGATTGGTTCAGCTCATAGTGAGTGGAAGAGACGAA +CAGTCAATAGCCGAAGCAATAATCGTGGCCATGGTGTTTTCACAAGAGGATTGCATGATAAAAGCAGTTAGAGGTGACCT +GAATTTCGTCAACAGAGCAAATCAACGGTTGAACCCCATGCATCAGCTTTTAAGGCATTTTCAGAAAGATGCGAAAGTGC +TTTTTCAAAATTGGGGAATTGAACACATCGACAGTGTGATGGGAATGGTTGGAGTATTACCAGATATGACTCCAAGCACA +GAGATGTCAATGAGAGGAATAAGAGTCAGCAAAATGGGTGTGGATGAATACTCCAGTACAGAGAGGGTGGTGGTTAGCAT +TGATCGGTTTTTGAGAGTTCGAGACCAACGCGGGAATGTATTATTGTCTCCTGAGGAGGTCAGTGAAACACAGGGAACTG +AAAGATTGACAATAACATATTCATCGTCGATGATGTGGGAGATTAACGGTCCTGAGTCGGTTTTGGTCAATACCTATCAA +TGGATCATCAGAAATTGGGAAGCTGTCAAAATTCAATGGTCTCAGAATCCTGCAATGTTGTACAACAAAATGGAATTTGA +ACCATTTCAATCTTTAGTCCCCAAGGCCATTAGAAGCCAATACAGTGGGTTTGTCAGAACTCTATTCCAACAAATGAGAG +ACGTACTTGGGACATTTGACACCACCCAGATAATAAAGCTTCTCCCTTTTGCAGCCGCTCCACCAAAGCAAAGCAGAATG +CAGTTCTCTTCACTGACTGTAAATGTGAGGGGATCAGGGATGAGAATACTTGTAAGGGGCAATTCTCCTGTATTCAACTA +CAACAAGACCACTAAAAGACTAACAATTCTCGGAAAAGATGCCGGCACTTTAATTGAAGACCCAGATGAAAGCACATCCG +GAGTGGAGTCCGCCGTCTTGAGAGGGTTTCTCATTATAGGTAAGGAAGACAGAAGATACGGACCAGCATTAAGCATCAAT +GAACTGAGTAACCTTGCAAAAGGGGAAAAGGCTAATGTGCTAATCGGGCAAGGAGACGTGGTGTTGGTAATGAAACGAAA +ACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAATGTTGAATAGTTT +AAAAACGACCTTGTTTCTACT +>NC_007372.1 Influenza A virus (A/New York/392/2004(H3N2)) segment 2, complete sequence +AGCAAAAGCAGGCAAACCATTTGAATGGATGTCAATCCGACTCTACTGTTCCTAAAGGTTCCAGCGCAAAATGCCATAAG +CACCACATTCCCTTATACTGGAGATCCTCCATACAGCCATGGAACAGGAACAGGATACACCATGGACACAGTCAACAGAA +CACACCAATATTCAGAGAAGGGGAAGTGGACGACAAATACAGAAACTGGGGCACCCCAACTCAACCCAATTGATGGACCA +CTACCTGAGGATAATGAGCCAAGTGGATATGCACAAACAGACTGTGTCCTGGAGGCTATGGCCTTCCTTGAAGAATCCCA +CCCAGGTATCTTTGAGAACTCATGCCTTGAAACAATGGAAGTCGTTCAACAAACAAGGGTGGACAAACTAACCCAAGGCC +GCCAGACTTATGATTGGACATTAAACAGAAATCAACCGGCAGCAACTGCATTAGCCAACACCATAGAAGTTTTTAGATCG +AATGGACTAACAGCCAATGAATCAGGAAGGCTAATAGATTTCCTCAAGGATGTGATGGAATCAATGGATAAAGAGGAAAT +GGAGATAACAACACACTTTCAAAGAAAAAGGAGAGTAAGAGACAACATGACCAAGAAAATGGTCACACAAAGAACAATAG +GGAAGAAAAAACAAAGAGTGAATAAGAGAGGCTATCTAATAAGAGCTTTGACATTGAACACGATGACCAAAGATGCAGAG +AGAGGTAAATTAAAAAGAAGGGCTATTGCAACACCCGGGATGCAAATTAGAGGGTTCGTGTACTTCGTTGAAACTTTAGC +TAGAAGCATTTGCGAAAAGCTTGAACAGTCTGGACTTCCGGTTGGGGGTAATGAAAAGAAGGCCAAACTGGCAAATGTTG +TGAGAAAAATGATGACTAATTCACAAGACACTGAGCTTTCTTTCACAATCACTGGGGACAACACTAAGTGGAATGAAAAT +CAAAACCCTCGAATGTTTTTGGCGATGATTACATATATCACAAAAAATCAACCTGAGTGGTTCAGAAACATCCTGAGCAT +CGCACCAATAATGTTCTCAAACAAAATGGCAAGACTAGGAAAAGGATACATGTTCGAGAGTAAGAGAATGAAGCTCCGAA +CACAAATACCCGCAGAAATGCTAGCAAGCATTGACCTGAAGTATTTCAATGAATCAACAAGGAAGAAAATTGAGAAAATA +AGGCCTCTTCTAATAGATGGCACAGCATCATTGAGCCCTGGGATGATGATGGGCATGTTCAACATGCTAAGTACGGTTTT +AGGAGTCTCGGTACTGAATCTTGGGCAAAAGAAATACACCAAGACAACATACTGGTGGGATGGGCTCCAATCCTCCGACG +ATTTTGCCCTCATAGTGAATGCACCAAATCATGAGGGAATACAAGCAGGAGTGGATAGATTCTACAGGACCTGCAAGTTA +GTGGGAATCAACATGAGCAAAAAGAAGTCCTATATAAATAAAACAGGGACATTTGAATTCACAAGCTTTTTTTATCGATA +TGGATTTGTGGCTAATTTTAGCATGGAGCTTCCCAGTTTTGGAGTGTCTGGAATAAACGAGTCAGCTGATATGAGTATTG +GAGTAACAGTGATAAAGAACAACATGATAAACAATGACCTTGGGCCAGCAACAGCCCAGATGGCTCTCCAATTGTTCATC +AAAGACTACAGATATACATATAGGTGCCATAGAGGAGACACACAAATTCAGACGAGAAGATCATTCGAGCTAAAGAAGCT +GTGGGATCAAACCCAATCAAGGGCAGGACTATTGGTATCAGATGGGGGACCAAACTTATACAATATCCGGAACCTTCACA +TCCCTGAAGTCTGCTTAAAGTGGGAGCTAATGGATGAGAATTATCGGGGAAGACTTTGTAACCCCCTGAATCCCTTTGTC +AGCCATAAAGAAATTGAGTCTGTAAACAATGCTGTAGTGATGCCAGCCCACGGTCCAGCCAAAAGTATGGAATATGATGC +CGTTGCAACTACACACTCCTGGAATCCCAAGAGGAACCGCTCTATTCTAAACACTAGCCAAAGGGGAATTCTTGAGGATG +AACAGATGTACCAAAAGTGCTGCAACTTGTTCGAGAAATTTTTCCCTAGTAGTTCATATAGGAGACCGATTGGAATTTCT +AGCATGGTGGAGGCCATGGTGTCTAGGGCCCGGATTGATGCCAGAATTGACTTCGAGTCTGGACGGATTAAGAAGGAAGA +GTTCTCTGAGATCATGAAGATCTGTTCCACCATTGAAGAACTCAGACGGCAAAAATAATGAATTTAGCTTGTCCTTCATG +AAAAAATGCCTTGTTTCTACT +>NC_007371.1 Influenza A virus (A/New York/392/2004(H3N2)) segment 3, complete sequence +AGCAAAAGCAGGTACTGATTCGAAATGGAAGATTTTGTGCGACAATGCTTCAACCCGATGATTGTCGAACTTGCAGAAAA +AGCAATGAAAGAGTATGGAGAGGATCTGAAAATTGAAACAAACAAATTTGCAGCAATATGCACCCACTTGGAGGTATGTT +TCATGTATTCAGATTTTCATTTCATCAATGAACAAGGCGAATCAATAGTGGTAGAACTTGATGATCCAAATGCACTGTTA +AAGCACAGATTTGAAATAATCGAGGGGAGAGACAGAACAATGGCCTGGACAGTAGTAAACAGTATCTGCAACACTACTGG +AGCAGAAAAACCAAAGTTTCTACCAGATTTGTATGATTACAAGGAGAATAGATTCATCGAAATTGGAGTGACAAGAAGAG +AAGTCCACATATATTACCTTGAAAAGGCCAATAAAATTAAATCTGAGAACACACACATTCACATCTTCTCATTCACTGGG +GAGGAAATAGCCACAAAGGCAGACTACACTCTCGACGAGGAAAGCAGGGCTAGGATTAAAACCAGGCTATTTACCATAAG +ACAAGAAATGGCCAACAGAGGCCTCTGGGATTCCTTTCGTCAGTCCGAAAGAGGCGAAGAAACAATTGAAGAAAAATTTG +AAATCTCAGGAACTATGCGTAGGCTTGCCGACCAAAGTCTCCCACCGAAATTCTCCTGCCTTGAGAATTTTAGAGCCTAT +GTGGATGGATTCGAACCGAACGGCTGCATTGAGGGCAAGCTTTCTCAAATGTCCAAAGAAGTGAATGCCAAAATTGAACC +TTTTCTGAAGACAACACCAAGACCAATCAAACTTCCTAATGGACCTCCTTGTTATCAGCGGTCCAAATTCCTCCTGATGG +ATGCTTTGAAATTGAGCATTGAAGACCCAAGTCATGAAGGAGAAGGGATTCCATTATATGATGCGATCAAGTGCATAAAA +ACATTCTTTGGATGGAAAGAACCTTATATAGTCAAACCACACGAAAAGGGAATAAATTCAAATTACCTGCTGTCATGGAA +GCAAGTATTGTCAGAATTGCAGGACATTGAAAATGAGGAGAAGATCCCAAGGACTAAAAACATGAAGAAAACGAGTCAAC +TAAAGTGGGCTCTTGGTGAAAACATGGCACCAGAGAAAGTAGACTTTGACAACTGCAGAGACATAAGCGATTTGAAGCAA +TATGATAGTGACGAACCTGAATTAAGGTCACTTTCAAGCTGGATACAGAATGAGTTCAACAAGGCCTGCGAGCTAACTGA +TTCAATCTGGATAGAGCTCGATGAAATTGGAGAGGACGTAGCCCCAATTGAGTACATTGCAAGCATGAGGAGGAATTATT +TCACAGCAGAGGTGTCCCATTGTAGAGCCACTGAGTACATAATGAAGGGGGTATACATTAATACTGCCCTGCTCAATGCA +TCCTGTGCAGCAATGGACGATTTTCAACTAATTCCCATGATAAGCAAGTGCAGAACTAAAGAGGGAAGGCGAAAAACCAA +TTTATATGGATTCATCATAAAGGGAAGATCTCATTTAAGGAATGACACAGATGTGGTAAACTTTGTGAGCATGGAGTTTT +CTCTCACTGACCCGAGACTTGAGCCACATAAATGGGAGAAATACTGTGTCCTTGAGATAGGAGATATGTTACTAAGAAGT +GCCATAGGCCAAATTTCAAGGCCTATGTTCTTGTATGTGAGGACAAACGGAACATCAAAGGTCAAAATGAAATGGGGAAT +GGAGATGAGACGTTGCCTCCTTCAGTCACTCCAGCAGATCGAGAGCATGATTGAAGCCGAGTCCTCGATTAAAGAGAAAG +ACATGACCAAAGAGTTTTTTGAGAATAAATCAGAAGCATGGCCCATTGGGGAGTCCCCCAAGGGAGTGGAAGAAGGTTCC +ATTGGGAAAGTCTGTAGGACTCTATTGGCTAAGTCAGTGTTCAATAGCCTGTATGCATCACCACAATTGGAAGGATTTTC +AGCGGAGTCAAGAAAACTGCTTCTTGTTGTTCAGGCTCTTAGGGACAACCTCGAACCTGGGACCTTTGATCTCGGGGGGC +TATATGAAGCAATTGAGGAGTGCCTGATTAATGATCCCTGGGTTTTGCTCAATGCATCTTGGTTCAACTCCTTCCTGACA +CATGCATTAAAATAGTTATGGCAGTGCTACTATTTGTTATCCGTACTGTCCAAAAAAGTACCTTGTTTCTACT +>NC_007366.1 Influenza A virus (A/New York/392/2004(H3N2)) segment 4, complete sequence +AGCAAAAGCAGGGGATAATTCTATTAACCATGAAGACTATCATTGCTTTGAGCTACATTCTATGTCTGGTTTTCGCTCAA +AAACTTCCCGGAAATGACAACAGCACGGCAACGCTGTGCCTTGGGCACCATGCAGTACCAAACGGAACGATAGTGAAAAC +AATCACGAATGACCAAATTGAAGTCACTAATGCTACTGAACTGGTTCAGAGTTCCTCAACAGGTGGAATATGCGACAGTC +CTCATCAGATCCTTGATGGAGAAAACTGCACACTAATAGATGCTCTATTGGGAGACCCTCAGTGTGATGGCTTCCAAAAT +AAGAAATGGGACCTTTTTGTTGAACGCAGCAAAGCCTACAGCAACTGTTACCCTTATGATGTGCCGGATTATGCCTCCCT +TAGGTCACTAGTTGCCTCATCCGGCACACTGGAGTTTAACAATGAAAGCTTCAATTGGACTGGAGTCACTCAAAATGGAA +CAAGCTCTGCTTGCAAAAGGAGATCTAATAACAGTTTCTTTAGTAGATTGAATTGGTTGACCCACTTAAAATTCAAATAC +CCAGCATTGAACGTGACTATGCCAAACAATGAAAAATTTGACAAACTGTACATTTGGGGGGTTCACCACCCGGGTACGGA +CAATGACCAAATCAGCCTATATGCTCAAGCATCAGGAAGAATCACAGTCTCTACCAAAAGAAGCCAACAAACCGTAATCC +CGAGTATCGGATCTAGACCCAGGATAAGGGATGTCCCCAGCAGAATAAGCATCTATTGGACAATAGTAAAACCGGGAGAC +ATACTTTTGATTAACAGCACAGGGAATCTAATTGCTCCTCGGGGTTACTTCAAAATACGAAGTGGGAAAAGCTCAATAAT +GAGATCAGATGCACCCATTGGCAAATGCAATTCTGAATGCATCACTCCAAATGGAAGCATTCCCAATGACAAACCATTTC +AAAATGTAAACAGGATCACATATGGGGCCTGTCCCAGATATGTTAAGCAAAACACTCTGAAATTGGCAACAGGGATGCGA +AATGTACCAGAGAAACAAACTAGAGGCATATTTGGCGCAATCGCGGGTTTCATAGAAAATGGTTGGGAGGGAATGGTAGA +CGGTTGGTACGGTTTCAGGCATCAAAATTCTGAGGGAACAGGACAAGCAGCAGATCTCAAAAGCACTCAAGCAGCAATCA +ACCAAATCAATGGGAAGCTGAATAGGTTGATCGGGAAAACAAACGAGAAATTCCATCAGATTGAAAAAGAATTCTCAGAA +GTAGAAGGGAGAATTCAGGACCTCGAGAAATATGTTGAGGACACTAAAATAGATCTCTGGTCATACAACGCGGAGCTTCT +TGTGGCCCTGGAGAACCAACATACAATTGATCTAACTGACTCAGAAATGAACAAACTGTTTGAAAGAACAAAGAAGCAAC +TGAGGGAAAATGCTGAGGATATGGGCAATGGTTGTTTCAAAATATACCACAAATGTGACAATGCCTGCATAGGGTCAATC +AGAAATGGAACTTATGACCATGATGTATACAGAGATGAAGCATTAAACAACCGGTTCCAGATCAAAGGTGTTGAGTTGAA +GTCAGGATACAAAGATTGGATCCTATGGATTTCCTTTGCCATATCATGTTTTTTGCTTTGTGTTGCTTTGTTGGGGTTCA +TCATGTGGGCCTGCCAAAAAGGCAACATTAGGTGCAACATTTGCATTTGAGTGCATTAATTAAAAACACCCTTGTTTCTA +CT +>NC_007369.1 Influenza A virus (A/New York/392/2004(H3N2)) segment 5, complete sequence +AGCAAAAGCAGGGTTAATAATCACTCACCGAGTGACATCAAAATCATGGCGTCCCAAGGCACCAAACGGTCTTATGAACA +GATGGAAACTGATGGGGATCGCCAGAATGCAACTGAGATTAGGGCATCCGTCGGGAAGATGATTGATGGAATTGGGAGAT +TCTACATCCAAATGTGCACTGAACTTAAACTCAGTGATCATGAAGGGCGGTTGATCCAGAACAGCTTGACAATAGAGAAA +ATGGTGCTCTCTGCTTTTGATGAAAGAAGGAATAAATACCTGGAAGAACACCCCAGCGCGGGGAAAGATCCCAAGAAAAC +TGGGGGGCCCATATACAGGAGAGTAGATGGAAAATGGATGAGGGAACTCGTCCTTTATGACAAAGAAGAGATAAGGCGAA +TCTGGCGCCAAGCCAACAATGGTGAGGATGCGACAGCTGGTCTAACTCACATAATGATCTGGCATTCCAATTTGAATGAT +GCAACATACCAGAGGACAAGAGCTCTTGTTCGAACTGGAATGGATCCCAGAATGTGCTCTCTGATGCAGGGCTCGACTCT +CCCTAGAAGGTCCGGAGCTGCAGGTGCTGCAGTCAAAGGAATCGGGACAATGGTGATGGAACTGATCAGAATGGTCAAAC +GGGGGATCAACGATCGAAATTTCTGGAGAGGTGAGAATGGGCGGAAAACAAGAAGTGCTTATGAGAGAATGTGCAACATT +CTTAAAGGAAAATTTCAAACAGCTGCACAAAGAGCAATGGTGGATCAAGTGAGAGAAAGTCGGAACCCAGGAAATGCTGA +GATCGAAGATCTCATATTTTTGGCAAGATCTGCATTGATATTGAGAGGGTCAGTTGCTCACAAATCTTGCCTACCTGCCT +GTGCGTATGGACCTGCAGTATCCAGTGGGTACGACTTCGAAAAAGAGGGATATTCCTTGGTGGGAATAGACCCTTTCAAA +CTACTTCAAAATAGCCAAATATACAGCCTAATCAGACCTAACGAGAATCCAGCACACAAGAGTCAGCTGGTGTGGATGGC +ATGCCATTCTGCTGCATTTGAAGATTTAAGATTGTTAAGCTTCATCAGAGGGACAAAAGTATCTCCGCGGGGGAAACTGT +CAACTAGAGGAGTACAAATTGCTTCAAATGAGAACATGGATAATATGGGATCGAGCACTCTTGAACTGAGAAGCGGGTAC +TGGGCCATAAGGACCAGGAGTGGAGGAAACACTAATCAACAGAGGGCCTCCGCAGGCCAAACCAGTGTGCAACCTACGTT +TTCTGTACAAAGAAACCTCCCATTTGAAAAGTCAACCATCATGGCAGCATTCACTGGAAATACGGAGGGAAGGACTTCAG +ACATGAGGGCAGAAATCATAAGAATGATGGAAGGTGCAAAACCAGAAGAAGTGTCATTCCGGGGGAGGGGAGTTTTCGAG +CTCTCAGACGAGAAGGCAACGAACCCGATCGTGCCCTCTTTTGATATGAGTAATGAAGGATCTTATTTCTTCGGAGACAA +TGCAGAAGAGTACGACAATTAAGGAAAAAATACCCTTGTTTCTACT +>NC_007368.1 Influenza A virus (A/New York/392/2004(H3N2)) segment 6, complete sequence +AGCAAAAGCAGGAGTAAAGATGAATCCAAATCAAAAGATAATAACGATTGGCTCTGTTTCTCTCACCATTTCCACAATAT +GCTTCTTCATGCAAATTGCCATCCTGATAACCACTGTAACATTGCATTTCAAGCAATATGAATTCAACTCCCCCCCAAAC +AACCAAGTGATGCTGTGTGAACCAACAATAATAGAAAGAAACATAACAGAGATAGTGTATCTGACCAACACCACCATAGA +GAAGGAAATGTGCCCCAAACTAGCAGAATACAGAAATTGGTCAAAGCCGCAATGTGACATTACAGGATTTGCACCTTTTT +CTAAGGACAATTCGATTAGGCTTTCCGCTGGTGGGGACATCTGGGTGACAAGAGAACCTTATGTGTCATGCGACCCTGAC +AAGTGTTACCAATTTGCCCTTGGACAGGGAACAACACTAAACAACGTGCATTCAAATGACACAGTACATGATAGGACCCC +TTATCGGACCCTATTGATGAATGAATTAGGTGTTCCATTTCATCTGGGGACCAAGCAAGTGTGCATAGCATGGTCCAGCT +CAAGTTGTCACGATGGAAAAGCATGGCTGCATGTTTGTGTAACGGGGGATGATAAAAATGCAACTGCTAGCTTCATTTAC +AATGGGAGGCTTGTAGATAGTATTGTTTCATGGTCCAAAAAAATCCTCAGGACCCAGGAGTCAGAATGCGTTTGTATCAA +TGGAACTTGTACAGTAGTAATGACTGATGGGAGTGCTTCAGGAAAAGCTGATACTAAAATACTATTCATTGAGGAGGGGA +AAATCATTCATACTAGCACATTGTCAGGAAGTGCTCAGCATGTCGAGGAGTGCTCCTGCTATCCTCGATATCCTGGTGTC +AGATGTGTCTGCAGAGACAACTGGAAAGGCTCCAATAGGCCCATCGTAGATATAAACATAAAGGATTATAGCATTGTTTC +CAGTTATGTGTGCTCAGGGCTTGTTGGAGACACACCCAGAAAAAACGACAGCTCCAGCAGTAGCCATTGCTTGGATCCTA +ACAATGAAGAAGGTGGTCATGGAGTGAAAGGCTGGGCCTTTGATGATGGAAATGACGTGTGGATGGGAAGAACGATCAGC +GAGAAGTTACGCTCAGGATATGAAACCTTCAAAGTCATTGAAGGCTGGTCCAAACCTAATTCCAAATTGCAGATAAATAG +GCAAGTCATAGTTGACAGAGGTAATAGGTCCGGTTATTCTGGTATTTTCTCTGTTGAAGGCAAAAGCTGCATCAATCGGT +GCTTTTATGTGGAGTTGATAAGGGGAAGAAAAGAGGAAACTGAAGTCTTGTGGACCTCAAACAGTATTGTTGTGTTTTGT +GGCACCTCAGGTACATATGGAACAGGCTCATGGCCTGATGGGGCGGACATCAATCTCATGCCTATATAAGCTTTCGCAAT +TTTAGAAAAAAACTCCTTGTTTCTACT +>NC_007367.1 Influenza A virus (A/New York/392/2004(H3N2)) segment 7, complete sequence +AGCAAAAGCAGGTAGATATTGAAAGATGAGCCTTCTAACCGAGGTCGAAACGTATGTTCTCTCTATCGTTCCATCAGGCC +CCCTCAAAGCCGAGATCGCGCAGAGACTTGAAGATGTCTTTGCTGGGAAAAACACAGATCTTGAGGCTCTCATGGAATGG +CTAAAGACAAGACCAATTCTGTCACCTCTGACTAAGGGGATTTTGGGGTTTGTGTTCACGCTCACCGTGCCCAGTGAGCG +AGGACTGCAGCGTAGACGCTTTGTCCAAAATGCCCTCAATGGGAATGGAGATCCAAATAACATGGACAAAGCAGTTAAAC +TGTATAGGAAACTTAAGAGGGAGATAACGTTCCATGGGGCCAAAGAAATAGCTCTCAGTTATTCTGCTGGTGCACTTGCC +AGTTGCATGGGCCTCATATACAATAGGATGGGGGCTGTAACCACTGAAGTGGCATTTGGCCTGGTATGTGCAACATGTGA +ACAGATTGCTGACTCCCAGCACAGGTCTCATAGGCAAATGGTGGCAACAACCAATCCATTAATAAAACATGAGAACAGAA +TGGTTTTGGCCAGCACTACAGCTAAGGCTATGGAGCAAATGGCTGGATCAAGTGAGCAGGCAGCGGAGGCCATGGAAATT +GCTAGTCAGGCCAGGCAAATGGTGCAGGCAATGAGAGCCGTTGGGACTCATCCTAGCTCCAGTACTGGTCTAAGAGATGA +TCTTCTTGAAAATTTGCAGACCTATCAGAAACGAATGGGGGTGCAGATGCAACGATTCAAGTGACCCGCTTGTTGTTGCC +GCGAGTATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCGTCTTTTTTTCAAATGCGTCTATCGACTCTTCAA +ACACGGCCTTAAAAGAGGCCCTTCTACGGAAGGAGTACCTGAGTCTATGAGGGAAGAATATCGAAAGGAACAGCAGAATG +CTGTGGATGCTGACGACAGTCATTTTGTCAGCATAGAGTTGGAGTAAAAAACTACCTTGTTTCTACT +>NC_007370.1 Influenza A virus (A/New York/392/2004(H3N2)) segment 8, complete sequence +AGCAAAAGCAGGGTGACAAAGACATAATGGATTCCAACACTGTGTCAAGTTTCCAGGTAGATTGCTTTCTTTGGCATATC +CGGAAACAAGTTGTAGACCAAGAACTGAGTGATGCCCCATTCCTTGATCGGCTTCGCCGAGATCAGAGGTCCCTAAGGGG +AAGAGGCAATACTCTCGGTCTAGACATCAAAGCAGCCACCCATGTTGGAAAGCAAATTGTAGAAAAGATTCTGAAAGAAG +AATCTGATGAGGCACTTAAAATGACCATGGTCTCCACACCTGCTTCGCGATACATAACTGACATGACTATTGAGGAATTG +TCAAGAAACTGGTTCATGCTAATGCCCAAGCAGAAAGTGGAAGGACCTCTTTGCATCAGAATGGACCAGGCAATCATGGA +GAAAAACATCATGTTGAAAGCGAATTTCAGTGTGATTTTTGACCGACTAGAGACCATAGTATTACTAAGGGCTTTCACCG +AAGAGGGAGCAATTGTTGGCGAAATCTCACCATTGCCTTCTTTTCCAGGACATACTATTGAGGATGTCAAAAATGCAATT +GGGGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCGAGTCTCTAAAAATCTACAGAGATTCGCTTGGAGAAG +CAGTAATGAGAATGGGGGACCTCCACTTACTCCAAAACAGAAACGGAAAATGGCGAGAACAGCTAGGTCAAAAGTTTGAA +GAGATAAGATGGCTGATTGAAGAAGTGAGACACAGACTAAAAACAACTGAAAATAGCTTTGAACAAATAACATTCATGCA +AGCATTACAACTGCTGTTTGAAGTGGAACAGGAGATAAGAACTTTCTCATTTCAGCTTATTTAATGATAAAAAACACCCT +TGTTTCTACT +>NC_002023.1 Influenza A virus (A/Puerto Rico/8/1934(H1N1)) segment 1, complete sequence +AGCGAAAGCAGGTCAATTATATTCAATATGGAAAGAATAAAAGAACTAAGAAATCTAATGTCGCAGTCTCGCACCCGCGA +GATACTCACAAAAACCACCGTGGACCATATGGCCATAATCAAGAAGTACACATCAGGAAGACAGGAGAAGAACCCAGCAC +TTAGGATGAAATGGATGATGGCAATGAAATATCCAATTACAGCAGACAAGAGGATAACGGAAATGATTCCTGAGAGAAAT +GAGCAAGGACAAACTTTATGGAGTAAAATGAATGATGCCGGATCAGACCGAGTGATGGTATCACCTCTGGCTGTGACATG +GTGGAATAGGAATGGACCAATGACAAATACAGTTCATTATCCAAAAATCTACAAAACTTATTTTGAAAGAGTCGAAAGGC +TAAAGCATGGAACCTTTGGCCCTGTCCATTTTAGAAACCAAGTCAAAATACGTCGGAGAGTTGACATAAATCCTGGTCAT +GCAGATCTCAGTGCCAAGGAGGCACAGGATGTAATCATGGAAGTTGTTTTCCCTAACGAAGTGGGAGCCAGGATACTAAC +ATCGGAATCGCAACTAACGATAACCAAAGAGAAGAAAGAAGAACTCCAGGATTGCAAAATTTCTCCTTTGATGGTTGCAT +ACATGTTGGAGAGAGAACTGGTCCGCAAAACGAGATTCCTCCCAGTGGCTGGTGGAACAAGCAGTGTGTACATTGAAGTG +TTGCATTTGACTCAAGGAACATGCTGGGAACAGATGTATACTCCAGGAGGGGAAGTGAAGAATGATGATGTTGATCAAAG +CTTGATTATTGCTGCTAGGAACATAGTGAGAAGAGCTGCAGTATCAGCAGACCCACTAGCATCTTTATTGGAGATGTGCC +ACAGCACACAGATTGGTGGAATTAGGATGGTAGACATCCTTAAGCAGAACCCAACAGAAGAGCAAGCCGTGGGTATATGC +AAGGCTGCAATGGGACTGAGAATTAGCTCATCCTTCAGTTTTGGTGGATTCACATTTAAGAGAACAAGCGGATCATCAGT +CAAGAGAGAGGAAGAGGTGCTTACGGGCAATCTTCAAACATTGAAGATAAGAGTGCATGAGGGATATGAAGAGTTCACAA +TGGTTGGGAGAAGAGCAACAGCCATACTCAGAAAAGCAACCAGGAGATTGATTCAGCTGATAGTGAGTGGGAGAGACGAA +CAGTCGATTGCCGAAGCAATAATTGTGGCCATGGTATTTTCACAAGAGGATTGTATGATAAAAGCAGTTAGAGGTGATCT +GAATTTCGTCAATAGGGCGAATCAGCGACTGAATCCTATGCATCAACTTTTAAGACATTTTCAGAAGGATGCGAAAGTGC +TTTTTCAAAATTGGGGAGTTGAACCTATCGACAATGTGATGGGAATGATTGGGATATTGCCCGACATGACTCCAAGCATC +GAGATGTCAATGAGAGGAGTGAGAATCAGCAAAATGGGTGTAGATGAGTACTCCAGCACGGAGAGGGTAGTGGTGAGCAT +TGACCGGTTCTTGAGAGTCCGGGACCAACGAGGAAATGTACTACTGTCTCCCGAGGAGGTCAGTGAAACACAGGGAACAG +AGAAACTGACAATAACTTACTCATCGTCAATGATGTGGGAGATTAATGGTCCTGAATCAGTGTTGGTCAATACCTATCAA +TGGATCATCAGAAACTGGGAAACTGTTAAAATTCAGTGGTCCCAGAACCCTACAATGCTATACAATAAAATGGAATTTGA +ACCATTTCAGTCTTTAGTACCTAAGGCCATTAGAGGCCAATACAGTGGGTTTGTGAGAACTCTGTTCCAACAAATGAGGG +ATGTGCTTGGGACATTTGATACCGCACAGATAATAAAACTTCTTCCCTTCGCAGCCGCTCCACCAAAGCAAAGTAGAATG +CAGTTCTCCTCATTTACTGTGAATGTGAGGGGATCAGGAATGAGAATACTTGTAAGGGGCAATTCTCCTGTATTCAACTA +CAACAAGGCCACGAAGAGACTCACAGTTCTCGGAAAGGATGCTGGCACTTTAACCGAAGACCCAGATGAAGGCACAGCTG +GAGTGGAGTCCGCTGTTCTGAGGGGATTCCTCATTCTGGGCAAAGAAGACAGGAGATATGGGCCAGCATTAAGCATCAAT +GAACTGAGCAACCTTGCGAAAGGAGAGAAGGCTAATGTGCTAATTGGGCAAGGAGACGTGGTGTTGGTAATGAAACGAAA +ACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAGTGTCGAATAGTTT +AAAAACGACCTTGTTTCTACT +>NC_002021.1 Influenza A virus (A/Puerto Rico/8/1934(H1N1)) segment 2, complete sequence +AGCGAAAGCAGGCAAACCATTTGAATGGATGTCAATCCGACCTTACTTTTCTTAAAAGTGCCAGCACAAAATGCTATAAG +CACAACTTTCCCTTATACCGGAGACCCTCCTTACAGCCATGGGACAGGAACAGGATACACCATGGATACTGTCAACAGGA +CACATCAGTACTCAGAAAAGGCAAGATGGACAACAAACACCGAAACTGGAGCACCGCAACTCAACCCGATTGATGGGCCA +CTGCCAGAAGACAATGAACCAAGTGGTTATGCCCAAACAGATTGTGTATTGGAAGCAATGGCTTTCCTTGAGGAATCCCA +TCCTGGTATTTTTGAAAACTCGTGTATTGAAACGATGGAGGTTGTTCAGCAAACACGAGTAGACAAGCTGACACAAGGCC +GACAGACCTATGACTGGACTTTAAATAGAAACCAGCCTGCTGCAACAGCATTGGCCAACACAATAGAAGTGTTCAGATCA +AATGGCCTCACGGCCAATGAGTCTGGAAGGCTCATAGACTTCCTTAAGGATGTAATGGAGTCAATGAAAAAAGAAGAAAT +GGGGATCACAACTCATTTTCAGAGAAAGAGACGGGTGAGAGACAATATGACTAAGAAAATGATAACACAGAGAACAATAG +GTAAAAGGAAACAGAGATTGAACAAAAGGAGTTATCTAATTAGAGCATTGACCCTGAACACAATGACCAAAGATGCTGAG +AGAGGGAAGCTAAAACGGAGAGCAATTGCAACCCCAGGGATGCAAATAAGGGGGTTTGTATACTTTGTTGAGACACTGGC +AAGGAGTATATGTGAGAAACTTGAACAATCAGGGTTGCCAGTTGGAGGCAATGAGAAGAAAGCAAAGTTGGCAAATGTTG +TAAGGAAGATGATGACCAATTCTCAGGACACCGAACTTTCTTTGACCATCACTGGAGATAACACCAAATGGAACGAAAAT +CAGAATCCTCGGATGTTTTTGGCCATGATCACATATATGACCAGAAATCAGCCCGAATGGTTCAGAAATGTTCTAAGTAT +TGCTCCAATAATGTTCTCAAACAAAATGGCGAGACTGGGAAAAGGGTATATGTTTGAGAGCAAGAGTATGAAACTTAGAA +CTCAAATACCTGCAGAAATGCTAGCAAGCATTGATTTGAAATATTTCAATGATTCAACAAGAAAGAAGATTGAAAAAATC +CGACCGCTCTTAATAGAGGGGACTGCATCATTGAGCCCTGGAATGATGATGGGCATGTTCAATATGTTAAGCACTGTATT +AGGCGTCTCCATCCTGAATCTTGGACAAAAGAGATACACCAAGACTACTTACTGGTGGGATGGTCTTCAATCCTCTGACG +ATTTTGCTCTGATTGTGAATGCACCCAATCATGAAGGGATTCAAGCCGGAGTCGACAGGTTTTATCGAACCTGTAAGCTA +CATGGAATCAATATGAGCAAGAAAAAGTCTTACATAAACAGAACAGGTACATTTGAATTCACAAGTTTTTTCTATCGTTA +TGGGTTTGTTGCCAATTTCAGCATGGAGCTTCCCAGTTTTGGTGTGTCTGGGAGCAACGAGTCAGCGGACATGAGTATTG +GAGTTACTGTCATCAAAAACAATATGATAAACAATGATCTTGGTCCAGCAACAGCTCAAATGGCCCTTCAGTTGTTCATC +AAAGATTACAGGTACACGTACCGATGCCATAGAGGTGACACACAAATACAAACCCGAAGATCATTTGAAATAAAGAAACT +GTGGGAGCAAACCCGTTCCAAAGCTGGACTGCTGGTCTCCGACGGAGGCCCAAATTTATACAACATTAGAAATCTCCACA +TTCCTGAAGTCTGCCTAAAATGGGAATTGATGGATGAGGATTACCAGGGGCGTTTATGCAACCCACTGAACCCATTTGTC +AGCCATAAAGAAATTGAATCAATGAACAATGCAGTGATGATGCCAGCACATGGTCCAGCCAAAAACATGGAGTATGATGC +TGTTGCAACAACACACTCCTGGATCCCCAAAAGAAATCGATCCATCTTGAATACAAGTCAAAGAGGAGTACTTGAAGATG +AACAAATGTACCAAAGGTGCTGCAATTTATTTGAAAAATTCTTCCCCAGCAGTTCATACAGAAGACCAGTCGGGATATCC +AGTATGGTGGAGGCTATGGTTTCCAGAGCCCGAATTGATGCACGGATTGATTTCGAATCTGGAAGGATAAAGAAAGAAGA +GTTCACTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAAAAATAGTGAATTTAGCTTGTCCTTCATG +AAAAAATGCCTTGTTCCTACT +>NC_002022.1 Influenza A virus (A/Puerto Rico/8/1934(H1N1)) segment 3, complete sequence +AGCGAAAGCAGGTACTGATCCAAAATGGAAGATTTTGTGCGACAATGCTTCAATCCGATGATTGTCGAGCTTGCGGAAAA +AACAATGAAAGAGTATGGGGAGGACCTGAAAATCGAAACAAACAAATTTGCAGCAATATGCACTCACTTGGAAGTATGCT +TCATGTATTCAGATTTCCACTTCATCAATGAGCAAGGCGAGTCAATAATCGTAGAACTTGGTGATCCTAATGCACTTTTG +AAGCACAGATTTGAAATAATCGAGGGAAGAGATCGCACAATGGCCTGGACAGTAGTAAACAGTATTTGCAACACTACAGG +GGCTGAGAAACCAAAGTTTCTACCAGATTTGTATGATTACAAGGAAAATAGATTCATCGAAATTGGAGTAACAAGGAGAG +AAGTTCACATATACTATCTGGAAAAGGCCAATAAAATTAAATCTGAGAAAACACACATCCACATTTTCTCGTTCACTGGG +GAAGAAATGGCCACAAAGGCCGACTACACTCTCGATGAAGAAAGCAGGGCTAGGATCAAAACCAGGCTATTCACCATAAG +ACAAGAAATGGCCAGCAGAGGCCTCTGGGATTCCTTTCGTCAGTCCGAGAGAGGAGAAGAGACAATTGAAGAAAGGTTTG +AAATCACAGGAACAATGCGCAAGCTTGCCGACCAAAGTCTCCCGCCGAACTTCTCCAGCCTTGAAAATTTTAGAGCCTAT +GTGGATGGATTCGAACCGAACGGCTACATTGAGGGCAAGCTGTCTCAAATGTCCAAAGAAGTAAATGCTAGAATTGAACC +TTTTTTGAAAACAACACCACGACCACTTAGACTTCCGAATGGGCCTCCCTGTTCTCAGCGGTCCAAATTCCTGCTGATGG +ATGCCTTAAAATTAAGCATTGAGGACCCAAGTCATGAAGGAGAGGGAATACCGCTATATGATGCAATCAAATGCATGAGA +ACATTCTTTGGATGGAAGGAACCCAATGTTGTTAAACCACACGAAAAGGGAATAAATCCAAATTATCTTCTGTCATGGAA +GCAAGTACTGGCAGAACTGCAGGACATTGAGAATGAGGAGAAAATTCCAAAGACTAAAAATATGAAAAAAACAAGTCAGC +TAAAGTGGGCACTTGGTGAGAACATGGCACCAGAAAAGGTAGACTTTGACGACTGTAAAGATGTAGGTGATTTGAAGCAA +TATGATAGTGATGAACCAGAATTGAGGTCGCTTGCAAGTTGGATTCAGAATGAGTTCAACAAGGCATGCGAACTGACAGA +TTCAAGCTGGATAGAGCTTGATGAGATTGGAGAAGATGTGGCTCCAATTGAACACATTGCAAGCATGAGAAGGAATTATT +TCACATCAGAGGTGTCTCACTGCAGAGCCACAGAATACATAATGAAGGGGGTGTACATCAATACTGCCTTACTTAATGCA +TCTTGTGCAGCAATGGATGATTTCCAATTAATTCCAATGATAAGCAAGTGTAGAACTAAGGAGGGAAGGCGAAAGACCAA +CTTGTATGGTTTCATCATAAAAGGAAGATCCCACTTAAGGAATGACACCGACGTGGTAAACTTTGTGAGCATGGAGTTTT +CTCTCACTGACCCAAGACTTGAACCACACAAATGGGAGAAGTACTGTGTTCTTGAGATAGGAGATATGCTTCTAAGAAGT +GCCATAGGCCAGGTTTCAAGGCCCATGTTCTTGTATGTGAGGACAAATGGAACCTCAAAAATTAAAATGAAATGGGGAAT +GGAGATGAGGCGTTGTCTCCTCCAGTCACTTCAACAAATTGAGAGTATGATTGAAGCTGAGTCCTCTGTCAAAGAGAAAG +ACATGACCAAAGAGTTCTTTGAGAACAAATCAGAAACATGGCCCATTGGAGAGTCTCCCAAAGGAGTGGAGGAAAGTTCC +ATTGGGAAGGTCTGCAGGACTTTATTAGCAAAGTCGGTATTTAACAGCTTGTATGCATCTCCACAACTAGAAGGATTTTC +AGCTGAATCAAGAAAACTGCTTCTTATCGTTCAGGCTCTTAGGGACAATCTGGAACCTGGGACCTTTGATCTTGGGGGGC +TATATGAAGCAATTGAGGAGTGCCTAATTAATGATCCCTGGGTTTTGCTTAATGCTTCTTGGTTCAACTCCTTCCTTACA +CATGCATTGAGTTAGTTGTGGCAGTGCTACTATTTGCTATCCATACTGTCCAAAAAAGTACCTTGTTTCTACT +>NC_002017.1 Influenza A virus (A/Puerto Rico/8/1934(H1N1)) segment 4, complete sequence +AGCAAAAGCAGGGGAAAATAAAAACAACCAAAATGAAGGCAAACCTACTGGTCCTGTTATGTGCACTTGCAGCTGCAGAT +GCAGACACAATATGTATAGGCTACCATGCGAACAATTCAACCGACACTGTTGACACAGTGCTCGAGAAGAATGTGACAGT +GACACACTCTGTTAACCTGCTCGAAGACAGCCACAACGGAAAACTATGTAGATTAAAAGGAATAGCCCCACTACAATTGG +GGAAATGTAACATCGCCGGATGGCTCTTGGGAAACCCAGAATGCGACCCACTGCTTCCAGTGAGATCATGGTCCTACATT +GTAGAAACACCAAACTCTGAGAATGGAATATGTTATCCAGGAGATTTCATCGACTATGAGGAGCTGAGGGAGCAATTGAG +CTCAGTGTCATCATTCGAAAGATTCGAAATATTTCCCAAAGAAAGCTCATGGCCCAACCACAACACAACCAAAGGAGTAA +CGGCAGCATGCTCCCATGCGGGGAAAAGCAGTTTTTACAGAAATTTGCTATGGCTGACGGAGAAGGAGGGCTCATACCCA +AAGCTGAAAAATTCTTATGTGAACAAGAAAGGGAAAGAAGTCCTTGTACTGTGGGGTATTCATCACCCGTCTAACAGTAA +GGATCAACAGAATATCTATCAGAATGAAAATGCTTATGTCTCTGTAGTGACTTCAAATTATAACAGGAGATTTACCCCGG +AAATAGCAGAAAGACCCAAAGTAAGAGATCAAGCTGGGAGGATGAACTATTACTGGACCTTGCTAAAACCCGGAGACACA +ATAATATTTGAGGCAAATGGAAATCTAATAGCACCAAGGTATGCTTTCGCACTGAGTAGAGGCTTTGGGTCCGGCATCAT +CACCTCAAACGCATCAATGCATGAGTGTAACACGAAGTGTCAAACACCCCTGGGAGCTATAAACAGCAGTCTCCCTTTCC +AGAATATACACCCAGTCACAATAGGAGAGTGCCCAAAATACGTCAGGAGTGCCAAATTGAGGATGGTTACAGGACTAAGG +AACATTCCGTCCATTCAATCCAGAGGTCTATTTGGAGCCATTGCCGGTTTTATTGAAGGGGGATGGACTGGAATGATAGA +TGGATGGTACGGTTATCATCATCAGAATGAACAGGGATCAGGCTATGCAGCGGATCAAAAAAGCACACAAAATGCCATTA +ACGGGATTACAAACAAGGTGAACTCTGTTATCGAGAAAATGAACATTCAATTCACAGCTGTGGGTAAAGAATTCAACAAA +TTAGAAAAAAGGATGGAAAATTTAAATAAAAAAGTTGATGATGGATTTCTGGACATTTGGACATATAATGCAGAATTGTT +AGTTCTACTGGAAAATGAAAGGACTCTGGATTTCCATGACTCAAATGTGAAGAATCTGTATGAGAAAGTAAAAAGCCAAT +TAAAGAATAATGCCAAAGAAATCGGAAATGGATGTTTTGAGTTCTACCACAAGTGTGACAATGAATGCATGGAAAGTGTA +AGAAATGGGACTTATGATTATCCCAAATATTCAGAAGAGTCAAAGTTGAACAGGGAAAAGGTAGATGGAGTGAAATTGGA +ATCAATGGGGATCTATCAGATTCTGGCGATCTACTCAACTGTCGCCAGTTCACTGGTGCTTTTGGTCTCCCTGGGGGCAA +TCAGTTTCTGGATGTGTTCTAATGGATCTTTGCAGTGCAGAATATGCATCTGAGATTAGAATTTCAGAAATATGAGGAAA +AACACCCTTGTTTCTACT +>NC_002019.1 Influenza A virus (A/Puerto Rico/8/1934(H1N1)) segment 5, complete sequence +AGCAAAAGCAGGGTAGATAATCACTCACTGAGTGACATCAAAATCATGGCGTCCCAAGGCACCAAACGGTCTTACGAACA +GATGGAGACTGATGGAGAACGCCAGAATGCCACTGAAATCAGAGCATCCGTCGGAAAAATGATTGGTGGAATTGGACGAT +TCTACATCCAAATGTGCACAGAACTTAAACTCAGTGATTATGAGGGACGGTTGATCCAAAACAGCTTAACAATAGAGAGA +ATGGTGCTCTCTGCTTTTGACGAAAGGAGAAATAAATACCTGGAAGAACATCCCAGTGCGGGGAAGGATCCTAAGAAAAC +TGGAGGACCTATATACAGAAGAGTAAACGGAAAGTGGATGAGAGAACTCATCCTTTATGACAAAGAAGAAATAAGGCGAA +TCTGGCGCCAAGCTAATAATGGTGACGATGCAACGGCTGGTCTGACTCACATGATGATCTGGCATTCCAATTTGAATGAT +GCAACTTATCAGAGGACAAGGGCTCTTGTTCGCACCGGAATGGATCCCAGGATGTGCTCTCTGATGCAAGGTTCAACTCT +CCCTAGGAGGTCTGGAGCCGCAGGTGCTGCAGTCAAAGGAGTTGGAACAATGGTGATGGAATTGGTCAGGATGATCAAAC +GTGGGATCAATGATCGGAACTTCTGGAGGGGTGAGAATGGACGAAAAACAAGAATTGCTTATGAAAGAATGTGCAACATT +CTCAAAGGGAAATTTCAAACTGCTGCACAAAAAGCAATGATGGATCAAGTGAGAGAGAGCCGGGACCCAGGGAATGCTGA +GTTCGAAGATCTCACTTTTCTAGCACGGTCTGCACTCATATTGAGAGGGTCGGTTGCTCACAAGTCCTGCCTGCCTGCCT +GTGTGTATGGACCTGCCGTAGCCAGTGGGTACGACTTTGAAAGAGAGGGATACTCTCTAGTCGGAATAGACCCTTTCAGA +CTGCTTCAAAACAGCCAAGTGTACAGCCTAATCAGACCAAATGAGAATCCAGCACACAAGAGTCAACTGGTGTGGATGGC +ATGCCATTCTGCCGCATTTGAAGATCTAAGAGTATTGAGCTTCATCAAAGGGACGAAGGTGGTCCCAAGAGGGAAGCTTT +CCACTAGAGGAGTTCAAATTGCTTCCAATGAAAATATGGAGACTATGGAATCAAGTACACTTGAACTGAGAAGCAGGTAC +TGGGCCATAAGGACCAGAAGTGGAGGAAACACCAATCAACAGAGGGCATCTGCGGGCCAAATCAGCATACAACCTACGTT +CTCAGTACAGAGAAATCTCCCTTTTGACAGAACAACCGTTATGGCAGCATTCACTGGGAATACAGAGGGGAGAACATCTG +ACATGAGGACCGAAATCATAAGGATGATGGAAAGTGCAAGACCAGAAGATGTGTCTTTCCAGGGGCGGGGAGTCTTCGAG +CTCTCGGACGAAAAGGCAGCGAGCCCGATCGTGCCTTCCTTTGACATGAGTAATGAAGGATCTTATTTCTTCGGAGACAA +TGCAGAGGAGTACGACAATTAAAGAAAAATACCCTTGTTTCTACT +>NC_002018.1 Influenza A virus (A/Puerto Rico/8/1934(H1N1)) segment 6, complete sequence +AGCGAAAGCAGGGGTTTAAAATGAATCCAAATCAGAAAATAATAACCATTGGATCAATCTGTCTGGTAGTCGGACTAATT +AGCCTAATATTGCAAATAGGGAATATAATCTCAATATGGATTAGCCATTCAATTCAAACTGGAAGTCAAAACCATACTGG +AATATGCAACCAAAACATCATTACCTATAAAAATAGCACCTGGGTAAAGGACACAACTTCAGTGATATTAACCGGCAATT +CATCTCTTTGTCCCATCCGTGGGTGGGCTATATACAGCAAAGACAATAGCATAAGAATTGGTTCCAAAGGAGACGTTTTT +GTCATAAGAGAGCCCTTTATTTCATGTTCTCACTTGGAATGCAGGACCTTTTTTCTGACCCAAGGTGCCTTACTGAATGA +CAGGCATTCAAATGGGACTGTTAAGGACAGAAGCCCTTATAGGGCCTTAATGAGCTGCCCTGTCGGTGAAGCTCCGTCCC +CGTACAATTCAAGATTTGAATCGGTTGCTTGGTCAGCAAGTGCATGTCATGATGGCATGGGCTGGCTAACAATCGGAATT +TCAGGTCCAGATAATGGAGCAGTGGCTGTATTAAAATACAACGGCATAATAACTGAAACCATAAAAAGTTGGAGGAAGAA +AATATTGAGGACACAAGAGTCTGAATGTGCCTGTGTAAATGGTTCATGTTTTACTATAATGACTGATGGCCCGAGTGATG +GGCTGGCCTCGTACAAAATTTTCAAGATCGAAAAGGGGAAGGTTACTAAATCAATAGAGTTGAATGCACCTAATTCTCAC +TATGAGGAATGTTCCTGTTACCCTGATACCGGCAAAGTGATGTGTGTGTGCAGAGACAATTGGCATGGTTCGAACCGGCC +ATGGGTGTCTTTCGATCAAAACCTGGATTATCAAATAGGATACATCTGCAGTGGGGTTTTCGGTGACAACCCGCGTCCCA +AAGATGGAACAGGCAGCTGTGGTCCAGTGTATGTTGATGGAGCAAACGGAGTAAAGGGATTTTCATATAGGTATGGTAAT +GGTGTTTGGATAGGAAGGACCAAAAGTCACAGTTCCAGACATGGGTTTGAGATGATTTGGGATCCTAATGGATGGACAGA +GACTGATAGTAAGTTCTCTGTGAGGCAAGATGTTGTGGCAATGACTGATTGGTCAGGGTATAGCGGGAGTTTCGTTCAAC +ATCCTGAGCTAACAGGGCTAGACTGTATAAGGCCGTGCTTCTGGGTTGAATTAATCAGGGGACGACCTAAAGAAAAAACA +ATCTGGACTAGTGCGAGCAGCATTTCTTTTTGTGGCGTGAATAGTGATACTGTAGATTGGTCTTGGCCAGACGGTGCTGA +GTTGCCATTCACCATTGACAAGTAGTCTGTTCAAAAAACTCCTTGTTTCTACT +>NC_002016.1 Influenza A virus (A/Puerto Rico/8/1934(H1N1)) segment 7, complete sequence +AGCGAAAGCAGGTAGATATTGAAAGATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCATCCCGTCAGGCC +CCCTCAAAGCCGAGATCGCACAGAGACTTGAAGATGTCTTTGCAGGGAAGAACACCGATCTTGAGGTTCTCATGGAATGG +CTAAAGACAAGACCAATCCTGTCACCTCTGACTAAGGGGATTTTAGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCG +AGGACTGCAGCGTAGACGCTTTGTCCAAAATGCCCTTAATGGGAACGGGGATCCAAATAACATGGACAAAGCAGTTAAAC +TGTATAGGAAGCTCAAGAGGGAGATAACATTCCATGGGGCCAAAGAAATCTCACTCAGTTATTCTGCTGGTGCACTTGCC +AGTTGTATGGGCCTCATATACAACAGGATGGGGGCTGTGACCACTGAAGTGGCATTTGGCCTGGTATGTGCAACCTGTGA +ACAGATTGCTGACTCCCAGCATCGGTCTCATAGGCAAATGGTGACAACAACCAACCCACTAATCAGACATGAGAACAGAA +TGGTTTTAGCCAGCACTACAGCTAAGGCTATGGAGCAAATGGCTGGATCGAGTGAGCAAGCAGCAGAGGCCATGGAGGTT +GCTAGTCAGGCTAGGCAAATGGTGCAAGCGATGAGAACCATTGGGACTCATCCTAGCTCCAGTGCTGGTCTGAAAAATGA +TCTTCTTGAAAATTTGCAGGCCTATCAGAAACGAATGGGGGTGCAGATGCAACGGTTCAAGTGATCCTCTCGCTATTGCC +GCAAATATCATTGGGATCTTGCACTTGATATTGTGGATTCTTGATCGTCTTTTTTTCAAATGCATTTACCGTCGCTTTAA +ATACGGACTGAAAGGAGGGCCTTCTACGGAAGGAGTGCCAAAGTCTATGAGGGAAGAATATCGAAAGGAACAGCAGAGTG +CTGTGGATGCTGACGATGGTCATTTTGTCAGCATAGAGCTGGAGTAAAAAACTACCTTGTTTCTACT +>NC_002020.1 Influenza A virus (A/Puerto Rico/8/1934(H1N1)) segment 8, complete sequence +AGCAAAAGCAGGGTGACAAAGACATAATGGATCCAAACACTGTGTCAAGCTTTCAGGTAGATTGCTTTCTTTGGCATGTC +CGCAAACGAGTTGCAGACCAAGAACTAGGTGATGCCCCATTCCTTGATCGGCTTCGCCGAGATCAGAAATCCCTAAGAGG +AAGGGGCAGCACTCTTGGTCTGGACATCGAGACAGCCACACGTGCTGGAAAGCAGATAGTGGAGCGGATTCTGAAAGAAG +AATCCGATGAGGCACTTAAAATGACCATGGCCTCTGTACCTGCGTCGCGTTACCTAACCGACATGACTCTTGAGGAAATG +TCAAGGGAATGGTCCATGCTCATACCCAAGCAGAAAGTGGCAGGCCCTCTTTGTATCAGAATGGACCAGGCGATCATGGA +TAAAAACATCATACTGAAAGCGAACTTCAGTGTGATTTTTGACCGGCTGGAGACTCTAATATTGCTAAGGGCTTTCACCG +AAGAGGGAGCAATTGTTGGCGAAATTTCACCATTGCCTTCTCTTCCAGGACATACTGCTGAGGATGTCAAAAATGCAGTT +GGAGTCCTCATCGGAGGACTTGAATGGAATGATAACACAGTTCGAGTCTCTGAAACTCTACAGAGATTCGCTTGGAGAAG +CAGTAATGAGAATGGGAGACCTCCACTCACTCCAAAACAGAAACGAGAAATGGCGGGAACAATTAGGTCAGAAGTTTGAA +GAAATAAGATGGTTGATTGAAGAAGTGAGACACAAACTGAAGGTAACAGAGAATAGTTTTGAGCAAATAACATTTATGCA +AGCCTTACATCTATTGCTTGAAGTGGAGCAAGAGATAAGAACTTTCTCATTTCAGCTTATTTAATAATAAAAAACACCCT +TGTTTCTACT +>NC_007378.1 Influenza A virus (A/Korea/426/1968(H2N2)) segment 1, complete sequence +AGCAAAAGCAGGTCAATTATATTCAATATGGAAAGAATAAAAGAACTACGGAATCTGATGTCGCAGTCTCGCACTCGCGA +GATACTAACAAAAACCACAGTGGACCATATGGCCATAATTAAGAAGTACACATCAGGGAGACAGGAAAAGAACCCGTCAC +TTAGGATGAAATGGATGATGGCAATGAAATATCCAATTACAGCTGACAAGAGGATAACAGAAATGGTTCCTGAGAGAAAT +GAGCAAGGACAAACTCTATGGAGTAAAATGAGTGATGCCGGGTCAGATCGAGTAATGGTATCACCTTTGGCAGTGACATG +GTGGAATAGAAATGGACCAATGACAAGTACGGTTCATTATCCAAAAATCTACAAGACTTATTTTGAGAAAGTCGAAAGGT +TAAAACATGGAACCTTTGGCCCTGTCCATTTTAGAAACCAAGTCAAAATACGCCGAAGAGTTGACATAAACCCTGGTCAT +GCAGACCTCAGTGCCAAGGAGGCACAAGACGTAATCATGGAAGTTGTTTTCCCCAATGAAGTGGGGGCCAGGATACTAAC +GTCGGAATCACAATTAACAATAACCAAAGAGAAAAAAGAAGAACTCCAAGATTGCAAAATTTCTCCTTTGATGGTTGCAT +ACATGTTAGAGAGAGAACTTGTCCGAAAAACGAGATTTCTCCCAGTTGCTGGTGGAACAAGCAGTGTGTACATTGAAGTG +TTACACTTGACTCAAGGAACATGTTGGGAACAGATGTACACCCCAGGTGGAGAAGTGAGGAATGATGATGTTGATCAAAG +TCTAATTATTGCAGCCAGGAACATAGTGAGAAGAGCAGCAGTATCAGCAGATCCACTAGCATCTTTATTGGAGATGTGCC +ACAGCACACAGATTGGCGGGACAAGGATGGTGGACATTCTTAGGCAGAACCCAACGGAAGAACAAGCTGTGGATATATGC +AAGGCTGCAATGGGACTGAGAATCAGCTCATCCTTCAGTTTTGGCGGGTTCACATTTAAGAGAACAAGCGGGTCATCAAT +CAAGAGAGAGGAAGAAGTGCTTACGGGCAATCTCCAAACATTGAAAATAAGGGTGCATGAGGGGTACGAGGAATTCACAA +TGGTGGGGAAAAGGGCAACAGCTATACTCAGAAAAGCAACCAGGAGATTGGTTCAGCTGATAGTGAGTGGAAGAGACGAA +CAGTCAATAGCCGAAGCAATAATTGTAGCCATGGTGTTTTCACAAGAAGATTGCATGATAAAAGCAGTTAGAGGTGACCT +GAATTTCGTTAATAGGGCAAATCAGCGATTGAATCCCATGCATCAACTTTTAAGACATTTTCAGAAAGATGCAAAAGTGC +TCTTTCAAAATTGGGGAATTGAACATATCGACAATGTAATGGGAATGATTGGAGTATTACCAGACATGACTCCAAGCACA +GAGATGTCAATGAGAGGGATAAGAGTCAGCAAAATGGGCGTGGATGAATACTCCAGCACAGAGAGGGTAGTGGTAAGCAT +TGACCGGTTTTTGAGAGTTCGAGACCAACGAGGAAATGTACTACTATCTCCTGAGGAGGTCAGTGAAACACAGGGGACAG +AGAAACTGACAATAACTTACTCATCGTCAATGATGTGGGAGATTAATGGCCCTGAGTCAGTGTTGGTCAATACCTATCAG +TGGATCATCAGAAACTGGGAAACTGTTAAAATTCAATGGTCTCAGAATCCTACAATGCTATACAATAAAATGGAATTTGA +GCCATTTCAGTCTTTAGTTCCTAAGGCCATTAGAGGCCAATACAGTGGATTTGTTAGGACTCTATTCCAACAAATGAGGG +ATGTACTTGGGACATTTGATACCACCCAGATAATAAAGCTTCTTCCCTTTGCAGCCGCCCCACCAAAGCAAAGTAGAATG +CAGTTCTCTTCATTGACTGTGAATGTGAGGGGATCAGGAATGAGAATACTTGTAAGGGGCAATTCTCCTGTATTCAACTA +CAACAAGACCACTAAGAGACTAACAATTCTCGGAAAGGATGCTGGCACTTTAACTGAAGACCCAGATGAAGGCACATCCG +GAGTGGAGTCCGCTGTTCTGAGAGGATTCCTCATTCTGGGCAAGGAAGATAGAAGATATGGACCAGCATTAAGCATCAAT +GAACTGAGTACCCTTGCAAAAGGAGAAAAGGCTAATGTACTAATTGGGCAAGGAGACGTGGTGTTGGTAATGAAACGAAA +ACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAATGTTGAATAGTTT +AAAAACGACCTTGTTTCTACT +>NC_007375.1 Influenza A virus (A/Korea/426/1968(H2N2)) segment 2, complete sequence +AGCAAAAGCAGGCAAACCATTTGAATGGATGTCAATCCGACCTTACTTTTCTTGAAAGTTCCAGCGCAAAATGCCATAAG +TACTACATTCCCTTATACTGGAGATCCTCCATACAGCCATGGGACAGGAACAGGATACACCATGGACACAGTCAACAGAA +CACATCAATATTCAGAAAAGGGGAAGTGGACAACAAACACGGAAACTGGAGCGCCCCAACTTAACCCAATTGATGGACCA +CTACCTGAGGACAATGAACCAAGTGGATATGCACAAACAGACTGCGTCCTGGAAGCAATGGCTTTCCTTGAGGAATCACA +CCCAGGAATCTTTGAAAATTCGTGTCTTGAAACGATGGAAGTTATTCAACAAACAAGAGTGGACAAACTGACCCAAGGTC +GTCAGACCTATGACTGGACATTGAACAGAAATCAGCCGGCTGCAACTGCGCTAGCCAACACTATAGAGGTCTTCAGATCG +AATGGACTGACAGCTAATGAGTCGGGAAGGCTAATAGATTTCCTCAAGGATGTGATAGAATCAATGGATAAAGAGGAGAT +GGAAATAACAACACACTTCCAAAGAAAAAGAAGAGTAAGAGACAACATGACCAAGAAAATGGTCACACAACGAACAATAG +GAAAGAAGAAGCAAAGATTGAACAAGAGAAGCTATCTGATAAGAGCACTGACATTGAACACAATGACTAAAGATGCAGAG +AGAGGTAAATTAAAAAGAAGAGCAATTGCAACACCCGGTATGCAGATCAGAGGGTTCGTGCACTTTGTCGAAACACTAGC +GAGAAATATTTGTGAGAAACTTGAACAGTCTGGGCTTCCGGTTGGAGGTAATGAAAAGAAGGCTAAACTAGCAAATGTTG +TTAGAAAAATGATGACTAATTCACAAGACACAGAGCTCTCTTTCACAATTACTGGAGACAACACCAAATGGAATGAGAAT +CAAAATCCTCGAGTGTTTCTGGCGATGATAACATACATCACAAGAAATCAACCTGAATGGTTTAGAAACGTCCTGAGCAT +TGCACCCATAATGTTCTCAAATAAAATGGCTAGACTAGGGAAAGGTTACATGTTCGAAAGCAAGAGCATGAAGCTCCGAA +CACAAATACCAGCAGAAATGCTAGCAAGTATTGACCTGAAATACTTTAATGAATCAACCAGAAAGAAAATTGAGAAAATA +AGGCCTCTCCTAATAGATGGCACAGTCTCATTGAGTCCTGGAATGATGATGGGCATGTTCAACATGCTAAGTACAGTCTT +AGGAGTCTCAATCCTGAATCTCGGGCAAAAGAAATACACCAAAACNACATACTGGTGGGACGGACTCCAATCCTCTGATG +ACTTCGCTCTCATAGTGAATGCACCAAATCATGAGGGAATACAAGCAGGGGTGAATAGATTCTACAGAACCTGCAAGCTA +GTCGGAATCAATATGAGCAAAAAGAAGTCCTACATAAATAGGACAGGGACATTTGAATTCACAAGCTTTTTCTATCGCTA +TGGATTTGTAGCCAATTTTAGCATGGAGCTGCCCAGCTTTGGAGTGTCTGGAATTAATGAATCGGCTGATATGAGCATTG +GGGTAACAGTGATAAAGAACAATATGATAAATAATGACCTTGGGCCAGCAACAGCCCAAATGGCTCTTCAACTATTCATC +AAAGACTACAGATACACGTACCGGTGCCACAGAGGGGACACACAAATTCAGACAAGGAGATCATTCGAGCTAAAGAAGCT +GTGGGAGCAAACCCGCTCAAAGGCAGGACTTTTGGTGTCGGATGGAGGATCAAACTTATACAATATCCGGAATCTCCACA +TTCCAGAAGTCTGCTTGAAATGGGAGCTAATGGATGAAGACTATCAGGGGAGGCTTTGTAATCCCCTGAATCCATTTGTC +AGTCATAAGGAAATTGAGTCTGTAAACAATGCTGTGGTAATGCCAGCTCACGGTCCAGCCAAGAGCATGGAATATGATGC +TGTTGCTACTACACACTCCTGGACCCCTAAGAGGAACCGCTCCATTCTCAACACAAGCCAAAGGGGAATTCTTGAAGATG +AACAGATGTATCAGAAGTGTTGCAATCTATTTGAGAAATTCTTCCCTAGCAGTTCGTACAGGAGACCAGTTGGAATTTCC +AGCATGGTGGAGGCCATGGTGTCTAGGGCTCGGATTGATGCACGGATTGACTTCGAGTCTGGACGGATTAAGAAAGAGGA +GTTCGCTGAGATCATGAAGATCTGTTCCACCATTGAAGAGCTCAGACGGCAAAAATAGTGAATTTAGCTTGTCCTTCATG +AAAAAATGCCTTGTTTCTACT +>NC_007376.1 Influenza A virus (A/Korea/426/1968(H2N2)) segment 3, complete sequence +AGCAAAAGCAGGTACTGATTCGAAATGGAAGATTTTGTGCGACAATGCTTCAATCCGATGATTGTCGAACTTGCGGAAAA +GGCAATGAAAGAGTATGGAGAAGATCTGAAAATCGAAACAAACAAATTTGCAGCAATATGCACTCACTTGGAAGTATGCT +TCATGTATTCAGATTTTCATTTCATCAATGAGCAAGGCGAGTCAATAATGGTAGAGCTTGATGATCCAAATGCACTTTTG +AAGCACAGATTTGAAATAATAGAGGGAAGAGATCGCACAATGGCCTGGACAGTAGTAAACAGTATTTGCAACACCACAGG +AGCTGAGAAACCGAAGTTTCTGCCAGATTTGTATGATTACAAGGAGAATAGATTCATCGAGATTGGAGTGACAAGGAGAG +AAGTCCACATATACTATCTTGAAAAGGCCAATAAAATTAAATCTGAGAATACACACATCCACATTTTCTCATTCACTGGG +GAAGAAATGGCCACAAAGGCCGACTACACTCTCGATGAGGAAAGCAGGGCTAGGATCAAAACCAGACTATTCACCATAAG +ACAAGAAATGGCCAACAGAGGCCTCTGGGATTCCTTTCGTCAGTCCGAAAGAGGCGAAGAAACAATTGAAGAAAGATTTG +AAATCACAGGGACAATGCGCAGGCTTGCCGACCAAAGTCTCCCGCCGAACTTCTCCTGCCTTGAGAATTTTAGAGCCTAT +GTGGATGGATTCGAACCGAACGGCTACATTGAGGGCAAGCTTTCTCAAATGTCCAAAGAAGTAAATGCAAAAATTGAACC +TTTTCTGAAAACAACACCAAGACCAATTAGACTTCCGGATGGGCCTCCTTGTTTTCAGCGGTCCAAATTCCTGCTGATGG +ATGCTTTAAAATTAAGCATTGAGGACCCAAGTCACGAAGGGGAGGGAATACCACTATATGATGCGATCAAGTGCATGAGA +ACATTCTTTGGATGGAAAGAACCCTATATTGTTAAACCACACGAAAAGGGAATAAATCCAAATTATCTGCTGTCATGGAA +GCAAGTACTGGCGGAACTGCAGGACATTGAGAATGAGGAGAAGATTCCAAGAACTAAAAACATGAAGAAAACGAGTCAGC +TAAAGTGGGCACTTGGTGAGAACATGGCACCAGAGAAGGTAGACTTTGACAACTGTAGAGACATAAGCGATTTGAAGCAA +TATGATAGTGACGAACCTGAATTAAGGTCACTTTCAAGCTGGATCCAGAATGAGTTCAACAAGGCATGCGAGCTGACCGA +TTCAATCTGGATAGAGCTCGATGAGATTGGAGAAGACGTGGCTCCAATTGAACACATTGCAAGCATGAGAAGGAATTACT +TCACAGCAGAGGTGTCCCATTGCAGAGCCACAGAATATATAATGAAGGGGGTATACATTAATACTGCCTTGCTTAATGCA +TCCTGTGCAGCAATGGACGATTTCCAACTAATTCCCATGATAAGCAAGTGTAGAACTAAAGAGGGAAGGCGAAAGACCAA +TTTATATGGTTTCATCATAAAAGGAAGATCTCACTTAAGGAATGACACCGACGTGGTAAACTTTGTGAGCATGGAGTTTT +CTCTCACTGACCCGAGACTTGAGCCACACAAATGGGAGAAGTACTGTGTCCTTGAGATAGGAGATATGCTACTAAGAAGT +GCCATAGGCCAGATGTCAAGGCCTATGTTCTTGTATGTGAGGACAAATGGAACATCAAAGATTAAAATGAAATGGGGAAT +GGAGATGAGGCCTTGCCTCCTTCAGTCACTACAACAAATCGAGAGTATGGTTGAAGCCGAGTCCTCTGTCAAAGAGAAAG +ACATGACCAAAGAGTTTTTTGAGAATAAATCAGAAACATGGCCCATTGGGGAGTCCCCCAAAGGAGTGGAAGAAGGTTCC +ATTGGGAAGGTCTGCAGGACTTTATTAGCCAAGTCGGTATTCAATAGCCTGTATGCATCCCCACAATTAGAAGGATTTTC +AGCTGAATCAAGAAAACTGCTTCTTGTCGTTCAGGCTCTTAGGGACAATCTTGAACCTGGAACCTTTGATCTTGGGGGGC +TATATGAAGCAATTGAGGAGTGCCTGATTAATGATCCCTGGGTTTTGCTTAATGCGTCTTGGTTCAACTCCTTCCTAACA +CATGCATTAAGATAGTTGTGGCAATGCTACTATTTGCTATCCATACTGTCCAAAAAAGTACCTTGTTTCTACT +>NC_007374.1 Influenza A virus (A/Korea/426/1968(H2N2)) segment 4, complete sequence +AGCAAAAGCAGGGGTTATACCATAGACAACCAAAAGCATAACAATGGCCATCATTTATCTCATACTCCTGTTCACAGCAG +TGAGGGGGGACCAGATATGCATTGGATACCATGCCAATAATTCCACAGAAAAGGTCGACACAATTCTAGAGCGGAATGTC +ACTGTGACTCATGCCAAGGACATCCTTGAGAAGACCCATAACGGAAAGCTATGCAAACTAAACGGAATCCCTCCACTTGA +ACTAGGGGACTGTAGCATTGCCGGATGGCTCCTTGGAAATCCAGAATGTGATAGGCTTCTAAGTGTGCCAGAATGGTCCT +ATATAATGGAGAAAGAAAACCCGAGATACAGTTTGTGTTACCCAGGCAGCTTCAATGACTATGAAGAATTGAAACATCTC +CTCAGCAGCGTGAAACATTTTGAGAAAGTTAAGATTTTGCCCAAAGATAGATGGACACAGCATACAACAACTGGAGGTTC +ATGGGCCTGCGCGGTGTCAGGTAAACCATCATTCTTCAGGAACATGGTCTGGCTGACACGTAAAGGATCAAATTATCCGG +TTGCCAAAGGATCGTACAACAATACAAGCGGAGAACAAATGCTAATAATTTGGGGAGTGCACCATCCTAATGATGAGGCA +GAACAAAGAGCATTGTACCAGAATGTGGGAACCTATGTTTCCGTAGCCACATCAACATTGTACAAAAGGTCAATCCCAGA +AATAGCAGCAAGGCCTAAAGTGAATGGACTAGGACGTAGAATGGAATTCTCTTGGACCCTCTTGGATATGTGGGACACCA +TAAATTTTGAGAGCACTGGTAATCTAGTTGCACCAGAGTATGGGTTCAAAATATCGAAAAGAGGTAGTTCAGGGATCATG +AAGACAGAAGGAACACTTGAGAACTGTGAAACCAAATGCCAAACTCCTTTGGGAGCAATAAATACAACACTACCTTTTCA +CAATGTCCACCCACTGACAATAGGTGAATGCCCCAAATATGTAAAATCGGAGAAATTGGTCTTAGCAACAGGACTAAGGA +ATGTTCCCCAGATTGAATCAAGAGGATTGTTTGGGGCAATAGCTGGTTTTATAGAAGGAGGATGGCAAGGAATGGTTGAT +GGTTGGTATGGATACCATCACAGCAATGACCAGGGATCAGGGTATGCAGCAGACAAAGAATCCACTCAAAAGGCATTTAA +TGGAATCACCAACAAGGTAAATTCTGTGATTGAAAAGATGAACACCCAATTTGAAGCTGTTGGGAAAGAATTCAGTAACT +TAGAGAAAAGACTGGAGAACTTGAACAAAAAGATGGAAGACGGGTTTCTAGATGTGTGGACATACAATGCAGAGCTTCTA +GTTCTGATGGAAAATGAGAGGACACTTGACTTTCATGATTCTAATGTCAAGAATCTGTATGATAAAGTCAGAATGCAGCT +GAGAGACAACGTCAAAGAACTAGGAAATGGATGTTTTGAATTTTATCACAAATGTGACAATGAATGCATGGATAGTGTGA +AAAACGGGACATATGATTATCCCAAGTATGAAGAAGAATCTAAACTAAATAGAAATGAAATCAAAGGGGTAAAATTGAGC +AGCATGGGGGTTTATCAAATCCTTGCCATTTATGCTACAGTAGCAGGTTCTCTGTCACTGGCAATCATGATGGCTGGGAT +CTCTTTCTGGATGTGCTCCAACGGGTCTCTGCAGTGCAGAATCTGCATATGATTGTAAGTCATTTTATAATTAAAAACAC +CCTTGTTTCCTGA +>NC_007381.1 Influenza A virus (A/Korea/426/1968(H2N2)) segment 5, complete sequence +ATGGCGTCCCAAGGCACCAAACGGTCTTATGAACAGATGGAAACTGATGGGGAACGCCAGAATGCAACTGAGATCAGAGC +ATCCGTCGGGAAGATGATTGATGGAATTGGACGATTCTACATCCAAATGTGCACCGAACTTAAACTCAGTGATTATGAGG +GGCGACTGATCCAGAACAGCTTAACAATAGAGAGAATGGTGCTCTCTGCTTTTGACGAGAGAAGGAATAAATATCTGGAA +GAACATCCCAGCGCGGGGAAGGATCCTAAGAAAACTGGAGGACCCATATACAAGAGAGTAGATGGAAAGTGGATGAGGGA +ACTCGTCCTTTATGACAAAGAAGAAATAAGGCGAATCTGGCGCCAAGCCAATAATGGTGATGATGCAACAGCTGGGCTGA +CTCACATGATGATCTGGCATTCCAATTTGAATGATACAACATACCAGAGGACAAGAGCTCTTGTTCGCACCGGAATGGAT +CCCAGGATGTGCTCTTTGATGCAGGGTTCGACTCTCCCTAGGAGGTCTGGAGCTGCAGGCGCTGCAGTCAAAGGAGTTGG +GACAATGGTGATGGAGTTGATCAGGATGATCAAACGTGGGATCAATGATCGGAACTTCTGGAGAGGTGAGAATGGACGGA +AAACAAGGAGTGCTTACGAGAGAATGTGCAACATTCTCAAAGGAAAATTTCAAACAGCTGCACAAAGAGCAATGATGGAT +CAAGTGAGAGAAAGCCGGAACCCAGGAAATGCTGAGATCGAAGATCTAATCTTTCTGGCACGGTCTGCACTCATATTGAG +AGGGTCAGTTGCTCACAAATCTTGTCTGCCCGCCTGTGTGTATGGACCTGCCATAGCCAGTGGGTACAACTTCGAAAAAG +AGGGATACTCTCTAGTGGGAATAGACCCTTTCAAACTGCTTCAAAACAGCCAAGTATACAGCCTAATCAGACCGAACGAG +AATCCAGCACACAAGAGTCAGCTGGTGTGGATGGCATGCAATTCTGCTGCATTTGAAGATCTAAGAGTATTAAGCTTCAT +CAGAGGGACCAAAGTATCCCCAAGGGGGAAACTTTCCACTAGAGGAGTACAAATTGCTTCAAATGAAAACATGGATACTA +TGGAATCAAGTACTCTTGAACTAAGAAGCAGGTACTGGGCCATAAGGACCAGAAGTGGAGGAAACACTAATCAACAGAGG +GCCTCTGCAGGTCAAATCAGTGTACAACCTGCATTTTCTGTGCAAAGAAACCTCCCATTTGACAAACCAACCATCATGGC +AGCATTCACTGGGAATACAGAGGGAAGAACATCAGACATGAGGGCAGAAATCATAAGGATGATGGAAGGTGCAAAACCAG +AAGAAATGTCCTTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCCTCTTTTGAC +ATGAGTAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTACGACAATTAA +>NC_007382.1 Influenza A virus (A/Korea/426/1968(H2N2)) segment 6, complete sequence +ATGAATCCAAATCAAAAGATAATAACAATTGGCTCTGTCTCTCTCACCATTGCAACAGTATGCTTCCTCATGCAGATTGC +CATCCTGGTAACTACTGTGACATTGCATTTTAAGCAACATGAGTGCGACTCCCCCGCGAGCAACCAAGTAATGCCGTGTG +AACCAATAATAATAGAAAGGAACATAACAGAGATAGTGTATTTGAATAACACCACCATAGAGAAAGAGATCTGCCCCGAA +GTAGTGGAATACAGAAATTGGTCAAAGCCGCAATGTCAAATTACAGGATTTGCACCTTTTTCTAAGGACAATTCAATCCG +GCTTTCTGCTGGTGGGGACATTTGGGTGACGAGAGAACCTTATGTGTCATGCGATCCTGGCAAGTGTTATCAATTTGCAC +TCGGGCAGGGGACCACACTAGACAACAAACATTCAAATGACACAATACATGATAGAATCCCTCATCGAACCCTATTAATG +AATGAGTTGGGTGTTCCATTTCATTTAGGAACCAGGCAAGTGTGTGTAGCATGGTCCAGCTCAAGTTGTCACGATGGAAA +AGCATGGTTGCATGTTTGTGTCACTGGGGATGATAAAAATGCAACTGCTAGCTTCATTTATGACGGGAGGCTTATGGACA +GTATTGGTTCATGGTCTCAAAATATCCTCAGGACCCAGGAGTCGGAATGCGTTTGTATCAATGGGACTTGCACAGTAGTA +ATGACTGATGGAAGTGCTTCAGGAAGAGCCGATACTAGAATACTATTCATTGAAGAGGGGAAAATTGTCCATATTAGCCC +ATTGTCAGGAAGTGCTCAGCATGTAGAGGAGTGTTCCTGTTATCCTCGATATCCTGACGTCAGATGTATCTGCAGAGACA +ACTGGAAAGGCTCTAATAGGCCCGTCATAGACATAAATATGGAAGATTATAGCATTGATTCCAGTTATGTGTGCTCAGGG +CTTGTTGGCGACACACCCAGAAACGACGACAGATCTAGCAATAGTAATTGCAGGAATCCTAACAATGAGAGAGGGAATCC +AGGAGTGAAAGGCTGGGCCTTTGACAATGGAGATGACGTGTGGATGGGAAGAACGATCAGCAAGGATTTACGCTCAGGTT +ATGAAACTTTCAAAGTCATTGGTGGTTGGTCCACACCTAATTCCAAATCGCAGATCAATAGACAGGTCATAGTTGACAGC +AATAATTGGTCAGGTTACTCTGGTATTTTCTCTGTTGAGGGCAAAAGATGCATCAATAGGTGCTTTTATGTGGAGTTGAT +AAGGGGAAGGCAACAGGAGACTAGAGTATGGTGGACCTCAAACAGTATTGTTGTGTTTTGTGGCACTTCAGGTACTTATG +GAACAGGCTCATGGCCTGATGGGGCGAACATCAATTTCATGCCTATATAA +>NC_007377.1 Influenza A virus (A/Korea/426/1968(H2N2)) segment 7, complete sequence +AGCAAAAGCAGGTAGATATTGAAAGATGAGCCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCGTCCCGTCAGGCC +CCCTCAAAGCCGAGATCGCACAGAGACTTGAAGATGTCTTTGCTGGGAAGAACACAGATCTTGAGGCTCTCATGGAATGG +CTAAAGACAAGACCAATCCTGTCACCTCTGACTAAGGGGATTTTGGGATTTGTATTCACGCTCACCGTGCCAAGTGAGCG +AGGACTGCAGCGTAGACGCTTTGTCCAAAATGCCCTCAATGGGAATGGGGATCCAAATAACATGGACAGAGCAGTTAAAC +TGTATAGAAAGCTTAAGAGGGAGATAACATTCCATGGGGCCAAAGAAGTAGCGCTCAGTTATTCTGCTGGTGCACTTGCC +AGTTGCATGGGCCTCATATACAACAGGATGGGGGCTGTGACCACTGAAGTGGCCTTTGCCGTGGTATGTGCAACCTGTGA +ACAGATTGCTGACTCCCAGCATAGGTCTCACAGGCAAATGGTGACAACAACCAATCCACTAATAAGACATGAGAACAGAA +TGGTTCTGGCCAGCACTACAGCTAAGGCTATGGAGCAAATGGCTGGATCGAGTGAGCAAGCAGCAGAGGCCATGGAGGTT +GCTAGTCAGGCCAGGCAAATGGTGCAGGCAATGAGAGCCATTGGGACTCCTCCTAGCTCCAGTGCTGGTCTAAAAGATGA +TCTTCTTGAAAATTTGCAGGCCTATCAGAAACGAATGGGGGTGCAGATGCAACGATTCAAGTGACCCCCTTGTTGTTGCT +GCGAGTATCATTGGGATCTTGCACTTTATATTGTGGATTCTTGATCGTCTTTTTTTCAAATGCATTTATCGCTTCTTTAA +ACACGGTCTGAAAAGAGGGCCTTCTACGGAAGGAGTACCTGAGTCTATGAGGGAAGAATATCGAAAGGAACAGCAGAGTG +CTGTGGATGCTGACGATAGTCATTTTGTCAGCATAGAGCTGGAGTAAAAAACTACCTTGTTTCTACT +>NC_007380.1 Influenza A virus (A/Korea/426/1968(H2N2)) segment 8, complete sequence +ATGGATTCTAACACTGTGTCAAGTTTTCAGGTAGATTGCTTCCTTTGGCATGTCCGAAAACAAGTTGTAGACCAAGAACT +AGGTGATGCCCCATTCCTTGATCGGCTTCGCCGAGATCAGAAGTCCCTAAGGGGAAGAGGCAGCACTCTCGATCTAGACA +TCGAAGCAGCCACCCGTGTTGGAAAGCAGATAGTAGAGAGGATTCTGAAGGAAGAATCCGATGAGGCACTTAAAATGACC +ATGGCCTCCGCACCTGCTTCGCGATACCTAACTGACATGACTATTGAGGAATTGTCAAGGGACTGGTTCATGCTAATGCC +CAAGCAGAAAGTGGAAGGCCCTCTTTGCATCAGAATAGACCAGGCAATCATGGATAAGAACATCATGTTGAAAGCGAATT +TCAGTGTGATTTTTGACCGGCTAGAGACCCTAATATTACTAAGGGCTTTCACCGAAGAGGGAGCAATTGTTGGCGAAATT +TCACCATTGCCTTCTCTTCCAGGACATACTATTGAGGATGTCAAAAATGCAATTGGGGTCCTCATCGGAGGACTTGAATG +GAATGATAACACAGTTCGAGTCTCTAAAACTCTACAGAGATTCGCTTGGAGAAGCAGTAATGAGAATGGGAGACCTCCAC +TCACTCCAAAACAGAAACGGAAAATGGCGAGAACAATTAGGTCAAAAGTTCGAAGAGATAAGATGGCTGATTGAAGAAGT +GAGACACAGATTGAAGATAACAGAGAATAGTTTTGAGCAAATAACATTTATGCAAGCCTTACAGCTACTATTTGAAGTGG +AACAAGAGATAAGAACTTTCTCGTTTCAGCTTATTTAA +>NC_026422.1 Influenza A virus (A/Shanghai/02/2013(H7N9)) segment 1 polymerase PB2 (PB2) gene, complete cds +ATGGAAAGAATAAAAGAACTAAGAGATTTGATGTCACAGTCTCGCACTCGCGAGATACTGACAAAAACAACTGTGGACCA +TATGGCCATAATCAAGAAATATACATCAGGAAGACAGGAGAAGAATCCTGCCCTTAGGATGAAGTGGATGATGGCAATGA +AATATCCAATTACGGCAGACAAAAGGATAATGGAGATGATCCCGGAAAGAAATGAGCAAGGTCAGACCCTTTGGAGCAAG +ACAAATGATGCTGGATCAGACAGAGTGATGGTGTCACCTCTGGCTGTGACGTGGTGGAACAGAAATGGACCAACGACAAG +CACAGTCCATTATCCAAAGGTCTATAAAACCTATTTTGAAAAGGTCGAAAGGCTAAAACATGGAACCTTCGGCCCCGTTC +ACTTCAGAAACCAGGTTAAAATACGCCGCAGGGTCGACATAAACCCGGGCCATGCAGATCTTAGTGCTAAAGAAGCACAG +GATGTCATCATGGAGGTCGTATTCCCAAACGAAGTTGGAGCCAGAATATTGACATCAGAGTCACAGTTAACGATTACCAA +GGAAAAGAAGAAGGAGCTTCAGGACTGCAAAATTGCCCCTTTAATGGTGGCTTACATGTTGGAGAGAGAACTGGTTCGCA +AAACAAGATTCCTACCAGTAGCTGGAGGGACAAGCAGCGTGTATATCGAGGTGTTGCATTTGACCCAAGGGACCTGCTGG +GAGCAAATGTACACACCGGGAGGGGAAGTGAGAAATGATGATGTTGATCAGAGTTTAATTATTGCTGCTAGAAATATTGT +TAGAAGAGCAACAGTATCAGCAGACCCGTTGGCTTCGCTTTTGGAGATGTGCCATAGTACACAGATTGGCGGGATTAGGA +TGGTTGACATCCTTAGACAAAACCCAACAGAAGAACAGGCTGTGGATATATGTAAGGCAGCAATGGGTCTAAGGATCAGT +TCATCCTTCAGCTTTGGAGGTTTCACTTTCAAAAGGACAAGTGGGTCATCTGTCAAAAGGGAAGAAGAAGTGCTCACAGG +CAACCTCCAAACATTGAAAATAAGAGTACATGAAGGATATGAGGAATTCACAATGGTCGGGCGAAGAGCAACAGCCATTC +TAAGGAAAGCAACCAGAAGACTGATCCAACTGATAGTGAGTGGGAAAGACGAGCAATCAATCGCCGAGGCAATCATAGTG +GCAATGGTATTCTCACAAGAGGATTGTATGATAAAGGCAGTGAGAGGTGATTTGAACTTTGTCAACAGAGCAAACCAGCG +GCTAAATCCCATGCATCAACTCCTGAGGCATTTCCAAAAGGATGCAAAGGTCCTGTTTCAAAACTGGGGAATTGAACCCA +TTGACAATGTAATGGGGATGATCGGAATATTGCCTGACATGACCCCCAGCACAGAGATGTCATTGAGAGGAGTGAGAGTT +AGTAAAATGGGAGTAGATGAATATTCCAGCACTGAGAGAGTGGTCGTGAGTATTGATCGTTTCTTGAGGGTCCGAGACCA +GAGGGGAAACGTACTCCTGTCTCCTGAAGAGGTTAGTGAAACACAGGGAACAGAAAAGCTGACTATAACATATTCATCGT +CCATGATGTGGGAGATCAATGGTCCGGAATCAGTGCTAGTTAACACATATCAATGGATCATTAGAAATTGGGAAAATGTA +AAGATTCAATGGTCCCAAGATCCTACAATGCTATACAATAAGATGGAATTTGAACCCTTTCAATCCCTAGTGCCTAAAGC +TGCCAGGGGCCAATATAGTGGGTTCGTGAGGGTTCTATTCCAACAGATGCGTGACGTACTGGGAACATTTGACACTGTCC +AAATAATAAAGCTATTACCATTTGCAGCAGCCCCGCCGAAGCAGAGTAGGATGCAGTTCTCTTCTCTAACTGTGAATGTG +AGGGGTTCCGGAATGAGAATAGTTGTGAGAGGCAATTCTCCTGTGTTCAACTACAACAAGGCAACCAAGAGGCTTACGGT +GCTTGGAAAGGATGCAGGTGCATTGATGGAAGACCCCGATGAGGGAACAGCAGGAGTGGAATCTGCGGTATTGAGGGGAT +TTCTGATTCTGGGCAAAGAAGACAAAAGATATGGGCCAGCATTGAGCATCAACGAATTGAGCAATCTTGCGAAAGGAGAG +AAGGCTAATGTGTTGATAGGGCAAGGAGACGTTGTGTTGGTGATGAAACGGAAACGGGACTCTAGCATACTTACTGACAG +TCAGACAGCGACCAAAAGGATTCGGATGGCCATCAATTAA +>NC_026423.1 Influenza A virus (A/Shanghai/02/2013(H7N9)) segment 2 polymerase PB1 (PB1) and PB1-F2 protein (PB1-F2) genes, complete cds +ATGGATGTCAATCCGACTTTACTTTTCTTGAAAGTGCCAGTGCAAAATGCTATAAGTACCACTTTCCCTTATACTGGAGA +CCCTCCATACAGCCATGGAACAGGAACAGGATACACCATGGACACAGTCAACAGAACACATAAATACTCAGAAAAAGGAA +AGTGGACAACGAACACAGAGACTGGAGCACCCCAACTCAATCCAATTGATGGACCATTACCTGAGGACAACGAGCCGAGT +GGGTATGCACAAACGGATTGTGTATTGGAAGCAATGGCTTTCCTTGAAGAATCTCACCCAGGGATCTTTGAAAACTCGTG +TCTCGAAACGATGGAAATTGTTCAGCAAACAAGAGTGGATAAACTGACCCAAGGCCGCCAGACCTATGACTGGACGTTGA +ATAGAAATCAGCCGGCTGCTACCGCATTGGCCAACACTATAGAGGTATTCAGATCGAATGGCCTGACAGCCAATGAATCA +GGAAGGTTGATCGATTTCCTCAAGGACGTGATGGATTCAATGGATAAGGAAGAAATGGAGATTACAACACATTTCCAGAG +GAAGAGGAGAGTGAGGGACAACATGACCAAGAAAATGGTCACACAGAGAACAATAGGAAAGAAAAAACAAAGACTGAACA +AAAGGAGCTACCTAATAAGAGCACTTACATTGAACACAATGACAAAGGATGCTGAAAGAGGCAAGCTGAAAAGGAGGGCA +ATCGCAACACCCGGGATGCAAATCAGAGGATTCGTGTATTTTGTAGAAGCACTAGCGAGGAGCATCTGTGAGAAACTTGA +GCAATCTGGCCTCCCTGTCGGAGGGAATGAGAAGAAAGCTAAATTGGCAAATGTTGTGAGGAAGATGATGACTAATTCAC +AAGATACAGAGCTCTCCTTCACAATTACTGGGGACAACACCAAATGGAATGAGAATCAAAACCCCCGGATGTTTCTAGCA +ATGATAACATACATCACAAGAAACCAGCCAGAATGGTTTAGAAATGTCTTAAGCATTGCTCCTATAATGTTCTCAAACAA +GATGGCGAGATTAGGAAAAGGGTACATGTTCGAAAGTAAGAGTATGAAGTTACGGACACAAGTACCAGCGGAAATGCTCG +CAAATATTGACCTGAAATACTTCAACAAATCAACAAGAGAGAAAATCGAGAAAATAAGACCTCTACTGATAGATGGCACA +GCCTCATTGAGTCCTGGAATGATGATGGGCATGTTCAACATGTTGAGTACAGTCTTAGGAGTTTCAATTCTGAATCTCGG +GCAGAAGAAGTACACCAAAACCACATATTGGTGGGACGGACTCCAATCCTCAGATGACTTCGCCCTCATAGTGAATGCAC +CGAATCATGAGGGAATACAGGCAGGAGTAGATAGGTTCTATAGAACCTGCAAATTAGTTGGGATAAACATGAGCAAGAAG +AAATCCTACATAAATCGGACAGGAACATTCGAATTCACAAGCTTTTTCTACCGCTATGGATTCGTAGCTAACTTCAGTAT +GGAGTTGCCCAGTTTTGGAGTGTCCGGGATTAATGAGTCAGCTGACATGAGCGTTGGTGTTACAGTAATAAAGAACAATA +TGATAAACAACGATCTTGGACCAGCAACAGCCCAAATGGCCCTTCAGCTATTTATCAAAGACTACAGATACACATACCGA +TGTCACAGGGGTGATACGCAAATTCAAACGAGGAGAGCATTCGAGCTGAAGAAGCTGTGGGAGCAGACCCGTTCGAAGGC +AGGACTGTTGGTTTCAGATGGAGGGCCAAACCTGTACAATATCCGGAACCTCCACATTCCAGAGGTCTGCTTGAAATGGG +AATTGATGGATGAAGACTACCAAGGCAGGTTGTGTAATCCTATGAACCCGTTTGTCAGTCATAAGGAAATTGATTCAGTC +AACAATGCTGTGGTGATGCCAGCTCATGGCCCAGCCAAAAGCATGGAGTATGATGCCGTTGCAACCACACATTCATGGAT +TCCTAAGAGGAATCGCTCCATTCTCAACACCAGCCAAAGGGGGATTCTTGAGGACGAACAGATGTACCAGAAGTGCTGCA +ACCTATTCGAAAAGTTCTTCCCCAGCAGTTCGTACAGGAGGCCAGTTGGAATTTCCAGCATGGTGGAGGCCATGGTGTCT +AGGGCCCGAATTGATGCACGAATTGACTTCGAATCTGGAAGGATTAAGAAAGAAGAGTTTGCTGAGATCATGAAGATCTG +TTCCACCATTGAAGAGCTCAGACGGCAAAAATAGTGAATTTAGCTTGTCCTTCATGA +>NC_026424.1 Influenza A virus (A/Shanghai/02/2013(H7N9)) segment 3 polymerase PA (PA) and PA-X protein (PA-X) genes, complete cds +ATGGAAGACTTTGTGCGACAGTGCTTCAATCCAATGATCGTCGAGCTTGCGGAAAAGGCAATGAAAGAATATGGGGAAGA +TCCGAAAATCGAAACAAACAAATTCGCATCAATATGCACACACTTAGAAGTCTGCTTCATGTACTCTGATTTCCACTTCA +TCGACGAACGAGGCGAATCAACTATAATAGAATCTGGCGATCCAAATGCGCTGCTGAAACACCGATTTGAAATAATCGAA +GGGAGAGACCGAACAATGGCCTGGACAGTGGTGAATAGTATCTGCAACACCACAGGAGCCGAAAAACCCAAATTTCTCCC +GGATCTGTATGACTACAAGGAAAACCGTTTCATTGAAATTGGAGTGACGAGGAGGGAAGTCCACATATATTACCTAGAGA +AAGCCAATAAAATAAAATCCGAGAAGACACACATCCATATTTTTTCATTCACTGGAGAAGAGATGGCCACCAAAGCAGAT +TACACTCTTGACGAAGAAAGCAGGGCAAGAATCAAAACCAGGCTGTTCACCATAAGGCAGGAAATGGCCAGCAGGGGTCT +ATGGGATTCCTTTCGTCAGTCTGAAAGAGGCGAAGAAACAATTGAAGAAAGATTTGAAATCACAGGAACCATGCGCAGGC +TTGCCGACCAAAGTCTCCCACCGAACTTCTCCAGCCTTGAAAACTTTAGAGCCTATGTGGATGGATTCGAACCGAACGGC +TGCATTGAGGGCAAGCTTTCTCAGATGTCAAAAGAAGTGAACGCCAGAATTGAGCCATTTCTAAGAACAACACCACGCCC +TCTCAGATTGCCTAATGGGCCTCCCTGCTCTCAGCGGTCGAAATTCTTGCTGATGGATGCTCTGAAATTAAGCATTGAGG +ACCCGAGCCACGAAGGGGAGGGGATACCGCTATATGATGCGATCAAATGCATGAAAACGTTCTTCGGGTGGAAAGAGCCC +AACATTATCAAACCACATGAGAAAGGCATAAACCCCAATTATCTCCTGACTTGGAAGCAGGTGCTAGCAGAACTTCAGGA +CATTGAAAATGAAGAGAAGATTCCAAGGACAAAGAACATGAAGAAAACAAGCCAATTAAAGTGGGCACTCGGTGAGAACA +TGGCACCGGAGAAGGTGGACTTTGAGGATTGCAAAGATGTCAACGACTTGAAACAGTACAACAGTGATGAGCCAGAGCCC +AGATCACTAGCATGTTGGATCCAGAATGAATTCAACAAGGCGTGTGAACTGACTGACTCAAGCTGGGTAGAACTTGATGA +AATAGGGGAAGATGTTGCCCCAATCGAACACATTGCAAGCATGAGACGGAACTATTTTACAGCAGAGGTGTCCCACTGCA +GGGCTACTGAATATATAATGAAGGGAGTGTACATAAATACAGCTTTGCTCAATGCATCTTGTGCAGCCATGGATGACTTT +CAACTGATTCCAATGATAAGTAAATGTAGAACCAAAGAAGGAAGACGGAAAACAAACCTGTATGGATTCATTATAAAAGG +AAGATCTCATTTGAGGAATGATACCGACGTGGTAAACTTTGTAAGTATGGAATTTTCCCTTACCGACCCAAGGTTGGAAC +CACATAAATGGGAAAAGTATTGTGTTCTTGAAATAGGGGACATGCTCCTGCGAACTGCAGTAGGCCAAGTGTCAAGACCC +ATGTTTCTGTATGTGAGAACCAATGGGACCTCCAAGATCAAGATGAAATGGGGTATGGAAATGAGACGCTGCCTTCTTCA +ATCTCTCCAACAGATTGAGAGCATGATTGAAGCTGAATCCTCCGTCAAAGAGAAAGACCTGACCAAAGAATTCTTTGAAA +ACAAATCAGAAACATGGCCAATTGGAGAGTCACCTAAAGGAGTGGAGGAAGGTTCCATCGGGAAGGTGTGCAGAACCTTA +CTAGCAAAATCTGTATTCAACAGCCTATATGCATCTCCGCAACTCGAGGGGTTCTCAGCTGAATCGAGAAAACTGCTACT +CATTGTTCAGGCGCTTAGGGATAACCTGGAACCTGGAACCTTTGATCTTGAAGGGCTATATGAAGCAATCGAGGAGTGCC +TGATTAATGATCCCTGGGTTTTGCTTAATGCATCTTGGTTCAACTCCTTCCTCACACATGCACTAAGATAGTTGTGGCAA +TGCTACTATTTGCTAT +>NC_026425.1 Influenza A virus (A/Shanghai/02/2013(H7N9)) segment 4 hemagglutinin (HA) gene, complete cds +ATGAACACTCAAATCCTGGTATTCGCTCTGATTGCGATCATTCCAACAAATGCAGACAAAATCTGCCTCGGACATCATGC +CGTGTCAAACGGAACCAAAGTAAACACATTAACTGAAAGAGGAGTGGAAGTCGTCAATGCAACTGAAACAGTGGAACGAA +CAAACATCCCCAGGATCTGCTCAAAAGGGAAAAGGACAGTTGACCTCGGTCAATGTGGACTCCTGGGGACAATCACTGGA +CCACCTCAATGTGACCAATTCCTAGAATTTTCAGCCGATTTAATTATTGAGAGGCGAGAAGGAAGTGATGTCTGTTATCC +TGGGAAATTCGTGAATGAAGAAGCTCTGAGGCAAATTCTCAGAGAATCAGGCGGAATTGACAAGGAAGCAATGGGATTCA +CATACAGTGGAATAAGAACTAATGGAGCAACCAGTGCATGTAGGAGATCAGGATCTTCATTCTATGCAGAAATGAAATGG +CTCCTGTCAAACACAGATAATGCTGCATTCCCGCAGATGACTAAGTCATATAAAAATACAAGAAAAAGCCCAGCTCTAAT +AGTATGGGGGATCCATCATTCCGTATCAACTGCAGAGCAAACCAAGCTATATGGGAGTGGAAACAAACTGGTGACAGTTG +GGAGTTCTAATTATCAACAATCTTTTGTACCGAGTCCAGGAGCGAGACCACAAGTTAATGGTCTATCTGGAAGAATTGAC +TTTCATTGGCTAATGCTAAATCCCAATGATACAGTCACTTTCAGTTTCAATGGGGCTTTCATAGCTCCAGACCGTGCAAG +CTTCCTGAGAGGAAAATCTATGGGAATCCAGAGTGGAGTACAGGTTGATGCCAATTGTGAAGGGGACTGCTATCATAGTG +GAGGGACAATAATAAGTAACTTGCCATTTCAGAACATAGATAGCAGGGCAGTTGGAAAATGTCCGAGATATGTTAAGCAA +AGGAGTCTGCTGCTAGCAACAGGGATGAAGAATGTTCCTGAGATTCCAAAAGGAAGAGGCCTATTTGGTGCTATAGCGGG +TTTCATTGAAAATGGATGGGAAGGCCTAATTGATGGTTGGTATGGTTTCAGACACCAGAATGCACAGGGAGAGGGAACTG +CTGCAGATTACAAAAGCACTCAATCGGCAATTGATCAAATAACAGGAAAATTAAACCGGCTTATAGAAAAAACCAACCAA +CAATTTGAGTTGATAGACAATGAATTCAATGAGGTAGAGAAGCAAATCGGTAATGTGATAAATTGGACCAGAGATTCTAT +AACAGAAGTGTGGTCATACAATGCTGAACTCTTGGTAGCAATGGAGAACCAGCATACAATTGATCTGGCTGATTCAGAAA +TGGACAAACTGTACGAACGAGTGAAAAGACAGCTGAGAGAGAATGCTGAAGAAGATGGCACTGGTTGCTTTGAAATATTT +CACAAGTGTGATGATGACTGTATGGCCAGTATTAGAAATAACACCTATGATCACAGCAAATACAGGGAAGAGGCAATGCA +AAATAGAATACAGATTGACCCAGTCAAACTAAGCAGCGGCTACAAAGATGTGATACTTTGGTTTAGCTTCGGGGCATCAT +GTTTCATACTTCTAGCCATTGTAATGGGCCTTGTCTTCATATGTGTAAAGAATGGAAACATGCGGTGCACTATTTGTATA +TAAGTTTGGAAAAAACACCCTTGTTTCT +>NC_026426.1 Influenza A virus (A/Shanghai/02/2013(H7N9)) segment 5 nucleocapsid protein (NP) gene, complete cds +ATGGCGTCTCAAGGCACCAAACGATCCTATGAACAGATGGAAACTGGTGGGGAACGCCAGAATGCTACTGAGATCAGGGC +ATCTGTTGGAAGAATGGTTAGCGGCATTGGGAGATTCTACATACAGATGTGTACAGAACTCAAACTCAGTGACAATGAAG +GGAGGCTGATTCAGAACAGTATAACAATAGAGAGAATGGTACTCTCTGCATTTGATGAAAGAAGGAACAGATACCTGGAA +GAGCACCCCAGTGCAGGAAAGGACCCTAAGAAAACTGGAGGTCCAATTTACAGGAGAAGAGACGGAAAATGGGTGAGAGA +GCTGATCCTGTATGACAAAGAGGAAATCAGGAGAATTTGGCGACAAGCGAACAATGGAGAGGATGCAACTGCTGGTCTTA +CCCATCTGATGATATGGCATTCCAACCTGAATGATGCTACCTATCAGAGAACGAGAGCTCTCGTGCGTACTGGAATGGAT +CCCCGGATGTGCTCTCTGATGCAAGGATCAACTCTCCCGAGGAGATCTGGAGCTGCAGGTGCAGCAGTGAAGGGGATAGG +GACAATGGTGATGGAACTGATTCGGATGATAAAACGAGGGATCAACGACCGGAATTTCTGGAGAGGCGAAAATGGAAGAA +GGACAAGAATTGCATATGAGAGAATGTGCAACATCCTCAAAGGGAAATTCCAAACAGCAGCACAAAGGGCAATGATGGAT +CAAGTGCGAGAGAGCAGAAATCCTGGGAATGCTGAAATAGAAGATCTCATTTTTCTGGCAAGGTCTGCACTCATCCTGAG +AGGATCAGTGGCTCATAAATCCTGCTTGCCTGCTTGTGTGTACGGACTTGCAGTGGCTAGTGGATATGACTTTGAGAGAG +AAGGGTACTCCTTGGTTGGAATAGATCCTTTCCGTCTGCTTCAAAACAGCCAGGTCTTTAGTCTCATTAGACCAAATGAG +AACCCAGCACATAAGAGCCAACTAGTGTGGATGGCATGCCACTCTGCAGCGTTTGAGGACCTTAGGGTCTCAAGTTTCAT +TAGAGGGACAAGAATGGTCCCAAGAGGACAGCTATCCACTAGAGGGGTTCAAATTGCTTCAAATGAGAACATGGAAGCAA +TGGACTCCAATACTCTTGAACTGAGAAGTAGATATTGGGCTATAAGAACCAGAAGCGGAGGGAACACCAACCAACAGAGG +GCATCTGCAGGACAGGTCAGCGTTCAACCCACTTTCTCAGTACAGAGAAACCTTCCTTTCGAAAGAGCAACCATTATGGC +AGCATTTACAGGAAATACTGAGGGTAGAACGTCTGACATGAGGACTGAAATCATAAGAATGATGGAAAGTGCCAGACCAG +AAGATGTGTCATTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGAC +ATGAATAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAATTGAAGAAAAAAA +>NC_026429.1 Influenza A virus (A/Shanghai/02/2013(H7N9)) segment 6 neuraminidase (NA) gene, complete cds +ATGAATCCAAATCAGAAGATTCTATGCACTTCAGCCACTGCTATCATAATAGGCGCAATCGCAGTACTCATTGGAATGGC +AAACCTAGGATTGAACATAGGACTGCATCTAAAACCGGGCTGCAATTGCTCACACTCACAACCTGAAACAACCAACACAA +GCCAAACAATAATAAACAACTATTATAATGAAACAAACATCACCAAYATCCAAATGGAAGAGAGAACAAGCAGGAATTTC +AATAACTTAACTAAAGGGCTCTGTACTATAAATTCATGGCACATATATGGGAAAGACAATGCAGTAAGAATTGGAGAGAG +CTCGGATGTTTTAGTCACAAGAGAACCCTATGTTTCATGCGACCCAGATGAATGCAGGTTCTATGCTCTCAGCCAAGGAA +CAACAATCAGAGGGAAACACTCAAACGGAACAATACACGATAGGTCCCAGTATCGCGCCCTGATAAGCTGGCCACTATCA +TCACCGCCCACAGTGTACAACAGCAGGGTGGAATGCATTGGGTGGTCAAGTACTAGTTGCCATGATGGCAAATCCAGGAT +GTCAATATGTATATCAGGACCAAACAACAATGCATCTGCAGTAGTATGGTACAACAGAAGGCCTGTTGCAGAAATTAACA +CATGGGCCCGAAACATACTAAGAACACAGGAATCTGAATGTGTATGCCACAACGGCGTATGCCCAGTAGTGTTCACCGAT +GGGTCTGCCACTGGACCTGCAGACACAAGAATATACTATTTTAAAGAGGGGAAAATATTGAAATGGGAGTCTCTGACTGG +AACTGCTAAGCATATTGAAGAATGCTCATGTTACGGGGAACGAACAGGAATTACCTGCACATGCAGGGACAATTGGCAGG +GCTCAAATAGACCAGTGATTCAGATAGACCCAGTAGCAATGACACACACTAGTCAATATATATGCAGTCCTGTTCTTACA +GACAATCCCCGACCGAATGACCCAAATATAGGTAAGTGTAATGACCCTTATCCAGGTAATAATAACAATGGAGTCAAGGG +ATTCTCATACCTGGATGGGGCTAACACTTGGCTAGGGAGGACAATAAGCACAGCCTCGAGGTCTGGATACGAGATGTTAA +AAGTGCCAAATGCATTGACAGATGATAGATCAAAGCCCATTCAAGGTCAGACAATTGTATTAAACGCTGACTGGAGTGGT +TACAGTGGATCTTTCATGGACTATTGGGCTGAAGGGGACTGCTATCGAGCGTGTTTTTATGTGGAGTTGATACGTGGAAG +ACCCAAGGAGGATAAAGTGTGGTGGACCAGCAATAGTATAGTATCGATGTGTTCCAGTACAGAATTCCTGGGACAATGGA +ACTGGCCTGATGGGGCTAAAATAGAGTACTTCCTCTAA +>NC_026427.1 Influenza A virus (A/Shanghai/02/2013(H7N9)) segment 7 matrix protein 2 (M2) and matrix protein 1 (M1) genes, complete cds +ATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCATTCCATCAGGCCCCCTCAAAGCCGAGATCGCACAGAG +ACTTGAGGATGTTTTTGCAGGGAAGAACGCAGATCTCGAGGCTCTCATGGAGTGGATAAAGACAAGACCAATCCTGTCAC +CTCTGACTAAGGGGATTTTAGGGTTTGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGGTTTGTC +CAAAACGCCCTAAATGGGAATGGAGACCCAAACAACATGGACAAGGCGGTTAAATTATACAAGAAACTGAAGAGGGAAAT +GACATTTCATGGAGCAAAGGAAGTTGCACTCAGTTACTCAACTGGTGCGCTTGCCAGCTGCATGGGTCTCATATACAACA +GAATGGGGACTGTGACCGCAGAAGGGGCTCTTGGACTAGTATGTGCCACTTGTGAGCAGATTGCTGACGCACAACATCGG +TCCCACAGGCAGATGGCGACTACTACTAACCCACTAATTAGGCATGAGAATAGAATGGTACTAGCCAGCACTACGGCTAA +GGCTATGGAGCAGATGGCTGGATCAAGTGAACAGGCAGCGGAAGCCATGGAAGTTGCAAGTCAGGCTAGGCAAATGGTGC +AGGCTATGAGAACAGTTGGGACTCACCCTAACTCCAGTACAGGTCTAAAAGATGATCTTATTGAAAATTTGCAGGCCTAC +CAGAACCGGATGGGAGTGCAACTGCAGCGGTTCAAGTGAGCCTCTAGTCGTTGCAGCTAACATTATTGGGATATTGCACT +TGATATTGTGGATTCTTGATCGTCTTTTCTTCAAATGCATTTATCGTCGTTTTAAATACGGTTTGAAAAGAGGGCCTTCT +ACGGAAGGAATGCCTGAGTCTATGAGGGAAGAATATCGGCAGGAACAGCAGAATGCTGTGGATGTTGACGATGGTCATTT +TGTCAACATAGAGCTGAAGTAAAAA +>NC_026428.1 Influenza A virus (A/Shanghai/02/2013(H7N9)) segment 8 nuclear export protein (NEP) and nonstructural protein 1 (NS1) genes, complete cds +ATGGATTCCAATACTGTGTCAAGCTTCCAGGTAGACTGCTTTCTTTGGCATGTCCGCAAACGATTTGCAGACCAAGAAAT +GGGTGATGCCCCATTTCTAGACCGGCTTCGCCGAGATCAGAAGTCCCTGAGAGGAAGAAGCAGCACTCTTGGTCTGGACA +TCAGAACTGCCACGCGTGAAGGAAAGCATATAGTGGAGCGGATTTTAGAGGAAGAGTCAGATGAAGCATTTAAAATGAGT +ATTGCTTCAGTGCCAGCTCCACGCTATCTAACTGACATGACTCTTGAAGAAATGTCAAGAGATTGGTTAATGCTCATTCC +CAAACAGAAAATAACAGGGTCCCTATGCATTAGAATGGACCAAGCAATAGTGGACAAAAACATCACATTGAAAGCAAATT +TCAGTGTGATTTTCAATCGGCTTGAAGCCCTGATACTACTTAGAGCTTTTACGGAAGAAGGAGCAATTGTAGGCGAAATC +TCACCATTACCTTCTCTTCCAGGACATACTGACAAGGATGTCAAAAATGCAATTGAGATCCTCATCGGAGGATTTGAATG +GAATGATAACACAGTTCGAGTCTCTGAAACTCTACAGAGATTCGCTTGGAGAAGCAGCGATGAGGATGGGAGATCTCCAC +TCTCTACAAAGTAGAAACGGGAAATGGAGAGAACAGTTAAGCCAGAAGTTCGAAGAAATAAGATGGTTGATTGAAGAAGT +ACGACATAGATTAAAAATTACGGAGAATAGCTTTGAGCAAATAACTTTTATGCAAGCCTTACAACTATTGCTTGAAGTGG +AGCAAGAGATAAGAACTTTCTCGTTTCAGCTTATTTAATGA +>NC_026438.1 Influenza A virus (A/California/07/2009(H1N1)) segment 1 polymerase PB2 (PB2) gene, complete cds +ATGGAGAGAATAAAAGAACTGAGAGATCTAATGTCGCAGTCCCGCACTCGCGAGATACTCACTAAGACCACTGTGGACCA +TATGGCCATAATCAAAAAGTACACATCAGGAAGGCAAGAGAAGAACCCCGCACTCAGAATGAAGTGGATGATGGCAATGA +GATACCCAATTACAGCAGACAAGAGAATAATGGACATGATTCCAGAGAGGAATGAACAAGGACAAACCCTCTGGAGCAAA +ACAAACGATGCTGGATCAGACCGAGTGATGGTATCACCTCTGGCCGTAACATGGTGGAATAGGAATGGCCCAACAACAAG +TACAGTTCATTACCCTAAGGTATATAAAACTTATTTCGAAAAGGTCGAAAGGTTGAAACATGGTACCTTCGGCCCTGTCC +ACTTCAGAAATCAAGTTAAAATAAGGAGGAGAGTTGATACAAACCCTGGCCATGCAGATCTCAGTGCCAAGGAGGCACAG +GATGTGATTATGGAAGTTGTTTTCCCAAATGAAGTGGGGGCAAGAATACTGACATCAGAGTCACAGCTGGCAATAACAAA +AGAGAAGAAAGAAGAGCTCCAGGATTGTAAAATTGCTCCCTTGATGGTGGCGTACATGCTAGAAAGAGAATTGGTCCGTA +AAACAAGGTTTCTCCCAGTAGCCGGCGGAACAGGCAGTGTTTATATTGAAGTGTTGCACTTAACCCAAGGGACGTGCTGG +GAGCAGATGTACACTCCAGGAGGAGAAGTGAGAAATGATGATGTTGACCAAAGTTTGATTATCGCTGCTAGAAACATAGT +AAGAAGAGCAGCAGTGTCAGCAGACCCATTAGCATCTCTCTTGGAAATGTGCCACAGCACACAGATTGGAGGAGTAAGGA +TGGTGGACATCCTTAGACAGAATCCAACTGAGGAACAAGCCGTAGACATATGCAAGGCAGCAATAGGGTTGAGGATTAGC +TCATCTTTCAGTTTTGGTGGGTTCACTTTCAAAAGGACAAGCGGATCATCAGTCAAGAAAGAAGAAGAAGTGCTAACGGG +CAACCTCCAAACACTGAAAATAAGAGTACATGAAGGGTATGAAGAATTCACAATGGTTGGGAGAAGAGCAACAGCTATTC +TCAGAAAGGCAACCAGGAGATTGATCCAGTTGATAGTAAGCGGGAGAGACGAGCAGTCAATTGCTGAGGCAATAATTGTG +GCCATGGTATTCTCACAGGAGGATTGCATGATCAAGGCAGTTAGGGGCGATCTGAACTTTGTCAATAGGGCAAACCAGCG +ACTGAACCCCATGCACCAACTCTTGAGGCATTTCCAAAAAGATGCAAAAGTGCTTTTCCAGAACTGGGGAATTGAATCCA +TCGACAATGTGATGGGAATGATCGGAATACTGCCCGACATGACCCCAAGCACGGAGATGTCGCTGAGAGGGATAAGAGTC +AGCAAAATGGGAGTAGATGAATACTCCAGCACGGAGAGAGTGGTAGTGAGTATTGACCGATTTTTAAGGGTTAGAGATCA +AAGAGGGAACGTACTATTGTCTCCCGAAGAAGTCAGTGAAACGCAAGGAACTGAGAAGTTGACAATAACTTATTCGTCAT +CAATGATGTGGGAGATCAATGGCCCTGAGTCAGTGCTAGTCAACACTTATCAATGGATAATCAGGAACTGGGAAATTGTG +AAAATTCAATGGTCACAAGATCCCACAATGTTATACAACAAAATGGAATTTGAACCATTTCAGTCTCTTGTCCCTAAGGC +AACCAGAAGCCGGTACAGTGGATTCGTAAGGACACTGTTCCAGCAAATGCGGGATGTGCTTGGGACATTTGACACTGTCC +AAATAATAAAACTTCTCCCCTTTGCTGCTGCCCCACCAGAACAGAGTAGGATGCAATTTTCCTCATTGACTGTGAATGTG +AGAGGATCAGGGTTGAGGATACTGGTAAGAGGCAATTCTCCAGTATTCAATTACAACAAGGCAACCAAACGACTTACAGT +TCTTGGAAAGGATGCAGGTGCATTGACTGAAGATCCAGATGAAGGCACATCTGGGGTGGAGTCTGCTGTCCTGAGAGGAT +TTCTCATTTTGGGCAAAGAAGACAAGAGATATGGCCCAGCATTAAGCATCAATGAACTGAGCAATCTTGCAAAAGGAGAG +AAGGCTAATGTGCTAATTGGGCAAGGGGACGTAGTGTTGGTAATGAAACGAAAACGGGACTCTAGCATACTTACTGACAG +CCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAG +>NC_026435.1 Influenza A virus (A/California/07/2009(H1N1)) segment 2 polymerase PB1 (PB1) gene, complete cds; and nonfunctional PB1-F2 protein (PB1-F2) gene, complete sequence +ATGGATGTCAATCCGACTCTACTTTTCCTAAAAATTCCAGCGCAAAATGCCATAAGCACCACATTCCCTTATACTGGAGA +TCCTCCATACAGCCATGGAACAGGAACAGGATACACCATGGACACAGTAAACAGAACACACCAATACTCAGAAAAGGGAA +AGTGGACGACAAACACAGAGACTGGTGCACCCCAGCTCAACCCGATTGATGGACCACTACCTGAGGATAATGAACCAAGT +GGGTATGCACAAACAGACTGTGTTCTAGAGGCTATGGCTTTCCTTGAAGAATCCCACCCAGGAATATTTGAGAATTCATG +CCTTGAAACAATGGAAGTTGTTCAACAAACAAGGGTAGATAAACTAACTCAAGGTCGCCAGACTTATGATTGGACATTAA +ACAGAAATCAACCGGCAGCAACTGCATTGGCCAACACCATAGAAGTCTTTAGATCGAATGGCCTAACAGCTAATGAGTCA +GGAAGGCTAATAGATTTCTTAAAGGATGTAATGGAATCAATGAACAAAGAGGAAATAGAGATAACAACCCACTTTCAAAG +AAAAAGGAGAGTAAGAGACAACATGACCAAGAAGATGGTCACGCAAAGAACAATAGGGAAGAAAAAACAAAGACTGAATA +AGAGAGGCTATCTAATAAGAGCACTGACATTAAATACGATGACCAAAGATGCAGAGAGAGGCAAGTTAAAAAGAAGGGCT +ATCGCAACACCTGGGATGCAGATTAGAGGTTTCGTATACTTTGTTGAAACTTTAGCTAGGAGCATTTGCGAAAAGCTTGA +ACAGTCTGGGCTCCCAGTAGGGGGCAATGAAAAGAAGGCCAAACTGGCAAATGTTGTGAGAAAGATGATGACTAATTCAC +AAGACACAGAGATTTCTTTCACAATCACTGGGGACAACACTAAGTGGAATGAAAATCAAAATCCTCGAATGTTCCTGGCG +ATGATTACATATATCACCAGAAATCAACCCGAGTGGTTCAGAAACATCCTGAGCATGGCACCCATAATGTTCTCAAACAA +AATGGCAAGACTAGGGAAAGGGTACATGTTCGAGAGTAAAAGAATGAAGATTCGAACACAAATACCAGCAGAAATGCTAG +CAAGCATTGACCTGAAGTACTTCAATGAATCAACAAAGAAGAAAATTGAGAAAATAAGGCCTCTTCTAATAGATGGCACA +GCATCACTGAGTCCTGGGATGATGATGGGCATGTTCAACATGCTAAGTACGGTCTTGGGAGTCTCGATACTGAATCTTGG +ACAAAAGAAATACACCAAGACAATATACTGGTGGGATGGGCTCCAATCATCCGACGATTTTGCTCTCATAGTGAATGCAC +CAAACCATGAGGGAATACAAGCAGGAGTGGACAGATTCTACAGGACCTGCAAGTTAGTGGGAATCAACATGAGCAAAAAG +AAGTCCTATATAAATAAGACAGGGACATTTGAATTCACAAGCTTTTTTTATCGCTATGGATTTGTGGCTAATTTTAGCAT +GGAGCTACCCAGCTTTGGAGTGTCTGGAGTAAATGAATCAGCTGACATGAGTATTGGAGTAACAGTGATAAAGAACAACA +TGATAAACAATGACCTTGGACCTGCAACGGCCCAGATGGCTCTTCAATTGTTCATCAAAGACTACAGATACACATATAGG +TGCCATAGGGGAGACACACAAATTCAGACGAGAAGATCATTTGAGTTAAAGAAGCTGTGGGATCAAACCCAATCAAAGGT +AGGGCTATTAGTATCAGATGGAGGACCAAACTTATACAATATACGGAATCTTCACATTCCTGAAGTCTGCTTAAAATGGG +AGCTAATGGATGATGATTATCGGGGAAGACTTTGTAATCCCCTGAATCCCTTTGTCAGTCATAAAGAGATTGATTCTGTA +AACAATGCTGTGGTAATGCCAGCCCATGGTCCAGCCAAAAGCATGGAATATGATGCCGTTGCAACTACACATTCCTGGAT +TCCCAAGAGGAATCGTTCTATTCTCAACACAAGCCAAAGGGGAATTCTTGAGGATGAACAGATGTACCAGAAGTGCTGCA +ATCTATTCGAGAAATTTTTCCCTAGCAGTTCATATAGGAGACCGGTTGGAATTTCTAGCATGGTGGAGGCCATGGTGTCT +AGGGCCCGGATTGATGCCAGGGTCGACTTCGAGTCTGGACGGATCAAGAAAGAAGAGTTCTCTGAGATCATGAAGATCTG +TTCCACCATTGAAGAACTCAGACGGCAAAAATAA +>NC_026437.1 Influenza A virus (A/California/07/2009(H1N1)) segment 3 polymerase PA (PA) gene, complete cds +ATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATCGTCGAGCTTGCGGRAAAGGCAATGAAAGAATATGGGGAAGA +TCCGAAAATCGAAACTAACAAGTTTGCTGCAATATGCACACATTTGGAAGTTTGTTTCATGTATTCGGATTTCCATTTCA +TCGACGAACGGGGTGAATCAATAATTGTAGAATCTGGTGACCCGAATGCACTATTGAAGCACCGATTTGAGATAATTGAA +GGAAGAGACCGAATCATGGCCTGGACAGTGGTGAACAGTATATGTAACACAACAGGGGTAGAGAAGCCTAAATTTCTTCC +TGATTTGTATGATTACAAAGAGAACCGGTTCATTGAAATTGGAGTAACACGGAGGGAAGTCCACATATATTACCTAGAGA +AAGCCAACAAAATAAAATCTGAGAAGACACACATTCACATCTTTTCATTCACTGGAGAGGAGATGGCCACCAAAGCGGAC +TACACCCTTGACGAAGAGAGCAGGGCAAGAATCAAAACTAGGCTTTTCACTATAAGACAAGAAATGGCCAGTAGGAGTCT +ATGGGATTCCTTTCGTCAGTCCGAAAGAGGCGAAGAGACAATTGAAGAAAAATTTGAGATTACAGGAACTATGCGCAAGC +TTGCCGACCAAAGTCTCCCACCGAACTTCCCCAGCCTTGAAAACTTTAGAGCCTATGTAGATGGATTCGAGCCGAACGGC +TGCATTGAGGGCAAGCTTTCCCAAATGTCAAAAGAAGTGAACGCCAAAATTGAACCATTCTTGAGGACGACACCACGCCC +CCTCAGATTGCCTGATGGGCCTCTTTGCCATCAGCGGTCAAAGTTCCTGCTGATGGATGCTCTGAAATTAAGTATTGAAG +ACCCGAGTCACGAGGGGGAGGGAATACCACTATATGATGCAATCAAATGCATGAAGACATTCTTTGGCTGGAAAGAGCCT +AACATAGTCAAACCACATGAGAAAGGCATAAATCCCAATTACCTCATGGCTTGGAAGCAGGTGCTAGCAGAGCTACAGGA +CATTGAAAATGAAGAGAAGATCCCAAGGACAAAGAACATGAAGAGAACAAGCCAATTGAAGTGGGCACTCGGTGAAAATA +TGGCACCAGAAAAAGTAGACTTTGATGACTGCAAAGATGTTGGAGACCTTAAACAGTATGACAGTGATGAGCCAGAGCCC +AGATCTCTAGCAAGCTGGGTCCAAAATGAATTCAATAAGGCATGTGAATTGACTGATTCAAGCTGGATAGAACTTGATGA +AATAGGAGAAGATGTTGCCCCGATTGAACATATCGCAAGCATGAGGAGGAACTATTTTACAGCAGAAGTGTCCCACTGCA +GGGCTACTGAATACATAATGAAGGGAGTGTACATAAATACGGCCTTGCTCAATGCATCCTGTGCAGCCATGGATGACTTT +CAGCTGATCCCAATGATAAGCAAATGTAGGACCAAAGAAGGAAGACGGAAAACAAACCTGTATGGGTTCATTATAAAAGG +AAGGTCTCATTTGAGAAATGATACTGATGTGGTGAACTTTGTAAGTATGGAGTTCTCACTCACTGACCCGAGACTGGAGC +CACACAAATGGGAAAAATACTGTGTTCTTGAAATAGGAGACATGCTCTTGAGGACTGCGATAGGCCAAGTGTCGAGGCCC +ATGTTCCTATATGTGAGAACCAATGGAACCTCCAAGATCAAGATGAAATGGGGCATGGAAATGAGGCGCTGCCTTCTTCA +GTCTCTTCAGCAGATTGAGAGCATGATTGAGGCCGAGTCTTCTGTCAAAGAGAAAGACATGACCAAGGAATTCTTTGAAA +ACAAATCGGAAACATGGCCAATCGGAGAGTCACCCAGGGGAGTGGAGGAAGGCTCTATTGGGAAAGTGTGCAGGACCTTA +CTGGCAAAATCTGTATTCAACAGTCTATATGCGTCTCCACAACTTGAGGGGTTTTCGGCTGAATCTAGAAAATTGCTTCT +CATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATCGAGGAGTGCC +TGATTAATGATCCCTGGGTTTTGCTTAATGCATCTTGGTTCAACTCCTTCCTCACACATGCACTGAAGTAG +>NC_026433.1 Influenza A virus (A/California/07/2009(H1N1)) segment 4 hemagglutinin (HA) gene, complete cds +ATGAAGGCAATACTAGTAGTTCTGCTATATACATTTGCAACCGCAAATGCAGACACATTATGTATAGGTTATCATGCGAA +CAATTCAACAGACACTGTAGACACAGTACTAGAAAAGAATGTAACAGTAACACACTCTGTTAACCTTCTAGAAGACAAGC +ATAACGGGAAACTATGCAAACTAAGAGGGGTAGCCCCATTGCATTTGGGTAAATGTAACATTGCTGGCTGGATCCTGGGA +AATCCAGAGTGTGAATCACTCTCCACAGCAAGCTCATGGTCCTACATTGTGGAAACACCTAGTTCAGACAATGGAACGTG +TTACCCAGGAGATTTCATCGATTATGAGGAGCTAAGAGAGCAATTGAGCTCAGTGTCATCATTTGAAAGGTTTGAGATAT +TCCCCAAGACAAGTTCATGGCCCAATCATGACTCGAACAAAGGTGTAACGGCAGCATGTCCTCATGCTGGAGCAAAAAGC +TTCTACAAAAATTTAATATGGCTAGTTAAAAAAGGAAATTCATACCCAAAGCTCAGCAAATCCTACATTAATGATAAAGG +GAAAGAAGTCCTCGTGCTATGGGGCATTCACCATCCATCTACTAGTGCTGACCAACAAAGTCTCTATCAGAATGCAGATG +CATATGTTTTTGTGGGGTCATCAAGATACAGCAAGAAGTTCAAGCCGGAAATAGCAATAAGACCCAAAGTGAGGGRTCRA +GAAGGGAGAATGAACTATTACTGGACACTAGTAGAGCCGGGAGACAAAATAACATTCGAAGCAACTGGAAATCTAGTGGT +ACCGAGATATGCATTCGCAATGGAAAGAAATGCTGGATCTGGTATTATCATTTCAGATACACCAGTCCACGATTGCAATA +CAACTTGTCAAACACCCAAGGGTGCTATAAACACCAGCCTCCCATTTCAGAATATACATCCGATCACAATTGGAAAATGT +CCAAAATATGTAAAAAGCACAAAATTGAGACTGGCCACAGGATTGAGGAATATCCCGTCTATTCAATCTAGAGGCCTATT +TGGGGCCATTGCCGGTTTCATTGAAGGGGGGTGGACAGGGATGGTAGATGGATGGTACGGTTATCACCATCAAAATGAGC +AGGGGTCAGGATATGCAGCCGACCTGAAGAGCACACAGAATGCCATTGACGAGATTACTAACAAAGTAAATTCTGTTATT +GAAAAGATGAATACACAGTTCACAGCAGTAGGTAAAGAGTTCAACCACCTGGAAAAAAGAATAGAGAATTTAAATAAAAA +AGTTGATGATGGTTTCCTGGACATTTGGACTTACAATGCCGAACTGTTGGTTCTATTGGAAAATGAAAGAACTTTGGACT +ACCACGATTCAAATGTGAAGAACTTATATGAAAAGGTAAGAAGCCAGCTAAAAAACAATGCCAAGGAAATTGGAAACGGC +TGCTTTGAATTTTACCACAAATGCGATAACACGTGCATGGAAAGTGTCAAAAATGGGACTTATGACTACCCAAAATACTC +AGAGGAAGCAAAATTAAACAGAGAAGAAATAGATGGGGTAAAGCTGGAATCAACAAGGATTTACCAGATTTTGGCGATCT +ATTCAACTGTCGCCAGTTCATTGGTACTGGTAGTCTCCCTGGGGGCAATCAGTTTCTGGATGTGCTCTAATGGGTCTCTA +CAGTGTAGAATATGTATTTAA +>NC_026436.1 Influenza A virus (A/California/07/2009(H1N1)) segment 5 nucleocapsid protein (NP) gene, complete cds +ATGGCGTCTCAAGGCACCAAACGATCATATGAACAAATGGAGACTGGTGGGGAGCGCCAGGATGCCACAGAAATCAGAGC +ATCTGTCGGAAGAATGATTGGTGGAATCGGGAGATTCTACATCCAAATGTGCACTGAACTCAAACTCAGTGATTATGATG +GACGACTAATCCAGAATAGCATAACAATAGAGAGGATGGTGCTTTCTGCTTTTGATGAGAGAAGAAATAAATACCTAGAA +GAGCATCCCAGTGCTGGGAAGGACCCTAAGAAAACAGGAGGACCCATATATAGAAGAGTAGACGGAAAGTGGATGAGAGA +ACTCATCCTTTATGACAAAGRAGAAATAAGGAGAGTTTGGCGCCTAGCAAACAATGGCGAAGATGCAACAGCAGGTCTTA +CTCATATCATGATTTGGCATTCCAACCTGAATGATGCCACATATCAGAGAACAAGAGCGCTTGTTCGCACCGGAATGGAT +CCCAGAATGTGCTCTCTAATGCAAGGTTCAACACTTCCCAGAAGGTCTGGTGCCGCAGGTGCTGCGGTGAAAGGAGTTGG +AACAATAGCAATGGAGTTAATCAGAATGATCAAACGTGGAATCAATGACCGAAATTTCTGGAGGGGTGAAAATGGACGAA +GGACAAGGGTTGCTTATGAAAGAATGTGCAATATCCTCAAAGGAAAATTTCAAACAGCTGCCCAGAGGGCAATGATGGAT +CAAGTAAGAGAAAGTCGAAACCCAGGAAACGCTGAGATTGAAGACCTCATTTTCCTGGCACGGTCAGCACTCATTCTGAG +GGGATCAGTTGCACATAAATCCTGCCTGCCTGCTTGTGTGTATGGGCTTGCAGTAGCAAGTGGGCATGACTTTGAAAGGG +AAGGGTACTCACTGGTCGGGATAGACCCATTCAAATTACTCCAAAACAGCCAAGTGGTCAGCCTGATGAGACCAAATGAA +AACCCAGCTCACAAGAGTCAATTGGTGTGGATGGCATGCCACTCTGCTGCATTTGAAGATTTAAGAGTATCAAGTTTCAT +AAGAGGAAAGAAAGTGATTCCAAGAGGAAAGCTTTCCACAAGAGGGGTCCAGATTGCTTCAAATGAGAATGTGGAAACCA +TGGACTCCAATACCCTGGAACTGAGAAGCAGATACTGGGCCATAAGGACCAGGAGTGGAGGAAATACCAATCAACAAAAG +GCATCCGCAGGCCAGATCAGTGTGCAGCCTACATTCTCAGTGCAGCGGAATCTCCCTTTTGAAAGAGCAACCGTTATGGC +AGCATTCAGCGGGAACAATGAAGGACGGACATCCGACATGCGAACAGAAGTTATAAGAATGATGGAAAGTGCAAAGCCAG +AAGATTTGTCCTTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGAC +ATGAGTAATGAAGGGTCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAGTTGA +>NC_026434.1 Influenza A virus (A/California/07/2009(H1N1)) segment 6 neuraminidase (NA) gene, complete cds +ATGAATCCAAACCAAAAGATAATAACCATTGGTTCGGTCTGTATGACAATTGGAATGGCTAACTTAATATTACAAATTGG +AAACATAATCTCAATATGGATTAGCCACTCAATTCAACTTGGGAATCAAAATCAGATTGAAACATGCAATCAAAGCGTCA +TTACTTATGAAAACAACACTTGGGTAAATCAGACATATGTTAACATCAGCAACACCAACTTTGCTGCTGGACAGTCAGTG +GTTTCCGTGAAATTAGCGGGCAATTCCTCTCTCTGCCCTGTTAGTGGATGGGCTATATACAGTAAAGACAACAGTGTAAG +AATCGGTTCCAAGGGGGATGTGTTTGTCATAAGGGAACCATTCATATCATGCTCCCCCTTGGAATGCAGAACCTTCTTCT +TGACTCAAGGGGCCTTGCTAAATGACAAACATTCCAATGGAACCATTAAAGACAGGAGCCCATATCGAACCCTAATGAGC +TGTCCTATTGGTGAAGTTCCCTCTCCATACAACTCAAGATTTGAGTCAGTCGCTTGGTCAGCAAGTGCTTGTCATGATGG +CATCAATTGGCTAACAATTGGAATTTCTGGCCCAGACAATGGGGCAGTGGCTGTGTTAAAGTACAACGGCATAATAACAG +ACACTATCAAGAGTTGGAGAAACAATATATTGAGAACACAAGAGTCTGAATGTGCATGTGTAAATGGTTCTTGCTTTACT +GTAATGACCGATGGACCAAGTAATGGACAGGCCTCATACAAGATCTTCAGAATAGAAAAGGGAAAGATAGTCAAATCAGT +CGAAATGAATGCCCCTAATTATCACTATGAGGAATGCTCCTGTTATCCTGATTCTAGTGAAATCACATGTGTGTGCAGGG +ATAACTGGCATGGCTCGAATCGACCGTGGGTGTCTTTCAACCAGAATCTGGAATATCAGATAGGATACATATGCAGTGGG +ATTTTCGGAGACAATCCACGCCCTAATGATAAGACAGGCAGTTGTGGTCCAGTATCGTCTAATGGAGCAAATGGAGTAAA +AGGGTTTTCATTCAAATACGGCAATGGTGTTTGGATAGGGAGAACTAAAAGCATTAGTTCAAGAAACGGTTTTGAGATGA +TTTGGGATCCGAACGGATGGACTGGGACAGACAATAACTTCTCAATAAAGCAAGATATCGTAGGAATAAATGAGTGGTCA +GGATATAGCGGGAGTTTTGTTCAGCATCCAGAACTAACAGGGCTGGATTGTATAAGACCTTGCTTCTGGGTTGAACTAAT +CAGAGGGCGACCCAAAGAGAACACAATCTGGACTAGCGGGAGCAGCATATCCTTTTGTGGTGTAAACAGTGACACTGTGG +GTTGGTCTTGGCCAGACGGTGCTGAGTTGCCATTTACCATTGACAAGTAA +>NC_026431.1 Influenza A virus (A/California/07/2009(H1N1)) segment 7 matrix protein 2 (M2) and matrix protein 1 (M1) genes, complete cds +ATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTTTCTATCATCCCGTCAGGCCCCCTCAAAGCCGAGATCGCGCAGAG +ACTGGAAAGTGTCTTTGCAGGAAAGAACACAGATCTTGAGGCTCTCATGGAATGGCTAAAGACAAGACCAATCTTGTCAC +CTCTGACTAAGGGAATTTTAGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTC +CAAAATGCCCTAAATGGGAATGGGGACCCGAACAACATGGATAGAGCAGTTAAACTATACAAGAAGCTCAAAAGAGAAAT +AACGTTCCATGGGGCCAAGGAGGTGTCACTAAGCTATTCAACTGGTGCACTTGCCAGTTGCATGGGCCTCATATACAACA +GGATGGGAACAGTGACCACAGAAGCTGCTTTTGGTCTAGTGTGTGCCACTTGTGAACAGATTGCTGATTCACAGCATCGG +TCTCACAGACAGATGGCTACTACCACCAATCCACTAATCAGGCATGAAAACAGAATGGTGCTGGCTAGCACTACGGCAAA +GGCTATGGAACAGATGGCTGGATCGAGTGAACAGGCAGCGGAGGCCATGGAGGTTGCTAATCAGACTAGGCAGATGGTAC +ATGCAATGAGAACTATTGGGACTCATCCTAGCTCCAGTGCTGGTCTGAAAGATGACCTTCTTGAAAATTTGCAGGCCTAC +CAGAAGCGAATGGGAGTGCAGATGCAGCGATTCAAGTGATCCTCTCGTCATTGCAGCAAATATCATTGGGATCTTGCACC +TGATATTGTGGATTACTGATCGTCTTTTTTTCAAATGTATTTATCGTCGCTTTAAATACGGTTTGAAAAGAGGGCCTTCT +ACGGAAGGAGTGCCTGAGTCCATGAGGGAAGAATATCAACAGGAACAGCAGAGTGCTGTGGATGTTGACGATGGTCATTT +TGTCAACATAGAGCTAGAGTAA +>NC_026432.1 Influenza A virus (A/California/07/2009(H1N1)) segment 8 nuclear export protein (NEP) and nonstructural protein 1 (NS1) genes, complete cds +ATGGACTCCAACACCATGTCAAGCTTTCAGGTAGACTGTTTCCTTTGGCATATCCGCAAGCGATTTGCAGACAATGGATT +GGGTGATGCCCCATTCCTTGATCGGCTCCGCCGAGATCAAAAGTCCTTAAAAGGAAGAGGCAACACCCTTGGCCTCGATA +TCGAAACAGCCACTCTTGTTGGGAAACAAATCGTGGAATGGATCTTGAAAGAGGAATCCAGCGAGACACTTAGAATGACA +ATTGCATCTGTACCTACTTCGCGCTACCTTTCTGACATGACCCTCGAGGAAATGTCACGAGACTGGTTCATGCTCATGCC +TAGGCAAAAGATAATAGGCCCTCTTTGCGTGCGATTGGACCAGGCGATCATGGAAAAGAACATAGTACTGAAAGCGAACT +TCAGTGTAATCTTTAACCGATTAGAGACCTTGATACTACTAAGGGCTTTCACTGAGGAGGGAGCAATAGTTGGAGAAATT +TCACCATTACCTTCTCTTCCAGGACATACTTATGAGGATGTCAAAAATGCAGTTGGGGTCCTCATCGGAGGACTTGAATG +GAATGGTAACACGGTTCGAGTCTCTGAAAATATACAGAGATTCGCTTGGAGAAACTGTGATGAGAATGGGAGACCTTCAC +TACCTCCAGAGCAGAAATGAAAAGTGGCGAGAGCAATTGGGACAGAAATTTGAGGAAATAAGGTGGTTAATTGAAGAAAT +GCGGCACAGATTGAAAGCGACAGAGAATAGTTTCGAACAAATAACATTTATGCAAGCCTTACAACTACTGCTTGAAGTAG +AACAAGAGATAAGAGCTTTCTCGTTTCAGCTTATTTAATGATAAAAAACACCCTTGTTTCTAC +>NC_036616.1 Influenza D virus (D/swine/Oklahoma/1334/2011) segment 1 polymerase PB2 (PB2) gene, complete cds +GGCATAAGCAGAGGATGTCACTACTATTAACGCTCGCAAAAGAGTATGCAAATCTCACAAAGGATAAGAAATCATGCAAA +TTGCTGTCGCAAGGGACCGTGTCAAGCTACACCACTTTTAAGAAATGGACAACATCGAGAAAAGAGAAAAACCCATCCCT +TCGAATGAGATGGGCAATGGGAAGCAAGTTCCCAATTATGGCAAACAGAGAAATTTTGGAAGAAGCTGGGATACCAGAAC +AATGGGAAGGGATAGACCTTTGGTCAAAAAAGGATGATGTTTCAAAGTTGGGGATGGTGTTAGCGTCTCCAGCAGCCATA +ACTTACTGGAATTTTTGTGGACCTGGAGTGGACAATTCTTCTGTAATAAAAGATGTTTATAAAGCAAAATTTATGAAAAA +AGAAAGATGGAGAGAGACTCTATGGGGACCAATGAACTTTGAATTGGTGGGTAAACAAAGAAGAGTGGTTGAAACTCAAC +CAGTGGAAATAAAGCTAAACCAAAAAGAAATAAAAGAACTAACGATGTGGGTTCTTTTTGAAGATGAAGCAAACCTTGCA +AGCAAATTCATACAGGAAAATTTCTCACTTGTCCTGTCATTAAGAGAACTTTACAAGGGAAAGGCAGTAAATAAAGATGT +TGCAGCTTTCATGATTGCCCACCAATTTTCTCCCGAGAAGAGGTTCTTACCCACTTTTGGCCCCATTAGACCAGAAAGAA +TGGAGCTACTCCACTGTTTAGGGGGTGATTTCTGGAAGATAGAGGCAGTAACTGCAGGGAGCCTGAACGAAGAACAAAAG +AAGAGAGATGTTAGAGCAGTTGCTAGAAAAATTTGCCTTAGAGCAAGTGTGGACTTATTTACTCCAGCAGAGAAGATAAG +GGACTATATAGCAAGTGTGACAATGAGATTTGGAACAGTAGAAAGAACATTCGAAGACGTAATAAGAAACAGTGATGACA +TATCTGCGGAAGTAACCTTATGCAAGGCGGCACTTGGGTGCGAATTGGGCAAAAGCATGAGCTTTGGGAATCTAAATCTG +AGGAAAGTCAGTGGAGAAGCAGAAACAATGGAAAAAACAGTATATTGGGGATTAAAGCCCATAAAATATAAATGCTGGAG +AGGAGAGGAAACATTTTATTGTGAACTGAGGAAGGTAACTTGTATGTTTAGAAGGTCTGAAGGCCTAGATTGGGCTAACA +TTGGACCTGGTTCACCTGAAGAAAGAAGAGAGCTTTTGGCAATGGTGATGATATTCTGCAGAGATGGGAGATTCTTTGAA +TCTGCACCAGTTAATATTGATGAATCATTCTTTAGGACAAGACTGAATAAAGAAATACCTTATCAATATGTGCTGCTAAA +ATGGGTAAGGCAATCGAGAGACAACTTGGATGCCTTGTTGAGTACAAGAGGACTAATACCTGCTCATATTGGACAATTCG +GAAAAGGAATGGGAATAGATGGAAGTAGCTCATCTTCTATGGTTTACAAGGGAGTCATGTTGTCGAAGACACCGATAGAC +ATAGTGGAGAGCAAAGAGAAGCACAGACTGTTTTTAAATGACAATATAGAAGCAGTGACAGAGAGAGGAGCAATGGTTGC +ATCCATAATGGACCTATCAGAGGATAATAGAGAAACATTTAACGATGTGACTTTTAACCATGTCGACTTAGCTGTTCTCA +AAGATGAAAAGACTGCAATAATAAAGATATATCGATCACTAGTGGAAAGAATAAACACTGATGATGATGGCCTACCTGCT +TTGATAATGGGTAAAAGATATTTAGAGTTGTATCAATTAGATGAAGTAAAAGACGCGGTCGGGCTAATACCAAAAAGGAT +GCTGGGGGCGTATTCCTACCAAGCAAGACAGCTCATACAGTCACAGATCAAAAATGACAGTTATAGCCTTCCTGAAATAA +TAAAGTTACTGCCCTTCTGTTACAGCCCTCCAAAGAAAATGTTATTTGATGGGACTTTCCATTTCAAAAATCAAATGTAT +GTTAGGCCTGGAATAAACACAAACCTTTTCAGTTTTAGTAAGACCGACAAAAGCAAGATATATGTGAACGGAAGCGCAGT +AAAAATAAAGCTTGTGCTCGGAGACGATGAAATGGACACCAGTCTTGCCTTTGTTGAAGGATTTCAAGTTTGTGAATATG +ATCCAAGAGCACCTTTGATACCAAGAAGAGATTTGAGACTGATTGGGTTCGGAAAGAAAGTTAGAGTTTTTGTTGGTCAG +GGACAGGAGAAAACCCTGGTGAGGACGAGCTCCAAAAGAGCCGCCTCCCATGATGTAAGCAAAAACATTCGTAGAATGCG +TCTGGAAGTTTGAAGCACATTGAAAAAATCCTCTTGCTACTGCT +>NC_036615.1 Influenza D virus (D/swine/Oklahoma/1334/2011) segment 2 polymerase PB1 (PB1) gene, complete cds +GGCATAAGCAGAGGATTTTATAACAATGGAAATAAACCCATATCTACTCATGTTAAACAATGATATAACGTCAATGATAT +CATTGACATACCCATATACTGGGGCACCTCCTATGTCACATGGAACATCGACCAAATACTCAATGGAGACTGTGTCAAGA +ACTTACTCCTACAGTAGAACTAAAAAAGAGGTACCTTCGGGAATATTCCCAATAGAGAGAAGGAAATTCTGTAACACAAT +AGAAGACAAAGAAAACCTAGAAAAACCGAATGGAAATGTTGATATAAATTTCATGTTATCGCTGGCAGAAATGCTGGAAG +AAAAGATGGGGAAAGGGTTCTTCAAATTCTGTGCCAATGAAGCTGAAGCTGAAATTTTGAAGATGCACTTCAGCAAGCTC +ACTGAAGGAAGGCAAACTTATGACTGGACAAGTGAAAGAAATATGCCAGCAGCCACCGCTCTTCAGCTAACAGTAGACGC +TATACAAGAAACACAGGGAACATTCAAAGGAACTACCATGGTTGAATATTGCAACAAGATATTAGAAATGATGGATTGGC +CGGAAGTGAAATTCAAAAAGGTCAGAATGATTGTTCAGAGGCATTGGGACCCGAAAACCAAAAAAGAAATAAAAATGAAG +TCTCCAACATTGATGATAACAAAGATTGGAAGAGAAGAATTCATAAAGAGGATATGCACGATAAATACCATGGCCAAAGA +CGGAGAAAGAGGAAAATACAAAAGAAGAGCTATAGCCACCCCCGGGATGGGAATCAGGCCATTCTCAAAAATTGTGGAAA +CTTTAGCACAAAAGATTTGTGAGAGACTAGCAGAGAGCGGTTTGCCTGTTGGGGGAAATGAGAAGAAAGCCAAACTAAAA +ACTACGGTCTCTTCAACAAACTCAAAACTACAAGAAGGGCAGTTCATGGTAAACATAACAGGGGACAACAGCAAGTGGAA +TGAATGTCAGCAACCAGAAGCTTATCTTGCAATGTTGGCATACATTACTAAAGACAGCAGCAACTTAATGAAAGATCTCT +GCTCAGTAGCACCAACATTGTTCTGCAATAAGTACGTAAAAATGGGACAAGGTTTCCGAGCAAAAAACAAAAGAAAAACC +AAAGAAATAGTGATACCCGCAAAAAAGATGAAAGAAAGGAAAGAATTGATGAACGCGGAATGGAGGGACCTATTTGAAAC +AATAGAACCTTACATGGATGGAGAGTGCTGCTTCTTGGGGGGAGGAATGCTGATGGGAATGTTTAACATGTTGTCAACTG +TTTTTGGAGTCATGACATTAAATTACAGGGAGGAAGCATTGGCCAGAAGGAACTGTTACTGGACTGGGCTACAAAGTTCA +GATGATTTTGTGCTCTTTTGCATCTCTAGGACTTGGCCAGAGATGGAGATGACTATTCTAAAATTCATCGCTGTTTGCAA +GTTGATGGGAATAAACATGTCTTTGGAAAAATCCTACGGGTGCTTGCCTGAACTTTTTGAGTTCACAAGCATGTTCTTTT +CCGGGGATTTTGTCTCAAACATAGCCTTGGAGTTACCTGCTTTCACAACAGCTGGAATGAATGAAGGAACCGACTTCACA +GCTGCGATGTCTGTCATAAGAACAAACATGATTAATAATGGACTTTCTCCTGGGACTGCTTTAATGGCCCTGCGAATTTG +TCTGCAGGAATTTAGAGCAACATACAGAGTACACCCTTATGATTCTGGAGTGAAGAATCATCGAATGAAAATCATAAGGA +AATTCATTGAAACTATTGAAAACAAAGATGGATTGCTGATATCAGATGGCGGGAAATTAATGAACAATATCTCAAGTTTG +CACATCCCTGAAGAAATATTGAAAGAGGATTTGATGGATCCCTCCTACAGGAACAGAGTTTTCAATCCTAGGAACCCCTT +TACACAGTTTGAGAAGACAGTTGACATCTTTAAGGCAAGTGGACCTATAAGGGTAGAGGAGAACGAGGCAGTTGTATCAA +CGCATTCCTTTAGAACAAGGAGCAATAGGACATTGCTAAATACAGACATGAGGGCAATGGCTCTCGAAGAGAAAAGATAC +CAAGTTGTTTGCAACATGTACCGATCGGTCTTCGAAAGTGCAGACGTTAACACCCCAATAGGATCAATGTCGATGGGAGA +GGCAATTGAAGCCAAAATCCTTGACCGGGCCAGAACCCAGTTTGAAAATGGAATCATAGGGGGAGAAGAATATTCTGAAA +TCAAAAGACTAATCGAGGACGCCAAGCGTCAACGACTGTCTGTTTAAGCTTTGCGTTGTTTAATAACAGAAAAATCCTCT +TGCTACTGCT +>NC_036619.1 Influenza D virus (D/swine/Oklahoma/1334/2011) segment 3 polymerase 3 (P3) gene, complete cds +GGCATAAGCAGGAGATTTAGAAATGTCTAGTGTAATCAGAGAAATCGCAAAGCGATTCTTGGAACAAGCAACGATAAACA +TCGCTGAAGAAGTGGTCAGAGAATATGGAGACCATGAAAGAACAATGATATCTGTTGGAGTTCATTTCCAAGCTTGCTGC +CTTATAAGTGATGAATATACCCTTGAGGATGAGACAACCCCAAGATACGTTCTTTTGGAGGGATTGAAAAGACAAGAGGC +TATAAGCAAGCAGAATAACATTTGCTCCACTTTGGGATTGGAGCCCTTGAGAAATCTAGCAGATATTTTTGATCGAAAAA +CAAGAAGATTCCTTGAGGTAGGAATTACAAAGAGAGAATCCGATGAGTATTACCAGGAAAAGTTCAACAAAATAGGAAAT +GACATGGACATACATGTTTTCACATATGAAGGCAAATATTTCAGCAACAATCCCAATGGGTTGGAAGACATCCAAAAGAC +AAGAATTTTTACATTCCTATCTTTTGTGTCAGACGAATTGAGAAAAGAGAACATGTTCACAGAAATGTATGTTACAGAAG +AAGGGGCACCTGAACTTGAAATGTACAAGTCAAAGCTTTTCATTGCGATGAGAGACGAGAGCGTGCCTTTGCCTTACATA +AACTATGAGCACCTTAGGACAAGATGTGAAACATTCAAAAGAAATCAGGCTGAATGCGAAGCAAAGGTAGCGGATGTGGC +TTCACGGCTAAAAATCAAACTGGAACATCTAGAAGAAAATAAACTGCGGCCGCTAGAGATACCGAAGGAGAAAGAGGCTC +CCTATACACACAAATTTTTGATGAAAGATGCTTGGTTCTTTGCAAAACCTCATGATTCGGAGAGAGCACAACCGCAACAG +ATATTGTATGATTTCTTTGAAGCAGCAAACATGGGGTTCATGACGACATCCCCAAAACCGATATTCGGAAAGCAAGGACT +GATGTATCACTCCCTCTGGGGGCAGACAAAAAGAGCAATAAAGGACAAGAGAAATGAGTTGGAGCCTTCAGAACAGAGAG +ACTTCCTTTGTGGAATTGGAAGAGCCTCCAAGAAAATACAGGAGGACAAATGGCAAGAATCCAGAGAGGAAGAGTTTAAA +CAAGAAGAGACTAAAGGGGCAGCTAAGAGGGGGTTCCCAACATGGTTTAATGAAGAATGGCTTTGGGCAATGAGGGACTC +AGGGGATGGGGACAATAAAATAGGGGATTGGATACCCATGGCAGAAATGCCTCCCTGCAAGAATGAGATGGAAGATTATG +CAAAAAAGATGTGTGAAGAATTAGAATCCAAAATACAGGGAACAAATTGTGCTAGGGAAATGTCCAAGTTGATACATACA +ATTGGGAGCTTACATACAGAATGTAGGAACTTTCCCGGAAAGGTCAAGATAGTGCCTATATACTGCAGAGGGACACTGAG +AGGGGAATCAACTGACTGTTTGTTTGGAATAGCAATAAAAGGGAAATCCCATTTAAACAAAGATGATGGAATGTATACTG +TTGTAACTTTTGAGTTTTCCACTGAAGAACCAAATCCAAGCAAACATGAAAAATATACGGTCTTCGAAGCTGGAACAGTG +CCTGTGGAAGCCGTGGTGTTAACTCCCAAAAGGGAAAGAGTTCTCAAAGAGAAGAAATTGTTCCTTTATTGCAGAACTAC +TGGAATGAGCAAGTTAAAGAACGATTGGTTTTCTAAATGCAGGAGATGTCTTATACCAACAATGGAGACTGTAGAGCAGA +TAGTGCTGAAAGAATGCGCTCTGAAAGAAGAAAACAGAGTTTCAGAGATGTTGGAGAATAAGAGAGCTTGGATTGCCCAT +GAGAACGGAGAGAATCTTACAAGATTGGTATCAACAAAGCTCAAGGACTTGTGTAGAATGCTAATTGTGACACAATTTTA +TTACTGTATATATAACGACAATCAATTGGAAGGATTCTGTAACGAGCAAAAGAAATTCCTTATGTTTCTTCAAGCAGATA +AGGACTCAAAATCTGCATTTACTTTTAATCAGAAAGGGTTATATGAAAAAATTGAAGAGTGTATTGTCAGCAATCCATTA +TGTATTTTCCTAGCTGATAGGCTAAACAAATTATTTCTTGTAGCCAAGTCCAATGGAGCTAAGTACTTTGAATGACCAAA +GGCCTTGTAATGTTAAAAATCTCCTTGCTACTGCT +>NC_036618.1 Influenza D virus (D/swine/Oklahoma/1334/2011) segment 4 hemagglutinin-esterase precursor (HEF) gene, complete cds +AGCATAAGCAGGAGATTTTCAAAGATGTTTTTGCTTCTAGCAACAATTACAGCAATAACTGCTTGCCAAGCAGAAAGAGA +ACTGATATGCATAGTGCAAAGAGTGAATGAAAGCTTCTCTCTTCACTCTGGATTTGGAGGAAATGTTTACAGCATGAAGA +CTGAGCCAATGACTGGATTCACAAACGTGACCAAAGGTGCTAGTGTCATCAACCAAAAAGACTGGATTGGATTCGGAGAT +TCAAGAACAGACTTGACTAATGATCAGTTTCCAGCGTCTTCAGATGTTCCATTGGCAGTGGCGAAGAAGTTTCGGTCATT +GTCAGGGGCTTCGTTGATGTTGTCAGCTTTTGGGCCTCCTGGCAAGGTTGACTACCTCTATCAAGGATGTGGGAAAGAAA +AAGTATTTTATGAAGGGGTAAACTGGTCCCCTGAGGCAGGAATTGATTGCTTTGGATCAAACTGGACTCAGACAAAGAAG +GACTTCTATTCGAGGATATATGAAGCTGCTAGAAGCAGCACATGCATGACTCTTGTAAATTCTCTTGACACCAAGATATC +ATCAACAACAGCCACGGCTGGAACCGCATCTTCTTGTTCTTCAAGTTGGATGAAAAGCCCGTTGTGGTATGCAGAATCTT +CTGTTAATCCTGGAGCTAAACCTCAAGTTTGTGGGACTGAGCAATCGGCAACTTTTACTTTGCCGACAAGCTTCGGAATT +TACAAATGCAACAAGCATGTAGTGCAGCTTTGTTACTTTGTGTACGAAAACAAAGCAAAATTTAACACTTTTGGCTGTGG +AGATTATTACCAAAATTACTATGATGGGAATGGAAACCTGATAGGGGGAATGGATAACAGAGTGGCAGCATACAGAGGAA +TAGCAAACGCTGGAGTTAAAATTGAATGTCCTTCCAAAATCTTGAACCCTGGGACTTACAGCATTAAATCAACACCAAGA +TTCCTTCTAGTACCAAAAAGGTCATACTGCTTCGACACTGATGGAGGGTACCCTATACAAGTAGTTCAATCTGAGTGGTC +AGCTTCACGAAGATCAGATAATGCCACAGAAGAAGCATGCCTACAAACAGAAGGATGTATTTTCATCAAAAAGACAACCC +CTTATGTAGGAGAAGCAGATGACAACCATGGAGACATTGAGATGAGGCAACTCTTGAGTGGGCTTGGCAACAACGACACA +GTGTGCGTTTCCCAAAGTGGATACACAAAAGGAGAGACCCCTTTTGTAAAGGATTATTTGAGTCCTCCCAAGTATGGCAG +ATGTCAGTTGAAAACTGACAGTGGAAGAATCCCAACTCTACCTTCTGGGTTGATAATACCGCAAGCAGGGACTGACTCTT +TAATGAGAACTTTGACGCCAGCAACAAGGATCTTCGGAATAGATGACTTAATCTTCGGGCTTTTATTCGTGGGGTTTGTC +GCAGGAGGGGTCGCAGGAGGTTACTTCTGGGGAAGATCAAATGGAGGGGGTGGTGGTGCCTCGGTGAGCAGTACGCAGGC +TGGATTTGACAAAATCGGAAAAGATATACAGCAGCTTCGGAATGACACAAATGCAGCAATTGAAGGCTTCAACGGGAGAA +TTGCCCATGATGAGCAAGCCATTAAGAATTTGGCAAAAGAAATCGAAGATGCAAGGGCAGAGGCTTTGGTAGGGGAACTT +GGTATAATAAGATCCCTCATAGTTGCCAACATAAGCATGAATCTAAAAGAATCTTTATATGAACTAGCAAACCAAATAAC +AAAAAGAGGAGGAGGAATTGCACAAGAAGCAGGCCCAGGGTGTTGGTATGTTGACTCCGAAAACTGTGATGCAAGCTGCA +AAGAGTACATTTTCAACTTCAATGGAAGTGCCACTGTCCCCACATTGAGGCCAGTTGACACCAAGGTTGTAATAACATCG +GATCCTTATTACTTGGGTTCGACCATAGCTCTCTGTCTTTTGGGGCTGGTGGCGATTGCTGCTTCTGTTGGTGTGATTTG +GATCTGTTGCAAGAAATAGAATCTTAGAAAAAATCTCCTTGCTACTGCT +>NC_036617.1 Influenza D virus (D/swine/Oklahoma/1334/2011) segment 5 nucleoprotein (NP) gene, complete cds +GGCATAAGCAGGAGATTATTAAGCAATATGGACTCAACAAAAGCCCAAACGCCTGAAGAGCAGAGAGCAAAGAATGCCAA +AACCATCCTTGAGAACATACAGATATATGAAAGGATGTGTGATCTCTTTGGGGTGTCAGAAGATGACAAACTGATAATTG +AGAACAGTATTTCAATTGAGAGGATGATAAGAGTTGTAACAGATAAGAAATACCAAGACAAAAAACTAAAGAATGCTGGA +AGTGATCCTGAAAAGATTGCAAATGCAGGGAAAGTTTTCTGTCGATTGGTGGAGTCAACAGCTGGGAAATGTAGTGCAAG +ATTGGGAATGGCACTGAAACCCAACGTTGAGGCAGTCCTGACCGATGTACTCGGGAATGAACTGGATAGGGCTGCTGTGC +TTGGGAAAAGAATGGGGTTTTCAGCAATGTTCAAATCAAACCTGGAAGAGGTTTTGTACCAAAGAGGAAAGAATCAGCTT +AAAAAGAGGAATGCTGCAGAAACTTTCACTCTTTCACAAGGTGCTTCGCTAGAGGCAAGATTTAGGCCCATAATGGAAAA +ACACCTAGGTGTTGGGACTGTTGTGGCGTCAATAAAGAATATCCTGGCAAGCAAAAAGAACGGGAACTACAGGAACAAGA +TGGTGAGGAAACCTGGAGGAAACAGAGAGAGCTGGTCACCATTGGAGAGAGAGATATCCTTTCTGAACAAGAAGTTGTTT +CCTGGACCAATGAGGCAGCTCTGCAAGAAATTCGAATACTTGAACGAGCAAGAGAAGCAACTGGCCTTAAACCTTATGCT +GGATGCAAGTCTCATCCTAAAACCGCAAGTGACTCACAAAATGATAATGCCTTGGTCAATGTGGCTGGCTGTGAAGAAGT +ATGCAGAAATGAACAAGGGATCACCCAGTCTTGAAGACCTCGCAGCCTATTCTGGAGTAAGAGCCTTTATGGCCTTCAAT +ACAGCTTGCTACATGAGTAAATTCACCATTGGGAAGGGAATTGTGGGAGATGCAGAGATCATGGAAAATGGAAACGACAA +GATGCAAACTCTTGCAATGGCTTGTTTTGGACTGGCGTATGAAGACACCGGGATTGTTGCTGCAATGATCTCCCAACCCA +TGAAGAAAAGATATCAGTTGAGAGTGGGGAACTTCAATCCTCCAGAAAAAGGAACAATAAAAGGAACAAGCGCCGGCTAT +TTCCACAAGTGGGCTGAATTTGGAAATAGGCTGCCTTTCAACAGTTTTGGAACTGGTGAATCCAAACAGATAAGCAACTC +AGGAGTGTTTGCAGTGCAGAGGCCCAGCACTACTAACATTCAAAGACTGGCAGAGCTAATGGCTAGGAATACCGGAGAAA +CCAGCGACAACTTTACTCAGTTGGTTCAGAAAATAAGAGAACAAGTGGGGGCCTTTGCTGATCAAAAAGCAAATCTTCGA +GAGTTCACCGGAGGATATATTTATGACATTACTGACGTAACGAAGAGCAACCCCAAGATACCTCAGTTGGGTGGGGACTC +TTTCTTCTTTGAGTTCACCGGAAGCGACGTTCCAAGAACTGGAGCCAAAAGAAGAGTGGGAGGAGCTGATGATGTGACCC +CTGGAACTTCCCAGCCCAAGAAAAGAGGAAGGCAAGGTGCCGGAGCAGAATCAAGTATGGACATTGAAACAGTTGGTGAA +GATTAACTCATCTTTGGATGGTTCTGTTGCAGTCCCCAGTGGGTGTTAAAGATGTTGGTTTGTCTTATTTAACAAAAAAT +CTCCTTGCTACTGCT +>NC_036620.1 Influenza D virus (D/swine/Oklahoma/1334/2011) segment 6 P42 (P42) gene, complete cds +GGCATAAGCAGAGGATATTTTTGACGCAATGGCACAAGAACAACTACTTGCTGAACTTGAGGGATACCTCAGAGGAGTTA +ACCCAATGACCAGGCAAACGATTATGAAGTCTGCAAGAGGTGGGATGGATAGTGCTAAGGAGGCAGCAAAAGCAGCGAAG +AAGGGAGAAATGCAACTAACAAGTGGAGAGAGCATAGTGGTGCACATATGCCTGAGAGCCATGTACCCTGGAATAAAGCC +ATGGTCAGAAGCCAAAAAAGATCTTGATAAAGCTACAGAAGGACTGAGTGGAAAAGACTGCAAAAATATAAGAAAAGCTC +TGAGGAAGGCAGGAGACCTGACAGGGATAAAGGAGATGATGATGATGTATGAAATGAGGGAGGACAAAAAAGCAGAAATG +GTAGAGCAAATCTACGATGACCCAGAGGATTTTACAGAAGATGTAAGGCTTGGGACCGTTGCTGCCTGGCTTCAATGCAA +AAACAAAAGGAGCGAGAAATATCATCACAAGATGTCAATGTCTGGAAGCACTGCACTTGCCTTGGGAGATGCCCAAAAGG +CCGGAATGGCCATAGAAAATATGGCTAGTGTTGTGCCAATGAAAAAAGAGGCCCAGGCACTGCACAAAGACGCAGAAGTT +TTGATTGAACTGGCAAGAATAGCATATGGGTCAAGAGCAATGGAAGGGCACCTGCAAAATGCAATGGACGGAATTGGAAG +CAAAGTCAGTGGAATGGCTAATCTTGCCCTAAAAAGGTCAGTTCTTACTTTGTTAATGTTGGTAATTTGTGGGATCCCCA +CTTGTGTAAATGCTGAAACTGTGGAAGAATTTTGTAGAAAGAAACTAAATCAGACGGAAGAAAAGGTTTATGTCCATTGT +TTCAATGAGGATGATGGTCGGGCAATGACTTTAGCTGCTTTGATACTTGGATGCTTTAGTATGCTTTACATTTTAATAAA +GGCAATACTGATGCTTTTGTTGACAATCATAAATGGAAGACCAAATGGAAGTTGGGATGACTTGAAACATGTTGTAAAAT +GTTTTTCAGAGACTGGAAGTGAGAACTTCGCCAGGGATATAATGGTCCTGGAATCCAGGCGAGATGGGGAGGAGACAAGC +TCCCCAGAGGAGGGACTAGGCCCTCCATTGAGTGGATTCAATGAAAATGGTGTATTCATGGAAACATTATAATCGCGAAA +AAATCCTCTTGCTACTGCT +>NC_036621.1 Influenza D virus (D/swine/Oklahoma/1334/2011) segment 7 nonstructural protein 2 (NS2) and nonstructural protein 1 (NS1) genes, complete cds +AGCATAAGCAGGGGTGTACAATTTCAATATGTCTGAAAATAAGTCAGTGAACACAACAAATATCAGAGCAGCAATCTCCG +AATTGGCATTGGGCGCAGCCAGCTGGATGGATTCCTCTGGGTTAATGACTTTCGAGAAAATGAGAAAGTCTGCTGAGAAT +TCACTGAGAGTCGAACAGGTTTATGAACCGAGAACTTGGGAAGATGCAGTGGCTGAAGGTAGAGAAATTCTAGGATTCAC +TACTATTGCTGCCTTAAGAAAACCAGAGGAGACTCATGCTGTTGAATTGGGGAAGAACATTATCTATCCCTTAGGAGGAA +ACCCTTTCTATCTAAGCCCATGTACCATTGACACTCTGTATGAGCCAAAGCTCATAAGACAAGGAGAAGTCTTTGGAGTA +AAATATCGGAACTGCAATTGCTTTGTAAAAACTGCTGAACTATTAGTGACCGACATGGGAGAAATCATTGTGCTCTTTTG +CAGAAACACTGAGAAACCAGCTTACTGCCTTAAGAATTTCCGTAGAGGAGATGACCCAGAGAAGTCAGTACGAAAGATAC +TCAGAATTTGGAGAAGTGGACTTGTTGTTGCCGTTGATGCGGAATCTAGAGATGAAATCAGACGATACAAATCTGGATGT +GAAACAGATCCCTTCTGGAGAAGAGAAGGCGCAACTACTGGAGAGGTTCAGGAGTTGCTTGGTGTCATTGATAAGGTTGA +AATCCAAGCTGGGAGTAGCGATGGTGAACTCTTTGACTAACCAGGATATGAGGGCCGCTTTGGATGAAATCAAGTCAGTT +TCGAGAACAATTTCAATGTTAAAAGAATGTATTCGTTCTTTAGTATGAAAAAACCCCTTGCTACTGCT +>NC_060925.1 Homo sapiens isolate CHM13 chromosome 1, alternate assembly T2T-CHM13v2.0 +CGTGGTCTGGGATGTGGCCCCGGTGAGGACCCGGCCCCATCAGGCACAGGGTGGATGTCT +GTGGAGTGAGGTGTGTGTGACATATTCATGTGACCACCCGTGCAGCGTCACGCGCCTGGC +CCTGCCGATGACAAGGGTGTGGGCCTGCGTGGGCATGACTGTGTGTGTGACACAGAGTGA +TGTTGCTGTGACCCGTGGCTGCACTCCCCACATCACCGGCTTTCACAGCCTTCCGGTAAA +GTGCTGTGTTCTCCCTTCTGTGTCTTCGCTGGGACCTGGGGCAAGGGTGGGTGTGGCCCC +CACAGCTGGAGTCAGCTTCTGTGGGGCCTTCCCGAGCCCTCCCCACCCTGGACCAGAGGC +CCAGCTGGTTGGAGCAGGAAGTACCTGGGCTCTGGGGTCAGGGATGGGAAGGCTGAGGAG +GCCTGCGTGAGCTGGACCTGGCCTGGGCCCTCCTGGCCGTGCCTGCCTGGTGGTGCAGGA +TTCCTGGGGCTGATGACAGACGGGGTAGGGCTGGGGTTGGCGAGCCTCCTGCCGATACCT +CACGTAGCTGACCTCTGACTCTTCCCCAGCCAGGCTGGCCCTGGGAGTTGCCGGAGAGTC +AGTGGATCTGCAGGCTGCACGCTGGCTGTTACCTTTGCTTCTGGGTTCCCACAGGGGTCA +TGGTTCTGTGGTTCTCCAGTCAGGGACCCTAGCAGGGCCATGGGGCGTGACTTCCTGGAG +GTGTGGCCTAGTATGGCCACGGCAGAGGATGGGGGAAGAGAAAGGCCCCCTTTGTCAGCC +CCCGGGCTCTGAACCAAGCTGAAGCCCTCCCCCTGGTCCAGCCTGCCCTGCCCCAAGTGT +CCTGGgcctctccccatctccctgggGAGCCTCACATTGCTGAGTCgccagccaactcca +gaaacccccagCCTGTCTGCAGCCAGAGGGGCTGGGAATTGGACCCCCTAGAACCTTGGG +CCCACCTGTCCCAGTGGCTGCTGGGAGTCTAATTCTGTCAGGGTATCCTctgggttgagg +ctgcagcagggGCACCCAGGGTGAGGCCCTCTTGCCAAAGATGgatacaaataatttatt +ttaaaaggtacaatTCACAAGGTTGGAGGGGTAGCTGGAAGTTTCTGTGGTTACCTTGCA +CTGGGGGGCTGCCCTGCCTCCACTCTCTCCCCACAGTCCGAGGGCAAGATGAGCACCCCC +ACCCAATGGCAGGACCAGCCCTGCGGGGAAATGTCAGCATGAGTGGAAGCACGGCAAGGC +CCCTTCCTTCTTGGCAAGGGGCTTCCCTGGCAGGCAGTTCAcagggtgtgtgggtggggg +ggaTGCTGACCAGCTGCTCTCCTGGACCCTTCCTGTACgagcctgtttttttttgttttg +ttttgagacagggtctccctctgtcgcccaggctggatgcagtggtgcaatcttggctca +ctgccacctccacctccccggttcaagcagttctcctgcctcagcctccccagtagctaa +gaggcacccaccacgatgcccggttaatttttgtatttttagtagagatggggtttcacc +atgttggccaggctggtgtcaaaatcccgacctcaagtggtctttctgcctcagccctcc +agagtgctgagatgacaggcgtgagccaccgcgcccggtgagACTGTGGTTCTTGGAGGC +TTTGGGGATCCTCTTGTCCACCCCATCAGGACCCAGCCTGGAGAATGAGGGGTGGACAAG +CTAAATGGAGCCTGGTCTTGGTGGGGCCCCGGTGGAGTCCTCAGAGATGCCAGGCTCCTT +TCGCGTCCTCGGGGACCGACTTCCAGTGGCTGCTGTGCCCTTGGGCCCCCCAGTGGGGGA +CGCCCCATGGAGCTGGGCGAGGGCGGCTGACCTGGGCAGAGGCTGCTGGCCCTAATTGTC +AGTCAGAGGCCCGAGGGGGGAGGCGGCTGTGCTGGTGGCCGGGGGCCgggggggcagggg +caggcagcGCAGGTTCCCGGTCTTGAGCGCGCACTGCACCGGCCAGAGTGCCACACAGAA +GAGCATCAGCAGCAGGGCAGAGACCAGTGCCATGCGCCTCCAGTCCCTGCAGCGCGCCCA +GCAGCGGGCCAGGCGGCCCCGGCGGGGGGCAGGGTCCCGGGCGGGCACGGGCGGCTCGGC +AGGCTTGCTCAAACCCACGTCCACGCATACGAAACCGGGCtcgcggccaggtgtggtggg +cagTGGCTGGCAGCACAGCTTGGTGCCCTCCAGCCACACAGGCTCCTCACGCCGCAAATG +CGCCGGCATCCGGGCCTGCAGCTGGCGGCTGGTGCACAGCGCGGGGGCTCCGGCGGGCGG +CACGGCCGTGGGCTGCCTGCAGAAGGGGCAAGGTACAGCCTCACCACCGGGGCGGCCCAC +AGGCTGAGCAGCCGCCAGCCGGGCCAGGCACTCCAGGCAGAAGACGTGGGTGCAGGAGAG +CTCCTTGGGTGTCTTGAAGATGTTGTCATAGCCTGAGAAACAGATGGAGCACTCCAGGGG +GGAGGCCACCCTCTCCGAGCCAGGGGTGCCAGGGGACCTGGGGCTGCCGGCCGAGCTGGG +GGACCTGGGCATCGAGGCTATGGAGCTGCTCCGGCGAGGGGGTGGCACAGCCGTGTGCCA +CACCTGCTGGCCTGACGACATGTCTCTGAGCTGTGGGACAGGGACTGTGGTAAGCAATCA +CCGGCCGCCCCTTTCTGGTGGTGTTttatctctccctcccctctctcgcCCCAGAGATCC +CAGGGAAGGACTCTGTTTCCTGCGCGCCACTCCAGAAAGTTCCTCCGGTGCCCCTGGAGG +TCATTCTGCCCCACGTGCAATCCTGTCCTCTCCACCCCATCACATGGCTGCACCGGGGTG +AGCCTCCCACAGGGCCCCAGGCCTGCTCCGGGAATGCAGGCCGTGTGTAGGGGGGTCTCA +CTGACCGCTCGGCAGACACCTCCTGTTGGCCCTGCCCCACCTGGCTGGCCCTGCTGCCCG +GGCAGAAATAATGGTGAGGATGACAATAGCCACAGTCGTCACTGTTTATGTCGGAGCTCT +GCAAGGCTGGGCCCACATCACGGGACTCACACAACGCCACAGTGTGGAAAAGGCCGCCCA +GAGCATGGGTGACTCGGCCAGGGCCACCCCAAGGGAGCTGGCGGGCCCTGGACCCTGGCA +GATACGGCTCTCAGGCAGGCCAGGGACTCCAAGTCAAGTGAAGTGAGTTTGAACTCAGAT +CCCAGGATGGGTGCCTGGCTTGGGCGGTGCAGGCCTGATTTGTAGGCAGCTATGtgaggg +tggggtgtgggggtCTCTGGGTCTGGGGACCGGGCTGAGCCCCGGGGGCTTTGGGACGAC +AGGGAGGgcccaggcaggggcaggggtcagtGCCCGAGGAAGGTGCACGTCAGGCACGAC +CTGCGGCCTGCGGGGCCGGCTTGTCTAGCTGCTGAGGGTCTGATGTGCACAGTGTGGGGG +TGGGACTTGGATAAGCCCAGCCATTCCCTCTGGGCCAGCCCACTGCCTCATGGTCAGGTG +ATGGTCAGGGCACCCTCAGCCGCCCACTGAGTGGGTGTTTCTTCTCCCTGACCCAATCCC +ACTTCATGGCAGGGACCCTGGGGGACGGACACTGGGGGATGCTGCTCTGCCCCTGGGCat +ggctcaggtgggcatctcAGCTGACCTGGGACCCTGCTCCACCTCCCGCCCCTCCCCTGC +ACCCAGGATCCGCTGCAGGGAGCCACAGGGGTCCCACCTGGAGGGAAGTGGGCaagggtg +acagtgagactcaaGGGCCTGGCCGTGCGTCCCCGTGGGGCCCAGGAGGCTGCCCCAGAA +GTGACTCCTGGCActgccccgccccacccctgACTTGCCAGTGAGTCCCAGACAGGCTGG +CGGGATGACACAGGTCACTGTGACCACCTGAGTCACACGCCGTCACTGCGAGGCCGTGAG +TGCCCCAGGCACCGGGACCTGGGGACTGTGCTCTGCGGCCTGTGTACCCCACAGAACCGG +TTCCTTGGCACGAGGCCCCACCCCTCCACGATGGTGCCCCACCCTGAGCCTGTGCAGGTA +AGGGGTGAACACGGGCTGAGCTGGCCTTACCTGGTGGCCGGGGGTCAGCGGGCCTGGGCG +TGGTCCTCCTCGCCGGCCACGGTTGGGCTCCAAGGCCCTGGGCTGCCCTGCCCTGGCAGT +GTCTGCTTCCTCTTCTCCGGGCCCGGCCCGGCCTGTGCTTCACCCAGCAGGTATCCCTCC +CCGGGGCCGGCCACCAGCAGCTGTCCCGGTGGCACTGGTCTGGCAGGTGTGGCTTCTGCT +CTGTCCAAGACAGGCGGGGACACAAGGAATGCGTGCGCCGTCACCCGCACAGAGCTCTGG +TCTGAGGCAGGTGTGAGTTGCTGGGTGTGGGCTCCCAAGCAGGTCTATTTATACCCTATG +GGCCAAGGGTGTGGCCGCAAGCCTCAGGGATTGGCTGGCTTCATCCTCTCCTTGGCGGGC +CAGGCagctggagggcagggagggaggggtgagggTCGGAGCCGGGTAGGGGTCAGCACA +GCCGCTGCAGCCTGGGCAGGTCTGGGCTGGGGTGTGTGCTTGGACAAAGCCCTCTCTCCC +TATAGCCCCAGGAGGCTGGAGCACCTGCTGGAAGCTGCTCACCGCAGTTCCAGGTCCCTG +TGGCCCCTGAGCTCCTGGGTGGGCCTCCTAGCAGGGGCCCTCCCCGAGCCCCCCACAACC +TATGCCCAGCCTGCCCCTGCCCTTTGCTCACTGCTGCCTGCCCTCACAGCCCATTCCTGC +CACTTCCCTGCCCACACCCACCCATGTGCTCACCTGCCTCATCCATACACATACGTGGCT +GCTCTCACACATGGGCCATGTGTTCACACGCTCTATGCCCCCGTGTCCACAGGCTCTCAC +ACACGTGCCGTGTCCGGAAGCTCACATATGCCATGTCCACACTCACACACGCCGTGTCCA +CACTCACACGCCGTGtccacactctcacacacatgcCATGTCCACATGCTCTCACACACG +TGCCctgtgtccacacacacacacatgccatgTCCACATGCCCTAGCAGACTACAGGACT +GGTCTGTGCAAAGACCAGGGCTGGAGCTGGTTGAGAgtctgggggctgaggctggcaggg +ctgggatggAGGATGTGTGGGTCTCAGAGGAGCAGCCAGTGGCATGGGCTGCCCCGTCCC +CCGCACACCCCGCTGTGGGCCCGAGGGCCTGGTGTAGAGCTGCACCCCCAGGCTGTCCAG +CTGCCAGCTCCCCACCTCACTGAGGCGTCTCTCTCCCAGCCCAGTGGACCTCATGCAAGG +GGAGGTCCGACCCGGCTGCCACAGCCCCATCCCCGCCATGAGGCCTGGGCCGGACCTGAG +CTGGGACTccacacaccagcctgggggGGTGTCACactgggtggggctgggagtgAGGGA +CCCACCCTAGTGGGAGAGCTGGCCGGGCCACCCCACAGACTGCCCTCAGGCAACTCCCAT +GCAGGTGCCCGCCGACCCCTCAGTAGGGACCCAGAGGCTCCCCCAGGGCTGCCGCGGGCA +TCCTGGAGCCCAAGGGATGCTGGGAAGTGGGAACCAGGACTGCAGAGGCCAGGGGGCAAC +ACCCCGAGGAGGAGCACAGGGACTTGGGCTCAGGAAGGGCCGGACCCCTGCCAGTTCCAT +GAGGACTCTCAGTCGGGGGTTGGGGGGACCCCTGCCAGTTCCATGAGGACTCTcagtcag +gggttggggggaccCCTGCCAGTTCCATGAGGACTCTCAGTCGGGGTTGGGGGGGTTCAG +AGAGCGGATTTGGGTGCTCAGACAGGGAGGGGTGGATGCTCAGAGAGCGGGGCgcgggct +ggggctgggctttCAGACAGGGAGGGCTGGGGACTCAagagctggggaggggtgggagct +CTGTGAGGGGCTCCGTGCGGGGTGGCTGAGGCTATGGGAACTCtgtggggggaggctgag +gctatggggactccgtggggggaggctgaggctatggggactccgtgccgggaggctgag +gctatggggactccgtggcgggaggctgaggctatggggactccgtggggggaggctgag +gttatGGGGACTCcgtgctgggaggctgaggctatggggACTCCATCGGGGGAGGCTGAG +TCTATGGGGACTCcgtggggggaggctgaggctatggggactccgtgccgggaggctgag +gctatggggACTCCGTGGGGCAGGCTGAGGCTACGGTGACTCCGTGCAGGGCTGTGAGGC +TACGGGGACTCCGTGGGGGGTGGCTGAGGCTACGGGGACTCCGTGGGGGGTGGCTGAGGC +TACGGGGACTCcgtggggggaggctgaggctacggggactccgtggggggaggctgaggc +tacggggactccgtggggggaggctgaggctacggggactccgtggggggaggctgaggc +tacggggactccgtggggggaggctgaggctacggggactccgtggggggaggctgaggc +tacggggactccgtggggggaggctgaggctacggggactccgtggggggaggctgaggc +tacggggactccgtggggggaggctgaggctacggggactccgtggggggaggctgaggc +tacggGGACTCCGTGCCGGGAGGCTGAGTCTACGGGGACTCCGTGCGGGGAGGCTGAGTC +TATGGGGACTCCGTGAGGGGTGGCTGAGTCTATGGGGACTCCGtgcggggaggctgaggc +tatggggACTCCGTGCGGGGTGGCTGAGGCTATGGGGACTCCGTGCCGGGAGGCTGAGTC +TATGGGGACTCCGTGCCGGGAGGCTGAGTCTATGGGGACTCCatggggggaggctgaggc +tatggggactccgtgccgggaggctgaggctatggggactccgtggggggaggctgaggc +tatggggactccgtggggggaggctgaggctatggggactccgtcgggggaggctgaggc +tatggggactccgtcgggggaggctgaggctatggggactccgtggggggaggctgaggc +tatggggactccgtgccgggaggctgaggctatggggactccgtgccgggaggctgaggc +tatggggactccgtggggggaggctgaggctatggggactccgtggggggtggctgaggc +tatggggactccgtggggggaggctgaggctatggggactccgtggggggtggctgaggc +tatggggactccgtggggggaggctgaggctatggggactccgtggggggaggctgaggc +tatggggactccgtggggggaggctgaggctatggggactccgtggggggaggctgaggc +tatggggactccgtggggggaggctgaggctatggggactccgtggggggaggctgaggc +tatggggactccgtgccgggaggctgaggctatggggactccgtgccgggaggctgaggc +tatggggactccgtggggggaggctgaggctatggggactccgtggggggtggctgaggc +tatggggactccgtggggggaggctgaggctatggggactccgtggggggtggctgaggc +tatggggactccgtggggggaggctgaggctatggggactccgtggggggaggctgaggc +tatggggactccgtggggggaggctgaggctatggggactccgtggggggaggctgaggc +tatggggACTCTGTGCAGGGCCGCTGTGAGGCCCTGAAAGCGCTCGTCGGAGGCTCCTGC +TTCCTGAGGACCGTGACTCGGGTCACATGCCGCCTCCAGGAAGCACCCTGGCCCCTGCAG +CTCTGGGAACGTCCTCCCGACAGCTCCTGGGAATATCCTGGCACTGAGGTCACTCTGGGC +TCCCGGCTGACACTCGTGCCGGAGGCAAAGGTGAGGAAAGGCCGGAGGAATGTGTGGTCT +CGGCGCCAGGCCAGGCCTCCCTGTGCAGGAGAGGAGCCAGCAGCTCCCCTTCTCTCAGCT +CAGACGGTCTCTCAGGGCTCTCGGGAGGCTCGGAGCAGCTTGGCTGGCAGATTCCAGGGC +AGGGGGTGGGCCCGCCTGGTCCCCTCCGTCGCAGCCAGTGGGCGGGAGGCTGGGCTGGTG +AGCGTGTGGGCGTGTGTGAGCACACGTGCCCATGCTTGAGACGTGGATGCTGGTGTGAGC +ACCTGACCCCTCACCTCCTTCACTCGGTCTCCTCACGCCCTCTCAGGGACTCCTTCCCCT +CCAGGCCTCGGTTACGGGTCACACCTGGCACTGCCAGGCCTGGGGACGTGGTGCGGCCGG +TGCGGGGAGGGGCCTTCCAGGCTGCTGTGGGGCCCCCGGCCtcgccccaccccgccccgc +cccgtgCTGGGCCATTGCCTCAAATGCAGCGGCTCTGTTGGCCGTGGGACTGGAATTCTT +TCCCAAGGGCCCAGATGTGCAGAGGGGAGGCCGGTGTGGGGGAGCAGGGCTCCGGGACGT +GCACTTGGGTCTAGCTTTGCCCCTGACGTGCTGGGGCCGCCCCTAGGCCCAGCTCAGTGT +GTCCCTCCTGTGCCCAGTGAGGAGGGCGTGCCCCTCGCTGCCACAGGTCCTGGCTGACCA +CGTGCTGCCCAAGGGCCAATCGCGAGTGCGCAGGTGGGGGACGTGGGGAGCCAGCTGAGG +GGGATATGTGGAGGTGTCAGGATGACCCTGGGTTTTTGGTTTGGGCCACTgggtgggagg +agaaggaggggaccCAGAATTGAGAGATGGGGCCTGGGGGGCTGCTCAGAGGGTGGGCTG +GGAGGTGCCTGTCTGTGTCTGGCCTGGCCTCCAGACCCTGCCTGGCTGGACCTGCTGTTC +GTGCCTGTTTCCGATTTTATCCTCCAAACCAGACGCCCAGCCTGGTGCAAATGCAGGAGT +GGAGTTTCCAGGGGGATGTGGactccttccctccacccccacctcggtccctgtctcctt +ccctccgCCCCCACCTCGgtccctgtctccttccctccgCCCCCACCTCGgtccctgtct +ccttccctccgCCCCCACCTCGgtccctgtctccttccctccgCCCCCACCTCGgtccct +gtctccttccctccgCCCCCACCTCGgtccctgtctccttccctccgCCCCCACCTCGgt +ccctgtctccttccctccgCCCCCACCTCGgtccctgtctccttccctccgCCCCCACCT +CGgtccctgtctccttccctccgCCCCCACCTCGgtccctgtctccttccctccgCCCCC +ACCTCGgtccctgtctccttccctccgCCCCCACCTCGgtccctgtctccttccctccgC +CCCCACCTCGgtccctgtctccttccctccgCCCCCACCTCGgtccctgtctccttccct +ccgCCCCCACCTCGgtccctgtctccttccctccgCCCCCACCTCGgtccctgtctcctt +ccctccgCCCCCACCTCGgtccctgtctccttccctccgCCCCCATCTCTgtccctgtct +ccttccctccgCCCCCACCTCGgtccctgtctccttccctccgCCCCCACCTCGgtccct +gtctccttccctctgcTCCCATCTCGGTCCCTGTCTCCTTCCCCACAGGAGGAGTCTGGG +GGCTCCCGCGTCACAGGGGCGTGGCCCAGGGCATCAGGTGGGGCGGTGGGTACTGGGCTC +AGAGTGGCCTTGGGCTGTCCagtccctccctttctccccaggACCAGTGACCCTCCCAGC +CCCAGGACACTTCTTGGGCCAGGGCCCAGGGCAGAGCCAATGCTCCCCCAGATACTCCCT +GGCTGCAAACCTCAGGCTGGGGGTTTTTGGGGACAGGGATGCAGGTGTCTAAGGACACGA +CCCTCCAGGCAGTGGACGTTTCTGCCTGGGTGGAGGGCACGGTTACGAGAGCAGGGCCCG +CGCTCTGGCATCCTGGTGCCCGGGCCCTCTGCCCTCAAGGC +>NC_060926.1 Homo sapiens isolate CHM13 chromosome 2, alternate assembly T2T-CHM13v2.0 +GAATTCCCACAGTATTCCCGGGGATAGAGTTGAAGTCTTATGTGTAGAAGGAACTCATTT +GATTATTAATCATATTCCCAGAGTcatggaaaaaaattatgtttccagGTTTCAACGTCT +GCTGAACATACCTCCCCCAGTGCACTGGTGACTGAATTTCTGGGGTAATTCGGagccctc +ctccctgccctcagAGGCTGGTGAAGACAGCGCTTTCTAACTGGACATTCACTGTCACAG +CAGCATTTCAACACCACGTCCCTTCTCCACAGACGGACATAGAGGTTTGGGAATAAAATA +GAGGTCTGCAGCATAGTGCCTGGCGGGAGACCAGGTGCTGAGATGCCAGATCCTCTCTGC +CACCTGTGATTACAGCATCTAGGATTCAGCATGGTCCCGCGTTGTCCACGTCCACCTGGG +GTCTCCTGGTGTGCACACTGCCTGCAGGCTCCCAGGCTTGGGGTCTATACTGCACCTGCC +TCAGAGGCATCTCAGGGCCACCCATGGATGTTTGATAAACAGGCCTTGGAATCATAAAag +tgtttgtgtttctgttcATCTGTGTATCTGCATGTGTGTGAttaggtatgtgtgtgtatc +tgtgtgtccctgtgtgtcaCTGTTtcagtatgtgtgcatgtgtatctgtgtattgtgtgt +gtgtgcatgtgcacatgtgtgtgtgcctgtgtattgtgtgtgtgtgcgtgtgctgATCAT +CATGTTTATGGAGGAATTGGGCACGGTCCCTTTGAGAACTGGGAATCTGGTCAAGATGAC +GTCTCaggttttcttctattaattctgATTCAGTCTTCTGAGatttacagagaagcaaag +taCAATAGGTATGGGTGATCATAACAATCTGGTTATTCAGGCATGTGCAAAGTGTTCACC +AGTGTTCTCATTTGCAAAAACACAGAACttactatttttctttgctttggagatatatat +atacaaaatgccATAAGGAAATTCATGTACCAAAAGCTAAAATAGTCTAAATAGCCAATT +AGTTTTTAAATACATTCATTGGTCAggcttcttgtttttcttcttctttaaaatattcag +tttacTATTCAACAGGAAATGAGTtgggaaaaataacaaaagttaaaACCAGCTGTTTGG +ATGTCTATGCTAATGTCCAGTTCAAGAAAGGGAAAATCGGCTAAGGAacaagttttgttt +gttgttgttttgatgaTGTCTTCTAATGATTAAACTTACAGTAGGAGGCCTTCATGGTag +gaattgttttatttatatttttttcaaaaaatgtcttTCCTGTGTTATTTACAATAGCAC +ATGTTTTTCTGGAATAGATCTCTGGGGAGGCGAAGTTGATGGTATTTCAGCACAAAATGG +CAAAAGTTTGGGGCGGTGGGCAGGAGGCCCTTGCCACTGTGGCGCCAGGAGACTGGGTAA +GGCGCCCACCACAGGGCTGGGGATCTCAGGGGCGTCTGAAGAGGAAGAGCTGGCTCGGGG +CGCTCGGGGTAGCACAGCCACACATCCAACCACGGCGCGAGAATCAAGGTGCCAGAATCA +CAGGACGCGGGAATCACGGGACGCAGGAATCACGGGACGCGGGAATCACGGGACGCGGGA +ATCACGGGACGCGGGAATCACGGGACGCGGGAATCACGGGACGCGGGAATCACAGGGTGC +CGGAATCAAGGGACGCCAGAATCACGGGGCGCGGGAATCAAGCTTCTCCATAAATGACTG +ACGCAGGGGAGACATGCCAGAATTCTCTGAGTGGTGTATTTAATACAATGACAAATAATT +CGTATGTGGTCTTTTCAGTAAATGTTGTCCAGTGACTACTCTCCCTCAACAATTTAGCTC +ATACACGGGTTGGGCTCAACACACGCAAACAGCTTTTCACCGAGCTTTGACGGAAATGAG +GCTGCGCTGAGGCGGCGCTGCGGCTGTGGAGATGCCCAATTCGTGGCGCCAGCGGGGGAG +GCGGCGCCAGCGGCTGCGCCACGTTTTTTCAGGAATTTGTCCTTCTTCAGAAAAGGAGAA +CACTGCTTCCTGCTAAGCATTTGGATTAGGAGACGCTGGCAAGATTACAGACATGTTGCG +ACCCCCATGCTGAACCTAGAACCTCATACTGGTTTTCAGTCAACATTGGTGAAGGACACA +GTCCACTGCCTGCGGAGGCCCCGAGGAACACGCGTGTAAAAGCTGCGCCCAGACCCGCAG +ATCCCACAGCAGCAGCCTTTGGTCTCGCGCCAAGACCTGCCCCACCAGATCCCACCCGCC +CCACCGGCCTGCCCCACCAGATCAAACCAGAGCAGCAGCCTTCCGTCCAGCGCCGAGACC +TGACCCATCAGATCCCCGCCTTTGCTGGGGTACTGCGGTGGCCACAACTCGCATGGAGCG +CCGCCtgggaaagggaggagaggaCGCATGAGATCAGAAACACTGGCTGCCGTAAACACT +TACAATGAAAATAACGTAACAAATAAGCGAAAggtaaaatgtgaaagaaatCCAACAGGT +CTGCAAAAATGGCTGCCTGGCATCACTGAATCCTAAAATCTTCTTGGTGTGGAAGACTCT +GTTATGATTTCACAATATGGCAGCACCAGGTCCCTGGGCGCACACCCAGCCCGATAAACA +CACCAGCATTTGCCACCACGAGTGACCTAACTCAGCGTGGGCCCAGGATAAGGCCAGTTC +TAAATTATCACAATGCTTTTACAATTCTCTAAAACGTGTCTCTATAATTCATATGCCTTA +GTCTTGCctgttcttttatatatattacagGTTTTTTCCTACCATCCTGCACTCACTCCA +GAACACAAATTGATTAATTGGAAGAGTGATAGGTGGTAGAACTGCCTGGCACATTCCCtg +ttcccttctctcctttccttccttctctcccttcctccttccctccttccctcccttcct +cccctcctcccttcttcccttcctcctttccccgcttccttctctccctcccttcctttc +ttcctcccttaattcctttgttcctttcttcctccctttctgccTTCCCTTATTTCTTTC +ATTGTTATCCGAACATATTTAATTGGATTTTCATAGAATTCAATGAAACATAATTGTACT +ATAAGAGTTTTGCTGAAATGGTCAAGCCCTATCCAGCCCTATCTAGGACAATCTGTGGTG +ATTAAGCCATGAAGTGAATTAATTCTTGCATTCATTGATCTATTTAACAAGCATTTGATC +CTATTACTTGCTTGCCATTGTGCTGGGTGCTAGATGTGAGGCCGGGAGCCCCCGACAGAT +GGAACCTATCCGGAGGAGGCTGTGCTGACCGGCTCTTCTGCGAGCCTCTGGGATTGTCAC +CAGGGATGGGTTTATCCCTTTCTTCTTGGCTGTAAATCTTCAGTTAAATTTTCACCTCAG +AACTTTCAGTGTCTCTCTTTTTCAATTCCTTCCACATTCATATGCCTCTTACGACTTTCT +tagaagtattcttttttttcttcacaaatgCTATGTTTTCATCCTTTATTCCCAAAGAGA +CTGTcctgtgtagaaaaaaaaattcaccctgCCTTTAGGGACAAAAGAACTAGGTTTGGG +TGACGCCTCCTTGTCACTGGGCACTCCTGGGAGTCGCAACTTCCGAGCCAACTTCTTCTA +TTAAATATCTGTGGAAGCCTCTACTTCGTAGGATTCTTATAAGGAACCACTAAAATAATG +CTCAGAGCATTACTACAATCAAATTATAAGTTTTATCATTATTCTATTCATGTTAACCTG +GAACTTTAATCTTTACCTGTTTCATCTTTaaatcttttcaaattattttcagttcAAAAT +GTCACATTTTTCATGAAGTGACCTAAAAAAATCACCAAATGAAAATCATATCAACCTAAT +TGGAAGTGTCGTGGCACCTTGCCCCTCACTTTAGAGAGTCGATTCTTCTCCTGAGATAAT +CATGCTGGAGCCAGCCTGGATTCTGGTGTCAGGCGGCGGCCCTGAAACTTGCCAACGCCA +CTTCTCCTGGTGTAGCCTTCACAAAGGGTGCCCACCAATTGCACGGGCAGGTAAACGAAG +GCCTGGAGTTTGAAATACATGTTTCCTCCTGGCCCTCCCTTCACTGTAAGGGCTTTTGTA +TAGCCAATTTGAGAAAAATGACGTTTTTAGGTGTAGGCAGTTTGAGATCATTTTCAAGCT +TTAGCACAGCTTTATTTATGCACACTGCCTACTCCCTAATGTAGAATTATCACGTGGAAT +CCTTAGTGGAGTCCACCTCCCTAACGATGCTGTTTTCTATGGCATGCTAAAGATAATTAG +TTGTATCTTTTCCCACAATTTCTATACAAGAAGTCATATTTAAAACTCCAAATCAACTTG +AAATTAAATCTTTGTAATTCCTTATTGTGTAGAATGAAAGGTGCTCTGTGTActtgcaaa +aataattaaattaggaaaaaaaagaatttagaaacaGATTCATGTCCTCACGGCGGGTGG +CACTGTCAGCTGCTCCCAGGGCCAGCCCTGCCGGCATGCTCAGCTTTGACCTAAGTCTCA +GCTTCCTCCGAGGGGATGGAAAGACCCCAGGGTGCACAGCGTCTCCTCCTTCCCCTAGCC +TCTAGGTCAGAGCTTGACCCGTAACAGGTCTTTGTTAAACATTTGCAAAGTGAACGTTGC +CTCAATCCCTCGGAACAATAACCACACCAGCAGGTCAAATCACTGCCTGGAGTGGAGGAG +CTCATTTCAGAGAgaagttgtgttttgttttgttttgttttgttttgttttaatggcaAA +GAGATCAAAATGCCTTTTCTTGGTCATTAACTCATTTTGGTTGAGAGCATGAGAACCCAC +CTCAGCCCTGTGTATTCTGTCACCCTTTTgtggacatttttctttctttgttcttggcCT +GTTTTGTTGCTGTGTGCTGGTCTCAGTGTTCTGTTTCGATTCTCACAAGCTTCATGTGAT +ACTTCTTTAAAAATGGCAATGATAAATCAGTTGTTGAAACTCAGTTTTGCTCTAAGGAAT +GGCAAATTGTCCACATTCCGCATGCTGTATTTGTTGGGAAACTGGAAAATTTCCAGCGCA +ATTAGAATTAGGATATGCTTTAAAGGTCTTGACTCTCTCAAAAACCCTCCAATTTTCCGT +CCCCTTGGAATAGCTGAGACGACCTATGGCCAGTGTCCATATGACAATGCTGACCCCAGA +AAATTAGAAGAGCGGCTAGAAGGAATTCTCATGGGGCCCAGATGTAGAACCACATGGCTT +TCAGAATCAAAGCCTATAAGTACAGTCTTTGCTGGAGATCTGATGATGCATGTCAGCAAA +GACAGGCAGCCTGGGAGTGTTAAGAACTGAAAGCTAGGCTCTCACAAAGTGATGATGCCT +ATAGTTTAAGTTCAGAGTAAGCCAGCCCTCTAGCTTTCCTGGAAGCCCAAGGCAGTAGGG +AAAGCATATTTGgatacaccaaaaaaaaattgactattGAATGGTATGAAGTGTATTGCC +TTTATCCGTCATAACCTGTGGGGGCTGGCGATGTGGCAGAAGAAAGGATGCTTCCGGTGT +GGCCACTACAATCATGGAAGACATCAAAGAGGGACGGATGCAGCCTCCAGGGAGATGGCA +TGCTGAGGGAACCAGACAGGAGAGAGGTTCTCTGTTGGTCCAGCAGTCACATGTTCCTCT +GAGCTGAGAACATCTCTTTAATTCTTCTCCCAGATAGCATGGAATTCTACTCTAACTTCC +GTAATATGTTGGATAATTTTAATGGGTGTTCCATTTGAAGAGGGCTATCTACAATTCGTA +TGATATTGGTCAGTTAAACACCCACAGGTGAATTGACGATTTTCTTTTAGTCTAAGTCCT +GAAAacctttattctattattttattattacactaTCATCATTTCTTAGAGAACAATAAC +TAAGTATTTATTTTGtcaatttgatgtttttcttagATACTTTTGCTAGTTCATTGCAGC +AAAGAACACCAGTGGGCAATCTGATAACTATGCGGAATCTGGGCAAGGCCTAAGATGCAG +CTGACAGTAACTGAGGCCTGTGGCTTGGTTAGGGCCAGAAACAGAGAACAGAAGGAGAGG +GATTTGTTTTATTCCCATTGACCCAGGGCAGGGAGGGACATCCTCACCTAGACAAGGTTG +GAACTTTGTAGGTCTTCCCATGATTCCTGCCTGCTTTGCAAGCACAAAGCAAACATATCT +TTCCAAAGAAGATCTTTGGTTGTGGAATCCTGGAATCTCACCATTAGAAGGGACAGCATG +GACAACCTGTCTCACAATGCAATGGGGTAGGTCAGTGAAGTGGCTTAACTCTTCTGGCTC +AGAGTTTCTCAAATTAGGACCCTCAATCCACATGCTTACAGACCACCTGGGATCTTGTCA +AAATGCATGTCCTCTGCCCCCACTCCAGTTTCTTGGGCTGAAAATTTGACCACCTGCTTT +GTAAGCAGATTTCCAGGAAAGTCCTATGCACCCTGGAGTCAAGGAGGCCACGGAGCCAGG +CAAGCCATTCCACTGTGCATGGCTCTCAGAACGTCCTTTCTTGCTGTGAACTGAAGTCTG +TGGTCCTGTGAATTTCTGTCATTAGCTCTCTTTCTGCCCTTGAGTCTTCCCAGGACAAGT +CTTGCCTTGTGTTGGAATCTACTTGCTACAGAGATGCAGCCCTGTGCCGTTAGCAGTCAG +AGGGCATGCAGAGGAGCATAACTGAGAGGGCTCAATGTGGGGGATAGGCAGAGTTATGGG +GCCACTCAAGGAGGCCCCAAGGGGTGGCAAGACACCCCAGCATTACAGACAGTGGGAGCA +GTCACCACCCTCATCAGAAGGGATAGGAAGGGACGTGGGGCACAGTGGCAGCCTGGCGAG +AGCCAACCTAGGCAAGGCCTCAGATGCTGCACAATCTTTGGCATGACTGAAAGGGGAAGG +CAAAAACCCACTCCAGCCTCGATTTCTCTGCACACTGTTTTCTTGCTAGGGCTCCCTATT +GGGAACCCAATTCTCAAGCCTGGAAGCCAAAGGGCAAAAGGGCCCAATGGGTTCATGGCC +AAAGGCAAAGAGCAGAGCCAATAGGGTGAGCACAGACTTGGGTTCACACAGAGAGACCCA +GGTCCTGAGGTCTATGTGATTCCTGTCCCAGGAGCCCCCAGGAAGACATGCCTCCCTCCC +AACGCTGTCCTGGTTGGCCCCTGTGCGCAAGACCTCATCCTCTTCTCCATTGCtatggct +ttgttttgtttgagcaTCTCTTCTACTTTAAATATATTGGTTTTCACTGAACTCATGTGC +CTAGTTTTTCCTGTGTTACATGACTGCAATTTTCaggccaggttttttttttttaattcc +tataTATTCTTAGTATCTTGTGATTATTAAGTGATTAgcatctgagtgtgtgtgtgtgtg +atgaataAAACTGAATTAGCTCAGTTACTCCCAGTTCAGCCGATGATGAAGGAAATGTGG +ATTTCCTAAGGAGTCTGATGTGAAGATtccattaaactaaaaagctttctACGGTACAAA +GAAGACATACGTTAGAAGGCCCTTAATAGTTTTCCAATTAAGCAAAGAGGTGATTTATAT +GAGGATTTCCAGTTGTTCTCTCTCTGCAACTGTGAAAGGACAAGGACTCACCACTTCCTT +TGTCTCCATCCATCCAGAGTTGTGTAGCCACTGCACCCTGAGAACTTCAGGGCTACAGAG +AACAACAAGCATGCTCGGCACCTCAAGGGGCCATACAGATGCTGCCAAGGACGCAGGAAG +AAGGCTGGTGTGGGGTGGGAACCTGAGGCGGGGGCTGTGTTTGAAGAGGACAATCGCAGC +AAGATCACACAGACTGTCACGACAATCCAGCCCTGAGGTAGCTCAGTGCGCCTCCAGGAG +GGGCTTTGTCTCCTATTTGTCACCTATAAGAATTCTGAGGGGAACATTTGTCCTCCAGTT +ATTGTCTTAATGAATTTCAACTGAGACACAGATTTCTGCCATAAGGCCTGGCCCAGAGGG +GATGCCCAGGGTGGCAGGGAGGCTTCCATCCTAGTAACTTCCACTTGCCCCTGGGGAGCT +TTCACAGTGGACAGGCACCTCAGGCAAATGCTTCGTCTGTACTTTGCAAAAACACCTCAA +TCAAGTGCCACGGGCACTGGCATCCAGGCCTCACCATCCTGAGGCTGCTACTGACCAAAG +GCCAGAATGGGCAACAGGGAAAGATCACAGAcatttttaacagaatttttCAGAACATGG +ACTTTGGCATGACCTAGTGGAATGGAGTTTCCTTTTCTAGGGAAGACCAATggtctttat +tgtttcttttaggCTTAATTAGTTATGAAGGAATCCTTGTctaaataaaaaggaagcatT +TAGAGTTCGTGACTGTTGTGGGTCCAGAGTTGATGAGTTTAGGAGTCCTATAATCCTGTG +ACCGTGTGGTTCCTATGGGCCATGTGGTTTATGTGGTCCTGTGGTCTATGTGTTCCATGT +GGTTTATGTGGTGCTGTGATTCTGTGGTCCTGTGGTCTATGTGCTCCATGTGACTTAGTG +GTGCTGTGATTCTGTGGTCCATGTGGTCCTTGTGGTCCATTGGTCAATGATCCTGTGGTC +CATGTGGTCCCTTTGTCTGTGTGGTCCCTGTGGTGCCATAATTCCTGTGATTACTGCAGT +CGATGTGGTCCTGTGTCTAGTGGTCCATGTTGTCCTGTGGTTCATGTTGTCTATGTAGTC +CTAGGGTCCTCGTGGTCATGTGACCCATGCTTTCCTGTGGTTCTGTTGTCCTGCGGTCTT +GGGGTTCCTGGGGTCCTATTGCCCATGTGGTCCTGTGGTCCTTCTGATCCATTGGTTCTA +TGATCCTGTGGTCCATGTGGTCCTGTGGTGCTATGATTCTGTGTTACCATGGTTCATGTG +CTCCTGCAGTCTGTGTGGTCCATGTGGTGCTATGATTCCTGTGGTTCCTGTGGTTGATGT +GGCCCTGTGATATATGTGGTTGATGTGGTCCTGTGTTTAGTGGTCCATGTGGTTCATGTG +ATCCATGTGGTCCTGGAATTCCTAAGGCCCTATTGCTCATGTGGTCCTGTGGTCCATGTG +GCCAGTATGGTCCTGTGTCTATGTGGTCCACGCTATCCAAGTGGTCTTGGGGTCCTGTGA +TCCATGTTGTCCTGAGTCCCTGTAGTTCTATTGTCCACGTTGTCTTGTGGTCTGTGGCCC +ATGTGCTTTGGAGGTCTGCATGGTCCTTGTGGTCCTTAGGCCCTGGTGTCCTGAGATACA +TGTGTTCCTCAGGTTTTGAGTTCCTTGTTTCTTCAAGAACTGTGTTCCTGGGGTTTTTGC +ATCCTAAGGTTCATCAGGTCCTATGGTCTTGTGATCTTCATATTTTGTGGTCCATGTATT +CCTGTATATTGTGGTCATGTGGTGCATGTGGTTCTTGAGTCCTCACATTTTGAGTTTCAT +GGGGTCCTGTGGTCTTGTTATCTGTATGTTTTGTGGTCCATGTGTTCCTGTGTCTTGTTG +TCATGTGATCCAGGTGGTCTATGTGGTCCTTGGGTCCTTGTATGCTGAGTTTCATGGGAT +CCCATGGGCCTGTGATGGAGTTTAATACCAAAACAACAAAGCAGGGTAGATGTGAGTTCA +GAGGCTACTACTGCCTTTCTTCCATCTTAATCTGGAAAGCTTCACTCTGATGAGTGAGTC +CATGGTGTTCCCTTCGGGCTAGAAGCCTTTTGTAGACAGTGTTCTAAGGTTTCTGCTGTG +GGTCAGGAAGCTCCTGGGAATAGTCCTGAAAAGTCTGTTGTTTGCAAGAATGGAGGGAGT +GCTTCACATGACTCATTGTGTTTTGACTTCTGTGTTTCACTTTGGCTGTTTCACCTTGCA +GTCTGAGAAGCTCCTCAACCCagattttcctcatttctttaaaaagagattAATTATCCT +TAATTAGCCTTGACTCCAAGTTGTAGATGAAGCAGCTTGGA +>NC_060927.1 Homo sapiens isolate CHM13 chromosome 3, alternate assembly T2T-CHM13v2.0 +tcataaaaaactcttattattttgagctatgttccattaatacctagtttattaagaatt +tttaagatgaaggaatgttgaattttactgaaggccatttctgcatctattgagatcatc +atgtggtttttgtcattggttctgtttatgtgatggattatgtttattgatttgcatatg +ttgaaccagccttgcatcccagggatgaagctggctTGTTATTGGTGGATCagcttttta +tgtgctgctgccagtattttattgaggatttttccattgatgttcatcagggatagtggc +ctatagtcttctttttttgttgtgtttctgctgGGTTTTGGTTTCAGGACGaagctgacc +tcataaaatgagttagggaggagttcctctttttcagttgtttggaatagttttagaatg +AATGGTACCAGCTGCACTTTCTACCCCTagtagaattcagtagtgaatCAGTCTGGCACT +GGGCTTTTTTTGTtcggtaagctattaattactgcctcaatttcagaacttgttatttgt +ctactcagggattcagtttcttcctggtttagacttgggaaagtgtatgtgtccagaaat +gtatctatctcttctagattttctagtttgtttgcatggaggtgttcatagtattctctg +atggtagtttgtatttctgtgtggtcagtggtgacatcccctttatcattttttattgtg +tctatttgattcttctcttttttcttctttattcctctAGCTAGCAgactattttgttaa +ttttaaaaaaaataccagctcctgcattcattgatttttgacatgtttttcatgtctcta +tctccttcagttccactctgatcttagttatttcttctcttctgctagcttttggatctg +tttgctcttgcttctcttgttCTTCTAATTGTGAAGGTAgggttgatttgagatctttct +agctttctgatgcagacatttagtgctataaatttccctcttaacactgctttagctgtg +tgtcagagattctggtacattgtctctttgttctcattggttcaaagaacttcttcattt +ctgtcttaatttcattatttactcaggagtcattcaggagcaggttgttcaatttccaca +tagttgtgtggttttgagtgagtttgttCATCtcgagttctaatttgatttcactgtggt +agGAGAGACTCTtggttatgatttcagttattttgcatttcctgaggagtattttacttc +caattatgtggccaattttaAAACAGATGCCATGcagtactgagaagaatgtatattctg +ttgatttggggtggagagttctgtaggtatCTATTaagtccacttgatccagagctgagt +tcaaatccagaatatacttgttaattttctgtctcattaatctgtctaatattgacagtg +gggtgttaaagtctcccattattattatgtgggagtctaagtctctttgtagatatctga +gaacttgttttatgaatctgggtgctcctgtattaggtgcgtatatatttaggatagtta +gcttttcttgttagttcatccctttatcattatgtaatgcccttctttgtcttttttgat +cgttgttgatttaaagtctgtttctgaGACTcaaattgcaacccctgctttttctgtttt +ccctttgctttgtaaattttcctccatccctttattttgagcctatgtgtgtctttgtat +gtaagatgggttttctgaatacagcacactgatgggtcttgactctttatccaatttgcc +agatCTGTGtcttaattggagcatttagcccatttacatttaaggttaatattgttatgt +gtgaatttgatcctgtcattgtgatgttagctggttattttgctcgttagttgatgcagt +ttcttcctagcatcaatgatctttacaatttggcatgtttttgcagtggctggtaccagt +tgttcctttccatgtttagtgctacCTTAAAGATATCAGATACAAATTTAGCAGCTGAAA +CCTGTGGCCATCCCTTAGTCTCTCAACTAGGCAGCAGTGAAAACACTATGCAGTAAGAAA +AAGAACTAATCTTGTGTGCAgaaagcaaaaaatttaaaaatacacagattattTTCAATG +TTCTCTACTGCTAGCACTACAATCCCTTATTCCATTCCTCAGATCCTGAGACACCCAATG +ACTTCATTAGAGAGAGTCCTTCTTGCTTAACCTAAACTCAGTTGAGTTTTCATCATTTGC +AGCCAAAAGAATTCTAAAGAACACAGacattatttgtttacatataatTTGTTTTCCCTT +CCTATCAAATAATGTTTTCTCCATAGATGGggagcacacaccacacacacacatgcacac +atacagatgcatgcacgcacacacacacacacacacacacatattatgaGAAGTAATTTC +TCACACTGGCTGGAAATCTTGACATTTAGAGTTCAAATTACTAAATTGAGACTTTTATTC +TTTTGGGGATGATAGAGAGACAATAGAAGACTCAATAAGGcacaagacattttttaaata +ttcataatgTGATGTGACTTGAAATATCAATAAGTGGAGACGGATTTTGGAGGAAACTGG +CAATGATATTAAAGCAATGACTTGTATCCACTTACgtctttataaaaattttcctttAGA +ATGACTCTTGTGATTTTTTCTGCTTTGATCCTGGGATAAAACTTATTTCTGAGATCTACT +ATCCAGAAGAACTTCTGGATTTTTAACattattccatttttctaaaGTGTCACAATAATC +AGGGGAGGAGGGTAAAAATTATTGAAGATTCTGGCCCATAATATACAATCGGTCATATTT +TGGCTAATGAGTGCATGGATGATTAGATAATCTAATTAAGTTGATATGTACTGTAAATCT +CATAGTTTGACTTTCACATCAAgggacatttttttcttgtgtgttaATATCAAtcctgta +tttatatttatagaacataAAATTGCAGCATTTTAAACTTATAATTGTTTGCCCTGGACT +CTTAGATCCTCGTTACTTGAGGTGTGCTCCGGAGATCAGCAACAGTCACATCATTTGCAA +CATTTTGGGACTGGTTAAAGTATAGATCTCAGTCTCATCCCTGACAGCTGAATAAGAATC +TGTATTTGAAATAAACCCCCAAGTGTTCTGAAGCACATTAAAGTTAAAGAGGCTTTGCAA +CACATGACacattttttatgttgttttgaaattatgaaatataataaaCCTAACCTTGAT +AAAATGTCGTGTTATGTTTTCCACTTAAGCTGCATAGTTTTTTTCATGCCACAGATATTA +ATGACTAATTTGCTGTGCTAAATCACAGGAATTGGTAATCAAATGAGAATGGCTTTAAAC +CTATACTTTGATgaaattgacatttaaaaatatagtaaacgtttttttaaagcaataatg +cAGAAGTATGGGGCATCATTTAGTTTTATGTTATGGGCTTTTTTTGCAGAAAAAGTATGA +TTtctaaattaaatgtattttagagATCTACAAAGCTACCAGATGTATTGATTCTTATGT +TTGTTGGTGTTTTCATATAACATTGATATTATTCAGAGCACACCAGTTGGCTAGAAAATT +TTAGGGTTTATTTCATTGGCAATATCATATTATCTCTTGATACTAATTGGtattaaattc +agaaaaatcaCCAACTGCATTAGCAGTTGTGCATGAATATCTGAGTATGCTGTTATTTCA +AATCTGGAAGTCATTGTAAGGACatcttttttttagaatttaagtTAATATTGTGCTACA +TGACTGTTTGTAGCATTGAAGGGGAACTAATCTTTATCAATCATTTAATTACAATGAATT +AAAGTATATATGTAATTacctacattttattaaaattggaCATATTTATAAGGAATTCTA +GGTGAAATATTAGTCTTAGCATTATGTGAACTGGACTCTGATTACACAGAACTTCCCAAT +GCATCTTTGTACTGCACCAAATTAACTCTAGACTCCTAAGCCCTTTACAGCTTGATGAAG +CAAAAATTCTTCTGATAATTAAATCCAAGGGGAATTTTACTACATTCTTATTTTTCCACA +AAAATAACTAAGAAGTTCTTTTAACACGAACAAattctttcaagaaatatttattgagtc +cctcTATGAAGAACATAATTCAGATTAGCAGGTGggaaaaaacaaatcacaaaacaaCTG +TCTCTTTCCTGTATAGTCCATAAGCagaatatgtacatatacatctGTCTTTGGGCGTGT +GACCATCATTGAAGAGAAAGGCTAatcatttcatcttattttaaaatatatttcaagttc +tctatatgatttttaaataagttgtAGGCCTTACTAAGCACTGATATTATGCTAGCAAAT +TTAGTAAGCATTCAAttttattatctcattgaatgtattaaaaatttgATGAACTGTATA +GTATGTGTTGTTAATCCCATTTTGCACATCAGAAAACAGAGGCTCTGCAAGCTTTTGGCT +ATCTTGTTCAAGATCACAGAAATAGTCAGTTGTGGATCCAGAAATTATAGCCATCCTTCA +GAGTGTATGTGTATCGAGTTTATTGTAAGCTTCTGattatgttgaataacaatgAATAAG +CACTAAATAAGGAAACCTTTACAAACAGCATAAGAAGGCTCATCTTGAGGACACTGCCCT +TAGACACAGTAGCACAGAACTACCATCAAAAGGGTGAAATAATTTACATGGAATCCTAGT +GCTTGTCAACAAGCAcaggttttctatttttgcctCCACTGACAGAGAGGATGAGTTTTA +GTACAGACAATGCCAGTCTGCTAGTACAACCTACTGTCCTGTGACagcacaaaaattaac +ttatccaaaaggatagaaaatgaaaagaaagtttgagtCCGCTTATCATGTGTGCCAGAG +TGTGACCACAGTCGTTGTTTACCATTCCCCTCtctcactgtaatttttttcccaCTGGAT +GCCTCTGAGTATTACTTTCCAACTTGATGATATTTCTTGGAAAAATAGCACCCTGGCAGG +CCAAAGTTAGAGAAGTCCAGTTGGTACCTGacactcacttttttttctttttttcattcc +acACCCAACCTTTCAAGAGAGAAATGCAAGGCAGGCAAACTGGTGAGTCCCCTGAAGGCC +CTTGAAGTGACTAATGTACACTCTATTTTGCAATCACATGGGGCCTGTGAAAGCACGTGG +GGCCTGTGACTATTTTTATCTAACTGGGTTAGAGTTGGACTCCCCATAGACCCAAAAGTA +TAGGAATCTAGATCATCATTTAGGAGGTAGCTTCGATTGAAATGCTGGAGGCTTGAACAG +GAGTCCTCTTGgtaacaaagaaatgaaaggctCCTATCTTGAGTTCTGCATGGAAGACTC +CCTCTTACACTTTTTACTGTTGTTTTCAACTAATACAAGGactactgatttttcttttta +tattaaagttACACTTGGCCTAAAGTTTTATATTTGTGAGTAGTTTCTACAATTTTGCAC +AGTTTAATATGTTATGTATTTAGTCTCAATTATCACTCTCCACCTCCTACTTGTAATACA +TTTGTAACTGGTAGGAACTAGTTCATTTAAACCGTATTAATCACACTCTGTCTGAATTAA +TATTTGTTAGCACTGATTATACTGATGGCTACTTCACATTTATACTTCACCTCCCCTCCC +TTTTTGCCAGCTACCATAAACCCAGctgtattttattctaaaagaaaaaagaaagaaaaa +aatctgggcCCAGAGCTAAGTGTCAAAGATAATAGaaacaaagtgctgagatttttCCTG +GTGGAATAATGGACACTTTTCTTACACAGACTCTTTATAAAGTGACATGTTTATTTAGTT +TCTGAGCAGTAATGAAATGATCAAAACAGTATTGCAATTTATAAAGTATAATACTTGGAC +ATACCAAGCCTTTTATTCTCTCAAGTCCCCTCGCAGAAATGACAAACACAAAGGCTAGGT +CAGTTACTATTCAGTAGTGCATCAGAGCTGGCTTGTATATTACTGGTGTCTCATCCCAAT +TCCTTGTTAATGATGTCACCTTGTTGACTGGGAAAAAAAGGCATAGTAGGAGTTATTTGC +TCTACAGGAGTAAGTAAATGCTACAAATTAGGGCTCCCTTTCTCACCTCTCCTCCTGGAA +GGGAGCAATAATGCTCCTCATTGTTGAGCATTTACCAGTGCACCATTGCCTATGACCATA +TCACGCTTGCTGTCTTGTATCATCAGCACTAGTTCTTCCTTAACAAATGCATGCCATTAT +GCACAAGTCTAACCAAACATACACTCAGAATGACTGCAAATTCATTGGAAAACATCCAAC +ACAAAGCTCACACTTGGTATTTTTTGGCTTCCTTGGGCACAAATTAGGATCTCAGgcaat +atttgctgagtgaataaattggcatatataataaaataaaagccttatCTATTTGCATAT +TTACCACCATCTTCAGAAACAGATGCATTTCATGTAGACTAACTCTGTCAGTAACCATAG +CATGCTAGTCTATAATCATTGTTGGAAAGTTTCacaggataaaataaaaagttattgaaa +AGGGAGTACTGAACTCAAAATCAAACTGAACTACTTGCTAAATTTGGGATATTAGTAgag +ttattcatattttatacattttattttctcatctgaaactgTAGACAATAATATCTACCA +TGGGTTTATTATGAGGATTCAAGTAATATTTAGCACGTAATCTGTATTCAAAAATTGCAA +TAGACACTGCCGATACACAACAATAACACTtgctatttttacatttattatcttctTAAA +TATAGTCTGCTGAGGATCACTGATGTTTCTAAACATCATGTGActggaataaaaaataac +ataagatTTTCCAGATATGAAGTCACTGGTAATTCATTGAACAACACTGAATATAAATTT +CAACGATTGGGATCTTTCATTGAGTCACAGAATTCAAGTAGGTATGGCCTAAGCATTTAC +TTTACAAAATAGTAAGATGTACTTTTAATTGTCTAGCTGAAGTTTGCTATTAAATTTACC +TAAATAAGAGATTTAAAttaatggtttgttttttttttgagagaagtctcgCTCTTAtcc +cccaggtttgagtgcaatggcttaatcttggctgactgcaacctccgcctcccaagttca +aatgattctcctgcctctgcctcccaaatagcttggATTACCTCGcttgccaccactcct +ggctaatttttgtattttttagtagagatggggtttcaccatgttggccaggctggtctc +aaactcctgacctcaggtgatccgcctgcctcggactcccaaagtgctgggattacaggc +atgagccactgcgcccggccattaaTGATAAATTTTTAAGAGCAGAGAAAAGCAATTTCC +TAAatatcaaagaactaaaaacaggcATTTTTTGGCCTTTGATGTTACCCTCAAGGAAAT +AGGTGATAATACAATAAttttactctaaaataatgattctCAAACATTAGAGAGCAGAAA +AATCACCAGAGAAGCCTGTGGGGAAAAGTGCAGATTATTCACATTCCTTCTACTGCCTTC +CTATCCAGGGAGGGAGagtagagaaggaagaagggaaggagaagagagaggaaggaaagg +gagagaggaaagaatgagtgagaggaaaggagggagggagataaaaaaagggagggagga +agaaaaggaaataggtGACTATTTCCCAAAGAGATTAATGTTTACATCagtctcctattt +tttttttgagtcttgggATTTGAAAAATACATTGGGATTTAAAGTGATGTCATTCAGATA +GATTTATCTCTTAAGGTATATCGGCTTATTTGAAATGGTatcattaagttaaaatgaaat +taagtcaAATATGATTTTCCACATCCACGTTCCAGGCCACATAATGAAATAAGAATAGCA +CCAGCTTTAATCAAATGCAGGTGATATAACTGTACAACAGAAAGCCTTCAGAAGGGATGT +AGATTGGTGAAGCTATGCCACAGAGTCACCAATGATACAAAATTGCACTTGATACAGTCC +TGCATCCCAGGGTGCCCTGTAAAATTATTATGCTCTTCATAACTCATATCCCTTTATTAA +TGTAACACGGCATAAAAAAGGCAAAACCAGTGGTATCCTGGAAGTCAGAAGGACTACACT +CCTTGCAGAAATCTGTCACTAGCATGACTTTAGGTAACGATGGCATAATAAGAATTCCCT +AATAGTTTTTTGACTTATAAATGTCTTTCTTGATCTTTTTGTTCTTACTATTAGTTTTTA +TGGACCAAGTTATCTGCATTAAAGGTCAATTTCTTGGTCCTTCTGCTAAATTGTAAgcaa +atgtttttgctttttaagccTAGTAATTTATCAAGAATAGCAGCTATACACCATGTACCA +TGAGTGGATATATAGCTGCTTTGAAAGTGTGCAAACTGACACATATTTGCTTCAAAGTTT +TAAATCCTTGATTTTTTATGAGAGTAAAATTTTAGGCTTGAATAGTGGTCAGATTTAGAA +GCACTGGACTGAATTTTGTCTTAACTCCAGAATccaaaaattattctttctataAAAGAC +tttacagtcatgtgtcacataACAGTATTCAGGTCAATGATGGACCACAGGTACAACAGT +GgtttcataagattataatggagctaaaaatTCCTATCACTTAGTGACGTTGTAGTTGTC +GTAGCACAAAACATTACTCGCatctttgtggtgatgctggCATGAACAAACCTACTGTAC +TGACAGTCctataaaagtctagcacatgGAATTAGTACATACTACCAGAGAATGATTATA +AACACCTGTGTTACTGGTTCGTGTATTTATGATACtccattttttatcattattttggaG +TATATTGCTTCTACTTATGTAAAAAAGTTAACCGTAAAACAGGCTTAGACAGGCACTTCA +GGAGGTATTCTAGAAGAAAGCATTGCCATCATAGTGGATGATAGCTCCATGTATGTTATT +GCCCCGGGAGACCTTCCAGTGGGGCaaaatgtggaggtggaagacagtgatattgatgat +cctgaccttcTGTGGGCCtcagctaatgtgtgtgtttgtgtcttagcttttaataaaaaa +gtttagaaagaaaaaagtagaaaaatgcttatagaataaggatataaagaaatataattt +tttgtacagctgcacaatatatttatgttttaagctaaatgttattataagaataaaaaa +gttaaaaaacttataaagtaaaaatgttacagtgaGCAAAGGTTAGTTTATTattacaga +gaatttttttttatttttttgagaggaagtcttgctctgtcgcccaggctagagtgcagt +ggcgcgatcttggctcgctgcaacctcagcctctggagttcaaatgattctgctgtctca +gcctcctgaatagctgggattacaggcgcatgttgccaggcccggctaatttttgtattt +tagtagagacggggtttcaccatgttgctcaggctggtctcgaactcttgagctcaggca +atccgcccatctcggcctcccaaagtgctaggattactggcatgaaccactgcgcctggc +caatattttgtataaatgtaaAGTAGCCTacgtgtacagtgtttataaagtctgaagtag +tgtacagtaatgtcctaggccctcacattcacttaccactcactcactgactcacccaga +gcaacttccagtcctgcaagttcTATTgaatggtaagtgccctatacggtgtaccatttt +taatcttttataccatattttagtGTACCTTTTTACGTTTAGATACGTTGAGATACATAA +TGTAGTCCCTGTGTTACACTGACCTACAGTAGTTAGCTCAG +>NC_060928.1 Homo sapiens isolate CHM13 chromosome 4, alternate assembly T2T-CHM13v2.0 +TCACTGAGAAACACTTCTCTTCATAGGAGATTTTTTTAGTGGGAGGGAGATGAGCTAGCT +GAGGGGTCAGGGCTCACCAGGCTGACAGCTCTATTGGGGGCTGATCAACTGCTCATCTCT +CCTCCGTGATGTGTTTATTTCAGAAATCAATGTGATCATTGAGTGCTGTGTCTTTTTCAG +AACAGCCTTCTTGTAGGACACATGTAGATGCCCTCAGCTTCATCGTCCTGCTGGTTACTT +TAACGCTGGGTACTGTCCTGTCTTTAATTAACTGCCCTTTGCCCTTAGTTACCTCATGAC +AACTTGGGATCTATTTAACTTGCCCATTTGCTCACCTTCAGTTATGCCCATTAAGCCCAG +CAGTGATcccacagaaaaatatttttgtcagaAGAACCCTTGCTCATTTAAATTATCTGT +AGAATATATTCGATCCATAGCccagaaacataaaaacaatattaGCAAAAGTTTAATCCA +ATGctaatgttcatttatttattatagacgtggggtcttgctatgttgcccaggtgggtc +ctgaactcttggcctcaagcagtcttcccgcttcagcctcctcaagtgtTGAGATGaaag +gcatgagctgctgtgtccagcctatttatttatttttaatgacatagATTTTGTTGTGTT +TCAACTCCCCCAAATCCTGTAACCTGAATAAACCCCTAGATTTTAAGATGACTGTTGCGT +TTTCCCCGGGGAGTGAAGATCCAGGGAAATTAGGTGAGTTGTTTATACGTGTGTTTCCCC +TTCAAAGGTGGATAATAATGTCACGAGGCATTTGGATAAAGTATTAAAAAGAGGAGATTG +GGACATATTAATCCTCCACTACCTGGGGCTGGACCACATTGGCCACATTTCAGGGCCCAA +CAGCCCCCTGATTGGGCAGAAGCTGAGCGAGATGGACAGCGTGCTGATGAAGATCCACAC +CTCACTGCAGTCGAAGGTGAGGCTCGCCGTCGCTCACTGTCTGCTGATGTGGTTTCACGT +GGATGTTCCCTAGAATAAATGCAACCGCCTGAGTTATTCAGGGTGCATGTGTGAATGTCC +ACCATCAGTCTGCTAGCCAGGGGCCGCATGCCACACGGGCAGCACTGTCTCAGTGTCCAC +TGCACTGACTCCGTCTTCCAGCAGCCCTGCAGAACAGCAGCTCTCACTCCTACCCGTGTA +TGCATTCATTCAACTAATACCTCCTGAAGACCTTTTGTGCCACTCTCTCTGTTCTGTATC +ACTCTCTCTGTTCTGTGCCACTCTGTTCTGTGTCACTTTCTGTTCTGTGTCACTCTCTGT +TCTGTGTCACTCTCTCTTCTGTGTCACTCTCTGTTCTGTGTCACTCTCTCTGCTCTGTGC +CACTGTCTCTGTTCTGTGTCACTCTGTCTgttctgtgtctctgtttctgttCTATGTCAC +TTTTTGTCCATGCATTTGGGTGCATCAGTGAAACAGTCGATAATCCCTCGTGAAGCTCAC +GCTCTAGCCAGGAGAGATGAGAAAGATGAGTAAATAAGTATGTGAGGAGGTGATGGGTGC +TGCAGAAACtcagagggcaggaggaggggcttTCAACAGCGTGTtgagagaagccttccc +tgaagaCGTGTGCAGGGTGAGCAGAGACttgaagggagggaggggcagaccATGTGGTCT +GTGCACGAGTGTTCCAGGAGGACCAGCAGCGAGGGTCAGGCACAGCCTGCCTGGCTTGTC +CCGGAGCAGCAAAGGATGTGTGGCTGCAACCCCAGGGGCAGAGAAGCCTGGTGGGTGCCC +CCACATGGCTCAGAGCTCTTGCCTTTTGCTGTGTGTTGTGTTCTCACCAGAGTCCTGTGA +AAGattccatttgacagatgaggcgACCAAGGCACAGAGTAGAATGCGTCCAGAGTCTCA +CAGCTTGGCAGTGGCAAAGACAGAAACCAGATACAAACCGTCTGCCATCAGAGGGCAGAA +ATGCAGCCTGCTGTGCTCCATGAGCTGTGTACAATTCTGTGAACTTCATTTATGGCATTA +TTTGACTGTGACCCTGTGATCTGGCTATGAgctcataggaaaaaaaaatctaattcatTG +AGAAAGAGCTACAACTCTATAAAGTAAAGCTAAAACCGAAAATTGTCTTCTTAAGATGAT +GTGCTCTCTTCAGTCTGAACGCAGttgaaatgtttttcctttgccTTAAAGGAGAGAGAG +ACGCCTTTACCCAATTTGCTGGTTCTTTGTGGTGACCATGGCATGTCTGAAACAGGAAGT +CACGGGGCCTCCTCCACCGAGGAGGTGAATACACCTCTGATTTTAATCAGTTCTGCGTTT +GAAAGGAAACCCGGTGAGAATTTAGGAATGTTAACAGTTGGAAATTGtattacatttgtt +ttctatagtctggttttaattttgaaaacctATTTTTTAGAAGCTCCATAAGGTTGAAGT +CCCCAAGCAATGTGAGCATGAAAAGTAATTGGGCAAAAGGCTTTTGGGATCTGAAGTTAC +GTTCCTTCCCGAATCCTTAAAATACAGTTATTCTTTGTCAGAATTTTGTTGTATGAATGT +TGCTGCCTGGATATCTGGAACTGTTGAGAAAAATTGCCAGTAGCTCAGAGACATCTGGAC +AGCATGTGTGAACTGAAGGAAACGTGAATACCTCggcttttttaaaagtttgcattATTG +TAAACCATCTATTGAATAGCAGTGTCAACAAGAGTCATGGGACCCGGCCAGAGCAGGACA +GACAGAGGCCCCGTCTGTCAGTATTCAGACAcgccccaaacacacacacaccccactctg +ACCTGTGCCCAGACTCAGCCGCCAGCCTATGCACTCTGCCCTCGCGGCCGCCGGCCTTGC +TGTCCTGTCGGCGGCTGCCTTCCACTTGCGCCTGGCTTCTGCTGCCACACTCGCTGCCTC +ACTCTTGGTGAGCTCAGCGGTAATTTCTGCCGTCAGGCACAGCAGACGCTTTCGGGCGCT +GCTCTCACTGACCCTTCAGCACCCTTAGTGCTGCTGGTCCCGTAGCTTCTGGGACCTCAC +ATCTTTCtggttttcctccttttctctcctttgccAGCCTAGTTTCCTTTCCCTGGTCTT +TTTTACTGGACTGCCTTCTTGTTTCGTTCTGCATTAGCCCTGGAGATACGGTCTCATCTG +CCTCTGTGGTTGTAAATGCCGTGGATAGGCCCCACACCGGTCAGATTGATCTCTCTAAGT +GTCCCCATTCATCATTCTTGGCATAATTTGTCATTGCAGACTTATTGatggattttgttt +atttatgggATTCATGTAACATCTGCCTCCACATTACACTTTAAGCCAGATGAGGACAGG +ACCATGTCTCTTTTGCCCACCATGATCTCCACCTGACCTCTTATATCTTTTTATGAAGCT +TCTTggccgagaccagctcggtccgGGAGACTTTGACCcagcagcgctagaggaattaaa +gacacacacacagaaatacagaggtgtgaagtgggaaatcaggggtctcacagccttcag +agctgacagcCCTGAAGAGAGATTTAGCCACGTATTTATTAAcggcaaaccagtcattag +cattggtTCTACTGAttctaaattaactaaaagtatcccttatgggaaacgaagggatgg +gctgaattaaaggaatagaTGGGGCTAGTTAAccgcagcaggagcatgtccttaaggcac +ggttctctcatgctattgtttgtggcttaagaatgcctttaagcggttttccaccctggg +cgggccaggtgttccttaccctcattcccgtaaacccacagccttccagcgtgggcgtca +tggccatcatgaacatgtcacagtgctgcagagattttgtttatggccagttttagggcc +agtttatggccagattttgggagGCTTGTTCCCAACACTTCTTCATCTTGAATGTCTGAC +CTGAGCAGAGCTAGGAATGGTGGGGGCAGCTGCATGCGTGCAGGCTGCCTGCAAGTGCCG +GACTCATCACCAGCTTCAGTCCTGAGAGttggttctgttttgttttctttattctcatcA +TACCTGTTTCGTGAGCCAGGACTGTACTCTGGTGTACTCACAGCATTGGGCCACCATCAT +CACAGTCAATTTTACATCATTTTCCTCACCtcagaaagaaaccccatactCTTCTGCAGC +CAccttcctcttccccagcccagtcttctctccctcccccaaccctaggTAATCAGCGTC +ATTGTCTGTAGATTTGCCTCTTCTGCATGTTTTGTGTAAATGAAACCATATGGTCTcgtg +tgcctggcttctttcatgtagGATAGTGTTTTTCCAGGTTCATAGTTATAGCATGTATCA +AGACTTCatttctaggccaggcactgtggctctcacctgtaatcccagcactttgggaga +ctgaggtgggtggatcacctgagatcgggagttcgagaccagcctgaccaacatggagaa +accccgtctctactaaaaatacaaaattggctgggtgtggtggcgcatgcctgtaacccc +agctacttgggaggctgaggcaggagaatcacttgagcccaggaggcggaggttgcagtg +agccgagatcgtgccattgcactccagcctgggcaacaggagtgaaactccccatcttta +aaaaaaaaaaaaaaaaaaaagaagacttcatttcttttgttattaaatAGTCTTCCATTG +CATGGATTTAACACATTCATTGACCATTCTtgagctgatggacatttgggttgtttccac +tttctgGCTGTGATGAATAATGACGCTGTGATCATCTGTGTGTAgctttttgtgtggatg +tatatTTCCTATGTTGTCATTTTCTTACCCAGTATAGCTGTGCCCCCACCCGCCACCTCT +GTGCTGTTATTGTCAAATATGTTGCTTTTCTGTATGTTATAAACTGATGGCATAGTGATA +TAGACATGGTTTTATATAATTGCTTTTAAAtcaggagaggaaagaagaaaatgcttttat +aGTGTCTTTCATAATTATATGATTACCTTTACTGATGCTCTTTGCTTTTTTATGTACCTG +AAATTTGATCTAGAGTCACTGgctttcagcctgaagaacttcttttagtatttcttgtaa +ggcagattTGCTAgcaaagaattttttgttttagaaaatatccGGGATgtctattttgtc +ttctttttggaAGGAGTTTTGCTGACTGTAAGACTGGGTTggctgttttttctttcagca +ctttgaatgtgCTGTCTCAccgccttctggcctccatggtttctgatgaaaagTCAATTC +TTAATCTAATTGGGTTtcccatttctttgtcttttaccATTTTTGCTATAATGTATCTGT +ATTTTATGTTTACTCAACTTggagttcattgagcttcttgcaTGTGTAGGTTGATgtgtt +tcatcaaatttggaaaattttcagttgTTTAAATTGCATAATCTCTATTGATCTATCTTT +AAATTGCTGgttctttcttctgccagttcAAGTCTATTGTTAAACCCCTTTAGTGAATTT +TCTGTTTCAgttatcatactttttttttttttttttttttgagatggagtcttgctctgt +cacccaggctggagtgcagtgacacgatctcggctcactgccacctccgcctcccgggtt +caagctattctcctgcctcagcctcccgagtagctgggattacaggcacccaccaccacc +ggttaatttttgtatttttagtagagacagggtttcacattattggccaggccgatctca +aactcctgaccttgtgatctgcccacctcggcctcccaaccattatcatatttttttaaC +ACCAGAGTTTCatttgatgctttttaaaaaataatttctggccgggcgcggtggctcatt +tgtgatcccagcactttgggaggccaaggcgggcggatcacaagggcagaagttcgagac +cagcctgaccaacacggtgaaaccccgtctctactaaaagtacaaaaattagccagatgt +ggtgatgggcgcctgtagtcccagctactcaggacgctgaggcaggagaatcacttgaac +ccgggaggcagaggttgcagtgagccgagatcgcaccactgcactccagcttggcgacgg +agtgagactccatctaaaaatagtaataataataataataatttttatctctttattgat +attctctatttgatgaGGAAAAGAAGAGCATGGGGAGATGGGAAGGAGATCGCATAATCC +TCTATCGGGAGCTGGGGGAATGAGAGGGAGATCGTATAACCAACCCTCCTTCTGGAGCTG +GGGGAAAGGGAGCTCTGTGTTCTGGGCTGCACCCACCACAGGAGAGTTTCTGCCCCACTG +GGctaggagggggagggagggagcaggccACGGTTCAAGGGCTGCAGACTCTTAGGCTTC +TTACCAAGGCCTAGTGGATTTTCTTGAATAAAGATTTCTTTGTTTGTTCTGTATCCCTAG +ACAATTTCCAGAGACTGTgaatggtggtagtggtggtttttaaaatgtttaccacTTATG +CTTGTTTTATTGATAAGCAAGTTTATGGAGCTACTCTTAACACTATTCCCTATAGTTCTG +AAggatttttatcttaaaaatgcacggaaatttttgttttgttatgttaataaaaataaa +tgttaaaatgcttattattttgaaaataagcgGTTTTGGATTGTGTAGTGAGTGACTTCA +GAGACCTTCAGCCCACCACCGCCCACCCCTAGAGTGCTGACCTCCCTGTGTGGGCAGTAC +AGGTCTGGCCACTCCAGAGTCAAGGGGTGTGGGAAGGAGAGCATGCCTGTACCTGGACTT +CCACAGAGGGCAGAGCAGGTCTGTTTTATTTTCGGCCTCTTGCTACTAGAATGTTTGACC +CTGTTTGTTGTTCTGTTCCCCTGGTACCTGGCACCTAGTGGATGTTTTATCATTTGTGGA +TTGAATGTTGAAGACTCAGCAGGCGAGCCAGTGGAGGTAGAGACCGGCGGTGAAAGGATG +CTGCTGGGCTGTGGGAATGGTTTTCTGAAGTGCTGGAACTTCTTTCATGGCCCCTTATCG +TCAGTGGGGCGCAATCCACAGGCCTACCCTGTGTTTGTATTTCAGAATTACAGTTATTAA +AATAGTTTGTGCAGGCAAGAACTGGTCACAAACCAATCAAAGGTGCAAAATCAAGAGGCC +AGAAATAGACCTCAGTGTATCTGGGGACTTGGTGACAAAGGTGGCATCTCAGATTAGTGC +AGAGAAGAcatggtgctcaataaatgatgctggtaCCCCTGGCTGACCTTTTGGAAAAAG +GTAATGCAGACTCTCTGCCTTATTCTTTACAACAATATCAATCCAGGTCAAAGCATGTTA +ACGTCTTTAAAAGACTACAGTATGGAAAATTCTGGATGTAGAACGGTAGTCACAGTCGTA +TAATAAACCCCCAAGTCCAGCTTCACCAGTTACTGGCCAATTACAGCCAATCTTCTTTCA +TCCGTGCCCACACTCATTTCCCTTCTCCTTTATTATTTGGAAGCAGACCTCTAAAAGGTA +CGTGCTCTTTACCCCCATAATCTTGATACCcttatcacatttaaaaaatagtgttaaTTC +CTTAATATCACTGAGTAGTGTTCATATCTCTAatatctgtttctctctctttaggTGTTT +CAGCTTGTTTGAATCAGGCTACAAATAAGACCATACACTGTGATTTGTTTATGTGTCTCT +TAAGTCTCTGTAAATCTGTAGGTCCCCAGCCCCAAAACTCTTTGCTTTACTACAGTTTAC +TCGTGCACATTTCCTTCTTGAGACCTACAGTCAGCGATTTCTCCAGGATGCCCTGCTTCT +TTTTAGTGGAAGGTGGTATTTCAAGATCACTGTCTCAGAGCTACCAGTGCTAGCTCTGAG +TGGTTGGTCATTGTTTctagacagaaagaagaaattgtTTTAAGATAAAATGATCTTGTG +TTTGTATCGATTCACCTTCAAAACTGTAAAATGACTTCTTAGGTCTTACATCTGTACTTT +CTTCTTCCTAAGTTTAGAATCTTGGTTGTCAGCAACTCCAGATATGATAGAATTAGCATA +TCACATAATGACTCATTGGCTTTATCCCGCAATAGACACGCAACAGTCTCAGAATAACAA +TGCCAGTGCTGCCACTACCAGTATGAGGGTCAAAAGCAATTTAAGgtgggtttgtttttg +tctttgtgttttattttttgtgtcagCTCAAAGCACTTAATGTaagaaaatactagaaga +aagaAGTACTGGAAGAAAACGGCCACACTGGAGTGGAAGGTTCTTTCTAAGCATGACCTA +GAAGCCGTCATTAGAGAGTTGGCCAAGACCTGATTAATAAATTTGACCAAATTAAAAACT +CGCTACAAAAAACTTACCACAATCAAAGTAAAACCTCCCCAGACTCACACCTGAGTATCT +AAAGACACCTCACGCACCACCTATCCTGAGTAGCCGTCCCTGTGGCCTCTTGGCGCCCTG +CCGGTGTACGTTGAATTCCAGGGTGTGGAGCTGTTTGCTGTctttacagatgaaaacact +TCGACCAAGTTGAGTTTCTGCTCCGAAATCATAGTGGATGGTGGCAGAGCAGTGGCCTAG +GCCCATGGTGCTGACATCACAGCCATTCTTGCAAGGAGATGGTAGGATAGCCACTCACTG +TTCAGGCTTGAGCTTTAGCCAGCAGGCAGATGTCCAGCTTGTCCAAGTTGATTAGAGCAC +CCGGCCCAGCTGAACCTGCCTCATTCTGCGCTCCCCTATAGAAGCACCCACAGCTGCCCA +GGAGCCGTGAAGGGTTTATTTTCTCCATGAGCAACAGCATGTGTGCTCGTAGAGGGCAGA +GCATGGGATGCTCCAAATCCAGAGGGGCCGGGCTGTCAGCGATCCCAGCCTCACTTCATT +CTCCGGTTGGCTGTTGACCTTGCCAAAGTGACAGTCCCTCCGTGTCTGCGGGACCACCTG +CTTCCTCTGTGTTCAGCCCATGCTCCGTAGCCCTTACTGTATGGAATTCCTCACATGAGC +CTCTCTCGCAGCCTGTTGCAGGCTACTGAAGGAAAGACACCGTCCCTGGCATAGAATGGG +TTCGGTAACTATCAACACAGCAAGCACAGGAGGTGATTCCTGTACGATTCTGTGTTGAGT +GGTGTGAAGAGACGGATCATTTGGCTCATGTTAGTTGTAGAAGGTCTAATTCAAGAATGA +GTACCATCTTACACTTTCTAGAAGTCTgttacttaaaatgttttctttcttctaggtGAT +ATCCGACATCCAAAGCACGTCCAACAGACGGATGTGGCTGCGACACTGGCGATAGCACTT +GGCTTACCGATTCCAAAAGACAGTGTAGGGAGCCTCCTATTCCCAGTTGTGGAAGGAAGA +CCAATGAGAGAGCAGTTGAGATTTTTACATTTGAATACAGTGCAGCTTAGTAAACTGTTG +CAAGAGAATGTGCCGTCATATGAAAAAGGTCAGTCAACTCACCGTTTCGAGCTCTGTCAG +AGCTGTGTGTTTCCACTGAGCTCGGGTTTCTCCGATGTGTTTCTGTGGTATGCAGTTTGT +CACAGGAGTATTTTTTCATCACTACTCTTTGATGATACagattgtgtttctgttttctta +gaaCTTTGAACTATCACCATTGGCAGCACCCTCAGATGCAGTTATCTAAAGTTCtttcat +aaatttattcattcaacaactatttaccAGGATCTTGTTATGAATGAGAGGCTGTTAACA +GGCACTGGAGACAGAGCAGGTAcgaggctctgccctcatggaaccttccagagggaggag +agaaaaggaagtgaTCGATGGCCGATGGTGACGAGTACCTTAGGAAAAGAATaaacaggg +ctgggtgcggtggctcacgcctgtaatcccagcactttggg +>NC_060929.1 Homo sapiens isolate CHM13 chromosome 5, alternate assembly T2T-CHM13v2.0 +CTCACtttggggtggggttggggttggggtgcAGGTGGAGCCTCTGAAAGGCTTTGAGGA +GTTTGCAAATGCCCTGCAGGGGAGCAACTTCAGGTCTCGCTGACCTTTATCCCTCAGGAG +AGGATCTCCAGTGAGGCTGTGCTCTCCGGGAATTCTTTTGTGCAGGTAGACGGTGAGGGC +AGCTTCCCAAGCCTGTTAACTGCACCTGTGCCTGCTCACGTGGCCACAGCCGCCACTATC +AAGGAGCTCTGGGTCCTGCCCGCGAAGCCAGGACTTTGTCACGAGCTTTGCCCGGACGCA +GCAGCCGGAAGCGGTTGGGAGGATTGATTCTTGATATTGATGCCACCCAGAGAGGACAAA +GGTGGAAAGACACACGAAAGGGGCCCGAGACGGGGGCTGGAGACGCGCGGAACCCGGGCT +GCGGAGAGGGTGCTGGGGTGCgcggcagggccagggcagcccGCACAGGGTGCATTCTCA +CGCAAGGTGTGCCCCGTGTCTCCATCATTTGCCCCAAATGCAGGAGGGCCCGGGGTCCTC +CCGAGGGGCCCCATGCTGCTCCCTGTCCTGTGGGGCCACCCTGCCAAGCGGGGCACCACT +CCAGAGCTGGGACAGCAGCAAACCAGAGCCAGACCCCACAGGTTCCCCACCTTCTGGGCG +CTGCTCCCAGGGACCTGTCTGGCCACTTCCCAGCAGGCTGTTTTAACCCGTGCAGAGCTG +GTTTCCTATGATAATCTCGACTTTTCTGGGCAGTTGTAAAGACTGAAAATCAGACTCCTT +CAGAGAGAGTGGGTTGACTTTGTTCTCAAACCCAAGGAAAACGAAGGATAAAACGTGTTA +TTTATTATCCTTGTTTTAAAGTTattgggggccgggcgcggtggctcacgcctgtaatct +cagcactttgggaggccaaggtgggtggatcacaaggtcatgagatcgagaccagcctgg +ccaatatggagaaacaaaaaaaaaatacaaaatacaaaaattagccaggagtggtggcag +acacctgtagtcccagctactcgggaggctgaggcaggagaatcgcttgaacccgggagg +tggagattgtggtgagccgagatcgagattgggccactgcactccagcctgggagacaga +gtgatactgtctcaaaaaataaataaataaataaataaataaataaataaataaataaag +ttattggGTCAGGTAAGAAGGAGGGATCcggctgctgcttcttttttttttttttttttt +tttttttttttttttttttttgagacggagtctggctctgttgcccaggctggagtgcgg +tggcgcgatctgggctcactgcaagctccgctcccgggttcacgccattctcctgcctca +gcctcccgagtagctgggactacaggcgcccgccaccacgcccggctaattttttgtatt +tttagtagagacgaggtttcaccggttttttttttcttaaatagtgtctagctctgttgc +ccaggcgagcaccaccaggcctggctaattttactattttttgtagagatttttttcacc +atgttgcccatgctggtctaaaactcttgggctcatgtgatcctccagcctcggcttccc +aaagtgctgggattacaggtgtgagccaccgcgcccattcTGGGGGGATCCAAAGACACT +GGCACCCCATCCTCAACCCCCAACACCCCAATCCCTGCCCCACAGACGCCTGAATCCCCA +CCCCACAGTCGACACCCGAATCCCCACAGACGCCCGAATCCTCACCCTGCAGACGCCCGA +ATCCCCACCCCGCAGACGCCCGAATCCCCACCCCACAGACGCCCGAATCTCCACCCCACA +GACGCCCGAATCCCCACCCCACAGACGCCCGAATCCCCACCCCGCAGACGCCCGAATCCT +CACCCCGCAGACGCCCGAATCCCCACCCCGCAGACGCCCGAATCCCCACCCCGCAGACGC +CCGAATCCCCACCCCGCAGACGCCCGAATCCCCACCCCGCAGACGCCCGAATCCCCACCC +CGCAGACGCCCGAATCCCCACCCCGCAGACGCCCGAATCCCCACCCCGCAGACGCCCGAA +TCCCCACCCCGCAGACGCCCGAATCCCCACCCCGCAGACGCCCGAATCCCCACCCCGCAG +ACGCCCGAATCCCCACCCCGCAGACGCCCGAATCCCCACCCCGCAGACGCCCGAATCCCC +ACCCCGCAGACGCCCGAATCCTCACCCCACAGACGCCCGAATCCCCACCCCACAGACGCC +CGAATCTCCACCCCACAGACGCCCGAATCCTCACCCCACAGACGCCCGAATCCCCACCCC +ACAGACGCCCGAATCTCCACCCCACAGACGCCCGAATCCCCACCCCACAGACGCCCGAAT +CTCCACCCCACAGACGCCTGAATCTCCCCGCTACACCCAAATGCCCACCCACACCCATGT +GGCTCCAGTTCCCATTCGGCTTCTTGGCGCCCGCCCCTCACACCAGTGGAGCCAGGGGAA +GGGGTGACCAGTGCTCAGGCGCGGAGCCCAGCTATGGAATCACAAGCAGCCCAGAGCGCG +CCCGGGATGGAGATGCCGCAGGGAGACGCAGGCCTCAGGATGGAGTAGCCGCAGGCAGAC +GCAGTCCTCAGCGCGCCAGGGATGGAGATGCCGCAGAGAGACGCAGCCCATAGTGTGCCC +GGGATGGAGATGCCGCAGGGAGACGCAGCCCACAGTCTGCCGGGGATAGAGATGCCGCAG +GGAGACGCAGGCCTCAGCGCGCCCGGGGATGGAGATGCCGCAGGGAAACTCAGGCCTCAG +CGCGCCCGGGGATGGAGATGCCGCAGGGAGACGCAGCCCATAGCGCGCCTGGGATGGAGA +TGCCGCAGGGAGACACAGCCCATAGTGTGCCCGGGATGGAGATGCCGCAGGGAGACACAG +CCCATAGTGTGCCCGGGATGGAGATGCCGCAGGGAAACTCAGGCCTCAGCGCGCCCGGGG +ATGGAGATGCCGCAGGGAGACGCAGCCCATAGCGCGCCTGGGATGGAGATGCCGCGGGGA +GACACAGCCCATAGCGCGCCCGGGATGGAGATGCCGCAGGGAGACGCAGGCCTCAGCATC +ACCATCGCCCCCACGCCGTAAAGGACAAGGACATTAGAGAGGAAGACCTCCCGGGAGTCA +CACATGAGAACTAAAGTTTAAAACTCAACAGAGGATTGAAAGAGGAGGTTAAGAATTTCT +CTCAGGCCacaggtggtggctcacacctgtgatcccagcactttgggaggctaacgcagg +agaatcgcttgagcccaggagttccagaccagcctgggcatcatagtgagaccccgtctc +tacaaaatacaaaaactagccaggcatggtggtgctttgcctgtggtcccagctacttgg +gaggctgaggcagtaggatcacttgagcctgggaggtggaggctgctgtgagctgagatc +gcaccactgcattccagcctgggtgatagagccagatcctgtctcaaaaaaaaaaaaaat +tatctcagaagatagagaaaaaaagacacataaagaaaatgtagggccaggcacagtggc +cacacctgtgatcccaccactttgggaggctaatggtggagcggatcacttgaggccagg +agttaaagaccagcctgggcagcatggtgaaactctgtctctactaaagtaaattacaaa +aattagctgggtaccgtggcgcatgcctgtaatcccagctactcaggaggctgaggcata +agaatcgcttgaagccaagaggtggaggctgcagtgagctgagctcatgccactgcactg +cagcctgggcgagagagtgagatggaaggaaggaaggagggagggagggaaggagggagg +gagggagggaaagaaggaaggaagggagggagggagggaggaaggaagggtttGAGGGCA +GAGTAGGCTGGTCCCATGTGGGCCGAACGTGGAACCCTGGAACTCAGGCGTGGGCAGAAG +ATGGAGAACCGCGGACAGGCATCACCACAGCCATTCCCAAAACCAAGCTTGCGGTTCCAG +ACTCAGTGAACTGCCAGGGACCTGGCACAGCAGGTGAAGTTAGCTGTACCCCAAAGCATG +TCAGGGAGTGAGAGGAGAatggggtgcggggagggggaggaggcctCCTGCAAAGAACCA +GGAATGAGGAAGGCCTCCGTGTCTCGCATGGATGCCAGAAGAAGCTGGCACAGGGCCTGA +TGATTTGGAAGGGAAACCAGTTCCCGCGGCGCGAATCAAGCAAGGCAAAGGCATCTCAGA +GGGGCCCTGCGGGCAGCCGGCGTTGTCCCTCCTGCAGTCAGCGCTCCACTGCCCCACACT +CAGCTGGCTTCCCAGGGCCTGAGCAAGGATGGGGGAGGCTTCGGGAGAAGAGGGGCTCCA +ACGATGTGGAGGAGAATGTGTTGGGGAGACAGGTGCTGGGCTGGACCGGGGAGCCGCTGG +AGGCCTGGGGGCATTGGAAGCAGGAGGATCCGTGGGTGCTTGGGCCCCTGGCGGAGCGCG +GCAGCTTGTTGGGAGCTGGGAGCAGAGCCACTTACTGTGAGCTCAGAGAGGCTGCCAAGA +GCAGCGACAGAGACCATCGTTCCCTCCAGGCAAAGCCAGATGCTGTGTGGGAAAGGAAAC +GTGGCCGTACGCTGCCACGGAGCTCTAAGGTGTTCGTGTGGGACGGAAGCACTGGTGGAA +AGGCCAGAACCCGTGGGACACACCCTCGAGAGCCGCCGGCAGCACGCTTGGTCCCGGCCT +GGAGACAGGGGCCAGCACAGTCAGGCTCTCTCTGAGCCCAGGGGTGGAGACCTCACTGGG +CTTTACTGTGGTGACCACTGGGGAGCGGGGCCCAGGGGACAAGGTGGGCAGGGGCTGCTG +TTTTCTCGAGTGAACCCTAGAACTACTTGATTTTTCATCTGACAAAGCTAACAGAGGAAA +AGATGAGGCCCATGGATGCATGAGCTCTCTGCCTGGCAGGCAAACATGCCCAGTGCATTT +TCAGGCATTTGCTGAGGGCCCGCTACCCACAGGCTGGAACAGACTCAGCCCGgaaaggcc +caggcaggcggCCGTGGATGCCATCTCCTGTGAGTCGATGGGGTCAGCTGCCTGGGGAAT +CCTGCGGGGGGAAGGCGAGGGAAATGGAGGTGGAGGAGCTGTGGGAAAGGCCAGGGCTGC +TGGGTGCAGGGGTGGGCGGGAAGATGCACCAGCAGCACACGCAGCTTTCTCTAGGCACTG +CTGTGCTCCAAGACCTCCTGTGGCTCCCACTGTCTCATAGCTGTGCCTGGACACCTGCTG +CCCCACCAGGTCTTCCTGTGTCTCCCCTGGCCACAGCCCTTCTTCCTGTCTCTGCAGGTC +CCACCCTGCATTCTTGTAACCTCCCATCACGACTCCCTCCAGCCTCATAATAAGGGCTCA +GATACCTGCCCATCCACATGTGAGATCCCAAAATATCGAACACACACCAGCAAAACTGTG +AGCCGCAAGGAGAGCACTTTGGTCCCACTGGCCTTGCTGGGCAGGGGCAAGAGTGTCTCA +CTGTTCTCGGATGGCAAGGCCGGCATTTAAGTGGacaaaagacctaaatgtaaaagacag +aactataaaatttctagaagatagCATGGAAGAAAAGCTACATAaccttgggtttggtga +tgaATTTTTAGatcaacaccaaaagcatgagctataaaagaaaaaattggtaagttggac +tttattaaaattaaaaactttttctctgcaaaagaagacatttgcaaaacacatatctcc +TAAAGAGTTTATCATTCAAACATACAAAGGACTCTAAAAACtcataggaaaaataaacaa +cccaGTGAGAAATGAGCCAAACATCTGGGCAGACCCCACACCAAAGACAGGCAGATGGCA +AGTAAGCCCCTGAAATATGCACGACAGCCCATGTCATGGCGGAGCTGCAAATTAAAACAC +ACGGAGACACCACCACGTACCCGTCAGCGTGGCCGAAACCCAGGACACGGATAGCACCGA +AGGCTGGCGAGGATGTGGCCACAGGAGTGTGCACCCAGCACTGCTGGAGGCACAGGGTGG +CGCGGCCACTTGGAAGACAGCGTGGCAGTTTCCTACAAACCTAAGCAGGCCATGACCAGA +AAACTCAACGGTCAGGCCCGCAGGAGTTGAAATCCTCCGTCTACACAAAAGCCTGCACAT +GGaggtttatagcagctttattcataatcaccaaaatcACCTGGAAGCAGCtgagatgtc +cttcagtagatggATAGATCCAGACAGTGGAATAtcattcagtgctaaaaagaaatgagc +tgtcaagccaTGAATAGACACGGAGGAAACACAGATGCAAtgactaagtgaaagaagccg +cTTTGAGAAGGCTGCACGCTATAGGTTTCTAACTACacgacattctggaaaaggcacaaC +TATGGAGACAGTAGAAAGATCAGTGGCTGCCACGGGTTAGGGGGAGAGAGGGAtgaacag +gcagagcacagaggatttttagggcagtgaagctCCTCTGGATGAGACTGTAATGCTGGA +TCCATGTCGTTGTACCCATGTCCAAACTCACAGAAGTGTAACACCAAGAATGAgacctaa +tgtaaactgtggaccttaattaataataatgtaccaaGAACGAGCCCTAACGTAAACCGT +GGAccttaattaataataatgtatcaagaATGAGCCCTAATATAAACTGTGGAccttaat +taataataatgtatcaagaACGAGCCCTAACGTAAACCGTGGAccttaattaataataat +gtatcaagaATGAGCCCTAATATAAACTGTGGAccttaattaataataatgtatcaagaA +TGAGCCCTAATATAAACTGTGGAccttaattaataataatgtatcaagaGTGGCTAAACT +ATGACAAATGTATCACACCAATGCCACCTGTTAATAGGGGGAGTGGGGGGTGGAACGGCT +GGGGTGTGGCTGGAGGGAACTTGATACTATCAGCTCAATATTCTGTAAATCTACAACTTT +ACTAAGAAATTTAAGTCTATTCGTTTTCTAAGAAAGGGTGTCCCCGAAGCTGTGGGGGGG +GCACTCCTTTTGGGGTGAGCTGGAGAAGGCCAGGCTGAGGGGACCAGgacagcattccag +gcagagaacgTGCACGGTGGGCAGGCTGAGTCCTGGCGGAGCCCAGGCTGCGGCACCCCT +GGAGGAAGGGCCGGGCGTGCAGAGGCCCAGCAGCCAGTCTCATCCTGACCCACCTATCAA +TTCTGACTCCACGGTGCTGACACTACTGTCCGGCGTCACCAAGATCAGAGCAAATACCAG +TCCCACTTTTCACTGGAAGATAAGAGGGGGAAAGGCGGTTACAGAGGTTTCCACTGCAGC +AAAACCCGAGACAGCAGAAACTGGGGCTGGAGAATTGCCTCCTGCAGCGATACTGAGACT +TAGGAACCTGGGCACcaggagggtgagggagggggGCGTGCACCTACTGTGAGCTGCGTG +GTGTGGGCTGGGACCACTGAGATGCCAGCTGCTGCAGACTCCAGCAGACCACAAAGCCAG +GGGTGCTTTTGGAACATGATAGTGGCACTGGTTACAGCCGGGATGTGGCATCCCCTTTGG +AGTTTTGGATTGGCAACATTTACCATGGGCAGTATCTGGGAGCTTCATTTTGTTGATGCT +TTTTGGGAAGGAGAAAGGCCGGGAGGAAGGCTGGCAAATGGCACAGCCGCTGTGCCGGGA +CGCAGGTGCTAGATGGGCCTTCACACATgggagcccccaccccctgctctAACAGAGCTC +AAGTGCCCCCTAAAAGCACGTGGCCCCTCTGAGGATGCAGAGTTGGGCGGGAGGAGAGCG +CCAGGTGCACGAGTGATACCCAGGGTCTGTGCCACTGGGGTGTGCGGGGCAGAGAACGCG +TCAGCCCCATGGACAGTTGGGTGGGTCCTGGCCACGGGGTCCCTGAGACACAGTGGATGC +TGAGACGGCCACGTCTGACTTCACAGCACACACATGCCACCTCCATGGGACACACGTGCT +CCTCAGGGGCCCAGGGACAGCTCTGGTGGGCAGACAGCAGCCCCGGGCCACCCTCGCCTT +CTCCCCCTGTGATGGTACACAGTAAGAATGAGGAAGTAGTTCCTGACAGCTCCTTCTCAG +GAAGCTTTAACTTCCCACGGCCAGCCCTTGTGTTGCGGATTTAGGTCGAACGCAGCTCTC +CCATTTGTCAGCACCTCTGGCGACAGGGCTGCGCCCCAGGGCTCCTCTCCCTCTGAAGGC +AGGCGGGCCACGCACAGCCACTGGAGCTTCTCCTGGGAGCAGCACTCAGCCAACCCGAGC +CAGTTCCGCCTGAAGAGATTCCCCCACTGTGTGCTGGGTGTGGGCGGTGGGCAAAATCCA +GAGAAGCAGAGACAATGGTGCCTGGCAAGGCCCCAGCCCCGGCTCGGGAGGGCACCCTGC +TTTCTGGGAAGAGATTACTTCCCTAATCACAGTTGGCTCTAACTAATCCTAAAATGAACC +TTCAGATCTTGAGAAAACCAGGATTAAAGACAGAAACCTGGAAGTGGCGCTCACATGGGC +GAGCCCTCGGGGAGGCGTGCTCAGGCAGTCCCGGTTCCAAGACGCTTCACacactccctc +ttcctccctgacCTGAGGTCTCCCAGGCTCTGTGCCGCCAGGGCTGTCCCTCCAGGGGCT +CTGTCCCTCAGGGGGCTCTGAGGCCCAGCCTCCGGCCTGTGCCCTCCCTCCTCACCTCTG +CAGAGTCACCCAAGACCAGTGGCCGCTGGCTCCCCCTTCCTGGGGCCCACCCTGCCCCCC +GAGGCCCATCGGGTCTTGCCTGTCGGGGGCTTTGCTCACTGTGGCCCCTCAGGCAGTCCT +GCCCAGTGGCTCCCACATCCAGTAGGTGGGGAAGGAGTGGTACGGCCCGCTGAGGGCCCC +ATGAGGGCCGGGTTCTAAGGGGAATCTGCCTTCACCGTCTGGTCAGCCCCGTGTCCTCTG +CACCAAACATCTGGGGCTGAATCTGAGGACGGAGCCCGCAGTAGCTGCTGTTCTTCCACA +CTTTGTGTCACCCCCAAAGCTCTTAAAAACAGGCATTTTCAACTTTCCCATTCAGGCTTA +AAGAAACCCTTTCCCAACAAAGAACTCAAACCCTTGGACTTTGGCATGACAGCTCAGCAG +GCGGTGAGCCTGCAGGTTCCCCGATCCACCAGAAAGGAGGAAGCTGCCAGTGCGTCCCTG +GCTCCCGCTCCTTCCCTCTGCCCTAGCCCTGCACAGTCCAGAAGGGGACCCTGGCTCTGT +CCCTCCCCAGGGCTGGCTCCCAGAGCCAGATAGGGGGTCCCGGCTGGGATGGTCCAGCAC +AAAGCCCTCGGGGATGCACTCAAAGGCCGCCCTCCAGGGACCAGGAGCTTGGCACAGGTC +ACCTGGTCTTTCCCTAAGGCAGAGCCTTCCATGGGGAGACATGGGGAGATTTCTCggccc +cccacccctcaccccagaGTCCATGGGGAGATTTCTCGGTCTCCCACCCCAGAGTCCATG +CCATCAGCCTGGAGTCTCTGTCACAGCCCTAACCACCCCCAGCACAGCAGCACAAACGGC +CAGGCCCATTCCCAGGATGTGCCGCTCCCCATTTGTGGAATTCCCACAGCCCCTCCTGCT +CTGCCcgcccctccctccttcctttcagGCCCCTGTGGACGGTGCACACACGGGAACCCC +TTGGGCACCCTGGCTGCTCTCCTGACTCCACCTGGACACGGCCCCAGGCTCCATCTCAAT +TCTTCCTAGACTGACGACACGACACTTTGGAAATGGACTTGACACACAGCCAGCCCCAAG +GGAAGGCTGGCAGTCGGACAGAACAGGGAGCCCAGAGCTCAGGCTTGTAAGGGCACTCGC +CAATGTGAGGGAGCAACCCAGAGCTGAACATGGTCATCACA +>NC_060930.1 Homo sapiens isolate CHM13 chromosome 6, alternate assembly T2T-CHM13v2.0 +cttccaaaagggtgagaaaataaatgtatgttgtttaagccactcggTCTAGTAtacttt +gttataacagccctACCAAACTACTAACAGcaggtacagaaaaaaaaaacttcgaAATCA +TTCTAAAGTTTGATACCAAATTAATATCGAGAGAAATTTTTTACCCCTAAAAGAACTAGA +tgccatgaaaataaatgaatccaagaATAAAAGCTCTTGAAATTTTCAAAAAGGTCCAAA +GACACATGACTTATACAGTCATAATAATGTAGTAACTGACCACCGgtttaaacaaaattg +aaataaggCACAAAAGGCGGATGTGTGTTTGGGGGCAGGCAAGACAGGTAAACCAGGGAG +TGACCATCTTTTATCTCACATAATGGGAGGCTGACAGCTAATGTCTAAAACGGACCACCA +AGAAATGGCAGATTAGAAGAATCTGGAAATGTTGCAGTGGATGGCAGGAGAGAGTGGAAT +GAGTCTGGGGTATGTTGTATAATAGAGTATTTGACCTCTGTCCCTGGTTTCTGGGAGCGA +GTCTTAAATCCTTGGTGTTTTCCGGCAATAGGAGGGTCTTTGTTATTCATGATCCTCTCA +AACCACGCCCTAGTATAGGCCAAGATGACTCAACAGCAGGACTGGCCATTCCAGAAAGAC +CATGGGATTAGAGGGTTAGGGTTTTGAGCAAAGCACCAGCAAACCAACCTCCTGTGGAGA +GGCGGGGCTGCAGATTAGGTTCAGTCCAACACgacttaatcaatcatgcctacgtaactt +atttaatacaaataaaatggcaaaacaacaaaaaaggaagtcCAGAAAAACATTATCATT +CATCCAATAAACCCAATGAGACAACTCAAGGTTACCTTGagttcctctccttccctctgg +cACCCCCTGAATCAAATAATCAGTATCTTTTGTCTGAATCAAAAATCAACTATTCCTCTC +AATCCTACTGTTTCCTCCTGTTGCTCTCCCACTTAAGACCTTCGTCTTCTCCCCTCAATG +CTGCAACAGACGTATAACTGGTAACTCTGCCCCATTTTCTCTCCACTGCAATCCACCCTC +AGCAAATGCCAGAGTTAGTTCTCTAAAATATGGAGCTAATCAATATTATCCCTACCTTTA +AAATAATCTTCTATGAAATCCACTGTTTTGTGGTCTGCACAGCCCACAACCTCCTCCACA +TCCCGTTCAAAGCCTGCCACAGCTAGACCCGTCCACATTGCCTACTTCATCTCCACCACT +CCTCTCCTCTGACATTCCCCACATGAGCCCATTCACCTCTTATGAACCTGCCACATGCTT +GTATTCATGTAATTCAACCTCTTTCCACTAAAGAGAAATTTCCAAGTTTATTAAATCTTT +ACCAATATTTCAAGTCATGCTCAAATGTTATTTTAGTCTCCCTGATCCCTCCTTCTATTA +AACTTCTACTACATAATGTTAATATTCACTGTgttaaattttagatattttatttgtttc +tccttTGAAAACACatctttaatcaattttatatCCCCACTTCTCAAGCTGTGGGATCTG +ACATGCTCATGTCAGGACTGAACTGAATTAGAGGACATCTAGCTGGTATCCGCTGGAGAG +CtgcttgcttggtgtgtggggaaaacTTCACACACACCTGGTATCAGGAGTGTGTACTGA +GTTAGTGGCTGTGTGAACATAGAAAGTAGGAAAAACACTTGGATTTTTTCCTATCTCTTT +ATAAGCAAATAAGCAGATAACCGAAATGGACCCTAAGAtgaaccagacagaagaattagT +AGATAAGAACTTAAAAGAGTCTATaacaaatgttattaaaatatatgtaatcatAATGAA +TAAACAGATGGTTGTTCTACATAGaggaattaaaattataaaattattttttaaaaagaa +atgcaatgcGAATTCTAGAACTGAAAGGTATACtgtctgaaatgaaaaatacactgaTTA +GGCTGCACAGTAGGTAGAAGATATTTGAAGAAACAGTCAGTGAACATGATTATAGATCAA +TATAGTTATAGAAATAGATTTATCTAAAGATATATAGTTCTTTAAagtactggaagaaaa +aaagtctgaaattaaAGTTGTAAAAGGcatttttcaagtaaaaaaaaaaaggttcattgC +AAACAAATCTGTATGACAAGAAATGCTGAAAGAAGTTCTTCAATCTCAAGGGGAAGTGAT +ACCACAAAGCAATTTGGTAGGAGAGTTTATAATGATGAAAGGACAAATTCATCAGAAAGA +TATAACAATCAAAACTGTATACACCTAATACAAGAGCTTCAAAACCCATTAAACAAAAAC +TGATTGATAGGGAGAGATAAATACACAatcatagtttgaggttttaaTATTCCCTTTCAA +TATTAATAACtagatattaaaaaacaaacaaaaaacatagaagATATGAACAGCACTGTT +GGTCATCCTGACCTGACATTTATAAAACTCCTTTTCAGGTGCTCATGGAAtgttcaccaa +gatagaccatatgctgGGCCATAAAGTAAGTCACAGGCAATTCCCAAAGACCGAAATTCC +GAAGATTACAAAGGAATCTTCGTTAGCAATAGAAACACAATATCCAGAAAAGTATCCAGG +TATTTGGAAATtaatacacttctaaataacccaacATTCAAAGTAGAAATTAAGagggaa +acaaaatattttgaaatgaatgataagaaacatttatcaaaatttgtggaatgccACCAA +AGCAGTAACTtaagatcttagagaaaaaatatttaaaattaagaatctaTGTTtccacct +tttttaaaaaaactagaaaaataagggCTAAATAAACTCAAAGTAAAGGGGAAGGAGGGC +AGGAAAAGGAAGCAGAatgacagaaataggaaaaaaataaacagtggaaACCAATAACAT +AagtaaaaagaatttgaaaaaaattaaagccaaaaGTTCTTCACCAACAATTAATGAATT +GATGTTTCAAAAAAACTCtctagaaatgaaacaaaaattatcaatTTCAGTAATGAAAGA +GGGAATAACCATAGATACTAAAGACATTTAAATAGCAATAAAGACAATGAACAGCTTTAT +GCTGATAAATTttacaacttagatgaaatgaattccttgaaagacaagTTACCCAAACTA +AacaagatgaaatagaaaatctcaatatcttcataaagattaaataaattaaattcattA +TCAAAACTTTCCTACAAAGAAAACTCAAACCTAGATGCCTTCACAGATGGATTCCataaa +acatttaaggaagaagaaatatcaagcctatatgaaatatttcaaaaagcaaaagaggaa +tacatcatgatcaagtagggtTTATTCCAACCAAGCAAGGCCAGTTTTTCAAACATCAAT +CACTGTGAATTACCATattaaaagtaaaggaaaaaccGTATGTTACCCTAAATAGATGTC +AAAGAAGCCTTTGATAAAACTCATGATTAAAAACTATTCAcgattaaaaactctcaacaa +actaagaCTACAGAGCATCTCCTCAATCTAATAAAGAACTAtttgagtggggaggatcac +ctAACATCctacttaatggtgaaatacaGAATGCTTTCCCCCCTTTCGAACAGTAACATA +GAAAAGATACCTCTCTTTCCTTGCCTATTCAACACTGTTCTAGAAGTTCTAGCAGTGCAA +TAGGGcgaattaaagaaataaaaagcagaaagatggcaaaggaagaagtaaacatctatt +tgcagatgacatgattgcttATAtaaaaaatcctaagaaatctACTAAGCAACTAATAGC +ACTAATAGCCGAATTTAGCAAAGTCTTAGTATTCAtggtcaatatataaaaatcagttat +ttacatattttagtaggaaatgattagaaaataaaattttttaaattttgaaaatgccat +tataaaaccaaatacctaaaaatacacttaataaaagaaatgtacaagACTTCTACATTA +AAAACTACAATATACTgcagagacaaaacaaagacCTAAATAAGTGAAGATCTATATCAT +GACCATGGATCAGAAGACTCAATGTTGTTAAAGtatcaattctccccaaactgaTTATAA +ATTCATGCAAGCTTATATAGAGATATTGTCAAGGTCATTCTAAAATTCCAGTAGATATTC +GAAGATCTAGCAAGAGCCAAACCAATcttaggaggaagaaaaaagttgTAACACAGTTCA +TGACTTCAAGACTTATTAgaaatctacagtaatcaagacagtgttgtTGACATTAGGATA +AACTAATGGACGAATGAAATAGACTAGAATCCAGAAACAAACACATATGATTATATGAGT +TTTGACAAGGCACCAAAGTaattcaatgggaaaaatattttaatggtgtTGAAAAAACTG +GATagctacataaaaaaaaaaaaaggaatgttaacTGCAACCTCACATcacttacaaaaa +ttatttcaaaatggctcataaacataaaaactaaaattataaactataaagaagataaca +taggagattATCTCCATTACCTGGGCGTAGGTAAAGACTTGTGTTCAATATGACAAACAC +AAGTACAATGAAAAACACTAAATTTTCTGACTTCATCCAAATTAAAATCTTCTGCttatc +aagagaaaataaataggcAACTACTGCCTAGAAGGAAATATTCACAATAGATACAAATGA +CAAAGGACTTTATACAAACAACACATAAAGAACTTTTGCAATCTGATAACAAAGGAAGCA +accctttttttttgagcaaaagaTTTGAGGAGACTCTTCATAAAGGCAGATATATGAACT +CAGTTTTTAATATGGTATGTGACAAAGAAGTGTACTGGtagatttatgtgtgtgtgcaag +tgtgtatTTTCTAGCTTTGTACATTGAGAGAGGCTAGAAGCAATAATACAACAGTAGCGA +TGAGCATATCTAACTCCCAAATACCATTTTTCAATGAAAGGAACCAGTgaccttggagaa +atggctgatgcagggctgaggcagggcaaGGACAAGGTAAGCCTGAAAGATTCTGCTGTA +CCAGTAAGGAAGTGTATGTCAaaaggccacagagccagactgaAGCAGTGCCCACTGTCC +AAACCAGACAATCTGAGAACcaaaaattagtattttcttGACCTTGACATTTTCAAAGAG +TACAGGTTATTTTATGGAATGCCTATCAATTTGGCTCTGTCTGATCATCCCTGTTGATTT +GATTTGGCTTATGTATCTTTCACAGGGACTTCACAGATCCTTCTCAGTGATTCATATCAA +GAAAGGCTCCTCATGTTTGTCTGTTTCAACTTTGGATTAGACAGTATGGtaccaatattt +tatttcctgattttggtaaCTGTATTATAATATAAGAGAATGTCCTTATTCTTAATAACT +acatactgaagtatttaggagTCAAGGAATGATGCCTCATCCCACTTTCAAATGGTTCAC +AAAAACATAGACAGATGGACAGAATGATACAGAAAttggggaaaaaggaaacaactGGTG +GGCGTGGTTAAAGGGCTTCCTGGAGTTACTAGTCACCAAAATGAAGGAAGTAAGTAAGGG +GTTTATAGGAGTTACTTTTACTATTCTGGAAAGTTTTCTATAAGTTTGAAgttatagcaa +aataaaaagttatcaaATAATGCTttggtaatattttgaaattaaacacAAACACATCCC +ATTAACATTAGCCTGCTAAGCTACACAACATATTAGGCTCATTGTTCCTGAAAAttgaaa +gatatttattttcacatttgacATCAGCAAAATGCACAAATAAGCAATGAATAAACTGAT +ATTACATAAAGATACTAGGTAATTTAATAGTTACgtttatataaaattgtatgtttcaga +attattattttactggAATACACTATTGCTACCTCTTTAAACATGCTTCTAAACGCAGAC +AAAAGTGTGGAAAGCTTGTTTTGACAATGTGCTAGAAAACTATTATAAACTGATAAACAT +GAGATTTAGTATGGTagcatattaataaaaattataggaCAGCAAAGGCATATTTCAACA +CAAAGTTCTTCAACAACTGCTTCAATAAACAGACATCATGTTGCTCCAAAGATACCAAAA +CACTGCAGGGAGagcaaatattaagaaaaatgtggATAATTAACCCACCACATTAATTAA +TGCTTACAAACCAATTTGTGAGAGGAAAATACTTTCTTCAATTGGCATGGAAAATTAGGC +TCCACTGAGTGGTGATTCAATTATTTTCTTGACACTATTAAGGTATGTCCTCAGTATTAC +AGCACAAATTAAATAAGCATGTGGTTAAAAGTGAGTACTTTCAGATTCTGGTCTAGATCA +CATAAAGAACCaaatttttaagtagaaatatGCTGCTCTCCTTGTTTCCAGAAAAACAGT +AGTATTAaaacttaatgaaaataattaccGTTGACATTAATGTTACTGAAAAGATGATTA +GTACAAACATCAGACTGTCAGAGATCCTCAGCGGTTTTGATTATCAGCAGGGGTGGTATT +TCACAGAATCAGAGCCAAAGGAGAGCTGACACAACTGGTATCTAGTCTCTTCACCTGAAG +ACACTGTAACCTAGAGATGCTGAGTGTCTTTTTCAAGAGCACACACCTGATGAGTTGTCA +AACAGACCAGATTCCTGGTGACCGGATCTGTAAGAGTCTAGTATCCTCTTCCTTCTGTAC +CACCATATGTCCTGTGAGGTCATTTGTGAATGTGACCGCTCGCATTCTAATAACCTTCAT +TGTGTCTCCAGTGACTGGGGCTCTGGCTCACTCTGGTGTGAAACATAACTGCAATTAGAA +TACCTCTGGTCTCAAAGAACGCAAAACTAAAAAACTAGGACAGGGCAATTCCAATTTACT +CCCACTATTTCAAATCCATTTTGAGGTCATTTACACAGGGCTCTTAATCTTAACTATGTT +ACCCTCAAAATCTGTCCAACTAAAAGTAATGTCTGGTCATAAAAGGTAATGTCTGGGCCA +CCATGGATAGCCATGAATCAAAAAGTCTGATCTACTTTCTTATTTATGACTGAAGAGTAC +AGGCAGGTGTCTTCCAGACGCACAAAGCAGACAACTGAAAAGCCAACAGGCATTACACTG +GTTCATTTGCAACAATCGTATTTCCTTACCATGAAGAATTACCTACATATATCCAAACCA +GAACAGACCATTATGCCAGGAAGACCTGtcatttaatttacaaatataagAACATATCTG +CTTTTCACACTGCAGTATCCGTAGCACATCCAACAGTGCCTGCGACATAATATACACTCA +GTAATTTGTGAATGAACTATAGGAAGAGATGTCTCTTCTCAACCTGCCTTCAGTTAAAAA +CATACTACAAGATAGTATGTTCTTATGTTTGTTGATATGTTCTTATCAATAAGTAATGCT +CTTATGTTTAAAAtctctaataaaagaaataatttcttatcaCTCTCAGGAAAGAGTCTA +AGGCTTTAAGGAAACAGAATTCAGCTTCTGAACATTTTCAGTTTGACGATCCATGCCAGA +CTCCCTTGAGTTTAAAGGAACGCTCTAGTCTACAGTTGTCATTGTCTACAAATTTTCCTC +ACAAATATTCCAATTGCCATAAAACAATGACATCAAAAATGTGTCATAAGCTCTTTCTTA +TATAAATACACTAAACGGAGGTCAACAAAAGTCTGACTTTGCCTGTCATAAACCTCATTT +GTTTAACTAAAGCAATATATAGTCTTTTAACTTCATAGCCATTTAAGACAATTAAGAAAG +CACTAAGGAATAAAGTGAATAAGCCTATCCTAAAAGCACATaccacaaacttttaaaaac +tctttttttttttttttttttttgagacaaggtatcactctgtcaaccaggctggagagc +agtagcgtgaccacggctcactgcagcctcgaactcctgggctcaagcaatccttccacc +tcagccttacaagtagctgggaccacaggcatgcaccaccatgcctgcctaatttttgtt +atattttttttttaatagagacagggtcttgctcttgaactcctaggctcaagcaatctg +cccacttccgcctcccaacgtgctgggattacaggcatgagccactgcactgggccctaA +CTCTTTTCTTTGTAAGAGACGGAGCCTCGTTGTGTTTCCCATGCTGGAGGGCCGTGGAAA +TTCACAGGTGCGATCAGGGTGCATTACTGCCTCCAACTTCTggcttccagtgatcctcct +tcctcagcctccagagtagctggaactacaggcccgcaccactgtgcccggccacaaacT +AATTTTATCTTTGGAAAGCATAGGGATAAAGAGGTATAACAGCTATTATTACTCATGTAA +GGAAAGTTAATACAGATGAGAATCAGGAACTTTTATTAGGTCAGATTCTGGTACAAGAAA +ACTAATAATATACAAAGTACTAAATAATGCAAATGGGCAAATAATAAACGTTGGGGGAAT +GGGAGTACTTACTGGGAActtcacatatatacacaggtATATAAGATGGGCTACAAATTA +TTACTTACTGGCTCCTAGCCTAAGAACCACACTACACACTTACGTACTATCCATTACCAA +AGAGAATTACtggtttgcttaaaaaaaaatcataattctgATGTGTTTCCAGACTCATGT +TAATTCACCAAGTATTTCTCAAATGCCTGGACCCGAATGGGGATAACCAGAACTAGGAGG +GTCCTTATGGAAATTAACCGTGGAAAGAGACACTTGTCTGATTTCTTTTGATAATGGCAA +CCTATTCACtgaataaatatacacacaagagtaatttctttttagcagtaaaatgtttaa +aaagtacaaGTCTGTCATATGAATAAGCCAGTTTAGCTTTCAGCAAATGGTATCTAGTGG +GACAATAAATTCTGGATATAAGAAAGCACTTTAATACATTTTCCAATGATTTATTTTCTA +CAGATACAGTGAAACATAAAAGGCATAGTGTTTTCTTGCTTCTCAGTAGTCTCCCTATGA +GAAACAATGGAAGATGCTTAAATAATTTGTAAACTTGAgactttgactttttttaatgta +agactTTATTTTCATTGAATTATCATTTTGTGTGGCAAATAAATTCCTTCCTGCCTGCAA +GAGCAAAGGACATCTTCAAACAAGGACAAAATGATAATGCCCCTCCAAAAggtttgagat +tttttaaatttaaattttatctttatagaTTAAGTAAAACAATCATATGGTACTCTAGAT +TTATTGTAATGAACAAAAGTATATCCAAGCTGTAAGTCTATTGAAACATTTATGAACAGT +CTGGAGACTGGGTTCTAAACTGAGTTCTGGCATTAGGAAATAAAAACGCTTGTTCACTTT +TACGCACTGTGAAACGTTTCTTATCTATAAACAAGATGATTGGATGAGATCAGCTCTAAG +GCATCTCTGAGCTCTTGTTCCTAGGAGAGTCCTTTACAAAGCTTTTAAATTCAGCAACTA +ATGCATGACTATAGAAACGGGCACTCTCTAGTTTTTCacaattaaactaaaaactttaat +aatagcttgctattcattttaaaatttctgtattgTAAAACGTTTTTACTGTATAATTAC +ACAATATTAGttaaaacattatatttagaTGGTCTATTGATGTTTAATATTATAGGCAAC +GTATCTCTGCAGATTAGGGAATAACCTAAGTAGAAgaataaattatcttttccattttca +aaagctACATTACAAAACTAGGCTATAAAACTTTTGATAGATACTCCCTGTTAATGAATT +ATTAAAAGTAAACCATAATAATTCATGAAAGACTAAactgtaaaattatttatgttcTAA +AACAAACTAttagatttttcatttctgttggtaTTATTAAG +>NC_060931.1 Homo sapiens isolate CHM13 chromosome 7, alternate assembly T2T-CHM13v2.0 +TCAGCTCTGAGTCAGTttcaattgattgatttttctcctttcaagAGTCAGACTTTCCTG +CATCTTTATATGGCTGTTATTTTTGTTGGGTGCCACACATTGTAAAATTTGCTTTGTTGG +TAACATGGTCCACACTTGAGGCTAGACCTTCTGAATAATCTCCCCCATTCCATGAATCCT +GAGATGTTCCAGTTTGGCAGATAAAAACAGCCTCAATTCCTGACTCTGTGTGTGCTACAT +ACTGTTCCCTCTAATAATTTCAGGTAGGTTTTCTTCCCCTTGCCTTGAACACCCAAGCAC +CAATCCATCCTCTCTTAAATATTTAAGGACCATACACAATTTTATGGAGTTTCCTTTCAT +GCAATTATGTGTCCTAAGAACTCAGCCACTGTGGTCTCCCCACACTCTCTGCTGTATCTC +CTCCACACAGGGGGTCTGCTGGGCTCCATCTCATTTCCCGCTCCCTACCTCACAGCCCAG +AAAGTGTCCCCAGGCAGTGACTATAGAAGATGAGGATTCTTCAGGGCTTGTCTCATTGCT +TCCCTTCTCTCTGGGATCACCACCCTTCACTTTCTGGTGCCCAGTTTCTTGAAGACCatg +atttcatatattttgtctgtttttaggTTGTTTCTGGTAGGAGGGTAAATCTGGTCCTCT +TGTCAATGCATCTTGGTGACACAAGTTCTCACATATAGATTTAGTTGTGTAGAAGAAATA +TGGTTGCTCTAGTTTTCTGTAACTCAATGATCTCAGGGCCAAGGGTTACACCTATTCTAT +TTCCTCCCATCTTCCCAGCACCTAGAGCAGTACTTgctacatagtaggtgctcagtaaat +gatcAACCCACTGTGTGACTGAGAGTTTTCTCCCTCATTtaatttccctccttttctcct +gttaTACGTGTGTAATGGAACGGCCCTCAGGGTGTTGGGACCCTGGCCAGGGGTAACAGA +CAGAGGTGTTGGGGCCCTGGCCAGGGCGAGCAGATAGGACAGGGGAGATAGAAGCAGTGA +GATAAGCTCACCCACTGCCAGGGCTGTGGGTACAGATCAGGCAACGGCTGTGAGGACATG +GGGAGGGGGGTATGGAGGAAGAGGATAAACCCCACCCAGGTGTATTAGGGGAGGGGGCTT +CTCAAGGGAGTCCAGGCCTGTGAGAAGGAGGCAGAGGACTTAGCCAGgggcaaaggaaga +gaaaagacagcAGACCCATCAGCACATGGCCCCCACGAGAAGCCATCAGGTGAGCCAATG +ATTCCATATGCTCCAGCCTCATGTGAATGATGACATTTAACAGCATGGACATGGTATGCT +CTGctgtgtttttgtgtttcttgaCATGCAGCTTACATGAAGTGCACAAATCTCAAGTGT +GCAGCTCAGGGTGGGACCCAACGTGGCACTGAGGGGCCATAGGGGTGGGAGATGAGGGGC +TTCTGCTCCCAGGGCCAGGGTGGGACACCCGTCTCGAAGGAGCAGGAAACAGATGGGCTG +ACCACAGTGGCATCAGCCCCTGGAGCAGGCACCCAGCGTCTGCAAAGAAGGGGTGGAGGA +TCCGGAAGTGAGGTCAACCTAGAACCCCCTGTCACAGCCCCACCCAGGCCCAGCAAGACC +ACCTCCAGCCCAGCCACACTCCAAGTGCCCCCATCAGCACAGTGAGGACAGCAAGTCCAA +GGCcgggcacacacacaaaaaaaagccGAGGGGAGCAGGGCTGGGCGGGCCCCTGGGGAT +CCTCCCTCTCCTGGGCTCAGCAGAAAGCATGGGCATGAGGCTTCCGTCCACACTCCACTC +ACCCCAGCCTGACCCTCCTGCCAGGGATACAGAGAACTCTGGCCAAGTCCAAGCCAAGGG +CTCATGCCTGGGGTGAAGGAGGGTGGGTCAGAGACTCTTtgccaaaaaaaccccacagaa +tgAGCAAAGCAATGTTGGGGGGCAGTGGTGGCCTCCCCAAGATGTGTGCAAGGCAGGCAG +GTGCATTCTGCCACCTCAGTGGCCAGGAGCAAGTCTcacagcctctctgggcctcaattt +ccctcTCTGTAGAGGACGATGGTGAGACAGTTCCATCCACAGGTGCGTGGGAAGGGCAGG +CCTGCAGGATGGACAAGGGTGGGCGAGGTTATGGGCCTCACTCTCTGAATCCTGGAACAC +CATCCTTGGGGTCCCGTGCACACTCTCTCCCACCGAGGGACTTAGAAATGTTGACAAGGG +AATGTCTGAGCAGTTTAAAGGGGACAGCAGTGGCCggcagggatgggggtggggaggggt +ggggaggcccAGCAACGTTGAAGACGTCACAGTGCCACTGGAGGAAGCGGGTCCTCACAC +CTGCAGAGGAGACAGATACCGTGAGCTTTCGAGGATGCCAGTTCCCTGTGATGCCGGCCT +CAGGGCCACACTGTGCTGGGTGGCTCAGGAAAAAGGCCTCAGGGAGCACAGAATGCACCG +TGCAATGGTTCCTTAAAAAGGTCAATAGGCCTCGGCCCCAGCCCATCGATCTCACTCCTG +GATATCTGACCGAGACAAACGAAGACAGCCACAAAAACAGCCACAGGAGAATGTTTATAG +GAGCTTTCAGGTAGGAGGTGGGCCTCAGACACTGGACCAGATGGAGGACTAACTAAAACA +GGGCCAGAGGAGAAGCAGCTTTCCACAGAAACCTCCACCAACGTGCCACATCAATTTACC +ATTGCGATGGCAACACCTGGGAGTCACCGTGcttttccatggcaatgacccagtGAGCCA +AAAGTTCCTACCCCTTCCCTAGAAAGGTCTGCATAAACGGCCTTTTCATCTGGGTGACAT +TAAATGTGGATATAAACATGGctgcaaaactgccctgagctgctactctctACTTGCGGG +GTACCCCTGCTCTGCAGAAGCAGCCGCGGAGCTCTAACACTGCCGCTTCCATAAAGCTGT +TTTATTCTCCCTACCACCAGCtgacccttgaattctttcctaggTGGAGCCAAGAACCCT +CACAGGCTAAGCCCCACATTGGGGTTCACCCGTCCTGCATCAGCTTCGCTTACGGGAGCC +AAAGCCAGGAAAAAACACACGTCTGACAACAGGAGAACACGTTCATACACCAGATGAGCA +CAGGAGAAATCACCCGACAAGAGCACGCGTTCATACACTAGATGAGCACAGGAAAAATTA +CCCAACAGGAGAACGTGTTCATACACTAGATGAGCACAGGAGAAATTACCTGACAGGAGA +ATGAGTTCATATACTAGATGAGCACAGGAGAAATTACCCAACAGGAGAACCCATTCATAC +ACTAGATGAGCACAGGATGAAATTACCCAACAGGAGAACGCGTTCATACACTAGATGAGC +ACAGGGTGAAATTACCCAACCGGAGAACCCGTTCATACACTAGATGAGCACAGGATGAAA +TTACCCAACAGGAGAACCCGTTCATACACTAGATGAGCACAGGATGAAATTACCCAACAG +GAGAACGAGTCCATACACTAGATGAGCACAGGGTGAAATTACCCAACAGGAGAACGCGTT +CATACACTAGATGAGCACAGGAGAAATTACCCAACAGGAGAATGCATTCATACACTAGAT +GAGCACAGGGTGAAATTACCCGACAGAAGAACGAGTTCATACACTAGATGAGCACAGGGT +GAAATTACCCGACAGGAGAACGCGTTCATACACTAGATGACCACAGGAGAAATTACCCGA +GAGGAGAACGTGTTCATACACTAGATGAGCACAGGAGAAATTACCCAACAGGAGAACGAG +TTCATACACTAGATGAGCACAGGGTGAAATTACCCGACAGGAGAACGCGTTCATACACTA +GATGAGCACAGGAGAAATTACCCAACAGGAGAACGTGTTCATACACTAGATGAGCACAGG +AGAAATTACCCAACAGGAGAACGCGTTCATACACTAGATGAGCACAGGAGAAATTACCCA +ACAGGAGAACGAGTTCATACACTAGATGAGCACAGGGTGAAATTACCCGACAGGAGAACA +CGTTCATACACTAGATGAGCACAGGAGAAATTACCCAACAGGAGAACAAGTTCATACACT +AGATGAGCACAGGGTGAAATTACCCGACAGGAGAACGCGTTCATACACTAGATGAGCACA +GGAGAAATTACCCAACAGGAGAACGCGTTCATACACTAGATGAGCACAGGAGAAATTACC +CAACAGGAGAACGCGTTCATACACTAGATGAGCACAGGAGAAATTACCCAACAGGAGAAC +GAGTTCATACACTAGATGAGCACAGGGTGAAATTACCCGACAGGAGAACGCGTTCATACA +CTAGATGAGCACAGGGTGAAATTACCCAACAGGAGAAGGCGTTCATACACTAGATGAGCA +CAGGAGAAATTACCCAACAGGAGAACGCGTTCATACACTAGATGAGCACAGGAGAAATTA +CCCAACAGGAGAACGAGTTCATACACTAGATGAGCACAGGGTGAAATTACCCGACAGGAG +AACGAGTTCATACACTAGATGAGCACAGGAGAAATTACCCAACAGGAGAAAGCGTTCATA +CACTAGATGAGCCCAGGGTGAAATTACCCGACAGGAGAACGAGTTCATACACTAGATGAG +CACAGGAGAAATTACCCAACAGGAGAACGAGTTCATACACTAGATGAGCACAGGAGAAAT +TACCCAACAGGAGAACCCGTTCATACACTAGATGAGCACAGGAGAAATTACCCAACAGGA +GAACGCGTTCATACACTAGATGAGCACAGGGTGAAATTACCCAACAGGAGAACGAGTTCA +TACACTAGATGAGCACAGGAGAAATTACCCGACAGGAGAACGCGTTCATACACTAGATGA +GCACAGGAGAAATTACCCGACAGGAGAACGAGTTCATACACTAGATGAGCACAGGGTGAA +ATTACCCAACAGGAGAACCCGTTCATACACTAGATGAGCACAGGGTGAAATTACCCAACA +GGAGAACGAGTTCATACACTAGATGAGCATAGGGTGAAATTACCCGACAGGAGAACGAGT +TCATACACTAGATGAGCACAGGTGAAATTACCCAACAGGAGAACATGTTCATACACTAGA +TGAGCACAGGGTGAAATTACCCGACAGGAGAACGCGTTCATACACTAGATGAGCACAGGA +GAAATTACCCAACAGGAGAACGCGTTCATACACTAGATGAGCACAGGAGAAATTACCCAA +CAGGAGAACGAGTTCATACACTAGATGAGCACAGGAGAAATTACCCAACAGAAGAACAAG +TTCATACACAGGATGGAGCGCAGGATGGAATCACCACTCAGCGAGAGAAGGAAGCCAGCC +ACGACACATCAACAATGAGTCCCAGAAGCAGCACCCTGCGTGAAGAGCCAGGCGCACAGA +CATGAAATCCTAGCACAAGCAAAACCGGCCAAGCTAAAACTCAGCTCAGTGTTGCTTTGG +GAGGGCCGGTGCCGGGGACAGGTCGCCGGGAACCTCTGGGGGACATACATGTTCTGCCTC +AGTAGGCTTATGTTGAAACCAGCTGAACGGTACAGCTAAGATCTGAACTCTCTGCTGCAT +CCAAATTCCACTTCCAGAAAAGACTGCcaaggaaatgaatgaaatcaaaaatcaaaagcc +TCACAAAAGTAATCAATGGGTAGAAGTGGGGATGACAGCCACCCTGAGTCAGGGAAGGGG +CAGGCGGGCTCTGGGTGCTGGCTGTGTTCTGTTTCCCGGCGTGGTGCTCCCTCCTTGGAC +AGGCTCACTTTGTAGTGAAAGGATTGTGCTGTGCATCTGAGATGTGTGTGGTTTTCCACA +CGCGTGCGATATGTGGATATTCAAAACCACAGAATTTAAAAGTAGGTTCTGCCTAGACTG +GGAGCCACGTATGTCCAGGGTGGAGGCCACACAGCCCCCTGGCCCACAGCACCCTCCTGG +CCGTGGCCATGCCCCTTCACCACCCCAGGACCACACTATTGACCTGAGTGCAGCTCCCTG +AGCGGTGACGGGGGAGTCCACCTGCTGAGGGAAGTGAGGGGAGTCTGTGGGACGCCCAGC +TCTCCAAGGCATGGCAGGAGCTCCGGACTTGCTTTCGCTTCCCGCCTCTCAGGCCCTGGG +CCTGAACCCCCACACCCCCCATGGAGGGGCTGTTCCCCTCTGAGGCCGAGCCTGGCCCCC +CCAGAGCATCTGTCTCTGAGTCTGTGCCTGTCCCTCTGCGAAGGTGAAGTCCAGACAGCT +TTGAAGCCCCCATGCTCCCATCCTCGGGGTGGCCCGGGACCAAAGACGAGGCAGGAGCCA +GCTGTCAGAGTCTCTGGAACCCAGCAGGAGAGGGTAAGGGCTGGACTACCAGCTGGTGTT +TTGAAAGAATGAAGACCTGCAGCTCCAGGGGGAGGGCCTGGCCTGGCCAGCCGCCGAGCC +TCCACCCCCTCACCAGAAACCCCTTGGGCTGCGGGCCACCGCCtgactctccctccctcc +tccagacCACCCTGGTACTCACTCAACCTGCCTTCGCCAACAGCTGGGGGCGGGGAATCT +TTTGCATGACCGGCCCTGGGCCTGACTCCTCTGGTGCAGGAAGAACCAGATCCAGCAAGG +GGGTCCTCCCATCCCTGGTGGGGCCAAACCTTCTCCAACAAGCCCTCAGACAGAGCAGTG +TACGGAGGCTTCCTTTGAATGTCGAGGTTTTCCAAAGATCAAAACAGAAAGCAAGGTATT +TTGGAAACACCTCATGTGCCAACTAATTAAGTGTCTGGCTGTTAGCAAGCCCCTCACAGA +GGAGGGAAGAGCCAGCCGGATCCTCAGCCACCCTCCATAGAAGTCAGATAAGGAGAGAGT +TTCTCATCAGAAAAGTACAggcaagaaaaccaaaaatagacaaatggaattgcaTCAAAC +CTAGGAGTCTCTGCACAGCGACGgaagcaatcaacagagtgaaaagggaaacccacagag +tgggagaaaatatttgcaaaccgtctatctgataaggggttaatctccagaataaataaa +gaactcttacaactcagcaacaccaacaaaaccaaacaacacgatttaaaaaatgggcca +aggacttgggtagacatttctccaaagaagacagacaaatggcCACCAACatctgaaaag +atgttcaacacctCTCATCAgtggggaaatgaaaatcaaaaccacagttagaTATTGAGA +GCTCCATAGATAAGATTTCCACATGATCCAGGAATTGCACTGTTGGGGACACACCCAACA +GAATCGAAGGCAGGATCTTGGAGAGATGGTTGGACACCCCTGATCTTGGAGAGACGGTTG +GACAGCCCTAATCTTGGAGAGACAGTCGGACAGCCCTGATCTTGGAGAGACAGTCGGACA +GCCCTGATCTTGGAGAGACGGTAGGACAGCCCTGATCTTGGAGAGACGGTCAGACAACGC +TGATCTTGGAGAGATGGTCAGACAACCCTGATCTTGGAGAGATGGTCGGACACCCCTGTT +CACAGCTGCATGATTCACAATGTAACCCCAGAGTCCATCAAGGCATGAGTGGGGAAGTGC +AATGTGGTCCGTCCACATGGTGGGAAAATTTTCAGCCTTAAACAGGAAGGAAGTTCCAAC +CCCTGCTACAGCCTGGAGGGGCCTTGAGGACGTCatactcagtgaaataagccagactct +GAAGGACAAATACCGTCTAATTCCACTTATATCAGGTAGTAGAGAAATTCACATAATAGA +GacagagagtggaatggtgggtgccagaggctggggtgagaggaatGGGGAGTCcatgtt +taatggggacagagttcaGTTTTGGAAGGTGAGAAAGTTCTCAAAATCTGTTGCATAATC +ATGTCGACATATTTAACACTACTCACCCATATGCTTAAAATGGCTAAGGTAGTAAATTGT +ATGATATGTGTTTTTACCACAAAAATAAAGagagggagacacagagagagaaatagagag +attCTCCTCCCACATCCTGAAACCTGAATTTTCACAAAGGGTCCTGACCATCACAAGAAT +AAGGCTGTACACTCGTGGTGCCCGCAGCCACCCTACTGACTTGGATGGCTGCAGAGTGGG +CACAAGATTGGGGGGTTGGGGGATACCGCATCAGGACCGCTCCCCACACCCAAGGCTGTG +GCTGCCCCTCCCTGAGCTTCTTCATCTCTCCTCAAAAACCTGACAACTGCACCCTCTGCT +TCACGGAGGGCAACCAGTAAGGGCTAATGAGACGGGGACTCACTGTATGAACCGAGGGTG +GCAGCTGAGGCAACTGTGGTCAGAGAGAAGAAACGTCCTGACCCCAGTGGCCCAGGGCTT +GTTACCAACAGAACCACAGCTGGAGCTCAagcctccttcctccctgctaACAGGTCTCAA +AAAAACTGCCaaacattcatccatccacccacccatccatccaccatccacccaccCGTC +TATGCACCCACCCagtcatccatctatccattcatccacccatctatccacaacccatcc +atccacccatctatccacccacccacccatccatccatctatccacctacccatccatcc +atctatctatccacccacccacccatccatctatccattcatccatccatctatccacaa +cccatccatccatccatctatccacccacccacctatccatccatctatccacccatcca +cccatccatctatccattcatccatccatctaaccACAACCCATtcatccaccatccacc +caccatccaccatccatccatctgtctatccacctatccacccatccatctatccattca +cccatccatccacccacccattcatgaAACAAATATTCATCATATGCTTCTGTGCTGGAA +GCATAGAGAGGATGAGACCAGAAATGCCCCTGCCCTTCTGGCACTCACAGCCTAGGTGGG +GAAGATGAATACATGGTAGGTAGATAGGCAAGTGACAAAAACAATACCAACCAGGTTACT +AGGATCTCAGGAGAAGGCAGCAGtcattttacaaaagtaaaataggATACAGGAGTGGTG +AGTGGTGGGGacagcagtgggggtgggggagtccCCTGTTGGGAGGGGACCCTGGAGCTG +CTACCTGCAGCACCGGCAGCtgtggggatggagggaggaagctCCCACCTGGGGAAAAGG +CTTCGGccagggaggcaggcagaggacAGCACCTGTGGCTGGAACAGGAAGGGCGAGGGA +GGCGCTAGGTGGGAAGAAGGGCTGTGGAAGCCCCTGGAGAGTCAGAAGGAGACACCGCCA +GGCCCTGCTCTGCACCACGCGTGGGGCGAGGGAGGGGAGCCGCCCCTTATCTAGGGTTCG +ATGAACAACGTGATCCCGGGTTCAGTGGCAGCAGCTCAGGCCAGACTTTGTATCCTCCAT +CGTACTGACTCCTCCCACACCCCTTCCAGGGTCTGTCCACCCAGACATGAGACATGGGGG +GTATCCAGGGCCTTCGCTCTGTGCTGGAGGAGGCACGGGGAGACCTGAAGGCTTTGAAGG +CCCCAAGATGAATCCCTTTACCTCAACTAATCCGGGCTCAAAGGCAGCCCTGCCCCCAGA +AGGGTGGCCCTGGCAGGGTTGTGGGAGCCCTCACCTGGAGAAGGGGCCGCCGGGCCGGCT +AATCCCCACCAGACGATTAGGGCCTGATCAGGTTTCCTGACCGACCACTGAGGCCCGGCT +TTCCCAGGGCCCGGATGTGTGCGGGACCTCGGAAGACCAAGGTGCTCTCAGGGTCATTCA +GACCGTGCTAAGTGCAAAGAAAAGGGAGATGGCTCCGAGTGTCCAAAGGGTAATGATCTG +GGATTAGCACCACAGCCCAGCTGGCTCACTCTGCCCGCCTGCTCCCCGCCCGGCCCACCT +CGCCCCGGCCCCACTCAGCCCCGCCAGGACCTTGGCTGGGGGACCCTGCTGTTCTCTGGG +CCCCTCCAGCCTCCCCCTCCCTAACAGAGCCTCGTCATGGA +>NC_060932.1 Homo sapiens isolate CHM13 chromosome 8, alternate assembly T2T-CHM13v2.0 +CATACGTCCACACCAGGCCACACAAGAACATGTGCATGGATTCTCATAGCAATGTTACTG +ACAATAGCTAAAAAGGAGAAACAACCAAacattcatcaactgatgaatggagaaacaaaa +tgtggtctattcatacaatggaatattattcagccttaaaaaagaaagttagttctgacc +catgctacaacatgaatgaacctttaaaaaattatgctacATGAAAAAACCCAGACACAA +AGGGTCATAtgttgcatgattccatttatatgacatgtcCAGAACAGACAAATctataaa +gaaaacagattagtggtttccagaggctggaGGGACTGGGGAATGGGGGCTGAGTGGTTA +CGGgataatgagttttttttttgttttttttttttttttttttttttttttttgagacag +ggtctcactgcattgtctaggctggagtgcagtggcacagtcttggctcactgaagtctt +gtcttctcaggctcaagtgaccctcccacctcagcctcttgagtagctgcgaTATAGGTG +TACatcatcatacctggctaatttttgtactttttgctagagatgggtgactcgccatgt +tgcccaggctggtctccaactcctaagctcaagtgatccacccacctcagcctcccaaag +tgctgtgataacagggtgagccactttgcccggccAAGTGTTTCTTTTTGGTGTGGTaag +aatattctggaattagatggTGGTAATGGAATGGTTGTACAACAGTGTCAATATACTAAA +AAGCAGTAAATTGTATACTTTGAATTGGTTGATTTGAAATGGTAAATTTGAGGTTACCTT +TCTGGGGTGCAGCCTTATCTATCTCTGCCCTTGTGACACGACCTGATCATCACAAATTCC +CTTTTAAGCCAGGGCCAAGTGGTTTTGGTTGCTTGTAATTGAAGGGTCTAAATTGTCCAA +GCAACTGACCCAAGGGCATCAGACTTGACAGACCAGAGTCTGAACCCTCAGAAATCACAT +GTGAGACCATGTCACCGAGGGAACCGAAGCAGGGGCAGCATCTGCACCCTCACCCTGGGG +GGTTCAGCCCTCAAGGGCCATAGCCTGTTTCTCCGTGTGCCCACCAATCCTGATTCTGTA +TTGGCACCTCCACCTGGACACGGCTCCAACTGTTCAGCAAAAGGCTCGTGCACCCAACCT +TCTCATTTGCTCCctggaaaaataatcttttaccCTTTGAGACTAGGTCAACTCACATCa +gtattttgacttttaattCAACATCTTCATATTAAAGAGTATATTACAGATGCCACTGAA +ACGAAGTGGCTGAATGCTGAAGCTTTGTGAAAAGACGTCACCCAAAGGATCACCAAAAAC +TTCAAAGGCCAAGTGCTTTGTCAGACTCAAATGGACCCAGCCACTTAAAAGTGAAAAGCC +AATCACTTTAGGCAAGAAAATATATATCTTCTAGAATGAAACTGGCCTGGAATTTACAga +tattattttttcacttaggaatgatccatcatccatccatgcatACAGCTTCAACTGCCC +CACCTAATTTCATCTTCCTACCACCAGATATGTTACTGGTAAACAATCACCGTTAAAACT +TTAGGTAGGttagaacaaagaaaaagtaaatcgaccttaaaaatacaattttaaaaaaga +ttaaaaatgttgGTTCagtaaaattcagagaaaaacaggaaatgttAGGGATGCCCTGCT +TCTTGTAAGGCATAACAGTGCACATGCTCCCCATTATCATCACCGTCAGAGCCGTACATT +CTTATAATCAATAAACCTACGCTGACACACGTTGCCACCCCGGTCTGCAGTTTACATTGC +GGTTCACTCTCGTACATCCTGTGAGTTGAAGCAAACGCAGAATGAGATGCGCCCACCATG +ACAGCATCGTACAGGGCAGTTTCACCGTCGTGCAAATCCTCTGGGCTCCACCTGCTCCTC +CCAGTCCTCGGCATCATACAGGGCAGTTTCACCGTCCTGCAAGTCCTCTGGGCTCCACCT +GCTCCTCCCAGTCCTCGGCATCGTACGGGGCGGTTTCACCGTCCTGCAAGTCCTCTGGGC +TCCACCTGCTCCTCCCAGTCCTTGGCATCGTACGGGGCGGTTTCACTGTCCTGCAAGTCC +TCTGGGCTCCACCTGCTCCTTCCAGTCCTCGGCATCGTACGGGGCGGTTTCACCGTCCTG +CAAGGCCCCTGGGCTCCACCTGCTCCTCCCAGTCCTCGGCAGTCACTGATCTTTTTCGGG +TCTCCTCagttttgcttttccacagtGTTACAGAGTTGGAATTGCAatgtgtagcctttt +cagatcggtttctttcacttactaaTAAGCATTTAAGGTCCcatcatgtcttttcatggc +ttgacagttcatttctttttagccctGAATAATTTTCcgttgtctggatgtaccacaatt +tgcttattcattcacttactgaaggacatcttcGTTGCTTCCAAGTTtcggcagttatga +ataaagctgctataaacatccatgtgcaggtttattgACGTTTTCCATCTATTTGGATAA +ATGTCAAGGGGCATAACTGCTGGATCCTACAGGTAAGAGTATGTTCAGTTGTGTAAGAAA +CTAcccaactgtcttccaaagtggctgccctGTTTTGCATTCCCATCTGCAGTGATGAGA +GTCCTTGTTCctccagcatttggtgttgttagtgttctggattttgtcCATTCTAGTAGG +TATGTGGTGGTGTCTCattgtcttaatttgcatttccctgataacatATGATGTGAAACA +TCTTTACATAGGATTATTTGCCATCTACATATTTTCCTTGGTGAGGTCCACATCTTTGGC +CCATTTTCTTATTAAGTTTTAAGAATTCTTCAAACATTTTGAGTAACAGTCCTTTGTCAg +gtatgtcttttgaaaatattttctctaagtcTGTGGCCTGTCTCTTCATTCTCTTGACAA +TGTCATTCGCAGAGcacaagattttaattttaatgatgtcCAGGTTATCAACTGGACATC +TacttatcaattctttctttgaTTGATCAAGCCTTTGGTGTTGTAGCTAAAAAGTCACTG +CTGAACCCGAGGGCACCTAGATTGCCTCCCATGTAATCTTCTAACcgtttatagttttgc +attttacactCAGGtgtaagatctttttttttttttttgagatggagtcttgctctgtca +cccaggccggactgcagtggcaacatctcagctcactgcaacctctgctcctgggttcaa +gcaattcttctgcctcagccgaccgagtggctgggactacaggcgcccgccaccatgccc +agctgattttttgtatttttattagagacagggtttcaccatgttagccaggatggtgtc +gatctcctgacctcgtgatccgcccatcttggcctcccaaagtgctgggattataggtgt +gatccaccgcgcccagtccAGATCCATTTTTAGTAAGATTTTTTTGTGAAAGGTTTAAGG +TCTGTGTCTATATTTTTATGCATGTGGATGTCTAGTTGTGCCAgccccatttgttgaaaa +gaccattCACTGAATAGCCTTTGTTTGCTCCTGTATCAAAGATAAGTCAGTggtatttat +gtgggtctatttctgtactctctattctgtcccattaatctatgtgtctaCTCTTTTGCC +AAAAATacgctgtcttgattactgtagatttcTGGTAAGTAACTCTTGAAGTCATGTAAT +GCCagtcctttattttgtttttctcctttaatattCTGTTGGCTATTCTCAGTCTTTTGC +GTCTCCAtctaaactttagaatcagtttatcaatatccacaaaataacttgctgggatat +TAATCAGGATTGTATTGAATGTGTACATCAAGTTAGGAAGAATGAGTATCTCTATAATAt +cgagtcttcctatccatgaacatggaatatctgtTCAATTTTtagtcttctttgatttct +ttcatcagagttctATAGCTTCTTCATATAGATGTTGTACACATTTGTTAGATctacact +aaaatattttattatggggGGGTGGTAATATAAATGATaccgtgttttgttttgttttgt +tttgtttttgagacggagtcttgctctgtggcccaggctggagtgcagtgacatgatgtc +ggctcactgcaacctctgcctccagggttcaagtgattctcctgcctcagcctctcgagt +agctgggactacaggtgtgcaccaccatgactggctaattttttgtatttttagtagaga +cagggtttctactgtctactgtgttagccaggatggtctcaatctcctgaccctgtgatc +cgcccaccttggcctcccaaagtgctgggtgtttttaatttcaaattccacttgttcttT +GCTGACATATAGGAAAGCAGTTGACTTCCGTGTATTAACTTTGTATCGTACAACCCCACT +ATAATCCTTTATTAGTTCCAGAAGTCTTTTTTGTTGcttctttcagattttcattacctg +ctttttctttaaaaactttgttATACTGattgaaaaagcaagaaaatttcTAACAGGCAC +AATGGACAGTGCATTAGCTTTCTAGGGCTGCCACTACAAAGCCCCACAGACTGGGCGAAG +TCAACAACAGACATTTGTTCTCTCACAGCCCGGAAGGCTGGAAGGCCAAGGTCATAGTCT +CAGCAGGGCTGCCTTTGGACCTTGGCTTGCAGACGCCGTTCTCTCTCAGTTGTCACAGGG +TCAAGCCTCTCTACGTATGTGTGTCCTGATCTCATCTTCTAATATGGACACCAGTAATAC +TGGATTAGGGTGCACCCTGACGACTTCATTGACCCTTAATCAACTTTAGGACCccatctc +caaacacagtcacattctgaagtatggggggttagggcttcaacatacaaatttgctGGT +GGCGGCTGTGAGGCGGGGAGCGCAATTCAGCCTATAATAAGTATATTCTTTAAATGGCAA +AAGTATGTGCAAAAGCAGTCATTTACTCCTTAATTGGAACGTTATCCTACTACACTGGGA +GCTTGTACCATTTGAAAACATTAAGCCATATgggaaaaatgtagaaaagaacATGGAATA +CACGGATTTGTCCCATGGGAAAAGCATGCTTAGTGTAACCCCGTATCTAGGAGACGTGAA +GGGAACTTTTTCCTTCTCACTTGTCTTCTATCCTTGACCAGAACGGTGTCTGTGGCACTC +ATCACATCGCAGGTTAGACAGGCTTTCTGAGCCGGCCTGGAAATGGAATCACCACACAGA +ATATTACGTCTGTGGGAAGATGTGTTCAGAGTCAATGGAGATCTGACCTGTGGGGCTGGA +AGGTGATTTGTGGGATGACGAGGACCTGCCTGCTGAGATCCTGGTGCGCAGCTCCATTAT +AAGGTGTGTGAAAACCAGAGACCACGCAGCTCTCAGGAACACAAATGCGTGGAGAACAAA +TGCCCAGTGAGAGACCACCACTATACAAACACGAACGAGACCCCCAGAAATGGCACCCAG +GAACCCACGTCTGGCTTCATAGACTTATGTGTTTACTGGGGAACCGAATGGACCCGCCCA +CATGTGCTGCACCCAGGCGGCCTCTTCTGGCATCTCTCAGTGGGATGTGCTGCACCCAGG +CGGCCTCTTCCGGCATCTCTCGGTGGGATGTGCTGCACCCAGGCGGCCTCTTCCCGCATC +TCTCGGTGGGATGTGCTGCACCCAGGCGGCCTCTTCCCGCATCTCTCGGTGGGATGTGCT +GCACCCAGGCGGCCTCTTCCCGCATCTCTCGGTGGGATGTGCTGCACCCAGGCGGCCTCT +TCCCGCATCTCTCGGTGGGATGTGCTGCACCCAGGCGGCCTCTTCCGGCATCTCTCGGTG +GGATGTGCTGCACCCAGGCGGCCTCTTCCGGCATCTCTCGGTGGGATGTGCTGCACCCAG +GCGGCCTCTTCCCGCATCTCTCGGTGGGATGTGCTGCACCCAGGCGGCCTCTTCCCGCAT +CTCTCGGTGGGATGTGCTGCACCCAGGCGGCCTCTTCCGGCATCTCTCGGTGGGATGTGC +TGCACCCAGGCGGCCTCTTCCCGCATCTCTCGGTGGGATGTGCTGCACCCAGGCGGCCTC +TTCCGGCATCTCTCGGTGGGATGTGCTGCACCCAGGCGGCCTCTTCCGGCATCTCTCGGT +GGGATGTGCTGCACCCAGGCGGCCTCTTCCGGCATCTCTCGGTGGGATGTGCTGCACCCA +GGCGGCCTCTTCCGGCATCTCTCGGTGGGATGTGCTGCACCCAGGCGGCCTCTTCCGGCA +TCTCTCGGTGGGATGTGCTGCACCCAGATGTTCTCATCCCACGTCTCTCAGTAGGATGTG +CTGTACATAGGTGGTCTATTCCCGTGTCTCTCGGTGGGATGTGCTGCACAGAGGTGACCT +CTTCCTGCATCTCTCGGTGGGATGTACTCCACCCAGGTGTTCTCTTCCCACGTCTCTCAG +TTGGATGTGCTGCGCACAGCCGGTCTATTCTCGTGTCTCTTGGTGGGATGTCTTACACCC +AGGTGGTCTATTCCCGTGTCTCTCGGTGGGATGTGCCGCACCCAGGTGGTCTATTCCCGT +GTCTCTCAGTGGGATGTGTTACATCCAGGTGGTCTCTTCCCACATCTCTCAGTGGGATGT +GCTGCACCCAGGTGGCCTCTTCCCGCATCTCTCAGTGGGATGTGGTCCACCCAGGTGGTC +TCTTCTCGTGTCTCTCAGTAGGATGTGCCGTAGACAGGTGGTCTATTCCCGTGTCTCTCA +GTGGGATGTGCTGCACCCAGGTGGTCTCTTCCCGTGTCTCTCAGCGGGGTCCTCTCACAG +TCTCACAGGTGAGCGGAGTTGCACTGCAGGGACCAGAGCTGATGGGACTCTCATGGCAGA +TGATCCTGCAGCCACCAAGAGCTTAACATGGGGCTGTCATGGGACAGACGTCTGCCAAAG +ACCACGGGACAAGAACCTCAGAAGCCTGTCCCTGAGTGGGCACAAGCCAACGGGGCCAAG +GGGGCCACCACAGTGACTGGGGGCATGGTGTATGGTGGGGAAGGCGCCTGTCTTCCTCAG +AGGACAGGAAGGCTGGCCCAAGCCCCAGTTTCAGTCCAATCGCCATCTTCAGAGCACACA +AGTAAATGACCCCAAAAAGGCAGCACCCTGACCTGGCCTTGGCTGGGGAGTCCACAGGGG +CCTTGGCAGAGCTTGTGTGGAGAGCGAtgcctgccctgcccacctgcTGCAGGCCCTCTG +CAGACCTGCAGACAGATGCCCGAGGCCCAAAAGACACATTCTCCAAGGCAAGTGATGATG +ACGGAGGTTAACTTCAGTTTCTGAGACCCACCCACATCTGCAGACAAACTCACCTGTCAA +AGGCTCAGCATGTTTCTGGCTCACTTTCTCAGAGGTCACTTTCTTTGGTGGATTTTGGAC +GGCCAGCGTCTGGGGTTCCCTCTTTCCTTGGCCACTTGGAACAGGAGGAAAAAGTCTCTG +CAGCACCTTCTCCACAAACACTGTACAGACAACCGattaaaagaaaaggaggaaaaggaa +tgaattatgCAGTTTATCTGAATCACACGTGACTTTTActctacacaaacacacacatcc +tgAAAGCACCAACGGAGACCCAAGTCCCTGGTCCTCCCACGCTGGGCACTGCACACCAGG +ATCCCCCAGACTCTGCCCGCAGAGGAACCCTTGAGGCTGGCCCGAGGACCCCCCACCATC +CTGCCATCAGCTGACCCTCTCTCCAGGGCATCACCCTGCATCCAGGAGGCTGTGCACTGC +TGGCAGGTGCTGCCTCTGGCTGCAGGTCCCTCGGTTCCTCCCTGTGAGGTTCAGGCACAT +GCAGGCCATGACCCCTGTCAGTGGGGGCTGTGGTCCTGGGTGGACGGTGTCAGTGGCCCA +CAGTGCTTGGAGCCAGGTGAGTGAATGGAGCAGGTCTGGCGGGCCCTGAGGCAGGGCAGG +CACCACCCCGCGCCCTCTGGGAACCCACGGTCTGCACTCTCTCCCTTAAACTGAACGTGT +CAACAACTGCGAATGGGGAGAATTCCGTGCATCTGACGTGGTTTAACGACTAAACAGAGA +TTCTTTACTTTGCTTGTTTTAGTTTACGTTGTTTAAACTGTGGGACAAACGGtcataatg +aataaatatttctgccCTGATTTAAGTGTGGTTAATAAACAGGCAGCTGCTTTGGAATAA +CCAAAAGTCGCACAGTGGAAATCAGCACTCCTGAAACAACTGCCTGGTGCCTTTAGGAAC +AGGGAGGCAGGGACTTGGCCTGACTGGAGGCGTGCAGGGATCTGTCATAGGCCCCCTGAG +AGGAGACGCTGGGGGTGGCTTCTAGGCGAGGCAGGGAGGCTCCACGGCCCTACCTGGGAA +CACTGTAGCTGAAGGCACAAATCCTTCCTAATTCTGGCCTCTGGGACAAACACGTGATAG +AAATAACCCTCCTACAGGCCCCGCTGTTAAGAACACTATGTGGGTTTCCACGCAACGCTC +ACCAGAGCTCCCCGTGCCCTCCGTGGATGGACCATGAAAACCCTGAGCACAGAGCTCAGT +GGGAGTGAGGTGCAGTGTGGTCATGAACAAGGTGGCTGCTCACTCAGACTCTCCACCTCC +GCGGCTCCCAGAGAGTGAGCACAAAGCCTGCTTTTGCTGGGAGGAAACGACCTCTGGTTA +AGTGGAAAACCTGAACTGAAACGATGTGATCCCTGAGACCCCGGGCTCTTCACCAGGTCC +TGGCAATGAGAGGGTCCCCATACGCTATATTTTGAATATGATGCAGAAGTGCACTAGCAC +AGGATACCTCAAAAGCTCCTGCTGGCTGTGGTGAGCGGGTCCCACCCCTACAGAAAGGCC +TTGCCTCAAGCATACCTGCCCGGCGGAGACACCTTGGCTCTCAGGGAGCAACAGGTGGTC +TgtgaaatgcttttaaaaatgtgctgCAGTGCTCCCAGGTATGTTCAAAAGAAGGTTCCA +AGACTTCAGATAAAAATCCAATGGTCACATTTCCTTCAAatgtcaaagaagaaaatgtcC +TGTGCCAGATGACCAAGCTGGTGATGAGCAGAGGAGATGGTAGGCAGATAAGATGCACTT +TATCCAACATCTTCATAAGCCAAAACAAATTCTAAGACAAAACCATAACCAGCCGTCCAA +TTCTGCAAACAAGGACAGGGGCGCTCAGAGCTAAAGCCTTGCTGGGCCTGGGGCAGCCAA +CGCGGACATGTGGCTGAAGTCGCCTCCCCAGGCACAGCTGCCTGCGAGTGTCTGGAGCCA +GGAAAATGCTATGGAGAAATCCCAGGCCATGGTCAGAGCCAGGCAATGCTGCAGAACGCC +TGAGGCTGGGCAGGCACAAGACAGTCCCAGGGACGGGGGCAGGCCAGGGCAGGCCCTGAC +TAAACAGCCACCGCCAGGAGACGCTGGGCCCAAGCAAGCATCAGATGACAGAGTTTTCTG +AAACAAGGCAGCTGATCCCAAAGAAAATGGCAGAACACGCCAGGGTAAGGATCGGAGCGC +ACTGAGAAACGGCACAACACATCAGCGTTTGGATCAGAGCGCACTGAGAAACCGCACAAC +ACACCAGGGTACAGATTGGAGTGCACTGACAAACTGCACAACACACCAGGGTACAGATCG +GAGCGCACGGAGAAACCGCACAACGCACAACACACCAGGGtacagattggagtgcaatga +caaACCGCACAACACACCAGGGTATGGATCGGAGTGCACGGAGAAACCGCACAACACACC +AGGGTACGGATTGGAGCGCACTGAGTCTGGCCCCAGGTCACGGTCTTTCAAGGCTTCCTG +AGGCAGATTTCGGAGCTAAAAGCGACATAATAAGAatgtgccttaaaaaaaaagaaaggt +agggAGCATTTTCACTGAATTCCATCCACTGCctgaaataa +>NC_060933.1 Homo sapiens isolate CHM13 chromosome 9, alternate assembly T2T-CHM13v2.0 +TCATGTTCAACTACAGAAAACAACAAGTGAAACTTTGTTTGCTCCAAATTGGAAACTGAA +ATATGGAAACAGCAGTGTGGAAGGAAATTTAACATATGAAGGTGATTTATCAGAAAACGA +AAAGGCAAAGGATACTTTATTCAATTATATTTAAAGGAGGGACCTAAACTGAAAGccaga +aacaacagaaaatgtTGTAGAATCTTTCACAGAGGAGCCAAGTGAAGTTTTTCCATACCC +TGATTTTCTCCCTCCTACGGAGCTTCAGTACCCTGGACTTGCACAGATGAGGCCCTCACA +AAATCTGAAAATTGGAAAGCAACAGGGGAACCTTCAGAAAGCTCTATTATTGGAAATGGA +AAGATTACAACATATGACTATACAAAAAGAGAGGTCAAAGTTACAAACTACTTTCTGTAC +CCCAGCAGTTACTGAATGACTTTCTTCCTCCAAAGCTATACTGAGAGTGGGACAGCCAAA +ACTTTCTGATTCACTGAGTCTTCAGACATCTCGTGTagataaaagttgagaaaaaagaaa +aaaaaaaccaatcgGGTTCTTTCAAGCTTGAGCAAAATGCTTCAAAATGGATTTGGAGCA +ATGctggaaaatataaatgaaattctaGACCACCAACTCTAAAAAGTTCATCCACCACAA +AACAGTTGGTTGCAACTTAGGACTTTAAAACtcttaaaagttcatttttaaatccGTGGC +AAGAACTTTCAGCAAGGACCAGACAACGCACTGACTGGTTAAAGTGGCCTCAATAAGGTG +TCTGCCCCCAAGGTTTTCAGTACCAGTCTCCatcttttcttgaaaatgagaagaaataaa +tcaAGGCACCAAGAACCAATCAcaaactttataaaaaaaaaatagtgttgcaTAGACCAT +TCTATATTTAGAAGCTATTTGTTGCCTTCATTTATAGCTAAGGGCTTATGTATTgactaa +aaataattcttttctttcatatatcTCAGTGTGAGCAAATCTATTCCAAGAAGCCCAGCT +AAAATATGGTTCATTGTTCCCAGATACAGGTATTCGCCCAcgcacagacatacacacaca +cacacacacacacacacaccccaattgCTTGATATGATATCGATTGGAATTTGTGAAAAT +TACTGCTGagagtattttaattttcttaattgttactttttaaaaaaatagagatgaggt +ctcactttattgcccaggctggtctcaatccaattcctgggctcaagctatcctcctgct +ttGGGATCTCCaaatgatgggattataggcacaagcgcCCAGCCTCGCGAGAGTCTTTAT +ATAAATCCAAGGGCTTCTATGCTGACATGTTTGACAATCTTTCGCATGTTATATTTCAAG +AAATGTTTCACTTAGTAAACGGTTCTATTCAAAGATTGTTCTTTTGTGACAGTTTTCCAG +TATAATTCTATCATCAGTAAATGGTATAATGGGTAGGGGGAGGAAGAAAGTACTGAAACA +TACTACAGCATGGATGAGCCTTGCAactattatgttaagtgaaagaagctagtagCATGT +TGTTATGTTCCTAGTTATATGCAACGTCCAGAATcagcaaatccatagagacagaaagta +aattagtggtaGCCAGCGGCTGGGAgtagggaggaatggggagtgactaatgggtatggg +gtttcttacTGGGATGtcaatgttctggaattagtggtgatggttgtgtgactttgggaa +taTATtcaaaaccactgaattatacattttGGGAGTAAATTGTATGGCATGTGAATTGTA +TGtcaataaaataactaaattaaaaatgaaatttcaagtaTAAATCCACTAAAAATTCAG +AATCTGCCATACTTTTGATTGATTCGTTTTGCTTACTCTTGAGGGCCTATCAATGTTTAC +TGACTAAATGCaaagagggagaaataaaggAGAGGTGAAGGCTGGGAATTCTGGGGATgg +agagcactttttttttttttttcttagagtcgtgctctgtcgcccaggccaaagtgcagt +ggcatgatctcggctcactgcaacctcagcttcccgggttcaaggattctcctgcctcag +cctcccgagtagctgggattacaggtgcacgtcaccacgcccagcgaatttttttgtatt +ttttagtagacatggggtttcaccatgttggccaggccggtgttgaactcctggcctcaa +gtgatccacccatctcggcctcacaaagtgctgggattataggtgtgagccagtgcaccc +ggtCGAGggcactatttatttatttatttttgagacagggtcacactctgtagCCTGgac +tagaatgcagtggctcaatctctgctcactgccgcctcgacctccagggctcaggcgatc +ctcctaccttagcctccagagtagctgggactacaggcgcgcgccatcgcgcccagctga +ttttttttttttttttttttttttttggtgaaaacagaatttcactgtattgcccagaac +tcctggggtcaactgatctacctgtctcggcctcccaaagtgtgaggattataggcctga +gccactgcgcctggccgacgAGCACTTTTAAAATGCAGGAGTCTTCCTGCCTCTGATATC +TCATCCCTTATCACCATGCAAACAATTCTCCTTTTCATAGAAGAGTAGACATTTGGggcg +gggtggtggtggtgggggattTTAGAAAATATCTACTGCATCCAAATGCCCTACTCTACA +GACGAAAAAGCAAGGCCCAGGAGGAGGAAAGAGTTTGCTTACTGCCACCCAGTGAGCTGG +CAAAGGCGCTGAGATTCAAAATGAGCTTTCCTGCCTTCACATATCTTCCGGCTGCCCTTT +GCCTATTCCCTAAACAGTCAGGAGCCATCAAGTTCAGGAATTTGCAGGTGTGCTTCGCTG +TGAACTGTGGAAAAGCAGCGTCTTCTCCCCAGAGGCAAGCATGTCGCCTTGTGAAGTTTG +ATGGCTCTTCACTTGCACACTCACAAAAAAGACTGAGCGTGTGTAACGCCCTGCTGGATG +TGTGCGGTGCTAGAGAgcttgggggtgaggggaggactCTCTCCCTTAAGAAAATCAGTT +GACTGCAGAGCTAACATTGTTTTTTGAGTAATACCTGGTTTTTATAAAGTCGTCCCTTCA +GTTCCCAAGCTCCTCTTCTGTTTGTTCAAGCCACCTTCAATTTGAAAAAGACTGAAGTCA +CAGCTTCTCAATCCCTACTAATTTCTCATGGACCTACTGGATTGCTCCAAATCGAGTATT +TGGGACTGAACTAGGAAGCCAGTTCAATCCTGAGCCCCCGAGGCAGGCGTTGGGTCTTCT +GTGGAGTCCCCAGAGACCTGCAACCTTCTGAACACGCATCCTCCCCTTTCCGCCGAGGAC +TCTGTCCTGCAGCCGAGCCAGGGCGAATGCACGGAGGTCACAAGGGAGGTGCCCTTGGAG +GCGGGAGGTTTCTGGCCGCCGGGGCGACCGTGCTGACGAGGCACCTGCAGGAAACAGAGC +TCTGCACGCTCCGGTCCCCCTCACccggggagggagaggaggtacAGAGGCGCTGGGGGA +GGACGTCGAGCAGGCCAGCCTCGTTGCCAGAACCCCCGCCCCAGCCGGAGATGGGAGCAC +CGCACCGTCTCACGGGGGCTGGATTTCTTCTCCCCTTGCGGGTGTGTGTGCGAGGATGGA +CGTGGTAAATACGGGTTGGCAGAAGGAGCGAACCGCGGTGGAGGAAGTTCTTCTGCTTAG +TTCTCGCCGCGGCGAGGCCCGCGGGCCAGGCGCGGCGACGAAGGTGCACGAAGGTGCCCC +GCGGGCCTGGTGGAGTTGCAGCGGCGCGCAGGCGCACTGAGGGCCGCCCGCGGCCGGCTC +CGCGGTACAAAGAGCGCCCCCGCGGGGAGCCGGGCGTCCTCTGGGCGGAGGGAGCAGCCG +GGGCTTCGCCGGCCCGCGCCGTTCTTCTCACGCGCCGCTCCGGGGCGCAGCCACAGCTGT +CGCCCACCGCGGGTGAGAGGCTTGCTGGTCCGCCCCGGCTTCCCCGCCCCGGCGGCGGCC +GTGCGGTTCGGGCTTTAATTCTGGCGCTTGCCAGCCGGGGCCGACTCCGCCCCCTGCGCC +CCGCCCTTCCCCGAGCTCCGGGTCCGCGGCGGAGCGAGCGAGCGGCCGGCAGGTTGGGAG +GAGCGGCCGAAGGTGAGTGACGCGGCGGGGCCGTGCCGCGCCCCGTGCCGCGCTGCGCCC +CGTGCCGCGGCGAGGTTGTCCCGGAGCGCGAGGCCCCTACCCCTGCCTCGGGCTGGCCCC +GCGCGGAGCCGACTTGGCGCGCGCCGGGGTTGCGCGGCGGCCGTGGCGGTGGCGGAGGGC +AGCCCCCGCGGGCTCCCGCTCGTGCGGGTGAACCCGGCGGCCTCGGGGCGGTCCTGGGGG +GGGGTCCGAGAGGTGGCGTCGGCCCCGCGGCCGTCGGAGTTTGGCGCGCTCTGCAGCGGC +GGCGCTCGGCCGgtctggaggagggagaggcgcgCCGGGCACGGAGCAGCGAGAAAGTTC +GGGCCGGGCCGGCCGGCGGGAGGGTGCGGGCGCCTGGCTACCCCGGCCCGGCGCTCTGTC +CCTCGGATGCCTCTGGGCCCTTCCCTAGCCCGGGGCGGAACGGGGGACCCTCTCTGAAGC +GGCTCTCCGTGGAGTTGGATGTTGCCCTTCGCGGGAGGGAGTGGCGGTCAAGACCCCTTT +ATCCTCGGCCCCAGAGGGGCAGGTGGCCTCGGGTCGCCCTCCGCCAACTCCGAGGTGGCT +TCGGCCGGGGCTGGAGGGCGGGGAGGCGGGGGAGGGGCGTGGGCGCTGCGGCCTCTGGGG +CGGCCCAACCCGGCGCGGGCAGCGTGGGTTTCCGAGGTCCCGCGGTTCCAGGTCGAGGGA +AGGTGTAGGGGCCCTGAAGCGGGCTGGTCCCCGAATGTTGCGTTTTCTGTGCCGCTTTGG +GCAACACGCAGTGGCGCTCGCGGCAGCCACGGCTCCTTGACCGTTCATCTCCTTCACCCG +GGTCCCGTGGAACTTTCAGAGGCAACTGTTCTTGGTGGCTCTTGCGGGTCAGCACGAGCC +GTGCTGCACGAGCGTGACCTAGTGAAGGCCTTGGGCGAGTTGGCGTTAACAATTTATGGC +GTCCGCCAGCGCTCGCTTTCCGCACGTGGCCTCTGCGGAGGGTCAGCCCATCTTATTAAA +TAGTGGATTCTATTAGACCCTGATACCCGAGGCTAATAAGGAAGCTTAATCATCCAGATG +TGTAATCGTGCAGTTCCTTTCCTCACCGTCATTGCCCCCCACCTCTGGAGCTGAATGGAA +ATGAGGGTCTGTTTGCTTATATTGAATTCCTGAGTTTATTCAAGTTCATTTTTAGGTGGC +GTTAACAGCTAAGTAGCTGTTCATCTGCCAGTTTCTCCTTTCATCCAACTTTCTCTACTA +AAATGTTGAGCacgttttatttaaaaaaaattgaagtgtaataaacatataaatttacTC +TTCTAAGGTcaaaattcagtggtttttaatatatccGTAAAGTTATGAAATCATCACTAC +CATCTGATTCCATTTCGTTGCCCCCAAAAAGAACCCCTATACCGATTAGCAGTCATTCTT +CCATCTCCCAGCCCTTCTCCCTCATTTTAAGGCAGCTACTTAGGAAGTTTTTCTAAGATA +GAGACtgagtgagaaaactgagaggtGATTAACTTTGATCCTTTTTCTGTTACTAGGTTT +GGGGAAAGGTGCTGCTGAAgcaatggaagaaaaattaagtaTTGGCTGTCCTATGGGGAG +GTTAAAATGAATAAGGATGGAAGAGAAGCTGCCAGTAGAGGAATAATTGCCTCCTGTAGA +GACCCACAAGTTGGGAATACATTTTATCCCCTTAGGGCACAGGGATGCTTTCTGGGCTCT +AGACTTGCCTAGTCCATAAATCACTCTAGTCGAGGTTCTGCCTCAGCGAAAGTGagttct +gggtgtgtgtgtgtgtgtgtgtgcgtgtgcgtgcgcGCTCGGCAGGgaatgttagaagga +aaaaagactaggcttaaaagtaattttttaaaatatccaaactggccccaaagaaagaaa +ccaaaaaaccACAGGCAAATGGCCACTGGAATTGATACATTCAAGACTAGTTTCATTTCA +TGAGTATCAGTTCACAAATAGTTCTGAGTTAATGTGTGCATACATTAACTTTTTATCCca +agtgggaggaggaggatggaaaAGGATCTAGTTGGGGGCAGTGCAAGGAACTGGGAAGAG +GAATGGGATAATGGCCGAAAGGGGCAGTGCTTGTGGGAGCTGAGGACTGTTGAGATGGAA +TAACTATAGGGTGAGCAGATTCTGAAAGAGCAGAGTGGGTCTGTGAAAAGTTGGACACTT +CACTCGGGCTTTTTGTTGGATAATGtgtgcatgttttaaaaatcatttttagtaaGGAGA +GTTGAAGCTATCCAAATTATGCAACATCCACTACACTTCTCACTCACCCTTCAATAAGAA +AAGTCAACTTGTTTTCAAGTGTTTCGGGAAGTTTTAGGCCTGTTGCATGGGTGACAGCtt +atgccatcttttttttttttttttggtaatttagaacattgacatagcgagactccgtct +ctacaaaaaaaataaaaaataaccggatatggtggcacatgcacctgtagtcccagctac +ttgggaggctgaggcaggaggattgctttagcccaggagtttgaggctgcagtgaactat +gatcatgccactgcactccagcctagatgaccgAGCAATATCCTCTCTCAAAACAAGATG +AGCTGTACCATAGGTATACATATCCCACACCCCCAGCCCTGccgacggagttttgctctt +gtcagccaggctacagtgcaatgtcacagtatcagctcactgcaacctccgcctcccagg +tttaagcgattctcctgcctcagcctcccaagtagctgggattacaggcacctgccacca +tgcccggctaatttttttttttttttttttgagatggagtctcgatctgttgccaggctg +gagtgcagtggcgcgatctcagctcactgcaacctccgcctcctgggttcaagcgattct +cgtgcctcagcctcccgagtagctgggactacaggcaccgtgtcaccacacccagctaat +ttttgtatttttagtagagacagggtttcactatgttggccaggatggtctcaatctctt +gacatcgtgatgtgcccacctcggcctctcaaagtgtcaggattacaggtgtgagccacc +atgccagtttttgtatttttagtagagacggggtttcaccgtgttggtcaggctggtctc +caactcctgaccttgtgatccgcccacctcagcctcccaaagtgctgagggattacaggc +atgcgcccccacacttggctaatttttgtatttttgttagagacgggggttttaccatgt +tggccaggctggtcttgaactcgtgacgtCAGGTTATccatccgcctctgcctcccaaag +tgttgggattacaggtgtgagacaccctgctcagcctttttttttttttttttttttttt +tttttttttgagatggagtttctttcttgttgcccaggctggagtgcattggggtgatct +cagctcactgcaacctctgcctcccgggttcaagcgattctctgcctcagcctcctgagt +agctgggattgcaggcatctgccaccatgcccggctaattttgtatgtttagtagaaacg +gggtttctccatgttggtcaggctggtctcgaactcccgacctcaggtgatccgcctgcc +ttggcctcccaaagtgctggcattacaggcgtgagccactgtgcccagcctgtagcTATA +CATCTTAAGAGTACATCTTCACAAATTGTCACAAAGTGAACATAAACATATAACAAGTAC +TCACGGAAAGAACCAAAATATTGCCAGCATTGCAGAAGTGCCCCTATACTCTTGTCCAAT +CACTGCCCCTCCCGAAGAGTAACCGTTGTGCCAACTGTGGATTAGTTTTATCTGTTTTCA +TGCTCTACACAGACTCACACGGTATATAGCTTTTAGTATCCTGGTTTCTTTCTCAACATT +ATATTTGTGAGATTCAGCTGTGTTGTTGCTTGTGGCTGTAGTTCAGTTATTTTCACTGCT +GTGTAATATTCAATTGTATGActacaatttatcaatttttaggTTTGAGGGGCATTTACA +TAGTTTCCAGTTTCTTACATGGTAAGTAGTGTGACTATGAACATTCTAATTCTAGTACAC +GTCTTGATACACAATATCCAATACAAATGTGTACATTTGTACAAATTCTATTCAGAAGTA +GAATTTCCCAGTTCCAAACTAGGATTCAGTTTAGAGGTACAGTCATGCGGATTTCTGAAG +TGGTTGTAGAGTTTATACTTCTACCCGTAGTGTGAGAGAGTTCTGTTGTGTCCTTTTTAA +ATTGGAAGAGCAGTAGATCTGCAGAGTTTGGCAAATGGACAAAATATgacctatttatta +ttttttttttggaggcggagtcttgctctgtcaccaggatgagtgcagtggcgcgatctt +gactcactggaacctctgcctcctgagttcaagcaattctcctgcctcagcctcccgatt +agctggaactacaggcacacgccaccacgcccagctaatttttgtacttttagtagacac +ggggtttcaccatgttggccgggatggtctccatctcctgacctcgtgatccacccacct +cggcctcccaaagtgctgtgattacaggcgtgagccactggcccaATATGACCTATATTT +ACCCCATCCTAGCAGACTAATTATTTGTTGTCTTCACTTCCAGTGCTTTTccatgtctgt +tcatgtttttatgAAGTCACAATTCTAatattcaattttgtattttgtttcttaacaCAG +TATCTTAATATTGCTTCAGTCTCTGACTTTTTAATCCCTGCATATGCCTAAGGATATGCT +TTCATTTAATAATCCTCTTATTAGAAATGTGTGTTAATTTCTGGTGTTTTACTAGTACAT +ACCGTTGTGGAAATCATCTTTGTGCATATAGTTTTTACCTCCCTCTTGGGTATTTCATAA +ATTTGAGATTTTTGTTTATGTGGCTTGGGATCTTTGTTAAACTGCTGCCTGCAGAGTTAT +CCTTGAACCTAATATGGAATTGattaaagaaatcttttttatttttttgagacaggatat +cattgtgtcacccaggctggagtgcagtgacaggatcagAGCTCGCTGTAACCGTGAACt +gctgggcccaagcaatcctcccgcctcagcctgcctcccgagtagctgggactacaggca +tgtgccactgcactcagctaatttttccttttttttttttttagttgtagagatggggtc +ttgctaggttgtccaggcgggtctcaaactcctggcctcaaacaatcctccctccttgcc +ctcctaaaagtgctgggattacaggtgtgagccactgcacccagtctaagAAATCTTTAA +ATTGCTAATATGTTACCTGCAAAAGGGTGTCTCATTGGGTTAAATTGCAATTCTGAAAAT +AATGGTGAGGTTGACCATgataacttctttaaaaatagcataaattGAACCTTTGTGGCA +ATTTCATTTAGGTATCActgattaattttctttatatggtCCTGTTTACAAAGGTATTGA +GCCAAGAGCTTGAAAGGATATAAGAAGGATCATACCATTAAGTAGTTGATTGTCCAGAAA +TTAtatctaataattaaaaataccagTTAGGCAAAATTCTTACACATGACCAAGGAGTGT +TCATTCTACAAATGCAGTGCTTGTTTAAGTTCTGAGGGAGAAGTCTTTCTTGTCTAGATG +ATTAGGAGCTGCTTCCCCCAAAAGTAAGACTTGAGCTCAGC +>NC_060934.1 Homo sapiens isolate CHM13 chromosome 10, alternate assembly T2T-CHM13v2.0 +CCGGCACCTCATCAACACAGAGTCACTAACTTCCCAGCAGTGTCTCTAGTCCCTCTACAA +GGATATACAGATATACACGCAGGAGCTATCTTAGGAGGCAACAAGACGCTCTTCAGGAAA +CAGGAGAAAGCAAAACATTTGAGGAACGGACAGGGGCATCTCCACCTTCTACTGCCACAA +TTTGTGTGTTAGTGATCAAGCCAAGGTTCTCAACCTTTCCAATCTATTAACCCCCTGCCT +GAGGCTCTCGACTGATCCCCAGCTGTACTTCCTGGCAATAAACAACCTGCCCAGCTGTGA +TTCCTGTGTGCACCTGACACCAGGGAGATGGAGCTGCCTGCCCAGCGGTGCTTCCTGTGG +GTGCCCCTGACCCCACAGGAGATGGGGACCACCTGCCCAGCTATATTCCCTCTGTGGGCA +CCTGACACCAGGGAGATGGAGCCACCTGCCCAGCTGTGCTTCCTGTGGGTGCCCCTGACG +CCACAGGAGATGGGGACCACCTGCCCAGCTATATTTCCTCTGGGTGCACCTGACACCAGG +GAGACAGAGCTGCCTGCCCAGCTGTGCTTCCTGTGGGTGCCCCTGACACCACAGGAGATG +GGGACCACCTGCCCAGCCATATTTCCTCTGGGCGCACCTGACAACAGTAGGATGCTGCAT +GTGCCTACACTGACAGCTACAGCATCATCTCCTGCTGTAAAAACTCCCTTTCAGAGGTAA +CAGGACAATGGGGCAGGTTTTCTCCTGGAGAAGTAAAGAAGCTGAGAAATCCAGGGGATT +AGGAACGCAGGTGACAAAAGGAGGTTGTGACATCTACACGATGTCACATTTGGCAGCACA +AGGGAGTGCTGGTATGTGCTGCTAGGTACTGTTATTCCCAGAACCACCTCACACTGCATG +GCATTGACATGCTTCCCATGCTCGTTACCCTTCGGAAGACACATTTAAATAACCTTGACT +TGCTGGGATGCAGCTGGAGAGAGATGCCTGGAGACCACCAGCCCAGAGTCAAGGCTCCAT +TTTCTCCTGCTTGCAGGACTTCTGCATGAAGCTAAGGCATCCAAATGTGCATAAGATTTA +TGAAGAGCAGACAAGCTGCATGACATCTTCTGAGAGGGAAGCTGTGCCATGTCAGGGGTT +GGGACAGCAGCAGCAAGGGGGATCAGCCCAAGGCCTGGGGAGAGGCAGTTGGGAAATCTC +AGTGTGTGTAGCCCTGGGGTCTGAGGCTTTCAACTGTCCATGTGGCTCCCACAGCTCAAG +TCCAGCGTGTGGTCATGACCCAGGGCAGGGCCACTCACAGAGCACAGTTCATCTCAAATG +TGATGGGGACGCTGAATGATACGCCAACGTACCAGAATAGAATCCCCAGTACTCACATGC +AGAAGGCACTCCCAGCAACACGCATGCCTACACCACCCTGCACCAAGGGGCTGGGCACTC +CTGCAGTCTGCAGCTGCCTCCTATCCCCCAACACACAGTGGCCTCCCGGGACAACATTCT +ATTTGCCGGCCACAGCCTGGAGCCCCCAAAGCACGGAGGAGGGGCTTAGCGAGCCACGCA +ACGTTCCCACCTCACACCCAGGAAACGAGCCCCTCACTGAAGTGGGTCCTGCACCCGCCA +GCTGTGCATGATCAGAGGTGTGAGGTTATGGACATGGTCACACACTGTGCACAGAGGTGT +GAGGTCACAGACCTGGTCACCCACTGTGCATGATCAGAGGTGTGAGGGCATGGACCCGGT +CAACCACTGTGCAAGACGAGAGGCGTGTGGTCAAGGACCTGGTCACCCACTGTGCACGAT +AAGAGGTGTGAGGTCACGGACCCGGTCACCCATTGTGCACGATAAGAGGTGTGAGGTCAC +AGACCCGGTCACCCGCTGTGCACGATGAGAGGTATGCGAGGTTAGGGACCTGGTCACCCA +CTGTGCAGTCAGAGCCATGCGACGTTACAGACCTGGTCACCAGCTGTGCCCAATCAGAAG +CTTTTGAGGTTAGGGACCTGGTCACCCGCTGTGCACAGAGGCGTGAGGTTACGGACCTGG +TCACCCGCTGTGTCCAATCAGAGACGTATGAGGTTACAGACCTAGTCACCAGCTGCAAAC +AATCAGAAGCTTTCAAGGTTAGGGACCTGGTCACCCGCTGTGTCCAACCAGAGCTGTGCG +AGGTTACAGACCTAGTCACCAGCTGTGCCCAATCAGAAGCTTTTGAGGTTAGGGACCTGG +TCACCCGCTATGCACAGAGGCGTGAGGTTACGGACTTGGTCACTCGCTGTGCACTATCAG +AGGTGTGTGAGGTTAGGGACCCGGTCACCCGCTGTGTCCAATCAGAGGCGTGCGAGGTTA +GGGACTGTGTGCGCGGTGACGGACCTGGTCATCAGCCAAGATTCCTGATGTTTCCAGTGT +CATCTCAGCTTCCTTCAAAACTTGAAATCTTTAGATATTTCCCAAAAGCTCGTCCGTCTT +TGAAAACGATACATATGCGCACAGGTGAGTTTGTTCCCGCACATTCCTTTCAGTACTGAC +GATTGAAGATCGAAGGTTAGAGCATTCCAGCCCAGTGCCCATGTCCCACCCCATCTGTGA +AAACCTGAGCACAATCAGAGGCTGCAGACAATCTCTGCATCATCCTCAGAAACTGTTCCT +GACCATTCACCTGAGGCCACCAAGTTTAAATGAGGGGCCCAAGTTTTAAAAGACAGGAGA +AGACTTTTCCACAATCTTTTTCTGAAGACAGAGTCCATGCGTTGTATCATCAGCACCATT +TGTGCCTGTCCTGGTCAGGAAGAGCTGCAACCACGTCTCTGTGCTCTTCCAGTGCAGGGT +GctgcccttccctccctttccaagCACAGAGCAGCTCCTGATGACCCAGCACCTCTGCTC +AGCCACCTTCCCCCAACGCCTTCCTCCCTCACGCCAGAGGAGCTCGTGCAGCCAGGCTTT +CTGGCTCACCACCGCGATTCAGTCACTTACACCCTCATTCCAGGCTGAAAATCTCTTCTG +AAAATATCCAAATCTTACCCATGTCAGGCTCCATCTTTTCCCCAGAGCCCCTCACCCACT +CCAGAGCAGCATCTCCGGTGCCCGTGCAGCCTGGGCGCAGATCCACAGGCTCAGAGTGCC +CAGGCCCTCAGCCCCTCCATGTGTGCCCTTACTCCCTTGCTCCCCAGCGTTAATGCCCCC +ATCCTCGATTTCCTGGTAGGCAAAAGGGGGTTAATTCTAACAGTGCTTACCTAACTGGAT +AATTTCATACCGCATCCGGCCCAGCATACTGCCTTGATAAATGACAGGTCCTGCTGCACT +GTTACCATTGTGCTGGTTCCGGATTTCCTGTGAGCCGCTAAGCTCTTCGCAGCAAAGACC +ACTCAATGGTCTGGTCCAGGACTCtctgggatggatggatgggtgagtggctGATGGACA +AGTGTGATGCTGAATGGGATCATGCAAAGCTGGCCCCACGTATTTTGGTCAACGTAAGAA +AAAAGCCTCCCATGTTTGCTTGCTGCCACCCTAACCGCAGCGTCCAGAAGAAGCCACTTA +AAGGCAACTGTACCGCACATACAGGAGATGGCGAGACGAGACTGGCTGGAGATGGGAAGT +TGTGTACTACTGATCAGGGCTGCATGACCCAAAAAAGGCATCACTCGAAAACACGGCTGT +TCCAACAGCAGTGCTGGAAGGCGGCCACTCTGACCCGACCGTCCACCTCCAGGGTCAGCC +ACCTGGCACCTCTTGGATGTCTCATCCTGGGCACCCCTTCACAGAGTAAATGAGCCTTTT +AACTTCAGCCTGTCCTCGCTAGAACACTGACTCCCACCTCCCATGTCCTGAACCGGCCTG +TTCCAGGGACTGCTGTGGACAGACGAGCAGGCCCAAGATATCTAGTGGCATTTCCTGGCA +AGGACACTCACGATGCTTGACCATACAACTAGGGGTCGATTGGTTTTTTAGACTGACTGT +AATTCCCTGGTGGCACGCGTGGATACTGATTCACCCGGGGAGGGGCATAGAGGAGACTGA +AGGAAAACCCGTCCTAACCGCGCCAGGTATTCCCGCACGCACCGACATCTTCAGACTTCT +GCAGCATCTTCCTCCTACAGacaaactgaagctcagagacaCTAAGGAGCTTGTCCAAGA +CCAGCAACAAGTATGTGAGCAGCTGGGATTCAACCAGGTCCTTCCCTGGATCCATCCGCG +CTGCTCCCCCTCCCACCCCGAGGCAGCTCCAGATGGACACAGCAGGTCGGAACATCCCAC +ACCCCAAAGACAGACTACGGAGCAGAGCCGGCTTCCGCAGCGGAAACTCACACACAGCCC +ATTCCCATTCTTGCCGAATATCTCAGGGACTCTGTGCGGTAAGGGCTGCAGGTGTGACCT +CACTCTGCGCCAGGAGATCCGGGTGGTAGGCAGTGTTTTGGAGGGTGCTCGTCCAGACGA +GAGAGAGGCATCTAAGGGGGCTCATAAGCAGATCCATGAGACACAGGACACCTCAGAGAA +GGGCCGACAAACCCCACAAAGTCGCTCCCATCCTGGAGAGCAGCTTGGAGAGGACGGGGC +GCCGCAGTCTCCTCCCAGCCCACGCTTCGGCATGGAGAGCAGCTTGGAGAGGACAGGGCC +GCCGCAGTCTCCTCCCAACCCACGCTTCAGATGGGTCTCGCTGCAGCCTGTGGTGCTCAT +CAGGCTAAGCAGCAAGAGGAAGCTTCCCAGGGCAGGAGTTCTCCTTTCACAGCAAAAGTG +GCACAGGCAATGCAGCAGGGCTACTTCAGCCCAGGGCTCAGGAACCACGGGGTGCAGCGC +GGCCTGCAGCAAACCAGACACATCAGAAGCCAAGGTCCCACTTTAACATTCAGTGACATC +GAACGGAGGGAGTTATCTGTAGCAATCGCCTTCCTGGGGGACCCGTACAACACGCATGAC +CACTGAAACTGACTGAGTCCCTTCTAGGTCCTGGGGGCTACCCCACTTTACACTCATTGG +TTCCATTCACAAATCTATGTGGGGCAGTTGTTAGCCCCagtttagagatgaggaaaatgc +TGCTTGGAGAAACTAAATGATAAAACCAGACTTCAACACACCTTGCCGTCTCCAAGACCC +CTGCTCTGTGTCCTAGGGTCTCAGGGGCTGGGTATTCGGCATTTTAAGTGACTAATCATA +GGCAGTTTTCTTCTCTCCTGCACCTATATTTAGCCTGAACGTGCACGTACATGCTCAGCT +GCAGGTGCACTGCCGTATGTGGACCAGCAACGCTCTTTCCCGCCTGGGGTTCTCGTGACC +ACCTTCCGGAAAGCTCTCGCCTGCTTTACAGCCGTGCCAGGCAGGCCTGGGCAGCCGCAC +AGTGAAATTACTGCAGGGTCAGAGCCAAGTGCTGGCTGAGATTTTAACAGCGAAGACAGC +AGAGCAATGGGGATAAGCTGAACAAAACTCTATTGCAGCACAGACGGAAATCTAGAAGCA +AAAGAAGCTGACACCCCTGAGAGAGCAGCTGACTGCATCTCACTGTGACGTTAACAGCAG +CCTGCTGTTTCCAGCGCCTCCGTGTGCCGGGGTTTCCAGTCAGCATTTGTGTTTATCTGC +TCTTGAGCTGCCTGATCAAACCTCCGTAAAGATCAGGGATATCTAAATTGACCCAATATC +TGCATGCTGGCTGCTCAGAGCTGGTGGTGTGGGACAGCCAGGACATCACTTAGTCATACG +GGGGCACAAACATGTCACTTGCCACTCATGTCtttatctcattaaaacctaTTTTCTCCT +GAATATTGACCACAGCAAAGTCTATTAGCCTTCGAGATGCAGTTGAAACATCGACGTGCT +TTGTTCAAGAGGTTTAAGACACACGTAAGTCTTTCTTGCCATGCTCAATACACACAGCCG +TTTCTGAAGTCGGTGTTTCTGGAACAAAAGCCTTGGCCTGCCCCAGTGAACATTCACGCT +GAACACACTGTCGCGATGCTGCTTGGCCAGCCAGCAGGGGGCAGGAGAGAGCAGCAGGTG +CCAGCGTGGAGTTCCTGCAAACTCGCCTCAATCAAGGGCGGTGTGTCCTGCCAATCCAGC +GGCTTCCTCCAAGGGGAAGCGGCCTCTTCAGCTGCCACAGCACTGATTTCAGGCGGCTCA +GCCAATGGGGCAACAGATTCAACAGAGTTCCATGTCGTTAAAGGAAAACTTCTGTTACCA +GGCAACCTTAATATCAGATTCAACGTAAAATAACCAACAAGATTGTTTCCAAACCAAGGT +GCTACTAGTGCCTTATCCTTCAATGCTGCTTAAACACGGAGAAGTATGAGGAAAAAAGAA +CATAGCATTTACTTCTTAAAAAATAACACGTCTTCCAGGTTCATTTTACCCATAAAGACT +TAGAACTGTGGCTTCCCTAGAGGAACGTGGTGGGAGGTGGATCCCGACACTGACCCAGCC +TCCCCCAAGTCAGTCACCCCTCCACGGGGTTCACACCTCTCCAGGCCCTGTCACCTCAAC +AATGAAGGGTGGCGGCTCCGAGCTCTCTTCACAGGGAGCACCGAACAGGAGctagagaga +gacacagacacacccacaacCGCTTAAAAATCCTGAAATGCAATACATATTTAAGGACTT +CATTATTAGTTTTTCAAAACTGTAAGAACAAAGTGAGCCTGGCTTTAACCTGTGTGACAC +GATAACACCGTGTATATCTGTCCTTTACTGTCTGTTCCTTCTCCAGCTGCTGCTGCCTGG +CTGGCCGACTGCGGGAGAAGAGCCTCTGGTACTCCCGGGAGGCCCTCGGTAAAAGCGTGA +GCACCACAATCACCTCTCAGGACACCGCACACGTTAGGGTCGCCCACAGACGGCCGTTCC +CAGTGCCTTCTTATAAAGGCATGAACGGGCCTCCTGCTCTTTGTAAATGTCAACCTTCCT +AAGCGATGTCGTGTTGACAATTTTTAACTGCAGTCCACCTATACTTCtttgtttctgtct +tgtttttatcctAGAGGCATattattatggaaaattaaatTTGCAAGGTTGAAGCGTTTT +TTAAAGTTGACTTCTAATcctggaagggaaaaaaatgggccagatgtggtgctcacacct +gtaatcccagcagtttgggaggctgaggcaggcagattgcttgagcccaggagctcaaga +ccagcctgggaaacatggcaaaaccctgtctctactaaaaataaaaaataaaaataaaaa +taaaaaattagctgggtgtggtgatatgtatctagtcccagctactcagggtgctgaggt +gggaggatcacctgagaggtgatcacccaggaggtgaaggctgcagtcagccaagatttg +cgttgctgcactccagcctgggcgacagagtgagaccccatctcaaaaaacaaaaagcaa +aaacaactgtATACATCATTATAGAAAGGAGCTGgccgggcagtggctcacgcctggaat +cccagcactttggaaggtcggggtgggcagatcacctgaggtcaggagtttgagaccagc +ctggccaatatggcaaaaccccatctctaataaaaacacaaaaattagccaggcatgatg +gtgggtgcctgtaatcccagctactagggaggctgagggaggagaatcacttcagcctgg +gaggtggaagttgcagtgagccgagattgcgccactgtactccactccagcctgggtgac +aacagcgagACCccacttcaggaaaaaaaaaaaaaaaaaaaaaagggagctaatgttttt +catttaagggaagggagaagaacaTTCAGTATTTATACATCTCACGCACACATCTGCAGT +GGGGCCCTAAAGTATTCAAGATACACATTCCTACAAATATAGCTCAAAACTACTCACCAA +GTTTCATGCTAAAAGCACATGCATTTTAAGAGTgctacattatattttttaagcatCTGT +ATCCAATATTTTAGCATACTGGCAGTTTTCCCTTCAGGTGCTGTATGCCTAAATTATTAC +ATGTTTAGTCGTTCATGTTAGAATTTATGACTCGCtttagacaaaagaaataaacataag +cTACTAAATTAATGACTTAGGGGAAAAGTTACTACAATAACTTAGAAGTCAAACTTTGCA +AACTGAATTTGTTGGACCATGTAAGCCAGatgatcagtttttaaaattgtttgttgCGTG +TTTCCCTCAAGGACGGAAGTCTCCCCTTTACTCTCATCCACTGCATGCTGCAGCCCGCAC +CTCTCATCCACCACAGCACACTGCGGCCCGCGCCTCTCCTCCACCGCGCCACACCACGGC +CCGTGGCTCTCGTCCACCACAGCACACCGCAGCCCATGCTTCTTGTCCACCGTGCCACAC +CGCGGTCCACTGCGCCACACTGCAGCCTGCAATTCACCCTGTACCACGCCTTCCACACCT +TACCTGAAAGTGAAAGTCACTAAGTATAaccaagaaggaaatgaaaagtagaTAAAtgac +ctccacccccaccccatgtcCAGCCTGCACATGTTTAAACATTCATcaaagtaaaaccaa +aaactcACGTTAGCTCACGATTGTAACTGGTAGAATCATGTGCATGGCAATTTTAAAAGT +CTCATTAAGTAAAAACCTAATCGAACCTCTCAAGAAATACAAAGTTTATACAAAAAGACA +TCTGCAAACATCGACAGTGAGGAAAGGACTTCACTCACCATCCAGCCTGTCCTGGAAGCC +ACGGCCAAATGCCAGGTTGTATAGatccaaaaagcagaaaaaacagTGCTGAAATGTGTA +CAGTCTTGGCAATGTACAAATTCAGATGTAGGATGCTCAGAAACCTTGAATTTCCAATCA +GAGAACAGGAACATGAGCAAGTTCCCCAGCAGTGCCCACCTTCTGCCTATAGCATGTGTA +ACAGGAATGCTGGCCACCTCGGGGGGACAGAGGCTTCCTGGTGCATTCGCCCTGCCAGCC +GCACAGCTGGCCCCACCACAAACACCTGCTAATACTGAAGAACCACCCCCCTTCCTTGGG +CTTTGCTCACTCTAGCCAGGAGAGCGTATTTACACAGTGCATTATCGACTCAGTTCTCGT +TCAATACGTCAAGCTTGTTGAAGGCATGGCAACCCCACTCCTGGCCCAATTAAGTGAACT +GAGCAGAACAAATGCCCCCAGTTCGACGGCACTCAGTCACAACAGCAACGGCCACCATTC +ACAGGGTGCTGGCTTCGTGCCGGGAACAGTTCCAGGCGTCTTCTTTGTCCGAGGAATTTA +CACTGCAACCCTGCAGGGCCGTTCGCAATGTTCACCAGAGGGTTCTGAGGCAGCCAAGTC +CAGGCTGTCTGTGGGCCTCACCGCATGGCCGTCCGTGTCCCCCTGCAGACCAGACCTCAC +TCCAAGGACCGCGGGTTCCAGGGCTGCCTTGAGGCACATGCTCCCTTCGCCACCTCCTCC +TGGCCCCTGACACCGACCCTCACCATTGCTGCCAACACCGTATTTCCTCATGGCTCCTGA +GGGACCTGGTCTTTCTGCACGTCCCTGCTCCCTGCGTCCGGCTTGGAGGATGCCCGTATC +AACGCCAACATTCACGTAATCACCACCCCCCTTCCATGGGGGGCTTTATGCCTAGGAGTC +TCAATATCAGAATGTCGGATTCCTGTGCTTGGAGGATTTATTCCCACTGTGGAAGTGAAG +GGGGTAAAATTCTAGGTGCCTGCAATAACCTCATTTCTGTAGCTAAGCAACTTCAGTAGT +AGCAAAAAACAagctttttttaacttcttttatacaagctaaaaacaatttttacGTCCA +CGTTCTCATCAGCTCCCACCTGGTGAGCAGGCAGATagtaattttcagaaaaacaaattg +ttCCATAATTTTAACACTTAGTGTTATCACTATTAAGAATTATAAACGTTAATTACATAA +CTATCCAAAATGcctcagggaaaaaaatgtcATCCAATTGGTTCTTTAAAGTGTTACAAA +TGCAGCTGAGTTTTAATAGTAACTTGTCCATAATTGtcaaa +>NC_060935.1 Homo sapiens isolate CHM13 chromosome 11, alternate assembly T2T-CHM13v2.0 +ttagctgggtgtggtggcgggcgcctgtaatcccagctgctcgggaggctgaggcaggag +aatcgcttgaacctgggaggcagagatcgcgccagtgtcctccagcctgggtgacagagc +aagactccatctcaaaaagaaaaaaagaagtcaagttTCAATTTTAACTTGTGTTAGTGT +GTGATCCTGTCTTTGTGTGCTGTGGAACTTGGTGCTGGTGGGACACAGGCTGCTCACCCC +ATCCCTTGAGCTTTGCGTTTATTCCTGGGATTCTGCATGTGAATGGGAGCCTGTGCTGTA +TCTGGGAGATGCTGACTGGGTTGCGGGCACGTCCGAGGGTCAGGGTGGGGCCGagtgcag +cctcctcctccagtGGGCCTGTGTGTGGAGTGGTGGCATTCTGGGTGTCCCTGAGGCCTG +GTCGTTTCCATCTTCTTCCTGAGCCCACATGGAGATGACGAGGGGTTTCCTGCTGGTCTC +TTGCAGAACAGGGTTGAGTGGTGTCCTCACGTTGATCTAGCTTCTGGGTCTCCCATTCTG +CATGTGAGCAGGTTGATGGGCTGTTGTCTCTTCCACGGTTAGCCTCCCTTAGGCTGGGGC +TCCTTCACCCCTCTTTTCTTAGAGACATTACTGCCCAGAGTGAGAACCCCTCACGTGGGG +TGGCCGTGTGGTTCCAAGACAGGGTCCTGTGGAGGCCCTGTTAGCTTCCCCACTGGAGGC +CTCCCTCACAGCAGGCTCCTGTCCCGgcatctgcactccagccaggcagaGTCCTGCTCC +CGTGCACACCACACCCTGTCTGTCTGTGCTGTGGGCCCTTGGCGGGGTTCTGGGTGTCTG +GAGCCCCTTGACCTTGTTCCTCCTACAAGGTGACCTCGTCAGGAAGCCCCAGGATGAGAC +TGTCCCTGGCTCCTCCAAAGGTCACTTCAGACATGTGCACCCTTTGGAGAGGTCCCTGCT +GTTTCTCAGAACTGCTGGGGATGGAGGCTGAGCCCGAGAGTGCTTGCTCCTCGCGCTCCC +TTCTTGCTATGGTCTCCGGAGATGCCTCCCAGGCCACGAGCCCTCCTGGCGTGGTTTTAC +TGGGACCTGGCTTTGCAACAAAAATAGTTGTTTTAACCTCCCTAACCACTCCCAtccctc +ttttgtttttctctataaCGTGTAGGGTTTCTTAGCTCTCCTGTATTGGTCTCACTCCAC +TGGAAGGAAGGCTCAGGAACGCAGGCTGTGTCTTCTCCCGGGTGTGGCTGGGGCGGGGGC +TCAGGGAATGGCTGTGATGGCCCAGTGTCCAGGAGGCTCCGGGCCCCACCCCCCGCCTTG +CTGCATGACCTTCACAGTGTCACTTACCGGCCCTGACTTGCCTGCGGGCACCACGCACAC +GGCATGAAGGTGCCCTGGCCCGGGGCACGGACACAGCCAGAGCCACCGCGCTCCTGGCTG +TCATCACGTCGTTGGCTTTGCGATCTAAACCTgcttgttgttttggtttttctttctttc +tgttttctttcattcttttttttttttttttttttttttgagacagaatctcactctgtc +acccaggctggagtgcagggatgtgatctcagcttactgcggTCCCCGACTCCTGGGCCG +AAGTAAtctcccctcaccctccctcttcccaagtagctgggaccagacatgcgccaccac +atccagttaattttttttttttttttggtagaaatagggtctcactatgtttcccgagct +ggtctccaactcctgggctcaagtgatcctcctgcctcagcctcccaaagctctggaatt +acaggtgtgagccacggtacCTGCCCCCAAACACTCCTGACTCTTCTTATCCTAACCGGG +GTCATCTTACTCTCCTCACCGAAATCTGATGTCACCTGTATGGAGGAAAGGGTGGGCCTC +ATGGAGGGGCAGGCCAGGGACAAGGGGACTCCTGGgccccagctgagcccagcccgtTTC +CCCTCAAGGGCTGTCTCCAGGAGGACACGTTCTGTAAGTGTAGTGTTCAGCAGAGGGTGA +GTTTCTGGGTCGCCGAATCCAGGCACCCTTAGGAATGGGGGCCTAAGAGGGCCTTCTGAC +GTGGGTTCTCTGCTGTGATTGTGGGCAGGTCTCTCAGTACTGAAGGGCCCCACGGTGTGG +AGCTCAGCAGGAAGGCTGAGGTTCCCTGCGGTTTCCTCATGGCTTAGGACTCAAATGCAA +ATGTATCTAAAGAAAAAGGTGGTTGATAGTCACAATGAAACTTTTATTTACCTCTGGTTG +TCTTAAATGCCTAGTATTGTAAAATATGGCAGAAGAATTCactttcatgcctgtaatccc +aacactttgggaggccaaggtgggcagatcccttgagttcatgagtttgagaccagcctg +gaaaacatggcaagaccccgtctctacaaaaaatacaaaaaaatccaacCTGACccacat +ggcaagaccccatctgcacaaaaaatacagaaagttccAGCCTGGAGCCTCCACCTGCAG +TCCTGCAGCTCCACCCTGGCTCTTCATGAAATCGGCTAAGTCCAGGTGTGGGTGCGTTCA +GTGCAGCACCCACGTGCAGGTGACACGCCCATGCACCGCCACAACCACGCTCACACCAGA +ACATTCCATCATCCGGAAGGCCCGTGTCTCCGCTCCAGTCTGCTTTTCGTGGATGCAAAC +TCATTTCCTTGAGTCGTGTGTGGGTGACAGCAGATGGGAGGTTTCTTTTGTGCCTGGCGT +CTGTAgcgtgtttttctttttctttttttatcttttgagacgggatctcacgATGTTCAt +gatgttgccccggctggtcttgagctcctggcccaaaacagtcctcctgcctgggcctcc +caagggGCGTGTCTTTGAGATCTATCCACGTTGAGGTCGTTGCCAGCAGCACATTCCTCT +GAGTGCTGAGCCATGCTCCGCTGGTCGGAGGGACCACAGTGTTTCCTCCACTGATAGAGT +TTTGGTTTGTTTCCCGTTTTAGGTTATTATACCTGAAACATCTGCATGTAAGTCTTTGAC +TGGACCTGTGTTTTCATCTGTCTCAGGCCCACGTTTGGGAGTGTGTCTTTGACTGGACCT +GTGTTTTCATCTGTCTCAGGCCCACGTTTGGGAGTATGTGGCTGGCTGGATAGCAGACGT +AGCATAGGCCTCACTTTTCTGTGCCGTTTTGCAGTCCCACCTGCAGTGTGTGAGCATCTT +GCTCCGAGACCTCACCAGCACTCTGCATTGTGATGTTCTTAATTTCAGCCGTTCCAGCAG +ATGTGCACTGATGCTGTGTCGTGGCTTGGATTTGTGATGCTTTTAATTTCAGCCGTTCCA +GCGGATGTGTACTGATGTGTCCTGGCTTGGATTTGCTTTCACGGTGACCAGTGCTGCTCC +TCGTTtgttcatgtgcttattggccatttgtatgttttccttgtgaagtgtctgttcaat +tttttgcctattttttcattaaattgtttattgagctgtatgagttctttataaattctg +gataaaaagtattttttttctttttttttttttgagattgagtctcgctctgtcgcccag +gctggagtgcagtggcgcgatctcggctcactgcaggctccgcctcccgggttcacgcca +ttctcctgcctcagcctcccgagtagctgggactacaggcgcccacccaccacacccggc +taattttttgtatttttagtagagatggggtttcaccgtgttagccaggatggtctcgat +ctcctgacctcctgatccgcccgcctcggcctcccaaagtgctgggattataggcgtgag +ccaccgcgcctggcctgatttttttttttttttttttttttgagacagatcttgctctgt +ctcccaggctagagtgcagtggcacaatcatcctagcgcactgcaacctcaacctggGCT +TAAGCGAATCtgccacctcccgagtagctgggactacaggtgcctgccaccacgcctggc +taattttttatagagatggggtctcactgtgttacccagtctggtcctgaacgcctgggc +tcaagcaatcctcttgtctcagcctcccaaagcgttgggactacagacgcgtgcaGCCTA +CAAagttttatcagatatatgtattgtgaatattttctcccagtttgtgacttgcctttt +catttctttagggcACAAATAGTTTACATTTCATGGAGGCAAGTCCTGGGCAACATGCTT +TAAGTGCATTGTTCACTTAATTTTCATGATGTCCTTGGAAGTCAGAAGCTTCCCCATTTa +gatatgaggaaactgaggcacggagggGTGCATCATCTCTCCAAGGACACACTCCAGTGG +ATGTAGGACCTGGGTTAGACGTGAGGACACACTCCGGTGAATGTAGGACCTGGGTTAGAC +GTGAGGACACACTCCGGTGGATGTCGGACCTGGGTTAGACGTGAGGACACACTCCGGTGG +ATGTCGGACCTGGGTTAGACGTGAGGACACACTCCGGTGGATGTCGGACCTGGGTTAGAC +GTGAGGACACACTCCGGTGGATGTCGGACCTGGGTTAGACGTGAGGACACACTCCGGTGG +ATGTCGGACCTGGGTTAGACGTGAGGACACACTCCGGTGGATGTCGGACCTGGGTTAGAC +GTGAGGACACACTCCGGTGGATGTCGGACCTGGGTTAGACGTGAGGACACACTCCGGTGG +ATGTAGGACCTGGGTTAGACGTGAGGACACACTCTGGTGGATGTAGGACCTGGGTTagac +atgaggaaactgaggcacagaggggtgcATCATCTCTCCGAGGACACACTCCGATGGATG +TAGGAACTAGGTCTCTGCCTCCATTTGCAGATGGTCATGCAGAGGGGGTCTCAGGCGAGT +GTCTGGCACAGGCAGTGGCTGGGGTCTGGTGGCCCCCAGTTCTGATACTAGGCTGGTTGT +GGGCTTTTCCACCAGCGATGGGACAGGACAAGACTGCAAAGGGAGcgccctgcctcctcc +tcccacgTCTGGGCTCTGACAGGCCAGAGGACGGGCAGACCCACGGCTCGTGGCTCACTC +CAGCTAGCAGCGGTCACTCTGCAGGCCTCTGCTCAGGCCCCTTCTCAGCTCTTGGTGTCT +TGGGCTGCTGCACTGAATCTCAGATGTTATTTCATGAACCCAAAGAGTTGTTGTCTCGGC +TTGTCTTGCGCAGTGAAAAGCGCGTGTTTTACGTGTCCAGTTGCTCTTAATAGCAGATAC +CTGCCCTGGACGCCAGTGGCAGCATGTGCCCTCTGAGCAGCGGCCTTCAGCTTCCCAGGA +ACACGGGGCTCTTCCTGTCCAGCCTCCTGGGGGCTGGTCTCAGCCCTGACTGGCCAGCAG +ACGCAGGGTCATCTCGGAGTTACCCAGCTAGGGACTCGCAGCCAGTTGCTGGTTGGGAGT +TGGAGAGTGGAGTTTAAGCCCTCTCCTTGACGTAGAGAGGATTTGGGGCCTGTTACGTGA +GTATTTAGCAATGCTGCCCAAGCTCTGACACCATGCTTATGCGTTTTTGGATTTCAGGCG +AGCCCACACCTTAACCGTGCTCTTCATCCTCACCTGTACGCTTGGCTATGTGACGCTGCT +GGAGGAAACACCTCAGGACACGGCCTACAACACCAAGAGGTAAGCTGCCCTCTCGTCCTG +CCTTCTGAAACTGCCCTGTGCCCCGTGTGGTGGGTGTGGCACCCTTACTGCTCGGGCTGC +CGGGGGCTCAGAAGGCCTTCACCAGAGGGCTGCGTGGGGCCGCCGGCCTCTCCCTTGAGT +GTGTCTGATGTGCAGACTCCAGGGCTGCCCTTGGTGCTGCGTGGCGTTCCCGGTCAGCCC +CCGTCGCCTGTCACTGGGAGCCAGGAGTCTGTGTCATCTCCACGTGACCGGCAGCCTGTG +CTGCGTTTCCTCTGAGTTTTGCATGTTGAGGTTGGAACGAGCTGCAGCAGCTACAGGGCT +GAGCCCTTGAGTTTGGGCGTCTCCGGGGGTGAGGTTCCTGCGGTGGCCGCGTGCTGGTTC +CGTTAGCCAGCGGGGCTCTTGCACGGACAGGGGCCGACACGGACCGCAGACCATCTGGTC +AGCAGCCAAGCGAGTAAACTCGTCTTCTCAGGTTTGTCTCCACAGGCAGGCAGGCTAGAC +CTTGGGTGTGTCCTCTGCCTGAATTCCATGGATTCTGACGCCAGTCTCAGAAGTGCGTGT +GGAAGAGAAGCTGGTTTTAGAGCCTGTGAATCAGTCTTGAGTTTTCTGTGCCTGACTCTC +CTCTCGCGTTGCTCTTCCGACGCGCGCACAGGGTGTGTCTGCCCAGGGCTGCCTCCTGCC +CAGCAAGGCTGCTGACACCATCAGGGCCTGGCCCCACTTGCTCCGGCGGGATGGTGGGAG +GAAGCCGGAGCAGGGTCTGAGACCAGCAGCAGGATGGGGACAGAGGTGGAAGGAGGCATT +GGAGGCCTGTTGGTGTCGGGGCCACAAGTTGGCTCTGGTTGGCGGGAGCCCTGGGGTTTG +TAGGACTTAGCTGTCCCTACAGCTCTTGGGCCAGCACTTCATTTTGTAAAGCAAGAGTCT +CGCTATCTTCGTGACTGTTGGGTGGGGTGATGGGTGGGCATGGTGTGAACGTCATCACGC +TTGCACGGGCGTTGGTGGCCCTGTTTGCCCACTGATTTGACACCAGCCCTGTGGGCTCTA +GAACACAAGCATGCCCAGTGCCCTGTCTGTAGGGGAGCGGATGCTTTAGAATCACGCACA +GCAGACCTCATAACTGAGTCCATCTCCCTGGGGGCAGTGGGGCATTTCTGGTTAGAAATT +ACTGTTGAGGTGCCTGGACCCAGGACTCTGCAGCCTGCTCCCCAGATGAGCTCACCCTCC +ATCCtcacctgggaggcgcaggtggCCTCTCCTGTCCTGGTCTCCCTACCCTGCTCCTGG +CTGCATGCTCTGTGGGTTCTCTCCCACCTTGCTGTCATCCCTCTCCCAGTCAGCTTTGCT +GGCCCTTCCCCCTTTTTCTGAGCCTGAGGTGCCAGCTTGCTCCCAGGCCTGGCCTGGCCA +GTGCCTCCCGTGCTCCAGGCCCAGCTCGCTCCTTCTCCCTTTCTTAGGCAGTCCCAGCGG +GGGTCACGTGCAGAACCTGCAGGCCCGGTGTGCACTGTGTAACTAGGCTCCAGAAATAGA +TGAGGGAGCATGTGCCGTGCCTGGGGCCCCTGTGGAGGGGCCACCTGGGGACGCTGGACC +TGTGGCTCTGGAGGCAGTGAGGCAGTGGGCAGGAGCCCCGTGTGTGCCTAGAGGGAGCTT +TCAAGGAGGACTTGGTCTTTCTTGAATTCATCCATCAGCACCTGGCTAGGAGGGTCTGTG +GCATCTGCCGGGCACAGCAGGGTAGGTGGATTAGGAAGCAGGACCGGGTCTCACCTCAAG +TGTCCCACATGGCAAGAATTGTCAAGAGCAGGAGTGCAGGGGGTGTCTTGGGAGCACTCC +CCGAAAGCATTCACCAGGCCCCCACCAGGCGCATCACAAAGCCTCACCACCCCAagccag +gccctgccctcccAGGCCTGGTTCCTATGGGAAGCACTAGGTGACCCAGACCCAGAGGGG +CCAGGAGCTTAGACCCCTGAGGGGGCAGCAGTGGTGGGCACGTCCCCCACTTCACCCAGC +ACTGGCCTCTCCTGAGTGGCCCCCGACGTGAGAGGCTGGGTTCTGCCATCCTGTCCTCTC +CAGCAGGGAGCCCCTGCGTGTGTTCATTGAGAGGGGCCAGGAGACGGGAATTCACGGGGC +CCTGGGCACTCTTCTCTGAGGTTCTGTTCTGGGGACACTAAACGCGCTCCCAACTCACAT +TCTCTTTCCCCCTCACCCTCTTTGAGGGCACAAAAGAAGCCACCTGTCCTTCTCTGCTGC +TGGCACCTAGAACCTGCTCTGGGCTCCTTCCTGGAAGGCTCGGCTGCCCCAGGTCACCCT +GGCACTGACCGTGGCTCTGTGGCTCCTTCCAGTGAAATTGCCGTGGTGCACCTGTCCTGA +GTCCATTCTCATGGCCTGGACCCGCACTGCTGCATACCAGAAGCCCAGCTCCTGGGCAGC +CACCCTACCTGCCCCTACGCAGGGTGTCCACACAGAGGGTGTCCGCACACAGGGTGCCCA +CACACAGGGTGTCCCCACACAGGGTGTCCAGAAGGCTGTGGGGGCTGGTTTACTTTTAAT +ACTAGAATTATCTGATGTCCTCAAGAGTAGATTTTCTTATATAGAAAATAccttctaggc +caggcgcggtggctcacgcctgtcatcccagcactttgggaggctgaggcgggcagatca +cgaggtcaagagatcgagaccaacctaaccaacatggtgaaatcctgtctctactaaaaa +tacaaaaattagccgggcgcggtggctcatgcctgtagtcccagctactcgggaggctga +ggcaggacaatcgcatgaacctaggaggtagagcttgcagtgagctgagatcgcactact +gcactccacctgccgaaaaagcgagactccgtctcaaaaaaaaaaaaagaaaagaaaaga +aaataccttctAGAAATTaggcttaattttattttttatttattttatttttttttgaga +tggagtctcgctctgtaccccaggctggagtgcagtggtgtgatctcggctcaccgcaag +ctccgtctcccgggttcacgccattctcctgcctcagcctcccgagtagctgggaataca +gggcccaccaccatgcccagacagtttttgtatttttagtggagacggggtttcaccgtg +ttagccaggttggaattttttttttttttttggtcaatgttgaccaggttggcctcgaac +gtGTAGCCTCGCCTCCCCAAGCGCCAGAACAAACagcctgagccactgcagctcccagcc +ttatttttttgttttcagacagactctcgctctgttgtccaggctggagtgcagtggcac +aatcctggttcgctgcaggctccacctcccgggttcccgccattctcctgcctcagcctc +ccgagtagctgggactacaggtgcccgccaccatgcccggttaattttttgtatttttag +tagagacggggtttcaccgtgttagccaggatggtctcgatctcctgacttcgtgatccg +cccgcctcagcctcccaaagtgctgggattacaggcgtgagccaccatgcctggccagcc +ttatttttaaaaattaatatttatgttattaaagttaaaaagttataaaactagTGTGTC +TTTATTCAGCTTGCTGTCATTGTTCTTTTTATGGATCTAACAGGTTCCCCACCTTAgggg +atgattttctttttcttttttttttctttttttggagacagggtcgtgctctgttgccca +ggctggagtgcagtggcgtgatggcccactgcaaccttcacctcccaggttcaatcagtt +cttgtgcctcatcctctgtggtagctgggactatagccgtGCACcgccacgccccactaa +tttttttatattttggtagagacaggtttcaccatgttgcccaggctggttttgaactcc +tgagcacagacagtacacccgcctcagcctcccaaattgctaggattacaggcgtgagcc +actgcgcccggccccgttttgtttttcttgagtcAACGTTATTGACCTATAATTTACTAT +AATCTGTGTCTGATTCACGCGTACGGCTGATGAGTTTTAACAGACTCAGAGCCCCGTGTG +CCCACCACTGCATGGGGGTGCGAAAGTGTTCACTGTTCCCTGCGCTCAGAGTGCCTCACC +CCGGCTCGGGCAGTGCGGAGGCATCTCCCCTGCGCTCAGAGTGCCTCACCCCGGCTCGGG +CAGTGCCAGTGCATCTGCCTGGGTGAGAGCAGGGTCTGTGCTGCCGGCCCCGGCTTCCTG +TGAACGCAGTTGCTCCTCCGGCCTGGCCTCTCCCGCTGGAG +>NC_060936.1 Homo sapiens isolate CHM13 chromosome 12, alternate assembly T2T-CHM13v2.0 +CAAATCCAGCCTCCTCTCTCCACCCCGCAgccgcccccccgcccccgaactctttttttc +tgagatggcgtctcactctgttgcccaggctggagtgcagtggtgtgatctcagctcact +gcaacctccgcctcccgggcccaagccatccttccacttcagcccccaaatagctgggac +tgtaagCACGGgctaccatggctggctaatttttagccCGGGaatttgagtctgcagtga +gctttAAATTGCAcccctgcgctccagcctgagcaacagagtgagattctgtcaaaaaaa +caaacaaacaaaaaaaccccacatactGTTATTAATTATCATCACCATGTTGTCAAATCT +TCTCTTTCTGAACCCTTCTGCCCTTAATTCCCTTAACCCTTCTGTCTCTTAACCCTTCTG +CCCTCCCCCACAAAAACCCTTGTGTGAAAATGTAGTCTTAAAAAGAATTcatcacaggtt +tttttttttttgagatggagtttcgctcttgttgcccaggatggagtgcagtggcgcgat +ctcggctcactgcaacctccgcctcttgggttcaagcgatcctcctgcctcagcctcccg +agtagctgggattacaggtgcgcaccaccacgcctggctaatgttttctgtatttttagt +agagacagggtttcaccatattggccaacatggtctcaatctcctgaccttgtgatctgc +ccgccttgggctcccaacatgctgggattacaggcgtgaaccaccacgcctggcctcacc +AGAGGTTTTAACAGATGTTCTATACTATGTAATGAGTGAATTAATTAGTTATTTGGTAGC +TCTGTTTTGAGACAACTTGGGGCTTCCCTCTCCTCCTAGAATTAACTAACAGCTGGTGAA +AGAGCAGAGGGACAGTGACCACCAGGCCAACCTCGCCCAGAGAACTGACAGCAGCATCAG +CGGCTCTTACAGCAGCCCCCTTTCCTCTgttcccactgcagcctccaaccctGGACTCCC +TAAGCccagaggggaaaggaagggccGTCTGCCCAGCCATTTGAACCCTGATCCATCTTG +GATTGGAGAATTGCTTTGGAGAAACCTGAAATCAAGAATTGGCGCTTGCTGAGATTTGCC +TGGGGGAACATTTGCCCCATCCTTGAGTTTGGCTTTTGCATTTTCTGGCCTTTCTCATGC +TTTCCTGTCCATTTTCAGAATGTTCCCACTGCATGAAGTATTGTCTCCCTGCCACACTTC +ATTGTCATGGGGGAGAGTGTCCTGAAGACCCTTGTTTCATGTTGCTGGGGCCCAGGATTG +CTGTCTGCAGAGAGATAGGGGTCTGAATAGGTCTACCTCTCAAATTATCCTGCTTCTGGG +GTTGATAGGAGTTGGGGGAGGAGACTGAGGAGCTGGAGACAAAGCTCTGTGGAACCCACC +AAGGATTTTAAACCCTCTCCCATGAAGAGCCCTAGATCAGTGACAAGTGGGAGAGTTGCC +ATTTGCAACTCCATCcatctatttttgtcttctttcatttgCATAGATCTGAGCCAGGTA +AGCATCAGCTGATACTCTTCTTATAAATCAGATTGTAACCCGATTTGTCTGTCTCATTTT +TTTACCCTCTAATACAGCACAGGTACAGTATGCCTATAGGTATGTCCCTGAAACATTCTA +TgcagttcagatttttttttttaggaactattttaaattcattagGCAGGCTTTATTATT +TCAGGCATCCATGATGGATCTGCTAGCAACAGGAAAATCGTTcttcatttgtgtgtgttt +attatcAAATCATAGAGTGTAACACTTACAATGGTCCTTAAATATCATCATTTTATAACT +AAGAAAACCAAGGATCAGGAGGTCACTGGGATCACAAAGCCAGTGAAAGAACAAGGACCA +AAACCTTGGTCTCCTGACTTCTAGCCCACTGCTCTTTCAATCACAGGGACAATGAAATAC +AGAGAAGTTTAAAACTGTTATCTtcctatattttcatttccatctcttttttctacttaa +aaacattttatttctattttttaaaattcaaaagtataTAATATTAAAAGGTGCTTTCAC +AGAAGTAAGCACCATAAAAAATTCAATATGCCTTCTAAGTGTTTTCTATGCCTCTGTGAT +gcctgtacacatacacatagaggCTCCTATACTTACaagtgcatttttatttatttttta +ttttatttattttttttgagacagagtctcactctgtcacccaggctggagtgcagtggc +gcggtctcggctcactgcaagctccgcctcccgggttcacgccattctcctgcctcagcc +tcccgagtagctgggactacagacacataccaccacgcctggctaattttttgtatcttt +agtagagacggggtttcaccgtgttagccaggatggtctcgatctcctgacctcgtgatc +cgcccgcctcggcctcccgaagtgctgggattacaggcgtgagccaccgtgcccggccaa +gtgcatttttaaatgaatttttaattttagaatagtttttcatTTACCCAACATTGCAAA +GGTAGTCTGGAGAGCTCTCACTTTGCTCACACCCAGTTTCCTCTATTATTAGCATCTTGC +ATTAAGCCCCGGTACATTTGTCATGATTAATGAACCAATATCGGATGTTATTATTAACTC +AAGTTCATACTGTATCCTGAATTCCTTTCAGATATCCCTTTTCTGTTCCTAGACCTCTGT +AGTCATTGGGTCTCCCTAAGTTCCTACTGGCCATGACAGATTTAAGCGTTTTTTTGATAG +TGTCACTTTTGTGATATATATGGCAACCTTTTTTCACATAACTATATGTTTTGAACACCT +TTCTGGGTTAGTGTGTGTGGCCTTCCACACCCTTTTAACTCACCACAGTGTTCTGTTGAG +TGGCTTTACCCCATCATTTTACACTGCCCTTGGCACAGAGCCCCCGTCTGGAAGTGTCAC +TGGGCCTGGGTGCTGTCTGGTGGATTAGACAGACGCTTCCGCTGTCTTGGAATTTGGACA +CTGTGGGAACAGAGAACATGGATGTAAATGACCTGACAGAGCTCAGAGAAAAGGAGCCAC +GTGGCCTGGGGCACTGCTGTTGTGGCGACCCTTCACCCCACGCCCTCCACCCTACATCCC +TCACCCCACACCCTACGCCCTGCGAGTGGCTCTGTGTTTACATACAAGAGTTTACATCTG +TGGTGGAAGCACTTTCTCACAAAAGGGTAGGGCTTATTCTAGGAGGCCCTACCAAAGAAA +AGCACTAGGTAGCAGCATTCCAGCTGTAGGGCCCGTGACTGTGGCATGCGGAACATTCCT +GCCCCTGGAAATCCAGTAGTAGCTTGGTGGACGTCTGTCCCTGGAAATCCAGTAGTAGCT +TGGTGGACACCTGCCCCTGGAAATCCAGTAGTACCTTGGTGGACACCTGCCCCTGGAAAT +CCAGTAGTAGCTTGGTGGACACCTGCCCCTGGAAATCCAGTAGTAGCTTGGTGGACACCT +GCCCCTGGAAATCCAGTAGTAGCTTGGTGGACACCTGTCAGGAGTGCTTGAGTAGAGCGT +TGATACTAACCTGTGAAAGAAATTTCCCATGATCATCCATTGTAACTGGAAGAGATCTGA +AAAATGACTCGGCCCAAGGTCCCACAGCCAGTGGAGACAGAATGTCTTCTCTTACTGTCT +TTTCCGCTGGCCCTGCCAGCCCAGACCTGTCCCTAGGGGGACATCCAATTCATATTCGTT +AATGAAGAGAAAGCTTCCAGATCCTTCAAGGTGTCTCTGTTACCTCAGAAGGTCCAGTGC +ATATTTTGAAACaacttacttttgttttttttagacagggtcttgctccatcacccaggc +cacccaagctggagttcagtgatgcaatcatggcttactgcagcttcgaactcccaGGCT +tgagcaatcttcccacctcaggctcttgagtgcctgggactacaggtgtgtgccaccatg +cctggctaatttttaaaaatttgttatagagatagggtcttactacattgcccaggctgg +tctcaaactcatggtcTCAAGCAATAAAACagctttttaatgtttaaattataCCCGAGG +TTTGGTTCTCTGCAGATGTCCCCCAGAATTGGGCACAGCCTCCGATCGGCCTTATTCCTC +TCACTTAATATTTGTCACTATTCCAAACCCCATGTTCAACACTTCACCCATTACCTTTTC +CCTCTGACCTCTGATTTGCACAGGCCCTTCCAGCAGAGCTCCAGGCTGTTCTTGCCCAAG +CAGAGATTACAAACATACTACTTTGAGGACTGACCCTCCCAGACTTACCACTTCAGCCGA +AGTAAGGGAGAACTAGATAACTCTCTTTGTCTCATGCTACAAAGTGCCCCAGGAGGCCTT +TCATACACAATTATTTTTCAGTAAGGAGCCAGGGAACCAGGGTCTTTTCCTCTCATGCAC +CTTGTGAGGTTGGCAGGACAGCGTGTGACTCATGCCTGGACAGAGGCGCATACCTTTAAC +AGCCTTGCTGGGGAGGTGCCCCACTTAGGAGTGGTGGAGATACACTCTACTGGTTTTTCC +TACCCAGCAGGTGTCTAAGACAGACACACTCAGACAACACTGCTTTCCCCATCACTGCCT +GTCATCCAACACTTCAAAGATGATGGACAACGTGTCTGAAGCTGATGGGGCGGAGGACCC +CTGCACACCTGCACCTACTAACCTACTGCTGTACCTtcgccccacccccagccccctttG +AGAGCTCAGATCCCGCCTAGGAGGGGATGGATGGGCTTGTTAACAGCTGACAAGTGCTCT +GCAAAATGCAGCTGTTTAATCATAAATGAACATTAGAAGGTGGCCTGGGGCCACTGTGCT +TTAGGAAACTCATGCGCGTGGAGAGGACAGGAGGAAAGGAGATTTCCAGGGCAGGAGAAA +CTTGGGAAGCAACACTGAATGGGAAGAGAGGGAGGCTTTCTAGGGGATTTAAATGATACT +GAAACCCGGATACGGAATAGGAGAAAAAATACCAACTTGCTCTCAGGGTGTCTTTACTCT +CCCCAGTGCAGATTTCATTGACCTAAATCAGGTCTCTGCTCCTATTTGCTGGTACCTAGT +TCAAGAGAGTCTTATAAATACACAAAGCCGGAAATGCCTGGGTAGGGGGGTGGCAAGAGC +ATGCGGTTCCACTCCAGGACAGGATCTGACTCAAATCACACTTCCCTCCTGGATTCCAGA +CTGTCAGGAGGGATGCCTCCGAGGTGGTGTTTGGAAGGAGGTGCTGAGAGCGGAGCTGGG +TTATTCTAAGCGTGGCCCAGGGAAGATCTTGCCAGACTTGTTAATGTGTGACCCCACCCA +GTGCCATGCTCAGCAAGGCAGAGAAGTGTGCTGTGGGTGgtgggagcaagaaagagagga +ggCCAGGACATCTCTATTCCACACATACCCTGTTTCATCCCTTGCTGCATTTCACTAAAA +TTATCCACTCGCCCCTACGAGACCTGCTGTGTCCTCCTTGAGTCCTTGTTTGGCATACCT +TTGTTCCCTTCCATGGCCGAGTGAGTTCAGTCCACATTCATTGAACTGAAAGCTCACAGG +TCTTGGAGCCTGGAGAAATAATCGGAACCATTCCCTTTCGTCTCCAGGCAAGATGAGCGA +TGGACCCAGGTTGCCTAACCTAGTTAGCTGCATGACACTCCAGAGCATCCAGCTCAAAGC +AGGCATTGACAGGGATGGGGCACCCAGAGAAATGGCGCTGGTGCTGCTGTAGGGGTAAGA +TGTAGCAGCAAGGGGCGGGCAAGAGGGCTCCAGATGATTTCTGCCATGCTGAGCTAGCTG +CCTGCTGGCTTTGTAAGCAGTGGAATAAGAAGACTATTGTGTCAACTCTTTGAGGGGGTG +TGGCCTTCCTTGGGGTGAGAAAGCACAATGGGAAGGGCTAGCAGCTCCCCCGATCCTCTT +CCTACTGTGACCTGAGAGACACTCCATGGGGGGGTTGGACGCTGGGGGGCTGGTCAGGGG +AGTTGGCTGGGCTGGGAGGGAAACGGGCCCTTTCAAGAGCAAGTCAGACTCTGGTGAGCT +GTTTACCCGCCTCATGCCCAAGGGTGCAATGTGAGTCATTTAATTTAATTGGTTTAATAA +GTAAACGGTCTGGGTACAAAGAGGAGGGGGTTGGGTATGAGAGGGAGGGGCGGGGCAAAC +CCTGCAGAGCTGCTTTGGAAAGAAACCTGTTGCCAGCCCTCTAGGGATGGTCACAATTAA +ACAGGGAGTGGAGATGCTTTGGGAAGTAGGGAGAAGGGAGAGCCCCAGATGTTGAAGTGG +AAAGAGGAGTAGAGGCTATAAGTCGGCCAGCCTCAGATTCTCAGTGCCCATCTGAGTATT +CGATTCACTGGTGCTGGTATATCCACAGGGCTGTGCAACCATTGCCACTACCTAATTCCA +GAGCATTTTCCTCACCCTAGAAAGGAACCTCACCCATTATCAGTCACTCCCAAttctccc +cacctccagcactggaaCCACGACTCTCCTTTtggtctctatggatttgcctattctttt +ttttttttttttttttttttttgagacagggtcttactctggtgcccaggctggagtgca +gtggcagctcactgcaatttctgcctgcCAAGCTCAAGgtattctcccacctctgcctcc +tgagcagctgaactacaggcgtgtgccaccacgctcggctaatttttgttttttgttttt +tttggtaccTTCCACcatccaccttccaccttccgcCTTCTGCCTTCCGCCTTCCACCTT +CGACCTTCTTCCACCTTcgaccttccaccttccaccttccgccttctgccttccaccttc +caccttccttccaccttccaccttccaccttcaaCCTTCCGCCTTCCGCCTTCCACCTTC +TGTCTTCCaccttccttccaccttccaccttccaccttcttccaccttccaccttccacc +ttcttccaccttccaccttccaccttcttccaccttccaccttcttccaccttcttccac +cttccaccttccaccttccaccttcttccaccttccaccttccaccttctaccttccttc +caccttccaccttccgcCTTCGAccttcttccaccttccaccttccgcCTTCCACCTTCG +ACCTTCTTCCACCTTcgaccttccaccttccaccttcttccaccttcGAGCTTCCACCTT +Ccgccttccaccttccaccttccaccttccaccttccttccaccttccaccttccacctt +cgACCTTCCGCCTTCCGCCTTCCGCCTTCCACCTTCTGTCTTCCACCTTCCTTCCACCTT +CCGCCTTCCaccttccttccaccttccaccttccaccttcttccaccttccaccttccac +cttcttccaccttccaccttccaccttcttccaccttcttccaccttccaccttccacct +tccaccttcttccaccttccaccttccaccttcttccaccttccaccttccaccttcctt +ccaccttccaccttccgcCTTCGAccttcttccaccttccaccttccaccttcttccacc +tttgaccttccaccttccaccttccgcCTTCCGCATTCCGCCTTCCAtcttccttccacc +ttccaccttccgcCTTCCACCTTCTaccttctgccttccaccttcGACCTTCTTCCACCT +TCAACCTTCCACCTTcgaccttccaccttccaccttccaccttcttccaccttcgagctt +ccaccttccaccttccaccttccgcCTTCCGCCTTCCACCTTCCGCCTTCCGCCTTCCAC +CTTCCGCCTTCcgccttccaccttccaccttccaccttccaccttcttccaccttccacc +ttccaccttcttccaccttcttccaccttcttccaccttccaccttccaccttcttccac +cttccaccttcttccaccttccaccttccaccttccttccaccttccaccttccgcCTTC +GAccttcttccaccttccaccttccaccttcttccaccttTGACCTTCCACCTTCCGCCT +TCCGCCTTCCGCCTTCCAtcttccttccaccttccaccttccaccttccgcccaccttcc +accttccaccttccaccttctaccttctgccttccaccttcGACCTTCTTCCACCTTCAA +CCTTCCACCTTcgaccttccaccttccaccttccaccttcttccaccttcgagcttccac +cttccaccttccaccttccgcCTTCCACCTTCcgccttccaccttccaccttccaccttc +ttccaccttccaccttccaccttcgATCTTCCTTCCACCTTCcgccttccaccttccacc +ttccaccttcttccacctttgaccttccaccttccaccttccgcCTTCCGCCTTCTGCCT +TCCTTCCACCTTCCGccttccaccttcttccaccttccaccttccgccttctgccttcca +ccttcCGCCTTCCaccttccttccaccttccaccttccacatTCCACCTTCTACCTTCCG +CCTTCCGCTTTccaccttctgccttccaccttccaccttccaccttcttccaccttccac +cttccactttccaccttccaccttcgatcttccttccaccttccaccttccgccttccac +cttccaccttccaccttcttccaccttccaccttccaccttcttccacctttgacctttc +accttccaccttccgccttccaccttctgccttccttccaccttccgccttccaccttcc +accttcgaccttccaccttccaccttccaccttccaccttcttccaccttccaccttcca +ccttccaccttccactaCCGTTCTTGGATTTTGccaacaaagaacaaagaattGAGGGCA +AATCtgtagagtaaagtgaaagcaaatttattaaaaaagtaaaggagTAAAACAATGACT +ATTCCACAAGCAGAGCAGCCCTgaaggctgctggttgcccattttatGCTTATTTCTTGA +TTAGATGCTAAACGGTGTGGGTTATTCGTGCCTCTCATTTTTAGGCCATATAGGGTTAAC +TTCCTGATGTCGCTGTGAtgtttgtaaactgtcatggtgctggcgGGAGCATAGCAgcga +ggacaaccagaggtcacttttatcaccatcttggttttggtgggttttagccggcttctt +tcctgcagtctgttttatcagcaaggtctttatgacctgtatcttatgCCTCCTATCTTA +TACCTCCTATCTCATTCTGTGATTAAGAATGGCTTAACTTACTGGGAATGCAGTCCAGCA +GGTCTTAGCCTTATTTTAGCCAGCCTCTATTCAAGGTGGAGTTGCTCCAGCACCTCTGAC +AATAGCTCACTACGGCCTCGAACATTTTTGTATAGACgcggtctccctatgttgcccagg +ctgatccctaactcctggcctcaagcagtcctctgacctcagtttcccaaagcatgcgga +ttacaggcgtgagccactgtgcccagtccatttctttttattgctaagttaTATTCTGTT +gtgtggatagaccacattttgcttcTCCATTCATAGTTGAtgatggacatttgcattgtt +tccgctttttggctattaggaataatgctgCGCTGAGGCTTTCATTTCTGTTGGGTGTAT +ACCTGGGAAtagaactgctgggtcaaatagtaacTCCATGTTTTGAGGGACTGTCAGATT +TTTCCAAAtcggctacaccattttacattctcaccagccatgtatgagggttccaatttc +tctatgttcttgccaacacttgttattgtccgtttttgtttttttttttttttttgagac +ggagtctcgctctgtcccccaggctggagtgcagtggcgcgatcttggctcactgcaagc +tccacctcccgggttcacgccattctcctgcctcagcctcc +>NC_060937.1 Homo sapiens isolate CHM13 chromosome 13, alternate assembly T2T-CHM13v2.0 +CTAtagtgtacataaaatatcaaagtacccaaaCTATacattatatactgtacataaaat +atgaaattacatcaaatacattttatattaggtacataaaatatgaaagtacaTCAAATA +TAGATTaaatactgtacataaaataccAAAGTACcccaaatatataatttatactgtACA +TGAAATATCAAAGTTCacaaactatatattatatactgtacataaaatatcaaagtaccc +aaGGTATATATTCTATACTGTacaaaaaatatcaaagtacccaaagcacgtattatatac +tgtacataaaatatgaaagtacatcatatatatattttattctgtacataaaatatcaaa +gtacaccaGATATATATTCTAtagtgtacataaaatatcaaagtacccaaaCTATacatt +atatactgtacataaaatatgaaattacatcaaatatatattaagtacttaaaatatgaa +agtacatcaaatatagattatatactgtacataaaatatcaatgtaccccaaatatatat +tttatactctaCATGAAATATCAAAGTTCaaaaatcatatattatatactgtacataaaa +tatcaaagtacccaaGGTATATATTCTATACTATACAAAAAATATCAAGGTACCCAAagc +atgtattatatattgtacataaaatatgaaagtacatcaaatatatattttattctgtac +ataaaatatcaaagtacaccaGATATATATTCTAtagtgtacataaaatatcaaagtacc +caaaCTATacattatatactgtacataaaatatgaaattacatcaaatatatattttatt +aggaacataaaatatgaaagtacaTCAAATATAGATTATATGCTGTACATTAAATACCAA +AGTaccccaaatatatattttatactgtaCATGAAATATCAAAGTTCacaaactatatat +tatatactgtacataaaatataaaagtaccCAAGGTATATATTCTATACTGTacaaaaaa +tatcaaagtacGCAAAGCacgtattatatactgtacataaaatatgaaagtacatcacat +atatattttattctgtacataaaatatcaaagtacaccagatatatatactatagtttac +ataaaatatcaaagtacccaaaCTATacattatatactgtacataaaatatgaaattaca +tCAAATTTATATTAggtacataaaatatgaaagtacatcaaatatagattatatactgta +cataaaatatcaaagtaccccaaatatatattatatactctacatgaaatatcaaaattc +acaaactatatattatatactgtatataatatatcAAAGTACCCAAGGTATATTTTCTAT +ACTGTacaaaaaatatcaaagtacccaaagcatgtattatatactgtacataaaatatga +aagtacatcaaatatatattttattctgtacataaaatatcaaagtacaccaGATATATA +TTCTATAGTGtacataaaataacaaagtacacaaactataaattatatactgtacataaa +atatgaaattacatcaaatatatattaggtacataaaatatgaaattacatcaaatatag +attatatactgtacatataaTATCAATGTaccccaaatatatattttattctctacATCA +AATATCAAAGTTCACAAAGCATacattatatactgtacataaaatatcaaagtacccaaG +GTATATATTCTATACTGTacaaaaaatatcaaagtacccaaagcatgtattatatactgt +acataaaatatgaatgtacatcaaatatatattttattctgtacataaaatatcaaagca +CACCAGATATATATTCTATAGTGtacataaaataacaaagtacacaaactataaattata +tactgtacataaaatatgaaattacatcaaatatatattaggtacataaaatatgaaagt +acatcaaatatagattatatactgtacatataaTATCAATGTaccccaaatatatatttt +attctctacATGAAATATAAAAGTTCACAAaccatatattatatactgtacataaaatat +caaagtacccaaGGTATATATTCTATACTGTACAAAAAACATCAAAGTACCCAAagcatg +tattatatactgtacataaaatatgaaagtacatcaaatatatattttattctgtacata +aaatatcaaagtacaccaGATATGTATTCTAtagtgtacataaaatatcaaagtacccaa +aCTATacattatatactgtacataaaatatgaaattacatcaaatatatattaggtacat +aaaatatgaaagtacatcaaatatagattatatactgtacataaaatatcaatgtacccc +aaatatatattttatactctaCATGAAATATCAAAGTTCACAAACCATAtcttatatact +gtacataaaatatcaaagtacccaaGGTATATATTCTATACTGTacaaaaaatatcaaag +tacccaaagcatgtattatatactgtacataaaatatgaaagtacatcaaatatagattt +tattctgtacataaaatatcaaagtacaccaGATATATATTCTAtagtgtacataaaata +tcaaagtaccaaAACTATacattatatactgtacataaaatatgaaattacatcaaatat +atattaggtacataaaatatgaaagtacatcaaatatagattatatactgtacataaaat +atcaatgtaccccaaatatatattttatactctaCATGAAATATCAAAGTTCACAAACCA +TAtcttatatactgtacataaaatatcaaagtacccaaGGTATATATTCTATACTGTaca +aaaaatatcaaagtacccaaagcatgtattatatactgtacataaaatatgaaagtacat +caaatatagattttattctgtacataaaatatcaaagtacaccaGATATATATTCTAtag +tgtacataaaatatcaaagtacccaaaCTATacattatatactgtacataaaatatgaaa +ttacatcaaatatatattatattaggtacataaaatatgaaagtacaTCAAATATAGATT +ATATACTGTACATTAAATACCAAAGTaccccaaatatatattttatattgtacatGAAAT +ATCAAAGTTCacaaactatatattatatactgtacatgtAATATCAAAGTACCCGAGGTA +TATATTCTATActgtacaaaaaataacaaagtaccaaaagcatttattatatactgtaca +taaaatatgaaagtacatcaaatatagattttattctgtacataaaatatcaaagtacac +caGATATATATTCTAtagtgtacataaaatatcaaagtacccaaaCTATacattatatac +tgtacataaaacatgaaattacataaaatatatattatattaggtacataaaatatgaaa +gtatatCAAATATAGATTATATACTGTACATTAAATAGCAAAGTaccccaaatatatatt +ttatactgtaCATGAAATATCAAAGTTCacaaactatatattatatactgtacatgtAAT +ATCAAAGTACCCGAGGTATATATTCTATActgtacaaaaaataacaaagtaccaaaagca +tgtattatatactgtacctaaaatatgaaattacatcaaatatatattttattctgtaca +taaaatatcaaagtacaacAGATATATATTCTAtagtgtacataaaatatcaaagtaccc +aaaCTATacattatatactgtacataaaatatgaaattacatcaaatatatattaggtac +ataaaatatgaaagtacatcaaatatagattatatactgtacataaaatatcaaagtacc +ccaaatatatattatatactgtacatgaAATATCAAAGTTCacaaactatatattatata +ctgtacataaaatatcaaagtacccaaGGTATATATTCTATACTGTacaaaaaatatcaa +agtacccaaagcatgtattatatactgtacataaaatatgaaagtacatcaaatatatat +tttattctgtacataaaatatcaaggTACACCAGATATATATTCTATAGTGTACATAAAA +TAGCAAAGTACACAAACTAtaaattatatactgtacataaaatatgaaattacatcaaat +atatattaggtacataaaatatgaaagtacatcaaatatagattatatactgtacataaa +atatcaatgtaccccaaatatatattttatactctaCATGAAATATGAAAGTTCACAAAC +CATATAttgtatactgtacataaaatatcaaagtacccaaGGTATGTATTCTATACTGTa +caaaaaatatcaaagtacccaaagcatgtattatatactgtacataaaatatgaaagtac +atcaaatatatattttattctgtacataaaatatcaaagtacaccaGATATATATTCTAt +agtgtacataaaatatcaaaggaCCCAAACTATacattatatactgtacataaaatatga +aattacatcaaatatatattaggtacataaaatatgaaagtacaTCAAATATAGATTACA +TACTGTACATTAAATACCAAAGTACCccgaatatatattttatactgtgCATGAAATATC +AAAGTTCacacactatatattatatactgtacataaaatatcaaagtacccaaGGTATAT +ATTCTATACTGTacaaaaaatatcaaagtacccaaagcatgtattatatactgtacataa +agtACGAAAgtacatcaaatatatattttattctgtacataaaatatcaaggTACACCAG +ATATATATTCTAtagtgtacataaaatatcaaagtacccaaactataaattatatactgt +acataaaatatgaaattacatcaaatatatattatattaggtacataaaatatgaaagta +caTCAAATATAGATTATATACTCTACATTAAATACCAAAGTAccccaaatatatatttga +tactgTACATGAAATATCAAATTTCacaaactatatattatatactgtacataaaatatc +aaagtacccaaGGTATATATTCTATACTGTACAAAAAATATCAAACTACCAAAagcatgt +attatatactgtacctaaaatatgaaagtacatcaaatatatattttattctgtacataa +aatatcaaggTACACCAGATATATATTCTATAGTGTATATAAAATAGCAAAGTACACAAA +CTAtaaattatatactgtacataaaatatgaaattacatcaaatatatattaggtacata +aaatatgaaagtacatcaaatatagattatatactgtacataaaatatcaatgtacccca +aatatatattttatactctaCATGAAATATCAAAGTTCACAAACCATATAttgtatactg +tacataaaatatcaaagtacccaaGGTATGTATTCTATACTGTacaaaaaatatcaaagt +acccaaagcatgtattatatactgtacataaaataggAAAgtacatcaaatatatatttt +attctgtacATAAAGTATCAAAGTACACCAGACATATATTCTATAgagtacataaaatat +caaagtacccaaaCTATacattatatactgtacataaaatatgaaattacatcaaatata +tattatattaggtacataaaatatgaaagtacaTCAAATATAGATTATATACTGTACATT +AAATACGAAAGTaccccaaatatatattttatactgtaCATGAAATATCACAGTTCacac +actatatattatatactgtacataaaatatcaaagtacccaaGGTATATATTCTATACTG +Tacaaaaaatatcaaagtacccaaagcatgtattatatactgtacataaaatatgaaagt +acatcaaatatatattttattctgtacataaaatatcaaagtacaccaGATATATATTCT +AtagtgtacataaaatatcaaaggaCCCAAACTATacattatatactgtacataaaatat +gaaattacatcaaatatatattaggtacataaaatatgaaagtacaTCAAATATAGATTA +CATACTGTACATTAAATACCAAAGTACCccgaatatatattttatactgtaCATGAAATA +TCAAAGTTCacacactatatattatatactgtacataaaatatcaaagtacccaaGGTAT +ATATTCTATACTGTacaaaaaatatcaaagtacccaaagcatgtattatatactgtacat +aaagtACGAAAgtacatcaaatatatattttattctgtacataaaatatcaaggTACACC +AGATATATATTCTAtagtgtacataaaatatcaaagtacccaaactataaattatatact +gtacataaaatataaaattacatcaaatatatattatattaggtacataaaatatgaaag +tacaTCAAATATAGATTATATACTCTACATTAAATACCAAAGTAccccaaatatatattt +gatactgTACATGAAATATCAAATTTCacaaactatatattatatactgtacataaaata +tcaaagtacccaaGGTATATATTCTATACTGTACAAAAAATATCAAACTACCAAAagcat +gtattatatactgtacctaaaatatgaaagtacatcaaatatatattttattctgtacat +aaaatatcaaggTACACCAGATATATATTCTATAGTGTATATAAAATAGCAAAGTACACA +AACTAtaaattatatactgtacataaaatatgaaattacatcaaatatatattaggtaca +taaaatatgaaagtacatcaaatatagattatatactgtacataaaatatcaatgtaccc +caaatatatattttatactctaCATGAAATATCAAAGTTCACAAACCATATAttgtatac +tgtacataaaatatcaaagtacccaaGGTATGTATTCTATACTGTacaaaaaatatcaaa +gtacccaaagcatgtattatatactgtacataaaataggAAAgtacatcaaatatatatt +ttattctgtacATAAAGTATCAAAGTACACCAGACATATATTCTATAgagtacataaaat +atcaaagtacccaaaCTATacattatatactgtacataaaatatgaaattacatcaaata +tatattatattaggtacataaaatatgaaagtacaTCAAATATAGATTATATACTGTACA +TTAAATACGAAAGTaccccaaatatatattttatactgtaCATGAAATATCACAGTTCac +acactatatattatatactgtacataaaatatcaaagtacccaaGGTATATATTCTATAC +TGTacaaaaaatatcaaagtacccaaagCATGTATTACaaactgtacataaaatatgaaa +gtacatcaaatatatattttattctgtacataaaatatcaaagtacaccaGATATATATT +CTAtagtgtacataaaatatcaaagtacccaaaCTATacattatatactgtacataaaat +atgaaattacatcaaatatatattatattaggtacataaaatatgaaagtacatcaaata +tagattatatactgtacataatatATCAAAGTAccccaaatatatattatatactctaCA +TGAAATATCAAAGTTCacaaactatatattatatactgtacataaaatatcaaagtaccc +aaGGTATATATTCTATACTgcacaaaaaaatcaaagtacCCAAAGCATgaattatatact +gtatttaaaatatgaaagtacatcacatatatattttattctctacATAATATATCAAAG +TACACCAGATATATATTCTATAGTGTACGTAAAATAACAAAGTACACAAACTAtaaatta +tatactgtacataaaatatgaaattacatcaaaaatatattaggtacataaaatatgaaa +gtacatcaaatatagattatatactgtacataaaatatcaatgtaccccaaatatatatt +ttatactctaCATGAAATATCAAAGTTCACAAACCATATAttgtatactgtacataaaat +atcaaagtacccaaGGTATGTATTCTATACTGtacaaaaaatatcaaagaacCCAAagca +tgtattatatactgtgcataaaatatgaaagtacatcaaatatatattttattctgtaca +taaaatatcaaagtacaccaGATATATATTCTAtagtgtacataaaatatcaaagtaccc +aaaCTATacattatatactgtacataaaatatgaaattacatcaaatatatattaggtac +ataaaatatgaaagtacatcaaatatagattatatactgtacataaaatatcaatgtacc +ccaaatatatattttatactctaCATGAAATATCAAAGTTCACAAACCATGTAttgtata +ctgtacataaaatatcaaagtacccaaGGTATCTATTCTATACTGTacaaaaaatatcaa +agtacccaaagcatgtattatatactgtacataaaatatgaaagtacatcaaatatatat +tttattctgtacataaaatatcaatgtACACCAGATATATATTCTATAGTgttcataaaa +tatcaaagtacccaaaCTATacattatatactgtacataaaatatgaaattacatcaaat +atatattatattaggtacataaaatatgaaagtacaTCAAATATAGATTATATACTGTAC +ATTAAGTACCAAAGTaccccaaatatatattttatactgtaCATGAAATATCAAAGTTCa +caaactatatattatatactgtacataaaatatcaaagtactcAAGGTATATATTCTATA +ctgtacaaaaaataacaaagtaccaaaagcatgtattatatactgtacctaaaatatgaa +attacatcaaatatatattttattctgtacataaaatatcaaagtacaccaGATATATAT +TCTAtagtgtacataaaatatcaaagtacccaaactatttattatatactgtacataaaa +tatgaaattacatcaaatatatattatattaggtacataaaatatgaaagtacatcaaat +atagattatatactgtacataaaataacaatgtaccccaaatatatattttatactctaC +ATGAAATATCAAAGTTCACAAACCATATCTTAtaaactgtacataaaatatcaaagtacc +caaGGTATATATTCTATACTGTacaaaaaatatcaaagtacccaaagcatgtattatgta +ctgtacataaaacatgaaagtacatcaaatatatattttattctgtacatgaaatatcaa +agtacccaaaacatgtattatatactgtacataaaatatgaaagtacatcaaatatatat +tttattctgtacATGAAATATCGAAGTATACCAGATATATATTCTAtagtgtacataaaa +tatcaaagtacccaaaCTATacattatatactgtacataaaatatgaaattacatcaaat +atatattatattaggtacataaaatatgaaagtacatgaaatatagattatatactgtac +ataaaatatcaaggtaccccaaatatatattatatactctaCATGAAATATCAAAGTTCt +caaactatatattatatactgtacataaattATCAAAGTACCCAAGGTATATATTCTATA +ctgtacaaaaaataacaaagtacctaaaacatgtataatatactgtacataaaatatgaa +agtacatcaaatatatatttttttctgtacataaaatatcaaagtacacccGATATATAT +TCTAtagtgtacataaaatatcaaagtacccaaaCTATACATTATATactgtaaataaaa +tatgaaattacatcaaatatattttatattaggtacataaaatatgaaagtacatcaaat +atatattttattctgtacataaaatatcaaagtacaccaGA +>NC_060938.1 Homo sapiens isolate CHM13 chromosome 14, alternate assembly T2T-CHM13v2.0 +GGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggtcagaAGAATAGAAAGG +GACAGGGCTGAAGAACACAggtcgctgcatttagaaaggaggcggggtcagaggaataga +aagggacaGGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggtcagaggaa +tagaaagggatagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcaga +ggaatagaaagggatagGGCTGAAGAACAGAGGTCGCTTCATTTAGAAACgaggcggggt +cagaggaatagaaagggataggactgaagaacacaggtcgctgcatttagaaaggaggcg +gggtcagaggaatagaaagggataggcctgaagaacacaggtcgctgcatttagaaagga +ggcggggtcagaggaatagaaagggacaGGGCTGAAGAACAGAggtcgctgcatttagaa +aggaggcggggtcagaggaatagaaagggacaGGACAGAAGAACACAggtcgctgcattt +agaaaggaggcggggtcagaggaatagaaagggatagggctgaagaacacaggtcgctgc +atttagaaaggacgcggggtcagaggaatagaaagggacaGGACAGAAGAACACAggtcg +ctgcatttagaaaggaggcggggtcagaggaatagaaagggacagggctgaagaacacag +gtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggacaGGACAGAAGAAC +ACAggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggatagGGCTGAA +GAACAGAggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggatagggc +tgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggaca +gggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagg +gatagGGGTGAAGAACAGAGGTCactgcatttagaaaggaggcggggttagaggaataga +aagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaa +tagaaagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcaga +ggaatagaaagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggt +cagaggaatagaaagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcg +gggtcagaggaatagaaagggacagggctgaagaacacaggtcgctgcatttagaaagga +ggcggggttagaggaatagaaagggacaGGGCTGAAGAACAGAggtcgctgcatttagaa +aggaggcggggtcagaggaatagaaagggatgGGCCTGAAGAACAGAggtcgctgcattt +agaaaggaggcggggtcagaggaatagaaagggatagggatgaagaacacaggtcgctgc +atttagaaaggaggcggggtcagaggaatagaaagggatagGCCTGAAGAACAGAggtcg +ctgcatttagaaaggaggcggggtcagaAGAATAGAAAGGGATAGGCCTGAAGAACAGAg +gtcgctgcatttagaaaggaggcggggttagaggaatagaaagggacagggctgaagaac +acaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggacaggactgaa +gaacacaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggacagggc +tgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggaca +GGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagg +gacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaataga +aagggacagggctgaagaacacaggtcactgcatttagaaaggaggcggggtcagaggaa +tagaaagggacagggctgaagaacacaggttgctgcatttagaaaggaggcggggtcaga +ggaatagaaagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggt +cagaggaatagaaagggataggactgaagaacacaggtcgctgcatttagaaaggaggcg +gggtcagaggaatagaaagggataggcctgaagaacacaggtcgctgcatttagaaagga +ggcggggtcagaggaatagaaagggacaGGGCTGAAGAACAGAggtcgctgcatttagaa +aggaggcggggtcagaggaatagaaagggacaGGGCTGAAGAACAGAggtcgctgcattt +agaaaggaggcggggtcagaggaatagaaagggacaGGACAGAAGAACACAggtcgctgc +atttagaaaggaggcggggtcagaggaatagaaagggatagggctgaagaacacaggtcg +ctgcatttagaaaggaggcggggtcagaggaatagaaagggatagGGCTGAAGAACAGAg +gtcgctgcatttagaaaggaggcggggtcagTAGAATAGAAAGGGAGAGGACAGAAGAAC +ACAggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggatagggctgaa +gaacacaggtcgctgcatttagaaaggaggcggggttagaggaatagaaagggatagggc +tgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggata +gggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagg +gacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaataga +aagggatgGGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggtcagaggaa +tagaaagggatgGGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggtcaga +ggaatagaaagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggt +cagaggaatagaaagggacagggctgaagaacacaggtcgctgcatttagaaaggatgcg +gggtcagaggaatagaaagggacaGGGCTGAAGAACAGAggtcgctgcatttagaaagga +ggcggggtcagaggaatagaaagggacaGGGCTGAAGAACAGAggtcgctgcatttagaa +aggaggcggggtcagaggaatagaaagggataggcctgaagaacacaggtcgctgcattt +agaaaggaggcggggtcagaggaatagaaagggacagggctgaagaacacaggtcgctgc +atttagaaaggaggcggggtcagaggaatagaaagggatagGGCTGAAGAACAGAGGTCG +CTTcatttagaaaggaggcggggtcagaggaatagaaagggatgGGGCTGAAGAACAGAg +gtcgctgcatttagaaaggaggcggggtcagTAGAATAGAAAGGGACAGGACAGAAGAAC +ACAggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggacagggctgaa +gaacacaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggacagggc +tgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggagG +GGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggtcagaggaatGGAAAGG +GACGGGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggtcagaggaataga +aagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaa +tagaaagggatagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtTAGA +GGTATAGAAAGGGACAGGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggt +cagaggaatagaaagggatagGCCTGAAGAACAGAggtcgctgcatttagaaaggaggcg +gggtcagaggaatagaaagggacagggctgaagaacacaggtcgctgcatttagaaagga +ggcggggtcagaggaatagaaagggacagggatgaagaacacaggtcgctgcatttagaa +aggaggcggggtcagaggaatagaaagggatagGGCTGAAGAAAACAggtcgctgcattt +agaaaggaggcggggtcagaggaatagaaagggacagggctgaagaacacaggtcgctgc +atttagaaaggaggcggggtcagaggaatagaaagggacagggctgaagaacacaggtcg +ctgcatttagaaaggaggcggggtcagaggaatagaaagggactgggctgaagaacacag +gtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggatagGGCTGAAGAAC +AGAggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggatagggctgaa +gaacacaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggataggac +tgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggaca +GGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagg +gacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaataga +aagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaa +tagaaagggacaGGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggtcaga +ggaatagaaagggatagggctgaagaacacaggtcgctgcatttagaaaggaggcggggt +cagaggaatagaaagggatagGGCTGAAGAACAGAGGTCGCTTcatttagaaaggaggcg +gggtcagaggaatagaaagggatgGGGCTGAAGAACAGAggtcgctgcatttagaaagga +ggcggggtcagaggaatagaaagggacGGGGCTGAAGAACAGAggtcgctgcatttagaa +aggaggcggggtcagaggaatagaaagggatagGCCTGAAGAACAGAggtcgctgcattt +agaaaggaggcggggtcagaggaatagaaagggacagggctgaagaacacaggtcgctgc +atttagaaaggaggcggggtcagaggaatagaaagggacaGGGCTGAAGAACAGAggtcg +ctgcatttagaaaggaggcggggtcagaggaatagaaagggatagggctgaagaacacag +gtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggatagGGCTGAAGAAC +AGAGGTCGCTTCATTTAGAAACgaggcggggtcagaggaatagaaagggataggactgaa +gaacacaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggataggcc +tgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggaca +GGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagg +gacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaataga +aagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaa +tagaaagggacaggactgaagaacacaggtcgctgcatttagaaaggaggcggggtcaga +ggaatagaaagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggt +cagaggaatagaaagggacaGGGCTGAAGAACATAggtcgctgcatttagaaaggaggcg +gggtcagaggaatagaaagggacagggctgaagaacacaggtcgctgcatttagaaagga +ggcggggtcagaggaatagaaagggacagggctgaagaacacaggtcactgcatttagaa +aggaggcggggtcagaggaatagaaagggacagggctgaagaacacaggtcgctgcattt +agaaaggaggcggggtcagaggaatagaaagggacagggctgaagaacacaggtcgctgc +atttagaaaggaggcggggtcagaggaatagaaagggacagggctgaagaacacaggtcg +ctgcatttagaaaggaggcgggctcagaggaatagaaagggataggactgaagaacacag +gtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggatagGACAGAAGAAC +ACAggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggatgGGGCTGAA +GAACAGAGGTCGCAgcatttagaaaggaggcggggtcagaggaatagaaagggacaGGGC +TGAAGAACAGAggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggata +gggctgaagaacacaggtcgctgcctttagaaaggaggcggggtcagaggaatagaaagg +gatagGGCTGAAGAACAGAGGTCGCTTcatttagaaaggaggcggggtcagaggaataga +aagggacaGGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggtcagaggaa +tagaaagggacaGGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggtcaga +ggaatagaaagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggt +cagaggaatagaaagggacaGGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcg +gggtcagaggaatagaaagggatagGGCTGAAGAACAGAGGTCGCTTCATTTAGAAACga +ggcggggtcagaggaatagaaagggataggactgaagaacacaggtcgctgcatttagaa +aggaggcggggtcagaggaatagaaagggataggcctgaagaacacaggtcgctgcattt +agaaaggaggcggggtcagaggaatagaaagggacaGGGCTGAAGAACAGAggtcgctgc +atttagaaaggaggcggggtcagaggaatagaaagggacaGGACAGAAGAACACAggtcg +ctgcatttagaaaggaggcggggtcagaggaatagaaagggatagggctgaagaacacag +gtcgctgcatttagaaaggacgcggggtcagaggaatagaaagggacaGGACAGAAGAAC +ACAggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggacagggctgaa +gaacacaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggacaGGAC +AGAAGAACACAggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggata +gGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagg +gatagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaataga +aagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaa +tagaaagggatagGGGTGAAGAACAGAGGTCactgcatttagaaaggaggcggggttaga +ggaatagaaagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggt +cagaggaatagaaagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcg +gggtcagaggaatagaaagggacagggctgaagaacacaggtcgctgcatttagaaagga +ggcggggtcagaggaatagaaagggacagggctgaagaacacaggtcgctgcatttagaa +aggaggcggggtcagaggaatagaaagggacagggctgaagaacacaggtcgctgcattt +agaaaggaggcggggttagaggaatagaaagggacaGGGCTGAAGAACAGAggtcgctgc +atttagaaaggaggcggggtcagaggaatagaaagggatgGGCCTGAAGAACAGAggtcg +ctgcatttagaaaggaggcggggtcagaggaatagaaagggatagggatgaagaacacag +gtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggatagGCCTGAAGAAC +AGAggtcgctgcatttagaaaggaggcggggtcagaAGAATAGAAAGGGATAGGCCTGAA +GAACAGAggtcgctgcatttagaaaggaggcggggttagaggaatagaaagggacagggc +tgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggaca +ggactgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagg +gacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaataga +aagggacaGGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggtcagaggaa +tagaaagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcaga +ggaatagaaagggacagggctgaagaacacaggtcactgcatttagaaaggaggcggggt +cagaggaatagaaagggacagggctgaagaacacaggttgctgcatttagaaaggaggcg +gggtcagaggaatagaaagggacagggctgaagaacacaggtcgctgcatttagaaagga +ggcggggtcagaggaatagaaagggataggactgaagaacacaggtcgctgcatttagaa +aggaggcggggtcagaggaatagaaagggataggcctgaagaacacaggtcgctgcattt +agaaaggaggcggggtcagaggaatagaaagggacaGGGCTGAAGAACAGAggtcgctgc +atttagaaaggaggcggggtcagaggaatagaaagggacaGGGCTGAAGAACAGAggtcg +ctgcatttagaaaggaggcggggtcagaggaatagaaagggacaGGACAGAAGAACACAg +gtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggatagggctgaagaac +acaggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggatagGGCTGAA +GAACAGAggtcgctgcatttagaaaggaggcggggtcagTAGAATAGAAAGGGAGAGGAC +AGAAGAACACAggtcgctgcatttagaaaggaggcggggtcagaggaatagaaagggata +gggctgaagaacacaggtcgctgcatttagaaaggaggcggggttagaggaatagaaagg +gatagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaataga +aagggatagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcagaggaa +tagaaagggacagggctgaagaacacaggtcgctgcatttagaaaggaggcggggtcaga +ggaatagaaagggatgGGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcggggt +cagaggaatagaaagggatgGGGCTGAAGAACAGAggtcgctgcatttagaaaggaggcg +gggtcagaggaatagaaagggacagggctgaagaacacagg +>NC_060939.1 Homo sapiens isolate CHM13 chromosome 15, alternate assembly T2T-CHM13v2.0 +TATGGGGACATTGTGAgaaatctctgcactgatcacccaggtgatgtaactgttGTGTAA +CCTCTGCCTACAGGGGAATTGTGAGAGATCTCGTCACTCATTACCCAAGTGATGTAACCA +TTGCCTAGGCTTTGCGTAcagggggctttgtgacatacctttgcactgatcacccaggtg +atgtaacacaTCTAAGTTCGGCCTAAAggagctttgtgacatatctctgcactgatcact +taGGTGATGTAACACTTTTATAATCACTGCCTACAGGGAATTTTGAcaaatctctgcact +gatcacctaggtgatgtaactcttgtctaccCTCTGTCCAATggggcattgtgaaatatc +tctgcactgatcacccaggtgattcAACTCTTGACTAGGAACTGCCTACAGAGgttattg +tgaaatatctctgcactgatcaacAAGGTGGTGTAAACCTTGTCCAAGTGCTGCCTACAG +GGGCGTTTCCATATATCCCTGAACTGATGAcaaaggtgatgtaactctttcCTAGGCTAT +GCCTACAGGGTACATTGGACATatatctgcactgatcacccaggtgatgcaaaTCTTGCC +TAGGGTTTGCCTTCAGGGGACATCGTGACATATCTCTTCAATGATCACTCATGTGATGCA +TCTCTTGCCTATGCTTTGCCtacaggggacattgtgacatatctcacCACTGATCTCCCA +GGTGCTGTAACTTTAGTCTAGGCTCTGGCTACacggcattgtgacatatcactgcactga +tcaaccaggtgatataactcttgtataggctctgcctacagggggaTTGTGACCTACCTc +tacactgatcacccaggtgatacaACTCTTCTCTAGTATCTGCCTACAAGTACTTTGTGA +CATATccctgcactgatcacccaggtgatctAACTCTGGTCTAAGCTCTTCCTAAAGGGG +CATTGTGACagatctctgcactgatcactctGGAGATGTAAGGATTGTCTAGGCTCTGCT +TCAAGGGGCCTTgtcacatatctctgcactgatcacccaggtgatgtaactcttgtttAG +GCTCTGCTTCGAGGGCATATTGTGACATATCTATGCACTGATCACCTTAGTGATGTAACA +CTTTGGTAGGCTCGGTCTACAGGGGAATcttgacatatctctgcactgttAACCGAGGTG +AtttaactcttgtctaggctgtGCCCACAGGGGGATTGAGACATATCTCTGCAGTAATCC +CGAGGTGATACAACTCTTGCCTGGTCTCCGCCTACTGTGGACATTGTGACATAACTCTGC +ACTGATCTCCCAGGTGCTGTAACTTTAGTCTAGGCTCTGGCTACacggcattgtgacata +tcactgcactgatcacccaggcgATATAACTCTTCTCTAGGATCTGACCACAGGGTGCTT +TTTGACATATCCCTgcaatgatcacccaggtgatatacCACTTGCcaaggctctgcctac +aggggcattacaatgtatctctgcactgatcacctaggtcTTGTAGCTATTTTCTAGGAT +CTGCCTACAGGGTGCTTTGTGACGTGTCCCAGCAAGGATTACCCAGGTGATGTACCTCTC +ATCAAGTCCCTGCCTACAGGCACATTGTGatgtatctctgcactgatcacctcgGTCATG +TAAATTTTTTCTAGGCTCTACCAACGACGGCATtctgacatatctctgcactaaTCATCC +aagtgatgtaactcttgtctaggatGTGCCTAAATTAACTTTTTGACATAACCCTGTACT +GATCATCCAGGTGTTGGAGCTTTTGTCTGGGCTCTGCCtaagggggcattgtgacatatt +tctgcatTGATCACCCAGGTGGCGAACTCTACTCTCggatctgcctatgggggcattttg +agaaatctctgcactgatcaccaaGGTGATGTAACTGTTGTGTAACCTCTGTCTACAGGG +GAATTGTGAGAGATCTCGCCACTGATTACCCAAGTGATGTAATCGTTGTCTAGGCTTTGC +GTAcagggggctttgtgacatacctttgcactgatcacccaggtgatgtaacacaTCTAA +GTTCGGCCTAAAggagctttgtgacatatctctgcactgatcgcTTAGGTGATGTAACAC +TTTTATAATCACTGGCTACAGGGAATTTTGACAAACCTCTGCACTGgtcacctaggtgat +gtaactcttgtctaccCTCTGTCCAACggggcattgtgaaatatctctgcactgatcacc +caggtgattcAACTCTAGACTAGGGACTGCCTACAGAGgttattgtgaaatatctctgca +ctgataaACTAGGTGGTGTAACCCTTGTCcaagctctgcctacaggggcgttTCCACATA +TCCCTGAACTGATGACagaggtgatgtaactcttgcctAGGCTTTGCCTACAGGGAACAT +TGGACATATATCTGCACTGATTacccaggtgatgcaactctttcctaggctttgcctaca +ggggacattgtgacatatctcttcAATGATCACTCATGTGATGCATCTCTTGCCTAGGCT +TTGCCtacaggggacattgtgacatatctctgcactgatgtCCCAGGTTCCGTAACTTTA +GTCTAAGCTCTGGCTACacggcattgtgacatatcactgcactgatcaaccaggtgatat +aactcttgcataggctctgcctacagggggaTTGTGACCTacctctgcactgatcaccca +ggtgatataaCTCTTCTCTAGGATCTTCCTACAGGGTACTTTGTGACATATCCCTGCACT +GGTCACCCAGGTGATTTATCTCTGGTCTAAGCTCTGCCTAAAGGGGCCTTgtcacatatc +tctgcactgatcacccaggtgatgtaactcttgtctaggctctgcttcctgggcatATTG +TGACATATCTATGCACTGATCACCTTAGTGATGTAACACTTTGGTAGGCTAGGCCTACAG +GGGAATcttgacatatctctgcactgttAACCGAGGTGAtttaactcttgtctaggctgc +GCCCACAGGGGGATtgagacatatctctgcactgatcccGAGGTGATACAACTCTTGCCT +GGTCTCTGCCTACTgtggacattgtgacatatctctgcactgatctccCAGGTGCTGTAA +CTTTAGTCTAGGCTCTGGCTACacggcattgtgacatatcactgcactgatcacccaggc +gATATAACTCTTCTCTAGGATCTGACCACAGGGtgctttgtgacatatccctgcaatgat +cacccaggtgatatacCACTTGCcaaggctctgcctacaggggcattgcaatgtatctct +gcactgatcacctaggtcTTGTAGCTATTTTCTAGGATCTGCCTACAGGGTGCTTTGTGA +GGTGTCCCAGCAAGGATTACCCAGGTGATGTACCTCTCAtcaaggctctgcctacaggCA +CATTGTGatgtatctctgcactgatcacctaggaCATGTAACTTTTTTCTAGGCTCTACC +TACGatggcattgtgacatatctctgcactaaTCATCCaagtgatgtaactcttgtctag +gatGTGCCTAAATTAACTTTTTGACATAACCCTGTACTGATCATCCAGGTGATGGAGctt +ttgtctaggctctgcctaagggggcattgtgacatatttctgcatTGATCCCCCAGGTGT +CGAACTCTTCTCTCATatctgcctatgggggcattgtgagaaatctctgtactgatcacc +caggtgatgtaactgttGTGTAACCTCTGCCTACAGGGGAATTGTGAGAGATCTCGCAAC +TGATTACCCAAGTGATGTAACCGTTGTCTAGGCTTTGCGTACAGGGGACTTTGTGACATA +CctttgcactgatcacccaggtgatgtaacacaTCTAAGTTCGGCCTAAAggagctttgt +gacatatctctgcactgatcacttaGGTGATGTAACACTTTTATAATCACTGCCTACAGG +GAATTTTGAcaaatctctgcactgatcacctaggtgatgtaactcttgtctaccCTCTGT +CCAACggggcattgtgaaatatctctgcactgatcacccaggttaTTCATCTTTTCACTA +GGAACTGCCTACAGAGgttattgtgaaatatctctgcactgataaACTAGGTGGTGTAAC +CCTTCTCCAAGCTCTGCCTACAGGGACGTTTCCACATATCCCTGAACTGATGACagaggt +gatgtaactcttgcctaggctttgcctacagggaacattgtgacatatctcttcAATTAT +CACTCATGTGATGCATCTCTTGCCTATGCTTTGCCtacaggggacattgtgacatatctc +ttcACTGATCTCCAAGGTGCTGTAACTTTATTCTAGGCTCTGGCTACacggcattgtgac +atatcactgcactgatcaACCAGGTGATATAACCCTTGtataggctctgcctacaggagg +ATTGTGACCTacctctgcactgatcacccaggtgatataactcttctctaggatctgcct +acagggtactttgtgacatatccctgcactgatcacccaggtgatctAACTCTGGTCTAA +GCTCTGCCTAAAGGGGCATTGTGACagatctctgcactgatcactctGGTGATGTAAGTA +TTGTCTAGGCTCTGCTTCAAGGGGCCTTgtcacatatctctgcactgatcacccaggtgt +tTTAACTCTTGTCTAAGGCTCTGCTTCCAGAGCATATTGTGACATATCTATGCCCTGATC +ACCTTAGTGATGTAACGCTTTGGTAGGCTCGGCCTACAGGGGAATcttgacatatctctg +cactgttAACCGAGGTGActtaactcttgtctaggctgtGCCCACAGGGGTATtgagaca +tatctctgcactgatcccGAGGTGATACAACTCTTGCCTGGTCTCTGCCTACTgtggaca +ttgtgacatatctctgcaatGATCTCCCAGGTGCTGTAACTTTAGTCTAGGCTCTGAATT +CACGGGCATTGTGACttatcactgcactgatcacccaggcgATATAACTCTTCTCTAGGA +TCTGACCACAGGGtgctttgtgacatatccctgcaatgatcacccaggtgatatacCACT +TGCcaaggctctgcctacaggggcattgcaatgtatctctgcactgatcacctaggtcTT +TGTAGCCTATTTTCTAGGATCTGCCTACAGGGTTCTTTGTGACGTGTCCCAGCAAGGATT +ACCCAGGTGACGTACCTCTCATCAAGACTCTGCCTACAGGCACATTGTGatgtatctctg +cactgatcacctaggtcaTGTAACTTTTTTCTAGGCTCTACCTACGatggcattgtgaca +tatctctgcactaaTCATCCaagtgatgtaactcttgtctaggatGTGCCTAAATTAACT +TTTTGACATAACCCTGTACTGATCATCCAGGTGATGGAGcttttgtctaggctctgccta +agggggcattgtgacatatttctgcatTGATCACCCAGGTGGCGAACTCTTCTCTCggat +ctgcctatgggggcattgtgagaaatatctgcactgatcacccaggtgatgtaacagtTG +TGTAACCTCTGCCTACAGGGGAATTGTGAGAGATCTCGTCACTGATTACCCAAGTGATGT +AACCGTTGTCTAGGCTTTGTGTACAAGGGGCTTTGTGACATACatttgcactgatcaccc +aggtgatgtaattCATCTAAGTTCGGCCTAAAggagctttgtgacatatctctgcactga +tcattTAGGTGATGTAACACTTTTATAATCACTGCCTACAAGGAATTTTGAcaaatctct +gcactgatcacctaggtgatgtaactcttgtctaccCTCTGTCCAACggggcattgtgaa +atatctctgcactgatcacccaggtgattcAACTCTTGACTAGGAACTGCCTACAGAGgt +tattgtgaaatatctctgcactgataaACTAGGTGGTGTAACCCTTGTCCAAGCTCTGCC +TTCAGGGGCGTTTCCACATATCCCTGAACTGATGACAAAAGTCATGTAACTCTTGCCTAG +GCTTTGCCTACAGGGAACATTGGACATatatctgcactgatcacccaggtgttGCAACTC +TTGCCTTGGCTTTGCCTACAGGGGACATCGTGACATATCTCTTCAATGATCTCTCATGTG +ATGCATCTCTTGCCTAGGCTTTGCCtacaggggacattgtgacatatctctgcactgatc +tccCAGGTGCTGTAACTTTAGTCTAAGCTCTGGCTAcaaggcattgtgacatatcactgc +actgatcaaccaggtgatataactcttgcataggctctgcctacagggggaTTGTGACCT +acctctgcactgatcacccaggtgatataaCTCTTCTCTAGGATCTTCCTACAGGGTACT +TTGTGACATATccctgcactgatcacccaggtgatttATCTCTGGTCTAAGCTCTGCCTA +AAGGGGCCTTGTCACATATCTCTGCACTAATCACTCTGGTGATGTAAGTATTTTCTAGGC +TCTGCTTCAAGGGGCCTTGTCACATacctctgcactgatcacccaggtgatgtaactctt +gtctaggctctgcttcCAGGGCATATTGTGACATATCTATGCACTGATCACCTTAGTGAT +GTAACACTTTGGTAGGCTCGGCCTACAGGGGAATcttgacatatctctgcactgttAACA +GAGGTGActtaactcttgtctaggctgtGCCCACAGGGGGATtgagacatatctctgcac +tgatcccGAGGTGATACAACTCTTGTCTGGTCTCTGCCTTCTgtggacattgtgacatat +ctctgcaatGATCTCCCAGGTGCTGTAACTTTAGTCTAGGCTCTGGCTACacggcattgt +gacatatcactgcaaTGATCACCCAGGCGATATAACTCTTCTCTAGGATCTGACCACAGG +GTGCTTTGTGATATATCCCTGCAATGATAACCCAGGTGATATACCACTTGCcaaggctct +gcctacaggggcattgcaatgtatctctgcactgatcacctaggtcTTGTAGCTATTTTC +TAGGATCTGCCTACAGGGTTCTTTGTGACGTGTCCCAGCAAGGATTACCCAGGTGACGTA +CCTCTCATCAAGACTCTGCCTACAGGCACATTGTGatgtatctctgcactgatcacccag +gtcaTGTAACTTTTTCTAGGCTCTACCTATGatggcattgtgacatatctctgcactaaT +CATCCAAgtgatgtaacccttgtctaGGATGTGCCTAAATTAACTTTTTGACATAACCCT +GTACTGATCATCCAGGTGATGGAGcttttgtctaggctctgcctaagggggcattgtgac +atatttctgcatTGATCACCCAGGTGGCAAACTCTTCTCTCggatctgcctatgggggca +ttgtgaGAAATCTCTGCACTGAtaacccaggtgatgtaactgttGTGTAACCTCTGCCTA +CAGGGGAATTGTGAGAGATCTCGTCACTGATTACCCAAGTGATGTAACCGATGTCTAGGC +ATTGCATAcagggggctttgtgacatacatttgcactgatcacccaggtgatgtaacaca +TCTAAGTTCGGCCTAAAggagctttgtgacatatctctgcactgatcacttaGGTGATGT +AACACTTTTATAATCACTGCCTACAGGGAATTTTGAcaaatctctgcactgatcacctag +gtgatgtcACTCTTGTCTACCCTCTGTGCAACGGGGccttgtgaaatatctctgcactga +tcacccaggtgattcAACTCTTGACTAGGAACTGCCTACAGAgtttattgtgaaatatct +ctgcactgataaACTAGGTGGTGTAAACCTTGTCcaagctctgcctacaggggcgttTCC +ACATATCCCTGAACTGATGAcaaaggtgatgtaactcttgcctAGGCTTTGCCTACAGGG +AACATTTGACATatatctgcactgatcacccaggtgatgcaactcttgcctaggctttgc +ctacaggggacattgtgacatatctcttcAATGATCACTCATGTGATGCATCTCTTGCCT +AGGCTTTGCCTACAGgtgacattgtgacatatctctgcactgatctccCAGGTGCTGTAA +CTTTAGTCTAGGCTCTGGCTACacggcattgtgacatatcactgcactgatcaACCAGGT +GATATAACTCTTGTATAGGCCTCTGCCTACAGGGGGATTGTGACCTAccactgcactgat +cacccaggtgatataactcttctctaggatctgcctacagggtactttgtgacatatccc +tgcactgatcacccaggtgatctAACTCTGGTCTAAGCTCTGCCTAAAGGGGCATTGTGA +CagatctctgcactgatcactctGGTGATGTAAGTATTGTCTAGGCTCTGCTTCAAGGGG +CCTTGTCATATacctctgcactgatcacccaggtgatgtaactcttgtctaggctctgct +tcCAGGGCATATTGTGACATATCTAGGCACTGATCACCTTAGTGATGTAACACTTTGGTA +GGCTCGGCCTACAGGGGAATcttgacatatctctgcactgttAACCGAGGTGATTTAACT +TTTGTCTAGGCTGTGCCCACAGGGGGATtgagacatatctctgcactgatcccGTGGTGA +TAAAACTCTTGCCTGGTCTCTGCCTACTGTGGACATtgagacatatctctgcactgatct +ccCAGGTGCTGTACTTTAGTCTAGGCTGTGGCTACacggcattgtgacatatcactgcac +tgatcacccaggcgATACAGCTCTTCTCTAGGATCTGACCACAGGGTGCTTTGTGACATC +TCCCTAcaatgatcacccaggtgatatacCACTTGCcaaggctctgcctacagggcaTTG +CAatgtatctctgcactgatcacctaggtcTTGTAGCTATTTTCTAGGATCTGCCTACAG +GGTGCTTTGTGACGTGTCCCAGCAAGGATTACCCAGGTGATGTACCTCTCAtcaaggctc +tgcctacaggCACATTGTGatgtatctctgcactgatcacctaggtcaTGTAACTTTTTC +CTAGGCTCTACCTACGatggcattgtgacatatctctgcactaaTCATCCaagtgatgta +actcttgtctaggatGTGCCTAAATTAACTTTTTGACATAACCCTGTACTGATCATCCAG +GTGATGGAGcttttgtctaggctctgcctaagggggcattgtgacatatttctgcatTGA +TCACCCAGGTGGCGAACTCTTCTCTCGGGtctgcctatgggggcattgtgaGAAATCTCT +GCACTGAtaacccaggtgatgtaactgttGTGTAACCTCTGCCTACAGGGGAATTGTGAG +AGATCTCGTCACTGATTATCCAAGTGATGTAACCGTTGTCTAGGCTTTGCAAAcaggggg +ctttgtgacatatatttgcactgatcacccaggtgatgtaacacaTCTAAGTTCGGCCTA +AAGGAGCTTTGTGACAtgtctctgcactgatcacttaGGTGATGTAACACTTTTATAATC +ACTGCCTACAGGGAATTTTGAcaaatctctgcactgatcacctaggtgatgtcACTCTTG +TCTACCCTCTGTGCAACGGGGccttgtgaaatatctctgcactgatcacccaggtgattc +AACTCTTGACTAGGAACTGACTACAGAGgttattgtgaaatatctctgcacttaTAAACT +AGGTGGTGTAAAACTTGTCcaagctctgcctacaggggcgttTCCACATATCCCTGAACT +GATGAcaaaggtgatgtaactcttgcctAGGCTTTGCCTACAGGGAACATTGGACATata +tctgcactgatcacccaggtgatgcaactcttgcctaggct +>NC_060940.1 Homo sapiens isolate CHM13 chromosome 16, alternate assembly T2T-CHM13v2.0 +ccttttgttttccattttcttttattttgagacattgtcttgctctgtcacctgggctga +agtaccgtggtgcaatcacagctcactgcagcctggacctctcaGGCTcactccatcctc +ccacctcctcctcctgaggacctgggactacaggtgcgcattgCCAATGCCTGGctagtc +ttttaatttttaatagagatggagtttcactacgttgcccagactgatcttgagctcctg +ggctgaagggatcctcccaccttggcctcccaaagtactgggatcacaggcatgagccgt +caCACCTGGCCATGgatgaaaacttttttctttttgtttctcttctcttttcttggcttt +cttttctttttgagacagtcttgctctgtcttgctCTGTGAAGTGACATCATCACAGCTC +TCAATAGTTTTCACTTCCCagacctcccaagctcaaatgatcctccctcctcagcctccc +gagcagctgagaccacaggcgcatgccaccatacccagatgattttttaattttttgtag +agacaggcccagactggtcttgaactcctgggctctagcagtcctcccacctcggtctcc +cagaatgttggaattacaggcaggagccaccgcgtcccacttgttttccattttctgtca +ttttagggGCTAGGGGCTAGGGGCTAGAGGAAGCAGAGGTGAACGTCATCATGCATCTTT +TTCTAACTGTCTTCTTGCTCACCCCTTTCAGAAAAGCATTGAGCTGGCCGGGCGTAgtag +gtcacgcctgtaatcccagcactttgggaggctgaggtgggtggatcacctgaggttggg +agttcaagaccagcctggccaaaatggagaaaccccatctctactaaaaaaatacaagat +tagccaggtgtgttagcaggtgcctgtaatcccagctactcaggagactgaggcaggaga +atcacctgaaccctggaggcggagcttggagtgagccgagattgtgccattgtactccag +cctgggcaacaagagcgagactccatctcaaaaaaagaaagaaaaagagaagcattGAGC +TCTTAGGAACGTGACGTGCATCCCCAGCTACACTTCTGTTACCACTTCAGCATCACCTTC +CTCCCCACTTCATCAAGTCTTTTACTCCAGACAGGCTGCAGCTGGTGACATGAAAGACCG +GTCAAGGCCAGCTAAGGCATCTGCTTGAGGCCTCCCGTGCCTAGGATGGGGCGCAGCCTG +CAGTTGGCTGTCACAGCCTTGTGTCAGAAACAccctttaaaatttaatgtttccTTCACG +GGTACCCTTTGGCATAAAAAAAGCCCAATCTgagccggacgcagtggctcacgcctgtaa +tcccagcacattgggaagccaaggtgggtggatcacgaggtcaggagttcaagaacagcc +tgaccaacatggtgaaaccccgtctctactaaaaatacaaaaattagttaggcatggtgg +cacacatgcctgtaatcccagctactcaggagcctgaggtaggagaactgcttgaaccca +gaaggcagaggttacagtgagcccagatcacgccactgcactctagcctgggcgacagag +caagactgtctcaaaaaaaaaaaaaaaaaaaaaagctccatcTGCAGTTATCTGTCGTTA +GAGTTTACAAAACAGAGACCTCTTCTGCAGTGTGTCTATccacatgtaaatatatgtaca +caaGATTTAATCTGTTGTTTTGCCCCAAATCTGCCACAAGAGGCTaaggaagagcaaaat +aaacGTCGCGATTCGCTTCTCACAGTTCTCAGCCCTTCGCGCTGAACTATTGCTGAGATG +GTGGGTTTTGCCAGCAGCCATTGTAGCCCCCGGGCCTGGCTGCATTGCTCACCTCCCTCA +GCCTTGTTCTGTCCCTGTCCATGAGATGGAAGTGGCTTTCTCCAGTCAGCTGTGTGTGCA +GAGACCGGGGGCTCCGGGCAGAGCCGAGTCCATCAGGACTGGAGGAAGTGCTCACAGCAG +GCAGGCTCCCTGGGCCCTGGGTGGGAGGCCTCAGGGATCCCCGTACCTCCTTGCTCACCA +GCCAGGCTCGACCTACTGCCCTGTGGGGCAGGTCAGGCTTTTTCCACAGCTCCCTCTCTG +GGAGGAGGGTCCTTCCAAGTGAGGGTGTGGTGTAGCTGGAGAATCCCTCTTTCTAGGGGA +TTTAAATAAGCAGCCCCAGCCggacgcggtggttcacgcctgtactcccagcactttggg +gggccgaggcgcacagatcacgaggtcaggagtttgagaccagcctggccaacatagtga +aaccccatctctactaaaaaaaacaatacaaaaagttagctgggcatggtggcaggtgcc +tgtaatcccagctacctgggaggctgaggcaggagaatggcttgaacccggaaggcagag +gttgcagtgagctgagattgcaccactgcactccagcccaggtgacagtgcaagactctg +tcgcaaaaaaaaaaaaaaaaaaaaaaaaaaaaattaaataagtaaataaataagcagcCG +CATGACCCATGCTGAGGACCCTCTGCCTCACGTTGgtggccacgtgtggtggctgcACGC +TGGGTGCCTGGGGATGGCTGTGTCCCCGAGTCAGCCCCAGAAGTGCCTACGCCTCTAGGA +CAGCTCAGAAGTGCTGACAGGTCGTGGCCTCTCAGGATGGGCTCTGGGTTGCAGCTTCAT +GCCTGGAGTGGCTCATGTTTGGGGGCAAGGTCATGGGCGTTTAAGAGCAGCGACTGGCCA +AGAACATGATCTGTATCAGCAGCAgcttttgagaatctgatgaaatcCCCAGAGCCCCAG +AAGGGCACCGGTGTGTTCCAGCTGGTGCACGTTCACAGGGCTTGTCTCCTCAGAGCGTTT +ATGGGGAAAAAGATGGAAATGTTCAAGCCCAGTCCGTACTGAGAAGCAAATCGAACTTCA +TACACTTGGTAGACATTTTCAgtggaaaaatattaacattttatggaATTCTTACTCTGC +TACGTCCCTAGCCAAGCTGTTTGTATGCATGACCTTGGTTAAACCTCAGTTGCCTCTAGA +CCCCCATTTCATAGGCAAGGAAGCTGGGAGAGGGTCCCCCCATTTCATAGGCAAGGAAAC +TCGGAGAGGGTCCCCCCATTTCATAGGCAAGGAAGCTCGGAGAGGGTCTCCCATTTCATA +GGCAAGGAAGCTGGGAGAGGGTCCCCCCATTTCATAGGCAAGGAAGCTCGGAGAGGATCC +CCCCATTTCATAGGCAAGGAAGCTGGGAGAGGGTCCCCCCATTTCATAGGCAAGGAAGCT +CGGAGAGGGTCCCCCATTTCACAGGCAAGGAAGCTGGGAGAGGGTCCCCCATTTCATAGG +CAAGGAAGCTGGGAGAGGGTCCCCCCATTTCACAGGCAAGGAAGCTGGGAGAGGGtcccc +ccatttcacagacaagtTCAGAGAGGCTCCCCCCATTTCATAGGCAGGGAAGCTGGGAGA +GGGtccccccatttcacagacaagtTCGGAGAAGGTCCCCCATTTCATAGGCAAGGAAGC +TGGGAGAGGGTCCCCCCATTTCACAGGCAAGGAAGTTCAGAGAGGGtccccccatttcac +agacaaggaagTTCGGAGAGGATCCCCCATTTCATAGGCAAGGAAGCTGGGAGATGGTCC +CCCCATTTTATAGGCAAGGAGTCTGGGAGAGTGTCCCCCCATTTCATAGGcaaggaggct +gggagagggtcCCCCCATTTCATAGGcaaggaggctgggagagggtcCCCCCATTTCATA +GGCAAGGAAGCTCGGAGAGGGCCAGTGCTTTTTAACGGTCACGCAGTTCTGAGCATCAGG +CTGTCAGCCTGGAGCCTGGCTTGGTACTGAGGTTCCCAGGATGTATAAAGAACTGAACAC +GCACCTTTGCTGTTGGCTCTTCTGTGCGAGTGCTCTGAGAGTTTTCTGTACTCCCGGCAA +GTTTGGGTTGGTACAGATTCACCACAGCGAATCTGACCACGTGGTGACCACAAGCACGCG +CTTACTGCGCGCCTAAGTTCACACTCCCTGGAGAAGCTCCTGCCCCAAGGCCGCAGCCTA +TGGGCCTTTGCGTCTACTCAGGACCATGAGGCTGTGTCCCCGAGCCTGGCCCGGGTAGTA +ACTGGCATGGCCTGCGGTGCTGGGGGCGTGTCCACAGGAGCTGGTGCCACAGAGGACACG +TGTGTCTGCTGTCTTCCTGGACTCGGTCGGACCAGTTTCCCAGTGTGTCCGTGAGGGTGA +CACTGAGTGAGACTTCTGGGATCCACACCTTTCCTGGGACCCTCACTCTTCCTGCCACAG +AAAGCACCTgtgaaagtctgagatcaagaaTGTGCACAGGGGAGGTGTCTGCAGGTCAAG +GTCCTGAGCTGATGTCTCACAGGCCTCTGGTAGAGACGAGATTGTTCGTGTCTCTGCGAA +GAAGGGCATGTTTTATTGCAGCCAAGTACAAAGTCCTCTCTGCCACTCGCTGGCTGGGAC +TGAGGTCATGTTCTGTCAGGTTCCAAAGAGCGCCAGGAAGACTCTGAGACCACAGAGCAC +GGCCTGctttctcccagcccctggtaaagATGTCCAGCCTGGGACCTCCCCCTGTATATA +GTGCTTTAAGTGGGAGAAGACCACCACCCAGATCAGGGGAGGACCTGTCCCCTGCAATGC +TGCTGCCTGCTTTTCAGATTGACTTGGGAGTGCTTGTGCTGACGGAGCATGTCCTGtggt +ttttccctttcttccctctgttGTTGTGCCTTTTCTGTAGGTACCTGCACCAGTCAGGGG +CCCTGACCATGGAGGCCCTGGAGGACCCTTCCCCCGAGCTCATGGAGGGCCCAGAGGAGG +ACATTGCTGACAAGGTAGGCCCTGGAGGGCTGGGTAGGTGGCAAGTAGGGGATTTAGAAC +ACAGCCACGCCTAAGGGCCGCTGCAGACACCCCGGGAGGTGGGGACAGCACAGCCGGAGG +TGACCCCATGTCCTCCAGGGCTCCCCAGACTGTCCATCCAGCCCCGATGCTCTTTGGCAG +GTTTCCCCAAGGGGTCTCGTGGCCATGTGAGAAAAAGGAGTCTTCCTGTTGTGCACGAAG +GGCCAGCTGGGAGGAGTGGACTGGGCAGTGAGTGAGCACCCTCGGGTATCCCACCCCCAC +TGTGTCTGAGTCGGGCTGGGGGACACCCAGACATTCAGTCCACCAGGCCCATGGAGACGC +GACCTGGGGCACCCATGATTTGGGAGAAAAGGGCTGGCCCTGCAGTTACTGCAGAGCCAA +CAGCCTGAGGAACGGGCTTCTCCTGGGGCCTTGAATGGAATGGGTGACAGCAGCCAGGGC +AAGGCAGCCTTGCCGTGGTCAAGACCCGCTtttcagccagatgtggtggctcacgcctgg +aatcccagcacattaggaggcctaggcgggcagatcacttgaggtcaggagtttgagatc +agcctggccaacatagtgaaaacccgtctctactaaaaatacaaaagttagccacgcatg +gtggcgggcaactgtaatcccagctatttgggaggctgaggcaggagaatcacttgaacc +tgggaggtggaggttgcagtgagccgagattgcacgactgcactccagcctgggcgacag +agggagactccgtctcacctTCTGCACCCCCTCACCTTCTGTGACCCCTTCACTTACTCC +TGTACCCCCTCAATTCCTCCTGTACCCCTCATCTCCTCCTGTACCCCCTCACCACCTCCT +GTACCCCCTCACCACCTCCTGTACCCCCTCACTACCTCCTGTAccccctcacctcctcct +gtACCCCCTCACCTCCTTGTGTACCCCCTCACCTCCTGTAccccctcacctcctcctgta +cccccccacctcctcctgTACCCCCTCACCTCCTCTTGCACTCCCATCTCCTCCTGTACC +CCCTCACCTCCTTGTGCACCCCCTCACCTCCTGTAccccctcacctcctcctgtaccccc +tcacctcctcctgtaccccctcacctcctcctgcACTCCCATCTCCTCCTGTACCCCCTC +ACCTCCTTGTGCACCCCCTCACCTCCTGTAccccctcacctcctcctgtaccccctcacc +tcctcctgtaccccctcacctcctcctgcACTCCCATCTCCTCCTGTACCCCCTCACCTC +CTTGTGCACCCCTCACCTCCTGTAccccctcacctcctcctgtACCCCCCTCACCTCTTC +CTGTACCCGCCTCACCTCCTCCTGCACTCCCATCTCCTCCTGTACCCCCTCACCTCCTTG +TGCACCCCTCACCTCCTGTAccccctcacctcctcctgtACCCCCCTCACCTCTTCCTGT +ACCACCTCCTCCTGTACCCCCTCACCTCCTCTTGCACCCCCCTTGCCTCCTGTACCCCCT +CACCTCCTTGTGCACCCCCTCACCTCCTGTACccccctcacctcctcctgtACCCGCCTC +ACCTCCTCCTGCACTCCCATCTCCTCCTGTACCCCCTCACCTCCTTGTGCACCCCCTCAC +CTCCTCCTATACCCCCTCACCTCCTCCTATAccccctcacctcctcctgcACTCCCATCT +CCTCCTGTACCCCCTCACCTCCTTGTGCACCCCTCACCTCCTGTAccccctcacctcctc +ctgtaccccctcacctcctcctgtaccccctcacctcctcctgcACTCCCATCTCCTCCT +GTACCCCCTCACCTCCTTGTGCACCCCCTCACCTCCTGTAccccctcacctcctcctgta +ccccctcacctcctcctgtaccccctcacctcctcctgcACTCCCATCTCCTCCTGTACC +CCCTCACCTCCTTGTGCACCCCTCACCTCCTGTAccccctcacctcctcctgtaccccct +cacctcctcctgtaccccctcacctcctcctgcACTCCCATCTCCTCCTGTACCCCCTCA +CCTCCTTGTGCACCCCTCACCTCCTGTAccccctcacctcctcctgtaccccctcacctc +ctcctgtaccccctcacctcctcctgcACTCCCATCTCCTCCTGTACCCCCTCACCTCCT +TGTGCACCCCTCACCTCCTGTAccccctcacctcctcctgtACCCCCCTCACCTCTTCCT +GTACCACCTCCTCCTGTACCCCCTCACCTCCTCTTGCACCCCCCTTGCCTCCTGTACCCC +CTCACCTCCTTGTGCACCCCCTCACCTCCTGTACccccctcacctcctcctgtACCCGCC +TCACCTCCTCCTGCACTCCCATCTCCTCCTGTACCCCCTCACCTCCTTGTGCACCCCCTC +ACCTCCTCCTATAccccctcacctcctcctgtACCCCCTCACCTCCTTGTGCACCCCCTC +ACCTCCTGTAccccctcacctcctcctgtaccccctcacctcctcctgtaccccctcacc +tcctcctgtACCCCCTCACCTCCTTGTGCAACCCTCACCTCCTGTAccccctcacctcct +cctgtacccccctcacctcctcctgtaccccctcacctcctcctgcACTCCCATCTCCTC +CTGTACCCCCTTACCTCCTTGTGCACCCCTCACCTCCTGTAccccctcacctcctcctgt +ACCCCCCTCACCTCTTCCTGTACCCTTCACTTCCTCCTGTAccccctcacctcctcctgc +ACCCCCCTTACCTCCTGTAccccctcacctcctcctgtACCGCCTCACCTCCTCCTATAC +CCCCTCACCTCCTCCTATACCCCCTCACCTCTTCCTGCaccctcctcacctcctcctgcA +CCCCCATCTCCTCCTGTACCCCCCTCACCTCCTGTACCCCCTCATCTCCTGTACCCCCTT +ACCTCCTCCTGCACCCCTCACCTCCTGTAccccctcacctcctcctgctcccccacctcc +tcctatACCCCCATCTCCTCCTGTACTCTCTCACCTCCTCCTGTacctcctcacctcctc +ctgtACTTCACCTCCTCTTGCATCCCCACCACCTCCTCCCTACAACTTCTCTAGCATCTC +AAGTCTGCTGACCCAGGCCAAGTCCTCCTCTGCTCCCTTCACTCCTTCTCCTACCTCCGC +AGGTGTCTGATTCTCATCTTGGTGTGAACTCTCTGAGGGAGGGACCGAGACATGGATCTG +TCTGTCCCTTGCATCCATGGGCACCTGGGCTGCCTCTGTGAGCTGCATCTGGCTGAGCAG +AGACCCAACTGTGTGTTGGGGGGCTGAGTCTTGCTGCCCACCAGCCAGCCAGTCCAAAGG +CACCCCTGGGCCCCGAGCCCTCAGAGCTGCGGCACTGTGTGCATTTGTGGGTCGAATGAC +AGTGCTCCCCAAGACCCCGGCCCCATTAGGAGCTGCACCTTTGTGGGTTTATGGGACAAG +TTGGATCCAACACCAGCCTAGCTAGGTGGATCTGATTCTGTGCTGAGAAAATCCCCAGGC +GGCCTCCCAGGTTGTTCCCTTGGGGGTGCAGGCCCTTCTGCTTCTGGCTGCCTGACCCTG +AAGCCTGGTCTCATTGCCAAGGTTGTCTTCCTGGAAAGGCGTGTGCTGGAGCTGGAAAAG +GACACGGCAGCCACCGGTGAGCAACACAGccgcctgaggcaggagaacctgcAGCTGGTG +CACAGGTGAGCCTGGGCCAGGAGACCCGGGCCTCTGCGTGGCGCCTCCTGTGCCCGCCTG +TCAGCCCCCATTTACTTCTCTTTACCTCACACAGCAGGGGCTTGGCCACCCGTCCATCCC +CGTTGGAAGCCGGCTGAGGGGGTGGTGCCAGGTGGTCATCTGAGCCTACCCAGTGGGCTG +CAGGCAGGCGACCCGAGGCTCTGACTGGTGCTCTCATGGAACCCTAGACACACAGAGGGC +CAGAGGAGGGCACTGCCTCCCTCTCGGGAGCGCTGAGACCTGACCCACACAGAGGAGGAA +CTGACTGCGAACCCACGCAGTGCTCAGCCTCACCAGCAGGCCTGGAGGTGCAGCTCTCCC +ACCACTCTGGTCCATACGGGGTTTGCCCGTCCTGGAAGAATGCAGGTTAGAGAAGTCGCT +CAGCAGCAGAAAGCGAAATGAGCAGTGACTGCTGAGTACGCGACAGGACGCGCAGTCTCA +TCGCTGTGGGCAGGAGTGCTGGGGAGGAAGCGAAGTGTGACGCCGTGTTTGCAGAGAAAG +AGTGGGAGCTGCTTGCCTCACTCTGGTTTGCAGACTTTTCTTAGAATACCGTGTAATTCT +CGGTGTTTTTCACACGAGGCACGCCATGTTGTCTCATAGCCGATTTGCAGGACTGTTTCC +GGTGCAAAGTAAGATGAGCTTGTCCCAGGAGTCAGCTACCCAGGCTATGACACCTGTAGC +TGGGCACCGGCAGCCTCTTGTGGGCAGAGGAGGCAGCCAGGAGGCCTATGAGGCACCTGT +GGGATCTGCAGAAGAGGTTCTTCCTGTGAGCTTCTGTCCCTGCCCAGCTGCGCGGGCACA +TCCCGGCTCTTCCACATATTCTCAGCTCGGCCAAGGGCCCTGTCCCTTGAAGCTTCAGTG +TCTTCATCACCACTGAGCAGGTAGATTCAGGGCTCTGAGCAGCCTGCACACACGTGTGTT +GGCAGCAGGGCATTTGTGGTCAGCATCCCCAAAGCCCCCAAGCCCTCACCCTCACGGTAC +TAACATTTGTGACCATCTGCCCTGTGAGCGCTGAGAATTGGAATGCCTCATGGGATTGTG +GGCATAACTTGCACATCATTTTAATTCTAACAAAGCAAAGCATGTGCTCTTGTGGAGTGA +AGACCCTGGGCTTGGCGGCTGCCCGTTCTCCAGGATTCTCAGCAGAAGAGGGCCTGCTAC +CAGCCCCTGCTGCAGAGTGGAGaggggccaggcatgctggtgaaGGGGCTGGACTCCCGT +AGTGCGCTACACATAAGCAGTGCCACCAAAGACCACTGTCT +>NC_060941.1 Homo sapiens isolate CHM13 chromosome 17, alternate assembly T2T-CHM13v2.0 +tgagaggagaggagagcaaCAACTGAACAATGAAGAGGGGATGATTTAAAGACCAGTTCT +gccaaaacatttcaaatatgaaAACCAAAAAGGAAGGAGCTGGGGAAAAAGGCTCAAGTG +TTCCTAGCTGACCCCTGACCACCACCACAGAGCACCACCTCGGCCAGGAGACACTGGGCT +CCAGGCCAGGAGCTTGGCCCTGGCCGAGTGAGTTCAGGCAGAAAGGGGCTGTGCCGCCCT +GAGAAACCAGTACCCCCAGCCCAGTCCTCCCGGGACAGAAGGTGTCTGACAGTTGGCCAA +CTGCCATTCTGACAGTCCTGTACCTGTGTTTTACAATAAAGCATTGTCTTTGCAAACTTG +AGTAAGCTCCTGTCAGTTTTTCATGGTCTCTACGTGGTTACCCTGTTCAGCTGCCTCAGC +TTGTCCAGAAGGGCCTTCCCTGCCCTCGTTCCCTTACCACTTTTGGCCTTTGGGGGATTT +TTCCTTGGAGAGGTCCTGGGACAGACCCAGGTTCACAGGCTACCCTGGTCCTCAGATGCA +ACAGGGCCATTTGTTCCTCTGTGGTCCTATAGCTCCCTAAATGTAAAAGACAAATCACCA +GGAAGTAGGGCCCAGCCAGAGAGGGTGAAGAATGGCTCAAAACAAGTGCTTGGCAAGAAT +GTCATTCAAGCATCCTTCACTGGGACCTACTTCCCGTCCGGTTATCTGGATTACCAGCTC +ACAGAGCCTGTCCTGATGCTCTCCGGACCCTGCCCAGCCAGAGGCCGTGGGAGCTCAGGG +GGCTACTCCCAGGGTGGGGCCTGTGCTCAATGCTGAACCCTCATGCTTGTCGCCGGGCAG +ATCTCCGTAGGGCTGAATCCAGTGCCACATATATCTACGCTTGAAACCAGGCAGGAGCAT +GGCTTGGGAAGGTCCGAGAGGAGAGCCAGCAAGAGGAATCAGGGGGCTGCTAAAGCCAAC +CTCATACTTCTCAGGAGAAACTCAGGATTCCTTCAGTGGGATCTCTGTtcctatttcctt +tccttttctgtttttttgagacagtctcactttgtcacccagactggagtgcagtggtgc +aatctcagttcattgcaacctctgccttctgggctaaagtgatcctcctgtctcagcctc +tcaggtagctgggactacaggcgtgcgccaccacgccccactaatatttcccgggtagct +gggactacaggcgtgcgccatcaggCCCCGCTATTatttcccaggtagctgggactacag +gcatgcaccaccacgccccactaatatttcccgggtagctgggactacaggcatgcgcca +tcaggCCCCGCTATTAtttcccaggtagctgagactacaggcatgcgccaccacgcccca +ctaatatttcctgggtagctgggactacaggcgtgcgccaccacgccccactaatatttc +ccgggtagctgggactacaggcgtgcgccaccacgccccactaatatttcccgggtagct +gggactacaggcgtgcaccaccacgccccactaatgtttcccgggtagctgggactacag +gcgtgcgccaccacgccccactaatatttcccgggtagctgggactacaggcgtgcgcca +ccacgccccactaatatttcccgggtagctgggactacaggcgtgcgccaccacgcccca +ctaatatttcccgggtagctgggactacaggcgtgcgccaccacgccccactaatgtttc +ccgggtagctgggattacaggcgtgcgccaccacgccccactaatgtttcccgggtagct +gggactacaggcgtgcgccaccacgccccactaatatTTCCCGGGTAGTTGGGAcgacag +gcgtgcgccactacgcccCACTAATatttcccgggtagctgggactacaggcatgcgcca +ccacaccccactaatatttcctgggtagctgggactacaggcatgcgccatcaggCCCCG +CTATTatttcccaggtagctgggactacaggcatgcaccaccatgcccagctaatatttc +ccgggtagctgggactacaggtgcccacgacaCCTGCTAATAtttcttgggtagctggga +ctacaggcatgcaccaccatgcctgttaatatttcctgggtagctgggactacaggcgtg +caccaccatgccccgctaatatTTCCCGGgtaactgtgactacaggcgcccaccaggcCT +GCTAATATTTCCTGGGTAGCAGGgactacacgtgtgcaccaccacacctgctaatatttc +ccgggtagctgggactacaggcgcccaccacgcctgctaatattttctgggtagctggga +ctacaggcgcccaccacgcctgctaatatttcctgggtagctgggactacacgtgtgcac +caccacgcctgctaatatttcccgggtagctgggactacaggcgcacaccaccacgcccc +gctaatatttcccgggtagctgggactacaggcgtgcaccaccacgcccagctaatattt +cccgggtagctgggactacaggtgtgcaccaccacgcctgctaatatttcccaggtagct +gggactacaggtgcccacgacgCCTGCTAATatttcccgggtagctgggactacaggtgc +ccacgacgCCTGCTAATAtttcctgggtagctaggactacacgtgtgcaccaccacacct +gctaatattttccgggtagctgggactacaggcgcgcaccaccacgccccgctaatattt +cccgggtagctgggactacaggcgcgcaccaccatgccccgctaatatttcccgggtagc +tgggactacaggcgtgcaccaccacaccccactaatattttccgggtagctgggactaca +ggcgtgcaccaccacgcctgcttATATTTcccggatagctgggactacaggcgtgcacca +ccacaccccgctaatatttcccgggtagctgggactacaggcatgcaccaccacaccccg +ctaatatttcccgggtagctgggactacaggcgtgcaccaccacaccccgctaatatttc +ccgggtagctgggactacaggcatgcaccaccacaccccgctaatatttcccgggtagct +gggactacaggcgtgtaccaccacaccccgctaatatttcccgggtagctgggactacag +gcatgcaccaccacgccccgctaatatttcccgggtagctgggactacaggcgtgcacca +ccacgccccgctaatatttcccgggtagctgggactacaggcatgcaccaccacgccccg +ctaatatttcccgggtagctgggactacaggcgtgcaccaccacgccccgctaatatttc +ccgggtagctgggactacaggcgtgcaccaccacgccccgctaatatTTCCCgggtagat +gggactacaggcgtgcgccaccacgccccgctagtatttcccgggtagctgggactacag +gcgtgcgccaccacgccccgctagtatttccttttctgaccTGCATTTtctttaaggcta +ttttcacCTGTTTTGTGAcccatttttttcccttgttactaaaaagaaatcaatattgaA +CATTAGTTAGCAAGCAGAGAAGTATACATATTTTTGATGTGCTAAGTAGGAAAAGAGTGC +TTTGTGGTTTCAGCTGCATTTTATTCTAATAAAGTCGTGAGTGAGCCCAAGTAGGCAGGA +CCTTGTGGTCTGGCCTCAAAATTGGGCTGCTGCCACCACCGCTCTGCAGTCCATTGCCTG +AAAGGCCAGCCCGattcacctgctccaccctgtcTAAAGACCAGCCCGATTCACCCGCTT +CACCTGCTCTGAGGCTGGTCTCATGGGACAAAGAGGGAATTGCACTGAAGTCTCAGGGTT +TTAGGACCAGAAGGGTAGGAGCTAGAGAAGGTGGCAGAGGTGAAGGTTGAACAAGTGAGT +GGGACTCCAGGTACAAGTCCCAGCCTGCCCCCGGCTTCAACCACAGTAGCTCAGTTTCAC +GGTCTTACACATTAGCTCCGTGGCCTGGAGTAAGTTTCAAATGAGCACAGCGCCTACTTC +CTACGGCTGATGAAGCACAGTGACTGACTGCAGGTAAACGCACCTAATATAGCGTGGGTC +ACCAAGTGGATGTTCAAAGCATGACAGCTATGGGTGTTTCAGATtctacattctattttt +tttttttttttgagatggagtctcactctgtcgcccaggctggagtgcagtggcgcaacc +ttggcagcacccaccaccacgcctgactaattttttgtatttttagtcgtgatggggttt +tgtcacggtagccaggctgctctcaaactcctgaccttaagtgatcatcccacctcagcc +tctcaaagtgctgggattataggcatgagccaccgcacccggcctctacaTTAGATTTTG +TTACAAGAAAGGATTTGGAAATCACTGATTTGGCCCATCtctctcattttaaaacaattg +aaaaataacTTTGTTAAAGTACACACAAAGTATGTAAATGCATTTGTATaagaaaatttc +caaaaaaaCTATACCagagtaaatggaaaaaaatatttccttgctTCTCTACCTACTCTC +ACTCCAACTTCCTTCCCAAGAGACATCCACTGTTACCATTTCCAGACTTCTTTCTTATAC +atttacacacataaacatgctttttactttttccatAAAAGACATtatacctcccaaagt +gctgggatgacaggcgtgagctgctgcgtCCGGCCCCCGTTCTACCACTTTTAAACTGCT +GTGTAGCATCTCACAGTATGGATgcactgtaatttatttaaccatcttCAATAATAAACA +TTACAGACACAGCCAAGCCTTTTGCTTTTAAGGCTGCAGTTCACCTCTTTCTTTGTGCAT +CTTCCTCTAcatgtatggatttttttttagactTCTGGTTTAGATGTAAAATTGTTGCTT +GACAGGACATGCATATTTACATTTCTGAAAGTTCTGATAATGACAATTTATGCACCAAAA +AGGTTGTATCAAGCTGTATACTAGCCCTAAAATCCTGTACTGTtagtcttgtaatttttt +tctgtttgcaaaCCTGATGTAGGAAAAatatcctgttttcttttttttcatgtttattag +ccAACTGAATTTCTTCAGTCAATCGTCTGTCTGACTCTGTACTCATTTTTCTAACGGGTT +ACTCGTATTTTCCTTATGGATttttaggagttctttacatGTGCTAGATATTAATCGTTT +GTGTCATGCAGCTTCAACTGTTTTTTAATCCCTTGATTATGTTTCTGGTCTCTTTTTCCA +AAAGAACGTTGTTCTCTTTATGTTGTTAAACCTTTTAGTACTTTTCTTCATGGCTTTTGG +GTTTTATGTCTTATTTAGTCTCCCTAATATTCTGTTATTAAAGgataggtgggcatggtg +gctcacacctggaatcccagcactctgggaggccgaggcgggcagatcacctgaggtcag +gagtttgagaccagcctggtcaacatggtgaaaccccgtctctactaaaaatacaaaaat +tagccaggcttagtggtgtgcacctgtaatcccagctatccaggaggctgaggcaggaga +attgcttgaacctgggaggcagaggttgcagtgggccgatatcgccccactgcactccag +cctgctgacagagcaagactctgtctaaaaaacaaaatgaaaaaacaaaaaaataaaaaa +ataaaggatagtcttttcttctcatttaacAGGGAAGGCAGTTCACTACATTACAGCAGA +ATCGGGATTAGACCACAAGTCTTGACTGCTGGTCCAAGGATTTTGCTACTAAATCACTTT +GCTTCTCTATTGTTACccgcagtttaaaaaaaaaaacaaatctagcTCTAAAGAAAATTC +AAAGGTATGATTCTCTCAACTTGgatttcttcttccctccctcctttcttctttcccctt +ccaTTCCTGCCTGCATGGGTTCTGTGTACACTCTGCACGACTCGAGGAGACGGATGAGTC +AGCTACAATTCCTGTATTCAAGGAGCTCAATGTCTACGCATATGTAATGATGCAAACAGA +AATTACCATAGAACAGAGTCACTTGGTTTCCCAGTGGACAGGAAATCTGAAGAGAGCACC +TTGATGTGTTAGCAGGGAGCCTGGGCCTCCAACGAGAAGAGGTttactcctttctctttc +ttttctttttttttagagatagggtgtcactctgtcactcatcatagctcactgcagcct +caactcctgggctgaagtgatcctcctgcctcagcctcccaagtgattGGGACTAAGGGG +tgcacccgactaatttttttttttttgtagggatgaggtctcactatgttgcccaggctg +gtctcgaactcctggtctcaagcaatcctgccttggcctcccaaagtgctgggattatac +aggtgtgagccactgcatcagaCCAAAAAGAAGAGGTTTCCGGAGTGAAAATTTGGACCT +GGTCTTTGACTACACAGAGACAAACGTTTAACCGGCAGTACTATGTTCCACCTTTCCAAT +GGAGGCACGTAGTCCCCAGGCCTGTATACCTGGCTTTGGGGTTTACAGAGACTCATTGAC +CTAGTTTGTTCACCAGAGATGTTAAAAGGTAAACCCTAAAGTAAAAACATATCCTAATTG +TAACCAAATCTGATAACTGATAAAGAAATAAGGTATTTGTGACTGAGTAAGGCCTCTGAC +TCACAAAATTActagtctgtaaaatgggatcaaTACTTAAGAAAAATGATGACAGGGCAT +TCTAGAAACATGATGTACTGCGTAAGAGACAAACAATAAATCCACACAGAGTGTTCTGTA +TCATCACTTTCCCAGCAGCTCAGTGAAATCACTGCAATGAGGGGTTAAGCACCGAAGCCA +ATGGATAGAGTCACCATACAGTGAAACCCTGAATCCCAACCACCCAACCCACTGATTTCA +CGTGGCAGCTCCCTAGGGAAGGTCTTACCAGGGTCCCATCGGTCAGGGTGCAGCCGGAGA +AGCGTTTTGCAAGAAACCCCTCAAAGTTAGTTGTTCTTTGAATAGCAAAAAGAAGCAATT +TCACTTCAATTTCCTTCGCTCTGGTACGCATAATCTTGGCAAGTTCTGCCCTTCAAAACA +AAGAGATAAGAATACTATCAAACAAGCTGATCATTCATTCAGTAGAGATAAGGTAAATGG +CCTTAgcttatattcagaaaaaaaaaatgtatgtggtCATTTCAAACCCTGAGGTCTGTT +ACCACCTTAGTCTAAAACCTGGGGAATAGAAATACATATTCTAAACAAGATTTTTAAGGT +GAAATTATCCACCAGGCAAAAAAATCAGGGGTCATggatgatatatatatacttatattt +atttgtttgtttatttatttatttatttatttgagatggagtctccctctgtcgcccagg +ctggaacctccacctcctgggttcaaatgattcttttttttttttgtatttttagtagag +atagtgtttcaccatgttggccaggctggtctcaaactcctgacctcaagagatccgccc +acctcggcctcccaaagtgctgggattataggtgtgagccaccagtaATTTGGTTACATA +GTTACTACGTTGCCTGTATCTTTGAACAGTTTAATAATTGGATAATAATACATATGGAGc +acctaattttttattagtGTATATAGCCTATATAATTTCACAAGTCATTAATTACTGAAT +TATAAAGCCCTCCCTCTTCCTGAGGGCCCAATAATCATCTCTTCAACTAGAGAGCAGGAG +TCCTGGAAACACACGCAAGGGACAGGATCCCTGCGGGAAAAGTGGCAAGCACGCTTAGCT +GGTCCCTGCCCGAGAAGCTCCTGTGCAGCTCTCACTCAAACGTTCCATCTCAGAAGCTCA +GTTGCTGGTGAACAGGGACATGTGAGTTCTTAGTAAGGACTAAGCTACCATCTTCtcaca +caaataaatgacaaaatgaaacaaagagtcTCTGAGTTTATTTGAGAATGATGTATCTGT +AGGATTTTAGCCAAAATTCTAACAATAGAAGCTTGGCAGCAACACTGCCATTAGCCGAGA +CAACAATGGCAGGTACTGGCGCTCACAAGAAACGTGCTGGCTCTAGCATACGTCCAGCCT +CTCCCAGGCTCCATTTCTCACTGAGCTGGTTTGCAAGTCTGCTGAACTGTAGGCTAAAAA +GAATTAGCTAACAGTTTCTCAAGGAATTcactctttattttgttaattgggATTTAGAAG +GTGACAATCTCAACTCATCTTAAACCAATGCTAAAAGGTTCTCTAAATCTACAGGAGtca +atgtgtttctttttttttcttcctctttctttctttttcccttccactcgccctccctcc +ctccctccctcccttcctcacttccttccttctctgtctttctctctcttcttttttttt +ttttgagacaggttctcactctgtcacccagggctggagtgcaatggcatgataatGGCC +TACTGCAACcttgacctgggctcaagcaatcctcccacctcagcctctctagtagctggg +attacaggtgcttgccaccatgaccagctaatttttgcattttttgtagagatggggttt +tgccatgttgcccaggcttgtctcaaactcctaggctcatatgatccacctgccttggcc +tcctgaaatgctaggattataggcataaaccaccaagcctggcccaatGTGTTTCTTAGA +ATAACAGCCACACAGAATGGAGCTCAgtgcacctgtagttgcagctacttgggtggctga +agcaggagggctgcctgagcccgggagttcaaggctgggGTACGCTATTaccatgcctgt +gaatagccattgtactccagcctgggcaacactgcgagacccccatctcttaaaaaaaaa +aaaaaaagccacacagaATGTATGTGAACACCAAGCGTGAACACTACCATGAACTATGGA +CCATCACTCTGGGTAATGATGATGTGTCCGTGTAGTTTCATGAGCTGTGATAAATGCATC +GCTCTGGCGGAAGGTGCCGACCATGGGGAAGACTATGCACGTGGGGCCGGGAGCACCTGG +GAACTCTCTGTGTCTTCTGCTCAATtctgctgtgaacctaaaactgctctaaaaggTAAA +ATCTATTTTAAGAAAAGCCAATATCCCTTAAAACACTTTTGCCCCACAATGTGTTTGAAA +CATGCAATTTGACTTTACTTTccatgattttaataaaaaagacGGCCATGGATTATGGGA +AAAGGTGGTTGAGTTATGCTAGATAtgggcttttttttctctttttcacccGGCATTAGA +TCTAACTGTGTACTACTGGGAGGAAATATATAACTAATAAGAACCAGTTACCAACACTGT +TGTAGTCTAGCcgcaaataaagaataaaaggagttcaagaccagcccgaacaacacagca +aaactcttgtctctacaaaaaatacacacacaaaaattagccggtgtggtggcacacacc +tgtcatctcagctactcaggaggctgaggtgggagaatcacttgagcctaggaggtcaag +gctgctgtgagccatgatcacaccactgcactccagtctgggtgacaaagtgagaccccg +tctcaaaaaaaaaaaaaagtctgactcTGGCTTTAGCTTTGTCATAGATATACTGATTTA +ACCTTCCTGggctttgggtttttttaatataaagagaCTATCTGTCCTTGGGCTACACTC +ATGGATAACGTAGAGAGGATGAACAAAAGACGGTCTTTAAAATGCTTGGAAAGCTCAGac +gcaggccaggtgcagtggctcatgcctgtaatcccggcacttcgggaggctaaaatgggc +gggcagatcacctgaggtcgggacttcaagaccagcctggc +>NC_060942.1 Homo sapiens isolate CHM13 chromosome 18, alternate assembly T2T-CHM13v2.0 +TCTtccttcttgttctctctcttgAATTCCTTGTTCTGGCAGCAGCCAGCTGCCACattg +tgaggacactcaagcaatTTCACAcagcaaggaactgaggcctcctgccaagaGCTATGT +GAACAGGCCACTTAAGTAGCAGACCCTCCAGCcacagtcaagccttcagatgactgcagc +tctGGCTGAGATCTTGACACAACCTCATGAAAAACAGTGAGTCAGGACCATCTAGCTaag +ctgctcttgaattcctggtccACAAAAACTATGAGATGatgaatatttattgttttaaat +tgccAAGTTTTAGAGtaacttgttatgcagcaataaacaactaatacaaatacaaattca +GAATTTTGACTTACCTTGTAGTATTGTAAAATTCTTGATGAGCTGACCATGCTTGGAGTC +TACTAGCTTCATTTCTTCCATAATCACTGATAAGTTGGCTACTTCAGTGTCTAACCTCGA +CCTCATCAAATCTTGTTGCATCCTGAGAGAAACAGAATCCAAACGGATGTTGGCCAGGGT +ATTATTCAAGGAGGTCAGATCATCTGTGTGTTTGGTAAGGGTATCTGTGCAAGTGGTCCT +GACTTCATTTAGATTGCTGGTCAGCGTCCGCAGGTGGTGGGCTGTGTAACTGATATTGCT +AATGATGTTCACAATATCCGTCTCAAAGAGCTGGAAGCGTTCCTCCAGTTGGTTGAACTT +GATGGCTGTTCTATTCTCTGCATCTTTGTGTAAGTCCTGCAGGTCTTTCAGGTTCTGCTC +GTTGGCTTGAGAGATAGTGGTGATGTTCTCCATCTGACCTGTGAATGAGTTGAGCTGGCT +GTTCATATCCTCCAGGGTGTCGTTGTTGGCTTTGGCCAACGCAGAGTTGTTGGCAGCCAG +CGTCTGCAAGCTCTGCACTTTCTCCTTCAGCCAATCCGTGTCCTTCTTGGCTTGAAGAAA +AACCTGCTGCAGATTTTGAAAGTCGTTCTTGATTCGCTGGATAGCCTGGCTTGTGTCATC +CACAGACCGCTGCAGATTCGTGATGAGGTTCCTCTGCTGCACCTGGGTCAGGTTCAGGTT +GTTGAGGTTCATGATGACCACATTATGAGAATACATTTGGTTCTGCAGATTGCCCTGGAG +CACGCTGGTATCTTGCTGCAGATTCGTGACATAGCCATTATACGCCTGGAGGGTTTTGTT +TACAGTGGTGATGAGGAAAGAGTTATTCTCCAAAGTTTCTTTCAATTGACTCTGCCTGTC +CACCAGAGCATCCCCGCTCGCCTGTAACTTCTCCAGCGTATCCTTGTTCTTGCTGGTTTT +TTCTGTAATCTCACGAAGTTGCTGACGGAGATCTAGAATGTCTGATCTGAAGGTGGAGAG +TTCTGAGTTGGTGCTGATAGCTTTCTTCCCAGTTTGGTCACCTGGAATAAGAAATATCTG +TGACTTATATTGGTGGTATGGAGAAGTGTTCAGGCAAGGCCAAAGATCCCGAACACACTT +AATCGGTATGCACTGTATTTTAGATGCAAAATTGGCAGTATAAGCGGACAGCTCTGCATT +AGTAAAATGTACATATCTATTAAAACTGGGTCCTGGGGAATCGGAAAAGAAGCTCAGAAC +TAGGAATGACAAACTTGGCTGAACATTTTTCTCAAAGAGGGAGGGGGAATTTACTAGATT +TTAGGGCAGTGGGCAGGCTGTCAAGAAGAAACTAACCTTttaaatttcccaaattttttt +ttaatgaaagcaaaaatCAAGGAATAGAATATGCTAGGATCTTTCACTTTATAACTTAAT +TTCTACAATTCTATGTAGtttaaagtatttcaaaaatgCTCAGTAAATTCCTATTTATGT +GACAGTTTTTAATAAAgggtatttgtgttttttttcagtCAGGATTGATCTTCAGATATT +ATTTGGCACATAATAGTTTTCTTGGCAGGACTTAATTCCAAAACTGACccttaactttaa +aatttaagcATTTGAATTAAATCATGAGGGGAGACTCAACATGCAACACAAAAATTGAAT +GTCCTTCCGGGTGAATGGGGAGTTTATAGCAACATCATTCTAAGAAGCTGTGGTCATTTA +TGTAGAGTCAGGGGATTTCATGGTTTAGTCTTGTCACAGATTACCTAATTTTTTCAGGTC +ACTTTCCACTGCTGTGAGCTTGTCATCATAGGTTTGGCGAGATGTTTCCATGCCACCTGT +GACATTGTCCATTTTCTCTACAACTAAGATTTGGAAAATGATGCATTAGTATACATATct +gctcatattttatttttcagtttcaaaacAAGAGATCATTTCATTATGGAACAAAGGAAA +CAGATTGAACGAAAACAGTGTAACTGAAATCAAATATAGGAAAGAAAAGCCAtctttttg +gaaaaataacttACTTGTCACAAAACCCAGGGGTACAATTTACTTAGTTGAGAATTGTAT +GTTCTTAACTATTCTTATGATTCTGTAATGCCTTGGATGTTTCAGAAATCATTTggaact +aatttaaaaattttcatgcaTTTTAGAAGTCCCTAATCTGCTATTTCCTATATTAATTTC +CATAGATGAAGGCAAGGCACACTGTGATAATTTACAAAATGTTGTCACTCATCAGCTTCC +CTAACATTCTTGGCAGGTGGGACTCATTTACCTAGAAAAGGATTCCATTGGCAAGGAAAA +CCCAGCTCAATTCTATACACAAAATCGGCATAGAAAGGTTGCAAAGTCAAGAGTGTCTGC +CACTTTCTGTTATGAGTTCCACCACAAGGCCCTGAAAATCTGCTTTTTGTTAGTGACAAC +TGATTCTGTAGTTTGTCAGTTCTCAAGTAGATGCCTGAGTGGTGTTTCCAAACAATGATT +TGCCAAGAAGTATTTTTTGGTAGTATTTTCTTGATTGCATATGATAGGGAAAGTAATGCc +actgatagggtttggctgtgtccccacccaaatctcaccttgaattatactcccctaatt +cccatgtgttgtgggagggacttggtgggagataatttgaataatgggggtggtttcccc +tatactgttctggtggtagtgaataagtctcacaagatctgatggtcttatcaggggttt +ccacttttgcatctttctaattttctcttgCCGTCCCAAATGTTAacccccaagacaatg +gggaaaatgtcttcagggcatgtcagagcCTTCCTGGCAGCCCTTTCCATCActggcctg +gaggcccaggagaaaatggtttcgtgggccaggcccagggtccccatgctgtgtgcagcc +tagggacttggtgccctgcttcccagccactccagccatggctgaaaggggccaatgtgg +AGCTGGggccgtggcttcagagggtgcaagtctcaagccttggcagctttcatgtgttgt +tgagcctgtgagtgcacagaaatcaataattgaggtttgggaacctccgcctggatttca +gaggatgtatgggaaCTCTTGGATATCCAGGGAGAGGTTTGCTGCACGGGTGGGATGtgc +atgaagaacctctgctagggcagtgtggaagggaaatgtggtgtcggagcccccacacag +agtccctactggggcactgcctagtggagctgtgagaagagggccaccgtcctccagacc +ccagaagggtagatccactgacagtttgcaccgttcacctggaaaagccacagatgctCA +ACACCAGCCATGAAAGCAGCAGGgagagaggctgtaccctgcaaagccacaggggtggag +ctgcccaagaccatgggaacccacctcttgcgtCAGCATGACCGGGATGTgcgacctgga +gtcaaaggagataattgtggagctttaaaatttgactgccctgctgactttgaacttgca +tggggcctgtaacccctctgttctggccaatttctcccatttggaaaggctatatttacc +caatacctgtaaccctcattgtatctaggaagtaactagcttgcttttgattttacaggc +tcataggcggaagggacttgccttgtctcagatgggaCTTTGGACTGCGGACTTtagggt +taatgctgaaatgagttaaaactttgtgggactgttgggaaggcatgatttgttttgaaa +cgtgaggacatgagatttggcaggggccaggggtggaatgatacagtttggctgtattct +cgcccaaatctcatcttgaattatatctcccagaatttacatgtgttgtgggaaggaccc +agtgggagataatttgaatcatgggggcggtttcccccatactgttctcatggtagtgaa +taagtctcacgagatctgatgggtttccactttttcatctttctcactttctcttgctgc +tgccgtgtaagaagtgccttttgcctcccaccatgattctgaggcctccccagccatgtg +gaactgtaattccagttaaacctcttgttcttcccagtctcgggtatgtctttatcagca +gcgtggaaacggactaatacagccacACTAAATAAAAGCTTCAGTTCTTATTCATTTTCA +GAAGGCAGTAATTCTCTACAGTTATGAATTCAAGTACACgtttctaaaatgttaaataag +agGATGTTTCTCCAAAAGTGATTTATGTGAGATACAGCTTCTAGCAGCTTGGGATCAAGT +CTGACTGTCCTTCTTAGTAtcaatagcttaaaaaaaaaagacttcagaccgggcatggtg +gctcacgcccgtaattccaacactttgggaggctggggtgggtggatcatttgagctcag +gagatcaagaccagcctggccaacatggtgaaaccccatctctactaaaaatacaaaaat +tagccggttgtggtggtacacgcctgtaacctcagctacttaggaggctgaggcaggaga +attgcttgaacctgggaggtggaaccaggagaattgcttgaacctgggaagtggaggttg +cagtgagccgagatcacgccattgcactccagcctgggcaacagagcgagactctgtctc +aaaaaaaaaaaaaaaaaagacttcaaaaaaTGAGAACATGCTTTATATATCAATTATGAG +CCAACGGATCTAATTTATTGTATTCATCACATGTTCTACCCACGCATGACTGTGTGAGAT +TCTCCTGGCTCCTCTCAGGAAGAAGTAGTAAGTTCCCATGTGTTTGTGTGACCCAAAGTG +AACTGGCTCCTTGGATCCTGGAATTGTCCCTGGAGAAGCTCACTGTTTTCCCTCAAGCTT +CTACCGTCTGGTCATAATGAAATGTGTGCACTGCGACAAACACTCTCTCACACGAGCCTT +TCCATGTGTTCTCTCTACCTAGAATGttcttccctgttttttttttttactgagctAAGT +CCTATTTGCTCTTCAAGACTCTGCTTGTCACTTCCTGTGGGAACCCTTTGCCGAGGTGCA +CCTTGCAGAATTCCCCTGGCAAGTAGTCCTTTCTCTATTATGGGACTCACTGCACTGTGC +TGTCATGACTTATCTACTATTATATCCTTTAGGGCAGGAAAATTTACATTCAATTCCATC +TCTTCCTCTTAGCTCAGTGTGTGGCACTTTGTAGGTAgtcaatgaatatatatttattat +gtcatttatttatttaattttttattagacggagtttcactcttgttgcccaggttggag +tacaatggaaTGATcttagctgactgcaacctccgcctcccaggttcaagtgattctcct +gcttcagcctcccgagtagctgggattacaggagcctgttaccacgcccggctaattttt +gtatttttattatactttaagttttagggtacatgtgcacaacgtgcaggtttgttacat +acgtatacatgtgccatgttcgtgtgctgcacccattaactcgtcaatttttgtattttt +agtagagatggggtttctctatgttggccaggctggtctcgaactcctgacctcagatga +tctgcccaccttggcctcccaaagtgctaggattacaggaatgagggatttatttaaata +agtaGCAATCTGCCGGCTGAGCTACAGGGCAAGCAAACACGTGTTTCCCAACCAACCCAG +GGAAGCCTGAGCATTGGCAGTGAGTATGACATTTCGCtgagtaattattatttttaaaat +tactacatAGACAGAGAGATGCAGTTCTAATAATCTGTACCTTAGGGTTGCTTCATAGGT +ACACATACTCCTAAATCCCTGGAAACTCTCAAGAATAAAATGTTGCATATGTGTTTTTAG +CAAAGCTAATTTTTAAGAACTAAAATACAGAATGTTTACAGGTTTAGGTTCAGTTTTGAT +CCTCAAATCAAAACATATGCCTCGGTCTGTCCTCAAACCACATGCAGGATCTCAAGTCCT +GCCCTTCTTTCCTGGAAGCCAAAGAAACCTTCAAATATGCTGACAGTCAGTCATTTTCTA +ccctttctactttttcttccattttagttttgaaaaacagAGAACTGTCATGGACAGATA +ACTCAGGTTTGTGTAGAATAAATACAAAAGGGATAaatacattcattaaaaaaaagaaca +aaaaaaatctgtCGACGTTttcttctgtgcagcaaaaggaAACTATTTTCCCTGCCCACA +AGTGCTAATGAACAGTTTACATGCACTGGGGGGTGTGTGTCTTTGTTTAACAATAGGATC +TGGTATAAAGCTGGAAATGTTAGGATTGCAATGCTGGAACCTGCTACTGCATAAAAATAC +CAGACTGGTGGAGATCCAGAACTTACCCTTGCTGTAACAGCACACAGCACTTTCATTGAC +TTTTATTCTGAATTTATTAGCACCAATTCTCAATCAGGAATACAGTCGCAGAGCCATCCT +GTATTACCCTGGAAATTCCCAGTCTATAGACATAGACCTCAGTTTGCAGACCATTCTCAC +ATGAGAAAAATGAGCAGGATACACAGAAGGGTGACCAGCAGTCTGGTTTCTCATAGGCTC +TCCTGTATTGGGAATTGTTTCTTAAGGTAGAATTTTTCTACAGAATATTGGTGTTTCAGG +TATTATACCTGAAGATCTGTCCCTCTTCAAGTATCCAAAGTATAATTCTCTAGGATACTC +TGACAATAAAACCTTTTTTATAAAAGCACTTCGGTATCATCCCTTGGCCTGGGCCACTAA +CTTCTTCTTCCCTCGTCTTGACTCCACTTCTCCTTGAAGGTCCGCTCCACACCTCACTAC +CCCATTGTACTCAGCCACACCTACAAGTTGATTCCACTGCACACCAACTCGATCTTTATt +tgaatgataataataatagcctcTATTTATCGAGTGCCTGCTCTTTGCCGGATGCACTAC +ACCATCACTGCAGTTAATCCTTCCAACTGCTGTTTTGTAGATGAAGAGATTGAGGCTCAC +AGATGTTCAGTAACTTGCTAAAAAGTCACACAGCTTGTCAGTGACTATGTGGGATACCAG +GCTGGAAGGTTTAACTCCAAAATCCATGCTCTTTCTATGACTCCGTATCACCTCTCtttt +ggtatttctttttcctaaatcTGGTTTCCTCCAATAAAGAATCCCTTAAGGGGAAgaatt +atttctgtttatattctctttaaagttaacatcaccagaCATTTACCAAGTATCTGCCAT +GTAGGTGGCATAGTGCTAGACATTGAGGATTCAAGAGACACAGGCCATGGTCTCGGCCCT +GAGGACAGAGCACAGAGCTCCTAGCTGGTGCTCACACGTTTTTGTACCAGACTGATCATG +GCACTGTGGGATAAATACTTCCTCTCTCTGGGACCTGGGGCTTCCCAGTAACATTAGTTA +CACTCCTCTGGAATTTAATAAAGGCATTTCTACCTTGAACACCATTTTAGGTTTCcttac +agaaatacagaaaatctgATTGTAGGGTGTTATCCTGGATCCTAAAGCGCTCTCCAGTGT +GATTTGATGTGTATTTTGAAAGCCTAAATAGTAATCCAGTTGTAAACTGCTACACTGACC +CAGCTTAGCAGCAAAGTAGACTACCAGTGACTAGGAATGTTGAATTAAAGGAGATCCTTA +TTGAGAAAGATTcagatttctgtcttttttctttttcctaattacCTTTAGAAGGTTGCC +TGTTGGAAAGGATAATGGAGTAGGATTTTCCTGTTCAGGAAATATTCTGGAAGAAACATG +ACACATTGAACTTAAGAGATGACTCCTGCTATGGAAGCTCTGTTGACTAATGATAAAAAG +CCCGGGGCAGAGGATGTACCAAGCTCAACTGTCCAAGAACATGTTTTCTGCAAAGTGGCT +GATACGCCTCACAGTCACGACCACTGCACAGACCCTGTCTGGGTGACTGAGCGATTCTCT +GGCTTCTTCAGCAAATTCTCTTGATGGAAGCTCATTGTATTCTAACTTGTGGCTATGTAA +GTgacatgaaagaagaaaagaacaatttTGAGCAAAACAGTATGAAGTTGCCTTTGCCAG +CTctgataaataaaagtttttactCCTTTCCTTTCGATTTCTCCTTCAGAGGAATGCCTT +ATTGTGTTTCTTTCattgaatattcttttctttctttcttttgtaacgGAGAGAGTTTCT +CTAGACTTCAAAGGGGGAATGTGTGAAGGGAGAACTGGGTTTTATCTTTCTGCCTCTTAC +AACATTGGGTCACTAGAATCTTACCAGCAAGAAAGAGGAGTCACTGTGTGAGTAAAGAGA +AAGCACATCtggaaaatatcaacattttagtTCATTAATGGTGTGTTTGGAAAGCAAAAG +TGCAtgttgtattatcttttttttggtCAGTGGAGGCCTGAAGGAGGGGGGcactgaagg +aaagaaaagaggggcAAGACATCATCTCGTTTCCCCTTGTACTTGCTCCCCATTATCTCT +TCTTCCTTCATCTTGGTGAGACTGCCCCCACAGAGCAGGCCAAGCCAATCTCCAAAACAT +TAGGTTTCCAGGCAGGGCTTTTAGGGGCAGCTATCCCCTAGATGCAGATTGGCTTAGAGG +TCCCTGAGCATCTGCTGTTTGCCTTCCTGGAAGGCAGCCCTAATGCAcaatccatcaatc +catccatgcatccatccatccatccatccatccatccatccatccatccatcctcccatt +aATTCATTCAGTGAACTTTCCTGGGCAATGGTTAAATATCATGAGACTAGGTGCTGGTGG +gagatataataaataaaaggtagTCTCTTGTCTTCATGGAAACTCGTagtttgggtggtg +acacagacaAGTCCACTGACTCTAATGACACAGTGTGACAGGGGCTAAGAGTAAATGCTG +GGTGCTATGGGAACAAACAGGAAGGGGCCTAATTCAGCTTTCGGGAGCTGCCATGTGTCT +ACATGAGACatgaagggtgggagggaggcactTTAGCTGGAGAGCAGAGAAAAGGTGCTG +TGGGCAAATGGACCAGCACACGCACAACACGCCAGAGCCAGGAAGGGCTTTCCATGGATA +AAAAGGGAGGAAATATCTGTACcttaacaaacaaacagaaaaaaaagaaaggagaaaaaa +agcctcttctttgactctttttgtataattctGAATGCATAAATGTCCCAGACTTTATTT +CCTAGCACAGGTAAAAATTACAACATGTTATATATTTGCCAAACCACTCTCATCTCTCTT +TTAGCAGTAAATGTGATTACACAGTACTGAGGCTTAAAAGTACTTATtaaatggctgatt +tcaagcttcTCCTTTATCTTGGCTCACTAGGAAAAGTCATGGAGAAGTGAGTAATGACCT +AAATAATCTAAACAAAAGGAAGAGAGATAGTCCGGATTACCTGGGACATGGAAAACCCTC +CTTTCTCTCATCAGCTTCCCACCCCACCTCTGCCCAGCGCTAATCATGATTTAATAGCCT +TCCTTAATCACTTACTCTGTTTGCTGCTTCATCTAAAAACT +>NC_060943.1 Homo sapiens isolate CHM13 chromosome 19, alternate assembly T2T-CHM13v2.0 +acccggccttaatttttgtatttttagtacagacggggtttcaccacattggccaggctg +atctccaactcctgacctcaggctatctgcccaccttgacctcccaaagtgctgggatta +taggcgtgagccactgcacccggcccgcAAGCGGGGACTTGATTTTCAAAGCATGATGGG +GATTCAGAGAAGATTTTGAGCTGATTTACGTTACATTATGAAATCgatccttttaaattt +atgattgatttaaaataatttttgtacagCTTTATTAGGAAATTATGCACTAtacaattt +acttatttaaagaCTACATttcttgctgggcacagtggctcacgcctgtcatcccagcac +tttgggaggccaaggagggtggatcacctgaggttaggtgtttgagaccagcctggccaa +cacggcgaaaccctgtcgctactaaaaatacaaaaaaattagccggacgtggtgatgcgc +ttctgtaatcccagctactcgggaggctgaggcaggagaatcgcttgaacccaggaggca +gaggttgcagtgagctgagatcacggcactgcattccaggctgggtaacagagtgagact +ccatctcaaaaaaaaaaaaaaaaaaatggccaggtgcagtggctcatacctgtaatccca +gcactttgggaggctgagatgggtggatcacaaggtcaggagttcgagaccagcctggct +aacatggtgaaaccccatctgtactaaaaatacaaaaattatccaggcgtggtggcaggt +gcctgtagtcccagctactcgggagactgagtcaggagaatggcatgaacccaggaggcg +gagcttgcagtgagccgagatcgtgccattgcactccagcctgggtgacagagcgagact +ctgtctcaaaaaaaaagaaaaaaaaagttttttttagagactgggtcttgctgtgtcgcc +caggctggtctcgaactcctggcctcaagtgatcctccctcctcagcctcccgaagtgct +gggatcacaggggtgagccacccaCATCCGGCCTGATGTGCGTTTTGAAGGACTCCTGTG +GCTGTGGGGCCCAGTGGGGCCTGGGGAGGTCCTGGAGAGGGGGTTGGGAGGTGGCCTGGG +GGGAACATGATGGGGGTGATGAGAGGGGGATGGGAGGGATGAAGGGCAGCCCACACGTAT +CAGCCTAAAAGTTTCGGGGAACACTGGGGACTTCATTAGGATGGCACATCTGCTTGGGGT +CCTGGGCCTCTGAGCTGGGCAAGGACAGTCGCGGCAGGCAGCAGGGGCATGTAGCCCCAA +CCTGGCTCTTTGTCCCCCATCCTGGCAGGCAGCTCCTTTGGGACCCAGATCATCGGGGGC +CGGGAGGTGATCCCCCACTCGCGCCCGTACATGGCCTCACTGCAGAGAAATGGCTCCCAC +CTGTGCGGGGGTGTCCTGGTGCACCCAAAGTGGGTGCTGACGGCTGCCCACTGCCTGGCC +CAGCGGTGAGtaccctgccctgcccaccccagGGGTCCGGGGAATCCATCCGACGGCGCT +CATTCTCTGCAGGGGGTGGGCTCTGGGAGATTTAGGCCCATTGTGGGACCCCCGTCCCCT +CCCGGTGACGACTTAGGCAGGTTTAAGTGACCTGCGGCTGTGGGACTCCTGGAGAAGGTT +TACTCCTTGCAAGAGGCACTGGCAGGGCCAGCTCCTTCCACACCGCAGCCTGGGTCAGAG +CCTGGCTCCTTTCACGGCTGAGCCACAGTCCTGGTGTGGACAGAGTGCATTGTGTCTGtc +cattcacctgctgatggACCCAACTTAGGCGGGGGCTTCTGCTATAAGGAAGGAGGGTCA +GGTGGGGGTGTTTGCCACCTGTGGCCAGGAGGTCGAAGCCGGCCTTCGAGAGTGGCTCGG +GAATCGACCTGGTTCCCGGGGATCAGGAAGCCGCTAAATGACCCATCATGGAGTTGCCCT +ACCTCAGGACTGGTCCGTCATACAGAGCCCAGATCAAGATGGTCAAAGTAACAAAAAGGG +ACCTGCCGGCTTGTGTAACTGCAAAGTCTAGGAGGAGGCCTGGCTTCAGGTGCGGCTTGA +TCCAGGTGCTCACAGGAGGTGCTGTGGAGCCCATCTGTCTCCCAGCTCTGCTGCACTACC +AGGAAGCCTGTCTCACAAGGTGGAAAGATTGACCCTCCTCAGTCCCATGGAAAGAGGGCT +TGGCTCTCTAAAGTTGGGGCACACTTAGGAGGATTGGCATGTGTCAACCCCTGTACAAAT +CACTGTGGTTGAGCCTGGGGCCCCAAGTGAAGGGAATTCCCAGGGCTGGTTTTCGTGAAG +CTGTAGGCTTGGGGTTGGATTTTTGGACACACAGCCCTTGCCTGGGGCCAGGGCCGGGCA +GAAGTCTGGGGCAGGGGTGAgagcagggagggcttcctggaggaggtgggttGCAAAGAC +ACAGGGAAGGACTGGCCAAGCCAAGGCCTGTGAGGGGCAGCGGCTGTGAGTGATGGCCAT +GGACAACGGGCACAGTGGGGGCCGGGACTGCATGTGGCGGGTCGTCCACGCCGGGCCAGG +CCGCAGCACCCTGATTCCCTCTGTCCCCAGGATGGCCCAGCTGAGGCTGGTGCTGGGGCT +CCACACCCTGGACAGCCCCGGTCTCACCTTCCACATCAAGGCAGCCATCCAGCACCCTCG +CTACAAGCCCGTCCCTGCCCTGGAGAACGACCTCGCGCTGCTTCAGGTGTGCAGGGACGG +GACAGGGAGAACTGGGCACCCTCCTGTCCCCCACGGGTGCCCCTCACCCCCACTGCGCCC +TCCCCCCGCTGCCGACCCTCCCCCCGCACTGCTGCCCCTCCCCCCGCACTACTGCCCCCT +CCCCCATTGCCCACCCTCCCCCCACTGCCACCCCTCCCCCCGCTGCCGCCCCCTGCCCCC +GCACTCTCACCCCCTCCCCCTGCTCACCTGCCCCTTCCTGTCACTCGTAGCTGGACGGGA +AAGTGAAGCCCAGCCGGACCATCCGGCCGTTGGCCCTGCCCAGTAAGCGCCAGGTGGTGG +CAGCAGGGACTCGGTGCAGCATGGCCGGCTGGGGGCTGACCCACCAGGGCGGGCGCCTGT +CCCGGGTGCTGCGGGAGCTGGACCTCCAAGTGCTGGACACCCGCATGTGTAACAACAGCC +GCTTCTGGAACGGCAGCCTCTCCCCCAGCATGGTCTGCCTGGCGGCCGACTCCAAGGACC +AGGCTCCCTGCAAGGTGAGGGGCGCCcgggtggggctgggggaatgAGGCTGGCGGGAGG +GCCGGGGCCAGGGCAGCCGCCGGGCAGGTTCCTGGCTCTCCCGTTCTCTGGGGAGtcctg +tcaggggctggggggcgGGGAAGCACTGGCAGGGGTCCCGTTTCTCAggtgcagaaactg +aggctcagacaggtttAGCAACCTGCGCAAGACCACACAGCCGGGAAGCGGCAGAGCTGT +GACTTCTGCTCCAGCCAAGACGGTCCGGCGGGGGAAGAAGGAGCAGGGTTCACAGGGCCA +GCGGGAGATGGGGAGGGGACGCGCGTGGGCCGGGAGCAGCCCCTGTGTCTCCTTGAGCCT +GGGGATAACAGGCCTGGCCCTGCTCCCCTCGGCGGGCCCTGCTCCCCTCGTCCCCTCAGC +AGGCGCAGAGGCTGAGCTGCGGTGTGTCGTCCCTGCAGGGTGACTCGGGCGGGCCCCTGG +TGTGTGGCAAAGGCCGGGTGTTGGCCGGAGTCCTGTCCTTCAGCTCCAGGGTCTGCACTG +ACATCTTCAAGCCTCCCGTGGCCACCGCTGTGGCGCCTTACGTGTCCTGGATCAGGAAGG +TCACCGGCCGATCGGCCTGATGCCCTGGGGTGATGGGGACCCCCTCGCTGTCTCCACAGG +ACCCTTCCCCTCCAGGGGTGCAGTGGGGTGGGTGAGGACGGGtgggagggacagggaggg +acCAATAAATCATAATGAAGAAACGCTCAGAGCCCGCCTGAGTCCCAGCCCACCTCTGTC +CATGCTGGCTGTGGGGCTTCCGACAAACCTgtttccctcagcctcccgagtaactgggtc +tacaggcgcccgccaccacgccaggctaacttttggtatttttagtagagaaggggtttc +tccatgtttgtcaggctggtctccaactcttgaccttgtgatctgcccacctcggcctcc +caaagtgctgggattacaggcgtgagccaccgcgcccggcccttcccTGTTTTAAAAAGG +GAGGTTGTGGATCCCAAGGCTTCTCCCAGGAGGGGGCGGCGTTGGCCAGGACTGGAGCGG +TGGCCGGGTCTGCAGGCTGGCAGGGGTGCGCGGCCGTCCTCCCCGCGTGGCTCCTGGGGC +TGGGCCTTGAACAGCATCCCAGGATCTTCTTTTTTAGTAACAGCTTTTATCAAGTTACAA +CTCACATAGCAGATGAGTCTCCCTGTAAACTGCGATTCAGGGGCCTTTGGTACCTGCACA +GAGCTGGGCAACCACCACCGTGACATGTCACCCCAGCACCCCGAAAACAGGCCCGTCCCC +AGTCACCCCAGCACCCCGAAAACAGGCCCGTCCCCAGTCACCCCAGCACCCCGAAAACAG +GCCCGTCCCCAGTCACCCCAGCACCCCGAAAACAGGCCCGTCCCCAGTCACCCCAGCACC +CCGAAAACAGGCCCGTCCCCAGTCACCCCAGCACCCCGAAAACAGGCCCGTCCCCAGTCA +CCCCAGCACTCCGAAAACAGGCCCGTCCCCAGTCACCCCAGCACCCCGAAAACAGGCCTG +TCCCCTGTCACCCCAGCACCCCGAAAACAGTCCTGTCACCCCAGCACCCCGAAAACAGCC +CTGTCCCCACTGTCACCCCAGCACCCCGAAAACAGGCCTGTCCCCACTGTCACCCCAGCA +CCCCGAAAACAGGCCCGTCCCCACTGTCACCCCAGCACCCCGAAAACAGGCCTGTCACCC +CAGCACCCCGAAAACAGGCCTGTCCCCCTGTCACCCCAGCACCCCGAAAACAGGCCTGTC +CCCACTGTCACCCCAGCACCCCGAAAACAGCCCTGTCCCCACTGTCACCCCAGCACCCCG +AAAACAGGCCCGTCCCCACTGTCATCCCAGCAGCCCGAAAACAGGCCTGTCCCCACTGTC +ACCCCAGCAGCCCGAAAACAGGCCCCATCTCTATCACCCCAGCACCCCAAAAGGAAGCCC +CACCCCCATTGTCATTCCAGCACCCCGAAAATAGACTCTGTCCCCACTGTCACCCCAGCA +CCCCAAAAGGAGGCTCGTCCCCATCGGCCGTCACTCCccgtccccaccccagccccggTG +CCCTCACATCCCCTCCCTGTCTCTGGATGGGCCTGTGCTGACATTTCATGGACAGGGGAT +CACGCTGCgtggccttctgtgtctggcgTCTCCCGCTGAGCGTGACGTCCTCAAGCTGCA +CCCGCGCGCTGGCTGGGTCCGAGCCGTGCTCCTGCTCCGGGGGGTCGAGCTCCAGCTCGA +GGGGGGCCTCGCTGCGTTTGTGGGTGCGTCCCTGGGTGCACATCTGGGCGGCTTCGTCTG +CGTCCGTCCGTCTGAAGCTTTGCTGGGAGCCGCCTGTGTGCGTTTTCGTGTGGACCTAcc +tgctccttcctccctccagatTAGACCCGTGGGAGTGGCATCTCGGGCTGTTCAGTGACT +CTGTTTCAGCGCCGCGCTGTTTTCCTGCagaatcttttaatttcattaccaactctttct +ttcttttcttttctttcttccctttcttccccttcttctctttccctcccttccccttct +tctctttccctcccttccccttcttctctttcccttccttccccttccctcccctcccct +cctctctttctttctttcctttcttccccgtctccccttcccctcccctcccctctcctc +ccctcccctctcctcccctcctctctttctttctttctttcttttcttttctttttttct +tttattttcctttcttttcttctgatggAGTCTCAGTgcgtcacccgggctggagtgcag +tggcacgatctcggctcactgcaagccatctcaggttcaagcgatgcttgtgtctcagcc +acctgagtagctgagggatcacagacgtgcaccaccacgcccagctaactttttttgtat +ttttagtagagactaataGAAAcacaggtttcaccacgttgaccaggctggtcttgaact +cctgacctcaggtgacccgcccacctcgccctcccaaagtgctgggattacaggcatgag +ccactgtgcccacgttaatggttttttattattttattttatttttagacagttcccact +ctgttgcccaggctggagtgcagcctcagcctcccaagtagctggaattataggggtcca +ccaccaagcccagctaatttttttggatttttactagagacggggtttcaccatgttggt +caggctggtctcgaactcctgacctcaaataatccacccgcctcggcttcccaaagtgct +gggattacaggtatgagccactgtgcccggccgggtTAGTGTTGTAatagacttaatttt +taaaaccatttttggTCTGCAGGAGATGTGTGGCGGCTGTATCCACAGGGTCCCCCGCGT +CCCCGCCCCCAGGCTCCTGGCCGCTCCCCTCTCCAGTCCAGCAGGAGTCACGGCTGACGA +ACTCACATGAATGCGTGATTAACTACTAAGGACCTACGCTTGGCTCGGATTTCCTCAGTT +TCCCCTAATGTCTCTTCCTGCACAGGGTCCCACCCGGGACCGAACCTGCCGTTTTGCCGC +AGCCTCTCCTCGGCACCCCCAGGCTCCGACCGTTTCTCAGAACTCCGTGTCTGGAGGCCG +GCTGGACGGGATTTATGTAGATTACGGGTGTGGACCACTGCACCCGCCAGCTATCTCATG +TTTTTCTCTCGATTGGACTGGAGTCACAGTGTTTTTGGGAGAGGCAAGTGCATTTTTAat +ctttaacttttttaatttttttatgttatttttttagagactcctgggctccagcaatcc +tcccacctcagcctcctaaaggattacaggtgtgagccaccgcgcccggcctaatcttTA +ACTTTTTATGGCATCATTGGCAGTGGAAGGTTCTCAGGTCACAAGTGAAGAGCCTCATAA +CTCACAAACCAGGCACGCCCCTGTTCCCGGCACCTGGGTCCAGATACAACCCCCTGCCAC +GAAGCCCCTCCTTAGCCAAGTACCCAAGtccagtgtctttttttttttttgagattccag +tctcgctctgtcccccaggctggagtgcagtggtgcaatctcagctcactgcaagctcca +cctcccgggttcatgccattctcctgcctcagcctccccagtagctgggactacaggcgc +ccgccaccacgcctggctaattttttaaatatttttagtagagacggggtttcacggtgt +tagccaggatggtctcgatctcctgacctcgtgatccacccacctcggcctcccaaagtg +ctgggattacaggcatgagccactgcgccccgccccaAGTCCAGTCTCTAACCCCAGAGA +TGGGCCCTGCCTGtttgggttctttttttgttttttgtttttgtttttgttttgacacgg +agtctcgctctgtcgcccaggctggagtgcagtggtgcaatctcggctcactgcaacctc +cgcctcctgggttcaagcaatcctcctgcctcaacctcccgagtagctgggactataggc +acgcgccaccacgcccggctaatttttgtatttttagtagagacggggtttcaccagatt +ggccaggctggtcttgaactcctgacctcatgatccgccagccttggtctcccaaagtac +tgggatgacaggcgtgaggcaccacgcccagcccctttgggtttttaaattgttcattca +tggccaggcatggtggctcgcgccggtaatcccagcacatcgggaggctgaggcgggcgg +atcacgaggtcaggagttcaagatcggcctggccaacatggtgaaaccctgtctctacga +aaattacaaaaaaaattagctgggcatggtggtgggcacctataatcccagctacttggg +aggctgaggcaggagaatcacttcaagcCGGGAAagggaggttgcagggagctgagatca +caccactgcactctagcctgggcgacaagagcgagactccgtctcagaaaaaaaaaaaaa +caaaaccataaataaaaaattttttaaaaaatgataaatgtttgcaaCTCTAGCTATGTT +AATGTCTGATCAGCACACATTGTATGTATTGAAAcgtcactatgtaccccatgaatatgt +acaattattatgtgttctttttttttttgagacagagtattttgctcttgttgcccaggt +tggagtgcagtggcacgatctcggctcaccgcaacctccgcctcccagattcaagcgatt +cccctgcctcagcctcccgagtagctgggattacaggcacccgccaccacgcccggctac +tgtttgtatttttagtagagacggggtttcgccatgttggccacgctggtctcaagctcc +tgatgtcgtgatccgcccgcctcagcctcccaaggtgctgggattacaggcgtgagccac +cgcgcccggcatgtgttcattttttttaaaaaaaaaaaaggataaaaaggccaggcacgg +tggctcacgcctgtaatcccagcacttttggaggccaaggctggtagatcacttgagccc +aggagttcgagaccagcctggccaacatggtgaaaccccgtctctactaaaaatacaaaa +aaattaaaattaaaaataaaaacaaataaagaaaagataaaaagaaagccaGGCCTCTTG +GCAATGAAAGCTGCCCGGGGCagccctctccctcttcctggtGCAGGTGTGTTGCCAGCG +TGGATGTCCTTCGTGGACGTGaacttattttacaaaagagCACTTGTCCAGAGCTAGTCC +TGAGCCTGCGGTTTCTGGGAGTCACCAGCTCGAATGACGCAGGACAAGTACACTTTGGGG +TGGCACGTCCTGGTGCTGTTATTTTGGGGTGGGGTGTCCTTCCGTGGTACGGCTGGACCA +CGTTGCCTCTGTCCACTCACTGCCCTCGAGGGATGGGTGAGCTGTTTCCACCTTTGGCTG +CCGTGACCTGGGCTGCTGTGAACTTCGCAGACGTTTGTGTTTCTTTCCCGCACGGAAACT +TGGACAGAAGCTCCTTGTCACGTCCCACAGTCACACGGCCCCTGCACGTGCTTAAAAGAA +gctgtggtgttttttttttgttttttttttttttgttgttgttgtttgcttttttttttg +agacggagtctctgtttccaggctggagtgcagtggcgcaatctcggctcactgcaacct +cctcctcccgggttcaagtgattctcctgcctcagcctcccgagtagctgagattacagg +cacccaccaccacgcccggctaatttttgtattttcagtagagatggggtttcaccatgt +tggtcaggctggtctcgaactcctgacctcaggtgatccacccgcttcggcctcccaaag +tgctgggatgacaggtgtaagccaccgtacccagcgGAAGCTGCGATTTTCCTTATTCCT +TGACATCCTCAAGGGAGACCCTGATGTAGAGGCAGGGAGGCTAGGAAGGAGGAAGCATCC +AGCCCAGTGGGGTGGACCCGTCAGAAATGCTCAGAGGcggccgtgcatggtggctcacac +ctgtcatcccagcattttgggaggccgaggcgggcggatcacctgaggtcgggagttcga +gatcagcctggccaacacagagaaaccccgtctctactaaaaatacaatgttagccgggc +gtggtggcgcatgcctgtaatcccagctactggggaggctg +>NC_060944.1 Homo sapiens isolate CHM13 chromosome 20, alternate assembly T2T-CHM13v2.0 +tttCTTCTGTCAGCATAACACCTAGTCAATTGTTCATGAGATGTGTCAAGCTCTTGACTC +AGGTGTGTcctttcatccattcatccattcatccattcatccgcCTGCCCATTTGTCCAG +TCATTCATCAGTCTGTCACTTAATGGGTGTCTACTTGTACTAAGCACTGTACTGGGGATA +AAAAGATGAATTACTCCCTCCCAGCCCTTGAAGGGCTCACAGTAGGGACACAaacaatta +ttatatataatagaatctGAGGGATTATGAAAATCCAGAGGaaagaatgactttttttct +tcttctttttttttgagacggagttacgctctttgttgcccaggctggagcgcagtgttg +cgatctcagctcactgcaacctccacctcctgggtttgagcagttctcctgcctcagcct +cccgagtagctgggattacaggcattcaccaccacgcctggctaattttttgtattttta +gtggagacggggttttgccatgttggccaggctggtcttgaaatcctgatctcaggtgat +ctgcctgcctcggcctcccaaagtgctgggattacaggagtgagccaccacacctggcca +agaatgaCTACTTCTAAAGCAGTCAGGAAAGGCTTCACCAAGAATATATTCTGGatcctt +cttttaatttttttttttttttttgagacagagtttcactcttgttgcccaggatggagt +gcaacggcacgatctcagctcaccgcaacctccacctcccaggttcaagcaattctcctg +cctcagcctcccgagtagctgggattacaggcatgcaccaccatgcctggctaattttgt +atttttagtagagacagggtttttccatgttggtcaggctggtctcgaactccccacctc +aggtgatccgcccaccttggcctcccaaagtgctaggattacaggcatgagccaccgcat +ctggcccttctttttaatttttatttatttatttagacagggtctcactctgttgccttg +gctggagtgcagtggcacaatcatagctcactgcagcctcaacctctagggctcaagcga +tccttccacctcagccttctatgccaccatgcctaattttaaaaaaattttttgtagagg +tggggtctcattatgttgcccagactgatcttgaactcctgggctcaagcaatcctcttg +cctcaacctcccaaagtgctaggatcgcagatgtgagccaccacactgggctctggtacg +ttcttaaagaaaattttgcCACAGGGAAGAGTGTGTTAAGGGGAAAGTACTCCAGGCAGA +AGAGTTATGTGCAAAGACCTTGTCACATGAAAGAAACACCATGTCCAGGAAACAAAGAGT +TCTATGAAGCTGAAGTGCCAGGTAAAGGGAGAGAACAGAAGCAGGTAGCACCGCAGTAAA +AGAGGCTGGGCTGGATTCATCCCGCAAAGGAGTCTGGGTTTATCCTGTACTcaggaggaa +gacagggagggatTTTACTTTGGGCCTGAGGGCCATCCTTTGGAAGACCAGGCTGTACGT +TTTCAAGAGGGGTCAAAAACATGCAGGAAACAGAGAAGCCTTTTTATATAACATCGGTGG +AGGCAAACCATGAGAAGAATTTAATTtccaacaaagagaaaaaacctaacatatttaatt +tttttttaacttgggaGTACCCCTGCACtttccacacatcacaaattgaCAGCACTTGAG +TGGCAATACTGAATACTGCTTGAGGGAAGCTGATATTCAGAAGTCTTGTTAACCTATTTG +CTAAGAGTATgataatttttcttcagtttgttTAGACATACATCCACCCCATCTCTCTTT +CTAAATAAGCTATTCGGCAATCTGGGAGAAAGGAAATCTTgtatcttggggaaaaaaacc +acTATGCAGTCAACTGAATTTCCATGAGGTTTTGGCAAACCATTTGCCAGAATGTTACTT +AATTCTGAACTCAAATCCTCAAATCATACCTCCCATAACTCATTTCTCTTAAGACTctgt +tccaatttttttttttttttttgagacagggtcttactctgtcacccaggctggagaata +gtggcacgatcatggctcactgcagcctcaaccttctgggctcaagtgatcctcctgcct +tagcctcccaggtagctgggaccacagacaaaCTCCactggcccagctaatttttgcgta +tatatattttgtagagaaaaaaagtgttgcccaggctgatctcaaactcctgggctctag +tgatccacccacctcgacctcccaaagtgctgggattacaggcgttgagccaccatacct +ggcctccaATTCTACTTTTAATCCTGCATTTCAAAATTTACTtactatttcaaaattttt +ggCACTCTGTGGGAACGCAACAAATACGTGCAGAATATAGTAAGTGATTTAGTTTAGTTA +TTGTTCCTCTGGAAAAAACTGGCTTGCAGTAAATGACATTATTTTTCCCATACTGTTAAG +GTGATGCTCACTGCAGAACTCTCTAAACAGATCTGCAGACTCTTTGGCCTGTTTCTAACA +CTACCGGTGTTTCCCAGAGGAGGATGCTGTCCCAACGTGGATTTCGGCTGCTGTTTTTTT +CAGGCCCCAACACCACCCTCCTCAACCCCACAGCCTAGTGATTAAATGTCAGTGGCAGAT +GGAGAAAGCACTCCCACGTGTGCCACTCTGACAAATACTTTATTCCAACTAAATGTATAG +GCTCTCACTGTGACataaaaagggaagaggaaacagaaaattcaaGTGAGCTAAAGATGT +ATGAATTACAGAGTGAGATCAACTGCTAGACGACACAGGGAGGGAGTTAGCAGCGTCTCC +ACTGAAAGACAAATTCACAGACATCCTGTTTATTTCCGAAAGAGAAACATCATAGAGCTA +TTCTTGGGATGTTCaggaaaagattaaaataaatgccTATTATCTATTGTATTTCGAGAT +AAACTTTATAGATTTAGAGCAGGACACACATTTCTGGACTTGAGAACGCTGTATCTGGCT +TGGAATAAAAGCCCACATTTCATCTAGAGGTAGAATGTATGTCATTCTAATCTCCCTCAA +TCCTTTCTTCTCCAATTTCTTTATTGCCCCACTTACAAGATAGTGCACTATTATTCCAAA +GCTGATACCTTCCAAATTCCTTTATAGTAGAGGTCTTGGCTATCATAACCATGATGGAAC +GAATGACCGTCCTACAGCTGGCTGCAAAATATAAGACTGCTATAAATAAATCCCTGATGC +CTGAAAagtaattcattcaacaaaggaAGATAGGTATGACTTTGGCCTACTCTTCATTAG +AacgcttatttttatttatttatttatttatttataaagaggGCAAAGCAGACTTTATTT +GAGGGGCACCACAGCAATAGGTATAGCAACAACTGCAACAGGGTTTTGTAGTCAGGGAGG +GAGATCAGACTCAACTCCCTAAAATGCTAATTTTAACAATGGGACACTTTATCTGAACTG +TGGTTCTTAATGGTTCAGATAAAGATGACACAACCCACTATTGGCTTAAACTTCTCCCAA +CTCTGGCTACAGAATCCAGGTAAAGATTTCTGCCCCCTCAGAGTAATAGGCATGTCCAAA +ATCACCTGGATTAGGGCACTTAATACACTGGGAAGGGACGATAACAACTAAAGATGACCA +CTATCCATGCCTCCTCTAAaagttttttcatatattttttcatatcacCAAAACAAATAC +TAACTTGGATCAACTAATTTATATAATGGAATCTCGTGTGAGCGTACAAAATTCCATACT +GATTATTTGGTTTAAGCCTGCATTATCATAAAGGCTTTACAGTCTTTAAACTGAAATTAA +GCTCAAATTAAGAAATGCTAGTCTTAAAACAATGGAAGGGGGGGGCCGTtttgtgtggag +ggagggagacagacataCCCCTACACCCACCCACAACTACTGATATTGACATTGGAAATT +AACTTGAAAatttatgcctgtagtcccagctactcaggaggctgaggtgggaggagcact +taagtccaggagttgggAGATGACAGTGAGCTTTgactgtgacactgcactccaacccgg +gtgacagggcaagatcccatctctcaaaaaaaaaaaaaaatgctttaactCGACGTCTGT +ACCAGAAGACCACAGCAGGAGAGGAAAACCTTATTTCAGTCTGGGTAAGAGTTCtattaa +acacaaaataaaacaaactagcCTCTGTTTCTGGAGGTCTTCATTAGTAGTTTCTACAAA +ACAGTATCCAAATTAGCAAAGATTCTGTTAACTACCTGGAAAAAGCAGGTACCAAGAAAG +AATGTTTCACtacaatggaaaaaaacagtCTAGTAAGTAAACCAATCTGACTATAAACGC +TACAAAAGAGGGATTCTAGCATTAGTAACTTTGCCAACAATACTCTGatatgattaaaaa +acaaaacaataacaaaaacaaaaaacctcatctTTAAATTTGTCCCATTCATCCAGAGAA +GCAAAATCAAGGAAACTAGAGGGGGTAAAGTCTTGCAACAGATACACAGCTGCACTGCCA +ACAGGTCACAAGACCCATGCTGCCTAGGGCATTGACTGTTATGCCATGAGGACAGACATC +ACACAAACACCAGTAATTAAAGGGTTACGGTGCCAAAGGGTTCAGAGCTCCACTTCCATT +CAGTATCAGAAcataagaaaaagggaaaaacagaaaatgagcccaaataaaatataaaat +aaaatatagataccAGGAGCTTCCTCAAAATATGTGGGTTGTATTAATAACGTGTTTGGC +TCTGTTACGGGCACCATCCATCAGAGGACTGGAAATAGGGAAAGTCACCTTAGTCTTCCT +CAaggaaaaaagattatttaactTGGTTCACGGTGTACATTCATAATTTTAACTGtcatg +tatttattgaatgaaaaacaTTTGAGAACATCATGTGCAACAAAAACATGATTTCACAGA +AATTGTCCaaactaaaagagtataaaaaTAGAAGCGCTTTTTATacaattatttacttat +tattattattgagatagggtctccatctgtcacccaggccggagtgcagtggcgcaatca +tagagTAGCCTctaagtcctgggctcaagcgatcctcctgcctcagcctccagagtcgtT +GGGATCACAGGCTCGAGCCTCCACACCCgactaacttttaaaaactttttgtagagatga +ggcctcgcTGTGTTTCCCAGCCTgatctcgaaatcctggcctcaatcgatcctccaacca +tggcctcccaaagcgctgggattacaggcgcgagccatggtgcccggccgcTTTTACAca +attgaaaaacattaaaataggtGGCAGAAGACAGACAGAAAGTCGATTCGTGGTTGCCAG +GCGTCGTGAATACCGGGGAACGCGGAGTGCCTATTAATGGGTAAGGGTTTCGTTTTGGAA +TCAGACAGCGGCGATGgctgcacaactttgtgaattttCTAAGAATCACTGAACTGTGCA +CCTTAAAGGAAGAACTGTGTGGTAATTACATCGGCGGTACGCGGGCAGCGCGTCAATCAA +GCCGGCGACGGTGAATGCAGTTCGGGAGAGCTGATACCCCTCGGGGAGGCGGCTCCGGGA +GCCTGCGGACGTGGCGGACGCCTGGGACGGGGTGGGCCTGGCCTCCGCGCTCGAGGAGTC +CCAGTCCTCTCCAGATGGAAGAAAGCCGGGGCGCGAAGCCGCCGCCCGCTCTTCTGCCTG +GGGACGCGACTCTGCCGCCAGGCTCCCTCGGGTCAGCTCGGCACCCGCCCGAGCCCCCCC +AGTTCCAGGCCCTCTCCTCATCAGACGTGCCCTGGGCCCTCAGCCTGTTCCTCTCGCCGC +CCGGAACCCCGCAGCAGCCCCGGGTCCCCAGCCCGCGCCCCTCCGGCGCCGCCTCCGCCA +GCTGCCCCTGCCCCCCGGGCGGCCCTCGCAGGCCGCTCCCGGCGCCCCGGTCGGCTTCCG +TACCTGCCTTCTCCGCGCCGCCGTCCCAGTGGCCGGAGGTGGGGCCGTCGCCCTGCGCAC +TCCGGAGGGCCATGCCCCGGGGCCCCGGGCCCCCACCCGAGCCCCGGCTGGTGGCGGAGC +CGGGAGAAGACGCGGCTCCGACCGCGGGACGTAGCACCCGCTCGGCATCGGCAGGCTCCC +CTCCGTCGGCCAGCGGCGCGCAGGCGCGCAGGCGCCCCGCTGGCCCCGCCCCGCGCCGGC +ACGTGACCCTGCGCTACGCCCGGCCGGCGGCGGGGGAGGCTGCGGAAAGAGCGCGGTGAG +CGCTCTGAGGAGTTGGCTTCGTCTGCGCTGTAGACTCTACGGTGTAGAGTGTGGCGCTCT +TGAGCGAGTGTGCTCGAGACCAGCTGTCGTTTCCTTTGcttctttcatctgtaaaatagt +attgatgataataaaaatattgaactcaCAAGGTTATTGAGAGTGTTTAGAACATCACCA +AGCATATAGTAAATACTCCACAATTATGACCAATTTTTGCTTACCAAGGATTATTTTTTT +ACCTCCTGTCTCGTCTCCCCACACGAACTCCTGTCATCAGTTCTTGGGTACTTGGGGATC +TAGCAGGTTCATGTCATACGGGTCCGCAGGTTATGCACTGCACAAGGCCTGGGAGCGCCA +TTTACGTAGACGTTCACGTGAACCGTGCCCCCTTAAGTTGTGCGAAATAGTGGCCACTCA +TCTAAAGCAGCGCTCTGGCTTATCAGGTCTGATTTCCTTCTCGTCTTCAGTGATATTCCT +TTCTTTCCAATTAGACATCCATTCCCTTGGTTATATCCCTGGTATTGTGATTGTGGCCTC +CCGAATTTCTAGTGCTAGGTCTTCATGCTGAAGTTCCCATAATTCCAGTTGCTTGATGAC +TCTCTTCCACCTCCCACCCGCAACCACAACAGTTCTTTATTATCCTGAGACCTCCAGCCc +atgaaactcctgacctcgtgatccgcccgcctcagcctctcaaagtgctgggattacagg +cgtgagccaccgcgcacagccaAGTTTTACAGTTCTATTCATAAATCTAGTAAATTATAT +CAGTTATTTGGTCCCATTAATAAACTAAGCTAATTAAAATCCTTTGAACATTTGAAACTG +CATTTATAAATTCAATTCGTTTTTCTAAGTATCACAGGTTTCTAACAAAGCCTTTCAAGT +CCTTGTGTAATTCTTGTAAATGTAATACATTTATAAGAATACTGAGTCATGAGTGCTTTC +AAATGTGTCAATACAAACGAGATTTCATCTTAAAATCAAAAGTCTAAATCTATTCAAATA +CATATTTGTAATTAGTACAAGAATAATCTGTTAGAATtctcaaaattatctttttttttt +ttttgagacagagtctcactctatcacccagactggagtgcaatagcgatcatagctcac +tgcagcctcaagctcctgggctcaagctagcCTCCTgttgcagcctcccgagtagctgag +actgtaggcacacactaccatgcctggctagtttttttagtttttatagagGGGGTGGgg +aatctccctatgttgcccaggccggtctcaaactgccttcgcctcccaaagctctgggat +tacaggcgtgaatcacagTGCCAAGCTCTTGAAATTATCTTGAACATTATAGGAATTTAA +AGTATCACATTTACACAGATGCCTTAATGCAAAATTATTAATACTAGAAGTTTGAAAACA +TTTCTAGTCTTTGTTCTAAATCATCTgtgaggctcatgcctgtaatcccagcactttggg +aggtgaagggctgcagatcacttgaggtcaggagttcaagaccagcctcaccaacatggt +gaaaccccatctctactaaaaatacaaaaattagctgggcatggtggtgcctgcctgtaa +tcccagctacttgggaggctgaggcaggagaattgcttgaacctgggaggcagaggttgc +agtgagccaagattgcgccactgcactccagcctaagagacggagtgagactccatctca +aaaaataaataaataaaatgaaataaatcatcaTTGAGGTTAAAAGATGCTTAGTGCCCA +CTGAAGGAAGATTTAAGTCATCCCAGTTTAAGAGTAACGTGCTCAAGCAATTTGAGATAT +TTATTCCCTTCTCAGTTTACTGCGCTGGTCATCCAGCCAGCTGGATTCTTGCTTTTGGTA +GTGATGGAACAGTGACCCCCACCCCATTCCCACCACCACAACTCTAGGACTAAACAGTTG +TGTGGTCGTTGTGAAGCTTGGGCCAGAATTTACTTTCAAAAAATGTCCCGCTTCATGTAT +AATATAAAGACCTTACAATAAATTCCCATTTCTTCCCTCCTGTTCTTCTTGCTGTTGtcc +tacattttactttttaaaatcccttccttctcttgcttTCTCCCCTCTACCCACCAACCA +CTTGCAAACAACCACTGATCTACATCCTGTCACTATAgattggttttcattttctggaat +tttttatggacggaatcatatagtatgtagtcttttttgtctggcttcttttactcagcg +TAATTATTTTATAAGCAATCATGTTGCATTAATCaatagttcatttgtttttgttgttaa +gtAGAATTTCATCTTAGAAATATACCACGATTCattttatcagtattttaaatttttgca +tgtGCTGCAAGTACACAATTCATTGCTAATATGCTTGCCTTAGACCAGGCGGTTAGCAAA +AAAGATGGTCTGCCCACCTGCAAGCCAAAACCACTCTACTGCCTGATTTTGCACGGCTCA +TGAACTAAGAATGGCTTTTACCTTGATAAATGTTGAAAAATCACAACTTAATTGTAGCAC +ATTAAAACTATATGGAATTTAAATCTCAGTGTCCATAAACCTTTACTGAAACAGAGTCAC +GCTCATTCATTTACCTActgtctatggctgttttcatgCTGCAACGGTAGAGTTCAGTGG +TTGCAACAGAGATATGGcctacaaaacctaaaatatttattatctgctcctttatgtatt +tatttattttatgtgtgtatgtatgtatgtatttttttgagatggagtttcactcttgtt +gcccaggctggagtgcaatggcgcaatcgcagctcactgcaacctccgcctcccaggtcc +acgtgattctcctgcctcagcctcccgagtagctgggattagcccgccaccatgcctggc +taatttttttgtatttttagtagagacggggttttgccatgttggtcaggctggtctcaa +actcccgacctcaggtgatccgcccgcctcaggctcccaaagtgctgggattacaggcat +gagccaccgcacccggcctatctgctcctttatagaaaaagattggcaggacgtggtggc +tcacacctgtaatcccagcactttgggaggccgaggcaggcagattacatgaggccagga +gttcgagaccagcttggccaaagtggtgaaaccccgtctttactaaacatacaaaaatta +gccaggcatagtggcacaggtctgtaatcccagctactcaggaggctgaggcaggagaat +cacttgaacccaggaggcggagactgcagtgagccgagatcacaccattgcactccagcc +tgggtgacagagtgagactccacataaaaaaaaaaaaaataaaaaaaaaaaaagttttgt +gacCCTctattgtagagatggaggtattggggctgttgcccaggctggccttcaactcct +ggcctcaagggatcctcctgcttcagcctcccaaaaatgaTGGGATTTCAAGTTTGAGCC +CCATGCCCAGCTCACTTCAGTTATTTCtaaggtaatttaaaaaagattttaattgtACTT +ACCTTCATTCAATTTCCAGTGCTCTTAATTTCATTGTGTAG +>NC_060945.1 Homo sapiens isolate CHM13 chromosome 21, alternate assembly T2T-CHM13v2.0 +TGCCTACAGGGGACATTGGACATatatctgcactgatcacccaggtgatgcaactcttgc +ctaggctttgcctacaggggacattgtgacatatctcttcAATGATCACCCATGTGATGC +AACGCTTGCCTAGGCTTTGCCtacaggggacattgtgacatatctctgcactgatttCCC +AGGTGCTGTAACTTTAGGCTAGGCTCTGGCTACACGGCATTGTGATATATCACTGCACTG +AACAACCAGGTGATATAACCCCTGTATAGGCTCTGTCTACAGGGGGCTTGTGACATATCT +CTCCACggatcacccaggtgatataGCTCTTCTCTAGGATCTGCCTACAGGGtgctttgt +gacatatccctgCACTGATCACCCTGGTGATCTAACTCTTGTCTAAGCTCTTCCTAAAGG +GGCATTGTGACagatctctgcactgatcactcagGTGATGTAACTGTTGTCTAGGCTCTG +CTTCAAGGGGCCTTGTCAcaaatctctgcactgatcacccaggtgatgtaactcttgtct +aggctctgcttcCAGGGCATATTGTGACATATCTATGCACTGATCACCTTAGTGATGTAA +CACTTGTGTAGGCTCGGCCTACAGGGGAATCTTGACATACTCTGCACTGTTAAACGAGGT +GATTTAACTCTTCTCTAGGCTGTGCCCACAGGAGGATtgagacatatctctgcactgatc +ccGAGGTGATCCAACTCTTGCCTGGTGTCTGCCTActggggacattgtgacatatctctg +cactgatctccCTTGTGCTGCAACTTTAGTCTAGGTTCTGGATACacgacattgtgacat +atcagtGCACTGATCACATAGGTGatataactcttgtctaggctctgcgtACAATGgtct +tgtgacatatctctgcactgatcatccaGGTGATATAACTATTCTCTAGGATCTGACCAC +AGGGtgctttgtgacatatccctgcaatgatcacccaggtgatatacCACTTGCcaaggc +tctgcctacaggggcattgcAATGTATCTCAGCACTGATCACCTAGGTCTTGTAACTCTT +TTCTAGGATATGCCTACAGGGTGCTTTGTGACGTATCCCAGCAAGGATTACCCGGGTGAT +GTACCGCTCAtcaaggctctgcctacaggCACATTGCGatgtatctctgcactgatcacc +taggtcaTGTAACCTTTGTCTAGTCTCTGCCTACGatggcattgtgacatatttctgcac +tAATCATCCAactgatgtaactcttgtctaggatcTGCCTACATTAACTTTGTGATATAA +TCCTGTACTGATCATCCAGGTGATGGGGtttttgtctaggctctgcctaagggggtattg +tgacatatttctgcatTGATCACCCAGGTGGCGAACTCTTCTCTTGTATCTGCCTATGCG +GGCATTGTGAcaaatctctgcactgatcacccaggtgtcGTAACTGTTGTGTAACCTCTG +CCTACAGGGGAATTGTGAGAGATCTCGCCACTGATCACCCAAGTGATGTAACCATTGTCT +ACGCTATGCGTAcagggggctttgtgacatacctttgcactgatcacccaggtgatgtaa +cacaTCTAAGTTCGGCCTAAAggagctttgtgacatatctctgcactgatcacttaGGTG +ATGTACCACTTTTATAAGCACTGCCTACAGGGAATTTTGACAAATCTGTAcactgatcac +ctaggtgatgtaactcttgtctaccCTCTGTCCAACggggcattgtgaaatatctctgca +ctgatgaCCCAGGTGATTCAACTCTTGACTAGGAACTGCCTACAGAGgttattgtgaaat +atctctgcactgataaACTAGGTGGTGTAACCCTTGTCCAAGTTCTGCCTACAGGGGCGT +TTTCACATATCCCTGAACTGATGAcaaaggtgatgtaactcttgcctAGGCTTTGCCTAC +AGGGGACATTGGACATatatctgcactgatcacccaggtgatgcaactcttgcTTAGGGT +TTGCCtacaggggacattgtgacatatctcttcAATGATCACCCATGTGATGCAACTCTT +GCCTAGGCTTTGCCtacaggggacattgtgacatatctctgcactgatttCCCAGGTGCT +GTAACTTTAGGCTAGGCTCTGGCTACACGGCATCgtgacatatcactgcactgaACAACC +AGGTGATATAACCACTGTATAGGCTCTGCCTACATGGggcttgtgacatatctctgcacg +gatcacccaggtgatataGCTCTTCTCTAGGATCTGCCTACAGGGTGCTTTGTGATATAT +ccctgcactgatcacccaggtgatctAACTCTGGTCTAAGCTCTTCCTAAAGGGGCATTG +TGACagatctctgcactgatcactcagGTGTTGTAACTGTTGTCTAGGCTCTGCATCAAG +GGGCCTTGTCACAACTCTCTGCattgatcacccaggtgatgtaactcttgtctaggctct +gcttcCAGGGCATATTGTGACATATCTATGCACTGATCACCTTAGTGATGTAACACTTGT +GTAGGCTCGGCCTACAGGGGAATcttgacatatctctgcactgttAACCGAGGTGATTTA +ATTCTTCTCTAGGCTGTGCCCACAAGGGATtgagacatatctctgcactgatcccGAGGT +GATCCAACTCTTGCCTGGTCTCTGCCTActggggacattgtgacatatctctgcactgat +ctccCTTGTGCTGCAACTTTCGTCTAGGCTCTGGCTACacgacattgtgacatatcagtG +CACTGATCACATAGGTGatataactcttgtctaggctctgcctacaatggtcttgtgaca +tatctctgcactgatcacccaggtgatataaCTATTCTCTAGGATCTGACCACAGGGtgc +tttgtgacatatccctgcaatgatcacccaggtgatatacCACTTGCcaaggctctgcct +acaggggcattgcAATGTATCTCAACACTGCTCACCTAGGTCTTGTAACTCTTTTCTAGG +ATCTGCCTACAGGGTGCTTTGTGACGTATCCCAGCGAGGAGTACCCAGGGGATGTACCGC +TCAtcaaggctctgcctacaggCACATTGCGATgaatctctgcactgatcacctaggtca +TGTAACCTTTGTCTAGTCTCTGCCTATGATGGCATTGTGACATATGTCTGCACTAATCAT +CCaagtgatgtaactcttgtctaggatcTGCCTACATTAACTTTGTGACATAATCCTGTA +CTGATCATCCAGGTGATGGGGtttttgtctaggctctgcctaagggggcattgtgacata +tttctgcgTTGATCACCCAGGTGGTGAACTCTTCTCTTggatctgcctatgggggcattg +tgacaaatctctgcactgatcacccaggtgatgtaactgttGTGTAACCTCTGCCTACAG +GGGAATTGTGAGAGATCTCGCCACTGATCACCCAAGTGATATAACCATTGTCTAGGCTTT +GCGTACAGGCGGCTTTGTGACATACCTTTGCACTGATCAGCCAGGTGATGTAACACATCT +AAGTTCGGCCTATAggagctttgtgacatatctctgcactgatcacttaGGTGATGTAAC +ACTTTTATAAGCACTGCCTGCAGGGAATTTTGACAAATCTGTAcactgatcacctaggtg +atgtaactcttgtctaccCTCTGTCCAACggggcattgtgaaatatctctgcactgatga +CCCAGGTGATTCAACTCTTGACTAGGATCTGCCTACAGAGgttattgtgaaatatctctg +cactgataaACTAGGTGGTGTAAACCTTGTCCAAGTTCTGCCTACAGGGGCGTTTTCACA +TATCCCTGAACTGATGAcaaaggtgatgtaactcttgcctaggctttgcctacaggggac +attgtgacatatctcttcAATGATCACCCATGTGATGCAACTCTTGCCTAGGCTTTGCCt +acaggggacattgtgacatatctctgcactgatttCCCAGGTGCTGTAACTTTAGGCTAG +GCTCTGGCTACACGGCATTGTGATATATCACTGCACTGAACAACCAGGTGATATAACCCC +TGTATAGGCTCTGTCTACAGGGggcttgtgacatatctctgcacggatcacccaggtgat +ataGCTCTTCTCTAGGATCTGCCTACAGGGtgctttgtgacatatccctgCACTGATCAC +CCTGGTGATCTAACTCTGGTTTAAGCTCTTCCTAAAGGGGCATTGTGACagatctctgca +ctgatcactcagGTGATGTAACTGTTGTCTAGGCTCTGCTTCAAGGGGCCTTGTCAcaaa +tctctgcactgatcacccaggtgatgtaactcttgtctaggctctgcttcCAGGGCATAT +TGTGACATATCTATGCACTGATCACCTTAGTGATGTAACACTTGTGTAGGCTCGGCCTAC +AGGGGAATCTTGACATACTCTGCACTGTTAAACGAGGTGATTTAACTCTTCTCTAGGCTG +TGCCCACAGGAGGATTGAGACATATCCCTGCACTGATCCCGAGGTGATCCAACTCTTGCC +TGGTCTCTGCCTActggggacattgtgacatatctctgcagtgATCTCCCAGGTCCTGCA +ACTTTAGTCTAGGCTCTGGCTACacgacattgtgacatatcactgcactgatcacccagg +tgatataactcttgtctaggctctgcctacaatGGTcatgtgacatatctctgcactgat +cacccaggtgatataaCTATTCTCTAGGATCTGACCACAGGGTGCTTTGGGCATATCCCT +gcaatgatcacccaggtgatatacCACTTGCcaaggctctgcctacaggggcattgcAAT +GTAtgtctgcactgatcacctaggcCTTGTAACTCTTTTCTAGGATCTGCCTACAGGGTG +CTTTGTGACGTATCCCAGCAAGGATTACCCAGGTGATGTACCGCTCAtcaaggctctgcc +tacaggCACATCGCGATGTATCTCTCCACTGATCACCTAGGTCATGTAACcattgtctag +gctctgcctacgatggcattgtgacatatctctgcactaaTCATCCAAgtgatgtaacac +ttgtctaGGATCTGCCTAAATTAACATTGTGACATAACCCTGTACTGATCATCCAGGTGA +TGGGGcttttgtctaggctctgcctaagggggcattgtgacatatttctgcatTGATCAC +CCAGGTGGCGAACTCTTCTCTTggatctgcctatgggggcattgtgacaaatctctgcac +tgatcacccaggtgacgTAACTGTTGTGTAACCTCTGCCGACAGGGGAATTGTGAGAGAT +CTCGCCACTGATTACCCAAGTGATATAACCATTGTCTAGGCTTTGCGTACAGGCGGCTTT +GTGACATACctttgcactgatcacccaggtgatgtaacacaTCTATGTTCGGCCTAAAGg +cgctttgtgacatatctctgcactgatcacttaGGTGATGTAACACTTTTATAACCACTG +CCTACAGGGAATTTTGACAAATCTGTACACTGATCACCTAGGTGACGTAACTCTTGTCTA +CCCTCTGTCCAACGGgtcattgtgaaatatctctgcactgatcacccaggtgattcAATT +CTTGACTAGGATCTGCCTACAGAGgttattgtgaaatatctctgcactgataaACTAGGT +GGTGTAAACCTTGTCCAAGCTCTGACTACAGGGGCGTTTTCACATATCCCTGAACTGATG +ACAGAGGTGATGTAACACTTGCCTAGGCTTTGCCTACAGGGGACATTGGTCATATATCTG +CACTGATCTCCCAGGTGATGCAACTCTGGCCTAGGCTTTGCCtacaggggacattgtgac +atatctcttcAATGATCACCCATGTGATGCAACTCTTGCCTAGGCTTTGCCTAaagggga +cattgtgacatatctctgcactgatctccCAGGTGCTGTAACTTTAGTCTAGGCTCTGGC +TAGacggcattgtgacatatcactgcactgatcaACCAGGTGATACAACTCTTGtatagg +ctctgcctacagggggcttgtgacatatctctgcactgatcacccaggtgatataGCTCT +TCTCTAGGATCTGCCTACAGGGtgctttgtgacatatccctgcactgatcacccaggtga +tctAACTCTGGTCTAAGCTCTGCCTAAAGGGTCATTGTGACagatctctgcactgatcac +tcagGTGATGTGACTGTTGTCTAGGCTCTGCTTCAAGGGGCCTTgtcacatatctctgca +ctgatcacccaggtgatgtaactcttgtctaggctctgcttcCAGGGCATATTGTGACAT +ATCTATGCACTGATCACCTTAGTGATGTAACACTTGTGTAGGCTCGGCCTACAGGGGAAT +cttgacatatctctgcactgttAACCGAGGTGAtttaactcttgtctaggctgtGCCCAC +AGGGGGTTTGAGACATATCTCTTCACTGATCCCGAGGTGATCCAACTCTTGCCTGGTCTC +TGCCTActggggacattgtgacatatctctgcactgatctccCAGGTGCTGCAACTTTAG +TCTAGGCTCTGGGTACACGACATTGTGAaatatcactgcactgatcacccaggtgatata +actcttgtctaggctctgcctacaatggtcttgtgacatatctctgcactgatcacccag +gtgatataaCTATTCTCTAGGATCTGACCACAGGGTGCTGTGTGACATATCCCTgcaatg +atcacccaggtgatatacCACTTGCCAAGGCTCTGCCTACATGGGCATTGCAATGTATCA +CTGCATTGATCACCTAGGTCTTGTAACCCTTTTCTAGGATCTGCCTACAGGGTGCTTTGT +GACGTATCCCAGCAAGGATTACCCAGGTGATATACCGCTCAtcaaggctctgcctacagg +CACATTGCGatgtatctctgcactgatcacctaggtcaTGTAAGCTTTGTCCAGGCTCTG +CCTACGatggcattgtgacatatctctgcactaaTCATCCAAgtgatgtaacacttgtct +aGGATCTGCCTAAATTAACTTTTTGACATAACCCTGTACTGATCATCCAGGTGATGGAGc +ttttgtctaggctctgcctaagggggcattgtgacatatttctgcatTGATCACCCAGGT +GGCGAACTCTTCTATTggatctgcctatgggggcattgtgacaaatctctgcactgatca +cccaggtgacgTAACTGTTGTGTAACCTCTGCCGACAGGGGAATTGTGAGAGATCTCGCC +ACTGATCACCCAAGTGATGTAACCATTGTCTACGCTTTGCGTACAGGTGGCTTTGTGACA +TACctttgcactgatcacccaggtgatgtaacacaTCTATGTTCGGCCTAAAggagcttt +gtgacatatctctgcactgatcacttaGGTGATGTAACACTTTTATAACCACTGCCAACA +GGGAATTTTGACAAATCTGTACACTGATCACCTAGGTGACGTAACTCTTGTCTACCCTCT +GTCCAACGGgtcattgtgaaatatctctgcactgatcacccaggtgattcAACTCTTGAC +TAGGATCTGCCTACAGAGgttattgtgaaatatctctgcactgataaACTAGGTGGTGTA +AGACTTGTCcaagctctgcctacaggggcgttTTCACATATCCCTGAACTGACGACAGAG +GTGATGTAACACTTGCCTAGGCTTTGCCTACAGGGGACATTGGACATATATCTGCACTGA +TCTCCCAGGTGATGCAACAATGGCCTAGGCTTTGCCtacaggggacattgtgacatatct +ctgcactgatctccCAGGTGCTGTAACTTTAGTCTAGGCTCTGGCTACACGGCcttgtga +catatcactgcactgatcaACCAGGTGATATAACTCTTGTAttggctctgcctacagggg +gcttgtgacatatctctgcactgatcacccaggtgatataGCTCTTCTCTAGGATCTCCC +TACAGGGtgctttgtgacatatccctgcactgatcacccaggtgatctAACTCTGGTCTA +AGCTCTACCTAAATGGGCATTGTGACagatctctgcactgatcacccaggtgatgtactT +GTTGTCTACGCTCTGCTTCAAGGGGCCTTgtcacatatctctgcactgatcacccaggtg +atgtaactcttgtctaggctctgcttgCAGGGCATATTGTGACATATCTATGCACTGATC +ACCTTAGTGATGTACCACTTGTGTAGGCTCGGCCTACAGGGGAATCTTGACAAATCCCTG +CACTGTTAACCGAGGTGAtttaactcttgtctaggctgtGCCCACAGGGGGTTtgagaca +tatctctgcactgatctcgAGGTGATCCAACTCTTGCCTGGTCTCTGCCTActggggaca +ttgtgacatatctctgcactgatctccCAGGTGCTGCAACTTTAGTCTAGGCTCTGGGTA +Cacgacattgtgacatatcactgcactgatcacccaggtgatataactcttgtctaggct +ctgcctacaatggtcttgtgacatatctctgcactgatcacccaggtgatataaCTATTC +TCTAGGATCTGACCACAGGGTGCTGTGTGACATATCCCTgcaatgatcacccaggtgata +tacCACTTGCCAAGTCTCTGCCTACATGGGCATTGCAATGTATCTCTACACTGATCACCT +AGGTCTTGTAACTCTTTCTAGGATCTGCCTACAGGGTGCTTTGTGACGTATCCCAGCAAG +GATTACCCAGGTGATGTACCGCTCAtcaaggctctgcctacaggCACATCGCGatgtatc +tctgcactgatcacctaggtcaTGTAACctttgtctaggctctgcctacgatggcattgt +gacatatctctgcactaaTCATCCAAgtgatgtaacacttgtctaGGATCTGCCTAAATT +AACTTTGTGACATAACCCTGTACTGATCATCCAGGTGATGTGGcttttgtctaggctctg +cctaagggggcattgtgacatatttctgcatTGATCACCCAGGTGGCGAACTCTTCTCTT +GGATCCgcctatgggggcattgtgacaaatctctgcactgatcacccaggtgacgTAACT +GTTGTGTAACCTCTGCCGACAGGGGAATTGTGAGAGATCTCGCCACTGATCACCCAAGTG +ATGTAACCATTGTCTAGGCTTTGCGTACAGGCGGCTTTGTGACATACctttgcactgatc +acccaggtgatgtaacacaTCTATGTTCGGCCTAAAggagctttgtgacatatctctgca +ctgatcacttaGGTGATGTAACACTTTTATAACCACTGCCTACAGGGAATTTTGACAAAT +CTGTACACTGATCACCTAGGTGACGTAACTCTTGTCTACCCTCTGTCCAACGGgtcattg +tgaaatatctctgcactgatcacccaggtgattcAACTCTTGACTAGGATCTGCCTACAG +AGgttattgtgaaatatctctgcactgataaACTAGGTGGTGTAAGCCTTGTCcaagctc +tgcctacaggggcgttTGCACATATCCCTGAACTGATGACAGAGGTGATGTTACACTTGC +CTAGGCTTTGCCTACAGGGGACATTGGACATATATCTGCAGTGATCTCCCAGGTGATGCA +ACTCTGGCCTAGGCTTTGACtacaggggacattgtgacatatctcttcAATGATCACCCA +TGTGATGCAACTCTTGCCTAGGCTTTGCCTAaaggggacattgtgacatatctctgcact +gatctccCAGGTGCTGTAACTTTAGTCTAGGCTCTGGCTACacggcattgtgacatatca +ctgcactgatcaaccaggtgatataactcttgtataggctc +>NC_060946.1 Homo sapiens isolate CHM13 chromosome 22, alternate assembly T2T-CHM13v2.0 +tgacatatctctgcacggatcacccaggtgatataGCTCTTCTCTAGGATCTGCCTACAG +GAtgctttgtgacatatccctgcactgatcacccaggtgatctAACTCTGGTCTAAGCTC +TTCCTAAAGGGGCATTGTGACagatctctgcactgatcactcagGTGATGTAACTGTTGT +CTAGGCTCTGCTTCAAGGGGCCTTGTCAcaaatctctgcactgatcacccaggtgatgta +actcttgtctaggctctgcttcCAGGGCATATTGTGACATACCTATGCACTGATCACCCT +AGTGATGCAACACTTGTGTAGGCTCGGCCTACAGGGGAATcttgacatatctctgcactg +ttAACCGAGGTGATTTAACTCTTCTCTAGGCTGTGCCCACAGGGGGATtgagacatatct +ctgcactgatcccGAGGTGATCAAACTCTTGCCTGGTCTCTGCCTActggggacattgtg +acatatctctgcactgatctccCTTGTGCTGCAACTTTAGTCTAGGCTCTGGCTACacga +cattgtgacatatcagtGCACTGATCACATAGGTGatataactcttgtctaggctctgcc +tacaatggtcttgtgacatatctctgcactgatcacccaggtgatataaCTATTCTCTAG +GATCTGACCACAGGGtgctttgtgacatatccctgcaatgatcacccaggtgatatacCA +CTAGCcaaggctctgcctacaggggcattgcAATGTATCTCAGCACTGATCACATAGGTC +TTGTAACTCTTTTCTAGGATCTGCCTACAGGGTGCTTTGTGACATATCCCAGCAAGGATT +ACCCAGGTGATGTACCGCTCAtcaaggctctgcctacaggCACATTGCGatgtatctctg +cactgatcacctaggtcaTGTAACTTTGTCTAGTCTCTGCCTACGatggcattgtgacat +atttctgaaCTAATCATCCaagtgatgtaactcttgtctaggatcTGCCTACATTAACTT +TGTGACATAATCCTGTACTGATCATCCAGGTGATGGGGtttttgtctaggctctgcctaa +gggggcattgtgacatatttctgcatTGATCACCCAGGTGGCGAACTCTTCTCTTggatc +tgcctatgggggcattgtgacaaatctctgcactgatcacccaggtgtcATAACTGTTGT +GTAACCTCTGCCTACAGGGGAATTGTGACAGATCTCGCCACTGATCACCCAAGTGATGTA +ACCATTGTCTAGGCTTTGCGTAcagggggctttgtgacatacctttgcactgatcaccca +ggtgatgtaacacaTCTAAGTTCGGCCTAAAggagctttgtgacatatctctgcactgat +cacttaGGTGATGTAACACTTTTATAAGCACTGCCTACAGGGAATTTTGACAAATCTGTA +cactgatcacctaggtgatgtaactcttgtctaccCTCTGTCCAACggggcattgtgaaa +tatctctgcactgatgaCCCAGGTGATTCAACTCTTGACTAGGATCTGCCTACAGAGGTT +actgtgaaatatctctgcactgataaACTAGGTGGTGTAACCCTTGTCCAAGTTCTGCCT +ACAGGGGCGTTTTCACATATCCCTGAACTGATGACAAAGGTGATGTAGCTCTTGCCTAGG +CTTTGCCTACAGGGGACATTGGACATATATCTACACTGATCAaccaggtgatgcaactct +tgcCTAGGCGTTGCCtacaggggacattgtgacatatgtCTTCAATGATCACCCATGTGA +TGCAACTCTTGCCTAGGCTTTGCCtacaggggacattgtgacatatctctgcactgattt +CCCAGGTTCTGTAACTTTAGGCTAGGCTCTGGCTACacggcattgtgacatatcactgca +ctgatcaACCAGGTGATATAACCCCTGtataggctctgcctacagggggcttgtgacata +tctctgcacggatcacccaggtgatataGCTCTTCTCTAGGATCTGCCTACAGGAtgctt +tgtgacatatccctgaactgatcacccaggtgatctAACTCTGGTCTAAGCTCTTCCTAA +AGGGGCATTGTGACagatctctgcactgatcactcagGTGATGTAACTGTTGTCTAGGCT +CTGCTTCAAGGGGCCTTGTCAcaaatctctgcactgatcacccaggtgatgtaactcttg +tctaggctctgcttcCAGGGCATATTGTGACATATCTATGCACTGATCACCTTAGTGATG +TAACACTTGTGTAGGCTCGGCCTACAGGGGAattttgacatatctctgcactgttAACCG +AGGTGATTTAACTCTTCTCTAGGCTGTTCCCACAGGGGGATtgagacatatctctgcact +gatcccGAGGTGATCCAACTCTTGCCTGGTCTCTGCCTActggggacattgtgacatatc +tctgcactgatctccCTTGTGCTGCAACTTTAGTCTAGGCTCTGGCTACACGATATTGTG +ACATATCAGTGCACTGATCACATAGGTGatataactcttgtctaggctctgcctacaatG +GTCTTGTGacgtatctctgcactgatcacccaggtgatataaCTATTCTCTAGGATCTGA +CCACAGGGtgctttgtgacatatccctgtaatgatcacccaggtgatatacCACTAGCca +aggctctgcctacaggggcattgcAATGTATCTCAGCACTGATCACCTAGGTCTTGTAAC +TCTTTTCTAGGATCTGCCTACAGGGTGCTTTGTGACATATCCCAGCAAGGATTACCCAGG +TGATGTACCGCTCAtcaaggctctgcctacaggCACATGGCGatgtatctctgcactgat +cacctaggtcaTGTAACTTTGTCTAGTCTCTGCCTACGatggcattgtgacatatttctg +cactAATCATCCaagtgatgtaactcttgtctaggatcTGCCTACATTAACTTTGTGACA +TAATCCTGTACTGATCATCCAGGTGATGGGGtttttgtctaggctctgcctaagggggca +ttgtgacatatttctgcatTGATCACCCAGGTGGCGAACTCTTCTCTTggatctgcctat +gggggcattgtgacaaatctctgcactgatcacccaggtgtcATAACTGTTGTGTAACCT +CTGCCTACAGGGGAATTGTGAGAGATCTCGCCACTGATCACCCAAGTGATGTAACCATTG +TCTAGGCTTTGCGTAcagggggctttgtgacatacctttgcactgatcacccaggtgatg +taacacaTCTAAGTTCGGCCTAAAggagctttgtgacatatctctgcactgatcacttaG +GTGATGTAACACTTTTATAAGCACTGCCTACAGGGAATTTTGACAAATCTGTAcactgat +cacctaggtgatgtaactcttgtgtACCCTCTGTCCAACggggcattgtgaaatatctct +gcactgatgaCCCAGGTGATTCAACCCTTGACTAGGATCTGCCTACAGAGgttattgtga +aatatctctgcactgataaACTAGGTGGTGTAACCCTTGTCCAAGTTCTGCCTACAGGGG +CGTTTTCACATATCCCTGAACTGATGACAAAGGTGATGTAGCTCTTGCCTAGGCTTTGCC +TACAGGGGACATTGGACATatatctgcactgatcacccatgTGATGCAACTCTTGCCTAG +GCTTTGCCTACAttggacattgtgacatatctctgcactgatttCCCAGGCTCTGTAACT +TTAGGCTAGGCTCTGGCTGCacggcattgtgacatatcactgcactgatcaACCAGGTGA +TATAACCCCTGTATAGGCTATGCCTACAGGGggcttgtgacatatctctgcacggatcac +ccaggtgatataGCTCTTCTCTAGGATCTGCCTGCATGATGCTTTGTGACATAACcttgc +actgatcacccaggtgatctAACTCTGGTCTAAGCTCTTCCTAAAGGGGCACTGTGACag +atctctgcactgatcactcagATGATGTAACTGTTGTCTAGGCTCTGCTTCAAGGGGCCT +TGTCAcaaatctctgcactgatcacccaggtgatgtaactcttgtctaggctctgcttcC +AGGGCATATTGTGACATATCTATGCACTGATCACCTTAGTGATGTAACACTTGTGTAGGC +TCGGCCTACAGGGGAATcttgacatatctctgcactgttAACCGAGGTGAtttaactctt +gtctaggctgtGCCCACAGGGGGATtgagacatatctctgcactgatcccGAGGTGATCC +AACTCTTGCCTGGTCTCTGCCTActggggacattgtgacatatctctgcactgatctccC +TTGTGCTGCAACTTTAGTCTAGGCTCTGGCTACacgacattgtgacatatcagtGCACTG +ATCACATAGGTGATATAACTcctgtctaggctctgcctacaatgctcttgtgacatatct +ctgcactgatcacccaggtgatataaCTATTCTCTAGGATCTGACCACAGGGtgctttgt +gacatatccctgcaatgatcacccaggtgatatacCACTAGCcaaggctctgcctacagg +ggcattgcAATGTATCTCAGCACTGATCACCTAGGTCTTGTAACTCTTTTCTAGGATCTG +CCTACAGGGTGCTTTGTGACATATCCCAGCAAGGATTACCCAGGTGATGTACCGCTCAtc +aaggctctgcctacaggCACATTGCGatgtatctctgcactgatcacctaggtcaTGTAA +CTTTGTCTAGTCTCTGCCTACGatggcattgtgacatatttctgcactAATCATCCAAGT +GATGTAACTCTTGCCTAGGATCTGCCTACATTAACTTTGTGACATAATCCTGTACTGATC +ATCCAGGTGATGGGGtttttgtctaggctctgcctaagggggcattgtgacatatttctg +catTGATCACCCAGGTGGCGATCTCTTCTCTTGGATCTGCCTAAGGGGCATTGTGAcaaa +tctctgcactgatcacccaggtgacgTAACTGTTGTGTAACCTCTGCCGACAGTGAAATT +GTGAGAGATCTCGCCACTGATCACCCAAGTGATGTAACCATTGTCTAGGCTTTGCGTACA +GGGAGCTTTGTTACATACctttgcactgatcacccaggtgatgtaacacaTGTATGTTCG +GCCTAAAggagctttgtgacatatctctgcactgatcacttaGGTGATGTAACACTATTA +TAACCACTGCCTACAGGGAATTTTGACAAATCTGTACACTGATCACCTAGGTGACGTAAC +ACTTGTCTACCCTCTGTCCAACGGgtcattgtgaaatatctctgcactgatcacccaggt +gattcAACTCTTGACTAGGATCTGCCTACAGAGgttattgtgaaatatctctgcactgat +aaACTAGGTGGTGTAACCCTTGTCgaagctctgcctacaggggcgttTTCACATATCCCT +GAACTGATGACAGAGGTGATGTAACACTTGCTTAGGCTTTGCCTACAGGGGACATTGGAC +ATATATCTCCACTGATCTCCCAGGTGTTGCAACTCTGCCCTAGGCTTTGCCTACAGGGGA +CATTTTGACATATCTCTTCAATGATCACCCATGTGATGCAACTCTTGCCTAGCCTTTGCC +TAaaggggacattgtgacatatctctgcactgatctccCAGGTGCTGTAACTTTAGTCTA +GGCTCTGGCTACacggcattgtgacatatcactgcactgatcaaccaggtgatataactc +ttgtataggctctgcctacagggggaTTGTGAAATATCTCAGCACTGAACACCCAGGTGA +TTCAACTCTTGACTAGGAACTGCCTACAGAGgttattgtgaaatatctctgtaCTGATAA +ACTAGGTGGTGTAACCCTTGTCcaagctctgcctacaggggcgttTCCACATATCCCTGA +ACTGATGACAAAGGTGATGTAACCCTTGCCTAGGCTTTGCCTACAGGGGCATTGGACATa +tatctgcactgatcacccaggtgatgcaactcttgcCTAGGCTTTGCCTACAGGGGACAC +TGTGACATATCTCTTCAATGATCACTCATGTGATGCATCTCTTGCCTAGGCTTTGCCAac +aggggacattgtgacatatctctgcactgatctccCTGGTACTGTAACTTTAGTCTAGGC +TCTGGCTACacggcattgtgacatatcactgcactgatcaaccaggtgatataactcttg +tataggctctgcctacagggggaTTGTGACCTACCTCTGCACTGATCTCCCAGGTGATAT +AACTCTTCTCTAGGATCTGCCTACAGGGTGCTCTGTGACATATccctgcactgatcaccc +aggtgaccTAACTCTGGTCTAAGCTCTGCCTAAAGGGGCATTGTGACagatctctgcact +gatcactcagGTGATGTAACTATTGTCTAGGCTCTGCTTAAAGGGGCCTTGTCacatatc +actgcactgatcacccaggtgatgtaactcttgtctaggctctgcttcCAGGGCATATTG +TGACATAACTATGCACTGATCACCTTAGTGATGTAACACTTGTGTAGGCTCGGCCTACAG +AGGAATcttgacatatctctgcactgttAAACGAGGTGAtttaactcttgtctaggctgt +GCCCACAGGGGGATtgagacatatctctgcactgatcccGAGGTGATCCAACTCTTGCCT +GGTCTCTGCCTActggggacattgtgacatatctctgcactgatctccCAGGTGCTGTAA +ATTTTGTCTAGGCTCTGGCTACACGGCATTGTGACTTATCACTGCACCGATCACCCAGGC +GATacaactcttgtctaggctctgcctacaatggtcttgtgacatatctctgcactgatc +acccaggtgatataaCTCTTCTCTAGGACCTGACCACGGGGtgctttgtgacatatccct +gcaatgatcacccaggtgatatacCACTTGCCAAGGCTCTGCTTACAGGGGCATTGCAAT +GTATCTCTGCATTGATCACCTAGGTCTTGTAGCTATTTTCTAGGATCTGCCTACAGGGTG +CTTTGTGACGGGTCCCAGGAAGGATTACCCAGGTGATGTACCTCTCAtcaaggctctgcc +tacaggCACATTGCgatatatctctgcactgatcacctaggtcaTGTAACTTTTGTCTAG +GCTCTACCTACGatggcattgtgacatatctctgcactaaTCATCCAATTGATGTAACAC +TTGTCTAGGATGTGCCTAAATTAACTTTTTGACATAACCCTGTACTGATCATCCAGGTGA +TGGGGCTTTTTTCTAGGCTCTGCCtaagggggcattgtgacatatttctgcatTGATCAC +CCAGGTGGCGAACTCTTCTCTCggatctgcctatgggggcattgtgagaaatctctgcac +tgatcacccaggtgatgtaactgttGTGTAACCTCTGCCTACAGGGGAATTGTGAGATAT +CTCGCCACTGATTACCCAAGTGATGTAACCATTGTCTAGGCTTTGCGTAcagggggcttt +gtgacatacctttgcactgatcacccaggtgatgtaacacaTCTAACTTCGGCCTAAAGG +AGCTTTGTGAcacatctctgcactgatcacttaGGTGATGTAACACTTTTATAATCACTG +CCTACAGGGAATTTTGAcaaatctctgcactgatcacctaggtgatgtaactcttgtcta +ccCTCTGTCCAACGGGGCATTGTGAAATATATCTGCACTGAACACCAAGTGATTCAACTC +TTGACTAGGAACTGCCTACAGAGgttattgtgaaatatctctgcactgataaACTAGGTG +GTGTAACCCTTGTCcaagctctgcctacaggggcgttTCCACATATCCCTGAACTGATGA +CAAAAGTGATGTAACTCTTGCCTAGGCTTTGCCTGCAGGGGACATTGGACATatatctgc +actgatcacccaggtgatgcaactcttgcCTAGGCTTTGCCTTCAGGGGACACTGTGACA +TATCTCTTCAATGATCACTCATGTGATGCATCTCTTGCCTAGGCTTTGCCAAccggggac +attgtgacatatctctgcactgatctccCTGGTACTGTAACTTTAGTCTAGGCTCTGGCT +ACacggcattgtgacatatcactgcactgatcaaccaggtgatataactcttgtataggc +tctgcctacagggggaTTGTGACCTacctctgcactgatcacccaggtgatataactctt +ctctaggatctgcctacagggtgctttgtgacatatcccttcactgatcacccaggtgac +cTAACTCTGGTCTAAGCTCTGCCTAAAGGGGCATTGTGACagatctctgcactgatcact +cagGTGATGTAACTATTGTCTAGGCTCTGCTTAAAGGGGCATTGTCACATATCCCTGcgc +tgatcacccaggtgatgtaactcttgtctaggatcTGCTTCCAGGGCATATTTTGACATA +ACTATGCACTGATCACCTTAGTGATGTAACACTTGTGTAGGCTCGGCCTGCAGAGGAATc +ttgacatatctctgcactgttAAACGAGGTGAtttaactcttgtctaggctgtGCCCACA +GGGGGATtgagacatatctctgcactgatcccGAGGTGATCCAACTCTTGCCTGGTCTCT +GCCTActggggacattgtgacatatctctgcactgatctaACAGTTTCTGTAAATTTTGT +CTAGGCTCTGGCTACAAGGCTTTGTGACctatcactgcactgatcacccaggcgATACAA +CTCTTGTCTACGCTCTGCCTACAATGgtcttgtgacatatctctgcactgatcacccagg +tgatataaCTCTTCTCTAGGATCTGACCACGGGGtgctttgtgacatatccctgcaatga +tcacccaggtgatatacCACTTGCcaaggctctgcctacaggggcattgcaatgtatctc +tgcactgatcacctaggtcTTGTAGCTATTTTCTAGGATCTGCCTACAGGGTGCTTTTTG +ACGGGTCCCAGCAAGGATTACCCAGGTGATGTACTTCTCAtcaaggctctgcctacaggC +ACATTGCgatatatctctgcactgatcacctaggtcaTGTAACTTTTGTCTAGGCTCTAC +CTACGATggtattgtgacatatctctgcactaaTCATCCAAgtgatgtaacacttgtcta +GGATGTGCCTAAATTAACTTTTTGACATAACCCTGTACTGATCATCCAGGTGATGGGGct +tttgtctaggctctgcctaagggggcattgtgacatatttctgcatTGATCACCCAGGTG +GCGAACTCTTCTCTCGTatctgcctatgggggcattgtgagaaatctctgcactgatcac +ccaggtgatgtaactgttGTGTAACCTCTGCCTACAGGGGAATTGTGAGAGATCTCGCCA +CTGATTACCCAAGTGATGCAACCATTGTCTAGGCTTTGCGTAcagggggctttgtgacat +acctttgcactgatcacccaggtgatgtaacacaTCTAAGTTCGGCCTAAAGGAGCTTTG +TGAcacatctctgcactgatcacttaGGTGATGTAACACTTTTATAATGACTGCCTACAG +GGAATTTTGAcaaatctctgcactgatcacctacgtgatgtaactcttgtctaccCTCTG +TCCAACggggcattgtgaaatatctctgcactgaacACACAAGTGATTCAACTCTTGACT +AGGAACTGCCTACAGAGgttattgtgaaatatctctgcactgataaACTAGGTTGTGTAA +CCCTTGTCcaagctctgcctacaggggcgttTCCACATATCCCTGAACTGATGAcaaagg +tgatgtaactcttgcctAGGCTTTGCCTACAGGGGACATTG +>NC_060947.1 Homo sapiens isolate CHM13 chromosome X, alternate assembly T2T-CHM13v2.0 +caccacattggccaggctggtcttgaactcctgacttcagatgatcctcctgcctcagcc +tcccagagtgttgggattacaggcgtgagccacggtgcccggccagaCGTCATGTCTTAG +GAAATCAGAAAGTGGGTAGTTTCCGCACTCTGAGGAGAAAAAGAGACGTCCGGCGAAGAG +AAAGGAGAGTGAAAGGATGTCTCCTCTTGTCTGTAGCCTGTTCTCAATCGTGAGTGAGCC +AATTGCCAGAAACTGAGGGTGCTTCATTTGGCCAGGCAAGCTTCTCAACAGAATGTCTAA +GTACTTGTTAATGCTGAGAAGCTCTccaagctactgcactccagcctgggtgacagagca +cgacctTGTCTGAAAacaattaattaatcaattaattaatataatgaaATCATACTGAAC +TCAGGAGACCATtggggtgggcagggctggggttgGAAAGGAACATAAAATATGGTGCAA +TGGACTTTGCTCCAGTCTCCCTCCCCATCTCTTCTCGCCAAGAGTCTCTGGAGGGAGCAT +GGGGAAGATGCTTTGGGAATCTGTAACTTCTTGTCTTGTAAACAGAATATCTAAGTAATT +GTTAATGCTGAGAAGTTATAGATTTCCAAAGCCTTTCTCCAGGCTACGGACAAGGGTCAT +GGGTTACTCAGTGTTACAGAAAGAATGACATGGAGATGTTTGTTACATCTTAAGGAACCA +TGAGGGGCCAGAGTATTTTACTCTAAGTGTAGATGGTACATTGGCCACGCCTGTCCCAAC +ACCACCAATGGTGGCACCTAACTTTTGTGTTTGTGCcccacatttcttcttcttttctga +cGTAAATGCAAGTGATATTCCTTGGAAACCATGCTGCAGCAAGAGGCCATCTGACTACTA +GTGATACCCTGTAGCTCACCTACAGCAGCTCACTTGAAGCAGCTCACCCATAGCTCAGGT +ATAGCTCACCTGCAGCGGCTCACCTGTAGCTCACGTGTAGCTCACTTGTAGCAGCTCACT +GGTAGCTCACCTGCAGCAGCTCACCTGTACCTCACCTGTACCTCACCTGCAGCAGCTCAC +CTGTAGCTCACCTGtacgtgagccaccgtacccggccagcaagaccccatttctaaaata +aatacacaaaaattagccggacgcggtggcgcgtgtctgtagttgtagctactcaggagg +ctgaggtgggaggattgctggaggctgggaggtagaggctgcagtgaaccgtgatccagc +cactgtactctagcctggatgacatagcaaaaccttgtctcaaaaaacaaaaacaaaaaa +caaaacaaagaaacaaacaaaaaacccacgcACAccggaaaacaaaacaaaaagcaaaaa +ggaaagaaaagagagccaggtcccaaatatatatttccttgGAGAACCATTTGCAAAGAG +CAcacttaaggccgggcgcggtggctcacgcctgtcatcccggcactttgggaggccgag +gtgggtggatcacgaggttgggagatcgagaccatcctggccaacatggtgaaaccccat +ctctactaaaaatacaaaaaatcagccaggtgctgtggcaggtgcctgtagtcccagcca +ctcaggaggctgaggcaggagaatggcatgaacctgggaggtggaggttgcagtgagccg +agatcgcgcccctgcactccagcctgggcgacagagcgagactccttctcaaataaataa +ataaataaataacaaagagcaAACTTAAAATTGTCTCAGAAATCCCACGGGATATTGGAT +CTCCCTCATGGCTATCTGATGACACTTTGAGTGTCTGGGACCCCGTGCCTATTTTCTGGG +GTTCCCAGAAGCTGCCGTTCTGAAAGTGTGGCTCTCGGGGACGTGGCACAGGTGTGGATG +TCTGTTTTAAATGTCAGGCGTTTGGACGTTGAGGAACGTGAGGCTGAAGGTCGCCTTCGC +CGACCCCCTGAGTTTAGGGTCCTGCCTTTTAAAATCTTCCCAGCACTCTGTTGTTCACGC +AAGCGTCCCATCTGTTTGGGTGGCCGTGCCGTCTGCATCTGTCTCGAACCTTCACAGCTT +TGCAGAATATCCTGTTTCTCAATACGGATGGAGAAACACGAGACGCGTTTTCTGGGTTAT +TTTAGCCGTCACGGAGAACCCCAGACTCATGTGTGCTAATGACCTCATTAATGATACTCT +GAGGCAGACAGCCCTGCCTGATCttaacaacattttttaaatttctttttttgttgttgt +tgttacagcaTCATTCATATAACGTAGGAAACCGTGATCAGTAGCTTTTAGGATATTTGC +AACAGGGTGTAACCATCTGTTAGACTCCAGAGCGTTTTTATCACGCTGAAAAGAAACCGC +AAGCCCATTCCGCCATCAGTCTCAGGTTTCTCCATTTAGCCTGGGCAACCATTAACCTGC +TTCCCATCTCTCTACACCTCTCCTACtctgaatatgtatatatacgtgtgtatatatatg +tgcatctatgtgtgtgtgtacatgtaaatatatgtgtgtatatgtgtatatatgtgggta +tatatagtgtgtatatatctgtatatacgtgtgtatacatatgtgaatctatgtgtgtgt +gtacatgtaaatatatgtgtatatgtgtgtatatatagtgtatatatgtgcatctatgtg +tgtgtgtacgtgtaaatatatgtgtatatgtatatatgtgtatatgtgtgtatatatagt +gtttatatgtgcatctatgtgtgtgtgtacgtgtaaatatatgtgtatatgtatatatgt +gtatatgtgtgtatatatagtgtgtatatatatgtgcatatatgtgtgtgtacatgtaaa +tatatgtgtatatatgtatatatgcatatatatagtgtatatatgtctgcttatatgtat +atatgtgtggacatatgtatatatttgtgtgtatgtgtatatagagtgtatatatgtgta +tatgtgtatatatgtgtatatatgtatatatatcagtgtatgtatgtgtgtatatatgta +tatatgtgtatatatgtatatatatcagtgtatgtatgtgtgtatatatgtatatatgtg +tatatatgtatatatatcagtgtatatatgtgtatatatgtatatatgtgtatatatgta +tatctctgtatatatgtatatctgtgtatatatgtgtgtatatatgtatatatagtgtat +atatgtgtgtatatatatgtacatatgtatatatatgcacatatgtatatatatgcactt +ttttttcccattcagccTATAAGTACGAGGCAGGCCATGTTcatttatattaagaaatat +gTAGACTGCCAAATGAGGCAATCATATTTCTGAAGCCAGCCAATGCAAACCCTCCTTCTT +TCAGAAGGGACGTCTCcccaggcaaaaagaaaaaaaaaaaaaagtcagcttcGCAAGATC +TCTTACCGTGAGCGGAAAATGCAGTTAAGTTAAGAGAGCCGGCCAGCCAGGCTCCCGATG +GCGGTGTGACGGGTGGCGTGGACGACGCTGGGAGAACCACGGGGAAGATGGGTGATACGA +TGCTCCTTCTAATTGACACCTCTAGGTCCAGGGCAAGTTAATGATGAGCTTGGACCGCGT +TGCCACCGGTTCGAATGGCCTTTGCCAGTTTTCTCTGCACGGAGCAGCGTTCGGCTTCAC +ATTTTTGCCTCTTAACTTCATCCACTTGGTCTGTTTCTGAAAAGCACCTTCTCCTCTGGC +ATGGAGCTTAGAATGTTGTGGCGGGTCATGGGGTCtgtcattttctcttattttaattat +tattcatttatttatttttgagacagtgtctcactctgtcacccaggctggagtgcagtg +gtgcaatctcagctcactgcaacctccacctcccgggttcaagcgattctcctgcctcag +cctcctgagtagctggtactacaggcatccgccaccacgcccggctaatttttgtatttt +tagtagagatggggtttcaccatgttagccagaaaggtctcgatctcttgacctcgtgat +ccacctgcctcggcctcccaaagtgctgggattacaggcacccgccaccgcacctggcta +atttttttttttgtatttttagtagagacggggtttcaccatgttggtcaggctggtctc +gaactcctgacctcaaataatcctcccaaagagctgggattacaggtgtgtcatttttaa +attttcatagagatggggtcctgtTATATTGCTGAGGCTGATCTGgatctcccagcctca +agcaattatcttgcctcagcctcccaaagtgctgggattacaagtgtgagccactgcgcc +tgggtcAGGCTCAcggagttttttatttttattttttttattttttttgagatggcgtct +cactctgtcgcccaggctggagtgcaatggcatgatcttggctcactgcaacctctgcct +cccaggctcaagtgattctcctgcctcagcctcccgagtagctgggattacaggcgcccg +tcacctgcctaattttttcctttgtttttgagaccaagtcttgctctgtcccccaggctg +gagtgcaatggatccatcttggctcactgcaacctgtgcctcctgggttcacgccattct +cctgcctcagcctcctgagtagctgggactacaggcgcccgccaccacgcccggctaatt +ttttgtatttttagtagagacggggtttcaccatgttagccaggatggtctcgatctcct +gaccttgtgatccgcctgcctcggcctcccaaagtgctgggattacaggtgtgaaccact +acacctggctaatttttgtatctttagtacagatggggtttcaccatgttggccaggctg +gtctcgaactcctgaccttgtgatccacccacctgagcctcccaaagtgctaggattaca +aatgtgagccactgcacccagcccaggctCATGGAGTTTTTAGTAAGAGCCCATGCTCAC +AGCCTGTCTTAAGGGAGACCTTCTCCAGATCCTGGGTGGTGCCGTTTCATGGACAACAAA +TTCATTCTCAAAAAGCGTAGCCCCAGTGGAAGACCTTGGGTCCTTCCACTCGGAGTGTGT +CAGTTCATCACCATAACCGTTTGTTGAGGTGTGTTCAAAACATCTATAGCCAAATTCCAC +AGGAGGAATGGGATGAGGACTCTAAGCTTCTGGACTTGATGTAGAAACcgggtctttgca +gatgtcttTAAGGGAAGGATCTGAAATGAGGTcatcctggattagggtgggtCTTAAATC +CAATAACAGGTGTCCTTGTAAGGGACAGAAGAGGACCATAAATCTAATGACTACGGTCCT +CCTAAGAGATGGAAGAGGAGACATAGACACaggcacagacacagaggagaaggccacgtg +gagacGGAGGCAGCGACTGGAGTGAtccggccacaagcccagggacgcctggagccccca +ggagctgggagaggcaggaaggatcctcccctagagcctccagagggaactTCTTATGGT +TGAAGTGGATTGAACTATGGTACCCCCCAAAAATATGTTCATATTCTAACCCAAGAACCT +GTGAAAGGAGGTAGAGACTGGAGTGATggggccacaagcccagggatacCTGGAGCaccc +agaagctgggagaggcaggaaggatcctcccctagagcctccagaaggaactggATACAA +CTGAAGTGAAGTGAACCGTGGCCCCTCAAAAGACCTGTCCATGTATTGATCATCTGGAAT +CTGTGAATGGGACATTATTTGGAAATACGGtctctgcagatgtgattaagtggAAGATct +ggagatgagatcatcctagaTTAGGGTGGACCATAAATCTAATGAcaggtgtccttctaa +gagacagaagaggagacacagacacagaggaggaggccacgtggagacagaggcagagac +tggagtgatgcagccacaagcccagggatgcctggagcccccaggagctgggagaggcag +gaaggatcctcccttAGAGTCtccagagggagcacagccctgagACTCCTTGACCTCAGA +CTCCTGGTCTccaggactgggagaggcaggaaggaccctcccttagagcctctggaggga +gcatggccctgagACACGTTGACCTCAGACTCCTGGTCTccaggactgggagaggcagga +aggaccctcccttagagcctctggagggagcatggccctgagACACCTGGACCTCAGACT +TCTGGTCTCTatggctgggagaggcaggaagtcTCCTCCTcaagagcctctggagggagc +atggccctgagACTCCTTGACCTCAGACTCCTGGTCTCCAggcctgggagaggcaggaag +gaccctcccttagagcctctggagggaacATGGTCCTGAGACTCCTTGACCTCAGACTCT +TGGTCTCCAGGACTTGACGGGGATGAATTCCTGCGGCATGCATCGTCATTCCTGGTCCTT +TGTTACGGCTGACTCAGGAATCTAAGAAACTGACCTGCGGGGTTTTGCCCATCAGGATGG +TGGCTTCTCCGGCTGTGGATTTGTTGCTTTTCCATCTTCTCTGCGGCTGACACTCTTACG +GGGAGTAATGGTGCAGAGAATTTCGGTTGCCTCCCAGAGCTGCAGCCGGAAGACGCAAGG +ACCAACGAAAACATTTGCATCGTGGCTCTCTGTGAGGAAGAGTCCTGCTGTGAAAGCATT +TTTATTCCGAAAGAGGATCATCTTTGGGAGCAGAACCATGGAAAAGTCTCTTTCGGCAGC +CCACGGAATGATGGGCCGGCCACATTTTGGATACATCTCATGCTTCTTACTGTTTTCAAA +TGGTTTTGGCTTGAATGGAATTCcaagcccattttttttttcctctttcccaagTACTTT +TTGTTCTTGAGTCTTGCAATCCTATGAATTCCAAGGGAAGCTGAATGTCTATCTTTTTGA +TACGTGGACACTGTCATCCTGCAAACAAAACCGTAGACGTCTTTGGGGGGGTCGTGAACT +TGGCAGTGAAGTTCGAAGGTCTCCAGTGCTTCTCACATCCGAAGTCAGAGCCCACATTTC +TCCGTCAGTTTGTAACCCTGGCAAAAGAAGGTCTTCGGCTTGCTTGTTTTCCTGAAAAAC +AGGAAGTTTTATTTTGCCAAGAATGAATGGAATGGGAAGCCAAAGCGTTTGATATGCACA +AGGGAAAATGCAGGATTTTTTTGTGTGCAAAGTTTACGTGGGGCTACACACCCTATTTCC +TCTTTCCTCACAATGATGCCACGAAATTGATTTTATTCCCTGCGGCTACTACATTTACCG +TTCAAGTGCTGaattcctcccctcccctgccctccccactcccctcccctgacctccccc +ctcccctcccctgccctccccatcccctccccctccccctctactccccctcctcccatc +ccatctcctttccccctcccccatcccatccctcccgtcctcccctcccctcccctcttc +ccctcccctctccttcaccCCCTcacatcccctcccctcccctcctaccctcccctcctc +ccctctccttccccttcccccctcccctcctccccttccctctgttcctcccctcctccc +ctcccctcctcccctcccctcctcccctcccctctcctttcccactcccccctcccatcc +cctcctccactcccctcctcccctactctcctcccctcctcccgtcccctcctcccctcc +cctcttctcttcccctcccctcccctcctccctctcctcccctttccccctcccccttcc +catcccctcccatcctcccctccctcccatcttcccctcccctcccctcctctcttcccc +tcccctcccctcccccacttctcactctcctcccccctcccatcccctcccctcctcttc +tcttctcttcttttctcttcttttcttttttttcttcttcttttttttttttctaatggt +cttcctctgtcacccaggctggagtgcagtggtgcgatcttggctcactgcagcctccac +ctctctggctcaagagatccttccacctcatcctTCTGATtctgttacttatttttattt +ttttaattaattaattaatcttttttttgagatggagtctggctctgttgcccagtctgg +agtgcagtggcgctacctcggctcactgcaagctccacctcctgggttcacgccattctc +ctgcctcagcctcccgggtaactgggactacaggcacccgtcaccacacccgactaattt +ttgtatttttagtagagacgggatttcaccgtgttagccaggatgatctcggtctcctga +cctcatgatctgccctcctcagcctcccaaaatgctggtatgacaggcatgagccaccgc +gcccagcctaattaattttttacattttactttaacttctgagatacatgtgctaattaa +ttaattttttaaattttactttaaaaaagtcaTACTTTACTTAAGTAAAAGTAAGTAAAT +GTGTGTTAACTAAACacattctggggtacatgtgcacaaagcgcaggttagttacatatg +tatacatgtgccatggtggtttgctgctcctatcaacccattatctaagttttaagcccc +acatgcactaggtatttgtcctaatgctctccatcCTCTTGCCTTCTATCcccccacagg +ccctggtgtgtgatgttcccctccctgtgtccatgtgttctcactgttcaactcccactt +acgagtgagaacatgcagtgtttggttttctgaggATGCGGaaaaataggaaagctttta +ctctcgatggtgggaggtgaataagttcaaccattgtggaaggcagtgtgatgattcctt +gaggatctagaacaagaagtAACAttggacccagccatcccattactgggtatataccga +aaggattgtaaatcatgctgctataaagacacatgcacacgtatgtttattgaggcacta +ttcacaatagcaaagacttggaaccaacccaaatgtccatcaacaatagactggataaag +aaaatgtggcacacagacaccatggaatactatgcagccatgaaaaaggatgagttcatg +tcctttgcagggacatggatgaagctggaaaccatcattctcagcaaactcacacaggaa +cagaaaaccaaacgccacgtgttctcactcataagtgggagtcaaacaatgacaacacat +ggacacagggaggggaacatcacacactgggggcctgttggggggtgaggggctagggga +tggagggcattaggacaaatacctaatgtagatgatgggttgatgggtgcagcaaaccac +catgacacatgcatacctatgtaacaaacctgcacgttctgcacttgtaccccagaactt +aaagtaaaatttaaaaacaaacaaacaaacaaaaaaacaaaggccaggcctggtgactta +cacctataatcccagcactttgggaggccaaggttaggagtttgagaccagcctggacaa +catagcaaaagcctgtctctactaaaaatacaaaaaaaaattaacagggagtggtggtgg +gcacctgtaatcccagctacttgggaggctgaggcaggagaatcacttgaacccgggagg +ccgaggttgcggtgagccgagatcgtgccattgcactccaggctgggcgacagagtgaga +ctctgtctcaaaaaataaataaataaataaatgtaaaaaaataaaaataggtcgggcacg +gtggctcacgtctgtaatcccagcactttggaaggccgaggtgggtggatgacagggtca +agagattgagaccatcctggccaacatggcaaaatgccgtctctactaaaaaatacaaaa +attaggcgggcgtggtggcgggtgcctgtaatcccagctac +>NC_060948.1 Homo sapiens isolate NA24385 chromosome Y, alternate assembly T2T-CHM13v2.0 +GTACagccctagattttttttttttttaaccaaaaaggcTGAGTAATTTTGAAAAATCGA +AACATAACAGTGTGTCATCATTTCCTCCCAAGAAAAAGCTCACTCCACGTGAGTAGAAAG +ACATCTACCTGGTCCCTGTAGAATCTGAACGTTTCTCTTTAGAGACGGaatttcaatctt +gttgcccaggctggagtgcagtggcacaatctcggctcaccgcaacctccgcctcccggg +ttcaagccattctcctgcctcagcctcccgagtagctgggattacaggcacctgccacca +ggcctgggtaactttctggtatttttagtagagacagggtttcagcctcccgagtagctg +ggattacaggcacctgccaccaggcctgggtaactttctggtatttttagtagagacagg +gtttcagcctcccgagtagctgggattacaggcacctgccaccaggcctgggtaactttc +tggtatttttagtagagacagggtttcagcctcccgagtagctgggattacaggcacctg +ccaccaggcctgggtaactttctggtatttttagtagagacagggtttcggcctcccgag +tagctgggattacaggcacctgccaccaggcctgggtaactttctggtatttttagtaga +gacagggtttcggcctcccgagtagctgggattacaggcacctgccaccaggcctgggta +actttctggtatttttagtagagacagggtttcggcctcccgagtagctgggattacagg +cacctgccaccaggcctgggtaactttctggtatttttagtagagacagggtttcagcct +cccgagtagctgggattacaggcacctgccaccaggcctgggtaaCTTTCtggtagtttt +agtagagacagggtttcggcctcccgagtagctgggattacaggcacctgccaccaggcc +tgggtaactttctggtatttttagtagagacagggtttcggcctcccgagtagctgggat +tacaggcacctgccaccaggcctgggtaactttctggtatttttagtacagacagggttt +cggcctcctgagtagctgggattacaggcacctgccaccaggcctgggtaaCTTTCtggt +agttttagtagagacagggtttcagcctcccgagtagctgggattacaggcacctgccac +caggcctgggtaactttctggtatttttagtacagacagggtttcggcctcctgagtagc +tgggattacaggcacctgccaccaggcctgggtaaCTTTCtggtagttttagtagagaca +gggtttcagcctcccgagtagctgggattacaggcacctgccaccaggcctgggtaattt +ttttgcatttttggtggagacagttttttgccgtgttggcccggctggcctcaaactcct +gacctcaggttgaCCTGCCCGCTTTGtccctcgcaaagtgctgggattacaggcgtgagc +caccgcacctggcctgaatctGAACTTTTAAAAGGGAGTTACTGACTCTCAACTGTGCGG +GGACGGTTTCAGTTTGATTTAATATGGAAAGAGGGCCAAGTGTCATCCTCACAAATGGGT +CCCCGAAGCAGATCAAACGCAGAGAACTGTGAGGGTGGGACACGAGTGTCTGTGGACACT +GGCTGCCTTTGGCTTTTCTCCTGCGAGAGAAGTTGGGTGACTTTCTGTAGGTGGATGAGT +GATCCCTGAATGAGTGTGGGGTACGTGTATGCTAGCTGCTTCTTTCTCCCTGAAACTCTC +GGATGGAAGGAAGTAAGAAATTCAGCTTGGGCTGTGACCAGTTCTCACCACCAAcgccct +cttctctctcccttcccttctccttccttccttccttccttccttcctttctttttcttt +ctttctttctctctttctttcttttctttctttgtttctttctttttctttctttctgtt +tctttcctttttatctttctctctttttctttctcttttccttttttctttctttctttc +tttttctttctttcttcgatgaagtctcactctgtcacccaggctggagtgcagtggtgc +aatcccagctcactgcatcctctacctcctggcttcaagaaattctcctgcctcagcctc +ccaagtagctgggatgacaggcacccaccaccattcccggataatttttgtattttttag +tagagactgggtttcgccatgttggccaggctggtcttgaactcctgacctcacatgatc +cacccgcctcggcctcccagagtgctgggattacggggtgaggcaccgcgcccggcctcc +tctctctttttctgagatGTTTAGGAAGGACTGGGCTGATGGGGACCCTCTGTATGTGAT +GTGCGTGGGTTTGGTTTCCCGGAAGGCCCTCCAGAGACACGTTTGCGTGAACATTCAGCA +TGGAAACAACATACGTCTCTCCACAGGAGGTGAGAAATTGAATTTATGGGGTGGGTGTAC +GCTGGCGATTCTTGGTGCTTTTTGCTCAAAACAAGGTTCTTTTGAAAGTCACGTTCCTGC +TTTCCCTGTGGCTTCCCGGTGAGCTCGCTCGCAGAGCAAGGAATACCACCCAGAGAGCAA +CGTGGGCTGTGTTCCGTTGTAACGCCGTTGCAGAGAGAGGATTTGGTGTGTGAGATCCGT +ACCAGCTCCAGCACACTGATAGGAACACGTTGCTGGCCGAACTGAACGATGCTGGGTTGG +GTCCTGATTGATACGtattttcttccctcctctccccaaaaCTTGGCCAAATAGTCCGTG +GAGGGTTGTCAGTCGCCGCAGTTGAGCAAAAAACACTTCTTCCTTTGAGTGGCTGTTCTG +GTGAAATCTGTTTCTGACATAtccacttttctctctcttttctctctctctgactgcGAA +GCacccacagggagaaggaattgGATGTATCGGATGTTGCtattagattttctttctccG +TTCGAGTCTCTGACTGGTGCATACTTTGCAAAGGTGTGTTCCTGGCAATTGCCAAGAGTT +AGAAAAATGCACCTTCTCTGGTGGCCGTTGGGGTGTTGTTTCACAGGCAGTGGTGACAGG +GCCCCTTGGCTGTGGCTGTCTTCTCCAGCGCCGTGGATAAAGAGATGGGACAGATTCTGT +GCCTCTGTACGATTTAGAGCGTAACTGACCGCGTCCAACACCCGTTTTTCCACTTACAAA +GCTGGTGGTGCGACGGGCTTGGTGTCTCCCGTACGGGAAGGAGGCCTTTGGGCCGCTCCA +AAGACGCCCTGTCGTAGGAATGGCCTCTCCATCCCGCCAAAGTCCAGCCAGGCCCCCGAA +ATGGTCCCATTTCCTTGGAAGCCTGAGTTTCTGTTCTGGTCTTGCTGCTGTCCTTGGCCA +CGTCAGCACGTGGGAGCATCTGTGGATACCGCAGAGTCTGGGGACAGCTGGGCGTTTAAC +CGAAATGAAGCCGAGACGGGTTTCAGGTTTTGGTGCCAAGCTCTGGTCAGGATGAAAGGG +AAATACCAGAGTCCTGTGTCCTCACCTCTGGGTTTCATGCTGACCTTTCTAACATTTGTT +TTCCCCTAAGAACAAGCAGAAGCCTCCAGCTCCCTTTAGCTCCACAGTTTTCCCGGGGAC +ATAGCGAGGATGGCACACGGCAGCCACTCCCACGACACACATTTCGGAGGCACTTTGCTG +GAAGCCGCTTGTCTCCTCCAGCTTTGGGAGgtctggggaggagagaggctTTCGGTGGAC +AcgtttgacattaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaactggtgccTAATTT +ATTAAAGAGAATTAGCTTAGCGAGTATATGCTGATATTCTTCGACACACGTGGGTAAGTT +GATgccatttataaatgttttattgaaattTGATATTTAATGAGAAGCCGGTTAAGGAAT +GTAGACAATATCCCGTTTCAAAGCTATGAAATGTGCTATTTATTGAAAGGGGATGTGGCT +TCACGAGTTCAGCCCATTGTACGTGCAGGTCCCGTGGGAAGGAGGCAAAAGCCCCTGCTT +CTTACTTTGTGATGTATGTggatttgttatttattttttttttccttggtcgGACGTTCA +TAAATATGTACTATTTTAATTATGTCGAGTGTAAATTTGACATCGcgttgcatttatttt +tatatttctgaaaactgttgctttttctttttccctcccccaTTGACGACATAGCGGCCC +CCGCGTCCGGGTTACAAATACATCTACAGATATTTTCAGGGATTGCTTCAGATGAAAACA +AATCACACACCGTTTCCCAAACCAACAGTCTTCACATTTCTATCCCTCTGTTATTGTCGG +CAGGCGGTGAGgggtagaaaaaaaacaaacaaacaaacaaaaaaaaaaccaaaaaaaacc +accCTGAGTTTCTCTGGTGACGCCCTCATTCTCCTAACGTTCAATAATCTCAATGTTGAG +TTGCAGCAACAGACTGTATTTTTGTGACGCCCCGTAGTATGAATGtacatcttgtaaaac +tgagatataaataaacttataaatatttgtattcaagtgttaaaaaaaaaaaaattctca +acctCTCCCCTGAGGACAGgcttattggaaaaaaaaaaaaaaaaaaaaaatcctgagtcG +GCCGTGGCTGAACACAGAGTGTTGTTCTGCTCCGTGCATTTCCAGGGTGGGTACCCAGTG +TTGCCCCCCAGCCTTAGATCGGGAGGTACCATTGACTTTTGCTTGTATCCCATCCCCTTC +CTTTACTGAAACCTACCTCCCCGCTTCTCAGCCAACGTCCCCCCAGAAGGTGgcaaaaaa +aacagaggaaaaagccCTGATTTGAATCAAGTCAGAGCTGCTAATTCTCCactttcttta +attaattaatttatttttttttttgagactgagtctcgctctgtcgcccaggccggagga +gtgcaggggcgcgatctcggctcaccgcgacctccgcctcccgggttcaagcgactctcc +tgcctcagcctcccgagtagctgggatgacagtcacctgcaccaccgcgcccggctcatt +tttgtatttttagtagcaatggggtttcaccgtgttggtcaggctggtctcgaactcctg +acctcgtgatccacccgcgtctGGGCCCGGCCGGTGATGTGTgtgcttttaacttttatt +ttgttccaGTTTTCGACAGTGGCACGGATTTTCCAGCACGGTCTTGCAAGGATGATTGAG +TCATTTTTgagacaaaaaatataataataataaatggaaaaagaaatcgacttttaaaaa +tgacaaatttttttttttttttttgcatagatttttctctctttatgtaAAGGAAAGTTC +ATGATTGGATTTGGCCGGCCTGACTGCTTCCCGGCTGTGATAAAAAACACATGTGAGctg +ggagggaagtgggggagggaCACAGCTGCCCACACAGGGTTCCCACCGCGGTTACAGGGT +GGGCAGTGCTGGGGGAGCTTTCTCTGTGGGGGGCTCAGAGCCTGAGGACAGGTGAGCCTC +TCCGACACCTCCCCAGTTGCCTGGAGTCTAAACCGTCCGTTGTCTGTACCGTCCGTTCTT +CCTGCTGACTCCTGGTAGTTCCTGAAAGCTTCTCTTGGCCAGAGAAGGGGTTTCAGAGGC +CGTGTGTCCAGGCCATTCTGCAAAGTGCAACTTGAccgttcctttccttttctggcctGC +GTGGTCTGAAGCTCAGAGCCCTCTCTTCAcccagcctgtgtgtgtcttgcCGGACAGAAG +AAAAATGGTGCTTTTTGCGTGTTAGCAGAGGTGCTTTTCATGGCTGACCTCAACGCGTCC +ATCTCCAGCCTTGACCAAGCTGTTTTTTAGGGGCAAACGCAGGCAAGTTCTGAATGCACA +CAGTTATTTCATGGTTAAACTATTCagctttggccgggcgcagtgtggctctcacgcctg +tcatcccagcactttgggaggccgaggcgggtggatcacctgaggtcaggagttcgagac +cagcctggccaacacggtgaaactctatctctactaaaaatacaaaaattagccgggcgt +ggtggtgtgtatctgtaatcccagctactcaggaagctgaggcaggagaatcgcttggac +ccaggaggcggaggttgcactgagccgagatcgcgccattgcactccagcctgggcgaca +gagccagacgctgtctcaaaaaaatgaataataaaataaaataacaggaactaaataaaa +taaaacgttCAGCTTTGTTCTGCAAATCCACTCCTATTGTTTTACGTGGTTTGAGAGACT +CTGTCCCTTAGAAATAGATGTTTGTTGCCAATTGTAATGAATCTGTttcaaaaatgaaca +gaatattcAAATGGTTTGAGAGATCTTTTCCCTTAGAAATAGCTTGTTGCCAATCACAaa +gaatgtttttcaaaaatgaatggAATCTTCCTGGATATCGCTTCcagatcttcatttttt +ttgcataGTTCAACCTGAAAAGTAAGTGTCTCAGCCCtgaatttctttctgatttttcca +TGGGTTGTCTTGCAGACTTCTCTGGACTtgaccacatttaaaaaaaaaaaaattaacttt +ttcacACGGACACGGTTTCAATAGGAATGAGATCTTTGAGTTTTTATGTAACAGATTCTT +ACCATCAGTTCTCAGATTCCCAAATTACACACAAAAAGCCACGGACTTCGCCTCCTGCTA +ACATGTCCTTCtgtttctgaggcttctgttggTGTTAGACTTTCATGTTTAATAGCAGAC +AATGTagggatttaaagaaaaatgcagagaaagcAAAAACACTGACCAAACACACGGAGA +TAAGCTTTCTAAAGCCTTTGTTCTTGGAGTtgtcgttaaaaaaaaaaagttgttttaaac +tTTGCAAGCATGCCTATATTGAACTCATAAGCAAGAGAGCCAAGAAAAATAGTGTCGGTC +GTCTACTCTACACGTTTTCCCAAAACAGacgtattttaatttcttttgtttgaacTCACA +GATGCTGAgagttaaaagttaaatttttgtcATGAACAATAATGGccaaaaccacagtta +cttttgcactatagcataataagaaaaatacaggctgggctcggtggctcacacctgtaa +tcaaagcactttTGGAGGCGAAACAgccagatcccttgagcccaggagattgagaccagc +ctgggcaacatagcgagaccctcatctctacaaaaaaggtttgttacatatgtaacaaac +ctgcacattgtgcacatgtaccctaaaacttaaagtataataataaaaaaattaaaaaaa +aattcaccaatcAACTGCCTGCTggtgccttcaagagactcacctaacacataaggactt +gCATAAACTTATAAAACAATTCAATGGAAGAATCCTTGAAAGTATTCTGAGAAGACAGTA +TAATAAACTGATTTCTAAAAAGGctataaaaaattgaataaatcatTGTTGGGCATCCTG +TGCTGAAATATAATGCAgccaataaaaattacaaaatgaataaacattttataacaatta +aaaaaagtcaaataattaggcaggcatggtggtgctctcCTACGGTTGAAGCTATTCAGC +AGGCAAGAggatactttgtttttgttttttaattttttttgagacagagtctcgctctgt +tgccaggctggagtgcagtggcgtgatctcagctcactgtaatttctgcctcccgggttc +aagcgattttcctgccccagcctcccgagtagctgggattacaggtgcccgccaccacac +ctggctaatttcttttgtatttttagtagagacgaggtttccccatgttggccaggctgg +ttttgagctcccgacctcgggtgatccacccgcctcagcctcccaaagtgctgggatgac +aggcgtgagccaccgcgcctggcccaggaggattatttgatcccaggaggtggaggctgc +aggaagccatgattgcaccactgcactccagcctggctgacagagtgagaccacatctct +aaataaatgaataaatacaggcagaaactttttttgttttgttttgatggagtcttgctc +tgtcaccaggcaggagtgcagtggtgccatctcagctcactgcaacctccacctcctggg +ttcaagcaatcctcctgcctcagcctcccgagtagctgggattacaggtgcccgccacca +cgcccggctaattttttgtatgtttagtagagacgggatttcaccgtgttagccaggatg +gtcttgatctcttgactttgtgatctgcctgcctcagcctcccaaagtgctgggattaca +ggcatgagcccaggagttcaagaccagcctcagcaacaaagtgagaccttttctctccaa +aaaatcaaaaatttagccagctgtggtggctcctgcccgtgatcccagtactgtgggagg +ctgaggcagaattgcttgagcccaggagttcgagaccaacctcaGCAAAAaggactctct +ctctgtctctctctctctctctctctctctctctctctctctctctatatatatatatat +atatatatatatatgagtttcaAAAATTGCTGGGTGACCAGCTTATCTACTGGTTTTCCC +CTTGGGAAAGTGAAATTGTCATGTATTGAAGATTTCCAAGGAAGTTGTATTGAATGAGAA +ACAAACTCAATCTGTTCGTGTTTAAAGAGCTGCAGTGCGTTTGCTGTGTTTCCCATAAAA +CTGCACTTCCAAAAGACACGCTGAGAAAGGAGACCAGGATTTGTAATTCAGAAATTGGAA +AGCAAGTTAGGCTGgacgtggtagctcatgcttgttgtaatctcagcactctgggaggct +gaggcaggaggatcacttgagcccaggagttcaagaccagcccgtgccacatggtgaaac +cctgtctctccaaaaaataaaacatttagccagatgtggtgactcatgcctgtaatcccg +gtattctgggaggctgaggcagagttgcttgagcccaggagttcaagaccagcctcggca +acaaagtgagaccctgtctctccaaaaaataaaacatttagccagctgtggtgactcatg +cctgtaatctcagtactctgggaggctggggcagaatggcttgagcccaggagttcgaga +ccaacctcagcaacaaagtgagatcttgtttctccaaaaaatcaaaaatttagccagctg +tgctggctcatgcctgtaatcccggtactctgggaggctgaggcagaatcgtttgagccc +aggagttcgagaccaacctcagcaacaaagtgagatcttgtttctccaaaaaaatcaaaa +atttagccagctgtgctggctgatgcctgtaatcccggtactctgggaggctgaggcgga +attgcttgagctcaggagttcaagaccagcctcagcaacaaagtgagatcttgtttctcc +aaaaaataaaatatttagccagctgtggtggctcaagcgtgtgatcctagcattttggga +ggccgaggcgggcggatcacgaggtcatgagatcgagaccatcctggctaacacggtgaa +accccgtctctactaaaaatacaaagaaaattagccgggcgtggtggcgggcgcctgcag +tcccagctactcgggaggctgaggcaggagaatgccgtgagcctgggaggcggaccttgc +agtgagtcaagatcgcgccactgacctccagcctgggccacagagcgagactccgtctca +aaaaaaaaaaaaattgctgcccaacctgtgtttgcaccactgccctccagcctgggcaac +agagcaagactccgtctcaaaaaaaaaaaaaaaaaaagctgcccaagctgtgtttgcacc +actgccctccagcctgggcaacagagcaagactccgtctca diff --git a/conf/modules.config b/conf/modules.config index 26f5151..f1f3d52 100644 --- a/conf/modules.config +++ b/conf/modules.config @@ -40,7 +40,7 @@ process { ext.args = { params.fastq_output ? "--fastq-output" : ""} ext.prefix = { "${meta.id}_${taxid.toString().replaceAll(' ', '-')}" } publishDir = [ - path: { "${params.outdir}/reads/kraken2" }, + path: { "${params.outdir}/extracted_reads/kraken2" }, mode: params.publish_dir_mode, pattern: '*.{fastq,fasta}' ] @@ -49,7 +49,7 @@ process { withName: EXTRACTCENTRIFUGEREADS { ext.prefix = { "${meta.id}" } publishDir = [ - path: { "${params.outdir}/reads/centrifuge" }, + path: { "${params.outdir}/extracted_reads/centrifuge" }, mode: params.publish_dir_mode, pattern: '*.fastq' ] @@ -57,7 +57,7 @@ process { withName: EXTRACTCDIAMONDREADS { ext.prefix = { "${meta.id}" } publishDir = [ - path: { "${params.outdir}/reads/diamond" }, + path: { "${params.outdir}/extracted_reads/diamond" }, mode: params.publish_dir_mode, pattern: '*.fastq' ] @@ -69,6 +69,29 @@ process { mode: params.publish_dir_mode, saveAs: { filename -> filename.equals('versions.yml') ? null : filename } ] - + } + withName: '.*:FASTQ_ALIGN_BOWTIE2:BAM_SORT_STATS_SAMTOOLS:SAMTOOLS_(SORT|INDEX)' { + publishDir = [ + path: { "$params.outdir/pathogens/bowtie2/align" }, + mode: params.publish_dir_mode, + saveAs: { filename -> filename.equals('versions.yml') ? null : filename } + ] + } + withName: 'SAMTOOLS_SORT' { + ext.prefix = { "${meta.id}_aligned_pathogens_genome_sorted"} + } + withName: '.*:FASTQ_ALIGN_BOWTIE2:BAM_SORT_STATS_SAMTOOLS:BAM_STATS_SAMTOOLS:.*' { + publishDir = [ enabled: false ] + } + withName: 'BOWTIE2_BUILD_PATHOGEN' { + ext.args = '--large-index' + publishDir = [ + path: { "$params.outdir/pathogens/bowtie2/build" }, + mode: params.publish_dir_mode + ] + } + withName: '.*:FASTQ_ALIGN_BOWTIE2:BOWTIE2_ALIGN' { + ext.args = '--no-unal' + publishDir = [ enabled: false] } } diff --git a/conf/test.config b/conf/test.config index 0b6517e..71ce54e 100644 --- a/conf/test.config +++ b/conf/test.config @@ -21,6 +21,7 @@ params { // Input data input = 'assets/samplesheet_v1.csv' + pathogens_genome = 'assets/test_data/reference/reference.fna' // Extract reads extract_kraken2_reads = true diff --git a/conf/test_full.config b/conf/test_full.config index b0ad611..2c39976 100644 --- a/conf/test_full.config +++ b/conf/test_full.config @@ -15,9 +15,15 @@ params { config_profile_description = 'Full test dataset to check pipeline function' // Input data for full size test - // TODO nf-core: Specify the paths to your full test data ( on nf-core/test-datasets or directly in repositories, e.g. SRA) - // TODO nf-core: Give any required params for the test so that command line flags are not needed - input = params.pipelines_testdata_base_path + 'viralrecon/samplesheet/samplesheet_full_illumina_amplicon.csv' + input = '../final_test_data/samplesheet_v3.csv' + pathogens_genome = 'assets/test_data/reference/reference.fna' + + // Extract reads + extract_kraken2_reads = true + fastq_output = true + + extract_centrifuge_reads = true + extract_diamond_reads = true // Genome references genome = 'R64-1-1' diff --git a/conf/test_taxid.config b/conf/test_taxid.config index 51dce1f..a2ce629 100644 --- a/conf/test_taxid.config +++ b/conf/test_taxid.config @@ -11,7 +11,7 @@ */ params { - config_profile_name = 'Test profile' + config_profile_name = 'Test user defined taxid profile' config_profile_description = 'Minimal test dataset to check pipeline function' // Limit resources so that this can run on GitHub Actions @@ -21,8 +21,8 @@ params { // Input data input = 'assets/samplesheet_v1.csv' - taxid = '211044 11676' //separated by space + pathogens_genome = 'assets/test_data/reference/reference.fna' // Extract reads extract_kraken2_reads = true diff --git a/modules.json b/modules.json index 93a1f1a..2992ed0 100644 --- a/modules.json +++ b/modules.json @@ -8,7 +8,7 @@ "bowtie2/align": { "branch": "master", "git_sha": "e4bad511789f16d0df39ee306b2cd50418365048", - "installed_by": ["modules"] + "installed_by": ["fastq_align_bowtie2", "modules"] }, "bowtie2/build": { "branch": "master", @@ -39,11 +39,51 @@ "branch": "master", "git_sha": "b7ebe95761cd389603f9cc0e0dc384c0f663815a", "installed_by": ["modules"] + }, + "samtools/flagstat": { + "branch": "master", + "git_sha": "04fbbc7c43cebc0b95d5b126f6d9fe4effa33519", + "installed_by": ["bam_stats_samtools"] + }, + "samtools/idxstats": { + "branch": "master", + "git_sha": "04fbbc7c43cebc0b95d5b126f6d9fe4effa33519", + "installed_by": ["bam_stats_samtools"] + }, + "samtools/index": { + "branch": "master", + "git_sha": "04fbbc7c43cebc0b95d5b126f6d9fe4effa33519", + "installed_by": ["bam_sort_stats_samtools"] + }, + "samtools/sort": { + "branch": "master", + "git_sha": "04fbbc7c43cebc0b95d5b126f6d9fe4effa33519", + "installed_by": ["bam_sort_stats_samtools"] + }, + "samtools/stats": { + "branch": "master", + "git_sha": "04fbbc7c43cebc0b95d5b126f6d9fe4effa33519", + "installed_by": ["bam_stats_samtools"] } } }, "subworkflows": { "nf-core": { + "bam_sort_stats_samtools": { + "branch": "master", + "git_sha": "0eacd714effe5aac1c1de26593873960b3346cab", + "installed_by": ["fastq_align_bowtie2"] + }, + "bam_stats_samtools": { + "branch": "master", + "git_sha": "0eacd714effe5aac1c1de26593873960b3346cab", + "installed_by": ["bam_sort_stats_samtools"] + }, + "fastq_align_bowtie2": { + "branch": "master", + "git_sha": "0eacd714effe5aac1c1de26593873960b3346cab", + "installed_by": ["subworkflows"] + }, "utils_nextflow_pipeline": { "branch": "master", "git_sha": "5caf7640a9ef1d18d765d55339be751bb0969dfa", diff --git a/modules/local/extractcentrifugereads.nf b/modules/local/extractcentrifugereads.nf index efcd331..00aa204 100644 --- a/modules/local/extractcentrifugereads.nf +++ b/modules/local/extractcentrifugereads.nf @@ -17,6 +17,9 @@ process EXTRACTCENTRIFUGEREADS { tuple val(meta), path("*.fastq"), emit: extracted_centrifuge_reads path "versions.yml", emit: versions + when: + task.ext.when == null || task.ext.when + script: def args = task.ext.args ?: '' def prefix = task.ext.prefix ?: "${meta.id}" diff --git a/modules/local/extractdiamondreads.nf b/modules/local/extractdiamondreads.nf index 097ff14..9b8a222 100644 --- a/modules/local/extractdiamondreads.nf +++ b/modules/local/extractdiamondreads.nf @@ -17,6 +17,9 @@ process EXTRACTCDIAMONDREADS { tuple val(meta), path("*.fastq"), emit: extracted_diamond_reads path "versions.yml", emit: versions + when: + task.ext.when == null || task.ext.when + script: def args = task.ext.args ?: '' def prefix = task.ext.prefix ?: "${meta.id}" diff --git a/modules/nf-core/samtools/flagstat/environment.yml b/modules/nf-core/samtools/flagstat/environment.yml new file mode 100644 index 0000000..68b8155 --- /dev/null +++ b/modules/nf-core/samtools/flagstat/environment.yml @@ -0,0 +1,8 @@ +name: samtools_flagstat +channels: + - conda-forge + - bioconda + - defaults +dependencies: + - bioconda::samtools=1.20 + - bioconda::htslib=1.20 diff --git a/modules/nf-core/samtools/flagstat/main.nf b/modules/nf-core/samtools/flagstat/main.nf new file mode 100644 index 0000000..754d84b --- /dev/null +++ b/modules/nf-core/samtools/flagstat/main.nf @@ -0,0 +1,46 @@ +process SAMTOOLS_FLAGSTAT { + tag "$meta.id" + label 'process_single' + + conda "${moduleDir}/environment.yml" + container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ? + 'https://depot.galaxyproject.org/singularity/samtools:1.20--h50ea8bc_0' : + 'biocontainers/samtools:1.20--h50ea8bc_0' }" + + input: + tuple val(meta), path(bam), path(bai) + + output: + tuple val(meta), path("*.flagstat"), emit: flagstat + path "versions.yml" , emit: versions + + when: + task.ext.when == null || task.ext.when + + script: + def args = task.ext.args ?: '' + def prefix = task.ext.prefix ?: "${meta.id}" + """ + samtools \\ + flagstat \\ + --threads ${task.cpus} \\ + $bam \\ + > ${prefix}.flagstat + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//') + END_VERSIONS + """ + + stub: + def prefix = task.ext.prefix ?: "${meta.id}" + """ + touch ${prefix}.flagstat + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//') + END_VERSIONS + """ +} diff --git a/modules/nf-core/samtools/flagstat/meta.yml b/modules/nf-core/samtools/flagstat/meta.yml new file mode 100644 index 0000000..9799135 --- /dev/null +++ b/modules/nf-core/samtools/flagstat/meta.yml @@ -0,0 +1,51 @@ +name: samtools_flagstat +description: Counts the number of alignments in a BAM/CRAM/SAM file for each FLAG type +keywords: + - stats + - mapping + - counts + - bam + - sam + - cram +tools: + - samtools: + description: | + SAMtools is a set of utilities for interacting with and post-processing + short DNA sequence read alignments in the SAM, BAM and CRAM formats, written by Heng Li. + These files are generated as output by short read aligners like BWA. + homepage: http://www.htslib.org/ + documentation: http://www.htslib.org/doc/samtools.html + doi: 10.1093/bioinformatics/btp352 + licence: ["MIT"] +input: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - bam: + type: file + description: BAM/CRAM/SAM file + pattern: "*.{bam,cram,sam}" + - bai: + type: file + description: Index for BAM/CRAM/SAM file + pattern: "*.{bai,crai,sai}" +output: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - flagstat: + type: file + description: File containing samtools flagstat output + pattern: "*.{flagstat}" + - versions: + type: file + description: File containing software versions + pattern: "versions.yml" +authors: + - "@drpatelh" +maintainers: + - "@drpatelh" diff --git a/modules/nf-core/samtools/flagstat/tests/main.nf.test b/modules/nf-core/samtools/flagstat/tests/main.nf.test new file mode 100644 index 0000000..24c3c04 --- /dev/null +++ b/modules/nf-core/samtools/flagstat/tests/main.nf.test @@ -0,0 +1,36 @@ +nextflow_process { + + name "Test Process SAMTOOLS_FLAGSTAT" + script "../main.nf" + process "SAMTOOLS_FLAGSTAT" + tag "modules" + tag "modules_nfcore" + tag "samtools" + tag "samtools/flagstat" + + test("BAM") { + + when { + params { + outdir = "$outputDir" + } + process { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.sorted.bam', checkIfExists: true), + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.sorted.bam.bai', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot(process.out.flagstat).match("flagstat") }, + { assert snapshot(process.out.versions).match("versions") } + ) + } + } +} diff --git a/modules/nf-core/samtools/flagstat/tests/main.nf.test.snap b/modules/nf-core/samtools/flagstat/tests/main.nf.test.snap new file mode 100644 index 0000000..e9f85ef --- /dev/null +++ b/modules/nf-core/samtools/flagstat/tests/main.nf.test.snap @@ -0,0 +1,32 @@ +{ + "flagstat": { + "content": [ + [ + [ + { + "id": "test", + "single_end": false + }, + "test.flagstat:md5,4f7ffd1e6a5e85524d443209ac97d783" + ] + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "23.04.3" + }, + "timestamp": "2024-02-12T18:31:37.783927" + }, + "versions": { + "content": [ + [ + "versions.yml:md5,f606681ef971cbb548a4d9e3fbabdbc2" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "23.10.1" + }, + "timestamp": "2024-05-28T15:41:52.516253882" + } +} \ No newline at end of file diff --git a/modules/nf-core/samtools/flagstat/tests/tags.yml b/modules/nf-core/samtools/flagstat/tests/tags.yml new file mode 100644 index 0000000..2d2b725 --- /dev/null +++ b/modules/nf-core/samtools/flagstat/tests/tags.yml @@ -0,0 +1,2 @@ +samtools/flagstat: + - modules/nf-core/samtools/flagstat/** diff --git a/modules/nf-core/samtools/idxstats/environment.yml b/modules/nf-core/samtools/idxstats/environment.yml new file mode 100644 index 0000000..eb6c880 --- /dev/null +++ b/modules/nf-core/samtools/idxstats/environment.yml @@ -0,0 +1,8 @@ +name: samtools_idxstats +channels: + - conda-forge + - bioconda + - defaults +dependencies: + - bioconda::samtools=1.20 + - bioconda::htslib=1.20 diff --git a/modules/nf-core/samtools/idxstats/main.nf b/modules/nf-core/samtools/idxstats/main.nf new file mode 100644 index 0000000..2ea2a5c --- /dev/null +++ b/modules/nf-core/samtools/idxstats/main.nf @@ -0,0 +1,48 @@ +process SAMTOOLS_IDXSTATS { + tag "$meta.id" + label 'process_single' + + conda "${moduleDir}/environment.yml" + container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ? + 'https://depot.galaxyproject.org/singularity/samtools:1.20--h50ea8bc_0' : + 'biocontainers/samtools:1.20--h50ea8bc_0' }" + + input: + tuple val(meta), path(bam), path(bai) + + output: + tuple val(meta), path("*.idxstats"), emit: idxstats + path "versions.yml" , emit: versions + + when: + task.ext.when == null || task.ext.when + + script: + def args = task.ext.args ?: '' + def prefix = task.ext.prefix ?: "${meta.id}" + + """ + samtools \\ + idxstats \\ + --threads ${task.cpus-1} \\ + $bam \\ + > ${prefix}.idxstats + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//') + END_VERSIONS + """ + + stub: + def prefix = task.ext.prefix ?: "${meta.id}" + + """ + touch ${prefix}.idxstats + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//') + END_VERSIONS + """ +} diff --git a/modules/nf-core/samtools/idxstats/meta.yml b/modules/nf-core/samtools/idxstats/meta.yml new file mode 100644 index 0000000..344e92a --- /dev/null +++ b/modules/nf-core/samtools/idxstats/meta.yml @@ -0,0 +1,52 @@ +name: samtools_idxstats +description: Reports alignment summary statistics for a BAM/CRAM/SAM file +keywords: + - stats + - mapping + - counts + - chromosome + - bam + - sam + - cram +tools: + - samtools: + description: | + SAMtools is a set of utilities for interacting with and post-processing + short DNA sequence read alignments in the SAM, BAM and CRAM formats, written by Heng Li. + These files are generated as output by short read aligners like BWA. + homepage: http://www.htslib.org/ + documentation: http://www.htslib.org/doc/samtools.html + doi: 10.1093/bioinformatics/btp352 + licence: ["MIT"] +input: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - bam: + type: file + description: BAM/CRAM/SAM file + pattern: "*.{bam,cram,sam}" + - bai: + type: file + description: Index for BAM/CRAM/SAM file + pattern: "*.{bai,crai,sai}" +output: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - idxstats: + type: file + description: File containing samtools idxstats output + pattern: "*.{idxstats}" + - versions: + type: file + description: File containing software versions + pattern: "versions.yml" +authors: + - "@drpatelh" +maintainers: + - "@drpatelh" diff --git a/modules/nf-core/samtools/idxstats/tests/main.nf.test b/modules/nf-core/samtools/idxstats/tests/main.nf.test new file mode 100644 index 0000000..a2dcb27 --- /dev/null +++ b/modules/nf-core/samtools/idxstats/tests/main.nf.test @@ -0,0 +1,36 @@ +nextflow_process { + + name "Test Process SAMTOOLS_IDXSTATS" + script "../main.nf" + process "SAMTOOLS_IDXSTATS" + tag "modules" + tag "modules_nfcore" + tag "samtools" + tag "samtools/idxstats" + + test("bam") { + + when { + params { + outdir = "$outputDir" + } + process { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.sorted.bam', checkIfExists: true), + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.sorted.bam.bai', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot(process.out.idxstats).match("idxstats") }, + { assert snapshot(process.out.versions).match("versions") } + ) + } + } +} diff --git a/modules/nf-core/samtools/idxstats/tests/main.nf.test.snap b/modules/nf-core/samtools/idxstats/tests/main.nf.test.snap new file mode 100644 index 0000000..4eacdb9 --- /dev/null +++ b/modules/nf-core/samtools/idxstats/tests/main.nf.test.snap @@ -0,0 +1,32 @@ +{ + "versions": { + "content": [ + [ + "versions.yml:md5,7acbcb2a8ec6436ba7b2916d3ff13351" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "23.10.1" + }, + "timestamp": "2024-05-28T15:46:46.617989517" + }, + "idxstats": { + "content": [ + [ + [ + { + "id": "test", + "single_end": false + }, + "test.idxstats:md5,df60a8c8d6621100d05178c93fb053a2" + ] + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "23.04.3" + }, + "timestamp": "2024-02-12T18:36:41.561026" + } +} \ No newline at end of file diff --git a/modules/nf-core/samtools/idxstats/tests/tags.yml b/modules/nf-core/samtools/idxstats/tests/tags.yml new file mode 100644 index 0000000..d3057c6 --- /dev/null +++ b/modules/nf-core/samtools/idxstats/tests/tags.yml @@ -0,0 +1,2 @@ +samtools/idxstats: + - modules/nf-core/samtools/idxstats/** diff --git a/modules/nf-core/samtools/index/environment.yml b/modules/nf-core/samtools/index/environment.yml new file mode 100644 index 0000000..260d516 --- /dev/null +++ b/modules/nf-core/samtools/index/environment.yml @@ -0,0 +1,8 @@ +name: samtools_index +channels: + - conda-forge + - bioconda + - defaults +dependencies: + - bioconda::samtools=1.20 + - bioconda::htslib=1.20 diff --git a/modules/nf-core/samtools/index/main.nf b/modules/nf-core/samtools/index/main.nf new file mode 100644 index 0000000..b523c21 --- /dev/null +++ b/modules/nf-core/samtools/index/main.nf @@ -0,0 +1,48 @@ +process SAMTOOLS_INDEX { + tag "$meta.id" + label 'process_low' + + conda "${moduleDir}/environment.yml" + container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ? + 'https://depot.galaxyproject.org/singularity/samtools:1.20--h50ea8bc_0' : + 'biocontainers/samtools:1.20--h50ea8bc_0' }" + + input: + tuple val(meta), path(input) + + output: + tuple val(meta), path("*.bai") , optional:true, emit: bai + tuple val(meta), path("*.csi") , optional:true, emit: csi + tuple val(meta), path("*.crai"), optional:true, emit: crai + path "versions.yml" , emit: versions + + when: + task.ext.when == null || task.ext.when + + script: + def args = task.ext.args ?: '' + """ + samtools \\ + index \\ + -@ ${task.cpus-1} \\ + $args \\ + $input + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//') + END_VERSIONS + """ + + stub: + """ + touch ${input}.bai + touch ${input}.crai + touch ${input}.csi + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//') + END_VERSIONS + """ +} diff --git a/modules/nf-core/samtools/index/meta.yml b/modules/nf-core/samtools/index/meta.yml new file mode 100644 index 0000000..01a4ee0 --- /dev/null +++ b/modules/nf-core/samtools/index/meta.yml @@ -0,0 +1,57 @@ +name: samtools_index +description: Index SAM/BAM/CRAM file +keywords: + - index + - bam + - sam + - cram +tools: + - samtools: + description: | + SAMtools is a set of utilities for interacting with and post-processing + short DNA sequence read alignments in the SAM, BAM and CRAM formats, written by Heng Li. + These files are generated as output by short read aligners like BWA. + homepage: http://www.htslib.org/ + documentation: http://www.htslib.org/doc/samtools.html + doi: 10.1093/bioinformatics/btp352 + licence: ["MIT"] +input: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - bam: + type: file + description: BAM/CRAM/SAM file + pattern: "*.{bam,cram,sam}" +output: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - bai: + type: file + description: BAM/CRAM/SAM index file + pattern: "*.{bai,crai,sai}" + - crai: + type: file + description: BAM/CRAM/SAM index file + pattern: "*.{bai,crai,sai}" + - csi: + type: file + description: CSI index file + pattern: "*.{csi}" + - versions: + type: file + description: File containing software versions + pattern: "versions.yml" +authors: + - "@drpatelh" + - "@ewels" + - "@maxulysse" +maintainers: + - "@drpatelh" + - "@ewels" + - "@maxulysse" diff --git a/modules/nf-core/samtools/index/tests/csi.nextflow.config b/modules/nf-core/samtools/index/tests/csi.nextflow.config new file mode 100644 index 0000000..0ed260e --- /dev/null +++ b/modules/nf-core/samtools/index/tests/csi.nextflow.config @@ -0,0 +1,7 @@ +process { + + withName: SAMTOOLS_INDEX { + ext.args = '-c' + } + +} diff --git a/modules/nf-core/samtools/index/tests/main.nf.test b/modules/nf-core/samtools/index/tests/main.nf.test new file mode 100644 index 0000000..bb7756d --- /dev/null +++ b/modules/nf-core/samtools/index/tests/main.nf.test @@ -0,0 +1,87 @@ +nextflow_process { + + name "Test Process SAMTOOLS_INDEX" + script "../main.nf" + process "SAMTOOLS_INDEX" + tag "modules" + tag "modules_nfcore" + tag "samtools" + tag "samtools/index" + + test("bai") { + + when { + params { + outdir = "$outputDir" + } + process { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.sorted.bam', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot(process.out.bai).match("bai") }, + { assert snapshot(process.out.versions).match("bai_versions") } + ) + } + } + + test("crai") { + + when { + params { + outdir = "$outputDir" + } + process { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/homo_sapiens/illumina/cram/test.paired_end.recalibrated.sorted.cram', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot(process.out.crai).match("crai") }, + { assert snapshot(process.out.versions).match("crai_versions") } + ) + } + } + + test("csi") { + + config "./csi.nextflow.config" + + when { + params { + outdir = "$outputDir" + } + process { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.sorted.bam', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert path(process.out.csi.get(0).get(1)).exists() }, + { assert snapshot(process.out.versions).match("csi_versions") } + ) + } + } +} diff --git a/modules/nf-core/samtools/index/tests/main.nf.test.snap b/modules/nf-core/samtools/index/tests/main.nf.test.snap new file mode 100644 index 0000000..52756e8 --- /dev/null +++ b/modules/nf-core/samtools/index/tests/main.nf.test.snap @@ -0,0 +1,74 @@ +{ + "crai_versions": { + "content": [ + [ + "versions.yml:md5,802c9776d9c5e95314e888cf18e96d77" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "23.10.1" + }, + "timestamp": "2024-05-28T15:42:04.203740976" + }, + "csi_versions": { + "content": [ + [ + "versions.yml:md5,802c9776d9c5e95314e888cf18e96d77" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "23.10.1" + }, + "timestamp": "2024-05-28T15:42:09.57475878" + }, + "crai": { + "content": [ + [ + [ + { + "id": "test", + "single_end": false + }, + "test.paired_end.recalibrated.sorted.cram.crai:md5,14bc3bd5c89cacc8f4541f9062429029" + ] + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "23.04.3" + }, + "timestamp": "2024-02-12T18:41:38.446424" + }, + "bai": { + "content": [ + [ + [ + { + "id": "test", + "single_end": false + }, + "test.paired_end.sorted.bam.bai:md5,704c10dd1326482448ca3073fdebc2f4" + ] + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "23.04.3" + }, + "timestamp": "2024-02-12T18:40:46.579747" + }, + "bai_versions": { + "content": [ + [ + "versions.yml:md5,802c9776d9c5e95314e888cf18e96d77" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "23.10.1" + }, + "timestamp": "2024-05-28T15:41:57.929287369" + } +} \ No newline at end of file diff --git a/modules/nf-core/samtools/index/tests/tags.yml b/modules/nf-core/samtools/index/tests/tags.yml new file mode 100644 index 0000000..e0f58a7 --- /dev/null +++ b/modules/nf-core/samtools/index/tests/tags.yml @@ -0,0 +1,2 @@ +samtools/index: + - modules/nf-core/samtools/index/** diff --git a/modules/nf-core/samtools/sort/environment.yml b/modules/nf-core/samtools/sort/environment.yml new file mode 100644 index 0000000..36a12ea --- /dev/null +++ b/modules/nf-core/samtools/sort/environment.yml @@ -0,0 +1,8 @@ +name: samtools_sort +channels: + - conda-forge + - bioconda + - defaults +dependencies: + - bioconda::samtools=1.20 + - bioconda::htslib=1.20 diff --git a/modules/nf-core/samtools/sort/main.nf b/modules/nf-core/samtools/sort/main.nf new file mode 100644 index 0000000..596c6f7 --- /dev/null +++ b/modules/nf-core/samtools/sort/main.nf @@ -0,0 +1,63 @@ +process SAMTOOLS_SORT { + tag "$meta.id" + label 'process_medium' + + conda "${moduleDir}/environment.yml" + container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ? + 'https://depot.galaxyproject.org/singularity/samtools:1.20--h50ea8bc_0' : + 'biocontainers/samtools:1.20--h50ea8bc_0' }" + + input: + tuple val(meta) , path(bam) + tuple val(meta2), path(fasta) + + output: + tuple val(meta), path("*.bam"), emit: bam, optional: true + tuple val(meta), path("*.cram"), emit: cram, optional: true + tuple val(meta), path("*.crai"), emit: crai, optional: true + tuple val(meta), path("*.csi"), emit: csi, optional: true + path "versions.yml" , emit: versions + + when: + task.ext.when == null || task.ext.when + + script: + def args = task.ext.args ?: '' + def prefix = task.ext.prefix ?: "${meta.id}" + def extension = args.contains("--output-fmt sam") ? "sam" : + args.contains("--output-fmt cram") ? "cram" : + "bam" + def reference = fasta ? "--reference ${fasta}" : "" + if ("$bam" == "${prefix}.bam") error "Input and output names are the same, use \"task.ext.prefix\" to disambiguate!" + + """ + samtools cat \\ + --threads $task.cpus \\ + ${bam} \\ + | \\ + samtools sort \\ + $args \\ + -T ${prefix} \\ + --threads $task.cpus \\ + ${reference} \\ + -o ${prefix}.${extension} \\ + - + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//') + END_VERSIONS + """ + + stub: + def prefix = task.ext.prefix ?: "${meta.id}" + """ + touch ${prefix}.bam + touch ${prefix}.bam.csi + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//') + END_VERSIONS + """ +} diff --git a/modules/nf-core/samtools/sort/meta.yml b/modules/nf-core/samtools/sort/meta.yml new file mode 100644 index 0000000..341a7d0 --- /dev/null +++ b/modules/nf-core/samtools/sort/meta.yml @@ -0,0 +1,71 @@ +name: samtools_sort +description: Sort SAM/BAM/CRAM file +keywords: + - sort + - bam + - sam + - cram +tools: + - samtools: + description: | + SAMtools is a set of utilities for interacting with and post-processing + short DNA sequence read alignments in the SAM, BAM and CRAM formats, written by Heng Li. + These files are generated as output by short read aligners like BWA. + homepage: http://www.htslib.org/ + documentation: http://www.htslib.org/doc/samtools.html + doi: 10.1093/bioinformatics/btp352 + licence: ["MIT"] +input: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - bam: + type: file + description: BAM/CRAM/SAM file(s) + pattern: "*.{bam,cram,sam}" + - meta2: + type: map + description: | + Groovy Map containing reference information + e.g. [ id:'genome' ] + - fasta: + type: file + description: Reference genome FASTA file + pattern: "*.{fa,fasta,fna}" + optional: true +output: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - bam: + type: file + description: Sorted BAM file + pattern: "*.{bam}" + - cram: + type: file + description: Sorted CRAM file + pattern: "*.{cram}" + - crai: + type: file + description: CRAM index file (optional) + pattern: "*.crai" + - csi: + type: file + description: BAM index file (optional) + pattern: "*.csi" + - versions: + type: file + description: File containing software versions + pattern: "versions.yml" +authors: + - "@drpatelh" + - "@ewels" + - "@matthdsm" +maintainers: + - "@drpatelh" + - "@ewels" + - "@matthdsm" diff --git a/modules/nf-core/samtools/sort/tests/main.nf.test b/modules/nf-core/samtools/sort/tests/main.nf.test new file mode 100644 index 0000000..fb38ed9 --- /dev/null +++ b/modules/nf-core/samtools/sort/tests/main.nf.test @@ -0,0 +1,104 @@ +nextflow_process { + + name "Test Process SAMTOOLS_SORT" + script "../main.nf" + process "SAMTOOLS_SORT" + tag "modules" + tag "modules_nfcore" + tag "samtools" + tag "samtools/sort" + + test("bam") { + + config "./nextflow.config" + + when { + process { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.bam', checkIfExists: true) + ]) + input[1] = Channel.of([ + [ id:'fasta' ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot( + process.out.bam, + process.out.csi.collect { it.collect { it instanceof Map ? it : file(it).name } } + ).match("test_bam") + } + ) + } + } + + test("cram") { + + config "./nextflow.config" + + when { + process { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/homo_sapiens/illumina/cram/test.paired_end.sorted.cram', checkIfExists: true) + ]) + input[1] = Channel.of([ + [ id:'fasta' ], // meta map + file(params.modules_testdata_base_path + 'genomics/homo_sapiens/genome/genome.fasta', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot( + process.out.bam, + process.out.csi.collect { it.collect { it instanceof Map ? it : file(it).name } } + ).match("test_cram") + } + ) + } + } + + test("bam_stub") { + + config "./nextflow.config" + options "-stub" + + when { + params { + outdir = "$outputDir" + } + process { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.bam', checkIfExists: true) + ]) + input[1] = Channel.of([ + [ id:'fasta' ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll ( + { assert process.success }, + { assert snapshot(file(process.out.bam[0][1]).name).match("bam_stub_bam") }, + { assert snapshot(process.out.versions).match("bam_stub_versions") } + ) + } + } +} diff --git a/modules/nf-core/samtools/sort/tests/main.nf.test.snap b/modules/nf-core/samtools/sort/tests/main.nf.test.snap new file mode 100644 index 0000000..5a27de1 --- /dev/null +++ b/modules/nf-core/samtools/sort/tests/main.nf.test.snap @@ -0,0 +1,114 @@ +{ + "cram": { + "content": [ + [ + [ + { + "id": "test", + "single_end": false + }, + "test.sorted.bam:md5,21c992d59615936b99f2ad008aa54400" + ] + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-05-31T08:13:54.512837189" + }, + "bam_stub_bam": { + "content": [ + "test.sorted.bam" + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-05-31T07:29:00.761845507" + }, + "test_cram": { + "content": [ + [ + [ + { + "id": "test", + "single_end": false + }, + "test.sorted.bam:md5,22b2093be34a7637f5fbc84272b89d06" + ] + ], + [ + [ + { + "id": "test", + "single_end": false + }, + "test.sorted.bam.csi" + ] + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-05-31T09:16:51.924951855" + }, + "test_bam": { + "content": [ + [ + [ + { + "id": "test", + "single_end": false + }, + "test.sorted.bam:md5,21c992d59615936b99f2ad008aa54400" + ] + ], + [ + [ + { + "id": "test", + "single_end": false + }, + "test.sorted.bam.csi" + ] + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-05-31T08:28:12.15952312" + }, + "bam_stub_versions": { + "content": [ + [ + "versions.yml:md5,7a360de20e1d7a6f15a5e8fbe0a9c062" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-05-31T07:29:00.765038811" + }, + "bam": { + "content": [ + [ + [ + { + "id": "test", + "single_end": false + }, + "test.sorted.bam:md5,21c992d59615936b99f2ad008aa54400" + ] + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-05-31T08:13:48.538030517" + } +} \ No newline at end of file diff --git a/modules/nf-core/samtools/sort/tests/nextflow.config b/modules/nf-core/samtools/sort/tests/nextflow.config new file mode 100644 index 0000000..f642771 --- /dev/null +++ b/modules/nf-core/samtools/sort/tests/nextflow.config @@ -0,0 +1,8 @@ +process { + + withName: SAMTOOLS_SORT { + ext.prefix = { "${meta.id}.sorted" } + ext.args = "--write-index" + } + +} diff --git a/modules/nf-core/samtools/sort/tests/tags.yml b/modules/nf-core/samtools/sort/tests/tags.yml new file mode 100644 index 0000000..cd63ea2 --- /dev/null +++ b/modules/nf-core/samtools/sort/tests/tags.yml @@ -0,0 +1,3 @@ +samtools/sort: + - modules/nf-core/samtools/sort/** + - tests/modules/nf-core/samtools/sort/** diff --git a/modules/nf-core/samtools/stats/environment.yml b/modules/nf-core/samtools/stats/environment.yml new file mode 100644 index 0000000..1cc83bd --- /dev/null +++ b/modules/nf-core/samtools/stats/environment.yml @@ -0,0 +1,8 @@ +name: samtools_stats +channels: + - conda-forge + - bioconda + - defaults +dependencies: + - bioconda::samtools=1.20 + - bioconda::htslib=1.20 diff --git a/modules/nf-core/samtools/stats/main.nf b/modules/nf-core/samtools/stats/main.nf new file mode 100644 index 0000000..982bc28 --- /dev/null +++ b/modules/nf-core/samtools/stats/main.nf @@ -0,0 +1,49 @@ +process SAMTOOLS_STATS { + tag "$meta.id" + label 'process_single' + + conda "${moduleDir}/environment.yml" + container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ? + 'https://depot.galaxyproject.org/singularity/samtools:1.20--h50ea8bc_0' : + 'biocontainers/samtools:1.20--h50ea8bc_0' }" + + input: + tuple val(meta), path(input), path(input_index) + tuple val(meta2), path(fasta) + + output: + tuple val(meta), path("*.stats"), emit: stats + path "versions.yml" , emit: versions + + when: + task.ext.when == null || task.ext.when + + script: + def args = task.ext.args ?: '' + def prefix = task.ext.prefix ?: "${meta.id}" + def reference = fasta ? "--reference ${fasta}" : "" + """ + samtools \\ + stats \\ + --threads ${task.cpus} \\ + ${reference} \\ + ${input} \\ + > ${prefix}.stats + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//') + END_VERSIONS + """ + + stub: + def prefix = task.ext.prefix ?: "${meta.id}" + """ + touch ${prefix}.stats + + cat <<-END_VERSIONS > versions.yml + "${task.process}": + samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//') + END_VERSIONS + """ +} diff --git a/modules/nf-core/samtools/stats/meta.yml b/modules/nf-core/samtools/stats/meta.yml new file mode 100644 index 0000000..735ff81 --- /dev/null +++ b/modules/nf-core/samtools/stats/meta.yml @@ -0,0 +1,63 @@ +name: samtools_stats +description: Produces comprehensive statistics from SAM/BAM/CRAM file +keywords: + - statistics + - counts + - bam + - sam + - cram +tools: + - samtools: + description: | + SAMtools is a set of utilities for interacting with and post-processing + short DNA sequence read alignments in the SAM, BAM and CRAM formats, written by Heng Li. + These files are generated as output by short read aligners like BWA. + homepage: http://www.htslib.org/ + documentation: http://www.htslib.org/doc/samtools.html + doi: 10.1093/bioinformatics/btp352 + licence: ["MIT"] +input: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - input: + type: file + description: BAM/CRAM file from alignment + pattern: "*.{bam,cram}" + - input_index: + type: file + description: BAI/CRAI file from alignment + pattern: "*.{bai,crai}" + - meta2: + type: map + description: | + Groovy Map containing reference information + e.g. [ id:'genome' ] + - fasta: + type: file + description: Reference file the CRAM was created with (optional) + pattern: "*.{fasta,fa}" +output: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - stats: + type: file + description: File containing samtools stats output + pattern: "*.{stats}" + - versions: + type: file + description: File containing software versions + pattern: "versions.yml" +authors: + - "@drpatelh" + - "@FriederikeHanssen" + - "@ramprasadn" +maintainers: + - "@drpatelh" + - "@FriederikeHanssen" + - "@ramprasadn" diff --git a/modules/nf-core/samtools/stats/tests/main.nf.test b/modules/nf-core/samtools/stats/tests/main.nf.test new file mode 100644 index 0000000..e3d5cb1 --- /dev/null +++ b/modules/nf-core/samtools/stats/tests/main.nf.test @@ -0,0 +1,65 @@ +nextflow_process { + + name "Test Process SAMTOOLS_STATS" + script "../main.nf" + process "SAMTOOLS_STATS" + tag "modules" + tag "modules_nfcore" + tag "samtools" + tag "samtools/stats" + + test("bam") { + + when { + params { + outdir = "$outputDir" + } + process { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.sorted.bam', checkIfExists: true), + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.sorted.bam.bai', checkIfExists: true) + ]) + input[1] = [[],[]] + """ + } + } + + then { + assertAll( + {assert process.success}, + {assert snapshot(process.out).match()} + ) + } + } + + test("cram") { + + when { + params { + outdir = "$outputDir" + } + process { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/homo_sapiens/illumina/cram/test.paired_end.recalibrated.sorted.cram', checkIfExists: true), + file(params.modules_testdata_base_path + 'genomics/homo_sapiens/illumina/cram/test.paired_end.recalibrated.sorted.cram.crai', checkIfExists: true) + ]) + input[1] = Channel.of([ + [ id:'genome' ], // meta map + file(params.modules_testdata_base_path + 'genomics/homo_sapiens/genome/genome.fasta', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll( + {assert process.success}, + {assert snapshot(process.out).match()} + ) + } + } +} diff --git a/modules/nf-core/samtools/stats/tests/main.nf.test.snap b/modules/nf-core/samtools/stats/tests/main.nf.test.snap new file mode 100644 index 0000000..2747fd6 --- /dev/null +++ b/modules/nf-core/samtools/stats/tests/main.nf.test.snap @@ -0,0 +1,72 @@ +{ + "cram": { + "content": [ + { + "0": [ + [ + { + "id": "test", + "single_end": false + }, + "test.stats:md5,c9d39b38c22de2057fc2f89949090975" + ] + ], + "1": [ + "versions.yml:md5,b3b70b126f867fdbb7dcea5e36e49d4a" + ], + "stats": [ + [ + { + "id": "test", + "single_end": false + }, + "test.stats:md5,c9d39b38c22de2057fc2f89949090975" + ] + ], + "versions": [ + "versions.yml:md5,b3b70b126f867fdbb7dcea5e36e49d4a" + ] + } + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "23.10.1" + }, + "timestamp": "2024-05-28T15:45:24.403941966" + }, + "bam": { + "content": [ + { + "0": [ + [ + { + "id": "test", + "single_end": false + }, + "test.stats:md5,d522a1fa016b259d6a55620ae53dcd63" + ] + ], + "1": [ + "versions.yml:md5,b3b70b126f867fdbb7dcea5e36e49d4a" + ], + "stats": [ + [ + { + "id": "test", + "single_end": false + }, + "test.stats:md5,d522a1fa016b259d6a55620ae53dcd63" + ] + ], + "versions": [ + "versions.yml:md5,b3b70b126f867fdbb7dcea5e36e49d4a" + ] + } + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "23.10.1" + }, + "timestamp": "2024-05-28T15:45:06.711251947" + } +} \ No newline at end of file diff --git a/modules/nf-core/samtools/stats/tests/tags.yml b/modules/nf-core/samtools/stats/tests/tags.yml new file mode 100644 index 0000000..7c28e30 --- /dev/null +++ b/modules/nf-core/samtools/stats/tests/tags.yml @@ -0,0 +1,2 @@ +samtools/stats: + - modules/nf-core/samtools/stats/** diff --git a/nextflow.config b/nextflow.config index d5df827..275f971 100644 --- a/nextflow.config +++ b/nextflow.config @@ -11,13 +11,12 @@ nextflow.enable.strict = true // Global default params, used in configs params { - // TODO nf-core: Specify your pipeline's command line flags // Input options input = null taxid = null - pipelines_testdata_base_path = "https://raw.githubusercontent.com/nf-core/test-datasets/createtaxdb" - viral_pathogen_genome = params.pipelines_testdata_base_path + "/data/fasta/haemophilus_influenzae.fna.gz" + // Pathogen screening + pathogens_genome = null // References genome = null @@ -42,7 +41,6 @@ params { hook_url = null help = false version = false - pipelines_testdata_base_path = 'https://raw.githubusercontent.com/nf-core/test-datasets/' // Config options config_profile_name = null @@ -193,6 +191,7 @@ profiles { } test { includeConfig 'conf/test.config' } test_full { includeConfig 'conf/test_full.config' } + test_taxid{ includeConfig 'conf/test_taxid.config' } } // Set default registry for Apptainer, Docker, Podman and Singularity independent of -profile diff --git a/nextflow_schema.json b/nextflow_schema.json index 9077ebf..8438de2 100644 --- a/nextflow_schema.json +++ b/nextflow_schema.json @@ -27,13 +27,32 @@ "type": "string", "description": "The taxonomy ID of the species identified in the classification results or a list of taxids separated by spaces." }, - "viral_pathogen_genome": { + "pathogens_genome": { "type": "string", "format": "file-path", "pattern": "^\\S+\\.fn?a(sta)?(\\.gz)?$", - "description": "Path to a concatenated genome file containing all RefSeq viral genomes from a list of viral pathogens.", - "fa_icon": "fas fa-file-csv", - "default": "https://raw.githubusercontent.com/nf-core/test-datasets/createtaxdb/data/fasta/haemophilus_influenzae.fna.gz" + "description": "Path to a concatenated genome file containing complete genomes from a list of viral pathogens.", + "fa_icon": "fas fa-file-csv" + }, + "extract_kraken2_reads": { + "type": "boolean", + "default": true, + "description": "Extract classified Kraken2 output by taxonomic ID." + }, + "extract_centrifuge_reads": { + "type": "boolean", + "default": true, + "description": "Extract classified centrifuge output by taxonomic ID." + }, + "extract_diamond_reads": { + "type": "boolean", + "default": true, + "description": "Extract classified diamond output by taxonomic ID." + }, + "fastq_output": { + "type": "boolean", + "description": "Turn on saving extracted kraken2 reads in fastq format.", + "default": true }, "outdir": { "type": "string", @@ -277,13 +296,6 @@ "description": "Validation of parameters in lenient more.", "hidden": true, "help_text": "Allows string values that are parseable as numbers or booleans. For further information see [JSONSchema docs](https://github.com/everit-org/json-schema#lenient-mode)." - }, - "pipelines_testdata_base_path": { - "type": "string", - "fa_icon": "far fa-check-circle", - "description": "Base URL or local path to location of pipeline test dataset files", - "default": "https://raw.githubusercontent.com/nf-core/test-datasets/", - "hidden": true } } } @@ -304,27 +316,5 @@ { "$ref": "#/definitions/generic_options" } - ], - "properties": { - "extract_kraken2_reads": { - "type": "boolean", - "default": true, - "description": "Extract classified Kraken2 output by taxonomic ID." - }, - "extract_centrifuge_reads": { - "type": "boolean", - "default": true, - "description": "Extract classified centrifuge output by taxonomic ID." - }, - "extract_diamond_reads": { - "type": "boolean", - "default": true, - "description": "Extract classified diamond output by taxonomic ID." - }, - "fastq_output": { - "type": "boolean", - "description": "Turn on saving extracted kraken2 reads in fastq format.", - "default": true - } - } + ] } diff --git a/subworkflows/nf-core/bam_sort_stats_samtools/main.nf b/subworkflows/nf-core/bam_sort_stats_samtools/main.nf new file mode 100644 index 0000000..b716375 --- /dev/null +++ b/subworkflows/nf-core/bam_sort_stats_samtools/main.nf @@ -0,0 +1,50 @@ +// +// Sort, index BAM file and run samtools stats, flagstat and idxstats +// + +include { SAMTOOLS_SORT } from '../../../modules/nf-core/samtools/sort/main' +include { SAMTOOLS_INDEX } from '../../../modules/nf-core/samtools/index/main' +include { BAM_STATS_SAMTOOLS } from '../bam_stats_samtools/main' + +workflow BAM_SORT_STATS_SAMTOOLS { + take: + ch_bam // channel: [ val(meta), [ bam ] ] + ch_fasta // channel: [ val(meta), path(fasta) ] + + main: + + ch_versions = Channel.empty() + + SAMTOOLS_SORT ( ch_bam, ch_fasta ) + ch_versions = ch_versions.mix(SAMTOOLS_SORT.out.versions.first()) + + SAMTOOLS_INDEX ( SAMTOOLS_SORT.out.bam ) + ch_versions = ch_versions.mix(SAMTOOLS_INDEX.out.versions.first()) + + SAMTOOLS_SORT.out.bam + .join(SAMTOOLS_INDEX.out.bai, by: [0], remainder: true) + .join(SAMTOOLS_INDEX.out.csi, by: [0], remainder: true) + .map { + meta, bam, bai, csi -> + if (bai) { + [ meta, bam, bai ] + } else { + [ meta, bam, csi ] + } + } + .set { ch_bam_bai } + + BAM_STATS_SAMTOOLS ( ch_bam_bai, ch_fasta ) + ch_versions = ch_versions.mix(BAM_STATS_SAMTOOLS.out.versions) + + emit: + bam = SAMTOOLS_SORT.out.bam // channel: [ val(meta), [ bam ] ] + bai = SAMTOOLS_INDEX.out.bai // channel: [ val(meta), [ bai ] ] + csi = SAMTOOLS_INDEX.out.csi // channel: [ val(meta), [ csi ] ] + + stats = BAM_STATS_SAMTOOLS.out.stats // channel: [ val(meta), [ stats ] ] + flagstat = BAM_STATS_SAMTOOLS.out.flagstat // channel: [ val(meta), [ flagstat ] ] + idxstats = BAM_STATS_SAMTOOLS.out.idxstats // channel: [ val(meta), [ idxstats ] ] + + versions = ch_versions // channel: [ versions.yml ] +} diff --git a/subworkflows/nf-core/bam_sort_stats_samtools/meta.yml b/subworkflows/nf-core/bam_sort_stats_samtools/meta.yml new file mode 100644 index 0000000..e01f9cc --- /dev/null +++ b/subworkflows/nf-core/bam_sort_stats_samtools/meta.yml @@ -0,0 +1,70 @@ +# yaml-language-server: $schema=https://raw.githubusercontent.com/nf-core/modules/master/subworkflows/yaml-schema.json +name: bam_sort_stats_samtools +description: Sort SAM/BAM/CRAM file +keywords: + - sort + - bam + - sam + - cram +components: + - samtools/sort + - samtools/index + - samtools/stats + - samtools/idxstats + - samtools/flagstat + - bam_stats_samtools +input: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - bam: + type: file + description: BAM/CRAM/SAM file + pattern: "*.{bam,cram,sam}" + - fasta: + type: file + description: Reference genome fasta file + pattern: "*.{fasta,fa}" +# TODO Update when we decide on a standard for subworkflow docs +output: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - bam: + type: file + description: Sorted BAM/CRAM/SAM file + pattern: "*.{bam,cram,sam}" + - bai: + type: file + description: BAM/CRAM/SAM index file + pattern: "*.{bai,crai,sai}" + - crai: + type: file + description: BAM/CRAM/SAM index file + pattern: "*.{bai,crai,sai}" + - stats: + type: file + description: File containing samtools stats output + pattern: "*.{stats}" + - flagstat: + type: file + description: File containing samtools flagstat output + pattern: "*.{flagstat}" + - idxstats: + type: file + description: File containing samtools idxstats output + pattern: "*.{idxstats}" + - versions: + type: file + description: File containing software versions + pattern: "versions.yml" +authors: + - "@drpatelh" + - "@ewels" +maintainers: + - "@drpatelh" + - "@ewels" diff --git a/subworkflows/nf-core/bam_sort_stats_samtools/tests/main.nf.test b/subworkflows/nf-core/bam_sort_stats_samtools/tests/main.nf.test new file mode 100644 index 0000000..821a3cf --- /dev/null +++ b/subworkflows/nf-core/bam_sort_stats_samtools/tests/main.nf.test @@ -0,0 +1,134 @@ +nextflow_workflow { + + name "Test Workflow BAM_SORT_STATS_SAMTOOLS" + script "../main.nf" + workflow "BAM_SORT_STATS_SAMTOOLS" + tag "subworkflows" + tag "subworkflows_nfcore" + tag "subworkflows/bam_sort_stats_samtools" + tag "bam_sort_stats_samtools" + tag "subworkflows/bam_stats_samtools" + tag "bam_stats_samtools" + tag "samtools" + tag "samtools/index" + tag "samtools/sort" + tag "samtools/stats" + tag "samtools/idxstats" + tag "samtools/flagstat" + + test("test_bam_sort_stats_samtools_single_end") { + + when { + workflow { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.single_end.bam', checkIfExists: true) + ]) + input[1] = Channel.of([ + [ id:'genome' ], + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll( + { assert workflow.success}, + { assert workflow.out.bam.get(0).get(1) ==~ ".*.bam"}, + { assert workflow.out.bai.get(0).get(1) ==~ ".*.bai"}, + { assert snapshot( + workflow.out.flagstat, + workflow.out.idxstats, + workflow.out.stats, + workflow.out.versions).match() } + ) + } + } + + test("test_bam_sort_stats_samtools_paired_end") { + + when { + workflow { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.bam', checkIfExists: true) + ]) + input[1] = Channel.of([ + [ id:'genome' ], + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll( + { assert workflow.success}, + { assert workflow.out.bam.get(0).get(1) ==~ ".*.bam"}, + { assert workflow.out.bai.get(0).get(1) ==~ ".*.bai"}, + { assert snapshot( + workflow.out.flagstat, + workflow.out.idxstats, + workflow.out.stats, + workflow.out.versions).match() } + ) + } + } + + test("test_bam_sort_stats_samtools_single_end - stub") { + + options "-stub" + + when { + workflow { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.single_end.bam', checkIfExists: true) + ]) + input[1] = Channel.of([ + [ id:'genome' ], + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll( + { assert workflow.success}, + { assert snapshot(workflow.out).match() } + ) + } + } + + test("test_bam_sort_stats_samtools_paired_end - stub") { + + options "-stub" + + when { + workflow { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.bam', checkIfExists: true) + ]) + input[1] = Channel.of([ + [ id:'genome' ], + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll( + { assert workflow.success}, + { assert snapshot(workflow.out).match() } + ) + } + } +} diff --git a/subworkflows/nf-core/bam_sort_stats_samtools/tests/main.nf.test.snap b/subworkflows/nf-core/bam_sort_stats_samtools/tests/main.nf.test.snap new file mode 100644 index 0000000..044536f --- /dev/null +++ b/subworkflows/nf-core/bam_sort_stats_samtools/tests/main.nf.test.snap @@ -0,0 +1,354 @@ +{ + "test_bam_sort_stats_samtools_single_end": { + "content": [ + [ + [ + { + "id": "test", + "single_end": false + }, + "test.flagstat:md5,2191911d72575a2358b08b1df64ccb53" + ] + ], + [ + [ + { + "id": "test", + "single_end": false + }, + "test.idxstats:md5,613e048487662c694aa4a2f73ca96a20" + ] + ], + [ + [ + { + "id": "test", + "single_end": false + }, + "test.stats:md5,d32de3b3716a11039cef2367c3c1a56e" + ] + ], + [ + "versions.yml:md5,494b5530a1aa29fd5867cf655bebbfe1", + "versions.yml:md5,9fcb0cd845bfb1f89d83201bb20649b4", + "versions.yml:md5,bacc323ec4055d6f69f07a09089772d1", + "versions.yml:md5,ce946e97097c6a9ccf834a3f91f6da30", + "versions.yml:md5,d6c8dae685f1b7d050165fc15c7a20b5" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-07-03T12:20:38.911799" + }, + "test_bam_sort_stats_samtools_paired_end": { + "content": [ + [ + [ + { + "id": "test", + "single_end": false + }, + "test.flagstat:md5,4f7ffd1e6a5e85524d443209ac97d783" + ] + ], + [ + [ + { + "id": "test", + "single_end": false + }, + "test.idxstats:md5,df60a8c8d6621100d05178c93fb053a2" + ] + ], + [ + [ + { + "id": "test", + "single_end": false + }, + "test.stats:md5,cca83e4fc9406fc3875b5e60055d6574" + ] + ], + [ + "versions.yml:md5,494b5530a1aa29fd5867cf655bebbfe1", + "versions.yml:md5,9fcb0cd845bfb1f89d83201bb20649b4", + "versions.yml:md5,bacc323ec4055d6f69f07a09089772d1", + "versions.yml:md5,ce946e97097c6a9ccf834a3f91f6da30", + "versions.yml:md5,d6c8dae685f1b7d050165fc15c7a20b5" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-07-03T12:20:51.171967" + }, + "test_bam_sort_stats_samtools_single_end - stub": { + "content": [ + { + "0": [ + [ + { + "id": "test", + "single_end": false + }, + "test.bam:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "1": [ + [ + { + "id": "test", + "single_end": false + }, + "test.bam.bai:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "2": [ + [ + { + "id": "test", + "single_end": false + }, + "test.bam.csi:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "3": [ + [ + { + "id": "test", + "single_end": false + }, + "test.stats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "4": [ + [ + { + "id": "test", + "single_end": false + }, + "test.flagstat:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "5": [ + [ + { + "id": "test", + "single_end": false + }, + "test.idxstats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "6": [ + "versions.yml:md5,494b5530a1aa29fd5867cf655bebbfe1", + "versions.yml:md5,9fcb0cd845bfb1f89d83201bb20649b4", + "versions.yml:md5,bacc323ec4055d6f69f07a09089772d1", + "versions.yml:md5,ce946e97097c6a9ccf834a3f91f6da30", + "versions.yml:md5,d6c8dae685f1b7d050165fc15c7a20b5" + ], + "bai": [ + [ + { + "id": "test", + "single_end": false + }, + "test.bam.bai:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "bam": [ + [ + { + "id": "test", + "single_end": false + }, + "test.bam:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "csi": [ + [ + { + "id": "test", + "single_end": false + }, + "test.bam.csi:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "flagstat": [ + [ + { + "id": "test", + "single_end": false + }, + "test.flagstat:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "idxstats": [ + [ + { + "id": "test", + "single_end": false + }, + "test.idxstats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "stats": [ + [ + { + "id": "test", + "single_end": false + }, + "test.stats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "versions": [ + "versions.yml:md5,494b5530a1aa29fd5867cf655bebbfe1", + "versions.yml:md5,9fcb0cd845bfb1f89d83201bb20649b4", + "versions.yml:md5,bacc323ec4055d6f69f07a09089772d1", + "versions.yml:md5,ce946e97097c6a9ccf834a3f91f6da30", + "versions.yml:md5,d6c8dae685f1b7d050165fc15c7a20b5" + ] + } + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-07-03T12:13:52.386146" + }, + "test_bam_sort_stats_samtools_paired_end - stub": { + "content": [ + { + "0": [ + [ + { + "id": "test", + "single_end": false + }, + "test.bam:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "1": [ + [ + { + "id": "test", + "single_end": false + }, + "test.bam.bai:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "2": [ + [ + { + "id": "test", + "single_end": false + }, + "test.bam.csi:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "3": [ + [ + { + "id": "test", + "single_end": false + }, + "test.stats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "4": [ + [ + { + "id": "test", + "single_end": false + }, + "test.flagstat:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "5": [ + [ + { + "id": "test", + "single_end": false + }, + "test.idxstats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "6": [ + "versions.yml:md5,494b5530a1aa29fd5867cf655bebbfe1", + "versions.yml:md5,9fcb0cd845bfb1f89d83201bb20649b4", + "versions.yml:md5,bacc323ec4055d6f69f07a09089772d1", + "versions.yml:md5,ce946e97097c6a9ccf834a3f91f6da30", + "versions.yml:md5,d6c8dae685f1b7d050165fc15c7a20b5" + ], + "bai": [ + [ + { + "id": "test", + "single_end": false + }, + "test.bam.bai:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "bam": [ + [ + { + "id": "test", + "single_end": false + }, + "test.bam:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "csi": [ + [ + { + "id": "test", + "single_end": false + }, + "test.bam.csi:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "flagstat": [ + [ + { + "id": "test", + "single_end": false + }, + "test.flagstat:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "idxstats": [ + [ + { + "id": "test", + "single_end": false + }, + "test.idxstats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "stats": [ + [ + { + "id": "test", + "single_end": false + }, + "test.stats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "versions": [ + "versions.yml:md5,494b5530a1aa29fd5867cf655bebbfe1", + "versions.yml:md5,9fcb0cd845bfb1f89d83201bb20649b4", + "versions.yml:md5,bacc323ec4055d6f69f07a09089772d1", + "versions.yml:md5,ce946e97097c6a9ccf834a3f91f6da30", + "versions.yml:md5,d6c8dae685f1b7d050165fc15c7a20b5" + ] + } + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-07-03T12:14:06.231663" + } +} \ No newline at end of file diff --git a/subworkflows/nf-core/bam_sort_stats_samtools/tests/tags.yml b/subworkflows/nf-core/bam_sort_stats_samtools/tests/tags.yml new file mode 100644 index 0000000..30b69d6 --- /dev/null +++ b/subworkflows/nf-core/bam_sort_stats_samtools/tests/tags.yml @@ -0,0 +1,2 @@ +subworkflows/bam_sort_stats_samtools: + - subworkflows/nf-core/bam_sort_stats_samtools/** diff --git a/subworkflows/nf-core/bam_stats_samtools/main.nf b/subworkflows/nf-core/bam_stats_samtools/main.nf new file mode 100644 index 0000000..44d4c01 --- /dev/null +++ b/subworkflows/nf-core/bam_stats_samtools/main.nf @@ -0,0 +1,32 @@ +// +// Run SAMtools stats, flagstat and idxstats +// + +include { SAMTOOLS_STATS } from '../../../modules/nf-core/samtools/stats/main' +include { SAMTOOLS_IDXSTATS } from '../../../modules/nf-core/samtools/idxstats/main' +include { SAMTOOLS_FLAGSTAT } from '../../../modules/nf-core/samtools/flagstat/main' + +workflow BAM_STATS_SAMTOOLS { + take: + ch_bam_bai // channel: [ val(meta), path(bam), path(bai) ] + ch_fasta // channel: [ val(meta), path(fasta) ] + + main: + ch_versions = Channel.empty() + + SAMTOOLS_STATS ( ch_bam_bai, ch_fasta ) + ch_versions = ch_versions.mix(SAMTOOLS_STATS.out.versions) + + SAMTOOLS_FLAGSTAT ( ch_bam_bai ) + ch_versions = ch_versions.mix(SAMTOOLS_FLAGSTAT.out.versions) + + SAMTOOLS_IDXSTATS ( ch_bam_bai ) + ch_versions = ch_versions.mix(SAMTOOLS_IDXSTATS.out.versions) + + emit: + stats = SAMTOOLS_STATS.out.stats // channel: [ val(meta), path(stats) ] + flagstat = SAMTOOLS_FLAGSTAT.out.flagstat // channel: [ val(meta), path(flagstat) ] + idxstats = SAMTOOLS_IDXSTATS.out.idxstats // channel: [ val(meta), path(idxstats) ] + + versions = ch_versions // channel: [ path(versions.yml) ] +} diff --git a/subworkflows/nf-core/bam_stats_samtools/meta.yml b/subworkflows/nf-core/bam_stats_samtools/meta.yml new file mode 100644 index 0000000..809bf73 --- /dev/null +++ b/subworkflows/nf-core/bam_stats_samtools/meta.yml @@ -0,0 +1,43 @@ +# yaml-language-server: $schema=https://raw.githubusercontent.com/nf-core/modules/master/subworkflows/yaml-schema.json +name: bam_stats_samtools +description: Produces comprehensive statistics from SAM/BAM/CRAM file +keywords: + - statistics + - counts + - bam + - sam + - cram +components: + - samtools/stats + - samtools/idxstats + - samtools/flagstat +input: + - ch_bam_bai: + description: | + The input channel containing the BAM/CRAM and it's index + Structure: [ val(meta), path(bam), path(bai) ] + - ch_fasta: + description: | + Reference genome fasta file + Structure: [ path(fasta) ] +output: + - stats: + description: | + File containing samtools stats output + Structure: [ val(meta), path(stats) ] + - flagstat: + description: | + File containing samtools flagstat output + Structure: [ val(meta), path(flagstat) ] + - idxstats: + description: | + File containing samtools idxstats output + Structure: [ val(meta), path(idxstats)] + - versions: + description: | + Files containing software versions + Structure: [ path(versions.yml) ] +authors: + - "@drpatelh" +maintainers: + - "@drpatelh" diff --git a/subworkflows/nf-core/bam_stats_samtools/tests/main.nf.test b/subworkflows/nf-core/bam_stats_samtools/tests/main.nf.test new file mode 100644 index 0000000..76e7a40 --- /dev/null +++ b/subworkflows/nf-core/bam_stats_samtools/tests/main.nf.test @@ -0,0 +1,188 @@ +nextflow_workflow { + + name "Test Workflow BAM_STATS_SAMTOOLS" + script "../main.nf" + workflow "BAM_STATS_SAMTOOLS" + tag "subworkflows" + tag "subworkflows_nfcore" + tag "bam_stats_samtools" + tag "subworkflows/bam_stats_samtools" + tag "samtools" + tag "samtools/flagstat" + tag "samtools/idxstats" + tag "samtools/stats" + + test("test_bam_stats_samtools_single_end") { + + when { + workflow { + """ + input[0] = Channel.of([ + [ id:'test', single_end:true ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.single_end.sorted.bam', checkIfExists: true), + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.single_end.sorted.bam.bai', checkIfExists: true) + ]) + input[1] = Channel.of([ + [ id:'genome' ], + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll( + { assert workflow.success}, + { assert snapshot( + workflow.out.flagstat, + workflow.out.idxstats, + workflow.out.stats, + workflow.out.versions).match() } + ) + } + } + + test("test_bam_stats_samtools_paired_end") { + + when { + workflow { + """ + input[0] = Channel.of([ + [ id:'test', single_end:true ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.sorted.bam', checkIfExists: true), + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.sorted.bam.bai', checkIfExists: true) + ]) + input[1] = Channel.of([ + [ id:'genome' ], + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll( + { assert workflow.success }, + { assert snapshot( + workflow.out.flagstat, + workflow.out.idxstats, + workflow.out.stats, + workflow.out.versions).match() } + ) + } + } + + test("test_bam_stats_samtools_paired_end_cram") { + + when { + workflow { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/homo_sapiens/illumina/cram/test.paired_end.sorted.cram', checkIfExists: true), + file(params.modules_testdata_base_path + 'genomics/homo_sapiens/illumina/cram/test.paired_end.sorted.cram.crai', checkIfExists: true) + ]) + input[1] = Channel.of([ + [ id:'genome' ], + file(params.modules_testdata_base_path + 'genomics/homo_sapiens/genome/genome.fasta', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll( + { assert workflow.success}, + { assert snapshot( + workflow.out.flagstat, + workflow.out.idxstats, + workflow.out.stats, + workflow.out.versions).match() } + ) + } + } + + test ("test_bam_stats_samtools_single_end - stub") { + + options "-stub" + + when { + workflow { + """ + input[0] = Channel.of([ + [ id:'test', single_end:true ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.single_end.sorted.bam', checkIfExists: true), + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.single_end.sorted.bam.bai', checkIfExists: true) + ]) + input[1] = Channel.of([ + [ id:'genome' ], + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll( + { assert workflow.success}, + { assert snapshot(workflow.out).match() } + ) + } + } + + test("test_bam_stats_samtools_paired_end - stub") { + + options "-stub" + + when { + workflow { + """ + input[0] = Channel.of([ + [ id:'test', single_end:true ], // meta map + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.sorted.bam', checkIfExists: true), + file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.sorted.bam.bai', checkIfExists: true) + ]) + input[1] = Channel.of([ + [ id:'genome' ], + file(params.modules_testdata_base_path + 'genomics/sarscov2/genome/genome.fasta', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll( + { assert workflow.success }, + { assert snapshot(workflow.out).match() } + ) + } + } + + test("test_bam_stats_samtools_paired_end_cram - stub") { + + options "-stub" + + when { + workflow { + """ + input[0] = Channel.of([ + [ id:'test', single_end:false ], // meta map + file(params.modules_testdata_base_path + 'genomics/homo_sapiens/illumina/cram/test.paired_end.sorted.cram', checkIfExists: true), + file(params.modules_testdata_base_path + 'genomics/homo_sapiens/illumina/cram/test.paired_end.sorted.cram.crai', checkIfExists: true) + ]) + input[1] = Channel.of([ + [ id:'genome' ], + file(params.modules_testdata_base_path + 'genomics/homo_sapiens/genome/genome.fasta', checkIfExists: true) + ]) + """ + } + } + + then { + assertAll( + { assert workflow.success}, + { assert snapshot(workflow.out).match() } + ) + } + } +} diff --git a/subworkflows/nf-core/bam_stats_samtools/tests/main.nf.test.snap b/subworkflows/nf-core/bam_stats_samtools/tests/main.nf.test.snap new file mode 100644 index 0000000..a3ddcc5 --- /dev/null +++ b/subworkflows/nf-core/bam_stats_samtools/tests/main.nf.test.snap @@ -0,0 +1,350 @@ +{ + "test_bam_stats_samtools_paired_end - stub": { + "content": [ + { + "0": [ + [ + { + "id": "test", + "single_end": true + }, + "test.stats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "1": [ + [ + { + "id": "test", + "single_end": true + }, + "test.flagstat:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "2": [ + [ + { + "id": "test", + "single_end": true + }, + "test.idxstats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "3": [ + "versions.yml:md5,3c485730f712b115bcdc235e7294133b", + "versions.yml:md5,90f593a26a2d53e0f0345df7888f448e", + "versions.yml:md5,9ae003814e63a0907d52eec64d5d3ca3" + ], + "flagstat": [ + [ + { + "id": "test", + "single_end": true + }, + "test.flagstat:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "idxstats": [ + [ + { + "id": "test", + "single_end": true + }, + "test.idxstats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "stats": [ + [ + { + "id": "test", + "single_end": true + }, + "test.stats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "versions": [ + "versions.yml:md5,3c485730f712b115bcdc235e7294133b", + "versions.yml:md5,90f593a26a2d53e0f0345df7888f448e", + "versions.yml:md5,9ae003814e63a0907d52eec64d5d3ca3" + ] + } + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-07-03T12:20:06.699297" + }, + "test_bam_stats_samtools_single_end - stub": { + "content": [ + { + "0": [ + [ + { + "id": "test", + "single_end": true + }, + "test.stats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "1": [ + [ + { + "id": "test", + "single_end": true + }, + "test.flagstat:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "2": [ + [ + { + "id": "test", + "single_end": true + }, + "test.idxstats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "3": [ + "versions.yml:md5,3c485730f712b115bcdc235e7294133b", + "versions.yml:md5,90f593a26a2d53e0f0345df7888f448e", + "versions.yml:md5,9ae003814e63a0907d52eec64d5d3ca3" + ], + "flagstat": [ + [ + { + "id": "test", + "single_end": true + }, + "test.flagstat:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "idxstats": [ + [ + { + "id": "test", + "single_end": true + }, + "test.idxstats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "stats": [ + [ + { + "id": "test", + "single_end": true + }, + "test.stats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "versions": [ + "versions.yml:md5,3c485730f712b115bcdc235e7294133b", + "versions.yml:md5,90f593a26a2d53e0f0345df7888f448e", + "versions.yml:md5,9ae003814e63a0907d52eec64d5d3ca3" + ] + } + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-07-03T12:19:57.708621" + }, + "test_bam_stats_samtools_paired_end_cram - stub": { + "content": [ + { + "0": [ + [ + { + "id": "test", + "single_end": false + }, + "test.stats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "1": [ + [ + { + "id": "test", + "single_end": false + }, + "test.flagstat:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "2": [ + [ + { + "id": "test", + "single_end": false + }, + "test.idxstats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "3": [ + "versions.yml:md5,3c485730f712b115bcdc235e7294133b", + "versions.yml:md5,90f593a26a2d53e0f0345df7888f448e", + "versions.yml:md5,9ae003814e63a0907d52eec64d5d3ca3" + ], + "flagstat": [ + [ + { + "id": "test", + "single_end": false + }, + "test.flagstat:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "idxstats": [ + [ + { + "id": "test", + "single_end": false + }, + "test.idxstats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "stats": [ + [ + { + "id": "test", + "single_end": false + }, + "test.stats:md5,d41d8cd98f00b204e9800998ecf8427e" + ] + ], + "versions": [ + "versions.yml:md5,3c485730f712b115bcdc235e7294133b", + "versions.yml:md5,90f593a26a2d53e0f0345df7888f448e", + "versions.yml:md5,9ae003814e63a0907d52eec64d5d3ca3" + ] + } + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-07-03T12:20:17.051493" + }, + "test_bam_stats_samtools_single_end": { + "content": [ + [ + [ + { + "id": "test", + "single_end": true + }, + "test.flagstat:md5,2191911d72575a2358b08b1df64ccb53" + ] + ], + [ + [ + { + "id": "test", + "single_end": true + }, + "test.idxstats:md5,613e048487662c694aa4a2f73ca96a20" + ] + ], + [ + [ + { + "id": "test", + "single_end": true + }, + "test.stats:md5,4a0c429c661d6aa0b60acb9309da642d" + ] + ], + [ + "versions.yml:md5,3c485730f712b115bcdc235e7294133b", + "versions.yml:md5,90f593a26a2d53e0f0345df7888f448e", + "versions.yml:md5,9ae003814e63a0907d52eec64d5d3ca3" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-07-03T12:19:25.801394" + }, + "test_bam_stats_samtools_paired_end": { + "content": [ + [ + [ + { + "id": "test", + "single_end": true + }, + "test.flagstat:md5,4f7ffd1e6a5e85524d443209ac97d783" + ] + ], + [ + [ + { + "id": "test", + "single_end": true + }, + "test.idxstats:md5,df60a8c8d6621100d05178c93fb053a2" + ] + ], + [ + [ + { + "id": "test", + "single_end": true + }, + "test.stats:md5,7afd486ad6abb9a2a3dac90c99e1d87b" + ] + ], + [ + "versions.yml:md5,3c485730f712b115bcdc235e7294133b", + "versions.yml:md5,90f593a26a2d53e0f0345df7888f448e", + "versions.yml:md5,9ae003814e63a0907d52eec64d5d3ca3" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-07-03T12:19:36.158768" + }, + "test_bam_stats_samtools_paired_end_cram": { + "content": [ + [ + [ + { + "id": "test", + "single_end": false + }, + "test.flagstat:md5,a53f3d26e2e9851f7d528442bbfe9781" + ] + ], + [ + [ + { + "id": "test", + "single_end": false + }, + "test.idxstats:md5,e179601fa7b8ebce81ac3765206f6c15" + ] + ], + [ + [ + { + "id": "test", + "single_end": false + }, + "test.stats:md5,16b59a1f2c99d9fe30f711adc3ebe32d" + ] + ], + [ + "versions.yml:md5,3c485730f712b115bcdc235e7294133b", + "versions.yml:md5,90f593a26a2d53e0f0345df7888f448e", + "versions.yml:md5,9ae003814e63a0907d52eec64d5d3ca3" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-07-03T12:19:46.625907" + } +} \ No newline at end of file diff --git a/subworkflows/nf-core/bam_stats_samtools/tests/tags.yml b/subworkflows/nf-core/bam_stats_samtools/tests/tags.yml new file mode 100644 index 0000000..ec2f2d6 --- /dev/null +++ b/subworkflows/nf-core/bam_stats_samtools/tests/tags.yml @@ -0,0 +1,2 @@ +subworkflows/bam_stats_samtools: + - subworkflows/nf-core/bam_stats_samtools/** diff --git a/subworkflows/nf-core/fastq_align_bowtie2/main.nf b/subworkflows/nf-core/fastq_align_bowtie2/main.nf new file mode 100644 index 0000000..cafaa9b --- /dev/null +++ b/subworkflows/nf-core/fastq_align_bowtie2/main.nf @@ -0,0 +1,45 @@ +// +// Alignment with Bowtie2 +// + +include { BOWTIE2_ALIGN } from '../../../modules/nf-core/bowtie2/align/main' +include { BAM_SORT_STATS_SAMTOOLS } from '../bam_sort_stats_samtools/main' + +workflow FASTQ_ALIGN_BOWTIE2 { + take: + ch_reads // channel: [ val(meta), [ reads ] ] + ch_index // channel: /path/to/bowtie2/index/ + save_unaligned // val + sort_bam // val + ch_fasta // channel: /path/to/reference.fasta + + main: + + ch_versions = Channel.empty() + + // + // Map reads with Bowtie2 + // + BOWTIE2_ALIGN ( ch_reads, ch_index, ch_fasta, save_unaligned, sort_bam ) + ch_versions = ch_versions.mix(BOWTIE2_ALIGN.out.versions) + + // + // Sort, index BAM file and run samtools stats, flagstat and idxstats + // + BAM_SORT_STATS_SAMTOOLS ( BOWTIE2_ALIGN.out.bam, ch_fasta ) + ch_versions = ch_versions.mix(BAM_SORT_STATS_SAMTOOLS.out.versions) + + emit: + bam_orig = BOWTIE2_ALIGN.out.bam // channel: [ val(meta), aligned ] + log_out = BOWTIE2_ALIGN.out.log // channel: [ val(meta), log ] + fastq = BOWTIE2_ALIGN.out.fastq // channel: [ val(meta), fastq ] + + bam = BAM_SORT_STATS_SAMTOOLS.out.bam // channel: [ val(meta), [ bam ] ] + bai = BAM_SORT_STATS_SAMTOOLS.out.bai // channel: [ val(meta), [ bai ] ] + csi = BAM_SORT_STATS_SAMTOOLS.out.csi // channel: [ val(meta), [ csi ] ] + stats = BAM_SORT_STATS_SAMTOOLS.out.stats // channel: [ val(meta), [ stats ] ] + flagstat = BAM_SORT_STATS_SAMTOOLS.out.flagstat // channel: [ val(meta), [ flagstat ] ] + idxstats = BAM_SORT_STATS_SAMTOOLS.out.idxstats // channel: [ val(meta), [ idxstats ] ] + + versions = ch_versions // channel: [ versions.yml ] +} diff --git a/subworkflows/nf-core/fastq_align_bowtie2/meta.yml b/subworkflows/nf-core/fastq_align_bowtie2/meta.yml new file mode 100644 index 0000000..b18e405 --- /dev/null +++ b/subworkflows/nf-core/fastq_align_bowtie2/meta.yml @@ -0,0 +1,67 @@ +# yaml-language-server: $schema=https://raw.githubusercontent.com/nf-core/modules/master/subworkflows/yaml-schema.json +name: fastq_align_bowtie2 +description: Align reads to a reference genome using bowtie2 then sort with samtools +keywords: + - align + - fasta + - genome + - reference +components: + - bowtie2/align + - samtools/sort + - samtools/index + - samtools/stats + - samtools/idxstats + - samtools/flagstat + - bam_sort_stats_samtools +input: + - meta: + type: map + description: | + Groovy Map containing sample information + e.g. [ id:'test', single_end:false ] + - ch_reads: + type: file + description: | + List of input FastQ files of size 1 and 2 for single-end and paired-end data, + respectively. + - ch_index: + type: file + description: Bowtie2 genome index files + pattern: "*.ebwt" + - save_unaligned: + type: boolean + description: | + Save reads that do not map to the reference (true) or discard them (false) + (default: false) + - sort_bam: + type: boolean + description: | + Use samtools sort (true) or samtools view (false) + default: false + - ch_fasta: + type: file + description: Reference fasta file + pattern: "*.{fasta,fa}" +# TODO Update when we decide on a standard for subworkflow docs +output: + - bam: + type: file + description: Output BAM file containing read alignments + pattern: "*.{bam}" + - versions: + type: file + description: File containing software versions + pattern: "versions.yml" + - fastq: + type: file + description: Unaligned FastQ files + pattern: "*.fastq.gz" + - log: + type: file + description: Alignment log + pattern: "*.log" +authors: + - "@drpatelh" +maintainers: + - "@drpatelh" diff --git a/subworkflows/nf-core/fastq_align_bowtie2/tests/main.nf.test b/subworkflows/nf-core/fastq_align_bowtie2/tests/main.nf.test new file mode 100644 index 0000000..2fabb42 --- /dev/null +++ b/subworkflows/nf-core/fastq_align_bowtie2/tests/main.nf.test @@ -0,0 +1,189 @@ +nextflow_workflow { + + name "Test Subworkflow FASTQ_ALIGN_BOWTIE2" + script "../main.nf" + config "./nextflow.config" + workflow "FASTQ_ALIGN_BOWTIE2" + + tag "subworkflows" + tag "subworkflows_nfcore" + tag "subworkflows/fastq_align_bowtie2" + tag "subworkflows/bam_sort_stats_samtools" + tag "bowtie2" + tag "bowtie2/build" + tag "bowtie2/align" + + test("test_align_bowtie2_single_end") { + setup { + run("BOWTIE2_BUILD") { + script "../../../../modules/nf-core/bowtie2/build/main.nf" + process { + """ + input[0] = Channel.value([ [ id:'genome' ],file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)]) + """ + } + } + } + when { + workflow { + """ + input[0] = Channel.of([[ id:'test', single_end:true ], [ file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true) ]]) + input[1] = BOWTIE2_BUILD.out.index + input[2] = false + input[3] = false + input[4] = Channel.value([ [ id:'genome' ],file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)]) + """ + } + } + + then { + assertAll( + { assert workflow.success}, + { assert snapshot( + file(workflow.out.bam_orig[0][1]).name, + workflow.out.fastq, + workflow.out.log_out, + file(workflow.out.bam[0][1]).name, + file(workflow.out.bai[0][1]).name, + workflow.out.csi, + workflow.out.stats, + workflow.out.flagstat, + workflow.out.idxstats, + workflow.out.versions + ).match()} + ) + } + } + + test("test_align_bowtie2_paired_end") { + setup { + run("BOWTIE2_BUILD") { + script "../../../../modules/nf-core/bowtie2/build/main.nf" + process { + """ + input[0] = Channel.value([ [ id:'genome' ],file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)]) + """ + } + } + } + when { + workflow { + """ + input[0] = Channel.of([[ id:'test', single_end:false ], [file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true), file(params.test_data['sarscov2']['illumina']['test_2_fastq_gz'], checkIfExists: true)]]) + input[1] = BOWTIE2_BUILD.out.index + input[2] = false + input[3] = false + input[4] = Channel.value([ [ id:'genome' ],file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)]) + """ + } + } + + then { + assertAll( + { assert workflow.success}, + { assert snapshot( + file(workflow.out.bam_orig[0][1]).name, + workflow.out.fastq, + workflow.out.log_out, + file(workflow.out.bam[0][1]).name, + file(workflow.out.bai[0][1]).name, + workflow.out.csi, + workflow.out.stats, + workflow.out.flagstat, + workflow.out.idxstats, + workflow.out.versions + ).match()} + ) + } + } + + test("test_align_bowtie2_single_end - stub") { + + options "-stub" + + setup { + run("BOWTIE2_BUILD") { + script "../../../../modules/nf-core/bowtie2/build/main.nf" + process { + """ + input[0] = Channel.value([ [ id:'genome' ],file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)]) + """ + } + } + } + when { + workflow { + """ + input[0] = Channel.of([[ id:'test', single_end:true ], [ file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true) ]]) + input[1] = BOWTIE2_BUILD.out.index + input[2] = false + input[3] = false + input[4] = Channel.value([ [ id:'genome' ],file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)]) + """ + } + } + + then { + assertAll( + { assert workflow.success}, + { assert snapshot( + file(workflow.out.bam_orig[0][1]).name, + workflow.out.fastq, + workflow.out.log_out, + file(workflow.out.bam[0][1]).name, + file(workflow.out.bai[0][1]).name, + workflow.out.csi, + workflow.out.stats, + workflow.out.flagstat, + workflow.out.idxstats, + workflow.out.versions + ).match()} + ) + } + } + + test("test_align_bowtie2_paired_end - stub") { + + options "-stub" + + setup { + run("BOWTIE2_BUILD") { + script "../../../../modules/nf-core/bowtie2/build/main.nf" + process { + """ + input[0] = Channel.value([ [ id:'genome' ],file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)]) + """ + } + } + } + when { + workflow { + """ + input[0] = Channel.of([[ id:'test', single_end:false ], [file(params.test_data['sarscov2']['illumina']['test_1_fastq_gz'], checkIfExists: true), file(params.test_data['sarscov2']['illumina']['test_2_fastq_gz'], checkIfExists: true)]]) + input[1] = BOWTIE2_BUILD.out.index + input[2] = false + input[3] = false + input[4] = Channel.value([ [ id:'genome' ],file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true)]) + """ + } + } + + then { + assertAll( + { assert workflow.success}, + { assert snapshot( + file(workflow.out.bam_orig[0][1]).name, + workflow.out.fastq, + workflow.out.log_out, + file(workflow.out.bam[0][1]).name, + file(workflow.out.bai[0][1]).name, + workflow.out.csi, + workflow.out.stats, + workflow.out.flagstat, + workflow.out.idxstats, + workflow.out.versions + ).match()} + ) + } + } +} diff --git a/subworkflows/nf-core/fastq_align_bowtie2/tests/main.nf.test.snap b/subworkflows/nf-core/fastq_align_bowtie2/tests/main.nf.test.snap new file mode 100644 index 0000000..c849096 --- /dev/null +++ b/subworkflows/nf-core/fastq_align_bowtie2/tests/main.nf.test.snap @@ -0,0 +1,126 @@ +{ + "test_align_bowtie2_single_end": { + "content": [ + "test.bam", + [ + + ], + [ + [ + { + "id": "test", + "single_end": true + }, + "test.bowtie2.log:md5,7b8a9e61b7646da1089b041333c41a87" + ] + ], + "test.sorted.bam", + "test.sorted.bam.bai", + [ + + ], + [ + [ + { + "id": "test", + "single_end": true + }, + "test.sorted.bam.stats:md5,d499a70739ffa0a96880eaad229dcf7c" + ] + ], + [ + [ + { + "id": "test", + "single_end": true + }, + "test.sorted.bam.flagstat:md5,e9ce9093133116bc54fd335cfe698372" + ] + ], + [ + [ + { + "id": "test", + "single_end": true + }, + "test.sorted.bam.idxstats:md5,e16eb632f7f462514b0873c7ac8ac905" + ] + ], + [ + "versions.yml:md5,0b1901279f738fa8e22cabea6e2a48bd", + "versions.yml:md5,60be918ac1032f74137ad27024c002ef", + "versions.yml:md5,8644be336f2fd05a04b95050a4de9094", + "versions.yml:md5,aab337e63eac9055aadb9a35cec16053", + "versions.yml:md5,dd60999d74ea42ae4f5483c9d94507f3", + "versions.yml:md5,ddb252583f75777033ee6467e4b6d545" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-07-03T13:07:32.050239" + }, + "test_align_bowtie2_paired_end": { + "content": [ + "test.bam", + [ + + ], + [ + [ + { + "id": "test", + "single_end": false + }, + "test.bowtie2.log:md5,bd89ce1b28c93bf822bae391ffcedd19" + ] + ], + "test.sorted.bam", + "test.sorted.bam.bai", + [ + + ], + [ + [ + { + "id": "test", + "single_end": false + }, + "test.sorted.bam.stats:md5,c02dbd116c1f49339dda208cb950261d" + ] + ], + [ + [ + { + "id": "test", + "single_end": false + }, + "test.sorted.bam.flagstat:md5,49f3d51a8804ce58fe9cecd2549d279b" + ] + ], + [ + [ + { + "id": "test", + "single_end": false + }, + "test.sorted.bam.idxstats:md5,29ff2fa56d35b2a47625b8f517f1a947" + ] + ], + [ + "versions.yml:md5,0b1901279f738fa8e22cabea6e2a48bd", + "versions.yml:md5,60be918ac1032f74137ad27024c002ef", + "versions.yml:md5,8644be336f2fd05a04b95050a4de9094", + "versions.yml:md5,aab337e63eac9055aadb9a35cec16053", + "versions.yml:md5,dd60999d74ea42ae4f5483c9d94507f3", + "versions.yml:md5,ddb252583f75777033ee6467e4b6d545" + ] + ], + "meta": { + "nf-test": "0.8.4", + "nextflow": "24.04.2" + }, + "timestamp": "2024-07-03T13:07:48.653475" + } +} \ No newline at end of file diff --git a/subworkflows/nf-core/fastq_align_bowtie2/tests/nextflow.config b/subworkflows/nf-core/fastq_align_bowtie2/tests/nextflow.config new file mode 100644 index 0000000..2f85e80 --- /dev/null +++ b/subworkflows/nf-core/fastq_align_bowtie2/tests/nextflow.config @@ -0,0 +1,8 @@ +process { + withName: '.*:BAM_SORT_STATS_SAMTOOLS:SAMTOOLS_.*' { + ext.prefix = { "${meta.id}.sorted" } + } + withName: '.*:BAM_SORT_STATS_SAMTOOLS:BAM_STATS_SAMTOOLS:.*' { + ext.prefix = { "${meta.id}.sorted.bam" } + } +} diff --git a/subworkflows/nf-core/fastq_align_bowtie2/tests/tags.yml b/subworkflows/nf-core/fastq_align_bowtie2/tests/tags.yml new file mode 100644 index 0000000..267bcc7 --- /dev/null +++ b/subworkflows/nf-core/fastq_align_bowtie2/tests/tags.yml @@ -0,0 +1,2 @@ +subworkflows/fastq_align_bowtie2: + - subworkflows/nf-core/fastq_align_bowtie2/** diff --git a/viralPathogenList.csv b/viral_pathogen_list.csv similarity index 100% rename from viralPathogenList.csv rename to viral_pathogen_list.csv diff --git a/workflows/metaval.nf b/workflows/metaval.nf index 4439e3f..407f646 100644 --- a/workflows/metaval.nf +++ b/workflows/metaval.nf @@ -4,17 +4,24 @@ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ */ -include { FASTQC } from '../modules/nf-core/fastqc/main' -include { MULTIQC } from '../modules/nf-core/multiqc/main' -include { paramsSummaryMap } from 'plugin/nf-validation' -include { paramsSummaryMultiqc } from '../subworkflows/nf-core/utils_nfcore_pipeline' -include { softwareVersionsToYAML } from '../subworkflows/nf-core/utils_nfcore_pipeline' -include { methodsDescriptionText } from '../subworkflows/local/utils_nfcore_metaval_pipeline' -include { EXTRACT_VIRAL_TAXID } from '../modules/local/extract_viral_taxid' -include { KRAKENTOOLS_EXTRACTKRAKENREADS } from '../modules/nf-core/krakentools/extractkrakenreads/main' -include { EXTRACTCENTRIFUGEREADS } from '../modules/local/extractcentrifugereads' -include { EXTRACTCDIAMONDREADS } from '../modules/local/extractdiamondreads' -include { TAXID_READS } from '../subworkflows/local/taxid_reads.nf' +// Extract reads of taxIDs +include { EXTRACT_VIRAL_TAXID } from '../modules/local/extract_viral_taxid' +include { KRAKENTOOLS_EXTRACTKRAKENREADS } from '../modules/nf-core/krakentools/extractkrakenreads/main' +include { EXTRACTCENTRIFUGEREADS } from '../modules/local/extractcentrifugereads' +include { EXTRACTCDIAMONDREADS } from '../modules/local/extractdiamondreads' +include { TAXID_READS } from '../subworkflows/local/taxid_reads.nf' + +// Maping subworkflow +include { BOWTIE2_BUILD as BOWTIE2_BUILD_PATHOGEN } from '../modules/nf-core/bowtie2/build/main' +include { FASTQ_ALIGN_BOWTIE2 } from '../subworkflows/nf-core/fastq_align_bowtie2/main' + +// Summary subworkflow +include { FASTQC } from '../modules/nf-core/fastqc/main' +include { MULTIQC } from '../modules/nf-core/multiqc/main' +include { paramsSummaryMap } from 'plugin/nf-validation' +include { paramsSummaryMultiqc } from '../subworkflows/nf-core/utils_nfcore_pipeline' +include { softwareVersionsToYAML } from '../subworkflows/nf-core/utils_nfcore_pipeline' +include { methodsDescriptionText } from '../subworkflows/local/utils_nfcore_metaval_pipeline' /* @@ -33,7 +40,7 @@ workflow METAVAL { ch_versions = Channel.empty() ch_multiqc_files = Channel.empty() - // Create channels + // Create input channels ch_input = ch_samplesheet.branch { meta, fastq_1, fastq_2, kraken2_report, kraken2_result, kraken2_taxpasta, centrifuge_report, centrifuge_result, centrifuge_taxpasta, diamond, diamond_taxpasta -> // Define single_end based on the conditions @@ -77,6 +84,26 @@ workflow METAVAL { ) ch_versions = ch_versions.mix( TAXID_READS.out.versions ) + /* + SUBWORKFLOW: Short reads pathogens screening + */ + ch_reference = Channel.fromPath( params.pathogens_genome, checkIfExists: true) + .map{ file -> [ [ id: file.baseName ], file ] } + BOWTIE2_BUILD_PATHOGEN ( ch_reference ) + ch_versions = ch_versions.mix( BOWTIE2_BUILD_PATHOGEN.out.versions ) + FASTQ_ALIGN_BOWTIE2 ( + ch_input.short_reads, // ch_reads + BOWTIE2_BUILD_PATHOGEN.out.index, // ch_index + false, // save unaligned + false, // sort bam + ch_reference // ch_fasta + ) + ch_versions = ch_versions.mix(FASTQ_ALIGN_BOWTIE2.out.versions) + + /* + SUBWORKFLOW: long reads pathogens screening + */ + // // MODULE: Run FastQC // From 59185cae00ccf716e9bf9bbefd6551c7830d9fdb Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Wed, 10 Jul 2024 10:41:57 +0200 Subject: [PATCH 10/25] remove extra left-padding spaces in config/modules.config --- conf/modules.config | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/conf/modules.config b/conf/modules.config index f1f3d52..d14fd24 100644 --- a/conf/modules.config +++ b/conf/modules.config @@ -88,7 +88,7 @@ process { publishDir = [ path: { "$params.outdir/pathogens/bowtie2/build" }, mode: params.publish_dir_mode - ] + ] } withName: '.*:FASTQ_ALIGN_BOWTIE2:BOWTIE2_ALIGN' { ext.args = '--no-unal' From 003feba9e99ee0f45247bf189c08bf3828fdd701 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Wed, 10 Jul 2024 14:30:44 +0200 Subject: [PATCH 11/25] add pathogen screening for long reads --- conf/modules.config | 27 +++++- conf/test.config | 5 +- conf/test_full.config | 5 +- conf/test_taxid.config | 5 +- nextflow.config | 4 + nextflow_schema.json | 13 +++ subworkflows/local/longread_screenpathogen.nf | 34 ++++++++ workflows/metaval.nf | 85 ++++++++++--------- 8 files changed, 133 insertions(+), 45 deletions(-) create mode 100644 subworkflows/local/longread_screenpathogen.nf diff --git a/conf/modules.config b/conf/modules.config index d14fd24..ff80419 100644 --- a/conf/modules.config +++ b/conf/modules.config @@ -24,7 +24,7 @@ process { publishDir = [ path: { "${params.outdir}/fastqc/input" }, mode: params.publish_dir_mode, - pattern: '*.{html,zip}' + pattern: '*.{html}' ] } @@ -87,11 +87,34 @@ process { ext.args = '--large-index' publishDir = [ path: { "$params.outdir/pathogens/bowtie2/build" }, - mode: params.publish_dir_mode + mode: params.publish_dir_mode, + pattern: 'bowtie2' ] } withName: '.*:FASTQ_ALIGN_BOWTIE2:BOWTIE2_ALIGN' { ext.args = '--no-unal' publishDir = [ enabled: false] } + withName: '.*:LONGREAD_SCREENPATHOGEN:MINIMAP2_INDEX' { + ext.args = '-x map-ont' + publishDir = [ + path: { "$params.outdir/pathogens/minimap2/index" }, + mode: params.publish_dir_mode, + pattern: '*.mmi' + ] + } + withName: '.*:LONGREAD_SCREENPATHOGEN:MINIMAP2_ALIGN' { + ext.args = '--sam-hit-only' + publishDir = [ enabled: false] + } + withName: '.*:LONGREAD_SCREENPATHOGEN:BAM_SORT_STATS_SAMTOOLS:SAMTOOLS_(SORT|INDEX)' { + publishDir = [ + path: { "$params.outdir/pathogens/minimap2/align" }, + mode: params.publish_dir_mode, + saveAs: { filename -> filename.equals('versions.yml') ? null : filename } + ] + } + withName: '.*:LONGREAD_SCREENPATHOGEN:BAM_SORT_STATS_SAMTOOLS:BAM_STATS_SAMTOOLS:.*' { + publishDir = [ enabled: false ] + } } diff --git a/conf/test.config b/conf/test.config index 71ce54e..744e5d6 100644 --- a/conf/test.config +++ b/conf/test.config @@ -24,12 +24,15 @@ params { pathogens_genome = 'assets/test_data/reference/reference.fna' // Extract reads + perform_extract_reads = true extract_kraken2_reads = true fastq_output = true - extract_centrifuge_reads = true extract_diamond_reads = true + // Screen pathogens + perform_screen_pathogens = true + // Genome references genome = 'R64-1-1' } diff --git a/conf/test_full.config b/conf/test_full.config index 2c39976..24bb6e4 100644 --- a/conf/test_full.config +++ b/conf/test_full.config @@ -19,12 +19,15 @@ params { pathogens_genome = 'assets/test_data/reference/reference.fna' // Extract reads + perform_extract_reads = true extract_kraken2_reads = true fastq_output = true - extract_centrifuge_reads = true extract_diamond_reads = true + // Screen pathogens + perform_screen_pathogens = true + // Genome references genome = 'R64-1-1' } diff --git a/conf/test_taxid.config b/conf/test_taxid.config index a2ce629..00a1082 100644 --- a/conf/test_taxid.config +++ b/conf/test_taxid.config @@ -25,12 +25,15 @@ params { pathogens_genome = 'assets/test_data/reference/reference.fna' // Extract reads + perform_extract_reads = true extract_kraken2_reads = true fastq_output = true - extract_centrifuge_reads = true extract_diamond_reads = true + // Screen pathogens + perform_screen_pathogens = false + // Genome references genome = 'R64-1-1' } diff --git a/nextflow.config b/nextflow.config index 275f971..e1e47c4 100644 --- a/nextflow.config +++ b/nextflow.config @@ -64,12 +64,16 @@ params { validate_params = true // Extract kraken2 Reads + perform_extract_reads = true extract_kraken2_reads = true fastq_output = true extract_centrifuge_reads = true extract_diamond_reads = true + // Screen pathogens + perform_screen_pathogens = true + } diff --git a/nextflow_schema.json b/nextflow_schema.json index 8438de2..85c49e1 100644 --- a/nextflow_schema.json +++ b/nextflow_schema.json @@ -34,6 +34,13 @@ "description": "Path to a concatenated genome file containing complete genomes from a list of viral pathogens.", "fa_icon": "fas fa-file-csv" }, + "perform_extract_reads": { + "type": "boolean", + "default": true, + "description": "Extract reads assigned to taxonomic IDs.", + "help_text": "Enable the option to extract reads assigned to taxonomic IDs based on the classification results from classifiers Kraken2, Centrifuge, and Diamond." + }, + "extract_kraken2_reads": { "type": "boolean", "default": true, @@ -54,6 +61,12 @@ "description": "Turn on saving extracted kraken2 reads in fastq format.", "default": true }, + "perform_screen_pathogens": { + "type": "boolean", + "default": true, + "description": "Screen viral pathogens for each sample", + "help_text": "Turns on the option to screen viral pathogens by mapping reads against genomes of a list of viral pathogens. Use BOWTIE2 for short reads and Minimap2 for long reads." + }, "outdir": { "type": "string", "format": "directory-path", diff --git a/subworkflows/local/longread_screenpathogen.nf b/subworkflows/local/longread_screenpathogen.nf new file mode 100644 index 0000000..c7459a9 --- /dev/null +++ b/subworkflows/local/longread_screenpathogen.nf @@ -0,0 +1,34 @@ + +// +// Screen pathogens for long reads +// + +include { MINIMAP2_INDEX } from '../../modules/nf-core/minimap2/index/main' +include { MINIMAP2_ALIGN } from '../../modules/nf-core/minimap2/align/main' +include { BAM_SORT_STATS_SAMTOOLS } from '../nf-core/bam_sort_stats_samtools/main' + +workflow LONGREAD_SCREENPATHOGEN { + take: + reads // [ [ meta ], [ reads ] ] + reference // [ [ meta ], [ reference ] ] + + main: + ch_versions = Channel.empty() + ch_multiqc_files = Channel.empty() + + ch_minimap2_index = MINIMAP2_INDEX ( reference ).index + ch_versions = ch_versions.mix( MINIMAP2_INDEX.out.versions ) + + MINIMAP2_ALIGN ( reads, ch_minimap2_index, true, 'bai', false, false ) + ch_versions = ch_versions.mix( MINIMAP2_ALIGN.out.versions.first() ) + + BAM_SORT_STATS_SAMTOOLS ( MINIMAP2_ALIGN.out.bam, reference ) + ch_versions = ch_versions.mix(BAM_SORT_STATS_SAMTOOLS.out.versions) + + emit: + index = MINIMAP2_INDEX.out.index // channel: [ val(meta), [ index ] ] + bam = BAM_SORT_STATS_SAMTOOLS.out.bam // channel: [ val(meta), [ bam ] ] + bai = BAM_SORT_STATS_SAMTOOLS.out.bai // channel: [ val(meta), [ bai ] ] + versions = ch_versions // channel: [ versions.yml ] + mqc = ch_multiqc_files +} diff --git a/workflows/metaval.nf b/workflows/metaval.nf index 407f646..558c538 100644 --- a/workflows/metaval.nf +++ b/workflows/metaval.nf @@ -5,23 +5,24 @@ */ // Extract reads of taxIDs -include { EXTRACT_VIRAL_TAXID } from '../modules/local/extract_viral_taxid' -include { KRAKENTOOLS_EXTRACTKRAKENREADS } from '../modules/nf-core/krakentools/extractkrakenreads/main' -include { EXTRACTCENTRIFUGEREADS } from '../modules/local/extractcentrifugereads' -include { EXTRACTCDIAMONDREADS } from '../modules/local/extractdiamondreads' -include { TAXID_READS } from '../subworkflows/local/taxid_reads.nf' +include { EXTRACT_VIRAL_TAXID } from '../modules/local/extract_viral_taxid' +include { KRAKENTOOLS_EXTRACTKRAKENREADS } from '../modules/nf-core/krakentools/extractkrakenreads/main' +include { EXTRACTCENTRIFUGEREADS } from '../modules/local/extractcentrifugereads' +include { EXTRACTCDIAMONDREADS } from '../modules/local/extractdiamondreads' +include { TAXID_READS } from '../subworkflows/local/taxid_reads' // Maping subworkflow -include { BOWTIE2_BUILD as BOWTIE2_BUILD_PATHOGEN } from '../modules/nf-core/bowtie2/build/main' -include { FASTQ_ALIGN_BOWTIE2 } from '../subworkflows/nf-core/fastq_align_bowtie2/main' +include { BOWTIE2_BUILD as BOWTIE2_BUILD_PATHOGEN } from '../modules/nf-core/bowtie2/build/main' +include { FASTQ_ALIGN_BOWTIE2 } from '../subworkflows/nf-core/fastq_align_bowtie2/main' +include { LONGREAD_SCREENPATHOGEN } from '../subworkflows/local/longread_screenpathogen' // Summary subworkflow -include { FASTQC } from '../modules/nf-core/fastqc/main' -include { MULTIQC } from '../modules/nf-core/multiqc/main' -include { paramsSummaryMap } from 'plugin/nf-validation' -include { paramsSummaryMultiqc } from '../subworkflows/nf-core/utils_nfcore_pipeline' -include { softwareVersionsToYAML } from '../subworkflows/nf-core/utils_nfcore_pipeline' -include { methodsDescriptionText } from '../subworkflows/local/utils_nfcore_metaval_pipeline' +include { FASTQC } from '../modules/nf-core/fastqc/main' +include { MULTIQC } from '../modules/nf-core/multiqc/main' +include { paramsSummaryMap } from 'plugin/nf-validation' +include { paramsSummaryMultiqc } from '../subworkflows/nf-core/utils_nfcore_pipeline' +include { softwareVersionsToYAML } from '../subworkflows/nf-core/utils_nfcore_pipeline' +include { methodsDescriptionText } from '../subworkflows/local/utils_nfcore_metaval_pipeline' /* @@ -71,38 +72,42 @@ workflow METAVAL { /* SUBWORKFLOW: TAXID_READS */ - TAXID_READS ( - ch_extract_reads.reads, - ch_extract_reads.kraken2_taxpasta, - ch_extract_reads.kraken2_result, - ch_extract_reads.kraken2_report, - ch_extract_reads.centrifuge_taxpasta, - ch_extract_reads.centrifuge_result, - ch_extract_reads.centrifuge_report, - ch_extract_reads.diamond_taxpasta, - ch_extract_reads.diamond_tsv, - ) - ch_versions = ch_versions.mix( TAXID_READS.out.versions ) + if ( params.perform_extract_reads ) { + TAXID_READS ( + ch_extract_reads.reads, + ch_extract_reads.kraken2_taxpasta, + ch_extract_reads.kraken2_result, + ch_extract_reads.kraken2_report, + ch_extract_reads.centrifuge_taxpasta, + ch_extract_reads.centrifuge_result, + ch_extract_reads.centrifuge_report, + ch_extract_reads.diamond_taxpasta, + ch_extract_reads.diamond_tsv, + ) + ch_versions = ch_versions.mix( TAXID_READS.out.versions ) + } /* - SUBWORKFLOW: Short reads pathogens screening + SUBWORKFLOW: Screen pathogens */ ch_reference = Channel.fromPath( params.pathogens_genome, checkIfExists: true) .map{ file -> [ [ id: file.baseName ], file ] } - BOWTIE2_BUILD_PATHOGEN ( ch_reference ) - ch_versions = ch_versions.mix( BOWTIE2_BUILD_PATHOGEN.out.versions ) - FASTQ_ALIGN_BOWTIE2 ( - ch_input.short_reads, // ch_reads - BOWTIE2_BUILD_PATHOGEN.out.index, // ch_index - false, // save unaligned - false, // sort bam - ch_reference // ch_fasta - ) - ch_versions = ch_versions.mix(FASTQ_ALIGN_BOWTIE2.out.versions) - - /* - SUBWORKFLOW: long reads pathogens screening - */ + // Short reads + if ( params.perform_screen_pathogens ) { + BOWTIE2_BUILD_PATHOGEN ( ch_reference ) + ch_versions = ch_versions.mix( BOWTIE2_BUILD_PATHOGEN.out.versions ) + FASTQ_ALIGN_BOWTIE2 ( + ch_input.short_reads, // ch_reads + BOWTIE2_BUILD_PATHOGEN.out.index, // ch_index + false, // save unaligned + false, // sort bam + ch_reference // ch_fasta + ) + ch_versions = ch_versions.mix( FASTQ_ALIGN_BOWTIE2.out.versions ) + // Long reads + LONGREAD_SCREENPATHOGEN ( ch_input.long_reads, ch_reference ) + ch_versions = ch_versions.mix( LONGREAD_SCREENPATHOGEN.out.versions ) + } // // MODULE: Run FastQC From 2a7a354b430f1113600dce2590253d30b36ec2cf Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Thu, 11 Jul 2024 09:07:52 +0200 Subject: [PATCH 12/25] update the CHANGELOG --- CHANGELOG.md | 1 + 1 file changed, 1 insertion(+) diff --git a/CHANGELOG.md b/CHANGELOG.md index 9d7b41b..71328ac 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -11,6 +11,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0 - Extract Kraken2 reads with KrakenTools - Extract Centrifuge reads - Extract DIAMOND reads +- Screen pathogens via mapping against genomes from a list of pethogens: Bowtie2 for short reads and Minimap2 for long reads ### `Fixed` From 17e72b6445a61e338ecb5b001b332f9fb3cb3f20 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Thu, 18 Jul 2024 13:37:40 +0200 Subject: [PATCH 13/25] Update conf/modules.config Co-authored-by: Sofia Stamouli <91951607+sofstam@users.noreply.github.com> --- conf/modules.config | 1 + 1 file changed, 1 insertion(+) diff --git a/conf/modules.config b/conf/modules.config index ff80419..d67204a 100644 --- a/conf/modules.config +++ b/conf/modules.config @@ -54,6 +54,7 @@ process { pattern: '*.fastq' ] } + withName: EXTRACTCDIAMONDREADS { ext.prefix = { "${meta.id}" } publishDir = [ From 484429b14b2f0f176d067a4b894230ac47896153 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Thu, 18 Jul 2024 13:38:04 +0200 Subject: [PATCH 14/25] Update conf/modules.config Co-authored-by: Sofia Stamouli <91951607+sofstam@users.noreply.github.com> --- conf/modules.config | 1 + 1 file changed, 1 insertion(+) diff --git a/conf/modules.config b/conf/modules.config index d67204a..c321bc3 100644 --- a/conf/modules.config +++ b/conf/modules.config @@ -71,6 +71,7 @@ process { saveAs: { filename -> filename.equals('versions.yml') ? null : filename } ] } + withName: '.*:FASTQ_ALIGN_BOWTIE2:BAM_SORT_STATS_SAMTOOLS:SAMTOOLS_(SORT|INDEX)' { publishDir = [ path: { "$params.outdir/pathogens/bowtie2/align" }, From 22aa86a65b0b868464bcf7ba3e3329e1dcbb44be Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Thu, 18 Jul 2024 13:39:04 +0200 Subject: [PATCH 15/25] Update conf/modules.config Co-authored-by: Sofia Stamouli <91951607+sofstam@users.noreply.github.com> --- conf/modules.config | 1 + 1 file changed, 1 insertion(+) diff --git a/conf/modules.config b/conf/modules.config index c321bc3..2c15606 100644 --- a/conf/modules.config +++ b/conf/modules.config @@ -79,6 +79,7 @@ process { saveAs: { filename -> filename.equals('versions.yml') ? null : filename } ] } + withName: 'SAMTOOLS_SORT' { ext.prefix = { "${meta.id}_aligned_pathogens_genome_sorted"} } From 6a5e515d0b232166cb647a150b59c08d2b31c3f8 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Thu, 18 Jul 2024 13:39:14 +0200 Subject: [PATCH 16/25] Update conf/modules.config Co-authored-by: Sofia Stamouli <91951607+sofstam@users.noreply.github.com> --- conf/modules.config | 1 + 1 file changed, 1 insertion(+) diff --git a/conf/modules.config b/conf/modules.config index 2c15606..ea22df8 100644 --- a/conf/modules.config +++ b/conf/modules.config @@ -94,6 +94,7 @@ process { pattern: 'bowtie2' ] } + withName: '.*:FASTQ_ALIGN_BOWTIE2:BOWTIE2_ALIGN' { ext.args = '--no-unal' publishDir = [ enabled: false] From 3b912c77edca4597ebacb1956233f14a1e69606f Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Thu, 18 Jul 2024 13:39:25 +0200 Subject: [PATCH 17/25] Update nextflow_schema.json Co-authored-by: Sofia Stamouli <91951607+sofstam@users.noreply.github.com> --- nextflow_schema.json | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/nextflow_schema.json b/nextflow_schema.json index 85c49e1..3f5a32e 100644 --- a/nextflow_schema.json +++ b/nextflow_schema.json @@ -44,7 +44,7 @@ "extract_kraken2_reads": { "type": "boolean", "default": true, - "description": "Extract classified Kraken2 output by taxonomic ID." + "description": "Extract reads classified by kraken2 according to taxonomic ID." }, "extract_centrifuge_reads": { "type": "boolean", From b19db4fb51ed2d947cc1642f7390b3867a7e8ed4 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Thu, 18 Jul 2024 13:39:36 +0200 Subject: [PATCH 18/25] Update nextflow_schema.json Co-authored-by: Sofia Stamouli <91951607+sofstam@users.noreply.github.com> --- nextflow_schema.json | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/nextflow_schema.json b/nextflow_schema.json index 3f5a32e..1d0574d 100644 --- a/nextflow_schema.json +++ b/nextflow_schema.json @@ -49,7 +49,7 @@ "extract_centrifuge_reads": { "type": "boolean", "default": true, - "description": "Extract classified centrifuge output by taxonomic ID." + "description": "Extract reads classified by centrifuge according to taxonomic ID." }, "extract_diamond_reads": { "type": "boolean", From 7b1b179fe8381fe121d95db0f6b9ad63d91927a4 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Thu, 18 Jul 2024 13:39:44 +0200 Subject: [PATCH 19/25] Update nextflow_schema.json Co-authored-by: Sofia Stamouli <91951607+sofstam@users.noreply.github.com> --- nextflow_schema.json | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/nextflow_schema.json b/nextflow_schema.json index 1d0574d..d3b2921 100644 --- a/nextflow_schema.json +++ b/nextflow_schema.json @@ -54,7 +54,7 @@ "extract_diamond_reads": { "type": "boolean", "default": true, - "description": "Extract classified diamond output by taxonomic ID." + "description": "Extract reads classified by diamond according to taxonomic ID." }, "fastq_output": { "type": "boolean", From c2cc381474035f8b22cdb6afd9eeb76589813b66 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Thu, 18 Jul 2024 13:39:51 +0200 Subject: [PATCH 20/25] Update nextflow_schema.json Co-authored-by: Sofia Stamouli <91951607+sofstam@users.noreply.github.com> --- nextflow_schema.json | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/nextflow_schema.json b/nextflow_schema.json index d3b2921..953d412 100644 --- a/nextflow_schema.json +++ b/nextflow_schema.json @@ -65,7 +65,7 @@ "type": "boolean", "default": true, "description": "Screen viral pathogens for each sample", - "help_text": "Turns on the option to screen viral pathogens by mapping reads against genomes of a list of viral pathogens. Use BOWTIE2 for short reads and Minimap2 for long reads." + "help_text": "Turns on the option to screen viral pathogens by mapping reads against genomes of a list of viral pathogens. Bowtie2 is used for mapping of short reads and minimap2 for long reads." }, "outdir": { "type": "string", From eac76ca442bf2f30e8031abc15bc5bf595ed8509 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Thu, 18 Jul 2024 13:55:14 +0200 Subject: [PATCH 21/25] Trail whitespace --- conf/modules.config | 16 ++++++++++++---- 1 file changed, 12 insertions(+), 4 deletions(-) diff --git a/conf/modules.config b/conf/modules.config index ea22df8..510f724 100644 --- a/conf/modules.config +++ b/conf/modules.config @@ -36,6 +36,7 @@ process { pattern: '*viral_taxids.tsv' ] } + withName: KRAKENTOOLS_EXTRACTKRAKENREADS { ext.args = { params.fastq_output ? "--fastq-output" : ""} ext.prefix = { "${meta.id}_${taxid.toString().replaceAll(' ', '-')}" } @@ -54,7 +55,7 @@ process { pattern: '*.fastq' ] } - + withName: EXTRACTCDIAMONDREADS { ext.prefix = { "${meta.id}" } publishDir = [ @@ -63,6 +64,7 @@ process { pattern: '*.fastq' ] } + withName: MULTIQC { ext.args = { { params.multiqc_title ? "--title \"$params.multiqc_title\"" : '' } } publishDir = [ @@ -71,7 +73,7 @@ process { saveAs: { filename -> filename.equals('versions.yml') ? null : filename } ] } - + withName: '.*:FASTQ_ALIGN_BOWTIE2:BAM_SORT_STATS_SAMTOOLS:SAMTOOLS_(SORT|INDEX)' { publishDir = [ path: { "$params.outdir/pathogens/bowtie2/align" }, @@ -79,13 +81,15 @@ process { saveAs: { filename -> filename.equals('versions.yml') ? null : filename } ] } - + withName: 'SAMTOOLS_SORT' { ext.prefix = { "${meta.id}_aligned_pathogens_genome_sorted"} } + withName: '.*:FASTQ_ALIGN_BOWTIE2:BAM_SORT_STATS_SAMTOOLS:BAM_STATS_SAMTOOLS:.*' { publishDir = [ enabled: false ] } + withName: 'BOWTIE2_BUILD_PATHOGEN' { ext.args = '--large-index' publishDir = [ @@ -94,11 +98,12 @@ process { pattern: 'bowtie2' ] } - + withName: '.*:FASTQ_ALIGN_BOWTIE2:BOWTIE2_ALIGN' { ext.args = '--no-unal' publishDir = [ enabled: false] } + withName: '.*:LONGREAD_SCREENPATHOGEN:MINIMAP2_INDEX' { ext.args = '-x map-ont' publishDir = [ @@ -107,10 +112,12 @@ process { pattern: '*.mmi' ] } + withName: '.*:LONGREAD_SCREENPATHOGEN:MINIMAP2_ALIGN' { ext.args = '--sam-hit-only' publishDir = [ enabled: false] } + withName: '.*:LONGREAD_SCREENPATHOGEN:BAM_SORT_STATS_SAMTOOLS:SAMTOOLS_(SORT|INDEX)' { publishDir = [ path: { "$params.outdir/pathogens/minimap2/align" }, @@ -118,6 +125,7 @@ process { saveAs: { filename -> filename.equals('versions.yml') ? null : filename } ] } + withName: '.*:LONGREAD_SCREENPATHOGEN:BAM_SORT_STATS_SAMTOOLS:BAM_STATS_SAMTOOLS:.*' { publishDir = [ enabled: false ] } From bed5faadc492153d23cdf99ae5e7321619266bee Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Thu, 18 Jul 2024 14:35:34 +0200 Subject: [PATCH 22/25] move the multiqc to the end of modules.config --- conf/modules.config | 19 ++++++++++--------- 1 file changed, 10 insertions(+), 9 deletions(-) diff --git a/conf/modules.config b/conf/modules.config index 510f724..6e140c1 100644 --- a/conf/modules.config +++ b/conf/modules.config @@ -65,15 +65,6 @@ process { ] } - withName: MULTIQC { - ext.args = { { params.multiqc_title ? "--title \"$params.multiqc_title\"" : '' } } - publishDir = [ - path: { "${params.outdir}/multiqc"}, - mode: params.publish_dir_mode, - saveAs: { filename -> filename.equals('versions.yml') ? null : filename } - ] - } - withName: '.*:FASTQ_ALIGN_BOWTIE2:BAM_SORT_STATS_SAMTOOLS:SAMTOOLS_(SORT|INDEX)' { publishDir = [ path: { "$params.outdir/pathogens/bowtie2/align" }, @@ -129,4 +120,14 @@ process { withName: '.*:LONGREAD_SCREENPATHOGEN:BAM_SORT_STATS_SAMTOOLS:BAM_STATS_SAMTOOLS:.*' { publishDir = [ enabled: false ] } + + withName: MULTIQC { + ext.args = { { params.multiqc_title ? "--title \"$params.multiqc_title\"" : '' } } + publishDir = [ + path: { "${params.outdir}/multiqc"}, + mode: params.publish_dir_mode, + saveAs: { filename -> filename.equals('versions.yml') ? null : filename } + ] + } + } From d16c39008497ed1ba33ad046faad35fbe5af33c1 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Thu, 18 Jul 2024 14:53:57 +0200 Subject: [PATCH 23/25] Update nextflow_schema.json Co-authored-by: Sofia Stamouli <91951607+sofstam@users.noreply.github.com> --- nextflow_schema.json | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/nextflow_schema.json b/nextflow_schema.json index 953d412..da7e162 100644 --- a/nextflow_schema.json +++ b/nextflow_schema.json @@ -38,7 +38,7 @@ "type": "boolean", "default": true, "description": "Extract reads assigned to taxonomic IDs.", - "help_text": "Enable the option to extract reads assigned to taxonomic IDs based on the classification results from classifiers Kraken2, Centrifuge, and Diamond." + "help_text": "Enable the option to extract reads assigned to taxonomic IDs based on results from Kraken2, Centrifuge, and Diamond classifiers." }, "extract_kraken2_reads": { From 36cc4221b1ded38c28c7fcd6b78b3e3375ce7b40 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Thu, 18 Jul 2024 14:57:01 +0200 Subject: [PATCH 24/25] Update nextflow.config Co-authored-by: Sofia Stamouli <91951607+sofstam@users.noreply.github.com> --- nextflow.config | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/nextflow.config b/nextflow.config index e1e47c4..fa5a7a4 100644 --- a/nextflow.config +++ b/nextflow.config @@ -16,7 +16,7 @@ params { taxid = null // Pathogen screening - pathogens_genome = null + pathogens_genomes = null // References genome = null From 93468704b4ccb50d1269a2fe7dc91a4b5d39c302 Mon Sep 17 00:00:00 2001 From: Lili Andersson-Li <64467552+LilyAnderssonLee@users.noreply.github.com> Date: Thu, 18 Jul 2024 14:57:29 +0200 Subject: [PATCH 25/25] Update nextflow_schema.json Co-authored-by: Sofia Stamouli <91951607+sofstam@users.noreply.github.com> --- nextflow_schema.json | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/nextflow_schema.json b/nextflow_schema.json index da7e162..0158ef0 100644 --- a/nextflow_schema.json +++ b/nextflow_schema.json @@ -27,7 +27,7 @@ "type": "string", "description": "The taxonomy ID of the species identified in the classification results or a list of taxids separated by spaces." }, - "pathogens_genome": { + "pathogens_genomes": { "type": "string", "format": "file-path", "pattern": "^\\S+\\.fn?a(sta)?(\\.gz)?$",