diff --git a/tools/virAnnot/.shed.yml b/tools/virAnnot/.shed.yml
new file mode 100755
index 00000000000..46e552c8f8e
--- /dev/null
+++ b/tools/virAnnot/.shed.yml
@@ -0,0 +1,22 @@
+categories:
+- Metagenomics
+description: virAnnot wrappers
+homepage_url: https://github.com/marieBvr/virAnnot
+type: unrestricted
+long_description: VirAnnot was build to ease the assembly, blast search, taxonomic
+ annotation and OTUs assignation of viral metagenomic NGS data. It is designed to
+ identify viruses in plant metagenomic data but it can be used to assemble and annotate
+ any sequences with the NCBI taxonomy.
+name: virannot
+owner: melefebvre
+remote_repository_url: https://github.com/galaxyproject/tools-iuc/tree/master/tools/virAnnot
+auto_tool_repositories:
+ name_template: "{{ tool_id }}"
+ description_template: "Wrapper for the anndata tool suite: {{ tool_name }}"
+suite:
+ name: "suite_virannot"
+ description: "Add taxonomic info to HTS data and assign viral OTUs"
+ long_description: "VirAnnot was build to ease the assembly, blast search, taxonomic
+ annotation and OTUs assignation of viral metagenomic NGS data. It is designed to
+ identify viruses in plant metagenomic data but it can be used to assemble and annotate
+ any sequences with the NCBI taxonomy."
\ No newline at end of file
diff --git a/tools/virAnnot/blast2tsv.py b/tools/virAnnot/blast2tsv.py
new file mode 100755
index 00000000000..ea3d48b854e
--- /dev/null
+++ b/tools/virAnnot/blast2tsv.py
@@ -0,0 +1,284 @@
+#!/usr/bin/env python3
+
+
+# Name: blast2tsv
+# Author(s): Sebastien Theil, Marie Lefebvre - INRAE
+# Aims: Convert blast xml output to tsv and add taxonomy
+
+
+import argparse
+import csv
+import logging as log
+import os
+
+from Bio import Entrez
+from Bio import SeqIO
+from Bio.Blast import NCBIXML
+from ete3 import NCBITaxa
+
+ncbi = NCBITaxa()
+
+
+def main():
+ options = _set_options()
+ _set_log_level(options.verbosity)
+ hits = _read_xml(options)
+ _write_tsv(options, hits)
+
+
+def _guess_database(accession):
+ """Guess the correct database for querying based off the format of the accession"""
+ database_mappings_refseq = {'AC_': 'nuccore', 'NC_': 'nuccore', 'NG_': 'nuccore',
+ 'NT_': 'nuccore', 'NW_': 'nuccore', 'NZ_': 'nuccore',
+ 'AP_': 'protein', 'NP_': 'protein', 'YP_': 'protein',
+ 'XP_': 'protein', 'WP_': 'protein'}
+ return database_mappings_refseq[accession[0:3]]
+
+
+def _read_xml(options):
+ """
+ Parse XML blast results file
+ Keep only the first hit
+ """
+ log.info("Read XML file.")
+ results = open(options.xml_file, 'r')
+ records = NCBIXML.parse(results)
+ xml_results = {}
+ for blast_record in records:
+ for aln in blast_record.alignments:
+ hit_count = 1
+ for hit in aln.hsps:
+ hsp = {}
+ if hit_count == 1:
+ first_hit_frame = hit.frame[1] if len(hit.frame) > 0 else 0 # strand
+ cumul_hit_identity = hit.identities if hit.identities else 0
+ cumul_hit_score = hit.bits # hit score
+ cumul_hit_evalue = hit.expect # evalue
+ cumul_hit_length = hit.align_length if hit.align_length is not None else 0
+ hit_count = hit_count + 1
+ else:
+ # all HSPs in different strand than 1st HSPs will be discarded.
+ if (first_hit_frame > 0 and hit.frame[1] > 0) or (first_hit_frame < 0 and hit.frame[1] < 0):
+ cumul_hit_identity = cumul_hit_identity + hit.identities
+ cumul_hit_length = cumul_hit_length + hit.align_length
+ cumul_hit_evalue = cumul_hit_evalue + hit.expect
+ cumul_hit_score = cumul_hit_score + hit.bits
+ hit_count = hit_count + 1
+ if hit_count == 1:
+ final_hit_count = hit_count
+ elif hit_count > 1:
+ final_hit_count = hit_count - 1
+ hsp["evalue"] = cumul_hit_evalue / final_hit_count # The smaller the E-value, the better the match
+ hsp["query_id"] = blast_record.query_id
+ hsp["query_length"] = blast_record.query_length # length of the query
+ hsp["accession"] = aln.accession.replace("ref|", "")
+ hsp["description"] = aln.hit_def
+ hsp["hit_length"] = aln.length # length of the hit
+ hsp["hsp_length"] = hit.align_length # length of the hsp alignment
+ hsp["queryOverlap"] = _get_overlap_value(options.algo, hsp, 'hsp', hsp["query_length"])[0]
+ if cumul_hit_length == 0:
+ hsp["percentIdentity"] = round(cumul_hit_identity, 1) # identity percentage
+ else:
+ hsp["percentIdentity"] = round(cumul_hit_identity / cumul_hit_length * 100, 1) # identity percentage
+ hsp["score"] = cumul_hit_score # The higher the bit-score, the better the sequence similarity
+ hsp["num_hsps"] = final_hit_count
+ hsp["hit_cumul_length"] = cumul_hit_length
+ hsp["hitOverlap"] = _get_overlap_value(options.algo, hsp, 'hit', hsp["query_length"])[1]
+ db = _guess_database(hsp["accession"])
+ try:
+ handle = Entrez.esummary(db=db, id=hsp["accession"])
+ taxid = str(int(Entrez.read(handle)[0]['TaxId']))
+ handle.close()
+ log.info("Taxid found for " + hsp["accession"])
+ lineage = ncbi.get_lineage(taxid)
+ names = ncbi.get_taxid_translator(lineage)
+ ordered = [names[tid] for tid in lineage]
+ taxonomy = ordered[1:]
+ hsp["tax_id"] = taxid
+ hsp["taxonomy"] = ';'.join(taxonomy)
+ hsp["organism"] = taxonomy[-1]
+ except RuntimeError:
+ hsp["tax_id"] = ""
+ hsp["taxonomy"] = ""
+ hsp["organism"] = ""
+ log.warning("RuntimeError - Taxid not found for " + hsp["accession"])
+ if hsp["evalue"] <= options.max_evalue and hsp["queryOverlap"] >= options.min_qov and \
+ hsp["hitOverlap"] >= options.min_hov and hsp["score"] >= options.min_score:
+ xml_results[hsp["query_id"]] = hsp
+ else:
+ xml_results[hsp["query_id"]] = [hsp["query_length"]]
+
+ return xml_results
+
+
+def _get_overlap_value(algo, hsp, type, qlength):
+ """
+ Set hsp or hit overlap values for hit and query
+ Return array [query_overlap, hit_overlap]
+ """
+ if type == 'hsp':
+ q_align_len = qlength
+ h_align_len = hsp["hsp_length"]
+ else:
+ q_align_len = qlength
+ h_align_len = hsp["hit_cumul_length"]
+
+ if algo == 'BLASTX':
+ if q_align_len:
+ query_overlap = (q_align_len * 3 / q_align_len) * 100
+ if hsp["hit_length"]:
+ hit_overlap = (h_align_len / hsp["hit_length"]) * 100
+ elif algo == 'TBLASTN':
+ if q_align_len:
+ query_overlap = (q_align_len / q_align_len) * 100
+ if hsp["hit_length"]:
+ hit_overlap = (h_align_len * 3 / hsp["hit_length"]) * 100
+ elif algo == 'TBLASTX':
+ if q_align_len:
+ query_overlap = (q_align_len * 3 / hsp["hsp_length"]) * 100
+ if hsp["hit_length"]:
+ hit_overlap = (h_align_len * 3 / hsp["hit_length"]) * 100
+ else:
+ if q_align_len:
+ query_overlap = (q_align_len / q_align_len) * 100
+ if hsp["hit_length"]:
+ hit_overlap = (h_align_len / hsp["hit_length"]) * 100
+ if query_overlap is None:
+ query_overlap = 0
+ if query_overlap > 100:
+ query_overlap = 100
+ if 'hit_overlap' not in locals():
+ hit_overlap = 0
+ if hit_overlap > 100:
+ hit_overlap = 100
+
+ return [round(query_overlap, 0), round(hit_overlap, 0)]
+
+
+def _write_tsv(options, hits):
+ """
+ Write output
+ """
+ # get a list of contig without corresponding number of mapped reads
+ if options.rn_file is not None:
+ with open(options.rn_file) as rn:
+ rows = (line.split('\t') for line in rn)
+ rn_list = {row[0]: row[1:] for row in rows}
+ fasta = SeqIO.to_dict(SeqIO.parse(open(options.fasta_file), 'fasta'))
+ headers = "#algo\tquery_id\tnb_reads\tquery_length\taccession\tdescription\torganism\tpercentIdentity\tnb_hsps\tqueryOverlap\thitOverlap\tevalue\tscore\ttax_id\ttaxonomy\tsequence\n"
+ if not os.path.exists(options.output):
+ os.mkdir(options.output)
+ tsv_file = options.output + "/blast2tsv_output.tab"
+ log.info("Write output file: " + tsv_file)
+ f = open(tsv_file, "w+")
+ f.write(headers)
+ for h in hits:
+ if options.rn_file is not None:
+ read_nb = ''.join(rn_list[h]).replace("\n", "")
+ else:
+ read_nb = ''
+ if len(hits[h]) > 1:
+ f.write(options.algo + "\t" + h + "\t" + read_nb + "\t" + str(hits[h]["query_length"]) + "\t")
+ f.write(hits[h]["accession"] + "\t" + hits[h]["description"] + "\t")
+ f.write(hits[h]["organism"] + "\t" + str(hits[h]["percentIdentity"]) + "\t")
+ f.write(str(hits[h]["num_hsps"]) + "\t" + str(hits[h]["queryOverlap"]) + "\t")
+ f.write(str(hits[h]["hitOverlap"]) + "\t" + str(hits[h]["evalue"]) + "\t")
+ f.write(str(hits[h]["score"]) + "\t" + str(hits[h]["tax_id"]) + "\t")
+ if h in fasta:
+ f.write(hits[h]["taxonomy"] + "\t" + str(fasta[h].seq))
+ else:
+ f.write(hits[h]["taxonomy"] + "\t\"\"")
+ f.write("\n")
+ else:
+ f.write(options.algo + "\t" + h + "\t" + read_nb + "\t" + str(hits[h])[1:-1] + "\t")
+ f.write("\n")
+ f.close()
+ _create_abundance(options, tsv_file)
+
+
+def _create_abundance(options, tsv_file):
+ """
+ extract values from tsv files
+ and create abundance files
+ """
+ log.info("Calculating abundance.")
+ file_path = tsv_file
+ abundance = dict()
+ with open(tsv_file, 'r') as current_file:
+ log.debug("Reading " + file_path)
+ csv_reader = csv.reader(current_file, delimiter='\t')
+ line_count = 0
+ for row in csv_reader:
+ if line_count == 0:
+ # headers
+ line_count += 1
+ else:
+ # no annotation
+ if len(row) == 16:
+ if row[14] != "":
+ nb_reads = row[2]
+ if nb_reads == "":
+ current_reads_nb = 0
+ log.debug("No reads number for " + row[1])
+ else:
+ current_reads_nb = int(nb_reads)
+ contig_id = row[14]
+ if contig_id in abundance:
+ # add reads
+ abundance[contig_id]["reads_nb"] = abundance[row[14]]["reads_nb"] + current_reads_nb
+ abundance[contig_id]["contigs_nb"] = abundance[row[14]]["contigs_nb"] + 1
+ else:
+ # init reads for this taxo
+ abundance[contig_id] = {}
+ abundance[contig_id]["reads_nb"] = current_reads_nb
+ abundance[contig_id]["contigs_nb"] = 1
+ else:
+ log.debug("No annotations for contig " + row[1])
+ else:
+ log.debug("No annotations for contig " + row[1])
+ log.debug(abundance)
+ reads_file = open(options.output + "/blast2tsv_reads.txt", "w+")
+ for taxo in abundance:
+ reads_file.write(str(abundance[taxo]["reads_nb"]))
+ reads_file.write("\t")
+ reads_file.write("\t".join(taxo.split(";")))
+ reads_file.write("\n")
+ reads_file.close()
+ log.info("Abundance file created " + options.output + "/blast2tsv_reads.txt")
+ contigs_file = open(options.output + "/blast2tsv_contigs.txt", "w+")
+ for taxo in abundance:
+ contigs_file.write(str(abundance[taxo]["contigs_nb"]))
+ contigs_file.write("\t")
+ contigs_file.write("\t".join(taxo.split(";")))
+ contigs_file.write("\n")
+ contigs_file.close()
+ log.info("Abundance file created " + options.output + "/blast2tsv_contigs.txt")
+
+
+def _set_options():
+ parser = argparse.ArgumentParser()
+ parser.add_argument('-x', '--xml', help='XML files with results of blast', action='store', required=True, dest='xml_file')
+ parser.add_argument('-rn', '--read-count', help='Tab-delimited file associating seqID with read number.', action='store', dest='rn_file')
+ parser.add_argument('-c', '--contigs', help='FASTA file with contigs sequence.', action='store', required=True, dest='fasta_file')
+ parser.add_argument('-me', '--max_evalue', help='Max evalue', action='store', type=float, default=0.0001, dest='max_evalue')
+ parser.add_argument('-qov', '--min_query_overlap', help='Minimum query overlap', action='store', type=int, default=5, dest='min_qov')
+ parser.add_argument('-mhov', '--min_hit_overlap', help='Minimum hit overlap', action='store', type=int, default=5, dest='min_hov')
+ parser.add_argument('-s', '--min_score', help='Minimum score', action='store', type=int, default=30, dest='min_score')
+ parser.add_argument('-a', '--algo', help='Blast type detection (BLASTN|BLASTP|BLASTX|TBLASTX|TBLASTN|DIAMONDX).', action='store', type=str, default='BLASTX', dest='algo')
+ parser.add_argument('-o', '--out', help='The output file (.csv).', action='store', type=str, default='./blast2tsv', dest='output')
+ parser.add_argument('-v', '--verbosity', help='Verbose level', action='store', type=int, choices=[1, 2, 3, 4], default=1)
+ args = parser.parse_args()
+ return args
+
+
+def _set_log_level(verbosity):
+ if verbosity == 1:
+ log_format = '%(asctime)s %(levelname)-8s %(message)s'
+ log.basicConfig(level=log.INFO, format=log_format)
+ elif verbosity == 3:
+ log_format = '%(filename)s:%(lineno)s - %(asctime)s %(levelname)-8s %(message)s'
+ log.basicConfig(level=log.DEBUG, format=log_format)
+
+
+if __name__ == "__main__":
+ main()
diff --git a/tools/virAnnot/macros.xml b/tools/virAnnot/macros.xml
new file mode 100755
index 00000000000..291f8cbac18
--- /dev/null
+++ b/tools/virAnnot/macros.xml
@@ -0,0 +1,25 @@
+
+
+
+ biopython
+ ete3
+ clustalo
+ curl
+ r-base
+ pyaml
+ openpyxl
+ xlsxwriter
+ xlrd
+ pandas
+ krona
+ zip
+
+
+
+
+
+
+ 10.1094/PBIOMES-07-19-0037-A
+
+
+
diff --git a/tools/virAnnot/otu.py b/tools/virAnnot/otu.py
new file mode 100755
index 00000000000..b0100c966a0
--- /dev/null
+++ b/tools/virAnnot/otu.py
@@ -0,0 +1,442 @@
+#!/usr/bin/env python3
+
+
+# Name: virAnnot_otu
+# Author: Marie Lefebvre - INRAE
+# Reuirements: Ete3 toolkit and external apps
+# Aims: Create viral OTUs based on RPS and Blast annotations
+
+
+import argparse
+import csv
+import logging as log
+import os
+import random
+import re
+
+import pandas as pd
+import xlsxwriter
+from Bio import SeqIO
+from Bio.Align.Applications import ClustalOmegaCommandline
+from ete3 import NodeStyle, SeqGroup, SeqMotifFace, Tree, TreeStyle
+
+
+def main():
+ """
+ 1 - retrieve info (sequence, query_id, taxo) from RPS file
+ 2 - align protein sequences of the same domain, calculate
+ matrix of distances, generate trees
+ 3 - get statistics (read number) per otu
+ 4 - create HTML report
+ """
+ options = _set_options()
+ _set_log_level(options.verbosity)
+ hits_collection = _cut_sequence(options)
+ _align_sequences(options, hits_collection)
+ _get_stats(options, hits_collection)
+ _create_html(options, hits_collection)
+
+
+def _cut_sequence(options):
+ """
+ Retrieve viral hits and sequences from RPS files
+ """
+ log.info("Cut sequences")
+ i = 0 # keep track of iterations over rps files to use the corresponding fasta file
+ collection = {}
+ options.rps.sort()
+ for rps_file in options.rps:
+ log.debug("Reading rps file " + str(rps_file))
+ with open(rps_file[0], 'r') as rps_current_file:
+ rps_reader = csv.reader(rps_current_file, delimiter='\t')
+ headers = 0
+ for row in rps_reader:
+ if headers == 0:
+ # headers
+ headers += 1
+ else:
+ if row[1] == "no_hit":
+ pass
+ else:
+ query_id = row[0]
+ cdd_id = row[2]
+ startQ = int(row[5])
+ endQ = int(row[6])
+ frame = float(row[7])
+ description = row[8]
+ superkingdom = row[9]
+ match = re.search("Viruses", superkingdom)
+ # if contig is viral then retrieve sequence
+ if match:
+ options.fasta.sort()
+ seq = _retrieve_fasta_seq(options.fasta[i][0], query_id)
+ seq_length = len(seq)
+ if endQ < seq_length:
+ seq = seq[startQ - 1:endQ]
+ else:
+ seq = seq[startQ - 1:seq_length]
+ if frame < 0:
+ seq = seq.reverse_complement()
+ prot = seq.translate()
+ if len(prot) >= options.min_protein_length:
+ log.debug("Add " + query_id + " to collection")
+ if cdd_id not in collection:
+ collection[cdd_id] = {}
+ collection[cdd_id][query_id] = {}
+ collection[cdd_id][query_id]["nuccleotide"] = seq
+ collection[cdd_id][query_id]["protein"] = prot
+ collection[cdd_id][query_id]["full_description"] = description
+ if options.blast is not None:
+ options.blast.sort()
+ with open(options.blast[i][0], 'r') as blast_current_file:
+ blast_reader = csv.reader(blast_current_file, delimiter='\t')
+ for b_query in blast_reader:
+ if b_query[1] == query_id:
+ collection[cdd_id][query_id]["nb"] = b_query[2]
+ if len(b_query) > 10:
+ collection[cdd_id][query_id]["taxonomy"] = b_query[14]
+ else:
+ collection[cdd_id][query_id]["taxonomy"] = "Unknown"
+ else:
+ if "nb" not in collection[cdd_id][query_id]:
+ collection[cdd_id][query_id]["nb"] = 0
+ if "taxonomy" not in collection[cdd_id][query_id]:
+ collection[cdd_id][query_id]["taxonomy"] = "Unknown"
+ else:
+ log.info("No blast file")
+ collection[cdd_id][query_id]["taxonomy"] = "Unknown"
+ collection[cdd_id][query_id]["nb"] = 0
+
+ collection[cdd_id]["short_description"] = description.split(",")[0] + description.split(",")[1] # keep pfamXXX and RdRp 1
+ collection[cdd_id]["full_description"] = description
+ i += 1
+ return collection
+
+
+def _retrieve_fasta_seq(fasta_file, query_id):
+ """
+ From fasta file retrieve specific sequence with id
+ """
+ contigs_list = SeqIO.to_dict(SeqIO.parse(open(fasta_file), 'fasta'))
+ try:
+ seq = contigs_list[query_id].seq
+ except KeyError:
+ print("KeyError for " + query_id + " file " + fasta_file)
+ else:
+ return seq
+
+
+def _create_tree(tree, fasta, out, color):
+ """
+ Create phylogenic tree from multiple alignments
+ """
+ try:
+ f = open(tree, 'r')
+ except IOError:
+ log.info("Unknown file: " + tree + ". You may have less than 2 sequences to align.")
+ return
+
+ line = ""
+ for word in f:
+ line += word.strip()
+
+ f.close()
+ seqs = SeqGroup(fasta, format="fasta")
+ t = Tree(tree)
+ ts = TreeStyle()
+ ts.show_branch_length = True
+ colors = _parse_color_file(color)
+ node_names = t.get_leaf_names()
+ for name in node_names:
+ seq = seqs.get_seq(name)
+ seqFace = SeqMotifFace(seq, seq_format="()")
+ node = t.get_leaves_by_name(name)
+ for i in range(0, len(node)):
+ if name in colors:
+ ns = NodeStyle()
+ ns['bgcolor'] = colors[name]
+ node[i].set_style(ns)
+ node[i].add_face(seqFace, 0, 'aligned')
+
+ t.render(out, tree_style=ts)
+
+
+def _parse_color_file(file):
+ fh = open(file)
+ reader = csv.reader(fh, delimiter="\t")
+ data = list(reader)
+ colors = {}
+ for i in range(0, len(data)):
+ colors[data[i][0]] = data[i][1]
+
+ return colors
+
+
+def _align_sequences(options, hits_collection):
+ """
+ Align hit sequences with pfam reference
+ """
+ log.info("Align sequences")
+ if not os.path.exists(options.output):
+ os.mkdir(options.output)
+ color_by_sample = {}
+ for cdd_id in hits_collection:
+ cdd_output = options.output + "/" + hits_collection[cdd_id]["short_description"].replace(" ", "_")
+ if not os.path.exists(cdd_output):
+ os.mkdir(cdd_output)
+ if os.path.exists(cdd_output + "/seq_to_align.fasta"):
+ os.remove(cdd_output + "/seq_to_align.fasta")
+ file_seq_to_align = cdd_output + "/seq_to_align.fasta"
+ file_color_config = cdd_output + "/color_config.txt"
+ f = open(file_seq_to_align, "a")
+ f_c = open(file_color_config, "w+")
+ log.info("Writing to " + file_seq_to_align)
+ count = 0 # count number of contig per domain
+ for query_id in hits_collection[cdd_id]:
+ if query_id not in ["short_description", "full_description"]:
+ sample = query_id.split("_")[0] # get sample from SAMPLE_IdCONTIG
+ sample_color = "#" + ''.join([random.choice('ABCDEF0123456789') for i in range(6)])
+ # same color for each contig of the same sample
+ if sample not in color_by_sample.keys():
+ color_by_sample[sample] = sample_color
+ f.write(">" + query_id + "\n")
+ f.write(str(hits_collection[cdd_id][query_id]["protein"]) + "\n")
+ f_c.write(query_id + '\t' + color_by_sample[sample] + '\n')
+ count += 1
+ f.close()
+ f_c.close()
+ file_seq_aligned = cdd_output + '/seq_aligned.final_tree.fa'
+ tree_file = cdd_output + '/tree.dnd'
+ file_cluster = cdd_output + '/otu_cluster.csv'
+ # create alignment for domain with more than 1 contigs
+ if count > 1:
+ log.info("Run clustal omega...")
+ clustalo_cmd = ClustalOmegaCommandline("clustalo", infile=file_seq_to_align, outfile=file_seq_aligned,
+ guidetree_out=tree_file, seqtype="protein", force=True)
+ log.debug(clustalo_cmd)
+ stdout, stderr = clustalo_cmd()
+ log.debug(stdout + stderr)
+
+ # create tree plot with colors
+ file_matrix = cdd_output + "/identity_matrix.csv"
+ log.info("Create tree...")
+ _create_tree(tree_file, file_seq_aligned, tree_file + '.png', file_color_config)
+ _compute_pairwise_distance(options, file_seq_aligned, file_matrix, cdd_id)
+ log.info("Retrieve OTUs...")
+ # if os.path.exists(file_cluster):
+ # os.remove(file_cluster)
+ otu_cmd = os.path.join(options.tool_path, 'seek_otu.R') + ' ' + file_matrix + ' ' + file_cluster + ' ' + str(options.perc)
+ log.debug(otu_cmd)
+ os.system(otu_cmd)
+ # only one contig
+ else:
+ mv_cmd = 'cp ' + file_seq_to_align + ' ' + file_seq_aligned
+ log.debug(mv_cmd)
+ os.system(mv_cmd)
+
+ f = open(file_cluster, "w+")
+ f.write('OTU_1,1,' + list(hits_collection[cdd_id].keys())[0] + ',')
+ f.close()
+
+
+def _compute_pairwise_distance(options, file_seq_aligned, file_matrix, cdd_id):
+ """
+ Calculate paiwise distance between aligned protein sequences
+ from a cdd_id
+ """
+ log.info("Compute pairwise distance of " + cdd_id)
+ matrix = {}
+ for k1 in SeqIO.parse(file_seq_aligned, "fasta"):
+ row = []
+ for k2 in SeqIO.parse(file_seq_aligned, "fasta"):
+ identic = 0
+ compared = 0
+ keep_pos = 0
+ for base in k1:
+ base2 = k2[keep_pos]
+ # mutation, next
+ if base == 'X' or base2 == 'X':
+ keep_pos += 1
+ continue
+ # gap in both sequences, next
+ if base == '-' and base2 == '-':
+ keep_pos += 1
+ continue
+ # gap in one of the sequence, next
+ if base == '-' or base2 == '-':
+ keep_pos += 1
+ continue
+ # identity
+ if base == base2:
+ identic += 1
+ compared += 1
+ keep_pos += 1
+ # set minimum overlap to 20
+ if compared == 0 or compared < 20:
+ percentIdentity = 0
+ else:
+ percentIdentity = (identic / compared) * 100
+ row.append(percentIdentity)
+ matrix[k1.id] = row
+ log.debug("Write " + file_matrix)
+ f = open(file_matrix, "w+")
+ for row in matrix:
+ f.write(row + ',' + ', '.join(map(str, matrix[row])) + "\n")
+ f.close()
+
+
+def _get_stats(options, hits_collection):
+ """
+ Retrieve annotation and number of read
+ for each OTUs
+ """
+ file_xlsx = options.output + '/otu_stats.xlsx' # Create a workbook
+ workbook = xlsxwriter.Workbook(file_xlsx)
+ log.info("Writing stats to " + file_xlsx)
+ for cdd_id in hits_collection:
+ otu_collection = {}
+ cdd_output = options.output + "/" + hits_collection[cdd_id]["short_description"].replace(" ", "_")
+ worksheet = workbook.add_worksheet(hits_collection[cdd_id]["short_description"]) # add a worksheet
+ file_cluster = cdd_output + '/otu_cluster.csv'
+ with open(file_cluster, 'r') as clust:
+ otu_reader = csv.reader(clust, delimiter=',')
+ samples_list = []
+ for row in otu_reader:
+ contigs_list = row[2:len(row) - 1] # remove last empty column
+ otu_collection[row[0]] = {} # key -> otu number
+ otu_collection[row[0]]['contigs_list'] = contigs_list
+ for contig in contigs_list:
+ sample = contig.split('_')[0]
+ samples_list.append(sample) if sample not in samples_list else samples_list
+ if sample not in otu_collection[row[0]]:
+ otu_collection[row[0]][sample] = {}
+ otu_collection[row[0]][sample][contig] = {}
+ # add read number of the contig and annotation
+ if 'nb' in hits_collection[cdd_id][contig]:
+ otu_collection[row[0]][sample][contig]['nb'] = hits_collection[cdd_id][contig]["nb"]
+ else:
+ otu_collection[row[0]][sample][contig]['nb'] = 0
+ if 'taxonomy' in hits_collection[cdd_id][contig]:
+ otu_collection[row[0]][sample][contig]['taxonomy'] = hits_collection[cdd_id][contig]["taxonomy"]
+ else:
+ otu_collection[row[0]][sample][contig]['taxonomy'] = 'unknown'
+ else:
+ otu_collection[row[0]][sample][contig] = {}
+ # add read number of the contig and annotation
+ if 'nb' in hits_collection[cdd_id][contig]:
+ otu_collection[row[0]][sample][contig]['nb'] = hits_collection[cdd_id][contig]["nb"]
+ else:
+ otu_collection[row[0]][sample][contig]['nb'] = 0
+ if 'taxonomy' in hits_collection[cdd_id][contig]:
+ otu_collection[row[0]][sample][contig]['taxonomy'] = hits_collection[cdd_id][contig]["taxonomy"]
+ else:
+ otu_collection[row[0]][sample][contig]['taxonomy'] = 'unknown'
+ if 'taxonomy' in hits_collection[cdd_id][contig]:
+ otu_collection[row[0]]['global_taxonomy'] = hits_collection[cdd_id][contig]["taxonomy"]
+ else:
+ otu_collection[row[0]]['global_taxonomy'] = 'unknown'
+
+ # calculate total number of reads for each sample of each OTU
+ for otu in otu_collection:
+ for sample in otu_collection[otu]:
+ if sample not in ['contigs_list', 'global_taxonomy']:
+ total_nb_read = 0
+ for contig in otu_collection[otu][sample]:
+ total_nb_read += int(otu_collection[otu][sample][contig]['nb'])
+ otu_collection[otu][sample]['total_nb_read'] = total_nb_read
+ row = 0
+ column = 0
+ item = '#OTU_name'
+ worksheet.write(row, column, item)
+ for samp in samples_list:
+ column += 1
+ worksheet.write(row, column, samp)
+ worksheet.write(row, column + 1, 'taxonomy')
+ worksheet.write(row, column + 2, 'contigs_list')
+ row = 1
+ # column = 0
+ for otu in otu_collection:
+ if isinstance(otu_collection[otu], dict):
+ column = 0
+ worksheet.write(row, column, otu)
+ # prepare table with 0 in each cells
+ for sample in otu_collection[otu]:
+ column = 1
+ for samp in samples_list:
+ worksheet.write(row, column, 0)
+ column += 1
+ # fill in table with nb of read for each sample and each OTU
+ for sample in otu_collection[otu]:
+ column = 1
+ for samp in samples_list:
+ if samp == sample:
+ worksheet.write(row, column, otu_collection[otu][sample]['total_nb_read'])
+ column += 1
+ worksheet.write(row, len(samples_list) + 1, otu_collection[otu]['global_taxonomy'].replace(';', ' '))
+ worksheet.write(row, len(samples_list) + 2, ",".join(otu_collection[otu]['contigs_list']))
+ row += 1
+ workbook.close()
+ read_file = pd.ExcelFile(file_xlsx)
+ for sheet in read_file.sheet_names:
+ cluster_nb_reads_file = options.output + "/" + sheet.replace(" ", "_") + "/cluster_nb_reads_files.tab"
+ data_xls = pd.read_excel(file_xlsx, sheet, dtype=str, index_col=None)
+ data_xls.to_csv(cluster_nb_reads_file, encoding='utf-8', index=False, sep='\t')
+
+
+def _create_html(options, hits_collection):
+ """
+ Create HTML file with all results
+ """
+ # create mapping file with all informations to use to create HTML report
+ map_file_path = options.output + "/map.txt"
+ if os.path.exists(map_file_path):
+ os.remove(map_file_path)
+
+ map_file = open(map_file_path, "w+")
+ headers = ['#cdd_id', 'align_files', 'tree_files', 'cluster_files', 'cluster_nb_reads_files', 'pairwise_files', 'description', 'full_description\n']
+ map_file.write("\t".join(headers))
+ for cdd_id in hits_collection:
+ cdd_output = hits_collection[cdd_id]["short_description"].replace(" ", "_")
+ short_description = cdd_output
+ file_seq_aligned = cdd_output + '/seq_aligned.final_tree.fa'
+ tree_file = cdd_output + '/tree.dnd.png'
+ file_cluster = cdd_output + '/otu_cluster.csv'
+ file_matrix = cdd_output + "/identity_matrix.csv"
+ cluster_nb_reads_files = cdd_output + "/cluster_nb_reads_files.tab"
+ map_file.write(cdd_id + "\t" + file_seq_aligned + "\t" + tree_file + "\t")
+ map_file.write(file_cluster + "\t" + cluster_nb_reads_files + "\t" + file_matrix + "\t")
+ map_file.write(short_description + "\t" + hits_collection[cdd_id]["full_description"] + "\n")
+ map_file.close()
+ log.info("Writing HTML report")
+ html_cmd = os.path.join(options.tool_path, 'rps2tree_html.py') + ' -m ' + map_file_path + ' -o ' + options.output
+ log.debug(html_cmd)
+ os.system(html_cmd)
+
+
+def _set_options():
+ parser = argparse.ArgumentParser()
+ parser.add_argument('-b', '--blast', help='TAB blast file from blast2ecsv module.', action='append', required=False, dest='blast', nargs='+')
+ parser.add_argument('-r', '--rps', help='TAB rpsblast file from rps2ecsv module.', action='append', required=True, dest='rps', nargs='+')
+ parser.add_argument('-f', '--fasta', help='FASTA file with contigs', action='append', required=True, dest='fasta', nargs='+')
+ parser.add_argument('-p', '--percentage', help='Percentage similarity threshold for OTUs cutoff.', action='store', type=int, default=90, dest='perc')
+ parser.add_argument('-vp', '--viral_portion', help='Minimun portion of viral sequences in RPS domain to be included.', action='store', type=float, default=0.3, dest='viral_portion')
+ parser.add_argument('-mpl', '--min_protein_length', help='Minimum query protein length.', action='store', type=int, default=100, dest='min_protein_length')
+ parser.add_argument('-tp', '--tool_path', help='Path to otu_seek.R', action='store', type=str, default='./', dest='tool_path')
+ parser.add_argument('-o', '--out', help='The output directory', action='store', type=str, default='./Rps2tree_OTU', dest='output')
+ parser.add_argument('-rgb', '--rgb-conf', help='Color palette for contigs coloration', action='store', type=str, default='rgb.txt', dest='file_rgb')
+ parser.add_argument('-v', '--verbosity', help='Verbose level', action='store', type=int, choices=[1, 2, 3, 4], default=1)
+ args = parser.parse_args()
+ return args
+
+
+def _set_log_level(verbosity):
+ if verbosity == 1:
+ log_format = '%(asctime)s %(levelname)-8s %(message)s'
+ log.basicConfig(level=log.INFO, format=log_format)
+ elif verbosity == 3:
+ log_format = '%(filename)s:%(lineno)s - %(asctime)s %(levelname)-8s %(message)s'
+ log.basicConfig(level=log.DEBUG, format=log_format)
+
+
+if __name__ == "__main__":
+ main()
diff --git a/tools/virAnnot/rps2tree_html.py b/tools/virAnnot/rps2tree_html.py
new file mode 100755
index 00000000000..e7294601c0f
--- /dev/null
+++ b/tools/virAnnot/rps2tree_html.py
@@ -0,0 +1,153 @@
+#!/usr/bin/env python3
+import argparse
+import csv
+import logging
+import sys
+
+
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+
+
+def main():
+ options = _set_options()
+ data, headers = _read_map_file(options.map)
+ html = _print_html(data, headers, options.out)
+ index_file = options.out + '/index.html'
+ fh = open(index_file, mode='w')
+ fh.write(html)
+ fh.close()
+
+
+def _get_google_script_headers(data, headers, out_dir):
+ html = '' + "\n"
+ html += '' + "\n"
+ return html
+
+
+def _get_google_js(data, headers, out_dir):
+ java_scripts = []
+ chart_names = []
+ for cdd in data:
+ chart_names.append(cdd['cdd_id'] + '_' + cdd['description'])
+ js = 'var data = new google.visualization.DataTable();' + "\n"
+ mat, head = _parse_csv(out_dir + '/' + cdd['cluster_nb_reads_files'])
+ for el in head:
+ if el == '#OTU_name':
+ js += 'data.addColumn(\'string\', \'' + el + '\');' + "\n"
+ elif el == 'taxonomy':
+ js += 'data.addColumn(\'string\', \'' + el + '\');' + "\n"
+ elif el == 'contigs_list' or el == 'seq_list':
+ js += 'data.addColumn(\'string\', \'' + el + '\');' + "\n"
+ else:
+ js += 'data.addColumn(\'number\', \'' + el + '\');' + "\n"
+ js += 'data.addRows([' + "\n"
+ for j in range(0, len(mat)):
+ js += '[\'' + mat[j][head[0]] + '\''
+ for i in range(1, len(head) - 2):
+ js += ',' + mat[j][head[i]]
+ js += ',\'' + mat[j][head[len(head) - 2]] + '\''
+ js += ',\'' + mat[j][head[len(head) - 1]] + '\''
+ js += ']'
+ if j != (len(mat) - 1):
+ js += ','
+ js += "\n"
+ js += ']);' + "\n"
+ js += 'var table = new google.visualization.Table(document.getElementById(\'' + (cdd['cdd_id'] + '_' + cdd['description']).replace('-', '_') + '_div' + '\'));' + "\n"
+ js += 'table.draw(data, {showRowNumber: false, width: \'70%\', height: \'70%\'});' + "\n"
+ java_scripts.append(js)
+ return chart_names, java_scripts
+
+
+def _parse_csv(file):
+ fh = open(file)
+ reader = csv.reader(fh, delimiter="\t")
+ data = list(reader)
+ headers = data[0]
+ matrix = []
+ for i in range(1, len(data)):
+ dict = {}
+ for j in range(0, len(data[i])):
+ if data[i][j] == '':
+ dict[headers[j]] = None
+ elif data[i][j] == 'null':
+ dict[headers[j]] = None
+ else:
+ dict[headers[j]] = data[i][j]
+ matrix.append(dict)
+ return matrix, headers
+
+
+def _print_html(data, headers, out_dir):
+ html = '' + "\n"
+ html += '
' + "\n"
+ html += '' + 'rps2tree' + ' '
+ html += _get_google_script_headers(data, headers, out_dir)
+ html += '' + "\n"
+ html += '' + "\n"
+ html += '
rps2tree ' + "\n"
+ html += '' + "\n"
+ html += _print_data(data, headers)
+ html += '' + "\n"
+ html += '' + "\n"
+ html += '' + "\n"
+ return html
+
+
+def _print_data(data, headers):
+ html = ''
+ for cdd in data:
+ html += '' + cdd['cdd_id'] + ' ' + cdd['description'] + ' ' + "\n"
+ html += '' + cdd['full_description'] + '' + '
' + "\n"
+ html += '
' + "\n"
+ html += '' + "\n"
+ html += '' + "\n"
+ html += ' ' + "\n"
+ html += '' + "\n"
+ html += '' + cdd['align_files'] + ' ' + "\n"
+ html += '' + "\n"
+ html += '' + cdd['cluster_files'] + ' ' + "\n"
+ html += '' + "\n"
+ html += '' + cdd['cluster_nb_reads_files'] + ' ' + "\n"
+ html += '' + "\n"
+ html += '' + cdd['pairwise_files'] + ' ' + "\n"
+ html += '' + "\n"
+ html += '' + "\n"
+ html += ' ' + "\n"
+ return html
+
+
+def _read_map_file(file):
+ reader = csv.reader(file, delimiter="\t")
+ data = list(reader)
+ headers = data[0]
+ headers[0] = headers[0][1:]
+ map_obj = []
+ for i in range(1, len(data)):
+ dict = {}
+ if len(data[i]) != len(headers):
+ sys.exit('line and headers not the same length.')
+ for j in range(0, len(headers)):
+ dict[headers[j]] = data[i][j]
+ map_obj.append(dict)
+ return map_obj, headers
+
+
+def _set_options():
+ parser = argparse.ArgumentParser()
+ parser.add_argument('-m', '--map', help='The map file produced by rps2tree.pl script.', action='store', type=argparse.FileType('r'), required=True)
+ parser.add_argument('-o', '--out', help='The title for the HTML page.', action='store', type=str, default='./')
+ args = parser.parse_args()
+ return args
+
+
+if __name__ == "__main__":
+ main()
diff --git a/tools/virAnnot/rps2tsv.py b/tools/virAnnot/rps2tsv.py
new file mode 100755
index 00000000000..1d2a4be3bcf
--- /dev/null
+++ b/tools/virAnnot/rps2tsv.py
@@ -0,0 +1,124 @@
+#!/usr/bin/env python3
+
+
+# Name: rps2ecsv
+# Author: Marie Lefebvre - INRAE
+# Aims: Convert rpsblast xml output to csv and add taxonomy
+
+
+import argparse
+import json
+import logging as log
+from urllib import request
+from urllib.error import HTTPError, URLError
+
+from Bio.Blast import NCBIXML
+from ete3 import NCBITaxa
+
+ncbi = NCBITaxa()
+
+
+def main():
+ options = _set_options()
+ _set_log_level(options.verbosity)
+ hits = _read_xml(options)
+ _write_tsv(options, hits)
+
+
+def _read_xml(options):
+ """
+ Parse XML RPSblast results file
+ """
+ log.info("Read XML file " + options.xml_file)
+ xml = open(options.xml_file, 'r')
+ records = NCBIXML.parse(xml)
+ xml_results = {}
+ for blast_record in records:
+ for aln in blast_record.alignments:
+ for hit in aln.hsps:
+ hsp = {}
+ hit_evalue = hit.expect
+ if hit_evalue > options.max_evalue:
+ continue
+ hit_frame = hit.frame[0] # frame
+ hit_evalue = hit.expect # evalue
+ hit_startQ = hit.query_start
+ hit_endQ = hit.query_end
+ hsp["frame"] = hit_frame
+ hsp["evalue"] = hit_evalue
+ hsp["startQ"] = hit_startQ
+ hsp["endQ"] = hit_endQ
+ hsp["query_id"] = blast_record.query_id
+ hsp["cdd_id"] = aln.hit_def.split(",")[0]
+ hsp["hit_id"] = aln.hit_id
+ hsp["query_length"] = blast_record.query_length # length of the query
+ hsp["description"] = aln.hit_def
+ hsp["accession"] = aln.accession
+ hsp["pfam_id"] = hsp["description"].split(",")[0].replace("pfam", "PF")
+ log.info("Requeting Interpro for " + hsp["pfam_id"])
+ url = "https://www.ebi.ac.uk/interpro/api/entry/pfam/" + hsp["pfam_id"] + "/taxonomy/uniprot/"
+ req = request.Request(url)
+ try:
+ response = request.urlopen(req)
+ except HTTPError as e:
+ log.debug('Http error for interpro: ', e.code)
+ except URLError as e:
+ log.debug('Url error for interpro: ', e.reason)
+ else:
+ encoded_response = response.read()
+ decoded_response = encoded_response.decode()
+ payload = json.loads(decoded_response)
+ kingdoms = []
+ for item in payload["taxonomy_subset"]:
+ lineage_string = item["lineage"]
+ lineage = [int(i) for i in lineage_string]
+ translation = ncbi.get_taxid_translator(lineage)
+ names = list(translation.values())
+ taxonomy = names[1:] # remove 'root' at the begining
+ kingdoms.append(taxonomy[0])
+ frequency = {kingdom: kingdoms.count(kingdom) for kingdom in kingdoms} # {'Pseudomonadota': 9, 'cellular organisms': 4}
+ sorted_freq = dict(sorted(frequency.items(), key=lambda x: x[1], reverse=True))
+ concat_freq = ";".join("{}({})".format(k, v) for k, v in sorted_freq.items())
+ hsp["taxonomy"] = concat_freq
+ xml_results[hsp["query_id"]] = hsp
+ return xml_results
+
+
+def _write_tsv(options, hits):
+ """
+ Write output
+ """
+ log.info("Write output file " + options.output)
+ headers = "#query_id\tquery_length\tcdd_id\thit_id\tevalue\tstartQ\tendQ\tframe\tdescription\tsuperkingdom\n"
+ f = open(options.output, "w+")
+ f.write(headers)
+ for h in hits:
+ f.write(h + "\t" + str(hits[h]["query_length"]) + "\t")
+ f.write(hits[h]["cdd_id"] + "\t" + hits[h]["hit_id"] + "\t" + str(hits[h]["evalue"]) + "\t")
+ f.write(str(hits[h]["startQ"]) + "\t" + str(hits[h]["endQ"]) + "\t" + str(hits[h]["frame"]) + "\t")
+ f.write(hits[h]["description"] + "\t" + hits[h]["taxonomy"])
+ f.write("\n")
+ f.close()
+
+
+def _set_options():
+ parser = argparse.ArgumentParser()
+ parser.add_argument('-x', '--xml', help='XML files with results of blast', action='store', required=True, dest='xml_file')
+ parser.add_argument('-e', '--max_evalue', help='Max evalue', action='store', type=float, default=0.0001, dest='max_evalue')
+ parser.add_argument('-o', '--out', help='The output file (.tab).', action='store', type=str, default='./rps2tsv_output.tab', dest='output')
+ parser.add_argument('-v', '--verbosity', help='Verbose level', action='store', type=int, choices=[1, 2, 3, 4], default=1)
+ args = parser.parse_args()
+ return args
+
+
+def _set_log_level(verbosity):
+ if verbosity == 1:
+ log_format = '%(asctime)s %(levelname)-8s %(message)s'
+ log.basicConfig(level=log.INFO, format=log_format)
+ elif verbosity == 3:
+ log_format = '%(filename)s:%(lineno)s - %(asctime)s %(levelname)-8s %(message)s'
+ log.basicConfig(level=log.DEBUG, format=log_format)
+
+
+if __name__ == "__main__":
+ main()
diff --git a/tools/virAnnot/seek_otu.R b/tools/virAnnot/seek_otu.R
new file mode 100755
index 00000000000..96fdbe24b88
--- /dev/null
+++ b/tools/virAnnot/seek_otu.R
@@ -0,0 +1,48 @@
+#!/usr/bin/env Rscript
+
+## Redirect R error handling to stderr.
+options(show.error.messages = FALSE, error = function() {
+ cat(geterrmessage(), file = stderr())
+ q("no", 1, FALSE)
+})
+
+## Avoid crashing Galaxy with a UTF8 error on German LC settings
+loc <- Sys.setlocale("LC_MESSAGES", "en_US.UTF-8")
+
+args <- commandArgs(trailingOnly = TRUE)
+if (length(args) == 0) {
+ stop("Arguments missing for Rscrpit", call. = FALSE)
+} else {
+ # percentage of identity
+ id_threshold <- as.numeric(args[3])
+ # get input data (matrix)
+ data <- read.csv(args[1], header = FALSE, sep = ",", row.names = 1)
+ # remove last 2 columns
+ data_length <- length(data)
+ # create matrix
+ mat <- as.matrix(data[, 1:data_length], fill = TRUE)
+ # create coordinate matrix
+ d <- as.dist(1 - mat)
+ # create tree
+ hc <- hclust(d, method = "single")
+ # assign otu based on identity value
+ otu <- cutree(hc, h = -id_threshold)
+ # group contigs by otu
+ # Print results to output file
+ output <- args[2]
+ # unique is used to know the number of different otu
+ for (i in unique(otu)) {
+ # retrieve contigs belonging to the same otu
+ clust <- which(otu == i)
+ # write otu number and number of contigs in this otu
+ cat(
+ paste("OTU_", i, ",", length(clust), ",", sep = ""),
+ file = output, append = TRUE
+ )
+ for (n in names(clust)) {
+ # write contigs name
+ cat(paste(gsub(" ", "", n), ",", sep = ""), file = output, append = TRUE)
+ }
+ cat("\n", sep = "", file = output, append = TRUE)
+ }
+}
diff --git a/tools/virAnnot/test-data/blast2tsv_contigs.fa b/tools/virAnnot/test-data/blast2tsv_contigs.fa
new file mode 100755
index 00000000000..9b1c61681af
--- /dev/null
+++ b/tools/virAnnot/test-data/blast2tsv_contigs.fa
@@ -0,0 +1,16 @@
+>ds2020-482-EDGG-1-Q4_42600
+TCGGTGGGGGGACCTTGCGGACATGGGCGGCGGACCGTAAGATGTATAGAGGTGGGGGTA
+GTAGTTTTGATGCCCTTTTGCTTTTGTGCCAAGCCA
+>ds2020-482-EDGG-1-Q4_107243
+TATATCTGTGCTTTGGAACACAATGATTCTCAAAGTCTATGTCGAGACTGGAAACTCTCT
+>ds2020-482-EDGG-1-Q4_2681
+CCTTCCTAGCGACCACGCACACGTCAAGACCGGCATCATCAATGTCGCGACAATCGTGAA
+CCACTTTAGTATAGTCCACATCAAGATCATCATAAGGTAGATAAAAGGAATCAATTTCCC
+TAGGAAAAAGTCCAGAATCATCTTCCTCATAAAAATCTGGTATCGAGGGATCAATGGTTC
+GCACCACCATCTCGAATGTATCAAAGATCGTCGCGAAATCAAACTTTGCGGTATGCTTAA
+CGACAAACTCGAAAAGGAAAAGTTTTACCCATTCGTCGTAGTTGTCATCTTTATGCACAC
+CGAACGTCGAGAAAAACCCAAAGAACGTGTGCGTGGTCGCTAGGAAGG
+>ds2020-482-EDGG-1-Q4_107857
+TCAAGATTGTCGAAAGTGCCACACAGATATTGGTTGCAGCTGTGATTACTGCAATTGGC
+>ds2020-482-EDGG-1-Q4_63163
+AAGTTCATGGACTTCATCCGAGGAGTTGCCGTCATTGGGGAAGGGCAGTGGGGGATTGAG
\ No newline at end of file
diff --git a/tools/virAnnot/test-data/blast2tsv_contigs.txt b/tools/virAnnot/test-data/blast2tsv_contigs.txt
new file mode 100644
index 00000000000..aef29a9b6a2
--- /dev/null
+++ b/tools/virAnnot/test-data/blast2tsv_contigs.txt
@@ -0,0 +1 @@
+1 Viruses Riboviria Orthornavirae Kitrinoviricota Alsuviricetes Martellivirales Bromoviridae Ilarvirus Blackberry chlorotic ringspot virus
diff --git a/tools/virAnnot/test-data/blast2tsv_input.xml b/tools/virAnnot/test-data/blast2tsv_input.xml
new file mode 100755
index 00000000000..99ac6541b13
--- /dev/null
+++ b/tools/virAnnot/test-data/blast2tsv_input.xml
@@ -0,0 +1,593 @@
+
+
+
+ tblastx
+ TBLASTX 2.10.1+
+ Stephen F. Altschul, Thomas L. Madden, Alejandro A. Schäffer, Jinghui Zhang, Zheng Zhang, Webb Miller, and David J. Lipman (1997), "Gapped BLAST and PSI-BLAST: a new generation of protein database search programs", Nucleic Acids Res. 25:3389-3402.
+ /save/tcandresse/refseq/refseq.short.fa
+ ds2020-482-EDGG-1-Q4_42600
+ No definition line
+ 96
+
+
+ BLOSUM62
+ 0.001
+ 11
+ 1
+ L;
+
+
+
+
+ 1
+ ds2020-482-EDGG-1-Q4_42600
+ No definition line
+ 96
+
+
+ 1
+ ref|NC_035070.1|
+ Spinach amalgavirus 1 isolate SRP059420 fusion protein and putative coat protein genes, complete cds
+ NC_035070
+ 3420
+
+
+ 1
+ 51.4703
+ 106
+ 6.20873e-08
+ 3
+ 95
+ 1338
+ 1430
+ 3
+ 3
+ 20
+ 24
+ 0
+ 31
+ GGGTLRTWAADRKMYRGGGSSFDALLLLCQA
+ GGGAMRSWEVDSQMYRGGGNSADALRLLGQA
+ GGG +R+W D +MYRGGG+S DAL LL QA
+
+
+
+
+
+
+ 7073
+ 36804204
+ 24
+ 96786528
+ 0.133956144488482
+ 0.317605957635731
+ 0.401214524497119
+
+
+
+
+ 2
+ ds2020-482-EDGG-1-Q4_60894
+ No definition line
+ 82
+
+
+
+
+ 7073
+ 36804204
+ 19
+ 97069448
+ 0.139224951877679
+ 0.315124495232289
+ 0.441609275168242
+
+
+ No hits found
+
+
+ 3
+ ds2020-482-EDGG-1-Q4_64647
+ No definition line
+ 80
+
+
+
+
+ 7073
+ 36804204
+ 18
+ 97126032
+ 0.133956144488482
+ 0.317605957635731
+ 0.401214524497119
+
+
+ No hits found
+
+
+ 4
+ ds2020-482-EDGG-1-Q4_97438
+ No definition line
+ 64
+
+
+
+
+ 7073
+ 36804204
+ 13
+ 97408952
+ 0.133956144488482
+ 0.317605957635731
+ 0.401214524497119
+
+
+ No hits found
+
+
+ 5
+ ds2020-482-EDGG-1-Q4_104226
+ No definition line
+ 61
+
+
+
+
+ 7073
+ 36804204
+ 12
+ 97465536
+ 0.133956144488482
+ 0.317605957635731
+ 0.401214524497119
+
+
+ No hits found
+
+
+ 6
+ ds2020-482-EDGG-1-Q4_60048
+ No definition line
+ 83
+
+
+
+
+ 7073
+ 36804204
+ 19
+ 97069448
+ 0.133956144488482
+ 0.317605957635731
+ 0.401214524497119
+
+
+ No hits found
+
+
+ 7
+ ds2020-482-EDGG-1-Q4_57812
+ No definition line
+ 84
+
+
+
+
+ 7073
+ 36804204
+ 20
+ 97012864
+ 0.133956144488482
+ 0.317605957635731
+ 0.401214524497119
+
+
+ No hits found
+
+
+ 8
+ ds2020-482-EDGG-1-Q4_107243
+ No definition line
+ 60
+
+
+ 1
+ ref|NC_006276.1|
+ White clover cryptic virus 1 RNA2, complete genome
+ NC_006276
+ 1708
+
+
+ 1
+ 37.724
+ 76
+ 0.000859157
+ 2
+ 52
+ 495
+ 545
+ 2
+ 3
+ 14
+ 15
+ 0
+ 17
+ ISVLWNTMILKVYVETG
+ VSVLWNVMILKVYVNTG
+ +SVLWN MILKVYV TG
+
+
+
+
+
+
+ 7073
+ 36804204
+ 12
+ 97465536
+ 0.133956144488482
+ 0.317605957635731
+ 0.401214524497119
+
+
+
+
+ 9
+ ds2020-482-EDGG-1-Q4_99332
+ No definition line
+ 63
+
+
+
+
+ 7073
+ 36804204
+ 13
+ 97408952
+ 0.133969292349849
+ 0.313843789061929
+ 0.427993038537577
+
+
+ No hits found
+
+
+ 10
+ ds2020-482-EDGG-1-Q4_77228
+ No definition line
+ 74
+
+
+
+
+ 7073
+ 36804204
+ 16
+ 97239200
+ 0.133956144488482
+ 0.317605957635731
+ 0.401214524497119
+
+
+ No hits found
+
+
+ 11
+ ds2020-482-EDGG-1-Q4_66730
+ No definition line
+ 79
+
+
+
+
+ 7073
+ 36804204
+ 17
+ 109330443
+ 0.123285876267438
+ 0.308001358455575
+ 0.370429799913588
+
+
+ No hits found
+
+
+ 12
+ ds2020-482-EDGG-1-Q4_2681
+ No definition line
+ 348
+
+
+ 1
+ ref|NC_011554.1|
+ Blackberry chlorotic ringspot virus RNA2, complete genome
+ NC_011554
+ 2879
+
+
+ 1
+ 72.0897
+ 151
+ 1.04985e-23
+ 137
+ 286
+ 117
+ 266
+ -3
+ 3
+ 28
+ 36
+ 0
+ 50
+ DNYDEWVKLFLFEFVVKHTAKFDFATIFDTFEMVVRTIDPSIPDFYEEDD
+ DMYKEWVSMFLFKFIVEHTAKFDFATIDCTFGMIVARLIPGYSDLDDEDE
+ D Y EWV +FLF+F+V+HTAKFDFATI TF M+V + P D +ED+
+
+
+ 2
+ 56.0524
+ 116
+ 1.04985e-23
+ 38
+ 148
+ 252
+ 362
+ -3
+ 3
+ 21
+ 28
+ 0
+ 37
+ EEDDSGLFPREIDSFYLPYDDLDVDYTKVVHDCRDID
+ DDEDEEHSPREIDSFYLPYDDLDVDYTTIDYRRDDVE
+ +++D PREIDSFYLPYDDLDVDYT + + D++
+
+
+ 3
+ 44.5971
+ 91
+ 2.20433e-07
+ 183
+ 275
+ 128
+ 220
+ 3
+ -2
+ 19
+ 20
+ 0
+ 31
+ TTISNVSKIVAKSNFAVCLTTNSKRKSFTHS
+ TIIPNVQSIVAKSNFAVCSTINLNKNMLTHS
+ T I NV IVAKSNFAVC T N + THS
+
+
+ 4
+ 28.1016
+ 55
+ 2.20433e-07
+ 73
+ 126
+ 274
+ 327
+ 1
+ -3
+ 12
+ 12
+ 0
+ 18
+ SPHQDHHKVDKRNQFP*E
+ SLHQDRRMEDKRNQSP*E
+ S HQD DKRNQ P*E
+
+
+
+
+
+
+ 7073
+ 36804204
+ 43
+ 873366817
+ 0.133956144488482
+ 0.317605957635731
+ 0.401214524497119
+
+
+
+
+ 19
+ ds2020-482-EDGG-1-Q4_107857
+ No definition line
+ 59
+
+
+ 1
+ ref|NC_003501.1|
+ Brome streak mosaic virus, complete genome
+ NC_003501
+ 9672
+
+
+ 1
+ 62.0091
+ 129
+ 4.20284e-11
+ 2
+ 58
+ 3274
+ 3330
+ 2
+ 1
+ 19
+ 19
+ 0
+ 19
+ QDCRKCHTDIGCSCDYCNW
+ QDCRKCHTDIGCSCDYCNW
+ QDCRKCHTDIGCSCDYCNW
+
+
+ 2
+ 55.1359
+ 114
+ 4.92676e-09
+ 3
+ 59
+ 3275
+ 3331
+ -1
+ -3
+ 19
+ 19
+ 0
+ 19
+ ANCSNHSCNQYLCGTFDNL
+ ANCSNHSCNQYLCGTFDNL
+ ANCSNHSCNQYLCGTFDNL
+
+
+
+
+
+
+ 7073
+ 36804204
+ 11
+ 97522120
+ 0.133956144488482
+ 0.317605957635731
+ 0.401214524497119
+
+
+
+
+ 20
+ ds2020-482-EDGG-1-Q4_83983
+ No definition line
+ 71
+
+
+
+
+ 7073
+ 36804204
+ 15
+ 97295784
+ 0.133956144488482
+ 0.317605957635731
+ 0.401214524497119
+
+
+ No hits found
+
+
+ 21
+ ds2020-482-EDGG-1-Q4_92239
+ No definition line
+ 66
+
+
+
+
+ 7073
+ 36804204
+ 14
+ 97352368
+ 0.133956144488482
+ 0.317605957635731
+ 0.401214524497119
+
+
+ No hits found
+
+
+ 22
+ ds2020-482-EDGG-1-Q4_31663
+ No definition line
+ 111
+
+
+
+
+ 7073
+ 36804204
+ 29
+ 96503608
+ 0.133956144488482
+ 0.317605957635731
+ 0.401214524497119
+
+
+ No hits found
+
+
+ 23
+ ds2020-482-EDGG-1-Q4_63163
+ No definition line
+ 81
+
+
+ 1
+ ref|NC_011591.1|
+ Southern tomato virus, complete genome
+ NC_011591
+ 3437
+
+
+ 1
+ 44.1389
+ 90
+ 1.00223e-05
+ 1
+ 81
+ 3034
+ 3114
+ 1
+ 1
+ 17
+ 19
+ 0
+ 27
+ KFMDFIRGVAVIGEGQWGIEMDRWIRF
+ KVMDLIRGNATIGRGQWGNDVMDWIRF
+ K MD IRG A IG GQWG ++ WIRF
+
+
+
+
+
+
+ 7073
+ 36804204
+ 19
+ 97069448
+ 0.133956144488482
+ 0.317605957635731
+ 0.401214524497119
+
+
+
+
+ 24
+ ds2020-482-EDGG-1-Q4_91422
+ No definition line
+ 67
+
+
+
+
+ 7073
+ 36804204
+ 14
+ 97352368
+ 0.133956144488482
+ 0.317605957635731
+ 0.401214524497119
+
+
+ No hits found
+
+
+
diff --git a/tools/virAnnot/test-data/blast2tsv_output.tab b/tools/virAnnot/test-data/blast2tsv_output.tab
new file mode 100644
index 00000000000..ff57c251bd5
--- /dev/null
+++ b/tools/virAnnot/test-data/blast2tsv_output.tab
@@ -0,0 +1,6 @@
+#algo query_id nb_reads query_length accession description organism percentIdentity nb_hsps queryOverlap hitOverlap evalue score tax_id taxonomy sequence
+TBLASTX ds2020-482-EDGG-1-Q4_42600 96
+TBLASTX ds2020-482-EDGG-1-Q4_107243 60
+TBLASTX ds2020-482-EDGG-1-Q4_2681 348 NC_011554 Blackberry chlorotic ringspot virus RNA2, complete genome Blackberry chlorotic ringspot virus 56.3 2 100 9.0 1.04985e-23 128.1421 339420 Viruses;Riboviria;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Blackberry chlorotic ringspot virus CCTTCCTAGCGACCACGCACACGTCAAGACCGGCATCATCAATGTCGCGACAATCGTGAACCACTTTAGTATAGTCCACATCAAGATCATCATAAGGTAGATAAAAGGAATCAATTTCCCTAGGAAAAAGTCCAGAATCATCTTCCTCATAAAAATCTGGTATCGAGGGATCAATGGTTCGCACCACCATCTCGAATGTATCAAAGATCGTCGCGAAATCAAACTTTGCGGTATGCTTAACGACAAACTCGAAAAGGAAAAGTTTTACCCATTCGTCGTAGTTGTCATCTTTATGCACACCGAACGTCGAGAAAAACCCAAAGAACGTGTGCGTGGTCGCTAGGAAGG
+TBLASTX ds2020-482-EDGG-1-Q4_107857 59
+TBLASTX ds2020-482-EDGG-1-Q4_63163 81
diff --git a/tools/virAnnot/test-data/blast2tsv_output_with_rn.tab b/tools/virAnnot/test-data/blast2tsv_output_with_rn.tab
new file mode 100644
index 00000000000..418c49d6a04
--- /dev/null
+++ b/tools/virAnnot/test-data/blast2tsv_output_with_rn.tab
@@ -0,0 +1,6 @@
+#algo query_id nb_reads query_length accession description organism percentIdentity nb_hsps queryOverlap hitOverlap evalue score tax_id taxonomy sequence
+TBLASTX ds2020-482-EDGG-1-Q4_42600 12 96
+TBLASTX ds2020-482-EDGG-1-Q4_107243 63 60
+TBLASTX ds2020-482-EDGG-1-Q4_2681 8 348 NC_011554 Blackberry chlorotic ringspot virus RNA2, complete genome Blackberry chlorotic ringspot virus 56.3 2 100 9.0 1.04985e-23 128.1421 339420 Viruses;Riboviria;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Blackberry chlorotic ringspot virus CCTTCCTAGCGACCACGCACACGTCAAGACCGGCATCATCAATGTCGCGACAATCGTGAACCACTTTAGTATAGTCCACATCAAGATCATCATAAGGTAGATAAAAGGAATCAATTTCCCTAGGAAAAAGTCCAGAATCATCTTCCTCATAAAAATCTGGTATCGAGGGATCAATGGTTCGCACCACCATCTCGAATGTATCAAAGATCGTCGCGAAATCAAACTTTGCGGTATGCTTAACGACAAACTCGAAAAGGAAAAGTTTTACCCATTCGTCGTAGTTGTCATCTTTATGCACACCGAACGTCGAGAAAAACCCAAAGAACGTGTGCGTGGTCGCTAGGAAGG
+TBLASTX ds2020-482-EDGG-1-Q4_107857 402 59
+TBLASTX ds2020-482-EDGG-1-Q4_63163 88 81
diff --git a/tools/virAnnot/test-data/blast2tsv_read_nb.tab b/tools/virAnnot/test-data/blast2tsv_read_nb.tab
new file mode 100755
index 00000000000..3bdd1e4a96a
--- /dev/null
+++ b/tools/virAnnot/test-data/blast2tsv_read_nb.tab
@@ -0,0 +1,6 @@
+ds2020-482-EDGG-1-Q4_42600 12
+ds2020-482-EDGG-1-Q4_107243 63
+ds2020-482-EDGG-1-Q4_2681 8
+ds2020-482-EDGG-1-Q4_107857 402
+ds2020-482-EDGG-1-Q4_63163 88
+ds2020-482-EDGG-1-Q4_47667 1
diff --git a/tools/virAnnot/test-data/blast2tsv_reads.txt b/tools/virAnnot/test-data/blast2tsv_reads.txt
new file mode 100644
index 00000000000..05703e70b99
--- /dev/null
+++ b/tools/virAnnot/test-data/blast2tsv_reads.txt
@@ -0,0 +1 @@
+0 Viruses Riboviria Orthornavirae Kitrinoviricota Alsuviricetes Martellivirales Bromoviridae Ilarvirus Blackberry chlorotic ringspot virus
diff --git a/tools/virAnnot/test-data/blast2tsv_reads_with_rn.txt b/tools/virAnnot/test-data/blast2tsv_reads_with_rn.txt
new file mode 100644
index 00000000000..418c49d6a04
--- /dev/null
+++ b/tools/virAnnot/test-data/blast2tsv_reads_with_rn.txt
@@ -0,0 +1,6 @@
+#algo query_id nb_reads query_length accession description organism percentIdentity nb_hsps queryOverlap hitOverlap evalue score tax_id taxonomy sequence
+TBLASTX ds2020-482-EDGG-1-Q4_42600 12 96
+TBLASTX ds2020-482-EDGG-1-Q4_107243 63 60
+TBLASTX ds2020-482-EDGG-1-Q4_2681 8 348 NC_011554 Blackberry chlorotic ringspot virus RNA2, complete genome Blackberry chlorotic ringspot virus 56.3 2 100 9.0 1.04985e-23 128.1421 339420 Viruses;Riboviria;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Blackberry chlorotic ringspot virus CCTTCCTAGCGACCACGCACACGTCAAGACCGGCATCATCAATGTCGCGACAATCGTGAACCACTTTAGTATAGTCCACATCAAGATCATCATAAGGTAGATAAAAGGAATCAATTTCCCTAGGAAAAAGTCCAGAATCATCTTCCTCATAAAAATCTGGTATCGAGGGATCAATGGTTCGCACCACCATCTCGAATGTATCAAAGATCGTCGCGAAATCAAACTTTGCGGTATGCTTAACGACAAACTCGAAAAGGAAAAGTTTTACCCATTCGTCGTAGTTGTCATCTTTATGCACACCGAACGTCGAGAAAAACCCAAAGAACGTGTGCGTGGTCGCTAGGAAGG
+TBLASTX ds2020-482-EDGG-1-Q4_107857 402 59
+TBLASTX ds2020-482-EDGG-1-Q4_63163 88 81
diff --git a/tools/virAnnot/test-data/index.html b/tools/virAnnot/test-data/index.html
new file mode 100644
index 00000000000..ea195d7ab8e
--- /dev/null
+++ b/tools/virAnnot/test-data/index.html
@@ -0,0 +1,235 @@
+
+
+rps2tree
+
+
+
+
rps2tree
+
+
pfam02123 pfam02123_RdRP_4
+
pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus.
+
+
+
+
+
+
pfam02123_RdRP_4/seq_aligned.final_tree.fa
+
+
pfam02123_RdRP_4/otu_cluster.csv
+
+
pfam02123_RdRP_4/cluster_nb_reads_files.tab
+
+
pfam02123_RdRP_4/identity_matrix.csv
+
+
+
+
pfam00680 pfam00680_RdRP_1
+
pfam00680, RdRP_1, RNA dependent RNA polymerase.
+
+
+
+
+
+
pfam00680_RdRP_1/seq_aligned.final_tree.fa
+
+
pfam00680_RdRP_1/otu_cluster.csv
+
+
pfam00680_RdRP_1/cluster_nb_reads_files.tab
+
+
pfam00680_RdRP_1/identity_matrix.csv
+
+
+
+
pfam00665 pfam00665_rve
+
pfam00665, rve, Integrase core domain. Integrase mediates integration of a DNA copy of the viral genome into the host chromosome. Integrase is composed of three domains. The amino-terminal domain is a zinc binding domain pfam02022. This domain is the central catalytic domain. The carboxyl terminal domain that is a non-specific DNA binding domain pfam00552. The catalytic domain acts as an endonuclease when two nucleotides are removed from the 3' ends of the blunt-ended viral DNA made by reverse transcription. This domain also catalyzes the DNA strand transfer reaction of the 3' ends of the viral DNA to the 5' ends of the integration site.
+
+
+
+
+
+
pfam00665_rve/seq_aligned.final_tree.fa
+
+
pfam00665_rve/otu_cluster.csv
+
+
pfam00665_rve/cluster_nb_reads_files.tab
+
+
pfam00665_rve/identity_matrix.csv
+
+
+
+
pfam01443 pfam01443_Viral_helicase1
+
pfam01443, Viral_helicase1, Viral (Superfamily 1) RNA helicase. Helicase activity for this family has been demonstrated and NTPase activity. This helicase has multiple roles at different stages of viral RNA replication, as dissected by mutational analysis.
+
+
+
+
+
+
pfam01443_Viral_helicase1/seq_aligned.final_tree.fa
+
+
pfam01443_Viral_helicase1/otu_cluster.csv
+
+
pfam01443_Viral_helicase1/cluster_nb_reads_files.tab
+
+
pfam01443_Viral_helicase1/identity_matrix.csv
+
+
+
+
pfam00078 pfam00078_RVT_1
+
pfam00078, RVT_1, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses.
+
+
+
+
+
+
pfam00078_RVT_1/seq_aligned.final_tree.fa
+
+
pfam00078_RVT_1/otu_cluster.csv
+
+
pfam00078_RVT_1/cluster_nb_reads_files.tab
+
+
pfam00078_RVT_1/identity_matrix.csv
+
+
+
+
pfam01787 pfam01787_Ilar_coat
+
pfam01787, Ilar_coat, Ilarvirus coat protein. This family consists of various coat proteins from the ilarviruses part of the Bromoviridae, members include apple mosaic virus and prune dwarf virus. The ilarvirus coat protein is required to initiate replication of the viral genome in host plants. Members of the Bromoviridae have a positive stand ssRNA genome with no DNA stage in there replication.
+
+
+
+
+
+
pfam01787_Ilar_coat/seq_aligned.final_tree.fa
+
+
pfam01787_Ilar_coat/otu_cluster.csv
+
+
pfam01787_Ilar_coat/cluster_nb_reads_files.tab
+
+
pfam01787_Ilar_coat/identity_matrix.csv
+
+
+
+
pfam01573 pfam01573_Bromo_MP
+
pfam01573, Bromo_MP, Bromovirus movement protein.
+
+
+
+
+
+
pfam01573_Bromo_MP/seq_aligned.final_tree.fa
+
+
pfam01573_Bromo_MP/otu_cluster.csv
+
+
pfam01573_Bromo_MP/cluster_nb_reads_files.tab
+
+
pfam01573_Bromo_MP/identity_matrix.csv
+
+
+
+
+
+
diff --git a/tools/virAnnot/test-data/otu_s1.fa b/tools/virAnnot/test-data/otu_s1.fa
new file mode 100755
index 00000000000..94881e2fff1
--- /dev/null
+++ b/tools/virAnnot/test-data/otu_s1.fa
@@ -0,0 +1,6856 @@
+>ds2020-267_1
+CAGCACGTCCGCAAAAGGTCCTCGCTCCAAAACTGTCTCATCATCTCTATCGTGCCCTGA
+CCCGTTTTCATCTTTGTACCTAGCTCTACTTCTTCTATCCTTGTTGGCACTTCTATCGCC
+ATTACCCTCGCTATGTTGCCACGTTGTCCGTTGACCATAGGCCGCCACATCCTATAATGC
+CTCATGTCTCCAACTACTGCCCCACTCATTGTTATCTCTGTGTATACTGGACATGTTTGC
+CCTCTGTCTGGCCACAGCAGATTGGCTGCGGCTATAAACTTGTACAGTTTCACCTCGTCG
+TCATGTGGTGTCAGCACTATGTTCTTATCTATCACGACTCTAGCTTCATGTGGAAAGCAG
+TTCTCCTGATCTACCGGTATTCTGTGTAGTGAACCATACCCTAGGTGGCAACAGGGCAAC
+GACATGTGCACCAAATTCACGTGCGTGACTAGAGGCCTCTTGAAGTACATCTTCGCACGG
+TATTCAAACTCCGTTTGCATCATCCTTCCTTTCACACCTGCCACAATTGGGTTCCTGATG
+TGAAATTCTCCATATTCTAGTGACATTTCTAGGTTCACTGGCGTCACCAGGAACCCCAGC
+ATGTTTGACAGCCACGGCACCACTGCGTTGAATGTTGATAGCTCTCCAAGGTGTTGGTGC
+AGCTCACCAAGTCTGCAGTTCCTGAAGGAGTGTGGCAGTCTAATATCCAACTCCCTCACT
+TCAGACAGCTCCCAATGCCATATAGGAAAGTCTATGAAACTGCCTCTAATTGTGTTCTTA
+TCTTTCGTCTGCTTGAAGGAAGTACATCCCAGGCACACACAGTACCTCGTCACATCTCTG
+AAAGTTGCCTGACCAGGTGCAAACGTGGGTGGAGGCTGTGGTATCTTTGGTTCAATCAAC
+CTTATTATTTCAGCAGGTGCTATCCTGGTGAACATGTCTGCCTGTTTTGCCAGTTTCAGC
+AAAGAGTGCTCATCACCCTGCTTCTTGAATAGGCAGAAATGCGGCCCTGTGACATTGTGT
+TTGTGCCCACAGCTCAGCTTCAGCTGGCTATTCTGTGTAGAGTTGCCAAACCAGTTTATC
+TTTTCGCCGTAGTACATCCACCTACTTGGGTGCATTTCTTCTTCGTTAAGTGGCATGCCT
+TTCACCATCCCTTGCATAACCTGGGCCTCGGTATTGATGCCGTGTTCGTGGTCAAAAATA
+GGGCACTTGCCCTCTGCACCGCATGACATCAACGGCATGCCTTGCCATTTCCCGGTCAGT
+TCCTGGCAATTTTCAGGTGTCGGTGGTACCAGTGAGGTTCCTCCGCGCTTGAAAGTGTCA
+TCGTCATCACTCTGCTCTTCCATTATGTGACGTCTTATCCTTCCTAGCTCCTCTCTCGCT
+CGCTCAGTTCTGTAAGCCTTTTCTTCTTTTCTGTTCATCCATGGCACGTCCCATGATCGT
+GCGTCTTTTTCCCTTTGTTCCGAACTCGTGTCTGTTTGTGAATCGACAAACTCTTTCGCC
+TGCCTCAATTTTTCAGCCACATCATCACACTCGATTCTCACTTCTGGCTCTAGCACGACA
+TGCCCCTCACCTATAAGCAGGTTCTTCATGGTGTCCGCCCCCTCTGTATCTGACTCTGAC
+GCTTCGTCCTGCGTCTTAACAGGGCTTGGTGTAGGGCCACCATCGAACGTGACGTCAGTT
+TCTTGCTCTACATCCACCTCAACACTCAGCTTCTTAGAGTGAGCGCTTTTCCGTTCAGTG
+AACTTGTAGACCAACATGTTTGCGTTGTACATGAGCTGTCCCCTTATGTCTTCCGATTTG
+TCGCTTGGCCTACGCTGTTTCTGATCGAGCGCCTCGTCAACGTATTCAATGTCTGCTACG
+TGCTCAGTGCTCATCATCTTGGCGTCTATTACGTCCTCGATTGACGGTGTCCTCTTTAGA
+GTCTTCACCTCTAGTGTTCCGTCAACCACGACACCTGCCTCTTCGATTGCCTGGTTGCAC
+AGCGCGCACGACACAAGCTGCTTGCACTTCCTGCACACATGCTGCATTTTTATGTATCCA
+CAGCAACTTGTTTGGCACGGTGAAGACATCCTGACACACTTCTTGTTCTTCACCCTCGTC
+TTGGGGGTGCTCATCACTTCATGGACAGACTTGATATTGCGTTGCCCTTTTTGACCGGTT
+TCAGCCACACATACTTGATACGTGTGCACCAGGCTCAAGTAGTTTGGCCAGTTTGCATCA
+GCTGCCACCACCAGTGACGCAACATACCTCACACGCGGTGAGTAGTTAGCAAACAAAGTG
+TGTACCTGCTCCAATCTAGCAGCAGGTGTCATCTCGGTGCTGTTGAGTTTCTCATCCTTG
+TATTTTAAACCCCTTTTGGTCAAAGTGAGGGCGTAACCGGTGCAGGCGTGCCATACTAGT
+CTTGAAAGTGACCGTTTTGCGTGCTTGGTCAGTGGCAAGTAATAAACTTGCTTCGCATGT
+TCGAAAGCCCTCTTACTATGCCAGGTGTACTCGAGTTCACTTTCTTCTGCCAGCAGTGCT
+GCTGCATCTAGCCATTCTTACATGTCAGACTGATCAACGTACTGGCCTCCTGTTGCGGAC
+GTGCTGNNNNNNNNNNATCTAAGGAGCAGCACGTCCGCAATGATGGCCCCATACAGTAGT
+GATTTCTTGTCGAAACCACCAAATTCGAACACTGGCCTGTTGATACTTGAGCTAGTGATC
+AACATCTTAGCGTTTTCTGTCTCTGCAGTGAAAACAGACCTGTACGTTGCAGCTCCAATA
+ATGAGCTGTTTCAAATCCATTTGCTTGTCGTGCCATTTGGTCGGTGACACACATATTCCT
+CTCTTGGTTCTGATGCACATTAGCGCTCTGTACAAGTTTACGACTGACGCTGCTCCTGTC
+ACGTCGTTGATTGCTGACGTCAGTGACGCAAGGAACATCGATTTTGACGCCTGAGTTCCT
+ATTGGCCTACCGCTTGACGTCACCGGAACTGCAATCCTGCAGTTGCTATTTGTGGTAACA
+GCNNNNNNNNNNCAGCACGTCCGCAATTGCCTTCCATTGGGTTGCCAACTCCCAGTACCT
+TTTCGTCACTCACCCTCAGTTCGAAGCCATATCGCCTGAGTTCTGGTGCGATAGCCATCA
+CTCTCGCTTCTGCTCCCATTAACTGACCATTTATGATGTTGACATCAGATCTGTCGTTGC
+CATCAGCAACGCAAGCGTCATCAACCCATGCCATCAGCGAGTTCAATGCTCCTGCCGTTG
+CCCTCGCTGCTGATACATTAGTCAGCAGCACGCCTGCCTCATTTTGAGGGCCTTGGACAT
+ACTCATCATGTTGCGATGTCACCGAACAAGCGTAGCTACCTTCAGACTGAACGTCAGTAG
+TGTACCTGGTGCGCACTGCGCTACCTAGCACACTATCTGAAGTCAAAGCGCTTCTCGAGC
+TCATTATGCCCGCCCGCATGAAAGGTTCATCTTTGTCAACCACTTCATAAACACCATGAC
+CCGTCGGAGTTACAACGCTCTCGTCATGCTGCTTGTGTTTGCCACCAAAACCAGCGTATC
+TGTTGGTGGCGATTATTGGCGTGACTCTTGCTGCGACTGATTTTTCAGCAGAGTTGTATT
+GAAAAACTGGTACGCCCATCTTGTACAGTTGGCTGCAATGTCCCAA
+>ds2020-267_2
+CAGCACGTCCGCAACAGTTGGTCCTTGCTAACAGTAATGGCGACTTGTGGACACGCATGG
+GCGCCTTGCATGGACAAAGTTCTGCAGTGGCCTGACATAACGAACACGTTTATGTCATCA
+CTACTACTTGCCATGGCTGCACTACCACCAGAGTTATATGTACTAATGGTGGAGTGGAAC
+GGCTGGGCAAAGTGTGGCTCTATGGCAGAGTACATCGTAGAGGCAAAAAACCTGACGACT
+AAGATGAAGGCACTGGACAACCAGGTAACATTGGGTGACTTCGAACTCGACTTATCGCCT
+TTATTCGAGTGGGAAGTGCTAAATCACAGAGCGGTCTTGAAAGGCATCTATGACAAGGAA
+GTCACAGAGCGTAGAGATCAGAAACAGAGCATCAAGCTATCTGCTGCCGATCTGGAGGAA
+GAAATAGACAGCGTGTTTCAGGACGTGGGTTCCGTTCTAGACGCCAGGACAAAAGAGGGT
+GAAAAATCACCTCTGTATGCAACGTGGGATGATTGGTACGTTGACAGGGTGCAAACCACA
+CCAGCTGGGTCTGCATTCACAGTCAACAAGGACATGATGGAGGCAAGAAACATGCTGAAA
+GCCAATGGGGTCCAAAATCTGACCAAGACGCAAGTGATGGCGCAGATGAGGGACAAGCTC
+CCGCTGGCGTCTATCTTGGGTAGCGAGCCAATGATATTGGCCCAGATGTCATGGAAGTTG
+GAATGGTCAAAACTGAGGGCACTATTTGCTGCTAGCATGGAGCACTGGATGCCATCGGCA
+TTCGCCCTGGGGCAGATAGAAGAGTATCTACCCAGTGACTGCCCCATAGGTAAAGCTGCC
+GATGCGCACAACGTGTGCAGGCGCGTGATGGAAATGTCAACGCAAGGAGTGGTAGCATGC
+ATAGATGCAAAGAACTTCAACATCTTGCACACCCACGAGATAATGTCAGCAATACTGAAA
+TCCGCATCAAAGATGCTAGGAGATAGGCTGTCTAGTGAGCAACATGACTGCCTAAAGTGG
+CTGGCGAAAGCGGAGCTGAACCAGAAAGTGCTGGTCAAGACAGGTGAAGTAACTGAACAG
+TTGCTCCAGGTCGGCAGGAGAGACGGGTGGATTAACAAGCTAACTAAAGGTGACGGCACA
+GTGGTAGAAGCGGCTGACGTGACGGTTGGAATGTTTTCAGGTACTAGGTTCACGATGCTG
+TACAACACAGTGCTAAACAGGGCGTACTACAAAGTGGCGGAGAAACGTGCGAAGATAAAG
+ACTTTATCACTTCATTCGGGTGATGACGTGTATGCTGTTTTCGCTAACTATATAGACGTG
+TACAAGATGAAGCGTGAGATGGCGTTAATCGGCTACACACTGCAGTTAGGCAAGTGCTTC
+TTGCAGGGAGTCCGAGAATTCTTGAGAATATCTCATAAGAATGCAAACACTTCTCAATAC
+CTAGCGAGGTCCGCAGCAACGGCAATACATGGAAGAATAGAGGCAGATGAGCCTTCTGAT
+TTCGTGGCTTTTGTGGGGTCAATAATGAGAAGAGGTGCAGAGATGGTGGTCAGGCACGCG
+GCAAGAGCAGTGTTGCTAGATGTCATGAAGATACAGATAGCAGGAGCTTGCGCAAGGTGG
+GCGATTACAGCTATGGCGTGGGACTCATTCTTAATGTTGCCAAAAACAATGGGCGGTTGT
+GCTGCAAAAGCACGCCTGATGGAACAATGGAGTGGTTTTTCTATAGAAAGAACTGCAAGC
+GCCAGAGGTGGCATCGTAGACTATTTGGCTGAACAACCAGGTACCAAAACAGCGGCGAGG
+AGGCTGGTTGAGAAGTTGCAAATAATGAAGTACCACAAGAGAGTTGCACAAGCCGTTGCT
+GCGGCGATAGCACCTAAAGGAGTTTTGAAAAACTACGGTATGATAGTAAGGTGGATGAAC
+AAAGATGACATGGCACATATGTCGAGAGTGGCAGGGACACTAGGGCGAATAAGACAATCG
+AGAGAGTACATATTATCAAAAGCAGCAGGATTATTCAATACGCTAGCAATAAATGACAAC
+TTCTGGGGTGATGTGAGCGGTGTGTTCAGAGGCATACCGTCAGCGTGGCACGGCAGAGCA
+CTGACGTTCGCACTGTCTGAGAGGAGTGAGTCAGAAGCGCTGTTTGCAAATAAAATGTAC
+AAGCTACACTATAAAATGACAGAGTGGGCAAGAGCTGCAACAGAGAATAGACTGATAAGA
+ATGCAGCTAGATATGCCACCGGGGTAATGCTGGTGGTAATAAGTACGATAGAACTTGCCA
+TCCACTAGGGAAGTGGACACAAGCGGAGTAGGCGACCGGTGGCAAGTATAACAAGCCAGG
+CTGAACGGCCGTACGTGGCTCCCAGACGTACAAACATTGGCGCTATCAACTAGCGCCTAC
+ACAATATAAAATATGCGTTTAGTTGCGGACGTGCTG
+>ds2020-267_3
+CAGCACGTCCGCAATCTGAAACGGCTGTCTGGCACGCCTGCACTGGCTTCATTCTCTTCG
+TGACCAAGGCATGTCTGGTGTACGATGGGGGTGAGAATTCAACATCTGAAGTCACACCGG
+CAGCTAGGCTTGACCAGGTACACCGAGTGTACGCGGCGTACAGTAGCAGGGTTAGGTACG
+TAGTGTCTCTTCTAGTCGGCGAGGATGCCAACTGGCCGAACCCAATCGGACTAGTTCACG
+TCTACCAGCTGGCAGTCACGCCCGGGCACCCGAAAGACATGTTGTCTTCGGATGACATTC
+ACTCAGTTTTGAGCACACCCACCGCGAGGGTGAAGAACGGCAGGTGCACAAGGATGGATG
+CACCATGTCAAGTCAGTTGCTTTGCCCGCCTTGATGATTTGCACGAGTGTAGGCGATGCA
+AGTGCCGGGTGACGTGCGCACTGTGCATCAAGGCATTGTGCCTAACAGGTTACGCGCATG
+ATGGGAGTAGAAAATCGAACAGCCAGGAAACTACGCCTGCTACCGGGGGCGATGTACTCC
+ACGCTAAGACGATGGGATCCGAATACGTCGGTGAATTGCACGACACTGAATCTATAGTGG
+GTGCAAAGCCGATTGACTTGGCACCTGTAAACGTCGATGTGCGTTCCGAGCTGGTTGAAC
+TCGCAAGCAATCTGCTCAAGATGAACGGTAGGCGACCTAGTGCCCAGGTTAAGAAACTGA
+GCGTGGGCGACACTGACGAGAACAGGAATGAACATGGCTTCGAAAGTTTGTCTGAGTCGG
+ATAACAACGCACAAGAGCTCGATGCAGAATCAAGCGGTGATGTCAGCATGGTAGGTGAGA
+TAAGCGAGCAGCAAGTTAGGGATGCAATCGCTCACTCGGAAGCGGAAAGTCGACTGTTCG
+ATGACACAGCTGACGTGGATGACAAATTGTTTGAAGCGTGTTCGTACGTACCGGGTGACG
+CAAGCGAGGTTGGGGTATCGGACGTGGACGTGACTCCTAAGAAGAGTGCGATACGACCAC
+CAATATCATCAAGACGCTCATCCACGCCCACGCCTACCACGTCACGGGGGCTGAAGTTCG
+ACGTTGATATCATTGCAGACATACTACACGAGCCACCGAAAATGTGGGACCAGTCGCGCG
+AATTCGTTGAACAAACGGAACCACCGGTTAGCTTAGAGCAATGCACGGCTCTGGTGCCGA
+TGCACGCCGGTTTTGCGATGCCAGTGTGCAGCAAATTGGGCTACTGTGACATACTAAGCG
+ACAAATCAGCGCTGCAAGACGAGCTCGTGGTGAACGACGAAATCATCAATTTCAAGGTGC
+CAGAGCAAGAAGAAGCCGAAATGTCGGCATCAATCTTTGCGGTTGAAAGGAGTGGTGAGT
+GGATCAAGTTATTGCCACAGCGGCAGAAGCTGAAGCTCAGCTGCGGGCGAGATCACTCCA
+TGACAGGGCCCCACTGGTGTGTACTGAAGAAACAAGATGGCAACTCGTCACTGCGGAAGA
+TAATCAGTGATGCAGGCATGACGGACAGACTAGTAAGGTCACAGTTGATACGCAAGATTG
+TCCCTGGGAGACCATCAACACTGTACCTACCAGGCAGTGCGATGTTCAGGGACATCACCA
+AAAACTGTGTGTGTGCAGGGTGCTCGTCCTTCAAGAGGACGAACGACCCAAACATGGTCA
+AACGCAGTGCTGTGGACTTCCCAATATGGCACTACGATCTGGGGGAGCTGCATTCATTGG
+ACATCAAGATACCGGAAGGCCAGCGCGATTCAATCGTCGGCGACCTGATGGAGAATAGGG
+GCGCAATGGAGCAGTTCTGTGCCATCAAACCCTGGCTGTCAAACATGCTCGGGTTCATGG
+TCAAACCAGGCACAGTGAACCAAGTCGGTGGGTACGGAGATTTTCACTTCAGCAACCCCA
+GGATAAACGTCAGCACGCACCCAATGAGCCATGAATCAAACTACAACTTGCCGCTATTCT
+ATCGCAAACCACTGGTAATGCACATCAACAAGATACATGCGTCGCTGCCATGTTGCTCAA
+TGGGTTACGGCGACATCCTGACGTTCCCTCCAGACCTGGAGAACGGGATGCCATTCGAGG
+CAAGGATGAGAATAGACAAATCGATTGTGCTGAACTCACACGATGATGAAACAAAAATGT
+TTCTCATAGCGGCGCTGGCGACATTACTGTGGCCTAGGCCAGGGGAAGAAGACCCACAAA
+GAGCAAGTCTGAGTTTTTCAGGCGTGATGCTCGGTGACATGAGGCATTACTCGATGAGAA
+GAGTAGTGCGTGATGGCAAACTGACGGATGACTCCGTGCTTCGCGCAGTAACGGTGTCTG
+ATCGAATGGACAAGGTGGAAAAACTGAGTAAAGTGAGAGTAAGCGAAAAGACATTGCGGA
+CGTGCTG
+>ds2020-267_4
+CTTCCGATCTATCTAAGGAGCAGCACGTCCGCAATTCAGCTACTCTCAGCACGTCCGCAA
+TACTAACAGCTCAGCGCGTCCGCAACACGACTGGGGCACACGTCCGCAACGTCCACGACT
+TATCACTTGCGGACGTGCTGCTCCTTAGATTCTGGAAGTAAGGACGTTCGGGCTTCCTAT
+TCCGCTTTATTAAGGTACACTAAGTAACTATTCCTATTAACTCCATCGGGTCCTTAGATC
+CTTTGAGTAGGTGTAGTAGTGGGCCGCTTTTATTGGTCCCATTCAACACGTCCATCAGGA
+AGCCGGTCATTTTGGCTTTTCCGTAATTGACTATGTCTGTTTCTTCTTTGTGTACCTTGA
+ATAACGCTCGCAAAATCTCGTACCGCTTGATGTTACCATTCCTTGAAACGTTTATGTTCC
+TTTCTTTTGGTATCACCGCGTCGTATGTTGCGCGCATTATTCGTGAAATGAAATCCTGCA
+AAGGTCTTTCAAGTTGTAGTGATGCTTTCACCATCCTGGAGTAGTCCACCACTCCCGGTA
+ACACGCCTATCTGCGTGGCACCCTTCCTGAAGCCCGACGACCGTATCATCCACTTTACGT
+CCGATCTCTTGTCTTCACTTATGCCCCCCACACACCTGTGGGAGGTCTTTATTTTATAAC
+AGTCTGAAACTGTCATGTGCAATCGCTCACATTGTCTCGAGTAGTATTTGTTCCTCAATG
+ACGCCGCTAACCACATTGGCATTCCCCTAGACACTGAATCGTCCAGACGCGACTCCAGCG
+CTTCCAAAAGGTCCCTCATATCGCTTGAAGGTTTTGACTCTATCCTCGAGTGTACCAAGG
+TTGCCATAGCTCTAGATAGATACTGTCCCTTAGACCCACGTTTGTGATCTACGCGTAGAA
+ACTCTGCTATGGCCCCATACGCACATTTGCTCATCTGCAGGCGTATGTTGTGCTTCTTGG
+CATTTTTGCCAGCTAGCAACACGTCCTCGAGCGAATTACTTCCCAGTAGCACGTCGTCAC
+CGTTGTGGAGGCTGTTTTGCGATTGTACCACGTCAGGTACTATCAGTTGAGTGTAAATGT
+AGTTAAGCACGCTGTTCATGAACGTAGTGAGTCGCCACCCCGATAACAGGGTCCCCTTAG
+CGTTGTACTCCATTTTCAAGCCTTGATTGTCGTGTACTATTACCCTATCCAGTGAAAGCC
+GAGTCCACTCCACAGCTGCTAGTTGCTCCTGAGTCAGGAAGTGTCCGAAAGTATCTCTGT
+ACGCATCTATTACTGCTTTCATAGATTGTACACTGTGTTGACTGTTGAAATCCTCGAAAT
+CTACACAATACTGAGTCCTGCCTTCTAAGACTGACCTTACTCTACTGCGGACGTTCTCAT
+CGTTGGCTGCTTTTCCCACCGGGAACGGCGAGGGCAATACGTCCTCGCAGTTATAGAAGG
+CGAAATGTGCCAATACGTAACTAGTGACATCTGTCCCGTAGATAGCGCGGAGTTTGCTCC
+ATTCATACTTCGTGGATGACCATGCGTGAAGTTCAGGATCTCTTTCGCGCCACGAGTCCA
+TATTCATATCCGGCATGGCCAGTATTGATATGAACTTGTTCTTGAGGTATATGTCTTTGA
+ATATGTATTTATCGTCTTCTGAATATTGCGAGTGTATGCTGCCGGCCGCACTCCACTGCC
+ACCTACTCTGCCAGTACTCCCGCCAATCAAACTTCCTCGGTCTCTTACCCGCTGAGATCG
+ATCTACTGAAGAGCTGCGAGGCCCTTTCATAAACCAATCCCTCCGGCATCTCGGCCAAGT
+TAGGGGACACCCTGTTCTTGTGCTCCTCCTCCCAGTTGACCAGTCTTGATTTGCGGACGT
+GCTGCTCCTTAGATANNNNNNNNNNGGACGTTCGGGCTTTGCGCTGGCAATGGAGAACAG
+TCCTGACCCTCTAGCGAGCTGCATCTCCTCGGGGGTGAGACCAGCTGCCCACAGTGCCAC
+GCCCGTAAGGAATGAGTTAGTAGCTTCTCTGGTTATTGATAAGGCCAGAGCTACGCTGTC
+AGAGTTGACTCCCAAAATGTCTACCACCTCCTTGAACGAAAAGTGAACATGATGCGACGC
+CGTTATCTTGGTGTGTTTTGCCGACATTGCTTCATGTAACTGCCACCCTCTGCCTTGCTG
+TCCATTTACTTTCCTCAATAATCGCTTCGGAGACACAGGGTCCTCAAAGTCGATAGAATC
+GTAAAGACCTGAGGTGTGCCTGGTCATTTGAGAAAGTATTTCTTTGCGTATACCCCAAGA
+TCTTTGCGGACGTGCTG
+>ds2020-267_5
+ATCGCACATGATAAAGCCCGATATCTAAGGAGCAGCACGTCCGCAACCCTCTGCCTCCAA
+CAATAAAGCAGATTTCTTTGCTCTTCTAACAGCTATTACTTACCACAATGGACCACCTCA
+CTTCCCTTTTCGAGCTTTTTGCTATCACACCGAAAACACAAAACAATCTACAGTTTGTTG
+GGATCTACCACAGACCTCCACACTCCGTTCGAGCAAACCTCCGCAACGTTGAAAAACACA
+AAATCACAGTCGCTCACGCCATGCACAAGTACCTTTACCCGCATGAAATCGACTTTGTTA
+TCAACCAAATGCGACGCTCAGACGTCACTGAAGATGCCATACTTGCTGACTTTTTCGACA
+ACAACGTCGAACCACTTGAACCTGTTCTTGACGAACACTTCGAACGTGGACTCTCCGCAA
+TGCTGGACGCTTTTCGCCCTCCGCAGAAATGCCTACCTGCCCACATCTATGATGTGCAGC
+ACCACTACCCATATAAATGGCAAGTGAACGCTGAAGCCCCCTTCTCCACCGATTCCTATT
+TCTTAGCGAATCGACCAACCTTCCGCGCAGTGTTTGAACGACTCGAATCGCTCTACACAC
+ACCTCGCAACCGATTGGCACCGCCGATACGGAAACAAAACCGACAATGATGATTTTATGA
+ATGATCATGTCCCTGCGAAATTTGGCCCTATGAAAGAAACAGTCTTCTCATGGACTCACC
+GATGGCACCACGTCATCAAATCCAACTTCACCGACACAGCTGGATTGTCTAAAGACTATT
+ACTTCAAAAACCGATACATCTTCCCAATGCTACTTCACACGAAGACAGCGATTGTCAAGA
+AAGACGACCCGAATAAGATGCGAACCATCTGGGGCTGTTCAAAGCCTTGGATCATCGCAG
+ACACCATGCTATGGTGGGAATACGTCGCGTACGCTAAGTTACAACCTGGAGCCACACCAA
+TGCTCTGGAGTTACGAAACCTTCACAGGTGGCTGGCTTAGACTCAACCACGCACTTTTCT
+CTTCATACATACGGCACTCGTACATCACACTCGACTGGAAACGCTTCGACAAGAAAGCGT
+ATTTCTGCATCATCGACAAAATTTTCGATGGCGTTGAAACATTCCTCGACTTTGACAACG
+GCTATTTGCCTACGAAAGATTATCCCGATACCAAATCGACTTGGACACAAGAACGTTCCA
+CCCGCCTCAAACGCCTGTTTGACTGGACAAAAGAGAACTTCTACCATGCACCAATTGTCC
+TACCCAATGGGCACATGTACGTCCGAAAATTCGCTGGAATACCCTCTGGCCTATTTATCA
+CTCAACTGATCGATTCCTGGTACAACTACACCATGCTCGCAACCATCCTATCCGCGATGG
+GCTTCGACCCTCGGTCCTGTATTATTAAAGTCCAAGGTGATGACTCAATCATCCGCCTCA
+GTGCACTCATCCCTCCGGATGCTCACGATTCTTTTTTAACTAAGGTCCAAGAACTCGCCG
+ACTACTACTTTCAATCAGTAGTCTCCGTGAACAAGTCTGAAGTACGCAACGAGCTCAACG
+GATGCGAAGTTTTATCGTACCGACACAGACACGGTTTACCATACCGCGATGAACTAGCTA
+TGCTAGCTCAACTGTATCACACGAAAGCACGCAACCCAAGTCCCGAAATCACAATGGCAC
+AATCCATCGGCTTCGCCTACGCTTCCTTCGGAAATCATGAAAGAGTACGTCTCGTACTAC
+ATGATATCTACGAATATTACAAGCATCAAGGCTACACACCCAACCGAGCCGGACTCAGCC
+TCGTCTTCGGAAACTCTCCTGACCTCATGATCCCGCACTACACACTTGATCACTTTCCCT
+CAATCAGGGAAATAAAAATGTTCCTGACTAATGCAAAATATGCCAATGAAGAAACCAACT
+CACGAACGTGGCCTTTAACCCACTTTCTCCATCTTCCTTGTCATCGCACTTAGTATTTGA
+GCAATTGCAATTACAACATAATTACAAAAAAAGGATTGCGGACGTGCTG
+>ds2020-267_6
+TGAGGCTATTGTGCTGTTCTTCTGACAGCCTGGAACCTATCATCACTGACGCTGATTCCA
+ATAGTGCTATTGCTAGTGTGTTGTTTTACTTGCCTGGGAGCCGCAAGCGGCTTGCAAAGC
+CTGGCGTTAATTGTACGTGCACCGGTTGCCTACACCGACGTTGACGGCGCTAGCTCTCCC
+TCAGCTAACGGGTCGTTAGTGACCAATTCTTTTGCGCCCATTTCGTGCTTGCTTGTCTGG
+GAGCCACAAGCGGCATTTGCAGCCTGGCGAGTTATTTGATACGTGTACCGAGTGCCTACC
+CCGACATTGACGGCGCCAACCTTCCCTAGGTTGACGGGAGCCACAAGTGTTTCACACTCA
+TGGCTCTAATTACAGTGGCCTTTGGCCCAAGTTGAGCCTATGTCTCGTTTGCGAGTAGTT
+CGTCGCCACTCCTATCCACCCCATCACTGTGGTATGTAGCTTGAACCTCCTGTTATCGAA
+CAGTGCTTTCTCCTCGCCTCTTTTCGCCAGCGCGAACGTTAGTGCTCTGGCGTGCCACGC
+TGACGGTATGCCTCTAAAGACTCCCGTCACGTCGCCCCAAAAGTGGTCGTTGATGGCCAG
+CGTGTTGAACAAGCCAGCTGCTTTGGATAAGATGTACTCACGTGACTGTCTTATCCTTTC
+CAGTTGACCCGTCACGGTCGCTAAATGCTCAAGATCGTCCTTGTTCATCCACCTGACTAT
+CATTCCATAGTTCTTGAGGACACCTTTTGGTGCTATGGCTGCTGCCACGGCTTGCGCAAC
+TCTTTTGTGGTACCGCCGTATGCCTAGTGCCTCTACTAACTGTCTCGCAGCAGTCTTGAC
+TCCTGGTTGCTGCGCCAGGTAGTCGACTATACCACCACGTGCGCTGGCAGTTCGCTCGAT
+AGAGTACCCACTCCACTCGTCTGCCTTTCGTGGTCGCGCAGCACACCCACCCATGACGTT
+TGGCAACACCAGAAATGCGTCCCAAGTCATGGCCGAAATTGCCCAGCGTGCACAAGCCCC
+TGCAATTTGCAGCTTCATCACGTCGAGCAACACGGTTCTCGTTGCATGTCTGACAACCAT
+TTCTGCACCACGTCTCATGATGGAACCCACGAATGCCACAAAGTCTGATGGTTCATCAGC
+CTCAATTCTACCATGTATTGCAGTAGCTGCAGACCTCGCCAGATACTGTGACGTGTTTGC
+GTTCTTGTGTGAGATCCTTAAAAACTCTCTCACACCCTGCAAGAAGCACTTCGCTAGTTG
+CAGTGTGTACCCAATGAACGCCATCGCTTTCTTCATTTTGTACACGTCAATGTAGCTGGC
+AAACGCAGAGTATACATCATCGCCAGAGTGTAGTGACAGTGTTTTGATCCCGGCGAGTTC
+TTCGGCCACCTTGTAGTATGCCCTGTTGAGTATCGTGTTATACAACATCGTGAACCTCGT
+TCCTGAAAACATGCCAACCGTGACCGTCGCTGCTTCCACCATGGTGCCGTCACCCTTCAT
+CATTTGGTTTATCCACCCTTCTTGTCTCCCTGCCGACAGCAGTTCCTCTGTGACCTCACC
+TTTCTTCACTAGTACCTTCTGGTTCAACTCAGCTTTGGACAGCCATTTGAGGCACTTGTG
+CTGTTCTTCTGACAGCCTGGAACCTAGCATCACTGACGCTGATTCCAATATAGATGCCAT
+CACCTCCTGGGTGTGCAAGATGTTAAAGTTCCTCGCATCTATGCATGCAACTACTCCCTG
+AGTAGACATCTCCATGACTCGTCGGCACACCCTGTGTGCATCGGCTGCCTTGCCGATGGG
+GCAGTCAGCTGGCAAGTACTCTTCAATCTGCCCAAGCGCTAAGCCGTTGCGGACGTGCTG
+>ds2020-267_7
+CAGCACGTCCGCAAAGTTCGCTCTCTTCATTGAGCTAATTGGTTAAAAGTCTACTTGTTA
+AGTAGCATTCACATCAAGGAAAGAATTTCGTCAAAATGGCATACCAAAAGCCCGACAAAT
+CGACCGTCTCCGGCACGACTCTTACGCCAGATGACTCAGCCTCACAAGCTGGTCCACAAA
+ATGATACCCCCAATCCTGCGAAGTCCGGACGCCCAAAGCGTTCATCAAAGATTTCAAAGG
+GCAAAGATCTACCTCCGGGTGCGATCAAGGTACCAAAAGGTGGCGCCAACATGACGGGGA
+AAGCATCTCCCGTACAGTCTGCAACCATTCCATTTCGGGATGGGGAGAAATAGACCTCAA
+CTCTCATAGAAATGAGATTGAGCCGGTCTTCACAGTCGACGCTCAGCCGTATGACGACCT
+TGTCAACGTGGTGTACTCATCACTTCAGTCGCGATACTCAAATGCGGCGAAGCACATCCC
+GTTTGGCCTCTTCCGCTACTACTGCATGCAATTGTGGTGGTATCGGGTTCTTTTTCTGCA
+TCGCACGAACGGCAATGCTCTCACATCTGACGAACGTCAGTTCATGAGCATCATGGAGAC
+TGGACAAGAGTTCCAAATCCCCTCCCAAATAGCACAGTATCTTGCCAACCTTGGCAATTT
+CATGCAAGGAGGAGAGAACTTCTTTTTCCGCCTGCCCCCACACGCCTTCGCCGAAGCAAC
+AGGCACTATCCACTCAGGATGGTTTGCCTCTGGTCTTCCCACCGCCAAGGTGGACACAAC
+TTCCTTCTGGAAGTACGCTCAACTTCCGAGTCCGGGCGTTTTCGTGTCCTATATGTGCAA
+CGAAGCACATTACAACACCCCTGGCCACCAGCCCAATCGTCTCTTCGATCTCTCAGAGAT
+CGCCCCCACCATTTCCGACGACAGTTATTCAGTTCCGACTGATAACATCGTTGGTTGGAG
+TAACGGCATTTACACTGCCACGCACGCCTCCTGGCGTTCGACATACTCCAATCTTGGCTG
+GTCAATCGACGGTTGTGCCCTTGACTCTCAGACAACATTCATGCTCTCGACATCGACCAT
+GCGTGCCGTGTCTGACCGTATTGCGTCCGTCACCGGACTCAAAGTGAACACGTCAACACA
+GTTGACACTCTCTGTGCAAGGCAATCCCCTGGATTGCTACTACCTTGCAACTGTGGACTA
+CGCCTCCAACCGCTCTCAGTGGCCAAAGGCACCTGGTCCTCATCAACAACAGAAAGTGAA
+CGGCTGTTTGCACACAGAACTCGCCCTCCACTCCCGCTACGCCATGGACTCAAAAGTCCT
+ATCACCCGCGTTCTCGTTCGGATATCGCCTAGAGCGATCGCTCATCTGGAACGGTACATA
+CGATACCGACAGACGTCCGGTCCACGCTCAGGCCAGCAACTATCAGCCCTGGCTGATACA
+GTCTGAAGCCGACGACAAATACCGCGATCCTGGCCCCGCATGGATGGCCCATATGAACGA
+TTCGTTCAATTTTGGTTCTTCATTGAACTTGAATTTACGACGATTTTCGACTCATGGCCT
+CATTCGTTCTGTCGCGCTTGACGCGTCCGTTGTCCTCAGTGACACCAAGTAGAAACTTCT
+TCTTCTACTACAGCAACTCTCTCTCTTGGTAAAGCTCACTGGTAACCGGTCCAAAACGAA
+ACTCTTAAAACAGTGGATACCCTCCGGGGCGCACGTCCGCAAGGGTCCGGCAGTTGCGGA
+CGTGCTACCCAAAGACCTTTGCGGACGTGCTG
+>ds2020-267_8
+CAGCACGTCCGCAAACTGGGGTGTCTGGTATGGTAACTTCTGTTTTTTGTTACTGATATG
+TCAATCAGTAAAGAACGCTTCCTCGAGGTGGAGTTCCGAATAGAGGGGCCGTGTTTCTTG
+ATATTTTTCGAAATCAGAAAAAGAACGTTGGCGTAGTGCTCTGTTGGAATAAGCCTCGGG
+TATGAACGCGTACTCGGGTAGGTTTCTATCTCTTCTTGAGATGAATTTCCGTGGCGAGGG
+TTGAGGTAGTAGCGCAGGGAAGAAAAATCCGCCGAAAGGATCGGTTTGTCGGATGGGAAG
+TGTGATTTCCTTCATCTCGAGACCGAGAGTGGAGAGATATTTGAATGCCTTTGAAGGCTT
+CTCTGCCACGTAGGCGTTGAGGGTTTTCTCTTGTATGCCGTTGGTGCTCATGATGTGTTT
+GATCGCATCATAGAATACATTGCATAGTTTTGGATCCATGCAGGAGTAGAGCTGTCCAAG
+TAGGCGTGCGCATGACTCGAGTGGTGAGTCAACTGGGCGTTCCGGGTAGATGGTGGAAGC
+GAAGATGAAGTCGTATGACCTTCGCGGTCCGGTAACTCGGTGGAAGTATCCGAGCCAGTG
+TATATTCTCAGGGTTATTACTGAGAATCGTCTTGTCCAGGTTAAGAATGCCATTGAAAAC
+ATCCTTTAAAACAACACCAAGTTCGACGAGATCAATCGGTCTATCTAGAAAGATGGACGA
+ATCATCTCCGTAGTAGTAGTCCTTAACGGGTAAGGCTCCAGTGACTCGGTAGATGGCAGT
+ACGCATTTGCACTGCGTTGACGATTGTGTCGAGAAGGTTGGTCCACATTGAACCAGATGG
+GATGCCAGTGCTCTTTTGTACTCGGAGACCGCGGGGTGTGCGTATCTTCGTGTTGATGAA
+GTAAGAGACCATGGCTTTCCATCGTCGTGCTGTTTGGTCTGAACGGACGTTCCATACTAT
+CCCTTCAGAATCTCTGACTTTTGAAAAGTCAAACCAATCAGAAATGAACGAGAATGTGTC
+TCGTATTATCCAATGGGTAACATTGGCGTCGAAGCGTGAAAAGTCGGTGGTGAGGGAAAC
+GATATTGTCGATCATGCTCCTCGCAAGATGCGAGTGGCCTGACTTCATTGTTTCCATTCC
+GATGCCGTAGCACGCGTCCTCTCTGTTGCAGAGTTCCTTCAATTCTGAGAAAAGAGGAAT
+GAAGAAGCGGGCCTCTTCAAGGATGACATCAGTTGGGTAACCCCAAACTGGACGTACTTT
+GACATTCGGTTGCTCACTTGCGACAACCCTGTTGAAAGCAAGGCAGTCGGGCAGCGACCA
+TGGGATTCCTCTTCCGATACTATCCCAAGCCCGATGTATCTTTCCGGTGGCAACTGGGTC
+TGCGAAGACCTCAGCTTTTGTCTTGTATCCTTGGTTGACCCAAGGGAAGCCGGGAGATGT
+CGTGGTGGGCATTGCGGAGTGCTTGGCAGCAGCTCCGAGGGTTAGCGGTATGATACGGTT
+AGCGGGGCGAAGTTCATCGAGTGTTTTCTTGATAATCGCAAGATAGTCACCATCAACACA
+CCGGGTGGTGGGTCGTTGGTCGTAATCCATGAGATTATCTTCGAGAACCGACTGGTCCGC
+GGACGGACGGTGCCATGTCGATGAGATGTTGCTAATGAAGTCACAGAGATCCGGAGAACC
+TGTCAATAGTTGCGGACGTGCTG
+>ds2020-267_9
+TATCTAAGGAGCAGCACGTCCGCAAGCCACGTACGGTGAAAAGAGAGCAGTCGCGCCTGG
+CGACTTGGGCTTGGTGGACTCGCTTGTGGTGAAGTCACAGATTGATTGGTGGCATTGCAA
+TGTCACTATGTGGGTGGCCGCTTACAAGTTGTCTGTGACGCTAGCTGCATCGTGTGGTGA
+CATGAACTTCAGTGGTGAGGAAGTTAATGAGATCATACAGTACACGTTCAGCCGCTCAAC
+ATACAGGAAGCTCGTAGCGAGCGACGCGGTGATGGACTCGACTAGAGACATTGCAGCAAG
+TGAGGTGACGCAGGCAGCGTCAACGCCAGTCAGGTGGGCTAGGCAAGTGAACCCAATCGT
+GCTGGTGCTCGACGATGTCGAGTACGCCATCACACGCAACGAAGTTAATGATGTCTTGAC
+AAAGGTATACGATAAGGTACACGCTGCAATCATGAAACAAGCTGGAAAAGGTTACGGTGA
+CTACAACAGTACTGGGCTTGAGCTGGTCTACAGCGAGGAGACAGGGCTATCAGCAGGTGA
+AACTCCGAGAGGGGTTTTGAACCCGGTTTTTGGTTACGCAAAGCTGGCAAATGGCGCAAT
+AACTGTGGAGCCATGCAAGTGCGCAGACTCAAACGCCGTACTCATGACGATGAGTGAAGG
+TGAGCAAAAACCAGGGCTGAGTGAGGTGTCAATCGGCAGCGAATCAGTCAAGGTAGTTAA
+ACGAAACAGAGGCGGAAGGACTTTGACCTATCTGATGCCAGAGACGATAAGCGGCATGGG
+GGCAGACAGGTCATATGTCTATCTTGCGGGGATGCACTTCAGAGAGGATGAGCTCAAGTA
+CTCACTGCCAACCCTGGAGTTCCTGTCACAGTTCACAACAAAGTACAAACCACTACAGCC
+GTCAGAAAGGTTGAGCAAGCTACGAGTGCTAACCGATCCAACTTCAACGCGAGTGCACCA
+CAGGCACATGTCTATGTTGACCGTGATGGCGACTTGCTGTCATGCGTGGGCTCCGTGCAT
+GGACACAGTGTTAGATTGGCCTGACATCACGAACACGTTTATGTCAGCGCTAATGCTAAC
+GATGGCTGCAGTGCCACCTGAACTGTATGTGCTCATGTGTGAATGGAACGGGTGGGCCAG
+CTGCAAAAGCATGGCAGAGTACGTAGTGACTGCGAAAGAACTTACAACAAAGATGAAAGC
+TCTAGACAACCAGGTGGCAATCGGCGATTTTGAGCTGGACCTGTCGCCACTGTTTGAGTG
+GGAGGTGTTGAATCACAGAGCTGTGACAAAAGGCATCTACGACAAGGAGCTAATCGAAAG
+ACGTGATGCAATGCAAAGCATTAAGCTCACGCCAGAGCAGCTCAGGCCGCACATCGATAG
+TGTATTCAGGGACATCAGTGCGATACTAGACAAGCGCACAAAGCATGGTGAGAAGTCGCC
+GATTTTTGCAAATTGGGACGATTGGTATGCTGATAGGGTGCAGGCAACACCTGCGGGATC
+AGCATTCACAGTCGAGGAGTCTCTTTTGCAGGCAAGACAAGTCTTAAAAGATAACGGCGT
+GCAGAACCTGACAAAGACACAAGTCATGGCGCAAATGCAGGATGGATTAAAACTGGATAC
+TCTACTCAGTCATGAGCCAGACATCATTGCGGACGTGCTG
+>ds2020-267_10
+CAGCACGTCCGCAATTTGGGTGGTCTGTTGAGACCATTAGATTGTTTCATTGCGTGTTGA
+ACGCATTGCGACAGAAACAGTTGAGTGGGGCTTAAAGTAGAAAAAAAGCAAACAACAATG
+GAAGGTCGTTCAGTAAAAAGAAATTAGAAAACAGAAAAAGAGAAAAACTCGGGGGTGTCG
+CGAGAATTTGCGCTTCTCTATTCAAATCTGAGTGCGGAGGGGGTGTGGTAGTAGCCGGAA
+ATCAACGGTGCAATGGTGTTGCTGACGTTGTATTGCGAAGTTCGACGACTATCGGGAATA
+CTGAAGATTGGTCCGACGTGGGTTGACTTAAAGTCAGGGCCAGAAGTGTCGGTGACATCT
+TTGTTGATGTCAGTCCAATCGGAGTTGAGCTGAGTGAGGATGCCGGCCTGTTCAGTGACT
+AGGTCGAGAAACTCTTCAGAGTGGAGGTGGATCGTAGTGATTCCAGTAAATTCTGGAATA
+TCATACCGGAGCGTGGAACCGGTCTGATAACGGACTTTGCGCGTGGTAACGGCATGAACA
+AGAATGTTCTTGTTTTGCCTAGTAGCCACGTACTTTGTACGTACATAGGAGATCCCAGTG
+CCAGTAGTGGTCACGGAGCCAAGGGAAACAGTGTCCTTGAAGAAATCACTGTAAGGCTGC
+ATGACGCGGATGACTTGAGCAAACCAACCGTAAGGTCGGTCAGCATGATTGCCGATGCCG
+CGAAAACCGAAGACCTGGTCGAGGTCGAGGGTATCGTCGTCGTCGGAGATGACATATTGA
+CTGTCACCGTCATTGGCGAAGGGGAGGGTGTTGCGCCACACGTTGGATGAGGTGGCGAGG
+CCGTTGAGGAGACCAACAGTGGTCTGGAAGTCGGACCGAGCACTAGGCGTAAGCATAGCA
+AAACGGGTCGCTTCGTCCTTGGAGGCGGGGGCGCCGAAGATCGTCGTATAGACGGTATCC
+GTGTGGGAAGCATTGGCTTGGACTGGGCCAGAGTTGACAGGCGAGATCAGGGAGATCAAT
+CGCATGAACTGATCAAGAATGAAGATCACATTCGGGAGAATGGTGTGAACTTTGTCTTGC
+CAGAGGAAACTGGTGCAGTTGATGTCATGGGCATTGGGTATGCCAAAGACAAGATTGCCA
+AAATTTTCGTTGGGGCCAGCGTTGGCGGCGAGAGACTGGAAGAAGATGGCGACAGGGCCA
+GGGATCTTCAAGTGTTCGGCCTTGAATTGGCTGTCGAGAAACTCGACAAACAAACGTTGA
+TCGTTGGTGATCATACCACCGTGAGATTGGTTCTTGAGAACCTGGTAGTAGAACAACACA
+GCGATGTAAAGCTGGGAGACGAAAGGGTGCCAGTCAGGGTTGGCGTCGGTGAAACGCTTG
+GTTCTGACCATCTGCGTGTCCATGATAGACAGGACGTAGAAGAGCTGAGTGGTGTCAGGC
+ACGACATAGGATATGTCATTGTGCTTGATGCCGAAGAAGGGGAGGTCGGAGACGCCTGAT
+AGCATCATTGAGAGACCCGGGTTCTTGGGGCCAGCGGAGCTTGCAGTGGGTTCGCGAGGG
+GCGAAACTCTTCTGCTTCTTGGCAGGAACCGAGTATTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_11
+ATCTAAGGAGCAGCACGTCCGCAATAGATGTTGGGTTCCGGGGCTTGGAAGAAGTGGTGA
+AGCAAGTCGCTAAGAATGAGACGGCTTCTGGTTCTGACGTAGAGGCAGTTCTGGCTGACT
+TGGAGGTCATGGTATACGAGCGAGCTCAATCTAAAGACCTTGCTTGCAAAGGCGAAAAGG
+CAGTCGCACTACCGAAAGATGTGCACGCCAGCTCATTCATCCACGGCGTCTCGACGGGGT
+TCAAGAAGCGTCAGTGGGCGGAGGTGACGCTTAACAGTGAGAGTTTTTTGCCTGTCGATG
+AGAGCTTTGACATTTTTGATGGCGTGATCACAGCTGGCGCGTACTCAACTGAAAAACTAC
+TGATCAGCGCACTGCCTTGTGAAGAACATGTGTCAAATGGGCACGCTTCAGTGAACACTT
+TCGTGGTCGCGCCGAGAAACGGCAAAGTCAATTTCAGGGACGTGATGTCAGCTGATTCGG
+AATACAAGAACATGGCAAAGAACATCCTGACGATGCTTACATTTGCCAGTCTGGATGCCG
+AATATGAGAACGCTGAGATTGAAGGCTTCGTTAAGGCGAGGCAAACCTTCCCATTGATAT
+CGACATCTCACATTGCCGAGTTTGGACACGGGTCAACAACGAAGAGAGAATATGACGTGT
+CAACTGCTTCAAGCAACACGCTGATCAACCTCAAGACTAAAATTGATGGTGACCAGATAG
+AACTTGCTGGGTGCTCTGTGACACTGAAATGTGCGATACTGATCGCATATCAAGTCCATC
+CGGCTCTTTGGAATGATTTTTTTGAAGGGCTCGTACCCCCGCCATTTAGTGGCCAGCTCC
+CGAGCATGCAGGGCATTATGCGGCGGGCGATTGCGGAGTTAGACATCCAGAATGATGAGC
+TGAGACTATTGATCGCCGAGACAGCCGCTACAACTGGTAGAGTTTACGGCATGTCAGATG
+AGTCCATGGTGGAGCAGCTCACGATCTCATACGCCAGGGCTGTCCCTTTTGGCGACACGT
+TGTTCCCGAGGGACGGAGACAAATTGCCTGCTGCCGATGTATCTAGCTGGCAAGTCAGAG
+GCGTGCTCACGCTGGAACTAGCGTTCACTAGGCTATTCAGCTTGTTTGCGCACCAGACAG
+ATCGAAACAAGTACGAGAGGAGCACACACTACGATCAGCTCAGCTCGGCTGGTTTTGCAC
+TTTTTGCGAAAGACGAAGAAGGCCAGTTTGTTTTGCCTATCGCGTCCATTATTTCGACGA
+ACGTCTTCAGGAAGTCTGCGACTTCAACTGGCACTGTGAAGAAACAGTTCAAAGCAAGAC
+CAGTCGGACACGTATTGCGCGAATTAGTTACCAGTGACTTGCCACTCATGCGTAAAGGGG
+TAGCTAGTGCAAGGGACGTGTTGATGGCTGATAACCTACTAGGTGCCAAAGCAAGGGGTA
+GATACGCAACCGACGTCAAATCAGAGGGCAGTTATGCATGCTCTGTTGCCACAGAGCCGA
+ATGAGTATGTCTGCGGGCCACGTGACACAGATGGCTCGATGCTCACCAATGTGATGGCCG
+CCATGTTGCGGACGTGCTG
+>ds2020-267_12
+AACGATTGCGGACGTGCTGCTCCTAGATAATCTAAGGAGCAGCACGTCCGCAAGCACCGC
+CCGGTGGGACAAGTGACTAAGTGCACATGGTGGATGCCTTGGCGATATCAGGCGATGAAG
+GACGTAGTAGCTTGCGATAAGCTGCGGGGAGTGAGCAAACACACATTGATCCGCAGATTT
+CCGAATGGGGAAACCCGGCCGAAAGGTCATCGTATTCTGAATACATAGGGATACGAAGCG
+AACGTGGCGAACTGAAACATCTAAGTAGCTACAGGAAAAGAAATCAACCGAGATTCCCAA
+AGTAGTGGCGAGCGAAATGGGAAGAGCCTGCATGATTTAGCATCTTTGATAATAGAACGG
+AATGGAAAGTCCGGCCATAGAGGGTGATAGCCCCGTATATAAAATCATCGGTGTGGAACT
+AAGTATGCGACAAGTAGGGCGGGACACGTGAAATCCTGTCTGAACATGGGGGGACCATCC
+TCCAAGGCTAAATACTCGATATCGACCGATAGTGAACCAGTACCGTGAGGGAAAGGCGAA
+AAGAACCCCGGAAGGGGAGTGAAATAGAACCTGAAACCGTGTGCATACAAACAGTAGGAG
+CAGACTTGTTCTGTGACTGCGTACCTTTTGTATAATGGGTCAGCGACTTACATTCAGTGG
+CAAGCTTAACCGCATAGGGAAGGCGCAGAGAAATCGAGTCCGAATAGGGCGAAATCAGTC
+GCTGGGTGTAGACCCGAAACCAAGTGATCTACCCATGGCCAGGTTGAAGGTGCGGTAACA
+CGCACTGGAGGACCGAACCCACTAATGTTGAAAAATTAGGGGATGAGCTGTGGGTAGGGG
+TGAAAGGCTAAACAAACTTGGAAATAGCTGGTTCTCTCCGAAAACTATTTAGGTAGTGCC
+TCTTGTATCACCGTCGGGGGTAGAGGCTCTATTGCGGACGTACTAAGGGGGAAAATTTGC
+GGACGTGCTGNNNNNNNNNNCAGCACGTCCGCAACTCCCGACCCATTGCAAACTCCGAAT
+ACCGACGAGTGCGAGCAAGGGAGACAGACATCGGGTGCTAACGTCCGGTGTCAAGAGGGA
+AACAACCCAGACCGCCAGCTAAGGTCCCAAAGTACAGCTAAGTGGAAAACGAAGTGGGAA
+GGCTAAAACAGTCAGGAGGTTGGCTTAGAAGCAGCCACCCTTTAAAGAAAGCGTAATAGC
+TCACTGATCGAGTCGTCCTGCGCGGAAGATGTAACGGGGCTAAGCTGTACACCGAAGCTG
+CGGATATCCTTTTAGGATATGGTAGGAGAGCGTTCTGTAAGCCTGCGAAGGTGACTTGTA
+AAGGTTGCTGGAGGTATCAGAAGTGCGAATGCTGACATGAGTAGCGATAATGGGGGTGAA
+AAGCCCCCACGCCGTAAGCCCAAGGTTTCCTGTTCAACGTTCATCGGAGCAGGGTGAGTC
+GGCCCCTAAGGCGAGGCAGAGATGCGTAGCTGATGGGAAGCAGGTTAATATTCCTGCACC
+GTCGTATGATGCGATGGGGGGACGATTGCGGACGTGCTG
+>ds2020-267_13
+CAGCACGTCCGCAAGTGCCAGGGCCTCTTGGAGTGTTAGAGTCGTTGGCACAACACTCGG
+GTACGGATGCACAGGTCGTCAAGGTAATGTACTCTGACAACAACGACCAGGGAGAGTTCA
+CCGTCAGGCCACGTGAACTGAGCATGGCAATGAATGCACTGCTGCGTGGCTACGGAGTCA
+AGGCTGAGCAGTTCAACGCCGCCGTCGTGAAACTAGGCGAGACCGTTGCTCATGCGTTTC
+CCATGAGGTCAAAAACAGGATCTATCAGTGCGCCGGCTCTCGCGCTGAGATTGCNNNNNN
+NNNNCAGCACGTCCGCAAAAGATTGCCAATTGAGCACGTGTATGGGATCCAGGGGCAGCG
+TTCACTGAACGTGTTTGGAATGCAGAGCCCGCAAGACACAGGCATGTCGGAGAACATCAA
+TTATATGCCAAACTTGCTGGGTGCTTGCACATCGATGGCTGCTATGATGTGGCAGTCATC
+ACTCAAGACGAACAATGGTAGAATGCTGGTAGAAGATGGCTCTGATGTCATCGATGTGGC
+ATCAACGATGAGCGACACAGTGAAGACTTATGCTGATGGAGTAGAGGTGAGGAAAGATGA
+GTACTCTGCGATAGGTACTGGTGAATGGCGACAAGGTAGAGCAGCGGCAAGCTACTTCCA
+TGTGAGTGGCGTGAAGGAAACCAAGAGCATTGCTGACGCTGTCTCACGCTATGGAAGCAA
+TGCAATGGTAGAACATGCGGGTGTCAGAACAGCGGTAGGCACTGTCATCGATCAGGGTAT
+GGCTGGTGGCAGGGTAGCAACTGTCGCGGCCCACTCCAGAGAACTGACTTTCGATTTCGA
+TCGCGGTTCTGCGGTCAAGAAGTGGCACAGATTGCCACAAGTGCTGGATGAGCACCAAGT
+CACCCTTGACGGTGTTGGTGACGTGAGGGTGGTTACGGTAGCAGTGAATGTCGCTCACGT
+CCGTTTTGACACGTTCAGGGTGGCTGACGGTGAAGTTGGTGCAGCCGAGCTCAAGGTGAG
+GCGCACGCGTTATGGGATGGAATTGGGAACACTGGAGCACACGTTGATGCAGGCAATTGA
+CACGGCAAAGAAACCAATGACTGACACTGTCAACGTCGCCGCGACTGCAGGTATGAGCCC
+TCGCTCGGCATCTGACCTANNNNNNNNNNCAGCACGTCCGCAATTCAATGGCAGTGGCGA
+GTTCAACTCCAGGATACAGCATGTCATTGATCAAAGAAGCTGGTGCCAACGGGCCAGCAA
+AGATAACTCTCACTGGCAAAGTACCAGTGTGCACTGTTGGTGAGTTTGCGAAGCTGATGG
+GTAACATGACGATAGCGCCTGTTTCTGAAAAACCTGTCCCTTCCTCATTAGCCACATCTT
+GCGGACGTGCTGC
+>ds2020-267_14
+CAGCACGTCCGCAACCGGGTATCCACTGTTTTAAGAGTTTCGTTTTGGACCGGTTACCAG
+TGAGCTTTTACCAAGAGAGAGCGTTGTAGTAGAAAAGAAGTATTGATCTACTTGGTGTCA
+CTGAGGACGACAGATGCGTCAAGCGCGACAGAACGAATTAGGCCATGAGTCGAGAAACGT
+CGAAGATTCAGGTTCAAAGAAGAACCGAAATTGAACGAGTCGTTCATGTGTGCCATCCAT
+TCGATGCCAGGATCACGATATGTATTGTCGGCGTCAGACTGTATCAGCCAGGGCTGATAA
+TTGCTGGCCTGAGCAAAGACCGGTGATCTATCTGGATTGTATGTTCCAGACCAGATGAGC
+GATCGCTCAAGGCGGTAGCCGAACGAATACGCTGGTGACAGGACTTTGGAGTCCATGGCG
+TATCGAGAATGAAGGGCGAGTTCTGTGTGCAAACACGCGTTGACCTTCTGATTTTGATGA
+GGACCTGGTGCCTTTGGCCACTGGGAGCGGTTGGAGGCGTAGTCCTCTGTTGCAAGGAAG
+TAACAATCCAGGGGATTGCCTCGCACAGAAAGAGTCAACTGTGTTGACGAATTCACCTTG
+AGTCCTGTGACGGACGCAATTCGGTCAGACACGGCGCGCATGGTCGATGTGGAGAGCATG
+AACGTTGTCTGAGAGTCAAGGGCGCAACCATCTATGGACCAACCAAGATTAGAGTATGTC
+GCACGCCAGGAGGCGTGAGTGGCAGTGTAAGTGCCATTACTCCATCCAACGATGTTCTCG
+GTCGGAACCGAGTAACTGTCATCAGAAACGGAAGGTGAGATCTCAGAGAGATCAAAAAGA
+CGATTGGGCTGGGAGCCAGGGGTGCAAGAATGTGCTTCATTGCACAGGTAAGACACGAAA
+ACACCCGGACTCGGAAGTTGGGCGTACTTCCAGAAGGAAGTAGTGTCTACCCTAGCGTCG
+GGAAGACCAGAGGCGAACCATCCGGAGTGGATAGTGCCTGTTGCTTCGGCAAAGGTGTGG
+GGAGGTAGGCGAAAGAAGAAGTTTTCTCCTCCTTGCATGAAATTGCCTAAATTGGCAAGA
+TACTGAGCAATTTGGGAGGGTATTTGAAACTCCTGCCCCATCTCCATCACGTTCATGAAC
+TGACGTTCGTCAGAATTCAAGACGTTACCGTTTGCGCGATGCAGGTAAAGAACCCGGTAC
+CACCACAATTGCATGCAGTAGTAGCGGAAGAGGCCGAATGGGATGTGCTTCGCCGCATTT
+GAGTAGCGCGACTGAAGTGATGTGTACACCACATTGACCAGGTCGTCATATGGCTGTGCA
+GTTGCGGACGTGCTG
+>ds2020-267_15
+TATCTAAGGAGCAGCACGTCCGCAACCCAATGTGGCTCTAGGATGGTGGCACGGATCAAC
+GGTGAACGTGCTGGCGAGGTGGTACGCGGTGGACACCGATAACGAGTGGACACCTCTGAT
+CTCGAGGAGGTTCGCAGAAGATGCCAAGAGCACGGACGGGAGCTACGAGGAGACGCTAGC
+TTACTGCTTTACGTCACACATGTTGGCGGAAGGCGGAGCATATTTGACGATAGCTGCGGG
+GTCACAGTGGTCAACAGTAGGGGCTTCAATTGTGTCAGGGGCCGCCGTGCCAGTTGTGAC
+ACAAAAATGGGCTATAATGGATTGCTCCAGAAGCATAGACAATGGAAACAGCGACGGCGC
+TAGGCTAGGAGACCTGATGGCAAAGATGGTGCGAGAAGGCACGACAGCAATGGTCAAGAT
+TGATGCCGTGGTGCAGGTACGCAGCATGCCCACCGTGATGGAGGGTAATAGAGACACGAA
+TGCCCATGCCACGCAACACAGCAATGTGGTGACGTCAGCAATAAACCACCCCATGTTGGC
+GTTGACAACGTTGTACTACGTGCCTGGAGAGCAACAAGTAGTAGACTCTGTGATACTGCG
+AACAACGGACGACACCCACAGCTCCAAGATAAGAGGACAGAATGCTATGGGAGGCGCTGA
+GTTGGCTGAGATATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAGANNNNNNNNNNCA
+GCACGTCCGCAATCTTCGGGGCCTTGGTGATCCTGCAACTGACCCAGATGCTGCAACCAC
+ATAGTATGAAAGTGCGGGTGGGAGGGTGGCAAGACATCAATGATGTCAAAACTACGTGCT
+TCATCGGGCACGTAGCTTTCTTTTGTTTTTCTTTTGTTTTGTTTTTGTTTATTCATGCGT
+CTTTATCTCATTTGTATCGTTTACCTCTGATTTTGCGTGAGTGTTCTTCAGTCTTGAACG
+TGTGCACATGGCAGACTGTGCCAAGCGATGGCTTCGTTGGCAAAGTATTCGCTGAAACAA
+AAACAAAAACAGAAGATACGGAACGAGTAACCGGCGTAGGTCAAATCAGCAAAACAGGCA
+GACGTGGCACCTGAGCTGGGAAATGGCACTTGAACAGGTGCACAACACGGCGAGTACCAG
+CCAAAGTACCGTTTTCACGAGGACGGTGTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_16
+CGTCCATCAGGAAGCCGGTCATTTTGGCTTTTCCGTAATTGACTATGTCTGTTTCCTCTT
+TGTGTACCTTGAATAGCGCGCGCAAAATCTCGTACCGCTTGATATTACCATTTTTTGAAA
+CGTTTATGTTCCTTTCTTTTGGTATTACCGCGTCGTATGTTGCGCGCATTATCCTTGAAA
+TGAAATCCTGCAAAGGTTTTTCAAGTTGTAATGATGCTTTCACCATTCTGGAGTAGTCCA
+CCACTCCCGGTAACACGCCTATTTGCGTGGCACCCTTCCTGAAGCCTGATGACCGTATCA
+TCCACTTTACGTCCGATCTCCTGTCTTCACTTATGCCCCCCACACACCTATGAGAAGTTT
+TTATTTTGTAACAGTCTGAAACTGTCATGTGCAATCGCTCACACTGTCTCGAGTAGTATT
+TGTTCCTCAGTGATGCTGCTAGCCACGTGGGCATGCCTCTCGACACCGAGTCGTCGAGGC
+GTGATTCCAACGCCTCTAGAAGGTCCCTCATGTCACTCGAAGGTTTTGATTCTATCCTCG
+AGTGTACTAAGGTCGCCATGGCCCTTGATAAATATTGTCCCTTAGATCCGCGCTTGTGAT
+CCACTCGTAGGAACTCCGCTATAGCTCCGTACGCGCACTTGCTCATTTGTAGTCGTATAT
+TGTGCTTCTTCGCGTTTCGGCCGGCTAGTAACACGTCCCCGAGCGAGTTACTGCCCAGCA
+GCACGTCGTCGCCGTTATGAAGACTGTTTTGTGACTTCACGACATCTGGCACTATTAATT
+GAGTGTAAATGTAGTTCAGGACGCTATTCATGAATGTGGTGAGCCTCCACCCCGACAGTA
+AAGTTCCTTTAGCACTATACTCCATCTTCAAGCCTTGGTTGTCATGTACTATCACTCTGT
+TCAGCGACAGTCGAGTCCATTCCACCGCCGCCAGCTGCTCTTGCGTTAGGAAGTGCCCGA
+AGGTGTCTCTGTACGCATCTATCACTGCTTTCATTGACTGTACACTATGTTGACTGTTGA
+AGTCTTCAAAGTCTACGCAGTATTGAGTTCTACCCTCGAGAACCGCCCTCACTCTGCTAC
+GAACGTTCTCATCATTCGCAGCCTTGCCTACCGGGAATGGTGAAGGTAACACGTCTTCAC
+AGTTGTACAATTGCGGACGTGCTGG
+>ds2020-267_17
+CAGCACGTCCGCAAACCGACTTGGCTGACAGAACTGCCTACTTAGAGACCGTCAAGAGAA
+TCGTCAGTGATCGTGTGCTTGCTCGTGACAGGGCTCTGAAAAAGTACCAGCACTCGTGCG
+CACCGCAAGCAACTAGTGTCAATCCGGTGTTGGGAGCGCCAGCTCAGGGTTTTGGCGGCG
+TAGCAACTAATGACTACTACTTGACAGAGGGCAACTTGCTGCCCGTGGAAGAACATTTAG
+AAGCGTACGATGGAGTGTTGACTGCAGGCGCAATGTCGTCGGAGAGGATGGCGGTCGGTA
+AGGTGCCACTCAAAGCGCCAATGAGAGCAGGGTCTGTTACGGTCAACACTTTCGTGGTAA
+CGCCGAGGGCAGGAGAAGTGCGCATGGTGAACCTAAAAACTTCATTTAGAGAGACTCAGA
+ACATGAGTCGAAATGTGCTGACTGTTTTGACAGCAGCCAGTTTTGACGGCGAGTTTCTCA
+ACACCCCACTGGATGGCGTGATATCATTCAGAAGGCGGAGGCCGTTGATCTCGACTTCTC
+ACGTAGTCGAGACTGGGTCGGGCGTGGCCACGAGGCGAGAGTATGACGTGTCAATGGCAG
+AGTCGACGCAAATAATCAACATAAGGAAGAGTATGCGTGGCACGAAGATACGCTTTGCAC
+CTGGGACTCAACTTGTGCACTGCGCGCTGGTGCTAGCATATCATGTAGTACCACATGTTT
+GGAGCGCTGTCTTTGGGGACAAGGTGCCTGAACAGTACAGTGGGAAGACCCCGAATGCTG
+ACTACATGATTAGAGCTGCCATCGCACGTTTGGACTTCAAACCTAGTGAGCATCAGGTGT
+TAGTCGCCGAAGCGGCTGCAGCTTTGGCATGCGTGTATGGCATGTCTGACGAGTCCATGG
+TGGAATCGATCTCACCAGTTGTTTCTGTACTAGAGCCCACAGGTGACTTGGTGGTGTCCA
+ACATCTCGAGCACTGTTAGAGCCACGCAAGTGATCAAATGGCAGACTCAAGGCGTGCTAA
+CGTTCGAGCTCGCGCTAACTAGGCTCTTCAGTTTGTTCACTTCGCAGGTGGACAAGCACA
+AGTACGAAAGATTG
+>ds2020-267_18
+CAGCACGTCCGCAAAGTGAAGCCGGTAAGAGGTCAGGCGACGTTGGCCAGAGCAAGGCTA
+TGGCTGCAGGTGACATAGGGAGAGTTGACGCAATGGTGATTGCGTCACAGACAAGCTGGT
+GGCACCCTGGCGTGACTATGTGGATTGCAGCCTACAAGCTAGCCGTAGCAATACTGGCTA
+GCGCCAAAACTCTGATGATGACCGAGAAGGAGATAGAGGCTCTTATCAACTACACGTTCA
+CAAGGACCACGTACAGGAAACTAGTAGCCAGCAACGCGCTAATGGATTCTACGAGAGACA
+TAGCAGCCAGTGAGGTGACCCAAGCAGCATCAACCCCAGTCAGGTGGGAGAGGCAGGTGC
+ACCCAATAGTCCTAGTACTAGACGATGCAGAGTACTCGATTACAAGAAAGACAGCTAGTG
+CAGAAATCACTAGCGTGTACGACAAAGTGCACTCGCACATGGCGCTAAGCCTTGGGTCTC
+TCTACGGTGACATGGCGCACACTAGGATGAAGCAGCCAAATAGGATTGGCACTGGTTTGT
+TGGCAAAATCAGGCAGGGCACAAAGGGCAAGTCCAGTTTTTGCCAAACTGAGATTGACTG
+ATAACACAGTGACAGTTACGGCGTGCCCTACATCAGACTCAGACGCAGTACTGATGTCGA
+TAAGCAAAGGCATTGAAAAGGCTGGCCTACACAACGTTACGCTGGGAAATGAAGTGGTGA
+AAGTTGTGAGGAAGCCTGAGTACGGCATGACACTGACGTACCTGATACCTTCGACAATCA
+GTGGGAAAGGTGCTGACAAGTCATATGTCTATTTGGCTGGCATGCACTTCAGGGAGGACG
+ATCTAACGTACTCTTTGCCTACGCTAGAGTTCTTGTCGCAGTTCACGACAGAATATGAAC
+CGGTCAAGCCTGACAAGCGGCAAAAGATGTTTCGCCTGCTAGTAGACCCAGTGACGACAA
+GGGTCCACCACAGGCACATGTCCTTGCTAACAGTAATGGCGACTTGTGGACACGCATGGG
+CACTTGCGGACGTGCTG
+>ds2020-267_19
+CAGCACGTCCGCAATTCAACCTTCCTCGGTCTTCAGTCCATCAATGCCGTGGTGTGCCAT
+GCCGGCTTTCATACACCTTGCCATTAGTGACTGAATAGCACTTCTGTTCCTATCACAGAA
+ATTGGAGTACTCCCTCAGGTACCCATCCTCTGTAACAGAGTACTTGCTACTAATCGAGTC
+TACTTGGCTCACCACAGCGTGGTTTGAGCCAATTCTCGATTGTATCCTCATCGGCCTTAT
+TGACGCCCTGGATTCCATAGTGTGCAACAATACGGCATTCAGGATTATTTGGTCCTTGTC
+CGATTTGCCAGCTGCCTGTTGGTTCAGCAGTATCTGGCATGCATGTGCTGCGATGTCTGA
+AGTGACCGCTCTGGCCCCACCTAGCACTGCAATTGTCTTCAAGCTCTGCGGGGCGAAAGA
+CAGCATCATAGGGTCTTCATTTGGCAGGGGAGACATCATCGGATATACGCCCATTGCATA
+TTGCTTCTTCTGCACAATGGCTGACCCTACCCACTTCTTGAGATTCAAAGCTGCTTCCTG
+GTGGTCAATAAATCGTAGTTCATTATCACACACACAGTAGTTTGGATCCGCAAAAGCGTC
+TAGTGGGCTGGACCTCACGCCGGTTGACCTCAAGACCTTGATCATCTCCGGCTCTATGTT
+GACTTCGCTTGCAGAGCACATATCACTGATATCAGTTCGCGCAAGGTATCCTATGAAGTC
+TGCTAGCTTCTCATCAGGGTACATCACCCATGCACCTGGGTTCCCTCTTCCGCTTGCACC
+AGTTGGGCTGTTTGGTGCTCTTCTTGCTCGTTTGTGCTCCGGCAATTCTTCGCTGTCAAT
+GAATGGAGCGCCCTGATCATTCCTTTCTGACATATTCTCCATAAACATGTGGTGTGCCAT
+GTTTAGTTCTTATTTTCACTGTACTCCTTTGCAATTGAGTTCGTAAAGTAGTTTTGGTGT
+TTTATCGTCCAGCAGCTGAAAGATATTGCGGACGTGCTGC
+>ds2020-267_20
+CAGCACGTCCGCAAAGGCCCTCCCTTGACTTGATCTTAAATTGAATTATGGAATTCTCTC
+CCAGAGCTGCGGAACTAACGACTCTATTAGAAAGTAGAATTACCAACTTTTACACGAATT
+TTCAAGTGGATGAGATCGGTCGAGTGGTCTCAGTTGGAGATGGGATTGCACGTGTTTATG
+GATTGAACGAGATTCAAGCTGGGGAAATGGTTGAATTTGCCAGCGGTGTGAAAGGAATAG
+CGTTGAATCTTGAGAATGAGAATGTAGGGATTGTTGTCTTTGGTAGTGATACCGCTATTA
+AAGAAGGGGATCTTGTCAAGCGCACTGGATCCATTGTGGATGTTCCTGCGGGAAAGGCTA
+TGCTAGGGCGCGTGGTCGACGGGTTGGGAGTTCCTATTGATGGAAGAGGGGCTCTAAGCG
+ATCACGAGCGAAGACGTGTCGAAGTGAAAGCCCCTGGGATTATTGAACGTAAATCTGTGC
+ACGAGCCTATGCAAACAGGGTTAAAAGCGGTAGATAGCCTGGTTCCTATAGGCCGTGGTC
+AACGAGAACTTATAATCGGGGACCGACAAACTGGAAAAACAGCTATTGCTATCGATACCA
+TATTAAACCAAAAGCAACTGAACTCAAGGGCCACCTCTGAGAGTGAGACATTGTATTGTG
+TCTATGTAGCAATTGGACAGAAACGCTCAACTGTGGCACAATTAGTTCAAATTCTTTCAG
+AAGCGAATGCTTTGGAATATTCCATTCTTGTAGCAGCCACCGCTTCGGATCCAGCTCCTC
+TGCAATTTCTGGCCCCATATTCTGGGTGTGCCATGGGGGAATATTTCCGCGATAATGGAA
+TGCACGCATTAATAACCTATGATAATTGCGGACGTGCTGCTCCTTAGATAGAT
+>ds2020-267_21
+CAGCACGTCCGCAAATCCCGCTTGTTTCGTGAGTTGGCCATATTCCGGATAGAGCAGGCG
+CAGGTAGGTCTCCTCCGCTGGGCGGTAGGGAAGGGGGAGCTGAATGACCCCATCCACCAC
+TGGGTAGTCGGCTAGGAACCAATACTTTCCCAAGAACTGAATCCCTTGAAACTCCCCCTC
+AATGGCATCCAGTAGACGGGTGGTGGAGAAGGACTTCTTTCCCCACCAATCGATGGCCAC
+CATCCTCTGGACACACTCCGCAATCGTCTCCGTCGTGAGGTGGGCCAACCTGAGGGAGAC
+CGCCATGATATTGTCGTCCCCCAATGACTCCATCCATGCGTGCTCGTCAATGTTGTCGAT
+GGTGAGCCCCCCGTCCAGTTCGAAAAGCGCCGCATATCCGATGAGTAGGGTGATGATGGA
+CTGCAGGAGCGTGTTGTGGGAATGGCCACTTGTCGTGCCCACATACTTCTGCATGCGGAC
+CCCATCATCGCGATAGATTGGAGCCCGCAGCAGGCTTTCTGCCACAAAGGCCCAATAGGT
+GTCGTAATCGGGATTGTCCCCATCGTAATACTGCTTGCGACAGATGTTAATGGCGATGGT
+GACCATCCATTCATTGATGCTGGAGTCGAACTTCTTGGCGTCGAAGCAGAAGAACTTGTC
+GAAAGGCGCCATCCTGTCGATGAACTCCTGTGACCCCCCGTGGTACCATGATTGACCCAC
+CGCGATTGGATAGTTAGGGGCGGACCAGGCCTTCGTTAACTGGTTCTCTGTGACCCCACA
+CAACTTCAAGTCACGGTGGCTCATCATGAGGATCAGACGCCCCACGGGGGGGATCTTGGA
+TTCCTTGCGGACGTGCTG
+>ds2020-267_22
+CAGCACGTCCGCAATTGACTCTGGATCCGGCCTAACCGGAACACTGCCGAGTAGCAGTGT
+ATTTATAGCCCCGGCATAACCGGGACACCACCGCTGGCCAGCAGTGGTGAGAGCATCCTT
+TTCTAGGCTTAGCAAACCACATCTCCACTCCGAATACCAAGGTACTCAGAACGAAAATAT
+CGTTCGAAAGCTAACAAAAAGGAAAACTCTGGGATCAGGCATGACCGATGCTTGATTCAA
+GTAACCATCATTTCCCAAAGATGAATGGTCGCTGATTTGGGTGACGTGTCAGCACACGGG
+ACTACAGGTCAGACGTATGTTACGACCCTAACCAACTGCATTGCTAGCAGGATATAAAAG
+GTAAAGCTATCATTGGGATAGCTAGCCCTCCCCAACCGAATACATCAGCTAGCGAGAAAC
+GCGATACGGCTTACGACTGCAACGCCCTCACTATCGTAAGGCATACCGCTATCTCTACAC
+AAGATAATGCACCAGAAGGGGAAGTACTAGGTCTCCAGGACCCGGGTCGGGTCCGCTTCG
+TAAGGTAATACTTACGAAGAAACCGTTATGTGGTGGTTTTACGCCAGAGGTCATGAGATA
+TACGTATCTCTACAGACGGGCCTCGCTACTTCGTTGCCTGGGTGATAACGAGCACAAGGA
+CACCAGCCGATGGGGGGCAAAACCTCACCTCTCTCTACCCCCAAGAGAGGCCCAGCATGA
+CACTTGCTAGTGCCAGTTTGTGATCAGAGAGCCTCCTCCCCTTTGCTCGACTAAGTCGTA
+ACCTAAGAATGGAAGGTGGCGCTCCACTGATTTGCACAGGAGCTATGTTGCGGACGTGCT
+G
+>ds2020-267_23
+CAGCACGTCCGCAAGCCCACACTCAGCACGTCCGCAACGTCACAGGCATCAGCACGTCGC
+AACTTGGGCCTAATTGCGGACGTATCTAAGGAGCAGCACGTCCGCAAGCGCGGTATCACC
+GCACATCATAAGGGCGCTGAGGACGATGGGTGTTCAGGGGAATGAGCAAGGGGCTTTTTC
+CGACCCAAACTACTGCGTTCACGATAATCAGGTGCGGCGTATCGATAGGGTCAAGGCCGC
+AATGAACATGCGACGTTGGGTCGGGTCCGCTATCGTGCAGAGGAAAAAGACGTCTATGGG
+CACATACCCTGTTCTTTCACCGATACCAAATGACGACCCGATGATGATGAAATTTTCACC
+TTTCCCACTGCAATTAGAGCTTTACTTTGGTGGCAAGAGGGCAATGAACACAGACCAAGC
+AGCACAAGCGTGTCAAATAGTCATGAACCAGATGACAGAAGGCATGTCGTCTAAAGAGCA
+GGCGCTGATGCACACCGTACTGTTGCAGGGCTATCAGTCCAGGGGCTCAATTGCGCGCAT
+GGAGATCAAGTCGAGAATGGGGAAGATGAATCCCCCGATTGACTCAAACATGAGCATCAG
+CGATAAGTACTCGATGCATGAACCGGAGTATGAAGCGGCGTACGTACGCTTTTGCGACGC
+AAACGAAAACACTATAAGGGACTATATGGCCAGATGCATCAAGGTTGGCGTGGCTGCACA
+TGGCTTCGAGGGTACCAAGACTGAAGAAGCGGCTGCCATGGCGAAGCTGGCACGAAGGAA
+AGCAGGCACGTACGGTGAAAAGAGAGGCAATTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_24
+AGTACCTTTTATCCGTTGAGCGATGGCCCTTCCATACAGAACCACCGGATCACTATGTCC
+TACTTTCGTACCTGCTCGACTTGTCAGTCTCGCAGTTAAGCACGCTTATGCCATTGCACT
+ATTAGCACGATGTCCGACCGTACCTAGCGTACCTTCGAACTCCTCCGTTACACTTTGGGA
+GGAGACCGCCCCAGTCAAACTGCCTACCATGCACTGTCCCCGACCCGGATTACGGGCCAA
+GGTTAGAACCTCAAATAAACCAGGGTGGTATTTCAAGGATGGCTCCACGCAAACTGGCGT
+CCACGCTTCTAAGCCTCCCACCTATCCTACACAGATCGATTCAAAGTCCAATGCAAAGCT
+ACAGTAAAGGTTCATGGGGTCTTTCCGTCTAGCCGCGGGTAGATTGCATCATCACAAACA
+CTTCAACTTCGCTGAGTCTCGGGAGGAGACAGTGTGGCCATCGTTACGCCATTCGTGCAG
+GTCGGAACTTACCCGACAAGGAATTTCGCTACCTTAGGACCGTTATTGTTACGGCCGCCG
+TTTACTGGGACTTCAATCAAGAGCTTGCACCCCATCATTTAATCTTCCAGCACCGGGCAG
+GCGTCACACCCTATACGTCCACTTTCGTGTTTGCAGAGTGCTGTGTTTTTATTAAACAGT
+CGCAGCCACCAGTTTATTGCAACCCCTTCGTCCTTCCCCCGCAGGGAGGTCAAACTACCA
+GGGCGTACCTTATCCCGAAGTTACGGTACCAATTTGCCGAGTTCCTTCTCCCGAGTTCTC
+TCAAGCGCCTTAGAATACTCATCTCGCCCACCTGTGTCGGTTTGCGG
+>ds2020-267_25
+AGTGATTCCAATCTACCTTGTCGGGAGGTCTCTTTCCACACAAGTGCTACTGCCATCATT
+TTCACACGTAATAGTTGTATCACTAGGGGATATCCATATGGTAAGCGTACCGTCAGTCGA
+GGTATAGATTGTTTCTCCTTCGCAGTCAGGCGTGTATGTGAAGGCCTTGTTACAGAACGT
+TGAAAACGTGTCTGCGCCTGCATAACCGCCTGCCGCGACTATAGCATATGTAACTATGTG
+ACAGTCTACGTTGTTCTGATTACACGCCAAGTTGTCTACGATATAAGTTGCGGCGCCAGA
+TGACCCTGCGATGATCGAAGCTACACTCGGGCAAACGAAGGCGGCTAGTCTGCTCTGTGA
+TCCTAATCCGATAGTAAGACCGTTTCCCAGAGACCGGCAGCTATTGGTATCACGCTTACT
+GTGAGGCGCGGTATCAGTCGGGTCAGTACCCATGAGCATGTTGTGGACGTATTTGTGCTC
+CTCCTCATTACTCGTGTCCACAATTATCACCTGTCTGCTCGTGTTGTTGAGGTCGGGCAC
+CATCCACCTCATGTCCCACATTGAATCGCTGCCCTTCGTCAGTGCGCCAGCGCTGTCTAC
+GTATAAAAAAGCCCTGGCGCCCATTAGTCCGAGTGACCAGGCCAGCAGGAACAGCCCCAT
+GTTGAACATTGTTATCTCAGACGTGTATCACTCGATTGGTAGTTATCAAGTTGCAATCAC
+TTTAAAGCTATTATTTTCAGGGAGATGACAACGGTCAGTGCGTCGCCTTAAGCGTATCTA
+AGGAGCAGCACGTCCGCAATATA
+>ds2020-267_26
+CAGCACGTCCGCAAATCGCTCACAGTCTATGTTTGAACTTGTGGTGTCACTTTCAACCCG
+CGGTAGAGAGGTTGGAGAGCTTGGTTGGTGGACAAGAACAAAAGTCCGTCGATCATCATC
+TCCCCTTAAAGCCAAAGGAAGACAGTGATAGTAAACATATTACTAACTGCTAAGCACGTG
+CCCACCGCCGGGTGGGGGGGGTTATACCAGACATAGAGGAATACTATGTCAGAGGGAACC
+ACCCTGCTGCCTGAAGCCTTCGTGCAGCTTTTGAGGTGCTCTCGCTTTCTCCCGAGTTGA
+TGCATGTCAACAGGGAAGGGCCCGCACACCTCCCGTTCACGTTGAACGTTTCCCTTTTCC
+CACTGAAGGGACGGACGCTGGAGCTACGGTTGGTACTTTCGTACCGGTCGGCTCTGCTCG
+CCCGGAAAACGCTCTATGAACGGAAATGTCCTTGGAGGGTCGGTGGTTCGCCATAAGTCA
+GCAAACCACTACCAAGGACTAGTCGCTCATTCCATTAGCATTCTGGGTCTGGTTAGGACC
+CGCGCCCCAAGACACATAACCACGCTACCTATGTCTCCTGACTGGAATAACTAATGGACC
+GCGACGCATATCCGGGTGGTACCGTAATACCACTCTGGCAGACTGTGCATCGGTCTGTCC
+GGATATTGACTAGGAAGGGTTACAAGCTTGTAACCAGGAGCAGGACGTCAACCTGCCTTC
+CCCCATGCCCACCGTACTTACTTTGCGGACGTGCTG
+>ds2020-267_27
+ACAGCACGTCCGCAATTGATGCAGTTTCAACCTCGGCCCAGGCCTTTGTAGGGTTTGGTG
+GAGGCTTTGCCTCTTGAGTTTCATTGTGTTTTACATGCCGACGCAGTTTTTGATGCCTGT
+GGTGGAGTTTTTGATACAGGTCTTTGCCACCCTTACTACTCGAGGGTTCTGGCCTGACCA
+TAATGACTCTGGTGGGTCATTTGTAGAGTGGCTTGTCTGGAGATTCACTTGGGTCGTTGT
+CAACGCGACCGCTGTTGCTGAGTCTGTCAATGCCGAAGTCCGCAAGAGGCACAGTGACAA
+AATATCACCAGACTCTGTCCGTCTTGCAGCAATTTTCAGGAGTTTCTTCATTCAGGGTGT
+TGCCTTCATTGATGAGTTGGGATTGCCTCACTATCTACGATCCTACACCCCTGTGGAAAT
+GACTAAACAGGCCCTGGACAAGTCTCTGTCTCTAATGGCTGAAGTCGGGTGGCCAGTGAA
+TGTGGCCACGGATGAGAGGGTTGATCCCATTGCGGAACGCATGGGATTCAAAGAGTGGGT
+CCTTTGTGGACGTGCTGNNNNNNNNNNCATTTGTAGAGTGGCTTGTCTGGAGATTCACTT
+GGGTCGTTGTCAACGCGACCGCTGTTGCTGAGTCTGTCAATGCCGAAGTCCGCAAGAGGC
+ACAGTGACAAAATATCACCAGACTCTGTCCGTCTTGCAGCAATTTTCAGGAGTTTCTTCA
+TTCAGGGTG
+>ds2020-267_28
+TATCTAGGAGCAGCACGTCGCAATAATTTCCCCGTCAGCACATCCCAACACAGTAGCCTT
+GCGGACGTGCGCCCCAAGCAGCTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGAC
+GCACTGACCGTATAGCTGGTTCTCCCCGAAATGCATTTAGGTGCAGCGTTGCGTGGTTCT
+TGTTGGAGGTAGAGCACTGGATGGTCTAGGGGGCTTATCGGCTTACCGAAATCAGCCAAA
+CTCCGAATGCTGGCAAGTGTAGCGTGGCAGTGAGACGGCGGGGGATAAGCTTCGTCGTCG
+AGAGAGAAACTACAAAGCCCGAACGTCCTTACTTCCAGAGCACGTCCGCAAAGACCATCG
+CCTTTAAGTTGCGGACGTGCTGNNNNNNNNNNCAGCAGTCCGCAATCGAGTAGATCTCAG
+CACGTCCGCAAGGTGAGGCCCCTAAGGGTGTACTAAGTGGAAAAGGATGTGGGATCGCGA
+AGACAGCCAGGAGGTTGGCTTAGAAGCAGCCATCCTTGAAAGAGTGCGTAATAGCTCACT
+GGTCAAGTGATTCCGCGCCGATAATGTAGCGGGGCTTAAGTTATCCGCCGAAGCTGTGGC
+AACCTGTGTGGTTGGGAAGGGGGGGCGTACGGTCAGTGCGTCGCCTAGCGTATCTAAGGA
+GCAGCACGTCGCAAGGATGCATTCAGCACGTCCCAAGTTTAAGGCGGTGTTGGTTGCGGA
+CGTGCTG
+>ds2020-267_29
+CATGCGTAGGGGAAGTCCCCCTGCAGGAGGCCTTACGTCCGCAGAATTGGTTGAAGTTGT
+GTACCGCACACGCAAGTTGGGGTCCGTCGTAATGTCAACGATGACGATGCTGACTCCCCG
+TGCTGACATGCAAGTGAGTGCTCCCTGCATGATGTTTGAGGGGTTGAGCACTCCATCATC
+GAAAGCGCCCGGGTGAAAACCTCGAACCTGCTGTGAGAAGTTGTAAAACTCGCCGGCAAT
+AGGCCAAGACAACAGGGTCGCCGCCGTTGAGGCTTCATCAGGCCCTAACTTAATCAGCGT
+TCCTCCCGCGATTCGCTCTCTGACAGCCGTGTTGTGCATGTTCATGCGGGCCAAGAGCTT
+GAAGGCCCAGCCAGTCGGGTCAACATTGTCTCGGTACTGTGATCCCCTATTACCAGACGT
+CATCTTTGACGCCTCCTGAAGCTCGTGAACTGCAGCATTGCTCCGAACGGCGTCATTGTA
+CTGCTTGACATCCTCAGCTGCATCAGTGTTGACAATGTGGTGCAAGAGGACGTGAGCGCA
+AGATCGCAGCTTGTCAGCCGTCTTTGTCGTGACGGTAACGCCAACGTTTATGTTCCAGCC
+AACAACAATGGGGATGTTGTAGGACGTCTTGACAGGCACAGTGGCCTTCTTGTTGCTGTC
+TGTCATAGCAGCAGTGACATCGATGTGCTCGATCATGTTGAACGCGCTGACATTGCGGAC
+GTGCTG
+>ds2020-267_30
+CAGCACGTCCGCAAAATATTTCCCCTCAGCACGTCCGCAACAGGAGCCATGTCAGCACGT
+CGCAACTTACCTATTGATATTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGC
+ACTGACCGTGTCGACAACCTTGCAATCTCCATCCTATCCTCCTTGCTCTTCCTCTGCTCC
+TTCCTCGCCTTGACCTTCTTCCTCACCGACCCCTCAACTTGCCTGGAATGCCCCAAAATC
+CGATCCCCTGCATTCTCCTGGAACCTATGCTCGTACTCCTCTTGCCTTTCAATCTCCATC
+TCGTCCTCAGACACCATCTCCAAATCCTCCTCATTTACCTCGGGACCGCTTCCCTTGCTC
+CGNNNNNNNNNNAGCACGTCCGCAACAGCATTCTTATCTTTTTCTACCAATAACTCGCCA
+TTATCATCCTCTTCCTCCTCGGCAACGGCACTTAAGAATTCTTTCCTTCTGTGTTCTTGC
+TCTTCATCGTAGACCTTGGTGTTATTATCATCCTCCTTAAGTTCGGGGCCATCCTCGATC
+AAATGCTTAGCCACAGGGATACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCA
+CGTCCGCAAAAAGTCCCCGGTTCTATTGCGACGTGCTGGGCTATTGATCTTGCGGACGTG
+TGCCCGATAAGCATTGCGGACGTGCTGCCTCTCTCGACTTGCGGACGTGTGCTCCTTAGA
+T
+>ds2020-267_31
+CAGCACGTCCGCTATCTAAGGAGCAGCACGTCCGCAAGGGTTGGGCTTCGGCCACATACG
+TGCTTAGGATGCTGGCATAATGTCTTTAATCGACCCGTCTTGTAACACGGACCAAGGAGT
+CTAACATGCCCGCGAGTGTTTGGGTGGAAAACCCGAGCGCATAATGAAAGTGAAAGTTGA
+GACCTCTGTCGTGGAGGGCATCGACGCCCGGATCAGAACTTTTGGGACGATTCCGCGGTA
+GAGCGTGTATGTTGGGACCCGAAAGATGGTGAACTATGCCTGAATAGGGTGAAGCCAGAG
+GAAACTCTGGTGGAGGCTCGTAGCGATTCTGACGTGCAAATCGATCGTCGAATTTGGGTA
+TAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCTGCCGAAGTTTCCCTCAGG
+ATAGCAGAAACTCATGTCAGATTTATGTGGTAAAGCGAATGATTAGAGGCCTTGGGGTTG
+AAACAACCTTAACCTATTCTCAAACTTTAAATATGTAAGAACGAGCCGTCTCTTGATTGG
+ACCGCTCGGCGATTGAGAGTTTCTAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCG
+GGATGAACCGAACGCGAGGTTAAGGTGCCGGAATTCACGCTCATCAGACACCACAAAAGG
+TGTTAGTTCATCTAGACAGCAGGACGAAGGCCATGAGGTTGCGGACGTGCTG
+>ds2020-267_32
+CAGCCGTCCGCAATGAGTCACGGGCAGCACGTCCCAATGGGCCTTTGCTTGCGGACGTGC
+TGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTAGTTTATTACCTCTTTACTGTTC
+AAAGATCAAAGAGAAAACCATTCTGTTATTCTGTTATTACATTACGTGGATACACATTTT
+CTATGGGAAACAACATAGACATTGTAGTTGTCCAACGAGATACTGCACATACTAATGTCT
+TGGGCGAGTCATGCGCACTTACCGTTTGTTTTATTATTTTAGAAATTTTATTTATGTTGT
+GCTTGTTTTATTGAACCCATTTCATATCATGGTTCAAACGTTAAAAATCGACTCCGAAGA
+AGTTCCCGTGGATCATTTGTCAACTGCTCAATCAATGACTTCTATAATGGGTATAATAAA
+ATGGGTATAGTATAATAAAATAATCTTTTTGTTAGCATTCCGACGAAGAAGTCATTGATT
+CTTTTGATCGGGATTCATATTGAAAATAATCAGAAATCTAGGAATTATAATCGCTTTTAA
+TCGCTTTCGATTATTTAAAATTAATTGAAATCAACACAAATAGATAAAGCAAAGAAATAG
+AATTGGGACATTATATACATTATCACTATGTATATTCTATATGTATATATGTAATTGATT
+TCCCTATAAATAGGCCAGGAACCACAGACGGTCAGTGCGTC
+>ds2020-267_33
+CAGCACGCCGCAACTATTGATCGGTAGCACGTCCGCAACGTCATGTCCCTCACACGTCCC
+AAACCAAAACCATTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACC
+GTTGGTCTGCCCCCCCCCAGATCTCTCAAGTGGAAGTCTGACAAAATCTGCTAACTGACG
+GGACAATTGTTGGTGATACATAGCACCAGCAGACTCCTTGGTAACAGGCGATATAATACC
+AACACTCAGNNNNNNNNNNCACACGTCCGCAACCAATCTTGCATCTCTTGTTTGGAACCC
+AATTCTTCATCATTTTCCGCACTGGGCTGAGAAGTCGAGCCAGATAAAAGTTTCTGCCTC
+ATTTTCTCTGCTAGCATCACCATCTCTTTAGCCTTACTCATGAGAGCATTCAAGTCCTGG
+AAAGCGTCTTGCAAGCTCTTATCAGTACTCTCCCACATCTCCTGCTCCTTCCTTAGAATC
+CCTGACACTCCAACCATCCTCACCGCCCCTTCCCTCGTATACATCCCAGAGCTCGACCCA
+GGACCCTCCAGACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAA
+GTATTCAAGCCTCAGCACGTCCGCAAACTCCCGGGGCAGCACGTCCCAAGAATCACACCG
+TTCAATTTGCGGACGTGCTG
+>ds2020-267_34
+CAGCACGTCCGCAAGCCAGTCGCAGTGCCGATGTCTCCTGGTTGCGTGTACGTTAGGCAA
+AACAGCCACAGGTTGTCAAGCTACGTACAACGAGACCTGTCGTACGGCAGAGATCAAGTG
+GTGAGAATGCTAGGGCAGAGGGCAGGCTGCATTGCCACAGTAGATGGACACGAGGCTGTG
+ACAAGCCCACACGACTACCCTGCGTGCGTGGTTGATTGTACTGCATATGAAATAGGTTTG
+GTGAACACGAACGCGAGGGCGCTAGCACTCGAAAAACCATCTTTCTTCAGCCAAGCCATA
+ACGCTGTGTCGGGACACGTGGTCGTTCAGGAATGTCAGGGCGTTCTCGTATAACCCGGAG
+GAGGTGGAGTCAATGATAAGGGCGATCAGCAGGAGCGACGAGTATGCAACCATGTTGTAT
+GCTTCTATGAATGATGGCACTGCACCACAAGAGCAAGCAGTCACCCTGGAGGAATTGATC
+ACAAATGCGTGCAGAGACGAAGACATGACATCGATCAAAGCGGGAGCTGGCCAGCGAATG
+AGGCATGAGCACAGGCTGTTCATGACAATCGTGGCCGGTGTCGTGGATGATATCAGGGGA
+TTGGAATTGGGCATAACACCGGAGGTGCGGTACGCGGCCAAAGAGACAGTGGCATTTGCG
+GACGTGCTG
+>ds2020-267_35
+CAGCACGTCCGCAAAAGTTGCCATCTCAGCACGTCCGCAACAGGGTGACCTTGCGACCGG
+AGCCTAATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTCATA
+TTGGGCCTGAGTAAGCGGACGAATAAGGAGAAGAGGGATTGGAATTATGGTTAGGGTTTG
+CGGTAATTGTCGGTGGCAAAGTGGCATAACTGGGAGCCGATTGATTCTGATCGTATGGCG
+GATGATACGATTGCTGCTGAGGCGGCGGTTGATAGGGCGCATGGGGCTCAAATGCAGGGA
+CGTTGCGGACGCTCTGACCCAAAGCTTTTGCAGACGTGCTGACGGAANNNNNNNNNNCAG
+CACGTCCGCAATATAAGGGAGGGAAAGAAGGTGGTTGAGGTGTGGGATTGAAGGTTTGCA
+AATTAGGGCTGGAGATTGGAGGAGGGGTATAGGAAGGAGCGGTGGGAGGGGCAGGATCAG
+GATTCAGAGAATACGGAGGGTAAGATTGGGAATAAGGCGAGTAATCGGAGGTGCTACGGT
+CAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATAGATTATCAGTCAGC
+ACGTCCGCAAGCTTTTTTCCTCAGCACGTCCACAAGACCCTAGTTGCGGACGTGCTG
+>ds2020-267_36
+CAGCACGTCCGCAACTACGACACGTTTTTGTAGCGCTCCCTGGCCGTGTCTGCGTTCTGC
+ATTGCTCGCGGCAAACACAGCAGGTTGTGTGCATGATCAAGTTGCAGACGCGTAACGTCC
+TCATCTTTTAGACACATTTGTGACCGCTGTGCCACGTGCACCTCTGCCATCGCTCTACCG
+CTGCCCAACATCTGGATGCTCGAGCAGATCATGCTGACCATCTCATCACCGTTGATTGAC
+GAATTCTCACTGATCTTGTTAAACTGAGGGCTGTTAGATGATGAAAACAGCCTGTCAACC
+GTTGGCTCGCAAAAGGGTTGTACCACTTTGTACACCCCTGCGTAAAACACGTCAGCATAG
+TCGTGGTGGGACAAGGCTGCAGGCTGGTAGGTAGACGCCACAGCTAGCGACGCCATTAAC
+ATCACGTTTTTAGAAGCCATGAAGTGCCTGGTCGTGACGTGTCCAATGAGGTCCAACATG
+TCGTTGATCGAGAAACCAACACTGTTGAACCAGTCTCTGTCGAGGTGGGGCGCTGACGAC
+CCTACACCTGCAATGAAGGACACATTGCACTCACTTGCCACCGCCATCAACTTCTGATGC
+CCCACAGCAGCCTCAATGGAAGGCGAGAACCCCGTATTTGCGGACGTGCTG
+>ds2020-267_37
+CAGCACGTCCGCAACTGTAATCCCCCAGCACGTCCGCAACATGTCCGCCGTCGGCACGCC
+GCAAACCATAGCTGAATGATTGCGGACGTGCTGCTCCTTAGATTCGCTTAAGGCGACGCA
+CTGACCGTTCCACTTTTGTTCTATTTCACTCCCCTCCCGGGGTTCTTTTCACCTTTCCCT
+CGCGGTACTCTTCTCTATCGGTCACACAGGAGTATTTAGCCTTACGAGGTGGTCCTCGTG
+GATTCAATCGGAATTTCTCGTGTTCCGACCTNNNNNNNNNNAACACCTCTCAAGTGTTTC
+GTCTAGCCGCTAGATTCCATATCGCTGTCCCACAACCCCAGCAGTAAAAACTACTGGTTT
+AGGCTCTTCCCGCTTCGCTCGCCGCTACTAAGGGAATCGAGTTTTCTTTCTCTTCCTGCA
+GCTACTTAGATGTTTCAGTTCACTGCGTTGGCTCATACCCACCTATTTATTCAGCGAGCT
+GTATTTAGGGTTGCCCCATTCGGAAATCTCTGGATCAATGCCTGCTTCCGGCTCCCCAAA
+GCGTATCATACGGTCAGTGCGTCGCCTAAGCGCGTCCGCAAATTTGAGCCCATGTAAATT
+GCGGACGTGCTGACTGATCAAATATTGCGGACGTGCTG
+>ds2020-267_38
+CAGCACGTCCGCAAATACAGTTGCATCTATCTCCCCCTCAAATCTGACACTGGTAGAGGG
+TCGAGATTTGGAAGAAGAGAAAATGAAATAATAGTAAAGAGACTCAAACATGCCAGTCTC
+GTGGTAGAAACAAATGCAAGGAAAGGTGGAATGGAGATGGGCATCCGACAACTGGAGAAA
+AGGAATAAAAGATGGAAAAGAGTCAAAACATTAGGCACAAATGTGATGTGCTGNNNNNNN
+NNNGACGTGTATGCACACATAGAGAGAAAGGGATGAATATTGTATAGATAGGGTAGGTGA
+CGTGGACAAGTGTAAGAGGTGTTGAAACGGAAGCCAAGTTATTGGCGTGGGTGTGCATGA
+GAACGAAGAGATGAGGAGAAAACACCCGTGGGTAACACAGAGAAAAGTGAAAGGCAACAA
+GGGAGAAGAAATATATCAGACAAAAATGGGATGGAAATAGAGTGGAAGAAATAATTTAAG
+GAAATAAAGGGGAATAAAGTAAGAAGTATGTGATAGGTGGTGAGAAAAGAAACCATAAAT
+AAGAAAACACAAGATGTTGGCGTGAGAGAGAGAAATAGTCAAACAGGATAGGAAACGGTC
+AGTGCGTC
+>ds2020-267_39
+CAGCACGTCCGCAAACACTAACCCATCAGCACGTCCGCAAATATCCGGGTCTTGTGGACG
+TGCTGAGGGCCGGGTCCTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACT
+GACCGTTCTGCCTGGAGTTGGCTAGCGATTTCCTCTGCATGGGTAGGTGATAGTTGTGAT
+TCTTGTGCGAGGGACGTTAGGGGAGTATCCGCAGGTACTAGACTGGCGTAGCAGTTATCT
+AGAGTTGGTCGTGGACGATGCTGGCAGTTACTCGTCATCCAAAGCAGGTGTGGTGGACGG
+ATGCGTGATTGCGGACGTGCTGNNNNNNNNNNCAGCACGTCCGCAAATCGAGGTGGGCAC
+ACGTCCGCAACCGTGACTGTCCTCCAGAATAGGACTAAGCCCTGTATCTTGTAACGCAGA
+ATGAAGTTCACGCGGAGTAACATCCGCAATAGCAACTGTGGGGGCGATGAGGCGTAAACC
+GCAGTTCTGTAATGCAGGTGATAAGGGCTCACCCACGGTCAGTGCGTCGCCTTAAGCGGT
+CCGCAAGCTTCACGGTCTTCGAATTGCGGACGTGCTGAGGGGAAGAAGGTTGCGGACGTG
+CTG
+>ds2020-267_40
+TCTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTCTCGCTACC
+TGTACTTGCAAGCCCCTACTGCTGGTTGGCTGAATGAGAATGATATAGTTTCCCCTTCCA
+TCGTAAGCACGTGCGGTAAGGGGAAAGATCGTCCAGTTCGTTCCTCAGAATCACATACCC
+TGACGGCAGCCCCCGGAATAACAGTGTCAAATACTGACTCGGGTGCGATTATACATTCTC
+TCACGTTACAGTAGGGCGTAAAAAGACCCCTTGAACTTAGGTCTTCGAACACCACTTCGT
+GCCCGAAGACTCTGTAAGCGTTTGCTAGTCGCAAGGCATCTCTAGGCTCCATGACGAAAT
+CATCACCAATAGGTATAGACTGCATCCCTGTCAAATGTGAAATCCCGTCGTACCCATCAA
+CCACACAACCCGCTAACAATGCTCCCGAGACGTAAACAGGTACGGTCAGTGCGTCGCCTT
+AAGCGTATCTAAGGAGCAGCACGTCCGCAATCCGGTATCCCTCAGCACGTCCGCAACTGA
+TAGCTACTCAGCACGTCCCAACAGTCAACCCCTTGCGGACGTGCTG
+>ds2020-267_41
+TATCTAAGGAGCAGCACGTCGCAATAGTGACCCCCTCAGCACGTCCGCAACAGGTCCTCC
+TCAGCACGTCGCAAGAGTGTGGGTTTTTTGCGGACGTGCTGCTCCTTAGATTCGCTTAAG
+GCGACGCACTGACCGTTTCCTCATTGCTCCATGTTGGGCGCACAAACTTGACATTCTGGA
+TTATCATCTAATAAATCACATGTAATAAAATTTTGTAACGTCATGTCGCTCATCATCGTT
+CCTTAAGTCAATTGTTTTTGGGAAGGTTAGTTTCTAAACCGCGTCATCGCTAGCATTTCA
+CTGTTACTGATAACTTGGGTTTTTTGGGCAATATCGACACGATTAGCAGATTTTTCATAG
+GTATGTTTGACGTGCCAATTGTTGCTCACCAGCGCCATTGCCATCGTTACCCTATCGGCT
+AAAACACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGTATGT
+CTCGTTCCACGTCCAAAACCTGGCTCCTCAGCCGTCCGCAATTGACATCAGTTCAGCACG
+TCGCAAATCCATGCCCTTTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_42
+CAGCACGTCCGCAAATTAGGCCGCCCCCCCCCCCTGACTGTACAAGAATATGCGGAGCTC
+AACATGTCTGGAAGCACAGGAGAACGTTCTTTTGCTGATATTATTACCAGTATTCGATAC
+TGGGTCATTCATAGCATTACTATACCTTCCTTATTTATTGCGGGTTGGTTATTCGTCAGC
+ACGGGTTTAGCTTACGATGTATTTGGAAGCCCTCGTCCAAACGAGTATTTTACAGAAAGC
+CGACAAGGAATTCCATTAATAACTGGCCGTTTTGATTCTTTGGAACAACTCGATGAATTT
+AGTAGATCTTTTTAGGAGGCCCCAATGACTATAGATAGAACCTATCCGATTTTTACAGTG
+CGATGGTTGGCTGTTCACGGACTAGCTGTACCTACCGTTTCTTTTTTAGGGTCAATATCA
+GCAATGCAGTTCATCCAACGATAAACCTAATCCGAATCATAGAGCCATTTACGGTCAGTG
+CGTCGCCTTAAGCGAATCTAAGGAGCAGCACGTCCGCAAGGGATTCTGACTCACACGTCC
+GCAAAGTACACCACCTATAGTTTGCGGACGTGCTG
+>ds2020-267_43
+CAGCACGTCCGCAACTACTCTCCCTTGCATCAGGCGGTGAAATGCGCTCTCTGCGTCGGC
+TTGTGCCAGGGGATTCGCCTCTTCCCTGGTCTTAAGTCCCATTGTAGCGTACTCAATGCC
+GGCGAACTTCTTGGGGTAGAACTTAACGGTGGCGAGATCTTCCACTGCCGGGAAGAAGAG
+GAAGTCGGGAAGGTCGAGTAACTTTGCCACTACATAGGCGGCCTTCTCTATGGAGTCGGT
+GTAGCGGGGGTCAGGGGTGTGATTTGGCCGATCGAAGTGGCGAAGGTGTGCCATCTCAAC
+TGGGGTGCAGGCCTTGACGAATGTGAATTCCTCCGGCTTGAAATTGTTGATGGGGGGGGG
+ATGGAGGAGGGTGTAGGCGACAACTTCGGGGTCGGGTGGCGCAATGTCGAGTTCCTTGTT
+TAGCTTCCCATAGGCTTCAACCCTACCGAGGATTCGTATATGTTGGAACATGTTGGTGAG
+TTCCATCACTTCGCGGGTCGCGGCCTCTTTGGACCTCATGGATCGCATACGCGTCCTACG
+CTTGATAGATTGCGGACGTGCTG
+>ds2020-267_44
+CAGCACGTCCGCAACATGCCTTGCCTGGAGACCAACCGCAAGGGGGGGTAGCCCTTCTCT
+GTGTTCTGGAAAGAACCAGACGCAAGAGCTACCTTACTTGTAGGGCTGACGGAGTCGAAC
+CGCCGGTGGTCACACCCTATACTCTTCTTGAAGTAGGACCGTCCTACCAATATATCTAAC
+CTTTTAAGCACACTCACTGATATATAGTTTTACTAGTTTCAGAAAACGACACCTAACGCC
+ACGTCCCGAGCCGGAGCTGTTTACCCCCGCCCCTTCCGTTTACGTAGACGCTACCTCGAA
+AAAAAGGCATGAACGCTTGGCATCTATCATCCACTAGTCCGTGTGCCTGAACCTCCAACA
+GACAGGCGGAAGAACGCCTTACCCTCGGCTTGATCGCCCGTGAAATCACAGAGCTTCCAC
+ACTAAGTGGTGTACCTCAGAGTAAGAACGATTTACCTATTATGGCTAACCGTAAAGGCCA
+AAAGTGAAACATAATTAGAGATCTAAGAAAGTCATATAAATAGAGTGAGTGTTGCGGACG
+TGCTG
+>ds2020-267_45
+CTAAGGAGCAGCACGTCCGCAATATGCCCCGTTTCAGTGTGCGTTTGTCCGTGCTAGACA
+AGGGTTTTTGGTATAGTGCCCTTGCCGCGTTGTAGCCGTCTTGGCTTGCCCATGCGTACT
+CCAGTTCTTGGTCATCTGCAAGTGTAGCTGCGGCATCCATTGCCTCAGCCAAGCTCTCTT
+GGTCAACGAATTGCCCACATTGCATAGCCGCGTAGGTTGCTGAAGACACTCTGGTACCAA
+GNNNNNNNNNNTCAGCACGTCCGCAAGACACACATGCTTTGACACCGTACCGCATTGTCT
+TCTTGTTGAAGCCACCAAACTCGTTGATTGGTCTGTTGAGGCTTGAGCTGGTAACCACAA
+CCTGATCAATAGTGCTTCCGCCTGAGAAGCTCAAACCAAAAGTTGCCGTTCCGACGATGA
+CTTGGTTGTTGTCGATCCTAGCTTGATGCCAGAACCTTGGGTTCGTTACTACACCCTTTT
+TCAATTTGATGCAGTTCAATGCTCTGTACAGGCACAAGATGTAGGGTTGCGGACGTGCTG
+>ds2020-267_46
+CAGCACGTCCGCAAGATTGACCAGGTGAGTAAGGATGCAGCTCCGTGGACCGCTCGTCGG
+GCCTGATAGGTGGTGGTATCACACCCTTCTCAAAGAAACCGTACGTGACACTCTCGCGTC
+ATACGGCTCCGTCCCGGAATCGGGACCTTTCTTTCAGAACCTTTGACCAACGGGTCCTCG
+AACCAACCTGTCCTCCCCCTCGGTAAGCGGTTTCTTTTCATTCATTCATTGATTGATTCA
+AGGTAGCTGTAGCTTGCTTCCAAGTCCAAGTGCTAGCGGTAGAAGCTAGTCGCCAGAAGC
+GAACTTCCGGGCCGGGAAGGAGCCAAAAAACGTGAGCGCCCCTGCAATCTTTCTAAAGCA
+ACAAGCGAGAAACCTTACTTTGAGAAAGAAGCGCCTTCTATTATAATATTAGTAAAGGCG
+TCTTAGCCTATCTATAGTAAGGGGCCTTTTCTTGCTCGTTAGCGCTTTCAATAAGGACGT
+TTAGGCTTTACTAATAGAATATATAGGGCTCTGCGCTTGCGGACGTGCTG
+>ds2020-267_47
+CAGCACGTCCGCAAGTTAATGGTATTGGATTGCGACGTGCTGAGGTCTCTTAATTGCGGA
+CGTGCTGAGACAGTGTGCTTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCA
+CTGACCGTGTGGCCTTTACTATAGTTTGGTATTGGTGTTCGGTGTGGCTTGTGTAGGATA
+GGTGGGAGACTCAAGCGGGCACGCCAGTGTTCGTGGAGTCGTCGTTGAAATACCACTCTG
+GTCACTCTGGATATNNNNNNNNNNCGGGCAGGGAGACAGTGTCAGGTGGGCAGTTTGACT
+GGGGCGGTTGCCTCCTAAAATGTAACGGAGGCGCCCAAAGGTTCCCTCAGCCTGGTTGGC
+AATCAGGTGTCGAGTGCAAGTGCACAAGGGAGCTTGACTGTGAGAGTGGCAACCGAGCAG
+GAACGGTCAGTGCGTCGCCTTAAGCGCGTCCGCAACATACTCCTCGTCATTTGCGGACGT
+GCTGAGGAGGAACCTATTGCGGACGTGCTGAGGGACCAACTGTTGCGG
+>ds2020-267_48
+CAGCACGTCCGCAATACATCGCATATATTGGTAGTCCCCTCCTTAGTAAGCTGCAAACGT
+CAAGTGATATTGGAATAATGGAGTACCTGTACCTTGTTGATCAATCTCCGTTACGAATTC
+GAATGGTTGAATTTCCGTGTCCACTTGCCTAGTTATATCATCCAGGACAGTGTACCAATC
+GTTCTCGGAGAGGTAGGTGATAGGTGTTCCACTCAGCAATGTAATCTCTATGATTATATT
+ACCGGATCCAGTATCATATGTTATGCTAGGACCAGGGCCATTGGCATCACGTGCATCAGC
+TACAGCTTCTTGAATCTCTCCGTTGGCAGTTTCAAGGTCATCTTCGTCATAAGGAGGATC
+GTCTTGGTTCTCTTGAACTTGAACGCTAGACAACACAGTTACTCCAAGATCTGGTAGATC
+AAAGTATTCTATGTCACCTACTTCCTTCTTAATCAGTTGATCCTGAGAGAGAGGATTCTT
+AGCTGTAGCTCTACAAGTTACGAAAGCAGGCACGGTCAGTGCGTC
+>ds2020-267_49
+CAGCACGTCCGCAATTTAGCATAGGTACACGTCCGCAACACCCACTGCTTGCGGACGGCT
+GCTCCTTAGATTCGCTTAAGGCGACGCACTGACCGTACTATTAAGCTTTTTCCTACCCGG
+TTATTTTACCAGACATAGCGGGTTAGTATCCGTAAGCTATAACTCCCGCCCGTTGCCAGA
+GGCCGTTTAGTCCGGTAGACCTTTTAAAGTTGTTTTCTCTGTGTTTTTGTTTTTTTTTAA
+AAAATAAACCTCACATACAGCAACTGGTTGCCAGCCGATGTCACTCGGCCGACTACATCC
+CGTCCCTGTCCAAGGTTTTTAATACTGTGTTTTTGAAATTTGTAGTTTTAAAGACGTTGT
+TAGGAAGTTGAGGGCTAAGCGCTACTACCTTCCACACTACGTCACGTCCCCCGACTTGCT
+CTTAACAAGTCAAGCCGACGGACAGTAATCCGTCAACCGTTTAGTGATTCCAATCTACCT
+TGTCGGGAGGTCTCTTTCCACACAAGTGCTACTGCCA
+>ds2020-267_50
+CAGCACGTCCGCAACGCCACCGAAGCCTACCTCGCCGACCATGTCTCGAATGTCGAAGCT
+ACCGCCCTGGAGATGGTGCGGGTGGATATAGTGGGTTTAATGGTTACTTCTTCTTACCGG
+AAGGGGTTGAACCAGACCCACTCAATACCGCCACAGCCCCTGATCCTAAGGAAGCTACCC
+CCAAGACGTTTGAGATCTTTCGTCGACGCCACTACCCTCATGAAGAGTCCAGTTAGACAT
+GGGTGCCTCACACAGTATCCCATCCTACAGCTCTTCGCCTCACGGCTCTCTGAAGCAGAA
+CTCCGCACCCTCGTAACCGAAGTGGGCGGAGATTCGACTGCAAGAGATATCCGGAGGGAG
+GCATTTGGCGCCGAATCCGTCACGAGGAACATCGTAGGTTTCATCCCGCTCGCCGACGCA
+TCCTCGCTAGCGTCCAGAACGGACTATGACAACATCATGGTCCAATACCAAGTTTATCTA
+TAATAGCCTGCTACATTTGCGGACGTGCTG
+>ds2020-267_51
+CAGCACGTCCGCAAGGAATTCCCCCTCAGCACGTCCGCAACGTATGCCCATCAGCACGTC
+CCAAACCCAACCCAATTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTG
+ACCGTCGAGAAGCAACTAACTCGTTCCTAACGGGTGTGGCGCTGTGGGCGGCTGGCCTCA
+CTGATGACGAGATGATGCTTGCTAGGGGGTCAGGGCTGTTCTCCCTCGCAAGCGTCAAGG
+ATTACAAGCGCGAAGCTAAGCGCATAAGCGTGGAAGCAAAATCTCTACAAAACTTGGTAG
+ATGTGGACTTGAGAAAGTTCTTCGAACTAGAGGTGCTAGTCAATAGGGGACACGACGGTC
+AGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAAAAGACCTGAGTTTATT
+GCGACGTGCTGAGGGACTCGAGTTTGCGGACGTGCTGAGACGTAAACATTGCGGACGTGC
+TGCGCCTTAGATAGAGCGGA
+>ds2020-267_52
+CAGCACGTCCGCAATCGTTGCAGACTACAATCCGGACTACGATACACTTTCTGGGATTAG
+CTCCCCCTCGCGGGTTGGCGGCCCTCTGTATGTACCATTGTATGACGTGTGAAGCCCTAC
+CCATAAGGGCCATGAGGACTTGACGTCATCCCCACCTTCCTCCGGTTTGTCACCGGCAGT
+CTCATTAGAGTGCCCTTTCGTAGCAACTAATGACAAGGGTTGCGCTCGTTGCGGGACTTA
+ACCCAACATCTAACGAGGGCATGACAATTGCGGACGTGCTGNNNNNNNNNNCAGCAGGTC
+CGCAATGGGTGCCGCTTGTGCGGGTCCCCGTCAATTCCTTTGAGTTTTAATCTTGCGACC
+GTACTCCCCAGGCGGTCTACTTCACGCGTTAGCTGCGTTACCAAGACAATTAAGTCCCGA
+CAACTAGTAGACATCGTTTAGGGCGTGGACTACCAGGGTATCTAATCCTGTTTGAGGGAC
+CTGATGTTGCGGACGTGCTG
+>ds2020-267_53
+CAGCACGTCCGCAATCCCTTTCCTCTTCCTAACTCCTCCCCGGGTAGTTCCCAATGTTTG
+GCACTTTCCATACTTCGTGGGTGCAACATCAACAAATTCGCTCATGATCAAGTTACAACC
+TAAGATCTATGACCATATTATGTTAACTGTTCGTATTTCGTTCATTCCATCGGTATGCTC
+CCAGGTACCTGTAATTGTGATCCGTTTGCCAGAACTAAGGGGTCTTTCTGTGGAAACCTT
+CACGAACAATCGTCGTTTTTTGATGGTTTTTCCGCTTCTCACAGCTGCTCTTTCTACACC
+CCCGGATATCTGGTGCCAAACCGTCGCCCGTTTCCTTATTTCTTCGATAATAGAGTTGTC
+TATCTTTGTGGCATCGATTGTACAAGTTCGTGAAGAAGGCTGGACGAGTGGAATGAGGGA
+AAGCGGCTCGATCGACAAAAAAGAAGAGTAGCCCAACCCAAGAACCTTGCGGACGTGCGC
+TCCTTAGATAGA
+>ds2020-267_54
+CAGCACGTCCGCAAGGGTCGTTTGGTCTTCCAAGGAATCTGATCCTGAGAGAGTGTCGTC
+ATTAAAGAGTAGGTTTTACTCTTTCTTGGTAGGTTATGGTCGCAAGAGAGCTTCTGTGTT
+CAGGAAGATCTTTCTTCGTGAGAACCTAAGCACGATTTATTCGTGTCGGCGGTCTTTAAC
+GAGAGGTATGGGGATGAAAGTGACGGAGGAGGAGTTGAGGGACTGCGGTCTCCNNNNNNN
+NNNATCTAAGAGCAGCACGTCCGCAACAGGGCGGTGGTGGACGGAAGCCAATTGGGGCTG
+TTCCACTTGGGGTTTAAGCGAGTTTGTCACCCCTAGGATGACTCGTCTTACTGGTCTGAC
+CAGACGCCTCTTGTGGAAGTGGGTTTGTCTACGCCGGAACGAATCTGTTTTCGGACGGGT
+TCGCTTTTGTAAAGGAAAAGGACATAATTGCGGACGTGCTGGGGGCTATATTTTGCGGAC
+GTGCTG
+>ds2020-267_55
+CAGCACGTCCGCAAAAAAATCAGGTCAGCACGTCCGCAAGGGAATAGCCGTCAGCACGTC
+CACAAGATCACAGTTGCGGACGTGCTCGCTTAAGGCGACGCACTGACCGTACATGTATTC
+GTGCGGTACACATTTTGCTAGCAACTTCGGAGCCGCTACTTCGGGATGCGTACCCGGTGA
+CGGATATGCTCACTACGGAGGTTCAGCGTGGTTGAACTGCCGCGCGCTGCAAGAGTGCCA
+GAACGAGGGTAACGATGTAGTTAAGAGATCTGAACTCAATGTCACTAGCTCCGACGTTCG
+TGGAGCTATGTCTGGTGGTGTGGTGATGCCGGACTTTCTGTACGCGTACGGCACCACCTA
+CTTTATCCACGGACAAAACAAGTCCGGGGGTCACGTTGACGCTAAGATTTTTGACAACAC
+TGAATCTGAGGACTTGATGAAAGATCTGGTCAACATGACTGAAACCGACTTCGTTGCCAA
+ATAC
+>ds2020-267_56
+ACTCTGTATGCGTTCGCCAAACGCAACGCATCCCTAGGCTCCATGACGAAATCGTCGCCA
+ATGGGTATCGATTGCATCCCAGATAGGTGTGACACACCGTCATACTCATCGACTACGCAG
+CCAGCCAATAGTGCTCCTGAGACGTAAGCGGGTATGCAAGTCAGGCGCTTTGATAAGGGA
+TAGCCCTCCTCTATCAGCCTGGTCGCCTTGACTTCTTGGACTTCGGCAAGGTGTCCAAAT
+TCGAAGGCCAGCCAACACGAGTCGTTCGCGACAGTAGGAACCTCTTTCCCGAAAGGGACA
+GAGCACATTGCGGCTCTGCCTATTGGGGACATCATCATCCGGATTGCTACGGTCAGTGCG
+TCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAAGTCTTAACCCTCAGCACGTCCC
+AATACATTTTCCGTCAGCACGTCCGAAAATCTACCACTTGCGGACGTGCTGCTCCTTA
+>ds2020-267_57
+CAGCACGTCCGCAATACGTGGTCCCTCAGCACGTCCGCAAAACCTAACCGCTCAGCACGT
+CCGCAATGTGTTGACCCCGCTTAAGGCGACGCACTGACCGTCCGTAATCCGCTCATCCAA
+GCGGTACTATTCTGGGTTGCTACGGCATTCTTAGCAGTCGGTCTATTCGTGACACCAATC
+TTGAACGGTGGTAAAGATCCTAAATACCAAAAATTGGGTGTGGACATCATGGCGATTCAT
+CAAATCATGCCTGACAACTTAAACTTCTGGTTTGGTCACCAAGGTTATGAATTTATTGAT
+ATCGGTCGTTTCTGGCAGATCTTAAAATGGGTTGGCGTATTATTAAGGCGGGTACGGTCA
+GTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATTCCTTCTTCCTCAGCAC
+GTCCCAATAGTCCGTCCCTCAGCACGTCGCAAATGGAGGTCTGTTGCGGACGTGCTG
+>ds2020-267_58
+CAGCACGTCCGCAAGACAATATGGCTCAGCACGTCCGCAAGTCGACGCCCCTCAGCACGT
+CGCAACCATACCGACTACTTTTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACG
+CACTGACCGTGGTTGATTCTCTCCTGGCAAGGTGATAAAGGCACTGGCGTACTCTGCCAT
+GATGGCTTTACTGGTATGCATGGTATCGGTCAAATGCAAACGCGTCAACCCGCCATGCGC
+CACTTCTCGATCCATCATAAACTCAGGAATCACACCCACGGCTATACCGTTTTTTTCAAT
+CACACCATCGGCAACCGCGCCCATGCATCCAATCACCGCACCGCCATACACCAGACCTAA
+CCCCGCTTCAACCAACCCCCAAATTACGGTCAGTGCGTCGCCTTAAGCGAACGTCCGCAA
+GTTTTGAGGGGTGGGATTGCGGACGTGCTGACTCAGTAGTATTTGCGGACGTGCTG
+>ds2020-267_59
+CAGCACGTCCGCAAGCACACTTAATTGGGACGTGCTGAGTTGATTAATTTGCGGACGTGC
+TGCCCGATAACAATTGCGGACGTGCTGCTCCTTAGATAATCTAAGGAGCAGCACGTCCGC
+AAATGGCCATTCCTCGTCTCTGGATACCTAGGCACCCAGAGACGAGGAAGGGCGTAGTAA
+GCGACGAAATGCTTCGGGGAGTTGAAAATAAGCGTAGATCCGGAGATTCCCGAATAGGTT
+AACCTTTCGAACTGCTGCTTAATCCATGGGCAGGCAAGAGACAACCTGGCGAACTGAAAC
+ATCTTAGTAGCCAGAGGAAAAGAAAGCAAAAGCGATTCCCGTAGTAGCGGCGAGCGAAAT
+GGGAGCAGCCTAAACCGTGAAAACGGGGTTGTGGGAGAGCAATACAAGCGTCGTGCTGCT
+AGGCGAAGCGGTGGAGTGCTGCACCCTAGAGGGCAAGCTATTGCGGACGTGCTG
+>ds2020-267_60
+CGGATCTCACGCCCGATCTATCTAAGGAGCAGCACGTCCGCAAGATTTTTGGAGTTGCGA
+CGGCTGGGCCATATTCATTGCGGACGTGTGAGTGTAATATCTTTGCGGACGTGCTGCTCC
+TTAGATACGCTTAAGGCGACGCACTGACCGTGTACTTGTTGTTTCCATTCGGGTTGTTCC
+ATTCCATTCCATTCCATTCCACTCCATTCCATTGCACTCGGGTTTATTCCATTCCATTCC
+ATTCCATTCCATTCCATTCCATTCCATTCCATTCCATTCCATTCCATTCCATTCCTTTCC
+GTTCCATACCATTCCATTCCATTCCATTCCATTCCATTCCGTTCCGTTCCGTTCCATTCC
+ATCCTATTCCAAACGGTCAGTGCGTCGCCTTAAGCTATCTAAGGAGCAGCACGTCCGCAA
+CTCTATCCTTGTAACTGGACGTGCTGAGGTACGGGCTTTTGCGGACGTGCT
+>ds2020-267_61
+CAGCACGTCCGCAAGGATGCACTCTCAGCACGTCCGCAATAAAGGGGCATGTGTTGCGGA
+CGTCGCTTAAGGCGACGCACTGACCGTCTTTTCGCCCTTGGGACACTCGATTCCCACCAG
+TTCTGGTACCTGATTGGCACATTCTTCATAGAGTGAGGAAACATCCTTAGCAACTTTTGA
+ATTGGGTTGTATTCTCAGGCTTCCAACCTCACCNNNNNNNNNNNNNNNNNNNNNNNNNNN
+NNNNNNNNNNNTGAAGTCAACATGTTCTGTGCCAAGCAAACGAGGATCATTCTTCGTGAT
+AACGCTGGGTATCTTTTCACAGGGAGTTTCCAGGTGCCACTCGAGTGGTGTTTCCACCAA
+ACTGGAGGGCCACGAACACGGTCAGTGCGTCGCCTTAAGCGACGTCCGCAAGTAAGATTC
+CTTCGCACGTCCGCAATAGAGCTGTCTTTATTTGCGGACGTGCTG
+>ds2020-267_62
+CAGCACGTCCGCAAGTCTAAGCCCCTAAATCATAGTTAAGTGGGAAACGATGTGGGAAGG
+CATAGACAGCTAGGAGGTTGGCTTAGAAGCAGCCACCCTTTAAAGAAAGCGTAATAGCTC
+ACTAGTCGAGTCGGCCTGCGCGGAAGATGTAACGGGGCTAAAACTATGTGCCGAAGCTGC
+GGATTTGACATTAGTCAAGTGGTAGGGGAGCGTTCTGTAAGCCGATGAAGGTGTATTGAG
+AAGTATGCTGGAGGTATCAGAAGTGCGAATGCTGACGTGAGTAACGACAATGCGAGTGAA
+AAACTCGCACGCTGAAAGACCAAGGGTTCCAGTCCAACGTTAATCGGGGCTGGGTGAGTC
+GACCCCTAAGGCGAGGCCGAAAGGCGTAGTCGATGGGAAATCGGTTAATATTCCGATACT
+TGTTTATAATGCGATGGAGGGACGGTCTTTTGCGGACGTGCTGA
+>ds2020-267_63
+CAGCACGTCCGCAAACTTTTCATTGCGGACGTGACGCTTAAGGCGACGCACTGACCGTCT
+ATATGCACCTCTCTTGTCTCAGAACTGGGCCGTGGAGATTCAGGAACTATGGGAGTTTGG
+GAAGACATGGTTTGGAGGAACCCTTATCTGCGCATTCGGTGGCGCAAGGGACAATTCAAG
+GTTAAGATCATCAAGGTGAGTGCATGAGGATGCCATTGTTTTGTTTTTGGATTTTTTGAT
+GTTTTTCTCTGAATTTGCCTTACTTGCGGACGTGCTGNNNNNNNNNNGGGACACTGACCA
+CCAGCACCAACCTCCATCCCCCGGCACCTGCCTTTATCACCCATTTCCCAGGTGAGGACA
+GGTGCTCAAAGAGGGGCAGGGTTCCTCTGAGGTAACACAGCAGGGCGGCAACAACGGTCA
+GTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATC
+>ds2020-267_64
+CAGCACGTCCGCAATGATACGCCGATATTTGAGTACCTTTCCCGAGCAGATTCTGCATCT
+TGCGTCGACCTTGGTATCGTTAGCAGACTGTGTGCGTGGTCAAGCTGCAATCGCTCAACG
+TTGTTTTTGTTCAGGCACACAGTTGCGCGTTGTGCAACGTGCACCTCTGCTAGTGCTCTG
+CCAAAACACAGACTCTGTATGGTTGAGCACAACATGGCCAACATCGCGTCACCATTTTGA
+GGTGCTGCGCTATTTAGTCTCAGGGTCTCCTCCGTGTTGTGAGCCATCATCAGTCTGTCC
+ACCGCTGGCTCACAAAAGGGTTGGTTCACCCTGTACAACCCTGCATACAGCACGTCAGTA
+TAATCGTGGTGTGATGCCGCTGCTGACTGGAAAAGTGAAGCAATGGCGGCCGACGCTACT
+AGCATCACATTCTGCAATGCCAGAGACTTGCGGACGTGCTGC
+>ds2020-267_65
+CAGCACGTCCGCAAAGTGTACCCGATGTCTATTGCGGACGTGCTGACGGGTGCTCCTTTG
+CGGACGTGCTGAGGAGTCCTGATTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGA
+CGCACTGACCGTCACCTTCGTGCTACCATCATATGCCAAGGTCGCCAAACTATTGTCCAG
+TGAAGAGTTACCTGTGCCTTGACCATAAGAAGATTCCATGCCCCAAATGGCAGTCACAAT
+AGAGGCCGGCACACCATACTGATTTTCAATGCGATCAAGTAGGGCGCTTTGGCTGGCAAA
+ATTGCGCTGACCCCCACTAACACGACTACTCGACGCGGCACCATCGATATATTCCCAAGG
+CATTTAGCAACGGTCAGTGCGTCGCCTTAAGCGTAGCAGCACGTCCGCAATAGTTGATGA
+GTCAGCACGTCGCAACAGACCCACTTCATTGCGGACGTGCTG
+>ds2020-267_66
+CAGCACGTCCGCAACTTTCCTCTTGTTGTCTCGCCACATCGATGAGGTGCTGCTTGACGA
+CCGAGAACCCAGTAGCTGCAAAATCCTTACGTCGCTCTTTCTCAGCATCACTGACATTAA
+CGGCGTCAGCGTGCTCCAATTTCTGAGTTCCTTTGACGCTCAAGAAGCTGTTGACTACCT
+CCGAGGCCACAGCATCGATTCTTTTTCCTTCCTCTTTCACCTCAGCCTTGTAAGCTGCTT
+CCTCCTTCGTCATCATTTCTCCGTTGATATCAATGGTCTCAGGGAGACCATTCGGGTTTG
+CCATGGCTCGCATCTTCTTCTCCGCGGTCTCGCGCGCTTTCTGGTTCTTCTGTCGGCGCG
+CCATCTTGTCTCTGTCCAGCGGCGATCTCTTCGAAAAAAGAAAAATTTGGTCGTAGTTGT
+TGCTTCTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_67
+TCTAAGGAGCAGCACGTCCGCAACGGCAGCAAAAGCGCCAGCCGAGGCAGCACTGAACCA
+TGAGCAGCGATTGTTTGTCACCATAATGGCAGGCATTGTGGACAAGGTCAGGGCGATTGA
+GCACGAAACATCTGAGGCTGCTCTGTATTCCATCAAGGAAGCAGTTGCCATCGGGTGGTG
+GAACGCGTCGACGGTTGCCTCATTGGCAAAGTGGTACGCCTTCGACTCAAAGAATGAGTG
+GGTGACGTTGACTTCAAAGAAGTTGGCCGGTGATGCGAGAGGGGCAATCGGCGAATACCA
+ACTGCCAATGGCCCACTGCTTCTTGTCTGCCCTATTAGCGCAGTCACAGACGTACATCGT
+GGTTGCATCACAGTCACAGTGGGCAACGATCGGATCGACTATCGTTGGTGGGGGCGCATC
+TCCTGTGATCACGCAGCCCAAGGAAATTGCGGACGTGCTG
+>ds2020-267_68
+AGCACGTCCGCAAGTAGTGGGGGATTGGGACGTGCTACTGGAAGTAAGGACGTTCGGGCT
+TGCGTTGTCTGCTATAAGATAGCTAGTTGGGGGCTTTCGACATAAAAAAGCCTATCCGGC
+TTGGCTTCGCTATGGCTCATGACTTGTATTGTAGTCGTAGTCTTGTAGTCGGCCCGGAAT
+GCCTTTGTAGTCTTTCTAATGCTAATGCCTTCTTCCTTAGCACAAGCGCTAAGCGATAAT
+AATTCCTTCATTCATTTTTTTTTAGTTGCGGTAGCTTCCGCGCCAGCAAGATACGGACGG
+CAAAGCCAAAGCAATACTAAACAAGCGAGAAAAGCCCTATATATTCTATTAGTAAAGCCC
+GAACGTCCTTACTTCCAGTAGCTAAGGAGCAGCACGTCCGCAAGGCGAGGCAAGTCAGCA
+CTCCGCAAATAAATTAGGTTGCGGACGTGCTG
+>ds2020-267_69
+CAGCACGTCCGCAAGCCATTGCCACTCAGCACGTCCGCAACGACGGCCACCCCACGTCCG
+CAACGTTGATCGAGTTAAAATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGC
+ACTGACCGTAAGCTCCCTGGTTGTTGAGACCAGTTTATTGAGATCGCCTTCCAGTCGCCC
+CATATCAGACGATATGCCCTTCTCACATTATTTTGTAATTAATTTATTGTTTTACCCGTG
+TTTTTCCGCTGATTTACATTTTGCGCCCGGTTGCATTTTCCACCAATTGCCCCTGTCGAC
+CTGCCATAGGGCTTAACAAGTCAACTCATCCACCTTTGGTCATCATTCAACGACTTATGC
+AGCACCGAACAAGTCGCCGTCTACACCAAGGTGCGCGTATTTGGCAACGAAGTCGGTTTC
+AGTCATGTTGACCAGATCTTTCATCAAGTCC
+>ds2020-267_70
+CAGCACGTCCGCAAACCTATTTTTGTGGACGTGCGAGGCACTGATAGTTGCGGACGTGCT
+GACGGATCACGCATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACC
+GTCATGATGTGGATGCGCTGCGTTGGCGCGCTGACACCAGTTCTAAATTACCATCTGCAC
+TTTCTGCAACTTACAGCACATCTGCCATGGCAGTAGTCAATAACTTAACTTCGCGATGGC
+CGAGGCTCTAAGCGCCACCAGATGAAACTTCAGTGGCAGGTCACCGAGAGGAAGAAATTA
+CCGGTACCAGCTAACACAGCAGAGCCCTGCTGACACGGTCAGTGCGTCAGGGGTTCGGAA
+ACGGTCAGTGCGTCGCCTTAAGCGTTCCGCAATCACTCGCCCTTGTTGCGGACGTGCTGA
+GGGACTTATTGTTGCGGACGTGCTG
+>ds2020-267_71
+CAGCACGTCCGCAACCTACTCCAATTGGGACGTGCTGAGGCTTGGGAGATTGCGGACGTG
+AGGGTCAAGCTTTTGCGGACGTGCTGAGGTCTTTCCCTCGTGTGCGGAACAACTAGCCGG
+TCTTTCGAGATAGAGTAGTCGCAGGTACAGAAAGCATGTTCAATTCCTCCCGTAACGGGG
+TGGGTCCCACGCAGGTTCGTGGTTCCCTTACTCGAGAGAGACTATTAGTACAAGAAGGCG
+GACGTTGGTTGATGGCAAGGCACATGGTGTGATTCTGCCATTAGTCGTCATCCCTGTATG
+CCTGTGGAGGTCAGCCCGGACAGATGCATATATATGACAGCGAAGCGAAAGCGACGGTGG
+CTCCATACCCTGGAAAGGTGGTTACTAACTTTGCGGACGTGCTGAGGGTGCGCTGCTTGC
+GGACGTGCTGAGGGGTGGAATCTT
+>ds2020-267_72
+CAGCACGTCCGCAAGCTCAGTACGGTGTTGGAATTGATGTCCGTGATCTCAAAAATATAT
+GACATAGAAGTGAGAGAAGAATTTAAATTAGGCAGCAAGATCGGCGAAGCCGGAAAGGTT
+CAGACGTCCATGCTGAGTAACATGGTAAACAAGATAACCAGCTCCGTAGTGAGGGAATTG
+GCTGACAAAATAATAAGCCAGAAATCATTGCAAGATTCGGGGAAGAAGATGGAGGAAGAG
+AAGAAAAAAGAAACTGAAATTAGAGAGAAAAGAAGCGCATATGCCATGCTGTCTAACAAA
+TCGTGCCAAATAGAAACGGATGCAGAAGCTGAAGTTTGGAGAAACGTGGAGTGCAAAGGT
+AGGGCGACATGTTTTGACAAAACGTAGGGGAGTAACGTTGCGGACGTGCTGCTCCTTAGA
+TACCTTGCGGACGTGCTG
+>ds2020-267_73
+TTCCGATCTATCTAAGGAGCAGCACGTCCGCAATTTCATCTGACTTGGGACGTGCTGAGC
+CAAGCATGTTGCGGACGTGCTGAGGTGTGATGCCTTGCGGACGTGCTGCTCCTTAGATAC
+GCTTAAGGCGACGCACTGACCGTATTGTACCCGCTGCGATGTCTTCGAATACTGCCAGTG
+CGGTTTCCAGTGCAGTGGCGCCAACTTCTACTGGCAGTGCCCTTGCCATGATAGATATTG
+AATTGGCAGACTAAACCTACGACTGAGATGAATTTATGAAACCGCACGCCTCACTGAGCC
+AATCCCTGCAAAAACTAACCACGCCTCTGGGAACGGAGCTTGAACGGTCAGTGCGTCGCC
+TTAAGCGTGTCCGCAACCGATGCCCAATAGCTTGCGGACGTGTGACATAAATACGATTGC
+GGACGTGCTG
+>ds2020-267_74
+ATCTAAGGAGCAGCACGTCCGCAAATTCGTGGGGTTGATCATGTCACCTCTCGTTGCGTA
+CTCTGTGTAAGTGAAAGCCAGGGTAGTCTCAGGTGAAGTTGGTGGCAGTGCGATAGTTGC
+ATGCTCAACCATGGTTGACATGACTCTGTTGGCTGTGTTCGCGAGCACTGCATCGTAAGA
+GAACAACCATCCCAGTATGGGCGCTGACAACACCTGCAGAGACAGTGGTGCCCTTCCTTG
+CACTCAGAAGGCTTTGACTTCCGTGATGGCTCTTTGCATCACTGACCCTGTGTGTGTCGT
+CATGATCGCGTCAGCGACATCTCCACCAAAACGCTCGCCTGATGCGCAAGCAAGGTCTGC
+CATGCCGATGGGGTGCGCGTATTTCTCAGACCCAGCCAGTATTGCGGACGTGCTGCTCCT
+TAGAT
+>ds2020-267_75
+CAGCACGTCCGCAACGGTTTGGGGGTATGGATGGGGTATGGCCGTTTGCACGTGCGAGTG
+TTACTCCTTTGCGGACGTGCTCGCTTAAGGCGACGCACTGACCGTGTGCTTCCCCGTCCT
+GCCATAACGATATCGCTGACTTTGCCCGAGGTTTCTGGAATGTCTTGCTCAAGCATGGCA
+ATTTTCAGATTGCCACTGATTTGGAATTCGCCACTGTCAGCCTTGACTTGACCGCTAATG
+ACTTTAAACAAAGTTGATTTGCCTTCACCATTGCTAAGACGGTCAGTGCGTCGCCTTAAG
+CAATCTAAGGAGCAGCACGTCCGCAAAGGCCAACTGGTCACACGTCCCAACTGGATCTTC
+TTGCGGACGTGCTGAGGGCTAATGCTTGCGGACGTGCTGAGGCTGATGGGCTTGCGGACG
+TGCTG
+>ds2020-267_76
+CAGCACGTCCGCAATAGAACTGGGGTTAGTTTGGGACGTGCTGACCCCCTCGGTTTGCGG
+ACGTGCTGAGTCGTGGCATCTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGC
+ACTGACCGTGGGGTTCCGGGTTGGAGGCAACACACTAGGAACGGGAGCAGGACAAATAAA
+CCCGAAAAAGGCAGCGCATCCCGGGCTCATCTATGACATCACAGTGGATGACTATATCAG
+CTTCTTGTGCAAGCAAGGCTACAACAGCACCAACATTGGCATACTTGTTGGAGGCAAAAA
+GAACATCTGACGGTCAGTGCGTCGCCTTAAGCGAAGCACGTCCGCAAGACTCAACATTTT
+CGGACGTGCTGAACGGAATCCGCTTGCGGACGTGCTGAGCCTCTGGTTATTGCGGACGTG
+CTG
+>ds2020-267_77
+TAAGGAGCAGCACGTCCGCAATGGTCACGGGGTGTTAATTCATCCCCCCACCCCCCCTCC
+ACCCGCGAGGGGGGGGAGAGTTCGACTGTTCTTCACCGAGCAGTTTGGGTGATTTTTGCC
+GACCAATGCGCGGGTACGTGTGATATACTGCATTAAGCGCACGGATTATTGGGAGCAAGT
+GGTGGGAGGAACCGGCATCTATCGGGTACAGGCAACGATGGCCACTCCGGGACCCACGCC
+TGGCAACAGGATACAAGAAAGGACGGTCAAGGTTTAGGATCTGTGGTCCCGCGAGGGAAA
+TCTCCTTTACCTCATAACAAGCCGTACACTGCGAATCCCTTGGCACCTCGGTGCTTTAAG
+AGTTCATGACCAGCCCAGTGCAGTGGGTGCCTTCTTAGGGGGTCTAGTTTGCGGACGTGC
+TG
+>ds2020-267_78
+CAGCACGTCCGCAATAGACTATGGGTAGCACGTCCGCAACAGGTACACCCTGAGGCTTGC
+GGACACGCTTAAGGCGACGCACTGACCGTACCCGCCCTGCTCCCCACTGACATTCACAGA
+AGCTTCTGTCTCGCGGTAACGGGCGGTGGCGGTATTGCTGCTGACTTGTGGACTGACGCT
+TTGCACATAAGGCTGTTCTGCAACTGCATTAGCATTCTCGTACGGTTAAAGTATTGGTGC
+CTAAGGAGCTGATATCATTGAGAATTTTTTGTTGAGAGCCTTGCCCTAGACCCACTACCG
+ATACCACAGAGGCAATACCGATAATCACCCCCTGCAGAGCACGGTCAGTGCCTCGCACTT
+AGCGTGCGGACGTGCTGACGGGGATCCTTTGCGGACGTGCTGAGGGGCATTGATTTGCGG
+AC
+>ds2020-267_79
+CAGCACGTCCGCAATTTAGGCCAATTACGTTGCGGACGTGCTGGACTGGTAAATTTGCGG
+ACGTGCTGCTCCTTAGATACGCTTAGGCGACGCACTGACCGTGGGTGAGTTGAGTTTTGT
+GCTCAATTCACAACAAGTGGTATCAGAGCTGTGTTGGAGCAGCAAGTTGCTAGAGTGTTG
+AAGATGGCAGGTGACAAGGAAGCTGAAGGTGAAAGTAGCTCTATGCTGCAGAGGCTGCCA
+CAATCTGTCAACATGAAGGTGGAGTTAAAGCCCTTCACAGGGAAGGAGAACTTCACGCTT
+TGGCAAAGGAGGATGAAGTCAGCCCTTACACAACAACATCTCCATGTTGTGTTGGTGGGC
+AAGGAAAAGAAGCCAACAGGTATGTACACGGTCAGTGCGTCGCCTTAAGCGGGACGTGCT
+G
+>ds2020-267_80
+CAGCACGTCCGCAATCCTAGGTGAATCTTGCGGACGTGCTGACCATAATCACTTTGCGGA
+CGTGCTCGCTTAAGGCGACGCACTGACCGTGTCTGGTTCGTTGTGTGTGTTTTTTTTAAG
+GCTTATCCGGGGGCTGCTGCTCTGGGGCATCCAATTCTTCTTCTTTCTTTTGCTGCTGAT
+CTCACAGCGAGAGCAGCTCCTTCTTGTTCAGGGTCATAAGATGAGAGATCTTCCTCCGAT
+TCCGAGAAATCGGTCAAGCGGGGGGCTACCCTCGGCTCACCTCTCTATCTATAGAGGTCC
+CTCCCCAGAGAGGGGCACGCGGACGGTCAGTGCGTCGCCTAAGCGATCTAAGGAGCAGCA
+CGTCCGCAATGATATTCCCCTCAGCACGTCCACAAGATCGCCTTTGCGGACGTGCTG
+>ds2020-267_81
+CAGCACGTCCGCAAATTAGAACCCGTTCCAGAGCTAATACATGCAAACAACATGACACCG
+CCGGCTCGCCGGAGGCACATGTGCTTTTATTAGATTAAAACCATACCGCTCTTGGGCGGT
+TCACTTTAGACGAATCTGGATAATTTTGGCTGATCGTATGGTCTCGTACCGACGACACAT
+CATTCAAATGTCTGCCCTATCAACTATTGATGGTAGTATAGAGGACTACCATGGTTGCAA
+CGGGTAACGGGGAATCAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACAT
+CTAAGGAAGGCAGCAGGCGCGTAAATTACCCAATCCCGGCACGGGGAGGTAGTGACGAAA
+AATAACAATACAGGACTGGTGTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_82
+GCAGCACGTCCGCAATTTCCACCCCATTAGTGTTACTACATTGAGCTCGGTTACGGCCTT
+AGAGGCGTTCAGGCATAATCCAACAGACGTAGCTTCATACCACTGTTCGATCGAACAAGT
+ATTGTACCAGAGGTCTGTACCAGCGGTTCCTCTCGTACAACGCTAGTATGCTCTTGTAAT
+AACGGTTCATCAGTAGGGTAAAACTAACCTGTCTCACGACGGTCTAATCCCAGCTCACGT
+TCCCTATTGGTGGGTGAACAATCCAACACTTGGTGAATTCTGCTTCACAATGATAGGAAG
+AGCCGACATCGAAGGATCAAAAAGCAACGTCGCTATGAACGCTTGGCTGCCACAAGCCAG
+TTATCCCTGTGGTAACTTTTCTGACACCTCTAGCTTCAAATTCCGAAGGTCTAA
+>ds2020-267_83
+CAGCACGTCCGCAACTTCATGGGCCTCTTATTGCGACGTGCTGAGTGTATTATATTTGCG
+GACGTGCTGACGGAAGTATAATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACG
+CACTGACCGTGAAACTCCCCCCATCGTCAGCTTTCTTGGCGTCTGCAAGTTGTTCTATTT
+TTTCCTGAGCAGTCTCTTTAAGCATGGCTGCTTTTTCTTGAGCTGTTTCTTTTAAGGTTT
+CAGTTGTTTGCATGACACTGTCAATCACGGTGCTTTTATCATTAGTGCTATCTTTCGCAA
+GGTCTTTGCGACGGTCAGTGCGTCGCCTAAGCGTCGCTTAAGGCGACGCACTGACCGTAG
+TACACTCGTTACCACACGGTCAGTGCGTCCCCGACTATTCACGGTCAGTGCGTC
+>ds2020-267_84
+CAGCACGTCCGCAATGACGTTGGGATCTCCGTAACCGTGAATGTTGACTGGCTGAGCGGC
+TACCCACTGATTGTAACTGCGTCTCTGTCTGTTGCTGGTGCAAACTGCCTTCATCTGCAT
+GACCCATCCGAACAGCGCAGCAAGCATTACTGTTCCTGCTGTCTTTGCCGCGCTAACGCT
+GCTTGGTTCTATCGTTCTGAGTGCCTGTATCTCATCTGCATCAAGCTGCAGCCCACTTGC
+CGTGACACCAGCCACTGCTTTGCCATTCAATAGCTGTGAGACCACAGCGTTCTCACTCAC
+ACTGATGCCCTCATCTTCTGCCAGCACAGGCATCTCACCGATGACTCGCATGCTCACAAC
+CTCGTATGTGTTAACGATGTGGTATTGCGGACGTGCTGTCCTTAGATAGATC
+>ds2020-267_85
+GCAGCACGTCCGCAACCGGTCATCAGTTTGCCACGTTTCCCCCTTATCCAAGGTTTCCCC
+TAGCCGCAACTTGAATTGCCTGTCTTGTAGCGGCCTTTCATATGAATCGTGGAATTCTGT
+TTTCACTTCCTTCATCTTTCTTTGGTTGGGGTACGCCCTATCACTCTGATTCCAGTCCGC
+TTGCTGATCGAGAGTCGGGTAAACCGTCAACTGTTGTTGCTCCACCTTCTGGACACCCGA
+AACCGTTAGTGGCAAGGCAGCGTAGTCACTGCAATTCTTTCAGAACCTTCTTTCTCCATA
+TCTTAAGCACTAAGGGCCTGTTTTGTTTCTTACAGAATATGGGTATGTCCCACGAATGCT
+GGTTCCCGTGTATCGGGTCTACCCAAGTGCTTGCGGTTTGCGGACGTGCTG
+>ds2020-267_86
+CAGCACGTCCGCAACTTCATACACGTCCTCATAATGAAGCTACCCTTCAACTCCAAGGGC
+ACAGAGGCCTACATAGCCTCCCTCGAAGCCTCTCCCGTATTGCCACGTGTCAACTTCATC
+ACCCTCCCAAAAGTCCCAGACCTAGACAAGCACCTCAGCTCCCACTCCTTCCGCAACCAG
+TTCGTCGAAAGCCACAAAACCCACGTCAAAAACGCGGTCGCCGAACTCACCGAGTCAAAG
+TCCGAGTCAAGGCCTCGGCTTGCTGGGTTCGTCATCGACATGTTTTGCACAACAATGATC
+GATGTGGCGGATGATTTTGGGGTTCCTACGTACATGTTCTTCACTTCACCTGCTGGGTTT
+CTCGGGCTGCTGTTTAACCTACAAAGGGCCAAAATTGCGGACGTGCTG
+>ds2020-267_87
+GCAGCACGTCCGCAATAATGCGCCGCTCAGCACGTCCGCAATTGCAACCCGATAAGACTG
+GGGAACACCGATTGCGGAGATAAGGAAAGAGGCAAGGAGGGCGGTGAAGAGTGGGGAGGT
+GGTGTCGGTGGCGAAGGCGAATGAGGTTTTGTTTGAAGAGGATGAGGTGGTTGAGGAGGA
+GAGGCAGAGAGAAAGGGAATTGCAAGAGAGGAGTGAGAGGGAGAAAGAGTTTGTGGTGCA
+CGTGCCGTTGCCGGACGATAAGGAGATTGAGAAGAGGGTGCACGAGAAGCCCGAACGTCC
+TTACTTCCAGGCACGTCCGCAAACTACTCTGGCTCGCACTCCGCAAGTAATACCCCATAC
+AGATTGCGGACGTGCTGAGGGCCCACATCTTGCGGACGTGCTG
+>ds2020-267_88
+CAGCACGTCCGCAATTTTGGCCCCCTATGTCTTTTCACAATGTCAAACTAGAGTCAAGCT
+CAACAGGGTCTTCTTTCCCCGCTGATTTTGCGAAGCCCGTTCCCTTCGCTGTGGTTTCGC
+TAGATAGTAGATAGGGACAGTGGGAATCTCGTTAATCCATTCATGCGCGTCACTAATTAG
+ATGACGAGGCATTTGGCTACCTTAAGAGAGTCATAGTTACTCCCGCCGTTTACCCGCGCT
+TGGTTGAATTTCTTCACTTTGACATTCAGAGCACTGGGCAGAAATCACATTGCGTCAACA
+CCATTTTCTGGCCATCGCAATGCTATGTTTTAATTAGACAGTCAGATTCCCCTTGTCCGT
+ACCAGTTCTAAGTTGGGTGTTAAGCCTTGCGGACGTGCTG
+>ds2020-267_89
+AGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACATCCAAGGAAGGCAGCAG
+GCGCGCAAATTACCCAATCCTGACACGGGGAGGTAGTGACAATAAATAACAATACCGGGC
+TCATAGAGTCTGGTAATTGGAATGAGTACAATCTAAATCCCTTAACGAGGATCCATTGGA
+GGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTG
+TTGCAGTTAAAAAGCTCGTAGTCGGACAATAACGGTCAGTGCGTCGCCTTAAGCGTATCT
+AAGGAGCAGCACGTCCGCAAACGATTCTCCCTCACACGTCCGCAATTTTACCCTCCTGAT
+ATTGGACGTGCTGACCGGTTGCACATTGCGGACGTGCTG
+>ds2020-267_90
+CAGCACGTCCGCAAAGGGAAACCGGTTAATATTCCGGTACCTCGATGTGGATTATCCGCG
+GCAACGCAACTGAAGGTGGAGACGTCGGCGGGGGCCCCGGGAAGAGTTCTCTTTTCTTCT
+TAACTGTCTATCACCCTGAAATCGGTTTGTCCGGAGCTAGGGTTTAATGGCAGGTAGAGC
+AGCACACCTTTGTGCTGTCCGGTGCGCTCTCGACGACCCTTGAAAATCCGCCGGAAGGAA
+TGATTTTCACGCGAGGTCGTACTCATAACCGCAGCAGGTCTCCAAGGTGAACAGCCTCTA
+GTTGATAGAACAATGTAGATAAGGGAAGTCGGCAAAATAGATCCGTAACTTCGGGAAAAG
+GATTGGCTCTAGGGGTTGGGCATTGCGGACGTGCTG
+>ds2020-267_91
+CAGCACGTCCGCAATACCCGTATGATTGCGGACGTGTGAGGACATAGACCTTGCGGACGT
+GCTGCTCCTTAGATTCGCACTGACCGTCGATGTTGCCCTTTATGATTCGGATAAAATCAA
+TGACTCACTTGCATCAGCCATTAATATTCAAAGCTTAAATTCAGAGACATCCGATGATGA
+GGCGCGCGTTGAATTGACTTATAAAGACCAAACGCGCAATGCCAAATTGTATTACAACCA
+AGCCGATGAAGGCTTTACGCCAGCAACTTCACCTATTACTGCTGGGCGAGGACGGTCTCC
+ACGGTCAGTGCGTCGCCTATCTAAGGAGCAGCACGTCCGCAAAGTTTTGGCCCCAGCACG
+TCCCAACCCAACCCCGATTAATTGCGGACGTGCTG
+>ds2020-267_92
+CAGCACGTCCGCATGCTTCGCCGTCTTGCCATCACCATCAGTCATCATTCCACCGAAGTA
+AACATCGCTAACGTTCTTCAGCTTGTTGTTGACGTCCTCGTGCATAGCCTTCTTCGCCAC
+ACCGTATTCAGCCTCCTCTTTAGTCATCATGACGCCATCCGTCATGATGCCCTCAACCAG
+TCCATTGGGGTTCATCGCCTTCTTCACCCGCTCGGCCACCACCTCGTCTCGCTTAACTTG
+TTTCTTTGGTGCAGCCATCGTAACGTCCTTTCTCGCTTCTGGTGGTATCGTTGCAATTTG
+CGAAAAACAGTGATCTTTTGTGGGGTTCTTAGCAAAAGGTTGTGTTTGTTCGTAAGTGAA
+ATTCCTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_93
+TATCTAAGGAGCAGCACGTCCGCAAATTCATTTCTCTCAGCACGTCCGCAAAGTGGTGGC
+CTCACACGTCCATCTATACTGGCTTTAAGTTGCGGACGTGCTGCTCCTTAGATACGCTTA
+AGGCGACGCACTGACCGTATTTGCAGGGGTATAAGAACAAAGTTCAATCATCTCTATCAG
+ATCACGATCTGATAAATTTTCACTCCCTATTTGAACTAGTCTGTTTAATAGTTCTAGATT
+AAATGCCTTAAATATATGAGTACCATCATAAGACCACAATTCAAATTCTAGATGAGTAAC
+ACGATTTCTCATGTTTTCTACGTCTAAGGCCCATTGATTGTACTAGGGTATGGAGGACGG
+TCAGTGCGTCGCCTAAGCGTATCTAAG
+>ds2020-267_94
+CAGCACGTCCGCAAATCGACCGGCGTACTGTTGGACGTGCTGAGTGATACCAGCTTGCGA
+CGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTCATGAGGACCCTGACCAT
+GTATTGCTTAAGCAGGCTTATTTAGAGGGTGCTGTGGTAGTGACACCCAATCCCCGCGGA
+CATGCTATGTTGGCCAATAAGCAAAACCTGACATTGCTATCAGACTCCCAAATATTGCGC
+TCTTGGGGTCTGGATGAGGCTGCAGTGGAGAGGTACTGGAACACGGTCAGTGCGTCGCCT
+TAAGCGAATCTAAGGAGCAGCACGTCGCAAACTTCTTGCCCTAGCACGTCCGCAAGTGGG
+ATAGGGTGGATATTGCGGACGTGCCG
+>ds2020-267_95
+GGACGTTCGGGCTTGGGTGGAGTGATTTGTCTGCTTAATTGCGATAACGAACGAGACCTT
+AACCTGCTAAATAGCCAGGCCCGCTTTGGCGGGTCGCCGGCTTCTTAGAGGGACTATCGG
+CTCAAGCCGATGGAAGTTTGAGGCAATAACAGGTCTGTGATGCCCTTAGATGTTCTGGGC
+CGCACGCGCGCTACACTGACAGGGCCAGCGAGTTTATCACCTTGGCCGGAAGGTCTGGGT
+AATCTTGTGAAACCCTGTCGTGCTGGGGATAGAGCATTGCAATTATTGCTCTTCAACGAG
+GAATTCCTAGTAAGCGCATGTCATCAGCATGCGTTGATTACGTCCCTGCCCTTTGTACAC
+ACCGAGGAAAGCCCGAACGTCC
+>ds2020-267_96
+CAGCACGTCCGCAATCAGCCTGTTATCCCCAGAGTACCTTTTATCCGTTGAGCGATGGCC
+CTTCCATACAGAACCACCGGATCACTAAGACCTACTTTCGTACCTGCTCGACTTGTGGGT
+CTCGCAGTTAAGCGCGCTTTTGCCTTTATACTCTACGCGTGATTTCCGACCACGCTGAGC
+GCACCTTCGTACTCCTCCGTTACTCTTTAGGAGGAGACCGCCCCAGTCAAACTACCCACC
+AGACACGGTCCTCGTCCCGGATAACGGGACAGAGTTAGAACCTCAACATTACCAGGGTGG
+TATTTCAAGGACGGCTCCATTGGAACTAGCGTTCCAACTTCAAAGCCTCCCACCTATCCT
+ACACCCGTTGCGGACGTGCTGG
+>ds2020-267_97
+CAGGTATGTTTTCGGACGTGCTGACAATCAGGTCCTTGCGGACGTGCTGACCCCATACTA
+ATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTCCTGGTCTCC
+CTCCATAGCCGAAATGACCATGGTCACACAGGAAGTAAGCCTTGACTTCCCCATTAAAAC
+GGTTTTCGATACGGCGCAATTCACCATAGCGCTCACCCGCTGAGATATTACAACCTGTCG
+AACAGCCATGACAAATGCTTGGTGCATATTGCATGTCCCAATCCACGGTCAGTGCGTCGC
+CTTTAGCGTATCTAAGGAGCAGCACGTCCGCAAACGAGATTTTGTGGACGTGCTGCCGGA
+TGAGCCTTGCGGACGTGCTG
+>ds2020-267_98
+CAGCACGTCCGCAACGTCCTTACACTCAGCACGTCCGCAAGACTATCAGCCTCAGCACGT
+CCCAACCGAGTCTCTTTTGCGGACGTGCTGCTCCTTAGAAAGGACGTTCGGGCTTTCCTG
+CTGCCATCCGATCCTGAAGTTTACCCTTTGCCCTTAGAATACGACCAAGGCGCTGCGCTT
+CTTGACGCCTTGAACCAGCATGTGACGATATCTGAATTATCACATTTGCCTCCAGAATGT
+CTATGGAATTATCACCTACCTTAGACAAAAATGCCATGTTAAGCCCGAACGTCCTTACTT
+CCAGTATCTAAGGAGCAGCACGTCCGCAATATTCACACTCTCAGCACGTCCGCAAAGGGA
+ATGGGATTGCGACGTGCTG
+>ds2020-267_99
+CAGCACGTCCGCAATGGGCATGGCATCGGTTTGAAACATCGGAATTGACGACTCTGGCCA
+TAAGATAATGTCCTGACCAAGGCGGATGAATTGCGGACGTGCTGCTCCTTAGATACGCTT
+AAGGCGACGCACTGACCGTAGCTCTGTCCCCCCCAGTCGAAAACTGGAGCTCTGATACCA
+CTTGTTGTGCGGAAGCGTCAACCAATTGCGAGTGAAAAATAAACAACAACTGGCAGGAGA
+TAAATGGAACCAAAACAAAACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCAC
+GTCGCAATCCATCACGACTCAGCACGTCCCAATGTCTAGGCCCCAGCACGTACCCAATGA
+TTTCTTGCGGACGTGCTG
+>ds2020-267_100
+TCAATCGGCAGGAACAAAATTAGGTGTATAAACTTATTTTGCTTATTCGGACGGACCAAC
+TAGACTAGTTACGACATCACATTGATAGCCTCTACTCGTGTCCTAGCTCGTCTGAGAGCT
+AAATTTGCCTCAATTGTTTGTCTCTTGCCTTCAGCTTTCCTCAAGTTAGCTTCCGCTATT
+TCAAGAGTTTGTTGCGCTTCTTGTGGATCAATGTCACTACCCTTCTCTGCATCATTTACT
+AAAACCGTGATCTCATTATTGCCTATTCTAGCAAAACCACCCATCAGAGCCATCGTTAAC
+CATTGGTCGTTAAGGCGTATTCTCAAAATACCGATATCTACAGCTGTGGCAGGGCGTGAA
+CCTTGCGGACGTGCTG
+>ds2020-267_101
+CAGCACGTCCGCAATCAGTGTGTCCTCTGCTCATTGTCACGTGCACCTGACTGCTTCATG
+TGCTGTAGCCAACCAAACAGGCTAGTCAGCGCGACTGTACCTGCCATTTTAGCTGCACTG
+ACACTGTTGAGCTCGATTCTTGTCATAGCAGCTATCTCTTGTTCATCCAACTGCATGCCG
+GGAGCAGCTACACCAGCGACTGCCTTGCCGTTAAGTAAGTGCGCCATGACTGCATTTTCA
+CTGACGCTGATTCCTTCTGCCTCAGCCATGATCGGCAGCTCACCGATCACTCTGATCTGG
+TGCGGCTGAAACACAGTGATGATCTCACTTGTCAGCGTCTTGTCAGAAGACTTGGCCATG
+GTTGCGGACGTGCTG
+>ds2020-267_102
+GAGTTCTCTCAAGCGCCTTAGAATACTCATCTCGCCCACCTGTGTCGGTTTGCGGTACGG
+TCTCGTATGACTGAAGCTTAGAGGCTTTTCTTGGAACCACTTCCGATCGCTTCGTGAGCA
+TGCTCACTCGTCTCAACCCCTTGAATTCCGTGCCCGGATTTACCTAGACACCTTCTCCAA
+GTCAAGAACAGGCTCTTCCAACCGCCTGACGACCTTCCGCGATCCGTCCCCCCATCGCTC
+CATCGACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATTGTTT
+AGTCCTCAGCACGTCCGCAAGATATTTTCCGTCAGCACGTCCCAAACTAAGGTAGGTGTA
+ATTGCGGACGTGCTG
+>ds2020-267_103
+TATCTAAGGAGCAGCACGTCCGCAACTACTTGGCTGTATTTGCGGACGTGTGAGGGAAAT
+ACCTTGCGGACGTGCTGAGGGTAAGCGTTTTGCGGACGTGCTGCTCCTTAGATTCGCTTA
+AGGCGACGCACTGACCGTGGTTTGACTCCTAAAATGTCTACCACCTCCTTGAAGGAAAAG
+TGGACATGATGCGATGCTGTTATCTTGGTATGCTTTGCCGACATGGCTTCGTACAGCTGC
+AATCACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGCACCCA
+GCCCTCAGCACGTCCGCAAGATGATCTCACTCAGCACGTCGCAAAAGTTCCTGTATGGTT
+TGCGGACGTGCTG
+>ds2020-267_104
+CAGCACGTCCGCAACCTCTAGGCCCTCCTTGGGAACCATCACAAGTACGGCCGGCCTATA
+TTTAAACGAGAATGCCGTGTCGTCCAGCGGAGCCTAGAAGAAGGTGACTCGCGCAGACAG
+CGGACTCCTTTTCAATAGAAAGGAATAGCCAAACCAACCCAGCTGGCTGGTCAATCTCAG
+AGATCTTATCGGCCGGCAAACCGGAGACGGACGACCACGGTCCCGACCTTACCAGCACCG
+GAGGTGTACTAATCAATGAACCCCCGAAACCTACTTTCTTTTCTGACAAAATCAACCAAA
+GTACTCTTGCGGACGTGTGAGGTCTCTGAACTTGCGGACGTGCTGAGGGGGGCTATGTTG
+CGGACGTGCTG
+>ds2020-267_105
+CAGCACGTCCGCAATTTCTGATCCCTCAGCACGTCCGCAAGCCGCTGTCTCTCACACGTC
+CGCAACTACCAGGTTTTGCGGACGTGCTGCTCCTTAGATATAAGGCGACGCACTGACCGT
+CAAATGGTAGGTAGTTATTGCCAGCGTATGCCATGTGCTCTTCGCATTCAGCTAAGAGGA
+GTGCTGGCTCACTATGCATGGCCGCTGCAACACGTTGACCGAGCGATAACGGCACGGTCA
+GTGCGAATCTAAGGAGCAGCACGTCCGCAAATCAGTTTTCCTCAGCCGTCCGCAAATGTT
+CTCTCCTTGCGGACGTGCTGAGTAACTATGCATTGCGGACGTGCTGCTCTTAGATAGATC
+GGAAGACCAC
+>ds2020-267_106
+GCGACGCACTGACCGTCTATCCGTTCCTTCCTGCAATCTTGATTGAATGGTTTGAATCCA
+AGTAATCAACTTCAATAATTCTTCATCGGCAATGGCTTGCCAAGTCAGACAGCAGCTTTC
+ATCATAGTTTTTGCCGGGCGTATTCATCGCATCCGTAATGACCTCCGTGATAACATCTGT
+GATAACAGCATTGATAACATCAGCGTCGCCAGTTAAATTTTCGTCCAGTCGCATCGGGGC
+TGTTGGTTTGCTAGATGGGCAGTAACGGTCAGTGCGTCGCCTTAAGCGTCTAAGGAGCAG
+CACGTCCGCAAACGAGTAACGGTAGCGTTGCGGACGGCTGACAGCTTATTAATTGCGGAC
+GTGCTG
+>ds2020-267_107
+CAGCACGTCCGCAAATGTTACCCGATGGTCCTTGCGACGTGCTGAGGAGGTCTGAATTGC
+GGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTGCATTCGCCGCTGCC
+ACCGAAGTTTTCTTTGCTTTCCCGACTTAGCTGCAATCAGCTGAGCCTTGAATTCTAGCA
+CAGATTTTGAAGATCTGTCAAACTTTTTGATCTCTTCTTTTGCTGCAATCGCTTTTTCAA
+AGCAACCACCGCAATCAGCGAAGCCTTAGATTGTACAACAGTTTTTACACCGCAATCAAC
+AAATTCCAAAACTTCTTCAACCAACCCCGATACAGACGGTCAGTGCGTCGCCTTAAGCGA
+ATCTA
+>ds2020-267_108
+CAGCACGTCCGCAATGGTCCGCCCTTCCTCTCCCTCTCCCTATGGTCGAGCTAGTTTAAC
+CTTCCTCCAAGACTTGAATCAGGAATATCTTTTCTGTACTATGCCCTGCGCCTGGTCTTT
+CTTCTTTATTGCCTTGGCCTTTCACCGGATCGATCCCTTCCACCATTCCTCCAACAGATG
+CGGATGAATTAGCTGCCGTTATTCTTTCAACATTTGCAGAGCTAACCCCTGAAGTGACTT
+CAGTCCCGTGTTAGAGCTAACTGCTGCTTCTTCTATAGCAAGTGCCGAGCGAGTGCATAT
+TGCGCTGAAGGCCCCCGCGTTGCGGACGTGCTGAGAGAAGGGATGTTGCGGACGTGCTG
+>ds2020-267_109
+CAGCACGTCCGCAAACATAGGGAGCCAATTGCGGACGTGCTGTCTGGAAGTAAGGACGTT
+CGGGCTTGTTCATACTACTCCCCATAGCGACACCATGTGCTACCGACGCAAGATTTGACG
+GTACGCAAAGACTTGCCATAGGCATGCCCTGTTTCAAAACCTGCGTTGATTAAGCGTTCC
+CAAATATCGGGCAATTGGTCAATACGTGCACCAAATAAATCCACACGTTACCCACCAGTA
+AAAGCCCGAACGTCCTTTATCTAAGGAGCAGCACGTCCGCAACATAGCGCCCCTCAGCAC
+GTCCCAAGTAGTGTGCCCTCAGCACGTCCACAATGTAGGTCTATTGCGGACGTGCTG
+>ds2020-267_110
+TATCTAAGGAGCAGCACGTCCGCAAGGTGCCCAGGGTGCCTTGCTTATGTCTTAAACGGT
+TAAGGGGATTAAAATGATTGCTGTTGTTATCATTGCTTTAGGTGTCATGATTTGCGGACG
+TGCTGCTCCTTAGATTCGCTTAAGGCGACGCACTGACCGTTGTAGTTTGCCTGTAGGTGC
+TGCAAATGCTCATTGAGCTGTTGCTGGTTATTTGTGAGTGCATGCTCTTCAAGTAATAAC
+TGCTGTAATTGGCGATTGATGTTATCAAGCCGTTGTTTGGCAATCGCTAATTGTTGCTCG
+GTATCATCGGGCGTGTAGGGCTGATGGGAGGCCAAATAACACGGTCAGTGCGTC
+>ds2020-267_111
+CAGCACGTCCGCAACGAGTAGCCACTCAGCACGTCCGCAACTCCCGGGACTTTGCGACGT
+GCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTAACAGCGTGGTTGGAACGCAA
+GAACTGTTTGTGCAGATCAGTTATTGTGTGTTCTGACTTACACGCCCGTGTCACTCCGGA
+TTTATCGGGATGGCGGTAAGTGCTTTGCCGTTGTCCACATAAAGACGGGGTGGACGTTTC
+ATTTACTCTTTTCCCAAATAAGAAGTGGAACGGACCTCGGTCAGTCCGACCTAAGTTTGC
+ATCGCAGAACATCCTGTATTGATTATAACGGTCCTTTACTTGCGGACGTGCTG
+>ds2020-267_112
+CAGCACGTCCGCAATCATTGGCTGGTGTTGCGGACGGGATGAAGAAGGATTTGCGGACGT
+GCTGCTCCTTAGATCCGCTTAAGGCGCGCACTGACCGTCCAGACTGGGATGGCGCATATT
+TGGCCGGTTAATATTTTCTATCTAAGCCTCCATGTTCCTAGGAACCTAGAGGATCCCCCC
+CCTCATCTTCCATTTCAGCAATCTCAACGTCGCGCAGCCACTTTGGCTTCCTGTTCGACC
+GTTTGTTCTTTCTCCTTCGGCTGTCGGAATTCGGGTACTTGACTCGATACGTGTTCTTAT
+CCATCATGACCAATCCATCAACGGTCAGTGCGTCGCCTTAAGCGAGATCG
+>ds2020-267_113
+CAGCACGTCCGCAACACATCCGTTCTTCACATCCAGGCACTCCAATGTCGCTTGTGAGTA
+GGGCTTCCCAGGCCCGAGTGAACGATGAGTTTGGTGAACGCATGTCTTGGGTAGACACGC
+TCGGTCCGCGGCCCCGTAAGAGGTACACCGGCGAGTGGCGGGTTCTCAATCGATGGAGTA
+GGGTTCCGTTGATCCCTGACATTGAGAATCACCTCACCAAACCGCCTCCCGTTTCTGCAC
+CCGTAACGTAAATGGATGCAAACACCGTCGGCTCGTTCCTTGCGAACGTGCTTGCGAGCC
+CTAGAGGGGGTCGCATTGACAAGAACGCCAACCGATTGCGGACGTGCTG
+>ds2020-267_114
+GACGCACTGACCGTGATCGGCTTTCTATTTTTTTTGTGTCCTTTATTCTTCCTTGCTTCG
+GATCGGAAAATTAAAGAATTGAGTGAATCATAAACCAAAGGAGGTTCATGGCCAAGGGTA
+AAGATGTCCGAGTAACAGTTATTTTGGAATGTACCAGTTGTCTTCGAAATCGTGTTAATA
+AGGAATCAACGGGCATTTCCAGATATATTACTCAAAAGAATCGACACAATACGCCTGGTC
+GATTGAAATTGAGAAAATTCTGTCCCTGTTGTTACAAACATACGATTCATGGGGAGATAA
+AGACATAGATCGACCCGACCGCAGCGCGCGATAGTGCGGACGTGCTG
+>ds2020-267_115
+CAGCACGTCCGCAAAGTGGTGGCGCTAAGCGAACTGATGTCAACTCTAGGAATGATACCC
+ATAGACGAGGCGCTGACTGCCGAAGCTTGCGGGTCAACAAGCCCAATCGAGTGGGGAAAA
+GAAGGAAGAGAAAGAATAATGAGCGAAAGAATAGAAACGTTACGTGAAGCTGCGTCTGAG
+CCTTCGGCGAGAACGACGACGCTATTTGTAGAAGAAAGGTGACAAGAAGAAAACATAGGA
+AGTACGCGGCTGGGTGCCAGCGAAAGAACGGAAGGATAAGCAAACAGAGGAGAAGAAGTG
+GATGGTGAAAAGAAAGAAAAGAGAAAGTTCATTGCGGACGTGCTG
+>ds2020-267_116
+CAGCACGTCCGCAGCGACGAGTTCATTGTAGCGCGCGTGCAGCCCAGGACATCTAAGGGC
+ATCACAGACCTGTTATTGCTCAATCTCGTTATTGCTAGACGCAATTTGTCCATTTAAGAA
+GCAAAGTGTCCTCTTAAGACAAACCAAACAGGTATGACTCCATCGCACGTGCCGAAGCAC
+ATGAAACTTCAACGCCATAGTCCTGCAGGCATCTATTTAAAAAAGTTTGAGTCTCGTTCG
+TTATCGGAATTAACCAGACAAATCACTCCACGAACTAAGAACGGCCATACACCACCACCC
+ATAGATTCGAGAAAGAGCTATGGGTTGCTAGTTGCGGACGTGCTG
+>ds2020-267_117
+ATCTAAGGAGCAGCACGTCCGCAACGCAAATGGCCTCAGCACGTCCGCAATTACCAACCC
+CCATTTGCGGACGTGCCTGGAAATAAGGACGTTCGGGCTTATTCCTCGTGCTATGAGCCG
+AAGAAATAGTAAGATATGGGTAAGAGTTCTCGCTGATCTCCCTATTACCCGGAAACCTAC
+AGAAGTAAGAATGGGAAGAGGAAAAGGAAATCCTACGGGTTGGATCGCTCGTGTGTCCAC
+GGGACAAATCCCATTTGAAATGGATGGTGTGAGTTTGTCAAATGCTCGACAAGCCGCTGT
+CAAAGTGTGGATTTCATTTTGTAAAAAATAAGGGGGACGTGCTG
+>ds2020-267_118
+CAGCACGTCCGCAAGGGTGCCCCACCCACACGTCCGCAATGAATCGTTTGTGGTTTGCGG
+ACGTGCTGCTCCTTAGATACGCACTGACCGTTGCGCCGCCATAGAACTCGACAGTTACAC
+CTACTTGTTCGACACTATATTTTGATTCTGCCCTTCTAAAAGGAACATCGGCTCTAACAA
+TTCCGTCTCCGTCTACCAAAACAACCGGAAACGTTTCAAAAAAGGTAGGCATACGACGTA
+CAAAAAGTTCGCGCCCCTCTTTATCTCTAAAGATAGGATGTCCTAACCACCCAACAGCTA
+TTCCATCCCCGTTGTCCATTGAGCCACGAACGGTCAGTGCGTC
+>ds2020-267_119
+ATCTAAGGAGCAGCACGTCCGCAAATGACCTGAAGTGAGAGACCCGAGAGTGGAAGTGGT
+GTCAGACGGACAGATAGAAGCAGAAATACCACTTGATGTTCAAACAGCCAATGAGATCAT
+GGAGTCGAAAGCAGTTTACAAGTTCAAAGGGTCCAGAGATTACGTCGAAGGGCTTGGAAG
+CACGTACGGAGTGACTTGGAAGCATGAAGGAAAGAAGAGGGCAGTGGCACTCATCGCTGC
+TGGGAACCTGATGGTGGGAGCAAGGCAGTCAACCGGGATGCACGATGAACTCAGCAGAGA
+CGTGGAGCTTTCCACAGGGGACGGAACTTGCGGACGTGCTGG
+>ds2020-267_120
+GACGCACTGACCGTAACCTTGACCTTGACGCACTGACCGTTCCCTTTCCCTTCGTATCTA
+TGGCACAACGGACGGTCAGTGCAGGAGCAGCACGTCCGCAACCCCGGCTTCGTATGATTT
+TGCTTACTATACCTGCTGCTGTAGCATTATAAACATTATTGTTACTCTTGCTCCCGTCGG
+GATAAATCTGACCCCTTCCCCTGTTCCCGCCTACGTATATGGGATATTTTAAGAAGTGAA
+CATCTTTCTTAGTAGCGGGGTCCGGGGAAAGAATAGGAAATGTGATTTCACTATATTTCT
+GACCAGGGACAGGACCTATCACCATTTGCGGACGTGCTG
+>ds2020-267_121
+GCAGCAGTGGGGACTCTTGGACAATGGGCGAAAGCCCGATCCAGCACTATCGCGTGAGTG
+AAGAAGGGCAACGCCGCTTGTAAAGCTCTTTCGTCGAGTGCGCGATCATGACAGGACTCG
+AGGAAGAAGCCCCGGCTAACTCCGTGCCAGCAGCTGCGGTAAGACGGGGGGGGCAAGTGT
+TCTTCGGAATGACTAGGCGTAAAGGGCACGTAGGCGGTGAATCGGGTTGAAAGCGAAAGT
+CGCCAAAAACTGGTGGAATGCTCTCGAAACCAATTCACTTGAGTGAGACAGAGGAGAGTG
+GAATTTCGTGTGTAGGGGTTACAGGTTGCGGACGTGCTG
+>ds2020-267_122
+ATCTAAGGAGCAGCACGTCCGCAATAAACTCCCGGTAGAAAGAGATTTCACTAATGAAAA
+AGCTTTCAATGCTGCCCGATATCCCTTCCTTTTCCAAATATTTTTACGAATCCGTTTTTT
+TGAAATAGAGGTGCGTTTTTTTGGAACTGCCATTAAAAAATTATATTATAATAGGTTCTT
+CGGTTGGATGTGAAAGACATCTATTGTTCAACTCTTCTCTATCTATTTATTCTCTAAATC
+ATACTCCCTTCATAAAAAAGGGGGGGGGGGTTGCGGACGTGCTGCTCCTTAGCTACGTTC
+GGGCTTGTTATAGGGGTTGGTTGAAAGCCCGAACGTCC
+>ds2020-267_123
+GACGCACTGACCGTCGCCCCCCGTGCTTCTGGCATGTTACATTCCTCTTCGTGCTGAGCC
+CCCCTTTCTCGTCGGTCCGCAGAGACAAAATGTAGGACTGGTGCCAACAGTTCATCACGG
+AAGAAAGGACTCGCTGAGCCGAGATCACTAACTAATACTAATCTAATACTAATGAAAATG
+CTAATATAATAGAAAAGAACTGTCTTTTCTGTATACTTTCCCCGGTTCCGTTGCTACCGC
+GGGCTTTACGCAATCGATCGGATCATATAGATATCCCTTCAACACAACCTAGTTCACTGC
+CAGGATCTCGGAGACACGCCACCAAGCCCGCACGTCCC
+>ds2020-267_124
+CAGCACGTCCGCAAATGTATCCTCCTGTGATTGGGACGTGCTGAGGGCCCATGAGTTGCG
+GACGTGCTGAGTGGCCTTGTGTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACG
+CACTGACCGTGGTTGTCACCCTACTCCATCCATACCACATATACTCTACATACACATCAT
+ATACACACATACCATACACACTGTCACACACACCGCATACACCACACACACCCACACATA
+CCACACACACATATACATCACAGACACCATACCCACTCACACACAGAAACATATACCCCG
+GCAAATACGGTCAGTGCGTCGCCTTAAGCGAGATCGG
+>ds2020-267_125
+CAGCACGTCCGCAATGTATCAGGGTTGGTTGCGGACGTGTGAGGGAGTGGCTATTGCGGA
+CGTGTGATGGGTATGAAGTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCAC
+TGACCGTCTTACTTGGCCTCTCGTCACATACCTTCATGTTGGGAGAGCTGTCTACGGCAT
+AGTCTAATTGCCATTCTTTAGGGGCTTCGCTGTCGCTTCTAAGAAAGATTTCAATAGCTC
+TTCTTATAATTTTGAACCGCTTTCCTGCGTCCACTTGTTCAACATGGTTGGTCGTGCCAT
+AGGATCTGGGTTGCGGACTTGCTGCTCCTTAGCTA
+>ds2020-267_126
+GACGCACTGACCGTGTTCCAGGCCCTCTCTTAACTGAGACAGAGATCCAATGCTTGAAGT
+AGGAATAAAATTGATTCCACCAAACCTAATATGTATGGTAGATCAGGTCATATTTTAAAA
+GTATTCCTTTCTTTTCTACTCATTTATATCTTCTAAATCTATTTTTTTTTCTGGCTCGGC
+TAAGTGGGATAGCCGAGCCATTTCCTTATTATGCTACCGATTCCTTTTATGCTACAGCCG
+GGACTACGGTCAGTGCGTCGCCTAAGCGCACGTCCGCAATCCAAGGAGCATGTAGTTGCG
+GACGTGCTGAGGGCATTAACATTGCGGACGTGCTG
+>ds2020-267_127
+CAGCACGTCCGCAATTTTCGCTACCTTAGGACAGTTAGAGTTACTGCCGCCGTTTACCGG
+GGCTTCCATTCAAAGCTTATAACACTTCTCCTTCCGACCTTCCAGCACCGGGCAGGTGTC
+AGACTCTATACATCGTGTTACCACTTAGCAGAGTCCTGTGTTTTTAATAAACAGTCGCTA
+CCCCCTGGTATGTGCCGCTTTCCTAATCAAAAGATAGGAGAGCACCCCTTCTCCCGAAGT
+TACGGGGTCATTTTGCCGAGTTCCTTCGACATGGTTCTCTCAAGCGCCCTAGTATACTCT
+ACTTGTTCACCCGTGTCAGTTTGCGGACGTGCTG
+>ds2020-267_128
+CAGCACGTCCGCAATATGGCTGAGCTTCCAGTACGTGGGGCGCAACGCCCACTCTCTACT
+GAGCATCCCGTCCGACATCAATTGCTGCTCGTCAGCAAAACGAGCCCCAGACTAGACTAT
+CTGGGGGAAGGTATACCGGGGTTTGTTAAGACCCGGATGCCCCATAGGAGGCCGTCATTA
+CACACTTGGGCGTTTGCTAAACGTTAACCCCAAGATTGCACCTATTGAGAGATCTCTCAT
+GCAGTGCTCCTGACTTACCTTCACCTTTTCCAAGACTTCCCCGCACGAGATGCCTATGCA
+TCACATACGTGGGCGGTGTTGCGGACGTGCTG
+>ds2020-267_129
+GGACGTTCGGGCTTCATCTAAGGGGTACCTCATGCTCTTCAAGGTCGAGGCTAGCGCTGG
+AGGTTCGAATGTGGATTTGATGGATCTGTCGACGCTTGACTTCGCTCTCATGGCCGAGTT
+TGATCAGCACATCCTCGAGTATATTCGGCAGCAAGTCATCGACGCCCTCGAGAAGGCTAA
+ACACGCCAGCGACGAGGCGATCGAGAAAGCCCTGAGGAAAGCCCGAACGTCCTTAATCTA
+AGGAGCAGCACGTCCGCAACCCGTATTCCCCGCACGTCCGCAACAATTAACTACTGATTG
+GGACAAGGCCACAGCATTGCGGACGTGCTG
+>ds2020-267_130
+CAGCACGTCCGCAACTGCAAATGGATAGACTCCAAGGTCCGAACTGTAATTGGTTCTCCT
+ATAACCCAGTATATAATGAGCACCATATGGAATTATGGTCCCAATCACAACTTTGCTTGG
+GAGACCACACCCATCAAAGTGGGCATGCCACTAAATGGGTTTTGGCTGTCCAAGTTGTTC
+TCTAAACATGCCAGGTGCCAAATGCACATTGAGGGTGACTTTGAAGCTTTTGACTCAACC
+ATCTCCGGGTCCGTTGTTGACCTTATTAAGGATGTGAGGAAGAAAGGGTATGAAATGCAT
+AGAGACAGGGCTTCAGTTGCGGACGTGCTG
+>ds2020-267_131
+CAGCACGTCCGCAATCCACGACCGCTAGCGAAGGTCCCAAAGTCATGGTTAAGTGGGAAA
+CGATGTGGGAAGGCCCAGACAGCCAGGATGTTGGCTTAGAAGCAGCCATCATTTAAAGAA
+AGCGTAATAGCTCACTGGTCGAGTCGGCCTGCGCGGAAGATGTAACGGGGCTAAACCATG
+CACCGAAGCTGCGGCAGCGACGCTTATGCGTTGTTGGGTAGGGGAGCGTTCTGTAAGCCT
+GTGAAGGTGTGCTGTGAGGCATGCTGGAGGTATCAGAAGTGCGAATGCTGACATATGAAC
+AATGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_132
+CAGCACGTCCGCAAGTGCTAACGATAGTAGGTTGGGACGTGCTGAGAGTAATTAGTTTGC
+GGACGTGCTGAGTGGTTAGACTTTGCGGACGTGCTGCTCCTTATCGCTTAAGGCGACGCA
+CTGACCGTCGTTCTGGTGCTCCCTGTGCTTGTCCCCATAACTGTCACTGTAGCTATCACT
+TGGGCTATGACTTGCATACTCATGCACTGCCGAGGGTGCACTGTTCGGGGGATAATCTTG
+GCTAGCAGAAGCAGGATAAACATCATCCGACACTAGATAATCTTCCAATCCTTCAGTTTC
+ATGGCGGGTAAAACGGTCAGTGCGTCAG
+>ds2020-267_133
+CAGCACGTCCGCAATCAGTTTGTGGCGGTCACTGATTACTTCCGGTGGGGTTGACTGGAG
+GGATTGGTGACCGGGGTTGAATGGCATCAGACAGCGTGGCCTGAGGAGAAGCATGCAGCA
+TCCGGACTCTTGAAGGATGAAGACGTCAATTACCGTTGAGAGGGACGGTTCATGTAGGGG
+TACGTTAGCGAGTAAAAGACTAAGCGTAGAAAAGGAGATGCCGTGACCGCCATATTGAGC
+CGTTTCCGTTTTGTTCTCCCATCTCACCATAGATGAAAAGCTGGTACTAGTTGGATCCAT
+CGACTAGGGGATTGCGGACGTGCTG
+>ds2020-267_134
+CAGCACGTGCGCTCGCTTAAGGCGACGCACTGACCGTAGTAATGAGGGTTCCAGTTATGT
+GTTTTAGATTCTTCATTCCAAGTATATTCACTATGAATATCATAAAGAAGTTCTTGATCT
+AAACAAGTATAAGCTTTACTCTCTTGTTGCCTAACAATTTCTTCAATGATTTCATTAGCA
+CGAACAGTATAACCTTTACCAAGTAACCAGAAAGCCAAAGACGGTCAGTGCGTCGCCTTA
+AGCGAATCTAAGGAGCAGCACGTCCGCAATTACATTGGGCTGAGGTTTGCGGACGTGCTG
+AGGGGATCAGTTGCGGACGTGCTG
+>ds2020-267_135
+CAGCACGTCCGCAATGTGTTGCCCTCAGCCGTCCCGCAACCGTCTAGACCTTGCGGACGT
+GCTGCCACCGCTTAAGGCGACGCACTGACCGTGAATCTACAGGGACGCACTGACCGTACC
+CTTCTTCCTGACGCACTGACCGTGACTTCAACACTGACGCACTGACCGTCCGAGTATGCG
+TGACGCACTGACCGTCGTTGGATACTGACGCCTGACCGTTACGAGATCTCATACGGTCAG
+TGCTATCTAAGGAGCAGCACGTCCGCAACCTACCCGGGGTATATTGCGGATGTGCTGAGT
+CATGCGTATTTGCGGACGTGCTG
+>ds2020-267_136
+CAGCACGTCCGCAAGTATGCCTGGTTTCAGGATCTATTTCACTCCCCTCACAGGGGTTCT
+TTTCGCCTTTCCCTCACGGTACTGGTTCACTATCGGTCAGTCAGGAGTATTTAGCCTTGG
+AGGATGGTCCCCCCATATTCAGACAGGATACGACGTGTCCCGCCCTACTCATCGAGCTCA
+CAGCATGTGCATTTTTGTGTACGGGGCTGTCACCCTGTATCGCGCGCCTTTCCAGACGCT
+TCCACTAACACACACACTGATTCAGGCTCTGGGCTCCTCCCCGTTCGCTCGCCGCTACTG
+GGGAAATCTTGCGGACGTGCTG
+>ds2020-267_137
+CAGCACGTCCGCAACGTATGCCCCCTCGCGGAGCTAAGTCTTCGTTGCCGTCTTAAGACA
+ATCCACCGGTAGTGTGGCGCATAACTTGGGTTCTGGGCTAAAGTCGAGCGCAACTGCATA
+AGAAGCGTGCGATCCGTTCGGACCACTTTGTGTGTCTTACTCTGAGGGCTTTGTCACGGG
+GCGGTGATATGTGAGGTAGGCCCCTTTGAGAAAGGGTCTTTAAAGCGTGCCGTAGGACGT
+GCGCGCCTCATGTTACCGGGTACCCAAGGTCATAGGAACTGGGACTGCCTTGCGGACGTG
+CTGCCCCTTAGATAGATCGGCA
+>ds2020-267_138
+CAGCACGTCCGCAACCGCGTTCATCTCAGCACGTCCGCAAGCGACCTCACGTCAGCACGT
+CCGCAATGGCCATATCGTTGCGACGTGCTGCTCCTTAGATATAGGCGACGCACTGACCGT
+ATCGTCGCCCCTGGTGGCATGGGCCTGTAGTCCCAGCTACTCAGGAGGCTGAGTCAGGAG
+AATTGCTTGAACCTGGGAGGCAGAGGTTGCAGTGAGCCGAGATCATGCCATTGCACTCCA
+GACTGAGGTGTTCGCTCTTGGGACGTGCTGAGAGGAAGATGTTTGCGGACGTGCTGAGCC
+TTATCCTATTGCGGACGTGCTG
+>ds2020-267_139
+CAGCACGTCCGCAAACAGCCTATCCTCGCACGTCCGCAACATCGCTTAAGGCGACGCACT
+GACCGTTTGTTGCTGGGTAGTGACGGCGTTATCTTAAACAACAGCCGAAAAAAACACCCA
+GACCCAAACGGCTGGGTGGGTGGAAGGTAACCCGTGGCTTGGTAAAGGCGAAGCCAAAAT
+TATTTTGGGTCAGGTCAATTCAACCAGCCCCAGTCAATTGGCCGGTTATACCGAAATTGC
+CGGGGGCAAAGCCGAGCTGGTGATTGCTAACCCAGCAGGGATTACCTGTTCGGGAGGTCT
+AGTTGGACGGTCAGTGCGTC
+>ds2020-267_140
+CAGCACGTCCGCAATGAGTTTGGGCGCTTAAGGCGACGCACTGACCGTCAAAGCAGCCAT
+CCTTAAAAGAGTGCGTAATAGCTCACTGGTCAAGCGTTCCTGCGCCGAAAATGAATGGGA
+CTAAGCATTGCACCGAAGCTGTGGGTTTGTCTTTAATTAGACAAGCGGTAGAGGATGCTA
+AACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATGCATGTGGG
+GTCAGCCGTCCGCAATAAATCACCCCTGAGCCATGCACGTGCTGAGGAAGAGCGCGTTGC
+GGACGTGCTGCTCCTTAGA
+>ds2020-267_141
+CAGCACGTCCGCAACGTGGTCATTCTCAGCACGTCCCAACCTAGTATGCCTCAGCACGTC
+GCAAAGACCGGAACCTTTTTGCGGACGTGCTGCTCCTTAGATACTGGAAGTAAGGACGTT
+CGGGCTTTGCGTCTCCCCTAGATCGCATCTTGCGTTGGGGTGATGCTAAAGCTTGGCATG
+TCAGCAAGTTCAGTGCCTGCAGGGATAGACACTGTAACCCCAGCAATCGCTTGTGCCACT
+GTCAGGGTTTGGGTTGTGCCATCAGCATTGGTGAGCACGATGCTAGCAATGTCAGCCGCG
+TAGTTAAGCCCGAACGTCC
+>ds2020-267_142
+CAGCACGTCCGCAAACATTCACGGGTCAGCACGTCCGCACGCTTAAGGCGACGCACTGAC
+CGTATTGAATGCCGTGACGCACTGACCGTCACTGCGACCTTGTTTGTGTTGGTCATAACT
+GACGGTAATATCGGTATTATCATTAATATCTTTTACCAAGGGGTGCCCTACGGTCAGTGC
+GTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAATGATTGAAATTGCGGCGTGCT
+GAGCTGGAGTCCTTGCGGACGTGCTGAGTTGTAACCCCTTGCGGACGTGCTGAGGGCATA
+AGTTTTGCGGACGTGCTG
+>ds2020-267_143
+CAGCACGTCCGCAAACAACTGCCCTTAAAATGGATGGCGCTTAAGTCGTCTGCCTATACA
+CCGCCGCTACGGCACAGGCGGTTGCGTACTTGTGCGCAGCCGCATTAGGCCGTAGTGAGT
+AGGAGGGTACAATGGTGTGCGTCGAAGCTTTGGACGTGAGTCCGAGTGGAGCCGCCATTG
+GCACAGATCTTGGTGGTAGTAGCAAATAATCGAATGAGACCTTGGATGACTGAAGTGGAG
+AAGGGTTCCGTGTGAACAGTGGTTGATCACGGGTTAGTCGGTCCTAAGCACCAAGCAGCC
+ATTGCGGACGTGCTG
+>ds2020-267_144
+CAGCACGTCGCAATCCTAGCGTAGTCACACTCCGCAGACCTCTCTTGTTGCGGACGTGCT
+GCTCCTTAGATTCGCTTAAGGCGACGCACTGACCGTCCCCTAATTGCTGGTGTGGTCGTA
+GTGCCAGCAGTTGATGTCGTCGACGCTTGTGTGCGGTTTGGGCTGTATGGTGTCATCAAA
+GATGAGGTGCCGATGGCATTGGGTGTGGCATTTTCATGCTGTCTTAGCATGGGTTTAATC
+AGTTGCCATTGTTCTTTGGCGGTGAGTGTTTCACTGTTTAGAAAGCGGGACAGCGAGATA
+TACGGTCAGTGCGTC
+>ds2020-267_145
+CAGCACGTCCGCAATCGGTGTATACTCAGCACGTCCGCAAAGTCTGTCAGTTCAGCACGT
+CCCAACACCCCCCCACTCTTGCGGACGTGCGCTCCTTAGATACGCTTAAGGCGACGCACT
+GACCGTGTAAGGATATCTCCAGTTCCAAAGTTTGCCCTGCCTTGATGGCAATTCGCCAAC
+CATTGGGTACTCGCTCTCGTGTTTGCTTGGCTGTATCAGTCACATAGGCTTCGTACAACG
+CCCCAGTTAAGCAGACACTAATCTCCCCTCTAGTCGCATCCACATCGCTATCACCAAATG
+AACGGTCAGTGAGTC
+>ds2020-267_146
+ACAGCACGTCCGCAAGTCTTTTCGGTTGGAATCAAAAATGGGCTGTCTCCTCTCTGATGA
+TCTTTTCTATAGGTAGAACTACTGTGAGCGGTCTAAACTTCGACCCTTATTTCTTTCTTA
+AAAAAAAAGAAAAAAAGGACATTCGACCCAATACCTTAACCATGTAATTTCTCCGACATT
+ATTTTCTATCGCCACATCAAGGTGACAGGATTCGAACCTATGGCCCTCTGTACCCAAAAC
+AGATGCGCTGACCAGACTGCGCTACACCTCGCGTCTCACCCCCCCCCATTGCGGACGTGC
+TGCTCCTTAGATA
+>ds2020-267_147
+GATCTCGCTTAAGGCGACGCACTGACCGTCAAGTCGCCTCTCCATCTTAAGCTAAACCAC
+TCGCAGGCTTATTTGCTACTCACCGACCAAGCGGCGCACAACCCAACGGGCGATTTTGCC
+TTAGAAAATGGCAAGGTTAAGGCAGATGGTACGCCAAAATATACCTTTGCAGGGATTAGT
+GTGATGTCACCAAGATTATTGGATACGGGAGCCAACGGTCAGTGCGTCGCCTAAGCGTAT
+CTAAGGAGCAGCACGTCGCAAATGTCTGGCCCTATTGCGGACGTGCTGAGAAGACTAACC
+TTGCGGACGTGCT
+>ds2020-267_148
+CAGCACGTCCGCAACCTGACTACTCTCAGCACGTCCGCAAGTCTGATACCCTCAAAGTTG
+CGGACTATCTAAGGAGCAGCACGTCCGCAACAGGTGAGTAGTACGGTACGGATATGGGTA
+TCAGTTTTGTATCTTGCGAATAGCTGAGTATGGATTTGGGTATCATTTATGTATCTTTCC
+AATAACTGAGTAGTATAGATATGGGCATCATATTCTGAATTTGAATGTGTATCATTTTTC
+TATCTTGATAATAGGTAAGAAATATAAATTTGGGTATCCGATTTTGTATCCGGAGATGAT
+TGCGGACGTGCTG
+>ds2020-267_149
+CAGCACGTCCGCAATATTCGCACCATTGCTGCCTCCCGTAGGAGTCTGGACCGTGTCTCA
+GTTCCAGTGTGGCTGGTCGTCCTCTCAGACCAGCTACTGATCGTCGCCTTGGTAGGCTTT
+TACCCTACCAACTAGCTAATCAGATATCGGCCATTCCAATAGCACAAGGTCCGAAGATCC
+CCTGCTTTCATCCACAGATCGTATGCGGTATTAGCTATCCTTTCGGATAGTTATCCCCCA
+CTACTGGGTATGTTCCGATATATTACTCACCCGTTCGCCACTCGCCACCAGACCCATGTT
+GCGGACGTGCTG
+>ds2020-267_150
+CAGCACGTCCGCAATTCACCCGGCATCGATCGATCGCGCGAGTACGCATCTAGTCAGCAC
+ATAGCGAACGAAAAAAGCATTCATCCTGGATTGGATTCTCTTCCTCAATCAAAATGTCTA
+TCAATTGATCCCCATTCATTCGGTCAAAGTCTCACCCTTGAGAGGTGCACCATGTTGATA
+GGAATCGGCAAAGACCCTCTTGTACACATCCTCGAGGGCAGCATTCATGGCAATCATCAC
+TAGTTTATCCCGAGGGCATGGTATGGCTTTGTTCTTGGTGTTGTTTAATAGATTTCGATT
+GCGGACGTGCTG
+>ds2020-267_151
+CAGCACGTCCGCAATCCTTCGTTCTTGATTAATGAAAACATCCTTGGCAAATGCTTTCGC
+AGTAGTTAGTCTTCAATCAATCCAAGAATTTCACCTCTGACGATTGAATACTGATGCCCC
+CGACTATCCCTATTAATCATTACGGCGGTCCTAGAAACCAACAAAATAGAACCACACGTC
+CTATTCTATTATTCCATGCTAATGTATTCGAGCAAAGGCCTGCTTTGAACACTCTAATTT
+TTTCAAAGTAAACGTCCTGGTTCCCTACCACACCCGGAAAGCCCGAACGTCCTTACTTCC
+AGAGATCGGAA
+>ds2020-267_152
+CTTCCAATCTATCTAAGGAGCAGCACGTCCGCAATGTTCTAACCATAAACGATGCCAGCT
+AGCAATTGAATGTAGCTACTAATTTCGGTTCATTCAGTCGCTTTCCGGGAAACCAAAGCT
+TTTGGGCTCCGGGGGAAGTATGGTTGCAAAGCTGAAACTTAAAGGAATTGACGGAAGGGC
+ACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGAAAACTTACCAGGTCC
+GAACATAAATGAGTAAGACAGATTGATAGCTCTTTCTCGAATCTATGGGTGCTGGTTTGC
+GGACGTGCTG
+>ds2020-267_153
+TATCTAAGGAGCAGCACGTCCGCAATCAGCCAGCCCTTGACATATGAACAACAAAACCTG
+TCCTTAACGGGATGGTACTTACTTTCATACAGGTGCTGCATGGCTGTCGTCAGCTCGTGT
+CGTGAGATGTTTGGTCAAGTCCTATAACGAGCGAAACCCTCGTTTTGTGTTGCTGAGACA
+TGCGCCTAAGGAGAAAGTCTTTGCAACCGAAGTGAGCCGAGGAGCCGAGTGACGTGCCAG
+CGCTACTAATTGAGTGCCAGCACGTAGCAGTGCTGTCAGTAAGAAAGGAGCCTGACTTGC
+GGACGTGCTG
+>ds2020-267_154
+CAGCACGTCCGCAATCTTGCAGCCCTGAGCTCTCCCTTGATCGTGGGATCGCCTTCTGAA
+AGTTCAGCAAGCACTTTCAAATGGTTACCTTTAAAGGTAGCCTGTTCCTCACGAAGTCTT
+TCGTTGAGGGTCCTAATGGGCTCTGTTCCCATTATGGCAATCTCTCGGCTTTTTGCATCG
+AGAGCCATCTTGACATCCAGTTCTGTCAAGACTAATCCGTCCTTTCTCAAGGCCGAGATG
+ACCGCTCCTTCGACAAAGGAGCTGGGATTGATCTCGGTCGCATAGGCCAAGTACCTTGCG
+GACGTGCTG
+>ds2020-267_155
+CCGCAGGTCCGCGAACTGAGGGGAATTGATAGCTCAGCTTACTGGCTCATCAAATCCTTT
+CTAAGATGAGTCAATTGGGCCTGAGATTGATCTTTCATTTTTGTACGAAGGGTTCTGCGC
+ATCAGGTTTCAGTAAATTTCTTTCAAAGACAACAGGGAGTAGCCAAAGCTCTGGTCCAAT
+AAGAGCACTCACGTGGTTTTTCAAGCCGAAAGCACCACTAGGCGCAGGGGCCGAAGAAGT
+CCTTTTATCTCATTCCGTACCTGACGGTATCACGGAGCGTAGATTGCGGACGTGCTGCTC
+CTTAGATA
+>ds2020-267_156
+CAGCACGTCCGCAAGAGTTCTTCCCTCAACCAAGCTGTCTCTCGACTGTTAGTTTGTCTT
+ACGCCTTCCTGAGACGCAGACTACTGCCTACTGTTGCAAATAGTACGCAGGCTCATCATT
+TATAACGCGCGAGTAGCACCGCGCATAGCTATCAACTTCGCCTTAGTAACGCAGCTCACC
+CAGCCTGTCCTTACCGACCTAGAGTCACTCCCAGCCTAACTAGCTATCTACGGCGAAATG
+AAAAGACTAGCTAACTGGAGACGAAAGCACAAATGAAACGAGGTTGCGGACGTGCTGCTC
+CTTAGAT
+>ds2020-267_157
+ACAGCACCTCCACAAAAGGGGGACAGTAGGTTTATGAGAAAGGGATGCTCTTATCATGTT
+CTTGCTGAAAAGAAAAACCGAATTCCTCTATTTGATGTCGATTCATCCACACTTCCATTC
+TTTGTAGAGGAAGGCTAACTGCTTGCTGGCTGGGAGCTGTATGAGCGGTAACGTCCACGT
+ACGGCTCCGTGAGAAGGTCGGTGGACAGAAATGGCCTTGTTGTACCTCACTCTCGTCTTC
+AATGGGGTCTGCTCTTTTTTTTGGGAGAGTATGCCAATATGATCTCAATAAGGTTGCGGA
+CGTGCTG
+>ds2020-267_158
+CAGCACGTCCGCAAAGTTTATCCCCTCAGCACGTCCGCAATTACGAGGAGATGGGGTTTG
+CGGACGTGCGCTTAAGGCGACGCACTGACCGTGTTTCTGGGGCTGACGCACTGACCGTAT
+AATGCACCCTGACGCACTGACCGTGCAAAGGGGAATTGGACGGTCAGTGCGTATCTAAGG
+AGCAGCACGTCCGCAAGTGATCTACCCTCAGCACGTCCCAAGGCCACACCATTGCGGACG
+TCTGAGTGATCGGAGTTTGCGGACGTGGATGGCTCCTGATTTGCGGACGTGCTGCTCCTT
+AGATA
+>ds2020-267_159
+ATCTAAGAGCAGCACGTCCGCAATCGGTCACCCTCAGCACGTCCGCAAACTCCCGCCTCG
+AGCACCATCAATGACTATCAAGAAGCGTATTTTACTGTCATCAAGCAGCCAAGCATCGAT
+GCGGCTGCAGCCAGTGACCCAAACACCCTCAATCAATTTGACTATATACCCATCAACTTA
+CGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATACTCATCGGGT
+TTGGTGGGACTGTAGCCCAATTGGCTTGCGGACGTGCTGAGTACCGGCATTTTGCGGACG
+TGCTG
+>ds2020-267_160
+CAGCACGTCCGCAAGGGTGGCGGAATTAGTAGTAACTTTAGCTGTTCATCAGCCTGGGTG
+CCGCTGACGGATCGCTAGTCCTGGCTAGTTTTACGTTTACTGAGAGCCTACCCCAGCATT
+GACGAGAACCGATGTTTACCCTTACACCGGGCGCTTCCACCACCCCAGCCCCTCCCTCCC
+ACCGCATGTAGAGAAGGGCGCTAATAGTTGGCAGTTGACAGCTCAATCGCTGTGGCAACG
+TCGACATTGTACGCTCTCGTACGCCCACCTATCACTTCATCGACTCTCTGTTGCGGACGT
+GCTG
+>ds2020-267_161
+GACGCACTGACCGTTACTTGCCGGATTATACCAGTGTTTACCTTTCTTACTACAGAACAC
+CAGCTTTCCACATTAGACTTTTCCTGCTTTACAGCCTTTACATCTTCTCTTCTCTTCTCT
+TGCCTCTTCATACAGCCAACTTCTTCCCCCTACTCAAAATTTAAGTTTCATGCCAACATT
+TCAGAGGGAGCGCCTATACGACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCA
+CGTCGCAAAGGATTCCCCTTTTGTTGCGGACGTGTGAGGCTCAGTCGTTTGCGGACGTGC
+TG
+>ds2020-267_162
+GATCTATCTAAGAGCAGCACGTCCGCAATGGGCCTCCCTTACCTACATTATTCTATCGAC
+TAGAGACTTTTAACCTTGGAGACCTGCTGCGGATATTGGTACGGTCTATTGAGAATGTTT
+ACGTGGCCCTGGCATAGATTTTCAAGGTTCGAGGAAGACGCACGCGACACAGCAATATAG
+GCCATGCTCTTCTAGTCCATCAACCATATCTCTCTTCGAAAGACTTCCATGGTTGTACGA
+CTATAAAACAGAAAAGAAAACTCTTTCGGTGCGCACCGACGATTTCTCTAAGCCAACAGA
+A
+>ds2020-267_163
+CAGCACGTCCGCAACATCGCCCACATTGCCAACGCCTGTCTGCGGATTCTGGAACAAGCA
+AGACAGGAAAGTCGTAAGCCATATCCTCCCATCCATCATACGCCTGACGAAGTATCTCAC
+GTTGTTTGCAGTCCGGTCTCCATCTTGCTTGAGTGGCAGCCCTGTCACCGGAGGCCTGAT
+GTTGGCTTCGTCATTCGTTGTCGTGTAAGTCACCGTGACGGCTGGTGCACTCACTATGTC
+AACTATGACGATCCTTTCACCTGAACGTGACATCACCCCGAACTTATTGCGGACGTGCTG
+>ds2020-267_164
+TATCTAAGGAGCAGCACGTCCGCAAGGTGGACCCCCTCAGCACGTCCGCAAGTACAATTC
+GGTCAGCACGTCCGAAAGTCTCTAAGTTGCGGACGTGCTGCTCCGTAGACGCTTAAGGCG
+ACGCACTGACCGTTTCCCTGCTGCTCCAATGTGCAGCGGATTATGGCGATTATGTGTGAG
+CTGGATGAATACGATGCTATTTATGAGATTATCAATACAAAAATTGACGGGCTAACCTTG
+GGGATGAGTGTGGGCGTGCATCCCTGCGAAGACAGTGCCATGGCTACGGTCAGTGCGTC
+>ds2020-267_165
+GGACGTTCGGGCTTCACGGCAACACTTCCCAAGCCCTCAAACACCTTGCCTACACTTCCA
+ACTGCCCCAACTCTGCCCAAGACCACATTGCCTCCACTTCCCTCAACCTCATTGCCTACG
+CTTCCAACTGCTCCAACTTTGCCAAAGCCGGCCACGTTGCCACCGTTGCCCTCTACCCAA
+TTGCCTACTAACCCAACAAAAAAGCCCGAACGTCCTTACTTCCAGAATCTAAGAGCAGCA
+CGTCCGCAACACAATCTCGCTCGCACGTCCGCAACTATGGCTGAATTGCGACGTGCTG
+>ds2020-267_166
+CAGCACGTCCGCAAGGTGGAGCCTCCAGCACGTCCGCATATGGAACTCGTTGCGACGTGC
+TGCTCCTTAGATTCGCTTAAGGCGACGCACTGACCGTCCGAAGCGACTTCTGTTGAAAAA
+GGAGCGGATGAGGTGTGGTTAGGGGTGAAATGCCAATCGAACCTGGAGCTAGCTGGTTCT
+CCTCGAAATGTGTTTAGGCGCAGCGGTATTGATTATAGCCGGGGGGTAAAGCACTGATTC
+GGTGCGGGCTGAGGAGGTCACTTTGCGGACGGAGAGGTCGGGTCTTGCGGACGTGCTG
+>ds2020-267_167
+ACGTGCTCGCTTAAGGCGACGCACTGACCGTATCTGGAGAGGTCAATAATAGTCGCCCAA
+AGTGTCGCACTGGCAATGCGGCTTTCTTGCTTGGTCGCGGCAAGATAGCCTAACGTCAAT
+GCGGTCAACATACCCCCAATACAGTAACCTGTAATAATGATGGTTTTTTCACCCGAGCTC
+TCATCCCACGGTCAGTGCGTCGCCTAAGCGTCGTCCGCAATTTCGGTTGGTTCTTGCGGA
+CGTGTGAGGGATTAAGAGTTGCGGACGTGCTGAGGGGTGTTCCGTTGCGGACGTGCTG
+>ds2020-267_168
+CAGCACGTCCGCAAAGTAAGGTGGTTTGTGTTACCCCGTTTGTCTAGCATGTCCCAGTAC
+AGTGGTATGGCAATGCCCTTATAGACCACCCCTAGCATAAATATGTTGATGTTGCTTTTC
+CCCCATTTCCAGTTGGTGCGGTCAATGGTAATGGTGACTTTGCTAAGTCCAAATAGCCGA
+TATATCAATATGGCTAGTTGGTCATAGTCTATGACAGCACTGGCGATAAATCGCTGTAGC
+CTGCGGTATTGACTGTCCGTCTTGCCACTTTTAGGTAAGTTTCCTTGCGGACGGGCTT
+>ds2020-267_169
+CAGCACGTCCGCAATCCCTTTATAGTTGCGGACGTGCTGAGTGTAACTCGATTGCGGACG
+TGCTGCTCCTTAGATTCGCTTAAGGCGACGCACTGACCGTCCTGGTGGGGGTACCTTTAA
+TAAGATAGAGCTATTAGAGGAATATCCAGATAAAGAATATAATGGAGAGGATGTAGTAAT
+TTATAGTCTCGGAGAAAGGTATTTTTTTAAGAATTCAAGGGAGAGAACCTTTGGAAATTT
+TAAGCAGACTAAACCTTTGCAGCTTGAAGAGAAGTGGGCGACTACGGTCAGTGCGTCG
+>ds2020-267_170
+GACGCACTGACCGTCGCCCAAAGACAGGTTGGAGAAGGCAGTGGCAGCTGCATGGGCTTT
+GGGTTTTACAGATCTGGAAGGCAGTCCTGGCTCAGTCCCTGTACCTTAAGGAAACTCAAA
+CAACTTATTTGGCCTTTCTGATCATAATATATATCATTTTTGAAATGGGAGAAAACGGTC
+AGTGCGTCGCCTAAGCGTCTAAGGAGCAGCACGTCCGCAACCCGAGTTACTTGCGGACGT
+GCTGAGGGCGCGAAACTTGCGGACGTGCTGCCCTGTGCAGATTGCGGACGTGCTG
+>ds2020-267_171
+CAGCGCTTAAGGCGACGCACTGACCGTGCTTCCCTCCCCCTGTAATTGATTCTTCCTGGG
+TCGATGCCCGAGCGGTTAATGGGGACGGACTGTAAATTCGTTGGCAATATGTCTACGCTG
+GTTCAAATCCAGCTCGGCCCAATAATTCGCCGATCCACCATGAAATAATATAACCCATAG
+TGTTACGGTCAGTGCGTCGCCTTAAGCGTCACGTCCGCAACCATCGTAGTTTCGGACGTG
+CTGAGGGGATCAATTTGCGGACGTGCTGGGGTCCCTGGTCTTGCGGACGTGCTG
+>ds2020-267_172
+CCAGCACGTCCGCAAGTGGCAGGCCCTAGTATGTTCCTCATTTAATGAGTTCAGACCGAC
+GGTTTCTAGAAGAGAAGTTAGGACGTGTTTCACCTCCCTTACTTCTCCTTTTTCGGAGAG
+ATACTGTAATAGATAATCATCTATTAGTTGTGTCTTCTTTAACTGCTTGGTTTTAGGATC
+CAATACTGGATTATTACCAAAGAAGCTATGATCCCTACGAAGAGCTCCAAGCGTAAGCTT
+GGGGTCATTCCGGAATTTAGATCGAACACGGATGGCTATTTGCGGACGTGCTG
+>ds2020-267_173
+CAGCACGTCCGCAAACAATGTCCTCTGCTGTTTTCCTGTCTACATCGCTTTCGCGGCTTT
+CATCTCTTACGTCATCTTTATCCTTCACCACTTCAGCATATGTGGGTTTGCTTGATTCGA
+CACTTCTATTCGTTCCAGAATCCCTCGACTGCTCTTTGGGCTCTCCGTCGTTTCCTTCGC
+ATGTCGGCTCATTCTCTTCCGCGCCCATCTCACTCACCGCTTCATTTTCCACTAATCTAA
+GCGATGCTTTCTCACGCCTTCCTTTAGCCTCCTGTCTTTGCGGACGTGCTG
+>ds2020-267_174
+CAGCACGTCCGCAATCCAACTGCTCAGACTCCGCAATCAACTCGTCGTCAATTCTAATGT
+ACCGCTGATCCATACTTACTATTGGCAGATTTTCGTATGTGTTGAATCTCATGTTTGTGT
+CTCTCGAACTGCCGGAGGATAGTGCATGTAGGGGTAGATCTGGTTCCTCCTCTTCTTCCT
+CATCCTCATCCCCAGCATTGCTAGGTGGAGCACGAGGTCTTTCATTCAACGCACCTCCAA
+AGCTCCGCAGCACTCTGGAGTCATCATTGCCCCTCATTTGCGGACGTGCTG
+>ds2020-267_175
+CAGCACGTCCGCAACCGAACTGCACTCAGCACGTCCGCAAATGAGACCCCATGTAGATTG
+CGGACGCACTGACCGTCATTCAGCGGTTCAGGTACGGTCAGTGCGTCCCGGATATTACGG
+TCAGTGCGTCAGGGAAGATCCCACGGTCAGTGCGTCACGCTAGAAAGCACGGTCAGTGCG
+TCGCCTTAAGCGTCCGCAAGATCTTAGGGGTTGGGACGTGCTGGGATGGGCTGATTGCGG
+ACGTGCTGCCGGCGACCTATTGCGGACGTGCTGAGGGGATGGACATTGCGG
+>ds2020-267_176
+CAGCACGTCCGCAAGCCAAAGCCCCTTCTATTGCGGACGTGCGAATGGTATCGTGTTGCG
+ACGTGCTGCTCCTTAGATACGCTTAGGCGACGCACTGACCGTTCGCATTTCCCTGGGGTG
+TCTTCATTCCAAGCACTCGCTATGTCACTCGCAGGTCGTGTGGGTACAGGCAATATTGCC
+GGTGTGGCAACGGCGATTACCTTTGGTGGTCCTGGTGCATTATTCTGGATGTGGATGGTG
+GCAGACACGGTCAGTGCGTCGCCTTAAGCGGCGACGTGCTGCTCCTTAGAT
+>ds2020-267_177
+AAGCCCACTATTTCAAACTTTGCTTTTGCTACACTTCTTTGCTCTCTTGACCATCTGTGT
+TTATTCCCAATGGCTTTTCCCCTGTTTGTTGATACCTATGAGCATGTTGCAAAACATGAC
+AAGAAATATTATGGATCTTTCCCAGCCACCTTCACTTTGGTTGCTGGAGGTGGGGTGATT
+GATCTTGAGAAAATGTTTTCTGGAGTCCGCAAACTAAAGCGCCATTTGACGCTACACCGA
+ATGTTTGCGGGCTGTGTTCTGGGCACAGAAGCTGCTTTGCGGACGTGCTG
+>ds2020-267_178
+AAGGAGCGCACGTCCGCAACCTACCAGCCTTAGCACGTCCGCAACTCAGGGGATTGGGAC
+GTGCTGAGGGGCTAGTGCTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCAC
+TGACCGTTGTCGCTGCATTGTGTTAGTAAAGGAATCCTTACATCGAAACTTCCGAAAGGA
+TGAAGGATAAACCTATATGCATACGTATAGTACTGCAATACTATCTCCAAATGATTAATG
+ACGGCCCCGTAGACGGTCAGTGCGTCGCCTTAAGCGAGATCGGAAGAGCG
+>ds2020-267_179
+GCGACGCACTGACCGTCCAAATATGCTTAAGACGGAAGAATCCCACGAGGCGAGTAATCT
+CACCCCATGAACACGCCACCGCCATCATACCTAAGAAGGCTGTTAGGCTCACCATCAACA
+GCGATAACCCATCAATGGCCAGAGGGAAACTGACCCCCAATGAGGGCATCCAAGGTAAAC
+ATGGCAGAGCACGGTCAGTGCGTCGCCTAAGCGTAAGGAGCAGCACGTCCGCAACGTAAT
+GTCGGTCAGCACGTCCCAATGATGAGACCCTAGTTTTTGCGGACGTGCTG
+>ds2020-267_180
+CACTGACCGTGTGGTCGCTGATGTGGAAAGAAAGTGATCCTATCGCCATCAAAATGGGCT
+TAGCCTGGGCAGTCATCGGTCTAATTTACTTGGCATTTAAAACCGGTGGTTTTAAGCGTC
+ATCCACCTATGCACAATGAACATGAGAGGGGCTGCGAAACGGTCAGTGCGTCGCCTTAAG
+CGTATCTAAGGAGCAGCACGTCCGCAACTTGTATTCTCTCAGCACGTCCGCAAGGGGTAT
+TTCCTCAGCACGTCCGCAAGCTACAGGCCTTAGGAATTGCGGACGTGCTG
+>ds2020-267_181
+CAGCACGTCCGCAATCACTGGTACCTTTTGCGACGTGCTGACGGTAATGATATTGGGACG
+TGCTGAGGCAGTGGCACTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACT
+GACCGTTTCATCCGGCCTCCAGCTTCCAAGCGGCTGCACCGGCAATCAGTCCGCGAAACA
+TATCATTCATAATTAACACTCCCCTTTTTCGAACTATGTGTATTGAAAGCAGTCAGAAAC
+CGCCGCTTTCACAACATTCGGCAATCAGCGTTCCAAAGATGTGTTCAAA
+>ds2020-267_182
+ACGGTGATAACCGAGAGCTGCGGAGAGAGGCTAGCTCTTTGCTTGCACGGGGGTCTGCGG
+ATGTCTGGAAGTAAGGGCGTTCGGGCTTTCGATTCTGGACGTTCGGGCTTTCGCTGGTGG
+GTATGAAGCCCGAACGCCAGGATTCAAGGAAGCCCGAACGTCCTTACTTCCAGACACGTC
+CGCAAAATACCTGTGGTCGATTGCGGACGTGTGAGGATTCGTGTCTTGCGGACGTGCTGG
+GGAATTTATCTTGCGGACGTGCTGAGGGCGAGGATCTTGCGGACGTGCT
+>ds2020-267_183
+CAGCACGTCCGCAACACCAGATCCCTGTGGTAACTTTTCTGACACCTCTTGCTAAAAACT
+CATTAATGCCAAAAGGATCGATAGACCGGGCTTTCGCCGTCTCTATGTTTACTGAACATC
+GAGATCAAGCCAGCATTTGCTCTTTTGCTCTACGTGTGGTTTCTGTCCGCACTGAGCTGG
+CCTTGGGACACCTCCGTTATTATTTTAGAGATGTACCGCCCCAGTCAAACTCCCCACCTG
+GCAGTGTCCCTGACTTGGATCGCGCCAGGTGGGATTGCGGACGTGCTG
+>ds2020-267_184
+CAGCACGTCCGCAATCTATTCCGAGTTTAGGAACCTAGGTAATAGTATCCCGATCAAACA
+GCTGACGAAGGGGATGAGCGAAACAGGGAGTCTACTAGACGGGGTTCAACTAGCGGACAC
+TCTTGGAACGGCCGGAGTAAGAAGTCCCCAAGTGAGCGTATTATGGGGGACCGTCAAGCA
+CATCCGGCAAGAATCAAAGGGGATCTCGTTGTTGCATAGCTCAGGTCGGAGCAAGGCGCC
+ATCGGACGTTCAACGGGCAACCTTTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_185
+CAGCACGTCCGCAACCCAACTCCCATCAATTAACCTTCCGGCACCGGGCAGGCGTCACAC
+CCTATACGTCCACTTTCGTGTTTGCACAGTGCTGTGTTTTTAATAAACAGTTGCAGCCAG
+CTGGTATCTTCGACTGATTTCAGCTCCACGAGCAAGTCGCTTCACCTACATATCAGCGTG
+CCTTCTCCCGAAGTTACGGCACCATTTTGCCTAGTTCCTTCACCCGAGTTCTCTCAAGCG
+CCTTGGTATTCTCTACCTGACCACCTGTGTCGTTTTGCGGAGGTGCTG
+>ds2020-267_186
+CAGCACGTCCGCAAAAGTCACACCTTTTCAGGGAGAGCTAATGCTTGTTGGGTATTTTGG
+TTTGACACTGCTTCACACCCAAAAAGAAGCGAGCTACGTCTGAGTTAAACTTGGAGATGG
+AAGTCTTCTTTCGTTTCTCGACGGTGAAGTAAGACTAAGCTCATGAGCTTATTATCCTAG
+GTCGGAACAAGTTGATAGGATCCCCTTTTTTACGTCCCCATGTCCCTCCCGTGTGGCGAC
+GTGGGGGCGTAAAAAAGGAAAGAGAGGACAGGGGAAGCCCGAACGTCC
+>ds2020-267_187
+GACGCACTGACCGTTTTTTTACCGATTTCAAGTACTGGGCATTTAATTCTTGCCGACTCT
+CTGTTAAATTTTTGGACCAAAGACAAAGCCGACTTGTTTATCGCCGTCATTCAGCTGGGT
+GCGATTTCAGCGGTAATTTATTTGTACTGGGGGAGGACCAGTGTCACGGTCAGTGCGTCG
+CCTTAAGCGGTCTAAGGAGCAGCACGTCCGCAAGAGCCATTTCGTTGCGGACGTGGACCT
+GACCGTTTTGCGGACGTGCTGAGGACAGCTAGCTTGCGGACGTGCTG
+>ds2020-267_188
+CAGCACGTCCGCAATATCCCCGTATTCGACATCGGCCCACGATTTCACGTTGAGGGGCGC
+AGGGGCCCAAAACACCTCTTTTTCGGCCTCGTCAGGATTCTGAGCTGTGCCGCTTTTCGA
+GCTCTTGGAGGAACCCTTCTCGTCCTTCTTCTTCTTCTTCAAGCTCCCGAGCGCCGCAAA
+CACGTTGGTGCTATTCAGAACCACAGACTCGTCCTTTCTGTTCCCGCCTCCCACCATTTC
+TTAACCCAGCGTAAGTCTAGACTTACCGAGCTTTGCGGACGTGCTG
+>ds2020-267_189
+CAGCACGTCCGCAATCGATCCATCCCCCGTTTTTCTTTTCTTTGCTGATTCCTCTCAATG
+AAATTTGCCATGTTGCACTAAGTTACTTACGGATGTATGCATGCAATCCGGGAACACTTT
+GGGGTGAACACCCATCCGAACAAGTAGGGTCAATAGTTCAGCATTTAGGCCGTAACATTT
+AGCAAAAAAAATCTTTAACCCAACAAGTGCTCTCCGAACCAAGCTAGATAGTCTCCTATC
+ACTAGGCTCACCAACCAACCTTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_190
+TATCTAAGAGCAGCACGTCCGCAAACGGTGGCCCCTCAGCACGTCCGCAAAGTGGTTGTA
+TTTTGGGAGGAGTCGCGTAGAATTGCGGACGTGTGAAGAGACCACCAAACAGGCTTTGTG
+TGAGCAATAAAGCTGTTTATTTCACCTGGGTGCAGGTGGGCTGAGTCTGAAGAGAGTCAG
+CAAAGGGTGGTGGATTATCATTAGTTCTTATAGGTTTTAGGATAGGTGGTGAAGTTAAGA
+GCAATGTTTTGCAGGCAGGAGTTCGCGATGCACGGTCAGTGCGTC
+>ds2020-267_191
+GCTCCTTTATGTAAGATGGATAAATTCCCAGATTAAGACATGAACGAAATAAAAAAAAAT
+TCCACCCATAACATCTATGTCAGCTTTTCTGTCTGAATGTATTCAGAACAACCCGCTTTC
+TAGACGATCCCTAATAGAAAAGAGGGGGGCTAGGGGTTATAGTCGACGTTGATTCATCAT
+TTTTAACGTCTCTAATTCAAAACTGAACGTGAAACTTTGGTTTCATTCGGCTCCTTTATG
+TAAGATGGATAAATTCCCAGATTAAGACATGAACGAAATAAAAA
+>ds2020-267_192
+CAGCACGTCCGCAAGGCCACCGACCTAAGTTCCTTGGAACAGGACGTCATAGAGGGTGAG
+AATCCCGTATGCGGTCGGAAAGGCGCTCTATACGTAGCTCCTTCGACGAGTCGAGTTGTT
+TGGGAATGCAGCTCTAAATGGGAGGTAAATTTCTTCTAAAGCTAAATATTGGCCAGAGAC
+CGATAGCGCACAAGTAGAGTGATCGAAAGATGAAAAGCACTTTGGAAAGAGAGTTAAAAA
+GCACGTGAAATTGTTAAAAGGAAAGGGAATTTGCGGACGTGCTG
+>ds2020-267_193
+GACGCACTGACCGTGGGCTTCCCCGTTCAGATATCGCCGGATCACAGGATATTGCCGCCT
+CCCCGACGCTTTTCGCAGGCTGTCACGTCTTTCATCGCCTCTGACTGCCAAGGCATCCAC
+CATGTGCACTTCATTACTTGACTATACAACAGGGCAACCGCGACGGTCAGTGCGTCGCCT
+AAGCGTATCTAAGGAGCAGCACGTCCGCAATTTGGGTCCCCTCAGCACGTCCGCAAGAAG
+CCTCACTCAGCACGTCCGAAAGTGTGCCTATTGCTGACGTGCTG
+>ds2020-267_194
+CAGCACGTCCGCAAGCACCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAA
+TGGGGGCAACCCTGATCCAGCAATGCCGCGTGAGTGAAGAAGGCCCTCGGGTTGTAAAGC
+TCTTTTGTCAGGGAAGAAACGGAGTTCTCTAATATAGGATTCTAATGACGGTACCTGAAG
+AATAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTAA
+TCGGAATTACTGGGCGTAAAGCGGCCCCATTGCGGACGTGCTG
+>ds2020-267_195
+CAGCACGTCCGCAATTCGGTTGCCCTAAGCGTCGCCAGTATCAACCTACTCAAAGAGGTC
+GGTGCATGGCAGCGTATCGAACAAAGCAAACGCAAAGCCGACTATACCCAAATGCAGGTA
+TGGCAAACCAATGGCGTGGGCGAGCTAAATTTTGGTGATGCTCAAACACCGCAATTATTG
+GGCAGTATGGTTGAGCCCTTTATCATCGAAAAAGCGCTGTATGACGGTTTTGACAATGAG
+AGCCTTGTCCATCAGGGAGACATGTGACTTTGCGGACGTGCTG
+>ds2020-267_196
+CAGCACGTCCGCAATGAGATGACGGTGAGCTGGATATCAAGAAATACTATGATATCATCC
+AAGAAGATCGAGTTTATATTTTCTTGGATGGTTTGGATGATCGACTTGACAAAGCCCGAA
+GTGATGTGCTCCAAATGAGTCTATTTCCTACAGTAGAGCAAGCCTATGCTCATGTTCGAC
+GAGAAGATATTCGACAAGCTGTGGTGTTAGGAGCTCCAACACCAACCGGAGTGGGGTTGC
+GGACGTGCTGGGGAGAATGAATTGCGGACGTGCTGCTCCTTAG
+>ds2020-267_197
+CAGCACGTCCGCAAATGCCTACTCATCAGAAACCAACCATCGCCATCAGAACCTAACTAA
+AGTTCAACTCCAAAATATTACCCAAATCTTGAACTTCACTGCAAATAATCTTTGATTAAT
+CCTCTAAACGAAGTAACCTCAAGATGTCCTTAATCCACCTCCATTGGTCGAAAGCCCATC
+TGAGTAGAACTCATAGTTGACCAAAATCAGCTTAAGAATCACAAGCCGAAACCAGTAGAG
+ACACAGAACCCCTGGCCCGTTGCGGACGTGCTGCTCTTAGATA
+>ds2020-267_198
+CAGCACGTCCGCAAACCTTCCCACCTTTTGACATGCCTGGACCGCCAGAGAGATCTGGCT
+TTCTCTTCGGAGACTAGGACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGAT
+GTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTTTCCTTATTTGCCAGCGGGTTAAGCCG
+GGAACTTTAAGGATACTGCCAGTGACAAACTGGAGGAAGGCGGGGACGACGTCAAGTCAT
+CATGGCCACGGAGATCGAATTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_199
+TCTTCCGATCTATCTAAGGAGCAGCACGTCCGCAAAAGTATCCCCTCCCTCAGTGAAACT
+ATGAACCCGGGCCCAGGCTCAAATTAATATTAATATAATAATAGAGTGGAAATGAAAATG
+TGATGGTTGGGGCAACTATATCATACAAGATACTTAACTGAAAATACTGTACGGAAGGTC
+GATGGTAAGCCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCACGTCCGCAAATTGA
+AACCAGTCACACTCGCAAAAACATAGGACTTGCGGACGTGCTG
+>ds2020-267_200
+TATCTAAGGAGCAGCACGTCCGCAAGGCATTACGCCTATTGCAAAGGCTATTGGCTTTTG
+ACCCGAAGGATCGACCAACTGCTGAAGAGGCACTAGCTGATCCTTACTTCAAAGGTCTAG
+CCAAAGTTGAGAGAGAACATTCTTGTCAGCCTATTTCAAAGCTGGAATTTGAATTTGAAA
+GGCGAAGAGTCACAAAGGAGGACATTAGGGAACTAATTTACCGGGAAATACTAGAATACC
+ATCCTCAGCTACTTAAGGACTACTTGATTGCGGACGTGCTG
+>ds2020-267_201
+CAGCACGTCCGCAAATGGAGTTGAGTTTTTCTTAATGGGTGGTGTGCTTTCTCTCACGGC
+TGGCTAAGTGGCGATTGACACCAAGAGAGGGTGAATATCAGCCATGAAAGTAGAGATCAA
+GTTCCCGGTTCTATGAAGTCGAACAAGGGCGTGAATTCGAGATCGCGGGCAGCGACTCAC
+GACTAAGTGGACACACAGGTCGCTGAACGTGGTGCACGACAAGGACAGTCGGTTCTCGTT
+GGTGACAAACGGATACAACGCCCTACATTGCGGACGTGCTG
+>ds2020-267_202
+CAGCACGTCCGGAAGCACTGATCGGTCAGAGGTCAACATAATGGCTGGCTGCGTCGTCGG
+GTCAGAGGCACGTGTTACCACGGTAGCTACTGAGCTGAAACGTTACGGTTTTGAACTAAG
+GGTTAGCGATAAGCTCGCTCTAGGCGTCGGCAACCCAAGGAAAGACTACGCGTTCACGAC
+CAACGCTCAGCAGACAGTTGCGGCAAGGATAGAGCGAACAAGCCGTCAAATCGGTAAGCG
+CGCTGCTACAAGCACGTTCATGTCGAAGCTGACCGTGGCGT
+>ds2020-267_203
+CAGCACGTCCGCAAAGGAACCGCCCTCTTTGGATGGGTAGAAAGAATAAGTACAATTTTG
+AATGTTTTGCTTATCCACAAAGTAACAAATATTATAATTGGATCGTTCAATCATTTTTCA
+GTCATTCATTGAATGATAAATCACTACAAGTGAAGGAGATACACGATTTAAATAACGAAA
+GATCCAATATTTAAAAATTGTATCTAAAATGACTGGAAAAGTAGAAACAAGACCGATACG
+GCTTGCGGACGTGCTACCCAGGTGTTCTTGCGGACGTGCTG
+>ds2020-267_204
+CAGCACGTCCGCAATTGGATACCGGTCATTCACTGAATTCGTTGATAGAGTAGGCGGTGT
+GTCAAGGTACGGAGCACATTTTTACGTCGATCACCACGTGTTTGCATCTTCATTTGAGGA
+GGGCCACGTCCTTGGCGATGTTGTAGAAGAAGAGGACTATAACGCAGCAACCATTTGCGG
+ACGTTACGCGTCGGACATAACCTTTTCCTGCGAGTCAGAAACGCCAGATTTTGAATTGGT
+AGCAAGATTTCTGTCGTCGGAAGCTGCGGACGTGCTGAG
+>ds2020-267_205
+GACGCACTGACCGTTCGGGTTTTTCTGTTCTGTTGTGGGAAGGGGGGATTTTCGCATCTA
+CAAGTTGAGAGTGTGCTGGGGCAAGTGGGCTAACCCGAACTCCCTGTAAGGGGCTTTTCC
+TTCAATAGGAATAAGGGTAATGTAACTCTTGTTTGAGAACTTTAGCTACGTACTTAGGTT
+AGTTAGCTCAGCTTCTCCTATGTCTATTTGGATTAAGGAAGTGGGGTAATGGGCAGACAA
+GGAGGTCCTAATAATGGTGGGTCGAAAGCCCGAACGTCC
+>ds2020-267_206
+CAGCACGTCCGCAAGAAGCCGCCCCTTGTTTCAAAGAGAGGAGGACGGGTTATTCACATT
+TCATTTGATGGTCAGAAGGCCGTATGCTTTGGAAGAAGCTTGTACAGTTTGGGAAGGGGT
+TTTGATTGATCAAAAAGAAGAATCTACTTCAACCGATATGCCCTTAGGCACGGCCATACA
+TAACATAGAAATCACACTTGGAAAGAGTGGACAATTAGCTAGAGCAGCAGGTGCTGTAGC
+GAAACTGATTGCAAAAGAAGGGAAATTGCGGACGTGCTG
+>ds2020-267_207
+TCTGGAAGTAAGGACGTTCGGGCTTCCCTATACCTTCTGCATAATGAATTAACTAGAAAT
+AACTTTGCAAGGAGAGCCAAAGCTAAGACCCCCGAAACCAGACGAGCTACCTAAGAACAG
+CTAAAAGAGCACACCCGTCTATGTAGCAAAATAGTGGGAAGATTTATAGGTAGAGGCGAC
+AAACCTACCGAGCCTGGTGATAGCTGGTTGTCCAAGATAGAATCTTAGTTCAACTTTAAA
+TTTGCCCACAGAACCCCCTCAACAAAGCCCGAACGTCC
+>ds2020-267_208
+CAGCACGTCCGCAATACCCATGCGCTACAATGGCGACTACAGAGGGTTAATCCTTAAAAG
+TCGTCTCAGTTCGGATTGTCCTCTGCAACTCGAGGGCATGAAGTTGGAATCGCTAGTAAT
+CGCGGATCAGCATGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACAC
+CATGGGAGTTTGTTGCACCAGAAGTAGCTAGCCTAACTGCAAAGAGGGCGGTTACCACGG
+TGTGGCCGATGACTGGGGTAGATTTGCGGACGTGCTA
+>ds2020-267_209
+CAGCACGTCCGCAATATACCACGCGTTACTGGTTCCCGGAAGAGTTAATATCTCCATTAG
+CTAAACCCTTTCTTACCCTTCCCTTGGACTCGTATTTTGTTTGTACACAATCAACGGAGG
+CCTCCCCGACATATGTTGCAACGTCTTCAATAGCATGCTCTTATTTCGTCTTTCCCTTAA
+TAAGTCATCAAATTTGGTGCTTTTTGATCCCCAGTTGCTATGGAGAACAAAGGACGAAAT
+AAGAGCATGCTATTGAAGACGGTTTGCGGACGTGCTG
+>ds2020-267_210
+CAGCACGTCCGCAACGGTCGACCTCTCCTGATGTATCTGTCAGTAATGGAAGCATCCATG
+AGTTGTGTCCTTGGTCAGCACGATGAAACGGGTAGGAAGGAAAGAGCCTTATACTATCTC
+AGCAAGAAGTTCACTGATTATGAGACAAGGTATACGGTTCTAGAAAAGACCTGTTGTGCT
+CTTACACGGGCCTCGCAACGCCTACGCCACTACATGTTGAACTATACGACCATGCTGATT
+GCAAGGGTGGACCCGGTGAAGATTGCGGACGTGCTG
+>ds2020-267_211
+CAGCACGTCCGCAACCACGGCCCCCTATCGAAACGACAGAGTTGTCGTCGTTTATAGCCT
+CATCGACGACGAGACGGTTCGGCGACTTCTTCCGCTCCAGAATCGCGGTCGAGAAGTCCT
+TCTTCTTCGAGTCGGACGATTCGGCTGGGTGAGCCATGGTGGAGATTTCAGAGATCAGGA
+AAGTACGGTAGACGAAAAGCAAACAGACCAAGAGAGAGAGAGAGAGAAAGAGAACATTGC
+GGACGTGCTGAGGCCCATATTTTTGCGGACGTGCTG
+>ds2020-267_212
+CAGCACGTCCGCAATCCGAGACCCCACCACGCGAAATGCTTTTCATCGTTGCCATGAAAA
+TTGCCATTTTTTATTTTGGTCCTTTGTGGTTTTTGCCGTCCCACGTTTAATCAATAATGC
+CACACAGGCGATTGGATAAAGTGGGGCGGTGGGGGTCAAGGGGAGGGCCTACCGACGGTC
+AGTGCGTCGCCTTAAGCGTATCTAAGAGCAGCACGTCGCAAGATGTTAACAGTAGCATTG
+CGGACGTCTGAGGACAGCGTGTTTGCGGACGTGCTG
+>ds2020-267_213
+GGACGTTCGGGCTTCCTAAAGCGGTTATCCCTTCCGAACATAGCTACCCGGCGATGCGAC
+TGACGTCACAACCGGTACACCAGAGGTTCGTCAACTCTGGTCCTCTCGTACTAGGAGCAG
+ATCCTCTCAAATTTCCAGCGCCCACGGTAGATAGGGACCAAGCCCGAACGTCCAATCTAA
+GGAGCAGCACGTCCGCAACAATCAGGCGTTATTGCGGACGGCTGACGGGCTGCAAATTGC
+GGACGTGCTGAGTGGATACCGTTTGCGGACGTGCTG
+>ds2020-267_214
+TCTAAGGAGCAGCACGTCCGCAAGGATCGGCCGCTTCCGCAAAGACCTAAGGGTTGCGGA
+CGTGCTAGGGTTGAGGTTTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCAC
+TGACCGTCTACTGTTCGGTATGGCGTCGTTTGGGTAGTGAAGTGGTAGTGTTTGAAGCCA
+AGCCAGAATTTTTGGCAGCGGCAGACAAAGCGGTGAGCAAAGAAGCGGCAAAACTACTAA
+AAGCCCAAGGAGTAATGTCAAAACGGTCAGTGCGTC
+>ds2020-267_215
+TATCTAAGGAGCAGCACGTCCGCAATGTTCTCGTCGTTTCTTCGTGGTCGTAACAATCAC
+TTCAAGCAGTGGAAATAACAAAAGATGTGCTCCAAGTCCTTGGGCTCTTGAACAGAATTC
+AACCACACTGGAATGGATGGTACAAAGTCCTCCAGCTTTTCATACTTTTGGAGAACTTCC
+AGCTATCAAGGAAACCGTGAAGTAAAAGAAGAAAAGGTAGACCACTAATACTAAGAACCT
+AACAGAACAAGCAATGCCCCGTTGCGGACGTGCTG
+>ds2020-267_216
+ATCTAAGGAGCAGCACGTCCGCAAAGACTTCCGACTACTTGGGACGTGTGACTCCTTCTG
+GGTTGCGGACGTGCTGAGTGGTTTTGTCTTGCGGACGTGCTGCTCCTTAGATTATCTAAG
+GAGCAGCACGTCCGCAAACTAAGTCAGCTCAGCACGTCGCAAAACCGCGGAATTGGGACG
+TGAGGGGCTACGCATTGCGGACGTGCTGCTCCTTAGATAATCTCAGGGTTCGTTTGTTGC
+GGACGTGTGTCCGATTTAGTATTGCGGACGTGCTG
+>ds2020-267_217
+TGTAAGGACGTTCGGGCTTCGCCCACCCGGTGACGTTCGGGCTTATTGGAGTGGGTGTTG
+GAATTTTGAGAGGATTTGTCCCTAGTACGAGAGGACCGGGATGAACGTACCTCTGGTGGA
+GCAGTTGTCGCGCCAGCGGCAGTGCTGCATAGCTATGTACGGACGGGATAACCGCTGAAA
+GCATCTAAGCGGGAAACCCACCTCAAAACGAGAATTCCCTTGAGAACCGTGGAAGACGAC
+CACGTTGATAGACCGCGGTGGAAGCCCGAACGTCC
+>ds2020-267_218
+GGACGTTCGGGCTTCGGGATCGAGGTATCATTAGCCGAAGAAGACCCTGGCCAATCCACG
+TGGCCTGCTTGACGAACGTCAGCGACGGAGACATCGTAAATTGGTCCGCGGGCATCGCAA
+TAAATCCTCTGTCCTACTACAGGTGCCGCGATAACCTTTACCAAGTCCGAACGATTGTCG
+ACCACCAGATCCGCTGGTCTGCAATATTCACCCTAGCCCACAAGCACAAATCCTCGGCGC
+GGAATATAATCCTAAAACCGTTGCGGACGTCCTG
+>ds2020-267_219
+CAGCACGTCCGCAACATGCTAGCTCTTAATTTTTTTTTAATTTTCCTTTTTCCTTGCATG
+AAATTTTGTTGCCAAAATTAAATTTCATATGATAGTTGATTTGCTACCAAGTTGGTGTGC
+CTTTCTTGTGGTTTTGGTCTAAATTATCTTAGCAAGGTGCTATATTGGCCTCTCCGTCCA
+AGGAGAAAAGTGAGAATTCACAGACCATTGGGAGGAACTGTTCTACTGGAATTACCAAAT
+ATGCCGAACGGATGAACTCTTGCGGACGTGCTG
+>ds2020-267_220
+TGTATTCATTATACCGGTCCTTTACTTGCTGTTGCGCTGCGATACGTGCCCTGGTTAGGT
+TTGTAGGCTTACAAACACAATCAGAGGTGATCTCTGTGTAGTCGTGTAGAACCAATTGTA
+GCTCAGCGAAGCTACGCTTGGTTGAGGGGGGTGTCGACGGTCAGTGCGTCGCCTTAAGCG
+ACGTCCGCAACACGCACCCCATAACACTTGCGGACGTGCTGACCGAACAAGCATTGCGGA
+CGTGCTGAGAGGGGGATAATTGCGGACGTGCTG
+>ds2020-267_221
+GACGCACTGACCGTCCTTTCCCTGGTATCCGATTCTGCCGCTACAAACAATAAGTGCTTG
+CTATTAATTAAGTTTAACCATTCCCCCCGTTCTTTGCCTGATAGCCCAACTGAAGACAGT
+ATTCTAAGTACAGCTTCTTCATCATTCTCTTGAGCATCTTTAGGTCTCCCGACTAAGAAT
+TCTTGATATTTTCTGTTTCTTTCCGCTATATTGCCTTCCTCTGCATCTTTGATAGCTGCA
+CCTATTAACTCTAGGCAGCACGGTCAGTGCGTC
+>ds2020-267_222
+CAGCACGTCCGCAAGTCTCACCTGGTCGCTCCTTCTTCTTCTTCTTCTAATATTCTGTCA
+ATCGCTTCCAAGTTCAGCCCATGGAGATGGAAATGGAGGTGGTACAACAACTACTAGTAC
+TATTACTAGGGCGGTTGTTGTTGGGGAGCAGCAGCCACCACTGCCAGCTACAAATTACCA
+TGTCAGTACTTTGCTTCACACAACTCGGAAGCTTAAGCTTGGGGTTCACATGAAAATAAC
+CCATACGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_223
+ATCTAAGGAGCAGCACGTCCGCAAACTAAATCGACTTTTACTTCCTCTAAATAATCAAGT
+TCGGTCAGCTTCCGTGCGACAAACAAATTACCACGAGGGTATCATGTTGTACACGTCCAG
+AGACCTCACTAAACAAGGGGCAGCACGTCCGCAAAGCCTAATCGCTTGCGGACGTGCTGA
+GGAGGTTGAGTTTGCGGACGTGCTGATGCTTAGATAGATCGGAAGCGCACGCGTCTGGCT
+TCCGTTCACTCCTGAGCTTCCCGTATGCTGTG
+>ds2020-267_224
+AAGCACGTCCGCAACCTCTCTCGACTGCCCAATCTCGTTCCCTCCCCAGAGTGCCAGTTG
+CTGAGTACATGCAGGGAGAGCCAATCCACAGTAGGTTGCGCAAATTGACCACTTCTCTTG
+CGGGGACTCTCCCAACGCACAAACTTGCGTTCATAGCGGGCGGCATACAACATGCACTCG
+ATACCCCCGTGTCGGTGTGCGTGGACGGTGTAACCACGCACAACGCATTGATGGATGTAC
+ACACAGACGTTAATGCTCTTGCTGACGTGCTG
+>ds2020-267_225
+ATCTAAGGAGCAGCACGTCCGCAAAGTTGAGGGGATGAGTTGTGGATAGGGGTGAAAGGC
+CAATCAAACACCGTGATAGCTGGTTCTCCCCGAAATGCATACGGTGCAGCGTTGCGTGTT
+TCTTGCCGGAGGTAGAGCACTGGATAGCCGATGGGCCCTACAAGGTTACTGACGTTAGCC
+AAACTCCGAATGCCGGTAAGTGAGAGCGCAGCAGTGAGACTGCGGGGGATAAGCTCCGTA
+GTCGAGAGGGGAAAACGAAAGCCCGAACGTCC
+>ds2020-267_226
+GGACGTCCGGGCTTGGTTGCTCCCCTCTGCCTTTGCACTCGAGGGCCAATCTCCGTCTGG
+CCCGAGGAAACCTTTGCACGCCTCCGTTACCTTTTGGGAGGCCTACGCCCCATAGAAACT
+GTCTACCTGAGAATGTCCCTTGGCCCGTAGGTCCTGACACAAGGTTAGAATTCTAGCTCT
+TCCAGAGTGGTATCTCACTGATGGCTCGGGCCCCCCCGGAAGGGGGCCTTCTTCGCCTTC
+CACCTAAGCTGCGGGGAATTGCGGACGTGCTG
+>ds2020-267_227
+CAGCACGTCCGCAACTGGCAACCCGCGCTTTAACGATTTTGTGCGACACTGATTTGATTA
+AACTCATTGGGTGTTTTGACCAACCCGTTAACTTGAATCACCATTTCTTGGTTTTGATTG
+GTGATAGTACCGACAGGTAATTCGACGTTCTGTGGGCGTAGCGCATTGCTAATTTGATTG
+ACTGAGACTTTATAGGCATTCATTTGGGTGGGATTGAGCAGCACACGGATTTGACGCTGC
+CGACCCACCGGGCCCAGATTGCGGACGTGCTG
+>ds2020-267_228
+CAGCACGTCCGCAAGCTCACATGGGTTATCTCTCTGCTCATCCACTACTACCTAATTTGG
+AATTATCATTCTCATCATTTCACTAAAATCAATTAAATTAAATTAAATTCATCACCTCTA
+TCAATTGATCCTCCAGAAGGCTTTTTCACCACTGCTTCTGGAGCCTCTGTAAAACAGACC
+AAAAGAAACCAAATTTACCACAAACACTCTGTAAAGTTTTCATCTTTTTACTGTTTCACT
+GTGTGAGAGAGACGAAATTGCGGACGTGCTG
+>ds2020-267_229
+CAGCACGTCCGCAATCCGCTGGCTGTATTTGTTGCTTTAGGTTTGTTTAGTAGAAGGTGC
+ACTGGGGTAGGCTCTGGTGGTAGTGGAGGTGGTGGAGGAGGAGCCGATTTTGGTGGTGGA
+GGAGGAGCCGATTGCGGTGATGGAGGAGGGGCTGATTTCGGTGGTGGAGGAGGAGGAGGA
+GGAGGTGATTTCGGTGGTGGAGGAGGTGGTGGAGGAGGAGGAGGAGGAGATTTCGGTGGT
+GGAGAAGGGATAGTTTGCGGACGTGCTG
+>ds2020-267_230
+CAGCACGTCCGCAAATCAGTGCCGCTACCTACTTCTACTAAGGCGGAGCTTAATAGGAGC
+AAGAGACTTGGTGGCAACAACCAGAATGAAATATTATTTAATCGTGGAAATGCCATGTCA
+GGTGCACCTATTAGAATCGGAACAGACCAATTACCAGATCCACCTATCATCGCCGGCATA
+ACCATAAAAAAGATCATTAAAAAAGCGTGAGCCGTTATTAAAACATTATAAAGTTGATGA
+TTACCACCATTCGCTTGCGGACGTGCTG
+>ds2020-267_231
+CAGCACGTCCGCAATGTTACCGCCCTCCCCTTAGATGTCTATGCATCCTTTAGCATCTCC
+CGATTTTTTTTTATATCGTTATATCTGCCCTCTCTCCATTTTTTTGAGAGAGAGCAGATG
+GATCCTATCCCCTATATCGAACACTAAATCCTATCTATTGATAGAAAGATCTTCGTCAAA
+TACCGGACTTTGCCTTTTTTTAGGAATTCCTCATATCCAAGGCAGCTTACCACAAGCACC
+CCATACGATACTAGTTGCGGACGTGCTG
+>ds2020-267_232
+CAGCACGTCCGCAAAACTGATGCAATAATGGTGGCTGCCTCAGCATCAGAAATGGAGGCT
+TCTCTAACTCTCATTAGTATCTGCTGCTTAAATGCCCTCCTCTCTCTCTGCCTCAGCCCT
+TCACCCACCTCCAATTGCACAGCAAATCTCGCCACACAACTAGAAAACGGGTGGTTCTCG
+AAGAACCTATTTTCCCTGCACTCTCTTGTTGTCTTCTTCTCCTTAACCCCACCACCACCA
+CCGGCTACCCCAGCTTGCGGACGTGCTG
+>ds2020-267_233
+GACGCACTGACCGTACCATCGCACCTTCAATAATCGATGAGCCAATCGCCACATGAGATA
+GTTGCACCAAAGCAAAGCCTAACAGTAAGCTCGTCACCAATAAGCCTAAACCCAATTATT
+TGTGACGGGCAAACACCATGCCCATGCCAACTGCAAGCACCACGTGAGTGAACATAGGAC
+GGTCAGTGCGTCGCCTTAAGCGACAGCACGTCCGCAATAATATGCCTCCACGTCCGCAAA
+TAACTGGCTATCTTTTGCGGACGTGCTG
+>ds2020-267_234
+GACGCACTGACCGTGGGGGTCCTCGTAGGCAATCGCTGTATTGTCGTCAATAGGTTTATC
+GGTGACTGCTTGAACGGCAGGACCTTTTGGGATAACTTTTACTACAGGTACCACAACCGC
+AGGTTTGGGTTGAGCATTCATAGGTGCACTTGCGCAACAGATTTGTTAGTGCTTTTGAAA
+CGGTCAGTGCGTCGCCTAAGCGCACGTCCGCAACATGAATCTCCTAAGCTTGCGGACGTG
+CTGGCGGAGGAACCTTGCGGACGTGCTG
+>ds2020-267_235
+CAGCACGTCCGCAATTCTTGGCTAGTGACGAGGCACTTCAACGGGTTGTACGAGTCGATT
+TACTTTGATGCACCAACCGAGGTGGAAGCCATGTTTTATGACAGGCTGCCGAACATGCCA
+GTCCGGAAGCCAAAAACAGAAAAACAGATAGACGGTCTAGGCTACACGAAGATCACGTCG
+AATCACCACATCCATTTCACTCCGTCCGAAGTGAGAAAGGCGGTTAGGAATGAAGCACGC
+GACAAGCCGAAGTTTGCGGACGTGCTG
+>ds2020-267_236
+CAGCACGTCCGCAAAGAACTCCGACTTCTGGAAGGGATGCATTTATTAGATAAAAGGCTG
+ACGCGGGCTCTGCCCGTTGCTCTGATGATTCATGATAACTCGACGGATCGCACAGCCATC
+GTGCTGGCGACGCATCATTCAAATATCTGCCCTATCAACTTTCGATGGTAGGATAGTGGC
+CTACCATGGTGGTGACGGGTGACGGAGAATTAGGGTTCGATTCCGGAGAGGGAGCCTGAG
+AAACGGCTACCACATCCAAGGAAGGC
+>ds2020-267_237
+GTTATCCCTGTGGTAACTTTTCTGACACCTCTAGCTTCAAATTCCGAAGGTCTAAAGGAT
+CGATAGGCCACGCTTTCACGGTTCGTATTCGTACTGGAAATCAGAATCAAACGAGCTTTT
+ACCCTTTTGTTCCACACGAGATTTCTGTTCTCGTTGAGCTCATCTTAGGACACCTGCGTT
+ATCTTTTAACAGATGTGCCGCCCCAGCCAAACTCCCCACCTGGCAGTGTCCCTGACTTGG
+ATCGCGCCTAAGTTGCGGACGTGCTG
+>ds2020-267_238
+CAGCACGTCCGCAAACTTTGTCAACTGGTTGTTGGGAGGGTTTCTTCTCAGTAACGTAGC
+TAACGCGTGAAGTTGACCGCCTGGGGAGTACGGCCGCAAGGTTGAAACTCAAAGGAATTG
+ACGGGGACCCGCACAAGCGGTGGATGATGTGGTTTAATTCGATGCAACGCGAAAAACCTT
+ACCTACCCTTGACATGTCTGGAATCCTGAAGAGATTTGGGAGTGCTCGAAAGAGAGCCAG
+AACTCCAGGTGCTTGCGGACGTGCTG
+>ds2020-267_239
+CGGAACTTCCGCAATCTCGGCCCTGGATAGAATTTCTTGGGTCTTCAACAAAAAAATTCT
+AAGTTTCAGTACAAATAATGATATATATTGTTAATTATTCAATTTAAATTTTAAATGGGG
+ATTCCTTGCTCAAAGATGTTCGTTTGTACGTGTATCAGATATATAACACATGAGGCTTGT
+GATAGGGCAGCACGTCCGCAAGACACAGACGGTATCTTGCGGACGTGCTGAGAGCGGCTA
+CCTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_240
+GACGCACTGACCGTTTTTGGCAAGGTTTAAATCATGGCTAATCAAAAGCATCGCCATGCC
+CCGCTCGTTTTTTAGCCGATGCAGTAACCCCAAAATCTCATGGCGTAAAGTCACATCTAG
+GGCGGTGGAGGTGGGGTACTACGGTCAGTGCGTCGCCTTAAGCGATCTAAGGAGCAGCAC
+GTCCGCAACTCCTCATCCCTCAGCACGTCCGCAATCGATCGTTGGCCACGTCCGCAAGTG
+GGGTCAGGTACATTGCGGACGTGCTG
+>ds2020-267_241
+CAGTTCGTCCGCAACTCTACCCGGATGCCCTTGCGGACGTGCTGACGGGTAAACTATTGC
+GACGTGCTGCTCCTTAGATAATCTAAGGAGCAGCACGTCCGCCACCACATCCGCCTCAGC
+ACGTCTGCAACTCCGTAAATGTGCGACGTGGAGGTATAGGATCTTGCGGACGTGCTGCTC
+CTTAGATTATCTAAGGAGCAGCCGTCCGCAACACTGATGGCCTCAGCACGTCGCAATCCT
+ATCCCATTTAGTTTGCGGACGTGCTG
+>ds2020-267_242
+CAGCACGTCCGCGAATGCCTCGGCGCGTCCGGTGGCTGGGCCCGCGGCGCGGCCGCGGTG
+GGGGTGGCGCAGCCTGTGCGCCGCCGGGTGCGGGTGTGGTGCGGGCGTGGGGTGGGCCCG
+GGGTTGGGGGGGTGGGGGTGGGGAGGGGGGCGTGCCGATGGAGGTAAGGGGCGGGACGTG
+GGGGAGGGTCGAGGGTTGAGATTGCGAGGTGGTGAGGTCAGGGTCATTGCGGACGTGCTG
+AGAGGCTTTCAATTGCGGACGTGCTG
+>ds2020-267_243
+CAGCACGTCCGCAATTTCATCCTTTTTCAAACCTGCCCCCGATCAGTGCAATGGGATGTG
+TCTATTTATCTATCTCTTGACTCGAAATGGGAGCAGGTTTGAAAAAGGATCTTAGAGTGT
+CTAGGGTTGGGCCAGGAGGGTCTCTTAACGCCTTCTTTTTTCTTCTCATCGGAGTTATTT
+CACAAAGACTTGCCATGGTAAGGAAGAAGGGAGGAACAAGCACACTTGGAGAGCGCAGTA
+CAACGGGTCAAACGGTCAGTGCGTC
+>ds2020-267_244
+CAGCACGTCCGCAAGATGGACACCCTGTAGATTGCGGACGTGCGACAGATTATTCATTGC
+GGACGTGTGAGAGTCTATCTTTGCGGACGTGCTGCTCCTTAGATACAGGAAGTAGGACGT
+TCGGGCTTTCCAGCGGCACTTGCTGTCGCTTATAATAACACACACGTCCAGGTTTGAGAT
+TGACTATGGTGGCTTATCATATCATGTTGTTACATGTTAGTAACAAAGGTTCTTTTTGGT
+AGGGAGTGTATAAGCCCGAACGTCC
+>ds2020-267_245
+CAGCACGTCCGCAAAGCCTCCGCCCTGATTCTTGATTAATAAACATGCCCTAATAAAAGG
+AGATTGATTATCGGGAATGGGTTAGGAATCGTAATTCAACTTTCTAATTGAAACAAACAT
+TATATTTCAAGCTAATATTGATGATGATTGTTGTTGGAAACAAACATAATATTTCTAGCA
+GATATATATTATATCCAGCTCCTCCTATCCTATAACAGAAAGAAAGAAAGGAGGGATAAT
+GAAGATCGAGTTGCGGACGTGCTG
+>ds2020-267_246
+CAGCACGTCCGCAATACCTGACGCTTCACTTGTTTCCGAACAAAATCGTCTAGTCGCGCT
+CTTCACGAGCTAATTGGTAAAAAGTCTACTGTCTAGTAGCATATTCACATCAAGGAAAGA
+ATCTTCGTCAAAATGGCTTATCAAAAGTCAGACAAGTCAACTGTCTCCGGCACAACAATC
+ACGCCAGATGACTCAGCCTCGCAAGCTGGACCACACATCGACACCCCTACCAAGTATCAC
+ATGCACCGGAAAGCCCGAACGTCC
+>ds2020-267_247
+GACGCACTGACCGTGAAAACGCCTCTGACGCACTGACCGTCTGTCGTTGGCTGACGCACT
+GACCGTTGGGAACGCTCTGACGCACTACCGTTCTATAGGGGTGTGTACGGTCAGTGCGTC
+GCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATATCATACCGTTGCGGACGGCTGAG
+GCTCGAGAATTGCGGACGTGCTGAGGTGTTTCTATTGCGGACGTGCTGAGCGCATATAGC
+TTGCGGACGGCTGCTCCTTAGATA
+>ds2020-267_248
+CAGCACGTCCGCAATACGTATCATCTTGCGACGTGCTGGGTGATTGACCTTGCGCACGTG
+CTGAGAGGAAGTGACTTGCCGACGTGCTGCTCCTTAGATAATCGAAGGGGCAGCACGTCC
+GCCAACTACTTTACCTCAGCCGTCCGCAAAACACCGAGCCATACTTGCGGACGTGCTGCT
+CCTTAGATTATCTAAGGAGCAGCACGTCGCATCAGTCACCGGTCAGCACGTCCGCAAAAG
+GGCCTCGGTATTGCGGACGTGCTG
+>ds2020-267_249
+TCAGCACGTCCGCAATCTGCGACCCCTGGAGTAATGTATTCTATGAATAATAAATAAATA
+TGAAGAATACTCTTTCAATCAAAGAAATATTTCAATTATTTTCGTGTTCGTATTTCGAAA
+GTAAAAAAACGTAAAAGGAATACAAAAGGTAGGAAATTTATTACAGCTGAATTCTTCATA
+AATTTTCTATTTCGATGAACTGACTCTTACAAAAGTTGTATATGGACCATGAGGAAGAAC
+AGACCCCCATTGCGGACGTGCTG
+>ds2020-267_250
+CAGCACGTCCGCAATACCCCACCACTATGAATGCTGGAAGCAACCCAACGCAAACTTGCA
+TAGGACATGCAAAGGGATATGATCAATACTCTCAACTCACCTGGGCACATAATGCACCAA
+TCGGTAGTTACAAGCAAAAGATCTTAAAACTCCTTCCTCTTTATTTTTCTCTCGATACTC
+TTCGACCCCTTTATCGCAATTAAAACTAAGCACAAAATTTATCTGCGCTGAAGAAAAAGG
+GCCACTCTATTGCGGACGTGCTG
+>ds2020-267_251
+CCGATCTATCTAAGGAGCAGCACGTCCGCAACAGGCAGTCTCACGATCGGGCATGAGCGT
+CCGGAAGTTGTCATTGTATACTCCCGCGGGTCGGAAGGCGGCGGGGGAAGGAGGAGGACA
+CTGGGCGGGATCTATCAGCAGCGAATTCCCCATACAGATAGAGGCGCCTATCAAAAAGAT
+ACTCCGAAGGCTTCGGGATCGAGGTATCATTAGCCGAAGAAGACCCTGGCCAATCCAACG
+GACCATACTTGCGGACGTGCTG
+>ds2020-267_252
+TCAGCACGTCCGCAATTCTATTTCACTCCATACCTAGCAAAAACAGGCTGGCTAAAAAAA
+TAAGACGACGTTTGAACAGGGGTCTTAGCTTGATGGCACTCACCAAGGTCAATTAAGCCC
+TATGTTAAATTAGTTAAATTGACGCCCAATAAATTTGACGGTTTCATCCTTGGCTTTTTT
+GACGGCAAGTTTGCGGTTTTGTCCTAGCAGTAATTTAATTTGCCACAGTTTTTCTTGATA
+CAAGGTTGTTGCGGACGTGCTG
+>ds2020-267_253
+GCGACGCACTGACCGTACTTTACCACAATTTATAGCTCGTGCAATTACCCAATCTCAAAC
+GGGTCATCTGGATTGATAGCCCAAAGTCCACTGAGGATTTTAGCTATATGCAAAAATTCT
+CAGCGTGGATTGCCTAAGGCGATGCCGATGATCCGGCAGTGGCGGAACGTGCCAAAAAGC
+TCAACCCCAATAACCCCCTCACTTTGCGGACGTGCTGAGGACATAGTAGTTGCGGACGTG
+CTGAGTATTATCTGGTTGCGGA
+>ds2020-267_254
+CAGCACGTCCGCAAAATGTCCTGGCTGGTTGGGACGTGCTGAGGCTCCTTACATTGCGGA
+CGTGCTGAGGCTAAAGTTGTTGCGACGTGCTGCTCCTTAGATCGCTTAGGCGACGCACTG
+ACCGTGGGCTTTGGGGTGTTTAAAGTGTAAAGCTGCAAAGGGTTGTTACCAATCGGTAAA
+TGTTGCTCGTGGGTCGCCCCTGCGGTGGGGAACGGTGTGGGAACGGTCAGTGCGTCAGGG
+TACTCCCAACGGTCAGTGCGTC
+>ds2020-267_255
+CAGCACGTCCGCAAACTGGCTGAGTTCTCTGTAGCTTTGCATACCACCAGTACCGCGGGA
+GAACAACTCAACGCTAAGTTCCCCCTGGACGACTTGAGGGGATACTGTTGCGGAGAAAGC
+AACTATGAGATGCTGGGTTTGGGTGGTGCTGTCGTCTACCACAGCTTGGTCAAGGATGCA
+GGTTGTCAGGCTCCAAGGTCAATTCTGAAAGGTTGCTGGAGCGAGGACGAGAAGGACGAA
+GAAGTCGTTGCGGACGGGCTG
+>ds2020-267_256
+CAGCAGTCCGCAATAGGCCCCGACTTCCGGGAGGGGTGTATTTATTAGATAAAAAACCAA
+CGCGGCTCGCCGCTCTTTTGGTGATTCATAATAACTTGTCGAATCGCATGGCCTTGCGCC
+GGCGATGCTTCATTCAAATATCTGCCCTATCAACTTTCGATGGTAGGATAGAGGCCTACC
+ATGGTTTCAACGGGTAACGGGGAATAAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACG
+GCTACCACATCCAAGGAAGGC
+>ds2020-267_257
+CAGCACGTCCGCAACAACCATCAATTAAATGTAGGAGCTATTCATGTTTTCACATGTAGA
+ACCGTATGCGGGTGACCCGATTTTGGGGCTGATGGACAAGCATAAACAAGACCCACGTGC
+CGACAAAGTTAATTTGGGTGTGGGTGTCTAATTTGATAATGAGGGTAAATTACCCGTCCT
+CAACTGTGTGCAAAAAGCTGAAGCACAAATCGCAAATCCACCAAAACCACGTCCCAGCCG
+GAATTCCTTGCGGACGTGCTG
+>ds2020-267_258
+CGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTCTGTCAAGTCGGATGTGAA
+ATCCCCGGGCTCAACCTGGGAACTGCATTCGAAACTGGCAGGCTAGAGTCTTGTAGAGGG
+GGGTAGAATTCCAGGTGTAGCCGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGA
+AGGCGGCCCCCTGGACAAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGAT
+TGTAGTTTTGCGGACGTGCTG
+>ds2020-267_259
+CAGCACGTCCGCAACTCAAACGGGGCGCACGTCCGCAATAGATCCCTCTTTTTGCGACGT
+GCTGCTCCTTAGATTATCTAAGGAGCAGCACGTCAGCAAAATAGCCCCGTTAGCACGTCC
+GCAAACGAGATCGCTCAGCCGTCCGCAATTTATGGCCATGGATGTGCGGACGTGCTGCTC
+CTTAGATAATCTAAGGAGCAGCACGTCGCAAAACACCCGTCATGTTGCGGACGTGAGCGA
+AGGCCAGTTGCGGACGTGCTG
+>ds2020-267_260
+CGTCCGCAAGTCGGATTGGGTCAGCACGTCCGCAAGAAAGGAGCCCTCAGCACGTCCGCA
+ATATTTTCTCGGTCGCCGTCCGCAAGTCAGTGTTGGTTGCGGACGTGCTGCTCCTTAGAT
+ACGCTTAAGGCGACGCACTGACCGTCGTGGGGACGCACTGACCGTACTCTTTCCCCTGAC
+GCACTGACCTTCTCATCTGATTTGACGCACTGACCGTCGTTGTGGGACTTGGCGGAGGGG
+ACAAACTACGGTCTGTGCGTC
+>ds2020-267_261
+CAGCACGTCCGCAAGGGCATACTACTCCAGTGCTGCGCCATTGGACAAGCAGTTCATACA
+ATCTTACAGCGTATTTACTTTGTAGGTTACTTACTTGGTCAATATCATACTCAGTAAAAC
+GTTGCTCAAGCCTTGTGATTAGCGGTATTACATCACTAGCAAAGACCAGCTCAACACAGC
+CCAAGTCATCAATATAGCCAATTTTATCCACCCAACGGCTTTTGAAATGACCGAATTTGC
+GGACGTGCTGCTCCTTAGAT
+>ds2020-267_262
+CAGCACGTCCGCAACTTTACCCTCTTTTTGGATGACTCACAATTATATATACTATATATT
+TCTATACGATCAGATATCATGCAAACCCTTTCTATACTAATAGCATAGAACCTTACTCTA
+TATTAATCTAACAAATATTTCATCTAATACTAATAAAAGTTAAAATTTCTTTTTTTGAAA
+TTGAAGAAGTTCTATTTGCTCAATAAACTTACCTATATTTATTTTTGTTTGTCCAGGGGT
+AGCCGCTTGCGGACGTGCTG
+>ds2020-267_263
+TCAGCACGTCCGCAATCACATACCGCTCTCGCCATGCTGGCTTATCTAAATTATGATTTG
+ATGATTGGCAATTTGGAAATGGATGTGATGGATGGCGAGCTGCGCTTTAAGACGTCGCTT
+GATTTGGAAGTGACGGGGGTGAGCGAGCTCATTATGAGTTATTTGCTACAGAGTAATTTC
+TCGTTGTTTTCACGGCTGTATGACACCATTCGCGAGATGATTGAGCAGCCCAATACTACC
+ATGGATTTGCGGACGTGCTG
+>ds2020-267_264
+CAGCACGTCCGCAAGAATCGCTGGCTGATCCAAGGGAATTTCGTACATTGTATTCATTTG
+TCTTTGTCAAGCATCCTGACATAAAGGGAACCGTCTACTGGCAAGCGAAGTCATCTCGAC
+GATGTAGCACTCTACTAATACCATAATCTTTAGTCGGAATTTTGTGAAAGAAAGAAAGGG
+CGCTCCCACATACTACTAAAAGCTCCAGCTCGGGCAATAATCCTCTCCACTCAAAAAGAA
+AGGGTCTTGCGGACGTGCTG
+>ds2020-267_265
+CAGCACGTCCGCAACACCCTCTGCATGAAGTAAGTGTAATTCCTTAACGCGAAATAGAAT
+GGCTGAACATCACGTGAGTTTGCCCGCCTTGCAAACTCACAGAGGCAGTCCAATCCACAG
+AATCTACAAGATATGCTATTTCCATTTTTTTTCTTTTGTAATCAAGTTAGCCTACAAGTC
+AGTATCTCTGATACTGAGACTCTACAATAAGCAGCTCCCATGGAAGCCCACTAGAGGGCA
+TAGTGTTTGCGGACGTGCTG
+>ds2020-267_266
+CAGCACGTCCGCAAGTTGCCCGCCAGCGTTGGTATTTCCAGTCTGTATCCCGAAGCTGCG
+TTCGGGGTGATTGAGACTGACACGTCACTGTCTAAGCTCTCTGAGATGCCCCCCGCCACC
+CTGTGCACTCTTTTGATTGTGTAGAAGTCCTCCTTCTCCATTGAGCACACTAGTGCTTGC
+CTGACATAGGATATTTCCCTCACTAACGATATTGTGAGGAGGGAAATATACTATATCAGG
+CAAGCTTTGCGGACGTGCTG
+>ds2020-267_267
+CAGCACGTCCGCAACACCCATCCACTCTTTCAGCATCCTGCAAATCTTCTTCCTTCTTCT
+TCAGTGCTGCCAATGCAGCAAGAAGATCAGACTCCAGGATTTCAAGGTTAAACCCTAGCT
+GGATATCCTGAGGATGATGAGAATTTCGGTTCATCTGTTCTTCCAGTTTCTGAGTCTGTG
+CAAACAACCTCTCAAGAAGAATCCTTGCAGGTTCCGATGCTCCATTGTCACTAATGCTCG
+ACTTATTGCGGACGTGCTG
+>ds2020-267_268
+CAGCACGTCCGCAATGCATGGCCTCTGAGTTTGTGGAAACGAACCCTCTGCCAACCTGGG
+ACGGCACGACCCACGTCTCTAAGTCTGCCAAGTTAGAACACGGGAAGACCCGCGCAATAT
+TCGCCTGCGACACCCGGTCGTATTTTGGGTTTTCGTGGATCCTAGATGCGACCCAACAGG
+CCTGGAAGAACGAACGGGTTGTCATGGATCCGGGCAAAGGTGGGAAGTGTGGGATGACGC
+AACGATTGCGGACGTGCTG
+>ds2020-267_269
+GACGCACTGACCGTCAAGCTTTCCCTCCCGACAATTTCAAGCACTCTTTGACTCTCTTTT
+CAAAGTCCTTTTCATCTTTCCCTCGCGGTACTTGTTTGCTATCGGTCTCTCGCCCGTATT
+TAGCCTTGGACAGAATTTACCGCCCGATTGGGGCTGCATTCCCAAACAACCCGTCATTGC
+ACGGTCAGTGCGTCAGGGAAAGACGTGTGCCCCTAATAGCTTGCGGACGTGCTGCCACAG
+GAGCCTTGCGGACGTGCTG
+>ds2020-267_270
+CAGCACGTCCGCAACTTAGCCGTCCTCATCATCATGAACCAGAGTCATACAAAGTAGAAC
+AAGAGGAGGAGAAGGAGAAGAAGCACGGCAGTCTTTTGGAGAAGCTTCACCGATCCGACA
+GCAGCTCTAGCTCTTCGAGCGATGAAGAGGGAGGTGAAGGAGAAGAGAAAAAGAAGAAGA
+AGAAAGAAAAGAAGGGACTGAAGGATAAGATCTCTGGTCATCATGATCAGAAGGCGGTGG
+ACAAAGCCCGAACGTCCTT
+>ds2020-267_271
+GACGCACTGACCGTTTCGGTCTCGGGACGCACTGACCGTCGAATCGGGAATAAAACGAGG
+CATATCGACACGGTCAGTGCGTCGCCTTAAGCGTAGCACGTCCGCAATAAATCGGGGATC
+GGTTGGGACGTGCTGAGGGAACGCGTATTGCGGACGTGCTGGGGTATTACGGTTGCGGAC
+GTGCTGGGGGATCGGTTGGGACGTGCTGAGGGAATGCGTATTGCGGACGTGCTAGGGTAT
+TACGGTTGCGGACGTGCTG
+>ds2020-267_272
+GGACGTTCGGGCTTTTCGTGGTGTTTGGGTTGCAATCCGCAATACTCAATGACGCTGCAG
+TCTTGCTTGGTCAGGATTTGCCCTCTTGGCTCAAGGAATGTGATGCTATGGTTGACTATA
+TGCACTTGTTTGCTGTAGCTCCGCGAGATGTCATTGATCGTATGCAAAAGCCTCTCAGCC
+TTGGGAGGCAACTCAGAATTATCTACAGAAAATTGTGCAATAGATATCGAGCTTAGTTCC
+CGGGTTTGCGGACGTGCTG
+>ds2020-267_273
+CCGATCTATCTAAGGAGCAGCCGTCCGCAACAGGCGCAGTTTGCTCAGTTGCAGGGACAG
+CAGCAGTGCTCGTCGTAGAGCCGGTGGTCGCGGGTGCAGACATTTTGACGTGGTAGCGTA
+AATGTGTGGGATGTGGGGGGAGGTAATACCTGTTAGGAGAGCGTGGAATGAACTTTTATG
+TTGGAGGTGTCAGACTTTGAGATTTACGTTCCTCAGATAATTCAGGGCAAGTTCGTTGCG
+GACGTGCTGCTCCTTAGA
+>ds2020-267_274
+ATCTAAGGAGCAGCACGTCCGCAAAGCCAATTCTGTAATATTTGTGATTCATTTTGGCGT
+GAGCTAATAATGTCTTGGGCTAAGTCTAGCAGTTCAGGATTTTTGCCGTATCGCTGCTCA
+ATATTGGCAAGCGCGATGATTTCATCAAAATGACTCAGCATGGTATTGACAAAAATCATA
+TCCGGTGAGATGGGTATATAGTCAAATTGATTGAGGGCGTTTGGGTCACTGGAGTGCACA
+GTGATTGCGGACGTGCTG
+>ds2020-267_275
+CAGCACGTCCGCAAATTTGCCGCTCTTCTTATTCCCAGAATCCTTAGCCTCTTCCTAAAT
+AAGGCCCCTCCCTAGTCCTTATTCTCTATTCCTTATAAAATGAAAGATTCATTCTTTAGC
+CAGATCAACATCCTTCTTCCTATTACCTATCTCCAGATCAAGATCCTAACATGATTTAAG
+CCATAACTCTACTATGGAAGTACTTAGTAATCCTACTTCCTATTCACTATCTACTTCCTT
+CGTCAGCCTTCCTCCATA
+>ds2020-267_276
+TAAGGAGCAGCCGTCCGCAACAGAATCCCCCTCAATTCTCCAGCGCCCACGGCAGATAGG
+GACCGAACTGTCTCACGACGTTCTAAACCCAGCTCGCGTACCACTTTAAATGGCGAACAG
+CCATACCCTTGGGACCTACTTCAGCCCCAGGATGTGATGAGCCGACATCGAGGTGCCAAA
+CACCGCCGTCGATATGAACTCTTGGGCGGTATCAGCCTGTTATCCCCGGAGTAACTTTTA
+TCCGTTGCGGACGTGCTG
+>ds2020-267_277
+GTCGCAACGTGGAAGCCCCAGCACGTCCGCAATGGGACTCCAGTCAGCACGTCCGCAAAT
+TACAGGTGGTCGGGGAAGAGTGGAATTAGAGGAAATCGGAGGTGAATTGGGTCGGGGTGA
+GGTTCGATTGGAGATAATTACGGTTTGATTGCAGAGGTTGACATTTGGGGGTTAGGGTTT
+GGTAGAGAGGGCAAGAGAGAGAGAGAGAGATAGAGGCAGAAGCGCCGAGTCCAACTGTAG
+GAACTTGCGGACGTGCTG
+>ds2020-267_278
+CAGCACGTCCGCAATGTTGGCCCTGTGCTGCAAGATTCATTGTTCGCTTTCTCAGACCTT
+TAGCACTGCAGAGGATGGGCAGAGCCAGATTCTTCTTCACCTCTACCGTGGAGATTCAGC
+TATGGCCAAGTCAGCCCATTCTTTAGGCACCTTCCAGATCACTGGTATTGCTCCAATGCC
+ACGTGGAGAGCCCAGCGTTCGCGTAGAGTTCCTAGCTGACACTGGGGGCATCACTCTCAA
+AGCATTGCGGACGTGCTG
+>ds2020-267_279
+AGGACGTTCGGGCTTTTTCGGTCGAGTTGTTTTATAGACCGGGGTTGCCCAGGGCGGGGC
+CAGGCGGGAGAAAGATACTTCGGGGATAGAATTGGATAGAGAACCTGTACCAAGAGATGT
+GTCAATTGAATAACGCGAGAAAGCCTCAAATCCCGCCCAACTCTATTGAATGAATCAGTC
+CACCTGAACCCACAGGTCAAAGGGGAAAGCAACGAGGAATTTCAAAGTGGAAAGGTAAAC
+GCAAGCCCGAACGTCCTT
+>ds2020-267_280
+CAGCACGTCCGCAATAAGGGCCCCCCCCCCCTCCTTCCTTGTCTGATTCGAGGGGGATCC
+CGTTGAGTTCTTATGCTTTCATGTCTACAACTCAGTTCATCCGATTATTACAGGGATGAA
+CCTAATCCAGAATAGGAACCATAAAAGAAAATACCGATTAAACCGATCACAAGAATACCC
+GCTACAGTACCTATTATCCAAAGAGGAATCCTTCCAGTAGTATCGGCCTATCTTTGCGGA
+CGTGCTGCTCCTTAGAT
+>ds2020-267_281
+CAGCACGTCCGCAATGTCTAGCGCATGGAGGATCCGTTGAGAGTTTCTGTTGTCTCGGTA
+GGGAACTGTATGATCTTTTCCCCTATTGTATTGAATCAATAAAAAAAAGAGGTCAGTGCT
+ACGGCCCCCTATTGTTTGATCCAATATTGACCGGGGACGAGCCCCGACTTCCATAGGTCC
+TTGGTTTGACCTCCCGTAGTGGTCCTTGCTTTTAATAAAGTGGAGCGGGGAAATTTTCTC
+GACTTGCGGACGTGCTG
+>ds2020-267_282
+CAGCACGTCCGCAAGCCGGGTCCCCTGGAAAAGTGAAAGTAGAAAGGGAAGTGCATTTCG
+GTAGAGAAATCAAGTAGGGGTGCATTTCTGTAAATACTCGGGATTCTTTGGGCTAACATT
+TTCGGTTTAGGCGGTGAAAGAAAGTTTGGGAGGAGGTTAGGATGAAAAAAGGGTGAATGG
+AAATTCGCCCCTTCTTTTTTGATGGTTTAGGCCAGATTCAGTGTACTCAGCAGCGGAGTT
+CACTTGCGGACGTGCTG
+>ds2020-267_283
+CAGCACGTCCGCAAACTTGGGTAGGTGGAGAAGTCACTTGAAATGTTTTCAGAGATGAAA
+AAATGTGGCGTGGCACCTAATGAGATAACCTTTATTGGGGTTCTTGGGGCTTGTCGACAC
+ATGGGCTTAGTCGATGAGGGGCGCCGCCATTTTGATTCCATTGTCCAGGAACACAAGATA
+GAACCCAACGTTGATTTGAGATATTGATAAGGCGAATTACCTGCCTATTCAATGCCAAGC
+GAGAAGCCCGAACGTCC
+>ds2020-267_284
+CAGCACGTCCGCAATGAGGCTTGACTCACACGTCCGCAATGAATACCCACTTCTGTTTGC
+CACTGTTGTTTTCTTTCTTCTTTTCCTTCTTGGTTATGTCTTTCTCCTTCTTCTTTGATT
+TCTCCTCGTCTTTATCAATATGTTTCTCCTCATCCTTTTTATGTTTTGGCTTCTCTTTTA
+CCACTGACTTGGTCTTTAATTCAAGTTCCACCTCAGCCTTCTCCTTCTTTAAATCCCCTG
+GTCTTGCGGACGTGCTG
+>ds2020-267_285
+GACGCACTGACCGTGACTGCTCTCCTCCGTCAATGTGCGTTTGTCAGAAGACAAAGTGCT
+ATATACCATCAATCATGCCAAACCAAAAGCGCTACTGTTAAATTCAGAATTGTCACCGAT
+GATCAAAAGCCACACCCAAGATGCGCCATCAATCGAGCATTTGATTTGGTTGGATGATAA
+CAATACGCCAATACACCCATACAGACGGTCAGTGCGTCGCCTAAGCGGGAGAGCATACCA
+ACATTGCGGACGTGCTG
+>ds2020-267_286
+CGCACGTCCGCAAATTCATGGGGGTGTTTGGTAGTATTTAATTCGTAGTATTTAACCGGT
+GGCATATATATTTATAGTACTCAGTCCGAGACTCCGAGAGTGTCACATGTGTTGTTATTG
+CCAGTGGTTGCCGTTGTGAATGAGATAGAGCCGACTACTAGGGTTTCCATGAGCATGGCA
+AATATTAGCACAGTGAGGAACCTTGACGGCTGATTTCTGAAAAGACGTCGTAGTCTCTAA
+TTTTTGCGGACGTGCTG
+>ds2020-267_287
+CAGCACGTCCGCAATACTCCGGGGCTAGACATTGCTCTACATGATACTTATTATGTGGTT
+GCACATTTCCATTATGTACTTTCTATGGGAGCCGTTTTTGCTTTATTTGCAGGATTTCAC
+TATTGGGTGGGTAAAATCTTTGGTCGGATATACCCTGAAACTTTAGGGCAAATACATTTT
+TGGATCACTTTTTTCGGGGTTAATCTGACCTTCTTTCCAATGCATTTCTTAGGGCTATCG
+GTTTGCGGACGTGCTG
+>ds2020-267_288
+CAGCACGTCCGCAAGGGGTTTTTAGTTCCTGTGGAGGATGTATGGATCGAGACACGCAGC
+TTCGACAAGTCTTTCTACCGGATACTACTGGGAGAGGTCCAGCTCGCTTGTTTGCCACGA
+ATATAATTCCTTTTAACTCATTTTTTTTATGCTAGGTTGGATCTACGGCAGTGCAGTTCT
+ACTTGAGCTTAACGATCACCAAAGGTCAGGTGAAATAGGAACGGAAAGCCAATTGCGGAC
+GTGCTGCTCCTTAGAT
+>ds2020-267_289
+GGACGTTCGGGCTTCTCATGTCCCCTTTCACCCGTAGGTCGTATGCGGTATTAATTCGAG
+TTTCCCCGAGCTATCCCCCACTACTAGGCAGATTCCTAAATGTTACTCACCCGTCCGCCA
+CTAATCATATCTAGCGAGCTAGATAATCATCGTTCGACTTGCCCTGTTAAGCCCGAACGT
+CCTTACTTCAGACGTCCGCAAGTAGCAGTAGGTAATCATTGCGGACGTGCTGAGGTGCTA
+ATTTGCGGACGTGCTG
+>ds2020-267_290
+CAGCACGTGCGCAAATATACTGATGTATTCAACGAGTCTATAGCCTTGGCCGACAGGCCC
+GGGTAATCTTTGAAATTTCATCGTGATGGGGATAGATCATTGCAATTGTTGGTCTTCAAC
+GAGGAATTCCTAGTAAGCGCGAGTCATCAGCTCGCGTTGACTACGTCCCTGCCCTTTGTA
+CACACCGCCCGTCGCTCCTACCGATTGAATGGTCCGGTGAAGTGTTCGGATCGCGGCGAC
+ATTGCGGACGTGCTG
+>ds2020-267_291
+CAGCACGTCCGCAATCCTTCTCCCCTCACCGTCTGAACAAGGTCCGGCATGTTCCATTCC
+GGGGGTAATTGCTTATCGGACCTCGACACCCACTTGGTGTATTCCGAACAGAGCGCCTCA
+AATATTTGCTCACACTCAGGTGGAGCGCTTTGCGCGTCAGACCTAGTCGAAGAGGTACTT
+GACGAGAAAGACATACTCTCATCGTCCAGCATAAAATGTAAATCCCCGGGGGGCAGGATG
+CTTGCGGACGTGCTG
+>ds2020-267_292
+GACGCACTGACCGTGCATCCACGCCTGACGCACTGACCGTGGTTACACACCTGACGCACT
+GACCGTAAGTAGAGACCTGACGCACTGCCGTTAGTGAGACGGTGAATAACGGTCAGTGCG
+TCGCCTTAAGCGTCACGTCCGCAATACGTCAGGGATGGCCTTGCGGACAGTCCAACTCGC
+TTGCGGACGTGCTGAGGGAAGTTTGTTTGCGGACGTGCTGACGGGTAGGAGTTGCGACGT
+GCTGCTCCTTAGATA
+>ds2020-267_293
+ATCTAAGAGCAGCACGTCCGCAAGTTGAGAACCCTCTTGACTACAGACGTTAGCACCCGC
+AGTCTGTCTCCCGGATATCACTCATCGGTATTCGGAGTTTGCATCGGTTTGGTAAGAGAG
+GCGGCTGGAAGCCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCCGTCCGCAACCAA
+TTTCGGGTAGCACGTCCGCAACATCTGCTCCTCACACTCCGCAAATTAGACCCCATATCG
+TTTGCGGACGTGCTG
+>ds2020-267_294
+TCCGCAAGCATAATCCGCTCAGCACGTCCGCAAAGGCCTACCCCCAGCACGTCCGCAAGC
+TGGAAACGGTTGCTGTTGCGACGTGCTGGGCTTAAGACCTTGCGACGTGCTGAGTCATAT
+CTGCTTGCGGACGTGCTGCTCCTTAGATATCCGCAAGGCAACTGGAATTGCGGACGTGAG
+GAGAGGATAGTTGCGGACGTGCTGAGTGACCGTACTTTGCGGACGTGCTGCCTCGAGATG
+TTTGCGGACGTGCTG
+>ds2020-267_295
+CAGCACGTCCGCAAAAGCCCCACCCTGCTTGCAAAATGAAAGAAAAGCCCCTTTTTATAA
+GTTAAAAAGACTGTTATGAAAAAAAAGTGCTAGAATCTACATTTACACATTGATTCTTTT
+TTTTCGTGATTTTTGTTGAACCGTATGCATCAAAAGGTGCATGTACGGTTTCTAATGGAT
+ACAACTTTATCCCATTAAACCGACTTTATAGAGAAAGATTAATTTTTTGAGGACTGGGTA
+ATTGCGGACGTGCTG
+>ds2020-267_296
+CAGCACGTCCGCAAGCCGAGAGCGGTTAGTAACAGATTAAGTGGAGTATTCGTCACACAC
+GACGATACCGCACTTTTACAAGGGTTCAAGTTGTTTAGCTACACAAGGTGAGCAGAGGTT
+ATTAACATGGCATCTCACTCAAGCATGGCATAGCACACAAACATGGCAAGAGGTGAAGCA
+TAAATAAACTACCTAAGCTAGTCAATTTAAGTGGGGTGAAATCCTAGACATGGCAAACTA
+TTGCGGACGTGCTG
+>ds2020-267_297
+GACGCACTGACCGTGTCCTCCTCCCTATTACTCGTGTCCATGAAGAGACGAAATCTGCTC
+GCAACCGCGCTCCTTCGAGCTCCACACCGCTTTCGGGCGGATGAGAGGCACGAAAGAGCC
+GTCGTGAGAATCGAAGAAAGACGAATTTAAAGAACAATAAGCGGACGGTCAGTGCGTCGC
+CTTAAGCGACGTCCGCAAGGAACATCCGGTACTCATTGCGGACGTGCTGAGGAGTCCGTC
+TTGCGGACGTGCTG
+>ds2020-267_298
+GGACGTTCGGGCTTGACTACAGCAGTGAATGAGGACCTGCACAAGGAGTGGCAGGAATAC
+CTGGATGAGACCAAGCATCACGAGCAGGTGCTGACCCAGGTTTTTGAAGAACTGGGATTG
+GACACCGAAGAGATGAGTCCGGGCAGAGAGGTGGTGGCGCATAACGGCGCCTCCTTGGTG
+GCCGAGTATGCATAGATTAAAGCCCGAACGTCCTTATGCGGACGTGCTACCCGGAATCTG
+TTGCGGACGTGCTG
+>ds2020-267_299
+GACGCACTGACCGTTAACCACGCGCTTCAACCTGGCCATGGGTAGATCACTCCGCTTCGG
+GTCTAGGACACGCGACTCAATCGCCCTATTCAGACTCGCTTTCGCTACGGCTTCCCCACA
+CGGGTTAACCTCGCCACGTATCACTAACTCGCAGGCTCATTCTTCAAAAGGCACGCTGTC
+ACCCCACAAGGAGGCATACGGTCAGTGCGTCGCCTTAAGCGACGTGCTGGGGAGCGCTAG
+TTGCGGACGTGCTG
+>ds2020-267_300
+CAGCACGTCCGCAAATTAGTCTGCACTTTATTCCCTTCCCAAAAGCCATAACTCCTCCTG
+GGAACCTTCTCAATCCCCAGATAACTACTACAATCAAACTTCAGGACAGAAGAATTTCCA
+TCAGCATTGTGATGCCAAGTGAATTTTAGGTTAGATGACGTGTTGCTTAACTTATGGTTG
+TGAGCTCCCTTTTCTTCATTCTCCTGGATGTTGGAACCTGACTTGGGCAGGGACTCTGTA
+TTGCGGACGTGCTG
+>ds2020-267_301
+GGACGTTCGGGCTTTGTTTGGTCAATTGTCGCTTGAGTTCAATCCAACCTGCATCGTAAA
+CCGATTTGGCTAGTTTGCCTTTTTACTGTTAAATTGGGTTGTTCTAACGTAACCTACCAC
+GATTAGGAGGCGTGAACAAAAGCCCGAACGTCCTTAATCTAAGAGCAGCACGTCCGCAAG
+GCGTCACTAGTTGCGGACGTGTGAGGGGCTATGTATTGCGGACGTGCTAAGGCCCCCTAC
+TTGCGGACGTGCTG
+>ds2020-267_302
+GTCCGCAAAATTAACACCCTCAGCACGTCCGCAATACATTCCAGTCAGCACGTCGCAATC
+AGGCAAGTTTGCGAGGAGTGCTGTATGCTTGCGGACGTCTGCTCCTTAGATAAAGGACGT
+TCGGGCTTGACCAATCGCCTGGACGTTCGGGCTTGGTGATCCCCTGCCCGCTGTCCTTGA
+CTTGACCCAAGATAGTTCATCACAAAACTTACAAAACCTACCTAACCTATCAGAGCAGTG
+AAGCCCGAACGTCC
+>ds2020-267_303
+GGGGGGGTGTGTTTGGGTGTTGGTGTTGTGGGTGGTGGGTGGGGGTGGGGGGGGGGTTTT
+GGGTTTGTTTGGTGGTGGTGGTGGGGTTTGTGGGTTGGGTGTGCTGGTGGGTTTGGGGTT
+GGTTTTGGGGTGGTGGTGGGTTTTGGGGTGGGTGTGTGGGTGTTTTGTTGTGTGGGTTGT
+GTTGTTTATACGGTCAGTGCGTCAGGGTGGGATTAACGGTCAGTGCGTCAGGGGACGATC
+GACGGTCAGTGCGC
+>ds2020-267_304
+CAGCACGTCCGCAATGCATTTTCGGTCCCTGTTGAGAAAGGCAGATTCTCTCACCCGATC
+TGGGACTACTAATCTCTGCATAATCAAATGAGCACAAAATAAACTTACACTTTGTTTATA
+CCACTGTATTTGGGGTCTCTATTTCAGAAGCTCAGCCTGTGTCCTACTTATTCAACCCCT
+TAGAGGAATACAGCACTAATATAGAGGAAAAGGTAGTTTCCAGGTAAACTGGGGCCCATT
+TGCGGACGTGCTG
+>ds2020-267_305
+CAGCACGTCCGCAATGAGTTGGCACTGAGGGCCTTGAGGGCAACGGAAACGTTCTTTGCG
+ATAGCGGGATTGAGGATGTAGTGGCACGAAATATCCCAACCAACAGCACCGAACTGGTAG
+GAAAGAGAGTACCCATAAATCAATGCGTTGATAAAGGCATCTTCATGGAGTCTACCAGCA
+CAAAGGAAAATCATACCAATCAGTGGGCGGGCACAACCAATGCGGACAAGGGTTCAGTGT
+TGCGGACGTGCTG
+>ds2020-267_306
+CAGCACGTCCGCAATGGCATGGGGATTTAAGAGTTTCAAGAGGAGGATGGGAGGAAAAGC
+TTAAGGCTTGAAGGCTATGGTATTTATAGCTTGGAAGGGTATGAGGAGGACGGAAAATCT
+TGATTGTGATGGTTGATGAATAGCTGGGATGATTGCTGGAATGCTTGCTGCAGCCAAAGG
+GAGAAAGGAAAGTGGTTCGATGGTTGTTGGGGGCTTGAGCAACCAAGAGATGCTGGTGAT
+TGCGGACGTGCTG
+>ds2020-267_307
+CAGCACGTCCGCAAATGTCGTCCCCTCAGCACGTCCGCAAACACTCCGATATGGTTGCGA
+CGTGCTAAGACTTAGTACTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCAC
+TGACCGTGGTTCTTCCTATCACTCGTAACGCTCTCTCTCGCTCTCACTTTCCAACTCCTC
+CCATTCCCCTTTCCCAATCCAATGGCAGCAACCAAATCCAAAATCCTCTTCATCGGAGGC
+ACTGGCTACATCG
+>ds2020-267_308
+CAGCACGTCCGCAATCACCTCTGTATTTTCTTCAAACTCTGACCTACCGTCGGACGGTGA
+TTGGGATTCAAAGTTCTCCGGCTGGAGGTCATAGTTTGAAGCAAATAGCGAGAAGGAGAG
+GGAGAAAAGATAGGTCTGTATTTGAGGAAATAATTAATATTATTATTTCTTTTTTTGTAT
+TTAAAAAATGGGTTTTGGAATTTTTGAAAAAAATAAATTGCGAAGAGAAGGTTATAGAAT
+TGCGGACGTGCTG
+>ds2020-267_309
+CAGCACGTCCGCAACCTGGCGGCCATATAACTAAAAGTAAAGATAAAGTGAATTATTTTG
+TAAATGATATAAATTCATTGTTACATGTTATAATACCCATATTTGATTATGTAAATCTGA
+ATAGTTCAAAATATCATCACTTTGATATTTTTTATTTAAAAAAGGGGGTCGGTGTTATTA
+ACTAAAAATAAAAGTCATTTAACGGCTGAAGGTAAATTGGCAATAAAAGGTCAAGAACTT
+GCGGACGTGCTG
+>ds2020-267_310
+CAGCACGTCCGCAAACCTGGTGGGGTGCAACCTGTGCGGGTGGTCCGCAGCGGAGAAGCG
+GTATGGAATTTGTCCTCCGTTTCCTTAACCAGATGCTCGTCGTGTAGCCTGTTATTGGCG
+TGAGAGCACTTGATCTCGTCTTTGACGTGTTTAGTTCGTTGACTATCTCGGTCGCGACGT
+GAAACAAAGAGATATGACACCGCAAGGGGTCTATCGGGGTACCTCAACGGACTTATGCTT
+GCGGACGTGCTG
+>ds2020-267_311
+TATCTAAGGAGCAGCACGTCCGCAAATGTGTCCCGGTTGTTGTTCGATCAAATGCCAAGC
+CCGGATTTTTATTCGTGGAAGGTGATGCTGAGGTGGTACTTTATGCACAACTTGTATGCA
+GAGGTTATGGGGTTCTATACCCGTATGAGAATATGCGTCAGAGAACATGACAACGTTGTT
+TTCTCGATTGTTCTGAAGGCTTGTAGTGAATTGCGGGACTTCAATGAGGGGAGAACTATT
+GCGGACGTGCTG
+>ds2020-267_312
+GACGCACTGACCGTGGCGGTAGCCCTCCATTCCTGAGCGCACAGGCGCTTTCTTGGATTT
+TTGCCGCTCGCTCAAAGGCCGCAACATCACCGTATTTAACTACCGCATCAACACCAACCC
+CAAATACGACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAAAC
+CACTTCACTTGGGACGTGCTGAGGTGTGCAGCGTTGCGACGTGCTGAGCCCTAGTCGATT
+GCGGACGTGCTG
+>ds2020-267_313
+CAGCACGTCCGCAAGGACACACTCTCAGCACGTCCGCAAGATTTATCTCCTCACACGTCC
+GCAACAAGGGCCGATTATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACT
+GACCGTTCCTTTGATCCTTCTGCAGGTTCACCTACAGAAACCTTGTTACGACTTTTACTT
+CCTCTAAGTGACCAAGTTTGCCTAAGTTTTCAGCGGCCTGCTACCGTTGCCGGTACAAGC
+TGCCAATCCCAA
+>ds2020-267_314
+GACGCACTGACCGTGAAAGCCTCCCTGACGCACTGACCGTTTCGTATGCTCTGACGCACT
+GCCTTATATCCCCTATGGGGGATGGGACGGTCAGTGCGTCAGGGAAGTGTCAACGGTCAG
+TGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAACCCATTACCCGTTAGCAGT
+TGGGACGTGCTGAGGTGGCGAAATTTGGGACGTGCTGAGGGAGGGCGTATTGCGACGTGC
+TGCTCCTTGATA
+>ds2020-267_315
+CAGCACGTCCGCAAGCAGCCATAGGTCTGAGAAGCATTACCGCCAACTGGTGAATCATGC
+GTCTGAAGGCATTATTGTTGTGCAGAATCAGAAAATTGTTTTTGCTAATCCTCAGATATA
+CAAACTCACGGCACGCCAACCGGATTCTTTACTGGCATTCAATTTTACTGATTTAATTGA
+CGAAGCTGATCGGCTGATCGTACAGGATTACGAGCAGCGTTGCTTACAGGGGGAACGTTG
+CGGACGTGCTG
+>ds2020-267_316
+GACGCACTGACCTTTGTCACCACGTTTGTGATCAACGCGTAGAAACTCAGCTATTGCACC
+GAATGCGCACTTAGAGGGCTGCGTTCGTATGCAAAGCCTTTGTCCTCTCTGGAGTGTGAA
+ACGAGTTATTTCCAGTGACGTCGTCCCTAGAAGCACATCGTCACCGTTGTGCAGTGAAGA
+GCCGACTTCTTTCATCGGACCCAACATGAAGTCGGTGTAAACGGCATTTCGGACGAGTTG
+CGGACGTGCTG
+>ds2020-267_317
+CAGCACGTCCGCAATCGACCGCCATTAGCTTGGGACGTGCTGAGGAGATGGAGCTTGCGG
+ACGTGCTGAGTGCAGAATAGTTGCGGACGTGCTGCTCCTTAGATAGGAAGTAAGGACGTT
+CGGGCTTAGAATTATCCCTGGCGTTCGGCTTCCTACAGCGAGTGGAAAGCCCGAACGTCC
+TTACTTCCAGAAGTGCGTCAGCGGGTCGCATACGGTCAGTGCGTCAAGGATGTTTCGACG
+GTCAGTGCGTC
+>ds2020-267_318
+CAGCACGTCCGCAATCTGGACCCCTTTCCTTTGTTTCTACATCCCTATCCCAAAAGACTG
+AATTGAGTTCGTATAGGCATTTTGGATGCCTCTATTGAAATTGCCCTTCTGGCTATATTT
+TCTGCTACTCCGCTCATTGCAGAAAGTATTCTACAGGGTTTAACAACAGCTACCCAATAT
+TCGGGAGATCCTTTACCCGAACCCATAAGTGTATCTGTAGTGCTGAGTGTAACGTGTTTG
+CGGACGTGCTG
+>ds2020-267_319
+CAGCACGTCCGCAAATGAGTCCCCCTAGCTTGCGGACGTGCTCTGGAAGTAAGGACGTTC
+GGGCTTTATGGGAGCTCTGAGCGCATTCTGTTTTTCAAGGGTAATTCCTAGCCTTTCCGG
+ACCAGAGTTGGGCGTAGTTCCTGGATTGAAGTCTGCCTGAGAAGCTTGTACAGCAAGGCT
+CTAAGGTTGCGGCGTGCTGACGTATAGGGGTTTGCGGAGTGCTGAACTCACCAATGTTGC
+GGACGTGCTG
+>ds2020-267_320
+GGAGGCAACTTTCCCGTATGAGCATTCGGTACATGTATCAGTCCGTGGAAGAGTGAAAGG
+GTCACCACTACTGAGGATCTCCCCCCTAATCTTAGATAGGTCGTCTGAGGGTTCGCCGCG
+GTTCATTGCTGTGCTTACACACTAGGCTACCCTTCTCCGAAAGCTCCGCGGGACCACCTA
+CCACTAGTCTTCGGCCGGAGGGGTTTATTGCACAAAAACGCCAGTCCGCAAGCCCGAACG
+TCCTTAATCT
+>ds2020-267_321
+GGACGTTCGGGCTTTTTCAGTTGGGTATGAAGCCCGAAGTCCAAGGAACCTTGTAAGCCC
+GAACGTCCTTACTTCCAGACACTGACCGTCGGGGGACAATTACGGTCAGTGCGTCAGGGA
+AACCTAAAGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATCCTT
+TATGGTTGGGACGTGCTGAGCGGTAGTGGTTTGCGGACGTGCTGAGGGAGCGCAAGTTGC
+GGACGTGCTG
+>ds2020-267_322
+GGACGTTCGGGCTTAACATTGACTCTGGGTAACTGATGTGTAGGATAGGTGGGAGCCTGT
+GATCCGGCGTCGCTAGGCGTCGGTTAGGCAACGTTGAAATACCACCCTTCAGTTGCTTGG
+AGCCTAATCCCCGAGGGGGAGACATTGTTTGGTGGGTAGTTTGACTGGGGTGGTATCTAA
+GGAGCAGCACGTCCGCAACAGCGCCAGAGTGATTGGGACGTGCTGCCCGTGTCATATTGC
+GGACGTGCTG
+>ds2020-267_323
+CAGCACGTCCGCAAAGCCCGCGATGACTTTGTCGTTGTACAGACGGCGGACCTTTTTCAC
+GTTGCCTTTCATTACGGTATTGCCCAACGTGGCCTGACCATCACCAGCGATGACCACATG
+GCCGTTACGGCGTACGCTTACTATAGTTGTCACGAGCTGACCCCTTGGTTACGAATACAG
+AGTACAAACCCCGTACAAAAGTACGGGGCATAATGCAATTATAGATGGCTGAGGTGTTGC
+GGACGTGCTG
+>ds2020-267_324
+TTTCGATCTAGCTAAGGAGGAGCAAGTCGGCAATGAAGCCGCTTTGTATGAGGCGCTTGT
+TTCACGTTTGGGTGGAGAATATCTTGATGTCGCCTTCGATGCTGTAGGAGGGCCACATAT
+TGAACAGATTGCAAAAGCGATGTCTGTGGGAGGACCCGAATGCAACCGGTCAGTGCGTCG
+CCTTAAGCGATCCGCAAGTAGGTAGGTATAGTTGCGGACGTGCTGAGTACAGGTCACTTG
+CGGCGTGCTG
+>ds2020-267_325
+CAGCACGTCCGCAAGCTGATTCTCCTCAGCACGTCGCAATATCATTAGCCTCAGCACGTC
+GCAATAATCGGCCTTTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGA
+CCGTGCGCTTCGCGCTCCCCAATTGTTCGCGCCGAAATTTTCTGTAATCCAAAATGACCC
+GCTGAGATTCGTTGTCCAAATAGTCAAATTTGCGTGATTTGATGGCGTAATAAATGTCAA
+AAATAGACAA
+>ds2020-267_326
+CAGCACGTCCGCAAAGCGGCCCGCTAGCCGTCCGCAACTATCTTCCCCTCAGCACGTCCC
+AACTAGTTCCAGATTGCGGACGTGCTGCTCCTTAGATAAGCTGGAAGTAAGGACGTTCGG
+GCTTGTGGCTCCATCTTATTTAAGGAGCAGCACGTCCGCAAGTGCCAGCTCCTAACGTTT
+GGGACGTGCTGAGGGTACCTACATTGGGACGTGCTGAGGGCAGTGAGATTGCGGACGTGC
+TGCTCCTTAG
+>ds2020-267_327
+CAGCACGTCCGCAAGACATCACCTATTGCGACAAGTTAATGGACACTCCATACACTGCAT
+CCCCAATTGGCCGTTTAGAAGCCAATGGGCTAAGTGCTGGGCTTTTCCCGTTTCGCTCGC
+CGCTACTCAGGGAATCCTAGTTAGTTTCTTTTCCTCCCCTTATTAATATGCTTAAATTCA
+GGGGGTAGTCTCATATGAGTTGAGGTCGCAAGGGAATGGGTTTGCGGTCGTGCTGCTCCT
+TAGATAGAT
+>ds2020-267_328
+CAGCACGTCCGCAATGTTCACCATTTCCATAAACAAATGAGTACTATCCTCGACTGCTAC
+TAACTTTAGTGCGTTCTCAGTTCTGCCTGACGCTCTTAATATTACGATTGACGCCGGCGC
+CTGGTTTGGCCTCAATCGCAGCCTGACATAGTTATTTGACCTTAACGCTGAAGCGCTCGC
+CGTAGCCATCACTATGCCGTGCCAATCATAACCAGAACCTCCCACTGGCGGCGTATTGCG
+GACGTGCTG
+>ds2020-267_329
+CAGCACGTCCGCAATATAATATCTCTCAGCACGTCCACAACTTGATTCTTGCGGACCTGC
+TGCTCCTTAGATACGCTTAGGCGACGCACTGACCGTGTGTAAGCGACTGGGGTACGCCGT
+TCTGGCAAATCTGTTTTATTGATGCAATATCGAGATTATTTGCTGTCCCAACAAATTAGT
+GCAGAAAATATTATTTATATCAATTTTGAGAGTTTTGAGTACCAGTGGGTTAAAGTTGCG
+GACGTGCTG
+>ds2020-267_330
+GACGCGCACTGCCGGCAGCCCGGCCCTCTGCTCTGCCCACCCGCGAAATAACCAGCACGT
+CCGCAACCATGATCCCCTAGCACGTCCGCAAACTAATTGGACTCCACGTCCGCAACTGAT
+TGGTGCTTGCGGACGTGGAGTCCAATTAGTTTGCGGACGTGCTAGGGGATCATGGTTGCG
+ACGTGCTGACGAGATCTTAATTGGGACGTGCTGAGGGACTGCGACTTGCGGCGTGCTGCT
+CCTTAGATA
+>ds2020-267_331
+TTCCGATCTATCTAAGGAGCAGCACGTCCGCAATTTTCGTTCCTCAGCACGTCCGCAAAG
+ATCCAATCCTCAGCACGTCCCAACCGGCTATGGTTTGCGGACGTGCTGCTCCTTAGATCT
+GGAAGTAAGCCCGAACGTCCTTACTTCCAGATCTAAGGAGCAGCACGTCCGCAAACGACA
+CTGACTCAGCCGTCCGCAACCCCTTCCCCTTCAGCACGTCCCAACCTTCCAATACTTGCG
+GACGTGCTG
+>ds2020-267_332
+CAGCACGTCCGCAAATTTCTCTCTTTCCAAAGTTCTTTTCATCTTTCCCTCACGGTACTT
+GTTCGCTATCGGTCTCTCGCCTATATTTAGCTTTAGATGGAATTTACCACCCATTTTGAG
+CTGCATTCCCAAACAACTCGACTCTTCGAGAGCACACCACAATGCATCGGTAGTCCGTGT
+CATATACGGGATTCTCACCCTCTACGACGCTCCGTTCCAGGAGGGGGGTATGCGTTGCGG
+ACGTGCTG
+>ds2020-267_333
+CAGCACGTCCGCAAGAGCCCCGTCTTCCTTCTCCTATTTCAATTCTTGACAAAGCTGGAC
+GAGCACATCATGCAAGTGTTCATATAGAGGATGGTGGAATAGTTTGAGTCTTGGCTCTTG
+TTTCATGTTGACAGTATCAGGTTCTTGATTAAGTTCCTCTGATGTGCTAACAATTTCCTG
+ACTTCATTTTATATAATAGATAGTGGAATAGTAGAAGATACCATGCATGGCCTATTGCGG
+ACGTGCTG
+>ds2020-267_334
+CAGCACGTCCGCAAGATCATGGTCCTCTGCTTTAGACTCGTCCCAGCCCATGGTCACCAT
+GAACTTCAACGCTCGTTTGTTGTAAGGGACATTGACTGTGGCTGGCAATTCAATTGAACG
+TGAAACCCACAGGGCCCGGTCTTCGCCAACTTCACGGATTAGGTCAACCTCATCCCTAAT
+CCACGCAAGGACTACGGAATACAACTTGAAAGGAGCAAATCCAGCGAACTTGGATTGCGG
+ACGTGCTG
+>ds2020-267_335
+CAGCACGTCCGCAACGAACCTCGAGTAAGACAACCAACCCTGGAGGCCATGGCTTGGCTT
+TATCCCGTAGGTAGTAAGAACAGAGAGAGCCTTCTGTGCTAGCAATACAGAGAGGTGGGG
+ATTGAATGAGGCGAGCGCTGACTGCAGCAAGACCACCAGACCCTAAAAAGAATAATAACA
+ACGTTCAGCAAGCCGAAGCCAGCCAGACAGGCACCACCAGATACAGGGCTTGGATTGCGG
+ACGTGCTG
+>ds2020-267_336
+GGACGTTCGGGCTTGGCTTCTAGGGTTTCTGTCAGGGTGCCGATCTGGTTGAACTTGATC
+AGGATCGAGTTGGCGATCTTTTTGTCGATGCCTTCTTTCAGGATCTTGGTGTTGGAGGAT
+TCCCTGAAAGCCCGAACGTCCTTAATCTAAGGAGCAGCACGTCCGCAACCCTTACCCAGT
+GACACTTGCGGACGTGTGAGGATCCGGCCATTGCGACGTGCTGACCCAAACTCTGTTGCG
+GACGGCTG
+>ds2020-267_337
+CAGCACGTCCGCAACTTCAAGGGTGTGTTTTCTTTTGTACCTGCGGGTTATTTTGCTTGA
+TTACATACATATACATGGAATAAAGCAGTTTTACTATCTACTTTGTGACCTGCTGAAGTG
+TTTTTGGTATCATTTATATTGCATTTTTGCAGATAATAGGAAATACAAAGGAGTTTAAGC
+AGAAACTGAAAGATAGCATCAGAAGGAAATCTGATTTGTTTAAGAATGGTAATTTGCGGA
+CGTGCTG
+>ds2020-267_338
+CAGCACGTCCGCAAGCTTTTTGGGGTGTCGAGAGATACCTACACGTCCGCTATTGAGTCC
+CTTGGGTCTTTTTCGTTGACTGAGGTTGAAGAAATTGTAGAAAAATACAAGAAGATGTGT
+CTTACTCCCCTCGAGTGCATGAGGAATTTATTATCTTTCATGTTGCAGATGAGGTGTGGT
+GCGAGAGGCCAAAAAAGAATGGATCCAAATAAAGATTTGTAGCGGCATCATGGTTGCGGA
+CGTGCTG
+>ds2020-267_339
+CAGCACGTCCGCAATACGAGACCGCTCCCAATAGATATTTGAGCATATATTCATGCCCTT
+TACCTGATGAACCAAGCAAGTTTGAACGCCAAATAAACAGATTGCGTGGGAAGTTGGCAG
+GGTTATCTGGGCTTTCACAGGCAAAACTTAATGAGCCATTTTGTAGGCTTTCGACCACAT
+AATCTTCCACTTTCATGCCTTTTGCTTTGGCTTCATTGGCAAAGGAGAGTGAGTTGCGGA
+CGTGCTG
+>ds2020-267_340
+GGACGTTCGGGCTTCTCGCACTGGGTCTGGAGCTGGGTCACGTGCTATCCTTAGGTTAAT
+AATGTTAACAATAAGTCAGTAATTTTTAAAAAAACACAAACTGATAGCATAAAAAAAAAG
+AATGGCGCTAAACCATTCTTTTTTGAAAATGTTTAGTTTTTATATCCACACGCATCAAGT
+CAATTGACGATGATTGACTTTGTCTAATTTTAACGCTTCCAACTATATGCTTATTGCGGA
+CGTGCTG
+>ds2020-267_341
+GACGCACTGACCGTTATAGGGCCTATTACACGGTCAGTGCGTCGGAAAAATGGGAACGGT
+CAGTGCGTCAAGGGACGCCCTACGGTCAGTGCGTCGCCTTAAGCGCTTAAGGCGACGCAC
+TGACCGTAGTTTAATGCCTGACGCACTGACCGTAACCATCTGCCTGACGCACTGACCGTG
+AACCTACCCGTGACGCACTGACCATTTCCCCCCGGACGGTCAGTGCGTCGCCTTAAGCGA
+CGTGCTG
+>ds2020-267_342
+CAGCACGTCCGCAACCCTCTATTGTTATCCATGGATCCTTTATTTATACTTATTCATTTA
+GAACTTATCCATTTAGAATAGAAGTATTGATCCAATAAAAAAAATTATGTTTCGTAATCT
+CATAATCCAATTTTTCAACTTTTCATTGATTCTTGGATACAAATCACGAGAATGTATATT
+ATTCCTCGAATTTTTTATTGAGAGGTAAAGGATTAAATCCAGGGGGATGCGATTGCGGAC
+GTGCTG
+>ds2020-267_343
+CAGCACGTCCGCAAAGGACTAACCTTCAGCACGTCCGCAAGTCAATACCTCTAGTTTGCG
+GACGTGCTGGGGAATTCCGGGTTCATGTGAACAGTTACAGTCCACAATCCCAACCAAGAA
+GGTGGTTCAATGTTTACCCAGACCTCTCGGCCAAGGATAAAACACACTGATACCTTCATT
+GTAGCGCGCGTGCAGCCCAGGACATCTAAGGGCATCACAGAGAGGACACATTTTGCGGAC
+GTGCTG
+>ds2020-267_344
+AGCAGCACTGACCGTCTCTGTTGCCATGACGCACTGACCGTCCTCATGCGACTGACGCAC
+TGACCGTCATGCACCACCTGACGCACTGACCGTTAATTATTGCCTGACGCACTGAACGTG
+GATTGTACGGTCAGTGCGTCGCCTTAAGCGCACGTCCGCAAATGGTAGGTAATTGGGACG
+TGCTGGGGTCTGGAACTTGCGGACGTGCTGGGGCCCTTCAGTTGCGGACGTGCTGCTCCT
+TAGATA
+>ds2020-267_345
+CAGCACGTCCGCAACTGATCACCACTCGAGGGTTTTGGCCTGGCCCTGCCCATTCTGGTG
+GGTCGTTCGTCGAGTGGCTCGTCTGGCGCTTCACTTGGATTGTTGTTAACGCAACTGCCG
+TCGCTGAGTCTGTCAATGCCGAAGTTCGGAAAAGGCATAGTGATAAAATATCACCAGACT
+CTGTCCGCCTTGCAGCAATATTCAGGAGTTTCTTTATTCAAGGTGTTGCTCTTTGCGGAC
+GTGCTG
+>ds2020-267_346
+GGACGTTCGGGCTTTGTGTTGCATGTTTATCAAAAACAAGCACAACAATTGAGCATCTTT
+GTAGAAACGCTACAACCGCCGCTACAATTATTAATTTTTGGCGCGGGGCAAGATTGTTTA
+CCCTTGATGACCATGGCAAAGGCTCGTTACTAAGCCCGAACGTCCTTACTCAGTATCTAA
+GGAGCAGCACGTCCGCAAAAGGAATATTGTGGACGTGCTGAGGGGCAGTAAATTGCGGAC
+GTGCTG
+>ds2020-267_347
+CTTCCGATCTATCTAAGGAGCAGCACGTCCGCAACAAAGAACGCCTCCCTTCTATAACCA
+TTTCTTTACAGAAGGCATCTATTACCCGATCATAAAGATGTTTTTGTGATTTCAACGTAC
+AATTCACAACGATTGTAAAGTTAATATTGTCTCGATGAACAGCGTCTCGGAAACCTTTAT
+TAACTTGATGTTGTAAGTATTGAGTGAAACCCGGATGTGCTTGCGGACGTGCTGCTCCTT
+AGATA
+>ds2020-267_348
+TCTGGAAGTAAGGACGTTCGGGCTTTTCGTAGTGGCTCGTTGGGAGAGGGTGGGTTGTCG
+TAGCTGAGGGCTTTTCAGGGTGTCAGGTTCCGATTCGGAGCTGGTGGTGGAGGTTGGTGG
+GTTGGTAGTAACGGAAACTGCATCTGATATCGATGGTTGCTTGGTAGGTGTTGGTCTTGG
+TCTAAGAGACATGTTGGACTGTGGCAGCGGAGGTGGCGGAGGCCGTGACTGTTGCGGACG
+TGCTG
+>ds2020-267_349
+CAGCACGTCCGCAATACTAACGCTGTCCCCCCTCAGCTCACCCTAGCCCCGGGCCTTTTG
+CTCTTCTAACGTAAGCTCCAAGGCTTCACACCAAGTCTTCACTGACATAATATGCATGCT
+TAAGTAGGGTCAGGCAGAACCGTTGTTGCCTGATGGGAACTTCCCCCATATTGCTATCAA
+TGTCTTCATGTCGCACGACCTCTTAACATTACACCACTGAAACCAAATCCTTTGCGGACG
+TGCTG
+>ds2020-267_350
+AGCAGCACGGCCGCAAGATCCATCTGATGATCGATGTTGGGTATTTTACAATTTGCTTTA
+TTACATTATCATTATATAGGCTCGCCCCAGTTCGCTATTCTTGTGATTCCGAATGCTAGC
+TGGTGGGCTTTCAAAGGTATGGGACGATCAGGATGGCTTGGTCCAGCTCCCTTTAATCTT
+TAGATCAATCATATGCCCTCCCCAACCTTTTCTATCTAGTAGGGCGATATGATGCGGACG
+TGCTG
+>ds2020-267_351
+GACGCACTGACCGTATAATGACCCATGGACGCACTGACCGTCTTCTTATGCCTGACGCAC
+TGACCGTGTGGTCACTCTTGACGCACTGACCGTTGAACTACTGTGACGCACTGACTATGT
+CGACCACGGTCAGTGCGTCGCCTTAAGCGTAGCACGTCGCAAACTTCGGCCCTTAGCACG
+TCCACAAGATCCCAACCGTGGACAATTGCGGACGTGCTGAGGGATACTGCCTTGCGGACG
+TGCTG
+>ds2020-267_352
+AAAAAGGCGACAGAGGCTATTGCCCAGGTAAGCTCCCGGGTGGGACAAATTGTGAAGCCT
+ACCGAGTGCATCTATTCGACTTGCTTCTTGACGTACGGAAAGGAGATGATCCTGAGAGGC
+GCCTACTTGCGGACGTGCTCTCCGTAGATAGATCGAGGCGACGCCCTGACCGCTCGCAGT
+CCTCGACGCACCGACCGCCCCTTCGCCCCTGACGCACTGATCGTGACATGTACGGTCAGT
+GCGTC
+>ds2020-267_353
+GACGCACTGACCGTTCTGCGCTGGCTTTTTCTGAATGAGAACACGCTGACGCCGGTTGAA
+CATACTTCCTGGAAATTAAGTGCGCTGCGTATTTTTCTGCTGTCCGGTTTTCTTCTGGAA
+GGCGGAATTGCGATTCACAGTTCATTGCATGCCTATGCACAAGGCACTTACCCTGTACTG
+TGGGCTTATTCTAGGCGGTGTATAAAGCCCGAACGCCAGGGTGTTCCGCAAGCCCGAACG
+TCCTT
+>ds2020-267_354
+GGACGTTCGGGCTTTGGATTTTTGGTTTTTTCCTCTTTCTCTATCCCTATCCCGTAGGTA
+CAGCGTTTGAATCAATAGAGAACCTTTTTTTCTGTATCTGTATAAATGTATCTAATCGAT
+ATTATTACATTCCAATTCCTTCCCGATACCTCCCAAGGAAAATTCCGAATTGTATCTCAA
+ATTGCGGACGTGTGAGCGAAAGCCTTTTGCGGACGTGCTGGGCCCATGTATTTGCGGACG
+TGCTG
+>ds2020-267_355
+CAGCACGTCCGCAAACCCCCCTCTTAATAATCCCCGTAACCCCCGAGAGGAGCACGGGCC
+ACTTTGGCGTTAGGCCACGCCTTGCGATAATCCTCTCGCCCCAAGAGGACTAAATCGCGC
+CACTGCTCAAATGTCAGCCGCTTGGGAATTGGCACCTCAACACCCACATTGCTATAGTCC
+CGCGATACCATGCGTTTGAAGTTCGGGGGCCAATCGAGGGGCGGGGTCATTTGCGGACGT
+GCTG
+>ds2020-267_356
+TATCTAAGGAGCAGCACGTCCGCAAGGGGTGCGTCGCTGGCGCGCGGATTAACAACGACC
+ATCAACAAACAATCGATTCAGAACTGGCACGGACCAGGGAAATCCGACTGTCTAATTAAA
+ACAAAGCATTGTGATGGCCCCAACGGGTGTTGACACAATGTGATTTCTGCCCAGTGCTCT
+GAATGTCAATGTGAAGAAATTCAAGAAAGCGCGGGTAAACGGCGGATCCATTGCGGACGT
+GCTG
+>ds2020-267_357
+ACAGCACGTCCGCAAAGGTCGCCAGAAAAGTCAGCATAATCAGCCTCCGAAATCATCAAG
+CATGATGTTCTCATCTTCCACGCCAAGATATTTTAGCATCTTAATCACGGCGGCGTTCAT
+CATTGGTGGACCACACATATAGAACTCGCAGTCTTCCGGTGCCGGGTGCTGTTTGAGGTA
+ATTTTCATACAGCACGTTGTGGATGAAGCCCGTATAGCAGGGGAGTTTCCTTGCGGACGT
+GCTG
+>ds2020-267_358
+CAGCACGTCCGCAAAGCTCACTTCGTTGCTCTGTCTCTGTCTCGATCCCGCTCCCGTTCC
+TTGTATCTTTCTCGATCCCGATCACTATCCCTTTCTCTTTCTCTTTCTCTTTCTCGATTC
+CGATCCCGGTCCCTTCCTCTGTCCCTGTCCCTGTCCCTGTCCGAATATTCTCTGTCAGAA
+TACTCACGGCTCTGGCTGCGATGGGTCCGTAGATCATCACTGCTGGCTGCTTGCGGACGT
+GCTG
+>ds2020-267_359
+AGATACGCTTAAGGCGACGCACTGACCGTGGAGTCTCCCCTGGGGAACATACGAAAGCTT
+TGGAATATTATTTTCGGGCCCTAGAGCGAAACCCATTCTTACCACAAGCTTTTAATAATA
+TGGCCGTGATCTGTCATTACGTGCGACTATCTCCACTATAGAAATAAAAAAAGGAAATAA
+AGAAAAAATCCGTTAACGTTAGTAAATACTAGAAACAAAGTGTAGGCTTAACGGTCAGTG
+CGTC
+>ds2020-267_360
+CGCACGTCCGCAACTTTGGAGGAAGAATTAGAAAGTGGCTGTTGAAAGTTGGTCTCTTTC
+AATGGTCCTGCCTCAATAACAGGCTTGTCAATAATTTGGATCTCACTACTCTGAACTGTG
+TGCTTCTCAGTCTCAAGATCAACTGCCGCTGGTTGAGGAGCTGATCTGATGGTAGATGCA
+TGGGGAGGCACTAGGTCAGATTGAACTCTAGGCGGCACAGAAAGATGCTGTTGCGGACGT
+GCTG
+>ds2020-267_361
+CAGCACGTCCGCAATTCGACCCGCTTTTGGATAACAAGAAGGCGAGCTGATCTGCTTTGA
+TCAAGGAAAAAGCCCAGTCAGCCACCAACTCGGTGCAGGTCACGTGACCTGCAGCTCGGC
+CTTCGCTTTTTGAGGCTTCCTCTACCCACATCTCTATGTGCCCGCAGCACTTCCATATGG
+AGAAAGATAGGCTTACCATGTTCCATCAATAGCACCTAACTAATGGAACTTGCGGACGTG
+CTG
+>ds2020-267_362
+CAGCACGTCCGCAACCACCCCCCACTTTCGTTCTTGATTAATGAAAACATCCTTGGCAAA
+TGCTTTCGCAGTTGTTCGTCTTTCATAAATCCAAGAATTTCACCTCTGACTATGAAATAC
+GAATGCCCCCGACTGTCCCTGTTAATCATTACTCCGATCCCGAAGGCCAACAGAATAGGA
+CCGAAATCCTATGATGTTATCCCATGCTAATGTATCCAGAGCGTAGGCCTTGCGGACGTG
+CTG
+>ds2020-267_363
+CAGCACGTCCGCAAAATGTCCCCACTGATACCTAATCGATAACGAACCTGAATGGCTTTT
+TTAGGTCCAATTCCATCAATTTTTGTTGAGGCAATTCTTACTTGTTCATCGGCAACTGAT
+CTAGCTCCTGAAATATATGACATTCTTGATCCTTTCCTTTACTAGTCTTCTCGGCTGGAA
+TCAAAAATGGGCTGTCTCCTCTCTGATGATCTTTTCTATAGGTAGAACATTGCGGACGTG
+CTG
+>ds2020-267_364
+CAGCACGTCCGCAACGGTCAAGGGGCAGCACGTCCGCAAGGTATCCGGGCCATCATTTTT
+CCTTATTTCACTTACAAAATAGGCGTATCACCAACGCAATACGCCTTTGTATAGGTTGAT
+TGATAGGTTAGTTCACTGCATCTTTTAACGCTTTACCTGCCTTGAAAATTGGGGCTTTTT
+TGGCAGGTATTTGGATGGCTTCGCCTGTAGCAGGGTTACGCCTTTTTCTTTGCGGACGTG
+CTG
+>ds2020-267_365
+CAGCACGTCCGCAACTTTCACCTCGTCTTCTTCCATACGTTTCATCACTCTAGCACAAGC
+CTTGAGAGCAAAATTGTATGTGAAATGATCAGACCTAACATTCGTTTCCTGCATATAGTT
+GTAAATATGTATAGCTTTGATGGGGAAGACGCTGTTGGTGTAAGCCCTGATCATGTTGTT
+GCAGATGAGAGGGTCGTCCATGGTGGTCTCTTCGAACAGGGCTTAAGATTTGCGGACGTG
+CTG
+>ds2020-267_366
+CAGCACGTCCGCAAGTGGTAATTCCTCCCTGCTTAAGAGCCACAGCATGTACAACAAAGT
+TTGAACTTCTCAGCAAGATCTAGAAAGCCTGTCCCAACCCGGCTGCAGCCTCCTCTTGGC
+AGCCTCACCTTCAGGCCTTTGCTCCTACAGTTCTCTCTGCTTTGCATGCCTCTCCCATCC
+GCTTGTCCAACTTTTGCTCAACCTTGAACTTTTGCCCATCATAACTCAATTGCGGACGTG
+CTG
+>ds2020-267_367
+TCCGCAATTGCCGTCCCCCAGCACGTCCGCAATAGCAGTCCACTCAGCACGTCCGCAATA
+CGATCTCCCTCAGCACGTCCGCAAAGGGTAGTCAAATTGGGACGTGCTGACCGATGTGAC
+GTTGCGGACGTGTCTGGAAGTAAGGACGTTCGGGCTTAAATTTGCTTATGATGATATGGG
+CTAGTAGCGCAGCGGTGGCAACGCTTTTATCGATGATAGTGATCACCAGAAGCCCGAACG
+TCC
+>ds2020-267_368
+CAGCACGTCCGCAAATATTCCTGGGCAGCATGTCCGCAATTCGTATCACCTCACACGTCC
+GCAACTATACCCTGTTAATTGCGGACGCGCTTAAGGCGACGCACTGACCGTGTCACAACC
+CCTATGGCGTTTACCCTTTGGTTCGCCCCATCATTTGAAGAAGTCAAACAACGTAGAGCG
+GAACTTGCTTTGATAGAACGTGAGACAGGGGCGTGGAAGTGCGGACGTGCTGCCCCTTAG
+ATA
+>ds2020-267_369
+CAGCACGTCCGCAACATTTTATCCATTGGACGTGCTGAGAAGAGGCTTTTGCGGACGTGC
+TGAGTGGGCGGACTTTGCGGACGTGCTGCTCCTTAGATACTGTAAGTAAGGACGTTCGGG
+CTTCCGCATACACCTCTTGGTCACGCTCAAAGGTCAAGGTCATACCATCTTCAGGGACTG
+CCAGTCCTTGCACTTGTACTTCATCGCTCGGATGTAGCATCAGTAATAAGCCCGAACGTC
+CTT
+>ds2020-267_370
+TCAGCACGTCCGCAATCTTCGGTCCGTGCAGCATTTCCACGATATCGTTATGATCAATTA
+ATGGGACTTGGCCGGAAAGTGTTCTTGCCTCTATCATTAGCTCGGGTAGTCCCCGTTTCT
+GGTGTTTCAGTCACCTTTCAATGGCTCCCTTAATTATGCGCGAGGAATTTTCCTCTGGAA
+GCGGGCTAGTCCCCGAAAATGCTCGTTAAAGTTGGGGGGGCAGTTTGTTTGCGGCCGTGC
+TG
+>ds2020-267_371
+CAGCCCGGTCTGACTCAATCGTCTTCCGACTTGGGAAGAAGTGCCCCCGAAGCACTCCAT
+TCATCTGGTGATGAAGAATCTCCTATCGCTTCATCTTCCGCTGCCCTTTCATTCTCTTCA
+GTTGTCTTCCTTCTTCCGTGTGGAGGAATGCCGATAGAACTGTGGATACCTCAGCTTTGG
+GAGAGACCTCCGTTTTGGTCTTCCTAGAAAGTGAGGAGGCGCCAGATTTTGCGGACGTGC
+TG
+>ds2020-267_372
+CAGCACGTCCGCAACCGCATGCGATCTACGGGTGAAAGGGGGCGCAAGCTCTTGCTATTA
+GATGAGCCTAAATCAGATTAGCTAGTTGGTGGGGTAAAGGCCCACCAAGGCGACGATCTG
+TAACTGGTCTGAGAGGATGATCAGTCACACCGGAACTGAGACACGGTCCGGACTCCTACG
+GGAGGCAGCAGTGGGGAATATTGGACAATGGGGGCAGTTTGCGGACGTGCTGCTCCTAGA
+TA
+>ds2020-267_373
+CAGCACGTCCGCAAGCTATACATGCTGCATATCTTTTCAAAGAGGCTGGAAACCAACAAG
+TGAATGGAATTGTACCACCGAAACCAAGTTCTGCTGGCGATTTTCCAATTGGACAGGAGC
+AACTAGTTTCAGTGACGAGGGATCATAATTTTCCCGCTCTGCAACAATATGGGGGGGTCA
+AAGGGCTGGGAGATTTATTAAAAACAAATCTAGACAAGGGATTACATGTTGCGGACGTGC
+TG
+>ds2020-267_374
+CAGCACGTCCGCAATGACTCTCTGTTCAATTGCGACCTTATAATGCAATTGCATTCTCCG
+GTCCAATTGCTGTTTTTGTTTCTGTATTCCTAATTTATCCGCTAGGTCAGTCTGGTTGGT
+TTTTTTGCGCCCAGTTTTGGTGTAGCAGCTATTTCGATTCATCCTCTTTTTCCAAGGGTT
+TCATAATTGGACATTGAACCCATTTCATATGATGGGAGGTGCTGTGTGTTGCGGACGTGC
+TG
+>ds2020-267_375
+TCAGGGTATGGAGCCACCGTCGCATCGGTATAGCATATCGAGTGGAAAAGGCTGATAGGG
+GTCACCACTCCCCGTCCTATTTCCAATGCGAAGAATCCCAGTTGAGTTAAGAAAACAGAT
+AGGTCGAACCTATCCCAAGCATTTATAGCCCTCGTGAATTCTATCTAAGGGGTATCCAAA
+CCACCAACCCCAACTAGATCCAACCAATGCCATTTGTAAAGCCCGAACGTCCTTACTTCC
+AG
+>ds2020-267_376
+GGACGTTCGGGCTTCATTGACTCTTGGACGTTCGGCTTATCGTCCCTACTAGAAAGCCCG
+AAGTCCAGGCCCCTAATTAAGCCCGAACGTCCTTATAAGGAGCAGCACGTCCGCAACTGC
+TGCGCCCTAGCACGTCCGCAAGACGCAACGCCTCAGCACGTCAGTGCGTCAGGATGTAAG
+TGACGGTCAGTGCGTCAGGGCAGAACAGACGGTCAGTGCGTCGCCTTAAGCGAGATCGGA
+AG
+>ds2020-267_377
+CTGGAAGTAAGGACGTTCGGGCTTACCGGATTGCCCCCATCAGCGAAGCCAAACGCTATG
+AGCAAGCATGGCTAGGCAAAATCAATGTCGTCATTAAGTTGCCAGCTATCACGTGGGGGC
+ACAGTGGTATAGTTGCTGTCTTTATCTAAGGAGCAGCACGTCCGCAACAACTGGGATTTT
+GCGGACGGCTGGAGGGCCTGCATTGCGGACGTGCTGAGTGTCAATGTGTTGCGGACGTGC
+TG
+>ds2020-267_378
+CAGCACGTCCGCAAATACAACGGATTACTGAGGTTCTTTCCAGTTCCACGCGTACTTATC
+TGAAACTATACCTATCTTCGGTGCTTTGGAGAGGGAGTACCCAAACAAAGATGAGTTAGT
+TGAGGAGATGACGGGGGGTTCTGGAGGGGTTGACTGATGAAGAAACTTTAAACTTACACC
+TACCCCGCAGATGAAAGGTTTCTTACCTCAGCGCTCAAAGGAAAATGCTTGCGGACGTGC
+TG
+>ds2020-267_379
+CAGCACGTCCGCAATCATATAGGGGTCTTTGCGGACGTGTGAGTCGGGTCAAGTTGGGAC
+GTGCTGAGGGGGTACTAGTTGCGGACGTGCTGCTCCTTAGATACGTTCGGGCTTGTGGAA
+AATCGTAGGCTAAATGATTGTTGTCGCTATTTAATAGCGGATAAAAACGCTGTCCTTCAT
+GCCCTTTTACCACCGCGGCATTGTCTTTATAGGCGGACCGTGTTCAGTAAGCCCGAACGT
+CC
+>ds2020-267_380
+GACGCACTGACCGTGGCATTTCCGATGTTGATTAAACAATCATTCCCAGATGTGAATCCG
+CTTAAAGTGGCGTTTTTAGGACCTTTGGTTGGTGCGTTATTCCGTCCGTTCGGTGGCTGG
+CTTGCTGACAAATTGGGCGGTGCAAAAGTCACCTTAATCAACTATGGCGTGATGGCTATT
+GGGACGTGCTGAGGTGGTGGATATTGCGGACGTGCTAAGTGGCTGGGCTTGCGGACGTGC
+TG
+>ds2020-267_381
+GGACGTTCGGGCTTTGATGACCTCCTCTCGTGTTACTGCCAGCTTGTCAATGTAAGCTTA
+TCAAGGTTAAAATGTTGTTTTTTAAGTTAAGCCCGCTACCTATTTGAGCCGTTTGTCAGT
+TCGTAGCCAGTTAGCGTATTACCCCACGAGATAAGCCCGAACGTCCTTATCTAAGGAGCA
+GCACGTCCGCAAAGTATATTCGCTCAGCACGTCCGCAATAGGTACAGCCTTGCGACGTGC
+TG
+>ds2020-267_382
+CAGCACGTCCGCAAGGTCTCATTCATCCGCCCTCATGATTGGGTGAGCCACGAGGGGGAG
+AGAGACAATGTGGAGGGGTCGGATGACGTGGACATGGTTGCGGCGGGGCGCTCTAACTCT
+GACTCCGAGGCAGCCGAGGAGGAATCCTCGGAGGATAGTGATGATGAGGCCACGAAAGTG
+GAGGAAAGGGGAGTGGGGGGGGCCAATCCCCCCTCCACGGTGATTTCATTGCGGACGTGC
+TG
+>ds2020-267_383
+GGAAGTAAGGACGTTCGGGCTTGTTGTCCCCTCGGACGTTCGGGCTTGATCTACGGGGGG
+ACGTTCGGGCTTGTTACGTAACCTGGACGTTCGGCTTAGAGACCACCGTAAAAGCCCGAA
+CGTCCTTACTTCCAGACTCTAAGGAGCAGCACGTCCGCAACTTCTAGGCCTTAGGGGTTG
+GGACGTGCTGAGTGTATGGTCCTTGCGGACGTGCTGAGGGTCGGCCAATTGCGGACGTGC
+TG
+>ds2020-267_384
+ATCTAAGGAGCAGCACGTCCGCAATGGCCACTCACTCGCTTGAAGATGCCGAATAACCGC
+CGGTTCTTTAGTACTTGGTTGGAATACCCAAGAGATCCCACTGGATAAGGCCTATTCCCT
+GCTCGTAAATTAACGGTTTAAGTTCATTTTTTCTTACTGTCGCAAGCCATTCTTCCACTC
+TATGATTATGATATGATTCACTTTCAAACGGAACAGGGCCTCTCATTTGCGGACGTGCTG
+A
+>ds2020-267_385
+CAGCACGTCCGCAAATCCAGGGTGGTGACTTGGCGATGGGCGGCGGCGTCTGGGAGCCTA
+AGCTTGACCTCAACCTCCATTAGAGGTTTGAGAATGTGAGACATAATACGGCGAGTTATA
+TTTTGGTGTTTGGGGTGCATAACTTTCAATTAGAAGGGACGGGCCTTTGCGGACGTGCTG
+AGCCTTAAATAATTGCGACGTGCTGAGTGCAATGAATTTGCGGACGTGCTGCTCCTTAGA
+T
+>ds2020-267_386
+CAGCACGTCCGCAAGCAGTCGCACCTTCTCCTTTGAGCACTCCACCCGCCGCCGCTCCTT
+CTCCTTTGAGCACTCCACCCGCTGCTTCACCTTCTCCTTTGAGTACCTCACCTTCTCCTT
+CGGGCACTCCACCCTCGGCTGCTCCTTCTACATCTCCGGTCGCAGACTCTCCACCTTCTC
+CCCCATCGTCTTCTCCTGAATCTCCAGCCAATTCCCCTTGCGGACGTGCTGCTCCTTAGA
+T
+>ds2020-267_387
+GCGCACTTCCGATCTATCTAAGTAGCAGCACGTCCGCAATTGAAGGGATCTCACACGTCC
+GCAAAGGTCGTTCAGTCAGACGTCCGCAATATGCCTGTCATTGGGACGTGCTGACGGGTC
+CGCCGTTGCGGACGCGCTTAAGGCGACGCACTGACCGTGTCTTTTTGGCTGACGCACTGA
+CCGTTGGTAAGTCCCTACGCACTGACCGTTGTCGACAGCCTGGTGGGACGGTCAGTGCGT
+C
+>ds2020-267_388
+CAGCACGTCCGCAATCATCCGCCCATGCACATTTAGCACTTTGGATCCTGGTGTTGAACT
+TCCGCCCCAGACGTAATGACTCCCTAGCCACTTTCAAGCTGTGTGTGCCGATAAGGACAT
+CGTCTCCGTTGTGCAGGCTGTCCCCTACTTCTCGTGCCCCTTTAGTGATCTTGTCCGTAT
+AGATGCTGTTCAATACTGAGTTGATGAAAGTGGTCACCCCCATCACCTTGCGGACGTGCT
+G
+>ds2020-267_389
+CAGCACGTCCGCACCTGGCATGAGATGGTTGGTACCTAAGAGGATGCAGGGGATTGGAGC
+AAGTGGTGCGGTTGACATGATACCAGATAAGCCAATGCTTGGAAGCGCGTGTACACTAAC
+AGAACTGCAAGAAATTGTTGACAAACTGCAAATCATCCACCCCCCACAAATCAACCACAA
+TGGAGCGGAAATGCTGGCCAATGTATTGGCTAATGATAGCGACCTACTTGCGGACGTGCT
+G
+>ds2020-267_390
+GACGCACTGACCGTAAATCAGCCCATGAACTACGGCAGTGCGTCAAGGTCAGTATTACGG
+TCAGTGCGTCACGGGGGCGCAACGGTCAGTGCGTCAGAGCGTTATACAGGTCAGTGCGTC
+GCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAATGTTTACCACTCAGCACGTCCGCA
+ATATTTCCTCACTCAGCACGTCGCAACCCCCAAGCCTTGCGGACGTGCTGCTCCTTAGAT
+A
+>ds2020-267_391
+CAGCACGTCCGCAAATTTCTGGGGCAGCACGTCCGCAAGAAGGTTTAAACGTCCGCAAGA
+CTGTATGGTTGCGGACGTGCTGCTCCTTAGATACTGGAAGTAAGGACGTTCGGGCTTGTC
+CATACAGGTAGCGGAGTTGAAGAAAGGGGTCGGTTTAGGACCGGAATCAGCTTCACTTCC
+CTGGCCCGTTTCCGTACCCGTTCTCGGCGGCCGGGAGCGGGTCCAGTAAGCCCGAACGTC
+C
+>ds2020-267_392
+CAGCACGTCCGCAAGTTGTCCGGCTTAAATCTTTAGCCCCTAACTTAAGTGCCGCTACAG
+CTCCATTTTCTATTACTTTTTTTGTTCTATCACATAACCACATTCCTTCGAAGACTGATA
+GTTGTGAAATTTCATATATGTTGTCTTCATCTAAGTAATATAGAAATTTGAAACTTGGTG
+TTGCGTCCGTTAAACGTAGATCAGTGAAGTACGCACCCATTCGTAGTTGCGGACGTGCTG
+>ds2020-267_393
+CAGCACGTCCGCAAGATTTTCAGGTTAGGGTAATTGTAATCCACAATTTTGAAATATCGA
+GCAGTGGCCTCAAGTTCATTTTCTTCTGAAGCAAAGTTCTCAGCACGGCGGTATTCCAGA
+GCCATCTTGCGTAAGTCCTCCAGGTCTTCATCAACCATTATCTTCAGGTTTCGGATCCCT
+TGTTTAAAATCTGAACCACAAAGGACCCACTCTTTGAATCCCATGCGTTCAGCTATGGGA
+>ds2020-267_394
+GACGCACTGACCGTCCGCCCAAATGTACGTATTTGGCAATCACTTGCTGATGGATGGGGA
+AATTACCGAGCGTTGCCCCTGCTTTACGGTCAGCAAAATAATGTTGCAGGGAGCGTGATG
+GGCACGGTCAGTGCGGATCTAAGGAGCAGCACGTCCGCAATGCTACTTGTATATGCTTGG
+GACGTGCGAGTGTTACTCCCTTGCGGACGTGCTGACGAAACTAATGTTGCGGACGTGCTG
+>ds2020-267_395
+GACGCACTGACCGTTGGACCCCACCTAGTCCAACCGAACCGGATAAATCGGTGACACGGG
+ATGCTGAGCTATTAATGGTAGGCAAACACATCAACGCCAACGACTTGACGGTGATTGTTG
+CAGGTGATTTTAACGATGAGGCGACGGTCAGTGCGTCGCCTATCTAAGGAGCAGCACGTC
+CGCAAAGGTACCCCTCTTGGATTGCGACGTGCTGACGAACAGTATCTTGCGGACGTGCTG
+>ds2020-267_396
+CAAGCGCCTCCGCAGGCACTCTTGCAATAGGAGAATATGCTTTTCATTCACCACTCTAGT
+CGACGGAGACAACTACTATCGGATTCAGTTGAGCCAGCCTTATGAGGGCCTTAGTGCGCT
+AGGTGGTAGTTCAGCTGTAAGTGTCAACCAGTCGGAAGGAGAACTCATAGCAGGGGGGGA
+ACCAATTTCAAGGGGAGAGAAAGTGAGATAATGAAGGGACGGGGAGAAGCCCGAACGTCC
+>ds2020-267_397
+CAGCACGTCCGCAAATCATTCTCCGTTTGGGACGTGCTGAGGACGTAATATTTGCGGACG
+TGCTGAGGGATAACCGTTTGCGGACGTGCTGCTCCTTAGATACTGGAAGTAAGGACGTTC
+GGGCTTCACTCATGCATTGTACCAATATCAACCTTAGCCATGACCCTCTCCTCAAACTCA
+TTGAGCCTTCTCTCAAACATGCCCTCAAGTCTCTCAGGGGGTTAGTAAGCCCGAACGTCC
+>ds2020-267_398
+CAGCACGTCCGCAACGGGTAACTCGTATATTCTTCTCATCAAAGCCACCAAAGACTTTCC
+TGTTGCTTTATTCTCACACGTTTCCTCAATAATTTTTTCTCTCATGATTCTCACCGCCTC
+TATAGCCCACAATCTTTGCTGTGCATCGTAAGATGAGTGGTCCAATGACACCCTCCAAGC
+TTTAACTTTGTTATGTCTCTCTCTCTCCTCTGCTATCGCGGGCCCTTTGCGGACGTGCTG
+>ds2020-267_399
+CAGCACGTCCGCAACTTTCTTCGCCTCTTTTTTCGACAACCAGTATAGAAAGTATCTCGC
+CCCTCTGTAATTCTTATCCGTCCCCAGATGCTGAATGAGCTAATCCTGATCTTTCTCTCA
+TAGGGTGAGAACAAGCTCGACCACTCTTAAGCTAGCCCGAAGCTTGATCCCGCGGCCCCG
+ATGCTACACATCAGTTCTGAACTCTACACATAAGTTCCTTGGCATTGCGGACGTGCTGC
+>ds2020-267_400
+ATCGAAGGAGCAGCACGTCCGCAATCAGGGACCTCGTTTCTGAACAACTGACCCACGGTG
+AATATCCTGTGTCCTACTCTGAGTGCTGGCAACATCAATGCCTGGCTCATCGTTATGTCG
+GTAGGCACCACCAATCCATGTTTCTCCACGTTATCGCTCATCGTCGCTTTGTGGTTCACA
+GCCCCCATGAGGTCACCTACCGGCACGTTTCTCAGCATACCAGCCTTGCGGACGTGCTG
+>ds2020-267_401
+CAGCACGTCCGCAAGTCTTCCCTAGTACAAGCAACTAAATTCAGTTAGCCCTTTTCCTTG
+GGAATGAACTGGATTTAGTTGCTTGTACTGGGGATTGGCTTAGCAGGAAGATTGGATATG
+ATTCTACTCGAGCGAACCCTGCAATGATTATAAGAGCCCAAGTGAGTCTTCCTTATTTTA
+CTGGAAGTGCTTTAATTTAAGGTGAACTATAAGACGAAGAGTTAATTGCGGACGTGCTG
+>ds2020-267_402
+TATCTAAGGAGCAGCACGTCCGCAATGGCAAAACAATCCCGAAAGAGAGCAAGATTTACC
+AACAGGTAATGTAACGTGGCAAGCATTGAGCAAAGTTGCTGGACTAAGAGAAGTAGATAA
+ACGGCGTTTTATGGGATTATTGGGAAAAGTTGTATTTGGTGAGAATGGGAAGATCACACC
+GTATTTCACATCAAACGACAAAGTTATTGAGGAAGTGGACCCATCTTGCGGACGTGCTG
+>ds2020-267_403
+CAGCACGTCCGCAATGACCCTTACCCTAAACAATCTTATCCGGTAAAGCGAATGATTAGA
+GGCTTATTGGGGACGAAACGTTCTCAACCTATTCTCAAACTTTAAATGGGTAAGACCTAG
+ACTTTCTTGATTGAAGTCTTACAGGTTTAGATGTATGTTGTACTTAGTGGGCCACTTTTG
+GTAAGCAGAACTGGCGCTGTGGAATGAACAGAGCTTGCTGACGTGCTGCTCCTTAGATA
+>ds2020-267_404
+GCACGTACGGTAACGAGGGGGGTTCGCGTCTATACGTGTAGTGTGGTGGTTGGGCCTACC
+CACCCTATTTGTTCCATGATCTATGGGTCTACTGGAGCTACCCACTTCGATCAATTAGCC
+AAAATTTTGACTGGATATGAAATCACTGGTGCTCGATCTAGTGGTATTTTTATGGGGATT
+CTATCTATCGCTGTAGGATTCCTATTCAAGATCACTGCAGATCTTTTGCGGACGTGCTG
+>ds2020-267_405
+GACGCACTGACCGTTATTTCCGACCTGCACGAATGGAGTAACGATTTCCCTACTGTCTCC
+ACCATGAACTCGGTGAAATTGCATTACGAGTAAAGATGCTCGTTACGCGCAGCAGGACGG
+AAAGACCCCGTGACCTTTACTACAGCTTGGTATTGGTGTTCGGTGTGGCTTGTGTAGGAT
+AGGTGGGAGACTGTGAAGCTCAGACGCTAGTTCGGGTGGAGTCATTGTTGAAATACCAC
+>ds2020-267_406
+GGACGTTCGGGCTTCAGTTTTTTGGTGGTGGTGATGTTTGGATCGTTGATCTTGGTGTTG
+GGTTTTTGTTTTGATCGATCTTGATTCTTGCTAGAAAGTGATCAATTTAAGGCAGAGATA
+GATCACAAAGCTTCAGAAAAAGAAAAATGCTTGGAAATGGGGTGGTGGGGATTTTTTCAG
+AGTCAGTGAACAAGTGGGAGAGAAGAGCACCTTTGACTCCATCTCACTGTGCTAGGCTG
+>ds2020-267_407
+GGACGTTCGGGCTTCAGGATATGCTTAGAGAAATGTTTATTTGCTGAGATACTGGATGCT
+TACCGAAAGAGGGGAATTGCACGTAAGAAAAGAGAGAATCTTCATAGACTGGCTTCCACC
+AATCGAAGTTTCGCGCATTTCAGATGGTGGTAAAGTGAGACACATAAAGAGCTCTTCCTC
+ATTCAGTCTGATTATTCAGTAAGAGATGGTTTGACCCTTTTTCTTTTTGCGGCGTGCTG
+>ds2020-267_408
+CAGCACGTCCGCAACCCGTTTCGCTCCAAACCCTAAAAAATAGGGTAAGGCAAGGTAAAG
+AAAGTCAAGAGCAAAGGCAAGGTCAACGGGCGTGACACAGCGGAAACACACCAGCAAAGG
+CATAAGCAACAATATTGGCACCATAACAGGCAGGAGCAATACAAGGCACTGGCACCAACA
+AGAGTAATACAAGGCACTGGCACCAGCAAGTCAAGGTAGGGAAATTGCGGACGTGCTG
+>ds2020-267_409
+CAGCACGTCCGCAAGAGTTCCGCCCTCATCATCATCATCGAAGTCCTCAAACTCCATGTC
+AAACTGCTCTGCCAAAACCCTCCACAAGTGCTTCCACTTATACAAATCCCCATTGCTGCA
+ATTGAAAGCCTCATTCTTGGCATAAGGATCAACTGCTGCCCATATCTCATGCTCAGCAAT
+CAGATCAGCATCTGAGGCATCCCAGTACCCGTACCAAAATCCCGTTGCGGACGTGCTG
+>ds2020-267_410
+CAGCACGTCCGCAAGCACAAGATCCTCGGCGCGGAATATAATCCCAAAGTACTCCAAAGA
+CTCAATTATAGTAAATCAAGAAGGTGGTAAGACCCTTGCAGAGTTCCCCAACAGCATAGA
+GCTGGGGAAGCTCGGACCCGGTCAAGATCCGAACAACAAGGAGCACTCAACTACTAGTCT
+AGTCTAGTAGTTGTTTTTTTCTATTAGTTGCGACGCGAACCCAATTGCGGACGTGCTG
+>ds2020-267_411
+CAGCACGTCCGCAAAGTGAGGCCCCTTCTGACCCCTTCTTTATTGAGCCCCAGTCACTGG
+TGGATGGTTGAAGTCAGTCCTCCCCCTACACGGGGGCGAGAGTTTGGCACCTCTCGGACT
+GTTCTAGATCTCGGCATCAGAAATCATGTCGGACGTACCATCTTCGTTCCGATCTCAGCG
+AGCAATGTTTTCGCTTGTCTGATTGAAGGAATATGACTGCTTACTTGCGGACGTGCTG
+>ds2020-267_412
+CAGCACGTCCGCAAGCGTCTTTCCCCCCCTTTTTGTCTGTATGAATTTCTGACCGCGCGG
+AATCTCCATAGCCAATTTTCCATTTTTGATTATGAAATCATAGGGTGCCTTTGGTAAAAC
+TCTTATTTCACACGATCCAGGAACTTCCATAACGTTGGCGTGATTCAGTTTGAGCAACGG
+ATCCTGACGTGATACATCTTCGTAATGAAAATAGAGTGGAATGCTTGTGGACGTGCTG
+>ds2020-267_413
+CAGCACGTCCGCAATTTCTTCCTGATTGTAAAATTGAATTAGTGAGGTCCTTTGCGTGAA
+CCACATTAATTGCATATTTGCATCCTATGATAGCCAAGGAGGTTAGAACCTCCTTGCTCA
+TAATGTGATCTACATCCCAGTATTCTTCGCAAAAGAAGAATCGGTTATGGCTAAGTCCTG
+ATTTGCTAGCTTTCACTAGCATTGCCATGCTGACCTGGGCCAGATTGCGGACGTGCTG
+>ds2020-267_414
+GGACGTTCGGGCTTAAGGCTGGTGTTAATAGCGGAACTGACGGGGCGACAATATCAGCAT
+CAGTTAAGGGACAGGCAAGTAACCAATACTACTTGAATAATGGAACTCATATCCTACCAA
+ACTATTCGTCAGCAGACTTACTAATAGATGAATGGTTATCAATTTACGATAACACAGAAT
+TAGTTATAAAAGCGATGAGGACTACTTACGGAACATGAAGATGAAAGCCCGAACGTCC
+>ds2020-267_415
+CAGCACGTCCGCAAAAGTCTTCTCATGCGGGCGAAGGAGATGCATTTCTGGTACTGGTAG
+TACTGGACAAGCTCTCAGGGAATAATCTCTTTCTTATTTCTGCCTTTCTTTCCCATGACG
+ACTAGGAACGGGCAAATCAAAAATTTCACTTTGAATTCCGGACCTCAACATCCTGCTGCT
+CATGGTGTTTCACGATCAGTATTGGAAATGAACGGAGAAGCTCTTGCGGACGTGCTG
+>ds2020-267_416
+CAGCACGTCCGCAACGTTTTAGGGGTGTAATTTGCGGACGTGCTGACGGCTTGGTCTTGC
+GGACGTGCTGACACCATTACCTTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGAC
+GCACTGACCGTTGCATGAGATATAACACGGTCAGTGCGTCACGGAACGGAGTACGGTCTG
+TGCGTCAGGGATACGACCACGGTCAGTGCGTCAGCAGTATGAAACGGTCAGTGCGTC
+>ds2020-267_417
+TATCTAAGGAGCAGCACGTCCGCAACATTCATGCCCTCAGCACGTCGCAATATCGGCCCG
+GTCAGCACGTCCCAACTCTCCCACCACCACCAGTACCTTACCATGCTTCCCCACCTGATC
+ACTCTAAACATGATCTAGTGCCGCCATTACCTCCAAATCATTACTCGTATGCTTCACCAA
+CAAGAGAACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAT
+>ds2020-267_418
+CAGCAGTCCGCAAGTATTACTCAGTGTACTCCATTTGGTCCTTGTCGCTGAACCTCTTTG
+ATTTAGATGGAGGGGGACTTCCTTGATAGTCATTATCATAAATACCTTCATAGTTTACCT
+CCGCTGCAACAGCATTGTAGTAGTCCTGCCTCTTGCACCGGAAAACTTCTACATACCTCC
+GCCCCATGTTCTGACGATCTCTATGAAGAGCAAACTCAACCTGTTGCGGACGTGCTG
+>ds2020-267_419
+CAGCACGTCCGCAACAGACGCAGAGTTGAAACTCTCAAATTGTTTGGTGACGATCTTCAA
+CCAACCTACGTTTATATCGACAAGTCGAAAAACTTTTTCATCGGGAATGCTGCTTCCGCG
+AAATACGAGACAAATCTTAAGACTAAATCAGATGATGGTTGGTTGTATAAAGATATAAAA
+CGTTGGGTAGGTGTGAACAAACACAACTTTACGGTGTAGCGTTTGCGGACGTGCTG
+>ds2020-267_420
+AATGATAAGGAAGTGGAAAGCACCTTTGGCAAATGGACCTTGAGCCAGGCATCTGAGACA
+GGCAATAATGATGAATGGGATGATAGTTTGCTAACTAAGGAGGAAGTGGAGGCAAGGTTG
+CAGAAGAAGGACGAAGCCCGAACGTCCTTACTTCCAGACACGTCCGCAATTCCTAATCGG
+CACTAGGTCGGGATATTTGCGGACGTGCTGAGGAATCTGGCCTTGCGGACGTGCTG
+>ds2020-267_421
+GACGCACTGACCGTTTCCTAATCCCTGACGCACTGACCGTAAGGCTCCTCGTGACGCACT
+GACCGTAGAAGGCACCCTGACGCACTGACCGTAATTCACAGGTTCGGCGACGGTCAGTGC
+GTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAACCCCAATGCCCTCGCACGTCCG
+CAAGTGACTCTCGCCACACGTCGCAACCATAAGGGGGTAACATTGCGGACGTGCTG
+>ds2020-267_422
+CAGCACGTCCGCAACACACCCATCGTGTAACGCTCTCTCTCTCCGACGCAGTCATCTTCC
+TCCCTCAGCCATCCAAGCTTAATCCCACAGTTCACATCCACGAGGTACTGTTCACGTTCC
+TTTTCTTAGAAATTTGGGGTTTTTGTGTATTTGGTTTATGGTGTATGGATTTGTATTAAA
+TTGGTTGAGGGGTTTCTTCCAAATTGGTTTAGGGTTTGCGGGTTGCGGACGTGCTG
+>ds2020-267_423
+GGACGTTCGGGCTTTTCGTCGTGCCTTTGGTATCATGCTACCGGCGTATGGCAATGAAGT
+GATTTTTATGCTCAAAGGCAGTGCGCTGGCATCGACCATCACTTTGATGGATATCACCGG
+TGAGGCAAAGACTGAAGCCCGAACGTCCTTACTTCCAGTATCTAAGGAGCAGCACGTCGC
+AAAAAGGCCCCACGTTTCTTGCGGACGTGCTGGGGTATGTCCCTTGCGGACGTGCG
+>ds2020-267_424
+GGACGTTCGGGCTTGGTGTAGGCTGTGGTCGGCTTTGTTCTACTTGTCGTTGCTTTTCGA
+CTTCCAATTGTGCATGTTGCTCTGCAAAGCTTTTTCCGCTTTCCATTGCTCGTACTTACT
+CATGGCGGAACCCCTACTAGAAGCCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCA
+CGTCCGCAATTCATTGAAGATTGGGACGTGAGTACGTACACTTTGCGGACGTGCTG
+>ds2020-267_425
+CAGCACGTCCGCAAGTGTGTCGAACTCCCCCTCCCCCCCGCCAATAAGTCTGTCTTACAT
+TTGTGCAGTAAATCATGCTCAAACGCCTTCAATGGCTTAGTGTAGGTCTCTTATGTACAA
+TTTAAAATCCTCAATAAATGTGCCTAACTGAAAGTTTTAGCTCTGTGCCTCCTCTCTCAT
+ATAATCTCTTATTTGATTACTGATGCTTAACCTGACGAGATTTGCGGACGTGCTG
+>ds2020-267_426
+CAGCACGTCCGCAAACAGCACCGCTCAGCACGTCCGCAAAATCCTCCGCTCAGCACGTCC
+CAATGCGATAAGGCTTGCGGACGTGCGCTTTAGGCGACGCACTGACCGTAATCCCTCCTT
+TCGAAAATCCTGCTTAGCCGGAGCTCTCACTGAGAAGGCTGGCCTATAGGAGACTGCATT
+ATTGGCAGATACTCTGAACTCCATTTCTTTACGAGGCTTCCTAACCCTAACGCTG
+>ds2020-267_427
+GGACGTTCGGGCTTCTTTAGCTTCATACCTATCCTCAGAATCAGAACTCTTTTCTCTCTC
+AGAGCGCCGACTATCACGGTCTCTCTTATCTTTATCTTTATCTTTATCCCTGTGTCTCTC
+TCCATTCCTCTCTTTTTCACGTTGCCGATCTCGATGACTCCTCTTGGATTCCCCCTCCTT
+CCTGGATTTATGCTTGCCCTCTTCCATTTCTTTCTTCCTGATACACGACGTGCTG
+>ds2020-267_428
+CGAAAAAACCAAATTCAGCTCTACGTAAGATGGCCAAAGTACGTTTGAGCAATCAACATG
+ATACATTTGCTTACATTCCAGGCGAAGGTCATAATTTGCAGGAACATTCTATGGTGTTAA
+TAAGAGGAGGTAGAGTGAAAGATTTGCCAGGTGTGAAATTCCATTGTATTCGAGGAGTCA
+AGGATTTGCTGGGAATTCCGGATCGAAGAAGAGGGGCTACAACGGTCAGTGCGTC
+>ds2020-267_429
+GGACGTTCGGGCGTCTATTTACGGATGGCAGCCCAAGGCGCAATCTTTCAGGATCATGCA
+CGTCCGATGTTTCCGCCATGGCCCGGGACCCGATGAAGAAAGCCCGAACGTCCTTACTTC
+CAGTAGGAGCAGCACGTCCGCAAATGTACTCCGCTCAGCACGTCCGCAACGTGTCACCAC
+TCAGCACGTCCCAAGTGTCCACTGGCTATAGATTGCGGACGTGCTGCTCCTAGAT
+>ds2020-267_430
+CAGCACGTCCGCAAACGCTCACGCTTCAGCACGTCGCAATGTTCGTCCGGTCAGCACGTC
+CACAAACCCTGAATTGCGGACGTGGCGCTTAAGGCGACGCACTGACCGTGCAGCCCCTGT
+TATATTGTCGGTGCAGGGCTACTTGACCAGTGAGCTATTACGCTTTCTTTAAAGGATTGC
+TGCTTCTAAGCAAACCTCCTGGCTGTCAGTGCTTCCCCACTTCCTTTTCCACTTA
+>ds2020-267_431
+GGACGTTCGGGCTTTCACTCCCAGATATAAGCCCGAACTCCAGGATGCCAGGCAAGCCCG
+AACGTCCAGACAGAAGAATAAGCCCGAAACGTCCACCGGAACGCACAAGCCCGAACGTCC
+TTACTTCCAGTATCTAAGGAGCAGCACGTCCGCAAGTCACCCATCGTGCGGAGAGTGAAT
+TATAATTGCGGACGTGCTGAGGGCGGTTTTTTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_432
+CAGCACGTCCGCAACCTGCTTTCCCTCCGAATAAGCAAAATAAGTTTATACACCTAATTT
+TGTTCCTGCCGATTGAATAAGAATCAAATACAATCAAGTGGAATAAAATTCTAATGAAAT
+ACAAAAATTTTTAAAATTAAATTAACTAAAGAGAGAAGGTAGGAAGGGGGCAAATACGGT
+CAGTGCGTCGCCTTAAGCCCGAACGTCCAGCCCGCATGTCAAGCCCGAACGGCC
+>ds2020-267_433
+TATCTAAGGAGCAGCACGTCCGCAAACGCATGCACATTGGACAGCGATTGGTTGGGTTGC
+CCAAGGTACGGCTTTAATTGTGTGGGGAGTAACTGAGCGCTACCGTTTAAGCCGATATAT
+TGGTGTGGTTTTAGTTTTACTTAGTTCTATTGCGCTGTTTTATCAGGTGTGGGTAAACGA
+AGAGTTCCCAACGCTAAGCACAAGCATCACAGCCAAACGATTGCGGACGTGCTG
+>ds2020-267_434
+CTATCTAAGGAGCAGCACGTCCGCAACAATAATTCCTTATTGAAAAATTCGCTCACAGGG
+CTTCTGCAACTGGGTAATGCATGCTTGTGAGCGAATTTTTCAATAAGGAGCTCCCACAAT
+AAGAATGTGGGTCTGGGCTGCCAACCACAAGGTCACCAAAATCATTGTTTGTGTCAACCA
+ATGTTTCACGGGAATCCAGATATCTGTGAGACCAATTCGAAAGCCCGAACGTCC
+>ds2020-267_435
+CAGCACGTCCGCAATTTTGCAGCCATGTACGCCCTGGCCATGGCTGGTCTGTTCACGGTT
+TTGAGGTGTTCCGTTGCCTGCTCTTCAGCGGCCAATATCTCCTTGTATGACTTAGGCGGC
+TCACCGATGGCAAGCGTCGTTCCCAGCGCCTTTGCCATAAGGTTAGACAAATCCCCCGTC
+CTCACGATTTGAGACCCCCTGGCGGCGCCCACCCATGATGTTGCGGACGTGCTG
+>ds2020-267_436
+GACGCACTGACCGTACCTGTAACCATCAATACTTTTTCTTGCAGTAATAATTCCATCATA
+AACTGCATATCATCTTCGATTGGATAAATGTCACGGTCAATTTTTGGGAAACAATAAAAC
+GCCCCTTGTGGCATGGTGCACGAGATACCTTTAATGGCGTTTAGACGCTCGATAGCGATG
+TTGCGCTGCTGATACAGGAGCCAATACGGAACGGTCAGTGCGTCGCCTTAAGCG
+>ds2020-267_437
+GACGCACTGACCGTCGGACATTCCTTGACGCACTGACCGTTCCTGCGCTGGGACGCACTG
+ACCGTTATACCCCAAATCAACGCACTCTCGTACGAAGGCTAGCGATACGGTCAGTGCGTC
+GCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGTACCAGGCTGTTGCGGACGTGGAG
+TAAGAGACATTGCGGACGTGCTGACCCCACCCCATTAAAATTGCGGACGTGCTG
+>ds2020-267_438
+CAGCACGTCCGCAACTGGCACCTTTTTCGGATGAAGACGAAGACTGTATTTCCGAAATCT
+GTCAAACACTTTCTTCAAATTCACCGTCTTCTTAAGCCCAAGACTTGGCGATCATGTCAT
+CGACATAGACCTCCATTTCCTTGTGAATCATATCATGAAACAGCGCAGTCATGGCTCGCT
+GGTACGGCGCCCCGTCATTCTTTAGACCAAACGGCAACACTGGCGGACGTGCTG
+>ds2020-267_439
+GACGCACAGACCGTCGATATGGCTCTAGCATAGGCAGTGCGTCCCGGGCACCTCACGGTC
+AGTGCGTCAGGAACATAATAACGGTCAGTGCGTCAGGGCATACTCTACGGTCAGTGCGTC
+GCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAAGGACTATCTCTCAGCACGTCCGCA
+ACTTCTTTGTCGTCAGCACGTCCCAATAACTGGTGGATGCTTGCGGACGTGCTG
+>ds2020-267_440
+TCAGCACGTCCGCAAGCTAACCTTTGTAATTATTGTAATTTTTCTTTACTCTCTTTTCAT
+TTCAAATTTATTCAATTTTCTTTGAGCTTTCTCTCTCTAGCTCTTCCAATTTCGACGTTC
+TCTTTGTTTGAACACCTCCTTCTTTTCTTCCACCGACTTCCGTCATTTCCCGCGTCCCAG
+TTTTCTTCACTGATAATTCTTCCTCCTCCTCGTCGGATCCACGGTCAGTGCGTC
+>ds2020-267_441
+CAGCACGTCCGCAAGTTGAGTTCAGTGGTGTAAACGAGTTGTCCAGTGTGGTAACGGTAA
+GGGAGTACAGTAATGCCAGGTTGTGGAAATCTGTTGTTTGGAAGTTCGTTGTCGTCTAAG
+TGACGATAAAATTCGAAGGGTTCGTTACGGTCAATGTTCGCTTGAGTGTAGCGTTCATAT
+GTTTGAGAGAAGGTGTGTTCGTATTCTGATGTGCGATGACTTGCGGACGTTCTG
+>ds2020-267_442
+CAGCACGTCCGCAAACCACGCCTTTTATGAGCAGCTAAGTCAGCTGCAGATTTTGCAACA
+ACAGATTGCATCTTTGACCACTAGCACCACCAACTAAAAATTGCCCAGCAAACGCTACAA
+GCCGATATTCAGCAGCGTTTTGCGACATTGGGTTTTGTGGATGACGCCGATAATCGCGCT
+GCGGTGTTGGTTGATACCGAGCGAGAAAGGGTTGAACTATTGCGGACGTGCTG
+>ds2020-267_443
+AAGCAGGTATACGGGTCAGACGTTTAGATGCAGGGTAGCCCTCTTCTACTATCCTGGTTG
+CCTTGACTTCCTGAACTTCAGCCAGATGTCCAAATTCAAAGGCTAACCAACACGAATCAT
+TTGCGACGGTAGGCACTTCTTTTCCGAAAGGCACAGAACACATTGCAGCCCTACCTATTG
+GGGGGGGGAGGGCACGGTCAGTGCGTCGCCTAAGCGCTCTTGCGGACGTGCTG
+>ds2020-267_444
+CAGCACGTCCGCAATGTGGCAACCGTGTACGACGTTTCCGATGACACCCTGTCTATCAAG
+TGCCCCAGTATCAGCATATTATTGGCGTTTGTGTTGATAAGGGACGTGTAATAGGAACCA
+CTCGGCATCGTCCCAAAAAGGTTGACAAGGTACCCCGAAGGATGCTCAAGAAGCTTCTTG
+AGAAGCTGGCGCTTTGACACAGATGACATAGCCTAACGTTTGCGGACGTGCTG
+>ds2020-267_445
+CAGCACGTCCGCAAAGGGCCGGGGATTGCGGACGGCTGAGTAGAGGGTAGTTGTTATTTT
+TGCATGCAAGCTACTGACGTCTTTTTTTTTGAGTGTTCGATGGCTTTGGAGAAAGGTTTT
+TAGGATTAGTGCATCAGGGGAAGATGATGCATCTGATGAGCATAAAGGTATGGAGGTTGC
+GGACGTGGAGGTGTAGCTTCTTGCGGACGTGCTGAGGTCAGTCGGGTTGCGGA
+>ds2020-267_446
+GGACGTTCGGGCTTTTGAGTTTCCCTGGACTTCGGGCTTGTTTCTGCGGCTGGACTTCGG
+GCTTTGTCTCTGGGGGGACGTTCGGGCTTATCTACACCCTGGAAGTAAGCCCGAACGTCC
+TTACTTCCAGTATCTAAGGAGCAGCACGTCCGCAACCGGCAAAACCTCAGCACGTCCGCA
+AGACGAACTACTCAGCCGTCCGCAAAGACCCCATCATTGCGGACGTGCTGCTC
+>ds2020-267_447
+GACGCACTGACCGTCGACGAGCCGATAGTACGGTCAGTGCGTCAGTTCTGTTCAGACGGT
+CAGTGCGTCAAGGTAGGGGCAACGGTCAGTGCGTCAGCGGAACTCGAACGGTCAGTGCGT
+CGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGTTATATACGGTCAGCACGTCCGC
+AATGCGGTCTCCCTCAGCATGTCCCAAACCCAGTGCGTGTTGCGGACGTGCTG
+>ds2020-267_448
+GACGCACTGACCGTAGCTGCCTGCTTCTTGACTTACATTCTTGGCCCCTTCCCTGGCGAC
+CACTACCATTATGCGATATAAAGTGAAATCCAACCTAAATTCCCAAACAACTTGAGGTTG
+CTGACTCATCATGTGGGTCAAAAACTGAACTAATTCCACATTTCCAGTGCAGTGAACTCC
+ACTTAATATAACCATTTTAGTGATTTAAGGTAAGTGTTTACGGTCAGTGCGTC
+>ds2020-267_449
+GACGCACTGACCGTTCTCTTCAGGATGACGCACTGACCGTTGCCCTTTCGATGACGCACT
+GACCGTCCTGAGACAGTTGACGCACTGACCGTTCCATTATCGCTGACGCACTGCACGTCT
+GACGGTCAGTGTATCTAAGGAGCAGCACGTCCGCAATAGAGTCCCCCTCAGCACGTCCGC
+AATAACTAGACGCTCCACGTCCCACGACCCTGGCTTATGTTGCGGACGTGCTG
+>ds2020-267_450
+CAGAACGTCAGCAATCGGCGTACCCTAGCGCGTCCGCAAGGAACAATCCTTCAGCACGTC
+CCAACTATCGTGCAGCACGTCCGCAAGAGTCGTACCCCAGCACGTCCGCAAGTAACAATC
+CTTCAGCACGTCCCAACTATCGTGCAGCACGTCCGCAAGCGCCGTACCCCAGCACGTCCG
+CAAGTAACAATCCTTCAGCACGTCCCAACTATCGGGGCATTGCGGACGTGCTG
+>ds2020-267_451
+CAGCACGTCCGCAAACCCAAAGCTCTCACTGCATCTTCCATCTCCTTCCTCCTCCCCTGC
+ACCGAAACGACGCCGTACGTACCCCTTCCCAACATTTCCAAACTCTCACGACCACTCGTT
+TTCCGTCTCTCGTCTGATCCGGAACCGGAACTACTCGACAATACGATGTCGTTTTCTGTA
+GACGAAAATGACACAGATAAAACCTTAGCCGGAACACATTGCGGACGTGCTG
+>ds2020-267_452
+CAGCACGTCCGCAAAGCTCCGTTGGTTAGAGCACTGCCTTGATAAGGCAGGGGTCATAAG
+TTCAAGTCTTATTAGACTCACCATTAGATGAGCTTAGTAAGCGCAAGCGAACTTAGCGAA
+ACTTATGTACCGCTACTTAATTACTGTAGCTGGTTAAAGTCTTATGTATCTTTACTCAAT
+TAAGTAACGACTCAATTAAGTAGCGGAGTGCGACATGATTGCGGACGTGCTG
+>ds2020-267_453
+TTGACAGAGACGGCACTCACAGGAATTAGTCTAGCAGCATGGTAGAAAGTCTTAGCCCAC
+AATTGCTTAAGTGGGGCAAAGCCCCCTATGTCTGAAATGAAATGGGAGCGCTTATACTTC
+TGCCATGTGCGGACGGGATTAGTCATGAAAGCACCAAGCCCGTATTTCTTTTCCCATTTT
+CCTATGATGTAGTTGAACGGGACCAGATTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_454
+CAGCACGTCCGCCACTGATCCGCCATTGTGAGCGGGCTGGCCGACGCGCGACCAACTCCC
+ATCCTATTGAAGCTGCTGATGTCTGTACAGCGGTAAGTGGGGGTGTCTGAATGCGGTACT
+CGGAAGTGAAATTGCACAGGTGCCAGCGAGGTACATAGCGTCACAGCTGCTAACGTTGCA
+TCAGGATTACAAGCAAGCGGTGCCGGAGGAAAAACGGATTGCGGACGTGCTG
+>ds2020-267_455
+CAGCACGTCCGCAACCTCACGCCTCTCAGCACGTCCGCAACCTCCTCTTCCCCCCTGAGT
+GGGAGGGCTGTAAACTCCTCTTTGTCCTTACCGACAAGTCCCTTGTCAACGCATTCCACT
+TCCCCCTGATTCCCACTCAGCAGAACTCCATGCTACACAACGCTGCGGCTGAGGCTCTCA
+TGCATCTCAAGTGCACCATCCACCTCAGCCCCATCATCAAGCCCGAACGTCC
+>ds2020-267_456
+GGACGTTCGGGCTTTGCGTGAGGGGTGTTGTGGGGCCATGTTGGACTCTTCTGCCGGAGG
+GTCGCGCCGCATGATGCTGGGAGTTGAACAGTCTGGGAAGTCTGGTGTAGAAGCCCGAAC
+GTCCTTACTTCCTATCTAAGGAGCAGCACGTCCGCAAAATGACAAGGTGGTTGCGGACGT
+GGCCCAAGTGGAATTGCAACGTGCTGACGGGCTGGGGTTTGCGGACGTGCTG
+>ds2020-267_457
+CAGCACGTCCGCAAGGCCTTTGGGGTGTATGACGGGCACGGTGGGGCTGAGGTGGCGAGG
+GCTTGCAGAGATAGGATGCATGAGTTGGTGGCGGAGGCAGTGGAACTGGAAAGGATTAAT
+AATAGTAATAATAAGAAGAAGAAAGATCCGGTGGATTGGGATTGGGAGAGGGTGATGGAG
+GGGTGTTTTGGTAAAATGGATGAGGAGGTGAGCGGGATTGCGGACGTGCTG
+>ds2020-267_458
+CAGCACGTCCGCAATTCATAGCCCCTCACTATAGAAGCTCCCATTGGAACTATGAGTACC
+CCAAATGAATGGGTGGCACATAATAGACCCAACTTCAATCGGTTACGTTGTTCATCACGA
+ATCTCTCACGTCAGCAAACATGTAAAGAGAGAGATAGAGACAATGTTTTATACAACACAT
+TGCCCGGGAGTTCCTTCCAGATGAAGACTACGAAGAGGTTGCGGACGGCTG
+>ds2020-267_459
+GACGCACTGACCGTATTAATGCATGTTGTAACGGTCAGTGCGTCAGCGCGTCGGGAACGG
+TCAGTGCGTCAGCAAGAGTTATACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGAGCAGC
+ACGTCCGCAAAGACCACGGGGTCAGCACGTCCGCAAGTGAGGCCTACTCAGCACGTCCCA
+ACTTACATTCCCTCAGCACTCCGCAAAAGGGTTCAAGTTGCGGACGTGCTG
+>ds2020-267_460
+CAGCACGTCCGCAATGGTATTAGTCTGAGAGGAGCAGAGGTAAGCACGTTAGAGCGTTCT
+TTTTTCACCTTTGTTTCTCATATAGAAGTCAAACTGAATGCATCTAATTTTGCTTCTCAG
+GCAAAAATCTATGGCGCACTACAACAGTCGTCAATTCGGATGGTCGCGCGTGATGTTGCA
+ACGTGGCAGGACTTTGATGCCTGCTCTGCTTTGGGATTTGCGGACGTGCTG
+>ds2020-267_461
+CAGCACGTCCGCAAACACTTCTGGGCGCCGTCGCAAAATGGTCGTGATATTGGGACGTGC
+TGAGGAGCGAGCCATTGCGGACGTGCTGCTCCACGCTTAAGGCGACGCACTGACCGTCGG
+TATACCCTTGACGCACTGACCGTCCTCACACATCTGACGCACTGACCGTCGTAGCAAGGA
+TTTTACGGTCAGTGCGTCACGCGACCTGCTACGGTCAGTGCGTCGCCTTAA
+>ds2020-267_462
+GACGCACTGACCGTAGTCTGAACACTGACGCACTGACCGTGATTGCGGGGTTAGAACGGT
+CAGGCGTCAGGGTAACGTTAACGGTCAGTGCGTCAAGGCATAGATTACGGTCAGTGCGTC
+GCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAACCACAGGCCGGTCAGCACGTCCGCA
+ACGGCACTTTCCTCAGCACGTCCCAAGACCTAATCATTTGCGGACGTGCTG
+>ds2020-267_463
+CAGCACGTCCGCAACCCAGCCTTCCTCATTCACCACCACCACCGCCACATTCACCACCAC
+CACCAATTTATCCGTATCCATCACCTCCACCTCCCGTCCATTCCCCACCTCCCCCAGTGT
+ACCAGTCCCCTCCACCACCACCACCACTTTGTATGGAGCCACCCCCTCCACCTTCGCCAC
+CACCACCAGGTATTGAGTACTCACCGCCACCTACTCCTTGCGGACGTGCTG
+>ds2020-267_464
+CAGCACGTCCGCAAGCCGATACTTTTATAGCACCTTTAGCTGACTGGCTGTCACACTTTT
+TGCCACTCGGCCAATCGTTAGACCTTGAATTAAAATGGAAAATACCACAATCGCATAAGT
+CAACGTTAATAACAAATCTCGCTCGGCCCCGGCAGGTAATTGTAATACTAATGCCACTGA
+AATACCGCCTCGCAGTCCACCCACCAATCATGCTTTGCGGCCGTGCTGCTC
+>ds2020-267_465
+CAGCACGTCCGCAACTTGTCCCCTGTGCGCTTACCCAGGATCGTAGGTATACCCTCTGGT
+GTGGTGGACACGAGTGGGTCGTCTACTGGACAACCGCATAGGAAGTTCAGGATAGACAAC
+CTAATCGCTTTTGCATGGGCAATGCAAAACTTTAGGCCCCTTTTGTTATTAACTGATTCC
+AAGTAATCAGTTAGATCATCCAATACACGTGCTTTATTGCGGACGTGCTG
+>ds2020-267_466
+CAGCACGTCCGCAAAATATGCGCGGTGGAGATAAGAAATGATGATTAGAGTATTGGTCGT
+TGACGATCATGATTTAGTCCGAATGGGCATCGTACGGATGCTGTCAGATAGCCCTGACAT
+CGATATGATTGGTGAAGCTACTGATGGTGAAACCGCGATTATCAAAACCAAACAATTAAA
+CCCTGATGTGGTGTTACTTGATGTACGGAATGTACATTGCGGACGTGCTG
+>ds2020-267_467
+TTAGATTCGCTTAAGGCGACGCACTGACCGTTGTTATGCTGGTATACTATGTGTATATGT
+TTAATAGAACTACTTCTAACAACCTATGCATTCGGTTATCGTTTCCAATTGGATGATCCA
+TTAATGCAACTGACAGAGGATTATAAATGGATCAATTTTTTTGATTTTTACTGGAGATTG
+GGAATAGATGGAATTTCTATAGGAAGCCCTCAGCTTACGGTCAGTGCGTC
+>ds2020-267_468
+TAGCACGTCCGCAACATGCCGCCCATGATAAAGCACTGATACTAACCACCGCGGATGCAT
+TGGTGGTCTTCTTTGAAGTCTGGTGGTGTTGATGTCGTGGGGCCTGATGTGTGGTTCAAG
+TGATGGGGTGACGCAGTGAGGTAGCCGCGCCACTTAGTGGATTGGTGGTGTAAGCGTGTA
+GGCCGTGTGGTAGGTAAATCCGCCGCACTTTATGGTTGTGGCGTGGTGCG
+>ds2020-267_469
+CAGCACGTACGCAAGAAGCATGGGGTATTGAAACTTGGCAGGGGGGTGTGGAGCTTGAAG
+AAGTGATGCGGCCGGTACCTAAGGATGCGGCGGCTGGGTTACGTGGTTAGGAGGATGGGC
+CGGGCTGCGTTCGAGCTTGGTTTGAGAAGTGCGACTGGATTATGCCCGACCGGGTTTTTC
+AAATATAGCTTGGGCACGGCCAGGATACGGAGGTTTTTGCGGACGTGCTG
+>ds2020-267_470
+GGACGTTCGGGCTTCACTCCAATCCTAGCTTCACAACCACCACCACCCACAAGCCCTCCC
+ACTCCCTCTCTACCCCCACTTTTCTCAAATTCCCAACCGAATCCCCAAATCCAAGCCCGA
+ACGTCCTTACTTCCAGTATCTAAGGAGCAGCACGTCCGCAATACACATGGGGTGCCCCGC
+AAAACCACATCGCTCACACGTCCGAAATGTATTCACTTGCGGACGTGCTG
+>ds2020-267_471
+GGACGTTCGGGCTTAGCGCACACCCTCTCAATCAGATTCCAGAAGATTCTTTGAGCTCTG
+ACTGCAGGAGTGCCTATGATCTGCTCGCCATTCTTTGCTGACCAGAGAACCAATTGTTAT
+TATACTTGCAATGAATGGGGCAGTGGCATGGAGATTGATAACACTTTCGGACGGGCTGAC
+AGTATGCAAAGTGCGGAAGTGCTGACAGCATAGTTATTGCGGACGTGCTG
+>ds2020-267_472
+CAGCACATACGCAATTGTCATCCCCTCAACACGTCCGCAACCTATACCCCCTTGACTTTG
+CGGACGTGCGCTTAGGCGACGCACTGACCGTGTATACCCCCCTCTGACACACTCTAGCCT
+TGCAGTCTCCAATGCAGTTCCCAGGTTGAGCCCGGGGATTTCACATCAGACTTACAAAAC
+CGCCTGCGCACGCTTTACGCCCAGTAATTCCGATTAACGCTTGCACCCT
+>ds2020-267_473
+CAGCACGTCCGAAAGTTATTCTTTATTGCGAAGTTCCAGTCTGTTAGCCTCAATCGTGAG
+TTCCTCCTCATCTCTGGGGAATCCGATCTCGATCTTGACGTTTCCCTCAGACTTGTTTCT
+GAAGTGGGGCATTTCAACGTGAGCGTCTTTGTAGCACCCAGATTTGAAGACCATAAAATC
+ATCTTCACCTTTGGTTGCCACATAGATCACTGACTTTGCGGACGTGCTG
+>ds2020-267_474
+CAGCACGTCCGCAACCGGTCTCGGCTGCTTACAGATAAATTATTGGCTTAGCATGAGAAG
+CTTGTGGCATGGGAGCAAAATCGACATGAGTTTAGCACCGAAGAGAAAATTGAGTGTTCT
+TGGGAGAAAAAGGGGTATTAAGGTAGGAGATGGAGAGTTTGCAAAGAGGTTTGGCTGAGA
+AAGGAGGGAAGGAAAGGAAAAGATGGCTTGGGCGATTGCGGACGTGCTG
+>ds2020-267_475
+CAGCACGTCCGCAATTCTGGGTCCTTGTACTGTAGCTTGACTTAAGCAAGCTATTTACTT
+AAAAAAAAACCGTCTTGATCTACGGCCATAACATCTAAAATCTTTTGTAATCGAGACCGA
+TACCGATACGCGCGAACTGGTTCTCGCCGTTCGGAAGGCATCGGTGGAGTCTATTCATTA
+CTTGTTTAAGCACCTCAATAACGACTAGGGCGGATTTGCGGACGTGCTG
+>ds2020-267_476
+CAGCACGTCCGCAATCTATAGGCCCTATACCCAAGTCAGACGAACGATTTGCACGTCAGT
+ATCGCTGCGGGCCTCCACCAGAGTTTCCTCTGGCTTCGCCCCGCTCAGGCATAGTTCACC
+ATCTTTCGGGTCCCGACAGGCATGCTCTCACTCGAACCCTTCTCAGAAGATCAAGGTCGG
+TCGGCGGTGCAACCCTCAAGAGGCATCATTAGTTGCGGACGTGCTGCTC
+>ds2020-267_477
+CAGCACGTCCGCAAACCAATATCGGTGGCTCACACCTGTAATCCCAGCACTTTGGGAGGC
+CAAGGCAGGCAGATCACTTGAGGTAAGATGTTCGAGACCAGTCTGACCAACATAGAGAAA
+CCCCATCTCTACTAAAAACACAAAAAGCTTGGCATAGTGGCTCGCGCCTGTAATCCCAGT
+TACTCTGGAGGCTGATGCAGGAGAAGCCTATAGAATTGCGGACGTGCTG
+>ds2020-267_478
+CCGCAAGGTAATAAGTCTCAGCACGTCCGCAAAACCCCGGGCCTCAGCACGTCCGCAAAC
+CGTAATCCCCCACTCGAACGTATACCCATTAAGCCTTGCTCTACTCCTCTCCTTCCTCAC
+TTGTTCTCACATCAATCTCCAACCTTTTTATTGGATTTTCATCCTCTTTCACCTCCTTGC
+TCCTCATCCCCCAGATCCCCCCACTCCACCCAACAAGCCCGAACGTCCT
+>ds2020-267_479
+GGACGTTCGGGCTTGGAGCTTCCCATGGACTTCGGGCTTTGCCAAACCCCTGGCGTTCGG
+GCTTCAATTATAGCCTGGACTTCGGGCTTAGCTCACCGCTTTTAAAAAGCCCGAACGTCC
+TTACTTCCAGATCCGCAACCGTGTTAGGGTGGAGCAATTGCGGACATGCTGCCCCTAGTT
+TGCGGACGTGCTGAGGGATGTTATTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_480
+GACGCACTGACCGTAGGTTCCCGACTGACGCACTGACCGTAGTTAATTCCCTGACGCACT
+GACCGTCTTCAGCGCCCCACACGTCCGCAATCTTTGGTCGGTGGCGTCTTGACCTAACTC
+GCATTGGTTACGGTTCAAAATCTGGTCTTCAATGGCGTTTCTAACGTATGGGTCGATATC
+GTAATACAACTCTAGCATGGCGGGGAGGATACCACTTGCGGACGTGCTG
+>ds2020-267_481
+CAGCACGTCCGCAATCGTACTTTCGTTCTTGATTAATGAAAACATCCTTGGCAAATGCTT
+TCGCTTAAGTTAGTCTTACGAGGGTCTACGAATTTCACCTCTCGCCTCGTAATACTAATG
+CCCCCAACTGCTTCTATTAATCATTACCTCTTGGTCTAAAAACCAATGAAAGTAGAACAG
+AGGTCCTGATTACTAGCAAGCTATTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_482
+CAGCACGTCCGCAACGCACTCGGGTTCACTTCTTTACGGGTCGGTTACCTGCGAAGCGGA
+GGTTGCCAAACACCTACACCAGAGGGGGCAAGTAGCCACCGATGATTACGGGACTCTTGG
+CCCTGACCAGGCCCTGTTGCTTGCGAATGTATACAGGGTTTTCGGACACACGCTGGAGCT
+GCAACACTTTAAGACTCAGGAGAGATACGGACCTTTGCGGACGTGCTG
+>ds2020-267_483
+TAAGGACGTTCGGGCTTAGAGATGCGGGTGCTGATTCTGATAATTGGGGGAGGAAGAAGG
+AGGAGAGTAATGGTGGGTCTGGTTTTGATCGAGAAAGAAGAGTTGGGTTCGTGTCCAATG
+GTGGTGGTGCGGATTCTGAGGTTTGGGGGAAGAAGAAGGAGGAGAGTAATGGTGGTCCTC
+GGGGTTGTTTGCGGACGTGCTGAGGCGACTATAGTTGCGGACGTGCTG
+>ds2020-267_484
+CAGCACGTCCGCAAGCTTCCTCTAATAAAGCGGGAAATACCTCTTGGTGCTCATATGGCA
+GTGTTACATCTTTCATTGCATCTTTGTAGTTTTTCATGTGTTATGTCTTCTAACTATGTT
+ATCATGTTGAATATAGGGTTGGGATCCCTCCATTATGGATTCTGACATTTGCTATTTCTT
+ACAGGATTCTCCAATTCTTGGGATGCCAACAATTTTGCGGACGTGCTG
+>ds2020-267_485
+AGACGTTCGGGCTTTTTAGATCCCTTGGACTTCGGGCTTTTTCCCGTCCCTGGAGTTCGG
+GCTTAACTCAGGGGTTAAGCAAGCCCGAACGTCCTTACTTCCAGAAGCACGTCCGCAAGT
+AACAGAGGTTGGGACGTGCTGAGGTGAGCCCAATTGCGACGTGCTGAGAGATTTAGGGTT
+GCGGACGTGCGAGTGCATTTATTTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_486
+CAGCACGTCCGCAATCGGAACCGGTTCGGAAGAATTCACAGGTAAGGGGCCCAGGTGTGA
+AGCCGTTGAAGCAACCGAAACCCAAGGCTAAGGACCCAAATAAGAGGGAGATGAGTATGG
+AGGAGAAGCACAAGTTGGGAGTTGGGTTGCAGAGTTTGCCGAAGGACAAGATGGAGCAGG
+TGGTGTAGATGATAAAGAAGAGGGGCGGAGTGCGGACGTGCTCTCCTT
+>ds2020-267_487
+GGACGTTCGGGCTTCTAAGGGAGTGTAGGTGGCTCATTAAGTCACATGTGAAATCCCCGG
+GCTTAACCTGGGAACTGCATGTGATACTGGAGAGATACAGCCAAGCCCGAACGTCCTTAC
+TTCCAGAGCAGCACGTCCGCAATCAGCCCGCCCTCAGCACGTCCGCAAGCCGTATTTCCT
+CAGCACGTCCACAATCCCCGCATTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_488
+GGACGTTCGGGCTTCCATGCTGCAATGGCTGGTACAGAGAGTGGCGAGCCTGTGAGGGTG
+AGCGAATCTCGGAAAGCCAGTCTCAGTTCGGATTGGGGTCTGCAACTCGACCCCATGAAG
+TCGGAGTCGCTAGTAATCGCAGATCAGCAACGCTGCGGTGAATACGTTCCCGGGCCTTGT
+ACACACCGCCCGTCAAGTCATGAAAATAGGTAACAAGCCCGAACGTCC
+>ds2020-267_489
+GGACGTTCGGGCTTGAATTCGGCAGTGGACGTTCGGGCTTTTACATTACGTGGCGTTCGG
+GCTTAGAACCCTGGCTGGACGTTCGGCTTTCATTACCGGGTTATATAAGCCCGAACGTCC
+TTACTTCCAGTATCTAAGGAGCAGCACGTCCGCAATATTTCACAGCTCCCGTCCGCAATG
+CGCAGTTGCTTGGGACGTGCTGAGAAGAGTCCAGTTGCGGACGTGCTG
+>ds2020-267_490
+GGACGTTCGGGCTTTACCCCCCCACTCAATAATCCTACCGATATGTGTAAACAAATAATT
+CACAGCCTTATCTTGCGCGCAATTAAAGAGCATAGGGAAAGCATTTCGCTTACTGGAAGG
+GTCCTGCTCGGAGGCCAAGAACCGATCGATGATCTCCGGCGCGCTATCCAGCAATGTCTC
+CCCCGTGGTTTGCGGACGTGCTGAGGGAACAGCCTTTGCGACGTGCTG
+>ds2020-267_491
+GGACGTTCGGGCTTTCTGCCGCCCCTAAGGATCATATAAGAAACCATCTAGAATATGAAT
+CTTGAGAGTACACACGATGCTTGTAATGACCTAGCCATTCTACAATTAAAAGTTCGACTA
+GAACTGTAACCAAGGCACAGCTCGAAGCCCGAACGTCCTTATCTAAGGAGCACCACGTCC
+GCAAGACGTCTCACTTCCACGCAACTTAACTGCATTGCGGACGTGCTG
+>ds2020-267_492
+CAGCACGTCCGCAAAGTGTCTGGGATAGTCTTTGACTGTGATACAGGCATACCAACGGTT
+ACGGCTGTCTTGCACCAACTCGCAAGTGTTGATTTGATATAGGCTAAGGTTGTAGCTGTA
+CCATAGGTCAATGATTAGTTTCTGCCCTTTGGCTAAAGATAGTTGTAAGGTGGATTTTAA
+GCCCTTTTTGCCTGTTTGGTGAGGGATACCGCATTGCGGACGTGCTG
+>ds2020-267_493
+CAGTACGTCCGCAAGTGTCGGGTCTTGTTTTCTTTTGGGTTTGAGGTTGTGGAGGGAGTG
+AAAGGGGTGGTTGATGAAGATGAGGAAGGGGTGTGTTTGGGGATTTGGAGAAGAGAGAGG
+GCTTGGAGAGTGCAAGTGAGTGTGTTTGGGATTGATCTTCTGTGAATGGGTTTTCTGCTG
+AAGAAAATTGAGGTGGAGGAGGAAGAGGGGGGGTTGCGGACGTGCTG
+>ds2020-267_494
+GGACGTTCGGGCTTGACACCATTCCTGGACGTTCGGGCTTGGACGCGGGACTATAAGCCC
+AAGTCCAGATACGAATCGAAGCCCGAACGTCCTTACTTCCAGACACGTCCGCAAAGTTAC
+CGGGGTATGTTGCGACGTGGGGGAGAGGGAGATTGCGGACGTGCTGAGTATGAAAATTTT
+GCGGACGTGCTGCCCGCGAGCTGTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_495
+TCACTCCATCATAGTCTGATAGATCTTTTTAAGAATTGATTAATCGGACGAGAATAAAGA
+TAGGGTCCCATTATACATGTCAATATCGACAACAATGAAATTTATAGTAAGAGGAGGTCC
+AGATGGACGGTCAGTGCGTCGCCTTAAGCGAATCTAAGGAGCAGCACGTCCGCAATACCG
+CGTCGATGTTGCGGACGTGCTGCCCAGAATCTCTTGCGGACGTGCTG
+>ds2020-267_496
+CAGCAGGTCCGCAACGTCGGTTTTGTGTCCGTATCGGCGGTGCCAATCGGTTGCGAGGGG
+TGTGTAGAGCGATTCGAGTCGGTCAAACACTGCGCGGAAGGTTGTTCGATTCGCTAAGAA
+ATAGGAATCGGTGGCGAAGGGGGCTTCAGCGTTCACGTGCCATTTATATGGGTAGTGGGG
+CTGCACATCATAGATGTGGGCAGGTCGTCAATTTTGCGGACGTGCTG
+>ds2020-267_497
+CAGCACGTCCGCAACTGAAGGTTCTTTCTATCTATGATCTTTCTATCTCTGTGCAGCTAC
+TTCACGCCATTCAAATAAATAGCTCATCCTCCAAATTCCAGACCCTTTTGGTTTCTGCAA
+AAATGTCGAGAGCTCAACCACACAGATGGCTCTCCCTACTCATCCTCTTCCTTGTACACC
+TTTCACACACATCTCACGCCGACGTGGACTCTGTTTCGGACGTGCTT
+>ds2020-267_498
+GACGGCACTGACCGTCTAAGTGTAGATAGTGTAGATGTATCGCAAGCTATGCCAACTATC
+GATGACGCATCTATGATGTTTGCCGCAGGCACAGGTGAGCTAGCGGATAAACACATCTCT
+GAGCCTATAACGGGTGTAGAGATGGCTGTACAGGACGCGGCTATTGGGACGTGCTGGCTG
+GGGTGACGTTGCGGACGTGTGACGCGTGCGTTGTTGCGGACGTGCTG
+>ds2020-267_499
+TAAGGAGCAGCACGTCCGCAACGAGTTAGGGGTCAGCACGTCCGCAAGTCGACTACGGTC
+AGCACGTCCCAAGTGGAGCCAATTTGCGGACGTGTCGCTTAGGCGACGCACTGACCGTTG
+GCGTATGGGGTACGCACTGACCGTGTGTCATCCCATTAGATACGGCCAGTGCGTCAGGTA
+AAAATCTACGGTCAGTGCGTCAGCCCCCCGAGAACGGTCAGTGCGTC
+>ds2020-267_500
+GACGCACTGACCGTGATTTATCCCCTGGACTACGGTCAGTGCGTCAGGCAACACTATACG
+GTCAGTGCGTCAACCCGTTCCTAACGGTCAGTGCGTCGCCTTAAGCGTGGCAGCACGTCC
+GCAACCAGATATCGATCATTGCGACGTGCTGACCGTACAATGATTGCGGACGTGGAGGCA
+GATGGACTTGCGGACGTGCTGAGCGAATTCCCTTTGCGGACGTGCTG
+>ds2020-267_501
+CAGCACGTCCGCAAGACTTCGCCCCTATTTCTATCCGTGTAATTTCGAATACTTGAACGG
+TCGATTCTTTTTTTTTCATCTTAGCTTTCACCTTTTCGAATGAAACCAGAGGAGTGTTTC
+ATTATGATCTGGATTACACTTTTATCTTTCATTTTATTCTTATCCTTTTCTTCGGGCAGA
+CCCTCTATAACATAACAAAAAAAAGGGGGCCTCTTGGGGACGTGCTG
+>ds2020-267_502
+CAGCACGTCCGCAACTTGTCCCCCGTTATGTTATAGAAGAACTGAACTTATTGCTGGGCT
+GGTTATTCAGAGCCAGCAATTGGCTGCCGGATTTCGTCCCGCAACTAGAAGAAGATCGCT
+TCGGGGGTCACTGTGGCGTGGCTGAATGTAGAGCAGTCTGCCCCTACAGCGTTTGATCAG
+TAGATTATTTAGAACTTCGGAGGGCCAGCCCATTGCGGACGTGCTG
+>ds2020-267_503
+GGGGAAACCTGGAATGTCCGGAGTAGTGTCCGGTGGCCCTGCCCTGAATGTATAGGGGTG
+TGGGTGGTAACGCGGGGAAGTGAAACATCTTAGTACCCGTAGGAAGAGAAAACAAGTGTG
+ATTCCGTGAGTAGTGGCGAGCGAAAGCGGAGGAGGCTAAACCGTGTGTGTTCAAGCCGGC
+AGGTGTTGGATGTGCGGGGTAGTGAGGGGACTTTGCGGACGTGCTG
+>ds2020-267_504
+ACATTACGTTCGCTTGCATCCGGCTGTCCATAAAGCTGCCATGGCAAAAGCAAACGGTAC
+CACCGCGCCCACAAAGCCCATATACAGCATCGGCGGGTGAAAAATTAACCCGGGGTCTTG
+CAGTAGTGGAGGGAGAGCCAGTTGCGGACGTGCTGCTCCTTAGATTGTCCGCAACTACGG
+CTTAATACTTGCGGACGTGCCAAGAGTGGTCCCTTGCGACGTGCTG
+>ds2020-267_505
+CAGCACGTCCGCAATAAAACCACTGGAAGTAAGGACGTTGGGGCTTCATTACGCTCGTTG
+GTAGTATCTACCTGACAACCTGTGTCGGTTTGGGGTACGATTTGATGTTACCTGATGCTT
+AGAGGCTTTTCCTGGAAGCAGGGCATTTGTTGCTTCAGCACCGTAGTGCCTCGTCATCGC
+GGACGTGCTGAGGTGCCGAATATTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_506
+CAGCACGTCCGCAACTCCTACTGCCTAGCCCTTGGGACGTGCTGAGGGTCTCAATATTGC
+GGACGTGCTGCTCCTTAGATATAAGGACGTTCGGGCTTAAAGGTCCCTCTCGCCTCGTCA
+ATCACTTCGCCCATCTTCAGCGCCGTGCCCGAGGGGGCGTCCGCCTTGTGCTTGTGGTGC
+GCCTCGATGATCTCGATGTCATAGCCCGTATAAAGCCCGAACGTCC
+>ds2020-267_507
+CAGCACGTCCGCAAGAGCTTCCCGATCTCTTAGGATCGACTGACCCATGTCCAACTGCTG
+TTACCATGGAACCTTTCTCCACTTCAGTCTTCAAGGTTCTCACTTGAATATTTGCTACTA
+CCACCAAGATCTGCACTAGAGGCTGTTCCACCCAGCATCGCTGCCAAGGCTTCCACTCCC
+TCCTATAAGCCCGAACGTCCAGCATGTCAAATAAGCCCGAACGTCC
+>ds2020-267_508
+ATCTAAGGAGCAGCACGTCCGCAACGTACTACTGGTCAGCACGTCCGCAATTACCTGAGA
+CTCAGCACGTCCGCAATCAATTACGGGCCCGCAACTTCCCTGATTTGCGGACGTGCTGCT
+CCTTAGATATCTAAGGAGCAGCACGTCCGCAAAAACCTTTAAGTGGGACGTGCTGGGGGT
+TAATGATTGCGGACGTGCTGAGGGATGACGCCTTGCGGACGTGCTG
+>ds2020-267_509
+CAAGCTTTTAATAATATGGCCGTGATCTGTAATTACGTGCGACTATCTCCACTATAGAAA
+TAAAAAAAGGAGAGAAAGAAAAAATCCGTTAACGTTAATAAATACTAGAAACAAAGTGTA
+GGCTTAACGGTCAGTGCGTCGCCTTAAGCGAGGAGCAGCACGTCCGCAACTGGCGACCGG
+TGTAACATTGCGGACGTGTGAGTGTGATAATTTTGCGGACGTGCTG
+>ds2020-267_510
+GGACGTTCGGGCTTCTACTAAGGGCTGGACGTTCGGGCTTGCAAACTTCACTGGACGTTC
+GGCTTATAAACCCTACTAAGCCCGAACGTCCTTACTTCCAGAGCACGTCCGCAAGTTGTC
+TCGACTCAGCACGTCCCAACCTCGCACTTGTTGCGGACGTGCTGACCGAGTGACATTTGC
+GGACGTGCTGAGGTACGAATATTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_511
+CAGCACGTCCGCAAAGAATCCCCGCTTTGTGGCGGAAGAAGCTGGTGATGATGATTTCTG
+TGATGTGGGAAGTGTGAGAACAGCGGCTGCTCACCCCCATCACTCAGAAGAAGAGGAAGG
+AGATGGTCTTGAGGTTGAAGATGGTAGAGAAAGAGTGGAGAAGAAAGCAGTTCTTTATAT
+TTGGAAGTCTCAGAGGCAGAGCGAACGAGTATTGCGGACGTGCTG
+>ds2020-267_512
+CAGCACGTCCGCAAATTCGTTGGAATACCCTCTGGCCTATTTATCACTCAACTGTTCGAT
+TCCTGCTGATGGCGTGCCACGAAGTTCATTATGGAGCTCTACGGCCCGAAAGGCTTAGTG
+GGGTACTCCCTTGGGAGGGTTGGCCCGGTAATGAATGGACGGTCAAAAGACCATCAGTTC
+GGCTGGGTCCGTGCGTCATAGGAACGAAACTTTGCGGACGTGCTG
+>ds2020-267_513
+CAGCACGTCCGCAATTCAACACCAATCTTACCCTCAATGATCTCATGTTTCCCATCTTGG
+TCTTCTTCAAATTCATCCGAAGAACTCCCATTTTCTTCAACCCCTCCGTTCACACCAGCC
+ATAGCCATAGTAGCATCCGTCACCGCCTTTTTCTCCTTACTCGAAAAAGACTCCAACTTT
+TCAACACTACCCTAGGGAAGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_514
+CTAAGGAGCAGCACGTCCGCAAGGATCTCACCCCAGCACGTCCGCAACATCTCTCCCTTT
+GCTTTCGCTCCTCAGCGTCAGTTACTGCCCAGAGACCTGCCTTCGCCATCGGTGTTCCTC
+CTGATATCTGCGCATTTCACCGCTACACCAGGAATTCCAGTCTCCCCTACAGCACTCAAG
+TTATGCCCGTATCGCCTGCACGCCCAAATCGAAGCCCGAACGTCC
+>ds2020-267_515
+CAGCACGTCCGCAATTAGTCCTCCCCAGCACGTCCGCAAACTCTATACCCCCAGCACGTC
+CGCACTGCTCTCCGGCAGCACGTCCAGACAGTTACGTTTGCGGACGTGCTTCTGGAAGTA
+AGGACGTTCGGGCTTGGGGTGTGAGTTATTACCGCAAATTTTTTATCCTTTGGTCACAGG
+ACGCGCCAATGGTACAGGGAGGAGGTCTGTAAAGCCCGAACGTCC
+>ds2020-267_516
+CAGCACGTCCGCAAGGCAGGTTGGGTTGCAATCACCACGCCTACCAGCATGCCGACTATT
+CCCCAAACCACAGCCATGACAGAAAATTGGCGCACAACCCTATAGTTGTATGAGTTTTCT
+TTAGTTATCGTCATGATCTCACTCTGTTGTAAAAATACACTGAAAGAATAACAACCGCAC
+TGCACAACTACCATCACACACACCAATGATATTGCGGACGAGCTG
+>ds2020-267_517
+GACGCACTGACCGTCGCCATCCTCTTGACGCACTGACCGTAAGGGGACACCTGACGCCTG
+ACCGTTTCTATGCTGTTGGTCACGGTCAGTGCGTCGCCTTAAGCGTCGTCCGCAAATCCG
+CTGGGGTTGGGACGTGCTGAGATGGACCGGGTTGCGGACGTGCTGAGTGAATACTGTTTG
+CGGACGTGTGAGGAGTTATCGGTTGCGGACGTGCTGCCCTTAGAT
+>ds2020-267_518
+TATCTAAGGAGCAGCACGTCCGCAATACCAAGGGGCTGGAATTGCGACGTGCTGATGGGA
+TAAGTCTTGCGGACGTGCTGAGGGATTCGACCTTGCGGACGTGCTGTCTGGAAGTAAGGA
+CGTTCGGGCTTCCCGTGGCTTGTGGACGTGCAGTTAGCTATGTCGATGTTGTCAAGATCT
+GCCATGTTTTACTCATAGGAGCCTGCAAGTCAAGCCCGAACGTCC
+>ds2020-267_519
+CAGCACGTCCGCAAGCATCTAAGGCGGGTTGCGGACGTGCTGTCTGAAGTAAGGACGTTC
+GGGCTTGGATGCGCTTTGTGGAGGGCTGCACTATGATGCGGGAAACCCCAGTTTTGTCTC
+TGCCACTGTGGAGCAGCACGTCCGCAATGGAGATGGAGTGAGTTGCGGACGTCTGGGCCA
+ATAATGTTGCGGACGTGTGAGGGACGGCTGTTTGCGGACGTGCTG
+>ds2020-267_520
+CAGCACGTCCGCAAACTCAGTACTCTTGCAGTTGCCCTCAACTTCTCAACCTGCTCTCTG
+AACACCAACGCTTCTTCTTTCTTACCACGCAGTTGTTCGATTAGGTCCCCTACCTCCTCC
+TTCAACTTCACTCTTTCACCATTTGTTTCCGCAATCCAGTTCTTTGCAGTTTGAAGCTCC
+TTTGTTGTTCCTAGAATACACTTCTCGTACTTTGCGGACGTGCTG
+>ds2020-267_521
+TCTAAGGAGCAGCACGTCCGCAATTACAGCCCCCCAGCACGTCCGCAAGCAATTTAGGGC
+CTCACACGTCCCAAACCCCTATCTTTGCGGACGCGCTTAGGCGACGCACTGACCGTTTCC
+AAGCCCCTGACGCACTGACCGTGTCGCTGACTCTGACGCACTGACCGTCTTTATCCCCCT
+GACGCACTGACCGTGCGTTAGCGTGTCGGGTACGGTCAGTGCGTC
+>ds2020-267_522
+CAGCACGTCCGCAATAGTGGTCTCCTCAGCACGTCCCAATATATCTTAGGTCGCACGTCC
+GAAATCCCTCCCTCTTGCGGACGTGCTGCTCCTTAGACGCTTAAGGCGACGCACTGACCG
+TTATATTGGTGGTAGGTGAATCCGTGTTATAATTGGCAATATTTCAATGAAAGGAGCTAG
+GGTACTACGGTCAGTGCGTCACAGTGCGTTACACGGTCAGTGCGT
+>ds2020-267_523
+GACGCACTGACCGTACGAGTAGCCTGACGCACTGACCGTCCAGCGCTGTATGACGGTCAG
+GCGTCACACGAGAGATAACGGTCAGTGCGTCCCCCATGTGACACGGTCAGTGCGTCGCCT
+AAGCGTATCTAGGAGCAGCACGTCCGCAATGGACTACTCCTCAGCACGTCCGCAAACTAT
+GATCCCTCAGCACGTCCCAACCCAAGACCCTTTGCGGACGTGCTG
+>ds2020-267_524
+TCTAAGGAGCAGCACGTCCGCAACGTTAGACACGTCAGCACGTCCGCAAAGGATTTTCAC
+TCTCCGCAATTCCCCCTAACTTGCGGACGTGCTGCTCCTTAACGCTTAAGGCGACGCACT
+GACCGTTCGCAGGCCCCTGACGCACTGACCGTATCGTACATCCTGACGCACTGACCGTAT
+CATCAGCTGTGACCGTAATATCCCACCTCGCACGGTCAGTGCGTC
+>ds2020-267_525
+CTCCGGCGCGCCTGGACCCCAGCCGCGCGCACTACCCATCGCCCGAACGCGCCGCACGTC
+CGCAACTCCCAGGGGTCAGCACGTCCGCAACTTTTGCACACTCAGCACGTCCGCAATCGT
+AATGTGTTGGGACGTGCTGAGGGAATGACCCTTGCGGACGTGCTGAGTGCAATGTCTTGG
+GACGTGCTGAGGTGAGTGGAATTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_526
+CAGCACGTCCGAAATCCCAGAAGTCTTCTGTTTTCCTTGCTCGCGGTTTCGTCAGTGCGG
+CTACACTGCTTAAACAGAAGCTCGAGCGTGGGTGTCTGTCACAGTATCCTATTATCCGCC
+TTTTTGGGAATCGCCTCGACCACAACAGTTTACGGCGACTTATCGTCCTCGCCGGCTGCA
+ATCCTGCTGCTCGTGATTTACGTGAAAAAGCTTGCGGACGTGCTG
+>ds2020-267_527
+CAGCACGTCCGCAAGGATGCCGGCATTGGGACGTGCTGAGAGTGTAAAGCCAGTCACACA
+AACAGATCAAAACGAAAAATCAAGAACAGCGTGTGATTGGGAGGTTTTCGGTTGCGCCTA
+GTCTGGATGACCATGAAGTGCAACGAGTTAATGCTGCTATAAATGAGGAAGAAGCCAATG
+TTCTTGATAATAATAATCAGAGACAGCGAATTGCGGACGTGCTG
+>ds2020-267_528
+CAGCACGTCCGCAATTTTCCGGCCCCCCAAAAGAACATTCATTCATTTCTTTCTTCCCCG
+TCGACCACGACGACTGAAACGACACGAAAAATCCAGACCCGGAAAGGAGAAGGGCCGGTG
+GTGGGCATTTGGGAAAGTCGGGCCGATCGGGTGTCTTCATTCAAGCGACGATACAGAAGA
+AGAACGAAACGAAGTGAGAGGCCAGGGTATTTGCGGACGTGCTG
+>ds2020-267_529
+ATCTAAGGAGCAGCACGTCCGCAAAGACTTCACCCCTTTTCTTAATACCCCTATTCTCCT
+TTCATCCGGAGCTGCCGTAACTTGGGCTCATCATGCTATACTCGCGGGGAAGGAAAAACG
+AGCTGTTTACGCTTTAGTAGCTACCGTTTCGCTGGCTCTAGTATTCACTGGCTTTCAAGG
+AATGGAATATTATCAAGCACCTGTCAACATTTGCGGGCGTGCTG
+>ds2020-267_530
+CGTCCGCAAGAGGCCATCACTCAGCACGTCCGCAAATTCTGGTGGCTGCCTCCTCGGGTA
+TTGAAGTCAGTTTGGTGCGCACAGACGCGGGACGGTTCATCTTAATTTCTTCTCTCACTC
+TCATTGCAATGCGCTCTACATCTCTATCGGACAGCGAACTGGTACGTGATGACCCCTCAT
+CCCGTGCAGAGCTAAGCGATTGCCTAGGCTTTGCGGACGTGCTG
+>ds2020-267_531
+CAGCACGTCCGCAAGATTCCGTGGGTTCCAAACTATATGCGGTCTCGCTATTCTTTGTTT
+GCATTCAAAGGTCTTGTGCCTGCGCTATCGAGTCACGTGCCTAACTTCCAAAGAATGAAT
+CATATGGTAGAGGAGCGAAAGTGGCCGGGGCGGCGGTGTAGAGCTATAAGGAGCGAAGCT
+CACACACACCGGCGTGAGGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_532
+CAGCACGTCCGCAATGATCGGCCTTTTTCCCATTTCTTTGAGCAATGATCTTCTCAATCT
+CTGAATCATAATCTGAATCTGAACTCTCACTGTCTTCATCCTCATCCTCACTCTCTTCAC
+TCTCAGCCACGTTTTTCCCATTCGTCCTACCCAGCTTCCTCTTCAACTTACTCAATTCAG
+ACGCAACATCAGCCTGAATTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_533
+GATCTATCTAAGGAGCAGCACGTCCGCAATTGGCCAGGGCAGCACGTCCGCAAAACATAT
+TACCTCCACGTCCCAACCCAAAAACGACGCCAAAGAATTGTACGGTATCATCCCAACCTA
+ACCCGAAAGCCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCACGTCCGCAAGGAGT
+GAGGGATTGGGACGTGCTGCCCCCAAATGTTTGCGGACGTGCTG
+>ds2020-267_534
+GGACGTTCGGGCTTTCAGGCCACCCTGGAGTTCGGGCTTATCTTATTACCTGGACGTTCG
+GGCTTCTTGCACGGCCTGGACTCGGGCTTTAATTCGAAAGGGAAAGCCCGAACGTCCTTA
+GCACGTCCGCAAGATACACGGCATGTTGATTGCGGGTGCTGAGGGCGATAGGGTTGCGGA
+CGTGCTGAGTGGGCGTGAGTTGCGGACGTGCTGCTTCTTAGATA
+>ds2020-267_535
+TATCTAAGGAGCAGCACGTCCGCAAATCAAAGGAAATCCCTTGCGACGTGGCCCAAGGAA
+TATTGCGGACGTGCTGGGGGTGCACAATTGCGGACGTGCTGGGGAGGCATCCTTGCGGAC
+GTGCTGCTCCTTAGATAACGTCCGCAATCAGGGCCGGCTACTTGCGGACTGCTGAGGGTT
+CGAATCTTGCGGACGTGCTGCCCATACCCATTTGCGGACGTGCT
+>ds2020-267_536
+GGACGTTCGGGCTTACCAATACACCTCTTAAGCCCGAAGTCCAGGGGATCATTCAAGCCC
+GAACGTCCAGCGAGATGAGCAAGCCCGAACGTCCTTACTTCCAGTCTAAGGAGCAGCACG
+TCCGCAAGTAATACTCCTTAGCCGTCCGCAATGACATACCACTCAGCACGTCCGCAAATT
+GCACATTGTGGACGTGTGACCGACATAGGGTTGCGGACGTGCTG
+>ds2020-267_537
+CAGCACGTCCGCAAAGCATCACCCCTCACACATTGCGGACGTGTGAGAGCTATATCGTTG
+CGGACGTGCTAGGGCTGAATGTTTGCGGACGTGCTGCTCCTTAGATACTGGAAGTAAGGA
+CGTTCGGGCTTTATTAAATCCCTGCCACAACCCCATAAACAATACAAACCACACTAACAT
+ATCTAACAAAGTCATCGGAGTCGTAATTGTAAGCCCGAACGTCC
+>ds2020-267_538
+GGACGTTCGGGCTTCTGGTCATGGGTTAGAATTCTAGCTTCGCCAGAGTGGTATCTCACC
+GTTGGCTCCATACTCCCCACAAGGAATACTTCATCGCCTCCCACCTATCCTGCGCAAGCC
+AAGCCCGAACGTCCTTATTCCAGTATCTAAGGAGCAGCACGTCCGCAAACGGCTCTGACT
+CAGCACGTCCGCAAGCTGCATGCCTTTGAGATTGCGACGTGCTG
+>ds2020-267_539
+GACGCACTGACCGTGTCAGCTTCCGTCCATTTAACTAAAGAGCAGAAGGTTAGCTTACCC
+AGTAGCATTGAAGAGGTGTTATGCCGTGACTATTGATGGCAAATTCACGCCTGTTCATAA
+ATTAGATGTTTTTCGACTATTAATCAGACGGTCAGTGCGTCGCCTAAGCGTATCTAAGGA
+GCAGCACGTCCGCAAGAAAGGGGCCATCGATTGCGGACGTGCTG
+>ds2020-267_540
+GAAAGGAGTATGTCGCTGACGGACTAGGCTCTATTGAGGGAGTAAGTCGCTGACGGACTA
+GGCTTTAATGAAGGAGTCACTTAAGTGGTTGTTCCTACAATTGTTGAGAACAGAAGGGTG
+GACACAAAGCCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCACGTCCGCAAGTTTC
+TTAGTTTTGCGACGTGCTGCCCCTCAAGGGTTGCGGACGTGCTG
+>ds2020-267_541
+CAGCACGTCGCAATCATCCGGTGTTTGTTGCGGACGTGCGAGGAGTGCATAATTGCGGAC
+GTGCGCCCAGCGGTCATTGCGGACGTGCTGCTCCTTAGATATCTAAGGAGCAGCACGTCC
+GCAAGTTCTGACCCCTCACACGTCCGCAACCAGTGCACCATTGCGACGTGCTGAGGCTGA
+CGTATTGCGGACGTGCTGACAGGTGAATAATTGCGGACGTGCTG
+>ds2020-267_542
+TCCGCAAATATAACGGCCTCAGCACGTCCGCAAGTCGAGGCACCTCAGCACGTCCGCAAT
+CCGTGGGTCCTGTCCGCAACCTCCACCCGTATCGATTTGCGGACGTGCTGCTCCTAGATC
+GCTTAAGGCGACGCACTGACCGTATAACTAAGCCTGACGCACTGACCGTACCAACCGCCT
+GACGCACTGACTGTTCATAAGGGACTGCAAACGGTCAGTGCGTC
+>ds2020-267_543
+CAGCACGTCCGCAATGCCCCATGCCTTTTTTGGTTGGACCAGCCCAACCGGCGATTTCCG
+TCTTCCTGAATTGGGAGAGCAAGCACAAGTCTCTCTTCTTTTTTTCCTTTGAATTACTCA
+TATATATATCCTATGAATTTCATTTCGCACCGGAAACTATTCTAGGAGAAGTTCGAATCC
+GTTCCGTTCGGATATTGATCGGTCTTGATTTGCGGACGTGCTG
+>ds2020-267_544
+CAGCACGTCCGCAATTGCGTGGCCCTCCACCTCGTTGGGAAAAGTAAAAAGAAATAACAA
+GCCCTAAACTAAATATCAACTAGCAGCTTATCAACCACCGAACACAGACTCATGTTGGCG
+ATGCCATGGTCAAGTAAGAGGACGACCCATTCACCTCAAAAGAAAAATCTCGCCTCTCAA
+GTAAGCTATGTTGCGGACGTGCTGCTCCTTAGATAGATCGGAA
+>ds2020-267_545
+CAGCACGTCCGCAACTTGCCCGGCATGAATTTATCAGCCACCGTGTAATACAAATTATAT
+CAACGTAATTTTCACGTTTTGGACCATACAAATCCCATATATATAAAACCCAGAAACCAA
+AAACTACGAAAAAAAAGAAGAAGAAAAACGGTGTAATAATTAATACTCCGTTCCGTTCCC
+GTTCAATTGAATTGGCACCTGGTTAGCTTTGCGGACGTGCTGA
+>ds2020-267_546
+CAGCACGTCCGCAAGTTAGCCCGCCTCAGCCGTCCGCAACGCGATAACTCTCAGCAGTCC
+GCAACCAGATGGCTATACTTGCGGACGTGCAATCTAAGGAGCAGCACGTCCGCAATTTCG
+GGGTCTTGAGACGTGCTGCCGGACAATACTTGGGACGTGCTGAGGACTACGATTTGCGGA
+CGTGCTGGGCCATTAGGATTGCGGACGTGCTGCTCCTTAAGAT
+>ds2020-267_547
+GACGCACTGACCGTGGCTTTAGGGGTGAAAGGCTAATCAAATTCCGTGATAGCTCGTTCT
+CGTCGAAATATCTTTAGGGATAGCCTCGGATGAATCATTGTGGTGGTAGAGCACTGACTG
+GACTAGGGGCCTCACAAGGTTACCGAATTCAATCAAACTCCGAATGCCAATGAATTATGG
+TCGGCAGTCAGACTGCGAGTGCTATCAAGTTGCGGACGTGCTG
+>ds2020-267_548
+CAGCCCGTCCGCAAAACCGGTCTCCTCCGGCTAGTTTGTTGCCTTTACCTTTACCTTTAT
+CTTTATCTTTATCTTTTTTTCCTGTATCTGGCTCGATGTTTTCGGCATTTGGGGTCTGAC
+GCGGTGCGATACTATCAAAAATACTTGCCATCGATATATCAAAATTATATTTGAGCATGG
+CTTCACCACGGGCCTGGACTTGCGGACGTGCTGCTCCGTAGAT
+>ds2020-267_549
+GGACGTTCGGGCTTAAGATGGGGGGTGATAACGGGTCTGCTTGCAGACGAAGTGAGTGAT
+ACCCTGCTTCCAGGAAAAGCCACTAAGCTTCAGCTACACACGACCGTACCGCAAACCGGC
+ACTGAAGCCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCACGTCCGCAATTTCTGC
+CTATTGCGGACGTGCTGAGAAGGGGTGTGTTGCGGACGTGCTG
+>ds2020-267_550
+GGACGTTCGGGCTTACCTTGCTCCCTGGACGTTCGGGCTTCGTAATTGGGTTGGACTTCG
+GGCTTTATCCCACCGCTGTAACTAAGCCCGAACGTCCTTACTTCCAGAATCTAAGAGCAG
+CACGTCCGCAATACGGGGTTGGTCAGCACGTCCCAAGTGATATTGCCTCAGCCGTCCGCA
+AGGTCCACACGCGTGGGTTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_551
+CAGGTCGTCCGCAATGGCGAATCCCTCGGGTCGTCCGGAAGCAGTCTTGAGTCTTTGAGG
+AGGGGGGGGGGGGTGGGGGGGGGGGGCGGGGGGGGGGCGGGGGGCGGGGGGGGGGGGGGG
+GGGGGGGGGCGGTGGGGGGGGGGGGGGGGGTGGGGCGGGGGGTGGGGGGGGGGGGGGGGG
+GGGGGGTGTGCGGGGGGGGGGGGGGGGGGGGGGGGGTGGGGGC
+>ds2020-267_552
+GGACGTTCAGGCTTACTGACTCCCCTGGAAAAGAAACTGACTAGGATTCCCTTAGTAACG
+GCGAGTGAACCGGGAAAAGCTCAAATTTAAAATCTGGCGTCTTTCAGGCGTCCGAGTTGT
+AACCTATATGGATAAGCCCGAACGTCCTTACTTCCAGTCAGCACGTCCGCAAGAGCTTAT
+CCCCAGACTCCGCAATCTATTGTTCCTGATTGCGGACGTGCTG
+>ds2020-267_553
+TATCTAAGGAGCAGCACGTCCGCAAGCATGCCGGCCTCAGCACGTCCGCAAACCGATCCC
+CTCAGCACGTCCGCAATCTAACTGCTTTATATTGGGACGTGCTGCAGCATGGTTAGATGT
+GTAGGGGAGACGGGGGAACTCCGGTGGCGGGGGGTGGTGGGGGGTGGCGTGTTGGGGGGG
+TGGTGGTGGGTGGTTGGGTGGGTGGGGGGGGGGGGGGGGGGGG
+>ds2020-267_554
+CAGCACGTCCGCAATCGGTATTTTGTCTTGTGGGAGATTAAAGCTTAGGAGGCATGGAAG
+ACAAGCTCTGGTGATCCACGTTTTGGGAAAGCAGCGAAAACGAAGAGGTTGGTTGCGGAA
+AACAGGGTTTTGGTAACGAAAGATTTACAAACGGAGAAACGGAGAAACGGAGAAAGAGAG
+AGGTTTTTTTTTGGGGGGGTACTCTCCCTTGCGGACGTGCTG
+>ds2020-267_555
+CAGCACGTCCGCAAAACACATCCCCTCAGCACGTCCGCAATTTACCTGTATTTATTATTG
+CTTTCATTGCTGCACCTCCAGTAGATATTGATGGTATTCGTGAACCTGTTTCTGGATCTT
+TACTTTATGGAAACAATATTATTTCTGGTGCAATGCTTCCTACCTCTGCAGCTATAGGGT
+TTCACGTTTAACCGATATCAGAAGCGCCTTGCGGACGTGCTG
+>ds2020-267_556
+CAGCACGTGCGCAATACTGCCCAATTTTTTGGTGGGTATCAAAGTTTTCTGTCTACCCAT
+ATATATATATGAAAATCTTTTCTTTGCTACCTCTTCTCTTTCACGCCAATAACTTGGCTT
+CCTTTTCCCTTTATTTTATTGGACTTGTTTTGCACCATATGCCTCTTCCGTTTCAACACC
+TCTTACACTTGTCCACATCACCTACCCTTTGCGGACGTGCTG
+>ds2020-267_557
+CAGCACGTCCGCAAGATGAACAAGGTACCGGCTGCAATAGGATGAGACGCGCTTCCTCCC
+GGCACAAAAGGATCAAAACCCTCCACACCCCACGCTGGATTTACGGATTGTACCCTTCCG
+GTTAGTCCATAAGGATCGGACACCCATATTCCAGGACCATACAATCCTGTTACATGAAAT
+GCACCAAAACCAAAGCAAGCCTGCGCCGTTGCGGACGTGCTG
+>ds2020-267_558
+GGACGTTCGGGCTTTCTGGTTACCCTTCCCTAGTCGATTAGTGATTTTTGACTAAGAATG
+ATACCGTTATTATCCGCATACACATACATGCCAGAGTTGATAGTTAGACCGCCAAAGCTG
+ATTTCGATATCCGTCTCGCCCACACCTTTGCGATTGGATTTTCGGGGGATAGCGAAAACC
+AGTTGCGGACGTGCTGACGGATATGCTCTTGCGGACGTGCTG
+>ds2020-267_559
+TCTAAGGAGCAGCACGTCCGCAACGTAGCCTGGGCAGCACGTCCGAACTCTCTACTCCTC
+AGCACGTCCGCAAGGGACAAGGTCTTGCGGACGTGTGAGGGACGGCTATTGCGGACGTGC
+TGCTCAATCTAAGGAGCAGCACGTCCGCAACGTAGCCTGGGCAGCACGTCCGAACTCTCT
+AGTCCTCAGCACGTCCACAGTGATTGGTTTGCGGACGTGCTG
+>ds2020-267_560
+CAGCACGTCCGCAAATACTGTGGCCTCAGCACGTCCGCAAATTCCCTTCCCTCACACGTC
+CGCAACAGGACAACCCTCAGCACGTCCGCAAATACTCTGGCCTCAGCACGTCCGCAAATT
+CCCTTCCCTCACACGTCCGCAACAGGACACCCCTCAGCACGTCCGCAAAATAAACTGCAT
+GCCCTTGGGACGTGTGAGCGAATCACTATTGCGGACGTGCTG
+>ds2020-267_561
+CACGTCCGCAATTGGTGTTGTGGGGCGGGGGGGGCGGGCGGGGGGGGGTGGGGGGGGGTG
+GGGGGGGGGGGGGTGGGGGGGGGGGGGGGGGGGTGGGTGGGGGTGGGGGGGGGGGGGGGG
+GGGGGGGGGTGGGGGGGGGGGGGGGGGTGGGGGGGGGTGGGGTGGGGGGGGGGGGGGGGT
+GGGGGGGGGGGGGTGGGGGGGGGGGGGGGGTGGGGGGGGGGG
+>ds2020-267_562
+CAGCACGTCCGCAAGTAGCGCAGCCTCAGCACGTCCGCAAGCAGAACTCCCTCACACGTC
+CGCAATTATTCTCCTTCTGTTGCGGACGCCGCTTAAGGCGACGCACTGACCGTTAGATCC
+CTCCTGACGCACTGACCGTATCTAATCCCCTGACGCACTGACCGTCGGACCGTCTCTGAC
+GCACTGACCGTCAACTAAGGACTGTAAAACGGTCAGTGCGTC
+>ds2020-267_563
+TCATGGCCTCAAGCTTGGCTCGGTACTACCATTATAGGCGACTGTGCATTATCGATACGC
+CGCTCATAGACTTCGCAGGTGTTACCATGAACTGGGGCCTCGTGGTCGTGTGGGAGCTGA
+TCTGGGAAGCCCGAACGTCCTTACTTCCAGTATCTAAGGAGAGCACGTCCGCAATAGGTT
+GGGAGTCAGCACGTCCGCAATGGTGCGCTTGCGGACGTGCTG
+>ds2020-267_564
+GACGCACTGACCGTTCTACAGCCATTGTCACACGGTAAGTGCGTCAGGAATCCGGCCACG
+GTCAGTGCGTCAGGCAGAATCTCACGGTCAGTGCGTCGCCTTAAGCGTAGCACGTCCGCA
+ATGGCGCTAATATTGGGACGTGCTGAGCGCATAACCATTGCGGACGTGCTGGGGTATCGG
+CATTGCGGACGTGCTGAGGAAATACGTGTTGCGGACGTGCTG
+>ds2020-267_565
+AAGCCTGGTTCTTTGACGCACTGACCGTTGGAGGCCCACTGACGCACTGACCGTGAACGA
+GTCCTTCTGGATTGTTGCCCAACGTTTTTGGGTCAATAGTTGCTGTTAGCCCCACCACTT
+CGCCATTGTCATCGGTGATGTGCTCCTCAATCTTTAGCACATAACTATTGCGTAAGCGGA
+TTTCTGGGTTTTACGGAGGCATCAGTAGACGGTCAGTGCGTC
+>ds2020-267_566
+CAGCACGTCCGCAATTGGTCCCGGCAGCACGTCGCAACCAAATAGACATTGCGGACGTGC
+TGCTCCTTAGACGCTTAAGGCGACGCACTGACCGTATTTGTCCGAGTTTAATTTCAATTC
+AATTAAGAGAACTAACAGTAAGTAATTACTAGATTACAAAGTATCCATTGCTTGGAATTC
+AAATTGTATCCATTGCTTGGAATTCAAATTTGATCTCCTTC
+>ds2020-267_567
+CAGCACGTCCGCAATTCCTCGTGACTCAGCACGTCCGCAAAACCTTTAGCCTCAGCACGT
+CCGCAACGGGGCTCCACTCAGCACGTCCCAAGTTTACCGCCATTAATTTGCACGTGCTGA
+GGAGTTCGAAATTGCGGACGTCTGGAAGTAAGGACGTTCGGGCTTCAGTCCACCCCTGGC
+GTTCGGGCTTAACTCACGGATTAGCGCAAGCCCGAACGTCC
+>ds2020-267_568
+CAGCACGTCCGCAAGTTATGATCGCCCCGTCCCAACCTCATCCCGCTGATCTTGCGGACG
+TTGCTCCTTAGCTTGCTTAAGGCGACGCACTGACCGTTGGATTGAGCCTTGGTATGGAAA
+CCTACCAAGTGAGAACTTTCAAATTCAGAGAAACCCTGGAATTAAAAATGGGCGATCCTG
+AGCCAAATCCTGTGTTATTAAAACAAACAAGGGGTTAATAA
+>ds2020-267_569
+CAGCACGTCCGCAACAAGCAATGGTGCGAAGCTATCATCTGCTGGATAATGGCTGAACGC
+CTCTAAGCCAGAATCCGTGCTAGAAGCGATAACGTTGGTCCCGCACATGCCTAGTGTTGG
+AATAGAGCTTTGCTCGTACACCATACAAGCCGCGTGCAGCCGGAAGGGGTAGCGTGGTTG
+ATTGCAATGTAAACAAGCGCGGGGAGCTTGCGGACGTGCTG
+>ds2020-267_570
+TCAGCCCGTCCGCAATAACCCACGGCTCACCCGCCCGCAATAGTTCGGCCCCAGCCGTCC
+GCAACCTGGCGAGGTCCTGGCGGACGTCTGGGGCCTAACTATTGCGGACGTGTGAGCAGT
+GGGTTATTGCGGACGTGCTGAGTCCGCAATCTCTTACGCCTCAGCACGTCCCAAGGTTTT
+AAGGGTGCGACGTGGAAAGGATCCCGCTTGCGGACGTGCTG
+>ds2020-267_571
+CAGCACGTCCGCAATACACATCCCTGCAGCTTTCTAGAAAGATCAGCCACCGTCTACGGT
+GACTGCCCCTCTCTTATTTACAACGATACCACCTACACGTGGACGCAGACCCACCGTCGA
+TGCATCCGAGTCGCTTCCTCTATATCATCGCTCGTCATCAAGAGTCGCCACGTGGTGTCT
+GTTCTCTCTCCCAACACTCCCCCCATATTGCGGACGTGCTG
+>ds2020-267_572
+CAGCACGTCCGCAAGCCGCAAATGGTATTTTTTTAATAGCCCTTGGTACTATCTTTTTGG
+GTACGCGCTTGTATCTTTAAGCATATTTTTCGCTAAATCAAAGCCAAATCATGTTGATGG
+TAGTTGCCATCTTATTGTTAATTTTTTTCCCCTTTTTTCCCTATTATAGGTAGAGGGCCC
+GCCATCTAAAATGCCAACAGTGGAACCTTGCGGACGTGCTG
+>ds2020-267_573
+GACGCACTGACCGTGTGCCACCCCTGACGCACTGACCGTCATTATGGGGCTGTAGACGTC
+AGTGCGTCAGGACTATGTGCACGGTCAGTGCGTCACGGGGGCACCTACGGTCAGTGCGTC
+GCCTTAAGCGTAGCACGTCCGCAATTGGTATCGGTTTGGGACGTGCTGAGCCGAAAGACT
+TTGCGGACGTGCTGAGGGGAAGAGATATTGCGGACGTGCTG
+>ds2020-267_574
+GACGCACTGACCGTTGGATTTGGGTGACGCACTGACCGTACGTATACCTCTGACGCACTG
+ACCGTACATCAGACCCTAACACACGGTCAGTGCGTCAGGTCGTACTTGACGGTCAGTGCG
+TCGCCTTAAGCGTGTCCGCAAATCCCATGCATTGCTCTTTGCGGACGTGTGGGCCTACAT
+ACTTGCGACGTGCTGAGGATTTCGTCCTTGCGGACGTGCTG
+>ds2020-267_575
+GGACGTTCGGGCTTATTCTATGCATTGGACTTCGGGCTTGTGCTATCCCTGGACTTCGGG
+CTTGAGCCTAAACATGGACTTCGGGCTTACAAATGCTGCTAGAAGCCCGAACGTCCTTAC
+TTCCAGCCACGTCCGCAAGCTCCTTACGCTCAGCCGTCCCACAACATCTACCATTTGCGG
+ACGTGCTGGGGACACATATTTGCGGACGTGCTGCTCCTTAG
+>ds2020-267_576
+GGACGTTCGGGCTTTTACGGCCCCCCCCCTTCTCATATCAATAACTAAAATGAAAAAAAG
+GGGAATATCAACGAATCCGGAAAAAAACGATTGATCTCTATCAATAAATGTCACACTAAG
+CCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCACGTCCGCAATTCTCATGATCTAG
+GACTTGCGGACGTGTGAGGGGCCTTGTGTTGCGACGTGCTG
+>ds2020-267_577
+CAGCACGTCCGCAACGCCGATACTATTGCGACGTGCTGGGGGTTTGTTATTGCGGACGTG
+CTGCTCCTTAGATTCGCTTAAGGCGACGCACTGACCTTGGACGTTGTTCTGACGCACTGA
+CCGTACACTCTCGCCTGACGCACGACCGTAGTATATCCCCGACAGCACGGTCAGTGCGTC
+GCCTTAAGCGAATCTATATCCCCTGGTTTGCGGACGTGCTG
+>ds2020-267_578
+CAGCACGTCCGCAACCATGGTCCCTCCACACGTCCGCAACGGCTCCAATATTGGGACGTG
+CTGAGGCGACGCACTGACCGTATGTAGGCCTCTGGACGCACTGACCGTTCTTCTCAAACT
+GACGCACTGACCGTGGTTACTAGCCTGACGCACTGACCGTGTCATTCGAACTCGAGATTT
+CTGTTCTCGTTGAGCACATTCCTAGGGACGGTCTGTGCGTC
+>ds2020-267_579
+GGACGTTCGGGCTTAGGTTACGGAATACAAAGCCCGAACGCCAAAGGATGCGAAGCCCGA
+ACGTCCTTAATCTAAGGGCAGCACGTCCGCAAACTCCTCCTCCTAGAAAACCTTCTATCC
+TTCAAAGCAGCTCCATCTTTTCGGGTCTTGTTCAGAATCAATGCGCGTTCCCTTTCTTTC
+TTTCGCTTCTCCCTTTCCAATCGTTCTTCCCTCAATTCTT
+>ds2020-267_580
+CAGCACGTCCGCAAACTTCCGGGTCTTTTCATTGCATTCACTTACAACAAGAAACAACCA
+CCAGCGTTTGGTGCAGCACCTGCATTTTGGTGCATTCTTCTTTCTTTCCTTGGTCTTTCG
+TTCCGTCATATTCCTAATAACTTATCCAATTACAACGTATTAACCGCTAATGCACCTTTC
+TTTTATCAAATCTCAGGGACAGCCCGTTGCGGACGTGCTG
+>ds2020-267_581
+CAGCACGTCCGCAATAACAGGCTGGTGACATATCGAAGAGACAGGACGTGCAAGGCAGTA
+GTACTGATGAGACCGGACGGATTTAAGCCGGACGTCATAGCGACCGTTTATGGGTTCGCG
+TACGGTTTGACCGAAAACGTCTTGACGATACCTCGAGGAGCCAAAGACGAAGGGAGTCAG
+GCCGGTGGGACAGGCGTATGGATCAAGACGGACGATAAGA
+>ds2020-267_582
+CAGCACGTCCGCAAACGGCACTGTCTCCAGACCCAGTGCCAGACCCAAAGCTGTGTGTCG
+TAACGATGTCATTGTCATCTCTCTTATTGTGCCGGATGCGCGATATCACGCGTTTTATGC
+TCGCGAGGTAACATGACATGCTCGAATGACAGAAAAATAACTGTTTGTTTACAGATAAGT
+GACAGCCAGGCGTCAGAGGTCTGAGGTTGCGGACGTGCTG
+>ds2020-267_583
+CAGCACGTCCGCAAGTCTAGCTAAGTCCCATGCCACTCTCCATGATGAGAAGTGCAATCT
+TGGATCCCTTAACATAGCATCCCAATTGTCCCTTCCATGTCTCCTCACACCTATCCATAG
+AAAATCCAACTCCTCTTCAGACCACATGGTACTATATGGCTTATATTTGTCATGAAAACT
+ACTCCTTTCATTGAAAGCTCAGCGGCTTGCGGACGTGCTG
+>ds2020-267_584
+GACGCACTGACCGTCTACTACTCCCTGACGCACTGACCGTGTGGACCCCCATGACGCACT
+GACCGTAAGTTTTCCCTTGACGCACTGACCATTTCATCCCCTACGGTCAGTGCGTCGCAA
+ACTAAAGTCCCTCAGCACGTCCGCAATAGTTCTGGCCTCAGCACGTCGCAAGTCCTTGTC
+CGTCCACGTCCGCAATAGCCAATTGTTTGCGGACGTGCTG
+>ds2020-267_585
+GACGCACTGACCGTACCACCTCAAATAACACTCAGTGCGTCAGACAATAAACTACGGTCA
+GTGCGTCAGACTATACCTAACGGTCAGTGCGTCGCCTTAAGCGGAGCAGCACGTCCGCAA
+TCGGCGTTTACTCAGCACGTCCGCAACGATAGACCTCTCACACGTCCGCACTAGCCGGGA
+ATTGCGGACGTGCTACCCGGAATTACTTGCGGACGTGCTG
+>ds2020-267_586
+GACGCACTGACCGTTACGGGGGGGGTGGTGTGGGTAAAAAACTAATAAATATTTAATTTA
+TCAACAACAATGCAAAATCACATGGGGGTGTATCCGTATTTGGCGGAGTAGGTGAGCGTA
+CTCGTGAAGGAAATGATCTTTACATGGAAATGAAAGAATCTGGAGTAATTAACGAACAAA
+ATATTGCAGAATCAAAAGTGTCTCCCACGGTCAGTGCGTC
+>ds2020-267_587
+CTCAGCACGCCCGCAATAGAAAACGAGTGAGTGTGAACGGTGTGGCAGAAGGAACTGCAA
+GAGGTGGTGTGCCTTTAGGTAGAATTGCTGTTTACAAAGTGTGCGAGCCAGTGGGTTGCA
+ATGGTGAACGAATTTTGGCTGCGTTCGACGATGCTATAGCGGATGGGGTAGATGTTTTAC
+CCATTTCTCTTGGAGACTAGCTTAGGCTTGCGGACGTGCG
+>ds2020-267_588
+CAGCACGTCCGCAAGAGCCTTTCCCTGATAACTTCTCGTTCGCCAGGCGACAATATATCC
+TTTTCCATCTCTACACCATTTACCCTTGTTTTAAGTGATACATTGCGCCTTGATTCTACA
+TTAAATACAAATTTTTTGTTATGGTTGTGAGAATCTGCCATGCCATTCATGTAATCCACG
+ACTCTTGCTGCTGATGCCATTTTGTTTGCGGACGTGCTG
+>ds2020-267_589
+GCAGCACGTCCGCAAAGAGTCAGGTTTTGTATTTTACAATACTAACAAATGGACGCTCAA
+AAAACTCAAGGAATCAGCCAGCAATAATCAGCAATTGCTACTTTCCAACTTTGAGGAGTA
+TTTAAATGGCTTTAGTGCTAAGTCAAAGACATATTAGTGCGGTTTAAATTACTTGACCAA
+GTTCGCCATATGGAGATGAGATTGTTTGCGGACGTGCTG
+>ds2020-267_590
+CAGCACGTCCGCAAGTGTTTCGCCTTCTTTCCTAATATCGTTCGTGATAACTGTAATACA
+GTTAAGACTCACGACATTACCATAGGGTTTCCTCTTAAGATTTCTTTTCTTATCGACATT
+GGTAACATTGTCGGTAGATTAGTCTTCTTACAGAGGGATATCCCAAATGGTCTAGGAAGG
+TGTTGACCTCCTAAGGTTCTCGTAATTGCGGACGTGCTG
+>ds2020-267_591
+CAGCACGTCCGCAAATCGCCGAAGATTGAGGAACAAGAAGAGATCTATTAAGAGAAAGAT
+TTATCCGAGAAAAAATCTTAACAGTTACATCCAATCACAAACTACACGAAAGTTGCCCCT
+TTTTCATGGGGATTTACCCATCACAGAGATGCACAGAGGAACAGAGCGAACTTCATATAT
+CCCTTTTCCACTCAAACCAGGAAACTTGCGGACGTGCTG
+>ds2020-267_592
+CAGCACGTCCGCAATTGTCATATCGTCCGTCGATGCTTTCGAACTTCTTCGTCAGCTTGT
+TGAGGAAGCCGACGTCAAGAGTCCTAGAGCCGGTCGACGTATTCGTCGAAGCAATTGGAG
+CTTTCTTGCCATGTGTTTGTGCCTTCAGAAGAACGGAGGGGGAGCCCATGCGGACTCCCC
+CTCGTGTACTACGAACAATCGTGGTTTGCGGACGTGCTG
+>ds2020-267_593
+CAGCACGTACGCAAAGTACTCTCTGGTGGAACCATGAAGGGAATGTAGTGCTTGTCGACG
+CGTTTGAACAGTGTATCACAGTCGACCTTAATTCTGATCTGGTAAGGCTTACCATTGTTT
+ATGCAAAGTGCTCCATTCAGGAGAGACGGCTTCTTTGGGAAAAACGGAAATTACTGTCCT
+AAGACATACAAGATCCATACCTGGTTGCGGACGTGCTGC
+>ds2020-267_594
+CAGCACGTCCGCAACCGCCCGCCCGTAAACCTAAGGGTTCCTCCGCAAGGTTCGTCCACG
+GAGGGTGAGTCAGGGCCTAAGATCAGGCCGAAAGGCGTAGTCGATGGACAACAGGTGAAT
+ATTCCTGTACTACCCCTTGTTGGTCCCGAGGGACGGAGGAGGCTAGGTTAGCCGAAAGAT
+GGTTATCGGTTCAAGGCAGAATGAGTTGCGGACGTGCTG
+>ds2020-267_595
+CAGCACGTCCGCAACAATGCGTATCTGAGGGCGGCCGTAGGGAAGACCTGGTACGAGGGT
+GCGCTATCGCTGCACACAGGCGACGATGTCTTTATCAGGGCGAACACCCTCGCCGACTGT
+TCCGTCATTCTCAGTGATGCGGTTGCCTTCGGATGCCGTATGAACCCAACCAAACAGTCA
+ATCGGATTCTACAATCGACTAGCCTTGCGGACGTGCTGA
+>ds2020-267_596
+TATCTAAGGAGCAGCACGTCCGCAACTTTTACTCGGTCAGCACGTCCGCAATGTTCGCTG
+CCTCAGCACGTCGCAATATGTTACTCATCAGCACGTCCGCAAGAAGATGAGGGTTCATTT
+GCGGACGTGCAGTGAGTCACTATTGCGGACGTGCTGAGTGGTAGTCAATTGCGGACGTGC
+TGAGGAGGTTTAAGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_597
+CAGCACGTCCGCAACTATCCGCCGATTGAATTATTTGGTCCCACTCGTTATCAATGGGAT
+CAAGGATACTTCCAACCAGAAATATATCGCAGAATTGGTGCTGGGTTAGCTGAAAATCAA
+AGTTTATCTGAAGCTTGGTCTAAAATTCCTGAAAAACTGGCTTTTTATGATTACATCGGC
+AATAATCCGGCAAAGGGGGGAAGCTTTGCGGACGTGCTG
+>ds2020-267_598
+TATCTAAGGAGCAGCACGTCCGCAATCAAAGAGGGATGCCATTGGGACGTGCTGAGGGGT
+TTGGCGTTGCGGACGTGTGCCTCACCGGCATTGCGGACGTGCTGCTCCTTAGGCGCTTAG
+GCGACGCACTGACCGTCGTCTACTCCTTGACGCACTGACCGTTCCTATGCTGGTGGACGC
+ACTGACCGTAATGAGGGGGTTCGGCACGGTCAGTGCGTC
+>ds2020-267_599
+GACGCACTGACCGTTCGTTGCCACCTCCCCATGGACATGCGAAGTGGCAGCAACAAACTA
+CTCGCCTTTATTCTAGAAAAACACCATGGTATCAAGCCGCACTGTGCCTACCTATTTTAC
+AACAAAACTGGCACACGGTTAAAAGTGCAGGGACCTGCTATTGCGGACGTGCTGAGTGAC
+AAAATGTTGCGGACGTGCTGAGGGTAGGTAATTGCGGAC
+>ds2020-267_600
+TCCTCCGGAGTGCCTGAAGTTCAGACCTGTCCCCTTCCGATCTATCTACGGACCAGCACG
+TCCGCAAGTCATGACCCCTCAGCACGTCCCAAGGTTGCTCCCTCAGCCGTCCGCAATTAT
+GTCAGTTTGCGGACGTGCTGCTCCTTAGAGATAGGAAGAGCGTCGTGTAGGGAAAGAGTG
+TGCCTCTATGTGTAGATCTCGGAGGTCGCCGTATCATTA
+>ds2020-267_601
+GACGCACTGACCGTAGCCAATTCCCTGACGCACTGACCGTGTCGTATCGCTTGACGCACT
+GACCGTAGGCAATCTACTGACGCACTGCCGTATGAAAGCCGGTAAGGCGGTCAGTGCGTC
+GCCTTAAGCGTCAGCACGTCCGCAAGCATTCACGTCTCAGCACGTCGCAACCAACCATCG
+CCATTTGGGACTGAGGGGTGACATATTGCGGACGTGCTG
+>ds2020-267_602
+GGACGTTCGGGCTTATATTGGGGGATAGAAGCCGAACGTCCAGGGATAAAGTAAAGCCCG
+AACGTCCAGGGGGCGCCGCAAGCCCGAACGTCCTTACTTCCAGCACGTCCGCAATAGTCT
+CGGTGTGCATTGCGACGTGCTGACCCAGTTCTGTTGCGGACGTGCTGAGGGGCTGAGAAT
+TGCGGACGTGCTGAGGCTGACGAGCTTGCGGACGTGCTG
+>ds2020-267_603
+GACGCACTGACCGTCGGAGAACTGGTGACGCACTGACCGTCATTGCAGAGGTTACGGTCA
+GTGCGTCAGGGGACGCACTGACCGTAGGGATGACCTGATGCACTGACCGTTGTAATTCGC
+CTACGTACGGTCAGTGCACGTCCGCAATTGAACCTGCTCCACGTCCCACCTGGTCAACCT
+TGCGGACGTGCTGAGCGTACCAGCGTTGCGGACGTGCTG
+>ds2020-267_604
+GACGCACTGACCGTCGTACCCCGATTCCTAGCCTTTGGTAGTGTTGATAAACGTATTACC
+GCCAAACTATCACTAGGGCAAGGGCTTTACGCCAATAACTTTACAAGCTGGTCAAGATAC
+TATGGCACGACCAACGTAACAGGCGAAACCACCAAAAAACGGTCAGTGCGTCGCCTTAAG
+CGAGGACGTGCTGAGCTGGAGCTTCTTGCGGACGTGCTG
+>ds2020-267_605
+GACGCACTGACCGTGGCTTGGATTTTAAGACAAGGAAGAAGAGAACAGAGAGAAGGGAAT
+GTTTAAATAGGAGCTGGGATTTCGAAGGTGGAATGTAAAGTTTGGGTCTTTAGCTGTATT
+TCGCTTTGTGGGCAAGTAATGGTAATGGTAATGGAGGATACTTCGAGAGCAAGGTTATAG
+TTGTGGACGTGCTGGGCGAACTGGGTTGCGGACGTGCTG
+>ds2020-267_606
+GGACGTTCGGGCTTTGTGCTGCGGGTGATTTTACCTACGGGTGAGCAAATTGAAATTTGC
+GGGGGTGAGGCGAATACCACCAACAACCGCATGGAGCTGATGGGGAGGGGGCCAATCAAG
+CCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCACGTCCGCAACTCTTCGCTCCTCA
+GCACTTCCGCAATTAGTGAATGATGTTTGCGACGTGCTG
+>ds2020-267_607
+AGGAGCAGCACGTCCGCAAAGGATTCGTCATCAGCACGTCCGCAATCCCAAGCCCGTCTC
+TATGGCGGGTGCTGAGCATCGATTATTGCTGAGGTGCTGTTCCTTAGATCATCTAAAGCG
+CATCACGTCCGACATTATTGTATCCTCAGCACCGCCGAATAGCATCTTCCTCCTCGTCCC
+AATTAATGGGGATTGATTGCGGACGTGCTGCTCCTTAGA
+>ds2020-267_608
+CAGCACGTCCGCAACCAACGTACCCTCTGATTTCGATACAATCCAAACCCTAATCTAACC
+CTAATTCCAATTATTGCAATTTCTTTCTCTTTCGTAAACCCTACTTTCCTTGAGTTCTTC
+GACACAATTATTCATTTTTACTGGATTTGATTGATTCATGGGCCGTAACTCCCTCGCTCC
+CGGGTTCCGATTCCACCCGAGAACTTGCGGACGTGCTG
+>ds2020-267_609
+CAGCACGTCCGCAACTATCATGCTATGGTCACAGAGCTCTTGTAGCTCAACATACCTGCA
+GCTGATGCCATCCGCATTGATGCAAGGGATGTTGAAAGTGATGACGGCACAGGCGTTTCA
+GAAACCGGTGCCAGCGTCATGTTTCCACACAACTTGGCCAGTTCACTGACTGTCGCAACA
+GGCACCTTGCCCATCAAGGTGTCATTGCGGACGTGCTG
+>ds2020-267_610
+CAGCACGTCCGCAATGCCGTAGCCCTGTGGACCGGGATGCTGGGCACTATCGTTTACAAC
+CAGAATCGCCAGCAAAACCGCGTGCGAATTTTCGAAAGCGGTTTGCGCTTTGTACCGGAT
+AATCAGGCAAATTTAGGCATCCGTCAGGATCTCCTGCTGGCTGGTGCTATCAGTGGCAAC
+CGTTATGAAGAGAGTGCCCGGAGATTGCGGACGTGCTG
+>ds2020-267_611
+CAGCACGTCCGCAATCGCTCTTAGATCCTCGTACCGCCAGTCCCCTTCTATTAGTGTCAG
+CAGAAGCTCAGTGGACCTCCGTAATGCCTCGTCCCAAAGATCTCATGCTTCCTATTTTGT
+TTCCCCCAATTCCTTTGGTTACCCATCTTTTTCACCCCTGAACTCAAGATACCTGTCTGT
+TGCACACATTCCAAGCCCTAACAATTGCGGACGTGCTG
+>ds2020-267_612
+CAGCACGTCCGCAAAGGGCCCACCCTCAGCACGTCCGCAACGCACTATCCCTCAGCACGT
+CCCCAAGTATCTAAGGAGCAGCACGTCCGCAACGGTGACCCCTTAACCATTGGACGTGCT
+GAGGGTTCGATACTTGGGACGTGCTGAGCGGACAGTTCTTGCGGACGTGCTGACAGATTG
+CCGCTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_613
+GACGCACTGACCGTACCACGCCCCTGACGCACTGACCGTGACGTAAGCGCTGACGCACTG
+ACCGTAACACTACCTGTGACGCACTGACCGTCCCTATACGGCTGACGCACTGACGTATTA
+GATCTGGTCCAACGGTCAGTGCGTCGCCTTAAGCGATCCGCAAGATTATAGAGGTTGGAT
+TGCGGACGTGCTGCCCGGACTATCTTGCGGACGTGCTG
+>ds2020-267_614
+GGACGTTCGGGCTTTGGTGTCATGGTTTGGGGTGGGGGTGTGTTATCTCAACTTGGTTGG
+CAAAGTACCCAGTTGCTTACCATTACCACAATGGCTCTACCCACCGTGTGCCGGAAGCCC
+GAACGTCCTTACTTCCATATCTAAGGAGCAGCACGTCCGCAATGGTCAGACCCTGATATT
+TGCGGACGTTGCGGGCTAGTTGCTTTGCGGACGTGCTG
+>ds2020-267_615
+CAGCACGTCCGCAAGTTCATCGGGATGTGTATAGTGATAGGATCACTCGATTCATGCGTC
+TTGGTTGGCAGGGGCTGGTTGGAAACACAGCAACAACCACACGCATCGAGAATGCAGAAT
+TGACCACACTTGGTGGTAATCATGTCGTTGACGTTCCCGTTCCTTTTTTATGAACGGAAG
+CTACGACTACAAACCCAGTTGGAATTGCGGACGTGCTG
+>ds2020-267_616
+CAGCACGTCCGCAAGTCGTCCGCTATCAGCACGTCCGCAATGGTTTTGTCCTCAGCACGT
+CCCAATACCGGATCCCTTGCGGACGTGCTGCTCACGCTTAAGGCGACGCACTGACCGTAC
+TTGCACGCCTGACGCACTGACCGTGAGCACATGAGTGACGCACTGACCGTCCAGACTACT
+TTAAACGGTCAGAGGAGTGGAACGACGGTCAGTGCGTC
+>ds2020-267_617
+GACGCACTGACCGTGTCCTATTCGTTGACGCACTGACCGTCACTCTGTTTCTGACGCACT
+GACCGTTACTAGCGCCCTGACGCCTGACCGTATCTGCGAGAATACGGTCAGTGCGTCGCC
+TTAAGCGTCAGCACGTCCGCAAGAGGCACCGGGCACACGTCCGCAATAGTCACCCGGTGA
+TTGCGTCGTGCTAAGGCTATATAATTGCGGACGTGCTG
+>ds2020-267_618
+GACGCACTGACCGTTTTAGCTACGGTCAGTGCGTCAGCCATATAAACACGGTCAGTGCGT
+CAGGGGCACGGCGACGGTCAGTGCGTCGCCTTAAGCGACTAAGGAGCAGCACGTCCGCAA
+TCCGTCGGCACTTGGGACGTGCTGAGGGAAACATCATTGCGGACTGACCGGTAACCTCTT
+GCGGACGTGCTGAGGGATAAACAGTTGCGGACGTGCTG
+>ds2020-267_619
+CAGCACGTCCGCAAATCCTAATCCTAACCCTAGAGAGCACAACAGCAGCAGTAATAGCCA
+TGGAGTGCGAGAGAAGAGAGACATTGATGGATGGATAGGATGAGTTTTTCCTGGAGCAAC
+TCCAATTGATCAGAAATTTGGGTTGCAGGGAGGGAAAACCCGAACCCTAAATTTTGGGGA
+CGTGGAAACGGAGGAGTGTAACATTGCGGACGTGCTG
+>ds2020-267_620
+GCAGCACGTCCGCAACTTCGGCCCCCTCCAGCCATGCCGCGTGTGTGAAGAAGGCCTTAT
+GGTTGTAAAGCACTTTAAGCGAGGAGGAGGCTACTTTAGATAATACCTAGAGATAGTGGA
+CGTTACTCGCAGAATAAGCACCGGCTAACTCTGTGCCAGCAGCCGCGGTAATACAGAGGG
+TGCGAGCGTTAATTGGGATACCATTGCGGACGTGCTG
+>ds2020-267_621
+CAGCACGTCCGCAACCATCTAGTTTTCCGAAACCGAACTGAATAGAATTGTGACTTTCCA
+AAAATGCTTGCTGAAAATCAAAGAAAGAAGGTCCATTTTCCCACGTAGTTCGTCGGTCAA
+ACCAACGATTCTCTTCTCAAAGTAATAGAGAGATCTTTTTCTAGTTAGACTTCTATCAAT
+GCAATGAAAGAACCATCCCTTATTTGCGGACGTGCTG
+>ds2020-267_622
+CAGCACGTCCGCAAAATCCATTGGGCAGCACGTCCGCAAAAAGCTCTCCTTTCACAAGGT
+GGACCTCCGGGACAAACCAGCACTGGATAAACTCTTTTCTTCAATAACATTTGATGCTGT
+CATACACTTTGCTGGACTCAAAGCAGTTGGTGAAAGTGCAGAAACCATTGCTGTATTATA
+ACAACAATTTAATCAGGACCGAATTGCGGACGTGCTG
+>ds2020-267_623
+CAGCACGTCCGCAACAATAGACCTCTGTGCTGCCATCTTCAAAGTTCGTATATCCACATT
+TCTAGGCTATAATCAAAATCTGATAAAAAGACGCCTCTAAAATCATCCCATGCTAGACAA
+GTGTGTTTCAATCACACAATCTTCCAACAAAAGATAGCCATCTTCAAAGTGCATATATGC
+ACATATATTGCATATCACAACCTATGTACACGTGCAA
+>ds2020-267_624
+CAGCACGTCCGCAAGCTAAAAGGTTTTGGTAGCCTCCTATCAACCAAACCCAATCGAAAT
+CAGTTAGGAAAGCCTCTCTAGCATGGTCCAAAGGGGCATTTGATGAAGTTGAATATTGAG
+GCACATTCCATTCGTTCCAAAATTTAGGGGTGTTTCGACATTTGCCCTTTTTTTTTATTT
+ATATAATTCCCACGGCTGCACGGTTGCGGCCGTGCTG
+>ds2020-267_625
+GCAGTTGACTCCTACATCCCTGCTCCACTGGGCTCGGGGCGATATAGCACAGTTGGTAGA
+GCTCCGCTCTTGCAATTGGGTCGTTGCGATTACGGGTTGGATGTCTAATTGTCCAGGCGG
+TAATGATAGTATCTTGTACCTGAACCGGTGGCTCACTTTTTCTAAGTAATGGGAGGGGGG
+CGCGTTTGCGGACGTGCTGCTCCTTAGATAGATCGGA
+>ds2020-267_626
+GACGCACTGACCGTCTTTCAGGTGATTAGATACGGTCAGTGCGTCAGTTAGCCATTAACG
+GTCAGTGCGTCAGGCCGCTTGGCACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGAGCAG
+CACGTCCGCAATCCATGGCCCCTTGCGACGTGCTGAGGACTAAATACTTGCGGACGTGCT
+GAGCAACAGCCCTTTGCGGACGGCTGCGCCTTAGATA
+>ds2020-267_627
+CAGCACGTCCGCAACTCCCTCACACTCAGCACGTCCGCAAGCATCTCCCCTCAGCACGTC
+CGCAACTCCCTCACACTCAGCACGTCCGCAACCAAGTAGAAGTGGACGTGGGGGAGCCAG
+ATTGCGGACGTGCTGAGCTGACTGGCCTTGCGGACGTGCTGATCCTTAGATAGATCGGAC
+GAGCGCACGCCTGAACGTGAAGCACTCCGGAGAAGAC
+>ds2020-267_628
+GGACGTTCGGGCTTGGATTACTCTGTGCGATCGGGAATCAGCAGTCGCTTCGCCATCTCT
+CGCAAGCTATCCGGGACAGCGATCTCGGAAAGCCCGAACGTCCTTTCTAAGGAGCAGCCG
+TCCGCAACAGGCATGGGGTAGCACGTCCGCAATCAAGTCTCCCTCAGCACGTCCCAACAT
+AACCCGGGTCTTTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_629
+CAGCACGTCCACAAACCAGACTTTGCGGACGTGCTGAGGGCGGTTACCTTGCGGACTGCT
+GCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTGTTTTGTTGATTGGTTTTAATGCC
+TTGGCGTATGTGTTGCCGCCCCTGCGTTCCAATACAGACAAAAAAGCGCTGCAAGAGGGC
+TTGCAAGATGGAGATATCCACCAACGGTCAGTGCGTC
+>ds2020-267_630
+GACGCACTGACCGTGTGAATACAGCTGACGCACTGACCGTGATTGTCTTGGGACGCACTG
+CCGTTGTGTGTACCCTGACGCCTGACCGTCGTCCAGTGGTATGATAACGGTCAGTGCGTA
+TCTAAGAGCAGCACGTCCGCAAGGGGCATCGAATTGCGGACGGCTGAGGGGAAGATGCTT
+GCGGACGTGTGAGCAGTTAGAGATTGCGGACGTGCTG
+>ds2020-267_631
+GACGCACTGACCGTAACCAGTACACTCCTTATTAACAGATGACCAATAAAAAAGGTTGGT
+AACTTACCAACCTTTTTTGGGTTTCTTTTTGACCTTTAAATACAAAAAATTTGATTACAG
+AAAATCAGTTTTTATAACTTTCATCTGCGGTCCGACGGTCAGTGCGTCGCCTTAAGCGTG
+CGGACGTGCTGAGGCGAGGGCCCTTGCGGACGTGCTG
+>ds2020-267_632
+CAGCACGTCCGCAACCATTGACCCGTTGCGACGTGCTGAGGGCTGGCCTATTGCGGACGT
+GCTGACCGAGACCAAGTTGCGGACGTAAGGACGTTCGGGCTTAGTGTGTCATCTGAGTTT
+GTGTCGGTTTGCTTACTTTCACTTAGGCATCCCTGGACGTTCGGCTTATGTGGGGGATGA
+AGCCCGAACGCAGGTCGCGAAGCAAGCCCGAACGTCC
+>ds2020-267_633
+GGACGTTCGGGCTTGAGTGGTAAGGTCTGCGAGGAGTGAGGCTTCAGCTGGATAAAGCTA
+ATTTCGAGCGGCTGAGCGGGGAGAAAAAGCCCGAACGTCCAGGCCTGAAATGAAGCCCGA
+ACGTCCTTACTTCCAGAATCTAAGGAGCAGCACGTCCGCAACGGATTTTTCCTCAGCACG
+TCCGCAAGGTCACCGGTATTTCTTTGCGGACGTGCTG
+>ds2020-267_634
+CTTACAATAAGATTAACTCCAGTCTCTCAGCTGGGCAATAGAAGGAATTGAGTCTCTAAT
+CCCCACCTAGGACAGTAACCATAGAACTTCACTTCTTAGCATTAGCAAGGTAGCAAAGCA
+GCCCGGAAGCCCGAACGTCCTTACTTCCAGACACGTCCGCAAGCTCCATACCGTATATGT
+TGCGGACGTGCGAGTGTACCGGTGTTGCGACGTGCTG
+>ds2020-267_635
+GGACGTTCGGGCTTTGTAGTTTGTTTTGTAGAAAGGGGCTTCTTAAAATATCCCATAAAT
+AAGTAGGGGCTTCAAAGCTTGTTGTAGTTTAGGGGTGCGCAGGTTTGGAACCCCATACAG
+GGGGCTAGCGCGCAATGGCTTTCTCTGAAAGGGGCTCGCTTCTTCAAGCTCCGCTCCGCT
+TGCTGCTTTTCATTTTGTTAGGAGTAGGTGCTTGCTG
+>ds2020-267_636
+CAGCACGTCCGCAACCATCTCATCAAAAACTTTTCGAGCTTTCTTAATCTCACCAACAAC
+ACCAAACCCATGAACCAAAGTCGTGTAAGTAACAACATCAATCTCACACTTCCTCTTCTT
+CATTTGCAAAAAGAACTCCCAAGCTTCCTTAATCTGGCCAGCTCTAAAATACCCTTTAAG
+CATTATGTTAAACGTGGTTCGGTTTGCGGACGTGCTG
+>ds2020-267_637
+CAGCACGTCCGCAAGTTGGCCTCGGTGGCGCTTCAAGGAGTGACTAATGACTCACGCTCA
+CGAAGACATCAGGGTTGGCACACTGTGCCTTCCCTTCTTTGGTAACGGCTGGCTAATGCC
+ATGGGGTGAAGTGGTCAGCAATACATTAAAGGCGCAGCGGCTCGCTGAGGAATATCGGGA
+AAGTCAGGAGGACTTGTATAGCCTTGCGGACGTGCTG
+>ds2020-267_638
+GTCCGCAACTCAGCGGCCTCAGCACGTCCGCAAATTAAAACGCCCAGCACGTCCGCAATA
+TATCCGCCGTCAGCACGTCCGCAAGGCCAACCTGATACAGTTTGCGGACGTGCTTAAGGC
+GACGCACTGACCGTCCTCCAACCCCTACAGCACGGTCAGTGCGTCAGAGTAAACCCCACG
+GTCAGTGCGTCAGGGAAGGGCACACGGTCAGTGCGTC
+>ds2020-267_639
+AGGAGGCTACTCAGTAGACAGTCCCACCCTCACACGATTCTTTACCTTTCACTTCATCTT
+GCCCTTCATTATTGCAGCCCTAGCAGCACTCCACCTCCTATTCTTGCACGAAACGGGATC
+AAACAACCCCCTAGGAATCACCTCCCATTCCGATAAAATCACCTTCCACCCTTACTACAC
+AATCAAAGACGCCCTCGGCTTACTTCTCTTCCTTCT
+>ds2020-267_640
+CAGCACGTCCGCAAACATTTTCTTCTTCTTTTTCTTTTTCTTCTTCCTTCTCTCCTGCCT
+TGCGACACTCGTCTTCCTGCCCTAACATGCATTTGGGACAATCTACTATCGTTTGATGAG
+GGAGGGAGACTAGAGGAGCTTCTTCTTCCATATTAATTCCTACTATGACGGAGGGCTTGC
+GGACGTGCTGAGGGGGAAGGTATTGCGGACGTGCTG
+>ds2020-267_641
+CAGCACGTCCGCAATTCCCCACTGCTTTCTCTCCGGTTATAGTAAAATACCTGCGTTCTA
+TTGTTTCTTTATATTCAGATGTCATTCTACCTCTCAATCCCTGAAAGTCATCCATCATGT
+CCTTGAGTTTCTTCCCCAAACCACTAACCACTGAGGTCCTGGTTCGATCTGCGGAGGAGC
+CAGGGCCACAACCAGGAAGGCTTTGCGGACGTGCTG
+>ds2020-267_642
+CTTTTACAGAACTCCCCTCTTGTATCATCAAACCGTCACCCATTAATACAACACCAACAT
+TATTTGATTCCAAATTCAGAGCAATGCCTATCGTACCCTCTTCAAATTCTACTAATACAA
+CCTACCACGGTCAGTGCGTCGCCTTAAGCGACGTCCGCAAGATAATCGACTTGATATTGC
+GGACGTGCTGATGGCATACGCTTTGCGGACGTGCTG
+>ds2020-267_643
+CAGCACGTCCGCAATATGGTACCCCTGATCAGAATGGTACTCGAATTCATTTACGATCCC
+GAGTTTCCAGACACATCGCACTTCCGCTCGGGTCGAGGCCGCCACTCGGCCCTAAGACGG
+ATCAAAGAAGAGTGGGGAACCTCTCGCTGGTTTTTGGAATTCGACATCCGGAAGTGTTTT
+CACACCATCAACCGATCATCGTTGAGGACGTGCTGC
+>ds2020-267_644
+CAGCACGTCCGCAACTCTGTCTTTAATGGCTGAAGTTGGGTGGCCAGTGAATGTGGCCAC
+AGATGAGAAGGTTGACCCCATTGCTGAGCGCATGGGATTCAAGGAGTGGGTCCTTTGTGG
+CTCAGACTTCAAACAAGGGATTCGAAATCTGAAAATGATGGTTGATGAGTACCTTGAGGA
+CTTGCGCAAAATGCCTTTGGAATTGAGGACGTGCTG
+>ds2020-267_645
+TCTAAGGAGCAGCACGTCCGCAACAAACCGGCCATTATTGGGACTGGACCCAATACGCGT
+TGCGGAAGGCCATTTCATTTGCGGACGTGCTGAGCGGTGTCAGGTTGCGGACGTGCTGCT
+CCTTAGATAGCACGTCCGCAACGAGAATTGCCTCACACGTCCCAACCTCGAACTATTTGC
+GGACGTGCTGACGATCGTTTCCTTGCGGACGTGCTG
+>ds2020-267_646
+CAGCACGTCCGCAACCACGACCGTCTTTCCTTGGCGAATGTCTTCAATGGCCTCTGGGAT
+GGAAGCAAATCCTTTTGTGGGGCAATCCAAATCAAATTCATCATTATCAACTGGAAAACC
+ACTAGTTGTTGGAACAGTATCTGCTGAAAGTGTTCCAAATGCTACTGCATCCGGCTGTAT
+CTCAATCCCAACTGACTAAGCATTGCGGACGTGCTG
+>ds2020-267_647
+GACGCACAGACCGTATACCCAGAATTGGACGGTCAGTGCGTCACACGGGATTATACGGTC
+AGTGCGTCAGGCCAACCAAACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCAC
+GTCCGCAAAAGCTCGACGGTCAGCACGTCGCAACACCTTAGCTCTTGCGGAACAGGACCA
+TAATTGCGGACGTGCTGCTCCTTAGATAGATCGGAA
+>ds2020-267_648
+TATCTAAGGAGCAGCACGTCCGCAAATTCATGGCATTCGACTTGGACGTGCTGAGGGAGC
+GCGAATTGCGGACGTGCTGAGGGACTGATTGCGGACGTGCTGCTCCTTAGATAGATCGGA
+AGAGCGTCGTGTAGGGAAAGAGTGTGCCTCTATGTGTAGATCTCGGTGGTCGCCGTATCA
+TTAAAAAAGTTTAATTGCGGACGGCGCTCCTTAGGT
+>ds2020-267_649
+CTAAGGAGCAGCACGTCCGCAAATGTTCTCGGGTAGCACGTCCGCAAGAGGTCCTGCCTC
+AGCACGTCCGCAACTCATTTAATAAACCTATTAAAACTATACAGGCTGCTAATATTATGG
+GAGCTATTCTGTTAGAAATAGATCCACCTATTGAAAAAACAAATGAAAAGACTTTAAATT
+TTACTTTAGAAGGGGGTCGGGGTTGCGGACGTGCTG
+>ds2020-267_650
+GGACGTTCGGGCTTAGGGGGTGCCCCTGATTTTTCAGGGTAAGAAGGGGTAGAGAAAATG
+CCTCGAGCCAATGTTCGAGTACCAGGCGCCACGGCGCTGAAGTAACCCATGCCATTCCCA
+CCTTAAAGCCCGAACGTCCTTAATCTAAGGAGCAGCACGTCCGCAATGGCCTAGTTATTT
+GCGGACGTGTGAGGGTTGACGACTTGCGACGTGCTG
+>ds2020-267_651
+CCCTGGACGTTCGGGCTTGATTTTGATGGTGATGAGGAGGAAGAGGTGGAGGAGAATATG
+ACGTCGTTTAAAGGAAGGGAAATGGGGTCGAATTTTTTAGAGGATATTGAATTTTCTGAG
+TTGCTGGGAGGGTTTGGTTCCATTGATGGGTATTTTTTGGAGGATATGTTGGTTGACTTG
+TGACAGTGGTGATGATGATGCTTTGCGGACGTGCTG
+>ds2020-267_652
+GGACGTTCGGGCTTTGGATCAGGGGTAGCGTGAAGCCCGAAGTCCAGGCAAATGGTTAAG
+CCCGAACGTCCAGGAGCAACGCTAAGCCCGAACGTCCTTACTTCCAGTCTAAGGAGCAGC
+ACGTCCGCAATTCCTCTAGTTTGCGACGTGCTGAGCCAGTTTCCCTTGCGGACGTGCTGA
+CGGAGTCCTCTTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_653
+CTTCCGATCTATATAAGGAGCAGCACGTCCGCAAAGACATACCCCTCAGCACGTCCGCAA
+TTAGCCTCCCCTCAGCACGTCCGCAAAGATGTACCTGTCAGCACGTCGCAACTCAGCTCC
+ATTCGATTGCGGACGTGCTGCTCCTTAGATACGTCCGCAACCCCAACCCAATTCATTTGC
+GGACGTGCTGAGTGGGATGGCTTTGCGGACGTGCTG
+>ds2020-267_654
+GGACGTTCGGGCTTGGTTTTGGTATTTGAGCTAGTGACGCAACTGGGCGGCGAGGCCGGG
+CCGAGAGTACACGACAAGCCCGAACGTCCTTACTTCCAGACACGTCCGCAACTTTACACC
+GATAGGATAGAGGGTCTGTATTGCGGACGTGCTGAGGCTAGAAAGATTGCGGACGTGCTG
+AGCGGCCTATGATTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_655
+TATCTAAGGAGCAGCACGTCCGCAATAAGTGTTCCCTCAGCACGTCCGCAACGTACATTC
+TCTCAGCACGTCGCAACTAGGAGGATCTCCTTGCGGACGTGCTGCTCCTTAGATTATCTA
+AGGAGCAGCACGTCCGCAACTCCTATTCCGTCAGCACGTCCGCCACTTCATAGGGCTCCA
+CGTCCCAATTAGATAGCGTATTTTGCGGACGTGCTG
+>ds2020-267_656
+GGACGTTCGGGCTTGTTCATCCCTTTTATAAAGCCCGAAGTCCAAGCCCGCCAAAAAGCC
+CGAACGTCCTTACTTCCAGACACGTCCGCAAATCGCTGTTGTTGGACGTGCTGAGGCAGC
+GCTGATTGCGGACGTGCTGAGGGGAACAAGGTTGCGGACGTGCTGCTCGTTAGATAGATC
+GGAAGAGCGCCCGTCGGAACTCCTGGCAGTCGGGGG
+>ds2020-267_657
+GACGCACTGACCGTGACACTTCCCCTGACGCACTGACCGTGCCCCTACCACCGACGCCTG
+ACCGTGTTATCCATGTTTATACGGTCAGTGCGTCGCCTTAAGCGACACGTCCGCAACGGT
+ACAGGACTTATGTTGCGACGTGCTGAAGCCCTTTAATTTGCGGACGTGCTGAGTGGGGAC
+TTATTGCGGACGTGCTGAGGCCAGCGATATTGCGGA
+>ds2020-267_658
+TCACAATTGCATGCAGTACTAGGGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGC
+GAAGGCGACTCTCTGGTCTGTAACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGCGTAGG
+ATAAGCCCGAACGTCCTTACTTCCAGTGTCCGCAATTAGTTTCCCCTCGCACTCCCAAAA
+ATTCCGAAGTGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_659
+CAGGCGGAGTGCCGCCTACGAGGGTCTCCGGAGTGAATGGAGTGCGGACGTGTGCTCTTC
+CGATCTATCTAAGGGGCAGCACGTCCGCAACAAAGGGTCACTTGGGACGTGCTGAGAGCG
+GGGCGTTTGCGGACGTGCTGAGCTAATGTGAATTGCGGACGTGCTGCTCCTTAGATAGAT
+CGGAAGAGCGGCGTTCTGAACTTTAGTCACTGTGGA
+>ds2020-267_660
+GGACGTTCGGGCTTACCCGTCCACCCCCTCTCGAGTTTCCGGCTGTTTCCTAGATTGAAG
+TAGCCTTTCGTCACCCTACCAAACGAAAGAAGTCACTATCAAACAGCCCCCCCAACTAGT
+CGTATGGGGTGCTTGTGGTAAGCTGCCTTGGTTGTGGACGTGCTGGCGAGCAGGAATTGC
+GGACGTGTTGAGGAGCGTGGGTTTGCGGACGTGCTG
+>ds2020-267_661
+CAGCACGTCCGCAATATGCCGTGCATTCTCCCATTTCGTATACAATTTCATTATTGTTAT
+TTAAAATGATAGTAGAATCACTGCGATTTGCGGACGTGCTGCTCCTTAGATTCGCTTAAG
+GCGACGCACTGACCGTGGGGTCTCTCCTGACGCACTGACTGTATTGTTGGCCCTGACGCA
+GTGACCTTTAAATGCCTCATGTACGGTCAGTGCGTC
+>ds2020-267_662
+GGACGTTCGGGCTTCCATTGGACGCTGAAAGCCGAACGTCCAGGGCCCAGGCCAAGCCCG
+AACGTCCAGGAGTGGTTGCAAGCCCGAACGTCCTTACTTCCAGACACGTCCGCAATACTT
+TGGATATTGGGACGTGCTGGAGGGGTCACGTTGCGGACGTGCTGAGTGTGAACTACTTGC
+GGACGTGCTGAGTGGTACGGATTTGCGGACGTGCTG
+>ds2020-267_663
+GGACGTTCGGGCTTTACCCCACCGATATGTTCTCCCCCCATTCCCCATGACCACCACGCA
+AGATCCAACCTTCAAACCCATACCACAACCACCCTCCACCCCAGAGGCAAACACAAGCCC
+GAACGTCCTTACTTCCAGTATCTAAGGAGCAGCACGTCGCAAGGTTCAGCCTCTCACACG
+TCCGAAATTCAACTCCCTGGGTTTGCGGACGTGCTG
+>ds2020-267_664
+GACGCACTGACCGTGGGGTGGACCCTGACGCACTGACCGTGTGATGTACCTTGACGCGCT
+GACCGTCTGATGTTTCCTGACGCACTGATAGTCCTTAGCACGGTCAGTGCGTCGCCTTAA
+GCGTGCACGTCCGCAATCCGAAACCCCTCTGCATTGGGACGTGCTGAGAGGGTAGTGGTT
+GCGACGTGCTGCCCGACACTGTTTGCGGACGTGCTG
+>ds2020-267_665
+GGACGTTCGGGCTTTTATCTCGGGCTGGAGGAGCTCCTAATGTGTCTGATGCAGATACCA
+TCAATGGTCAACCTGGTGATCTTTACAATTGCTCGGGCCAAGACACAATCATAGTTCCTA
+TAGACTTCGGTGAGACCACCCTTCTTGTCTCCCTGCCGACAGCAGTGCCTCTGTGACCTC
+ACCTTTCTTCACTAGTTATATGTTGCGGACGTGCTG
+>ds2020-267_666
+GGACGTTCGGGCTTCATGGTTGTGGTATTGATCTTACGGGGGGAACGAAATCAAAGAATA
+TATAGACTTGTAGAGACCCTCTATGTAGTTGTCTATCTAGGGCGATCGGTCTACATCTTT
+CCCCATAGCCCCGGGGCTGTGTTTCGATCTCCTACGTGCGAAATCTGAGGGTTCTTATTG
+CGGACGTGCGAGTTGATGCGGATTGCGGACGTGCTG
+>ds2020-267_667
+GTCCGCAATAACAGCAAGGTCAGCACGTCCGCAACTGCACACCCTCAGCACGTCCGCAAC
+AATCACTGGGTGAATCTTGCGGACGCGCTTAAGGCGGCGCACTGACCGGCCAGGTCCCCG
+TGACGCACTGACCGTGTCCATAGCCTTGACCCACTGACCTTATAGAATCACAGGACGCCT
+GCCTTTTCTTTGTCGGTACCGTACGGTCAGTGCGTC
+>ds2020-267_668
+CAGCACGTCCGCAAGCGAGTCCCCCCCCTAGTTCATATCTTTGTTTCGTGTGTTCCCGGG
+AGTAATTCGATCTCTTCAATCTCGGGATACCACCTAAATAACTGCGGCCAGAGAGTAAAA
+TAGGTCGGGAAGAAAGAGTCTGAGGTTGGGTCGGACGACATACATCTTGGAAGGAAGGTT
+CATTCTTTAAATCAGCGATGGTTGCGGACGTGCTG
+>ds2020-267_669
+CTTGGTGCAGAAGATCTTTTTCCACTCTTTTCTTCATCTAGTAGGTCTCTGATAGGGAAA
+TAAGCTGCTTTCTTGCAAAGCTCAAGTAGATCTGAACCTGTGTAACCCTCACTCAAGCCA
+GCTGATACGGTCAGTGCGTCGCCTTAAGCGTGTCCGCAACGTTTAACTGGTAAGATTTGC
+GGACGTGCGAGTGGCTTTCAGTTGCGGACGTGCTG
+>ds2020-267_670
+CAGCACGTCCGCAAGGGAGACATTCTCAGCACGTCCGCAAACTCTACTGGCTGGTTATTG
+CGGACACGCTTAGGCGACGCACTGACCGTAATTGCCACCTTATCTTTAGGGTTTTGTTGC
+CCTATCTGGGCTTTCTTTGCCATGCCTTGCCACCTTGCCTTTGCTTGGCCTTTATTTGCC
+TTACCTTGCCTTACCCTTTCTTTTTAGGGTTTGGT
+>ds2020-267_671
+TATCTAAGGAGCAGCACGTCCGCAAGTGCTTATCGGTGATATGTGCGACGTGCTGAAGTG
+GCTTCTCTTGCGGACGTGTGACACTACTGGTGTTGCGGACGTGCTGCTCCTTACGCTTAA
+GGCGACGCACTGACCGTCCGACTCACCCTACGGTCAGTGCGTCAGGGAGACATGAACGGT
+CAGTGCGTCAGGCGAGGACACACGGTCAGTGCGTC
+>ds2020-267_672
+GGACGTTCGGGCTTCAGAATGAGGATGGTTAAGCCCGAAGTCCCCAGGTGGGGCAAGCCC
+GAACGTCCTTACTTCCAGAAGCACGTCCGCAATAACACCACAGTCAGCACGTCCCAACCG
+CCCTCTCCTTGCGGAAGTAACATGGGATACATTGCGACGTGCTGACCGCGCCTCTATTGC
+GGACGTGCTGATGGGTAACCGTTGCGGACGTGCTG
+>ds2020-267_673
+CAGCACGTCCGCAAACCTGAACTGTTGCGACGTGCTGACCCCTTAACTCTTGCGGACGTG
+TGAGACCATACGCCTTGCGGACGTGCTGCTCCTTAGATTGAGCAGCACGTCCGCAAGGCG
+GCTTTCCTCAGCACGTCCGCAAAACGCGTCTCTCACACGTCCGCAATGGCCCATAGGTTG
+CGGACGTGTGAGAGACGCGTTTTGCGGACGTGCTG
+>ds2020-267_674
+GACGCACTGACCGTCTAAATTCCGTTGCTGCGATTCATGCAGGGCGCAAAGCGGAAAACC
+AAGACACCTTGACAATGCAAACGCTGGTGCCAACAGGGGATATAACACGGTCAGTGCGTC
+AGTAGTGGGATCACGGTCAGTGCGTCGCCTAAGCGTGTCCGCAACTCACAGCCTGTTGCG
+GACGTACTGAGTAACGTGACATTGCGGACGTGCTG
+>ds2020-267_675
+TTCTGGGCGTGTCTATGTAAGGAGCCGCCCTGCGTCAAGGGGATGGAGATTGGGACGTGC
+TGAGGTGCGGTGTATTGCGGACGTGCTGAGGGTTCGCGGGTTGCGGACGTGCTGAGTGAT
+TACGTTTTGCGGACGTGCTGCTCCTTAGATACACGTCCGCAAACAGTTAGGAGTATGTTG
+GGACGTGCTGCCCACCTAGGCTTGCGGACGTGCTG
+>ds2020-267_676
+ATCTAAGGAGCAGCACGTCCGCAATCTTCCCCCGCTCAGCACGTCCGCAATGCATTATAG
+CTCAGCACGTCCGCAATGGTTGCGGAAGTGCTGGAGAATCCAGGTTTTGCGGACGTGTAA
+GGACGTTCGGGCTTGAAGTACCCGCTGGACGTTCGGGCTTTCAACACCGCCTAGGACAAG
+CCGAACACCAGGGGATTGATAAAGCCCGAACGTCC
+>ds2020-267_677
+TATCTAAGAGCAGCACGTCCGCAAGCTAATCACCCTAGCACGTCCGCAAACCCCAGGCCC
+TCACACGTCCGCAATATAAAGCCGATAATGTTGCGGACGTGCTGCTCCTTAGATATCTAA
+GGAGCAGCACGTCCGCAAGATTGGTCCGCTCAGCACGTCCCAACTACATCGACATGTTCT
+TGCGGACGGAGTGGGTAAACTTTGCGGACGTGCTG
+>ds2020-267_678
+GACGCACTGACCGTTCCCCGCCGCCCCCTCTTTGACTCAGACGTTGCCGAGCGTCCGGCT
+ATTACCAATACAGAGGCTTTGTGGATAGACGCTTTTGATGATTTTCAAACGTCTGATAAC
+TTAGATGCAAGCTTTATCCCTTTTGGCGAGTATGATGTTGCAAGCTTTGGCGGATTTTCA
+CCCTTTGATAACATGGGCAATACGGTCAGTGCGTC
+>ds2020-267_679
+CAGCACGTCCGCAAAGACATACTCGTCCCTATTTTTAAGTCCTGTAACGCGGGAGGTTAT
+GCTCCGCTTTGTTTATAATTATAAAGATTTTGCACTTCCTAAAAATGCGGTGTTAAGCAC
+ATTTATACGCAGGTTAAACTATCCGTCTGATTAAATTTCATCATTCGGAGAAAACGTTCC
+TAATGTGCAAATGCCAGAAATTTGCGGACGTGCTG
+>ds2020-267_680
+GGACGTTCGGGCTTTAGAGGACCGGGGCGTTCGGCTTACAATACAGCCTTGAAGCCCGAA
+CGTCCACCAGAAAAGTTAAGCCCGAACGTCCAAAGGTGGACGGAAGCCCGAACGTCCTTA
+CTTCCAGGCACGTCCGCAATGGAGTCACAGGTAACACGTTGGGACGTGCTGAGGTGACCT
+CTATTGCGACGTGCTGACGGTTTGCGGACGTGCTG
+>ds2020-267_681
+GGACGTTCGGGCTTGTGATCTGCAGTATGGTTTGGATCTGTGTCCCCACACAAATCTCAT
+GTTCAGTTCCCAATGTTGGAGGGGGGGCTGGTGGGAAGAGATTGGATCATGGGGAGGTAA
+AATAAAAAGCCCGAACGTCCTTTATCTAAGGAGCAGCACGTCCGCAAGAGTTGGTCGATT
+GCGACGTGTGAGTATCGATGGCTTGCGGACGTGCT
+>ds2020-267_682
+TCCGCAAACTCATCTCCCTCAGCACGTCCGCAATACCAGCCCCCTCAGCACGTCCGCAAT
+AATGGGCCCTCACACGTCCGCAATTGAACCCTTCGTAATTTGCGGACGACGCTTAAGGCG
+ACGCACTGACCGTAGTGCTGACCGTGACGCACTGACCGTGTTGTTCCCCTTGACGCACTG
+ACCGTGTAGATGGGGTAACAAACGGTCTGTGCGTC
+>ds2020-267_683
+GCAATTGCATGTCCCTCGCACGTCCGCAAGCTCTTACCCATCAGCACGTCGCAAGAGCCA
+ACGCCTCAGCATGTCGCAAATTGGAGGTCGTTGCGGACGTGCTGCTCCTCGCTTAAGGCG
+ACGCACTGACCGTGACGGAACCGGTCATATAAGGTCAGGCGTCAGGCGAATAAAAACGGT
+CAGTGCGTCAGCCATACTCCAACGGTCAGTGCGTC
+>ds2020-267_684
+CAGCACGTCCGCAATTCCAATGCCTTCTGACCTGCTCCATTTAATATTTAATAATGAGAA
+TAAGCAGACTAACTTAGACCAGGGAGACCGCATTGCGGACGTGCTGCTACGCTTAAGGCG
+ACGCACTGACCGTATAATTTAGCCTGACGCACTGACCGTACAATTGAGTCTGACGCCTGA
+CCGTTCCCAACCTGATGAAGCACGGTCAGTGCGTC
+>ds2020-267_685
+CAGCACGTCCGCAAAGGTGCCGATATCCTCACATGAGTCGCCGTATTGATCTTCTGATTT
+ACATTTTGGGCATGTACCCTTAATGAAACGGTCAGACAAGAACATCCCTTTTTTGGGTCA
+AATAATTGAGTTACAGGACGAACTGCAATATTTCCAGCTTCACGGTTTTTAATATAGATA
+TCTGTTGAACGCGCTTTGATTTGCGGACGTGCTG
+>ds2020-267_686
+CAGCACGTCCGCAAGTGCAGAAGGGTGGGAAGGAAAAGGGGGAAGCTTTCATTCATCCTG
+TTTGTTTATCATCATTTAATTTCTTACAGATATATGGAATATAATTTTAGGAATTTCAAA
+ATATTTCAAGTGATGTATTTTGTGTATCTTCAATTCTACCTCGTAATTCAATCCAATCCT
+ATTCACAAAATGGCCCGAATTTGCGGACGTGCTG
+>ds2020-267_687
+CAGCACGTCCGCAACGAATGTGGATTCGTGTCGGAGGAGTTTTGAGCGTGAGCTACCACT
+CATGCAGCGGCAAGGACCCGCAACTCTCGAGGGGGCCACCAACCGCCCGAATAACTCCTT
+TACTCAATGGATAGCGCTTATCCTCTTTCAATCAACAAAATGAGAAATGGGGGAGAAAGA
+AAGAGAGAAAGAGGTTAGGATTGCGGACGTGCTG
+>ds2020-267_688
+CAGCACGTCCGCAATCGCTATGCCCTATCAAAGAAACTAGCGGACTGATCACTAAATAGA
+TACAAATAGGTGCAAATTCTGACATCACCACAGCCCACTTGGTTCTTTCGCTCCTTGCTC
+GCGGAGCGGCATAACGGAAAAAAGTCGGAATTCTACAATTTCGTGGTCCGCTGGGCGAAC
+GCCGGATATTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_689
+CAGCACGTCCGCAATGGAACCCGCCTCAGCACGTCCGCAATAACAAACCGCTCAGCACGC
+CCCACATTATTCTTCTCACACGTCCGCAATCCCCAGCGCCTACACCTTGCGGACGTGTGA
+GAAGAATAATGTGGGACGTGCTGAGCGGTTTGTTATTGCGGACGTGCTGAGGCGGGTTCC
+GTTGCGGACGTGCGCTCCTTAGATAGATCGGAAG
+>ds2020-267_690
+CAGCACGTCCGCAAGACCCGGCAGGTGTTGATTCTGCAGGACGGGCAACAGGTGCCGGGG
+CTGCGGAGAATGTGGTCGGTACATTTTTACCTGCCGAAACGTCTTTCAGGCGCTTGTATT
+CAGTGAGCACACGGCTGCCATAGCCTGAGTCGTTTTCAAAGGCGCTGGCACCGACATACA
+TTTTCAATACGGCTTTCACTTTGCGGACGTGCTG
+>ds2020-267_691
+CAGCACGTCCGCAATTCGGCCTGGGCAGCACGTCCCAAATATTATTCGCTTGCGGACGTG
+CTGTCGCTTAAGGCGACGCACTGACCGTTTTCTCCTGGCTTTTAGCACTTCATTGTCATC
+AAGCAGCACGGGTAGCACGTCTGCAAACGACAAGGATGGGACGTGTGACTGAAATCAGAT
+TGCGGACGTGCTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_692
+GACGCACTGACCGTCTATGGGGCTGGGTGTAATGAAATTGTTGGGGAGTGGAAAGATGCC
+TCTCCACATTTCACATTTGAAGATGCCACTTTGGATGAGGCTATTAATGGTGTTGAAGAC
+TTGGATTACTTTGACTCCCTTGTGATCGGAACTTCGGAAGGCTATCCCTATGTTCTTGAG
+AGGGAGACAAATCAGAAAGGTAAGTCGCGATATT
+>ds2020-267_693
+GACGCACTGACCGTGGGTTAAGGCATGGGATACGGTCAGTGCGGTCAGGGAGGAGCACAC
+GGTCAGTGCGTCAGGCAGAGACTGACGGTCAGTGCGTCAGGGTAAGATCTACGGTCAGTG
+CGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAACCCTAGCCGAGTAGCATTCGG
+ACGTGCTGACCTAGACGCAATTGCGGACGTGCTG
+>ds2020-267_694
+GGACGTTCGGGCTTGGTTTTATCTCTGGACGTTCGGGCTTGGGCCGCATCCTGGCGTTCG
+GGCTTTTCCCACACCCTGGACGTTCGGCTTTACCGTAACCATTAAGCCCGAACGTCCTTA
+CTTCCAGACAGCACGTCCGCAACATATTCGGCTTCCGCAATTACTCATAACTCATTGCGG
+ACGTGCTGAAGAGTGAAAACTTGCGGACGTGCTG
+>ds2020-267_695
+CAGCACGTCCGCAACGTTTCTGGCTTTTAATCAAGTTCGGAACCCCACCGACGGAACTTC
+GTTGGTCTCCAGTACAGGGGCACGGTTCACCTGCCCCATTATTGAAATTGGATCATCATC
+TGAGAGCTCTGTTGCAGCCAGTCAGAATACTTATTTTGAAGATGGTTTAAGCAGTGTTCA
+TACAAGTAATCAGGGGCCGATTGCGGACGTGCTG
+>ds2020-267_696
+TCTAAGGAGCAGCACGTCCGCAACACTTATCCCCTCAGCACGTCCGCAACAATCAATACC
+TCAGCACGTCGCAATCGGGGGCAGCTTGCGGACGTGCTGCTCCTTAGATTCTGGAAGTAA
+GGACGTTCGGGCTTTGTTTCTCCCCTGGACGTTCGTGCTTAGAGCACTCCCTGGCGTTCT
+GGCTTCTTACCTGCTATACAAACCCCGAACGTCC
+>ds2020-267_697
+GCGACGCACTGACCGTGCCCCGATACATCCCCACCAAACCGCAACAACCCTCGTTTCACC
+TCCATTTGGGCAAAGCAGCTGTCATCACTGGCAATCACAATGTCGGCATTGAGCATGAGC
+TCGATACCCGCGGTAAAACAAAGCCCTTGTACCGCAACAACGTAAGGTTTAGTACGCGGC
+ATACCTACCACGTCCCCAACGGTCAGTGCGTCGC
+>ds2020-267_698
+CAGCACGTCCGCGAACGCGTTCGCCTCAGCACGTCCGCAATTTACCCGCCTCAGCACGTC
+GCAACCATCAGGTATTTGCGGACGTGCTGGAAGTAAGGACGTTCGGGCTTACTTCCAGCA
+CGTCCGCAATCATAGCTGGGTCGTCGCAAAGAGGTCCCAGGGTTTGCGGACGTGCTGAGA
+GGTTTAGCCTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_699
+CAGCACTTGTCTCCTAAATTAGCAAGATCGCGCGTTCACCCTTTTGTTTCAAGCAGGTTG
+CTTAGTTATGGTGATAACCAAATTGTTAGCGAAGAGTTGTTTGTATCCGTCGGGTTACGC
+TATGACCCGGAAAAACATGCACAGCATCTGGCCAGATTTGGTATGACCCTAAAAATTGAC
+GAAACTGAAGTGACTATATATTGCGGACGTGCTG
+>ds2020-267_700
+CAGCACGTCCGCAACATGCCCAGCACGTCCGCAAATGTAAGTACCTCCGTCCCAACCCCG
+CCAGTTCCATTCCCGAACTTTCTCGCCAAATCCACATCTGCAAGCCCCCCTCCCTCCCCA
+AAACACACCCCTCTCCGCAATAGATCATTTGTGGACGTGCTGAGGCTCTGGCACTTGCGG
+ACGTGCTGAGGGGAACAAGATTGCGGACGTGCTG
+>ds2020-267_701
+CTTCTTCTCTGCCGAAAGGAAAGACAAAGGCGAGGGGGTACGGTCAGTGCGTCGCCTTAA
+GCGTATCTAAGGAGCAGCACGTCCGCAACTTTCAACGCCTGGTAATTGCGGACGTGCTGA
+GGCAACAACGTTTGCGGACGTGCTGAGAGGGAGAATGTTGCGGACGTGCGCTCCTTAGAT
+AGATCGGACGAGCACCCGGCGGACCTCCCGTCAC
+>ds2020-267_702
+TAGACCCTATCGATACGCCGCACCAGAGTATCGTGAACGCAGTAGTTTGGGTCGGAAAAA
+GCCCCGGGCTCATTCCCCTGACCACCCATCGTCCTCAGCGCCCTTCTGCTGTGCGGTGAT
+CCCGCGCTTGCGGACGTGCTGCTCCTTAGATACGCTTAGGCACACGGGTCAGCGGTTGCG
+GACGTGCTCAGGGGTTAGGGTTGCGGCCGTGCTG
+>ds2020-267_703
+CAGCAGTCCGCAATCGGTGTCCCCTCAGCACGTCCGCAATGGACAACACCTCAGCACGTC
+CGCAATTATTCACCCTCACACGTCCCAACAAGTCGGCAGTTGCGGACGTGCTGCTCCTAT
+CTAAGGAGCAGCACGTCCGCAAGCGCTAATTCCTCAGCACGTCCCAAAGGGGGATCGGCA
+GCACGTCGCAATTGATAATCGTTGCGGACTGCTG
+>ds2020-267_704
+GGACGTTCGGGCTTTTGTGGTCGCCTATTTTGAAATTCCACCCTCCTTTATTCGAATAAG
+ATATATATGTATAATAATGCAAGTAATCTTTCCAACTCAACAAAACCCTTCAGCCCAGTT
+TTACAAATAAACTAGATGCTCCAACCGTAACCATTCTCGCACTCTAGTCCAAACACCTTC
+GTCCGCAACTTCTGCCGGGTTTGCGGACGTGCTG
+>ds2020-267_705
+CGTCCGCAGTGCCCAGCCCCTTGATCTTGCGGACGCGCTTAAGGCGACTCTCTGACCGTT
+TAAAGCACGATACCCGGTCAGTGCGTCAGGACATACTCCACGGTCAGTGCGTCAGGGGCA
+GGGCGACGGTCAGTGCGTCGCCTTAAGCGACACGTCCGCAACAACCTGGCCTTCATTGCG
+GACGTGCGAGCGCTAAAATATTGCGGACGTGCTG
+>ds2020-267_706
+CAGCACGTCCGCAACCCGATGATGCTCCCTGAGCAAGGGCTATTTATTAATGTGTTTATT
+CAAGAATGTGTTAAAGCTCAGTTTTATTGTGGTGGTAAGTTTATGCCTACTCATGTAGTT
+ATGGAAGTGTATGAGTATGTTCGTAATAGTTTTATTGCTAATCGTACTCCTGTTGTACAA
+GAACCTGCAGCTTGCGGACGTGCTGCTCCTTAG
+>ds2020-267_707
+AAGCACGTCCGCAAGATTCAGCCACTATTGTTAATGATGGTATTAGAGCACTCGGCAGAT
+TGGGAGGGATTTATGTCCATCCGACTAATATCCTCAGTCAGTTCTTCCAAGTTGGGTGCT
+AAAGTGGAATTTTCTGCAATTCAAACCATAAGACTTTAGATGATGATAAAAAGAAACAAA
+TACAATGAATAAGATAAGGTTGCGGACGTGCTG
+>ds2020-267_708
+TCGCTTAAGGCGACGCACTGACCGTACTTTTTAGGCTTGCCAGTACCGCAAACGGATTTT
+CTTTTTCCGCCACTGCCTGTGGCAACTCACCCACCTCAGTCACTGCCATTTCGCAGTCGT
+CATGCTTGGGCGCTAATGGCAAATCCACCAATAACTCATCTTCAACCACGGCAACTTGGA
+CGTGCTGAGGATCTGAACATTGCGGACGTGCTG
+>ds2020-267_709
+GGACGTTCGGGCTTAATACCTGCCCTGTTAAGCCCGAAGTCCCCGCTACAAGCCCGAACG
+TCCAGCGTAGTGAGCAAGCCCGAACGTCCTTACTTCCAGTAGGAGCAGCACGTCCGCAAT
+AATGATCCGGTGGTTGAGGAAAACGCGTTTGCGGACGTGTGACCCCGAATAAGTTGCGGA
+CGTGCTGAGGGGGTACAAATTGCGGACGTGCTG
+>ds2020-267_710
+CAGCACGTCCGCAACTCTGACCTTCTTATTTATAAGCCACAGCTCACTTCGACGTTTCCA
+ATTTCCCATAGAATCTCCGGGGCTTTCCTAGTCACTATAGTTTTGTTTTTTTATCTTCTT
+TGTCTGAAAATAGGTTTGATTTGCCCAGCACGTCCGCAAAAAGAAACCTATACTTGCGGA
+CGTGCTGACCCAGTTTCGGTTGCGGACGTGCTG
+>ds2020-267_711
+TATCTAGGAGCAGCACGTCCGCAATCTTCTGGTATTTGCGGACGGCTGAGGCCGACGTGC
+TTGCGGAGTGCTGAGGGTCCAACACTTGCGGACGTGCTGCCCTTAGATCCTGGAAGTAAG
+GACGTTCGGGCTTGTTCAGGGAGATAATAAGCCCGAAGTCCACCCTGAAAACGAAGCCTG
+AACGTCCAGGCGATTCTAGAAGCCCGAACGTCC
+>ds2020-267_712
+TATGTAGGGAGCAGCACGTCCGCAATGACCCCGCACTCAGCACGTCCAATCATGATGGTC
+TCAGCCGTCCGCAATACACTGGGAACCCTGGCCTGGTTAATTGCGATTCTGAGCGGCTTT
+GTTCCCATACTGATGGATGGAGGAGAGTTTGGTCAGAATGTATTCATTCTCACCGGATTT
+TCGCTGCTGGGATTGTCTTACGGTCAGTGCGTC
+>ds2020-267_713
+GACGCATGACCGTGAATAAGCCTGTTCTATTTTTATCGACATTGACAGGGATGCTATTGG
+GAATCGGATCGGTGATTAAGCCACCGATATCTGCAGGCATGGTAGGCAATGGCAAGGTAA
+TGGGTAAATTGCCAGTATTGTTATTGACTGCGTTGTCAATGGCATTGGCTAGGACCCCAC
+TAGCGACGGTCAGTGCGTCGCCTTAAGCGTATC
+>ds2020-267_714
+GGACGTTCGGGCTTACACACCGCCATAAAGCCAAGTCCAGGGAACCTATAAAGCCCGAAC
+GTCCAAGGGAACGCCTAAGCCCGAACGTCAGCACGTCCGCAAGACCGGGATACTTGCGAC
+GTGCTGAGCCATCACCACTTGCGGACGTGCTGAGGTGTGCCTGATTGCGGACGTGCTGAG
+AGATGTCCGATTGCGGCGTGCTGCTCCTTAGAT
+>ds2020-267_715
+TCCGCAACATAGGTCCGGTCAGCACGTCCGCAAACGGTCTCCCTCAGCACGTCCGCAAGA
+ATAGGGGGCAGCACGTCGCAAAGTAGATGGGATTTGCGGACGTGCTACGCTTAGGCGACG
+CACTGACCGTATAGGTACCCCTGACGCACTGACCGTCTTTATTTGCCTGACGCACTGACC
+GTTTAACAGGCCATAAGCGACGGTCAGTGCGTC
+>ds2020-267_716
+GACGCACTGACCGTTCTAAACACAGTCAGTGCGTCAAGGGGCCAGATACGGTCAGTGCGT
+CAGCGGATGTGATACGGTCAGTGCGTCGCCTTAAGCGATCTAAGAGCAGCACGTCCGCAA
+TAACCAACGGCTGACCTTTGGGACGTGCTGAGGAGTGTCGACTTGCGGACGTGCTGAGGG
+TGGGGCTCTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_717
+GAGTCCGATGACGCAGAGCATGACGCACTTAGCCTAGATCGCACCGTTGACGAGACTCCG
+CCGATATTGATCCGCCACAGCACGTCCGCAAAGTTTCGTTCCTATGACGCACGGACCCAG
+TTTCCGTTGCGGACGTGTGTCCTTACATAGATGGGAGGGCCGTCCGGGCCGGCACCTGTG
+AGCCAGGATCGTTAGTGCACGGTGGGCGCCATA
+>ds2020-267_718
+ATCTAAGGAGCAGCACGTCCGCAATCGAATGTCGGTCAGCACGTCCCAATTCTAAGTGCC
+TCAGCACGTCCCAAAGCGTTTCGGTTGCGGCGTGCTGCTCCTTAGATACGCTTAAGGCGA
+CGCACTGACCGTTGTATTTGGCCTGACGCACTGACCGTGACACATGCCCTGACGCACTGC
+CGTGTTGTTGTGGGTCCATACGGTCAGTGCGTC
+>ds2020-267_719
+CAGCACGTCCGCAATTCCAATTCTATGCAAAATATATTCAGGCGTTTTATTCGGACAATT
+AGCTCGGCAAAAGCAAAAGGTTTGGTCAGATAATCATCGCCACCAATTTCAATGCCCTTA
+ATCCGATCGCTTAAATCATCTTTAGCGGTTAAAAATAAAACAGGCGTATGCTTTCCAGCA
+GCACGGTAGCCCACCAGCAAAGCCCGAACGTCC
+>ds2020-267_720
+GGACGTTCGGGCTTTAAGTTGGGGATAGAAGCCGAACGTCCAGGGGTGAAAGTAGGCCCG
+AACGTCCAGACCACTCAGCAAGCCCGAACGTCCTTACTTCCAGACTCTAAGGAGCAGCAC
+GTCCGCAAGATCGTGGGTGTTGGGACGTGCTGAGGTGAGCCAGCTTGGGACGTGCTGAGA
+GCCTGATAATTGCGGACGTGCTGCTCTTAGATA
+>ds2020-267_721
+GACGCACTGACCGTGCTCCTACCCCTGACGCACTGACCATCTTCACTCCAGTTACGGTCA
+GTGCGTCAGAGGCCCAGTAACGGTCAGTGCGTCAGAGGCCCAGTAACGGTCAGTGCGTCA
+GGCTGTTCAACGGAGACATTAACATACGGTCAGTGCACGTCCGCAAGATACCGGTTGTGG
+ACGTGCTGCCGAGGAACGCTTGCGGACGTGCTG
+>ds2020-267_722
+GGACGTTCGGGCTTGTGCCACCCACTCTCCGAGTACCTTTGTGACTATTTCGCTCAGCAT
+CTGGTTCCGAAACGGTATCAGGATGGTAAGGAAGGCCAAGTCGGTGGCGAGACGGAGCAA
+TGGGTTCGATACCGTTTCTTTATGTCCTTACTTCCAGCGTCCGCAACAACCGGTTTGTGG
+ACGTGCTGAGGGTATCACCTTGCGGACGTGCTG
+>ds2020-267_723
+CAGCACGTCCGCAATCCAGACACGCTCGCACGTCCGCAACGTCAGAAAGTAGGTAGAGTA
+TGCCGCTTCGCTTGCCCTTTCTCCTTCCTCTGCAATAGGAAGTGAAAGAACTGCCTGCCA
+TTTCTTAGGTTAGGCTGCTGTGTGATGCTTACTCCATCTCAACGGATAAGCTCAGCTGGC
+TTACTAATAGAAAGATACAAGCCCGAACGTCCT
+>ds2020-267_724
+GACGCACTGACCGTTGGATAGGTTGTTGGTGCGACAAGGGATAGTTTTATACTGAATGGC
+ATCGCCAGCGACTGGGGTAAAGTAAGGGAGGGGTAGCTCTACGGTCAGTGCGTCGCCTTA
+AGCGTCACGTCCGCAATATGCGACTCCTCAGCACCCGCAATGTACTCCCTGTACGTTGCG
+GACGTGCTACCCCATACTATTGCGGACGTGCTG
+>ds2020-267_725
+TCCGCAATAGGTCTCGTCTCAGCACGTCCGCAACTGACCCCCGCTCAGCACGTCGCAAGT
+GTCATACCATCACACGTCCGCAAGCCACACACCCAGAGCTTTGCGGATCGCTTAAGGCGA
+CGCACTGACCGTTCATACTGGCTGACGCACTGACCGTGGTTAATCCTCTGACGCACTGAC
+CGTACAAAGGCCACGGATGACGGTCAGTGCGTC
+>ds2020-267_726
+TATCTAAGGAGCAGCACGTCCGCAAATCAAGTCAGATGCGGTTGCGGCGTGCTGACCACC
+TAGCCTTGGGACGTGCTGAGGGGCCGCCAATTGCGGACGTGCTGCTCCTCTGGAAGTAAG
+GACGTTCGGGCTTAGGTCGCCCCCTCATTCTGCGTGTAAGGCAGACGCTCTACCAACTGA
+GTTAACGACCCCGATATACAAGCCCGAACGTCC
+>ds2020-267_727
+GACGCACTGACCGTATACCACCCCGTAACGAACGGTCAGTGCGTCAGGGCAACCTGGACG
+GTCAGTGCGTCAAGCGGAGTTCTACGGTCAGTGCGTCGCCTTAAGCGCACGTCCGCAAAA
+CGAGTTATCTCACACCAGGGACCTGGGCTTGCGGACGTGCTGAGGGCAAGTAGTTTGCGG
+ACGTGCTAAGCTGATAAACTTGCGGACGTGCTG
+>ds2020-267_728
+CCGCAAAAAGAGCTCACTTACACGTCGTGCCGAGGGATTCTGGATTGCGGACGTGCTGAG
+GTCCTCCATCTTGCGGGCGTGCTGGCAAAAAGAGCTCACTTTTCGGACGTGCTGAGGGAT
+TCTGGATTGCGGACGTGCTGAGGACCTCTATATTGCGGACGTGCTGACCAAAAGAGCTCA
+CTTTTCGGACGTGCTGAGGGATTCTGGTTTTCG
+>ds2020-267_729
+CAGCAAGTCCGCAAAATTAGGCGGTTCTCGAAAAAAGATAGCGAAAAAAATTATTCCTAG
+AGTTGAGACTAAAAGGAATGTATAAACCAATGCTTCCATAGATTTGATCGTGGTTTACAA
+TTATAGCTTCCATACCTGTTTATTGGGGATCGTCTCCCGGATAAATAAAGAACAAGAGTC
+AAAGAAAAGGCGAATTATTGCGGACGTGCTGA
+>ds2020-267_730
+GGATCCTATAGACCAACATTCTCAGTTAGGGCACCGGCTAAACAGGATTTTCGAAAAGAC
+ACTTCGAACTATGCCCCGGGGCTGACCGCTGGCAGTGCCCGAGTGGCGGAGAGCACGGCA
+CTACAGGAACAGGTACCTGCAGAGATTGTAGAATAGAAAATTACAAGCCCTCTACACAGG
+TATCGCCGACTAGACACTTCTATACGCCAGTA
+>ds2020-267_731
+TCGCTTAGGCGACGCACTGACCGTGCTGGTACCCCTGATGGATTTAGAGTATGCTATTAA
+AGCTCTAGAAGAAATCTTAGACTAAACTTCTGACCCTACAGCTAACAGTATCGCTGCTGA
+CGCCTTAGAAAAAGTATCTCAAGGTGATTACTTTGAATGTGCGCGGTTTCCCTCTCTAGT
+AAGACAAGTGCCGAAACATTGCGGACGTGCTG
+>ds2020-267_732
+TCAGCCGTCCGCAATGGCCAGAAAGTGTATCCCTTGATGGATTTGAATTGTGTAATCCCA
+TTGGATTCCCAAAAGCAGAAGATCCTTTATGTATATTTTCCTTCATATATGATTTCTTGT
+CCTGGAGAACTTCAAATATAAGAACTTATATTTTAATGATGAACGTCATATTTTTGAAAA
+TGCATTAACAACCCTGGCTTGCGGACGTGCTG
+>ds2020-267_733
+TTCCCCCATTGCCACCCTCATCCACTCTGTAGGGGGGTGCGGTCAGTTCTCTCTTCGCCT
+GTTACGCCACCTACAGAGTGGAAGATTGTGGCAATGGGGGAATTTCTCGAATACAAGGAT
+TGCAGTGGACGAAGGCGAAGGAGCACACCCAACGCCCGAAGGGAATCGGCAGCACGTCGC
+AAAATCAGGGCCCGGTTATTGCGGACGTGCTG
+>ds2020-267_734
+CAGCACGTCCGCAATTGGTAGATCCTCAGCACGTCCGCAATACACCCTCGTTAGCTTGCG
+GACGCTTAAGGCGACGCACTGACCGTCGCGTGGGCCCTGTCATGGTAGGAATAGAATTTG
+CATCAACATCGATTGAGCGCTCAAATGAGCCTTCATCGACATTGTTGCCAATTTATCTAT
+CTCTCTGTCCTTTAAATACATCACAGCGTTCT
+>ds2020-267_735
+CAGCACGACCGCAATTTTCGTCACCTTGGGGTTTTACGGCTACGGATGATAAAGTAAATC
+ACTGTAATTGCTAAGTAGCATCAAGATTTTGCAGCCATGGTATCGCTTTATATTCAAACC
+GGATGATTAGTTGTCACCGTTCTGTCACGAATCAGTCAAGCCACTGTCACATATCCCCTC
+TAACATACTCTAGTAAGTGCGGACGTGCTGCT
+>ds2020-267_736
+CCCTCAGCACGTACGCAAATATGATTGGGTTCTATATTGGCACCTAAATGGGAAACCGAA
+TCGGACCAAACCCTTTGTCAGGCTATTGTTCTCTTGTTTTGTTCCCTAAAAGTCATAGAG
+TAAGACATCAATTTATCAATAAGATCAAATATTTTTTTGATTACATGATGGACTCCTCTG
+AAAAACATCGGCGCGCGTTTGCGGACGTGCTG
+>ds2020-267_737
+ATCGTCTGGACTTCGGGCTTCTAACAGCCCCTGAGAAAAGCCCGAACGTCCTTACTTCCA
+GAATCTAAGGAGCAGCACGTCCGCAATAGATCTACCTTTTATTGCGACGTGCTGAGGGCA
+ATGATGTTGCGGACGTGCTGAGGGTACTCCAATTGCGGACGTGCTGGGCCTTATCTCTTG
+TTGAAGGGCACACTCCGGAACTACAACCACCC
+>ds2020-267_738
+ATCTAAGGAGCAGCACGTCCGCAATTTGCTATCCCTCAGCACGTCGCAAGTCCCACTCCC
+TAATGTTTGCGGACGTGCTACCCTGTGTCCTTTGCGGACTGCTGCTCCTTAGACACGTCC
+GCAACCATCCCAGGCTAATTGCGGACGTGCGGGTCTATCCTCTTGCGGACGTGCTGAGGT
+GGCCAATCTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_739
+GGACGTTCGGGCTTATGGCTGCAGATGGTCGATTTATCCAAGAAATTGAACTGGTTAAAG
+GGTATAATCAGCTCGACAAGGGTCGATTAAAAGCCCGAACGTCCTTACTTCCAGAGGAGC
+AGCACGTCCGCAAACGATGAGGGATATATTGGGACGTGCTGAGGAGGTATCTGTTGCGGA
+CGTGCTGAGGCCAATATATTGCGGACGTGCTG
+>ds2020-267_740
+GACGCACTGACCGTTTGTCCGTCCCTGACGCACTGACCGTTCCTGACTCCTGACGCACTG
+ACCGTATACTAGCGGCCGGAAGACGGTCAGTGCTAGCACGTCCGCAAAGACCCTACCATA
+TTGCGGACATGCTGACCGTAAGATCGTTGCGGACGTGCTGATCCACTGCAGGTTGCGGAC
+GTGCTGAGGGAATGAAACTTGCGGACGTGCTG
+>ds2020-267_741
+GACGCACTGACCGTATCTACTTTCCTGACGCACTGACCGTAGGTATAGGCCTGACGCACT
+GACCGTATTTGCATCCGTGACGCACTGACCGTCCTTATCCGGGGTGAAACGGTCAGTGCG
+TCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGGGCAGGAGACTGTGATTGCGAC
+GTGCTGAGCTGATGTAAATTGCGGACGTGCTG
+>ds2020-267_742
+CAGCACGTCGCAATACAATCGATCTAGCTTGCGGACGTGCTGAGGTATGCTATTTTGCGG
+ACGTGCTGAGGGGATACTGGTTGCGGACGTGCTGCTCCTTAGATTATCTAAGGAGCAGCA
+CGTCCGCAATCATGACCGAGTTACTATTGCGGAAGTGCTGAGGGAGTGACACTTGCGGAC
+GTGCTGACACTGACCGACTTGCGGACGTGCTG
+>ds2020-267_743
+GACGCACTGACCGTCTTAGTTTCAATAACGGTCAGGCGTCAGGGGCTGGAACACGGTCAG
+TGCGTCACGGAGGTAACAACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGAGCAGCACGT
+CCGCAACAACGCTGGGGTATTTGGGACGTGCTGAGGGGCTAAGCTTTGCGGACGTGCTGG
+GGGATAGGCCTTGCGGACGTGCTGCTCCTTAG
+>ds2020-267_744
+GTCCGCAATCCGATGGTCTCAGCACGTCCGCAATTCATTGGGCCTCAGCACGTCCGCAAG
+TGCCCTTCCTCAGCACGTCCGCAGATCGGCGTAATTGCGGACGTGCGCTTAAGGCGACGC
+ACTGACCGTACCCGAACCCTTAAATGACGGTCAGTGCGTCAGCGGAATGCATACGGTCAG
+TGCGTCAGGGATACCCCGACGGTCAGTGCGTC
+>ds2020-267_745
+CAGCACGTCCGCAAGGGGGCCCTTAGTCTTTTGATTAGAGTAGGGGTCGCGAGAGAGCAG
+AGCGTACCGCCCTGCCATAGTCGCGAGTCTGTTTATAGTCGCGACTGTTGTCATAGTCAA
+CAAGGTTGAAACTTCCAGGAAAAAACTTCGAATTGGGAGGGCGATCCTCCCGGTGAACTG
+ACCGTACCCCATTCATGTTGCGGACGTGCTG
+>ds2020-267_746
+CAGCACGTCCGCAAGTAAAATGGCCTTTGGCTATATATTTCCCTGTAGAAATGTACTTTG
+TACAAAAGAAAATTGGGTCCTGGACAAGAAAATGGATTGTTCTAGAGGCATTCAGTTTAG
+TTTGCTTTCTTGTCACAGTTGTGGGGGTTATTGGATCAGTTCAAGGACTTATAAGTGCCA
+AACTTAGCTAGGGAGTCTTGCGGACGTGCTG
+>ds2020-267_747
+CAGCACGTCCGCAACGAAATATTTATTCACGAGATCTGACGATTGATGATTTTATGAAAG
+TAGGTTTGAATGAATTCCGCTCTTTGATTTTGGTCTTTCTTGGTCACTATAAATTGGTTT
+AAAATGCGAAGAATTGACACATGAGCTTGTAGGGCCCGTTGAAGTCCCCGAATAAGGGGG
+AAAAAAGAGGATGCTACTTGCGGACGTGCTG
+>ds2020-267_748
+CAGCACGTCCGCAATTGACCAGTCCTCCATTGTCCCCTCAGCCATGGAAAGAGAATCCAT
+GGGGAGTTACCACTGAAGCCGTTCAGTTCCACCAGAATATTAATTCTCAAACTAACATAA
+ATGGCGTTGCTTGGGGAGCACATGTGTACCATGCAAATGATTCCACTTTATCTGTTGCTG
+CTTTCAGAGGAGAGAGCTTGCGGACGTGCTG
+>ds2020-267_749
+CAGCACGTCCGCAACAGCGCATCAGTCATTCCTGGTTACTAAGAAACTGTTCGACTATAG
+AACTGATTGTGAGAATTACCAACCTTTGCGCCTTACCTGTCCTGTGGACAGTGTTGCGGT
+ATGAATCCACTCTTCGCGGATCCCACTTTCGACTGACCGAAGATCGTCTCTTCCCGCACC
+ATGATGTACATGTCAGCTTGCGGACGTGCTG
+>ds2020-267_750
+CAGCACGTCCGCAAGGCGGATACGCTCCCCAATCCACACCGCCATCTCACCAATCGCAAG
+GTCGCCAATACGGTGGATGGCAATGGCGTTTTCGATGTCAAACTGGCCTTTGGCTTTCAA
+TCAGTTTTTTGCCTTGATTGACTGCCAGCTGCTCGTAGCCATAATAAGTGAGCTTGCTAA
+CAGGGAGGCGTAAGGTCACGGTCAGTGCGTC
+>ds2020-267_751
+GACGCACTGACCGTAAACTCTGCCCTGACGCACTGACCGTCTTTTCTGCCCTGACGCACT
+GACCGTAGTCTATGGGGTTATACACGGTCAGTGCGTCGCCTTAAGCGCACGTCCGCAATC
+TCTATGGCCTAACACTTGCGACGTGCTGAGGAGACGGACGTTGCGGACGTGCTGAGGGAA
+AGGTACTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_752
+CCGCAACTGCGTGGACCTCAGCACGTCCGCAACCAACTGAGCCTCAGCACGTCCGCAAAC
+ATCGTGTAGTGCGACGGCTAGGGGTGTGGTCTTGCGGACGTGCTACGCTTAAGGCGACGC
+ACTGACCGTTCATTGGACCTTGACGCACTGACCGTAAGTGTTTCCGTGACGCACTGACCG
+TCAATACCTGGAGTCGCACGGTCAGTGCGTC
+>ds2020-267_753
+TCCGCAATCGGTTGGGTCTCAGCACGTCCGCAAGCCTTTTTCACTCAGCACGTCCGCAAC
+TGAACACCCCTCAGCACTCCGCAACCGGGGCCAATTTGCGGACGTGCTGCTCCTAGATCA
+CTGACCGTACCAAACACCGTGCCCCACGGTCAGTGCGTCAAGGCTAGCAAAACGGTCAGT
+GCGTCAGGCAAGAATAAACGGTCAGTGCGTC
+>ds2020-267_754
+GACGCACTGACCGTTTGTCTTGCCCTGACGCACTGACCGTAAATAGTTCGTTGACGCACT
+GACCGTTGTTACCCCTTTACACACGGTCAGTGCGTCGCCTTAAGCGTAGCACGTCCGCAA
+GATCCAACCAGTGTAGATTGCGGAAGTGCTGAGGACGGACTACTGCGGACGTGCTGAGGG
+GTCACGGATTGCGGACGTGCTGCTCCTTAGA
+>ds2020-267_755
+GAGTGCCTGTAGTCGAAGGGGGTGTTGTTCGAATCTATGAAAGGTGCAGCACGTCCGCGT
+CCGCAAAGTGGTGGACTTGGGACGTGTGAGTGCCTTAGATTTGCGACGTGCTGACCGGTT
+GACTATTGCGGACGTGCTGCTCCTTAGATACGTCCGCAAGCCAACGGGGATGTAATTGCG
+GACGTGAGGGAAATAGTTTGCGGACGTGCTG
+>ds2020-267_756
+CAGCACGTCCGCAAACTTTCACAGCTCAGCACGTCCGCAAACCCCCGCGCTCAGCACGTC
+GCAATCACCCCTCATTGCGGACGCGCTTAAGGCGACGCACTGACCGTCAGCATCATCATG
+ACGGTCGTGCGTCAGGTGTCTTCGTACGGTCAGTGCGTCACGGGAGAAAACACGGTCAGT
+GCGTCAGGCGGCAAGACACGGTCAGTGCGTC
+>ds2020-267_757
+CTGGAAGTAAGGACGTTCGGGCTTTAGGTACCATGGTAAGCCCGAACGTCCAATCTAAGG
+AGCAGCACGTCCGCAAATTCAACGACCTCAGCACGTCCGCAAGGTATATTCCGTCAGCAC
+GTCCGCAACTGGCTCGGATTGCGGACGTGCTGAGTGTTACGTCTTTGCGGACGTGCTGAG
+GGGGCTAACGTTGCGGACGTGCTGCTCCTTA
+>ds2020-267_758
+TCTAAGGAGCAGCACGTCCGCAAGTCGGTGTCCCCAGCACGTCCGCAAGTGAGTGGCCTC
+AGCACGTCCGCAACTAAATTCGGGTCAGCACGTCACAAATATGCTCTTGCGGACGTGCTG
+CTCCTTGAATTCTGGAAGTAAGTACGTTCGGGCTTGCCAAGATCCTTGGAGTTCGGGCTT
+AGTACACCTGGAGTATGAAGCCCGAACGTCC
+>ds2020-267_759
+GGACGTTCGGGCTTTGGGGTGTGTATTTTACTTGTCTTTGGTGACTTTTGAAATTTTCTT
+TACGGTGGAGTTTCAAGAGTTTTCGTGGGTGTTCCTTGTGGGTAGTGTGTAGTTTGTTGC
+TTTGATTTTCTCTATGTACTTTGGGTAGCATTGTTTAAGGCTACATGGGTTTTGCGGACG
+TGCTGACATAGGCCCCGTTGCGGACGTGCTG
+>ds2020-267_760
+CAGCACGTCCGCAAGTACGTAACCGTCAGCACGTCGCAATGGGACACCTCTCCGCAAATG
+GGTGGTAGGTTGCGGACGTGCTGTCTGGAAGTAAGGACGTTCGGGCTTACTTAGGAGGGT
+ATGAAGCCCGAAGTCCAGGGAATTGATAAAGCCGACGTCCAGGGATGACAGCAAGCCCGA
+AGTCCAAGGCAAGAAACAAGCCCGAACGTCC
+>ds2020-267_761
+CAGCACGTCCGCAAAATTTGGGTTGTGGACGTGCTGAGCGGGATGTTTTGCGGACGTGCT
+GAGTGAGTGATAATTGCGGACGTGCGAGACGCTTAAGGCGACGCACTGACCGTCTTTGCT
+CGCCTGACGCACTGACCGTACCTTATCGCCTGACGCACTGACCGTCTTATTTTCCCTGAC
+GCCTGACCACGGTTGATACGGTCAGTGCGTC
+>ds2020-267_762
+GACGCACTGACCGTAACCTATACACTGACGCACAGACCGTAACCTATACACTGACGCACT
+GACCGTTAAACCGCGGCTCACTGACCGTTATGAAAGGCGTGACGACACGGTCAGTGCGTC
+GCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGCGCATTGCCCTCAGCACGTCCGCA
+AACCCCAGGCCTTAGAAATTGCGACGTGCTG
+>ds2020-267_763
+GGACGTTCGGGCTTGTAGATGCGGGTGATGTCGCTGGCATAGCCGTGGAAGCTGGCGCCG
+GCATCGATCAGGAAGCTGCGCAGCAGGTCGGGAGGTCATGGTAAAAGCCCGAACGTCCTT
+ACTAGTCCGCAAGATTCATCTGCTCACACGTCCGCAAACAAGACGTAATAGTTGCGGACG
+TGCTGAGGGACATTTCCTTGCGGACGTGCTG
+>ds2020-267_764
+GACGCACTGACCGTTTGAAACTGGGTGTTCTACGGTCAGTGCGTCAGCAGATCATTGACG
+GTCAGTGCGTCAGGGGAACCCCCACGGTCAGTGCGTCAGAATAGTTACTACGGTCAGTGC
+GTCGCCTTAAGCGAATCTAAGGAGCAGCACGTCCGCAATTGTATGTCCTTGGTTGCGACG
+TGCTGACCTGATAAAAGTTGCGGACGTGCTG
+>ds2020-267_765
+CAGCACGTCCGCAAAGGAACTTGGGTAGCACGTCCGCAAGGAGATACCAGTTAATTTGCG
+GACGTGCTGCTCCTTAGATTCGCTTAAGGCGACGCACTGACCGTTGACGACGCTCTGACG
+CACTGACCGTTCTCTGACCCCTGACGCACTGACCGTTGCCACATCCCTGACGCACTGACC
+GTGATACCATTAGAGAGACGGTCAGTGCGTC
+>ds2020-267_766
+CAGCACGTCCGCAAGCGAGGTTGGATACCAATCCATGTCCCCTAACTGGTCTACCGTATG
+TCCAGGTCTGGGTTTGAACGGGGGGATGCCCCCCCACATAAATGGCATCATGACAATACA
+CCCCACGACATGCCAAGGCGCAGAGGGGTAGAGCGGCCGCTCGTTGATAAAACGGCCAAA
+CCACCAGGGGTAGGCGGTTGCGGACGTGCTG
+>ds2020-267_767
+CCGCAAAGTCAGATCCCTCAGCACGTCCGCAAGGACCCTTACCTCAGCACGTCCGCAAAT
+AACCTGGGCTGTTTTGCACGTGGAGTCGACTAAAGTTGCGGACGTGACTGGAAGTAAGGA
+CGTTCGGGCTTTTGTTAGGTGTTAGGTGAAGCCCGAAGTCCAGACGATGATATAAGCCCG
+AACGCCAGTGACGGGACAAGCCCGAACGTCC
+>ds2020-267_768
+CAGCACGTCCGCAAACTGAAGGGAGTGGGGCTTGGGTTGTGGCTGGAGGTGCGGGTGGTC
+TGAGTTTTATACAGCCCGTGTTTCTAAAATTGGTGTAATAGATTAGGGCCTTAGCATGCA
+CAGAAAGATTAATTGAATCTTTGTTTTGTCTTGCTAAAAGTGGAAGATGTTGGATTGAAG
+CAGAGATGTGGCAAAGGTTGCGGACGTGCTG
+>ds2020-267_769
+TAGCACGTCCGCAAGTGGGATTTGGTGGACACAGATGCGGCAAGGTTGCTCGAGTTGGTC
+CCTGAGTTCGTTTGTCAATGGCAAAATGCGGATTATGATGGGAATGACGAGGAAAGCAAT
+TTGGCGTTATGTAGTGCTCCGCCGAAATTCTGACGTTTTTGGCAGATGTCAGTTTTCGAG
+GGGGAAGGGTGCGGGCTTGCGGACGTGCTG
+>ds2020-267_770
+CAGCACGTCCGCAACGCTCTCCCCTCCGTACCGTAAGGTGCGTGGTTTTTTGCTTTGGGC
+GTTATTCCTCTCCTTGAAACTTTCTTACCTTCCTCTTGCAGACTCGACATTCAGGCCGGA
+TCTCGGTATTGTTAGCTGTCTGGATGTCTAAACGTTTATACGTATGCTTTGAGGATTCAA
+CGATATGGACGCTTCATTGCGGACGTGCTG
+>ds2020-267_771
+CAGCACGTCCGCAATCGCTTACCCCTCTACCATATAAGTATTCACCTACAGGAATATACA
+ATTTACTTTGACCCTACTCTAAGCATAACCAGTTATAACCTTCTGCTTCACCCAAGAATA
+ATTTTTGGATTACTTCAACAAGAAAATCACGATTACAAAAACTAGGAACACTATCTGCAG
+CATCACGGTCATCTATTTGCGGACGTGCTG
+>ds2020-267_772
+TACGAGGAATTGGAGCAAACGCACAGAAATGCTTTTCCTTCAGCCCAAATACCTAGATTT
+TTCCAAGATTTCAAGAGAGCTGAACTTAGTGATGAGGTTGGTAAGGGTAAAGAAAATAAG
+ATTAACCGCAATGATTTCGTGAAAATAGCAACCCACACGGGTGGCAAACAAAATACACTA
+CGAGACCGATATCCTCTTGCGGCCGTGCTG
+>ds2020-267_773
+CAGCACGTCCGCAATTTGACTGATGTGCAATATTATGTGACCCAGCAAAACGGCACTGAG
+CGTCCTTTTAGCCATGAATATGATCACCAATTTGAACCTGGAATTTATGTGGATATTGTG
+AGTGGTGAGCCGCTTTTTAGCTCATCGGACAAATATGACTCAGGTTGTGGTTGGAGAGGC
+ATTTTGTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_774
+CAGCACGTCCGCAATGCACGCTTCCTCTTCTTTCGAATGCTAATGTGTGGTTTTGTCCTA
+CTTCCAAAGTCACAGAGGGAGCTGGAGCCGATTTTTTGTTTGACTACCTTCAATCGACGG
+ATGGTGCTAAAGGAGTTGGGAGAAGAGTCCACCTATAGTTATAGTAGTTAGAAGCCCAGC
+TTCAATCGCTCAGAGGTTGGGGACGTGCTG
+>ds2020-267_775
+GGACGTTCGGGCTTCACCTGCACCCTGGACGTTCGGCTTGTATCCACTCTGGACGTTCGG
+CTTTATAGTGCCCCTAAAGCCCGAACGTCCTTACTTCCAGAAGGAGCAGCACGTCCGCAA
+TCGGTCCGTCCTCAGCACGTCCGCAAGGAACTTTCCCTCAGCACGTCCCAAGGCACCCCA
+ATTTCGTTGCGACGTGCTGCTCCTTAGATA
+>ds2020-267_776
+GCAGCAAGTCCGCAAAAACGAGCAAATTGCAAGAGAGGAGCTCTACCAACTGATCTATAT
+CCCCCCGAGCCAAGTGGAGCATGCATGAAGGAGTCAAATGCTTCTTCTATTCTTTTCCTT
+GGCGCAGCTGGGCCATCCTGGACTTGAACCAGAGACCTCGCCCGTGAAGTAAATCATCGC
+ACCTACAGTACAACTATTGCGGACGTGCTG
+>ds2020-267_777
+GGACGTTCGGGCTTTACCCCATCCCTCAGAAAAGCCCAAACGTCCAACGCTACGGTGAAG
+CCCGAACGTCCACTGCATGATGCAAGCCCGAACGTCCTTACTTCCAGGGCACGTCCGCAA
+AACAAGCCAGGTTAGTTGGGACGTGCTGAGGGGGTCAAGTTGCGGACGTGCTGAGGGACG
+TAACGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_778
+GGACGTTCGGGCTTTGGTCCTACGGTGGCGTTCGGGCTTCAGAGAGGTAGGCAAGCCCGA
+ACGTCCTTACTTCCAGGATCTAAGGAGCAGCACGTCCGCAATCTATCATCCCTCACACGT
+CCGCAAAGGTATGCATTTCGGACGGCTGAGCGTAATACGGTTGCGGACGTGCTGCCCAAT
+TACGCTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_779
+GGACGTTCGGGCTTAGCCGGTCCCGCTTTTTATGGTCTTTTCCACGTAAACGCAGTTGGT
+TTTATATCCATTGTTCAAATAGCCGTAAGCGGTGGTTCAGGAAATGTTTTAGAATAGGTT
+GTTACAGAATACGCTGTGGGACGTCGAGGAGTATTAATTTGCGGACGTGCTGAGGCGGAA
+GTTTTTGCGGACGTGCTGCTCCTTAGATAG
+>ds2020-267_780
+CAGCACGTCCGCAATAGCATGTAGCTGGTTGAGTAAGATTATTTTCCTAATGCTTTTCTG
+AATATGTCAAGCAAAGAGAAAGGTGACCTTTCCATAAAGAAATTCATGTGCCTTTATATC
+ATGGGCATCTTTGATGAGAAGCTTATGTGCCCAAGTGTTGGGCAAGTCTTATTTATTTAT
+TTATTTCCTAGGACACTTGAGGACGTGCTG
+>ds2020-267_781
+GACGCACTGACCGTGCGAAAGGCCCTTAATTACGGTCAGTGCGTCAGGGAACTAGGAACG
+GTCAGTGCGTCAGGGCAATAGAGACGGTCAGTGCGTCGCCTTAAGCGCACGTCCGCAATC
+ATAGAGTATTGTTGTTGGGACGTGCTGAGGAAAAATTACTTGCGGACGTGCTGAGGATAA
+GTTGCTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_782
+GGAGTGGCTGGAATACAGACGTGGCCGGGGCAACTCGAGTTCAGAAGTGTCCTCTTCCGA
+TCTATATAAGGAGCAGCACGTCCGCAAAGATCCGGGAGTATTTGGGACGTGCTGAGCCAT
+AATGTATTGCGGACGTGCTGACTCGAGCCCTTTTGCGGACGTGCTGCTCCGTAGATACGC
+TTAAGGCGACGCACTGAGCGTGGGGGCTGG
+>ds2020-267_783
+GACGCACTGACCGTCATTTGATTTCTACCAGTTCAACTAATGAGGAAAGGGTAGGAAGCA
+ATGTGAAAACCAGGCCTAGAGTTTTCGATAGCAAAAAGAGGCTTATACGTTATTCTGGGA
+TGCTTCGAACCTGTGTTTTGCAAGGGTCTTTGAATGAGGGGAAGGCTATTCATGGGCAGG
+GAGTAGAAAACGGGAAACGGTCAGTGCGTC
+>ds2020-267_784
+GACGCACTGACCGTCTCCACGGCTTTTAACACGGTCAGTACGTCAGGCGTTTATATGCGG
+TCAGTGCGTCACGTCACCAGGTGCGGTCAGTGCGTCGCCTTAAGCGTAGCACGTCCGCAA
+GTTAAGGCAGTTAGGTTGGGACGTGCTGAGGGGTCTACCGTTGCGGACGTGCTGCCCCTG
+CAACGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_785
+CAGCACGTCCGCAAGCGGATAACATTGGACGTGCTGACTGCTTGATAGTTGCGGACGTGC
+TGGGCCAAGGTTATTGCGGACGTGCTGCTCCTTAGATATCCCTTGACGCACATCTAAGGA
+GCAGCACGTCCGCAATTATTTGCACCTCAGCACGTCCGCAAATTACACTCGCTCAGCCGT
+CCCAAGCCGATTGTTGTTGCGGACGTGCTG
+>ds2020-267_786
+GGACGTTCGGGCTTCCTCCACTCGCTCAAAAAACATACTGCAAGCAAGGCCCAGTGGTCC
+GTGCGTCGATGCACTTGCTTGTATCCGCAAGCGTCTGACACCTTCATCACCTGCCACAAG
+CCCGAACGTCCTTTATCTAAGGAGCAGCACGTCCGCAAAGGGCAATACCTCAGCACGTCC
+GCAACAAGTGTGCCTCATTGCGACGTGCTG
+>ds2020-267_787
+GACGCACTGACCGTATTCAAATCCGTGACGCACTGACCGCTTGATGAGACCTACGCACTG
+ACCGTGTTAATCCATAGACACACGGTCAGTGCGTCGCCTTAAGCGATAAGGAGCAGCACG
+TCCGCAACCCAACCCCCCTAGCTAGGCGCCCTATCCGAATGCCATGAGATTTGCGGACGT
+GCTGAGGACATAGAACTTGCGGACGTGCTG
+>ds2020-267_788
+GGACGTTCGGGCTTCTGTCTCTCCTTGATAAATGGGCTTAGCCACCACGTTGTGAGTCAA
+GTTATTACCAAATCTTACCCCCATGATTAAGCCCGAACGTCCTTACTTCCAGAGGAGCAG
+CACGTCCGCAACACACTGGTCTTATGTTGGGACGTGCTGAGGGCGAATAACTTGCGGACG
+TGCTAGGGGTTAGGGGTTGCGGACGTGCTG
+>ds2020-267_789
+CAGCACGTCCGCAACCCGACTCCTATCACTTTTCAAAAATACAATCTTACTCCCCGAAAG
+CCGAAAAATATGAGTGAGAGGAGAGCCTACGAACCCCTACTTCATCACAAATATCTCAAA
+GCCTCCGCAGCTCACCCACACGAAGAAGACGGCAGATCCCTAAAAGCGGCGAAACACAGC
+ACACACCAAATCCATGTTGCGGACGTGCTG
+>ds2020-267_790
+CCGCAAAGATAATGGCCTCAGCACGTCCGCAAACATCATCACCTCAGCACGTCCGCAACT
+AACTCCGACTCAGCACGTCCACAATCATGTTTTTGCGGACGTGCTGCTCCTAGATACACT
+GACCGTAGCGTATGGGTTGAAAAGACGGTCAGTGCGTCAGGGGCGATCACACGGTCAGTG
+CGTCAGGGTGGATAGAACGGTCAGTGCGTC
+>ds2020-267_791
+CAGCACGTCCGCAAATGTTAACCCGTCAGCACGTCCGCAAGCCGCCCGCCCTCGCACGTC
+CGCAATCGTGTCTAGTGTTTTGCGGACGTGCTGCTCCTTAGATTCGCTTAAGGCGACGCA
+CTGACCGTTTTCTTCTACCTGACGCACTGACCGTTCATCAACGCCTACGTGTCGGTCAGT
+GCGTCAAGGTAACCACACGGTCAGTGCGTC
+>ds2020-267_792
+GACGCACAGACCGTCGTTAAGGGGATCCTTACGGTCAGAGCGTCAATAGATAAATCACGG
+TCAGTGCGTCAGGGGATGGGCTACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAG
+CACGTCCGCAAGATGGTGGCGGTATTTGGGGACGTGTGAGGGTCGTGGAGTTGCGGACGT
+GCTGAGCTAAAAGTACTTGCGGACGTGCTG
+>ds2020-267_793
+TCCGCAAAGAAAGCCCCCTCAGCACGTCCGCAATCGTCACACGCTCAGCACGTCCCAATC
+TATAGGCCCCAGCACCGTCCGCAATATCGAGTCTGTTGCGGACGTGCTCTGGAAGTAAGG
+ACGTTCGGGCTTATCACCCCAAATGAAGCCCGACGTCCAGGGAGAAATTAAAGCCCGAAC
+GTCCAGGGAGGTTAGGAAGCCCGAACGTCC
+>ds2020-267_794
+AAACTTCGCACCCTCAGCACGTCCGCAAATTCGGCCTCCTCAGCACGTCCGCAAGGGTTG
+TAACTTGCGGACTACGGCGACCACCGAGGTCTACACATAGAGGTACACTGTGTCGCTAGA
+CGAGGGTTTTCCGATCTGTCGGGGGAGCAGCACGTCGCAAGTGGAGTGTTATTGCGGACG
+TGCGAGACGTGCTGTGTGGGGGGCGTGGTG
+>ds2020-267_795
+CAGCACGTCCGCAAACTCCTTTTCCTCATCTCATTAAGTTCTCTGATACAACACGTAAAC
+GCTCTAATTTTAATGATTATTTTATGATCCTATCTTTTCTTTTAACTTTGACTTTTTATT
+ACGACCAATTTTATTGTTTTATTGTTCGACAAAAGGTTCATTTATATACAATAATCGGAT
+TGTAGCGGGTTTAGTTTGCGGACGTGCTG
+>ds2020-267_796
+CAGCACGTCCGCAAGCCTTGTTCATTTGTTTCATGATGAGGCGATAGATGAGCGTTAGCT
+CCTCAATCGGGATGCGAACTTTCTCGCGTCCAATGACCTCCCGGAATTTCTTTCTGGCAG
+GTTCTGCCACCCACCTAGGCAGGTAACCCATGTTTCTCGTTTGAGAGAAACCTCCCATGG
+TATAGACCCTGAAGATTGCGGACGTGCTG
+>ds2020-267_797
+CAGCACGTCCGCAATTAGCCCTCCTTTAGAAAGGAATCTCCCCTACCATATATATATTTT
+TTCCTCAAATAAAAAGGTGACATGACAAAAATAGAAATAAAAATAAAAAGGTGCCAAATG
+TGCATCCAATCAATTTCTCATTACTGACGAACAAAATCAAAGAAACTACAGATTTCATTT
+GAAACCCTGAATAGATTGCGGACGTGCTG
+>ds2020-267_798
+CAGCACGTCCGCAACCCGGTCTGGCTATCTCTATCAATATTATAAAGTTTCTTGGTGGTT
+CAGTGCCTCCAGTCCCAAGCGGGGCTGGCCGAGATTCATTTCAGCCGAATCTTTCACTTC
+GACTCGATACTTGGTGAAGGATAGTTGCGACGTGCTGAGGAACAGAGGTTTGCGGACGTG
+CTGACGGTGTGGTATTTGCGGACGTGCTG
+>ds2020-267_799
+CCGATCTATCTAGGAGCAGCACGTCCGCAATGGTATTCCCCTCAGCACGTCCGCAAAAGC
+AATCCCCTAGCACGTCCGCAACGTGCTGGTACTCAGCACGTCCCAAGTTTAAGCACCTCC
+GGACCTTTGCGGACGTGCTAGGGGATTGCTTTTGCGGACGTGCTGAGGGGGCGGATATTG
+CGGACGTGCTGCTCCTTAGATAGATCGGA
+>ds2020-267_800
+GGACGTTCGGGCTTTTTCCGACCCCTGGACGTTCGGACTTCGACACCCAAGCCCGAACGT
+CCTACTTCAGGGCACGTCCGCAAACATGTCCCTGTCATATTGCGGACGCTGAGGGGCTTT
+GGCTTGCGGACGTGCTACCTCGAAATCGTTGCGGACGTGCTGAGGCTAATCCAATTGCGG
+ACGTGCTGCTCCTTAGATAGATCGGGAGA
+>ds2020-267_801
+TATCTAAGGAGCAGCACGTCCGCAACGCGTTATACCTCAGCACGTCCGCAATTCTCACAC
+GCTTTCCCTTGGGACGTGGAGGGCGGAGTCATTGCGGACGTGCTGAGGCAGGTCCTTTTG
+CGGACGTGCTGGATGACCATATGCTTGGGACGTGCTGATGGAGATATTGTTGCGGACGTG
+CTGAGGCAGGTCCTTTTGCGGACGTGCTG
+>ds2020-267_802
+GACGCACTGACCGTAACACAGCGCCTAACGCACGGTCAGTGCGTCAGCAAATTTCATACG
+GTCAGTGCGTCAGGTGGTGATGTACGGTCAGTGCGTCAGGAGGTAACCTACGGTCAGTGC
+GTCGCCTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGACATGAGTTCTCCACGTCCCAA
+CACACCCTGAAACATTTGCGGACGTGCTG
+>ds2020-267_803
+GACGCACTGACCGTCAAGATGATCATTAAAACGGCAGTGCGTCAGGAGGCAATACACGGT
+CAGTGCGTCAGCTACAATCACACGGTCAGTGCGTCAGGGGTATCGCTACGGTCAGTGCGT
+CGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAACCCACGAGACTTGATTGGGACGTG
+CTGAGGAGTATGTCATTGCGGACGTGCTG
+>ds2020-267_804
+GACGCACTGACCGTTATGATTCTGCTGACGCACTGACCGTCCTCTCCCACATGACCACTG
+ACCTGTCTACACGCAAACGCACGGTCAGTGCGTCGCCTTAAGCGCGTCCGCAATCACACC
+TCTGTATTGCGCAGGAACTCACCTTGCGGACGTGCTGACTGAATGTTTGTTGCGGACGTG
+CTGAGAGGAAACGCGTTGCGGACGTGCTG
+>ds2020-267_805
+GGACGTTCGGGCTTGAAACTTTGGGTGAGTTGGTCTTTGTTAAAGAGTTTGGGGATATAT
+TTTAGAGCAGCAATGGCGTTAAGGGGTTGGTTGTACCATGACATAGGGTAGTCCTCAAAG
+CCCGAACGTCCTTACTTCCAGTGCACGTCCGCAATCTCTAGACTGTGGGGATTGGGACGT
+GCTGAGACCGTTATTTTGCGGACGTGCTG
+>ds2020-267_806
+GTCCGCAAAGCTTCCCCCTCAGCACGTCCGCAACCATCATGCCCTCAGCACGTCCGCAAA
+GAAGACGCCCTCAGCACGTCCGCAACTATAAACCCCTTTTTTTTTGCGGACGAATCTAAG
+GAGCAGCACGTCCGCAACGGTTTCAGCTTGGGACGTGCTGGGGCATTTTGTTTGCGGACG
+TGCTGGCCGGGATTATTGCGGACGTGCTG
+>ds2020-267_807
+CCGCAATGCATATTTCCTCAGCACGTCCGCAATTCAAACTCGCTCAGCACGTCCGCAAGT
+TTAATCCTCTCAGCACGTCCCAACGGATAGGCTTTGCGGACGTGCTAATCTAAGGAGCAG
+CACGTCCGCAAAGCTTTCCCGATCAGCACGTCCGCAAACCTCTTTCCCTCAGCACGTCGC
+AATACCCGTGGGCTCTTGCGGACGTGCTG
+>ds2020-267_808
+GTAAGGACGTTCGGGCTTCACACCACACTTGGCGTTCGGGCTTTCAAGATGGGGGGACTT
+CGGGCTTACAGGCGCGAGTAGAAGCCCGAACGTCCTTACTTCCAGTAGCACGTCCGCAAA
+CTAAGAACTGTTGGGACGTGCTGACGGAGAACATATTGCGACGTGCTGAGGGTTCTGTTA
+TTGCGGACGTGCTGAGTGAAAGGCCATTG
+>ds2020-267_809
+CAGCACGTCCGCAACTAACCACCCCTTTCTGTAACATAACTACACATCCAGTACCACATT
+GAATCAGCGTCCGTCCAGTCTATGTTCTCATCGCCTTCGTACAAGGCGTCGTTTCCGCTG
+GTAGTTCTGGTGCTTAAGTTTTGGAGCTGGACGCCTGGCACCTTGACGTCGAAGTTGAAC
+GAGGTGGTCGTATTTGCGGACGTGCTGC
+>ds2020-267_810
+CAGCACGTCCGCAATCTCTCCACTTCCCTCCTAGAATGGAAAGCCGCTTTCGGGGGAGAA
+CTCTTGCTCACAGGCTCCCCGAAACCAAGAGACGAGACAGAAGATGCATAAGATGCAGAG
+GATACTATGGATTCAGGGTGAGCCCCTATCCTATGTCTAGGAGTAGAGAAGAGAGCACCT
+TCACCCGGACTTCATTGCGGACGTGCTG
+>ds2020-267_811
+TTCCCGCACCATTTATCTCTTTTCCTTGGACATAAAGTCGCCTTACAGATGGACCCATCC
+CCTTCGGACATACAGCAATTACACTGATGTTCTTGGGGAAGTCAAGACCCACTGACTGCA
+AATGCCCTAAAAGGAAACCATGGGAAAGGCCCAGTATACTATTGGGCTTCATGTGTGAAA
+ATACTTTCTCATAATTGCGGACGTGCTG
+>ds2020-267_812
+CAGCACGTCCGCTATGTTTAACCACTCCTGTAATAATTGTTGAGCTATTTAGTCAATATT
+TGGCTTCTGTGCATAGTTACCCACATTACGCAGAGCCACTTTATGCCTCCAGTGATCATT
+TAGGACCACCACTCCTCCTTCTATTCCTCTAAGTTCAAATGTTGACCTCTGTACCGGGCT
+CAATCAGTATCATTGGCGGACGTGCTGC
+>ds2020-267_813
+GACGCACTGACCGTCGCCTATCTCCTTATCCACCCTATCCTTATCAAAGTTATTCTCAAG
+TGGTTTATTAAGACTACCTACGAGGGACAAAATGACGGTCAGTGCGTCAGGTAAGTGACT
+ACGGTCAGTGCGTCGCCTAAGCGTCAGCACGTCCGCAAGGTCCACTGGTTGCGGACGTGC
+TGAGGGCTACCTTATTGCGGACGTGCTG
+>ds2020-267_814
+CAGCACGTCCGCAAACCATTGTCTATTGCGGACGTGTGAGCTTTTGCCCATTGCGGACGT
+GCTGGGGACGAACAGTTGGGACGTGCTGAGAGCGATCGGATTGCGGACGTGCTGCTCCTT
+AGATATCCGCAACTATTCAGGGTTTGGGACGTGCTGAGGATGTGCAGGTTGCGGACGTGC
+TGAGGGCATGCTAATTGCGGACGTGCTG
+>ds2020-267_815
+CAGCACGTCCGCAAAGCCGAAGAAGTTATCATGGACGAGCCACATGCAGGGAAACTTGCA
+CGTGTGGTTCTGGCCGGGCTTTCCTGAGGTATCTAATAACCTTGCTTCTGCTCGCCGCTG
+GCGCACCTCTCCTAACTATTGCCCATTTATACTGGAATAATCTTTTTAGGAGGGACAATT
+TTACATATTTCTGCCAAATACTTCTATT
+>ds2020-267_816
+CAGCACGTCCGCAATTTGAATGCCCTCAGCACGTCCGCAACGTTTCCCGCCCAGCACGTC
+GCAAGCTATCACTCATGTTTTGCGGACGTGCTGCTCCTTAGGATTCGCTTAAGGCGACGC
+ACTGACCGTCGTTCATCTGGTGACGCACTGACCGTCCTTTTTGCCGTGACGCCTGACCGT
+GTACCCATCACATAACGGTCAGTGCGTC
+>ds2020-267_817
+CAGCACGTCCGCAATGTCCAGTAAGTGGCATTAGGACAATATAAATCCAGCCTAAAACAC
+GTTCCCAACCAGGGGTAGGGCGCTGTGGGCCGTAATCATTATTGCCTTCTGTACCTTTTG
+CCGCAAAGAGATAGATCATAAAAATCAGGTCTAAGGCGGGGATCTGCATACGTAAAGATA
+GCCACCCTGTATTCTTGCGGACGTGCTG
+>ds2020-267_818
+CGATCTATCTAAGGAGCAGCACGTCCGCAATGATGAAGCCGTACGTCTATGCCAAGCCAA
+CCGCAAGTTTTTAATCCCCAGTCTACCAATAAACCTGCCACCCATCATCAAGCCAACCGT
+AAAGACACGTCCGCAATCTTGATCTTGTGGACGTGCTGGGGGGGCTTCGTTGCGACGTGC
+TGACCGATCAACCTTTGCGGACGTGCTG
+>ds2020-267_819
+GGACGTTCGGGCTTGTATTGTGGGCTGGTTGAGCTGGGCAAGGGTAGGTTGTTTGGGGTT
+TTGCATCGGTGAGGTGCTACTAGCAACACTCGAGGCAAGCTCTGGCTGTTTGGCGAGCGG
+TTGTCCTGTTTTTGGGTCAGTGACGACAACTTGCGGTGCTGCATGGGTCAGGCTTGTCAC
+CTACCAGGAGCAGGAAGCCCGAACGTCC
+>ds2020-267_820
+CAGCACGTCCGCAAACAGACCGGTCTAGATTTGGGACGTGCTGAGCGACTGAGATTTGCG
+GACGTGCTGAGCGAGCCGCTATTGCGGACGTGCTGCTCCTTAGATTCGCTTAAGGCGACG
+CACTGACCGTCGATGGGCATCTACGGTCAGTGCGTCAGCAGTAACAACACGGTCAGTGCG
+TCAAGGGTGCTCACACGGTCAGTGCGTC
+>ds2020-267_821
+AGACCGCAGACGGGAGTGTCCAGAGCGCATGGAGGCCAGACGCGTGCTCTTCCTATCTAT
+CTAAGGAGCAGCACGTCCGCAATCCGCGTCCCCTCAGCACGTCCGCAATCAAACACGCTC
+AGCACGTCCGCAAAGCTTTGATCCTCAGCACGTCGCAACATGAAGAGGGTGGACTTGCGG
+ACGTGTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_822
+CAGCACGTCCGCAAAGGATGGCACCTCAGCCCGTCCGCAAAATGTCTGGGTTATTGCGGA
+CGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTGAAGGCTCCCTTGACGCA
+CTGACCGTGTCCTGGACCTTGACGCACTGACCGTCTTGAAACCCCTGACGCCTGACCGTA
+ATACCCAAGCTTGTACGGTCAGTGCGTC
+>ds2020-267_823
+GGACGTTCGGGCTTTACATTGAGGTTGCGATTGTACTTGTGACTCATGGTTGGTGGATTG
+GTTAGCTAATGCTTGGGCGTTGGCTAGGGTTTGTGCTGGTCGATTTTCTTGTTTTACCAC
+CAAATAATTAATGCAGGTGTGTGGCCAAGCCCGAACGTCCTTACTTCCAGATGCGACGTG
+CGAGGGGAAGGCAGTTGCGGACGTGCTG
+>ds2020-267_824
+GACGCACTGACCGTTTCCTGACCCTTGACGCACTGACCGTATGTAGAGCACTGACGCACT
+GACCGTACCGTCACCCATGCTACGACGGTCAGTGCGTCGCCTTAAGCGTCTAAGGAGCAG
+CACGTCCGCAAGCTATCCGGGGTAGCACGTCCGCAATACACACTGGGCAACGTCCGCAAC
+ATACAGGATTTCGCTTGCGGACGTGCTG
+>ds2020-267_825
+GGACGTTCGGGCTTAGGTTACGGATTGAAGCCCGAAGTCCAGGGTGTCTGACAAGCCCGA
+AGTCCAGGGGAGGCTCAAGCCCGAACGTCCTTACTTCCAGCGTCCGCAATTCTACCAACC
+TCAGCACGTCGCAATGCTCGTTGGGTGATTGCGGACGTGCGAGGAGATGGGCATTGCGGA
+CGGGGGGTGACTTTTTGCGGACGTGCTG
+>ds2020-267_826
+GACGCACTGACCGTGTCACCCTTACTCAGACGGCAGTGCGTCAGGGAGCGATCTACGGTC
+AGTGCGTCAGCCAACAACATACGGTCAGTGCGTCGCCTTAAGCGCTGGAAGTAAGGACGT
+TCGGCTTACTGACCCCTATCGAGAAGCCCGAACGCCAGACCATACAAGTTGCGGACGTGC
+TGATTGTGATCAAGTTGCGGACGTGCTG
+>ds2020-267_827
+CAGCACGTCCGCAAACGTTTCCGGGTAGCACGTCCGCAACAGTAATCAATTGCGGACTGC
+TGAGTACTTTGGACTTGCGGACGCCTGGAAGTAAGGACGTTCGGGCTTGCCAGTCTGGGG
+GACGTTCGGGCTTACGAGTGGCTGTAAGCCCGAAGTCCAGGCCCAAGAGCAAGTCGAACG
+TCACCCCTAATTCTAAGCCCGAACGTCC
+>ds2020-267_828
+GACGCACTGACCGTACCTACCTGGCTGACGCACTGACCGTCTCGGGTCCTCTGACGCACT
+GACCGTATTAGGGGACGTCGCACGGTCAGTTCACGTCCGCAAACGTTATGCACTCAGCAC
+GTCCCAATGTTGACCTGGTGAGCCTTGCGGACGTGCTGCCCGTTATTGTTGCGGACGTGC
+TGACTAGGTCGATTTTGCGGACGTGCTG
+>ds2020-267_829
+CAACTGTTTTGGCCTCAGCACGTCCGCAATCAAATCCCCCTCAGCACGTCCGCATTCCAG
+TAAGCTCAGCACGTCCCAACCTCGGGATCTTGCGGACGTGCTGCTCCTTAGTCGCTTAAG
+GCGACGCACTGACCGTTTATACCTCCCTGACGCACTGACCGTATTGGTTTCTCTGACGCA
+CTAACCGATTCTGCACGGTCAGTGCGTC
+>ds2020-267_830
+GGACGTTCGGGCTTGATGGTTAAGGTAAAGCCCGAAGTCCAGGCAACTCGGAAGCCCGAA
+GTCCACCAGCCTATAGAAGCCCGAACGTCCTTACTTCCAGAGTCCGCAATCGGTTGGGCT
+TGCGGACGTGTGACCGGCTTGAAGTTGCGACGTGCTGAGTGAAAAAGGTTTGCGGACGTG
+CTGAGTGATTGGTATTGCGGACGTGCTG
+>ds2020-267_831
+CAGCACGTCCGCAAATATTAGGGGTTCATAGTTGCGGAGCTGAGGCGAAGGGTATTGCGG
+ACGTGTGAGACCATTGGCCTTGCGGACGTGCTGCTCTTAGATACGCTTAAGGCGACGCAC
+TGACCGTTCAGGTACCCCTGACGCACTGACCGTTAGCTTCTCGCTGACCACTGACCGTTT
+AGATAGCTATGTGCACGGTCAGTGCGTC
+>ds2020-267_832
+CAGCACGTCCGCAAACCCTTGCTTGTCCACGTACGCAAGTTAATTGGGTCAGCATTGGGA
+CGTGCTGAGGCGAGCCACATTGCGGACGTGCTGCTCCTTAGATACTGGAAGTAAGGACGT
+TCGGGCTTGCCTGCATCACTGGCGTCCGGGCTTTACATCTATCCTGGCGTTCGGGCTTCC
+ATAGTCCCATCTCAAAGCCCGAACGTCC
+>ds2020-267_833
+CAGCACGTCCGCAAATGAGGTTCGCTAATTTCTGCAGGAACAGGGAAGGTGGCTTAGAAA
+CCAGCCATTGAGAGAATAATGATACAACAAACAAACACTAATTGGACAATACTAGAAAAA
+ACCATGAATACGGAGCTCAAACCTGATTAAACTTTGAAAGCTGATCAACAGCATCATTTC
+CACCCAGTGCCGGTTGCGGACGTGCTG
+>ds2020-267_834
+CTCTCCCGATCTATCTAAGGAGCGCACGTGCGCAACAGGCCCCCCCTCGGAAAGAGAGGG
+ATTCGAACCCTCGGTACGAAAAACTCGTACAACGGATTAGCAATCCGACGCTTTAGTCCA
+CTCAGCCATCTCTCCCACGTCCGCAAATCCGGGTCGGTATTTGCGGACGTGCTGAGGGTC
+GTATAATTGCGGACGTGCTGCTCCTTA
+>ds2020-267_835
+CAGCACGTCCGCAATCGGCGCACACTCAGCACGTCCGCAAAGTGGTTTGGGTACAATCTA
+AAAAAAACGATTCCACATGAGGGAGAACCGGACAATTTCCCTCTTGAGTAATGGGAAATG
+GGAAGCGGGCTAGTCCCCGAAAATGCTCGTTAAAGTTGGGGGTTACAATTCACCCTGTGA
+CTAATTCCTTCGGTCGCGGACGTGCTG
+>ds2020-267_836
+GGACGTTCGGGCTTAACAACCCCCTTGGACTTCGGGCTTGCCTGTTCACCTGGACGTTGG
+GCTTTATTGTTGCGATGAAGCCCGAACGTCCTTACTTCCAGTATCTAGGAGCAGCACGTC
+CGCAAGTGAAGCCGACTGAAATTGCGACATGCTGAGGGCCAGTAGATTGCGGACGTGCTG
+AGGGCCCGGTGGTTTGCGGACGTGCTG
+>ds2020-267_837
+CAGCACGTCCGCAACAGGAAGTTCTTAACCGTTGTTCCTGTGGTGCTGTACTTGATAGCC
+TCACACACAACTGACTACCAGCACCCGATGCTCTTTTTCAACAGTCTTGCAGTCATTGTG
+CTAGTTATTGCCAAATTCTCCAATATGCACAAAGTCCGGATCTTCGGAATCAATGGAGAT
+AAGGAGTTGGGCCTTGCGGACGTGCTG
+>ds2020-267_838
+CAGCACGTCCGCAAAGACTTACCCCTCAGCACGTCCGCAAGAACCATGCCCTCAGCACTC
+CGCAATCTGATCTCGGTGTAAGCTATTGCCACGTGAACGTGTCGAGCGCTTGCTAGATGC
+CGGTACGCCATTTTTGGAAGTCTCACCGATGGCAGCGTATGGCATGTATGATGCCGATAT
+CACGGGTAACGGCTTGCGGACGTGCTG
+>ds2020-267_839
+GGACGTTCGGGCTTCGAACAACCCTTGGCGTTCGGCTTACAACCCTCCATGAAAGCCCGA
+ACGTCCTTAAGCACGTCCGCAAGACTTGACTACTTCCGCAAACCTTTGAGCCTCAGCACG
+TCCGCAACGTAACAGGGATACATTGGGACGTGCTGAGGCTCAAAGGTTTGCGGACGTGCT
+GAGGGCTCAGACCTTGCGGACGTGCTG
+>ds2020-267_840
+AATTTCTAGCCCCTCAGCACGTCCGCAAGTTGGCACACCTCAGCACGTCCGCAACCATAC
+CCAGTTCAATTTGCGGACGTGCTGAGCGGTGAGGATTTGCGGACGTGCTGAGACGTACAT
+GGTTGCGGACGTGCTGCCGGGTACCGTTTGCGGACGTGCTGAGCGGTGAGGATTTGCGGA
+CGGCTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_841
+CAGCACGTCCGCAATTTCCACTGGTTAGCACGTCCGCAAAAGATCTTACCTCACACGTCC
+GAAACCCCAGCACGTCCGCAATTTCCACTGGTCAGCACGTCCGCAAAAGATCTTACCTCA
+CACGTCCGCAACCCCAGCACGTCCGCAATTTCCACTGGTCAGCACGTCCGCAAAAGATAT
+GACTTCACACGTCCGGAACCCCTTGCA
+>ds2020-267_842
+GACGCACTGACCGTCGAAATGTGGATCAACACGGTCAGTGCGTCAGGAAAACAGCGACGG
+TCAGTGCGTCAGGGGTATAGTCACGGTCAGTGCGTCGCCTTAAGCGTACGTCCGCAACAG
+TATGCCCTTAGCGTTGGGACGTGCTGACGGAATTGTGGTTGCGGACGTGCTGAGGTAGGA
+CCGCTTGCGGACGTGCTGCTCCTTAGA
+>ds2020-267_843
+CTATCTAAGGAGCAGCACGTCCGCAACAAGACTACACTCGCACGTCCTCAAAAGTGTTAG
+GGTGTCCCAGCACGTCCGCAATAAGACTACACTCGCACGTCCGCAAAAGTGTGAGGGTGG
+CCCAGCACGTCCGCAATAGGACTACACTCGCACGTCCGCAAAAGTGTGAGGGTGGCCGAC
+TTGCGGACGTGCTGCTCCTTAGATAGA
+>ds2020-267_844
+TGCCGCAAGTACAGACGTATCCCCATCCGCTCTATCTAAGCATCAGCACGTCCGCAAAGA
+TTATGGCCTCAGCACGTCCGCAAGACACATTCCCTCACACGTCCGCAACGGATAGGCCAT
+CTAAATTGCGGACGTGCTGCTCCTTAGATACGCTTATGGCGACGCACTGACCGTTGAAGT
+CGAGGTATCGATTGTTTCTCCTTCGCA
+>ds2020-267_845
+GACGCACTGACCGTAGTATTGTCGCTCTGACCGTACTACAGGGCTTTTTACGGTCAGTGC
+GTCACGGGTCCAGTACGGTCAGTGCGTCAGGCCCAAACAGACGGTCAGTGCGTCGCCTTA
+AGCGGTCCGCAAATTGCTGCCTTTGGGACGTGCTGAGGGATCACTGATTGCGGACGTGCT
+GAGGGAGTTGCACTTGCGGACGTGCTG
+>ds2020-267_846
+TACGCACTGACCGTGTCATCATGGTTACGCCTGACCGTTGTATAGACCCTGACGCTGACG
+CACTGACCGTGTCATCATGGTGACGCCTGACCGTTGTATAGACCCTGACGCTGCCGTACA
+AGTTCGGGGCTACGGTCAGTGCGTCGCCTAAGCGTATCTAAGGAGCAGCACGTCGCAAGG
+CAGAATCGATTTATTGCGGACGTGCTG
+>ds2020-267_847
+GACGCACTGACCGTAGTTCCACCCCTACACACACGGTCAGTGCGTCAGGGCTAGAGGGAC
+GGTCAGGGCGTCAGGATAGGGCAAACGGTCAGTGCGTCAAGGGTAGCTAAACGGTCAGTG
+CGTCGCCTTAAGCGAATCTAAGGAGCAGCACGTCGCAAACTCAAGCCCCTCAGCCGTCCC
+AAATGTATACTGGTTGCGGACGTGCTG
+>ds2020-267_848
+TCCGCAATTCTCCCGGCTTAGCACGTCCGCAACTGTTGGTCACTCAGCACGTCCGCAATA
+TCGAGCACCTCAGCACGTCCCAACAGAGACCCAATTGCGGACGTGCTGGAAGTAAGGACG
+TTCGGGCTTTAGACTCCCCCTGGACGTTCGGGCTTCAGGCTCTCCTTGGACTTCGGGCTT
+AACTCTTCCCGGAAAGCCCGAACGTCC
+>ds2020-267_849
+GACGCACTGACCGTGACGTTACCCCTGACGCACTGACCGTGGAATTAGCCCTGACGCACT
+GACCGTAACAATGCCCTTGACGCACTGCCGTATTTACTGGACTAGCAACGGTCAGTGCGT
+CGCCTTAAGCGAATCTAAGGAGCAGCACGTCCGCAATTGCGAGTCCGTCAGCACGTCCGC
+AACTGGCCCATGATTGCGGACGTGCTG
+>ds2020-267_850
+GACGCACTGACCGTTTAACTCGTCCTGACGCACTGACCGTTATCGTGCCCCTGACGCACT
+GACCTTACAATAAGAGCGACGGTCAGTGCGTCGCCTTAAGCGTATCTAGGAGCAGCACGT
+CCGCAAACCATATGTCTTAGCAATTGGGACGTGCTGAGGAATGCAGGCTTGCGGACGTCT
+GACGGGCGAATATTTGCGGACGTGCTG
+>ds2020-267_851
+TCTAAGGAGCAGCACGTCCGCAAATAACTTGGGATTGGGACGGCTGACTGGGGGCGTTTG
+CGGACGTGCGAGTGATAATGTGTTGCGGACGTGCTGCCTTAGATACGCTTAAGGCGACGC
+ACTGACCGTTACTTTTCCCCTGACGCACTGACCGTTAAAAATCTTCTGACGCCTGACCGT
+CAAGAGGTCGGTGACGGTCAGTGCGTC
+>ds2020-267_852
+CAGCACGTCCGCAAATGCGTTTACCTCAGCACGTCCGCAATCTCATGGGTGTTGCTTCGC
+TTAAGGCGACGCACTGACCGGAGTTACAGCTTTAGGTATCAGCACTATGGCTTTCAACTT
+AAATGGTTTTAATTTCAATCAATCTGTAGTTGATAGTCAGGGTCGTGTAATTAATACTTG
+GGCTGATATTATTAACCGGGCTAACCT
+>ds2020-267_853
+CAGCACGTCCGCAAGGTTTAATTCCTGTTAGTTGCGACGTGCTGAGTGATGTTTAATTGC
+GGACGTGCTGCTCCTTAGATTCGCTTAAGGCGACGCACTGACCGTGCTTCTAGGGGTGAA
+TAACGGCAGAGAGGCAACGGGACGGTCAGTGCGTCAAGGGGCACCGAACGGTCAGTGCGT
+CAGTGGGGAATGGACGGTCAGTGCGTC
+>ds2020-267_854
+GGACGTTCGGGCTTACACTTTTCCCTGGACGTTCGGGCTTAGTGGACCCTTGGCGTTCGG
+CTTTCTATCGCCTGTAGCAAGCCCGAACGTCCTTACTTCCAGACGTCCGCAAGGCTTGAA
+CAGTCACGTCCAGGCGATTGGGGTAGATTTGCGGACGTGCTGAGGGTCAGGCCATTGCGG
+ACGTGCTGAGAGGGATACACTTGCGGA
+>ds2020-267_855
+TATCTAAGGAGCAGACGACTTAAGCGCCATCCATTTTAAGGGCTAGTTGTTTCGGCAGGT
+GAGTTGTTACACACTCCTTAGCGGTTTACAACTTCCATGTCCACCGTCCTGCTGTCTTAA
+ACAACCAACACCTAGGGCAGCACGTCCGCAAAACAGTTAGGCTGTATTGCGGACGTGCTG
+AGTGAGCCTCCCTTGCGGACGTGCTG
+>ds2020-267_856
+CAGCACGTCCGCAAGGACCATGGCATATTTAATTTAATTCTAAAGGAAAAGTGGCAAGAT
+GTGTGGCACTCTGCTGAGATGGAGAGTCTTGGTGATGATAATATCACAGGCTTACCGGAG
+TGGATGAAGCATATCACAGCCGAGGAGTTGGGGCAATCCGTGTTGGATATGACGGGGATA
+AATAGGCAGAGGTTGCGGACGTGCTG
+>ds2020-267_857
+CAGCACGTCCGCAAACACAGCACCCTAGCATAGCAAAAAATCCGCCACAGGGCAAAAGCT
+ATATGCAAAACTAAGTCTGTGCAATGGGCGAAGTCCCACTGACTAAGTGCGAGTTTTCGA
+CTTGATATTAATATTTCGCTAATGCTCCAAATTCCCACAAGTCAAAACCTCGGCAGGGGA
+TGGACAACACCTTGCGGACCGTGCTG
+>ds2020-267_858
+CAGCACGTCCGCAATAGACCCACCATTATAAATCCCCCCACCCAAACCAAAAAAATAAAA
+GCTTTTATATATATGAGTTTTTATATTTTCTGATCTGATTGAGAGTACTTGTTCTGTTTT
+CTCAGTAACTGCACTCTCTTTCCTCTTTTTCCCGCGCTTTAAAAATCCCAACTTTTTCTC
+ACCCCCCGCAATTTGCGGACGTGCTG
+>ds2020-267_859
+CAGCACGTCCGCAATCCCAGGTAGCTTGCTTACTTATTGCTTGCACTAAGGGCAAGCGGG
+CCTTGTCTAGGTTGGAGCTATGAAGCTTCCCTTATTATTATGAAAGGGTTGTTTACTTGC
+TTACTTGTTTTGTTAGAGTAAGGTAGCTTGCTTACTTAGTGCTTGCACTAAGGGGAAGGG
+GGGGGAGATACCTTGCGGACGTGCTT
+>ds2020-267_860
+GACGCACTGACCGTTCCGGAGTACCTAACAACGTATCTTCACAGACCAAGAACTACGAGA
+TCGCCCCTTTCATTCTGGGGTGACGGAGGGATCGTACCATTCGAGCCTTTTTTTTTCATG
+CTTTTCCCGGAGGTCTGGAGAAAGCTGCAATCAATAGGATTTTCCTAATCCTCCCTTCCC
+GGGGGGTGTTGTACGGTCAGTGCGTC
+>ds2020-267_861
+CAGCACGTCCGCAACCAAGATGCTATGTGCCCTTCCACTTTAAGGAGCTGTTTCCAGATG
+CGTGGTGTGCTTTGCAGTGAGAATTTGTTGGAATTTGAGGATTCTTCTGTTTCAGGGCTA
+TTGAAAACTCCATTGCCTTTTCGACACATCTCCTGTATGATATCATAATACCATGTGAGT
+ACGCGAGCACTGTTGCGGACGTGCTG
+>ds2020-267_862
+CAGCACGGCCGCAATCGAAGCCGGCTCCTTCGGTTGACGTGACCGGAGGCGCTAAGCCTC
+TGGTCATACAAGCGTATAGCTTCCTCAATGACACATCGATTTGTGTCGACAAGTACGGCA
+TGAGTCTTACCCATGCTGCAGAGGCGCTTGATGCGCTGAAACGAGACCCTGATGAGGGAA
+AAAGACTCGTGGATGCGGACGTGCTG
+>ds2020-267_863
+CAGCACGTCCGCAATGCCTACGCCCTCCACAGGTAACAGATTAAAATCGTTTTATCCCCG
+AATTTTTCACGACTTTCGTTACAAAAAATTTGACTGAAAACGGCATTAATTTTGTAACCC
+TAAAACAACTGTCTAAATATAGCCCATCGATTTTTGAGCAGTTGTTTGATGATGAAACCC
+AATAAACGGAGATTGCGGACGTGCTG
+>ds2020-267_864
+GGACGTTCGGGCTTAGGCTAACCGCTGGACTTCGGGCTTGAAGGTGTGACTGGACTTGGG
+CTTATTGGAGGCAACAAGCCCGAACGTCCTTACTTCCAGTCACGTCCGCAAACGGTTTGG
+GTTGGGACGTGCTGAGGGGCAGTATTTTGCGGAGGACATAATGCATATTGCGGACGTGCT
+GCCCTAAGCCTTTTGCGGACGTGCTG
+>ds2020-267_865
+GACGCACTGACCGTCTACAGCCTCCTTAACACGGTCAGTGCGTCAGTTAAGTCCGAACGG
+TCAGTGCGTCCCCGAGAAACACGGTCAGTGCGTAGCACGTCCGCAAAAGTGAAGTTGTGG
+ACGTGCTGAGGGATACACAGTTGCGGACGTGCTGAAGGCATAACAGTTGCGGACGTGCTG
+AGGCAATAATACTTGCGGACGTGCTG
+>ds2020-267_866
+GACGCACTGACCGTTTTCTACCCCATAGACAACGGTCAGTACGTCAGGCCTGAGATAACG
+GTCAGTGCGTCAGGGAATTACCTACGGTCAGTGCGTCAGGCATTATGCGACGGTCAGTGC
+GTCGCCTTAAGCGAGGAGCAGCACGTCCGCAAATAACGAGGGGTAGGTTGGGACGTGCTG
+AGACATGTGTCCTTGCGGACGTGCTG
+>ds2020-267_867
+CAGCACGTCCGCAACAGGGAACAGATTATTAAAAGTATTTAAAGCCAGTGAAGTAACACT
+CATTGCCTTTATGGGTGAAATAGCCGATTGTGTGGGTGATTATTCATCATTCCATAGCCT
+TATAACTGATGGGCTAGATGATGGCGAAATTCCTGTTACCAACTTACAGACCATTAACCA
+ACGCGCATTATTTTGCGGACGTGCTG
+>ds2020-267_868
+CAGCACGTCCGCAATGTCGTAATCGTCCCTTTCAGACCTTGCTGCAAACGCCACACTCGC
+AGCCGATATTGCTAACCCAAGCGAAGCGAGCTTTTATAATGTCAGCGAAGCGAGCTTTGC
+TAACGTCAGTGAAGAGAATTTGCTAAAAAACGCTGCTTAAACCAAGTTTCAGCCGATTGT
+CATTGGTAATCGTTGCGGACGTGCTG
+>ds2020-267_869
+CAGCACGTCCGCAAGTCTGCCCTCAGCACGTCGCAAGATAGGCGGGGTGGGTTGCTGCTA
+CCCGGTGTCCATTGCGGACGTGCTGCTCCTTAGATATCTAAGGAGCAGCACGTCCGCAAT
+ACCTGCCGTCTGTTGCGACGTGCTGAGGAAAGACGACTTGCGGACGTGCTGAGGTGTTTT
+GTTTGCGGACGTGTGCTCCTTAGATA
+>ds2020-267_870
+CAGCACGTCGCAACAGGTTCCGGATGTGCTGAGCCACTCCCAATTGCGGACGTGCTGCTC
+CTTAGATACGCACTGACCGTCTCTTGCCGACTCTCCCCTAGCTACTATCGTATAAAAGAT
+GAAAGGCATTAATCTTCAAAGGTTAGATGAAAGAATTGTGGTTGGCGATATGCCGTTAGA
+ATTACGTCCACTACGGTTAGTGCGTC
+>ds2020-267_871
+ATCTAAGGAGCAGCACGTCCGCAAATATTTTGTCCTCAGCACGTCCGCAAGTATCATCCC
+TTCAGCACGTCCGCAAGCCACCTCCTGTCAGCACGTCGCAAATCAACTGGCATGGCTTTG
+GGACGTGAGGAGCCGCCTATTGCGGACGTGCTGCTCATTAGATTAAGGACGTTCGGGCTT
+GGTTGCGGTTGAAAGCCCGAACGTCC
+>ds2020-267_872
+GGACGTTCGGGCTTGTGGGTCAAATTAAAGAAGCCAAAGAAGCCCAGGCCCGTGCCAACG
+CTGAAGCCTACAATGCGCAGGCAGCCTCAGAAGCCCGAACGTCCTTACTTCCAGACGTTA
+GGGTCATAGTTTTGCGGAGTGCTGAGGGAATTAGCTTGCGGACGTGCTGACGGATCTCGC
+ATTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_873
+GAGTTTCGTTTTAGGTCGGGGAGTCCGCTGTCATTTATACTCGTACAGTGAGTTTTATCA
+TTGATTAACAGCTACACGTTAATGAAGAAGTTGGCTATACTATATTCTATTGATTGCCAA
+CATCCCACGGTCAGTGCGTCGCCTAAGCGTCCGCAAGTTGGCGCTGTTGCGGACGTGCTA
+GGGCTACCAGATTTGCGGACGTGCTG
+>ds2020-267_874
+CAGCACGTCCGCAATCTGGGAGGGTTGAGACCAAGCCAAGGGCAGGGGCCTAAAGTATCG
+AAAAGGCAAGGACTCCAAGAAGAAGCCAAGCCTGAGGCCAAGAAAAGCGAGTTCAAGATC
+AGGAGCCAAAGCGGGCCGAGAAGAAAGAAGGAAGGCTTCATCTGCTCCAAGCCCCTAAAG
+AGGCTCAGCGGGTAGCGGACGTGCTG
+>ds2020-267_875
+GGACGTTCGGGCTTAAATGTGGCGATGTGTTAAGCCCGAAGCCAGGGAAACAATAAAGCC
+CGAACGTCCAGGGGTTATTCCAAGCCCGAACGTCCTTACTTCCAGGGCACGTCCGCAATA
+TCCCCGACCTATTTGCGACGTGCTGAGGATTGAACGGTTGCGGACGTGCTGAGGTGGGCC
+CGATTGCGGACGTGCTGCTCCTTAGA
+>ds2020-267_876
+TATCTAAGGAGCAGCACGTCCGCAATACTCGCCTACTCAGCACGTCCGCAATGCCGTAGT
+TATCACACGTCCGCAAGCAAGAACGACATGTTGCGGACGTGTGATATCTAAGGAGCAGCA
+CGTCCGCAACAACAGGTCGGTTGTGCGGACGGCTGAGAGATTCATATTGCGGACGTGCTG
+AGCCAACACAGCTTGCGGACGTGCTG
+>ds2020-267_877
+GGACGTTCGGGCTTTGTTGAAACCCTGGACGTTCGGGCTTAATCATACCACTGGACGTTC
+GGCTTATCATATAGGTTACCAGAAGCCCGAACGTCCTTACTTCCAGACACGTCCGCAAGG
+TCGAATATATTGCCGTTGGTTTGCGGACGTGCTGAGGCAAACGTAATTGCGGACGTGCTG
+AGACGATAGGTATTGCGGACGTGCTG
+>ds2020-267_878
+TCTAAGGAGCAGCACGTCCGCAAATTCACAGGGCTCAGCACGTCCGCAACTTAATCCCTA
+TCAGCACGTCCCAATCTATCCCCCCTTACTTGCGGACGTGCTGCCGCTTAAGGCGACGCA
+CTGACCGTCCCCGAACCACTACGGTCAGTGCGTCAGGGGGAAAGATACGGTCAGTGCGTC
+AGGGGCAAAGCAACGGTCAGTGCGTC
+>ds2020-267_879
+GACGCACTGACCGTTTAGATTGCCCTGACGCACTGACCGTCTAATTATAGCTGACGCACT
+GACCGTAGATATGGACGTAAGGACGGTCAGTGCGTCGCCTTAAGCGTGGAGCAGCACGTC
+CGCAATCCCTAGCCCGTGATCATTGCGGACGTGTGCCCGGCCAAAGTTGCGGACGTGCTG
+AGGCATATTACTTTGCGGACGTGCTG
+>ds2020-267_880
+GACGCACTGACCGTACTCTTTATGCTGACGCACTGACCGTTTGTGTTTTCCTGACGCACT
+GACCGTAGTCCAGACATTACTAGACGGTCAGTGCGTCGCCTTAAGCGGATCTAAGAGCAG
+CACGTCCGCAAATGAGATCGATTGCGACGTGCTGAGTGGTTCGAACTTGCGGACGTGCTG
+AGTGGAATCGAATTGCGGACGTGCTG
+>ds2020-267_881
+GACGCACTGACCGTCATAGAGCAGTTAACGCACCCTCGTACGCCCCGTTCTACACGGTCA
+GTGCGTCAGTGGTTGTACAAGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACG
+TCCGCAAAAGAGGAGCGCTCAGCACGTCCGCAGTTGGTTCTCTCTCACACGTCCGCAAGC
+TAAATCCTCTGAGTTGCGACGTGCTG
+>ds2020-267_882
+GGACGTTCGGGCTTGCAAGGGCCCCTGGACGTTCGAGCTACCTCATGAAGCCCGAAGTCC
+AGGGTAGGTACTAAGCCCGAACGTCCAGGAGACAAGAAAGCCCGAACGTCCTTACTTCAA
+GCACGTCCGCAATGATACCGTCCCAGCACGTCCGCAATTTGTAATCCGTCAGCCGTCCCA
+ACTCTCATTTCGTTGCGGACGTGCTG
+>ds2020-267_883
+GGACGTTCGGGCTTTTGCAACCACCTGACAAGCCCGAAGTCCACGGAATGGCGTAAGCCC
+GAACGTCCAGGGATAGGACGAAGCCCGAACGTCCTTACTTCCAGACTAAGGAGCAGCACG
+TCCGCAACTGAACTCCCTCAGCACGTCCGCAAATGGCACCCCCCAGCACGTCCCAAATCC
+CCGGCTATTCCCTTGCGGACGTGCTG
+>ds2020-267_884
+CAGCACGTCCGCAACAAGTCATTTCTCTTGCGGACGTGCGAGAAACTGAACCTTGCGGAC
+GTGCTGCTCCTTAGATTATCTAAGGAGCAGCACGTCCGCAAACCTGTGTCCGTCAGCACG
+TCCGCAATTGAGTGGCCCCAGCACGTCCGCAAGGGGCAATCCATCAGCACGTCCCAATAC
+ACCCAGGATGCTTTGCGGACGTGCTG
+>ds2020-267_885
+CCGCAATAGAGTTGCACTCAGCACGTCCGCAATGCGATGTTACTCAGCACGTCCGCAATT
+GCTAACATCTTGCGGAGTGTGAGTGAGAGATCTTTGCGGACGACGCTTAAGGCGACGCAC
+TGACCGTCTACTTGGGGGTCTAGGTCAGTGCGTCAGGGTACTATCGACGGTCAGTACGTC
+AGCATCAGTATTACGGTCAGTGCGTC
+>ds2020-267_886
+CAGCACGTCCGCAATGCGCGGTCCCTCAGCACGTCCGCAATAAGGGTGGGGTCGTTGCGA
+CGTGCTGCTCCTTAGATAATCTAAGGAGCAGCACGTCCGCAAATCATCGGCTCTGTATTG
+GGACGTGCTGAGGTGTGTTGGTTGCGGACGTGCTGAGTGACGTAAAATTGCGGACGTGCT
+GCCTGATTCGATTTGCGGACGTGCTG
+>ds2020-267_887
+CAGCACGTCCGCAAACTCAAACCGGTATGATTGCGGACGTGTGAGGCGTACTGCTTTGGG
+ACGTGCTGGGGGTCTTCCTTTGCGGACGTGCTGCTCCTTAGATTCTGGAAGTAAGGACGT
+TCGGGCTTCCCTCATGCCCTGGACGTTCGGGCTTACACTCACCCGTGGCGTTCGGCTTCC
+AAGCAGTATACGAAGCCCGAACGTCC
+>ds2020-267_888
+GGACGTTCGGGCTTTCTTACCAACCTACAGAAGCCCAACGTCCAGGGGGGGAGTAAAGCC
+CGAACGTCCACCAATTCGTGGAAGCCCGAACGTCCTTACTTCCAGATAAGGAGCAGCACG
+TCCGCAATCACAGTACCCTCAGCACGTCCGCAACAACTGCCCCCTCAGCACGTCCCAACT
+ACCCTGCCTTTTTTGCGGACGTGCTG
+>ds2020-267_889
+CAGCACGTCCGCAATGACAAAGCCCTCAGCACGTCCGCAATCCTAGTCGCCTCAGCACGT
+CCGCAAAAATGCCGAGCTCGTTGCGGACTCGCTTAAGGCGACGCACTGACCGTTACCAGA
+GTCATAACGGTCAGGAGTGGCGCTTGGACGGTCAGTGCGTCCCCGAACGGTCAGTGCGTC
+AGGGGTATATCAACGGTCAGTGCGTC
+>ds2020-267_890
+CAGCACGTCCGCAATAAGACCCTATTGTTGCGGACGTGCTGAGCGAGGCGCCTTTGCGGA
+CGTGCTGCCCATAGCGTATTGCGGACGTGCTGCTCCTTAGACGCTTAAGGCGACGCACTG
+ACCGTTGGCGAGGGGTTATTACGGTCAGTGCATCAGCAAAACTGGAACGGTCAGTGCGTC
+AATTGGCCACTTACGGTCAGTGCGTC
+>ds2020-267_891
+GCAACTGCGTTACCCTCAGCACGTCCAATGGTACTCGACATCTGTTGCGGACGTGTATCT
+AAGGAGCAGCACGGCCGCAAGACTGATTCCCTCAGCACGTCGCAAAGCCGCTCAACTCAG
+CACGTCCGCAACTGCGTTACCCTCAGCACGTCCAATGGTACTCGACATCTGTTGCGGACG
+TG
+>ds2020-267_892
+TCAGCACGTCGCAATCTATCAGTGGTTCATTGCGGACGTGCTATCTAAGGAGCAGCACGT
+CGCAATCACTCCCCCCAGCACGTCCGCAACAGCATCTAGGTCAGCACGTCCGCAATCTGT
+AACCGGTCAGCACGTCGCAATCTATCAGTGGTTCATTGCGGACGTGCTATCTAAGGAGCA
+G
+>ds2020-267_893
+AGTGCGTCAGCGTACCCATCACGGTCAGTGCGTCAGCGGCTAAAACACGGTCAGTACGTC
+GCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCACTGACCGTGTCAATCCTGGTCTGTAC
+GGTCAGTGCGTCAGCGTACCCATCACGGTCAGTGCGTCAGCGGCTAAAACACGGTCAGT
+>ds2020-267_894
+TCTTCCGATCTATCTAAGAGCAGCACGTCCGCAATTATATCCAGGTATATTGCGGAAGTG
+CTGAGGTTGTCCGCCTTGCGGACGTGCTGACGGATTTAGGCTTGCGGACGTGCTGAGGCG
+TTATATGTTGCGGACGTGCTGCTCCTTAGATAGATGGGGA
+>ds2020-267_895
+CGATCTATCTAAGGAGCAGCACGTCCGCAAAACGCCATGTGTGACATTATTCGCCAACCA
+ACCATTGTACTTTGGTGCGCTGCTCCACACGCATTTGTGGGCTTTCAGGATGCTGAGGGG
+TCGGAACTTGCGGACGTGCTGCTCCTTAGATAGATCG
+>ds2020-267_896
+TACCTTTGCCGTGTTCACAGGGTTTCTGTGTCCTTTGCCGTGTTCACAGGGTTTCTGTGT
+CCTTGCCGTGTTCACAGGGTTTCTGTGTCCTTTACCTTACCTTTGCCGTGTTCACAGGGT
+TTCTGTGTCCTTTGCCGTGTTCACAGGGTTTC
+>ds2020-267_897
+ATCGAAGGAGCAGCACGTCCGCAACTGCTCTGCCCTGTCCGCAAAGACCATACGCTGAAA
+CTTGCGGACGTGCTGAGTCGGTACATATTGCGGACGTGCTGAGTGGCTCCTTTTTGCGGA
+CGTGCTGCTCCTTAGATAGATCGGAAAGAG
+>ds2020-267_898
+CAGCACGTCCGCAATTTTAATCGCCTCAGCACGTCCGAATGATTCGTCCCTCAGCACGTC
+CGCAACATGAACCCGGTGAGTCTTGCGGACGGGCTGAGGGACGAATCATTCGGACGTGCT
+GAGGCGATTAAAATTGCGGACGTGCTG
+>ds2020-267_899
+TATCTAAGGAGCAGCACGTCCGCAAACATATCGGCCTGACGTCCGCAATGCCTAACCTGT
+CTCATTTGCGGACGTGCTGAGCCGACACACTTGCGGACGTGCTACCCCATGACAATTGCG
+GACGTGCTCTCCTTAGATAGATCGGA
+>ds2020-267_900
+CAGCACGTCCGCAACAAGTGGCTCTTGAATTTTTGCTTACGCCAGTAACCTCAAAAACAG
+CATGAGATTACCAGAAAAAAAAGCCGGCCGACTGGCCGGCTTTTCGATTACATCACCAGG
+CGGCGAATGTCGCTCAGCATGT
+>ds2020-267_901
+GCAGCACGTCCGCAAATAGCCTTCCTTCACCTCTCAGAGGTAGTAACTGCATTGATCTTC
+AACCCCGTGATCGATTTGGTGTTGTCAGCGCCATTAGCTTGATTGCAAAAGCATCATGTT
+GGTGCCACACCCTGCCTTTCCA
+>ds2020-267_902
+TTATTGGGACGTGCTGAGGAAAGATAGATGCGGACGTGCTGACCGAGTCCCCCTTGCGGA
+CGTGCTGGGTACGTGCTGAGTCATTGATTATTGGGACGTGCTGAGGAAAGATAGATGCGG
+ACGTGCTGACCGAGTCCCCCTT
+>ds2020-267_903
+TATCTAAGGAGCAGCACGTCCGCAAAGGTCACGCCCCAGCACGTCCGCAATACATTTTCC
+CTCAGCACGTCGCAACAACCCCTCAACTCTTGCGGACGTGCTGCTCCTTAGATACGCTTA
+AGGCGACGCACTGACCGTCTCG
+>ds2020-267_904
+AGCAGCACGTCCGCAATCTCAATGCTCTCAAGTGCTAAGCTCTCAGCACGTCCGCCAGCA
+CGTCGCAATGGTTAGGGGATAGATGTTGCGGACGTGCTGAGAGCTTAGCACTTGAGAGCA
+TTGAGATTGCGGACGTGCTGCT
+>ds2020-267_905
+CAGCACGTCCGCAACGACCGTGGGCAGCACGTCCGCAACATATTACCGCTCACACGTCCG
+CAATCAGATAGCGTTTTATTTGCGGATGTGTGAGCGGTAATATGTTGCGGACGTGCTGCC
+CACGGTCGTTGCGGACGTGCTG
+>ds2020-267_906
+TCGCTCAGCACGTCCACAAAGTAACCACCTTACTATTGCGCAGCACGTCCGCAAGCTGCC
+GTTCCTCAGCACGTCGCAAATAAACTTCGCTCAGCACGTCCACAAAGTAACCACCTTACT
+ATTGCGCAGCACGTCCGCAAG
+>ds2020-267_907
+CAGCACGTCCGCAAGGAATAACCCGTCAGCACGTCCGCAAGGAGTGTCCGCTCACGTCCG
+CAACCAACCAGTCGTTTTTGCGGACGGTGAGCGGACACTCCTTGCGGACGTGCTGACGGG
+TTATTCCTTGCGGACGTGCTG
+>ds2020-267_908
+GCAGCACGTCCGCAAGGATTGTTCGGTCAGCACGTCCGCAAAGTATTACCCTCAGAACGT
+CCCAACCCCACGCCGTTGCGGACGTGCTGAGGGTAATACTTTGCGGACGTGCTGACCGAA
+CAATCCTTGCGGACGTGCTGC
+>ds2020-267_909
+CACAGTTATCTCAAATCCATCAACTGTTACAGAGTCAAAATAATTTTCATGTTCTCAGCA
+CGTCCGCAACCCGTCCCCACTCTTCACAGTTATCTCAAATCCATCAACTGTTACAGAGTC
+AAAATAATTTTCATGTTCT
+>ds2020-267_910
+TTTGCGGACGTGCTGCCGCAAGTGAATAGCTGTATCGTGGGACGGGACACCCCTAAGACA
+TTGCGACGTGCTGAGGGTGAACTCTTTGCGGACGTGCTGCCGCAAGTGAATAGCTGTATC
+GTGGGACGGGACACCCCTA
+>ds2020-267_911
+ATTCCCTCAGCACGTCCGCAATGTGTTCTCCCTCAGCACGTCGCAAAAGTCAAGGTTTGT
+TGCGCAGCACGTCCGCAAGGCGAATTCCCTCAGCACGTCCGCAATGTGTTCTCCCTCAGC
+ACGTCGCAAAAGTCAAGG
+>ds2020-267_912
+TGAATGTCCCTGAAGGTCATGGGACAGAGGATACCGAGATTGTGGAGGAGCTGAAAGTCG
+CTGAAGGTCATGGAACAGAGGATACCGAGATTGTGAAGGAGCTGAGTGTCGCCGAAGGTC
+ATTGCGGACGTGCTG
+>ds2020-267_913
+TCAGCACGTCCGCAAAAGAAATAGGCTCAGCACGTCCCAACCCATTAATTATTGCCAGCA
+CGTCCGCAAAACATATACCCTCAGCACGTCCGCAAAAGAAATAGGCTCAGCACGTCCCAA
+CCCATTAATTATTGC
+>ds2020-267_914
+ACTCCAGCCACTCAGCACGTCCCAATAGCCCACTTGAGTCAGCACGTCCGCAAGCTCATA
+TAACTCAGCACGTCCGCAAACTCCAGCCACTCAGCACGTCCCAATAGCCCACTTGAGTCA
+GCACGTCCGCAAGC
+>ds2020-267_915
+TGCGTCCGATTGGCCTATGAACGGCAGTGCGTCAGGTGGAATTGTACGGTCAGTGCGTCA
+GGCATCTAAGGACGGTCAGTGCGTCCGATTGGCCTATGAACGGCAGTGCGTCAGGTGGAA
+TTGTACGGTCAGTG
+>ds2020-267_916
+CCCTATCTAAAACTTCTATTTGAAAAACTAGATCACCCAGGTCTGCACGGTCAGTTGCGT
+CAGCAATTAAGTTTCTCACCCTATCTAAAACTTCTATTTGAAAAACTAGATCACCCAGGT
+CTGCACGGTCAGT
+>ds2020-267_917
+CTGAGGGAAATAGTCTTGCGGACGTGCTGAGGGCAGAATGATTGCGGACGTGCTGACCGG
+GAATACCTTGCGGACGTGCTGAGGGAAATAGTCTTGCGGACGTGCTGAGGGCAGAATGAT
+TGCGGACGTGCTG
+>ds2020-267_918
+CTTGGGACGTGCTGAGAGAAATGCCGTTGCGGACGTGCTGAGGGTATACAGGTTGCGGAC
+GTGCTGAGTGGACCGAACTTGGGACGTGCTGAGAGAAATGCCGTTGCGGACGTGCTGAGG
+GTATACAGGTTG
+>ds2020-267_919
+GCTGAGGGAGTGCCCTTTGGGACGTGCTGAGGTGTGATTCGTTGCGGACGTGCTGAGCAG
+ATGTAGGTTGGGACGTGCTGAGGGAGTGCCCTTTGGGACGTGCTGAGGTGTGATTCGTTG
+CGGACGTGCTG
+>ds2020-267_920
+TCAACACGGTCAGGCGTCAGACAAAGAGATACGGTCAGTGCGTCAGGTGATCCCCCACGG
+TCAGGCGTCAGAGCATTCAACACGGTCAGGCGTCAGACAAAGAGATACGGTCAGTGCGTC
+AGGTGATCCCC
+>ds2020-267_921
+GCAAGGTAACCCTCCTCACACGTCCGCAATTCTAGGAGCCTAGCACGTCCGCAAGACTGT
+ATCCCTCAGCACGTCCGCAAGGTAACCCTCCTCACACGTCCGCAATTCTAGGAGCCTAGC
+ACGTCCGCAAG
+>ds2020-267_922
+GACAGTGTAGGACTTGCGGACGTGGAGACCGGAACATTTGCGGACGTGCTGGACTAACTA
+CTCCTTGCGGACGGCTGACAGTGTAGGACTTGCGGACGTGGAGACCGGAACATTTGCGGA
+CGTGCTGGACT
+>ds2020-267_923
+GCAAATGCCTATCCCTCAGCACTCCGCAATCCCATTGACGCAGCACGTCCGCAAGATAAC
+CCACCTCAGCACGTCCGCAAATGCCTATCCCTCAGCACTCCGCAATCCCATTGACGCAGC
+ACGTCCGCAAG
+>ds2020-267_924
+AACAACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATCCCTTA
+ACCCTCAGCACGTCCGCAAAGGTCTCCGGCTCAGCACGTCCCAACATCCGTTTGCTCTTG
+CGGACGTGCTG
+>ds2020-267_925
+CAACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATATACTGCC
+TTTATATTGGGACGTGCTGAGGGAACACGTCTTGCGGACGTGCTGAGGGTATGCGTTTTG
+CGGACGTGCTG
+>ds2020-267_926
+GCCCTCAGCACGTCCCAATCATACATCTCTCAGCACCTCCGCAAAGCGCACTCTCCAGCA
+CGTCCGCAATGGTGAGCCCTCAGCACGTCCCAATCATACATCTCTCAGCACCTCCGCAAA
+GCGCACTCTC
+>ds2020-267_927
+ATTGCGGACGTGCTGACGGACTCTACATTGCGGACGTGCTGCCGTTTGTTTATTGGGACG
+TGTGAGTGTGGGCTTATTGCGGACGTGCTGACGGACTCTACATTGCGGACGTGCTGCCGT
+TTGTTTATTG
+>ds2020-267_928
+GCACGTCCGCAACAGATGTCCCCTCAGCACGTCTGCAAGAACGCCTCCAGCACGTCCGCA
+ACTTGCTAGACCTCAGCACGTCCGCAACAGATGTCCCCTCAGCACGTCTGCAAGAACGCC
+TCCAGCACGT
+>ds2020-267_929
+TTGAACTTGCGACGTGCTGAGGGCCTAGGATTTGGGACGTGCTGAGGGGGAATTCCTTGC
+GGACGTGCTAGGGGTTTGAACTTGCGACGTGCTGAGGGCCTAGGATTTGGGACGTGCTGA
+GGGGGAATTC
+>ds2020-267_930
+ATGGTCAATACATCACGGAAGGCGCCGTATTTGCGGACGTGCTGGCAGCGCGCATAGGTA
+GATTTTCCCAAACAAATGGTCAATACATCACGGAAGGCGCCGTATTTGCGGACGTGCTGG
+CAGCGCGCAT
+>ds2020-267_931
+CTTTTGCGGACGTGCTGCCCGCAATTCACTCCCAATTTATTGAGGTGTTGTCAATGGGAC
+GTGTGACGAGATTGCTTTTGCGGACGTGCTGCCCGCAATTCACTCCCAATTTATTGAGGT
+GTTGTCAAT
+>ds2020-267_932
+CTTGCGGACGTGCTGCCGGGTTCTGATTGGGACGTGTGAGGAGAGAAACTTTGGGACGTG
+CTGAGTGCCTTCCTCTTGCGGACGTGCTGCCGGGTTCTGATTGGGACGTGTGAGGAGAGA
+AACTTTGGG
+>ds2020-267_933
+CAATATACATTCCCTCAGCACGTCCCAATTAGACAGCCCAGCACGTCCGCAAAGTAGGGG
+TCCTCAGCACGTCCCAATATACATTCCCTCAGCACGTCCCAATTAGACAGCCCAGCACGT
+CCGCAAAGT
+>ds2020-267_934
+CTGAGTAGTCTGTCTTTGCGGACGTGCTGGGTCAATCTGTTGGGACGTGCTGAGGTAGAC
+TCAGTTGGGACGTGCTGAGTAGTCTGTCTTTGCGGACGTGCTGGGTCAATCTGTTGGGAC
+GTGCTGAGG
+>ds2020-267_935
+TCGGCAGCACGTCCGCAAAAAATCCACACTCAGCACGTCCGCAACTATTTTCGGGCAGCA
+GTCCGCAAGCTGATTCGGCAGCACGTCCGCAAAAAATCCACACTCAGCACGTCCGCAACT
+ATTTTCGGG
+>ds2020-267_936
+GATTAGAGCCCCTGTATTGCGGACGTGCTGCGCAAACACATCCTCCTAGCACGTCCGCAA
+CGATCAACCCTTATGATTAGAGCCCCTGTATTGCGGACGTGCTGCGCAAACACATCCTCC
+TAGCACGTC
+>ds2020-267_937
+CCACTTCCTCTCAGCACGTCCGAAACATATTGCAGTCAGCACGTCCCAATCATCCGGGGC
+AGCACGTCCGCAACCCACTTCCTCTCAGCACGTCCGAAACATATTGCAGTCAGCACGTCC
+CAATCATCC
+>ds2020-267_938
+TGGCCCCACTATTGCGACGTGCTGAGAGTTTATTAGTTGCGACGTGCTGAGGCGGGAACA
+CTTGCGGACGTGCTGGCCCCACTATTGCGACGTGCTGAGAGTTTATTAGTTGCGACGTGC
+TGAGGCGG
+>ds2020-267_939
+GGACGAAATACGGTCAGTGCGTCGGTCTACTACGGCAGTGCGTCAACAATGAGATCACGG
+TCAGTGCGTCAGCGGACGAAATACGGTCAGTGCGTCGGTCTACTACGGCAGTGCGTCAAC
+AATGAGAT
+>ds2020-267_940
+TAAGGGGTCACACTCCAACAGTGATTCGCTTGCGGACGTGCTGAGGCAATTTGGCCAGCA
+CGTCCGCAAATAATAAGGGGTCACACTCCAACAGTGATTCGCTTGCGGACGTGCTGAGGC
+AATTTGGC
+>ds2020-267_941
+GTGCTGGGCTTAAGTTGCGGACTGCTGAGTCGTAACAGATTGCGGACGTGCGAGAGAGTC
+TCCATTGCGGACGTGCTGGGCTTAAGTTGCGGACTGCTGAGTCGTAACAGATTGCGGACG
+TGCGAGA
+>ds2020-267_942
+GGACGTGCTGCCCATTGTTTTGCGGAGTGCTGAGGGTAACCGTTTGCGGAGTGCTGAGGG
+ATACAGCTTTGCGGACGTGCTGCCCATTGTTTTGCGGAGTGCTGAGGGTAACCGTTTGCG
+GAGTGCT
+>ds2020-267_943
+CGTCCCAAACATGAGCCAGCACGTCCGCAATTGGTAACCCCTCAGCACGTCCGCAAGTAT
+GAACCCTCAGCACGTCCCAAACATGAGCCAGCACGTCCGCAATTGGTAACCCCTCAGCAC
+GTCCGCA
+>ds2020-267_944
+ATTGCGGACGTGTGAGAAGTGCGTTCTTGCGGACGTGCTGAGTAGATGTTGGGACGTGCT
+GAGGAATGTCGTATTGCGGACGTGTGAGAAGTGCGTTCTTGCGGACGTGCTGAGTAGATG
+TTGGGAC
+>ds2020-267_945
+CAGCACGTCCGCAACCAGTTCCCCTCAGCACGTCCGCAATTTCTTGCCACTCAGCACGTC
+GCAACTATTCCCCAGCACGTCCGCAACCAGTTCCCCTCAGCACGTCCGCAATTTCTTGCC
+ACTCAGC
+>ds2020-267_946
+CCGTCATTTTGCGACGTGCTGAGGGATAACAATTTGCGGACGTGCTGAGTTATAACGGTT
+GCGGACGTGCTGCCGTCATTTTGCGACGTGCTGAGGGATAACAATTTGCGGACGTGCTGA
+GTTATAA
+>ds2020-267_947
+ACCGGTACTGACGCACTGACCGTTAACCTGACCCTGACGCCTGACCTACTTACATGACAC
+ACTGACCGTCGTACCGGTACTGACGCACTGACCGTTAACCTGACCCTGACGCCTGACCTA
+CTTACAT
+>ds2020-267_948
+GCCTTGCGGACGTGCTGGGTTTGTTTGGGACGTGCTGAGGGAGATCTGTTTGCGGACGTG
+CTGAGGAGATGAGCCTTGCGGACGTGCTGGGTTTGTTTGGGACGTGCTGAGGGAGATCTG
+TTTGCGG
+>ds2020-267_949
+GCAAAACCAGTTCACTCAGCATGTCCGCAACTAGGGCAGCACGTCCGCAATACCCAGTGG
+CTCAGCACGTCCGCAAAACCAGTTCACTCAGCATGTCCGCAACTAGGGCAGCACGTCCGC
+AATACCC
+>ds2020-267_950
+GGCTGAATATGACGGTCAGTGCGTCCCTGAATACGGCAGTGCGTCACGGAAGTCTGTACG
+GTCAGTGCGTCAGGCTGAATATGACGGTCAGTGCGTCCCTGAATACGGCAGTGCGTCACG
+GAAGTCT
+>ds2020-267_951
+TTCAGGGCTCACACGTCCCAATGGTTTCTCCCTCAGCACTCCGCAATCTGGAACCCAGCA
+CGTCCGCAATTTTTCAGGGCTCACACGTCCCAATGGTTTCTCCCTCAGCACTCCGCAATC
+TGGAACC
+>ds2020-267_952
+CGTCCCCACTCAGCACGTCCGCAATATGCTCTACCTCAGCACGTCCCAACTGACCCAGCA
+CGTCCGCAATACGTCCCCACTCAGCACGTCCGCAATATGCTCTACCTCAGCACGTCCCAA
+CTGACC
+>ds2020-267_953
+GTTATGGCCTCGCACGTCCGCAAAACTCCCTATCTCGCACGTCGCAATAATCTGGCAGCA
+CGTCCGCAATTGTTATGGCCTCGCACGTCCGCAAAACTCCCTATCTCGCACGTCGCAATA
+ATCTGG
+>ds2020-267_954
+GCAATCATAGAGCTATTGCGGAAGCGAGTCTGTCTTGCGGACGTGCGACGAGTGTGGAGT
+TGCGGACGTGGGCAATCATAGAGCTATTGCGGAAGCGAGTCTGTCTTGCGGACGTGCGAC
+GAGTGT
+>ds2020-267_955
+AGGGAGTTGCGACGTGCTGACGGAATTACGGTTGCGGACGTGCTGAGGAAAAGTACGTTG
+CGGACGTGCTGAGGGAGTTGCGACGTGCTGACGGAATTACGGTTGCGGACGTGCTGAGGA
+AAAGTA
+>ds2020-267_956
+ACATTCCCTCAGCACGTCCGCAAGATTGTACGCCTCAGCACGTCCCAAATTCGGCAGCAC
+GTCCGCAAGTTACATTCCCTCAGCACGTCCGCAAGATTGTACGCCTCAGCACGTCCCAAA
+TTCGGC
+>ds2020-267_957
+GCACGTCCGCAATGAGTTCACCTTCAGCACGTCCGCATTAAAGCAGCCTCAGCACGTCCC
+AATTTCCCCAGCACGTCCGCAATGAGTTCACCTTCAGCACGTCCGCATTAAAGCAGCCTC
+AGCAC
+>ds2020-267_958
+GGCAAATTGGACGTGCTGAGTGAATGTGACTTGCGGACGTGCTGAGGAGTAGTCTCTTGC
+GGACGTGCTGGGCAAATTGGACGTGCTGAGTGAATGTGACTTGCGGACGTGCTGAGGAGT
+AGTCT
+>ds2020-267_959
+ATTTCTTGCGGACGTGCGAGGCCGATATTATTGCGGACGTGCGGGTTTAGGTTGGGACGT
+GTGAGGGTGAATTTCTTGCGGACGTGCGAGGCCGATATTATTGCGGACGTGCGGGTTTAG
+GTTGG
+>ds2020-267_960
+CCAAGTTCTTTTTCCTCAGCACGTCCCAACCGGCTCAGCACGTCCGCAAGTTGGAGTCCC
+TCAGCACGTCCCAAGTTCTTTTTCCTCAGCACGTCCCAACCGGCTCAGCACGTCCGCAAG
+TTGGA
+>ds2020-267_961
+ACCGTAGACCTCAGCACGTCCCAACCACTAATCCCTCAGCACGTCCCAACAGGTGCAGCA
+CGTCCGCAACACCGTAGACCTCAGCACGTCCCAACCACTAATCCCTCAGCACGTCCCAAC
+AGGTG
+>ds2020-267_962
+TCAGAGGTACGGAATAAGGTCAGTGCGTCAGAGTGAAACCAACGGTCAGTGCGTCGCGGA
+TTATCTACGGTCAGAGGTACGGAATAAGGTCAGTGCGTCAGAGTGAAACCAACGGTCAGT
+GCGTC
+>ds2020-267_963
+CAATCTCCCACGTCCGCAATCTAGTACAAGTCAGCACGTCCACACCAACCACCTAGACGC
+AGCACGTCCGCAATCTCCCACGTCCGCAATCTAGTACAAGTCAGCACGTCCACACCAACC
+ACCTA
+>ds2020-267_964
+TCCAAAACATAAGCCCTCAGCACGTCGCAACCTCTATCAGCACGTCCGCAACGCCTTAAC
+CCTCAGCACGTCCAAAACATAAGCCCTCAGCACGTCGCAACCTCTATCAGCACGTCCGCA
+ACGCC
+>ds2020-267_965
+AGGGGATTGGGACGTGCTGAGGCTAAAATGATGCGGACGTGTGAAGGACATGTAGTTGCG
+GACGTGCTGAGGGGATTGGGACGTGCTGAGGCTAAAATGATGCGGACGTGTGAAGGACAT
+GTAG
+>ds2020-267_966
+GATTGCGGACGTGCTGCCCGATGTTGGACGGTGAGGACCTAAGATTTGCGGACGTGCTGA
+GTACAACACGATTGCGGACGTGCTGCCCGATGTTGGACGGTGAGGACCTAAGATTTGCGG
+ACGT
+>ds2020-267_967
+CAGCACGTCCGCAATCTCTATCCCCTCACACGTCCGCAATCTGTAACCCCTCACACGTCA
+AATTGAGGCCAGCACGTCCGCAATCTCTATCCCCTCACACGTCCGCAATCTGTAACCCCT
+CACA
+>ds2020-267_968
+ATGCGGACGGGAGATGGATTTGATTGGGACGTGCTGAGGCCTAACTCCTTGCGGACGTGC
+TGCCCCATTATGCGGACGGGAGATGGATTTGATTGGGACGTGCTGAGGCCTAACTCCTTG
+CGGA
+>ds2020-267_969
+ATCCTTCTGCACTCGCACGTCGCAACTCACCCAGCACGTCCGCAATGGTTGATTACTCAG
+CACGTCCCAATCCTTCTGCACTCGCACGTCGCAACTCACCCAGCACGTCCGCAATGGTTG
+ATTA
+>ds2020-267_970
+GCTGTCCGATTGGGACGTGCTGAGCGACACTGAATTGGGACGTGCTGAGGAGACTAAGGT
+TGCGGACGTGCTGTCCGATTGGGACGTGCTGAGCGACACTGAATTGGGACGTGCTGAGGA
+GACT
+>ds2020-267_971
+ACTAGTAGTTGCGGACGTGCTGGGGAGAAATTGCGGACGAGCTTGGATACGTTGCGGACG
+TGTGAGGTACTAGTAGTTGCGGACGTGCTGGGGAGAAATTGCGGACGAGCTTGGATACGT
+TGC
+>ds2020-267_972
+CTGACTGAATACTTGTTGGGACGTGTGAGTGTCGGGGTCTTGCGGACGTGCTGGGGGGAT
+TGGGACGGCTGACTGAATACTTGTTGGGACGTGTGAGTGTCGGGGTCTTGCGGACGTGCT
+GGG
+>ds2020-267_973
+GGGCATTGCGACGTGCTGAGGTAATCTCTGTTGCGGACGTCTGAGTTATGAAAAATTGCG
+GACGTGCTGGGCATTGCGACGTGCTGAGGTAATCTCTGTTGCGGACGTCTGAGTTATGAA
+AAA
+>ds2020-267_974
+ATTGCGGACGTGCTGGGGGTTTATGTTGCGGACGGTCGTGTTGTTGCGGACGGCTGAGTG
+GATGTATATTGCGGACGTGCTGGGGGTTTATGTTGCGGACGGTCGTGTTGTTGCGGACGG
+CT
+>ds2020-267_975
+AAATGTTGCGGACGTGCTGCCTCGATTTGGATGTGAGGGATGGGAACTTGCGGACGTGTG
+AGCCAGTAAATGTTGCGGACGTGCTGCCTCGATTTGGATGTGAGGGATGGGAACTTGCGG
+AC
+>ds2020-267_976
+GTCTGAGTGTATAAAGGTTGCGGACGTGTGGGGTTCTGTACTTGCGGACGTGCTGGGGCA
+CTGGGACGTCTGAGTGTATAAAGGTTGCGGACGTGTGGGGTTCTGTACTTGCGGACGTGC
+TG
+>ds2020-267_977
+AATAGCGTCTCCCTCCACGTCGCAAAGCTCCAGCACGTCCGCAAGAACCATTCCTCACAC
+GTCCGCAATAGCGTCTCCCTCCACGTCGCAAAGCTCCAGCACGTCCGCAAGAACCATTCC
+T
+>ds2020-267_978
+GGCTTCCCTCAGCACGTCCGCAATTACACTCCAGTTAATTGAGGGCTCGCGGCTTGCGAC
+GTGCTGGGCTTCCCTCAGCACGTCCGCAATTACACTCCAGTTAATTGAGGGCTCGCGGCT
+T
+>ds2020-267_979
+TGGCGTGTGACCTCCACCCAAACCTTAACCAATACAGATAAATCCAGTATCGCGGACGTT
+CGGGCTTGGCGTGTGACCTCCACCCAAACCTTAACCAATACAGATAAATCCAGTATCGCG
+G
+>ds2020-267_980
+CAAGTTTCTCCGGGTCTCGCAATAATCCTTTTAACCAGTTATAACAATTTCACCCAGCAC
+GTCCGCAAGTTTCTCCGGGTCTCGCAATAATCCTTTTAACCAGTTATAACAATTTCACCC
+>ds2020-267_981
+CAGCACGTCCGCAATACCGTACACTTGCGGAGCCGAAGGTTATTGCGGACGTGTGCCTAG
+GCAGTCAGCACGTCCGCAATACCGTACACTTGCGGAGCCGAAGGTTATTGCGGACGTGTG
+>ds2020-267_982
+GGCAGTTGGGACGTGCTGAGGAAATTCTGATACGTGTGAGGAGGATTACATTGCGGACGT
+GCTGGGCAGTTGGGACGTGCTGAGGAAATTCTGATACGTGTGAGGAGGATTACATTGCG
+>ds2020-267_983
+TATCTAAGGAGCAGCACGTCCGCAAGTAGCTGGCTGTCAGCACGTCCGCAAGGTTGGATC
+CTCAGCACGTCCCAACCTGTATTGCCTCATGTTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_984
+TATATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTTGACCCT
+TAAGTGATTCCAATCTACCTTGTCGGGAGGTCTCTTTCCACACAAGTGCTACTGCCA
+>ds2020-267_985
+TCCGCAATTCGATTACTCTCAGCACGTCGCAATCCTGAACCCATGTAACTTGCGGCAGCA
+CGTCCGCAATTCGATTACTCTCAGCACGTCGCAATCCTGAACCCATGTAACTTGCGG
+>ds2020-267_986
+CAAGTTTCTCCGGGTCTCGCAATAATCCTTTTAACCAGTTATAACAATTTCACCCCGCCA
+AAATTTTGCTAATCTCTCCTAGACAGGAGGCCAATTGCGGACGTGCTGCTCGTTAG
+>ds2020-267_987
+TCTCCTGGTTACCTCTTCCTCCCACTCCAGATTCTTTGCGGCAGCACGTCCGCAATCGGT
+TTCTCCTGGTTACCTCTTCCTCCCACTCCAGATTCTTTGCGGCAGCACGTCCGCAA
+>ds2020-267_988
+CTCCGCCAGCACGTCCGCAAGATCTAGCCTCTCAGCACGTCCCAAGCTAACCCCGCTCAC
+ACTCCGCCAGCACGTCCGCAAGATCTAGCCTCTCAGCACGTCCCAAGCTAACCCCG
+>ds2020-267_989
+GTCCGCAATTGCGAATGCCTCAGCACGTCCCAATATGAGGCAGGTAAAGTTGCGGCAGCA
+CGTCCGCAATTGCGAATGCCTCAGCACGTCCCAATATGAGGCAGGTAAAGTTGCGG
+>ds2020-267_990
+TTGCGGACGTGAGCAAGGAGGTTTTGCGGACGTGCTGAGCGCTTCGTAATTGCGGACGTG
+CGGCTGCTTAGATAGGGGGGATGAGCAGCTGTTTGAAGTCTAGTCACTCCGGAGA
+>ds2020-267_991
+CAGCACGTCCGCAAGTGCAAATCACTCAGCACGTCCGCAACTCAGCGACCCTCAGCGTCC
+GCAAACATATTACACTCAGCACGTCCGCAATTCCTTCTCGGCACACGTCCGCAA
+>ds2020-267_992
+GCAACCATACTATGCTCAGCACGTCCGCAAGACTTATCCCTCAGCACGTCCGCAAAGGGA
+AAGGCATTGGGACGTGTGAGAGTAGCCAGATTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_993
+CGTGCTGAGGGGTAGTTATTTGCGGACGTGCTGGGGCCTATTTGCGGACGTGCTGGGGAC
+GTGCTGAGGGGTAGTTATTTGCGGACGTGCTGGGGCCTATTTGCGGACGTGCTG
+>ds2020-267_994
+TTTGCGGACGTGCTGACGTGAGGGGAACCTGGTTGCGGACGTGCTGAGAGTGTCCTGTTT
+GCGGACGTGCTGACGTGAGGGGAACCTGGTTGCGGACGTGCTGAGAGTGTCC
+>ds2020-267_995
+CCGGAACCTGGTGACCTTTGGGACGTGCTGAGACCTTGAATATTGCGGACGTGCTGCCGG
+AACCTGGTGACCTTTGGGACGTGCTGAGACCTTGAATATTGCGGACGTGCT
+>ds2020-267_996
+GTATTTGGCAACGAAGTCGGTTTCAGTCATGTTGACCAGATCTTTCATCAAGTCCGAGAC
+GGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGA
+>ds2020-267_997
+TCTTCCGATCTCTAAGGAGCAGCACGTCCGCAACGAGTACGTCGTCAGCACGTCCGCAAG
+TGTTATAGCCTCAGCACTTCCGCAATCCCACCCGTCTCCACGTCCGCAA
+>ds2020-267_998
+TTGCGGACGTGTGAGGTGAAGACGGTTGCGGACGTGCTGAGGCTAAAGGCGTTGCGGACG
+TGCTGAGGCAGGAAATATTGCGGACGTGCTGAGTACCTGCTATTTGCGG
+>ds2020-267_999
+TAGGCTCTTCAGTTTGTTCACTTCGCAGGTGGACAAGCACAAGTACGAAAGATTGGGACA
+TTGCAGCCAACTGTACAAGATGGGCGTACCAGTTTTTCAATACAACT
+>ds2020-267_1000
+GATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTTGTTATCCC
+TGTGGTAACTTTTCTGACACCTCTAGCTTCAAATTCCGAAGGTCTAA
+>ds2020-267_1001
+GTCAAAACGATTCTAACGGTCAGTGCGTCATCGCGGTTCTAACGGTCAGTGCGTCAAAAC
+GATTCTAACGGTCAGTGCGTCATCGCGGTTCTAACGGTCAGTGCGTC
+>ds2020-267_1002
+TGAATGTCCCTGAAGGTCATGGGACAGAGGATACCGAGATTGTGGAGGAGCTGAATGTCC
+CTGAAGGTCATGGGACAGAGGATACCGAGATTGTGGAGGAGCTGAA
+>ds2020-267_1003
+TAGGGGTGTCCCGTCCCACGATACAGCTATTCACTTGCGGCAGCACGTCCGCAAATGACC
+TCCCCTCAGCACGTCGCAACACTAAAACATTATTGCGGACGTGCTG
+>ds2020-267_1004
+TTGCGGACGTGCTGAGGGATAAGTCTTGCGGACGTGCTGAGCATAGTATGGTTGCGGACG
+TGCTGAGGGATAAGTCTTGCGGACGTGCTGAGCATAGTATGGTTGC
+>ds2020-267_1005
+TATCTAAGGAGCAGCACGTCCGCAAGCCGAAGCCCTCAGCACGTCCGCAAAGACAGCACC
+TCAGCACGTCCGCAAGATCGTTGGGGCACACGTCCGCAA
+>ds2020-267_1006
+TCTCAAAAAGCCTATCGTAGTCCGGATTGGGATGTGATGCTAATCTCAAAAAGCCTATCG
+TAGTCCGGATTGGGATGTGATGCTAATCTCAAAAAGCC
+>ds2020-267_1007
+CACAGTTATCTCAAATCCATCAACTGTTACAGAGTCAAAATAATTTTCATGTTCTTCAGG
+AGATAGGTCATAATCCTGGTGTTTTGCGGACGTGCTG
+>ds2020-267_1008
+AACCATCCCTGTGCCGTTCTGTCCCTATCTCAATCCTTGAGAACCATCCCTGTGCCGTTC
+TGTCCCTATCTCAATCCTTGAGAACCATCCCTGTGC
+>ds2020-267_1009
+GGACGTGCTGGGGAGAGGCTATGCGGACGTGCTGACCCTTAGGTAATTGCGGACGTGCTG
+AGGGGAGCCAGGTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_1010
+CAGACGCCTGTTCGCGACAGCGGACTAAGGAGCAGCACGTCCGCAACCTCTATTCCGTCA
+GCACGTCCGCAAATCTCGCCCTTCAGCACGTCCGCA
+>ds2020-267_1011
+AGCACTTTAAGCAGGGAGGAGAGGCTAATGGTTAAGTAAAGCACTTTAAGCAGGGAGGAG
+AGGCTAATGGTTAAGTAAAGCACTTTAAGCAGGG
+>ds2020-267_1012
+TCGAAGGAGTAGCACGTCCGCAAACACTTACCCCTTTTTGCGGACGTGCTGAGGGAGAAG
+TTGTTGCGGACGTGCTGAGGGAGAAGTTGTTG
+>ds2020-267_1013
+CTAAGGAGCAGCACGTCCGCAAAAACATACGGCTCAGCACGTCCCAACCTTCTCAGCACG
+TCCGAAGGCCCGCTTCCCAGCACGTCCGCAA
+>ds2020-267_1014
+CAGCACGTCCGCAACGGTGATACGCTCAGCACGTCCGCAATGTCCACAGCCTCAGCACGT
+CCCAATACTCTTCAGGCAGCACGTCC
+>ds2020-267_1015
+CAGCACGTCCGCAACTGTTGTTGACTCACACGTCCGCAAGAGCATACCCTCAGCACGTCC
+CAATGTACTAACGCTCAGCACGTCC
+>ds2020-267_1016
+AGGAGAGGGTAACGAAGTAGCTCGACTGAAAGGAGAGGGTAACGAAGTAGCTCGACTGAA
+AGGAGAGGGTAACGAAGTAGCTCGA
+>ds2020-267_1017
+GGACGTGTGAGTGGTTAAAACATGGGACGTGGAGTGAATTTTTGTTGCGGACGTGTGAGG
+TATCGACCTTTGCGGACGTGCTG
+>ds2020-267_1018
+TTGCGGACGTGCTGAGGGTTTATTATTTGCGGACGTGCTACCCAGTGAGTATTGCGGACG
+TGCTGCTCCTTAGATATATCGG
+>ds2020-267_1019
+TTGCGGACGTGCTGAGGGAGAAGTTGTTGCGGACGTGCTGAGGGAGAAGTTGTTGCGGAC
+GTGCTGAGGGAGAAGTTGTTG
+>ds2020-267_1020
+GTCCGCAATTTAAGTCACCTCAGCACGTCCGCAATTTAAGTCACCTCAGCACGTCCGCAA
+TTTAAGTCACCTCAGCACGTC
+>ds2020-267_1021
+CAGCACGTCCGCAATGAGGTCCGGGCAGCACGTCCGCAAACATGGGACATTGCGGATCTG
+GAAGTAAGGACGTTCGGGCTT
+>ds2020-267_1022
+GTGCTGGCGGGGATCACTTGCGGACGTGCTGAGGGAATTGGGCTTGCGGACGTGCGAGGG
+AAGGTCCTTGCGGACGTGCTG
+>ds2020-267_1023
+CCGCAACCTCCACTATCCACACGTCCGCAACCTCCACTATCCACACGTCCGCAACCTCCA
+CTATCCACACGTCCGCAAC
+>ds2020-267_1024
+CAGCCGTTTCTCAGGCTCCCTCTCCAGCCGTTTCTCAGGCTCCCTCTCCAGCCGTTTCTC
+AGGCTCCCTCTCCAGCCGT
+>ds2020-267_1025
+TGGACTTCGGGCTTGTCCCTCCAGTGGACTTCGGGCTTGTCCCTCCAGTGGACTTCGGGC
+TTGTCCCTCCAGTGGACTT
+>ds2020-267_1026
+TTGCGGACGGCTGAGCGCGGTTAATTGCGGACGTGCTGAGCGAACGAGATTTGCGGACGT
+GCTGACCGGTGGGAATTTG
+>ds2020-267_1027
+TTCACCTTTCCCCTCTTCGGCCTTCACCTTTCCCCTCTTCGGCCTTCACCTTTCCCCTCT
+TCGGCCTTCACCTTTCC
+>ds2020-267_1028
+CAGCACGTCCGCAACAACTTCCCCCTGCTTAAAGTGCTTTACTTAACCATTAGCCTCTCC
+TCCCTGCTTAAAGTGCT
+>ds2020-267_1029
+ATTGCGGACGTCTGAGGGAGAAGACTTTGCGGACGTGCTGACGAGTGTAACTTTGCGGAC
+GTGCTGCTCCTTAGATA
+>ds2020-267_1030
+CCCTTATTCTGCCAAGCCCGTTCCCTTATTCTGCCAAGCCCGTTCCCTTATTCTGCCAAG
+CCCGTTCCCTTATTCTG
+>ds2020-267_1031
+CTAATGCCACCATCCAATCCGCTAATGCCACCATCCAATCCGCTAATGCCACCATCCAAT
+CCGCTAATGCCACCAT
+>ds2020-267_1032
+TTATGAAAGGGCCTCGCAGCTCTTCAGTAGATCGATCTCAGCGGGTAAGAGACCGTGGAG
+TTTGCGGACGTGCTGC
+>ds2020-267_1033
+ATCTAAGGAGCAGCACGTCCGCAACTACACTTTCCTCAGCACGTCCGCAAATGAGCTTCC
+CTCAGCACGTCCGCAA
+>ds2020-267_1034
+TTGCGGACGTGCTGAGGGAATAATACTTGCGGACGTGCTGAGGGATAATGTTTTGCGGAC
+GTGCTGCTCCTTAGAT
+>ds2020-267_1035
+ATCTAAGGAGCAGCACGTCCGCAAAGTCAATCATGTCAGCACGTCCGCAAAGTTCATTCA
+CTCAGCACGTCCGCAA
+>ds2020-267_1036
+TTGCGGACGTGCTGAGCGAGTAGCCCTTGCGGACGTGCTGAGTATGTGTCGTTGCGGACG
+TGCTGCTCCTTAGATA
+>ds2020-267_1037
+TTGCGGACGTGTGAGAGGAAACAATTTGCGGACGTGCTGACGGGTAGGACCTTGCGGACG
+TGCTGCTCCTTAGATA
+>ds2020-267_1038
+ATTGCGGACATGCTGGGCGGAGTAATTTGCGGACGTGCTGCCGAGCGCTTATTGCGGACG
+TGCTGCTCCTTAGATA
+>ds2020-267_1039
+TTGCGGACGTGCTGATCGAATGGAATTGCGGACGTGCTGGACTCGGCTTGGATTGCGGAC
+GTGCTGCTCCTTAGAT
+>ds2020-267_1040
+TTGCGGACGTGTGAGATAACTCGGGTTGCGGACGTGCTGAGAACCGTCACCTTGCGGACG
+TGCTGCTCCTTAGATA
+>ds2020-267_1041
+TTGCGGACGTCTGAGCCTCAAGAGATTGCGGACGTGCTGAGGTGCTTTTCATTGCGGACG
+TGCTGCTCCTTAGATA
+>ds2020-267_1042
+ATCTAAGGAGCAGCACGTCCGCAAGATGACGCCCGGTAGCACGTCCGCAAGTGGGAGCCA
+CTCAGCCGTCCGCAAT
+>ds2020-267_1043
+TTGCGGACGTGCTGAGTAACAGAGTCTTGCGGACGTGCTGAGCGGCACAACATTGCGGAC
+GTGCTGCTCCTTAGAT
+>ds2020-267_1044
+TTGCGGACGTGCTGAGAGGATTACCGTTGCGGACGTGCTGAGGGATAGAATCTTGCGGAC
+GTGCTGCTCCTTAGAT
+>ds2020-267_1045
+TCCGCAACCGTATATACCTCAGCACGTCCGCAATCGTTACTCCTCAGCACGTCCGCAATG
+TTAAACGCCTCAGCAC
+>ds2020-267_1046
+TCACCAGACTCTGTCCGTCTTGCAGCAATTTTCAGGAGTTTCTTCATTCAGGGTGCTGCC
+TTTGCGGACGTGCTG
+>ds2020-267_1047
+TTGCGGACGTGCGAGTGACAATGGATTGCGACGTGCTGAAGGAGTAGTCCTTGCGGACGT
+GCTGCTCCTTAGATA
+>ds2020-267_1048
+TATCTATGGAGCAGCACGTCCGCAACATGAATATACTCAGCACGTCCCAAGATGTCTTCC
+GTCACACGTCCGCAA
+>ds2020-267_1049
+TTGCGGACGTGGAAGCGTAAATCCTTGCGGACGTGCTGAGAGACATGGTGTTGCGGACGT
+GCTGCTCCTTAGATA
+>ds2020-267_1050
+TTGCGGACGTGTGGGGCCAGACTGTTGCGGACGTGTGCAGCCGGGAAATATTGCGGACGT
+GCTGCGCCTTAGATA
+>ds2020-267_1051
+ATCTAAGAGCAGCACGTCCGCAAACCCATTACCCTCAGCACGTCCGCAACATGCCATCCC
+TCAGCACGTCCGCAA
+>ds2020-267_1052
+TAGCAAGGAGCAGCACGTCCGCAAGTTATTCGGCCTCAGCACGTCCGCAAGCCCTTTATG
+CCAGCACGTCCGCAA
+>ds2020-267_1053
+TTGCGGACGTGTGAGGTGGCTGGCGTTGCGGACGTGCTGAGGGCTAGAGTTTTGCGGACG
+TGCTGCTCCTTAGAT
+>ds2020-267_1054
+TTGCGGACGTGCTGAGGAGTGCAGTGTTGCGGACGTGTGAGGTGCTTTTTATTGCGGACG
+TGCTGCTCCTTAGAT
+>ds2020-267_1055
+TTGCGGACGTGCTGAGGGAGAAGAGTTTGGACGTGCTGAGGGGTGTCGCCTTGCGGACGT
+GCTGCTCCTTAGACA
+>ds2020-267_1056
+TTGCGGACGTGCTGAGGGGTAGTTCATTGCGGACGTGGAGGAGTGTGGGTTTGCGGACGT
+GCTGCTCCTTAGAGA
+>ds2020-267_1057
+TTGCGGACGTGCTGAGGCCTAACCATTTGCGGACGTGCTGGGGGAATCGCATTGCGGACG
+TGCTGCTCCTTAGAT
+>ds2020-267_1058
+TAGGCTCTTCAGTTTGTTCACTTCGCAGGTGGACAAGCACAAGTACGAAAGATTGAGGAC
+TTGCGGACGTGCTG
+>ds2020-267_1059
+TGCGGACGTGTGAGGGTAGACATATTGGGACGTGCTGACTAAGGCAAGCTTGCGGACGTG
+CTGCTCCTTAGATA
+>ds2020-267_1060
+TTGCGGACGTGCTGAGCCGTTACAGATTGGGACGTGCTGGGAGAACATAATTGCGGACGT
+GCTGCTCCTTAGAT
+>ds2020-267_1061
+ATCTAAGGAGCAGCACGTCCGCAAAATGGTTATGCTCAGCACGTCCGCAAGATACTACCC
+TCACACGTCCGCAA
+>ds2020-267_1062
+TTTGCGGACGGAAGGATTCTCGGTTGCGGACGTGCTGACGGGGAATCTCTTGCGGACGTG
+CTGCTCCTGAGATA
+>ds2020-267_1063
+TTGCGGACGTGCGCCAGTCAGTTATTGCGGACGTGCGACTGATGTGGCTTTGCGGACGTG
+CTGCTCCTTAGATA
+>ds2020-267_1064
+TTGCGGACGTGCGACAAATATTAAATTGGGACGTGCTGACCCAGTTGCTTTGCGGACGTG
+CTGCTCCTTAGATA
+>ds2020-267_1065
+CGGACGTGCTGAGACGTGACCGTTTGCGGACGTGCTGAGTGGTATGGTCTTGCGGACGTG
+CTGCTCCTTAGATA
+>ds2020-267_1066
+TTGCGGACGTGGACTCAATCATTATTGGGGACGTGCTGAGCGGTTGCGGATTGCGGACGT
+GCTGCTCTTAGATA
+>ds2020-267_1067
+TTGCGGACGTGTGAGGGATAGTGTTTGCGGACGTGTGAGGGTTGCTAGATTGCGGACATG
+CTGCTCCTTAGATA
+>ds2020-267_1068
+TTGCGGACGTGCTGGGGGTGAAAGATTGCGGACGTGCTACCAGGTACCTCTTGCGGACGT
+GCTGCTCCTTAGAT
+>ds2020-267_1069
+ATTGCGGACGTGGAGAAGTACTAATTGCGGACGTGCGGGGGCCTCGCGTTGCGGACGTGC
+TGCTCCTTAGATA
+>ds2020-267_1070
+CCAGACTCTTACCTTCCTCCAGACTCTTACCTTCCTCCAGACTCTTACCTTCCTCCAGAC
+TCTTACCTTCCTC
+>ds2020-267_1071
+TTGCGGACGTGTGGGTGGCAGAGATTGCGGACGTGCTGACCCCTATGCATTTGCGGACGT
+GCTGCTCCTTAGA
+>ds2020-267_1072
+TATCTAAGGGCAGCACGTCCGCAACGCGATTGCACTCACACGTCCGCAAGCCTCTTCCTT
+CACACGTCCGCAA
+>ds2020-267_1073
+CTAAGGAGCAGCACGTCCGCAAATCGTTATCCCTCAGCACGTCCGCAAAATGCATTACCT
+CAGCCGTCCGCAA
+>ds2020-267_1074
+TTTGCGGACGTAGGGAGCCGTAATTGCGGACGTGCTGACGAAACCTCCCTTGCGGACGTG
+CTGCTCTTAGATA
+>ds2020-267_1075
+GGACGTGCTGAGGGCCAACACCTTGCGGACGTGCTGAGAATATTAGATTTGCGGACGTGC
+TGCTCCTTAGATA
+>ds2020-267_1076
+TATCTAAGGAGCAGCACGTCCGCAAAGATGGCCACCTCAGCACGTCCGCAAGTGTTATGT
+CCTCAGCACGTCC
+>ds2020-267_1077
+GGACGTGCTGAGTAGTAATAGCTTGCGGACGTGCTGAGGTAACTCACTTTGCGGACGTGC
+TGCTCCTTAGATA
+>ds2020-267_1078
+TTCACCTTTCCCCTCTTCGGCCTTCACCTTTCCCCTCTTCGGCCTTCACCTTTCCACTCT
+TGCGGACTTGCTG
+>ds2020-267_1079
+GGACGTGCTGAGTGGGACCGTATTGCGGACGTGCTGAGTGATCCTATTTTGCGGACGTGC
+TGCTCCTTAGATA
+>ds2020-267_1080
+GGACGTGCTGAGGGTCTACGAATTGCGGACGTGCTGAGGGGTAAGTGCTTGCGGACGTGC
+TGCTCCTTAGATA
+>ds2020-267_1081
+TTGCGGACGTGCTGAGGCTATGGGGCTTGCGGACGTGCTAAGCGAGTAGTCTTGCGGACG
+GCTGCCCTTAGAT
+>ds2020-267_1082
+TTGCGGACGTGTGAGGGATTCAGAGTTGCGACGTGCTGAGAGCGGACACGTTGCGACGTG
+CTGCTCTTAGATA
+>ds2020-267_1083
+TTGCGGACGTGCTGAGGAAGAGGCTTTTGCGGACGTGCTGGGGTGAATTGCGGACGTGCT
+GCTCCTTAGATA
+>ds2020-267_1084
+GGACGTGCTGAGGGAAAGACATTGCGGACGTGCTGACCGGTTGCCTATTGCGGACGTGCT
+GCTCCTTAGATA
+>ds2020-267_1085
+TTGCGGACGTGGGGGCCAACCCTTGCGGACGTGCTGCCCATGACAACTTGCGGACGTGCT
+GCTCCTTAGATA
+>ds2020-267_1086
+GGACGTGCTGAGGAGAGCGACCTTGCGGACGTGCTGAGTGTGTAACCTTTGCGGACGTGC
+TGCTCCTTAGAT
+>ds2020-267_1087
+TATCTAAGGAGCAGCACGTCCGCAACTCTGTGCACTCAGCACGTCCGCAACACACTTACC
+CTCGCACGTCCG
+>ds2020-267_1088
+GACGTGCTGAGCGGAAGATCTTTGCGGACGTGCTGAGGGGAACCGGATTGCGGACGTGCT
+GCTCCTTAGATA
+>ds2020-267_1089
+GGACGTGCTGAGGAACGAACGATTGCGGACGTGCTGCCCTGAACACCTTGCGGACGTGCT
+GCTCCTTAGATA
+>ds2020-267_1090
+GGACGTGCTGAGGGCAAAGCTATTGCGGACGTGCTGGGGGAACTTGCTTGCGGACGTGCT
+GCTCCTTAGATA
+>ds2020-267_1091
+TATCTAAGGAGCAGCACGTCCGCAAGTGTGACGGGGCAGCACGTCCGCAAGTTACTCGCC
+CTCAGCACGTCC
+>ds2020-267_1092
+CGGACGTGCTGAGGGATCACTCGTTGCGGACGTGCTGAGGGGGAAAGTTTTGCGGACTGC
+TGCTCCTTAGAT
+>ds2020-267_1093
+GGACGTGCTGAGGAAGCTCGGATTGCGGACGTGCTGAGACCATAATAATTGCGGACGTGC
+TGCTCCTTAGAT
+>ds2020-267_1094
+AGTTGTATTGAAAAACTGGTACGCCCATCTTGTACAGTTGGCTGCAATGTCCCAACCTTG
+CGGACGTGCTG
+>ds2020-267_1095
+ATCTAAGGAGCAGCACGTCCGCAACATCCCGGCAGCACGTCCGCAAAATGGAGGCTCTCA
+CACGTCCGCAA
+>ds2020-267_1096
+TATCTAAGGAGCAGCACGTCCGCAACGATACTAACCTCAGCACGTCCGCAAGTTCTCCAC
+CCCAGCACGTC
+>ds2020-267_1097
+TTGCGGACGTGGAGGGTTTGGTAGTTGGGACGTGCTGAGGCGTATGACTTGCGGACGTGC
+TGCTCCTTAGA
+>ds2020-267_1098
+TATCTAAGAGCAGCACGTCCGCAAGGTAAGCCTCGTCAGCACGTCGCAAAGTTAAGTGCC
+TCAGCACGTCC
+>ds2020-267_1099
+GGACGTGCTGAGGTATCGCGGTTTGCGGACGTGCTGAGTAATCTACGTTTGCGGACGTGC
+TGCTCCTTAGA
+>ds2020-267_1100
+GGACGTGCTGACGGACTACTCCTTGCGGACGTGCAGGCGATCGTCATTGCGGACGTGCTG
+CTCCTTAGGTA
+>ds2020-267_1101
+TATCTAAGGAGCAGCACGTCCGCAAATGTGACCGGGTAGCACGTCCGCAACGCCTATTGA
+CTCAGCACGTC
+>ds2020-267_1102
+ATCTAAGGAGCAGCACGTCCGCAAATGACACTTCCTCAGCACGTCCGCAATACAGATCCG
+TCAGCACGTCC
+>ds2020-267_1103
+TATCTAAGGAGCAGCACGTCCGCAAGTCAATGGCCCTCACACGTCCGCAATAAGATATGC
+CTCGCACGTCC
+>ds2020-267_1104
+GACGTGCTGAGGGCTCACGACTTGCGGACGTGCTGAGTGGTAAGGCTTTGCGGACGTGCT
+CTCCTTAGATA
+>ds2020-267_1105
+ATCTAAGGAGCAGCACGTCCGCAAGGCCTCCCCACTCAGCCGTCCGCAATGGTCCTACCC
+TCAGCACGTCC
+>ds2020-267_1106
+GACGTGCTGATGGTCTGGTGATTGCGGACGTGCTGAGGAGTTAGGCTTGCGGACGTGCTG
+CTCGTTAGATA
+>ds2020-267_1107
+TCCGATCTACCTAAGGAGCAGCACGTCCGCAAATTCTAACTCTTAGCACGTCGCAAGTGG
+GCAGCACGTCC
+>ds2020-267_1108
+GCGGACGTGCTGCCCGGTAAAGCTTGCGGACGTGCTGAGCGGTGTAAGCTTGCGGACGTG
+CTGCTCCTTAG
+>ds2020-267_1109
+TTGCGGACGTGCTGGCGGACGTGCTGAGGTGAACAAATTTGCGGACGTGCTGCTCCTTAG
+ATAGATCGGA
+>ds2020-267_1110
+TCCGATCTATCTAAGGAGCAGCAGTCCGCAAGAATCATAGACTCACACGTCCGCAACGAT
+CAGCACGTCC
+>ds2020-267_1111
+TCTAAGGAGCAGCACGTCCGCAATGGTTGCATCCTCAGCACGTCCGCAATCCAGTGTCCC
+TCAGCACGTC
+>ds2020-267_1112
+TCTAAGGAGCAGCACGTCCGCAATACGACCTGGGCAGCACGTCCCAAGCATACTCACCTC
+ACGTCCGCA
+>ds2020-267_1113
+TATCTAAGGGCGCACGTCCGCAAGGAGTTAGGGGTAGCACGTCGCAAGCTGCAGTCTCTC
+AGCACGTCC
+>ds2020-267_1114
+GGACGTGCTGCCCGCTAAAGGTTGGGACGTGCTGGGAGATTGCTATTGCGGACGTGCTGC
+TCCTTAGAT
+>ds2020-267_1115
+TATCTAAGGAGCAGCACGTCCGCAAAAAGTGGCCCCTCAGCACGTCCGCAAGCTAAACCC
+CCTCAGCAC
+>ds2020-267_1116
+TAAGGAGCACCGTCCGCAATCTATTATGCTTAGCACGTCCGCAACCTCTACCAGTCACAC
+GTCCGCAA
+>ds2020-267_1117
+TAAGGAGCAGCACGTCCGCAATGGTCAATACTTAGCACGTCCGCAAGTAAGTTGGCCTAC
+GTCCGCAA
+>ds2020-267_1118
+GCGTTGGGACGTGCTGAGTGAATATACCTTGCGGACGTGCTGAGTGGATAGCAATTGCGG
+ACGTGCTG
+>ds2020-267_1119
+CTATCTAAGGAGCAGCACGTCCGCAAAAGACGCCCGGTAGCACGTCCGCAAAGATTACCT
+TGTCAGC
+>ds2020-267_1120
+TAAGGAGCAGCACGTCCGCAACCATCTCTCCCGCACGTCCCAGCTAGATGGCATCACACG
+TCCGCAA
+>ds2020-267_1121
+TCTTCCGATCTATCTAAGGAGCAGCACGTCCGCAATTGGGCAGCACGTCCGCAATGCAAT
+CCACGTC
+>ds2020-267_1122
+TTGCGGACGTGTGCCGAAGGGCATTGCGGACGTGCTGACGGTTTTAAGCTTGCGGACGTG
+CTGCTCC
+>ds2020-267_1123
+CAGCACGTCCGCAACGTGGTACGCCTCAGCACGTCCGCAACAATAGACCGCTCAGCACGT
+CCGCAAT
+>ds2020-267_1124
+TCTTCGAGGTATCTTCGAGGTATCTTCGAGGTATCTTCGAGGTATCTTCGAGGTATCTTC
+GAGGTA
+>ds2020-267_1125
+GAGCAGCACGTCCGCAACACTCGTCAACTCAGCACGTCCGCAATGACCCTGCTCTCCCGT
+CCGCAA
+>ds2020-267_1126
+GAGCAGCACGTCCGCAAACAGATAGCCCTCAGCACGTCCGCAAACGATAACGGGCCACGT
+CCGCAA
+>ds2020-267_1127
+GAGCAGCACGTCCGCAACGACAGACCCTTAGCACGTCCGCAAAGAAACCCGACTCCACGT
+CCGCAA
+>ds2020-267_1128
+CAGCACGTCCGCAACATCGGTCCCCTCAGCACGTCCGCAACGCACCTTCTCTCAGCACGT
+CCGCAA
+>ds2020-267_1129
+CAGCACGTCCGCAAGCTCATCTCCCTCAGCACGCCCGCAATCGTACCTGACTCAGCACGT
+CCGCAA
+>ds2020-267_1130
+CAGCACGTCCGCAACAGCTAGCTCCTCAGCACGTCCGCAAATGACTTTCCCTCAGCACGT
+CCGCAA
+>ds2020-267_1131
+TTGCGGACGTGCTGAGCGAAGGATAATTGCGGACGTGCTGAGGGGGGGCAAGTTGCGGAC
+GTGCTT
+>ds2020-267_1132
+CAGCACGTCCGCAATATGTCGTGGCTCAGCACGTCCGCAAAAAGTCCTCCCTCAGCACGT
+CCGCAA
+>ds2020-267_1133
+TCTAAGGAGCAGCACGTCCGCAACAAATACGCCGTCAGCACGTCGCAAATACAGGGCAGC
+ACGTCC
+>ds2020-267_1134
+GTTGCGGACGTGTGACAGAAGACTATTTGCGGACGTGCTGACAGAAGGGAAATTGCGGAC
+GTGCTG
+>ds2020-267_1135
+TTGCGGACGTGCTGAGACAGTAACTGTTGCGGACGTGCTGAGTGTGTAACCTTTGCGGAC
+GTGCTG
+>ds2020-267_1136
+TTGCGGACGTACTGAGGGAAATCAACTTGCGGACGTGCTAGCGGAACGGGGTTGCGACGT
+GCTGGT
+>ds2020-267_1137
+CAGCACGTCCGCAAGGAATACTCCTCAGCACGTCCGCAACCGATCGCCCCTCAGCACGTC
+CGCAAT
+>ds2020-267_1138
+TTGCGGACGTGCTGAGTGAGGGGGGCTTGCGGACGTGCTGAGGGAGTCGACTTTGCGGAC
+GTGCTG
+>ds2020-267_1139
+TTGCGGACGTGCTGAGGGATGACCTGTTGCGGACGTGCTGAGTGCATCGGTATTGCGGAC
+GTGCTG
+>ds2020-267_1140
+TTGCGGACGTGCTGAGTGGTCTATTATTGCGGACGTGCTGAGGGGTTTTCGATTGCGGAC
+GTGCTG
+>ds2020-267_1141
+TTTGCGGACGTGCTAAGGGTACGGAATTGCGGACGTGCTGAGCCCGCGACGTTTGCGGAC
+GTGCTG
+>ds2020-267_1142
+TTGCGGACGTGCTGAGGGAGAAGCAATTGCGGACGTGCTGATAGTAGAAGTGTTGCGGAC
+GTGCTG
+>ds2020-267_1143
+GCAGCACGTCCGCAATTGTACGCTACTCAGCACGTCCGCAATGCTCCTGGCCCACACGTC
+CGCAA
+>ds2020-267_1144
+GCAGCACGTCCGCAACATAAACTCTGTCAGCACGTCCCAATACGGTACACCTCACACGTC
+CGCAA
+>ds2020-267_1145
+AGCAGCACGTCCGCAAAGAAAGTTCCCTCAGCACGTCCGCAATTAACTACGGGCACACGT
+CCGCA
+>ds2020-267_1146
+CAGCACGTCCGCAAATACACACTCCTCAGCACGTCCGCAAGGGGGATACTCTCAGACGTC
+CGCAA
+>ds2020-267_1147
+GCAGCACGTCCGCAACATACAGTCCCTCAGCACGTCCCAATGTGTTGAACCTCGCACGTC
+CGCAA
+>ds2020-267_1148
+TTGCGGAGTGCTGGGGCACAACAATTGCGGACGTGCTGAGCCCACCTAGATTGCGGACGT
+GCTGC
+>ds2020-267_1149
+CAGCACGTCCGCAAGTCTATTCTCCTCAGCACGTCCGCAAAGCATATCCCCCAGCACGTC
+CGCAA
+>ds2020-267_1150
+CAGCACGTCCGCAACGTTACTTCCCTCAGCACGTCCCAAGGCACTCATCTCAGCACGTCC
+GCAAA
+>ds2020-267_1151
+CAGCACGTCCGCAAGAGCACTCTTCTCAGCACGTCCGCAATTGGTATGGCTTCACACGTC
+CGCAA
+>ds2020-267_1152
+CAGCACGTCCGCAATTGGACCACCTCAGCACGTCCGCAACTATTATACTCTCAGCACGTC
+CGCAA
+>ds2020-267_1153
+TTGCGGACGTGTGAGCCAAGTAGAGTTGCGGACGTGCTGACTGCGACAAGGTTGCGGACG
+TGCTG
+>ds2020-267_1154
+TTGCGGACGTGCTGAGGACTTACGATTGCGGACGTGCTGACCGGACAAACATTGCGGACG
+TGCTG
+>ds2020-267_1155
+TTGCGGACGTGCTGAGGGAAATGTCTTGCGGACGTGCTGAGTGAATACGCGTTGCGGACG
+TGCTG
+>ds2020-267_1156
+AGTATTTACCTTGACTTCGGGCTTTAAAAACGGATTGGAAAGCCCGAACGTCCAGGGGTT
+GCCAA
+>ds2020-267_1157
+CAGCACGTCCGCAACAGGAGTAACCTCAGCACGTCCGCAAACCTGTGTGGGCACACGTCC
+GCAA
+>ds2020-267_1158
+CAGCACGTCCGCAATGTGTAGTCCCTCAGCACGTCCGCATATGGAACCCCCAGCACGTCC
+GCAA
+>ds2020-267_1159
+AGCAGCACGTCCGCAATGTCTTCTCACTCAGCACGTCCGCAATATAAATCCTTGCCGTCC
+GCAA
+>ds2020-267_1160
+CAGCACGTCCGCAAGCTACTAATACTCACACGTCCGCAACACTCGTGCCCTCGCACGTCC
+GCAA
+>ds2020-267_1161
+CAGCCGTCCGCAACTTGGACTACCTCGCACGTCCGCAATTCGTAAGCCGTCAGCACGTCC
+GCAA
+>ds2020-267_1162
+TTGCGGACGTGCGAGGCGCTGTGGATTGCGGACGTGCTGACACAGTATCGATTGCGGACT
+GCTG
+>ds2020-267_1163
+CAGCACGTCCGCAATGTCATAGCCCTAGCCGTCCGCAACACTGGTGCCCTCAGCACGTCC
+GCAA
+>ds2020-267_1164
+CAGCACGTCCGCAATGGTAGTCCCCTCAGCACGTCCGCAAGATGTTTGGGCTGCACGTCC
+GCAA
+>ds2020-267_1165
+TTGCGGACGTGCAACCATTAGATATTGCGGACGTGCTGAGGGGCCGATATTTGCGGACGT
+GCTG
+>ds2020-267_1166
+TTGCGGACGTGGACCGAGAGAGTATTGCGGACGTGCTGAGGAGTAATGGATTGCGGACGT
+GCTG
+>ds2020-267_1167
+CAGCACGTCCGCAAACGATGATGCCTCAGCACGTCCGCATCTGGAAGTAAGGACGTTCGG
+GCTT
+>ds2020-267_1168
+ATGGTTGTATGGTTGTATGGTTGTATGGTTGTATGGTTGTATGGTTGTATGGTTGTATGG
+TTG
+>ds2020-267_1169
+CAGCACGTCCGCAAACCGACACAGGTGGGCGAGATGAGTATTCTAAGGCGCTTGAGAGAA
+CTC
+>ds2020-267_1170
+CAATTGGTCAATTGGTCAATTGGTCAATTGGTCAATTGGTCAATTGGTCAATTGGTCAAT
+TGG
+>ds2020-267_1171
+CAGCCGTCCGCAACGTTCATTCCCTCAGCACGTCCGCAACCGCTAGCTCTCGCACGTCCG
+CAA
+>ds2020-267_1172
+CAGCACGTCCGCAATCTGAGGTACCCAGCCGTCCGCAATGGCTCGTGTCTCGCACGTCCG
+CAA
+>ds2020-267_1173
+TTGCGGACGTGCTGAGTGAAGCAGGGTTGCGGACGTGTGGGAGAGTCTGGTTGCGGACTG
+CTG
+>ds2020-267_1174
+TTGCGGACGTGAGTATAGAATGGTTGCGGACGTGCTGAGTACGTTTTGCTTGCGGACGTG
+CTG
+>ds2020-267_1175
+GGACGTGCTGAGGGTTGACATCTTGCGGACGTGCTGAGCTGTCTCCTCTTGCGGACGTGC
+TGC
+>ds2020-267_1176
+CTGTCTAAGGAGCAGCACGTCCGCAACTGCCGCAGAGTCTTGGTTAACGTCAATGGGTTT
+TAG
+>ds2020-267_1177
+TCTTCCAATCTATCTAAGGAGCAGCACGTCCGCAAGCTACGGTCTCTCAGCACGTCCGCA
+ATT
+>ds2020-267_1178
+GCAGCACGTCCGCAAAACTAGATCGGCAGCACGTCCGCAAGGGCTAATGACTCAGCACGT
+CC
+>ds2020-267_1179
+CAGCACGTCCGCAAGGATAGGTCACTCAGCACGTCCGCAAACCACCTGCCCTCAGCACGT
+CC
+>ds2020-267_1180
+CAGCAGTCCGCAACAGATACCGACTAGCACGTCCGCAAACCCCCTACGCCAGACGTCCGC
+AA
+>ds2020-267_1181
+GGACGTGCTGAAGGAGATAACATTGCGGACGCGCTGAGGTCAGCTGGTTTGCGGACGTGC
+TG
+>ds2020-267_1182
+GGACGTGCTGAGGGACCGAGTATTGCGGACGTGCTGAGTGTGGCTTCATTGCGGCGTGCT
+GC
+>ds2020-267_1183
+TCTTCCGATCTATCTAAGGAGCAGCACGTCCGCAACCTATTCGCCCTCAGCACGTCCGCA
+AT
+>ds2020-267_1184
+CTATTGCGGACGTGCTAAGGTCTATATTTTGCGGACGTGCTGCTCCTTAGATAGATCGGT
+AG
+>ds2020-267_1185
+CATATTTGGCATGGCGTTCGTCTTACACAGAAGAGTAAGCCCGAACGTCCAGCCAGTGAC
+GT
+>ds2020-267_1186
+TTGCGGACGTGCTGAGTGCTAGTTTCTTGCGGACGTGCTGCTCCTTAGATAGATCCGAAG
+AG
+>ds2020-267_1187
+TTGCGGACGTGCTGACCCTATACTAATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAT
+AG
+>ds2020-267_1188
+TCTTCCAATCTATCTAAGGAGCAGCACGTCCGCAAACTGCCCGCGCCCAGCACGTCCGCA
+AT
+>ds2020-267_1189
+AGCAGCACGTCCGCAAACAGAAGGCCTCGCACGTCCGCACTTTCCTCGTCTCAGCACGTC
+C
+>ds2020-267_1190
+CAGCACGTCCGCAATCTGGAACTACTCAGCACGTCCGCAAACTTCTCCGGCTCAGCACGT
+C
+>ds2020-267_1191
+CAGCAGTCCGCAAGTGATGACATCTCAGCACGTCCGCAATTGACGTCCACTCAGCACGTC
+C
+>ds2020-267_1192
+AAGCACGTCCGCAAAACATCGGGGCTCAGCACGTCCCAAAACTGCCCCACTCAGCACGTC
+C
+>ds2020-267_1193
+GACGTGCTGAGCGATTTTATGTTGCGGACGTGCTGAGGCTTGACTTTTTGCGGACGTGCT
+G
+>ds2020-267_1194
+CAGCACGTCCGCAAAACTTTGTCCCTCAGCACGTCCGAACCCTTAACTACTCAGCACGTC
+C
+>ds2020-267_1195
+GACGTGCTGACGGAACAGAACTTGCGGACGTGCTGAGTGGTGCCAGTTGCGGAGTGCTGC
+T
+>ds2020-267_1196
+TTTGCGGACGTGCTGACCCAGTCAACTTTGCGGACTGCTGCTCCTTAGATAGATCGGAAG
+A
+>ds2020-267_1197
+TCTCCGATCTATCTAAGGAGCAGCACGTCCGCAAAGTCAATAGCCTCACACGTCCGCAAT
+C
+>ds2020-267_1198
+GTTGCGGACGTGCTGAGGGTACTCGATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+A
+>ds2020-267_1199
+TCTCCGATCTATCTAAGGAGCAGCACGTCCGCAATCACATATCCCTCAGCACGTCCGCAA
+A
+>ds2020-267_1200
+TTCCGATCTATCTAAGGAGCAGCACGTCCGCAACCGGTCTGCCCTCAGCACGTCCGCAAA
+G
+>ds2020-267_1201
+TTGCGGACGTGCTGAGGGGATTGACATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+A
+>ds2020-267_1202
+CTTTCCGATCTATCTAAGGAGCAGCACGTCCGCAATAGCGTACATCTCAGCACGTCCGCA
+A
+>ds2020-267_1203
+TTTGCGGACGTGCTGACCCGGGATCCATTGCGGACGTGCTGCTCCTTAGATAGATCGGAA
+G
+>ds2020-267_1204
+TCGTCCGATCTATCTAAGGAGCAGCACGTCCGCAATCGTTCGACCCTCAGCACGTCCGCA
+A
+>ds2020-267_1205
+TCTTCCGATCTATCTAAGGAGCAGCACGTCCGCAAGACCTCGCGCCTCAGCACGTCCGCA
+A
+>ds2020-267_1206
+TTGCGGACGTGCTGAGGACGCTTACTTTGCGGACGTGCTGCTCCTTAGATAGATCGGGAA
+G
+>ds2020-267_1207
+CTTCCCGATCTATCTAAGGAGCAGCACGTCCGCAAGATATACGACATCAGCACGTCCGCA
+A
+>ds2020-267_1208
+TTGCGGACGTGCTGAAGGGCTACTTTTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+A
+>ds2020-267_1209
+CTTGCGGACGTGCTGAGTACAATATCTTTGCGGACGTGCTGCTCCTTAGATAGATCGGAA
+G
+>ds2020-267_1210
+TTGCGGACGTGCTGACCGGATCTAAGTTGCGGACGTGCTGCTCCTTAGATAGATCGTAAG
+A
+>ds2020-267_1211
+TTGCGGACGTGCTGAGGGGATTCGCTTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+A
+>ds2020-267_1212
+CAGCACGTCCGCAAACGATAGGCGTTAGCACGTCCGCAAGTTTATACGCCTCAGCACGTC
+>ds2020-267_1213
+CAGCACGTCCGCAATGCAGACCCTTTAGCACGTCCGCAATTCGGCACTCTCAGCACGTCC
+>ds2020-267_1214
+TTGCGGACGCGCTGGACGTGCTGATCAAGGCGCATTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_1215
+TCTCCGATCTATCTAAGGAGCAGCACGTCCGCAATTACACCCACCTCAGCACGTCCGCAA
+>ds2020-267_1216
+CTTCCGATCTATCTAAGGAGCAGCACGTCCGCAAGTGATGATCTCTCAGCACGTCCGCAA
+>ds2020-267_1217
+GCAGCCGTCCGCAACCAACTGCTGCTCAGCACGTCGCAAGTCATATGGCCTCAGCACGTC
+>ds2020-267_1218
+GGACGTGCTGAGGACTGCTACATTGGGACGTGCTAAGCGAGCATGGTTGCGGACGTGCTG
+>ds2020-267_1219
+TTGCGGACGTGCTGAGGTATGGTAGATTGCGGACTGCTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_1220
+TTGCGGACGTGCTGAGGGATCCGCAGTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_1221
+TTGCGGACGTGCTGAGGGGCGTGCTATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_1222
+TTGCGGACGTGCTGAGCCATGCACACTTGCGGACTGCTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_1223
+TTGCGGACGTGCTGAGTCCCGACCACTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_1224
+CTTCCGATCTATCTAAGGAGCAGCACGTCCGCAAATCAAAGTACCTCAGCACGTCCGCAA
+>ds2020-267_1225
+TCTCCGATCTATCTAAGGAGCAGCACGTCCGCAACGTAGGATCTGTCAGCACGTCCGCAA
+>ds2020-267_1226
+TTGCGGACGTGCTGAGGATTCCACATTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_1227
+TTGCGGACGTGCTGAGGTAAGGAGCATTGCGGACGTGCTGCTCCTTAGATAGATCGGGAG
+>ds2020-267_1228
+CTCTCCGATCTATCTAAGGAGCAGCACGTCCGCAAGCGTTATCCCTCAGCACGTCCGCAA
+>ds2020-267_1229
+TTGCGGACGTGCTGCCCGGATAACATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_1230
+TTGCGGACGTGCTGCCGAGATAACATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_1231
+TTGCGGACGTGCTGAGAGAATCAAGTTGCGGACGTGCTGCTCCTTAGATAGATCGGGAAG
+>ds2020-267_1232
+TTGCGGACGTGCTACCCCGTGATACTTGCGGACGTGCTGCTCCTTAGATAGATCGAAAGA
+>ds2020-267_1233
+TTGCGGACGTGCTGAGGGGATCCTTATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_1234
+TCCGATCTATCTAAGGAGCAGCACGTCCGCAACCTGCTATCCGTCAGCACGTCCGCAACT
+>ds2020-267_1235
+TGAGTGAGTGAGTGAGTGAGTGAGTGAGTGAGTGAGTGAGTGAGTGAGTGAGTGAGTGA
+>ds2020-267_1236
+CCACTGCCACTGCCACTGTTGAGACTATCCCCCAAGCCAAAGGTATTGCGGACGTGCTG
+>ds2020-267_1237
+TTGCGGACGTGCTGACTGAGAGGGCATTGCGGAAGTGATCACGTATTGCGGACGTGCTG
+>ds2020-267_1238
+TTCCGATCTATCTAAGGAGCAGCACGTCCGCAAATTCATTCTGGTCAGCACGTCCGCAA
+>ds2020-267_1239
+ATTGCGGACGTGCTGAGGCACTGTTCGTTGCGGACGTGCTGCTCCTTAGATAGATCGGA
+>ds2020-267_1240
+TTGCGGACGTGCTGATGGGTTTCGTCTTGCGGACGTGCTGCTCCTTAGATAGATCGGAA
+>ds2020-267_1241
+CTTCCGATCTATCTAAGGAGCAGCACGTCCGCAACGTGCTATGCCTCACACGTCCGCAA
+>ds2020-267_1242
+TTGCGGACGTGCTGAGGGAACCGGCTTTGCGGACGTGCTGCTCCTTAGATAGATCGGAA
+>ds2020-267_1243
+TTCCGATCTATCTAAGGAGCAGCACGTCCGCAATCCGATTGCCCTCAGCACGTCCGCAA
+>ds2020-267_1244
+CTTCGATCTATCTAAGGAGCAGCACGTCCGCAAGAGATTACTCCTCAGCACGTCCGCAA
+>ds2020-267_1245
+TTGCGGACGTGCTGGGGAGTATTGCTTGCGGACGTGCTGCTCCTTAGATAGATCGGGAG
+>ds2020-267_1246
+TTAGAGGGACTATCGGCTCAAGCCGATGGAAGTTTGAGGCAATAACAGGTCTGTGCTG
+>ds2020-267_1247
+TTGCGGACGTGCTGAGGCGATACCTCTTGCGGACGTGCTGCTCCTTAGATAGATCGGA
+>ds2020-267_1248
+GTAAAAGCTCACTGGTAACCGGTCCAAAACGAAACTCTTAAAACAGTGGATACCCTCC
+>ds2020-267_1249
+CGGACGTGCTGAGACAATGGCGCTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_1250
+CCCGATCTATCTAAGGAGCAGCACGCCCGCAAATGTACACCGGTCAGCACGTCCGCAA
+>ds2020-267_1251
+TCCGATCTATCTAAGGAGCAGCACGTCCGCAAGGTAGACGCCCTCAGCACGTCCGCAA
+>ds2020-267_1252
+GTGCTGAGCCAGACTACTTGCGGACGTGCTGAGGGAGCCTAAATTGCGGACGTGCTG
+>ds2020-267_1253
+TTGCGGACGTGCTGAGTGTTTACAATTTGCGGACGTGCTGCTCCTTAGATAGATCGG
+>ds2020-267_1254
+TGCTGAGCGACTATAAATTGCGGACGTGCTGAGGGATTCACCGTTGCGGACGTGCTG
+>ds2020-267_1255
+TTGCGGACGTGCTGACGGACGACTATTTGCGGACGTGCTGCTCCTTAGATAGATCGG
+>ds2020-267_1256
+GGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGG
+>ds2020-267_1257
+GCTGAGGGCAGTGGGCTTGCGGACGTGCTGACGGATACGTCATTGCGGGCGTGCTG
+>ds2020-267_1258
+CTCACTCCTCAGCACGTCCGCAAACTGCTTCGGGTTGGGACGTGCTGAGGAGTGAC
diff --git a/tools/virAnnot/test-data/otu_s1_rps.tab b/tools/virAnnot/test-data/otu_s1_rps.tab
new file mode 100755
index 00000000000..46d60b8d066
--- /dev/null
+++ b/tools/virAnnot/test-data/otu_s1_rps.tab
@@ -0,0 +1,109 @@
+#query_id query_length cdd_id hit_id evalue startQ endQ frame description superkingdom no rank family genus
+"ds2020-267_100" "376" "pfam02823" "gnl|CDD|376940" "3.06167e-09" "228" "347" "-3" "pfam02823, ATP-synt_DE_N, ATP synthase, Delta/Epsilon chain, beta-sandwich domain. Part of the ATP synthase CF(1). These subunits are part of the head unit of the ATP synthase. The subunit is called epsilon in bacteria and delta in mitochondria. In bacteria the delta (D) subunit is equivalent to the mitochondrial Oligomycin sensitive subunit, OSCP (pfam00213)." "Bacteria(0.97);Eukaryota(0.03);" "(1.00);" "Lactobacillaceae(0.05);Rhodobacteraceae(0.04);Streptococcaceae(0.03);Bacillaceae(0.03);Burkholderiaceae(0.02);" "Lactobacillus(0.04);Streptococcus(0.03);Bacillus(0.02);Mycoplasma(0.02);Synechococcus(0.01);"
+"ds2020-267_100" "376" "pfam00401" "gnl|CDD|366077" "8.90041e-05" "87" "218" "-3" "pfam00401, ATP-synt_DE, ATP synthase, Delta/Epsilon chain, long alpha-helix domain. Part of the ATP synthase CF(1). These subunits are part of the head unit of the ATP synthase. This subunit is called epsilon in bacteria and delta in mitochondria. In bacteria the delta (D) subunit is equivalent to the mitochondrial Oligomycin sensitive subunit, OSCP (pfam00213)." "Bacteria(0.97);Eukaryota(0.03);" "(1.00);" "(0.06);Clostridiaceae(0.05);Lachnospiraceae(0.05);Bacillaceae(0.04);Peptococcaceae(0.04);" "(0.06);Clostridium(0.05);Lactobacillus(0.03);Bacillus(0.03);Eubacterium(0.02);"
+"ds2020-267_114" "347" "pfam00471" "gnl|CDD|376336" "8.05888e-12" "132" "302" "3" "pfam00471, Ribosomal_L33, Ribosomal protein L33. " "Bacteria(0.86);Eukaryota(0.14);" "(1.00);" "(0.07);Mycoplasmataceae(0.07);Clostridiaceae(0.06);Bacillaceae(0.03);Lactobacillaceae(0.03);" "Mycoplasma(0.06);Clostridium(0.05);(0.04);Lactobacillus(0.02);Bacillus(0.02);"
+"ds2020-267_117" "344" "pfam00252" "gnl|CDD|376306" "7.27175e-23" "107" "295" "2" "pfam00252, Ribosomal_L16, Ribosomal protein L16p/L10e. " "Bacteria(0.58);Eukaryota(0.29);Archaea(0.13);" "(1.00);" "(0.08);Clostridiaceae(0.03);Mycoplasmataceae(0.03);Spirochaetaceae(0.02);" "(0.04);Clostridium(0.03);Mycoplasma(0.02);"
+"ds2020-267_118" "343" "pfam00421" "gnl|CDD|366090" "7.68219e-41" "92" "337" "-1" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-267_120" "339" "pfam16639" "gnl|CDD|374695" "2.20279e-25" "197" "325" "-3" "pfam16639, Apocytochr_F_N, Apocytochrome F, N-terminal. This is the N-terminal domain of cytochrome f. It is a soluble lumen-side domain." "Bacteria(0.75);Eukaryota(0.25);" "(1.00);" "Synechococcaceae(0.25);Gloeobacteraceae(0.07);Prochloraceae(0.07);Aphanothecaceae(0.07);(0.07);" "Synechococcus(0.21);Prochlorococcus(0.07);Gloeobacter(0.07);Oscillatoria(0.04);Aureococcus(0.04);"
+"ds2020-267_130" "330" "pfam00680" "gnl|CDD|366242" "7.64962e-05" "124" "282" "1" "pfam00680, RdRP_1, RNA dependent RNA polymerase. " "Viruses(1.00);" "Riboviria(1.00);" "Caliciviridae(0.30);Picornaviridae(0.30);Secoviridae(0.20);Potyviridae(0.20);" "Vesivirus(0.20);Aphthovirus(0.10);Sequivirus(0.10);Bymovirus(0.10);Potyvirus(0.10);"
+"ds2020-267_139" "320" "pfam05860" "gnl|CDD|368641" "1.34887e-13" "167" "298" "2" "pfam05860, Haemagg_act, haemagglutination activity domain. This domain is suggested to be a carbohydrate- dependent haemagglutination activity site. It is found in a range of haemagglutinins and haemolysins." "Bacteria(1.00);" "(1.00);" "Nostocaceae(0.36);Burkholderiaceae(0.14);Pasteurellaceae(0.14);Pseudomonadaceae(0.12);Neisseriaceae(0.07);" "Nostoc(0.36);Ralstonia(0.14);Pseudomonas(0.12);Haemophilus(0.10);Neisseria(0.07);"
+"ds2020-267_145" "315" "pfam02626" "gnl|CDD|376868" "3.97676e-05" "140" "256" "-3" "pfam02626, CT_A_B, Carboxyltransferase domain, subdomain A and B. Urea carboxylase (UC) catalyzes a two-step, ATP- and biotin-dependent carboxylation reaction of urea. It is composed of biotin carboxylase (BC), carboxyltransferase (CT), and biotin carboxyl carrier protein (BCCP) domains. The CT domain of UC consists of four subdomains, named A, B, C and D. This domain covers the A and B subdomains of the CT domain. This domain covers the whole length of KipA (kinase A) from Bacillus subtilis. It can also be found in S. cerevisiae urea amidolyase Dur1,2, which is a multifunctional biotin-dependent enzyme with domains for urea carboxylase and allophanate (urea carboxylate) hydrolase activity." "Bacteria(0.86);Eukaryota(0.13);Archaea(0.01);" "(1.00);" "Bacillaceae(0.03);Pseudonocardiaceae(0.03);Clostridiaceae(0.03);Corynebacteriaceae(0.03);Streptomycetaceae(0.03);" "Clostridium(0.03);Corynebacterium(0.03);Pseudomonas(0.02);Streptomyces(0.02);Bacillus(0.02);"
+"ds2020-267_16" "1165" "pfam02123" "gnl|CDD|280316" "1.58664e-38" "536" "1078" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_168" no_hit
+"ds2020-267_176" "291" "pfam01235" "gnl|CDD|376500" "1.13408e-29" "115" "243" "1" "pfam01235, Na_Ala_symp, Sodium:alanine symporter family. " "Bacteria(1.00);" "(1.00);" "Bacillaceae(0.10);Lachnospiraceae(0.07);Clostridiaceae(0.06);(0.06);Corynebacteriaceae(0.03);" "Bacillus(0.06);Clostridium(0.06);(0.06);Corynebacterium(0.03);Blautia(0.03);"
+"ds2020-267_187" "287" "pfam02673" "gnl|CDD|376891" "3.59766e-13" "7" "156" "1" "pfam02673, BacA, Bacitracin resistance protein BacA. Bacitracin resistance protein (BacA) is a putative undecaprenol kinase. BacA confers resistance to bacitracin, probably by phosphorylation of undecaprenol. More recent studies show that BacA has undecaprenyl pyrophosphate phosphatase activity. Undecaprenyl phosphate is a key lipid intermediate involved in the synthesis of various bacterial cell wall polymers. Bacitracin, a mixture of related cyclic polypeptide antibiotics, is used to treat surface tissue infections. Its primary mode of action is the inhibition of bacterial cell wall synthesis through sequestration of the essential carrier lipid undecaprenyl pyrophosphate, C55-PP, resulting in the loss of cell integrity and lysis. The characteristic phosphatase sequence-motif in this family is likely to be the PGxSRSGG, compared with the PSGH of the PAP family of phosphatases." "Bacteria(0.97);Archaea(0.03);" "(1.00);" "Clostridiaceae(0.08);(0.06);Lachnospiraceae(0.03);Ruminococcaceae(0.02);Bacillaceae(0.02);" "Clostridium(0.08);(0.04);Bacillus(0.02);Eubacterium(0.02);Prevotella(0.01);"
+"ds2020-267_2" "2436" "pfam02123" "gnl|CDD|280316" "2.17343e-21" "184" "1476" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_20" "893" "pfam00006" "gnl|CDD|376291" "4.59259e-49" "498" "866" "3" "pfam00006, ATP-synt_ab, ATP synthase alpha/beta family, nucleotide-binding domain. This entry includes the ATP synthase alpha and beta subunits, the ATP synthase associated with flagella and the termination factor Rho." "Bacteria(0.88);Archaea(0.07);Eukaryota(0.05);" "(1.00);" "(0.07);Mycoplasmataceae(0.06);Clostridiaceae(0.04);Spirochaetaceae(0.03);Rhodobacteraceae(0.02);" "Mycoplasma(0.06);(0.03);Clostridium(0.03);Treponema(0.01);Persephonella(0.01);"
+"ds2020-267_20" "893" "pfam02874" "gnl|CDD|367225" "7.30466e-19" "126" "329" "3" "pfam02874, ATP-synt_ab_N, ATP synthase alpha/beta family, beta-barrel domain. This family includes the ATP synthase alpha and beta subunits the ATP synthase associated with flagella." "Bacteria(0.60);Eukaryota(0.28);Archaea(0.13);" "(1.00);" "Spirochaetaceae(0.04);Bacillaceae(0.04);Schizosaccharomycetaceae(0.03);Chlamydomonadaceae(0.03);Sulfolobaceae(0.03);" "Treponema(0.04);Schizosaccharomyces(0.03);Chlamydomonas(0.03);Bacillus(0.03);Thermotoga(0.02);"
+"ds2020-267_203" "281" "pfam03040" "gnl|CDD|367312" "1.76794e-22" "121" "231" "-3" "pfam03040, CemA, CemA family. Members of this family are probable integral membrane proteins. Their molecular function is unknown. CemA proteins are found in the inner envelope membrane of chloroplasts but not in the thylakoid membrane. A cyanobacterial member of this family has been implicated in CO2 transport, but is probably not a CO2 transporter itself. They are predicted to be haem-binding however this has not been proven experimentally." "Bacteria(0.77);Eukaryota(0.23);" "(1.00);" "Synechococcaceae(0.17);Aphanothecaceae(0.08);Microcoleaceae(0.06);Chlorellaceae(0.04);Merismopediaceae(0.04);" "Synechococcus(0.13);Oscillatoria(0.04);Physcomitrella(0.04);Microcystis(0.04);Synechocystis(0.04);"
+"ds2020-267_206" "279" "pfam03947" "gnl|CDD|377170" "2.63457e-16" "155" "265" "2" "pfam03947, Ribosomal_L2_C, Ribosomal Proteins L2, C-terminal domain. " "Bacteria(0.62);Eukaryota(0.27);Archaea(0.11);" "(1.00);" "(0.09);Mycoplasmataceae(0.03);Clostridiaceae(0.02);Spirochaetaceae(0.01);Ruminococcaceae(0.01);" "(0.05);Mycoplasma(0.02);Clostridium(0.02);"
+"ds2020-267_21" "858" "pfam00680" "gnl|CDD|366242" "8.36679e-11" "295" "729" "-1" "pfam00680, RdRP_1, RNA dependent RNA polymerase. " "Viruses(1.00);" "Riboviria(1.00);" "Caliciviridae(0.30);Picornaviridae(0.30);Secoviridae(0.20);Potyviridae(0.20);" "Vesivirus(0.20);Aphthovirus(0.10);Sequivirus(0.10);Bymovirus(0.10);Potyvirus(0.10);"
+"ds2020-267_210" "276" "pfam17917" "gnl|CDD|375428" "1.59337e-13" "52" "240" "1" "pfam17917, RT_RNaseH, RNase H-like domain found in reverse transcriptase. DNA polymerase and ribonuclease H (RNase H) activities allow reverse transcriptases to convert the single-stranded retroviral RNA genome into double-stranded DNA, which is integrated into the host chromosome during infection. This entry represents the RNase H like domain." "unknown" "unknown" "unknown" "unknown"
+"ds2020-267_214" "276" "pfam07992" "gnl|CDD|369639" "2.55939e-07" "129" "254" "3" "pfam07992, Pyr_redox_2, Pyridine nucleotide-disulphide oxidoreductase. This family includes both class I and class II oxidoreductases and also NADH oxidases and peroxidases. This domain is actually a small NADH binding domain within a larger FAD binding domain." "Bacteria(0.82);Eukaryota(0.09);Archaea(0.09);" "(1.00);" "Pseudomonadaceae(0.12);Nocardiaceae(0.07);Thermococcaceae(0.05);Enterobacteriaceae(0.05);Merismopediaceae(0.05);" "Pseudomonas(0.12);Rhodococcus(0.07);Synechocystis(0.05);Pyrococcus(0.05);Streptococcus(0.04);"
+"ds2020-267_218" "274" "pfam01348" "gnl|CDD|279664" "1.66328e-05" "51" "257" "3" "pfam01348, Intron_maturas2, Type II intron maturase. Group II introns use intron-encoded reverse transcriptase, maturase and DNA endonuclease activities for site-specific insertion into DNA. Although this type of intron is self splicing in vitro they require a maturase protein for splicing in vivo. It has been shown that a specific region of the aI2 intron is needed for the maturase function. This region was found to be conserved in group II introns and called domain X." "Eukaryota(1.00);" "(1.00);" "Saccharomycetaceae(0.40);Brassicaceae(0.20);Schizosaccharomycetaceae(0.20);Poaceae(0.20);" "Saccharomyces(0.40);Hordeum(0.20);Schizosaccharomyces(0.20);Baimashania(0.20);"
+"ds2020-267_227" "272" "pfam00873" "gnl|CDD|334294" "2.32215e-15" "36" "245" "-1" "pfam00873, ACR_tran, AcrB/AcrD/AcrF family. Members of this family are integral membrane proteins. Some are involved in drug resistance. AcrB cooperates with a membrane fusion protein, AcrA, and an outer membrane channel TolC. The structure shows the AcrB forms a homotrimer." "Bacteria(1.00);" "(1.00);" "Enterobacteriaceae(0.40);Merismopediaceae(0.20);Pseudomonadaceae(0.13);Helicobacteraceae(0.13);Burkholderiaceae(0.07);" "Escherichia(0.40);Synechocystis(0.20);Pseudomonas(0.13);Helicobacter(0.13);Cupriavidus(0.07);"
+"ds2020-267_230" "268" "pfam00115" "gnl|CDD|376293" "1.95663e-15" "81" "236" "-3" "pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I. " "Bacteria(0.87);Archaea(0.09);Eukaryota(0.04);" "(1.00);" "(0.07);Sulfolobaceae(0.03);Flavobacteriaceae(0.03);Bacillaceae(0.02);Burkholderiaceae(0.02);" "(0.03);Methylobacterium(0.01);Hyphomicrobium(0.01);Rhodanobacter(0.01);"
+"ds2020-267_261" "260" "pfam01051" "gnl|CDD|376444" "1.77523e-19" "26" "217" "-2" "pfam01051, Rep_3, Initiator Replication protein. This protein is an initiator of plasmid replication. RepB possesses nicking-closing (topoisomerase I) like activity. It is also able to perform a strand transfer reaction on ssDNA that contains its target. This family also includes RepA which is an E.coli protein involved in plasmid replication. The RepA protein binds to DNA repeats that flank the repA gene." "Bacteria(0.97);(0.02);" "(0.99);" "Streptococcaceae(0.08);Enterobacteriaceae(0.07);Campylobacteraceae(0.07);Lactobacillaceae(0.07);Pasteurellaceae(0.06);" "Lactococcus(0.07);Campylobacter(0.07);Lactobacillus(0.06);Acinetobacter(0.04);Escherichia(0.04);"
+"ds2020-267_268" "259" "pfam02123" "gnl|CDD|280316" "3.22949e-21" "18" "251" "3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_274" "258" "pfam03713" "gnl|CDD|367619" "2.00811e-09" "24" "185" "-2" "pfam03713, DUF305, Domain of unknown function (DUF305). Domain found in small family of bacterial secreted proteins with no known function. Also found in Paramecium bursaria chlorella virus 1. This domain is short and found in one or two copies. The domain has a conserved HH motif that may be functionally important. This domain belongs to the ferritin superfamily. It contains two sequence similar repeats each of which is composed of two alpha helices." "Bacteria(1.00);" "(1.00);" "Nocardiaceae(0.13);Mycobacteriaceae(0.13);Pseudonocardiaceae(0.10);Kineosporiaceae(0.08);Micromonosporaceae(0.08);" "Nocardia(0.13);Mycolicibacterium(0.13);Saccharopolyspora(0.10);Kineococcus(0.08);Streptomyces(0.08);"
+"ds2020-267_278" "258" "pfam00012" "gnl|CDD|365808" "4.1355e-19" "50" "232" "2" "pfam00012, HSP70, Hsp70 protein. Hsp70 chaperones help to fold many proteins. Hsp70 assisted folding involves repeated cycles of substrate binding and release. Hsp70 activity is ATP dependent. Hsp70 proteins are made up of two regions: the amino terminus is the ATPase domain and the carboxyl terminus is the substrate binding region." "Eukaryota(0.54);Bacteria(0.38);Archaea(0.08);" "(1.00);" "Saccharomycetaceae(0.12);Schizosaccharomycetaceae(0.08);Enterobacteriaceae(0.08);Hominidae(0.08);Plasmodiidae(0.04);" "Homo(0.08);Schizosaccharomyces(0.08);Escherichia(0.08);Saccharomyces(0.08);Synechocystis(0.04);"
+"ds2020-267_280" "257" "pfam01788" "gnl|CDD|366811" "2.47901e-09" "132" "224" "-1" "pfam01788, PsbJ, PsbJ. This family consists of the photosystem II reaction centre protein PsbJ from plants and Cyanobacteria. In Synechocystis sp. PCC 6803 PsbJ regulates the number of photosystem II centers in thylakoid membranes, it is a predicted 4kDa protein with one membrane spanning domain." "Bacteria(0.65);Eukaryota(0.35);" "(1.00);" "Microcoleaceae(0.12);Prochloraceae(0.08);Oscillatoriaceae(0.08);Synechococcaceae(0.08);Chroococcaceae(0.08);" "Oscillatoria(0.08);Prochlorococcus(0.08);Synechococcus(0.08);Ectocarpus(0.04);Arenga(0.04);"
+"ds2020-267_283" "257" "pfam13041" "gnl|CDD|372443" "3.148e-06" "13" "114" "1" "pfam13041, PPR_2, PPR repeat family. This repeat has no known function. It is about 35 amino acids long and is found in up to 18 copies in some proteins. The family appears to be greatly expanded in plants and fungi. The repeat has been called PPR." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.30);Euphorbiaceae(0.25);Salicaceae(0.16);Funariaceae(0.05);Poaceae(0.04);" "Arabidopsis(0.30);Ricinus(0.25);Populus(0.16);Physcomitrella(0.05);Naegleria(0.03);"
+"ds2020-267_287" "256" "pfam00115" "gnl|CDD|376293" "2.8946e-26" "13" "237" "1" "pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I. " "Bacteria(0.87);Archaea(0.09);Eukaryota(0.04);" "(1.00);" "(0.07);Sulfolobaceae(0.03);Flavobacteriaceae(0.03);Bacillaceae(0.02);Burkholderiaceae(0.02);" "(0.03);Methylobacterium(0.01);Hyphomicrobium(0.01);Rhodanobacter(0.01);"
+"ds2020-267_312" "252" "pfam00585" "gnl|CDD|278982" "1.52007e-05" "29" "166" "2" "pfam00585, Thr_dehydrat_C, C-terminal regulatory domain of Threonine dehydratase. Threonine dehydratases pfam00291 all contain a carboxy terminal region. This region may have a regulatory role. Some members contain two copies of this region. This family is homologous to the pfam01842 domain." "Bacteria(0.69);Eukaryota(0.31);" "(1.00);" "Solanaceae(0.23);Enterobacteriaceae(0.15);Pasteurellaceae(0.15);Bacillaceae(0.08);Burkholderiaceae(0.08);" "Solanum(0.23);Haemophilus(0.15);Salmonella(0.15);Mycobacterium(0.08);Saccharomyces(0.08);"
+"ds2020-267_315" "251" "pfam00989" "gnl|CDD|366402" "1.61999e-05" "32" "241" "2" "pfam00989, PAS, PAS fold. The PAS fold corresponds to the structural domain that has previously been defined as PAS and PAC motifs. The PAS fold appears in archaea, eubacteria and eukarya." "Bacteria(0.65);Eukaryota(0.35);" "(1.00);" "Bacillaceae(0.14);Enterobacteriaceae(0.14);Bradyrhizobiaceae(0.12);Brassicaceae(0.08);Drosophilidae(0.06);" "Bacillus(0.14);Bradyrhizobium(0.12);Escherichia(0.10);Arabidopsis(0.08);Drosophila(0.06);"
+"ds2020-267_316" "251" "pfam02123" "gnl|CDD|280316" "3.50628e-08" "28" "228" "-3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_318" "251" "pfam00252" "gnl|CDD|376306" "5.63854e-12" "78" "206" "-1" "pfam00252, Ribosomal_L16, Ribosomal protein L16p/L10e. " "Bacteria(0.58);Eukaryota(0.29);Archaea(0.13);" "(1.00);" "(0.08);Clostridiaceae(0.03);Mycoplasmataceae(0.03);Spirochaetaceae(0.02);" "(0.04);Clostridium(0.03);Mycoplasma(0.02);"
+"ds2020-267_323" "250" "pfam00227" "gnl|CDD|365960" "5.8155e-09" "10" "150" "-2" "pfam00227, Proteasome, Proteasome subunit. The proteasome is a multisubunit structure that degrades proteins. Protein degradation is an essential component of regulation because proteins can become misfolded, damaged, or unnecessary. Proteasomes and their homologs vary greatly in complexity: from HslV (heat shock locus v), which is encoded by 1 gene in bacteria, to the eukaryotic 20S proteasome, which is encoded by more than 14 genes. Recently evidence of two novel groups of bacterial proteasomes was proposed. The first is Anbu, which is sparsely distributed among cyanobacteria and proteobacteria. The second is call beta-proteobacteria proteasome homolog (BPH)." "Eukaryota(0.68);Archaea(0.21);Bacteria(0.11);" "(1.00);" "Drosophilidae(0.11);Rhabditidae(0.07);Schizosaccharomycetaceae(0.07);Unikaryonidae(0.07);Saccharomycetaceae(0.07);" "Drosophila(0.11);Schizosaccharomyces(0.07);Caenorhabditis(0.07);Saccharomyces(0.07);Encephalitozoon(0.07);"
+"ds2020-267_329" "249" "pfam13173" "gnl|CDD|379049" "4.80752e-08" "106" "249" "1" "pfam13173, AAA_14, AAA domain. This family of domains contain a P-loop motif that is characteristic of the AAA superfamily." "Bacteria(0.78);Archaea(0.22);" "(1.00);" "Bacteroidaceae(0.12);Coxiellaceae(0.09);Mycoplasmataceae(0.09);Sulfolobaceae(0.08);Prevotellaceae(0.05);" "Bacteroides(0.12);Coxiella(0.09);Mycoplasma(0.09);Prevotella(0.05);Sulfurisphaera(0.04);"
+"ds2020-267_33" "680" "pfam04157" "gnl|CDD|367847" "4.86455e-13" "342" "494" "-1" "pfam04157, EAP30, EAP30/Vps36 family. This family includes EAP30 as well as the Vps36 protein. Vps36 is involved in Golgi to endosome trafficking. EAP30 is a subunit of the ELL complex. The ELL is an 80-kDa RNA polymerase II transcription factor. ELL interacts with three other proteins to form the complex known as ELL complex. The ELL complex is capable of increasing that catalytic rate of transcription elongation, but is unable to repress initiation of transcription by RNA polymerase II as is the case of ELL. EAP30 is thought to lead to the derepression of ELL's transcriptional inhibitory activity." "Eukaryota(1.00);" "(1.00);" "Saccharomycetaceae(0.06);Debaryomycetaceae(0.05);(0.03);Schizosaccharomycetaceae(0.02);Mamiellaceae(0.02);" "Candida(0.02);Schizosaccharomyces(0.02);Micromonas(0.02);Leishmania(0.01);Naumovozyma(0.01);"
+"ds2020-267_336" "248" "pfam00113" "gnl|CDD|365883" "4.23282e-13" "15" "116" "-1" "pfam00113, Enolase_C, Enolase, C-terminal TIM barrel domain. " "Eukaryota(0.67);Bacteria(0.33);" "(1.00);" "Pleosporaceae(0.11);Bacillaceae(0.11);Anatidae(0.11);Schizosaccharomycetaceae(0.11);Debaryomycetaceae(0.11);" "Shigella(0.11);Anas(0.11);Bipolaris(0.11);Zea(0.11);Bacillus(0.11);"
+"ds2020-267_352" "245" "pfam00946" "gnl|CDD|366381" "3.23548e-05" "1" "141" "1" "pfam00946, Mononeg_RNA_pol, Mononegavirales RNA dependent RNA polymerase. Members of the Mononegavirales including the Paramyxoviridae, like other non-segmented negative strand RNA viruses, have an RNA-dependent RNA polymerase composed of two subunits, a large protein L and a phosphoprotein P. This is a protein family of the L protein. The L protein confers the RNA polymerase activity on the complex. The P protein acts as a transcription factor." "Viruses(1.00);" "Riboviria(1.00);" "Paramyxoviridae(0.44);Rhabdoviridae(0.31);Pneumoviridae(0.12);Filoviridae(0.12);" "Lyssavirus(0.12);Aquaparamyxovirus(0.06);Rubulavirus(0.06);Respirovirus(0.06);Avulavirus(0.06);"
+"ds2020-267_363" "243" "pfam00416" "gnl|CDD|366086" "2.02528e-05" "15" "134" "-2" "pfam00416, Ribosomal_S13, Ribosomal protein S13/S18. This family includes ribosomal protein S13 from prokaryotes and S18 from eukaryotes." "Eukaryota(0.55);Bacteria(0.27);Archaea(0.18);" "(1.00);" "Brassicaceae(0.18);Muridae(0.09);Poaceae(0.09);Drosophilidae(0.09);Mycobacteriaceae(0.09);" "Arabidopsis(0.18);Geobacillus(0.09);Rattus(0.09);Haloarcula(0.09);Shigella(0.09);"
+"ds2020-267_364" "243" "pfam00216" "gnl|CDD|365952" "1.5507e-10" "134" "241" "-3" "pfam00216, Bac_DNA_binding, Bacterial DNA-binding protein. " "Bacteria(0.95);Eukaryota(0.02);Viruses(0.01);Archaea(0.01);" "(0.99);Caudovirales(0.01);" "Tannerellaceae(0.09);Mycoplasmataceae(0.06);Pseudomonadaceae(0.05);Aquificaceae(0.05);Bacteroidaceae(0.05);" "Parabacteroides(0.09);Mycoplasma(0.05);Pseudomonas(0.05);Bacteroides(0.05);Desulfovibrio(0.04);"
+"ds2020-267_365" no_hit
+"ds2020-267_369" "243" "pfam12137" "gnl|CDD|378818" "6.51052e-05" "137" "217" "-3" "pfam12137, RapA_C, RNA polymerase recycling family C-terminal. This domain is found in bacteria. This domain is about 360 amino acids in length. This domain is found associated with pfam00271, pfam00176. The function of this domain is not known, but structurally it forms an alpha-beta fold in nature with a central beta-sheet flanked by helices and loops, the beta-sheet being mainly antiparallel and flanked by four alpha helices, among which the two longer helices exhibit a coiled-coil arrangement." "Bacteria(1.00);" "(1.00);" "Pasteurellaceae(0.14);Alteromonadaceae(0.07);Morganellaceae(0.05);Methylococcaceae(0.05);Shewanellaceae(0.04);" "(0.04);Marinobacter(0.04);Shewanella(0.04);Pseudomonas(0.03);Psychromonas(0.03);"
+"ds2020-267_370" "242" "pfam00146" "gnl|CDD|376297" "2.41391e-10" "22" "111" "1" "pfam00146, NADHdh, NADH dehydrogenase. " "Bacteria(0.78);Archaea(0.12);Eukaryota(0.10);" "(1.00);" "(0.04);Peptococcaceae(0.02);Flavobacteriaceae(0.02);Desulfurococcaceae(0.02);Prevotellaceae(0.02);" "(0.02);Prevotella(0.02);Bacteroides(0.01);"
+"ds2020-267_374" "242" "pfam00124" "gnl|CDD|365890" "5.09126e-07" "21" "125" "3" "pfam00124, Photo_RC, Photosynthetic reaction centre protein. " "Bacteria(0.95);Eukaryota(0.05);" "(1.00);" "Rhodobacteraceae(0.13);Chromatiaceae(0.13);Ectothiorhodospiraceae(0.08);Synechococcaceae(0.05);(0.05);" "Rhodobacter(0.08);Sphingomonas(0.05);Halorhodospira(0.05);Roseiflexus(0.05);Thioflavicoccus(0.05);"
+"ds2020-267_388" "241" "pfam02123" "gnl|CDD|280316" "6.16383e-08" "35" "214" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_4" "2297" "pfam02123" "gnl|CDD|280316" "1.96254e-52" "824" "1858" "-2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_402" no_hit
+"ds2020-267_404" "239" "pfam00361" "gnl|CDD|366050" "3.50341e-05" "70" "219" "1" "pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla." "Eukaryota(0.54);Bacteria(0.46);" "(1.00);" "Culicidae(0.23);Rhodobacteraceae(0.23);Poaceae(0.15);Enterobacteriaceae(0.15);Phasianidae(0.08);" "Paracoccus(0.23);Anopheles(0.23);Escherichia(0.15);Zea(0.15);Aspergillus(0.08);"
+"ds2020-267_407" "239" "pfam00177" "gnl|CDD|365924" "1.14399e-06" "28" "126" "1" "pfam00177, Ribosomal_S7, Ribosomal protein S7p/S5e. This family contains ribosomal protein S7 from prokaryotes and S5 from eukaryotes." "Bacteria(0.79);Archaea(0.11);Eukaryota(0.10);" "(1.00);" "(0.09);Clostridiaceae(0.04);Mycoplasmataceae(0.03);Spirochaetaceae(0.02);Ruminococcaceae(0.01);" "(0.04);Clostridium(0.04);Mycoplasma(0.03);Treponema(0.01);Desulfovibrio(0.01);"
+"ds2020-267_42" "575" "pfam00284" "gnl|CDD|366000" "1.02897e-21" "187" "300" "1" "pfam00284, Cytochrom_B559a, Lumenal portion of Cytochrome b559, alpha (gene psbE) subunit. This family is the lumenal portion of cytochrome b559 alpha chain, matches to this family should be accompanied by a match to the pfam00283 family also. The Prosite pattern pattern matches the transmembrane region of the cytochrome b559 alpha and beta subunits." "Bacteria(0.86);Eukaryota(0.14);" "(1.00);" "Synechococcaceae(0.17);Microcoleaceae(0.09);Aphanothecaceae(0.09);Prochloraceae(0.06);Phaeodactylaceae(0.03);" "Synechococcus(0.17);Prochlorococcus(0.06);Stanieria(0.03);Acaryochloris(0.03);Selaginella(0.03);"
+"ds2020-267_42" "575" "pfam00283" "gnl|CDD|365999" "1.54942e-08" "79" "165" "1" "pfam00283, Cytochrom_B559, Cytochrome b559, alpha (gene psbE) and beta (gene psbF)subunits. " "Bacteria(0.59);Eukaryota(0.41);" "(1.00);" "Synechococcaceae(0.29);Prochloraceae(0.12);Pseudanabaenaceae(0.06);Acaryochloridaceae(0.06);Thalassiosiraceae(0.06);" "Synechococcus(0.29);Prochlorococcus(0.12);Selaginella(0.06);Gloeobacter(0.06);Thalassiosira(0.06);"
+"ds2020-267_42" "575" "pfam00283" "gnl|CDD|365999" "2.95472e-07" "325" "411" "1" "pfam00283, Cytochrom_B559, Cytochrome b559, alpha (gene psbE) and beta (gene psbF)subunits. " "Bacteria(0.59);Eukaryota(0.41);" "(1.00);" "Synechococcaceae(0.29);Prochloraceae(0.12);Pseudanabaenaceae(0.06);Acaryochloridaceae(0.06);Thalassiosiraceae(0.06);" "Synechococcus(0.29);Prochlorococcus(0.12);Selaginella(0.06);Gloeobacter(0.06);Thalassiosira(0.06);"
+"ds2020-267_427" no_hit
+"ds2020-267_428" "235" "pfam00164" "gnl|CDD|333891" "1.04166e-24" "3" "182" "3" "pfam00164, Ribosom_S12_S23, Ribosomal protein S12/S23. This protein is known as S12 in bacteria and archaea and S23 in eukaryotes." "Bacteria(0.45);Eukaryota(0.27);Archaea(0.27);" "(1.00);" "Thermococcaceae(0.09);Micrococcaceae(0.09);Enterobacteriaceae(0.09);Thermaceae(0.09);Muridae(0.09);" "Thermococcus(0.09);Saccharomyces(0.09);Rickettsia(0.09);Synechococcus(0.09);Thermus(0.09);"
+"ds2020-267_436" no_hit
+"ds2020-267_438" no_hit
+"ds2020-267_444" no_hit
+"ds2020-267_457" no_hit
+"ds2020-267_466" "230" "pfam00072" "gnl|CDD|333815" "5.42419e-08" "50" "208" "2" "pfam00072, Response_reg, Response regulator receiver domain. This domain receives the signal from the sensor partner in bacterial two-component systems. It is usually found N-terminal to a DNA binding effector domain." "Bacteria(0.94);Eukaryota(0.06);" "(1.00);" "Enterobacteriaceae(0.38);Bacillaceae(0.13);Pseudomonadaceae(0.10);Rhodobacteraceae(0.08);Saccharomycetaceae(0.04);" "Escherichia(0.21);Bacillus(0.13);Salmonella(0.12);Pseudomonas(0.10);Rhodobacter(0.06);"
+"ds2020-267_471" "230" "pfam00201" "gnl|CDD|278624" "3.12575e-07" "46" "210" "1" "pfam00201, UDPGT, UDP-glucoronosyl and UDP-glucosyl transferase. " "Eukaryota(1.00);" "(1.00);" "Hominidae(0.46);Muridae(0.31);Leporidae(0.15);Poaceae(0.08);" "Homo(0.46);Rattus(0.31);Oryctolagus(0.15);Zea(0.08);"
+"ds2020-267_486" "228" "pfam17035" "gnl|CDD|374956" "5.12677e-09" "108" "203" "3" "pfam17035, BET, Bromodomain extra-terminal - transcription regulation. The BET, or bromodomain extra-terminal domain, is found on bromodomain proteins that play key roles in development, cancer progression and virus-host pathogenesis. It interacts with NSD3, JMJD6, CHD4, GLTSCR1, and ATAD5 all of which are shown to impart a pTEFb-independent transcriptional activation function on the bromodomain proteins." "Eukaryota(1.00);" "(1.00);" "(0.06);Poaceae(0.05);Brassicaceae(0.05);Saccharomycetaceae(0.05);Musaceae(0.05);" "Musa(0.05);Glycine(0.03);Populus(0.03);Ichthyophthirius(0.03);Arabidopsis(0.03);"
+"ds2020-267_5" no_hit
+"ds2020-267_504" no_hit
+"ds2020-267_506" "226" "pfam05173" "gnl|CDD|377479" "2.45773e-17" "93" "215" "-3" "pfam05173, DapB_C, Dihydrodipicolinate reductase, C-terminus. Dihydrodipicolinate reductase (DapB) reduces the alpha,beta-unsaturated cyclic imine, dihydro-dipicolinate. This reaction is the second committed step in the biosynthesis of L-lysine and its precursor meso-diaminopimelate, which are critical for both protein and cell wall biosynthesis. The C-terminal domain of DapB has been proposed to be the substrate- binding domain." "Bacteria(0.89);Archaea(0.07);Eukaryota(0.04);" "(1.00);" "Clostridiaceae(0.07);(0.06);Flavobacteriaceae(0.04);Lachnospiraceae(0.03);Ruminococcaceae(0.03);" "Clostridium(0.06);(0.04);Prevotella(0.02);Eubacterium(0.02);Ruminococcus(0.01);"
+"ds2020-267_516" no_hit
+"ds2020-267_529" "224" "pfam00510" "gnl|CDD|366140" "6.14777e-23" "35" "211" "2" "pfam00510, COX3, Cytochrome c oxidase subunit III. " "Eukaryota(1.00);" "(1.00);" "Culicidae(0.14);Phasianidae(0.14);Rhabditidae(0.14);Schizosaccharomycetaceae(0.14);Saccharomycetaceae(0.14);" "Anopheles(0.14);Schizosaccharomyces(0.14);Caenorhabditis(0.14);Gallus(0.14);Neurospora(0.14);"
+"ds2020-267_550" no_hit
+"ds2020-267_555" "222" "pfam00124" "gnl|CDD|365890" "7.71427e-08" "48" "203" "3" "pfam00124, Photo_RC, Photosynthetic reaction centre protein. " "Bacteria(0.95);Eukaryota(0.05);" "(1.00);" "Rhodobacteraceae(0.13);Chromatiaceae(0.13);Ectothiorhodospiraceae(0.08);Synechococcaceae(0.05);(0.05);" "Rhodobacter(0.08);Sphingomonas(0.05);Halorhodospira(0.05);Roseiflexus(0.05);Thioflavicoccus(0.05);"
+"ds2020-267_557" "222" "pfam00421" "gnl|CDD|366090" "3.32623e-20" "12" "200" "-2" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-267_558" "222" "pfam03737" "gnl|CDD|377116" "4.93695e-13" "57" "179" "-2" "pfam03737, RraA-like, Aldolase/RraA. Members of this family include regulator of ribonuclease E activity A (RraA) and 4-hydroxy-4-methyl-2-oxoglutarate (HMG)/4-carboxy- 4-hydroxy-2-oxoadipate (CHA) aldolase, also known as RraA-like protein. RraA acts as a trans-acting modulator of RNA turnover, binding essential endonuclease RNase E and inhibiting RNA processing. RraA-like proteins seem to contain aldolase and/or decarboxylase activity either in place of or in addition to the RNase E inhibitor functions." "Bacteria(0.81);Archaea(0.09);Eukaryota(0.09);" "(1.00);" "(0.05);Alcaligenaceae(0.03);Burkholderiaceae(0.03);Saccharomycetaceae(0.03);Streptomycetaceae(0.03);" "Bacillus(0.03);Corynebacterium(0.03);Streptomyces(0.03);(0.03);Advenella(0.02);"
+"ds2020-267_565" "222" "pfam03950" "gnl|CDD|377172" "9.52435e-10" "53" "184" "-3" "pfam03950, tRNA-synt_1c_C, tRNA synthetases class I (E and Q), anti-codon binding domain. Other tRNA synthetase sub-families are too dissimilar to be included. This family includes only glutamyl and glutaminyl tRNA synthetases. In some organisms, a single glutamyl-tRNA synthetase aminoacylates both tRNA(Glu) and tRNA(Gln)." "Bacteria(0.37);Archaea(0.36);Eukaryota(0.27);" "(1.00);" "(0.07);Thermoproteaceae(0.04);Sulfolobaceae(0.04);Methanobacteriaceae(0.04);Desulfurococcaceae(0.04);" "(0.07);Geobacter(0.02);Caenorhabditis(0.02);Encephalitozoon(0.02);Dictyostelium(0.02);"
+"ds2020-267_571" "221" "pfam00501" "gnl|CDD|366135" "2.61467e-07" "34" "201" "1" "pfam00501, AMP-binding, AMP-binding enzyme. " "Bacteria(0.56);Eukaryota(0.35);Archaea(0.09);" "(1.00);" "Bacillaceae(0.12);Streptomycetaceae(0.10);Mycobacteriaceae(0.09);Rhabditidae(0.09);Brassicaceae(0.07);" "Bacillus(0.12);Streptomyces(0.10);Caenorhabditis(0.09);Mycobacterium(0.07);Archaeoglobus(0.07);"
+"ds2020-267_58" "476" "pfam03641" "gnl|CDD|367590" "7.19579e-14" "142" "315" "-3" "pfam03641, Lysine_decarbox, Possible lysine decarboxylase. The members of this family share a highly conserved motif PGGXGTXXE that is probably functionally important. This family includes proteins annotated as lysine decarboxylases, although the evidence for this is not clear." "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Brassicaceae(0.17);Pseudomonadaceae(0.12);Mycobacteriaceae(0.08);Caulobacteraceae(0.08);Streptomycetaceae(0.08);" "Arabidopsis(0.17);Pseudomonas(0.12);Mesorhizobium(0.08);Caulobacter(0.08);Mycobacterium(0.08);"
+"ds2020-267_589" no_hit
+"ds2020-267_595" "219" "pfam02123" "gnl|CDD|280316" "5.90575e-11" "13" "210" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_597" "219" "pfam00421" "gnl|CDD|366090" "8.10522e-27" "22" "207" "1" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-267_599" "219" "pfam05717" "gnl|CDD|377551" "3.2952e-06" "28" "147" "1" "pfam05717, TnpB_IS66, IS66 Orf2 like protein. This protein is found in insertion sequences related to IS66. The function of these proteins is uncertain, but they are probably essential for transposition." "Bacteria(0.99);" "(1.00);" "(0.07);Burkholderiaceae(0.06);Lachnospiraceae(0.05);Rhizobiaceae(0.05);Bacteroidaceae(0.04);" "(0.06);Bacteroides(0.04);Burkholderia(0.02);Bradyrhizobium(0.02);Sinorhizobium(0.02);"
+"ds2020-267_6" "1860" "pfam02123" "gnl|CDD|280316" "1.35634e-17" "1147" "1764" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_610" "218" "pfam17759" "gnl|CDD|380005" "1.47034e-13" "25" "195" "1" "pfam17759, tRNA_synthFbeta, Phenylalanyl tRNA synthetase beta chain CLM domain. This domain corresponds to the catalytic like domain (CLM) in the beta chain of phe tRNA synthetase." "unknown" "unknown" "unknown" "unknown"
+"ds2020-267_622" "217" "pfam16363" "gnl|CDD|379835" "2.10592e-11" "29" "157" "2" "pfam16363, GDP_Man_Dehyd, GDP-mannose 4,6 dehydratase. " "Bacteria(0.76);Eukaryota(0.19);Archaea(0.05);" "(1.00);" "(0.05);Flavobacteriaceae(0.05);Paenibacillaceae(0.02);Spirochaetaceae(0.02);Nocardioidaceae(0.02);" "Flavobacterium(0.02);Leptospira(0.01);Paenibacillus(0.01);Plasmodium(0.01);Methylobacterium(0.01);"
+"ds2020-267_636" "217" "pfam13041" "gnl|CDD|372443" "7.94482e-18" "64" "195" "-2" "pfam13041, PPR_2, PPR repeat family. This repeat has no known function. It is about 35 amino acids long and is found in up to 18 copies in some proteins. The family appears to be greatly expanded in plants and fungi. The repeat has been called PPR." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.30);Euphorbiaceae(0.25);Salicaceae(0.16);Funariaceae(0.05);Poaceae(0.04);" "Arabidopsis(0.30);Ricinus(0.25);Populus(0.16);Physcomitrella(0.05);Naegleria(0.03);"
+"ds2020-267_637" "217" "pfam07026" "gnl|CDD|284449" "1.36077e-13" "47" "172" "2" "pfam07026, DUF1317, Protein of unknown function (DUF1317). This family consists of several hypothetical bacterial and phage proteins of around 60 residues in length. The function of this family is unknown." "Viruses(0.50);Bacteria(0.50);" "Caudovirales(0.50);(0.50);" "Siphoviridae(0.50);Morganellaceae(0.50);" "Photorhabdus(0.50);Lambdavirus(0.50);"
+"ds2020-267_639" "216" "pfam13631" "gnl|CDD|379304" "4.98182e-07" "2" "214" "2" "pfam13631, Cytochrom_B_N_2, Cytochrome b(N-terminal)/b6/petB. " "Bacteria(0.65);Archaea(0.25);Eukaryota(0.10);" "(1.00);" "Mycobacteriaceae(0.15);Thermomonosporaceae(0.10);Sulfolobaceae(0.10);Thermoplasmataceae(0.10);Drosophilidae(0.05);" "Thermomonospora(0.10);Mycobacterium(0.10);Saccharolobus(0.10);Thermoplasma(0.10);Streptomyces(0.05);"
+"ds2020-267_641" "216" "pfam00804" "gnl|CDD|366315" "9.72957e-23" "23" "187" "-3" "pfam00804, Syntaxin, Syntaxin. Syntaxins are the prototype family of SNARE proteins. They usually consist of three main regions - a C-terminal transmembrane region, a central SNARE domain which is characteristic of and conserved in all syntaxins (pfam05739), and an N-terminal domain that is featured in this entry. This domain varies between syntaxin isoforms; in syntaxin 1A it is found as three alpha-helices with a left-handed twist. It may fold back on the SNARE domain to allow the molecule to adopt a 'closed' configuration that prevents formation of the core fusion complex - it thus has an auto-inhibitory role. The function of syntaxins is determined by their localization. They are involved in neuronal exocytosis, ER-Golgi transport and Golgi-endosome transport, for example. They also interact with other proteins as well as those involved in SNARE complexes. These include vesicle coat proteins, Rab GTPases, and tethering factors." "Eukaryota(1.00);" "(1.00);" "Adrianichthyidae(0.08);Tetraodontidae(0.08);Brassicaceae(0.08);Poaceae(0.06);Funariaceae(0.06);" "Oryzias(0.08);Physcomitrella(0.06);Oreochromis(0.06);Selaginella(0.06);Arabidopsis(0.05);"
+"ds2020-267_642" no_hit
+"ds2020-267_643" no_hit
+"ds2020-267_65" "462" "pfam13406" "gnl|CDD|372592" "4.82338e-27" "145" "360" "-1" "pfam13406, SLT_2, Transglycosylase SLT domain. This family is related to the SLT domain pfam01464." "Bacteria(1.00);" "(1.00);" "Rhizobiaceae(0.23);Phyllobacteriaceae(0.08);Chromobacteriaceae(0.08);Methylococcaceae(0.08);Legionellaceae(0.08);" "Sinorhizobium(0.23);Piscirickettsia(0.08);Acinetobacter(0.08);Desulfotalea(0.08);Ruegeria(0.08);"
+"ds2020-267_669" "215" "pfam17862" "gnl|CDD|380037" "4.46873e-06" "33" "122" "-1" "pfam17862, AAA_lid_3, AAA+ lid domain. This entry represents the alpha helical AAA+ lid domain that is found to the C-terminus of AAA domains." "unknown" "unknown" "unknown" "unknown"
+"ds2020-267_685" "214" "pfam09334" "gnl|CDD|370442" "1.80219e-14" "16" "117" "-2" "pfam09334, tRNA-synt_1g, tRNA synthetases class I (M). This family includes methionyl tRNA synthetases." "Bacteria(0.57);Archaea(0.26);Eukaryota(0.17);" "(1.00);" "Erwiniaceae(0.09);Methanocaldococcaceae(0.04);Thermoproteaceae(0.04);Streptomycetaceae(0.04);Methanosarcinaceae(0.04);" "Saccharolobus(0.04);Leptospira(0.04);Wigglesworthia(0.04);Borreliella(0.04);Saccharomyces(0.04);"
+"ds2020-267_692" "214" "pfam00680" "gnl|CDD|366242" "4.79875e-05" "70" "180" "1" "pfam00680, RdRP_1, RNA dependent RNA polymerase. " "Viruses(1.00);" "Riboviria(1.00);" "Caliciviridae(0.30);Picornaviridae(0.30);Secoviridae(0.20);Potyviridae(0.20);" "Vesivirus(0.20);Aphthovirus(0.10);Sequivirus(0.10);Bymovirus(0.10);Potyvirus(0.10);"
+"ds2020-267_697" "214" "pfam00378" "gnl|CDD|334046" "5.08319e-08" "45" "170" "-3" "pfam00378, ECH_1, Enoyl-CoA hydratase/isomerase. This family contains a diverse set of enzymes including: enoyl-CoA hydratase, napthoate synthase, carnitate racemase, 3-hydroxybutyryl-CoA dehydratase and dodecanoyl-CoA delta-isomerase." "Bacteria(0.56);Eukaryota(0.44);" "(1.00);" "Bacillaceae(0.33);Hominidae(0.22);Enterobacteriaceae(0.11);Rhabditidae(0.11);Rhodobacteraceae(0.11);" "Bacillus(0.33);Homo(0.22);Rhodobacter(0.11);Escherichia(0.11);Mus(0.11);"
+"ds2020-267_710" no_hit
+"ds2020-267_719" "213" "pfam00072" "gnl|CDD|333815" "9.1657e-13" "45" "185" "-2" "pfam00072, Response_reg, Response regulator receiver domain. This domain receives the signal from the sensor partner in bacterial two-component systems. It is usually found N-terminal to a DNA binding effector domain." "Bacteria(0.94);Eukaryota(0.06);" "(1.00);" "Enterobacteriaceae(0.38);Bacillaceae(0.13);Pseudomonadaceae(0.10);Rhodobacteraceae(0.08);Saccharomycetaceae(0.04);" "Escherichia(0.21);Bacillus(0.13);Salmonella(0.12);Pseudomonas(0.10);Rhodobacter(0.06);"
+"ds2020-267_729" "212" "pfam01405" "gnl|CDD|279713" "5.43744e-05" "19" "99" "-3" "pfam01405, PsbT, Photosystem II reaction centre T protein. The exact function of this protein is unknown. It probably consists of a single transmembrane spanning helix. The Chlamydomonas reinhardtii psbT protein appears to be (i) a novel photosystem II subunit and (ii) required for maintaining optimal photosystem II activity under adverse growth conditions." "Bacteria(0.73);Eukaryota(0.27);" "(1.00);" "Synechococcaceae(0.33);Prochloraceae(0.13);Aphanothecaceae(0.07);Chlamydomonadaceae(0.07);Chamaesiphonaceae(0.07);" "Synechococcus(0.33);Prochlorococcus(0.13);Aureococcus(0.07);Geitlerinema(0.07);Rippkaea(0.07);"
+"ds2020-267_746" no_hit
+"ds2020-267_75" "425" "pfam00005" "gnl|CDD|365804" "4.26261e-07" "129" "275" "-1" "pfam00005, ABC_tran, ABC transporter. ABC transporters for a large family of proteins responsible for translocation of a variety of compounds across biological membranes. ABC transporters are the largest family of proteins in many completely sequenced bacteria. ABC transporters are composed of two copies of this domain and two copies of a transmembrane domain pfam00664. These four domains may belong to a single polypeptide as in CFTR, or belong in different polypeptide chains." "Bacteria(0.74);Eukaryota(0.26);" "(1.00);" "Enterobacteriaceae(0.41);Saccharomycetaceae(0.13);Pseudomonadaceae(0.07);Streptococcaceae(0.06);Bacillaceae(0.04);" "Escherichia(0.37);Saccharomyces(0.13);Pseudomonas(0.07);Bacillus(0.04);Lactococcus(0.04);"
+"ds2020-267_750" "211" "pfam02391" "gnl|CDD|376774" "1.24642e-05" "28" "114" "-2" "pfam02391, MoaE, MoaE protein. This family contains the MoaE protein that is involved in biosynthesis of molybdopterin. Molybdopterin, the universal component of the pterin molybdenum cofactors, contains a dithiolene group serving to bind Mo. Addition of the dithiolene sulfurs to a molybdopterin precursor requires the activity of the converting factor. Converting factor contains the MoaE and MoaD proteins." "Bacteria(0.72);Eukaryota(0.21);Archaea(0.07);" "(1.00);" "(0.04);Bacillaceae(0.03);Mycobacteriaceae(0.02);Burkholderiaceae(0.02);Paenibacillaceae(0.02);" "Bacillus(0.02);(0.01);Drosophila(0.01);Paenibacillus(0.01);Mycobacterium(0.01);"
+"ds2020-267_763" no_hit
+"ds2020-267_773" "210" "pfam01641" "gnl|CDD|376583" "5.23903e-34" "16" "174" "1" "pfam01641, SelR, SelR domain. Methionine sulfoxide reduction is an important process, by which cells regulate biological processes and cope with oxidative stress. MsrA, a protein involved in the reduction of methionine sulfoxides in proteins, has been known for four decades and has been extensively characterized with respect to structure and function. However, recent studies revealed that MsrA is only specific for methionine-S-sulfoxides. Because oxidized methionines occur in a mixture of R and S isomers in vivo, it was unclear how stereo-specific MsrA could be responsible for the reduction of all protein methionine sulfoxides. It appears that a second methionine sulfoxide reductase, SelR, evolved that is specific for methionine-R-sulfoxides, the activity that is different but complementary to that of MsrA. Thus, these proteins, working together, could reduce both stereoisomers of methionine sulfoxide. This domain is found both in SelR proteins and fused with the peptide methionine sulfoxide reductase enzymatic domain pfam01625. The domain has two conserved cysteine and histidines. The domain binds both selenium and zinc. The final cysteine is found to be replaced by the rare amino acid selenocysteine in some members of the family. This family has methionine-R-sulfoxide reductase activity." "Bacteria(0.79);Eukaryota(0.16);Archaea(0.05);" "(1.00);" "Flavobacteriaceae(0.05);(0.04);Saccharomycetaceae(0.02);Vibrionaceae(0.01);Spirochaetaceae(0.01);" "(0.02);Mycoplasma(0.01);Vibrio(0.01);Corynebacterium(0.01);"
+"ds2020-267_8" "1703" "pfam00680" "gnl|CDD|366242" "2.85682e-13" "685" "1458" "-3" "pfam00680, RdRP_1, RNA dependent RNA polymerase. " "Viruses(1.00);" "Riboviria(1.00);" "Caliciviridae(0.30);Picornaviridae(0.30);Secoviridae(0.20);Potyviridae(0.20);" "Vesivirus(0.20);Aphthovirus(0.10);Sequivirus(0.10);Bymovirus(0.10);Potyvirus(0.10);"
+"ds2020-267_811" "208" "pfam07991" "gnl|CDD|285265" "1.80927e-08" "20" "190" "-1" "pfam07991, IlvN, Acetohydroxy acid isomeroreductase, NADPH-binding domain. Acetohydroxy acid isomeroreductase catalyzes the conversion of acetohydroxy acids into dihydroxy valerates. This reaction is the second in the synthetic pathway of the essential branched side chain amino acids valine and isoleucine. This N-terminal region of the enzyme carries the binding-site for NADPH. The active-site for enzymatic activity lies in the C-terminal part, IlvC, pfam01450." "Bacteria(0.76);Archaea(0.24);" "(1.00);" "Bacillaceae(0.07);Helicobacteraceae(0.05);Sulfolobaceae(0.05);Bartonellaceae(0.02);Leptospiraceae(0.02);" "Bacillus(0.07);Thermus(0.02);Tropheryma(0.02);Corynebacterium(0.02);Pyrococcus(0.02);"
+"ds2020-267_817" "208" "pfam05656" "gnl|CDD|377540" "3.45664e-06" "86" "190" "-1" "pfam05656, DUF805, Protein of unknown function (DUF805). This family consists of several bacterial proteins of unknown function." "Bacteria(1.00);" "(1.00);" "Veillonellaceae(0.07);Sutterellaceae(0.06);Sphingomonadaceae(0.05);Rhodobacteraceae(0.04);Caulobacteraceae(0.04);" "Veillonella(0.04);Sphingomonas(0.04);Asticcacaulis(0.03);Dakarella(0.03);Prevotella(0.03);"
+"ds2020-267_837" "207" "pfam04061" "gnl|CDD|367791" "2.43363e-18" "1" "159" "1" "pfam04061, ORMDL, ORMDL family. Evidence form suggests that ORMDLs are involved in protein folding in the ER. Orm proteins have been identified as negative regulators of sphingolipid synthesis that form a conserved complex with serine palmitoyltransferase, the first and rate-limiting enzyme in sphingolipid production. This novel and conserved protein complex, has been termed the SPOTS complex (serine palmitoyltransferase, Orm1/2, Tsc3, and Sac1)." "Eukaryota(1.00);" "(1.00);" "Saccharomycetaceae(0.15);Nosematidae(0.04);(0.04);Phaffomycetaceae(0.03);Salpingoecidae(0.03);" "Kazachstania(0.04);Thalassiosira(0.03);Trichomonas(0.03);Nosema(0.03);Nakaseomyces(0.03);"
+"ds2020-267_94" no_hit
+"ds2020-267_97" "380" "pfam04879" "gnl|CDD|368171" "1.9903e-08" "125" "274" "-2" "pfam04879, Molybdop_Fe4S4, Molybdopterin oxidoreductase Fe4S4 domain. This domain is found in formate dehydrogenase H for which the structure is known. This first domain (residues 1 to 60) of Structure 1aa6 is an Fe4S4 cluster just below the protein surface." "Bacteria(0.75);Archaea(0.25);" "(1.00);" "Enterobacteriaceae(0.11);Bacillaceae(0.09);Pseudomonadaceae(0.08);Methanobacteriaceae(0.06);Phyllobacteriaceae(0.06);" "Bacillus(0.09);Escherichia(0.09);Pseudomonas(0.08);Mesorhizobium(0.06);Synechococcus(0.06);"
+"ds2020-267_98" "379" "pfam16203" "gnl|CDD|374428" "1.33948e-30" "131" "280" "-1" "pfam16203, ERCC3_RAD25_C, ERCC3/RAD25/XPB C-terminal helicase. This is the C-terminal helicase domain of ERCC3, RAD25 and XPB helicases." "Eukaryota(1.00);" "(1.00);" "Cryptosporidiidae(0.06);Vahlkampfiidae(0.06);(0.03);Opisthorchiidae(0.03);Chaetomiaceae(0.03);" "Naegleria(0.06);Cryptosporidium(0.06);Micromonas(0.03);Batrachochytrium(0.03);Caenorhabditis(0.03);"
diff --git a/tools/virAnnot/test-data/otu_s1_tblastx.tab b/tools/virAnnot/test-data/otu_s1_tblastx.tab
new file mode 100755
index 00000000000..330d4ca8e23
--- /dev/null
+++ b/tools/virAnnot/test-data/otu_s1_tblastx.tab
@@ -0,0 +1,57 @@
+#algo query_id nb_reads query_length accession description organism percentIdentity nb_hsps queryOverlap hitOverlap evalue score tax_id taxonomy sequence
+TBLASTX ds2020-267_392 26 240 NC_005979 Helminthosporium victoriae 145S virus Helminthosporium victoriae 145S virus 40.0 1 100 6.0 1.12512e-11 66.1329 164750 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Chrysovirus;Helminthosporium victoriae 145S virus CAGCACGTCCGCAAGTTGTCCGGCTTAAATCTTTAGCCCCTAACTTAAGTGCCGCTACAGCTCCATTTTCTATTACTTTTTTTGTTCTATCACATAACCACATTCCTTCGAAGACTGATAGTTGTGAAATTTCATATATGTTGTCTTCATCTAAGTAATATAGAAATTTGAAACTTGGTGTTGCGTCCGTTAAACGTAGATCAGTGAAGTACGCACCCATTCGTAGTTGCGGACGTGCTG
+TBLASTX ds2020-267_268 14 259 NC_001963 Sphaeropsis sapinea RNA virus 1, complete genome Sphaeropsis sapinea RNA virus 1 62.0 1 100 5.0 1.78772e-31 132.115 73497 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Victorivirus;Sphaeropsis sapinea RNA virus 1 CAGCACGTCCGCAATGCATGGCCTCTGAGTTTGTGGAAACGAACCCTCTGCCAACCTGGGACGGCACGACCCACGTCTCTAAGTCTGCCAAGTTAGAACACGGGAAGACCCGCGCAATATTCGCCTGCGACACCCGGTCGTATTTTGGGTTTTCGTGGATCCTAGATGCGACCCAACAGGCCTGGAAGAACGAACGGGTTGTCATGGATCCGGGCAAAGGTGGGAAGTGTGGGATGACGCAACGATTGCGGACGTGCTG
+TBLASTX ds2020-267_4 1434 2297 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 44.3 8 100 64.0 1.9240409540575e-07 928.6219 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B CTTCCGATCTATCTAAGGAGCAGCACGTCCGCAATTCAGCTACTCTCAGCACGTCCGCAATACTAACAGCTCAGCGCGTCCGCAACACGACTGGGGCACACGTCCGCAACGTCCACGACTTATCACTTGCGGACGTGCTGCTCCTTAGATTCTGGAAGTAAGGACGTTCGGGCTTCCTATTCCGCTTTATTAAGGTACACTAAGTAACTATTCCTATTAACTCCATCGGGTCCTTAGATCCTTTGAGTAGGTGTAGTAGTGGGCCGCTTTTATTGGTCCCATTCAACACGTCCATCAGGAAGCCGGTCATTTTGGCTTTTCCGTAATTGACTATGTCTGTTTCTTCTTTGTGTACCTTGAATAACGCTCGCAAAATCTCGTACCGCTTGATGTTACCATTCCTTGAAACGTTTATGTTCCTTTCTTTTGGTATCACCGCGTCGTATGTTGCGCGCATTATTCGTGAAATGAAATCCTGCAAAGGTCTTTCAAGTTGTAGTGATGCTTTCACCATCCTGGAGTAGTCCACCACTCCCGGTAACACGCCTATCTGCGTGGCACCCTTCCTGAAGCCCGACGACCGTATCATCCACTTTACGTCCGATCTCTTGTCTTCACTTATGCCCCCCACACACCTGTGGGAGGTCTTTATTTTATAACAGTCTGAAACTGTCATGTGCAATCGCTCACATTGTCTCGAGTAGTATTTGTTCCTCAATGACGCCGCTAACCACATTGGCATTCCCCTAGACACTGAATCGTCCAGACGCGACTCCAGCGCTTCCAAAAGGTCCCTCATATCGCTTGAAGGTTTTGACTCTATCCTCGAGTGTACCAAGGTTGCCATAGCTCTAGATAGATACTGTCCCTTAGACCCACGTTTGTGATCTACGCGTAGAAACTCTGCTATGGCCCCATACGCACATTTGCTCATCTGCAGGCGTATGTTGTGCTTCTTGGCATTTTTGCCAGCTAGCAACACGTCCTCGAGCGAATTACTTCCCAGTAGCACGTCGTCACCGTTGTGGAGGCTGTTTTGCGATTGTACCACGTCAGGTACTATCAGTTGAGTGTAAATGTAGTTAAGCACGCTGTTCATGAACGTAGTGAGTCGCCACCCCGATAACAGGGTCCCCTTAGCGTTGTACTCCATTTTCAAGCCTTGATTGTCGTGTACTATTACCCTATCCAGTGAAAGCCGAGTCCACTCCACAGCTGCTAGTTGCTCCTGAGTCAGGAAGTGTCCGAAAGTATCTCTGTACGCATCTATTACTGCTTTCATAGATTGTACACTGTGTTGACTGTTGAAATCCTCGAAATCTACACAATACTGAGTCCTGCCTTCTAAGACTGACCTTACTCTACTGCGGACGTTCTCATCGTTGGCTGCTTTTCCCACCGGGAACGGCGAGGGCAATACGTCCTCGCAGTTATAGAAGGCGAAATGTGCCAATACGTAACTAGTGACATCTGTCCCGTAGATAGCGCGGAGTTTGCTCCATTCATACTTCGTGGATGACCATGCGTGAAGTTCAGGATCTCTTTCGCGCCACGAGTCCATATTCATATCCGGCATGGCCAGTATTGATATGAACTTGTTCTTGAGGTATATGTCTTTGAATATGTATTTATCGTCTTCTGAATATTGCGAGTGTATGCTGCCGGCCGCACTCCACTGCCACCTACTCTGCCAGTACTCCCGCCAATCAAACTTCCTCGGTCTCTTACCCGCTGAGATCGATCTACTGAAGAGCTGCGAGGCCCTTTCATAAACCAATCCCTCCGGCATCTCGGCCAAGTTAGGGGACACCCTGTTCTTGTGCTCCTCCTCCCAGTTGACCAGTCTTGATTTGCGGACGTGCTGCTCCTTAGATANNNNNNNNNNGGACGTTCGGGCTTTGCGCTGGCAATGGAGAACAGTCCTGACCCTCTAGCGAGCTGCATCTCCTCGGGGGTGAGACCAGCTGCCCACAGTGCCACGCCCGTAAGGAATGAGTTAGTAGCTTCTCTGGTTATTGATAAGGCCAGAGCTACGCTGTCAGAGTTGACTCCCAAAATGTCTACCACCTCCTTGAACGAAAAGTGAACATGATGCGACGCCGTTATCTTGGTGTGTTTTGCCGACATTGCTTCATGTAACTGCCACCCTCTGCCTTGCTGTCCATTTACTTTCCTCAATAATCGCTTCGGAGACACAGGGTCCTCAAAGTCGATAGAATCGTAAAGACCTGAGGTGTGCCTGGTCATTTGAGAAAGTATTTCTTTGCGTATACCCCAAGATCTTTGCGGACGTGCTG
+TBLASTX ds2020-267_18 840 1037 NC_016760 Rosellinia necatrix quadrivirus 1 segment 3, complete genome Rosellinia necatrix quadrivirus 1 27.1 2 100 15.0 2.0868e-13 98.9223 1000373 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Quadriviridae;Quadrivirus;Rosellinia necatrix quadrivirus 1 CAGCACGTCCGCAAAGTGAAGCCGGTAAGAGGTCAGGCGACGTTGGCCAGAGCAAGGCTATGGCTGCAGGTGACATAGGGAGAGTTGACGCAATGGTGATTGCGTCACAGACAAGCTGGTGGCACCCTGGCGTGACTATGTGGATTGCAGCCTACAAGCTAGCCGTAGCAATACTGGCTAGCGCCAAAACTCTGATGATGACCGAGAAGGAGATAGAGGCTCTTATCAACTACACGTTCACAAGGACCACGTACAGGAAACTAGTAGCCAGCAACGCGCTAATGGATTCTACGAGAGACATAGCAGCCAGTGAGGTGACCCAAGCAGCATCAACCCCAGTCAGGTGGGAGAGGCAGGTGCACCCAATAGTCCTAGTACTAGACGATGCAGAGTACTCGATTACAAGAAAGACAGCTAGTGCAGAAATCACTAGCGTGTACGACAAAGTGCACTCGCACATGGCGCTAAGCCTTGGGTCTCTCTACGGTGACATGGCGCACACTAGGATGAAGCAGCCAAATAGGATTGGCACTGGTTTGTTGGCAAAATCAGGCAGGGCACAAAGGGCAAGTCCAGTTTTTGCCAAACTGAGATTGACTGATAACACAGTGACAGTTACGGCGTGCCCTACATCAGACTCAGACGCAGTACTGATGTCGATAAGCAAAGGCATTGAAAAGGCTGGCCTACACAACGTTACGCTGGGAAATGAAGTGGTGAAAGTTGTGAGGAAGCCTGAGTACGGCATGACACTGACGTACCTGATACCTTCGACAATCAGTGGGAAAGGTGCTGACAAGTCATATGTCTATTTGGCTGGCATGCACTTCAGGGAGGACGATCTAACGTACTCTTTGCCTACGCTAGAGTTCTTGTCGCAGTTCACGACAGAATATGAACCGGTCAAGCCTGACAAGCGGCAAAAGATGTTTCGCCTGCTAGTAGACCCAGTGACGACAAGGGTCCACCACAGGCACATGTCCTTGCTAACAGTAATGGCGACTTGTGGACACGCATGGGCACTTGCGGACGTGCTG
+TBLASTX ds2020-267_699 10 214 NC_033476 Botryosphaeria dothidea virus 1 strain YZN115 RNA-dependent RNA polymerase (RdRp) gene, complete cds Botryosphaeria dothidea virus 1 61.5 1 100 7.0 1.87612e-16 81.712 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 CAGCACTTGTCTCCTAAATTAGCAAGATCGCGCGTTCACCCTTTTGTTTCAAGCAGGTTGCTTAGTTATGGTGATAACCAAATTGTTAGCGAAGAGTTGTTTGTATCCGTCGGGTTACGCTATGACCCGGAAAAACATGCACAGCATCTGGCCAGATTTGGTATGACCCTAAAAATTGACGAAACTGAAGTGACTATATATTGCGGACGTGCTG
+TBLASTX ds2020-267_595 10 219 NC_038928 Aspergillus foetidus slow virus 1 CP gene and RdRp gene, genomic RNA Aspergillus foetidus slow virus 1 51.2 2 100 7.0 1.97993e-05 142.3464 1087070 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Victorivirus;Aspergillus foetidus slow virus 1 CAGCACGTCCGCAACAATGCGTATCTGAGGGCGGCCGTAGGGAAGACCTGGTACGAGGGTGCGCTATCGCTGCACACAGGCGACGATGTCTTTATCAGGGCGAACACCCTCGCCGACTGTTCCGTCATTCTCAGTGATGCGGTTGCCTTCGGATGCCGTATGAACCCAACCAAACAGTCAATCGGATTCTACAATCGACTAGCCTTGCGGACGTGCTGA
+TBLASTX ds2020-267_512 12 225
+TBLASTX ds2020-267_10 16208 1619 NC_038825 Flammulina velutipes browning virus CP1 gene for coat protein, complete cds Flammulina velutipes browning virus 35.1 2 100 30.0 3.63103e-21 125.3928 568090 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Alphapartitivirus;Flammulina velutipes browning virus CAGCACGTCCGCAATTTGGGTGGTCTGTTGAGACCATTAGATTGTTTCATTGCGTGTTGAACGCATTGCGACAGAAACAGTTGAGTGGGGCTTAAAGTAGAAAAAAAGCAAACAACAATGGAAGGTCGTTCAGTAAAAAGAAATTAGAAAACAGAAAAAGAGAAAAACTCGGGGGTGTCGCGAGAATTTGCGCTTCTCTATTCAAATCTGAGTGCGGAGGGGGTGTGGTAGTAGCCGGAAATCAACGGTGCAATGGTGTTGCTGACGTTGTATTGCGAAGTTCGACGACTATCGGGAATACTGAAGATTGGTCCGACGTGGGTTGACTTAAAGTCAGGGCCAGAAGTGTCGGTGACATCTTTGTTGATGTCAGTCCAATCGGAGTTGAGCTGAGTGAGGATGCCGGCCTGTTCAGTGACTAGGTCGAGAAACTCTTCAGAGTGGAGGTGGATCGTAGTGATTCCAGTAAATTCTGGAATATCATACCGGAGCGTGGAACCGGTCTGATAACGGACTTTGCGCGTGGTAACGGCATGAACAAGAATGTTCTTGTTTTGCCTAGTAGCCACGTACTTTGTACGTACATAGGAGATCCCAGTGCCAGTAGTGGTCACGGAGCCAAGGGAAACAGTGTCCTTGAAGAAATCACTGTAAGGCTGCATGACGCGGATGACTTGAGCAAACCAACCGTAAGGTCGGTCAGCATGATTGCCGATGCCGCGAAAACCGAAGACCTGGTCGAGGTCGAGGGTATCGTCGTCGTCGGAGATGACATATTGACTGTCACCGTCATTGGCGAAGGGGAGGGTGTTGCGCCACACGTTGGATGAGGTGGCGAGGCCGTTGAGGAGACCAACAGTGGTCTGGAAGTCGGACCGAGCACTAGGCGTAAGCATAGCAAAACGGGTCGCTTCGTCCTTGGAGGCGGGGGCGCCGAAGATCGTCGTATAGACGGTATCCGTGTGGGAAGCATTGGCTTGGACTGGGCCAGAGTTGACAGGCGAGATCAGGGAGATCAATCGCATGAACTGATCAAGAATGAAGATCACATTCGGGAGAATGGTGTGAACTTTGTCTTGCCAGAGGAAACTGGTGCAGTTGATGTCATGGGCATTGGGTATGCCAAAGACAAGATTGCCAAAATTTTCGTTGGGGCCAGCGTTGGCGGCGAGAGACTGGAAGAAGATGGCGACAGGGCCAGGGATCTTCAAGTGTTCGGCCTTGAATTGGCTGTCGAGAAACTCGACAAACAAACGTTGATCGTTGGTGATCATACCACCGTGAGATTGGTTCTTGAGAACCTGGTAGTAGAACAACACAGCGATGTAAAGCTGGGAGACGAAAGGGTGCCAGTCAGGGTTGGCGTCGGTGAAACGCTTGGTTCTGACCATCTGCGTGTCCATGATAGACAGGACGTAGAAGAGCTGAGTGGTGTCAGGCACGACATAGGATATGTCATTGTGCTTGATGCCGAAGAAGGGGAGGTCGGAGACGCCTGATAGCATCATTGAGAGACCCGGGTTCTTGGGGCCAGCGGAGCTTGCAGTGGGTTCGCGAGGGGCGAAACTCTTCTGCTTCTTGGCAGGAACCGAGTATTGCGGACGTGCTGCTCCTTAGAT
+TBLASTX ds2020-267_29 426 726
+TBLASTX ds2020-267_235 16 267
+TBLASTX ds2020-267_177 50 290 NC_039077 Prunus virus F isolate 8816-v1 segment RNA1 polyprotein 1 gene, complete cds Prunus virus F 90.4 3 100 13.0 5.317733333334419e-40 575.046 1855510 Viruses;Orthornavirae;Pisuviricota;Pisoniviricetes;Picornavirales;Secoviridae;Fabavirus;Prunus virus F AAGCCCACTATTTCAAACTTTGCTTTTGCTACACTTCTTTGCTCTCTTGACCATCTGTGTTTATTCCCAATGGCTTTTCCCCTGTTTGTTGATACCTATGAGCATGTTGCAAAACATGACAAGAAATATTATGGATCTTTCCCAGCCACCTTCACTTTGGTTGCTGGAGGTGGGGTGATTGATCTTGAGAAAATGTTTTCTGGAGTCCGCAAACTAAAGCGCCATTTGACGCTACACCGAATGTTTGCGGGCTGTGTTCTGGGCACAGAAGCTGCTTTGCGGACGTGCTG
+TBLASTX ds2020-267_444 10 233 NC_033476 Botryosphaeria dothidea virus 1 strain YZN115 RNA-dependent RNA polymerase (RdRp) gene, complete cds Botryosphaeria dothidea virus 1 68.5 1 100 7.0 1.4637e-19 92.2508 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 CAGCACGTCCGCAATGTGGCAACCGTGTACGACGTTTCCGATGACACCCTGTCTATCAAGTGCCCCAGTATCAGCATATTATTGGCGTTTGTGTTGATAAGGGACGTGTAATAGGAACCACTCGGCATCGTCCCAAAAAGGTTGACAAGGTACCCCGAAGGATGCTCAAGAAGCTTCTTGAGAAGCTGGCGCTTTGACACAGATGACATAGCCTAACGTTTGCGGACGTGCTG
+TBLASTX ds2020-267_441 2 234 NC_006961 Pleurotus ostreatus virus 1 RNA-1, complete genome Pleurotus ostreatus virus 1 36.2 1 100 9.0 6.11518e-09 56.9688 674983 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Betapartitivirus;Pleurotus ostreatus virus 1 CAGCACGTCCGCAAGTTGAGTTCAGTGGTGTAAACGAGTTGTCCAGTGTGGTAACGGTAAGGGAGTACAGTAATGCCAGGTTGTGGAAATCTGTTGTTTGGAAGTTCGTTGTCGTCTAAGTGACGATAAAATTCGAAGGGTTCGTTACGGTCAATGTTCGCTTGAGTGTAGCGTTCATATGTTTGAGAGAAGGTGTGTTCGTATTCTGATGTGCGATGACTTGCGGACGTTCTG
+TBLASTX ds2020-267_7 1414 1772 NC_033486 Wuhan fly virus 5 strain fly34516 segment Seg 2 hypothetical protein gene, complete cds Wuhan fly virus 5 28.4 1 100 15.0 9.16869e-08 56.9688 1923699 Viruses;Wuhan fly virus 5 CAGCACGTCCGCAAAGTTCGCTCTCTTCATTGAGCTAATTGGTTAAAAGTCTACTTGTTAAGTAGCATTCACATCAAGGAAAGAATTTCGTCAAAATGGCATACCAAAAGCCCGACAAATCGACCGTCTCCGGCACGACTCTTACGCCAGATGACTCAGCCTCACAAGCTGGTCCACAAAATGATACCCCCAATCCTGCGAAGTCCGGACGCCCAAAGCGTTCATCAAAGATTTCAAAGGGCAAAGATCTACCTCCGGGTGCGATCAAGGTACCAAAAGGTGGCGCCAACATGACGGGGAAAGCATCTCCCGTACAGTCTGCAACCATTCCATTTCGGGATGGGGAGAAATAGACCTCAACTCTCATAGAAATGAGATTGAGCCGGTCTTCACAGTCGACGCTCAGCCGTATGACGACCTTGTCAACGTGGTGTACTCATCACTTCAGTCGCGATACTCAAATGCGGCGAAGCACATCCCGTTTGGCCTCTTCCGCTACTACTGCATGCAATTGTGGTGGTATCGGGTTCTTTTTCTGCATCGCACGAACGGCAATGCTCTCACATCTGACGAACGTCAGTTCATGAGCATCATGGAGACTGGACAAGAGTTCCAAATCCCCTCCCAAATAGCACAGTATCTTGCCAACCTTGGCAATTTCATGCAAGGAGGAGAGAACTTCTTTTTCCGCCTGCCCCCACACGCCTTCGCCGAAGCAACAGGCACTATCCACTCAGGATGGTTTGCCTCTGGTCTTCCCACCGCCAAGGTGGACACAACTTCCTTCTGGAAGTACGCTCAACTTCCGAGTCCGGGCGTTTTCGTGTCCTATATGTGCAACGAAGCACATTACAACACCCCTGGCCACCAGCCCAATCGTCTCTTCGATCTCTCAGAGATCGCCCCCACCATTTCCGACGACAGTTATTCAGTTCCGACTGATAACATCGTTGGTTGGAGTAACGGCATTTACACTGCCACGCACGCCTCCTGGCGTTCGACATACTCCAATCTTGGCTGGTCAATCGACGGTTGTGCCCTTGACTCTCAGACAACATTCATGCTCTCGACATCGACCATGCGTGCCGTGTCTGACCGTATTGCGTCCGTCACCGGACTCAAAGTGAACACGTCAACACAGTTGACACTCTCTGTGCAAGGCAATCCCCTGGATTGCTACTACCTTGCAACTGTGGACTACGCCTCCAACCGCTCTCAGTGGCCAAAGGCACCTGGTCCTCATCAACAACAGAAAGTGAACGGCTGTTTGCACACAGAACTCGCCCTCCACTCCCGCTACGCCATGGACTCAAAAGTCCTATCACCCGCGTTCTCGTTCGGATATCGCCTAGAGCGATCGCTCATCTGGAACGGTACATACGATACCGACAGACGTCCGGTCCACGCTCAGGCCAGCAACTATCAGCCCTGGCTGATACAGTCTGAAGCCGACGACAAATACCGCGATCCTGGCCCCGCATGGATGGCCCATATGAACGATTCGTTCAATTTTGGTTCTTCATTGAACTTGAATTTACGACGATTTTCGACTCATGGCCTCATTCGTTCTGTCGCGCTTGACGCGTCCGTTGTCCTCAGTGACACCAAGTAGAAACTTCTTCTTCTACTACAGCAACTCTCTCTCTTGGTAAAGCTCACTGGTAACCGGTCCAAAACGAAACTCTTAAAACAGTGGATACCCTCCGGGGCGCACGTCCGCAAGGGTCCGGCAGTTGCGGACGTGCTACCCAAAGACCTTTGCGGACGTGCTG
+TBLASTX ds2020-267_692 5 214 NC_039077 Prunus virus F isolate 8816-v1 segment RNA1 polyprotein 1 gene, complete cds Prunus virus F 67.4 3 100 9.0 7.700429233333334e-12 283.7636 1855510 Viruses;Orthornavirae;Pisuviricota;Pisoniviricetes;Picornavirales;Secoviridae;Fabavirus;Prunus virus F GACGCACTGACCGTCTATGGGGCTGGGTGTAATGAAATTGTTGGGGAGTGGAAAGATGCCTCTCCACATTTCACATTTGAAGATGCCACTTTGGATGAGGCTATTAATGGTGTTGAAGACTTGGATTACTTTGACTCCCTTGTGATCGGAACTTCGGAAGGCTATCCCTATGTTCTTGAGAGGGAGACAAATCAGAAAGGTAAGTCGCGATATT
+TBLASTX ds2020-267_496 273 227 NC_038824 Carrot cryptic virus segment RNA 1 RNA-dependent RNA polymerase gene, complete cds Carrot cryptic virus 47.8 1 100 10.0 1.27723e-14 75.7553 589918 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Alphapartitivirus;Carrot cryptic virus CAGCAGGTCCGCAACGTCGGTTTTGTGTCCGTATCGGCGGTGCCAATCGGTTGCGAGGGGTGTGTAGAGCGATTCGAGTCGGTCAAACACTGCGCGGAAGGTTGTTCGATTCGCTAAGAAATAGGAATCGGTGGCGAAGGGGGCTTCAGCGTTCACGTGCCATTTATATGGGTAGTGGGGCTGCACATCATAGATGTGGGCAGGTCGTCAATTTTGCGGACGTGCTG
+TBLASTX ds2020-267_40 385 586 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 38.7 1 100 7.0 9.86751e-21 98.2075 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B TCTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTCTCGCTACCTGTACTTGCAAGCCCCTACTGCTGGTTGGCTGAATGAGAATGATATAGTTTCCCCTTCCATCGTAAGCACGTGCGGTAAGGGGAAAGATCGTCCAGTTCGTTCCTCAGAATCACATACCCTGACGGCAGCCCCCGGAATAACAGTGTCAAATACTGACTCGGGTGCGATTATACATTCTCTCACGTTACAGTAGGGCGTAAAAAGACCCCTTGAACTTAGGTCTTCGAACACCACTTCGTGCCCGAAGACTCTGTAAGCGTTTGCTAGTCGCAAGGCATCTCTAGGCTCCATGACGAAATCATCACCAATAGGTATAGACTGCATCCCTGTCAAATGTGAAATCCCGTCGTACCCATCAACCACACAACCCGCTAACAATGCTCCCGAGACGTAAACAGGTACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATCCGGTATCCCTCAGCACGTCCGCAACTGATAGCTACTCAGCACGTCCCAACAGTCAACCCCTTGCGGACGTGCTG
+TBLASTX ds2020-267_526 4 225
+TBLASTX ds2020-267_305 14 253
+TBLASTX ds2020-267_204 13 279 NC_033494 Botryosphaeria dothidea virus 1 strain YZN115 segment RNA3 hypothetical protein gene, complete cds Botryosphaeria dothidea virus 1 35.8 1 100 8.0 1.7348e-05 45.9718 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 CAGCACGTCCGCAATTGGATACCGGTCATTCACTGAATTCGTTGATAGAGTAGGCGGTGTGTCAAGGTACGGAGCACATTTTTACGTCGATCACCACGTGTTTGCATCTTCATTTGAGGAGGGCCACGTCCTTGGCGATGTTGTAGAAGAAGAGGACTATAACGCAGCAACCATTTGCGGACGTTACGCGTCGGACATAACCTTTTCCTGCGAGTCAGAAACGCCAGATTTTGAATTGGTAGCAAGATTTCTGTCGTCGGAAGCTGCGGACGTGCTGAG
+TBLASTX ds2020-267_419 16 236
+TBLASTX ds2020-267_130 45 330 NC_006937 Fusarium graminearum dsRNA mycovirus-1, complete genome Little cherry virus 2 52.4 2 100 8.0 1.496345e-12 249.1092 154339 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Closteroviridae;Ampelovirus;Little cherry virus 2 CAGCACGTCCGCAACTGCAAATGGATAGACTCCAAGGTCCGAACTGTAATTGGTTCTCCTATAACCCAGTATATAATGAGCACCATATGGAATTATGGTCCCAATCACAACTTTGCTTGGGAGACCACACCCATCAAAGTGGGCATGCCACTAAATGGGTTTTGGCTGTCCAAGTTGTTCTCTAAACATGCCAGGTGCCAAATGCACATTGAGGGTGACTTTGAAGCTTTTGACTCAACCATCTCCGGGTCCGTTGTTGACCTTATTAAGGATGTGAGGAAGAAAGGGTATGAAATGCATAGAGACAGGGCTTCAGTTGCGGACGTGCTG
+TBLASTX ds2020-267_27 60 729 NC_006937 Fusarium graminearum dsRNA mycovirus-1, complete genome Little cherry virus 2 47.7 3 100 5.0 1.29455e-22 141.58100000000002 154339 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Closteroviridae;Ampelovirus;Little cherry virus 2 ACAGCACGTCCGCAATTGATGCAGTTTCAACCTCGGCCCAGGCCTTTGTAGGGTTTGGTGGAGGCTTTGCCTCTTGAGTTTCATTGTGTTTTACATGCCGACGCAGTTTTTGATGCCTGTGGTGGAGTTTTTGATACAGGTCTTTGCCACCCTTACTACTCGAGGGTTCTGGCCTGACCATAATGACTCTGGTGGGTCATTTGTAGAGTGGCTTGTCTGGAGATTCACTTGGGTCGTTGTCAACGCGACCGCTGTTGCTGAGTCTGTCAATGCCGAAGTCCGCAAGAGGCACAGTGACAAAATATCACCAGACTCTGTCCGTCTTGCAGCAATTTTCAGGAGTTTCTTCATTCAGGGTGTTGCCTTCATTGATGAGTTGGGATTGCCTCACTATCTACGATCCTACACCCCTGTGGAAATGACTAAACAGGCCCTGGACAAGTCTCTGTCTCTAATGGCTGAAGTCGGGTGGCCAGTGAATGTGGCCACGGATGAGAGGGTTGATCCCATTGCGGAACGCATGGGATTCAAAGAGTGGGTCCTTTGTGGACGTGCTGNNNNNNNNNNCATTTGTAGAGTGGCTTGTCTGGAGATTCACTTGGGTCGTTGTCAACGCGACCGCTGTTGCTGAGTCTGTCAATGCCGAAGTCCGCAAGAGGCACAGTGACAAAATATCACCAGACTCTGTCCGTCTTGCAGCAATTTTCAGGAGTTTCTTCATTCAGGGTG
+TBLASTX ds2020-267_51 94 500 NC_020903 Xanthophyllomyces dendrorhous virus L1A capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1A 54.8 1 100 5.0 4.95153e-19 92.2508 1167690 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1A CAGCACGTCCGCAAGGAATTCCCCCTCAGCACGTCCGCAACGTATGCCCATCAGCACGTCCCAAACCCAACCCAATTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTCGAGAAGCAACTAACTCGTTCCTAACGGGTGTGGCGCTGTGGGCGGCTGGCCTCACTGATGACGAGATGATGCTTGCTAGGGGGTCAGGGCTGTTCTCCCTCGCAAGCGTCAAGGATTACAAGCGCGAAGCTAAGCGCATAAGCGTGGAAGCAAAATCTCTACAAAACTTGGTAGATGTGGACTTGAGAAAGTTCTTCGAACTAGAGGTGCTAGTCAATAGGGGACACGACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAAAAGACCTGAGTTTATTGCGACGTGCTGAGGGACTCGAGTTTGCGGACGTGCTGAGACGTAAACATTGCGGACGTGCTGCGCCTTAGATAGAGCGGA
+TBLASTX ds2020-267_9 1360 1660 NC_016760 Rosellinia necatrix quadrivirus 1 segment 3, complete genome Rosellinia necatrix quadrivirus 1 33.7 6 100 35.0 5.95825e-14 361.9737 1000373 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Quadriviridae;Quadrivirus;Rosellinia necatrix quadrivirus 1 TATCTAAGGAGCAGCACGTCCGCAAGCCACGTACGGTGAAAAGAGAGCAGTCGCGCCTGGCGACTTGGGCTTGGTGGACTCGCTTGTGGTGAAGTCACAGATTGATTGGTGGCATTGCAATGTCACTATGTGGGTGGCCGCTTACAAGTTGTCTGTGACGCTAGCTGCATCGTGTGGTGACATGAACTTCAGTGGTGAGGAAGTTAATGAGATCATACAGTACACGTTCAGCCGCTCAACATACAGGAAGCTCGTAGCGAGCGACGCGGTGATGGACTCGACTAGAGACATTGCAGCAAGTGAGGTGACGCAGGCAGCGTCAACGCCAGTCAGGTGGGCTAGGCAAGTGAACCCAATCGTGCTGGTGCTCGACGATGTCGAGTACGCCATCACACGCAACGAAGTTAATGATGTCTTGACAAAGGTATACGATAAGGTACACGCTGCAATCATGAAACAAGCTGGAAAAGGTTACGGTGACTACAACAGTACTGGGCTTGAGCTGGTCTACAGCGAGGAGACAGGGCTATCAGCAGGTGAAACTCCGAGAGGGGTTTTGAACCCGGTTTTTGGTTACGCAAAGCTGGCAAATGGCGCAATAACTGTGGAGCCATGCAAGTGCGCAGACTCAAACGCCGTACTCATGACGATGAGTGAAGGTGAGCAAAAACCAGGGCTGAGTGAGGTGTCAATCGGCAGCGAATCAGTCAAGGTAGTTAAACGAAACAGAGGCGGAAGGACTTTGACCTATCTGATGCCAGAGACGATAAGCGGCATGGGGGCAGACAGGTCATATGTCTATCTTGCGGGGATGCACTTCAGAGAGGATGAGCTCAAGTACTCACTGCCAACCCTGGAGTTCCTGTCACAGTTCACAACAAAGTACAAACCACTACAGCCGTCAGAAAGGTTGAGCAAGCTACGAGTGCTAACCGATCCAACTTCAACGCGAGTGCACCACAGGCACATGTCTATGTTGACCGTGATGGCGACTTGCTGTCATGCGTGGGCTCCGTGCATGGACACAGTGTTAGATTGGCCTGACATCACGAACACGTTTATGTCAGCGCTAATGCTAACGATGGCTGCAGTGCCACCTGAACTGTATGTGCTCATGTGTGAATGGAACGGGTGGGCCAGCTGCAAAAGCATGGCAGAGTACGTAGTGACTGCGAAAGAACTTACAACAAAGATGAAAGCTCTAGACAACCAGGTGGCAATCGGCGATTTTGAGCTGGACCTGTCGCCACTGTTTGAGTGGGAGGTGTTGAATCACAGAGCTGTGACAAAAGGCATCTACGACAAGGAGCTAATCGAAAGACGTGATGCAATGCAAAGCATTAAGCTCACGCCAGAGCAGCTCAGGCCGCACATCGATAGTGTATTCAGGGACATCAGTGCGATACTAGACAAGCGCACAAAGCATGGTGAGAAGTCGCCGATTTTTGCAAATTGGGACGATTGGTATGCTGATAGGGTGCAGGCAACACCTGCGGGATCAGCATTCACAGTCGAGGAGTCTCTTTTGCAGGCAAGACAAGTCTTAAAAGATAACGGCGTGCAGAACCTGACAAAGACACAAGTCATGGCGCAAATGCAGGATGGATTAAAACTGGATACTCTACTCAGTCATGAGCCAGACATCATTGCGGACGTGCTG
+TBLASTX ds2020-267_615 4 218 NC_039078 Prunus virus F isolate 8816-s1 segment RNA2 polyprotein 2 gene, complete cds Prunus virus F 66.3 3 100 15.0 1.3506373333333334e-12 273.5446 1855510 Viruses;Orthornavirae;Pisuviricota;Pisoniviricetes;Picornavirales;Secoviridae;Fabavirus;Prunus virus F CAGCACGTCCGCAAGTTCATCGGGATGTGTATAGTGATAGGATCACTCGATTCATGCGTCTTGGTTGGCAGGGGCTGGTTGGAAACACAGCAACAACCACACGCATCGAGAATGCAGAATTGACCACACTTGGTGGTAATCATGTCGTTGACGTTCCCGTTCCTTTTTTATGAACGGAAGCTACGACTACAAACCCAGTTGGAATTGCGGACGTGCTG
+TBLASTX ds2020-267_482 16 228
+TBLASTX ds2020-267_184 26 288
+TBLASTX ds2020-267_8 3373 1703 NC_028469 Penicillium aurantiogriseum partiti-like virus 66 kDa protein gene, complete cds Penicillium aurantiogriseum partiti-like virus 47.7 7 100 100 1.2504600000000032e-13 1057.2269000000001 1755781 Viruses;Penicillium aurantiogriseum partiti-like virus CAGCACGTCCGCAAACTGGGGTGTCTGGTATGGTAACTTCTGTTTTTTGTTACTGATATGTCAATCAGTAAAGAACGCTTCCTCGAGGTGGAGTTCCGAATAGAGGGGCCGTGTTTCTTGATATTTTTCGAAATCAGAAAAAGAACGTTGGCGTAGTGCTCTGTTGGAATAAGCCTCGGGTATGAACGCGTACTCGGGTAGGTTTCTATCTCTTCTTGAGATGAATTTCCGTGGCGAGGGTTGAGGTAGTAGCGCAGGGAAGAAAAATCCGCCGAAAGGATCGGTTTGTCGGATGGGAAGTGTGATTTCCTTCATCTCGAGACCGAGAGTGGAGAGATATTTGAATGCCTTTGAAGGCTTCTCTGCCACGTAGGCGTTGAGGGTTTTCTCTTGTATGCCGTTGGTGCTCATGATGTGTTTGATCGCATCATAGAATACATTGCATAGTTTTGGATCCATGCAGGAGTAGAGCTGTCCAAGTAGGCGTGCGCATGACTCGAGTGGTGAGTCAACTGGGCGTTCCGGGTAGATGGTGGAAGCGAAGATGAAGTCGTATGACCTTCGCGGTCCGGTAACTCGGTGGAAGTATCCGAGCCAGTGTATATTCTCAGGGTTATTACTGAGAATCGTCTTGTCCAGGTTAAGAATGCCATTGAAAACATCCTTTAAAACAACACCAAGTTCGACGAGATCAATCGGTCTATCTAGAAAGATGGACGAATCATCTCCGTAGTAGTAGTCCTTAACGGGTAAGGCTCCAGTGACTCGGTAGATGGCAGTACGCATTTGCACTGCGTTGACGATTGTGTCGAGAAGGTTGGTCCACATTGAACCAGATGGGATGCCAGTGCTCTTTTGTACTCGGAGACCGCGGGGTGTGCGTATCTTCGTGTTGATGAAGTAAGAGACCATGGCTTTCCATCGTCGTGCTGTTTGGTCTGAACGGACGTTCCATACTATCCCTTCAGAATCTCTGACTTTTGAAAAGTCAAACCAATCAGAAATGAACGAGAATGTGTCTCGTATTATCCAATGGGTAACATTGGCGTCGAAGCGTGAAAAGTCGGTGGTGAGGGAAACGATATTGTCGATCATGCTCCTCGCAAGATGCGAGTGGCCTGACTTCATTGTTTCCATTCCGATGCCGTAGCACGCGTCCTCTCTGTTGCAGAGTTCCTTCAATTCTGAGAAAAGAGGAATGAAGAAGCGGGCCTCTTCAAGGATGACATCAGTTGGGTAACCCCAAACTGGACGTACTTTGACATTCGGTTGCTCACTTGCGACAACCCTGTTGAAAGCAAGGCAGTCGGGCAGCGACCATGGGATTCCTCTTCCGATACTATCCCAAGCCCGATGTATCTTTCCGGTGGCAACTGGGTCTGCGAAGACCTCAGCTTTTGTCTTGTATCCTTGGTTGACCCAAGGGAAGCCGGGAGATGTCGTGGTGGGCATTGCGGAGTGCTTGGCAGCAGCTCCGAGGGTTAGCGGTATGATACGGTTAGCGGGGCGAAGTTCATCGAGTGTTTTCTTGATAATCGCAAGATAGTCACCATCAACACACCGGGTGGTGGGTCGTTGGTCGTAATCCATGAGATTATCTTCGAGAACCGACTGGTCCGCGGACGGACGGTGCCATGTCGATGAGATGTTGCTAATGAAGTCACAGAGATCCGGAGAACCTGTCAATAGTTGCGGACGTGCTG
+TBLASTX ds2020-267_316 18 251 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 63.2 1 100 5.0 2.97582e-26 114.703 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B GACGCACTGACCTTTGTCACCACGTTTGTGATCAACGCGTAGAAACTCAGCTATTGCACCGAATGCGCACTTAGAGGGCTGCGTTCGTATGCAAAGCCTTTGTCCTCTCTGGAGTGTGAAACGAGTTATTTCCAGTGACGTCGTCCCTAGAAGCACATCGTCACCGTTGTGCAGTGAAGAGCCGACTTCTTTCATCGGACCCAACATGAAGTCGGTGTAAACGGCATTTCGGACGAGTTGCGGACGTGCTG
+TBLASTX ds2020-267_14 1984 1335 NC_033486 Wuhan fly virus 5 strain fly34516 segment Seg 2 hypothetical protein gene, complete cds Wuhan fly virus 5 28.4 1 100 15.0 2.39383e-07 55.1359 1923699 Viruses;Wuhan fly virus 5 CAGCACGTCCGCAACCGGGTATCCACTGTTTTAAGAGTTTCGTTTTGGACCGGTTACCAGTGAGCTTTTACCAAGAGAGAGCGTTGTAGTAGAAAAGAAGTATTGATCTACTTGGTGTCACTGAGGACGACAGATGCGTCAAGCGCGACAGAACGAATTAGGCCATGAGTCGAGAAACGTCGAAGATTCAGGTTCAAAGAAGAACCGAAATTGAACGAGTCGTTCATGTGTGCCATCCATTCGATGCCAGGATCACGATATGTATTGTCGGCGTCAGACTGTATCAGCCAGGGCTGATAATTGCTGGCCTGAGCAAAGACCGGTGATCTATCTGGATTGTATGTTCCAGACCAGATGAGCGATCGCTCAAGGCGGTAGCCGAACGAATACGCTGGTGACAGGACTTTGGAGTCCATGGCGTATCGAGAATGAAGGGCGAGTTCTGTGTGCAAACACGCGTTGACCTTCTGATTTTGATGAGGACCTGGTGCCTTTGGCCACTGGGAGCGGTTGGAGGCGTAGTCCTCTGTTGCAAGGAAGTAACAATCCAGGGGATTGCCTCGCACAGAAAGAGTCAACTGTGTTGACGAATTCACCTTGAGTCCTGTGACGGACGCAATTCGGTCAGACACGGCGCGCATGGTCGATGTGGAGAGCATGAACGTTGTCTGAGAGTCAAGGGCGCAACCATCTATGGACCAACCAAGATTAGAGTATGTCGCACGCCAGGAGGCGTGAGTGGCAGTGTAAGTGCCATTACTCCATCCAACGATGTTCTCGGTCGGAACCGAGTAACTGTCATCAGAAACGGAAGGTGAGATCTCAGAGAGATCAAAAAGACGATTGGGCTGGGAGCCAGGGGTGCAAGAATGTGCTTCATTGCACAGGTAAGACACGAAAACACCCGGACTCGGAAGTTGGGCGTACTTCCAGAAGGAAGTAGTGTCTACCCTAGCGTCGGGAAGACCAGAGGCGAACCATCCGGAGTGGATAGTGCCTGTTGCTTCGGCAAAGGTGTGGGGAGGTAGGCGAAAGAAGAAGTTTTCTCCTCCTTGCATGAAATTGCCTAAATTGGCAAGATACTGAGCAATTTGGGAGGGTATTTGAAACTCCTGCCCCATCTCCATCACGTTCATGAACTGACGTTCGTCAGAATTCAAGACGTTACCGTTTGCGCGATGCAGGTAAAGAACCCGGTACCACCACAATTGCATGCAGTAGTAGCGGAAGAGGCCGAATGGGATGTGCTTCGCCGCATTTGAGTAGCGCGACTGAAGTGATGTGTACACCACATTGACCAGGTCGTCATATGGCTGTGCAGTTGCGGACGTGCTG
+TBLASTX ds2020-267_588 38 219 NC_007542 Penicillium chrysogenum virus segment 4, complete genome Penicillium chrysogenum virus 35.4 1 100 7.0 1.82953e-09 58.494 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus CAGCACGTCCGCAAGAGCCTTTCCCTGATAACTTCTCGTTCGCCAGGCGACAATATATCCTTTTCCATCTCTACACCATTTACCCTTGTTTTAAGTGATACATTGCGCCTTGATTCTACATTAAATACAAATTTTTTGTTATGGTTGTGAGAATCTGCCATGCCATTCATGTAATCCACGACTCTTGCTGCTGATGCCATTTTGTTTGCGGACGTGCTG
+TBLASTX ds2020-267_272 4 259 NC_039077 Prunus virus F isolate 8816-v1 segment RNA1 polyprotein 1 gene, complete cds Prunus virus F 90.4 3 100 9.0 3.231256727625802e-20 349.6072 1855510 Viruses;Orthornavirae;Pisuviricota;Pisoniviricetes;Picornavirales;Secoviridae;Fabavirus;Prunus virus F GGACGTTCGGGCTTTTCGTGGTGTTTGGGTTGCAATCCGCAATACTCAATGACGCTGCAGTCTTGCTTGGTCAGGATTTGCCCTCTTGGCTCAAGGAATGTGATGCTATGGTTGACTATATGCACTTGTTTGCTGTAGCTCCGCGAGATGTCATTGATCGTATGCAAAAGCCTCTCAGCCTTGGGAGGCAACTCAGAATTATCTACAGAAAATTGTGCAATAGATATCGAGCTTAGTTCCCGGGTTTGCGGACGTGCTG
+TBLASTX ds2020-267_355 78 244 NC_021222 Cryphonectria parasitica bipartite mycovirus 1 strain 09269 segment RNA1, complete sequence Cryphonectria parasitica bipartite mycovirus 1 69.8 1 100 8.0 5.21666e-22 100.499 1329781 Viruses;Cryphonectria parasitica bipartite mycovirus 1 CAGCACGTCCGCAAACCCCCCTCTTAATAATCCCCGTAACCCCCGAGAGGAGCACGGGCCACTTTGGCGTTAGGCCACGCCTTGCGATAATCCTCTCGCCCCAAGAGGACTAAATCGCGCCACTGCTCAAATGTCAGCCGCTTGGGAATTGGCACCTCAACACCCACATTGCTATAGTCCCGCGATACCATGCGTTTGAAGTTCGGGGGCCAATCGAGGGGCGGGGTCATTTGCGGACGTGCTG
+TBLASTX ds2020-267_856 16 206 NC_010985 Curvularia thermal tolerance virus RNA1, complete sequence Curvularia thermal tolerance virus 37.2 1 100 6.0 0.000320058 40.9315 421976 Viruses;Curvularia thermal tolerance virus CAGCACGTCCGCAAGGACCATGGCATATTTAATTTAATTCTAAAGGAAAAGTGGCAAGATGTGTGGCACTCTGCTGAGATGGAGAGTCTTGGTGATGATAATATCACAGGCTTACCGGAGTGGATGAAGCATATCACAGCCGAGGAGTTGGGGCAATCCGTGTTGGATATGACGGGGATAAATAGGCAGAGGTTGCGGACGTGCTG
+TBLASTX ds2020-267_61 32 465 NC_039077 Prunus virus F isolate 8816-v1 segment RNA1 polyprotein 1 gene, complete cds Prunus virus F 72.3 6 100 11.0 5.1484708137e-16 421.9992 1855510 Viruses;Orthornavirae;Pisuviricota;Pisoniviricetes;Picornavirales;Secoviridae;Fabavirus;Prunus virus F CAGCACGTCCGCAAGGATGCACTCTCAGCACGTCCGCAATAAAGGGGCATGTGTTGCGGACGTCGCTTAAGGCGACGCACTGACCGTCTTTTCGCCCTTGGGACACTCGATTCCCACCAGTTCTGGTACCTGATTGGCACATTCTTCATAGAGTGAGGAAACATCCTTAGCAACTTTTGAATTGGGTTGTATTCTCAGGCTTCCAACCTCACCNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNTGAAGTCAACATGTTCTGTGCCAAGCAAACGAGGATCATTCTTCGTGATAACGCTGGGTATCTTTTCACAGGGAGTTTCCAGGTGCCACTCGAGTGGTGTTTCCACCAAACTGGAGGGCCACGAACACGGTCAGTGCGTCGCCTTAAGCGACGTCCGCAAGTAAGATTCCTTCGCACGTCCGCAATAGAGCTGTCTTTATTTGCGGACGTGCTG
+TBLASTX ds2020-267_21 912 858 NC_021222 Cryphonectria parasitica bipartite mycovirus 1 strain 09269 segment RNA1, complete sequence Cryphonectria parasitica bipartite mycovirus 1 58.3 4 100 63.0 1.336125e-15 550.4540000000001 1329781 Viruses;Cryphonectria parasitica bipartite mycovirus 1 CAGCACGTCCGCAAATCCCGCTTGTTTCGTGAGTTGGCCATATTCCGGATAGAGCAGGCGCAGGTAGGTCTCCTCCGCTGGGCGGTAGGGAAGGGGGAGCTGAATGACCCCATCCACCACTGGGTAGTCGGCTAGGAACCAATACTTTCCCAAGAACTGAATCCCTTGAAACTCCCCCTCAATGGCATCCAGTAGACGGGTGGTGGAGAAGGACTTCTTTCCCCACCAATCGATGGCCACCATCCTCTGGACACACTCCGCAATCGTCTCCGTCGTGAGGTGGGCCAACCTGAGGGAGACCGCCATGATATTGTCGTCCCCCAATGACTCCATCCATGCGTGCTCGTCAATGTTGTCGATGGTGAGCCCCCCGTCCAGTTCGAAAAGCGCCGCATATCCGATGAGTAGGGTGATGATGGACTGCAGGAGCGTGTTGTGGGAATGGCCACTTGTCGTGCCCACATACTTCTGCATGCGGACCCCATCATCGCGATAGATTGGAGCCCGCAGCAGGCTTTCTGCCACAAAGGCCCAATAGGTGTCGTAATCGGGATTGTCCCCATCGTAATACTGCTTGCGACAGATGTTAATGGCGATGGTGACCATCCATTCATTGATGCTGGAGTCGAACTTCTTGGCGTCGAAGCAGAAGAACTTGTCGAAAGGCGCCATCCTGTCGATGAACTCCTGTGACCCCCCGTGGTACCATGATTGACCCACCGCGATTGGATAGTTAGGGGCGGACCAGGCCTTCGTTAACTGGTTCTCTGTGACCCCACACAACTTCAAGTCACGGTGGCTCATCATGAGGATCAGACGCCCCACGGGGGGGATCTTGGATTCCTTGCGGACGTGCTG
+TBLASTX ds2020-267_2 7516 2436 NC_016760 Rosellinia necatrix quadrivirus 1 segment 3, complete genome Rosellinia necatrix quadrivirus 1 41.5 7 100 53.0 5.655557142857142e-05 679.2049 1000373 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Quadriviridae;Quadrivirus;Rosellinia necatrix quadrivirus 1 CAGCACGTCCGCAACAGTTGGTCCTTGCTAACAGTAATGGCGACTTGTGGACACGCATGGGCGCCTTGCATGGACAAAGTTCTGCAGTGGCCTGACATAACGAACACGTTTATGTCATCACTACTACTTGCCATGGCTGCACTACCACCAGAGTTATATGTACTAATGGTGGAGTGGAACGGCTGGGCAAAGTGTGGCTCTATGGCAGAGTACATCGTAGAGGCAAAAAACCTGACGACTAAGATGAAGGCACTGGACAACCAGGTAACATTGGGTGACTTCGAACTCGACTTATCGCCTTTATTCGAGTGGGAAGTGCTAAATCACAGAGCGGTCTTGAAAGGCATCTATGACAAGGAAGTCACAGAGCGTAGAGATCAGAAACAGAGCATCAAGCTATCTGCTGCCGATCTGGAGGAAGAAATAGACAGCGTGTTTCAGGACGTGGGTTCCGTTCTAGACGCCAGGACAAAAGAGGGTGAAAAATCACCTCTGTATGCAACGTGGGATGATTGGTACGTTGACAGGGTGCAAACCACACCAGCTGGGTCTGCATTCACAGTCAACAAGGACATGATGGAGGCAAGAAACATGCTGAAAGCCAATGGGGTCCAAAATCTGACCAAGACGCAAGTGATGGCGCAGATGAGGGACAAGCTCCCGCTGGCGTCTATCTTGGGTAGCGAGCCAATGATATTGGCCCAGATGTCATGGAAGTTGGAATGGTCAAAACTGAGGGCACTATTTGCTGCTAGCATGGAGCACTGGATGCCATCGGCATTCGCCCTGGGGCAGATAGAAGAGTATCTACCCAGTGACTGCCCCATAGGTAAAGCTGCCGATGCGCACAACGTGTGCAGGCGCGTGATGGAAATGTCAACGCAAGGAGTGGTAGCATGCATAGATGCAAAGAACTTCAACATCTTGCACACCCACGAGATAATGTCAGCAATACTGAAATCCGCATCAAAGATGCTAGGAGATAGGCTGTCTAGTGAGCAACATGACTGCCTAAAGTGGCTGGCGAAAGCGGAGCTGAACCAGAAAGTGCTGGTCAAGACAGGTGAAGTAACTGAACAGTTGCTCCAGGTCGGCAGGAGAGACGGGTGGATTAACAAGCTAACTAAAGGTGACGGCACAGTGGTAGAAGCGGCTGACGTGACGGTTGGAATGTTTTCAGGTACTAGGTTCACGATGCTGTACAACACAGTGCTAAACAGGGCGTACTACAAAGTGGCGGAGAAACGTGCGAAGATAAAGACTTTATCACTTCATTCGGGTGATGACGTGTATGCTGTTTTCGCTAACTATATAGACGTGTACAAGATGAAGCGTGAGATGGCGTTAATCGGCTACACACTGCAGTTAGGCAAGTGCTTCTTGCAGGGAGTCCGAGAATTCTTGAGAATATCTCATAAGAATGCAAACACTTCTCAATACCTAGCGAGGTCCGCAGCAACGGCAATACATGGAAGAATAGAGGCAGATGAGCCTTCTGATTTCGTGGCTTTTGTGGGGTCAATAATGAGAAGAGGTGCAGAGATGGTGGTCAGGCACGCGGCAAGAGCAGTGTTGCTAGATGTCATGAAGATACAGATAGCAGGAGCTTGCGCAAGGTGGGCGATTACAGCTATGGCGTGGGACTCATTCTTAATGTTGCCAAAAACAATGGGCGGTTGTGCTGCAAAAGCACGCCTGATGGAACAATGGAGTGGTTTTTCTATAGAAAGAACTGCAAGCGCCAGAGGTGGCATCGTAGACTATTTGGCTGAACAACCAGGTACCAAAACAGCGGCGAGGAGGCTGGTTGAGAAGTTGCAAATAATGAAGTACCACAAGAGAGTTGCACAAGCCGTTGCTGCGGCGATAGCACCTAAAGGAGTTTTGAAAAACTACGGTATGATAGTAAGGTGGATGAACAAAGATGACATGGCACATATGTCGAGAGTGGCAGGGACACTAGGGCGAATAAGACAATCGAGAGAGTACATATTATCAAAAGCAGCAGGATTATTCAATACGCTAGCAATAAATGACAACTTCTGGGGTGATGTGAGCGGTGTGTTCAGAGGCATACCGTCAGCGTGGCACGGCAGAGCACTGACGTTCGCACTGTCTGAGAGGAGTGAGTCAGAAGCGCTGTTTGCAAATAAAATGTACAAGCTACACTATAAAATGACAGAGTGGGCAAGAGCTGCAACAGAGAATAGACTGATAAGAATGCAGCTAGATATGCCACCGGGGTAATGCTGGTGGTAATAAGTACGATAGAACTTGCCATCCACTAGGGAAGTGGACACAAGCGGAGTAGGCGACCGGTGGCAAGTATAACAAGCCAGGCTGAACGGCCGTACGTGGCTCCCAGACGTACAAACATTGGCGCTATCAACTAGCGCCTACACAATATAAAATATGCGTTTAGTTGCGGACGTGCTG
+TBLASTX ds2020-267_56 95 478 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 32.4 1 100 7.0 2.87431e-13 73.0061 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B ACTCTGTATGCGTTCGCCAAACGCAACGCATCCCTAGGCTCCATGACGAAATCGTCGCCAATGGGTATCGATTGCATCCCAGATAGGTGTGACACACCGTCATACTCATCGACTACGCAGCCAGCCAATAGTGCTCCTGAGACGTAAGCGGGTATGCAAGTCAGGCGCTTTGATAAGGGATAGCCCTCCTCTATCAGCCTGGTCGCCTTGACTTCTTGGACTTCGGCAAGGTGTCCAAATTCGAAGGCCAGCCAACACGAGTCGTTCGCGACAGTAGGAACCTCTTTCCCGAAAGGGACAGAGCACATTGCGGCTCTGCCTATTGGGGACATCATCATCCGGATTGCTACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAAGTCTTAACCCTCAGCACGTCCCAATACATTTTCCGTCAGCACGTCCGAAAATCTACCACTTGCGGACGTGCTGCTCCTTA
+TBLASTX ds2020-267_393 23 240
+TBLASTX ds2020-267_50 128 510 NC_038928 Aspergillus foetidus slow virus 1 CP gene and RdRp gene, genomic RNA Aspergillus foetidus slow virus 1 45.9 2 100 8.0 2.41899e-28 142.8046 1087070 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Victorivirus;Aspergillus foetidus slow virus 1 CAGCACGTCCGCAACGCCACCGAAGCCTACCTCGCCGACCATGTCTCGAATGTCGAAGCTACCGCCCTGGAGATGGTGCGGGTGGATATAGTGGGTTTAATGGTTACTTCTTCTTACCGGAAGGGGTTGAACCAGACCCACTCAATACCGCCACAGCCCCTGATCCTAAGGAAGCTACCCCCAAGACGTTTGAGATCTTTCGTCGACGCCACTACCCTCATGAAGAGTCCAGTTAGACATGGGTGCCTCACACAGTATCCCATCCTACAGCTCTTCGCCTCACGGCTCTCTGAAGCAGAACTCCGCACCCTCGTAACCGAAGTGGGCGGAGATTCGACTGCAAGAGATATCCGGAGGGAGGCATTTGGCGCCGAATCCGTCACGAGGAACATCGTAGGTTTCATCCCGCTCGCCGACGCATCCTCGCTAGCGTCCAGAACGGACTATGACAACATCATGGTCCAATACCAAGTTTATCTATAATAGCCTGCTACATTTGCGGACGTGCTG
+TBLASTX ds2020-267_266 2 260
+TBLASTX ds2020-267_119 45 342
+TBLASTX ds2020-267_388 10 241
+TBLASTX ds2020-267_6 1161 1860 NC_016760 Rosellinia necatrix quadrivirus 1 segment 3, complete genome Rosellinia necatrix quadrivirus 1 41.9 5 100 39.0 1.1597159999999999e-05 494.24539999999996 1000373 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Quadriviridae;Quadrivirus;Rosellinia necatrix quadrivirus 1 TGAGGCTATTGTGCTGTTCTTCTGACAGCCTGGAACCTATCATCACTGACGCTGATTCCAATAGTGCTATTGCTAGTGTGTTGTTTTACTTGCCTGGGAGCCGCAAGCGGCTTGCAAAGCCTGGCGTTAATTGTACGTGCACCGGTTGCCTACACCGACGTTGACGGCGCTAGCTCTCCCTCAGCTAACGGGTCGTTAGTGACCAATTCTTTTGCGCCCATTTCGTGCTTGCTTGTCTGGGAGCCACAAGCGGCATTTGCAGCCTGGCGAGTTATTTGATACGTGTACCGAGTGCCTACCCCGACATTGACGGCGCCAACCTTCCCTAGGTTGACGGGAGCCACAAGTGTTTCACACTCATGGCTCTAATTACAGTGGCCTTTGGCCCAAGTTGAGCCTATGTCTCGTTTGCGAGTAGTTCGTCGCCACTCCTATCCACCCCATCACTGTGGTATGTAGCTTGAACCTCCTGTTATCGAACAGTGCTTTCTCCTCGCCTCTTTTCGCCAGCGCGAACGTTAGTGCTCTGGCGTGCCACGCTGACGGTATGCCTCTAAAGACTCCCGTCACGTCGCCCCAAAAGTGGTCGTTGATGGCCAGCGTGTTGAACAAGCCAGCTGCTTTGGATAAGATGTACTCACGTGACTGTCTTATCCTTTCCAGTTGACCCGTCACGGTCGCTAAATGCTCAAGATCGTCCTTGTTCATCCACCTGACTATCATTCCATAGTTCTTGAGGACACCTTTTGGTGCTATGGCTGCTGCCACGGCTTGCGCAACTCTTTTGTGGTACCGCCGTATGCCTAGTGCCTCTACTAACTGTCTCGCAGCAGTCTTGACTCCTGGTTGCTGCGCCAGGTAGTCGACTATACCACCACGTGCGCTGGCAGTTCGCTCGATAGAGTACCCACTCCACTCGTCTGCCTTTCGTGGTCGCGCAGCACACCCACCCATGACGTTTGGCAACACCAGAAATGCGTCCCAAGTCATGGCCGAAATTGCCCAGCGTGCACAAGCCCCTGCAATTTGCAGCTTCATCACGTCGAGCAACACGGTTCTCGTTGCATGTCTGACAACCATTTCTGCACCACGTCTCATGATGGAACCCACGAATGCCACAAAGTCTGATGGTTCATCAGCCTCAATTCTACCATGTATTGCAGTAGCTGCAGACCTCGCCAGATACTGTGACGTGTTTGCGTTCTTGTGTGAGATCCTTAAAAACTCTCTCACACCCTGCAAGAAGCACTTCGCTAGTTGCAGTGTGTACCCAATGAACGCCATCGCTTTCTTCATTTTGTACACGTCAATGTAGCTGGCAAACGCAGAGTATACATCATCGCCAGAGTGTAGTGACAGTGTTTTGATCCCGGCGAGTTCTTCGGCCACCTTGTAGTATGCCCTGTTGAGTATCGTGTTATACAACATCGTGAACCTCGTTCCTGAAAACATGCCAACCGTGACCGTCGCTGCTTCCACCATGGTGCCGTCACCCTTCATCATTTGGTTTATCCACCCTTCTTGTCTCCCTGCCGACAGCAGTTCCTCTGTGACCTCACCTTTCTTCACTAGTACCTTCTGGTTCAACTCAGCTTTGGACAGCCATTTGAGGCACTTGTGCTGTTCTTCTGACAGCCTGGAACCTAGCATCACTGACGCTGATTCCAATATAGATGCCATCACCTCCTGGGTGTGCAAGATGTTAAAGTTCCTCGCATCTATGCATGCAACTACTCCCTGAGTAGACATCTCCATGACTCGTCGGCACACCCTGTGTGCATCGGCTGCCTTGCCGATGGGGCAGTCAGCTGGCAAGTACTCTTCAATCTGCCCAAGCGCTAAGCCGTTGCGGACGTGCTG
+TBLASTX ds2020-267_16 824 1165 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 50.8 1 100 25.0 1.27294e-121 434.533 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B CGTCCATCAGGAAGCCGGTCATTTTGGCTTTTCCGTAATTGACTATGTCTGTTTCCTCTTTGTGTACCTTGAATAGCGCGCGCAAAATCTCGTACCGCTTGATATTACCATTTTTTGAAACGTTTATGTTCCTTTCTTTTGGTATTACCGCGTCGTATGTTGCGCGCATTATCCTTGAAATGAAATCCTGCAAAGGTTTTTCAAGTTGTAATGATGCTTTCACCATTCTGGAGTAGTCCACCACTCCCGGTAACACGCCTATTTGCGTGGCACCCTTCCTGAAGCCTGATGACCGTATCATCCACTTTACGTCCGATCTCCTGTCTTCACTTATGCCCCCCACACACCTATGAGAAGTTTTTATTTTGTAACAGTCTGAAACTGTCATGTGCAATCGCTCACACTGTCTCGAGTAGTATTTGTTCCTCAGTGATGCTGCTAGCCACGTGGGCATGCCTCTCGACACCGAGTCGTCGAGGCGTGATTCCAACGCCTCTAGAAGGTCCCTCATGTCACTCGAAGGTTTTGATTCTATCCTCGAGTGTACTAAGGTCGCCATGGCCCTTGATAAATATTGTCCCTTAGATCCGCGCTTGTGATCCACTCGTAGGAACTCCGCTATAGCTCCGTACGCGCACTTGCTCATTTGTAGTCGTATATTGTGCTTCTTCGCGTTTCGGCCGGCTAGTAACACGTCCCCGAGCGAGTTACTGCCCAGCAGCACGTCGTCGCCGTTATGAAGACTGTTTTGTGACTTCACGACATCTGGCACTATTAATTGAGTGTAAATGTAGTTCAGGACGCTATTCATGAATGTGGTGAGCCTCCACCCCGACAGTAAAGTTCCTTTAGCACTATACTCCATCTTCAAGCCTTGGTTGTCATGTACTATCACTCTGTTCAGCGACAGTCGAGTCCATTCCACCGCCGCCAGCTGCTCTTGCGTTAGGAAGTGCCCGAAGGTGTCTCTGTACGCATCTATCACTGCTTTCATTGACTGTACACTATGTTGACTGTTGAAGTCTTCAAAGTCTACGCAGTATTGAGTTCTACCCTCGAGAACCGCCCTCACTCTGCTACGAACGTTCTCATCATTCGCAGCCTTGCCTACCGGGAATGGTGAAGGTAACACGTCTTCACAGTTGTACAATTGCGGACGTGCTGG
+TBLASTX ds2020-267_101 84 375 NC_016758 Rosellinia necatrix quadrivirus 1 segment 4, complete genome Rosellinia necatrix quadrivirus 1 22.3 1 100 8.0 0.000188849 43.2225 1000373 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Quadriviridae;Quadrivirus;Rosellinia necatrix quadrivirus 1 CAGCACGTCCGCAATCAGTGTGTCCTCTGCTCATTGTCACGTGCACCTGACTGCTTCATGTGCTGTAGCCAACCAAACAGGCTAGTCAGCGCGACTGTACCTGCCATTTTAGCTGCACTGACACTGTTGAGCTCGATTCTTGTCATAGCAGCTATCTCTTGTTCATCCAACTGCATGCCGGGAGCAGCTACACCAGCGACTGCCTTGCCGTTAAGTAAGTGCGCCATGACTGCATTTTCACTGACGCTGATTCCTTCTGCCTCAGCCATGATCGGCAGCTCACCGATCACTCTGATCTGGTGCGGCTGAAACACAGTGATGATCTCACTTGTCAGCGTCTTGTCAGAAGACTTGGCCATGGTTGCGGACGTGCTG
+TBLASTX ds2020-267_236 66 266
+TBLASTX ds2020-267_443 18 233
+TBLASTX ds2020-267_450 2 233 NC_006642 Cotesia congregata virus complete genome, segment Circle10 Cotesia congregata bracovirus 41.1 4 100 5.0 0.00020802475 172.0095 39640 Viruses;Polydnaviridae;Bracovirus;Cotesia congregata bracovirus CAGAACGTCAGCAATCGGCGTACCCTAGCGCGTCCGCAAGGAACAATCCTTCAGCACGTCCCAACTATCGTGCAGCACGTCCGCAAGAGTCGTACCCCAGCACGTCCGCAAGTAACAATCCTTCAGCACGTCCCAACTATCGTGCAGCACGTCCGCAAGCGCCGTACCCCAGCACGTCCGCAAGTAACAATCCTTCAGCACGTCCCAACTATCGGGGCATTGCGGACGTGCTG
+TBLASTX ds2020-267_644 8 216
+TBLASTX ds2020-267_36 424 651 NC_016758 Rosellinia necatrix quadrivirus 1 segment 4, complete genome Rosellinia necatrix quadrivirus 1 28.0 2 100 13.0 3.23046e-12 88.7361 1000373 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Quadriviridae;Quadrivirus;Rosellinia necatrix quadrivirus 1 CAGCACGTCCGCAACTACGACACGTTTTTGTAGCGCTCCCTGGCCGTGTCTGCGTTCTGCATTGCTCGCGGCAAACACAGCAGGTTGTGTGCATGATCAAGTTGCAGACGCGTAACGTCCTCATCTTTTAGACACATTTGTGACCGCTGTGCCACGTGCACCTCTGCCATCGCTCTACCGCTGCCCAACATCTGGATGCTCGAGCAGATCATGCTGACCATCTCATCACCGTTGATTGACGAATTCTCACTGATCTTGTTAAACTGAGGGCTGTTAGATGATGAAAACAGCCTGTCAACCGTTGGCTCGCAAAAGGGTTGTACCACTTTGTACACCCCTGCGTAAAACACGTCAGCATAGTCGTGGTGGGACAAGGCTGCAGGCTGGTAGGTAGACGCCACAGCTAGCGACGCCATTAACATCACGTTTTTAGAAGCCATGAAGTGCCTGGTCGTGACGTGTCCAATGAGGTCCAACATGTCGTTGATCGAGAAACCAACACTGTTGAACCAGTCTCTGTCGAGGTGGGGCGCTGACGACCCTACACCTGCAATGAAGGACACATTGCACTCACTTGCCACCGCCATCAACTTCTGATGCCCCACAGCAGCCTCAATGGAAGGCGAGAACCCCGTATTTGCGGACGTGCTG
+TBLASTX ds2020-267_5 37987 2029 NC_023684 Rhizoctonia solani dsRNA virus 2 segment 1, complete sequence Rhizoctonia solani dsRNA virus 2 47.6 8 100 100 3.1306275000000004e-37 1379.9565000000002 1411681 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Rhizoctonia solani dsRNA virus 2 ATCGCACATGATAAAGCCCGATATCTAAGGAGCAGCACGTCCGCAACCCTCTGCCTCCAACAATAAAGCAGATTTCTTTGCTCTTCTAACAGCTATTACTTACCACAATGGACCACCTCACTTCCCTTTTCGAGCTTTTTGCTATCACACCGAAAACACAAAACAATCTACAGTTTGTTGGGATCTACCACAGACCTCCACACTCCGTTCGAGCAAACCTCCGCAACGTTGAAAAACACAAAATCACAGTCGCTCACGCCATGCACAAGTACCTTTACCCGCATGAAATCGACTTTGTTATCAACCAAATGCGACGCTCAGACGTCACTGAAGATGCCATACTTGCTGACTTTTTCGACAACAACGTCGAACCACTTGAACCTGTTCTTGACGAACACTTCGAACGTGGACTCTCCGCAATGCTGGACGCTTTTCGCCCTCCGCAGAAATGCCTACCTGCCCACATCTATGATGTGCAGCACCACTACCCATATAAATGGCAAGTGAACGCTGAAGCCCCCTTCTCCACCGATTCCTATTTCTTAGCGAATCGACCAACCTTCCGCGCAGTGTTTGAACGACTCGAATCGCTCTACACACACCTCGCAACCGATTGGCACCGCCGATACGGAAACAAAACCGACAATGATGATTTTATGAATGATCATGTCCCTGCGAAATTTGGCCCTATGAAAGAAACAGTCTTCTCATGGACTCACCGATGGCACCACGTCATCAAATCCAACTTCACCGACACAGCTGGATTGTCTAAAGACTATTACTTCAAAAACCGATACATCTTCCCAATGCTACTTCACACGAAGACAGCGATTGTCAAGAAAGACGACCCGAATAAGATGCGAACCATCTGGGGCTGTTCAAAGCCTTGGATCATCGCAGACACCATGCTATGGTGGGAATACGTCGCGTACGCTAAGTTACAACCTGGAGCCACACCAATGCTCTGGAGTTACGAAACCTTCACAGGTGGCTGGCTTAGACTCAACCACGCACTTTTCTCTTCATACATACGGCACTCGTACATCACACTCGACTGGAAACGCTTCGACAAGAAAGCGTATTTCTGCATCATCGACAAAATTTTCGATGGCGTTGAAACATTCCTCGACTTTGACAACGGCTATTTGCCTACGAAAGATTATCCCGATACCAAATCGACTTGGACACAAGAACGTTCCACCCGCCTCAAACGCCTGTTTGACTGGACAAAAGAGAACTTCTACCATGCACCAATTGTCCTACCCAATGGGCACATGTACGTCCGAAAATTCGCTGGAATACCCTCTGGCCTATTTATCACTCAACTGATCGATTCCTGGTACAACTACACCATGCTCGCAACCATCCTATCCGCGATGGGCTTCGACCCTCGGTCCTGTATTATTAAAGTCCAAGGTGATGACTCAATCATCCGCCTCAGTGCACTCATCCCTCCGGATGCTCACGATTCTTTTTTAACTAAGGTCCAAGAACTCGCCGACTACTACTTTCAATCAGTAGTCTCCGTGAACAAGTCTGAAGTACGCAACGAGCTCAACGGATGCGAAGTTTTATCGTACCGACACAGACACGGTTTACCATACCGCGATGAACTAGCTATGCTAGCTCAACTGTATCACACGAAAGCACGCAACCCAAGTCCCGAAATCACAATGGCACAATCCATCGGCTTCGCCTACGCTTCCTTCGGAAATCATGAAAGAGTACGTCTCGTACTACATGATATCTACGAATATTACAAGCATCAAGGCTACACACCCAACCGAGCCGGACTCAGCCTCGTCTTCGGAAACTCTCCTGACCTCATGATCCCGCACTACACACTTGATCACTTTCCCTCAATCAGGGAAATAAAAATGTTCCTGACTAATGCAAAATATGCCAATGAAGAAACCAACTCACGAACGTGGCCTTTAACCCACTTTCTCCATCTTCCTTGTCATCGCACTTAGTATTTGAGCAATTGCAATTACAACATAATTACAAAAAAAGGATTGCGGACGTGCTG
+TBLASTX ds2020-267_43 465 563 NC_021222 Cryphonectria parasitica bipartite mycovirus 1 strain 09269 segment RNA1, complete sequence Cryphonectria parasitica bipartite mycovirus 1 57.9 2 100 21.0 5.04473e-43 192.2912 1329781 Viruses;Cryphonectria parasitica bipartite mycovirus 1 CAGCACGTCCGCAACTACTCTCCCTTGCATCAGGCGGTGAAATGCGCTCTCTGCGTCGGCTTGTGCCAGGGGATTCGCCTCTTCCCTGGTCTTAAGTCCCATTGTAGCGTACTCAATGCCGGCGAACTTCTTGGGGTAGAACTTAACGGTGGCGAGATCTTCCACTGCCGGGAAGAAGAGGAAGTCGGGAAGGTCGAGTAACTTTGCCACTACATAGGCGGCCTTCTCTATGGAGTCGGTGTAGCGGGGGTCAGGGGTGTGATTTGGCCGATCGAAGTGGCGAAGGTGTGCCATCTCAACTGGGGTGCAGGCCTTGACGAATGTGAATTCCTCCGGCTTGAAATTGTTGATGGGGGGGGGATGGAGGAGGGTGTAGGCGACAACTTCGGGGTCGGGTGGCGCAATGTCGAGTTCCTTGTTTAGCTTCCCATAGGCTTCAACCCTACCGAGGATTCGTATATGTTGGAACATGTTGGTGAGTTCCATCACTTCGCGGGTCGCGGCCTCTTTGGACCTCATGGATCGCATACGCGTCCTACGCTTGATAGATTGCGGACGTGCTG
+TBLASTX ds2020-267_453 17 232
+TBLASTX ds2020-267_352 4 245
diff --git a/tools/virAnnot/test-data/otu_s2.fa b/tools/virAnnot/test-data/otu_s2.fa
new file mode 100755
index 00000000000..1ed4abb883c
--- /dev/null
+++ b/tools/virAnnot/test-data/otu_s2.fa
@@ -0,0 +1,6446 @@
+>ds2020-328_1
+GGTCGGGATAGACGTTGGAGCGCGGTCAGCCGAGACCCCTGACAGAGGAAAGAGTCTTGA
+GGAGTCCAACGTTCGGCCAGGCATAATAATTCGTGCCCACTAATCGAATCGGTTTACTCG
+CCCACCATGTCAGCGCCTTCGGGTTAGTTCTTTATGGAGTTATTTCTTGTTCTTTCTGTC
+ATAACAATTCTCCTTATGGAAGTCCCCCACAAGATTAAGAATGCTTGTTGCCGCGGCTGT
+CTTGGTTCTTCGTTTAGCTTTCTGGCATATTCTACGGAGCTTTCCACTCTGGAGCTGGCT
+TTCAGAAAAACCTTCATTCACTAGATGTGAAGCACCCCTATGGGGGAACCCTCTTACCCG
+CTTTCCTCCCCCCCCGATATGGGGGGCCTCGCTGTCGCCTTTGGCTCGAGCTACTTTTTC
+TCCTGGAACGGATAGCTTTCTGTCCAAGTCTATCTCCCAAAAGTCAGCCATGTAATTGAC
+TTCTAACGTCTAATTTTCTTTTTCACCGGGGGTCCCTGATCCCCGTTGAATATTCCTTCC
+TTCTGAAAAAGCTGTGACTCCTAAATTCTTTGATTGAATGAAATGTGGACTTGGTCACGG
+GGCAATCTTCTTTTTTAGACCCCGCTTCTCTCGGTGTTACCTTTTTCGCCTTCTCGTCTC
+GCTTCGCGTCGTCNNNNNNNNNNGGTCGGGATAGACGCGCCGCTTCCGTCTGTTTTACCT
+TGTTAGAATTCTCGGCGCGCTTGGCGTCGTCTTTAGAGTCAATTCTATTGGAATCTCCTT
+TCCCCTTCTTTTCTTCCCCCACGATGAAAAAAATAAATATTGCAAAAAGAACAATATTTC
+CCCCCGTGGTCATCATAGTGGTTCCTTCTGATCCTAGAAAACGATTAAAAAGAAGGCAAA
+AAAAACAAAGGAGGATCTGCTTTTTCATATTAAAGCGCTTTCTTTCTTTTAAAAATACAT
+CATAGTAAAGCGCTTCCTTTTAAAAAAGCATCTGGTTCCATCTTTCTTTCGTTAGTTAAC
+CCACCTTTTTCTAAAAGGGATTGTAGTAATTCTGGTTTTACACTATTTAGAATGGCTCTC
+TCATATTGAGAGATTCTGTCTAGTGGCATTCGATCACAGAATCCATTGACAGCTGCATAA
+ATGACTAGAATTTGTTTTTCAATTGGAAGTGGTGCATATTGTGGTTGTTTCAGTACTTCT
+GTAAGCCTTGCACCTCTATTGAGTAATGCCTGAGTCGCAGCATCAAGGTCTGACCCAAAT
+TGAGCAAAGGCCGCCACTTCGCGATACTGTGCCAATTCCAGTTTTAAACTACCGCAGACC
+TGTTTCATAATTTTCAACTGAGCGGCAGACCCGACGCGACTGACAGATAAGCCGACGTTA
+ATAGCAGGTCTAATTCCGCGATAAAAGAGCTCTGTTTCCAAACAGATTTGTCCATCAGTA
+ATGGAGATTACATTGGTTGGAATATAGGCCGATACGTCTCCAGCTTGTGTTTCAATGACG
+GGTAAGGCGGTCAAGCTACCTGCACCTGTCTGGTCCGATCGTTTAGCGGCTCTTTCTAAG
+AGACGGGAATGTAAATAGAAAACATCGCCTGGGAAAGCCTCACGGCCTGGTGGTCGGCGT
+AACAATAATGACATTTGTCGATATGCCACCGCCTGTTTACTAAGATCATCATAGATTATT
+AATGCGTGCATTCCATTATCGCGGAAATATTCCCCCATGGCACACCCAGAATATGGGGCC
+AGAAATTGCAGAGGAGCTGGATCCGAAGCGGTGGCTGCTACAAGAATGGAATATTCCAAA
+GCATTCGCTTCTGAAAGAATTTGAACTAATTGTGCCACAGTCGAGCGTTTCTGTCCAATT
+GCTACATAGACACAATACAATGTCTCACTCTCAGAGGTGGCCCTTGAGTTCAGTTGCTTT
+TGGTTTAATATGGTATCGATAGCAATAGCTGTTTTTCCAGTTTGTCGGTCCCCGATTATA
+AGTTCTCGTTGACCACGGCCTATAGGAACCAGGCTATCTACCGCTTTTAACCCTGTTTGC
+ATAGGCTCGTGCACAGATTTACGTTCAATAATCCCAGGGGCTTTCACTTCGACACGTCTT
+CGCTCGTGATCGCTTAGAGCCCCTCTTCCATCAATAGGAACTCCCAACCCGTCGACCACG
+CGCCCTAGCATAGCCTTTCCCGCAGGAACATCCACAATGGATCCAGTGCGCTTGACAAGA
+TCTCCTTCTTTAATAGCGGTATCACTACCAAAGACAACAATCCCTACATTCTCATTCTCA
+AGATTCAACGCTATTCCTTTCACACCGCTGGCAAATTCAACCATTTCCCCAGCTTGAATC
+TCGTTCAATCCATAAACACGTGCAATCCCATCTCCAACTGAGACCACTCGACCGATCTCA
+TCCACTTGAAAATTCGTGTAAAAGTTGGTAATTCTACTTTCTAATAGAGTTGTTAGTTCC
+GCAGCTCTGGTAGAGAATTCCATAATTTTTTCTTTTAAAGAAAGTCAAGGGAGAATTCCG
+CTTATTGTTTTTGGCTCGAAATAAAGCTAGGGTCCTGATCGAGCAACTAGTAGTCCTATC
+TATCCACCTCTCCAGAAGGGCTATTTGGGGTCTAATTTTCTTTCTATCTGACAGGACAAA
+CAAAGAGGAAGGGGTGGTTCTTTCATTGCATTGATAGAAGTCTAACTAGAAAAAGATCTC
+TCTATTACTTTGAGAAGAGAATCGTTGGTTTGACCGACGAACTACGTGGGAAATATGAGT
+TGAGAGGACAAGAGGATTCGATCTCCACGAAAGGCTAAAGGAACATAAAAAAAGCTAGAA
+TTTGTTGCAAACAGTGACCGAGATGCCAGGGAAAAACTGTTGTTTCACATTTCCGGAAAG
+ACCACCTATTTGTTCGTTTACCAGGTTCGGTACGAAATCATAAATAAGCTCTACCCCGGG
+CCATCGCCTTATGGCCTAGGGGCGTCTATCCCGCC
+>ds2020-328_2
+CCCCCCCTTTCGCCCTTTTTTATGCAGACGATTCCCCGATCGGGGAATCGTCTGCTTCCC
+TACGTATTAATCTTCTTCTTTTCTCCTTTTTCGCGTTTTCCTCTTATTCCTCTTTCGTTT
+TCCTCTTATTCTTTTTATACGCAATTTCTTTTTTAATTTCTTACTGGTCTAAGTCCCACT
+CCTCTTTCTCCCCGTTTTGCGTTAAGAATATTTCACATGGCATCGGTTTATAGCCTTTTT
+CCCTTGTCATCTCCTCTACAATCTTTTCTATTTTTTCATATTTCTTCTTATAAAATTCTT
+CCTCTTCTCTTCTCTTGCTTACTTGTATGGTTGCCGGAAATACTCTTGTTTCGCCTATTT
+GTATTTGTAGAGGCCATGTAGCATAGTCGTTTCCTTGTTGAGCCCCCTTACTTCTTTTAA
+CTTCCATGTAGCTTCTTGCTGTCCAATCCCTTTTATCGTAGAATATCCTTTTAATTTTCT
+TTGTTTCTGAGTTTTCGTCTTGCTCTCTCTCTCCTTCATTTTCCTCGTCGCTTCCCTCCT
+GGTTTTCCTCCTCATATTCTTCCTTACTCTTAAATAGCTGCAAGAATCTCCTTCTTTTTT
+TCTCCTCTTTTTCTTCTTTCTTTTTTACGGGTATACACGCAAAATCTAACAGTGCCATTT
+CCTTCTCTTGTTCGCCCCATGTGTAGCATTCCTCACCATCGATTGTTTGTAATTCAAACA
+TCAAATAACTTCCTCCCGCTGTGGTTTTAATCTTTTTTATTTTTACTTCATATATTTTTC
+CTTTTTTTGTTATAAAGATAACTTCTTTCTTTAGAATGTATTCTGCGGCCTCTGGGTTCA
+ACTCCCTTTGATACGGTATGTTTATATTTTTTATGTACTGCTTCCATTTTTTTTGACTGT
+TTTTCATCTCCTTAGGATCGTCCTCAATAGGAATAAAGGTTCCCACGGTTTTGTTGTATG
+TTAAGATGACTTCCGTTGGTGTGCTTCTTTCCTTAAAATAGGGGCTCTTACACGCTCTTC
+TCATTATACACCCATATAAGGTTGCTACTATTCTTTCTTCCTCCAAATGCTCTATGTTTG
+ATGAGAACCTAACCCTATAGAACCTTGCTCTAAAGGGTCCATGTTGTCTCATTATTTGAG
+GTAGTTTGTTGGCAATCATAACAATTGGTACATTTCTTTTCTTTTTGAATACTCTTGCAT
+ATTTGGAGTCTAATCTACATTCTTGTCCATCAAGTACCTTGAGAATAGTGTTTGCAAATG
+CCGTTCCTTCTGCTGTGGCGCCTATAAGGGAGCTCTCGTCGTTTGGTTCATGAAACTCAT
+CGAATGCCCATAGATCATAGTAATCATTTGCTCCCGTAAAGTCATTTCTTCTTGCACTGG
+CAAAATAAATTCTTAATACTTTTGCTAGTAAGTGGAATAGTAATGTTTTTTGTGTGCTTG
+GTTCGCCATATATGAATAGTTGCTTTGTTTTTATGGGTCTCTTGAAGCATATTTGACACG
+CTATCCAATCTATAACGAGGTACTTTTCTCTTAGCTCTTCCACGTCATACTCCCTTGGTT
+CCCCTCTTTTTATTAGATAGGATACAATTCTTTCTAGGGTGTTTGTCTCTATATCTTTTA
+GTATCTTTAAATCTTCATAAGCTTCCTTCATTCTTGGTAGATGCATTAAAACTTTCTTTT
+GTAATATATCATCTCTATATACTTGGTACCAATCCTCCGTCTTCTCTAGTCTTTTGAGTA
+TTTCTGATGGGTCTGGATTCCCCTGTGCTTCCTTATGTTGTTCATGTGCCTTTGCTAACC
+CTCTTGTTTGCTCTAAAGAGTATTCTCCCCATATTAATGGTTCTTTATCTTCCTTTAAAA
+TATATTTGCAAATAGTTCCCCATCCCTTATGTGCCTTTACATCTATACATCTTCCATCCC
+ACTCTTTGAATCCATTTCTAATTCCTTTTGCTAAATTGTTCTTTGATGCACTCTCATTCC
+ATACTCCAATGTGGTAATGAAATCCTTTCTCTCCGTGATTTTCCTTTGCTATTATGACTG
+ATCTGCATTGAAACATCTTGATGATTCTCTCCTTTATTACTCCCCTATCTATTTTTTTCC
+GTTCTGTCGTTTCCGCATGAATAAGTGTTATTAGTAAGTAGGGTCTTATAGTGTTTAGTT
+TCATGTTCATTGTGTTGTTTCTTTTCCGTGATTTCCTTTTCTTCTTTTGTTTGCGCTAGG
+TTATGGAGTTGCTGCTGTGAGTGGATGTAACTTCTAGTGGATGTAACTTCTAGTGGATGT
+AACTTCTAGGTGGGAGTGGATGTAACTAATAGGGGGGTCCGGGGGAAGTGGGTCCCCCCC
+GGGCAAGAGACAAGATAGGTAACTCCAACATCCTCGTATGAAGAGTAAACAGAAGGGAAG
+TGAGGCTCCCTTATACAGGAGCCGAACGTTACTTCAATACCTATAAAGTTAAGGTAGTGC
+TCTTTTTGTTAAATACAAGCAGCCGACAACCCCGCCTAGCTCTAGTAATAGGGGTTGTCG
+GCGTATCGTCTGATTCTTCGGCGAATCGTCTGCTTTTTTTCTTTTTCCACTCGTGAAGCC
+CCCCCTTTCGCCCTTTTTTATGCAGACGATTCCCCGATCGGGGAATCGTCTG
+>ds2020-328_3
+TTCCCTACGTATTAATCTTCTTCTTTTCTCCTTTTTCGCGTTTTCCTCTTATTCCTCTTT
+CGTTTTCCTCTTATTCTTTTTATACGCAATTTCTTTTTTAATTTCTTACTGGTCTAAGTC
+CCACTCCTCTTTCTCCCCGTTTTGCGTTAAGAATATTTCACATGGCATCGGTTTATAGCC
+TTTTTCCCTTGTCATCTCCTCTACAATCTTTTCTATTTTTTCATATTTCTTCTTATAAAA
+TTCTTCCTCTTCTCTTCTCTTGCTTACTTGTATGGTTGCCGGAAATACTCTTGTTTCGCC
+TATTTGTATTTGTAGAGGCCATGTAGCATAGTCGTTTCCTTGTTGAGCCCCCTTACTTCT
+TTTAACTTCCATGTAGCTTCTTGCTGTCCAATCCCTTTTATCGTAGAATATCCTTTTAAT
+TTTCTTTGTTTCTGAGTTTTCGTCTTGCTCTCTCTCTCCTTCATTTTCCTCGTCGCTTCC
+CTCCTGGTTTTCCTCCTCATATTCTTCCTTACTCTTAAATAGCTGCAAGAATCTCCTTCT
+TTTTTTCTCCTCTTTTTCTTCTTTCTTTTTTACGGGTATACACGCAAAATCTAACAGTGC
+CATTTCCTTCTCTTGTTCGCCCCATGTGTAGCATTCCTCACCATCGATTGTTTGTAATTC
+AAACATCAAATAACTTCCTCCCGCTGTGGTTTTAATCTTTTTTATTTTTACTTCATATAT
+TTTTCCTTTTTTTGTTATAAAGATAACTTCTTTCTTTAGAATGTATTCTGCGGCCTCTGG
+GTTCAACTCCCTTTGATACGGTATGTTTATATTTTTTATGTACTGCTTCCATTTTTTTTG
+ACTGTTTTTCATCTCCTTAGGATCGTCCTCAATAGGAATAAAGGTTCCCACGGTTTTGTT
+GTATGTTAAGATGACTTCCGTTGGTGTGCTTCTTTCCTTAAAATAGGGGCTCTTACACGC
+TCTTCTCATTATACACCCATATAAGGTTGCTACTATTCTTTCTTCCTCCAAATGCTCTAT
+GTTTGATGAGAACCTAACCCTATAGAACCTTGCTCTAAAGGGTCCATGTTGTCTCATTAT
+TTGAGGTAGTTTGTTGGCAATCATAACAATTGGTACATTTCTTTTCTTTTTGAATACTCT
+TGCATATTTGGAGTCTAATCTACATTCTTGTCCATCAAGTACCTTGAGAATAGTGTTTGC
+AAATGCCGTTCCTTCTGCTGTGGCGCCTATAAGGGAGCTCTCGTCGTTTGGTTCATGAAA
+CTCATCGAATGCCCATAGATCATAGTAATCATTTGCTCCCGTAAAGTCATTTCTTCTTGC
+ACTGGCAAAATAAATTCTTAATACTTTTGCTAGTAAGTGGAATAGTAATGTTTTTTGTGT
+GCTTGGTTCGCCATATATGAATAGTTGCTTTGTTTTTATGGGTCTCTTGAAGCATATTTG
+ACACGCTATCCAATCTATAACGAGGTACTTTTCTCTTAGCTCTTCCACGTCATACTCCCT
+TGGTTCCCCTCTTTTTATTAGATAGGATACAATTCTTTCTAGGGTGTTTGTCTCTATATC
+TTTTAGTATCTTTAAATCTTCATAAGCTTCCTTCATTCTTGGTAGATGCATTAAAACTTT
+CTTTTGTAATATATCATCTCTATATACTTGGTACCAATCCTCCGTCTTCTCTAGTCTTTT
+GAGTATTTCTGATGGGTCTGGATTCCCCTGTGCTTCCTTATGTTGTTCATGTGCCTTTGC
+TAACCCTCTTGTTTGCTCTAAAGAGTATTCTCCCCATATTAATGGTTCTTTATCTTCCTT
+TAAAATATATTTGCAAATAGTTCCCCATCCCTTATGTGCCTTTACATCTATACATCTTCC
+ATCCCACTCTTTGAATCCATTTCTAATTCCTTTTGCTAAATTGTTCTTTGATGCACTCTC
+ATTCCATACTCCAATGTGGTAATGAAATCCTTTCTCTCCGTGATTTTCCTTTGCTATTAT
+GACTGATCTGCATTGAAACATCTTGATGATTCTCTCCTTTATTACTCCCCTATCTATTTT
+TTTCCGTTCTGTCGTTTCCGCATGAATAAGTGTTATTAGTAAGTAGGGTCTTATAGTGTT
+TAGTTTCATGTTCATTGTGTTGTTTCTTTTCCGTGATTTCCTTTTCTTCTTTTGTTTGCG
+CTAGGTTATGGAGTTGCTGCTGTGAGTGGATGTAACTTCTAGTGGATGTAACTTCTAGTG
+GATGTAACTTCTAGGTGGGAGTGGATGTAACTAATAGGGGGGTCCGGGGGAAGTGGGTCC
+CCCCCGGGCAAGAGACAAGATAGGTAACTCCAACATCCTCGTATGAAGAGTAAACAGAAG
+GGAAGTGAGGCTCCCTTATACAGGAGCCGAACGTTACTTCAATACCTATAAAGTTAAGGT
+AGTGCTCTTTTTGTTAAATACAAGCAGCCGACAACCCCGCCTAGCTCTAGTAATAGGGGT
+TGTCGGCGTATCGTCTGATTCTTCGGCGAATCGTCTGCTTTTTTTCTTTTTCCACTCGTG
+AAGCCCCCCCTTTCGCCCTTTTTTATGCAGACGATTCCCCGATCGGGGAATCGTCTGCAT
+AAAAAAGGG
+>ds2020-328_4
+CTGAAGTGCGGGGGCGGGATAGACGGGAAAGAGGAATAGAAAGGGGGGGGGACAGGTTGG
+TTCGAGGACTCGTTGGTCAAAGGAAAGATGGAAACAGGGGAGTTGGCTGATAAAGATGGA
+CAGTAACGATCGCGTAATATCAATTTATCGGCCTCGTCATTGAAAGCGGCTTCCAATTGC
+TCGGAAATTCTAAGCTATATGGGGGGCTTGGATGGTGAGCAAAAACAATTGATCAAGAAG
+TTGGTCAACTTTCGCATGAAAGAAGGTAAAAGAACGAGAGTTCGTGCTATTGTTTATCAA
+ACTTTTCATCGCCTAGCTCAAACCGAACGCGATGTAATCAAACTTATGGTTGACGCCGTA
+GAGAATATAAAGCCCATATGCGAAGTGGAAAAGGTAGGAGTAGCAGGTACTATTTATGAT
+GTCCCTGGGATTGTAGCCAGGGATCGTCAACAAACCTTAGCTATTCGTTGGATCCTTGAA
+GCAGCTTTCAAACGACGTATAAGCTACAGGATAAGCTTAGAGAAATGTTCATTTGCTGAG
+ATACTGGATGCTTACCGAAAGAGGGGAATTGCACGTAAGAAAAGAGAGAATCTTCATAGA
+CTGGCTTCCACCAATCGAAGTTTCGCGCATTTCAGATGGTGGTAAAGTGAGACCACATAA
+AGAGCTCTTCCTCATTCAGTCTGATTATTCAGTAAGATATGGTTTGACCCTTTTTCTTTT
+TGTTTGAATCTTCATATAGAAAGCCGGCCTTCCTCATACTCCTCCCTTCATTCATTGAGT
+TGGAGGAATCCATAGGGGCCCGCCCGTTATGCATTCCATGAAATAACCCTTCTTTGTATG
+ACTTCTCTTTTGCCTCAGGTCGAATGAATCCGAAAGGGAGATCAATCAAAAAAGAGGCCA
+TGAATGAAGAAGTAGTGGGCCTTTCACCCTCTTTCTAGTGACTCGGGGAGCTGATCTGAT
+AAATGCACTTCAAAGGGAGGGAAGCTAGGTTTCCCATGTTGGTATGGCCGGGCATAAAAG
+ATTTTGAAGTTAGGTCAAAAAGAAGAGGTAGAGAGAGAGAACAGAACGGAACCGATAGCC
+CCGAATTATGTCAGGGCAAGAGAAAGAAAAGAAAAGTAAGGACTCTCGTTTTCCGCATAC
+GCATATAGGCTGTGAAAAAGAAGTCCACTTTTCCAATAGAGAAAGAGAGTGATTCGTCTA
+CTTTGTTAATAAGGTAACGGAACGAACTTCAAGTACTTCGTAGGACGCCGCCGTTTGCTA
+AGATGTGCTTCCACATCGTGAGCTTTAGTGCACAAGTCGTCGAATCCCTTAAAGGTTTGG
+GGCAGGGGACGACAAGTCGTGCCTGAAGTTGTTCATGCACATCTTGAGGAGCTCTTGCGG
+AGTAAACTTCTGGGGACAGGCAAAAGTAGGGGCTCGCCACCTTGCAATGAACTCCGTGAC
+AGGTTCATGCTTGGTCTTGAGTTGTTCGGGCACTCCAACCCTTCTTTGTGTGTTGCTGAA
+CTGCTTCCTGAACTCCGAGACCCTTGCTTCCCAAGTCGGGATCGACTCTTCAGAGAGGTG
+GGCGTACCGTGTAAAGGCGGGCCCCTCCAATGATTGTACGAAAAGCCTAAGGCACAGTGC
+CCCATTCTGCGCTACCGGCCCACATCTTACCAGGAAATGCGCTAGATGCTGGTGCGGGTC
+TCCCCGTTCCGTCGAACTTTAGTCTGGCTGAGAGAACCCTGGCGTATACGGCACGGAATC
+TATCCAAGCCGGATAAGGTTTGGTGATCATGTGGTTATCCTCCTCCTTTTCCTTGGCCTC
+TTTTACTCTTTTCTTGACCAACTGATTCATTGTTGCGAGGAGGGTTGTCAAGCTTGTATA
+AAAAAAGACGTATAATAAATCGTTGATTGCTATTCTTGAACCTCTTCACCATGCTAATAA
+GATTCAGGAATTCTCCAACAGAATGGGTTTCCACTTTTCATTGGCAAATCAAGAGGCAGA
+TGATAAAATATGGCTCTGTTGGAATCATGAAGTGAATGTAGTGCTTGTCGACGCGTTTGA
+ACAGTGTATCACAGTCGACCTTAATTCTGATCTGGTAAGGCTTACCATTGTTTATGCAAA
+GTGCTCCATTCAGGAGAGACGGCTTCTTTGGGAAAAACTTCAATTACTGTCCTAAGACAT
+ACAAGGTCCATGGATGGTTGCGGGTGATTTTAACGCAATTTCATATGTGTCTGAAAAACT
+TGGTGGCAGACCTCCAAATCTTTATCTTTAGAGGAATTCAAATGAAAAATTCACGGACTC
+GCCATTTCTGTGAGAGATCCGATCCCAGTTGGTTTCAACTTTTTCTTCCCTCTCAATTCC
+ATCCATATCCCGCCTTCAATCTGAATGATCTGGAATTCATTTCCAATTCCTTATATCAAC
+TAATGGGGATACCGGGAGGGAGGAGAGAAAGCACCCCGCTAACTTTTTCTTTCTTCTACC
+AATGATCAGTAGATTGAGCACTAACGGAATATCGAGAAAGAAAGAGCGGAGCAACTAAAT
+CAAAAAAGTGCGTCTATCCCGACCA
+>ds2020-328_5
+GGTCGGGATAGACGAAAATCGCCTGTCAAAAAAGGAAACGAACGAACAGCTTTTGCGCGC
+GGAATAGGGAGAGACCTCTTTTTATAACGACAGCCGACCCCTTCTAGAAAGATTTTTGGG
+TAACCCCCCTGAAAATAAGGAAATGGATGTCGATTAACCCCACTTGGAGAAAAAGGGAGG
+CCAACGCAAGAGTCACCCACTCCGTGTGTGAATGGGCGAGGATAAGGCAGCCAATCAGGC
+TAAAATAAATGACGTGCACCTTATCCTTTGCCTCAAGAATGAGGTGGTTCAAATTTGCCG
+CAGCTTGTGAGCCCCCTGCTTCGTCTATCCCGACCNNNNNNNNNNGTGGAGGGAAAAAGA
+ATACAAGTGATCCTTACCTTTTTTCGCAATATAGAGAAAGAAAATGGCGCAAGCGCCCGA
+GAGGGGGAACAGCTGGTACTTTATTATTATGATAAAGTCTTGTGGGGCCAAAAAGATGCC
+TAGGGAGGCCAAGAGACTGACGACGCAAAGATAGAGAATGGCTAAATAAAGGGAGAAGGC
+CGGATGGATGCGAAGTCCCTCTTTCCAGAGAAAAAGGAAAAAGATTTGAATTAATAGGGC
+GATTCCCCCTTCGAAGGCGAAACACCGCCCTATTAATAATAATAGGAAGACCCAATCCCT
+CGGTAAGAGGAGAAGGGTTATCAACGCCGCAATGGGGTAAAGAGGGTCTGTAAGTAGAAA
+GCCGAAAAGGCTACTACTCAAAAAAGATGTAAAACTCAATTTACGTTGGAAGGGAGTCGT
+CGCCATAGTGGCGTAGAAAATACCCGAGCTTCCGCCCAGGACTTGTATTACTTGGATTAT
+TTTTTCCCATGGCAAAGGGGCCAAAAGGACCTTTATTGTATAAATAATAATTACAAAACA
+GATAATAATAATATCATCTGTATCATGGAAAAAATCCGTCAATAAATGACGAACCCCATT
+ACACAGATGATAGGACAGGGCTAAGGCTGCGATCTCGACAGAGATGGGGATTAACTTTGA
+TGAATAAAAGAGGAATTGGTAGAAATTCTCATGGTGCCCGCTATTCAGTGATGGTGAGCT
+GGTCAAGTAAGGAGAATCGGAATAATCGAGCTAATCGGTATCAGTCTTGGAGCAGGGTAG
+CGGATCAAAAAGTACCCCAAAAGAGTAGCAATAAGGTACCTATTACTCCATTCGTCAAAG
+CACGCTGAACACCGGCTCTTGATCCAGGGGTTTTTCATGTAAGTGGCTTAGAGTGAGATT
+CTTGTGACCGACCACCTCACTCCGGAATAGAGATTCTCAATAAAGTAAGAAAGAGAAAGA
+AGGAATACTAAGAGATTGAAGGCTTTTAGATTCAAGAAAGAATGCGAAGAGGACGCTAAG
+CAGGATGCAGAGAGCAAGCTTGGCTTATCCGTATCCGTCTTTTCCTCGGTTTTACTTTTT
+ATCTTTCTTAATGGAAGGCAAGGTACAGGTACTCTCAAGTGCGCGAGAGGAAAGCGAGCT
+TGATAGAAAAAGTCGCGTTTAAGCCGCTTGATATGAGTCAAAGAGCAATAAGCATTTCTT
+CTTGGTGAAGGGGCAAATTGATAAAGAAAGTTGTTTAAGCCCTTTGCTTTGAGAAAGGTA
+GGTAAGCCCCTTGATCGATCGTTTAAGGCGAGGGATCAGATCGGTGTGCCACAGAATATT
+ATTGTATTCTACCTTGGGATATTTTTTCCTGACCAATTGCCAAGCTGATTTGAACGAGAA
+ATCCCCTTCCGTAGATAACGTCCATACCACCCTGTCAGGCAAAGGTACTGGGGAAAGATC
+CAATGCCCTAATCTCCTGCCATATGTCCTCCAGAAAAAAATTTATGGCTGTAGGAAGAAC
+CCACCTCTGATTACCAATAAGGTCCGAAACGCGGTTCTGGCCTACGAGAGAAATTAACTT
+TACATACTGATATCGCATACCGAAGGGAAGGCCTAATTGCACCACTCCTCCTTATCTTCC
+GCCTGCCGTCTCCCTCCTCTTTGCTTTGCTAGCATCCTTTGATAAGCAAGTTGAATGAGC
+CTTCAAAAAGAACCCACCCATATATGTACCCCTTTAGGCTCTCCGAGCAAGCAAGTGAGT
+GAGCTAGTAAGCAAGCCAAAGATACCAATCCGCTGTTTTGGATTCCCGTAGGAGTTAGCG
+ATAGAAGTTGTGTCGTAAGTCCTGCCCCTTGGGGCAGAACCGCCAGCGATTTGCTTCCAT
+CAATGACAGCCGTCTTGTACTGATCCGCTTATCTTTTGATTGACGATCAAGTAGCTTTCG
+CCTAGTCTCATACACCCTCAGAATGGTTACTGGACAAGTTTGGTCCTTTGCTGATACAGA
+AATAGGGCAGCTCACCTGTTATAACACTTCGGCCCTAGCGTGGTCTTTCCACGGATAAAA
+CCTGTTCTGTATCAAGGACCCGGAACGAACGTCTATCCCGACC
+>ds2020-328_6
+AACACCAAGAAGTATCCATTCTTAACACAATGAAACCGCCGGCTTTTTAAAAATATTTCC
+TCTTCAATTATGCACGATTTACTGTACTGGGGTTGTCTTCCTTTCTTGGGAGTAAAGTGA
+GGAGTCAATGAAGGTTTGCTTGTGGTTTTAATTGATAGGTGTTTGCAATGGGCTTTCGTC
+TCAGGCTCAGGTAGTTCAGTCTCCGGTGAAGTAGGGTTAGATCAGTCTCAGGGTCCGAAG
+GAGATAGAGTTATGGCATTTCTAGGGTTCGAAGACGGTACTATTGATTTCATCAATACCA
+AGCGGGACTTGCTTAATGGGACATTCGAGAAGGAGCTGGACAGAGGAATTCGATCTTCAG
+CTAAAGGTACTTGAGGGTAAGGAAAGCCGTATAGTGAGTCAAGCTCAATTGTAGTTCCCT
+TTCCCCTATATGTGCGATTAGATTACCTTTCTCATTTGCTTAGTCCCGCTCCGTCTGTCC
+TTTCTTCCGTCTCTATGTCTATTTCTCAATAGGCAGTGAATGAACAACTTCTTATATAAG
+GATTTCTCGTAAGCGAAGAAACTTCTTTTCTAACTGGGTGTGTTCGTCTATCCCGACCNN
+NNNNNNNNGGTCGGGATAGACGCGTATTATGGGTGAGGGTACGACACTACAAGGCAACGA
+AGTTAAGAATAAGTTCTTCTGGTAATCAAGGAGCAGCCAAAGGAAGGTACTCTCGGGAAA
+ATCCATGTGAATAAGGAATGAGATCCGCGGAAGGGAGGAATTTAATCTTCTTCTTGAAAG
+CTGAAGGAAGTGTAAACTGTTCGAACGGCCGGTACTTAGCAACGGAAGTAGGAGGAGATC
+GAGCTAATCAGTCTATGTTGCTCCCGCTCAGGAAAGAAGACAGGGGCAAGTCGATGAAAG
+TCAGGTTTTTAACCGATTCAGGATCAACTTCGAATCCAATAGAAGGACTTCTAGGTTCAG
+ACAAGGTTGCTCTGCTTCGCAACCAGTGTTTCAAGTGCCAATCCCAAGCTCTCCAACGGC
+AGCATTCCAAGCAACCCTAACCAGCAGCAAAGCGCTTCCTCGAAGGCAAAGTAAGCACCG
+TAGATAGACATAATGTAACCAATCAAAGGTGCACCGCGTCTACCCCGACCNNNNNNNNNN
+ATGGGTTCAACTATTTCTTCTACGTACAGGATTCTATCCCTTCAAACCTGCCAGTGCTCA
+AGTCAAGTAGAAATAGGGTGGTTAGGGAGGGTCGATCCATCAACGGATCCAACAACAGAT
+CAATCCTCAAGTAATCCACGGAGAAATAAAATAGTATATGACTAAGATCTGTCTTTTGAT
+GCGGGAAAATGAGGCAAAGAAGTCAGTGCAGGCTCTTATGATTAGTAAGAGGAAGGTAAG
+TTTACGCTCTTACGACCGGAAGCGAAAGATGACTTGACCTTTAGACTTTATCAGAGGAAT
+TATTATCGCTTAGCGCTTGCGCGGAGGAAGGAAAACGAAAGCTCCGAGGAAGACAGAGTA
+ATTCGATCTTTTGGGAATGGGGGATTCAGGTAAGAGTTCATTCCGGCATAACTTGGCGCA
+AGGAATTTGCTCGTTCCGAGCGAGGTTCGACGTTAGTTGAAGTTGACATTGAGTCGCGCA
+CTTCCTGGAGTGGGGAGTGAATTCATGCGTACCTCAACGCAAGGATTGAATTAGCTCATC
+TCGAGTTACGTGAGTGAACTTTCGCTTCTTCTTACTTTGGTCGATCAGTCAACCTCCCCT
+TTATCAGTCTTAAGCGAACTCTTTCCCGACTGGCATCTTAGAATAAAGGAATATAAACTC
+TTCCAGATCCGGAATTTGCAACATCAAGAATAGAAGTAGAAGCATGCTATGCTAGCATAG
+AATAGAAGTCCCGAGTGAAAACGACTTTCCTTAGGATGAGCTTTTAGGGCACAGTAGAAA
+GAGCTTATTCGTCGATAACAAGCCTTTCTTCATATCATAAAGGAATAGAACCGGAAAGCT
+TTGATGCGAGAAAAGTAAGTCCATCCGCACTAGGTCCACGGATGAGTTCGACTACTAGGT
+CCACGGCNNNNNNNNNNACCCAATGCAAGACAGAGGGATCCTATAATAAGACTGACTCCT
+TCTATTCTCTTCACTTACACCTTACACTTCCGCTGAGTCTAACGAGGCTCAGGTGCGGAG
+CCTTCCACTGTGGACCGAGACTACACAAAGGTAGAACACTATAGAAACTTCGCTGACTTT
+ATCATAAACCTCGATTTCGCTACGCTCAATAAGAACCCGGAATAGCGGAAATAGGTTCGT
+GTTCCGCTTCCAAAGTAAGTCGTCTTTGCCCAAGTGTGAACCGCAGGCGAC
+>ds2020-328_7
+GGTCGGGATAGACGTCACCACATCCTCCTTAAAGGGGCATCCTCACCTTACGGTGAGGGC
+ATCTACAAATTTGTAGGCAATAAAAAGTGTCATCCATTCAGGATACAATGGGCATTTTTA
+TCTTAACTTTTAACGCACGCAGTGCAAGTTAACCAAAAGGATTTAACATTCAGTGACAAA
+ATCTGAATGGTGGATTCTATTGCAAAAGCAGCATCTCCAGCTACGAATATTCCTAGGAAT
+ACTCATAGTGGAGGTACAATCAAACAACGGATCATATAGTCATCCACTGACTATTTTATC
+CATTGCATCCATGAGAGCGGTATCCCGTTCAGCGTATAACACTGAATCAGGGATCTCGAC
+TCTCTTGGGCATCGAGTGTTGTAGGTACTGAGTACAGAACCATACCGGAACGCCGGGCTG
+AAAAGCATTGTCATATTTTATGACAAACCAGAGATCATCTGGTATATCCCCGACGGTCAT
+ACCAGTAGGAGCAAGAATTTGCACCCCACTGGCTTGTTTCGCTGTGAACTTCCTACGTTG
+TAGGGGATTAGGCGCCACTGGCGCATTCACATCGAAACCTTTAATGAGTCCGTAGACACC
+ATTAGAAACATCAAGGCAGTAACGAAAAACAATTCCGTATACCTTGGTATCAGCAGAAAA
+GTCCTTGAAAAGTTCTCGGACTTTCATGGTGTAGTAAACACCGGAAGCGGTCGAATTGAC
+CGTCAAATTCTCGGTACGAGATATCATACCGGAAAAATTTTTTACGGGCACATTTGGCCC
+GTGAAGCATCCACTCGGAAACAGACTTCGAGCTTCCACCCGGGAATTGTTTCTTAACAAA
+ACCAGCAGGGGGGGTAGTATTATTATTCTTCCGAGCTAAAGCAAAGCTTTGTGATCGGGT
+AGTAGGCTTTCCAGATTTAGTGGCTTTCCCAGACATTATGAGAGTATAAACAAACGAGAA
+TTGGAAGAAATTGGTAAACAAAACGAGCTATTAACTCACAAAGTGAGTTAACCAATCGTT
+ACACCAAAAGCTTCCTTGTCGGACTTCTCTTTTTTTAGAGGAACAGACTCGGCTTCCTTG
+AAACTGTCAAGGGAAGATTTACCCTTTACGGGTACAGCAATATTCTTAAAATCCACTGTT
+AAAGCCTTCTTTGACTCGTCAGACTTAATTTCAATAAGTCTGGGATTGATATCAACCTTT
+CCACTACTCCCAATTACCAAACGTGATTTGGCGAATGTTTGGAGTATCTTTACATTGTCC
+ACAGCAGCAAGGGCTTCCGATTTCTCAATCGGGAATCTCAAAGTTGGGTACATTTTCTCA
+TATGGTTTCTTCTTGTGCAATGAGTCATCCCAGAAGGGGTAAACAGTTCCAACAATCGAC
+GCGTGTTTAGCGTCTACACTTACAGCTGATGCTAGTAAACATATACCATCTCCGTCATCA
+GCATGAACTGCTCTTGGCCATCTCGCTACGAAAATAGCCGCTTCATTCAATGGTGAATCT
+GTATCTATATCAATAGATTCACCTGTATTCACATTGAAAAGTTTCAATGTCAATACCCCA
+CTAGTTGTTTCCAGAATGGTCGGAATGTACAACAAGTAAATTATACTATGATGCACGTAC
+ACATGACCTTTTGCTTTAGCGGATAATCTTGCCAAAGCGCTTCGGGATTCTTTGGATTGC
+AACTTCATGGGTTGAATTGGAACACCATTCTTCAACTGTAAAGAAAAACATTTCTTAGTT
+GGAAGATTCTTCATCATAGTTTGGGAATAAAAGTCATCCACTTCGCTGAGTATTGTATTC
+CAATCTTCAGCGGAAACTTCAAATGCCGAACTGGTACTGGCTTCGGACGTCTGTCCGGTA
+ATGGTCCTGGATACACCAGAGAAAGCCATATTCAATTCAGGAGATAAATCTACAACCGAA
+TTGTTTCACTCAATAAAATAAAGAGGTTAATGAATAGGAACAAGTCCGATTAGTGAGATA
+AATCTCAAACGTCACAAACTTGTCTTCTTCACACTTTGCAAGAAACCTTGCAGTAACTCA
+ATTTCTTGAGGGTTTATAGAGAACCGCACGTCTGTCAACTTCCACAGCTTAGCACAACCA
+CGCGTCTATCCCGCCC
+>ds2020-328_8
+GGGCGGGATAGACGCTAAGACGTCATGGAGATCTTGGTCTAGATCCGGTGGTTCGCAGAA
+TTCGGGACCTAACGATGTTCGGTTCGTCACATGAACGGGAGCGGACGATTCCCTCGTCTC
+TCCCTTTTCGGGGAATGGCTGCAATCACAAGCAAGTTATTGAATGGGTGGGGGGCTCCGA
+AAGCACATGCGGGATAAGCAGGTGTTTCAGGAGACGGTCTAAAAATGGGCCCGGTCTAGA
+ATAGAAAGAAAAGAGAACTCTCAACAAGCTGAAACTAATCAAGATCAATAGGAAGGCTAG
+TAATTTATTGACAAAGTTCATGCGACGACGATCTATATGGAAGGGCTGTTTTGTTGATGC
+ATTCCTGTTGAGAAAGTGTTTTTTTTATTCTCCAACTCCGGATGAGTTTGAGGCCTCCGG
+CGCCTTTTTTGAAGACTTTTTGTTGCGCCCCTATCTCTAAAGGGCGAGGGTGGCGGCCTT
+GATTTGGTGCCCCTCCAAGATCCCCCCGGTAAACTCGGGCTCGGGGGGCCTTTGCCTTCA
+TTTCTTGAAGAGCACGAGGTCACCTCTTCATCAATAGAAAGGAACGTCAGAAAAAAATGT
+TGTGAACTCCCCCCGGAATCCAAGAAAAAATAGCGGTAAGTCATGAGAGGGCGGCTTTCT
+TGTGGTAGTAATTTCGAACTAATTATATTTTTGGAGGATTCGTCCCCTATTCCTGCGGCT
+GAGAAGCCTCAAGCTCCGCCACCCTTACTCTCTCTCTATAAAAAAGCCCTTTCCCCTTAG
+TGCAAGTACTAAGTAAGCAAGCTACCTCTCCCTACCTTTGGTCGAGCAAGTAAACTACCT
+TTTCATAATAATAAGGCAAGCTCCAGAACCGGCGGAATTGCCCAATCCTATCTTTCCTTG
+AAGTAAGTCCGGAGCGGGAGCAACTTCTACAGCTAATTCAGACTAAACTCGATCACTTGG
+CAGGGGGGTCTTTTTGAGCGCATGTTTCTCATATCGATAAAGCAGGTTTCGTCTCATTTT
+CCGGAAAGCCTGTCATACTATTCCACTTTAGCTAAGCTAATGATGAAACAGGATCTGGAT
+TTGTCTGCAGATGATGATGTCCACTCCTGGCTCGAAGCGCTTAACGAAAGGGAACTCTCT
+AGATTAAGAAAGAATTTCCTTCATAATTAAGCAGCATCCTTTAAGTGAGTAGGGGTGCGC
+CGGACCGCCGACGAATAATAGGTACCCCACCTATCGTTGTGAAATAAGAGCACTCGATCG
+AAGACAATGTCAATTGGCCAAGCCATAAGCAAAGCAAGGAAGAGGCATCCAGTCCAATCT
+GCTCTTAATGTTCGAGTAGCCGGTGCCGCTTTTTATGGTCTTTTCCACGTAACCGCAGTT
+GGTTTTATATCCATTGTTCAAATAGCCGTAAGCGGTGGTTCAGGAAATGTTTTAGAATCG
+GTTGTTACAGAATACGCTGTGGGACGTCGAGGAAGAGCAGTGGGCCCCAGGTGCGGAGGT
+CTCGTTTGCAAGTGGAATCCGAAGGGGTTGTGCACAGTTAAGAAGAAGAAGTTGTTTTCA
+ATTTCATAAGACCTATGAAGGTACGAATGGGATTGAAGGACAGATGATCTTCCTTTTCTA
+AAGATAAAGAATCCCTGATCTGACTCAATAGGAACTACACTGAAACCTTTTCTGGTATGG
+TGGAGCTGAGACCACAGGTAATCGTCTTTTGATGCTTAAATTTAAATATAGGGAGTTTCA
+GAGAGAAGAGAGAGAGGGAGGGGAAGGTCAAAAGAGTCTACCTCGATTTACGGTTAATGC
+AAAACTGAGTTAGAATTCGGTCTCTTAAGACAGAAATCCCCTTAAACTGTCTCAGATAGC
+CCGATTTTTTCTTGGAGGACCTCTTTTTGTTATTTATTATGATTACTTT
+>ds2020-328_9
+GGTCGGGATAGACGCTGGGTGGGTTTGTTTATCCTTCCAGTTTCGAGTGTCTTCTCGGAT
+AGTTATAGCGGCCCATAGGCGCAAGATGTACCTTGTGGGGGGGCGGCGGTCCCCTGGACA
+TAGTCCTTTCAGGCAGTGGCCGTTTAGTCCATGGTCCATTGGATGGTCGGTGCAAGGCCA
+GAAATTGGAACACATTGATTCCGCTCGTTCCCGTCCTTCGCTTCAGGGCCTGCCCCTCGG
+TTTGGTCAGTACTCCATACTGTCGGGCAGCGAAGCTTACACTTGTTCACTAATTATGACG
+GTTCGCCAGGGCCTCTTTCCTCCTCCCTTTTCTGCTCACTCGTAGGGGTCCGGACCCCCA
+CAAAGGGGAAGGGAGTCGACTGAACATCTCAGCCATTGGCGGGAATTTCGCCCGCATCCG
+ATCCCCAATTCTTGTTCACCCCGGATGATCGTGTTGGGTGAATTGTGACCTCGTACGATC
+GTGTCGGGTGAGCAACAGCCGCTTCGTCACAGTACTTACTTATGGGCTAACGGGTCACAC
+TTTGGCCAAGTATCCTACAAAGAGACTCCCGAGAGCCAGAAGTATTGAAGGAATGGCCAT
+AGGAATGGGCGCATCATGACATCGTAAGATGTCTCGCCCGAATGAATTAGTTGGTACTAG
+AAATGTTAAAAAAAGTAAACGAAAAGAGTAATAAGAAGTGAAAAGGACAGAGACACTTCC
+CAACCAGAAAGCAAAGTTCCCACTGATGGTATACTTAGTGTAAGCGAGCTCTAAGATCAC
+ATCTTTGGAATAAAATCCAGTTAGAAAAGGAAATCCTATTAGAGATAAGCTGCCCATGAG
+CATCATGGCATAGGTAAAAGGGAACGAGGAGGCAAGCCCCCCCATCTTCCGCATATCTTG
+CTCATCCGACATGGCATGAATCACCGAACCTGCACTCAGGAATAGTAATGCTTTGAAAAA
+CGCGTGATTCATTAAGTGAAAGACGCTAACCGAATAGTTAGAGATGCCGCAAGCAAAGAT
+CATATAGCCTAATTGACTGCAAGTTGAATAAGCTATGACCCTCTTTAGATCGTTCTGTAA
+TATTCCAGTGGTTGCCGCTAGGAATGACGTCGTAGCTCCTGCAGAAGTAATAACAATCAA
+AGCCGTAGGTGGGTATTCAAATAAAGGGGAGCACCTTGCTATCATGAAAACGCCAGCTGT
+TACCATAGTAGCTGCATGAATCGAAGCGGATACTGGAGTGGGACCCTCCATAGCATCGGG
+TGACCAAGTATGCAATCCTATCTGTGCCGATTTCCCAACAGCACCAATAAAAAGTAAAAT
+ACAAATAAGAGTTATGGCATTAAATCTCATATTGCAAGAAATCCAAGAATTTCTGGGGGC
+ACTAGCACGAGCAAAAATGGTTGAAAAGTCTACTGTTTGAAAGAGAGTAAAACGGCCCGA
+AATCCCAGGAGCTAATCCAAAATCACCTACGCCCGTCTATCCCGACC
+>ds2020-328_10
+GGTCGGGATAGACGTCTTCTCTTCGTCTACCGCAAATAGAATAGCCTCGCCCGGGAAATT
+AGTCCCCTTACTAAAAAAATCAAGCTTATAGTCAGGCACGGGATGGGATGATCCGCAGGT
+GGTCTGCTATTGCCTGCCTCTTGCCTTTCTCATTTAGGGCTTCCGGGTGACGTACACAAT
+ATAGAACTCTGAGAGTAACATCTGCCACCTTGCTGTACGGCCCGTGAGGGCTGGCTTTTC
+AAAGAGATACTTCAGCGGGTCCACCCTTGCAATCAGCATGGTCGTATAGTTCAACATGTA
+GTGGCGTAGGCGTTGCGAGGCCCGTGTAAGAGCACAACAGGTCTTTTCTAGAACCGTATA
+CCTTGTCTCATAATCAGTGAACTTCTTGCTGAGATAGTATACGGCTCTTTCCTTCCTACC
+CGTTTCATCGTGCTGACCAAGGACACAACTCATGGATGCTTCCATTACTGACAGATACAT
+CAGGAGAGGTCGACAGGCGTTGGCGGTGCCTGGATGGGAGGATTGAGTAGATATTTCTTA
+ACTTTGTCAAACGCCTTTTGGCAATCCTCGTTCCTTGTGTCTATCTTTTCTGAAAGGCGG
+GGTATTCTTTCTGAGCAGTTTAAAGATCGGCTCACAGATGGGTGTGAGCTGGGCAATGAA
+CCTGCTGATGTATTGTAGCCTGCCCCAAAAAGCCCTGATTTCTTTCTCTGTCTTTGGTAC
+CGGCATGTCGATAATTGCTTTGCCTTTTGCAGGTCGACTTCGATTTCTCTTTTGCTGACA
+ATGAACCCGAGTAGCTTACCTGACAAAGCACCAAACCCCCCTCCCGGCTTTCTTTTTCGG
+ATGAAGACGAAGACTGTATTTCCGAAATCTGTCAAACACTTTCTTCAAATTCACCGTCTT
+CTTAAGCCCAAGACTTGGCGATCATGTCATCGACATAGACCTCCATTTCCTTGTGAATCA
+TATCATGAAACAGCGCAGTCATGGCTCGCTGGTACGTCGCCCCGGTATTCTTTAGACCAA
+ACGGCATCACCTTGTAACAGAACGTGCCCTCCTATCCGATATTGTGATAAACGCTCTGTC
+TTCCTCGGCCATCTTGATCTGGTTATATCAAGAGAAAGCATCCATAAAGGACAGCATCCC
+ATGTCCAGCGGTGTTGTCCACCAGAACATCGATGTGAGGAAGAGGAAAAAAAGATTTTCG
+GCTTGCCTTGTTTAGGGTCTTTTGACTCACGGAACCAGCTTTCTGAGGGAAAAACCGTTC
+TCGAAAAGCGTGACCATCCAGTTGAATCTCGTTACCCTCCCGTGTGGTTATGGGGGCGCG
+CCCACTTTCCACTATTATGGAGCCGGGCCGCAAGCAAGTGAATGTGACCCCGCCCTCCAT
+CAGCCGTTGTGTGTGAGCTTCGCTCCTTATAACTCTCCACCGTCTATCCCGACC
+>ds2020-328_11
+GGTCGGGATAGACGTTGTGGTCTGATTGTTTTTGTCTGGGTTGGGAAGCTCCCCCTTGTT
+AAAAGAGTCCTCTATCTGCACACTAACCTGGGAGACTTTCACCCTGTTTTTCTGCTTCTA
+AGCCGCTTTGAATTGGCCTGTGCCCGTTGATGAATCATCAATCCATTCAGCCGTCACGTC
+AGCCGAGAAGACGGACTTGCTGGTATCGTCAAATAGAGTATAGAAGGCTTCTTCCGCTCT
+AGTGGCGGGTTTATCTTTTCATTAAGTAGCCCCTCACCTCGTACACTGAGTCAAGCGACT
+TCTCCTTTTCTGTCATGAAGAGGAAGTGAGATGATGACAATGCGGCTGGGAAAAATCCAT
+ATCAATCCATTTCTTCTATATATAAGAGAATTGGATCCCGACCCAGACCTAATAAATTTA
+ATTATATGCTGATTTCATTCCACTAGTACCCGTAGCTTCTTTTGTTGGGTTGGTTGGAGT
+GCTTTAATCAAACACTTGACCGAGTAGATCATGTTGGGATCTTCACCATGAATGATCCTC
+CGGGCGAACATCTCATGGCACACCATTGATCAATAAGACAGGATAAATAGAATATACGGG
+GATAACCCCCATTCCTATCAGCGTGAAATGAAATTCATTCAATCAGTCCTCTCCTCCGCT
+CTCTCTGTCCCTGGCTTCTACTTTAACATACATACCTTCTGGCCTCAGTCGTTGACTTTG
+ACCCTTCCGCTCCTCCATTTAACAAGCAATTTCATTTAGTGGTTGTTCGCTCCTGAACGA
+AGCTATTGGGACAGCGGCTTTGATAGCGCTTTCTCAATGAGATAAATCATATCGTGGTAG
+AGCTCCTATCTGTGCTTTGACAAATCCCTCTCTGGCGTCATCTACTGGCTGACTGCACAC
+TGCCTTCTGCCTGACTATGGCTTTTATTAGAAAGCAAGATCCCTCCGTTTATCACTCTAT
+AGAAAGAACATCCCATACAGAGTCTTTCAACTAAGCTATTCGAGCCTTCACCTAAGCTCT
+CATCGATAGACCCCCTTTCTTTTTGGTTGTAGTCAGACACCTAACCGTTCAACCTCGTAG
+GCATCTTTCTATTAACCAAATCTGATACCGTCAGGTACGGAATGAAATAAAAGGACTTCT
+TCGGCCCCTGCGCCTAGTGGTGCTTTCGGCTTGAAAAACCACGTGAGTGCTCTTATTGGA
+CCAGAGCTTTGGCTACTCCCTGTTGTCTTTGAAAGAAATTTACTGAAACCTGATGCGCAG
+AACCCTTCGTACAAAAATGAAAGATCAATCTCAGGCCCAATTGACTCATCTTAGAAAGGA
+TTTGATGAGCCAGTAAGCTGAGCTATCAATGCCCAACTATCGTCTATCCCGACC
+>ds2020-328_12
+ACCGGCGTCATTTCCATCACTTGATCCGGTTTCTTAGGAAAAGCCATAGTTATGCTGCCG
+AAGTCAGCCATCGTTTGCGGAGATCCTCCTGGGTGTACCAACGCTGAGCTTACGCTTTCT
+CTCCCCACTTCGGTAGCTCGCTGCATCGCCATCTCCCTGTTGGCCATAACAGTCCTTATG
+CTGCTTCCTGACTTCTCCTGAGACATTTCTTCGCCTTCGTCTTCTTCATCGCTTGCATCT
+TCTACCAACACTCGTTCCATTTCTCTTGGCTCCGTATGCTTCTTATCTCCATCTTCAACT
+TTCGTCTTCTGGGCTTCGTTCTCCTGCTTTTCTTCCACTTGCTTCCCTTCTCTAGACTTG
+TCGCGCTTCTCGCCCTCTTCTTCAAGGCTCGGGTTTTCTTCTGCTGCGTCTCGATTCCTT
+TCCCCTGCTGTTTTCCTGTCTACATCGCTTTCGCGGCTTTCATCTCTTACGTCATCTTTA
+TCCTTCACCACTTCAGCATATGTGGGTTTGCTTGATTCGACACTTCTATTCGTTCCAGAA
+TCCCTCGACTGCTCTTTGGGCTCTCCGTCGTTTCCTTCGCATGTCGGCTCATTCTCTTCC
+GCGCCCATCTCACTCACCGCTTCATTTTCCACTAATCTAAGCGATGCTTTCTCACGCCTT
+CCTTTAGCCTCTGGCATGCGAGGGTGCTCCTCGGCGTTTTTGAATTTTCTAAACTTATTC
+AACACTCTTTTCCCAGCCAGCTTGGCTCTATCTGCGACCTTCTGGCATTTAATTTCAAAA
+TCAGCAGTCATTTTCTCATCGGCCTTTACTTTATCTCCTACAGAAGATAGCTCCTCGACC
+ATCGCTTCTGCGGTTTTGAAAGAAATATCTCCGACGTTAGCGCTCTCCAGAAGCTTCGTC
+ATGCAATTCATTGACATCTTCGTTACAAATGCGCTATCTTCATCTTCTGTACTCCATAAA
+TTAGATGAATTACGGCGGTCGGGATAGACGAAAGCGGGCCATCGCATTAGTGTCCGTTAT
+ATTCGCTAAACCTGCTTCAGTTATGAACTTACCTATGTGCGCTTCACACACATCATCTAC
+TAGAGCCATCCTCTCCGTCAAATCTCTGAGTGACGTCATCCCGAGGAGCATGATTAAAGC
+TTCCTCTTCCGGCACTCCAAAAGCCGCCGCCATCACCATCGTCTTGACGTCTTCTTCTTC
+CCATACTATATCTCTGGTTAGATTATACATCAGCCAACCCGAAGGGAAGATCCGCCTCGA
+TCTGAACCTACCTCCTCTCATCCCGTTCAAAGCCGACATCAGAGGCATGAACGCGTAAGT
+AACGTCCATCGGCTCCCCTTCCGTTTTCAGCATCTCGTGACGTCTATCCCGACC
+>ds2020-328_13
+GGTCGGGATAGACGACACTTTGCCATGGTTGTTGTGAAAGAAGAAACTCTTGGAGGAAAT
+GCCTTCTTAGCAATTGAATCAACTCCTGGTGATGAAGAAGAAGAAGGAGCTGTGAGGAAG
+GGAATGATTGCACTAGTCCCACACCCACGGACAGAAGGAATAGAATACGCTCTTTGAAGG
+ACGTTAATCAATAGGAGAAGATAGCCACGCACAGAAGTAGCNNNNNNNNNNATCGTAAAC
+GCTCTTCTTCCAATAGGAGTGATTCTTTGCCTTGACGCTGTGAGAGCTTCCGGTCCTTGA
+GTATGAGTACTCCTATCCGCTCTTGGGTTCATAACCGGTCCTATTGAATACGGTCTTCTC
+GGCTTTCCCTTTCCTCCTTGGCTTTGACTCTTTCGATCTCTGGTCTGCCTGTCTGTAACC
+AATGCCTGGATGACTGTCTTGGCTTTCTGTCTCGACTCTCTTCCTTCCTGGTGAAGACTG
+TGGTAGTGGTATCGGTTCTTTGCTTGGTTGATTGAATATCTCTTTCCTTGCCTACCTTAG
+TCTTAATCCGCCTTTAGGGAGTGAAGTGAACCGGGGGTGATCTAATAAGTTGTGAAAGAA
+TCGGTTTAGAACGTATCCGCTGTTTTAGCCATATCCGCTGCGCTCGTCCTTTCTTCCTAG
+ATGCTTTGAATATCCCCGCCATATTCAACAATTTTGCTTTCCAACCGGAGAGTCTTCCTT
+GCACTTTCTCTAAAAAATCTGCATAAGTTCTCCGAGAAACCCTTTCATGAATTAGTGGCA
+CGCCAAGATACTTCCCCGAGTTCTTTGTGACAGGCATCCCTACAATTCACTTTATTTAAC
+ACATCTCGAGAGGTATTCGGAGACACAAATACCTGGGAGTCTTTGGGCATCTCACAGTAA
+TGCAACGATCAAATCTTAATAAGATGTTGACCCGTTTTTCTTTTCTTTGCTGATTCCTCT
+CAATGAAATTTGCCATGTTGCACTAAGTTACTTACGGATGTATGCATGCAATCCGGGAAC
+ACTTTGGGGTGAACACCCATCCGAACAAGTAGGGTCAATAGTTCAGCATTTAGGCCGTAA
+CATTTAGCAAAAAAAATCTTTAACCCAACAAGTGCTCTCCGAACCAAGCTAGATAGTCTC
+CTATCACTAGGCTCACCAACCAACCTGGACTTTGATTTTTATTATTCCTACCGGATACCA
+AAACCATAAGGATTGTTTCCAGCCATGAGTTCCCATATGACATGACATAAGCGCTCTTGG
+GTGGGCTGGGCCATTCCATCAAATCTTTGAGAAGGGGCCCTTGCGTCTATCCCGACC
+>ds2020-328_14
+AACCGAATTACGGCGGTCGGGATAGACGGCGCCCCACCATCTGTTCTCAACGTTTGTAAG
+AGCAACCACTTAAGTGACTCCCTCTTTAAAGCCTAGTCCGTCAGCGACTTACTCCCTCAA
+TAGAGCCTAGTCCGTCAGCGACTTACTCCCTTCGAAGACTGCACCATTTCGGTCTTGAGC
+TCCCACCAGTTTTCTCCCCGAACAAGGTCCCGCACCTTTTGTCCAACATCGTCACCAACT
+CCCTTGCGCATATGCGCTTTTGCCACACCTCATGGCATTTGTGGGTCTCCCCCACTTATC
+TCGTCGACGCACCCTCACGTCAACGTGCCTCTGAAGCTGAGCTCTCTAACACTTTCGGCC
+TTCACAATTCACCAAGGTTCAATGCCATCCCTACTACGAGTAGAACATACTTCCGTAGCA
+TCCCCAAGGGAACAAGCACGACATCCTCCCCCAAGTTACTTCCTCTTTGGCCTTCCACCA
+AGTGCGGACTTAACACGTCCTCAGCCCCCATCTCACACAAAAGACTCCGGGATCAACCTT
+TGGAACACTCCCGCATTCCGCATTTTAGCTAGCAACCTTGTGTCAAACATTGTACTCCAC
+CCACACATTCTCCACAATTGCAAGAGCAACCACTTGAGTGACTCCTTCATTGAAGCCTAG
+TCCGTCAGCAACTTACTCCCTCAATGGAGCCAAGTTCGTCGGCGACTTACTCCCTGTCGA
+AGACTGCACTAATTCGGTCTTCAGCCCCCACAACTCTTCCCTGAACAAGGGTCTTGCACC
+ATCTGCTCAACTTGTTGCCAACAGAGTTTTTCTCAACCTTCACGGCATGCCACGGTTCGA
+GTGCTAGTTCATCTTCAACACTCTCACCAAACTCGCGCTCCCATTCTCCCCACATCCTGA
+ACTAAACAAGCAACATCACTTCGTCGCAAGTCAGAACCCCTGCCTACCCGACTTCCGGGC
+GCTTGGTGCACGGACTAGAAAACTAGGCAACCGAGCAGCACAACCAGCCATCATCCCACA
+TCTTAGAGTCATCCTGCTTGATGTCTTCACAAAACTTCAAGGCAAACTTTTGGCTACCTT
+CACCCTTCCATAGGATCCAGCACCAAGACGGGTTTCCATCAACCGTCACAACCTGATTCC
+AACTATCATCCACAGTGACGTTGGGTTCTTCAACCAACTTTGCAAATCCATTACCCAACA
+CCGTCAACCTGACCGTCTATCCCGACC
+>ds2020-328_15
+GGTCGGGATAGACGAAACTTCGGGCTGGTAAGGTCGGGACCGTGGTCGTCCGTCTCCGGT
+TTGCCGGCCGATAAGATCTCTGAGATTGACCAGCCAGCTGGGTTGGTTTGGCTATTCCTT
+TCTATTGAAAAGGAGTCAGCTGTCTGCGCGAGTCACCTTCTTCTAGGCTCCGCTGGACGA
+CACGGCATTCTCGTTTAAATATAGGCCGGCCGTACTTGTGATGGTTCCCAAGGATCCAAT
+ATGACCACTTAGGTCTACGTTGCCACGATATTGTTCTATGGAAGCGGGCGGGCTGTTAGT
+TAGAAGTTCGGCCCGGTTTTTTTGGTGTCGTAGGGAAGGGATTGACCTTTCTAACGCATA
+TTCAGTCGTACCGGCATGGCCCCACTGATTTGTTTTCGATCGGAGCATCAAGCAACGCAA
+CCCGGTTCTACTTGACTAAGCCCCGTGCTCGTCCAAGGAGGGAGTTTGCTTTACCCAACT
+CCCTTTTTGATAACAAGGCAGAAACCCCCGACCCGACATTCATTAGTTTCAAATGAAGAA
+TGAAGAGTACCCTGCCCCAGAAAGCACCAAATTACGTCTATCCCGACCNNNNNNNNNNGG
+TCGGGATAGACGAATGCGCCTACTCCTATAAAAAAAAAGCGTGACTTTACTAAACAAGCA
+AGAAAAGCCCTTTCTATGTTATTAGTAAAGCGCTAACGAGCAAGAAAACGGATGCGCGTT
+AGCGCAACGGCTTTCGCGCAGCTCAATCCCTTGCTTTGTTCTATAGTTAGGGGCCTTTTC
+AATAAGGCTCGCGTAGGGGCGCTCACGTTTTTTGGCTTCCCTAAAATCTAATTTTAAGTT
+GGTAAAGACCCACCCCTTGTTTCAGTCAGAATGAGTCCCCGGGACCCCGGGACATTGGCT
+TCCGCCAACAGTGGACTATTAAGGATCGCATCCCGCGCATATTCTACATTATAGCCTGCA
+ACTGATTCAGCTTCCGCTTCTGGGAGATCAAACGGAGCTCGATTAGTTTCTGCTAGACGA
+GAAATGAAGAACATAACCAATACAGGGAACAGGGGAATACCGGACCATATCTGCTTTTGC
+GCCATGACAATCTCACTCCAAATGCCCGTCTATCCCGACC
+>ds2020-328_16
+CTACCCGGTTATTTTACCAGACATAGCGGGTTAGTATCCGTAAGCTATAACTCCCGCCCG
+TTGCCAGAGGCCGTTTAGTCCGGTAGACCTTTTAAAGTTGTTTTCTCTGTGTTTTTGTTT
+TTTTTAAAAAATAAACCTCACATACAGCAACTGGTTGCCAGCCGATGTCACTCGGCCGAC
+TACATCCCGTCCCTGTCCAAGGTTTTTAATACTGTGTTTTTGAAATTTGTAGTTTTAAAG
+ACGTTGTTAGGAAGTTGAGGGCTAAGCGCTACTACCTTCCACACTACGTCACGTCCCCCG
+ACTTGCTCTTAACAAGTCAAGCCGACGGACAGTAATCCGTCAACCGTTTAGTGATTCCAA
+TCTACCTTGTCGGGAGGTCTCTTTCCACACAAGTGCTACTGCCATCATTTTCACACGTAA
+TAGTTGTATCACTAGGGGATATCCATATGGTAAGCGTACCGTCAGTCGAGGTATAGATTG
+TTTCTCCTTCGCAGTCAGGCGTGTATGTGAAGGCCTTGTTACAGAACGTTGAAAACGTGT
+CTGCGCCTGCATAACCGCCTGCCGCGACTATAGCATATGTAACTATGTGACAGTCTACGT
+TGTTCTGATTACACGCCAAGTTGTCTACGATATAAGTTGCGGCGCCAGATGACCCTGCGA
+TGATCGAAGCTACACTCGGGCAAACGAAGGCGGCTAGTCTGCTCTGTGATCCTAATCCGA
+TAGTAAGACCGTTTCCCAGAGACCGGCAGCTATTGGTATCACGCTTACTGTGAGGCGCGG
+TATCAGTCGGGTCAGTACCCATGAGCATGTTGTGGACGTATTTGTGCTCCTCCTCATTAC
+TCGTGTCCACAATTATCACCTGTCTGCTCGTGTTGTTGAGGTCGGGCACCATCCACCTCA
+TCTCCCACATTGAATCGCTGCCCTTCGTCAGTGCGCCAGCGCTGTCTACGTATAAAAAAG
+CCCTGGCGCCCATTAGTCCGAGTGACCAGGCCAGCAGGAACAGCCCCATGTTGAACATTG
+TTATCTCAGACGTGTATCACTCAATGGTAGTGGCGGCCGTTGCTGTGGATTATCCCGACC
+AAGGCGCACTCCGTCTATCCCGACC
+>ds2020-328_17
+GGTCGGGATAGACGGCTTCGAACCTTCTACCGGCGATACGCTCCTGGCCTTAATTGGCCG
+GGTCGTGCCTCCGGTGCTGTTACTTTGAAGAAATTAGAGTGCTCAAAGCAAGCCTACGCT
+CTGGATACATTAGCATGGGATAACATCATAGGATTTCGGTCCTATTCTGTTGGCCTTCGG
+GATCGGAGTAATGATTAACAGGGACAGTCGGGGGCATTCGTATTTCATAGTCAGAGGTGA
+AATTCTTGGATTTATGAAAGACGAACAACTGCGAAAGCATTTGCCAAGGATGTTTTCATT
+AATCAAGAACGAAAGTTGGGGGCTCGAAGACGATCAGATACCGTCCTAGTCTCAACCATA
+AACGATGCCGACCAGGGATCGGCGGATGTTACTTTTAGGACTCCGCCGGCACCTTATGAG
+AAATCAAAGTTTTTGGGTTCCGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATT
+GACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAAC
+TTACCAGGTCCAGACATAGTAAGGATTGACAGACTGAGAGCTCTTTCTTGATTCTATGGG
+TGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGCGATTTGTCTGGTTAATTCCGTTAACGA
+ACGAGACCTCAGCCTGCTAACTAGCTATGCGGAGGATCCCTCCGCGGCCAGCTTCTTAGA
+GGGACTATGGCCGCTTAGGCCAAGGAAGTTTGAGGCAATAACAGGTCTGTGATGCCCTTA
+GATGTTCTGGGCCGCACGCGCGCTACACTGAGGTATTCAACGCGTCTATCCCGACCCCCA
+ACGAAATCGTCTATCCCACCNNNNNNNNNNGGTCGGGATAGACGCTAGCGCCTGCTATAT
+TCAACGAGTCTATAGCCTTGGCCGACAGGCCCGGTTAATCTTTGAAATTTCATCGTGATG
+GGGATAGATCATTGCAATTGTTGGTCTTCAACGAGGAATTCCTAGTAAGCGCGAGTCATC
+AGCTCGCGTTGACTACGTCCCTGCCCTTTGTACACACCGCCAGCTCGCGTCTATCCCGAC
+CGCCGTAATTCAGATCGGAAG
+>ds2020-328_18
+GGTCGGGATAGACGATGACCCTCACTGCAGGACCGTAGAGTGTCCATCGGCTAGACCTAC
+TGAGCGGTAATTTTGCATAAACAATTGCAAACAGCCCGTCAGTGACTACACTTAGGGATA
+AGTGAAGTGATTTTGAATTAGAGCTACGTTAATTCCATCATTTGTAATATAAATACTAGG
+AAGGCACAATCCTAAATAAAGAAATGAAACTAATAAAACATCAAATTAGTTTCATAATTT
+TAGCGGTCTCTTCAGTGTGCAGTGTGTTGTGCGAACAAACATGTGATGCAGGCTGCAACC
+AAGCATACCAAAACTGCTTAATAACACGCGAAAGGTGTCAACAAGCGTGCAACCCTAACA
+GAATATACTGTGGGAATAACGCACCCGGCACATCGCAGACCTGTGATAATTTAATAGCCT
+GCGAAAACGGCTGTAGCCCTTGTGAAGAGATTTATAGGTCATGTGCTAATGGATGTGACA
+TTTGTGAAGGCAGCGCGGAAATGAAAAAACGTAGTCTTAACTATGACGTGTGCTACACAT
+ACACAAACTGTAAAGTAGTTAAAGTTGCGTGCAATCAAAAATGTAACGGCAACCAACAAG
+CACTTCAAGTGTGCAAGCAGTGCGTTAGCAGATGCCTAATAGCAGAAAAGTGTCGGGACT
+GTGTTTCAAAACAAATCCTTGGGTCCGACCCCGACCCAAAACAGACATGCATAACAGCAA
+AGCAGTGCAGTAAGGCAGTAATAGCAGCCGCAGGTATATAGGCACCAGGGGCAGCTATAC
+ACGAAAGAAGAAACTATGCGGCGACGGCTATAAACTCAGATCTTAGGAGATGAAATAAAG
+AACAGGCGTTCTAACCGTGAAACGAGTAGGACAATCCAGAAATGCAATAGGGGCAACGTT
+AGACTTAAATCTTCGGAAATAGGGTAATGGCGATACAAGCGCTCCACCGTGAAAATCGGG
+AATCCACTAAAAAACATGCAAGGGGACTATACGTCTATCCCGACC
+>ds2020-328_19
+GGTCGGGATAGACGAAGGTTCCGGGTGTCTTCCAGTGGTCTTCTAGCGTTAGAAGAAGTC
+GTGTCCGTCCCGGACATCTGCAATGTCCTCCCACGCTTTTTTTTAATATAGGACAAACTG
+AAGGAAAAGACTGACCCATTCGGTTACTTTCGCGGTCGCCCTCACTGAACCGACTTGAAT
+CTGAACTACGATTCAGATCAAGTCTTACCGACATCGGATTTCCTTTTCGTGCCATATGCG
+CTTTTACTTTACTTTACTTTACCCCTTTTGATTCCCGGTCCAATATTTGTTCTCGAAAGT
+CTTCGTTTTCGTTGCTCTAAGGTACACCCGAGCACCTTTTGGTGATGCGATGGTTTGATC
+CTATCCTCTCTCTCGCTTAAAGCCTTCAAACAAAGAAAGCTACTCCGCTATATATACTAA
+AAATTTTTCATATACGAGATTTCTGTTCCATTCCCCTCCTGCAGCCAAAGTGTTAGCGGC
+TGTAGCATCCACCGATAATGTGTGGAAGAGGGTAAGCTTTCTATGTGGATAGGACGTATC
+AACACCTTTTGCATCTTTTAAAGGAAATATATAAGAATGAATAATATTGTGTTGGGTCCT
+GAGGATCAGGATGGCCGAAGATCAAAACCTAAATGTGCCAGGGGTTGATCATCGAAGCCA
+GGGACGATGAAGGAATTTGAGCGCTGATGTAGCTAACAGCCACCTTCATAGTCGATTCAT
+TAGGGTCGCCACTCGTCTATCCCGACCNNNNNNNNNNGGGCTGTTAAGCCTCACAGCTAT
+GGGACTTCCTAAAGAAAACCGCAATCGTAGTTTATCAACCACTCACAAGACCACCGAGAT
+CTTCGGCTTAGCTCCCAAAGGTAATCCACCCGGCCCTTGCCCAACCTATACAAGGGGAGC
+GGAAGATAACGAAAGGGAGACAAAGTCCTAACTAAATCATAACACAAGAACCTCCGTCTA
+TATCATAACACAAGCTACCCATTAGCCTCGTCTATCCCGACC
+>ds2020-328_20
+GGTCGGGATAGACGTTAACATTGGCTACTTAAGCAATATTGGACACCAAGCACTTCGTGA
+AGGAATTTCCAATTAGGGATGAGGAAGAGGAAAGTAGCTCGACCAAAGGGAGAGGAAGAG
+CAGTGGTTGACAATCATTTGCCGACTCTTGCCCAGTTCAACTGATAAGGAAATTGAAGTC
+AAGAGGGGCTTGCCACCTGGTGAGATAGTAGTAGTGCCTATGCATGCAACTATTGGAGAC
+CNNNNNNNNNNAACGGCCGCCACTAATGTGTTTTTGTTCAGCGTGTGAGGTTTTGGAATT
+GGAATTGGAATTCGAGGAGTGCGCTGAGGGATACTTCTTTTATCACAGAGTGGTTTGTGG
+TTATCGGAATCGAAGGCTTGGATGAAATGGAGGATATGGAAGTACTTTTTGGAGTAGTTT
+TTTCGGGAGCAGGAGTTGGTGTGAGTGGAAGTGGGATAGATTTAGACACGCCTTTGAGGT
+ACGAAGGTGGATCTGATACTTGGATGGTGAGATGTGAGTGTGGTGCTAGAGATGACGATG
+GGGAGTTAAAGAGGTTAGCTCAAGACTTTTCCAGGAAAACCGAGACCAAGTTTGATTTCC
+ATAAAGAAAACGTTTAAAATTCACCAAATGAAAAAGTCTCTTGTTCTTTACTATAAACTC
+AAAGCATTAAAATAATTGATCTTGTTTGGAAGTTTTTACTTTAAAAAGCAATGATAAGAC
+CCCGTATTTGCGTCTATCCCGACCNNNNNNNNNNTTGCAAAACTTGCTTTAAGATAACTA
+GAAAGCTAGACCTACAGGTGCTCTGAATTCCCACAAAATTTGCTGTACATCTGCCAAATC
+ACATCTCGGTCTCTCCTCTTTCTTGTTAGTCCTTGGCTCGGGCTGGCCCTTTCGGATTAG
+CTTGTCTTCCTAGCTGCCTTTCTTTCCCCTGCCTTATGACTCTCGTACATAGAAGAATGA
+GTGGCAAAGCACTCGACCCGTCTATCGCGACC
+>ds2020-328_21
+GGTCGGGATAGACGAATATCAGCCCTGTAGATTCGTTCCCATGGTTCGATCCTTCCCAGT
+AAAACGCGGCGTGTTCGAATTCTGATCGCTTTTACGCGAGAAAGGGGGACCACCCTCTAA
+GCCTAAGTATTCCTCAATGACCGATAGCGTACAAGTACCGTGAGGGAAAGGTGAAAAGAA
+CCCTATTTAGGGAGTGCAATAGAGAACCTGAGATCCGATGCGAACAATCAGTCGAAGGAG
+CGGAGCTTAGAGCCTTTACTTTATATTAGTAAAGCGCGCTCACTCTAACGGCGTACCTTT
+TGCATGATGGGTCAGCGAGAAAATGGGAACAGCGGCTTAAGCCATTAGGTGTAGGCGCTT
+TCCAGAGGTGGAATCTTCTAGTTCTTCCTATTTGACCCGAAACCGATCGATCTAGCCATG
+AGCAGGTTGAAGAGAGCTCTAACAGGCCTTGGAGGACCGAACCCACGTATGTGGCAAAAT
+ACGGGGATGACTTGTGGCTAGGGGTGAAAGGCCAACCAAGATCGGATATAGCTGGTTTTC
+CGCGAAATCTATTTCAGTAGAGCGTATGATGTCGATGGCCCGAGGTAGAGCACTCAATGG
+GCTAGGGTGGCCCCATTTCGCCTTACCAACCCCAGGGAAACTCCGAATACAGGCCTAGAT
+CGTTTGTACAGACAGACTTTTGGGGTGCTAAGATCCAAAGTCGAGAGGGAAACAGCCCAG
+ATCGTACGCTAAGGTCCCTAAGCAATCACTTAGTGGAAAAGGAAGTGATCGAGCGATGAC
+AACCAGGAGGTGGGCTTGGAAGCAGCCATCCTTTGAAGAAAGCGTAATAGCTCACTGGTC
+TAGCTCCATGGCACCGAAAATGTATCAGGGCTCAAGTGATTCACCGAAGCGACGAGACCT
+TGAAAGCTTCTTTTTCAAGTGTCAGTAGCGGAACGTTCTGTCAATGGGGAAATGTTTTTG
+GTGACAACACGTGGAGATATCAGAAGT
+>ds2020-328_22
+GGTCGGGATAGACGTGCGTTCTCCTTATTGAAAGCGCTAACGCGCATCCGTTTTCTTGCT
+CGTTAGCGCTTTCAATAAGGACTTTTTTTAGGCTTATAACATAGAAAGGGCTTTTCCCAA
+CCAACCTAGGTTATGGGCTAGCGCGGCTCGCTTCGCTTTTGTTGCGGAGCTCGCTGCTTT
+TCATTTTGTTAGGAGTAGGTGCTTGCCCTTTGTTGGGTTTGGGTTGGGGGAAGAGGTCAT
+TTCCATCGCGAAGGATTCAATCCAGCCACAGGTTCCCCTACGGCTACCTTGTTACGACTT
+CACCCCAGTCGAAGACCCCACCGTGGTATGCGCCAATAAGACCACCAAAAGCCTTTGTGG
+CACTAGTGGTACACAGAAGTCATGGGTGATCATTGGTCCGATGCTTCGGGCGAAACCAAT
+TCCCAGGGTGTGACGGGCGGTGTGTACAGGGCCCGGGTACATATTCACCGCGGCATGCTG
+ATCCGCGATTACTAGCGATTCCAACTTCATGTTCCCGAGTTGCAGAGAACAATCCGAACT
+GAGGCAATCTTTCCGGATTCGCTCCGCCTTACAGCCTTGCTTCCCATTGTAATTGCCATT
+GTAGCACGTGTGTGGCCCAGCCCATAAGGGCCATGCGGACTTGACATCATCCCCCTACGT
+CTATCCCGACCNNNNNNNNNNGGTCGGGATAGACGACTCTAGCCCCTATCTCCGTCTATC
+CCGACCAGTGAGGTGATACGTCATCCCCACCTTCCTCCAGTATATCACTGGCAGTCCCTC
+GTGAGTGCGGCACGCACCTTTTTGTTTGTTTCGGAGCCGTTTTGGCGGGGTGTACTAAAC
+TCACTACGTACCACACCACCGGGCGGCTCGCCTGAATGCCTCGTACTTCGACTCAGCCAA
+CCCCGGCGTCTATCCCGACC
+>ds2020-328_23
+TGAATTACGGCGGTCGGGATAGACGGGAGCTACTACTCATGCAGCGGCAAGGACCCGCAA
+CTCTCGAGGGGGCCACCAACCGCCCGAATAACTCCTTTACTCAATGGATAGCGCTTATCC
+TCTTTCAATCAACAAAATGAGAAATGGGGGAGAAAGAAAGAGAGAAAGAGGTCTTTATTG
+AAGAGGCTTTGCACCTGAAATAGGACTAATGAAGATCCAGAAGAATGGGTCTGGGCTTTC
+GAAAAGATGAAGATGCAAAGGGTAAAGAGAAAAAGTCTTTTGAACAACCAACCTGACATA
+AGGATTATAGCTCGCCCACTTAGAGCAGATGGTGATTCTCGGACGGGGAAAAGCGGCACT
+CGAAATCTATTAAACAACACCAAGAACAAAGCCATACCATGCCCTCGGGATAAACTAGTG
+ATGATTGCCATGAATGCTGCCCTCGAGGATGTGTACAAGAGGGTCTTTGCCGATTCCTAT
+CAACATGGTGCACCTCTCAAGGGTGAGACTTTAACCGAATGAATGGGGATCAATTGATAG
+ACATTTTGATTGAGGAAGAGAATCCAATCCAGGATGAATGCTTTTTTCGTTCGCTATGTG
+CTGACTAGATGCGTACTCGCGCGATCGATCGATGCACGGGGGAATTGCGTGAATGACGAG
+ACCGGCCTAACCTAAAGTAAAGGCTCTTCCCTCTCTTCATGGCGAATCTTGATTGACTGA
+CACTAGGAGCCGACTCGGAGAAACAAGAAGCATGGCATGAGATTCGCGGCGGAATTAATT
+CCGATAGCGAATTACTTGATTCGATGGATGGAGGGAGAGCCCTCCAACTCAAGCACAAAA
+TCAATGTTGAATCAACAATCATCGAGAGCGAGAAGGGCCCCATGACGTCTCTCCCGACC
+>ds2020-328_24
+GGTCGGGATAGACGCCCCGGTTGAGTTTGAGAGCCGTGTGATGGGTGACTATCCTGCACG
+GTTCGGGGAGCACTTTTTGTCTGCGTTGGTGAATGGAAGCCCCCACTATCAAGCAAGAAA
+GAAGCGGCTCTTCCCACGGCGGAGTCCCCATTGACTCTATTTATTATTATGGTAAATCAG
+TGTATCAAGATGTCAATCTGAGATCTTATTTCGGTTCAATACGTCCACCTACGAGACTGA
+CCTTTGGCTTTCGTCTCGGTACGTGTATTATAATAAATTTTCCCAAAAGAACATTCATTC
+ATTTCTTTCTTCCCCGTCGACCACGACGACTGAAACGACACGAAAAATCCAGACCCGGAA
+AGGGAACGGCCGGTGGGGGGCAGTCGGGAAATGCGGGNNNNNNNNNNGGTCGGGATAGAC
+GGTGGTGGGCATTTGGTAAAGTCGGGCCGATCGGGTGTCTTCATTCAAGCGACGATACAG
+AAGAAGAACGAAACGAAGTGAGAGGCCGGGGGGCAGGGAAAAGAGTCGAGTCGATCAGGC
+TCGACGACCGGGAGAAGCAAAACGAAATTAGGATTTGGCCGAAAAAGAAGCAACGCTATG
+GATACCATGACCGATCACCATCGATAAAGAAGAATCTTTCTAAATCACTTCGGGTCAGCA
+GGGCCTTCAAGCACCCGAAATACGCCGGGGTTGTAAATGACATAGCGTTCCTGATAGAAA
+ATGACGACTCCTTCAGAAAAACTAAGTTATTCAAGTTCTTTTTGCCAAAGAAGTCCCGCT
+CCGACGGCCCGACGAGTCATCTACTTAAAAGGACCCTCCCTGCAGTGCGCCCCTCCTTCA
+ATTATTTGGTCATGCAATACTTATTGAATACAAAGAACGGGCATCGTCTATCCCCACC
+>ds2020-328_25
+ACTCCACCTAGACTCTTAATCTTAGACAATCTGTCACCGACCTTAACATAAAAGGATGAG
+CCCGGCCTGTCTATTTATATGCATTGGCTTAACTCATTCCTATACACTGCAAAGAACACA
+AAATTAAAACAGCCTGGTAAGGGCTGTACAAGGGAACGAAAAGGGAGTTTGTTTGATAAG
+AAAGAGTTTGTGCTTAGTTAACAAACATCGAGTTTGGAGTCGGGGCAGCGTGGATACGAG
+ACTATTGAAGTTAAGTTTGGAATCATTTTGGTTTTCTATCTTCAGATTACCAAATTGGAG
+AATCACCAAGGCCTTTCAGCGATTCGACGCGCCCCCCTAAGCTAGACGCTTCACCTACCC
+AGAGAATAGAATGAGTCGCCCGCCTAGTCTTACTAAGAGTTTGAATTGCTCCGGGCGAAT
+GAATCGCATTAGTGTGATTTGGCTAGCAGAATCGCCCTTATATTATATATATTTTTCAAC
+CAGGTCAACGCATCGCCACTACGGAAACGAAATTTCCTTAGTCCTTTTTCTGTGAAACAA
+AGCCAAGTCTTTTCCGCCTTCCATCCCGCGTTTCCCTGCTTGAGACTGCTTTTTATTAGC
+CCAGTCATGAACCACCCCGGTTGGAGCCATGGTCTACCCGGCAGTGCTTCATAGCCCCCT
+TGCTCTTTGTCTAATCTTAGACTAAAGGTACGGCATCCTTTTTTGTTGTTTTTCTTTTGG
+CCGTAGGTTGTACGCCAGCCATATGTAGCTTGAACTGTGATGGCCACAATGCTTAGCTAC
+CCAAGATGCCTTTGGTTGAATGTTCACACCCGTCTGCACTTCCTACATTCATTCCCGGAA
+ATTGAAACAAAACAGGAAAACTGGAATTGTAACCCCCCGGCGCGTCTATCCCGACC
+>ds2020-328_26
+GGTCGGGATAGACGATAAACTGGGCTTCTCAGCTTGAGTATGCGTAACATACACAGCGGA
+GGCATCCACCTCAACTTGAGACAGAGCATTTATAGGTTTCACTTTAATAGACCTAAGAAT
+ATGTCTTTTTGTCTTAACAGGAGTCTTCTTTCTATAGAAGAACTTAGACAAAGCATATAC
+CGTATCAGCAGGATTTCGGTATGTAATCGTTTGTTTCACATGATCACCTTTCAAAACATG
+GTGCTTCAGGAGAAACATATCATTCCTGGAAATAAACGGTATTTGTTCAGTGTCACCAAA
+GGCTATAACCTCTGATAAACCGGCAATTGCGTCTATCCCGACCNNNNNNNNNNGCGGTCG
+GATAGACGCAGCCCCCTCACCTCTTCTTCAACCTCATCTCCCTCTTTTGTTTCCAGCACC
+GGCAATTGTGGCAGCAGCATATATGCACCCAGCATGTTGCATGAAACACTCATCAAACAA
+CATCTTCTTTGCCTTGGGAGCATTGTTTGTCATCAGATAGGAATCGCAAGTTCGAATGAA
+CCTGCTTTTAACTAACTGGGATCCCTCAACAGCTTCTTTCAACTCAATTGCAGAAGATCT
+GTTGGAAGTCAAGAGTAGGTCTATATCATCTCCAACCATGGAGGCAATAGACTTGATCTT
+GGTAGTTTTTCCACAACCAGCAACACCGTCCATGATTGTGATTGAAAAATCACAATTCAT
+CTTCAAAGCCTTTTCCAGTGAAGGTATAACCTTCTCCACTGATGAGAATACACAAGAGTC
+ATCAACAATGACAATTTCGTATTCTCCGACAGATCGTACGCAGGCAGCGGACACATTTCC
+GGCATCATCCCACCATTCCGTCTATCCCGACC
+>ds2020-328_27
+AACGGCCGCCACTATACGAATACCATAGGGGGTAGAGCACTGTTTCGGCTAGGGGGTCAT
+CCCGACTTACCAAACCGATGCAAACTCCGAATACCTATGAGTACTATCCGGGAGACAGAC
+TGCGGGTGCTAACGTCCGTAGTCAAGAGGAAAACAATCCAGACCGCCAGCTAAGGCCCCA
+AAATCATAGTTAAGTGGGAAACGATGTGGGAAGGCATAGACAGCTAGGAGGTTGGCTTAG
+AAGCAGCCACCCTTTAAAGAAAGCGTAATAGCTCACTAGTCGAGTCGGCCTGCGCGGAAG
+ATGTAACGGGGCTAAAACTATGTGCCGAAGCTGCGGATTTGACATTAGTCAAGTGGTAGG
+GGAGCGTTCTGTAAGCCGATGAAGGTGTATTGAGAAGTATGCTGGAGGTATCAGAAGTGC
+GAATGCTGACGTGAGTAACGACAAAACGGGTGAAAAACCCGTTCGCCGAAAGACCAAGGG
+TTCCAGTCCAACGTTAATCGGGGCTGGGTGAGTCGACCCCTAAGGCGAGGCCGAAAGGCG
+TAGTCGATGGGAAATCGGTTAATATTCCGATACTTGTTTATAATGCGATGGAGGGACGGA
+GAAGGTTATGCCAACCGCGCGTCTATCCCGACCNNNNNNNNNNGGTCGGGATAGACGGAT
+GAGAAGGTTAAGTCAGCCTGGCGTTGGTTGTCCAGGTGGAAGGATGTAGGTATGTATCTT
+AGGCAAATCCGGGGTACTCTATACTGAGATCCGATAGCAAGCTGTACTTGTACAGTGAAG
+TGGCTGATACCATGCTTCCAGGAAAAGTCTCTAAGCTTCAGTTACACAGGAATCGTACCC
+GACTATACCGTCTATCCCGACC
+>ds2020-328_28
+GGGAGGGATAGACGAACAGTATGAGCCAATGGACCTATCAGATGCTAGTAGCGACGAGAC
+GGTTGGATGAAGGTTATAGATCAGAATACATAAGCGCAATGATCGTAGAAGCAGTTAAGC
+AAAACAGAATAAGAACCGTGAAGACTTTAGAGATAATCTCGGGGGCTCGAATGACAGAAG
+AAGAAAATGAAGTTTTCGGAAATTTGGCGGAAGCTGAGAGAAAATTAGAAGAAGATAAAA
+GAAGCTTTAGGAAGGTAGCTGGAATGATGGTGAAGAAGGTGGGAATGGTGATAGGATTGC
+CTTTCGTGATATCAGATTTCTGCATGGCTGCTTAGCGTCTATCCCGACCNNNNNNNNNNA
+GGTCGGGATAGACGACGCTTGGGTTTCTGGTTCGTAAGGACAGTGTCTTCAGCTCGAGAA
+AAGATATCAAGGACGGCGTCAGCTGCAGCTGCGTGGACATTAGACAAAATTGGAAAAATC
+AAGTCTTCGCAGGTTAAAATATTAGGAAATGTGTCGTCGCTACTCAGAAGGGCGTTGGAA
+TTGATGTCCGTGATCTCAAAAATATATGACATAGAAGTGAGAGAAGAATTTAAATTAGGC
+AGCAAGATCGGCGAAGCCGGAAAGGTTCAGACGTCCATGCTGAGTAACATGGTAAACAAG
+ATAACCAGCTCCGTAGTGAGGGAATTGGCTGACAAAATAATAAGCCAGAAATCATTGCAA
+GATTCGGGGAAGAAGATGGAGGAAGAGAAGAAAAAAGAAACTGAAATTAGAGAGAAAAGA
+AGCGCATATGCCATGCTGTCTAACAAATCGTGCCAAATAGAAACGGATGCAGAAGCTGAA
+GTTTGGAGAAA
+>ds2020-328_29
+GGTCGGGATAGACGGTGCAGTCGATTAGAACGGAAATGGAGTTGGAAGCAGCCCCTTTCT
+ACATGCTTGATATCTTAAAGCTCGCCAAAAGGAGCCCAGCCCATATTCCCATAGCTGTCA
+AGTTGAGATTCTTTTGCACAAACAAACAATATCGCAGAATATTCTGCGTGTATCACAGGC
+GCTTCGCGCCCTCGAGTTGAGAATCAAGGAGATTGATGTATATGGAGATTCGTCACTTAT
+CATCTTTCAGACAACTGGTGATTGGAAAACCAAAGATCAGAAGCTCATTCCCTACCATCA
+GTATCTGGAAGATATCAGCCTAAAGTTCAGACGGATTACCTTCAATTATATGTCGAGGAC
+GAAGAATAAGTTTGCTGACGCATTGGCCACACTAGCTTCCATGATCAGTAGACGGTATTG
+ATATCCGGCCAATAGAATAGAGTCGACGAATCGGATTGAAATCAGTGTGAAGAAGAGTCA
+TGCGAGGACTAATCAAGCACAGCTAAATAGTAGTCATATCCACAAAGAAAGGAAAAAAGA
+TCGTCAACGCTTCTAACGTCCGTAGGAACTAAGTAGGAGGGCCGGAACTTGAGGCACTCG
+TCTATCCCGACCNNNNNNNNNNTGAGACCCCATTTCCTGTCTACCTCTCTGAATCCTGAG
+TTTTCGGAGCAGTAGAGACTCGCGCTTTAGCCGCTTCATCTGAAGTGAAGGAGGGCTTAC
+AGAAGTCACAGCACCAGAAAGTGACAATAGGCAAATCAACATAAATGCAAGAAAAAGAGG
+AAACTGTACATCAAGCCCTGTATAGCGAGACAGAGAAAAGAAATGGTACCTGGCGTCTAT
+CCCGACC
+>ds2020-328_30
+TTCTTCGATGATGCGCAAATTGAAGCTTCGGTACCCTTGTTTTTTCCAATCGCCCTTTTC
+TCTTCTTTCTTCTTTTCTTCACTTCCTTCCTGCTTTAATTCTTCATCAGACCCTCCTTTC
+TTCCTCGCTGCTGCTTTAGCCGACTTCCCGCTGTTTTCATCGGTTTTTTCTTCTGTCTCA
+TTCTTCTTTGCTACCGGGTATTTAGCCGCGTTTCTTCCTATCAGCAAGTCCCACGTCCTT
+CTCATTGTCCGCGACGCCTTCCTCACTATTCTCACTGCTTTGTCTTTCAATTCCACAGCC
+CTTCTGACGATAGTCCTGTTTAGAAGTCTTCGCACGCCTACGATTTTCCTGCTTATCCAC
+CTTATCACCGTCGCCAGCTTACTGCCAACCGCTCCGTTCGCGTCGTTTATTTTCAGCTTC
+AGTGCCCAGAACCACCCTTGGTCCATTTCTGTGACTTTCAAAGCTTCTCCGGTGAGCACT
+TCCTCCTTAGACAGCATCGTCGATGCTATGGATGGGTTCTTCATCCTGTCCGTCAACTTA
+CTTATTATGGTGCTTGGGTCCATCATGTAGCTGCATCCTCTTGTCCGACAATCTGCTAGC
+CTTTTGAATAACTCATCTCGGCCCACGTCTTCTCCTGCTATTCTATTCTTCCTTTTCATC
+TTTATTCTTTCGGGATTTTCTATTCCCATTGGTGCCCTAGGGCTGAACTCGCTTGAATAC
+AAATATGCTATCTTGAATCTGTCATTCAAATCATTTAGAACCGCAGCCATTCTCAACGCG
+TCCGTTAACAACTCAGTTTCGCAACCAAGACACCACGTCTATCCCGACC
+>ds2020-328_31
+GGGCGATTGGAAAAAACAAGGGTACCGAAGCTTCAATTTGCGCATCATCGAAGAAGATCA
+GCTGGGCGGATCAATGCGAAGGAGAGGAAGCCGTCTATCCCGACCNNNNNNNNNNGGTCG
+GGATAGACGAACACACGGGATAGTGGCTAGATCGGTGATGACAGCTATAAGGACAGGAGT
+GAAACTGGCGCTAATTGGTCCTAAAATAGCATTATTTGCTGTAGGAAAGGTGTTGAGTGA
+TTGCAGGTCTAAAGTCACAGAAAGTCTGTCCAGAGCGACCCAAGTTATGAGGTTGGGACT
+TAAAATGCTGCAGAAATTAAGGTCCCAAGTAAGGAGTCGAGTCGGCGAGAAGATCCTATC
+GAAAGCGAAGAGTGTGGCTTGCGCCAAGGCTGGAAAGAAAAACACGGCGAAGGAAGAAGG
+CGAGGCAATCAAAAAGAACAGAAACGGACCGATGGAACAAGTGGCAAGGGCGGCTTTAGA
+TGAAATGAAAAAAGGAGCAAGAAAGTTCGTGTCGAGGATGTTCAGTGAGTTAAGGAGGCT
+AGCATCAAGTGCGGAAGAGAGAATTGAGAAGTTTTTTAGCTCGATTAGCAGAGCATGGAG
+TAGGCTAAGCAAAGAAGTGAAAGATTTATATTTCCAAACAAACCTTTTAGTGCGCGCGAT
+GATGGGCAAAAAAATGGACGTTGGCAAGCACTTTTGCTTATTCAGGAAAGGGGAAACAAG
+CTCAGCTGATTTGATAATTTCCGTAAGCAGAGCGATCATGGGGTTGTTGGGGAGAATAGT
+GATATTCTGTGTGTCGACTGATTCCCCACGTCTATCCCGACC
+>ds2020-328_32
+GGTCGGGATAGACGTTCCCCCCCCCCTTTCTATTCCTCGCGAGCATATTCCCACATAAGG
+GAGTACAATCGATTTTTCCCCCTGGAACTTGTGAATGAAAAGGGAATATGCTCGCCATTA
+TTGTAGTGCTCCCGCTGAAGCGACTCCACTCTCCCTAGCAGAGCTTTACAAAATCCAACC
+TCAGCCTTATCCAGCGCTAACGATTCGATGTACTTGTAAAAGGTTCTGTCGGGAAGGGTG
+CGCTTCCTTCCAGAAAAAAAAGTGGTTCTTACCTTCCTGTACGAGTAGTGAAGAACTATA
+GTGAGTTGTGGTTGGTTGTTGACCAACGGAAAGCGTGGGAGAAAGAAGGAGTCATCGACG
+GGGCGGGGATCACGCAATAGATCTCCGGGGGTGGGGGGGTACCTTACTTAAGTATGGATG
+TGATTTTGACCCCGTTCCACCCCAGCTCAAAATCCATTGGGATGCCCCAATTGTTGAATA
+TGATTAAAGCCATAAGGAATGTGTGGGAGGCTGTATAAAGAAGTAGAAACAAAAATAGAG
+ATTTCGATAGTCCATGAAGAAAAGGAAGGATTTGTTGATATGTAGCAGCTCCGGCACCTA
+TTGATTTTGCACCCTCTAACATCTCCGAGTTAAGAATTCTCGTCACGCTTTTTCATTCAC
+GATTTTATGTTATTGATTCCTCGTCGATTCTGCCCCCCCCAAAAAAAATGAAGAAAGACT
+TGTCGGAAATCGCCGGTTGGGTTTACCAACCAAGAAAGACATGGGAATTTTAGGCGTCAG
+ATTCTTTTTCTTCAGGGCTTGGCGACGTCTATCCGACCGC
+>ds2020-328_33
+TGGTCGGGATAGACGAGTTGGGGCCGAGTCCCGTAGATACTACATAAGAAATTTTTTCAT
+TGATGGATGGGAAGGTGTATAAAAAAAGGTAAAAGCGCTTATGGGGCATCCCACCTCCCG
+AGAAGGTTGAAGGGATAGAGGAGCTTTTTAGCCCTTTTGAGGAATTGGTTGGAAAAGCGC
+TACCACCCTGGCCGGAAATCCTATGTCCAAGCGCTTCAGAGGTCAAGGGAGTTCGATCCG
+GCTACAACTCTCCTCCTTCCACGCACGGACAAGGATCGGTTGTTGAAACAAATTCATCTA
+GAAACAAATAAGTTCTTGTTTGATCCGCCGCTGTTGTAACACCACAATATTCGTCCTTTT
+CCTTTTGAGGTTAATCCTCTCAATGGTGAATCGAGCACTCGAAAAATTTCTTCGACGGAA
+TGGAAGAAAGGTAAGGAAACCCGCGATGGCTACTGAATACCCGCCCTTTACTTTCTTAAT
+AAAAAAGCCCCTTACCTTTGTATTCGTTCGCCAAATCTTGTTCAGTTCCATCCAAGCTCG
+GTTTTGTCTGAATCTTCGCGGAAGAAGAAGAAGCGGTTCACCAGCCACTACATCTGTGGA
+TCCCACCAAATTTTTAAACCTGGCGGCTGCTCGCTCTTTGATCAGTGATTCACCGGCCAC
+TACATCGATGAAGAATCTCTCCAAAATCTGCTCTTTGATCAGTGATTCACCGGCCACTAC
+ATCCAGGGATCCCACCTTATTCTCAAACCTGGAGTGCAAGTCTATCACGACC
+>ds2020-328_34
+GGTCGGGATAGACGCTTACCGGGATTGGGGAAGACGGGTGGATTATAGAGCTAGGGGCGG
+ATCGAAGGTTTGCCCGTTGGGATTGGGCATGGACGAGCCTCGACTGGGCCAGCGTTGATG
+AAAAAATGAAAAAAAAACTTCTCCCATCGCATCATTAACCGGTGTAGGATTAAAGATCAG
+GTCCAGGATTCGAGGCAAATCAACCTCCCCTCTCATCTCAGGGTGAGGCAAGGAATTCAA
+TGTTCGTTGTTCAATATCTCGGCTGCTCAAGAAGTTGGACTAGCAGCTCCTCCGACCCGG
+AGTGGATTCTAGGGGAAGGGCAGAGCCTCACCTTGCAGTAGGAAGGTGGTCGTTGCTGGG
+ACGGGTTCAAACAGGACTGAAGGGAGGATAAATTCAATACTCCGATCTTACTGGGGATTC
+ATCACTGGCTAGGGCTTTCGAATCAAAGCATGGGCATCCGCAACTAAGAGGGAGCAGTAG
+ATCGTCGATTGAAGAGCCAGGTCAGTAAACTTCTATTGATTATTGATTCGACTAGAGGGA
+CTCCTAGCAACAAACTTGTATGAAGGGCCCCCCGTGGAGATGCAGGAGCCGCCAGCCGGA
+TCGACCAATAAATGATAGGCCAGAGGGATGGGCTCATTCGACTAATTAGTGATCCCTGGC
+CCTACCTAACAAGGGGTATGTGTCGTCTATCCCGACC
+>ds2020-328_35
+GGTCGGGATAGACGTTGACTTTCGCTTTCTCCCTTGTAGCCGTTACCCGAATTCGCGCAA
+GTGTGTCCACACCCCCCAAACTGACTTGACGAGGAATCCATTCTCGCGAACAAACACAAC
+CCCTACACACACCTAGGAGCACCCCTTCCTGCATATCCATACAAGACCCGAGTAGGCGGG
+TCGAGGTCCTACGAGGTACCCACTACTCGGAGTACCCTCCCAAAAGGAAAAAGATGTGTC
+TGTCAGGTTCGGTTCTTCTTAGTTGGGTTGGGCGGGTTCGACCAGAAATGCTATGCTTAC
+ACACAAGACTACCCCTCTTCCCGAAAGCTTCGCGGGGACTACTTTACGACGACGGACGAC
+CGCCCGTAGGGGGTTTACTGCACAAGGCCCCTGCAGAGGAAAGGCTTTATCCCAGCGAAT
+AGAAGATGCTCAGCTCCGCACAACATAGGGATTAGCACGCTTTCGGAAAGAACATAGAAT
+AGTAAAGGATCCAGCATGCGGAACACGGCGATCATTAGAAATTCACGAATTAGAGATGCT
+GTAATATACTCTTTCCCATAACTTCTCATACCAGACCAACCCACTGAAATGCAAATAGGG
+ATCAGAAATGTGGTCAATATCACGAAGAATAAAGAGATACCGTCTATACCCAAATAAAAA
+TTTATGTTTTATCGTCTATCCCGACC
+>ds2020-328_36
+GTACAGCTTTGGCTAGCAACTTCGGAGCCGCTACTTCGGGATGCGTACCCGGTGACGGAT
+ATGCTCACTACGGAGGTTCAGCGTGGTTGAACTGCCGCGCGCTGCAAGAGTGCCAGAACG
+AGGGTAACGATGTAGTTAAGAGATCTGAACTCAATGTCACTAGCTCCGACGTCCGTGGAG
+CTATGTCTGGTGGTGTTGTGATGCCGGACTTTCTGTACGCGTACGGCACCACCTACTTTA
+TCCACGGACAAAACAAGTCCGGGGGTCACGTTGACGCTAAGATTTTTGACAACACTGAAT
+CTGAGGACTTGATGAAAGATCTGGTCAACATGACTGAAACCGACTTCGTTGCCAAATACG
+CGCACCTTGGTGTAGACGGCGACTTGTTCGGTGCTGCATAAGTCGTTGAATGATGACCAA
+AGGTGGATGAGTTGACTTGTTAAGCCCTATGGCAGGTCGACAGGGGCAATTGGTGGAAAA
+TGCAACCGGGCGCAAAATGTAAATCAGCGGAAAAACACGGGTAAAACAATAAATTAATTA
+CAAAATAATGTGAGAAGGGCATATCGTCTGATATGGGGCGACTGGAAGGCGATCTCAATA
+AACTGGTCTCAACAACCAGGGAGCGCAGAACAAAAAAAACACACATAAGAAAATAACTCA
+TATAGTGGCGGCCGTTGCTGTGTATT
+>ds2020-328_37
+GGTCGGGATAGACGCACGCTCACACTGGTCGGGATAGACGGTACCAAGGGCTTTCGGTAG
+ACTTCTTTCATTTCCGAATTAGCTTGCGAAAAGTCCTAGCATTAGTATGAGTTCGTTGAC
+CGCGTAAGGGCGATCCATCTTGATGACGAATTCCACGATAACGAGAAATAGAAATTAATC
+GTTCGATGTCTGCTCGCTCTCCCCTCTTCAATTCCCAATGAACAACATGATCTTGACCTA
+TCATTTGTTCAATTTGGTCGATCTGATACTTAGTTAACTCTTTTATCTTTATGTTCCCAC
+TGATACCTAATCGATAACGAACCTGAATGGCTTTTTTAGGTCCAATTCCATCAATTTTTG
+TTGAGGCAATTCTTACTTGTTCATCGGCAACTGATCTAGCTCCTGAAATATATGACATTC
+TTGATCCTTTCCTTTACTAGTCTTCTCGGCTGGAATCAAAAATGGGCTGTCTCCTCTCTG
+ATGATCTTTTCTATAGGTAGAACTACTGTGAGCGGTCTAAACTTCGACCCTTATTTCTTT
+CTTAAAAAAAAAGAAAAAAAGGACATTCGACCCAATACCTTAACCATGTAATTTCTCCGA
+CATTATTTTCTATCGCCACATCAAGGTGACAGGATTCGAACCTATGGCCCTCTGTACCCA
+AAACAGACGTCTATCCCGACC
+>ds2020-328_38
+GGTCGGGATAGACGAATCATGATTTTACTACGAAGGAAGGAACTCGAAGTGAGACGGCAC
+TGTCTTGTCCAACGCAACGATATGGCCCTCTATCATCTTCTATCCGGTAGACTTGGTAAA
+AGGGCCCCGACTTTTTTCCAGAATTAGAGTTCGACCGCGGCTGCCCCCTTTTTTGGGGGG
+TTGGTCAGAAGTCAGTCTTGTTTGGTAAGACGGAATTGGACAAAGAAAAGAGAGTGCTCG
+ACCGGAGCAACGGCCAACAAAGACCGTAATTACATAGATAACCGCTCCTCCCCTTCTCCG
+TCTTTAAGGCTTTAAGGCGAACCGTATGGCGGCTGGAAAGAAAGACGACCTCACCTTCTC
+GTAGATGGTGTTAGTGAGAGCAACTTTAGTATCCCCCGTTGACCTTCTTTTGCAGATAGA
+ATCTTCAATGAGTGGAAACAAGCAACCTTACTAATAAAGGTGCTTGTTGAGTAAGGCCGG
+CGCCCAAGCCCCTTGTATAGGTTGGGTGCTTGAGCGCATGTTTCTCATATCGATCAAGGC
+TTTCCTTGAGTTTTCAATAAGGGGCGCGTTAGCACTCCTGCAAGAAAACGGCCTAGCTAA
+CGCGCGCCCTTACGTTTTCTTCGCTTGCTCTGCCTGCAGTACGAGCCTCATACAGAGCGC
+GCCCCATCGTCTATCCCGACC
+>ds2020-328_39
+GGTCGGGATAGACGACGGATCCCAGTCAGCCTTCTTCCTCTTCAGGACATACCTGACTCT
+CACAACTCCGCGAGAGGTTCACCTTCGGCGTCGTCCTCCACTGGACAACGAGTCACATTA
+CCTTGTGACAACACAATCACTCCGCATCCGGCAACGAACCCTCGACGCCCATACATCAAG
+CGTTGCATAAGACACGTCAACTGCATCGACCACGTCGCATGCTTCACTCATGGCTCGCTC
+ATGTCCAAGTCAAGACATAGCGATCCAACACACCATCGGTTTACCCACACTTCTGTCGGT
+CATTCCTTTAGCATCCACGATAGCCCACTTCCTCAAGCTATACACGCAAGCAGTCCTACT
+TGCATGTCGCCCAAGCCTTGGCGACATATATATTCCGAATGTCCCACATAACCGTCTATG
+CATTGCATGGGGTCGCAACCCATGCGTACCGGCATCCGAATATCTTCCTTCCAACATTAG
+ACAAGGCCGAACCCCAACCAAGTCTATCGAGTCTTGCCACATGCCTCGCTAGCCGATGGC
+ATAGCGAATGCCATTCCGTGACCTCACTCTTTCCGACAATGCCCAATACGAACGGCCCGA
+CGTGTTCGTACTGTCCTCGGGAAATCCTTTCCCTCGGAGACACAGATCATCCTCATTCAG
+CGTCTATCCCGACC
+>ds2020-328_40
+AACGGCCGCCACTACTTTTTGCCTTTATTGATATGATATAAAACAAGCTTACTTACTAAT
+AAAGCGGCAACAAGCACCTTCTTTCTCAAAAAGTAAAGTTTCGCGCTTGTTGCTTTAGAA
+AAATGGCAGCGTTAGCGCTTTACTAATACTTATATATAATATATCAAGTAAAGGCTCTTC
+TCCTTTTCTACTAATCTACAACTCTCTTTACTGAGCGAGACTCCATCCATATCCCTACTA
+GTGGTTCTTTTTTTTTCTATTCTATCATTTGTTTGACAGCTTAAACCAGGCTCCATTTTA
+GAGAGTTTTCGGTCTTAATCAAGATAGGTCAGGGGCGCGTCAGAACGGTCGGTGGCTGCT
+TAGTCTCATCCGAGAATCTCTTTGTACTGCTTTTTTTCAAAGAAAAAAAAAGAAAGAAGG
+GGTTCGATTTAGGCTCCTTCCCTTACAGAGCATAGCTGCGCTAGCAGGTACTACGAGCCC
+TCTGTCCCGCGCATCTAACCAGCTCGCGTGGTTCACCGGTTCCACCGAAAACTCTCATTT
+GTTGAAGCGGAGCATAGTGCGCTTTAGGCGCCGAGCGAGAAACGTCTCTTCTTTCGTTTC
+GATTTATTCACTGATCTGAAACTTTGCACTTGTTTTCTTATTGATTCCAGGGGCGGCGGC
+GTCTATCCCGACC
+>ds2020-328_41
+GCCGTGGACCTAGTTGCCTACCCCCTAAACCACTAGATCCACGGCTGGTACTTATTTACT
+AGGTCCACGGCGGTCGGGATAGACGACGAGAGCCCGTTCTAGTGCCTGAACTACTCCGAT
+TATTATAGGCCTCAAACTCGTGTCCTGCAGCTCTAATTCTTTTGCTATTTCTTCCAACTC
+TCTTTCTCTATCAACTTCCGCTTCTTCTTCGACTATCTCTTCTTCCGTCTCAGCCAGCAG
+CCTTTTCCTCAATTTCATTTCTTCGTGAGCCGCTTTGCATAACTTAGCGTCCTCAGAATT
+AGATGCTGCTATAGCCCCTCCGCACAGCAATGTCTCAGCTGCCACATCTCAGCTACGTCT
+ATCCCGACCNNNNNNNNNNGGTCGGGATAGACGTGTACTGCTTCTTTATCGGATAAAATC
+TGGCCATCTCTCTCGCAGCCGCGCACAGTCTTATTGCCTCTTTCGTAGTAAACTCTTTCT
+TTCCGAATGACTCTGTTTTCTCTACTATAGCTTTCATCCATTCTTTTTGCCCTTCGACTT
+CTTCTCTATTCAGGAGGTCTATTGAGCTATATCGGTCCCAATTATCGAACCTCCAGTACC
+TTTGCTCACCCTCTTTCTCTTCCGAAGCTCCCTCAACCATCGATTTGTTCGCGTCGTCTA
+ACCCGACC
+>ds2020-328_42
+GGTCGGGATATACGAGGCACTGGACTGGAGTGCTTTCATCAAATGATGCATGTGGGCTGG
+GCCATTCCCATCCCAAAGGGCGGCCCGATTCGGCCTGGCCTGGTCGGGAAGAGATTCACA
+TAGAGACTATCGCTATCCGGGAATCTATTTCTTTCTATGTTAGCTAGCGGGGGCGGGCTT
+TCCTATGGTAGTCCCGCTGCGGCCTCTGACCGTCCGTCCCGTCTCATCTTGATTTGGCTA
+TACTTGTATGTAGCCACCCTCCACATGATAGCCTTTTTCTAAAGGCTAAAAAGGCACTCA
+TCAGTCAGCTCGGCCCCTTTCCTATTAAGCTTTGCCACCTTACCTTAAGAGAATAGGTCC
+CGTTCAAGCGCCCCGCCTTTATTCATCTATACCAACTGCCACGCACGACCCAATATGAAC
+GATTTCAGCGCCTCTCTCTAGATAAGAAGCGGAACGCGCCATCACCTACAGCCCTTTCCT
+CTGCCGGGGACTTCCACGAAATGAAAACGGGCGGCATCGTCGTATGCTCGACATTTGTTG
+CCCGGGGTTATCTCCCGGAGTACTCCTATGGCCGATCTGTCACCCAACCAACTTAAACAA
+CCTCAATCGCTTGGCCCCGACCCGTTTGGAGAATGACCCTTATCGCACGGCTACGTCTAT
+CCCGACC
+>ds2020-328_43
+GGTCGGGATAGACGCGCGGGGGGTGTGCCACGACGAAACAAGGGAATTTAAGGCCACTTT
+GCGTTGGATGCTCTTTACCCTCCCCACAATGACGGCTCTGTTGTCTTGGGGAGCGTTGAA
+GCTTGCTTCTTCTCCAGAGTTTTCTTGGTCATCAATATGACCTGTCCTTAATAGAACCAA
+TCTGATTCTCTGAACAATCGGAATTTCGTACTTCTGTCGGATCCTCCCTATCTCCTGATC
+GAGCTTGTGTAGGTAGATGTTGCCTAGTAGGGCCGATAGTAGTACACTGTGTGGGACGGA
+ATAAGGGCCCTTCTCACCTCCTACGAGTCGTCCGGCGGAAAAGACTTTCTGAATGGGGTA
+AAAGAACTTGGGATCGTCGATCTCTTCCTTAAAGATTGGGATGAGTCGATGTCGGTCGAT
+GGTGTGAAAACACTTCCTGATGTCGAATTCCAAAAACCAGCGAGAGGTTCCCCACTCTTC
+TTTGATCCGTCTTAGGGCCGAGTGGCGGCCTCGACCCGAGCGGAAGTGCGATGTGTCTGG
+AAACTCGGGATCGTAAATGAATTCGAGTACCATTCTGATCGCCTCTTTCATGATCTTTTC
+TATAGGTAGAACTACTGTGAGCGGTCTAAACTTCGACCCTTATT
+>ds2020-328_44
+GGTCGGGATAGACGTGGGTGCTGGGTCGATTTATTCTATGGCGAAGCATCCGAAGCATAA
+CTGCACACTCACACGATCTTTGCCGAGAGATAGGAGCATTCGGTGGAACCGGTGAACTAC
+ACTTGCTTCTGGATAGATGTGTGGGACAGAGGGCTCGTGGTACCTGCTGCCCACCCTTCC
+TCCTCTGCTTTGAGAACCGTGTGAACGGAGAGTGGGCAGAAGGGAAGGAGGTCCTCATAC
+GGAGTCGCACACTTACTTGAGCAGTGCGGGAGACTGGGGAATGGGTCGAGCAAACTCCCC
+CTGGGCCGAAAAATTACAGACGAAGCTTTACTTAGATAGGGCTTTGATTTGATTGGTATT
+GATTTTTTCTTAGTGATTGGAAAGGAGGGCGCCGGGGTATGTTATAGAAAGGGAAGGCGG
+AGGTAGTACTTCGAATGGCGAAGAGCGGCGGCTCGGCAGGGAAGGAATGGGAAATCGTCA
+AGGATGACTTCTTTGTTGGCGAAACGAAGGGCTAAATAGCGCCAGTGATTCTCTGAGCCG
+GTCTGGATTTCCAACGCCTCGGGAAACTGGTCGAGATAGATGACAGCACCCTTTTCCTCT
+CTTCCTTACTCTAACAAGTAAGCAAGTAAACTACCT
+>ds2020-328_45
+GGTCGGGATAGACGTATATAAGCCCTGTATAGCGAGACAGAGAAAAGAAATGGTACCCCT
+CCGCCCCTTGCTATTAAGAAAATGACCAGACGTACCTGGTTGCGATCAGATGTAGGAGAG
+AAGTGCGTTTAGGAGCCACCGCATACGTTTACTCTTGAATTAATTCGTGAGATTTGCGAT
+CCCCTCGCAGGTCCTCCAAACCCCCTTGAGTATTCAAAGAAAAATTGTTTGATCATTCAA
+TGGATCAAGCAAGGTGTTGATTTCTCTTTTCAAATCAAGGTCTTCTTCGAAAGAACCAGA
+GTTAGCCGAGGAGCTCGAGCAGGAGTTTCTTAAAAGCTGAAAAACGGAAGACTGGGGCCT
+TTTTACAAAAAGTATGGGAAACCGGAAACGGAATACCTAGGTCGCAGGGCAAGGGAGGAC
+GGAACCCCACTTCGACTCACCAAGGAGAAGGTAAGTACTTTTATATCGTTTCTTCTGAAG
+TGATATAGAGCAATGCCTGGACTGGGGGGGGGGCGTCGGCCCACGGGAAACCATTTGCAG
+ATGCGACCATGAATCGAACCAGATCGAAACATTCAGCTTCGACGGACAAACCGAACCGTC
+GATCGCAAACGAAGAATGGCCGTCTATCCCGACC
+>ds2020-328_46
+GGTCGGGATAGACGCCCCTTAGCCCTGAATGGTAGCATAGTAGGGGAAACGGGTTTGGTC
+GGTTTCTCAGTCATATGAGCAGCAACACTCTACCTCAAAAAGGGCTCTGCTTAGGGAGAT
+CGGGTCGACGTCATTTCTCCGCTATACAACCAGACCAAATGAGAATGATGGCTCTAGAGT
+GCCCTACCAACAATAAGGCGGTTGACGTGACTCGCCAGTTATGTCGAACAGCGAAAAGTG
+GACTTGAATGAGATGCTTCTTAATGGAGGGTGAGTCGGAACCCTGGAACCGGGGAATACT
+GCGATTCGCAGATTCTATTCATCACTTTCCATGAGTCCCCAACCCTCCTGCGCGTATAGT
+CGCGAGAGTAAGCAACCCACTAAGCTCCTCCGTCTATCCCGACCCCGTATCAACCAGCAT
+TTCGACATTTCGGGTAAGATGGAACCCTTTTCTATACCCTTAACCTGCCACGGGTGTGAG
+TGGACCTTTCTCCTCAAGCGCTTCCCAACTCCCCCTATTCCAATCGCTCGTCGCCCATTC
+TCTAAGGGGGCTCTCTCCTGCTCCGTCAGCGTGGCACTCTTCTGCTCGGTCAACCGGGAC
+TGATTCCCCGTTGACGTCTATCCCGACC
+>ds2020-328_47
+GGTCGGGATAGACGCTTGTCCCCCCTCAGCTCACCCTAGCCCCGGGCCTTTTGCTCTTCT
+AACGTAAGCTCCAAGGCTTCACACCAAGTCTTCACTGACATAATATGCATGCTTAAGTAG
+GGTCAGGCAGAACCGCTGTTGCCCGATGGGAACTTCCCCCATATTGCTATCAATGTCTTC
+ATGTCGCACGACCTCTTAACATTACACCACTGAATCCCCAATCCTTTGCTTGCTGTGCAG
+TGACAGTACCAATATCCACTAATCGTTGTTTCCAGATACGGTTGCCGGTTGACATCTCTT
+CTAATTCGTCGATACGAGAAGCAAATTGTTGTGTGGAGGAATCAATATCTCGACATAAGC
+CAAGAGGCAAATCTTGGGCCACTCCACCTGGTCGTATGAAACTGGCATGCATCCTGGCTC
+CGGAGACTCTTTCATAGAATTCCAACAATTTCTCCCGCTCCTCAAAAGCCCACAGGAACG
+GAGTTGATGCTCCCACATCCATAGCATGAGTAGTTAAAGCAAGTGAATGATTTGAAATTC
+GAGTTATTTCACGGAATAACACTCGTATATATTGAGCTCGTAATGGTACCTCGCAATTCA
+AAAGTCTCTCTACGGCTGAAGAA
+>ds2020-328_48
+GGTCGGGATAGACGATGCATATGGGTAGCAAGAGGGCGCTTATGCCCCGACGGTGGGGCC
+TTATGGGGAAGGGCCCAGCCAAATAGGGACAGCACACCCCCCACTTCAAGCGCATCTCTG
+TATCGACTGAATCACTCTAAGAGTCTAGTCGGTGGAACCGGTGAACCACGCGAGCTGGTT
+AGATGCGTGGGGCAGAGGGCTCGTAGTACCCCCTTTTCTTGATCCAGCCTTTTCTTCACT
+TCGGTAGTGAATCACCTACTAAAAAAAGAGGCAGGCCTGCGCGCCCTATTTGAGACTACT
+AAGGCAGGCGGTGGACTCTTTCATTAGGGAAGGGAAGAAGGGGCCTAAGCACGGCAGATG
+CCGTACACTTGAGTGGCAAAGGAAAGCGAGATCGTACCAGTTTTTCCAGGCCTGTTCGGA
+CATATGGTTCCCGCGGAAGATCAAGTTGGTGAGCCGTGTGATGGGAAACCTTCCCGCACG
+GTTCGGAGAGCACTGAATTAGAATGAGAGGTTCACCACCACATCATTGCATGCAAGGGGA
+GCTCGCTCGATTCGCAAATTGGTCCGACTCGTAATTCACTTCTGACCCCGTGTCCCGTCT
+ATCCGACCGCCGTAATTCTCTCA
+>ds2020-328_49
+GGTCGGGATAGACGTTGGTACCCCCTTCATTCAGCTGACGTTAAGAAAACAACAACAGTT
+TGCACCCTCGAACATGCCTAGTGCTCCAAGAAACACCGCTGCCTTTGTGGCCTCATTCGA
+ATCGAACCAAGTTCGCCCTGAACCTGGCCGTTTCGTCCCGACCTTCCGTCCGATGTTTGG
+AATTGATGGACCCGTCCTCGATACCGTCTCCTTGACAAAGAACATCTTGTCTATCGTCTC
+TGACGTAGCCTCTGGAAGCCCCGGAAAAGCCGCTTTCTATGCCGCCGGTACCCTCTTGAA
+TCTCTCGGTCGTTTTCACCTCTACGAGCCAATCCCTGTCTGACGACGATATCTCAAACAT
+GGTCAACCTTCCAACTGCCCTCCAGCAATTGGTAATTGGATACTCTAGAGCGAAGTGTTC
+TCAGGAAAAAGTGGTTCTATTTGACTCTCGAACCGAGGTTTCCCGTCTGTTATGGACTTT
+CGATCAGATCGCAACAACTGGCCAAGTTATGGCTTTGTCTGCCCTGTCCGTCCCCATGAC
+TCCGTCTACCTCTCTTCCCGCTGCAGTCCTTCTCCACAACTTCCTTCGTCTATCCCGACC
+GCCGTAATTCAGATCGGAACA
+>ds2020-328_50
+GGGCGGGATAGACGCGACGGTCCGTTCTAGTGACAGCATTCCTACTTTTATTATAGCTTC
+CGGTACTGGCGGGGGCAATTACCATGTTATTAACCGATAGAAACTTTAATACAACCTTTT
+CTGATCCCGCTGGAGGGGGAGACCCCATATTATACCAGCATCTCTTTCGGTTCTTCGGTC
+ATCCAGAGGTGTATATTCTCATTCTGCCTGGATCCGGTATCATAAGTCATATCGTTTCGA
+CTTTTTCGGGAAAACCGGTCTTCGGGTATCTAGGCATGGTTTATGCCATGATCAGTACAG
+GTGTTCTTGGATTTCTTGTTTGGGCTCATCATATGTTTACTGTGGGCTTAGACGTTGATA
+CCCGTGCCTACTTTACCGCAGCTACCATGATCATAGCTGTCCCCACTGGAATCAAAATCT
+TTAGTTGGATCGCTACCATGTGGGGGGGTTCGATACAATACAAAACACCCATGTTATTTG
+CTGTAGGGTTCATCTTTTTGTTCTCCATAGGAGCACTCACTGGAATAATCCTGGCAAATT
+CTGGGCTGGCCACGGCCCACTTCTCCCTCCGGTGCGCACTCCAATCCATAATACAACCAG
+ATTGAGCGTCTATCCCGACC
+>ds2020-328_51
+ATTGCAAAAGAAAGGGCTTGCTGATAGAGCGGGGCGGGGAGGCGATACTAGTTATCAGGT
+CAGAGAGACGCCTGGCCCGTAAGCCGGCCCCCTTAAAACCCCATTACTTAATAAGGATTT
+GTTACGCGCGATATGCCGACGACTTACTACTGGGAATCGTGGGTGCCGTAGAGCTTCTCA
+TAGAAATACAAAAACGTATCGCCCACTTCCTACAATCCGGCCTGAACCTTTGGGTAGGCT
+CTGCAGGATCAACAACAATAGCTGCACGGAGTACGGTAGAATTCCCCGGTACGGTCATTC
+GGGAAGTCCCTCCGAGGACGACTCCCATACAATTCTTGCGAGAGCTGGAGAAGCGTCTAC
+GGGTAAAGCACCGTATCCATATAACTGCTTGCCATCTACGCTCCGCCATCAATTCCAAGT
+TTAGGAACCTAGGTAATAGTATCCCGATCAAACAGCTGACGAAGGGGATGAGCGAAACAG
+GGAGTCTACTAGACGGGGTTCAACTAGCGGACACTCTTGGAACGGCCGGAGTAAGAAGTC
+CCCAAGTGAGCGTATTATGGGGGACCGTCAAGCACATCCGGCAAGAATCAAAGGGGTATC
+TTACGTCTATCCCGACC
+>ds2020-328_52
+GGTCGGGATAGACGTTTGATCTACATGATACTTATTATGTGGTTGCACATTTCCATTATG
+TACTTTCTATGGGAGCCGTTTTTGCTTTATTTGCAGGATTTTACTATTGGGTGGGTAAAA
+TCTTTGGTCGGATATACCCTGAAACTTTAGGGCAAATACATTTTTGGATCACTTTTTTCG
+GGGTTAATCTGACCTTCTTTCCAATGCATTTCTTAGGGTTATCGTGTCTGCCACGGCGCA
+TTCCAGATTATCCAGATTCTTACGCTGGGTGGAATGCCATTAGCAGTTTTGGCTCTTATA
+TATCCGTAGTTGGGATTCGTCGTTTCTTCGTGGTCGTAACAATCACTTCAAGCAGTGGAA
+ATAACAAAAGATGTGCTCCAAGTCCTTGGGCTCTTGAACAGAATTCAACCACACTGGAAT
+GGATGGTACAAAGTCCTCCAGCTTTTCATACTTTTGGAGAACTTCCAGCTATCAAGGAAA
+CCGTGAAGTAAAAGAAGAAAAGGTAGACCACTAATACTAAGAACCTAACAGAACAAGCAA
+TGCCCCATGCCTTTCTTGGTTGGACCAGCCCAACCGGCGAATTACGTCTATCCCGACC
+>ds2020-328_53
+GGTCGGGATAGACGGGGCAGGTGCATGCGTCGCTTCTAGCCGGATTCTGACTTAGAGGCG
+TTCAGTCATAATCCAGCGCACGGTAGCTTCGCGCCACTGGCTTTTCAACCAAGCGCGATG
+ACCAATTGTGCGAATCAACGGTTCCTCTCGTACTAGGTTGAATTACTATTGCGACACTGT
+CATCAGTAGGGTAAAACTAACCTGTCTCACGACGGTCTAAACCCAGCTCACGTTCCCTAT
+TGGTGGGTGAACAATCCAACACTTGGTGAATTCTGCTTCACAATGATAGGAAGAGCCGAC
+ATCGAAGGATCAAAAAGCAACGTCGCTATGAACGCTTGGCTGCCACAAGCCAGTTATCCC
+TGTGGTAACTTTTCTGACACCTCTAGCTTCAAATTCCGAAGGTCTAAAGGATCGATAGGC
+CACGCTTTCACGGTTCGTATTCGTACTGGAAATCAGAATCAAACGAGCTTTTACCCTTTT
+GTTCCACACGAGATTTCTGTTCTCGTTGAGCTCATCTTAGGACACCTGCGTTATCTTTTA
+ACAGATGTGCCGCCCCAGCCAAACTCCCCACCAAACAACGTCGTCTATCCCGACC
+>ds2020-328_54
+GGTCGCGAAAGCCGCTCCGTGCTCTTTCATTAACTGATATAAATATCGGCTAGTCTACCA
+TATTTTTTATTGACAGAAAGATAAAAGGATGGCTCCATGTGCTCTGATTCATTATGTGGA
+TTCATCCAGGAGCACTACCAAAGTGTTTCAAAGAAGGGTTATCCTGACGTAGGTCTGCTT
+CTGGCCTAGATCAACTTAAGTTAAATGGAGTTTCTATCGCCCTGCTTGAATCAAATATGA
+AACTTCATACACCTTAAAGTTCATAAGATAGGACGAAAAGAGAGTTTTTTTGAGGTCCTT
+ATACTCATTATGCCTGGCATTGAATAGACAGGTAATTCGCCTTATCAATATCTCAAATCA
+ATGATGGGTTCTATATTGGCACCTAAATGGGAAACCGAATCGGACCAAACCCTTTGTCAG
+GCTATTGTTCTCTTGTTTTGTTCCCTAAAAGTCATAGAGTAAGACATCGATTTATCAATA
+AGATCAAATATTTTTTTGATTACATGATGGACTCCTCTGAAAAACATTGGCGCGCGTGTA
+AACGAGGTGCTCTACCTAACTGACCTATGGCGTCTATCCCGACC
+>ds2020-328_55
+ATCTAATACACAGCAACGGCCGCCACTATGCCTTTCGCCTACCTTTTCACCGTCCGGTTT
+CTCCTAAAGCTAGAATTACGGCTGCCAGGTTTGAACCACAGCGTCTGCCGACTAGCCTAT
+CACGAGATCTGCCTTATAGTGTCCAGTTCGGGTGGGATTTTTGTTGTTTTAAAATGTTTT
+TGTGTTTTTCTGGTTTTTTAAATGTTTTTGATTAAAAATTAATATCCACATGGTGGTTGA
+GGGTCAACCGTATAGCCACTGCCTGTTAACGTCAAGCTCATATCTACATCATCACCATCA
+TCAAATGCTATTGTTGAACAGAAATAGGTAGTGGCGGCCGTTGCTGTGTATTANNNNNNN
+NNNTCCGCTATTACTCCAGCTACCTGATCAGCCAAACTGTCGGTATATCCACTTTCCCAG
+GTGAAAGCCGATGCTTCAGAGAACTCTGCTTCTAGCTCAGTAGCAGTATAATCTTCCTAC
+CTCTAACTGTTAGTGGCGGCCGTTGCTGTGTATTAGGGATAGACGGAAAATACTCCTGGT
+CCGTCTATCCCGACCAGGGCCTGATGACGTCTATCCCGGCC
+>ds2020-328_56
+GGTCGGGATAGACGACCAGGTCTGGTGATGTTCAGGTTTGTCATAAATTACAGAATTTGC
+AATAGTTTCTGGTTAAATTTGGATATCGGGTGTGTGTTTATGTTGCTGTCATTTATAATA
+CTTATTGATCATGATCATGATGGTGCGTGGAGATATATACTATAATATGTATGCAATTAT
+AAAACCACTGGCTAGGAGACGTGTATTTAAGATGATCAAAGAATCTTTNNNNNNNNNNNN
+NNNNNNNNNNNNNNNNNNNNNNGGTCGGGATAGACGTATTTGAGGTATTTATGTTCATGT
+CTTTTATAGTTCTATTATGATTGCCTCAATTTTGTTTGTATTTGCAGTGGGATGACTGTA
+GTTACATCAAAAGAAAGAAAATTGAAAGATGAAGACCTGTCTAGCCCAAAAAAGAATGTT
+ATTTCCACACCAAAGAAGGATAAGGATAGACTTGCTAGGCGAAGAAAAGTAAACAAGTGG
+AGCTCTTTGGAAGAGGACACCTTGAGGGCTGGTATAGAGCAGTATGGAGTAGGACGTTAG
+AAGTTAATCTTGACTAGCAACCAGGACCGTCTATCCCGACC
+>ds2020-328_57
+GGTCGGGATAGACGACGATGGACCATGAGGAAGAACGGAACCCTTTTTATTTTACTTTTT
+ATTTTGTTTACCTCTTTACTGTTCAAAGATCAAAGAGAAAACCATTCTGTTATTCTGTTA
+TTCTGTTATTACATTACGTGGATACACATTTTCTATGGGAAACAACATAGACATTGTAGT
+TGTCCAACGAGATACTGCACATACTAAAATATTGTCTTGGCTAGTCATGCGCACTTACCC
+GTTGTTTTATTATTTTAGAAATTTTATTTATGTTCTGCTTGTTTTATTGAACCCATTTCA
+TATCATGGTTCAAACGTTAAAAATCGACTCCGAAGAAGTTCCCGTGGATCATTTGTCAAC
+TGCTCAATCAATGACTTCTATAATGGGTATAATAAAATAATCTTTTTGTTAGCATTCCGA
+CGAAGAAGTCATCGATTCTTTTGATCGGGATTCATATTGAAAATAATCAGAAATCTAGGA
+ATTATAATCGCTTTTAATCGCTTTCGATTATTTAAAATTAATTGAAATCAACACAAATAG
+ATAAAGCAAAGCTCTCCATCTATCCCGACC
+>ds2020-328_58
+TGGTCTGGATAGACGCCCGCTGCAAGTTATATGAGAACTGAGCAACATCCATCAACTTTG
+CCCAATTCCGCTGGTTGGCACTCACATAGTGCCTCAAGTAAAGCTCCAACAAGGCATTCA
+CCCGTTCCGTCTGACCATCTGTCTGAGGGTGAAAGCTAGTTGAGAAGTTCAACTGTGAGC
+CAAGTAGCTTGAAGAGCTCCGTCCACAGCTTCCCTGTGAAGCGTCTATCCCGCCCNNNNN
+NNNNNGGTCGGGATGACGGTAGCATACTTGGTGAACCTGTCAACCACCACCAAAATTGAG
+CCACACCCTTCCGACTTGGGTAGACTCACAATGAAGTCCATGGATAAACTCTCCCATGGT
+CTGGTTGGAACTGGAAGTGGCTCTAGCAACCCGCCTGGCTGCTTCTGCAATGTCTTGTCT
+TGTTGGCATACAAGACAAGTCCGCACGAACGAGTCTACATCTTCCCGCATCTGTGGCCAA
+TAATAAGCTTCACTCATCAAGGCTAATGTGCGATGAGTGAAGCTTATTATTGGCCACAGA
+TGGCCACCGTCTATCCCGACC
+>ds2020-328_59
+GGTCGGGATAGACGCTAGGGGGGAGTGCTACTACTTCACTTTCTTGATTTGAGACCCAGA
+TCATAGAGGAAAATGGGCTGTTTGACGGAAGGCATAGCGCTAGTCCTCTTACGGATAGAT
+GGGACTAGGACCGATATCATGCTATTCTAGAGATAGATAGGCGAACAACGACAAGGAAAT
+CCCAAGCTATGAATGTTCTAATGTTTGCGTCTTTGAAGCTTGTTCCTTTCCCACCCACCC
+TCCATCTTTACTTCTTTGAGTGTGAAGCACATGTTGGCATTCCAAGCTCCTTAAAACTCT
+ATGACCTACTAAATTTTTCTTCTTTCACTCTTTATCTTATAGTTCACCTTAAATTAAAGC
+ACTTCCAGTAAAATAAGGAAGACTCACTTGGGCTCTTATAATCATTGCAGGGTTCGCTCG
+AGTAGAATCATATCCAATCTTCCTGCTAAGCCAATCCCCAGTACAAGCAACTAAATCCAG
+TTCATTCCCAAGGAAAAGGGCTAACTGAATTCCCCTTCTCGAGCGAGAGTTCGGGACTTG
+AGTAGTGGCGGCCGTT
+>ds2020-328_60
+GGTCGGGATAGACGAGAGGGCTGGCTCATCAATATAGTACGGTCCGTGTGCCCTTTTTTC
+TCTTAGTCGCTAATAGAAGAGAGCTGCACAATCATTGGAGTGCCCGGGCATATCAACATC
+CAATTCCTATTCATAAAGCTGGACAGATTCTCTGAAAGTGATCGGACGGGTAGCTAAAGT
+AGAACGAGAGAGATCGGTAAACATAGGGGTTCCAGATCGGTAGACGAGAGGACTTTGACA
+CAAGCTTTTGAAAGCGATTGTGAAAGAAGATTTTTGCCTTCCTTCCAGCTGCAAAGATGG
+CTTTGAAAGCTTCGGCAGGGTCTTTTGATCTGTGCGGAGAATCAACCATTCTTAAACCAT
+TGGTTCTTATTAGGTAAAGAATAAACTGCCTCACCTTGACTTGAATGGAAGGTTCCGCCA
+TCCTCTTACTGAATATGGTCTGTCGAGCAAGAAAGATTCTATAACCCCGAGCTCGTATCA
+AAGCCCGACCACATTGCGTACCCCGAACTAAAGAGGGGACTCCCTGTCAAAGAATGGACC
+TCGTCTTCCCGACC
+>ds2020-328_61
+GGTCGGGATAGACGGTCAGCACCAGTGATTTCATATCCAGTCAAAATTTTGGCTAATTGA
+TCGAAGTGGGTAGCTCCAGTAGACCCATAGATCATGGAACAAATAGGGTGGGTAGGCCCA
+ACCACCACACTACACGTATAGACGCGAACCCCCCTCGTTACCGTACGTGCGACTCTCACC
+GCATACGGCTCGCACAAAGACTCCTAAATCCATCCCGAGCCTTTTCTTCCACCTCTCCTC
+TCCAATCCTCGATCAAACTTGCGTTCCCCAGGCGCTATGAAATGGGGGGGTCTTTCCTTC
+GCCTATCATATGTATCGGCTTGGCTTCGTCCAGAACCAAGGAGGCATTCCGGCGGGCGCG
+TGCGTGTAGGAAGGCCGACCACTACATAAGCTAAAAGACTACGACTACAAGCCAAGCCGG
+AAGCGACTCGCTTCTATTCTCGTTGGGATTGAATATAGATGGGGAATCTATAGATCGTAG
+TAGTTCGCCAACCTCTCTAACTAACATACGATACAATTTCACTTCAGTGCACGGTGTCGT
+CTATCCCGACC
+>ds2020-328_62
+GGTCGGGATAGACGTGAAGATCAGGTATACGCAGCTTTATGGACAGCAGAATCTGTGGGT
+AGACAGGTAATACACGATAATGTAGGTACAAAACAAACTTACCTAGCTAAAGATACACTA
+CTATCAGGATGGCGCCTAACCACGTTCATGAACAGCGTTCTTAACTATATATACTCTAAA
+GCCATAAGTCAAAATATGCTTAAAAGAGGAAACAGTCTTCATAATGGAGATGATGTTCTA
+ATAGGGACGAAGAACTTTGAAGCGGTGCGGAGGGGTCTAGAAATGGCTAACAGGCCTATG
+ACCTCTATCCCGACCNNNNNNNNNNTGAATTAGGCGGTCGGGATAGACGACTGTTTGCGC
+TGGTCGGGATAGACGCAGCTCACCCCTGGTCGGGATAGACGCGACACAGGGGTCTAGAAA
+TGGCTAAGAGGCTAAACGTAAGGGTGCAAAGCACTAAATGTGCCTTTGCTGGAATAGCTG
+AATTTTTAAGAGTAGACCATAAACGGGGCAGCAAGGGCCAGTATCAACAAGAAACTGCGT
+CTATCCCGACC
+>ds2020-328_63
+TTGGGGCGGATTAATCGAAGAGTCAAACTTCTCGTCTCGGCCCTATTAGGGTAAGGCCAA
+TGCACCAGCCAGCCGGGGTGGTGGCGAACACGATCTGCTGTAAGCTAAGCTGTTCACCTT
+GTAGACGGAGGAGATATAGAAAGTGTGCCGTGCGTGATTCATAAGATTATATAGTAACAC
+CAGTATATTATTATATTTCACTTAGCCTGCCTCTCCCATGACTTTCCGGACCAACCAACC
+CGGATCTGCCCTCGCAAGTCTCTCCGCGTTTTGGGAGCAGAGCCTGCAAAATCGAGCAAT
+GGGTCTGAGAAGAATTAAATTTTGAACGGCATGACTCTTTCTATTTTTGCGCCGGCATTT
+GAGTTGTCTCCCCTCCTCTTTCAATCGACACACTCCACACAGATAGCTCCCGTGGCCCCG
+GCTTCTGCCTCTATCAGGCGGCGACAGCCCCTACCTTCCCCAAGAACCCTTTTTTAAGGA
+TTCGGCAGGCCCGTAAAAAAAAATTGGGATACTTCCCCCGAAAAACCGCGGTTCGGCGTC
+TATCCCGACC
+>ds2020-328_64
+GGTCGGGATAGACGTTCAGTGCCCATCTTAACGGTACAAGTAAATTTTATTGATAATAAA
+AAAATAGACGGGGGGACATGCAGTTTCATCTTGATAGTAACTTCTTGATGAGACTCGACT
+CTTACAGTTTCATCTTCAATTCCTTGAGGTTGAGAAGGAGGTTGCTCCTCACAAATTGGA
+GGAGACAGAGAAGGACCCGAAGGCATGCTAGTTGATGATTCATCATTGTTTCTCTTAAAA
+AAATCTTGAATGGTCCTTGATCTCTTAACATTACGATGTTGACCCGACATTATAAAGTAT
+AACCTATTGAATAATATATAGAAGATGTAAACATATACACCCACAAAAATTTCAAAAGAA
+AAGAAGATGAAGAATGGAAGATTACCTTAGGTTGCTTTAATTAAGTCCAAGGACATGCAC
+AATTTTCCTTCTTGTCGAAGAGCAAGAGTTAGGCGCTAGAGGATGCAATAGAGAAAATTC
+TTTTTCTGTCTTTCCTTTTTTTTTCGGTAAAGGAGAGTGACGTCTATCCCGACC
+>ds2020-328_65
+GGTCGGGATAGACGCAGCCGCCTCATCCCTAAACCAAGGAAAGGACCGCGGTCATACTTT
+CTTTTAAACTATATAGGCCTTACACCTGGGGCGATTGATCGATTCTGCCGTTGACTCGAA
+TTCTTCGGGAACGAAGGATACCAGTACCAGACTAATAGAATAGAATCGTCGAGCACTATA
+ATCCGACGGACCGACCTAGTGATAGGAAGAGAAGGAGTAGCTCGCAACTGGCGAGCGATC
+GATTGGGGATTGATTTAGTGCCCTATTACAGAAGGCCGATGGGTAGACCCAATATCTATC
+AGTACTCGTGATCTGGGGAGTACCTAGGGAACTTATAAGGCCTCTACATTGAGGGAAACC
+CTGCTCTACGTGAAAAAGGAGAAGTTAACTTTTGCATAACCTCTGTTTTCATTGGGCATT
+GGAACAATCACAAGTGCAGGAAAGAACTTGTTGATATAAGAAGATCTCTTACCATATGGT
+CTTAAGTTGAGTATAGTACTCAGCAACAGGCATATCCCCCGTCTATCCCGACC
+>ds2020-328_66
+GGTCGGGATAGACGCACGCTTGCCATTTTTATTCATACAGTGAATGTTATTTTCTTTACT
+ATGCTACATGATTGACGGTCAGTTGCCCCCTTGAACTATCATTGTCATAGAAGGGCGCGC
+TACCACATTTTTTACATCCGTGGTTTGTGATCTGTCCTATCAGATTACATGCTCTAGCCC
+CATTTATAGTTTCTCCGGTGTTTGCTGTAAATGCAGTTAGATGCCCTACCGTTGCAATGT
+GCTGTCCTGGCGCGTAGTTCCCGTTGTACCCGTCACGGCATATTTTATCAACTAGACTAC
+CCAAATCATTGGGTCCAACACCACCACTACACAATGCGCTTCCTCTGCAATTTATGCCTA
+ATGCCCGAGTACTAACGTCTGCCACTGGCGTACCCCGCGACTCAATGGGGTTTGCCATAG
+CACACACTACTACAGCAACTAGGGAAGCCCCTAACAATCTCATATTAACAGTTAACATTT
+CTATGGGAATTTCCAGAGGATCTCTCAAAGTAATGTCCCGTCTATCCCGACC
+>ds2020-328_67
+TGAATTACGGCGGTCGGGATAGACGTCATTCAATGGTGGGGTGCTCATAGAAAAGAAGGC
+GTCGCCCAACAAGTGGCGGATTTTGATGGAGTCTCGCTTTGACGCTGGGGAGATCCATAG
+ATCTGGATAGAGTCTCGCCCATAGATAGAGGAAGAGTACGCGCGCTACGGCTTACGCAGT
+TGATCGGATCAGATAGCCCTTCGGGCAACCAACCAAACCCGGCACATCAAATGCCGATCA
+ACAACTGGGAGGTATGGCTGAGTGGCTTAAGGCATTGGTTTGCTAAATCGACATACAAGA
+AGATTGTATCATGGGTTCGAATCCCATTTCCTCCGGCACGGAAGTGGAACGGGCGGGCGA
+AATTACGTGAGAGAAAGAACCTCTTGGTGGAGTCCCCCGGAGGACAGAATAGCACTATTT
+AGTGACTAGGAGCGGAGAGCCCGTTGCGCGTTGTTTTTGTTTGACCGACCTATCTTCTTT
+CTATAAGCAAGCTCCCGCTGGCAATCCCTGTGTCCGTCTATCCCGACCA
+>ds2020-328_68
+GGTCGGGATAGACGAACGCCAACGGTTATCCCGACCAGGAGTACGTCGCGTCTATCCCGA
+CCAGGGCTGTTGACCGTCTATCCCGACCGCCGTAATTCATACACAGCAACGGCCGCCACT
+AACACGGAAACAGACAATGATTTGACTTTATCAACATGGAATAGTGAATTTTCTAAGGAT
+TATCCAGCGACCGGATCGACCAGTTTCGATGTCCTAAACCCTCTCTCAGACGGCTCGGAA
+TTAGAATTGGAAGTGTTAGTGTCATCTGGAAATATCTTTGGAAACTATCCGGTTGAAGAT
+TGGGCAACTATCACCAATTGGATCGTAGATACCATCTATGTCACCGAATTCAGTCCAGGA
+TACTTGACCGTACTTGTACATGATGAACAGGCAAACCGTGACATATGTGTCGTATCGTTC
+TATTGGATTGATGGTTAAAATATATGGCGGAACTTTAAAAACATGCAATAATAGTGGCGG
+CCGTTGCTGCGTATTACGATCTAAGGTGTTTTTCCGTCTAGCCCGACC
+>ds2020-328_69
+GGTCGGGATAGACGCCCATTGACATTAGGTTTGTACTGTCGGAATGAAGCCTCACACACT
+CTGGATAGAACCTTCGTGTCAACCAGTATGTGTCTTCTGGACACCGCTTCTAAAGAAGGG
+TGTACTACTGACGTAATATCAGTAGCCATGACCAAAGTTTTTGACTTCAGTTTGGTCAAC
+CAGGCACAGGATCTTCCTGCATTCAACTCAATTCCAGGTTTATACCCGGAGCAATAGGTG
+ATATCGATAATCATGACTCCATGAAAATCGGTTTTCCGCTCGACACGAAAGGCGGCATCA
+CCTAGATCAACAGCATTGTAATGCAAATACTCCATAAGTGTAGAATACTTATGGTCATAC
+CCCAAACAGGGTGCATCGACAAAGTCAAAATAAATTCTGTCTTTGTCCTTGTCCACATGC
+CAATCCACATTGAAATGATCTATGTGACCCCTGTCCTTAATGTACATCTCGGGATCGATC
+ATAACAGAACAAATGAATTTCATCACGCTTATTTCGTCTATCCCGACC
+>ds2020-328_70
+GGTCGGATAGACGGTTATGATTGGTTGAGGAGGACAACAAAGATCCGGCGGGGAGACCAT
+GATCCCCATCTGAGCGGAGGTGCCATATGTGCTTGAGCAAAGCTGCATGATTCAAAGATT
+CCATTTTGGAGATTCCTAGGCAATCTAGAAAGACAGACCGTAGCCCAAGCAACCTTGGCC
+CTTCTATGGTCAAGATCACTTCTAGAGAAAGGCATGGAGAATATGCTAAACCCGCTGGAT
+TACTCCTTGAGGAAGGAATAAAAGAGAAGACCAGGATGGCGAAAAGGATAGAGTTAACTA
+ACTGTAACCTGCCCGCGAAAGAAAGAGCCTTACTAGCCCAACAACTGATGCCTTTCCGAC
+CGGACTATAGATAGGCCTTACGCCCAGACTGAACTACACGATTGAAAGCCGTTACGTTAG
+CCCGCAACCAGAACTTCTTGCTTACTTCCCTCCGTAGCCAAGACTTTTCTTACCTTTTCC
+ACTCGGGTAGCTCACTCTATATGGCTTGTTTTTTGGGAGGTAAGCT
+>ds2020-328_71
+GGTCGGGATAGACGGAGACTAAGAGTGGGCAGAAAGTCGAATGACGGGGGGCAATACCTA
+CCGAGAGCTATAGCGACGTTAGTGCACTCGCGGATAGAGAGCGGACCAGCAACTTCATTA
+GCTGATGCACTGAGATCAAACGAAATACGTCTGTATGAAGCAATAGAGCGGGGTATGGAC
+GCCGAAATAGCATTGAAACTACGGTCGTTGTATATATCACGAGTGGCGCCTTTGTACGGT
+AATAACAGGCAAGAAGCTATGGAGCTATTAGAGGCGTCGTCTGTAGTAGGAGGACTGAGT
+ATGGACAGGGAGGCCAGAGTAGACAAAACATTTACGGAAACTGAGCCAACGTCGAAGGAG
+TCTGACGAAATAATGAACTTGGCGGGACACAGAAAATGGAGGGGAGTGTCAGACATGGCC
+AACGTGGTACTAGAAAAAATATCTGAACAAGGAGGAAGTGCCATAACGATAAAAAACATA
+ACGAAGCGAATTTATAATTATAAGCTGAGTGCGTTGTCTATAAAAA
+>ds2020-328_72
+GGTCGGGATAGACGTTGCCCTCCCCTTTCTCTCCAGCCCGAACCTACCTCTCTCCCTATT
+CAATGGTGCCGCCTTAACTTCCGTCTTCTTGATGCGAGGAGCGTAGTAGTTGATGCGGGT
+CTGTATAACACGGTCCGCCTCTGCTATACGCTCAGTTAGGGCGTTCATCTCCTTCTTGTA
+TTCCTGAACGATGTAGGCTTGCTCCCCTTGAATACGGCGGGCGGTTTGATACTCCGCCAA
+CTCTGCCGCGCTCAACGTTGAATCGTCCACCGTCATATTGCGTCTGGCCGATACAATCTT
+GTAAAAAGCCATTATACATGGTACGGCCACGCTGGCGTGCTTAGCATACCAGACGGCATT
+CTCCGGAAGAATGTCCTGAGTTTGGTACATCTCCCTCAACCCCACTGTCCAGCGCTCCAA
+GGACTTTTCGTTGCCATTGAAGCTAGCACGTGGTTCCCTAGACTTTGCTGGGTCGAAGTC
+TTGGATGCGGGCCCACTCCATCCACACGTCTATCCCGACC
+>ds2020-328_73
+GGTCGGGATAGACGCGCGGCACTGCTATTGGCATAACAACCGGTACACCATAGGTTGGCC
+CAACCCAGTCCTCTCGTACTAGGGTTGGCTCCTCGCAGTTCTCCCTTTAACACCAACGGT
+AGATAGGAACCGAACTGTCTCACGACGTTCTAAACCCAACTCACGTACCACTTGAATCGG
+CGAACAACCGAACCCTTGGGACCTTCTTCAACCCCAGGATGTGATGAGTCGACATCGAGG
+TGCCAAACGACTCCGTCGATAAGAGCTCTTGGGAGTCATCAGCCTGTTATCCCCGGCGTA
+CCTTTGATCCGTCGAGCGAGAGCCCTTCCACACGGGACTCCCGGATCACTATGGCCGACT
+TTCGTCTCTGTTCGACCAGTAGGTCTCACAGTCAGGCAGGCTTATACCATTACGCTCAAC
+AGCAGAATCTTAGCTTGAGCCTACCTTCGCACACCTCCGTTACTCTTTAGGAGGCATCCG
+CCCCAGATAAACTACCCACTACACGCGTCCATCCCGCCC
+>ds2020-328_74
+GGTCGGGATAGACGAACAACTACCATCTCGCTCTTTCCTTTTTTCGGTGCTACCTTTTTC
+TTTCTAAGGGATGGGATTGGGATGTATAATAACCTTTTTTTTGAGGATGCCCGGGAACAA
+CTCCTAGGTCAATTAAGGATCAAATGTTGGAACCTCATGGGTAAGGATAAGGTAATGGAA
+TTGATAGAGAAATTCATAGACCTAGGTAGGATAGGAGAATTGATAAGGGGAATAGAGATG
+ATGATAGAGATCATACTGAGAAACAGAATAATCCCGTACGGGTACAACTCTTATTTGAAC
+GAAGTGAAAAAAATGCGATCTTTGTTGTCTAATAGAACAAACACTAATACCTTAATTGAG
+TCGGTCAAGATCAAATCTGTTTATCAAAGTGCTTCTCCGATTGCTCAAGACATCTCTTTT
+CAACTGAGAAACAAAACAAGATCATTTCGTTCCATTTTTAGTAAAATAGTGAAGGATATT
+CCATTAGTAATGAAAAAAGTGTTTCGTCTATCCCGACC
+>ds2020-328_75
+GATCTGAATTACGGCGGTCGGGATAGACGAAATGCCCTTGTTTCTATCCGACCTAAAGGT
+TGGGCATCCCCAAGACAAGAGAAATATCAGTCGGTGAGGTTCGGATCGATCGGATCAACG
+GGAGCGAAAGCTGCTCGGAGAGAAAAAGAAAGTATGGCGTCTTTGGTCTTCTATGGAAGT
+CTTGGCTGAATCACTTGATCCAGTTAATCAAGAATCTTCTGACGAATAAGGATTGGAATT
+CACATCTGAGCAGTAAGGGAGGTGGAAGGACAGCAAGGTGGAGTAGTGGCGGCCGTTNNN
+NNNNNNNAAAAGTAGTAGGATTCAGAGAAAACCCAACGGCGGAAAACCGCTCCCCTTTCA
+GTCGAGCAAGTAGATTCAGCGATTATTGCTATTCTTTAACGCCCCCCGAAGATTCATTAA
+CATTAAGTAGCGTACGCCTGGTTCACCGCTAAATACACGAAAGAAGAACGGCTCTCCCGT
+TTGATGACTAAGGGGAAAAAATCGTCTATCCCGACC
+>ds2020-328_76
+GGTCGGGATAGACGAACTCACCGCTTCTATAGCCCACAATCTTTGCTGTGCATCGTAAGA
+TGAGTGGTCCAATGACACCCTCCAAGCTTTAACTTTGTTATGTCTCTCTCTCTCCTCTGC
+TATCGCGGCCATTTGCACTACATCATCTTCCGCAAATTCGCCGAAGTGGTTTATTCCTAA
+GCTCATGTTATTTCTGAATCTCGTCATTTTCAACATCTTATCCATCACCGAGAATAGGCT
+CAGCTCCACGTCTATCCCGACCNNNNNNNNNNGGTCGGGATAGACAGTTGTTTGCCCTGT
+TAATCTGCTTGTCTTCTTCTTTTCTACTCTTCTTTTAGCGAAAACGTTGGCAGCGACCTC
+TCCTCCTTTGGCTTTGCCGTCTATGAGCATGTCTCTTACTGCCTTCACTCTTCTGATCTT
+TCTTGGCAGATAACTAGCTATCAGTGGCAGTCCTGATCTGTGTCTGTCTATTATTCCTGA
+TGTCGCTTTGTTATTCGCGTACGTCTATCCCGACC
+>ds2020-328_77
+GGTCGGGATAGACGCTCGTTCTCTCTCTCTCTCTCTCTCTAGTTTTGCTCGGCTGAGAAC
+CAGCCAGCTCTCTCCTCCTCTCCTAAAGCCCTCTTCTCTTTATTTACAAAGGCTCTCAAG
+CCTACCTCAATGTAATACAACTCTCTATACATATATACAAACACAACAACCAGTGGATGT
+AGCCCGAATTCATGGGTGAACCACTCTATCTCTTCGTTTTACTTGTATGATTGTGATATT
+ACGGCTATCCCGATTTTATGGGTTCAACATTTGGCGCCGTCTGTGGGAACCCGCACGAAA
+GGCATGTGTTCTCATTTCTCTTAAAACACCTCATCTCTACCAAAAACAACTATCCTCATG
+GTCCCAGCACTCTTAGCCAACCAAGACAAGCAGAAAAGGTCACGTTCTCCACACTCCAAA
+ATCTGCTCAAGACACCCATGTGTCTCCTTGGCTCATTCTCTCCCTCGCGCAGCTCTCATC
+CACTTCAACATCCCCTGCGCACGTCTATCCCGACC
+>ds2020-328_78
+GGTCGGGATAGACGGTGACCTCTCGGGAAAAAAAAACAACGCAAAATCGAAAGTCCAATA
+TAGATATACAACGCCCCTTACGAACAAGAAAATCAAGTGGCCTTTGTTGAAGGCTTCTAG
+AGTGAGGAAAGGTTCTTAGCCACCGGTGACCGGCTTTCAAAAAAGCACCTTTGGGCGGAG
+GTTTCTCGATAAACTATCAGGGGCTTGCAACGTCTATCCCGACCNNNNNNNNNNTTTATA
+TAAAAAATTTTCAGGCCAGTCCTTTGCTTTGTACCAGAAGAGTGCGGCAAGGAGGAGATA
+CTAAGCAATCAAAGGGATGCAAGCAAGGAATTCGGCCTATTGGATTAAAGCAAGGAAGCA
+AGAAAAGAGATAAGCGTTAGAAGGAGGTAGGAAGCTCTTGCTATGCCGCACTCTCATACT
+TTTGAGTAAGGAATTCCCTGCAGGGCGGTTAACGGCTGTCGGATAGGGCATCGGGAAGAA
+CATATGGAAAAGTAGCGTCTATCCCGACC
+>ds2020-328_79
+GGTCGGGATAGACGATTTGCTGGCCTATGAATGTGGTTTCGATCCTTTCGGTGATGCCAG
+AAGTCGTTTCGATATACGATTTTATCTTGTTTCAATTTTATTTATTATCCTTGATCCGGA
+AGTAACCTTTTCCTTTCCTTGGGCAGTACCTCTCAACAAGATTGATCCGTTTGGATCTTG
+GTCCATGATGGCCTTTTTATTGATTTTGACGATTGGATCTCTCTATGAATGGAAAAGGGG
+TGCTTCGGATCGGGAGTAATCACTAGTGATAGGGCAAAAATAGGGGGGAAGGACAAAGGA
+AAGAGCGATGCCCACATTAAATCAATTGATTCGTCATGGTAGAGAAGAAAAACGGCGCAC
+GGACCGTACTCGAGCTTCGGATCAATGTCCCCAGAAGCAAGGAGTATGCCCGCGTGTTTC
+AACGAGAACACCGAAAAAACCAAATTCAGCTCCACGTAAGATAGCCAAAGTACGTTTGAG
+CAGGGACCGGTTTCGTCTATCCCGACC
+>ds2020-328_80
+GGTCGGGATAGACGCGCATCCCCCTGGTCGGGATAGACGTACATTGGGGCTGGTCGGGAT
+AGACGTCTAGGGGCCATCATAGAAACATAGATAGGGTCAACGACGGAACGAACAACGAAA
+CTTTACGACAGCTTTTTCGTACACGTTCACTTGCATCACATACACAAGTGCTCTCTGAAC
+CGTGCAATAAGGTTACCCATAACACGGCTCTCCCACTTGAGTTACCTTAGCCCCAGGCCA
+TGCTATTCAATGATATTGGAAAAATGGCAGCGTAACGTAACAACTAGTATTGAAAGCAGG
+TCGCCTTTTGAGGGATGGAAAGCGTTTCAATAGGAGCCCAGCTTCCCTCTTTGCTTTGCG
+ACCTCATCACTTCAATTCAAGCGCAAACCAATTTCTTTCTTAGTCACCGGGCGGGAGGTG
+AAGGCCATAAGAGAAGATTGCCCTCCCGGTAAGGTAGTTTACTTGCTTACTTGTTAGAGT
+AAGGAAGAGAGGAAAAGGGTGCTGTC
+>ds2020-328_81
+GGTCGGGATAGACGAAACTTCCAATTTGTAAACGTTGTTTGTATTCTGTTAGATGCTCTG
+ATATTGCCCTGTTAGGATTCGGTATTTTGAGGCCGGAGGCCATGGGTTGTTAACACTATG
+CTTGTGTATTGTATGCTGGCTGTTGGGTTGTAAATATCTGTGTTTTTGACAGGTTTAAAT
+TTTGGGATTTGTCCTGTTTACAGGGGAGACTGCCAAATTTTTGGTAGGAAGTCTCGGTTA
+TTAGTAAGTGGGCCCGGCATCTAAATAGTGGCGGCCGTTNNNNNNNNNNATTCCGGGGCG
+GGTCCTGTCAGCTTGGTATCAGAGCATTAGGTTCTTTTCCTGTGACTTCCATGCTTTCTT
+TGCATGTTATTACTGAAGATTTTGTGGTTCCTTTTGTTTAGAATCATGCATCGCCGAGGT
+GCTCGGTTAAGAGGTCGTGTTCCAAGATACGGACCGAATCCTCCACCTCCATCTCCGCCA
+ACCGTCTATCCCGACCGCCGTAATTC
+>ds2020-328_82
+GGTCGGGCTTGACGTACGGAAGCCATATCCGAAGCTAAAAAGATATTAGCGAGACTTAAC
+CAAAAAATAAGTAAGAAGAGGTTGGTGGAGGCGCTGGCCGGCGGCGAAATCGCTGTGGTG
+GCGCTAAGCGAACTGATGTCAACTCTAGGAATGATACCCATAGACGAGGCGCTGACTGCC
+GAAGCTTGCGGGTCAACAAGCCCAATCGAGTGGGGAAAAGAAGGAAGAGAAAGAATAATG
+AGCGAAAGAATAGAAACGTTACGTGAAGCTGCGTCTGAGCCTTCGGCGAGAACGACGACG
+CTATTTGTAGAAGAAAGGTGACAAGAAGAAAACATAGGAAGTACGCGGCTGGGTGCCAGC
+GAAAGAACGGAAGGATAAGCAAACAGAGGAGAAGAAGTGGATGGTGAAAAGAAAGAAAAG
+AGAAGACAGACAGCGGTCAGTTGAATTGGACCAGAGGATCGGAAAAGAAAGGGAGGTGTG
+TCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_83
+AACTGCTACATGCACTACCATGTAACAGCTCAGGCACTGTGGACACATTGAAGCAAACCG
+GCTCGGACGGGTGGCTAGGACCTACGTGTTTCACCGAAAATAGGCAAGGTCTGGAAAGGA
+TGGCTGGCATGATCAGAGTAACGAGAGAGCTACACTTAACCGATAGGAAGTTGGCAATGT
+TGAGAAGAAAAGTAGATGTTCTAAAAGATACTGCATGCCAGGAGTGGTTGCAGATGCATC
+TCAGCGGGTTGTTTCGTCTATCCCGACCNNNNNNNNNNGATGCAAGGATGGTATGGTGTG
+GTGCTATCACTACTATGTTGTGTAATGATACAGGGAAAAATCTACACATGTGGAGAAGGT
+CATATATAAGCTGTATTGAAGAGATAATAACTAATGCTGCAGTGTGCTTCGAGGCTGCCA
+ATAATGGTGTGTCAGCATCCATTTTAATAACTCGGGGAGCTAGTGCATCATGCCATACCA
+CAATTAAACGTCTATCCCGACC
+>ds2020-328_84
+TCGGCGGTCGGGATAGACGGGTAGTTCGGGTTTGATTGTGTCATAGCTCTATGATTCGGA
+TTAGGTTTATCGTTGGATGAACTGCATTGCTGATATTGACCCTAAAAAAGAAACGGTAGG
+TACAGCTAGTCCGTGAACAGCCAACCATCGCACTGTAAAAATTGGATAGGTTCTATCTAT
+AGTCATTGGGGCCTCCTAAAAAGATCTACTAAATTCATCGAGTTGTTCCAAAGAATCAAA
+ACGGCCAGTTATTAATGGAATTCCTTGTCGGCTTTCTGTAAAATACTCGTTTGGACGAGG
+GCTTCCAAATACATCGTAAGCTAAACCCGTGCTGACGAATAACCAACCCGCAATAAATAA
+GGAAGGTATAGTAATGCTATGAATGACCCAGTATCGAATACTGGTAATAATATCAGCAAA
+AGAACGTTCTCCTGTGCTTCCAGACATGTTGAGCTCCGCATATTCTTGTACAGTCAGGGG
+AGGGGGTCGTCTATCCCGACC
+>ds2020-328_85
+GGTCGGGATAGACGAATTCACCTCCTGATTTCTGGTTACTATCCACCTCCTTTCTCCCAC
+GGCTAACACTAAGCAGTCTACTATCAGCCTGATCTCCAGCCCTCCAGCCTTAAACAAAAT
+AGCTCCGCATTCTTTGATCTCCTCAGTCCTGAATTCTTCCAGCCCTCTTACTATTTCCAC
+CACCGCTTTTCCTTTCGCGCTCACTAATACGTCTGTCGATTCATCGACGATCACTATTTT
+TTCCGGCTCAGTTTCCGGATAAAACAGCATGTTAGCCCATTTAAACATGGACCATGGTTC
+GTATGTTATGCTGCTTTCAGCTATCTCGATTTCCACTTGTCCTTGAGCCTTTATTAGTTC
+GTCTATCACTTCTATCTCGAGGAACACCGACTTCTTCAATATAGCATTCCCTATCCATTT
+GTTCATTCGCATCAGCGGAACTCTCTCATTCCTCGCCATTCTGGGGAACATTTCTAGTAT
+GTTGTGGACCATCA
+>ds2020-328_86
+AACGGCCGCCACTACTATTCTTCATTTAGTACTTAAACCGGGAAAGTCCTTCCTTTCCTT
+CTCTTTACGAAGCCTAATCCGCTGAATAAGGGGAATTTGCTTTCTCCTGCTAGTTTACCA
+AAGCGGATCATATGGCTTTATTTTTCCCCAGCTGCTACTCTGAAAGTGCCCTTTCAACCT
+TCAATTGCTTCCTGTGCTAGCGGTTGATGTGCTTTCCTTCCAGACGGCTACGAACTTGCT
+TAGCCCTCTTCTTATTCCCAGAATCCTTAGCCTCTTCCTAAATAAGGCCCCTCCCTAGTC
+CTTATTCTCTATTCCTTATAAAATGAAAGATTCATTCTTTAGCCAGATCAACATCCTTCT
+TCCTATTACCTATCTCCAGATCAAGATCCTAACATGATTTAAGCCATAACTCTACTATGG
+AAGTACTTAGTAATCCTACTTCCTATTCACTATCTACTTCCTTCGTCAGCCTTCCTGCTC
+GTCTATCCCGACC
+>ds2020-328_87
+GGTCGGGATAGACGTTCCTTGTTGCTTTTCTTACCATTATCTACAGTCCCTACAGCACCA
+CTTTCATTTTTATCACTATTTCCAGTCATATTCATTCTGTTACTGTTAATCCCCATTGTT
+ATTTTCCACTGCTCTGCCGTTGTCTCACTGTCCCATCGAAATCTTTGTGCTGCTCTTTCG
+AAACTCTTCTTCCATAACGCCTGTACTTTGCTCGTCTTCACTCCTCTCCTTTCTAAGACT
+GCCAGATTGGAGTATATTTCATGTAGTTTACTGTCAAATCCAACCACTCTGTCTGTTTCC
+CAGTTACCACAGACAAAAGTAGCACATGATCTAGCCAAGCACCCTCTGAGTTTGCCGTCT
+TTACACCCTAGAACACGTAGGTATTCATGGTAAGACTGATCCGTAAGCAACTTGACTTCT
+TGCCCCTTAAGATTACATTTAGTGGCAACTTCATTCCAAGCTAAAGCGCAATGCCGTCTA
+TCCCGACC
+>ds2020-328_88
+GGTCGGGATAGACGGGGTGCTCCTCTGTTTCTCTCACCATGAATTTCATCGACTCTTTTA
+TCATTCTCTCTGTTATTTTATCGAATTCTTTCTCGCTTGCCACTTTCCCAGTTGAAACCA
+TCATGCTTATTGAGCTCGGCGCACAGTCTTCGTTGTCTAGAGCTATTAGATTGACTGCCT
+CCACCATTGCCAACGGCCATAGATACGCCGCGATTCTAATCAGCGCATGTGCTATTGATA
+TAANNNNNNNNNNGGTCGGGATAGACGAGCCGCTAATATCCAATCTATTAGTACCAGCGA
+GCTTACACCGACGCTCGCCAATATGGACATAGTTGTGGCGCAATAAGCTGCATAAGACGC
+AACCCCTATTGCGCTGGCTCTCAGTGCTATATTGTATGCCTCTCTATTCTCCATGTACAC
+ATTTATGTTATCTGCTGTGTGTTTTCTCTCTGACAACACTCCTATTCCACGTCTATCCCG
+ACC
+>ds2020-328_89
+GGTCGGGATAGACGCATGGGTTGCATAGCGCAGCCTGGAGGGAGGTGCTGCTTCAGCACC
+TTAGACATGGGCCAGATGTCTGTAAGCTACAGTGGCTACACAGGCACTGACATCAAGACG
+GTATCTGTGTATGATTCTGACCCGCAGTATGGGTGTGGTACTGAAACATCATCAAAGTAT
+GGCACTGCAACGTCAGGTTGCGTGCCCGGCGATGGGTACGCTCACTACGGAGGTTCTGCA
+TGGATAGATTGCAAGACCATAATGGCGTGTCAAGAGTATTACGACGACATAGCAAAGCGT
+GACGCAGGAGATGTATCATCAAATCGAGGTACCAACGTCACTGTTGTCAACGAGAGTCCA
+GCAGGATTCATGTTTGTGTACGACCTGTTGATGTTCATCAACGGGCAGCCCAGACCTCAA
+GGTCACGAGAAAGCCTACTTGTTCTCAGTACCAGAGACCACGGACCCGTCTATCCCGACC
+>ds2020-328_90
+GGTCGGGATAGACGGGTCCGATGCCTGCTGCTTCATCTGGGAGAAAAGAATCATAGATAT
+GCCGGTCATTAGAAGGAAGAACCGCCATAAAAAGATTCCTCGTGTATCATCTGTAGCAAA
+ACTATGAACGGAAGCTAGCAATCCGGACCGTATTGAAAAGGTTCCTGAGACACAGCATGG
+AAGAGTCACAATATTAAGAAACGAGGTCCAAGAATGAAGAAGGGGTAGAATTACTGAATG
+AATACGAGCTGTGGCTAATACCCGAGGCATAAAAGAAGCATTTTCTACGGGATCCCGAAA
+CCACCAGCCACCCCGACCTAATTCATGATGAGCCCACCAACTTCCTGGCAAGATGCCTAC
+GGTTAAAAACCACCGACATGTCAAGATCCAAATTCGAATTGGTTCCTGGTTTTGGTCAGA
+GACCACTGTGTTCGCGCCGGCAGTCCAACAATGAGGCAGCTTCGTCTATCCCGACC
+>ds2020-328_91
+TCCGATCTAATTACGGCGGTCGGGATAGACGGCTCGGAGCCCTCAGAATGTCAAATACCA
+AACCTGGTTCATAGATAAACCAGGCCTCAGTCCAGTTTTCGTGGGTCAGCTTGCAGGCAT
+CAGTTCAGCTATTTACACAAGTCAGATGAGTCGACACCCTTGATAGAAGTTGTTCCAATG
+GGTGTCTACTATAACATATCCAAATTTCAGCCCAATTGGATAAGTCTGGAGCCCTCAGCA
+TGTCAAATACCGAACCTGGTTCACAGACAAACCATGTGAGCTCACAGCAAAGCATGAGCT
+GCCACACATGGAGGCAAAGCATGAGCAGCTGTTGAGCCATGTGCTTAAAGCAGCCACACA
+TGGAGGCAAAGCATGTATCAGCTGCAAAGAGAGGTGTTGTGACCTAAGATGAGCTGCCAT
+GCATAGGAGACAAAGCATGAGCTGCCAAGGGGGAAAAATCGTCTATCCCGACC
+>ds2020-328_92
+CGTCATTGAGGAACAAATACTACTCGAGACAATGCGAGCGATTGCACATGACAGTTTCGG
+ACTGTTATAAAATAAAGACCTCCCACAGGTGTGTGGGGGGCATAAGTGAAGACAAGAGAT
+CGGACGTAAAGTGGATGATACGGTCGTCGGGCTTCAGGAAGGGTGCCACGCAGATAGGCG
+TGTTACCGGGAGTGGTGGACTACTCCAGGATGGTGAAAGCATCACTACAACTTGAAAGAC
+CTTTGCAGGATTTCATTTCACGAATAATGCGCGCAACATACGACGCGGTGATACCAAAAG
+AAAGGAACATAAACGTTTCAAGGAATGGTAACATCAAGCGGTACGAGATTTTGCGAGCGT
+TATTCAAGGTACACAAAGAAGAAACAGACATAGTCAATTACGGAAAAGCCAAAATGACCG
+GCTTCCTGATGGACGTGTTGAATGGGACCAATTATTCATAGTGGCGGCCGTT
+>ds2020-328_93
+GGTCGGGATAGACGAATTTTCTGGTGAGTTTATAACGCTTCCTTTCGTTATCGATCGGTT
+AAGAATGACATTCGATTTGGAGGATGATTATTCATTCTCTATGGGTGATTGTTCATACGA
+TCTGGAACTCACTGATGCTCAACTTGATTATGTTGAAGTTCTTCAACAACAGAAAGATTT
+CTTTTCAGAAAGTCTTGGTAAGGTTGTTGTCGATTATGATTTTTCCCTTGATAGTGAAGA
+TCCTTCCATCAAGGATGCTGTGAAAATACCCGATGAAATTCCGGAAGATTTCCCTCAGGA
+AAGTATACCAGCTGAAGTTGTAGCTGATGTTCCACAATCTGTTAGTGATGTCGTCGAAGA
+GCAAGTCGTGGCTGGAGAGTTGATACCTAGCTGCGAAACTGTCAATGAGAATGTTTGTGT
+GGAAGTTAAATACCCCACAAGCCTTATCCCTAGATTCCGTCTATCCCGACC
+>ds2020-328_94
+AGAAGTGGGGAAAAAGTAAAAAAAAATCTCTTCAAACCTGAGCTTTTCGGTTCGCCCCCC
+CTATGTGGTCGGTCTTCTTACCAGTCTGCCTCCTTTCTCTTGATGGAATATAAAAAAGCC
+CGAGCTCCTGCTTTGCTTGCGCTCTTCACTGGCGCTCGCCAGATGTATCACTCATCCCGC
+TCCAAAGGCAAGGAGTCTTCTGTATGTTAGAATCTTTACGGGAATGAATCGCATATGTTG
+GTTGAGAATTGCTCGGGAATTCATTTATAGTTATTTTGCCAGGTTCTAGGGTTGGGCTAC
+TCTTCTTTTTTGTCGATCGAGCCGCTTTCCCTCATTCCACTCGTCCAGCCTTCTTCACGA
+ACTTGTACAATCGATGCCACAAAGATAGACAACTCTATTATCGACGAAATAAGGAAACGG
+GGGACGGTTTGGCACCAGATATCCAGGGTAACCGTCTATCCCGACC
+>ds2020-328_95
+GGTCGGGATAGACGGGACTTGTTCCCACTTCAACACAGCGCTCTATAGGTAGGCAATTTT
+TTTGAGAATTTTGGTCCTAAAAGTAGCCGAGCTCTCACAAATAGAATTGGAGTACCACGG
+AGAAAAGCTAGCTGGATAAACAAGACAGGGATCGCCCGCTCGGCAATGCTGCCTTGGGGA
+GGAAACAACAAAACACTTTAATATAACAATTAAAAACTCATATTCAAAAGCTTTTCGATA
+TATGAACAAGATTACTATAAAAGAGTTGGTGAACATTGTTCTGACTCATAGCTCTAAGAT
+GACTAGCATGAATAAGCCAGCTTCAACACCACCTATACTCTTAATCATAGACAGACTTGC
+ACCGACCTCAACATAAAAGGATGAGAACGGCCTGTCTATTTATATGCCTTGGCTTAACTC
+ATTCCTATACACTGCAAAGAACACAAAATTAAAACAGCCTGG
+>ds2020-328_96
+GGTCGGGATAGACGTTTAAGGGGCCTGCACAAGCGGTGGAGCATGTGGTTTAATTCGATA
+CAACGCGCAAAACCTTACCAGCCCTTGACATATGAACAACAAAACCTGTCCTTAACGGGA
+TGGTACTTACTTTCATACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTT
+GGTCAAGTCCTATAACGAGCGAAACCCTCGTTTTGTGTTGCTGAGACATGCGCCTAAGGA
+GAAAGTCTTTGCAACCGAAGTGAGCCGAGGAGCCGAGTGACGTGCCAGCGCTACTAATTG
+AGTGCCAGCACGTAGCAGTGCTGTCAGTAAGAAGGGAGCCGGCGCTTTTCTCGCTTGTTT
+AGTAAAGTCAAGTTTTTGGCCTTATCTTGCAGGTGACGACGACGTCGAGTTGGCGGCGGG
+GAAAGACTCGGCATACAGGCGAGTATCGTCTATCCCGACCG
+>ds2020-328_97
+AACGGCCGCCACTAAATTGTCCCCTTAGATCCGCGCTTGTGATCCACTCGTAGGAACTCC
+GCTATAGCTCCGTACGCGCACTTGCTCATTTGTAGTCGTATATTGTGCTTCTTCGCGTTT
+CGGCCGGCTAGTAACACGTCCCCGAGCGAGTTACTGCCCAGCAGCACGTCGTCGCCGTTA
+TGAAGACTGTTTTGTGACTTCACGACATCTGGCACTATTAATTGAGTGTAAATGTAGTTC
+AGGACGCTATTCATGAATGTGGTGAGCCTCCACCCCGACAGTAAAGTTCCTTTAGCACTA
+TACTCCATCTTCAAGCCTTGGTTGTCATGTACTATCACTCTGTTCAGCGACAGTCGAGTC
+CATTCCACCGCCGCCAGCTGCTCTTGCGTTAGGAAGGGCCTGAAGGTGTCTCTGTACGCA
+TCTATCACTGTTTTCATTGACTGTACACTATGTTGACTGTT
+>ds2020-328_98
+AACGGCCGCCACTCTTGGGTGTCTATGTAGTTAAGCACGCTGTTCATGAACGTAGTGAGT
+CGCCACCCCGATAACAGGGTCCCCTTAGCGTTGTACTCCATTTTCAAGCCTTGATTGTCG
+TGTACTATTACCCTATCCAGTGAAAGCCGAGTCCACTCCACAGCTGCTAGTTGCTCCTGA
+GTCAGGAAGTGTCCGAAAGTATCTCTGTACGCATCTATTACTGCTTTCATAGATTGTACA
+CTGTGTTGACTGTTGAAATCCTCGAAATCTACACAATACTGAGTCCTGCCTTCTAAGACT
+GACCTTACTCTACTGCGGACGTTCTCATCGTTGGCTGCTTTTCCCACCGGGAACGGCGAG
+GGCAATACGTCCTCGCAGTTATAGAAGGCGAAATGTGCCAATACGTAACTAGTGACATCT
+GTCCCGTAGATAGCGCGGAGTTTACGTCTATCCCGACC
+>ds2020-328_99
+GGGCGGGATAGACGCTTGGTGATACTTACTTCACTTCGTGAGGAGGTGAAGGACGTAAAG
+GGAGACTGGGCCTTATGCAAGGAAGCTGTCTTGAACAAGACCCGGACTCCGAAGGAACCC
+AAAGTGCTGGATTCTTTCAAACCCAAATCCTATAATGGGAAGAGGGAGGCGAAGGAGCTA
+GACACGTTTTTGTGGAATATCGAAAGATATTTCAAGTATCTGAAGCTCGAGGAGGACGAG
+CCGAAGATCAACACGGCAACATTGTTTCTCACCGACAATGCTCTCATGTGGTGGCGACGT
+CGATCCATGGAAATCGACCAAGGTACGTTTGTACTAGACACTTGGGATGCATTTAAAAAG
+GATATTATGCTGCATTTCTATCCAGAGAATGCCAAGTATGAGGCAAAAGAGAAGCTGAGA
+TGGCTAAAGCAGACGGGGATGTTCCGTCTATCCCGACC
+>ds2020-328_100
+GGTCGGGGTAGACGGCGAAGAGAGCTACGCCACAATGAATGGTAACAGATGAATTGAAAC
+TAAAGCGACGGGTGTCAATTACCAAAAACGACTCGACCACTAACTCAGTCCCGCGGGTAA
+CACAAGGCCGAAGATGGATGCGAAGAATATTTGAAACCGCTCTCGAACCATCACACGGAT
+TCCGATCCAACTGCCCATGATATGGTAAGAACGAAATGGAAAGGCAAAAAAACGATTCTA
+TGCGCAGACGTGAAAGCTCTATCGATAGAAGCATTCTAGCCTATTTTGATTTAGAGAGGA
+GCGATTCCCTCGTCTGAGAACCGCCATTCCCGCACTATTCCTCCCCACTAAAAAGATTGA
+TAATCTCGATAACCAAAACAAAAATGCAGAAGTGAGCGTACCCCACTCCTCTCTCCCCCC
+TTTTTAGCCAACCCCAAATAACGTCTATCCCGACC
+>ds2020-328_101
+GGTCGGGATAGACGGTCGGCTGGCTTGAGAAGGAGGTCGGGATTTTCCATTATCAGAATA
+ACAGAGCTTTTTTTGTTTGTGACAATCTGGAGGAAGCTAAATGGTGTGCTAGGGTGGGAA
+AGGTAACGATGGAAGGTTCTTGTGACTTGCTCCTGTTCGCTTGGAAACAAAGTCTGGAAA
+ATAATATGAGGAAGGTGGTGAGTTATGGGGGATGGATTGCAATTACTGGGCTGCCGCTTC
+ATTGGTGGTCCCTAAAATTTTTCAGCCGAATTGGTGAGGCATGTGGAGGGTTAATCGAAG
+TTGATTTGAGGACTTCAAATTTGGAGTATTTGATCGACGCAAAATTAAGAGTCAGACCTA
+ATGAAATCGGTCTTTTACCTGGTGACTTGAGAATTGCTGATAATGGGGAGGTTCACGTCG
+TCCAAATAAGGCCTTGTCGACGTCTATCCCGACC
+>ds2020-328_102
+GGTCGGGATAGACGAGAAGGTGGTTTATCATTGGGTCAATAATGCTAATCCCTCTTTTTG
+TGCTACTCCTAGGGCGAGAAGAAGATAAGAAAACGCAAAGCGTTCTCTCCCAACCTGTTT
+ATTTCTAAAGGCTACCCTCTCTCGGCTGGATGTTGGTCCAGCCTACTACGAAGATCCCGT
+ATCCAACAACCCAACCTAAAAAAAGGGCATAAAAGCGCCTTGTCTAGGTTNNNNNNNNNN
+GTTTCACGCCCCAACGTAGCTAGGGTTTGTGTAGAAATCGGTCTTCCCTTATTATTATGA
+AAAGGTTGTTTACTTGCTTACTTATTTTGTTAGAGTAAGGTAGCTTGCTTACTTAGTGCT
+TGCACTAAGGGGAAGGGGCTTTATCGGCTAGTGCGCAGGAGCGCACTTCCGTTTTCCCTT
+TACTAGTAGGGGTTCCGCGCGTCTATCCCGACC
+>ds2020-328_103
+GGTCGGGATAGACGTGCGTTGGATATATTATTTATTCAATGTTTGAAATTGGTATTTTTA
+TGATGCATTGGCATTATTTGGGGATTTTGATATATTTGAGTATCTTGAGTATGCATACAT
+GGATTTTGGAGATTGCCTATATGTTATTGGTTATGTGTGGGGTACTTGGGTTGTTGAGTT
+GAGATTGTAGAAAGGTTTGAGTATAGAATGTCAGTTTGGAGTGCTTTAAGCGCTACCCTA
+TGTACCTCCCCGGATTTGGAACTTGAGATACTTGGAATTGTTAAGACTTGGGGCAACCTT
+AACGGGTTGTAGCCGAGGACCCTGCGGGGTGGTAGTCTGCGCGCGTAGGACTGTTCGCAG
+ACGTACAAGCTTTGATTTGGTATCGGCTGTACGTGCTGGCTGAGAGTTGGTCCCTCGTCG
+TCTATCCCGACCGCCGTAATTCTGATCGGAAG
+>ds2020-328_104
+GGTCGGGATAGACGTGGTAAGTTGCTAAAACAAACGGGAGGGGAGGATCGACCCGTTCAG
+TATAATTCCGAAGAAAGACTGTTGGCAGCAGGTGTTGACATTTATTTTGCTCCCTTCAAA
+AGGAAATGCGGGCGGGGTTAAGCTCGGCAGAGGGTTAATGGGGTAGGGTCCTGCCCTTAA
+GATTCAGATAAGAAAAGAGTTCCAAACCTTTATGCATGCACCTCCGTATAAGTGCTGCGT
+ACAAGTTCCGGCTAGGATAATTGGGAAAGATCAAACCAATTTGAAGCGCTCACATCACAC
+ACAGTAGTAGTAGCGTAAAGGCCGTAAGTCGGGGGCGGCCATAACATAAAGTTATTACTT
+TCACATCTCTCTCTAGATATCTTTAGATAAAAAGAGAGAGAGAGAGAGATCCGCTGCGTG
+AGCAACCCGAACTAGCGTCTATCCCGACC
+>ds2020-328_105
+TCTGAATTACGGCGGTCGGGATAGACGCGCACCCCAACTCTATCTTCCTTATCAGTGAAC
+CGGAAATAGTGCGTAGGTACTCTTCAATGCAAGCGGGGACGAGACGACGTGACATACTAC
+GATGACGTACAGAAGTGCTGCCCTTCGGCTCGGCAATATGGAACCTCTCAACAGCTCCCG
+TTCCTTTATGAGGTCCTATCGGGATAGGTAGGCCCAATCCTTTCCCCTCCCCCTCCCTCT
+CCCTTTGGTCGAGCTAGTTTACTCCCTCTATAAGACCCTATTTATCTTTCCCCCTCGAGA
+AAGAGAAAGAAGAGAATCACTCCTTTCTTTCTTCTCTTCTTTCATGTTGTGAACGGCCCC
+TTCTTGTATCGAAAGGTTTTTCGTGCTATACACCACGTTGAGAAAGACACTTGATCGTCT
+ATCCCGACCGCCGTAATTCAGATCGGA
+>ds2020-328_106
+GGTCGGGATAGACGCGGTGGAGTACTTTGGGATTATATTCCGCGCCGAGGATTTGTGCTT
+GTGGGCTAGGGTGAATATTGCAGACCAGCGGATCTGGTGGTCGACAATCGTTCGGACTTG
+GTAAAGGTTATCGCGGCACCTGTAGTAGGACAGAGGATTTATTGCGATGCCCGCGAACCA
+ATTTACGATGTCTCCGTCGCTGACGTTCGTCAAGCAGGCCACGTGGATTGGCCAGGGTCT
+TCTTCGGCTAATGATACCTCGATCCCGAAGCCTTCGGAGTATCTTTTTGATAGGCGCCTC
+TATCTGTATGGGGAATTCGCTGCTGATAGATCCCGCCCAGTGTCCTCCTCCTTCCCCCGC
+CGCCTTCCGACCCGCGGGAGTATACAATGACAACTTCCGGACACTCATGCCCGATCGTGA
+GACTGCCGGTTCACGTCTATCCGACC
+>ds2020-328_107
+ATGAATCCTTTGTTACATCTGGCACGAGATGATAAAGAGAGAGCTTCGTCTATCAATGAA
+CATCTGATTGACGGAGCTCTTGGCATTGCTTTGTTTTTCTCTCCTTTCCTATCAGCGAGT
+TCCGATCCTTTTGTTCGAAATTTCTTCGTTCGTACCGAACCGCTTGCAGAATCAAATCCT
+GTTCCACAAGATCCTATATCAGCTATACATCCTCCTTGCANNNNNNNNNNGGTCGGGATC
+GACGTCCGCCAGTGCTATGGGCTTTGGCTTATGTAGATCAAAAATGATGAATGGGATTGC
+GGCACTCCACTCGACGCCAATGCGGAAGGATGCCGTCGAAAAGAATGGAACGCTGCTTCG
+CTCTGCTGGATGCGTCGGATCCCGTACAACAAGCGAGCTTTTTACCGTCAAATTCAAACA
+TGTGGGGGCAGCGTCTATCCCGACC
+>ds2020-328_108
+TGAATTACGGCGGTCGGGATAGACGTAGAGGGGCTTTCTCGAGCATGCATACCCTTGAAG
+CTAGCGGTTTGACATAGGTTATACTAGCATTGACGTTTGAATCCCCCTCTTTGATTACCG
+CCTTACCACACTGAGATTCAGTTTGAGAGTTCTCTAGCTCTATTTCTTCCAATAAGCATC
+TGTATTTATTTGGTATGAGTATATGCCAGTGTTGGTCTTCCAACNNNNNNNNNNAGCGTA
+TGAGTGTCCAACCTAATCCCACCATCACCAACAGTCCTACGTATGGCGTCTAAAGTCATC
+TTTTCTAACCTTTGAAGTCTCAGAGATAGTTGTACCGCTTTCCAAGCACAATCACCATTA
+CTAGTAACATGACCCTGGTTCCTGAGAACAAGGGATGGACTACTCTCCAACCCACACTGG
+CGTCTATCCCGACCGCCGAATTCA
+>ds2020-328_109
+TGAATTACGGCGGTCGGGATAGACGCACATACCCCCTCTTGATATTATCTCATCAAACCT
+GTTATTCATAGATCGTATCAACTCTCTGTAGTCGTTTGCTGGTGCCATCTCTACCCTGCC
+ATGTACCGCTGTTGACACAGCTCTTGCCAGGTACTGCGAACTCGTTTTGTAACTCGCCCT
+CGTGTCCACCCGTAAGAACTCACCTATGGTCCCAATATTTGTCTTTGCTAATTGTGCTCT
+TATCCCTGCGTCCTTTGCTCTTTTAGCCAGCTTCACTGCCTGTGCTACGTTTTGCGTTGT
+AGCGTACATGTCATCTCCGTTGTGCAGTGCATAGTTCACGCTACTATCTAAGCCAACGCT
+AACGAGATAAACTCTGTTGAGTATGGTGTTTATGAAAGATGTCAATCTCCACCCACTCAG
+CAATGTTCCGTCTATCCCGACC
+>ds2020-328_110
+GGTCGGGATAGACGCCTGTTCCCCATTGTTTGTTGTGGGTCGCGCCTCACCGCAAGCACT
+GAATGAAATGAGTGGAGATCTTCCTTCCCCCTTGTTAATTACCAAGAACTTCGTTGCCAC
+TAGTGGCGAAGAATAATCCTACCATCCTACCCCAAAACAACTCTGAGCCTAAAGAGAAGA
+GAGTTCAGTCTACAAGAAGCTGGCAGAGCTTTAGCCATTGGACTACATCCATCCATCCTA
+CCTAAACAGTAACCTTTTTTTGTTCGTTCTTCGCATGGCGCGAGTGTAGAGAAATTCCTT
+CCGGCTAATGAAGAGGCTACTCCAATCTTCCCATTCATTCCCAGTGGATCCTTCTTCTCC
+CTAAGAATTGAACGAACCAAGTTCACCTATACGAGAGTGAGGAATAAAAACCAACAATCA
+ACCCGCTACGTCTATCCCGACC
+>ds2020-328_111
+GGTCGGGATAGACGCTCGGAACTGGTATATGGATCTCTCCATGTAGTGGTCGGCCTTCTA
+GAAGCTTCGCCAGAAGCGACTAGTCGCTTCCCGAATGCCTCTTTACTTTAGTATGGTCTA
+GTCTTTCCAATGCCTCCTTCCTTGCCGCCAACGTACGCTACTAGGAGAGTAAGCAAGCTA
+CCTTGCTTGCATTCTAGAAACGGTAGCTTCCGCGCCCTTCCTGCCTGCTGAAATTGATGT
+GAATGATCGTGACAGCTCTTCAAATCCTATTCAGTCTGATTAGATATGTCACTGAAACAA
+TCCGTTCTGTCTCTGTTTTATTTTCGGATTCCGAGGATGAGCCGGCCGATCCTAACATCA
+TTTATGAGGAGCCGGACGACGAAGCCTCCTCCTCAGATAAAGATGTCTCCGTAACGTCTA
+TCCCGACCGCCGTAATTCA
+>ds2020-328_112
+GGTCGGATAGACGCCTACCCCCTCTGCTCGTCTATCCCGACCACTGAGCATGCACGTCTA
+TCCCGACCGCCGACTTCGGATGATCGGAAACACAGGACCGCGAGTTGCTTCGTCGCGCTC
+GGCTTCTAGCAAAAGCATAAAAATGCCGCATTTCGATGCACGCTCTGAAATGAGTACCTC
+TATTCGTATGAGCAGGCTGTGGATGAGGTTAAATCAGCCGGATTTTTTTTGAACGCGTCG
+ATAGGCCATTGCGTCGACGAGGTGGTATACGTTGGGGTTACTCTCTCGCAAGGAGAGTCC
+CATCGGGAAGAAAGCGCAGTAACGCCGTATTAACGCCATGGCATATCTTGGGAGTTTACA
+CCAAGTTATTGTTTTCCGCCTTCCGCTTATAATTTCCCTTTGCATAAGTCACTGGGTTTA
+GTTAGTGGCGTCCGTT
+>ds2020-328_113
+GGTCGGGATAGACGCCGATAGCGGGTTTCTTGATTGCCTCTACATCGGGTAAATTTGGTT
+AATTCTTTATTTTATGTGGTGTATCCGCAATAATATCATACCGTTTCTTTCGATGGAGAA
+GGGATCTACCTTCTTATATTTTTACATCTAGGATCGGACTTGTATCATTGGTACTAATAG
+GAATTGAACCCTTATGGCAAGAAAAAGTTTGATTCAGCGGGAGAAGAAGAGACAAAAATT
+GGAAAAAAAATATCATTTGATTCGTCGATCCTCAAAAAAAGAAATAAGCAAAGTTCCCTC
+GTTGAGCGAGAAATGGGAAATTCATGGAAAGTTACAATCCCCACCACGTAATAGTGCACC
+TACACGCCTTCATCGACGTTGTTTTTCGACCGGAAGACCGAGAAACTATCGAGATCTTTC
+GTCTATCCCGACC
+>ds2020-328_114
+GGGCGGGATAGACCCGCGGGCGGCCGTAAAATTGTGCTAACATCTGGTGTGGAGTAGTAC
+GTAGATTTCTGAGGGTATAGTTTATTTAATTGAGTGAAATTCCGCCAGTAGTCGTGATAG
+TTGAGAACTGTGATTATTCGCTCGATCAACTCTTTGCCATCACGCTCTTTTTCTTTAGCA
+TCTGCCGAGCACATCTAAGCGCAAAATAGAAAAAAGAACCCGGTTTTAAATTGGATATCC
+TTATTCCCTGTTCCGGGTACAAGTCAAGTTGAATTTTCAAATTTGAATTCAGTGTTATAA
+TTATTCAAATCCATAAATTCACTACGAAACAAGGCCAGAACCAAGCCCTAAATTTGAGAC
+TTTGAAAAACTGCAAGTAAACTTAAACTATTAATCATATTAATATTACACCCTGAAAACG
+TCTATCCCGACC
+>ds2020-328_115
+GGTCGGGATAGACGTAAGCACTGGTTCCTCCATAAGTGCCTTCTTCAACTCATTGAAGGC
+ATGCTGGCATCGGGGCGTCCACTCCCACGCCTTGTTCTTCTTTAGCAAATCCGTCAAGGG
+GGCCGCAATGGCTGAATATCCCTTGATGAACCTGCGGTAGTAGTTAACCAATCCAAGGAA
+TGACCGCAACTCAGGTACCTTGGTTGGTGGCTCCCATTCTTGAATGGCTCGCACCTTGCC
+CTCCTCCATGAGCAACTGTCCACCCCGTATCTTGTGACCAAGGAACTCCACCTCATTTTG
+GGCAAACGAGCATTTCTCCTTCTTCACATATAGGTTGTTCTCCCTCAGAACTTTGAACAC
+CTGATGCAAGTGCTCGAGGTGCTCCTCTAGAGAATTGCTAAACACGCACCAACGTCTATC
+CCGACC
+>ds2020-328_116
+GGGTCGGGATAGACGTTCCACACCCTTTCCCCCATATGACCGCTATCAAAGAGAAGCTTT
+TTCCTATACTATAGTTGCAAGTCTATTGTTGTGTTTTGGAATTAGGGGAAGCAAAGCTTC
+AACAAGTAGAAGCTTCCTGGCAAAGCTTCAAACAAAGAGGTTGGGCTGTTCACTTCATTG
+ATTTTACTTAACTTTGCTTAAGATTAAAGATAGGGGCCGGGCGGGCAGTGAAGGCTCGTT
+TAGTAGACAGCACGGCTTTGACGAGCAGCAAGCACCTACTCCTAACAAAATGAAAAGCAG
+CAAGCGGAGCGGAGCTTGAAGAAGCGAGCCCCTTTCAGAGAAAGCCATTGCGCGCTAGCC
+CCCTGTATGGGGTTCCAAACCTGCGCACCCCTAAACTACAACCAGCGAAGATCGTCTATC
+CCGACC
+>ds2020-328_117
+CGGTCGGGATAGACGCCTTCCCCCACTTCCGCAAAAGGGTGACCCATAGAACGATGGATT
+AGCGGGCTAGGGTAGGGATGGTACTTCATTTAAACAGTGACATTGCTCATGGATTTGAAC
+AGCAATCCTAGATCACACCTATATGAAGCCTTGCTGCATCTCTAACTTCCTGCCTCGTCA
+TCCCAGGCCACCCACCCTAACCTAATGGAGAAGATTACTGGGCCACTCTCTGCAGGTTAA
+CTCTGGTTGGCCAGTCAAAAGACACACGCTACCATAACAGAACACTTAATTAACATCAAC
+TTGGGCAGCTTCACCCCGGAAAAGCATTGGAGTCTTTCTTTTTTGATGATCCCCGACCCG
+ACTCCGAAGTCTTCTGCGTGCATTATTCTGCCCTCAACAACTCTTTTCCTCGTCTATCCC
+GACC
+>ds2020-328_118
+GGGTCGGGATAGACGTGTGCGAAGATTGCATATTTGGAAAACAGAAGAGGGTCAGCTTTC
+AGACAAGTGGCAGAACCCCAAAGAAGGAAAGGCTAGAGCTTGTTCACTCTGATGTTTGGG
+GACCAACGACCATTTCATCCATTGGTGGGAAACACTACTTCGTGACTTTCATCGATGATC
+ACTCTCGGAAGGTATGGGTTTACTTTCTAAAGCATAAGTCTGAAGTGTTTGAGGTTTTCA
+AGAGATGGAAAGCTATGGTTGAAAATGAGACAGGTCTGAAGATTAAAAGGCTCAGAACCG
+ACAATGGTGGTGAATATGAAGACACCAGATTCAAGAAGTTCTGCTATGAGCAAGGAATCA
+GAATGGAGAGAACCGTACCAGGTACGCCTCAACATAATGGTGTAGCTGAGCGTCTATCCC
+GACC
+>ds2020-328_119
+GGTCGGGATAGACGGAAGCTGCCCCTGAGTGGACGAGAAAGAAAGGATTTCTCGGAGCAA
+CCCCCCAGGTTCCAGACCCAGGAGTCAACTTTCCCGTATGAGCATTCGGTACATGTATCA
+GTCCGTGGAAGAGTGAAAGGGTCACCACTACTGAGGATCTCCCCCCTAATCTTAGATAGG
+TCGTCTGAGGGTTCGCCGCGGTTCATTGCTGTGCTTACACACTAGGCTACCCTTCTCCGA
+AAGCTCCGCGGGACCACCTACCACTAGTCTTCGGCCGGAGGGGTTTATTGCACAAAAACG
+CCGGGACGCAGGCTCCCGAAGAGGGAAGCCCAACGAATGTCAGATGCAAAGCTCCGCACC
+TCATTAAGATCATATTGGCATACTCTCCCAAAAAAAAAGAGCAGGCCCCCGTCTATCCCG
+ACC
+>ds2020-328_120
+GGTCGGGATAGACGCGTTGGCTGCCTTCGAGACTATAAAATATAACCCAAGTGGTCTAAC
+CCCCCGGGGCGGACCCCAACCGAAAGGCGCTAGACGGACTAACGGCAAGCGAGATAAAGA
+AAGCAGCTGGCCCTATGGAACGGAACTGGTTGCTTATTTACTTTTAGTAAGACCACTTTG
+GTAAGCAAAATTAGATTATATAGGCATGGTTGCTTACAAGACAAAAGATCTGTTCTTTGC
+CTGAACATATAGAGGAAACAACCTTCTATCTGGCCTCTGTACCAGTAGTGGAGTGGCTTG
+CTACTTTCAATCAGAAAAGGAAAATTGAGCAAGGCAAGGGAGAAAGAAGTTGTCCCATCT
+TCTCTGGTAACCCGCCACCGCATATGTCGAAAAAGAGGGAGCCGTGTCGTCTATCCCGAC
+C
+>ds2020-328_121
+GGTTGGGATAGACGACCGGTTGGGCTGCAATCTCCGACAGAATTGCCATTCTCTAACTGC
+TGACCATTATCCCTGTTTGTCAGGCCGTACATAGCTAAGTCTGTCGACATGTATCTGTGC
+TTTCCATTGAAGTCTACAAATACGTGGTCTATAAACGGTATGATATGCGTATCGTTGTTG
+AATACCGCATGGTAGCCGTCTGAAGCGTGCCTGTCCAAACTGATGTGACCTGTTAAAAAC
+GGAACGTTCATGCCATGTAAGACATCCCAGTTTGCCTGTTCTATCCAGTTCGGCATTGGT
+GCCTCATTGAGCCTAGCGACTCCAGAGGTATTTTGCCAATTGTCAACCGATGGCTTAATA
+ATCCCACCGCCGTCAATATCAGGGTCTTCTCTGGCGAAATCGGTCCCAAGCGCGACCGGT
+>ds2020-328_122
+GGTCGGGATAGACGCCCGCGACTTCTCTCTTTATGAACGGTGGGGCAATTCCTGGAACCT
+TTTTAAGGGTTTTTTATCAGGAGATATGGAAGTCGAAGGGTTTCTTGTTTCTGATCCACA
+ATTCTTCGTTCCACTTACTGGAGTTCTTCATATGAAGAAATTGATAAGTGATGCTGGGAA
+GGTCCTTAGTGTTAAGGATTTACTCGAAGAACAGCGCGCTCTTGTTGCTTTAAAAATGCG
+CGAACAGATTGCTGAAAGGGAGAAAGCTGAAAAGAGTCGCCGAGAATATGAGAAGGCGAT
+TATTCAACTTGCTGCTTGGACTAAAGCACATCCAGATGCTAAGGTTCCAAAAGGGCTTTC
+CGTGGAAGAACCACTGATGCCGGACGTTGTCAAGAAAGTGACGACGTCTATCCCGACC
+>ds2020-328_123
+GGTCGGGATAGACGTCCACTCGCCCTAGCACACTCTCAACTTGTAGATGCGAAAATCCCC
+CCTTCCCACAACAGAACAGAAAAACCAACAGAACACGAACACCAGCACGTATGAAAGCAG
+ACCTAAGGAGCGGGCAACTATCCAATCTTCACTCAAATGGACTTATTTCCCTTCGTTAAC
+TACTTCAAACGGTGTAGCTACCTCGGCTCCATGTTGGGACAAAGAGCAATAACCGTGCTT
+ATCCTTCTAATAAAGAAACAAAAACTTGCCTAAGAAACCGATTCACTCATTACTCCTACT
+ACTAGTATAGAAGAAGATCTATTAACGCGCATGGCTACCTATATAACAGGGGGCCTCTGA
+CCTCTGTCTCACAACCGAAAATAGAACCTGTAGCTCGCACCAGCGTCTATCCCGACC
+>ds2020-328_124
+GGTCGGGATAGACGAGAAGTAAGGATTCGAGAGTCCAGGCTGAAAATACATGCATAGATA
+GTGGTCTAATGACAAAGGCCGACGACGGAAGCTCGGGACGGAGCCGTATGATGCGGAAGT
+CTCACGTACGGTTCCCTGAGAAGGGAGTGGCTACCTACTGGAGCTTCGACCAACCACCAC
+CGGTCAATTCCGCTTTGGGGCCACCCCTTACTCTACCATTATTATAGGGGTATGGGGTTC
+GAGACAAAGAAAGATCAAGGCAGCATATCAGTTTTTCCTTTATACTTTACTTGGATCTGT
+TTTTATGCTATTAGCTATTCTGTTGATTCTTCTCCAAACAGGAACCACCGATTTACAAAT
+ATCATTAACCACAGAATTTAGCGAGCGGGCGCGTCTATCCCGACCA
+>ds2020-328_125
+TGATCGCCCCCTCGGATTCGTTCTAGAACTTTCTATGCCCCCTTGTATAGGTTGGGCGAA
+TCCACCGACTCACGTCGAATACGAACGCCTCTCTCGACAAACTAGCCCACGTCTTTCTAT
+CGGACTAGACCGATAGAAGTAGCTTGGGTCGGGATAGACGCCCCACTACGCTGCCACCAT
+GTGAGAGTCGGTGCGTAATGGATCTACGCCTGCCTTCGAAAGCTCCACTCCTGTTTACCA
+GGATCCTGGAACCATTCCTTGATTGATTGAAAATCACGAGTCGAATTTTTCTCTACCTAT
+TCGACTATCAAGCTCTTGACACCCTGTTTAGCCTAGCGCCCTCCTCCTCTTTTGTTCGCT
+TCGCTCTCCTCCCTCAACCAGGCAAGTAACCCGTCTATCCCGACC
+>ds2020-328_126
+GGTCGGGATAGACGTATTGGCATGTTGCTTTTTATAGACGCCCAGCCTATGATCGTAAAA
+GTGCGGTCACCATCAATCATGAGTTTGAGACAGTTGGATGTCTTGGTGGTGCCGTATGAG
+CTCCCTGTGGTGAACTCAGGTTGCTTCTGAGCAAGCTTTCCCCCAGGTTATGTCATACCC
+ATATAAACAAGGTAAGAAGGGAAAGGAAGACTTTGACTACTAGGGTAGCTGGGCCAACCG
+CTAATAGATCAAATTAAGAGGGAGTGAACGACATATAATATAATCCGAATGGGAAGTTTT
+GAGCAATCGATTCTTTCTCATGTACGGCTAAACCTTGCAGTTGCAGGTAATTTGAGTCTG
+GACCCCCGAGTGATGGTAAATCGCCGTCTATCCCGACC
+>ds2020-328_127
+GGTCGGGATAGACGGGGGGTTTGTCTACGCCGGAACGAGTCTGTCTTCGGACGGGCTCGT
+TTTTGTAAAGGAAAAGGAGTGTTGAAACCGGACGCGGCATGTCTTCTAGACGATCGCGTT
+GAAGATGTGGAGAATAAGAGCTACAATTGCGTTCCTCCCCCTGCATGTTTGATGTAGGGG
+AGCTGAGTAACTATGTGACCAGCTTCGCGTATGTAAGGTTCATCCAAGTACAAAGCAATG
+GGAGACTTCGGTCGACCGCCTTCGGGTTACCATTGTGGATTATCAGTTCGGCTGGGTCCG
+TGCGTCATAGGGACGAAAGTATTGCGGTGTGTTGTCTTCGGACATTAATGGCGGATACAC
+TTCAACGGTGCTATCAAGGACAAGTAGTGGCGGCCGTT
+>ds2020-328_128
+TACAAACGGCGTAGTCGATGGACAACGGGTAAATAGTCCCGTACTGAAATTGATTGGTGC
+AGAGGGACGGAGAAGGCGGACATCAGCCGGATGTTGGTTACCGGTTCAACTGTGTGAGGT
+GATGAGAGGCGGAGAAAACGCTTTGAGCCGAGCCAGGNNNNNNNNNNCGAGTCCCTACGG
+GGGCGAAGTGGTGAAGTCATGCTTCCAAGAAAAGCTCTAAACACCATAAATCAATTTTAC
+CTGTACCCAAAACCGACACAGGTAGGGAGGTTGAGAATACCAAGGGGCGCGAGATAACTC
+TCTCTAAGGAACTCGGCAAAATGGCCCCGTAACTTCGGAAGAAGGGGTGCCCACAGCAAT
+GTGGGTCGCAGTGAAGAGATCCAAAA
+>ds2020-328_129
+GGTCGGGATAGACGCCCTTCTTGCCTGACTCCTGTTTTGTTTGCTTGTTTTTAGTGTTCA
+TCTGAACACCGCTTGTCGACAGGCCTATAACTTACTAGAATGCACCACTGCACACTCGCG
+TAATTAGCTTGCCCTCCTTTACACCCAAGTCAGTGCGTAGGATCACTCTTACACTGAAAC
+GCATTTCGCTCAACCTGAGGTCATAATTCAGGTGTCATGACTAGTGCGATAGTTACACGG
+AGTACGAAATGTTACAGTACATTTCGTAGGGCCAGATTTTTGTCACGCCAGGCTGGCCAA
+ACCCCGACGTCTTAGCTTCTACTATAGGTTTTTATCGCCGCCACTGCTGATAGCACATCG
+CCGCACAAACCGCGTCTATCCCGACT
+>ds2020-328_130
+GGTCGGGATAGACGAGCGCTACCGGTATAGCACCGAGAGGATCATTTGTAGGCATATACG
+GGTCATGCGGAGTCACGGTCATAAATAATGACGAAGAAAGAGAGGCAACTGTACCATACA
+ACAGTTTTGCAGCCGACAGTCTAATAACATCAAATTTCGTAGGAAGTTATTCGCTTGGAG
+GTGGGGGTGAAGAGCAGGCTCCTGAGCTCAGGTGTACACAGTATTTGATGGGTGAACCGG
+ACAGAATAGCGCCAAACTCAGCAGCTATAGAAGGCTGTATAGCACATGCCAATCACAATG
+TGGGAGGGTGCTTATAATGCATCTAACCCGCTCATTGATTAATTAATTGATGAAGCCAGT
+GCTCCGTTTCGTCTATCCCGACC
+>ds2020-328_131
+GGTCGGGATAGACGCGACGGTTCAATCACCCTAGAGCTAGAGGGGAGGCGATCTCAATAC
+CCGCTTTTTCCATGCCACAGTTATTAGGCATTAGGCGTCGGGCTCGAAATAGAATCGTGT
+TGGATTTCACACTCTATTTATCTGGGAGAAGAGGCGGTCTAATCTTAATTAGCCTTCGCA
+TTCGCTTCTGAACTCAACTATAAGTAATCAGTACAGTTAGGCTTTCCTACCGCCGGATCC
+TACCACCGCTTTCTTCTAAGATTTCATCTTGCCTATAACAACCAGGGTGTACTTGATTGG
+CTCTTTCTCGGCTTGACTAAACCAATCTATCAACCTTAATGCCCTGCCTTTCCGTAGTCC
+ACCGTACCGTCTATCCCGACC
+>ds2020-328_132
+GGTCGGGATAGACGACGCACCACCATCAAAGAAACCTTACCACTACTCATCTCCTCCTCC
+TCCTCCTCCACACAAGAAGCCGTACCACCCAGTGCATTCACCACCACCACCAAATAAACC
+TTACCACTACAAGTCTCCCCCACCACCCACACCCTCACCACCTAAGCATCCTTACCACTA
+CAAATCTCCACCACCACCCTCACCATCACCCCCTAAGCACCCTTACCACTACAAGTCTCC
+CCCACCACCATCACCTTCACCACCCAAGCACCCCTACCACTACAAGTCTCCTCCACCACC
+CTCACCATCACCACCCAAGCATCCTTACCACTACAAGTCTCCTCCACCACCCTCACCATC
+ACCACCCAAGCATCCTTACC
+>ds2020-328_133
+GGTCGGGATAGACGAAGCTCTCTCTTTATCATCTCGTGCCAGATGTAACAAAGGATTCAT
+CCTTTTTCCTTCTCGCGAACCACGGGAGCGCCTAGTGCCCAGAGGAGCAAAGCAAATTTT
+CCTTTCGGGGTAAAGCGGCGCATAAAAAAGGGCTGGCCCGTCAAAAGCCCGGTTCCTTCG
+CGAACGAAGTTCAGAATCAACAAGGGTTCGTAGAACGAAGGGGGTGTACAACTGGCGGTG
+TACAACACCACCACTTTTTTGTTCGTAACGAGGGAGAGATAGAATGGAGTTCTTCACGAA
+GTTCGAGACAAAGGAATAAAAAAGAGTTTCTCTATGGCCTCCTCGTTTTGAGACAGTCTG
+TTGGCGTCTATCCCGACC
+>ds2020-328_134
+GGTCGGGATAGACGTCCGTCAGGGATAAGCGTTTAGGGGAAGCCGGCTATTCCGGTAAGC
+GAGTAGTCCGTTATGGACCCCCCCTTACCCCACTTTTTTGTTCTTGACCCTTTCCGGCTG
+TGTGCCCTTAATCTATCTTAGCTGGGCCTTCCCGACTTTCCTTACCAAATCCCCTTTTCA
+AATCTTTTCCCCAAGTGATGGCTAGCCCGAGAATATCCCCATTTGCTTTATTTTATTGCC
+CCGGATCCTTATTCTTCCCGAAGGAACCCTATCAAACCTACTGGTAAAGGGAAATGGCCC
+TAAGCGTCTATAAGGAAATTGTCTTTACATACCTAATACCTAATATGACTTAGGGATCGA
+TCGTCTATCCCGACC
+>ds2020-328_135
+CGGTCGGGATAGACGGGACCGCCCCCTACTACCCAATTCCTGTCTTCGGAACTACGAAGA
+TAGGTTACTTTCTGCGATGGCCCTCCACCTCGTTGGGAAAAGTAAAAAGAAATAACAAGC
+CCTAAACTAAATATCAACTAGCAGCTTATCAACCACCGAACACAGACTCATGTTGGCGAT
+GCCATGGTCAAGTAAGAGGACGACCCATTCACCTCAAAAGAAAAATCTCGCCTCTCAAGT
+AAGCCAAACGATTGACGTCAAAGAGAAGGACCACCCACCCAGCAAAGAGCGAGGTCTTTC
+AGCAATGAACTTCACAAAAAGAGTGGAAGGCGAGAAAGACACTTAGACAACATTAGAGGA
+TCTTTTGTTTTTA
+>ds2020-328_136
+GGTCGGGATAGACGTCAGACGGTTCTTCAGCGTCTATCCAGACCGCCGTTATTCTAGCAA
+CGGCCGGCACGTTGGCATTCCCCTAGACACTGAATCGTCCAGACGCGACTCCAGCGCTTC
+CAAAAGGTCCCTCATATCGCTTGAAGGTTTTGACTCTATCCTCGAGTGTACCAAGGTTGC
+CATAGCTCTAGATAGATACTGTCCCTTAGACCCACGTTTGTGGTCTACGCGTAGAAACTC
+TGCTATGGCCCCATACGCACATTTGCTCATCTGCAGGCGTATGTTGTGCTTCTTGGCATT
+TTTGCCAGCTAGCAACACGTCCTCGAGCGAATTACTTCCCAGTAGCACGTCGTCACCGTA
+GTGGCGGCCGTT
+>ds2020-328_137
+GGTCGGGATAGACGAAAAATGAACCTCTCGGTGCTATACCGGTAGCTTTTTCAATCCTCC
+TTTTAGCATTATAAGTAGCATCTTCCACCAACACGGAACAGTCTGCATAATCCATTGTAT
+TTCCACAGTTTAGACCGCATCCTGCATAAACATGTATGTATCCTGGTGTAATATTACTAC
+CGCTAGAATCGCTAGTATTATTTGGTACGTTTATTGCATTCGTGTCCATGCCTTTCTTAG
+TAATTGGCCTATTATGTATCCTCATGTTCCCTGACCTGCCGTGATCAATACAACTCTTAA
+ACTTTCCCATGGCATCTCCTCTAATGTCAGATAACACCTCAATACTGGATGGATACGTCT
+ATCCCGACC
+>ds2020-328_138
+AACGGCCGCCACTACTAATTCTGCCTACTCGCCGGGGCGTAAATTTTGCCCCGGCGGGGG
+GGTATAAGTAACACGCTTGAGCGCCATCCATTTTCAGGGCTAGTTCATTCGGCAGGTGAG
+TTGTTACACATTCCTTAGCGGATTCCGACTTCCATGGCCACCGTCCTGCTGTCTAGATGA
+ACCAACACCTTTTGTGGTGTCTGATGAGCGTGTATTCCGGCACTTTAACCCCCCGTTCGG
+TTCATCCCGCATCGCCAGTTCTGCTTACCAAAAATGGCCCACTATAAACGTTTCATTCAC
+CTGTCCACGTTCAATTAAGTAACAAGGACTTCTTACATATTTAAAGTTTGAAAATAGTGG
+CGGCCGTT
+>ds2020-328_139
+GCCGTGGACCTAGTTTGTAAGGGGGTCTAGACTAGGTCCAGCAGAAATGTCACTAGGTCC
+ACGGCTCTCTGTCCGTGAATACGGCGGTCGGGATAGACGTGCCATGGCCATATCAGCAGT
+AATGTAATTCATGGATATGACTTTGTCTTTTAAATTGTACTTACTGTATCCTAAACCGAT
+GGCGTAAGTCACCAATTCCTCATATGTGCATTTTCCGGTGCTTGCTCGAATCAACAATAA
+TTTCAAAAATTCTTTTTCTATTGGTACCTCCTTCCACTCAATGACATTGCTTGCCACTTG
+GCTCAGCAGGGTTTTCCACACTGGCACAGGCATTAAAACTCTTTGCTGTGAGCCCTTTGC
+GATCGGTT
+>ds2020-328_140
+GGTCGGGATAGACGCCGCGCCTCCGTTTGACTGCCGCTCGGGGATGTAGTTGTAGATACT
+TTAGTCTTAGTGGGTCGTTGGCTCCACCTGTTATCTCCTTCTACGACATGCTGTTGTCGT
+CGCCATATTCCATATGTCACTTAGTCATCTCTGCCTCGCTGCGGGTCAGCACCTCCGAAA
+GAAACGGAGGACTTCATTCAGTGACTCCGCGATCGCCCTCTGAACGATCAGAATAAGGTA
+AAGCTTGAAGATAAGTTTTGTACTCTATTAATTTCTCAGTCCCTCTAGTCGGGTGGGCGC
+CGGCCGGTCTTTCGACCAGATATCCCCCTAAAAACCGTACGTGCGGGTCCGACCGTCTAT
+CCCGACC
+>ds2020-328_141
+CGCCGGGATAGACGGAGCCTCACGGTACTTGTTCACTATCGGTCGATTACGAGTATTTAG
+CCTTGGAGGATGGTCCCCCCATCTTCAGACAGGATTTCTCGTGTCCCGCCCTACTTATCG
+TCCACTCAGTTCCACACCAAACTTTTCTCATACGGGGCTATCACCCGCTATGGCCGGACT
+TTCCATTCCGTTCTGCTAGCAATACTGCTAAAGAGTACAAGGCTGATCCCATTTCGCTCG
+CCACTACTTTGGGAATCTCGGTTGATTTCTGTTCCTACAGCTACTTAGATGTTTCAGTTC
+GCTGCGTTCGCTTCCCTTGCCTATGTACTCAGCAAGGGATGACCCATCCATGCCGTCTAT
+CCCGACC
+>ds2020-328_142
+GATCTGAATTACGGCGGTCGGGATAGACGTTGATTTGAGGTGGTGGCGGGGGTTGGAATT
+TCGATAGATTTGGAGGGCATAATTGGGATGAGTCGTCGTCTTCTTCGCCGTCGGATCCTG
+CGTTTGATTTCGTGTACGAGGTGATGTGTTGGATTGCGCTTTCGAATTGCGTGCACTTCG
+CCTTCAAGAGGGTTATTCGTATCGTGGCGGATGGGTTGGGCGATGCGGAGAGAGCGAAGG
+TGCCGATGAGATTGACTTCGGTCTGCTGATGCGGTACCGTTTCGTTCTCAATGCTTAACG
+TATCAAAAAGGGGATACAAATCTGGTTTTAATTTATGTGTTGGTTGGGTTTGCGTCTATC
+CCGACC
+>ds2020-328_143
+GGTCGGGATAGACGGATCGAATTCGTTACGCTCCTTAGCTCGGTAGGGGGTACAAGAGTT
+AGCTCGTTTGGATCGGAGTGAACCGAAAAGGGAATGTATTCAATATGCGAGTAAGAAGAT
+TCATTTATAGGCTTGAAACCTAACTTGTCTGGAGAGCGAAATTAAACAATCAATTAAAAG
+CACATTAATTAGTTAATGCTTAACACTACAGCTAAGGGAAAAAGAAGTTCATCCATACAC
+TTAAAAAAGGAGGTTAATATTCTCATCTTTTATCCTCTTTGGCTAAAAACAGACTGCTAG
+CTTTCAAGATTCCAGTTTTCAAACTTGCCTAAGCTCTCCATAGCTTTACGTCTATCCCGA
+CC
+>ds2020-328_144
+GGTCGGGATAGACGAATTCGAGGTTTGTTCGGCGGCACGATTCGTTAAAATAATTTTTTT
+TTGCGTCGATCTATACGATCGACCCCGGACGTACCCATTCGCCGCGTGGGGAACCGGGTA
+ACCAAAGTCACGATCAGAATAAAAAAGGAAGTTCGCTGGGGAAGTCCGGGGTGCTGGTTC
+AAATCAAGTTCGTGACATGGTAATCTCGATGAGAATAAGAGCGGCCGGTATTGGACGAAG
+GGGAAGCTGCCCCAACCACTACAACATAGGGGGCTCGGAAGGCAAATTTGTTCACTGTCC
+TAGATTCAGAGGGGGCCGTGGAAGAGGGGCGCGGGCCGTCTATCCCGACCGCCGTAATTC
+AG
+>ds2020-328_145
+AACGGCCGCCACTAGTTCGTATTTCTCGGTTGTGAAGAATCACACGAGGGAGCAGTTTGG
+GGGTGGGTCTAAGGTATCGAATCCGAATGAGCGCTTTGGTTCTATTAGGACGAGGTGCTT
+ACTTCCCCAGCTGCGCTATTTACCTCCGTTTGGTGACGATATTACCTGCTGTAGTTCGTG
+AGTTCTCGGGTTAGTATGCGACCCCGTAACCGTTTGGCGTTTAGCTGCTTCACAAAAGCT
+ATTGTCTCGCTTCTACAGTGCCTAGCTGGCGTGCCCTCGCTTAGCACTTGAACGTGTAGT
+TAGGCCGACTTCGGATGATCGGAAACACAGGACCGCGAGTTGCTTCGTCTATCCCGAC
+>ds2020-328_146
+GGTCGGGATAGACGACCAGTTGCTTTGCCGGCGGGCCCACTTAGGTTAGGGGGGGCATTG
+TCCCTCAGTTCTTACCAACCTCCGGTGTGTAATCGACATGTTGCTAGCTTCAACTCGGTT
+GAATAAGAATCATTGATTCCCTATGCTGTCCATTTCTTATTCATTCAGGGCGCTCGGCCG
+GTGCTCCTTTAAAAAACCAAAACCACTCTGAACGTAAGGGAAGATAAGGGAAGACCGCCT
+GAGCGAACCGACCGAAAGGACTTTTGACTTATTTGAACCGAACGATAGCGGCTTAAAGCT
+AAGCCTATCACGAGCAGCGTCGCTGCTTGATCAGCGGTGAGGAGCGTCTATCCCGACC
+>ds2020-328_147
+AACGGCCGCCACTAAATGGAACAGGTACCTGCAGAGACTGTAGAATAGAAAATTACAAGC
+CCTCTACACAGGTATCGCCGACTAGACACTTCTATACGCCAGTAGGAGGTTCCGGTTATG
+ATTGGCATGGCGTAGAACTGGCCACGGCGAACGCATCAGCGTTAAGGTCAAGTAATTACG
+TCAGGCTGCGATTGAGGCCAAACCAGGCGCCGGCGTCAATCGTAGTACTAAGAGCGTCAG
+GCAGAACTGAGAACGCATTAAAGTTAGTAGCAGTCGAGGACAGTACTCACTTGTTTATGG
+GAATGGTTGATGGCGTTTTTGAGGGTGATATTAATGTTTGCGCTTAGTGGCGGCCGTT
+>ds2020-328_148
+GGTCGGGATAGACGTATAAAGCAGCAATGTCACTCCCCCTCAAATCCGACGACGTATGAG
+AGTCGAGATTTGGAGAAAGCAACACCGGTAATGACAATAAAGTTGCAGCACCCAAATAAA
+GTTGCATCTATCTCCCCCTCAAATCTGACACTGGTAGAGGGTCGAGATTTGGAAGAAGAG
+AAAATGAAATAATAGTAAAGAGACTCAAACATGCCAGTCTCGTGGTAGAAACAAATGCAA
+GGAAATGTGGAATGGAGATGGGCATCCGACAACTGGAGAAAAGGAATAAAAGATGGAAAA
+GAGTCTGCAACCCAAACAAAAAGGAGGAAAGTGTAGTGGCGGCCGTTGCTGTGTATTA
+>ds2020-328_149
+GGTCGGGATAGGCGGTGTTGTAGCATGTAGCACTGGGACCTGAGGAACAACATTTGTGTG
+CTGAGGTTGGCGAAAGAAGATTAAATGACGTATCATTTTGGGTTAATGATAGCTTGGGTG
+GAAGGGAGGATGAAAATGAAGTAATTGGTTCCAGCCTAATAAATACAGATTACCCAGGAA
+CAAAATGCGCCATGGTATACAGCTATGTAGAGGACAAATGGGTAGAAATGAGTAATAAAA
+ATTACGGTGAGTATACAAGGAAAAGCTTCCATGGCGATGTGAGACCTAGTGTACCTTTAA
+GGCGAACAATGGAAAAAGAACCTGCACCTGTAACTTGGTGCGTCGTCTATCCCGACC
+>ds2020-328_150
+GGTCGGGATAGACGAAGCCTACTCCTAACAAGTTGCTGGCTTTTCAGCCGTTGCGCGCTA
+GCGTTTTACCTTACTAGTAAAGGGGCTGCTGGTTGTAGCGCGCAGTGTGCTAGTGAATAG
+GAAAAGCGGATTGAGATTACTAATGACGGATGGAGACACCGAAGGTGATAGAACATGTTC
+GGTGCCTCGCTCTTGTCTCCTTCGCCGGAGACTGCAAATGATGGGAATCCTATCGATAAA
+GAAGAGGCATAGGCATCGCCTCTCGATCCAATCCGCCTTCCCCGGCCTCCCCAACACACT
+CTTGATACGAAAAAAACCATCACCATCGTCTATCCCGACCGCCGTAATTCAGATC
+>ds2020-328_151
+TGAATTACGGCGGTCGGATAGACGGACGCGCGAGGTTAAGGTGCCGGAATACACGCTCAT
+CAGACACCACAAAAGGTGTTAGTTCATCTAGACAGCAGGACGGTGGCCATGGAAGTCGGA
+ATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATGAACTAGCCCTGAAAATGGATGG
+CGCTTAAGCGTGTTACCTATACCTCACCGTCAGTGTTAGAGCGATGCGCTGACGAGTAGG
+CAGGCGTGGAGGTTGTATCGAAGCCTAGGCAGTGATGCTGGGTGGAACAGCCTCTAGTGC
+AGATCTTGGTGGTAGTAGCAAATATTCAAGTGGAGAACGTTAGTGGCGGCCGTT
+>ds2020-328_152
+GGTCGGGATAGACGAAAGCTCTGCCTGTGTTCTACCTGAGTTGATTTTAATACACAATGG
+TATCATCCCCTGCCTTAACCTGTATTCTTTCCGATTTTTAGTCGGTTTTTCACTCTCAGC
+CACACTTATGAAGCCAAGAGAGAAAGTGTAATCTTGTCCGTAACCCGTTGTTTCGTAATC
+AATAAATTTGCTGTCCGTGTTAGGTGCCGGTATGGGCATCTTATAATTCTCTATTCTGCA
+ATTTCTACAGGAGGAACTTCCGCACCTTCTACTCCCCGCGCATCCACTAGTTGATCTTGC
+GTTTGGCTGGCGTCTAACTGTCTGCTCATTGGGACCGGTCGTCTATCCCGACC
+>ds2020-328_153
+GGTCGGGATAGACGGCGGTTTGCCTTTTTTACTATTAAATTGATTACTCTGAATATCACC
+GACCACGATTAGGGCATTGTCTTTGACTAATTGGGTGGTAAATTTGTGTATCAGGTCTTG
+CCGTGTGTTTTTGATTTTGGCATGGATAGCCTTGATACGTTTTTTGTTGTTTGAGCGTTG
+GGCTATAGCTAATTGTTTTGCATATTTTAGCGTTTGCTTAATGGTTAGCTTGTCACCGTT
+TGAGGCGGTAGCACTGTCTTTAAGTCCTAAGTCAATACCTACACTACCTGTTCCGCATGA
+TTGTTTGGGATAGTCTTTGACTGTGATACAGGCATACCAACGATTACGGCTGT
+>ds2020-328_154
+GGTCGGGATAGACGATCCTCAGCCCTGTAAGCCCACACCTGTGTAGAGTGGATCGTTCAA
+CACCTGCGGCACAAACCCATTTTTGACCTATTGGTCCTAGTATCATAGGCGACCGAACGG
+CCGCCCCCTAATTACTAGACCAACCTGCTATAATAATTCCATAAACACCTAGCGAAGATA
+TGGCAAACAAATAAAGTAGCCCTATGTTCGAATCTGACAATACCATACCATAATCAAAAG
+GTACAACGGCCCGAGCAACCAGACTTAACATAAATGTAGTCACTGGAGCCATTCTAAAAA
+GGGAGAAATTAGCACTACTTGGTGAAATAGGTTTGAACGTCTATCCCGACC
+>ds2020-328_155
+GGTCGGGATAGACGATCCAGTTTCCTTTGATGGGGCCCTTCCTGCAGCAGATTCGTTCAC
+AGACGATTCAATAGCAACCCCTTCTTTTCTTGCAGCAAGAGGGTATTCGAGAACAAGCTC
+CTCTAGAGATGAATGTGCAGCTGATTCAATAGGAGCTTCTACGATCACAGTAAGAGCCTC
+TATGCCAACAGCGGCAACTCTCACAGCAGATAGGCAACGGTTACTGAAACAGTTAGCCAA
+AGAAGAAGACCGGTAACGAAAGCAACGGATATTCCAACAACAATAGGTATTGTAACAATA
+GGATTCTAAACCTTCTCGTCTTCTGAAGACCACTCGACGTCTATCCCGACC
+>ds2020-328_156
+GGTCGGGATAGACGGTATTGATCGCTTCTTCAAAAGCCAACCCACCCCCAACGTGTTCGA
+GTGGCCCACGATTCGCTAGCTTCTTCATGAACTCCGCCGAAAGCCATCCTCGACGTACTC
+GTGCATTGAGAAGGTTTGGTGGCCGTACTCCCAACACAAAAGCATAACCGAAGACAACCC
+CAAGCTAAAGTTCACCCAAAGCCCACTCATCATCACCACGTGTGTTCGTGTGGCCAACAA
+TTGACTAGCTTCTTCATCAACCCCGCCGAAAGCCATCCCCGACGTACCCGTGCATTGAGA
+AGGTTTGGTGGCCGTACTCCCAACACAAAAGCAATACGTCTATCCCGACC
+>ds2020-328_157
+GGTCGGGATAGACGGGGGGGCGGAGTGTTCTTCGGAATGACTAGGCGTAAAGGGCACGTA
+GGCGGTGAATCGGGTTGAAAGCGAAAGTCGCCAAAAACTGGTGGAATGCTCTCGAAACCA
+ATTCACTTGAGTGAGACAGAGGAGAGTGGAATTTCGTGTGTAGGGGTGAAATCCTAAGAT
+CTACGAAGGAACGCCAAAAGCGAAGGCAGCTCTCTGGGTCCCTACCGACGCTGGAGTGCG
+AAAGCATGGGGAGCGAACGGGATTAGATACCCTGGTAGTCCATGCCGTAAACGATGAGTG
+TTCGCCCTTGGTCTACGCAGATCAGGGGCCCATTTCGTCTATCCCGACC
+>ds2020-328_158
+GGTCGGGATAGACGCCCCTGCCCCATCATTTTAAAATAATTCAATTATTTGAGTTCCACT
+CCTTATCCCCAATGATTTTGCTTATTAGCCTATCATTGGGTCGTACCCATTATTTTTTAC
+CTTCGAATAATCCGTAGTATTTTCGCATATTTTCCATCATCCATTTCTCCAACCTGAACT
+TACCAGTTATTGTTTTTAAGTAATCCTGATCAATGATGCTCCTAGGAACACTCGCTGCCA
+ATACAATTAATTTACTGTCCTCCTCATTTGCTTTCCTAGGTCCAAAGCTTGCTGGCGCTT
+TTAGAAATTCCAGCGTTCTTGGTACCCCCTCACACCGTCTATCCCGACC
+>ds2020-328_159
+GGGTCGGGATAGACGGCAGATACCACTCGAACGTGGTTGTTCGTATTTTAAATCAATCAT
+GACTTCTTCCGAGATCACTGCTGCCAATGTCCATGAACTTTTGGTTAAAGTTCTGGAAAA
+GCAATGCGCTGACGAGACCACTACCGTCGGTAAGGCTTTCTCTGAGAAAGCAAAACAGTC
+TTTGAATAAGACATTCGGACTAAATGACGAGTCCAAGCAACTGAAGATTTCTTTTGATTT
+GACGGCTGAACAGCAGGCGTTACTCAAGAGACATTTTCCGGGTCGATCGGTGATTTTTTC
+AAATTCATCGAGTTCCTCACACAGTTATGCAGCGCGTCTATCCCGACC
+>ds2020-328_160
+GGTCGGGATAGACGTCGACCACAATTTCCCAAGTAAGAAAGAGATAGAATTTCACTAATT
+GGATTGGAAGGAAAAGGAGGGCTTCGATCCATTGTGATTAGGATCCTTGGTGTGGAGAGA
+TCCCTGCCAAAAATCAAAGAGCGACGTAATTCCCCATTCATCCGAAGTAGTATTTTAGTA
+TAGAACAGAGGCTTTCTGAGCCGACTACTACGACTACATGCGCATCTAGTGCAGTGGCTT
+GGAAGCAAGCTACCTTGACCATCTTCCGAAGTTCTAAATAATCTACTGATCAAACGCTGT
+AGGGGCAGACTGCTCTACATTCAACCACACATTGCGTCTATCCCGACC
+>ds2020-328_161
+GGTCGGGATAGACGAAGCGAACTCATCCACATGATCCCGATCTTTTGGGACCATAGAAAG
+GCACTTAGTCGGTTACTAAGTCGCGCTACATGTAGGTAATCATCCTACAGGTAGAACGTG
+TGGAAACACACACCATATCAATAGTGACTACTAATCACTATCAACCGATATGTGTGCCAC
+GGGCACATGCTAACCGGGGCGATCAGCACGAGGGTGGAACCACCACCATCCAAGGAAAAT
+CCTCGGCGCCAAGTAAGAAGTTTTGTTTCGCTAGTTTTACTGTTTCTCTTCCCGCGAAAT
+CTCTAGCGTTTCTCTCCCCAATAACCCCTAGTTAAGTCTATCCCGACC
+>ds2020-328_162
+GGTCGGGATAGACGCTTCCTCAATCTCCAATTCAGTGAGGATCCTTCTGAACCCAAAAAC
+CCAGCTGAGAGGGAGCCCATCCGATCCCATAAAGGAGGCAATGTTGTGGTTATGCTTGCT
+GGATAGGTTGAAGAGTCTAGGGAATACCTCTTTCAGGACCCCACCCTTGTTCCAATCATC
+CTCCCAAAATCTGACCCTAACTCCACAACCTACCACGAAAACGCAGCCTTGAAGGAACAA
+ATTGTAGCCACTAGAAATGTCTCTCCAAGGGCTACGACACGATCCTCGACTCACAGGATT
+AGCAAAATCATACGAAAAGAAAAAGGGGGGGGCGCCGTCTATCCCGAC
+>ds2020-328_163
+GGTCGGGATAGACGCATAGGGGGGCTGTTCACTACAAGCTATCAGTGCTGTCTTAGATTG
+AACGGCAATAAGATAAGTCGACGTTCAATCTCTAGGGCGGGTTTCCGCTGAGAACGGAAT
+AGTGTTCGTGTCCAAAGGCGAACAACGCCCTAGCTTCTAGAGTTCGCTGCTTTTCCCAGG
+CCGGAGAAGGTCTTATACCGCTCGCCTTTGTTTGATATGTTCATTCAGTACCAATACAAA
+CTACAACTACACAAAAAAAAGGAAGGGCCGCTATAGAAGCTAAAAGTAGCCTATAGTAGA
+GTAGTCGGCCTAACAAAAGCGTCACGGCAACATAAAATTCCCCTCTCT
+>ds2020-328_164
+GGTCGGGATAGACGGTGTGACTGGCTGGAGCGGCAGCTGAGATTATGACAGGGACCGGAA
+ACAAGGTGGTAAAAAAGAGGCCGTGGAAGATACAGGCCGAGCACAACCTGGGACGAGGGC
+TGGTTGCTCATGAAAAGCAAGCCTTGGGGCATGTGCTGGAGAAGGTTACACGGGAAAGTG
+ACATGGAAGCTGCGTTAAAGAGGTTCATAGTGAGGCCAGAGTCTACTGCTTGTAGACGGC
+TACTGTGGCACATCCACTGTAAAGGAAACGTGGAAAAGAGTAAACTTGAGGCATGGGCTA
+ACAATTTCAAGTTAGAGTGGCATGTGGCTCTCACGTCTATCCCGACC
+>ds2020-328_165
+GGTCGGGATAGACGCTAGTTCAAGGTTAGAAGAAGAAGGAATAAACTGGTGGGGTTGAGC
+AATGAGGTGGGTGAATGGATCACTGATAAGGAGGAGTTGAAAGCTGTGGCTGTGAAGTAT
+TTGAAAGATTTGTTTGATAGGAGTGATGCGGGATTCTGATTTGCCTAATCTTTTCCCAGC
+TTTAGATCCCAGGTTGTATGCTGACCTGGGTAGAAGTGTGAGTGACCAGGAAATTAAGGA
+TAGTCTCTTTGCTATTGGCCCTTACAAAGCTCCTGGTCCGGATGGTTTCTCTGCTTGCTT
+TTATCAGGGATGTCTGTGCCTCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_166
+GGGTCGGGATAGACGTTAACTGCCCATACCAACCATGTTTGCTAGCCTTGCAACGTCAGC
+TATTTCCTGCCAAGTGTCGACAGCTGCCTCATCTCGCAGCCTATTGTATATCACTGCCTC
+ATCTGCGGTTGTGCAATAACCACGTATACGTAAGTTCTGCACTAATGCATGTATTCCACA
+AGTACCATCTCCTTTTGTGTTAACTTCTGTCACTATTATTTTGTCCTCCTCTACTGGCAT
+TGGCTCATCTTTGACCAACTTTGACTCTGTGCCTTTGTCTTTCAGTTCATATGAACTACC
+TAGCATTTCCTCACCATTTACGCCTTTGACATAAACTGGCGATGGT
+>ds2020-328_167
+TTTTTGCAAGTATGATACTCCATTAGAGAAACACCCCAGTGCATTTTTGGGTATATTTCT
+TGCTGCTATACGACTCCATATTTCTGATTCTTCCAAACCTAGTATGCATGGTCTAACACC
+ACCTCGACTCTCCTGCATTACTATAACACCGTCCTTATCACATATTAGCGCACAAACCAT
+AAAACCTTTGAAGCATTCTATAACTCTTATGCTCCAGTCTACACCTGATAGACCCGACTC
+CACATCACAGCTAAGCATTGATGCTATTGCATGACTTAAATCTTGGCCAGTAGACCTGGC
+TTCTAATAATTTTACTGCCATAACGACCACCCGTCTATCCCGACC
+>ds2020-328_168
+GGTCGGGATAGACGCAATCCCCCGCTGCTGCCTCCCGTAGGAGTCTGGACAGTGTCTCAG
+TTCCAGTGTGACTGATCATCCTCTCAGACCAGCTAGGGATCGTCGCCTAGGTGAGCCGTT
+ACCCCACCTACTAGCTAATCCCATCTGGGCACATCTGATGGCAAGAGGCCCGAAGGTCCC
+CCTCTTTGGTCTTGCGACGTTATGCGGTATTAGCTACCGTTTCCAGTAGTTATCCCCCTC
+CATCAGGCAGTTTCCCAGACATTACTCACCCGTCCGCCACTCGTCAGCGAAACAGCAAGC
+TGTTTCCTGTTACCGTTCGACTTGCATGTGGTAGTGGCGGCCGTT
+>ds2020-328_169
+CGACCATAGGAGAGGGAGTGAAACTTGCTTAGAGTGAAACGCTAAGAGAGGAGCCCTCTT
+ACCTATCAATGGAAAGATCTACGTGCGTGGCGTGATAAGGAATCCTAGAAAAGATCTCAT
+GAGACCCGCCCACTATTACTACGAAAAAAGTACTGCCCTTTTCCGTCGCTGCTAGGAGAG
+TCAGCTACTTCTATTAGCGCCGGACCTTGAGTCGAATTGATCGTGTCATGTGCAACGTCC
+ATCAATGATGGTTCATTAATGTCCATTGATTTAGACTCCTTCCCCCCTCCCAACTACGAA
+TAAGATCGAGAGGAGCCCGAAAGTACCCATACGTCTATCCCGACC
+>ds2020-328_170
+GGTCGGGAAAGACGGTGCGTGTGGGTATTATCTAGGTTGTTCCCAATTGGTGAAGCAGCG
+ACGGACGAGAATGTCAGACCTACGGTACGCTAAGTTCTACGTAACGGGCAGCCATTTTGT
+TTCGATTATGAAGATTTCAATTCACAGCATAGCAACAGTTCGATGCAAGCGGTACTTGAC
+GCCTATCTCTTGGTTTTTAAAGACTATTTAAGCGAGGAGCAGGTGGAAGCTATGTCATGG
+TCAGTGAATAGTCTTAATGATGTTAAGATAAAGCAGCCTAATGGCGACTGGTATGAGGCA
+CGAGGGACACTATTATCAGGCTGGAGAGCCGTCTATCCCGACC
+>ds2020-328_171
+GGTCGGGATCGCGTTTATACAGTACGCGTGTTGCGATACTGATAGTAGTGAGCGGGGGGA
+CTTGGGATAAATTTCCTGAGCCAGGGAAGAATCGATTGGCGATTTCGGCGGCGGCGAGGA
+GGTGTTTCATCCAGTCAAAACTTGCATCATCGGAAAATCCGAGGAAAGCCGGGAGAGTAC
+GGAGGTCAGCGTTGCCCGGGATGTCTGGGATGTTCCAGCGGCGGATACGCGAATGCTTCG
+CTGTTTCTTCAAAACTACCAATTTTGTCACCTGTTTCAGCAGGGGCAAGCCAGGCCAGGT
+TGTAGGCGAGGGATTGGAATGAGGCAGTAGTGGCGGCCGTT
+>ds2020-328_172
+ATTACGGCGGTCGGGATAGACGGAGGGCGTCCTTCTAGCACCCCCGACACGCGAGCGCTG
+ACATTTGCGTCATTGGCGTCTCTCCCGACTGGGAATCTGTTTGGGAGCACGTTTTCACAA
+TTGTAAAACGCAAAGTTGGCAAGGACGTAACTCGTTGTATCTGTTCCATAGATTGCACGG
+AGCTTGCCCCATTCATACTTTGTTGATGCCCAAGCGTGTATTTCGGGGTTGCGTGATGTG
+AAGTATTCGATGTCAAAAGATGGCATGTTCGATATCATTATGAACTTGTTTTTGAGAGCG
+CGGTCAGTTCTGATGAGAACATCTCGTCTATCCCGACC
+>ds2020-328_173
+GGTCGGGATAGACGGAGGGAGTCCATCAATAAATGGACCATTTGTTACGGAGACACAAGA
+AAAACCTAGAAAGCATTTTTTCTGCAAGTCATCTCGAGGCTTTCAAACGCATCCAAGCAA
+TTGGTATGGTATCCGATTGATAGAAACCATAGATTCGCGTCGCCTACTTGCTGAAAGCAC
+AAATAGAATTGCCGATCATTCATTGTATGAAGTTTTTAAGACCTCACTAATCGGCCTTAC
+ATTTTTTAGTTCATAATGAATGAAATGACCCCCGGATGAAGAAAAAATCTCCCTTCCTTT
+TTACTAAACCATGGGGAGCCCTCGTCTATCCCGACC
+>ds2020-328_174
+GGTAAACGGACTTCTGGAGCAATCGACTCCCAGGGTGTGACGGGCGGTGTGTACAAGGCC
+CGGGAACGTATTCACCGTGGCATTCTGATCCACGATTACTAGCGATTCCGACTTCATGGA
+GTCGAGTTGCAGACTCCAATCCGGACTACGACGCACTTTATGAGGTCCGCTTGCTCTCGC
+GAGGTCGCTTCTCTTTGTATGCGCCATTGTAGCACGTGTGTAGCCCTGGTCGTAAGGGCC
+ATGATGACTTGACGTCATCCCCACCTTCCTCCAGTTTATCACTGGCAGTCTCCTTTGAGT
+TCCCGGCCGGACCGCTGGCAACACAGGCTAAGGGTT
+>ds2020-328_175
+GGTCGGGATAGACGGCAGACTTGAGTACCGAACTGGGACCAAGACCAACGGCTCCACCAA
+AGGTGCCTCCTATTCCCGTCATCAAGAGTCGCTCCAGCCCCGAAGGCGAGGACAAAGAGC
+ATGCTAAGAAACCTGAGAATGGTAATGGTCGTGAGAATGGAGGTGTTGTGAAACCCAGCC
+ATGAAGGAGCTAACGGTGGTGGCAGCAGTCATAATCGGAAGCATTCTGAAGGTGGCAGTG
+GTCCTAATAATGGGAAGCCGAATGGTGGAGTTTGCTGGTGATGAAGGAGGAAACGATGCT
+GATGCGATGAAGGGGTGCTATACGTCTATCCCGACC
+>ds2020-328_176
+GTAATACCCGATCCGATAGTTTACGATATAGATAGATATATATTTAACAACAACATTCTA
+AGAAAGGATATTTTTAGATATCGGTAGTTGTCCGGTCGTACCCAAACAGTAATATTCCAG
+AGGGAAATGCACCTAAGATCAAATATTTCGAGCCGGCTTCCGTGGAAAATTCATACGTTC
+TTTTTGATGCTGCGATCACATAAAAACATAAACTTTGAGGTTCAATAGCTAAATACATGG
+CAATTGAATCATGAGCCGAGATCATAAAGAGCATACTGCGAGTAGGAAGTGGAATTAATA
+CAATGAATTCAAAAGCAATGGTCGTCTATCCCGACC
+>ds2020-328_177
+TCTAGATAGAAAGCCCTATGATTGGAAACTACCACGTTAGGTTTGGAGAGAGACGGGACC
+GGTTATATAATAGGGGGAGCAGATGCAAGCTTTTTCTTTCAATAGCCGGCCAAATGACTA
+CAGGATCATCGGTCTACTCTACCTCAATTCACCATTTCGAACCTTATACAGAAGGTTTTT
+CCGTACCAGCTTCTTCTACCTATACCGCAGTTGAAGCACCTAAAGGAGAATTTGGTGTCT
+TTCTGGTCAGTAATGGAAGCAATCGTCCCTACCGTCGTAAAATAAGAGCACCTGGCTTTG
+CCCATTTACAAGGACCCTGTTCGTCTATCCCGACC
+>ds2020-328_178
+GAAACAAGGGATCAAAGCGTCGAGGCGCGAAGTCTTTAAGATCGGATGCAATTCCGAAGC
+TGGTACATGCTGCACTGGTCCATGTTTCTGGCAGGCCTGGAATCTCTTAGCATATTAAAA
+GAAATCGGACAAGATGGTTGGCCTGTAATGGCCATGCCTTCTGATCAGCCAACGCATTTT
+ATGCCCTGCTTGATGTGATCCACATACTATACTCCATCATGGACTTGAAACAGAATTTTT
+TCGGCTTCTTGCTCACTCACACACCTGAGGAGCAGTCCGTCCTTTCCACGCCGAACCAAT
+ATCCCGACCACGGACCAAAACCGTCTATCCCGCCC
+>ds2020-328_179
+GGTCGGGATAGACGTGATTCTTGCCTATGTATGCTCTTTCCTGCCCACATTGCTTGCCCT
+ACTGTTCTGGTTGAACTACGGCTTTGGCTGAACTACCACCTGACACCAGTATTCTTAGTT
+TACTGTCTGCTTCCTGCCTGATCGGTGCTGACTGCCTGTTCTTGCTTGTCTTGGGCCTGC
+ACTTCTGGCTTACCGGCTTGCTTGTTTGCCCGACTACCTGACTATCTGACTACTACGACT
+ATTCCGCTTGGCTATCGGACTACTTAACATCGGGATTCTTGTCTGTGCTGCTTACTCCCC
+TTCTTCTTACCTGAACAAAACGTCTATCCCGACC
+>ds2020-328_180
+GGTCGGGATAGACGGTGGGTGGTGGTTGATCTCAATGCTAATGGTTATCCCCAAGGTTCA
+ACGAATGAATGGGGCTATGATTGTACCCGGATAGAGATGACGGTCTTCCTCTGATGTCTC
+CAAGCCGGCCATAATAGAATAGATAGGCGAAGCAGCCAATAGCAGTCTGTTCTCGCCTAT
+CGATAGATAGTAGGTTGCTTCCAAGCTCAAACCATTTGAAACTGAATTGCTACTTTATTC
+TTGTTATTGATAGAGTGGTATTCTCCGCCCCTGTCAAATAAAGTAGAGGGAGAGAACTGG
+AAGAGAGAAGGGAAGAGTGGCGTCTATCCCGACC
+>ds2020-328_181
+GGTCGGGATAGACGCTGTTCCCCAATAACCAAAGGCCATGCACCACCTGTTCCTCCAAGA
+TTTCTGCGTGGAAGGCTTATGACCAATAAAATAACCTCTCTCTTTTGCCTTTCGGCAATT
+AGCTTGTACCCAGCCAAAAGTTCCCTGTTGCTTTGAAATTGAGTACAAGTACATGAACTG
+CTCGAATGTTGGCTCTCCCAACCCAACCAACCACCAAGCAATGTATACTCCATGAAGCAG
+AAGCCAGAAGTTGGGATTATACTGCCCCGGCGCATACCCCAGCTTGGCCAACATCATCTG
+CACCCAAAGATGAAGCGGCGTCTATCCCGACC
+>ds2020-328_182
+GCATTAGGCTATTGAATCTCGCGACTAGAATTACGGCGTCGGGATAGACGCTTTCTCCCG
+GTCGAGGTTCAGTACATCCGGGTTCTCAGCTCGATTTTCTCTCTGTATCCACCTTTAGTC
+GGTATTCAGGGTTCCATTCTTGATGTATCTACTATTTAAGTTCCTTCTGATCTATCTACT
+GTAGGTTCAATCCCCGGTCATTCTATCTTTAGTGAGGGGACGAGTCATCTTGCTCGACAT
+CATGGGATCGCGCTTTCATTAACGGGCTGCTTACTCCGAATTGGGATATATAATTAGCCC
+AAGCATGACAAGGCTCCGTCTATCCCGACC
+>ds2020-328_183
+GGTCGGGATAGACGCCGGGTTCCGCTTTCCGGCTAAGCAAGTGATAAAGGAGTAGCGGAT
+CCCTTTGTCTGTCGCATGATACCGGGGAGGCCTTCTTTTAGCACCGGTAGCTATGAGTCA
+GTCGGGGTAGTCACTCCCAAGAGAAGGTAAAGATGGGATCGTTTGTATGCGCCATACCTA
+TAAGAGGGGAGAGAAGGTCGAACGCTAATTCCTGACTGAAGGGCTGAGAATGAACACAAG
+ACTTTGAAGACCAGACTCAGGAAAGCGGACGGGAACAACAACGACGTAGTGACGTTGACT
+AAATCCGAGGGGCCAACGTCTATCCCGACC
+>ds2020-328_184
+AGGATATTCGAAAAAAACGCAAGTAGGACAAAATGACTGAGGTCAAATGGCACGCGGTAG
+TCATTCAAACAAAAGACGCTGAGGAACCTCCATCGAGCCACGTGATCCGCTACAACTCAC
+ACAAAGACTAGGTTCGGCTTCTAAAAAGAAAAGGGGGGGGGGAGAAAAGAGGACAGGGGC
+GCTCCCCGCTAACCGAAGTCTTGGATTTTTCTTTCAAAGGAAAGACAAGCAGTGGTTTCC
+CAGTTATCTTCAATTACTTAGTGAGAGCTTATCGAATTGATGTAAGGCGGGGATACCATG
+TAGGAGGCCTGCCCTGCGTCTATCCCGACC
+>ds2020-328_185
+GCGTGGACAAGGGCGGTCTTGCTTGGCGCGAAGGCTGCTGGTTCGGGGGTAGGGTACGGT
+ACTAAAGGTCCTCGGACTTCCAGGCGGTTTTTCTTTTGGGCAGCTGTTCACCGTTGGATC
+TCGCCAATACAGCCCCCTATAGTTTTCGTTACCGAGATATCTTTTTTTTTCATTGTTCCC
+AGGGATCTTTTGGGTAATCCGCTCCCATGCTGCAAACAGTCAAATCTGAACTAAACCTTG
+TTGCTCTTCTTTCTTTCCTCGCGGGCAGGAAGCACACCAGCAGCGTGCGTTGCGTGGAAA
+GAAGGAAGAGGCAACGTCTATCCCGACC
+>ds2020-328_186
+GGTCGGGATAGACGGCTACTCCCCCTTTTCTTCCTTCTTTTCCGTGTCTTTTTCTTCTTT
+CTTCTTTCCTTTGTGTCTTTTTCTCCTTTCTCCCTTTCCGTGTGTCTTCTCCTTTCTTTC
+CCTTTCCTTATTGGTTTGTCTTTTTCTTCTTTTTCCTTTTTCATTTCTTCTTCCTCTCGT
+TCTTCTTTTCTGCTCTTCTTCTCCCCACTCAATAGACTCCATCAGCCTAGCCACCAGGGA
+TCAAGGAGGAGGTATCTGGGTCAATCCACAGAGGGTGATTGTGATTCTAGAGGTCCACGG
+ACCCCCGTTCTAACTAGGTCCACGGC
+>ds2020-328_187
+GGTCGGGATAGACGCTGTGTCCCCCTGGAGGGGGAGATTGTTGGATCCAGCCCATAATGA
+AGAGACACCATGATGATGTCTATTGGTGAAATGTTTTTCCCTTGCCATCATGACTCTTAC
+TTTTGGAATTTGGTTTTGGCCGGTTTCTTCGGCATGAGGTGACTTTGTTTCTTTTGGAAT
+TTGGCTTTAGCATGCAGCGGGTTCTTCGGCAAGAAACATGGTGGTAGAAAGTGGAGGTAA
+TGATGGGTGAGAGACCAACATCATTATGTTTTCTTCTTTTCGCATGTGGTTGTTTTTTGG
+CGCGTTCTTGCACGTCTATCCCGACC
+>ds2020-328_188
+GGTCGGGATAGACGAGGGGTAAAGGTAGATTGGGAAAAAGAACTCGGTAATAAAGCAACG
+CCACCAGATGAAGTAGTAGGCTATGCAAATGGAGTTTTTAGTAGACATGCTGCTGATGAA
+ATTATCGGTCAGGCTATAAAAGATGTTGTTACCACAGCTTTTCCACACGCAGTACCAGCT
+AAGTTCAGTGATTTTATGGACGATGCATATGAGTGGTTGGTTTCTGGATCATCAGCTGGT
+ATACCGAGAGCACTTAAGAATTCGTCAATGAGGACTTATATCCTAAAAGACTTGGGTCTA
+CATACCAAGGGCGTCTATCCCGACC
+>ds2020-328_189
+GGTCGGGATAGACGAAATTGGCGGATGGTGCTAAAGGAGTTGGGAGAAGAGTCCACCTAT
+AGTTATAGTAGTTAGAAGCCCAGCTTCAATCGTCAGCAGGTGAGTCAGCAAAGTTCTCTA
+GGAAGTCAGCCCATTGCTTTGACTTTTAGCTGCCACTGCTTCATCGCATCGGATGTTGCC
+CTTGAATTTCTTTCTGTAGCCGCATCGGAGGATGTAATAGCAAAGTATGCCACCGCTCCT
+TCGGAGGTCTCCTCCCCCCTTTTGGACCTATAGATTGGTACCACACGAAACCGGACCCAA
+CGTCTATCCCGACCGCCGTAATTC
+>ds2020-328_190
+AGTAAACTGGTGGCTTGTAGACTGGTGTGGGTGGTGGGGGAGACTTGTAGTGGTAAGGCT
+TCTTTGGTGGTGATGGTGGTGGTGGAGACTTGTAGTGGTAAGGATGCTTGGGTGGTGAGT
+AGACCGGAGGAGTAGGAGAAGGTGGTGGTGGTGGAGACTTGTAATGGTAAGGCTTCTTGG
+GTGGTGATGGTGGTGGGGGAGACTTGTAGTGGTATGGGTGCTTAGGTGGTGAAGGTGATG
+GTGGTGGTGGAGACTTGTAGTGGTATGGGTGCTTGGGTGGTGAAGGTGATGGTGGTGGTG
+GAGACTTGTAGTGGTAGGGGT
+>ds2020-328_191
+GTGAAGGTGATGGTGGTGGTGGAGACTTGTAGTGGTAGGGGTGCTTGGGTGGTGATGGTG
+AGGGTGGTGGAGGAGACTTGTAGTGGTATGGGTGCTTGGGTGGTGAAGGTGATGGTGGTG
+GGGGAGACTTGTAGTGGTAGGGGTGCTTGGGTGGTGAAGGTGATGGTGGTGGTGGAGACT
+TGTAGTGGTAGGGGTGCTTGGGTGGTGATGGTGAGGGTGGTGGAGGAGACTTGTAGTGGT
+ATGGGTGCTTGGGTGGTGAAGGTGATGGTGGTGGGGGAGACTTGTAGTGGTAGGGGTGCT
+TGGGTGGTGAAGGTGATGGTG
+>ds2020-328_192
+CGGCGGTCGGGATAGACGCGTGTGATTGGTGCGCCTGTTTGGAGTTGGACTTCTAATCAA
+ACGATTGTGGCCGAGAGAGGAACTTATCTCGGCCGTTAGGTTAACGGCCTGAGCTACAAG
+GCCATTTAGTGGTGGTGTTGGTGGTGGATTTTGGGCGGTGCTCCGGCGCGTTGCTCAGAG
+AGCGACGGTCGTATGATATATGGGGTGAATGAGGCGATAACAGGGATGATGCTCCGGCGC
+CTTAAAAAATCAAGGGTCGTATGATATATTGATGAATGAATTTTCCTTACAATCTACCAC
+TACTCTTAGGAAAGCATGTAA
+>ds2020-328_193
+GGTCGGATAGACGGAGGAACGAGGTGCGCTCAGTAAAAATTAAAAAATTAACAGACGAAA
+AAATTGCAAAAAAGAAAGTATTAATTTCACTTCTAAATCTTTAATCAATATTCTTTTTGC
+CTTGGTGGATCTCTCTCTCATTTAATAAAAGTCTGGAATCTTGGGTTACTAATTGGTGGA
+ATACTAGGCAATCCGAAATCTTTTTGAATGATATTCAAGAAAAGAGTATTTTAAAAAAAT
+TCATAGACTTAGAGGAACTCCTACATTTGGACGAAATGTTAAAGGAATACCCGGAAGCAC
+AATAGAGCGTCTATCCCGACC
+>ds2020-328_194
+GGTCGGGATAGACGTTGGGGTTCGGTGCTTGGCTGTGGTTGGCTATTGATCAAGTAGTAA
+TCCGTTGACTACATTTGTGCGAGTGATGTAACTGGTGGGTTTGTGCTTGTACCATCGTCC
+GCGTGCGGAGTTGCGATGGGAGGTTCGCCGTGTAATTGCACTTGCCTATTGTAAGTGGGC
+TATCTTTCCGTTCGTTTGTAGAAAAGGCGGTAGTGGCAGTGACCTTGCTGTGGCATGGAC
+AGGTGGGTAGCTACACTTAGGATGCTGCTGTATCTGTGGTTTGGTTTCTGGGTTGCTTTC
+GGGTGTAGCTGGCGGCCGTT
+>ds2020-328_195
+GCCGTGGACCTAGTCTCAGTCCCCTGGTGGCGGATCAGCCTCTCAGACCCGCTACAGATA
+GTCGCCATGGTAGGCCTTTACCCCACCAATTAGCTAATCCGACTTAGGCTCATCTATTAG
+CGCAAGGTCCGAAGATCCCCTGCTTTCTCCCGTAGGACGTATGCGGTATTAGCATTCCTT
+TCGAAATGTTGTCCCCCACTAATAGGCAGATTCCTAAGCATTACTCACCCGTCCGCCGCT
+AAGATCAGTAGCAAGCTACCTCTCTCCGCTCGACTTGCATGTGTTAAGCCTGGCGGAGCG
+TCTATCCCGACCGCCGTA
+>ds2020-328_196
+GGTCGGGATAGACGTTTAGCAGCCTTAAACTCTTCATCTTCAGGGTATTGTGAGTGATAT
+GCTCCCGTAGGTGCCCACTGCCACCTCTTATTCCAATAACTTTTCCACTTTATGTTATCT
+GGTTTACTCCCGAGGTTTTTCAATCTAGTGAACATTTCTCCACTAGCCCTGTATATCTGC
+TCTCTAGTGAAAGAAGCGACGTTGGGTTTGGTTCTGTGCTCTTTCTCGGCTTTCCAATCC
+ACTTCTCCTATACCTCTGTTGACTAAAACTTCCATTTCAAAGAATGGTTTTAAGTTGAGC
+GGTGCGTCTATCCCGACC
+>ds2020-328_197
+GGTCGGGATAGACGCCTCGAACAACTCCCTCTCTCTGTCCCCTCCTCTCTCTGTCTCTTT
+CTCTCTCCCTTTCTGTCACTCTCCCTCTCTTTCTCTGTCTCTCTCTTGCCCTCTCTCTCC
+TTGTGTATCTTCCCCACCATCTCTCTTTCTCTCTCTTTGTTAGGCTCTGTTTCTCCATCT
+CTCTCTGCCTCTCTCTCTCTCTCCATCTCTTCCCTCTCCCCCCTCCTCTCTCTGTCTCTG
+TCTGTGTCTCTTTCTCCTTTTCTCTCTCTCCCTCTATCTCTGTCTGTCTCTCACCCCATG
+TCCTCGTCTATCCCGACC
+>ds2020-328_198
+TAATACCCATTAGATTAGACGTTACCTGCAGAATAAGCACCGGCTAACTCTGTGCCAGCA
+GCCGCGGTAATACAGAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGAGTGTA
+GGTGGCTCATTAAGTCACATGTGAAATCCCCGGGCTTAACCTGGGAACTGCATGTGATAC
+TGGTGGTGCTAGAATATGTGAGAGGGAAGTAGAATTCCAGGTGTAGCGGTGAGATGCGTA
+GAGATCTGGAGGAATACCGATGGCGAAGGCGCATCTCTAGCCAAAGACCGACATACCAGC
+ATTTCGTCTATCCCGACC
+>ds2020-328_199
+GGTCGGGATAGACGGAGAAGGCTACTCCCTTCCAAGTGGCAATGTGTAGCTCCACACCAC
+GAGCTACTCCATCAATCGGTTTGGCAGTTGAATTCACCGTCTTCATACTGCCTGCTTCCT
+TTGAGACCCGACACCCAAGTCTCTTTGCTTCCTGCACGGACATGAAGTTGTGTAAAGCAC
+CCGTATCCACCAGACAACGGGTTGTCTTGCCATTCACCATGACATCGACGAACATCACGC
+CTTTTGCTTGAACCTGTGGTTGAGCTCCCTTGGCCTGTAAGGCATTGAAGCGGTTAATGG
+CCCCTATTCCTGCTTC
+>ds2020-328_200
+TACTTCCTTCGTCAGCCTTCCTCCATAGCTACCTTTGAAGGGAAAGCTGGCTAGACCAAG
+CCTAGTAATTAATTGAATAAGAAGGAAAAAGGCCACTCAGGTCTATATCTAGAAAGGAGG
+CTGGATTGGAAGATTGAGAGACCCGGGACAGTGCAGGTTTGCAGAGAGGCTAGAGCATTC
+CCTTCACTAAAATAGAATAGTAGGTAAGATTCACTAGCTAGAAGTTTACTGAGAAGGGTA
+GAGTTTGCAGTAATCGATGAGAGAATGGTAATGCTAAAGGTAGGAAGAAAGAAGGGCAAA
+GACTAGGTCCACGGC
+>ds2020-328_201
+AGACTTCGGTGCCCCTCGGTTTTCTCTTATTTCTCTATCATCTTCCTGCTCTCTTTTCTC
+TAGGAACGTCATTCTTCCTACGTATCTCATCTGATTTTTGAACAGAAATTCCAACGCTCC
+CAGACTTCGGTGCCCCTCGGTTTTCTCTTCTTCCGTTTTCGATATCCCTATATCCTGACC
+TCTGTATGATAGTATCATATTCCTGTCCTCATGATTTAACTTCCATTTCCTATCCACTAT
+GAAGTCTTCTATTTCATGTTCTATCATTAATTTCTTTCTACTAGCCTTCACAACTTCGGC
+GCGTCTATCCCGACC
+>ds2020-328_202
+GGTCGGGATAGACGAAGAAGCGAACGTCATCGTCAGTAGCCTCGGACCAGTCAAGGCGTG
+GCATACGGAGCGCAGGGAGGTACCTAATTTCCCTCCAGTGGAATCGTTGCTGAGCAACGA
+TGCACACGGCGAGAAACGGGGGGAAGAAAGCCGTTTCAGACACGACGGTGTCATCAACAA
+AGAAATCATCCCCACTGACATCAGCAGCGTTGACTACGAGGAGGGCCCCAGACAACGCGA
+ACTGCGAAAGTGGTCGGTACTCCATAACGTCCCGTGAAAACAAAGCCACAAGGAAGCTTA
+TCGTCTATCCCGCCC
+>ds2020-328_203
+GGTCGGGATAGACGGCGGCGAAGATTTAACACCTCCTAAGGGCTGGGTGAGAGAAAGCGT
+CCTTTGTTGATACCTAGTGTACACCGCAACCTACTGAAATGGATTAATAAACGTTGCTTT
+CTATTGCTTGTAGCGGCGTTGCTTCCTTTTGTTCACCGCGAATAATTCAATCTTGAGAAA
+GAAGGCCTTGTGGGGCATCTCCAACAGCGCCAAAGAAGGAAGATGTTAAGTATTCTTTGT
+AGACTCGCACCGCTCACTTACGGTTTTATACAGAGGGGGGTTGTATTGAAGGGCCTTGTG
+ACGTCTATCCCGACC
+>ds2020-328_204
+GGTCGGGATAGACGAAGAGAGAGAATATGGCTGCTTAGCAGCGGAAGCTGGGGATCGAGA
+AGCGGAGGGAGAGCTTAGGCTTGAAATGGAGCTAGGATACCGGTATTTTTCCCTACCTGG
+ATCCGAGTCTTTCTCTTCTCCTGGACCGAGCACCGAGACCGAGGAACGAGAGGCTGGATA
+CGAGTCTGATGAGATCAGAGCCAGTGAAGAGAAGAGGGAAGGCTGACTCTGCTAGGCTGG
+CTTGCTTGTTCGACTAGAGCACATAAATAAGGTAGCTTGCTTACTTAGAGCGAAACGAGA
+CGTCTATCCCGACC
+>ds2020-328_205
+GGTCGGGATAGACGTTAACTTGAAATCATAATCAGTCATTAAGTGGGTCTTGTATGTCTT
+GTTTTCATATGTAGATGTTTTGTAGTATTTAACCATAATCATCTCTATGTCTTCTGTTCC
+TGACCCCTCGGCATCCCATGTTGGTGCTATCTGAGCAACCACGTCCATACGAGTCCATGT
+GTAAACAGTATTATATGTTATCAGCCTGTCATAAGGGGTACCAAACTGGTGTTCTCTGGG
+CAAAACTCGTTCAAGAGTGTATGAGGTAGCTTCGTCTAAGGTGGCCAGGTCGTCTATCCC
+GACCGCCGAATTCA
+>ds2020-328_206
+AACGGCCGCCACTAGATTATCCGTGTCCACTTGCCTAGTTATATCATCCAGGACAGTGTA
+CCAATCGTTCTCGGAGAGGTAGGTGATAGGTGTTCCACTCAGCAATGTAATCTCTATGAT
+TATATTACCGGATCCAGTATCATATGTTATGCTAGGACCAGGGCCATTGGCATCACGTGC
+ATCAGCTACAGCTTCTTGAATCTCTCCGTTGGCAGTTTCAAGGTCATCTTCGTCATAAGG
+AGGATCGTCTTGGTTCTCTTGAACTTGAACGCTAGACAACACAGTTACTCCAAGATCTGG
+TAGTGGCGGCCGTT
+>ds2020-328_207
+AACGGCCGCCACTAATCCGTCTTGGTTGATGTAGACTTAAGAAAGTTCTTTGAGCTGGAA
+GTTCTTGTCAACAGAGTGGATGGACTGGTCAACTGGGAGGAGGAGCACAAGAACAGGGTG
+TCCCCTAACTTGGCCGAGATGCCGGAGGGATTGGTTTATGAAAGGGCCTCGCAGCTCTTC
+AGTAGATCGATCTCAGCGGGTAAGAGACCGAGGAAGTTTGATTGGCGGGAGTACTGGCAG
+AGTAGGTGGCAGTGGAGTGCGGCCGGCAGCATACACTCGCAATATTCAGAAAACGAAAGT
+AGTGGCGGCCGTT
+>ds2020-328_208
+GGTCGGGATAGACGTCAAGAATCCCGCACGGGTTCGATTCCCGTAAGGGATAGGTACTCA
+TTCCCGGCCGCTTTCAGTTAGTGTTCATTGCTGAGTGATCGCTCGCTATTTGGCTGGAAA
+GGGTGGTCTGGAAGCTTCCTCTCTCCCAGCAAGCAAGACGAGATCACCGCTTCTCTCAGT
+AATGGACTTCCTTGAATTCTTCCTTATCCTGATTCCAAAGTTTTTATTTATTCTTTACTT
+TTAAGTGAAAAGGGGGAGTTGGATCATAAAGAAGAGTTTGTTCCTTAACTAGTAATCAAC
+GTCTATCCCTACC
+>ds2020-328_209
+GGTCGGGATAGACGTTCTTTAGGTGGGGAGGATAAGTTTCAAGTGCGGATACTTCATTTC
+AAATGGGTGAGAAATTTTTGATTGAGACAACATCATCCATTGTGATGCTAACCATCCCCA
+AGTGGGATTGGGTTTTTTTACCAAGTGCCCCAAGAAGTGAGTCGATAATGGTTACCTGAT
+AGGGGACCTAGGCTTGTTGATTGGTAAACTTCACTGAGTTCCTCGGCCAACCCTTTCATT
+CCCGAATGGAAATAGGGTACAATTGCTACAGACGATCCTTTAAGGATGTAAATGATGCGT
+CTATCCCGACC
+>ds2020-328_210
+GGTCGGGATAGACGGGGTGCGCCCTTGGATTGCTGTTGCATATTCAGCTCCTGTTGCAGC
+TGCTACTGCTGTTTTCTTGATATATCCAATTGGTCAAGGAAGCTTTTCTGACGGTATGCC
+CCTAGGAATCTCCGGTACTTTCAACTTCATGATTGTATTCCAAGCTGAGCACAACATCCT
+TATGCACCCATTTCACATGTTAGGCGTAGCTGGTGTATTCGGCGGCTCCCTATTCAGTGC
+TATGCATGGGTCCTTGGTAACCTCTAGTTTGATCAGGGAACAGATATAGTGGCGGGCGTT
+GCTGTGTATTA
+>ds2020-328_211
+GGTCGGGATAGACGAGTCTGTGTTCTGCGGTTCGGCGGGTAGAGGAGATCACTATGAAGA
+ATAAAAGGCATCGGAAGAGGGCTTTAGCCCAAGAGGTAGCATTTGGGAACGATCCATATC
+AATTGGTATGAAAGCCTACAGCAAGAAAGAAGGAAAGAACGAATGATAGGAATGTAGCGG
+AAGAAAAAAGTTCTTTGAAGGGGGCCCACCGCCCTCCATTTGGGAACTCTTTTCTATCCT
+TGTCCCTTGCCGGCTAGAGCCACGGAGCTAAAGGCGGATTCTTTAGTCGCTTATGCCGTC
+TATCCCGACC
+>ds2020-328_212
+GGTCGGGATAGACGTTGGAGCGGGCTGGGGATCCTATCAACTTGTTCCGACCTAGGATAA
+TAAGCTCATGAGCTTAGTCTTACTTCACCGTCGAGAAACGAAAGAAGACTTCCATCTCCA
+AGTTTAACTCAGACGTAGCTCGCTTCTTTTTGGGTGTGAAGCAGTGTCAAACCAAAATAC
+CCAACAAGCATTAGCTCTCCCTGAAAAGGAGGTGATCCAGCCGCACCTTCCAGTACGGCT
+ACCTTGTTACGACTTCACTCCAGTCACTAGCCCTGCCTTCGGCATCCCCGTGTATCGTCT
+ATCCCGACC
+>ds2020-328_213
+GGTCGGATAGACGGTCATCTGGCCTCGAATACGGTTCCCTTCTTTTATTCTATAGCTTTT
+ATTCAATTAGGGCGAATACCTTGTAACCGAATTTCTTTCTTGAAAGATATGCTACTTCCC
+GGTCGAGCTGTCTTGTAACGGTCTCTAGGGTCTTCAGTCGAATTTTTCTTCTTTCCTGTA
+GTAGTTCATCTGATGAGTTCATCGCGCAATTTGAGTTTAAGCATCGGGCTTCTCAAAGCT
+ATCTTCTGTAGGGATCGGAGATCGCCTTGTATAACTATCGATCAATGGTATAGAATAGTG
+GCGGCCGTT
+>ds2020-328_214
+GGTCGGGATAGACGGCATTAATATGTTAGGGTTATAAACCTTCACGTTAGAATATGTCAA
+TTTTCCATTGTTAAATAACGCATACGTCTTTGGATTAACTTTAACTTTGATATCCAACTG
+CCTACCGGACTGTATTATTTCTATCCAATTCTTAGCCCTCTTTATTAAAGTGTGCATTGG
+CATTACAAACAGGTTTGCTGCTCCAGTCCCTGGTATATCTGGCATTACATGACCATTTGC
+ATTTGCAGCCCAATTTTTGTATTTCTTACCAGTCATCGCATCATACACCGTAGACGTCTA
+TCCCGACC
+>ds2020-328_215
+GGTCGGGATAGACGAACGAGATGGCTAAAGCAGACGGGGAGCGTGAAAGACTATGTCACC
+ACGTTCACCAACCTATTGTTCGAGGTGCCTAGCATGACGGACGAGGACAAGCTCATGTAC
+TTCATGAGTGGCCTACAGAATTGGGCCAAGCTGGAGTTACAACGGAGGCACGTCCAAACC
+TTGTCAGAGGCATTGCTGCAGCCGAGTCTCTTGTGGAGTTCAAGAGAAGTGATCAAAGCG
+ACTCTAAGTTCAAAGGAAGGAAAGATGGCAGCGGATCCAGTGAGGGAAACTGGGCGTCTA
+TCCCGACC
+>ds2020-328_216
+GGTCGGGATAGACGCGGGGTTTCTGTGTGAAGGGGTCGTGATCCAAGTGGTCCAGGTGCT
+TGATTAGCTTGTGGAGGTTGGGAAGGACGATAAGACAGTGGTTTGTCTCGCTTATTGGTT
+GAGAGGATCTCAGGAGTGTGAGCGTCCGGGAGTCGACCATTTAAGTCTTCTTCTTTGAAG
+GTGGTATTAGACATTCTGTGTTAACAGAGGGGTAAGGGGTAGATGAGGTTTGGGTGTGTT
+AGTTTTCGTAGGAAAAGTTCAAAAGTTTGAGTGGGAAGGAGGGATATTTACCCCGTCTAT
+CCCGACC
+>ds2020-328_217
+GAATTACGGCGCTCATGTCTCGCCCCCCCCGTCTAGTGACCGGTTCCATGTTTCCCCCGA
+ATTTCATCAGTTCCAGGCTCAAGTGCCTGCTCATCCATCTTCATTCCAAAGGCGAACATT
+TCCTTGAGTGACTGTAACTGCTATGGTTTACAGTCAATAGTTCTTAACCAACCCTTTCTC
+TTAGAGCTTTATAAAGCTTTAAGAGAGAATAGGGAGTAAGGGGGAGCTTCGCTTCATTAT
+AAAATTTACCCGGACCTTCTTTCTACTCCTGCGGAGCCCTGCGAAAGTAACCTCGTCTAG
+CCCGACC
+>ds2020-328_218
+TGAATTACGGCGGTCGGGATAGACGAAAATGGGTGGTTGTGGTAGTTGAGGGCTTTTCGG
+GGTGTCAGGTTCCGATTCGGAGCTGGTGGTGGAGGCTGGTGGGTTGGTAGTAACGGAAAC
+TGCATCTGATATCGATGGTTGCTTGGTAGGTGTTGGTCTTGGTCTAAGAGACATGTTGGA
+CTGTGGCGGCTGAGGTGGCGGTGGTGGTGGTGTTGGCGGTGGCAATTGTGGTGGCTTTGA
+GAATTGTTAGTATTTAGAGGAGACACTTGGCTCTTGGCGTACGGGGGGAGACCGTCTATC
+CCGACC
+>ds2020-328_219
+GGGGCGGGATAGACGGCACCTGGACCTATAGCTTTTAAAGTAGCAACAGTGGTCGGCGTT
+ACACTTCTGGAAACCTTCCTTGTGCATGAAACCGTCAAACTTTTTGTACCACTGTCTTGG
+AGCTTGTTTCAGGCCATACAAACTCTTCTTAAGTTTGCACACCATGTTCTTATTCCCTCT
+TTCTGAGAAACCTTCTGGCTGGTGCATGTATATCTCCTCATCCAAGTCTCCGTGAAGAAA
+TGCGGTCTTCACGTCTAACTGTTCAAGATAAAGATCTTCAATGGCAGTGTCGCGTCTATC
+CCGACC
+>ds2020-328_220
+GGTCGGGATAGACGTGCCCTTGGAGTGCGCTCTTTGCCCGCGATTGTTCTTCTCAACCTG
+TCATAGAGCTCGACATCCTCCAATACGACCTGCTTGTCCGCGCTATGGTACACGTACCAC
+TCAAACCCAAGGCACCTGTACACTGTTACGTCTCCGCGGACATAGACTTCCCTATCTTTT
+TTGATCATTTCCCAGGGGTCGACAATTTTATTACACTTGTCGACTCCACACAACACGAAC
+TTGATATGGTATGTATCCCCAGCAAGTTTGTTTATATCCCAAAGCACTAATCCGTCTATC
+CCGACC
+>ds2020-328_221
+GGTCGGGATAGACGGGCAATACTCTTCATTCTTCGTAACCTTTATTTTTTGTATTTTTAA
+AATTCTTCCATGACTTAACCTCCAAATATCTCATGAAGCTTTTCCAAAAGCTTCTCAAGA
+ATTCCACATTCTCCACCACCTCCTCCTCCTCCAGTACACTCACCTCCTCCACCAAAGGCG
+CCTTACCACTACAAATCCCCACCACCACCACCCAAGAAGCCTTACCACTACAAATCTCCC
+CCACCACCACCAAAGAAACCTTACCACTACTCATCTCCTCCTCCTCCTCCTCCACACAAG
+AAGCC
+>ds2020-328_222
+GGTCGGGATAGACGGGCTTTCGTTCTATTTCTTTATCTCCCCATGAATCGTATGTTTGTA
+ACAACAGGGACAGAATTTTCTCAATTCCAATCGACCAGGCGTATTGTGTCGATTCTTTTG
+AGTAATATATCTGGAAATGCCCCTTGATTCCTTATTAACACGATTTCGAAGACAACTGGT
+ACATTCCAAAATAACTGTTACTCGGACATCTTTACCCTTGGCCATGAACCTCCTTTGGTT
+TATGATTCACTCAATTCTTTAATTTTCCGATCCGAAGCAGGGCATGTGTTCGTCTATCCC
+GACC
+>ds2020-328_223
+GGTCGGGATAGACGTTTCTTTACTATAGATAGATTGTCTCACCGCGCTTTCGATCTCGTT
+ATGGCTGAATGATGCGTCAGCAGTGAAAGGAACAGGTAGATCTCATACCTTTATTTATAT
+AGAATAAGCTTTTCTTTTCAAGTAGTTTTAGCTTCTCGCCCTATAGTATAGGTAGGGAAT
+GGACTGAAAGCCAACTCCTGCTGATGAACATATACGCTACTTCCCGCCCCGGAAGAACCT
+ACTTCCATTCAACTACCTGAACAAAATAGAATAAGAAAGGGGGGAGGTTCGTCTATCCCG
+ACC
+>ds2020-328_224
+GGTCGGGATAGACGCCTATTTGCATTTGTTATTGGAAAATGAGGAGGAAGCCATCTGTCA
+TGGAGAGGCAATCCTCAAATACGTACTTTGACCTGACGGCTTACCGTTCTTAGCTTCTGA
+TGGGAATTCCAAGTCGTATTGTCCATCGGAACCATCAATCATAAGATTAGCCAGTCAGAA
+AGTCTTCGCTCTTCCAAAGCCTCATTAGCACGCCAGTCAGTCAGCTTGACCAAGAAGACC
+CGAAAAGGCACACAATAAGGAAAGGAAGAAAAAAAGTACCGTTCCATGCGTCTAGCCCGA
+CC
+>ds2020-328_225
+GGTCGGGATAGACGAGGAGATGCGATTCATCAACAAAGGGATAAGGAACTTTTAAGCCAC
+TCTTCTAATTGGCTATTTCCGATCGGATCTTGCCGGGAGTTAGTGTATTGATGCCGAGAA
+TACGCTCTTTGATAGAATAAGCTCTTGTCTCAATATACGCTGTTTTAGCATTCTCCGAGC
+AGGAGAACATGAAGCTTGTTTGCTCTTTTGATTGAGTTCACGAAGGCTTTATTGAAAAGA
+CTTTCTGATTTTAAATAGAAAGAAAGTCCAGACCAACGGCTGCCGGCGTCTATCCCGACC
+>ds2020-328_226
+GGTCGGGATAGACGCTATCGAGATAAATTTATTCTTCAACCTTATATCTGATTTATGTAT
+AAATTGTTCGTCAGTTTTATATTGTGAATGGATACTCCCAGAAGCACTCCACTGCCATCT
+GTTGGTCCAAAATTTTTCCCAAGACATCACCATAGGAGTTCTCCCGCTAACTGCTGCACT
+CGCGAAGATTTTAAGTGCTTCATTCTGGATATAATCAGCACTTAGCTTGACTGTTGACGC
+TTTTGTTCTATGTGTGAACTCAGCTTCCCAATCGAGCGCGCCGTAACGTCTATCCCGACC
+>ds2020-328_227
+GGTCGGGATAGACGAAAAGAGCCTCTGGGGAAGGGATTTCGAGCGGCGAACCAGGAAGCC
+GCTGCCCGACTCCCTGAGAAGGCTGCGAATTTATTTCTTCCCCCGGTTCAGCGGTCCCTC
+TAATCCAACCTGAAAGCCCCTCAAAAAAGGAAGAGGAAGAATGGTCATCCCCCCGGGGCC
+CAGATGCATCCATCATCATACCTGATGAGGTAATTGCCCCTACGGCAATCAAGCGCACTC
+CCCAATCTCCGTCTGTCACGACAACTAAAATATTTAAAAAACATAAAAACCGTTGAACG
+>ds2020-328_228
+GGTCGGGATAGACGCCCTTGCTCCATAGCGTTTCTTTGATGTTGCAGCTCCCTTCGTTGC
+TGCGTTCGTTATCGTTTGGTATTGATATATTCAGTACCTACGTGATGCGACGACACACAA
+AACGTTTCGTCCATCAGGACTCTTCAGGGCACATGTTTACTGTATATCTAATCGCCTCCC
+AAGCACTGCCGTCTTCGCTGAACACCCAACTGTGTCAAGCTTATTTTCCTGCTCTGCTGC
+TCGTGTCTGTACAATTCGTGCACACAGAAGTGTATCGCATCTAGACGTCTACCCCGACC
+>ds2020-328_229
+GTTACATGCATTGGACTCGCGACTTGAATTACGGCGGTCGGGATAGACGTTGTTCGCGGA
+TGGAGAGGTACAACATGGATAAATTCTACTTTAAATTTTTGCTATGTGGCTATTGCACTC
+CAAAATATGGAACGTATACATGGTGTAAGTTGTGTATTATATGTAGATCATGGCGGAGAT
+GATATAGATTTAGGATTAAGTGAACCTGCCATGCTGCCATTGTTCCTAGAAATAATGGAT
+AGCATGCTGTTCAAGGCGAATAAATGGAAACAAATGTCCGATCCACGTCTATCCCGACC
+>ds2020-328_230
+GGTCGGGATAGACGATTTGGACGCCTGGTCGGGATAGACTTCACGTACGCGTCTATCCGA
+CCGCCGTAATTCACAGCAACGGCCGCCACTATGACCTTGCTGTCCATTTACTTTCCTCAA
+TAATCGCTTCGGAGACACAGGGTCCTCAAAGTCGATAGAATCGTAAAGACCTGAGGTGTG
+CCTGGTCATTTGAGAAAGTATTTCTTTGCGTATACCCCATGAATTACGGCGGTCGGGATA
+GACGCCTATGTTGAGTGTTACGTTATCCCGACCCCCCGCAAATCCGTCTATCCCGACC
+>ds2020-328_231
+GGTCGGGATAGACGTACCTGGTGGCTTGTTTGCTTTCCTCTTTCGGGGAGCAGGACAGAT
+AGCCTAAGGGACGCGGAAAGACTACGGGAAGGCTTGTTTGCCGGCGATTAATGCTTTCCT
+ATCTTGAGTTATTCCCTGTGATCCATCTATGAGATCGCTTGCACCGGAAGAAGTCTTTCA
+GATCCTCCAAACTAAAGCCGTCGAAACAGAACTCAACCGAAGCCCTTTCCCGTAACAACC
+TAACCTACAAGAAGGACCAAAGGGGGGGTTCGTCTATCCCGACCGCCGTAATTCAGAT
+>ds2020-328_232
+GGTCGGGATAGACGTTTTTGGGCCGGCCTTAACAGATGACTTACATTGTAGAGAAAGGTT
+TATCTAACTAGTGTGGGAGTTTGGCTGACCACCCTGCTTTCTGACGCTTTCTCGACGGTA
+GGCACCCAACGTCGCCAAACAAATTAGCCTCTCCTTCTTCCTCAATAGCTGCCTTAGTTT
+AGTCTTTGGTTGGTGTGCGACTATGAGCTTCTGGGCCTGTACGATTTCCTGTCCGAAAAG
+GCAATCCTCTACAGGAAGGGCCAATGGCTACGTCCCGCCGGTTCGTCTATCCCGACC
+>ds2020-328_233
+GGTCGGGATAGACGCTGTTTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGGAAGC
+CGGGTTACGGTGCCCAACTGCGCGCTAACCTAGAACCCACAAAGGGTGTTGGTCGATTAA
+GACAGCAGGACGGTGGTCATGGAAGTCGAAATCCGCTAAGGAGTGTGTAACAACTCACCT
+GCCGAATCAACTAGCCCCGAAAATGGATGGCGCTGAAGCGCGCAACCTATACTCGGCCGT
+CGGAGCAATTGCCTGGCTCCGATGAGTAGGAAGACAAAACAGTAGTGGCGGCCGTT
+>ds2020-328_234
+CGGTCGGGATAGACGGGTCGGCATACTTGTAGACTAGTTTTCTATGGGGGTACCCGGAAT
+CTATAGTGGCATGTGATATATGTGAAATATGGCATCACAGTCGCTGAAGTGGCATTGAGG
+ATGCGGAAGCTCTGCCACCTGTTTGTTCACACAGGGCGATTTCGGGGGCCTTTGCTTCGA
+AAGGGGCGTAGCGGAAAGAAGTAGCGGAATCAGGCGACTTGCCACACACCAGGAAGAATT
+CCTTCTTAGGCGTATCTAACTCTTTTGACAAATGCCCAGAGGACGTCTATCCGGCC
+>ds2020-328_235
+GGTCGGGATAGACGTAAGAGGGGGGTGTATCCGTATTTGGCGGAGTAGGTGAGCGTACTC
+GTGAAGGAAATGATCTTTACTTGGAAATGAAAGAATCTGGAGTAATTAATGAACAAAATA
+TTGCAGAATCAAAAGTGGCTCTAGTCTACGGTCAGATGAATGAACCGCGAGGAGCTCGTA
+TGAGAGTTGGTTTAACCGCCCTAACTATGGCGGAATATTTCCGAGATGTTAATGAACAAG
+ACGTACTTCTATTTATCGACCATATTATCCTTTTTATGCAAGCAGCGTTTGTTCT
+>ds2020-328_236
+GGTCGGGATAGACGTATCTTATTCCTTATGTTTAAGTACCAGCATGTCCAGCCAGAAGGA
+TAATGCATCACTCCTCTCATCTGCATACCTTTTCTTGTGTTTCATCCTTCCGTCTTTGAC
+ATTCCATCTGGTTATCATCTCTTTGGCTAGTCTCTTACTAACATTGTTCTTTGTGGCTAG
+CGCTAAAGTCTCTATGTCTTGCACCATCCTGCAATACACCACCTCATTTTAGTCCTGTCC
+TGCTCTGACTTAGCAATTTCCCCTCGCTCAGCATCATTAGCCGTCTATCCCGACC
+>ds2020-328_237
+GGTCGGGATAGACGTAATGCGCCACTTGCGTCTACCCGACCATGAGACGTCGGCGTCTAT
+CCCGACCAGGGGGATGGACCGTCTATCCCGACCGCCGTAATTCCCGGACAGAGGCCGTGG
+ACCTAGTCGTTCTGCCCCTGCCGTGGACCTCGTGAGTAGCGGGGTGATTACTAGGTCCTC
+GGCTCTCTGTCCGGCGGACAGAGAGCCGTGGACCTAGTAGTATTGTGAGTATAACTAGGT
+GAATTACGGCGGTCGGGATAGACGTAATTAGGGGGTTCGGTCGTCTATCCCGACC
+>ds2020-328_238
+GCCGTGGACCTAGTTATTTAGAGGGTTTCTGACTAGGTCCACGGCAGACCCAGGAGGACT
+AGGTCCACGGCTCTCTGTGAATTCGGCGGTCGGGATAGACGGCTTGGATTGCTGCAAGCT
+CTGACGAACATGTATTTTTAATCTCCAACTGCGTGATGTCTATTTCCATTGATTCCCCTG
+TGTTATTGAACATTTGCCCCTGCAACATGCGCTTATGCATTTCTCCATCTGGCTGACTTG
+CCATGTACTCCACCACGGATTTGAATTGTAGTCCTGACATTTTGTTTATTTTCG
+>ds2020-328_239
+GCCGTTGACCTAGTCTTTCGATGGCGCTTAGGGGTCGTTTTGGTATAAGAGGACATAATG
+AGATCACGGTTTTAGTAAATGATGCAGAGAAGGGTAGTGATATTGACCCACAAGAAGCGC
+AACAAACTCTTGAAATAGCGGAAGCTAACTTGAGGAAAGCTGAAGGCAAGAGACAAACAA
+TTGAGGCAAATTTAGCTCTCAGACGAGCTAGGACACGAGTAGAGGCTATCAATGTGATGT
+CGTAACTAGTCTAGTTGGTCCGTCCGAACCGGGGCGTGACGTCTATCCCGACC
+>ds2020-328_240
+GGTCGGGATAGACGTTCAATGGCGATGTGGTGGTGGAGGACAAGGAGGTGGTGGTTTAGG
+ATAGTCATGGTGATGTGGGGGTGTAGGAGAAGGAGGTGGAGGTTTAGGATAGTCATGATG
+GTGCGGTGGTGGTGGTGACGCAGTTGGTGGCTTTGGATAGTCATGGTGGTGTGGGGGTGG
+AGGTGGTGGAGAAGGTGAGGGAAGTGGTGGCTTTGGATAGTCATGGTGGTGGTGTGGTGG
+TGACGGAGTTGGTGGCTTCGGATAATCATGGTGGTGGTGCGTCTATCCCGACC
+>ds2020-328_241
+GGTCGGGTAGACGGCGGAGTGTACTTGATACCTTTCGAATTCACGGGGTAGATTTTGTCG
+GCATATTCGTCTGGCTCGGGCAAAGGAATGGTAGGAAATTCTTTCGGCTGCGAAATTAAA
+GTGGCGTCAGAAGTATATGACAAAGGGAGTTTCTCACGACGTCTGTACCTGTAGAGGTAC
+TGGTCCCAGACCTGATAGCCGGTTGATGACATGTCTGTCGTCCAGCACATCACCGAATCG
+AATTCTGGATGCTCAACTCGGGCAGTGTAACAAACATCATCAGCGAACCGGCC
+>ds2020-328_242
+GGTCGGGATAGACGGGGCACAATTCTAAGAGTACATAGAACAACATACTTCAATTTGGAA
+ACGATCCTACGGTCGGAACCTATCAAACCCGGATAACGCATAATATGCGATAATCCGTTC
+GATAGTCAAACGACCTCCGAATCGAGATCCGCGAAATCCTACACGCTCGTGACAACCTAA
+GGATCTCATTGGGACAAAATGCAGCTTCACCACTTCTGCCCTTGCGCGTGGGTTGCTTGA
+GTAAATTCCGGCGACCGTAAAAACTTCAAATCGCCACCTCGTCTATCCCGACC
+>ds2020-328_243
+AACGGCCGCCACTATTTGTCATTTTTATTTCATGCTACCGTAACCTCACAAAACTTAGAG
+CCTCCGTGTGGAGCATAAGCGATATATGACATACGGTAGCATGAAATAAAAATACAAAAA
+CAGTATAAAAATATAAAATCCTACCCGAACCGGACACTATAAGGTAGATCTTATGATAGA
+TTAGTTGGCAGGAGCTGTGGTTAAAACCTGGAAGCCGTAATTCTGATCTTAGGAGAAACC
+GGACGGTGATAAGGCTAACTAACTAAACAATGCGGAATTAGTGGCGGCCGTT
+>ds2020-328_244
+GGTCGCAATAGACGCCGGCGGTAGATTGGAGGATTAGAAACATGACTATTACTCTCCGAT
+TGGCTGTTTTTGCATTAATTGCTACTTCATTAATCTTATTGATTAGTGTACCTGTTGTAT
+TTGCTTCTCCTGAGGGTTGGTCGGGTAACAAAAATGTTGTATTTTCCGGTACATCATTAT
+GGATTGGATTAGTCTTTCTGGTGGGTATCCTTAATTCTCTCATCTCTTGAACCTATTCGT
+TCTAGATCCAAAAATGACATTACCCCTCCCTCCGAATTCCTTCAGGTGGTGA
+>ds2020-328_245
+GGCGGGATAGACGCGCGCCTTTTCTACTTGATTATCTTTTGGGTTAATATCGCAATAATG
+GGACTTGTTGTTACTGCCTTCAAGAGACAGACTTAAACCCCCCTTTACCATTTCAAAGAG
+GGTGGATGCCGATGCCAAGAGAGAGATTCCGTAGGGGAGAGATTCGATTACAATTTCTTT
+TTTTTTACTAGCATTTTTTTCCGTTCGCCCTACTACGAAAGTTACTAACCGCAATTTATT
+ACTTGGCAGCTTCTATGAGTTGAAGAAAAAGACAGCCCCGTCTATCCCGACC
+>ds2020-328_246
+AACGGCCGCCACTATTTGCTGTCCTTCCACCTTCCTTAACAATCTTTTCGGAGACACAGG
+GTCCTCGAAGTCTATCGAATCGTAGAGGCCCGAGGTGTGCCTGGTCATTTGAGAAAGAAT
+TTCCTTCCGCATTCCCCAAGTCCTCTGACTGACGTCGTAGTAGACTGCCGATCTGTTGCC
+CGGCATAGGCGATACGTACGCCTTAATTAAATTACCGTAAGCACAAACATTGATATCGCC
+TTCAAAAACGCCATTAACCATTCCCATAAACAAATGAGTACTATCCCGACC
+>ds2020-328_247
+GGTCGGGATAGACGGACGAAAGTGGTTAGTTAAGTAAGGTTTTCGGAGTATGAAGGTTAG
+TTAAGGCCTTCACCATATGTATTTCCCAAAGGGAAAGGGGAAGACCCTAATTCTGCAGTC
+AATTATATGGCAAAGGTAGCTCTTTGCTTTATTTCAGCAACCTCGATTGAAGCTGTAGGT
+TTAGGGCGAGCTATCAGAGCAGCAAGTGGTAGGCTGTAAGCCGAATGAGAGAGCTATCCA
+GTTTTCAGGTAAGAAGAAGGGGAGTAAGCAGCCCATACGTCTATCCCGACC
+>ds2020-328_248
+AACGGCCGCCACTAGTTTCGGTCCCTAAATATTGCTAAGTGGGAAACGAAGTGGGAAGGC
+TAAAACAGTCAGGAGGTTGGCTTAGAAGCAGCCACCCTTTAAAGAAAGCGTAATAGCTCA
+CTGATCGAGTCGTCCTGCGCGGAAGATGTAACGAGGCTGGTTAGTGGCGGCCGTTGCTGT
+GAATTACGGCGGTCGGGATAGACGATTACGAGGGCTGGTCGGGATAGACGATAATGACCG
+CTGGGAAGACGCATGATCAGCAAGTTGCGTCTATCCCGACCGCCGAATTCA
+>ds2020-328_249
+GGTCGGGATAGACGATCGCTCACGCTTTTTTAATGATCTTTTTTATGGTTATGCCGGCGA
+TGATAGGTGGATCTGGTAATTGGTCTGTTCCGATTCTAATAGGTGCACCTGACATGGCAT
+TTCCACGATTAAATAATATTTCATTCTGGTTGTTGCCACCAAGTCTCTTGCTCCTATTAA
+GCTCAGCCTTAGTAGAAGTGGGTAGCGGCACTGGGTGGACGGTCTATCCGCCCTTAAGTG
+GTATTACTAGCCAGTCTGGGGGAGCGGTGGCTTTAGCAATTTATAGGCTT
+>ds2020-328_250
+GGTCGGGATAGACGCATTCGCCATCTAGAGATATCTTTCCAAATGGTATAAATTTCCTTC
+TTTGCTCAGTGAGGCCACCCTGAATGTAAGTGACCTGTTCGAGGTACTGGCTTGTGGGTA
+TCGCCCTCCCTATCATTGCTCCATACATAGCATCGGCTCTATCAGATGCCTTGAGAACCA
+TGTCTGTATCCAGATATTGACGTTCTAAAATAGTTTGTAAATTGGGCGCGTTATGTATTA
+ATAAATATTATCCCCAGTACCAACAAGTATTCGCCCCCGTCTATCCGCCC
+>ds2020-328_251
+GGTCGGGATAGACGCAGACCCCCCGTTATGAGTGCTAACCACCGGGTCATCTCTTGTAGA
+AATTTCAGTATACACAAAGTTGAGTACCGTGTTCATAAATGTAGTCAGTCTCCAGCCTGA
+TAATAGAGTTACCGCACAGCGGTAAGTAGATCCGTCTCCTCTTCTAACTTCTGTCTTATC
+CAAGGCATCAATGGTCCAAGCTATACTAGCTAGCTGTTCCGGTTCAAGATATGTCTTAAA
+TACCGCACCGTACGCCTGCAAAACTGCCTGTTACCGTCTATCCCGACC
+>ds2020-328_252
+GGTCGGGATAGACGCCCGTTTGCCCTTAGTTGTCTCGAAGTTAGCTGCTTGGCATGAGTA
+GCTTGGGCAGTCTTAGTGAGTAGCTTGGCTTGCTCATGCGGGGCTTTGGAAAGAAAGTAA
+CCAGGGAATTCATATACTAATCTTCTAATCAGAAGTTTTTTTGTTTAAAAGTAGATCGGG
+AGTTCAAGCAGATGTTAAATTAAGGTGAGGTTTACTATTCTAGTCTACAGGCCATTTAGC
+TAAAAAAAATCCTGAGTATCGACTGTCATGATCCGTCTATCCCGACC
+>ds2020-328_253
+GGTCGGGATAGACGCCCTTGTCGTTGTTGGTTTAGGCTATTTCTAGTCTGAAATCATTAT
+TTGCTAATAAGAAGAAATGCAAGGACTTCTTATTTCCTGGGTTAAGAGATAAAAACTCAG
+ATTTGCCCATGAGTATGGGTGCCCCTTTAAATATACGGGATGTTACCTCTAAAAGAATTA
+GAGGTAAAAAGAAGATGAAAGAGAATTCTCATGTTCATATAGATGGTAAGGTCGGTGGAT
+GACCATACTATCTATTATTGTATACCTCCATATCGTCTACCCCGACC
+>ds2020-328_254
+GGTCGGGATAGACGGCAGCGACACTTGATCGATTTCAGACGCATGAGTCGCCACGTCACG
+GGACTAGGTTGAGCGGGGTCGTGGTCCGACAACGACATCTGTTTGTCGTATTATCGACAA
+TAATGGAAGGACAAAATCGAGGTGTTTGATGTCCAAGATGAATGTATCCTTGGTTCCTCT
+CAAGAGAAACCTTTTCCAAGGGTACATGGGGAAGAAGTTAGGAGTTGAAATCGGCGGTAT
+CGCTAAGGCAAGGAATGGTCATGGGGAGTCCTCGTCTATCCCGACC
+>ds2020-328_255
+GGTCGGGATAGACAAATATGTTCCCTGGTCGGGATAGACGTATCATGAACCTGGTCGGGA
+TAGACGCACGCTAGGTCTGTCGGTGTCTGAGCCGTTACTACCATGGGAAGTGTAGCCAAT
+GCCATCATAGTGGCAGATAGTTTTTTGATGTTCATAGAAATGGTTATTAATAGATTTGGG
+TAGATATACTATTTTTGTTCGGGAAGAAGGTAGGGCTGTGTTTTCTCTGTCACATTTCCT
+TGCAAGGATACCACAGCGGTACCCACGCAGCCCGTCTATCCCGACC
+>ds2020-328_256
+GAGAGGGAAGAGTTTTCAAGGAACCAGCTCCTGGGGACTTCTATTAAGAACGGCTTTTGG
+TCTTAGTATGTGGTACAGCATATAGAGTCGTGAGACGCTCTACTTCCTCTTGTTCAGTTA
+TCGATTCGCTGGCTGTTTCCGGGGGGCCCAGATGCTTTGCGAGACTGAAAGCTTCATTTT
+GTGTTCGGTTGCGTTATCTACCGCAAAGAGGGACTCCCCCTTTCTATTAGAACAGTGTTA
+GTTCGCTATTACTGCCGGTCAGGCCCTGGGTACGTCTATCCCGACC
+>ds2020-328_257
+TCCTGTTTGTCAATGCTCTCCCACCTCCTTTATCACTTAGTGCCAATTTTGGGGCCTTAG
+CTGGTGGTCTGGGCTGTTTCCCTCTTGACAATGGAGCTTATCCCCCACTGTCTCACTGGT
+TGTGTGTGCATCTGGTATTCTGAGTTTGTCTCGATTTGGTACCGCGTTAGCAGCCCGCAC
+CGAAACAGTGCTTTACCCCCAGACTATATTCACAACCGCTGGTCGGGATAGACGATGTTA
+GGTCCTGGTCGGATAGACGAATATGAGGACCCCGTCTATCCCGACC
+>ds2020-328_258
+GGTCGGGATAGACGAAACTAGAATTCTAACCTGGTGCCGTTAACCGGCATCGGAACAGTT
+TCAGGTGGGCAGTTTGACTGGGGCGGTCGCCTCCTAAAAGGTAACGGAGGCGCGCAAAGG
+TTCCCTCAGCACGGTTGGAAATCGTGCAAAGAGTGTAAAAGCATTAAGGGAGCTTGACTG
+CAAGAGCAACAACTCGAGCAGGGACGAAAGTCGGCTTTAGTGATCCGACGGCACTGCGTG
+GAAGGGCCGTCGCTCAACGGATAAAAGTTACTCTAGGGATCGTCTT
+>ds2020-328_259
+CTTTTTTTTTCGGTATAGGAGAGATGGAATGTCTATACCTAGTGGGAGTCTAATTTTTTT
+CACGTGGGGTGTGGGGTTTAGTTCTTTTTATTTATTTGTTGGTCAGCCTAGTTCTAGTGG
+GATTAGTTAATAATATTTTAAAAAAGATAGCCTAGTCCTAATGGGAATAGTTAATAATAC
+TTATTTGGATGAAGGTTTGTTTGAAATTGAAAGTAATTATGATAAAATTGGTTGCCATTT
+GCAGCCATTGATTGACGGCAAAGAACCCATACGTCTACCCCGACC
+>ds2020-328_260
+GGTCGGGATAGACGGGGCTTAGTGGTCGAGATATGCTTCCCCGTATCCAAGAGGGGTGGG
+CTGCCCGATCTCCCTATTCAAGAGAGGTGGGCGAACTGCCTATATAGCTGTCATTGGTTC
+CCCACTCCAAGGAAGGAGCCTTGAAAGGTTGAGAGTCAACCCGAAGGCAAATACAGACAC
+AGATCTCTCAATAGATCAAGGGATTGGTTTTTTCAAAAACTTAATAACCGATGCTTTCCG
+TACAATGTTTCTTCCAGTTAGGGCTTAGAATCGTCTATCCCGACC
+>ds2020-328_261
+GGTCGGGATAGGCGCCAGCCCAGGCGGTGTAAGCTCATCGGCAATCTCACGAAGAACACC
+GTCCGCTAACTGCAATCCAATCGCAGTGAGTGCCCGATTCAAGACCTCATCCTTTTCCAT
+CGTTGGAACACATTGTTGGCCATGCTTAGATACCCTTTAGTGCCTTTTGAGCAGCCCCTG
+TTGCACTAACAAGGCTCTCATCTTCAACACCAAAGTCTGGAATTTTTCTCCCGTCAAAAT
+AATTTCATATTTTCTCAACACGTCCCTGCTTCGTCTATCCCGACC
+>ds2020-328_262
+GGTCGGGATAGACGCAAACACCAACTACCCCATCAACACCGCCCGCAGGAAACTCTCAGC
+AACAGTCAGCTTACACCCCTCTACCCATTACTCCTAGCGAAGCTGTACAAGATGCAGGAG
+GGGTATTACCATCTTGTACACCCACTGGCGCACGTGGAGCACTCACAAATCTAGACGCCA
+TCTCTCTAGAAATGGAGGAGTGGATACCTGAAGAGATGGACGCTAAGACCCGAAGGGGTA
+TACTATTGAGTGCCGAGCATAGGGAGGTGACGTCTATCCCGACC
+>ds2020-328_263
+GGTCGGGATAGACGGAGCATGCTGTTGCTCTTGCATGGGCGGATAGCGTTGGGAAGGAAG
+AAACCGTAATCCGCACCTTGAACAAAAGGGGAACGATGAAGTTAGCCTAGCTTCGGTCTC
+TCTTCCCTTTCGTCTGCTATTCCTACGCCTTCCTGCCTTTACTTTTATGCTTGCCTGGAA
+GGAATGGGCAGACAGCAAGAAAGAAGGATTGATAATCAAAGAATAGAAGAAAGGCGCATC
+TCTAGCCAAAGACCGACATACCAGCATTTCGTCTATCCCGACC
+>ds2020-328_264
+GGTCGGGATAGACGTGTTTCAATCTTACAATGATTTTGTGCTCCGCCTCATTTCGGCCCC
+TTACTAACAATATGATCGGATGTCCATAATTAGATCTGCCAAATAAGATATGAGACTTTG
+ACAATTCTTTACCCCAATCTGGAGGTGTAACGTTAAGATACTCTTCATCCCAGTGTTCAC
+ATAATTTAAGATAACTAGGTTCAAGCTCCCTTTCTCCCCCCTTGAACTCGAGAGCCAATC
+TTGATAGCAAGAGCCACAGCCCCCGTCGTCGTCTATCCCGACC
+>ds2020-328_265
+GGTCGGGATAGACGAGCCTCTGCCCTGCTGTCCCATCTATTTGCAAGACCTGCCTTATAG
+TCGCCGGAGGGAATCCCGTAATCTCACTCAATAAATCGAATGTTGAGTACCCTGCTGGCA
+GCTTAATTGTTGACAGTAGTATATGGTAGGCTTTTATATGGTTCCTGATCCTCCAATCTG
+ATTTCGTATCATCTATATCAAGTGCCACCCTGTCGTACCCCCCTACCTGCCCTGAACTCA
+TCGCGTCCTCTTGTTCCAACACCCATGGTCGTCTATCCCGACC
+>ds2020-328_266
+GGTCGGGATAGACGATCAGACACGATACTCGCCTGGGCCCTCGTCGAGACCAACTCACTT
+CTCTCTCCTTAACGTCTGGTACCATTGCCCCGCCACTCTGCCTGTCTTCTTGTGGCCGGG
+TCGGGTCATTCTTCACTCCTGTTACAAGGGAGACCCCTCTTCGCATACCGACCCTCCAGT
+TAGTTCCACTTCTGGGGAGAAGCTGAGAACTCAGGGCATAAGGGCCTGCGGTGATTATTA
+ACATGCTTTTCCAGCCCATATTACTAGGTCCACGGCCCCACAT
+>ds2020-328_267
+TCTTCCGATCTGAATTACGGCGGTCGGGATAGACGTGATTTGTTCTTCCTCTTCCTGAGT
+TCACTCCTCTCTCCTCTCTCCTCTTTCTTTTTTTATTCTTCTTTTTTCTTTCCTTTCCTT
+CTCTCCTCTCTCCCCTCTCCCTTTCCTTCTCTCTCTTTTTTCCTTCTTTCTCTCCTCCAG
+TTTTCTTCTCTCTTGTCATCTGGCGATTTTTTTTTCCTTCTTCTCTCTTCTGGCTAGTTG
+GCTCTTTTTTTTCCTTTATCTCCTGCAACACTAGGTCCACGGC
+>ds2020-328_268
+GAATTACGGCGGTCGGGATAGACGCGGGTGAGAACATAGACTCAAGGAAATCGACGAAGG
+CAACCCTACGGAAACAAAGGGCAAAGGGTGAACCAAAAGTTAAGCCCGTGTCTGAACTGA
+CTACCCCAGCTACTGAAGTACCAGATGAGAAACCAGCAGTTGAACAGACACAACAAGTCA
+GTGACGTAACCGAGCCGAAGGAATTGATAAGGGAGAAAACAGAGCAGAAGGTTGACGTCA
+AGATTGAAGAACCGACAAGTAGCCACACACGTCTAGCCCGACC
+>ds2020-328_269
+GGTCGGGTTAGAAGCAAAAAGGACGTGGCCTACTCATCACCTTGCTCTTATGAAAGAGGA
+CATTCGTGAACAACCCCTAGATTCGGATTAGTGAAAATCGAAAACGCTAGATTAACGAAC
+AGCGGTTATTAGCCTAAGAGCGCTTACTGTAAGACCGTTTCACAGCAGCGGATGTGGTTA
+TTCCTCGAACAGCGCTTATTGCAAAGAGCCAAAGAGCCTTTTCTTCCTAAGGAGATATTC
+ATTAAACCATTAACAGTCGAACCGGCCGGAGAGAGATTGCTTC
+>ds2020-328_270
+AACCGATGAAGCAGGATTTTCGCAGTGGCGATTTGACCCATGCCCCCGGGCAAACAAGGC
+CAGAAGCTCGTGCCCAGAATGTAGAGGATCAGGACAATCAACCGACTGCGGAAGATGTAG
+GGTAGAGAACGTGAAGCCGAACCTGCCGGGAAGCAGAGACTGGATTAACTACATGACGCC
+TAAAGGAAAATCACTCAAATGGAACGGTATACAACTTATGACTGTGTCTGACACCAAGGA
+CAGAAGAGCTAATAACAGAAGACGGCTACGTCTATCCCGACC
+>ds2020-328_271
+AACGGCCGCCACTATATGATTTAGCTTTTTCCTACCCGGTTATTTTACCAGACATAGCGG
+GTTAGTATCCGTAAGCTATAACTCCCACCCTTAGCTTGTTTGGTTTGGACCCTTACGTTC
+GGTACACTCGTTAGGAAGCGAAGGGCTATAAAAAGGACTGCTTTCCAACTCACTAGCTTT
+AAAGTAAGGCTCTCCTAATGGCTCTGATCCACCTCCTCCCTCGCCCGGAACTACCACTCA
+AACTAGATCGCTGACAGAAGGAAGGTGCGTCTATCCCGACC
+>ds2020-328_272
+GGTCGGGATAGACGGGGCCCAACCGGAGATTGCTCGCGGCTCAATATGAATTGAGACGAA
+AGCTTTATAAAGCCTTTTGTAAAGATCCCGATTTCCTAGTGATATGCGGGACAAACATCG
+TTATAAGTTGTCCAAGTTGCCAAGAAAGAGTTCCTTTGCACGAGTAAGAAACCGATGTAT
+TTCCACGGGCCGCCCTCGTTCCGTATATGAGTTCTTTCGAATTTCTCGTATCGTTTTTCG
+TGGATTAGCATTTCGATGGGCTGTTAACGTCTATCCCGACC
+>ds2020-328_273
+GGTCGGGAGAGACGGCACCCACCCACTCTTTCCCCTTCCCCCTCTCACTCATATGCCCGA
+TACACATATGCCATAACTGGGTAGAAGCAGCATCTGAATCTACTGTAGATGACACATTAG
+CACTACCAAGAATAGTGCTTCCCTGAAGATGGTAGAGACCGTTAATCAACTTCCCTTTTA
+TCACAACCAGGGCACCCCGAAAAACCTTCAAAACTCCACCTCCACCCGACCCCATAGTAT
+CCGTCTATCCCGACCAAGGACTCTCTCCGTCTATCCCACC
+>ds2020-328_274
+GGTCGGGATAGACGAAAGCTTGGTGTTGCATTGCAATTTCAAATTTGATTTTATGATTTT
+ATTGATTTTGGTTGTTTCTTACAAGCTGTTGGCATGAAAGTTTTGGTTTTTAAGTTGTTG
+ATTTGGTTGGTTTAGGTCTCTCCTTACTAGTTGTTGTTATGTAGTTGGTTTTTAGTTGTT
+TTAGGATGTTGCTTACTAGGTGGTGTAGTTGGTGCAGTTGTGCCTCCTCCAATTAGGAAG
+AGACCAGCTTTAAGACTGCCAATGAACGTCTATCCCGACC
+>ds2020-328_275
+GGTCGGGATAGACGTGTAGAAATGGTTATTTACAGATATACCAGCTCTAATATTTCCAGA
+TATATTCGCCCCCACCGTAGCCATTATCTTAGGTGTTCTTATCGTAACAAAATCCAGTCT
+CACATATCTTAGTAACATTCCCTTCACACATACTTCTATCCCGCACGAGGACTCATTTAA
+ATAACCTATATACATTGGTGTCATTATCTTCCCATCCCTACTCGTCGGTTCCCAAGATCT
+GCAAACCTCTATTAATAGCCTATCCCGTCTATCCCGACC
+>ds2020-328_276
+GGTCGGCATAGACGATGGTTGGGGCTAACCAGGTGTTTCATTAGAGGTCTTAACCTGCCA
+ACCAAGATTTTAGTGAGAACCTTATAAAAAGTATTACACAGGCTAATCGGTCTCAGCTGC
+ATCATAGTCAAAGGGTTCTCAACTTTAGGAACCAAAGTTATTAGAGTTCTATTGAGGACA
+GCAGGCACTTCACAGGATCGGAAAATTCCCCTAACAAGGGAATACATATCAGCAGCACCG
+ACATCCCTGCTAAAAGCGATCAGAGCGTCTATCCCGACC
+>ds2020-328_277
+GGTCGGGATAGACGCCAACCCTTCCTGTTTTCCACATCGTTATTTCCTCCATCGATATCA
+AATTTCTCTTGCCATTTATTTTTTTGGGTCTTTATTGATTTATATACTCATCATCCCGCC
+GCTCCTACCAACGCTTACTTACTTATTCAAAGGGGTTCTAAATAAAATAATCAGCCCTTT
+GAATAAGCGAGGCTTTCCCGATAGAAATAGTTGCATGCGAAAGAGATCCCAATTCCGTGT
+ATCCGGTTAAGCAAGCCCTTCCTACGTCTATCCCGACC
+>ds2020-328_278
+GGTCGGGATAGACGTAGACTGTTTCCTTTACCAGTTGTACTTACGAGGAGACGTTTGTTC
+GCTATGTTGCAGGCGACTTTTATGACCTCGCTACCATATGTGGGCGTTATAGCGATGACA
+AGTGCTATTCTTGGTCAGGAATGTCTTCCGATGTCCTCCGCCGTGTCGCCTCTTACACTC
+TTCATTCGTCGCCGTCAATGGTCCAGTGCTGGGAAATGTTCCACTATCGCCTTGACCTCC
+CACCAGCGACCACCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_279
+GGTCGGGCTATACGGCGTCTGCCCTTGAAATCTTCGAGATAAGATGAAACTTCATCTACA
+TCCCCATTCGCACACTTGATAACCAATCGTAAGTCGTCACGCTGCACGAGCTGCTTCAGT
+AAACCGAAGGTAATGACTCTTAGCATTGTGCACTGATGCTGACTTGCATCTAGCACTATG
+ACTGAGTAGAGCTGTAAAACCCTCATGTCAGACAAATCCTATTATCAGTCATATATTCGA
+CATCATCCTCACAGCCCCATGTTTCGTCTATCCCGACC
+>ds2020-328_280
+GGTCGGGATAGACGCTAGTCCGCCATGTATTCAGCCTCCGTAGTCGACAGAGAAACTGTA
+GATTGTAGAATCGACCTCCAACTCACTGGACCTCCAGCAATACTGAATACAAAACCTGTA
+GTGGACCTACGCTTGTCCAAATCACCTGCGTAATCAGAATCCACATATCCAACAACACAT
+TGACCAGTAACTTTATCCTGCTGAAACAATAAACCAACATCCACAGTACCCCAAATAAGC
+GTCTATCCCGACCAGTGGGCATTGTCGTCTATCCGACC
+>ds2020-328_281
+GGTCGGGATAGACGTCAACGGGTACTCAAAATGATTTGAAGTGTAATGCGAAAGGGATAG
+ATAAGATAGATGAATTGAATGAAAGCTCGAAGACAAAGAGAACCGGGCTTTCCCAAAGAA
+TTACTGAAGCTTTCCCACTTCCTAATAGGATCATGAAGAGGAGACATGCTCTGGTAAAAA
+AAGTTCCCTTTCTTTTCATAGGTTCTATCGTTTTGCTTTTCTATCTTATTAGTCTTCTTT
+TTTCCTGCCAAACCCGATCTCGCCGTCTATCCCGACC
+>ds2020-328_282
+AACGGCCGCCACTATTGTTTTTTCCTCATCTCATTAAGTTCTCTGATACAACACGTAAAC
+GCTCTAATTTTAATGATTATTTTATGATCCTATCTTTTCTTTTAACTTTGACTTTTTATT
+ACGACCAATTTTATTGTTTTATTGTTCGACAAAAGGTTCATTTATATACAATAATCGGAT
+TGTAGCGGGTATAGTTTAGTGGTAAAAGTGTCGTTCGTTCTATCATCCCTTAGTAGTTAA
+GGGATTATAGAGCATCACACCCACGTCTATCCCGACC
+>ds2020-328_283
+GGTCGGGATAGACGCCGTGACTCCCCCCCCTATTTTTAAAGTACCCCTCTTCCTATTTAG
+GGGGTTGAGGCGAGAAATGGCTTGATGAACCGTTCCGTTCGCCACGCACCGGCCCCATTC
+ACTTGCTTATCGTAGAGGCTGTAAGTACACAGTGCTCCACAACTATTCATAGTATAGTGG
+GGTTGAAACACGAGAGTGCCCGCCCTTTCTTTCAAGCAGGCCACTCTTTCCGGACCGCCG
+TCCGCGGTAACCCCGACCTAACGTCTATCCCGCCC
+>ds2020-328_284
+GGTCGGGATAGACGTCACATCCTCATAATCCGTCTATCCCGACCAGGCAACTCTCACGTC
+ATCCCGACCGCCGTAATTCACCCCTAACCACACCTCATCCGCTGATTTTTCAACATCAGT
+CGGTTCGGACCTCCACTTGGTGTTACCCAAGCTTCATCCTGGACATGGTTAGATCACCCG
+GGTTCGGGTCTATAAACAGTGACGAACGCCCTCTTCAGACTCGCTTTCGCTTTGGCTTCA
+GCACAACTATGCTTTAACCTGCCACTGCCAACTAA
+>ds2020-328_285
+GGTCGGGATAGACGAAGAGACGGTGTTGGCGGGATTCGTGAGCTCAATTTTCCTTTCGCA
+TCCACTATCTTTGATTCCACCGACGGATTCTTTAAACCCAGGTGGGCATACACAGTATGA
+AGAACTCGAACCATCGCTGACACATATGGCATTAGGCCCGCACATGCCGTGAACTCTGCA
+CAATTCGTACCCTGCTTGCCAACCGACGGTCAATTCTCTAGGGCTCTGATCGAAACTGTA
+AATTCTGAGATCCCCGCGCGTCGTCTATCCCGACC
+>ds2020-328_286
+TAATACACAGCAACGGCCGCCACTATAACACTTGTCTTCCTATCTTTCTGCCTATCTGTC
+TTTCCTCTTTCTGCTTTGTCTTTCTCGCTGTCGGTAGAGATTAGTATTTCCTAAGTTGTC
+TGAGGCTGAGCTTCCCTACTTCTGTACTTGGTTGCCTGTCTCTAAGCTGTACTTCCTTGC
+CTGTATCTAAGTAGGTACGTCTCGCTTCGCTCCTCATTTCCTTGCCGTCTTTCAATTCTG
+ACTATTGAGAAATATCCATGAGTCTGTCCCGACC
+>ds2020-328_287
+GGTCGGGATAGACGGTTCGGTTTCCTCTCCCGTCGATTGGGGGCATTGAGTAAAAGGGGA
+ATGGGTGATCGATGAAAGAAATCTACTCCTCAGTCTGATAGCGGTCAGGTCTTATGGCTG
+TCGGGCAATCGCTCCTAGGCCGTTGAGCATGCCGGTAGTCAATTAAGAGTTCGGAACGAC
+ACTAACACATCGGAAAGTTAGCCGTACCGGCTCTTCCCGGCTTCCTAGCTTAGTTGGTAG
+CTGACCTAACCTACGCGCAACGTCTATCCCGACC
+>ds2020-328_288
+CGTAAAGCCGGTAGGAGTAGTGAAGAACTATAGATAACTTTTGTTGGTTGTTAACCAACG
+GAAAGCATGGGAGTGGAGCTCGCCTTAGCGAGCGAAACACGCGACATAACATAAAGGAGA
+GTATGAAAGTGAAAGCGGAGATCCTGGATAGCTGCCCTGTTTATAAAGGATCTACAAGGA
+GAGATCTATATAGAATTAGGGTTCCACTTTCCCTATCTCGGAGCCAACCCTAGGGCTAGG
+GTGAGGCTGGGAGGTTTGCGAAACACTCCGCCGA
+>ds2020-328_289
+GGGCGGGATAGACGATAGATAGGTGTTGAAGGAAATAGTCTCTGCTTCTCAGGGTGCTTT
+CGTGAAAAATAGGCAGATTTTGGATGCCGTCTTAGTTGCTAACGAGGTTGTTCAGGAAGC
+CGTGAAGCGGAATAAGGCGGGTCTGGTCTTTAAGATTGATTTTGACCATGCTTATGATCA
+TGTAGAATGGGATATGGTCGATGAGGTTTTGGTTAGGAAGGGTTTCGGAGGAAGATGGAG
+GAGATGGATCAGGGACCACCGTCTATCCCGACC
+>ds2020-328_290
+GGTCGGGATAGACGATACTCTGGGGTCAGCTTCCAAAGCCAACAACGATGGCTCATACCA
+CTCCAGAGTGGGATCATACCGCGTGGTCATGTAAACATCGAAGCAAACACCGGGAATGTA
+ATCGGAACCGTATAACATAGACTTAGCAGCCTCCACACCGCGAACGAAAACCTTACGAGT
+AGCATTAACAACGTAATCGGTCATGAACCAAGCCAACCTCTCAATGCTGCATGACTAGGT
+CCACGGCACAGCGAAAGAAACTAGGTCCACGGC
+>ds2020-328_291
+GGTCGGATAGACGCTGCTAACCTCTGGTCGGGATAGACGATACGAAGGGGTGCGGTCCGT
+CTATCCTCGGACAGAGAGCCGTGGACCTAGTGTTGCCGTTGTTTGTGTTGTGGGAGTGTT
+TGGAGCTTCTGGACTTTGGAGAACGAAGAAGGCCAATTTCCCCAAACGAAAAACTGAAAC
+AGAGAGAGAGCCATGGAATCCAACGAATATGAACGTCTGAAACGTAATTGATTTTAGAGG
+TAAAGAGAGGGCACCTAGGACTAGGTCCACGGC
+>ds2020-328_292
+GAGAAACTTATGAGGAATTTCTTATGGGAAGGTTTGGATGGAAAAAAGAACCACGCTGTG
+TGGTGGGAGGTTGTAGGCAAAGGAAAACTTTTCGGAGGGTTGGGAGTAGGTTCGCTGAGG
+ACAAGGTGTGCGGCTCTACGAGCCAAATGGCTATGGCGCTTTCCGATCGAGCCCCACGCT
+CTATGGCATAAAGTGATTAGAAGCATCTATGGATTGGATACAAATGGGTGGGATGCTAAT
+CCTGTAAGTCGAGAACCGCGTCGATCCCGACC
+>ds2020-328_293
+GGTCGGGATAGACGCCTCGCAGGAATTCAGCTATAGCTCCGAATGCACATTTAGAGGGTT
+GTGTCCGTATACAAAGCCTCTGTCCTCTCTGTAGTGTGAAGCGGGTTATCTCAAGTGATG
+TCGTTCCCAGAAGTACATCGTCACCGTTGTGTAGTGAAGAGCCAACCTCTTTCATCGGAC
+CTAACATGAAGTCAGTGTAGACGGCATTCAGGACGGAGTTAAGGAACGTAGTAAGTCGGT
+AACCTGACAGCAGAATCCCGTCTATCCCGACC
+>ds2020-328_294
+GGTCGGGATAGACGGGTAATCTCCCTCTTGTTGCTTAGGCAACTTAAACCCTCAACATAG
+TGAGGTGTGGGGCGAAAGGGGCCACCATTCTCTTTCTTTCTTCAATCGTTCCGATCAGCA
+CAAGTGGGTTGGTTCGTTTCGTCCTTCTATCTACGCAATTCTCTGTCTTCGTTCGTGATC
+ATGTTGGGCGAAAGGTAGTTGTAGAGGAGCGGCTGTGAAACGGTGATTCCCCCTTTCCAT
+TGAAGTAGGGGGGTCCCGCGTCTATCCCGACC
+>ds2020-328_295
+CGGTCGGGATAGACGGCGGAGGAAACGAGGAAGTTGCTGAGGGTGGCCCAGTTGGAGGCT
+GTGAAATCGAAGCTTCGAGAAGTCCAGAAAAGCTGGGTATCGTATCCGGAGTTTGTTCGG
+ATATGCAAGGAGGGTTGTTCGGATCCGGATCTGGGTCTCGGGTTCGCCAAATCGTTAGAC
+GAAAACGGGTCCGTTATCGTGTTGGGAAACGCCGTTTGCTTGAGGCCTGAGCAGGTAGCT
+AAAGCCATCCAGGTTCATCGTCTATCCCGACC
+>ds2020-328_296
+GGTCGGGATAGACGGTTGGTACCTATCTGCCGTGGGCGTTGGAAGTTTGAAGGGGGCTGC
+TCCTAGTACGAGAGGACCGGAGTGGACGAACCTCTGGCGTACCGGTTGTCACGCCAGTGG
+CATTGCCGGGTAGCTATGTTCGGAAGGGATAACCGCTGAAAGCATCTAAGCGGGAAACTC
+GCCTTAAGATGAGACTTCCCAGAGACTAGATCTCTTTAAAGGGTCGTTCGAGACCAGGAC
+GTTGATAGGCTGGGTGAACGTCTATCCCGACC
+>ds2020-328_297
+GAGAGCCGTGGACCTAGTTTCGGTCGTCCTGCCGTGGACCTAGTTAAGTTGCGCCTGCCG
+TGGACCTACTCGGTTCATGACTAGGTCCACGGCTCTCTGTCCGTATTACGGCGGTCGGGA
+TAGACGAGATGGGTGTGTATCCCGACCAGAGCAATTATACGTCTATCCCGACCAGGGGTA
+TGCTCCGTCTATCCCGACCAGGATTAAGATGCGTCTATCCCGACCAGGGAATTCGTACGT
+CTATCCCGACCGCCGTAATTCAACGTCACAGC
+>ds2020-328_298
+GGTCGGGATAGACGCGATACCTCCCTTACCTTACTTTTAGTGCTTTTAGTCTCGCCAATG
+CCTTCAGTCGAGTTAAACTTTCCAGCTACTCCGTACTCTTCTCTTACAGATGAAGTTAGA
+GATTTCGCTTTACCAAACCTTCTTCCAGAAGTCAAAGATTTTACAACCCTAGTTAGATTG
+TTATATTGGAATACAATATACTTAGCTAGCTGTGTTTTAGTCCCTCCTAAACCCTTCACT
+CCTCTAAACTTACTCCTCGTCTATCCCGACC
+>ds2020-328_299
+GGTCGGGATAGACGGGGTACAAGAGTTGAGGGACTGCGGTCTTTGGCATCGCGAGCTTTT
+CTACCTTGAACAGGTTGATGAGCCCGATTTGCCCTTTTGGTCTTTTGCCGAGATCAAGAG
+CAATAATCTTCCAACTGGTTGGACTCGGGTGTCACCTCGGTGGTATCCCGATGAGGTAGT
+CCGCGGATGGCAGTTTAGACTGTCACACGAGACGATCAAGCTTGCTTGGTCTCAACCAGT
+TATTAAGGATTCTGCTACGTCTATCCCGACC
+>ds2020-328_300
+GGTCGGGATAGACGACGAATTTCTATTCTTATGGACTGAATGTCTTTCATAAGGAATCGG
+AGGAATATTCGACGATTTTTTCCAGGAAATCCCCAACGAAAAATACACACTACGCCCTCT
+TTTATATCGAATCGATCATAACCACTACCTACATTCCACGAAATTGTGCACCACAAATAA
+GAGCTAATAAAAAGACCTGCGATCCCATGAAAACACATCACGATCCCTTGTGGGAAAAAA
+AATTATTTGCCGAGAAGGAAATAAAGATATA
+>ds2020-328_301
+GGTCGGGATAGACGGGAAATGGTGATGATGGAACAGAGAAGAAAAATGATGAGGAAAAGG
+TTGATGAGATTAAAAAAGAAGGGAAGAAGAAGAAAGATGTGGAGGAGAAAAAGAAGAAAC
+ACAAGGGTGATGATGATGAGAAGGAGAAGAAAAAGGATGAGGAAAAAGACAATGAAAGCA
+AAAAAGAAGGGAAGAAGAAGAAAGACAAAGATGATAAAAAGAAGAAACACAAGGGTGAAG
+ATGATAGGAACTTAGGACGTCTATCCCGACC
+>ds2020-328_302
+GGTCGGGATAGACGGGGGGCATGCGTCTATGGCTCATAGGGAAACTTCGGTTAATAATTT
+ACTTACTGCAAGCCATACATTAGAAATCCAACAAGCAGTACAAGGTTTAGAAGATGCTGT
+TGCGACAGGTATGGAAAAAGCTCAGAGTAAAAGTTCAACAGCTGTAGTAGATTTAATGGA
+TATAACTAAAGTATACCAAGGTGTGTTAGCAGAACATGGTATTTTAAATTATGGGCTAGT
+TGGGGAGAGCAGCGAGGCGTCTATCCCGACC
+>ds2020-328_303
+CAGTTACCTTTCACAAATGTAGCTATCGATCGGGCTAAACATCCTCTGAGAGTACCATCT
+TTTGTACCCATAACCCTAAGGTATTCATGGTAGGTTTCGTCCACTAGTAATTTTGACTCC
+TGTCCTTTAAGCCTTGCTTTTGCAGCCACCTCGTTCCACGATATTGCACCTGAATAAGTA
+CTATGTATGCTGATAACGTCATCGCCGTGGCACAAACGCATTTCAAGCCCTGATTCGACG
+CCCATATTAGCCTGAGACGTCTATCCCGACC
+>ds2020-328_304
+GGTCGGGATAGACGCCTCATCGGTATGCTCCCAGGTACCTGTAATTGTGATCCGTTTGCC
+AGAACTAAGGGGTCTTTCTGTGGAAACCTTCACGAACAATCGTCGTTTTTTGATGGTTTT
+TCCGCTTCTCACAGCTGCTCTTTCTACACCCCCGGATATCTGGTGCCAAACCGTCGCCCG
+TTTCCTTATTTCTTCGATAATAGAGTTGTCTAGCTTTGTGGCATACATTTTACAAGTTCG
+TGAAGAAGGCAGGACGAGTGGATTGAGGGAA
+>ds2020-328_305
+GGTCGGGATAGACGACGAGTCTTCTGCCGCTGTTGCTGTAGTTTAGTCCGGGAAGAGGAA
+ATTCATTAAGTGTCACAGCTTGATAGTGAGAAACTATCTAATTCATCTATATCTTACAAT
+CGATGGACACTGCTCTATCCCTACCTGAGCTAGCTGCAAGACAAGCGAACTGCCCTTCCA
+CTTCAAGAGACAGCCTGCCTCCATTTCACTTAAATAGTAATTAATCAGCAAACGGGGCTT
+AGTCAAGAGAAAGGCTGCGTCTATCCCGACC
+>ds2020-328_306
+GGTCGGGATAGACGTTGGACTCCACTAGCGTTAATAACACGTTAAGTGGCAGGACTAAGA
+TTAAACAACGGTCGAAGTCTGAACATCATATGTAAACTGCATTATGGAAATATAATTGTG
+GAGAAATTAGGGTGTATATGAGACTATAAATACACGAAGCAATGACTAAAGTTAAATAGC
+AATGCGACATGTGTTATAACCTCAACAAACATTAGAAGAATGGTTTAGTGGCGGCCGTTG
+CTGTGGTATTACTCTTTCGTCTATCCCGACC
+>ds2020-328_307
+TGAATTACGGCGGTCGGGATAGACGAATTTGCTCCCTATAACGTCTCTCTCTCTTCATCT
+CCACATACCACTCAAACCTCCCCTTCCCATTCACCTCATTCCTCCTCTTTCCTCCCTCGA
+TCGCACTCTCCAAAATTACCAAACTCTCCTTCCCGTTCAAATGATTCCCCTCCATGCCCT
+CCACCTGCATGCTTACCTCCCTCACGTGCAGCTCCCCGCCTTCGCTCCAATTGCATGTGA
+CCACCATACCGCACTTCCGTCTATCCCGACC
+>ds2020-328_308
+GGTCGGGATAGACGATTATTGTTCCTCTGTGCATCTCTGTGATGGGTAAATCCCCATGAA
+AAAGGGGCAACTTTCGTGTAGTTTGTGATTGGATGTAACTGTTAAGATTTTTTCTCGGAT
+AAATCTTTCTCTTAATAGATCTCTTCTTGTTCCTCAATCTTCGGAGAATGCGGCGTTGTA
+TTATTGTAAGTTCTCTGTTCCGAACATTTCCTGAAAGTAGACGACAAGTTTTAAATCTTA
+ATGCAGACAAGGGCAGTAGTGGCGGCCGTT
+>ds2020-328_309
+GGTCGGTGTAGTCAACTCCTTCCTTCTGCTGGAATCCTTTGACAACTAGTCGGGCTTTGT
+ATCTCTTAGAACCATCATGTTCTTCTTTCACTCGGTACACCCATTTGTTGTGAAGTGCCT
+TCTTCCCCACGGGTAACTCAGCTAGTTCCCATGTCTGGTTGGAGATCAGAGACCTCATCT
+CGTCTTTCATGGCAAGCTCCCACTTGCTAGCATCTCCAGTCTGACAAGCTTCATCATAGC
+ATTCAGGCTCACCCTTCGTCTATCCCGACC
+>ds2020-328_310
+GGTCGGGATAGACGTCCGAAGGGTCTACATCTATTACGTCTGGCCTCATTCTGTGTTCAC
+GTTCTTTAACCCAGTCTACTTGACCGTAGCCTCGATTAACAAGTGTATTTAACTCAAACA
+TATCCGTCAGATCAAGTAAGTCCCTAGAGTGTAATGCCTTCAGTGTCACTGATACGTCCA
+TCAGTTGTTCAAGCATTGCGTAGGTGTTTTCACACCACACTTTGTCTGAGTGGGTCAACA
+ATAGAGCACCACAGACCGTCTATCCCGACC
+>ds2020-328_311
+GGTCGGGATAAACGAGCCTCACGCTTCAATGAGAGCCACTCTGTGGCCGCTGCAGACTTA
+GATGACAAGAGGTAGACCCCGAGTGATCTGTCCAGCTGGCGTAGTCGCTTCAAAGTCACA
+CGCGAGTCAAGGCAGGAAACTTCCCGTGCTATAACCACTGTCGGATGTAATGCTCTGTGG
+TCACTCACAAAGACATCCTATCGAAGGACGCCTTTATGTTTCCATTCACCCTTGGATCTG
+TAAGAGCTACCTGTCACGTCTATCCCGACC
+>ds2020-328_312
+GGTCGGGATAGACGATGTACACACCACCCACTTTCCTCTCATCACAATAATCCAACAACA
+CAACTCCAATGTAATCTGTTCTCCAAGCCTCTTAAGTGATGTCCTAACAACATGCACCTG
+CCAGCAGAAAACGAAACCTTTAGAATGCAATCTCTAATGGAAATTGGATCGATTAGTAAG
+ATACTAAGATATGTGAAGATTGACAGTTCCCAGAAGTGAGTTATTGCAATGAAAATTTGG
+ACAAACAAGAAAAACACGTCTATCCCGACC
+>ds2020-328_313
+GGTCGGGATAGACGGACATATTAGGTGGGTTGAGGCCTTTGAGTTGCCCATAGTGTTTGC
+CCTTTGCACTCTGATGGAAATCAACTGTATTGTGTTAATTGGTGCGGTTGAAACAGCATC
+AATTGCTATGAGGTCTGCGGATGGCGGAAAGTCCTTTGTTCTGTCATCCCGTCCAAAATT
+GCAGTCCAGCACGTCTGCCTTTAGCATGGCCAAGGTTGCAACATCGGCCGCGTCATTTGG
+AGGAACGGGGCAAGAACGTCTATCCCGACC
+>ds2020-328_314
+TGAATTCGGCGGTCGGGATAGACGTGGATGAGTCATATGGAGAAGGATTGGGAGCAGAGG
+AGTATGATGAAGGATTGGGATTTGACTAAGACTGTGTATTTGTGTTTTGGCACCTATGGC
+CGGAGTGCTGCTGTTTTTTGCAATATTGAATCCTTGGAATTTTCGTCTTCTGGTGTTTGG
+TCGATGAAGGTATATTCAGTTGGCACAGCGCTCAACGGTATGGGTATAGGTGCCAAAACA
+CAAATACCGCACTTTCGTCTATCCCGACC
+>ds2020-328_315
+GGTCGGGATAGACGCAACCATCCCCTTATCGATGAATACGGAAGGGCGAATCCGGAGATT
+ATCCGTACGTCGTCCAACCAACCCTATAGCTGGAAACCTTTTCTTCGGGGTCGATTGACT
+GAAGGATCTCCCTCCTCCAACTATTTCAACTCTCTGTTATTAGTATGGCGAGCCGAACTA
+AAGGCGGTTCTCTTCTCAAATGAATTGCAGTTTGACCCAATAGTGAGTAGCCTTTCTTCT
+TTCTACTAGGTCCACGGCTCTCTGTCCGA
+>ds2020-328_316
+GGTCGGGAAGACGGGGTGGACGTATGTCCGGAGGTGATAACAGGAGACTCATGTTATGTG
+GGTTGGTGAGGGTCGAGGACAGTGGTACCCGCGGACCGGTGTCGCGGTACGCGCTGACAC
+CGACAGGTACGGAAACGGACAGACTTCAGGAACAATATGCCTTATACGGCTTAAAATTTA
+TTCAAAAACAGTATTAAAAGAAGTATAAAATCGGATAAAACAATATAATCTTAATAATTG
+ACAGTGACACAGTGTCTTAAACGTGCTAA
+>ds2020-328_317
+GGGCGGGATAGACGAATCGTCTCTCGTCCCCAAAGTAGTCTGCCTTTTGTGTCATCATTT
+AAGTATGTTGCTTGTAGTGTCCAAATGAACATGTTTTCTGCTTGTAATAGAAGCTTGGTA
+GCTCCGAATACTGCTCGAATTTTGTCAGGTTCATCAGATGCGACAACATGTGAGCGTGCG
+TGTAACGTGCTCCAATAGTATGGCACTGGCTGACCATCTTTCCAGAATGGAGTTAATCCA
+TCCTTAATAAAGTGGATGAGTGATCGGTT
+>ds2020-328_318
+GGTCGGGATAGACGATTTTCCTTTCTTGGCTGGGCCAACCGATATCACCTCTGTTTTAGA
+AACTATCTTCCTCAATTTAATCGCTATTAGCGCTGAATCCAACTGTTAGCTTTTGGTTCC
+TGCTGCAATTTCAGAATATCTGACATTTTCCTGTCCAATTCAACTTGTGTGTCACGGATT
+TCCTTATTCAAAAGCAAGATGGCCTTCACATCCTCTTTTAGCTGCAGCTTCAATCTCTTT
+AACAGTATTACCCCCCGTCTATCCCGACC
+>ds2020-328_319
+GGTCGGGATAGACGATATTGCCCTCTTTTCTTCCTAGACTATACTAATTCAAAATCTCTC
+TTATTAGCATACTGTTGGGCTTTTGCGGTAACCGCGTGCATTGAGACCCTTCATACCTTA
+CGCACTGGGAGGAACACTACGCTTTCACCCAAGAGTGTAAGCCAGCGTCTCAGCCATGTT
+CAAAAGCGTACCACAGGTTATCGCTCAGCCAAGACTCAAGCACTCATATGGATGAAGGGG
+ATACATCTAGCTGACGTCTATCCCGACC
+>ds2020-328_320
+GGTCGGGATAGACGGGTAGGTCGGCTACTGAGATCAACACCACGGTTGGGAAATCGAACT
+GGAGTTGGGTGGTGGCCTGTGAGAGTCAAGTACTTCATCAATCTTGGGATGTTATCAGGT
+CGGCCCTATCATGCTGGTTAGATAAAGAAGTTGAGCTATTTCCATATCAGGTTAACAGGG
+CTTTCTTTGTTTGTGAAAGTAAAGAGGAGGCTCTGAGAGTAAGCAGCGCTGGTAAGCTCG
+TGATGGAGGTTGTTCGTCTATCCCGACC
+>ds2020-328_321
+GGGCGGGATGGACGGCCGGGGGCTCTGGCGAAGTCGGAAGAGGATTGCAGTCATCTTGGG
+GTGGGCTTACTACTTAGATGCTTTCAGCAGTTATCCGCTCCGCACTTGGCTACCCAGCGT
+TTACCGTGGGCACGATAACTGGTACACCAGAGGTGCGTCCTTCCCGGTCCTCTCGTACTA
+GGGAAAGGTCCTCTCAATGCTCTAACGCCCTACCGGAGGCTCTGGGGAAGTCGGAATAGG
+AGAGCACTGTCGTACGTCTATCCCGACC
+>ds2020-328_322
+GGTCGGGATAGACGACGGTCGGGTTATTTCAAGAATATGCAGGTTATCCAACATCTTATG
+GATGCCAAGCATTTAAACGTACGTGCCATATTGCAGATCATAATGCAGAAATTGTAAACC
+GTTGGGAAAACACAGGCATTTTAACTTTTTGGCGTACCAATACTCCTGAGTTTGGTATCA
+AAGGCATTACAGAATCATATGCTTGTGGAGCTTGTCATAATCCTTGGAATTTAAAACATA
+ACAGTGGTTGTTAACGTCTATCCCGACC
+>ds2020-328_323
+GGTCGGGATAGACGGGGGTGAATAATCTGAAGAAGGCTATTCCGAATCCGAGGGAAACTG
+TGAAGAAGAAGACTACGAAGAAGGAAACCGATGCCTAGGCCAAGGCTGGTACCTAATTTT
+AAGTTGAATCTAAAGCTGAAGTTAGGGCTGGAGCCTGAGTTGGTGTTGATGTCCTAGAGT
+AGCGAAACTACAAGTGAAGGGGCGCTATCCGGAACCCTTAAGGTCGGGGACAATCTGCTT
+CGATTGGGACTTGCCGTCTATCCCGCCC
+>ds2020-328_324
+GCCGTGGACCTAGTTACTTACTATCTCCTCTCAATATTCTCTATGTTTTGACATGGTATC
+AGAGCAGCGATCTTGCTGACTCTAGTCTTGAATTGTTGTTACCATCATGGGAGAAGATGA
+TTTTTCCCCTGTTGGGAGTAGCACCACCGATCCTACTACTTTCACCGAATTTGCTGCTCA
+AATGGCTGAGTTGATGAAGATACAAGCATCAACATCAAATACAACCCCGACCCCGACTAT
+TACCGACGAAATGGCATCAAATACGACC
+>ds2020-328_325
+GGTCGGGATAGACGGACGGCTGTATAGGGGGATGAAGGGAGTGAAGCAATGGTTAGGTGA
+AGAATGGAAGCCAAAACTGAAGTCGGCGAAGTATGGCTGTGTAAAATAGTCGAAGCCTCC
+AGATGTAGACATCGAAGAACCAACAGCTCTCCCATTTTACCCCTGAAGCTCTCCAAACAG
+CTAGTTGAAATCCAACCAGACGCCTCTCAACCCTAAACATCCGCTAGTTACATCCCAAGG
+AAAGAAAGGGCCAACGTCTATCCCGACC
+>ds2020-328_326
+GGTCGGGGTAGACGACGGCCGGGCGTCAGGGGGGTCGAGGGCATGATGGCCAAGCGAGAA
+GTGCGACGCAAGGGTGTACCGAGGTACTTTGAGTATTTTGTCAAATGGAAGGGCCTGCCA
+GAGTCCGAAGGCAATTGGGAGAAAGAGGAGTCCTTATGGCAGTACAAGGACTACATCGAA
+GCATTCGAACGAGACGGATCAACCTCGACGACGAGGACGTCGCCGAAGTAGGTGGGGGAG
+GATGTCCCCGGCATGTCTATCCCGACC
+>ds2020-328_327
+GGTCGGGATAGACGTGCGGGGTGTTTGATGCACCAGTCCAGCGTCAACAGTTTCCTATCT
+ACAAGGTAGTAAGCCATGGGGTGTGCATTGAGTTTACAGACAAACGCATGAATGCTTCCA
+AGGTTTACAAGGAAGCACCTAAGCCAAAATCTATGTGGAAAATTGCCAATCGGCACGGTA
+CTTCAGTAGAAAAGATCTACGAAGAAATTATCTGATCTTCTATAACGGTTGCGAACTCTG
+CACCGGGCAATCGCGTCTATCCCGACC
+>ds2020-328_328
+GTCTAGTACTACATCCATATTTGAGAGCCACGTCCGCCAACATTGCGAGTTTGCCACATA
+TGACAGACTGTTATTAGGTAAACTTTCTACATTCCCAAACCATGAACTTTTCAATTTTCT
+GGCTCTACCAAATTCACTTATCTCTTCACTTTCGTTCCAACGTTCTATATTAAGATTTAC
+CCGTTTTGTAAATTTGTTATTACCGTTTAACATGCTCACTTTTTCCAGACCGCATGTCTC
+TAAATTTGATGTTATAGCTTCTACATT
+>ds2020-328_329
+GGTCGGGATAGACGGGGGGATAGCTTAAACATCATCTCCTCCTATCCCGGTGGGAGTACT
+GAAAGAGGGTGTTACGGGCTTCTTCTTATAAGAAGGAGGGCTTTAGGGCTTAACTAAGTA
+AGAGGGAGGGCTTTAGGGCTTAACGAAGTAAGAAGGAGGGCTTTAGGGCTTAACTAAGTA
+TTAGTTAAGGGCTCGGAACTTCTAGTAAGTGAAGGTCAGCGGGAGCTGCTATCGGTAGCG
+GAAAGGGCCTTGTCGTCTATCCCGACC
+>ds2020-328_330
+AGTCGATAGCCATTGTAGTCTCGCGACAGAATTACGGCGGTCGGGATAGACGTGCGCCGT
+GGATAAAGACATAAAAAAAAATTACTGTAATAGTGGATTCGGAATTGTGGTGTAACCTCC
+CATTGCTCTATCTCCGATAGCATGCAGCCGATAATGAGGACAGATATATAGAAAGTGTGC
+AGTGAGGGATCTTTATAGGTAACCAGTCTTTACTTATCTCGACTCAAGCTTTACTTAGCC
+CAAGCAATGGGTGCGTCATCCCGACC
+>ds2020-328_331
+GGTCGGGATAGACGACGTCTGGGAATCTAAAGTGACCGGAGCGGCTTTTCTGTATGGATC
+GACGTCTGGCCCCCCATTTCTCGTGTTTTTTGGCTTAACATTTATTCGCTATGAAACTGA
+CAGAGATGTAAAGGCAGAAGCCTTGTGGTGCTCTTTGATGGCAAGGATGCTTTAACTTGC
+ACGCGGTAACCCGTATTCCGTATTCCTGTTGAAACAAATCCATTCTTCCAGAACCTGTTG
+GAAAAGCTCACTACTTCGTAGCCTTT
+>ds2020-328_332
+GCCGTGGACCTAGTCGGTGTTGGGCTGAATGGAGGCAGCAGAATATGCGACGACGATCAT
+AGTAGAACAGGTCAGGGCGGCAGTGAGGTCAGCATTTCCGGCCGCCAAACCGAGCACATT
+CGACGACTTCATGGACGATGCTTACGAGTGGCTGGTCTCGGGATCTTCTGCAGGGATGCC
+AAGTGTATTAAAAAACACAACTGACCCTGTAAGGGATTTTATACTCAAAGATTTGGGATT
+AGCACCGAACAACGTCTATCCCGCCC
+>ds2020-328_333
+GGTCGGTATAGACGGTCGCTGGTGGTGCGAGCTGGGAAATGGGGTGTGCTGGTGAGTGAT
+GTGGAATCGGCGGAAAAAGAAGTGCTGAATGTTTCATCCAAGGAAGTAAGGCAGATAGAG
+AAATCTATGGCATCAACAAGAGAGATGAAGAAATATGTGATAGGTAGGAAGTAAATAGCT
+TAATAGCTGTCACTTGACTAGAGGTTTGAGTCTAGGTCAGGGACGAGAGTTCATAAGGGG
+GCTTAAAACGCGCGTCTATCCCGACA
+>ds2020-328_334
+GGTCGGGATAGACGAGACAGTTGCATCTATACTATTGAGTTGAGAGAAAGAGAAGATGGG
+ACTAGTTTGCTACTCCCGCGGGCCCTACTTACGTAAAGCTTATCTCCTCCAGGAGGCAAG
+GGATTGCTGCTTCCACAGCTGTCTCCACTCGGTCAAATGCGTCCTGCCTTGAACGAAGAT
+GAACAGAGACTCCTTGGGACGTAAAGTTCGGATCTTGGCCTTTCCTATCTGCCAACAAAC
+ACCTTGCGCGTGCGTCTATCCCGACC
+>ds2020-328_335
+GGTCGGGATAGACGGATCGGAGGCATTAAGTAAAGAACAGTCTATGTCACTAGATTGGAC
+AATTGAGTCAATCTCAGACCAAGTGGTAAGGTTTAATGAGTTAGGAAAAACAGAAAGAAT
+AAATGGAACCTTATTAAGCGGATGGCGTCTGACCTCGTTTATCAATACTGTATTAAATAG
+AGTGTACTTGTTAAACTCAGGACTAAGTACGTGTGTGAACTATGCGTTACACAACGGTGA
+TGAGATGTATGCGTCTATCCCGACCC
+>ds2020-328_336
+GGTCGGATAGACGTGTTGGCTGCTTCAGCAAGAAGCTTGCTGTCTGCCCAAGGAATTCGC
+TTCGACTTCCTACTATTTCAAGGGATCACCTTTCTAGTTGTTGGCCTTGGTTTGATAGGA
+GAGCAGGTGAGCTGACCTCCTCAGAGTAATGCTTTCAAGCGGTGTTGAGTGCTTTCCCGG
+AATGTACCATGGGGCGGGTACTTTGATCAGAGCTTTGAAATCCATATCGGCGCGCCGATG
+ACAGAGCTGTCCCGTCTATCCCGACC
+>ds2020-328_337
+GGTCGGGATAGACGAATGTGCGGCATGATAGGTGGCGTAAGCACGGTGTAGCTAACAATG
+TTAGTGACGAAGAATGGTCGCAACTGTTATATATGCAGTCACTATATGGCAGAGGTGGTG
+TGGTAGTCGACTGGCAGAAGGAGTTCGAGGGTAAAGCGAGGGAGCCTGAGAATATTTTGG
+CGTTCAATGGTTCAGTGTGGTCAGCAGAATATGCGACGACGATCATAGTAGAACAGGTCA
+GGACTGGCAGGCGTCTATCCCGACC
+>ds2020-328_338
+GGTCGGGATAGACGTATCAATACACTGGTCGGGATAGACGTACAAGGGGGTTGTTGGCCC
+ACGCTACCGTGGAAGGAATGAAGAAGGGGATGTTGGTCCAGGGTAAGGATCTGAGTGCGG
+AGGAGCTGGCGGAGTATCAAACTTGCCGCAAGATCATTGCCACCGCGGCGTTCCGAGTGG
+CGGAGATCAAGAAAATGATCAATGAGTACACGGGTACTGTTGATAAAGCTATCAAGAACA
+TACAGGGGGTACGTCTATCCCGACC
+>ds2020-328_339
+GGTCGGGATAGACGCCTGTATCCATTATGCTCTCTTCTTCATTGCTAAGAAAGAAAAGAA
+GAACCTATCTATATAGTATAAATAAACTCTTGTTTTGCATCCGGGTCGATAGCTCTCCAA
+AGTTCCGACTCTCTCTTTCTATATGCAATAATTTGAATCACCTACTTGGTACGCCCCTTC
+TGGCACAACACACATCCCCACTCACAAGAGCACACCTGAAATTCGGATAGAGCACCTCAC
+CTCGTCTATCCCGACCGCCGAATTC
+>ds2020-328_340
+GGTCGGGATAGACGAACGACCGTGCTGAATGAAAAAGTTTCCCCCATTCAATTTGTAGGG
+ACAACCCCTACCTCCTCTCTTCTAGAATGCTTTTAGGCGTTCTGGTTTTGCTTCTCATTA
+AGAAGCACACCGGGCTGCTTAGTCGGGGTAGGCAAGCGGTGTGCTTTAAGAGTAAAATAA
+TTCATATCAGAATGAAACGTAAGCTTTCTATTTTTCAGTACGGATCACAGTTTGATCCAA
+CCGGTCCCCCACGTCTATCCCGACC
+>ds2020-328_341
+GGTCGGGATAGACGAGAGTAGTTGGTGTCCGGAAGTAAGATAGAGAAAGTGATCGATCAA
+ATTGAAGGGAGTGGTATGGTACAATTACAAAATGATCCAACTGAAATTGAAGATCCATGT
+GAAGTATTTGAACCCGCACAGCCTGAAGTTGGATTGAGTGTGCAGGGAACAAGGGATGTA
+AAGGAGACATTGGATCCGCCCGTCTATCCCGACCACCCGAAGATTTCGTCTATCCCGACC
+AGAGAGCATGTACGTCATCCCGACC
+>ds2020-328_342
+GGTCGGATAGACGCTTGATTCGCCTACTTCAATCAGATCTGCACCAATGGCAAAAGCAGC
+TACAAGATAGGAGGAGTTAGAAGGTTCCGTTGTGGGATTGATCAGAAGATTAGGGAGTAA
+CTCACTTAGTGCTCTTATGCCAAGGAGTCGCTTCTAGTACATATCTCTTCCAAACCTTGA
+TACGAAATAGCCCCCTCTTCTCTAACAAGTCTTTTTCGGGAGAACTGCATGCTCCACGAA
+GGGCGTATGGACGTCTATCCCGACC
+>ds2020-328_343
+GGTCGGGATAGACGAAAAAGCCCCCTGGTATGTGCCGCTTTCCTAATCAAAAGATAGGAG
+AGCACCCCTTCTCCCGAAGTTACGGGGTCATTTTGCCGAGTTCCTTCGACATGGTTCTCT
+CAAGCGCCCTAGTATACTCTACTTGTTCACCTGTGTCGGTTTGGGGTACGGTCAGTTCAC
+CGGGAGGATCGCCCTCCCAATTCGAAGTTTTTTCCTGGAAGTTTCAACCTTGTTGACTAT
+GACAACGACGCGTCTATCCCGACC
+>ds2020-328_344
+GGTCGGGATAGACGTCTACTACCCCTCTTCTTATGGTGTATCATCCGCTTAAATATGAAT
+GGTAAAAGGAAGAGCTACCTCTCCCATATGCGTCTCAATTTCTTTCATCTTTCCCTCACC
+CACCGGTCGAATCTAAGGTGCTTATAGCGCCTGGTCAACTACCTACTTCTCTCTCGATTT
+GGTTGATCGCAAGCAAGCTACCTTAGCGCAGCGCTCACACCTGAACCCCCCGTCTATCCC
+GACCGCCGTAATTCAGATCGGAAG
+>ds2020-328_345
+GGTCGGGATAGACGATATAGAGCGTTAATGGCTTGCGTTGTCAAAGGACTGTCCGATTGA
+GACAATGTTAACCATGCTGGGTAAAAAGGCAAGGATTGATAAAATTGTAGCGTTGAGTCA
+GTATCTTGAATGAGTAAAGGCTTAACTTGACTCTCTTTGGCACGTATTTGACCGGCAACC
+TGTTCAACTTTGTCTTTGGGTACCCCAAAGTAAGCTTGACCGACCAAATTAAGCGGACAC
+CACACTGACCGTCTATCCCGACC
+>ds2020-328_346
+TGAATTACGGCGGTCGGGATAGACGGTCACTTTGGGTTGTGCAAGGGGGCCATGGAGACT
+AGGTTGCTGTTTAGTGTGGCTTTTGGTAGTATTTGGTTTGGGAGGTTGGGATACACGTTT
+CTACGTGGAAGTTATGGGGTGTCGAGAGGTACCTACACAACCGTTATTGAGTACCTTGGG
+TCTTTTTCGTTGACTGAAGTTGAAGAAATTGTAGGAAAATACAAGAAAATGTGCATTACT
+CCCCCTACGCGTCTATCCCGACC
+>ds2020-328_347
+GGTCGGGATAGACGGTGCCCTAGGATGAACGAAGGAGAATGGTAGTCCCTACTAAGACTG
+TGCCTCTTGTGCACCTATTATGCTATTCATACAGGTGATCATGAACGACAGGCTCAGGTC
+AACGAAACCGCTTCTGCGCCTCTAGTCCACCATCAAATAAGGTCTTCATTGGTTCTATCC
+TGCCGCTCCATCATCGGTCAATTTCGCCAACCACAGCCCGCCATACGCAACCAAAGCACG
+ACGACGCGTCTATCCGACCGCCG
+>ds2020-328_348
+CTGAATTGCGGCGGTCGGGATAGACGGCTCAAGGGTTTCTATACAAAGCCCTTCTCTTCT
+TCACTCAAAGGGGCAATGCACTCTTTGAATGGTACTTGATTCATAAAGAATGAATCTTTT
+GGTTAGAAGTTATACGGACTTTATAAAAGTAAATGCCACGTTCCGCGTGTCACGAGATAT
+GGGGCGTTCTAATCGAAGGGTCGTACTCCTCGTCTCGGCCCTATTAGGGTAAGGCCAATG
+CACCAGCCAGCCGGGGTGGTGG
+>ds2020-328_349
+GGTCGGGATAGACGCTCACCTACCCTCAAAGGCACGGTTTTACGTGATGTAGTTTCTACA
+CAACATGGGGGTATCCTACTCAGACTGTGAGGGAAGCCAAATTGGGACTTACTCCCCCTC
+CAGGGTACCAGCGTTGGGGTGGCCTCTTGCCCCAAAGCAAAAAGGTACGACACCGGGTTC
+GTGATCAAGACATCACAAACTCATCCACATGATCCCGATCTTTTGGGACCATAGAAAGGC
+ACACGGTCCGTCTATCCCGGCC
+>ds2020-328_350
+GGTCGGGATAGACGCGAGGTGGAGGTCCTAGTTCTAACTAGGACTGTCATAGGAGCTAAA
+AGAAACTCAAGATAGAGGAGCGGGTTTCCACTGTTAACCGTTGCACACGAAAGAGGATCG
+GAGGCTCCCCCAACCTCTTAATCAAGGGGTTTTGAGCCCCATCTACATCCATGTCAGCAG
+CATCACCCGGGATTATATCCATTGACTATTCATACCAGGTCAAAGGAAAATCGAAAAGAC
+CAACGCCTCGTCTATCCCGACC
+>ds2020-328_351
+GGTCGGGATAGACGACGAGGGGCAGTATTGGGACGAACAGTTGCCGAGGTAGTGAACTAC
+TTTGACAACAAATGTTCGAATGCACTTGAGGTTATGGCAGACGATAAATTTAGTGTATCC
+TATCATACTTACTATGACGTAGATAGGCCAGCTGTGTTGGGTTTGAATACAATGACTGTG
+AACGTACCGGTATATTGGACGAAGTTACCAGTAAAAATACAGCCTTACACATCAGAGCTT
+ACCAGGGCGTCTATCCCGACC
+>ds2020-328_352
+GGTCGGGATAGACGAGCGGAAGGTGTTCAGTGTACCTTAGTACAAGATCGAAAAGAATGC
+ATTGGATGGATGCCCGGGCATTGAGAAGGAAGGACGCTTTCAGAGGCGAAAGGCCATGGG
+GAGATACCGTCTGTGATCCATGGATCTCCGATCGGGAAACCGTATCCAAGCTCCGCGGCT
+AGTCTGCGCTCTTTGGACTTTTAAAACTTAGCGAACTGAAACATCTGAGTAGCTAAAGGA
+AGGCGTTCGTCTATCCCGACC
+>ds2020-328_353
+GGTCGGGATCGACGAACAATCCCCGTAAAATCCTTTGTTCCTCTCATTTATACTTTGGTT
+TATATTCTCCGCTTATTTATCTTTTGTTTTGATTCTATTCAAATATAAAACTATTGATTC
+GTTCTATATCATACCGTTTGAATTTGGATTGAAAAAACAAATAAATAAAGAAGAGTTAAG
+TAAAATCAAATAGTCTTCTTCACAATATACTATGACCAGTAATGCGGTATAAGTAATTCC
+CGAAATCCGTCTATCCCGCCC
+>ds2020-328_354
+CTAACTCTAAATCTCTTACTTGAGTCGTATTTTTGCCCTTTATGAAGTCTCGTTCGACTC
+CTGTAGAGGGAGTCTCACTCTCTTTCAGCATTCCTTCATGGATGTTTAAGTTTACCTGTT
+GCTTAAGGAATCCCGTACAAACAAGATAATGAAACCAAACCCCTTTATACCGTTCGACTC
+CTTTCCTAGTCCTAGCGCTGGATAAATCAACTTACAATCGTGCTTGTTCCTTTACAGTAG
+ACCGATGCGTCTACCCGAACC
+>ds2020-328_355
+GGTCGGTATCGACGTATGGGGCTAGCTTGCTTCTACTGGTGGCGGGCGGGCGAAGGGTCC
+AAAGGACACGTAGCCGGGGGCGAGTCACAAAATCCAATAGTTCCTCCTTAGCGCAAGCAC
+TAAGTAAGCAAGCTACCTCCCCCTATGGTCGAGCAAGTAAACTACCTTCTTGTTCATCAA
+TCGGAAATCAAGACAAACCGGGCACTACGGTGAGACGTGAAAACACCCGATCCCCTTCCG
+ACCTCGATATGTGGAATCACC
+>ds2020-328_356
+GGTCGGGATAGACGTAATTGGCCTTTCTTCTATTCTAGTCCGGATATCTGCATACCATGC
+CGGCTGATCGGAAGCTACATTCTTCCATCGTACAGCAACAGTAGTTCCTTAGCTGCCATC
+CATAGCTACATTATTCGACTAGACTAGTAAATTCAACTAGCTACCCCATGTTCTAACATG
+AAGTCTGCAATGGCTGTATCCATGCCTTTAACGGGAACATGCGGATACATTAGCAACTGG
+AGGAGTGCGTCTATCCCGACC
+>ds2020-328_357
+GGTCGGGATAGACGTGTGCCCTCTCTCCTCTGTTTATGGGATTGCGGCAGCGTATTGGTA
+TGTGGGAAGATTTGGGCAATGGTGTACAATCTCAAAGTTGGAACATGCCACTCGATCAAA
+GTCACTTCGATTGGCATGTGTCATTGCGCATGCTGTCTGTAGCTTTGGACGCTATCGCCA
+AGCTCATCCGAAGACGCGCAAGTGACAAAGTGAGACGGGACTTGCTATCTGTGTTACGCG
+GTGTCCCCGTCTATCCCGACC
+>ds2020-328_358
+GGTCGGGATAGACGTCGTAGATACCTTATCAGATAGAGGGGGGCTCAAACCTCTTCCTGA
+CGGAAATACCACCATTGAGGGAAATTCAGACTCACTCTTGGTATCGATTCTGAGAAGACT
+TTTGCCCCACCGGCAAAGGTTACTTTTGTACGGGCTTGCAGTTGTTGCCACGGTCAGAAA
+GTAGTCTTTGTTCCGGGAATGCTTTTCAGAAAGGAAAACTACGGTTAAAAACTAATGCAG
+AGCCGCCGTCTATCCCGACC
+>ds2020-328_359
+AGGGTATTGAGGTTGTGCGACACTAGGCCTGGCGTCCGCCTAATTAGTGGGGAGACATTG
+ATGTACGCGGTCAGCGGGGTAAAAGATCACCAGAGATACCTTCAAAAGTAAGTGACCAAC
+CGGGAAGTCGCTGCCGTTTCTAGCTTTGCGGCTAACGAATGTGGGAATGAGTTCGCCCCT
+ATGGGCGAGACTCCCATCCATCGGGTCTCCAAGCAATGATCACTCAACTTTATCAACTCT
+GCTCGACGTCTATCCCGACC
+>ds2020-328_360
+GGTCGGGATAGACGATGATGGCCGCTGGTCGGGATAGACGGTGAGACCCCTGGTCGGATA
+GACGTCCCCGCGCCCTGGTCGGGATAGACGATGCACTGGGGGTCGGGATAGACACAAGGC
+GCAATCGTCTATCCACGGACAGAGAGCCGTGGACCTAGTCGGATAATTAGTAGGTCCACG
+GCAAGGCTACACTGACTAGGTCCACGGCAGGCGGCTACAAACTAGGTCCACGGCAGGTAG
+TTCGCAACTAGGTCCACGGC
+>ds2020-328_361
+GGTCGGGATAGACGTTTTTGGCACCTGAGATCATTAAGGGCGAAGGTCATGGAAGTGCTG
+TTGATTGGTGGACTTTTGGAATCTTTTTATATGAGCTGTTGTTTGGTAAAACTCCTTTTA
+AGGGTTCTGGGAATCGTGCAACATTGTTCAACGTTGTTGGTCAGCCTCTCCGGTTTCCAG
+AATCACCAGTCGTCGGTTTTGCAGCAAGAGATCTCATAAGGGGATTGCTTGTAAAGGACC
+CCGCCGCGTCTATCGCGACC
+>ds2020-328_362
+TGGTGGGATAGACGTCCTCCCTTAGTGTTACCCAACCTTCAACCTGCCCATGGCTAGATC
+ACCGGGTTTCGGGTCTATACCCTGCAACTTAACGCCCAGTTAAGACTCGGTTTCCCTTCG
+GCTCCCCTATTCGGTTAACCTTGCTACAGAATATAAGTCGCTGACCCATTATACAAAAGG
+TACGCAGTCACACAGATTGCTCTGTGCTCCCACTGCTTGTACGTACACGGTTTCAGGTTC
+TTTTTCGTCTATCCCGACC
+>ds2020-328_363
+AATTACGGCGGTCGGGTAGACGGGGCAGAGAAGTAAGGGAAGCATTAAGTAAGTAGAGCG
+TGAAGGTAGGGCATGAAGGAAGCATGAAGCTTGCGGACCGAACTCTCACTCGAGAAGGGG
+AAGAAGCACGGCAGTCTTTTGGAGAAGCTTCACCGATCCGACAGCAGCTCTAGCTCTTCG
+AGCGATGAAGAGGGAGGTGAAGGAGAAGAGAAAAAGAAGAAGAAGAAAGAATCAGTAGTG
+GCGGCCGTTGCTGTGTATT
+>ds2020-328_364
+GGTCGGGATAGACGCTGGCGCGCCATCGATCAGGCTGAATTAATGGCGGATTGCCAGATT
+TCTTCTGTCTATCTGGCCCTTTCTGGCAAGCACATCAGCTGCCAGAACGAAATCGGTATG
+GTGCCGATTTCCGAAGAAGAAGTGACGCAGGAAGACGTTGAAAACGTGGTGCATACGGCG
+AAGTCCGTGCGCGTGCGCGATGAACATCGTGTACTGCACGTGATCCCGCAGGAACCCGGA
+TACATCGTCTATCCCGACC
+>ds2020-328_365
+GGTCGGGATAGACGTTGGTCGGCAATCTGCAGGCGTAGGCTTGCTTGCTTGCTTGACTCG
+GCGGTCACTTTGTCGGTCATCTGCGGTATCTTGATGAAGGCGCTTTTCACGAAATTAATG
+CCGGATCGGTCCAAATCGAGGAGATAGTGTCCACGTGGGACTCTCTGGAAGACAGTTTCT
+TTGCCAGATATCATTTCGAAGGTGGGTCTGTCGACTTTTGGTGCATGCTTACAAAGGGGC
+AAGTAGCGTCTATCCGACC
+>ds2020-328_366
+GGTCGGGATAGACGGAAGAAGCCTTTTTCTTCCTTTCCGTCTTTAAACCAACTGCGAAAT
+GCCTTTCTAATTAAGTTGCAAAAGCACTAGAAACCATCTGGAGCTATGTATATTAATGTA
+GGTACGCTTAGCGCTTGGTAGGTCAGGAGCAGAGCTTGTAGTATAGTAGTTCCAAATCCA
+ACTTCTAGGGCATAGGTTTTCCTAACCAAACTAACAACTCTAGTTTATACTGAGGCCATC
+TACCCGTCTATCCGGACC
+>ds2020-328_367
+GGTCGGGATAGACGCCAAGATCTACTTCGGAACAGATACCTTTCCACCTACCTCTCTCTA
+ACAATTACTTGTAGAGACGTATGCTAGGATATTCCATGTTTCCATGGAAAAGATCAATGG
+TCTTCCGACCACTTGAATTGACTCTCTATAGTTGTCTAAGCTATAGAGAACCCTTTCTTG
+ATGTCACCATCAAGAAAAGATTCCGTTTCGAAGGCATTTCAGCCTTCTCATCAGTGAGTT
+CCATCGTCTATCCCGACC
+>ds2020-328_368
+GGTCGGGATAGACGATGCGCACCTGTCTTTGAAGAATGCTGCGAACCCGGCCTAAACGCT
+TCCTGAGACTCAACCCTACTTCGTCTTCGCCCTCCAGCCTTTCCAGTAGTGGATTCAGCT
+CATATTATAAATTCTTACTTCACGAGAGAGATACTCACTATTGAAGGGTATACCCACGGG
+AGAGATACCGAAACTAGAAGCTTTGTTGCACCGCGCTCATTGACTTTCTATCAGAGGGGT
+TGACCGTCTATCCCGACC
+>ds2020-328_369
+GGTCGGGATAGACGTTGTCCGGTAGTGGTTCTGGTTCCAACATCTCTAATTGTGATGTCT
+GTGTAGGTTTTGTCAACGACGTGCCAGCGGTCAGTCTTTCCACGTGAAAACCCGGCGCTA
+GTAAGTCAAACTTGACGGACAGCCTAGCCAACACATCTTTCACCATGTCACTAGCCTGGG
+TGTATGATCTAGGAGTAGGCATAGTGAAGTCATCATATGATGCAACTGCAGCACACCAGC
+TCATCGTCTATCCCGACC
+>ds2020-328_370
+GGTCGGGATAGACGGTGTGGTGGCTTTCATAGTTGCTATTGGGAGGCAGCTTTCGAGTAT
+ATTCAATTGATTTTTGGTATTATTTAGTTTAGGTCAAATGTTCTTTAATTGTACTTCTTT
+TTTCTATGCCCGCGGGCCACCACATATCGTATCAAACTATTGCCCTGTTTGCATTAATGA
+TGGCCTTTTTTATCTCATTCGTATTCCGATCGAGTTTTTTTATGAAACTTGAAAACGTCT
+CTCTCGTCTATCCCGACC
+>ds2020-328_371
+GGTCGGGATAGACGTGGGAACCGGTTGTATGATATCATATTTGAATTGTAACAGGATATT
+AAGTAGACTACTGAGTCATAGCCCGTTGTTCATGTCGGGGAGAGTTAAATTGGAATATAG
+ATTATATATTGTGAGGTGCCTTTTTTATAGCAGCAACCAAGCTTGAAGGCATTTTGTTGC
+TATGCAATTTAGGCGATGGTGGAGCATATGTTATTCTGGACGCTCTGGCTATACTTGCGA
+TTGGCGTCTATCCCGGCC
+>ds2020-328_372
+GGTCGGGATAGACGCAGCCTACTTCTCCAGTGTCTTCAACATCAAACCTGTCCCGGTTCT
+GTATCGCGGCGAGTTCGACCTGAAGACACTGGAGAAGTTGGCTGAGACTATTGACCCCGT
+CTCGAAGGAAGGCTTCGTTGTTCGTGTCACCGACCGAGTTGCCTACGATGAGTTTGACCT
+GAAGTTCTCCAAGTGGGTGCGGAAGGGTCACGTCCACACCGACAAGCACTGGATGTCTCA
+CATACGTCTATCCCGACC
+>ds2020-328_373
+GGTCGGGATAGACGCCGCAAATCCCAATAGAACGAAGAACTTACCCTATTATTATATTAC
+CCAAACGAGGAGATAGACTATCAGCTTACCACTTACTTAGATACGGCTGAAGCAGAGCCG
+GGGAACGAGACGGGTTGAGGTTGAACCAGGAAAACAAGCCACAAAGACGGTGTTTGAGCC
+CGCTGCCCCTTTCTATTACAATTTCTTTCCCTACTCCTTAACCTTGGAGCTCTAGATAAG
+ATCTACCCTTCAGTGAG
+>ds2020-328_374
+GGACGGGATAGACGACGGGCTCGGTTGCTCCAGGTAATTTCCTCCTTCGTAACAAAGTCA
+GTATATGCCAGACGATGTAAACTTTGTATTCGACAACGACCTCCCGGACGATGATGTGTT
+GGTTCATCCAGACATCACGGCGTTGGGCTCTCCGTCTTTAAAGACGAGACAACGTCAGTT
+CCGATCCGGAGCGTTATTTTCTGGTCCCGGTCTCAAAGAGATCGCTCGATATGGTGGTTA
+CTCCGTCTATCCCGACC
+>ds2020-328_375
+AAAACCCCCCTCAGCAGCCGCGGTAATACGGAGGATGCAAGCGTTATCCGGAATGATTGG
+GCGTAAAGGGTCCGCAGGTGGCACATCAAGTCTGCTGTTAAAGGACAGGGCTTAACCCTG
+TAAATGCAGTGGAAACTGAAGAGCTAGAGTGTGGTAGGGGCAGAGGGAATTCCTGGTGAA
+TTACGGCGGTCGGGATAGACGACACAGCTCCCTGGTCGGGATAGACTATATACCTGCCTT
+TTACGTCTATCCCGACC
+>ds2020-328_376
+GCCGTGGACCTAGTTTACATTTATCTGCCTGGACCTAGTTAATTTAGCGGTAATAGGTCC
+ACGGCACTGTACCGACTACTAGGTCCACGGCAGGCAAAAGGCGACTAGGTCCACGGCGGG
+ATGCGATAACTAGGTCCACGGCTCTCTGTCCGTGAATTACGGCGGTCGGGATAGACGACT
+TTTGCTGCTGGTCGGGATAGACGCGCTTATACCCTGGTGGGATAGACGGCCAGTGCGCTA
+TTCCGTCTATCCCGACC
+>ds2020-328_377
+GAATTTCACCTCTAGCATGTAAGTACTCATGCCCCCGACTGCCCCTATTAATCATTACGG
+CGATTCCAAAAACCAACAAAATAGAACCGCACGTCCTATTCTATTATTCCATGCTAATGT
+ATTCGAGCAAAGGCCTGCTTTGAACACTCTAATTTTTTCAAAGTAAAAGTCCTGTTTCCC
+CAGCACGCCCAGTGGAGGGCATGAGGTTCTTCAGAAGGCAGGCCCGGCCGGACGAGTGCT
+TCGTAGTGGCGGCCGTT
+>ds2020-328_378
+GGTCGGGATAGACGCGGCATGCACCTCCAGTTAAACCATAACTCACCAACAAATTCTCTG
+TCTGCCAGTATCATCTCAATATTGTCTTTACCAAACTGCTTGATAAAGCGTTCAATGAGT
+TCGGCTTGCTCAAGATGGTTTGTGTTACCCCGTTTGTCTAGCATGTCCCAGTACAGTGGT
+ATGGCAATGCCCTTATAGACCACCCCTAGCCCAGTTAAACCATAACTCACCAACACGTTC
+CCACGTCTATCCCGACC
+>ds2020-328_379
+GGTCGGGATAGACTCCCCTACCCCCTACTCTAGTCAGCTTTCTATCTCTTTCTCCAACCT
+TCGATGATCCTCCTGCGGGCAAATCATCGAAGTCAAGAAGAAGTGATGGGCCTGATCTTC
+CGATATCGATATCAGATCCATAAGCTAGCTCTTGGTTAAGAAAATCCTGAATATGCTGAC
+CCGGGTGCAGTAAACGAACTTATATTCTCTTCCCTCCCCTCTATCCCGACCAGGGTGTTG
+ATCGTCTATCCCGACC
+>ds2020-328_380
+GGTCGGGATAGACGAGAAACCCTCCTGATGTATTTTAGTATAAATGTCCGCCATCTTCAC
+ATCAATTCTAATTTTTACAGTAAAATTGCTTTGCAGTAATGGAGGTAAATTTGCCAATCT
+CGGACTGACGGAATCAGTGATCTGATCATAAGTAGAATGAATTATACCTCACCGTTGCAT
+TATTGCAAAATCGTGATATGACATTTCAACTACATCGTAATATCTTTTGAAAACCGAATG
+TAGCGTCTATCCGACC
+>ds2020-328_381
+GGTCGGGATAGACGCGCCAGCTGATGTATCAGTTCGAAGATACTGACCTACTTCGTGCCA
+ATCACACGGTTCTTCACGGTGACTAAGGGTGAACCTCTCACGTGTAGCAGAGACCGCCTT
+GCGCAGCAAGGTTGATTCGCGTTCAGTTAGATCAGACCAACGTTTGTGTTGGCCTTCAAA
+CTTCATCAAAGAGTTATACAGTCCGGGTAAACCGGCACCTCTTCGGGTAAAACCACAATT
+TTCGTCTATCCCGACC
+>ds2020-328_382
+GGTCGGGATAGACGTTAGAGCCGAATGGAGCTCAAGAGGTCTCTTGAATTGCTCATAAAG
+AAGACGGAGGATGAAGGAGCAATAGTCATTTCCAATCCAGAAAATCATTGTAATAGAGTG
+TATCTCAAAAAAAGGGAGTAAGGGAAGCAGTTTTAGTATTTCCTCACAACTCCGAATTCT
+CAAAGAAATCTCTAAGAAGCCTCATCGTCATCGGAGTTGACCTCCACCCAACGCACACCA
+CCGTCTATCCCGACC
+>ds2020-328_383
+GGTCGGGATAGACGCGTAGCCCCCCTGAAGAAAGATGGTATCGTAAAGTAGAGTGGATTC
+GACGGTATGCCAGTTGCGTATAGAAAGAAGTTCTACGATTTCATGATGCAGCACGGAGTA
+TAAAATCTCCGTTAGTTCAGTTTCTGCTTTTTCCCTTATTTCCCACTCCTTATGTCAGGC
+AAAACCTGACCACGCGGACTTGAAAGAAAAAGCTTCGATGCATGAGAAGAGGACCGGGCA
+GCGTCTATCCCGACC
+>ds2020-328_384
+GGTCGGGATAGACGACGTGTCCACTGGTCGGGATAGACGACACATTTCCCTGGTCGGGAT
+AGACGTAACAGGGGATCAGATCGTCTATCCCGACCGCCGTAATTCATAGGCAAGTGGACA
+CGGAAATTCAACCATTCGAATTCGTAACGGAGATTGATCAACAAGGTACAGGTACTCCAT
+TATTCCAATATCACTTGACGTTTGCAGCTTACTAAGGAGGGGACTACCAATATATGCGTA
+ATAGTGGCGGCCGTT
+>ds2020-328_385
+AAAGAAGAGCAGCAGCTAGCCATTGGGGTGAAGGATAGACGGAAGAAATGACAATAATGG
+AAAAACAAATACTTAAATGGACTGTAGAAAAAGCAACAGGCCAAAAAACACAGAAGGATA
+AAACAGTAGAATTTATGTCGGAACTAAGAAAAATAAGACAGGCTGACGGTGGGTTAGGCA
+CAGCAAAAACTATATACAAGGGAAAAATACCTATGAGAAATGGGTTGCCAGACTTAGCGG
+ACGTCTATCCCGACC
+>ds2020-328_386
+GGTCGGGATAGACGTTTAGTTGGGATGTTCTTGTTGCTGGTCTTTTTAAACTTCATTTTT
+GATGAAAAAGAAGTGATGTGGTTTGAATGGCTAGAGCATAAATTGGCACGATTTGGCAAG
+GTCGATGCCATGAGCGTGTTTGTCGCCTTGGTACTACTAATGACCAGCAACAAGAACATC
+CCAACTAAACGTCTATCCCGACCAGGGGAAGCTACCGTCTATCCCGACCAGGAGTCTTCT
+TCGTCTATCCCGACC
+>ds2020-328_387
+GGTCGGGATAGACGTATCGTGTGCCTAGACGACTACAACTATCAAGTCAAGTGCTTAATT
+GAAGCTATTAAAACTGGACCTAGTGCTTGTGGTACTAGTATAAATGATAAAGGTGTATAT
+GATATCTTAGAAAATCTAATCAGGTGGACAAGGTCTCAGAGTGCTGATACATCAGATGAC
+AAGAATAAATTCTTTGAATTTGCTACCAACGTATGGCACTGCTATAGTTATGATGATGAC
+CCGTCTATCCCGACC
+>ds2020-328_388
+ATAGTACGATAAAACATCTTTCTGAAAACGGATCGGTAAACGATCTGTAGCAGAGGATAA
+ATCAAAGCTGTGGAATTGGTGGTCACCCAACATGCCTAATAACTTTTTATTTAGAAGAGA
+AATCAAAGGGGCACCTTGATTAAAGGTACCATCCTGTTGAATTCTTCTTAAAATAGAGAA
+GATATAATCATGAAGGGGCTTTAATATGGATTGTGTTACACAATCAGTAATAGCAAAGGA
+GTAGTGGCGGCCGTT
+>ds2020-328_389
+GGTCGGGATAGACGAGGGGTGGATATGGGGGAGAAGGTGGAGAGTCTGTGACGGGAGATT
+TAGAAGGAGCAGTCGAGGGTGGAGTGCCCGCAGGAGAAGGTGAAGCAGCTGGGGTAGGCT
+CTGGTGGTAGTGGAGGTGGTGGAGGAGGAGCCGATTTTGGTGGTGGAGGAGGAGCCGATT
+GCGGTGATGGAGGAGGGGCTGATTTCGGTGGTGGAGGAGGAGGAGGAGGAGGTGATTGAG
+GTAGTGGCGGCCGTT
+>ds2020-328_390
+GGTCGGATAGACGTACGTTTGACATAATCGATGATCCAATCCCATAATATTTCAGGCTTG
+TGAAACGGTATGTTCTCTGTGTCAATGCGGATTGCTGAATCGTGTGCGTTAACTCTATCT
+ACCGCTGCGTCTGCGATTTGAAAGGTTGGGATCGGAATGTCAAAATTTAAAGCGCTAGTT
+TGGTCTCGTCCGCATGCATGATATAGGTAGAAGGTTTCTTTTGCAGGAGTGGAGGCGTCA
+TAGTGCATAACGTA
+>ds2020-328_391
+AACGGCCGCCACTAAACCATTCTTCGTGGATGACCATGCGTGAAGTTCAGGATCTCTTTC
+GCGCCACGAGTCCATATTCATATCCGGCATGGCCAGTATTGATATGAACTTGTTCTTGAG
+GTATATGTCTTTGAATATGTATTTATCGTCTTCTGAATATTGCGAGTGTATAGTGGCGGC
+CGTTGCTGTGTACTTCGGGATAGACGCGGTGTGGCCTTCTATCCCGACCAGGGTGTTGTA
+CGTCTATCCCGACC
+>ds2020-328_392
+GGTCGGGATAGACGAAGACTCACTTTCTATTTGTTTGGCAATGCTGCTCTCCGCTATGAT
+GTTGCGACAGATGTTTGCTGATGAACCCATCCATTATGTTGGTCTGAATGCACAATTATT
+TTGTCTAAATTACATAGTTGGTGATACCATAAGTAACATCCCAGGTGATGGTGAAATATT
+CATACGGCAGATGATGACTGCAAAGTGCGCATCAATTGCCAAACAAATAGAAGGTGAGGC
+GGAAAACCGTTATC
+>ds2020-328_393
+GCCGTGGACCTAGTTTGCAATGGGGTAAGACTAGGTCCACGGCAGGGGGGTCAGGACTAG
+GTCCACGGCAGGAAGGCAGTACTAGGTCCACGGCTCTCTGTCCGTGAATTCGGCGGTCGG
+GATAGACGTTTGTGCGCCCTGGTCGGGATAGACACGGACAGAGAGCCGTGGACCTAGTGA
+CATTGCAACTCCTAGTAATCTAGGCGGTGAGGGACTAGGTCCACGGCAGTGGATAGGGAC
+TAGGTCCACGGCTC
+>ds2020-328_394
+GGTCGGGATAGACGTTAGAATGCCATCATCCCATTTAATTTTACTTCAACCGCACATATC
+TCTATTTCTTTTACTATAAGAATAACATTATGAATATCAGTAGTACTATTTGGATGAGTA
+AATAACTTTAAAAAAATAATAACACACCTAACGCCAACAGGAACCCCTAATAGACTAATA
+AATTTCATAGGATTAAGCGAACTAGTGAGCATAATGATTCGACCTATCACCCAATCTACT
+CGTCTATCCCGACC
+>ds2020-328_395
+GGTCGGATAGACGGTCTGCCCCCTTCTGTGGTCAACTCTCAAGAACTCTGCTATGGCCCC
+AAATGCACATTTCGAGCTCTGCAACCTCACACCAAACTTGTGCGCGTTTGCCTGACATGC
+TTGAGCACATGCTAGGTTATTTGTTCCTATGAGTACGTCGTCCCCGTTGTGCAAGCTTGA
+GCCTGGTGTTCTCCACTCTTTTGCTATCTTCGATGTGTAGACGAAGTTCAGCACGCTGTT
+ACGTCTATCCCACC
+>ds2020-328_396
+GGTCGGGATAGACGCTGCGTGCCAGTCGATCCGCCCATTGACGAATAAAACCTTGTTTGA
+ATGATTTGATAGAAAAAGATACGCAATTGTCGGGGTCAAAGTGAGATTAGCTGAGTCGAT
+GATGTCCTTCCACTCTTTGGAGCCCAAAGTAAAGATGGCAAGTTTGAAATCGAGAACACT
+AAGCCATGTCATTTTCCTATTGAACGGACGACTCCATTGCGTCTATCCCGACCGCCGTAA
+TTCAGATCGGAAG
+>ds2020-328_397
+GGTCGGGATAGACGTGGGATAGGCGTATGGATCAAGACGGACGATAAGAGCAGGAGGAAG
+AACCAAGGGACTAACAATGTACACAGCTTAGTCAGGCTGCTCCCATCTGGAAAAAAACAG
+ATGAAAGATTTGACTGATGTGGACGCCAAAGTGTTCGTGCTGACTACTGAAGTTCACTCG
+ACGTACATGCATAAGCTTAGAGAGGAATTCGCAAGCGAACACTCGATATCGGTGATGAGC
+GTCTATCCCGACC
+>ds2020-328_398
+GGTCGGGATAGACGAGGGGTCCATTTGGGTACCTAAAAATAGGAAAATCCATCATCTGTG
+ACATAAGTTTTGTAGCTGACATTTTTACGTAGTTTAAAATAACCTAACCAAGTTTTCTGA
+ATTTTTGGACAGAGATCTCATGATGTGAATCTTGGCCAGCGTGTGGCTCCACTTGAGGCG
+GCTCCATTGCCCCTCACCTTCCACTGCAGTCACAGGTGCATTTTGCGTCTATCCCGACCG
+CCGTAATTCAGAT
+>ds2020-328_399
+TGGTCGGGATAGACGGCCCGTTTCTTCTCCTACGGGTACTGAGATGTTTCACTTCCCCGC
+GTCAACCCCCACACAGACTATGAATTCACCTGCGGGTAACACCACACAACTGGTGCTGGG
+TTTCCCCATTCGGACATCCTCGGATCAACGCTTTGTTGGCAACTCCCCGAGGCATAACGC
+AGCCTCACACGTCCTTCATCGGCTCAGCATGCCAAGGCATCCACCATACGCCCGCAACCC
+GTCTATCCCGACC
+>ds2020-328_400
+GGTCGGGATAGACGGCACGGCTTACTCACAAGTGAATATTATGATGTAATCTTACATGGA
+CCAAATGCTTGGTTATGTAACGATATTCTTGCATTTTTAGATCTGGTAAACTATGTCTTT
+TAGTTCCGGAAATGTGAAACAACAGTTTTTCCCTGGCATCTCGGTCACTTAGTCAGTGCA
+CAGTGTCAGATTTGATATTCAGTAAGTAACGCAGTGAGTGTTTTCTAGGGAGGGCTTGAC
+GTCTATCCCGACC
+>ds2020-328_401
+TGGTCGGGATAGACATTGCGCGTCCCTGATTGTCATGCACTAGCACTCTGTCCAGCGATA
+GTCTGGTCCACTCCACAGCTGCCAGCTGCTCTTGAGTTAAGAAGTGACCAAACGTGTCCC
+TGTAGGCATCTATTACGGCCTTCATAGATTCCACACTGTGTTGACTGTTGAAATCTTCAA
+AGTCTACACAGTACTGAGTTCTGCCTTCTAAAACTGACCTCACTCTGATACGAACGTCTC
+GTCTATCCCGACC
+>ds2020-328_402
+GGTCGGGATAGACGGTTAGATCCCCTCAGGAAGGTGGCCTCACGTCGTCGGCAAGCTCTA
+GAACGGGGAAGGAGACCTGGACGTTAGTAGAGCTCTGCCGACGACGATGGAATGGCTGAC
+TAGACTGCAAGAGGAAGGCATCGACGGCCTCGGGGGAATGGAGACTGACATTCTGTCGGA
+AGTGATTAAAGGGTGCTTATGGGACTCCAATAATCCAAGAAGCGTTGAGTGCGCTTACTC
+GTCTATCCCGACC
+>ds2020-328_403
+GGTCGGGATAGACGCTTTCGGCCCATGCTACGCGGTTACTCATCTAACACGACGTCCGCC
+ACTGGTTAACAAGTCAACTCAGCGACGGTGTTCGTCGTAAGACGCTAGCACTGCGTTTAG
+AACCCATAGGGGTTTCCAAGTACCGCCTTGTCAGAATATTTATTTACAAAGTCTGTTTCT
+GCCATACTTAGGTAGTCATTCTCCATGGTCCTGGTCTCTGGTACTTAGAACAAGTAGGCT
+TTCTCGTGACCT
+>ds2020-328_404
+GGTCGGGATAGACGCAAACTACCACTAATAAAGAGGTGACCGGCTACGAAATACCTTTAC
+TTCACCCTTAGGGCGGAGCTTGAGAACAATTGGCTTCTTGTAAAAGGTAGTTAAACGGGA
+TTAGATTAATCACAAACAAACAAAAAAAAATCCTAGCATCGCGCTATGCGCTAGCACTTG
+TTGGGGAGGAGTGTGTGCCATAGCTTTGTGAGAGGCAGAGAGGCAGAGGGTTGAAGAATA
+GTGGCGGCCGTT
+>ds2020-328_405
+CACCCCCGCCACTACTACAACAGCTGCCAGCGCGTGCTCCACTCTATTGAGCCTGACGTA
+GTCAATGATCCATTCCCAAAGTGTCTCTGCCTTGTCCCAGGGAATTGATTCATAATCCTG
+TGACATAAACTGGGTGCCCCCAACACAGTCGACTAGAACCTGAGCGCAGTCCACGCCAGG
+TATGTTTATGTCGACGTTAAGTTCACTTTGCTTATTTCGGCCAGACAGATGTTCGTATTA
+GTGGCGGCCGTT
+>ds2020-328_406
+GGTCGGGATAGACGTTCCCCTCGGGTGCTTCTACTTTTTTCCATCCTCTTAGAGAGCTAA
+TAGGTAAAGTATGTATCTGTAGTCCAGGAAGTCAGACATGAAGGAGTACTACACCCATTC
+GCAAAGAAGACGGATAATACCTAGTGAGTTCTCATAAATTGCCGTTGGAAGCTACTTGTT
+GGCTTTGACCGAAGAAGACCTTTCTCTACTTAGTTGGGTAGTACCTATAACCGGCTTCCG
+TCTATCCCGACC
+>ds2020-328_407
+GGTCGGGATAGACAACGCTGAGGGGTATTTTGGGTATTTCGGAAGGATACGGGAGGAACC
+TGAAGAAACTCAGAACACGAAAGTTGTTCGTAATGACAAGATACACGCTATGCAACTGAC
+GGTTTGCCATTCGGAGTTCGTATGAAGAAGTTATGCCCAATTATGACTCCTCGTGCATAG
+GTGATGTTCCCTCCTGGCACAAGGCTAAATGCATAAAATGCTATATAGGGGGTGACAGCG
+TCTATCCCGACC
+>ds2020-328_408
+GGTCGGGATAGACGACAACTTACAATGGATGTATTAGCTATTCTTGCAGTGAATGTATCT
+ATGAGGCAGCACAGCTGCGCAAGGTCTTATTAAGGGTTGTTGGTGACTGGTGTACCATTT
+TTCTTCCTTTTTTTGGCTTCAAAACAGATGAACATACATCCTCTCAAAGACAACCAATAG
+ACCAAGATCGAGGATGGAGAAAACGGCAGTACGATGAAATGGCTGAAGGGCGACTCCACG
+TCTATCCCGACC
+>ds2020-328_409
+ACAGAGGTCTTTCTCGAACGTAAAGCTGCCTAAGGTTGTATCAGGCTACGATCTAATGGT
+GCCAGCATTTATGCACACAAACTCACAACTAGACAAACCAATACTGTCAATGCAAATGGC
+CAAATAGATTGGTAGGTTGCATCAAATGCTACTATTCATGAATGTTAAAGACATTCTAAC
+AGCTGCTGAACTAAGCACACATTGAACTTTTGATCGTATTGATAGTAGTAGGTTGATTCG
+TCTATTCCGACC
+>ds2020-328_410
+GGGCGGGATAGACGGCTATTGTGGTTGTTCGTATTTTAAAATGGATTCCCTACTTGAGTT
+TTTGCTACCTTCACATGAAGATGCGATCGAATTGGTTGATGCCAATTCGGTTAAGACTAG
+CTTCAGCTTGCCTGATTCTAGTGGGGATGTTTCCCCACTTTGTAGGTCGTTGTGTCAGTT
+CTTCGGATTTCTTATGATCCGAGATACTGTTGTCAGACCTGACAAATTTTCTGGTTTCGT
+CTATCCCGACC
+>ds2020-328_411
+GGTCGGGATAGACGTCCGCCAGCCATATGTACTGAGATTGTTCGGGAGACATGGTCCAAG
+CCCGGTATGGCATAGGAATAGAAGAGTCATTCTTTAATAACTGTATTTTAATTAAAAAGA
+ACACTACCATGTTAGGTTTGGAGTGCGGTGCATCTTTCTTTCTCCTGTCGTTATTATGTT
+TAAAAAGTCTTGTTCCTCGCCCTCAGATAGATGTTCTTACCAGCAACTGGTGCTATGCGT
+CTATCCCGACC
+>ds2020-328_412
+TGAATTCGGCGGTCGGGATAGACGTATTTGGCTCCTAGTTGCGTAGTCAAATGTACTACA
+CTGAACCGCTTCTGACAAGGCTAGACTGTGTAATATTATCCTATTCGGGGTACTTCTCCA
+GTTATAATAAGTATCCCAAGCAGCACTATTCACTACGAAAGGAACACCAGCCATAGTGGT
+GGACTGACACCCTCTCAAGCTGCACACTTCTGGCATGAGCATTATGTCGTCTTTCGTGTT
+CCAGATCATTG
+>ds2020-328_413
+AACGGCCGCCACTACTCGTCTGATATGGGGCGACTGGAAGGCGAGCTCAACGTGGACATC
+AACATACCTGGAGTAGACTGCGCGCAAGTTCTCGTCGACTGTGTTGGCGGAACACAGTTC
+ATGTCTCAGGACTATGAGTCCATTCCTTGGGACAAGGCTGAGACACTCTGGGAATGGATC
+ATCGACTACGTAAGGCTCAACAGAGTGGCACGTCTATCCCACCCCCGCAGTGTCCGTCTA
+TCCCGACCGCC
+>ds2020-328_414
+GGTCGGGATAGACGAGGCTACGTGGTAAACAGAGTAGCGGGGGTTTTGAAAGACAGATTA
+CCATATTGTCTAGACTTTGAGGATTTCAACAGCCAGCACAGTCTATCAAGTATGCAAGCG
+GTCATAGATGCGTACTATGAAGTATTCGGGCCGAATATGTCGGAAGGGCAGAGACAGGCA
+GTACTTTGGACAAGAGAATCACTGTCTAATAACGTGGTACATGATAATATGGGTACACGT
+CTATCCCGACC
+>ds2020-328_415
+GGTCGGGATAGACGGAACACCCCCCTGTAATTGTACATGCTCCCATAGAAATAACGTATT
+TTGGTTCAGGCATTTGTTCATATAATCTCACTAAAGAAGGAGCCATTTTCATTGTTACTG
+TGCCTGCTGTTAAAATTAGGTCTGCCTGTCTAGGACTAGATCGTGGCACCAGTCCATAAC
+GATCAAAGACGAATCGTGAGCCTATTAATGAACCAAATTCAATGAAGCAACATTTCTCGT
+CTATCCCGACC
+>ds2020-328_416
+GGTCGGGATAGACGAGCGAGGTTGGTGCAGAGGACGAGATTGAGGTGAAGATGGGCTCTG
+AGGATAGAGGCATGGACAGTTTAAGGGGACAAAAGGGTGTGGCTTTGCTTTATCAGTGAT
+ATGCATGTCATGTGCTTGGATTTTGTAATTCTAAGGGGTTTGTGAAATACGATCAATTAG
+GAAGATTGGGGTTGTTGGGGTTTTTGCTTCTGCATCAGACAGACTAGTGCAACGTTTCGT
+CTATCCCGACC
+>ds2020-328_417
+GGTCGGGATAGACGATTCCGCACCCTCTGTTGTCTCTGAAAAATCTCGTCGTACCGTTAG
+TCCCGTCCTGCGCTTGCCCGACGTTGACTATTCCTGTTCTTGGCTTGCTGTTATCTCTTG
+GGGAGCGTCGTGGATTTCCACTTCTGCGTGTTGAAAACCCTGCATGGGTTCGTGGGCTGC
+AATAGCAGGCCTTGTGACTTGCACCTTCTCTACGTGCATGCCCGTAGCAACACGCCCCGT
+CTATCCCGCCC
+>ds2020-328_418
+AGGTCGGGAAAAGCGATTGGCTTTAGGCGGCGCGAGGGACGGAACATCTTCTCGATAACA
+CGAAGAGCTCTTTTGTAGTGGAAATCCCTTGGAACGTCGTGGTAAGGGAGGTCAGTCTTA
+AGGAAGTCTTCTTCTCCGGCGGCGGGGTTAGTTGCAGAACGGCGGTAGCCATTGATTGCT
+TCGTTTGCCAAATCGGGGGGACAGCACTTATAGATTGCCTTCTGACGTCTATCCCGACCG
+CCGTAATTCA
+>ds2020-328_419
+GGTCGGGATAGACGACAGATACCGATCCTCTAAAATGCGTTCACGTCCCATCAATTCGAT
+AAAGCCGTCCAATTTTCGGTGTCACCGACAATTTGAATGGTATAAACATTGGGCGTGATA
+TCAACAATACTTGCAGGGAAGATATCCGCACAGCGCTTGACTTCTTCGCGGTTGCTACAC
+GTGGCGCGTACTTTGATCAGCATGAGTTCGCGCTCAATATGTACACCTCCGATCAGCGTC
+TATCCCGACC
+>ds2020-328_420
+TGAATTACGGCGGTCGGATAGACGCGAACTCCACGTTAGAAGAAAAGGCGTTAGCAAACG
+CTAAGCGAAAGGCCAAACAAAAGGAAGAGGAAAAACTAAAATTGCAGCGTCAGTTAGAAG
+ACGAGCGTTTGCAGGCGTATATGCAGCAGCAACAAGAACGTCAGCGACGACAAGCGGTGG
+AAGCAAGGAGCTTGATGCCGATTTATGGTGAGACCCCAATGACTCGTCTATCCCGACCGC
+CGTAATTCA
+>ds2020-328_421
+GGTCGGGATAGACGGTTCAGCAGCGTGGACTAAAGTAAAGTGGGATATTGAGAGGTTGTC
+TCGCTAGAGCTTGTGCTACCTTTGTTAACGTCAATTGGGAAACAGATAGAATCATAGGGT
+TTGACAACAAACTGCATGAAATATTTTCCTCGGTGGCTGTGTTAGAAAGAAGAGGTGCTT
+CGACTAAATCATGCCAGAAAATCTGGAAAGCTGCTTTCTTGCGATCAGCAAAGAATTATG
+GTTGGGATC
+>ds2020-328_422
+GGTCGGGATTGTTGAGGGGAATGAGGGAAGTGGGTTGGCTGGCAATGGAGGGAGCACCGT
+AGGCAATGTGGATTTTGGCAAAGATGGGATTTGGGGTTGGAAGGTTGGCAATGGGGGCAG
+AGTAGTTGGGAGAGTAGGCAATTGGGTAGACGGCAACGGTGGCAACGTGGCCGGCTTTGG
+CAAAGTTGGAGCAGTTGGAAGCGTAGGCAATGGGGTGGTGTAGTGGCGGCCGTTGCTGTG
+TATTAGATC
+>ds2020-328_423
+GGTCGGGATAGACGATCTTCGCCCCTTGAGTCACGGTACTTTGGTTTAGTCAGGATCACC
+CTGTAAAACTAGCTTAATAGAGGTCGAAATAAAAGAGTTTTGGGGTTCAATCTTCAAGTA
+AGGAGGAGTAAAGAAGAGGAATCGCGAACATACTCAATAGATATCTTTCTTCGACGAGGC
+GGTGCCTATTAAAGAGTTATTATTTCAGGGACGCCACCCTACCACCGATGTCATGCGTCT
+ATCCCGACC
+>ds2020-328_424
+GGTCGGGATAGACGATACAGTCCCCTCACTCACTATGTAGCGCAAGGAAGTGTGCGAGCT
+TGCTAGGAGTGTAATGATTAGCAGCTTTCCCTTTAGGCTGTTAGATGCTAGAGACAGGAA
+GAAAGGAAGAACTTTCCTTCCGCTCATGCTCTTTTCGAGAGAGCGTTCACTTACTATAAG
+AGCAAGGAAGTTATGGAGCTAGGAGTTAAGTAATGTTAAAACAACTGGAACACTCGTCTA
+TCCCGACC
+>ds2020-328_425
+GGTCGGGATAGACGAGGGATCACACTGTTCTACTACGTACCTTTCATATGCATACGATAT
+TTCTTGTACAATAGCTCTCTCATCGTTAATATTAGAAATTATTTCAAACGTTTAGGAGGA
+CCAAATATGATGAGAAGTATTTACATAAATTGTTGAAGGAAAAACTAGGAGACAAACATT
+TGCACGACACATTTACTAACGTTGTAATCCCAACTTTTGATATTAAGCAGCAACGTCTAT
+CCCGACCG
+>ds2020-328_426
+GGTCGGGATAGACGTATGGACACAGTGTCTCGACAGGGCCGCAACGGAACAACGGAAGTT
+CACTGGGTAACTCTAATCTAAGGGGTACGGGGACGTAGGTTCGAATCCTATTTGCGGCTA
+ATACCACCAATGGTGTGCTCAAAAGGTTCTTGTTCGTAGTCCAATGGCAGGTAAATTCTC
+CTTTTTCACTCCCGAGTTGTTTAGATTCAAGCAAAGCCCAAAAAGGAACGTTCCCGTCTA
+TCCCGACC
+>ds2020-328_427
+TGGTCGGGATAGACGCTGAAACCACCTTATATAAGCTCGTCACCAAACTTATAGGCCTAA
+AATCCCTAAGTCTGGCAGATTCTATCTTTTGGGAATCAGGCAGATTAGGGTTTCATTAGT
+TACTGCGTTGATAATTCCGGAGTTATAGAAATCATCCATTACCTTCATGAGATCACCTTT
+AATAGTATCCCAGCAAGATTGGAAGAAGAATAAAGTGAACCCAGGGAGGATGTACGTCTA
+TCCCGACC
+>ds2020-328_428
+GAAGAGCTGTCGGGAGTGGAACAAGTTGTGGGATAGTAGGGGGCAGTGGGGTGCTGCGGG
+AAGCACGCATTCGCAGTACCAGGAGGACATGGCTTACGTCCTCAAGGACGACATAAGGCT
+CAAGAATAAGTTCATTACCATATCGAACATGCCGCGCTTTCCCATGACAAGATTTACAAA
+CAGACCGCAGGAGATACAGGCTTGGGCGTCCACTAAGTACGAATGGGGCGGGGTCGTCTA
+TCCCGACC
+>ds2020-328_429
+GGTCGGGATAGACGGCGAACAAAATGTAAAACATATCAGAGATGTAGTATTTTAAGAAAG
+AGGGGGGAAGGGGAAAGTCAAGGCCAAAGAACAAAGGCCAAATAAGGGCTACACAAGACG
+AAAAACCAGAGGCAGCGCTAAGGCGCGAGGGGGATGTGAAAACAACAACAGTTCCACATG
+AAGGTCCTTGGAATGGAAGAAGGATCGGTAAAGTCGAGAAGCAGTGAGAGGCCACGTCTA
+TCCCGACC
+>ds2020-328_430
+GGTCGGGATAGACGTTGACATTCCGTGAATGCTTTTCTGCATAACAACTTCCAACTGTCC
+TCTTGGCTTCGAAATCGCAGTTCATGGGGAAGGCTTTGGGCATCTGCATGCAGAGCAACA
+TTGTTGTTGCGAGTTGTAAGCAATAATTTATTGCCACTGCCATCACTTGGGAAGGCCTTT
+GCAAGACTGTCAAAAGCGGTGGTACTCCATGTATCATCTAAAACAGCCAAAATGCGTCTA
+TCCCGACC
+>ds2020-328_431
+GGTCGGGATAGACGACTGTGGCCGATACTACTGGAAGGATTCCTCTTTGGATAATAGGTA
+CTGTAGCGGGTATTCTTGTGATCGGTTTAATCGGTATTTTCTTTTATGGTTCCTATTCTG
+GATTAGGTTCATCCCTGTAATAATCGGATGAACTGAGTTGTAGACATGAAAGCATAAGAA
+CTCAACGGGATCCCCCTCGAATCAGACAAGGAAAAAGGGGGGGGGGGTTCATGCGTCTAT
+CCCGACC
+>ds2020-328_432
+GGTCGGGATAGACGTTCCTCAGGTGTCAAATGTGATGCTGTACCTGGTCGTTTAAATCAG
+ATCTCTACTTCGGTACAACGAGAAGGAGTTTACTATGGTCAGTGCAGTGAGATTTGTGGA
+ACTAATCATGCCTTTATGCCTATCGTCGTAGAAGCAGTTCCTAGGAAAGATTATGGTTCT
+CGGGTATCCAATCAATTAATCCCCCAAACGGGGGAAGCTTAAGCGGTGGCATTCGTCTAT
+CCCGACC
+>ds2020-328_433
+GGTCGGGATAGACGACAAAGGCCTGTTCGCATCGCAACTAATAGAAAAAAACAACTACTA
+GACTAGACTAGTAGTTGAGTGCTCCTTGTTGTTCGGATCTTGACCGGGTCCGAGCTTCCC
+CAGCTCTATGCTGTTGGGGAACTCTGCAAGGGTCTTACCACCTTCTTGATTTACTATAAT
+TGAGTCTTTGGAGTACTTTAGGATTATATTCCGCGCCGAGGATTTGTGCTTGACGTCTAT
+CCCGACC
+>ds2020-328_434
+GGTCGGGATAGACGGGATGCTTTTGTTGAAGGGAGGAAGATTAAAGATAATGTCCTTGGA
+ACGGGTCTAAACGAAACTTCCGAGCCCCTATGTTGTAATGGTTGGGGCTGCTAATATAAA
+GACTTTTTTGGGTCATACGACACCTGCAAAACGAAAAAGCCCTAATTTCAGCCCCGAGCG
+GATAGCCCATGAAATACCTGTCACTTTGAGCCCGTGGAGGCATATGCTGCAAAGACAACC
+TCGTACC
+>ds2020-328_435
+ATAGGGCCCTATCTGGCTTTAATAGGGGGGCAGCGCCAGTTGTTTGTTTTCAAGTCAAGC
+CCCGTATCCCTATCTCTTTTTAGGTTGGCATAACAAAGAAAGAGAGTGCCAAGAAACAAC
+ACATACCCCCCCGCTTTTGGAAGGTTCGGGATCGTCAGGGAGCCCCTATAGACGTAAAGA
+CTTGACTTCACTGAACCGGCACTACTATTTGTCGGCTCCTACCACTCGCCTCCGTCTATC
+CCGACCG
+>ds2020-328_436
+GGTCGGGATAGACGTTTGGCAGCGTTATGGCTTTCCCCTCGGAGATTGCATCGGACTGTT
+TCAGCAATCTCTGGAACATCCTGTGACCAATTGAGATCATTTCCTTGTCATTCCGCTTGC
+GAATGCCATAGAAAATCTTATAGTCATTGGAGTTGCCAGGGTTGCACCTCTCCTCGATTT
+CATTGGGGCCATATTCTGAAATTGGGACGGCGTCGACAAACACCCCGTTCTTGCGTCTAT
+CCCGACC
+>ds2020-328_437
+GGTCGGGATAGACGCCGTGTACCGCTGGTCGGGATAGACGATACGAACTAGGGATGGGAT
+CCCGCCAAAGAGAGTCGAGAGCCTCTATTCCATGCTTTCGCCAAGCTAGTCTGCGAGTTG
+TCCGCCTAACTCACGACAGTTGGTACATTAGTGAAAGATGCAGTTCGCTTACCTATTCGT
+TTTAGATATTTTAGCTTTAGCTAGAATCAACCCCCAATATTAGCACCCAATGCCGTCTAT
+CCCGACC
+>ds2020-328_438
+GGTCGGGATAGACGGACAACGGCATTAAAAGAAGAGAAGGCCAGTCCTTGAGCCAGAGGT
+CATAGTGATCCTGTCCTTTCAATAGTTAAAGGCACACAAGAGAATCGCTTGGGAAAGAAG
+GGCTAAATAGCGCCAGAGGGAGCTGCTAGAGAATCAGCCCCCACTCTCTTTCATTTCCTC
+CCTCTCTAGTTAGCGCGTAGTGGGAATAGCCCTTCATCGACCCGGGTCAAGAGCGTCTAT
+CCCGACC
+>ds2020-328_439
+GGTCGGGATAGACGGGGGTGCAGTATGTCTATCCCGACCAGCGCGAGTACACGTCTATCC
+CGACCAGTATAAGCAAACGTCTTCCCGACCGCCGTAATTCTCGGACAGAGAGCCGTGGAC
+CTAGTAATTGGAACCGTGCCGTGACCTAGTTTTACTGCTCGTGCCGGGACCTAGTGACTA
+ATGGGGCCTAGTCGTCAGGGGGTTAATGACTAGGTCCACGGAGGGGAAAGCGGACTAGGT
+CCACGGC
+>ds2020-328_440
+GGTCGGGATAGACGATATACGCCGCTAACCCTAGCACTGCTCAAACATACTGATATAAAG
+CATATCCGCCATGTGATTGGCTCACACCAAGACCCTGATATCATTGCGTCATTGCCGCGT
+TGGTTATTGCATACCCAAGCCAATATCGTCATCTCAAGGTTGTGGGAGCGTATTTTACCG
+CATCTTAACTCCGCGTTTACTACTGACCGTCTGCAAGAAGGGGGGGAATCGTCCGTCTAT
+CCCGACC
+>ds2020-328_441
+GGTCGGGATAGACGTGCCCAGCTACTTCAAGAGTTAGATCCTTTGGCAGACATACGTCAC
+TTCTACCACTAGCAGTTTACAAACATAACACCGAAACTAGCTATGTAATTGCGAAACCAG
+AAATATCAATAGTCAAACTGGGTCAGAGAAACGTAAGAGTGAATCATGCACAACTAGTGC
+ATGGTAAGAAAAAAGATGTTATGTTTCATGTAGTTGGCAGTGCCGTCTATCCCGACCGCC
+GTAATTC
+>ds2020-328_442
+GGTCGGGATAGACGAGTCAGGGCTCTCAAAACCAAGTCAGTTAAAGACAAGATGGATTTG
+CAACCGCCAAAGGCCAAAGGAGGGCAGAGCCCCCCTCATACTCGACCTTGGCAACAAGCC
+TTAGCCGACAGGGGCTGATTCCTGCTCTGCAAAGTCTTTTGAGTGTTCATCCGGTTCTGC
+TGATTCCTGCTCTCCCAAGTCTTCTGAGCCTCGAATTCATAACCTGCATGTCACGTCTAT
+CCCGACC
+>ds2020-328_443
+GGTCGGGATAGACGTTGCAGCATGGTAAAATAACTGATCCTTCCGGGCAAGTACACACAT
+TGTATTATGGTGGTACTGCAGGGGGTGGAATTGAACATTTTGGGGGTACATTCACATTAA
+ATTGTGGAACTCATTATTATTACGGAGATGCCAACCATAACACGAAGGCGCCTTATGACT
+GTTAATACTGATGTCACCCAGCACTCACTGTATGAGTATAAATGGCAGCCGGCGTCTATC
+CCTACA
+>ds2020-328_444
+GGGTCAATCCAGAGAGGGTGATTGTGCTTCTTGAGTTGTTTGTTTTGGTTCTCTCATTTA
+ATTTTCAATTTTCTTTCTTCCTCAATTTATGTAGTTGTTGGGTTTTTAAGATATGTATGA
+GAGATATATATATATATATTGTTTGTGGTGAGAAGAATGAAATGAAGAAGGAAAGAGGGA
+AAGAGGGAAGAACAGTTAGGGTTGGGGTTTGGGGGAAAAAAGACAGGGATGACGTCTATC
+CCGACC
+>ds2020-328_445
+GGTCGGGATAGACGTAAGTGGCTTTTCCCAAGTCGACCTGACCGTGAAGTTCGTGGTAGT
+CGATGTATCGTTGTACTACATTTGATATTCTTGCAAACTTCGGGTAGTAGTTTGTTCTCC
+CCCCAGCCAGTGTTGGCCAGTGCGATCGCTTTCGGTTGGCAGGAACTATCTTGTACATTG
+CTGTTGATGCAAGCCTATATTTCATGGGTCTAGGCTTGTGATTCGCCTGTATCGTCTATC
+CCGACC
+>ds2020-328_446
+GGTCGGGATAGAGATAAGGGTTCTGGCTTGAATACCACGACTTGATCATGACCATAGTCG
+GCTTGGTGGTCGAAATCTCTGAGGGTTTGGAGGTTTTGAGGTGGGTAGAGAAAAGGGTTG
+GCGTTGATGTCGTGAATGGAGGTGGGATTTATGGGGAAATTAATGGAGGAGGGCTGTGGA
+TCCAAGTAATTGAGATGGTTGCGGAAGGTGGAGGCTGAGGAAGAGGAAGAATACTAGGTC
+CACGGC
+>ds2020-328_447
+GGTCGGGATAGACGCCGAGCCTGCTTTCGTGCCTTCTCTCTCTCTCTTCTTCTGCGTAGA
+AGCATCAGTTTGATCATTCAGTTCTGCACTTTTTGCCTTTCTTGCAGGGACTCTTCCTTT
+GGTCGTCTCCTTGAGATAGTTTGCCCTCTCCTTTCAGTCGAGCTACTTCGTTACCCTCTC
+CTCTCCTCTCTTGTGTCGATTGTTCTGCTAGCTCCTCTTTGTACCGCCATCAGCAAGGAA
+TCGGGT
+>ds2020-328_448
+GGTCGGATAGACGGATATGTTCCTTGGTCGGGATAGACGACCAGGCGTTGTTTTCGTCTA
+TCCCGACCGCCGGACAGAGAGCCGTGGACCTAGTCTGACTTCCCTTGCCATGGACCTAGT
+CTTCATTCTCCTGCCGTGGACCTAGTCTGTTTATACCTGCCGTGGACCTAGTCATCACCT
+CCCTGCCGTGGACCTAGTGCTAAGTCGGGTGCCGTGGACCAAATCTATTCCCACTAGGTC
+CACGGC
+>ds2020-328_449
+GGTCGGGATAGACGTGTGGAACTCAACGTGCCCACCGCAAGCTTCAACTGCTCCTGTTAG
+TGTATAAATCAGAAGGATAGGTAAACCGAGAACTTTGATGCAGAGGCAACCTGGCACTGT
+TGACGAGCCGTAGTTTACTACGATAGCGGTGGGAATTGAAGCCCACTGTAATCTCCCAAC
+ATCTAGGCCCATCAGGGTAAAGTGTGAGAATGAAATTCAAAATGCCCCACTTCGTCTATC
+CCGACC
+>ds2020-328_450
+GGTCGGGATAGACGTAGATGAACGGTATCTGGGGAATAAGCATCGGCTAACTCTGTGCCA
+GCAGCCGCGGTAATACAGAGGATGCAAGCGTTATCCGGAATGATTGGGCGTAAAGCGTCT
+GTAGGTGGCTTTTTAAGTCCGCCGTCAAATCCCAGGGCTCAACCCTGGACAGGCGGTGGA
+AACTACCAAGCTGGAGTACGGTAGGGGGCGTCTATCCCGACCGCCGTAATTCAGATCGGA
+GGGCA
+>ds2020-328_451
+GGTCGGGATAGACGCGCCCACAATATCAAGCCTACAAAGAAGGCCTCGTGCATGTCACCC
+TTTTTGTGTAAATCCTTAATAACGTTAAACATGAACCCTGCCTTACTAATAATTGTTTGG
+AAATCAATAGCCGCTAATTCCCTCACAGTAATGTGTCTCAGGTGACTGGCAGACACCTTC
+AGCACGGGTAGGTCAACCACCCCTGAAAAAATATTCTCAATAAATTTCACGCTGGCCAAG
+CTTGG
+>ds2020-328_452
+GGTCGGGATAGACGGCCATTCCGTTTTTTTTTAATCCAATTGTTGACGAGGAAGAAGCAG
+ATAGAGCAAAGGTCTCCTCTTTCCGTCCGCTCTTCCCGAAGTGAGCGAATTGCATGTAGA
+GATCCGTAGGGGCTTATAGTTTAATTGGTTGAAACGTACCGCTCATAACGGTTATATTGT
+AGGTTCGAGCCCTACTAAGCCTACCACCCCCTTCTCTGCACCCGACCCCGTCGTCTATCC
+CGACC
+>ds2020-328_453
+GGTCGGGATAGACGAATTCGTGCGGTCTTTCTATTTTGAGGCAATGTTGTAAGCATCTTG
+TTCAGATGGACTGCTCATTGTTATGTACGTTGGATTTCGGAGTCCAACATGGATTGGTTC
+GAGCGTGGACCGTGGTTCCTTTCCATCTATGATAATCTCTGTAGGCATTCCTGGTTACTC
+CCGTTTAGCGTGGATACTGGGTTCATTGGTAGGTGAGTACCCAGGATGACCCGTCTATCC
+CGACC
+>ds2020-328_454
+GGTCGGGATAGACGGATAGGCCCAATTATCGTCTATCCCGACCGCCGTAATTCATACCAT
+GACGTATCTGTAATAGTAATCATGAGTAAAACAAAAATACTTGTACAAACTGGCAAAGTA
+ACCCCATCCCCAACGGTCCAAAGATTCAAATCTTTGTAATATTCTGAACCATTCATAAAC
+ATCACAGCAAATACGATTAAAACATTTATAGCTCCCACGAGAGGGGTCGCATAGTGGCGG
+CCGTT
+>ds2020-328_455
+GGTCGGGATAGACGAGCTCTCCGCATATCCAATAAAAACAAAGCGTGCTGCTTCAACGAG
+CTCTCCTTCTGATGGTGGTGGATCAATAACTGAGTTTAATGTAGTTCTTCCCTCCGGAAA
+CTTGGTTTTAAGCTATTTTTCGCTCCCAGAGCTAGTTGAAGAAGACTCACTACCCTACTT
+CACTGATAAGAGTGGAGTCCCAAGCCACGCAAGAGACGGATTCATAGTCAACGTCTATCC
+CGACC
+>ds2020-328_456
+GGTCGGGATAGACGTTGTGGGTGGATAAAAGTTGTGCATTTTAAAGGGTAGTTTTGAGGA
+ATGTGCGATTTTATATTATATAGGAAAACTGTTTGAATTATTACTTTAAGCTAGAAAAGG
+AGATTTCCTACATCCCAAGCTGCTAATTCTTAAAACAATTCAATTATTACGGTAGTAAAG
+TAAGAAATTTGTTATCCTTCTGTCCTTAAAACCACATTTTAAATTAAATTATTGGTAGCA
+GTTTA
+>ds2020-328_457
+GGTCGGGATAGACGGTCTAATGAGGTGGTGGAGGAAAGTCGAAGGCTTAACAAGTCTGGG
+ATGTTGTTCAAAATTGATTTTGAGAAAGCCTATGATCATGTGGAATGGAGATTTGTTGAT
+GAGGTTATGATTAGGAAGGGTTTTGGGGAAAGGTGGAGAAGATGGATTTGTGGATGCCTC
+AAGACGGCTAATTTTTCTGTGATGATTAATGGAAGACCAAGGGAGGTGGGCGTCTATCCC
+GACC
+>ds2020-328_458
+GGTCGGGATAGACGGAAGGTAGCATTGATAGGCAGAAGGATTTGGTGACGGTGAAGGGCT
+CAATGGACATGAAGGAATTGGCTGAGACTTTGAAGGAGAAGCTCAAGAGGCCTGTTGACA
+TTGTGCCGCCAAAGAAGGAGAAGGAGAAGGAGAAAGCCGAAAACAACGGCGGCGGCGGTG
+GCGGTGGAGATAAGAAGAAAAAGGAGGAAGAGGGGCATATAGTGGCGGCCGTTGCTGTGT
+ATTA
+>ds2020-328_459
+GGTCGGGATAGACGAGGCCGTCACCTATGGTTTTTGTCTCACTGTACGGGACCAGTCTAC
+AAATATGGAGATGTACAAGCATTGGGAAAATAAGAATCCTTGGTCGATAGAGAGCCGTTA
+GCTAGCAGCCGAAGACGAAGGAACAGACCAGTAAGTGTGGAGATGAGCCTGCTAGACGCA
+GAGCTGGATCTGCTATATGCGGTAGTTCTTCCTTCCGAAACGCCTTACCTCGTCTATCCC
+GACC
+>ds2020-328_460
+GGTCGGGATAGACGTGGTAATGGTATGGTTGTGTGGAAAGACTTGAGGAAAGAACTACGT
+GTGGCTTGATCCCTCAAAAAGGGTACGCAGGCAGCCTGAAGTTACTAGGCGCGGCCGCGG
+ATTAGGCACCACTTAAGTGGTTTTGTTGATGGGTTCGGACCTCGTGGTTGGTTCCGAAAT
+TTGGTTGAATTTGAGGTTCGCTAGGTGAGTTGAGTGTAAGTGTGGTTCACCGTCTATCCC
+GACC
+>ds2020-328_461
+GGTCGGGATAGACGGAAGGAGGTCGTGTAATAGGAAGGTAAGGTGTAAGCCTCGAAAGCC
+TTTGGTACTTCGGTAGGGCGAGCAGCCCTTAAACCAAAAAGGTTTGGAACCCTTCCCCTA
+TTTCTGCATTTCATTCTCTAGCCTCAAACAAAATTAGAAAAAAGGAGAGGCCTTCGCATT
+CCTAATCCGGTGGGGGGCCGGACGGCTTTGTTTGCCCCAGCTTGGCGAATCGTCTATCCC
+GACC
+>ds2020-328_462
+GGTCGGGATAGACGGGAGCAATATATGGGGTGGATTTAACTTCGGCAACAGTAGCACACT
+TTGCCATGTTTAATTGTGAAGAAGCCTTGAAGCATAGGTTCCCGGTAGGTGAAGATGCGG
+AAGCCGGGCGTGTGCATAAGCGGCTAAAAGCTATGTTAGAAGGATGTGACTCGTACTGCT
+ATGATTTCGATGATTTCAACGCTCAGCACTCGACGTCGAGTATGGTCGCTGTGATAAAGG
+CGTA
+>ds2020-328_463
+GGTCGGGATAGACGATTGCCGTTGCTGAAAATGACGGGCATCAATTGGTTGGGGGATAAG
+AGCTTTGGTACCACAATTCTGGAAGATGACGAAGGATGTGGGCACCACCTCAGGTCACAG
+TTTCAACACGTTGATCCAATCTATTTGTACCTTGATGGTGGGCTATGCCGCACTCTTCGA
+CCTGGTTCCTGATGAAGACTGGGATCGGCTCTGGCAGGAGGCGTAGCTCGCGTCTATCCC
+GACC
+>ds2020-328_464
+GCCGTGGACCTAGTGGTGTCCCTGTTGCCGTGGACCTAGTGTAATGGAGCCTGCCGTGGA
+CCTAGCAACTCACTAGGATAGGCGGTATTATTGAACCAAACAAAGCAACAAGCAATAAAA
+CCAAAAACAGATAAAGCAGCTAAACTATAAGACAGGTAAGCCTCTCCATACCATACAAGT
+GCACGGCGAGCCCATGCAAAAGGTTTGGTTAAGATATGCCAGATTCCACCAAGTATACAA
+ATGG
+>ds2020-328_465
+GGTCGGGATAGACGTCGACCCCGCTTCTTCCACTTCTCTTTCTTGTGGTAGTCGTTCTCT
+TCCTTGTGGTAGTCGAATGAGGAAGTATGTTGCGGCAACTAAAGAGTTATCGAGACTGAC
+CGCAATTGCAGTAAGAGTTTGACTTTCTTTCAGTTATGTAAAGTTGTTTAGTACGAGATC
+GCTTCACACCTCGCGGTGCTTACACCTCTCCCCACTCAATAGACTCCATAACTAGGTCCA
+CGGC
+>ds2020-328_466
+ACTGCTGCAGAAGCGGAATCGAAGGGGTTGGTTGAAAGGTAAGGATAGCGTGATTGGCCG
+ATTGGTTGGAAGGTAAGGATAGCATGATTGACTGGTTGCGGGTCCTTTGGATCATGGGCC
+ACAGCTACTTGGGTAGAGACCGCTGAACATCATTTGGACAGGCCGAGGCTATATGTGCTT
+AGGCCTTTTGATGGCTGTCATTTTCTGGGCTATTTGGAAGGGTTAATGTCGTCTATCCCG
+ACC
+>ds2020-328_467
+GGTCGGGATAGACGGTCAGTCCCCCTTTGAAATCAAGCACCTCTAACCTCAGCTTGTTCC
+CCGTTATTATACCTACCATTTCGGCTCTAGTTACGGAGTTGCCATTACGTGTGACATAAG
+CCGCATATTCCGTATACTTGTCGCATATGCCTTTCAATTTCTCGGCTTCTTCATCCACTT
+CTTTATTGAACATCACATCTTCTAAACCACTACACTCACGTGGCTCCGTCGTCTATCCCG
+ACC
+>ds2020-328_468
+GGGCGGGATAGACGAAGGAGATGCATTTCTGGTACTGGTGATACTGGACAAGCTCTCAGG
+GAATAATCTCTTTCTTATTTCTGCCTTTCTTTCCCATGACGACTAGGAACGGGCAAATCA
+AAAATTTCACTTTGAATTCCGGACCTCAACATCCTGCTGCTCATGGTGTTTCACGATCGG
+TATTGGAAATGAACGGAGAAGTGGTGGAACGTGCGGAACCACGCCGGACGTCTATCCCGA
+CCA
+>ds2020-328_469
+GGTCGGGATAGACGAAGAATGGCTCTTACCTAGCTATTGCCCTGATCCTATTCGATCGTA
+TAGAACGCTACTATAGACCCTAGCTATTCCGCCCTATCAAAGCCCAGAGCAAAGAAGGAT
+GGAGGGACAACAACCCCTGAGGGAAAGGCAGAAGCATAAGCACTGACACGAGATGTCCTT
+ATCATCACTCTTTCTCGATCGAAGGCTTTAGCATTCCAATCTCCGCGGCCGTCTATCCCG
+ACC
+>ds2020-328_470
+GGCGGAAGACGAAGCGGGAGGAGATTCTTCATCACCAGATGAATGGAGTGCTTCGGGGGC
+ACTTCTTCCCAAGTCGGAAGACGATTGAGTCAGACCGGGCTCACTTTTCTAGTTAGTTCT
+AGACAAAGACTTCAGTGAAGGAACGGAGCTTTGTTGAAGCTATTACTCAGACTCTTTTTC
+GTACTATTGGCAGTGGAAGAAAGATCTTAGAATAAGTATCCGATTCAGACGTCTATCCCG
+ACC
+>ds2020-328_471
+GCCGTGGACCTAGTATTCGACCCCCTAGCCATAACAGTGCTCTACCCCCGACGGTGATAC
+GAGAGGCACTACCTAAATAGTTTTCGGAGAGAACCAGCTATTTCCAAGTTTGTTTAGCCT
+TTCACCCCTACCCACAGCTCATCCCCTAATTTTTCAACATTAGTGGGTTCGGTCCTCCAG
+TGCGTGTTACCGCACCTTCAACCTGGCCATGGGTAGATCACTTGGTTTCGGGTCTACACC
+CAG
+>ds2020-328_472
+TTCGTATCGATAGTTTTTATTTGTGACAACTTTCGTCACTAATAAAACCTACTTCAACTG
+AAGGGTGATAAATCAGCCGTACTCTTTCCCAATCCATGCTATCTATGGCGTGTAGAAATA
+CACCAGCTGTAACCGACCAATACCTACAAATGCATCTCAAGTAATTTGAGTTATTTTATT
+AGGCGGGGACAGGATTCGAACCTGCAGTCTTCAGGTCATGAGCCATATTCGTCTATCCCG
+ACC
+>ds2020-328_473
+GGTCGGGATAGACGTATGATATGGGTCCGTGCAGCATTTCCACGATATCGTTATGATCAA
+TTAATGGGACTTGGCCGGAAAGTGTTCTTGCCTCTATCATTAGCTCGGGTAGTCCCCGTT
+TCTGGTGTTTCAGTCACCTTTCAATGGCTCCCTTAATTATGCGCGAGGAATTTTCCTCTG
+GAAGCGGGCTAGTCCCCGAAAATGCGCGTTAAAGTTGGGGCTAAAAGATGGACAGAAAAA
+CGT
+>ds2020-328_474
+GGTCGGGATAGACGCGTGAGGACTCTTTCTCCGCCGGGTCAATCCTAATATGGGTGAGGG
+GGAAATCGAACTCTGTTATTCATTGCCGCAGAGACGCAAATTGGAGATTTCATCCCCTCC
+GCTCTAATCGGAACCCTTTTTGCGATACGTAATGCGTGAATTGGAACCTTTCTTTCGGAA
+CGGGATACGCTAGAACCAGTTGCTGGTAAGAACATCTATCTGAGGGCGACGTCTATCCCG
+ACC
+>ds2020-328_475
+GGTCGGGATAGACGATTTCTGAGAGTAGACCACAAACGAGGCTCAAAAGGACAGTATCTG
+GCGAGGGCAACGTCAACATTGGTACACTCACGAATAGAGTCTAAGCCGTCAAGTGACATA
+AGAGACCTAGTTGAATCACTAGAGTTCAGGTTTGATGACTGCTTATCTAGAGGGATGGAT
+AGCAGCGTGATAGTAGCGCTACGTCAGACATATTATAAGAGACCTGACACGTCTATCCCG
+ACC
+>ds2020-328_476
+GGTCGGGATAGACGATGAGTGGCCATCTATGGTACTGACGTGTCAAGTTACATCATGTCG
+CAGTTCGCATTCTACAACTGTGAGGAAGTACTGCCGGCTCAATTCCCAGTGGGGCCTGAT
+GCGAACGACAGAAACGTTACGGCAAAAGTGCAAGGAGTGTTGGAAGGGAAGGAAGCTTTC
+TGCCTCGACTACGAAGACTTCAACAGTCAGCACTCAGATGAGGCAAAGGCGTCTATCCCG
+ACC
+>ds2020-328_477
+GGTCGGGATAGACGTTGTTGGGTAGTGTGGAAAGGATTTTTGATAAAACGATATACTATA
+TTTCACACAATACAACAACTACCAACACATTACTAACATATTTTACACGCACATTTCACA
+GCATGCCGCTCACCAGTGAACAGAAGCTGGCATCTCGCCAAGCCAGAAAGCACCACCAAC
+ACGGTCTGGTAGAGCTGGCAGCGTATAAGCCCTCCCTCTCGTCTATCCCGACCGCCGTAA
+TTC
+>ds2020-328_478
+GGTCGGGATAGACGGCAGGTCGTGGTTATTTTCTAGCTAACTATAGCTTACATCCCTGCT
+CGGGAACCGCGGTAGTTGCCTATCCGGGAAAAGCACGTTATGACGTCTTGCTAACTCATC
+ACCATTAATCACCCCTCGCTGGTAGTCTCGTTGGGCACAGTCAAGCATAGTTTTCGCTGA
+CGCCAAATTGGGCACTAATTCGTGGTCACGCTCTAATATGCCATCGAATCGTCTATCCCG
+ACC
+>ds2020-328_479
+TGAATTACGGCGGTCGGGATAGACGGCGTCGGACGGTGGTTCGTGGATGATAGTGTGAAT
+GTCAAGGTTGTCAGGGATAACGATGCGTTTTTGTCGTTTAGGATGAGTCGGCTTTTTGGA
+TTGAATGTCTGTGCTATCGTTGTGTGTGTTAATCGGTTTGCTAGCAGGCAGTTTGGCTCG
+CTCGTCATCGCTAAGCTTGGCTAAGAAGTTATCATGAGGGGAATCTATCGTCTATCCCGA
+CC
+>ds2020-328_480
+GGTCGGGATAGACGTCGCAGCTCCTTGGTCGGGATAGACGTGAAGGTAAGGTAACGCTGT
+GATTCCTGCTCAAAAAGCAGACCGAACGCGTTCGAGTTATTGGCTCGTCCAACACGGCTG
+CATTCATGAATCGCTCGTTCAACTGTCCCTCGGAGACACGGTCGAGAAGTACCATGTACG
+GTTGCCCCCCGTCCTTTCTTTATCTCGGTCCCACCCAGCAGCTGCGTCTATCCGACCGCC
+GT
+>ds2020-328_481
+GGTCGGGATAGACGAGTAGAAGGGGTAAGACTGGCTCTCGTGGTATAAATCGTTCTACGA
+TTAGAAGAGCGGGGTATGCTTGGGAGTTATCTCTTGCTTTTAGGCTAACCAAGCGAAAGG
+TGGTTATTGGAGCGTAGGTGTTAAATGTAGCCGTCTCCCTACATTGATCACAGCTATCTG
+CCGGCGCAGGCAGGGGTATTCTACTTGACACTCTTCATTAGGATCTTACGTCTATCCCGA
+CC
+>ds2020-328_482
+TTATGATACGAACACTAAGCCAAACATTTATATGGATTCCTAAAAAATGAAATAATAGAC
+TATCATGTCATAATATATGACAGAAGCATCACTCTGTCTGTTGGATGCCCTTCTTCACTG
+CAAACATTTATGTGTTGCCCTTTCTTTAGATTGAAGATCGAACTGACAACCATCATCCTA
+TCTTATTCCTATTTTTACTTTACAGGCACAAGAAGGAGTACTATTATACGTCTATCCCGA
+CC
+>ds2020-328_483
+GGTCGGGATAGACGGAATTAACCCATGTAATGGCACAATCGAAGGCTCTAGCCGTGGCCG
+TTGCACGGATAACGAGAGGGAAGGGGCGGCACGACGCATCTGTAGAAGATTTCATCTTCT
+ACATAGCCTCAAACGGGCGTGCCGTCTCCGCTTCGGATATACCATCCGGAGTCCATAGCT
+TGGCTTGCGGTCCTCGTGACCATGTGGAACCCTCTGAGCGTTTACCAGCGTCTATCCCGA
+CC
+>ds2020-328_484
+GGTCGGGATAGACGATATATCTGCCTGGTCGGGATAGACGTGGACATCCCTTGGTCGGGA
+TAGACGCAAACGGTCTATGTCGTCTATCCCGGAATCCACAGCAACGGCCGCCACTATCTC
+CCTTGCATAGTATTTGTTGCGCAGCGAAGCTGCTAGCCACATAGGCATTCCTCTTGACAC
+TGAGTCATCTAACCGCGACTCAAGCGCTTCCAGGAGGTCCCGCATGTCGCTAGAAGGCTT
+CG
+>ds2020-328_485
+GGTCGGGATAGACGTGAGGGCGGCTATTTTAGGTAGTGTTATAAATGCACTGGCTAAACC
+TATTGATGGTCGGGGCGAAATTTCATCTTCTGAATCTCGATTAATTGAATCTCCTGCTCC
+TGGTATTATTTCGAGACGTTCCGTATACGAGCCTCTTCAAACCGGACTTATTGCTATTGA
+TTCTATGAGCCCTATAGGGCGTGGTCAGCAAGAATTAATTATTGGGTCCCGTCTTCCCGA
+CC
+>ds2020-328_486
+GGTCGGGATAGACGTTTTTGTGCCATGCGTTGCCTCGTGCCGCGTTTTAGGAACGTCAAG
+TTTTATTCTTTACGTGTTTTTTTGGGTTTATTTATTTTATAGTGTTTTTAATACCACTTT
+CACAAGTGAGTTTTTAGTTTTATCGCATCGTGCGATGCCGCTGTCAGCTCACAGCTGATC
+GATGTCCCGTAGTCTCTAGACCTACAGACCCATGCTACGCGGTGTACTCGTCTATCCCGA
+CC
+>ds2020-328_487
+GGTCGGGATAGACGATGCCAAGTAATATATCATCAGATGCAATATCGGGTCTAGCAGAAG
+ACCTAAAATGGAGAGTGGAGCCTGGGAGTGTGAGTGAAAGAGAGGTCAACATTGAAGATA
+GCAGATGGCTAATATTAGCAGCAATGGCACCAAAAGCAAACTTTGACGTAGAACAATTAA
+AGTTGCTTTGTAAGCACTTTAATGTACCTATAGACATGCGAACGGTGCGTCTATCCCGAC
+C
+>ds2020-328_488
+ACGGCGGTCGGGATAGACGTCATGTGGTCCTCCTATTCAACTACTTCAACCATTTTCGAA
+CACCTCATAGCATTTTCCGAACGTTCGAGGCTTCTATCATTTATGTATTATTTGATTTCT
+CGTACACTGTCCCTTCTTTTGAATGGGTTTCGAATAGAAAAATAATTTATTGGTCTGTAA
+CCCGACCTAGTTTAATCCATGGACTCAATTCGGTTATACCGGAACCACGTCTATCCCGAC
+C
+>ds2020-328_489
+TGAATTACGGCGGTCGGGATAGACGTAGTCAAGTAATTAAGTGCATGTGGTGGATGCCTT
+GGCAGTCAGAGGCGATGAAAGACGTGATAGCCTGCGAAAAGCTCCGGGGAGGCGGCAAAT
+ATCCTTTGATCCGGAGATTTCTGAATGGGGGAACCCACCTACTTTAAGGTAGGTATTGCA
+ACATGAATACATAGTGTTGCAAGGCGAACGAGGGGAAGTGAAACATCTCAGTACCCTTAG
+G
+>ds2020-328_490
+TGCCGAAGCGATTTATAAAGCACAGGCTGAAACAGGTGAAATCAAAGGGCATTACTTGAA
+CGCTACTGCAGGTACAGTAGACGAGATGATGAAAAGAGCTGCATTTGCCAGAGAATTGGG
+GGTTTCTAGTGGCGGCCGTTGCTGACGGCGGTCGGGATAGACGAGAATACCGGGTGTCGG
+GATAGACGAAGAAGCGCCCTGGTGGGATAGACGATACCCATCACGAGCGTCTATCCCGAC
+C
+>ds2020-328_491
+TGTATATACCTGCCATGTGCTCGTGGCTGTGCCTACTATTGAAGTCGGGATAGACGTAGG
+AGCTGAATACCGACGACACTCTGCATTTATCACTTCGCATCATCATCATCTCAAAGAACT
+TTTTATTATTCAAGTTGATGTCTATACTTGGGTGGTTCAGATGTTTCTCCACTGGTGCCA
+TGATCCAATTTGAGTAAATATAATGCCAGATTGATACGCCACCTACCCGTCTATCCCGAC
+C
+>ds2020-328_492
+GGTCGGGATAGACGTCATGTGAGACTCGCTGCCCACAGTGCCACGCCCGTGAGGAATGAA
+TTAGTTGCCTCCTTGGTTATTGACAGCGCCAGAGATACACTGTCTGAATTAACGCCTAAG
+ATGTCAACTACTTCCTTAAACGAAAAGTGGACGTGGTGCGACGCCGTTATCTTAGTGTGT
+TTGGCTGAAATTGCTTCGTGTAACAGCCAACCTTTACTTAGCTTTCCCGTCTATCCCGAC
+C
+>ds2020-328_493
+GCCGTGGACCTAGTGAATTTGGCTCTGCCGTGGACCTAGTGTTGGCACATCTGCCGTGGA
+CCTAGTGTGTCTACGCCTGCCGTGGACCTAGTTTTAACAGGCTTGCCGTGGACCTAGTAA
+CACTTAACCTGCCGTGGACCAAGTGGTACAAAACTAGGTCCACGGAGAATTACGGCGGTC
+GGGATAGACGGATCGGGGGGGGTCGGGATAGACGTTATCTATTTTGCGCGTCTATCCGAC
+C
+>ds2020-328_494
+GGTCGGGATAGACGGATGGTGCCCCTATACCCAAATTTGACGATCGATTTGCACGTCAGA
+ACCGCTGCGAGCCTCCACCAGAGTTTCCTCTGGCTTCACCCTATTCAGGCATAGTTCACC
+ATCTTTCGGGTCCCAACAGCTATGCTCTTACTCAAATCCATCCGAAGACATCAGGATCGG
+TCGATGATGCACCTTGCGGTTCTCACCTCCGTTCACTTTCATTACGCGTCTATCCCGACC
+>ds2020-328_495
+CCCCAGGTCCTCTGACTGACGTCGTAATAGACTGCAGACTTGTTGCCTGGCATCGGGGCT
+ACATACGCTTTCACTAAATTGCCGTACGCACAGACATTTATATCACCTTCAAAAACGCCG
+TTCACCATTCCCATAAACAAATGAGTACTATCCTCGACTGCTACTAACTTTAACTCGTTC
+ACAGTTCTGCCTGACGCTCTTAATACTACGATTGATGCCGGCATATCGTCTATCCCGACC
+>ds2020-328_496
+GGTCGGGATAGACGATGGAGAAAGCCCTCGTCGCGAAAAAAAAGATGTTCGGATAACTCT
+TGGAGATTTACTTCTGCGGGTAGGTTCACGTTCCCATCCGGAGTAGTATCTCTATAGACT
+CTAAAAATTATTGAGAGTTGTTCCACTATTTTTTCTTTAATAACATTCATGGTTACATCA
+GTAACCTTTGTTTCTATATTCATACTATCCATTAGATGGAGCATGGCCGTCTATCCGACC
+>ds2020-328_497
+TGAATTACGGCGGTCGGGATAGACGACACCACCCCCTTGGAAAGGTGTGGTTGGCCTGGC
+TAAGGGCCTTAGGAAGACCAAATCTGCATACCCGCTTGTGGTGGCCGTCCTGCCTGATGT
+TCCTGAGGAGCACCTCCAGATTCTTGAATCTCAAGGATGCATTGTGCGCCAGATTGAGCC
+TGTCTACCCTACTGAAAACCAAACCCAATTTGCCATGGCCTCTTCGTGTCTATCCCGACC
+>ds2020-328_498
+AACTGCCTCCACTATTTTTCGTAGCTATTCTTTTATTATTTTCATTTTAGTGAGTTTAAA
+GTTATTTTCTAAGTTAGATGTAAGGCTTAAGGAGGTTAATTTTTTAATTTATTTAGTGGC
+TCCTATTTTTATGCTTTTGCTTTCTATTTTTTTATGGTTTATTTTCCCTTTTGGTGGTTT
+TCTCTATTATTCTAGCTATTCTTTTATTATTTTCATTTTAGTGAGATAGTGGCGGCCGTT
+>ds2020-328_499
+GGTCGGGATAGACGGGCAGGTCATATGGAAGCGGCATATCTAGTTGGACTACTTGGCATG
+TGCGGAATTGGTCAGTCAAAAGAGGATGCATTAGAATTCTTGTGTTCTTTGAATCAACGT
+AACAACATTGATATGAAAGGAACCAGGGATGCTTTGAGACGAAGATTACGCGGAATTTTC
+TCTGTTGGAAGACATATCGTAGATATGTTCGACCATGGGAGGGTGCCGTCTATCCCGACC
+>ds2020-328_500
+AACGGCCGCCACTATTGTAATCTTCTATTTGAAGTGTTGGTTTGCAGAGAATGCTTTATG
+TATTGTGAGTTGTGATCACTAGTAATCGATGAATTTCATTCCACAAAGAGCCTCCTTCTT
+GTTTCTTGTTCCCTTCATCTAGTTTGGTTTTCTTTAACACAATCCCTCAAGACACTGAAT
+GAGAAGCCCTTTGACTGGTTTGGGCGCCAAGGGAATGGAAGCGACGTAGTGGCGGCCGTT
+>ds2020-328_501
+GGTCGGGATAGACGACGTCCGTAGCTTTGAGGTCGTAGTAGTTGGAAGATGAATTACAGT
+CGTCGAACACTACCTGATGGTGAGGATGATGATTTTGAGTTTGTGGAGGAGGCGGGCTCA
+GTGATTTGCTCATCTGTTGATCTCGGAAATCGATGGAGGTGATGGTGGAGGACTCGGCCG
+GAGCTAAGAACGAGTCGTCGCCGAGTTGGACTTGTTGCTGCTGATTAGGAAGCGGTACA
+>ds2020-328_502
+TGAATTACGGCGGTCGGGATAGACGTAAGGTGTCGGTTGTGGTTGGGGTCATGTCAGGTA
+TGGGGAATGCTGGTGGTGGTAGCAGTGGCAGCTGTAGAGGCAGCGCTATTGGTTCCGGTA
+GTGGTTGGTTTTAGTGTTGAAGGTGGCAGTTATGGTGGTGGTGGGGCCCTTTGGGGGTGG
+TCACAACAGCATGTAGGTGGAAGGGTTGTGACCAACTCCCCAGGGCGTCTATCCCGACC
+>ds2020-328_503
+GGTCGGGATAGACGACGAGTGCTATTTAGTGGGAGTTGTTGGTGAAGTGCACTAGCCAAA
+AGATGAGTTTTTAATTACAAGTGCTATTGGCATAAACCATATTCAATTCAAATATTCCCC
+TTCCATTCTCCCTATAAATAGCACTCCAATTCTAAACACAAGGGCATTCACAATTCATCT
+CATTCACTTCATCCTTCCACAAACACTCCATTCATCCACCTGTACCGTCTATCCCGACC
+>ds2020-328_504
+AGTGGGTAGAGACGAGTGTGGGCTGTGCGTGTTGTGCGCTTGTTTGACACTTTAAGATAA
+TATGTTAGTCTTGTGTGCGATAGGATGTCCTGTGCCCGAGACGCACAAGGTATACTGGTT
+TCTGAAAGGCCTAGGCCCAAACTAACAGACTTTCGTCATCACCATCATGGCAAAACATCT
+GATACCCTCTCTCAAGGAGATTATTCCCCAATTTCCGAGTAACACTTCTTCAGTCCTAC
+>ds2020-328_505
+AGTGGACGATGTGGGTGTGTTAGAACAAGATTGCTCTGCCGTTGCGCAATAGAATTCTTT
+CTCCGATATGTACCTTCCATCCGGGAGTACCTGTTTATCAGTGATCTCTTGGAAACCAAC
+ATAGTCCAGTGTACCAAATAGTGGTCGGATCCTAGATTTAAAAGAGTCATTCTCCCTGAT
+CGAGCGGGAGTAAGAAGAAGAAGGAGCACTTTCATCTTCCGGGCTTACACGACGAGACC
+>ds2020-328_506
+GGTCTAGATAGACGCTTATGACTGATTTATTTAATGATGCTGTTCTGGGAAACAGGGGGA
+AGGCTGTTAGCCTATCTCAATCTGGTTCCACAGTCTACCATCTTTGCTTTGCTGATGACT
+TGCTTCTATTTGCTAATGCTAGTACCAGGATCATGAAGGATTGTTTGGATAAATTTTGTC
+TTGCCTCTGGCCGCTTTGAGAAGTCAATGATCTACTGCTCCCCTAATGTGGACTCGGTT
+>ds2020-328_507
+CGGTCGGGATAGACGGTTACACACCCAGAGCGGCTTCATGCTAAGACTGATCGGTAGTCT
+GAGCTGCTGGAAAGAGAGTAGTCTGACCAGTATGGCTAACGCGTTAAAGAAATCAGTGCG
+AGCAGCGAAGCTTCTGCAGAACAATACAGCGTTAGATCTTCTGCCGATATTCGAGGCGGA
+GGTGTTAATTAACAGGGGAATAGGTGCAGTGGACTGGGGCAAAACGTCTATCCCGACC
+>ds2020-328_508
+TGAATTACGGCGGTCGGGATAGACGCAAATTTCCTCTTCATTAAAACATCATCATACACC
+GTCCACAAATCTTTATTTAGATCCGTTCTCTTTCGACCTCTCGCGCCACACCTCATCTGC
+AACATGAAAGATAATAAATCTCTCATGCACTCTAGGGGAGTAAGGCACATCTTCTTATAT
+TTTCCTACAATTTCTTCAACTTCAGTCAACAAAAGAGACCCCGGCGTCTATCCCGACC
+>ds2020-328_509
+GAATTACGGCGGTCGGGATAGACGATTCGTGGGTCTAGACGATGGACACTCTACGGTCCT
+GCGGTGAGGGGCTTCGTATTGTGGAAGGTCCAATGATTTCGAAATTATTTCTATATAATT
+CTCAATTTGAATATTATTGAAGCTAGTAAAACGTGAAAACCTAGCAGGATAGATACTAAG
+ACTGGTTAGTGAACAAGTTTAGTTTCTTTTTCAGGGCTGCGTCTCGTCTATCCCGACC
+>ds2020-328_510
+GGTCGGGATAGACGTCCATTCCCCCTCGTTACACCAGGTCGGTATCTACCAGACATCTTC
+ATCATTTCATTCAACATATTTTCATCGATAGACCCGTATTCGTTGATTGTCTTTGCATTG
+AAACCATCGAAGCTGGCAGTATCATTTACAACTTTTACATCGAGTCTCCCGAAAGGTGAC
+ATTACGTTAGAAAACAACGCTCCACGTCTTTCATGTTCTCTATGCGTCTATCCCGGCC
+>ds2020-328_511
+GAACAACTGATCTGTTATTGTTTGTGATAATATGGAGGAAGCTCAATGGTGTGCTAGAGC
+GGGAAAGATAACGATGGATGGATCTGGTGATTTGCTTCTGTATTCCTGGAAACAAAAGTC
+TGGGAAATAATTCGAGGAAGGTGGTGAGTTACGCGGGATGGATTGCAATATTTGGGTTGC
+CGGTCCCTAAATGTCCCGACCCGACTCCCCTAGCACCCACTGTCCGTCTATCCCGACC
+>ds2020-328_512
+GGTCGGGATAGACGAGTAGGGGCCATCAAGGAGAAGAACGCCAGGGAAACCATCAAACTT
+TGGCAACGCAGTTGAGATTGAATGGACGTTAATGTCATCGGTTGCCGGGATACGTTTGAC
+TCCACGTGCGTTGATGGGAATGAGCTGATCGGCTGTGGCGTCAAACTGCATTGGTGGGCC
+GATATCAATTGTCGCTGGCTGGGGGAGTTTCGTGGTACTTATGACGCCGCGGCTGGTT
+>ds2020-328_513
+GGTCGGGATAGACGCCAGACACATCCATTTGCATCAGGGACACCCAATCCACCTTGACTT
+TCCAGCCCACGAATAACCTCACGCGGCAGATCTAGCCATTCTTCGTCTATTTTGACCCGG
+CACCAGTGGCTCAGAGCACCTATAACACATCCGCGCGCTATATCTTGATCGAAGCCTCTG
+CGCTCTAGTTTGTGCATTTGATCTCGGATACCAGCAACTCAGATCGTCTATCCCGACC
+>ds2020-328_514
+GGTCGGGATAGACGACCTTCCCCCTTGCTCTCACGTTCGAGTGTTTGCTCGTCGTTTAGG
+CCGGTGAGTGAGATTTCTGCTCATTGCAGTCACCTCCGGGGTTCTTCGCACCTGGATAGT
+ACCAGGACCCTTGTGCCCCGGCCCTTGATCAGATAAAGCTGCCCGCCCTATGACCCACAA
+CTAAAAATGAGCCTTGCGACGAGACGCGGGCAATCCACATGCTGCGTCTATCCCGACC
+>ds2020-328_515
+GGTCGGGATAGACGGATTTCTCCAATGTCTTTATTGGTTGGTAAACCCAACTCGAAATTT
+CCGTCTTCCTGAATTGGGAGAAAGCAGAAGTCTCTCTCTTTTTTGGGGGGAGCAGAGCTA
+GCTATTGAACAAAAAGCCCTTTGCAATGAACAACAGGAATTCCTTGATACTTTATGGGGA
+TCCCACATCCGCTGATCTACGATTTATGCATAGTGACCCGTTTCGTCTATCCCGACC
+>ds2020-328_516
+GGTCGGGATAGACGATCGCCCTTGGTTGGTGACACATGGAGGAGAGCTAACTAAAATAAA
+ATGCGACATGGAGGACGTGGTAAGGCTGCACGAGATGACTGCGAAGACAGCGGCGTCGAA
+ATTCAAAGGATGGAGAATCAGCATGGGAGTTGATGAACTAGAGATGATGAGAAAAACAGC
+TTTGATGGTCCACAACATACTAGAAATGTTCCCCAGAATGGCGAGGAATGAGAGAGA
+>ds2020-328_517
+GGTCGGGATAGACGGGAGATAACTCTCTTCAATTATTCCTGGGATGGGAGGGAGTAGGTC
+TTGCTTCATATTTGTTAATTCATTTCTGGTTTACACGACTTCAGGCAGATAAAGCAGCTA
+CAAAAGCTATGCTTGTCAATCGAGTAGGTGATTTTGGATTAGCTCCTGGGATTTCGGGCC
+GTTTTACCCTCTTTCAAACAGTAGACTTTTCAGCCATTTCTCTCGTCTATCCCGACC
+>ds2020-328_518
+GGTCGGGATAGACGGCTTCTCTACTTGCTTTGTAGTCTGGTACTACGACTTTGTACCACT
+CTTCGTTCACTTCTGGAACCTTGTCTTTCAATTTCCAAACCATGTTATCTACATCGGGCA
+CTCCTAGCCCGTTGTCTTCAACGCGCCCATGTATTATTGTCTGAGGCAAGTTAAGCCATT
+TTTCGCCATCTTTTACTCTGCACCAGTGACTTATGCACTGTAGCGTCTATCCCCACC
+>ds2020-328_519
+TGAATTACGGCGGTCGGGATAGACGAAGAGATACTGTCTGGCATAGGACACTTCCGTGTC
+GGTAACTATTCGGTACCTGTGACTGAAATATGTGGCGGTGGGGTCCGTGCTCTGTATTTA
+GATGTCATGTATCCTGTGCCCTTGCTGCCCCCCCTCGTGAAACAACGTATTGCGGCCATG
+TACTCCATGGTGGCCTCTTACGACTACGGGGGCGTCGACGGCACGTCTATCCCGATC
+>ds2020-328_520
+GGTCGGGATAGACGTGGACACGTATTTCACCTCTGACTATGAAATACGAATGCCCCCGAC
+AGTCCCTATTAATCATTACTCCGGTCCCGAAGGCCAACACAATAGGACCAGACTCCTATC
+ACGTTATTCCATGCTAATGTATTCAGAGCATAAGCTTGCTTTGAGCACTCTAATTTTTTC
+AAAGTAACAGCGCCGGAACCGCGACCCAGCCAATTAAGACCAGTAGTGGCGGCCGTT
+>ds2020-328_521
+GGTCGGGATAGACGTACACCGCTGCTATCATCACTATTATCATCAGCCGTTACCACTACT
+TTGAGTCCCGAGTCTTCGCCTTTGTTCTTGCGGGTATTGGCAAACCGTGTTTCGAGAATG
+CGCATGCTTCGACGCTTCGGGATCACGGGAACTTCCTTACCCTTGCCTTTATTTTGGGAA
+GTACCTGTAAAATAAAATAAAATGTATACTTACTGTAACACCCCGTCTATCCCGACC
+>ds2020-328_522
+GGTCGGGATTGACGGCAGAAGTTGCTCTCCTTCATGAACACGAGCGAGCTTAGAGAATCC
+CCTCAAAATGTGATCCTCCGAGACATCGTGCACGATCCCGGCGTCTACGAGTTGTGGGAA
+CCTTCTAAAAATACCAGAAGGCGACATAACTTGGCAGGAGAGTTTGTTCTCTCGGAAGGT
+TTGAGCGAAATCGCCCGTTATGGTGGATACCAGAGTAAGACCTCGTCTATCCCGACC
+>ds2020-328_523
+GGCGGTCGGATAGACGTCTCCTCCATGTGGCACCAACCAAGGGAGATTGTCCTTTATTTT
+CTTTATTGATTTGGGTCCCAGCTTGCTCACTCTCTTTATTGTGGCCATTGCTGCGAAGAA
+TGCTACAACGCAGTACACCACCACATCTCCGAAGGCCCCGTACATGTACGTGAAACTCAA
+AGCTTTCGACGCCAGTAAGCTAGCCTGGCTTACTTGTTCGACACGTCTATCCCGACC
+>ds2020-328_524
+GTCGGGATAGACGCAAGAGATCGCTCTTCTCTAGACATGAATCAGGCGAGTCCGAATGCC
+TTTCTCTTTTGTCAGCGGCTCCTACCACATTTCATAGAAAGCCTATATCTTATATTATAG
+CGCGTACAAGAACTAGTGGTGGGCAATCTTCTCTGCGCTCTTTGATCTACCATAGATCCT
+TAGTGGTGGACCGATCTCAAGCCCTATCGTAAAAGACACACCTCGTCTATCCCGACC
+>ds2020-328_525
+GGTCGGGATAGACGAAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGCAGAACAACAACGAT
+AGACTCAGCGAAACAAGACGCTGAATCATATTGAATTGGATTTATAGAGATAAGGTGATT
+CCGATTCCAATTCCGATTCCGAGTCTGGTTCAGTTTTTCTCTCTTCTAAGAGAAAGAGAG
+AGAGAGAAAAGAGGGGAAGCTCAAAAGAGAGAAAGTAAGTATTTAGTGGCGGCCGTT
+>ds2020-328_526
+GGTCGGGATAGACGCCTCCTCTTTGCGATGATAAATGACCTACTTAACTCAGTGGTTAGA
+GTATTGCTTTCATCCGGCGAGAGTCATTGGTTCAAATCCAATAGTAGGTAAAACTTATTA
+GATACCAGTAGATACCAGAGTCAATTGTATCTAATAAGTTTTTCTACTTATCTTTTTTAT
+ATTAGTTTTTTATCTTTTTCGTCCTACCTTCAGGGGGTATTGTCGTCTATCCCGACC
+>ds2020-328_527
+GGTCGGGATAGACGGCTGTTAGTTCTTTCCGCGAAATCTCTAGCGTTTCTCTCCCCAATA
+ACCCCTTTGGGAATTTCCCCTACGTATGGAGCCATCGTCGCTTTCGCTTCGCTGCCATTT
+CATTATGAACTTGTCCGGGTACACCTCCACAGTCATAGATGAAATGACGGTTAACCGCAG
+CCGCTCGGTCCATATCCGCCTTACGAGTTAACCAATGCCCGACGTCTATCCCGACC
+>ds2020-328_528
+GGTCGGGATAGACGCACCGCCGGCTTGTTGAAGAGGGAAAGATCACTCCTAAATGCAGCC
+GTGATCTTATATACGATACCATCAGACGCGCCTCTCGCAGTCAAAACTCTCCTCGCCAGT
+AGTGGGACCAGCCGGGCCGGAAGCCTCGTTTCCTTCAACTAACTCAAGCGATTCGGTCAG
+TAGGAAAGTCATCTCACTGAACATTGGATTATATACAGGAACCGTCTATCCCGACC
+>ds2020-328_529
+GGTCGGGAGAGACGAATCGCCCCATTCGTATTTAGTCATTGCCTTGGCCCTTAATTGTGG
+GATTCTAGAGTTAAAGTGTTCAAATTCTTTCTTTCCCATTGCACACAAACTAAATATCTT
+ATTGCGTAATGTTGATTCTCTAGCTCTAAATTGGTCATCTTCTTCAAACTGGCTATAGTA
+ACTACCAGCAGGAGCCCACTTCCACCGAGTACTCCAAAAATTCGTCTATCCCGACC
+>ds2020-328_530
+GGTCGGGATAGACGATACTTGTGGTTCGGATGGAAATGATACTGAAACCGCTTCCAAAGA
+CTCAGCGATAGGGTAGGGCGTAGTGACTACTCAGATGAAAGCTTCGGAGGAAGCATGGTG
+TTAAACGAGGTTAGAAGCGGGTTCTTTGCTTCATATTCATTCTCGCCCACTTCGTATTCT
+TTATGGTTGAGTTTGTTCCACCTTCTTATACTGTGGAGCCACCGTCTCTCCCGACC
+>ds2020-328_531
+GGTCGGGATAGACGACTCGCCCCATTCGTATTTGGTTGATGCCCATGCCTGTATTTCTTC
+TGGTCTTGAAAGGAAGTACTCTAATGGTAGCTCTGGCATGTTGGATATCATTATAAATTT
+GTTTTTAAGGTTTCGATCAGTCCTCACTACATGCCGCTCGTCATCGTGATACTGCGAATG
+GACGCTGCCGGCAGCACTCCATTGCCATCTAGACCGCAAGCACGTCTATCCCTCCC
+>ds2020-328_532
+GTTGGGTGTAGCGGGTATCTCGATGTCAAGGCAGGGAATGGAATGTTTTGAGGCTAATAG
+GGCCTTTGGTGCCTTGCGAAGAGAAAGACCTTGAGTCTAAAACCATAGTATGGAAGGGGT
+CCAACGATCTTCTTTGGTTTGGCGCCTAGAGATGGGTTTGGGTGGGTTGTCGTCTATCCC
+GACCAGGACAAGACCCCGTCTATCCCGACCATGTCATTATGCCGTCTATCCCGACC
+>ds2020-328_533
+GGTCGGGATAGACGAACCCGTCCCCTGGTCGGGATAGACGCCGAGTGTGGATGAACGTCT
+ATCGAGAGTCGATCTCAAACCATTTGCACTTCGTGTACATTCTTTATGACGTTTGTCCGG
+GAAGAAATTCCTGGTCTTATATCTAAAAGATTGTCACCTCGTGTTAATGAAGTTTGTAGC
+CGGGGATCCTATTCAGGTTATACCTAATAGACCTCTGAAACATAGTGGCGGCCGTT
+>ds2020-328_534
+GGTCGGGATAGACGACACACTCCGGTGGTCGGGATAGACGCTTCCATCTGGTGGTCGGGA
+TAGACCATGGGTGTGCTCCGTCTATCCCGACCGCCGTAATTCACGGACAGAGAGCCGTGG
+ACCTAGTCACCGCTGCCCTGCCGTGGACCTAGTGCTTGATCCCTTGCCGTGGACCTAGTC
+TTATCTCTGCTGCCGTGGACCTAGTTGCGCAAGGGGTATCATACTAGGTCCACGGC
+>ds2020-328_535
+GGTCGGGATAGACGCAGGTTCACCCTGACCAAAACATCCAGTAATAAGTCTTATCACCAT
+TAGCGTATACGTCAATTCGCTTCCTGTCGTTGACTTGTACTTCGTATTTGGATTGCCACT
+CGTCTGATATGGGTATTACGTTCATACCCTGCTGATAACAGGTCGCATCGCATTGAGGGT
+CTCCTTGATACATTCTTTGTGCCCTGAAGCAATATCTTTGCCCGTCTATCCCGACC
+>ds2020-328_536
+TGAATTACGGCGGTCGGGATAGACGTAGACAAAAGAGAGATTTTCGTCGTTTGTGGATCA
+CTCGTATAAATGCAGTAATTCGCGAGAATAAAGTATACTTCAGTTATAGCAAATTAATAC
+ACAATCTGTACAAGAGACAGTTGCTTCTTAATCGTAAAATACTTGCACAAATAGCTATAT
+TAAATAAGAGTTGTCTTTATATGATTTCCAATGAGATCACGGCGTCCATCCCGACC
+>ds2020-328_537
+GGTCGGGATAGACGTTAGCACGGGTTGGAGTAGAGATTCAGTTAGGCAGATAGGTGACGA
+TATGATGCAAACGCTCAGGGTATTGCTTGAGACGGCAGTTGTGGGACAAGAGAAGTTGTG
+TAGATTAGTTAAAGGGTACCTTTGGCTTCTAGAATGTATGGAAAGAGGTACTATAGATGT
+TACCGTGGATAGCCAGAATTGTGTAATTTATGGGCCAAATGCGTCTATCCCGACC
+>ds2020-328_538
+GGTCGGGATAGACGGTGTTCTTCCTTTCGTGTTATCTGGCTAGCTGTCCCTCACTCTGGC
+GCTTGGTCTATTAGTTGACCTTTTCAGCCGCTGACTTGCCCTCCTATAGCTTACGCTCAT
+ACGTTGTTCCGTGTTATACTGCGCTTAGTTACCGTTAGTCCTCGGAAATTCTCGCTTTCT
+CGGGGCTCTTGCTACTTGCCTTCTAGTGTACCTCCGGCCTGCGTCTAGCCCGACC
+>ds2020-328_539
+CCGATCTGAATTACGGCGGTCGGGATAGACGAACACTGGGGCTTGGGGCTGCGAAGTTGG
+GGCTTGGCCTATGTCGTATTTGGGTCTCCCCTTAGGAGGGAACCCCAGAGCGATCAAATT
+CTGGGATCCCGTCGTGGAAAAGGTGGAGAATAGATTACAAAAATGGAAGAAAGCATGCTT
+ATCCAAAGGGGGAAGACTAACAATGATTCAGGCAGAAACAACGTCTATCCCGACC
+>ds2020-328_540
+GGTCGGGATAGACGGTCGCTGCACATATCCTTTTTTATTCTCGGTTTTTGATACCCTTGT
+TTGTTTTAATAAAACAGGATTTGGCTCAGGATCGCCCATTTTTAATTCCAGGGTTTCTCT
+GAATTTGAAAGTTCTCACTTGGTAGGTTTCCATACCAAGGCTCAATCCAATATGTAGACG
+CCCCATCGCTGTCGAACGTCTAGCCCGACCAGACTGGTGGCTCGTCATCCCGACC
+>ds2020-328_541
+TGGATTCGGCGGTCGGGATAGACGCAAGGTGGCAATGTGTCTAGTATCAGTTTGTGTTTC
+ACTTGGGGTTGCCCTTGTTGGTTATGTGTCCTTACATTGTAGACTCTTACTGCATTTGGG
+TCTAACAGAGTTATGTCTATTTCGGTCTTGTCTGTCTGAGTGACAGGTTCAAGCCAATTA
+TATCTTAACAGACCAACGCTCGTCTGCCAAGGTGCTTTTCCCGTCTATCCCGACC
+>ds2020-328_542
+GGTCGGGATAGACGAAGTACGGACCTGGTCGGGATAGACGTATATAAGCCCTGGTCGGGA
+TAGACGCATGCATACGGTGGTCGGGATAGACGTCGCATGTATATGGTCGGGATAGAAGGC
+TGCCGGTTACGTCTATCCCGGACAGAGAGCCGTGGACCTAGTACGACATACTTGGTCCAC
+GGCAGAGAGACGATGACTAGGTCCACGGCAGGGAGAACTATACTAGGTCCACGGC
+>ds2020-328_543
+GGTCGGGATAGACGTGTCATACGGCTCCGTCCCGGAATCGGGACCTTTCTTTCAGAACCT
+TTGACCAACGGGTCCTCGAACCAACCTGTCCTCCCCCTCGGTAAGCGGTTTCTTTTCATT
+CATTCATTGATTGATTCAAGGTAGCTGTAGCTTGCTTCCAAGTCCAAGTGCTAGCGGTAG
+AAGCTAGTCGCCAGAAGCGAACTTCCGGGCCGGGAAGGAGCCAAAAAACGTGAGC
+>ds2020-328_544
+GCCGTGGACCTAGTCGTTCACTTACGAGGCCACGGCAGGAGCATCCTCACTAGGTCCACG
+GCAGGGGATGTGGCGCAATTACTAGGTCCACGGCTCTCTGTCCGTGTCGGGATAGACGCA
+CTAGCAGACTGGTCGGGATAGACGTGGGAAAGTACTGGTCGGGATAGACGGTACCCCCCC
+CTTATCGTCTATCCCGACCAGGGAGGTTTATCGTCTATCCCGACCGCCGTAATTC
+>ds2020-328_545
+GCCGTGGACCTAGTTTAGATGGCCTGCCGTGGACCTAGTGCTCGCTTCGCTGCCGTGGAC
+CTAGTTAGCAGGCAGGTGACTAGGTTGAATTCGGCGGTCGGGATAGACGGGTTCCGGGGA
+TGCGCATAGCGGGAACAGAACTTGAAGCTTTAGCCAAGTCTGGGGCAACTAACGACTCGC
+ATGAGTCATACATACTAAATAGGTTAATATCGTGGTTTATCGCTAAGATGTATCA
+>ds2020-328_546
+GGTCGGGATAGACGGAGGCTTCTGCTTGTTTATTGTCAAACCAATCCCCCGCCCCCTGAA
+CACACTGTTAATTGTTATGAGAATTATAGTACAACAACCCTTATATGAATGGGTTTTGGT
+CAATTGGCTATGAATGGTTCGATGCAACAGTCCATCAGTGGGTACTATCACTCTATCAAC
+CAAATCCATATCCTTCACTGCCTGCTTTACTTGTTCTGACCGTCTATCCCGACC
+>ds2020-328_547
+CTATTCTGACCACTTACTATGGCTCTTCTCTCATTTGATTTTGGAATCTTATTTAAGCCA
+AGATTAGGCTATCGATTGGAGGAAGAAAGCATGCCTTTGTTGGTCACCATCACCACCATC
+GTTAACATCGGTACACTCCTAAATAAGGCCTACCTCCCTTCCATTCAACCAGAGCAGCGA
+TGAAAACAGAGACTCAATTAGCTAAGCAATGCATCAAACTCGTCTATCCCGACC
+>ds2020-328_548
+GGGTCGGATAGACGGGGTGTAAGTTTAGGAGACGTTCTGTTAATGCGGTAGAGCCGGCAG
+TTCCAGAATATCTAAAATGGTCAGAGGTGCCGATTACTTGGAGCAGGGAGGATCACCCGC
+CCAGAGTTGATAATCCGGGTCATCTGGCACTTGTGGTAGCACCCCAAGTTGGAGGATATG
+CTCTCACTAAGGTTCTGATGGATGGTGGAGGACATCGACTCGTCTATCCCGACC
+>ds2020-328_549
+ATTACGGCGGTCGGGATAGACGTGCATCCTCACTTAAAGTGCTTTACAACCATAAGGCCT
+TCTTCACACACGCGGCATGGCTGGATCAGGCTTTCGCCCATTGTCCAATATTCCCCACTG
+CTGCCTCCCGTAGGAGTCTGGACCGTGTCTCAGTTCCAGTGTGACTGATCATCCTCTCAG
+ACCAGTTACTGATCGTCGCCTTGGTAAGCCCTTACCCCACCAACTAGCTAATCT
+>ds2020-328_550
+GGGCGGGATAGACGAATTCAGAGTGTCTTTCTTTGGAGGCCCCCAATGCCTAACCTAATA
+GGGGATTCCCCATAGATGGATCAAGAAAGTAGGGCTCTTATCTTTCAACGCCTTTCGTGG
+TTTGGGAGGAAATCTCAAGAGTCCGCCCGAAGAGATGAAGGAATGAATGCGTAAAGTCGA
+GAGTACGCCGTCTGGAAGCGGGGCTATTAGGGGCCACGCACGTCTATCCCGACC
+>ds2020-328_551
+GGTCGGGATAGACGCACTCAAGCCCTCAAGTCCGCTGGTGCCATATCCGCGAAGACATGG
+TTACCCCAGTTGGCAGCTGGAGCATTACGCTTGGGCAATTTTATATTGTTTTACAGTGTT
+TTTGTTATTGAATTTTGTCGTATTTGTTTGCCACCCGATCTGCCCGATAACCCAGTAGCG
+GTGGTTCGTCGCCGCGCCTACTTCCAAAACGTCCGCACACCGTCTATCCCGACC
+>ds2020-328_552
+TGATTTAGGCGGTCGGGATAGACGACAAGTATCCCTAGGTCGGGATAGACGCCCATTTAC
+CCTGGTCGGGATAGACGCCTTGAGCCTGTGAATTCGTCTATCCCGACCGCCCGGACAAGA
+GCCGTGGACCTAGTGTCCTCACGCCTGCCGTGGACCTAGTATCTAGTCACCTGCCGTGGA
+CCTAGTGTCTCGCGTCCTGCCGTGGACCAAATCTTGATCAACTAGGTCCACGGC
+>ds2020-328_553
+GGTCGGGATAGACGTATCAGCCACTTAATTCGGCCAGACAGATGTGAGTAGTAGAACTCG
+GCTTGCCCTTTTGACGAAGCAGAATGGTAAAAGACGTATGGCTTTGCGAAGTAGTTTTCT
+TTGTTGCGAAGTTCCAGTCTGTTAGCCTCAATCGTGAGTTCCTCTTCGTCTCTGGGGAAT
+CCGATCTCGATCTTGACGTTTCCCTCAGACTTGTTTCTCGTAGTGGCGGCCGTT
+>ds2020-328_554
+GGTCGGGATAGACGCTTGCAACCCCTAACAATTTCCCTTTCTGATTTCAAGACACTCAAA
+AACTGACAAGATCCGAAAGGTGGATGCTGCCTGCCAAAACTGAAAGAGGGTGAAATATCA
+CTCAATCTGGCCCGCACAACCAAAACACCACCCAGCATCCTCAGACAACTCAAATTCCCC
+AACCCCGCTCCCTCCTCCCCCCCGCCCAACACAACGCGAACCAAAACGGCTGTA
+>ds2020-328_555
+GCCGTGGACCTAGTAGCAATCTGGATAGGTCCACGGCAGAGGTACTTCGACTAGGTCCAC
+CGCACGGGAGTCCGTACTAGGTCCACGGCGGGGGAGTCAAACTAGGTCCACGGCTCTCTG
+TCCGTGAATTACGGCGGTCGGGATAGACGATTGTTATGTATCTAGACGCTTAACCCCAGT
+AAACGTCTATCCCGACCAGGCAGCGCAACCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_556
+TGAATTCGGCGGTCGGATAGACGGGCGAAAATCGTCTATCCCAACCAGGCCGCTGTTCCG
+TCTATCCCGACCAGGGAGCTCGATCGTCTATCCCGACCGCCGTAATCCACGGACAGATAG
+CCGTGGACCTAGTGCGTCGGGTTCTAGGTCCACGGCAGTGAATGCTATACTAGGTCCACG
+GCAAGAGGTACGAAACTAGGTCCACGGCAGCGAATGTGACACTAGGTCCACGGC
+>ds2020-328_557
+GCCGTGGACCTAGTATAATTGGGGGGAGAAGAAAAGAAAGGGATGGGAGGGAGGGAGCCT
+ATCACCGCTTATGGCCCGCTTCCTATTTTTTAATCAATTCCTGGTTCACAGGCGAATAAA
+GCAGCTATCAAGGCTATGCTTGTCAATCTAGTAGGCTCCTTAGTGCTTGCGCTAAGGTAG
+TTTACTTGCTTACTTGTTAAGGAACAAACTCTTCTTTTTACGGCTATCCCGACC
+>ds2020-328_558
+GGTCGGGATAGACGCACTACGCCCCTACATGCGCTGAAAAGCGCATATCCATGATTTGTA
+TATGTTCTGAGCTATAGCTCATGTAAGTTCCTCAGTCCTATTGAGTGGGTTATGGTTTTG
+CATAAATGCATTTGAATCAGTTAAATACCCTCCAAATTTTTCATAGAATTTTTGTTTAAA
+GCAGTAATACAACATGGCCGTTTTTTCAGGCAACAGATTCGTCTATCCCGACC
+>ds2020-328_559
+GGTCGGGATAAACGACACCCATTACTATCATCCCATAATTCCCCTTTTGTTAGTCATCTT
+GTCTAACTCCCTTTCGCCAGTCCCGAATCACCCAATAAAAACCATGTGCACTGGGATCCC
+TGAGACCTGGTACCTGCCAAGAGTTTAGACTCAACTACACAAAAGACTATATCCATTACC
+CTCTTTTCCACTATCATCTCCTCCACCCAACTACTCCAGCGTCTAGCCCGACC
+>ds2020-328_560
+GGTGGGGATACACGAGGGGGGGTTATTCAGAGCGGGCTCAATGGACAACGGGGATGGAAT
+AGCTGTTGGGTGGTTAGGACATCCTATCTTTAGAGATAAAGAGGGGCGCGAACTTTTTGT
+ACGTCGTATGCCTACTTTTTTTGAAACATTTCCGGTTGTTTTGGTAGACGGAGACGGAAT
+TGTTAGAGCCGATGTTCCTTTTAGAAGGGCAGAATCAAAATATAGTGTCGAAC
+>ds2020-328_561
+GGTCGGGATAGACGTGGATTCGCCCTACTAGCTCACTCAATCTGCTGTAATATTCAGGTT
+CCGATGTACATTGAGCAGCCAACTGCCTCCCGATCTTCCGCTCAACCAATGTCCACACCT
+TGCTTTGCTTGAAGTTGTCTCTTTGGCTGTTCGGTCCTTGTTTTTTAACCATTTAGATGT
+ATCGTTTTTTGTTCTCTTTTTTCGCTCGCCCTACAATGGCGTCGATCACGCCC
+>ds2020-328_562
+GGTCGGGATAGACGCCGGGCTGTGGTGTCTTGGTGTGACCAATTGAGGGTGTTGTGCCAT
+GATTCTATTGGTGGGTTTTGGTCACATTGTGGTTGGAATTCAACCCTAGAAGCTGTTTAT
+GCTGGTGTTCCAATTCTCACTTACCCTATATTAGGGGATCAAATGCTCAACGCTGAGAAA
+ATTGTGGAAGATTGGAAGATTGGATACAGGGTGCTGACTCGTCTATCCCGACC
+>ds2020-328_563
+GGTCGGGATAGACGTGTAAAGGGGCTGCTTTCGAGATGCTTTCAACCATTGCGCTGCAAC
+CTAAGCCATCATTTCAAGAGGGGGTGGTATGGCAAGAGACATCGCTTCAAGTCAATTTAG
+CACGTTTTACACCAACGAGAGCCAGAGTTCCCGCTAACTTGGAAGGAGATGCTTACCGCT
+TAGAAAGCGAGTCAACAAATTCAATCAAACAACATAAGACCGTCTTCCCGACC
+>ds2020-328_564
+AGAAACATGAGCTTGTGATATAGCTACACCTAATTCCGGACCGGTTAATGCAAGAACTAT
+AAATAAAGGACCAGGATCTCCTATAAAAAATAAAAGATCATTCATACATAGCATAGTCCA
+AGCGAACCCACTTAAAATCTTTACTGAACTATGACCGGCCATCATATTAGCAAATAAACG
+TATTCCTGAGCTTAATGCGCGAAAACAATGAAGCGCATCGTCTATCCCGACC
+>ds2020-328_565
+GGTCGGGATAGACGGGCGGTTCCTAGTCCGCTTTGGCTCCTGATCTTGAGCTCGCTTTTG
+TTCAATTATAAATAAAAAACCGCTTTGATGGAGATTTGTAGCATCATTCAAGTAAATACA
+GATTAAGATCGTAAAAACATAAGCTTGTAATATAGCCACACCTAATTCCGGACCGGTTAA
+TGCAAGCGCTACGTGCCCTTTTTTAAAAGTGCTACCAGCGTCTATCCCGACC
+>ds2020-328_566
+GGTCGGGATAGACGTCGAGGCTGTATCATGTAACAAAACGATACAAATAGAAGGAATGGA
+AAAAGAGGAAATCGGAGAGATATTCAGGAGCTCACTGGGACCTGAGAACATAGTTAAACC
+GACAGATGGTGATGGCACAGCAGAAGTTAAAGCAGTGCAAAAAGGAAGAAAGAAAGATCA
+GGGACATAAAGAACGGAGTGGTGAAGAGCCTATGGTCAAATTTCAAGATAGT
+>ds2020-328_567
+TGAATTACGGCGGTCGGGATAGACGCATGGTGTGCTTGGTCACCGGTGGAAGTGGCTTGG
+TCACCGGTGGAAGTGGCTTGGTCACCGGTGTAGGTGGCGGTGCATGTATAATAGGAGGCT
+GAGTGCTTGGTGGTTTGCCATAAGGTGAAGATGGTGGTGGCCTCACCACTCTAGGAGGCA
+GAGTTGGTGGTTTGGGTTTGGGCACTATTGGTTAGGGCCGTCTATCCCGACC
+>ds2020-328_568
+AATACACAGCAACGGCCGCCACTACTGTACCTTGTATAGTCCAAGCTCTTCCAAAGTTGA
+TCCATAAAAAGGTAATTTCTCTCCCTCCACCGTGATTTCTAATGGTATTGTCCTGGTTTT
+CTCTGTACTTGGATCTATGAAACCCTCTGCTGGTCCTTCAGGATCACCAGTTTGTACAAC
+AAAACCATCCGCTCTTTGGATTTCCATGCCATCATAAAAGTGTCTATCCACC
+>ds2020-328_569
+GGTCGGGATAGACGGTGATGGCCTTTTCACAAGAGAGATTGGAGAGGAAGAGGAACTTGT
+TCCACGTTCCTAAGAACAGTGGGACAGCAATCAACCGCGCGAAAAGGGATAGGAGCAACA
+TAAAATTGTGGGATGCATCTGAGGGTGGTTCCGTGGTGGAAGGAAAGGACATACGAGTAG
+GTGAATTGTCCGACATATCTAATCTGTTCACCAGCCGATACACTGGTGGTAT
+>ds2020-328_570
+GGTCGGGATAGACGTCTCCATGTGCTGCACGCAGTTAGCCGCTTAAGGCTCATGGATCAT
+AACAACAGTGTTAATCAGGGTGATCCGCAGGAGGGAATGACCAGTGATGTGGTCATGGAA
+ATATTTGAACGGCTCTTCCGCGCAACGGGGGGAGCCGCTTCGCATTGGGACGTTTTGAAG
+GGAGCGTCAAGTCTTAAATTCCTTCGAGAGGCTGGAATCGTCTATCCCGACC
+>ds2020-328_571
+GGTCGGGATAGACGAATCTGGCTATTTATGGGCCAAACCAAGTCTTAAACTCTTATCGTA
+GAGATGGACGAGCATATGTTTTCAATTCCAAACCCGAGTCGGTAGGGCATACGGCACTGT
+TATTCAAAATGTGCGAATCTTATCCTCCAAGAGAATTTAGGTCGCATGTAAGCATACCAT
+CGGACGGGGATGAGATATTTATGGTAGCACAACGTCTATCCCGACCGCCGT
+>ds2020-328_572
+GGTCGGTATAGACGAACACCCCGCCTATTGAGAGCGAACTTAAAGAAGTTGATACTAATC
+AACAAATTAGGCCAAATCCCAAAACGAAATATTTAAATAACGTAGAAATTTAAGGACCAG
+ATATGCATAACTCCTCAAGACATCCGCCAGTCTTATAAAAACCACATGGCTCATAGAATT
+ACAAAACATTAATGCGTCTATCCCGACCGCCGGAATTCGTCTATCCCGACC
+>ds2020-328_573
+GGTCGGGATAGACGCAGGTTTGCTCTGGACTCCACATAAGCAGTTGTCGATATGCCTTTA
+TAGTATGACACATAACCCTGGAATATCTTGCCTAGGTTTTTAAGCACACCGGTATCATTG
+ACTAACTGGAACTGCCTCCTATCCAATTTGGCCATAGCTAGCGCGCACTTACCTAATTCT
+AGATCGTTTACATCATAATGAACCACATCGCCAGTCCCGTCTATCCCGACC
+>ds2020-328_574
+TGCCCTTGTTTCCAGCTTGGGAATGAGAGTGAGTAAGTAATTCCATGCTAGTACCTGTAA
+GCAAGCGTTTTAGGCAAACCTGTATACCCTCTTACCAGGGCTATACATAGGTAGAGAACG
+GCTCCATCTACATCCAGAGAGCTGCCTTTCGCGGTTAGAAAAGGAGGTGAAACTGCTTTT
+CTAACACAGGACAGGATACGGCCCATCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_575
+GGTCGGGATAGACGTACGTCTGGCATGAGTATGGGTGTATTAATGAAATACCACACCATG
+GCGTCCCAAACATTCTTCCACTTTTGCTTCTCAACCTGATCTGTCACAGGTTTTCCATTG
+AAGGAAGAGAAGTTCACGTTCTGTTTCAACACGTCAAACGCGACGCGTATCAACCACGCT
+GGTACTTTCGTATCAAAAGCGGAAAAATCTATGACCACGTCTATCCCGACC
+>ds2020-328_576
+GGTCGGGATAGACGACCCATCCACCTCTGCATCTTTCATATCCTCCAGCACCTCCTCTTT
+CATATCCACCAGCACCTCTTTCATATCCTCCAGCACCTCCTCTTTCATACCCACCAGAAC
+CTCCTCCTCTTTCATACCCACCAGCACCATTTCCCCTTTCATACCCACCAGCACCATTTC
+CCCTTTCATACCCACCACCACCATTCCCTTTTACCGTCTATCCCGACCGCC
+>ds2020-328_577
+GGTCGGGATAGACGGAGTTGCGGCATGGACTTAGAGTGATTTGGTCATTGGACTACGCAG
+TCCAGTTCCAACTCCATTTCAAGCCAATCATGGTTTAGTGGTGTATCTATCTATTAAAAT
+GTTATGAGTTCCGGTGTGCACGATTGGGCTAAGCAATATGAATGCCCCTTACTAAATGCA
+TATTGGAAAATTGCTAAACCTATCCAGCATGACTGAACGTCTATCCCGACC
+>ds2020-328_578
+GGGCGGGATAGACGTTGACTTCTCATCGAGATTGGGTTGGTGCTTAGATCGATTCAAGCG
+GATCGAACTTTATCTTCTATAAGGGGATTGGTTCATATCAATCAGAAGTGCATTCAGTTA
+TCTCTTTTTTCTTTTTCTTCTCGTCAGTTAGCTCTGCCGAATGCCTAAAAGGATTCCATT
+CTTTCTGGCGGATCTAGTTCTTATAAGGCAGAGATGCGTCTATCCCGACC
+>ds2020-328_579
+GGTCGGGATAGACGTTTAACTGGCCTTGTGGTCATATGGATGAAGACATCCCTAACTTCT
+ATCACGGAAATGATTACATTCCACAATCACACGGTGACTACATAGATATATCGCCACTTA
+GCGACAAGGAATCAAGGTTCGTGTTGCTGATGCTTGGTAGGTGGAAAAGGACGACAAGAT
+ACATGTTGGACTTTGATTTACCGAAGTTAGCGACGGCGTCTATCCCGACC
+>ds2020-328_580
+AAGCAAGGCCTCTTTTAGATTGACTGTTGGCAGATCGAGATTGAACAACGAAGTGCTTTC
+ACCTCTTGTAGTAGATCCGTTCATCAAACGAGACTCGGAAAGAGTGGCGTTAAAGAGGAC
+TGGGGCGCCTCTCGAAGTCTCCGATCTCACAGATGGTTAGGCTGCAATTCCTTCGCTTGT
+GAAGAAGCTTGGCTAGTTCTCCTTACTTGGAAATTACGTCTATCCCGACC
+>ds2020-328_581
+GGTCGGGATAGACGAAATGGCTGGTTCTTCTTGATCTTGAGGTCATGGGCTAACTCGACC
+GTAGGGAGAGGGGTTCAAGATGCCCTCGTCTAAGTCTGTCTATTTCGTTCTTTGCTTTAG
+GAGCTCGTAGGTCTCAAGGGTTGTTTTCCAACTCGACCGGAGGACTTGAGATGTCGCTAA
+GGGAACGTCTTCCGGATCGATCGAAGGGGAGGTGATACTAGGTCCACGGC
+>ds2020-328_582
+GGTCGGGATAGACGCACAATCGGAGTTTCCTTAGGCAGCCACCGACCTACAGTTATCCTT
+AAACTTCCGTGCTTGGTGGAGAAGAAGCGAACAAAGGTACGCTCGCTTGCTGTCTTGTTC
+TCTGCCGCGAACTGGGATCGCTCGCCAGCTAGGTCAGATTGGAGCAACTTATTTTTTGAG
+AACATATTACCCATATTCGGGGACAAGGGGCGGACCCGTCTATCCCGACC
+>ds2020-328_583
+GGTCGGGATAGACGAGAGGTCCCCATCGGACGGCAGCCCTTTCGGGGGTTCCTTAGGGAC
+CGATTCACTCTGCGTAGATTGACTGAACGCAGAAAGCCTTCCACTGGCAGGCGATCGTGT
+TTTTCACAGGATTTATCGTTACTCATGTCAGCATTCTCACTTCTGATATCTCCAGGTGTT
+GTCACCAAAAACCTTCCCCGATTGACAGAACTTCCACGTCTATCCCTCCC
+>ds2020-328_584
+GGTCGGGATAGACGACCACTGTGCCTGCCAGACTCGTCATATTATGATAGGGATTATCGA
+TCGATTTATTTGGCTTTAAGTGACAAGGCCCCCTTTCTCCAAAAAAAACAACAAGCAGCC
+TCTTAGGCAATCCCCTCCCCCGAGGTAGCTGCTTGCCGATGGCATTGCGATAGATCGGTG
+GTTGACTTACTGGTTTGTGACTCCCACTGCACTCCCACGTCTATCCGACC
+>ds2020-328_585
+TGAATTCGGCGGTCGGGATAGACGCAGCTGGCCTCTGGTCGGGATAGACGAACCTGCCCC
+CTGGTCGGGATAGACGACCAAGTGCCATCATTCGTCTATTCGGACAGAGAGCCGTGGACC
+TAGTTTTAAACCCCTTTGCAACTAGGCCACGGCCCCCGAACATTACTAGGTCCACGGCAG
+ATGGTTGAGGACTAGGTCCGCGGCAGAGAAGGGCCCACTAGGTCCACGGC
+>ds2020-328_586
+GGTCGGGATAGACGACCCACAGGACTCGAAGTAAGGAGAGAGGGTAAAAAACAATAAGCG
+GTAAGTGAGCCAGCAAACAAAGCCGTAGAAAGTGTTAAACATTCAGAGAGGTTCTATGTG
+TCAATGCATGAAGCCGGCGAGTATGATATGGACATGAGAGATAATAAATACCAGACATCT
+ATACCAACATTCCTTGATGAAAACATGGCTACCTTTCGTCTATCCCGACC
+>ds2020-328_587
+GGTCGGGATAGACGTGGATGTGGGGCAGGAGAGGATAATCGAGTTAGTTACGCCGACGGA
+GAAATCCATGTTGGAAGTAGCTCCACAGATTGTAGTGTACTTAGCAGCATAGTCGCGAAG
+GAGGGTCTGATACCAGTCATTGGCACGGGTAGGGGTGCCAGTCATGTCAGGCATCTTTCC
+AACCATTAGGGTTGAAAGACCAGTAACTGACATTAGCGTCTATCCCGACC
+>ds2020-328_588
+GGTCGGGATAGACGCTACAATCCCCTGGTCGGGATAGACGAACATCATCTCTGGTCGGGA
+TAGACGTTTGAAGGGGTTGTTGACGTCTATCCCGACTCGGACAAGAGCCGTGGACCTAGT
+GATCATCGCCTGCCGTGGACCTAGTAAATCCTTGCCTGCGTGGACCTAGTTCAGTATCGG
+GTATCTACTAGGCCACGGAACGCTAATGAGACTAGGTCCACGGCCTCTGT
+>ds2020-328_589
+GGTCGGGATAGACGTGCTTGTTGGGTGAAGGGATTCAGAAGACCGAGTGAAGCGACTAAA
+GCGACGACCATACATAGAGCTGGAAGCTGCACTAGTGGACGAAGAAGTAACTAAAGCCTG
+AACTGGATGTGGAGACGAAACTGTACAGGAAGAAGAATCGCCCTACTTTATTACATTACG
+GCCTTTCCCTCTTGGAATGAGCATAGCACTATACACCGTCTATCCCGACC
+>ds2020-328_590
+GATCTAATACACAGCAACGGCCGCCACTACTGATCTTCATCGAGGAGGAATGTGGTGGTA
+GTGGAATAGAGAGCAGACCAGGACTTGAAGGGTCGATTGGGGTGTTGGTGAGCTGAGATG
+AAGTAGAGGGTGTCGTTTTTGAGGATGGGGCGGTCGTGGAAGAGGCTTCCGGGTTCGGAG
+TGTAAGAGTTTGGGGGTGGGGAGTTAGTGGCGGCCGTTGCTGTGTATTA
+>ds2020-328_591
+GGTCGGGATAGACGCGAGGATGCAATTGGCTAAGGGGTCAGGGTTGTTCTCTCTAGCAAG
+CGTTAAGGATTACAAGAGGGAGGCTAAGCGTATAAGCGTCGAGGCAAAGTCTCTGCAAAA
+CCTGGTTGATGTGGATTTGAGGAAGTTCTTTGAATTGGAAGTGCTGGTAAATAGGGTGGA
+CGGTCTTGTCAATTGGGAAGAGGAGCACAAAACGGCGTCTATCCCGACC
+>ds2020-328_592
+GTGCACAGAATCCGAGCAGTACCTTAGGGGCAGGGTTTACCAGTATGAAATAATGCCGGT
+GGTCACACCAGAGGATATGCAGATACTTCTTGATCTGAAGCGCGTGCAAAATTGGGCGGG
+CTCTGTTTATATCGACCAGAGCATCGAGGAAAATAATGGTGTTATTTTGCGAATGGCAGC
+TGGAGCCGGAATCAATGTCTATGAGGGGCCAACGACGTCTATCCCGACC
+>ds2020-328_593
+GGGCGGGATAGACGATCACCTCCTTTCAGTGGGTGTAGTAACATTATTAATTCGGCCATC
+CCATCCTCTTGGTCAAACACTTTGTCAACGTAAGATATTACTTGTCTTCTTACACACTGT
+GACACTTCTACTGAGCCTCCTCTAGCTATTATTTCGTCAAATCTATTGTTCATTGATCTG
+ATCAATTCCCTATAATCGTTTGCAGGTGCCAGATACGTCTATCCCGACC
+>ds2020-328_594
+GGTCGGGGTAGACGCCAAGAAACACTTTGTCGGCTGAAATCTTATGTTAAACAATTCTGC
+ATTCTTCATTAGTAAATTGACTTGGCTCATAGACTGTACAGCTGCCAGGACGTCATCTCC
+GTTATGTAAACTAACAATAGTCTGGTTGGGTAAGCATTCTGAGATATAAATCTTATTTAA
+TAGAGTATTCATAAATGTAGTTAACCGCCTTCCTCCGTCTATCCCGACC
+>ds2020-328_595
+GGTCGGGATAGACGTTTCGCCAAGGTAATCATCTTTAACCATAAGTGGCCACGTCGAAGA
+TGATTCGTTAGGTGCGTAAGGTCGGGTCGCGTTTTCTAGCGCCATCGGGGTTTTAATTGT
+TAGGTCGTACCCACACAGCCTGCTAGCCCAGGCCCAGTGCCATAACTGATATGGCGTCGC
+TTTCCATCCTAATCTATTGCGTTGTAGCTTAGCTGCGTCTATCCCGACC
+>ds2020-328_596
+GGTCGGGATAGACGCTAGTACCTCTTTGCCCAAGGATTGCGAATATGCTTGACTGAGATT
+CCAAGCAAGCTACCTGGGCCTAAAAGACTGCTTCTTGAGCACATGAATATTCAATTGCTC
+CCGAGCCTTCGAGAAAGCCCATCCTCTTTCAATGCCATCTGACCCATCTGTTCAACCCCC
+ACTTCCGGATATTCTAATTCTGTATTTCCGCCCGACGTCTATCCCGACC
+>ds2020-328_597
+GTTCTGGATAGACGGTAGCTGCTTTATCTGTTTTTGGTTTTATTGTTTGTGGCTTTGTTT
+GTTTCTATAATATTGCCTTTCCTAGTGAGTTTTACGGGCCCACTGGACCAGAAGCTTCTC
+AAGCTCAAGCATTTACTTTTTTGGTTAGAGACCAACGTCTTGGGGCTAACGTAGGATCTG
+CTCAAGGACCTACCGGTTTAGGTAAATATCGAATGCGCCTATCCCGACC
+>ds2020-328_598
+GGTCGGATAGACGGGAGGGGGCGGTGAGGAAGGGTCTTTCGAATCTCGATCAAATAGCAT
+AGCACGGGACCGTGCCAAGCTGTAAGCATAGCGAGTTAGGTATGGGCTTTCTTTTAACTA
+CCAGAATCAGCAGTTGGCCTGTTGTTGATCAAAGTCTGGGTCGGCGGTCCCTAGTTATAG
+ATTGGCTTTCGCCTTCCTTTTTCCGTCCAACGCAACGTCTATCCCGACC
+>ds2020-328_599
+TGAATTACGGCGGTCGGGATAGACGTCTCACGGACCTGATAGACGAGCAGCACCAATACG
+CGTCTATCCCGACCAGCCCAAATACGTCTTGAAATAACTCCGGCTTAATCCCCAAAACAC
+CAAACCCAACACCAAATGGAACTCAAATTCACAAAACTATCCTTACATACGATCTGAAAT
+ACCAATGTGCTTGAATTCTCTGAACCAAAATCACACAAACCACATTTCT
+>ds2020-328_600
+GGTGGGGATAGACGTTTTGGTTCCTTCTAAAGGCCGCGCCCTCTCCCGCCCAATTGATGG
+TTCCCTGCTTGTTGAAGCGGGATACCCTACTGCTCATGCCTTGGCTGAGGATTTTGTTGG
+ACTTTCTAAGAAGTACACTAATTTCTATGCCACGTCCGAGTACGCGTCCCTGGCTGACCT
+GGTTGAACACCTCATCCATGGTTTAGCTCCAACCTCCGTATATCCCGAC
+>ds2020-328_601
+GGTCGGGATAGACGTTGGCGCTTAATTAGCTACCAAAACGCAGAAATTTCTCAAACCTAA
+CACAACCAGCAGCTAGAGCTCAAAGAGTAGATGAATTTACATACCTTATGCGTCCAAATC
+GGTTGAGAAACGAATGAGAACGAATGCTCCAAAGTTCTGTCAAAATCCGGCGAATTTTCT
+GCATTTTCCTGCGAATATCGAGGAGTCCAGTGGGCCGTCTATCCCGACC
+>ds2020-328_602
+TGTCGGGATAGACGCGTAGTTGCATTGACAATATATCTACTTTTCAATCCTTTCTCGTCC
+GGCTTTATAAATGCTTTCAAAACATCAGATTTGATTGTATCTAAACTAACCATCCTCAAA
+ACCTCCGCATCACTCAGCGTAATTGCAGCACCCAACTTTGTTCTCATCTTATCTCCGTCA
+ACCAACAACTTAGAGTGAGAGCTAGCACCCAGAGTCGTCTATCCCGACC
+>ds2020-328_603
+GGTCGGGATAGACGGGGACTCACTCTCTCCAATTTAGTGTCCTTTTTATGTGCCCTGCGT
+AAATGGCTGATAAGTATCCTACTACTTAACCTTAATATAATATTGTTAACTTAATAAAAT
+AAAAAACTGAAAAGCTAAAAATTGAAAAACACAAAAACACTAAATCATAGCAGCCACCAT
+TACCAAGTCCCTCCGCCCAGCCAACGCAAAACCCCCGTCTATCCCGACC
+>ds2020-328_604
+GGTCGGGATAGACGAGGGGAAGGGGTCAGATTTATCCCGACGGGAGCAAGAGTAACAATA
+ATGTTTATAATGCTACAGCAGCAGGTATAGTAAGCAAAATCATACGAAAAGAAAAAGGGG
+GGTACGAAATAACCATAGCGGGTGCATCGGATGGACGTCGAGTGGTTGATATTATCCCTA
+CAGCACCGGAACTTCTTGTTTCAGAGGGCGATTACGTCTATCCCGACC
+>ds2020-328_605
+GGTCGGGATAGACGCTCCTGGGTGCTTTTGGGAGTCCAATAATCCCAGAAGAGCGAAAGG
+CGTGATGTACTTCAGGAACGTCTGGGACTCAGCGAAGGCAAGAGCCCCCGGCGATAATAA
+CAGTCTGAAAAGGTGTTTAAATCATTGCACGCTGGCAGACTTTATAAATGTAGTGATAGA
+CATTTCGGTGGAGAACCTCAGGATCAGGTTACGGCGTCTATCCCGACC
+>ds2020-328_606
+GGTCGGGATAGACGGCCCAACGACCTCATTCTCCTTTTCCTTCATGACAACTTTCTCCTT
+CATGGCAGGAACAGCAGCAGCAACATTCTCCTTCTTAATAAACAGTACAATTATAAAACC
+CCAAGCTATCATAATCTCAATAATCATTTGAATTTATAAACCGAAAGTTTGAGATGAGAT
+AAAATGATGCATACATAAATTCAATAGATATAAGCGTCTATCCCGACC
+>ds2020-328_607
+GGTCGGGATAGACGGTAGCAGCGGGTTGAGCTGTCTCAGGATGCCCTTCAGGAGAGCGAC
+CCACATGGGGGTAGTTCACGGGCCGGCCGCTGAAAGTGATGAGAATTTCACGTTCTCATG
+TGTGATCATAAGCGCTGAAACGATAGTGACCGACTTTGTGAGAGGAGGGCGGCTGGTGAC
+ATATCGAAGAGACAGGACGTGCAAGGCAGTGGCGCGTCTATCCCGACC
+>ds2020-328_608
+GTTTGGACATCTAGCTTGATGCTATCCAGTGCGGAGTTGAGGGCTCCCTGGAATTGGCCT
+TGAAGTTCTTCCACCATAACTTCGAAGCCCCCCTTTGTAAGGACATCCTCCTCGAGTCTT
+TGATCGAACTCGATCACGGCTCTCTCCATCTTAGAAAGCCGATTCTCCATGGTTGCTGCA
+TCTCTAGATCGTTCCCTCTTTGATTTGCCGCCCACGTCTATCCCGACC
+>ds2020-328_609
+GGTCGGATAGACGTCAAAAGTGGCTCAGGTGGTGACTGCATTACTGGTGGTTGGTGTTAC
+GGATTACACTATTGTGAAGGCTGAAACGGCGGACTCCCCTGCTACATTACAATACCTTGC
+TCCTTATACAGGAGCAGCTCTGGCTGAATATTTTATGTATCGTGAACAACACACTTTAAT
+CATTTATGACGATCCCTCCAAACAAGCGCAGTTCCGTCTATCCCGACC
+>ds2020-328_610
+CAACTAGTGCTCCGACTGAAAGGTCGGGGGGTACAACACCGAAAGGCGTGCTAAACCTTA
+AGGTGGCGTTCATCATGGTAGAGCCTAGTCATGGTTAAGAAACCGAGGATTGGAACGGGT
+GGAAATTAGTGGCGGCCGTTGCTGTGTATTAGAATTACGGCGGTCGGGATAGACGTAATA
+GCACCTGGTCGGGATCGACGAGAGGGGGGCTTTCCGTCTATCCCGACC
+>ds2020-328_611
+GGTCGGGATAGACGCCCGGAGCCCAGGTATCATATACACCCCCAAAATAAAGCGCCTTGA
+ATACTAGAAGAAAAGCACCTATACCTAACAAGATTAAGTGAATACCCAAAATTGTAGTCA
+TTTTGTTTCTATCTTTCCAGACATAACCGAAGAATGGAAAAGATTCTTCAAGAGTCTCGG
+GTCCCAGAAGTGCATGATAAATCCCGCCTAGATACGTCTATCCCGACC
+>ds2020-328_612
+GGTCGGGATAGACGGTGCGGTGGGATGGGAGAACTCACTGGCATGAATGCCCCTGCTTCA
+TCGAGTGGGATACGACCCCCGTTTGATCTTAACATGGCTCCGGACCCGGAGCCGGAACCT
+TCCTCTTCACCCGGCCTAAAAAATAGAATTCTCGAGGCGGAGTTAGAAGAGGCCCAGAAA
+GAACTTCGCTTCTGGCAAGAGAAGGGAAGGCGTTCGTCTATCCCGACC
+>ds2020-328_613
+AACCGCCGCCACTACGTTTATCAATTGTTAAAGGCGATAACCCAGCCCACGCAGGACGCC
+CCCCAAGCTGGAAATTCATCATGGTTTCAGATAGGAGCGCACGGCTAATGTCTCCCATCA
+GTGGGGCAGTATGGGAGCCTGGCGCTCTAGTGGCGGCCGTTGCTGTTGATAGACGAACCA
+GCACCATGCGTCTATCCCGACCAGTGAATCTTTTCGTCTATCCCGACC
+>ds2020-328_614
+GGTCGGGATAGACGTCACCTCCCCATCCCGGTTCAGGAATTTTAACCCGATTCCCTTTCG
+AAGTTCGCGCGAGACGCGCTATCAGACGGGCTTCCCCCGTCTCTTAGGATCGACTAACCC
+ATGTGCAAGTGCCGTTCACATGGAACCTTTCCCCTCTTCGGCCTTCAAAGTTCTCATTTG
+AATATTTGCTACTACCACCATAGATCGTCTATCCGACCGCCGTATTC
+>ds2020-328_615
+GGTCGGGATGGACGAAGAAGGGCATTTTAAAAAAGAAAGAGATAGGTTCGTGCGTGCAGC
+CGTATACGAAAGTACGCTTCCTCTTCTTTCGAATGCTAATGTGTGGTTTTGTCCTACTTC
+CAAAGTCACAGAGGGAGCTGGAGCCGATTTTTTGTTTGACTACCCTCAATCGACGGATGG
+TGCTAAAGGAGTTGGGAGAAGAGTCCACAGGCGCGTCTATCCCGACC
+>ds2020-328_616
+GGTCGGGATAGAGGATGGCCGGCTTTGTTTCTCAGAATTAACTCACCCTCTACGCGCCTT
+AGCCATATGAGCTAAATGGGTTGCTCGGAAATCTTGCCTTTCCTTACTCTTAGGGCTTTC
+CTCCCTATCTTCAGGCAGCACACCGCCATCGGTTTCTGAATCAACGCTTACTATAGATCC
+TGACCTTTTCTCCGACGACACACCCACCTTAACCGTCTATCCCGACC
+>ds2020-328_617
+ATCTGCCTGGTTTCGGGTCTATACCCAGCAACTAAACGCCCTATTAAGACTCGATTTCTC
+TACGGCTCCCCTATACGGTTAACCTCGCTACTGAATATAAGTCGCTGACCCATTATACAA
+AAGGTACGCAGTCACACCACGAAGGTGCTACCACTGCTTGTATGCATGCGGTTTCAGGAT
+CTATTTCACTCCCCTCACAGGGGTTCTTTTCGCCTTTCCCTCACGGT
+>ds2020-328_618
+GCCGTGGACCTAGTTTTAACACTCTGCCGTGGACCTAGTATTCTATCTCGTGCCGTGGAC
+CTAGTCATTGAAAACTAGGTTCGGGATAGACGTAAAGGTCGCCTGGTCGGGATAGACGAG
+TTATAGGGGTGGTCGGGATAGACGTTATAACGCCCTGGTCGGGATAGACGCTGTACGCCT
+GGTCGGGATAAACAGGAATCCCCGTCTATCCCGACCGACGTAATTCA
+>ds2020-328_619
+GGTCGGGATAGACGCGTAACTGTCATCGATCTTTTCTTCTTTCTTCAATCGGTCATATCT
+GATCCGTAGCTGGTAGCGACATGAGGAAAAGGTCCAGAATAGTCTATTTTATTTGCTAAA
+TCGCGAGTTTAAGGGGTCGGATGGGTCAAGTATGGCCTCTAAAAACATGCGATAATCGGC
+TTTTTTAGTAGCATCTGTCCTACCCGCCCTGATCGTCTATCCCGACC
+>ds2020-328_620
+GGTCGGGATAGACGCTTGCCACTCCTGGTCGGGATAGACGTTGTTTTTCGCTGGTCGGGA
+TAGACTAGGTGATTGTTACGTCTATCCCGACCGCCGTAATTCACGGACAGAGAGCCGTGG
+ACCTAGTTATATCGTACCTGCCGTGGACCTAGTTAGCCTGGTTGTGCCGTGGACCTAGTG
+AAGTCAATGCTGCCGTGGACCAACTTAGCCCCCACGAGCGCCACGGC
+>ds2020-328_621
+GAGAGCCGTGGACCTAGTGAGGTTGTTGCTGCGGTGGACCTAGTATCCGAGGGGGTTGAA
+AACTAGGTCCACGGCAGCGGGTTTGAGACTAGGTCCACGGCAGGCAGCAGATCACTAGGT
+CCACGGCTCTCTGTCCGTGGATAGACGACACCCCAATCTGTTCGTCTATCCCGACCAAGG
+GTAATCTCCGTCTATCCCGACCAGGCACATGTTACGTCTATCCGACC
+>ds2020-328_622
+GGTCGGGATAGACGGGACCCTCGAATCTCTGGGATTGGCATGTAATAGAAGGATTGGGAT
+ACTCGAAACAACGCGGCACTGTCATCGGTAAAATAACGTCTAATAGATAGACCTGGAAAT
+CGATGCTTTCTGGCTCCTCACTTCCGGTCGGTGTGCCTCCCCTTTTTGTTTTATTTGATT
+CACAAGCAGGAATTGAACCAGAATCTCCGGTTACGTCTATCCCGACC
+>ds2020-328_623
+GGTCGGGATAGACGGCGCCACCTGCTATCTCGCCTTTCTGATTATTATTATCAAGAACAT
+TGGCTTCTTCCTCATTTATAGCAGCATTAACTCGTTGCACTTCATGGTCATCCAGACTAG
+GCGCAACCGAAAACCTCCCAATCACACGCTGTTCTTGATTTTTTGTTTTGATCTGTTTGT
+GTGACTGGCTTTACACTCTCAGCAGCTTTCAACGTCTATCCCGACC
+>ds2020-328_624
+GGTCGGGATAGACGGTGAAATGTGCATTGGTTTTGTTGCATTTCATGTAACAGGATTGTA
+TGGTCCTGGAATATGGGTGTCCGATCCTTATGGACTAACGGGAAGGGTACAATCCGTAAA
+TCCAGCGTGGGGTGTGGAGGGTTTTGATCCTTTTGTTCCGGGAGGAATAGCCTCTCATCA
+TATTGCAGCAGGGACATAGCATAGTGGCGGCCGTTGCTGTGTATTA
+>ds2020-328_625
+GGTCGGGATAGACGGCCGCCCGCCATACTGAGCGTCTCATGCAGTACACTACCTACAAGA
+CTAGTAGACCTGATGAAGTTCATGAACCGAACTTTTGTGAAAACACATTCCAGGACTGCT
+CCTTGCAAGGTAAGTATGCCATGGCAATCCATTCCACTTCGGATTTACCCTTAGGTGAGC
+TCTGTGAGAGCTTAAGGAAGAAGGGAGTGATTCGTCTATCCCGACC
+>ds2020-328_626
+AGGAATACCTAGTGGTGGACGAAGAACCATTGGCTATAGTTCCTTTGGGGATAGACGTGG
+TTGATGATTATCCACACACAGACCCAATGGTCTGTATACCCTTGAACCTCGACTCCTGCA
+TTGTCCAGCCACACCCCCACCTACAAAGACCCTCTAGCCTCGTTGGAGATGTTGACTACA
+TGGTTCATTGGCAATACCCTAATTCCGCCGTTCGTCTATCCCGACC
+>ds2020-328_627
+GGTCGGGATAGACGCGTGCCCAGCCTCCGTTTCACGGAATAAGTAAAATAACGTTAAAAG
+TAGTGGTATTTCAATTTCGCCGAAGCTCCCACTTATACTACACCTCTCAAGTCATTTCAC
+AAAGTCGGACTAGAGTCAAGCTCAACAGGGTCTTCTTTCCCCGCTGATTCTGCCAAGCCC
+GTTCCCTTGGCTGTGGATTCGCTAGGTAGGTGCTAGGGACAGTGGG
+>ds2020-328_628
+GGTCGGGATAGACGTGTTGGGTCAGCATCTCCGAACCTTGGCGAGGAATCTTTCCTATCT
+GGCTCAAGATCCTCTTAGTCAATCCATTTGAAATGGAACTTCTAGCCACTGGGTCAACGT
+TAACTCCACAAAGATTTTCGAGTTAGCTTCTGCTTACCTGCATTAGAAGTAAAGTCTTGG
+TACCAGTTACATACTTTTCTACCGTACTGATTCGTCTATCCCGACC
+>ds2020-328_629
+GGCGCCCTTTTTGTAAGAATTTGGGCATGAGCGACTTAGTGGTTAGCCGAGCTAGTTACT
+CACTCCATGGCATGATGGGAAAAGCCCCCTTCTGATGGTTGAGCGGGTAAAGCCCTTATG
+AAAAGAGTGAACCGGGCGTAGCGTAGAGGCTGCTAAGAGAGCTTTAAACCTCTATCTTAC
+ACCTGGCAGGAGATGTAAATACTTACTTTCGGGTTATTGGCCTCTG
+>ds2020-328_630
+CTGCCGTGGACCTAGTACTAGCCCAGGTCCGTGGACCTAGTAACCCACATCTTACTAGAG
+CGGGCATACTACTAGGTCCACGGCAAGCGACGAAATACTAGGTCCACGGCAGGGGAAATG
+TAACTAGGTCCACGGCTCTCTGTCCGTGAATTACGGCGGTCGGATAGACGTTTTAGATGG
+TTGGCTCGTCTATCCCGACCAGTGTCAGTGGTCGTCTATCCCGACC
+>ds2020-328_631
+GGTCGGGATAGACGCTGCATGTGCCTCTTCAACGCTTAGCTGTCTGTTAACCTCCCGCTC
+AGGGTACCTATCACGGAATAAAGCTGAAGGCGAAGTCGGAATCTCAATGTCAACGCTTTC
+GTAAAGCCTATTGAAATGACGTGTCATGATCAGAATAGGTTCAGGTGCTAGCGAAACTAG
+ATATTGATCGATCTTTGCAAAAATGTAATCTCCGTCTATCCCGACC
+>ds2020-328_632
+GGTCGGGATAGACGGAAATCTGCCCTGATCGTTTTCGGAAAGCGCCTTCTCCTTTTTGGT
+TGGTTTAAGGGGCGAGAGGGGGCGTGGAACTACTACTACGATTCTCATTATTCTCATTTC
+GCTTTCTACTAAAAAGAGGAACACGGAAAAAAAGGTTAAAAAAAAAGTGCAAAGAGGCGA
+TTCATGACTCCAGCATAAAAAACAGCACGATCGTCTATCCCGACC
+>ds2020-328_633
+GGTCGGGATAGACGGTGTTCCGTTTTAAGCATGTAGGCGGAGGTTCCAGGTAAATCCGGT
+ACCTTTTAACGCTGAGGTGTGATGACGAGGCACTACGGTGCTGAAGCAACAAATGCCCTG
+CTTCCAGGAAAAGCCTCTAAGCATCAGGTAACATCAAATCGTACCCCAAACCGACACAGG
+TGGTCAGGTAGAGCATACCAAGGCACCCGGGCGTCTATCCCGACC
+>ds2020-328_634
+GGGCGGGATAGACGTCCCATTACTCTTTCTACTCCTTCAAAATCGTTTAAAGACGCAAAG
+CTCTGCATCCAGATGTTATACGTAAATGTGTCCAGAGGGATGTTCCTCTGCTTCATTTCT
+TGCACTAAAGGAGCCACTTTCTCTGGTTGCTGCTTTCTCATATGCATAGACATGAGATTG
+TTAAAGACCAAAGAAGAGGAGTCTAAGTCGCCGTCTATCCCGACC
+>ds2020-328_635
+GGTAGGGATAGACGCAAAACCTCTATCATTATCGGCGAACCGAGAAAAGAGTCGGCGAAT
+CGTTAACTGCTATGTCAGCGAATCACAAAAAGAAACAAACTAGCTAACAATCATTCTTGG
+CCTAGCCAGGCCCATCTTGTCCTCTTCTAAACTAATCAAAACATCTTCAGGAGGGGTCTC
+TAACTCATGCAAGCCCAGAATCCAGCATACCCGTCTATCCCGACC
+>ds2020-328_636
+CGATCTGAATTACGGCGGTCGGGATAGACGAACTGTGGCGGTCATTAGAGTCAATCGAAG
+AAAGGCTTGACAGGCTGAGAGTAATAAGGAAAGAGGATGGTGGACTAGGATGCGGAAAGG
+CATTGTTTCGTGGTACAATGGAAAAGAGAAACGGGCTATGGACAGGAAAAGGTGACATAA
+AAGTCGACAGGGGGAGCACACATGTACAAAAGCCAAAAGAAATTA
+>ds2020-328_637
+AGGTCGGGATTGAAGACCACTTTCCCTATTTTTTACTCTGAGTTAAGCCCTGTCTTTGTT
+TTGTCTACTTCAATTATTTTGTCTCAACAGAATGGACGTTCAGCAAGCATTTCTTAATAG
+CATAAGAAATGACTTCAATCAGAACTAGTCTCGTTGCACTGTTATGGGGGCATTTCTCAA
+TCGTTATAGTTTTTCTGGATCTCCTTTTGATCGTCGATCCCGACC
+>ds2020-328_638
+GTCGGGATAGACGTACCAGTCAACTTTTTGCAATTTTCTTCATACATCACATGGTATGAC
+TTGGTTTGCCCAAGTCCGCGATGTAGCCGCAGCCGAAGCCTCGTCTTTCGAAGGCTCAGG
+CACCCTGGCTGATTGTCCCCCATTCGGGATAACGTCAAACCAGGTAGTTGTTAACTACTT
+GGCCCCAGCCACACTGCCAACGTCCCCTATTCGTCTATCCCGACC
+>ds2020-328_639
+GGTCGGGATAGACGGCGTGGCCGGGTCTTGCGGCTGATGGGCCATTTGATAAGAGAGGAT
+TGCCTTTTTTTGATGTTCTTTGTAACAAAGCCCGGTAGGGGCGCGTCTGATAATATTGTT
+AAAAGGGCACATCAGCCGCAAGACCCGGCCACTTCGTCTATCAGGAAGAGGAACCGTCTA
+TCCCGACCAGGGGCTCTTCTCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_640
+GGTCGGGATAGACGTTATTTGGTCTCGGGGAGACCGCCCATTTATCACATGGGAGGAGAA
+GACTAGTCAAACATTCGAGCTGTAAACTCGCAATATAGACTTGAAAAAAAGAAAGATATT
+GAGACGGAATATGAATGAAGGATTGAAGCATCTGACTGGGCTCCGGAGATGAATACCGAA
+AGAGCTTACCGGATGCACCATCGCACCACAACGTCTATCCCGACC
+>ds2020-328_641
+GGTCGGGATAGACGAAGGACCACCCTCCGCTTGGTAAAGCGACTCATAGGCGGATACCAC
+GTTGTTGTCAAGTGAGGTATAGATGAGCTGAACTTTACCTTGTAGACCACGAGCCGCTTG
+GGGAATATCGGTAGTGCGCTGTGCAGGTGCTGCAACGATGCTAATGCCCATAGGTTTAAA
+TTTTGTTTCAAGCGCTTTGAGTACCCCAGGTCGTCTATCCCGACC
+>ds2020-328_642
+GGTCGGGATGGACTTTGCGCCTTGTTAAAGCTTCACCTATTTCTAAAATTTCTGGAGAAC
+ATCACATACATTTCACAGCCGCGGAGGTGCTGCGCGCCATTCCTCGCGAAAAGAAGCTAC
+AGGCTCTACAAGCACTCCGTCTTCCTACGGATACCACTACCACCATGCTGGGGGGAGTCA
+TGTTATGGCTGGCCAGTCTAGACCCGTTTTCCGTCTATCCCGACC
+>ds2020-328_643
+GCCGTGGACCTAGTGCCGGATCGGGTGATGAACTAGGTCCACGGAGGTTACAGACAACAA
+AGTCCACCGCAGGGAGGAGTGAACTAGGTCCACGGCACCGTACTGTAAACTAGGTCCACG
+GCACGGGTCTAACAACTAGGTCCACGGCTCTCTGTCCGAGGATAGACGCTCACAGGGCCT
+GTAGACGTCTATCCCGACCAGGGCTCCCGTTCGTCTATCCCGACC
+>ds2020-328_644
+GGTCGGGATAGACGTTTAAACCTCTTGTGCGTCTATCCGAGGGGCTCAAACCGTCTATCC
+CGACCAGGGAGAGCCACGTCTATCCCGACCAGGGCGATTGTGCGTCTATCCCGACCGCCG
+TGGACCTAGTATCAGGCTTCGTGCCGTGGACCTAGTTCAAGCTCACCTGCCGGGACCTAG
+TATTAATTGGTCTGCCGTGAACCAAGATTCGACTAGGTCCACGGC
+>ds2020-328_645
+GGTCGGATAGACGAAATGGACCAGTGAGCGTCTATCCCGACCAGCCATGGTGCCGTCTAT
+CCCGACCGCCGTATCGGACAGAGAGCCGTGGACCTAGTTTCCGCCCCCCTGCCGCGGACC
+TAGTACGTTCCTCCTTGCCGTGGACCTAGTTGTGGTGACCCTGCTGTGGACCTAGTAGAG
+TCTCGACTAGGTCCACGGCAGAATATGATTCACTAGGTCCACGGC
+>ds2020-328_646
+GGTCGGGATAGACGATAGCTGCCCATAGTGCCACGCCCGTAAGGAATGAGTTAGTAGCTT
+CTCTGGTTATCGATAAGGCCAGAGCTACGCTGTCAGAGTTGACTCCCAAGATGTCTACCA
+CCTCCTTGAACGAAAAGTGAACATGATGCGACGCCGTTATCTTGGTGTATTTTGCCGACA
+TTGCTTCATGTAACTGCCACCCTAGGACTGTAGTGGCGGCCGTT
+>ds2020-328_647
+GGTCGAGCTACTTCGTTACCCTCTCCTCTGAGATACGAGCTTGACAACCACATAGTAATA
+TCCTTTCAAGTACGCCTACAGGGATAGGATTTTCCTTCTTTTTTCGACAACCAGTATAGA
+AAGTATCTCGCCCCTCTGTAATTCTTATCCGTCCCCAGATGCTGAATGAGCTAATCCTGA
+TCTTTCTCTCATAGGGTGAGAACAACTCTGCGTCTATCCCGACC
+>ds2020-328_648
+GGTCGGGATAGACGGTGAAAACCCCTTTTAACCTGATATAAAGATTGTTTTAACCGTTTA
+GCCTGTCTGGCTAACTGCAGCCAAACCAGCATACAACAACAAATATGATTCCGCTGAATA
+CGAGCCTTACGACACTGATTAGCTTCAATACCAGTGAGTTGTTTAAGTTATCGGTGAAAC
+TGCTCAATCTTCCGGGGGAGGCCCAACGAACGTCTATCCCGACC
+>ds2020-328_649
+GGTCGGGATAGACGGAGTGGCTGTATTTCTGGGTGCAGTTGTTCTCAGCTTAGCTCTTTC
+CGAGTCTGTGTGTGTAGTAGGTTTCAGTGCTGTGTAGTCAGCAAGTTTATGTTGTTGTTG
+TGACTCTTCTTTCTTAATATTTTGACTATGGAAGCGGGCTATTCCCCTAAAATGTTCGTT
+AACGTTGGGATGTAGTTTAGGTAAGTGTAGCGTCTATCCCGACC
+>ds2020-328_650
+GGTCGGGATAGACGTTGGGATGGATTTCATTAACACCCATAGACCAGAAAAGGTGTTCGT
+AGGCATACCGCTTGCTGTTCAAGAATCGGTAGCGGTTTTAAGGGAGACTACCGAGCTCCA
+CGAGAAGCGCCTATCATCTCTATGCGAATTCTGACCTTAGCTTTTCGTCTTTTATTAGTA
+TTAGTGAAAGCTCGCTCGACTTAGATATCGCGTCTATCCCGACC
+>ds2020-328_651
+GGGCGGGATAGACGATAGTAGGCCATTAAAACTTCCCACGACGCCCCTGTTAAGTCTAAA
+CAATGCAGCCATAGCGCTACTGCAGCTACGAACTCCGCAGCTTGGTTTACATGGTCCTTA
+CACCAGGATAATACTAACACACTTTGTTGCCTAGAGCGACTGAGTCCACGAAGTTTATCC
+ACACCTGCCAAATTTTTAACTGACTTGCCACGTCTATCCCGACC
+>ds2020-328_652
+GGTCGGGTTAGACGACCAACGGGCGTAATAGAACTCAAGGCAAGTAAGAAGGGCAGTCCG
+CCTCGTAGATCGATTTCGGAGTCGTAAGTTAATGTTTCCTTCTCGGCCGTTGATGAAGGG
+GACCCTTCGGCAAGCCTGGCGGTTGCTGCCTTGAGCCGATATCTTCCCAGTCCAAGCATT
+AGAGAACGTGTGGGGATAAGGCCGACGCTGCGTCTATCCCGACC
+>ds2020-328_653
+GGCGGGATAGACGGTTTACCTCCTGGTCGGGATAGACGGTGTTTATGCCTGGTCGGGATA
+GACGGTCATAGGAGTTGGGGTCGTCTATCCCGTCGGACAGAGAGCCGTGGACCTAGTCTA
+TACCCCTTTGTGCACTAGGTCCACGGCACCGTAAGTCAACTAGGTCCACGGCAGGGCGTA
+GGCCACTAGGTCCACGGCAGGGAGCGACCAACTAGGTCCACGGC
+>ds2020-328_654
+GGTCGGGATAGACGGTTCGGATGGTTAAGAGATTATCTATGGATAAACTATTCATACCAA
+AAGGATTATATCCATTAATAAGTTGCGAAGAGTTTAACCATAGATAATCTCTTAACCATC
+CCATCAAATATGTGGAAGACTCATTAAACTGTGACACGTTACCCTGCCATAATGTGATGT
+GATTCCAATGACAATAAAAAGAGACCCCCTCGTCTATCCCGACC
+>ds2020-328_655
+GGTCGGGATAGACGAGAAAAGCAGCTCAAGTATGAGACTGTGATTAGCCCATCGGTCCGT
+TACTCTGCGCTGATGCAGACGCCATCAGTCATGTCCCCTGGCATGGCATCGGTTGAAAGA
+ATACCGATACAGGAGCGGATAGTGACTAATAAGCCTTACCACTCTTCATGTGTTTATCAC
+TAAGAAGTAAAACGAATAAAAGTCAAAATCGTCTATCCCGACC
+>ds2020-328_656
+GGTCGGGATAGACGTCTGCTGTTCGTCAGGACTTTGATGGATGCTACGTTAAGTATCTCA
+TACAGTGAGGCCACTATAGGTGCGGCTGAAATAGGGCGTGCTAAATCGGTGGTTAGGTCC
+GCTCTGCGGCTCAGGAAACCAAGGCACGATATGACATTTAAGGTTAAAGCTGCAAGCTCA
+GTATCGTATAGGCCTATAATGGGAGTGACCGTCTATCCCGACC
+>ds2020-328_657
+GGTCGGGATAGACGCAGATCTCTTTTCTGCTCCATACCTCCTCTGGTATTCTATGCTCCA
+ATGGAACCGATGGGCCTCGGTTGATCAAGTAAGCTACTGTGTTGACTGCTTCTGCCCAGA
+ACTGCTTCGGTAGACCTGACTGTATACGAATGCTTCTGGCTCTTTCTGTCAACGTTCGGT
+TCATACGCTCAGCTATACCATTATTTTGAGGCGTACCCGGTAC
+>ds2020-328_658
+GGTCGGGATAGACGGTCATAGCTTTTACTGATGCTTATGGATCACTTTCTGAATCGAACC
+CAAAAACGGATAGGTTTGATCGGCCTGGCCTCGGGTGGTGGATCGAATGAACACTCAACC
+GCGTCATCACGGAAGCGATGGATGCCCAACCTTTATATCACTTCCTTCTCAATAAAGGCG
+GGGATGGACTCTGAAATACTCCTCTCTGTCGTCTATCCCGACC
+>ds2020-328_659
+GGTCGGGATAGACGGACGCCACTCCTGCCACATCAATTAATGATAGTGGTAAGCATATAC
+CAAAAAGTAAGACGGGCGTGTGTCAATATAATGATAGCGGTAGCGATATAATGGCTTAGG
+GACAAAATCAATCCCATGCCCACCCCAAGGATGACAGCGCGCGATACGCTTGGCTGTTAA
+TAATCCACCCCCTGCACTCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_660
+AACGGCCGCCACTACATTATGCACATCTGCGCCTCAACTACCGCCACAAAAGCCACCGCC
+ACCCACCACCACCACTTGAGGATGAAACTTTGAGCTCTTACTGCACATAGTCACCCAAAT
+GCAGGCACCCACCTCAATCTCTCCGCTGTAAAAACTCCCAATGCCCACATTGTGAAAAAA
+ACACCAAACCCATCCAAACCAATCCCAATTAGTGGCGGCCGTT
+>ds2020-328_661
+GGTCGGGATAGACGTTGGGATGAGTTTGGGTGATTGGTGATGGTAGAGAAAGATGAAATT
+CGTAGAGAATAGGAAGGGGGTTTTCTGGAGGTGTTTTGGTGATTTTGGACAGAATGGAGT
+GTTTGGGGAAGGATGGAAGTGTGAGAGGTTGGCTAGAGTGAATTGTAGTGGCTGAATGGA
+ATGAGATGTTGGGGATGTGAAGGATGGAGCGTCTATCCCGACC
+>ds2020-328_662
+GGTCGGGATAGACGCGGGAGTCAGTTCAAGTCTTACCTGAGACAATAGTATATAAAGTAG
+CTCAACCAATGGCAATTCCTCACGTATTCGAAGATCGGTAAATGCCTTAATCAACTAATT
+TAGGTTTTCTAGTGCGTGTAATTTCCATCCATTCATTACCAACGTAGTCTGGCTATAGCC
+CAGTTGTCCTGATCAGAAGAGGGGGTCCCCGTCTATCCCGACC
+>ds2020-328_663
+GGTCGGGATAGACGGAATAAGATACTTGTGGACGGATGACGTGGGAAGAAGTGGGGATCG
+GAGGTTGATGTGACGGTGGTTACAATGGTGTGGGCTGGTCATGTGGAGGACGAAGAACTG
+AACGCTTTGAGGAAACAATGGAGACAATGCGGCAAAATAGCCTCTCCTTTTCTTGGGTTG
+ATTGATGTTGTGTTCTTAGGAGAGTAGTGCGTCTATCCCGACC
+>ds2020-328_664
+AGAGCTTATCCCAATAGATCTAGCGGATCTAAGGGGTTTTTCCTCCTTTTCTTGGGAGAG
+TCTCTCCAGCTGGATCATAAGGGCACAAAACACCTTTGACTAGGTTCAAGCCTAGCCTAG
+GATACCCCGCTTCCGCATACACACCAGGGAATGAATTTGGAGAAGGATCAAAAGGAATTG
+GACTTGCTAACCCAATTGACGGGAATTAGTCGTCTATCCCGCC
+>ds2020-328_665
+GGTCGGGATAGACGAAGCTGCATCATGTCGGTGTTGACCATACCATAAAGCAAGAAAAAA
+GTAACTTGATCCAAACATATCCCAATAAATGCACAGATAAGGTAAGAGGACATGGACGCG
+CAGAAAGTAGTGACGAAGAGACTGACGAACAGGCAAAAAGCACAGATAAATAAGACGGCA
+AGTGCGCTAGAAAGAGAAGAAGCCGAATCCGTCTATCCCGACC
+>ds2020-328_666
+GGTCGGGATAGACGGGCGGTTTTGGTGAGTGAGAATGCGCTGCGATGGCTATCTTGCGCC
+CGGAGGTGTTGTGAAGCATTTGATTGCTGGAATGGCCACTCAATGAGCTGGCTGGATGGC
+GGAAGGTTGACCGAGATGCATGACGTGGCGCCGTCAGTTTTCCTTTATTTATTTATTTAT
+TTTTGTTTGGTTTTCGATAGTCAATCGAAGCGTCTATCCGACC
+>ds2020-328_667
+GGTCGGGATAGGCGGGAGTGTCGACTGGTCGGGATAGACGTAGAATGTATCTGTATCGTC
+TATCCCGAGACAGAGAGCCGTGGACCTAGTTCGCCGACTCTTGCCGTGGACCTAGTTCCT
+TAGCGGGTGAGTCACTAGGTCCACGGCAGGAAACTGGCACTAGGTCCACGGCAGAAAAAC
+GAGTACTAGGTCCACGGCAGAGATTATTAACTAGGTCCACGGC
+>ds2020-328_668
+GGTCGGGATAGACGTGGGATGTGGCTATGCCGAGTTCCGTGGACTGGTCCTATCCCACTA
+AAACGAGGCGTTCAACCCTCTCTCAGCAGTGGGCGCGTGTTTCAACGTCCTACGCAATGT
+TCTTCGAGATGTCGGCGGGTCTGTCGACCGGTCAATCTGCGCAAGGCAGTCATGCACAAA
+TGGTAGAAGTGACTATTATAGAGGGAGTACGTCTATCCCGACC
+>ds2020-328_669
+GGTCGGGATAGACGACGGCCGGCCATATACTTGCACATCAAAGAAGATTCCGACTGTCAG
+TCCCTGTTTGATACTTTCATCAGCTCAGACAACTACAAGTCAGAACTCAAAGCCTTCAAA
+GATGGCACTTATGATCAGAAGTACTCCGGCTCGACTACAATCGCCAGAAAAACGGTCCTC
+GCAAGTATCTTTTCAGACCAGTTCCCACATAAGGTCCACGGC
+>ds2020-328_670
+AATGACTCTAAGCCGAGGAATGATAAATTTGTCGGAATCCACCAGGGGTTTATTATCATG
+ACACCACTGTTCTAAGGAACAATCAACTTTGCGAGTGAACACCAATATATCTCCACTGCC
+AACTTCATGTACAAGCTTTGGTTCAAGAAAATATTTTGAACCGCACATTGCTGATAATCG
+ACGCCACCCATTTGCCACCTACCTCAAACGTCTATCCCGACC
+>ds2020-328_671
+CGTCGGGATAGACGGCTTTGGCTCTTGCCTCTTGCCCTACCGATCTATGCTACCTCGTAT
+GGTACTGTCTTTCTCGCTGCGTGCTTTTCTACAGGAAGCATCCCAACCAGCAGCTTAAGA
+AGGAGTTCCGGTGCCAATTTCATACCCTTTACCATAAAAGGGTAGTGCTCCTACCTTCCG
+GTCTACTGGTTATAGATCAATGGCTTACACCCCGTCCACGGC
+>ds2020-328_672
+AACGGCCGCCACTAATCAACTTTCTTTGGTGGGTCACAGTCGAAGGCTGATGAATCGGAC
+AGTTGGGTATCCAATAAGAGCTCTGTGTCGTCTGAGGGACGGAGATTCGGTGCTTCCGGT
+GGTGGGTTCGATCGGGAGAGGAAAGTGGGGTTCACATCTGATGGAGGTGCTGATTCTGAT
+AATTGGGGGAGGAAGAAAGAGGAGCGTACGTCTATCCCGACC
+>ds2020-328_673
+GGTCGGGATAGACGGCTTGCTGCCCTGCTTAATGGGTGGCTAGGCTTTGGCTACAAGCCC
+CAAAGGCCCAGACCCAGTTTCAATTTCAACTTAATTAATTGAAACAACAACAACAACAAT
+AACAATAATAACAAAATAATAGTCACAACAAATTGTAATAATCTTAATTCTTATATCAAC
+AATCAAGCAGCCGTCGAACTGTCCTCTGGGGCGGTCCACGGC
+>ds2020-328_674
+GGTCGGGATAGACGTACGGTTGCCCTGGGGGACTTGTTCTGTGATAAACAAATGACTCCA
+AACAAGAACCCCAGGGCAGCCAATCGTAAGAAAAGAGGTGAACCTGAGAAGAGCAGTAAG
+AGTAAGCGTTCAGGTGCTGGTGCTATGACCTTAAAGGCGGAAGATCCTCCCCTGGTTCTA
+ACCACCCTGAATGAAGAGAGGGCGCAGACGTCTATCCCGACC
+>ds2020-328_675
+GGTCGGGATAGACGTTCAGGTGCCATCTTTTTATCCGGTTTACTTGTAAGTTTTACTGGG
+TACGCCTTATATACTGCTTTTGGGCAACCCTCTCAACAACTAAGAGATCCATTCGAGGAA
+CACGGGGCTGATTACTAGGTCCACGGCTCTCTGTCCGAGGATAGACGGCAAAAGGAAGTG
+TTCGTCTATCCCGACCAGGGCAGTTATACGTCTATCCCGACC
+>ds2020-328_676
+AACGGCCGCCACTAAAGAAGCATAATCAACACATCACACATCATCAACACCCACCATGGC
+CGCAAACGACTACTACACCTCCCATCCCATGGAGAATTCCACCCTCGCACCCCCAGACCT
+AACCTACTCCGCCTCCGCCACACAACACAACTACAACAACACATCACACATCATCAACAC
+CCACCATAGCACATCGACGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_677
+GGTCGGGATAGACGACTATCAGTGTTGAGGATAGGAGCGTTCATGTTCCTTTTTGTCACC
+GACCGTGCCACTTCTCTAAAGGTACTTTGCCTATTGGAAGTTTGACCTGTCATTAAGGTG
+GAATCCACTCCAGACTTTCCTTTATCCCATGAAACAAAATGGGATAAATCAAAAGAGCAG
+TCATCAAGTTCAACTGCAATATCATCCGGCGTCTATCCCACC
+>ds2020-328_678
+GGTCGGGATAGACGAGCAGGCCCCATTCCTTAACAATAGGTAGCCAAAACAGGAACCCGT
+TAACCCGCACAAGCCAATCTTGAAGCATCAATGACGAGGGGTATGAGACGACAGTTCGAT
+GCCAGAGCACAGAGCCTGCCGGTGCATACAACCCATTCACCACTCACACGCCGTTGCTTT
+GGCGAAGCCCAGCACCACCAAACCTGACCGTCTATCCCGACC
+>ds2020-328_679
+GGTCGGGATAGACGGACTTCAACGCTCTGATGCCCGCCCTTGTCGCTTTGGGCTATGACT
+AGGGCAACCATACCCGCCATTACCACAAGCCCGCCTTGTGCCATTGGTGAGCATTGCGGG
+CATGATGCCAAGCTTGTTCCTGTCATTGGTCAGTCAGTACCAGCTACCAGCCAAGCCGAT
+GCCAACCATTCACGATAACCACAACCAGCGTCTATCCCGACC
+>ds2020-328_680
+GGTCGGGATAGACGACGGACTCCGCTGAGAAGGATTCTCGTGCCAACTATTATGTTCAAA
+GACAGGCCTCAACGTGACTTTAAAGCGATTATTCTCGATTGAAATTTCCATAGATAGAAT
+AGAAATTAGGCCATCTCCTCAGAGGCGGCTTCGGCTGCGTCTTTGCCTATTCTCACCTGA
+GATAGCGTCTCATGACACCCATATTAACCGTCTATCCCGACC
+>ds2020-328_681
+GGTCGGGATAGACGTTTGCACTCGGTCCGGTACGACCATCAAACAATACTTGCTGACCTG
+AGGTTGGCATACCTGCTAATTCTAGCAAGCCTTTGATTTGCTGTTCTTTAGCGCCATCAA
+ATACTGCCGTACCCATTGGTACGCCTGCACGTAGATTTTTTGACATCGCAATGATTTCCT
+CATCACTGAGGCTGCCTAAGTCCTTTTCGCGTCTATCCGACC
+>ds2020-328_682
+GCCGTGGACCTAGTCGTCTATCCCATACAATATTAGGTCCACGGCAGGGGGAGCTCCACT
+AGGTCCACGGCCCCCCCGTGGACCTAGTTATGGAGGGAATACTAGGTCCACGGCAGGGTA
+GCAGGTACTAGGTCCACGGCTCTCTGTCCGTGAATTACGGCGGTCGGATAGACGCTGTCA
+ACGCCTGGTCGGGATAGACGTGACCAATCGTCTATCCCGACC
+>ds2020-328_683
+GGTCGGGATAGACGTGATACTAGCCTGGTCGGGATAGACGGACTACCCCCCTGGTCGGGA
+TAGACGCAGGTATGTTCGTCGTCTATCCCGTGTCATCAGATTCAAGCCTCAATAGAAGAG
+AAACCATAAAGAAAAGAATTTCTGAAGGAGAAAGTAGCTCTGCTGCTAGGGGGAAGAAGA
+TGAATGGGTCATCATCAACGGGAGCACAACTAGGTCCACGGC
+>ds2020-328_684
+GGTCGGGATAGACGATACCGCGGGGTACGCCGTCTATCCGACCAGGGTTTCAAAGCGTCT
+ATCCCGACCAGTGAATCGGGTCGTCTATCCCGACCAGGGTCCCTGATCGTCTATCCCGAC
+GGACAGAGAGCCGTGGACCTAGTTAGGCAGCAGGTACCGGACTAGGTCCAGAGGAGTTCA
+GTCACTAGGTCCCGGCAGAGGCCCGTCCACTAGGTCCACGGC
+>ds2020-328_685
+GGTCGGGATAGACGAGTGAATCGGTTTGCGCATTTTTGCACGTAACTTTGAGGTTGTAAT
+ACTGTGTCTGATAACCGTCGGTATACGCACTAAATGGCGCAACGTTATACGATGATGAGT
+CCTCGTTATAGTAGCTGCGTGCCCGCTTAGTTACTCCTTGCGTTGTTGATCCCTGGCCGT
+TGTCTTCCCCCACGTAGACAGCCCGACCGCGTCTATCCGACC
+>ds2020-328_686
+TAGTTAGAATTACGGGGTCGGGATAGACGTTTAATGTGCCTGGTCGGGATAGACGCATAT
+AACCGCTCGTTCCGTCACCACAACCACCACCACCGCCGACGACAATAACATCAACAAGAA
+CGATAACCACCGGAAAGACAACAACATCAACCAGAACGACAACAACATCAACCAGAACGA
+CAACAACAAGAGCGACAAGCAGGATAAGTAGTGGCGGCCGTT
+>ds2020-328_687
+GGTCGGGATAGACGGCGAGCCACCATGTGTGAAAAAGCACCCCACCGCCTCATTTGATAA
+AACTTCCAACTGAGGGCTCCATGCTACTATCAACCCTTTGCATTCACCACCATCTTCACT
+AGTACTAGTACTTCTCTCCAGCTCCAGCTCCTCTATGAAGTTGGGTGGCAGCTTCGCCTT
+TTCGGATTCCTTGACCACCCACGAACAGCGTCTATCCCGACC
+>ds2020-328_688
+GGTCGGGATAGACGGCGCGTTCGTATGAAGCAAGAGCAGGATTGCAGTCCGTAAGAGCAA
+TTCTTGAGCCAGCCATAGCGATTCTGCATGCGTGCAGGTACGATCCCGTGTTGCTCGCTT
+TCGTAGACAAATATGGTAGGAAAATGTACGACATTGCAGCTAGAACAAAACACGTGCTTG
+TTGCGTTTTCGTACGTCCATTGCAGAGGTTCCCAGCCCCCCT
+>ds2020-328_689
+GGTCGGGATAGACGGTACGTGGTCCTGGTCGGTGCCGCTATCGTCGGTACTGCAGGCTTG
+CCATCAACGCTGGCAGCGGCTAACGCGGGTAAAAAGATTTTGCTTGCTAATAAAGAAGCA
+TTATTGATGGCAGGTGAGCTGATGATTAAAGCCGTCAAGAAGTCAAATGACAAATTGCTG
+CCAATTAATAGCGAGCAGTGGTACTTGGCGTCTATCCCGACC
+>ds2020-328_690
+GGTTACCACGCGCTCAGGCGGAGAAGGGGCAGTTCGTGAGTTATGTGATTTGATATTAAA
+AGCCACCGGTCATTACAATGATATTTTGGCAAGCTATGTGGTTTAGTGACTGTAAGTTAG
+CTTGAGTAATTTTTTCTAAGTGGTTTAGTTTAAGTAATTTGTTTTAAGTGATTTGGCGTA
+TGCGGCTTGGTGTGGAGTGGGTATGCTCGTCTATCCCGACC
+>ds2020-328_691
+GGGCGGGATAGACGGGATTCTTGGGTCATCTCAATGGGTTCAGAAACCACACGTTTCTCT
+GGATCATCATAGCGTACTTCTACATATCCACTCAGAGGAAGGTCTTTTCGTAATGGATGA
+CCCTCGAAACCATAATCTGTTGATATACGGCGTAGATCCGGATGATTGATGGAAGAAACA
+CCAAACATATCCCAAACTAGTTCGCACCGTCTATCCCGACC
+>ds2020-328_692
+CCCCGCTTCCACACCCGCTCACTACTACTCCAAAGTGTATCAAATCTTTACGTCTGTCTT
+TAACCCAGCTTTGTTCCGCTCCTATCAACGCCGATCCGTTCTCGCCTCAATCGCTCTCGA
+CCCCGTCACCTACCCCGACCGTCACATGAACTTCTTCGATCTCGTTTTCTCCGCTTCCCG
+CTCCAATCTCGCCGAACTCCGCGCAAACGTCTATCCCGACC
+>ds2020-328_693
+GGTCGGGAGAGACGGAGGCCATGTGTCTTATATATCACACCTGAGGCGGTCTGGGATGGT
+ATACGCAAGGTTTTGGGATTAGCACCACGACCAACAAAGAGATCAGTTTCCGAGGCAATA
+ACCAGGGAACAAGTTGCTGCAATACTCAAAACGGAGCCGAAAGTAGTAGCCAAGGCCCAC
+ATGAAGTTAAATGAAACGGGGAGGTAGCGTCTATCCCGACC
+>ds2020-328_694
+GGTCGGGATTGGATGGAGATGATGGTGAAGATGAGATGGGTATTCTGGAAGCAATGTTGG
+CTGGCCGAAAGAGTAGGAAAAATGCAGCTTTGAGGGTTGAGCAAGAGGATTCCTTCGTGA
+CTGATATTCATGTGGAGAATGATGGCGATGAGGTGGAGTTCATGGAAAATGATAACCGGA
+AGAGCACAAGAAGGAAAGGATTAAAGATAGTGGCGGCCGTT
+>ds2020-328_695
+GCGGGATAGACGTTGAATCACCTTGGTCGGGATAGACGAGCATGGGGCCTTATCGTCTAT
+CACGGACAGAGAGCCGTGGACCTAGTGCGGCTCGGGCTGAAGAACTAGATCCACGGCAGG
+GATAAGTATACTAGGTCCACGGCAGGGACTGACGGACTAGGTCCACGGCAGGGGACTTAG
+AACTAGGTCCACGGCAGCCCTCGGTTTACTAGGTCCACGGC
+>ds2020-328_696
+GGTCGGGATAGACGGGGGAAGCTCCTGAGAAATGGAAGAGGGTGTTCCAAAGAGGTGGAT
+CCGGAAGTCTCACTGTATGAGTTCCGAGGACATGGGGTATGTCCGCACTCGATGGCAGAG
+GGCCTAAGTGTTGCGGGGCTTTGCTGTGGTTTACACCTTGAGGTGGGGGTGTGCCAACGA
+GACAAGTAGGGGGAGAACCTCGAAACTCGTCTATCCCGACC
+>ds2020-328_697
+TCATCCACCTGGTCGGGATAGCCGTGCCATCCCTAGTGTGCCGCTGGCTCTTAGGTTTCT
+GAATGTACCTCTGTGCTCCCGCCAGTTTCGTGCGCGATCTATGTTAAGATTATCAGTAAC
+TTGTACTGTTGCTCTCTTTATAGATAACGCCTTTAGCGTAGAGTTGTACACTCTTTTTGT
+TATGTTGTTTATTGTTATATCTCCCTTCCGTCTATCCGACC
+>ds2020-328_698
+GTCGGGATAGACGCCGGAATTGACTCAAAAAAGACCAGCTAACATATCCACTGTGCAAAG
+CATTGCAAACGACACTTCAGTCCAAATACCTACCGCTGAATATGTAGCAACAATAGTTAA
+AAGAAGCGGTATGAATTGGACAGGAAAAGAAGTCGGTTCTTTTTCAAAAATCATGGAAGA
+TGTTGGATTCGCCGAAGGCCGACAACCCGTCTATCCCGACC
+>ds2020-328_699
+GGTCGGGATAGACGAGAGGCACCACTGGTCGGGATAGACGACTGAAGCTCGTGGTCGGGA
+TAGACGACGAAGTGGGGTCAGCGTCTATCCACGGACAGAGAGCCGTGGACCTAGTGCCAG
+TAACCGTGCCGTGGACCTAGTCCGCTTGTACGTGCCGTGGACCTAGTTTCTTCTGCCTTG
+CCTGGACCTAGTAGAAGCGACTGTCCAACTAGGTCCACGGC
+>ds2020-328_700
+GGTCGGGATAGACGATTACGCGCGCTGGTCGGGATAGACGATTATTTCCCCTGGTCGGGA
+TAGACGGCATACAACTCTGGTCGGGATAGACGAGAGCAGTGGATGTAGTCGTCTATCCCG
+GACAGAGAGCCGTGGACCTAGTCTACCAGACCCTGCCGTGGACCTAGTCCAGTTACTCCT
+GCCGTGGACCTAGTAATCGGGGTAAGTACTAGGTCCACGGC
+>ds2020-328_701
+GGTCGGGATAGACGTCACACCCTCTTCGAGGGTTTCCTTAGCATTTCTATGCCAGAGAAC
+TTTGCCGCACAATGGGATTAGTTTACTTTGAAGGGGACTCCTGACCTTGTTATCATAAAG
+CTCATGACGAGCCACTTCGCATTAAAGAACCAATACCATAATGGCAAGCCGTGACCCTAC
+CCTATAACCCCTGTACGAGAGAGCGGCGTCTATCCCGACC
+>ds2020-328_702
+GGTCGGGATAGACGCCTGTCGCAAGTGTAATACTTTTCGTTCTATGACTAATTTTTTTTA
+TTTGACAATATAATGTTGGGAACAATTTCTAGGATTCATTTTGCAAAGTCATATCAGGGT
+GAATTGGGTGAGAGAAGTTCTTATGTATTTCTTGATGGATAACTGTTGTTAATCGAGGTT
+GAGAAGACGTTGGAAGCTGTCAACTGCGTCTATCCCGACC
+>ds2020-328_703
+GGTCGGATAGACGCTATTATCCTCTGGTCGGGATAGACGCGCATGAACCTTGGTGGGTAG
+ACGTAAATCACTGGTTGACGTCTATCCCACGGACAAGAGCCGTGGACCTAGTCATCATTG
+CCGTGCCGTGGACCTAGTGGTAGTACCCGTGCCGTGGACCTAGTCTATACCCGAGGCCGT
+ACTAGGTCCACGGCAGGGTAGTGTTAACTAGGTCCACGGC
+>ds2020-328_704
+AACGGCCGCCACTATCCTCGTCTCTCACTCGGTCAACGACGCCGAATTTTGGCAAAAACG
+CTATGATGATGGCTATACTGGGTGGGATATCGGTCAAGTTTCGTCACCCCTGCAAGCCTA
+TATCGAGCATTTACTTGACAACGGCGTGAGTAAATCGGTACAGATTTTAATCCCTGGGGC
+GGGCAACGCTTATGAGTAGTGGCGGCCGTTGCTGTGTATT
+>ds2020-328_705
+GGTCGGGATAGACGTCCACGTGTGATGAGATACAGTATTTTCATATAAATTAAAATAGCA
+GTTTATAAGGCAAAAAGGGACTGAGGGAGAACCATACTCTAGCTAGTTAAATCAGGCCCG
+CCTGAACAAGTAGATAGAAGTCACGAACGTCGCATTGACGTGGCTGGCCTTGAGCTAAGT
+GATGACAGAGATCCAGGAGAGCGGATCGTCTATCCCGACC
+>ds2020-328_706
+GGTCGGGATAGACGAAATCATGTGCATTACTCAATGGGTTCTTGAAAACCAATCTTTTCT
+TGACTGCGCTCCAGAAAGTTAAATCATCATTAGCAAAATGTCTCGGGAAAACAGCTTCAG
+GGAGCATTGCGCAATTATCCTCCACCTGATCTTTCTGATTTGGCTCATCTTTGAACTGCT
+TGCTCCATCCGACACCAATCTCGACTAGGTCCACGGCTCT
+>ds2020-328_707
+GCCGTGGACCTAGTGATGACCGCCATGGAGAGGCAACGTGAGACTAGGTCCACGGCACCG
+ACCCCCCGACGAGGTCCACGGCAGGGCATGCTTAACTAGGTCCACGGCTCTCTGTCCGTG
+AATTACGGCGGTCGGGATAGACGTTTCACACCCCTGGTCGGGATAGACGGACTGAACCCC
+TGGTCGGGATAGACATAGGCGCCCACCGTCTATCCCGACC
+>ds2020-328_708
+GGTCGGGATAGACGCGCAACAACCTGGTCGGGATAGACGGAAATACCACCTGGTCGGGAT
+AGACGCATGGCCAATCAACGTCTATCCTCGGACAGAGAGCCGTGGACCTAGTAACAACTG
+CTCTTGGCCGCTATGGAGCCCAATAAAGGACTAGGTCCACGGCAGGTGTTGATGAACTAG
+GTCCACGGCAGGGGATACAAAACTAGGTCCACGGCTCTCT
+>ds2020-328_709
+GGTCGGGATAGACGTTAATGTCGCCTGGTCGGGATAGACGTTATGACTACCTGGTCGGGA
+TAGACAGGCACCACCCTCGTCTATCCACGGACAGAGAGCCGTGGACCTAGTCGTTAATTC
+GCTGCCGTGGACCTAGTACCGATGTCCCTGCCGTGGACCTAGTTCTAAATTTCGTGCCGT
+GGACCTAGTTCTAAAGGGCTTGTGCCACTAGGTCCACGGC
+>ds2020-328_710
+GGTCGGGATAGACGTGCGAGTTCCCTGGTCGGGATAGACGCATCAGAATCCTGGTCGGGA
+TAGACGTAACCAGCACTTTAGAACGTCTATCCTCGGACAGAGAGCCGTGGACCTAGTTAT
+ATTACGCTTGCCGTGGACCAGTGCCCCATGTCGTGCCGTGGACCTAGTTCGTCGACCCCT
+GCCGTTGACCTAGTACTTGCAGGGATACTAGGTCCACGGC
+>ds2020-328_711
+GGTCGGGATAGACGTAGATCGGTGGTGAGTCAGTACGAGGAAGAAATATACATAAAAAAG
+ATGTTACCCACAGATGCGAGAGATAAAGCAGGCTGGTTTTGTGCTTCTAAAATAAGTGAT
+CACAGTAAGTGGATGGAGCGACACCCAGAACTATATGCTTCAACACGCTTGAAGTACGAG
+TGGGGTAAAGTAAGAGCGCTACTAAACGTCTATCCCGCCC
+>ds2020-328_712
+GGTCGGGATAGACGAATCACTGTTATTCACTTCACCTGCTGGGCTTCTCGGGCTGCTGTT
+TAAACTGCAAAGAATTCGCGATGTGTATGGCAAGGATGTCAGTGAGTTCAAAGACTCGGA
+CACTGAGTTGTTCCTGCCCACTTTTGTCAACTCGGTTCCCGGCAGAGTCTTGCCTAGTGT
+GATTCTGGACAAAGAGGGCGCGGAGACGTCTAACCCGACC
+>ds2020-328_713
+TAATACACAGTAACGGCCGCCACTAAGTGATGCTTTTGCCATTGCACTTTAGGTACGATG
+TCCGACCGTACCAAGCGTACCTTCGAACTCCTCCGTTACACTTTGGGAGGAGACCGCCCC
+AGTCAAACTGCCTACCATGCACTGTCCCCGACCCGGATAGACGGGCCAAGTGCATGCATC
+GTCTATCCCGACCAGGCACCTGACTCGTCTATCCCGACC
+>ds2020-328_714
+TGAATTACGGCGGTCGGGATAGACGGTGGTGAGGAGTGTGTGTTGCATGTTGGGGGATAA
+GAGGGCTAGAGAGAGTGTGATGAGGAGCAATGGGGCGGCAAAGGTGTTGTTGGTGATGCA
+AAGTGGATATGGGGAGGGGAATTTTGTGAGGAGGATGTGTGGGGATTTGATTAAAGTTTT
+GAGTGTTGGGTTGAGGTGTGGGGTTCGTCTATCCCGACC
+>ds2020-328_715
+AAGGGACATTGTTTACAACTCAAAAGCACGGGATGTTAATATGTTAGGCTAAGGCACCTC
+TCATCACAGCACGTCGAAAGCATGCCATCAAATTCATTATTTAAAGCCTTAGAGCAGTAG
+CACGCACAGGGATAGAAAACCCTTCTGATCCCAAGGAATGCGCGTCTGGTGGTATCGAGA
+GAAAGGTTGCATTTAGGAGTGATTTCGTCTATCCCGACC
+>ds2020-328_716
+GGTCGGGATAGACGGCCGTAGCTTCTCTTTTTGGGAATAATTTTTATTGTAAAAATGATT
+ATTTCAGATAATCCCCGTCAGGGTTAGAAGACACGCGGACGGATTGACGAACGTACGTGC
+AAGAAAGTCACATCTATTGGATTACTCTAAATGGAACCTCGGACACTCACAAACCGCCTT
+GTCAGGATATCAGCGGCTGCGAATAGACGTGTGGAACTC
+>ds2020-328_717
+GGTCGGGATAGACGAAGGCCTAGAGTTGAATACATACGAACGATCACCGTGCCTAAAGGT
+ACCTACCACATCACGGGGATTGTACACAACATAGTCTTGAACGTCTAGATCTACATCTAT
+TGCTCCCCTGTCCATGCATTCTAGTAACATCCAGAAGCCTTTCACCAACCGAGTCAACTT
+AGATTGCCCAACAAAAACGCGCCAATGTCTATCCCGACC
+>ds2020-328_718
+GCCGTGGACCTAGTCTTATGTGTGGTCAGACTAGGTCACGGCAGGGAGGTGGGCACTAGG
+TCCACGGCACTGGAGTTTCGACTAGGTCCACGGCAGGGGATACGAACTAGGTCCACGGCT
+CTCTGTCCGGGTCGGGATAGACGGCTTGACCCCCTGGTCGGGATAGACGAGGAGCACCCC
+TGGGATAGAGCCGACACTAATTGGACGTCTATCCCGACC
+>ds2020-328_719
+TGAATTACGGCGGTCGGGATAGACGTAGTTTGCTAATGGCGGTGTTGGTGGGGTAGTTGG
+TGTTGGCGCCTGCCTGGATGTAACCGTGAGCTCCCTGGGTTTAGGAGGGGCAGATGATCC
+GTTGCTACGTAGTGGTTGTGGAGCTGTTGGTTTGCGACGGTCGTATGATATATGGGGTGA
+ATGAGGCGATAACAGGGATGCTGGCCGTCTATCCCGACC
+>ds2020-328_720
+GGTCGGGATAGACGATGGTAATGCATGGTCGGGATAGACGTAACCCTTCCTTGGTGGGTT
+GCGGGTGATTGTTGTGAAGGCCACTTTTGGAGGTCCAGTGCTGCAAAAACTGGCCTTTGT
+GTGCAAAAATGGGTCTTGGGACGAGGGCTGAAGGAGGGTTTGGTTGAGAAAATGGGGCGG
+TTAGTGCAGGCTGTTAGTGGCGGCCGTTGCTGTGTATTA
+>ds2020-328_721
+GGTCGGGATAGACGCTTGGTCGCTTTTAGTTGTTTTCTTTGTTGCTGCCATTGACCCCTA
+TGCTGCATTCGATCCATCTGTCCCATCACCAGAGGCGGATATGTGCCCAGGCATCAGATG
+CCTTTCGGACCTGTAAGGGAAATCAGTCATAGGTAGGCCCCATAGCCATCTCCATTCATC
+AGAAACTATCAATTACGAGTCTGTGCCGTCTTCCCGACC
+>ds2020-328_722
+GGTCGGGATAGACGTAACTCATGGCTAACAACGTGTTTTGGGGCGGTAACCAGACTGTGG
+AATCAATCGATTCCGCGGTGAGTGCGGGCGACCTTACGGGTGATGTGGATACCCTAGTAA
+ACTCTAATGCCAAAAGGAGTGAACGGTACCAGAGCATGCTCAGCCGGTACCGTAGCGCGC
+CATCTGAACAAAAGGCAGGGTCCGTCTATCCCGACCGCC
+>ds2020-328_723
+GGTCGGGATGACGTACGCAAGCACTGGTCGGGATAGACGCACCATACCCCTGGTCGGGAT
+AGACGTTAGTGCGCTGTTTCGTCTATCCTGACAGAGAGCCGTGGACCTAGTCCTAGGGGC
+GTTATTTACTAGGTCCACGGCAGGTCAAGGTCCACTAGGTCCACGGCAGGAAAAATATAA
+CTAGGTCCACGGCACGGGGACTACGACTAGGTCCACAGC
+>ds2020-328_724
+TGCCTCTGGCCTTATATTCTCCCGTCCCACCTATGTTATCATGGACTATCATGTCGTCTA
+CTGACGATATTGTCCACGCCATAGCTTGCTTCTGCTCACCCGTCATCTCACCGCTGTACG
+TGTCGGCGAACGCTCGTAACACCGATTTCATGGATCCTGTGCTATGTTGGGAATTGAAAT
+CCTCGAAGTCAAAACATAACGCACCCGTCTATCCCGACC
+>ds2020-328_725
+GGTCGGGATAGACGAATATAACCCTTGGTCGGGATAGACGTTTTAGTACTGGTCGGGATA
+GACGCCCGTCCCCCCTGGTCGGGATAGATGGCACCTTTTCGTCTATCCCGACACGGACAG
+AGAGCCGTGGACCTAGTACTAGCGTGGGTGTATCACTAGGTCCACGGCAAGGGAGCTTGG
+ACTAGGTCCACGGCAGGGATGAGACACTAGGTCCACGGC
+>ds2020-328_726
+GGTCGGGATAGACGTAATGATCGGCTGGTCGGGATAGACGTTATAGTACCCTGTCGGGTA
+GACGACCCCTACAATGCGTCTATCCCACGGACAGAGAGCCGTGGACCTAGTGGGATGTTG
+GGTGCCGTGGACCTAGTAACTGGGCTCCTCAATAACTAGGTCCAGGCATGCTGGTAAGAA
+CTAGGTCTACGGCAGGCCGAGTATTACTAGGTCCACGGC
+>ds2020-328_727
+GGTGGGGCTGACGTGGCGAGGGCTTGCAGAGATAGGATGCATGAGGTGGTGGCGGAGGCA
+GTGGAACTGGAACGGATTTATAATAATAAGAAAGATCCGGTGGATTGGGATTGGGAGAGG
+GTGATGGAGGTGTGTTTTGGTAAAATGGATGAGGAGGTGAGTGGGATTGCGGCGGCCAGG
+AAGGTTGGGGGATACTAGGTCCACGGCTCTCTGTCCGA
+>ds2020-328_728
+GGTCGGGATAGACGTAGAGCTGCTGTTAGCCAAATAGGCATCCCCCTGGACACAGAGTCG
+TCCAAGCGTGACTCGAGTGCTTCGAGCAGGTCCCTCATGTCACTCGAGGGTTTCGACTCT
+ATTCTTGAGTGCACCAGAGTTGCCATTGCCCTCGCCAGATATTGCCCCTTAGATCGGCGC
+TAGTGATCTACACAAAGGGTTCAGCGTCTATCCCGACC
+>ds2020-328_729
+GGTCGGGATAGACGCGCTTTCGCCATTGGCTACTGTAACTTTTGTTTTGTACATCTTCGC
+CCACCTACTAATCGCCTCTTCACTATTCACTCCTTTTGGTCATATTATTTACATTCTGTT
+TTACTTCTGTGATCGTGTTAAGACGACGGTTTTGATGTTATGTGTAGTTGCTGTTGTATT
+GATACGGTTATCATTATATATGTAACCGATGGGGATTG
+>ds2020-328_730
+GGTCGGGATAGACGATCAGGCCCTCGAGAAAGACACTTAGACAACATTAGAGGATCTTTT
+TTTTTACTGTATGAGTGGCTCGGAAGAATAATCGCGCCTCCAGTCGATTCTACTTCATGT
+CTGACTAGATAAGTCACAAGGCCTGTCCTTCTTCAGGCCCCGGTCATCTAGTCGGGGTCG
+ACCAAACTTTCCCAAGTAAGAAACAAACAGAATTTCAC
+>ds2020-328_731
+GGTCGGATAGACGCCGGATGTCCTTGACGAAACCTTTGTACCTAGTGCTCGAAATCTGAG
+AATCAGCTTCCTTGAAGAAATCTCCACTCTCTGTTCTATACGCACAAGCGGTGGCATAGG
+CCGCAACGACAACGTTCACGAGCTCATCGGGGCGGTGTGAAAACCCCGACGAAAGCACGA
+TTCCGCTAAGCGAAATGGCGTTGACGTCTATCCCGACC
+>ds2020-328_732
+GGTCGGGATAGACGTTTCAAGCTCCTCTAGTCGTTCCTCAACTAGGTCGGACGCGGAAAG
+CGCTCCACCTGAGTTCGAGCGGTTATTTGATCGAATCTGTGATGAATACGCAGAGTGGGT
+GGGGAGAAGCGGGAGGCAATTACCTCCCGAATGGACGGTGCCCGACCTTGTTCGGGCAGT
+TATTACCGACAATCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_733
+GGTCGGGATAGACGACCCAATGCCCTGGTCGGGATAGACGGTCTACTCACCTGGTCGGGA
+TAGACGTCAGGGCTAAAATTCGTCTATCCCACGGACAGAGAGCCGTGGACCTAGTCCCAA
+ACACCCTGCCGTGGACCTAGTTCTCCTGTCTCTGCCGTGGACCTAGTCAGACCACAGCCG
+ACTAGGTCCCGGCCCCGAATCACAACTAGGTCCACGGC
+>ds2020-328_734
+GGTCGGGATAGACGGAGTGACCGGGGGTCGGGATAGACGCGCAACCCACTTGGTCGGGAT
+AGACGAATAACAATGCTCCGTCTATCCACGGACAGAGAGCCGTGGACCTAGTCAAATGTC
+CGCTGATACTAGGTCCACGGCAGGGATAAGTTGACTAGGTCCACGGCAGGTGCCCTTGAA
+CTAGGTCCACGGCAGGGATGTAGTACTAGGTCCACGGC
+>ds2020-328_735
+GGTCGGGATAGACGGCCTCGTACGCTGGTCGGGATAGACGCATACAGCCCCAATAGTCGT
+CTATCCCACGGACAGAGAGCCGTGGACCTAGTTATCAGCTACTTTGTCCACGGCAGCGCT
+CACGACACTAGGTCCACGGCAGTGAGCGAAAGACTAGGTCCACGGCAGGTGTAAAGTGAC
+TAGGTCCACGGCAGGGGTGTATCTACTAGGTCCACGGC
+>ds2020-328_736
+GGTCGGGATAGACGTATTAAGGCCTGGTCGGGATAGACGGTTCATATCCCTGGTCGGGAT
+AGACGGCCTATTTCCCTGGTCGGGATAGACGTATATGTAGCTTGGACGTCTATCCCGTGA
+CAGAGAGCCGTGGACCTAGTGCGGCAACCCCTGCCGTGGACCTAGTTACATTTTGCCTGC
+CGTGGACTAGTTATCCCCCCAATGACTAGGTCCACGGC
+>ds2020-328_737
+GGTCGGGATAGACGTTTGGGCAGTGTATCCCGACCAGCCACGCGTGTCGTCTATCCCGAC
+CAAGGCGTTCCACCGTCTATCCCGACCGGACAGAGAGCCGTGGACCTAGTACCCTGTTCC
+GTGCCGTGGACCTAGTAATTAGATCACTGCCGTGGACCTAGTCCCTTACTCCATACATGA
+ATAGGTCACGGCAACGGCATCTCAACTAGGTCCACGGC
+>ds2020-328_738
+GGTCGGGATAGACGGGTGCATACGCTGCGGGTCAGTTTCGGGGCGGGGGGGCAAATAGAG
+ACCAGAAGAATGATTCATTTGGATCGACGAGCTTTTTCAGCCCCAAAACTAAGAATCAAT
+GGAATGTCTGTCTATCCATGAATATCTATTCTATCTGTATATCTAGGGAATCACTTTATA
+CATATAAAATTATATTATGGCATGATATGATCGCCTA
+>ds2020-328_739
+GGTCGGGATAGACGAGGTTTGTACTTGACTAGCGATGGTTGAGTGCGACAAGAGACGGAG
+GTCTCGGCCCAAGATGAGGGAAAGGATACAACTTTGAAAGAGAAGTTGAAAAGGGTTAAG
+GCAGTGGTGCTTTGTGGTCCATGGAGCGAGGAGAAGAGAAATTCCTATATGGATTGTTAT
+GCAGCAGTGCAGTGGGGCCAATCCGTCTATCCCGACC
+>ds2020-328_740
+GGTCGGGATAGACGGGTGGTTGTTATTCTCTTACTAAATTGCCTGTAGACATGTGGGAAT
+TAATTAATTTGCATCATCTTGACGTGAGTGGAACCCAAATTGTAGAGATGCCAATGCAAA
+TGAGTACATTGAAAAGCTTGAGAACATTGTCCGCTTTTATTGTGGGCAAATCTACTGGGT
+CGACTATTGGAAGCGGGGGGAATCGTCTATCCCGACC
+>ds2020-328_741
+GCCGTGGACCTAGTATCTCTTACCCTGCCGTGGACCTAGTAATTGGGAGGGTGACTAGGT
+CCACGGCTCTCTGTCCGTGTCATAACCCCCTGTGACGTCTATCCCACCATCTATTGTACA
+CGTCTATCCCGACCAGGGGTCGCCGTCGTCTATCCCGACCAGCTATTTGGAACGTCTATC
+CCGACCCCCTTCACGTCTATCCCGACCGCCGTAATTC
+>ds2020-328_742
+GGTCGGGATAGACGACGCCTCCCCGTCCTATGCCGTGAGCACAAATCTGAGCAACAACTA
+GCCCTGGGTTTGAGCCTAGCATTGCATACTTGGTCTGGATTCTTGTTTTAATGAAGTCGT
+TCCACACTTTGCTTTTCCTGATGTTTATATAATCTTGGGGTCTAAGTGTATCTAAATCAC
+CGTTGAACTTTACTCCCAAAGAACGTCTATCCCGACC
+>ds2020-328_743
+GGTCGGGATAGACGATTGCCACCACTCACTTTACTTTAGTCCACCCGGCATAACCGCATG
+TGAACCAACCGACTAACTTGCCTCTCCGGGATGAGAACCCATGATTTGATCTGCTAGCTT
+GAACGCCTGGATCATGCCGAGAAGAGAAAGTGAAGAAAAGACTGTCGGAACCGATCGGAG
+GAGTATTTCAGAGTCCATCCCCGCGTCTATCCCGACC
+>ds2020-328_744
+GGTCGGGATAGACGAAGAGAGGTCGTATTTCTTTGGGTTGGTAGTAATGGAATGGTTTCA
+TTATCTAAAATCAAGAACATTTCCCACCAAAGGATCAGTCCAATAATACCACTCACTGGT
+AAATAGCGCAATACTTCTTCGTGAATCTCCGCTATTTGAATATGGAACATCATAACAACG
+AATAGGAATGAAACGGCATAGGTCGTCTATCCCGACC
+>ds2020-328_745
+GGTCGGGATAGACGGATCGTATATATACTAGCAACACTCGAGGCAAGCTCTGGCTTTTTG
+GCGAGCGGTTGTCCTGTTTTTGGGTCAGTGACGACAACTTGCGGTGCTGCATGGGTCAGG
+CTTGTCACCTGTAGTACCGTCAATAACACTGCGCCGTTTGCCAAAGAGCCCACCAATTTT
+TTCATGCTTGTCACTTGTCCCCCCCGTCTATCCGACC
+>ds2020-328_746
+GGTCGGGATAGACGCGTCACCCCCATTATGTAAACTGTTTCCTCGCTTCAACGTGTCTTC
+AGATATCGCTTTTGTGTATATATAATTCAATATACTGTTCATGAATGTTGTCAGTCTCCA
+GCCTGACAGCAGTGTGTCTTTCGCCCTGTATGTACGCTTCGTACCAACATTGTCATGTAT
+TACCTGGTTGCCTACAGATTCAGCCGTCCATAAGGCC
+>ds2020-328_747
+GGTCGGGATAGACGGCGTGTTTTGGTATGTTGGGAGATATCATTATTGCCGAACCCAATG
+CTTACATTGCATTTGCGGGTAAAAGAGTAATTGAACAAACATTGAATAAGACAGTACCCG
+AGGATTCACAAGTGGCTGAATATTTATTCCATAAGGGCTTATTCGATCCAATCGTACCAC
+GTAATCCTTTACAGGGCGTATATCGTCTATCCCGACC
+>ds2020-328_748
+GGTCGGGATAGACGATTTGTGGGATTCATTACTGCAACCAAAGATGCTGCGTGATTTAAG
+TGAGGAAGTTGGCGATCGGATAATGGAAGGCCAAAGCGTTGACGAAGCATCGCTAATATG
+TGCCAGGCCATTAGGACAAGCAATCAGGTTGTTAAACCCACACGAAGACGTCATTCTAAT
+GGCGCAATCATATGGACTGTTAGAAAGTATAGGTGT
+>ds2020-328_749
+GGTCGGGATAGACGAACCCCACTGATCTAACTTTTGATGCGACGGATGTTGAGTTGAACG
+ATATTAAAATGCTAGTAACTGACTTCAAGTTTCAAGTTCAGTATGCTGTATCACAAAATG
+AGTAAGTTTTTTTTACAATTTTGTAACTCTTTTGATATTATCTGTTTCTTTTTGAAGTGC
+TTCCAGTTTCAGATTTGTACGGCGTCTATCCCGACC
+>ds2020-328_750
+GGTCGGGATAGACGTCGTCACCATTATGCACAGAGTCCACCACACCCGAGTGTGTGAATA
+CGCCTGCAATGTCCATGTATACATAGTTTAACACCGTATTGAGGAACGTAGTTAGCCTAG
+ACCCAGACAGCAAAGTGCCCGCAGGTCTGTAATTTTTCCCGTCTCCTGCATGAATCAGTA
+TGTCAGTGTAGCTATTTAGTATCCAGTCCATCGCGC
+>ds2020-328_751
+GCCGTGGACCTAGTATATTGTCACTTGGTCCACGGCAGGTAGAGGCACACTAGGTCCACG
+GCAGGAGCAAAGCAACTAGGTCCACGGCAAGCGGAACATTACTAGGTCCACGGCTCTCTG
+TCCGAGGGATAGACGAACGATGGGGCTTCACGTCTATCCCGACCACGGAGTGGTTACGTC
+TATCCCGACCACCACATTCTTTCGTCTATCCCGACC
+>ds2020-328_752
+GGTCGGGATAGACGATGGGGACAATTGTCAAACGATGTGCTCCGTTTGGAAGGCGGGGAC
+CGAGTCTCCATCCTTGTAAGGCCTGATGATGTTGATATTGTGAGAGTGAAGAAGACAGGG
+GTCCATCTAGAATGGGACAAAGTCATGAAGGAGAATAAATCGGATCGTCATTTGTATGAT
+TGGGAAATAAATGGGGATTTCGCGTCTATCCCGACC
+>ds2020-328_753
+GCCGTGGACCTAGTATTCATTACCCTGCCGTGGACCGTTATAGTTACGGCCGCCGTTTAC
+TGGGACTTCAATCAAGAGCTTGCACCCCATCATTTAATCTTCCAGCACCGGGCAGGCGTC
+ACACCCTATACGTCCACTTTCGTGTTTGCAGAGTGCTGTGTTTTTATTAAACAGTCGGGG
+GGGCCAGTTTATTGAACCCCTTCGTCTATCCCGACC
+>ds2020-328_754
+GGTCGGGATAGACGCGGGGTTGTTTTGTATTTAAGTCGGCAAAGCAACTCGTTATTGTGA
+CAGCTGCTCTTGTTTAAGATATACAGTTTGTCTGTTGAACGTTAGCTTTATTAATTGGTT
+ACTTGTTAGTTGGTTTACTTGATATTCACTTTCTCTACACTTTGTTACACGTGTTGGGAG
+ACGTACCATGACCCAGTGCCCTCGTCTATCCCGACC
+>ds2020-328_755
+GCCGTGGACCTAGTCAGACCTTCACTGCCGTGGACCTAGTCCATGCATGCGTGCCGTGGA
+CCCATGTATTTAGCCACTAGGTCCACGGCTCTCTGTCCGAGAATTAGGCGGTCGGGATAG
+ACGTGGGCCCCCACTGGTCGGGATAGACGGTACGCGGGACTGGTCTGGATAGACGGTTAT
+ATGCCCTTTGGTCGTCTATCCCGACCGCCGTAATTA
+>ds2020-328_756
+GGTCGGGATAGACGAAACCACGGCTGGTCGGGATAGACGTACTAAATCCCTGGTCGGGAT
+AGTCGGCGTTATCTCGTCTATCCAGACCAGGGGGAGGACACGTCTATCCCGACACGGACA
+GAGAGCCGTGGACCTAGTGATCGCATTCGTGACTAGGTCCCGGCAGGCAACTTATTACTA
+GGTCCACGGCAAGGGCAGAACAACTAGGTCCACGGC
+>ds2020-328_757
+GTCGGGATAGACGGCGATGTAGAATCGATTGAAGCCAAAGTGAATGAAGACTTTGTGCCG
+GCATGGCCTTGGCTGCCGATTGGGATTGGGATGAAAATATTGCCGCTTAAAGTTATGACC
+AAATTTTTATAAGCGCATATCTAAAAATTTTAAACTCTCAGCATCATCAACAGCGCCTTG
+GCAGCTGATGACGTTTATTATCCGTCTATCCCGACC
+>ds2020-328_758
+GGTCGGGATAGACGAGCAGCGGGGGTGTGAGAGCAGGCAGATAATGTGAGAGCTTGATTG
+CTTGATCGAGAAGAATGCCTTTTCTTGATTGCTTGATCGACTCACTCGTCTGATTGGCCC
+TACTATTCATTATGGCCTTCCCTCCCGACACGAGCATGAAGTCTTTCAATTCGAGTCTGT
+CATTAAGAAATAGTGGGTTAGCGTCTATCCCGACC
+>ds2020-328_759
+CGGTCGGATAGACGATGGTCCTGGTTTGACATGGTTTACGCGTTACTGGTTCCCGGAAGA
+GTTAATATCTCCATTAGCTAAACCCTTTCTTACCCTGCCCTTGGACTCGTATTTTGTTTG
+TACACAATCAACGGAGGCCTCCCCGACATATGTTGCAACGTCTTCAATAGCATGCGCTGT
+TTTCGTCTATCCCGACCGCCATAATTCAGATCGGA
+>ds2020-328_760
+GGTCGGGATAGACGGCAGATCGGGGTGTCCGGTGAGACGACGAGGAGGAGCTCCCAGGCG
+GGAAAGAGAATGGAAACGGTGGAGATGGCGGAGTGGTTGATGATGATGGAGGAGACGTGG
+AGAGCGCGATGAGTGGCGGGAAGCTGAGGGTGGTGATTGTCGTTGTAGAAGATTGCGTAG
+TTGGTGTGGATGTTGTCGATGGCGGTTGGTAAGTG
+>ds2020-328_761
+GGTCGGGATAGACGACTTTCCGCGCGCTTCTTCTTTAATATAGCAGTTATCTAATGAATA
+TAGTAACCACGGGAACACTCGTTGTTGTTCGAGGGACATCCTTTTACCAAACACTGCAAA
+ATATGCTTCCAACACAGCTTTCATCGAGCCCACGCTATGTTGCGAGTTAAAATCTTCAAA
+GTCAAAGCAGTAATGTACCCTGTCTATCCCGACCA
+>ds2020-328_762
+GGTCGGGATAGACGGAACTTCTTGCTCAGCAGGCGTAGCTTGGAGGGGGAGTGTAGCGGG
+GGTAAGGTAAGGAAGAGCCGCCAGAGAGGAAGCCAAACCGGCCTATTAAGCGCAGCTAAG
+CTAATATGCGCCGGAGAAAGCCAGGTGCCGGAGGTAAGCTCTATTCGGCCCGGAGCAAAA
+ATTCCCCATAACGAATGGACTCGACTGTCCCGACC
+>ds2020-328_763
+CGGTCGGGATAGACGGTGCTCTTCTCTCCAATTCATCCCCAAATACAAACCCATCTTCCT
+CTCTCTGCACCACAGCAATCGCCATCTCCATTTCCTTCACCAAAATACTCCTATTCATGT
+GCTGCTCTGCATAGAGCGGCCACGCCACCATCGACACCCCGGCGATCACCGCTTCAAGCA
+CCGAGTTCCAGCCACGTTTATCGTCTATCCCGACC
+>ds2020-328_764
+GGTCGGGTAGACGCATATGAGGTGTGCTATGTGCAACGCCAACGATATACAGCAGGGATA
+TCATTGGGCTGTAAGATTGGATAGATGTATGAGACAAATAATCGTGTCCCTATTATGTGC
+AGAAAAGAAAAGCACTAATGTAATAATAGAGTCCGGATTCCTCCATCAAGCGTCTGTGGT
+AAATGTAAACGAGCACGAAGACGTCTATCCCGTCC
+>ds2020-328_765
+GGTCGGGATAGACGTTAGCTGTCCATTTCTTGTATTTCTTACCAGTCATTGCATCATACA
+TGGTCGCATCATAGCCTCCTACTCTCAACGCTAACAGCATCTTGTTTGCAACTTTATTAT
+CATTAGTCGTGTACGATTTGGATCTGGCATCATAATCCATTCTAGCTTCGTATTGAAGAG
+AATTCATGTAGTACCTGTCGTCGTCTATCCCGACC
+>ds2020-328_766
+GGTCGGGATAGACGTGGCGTGGGTCTGAGAGTGTACGGACACACAGAGAAGAAAGGGGGA
+AGATAGAGAAATATGAAAAAAGCTTTGTGTTTGGATCAAACCCGCAACTTTTGGTATCTT
+TTTTTCCAACACAGAGAAGAGGTTCTCAGATATGAGAGAGAGAGAGAGAGAGAGAGAGAG
+AGAGAGGGGGGCGGCTGTTCGCGTCTATCCAGACC
+>ds2020-328_767
+GGTCGGGATAGACGACCAGCAGCATTACACAACACCCGATTTGCGGATGTTCAAGACACA
+GAGGACATGAGTACACACTACGAGCCAACGTTCGATGTGACCAGTGCGGCGGCTGAGGTA
+CAGAACACTGTACCTATCAGGTACGCGCCCACGGATGGTGCGAAGCATGACAAAGAGCCG
+CGTGCCCCTCAGCCCAGTAGTCCGTCTATCCGACC
+>ds2020-328_768
+GTCGGGATAGACGCTGGTAGATGGTAGCTGGGGTGTACAGTGGTAATAGGGATACTACAT
+TGATAAACACATTGTTGAACATAGCATACGCTAAGGTAGTTGACATTTCAGCTAACAACT
+TGAAAGTGAATATAGGGCTAGAAAGTAGATTGTGACATGGTGATGACATCATCAGTGTGC
+ATAGTACCTATACTGGCTCTGCGTCTATCCCGACC
+>ds2020-328_769
+GGTCGGGATAGACGCCGGGTTCACTTCTATCCCGACCAGCCCACGTAAACGTCTATCCCG
+ACCAGGAGGGTGAATCGTCTATCCCGACCCGGACAGAGAGCCGTGGACCTAGTGGGGTTG
+ACAATTAGGTCCACGGCAGGAGGTAATCTACTAGGTCCACGGCACTGGATAAATTACTAG
+GTCCACGGCAGGAATTATAATACTAGGTCCACGGC
+>ds2020-328_770
+GGTCGGGATAGACGCTCAAGGGCCATGTTCGTCTATCCCAGGATACTCGACCGTCTATCC
+CGACCAGGTGCATGTACCGTCTATCCCGACCGCCGTAATTCTAATACCAGCAACGGCCGC
+CACTAGTCGTGTGGGTTGATTATGATGAGAAGGAAATGGAACAACTCGATGAATTTAGTA
+GATCTTTTTAGGAGACCCAGGTAGTGGCGGCCGTT
+>ds2020-328_771
+GGTCGGGATAGACGCGCAGCCCCCTGGTCGGGATAGACGTTCCCTTGGTCTGGTCGGGAT
+AGACGAATAGGGTGGTTGTCCGTCTATCCCCCGGACAGAGAGCCGTGGACCTAGTCTACA
+ACTTGCTGCCGTGGACGTTTAGAATGCGCTGCCGTGGACCTAGTGGATGAAGGGGCCGTG
+GCCTAGTTCAACCCGCTAGAGACTAGGTCCACGGC
+>ds2020-328_772
+GGTCGGGATAGACGATCGTAAATCTCTGTAAGAGTTATCTTATCTTGTTATTTGCAATGG
+TGTACCCAGTTAACGCTGATACATTTGGGATACTGTGGAAATACATCAAGTAGTGATACA
+GTATTCTCGCACGAAGAGTAGCGAAAGTTCTTCGCTGTAGATGCATTTGCGATTGTCCTT
+GAAACACCTAAGGAGTATTTATAGTGGCGGCCGTT
+>ds2020-328_773
+GGTCGGGATAGACGAGGCAGCTTAATGGGAATGGTAAATGGAGTTTTTGAGGGTGACATC
+AATGTTTGTGTCTACGGTAATTTGATAAAGGCGTACGTGGCTCCGATGCCAGGGAACAGG
+TCAGCAGTCTACTATGACGTTAGTCAGCGAACTTGGGGAATACGTAAAGAAATACTCTCG
+CAGATGACGAGGCACAGCAACCGTCTATCCCGACC
+>ds2020-328_774
+TTTCTTATTATTTGACAGTGCAGAATGTTATTGATGACCATCAGCCATCATGCGCAAAAG
+CTTCACAAAGCCCCACTAAGAACATCATGATGACATCCTGAAAATGGTCCCAGCTACTAT
+TGCCGAAGGTCTGAACACCCGGCTCCTATTTTCAAACCAAGTCCTAGGTTCCAGCTACAA
+AAAAAGAGAGTAGGCAGCGTCGTCTATCCCGACC
+>ds2020-328_775
+CATGTTTTGGCCTTGTGTGTCCATAACTCAAAATAGGTGACCTAACGGCCGCCGCCCGAC
+TAAACATACCAATAGTCACCAGATTCATATGGGCTACTGAGGAGTAAGCAATGATCTTCT
+TAAGATCGATCTGTCTTGAAGTGGTCAAGGAAGTATATATTATAGCAATCGCGCTTGGAG
+TATAAATGAAAGAAGTCCCGCGTCTATCCCGACC
+>ds2020-328_776
+TATATTAGCGCTCTCCAAGTGTGCTTGTTCCTCCCTTCTTCCTTACCATGGCAAGTCTTT
+GTGAAATAACTCCGATGAGAAGAAAAAAGAAGGCGTTAAGAGACCCTCCTGGCCCAACCC
+TAGACACTCTAAGATCCTTTTTCAAACCTGCTCCCATTTCGAGTCAAGAGATAGATAAAT
+AGACACATCCCATTGCACTGACCGGGTTCGTTCG
+>ds2020-328_777
+TAACGGCCTATTTGCCAGATGAGACCACGCCAACAACAGCTTGTTTCTCAACGGTTCCTG
+ATGTTTCAGCCCATGATCCCTAAGTATACCATTGTACCTTGGGTCTGTGCGTACATCTGA
+CCCCTTAGTGCATGTACTGTCACCTAATCCGCCCGTTGCTTCAACAAGATTAGCAGCTTC
+CATCTTGTACAGCGAGCCGACGTCTATCCCGACC
+>ds2020-328_778
+GGTCGGGATAGACGATTTCGTACTCTGTATCTGAGCCGAACCGACTAGCGCCACAACTGA
+TAACCGATTATTATGGCGTCAACCACCGCATATCTACGGTAGACACGCACATAGCGGTAG
+CTGCAGAGGTTCGCAGGGTAAGGGGTTATATCCAACGAGCCCCGGCGGCTTTTCAATTTG
+TCGACACCATTCAGCCTGAGCGTCTAGCCCGCCC
+>ds2020-328_779
+GGTCGGGATAGACGAGGCTAAGGACTGGTCGGGATAGACGACATAACCACCTGGTCGGGA
+TAGACGAAAAACGCCGCTGCGTCTATCCCTCGGACAGAGAGCCGTGGACCTAGTGCTCGG
+AGGGCTGCCGTGGACCTAGTCTTTCCCGCCCTGCCGTGGACCTAGTGTTAGGTGCTCTGC
+CTGGACCTAGTTAGTCTGCTACTAGGTCCACGGC
+>ds2020-328_780
+GGTCGGGATAGACGCTAACATCAGGTTTTCACGTCTATCCCGACCAGGGCCCGTATACGT
+CTATCCGACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTCCACCACCCACTATA
+ACACTAGGTCCACGGCAGGGCAGTTTTCACTAGGTCCACGGCAGGGCGAACTAAACTAGG
+TCCACGGCAGAGGGCGCATGACTAGGTCCACGGC
+>ds2020-328_781
+GGTCGGGATAGACGGTTCATTCGCCTGGTCGGGATAGACGATGACTCCTCTTGGTCGGGA
+TAGACAGGGATGATCCGTCTATCGGACAGAGAGCCGTGGACCTAGTTGTGTAGAGGGTGG
+ATGACTAGGTCACGGCAGACTGATAAGGACTAGGTCCACGGCAGGTGCTTTCTGACTAGG
+TCCACGGCAAGGCGATCGTCACTAGGTCCACGGC
+>ds2020-328_782
+GGTCGGGATAGACGACTGGTCGCCCTGGTCGGGATAGACGGATCTCCCCGCTGGTCGGGA
+TAGACGGTTATTGCGCCTGGTCGGGATAGACGAAGAGGTCCAGTACGTCTATCCCACGGA
+CAGAGAGCCGTGGACCTAGTCCATGCCCCGTTGCCGTGGACCTAGTTGGGTTGCTGCTGC
+CGTGGACCAAGTGCGTAAGTACTAGGTCCACGGC
+>ds2020-328_783
+GCCGTGGACCTAGTCAATGGCTCCCTGCCGTGGACCTAGTGCATACTTCCCTGCCGTGGA
+CCTAGTGCTGCAACGACTGCCGTGGCCTAGTGTATGGTCTGGAAAACTAGGTCCACGGCT
+CTCTGTCCGAATTACGGCGGTCGGGATAGACGTACAGAACTGGTGGTCGGGATAGACGGT
+TACACTCACTGGTGGGATAGACGCACTACCGACC
+>ds2020-328_784
+GGTCGGGATAGACGCCGCTTTGTGTTTCAGGGTATATACCCACCTGCAGCCAACCGTACG
+TTTGCCTCTTGGTAACGTGATCAGTTCCCAAGTGTCGTTCTTCTTTAGAGCCTCTATTTC
+TTCTATCATAGCTTTCTTCCCCTGAGGATGATTGAGGGCTTCTTCAAAATTGGGAGACCG
+TCTATCCCGACCGCCGTAATTCAGATCGGAAGA
+>ds2020-328_785
+GGTCGGGATAGACGGGCCGTAACAGCAGAAGCAAGGCTTAGATTACCAGATCGTGGACAC
+AATCTTCCTAGAGATGGAGAGCCCCCTGCCTCGCCTTTTCTAGCCTCTCCTTCTTGCTTG
+CTTACCTAGCTCTTGTCTTAGTGACTCTTCCTCTTTCTCATTATTCAGAACAGTGGAGCT
+TTCGATCATTTGGTTCGCGCGTCTATCCCGACC
+>ds2020-328_786
+GGTCGGGATAGACGTTTAGGGGCAATACAGTCAGGCAGCTATCTACCGATCCTCTCCTGC
+TTCTGCTTGATCTACGTCGTCTATTACCAGTCGCAGAGGCATACCCTGAGTCATCAGTAG
+TCCTCTGCTTATTGTGTCGCGTTAACGGCGGACGCTGGTCGCCTCTGCTCACTTCACTTG
+TGGAAGCACCTCCCATTCTCGTCTATCCCGACC
+>ds2020-328_787
+AATGGCACAGTCATTTCTCTTCTCGCTTTCTTTCCAGCACGGGGATTCGCCCGACGATCT
+TACCGCTAGCCAACATTTGATTTTTTATTAATAGGAATTTCTCTCTTCGTCTTGATGCCT
+GCTATCTTCCTAAACAGGATAGAAAGAAAGCCCCAACCTCTTCCTTCTTATACTAAGAGT
+ACACTTCAAAATAGCCCCCCCGCTATCCCGACC
+>ds2020-328_788
+GGTCGGGATAGACGGGGTTGGTACATTGCAGGCTGTGTATGAGGAGTCAAATTGTTTTCA
+TCTTGTGATGGAGTTGTGCTCTGGAGGGCGCCTGATTGATCAGATGGTTCAGGAGGTTCA
+GTATTCAGAGCACCGGGCTGCCAAGATATTCAAGGAAGTGATGCTAGTTATCAAGTATTG
+TCATGATATGGGACGGATGCGTCTATCCCGACC
+>ds2020-328_789
+GGTCGGGATAGACGCAGGATGGTATTTTCCCTAATTAGGAAAGATTGAATGTGTTATATC
+ATGTTCTTGGCTGCTGAAAGACGAGTTTTTTCAAAACCTGCTTCTCGCCCTGAGCTGAGC
+CCTACCACAAGAATACGTTTTAGGACTAGCAGATCGACTTGTTTAGCCCTTTTCTATTGG
+TTTAGTGAATCCCACCAATACGTCTTCCCGACC
+>ds2020-328_790
+GGTCGGGATAGACGAGTTATTTCCATGGTCGGGATAGACGCTATAGGGTGGTGCTTCGTC
+TATCCCGACCGCCGTAATTCTCGGACAGAGAGCCGTGGACCTAGTCTGGGATGGGGGCCG
+TGGACCTAGTAAGCACCTACCTGCCGTGGACCTAGTGGTCCACCTCCTGCCGTGGACCTA
+GTTCGTTAGGGGGTCGGTCACTAGGTCCACGGC
+>ds2020-328_791
+GGTCGGGATAGACGTCGAACGGACTATCGCATATTGTGTGTTATCCGGGTTTGATAGGTT
+CCGACCGTTGGATCGTTTCCAAATTGAAGTAGGTTGTACTAGGTACTCTTAGAACCGTGT
+AGGTTTTTGCGGATCGTGAATCGGAGCCCCGGTTGTTCCGATTCATTAACTTAAAGTTTG
+GAGTTTTACGGTAACTGTACGTCTATCCCGACC
+>ds2020-328_792
+GGTCGGGATGACGGTTATATACGGTGGTCGGGATAGACGTGGATACCCCGTGGTCGGGAT
+AGACACTTGCGACCCTCGTCTATCCCTCGGACAGAGAGCCGTGGACCTAGTGCTGCCGCC
+CCCGTGGACCTAGTGATGATTATCCTGCCGTGGACCTAGTGGCCACTCTCTGCCGTGGAC
+CAGTCACACCCCTGCACTCACTAGGTCCACGGC
+>ds2020-328_793
+GGTCGGGATAGACGCACGGTTACCTGGTCGGGATAGACGTCAGAGTGCCCTGGTCGGGAT
+AGACGAGTGTAAGTTTACGTCTATCCACGGACAGAGAGCCGTGGACCTAGTTACCGGTCA
+CCTGCCGTGGACCTAGTCCTATCTCCGCTGCCTGGACCTAGTTCATCATCGGATTAGACA
+CTAGGTCAGGGGACGGAACACTAGGTCCACGGC
+>ds2020-328_794
+GCCGTGGACCTAGTAAATTCAACAATAGGTCAACGGCAGGGGGGGAATGACTAGGTCCAC
+GGCAGGTGAGGTTGGACTAGGTCCACGGCAGGAGCCAAGGAACTAGGTCCACGGCTCTCT
+GTCCGAGGATAGACGGGATTCACACTTATCGTCTATCCCGACCAGGGCGAATCAGCGTCT
+ATCCCACCAGGGGTACGTACGTCTATCCCGACC
+>ds2020-328_795
+GGTCGGGATAGACGCCACAAAGGGGTAAGGGGCAGGAAGGAGCCGCTTAACAAGGCACTT
+CCATTTCTCGCTCATCCGCTCGCAGCTAAAAAGCTATCCTTTGCTTTGATCCATTACTGG
+TTCCGCAGGCTCAAGCTTACTTCATTTTCCATCTCTCTATTTTTCTTTCTATTTTCTCGC
+CCAGCTAACAACAGCAACCGTCTATCCCGACC
+>ds2020-328_796
+TAAAGACAAAAAAAAGAACAAGTCAAAAATACAAATTTATTGAAGCAGAAGAGGCTCACC
+TGATACAAAAATTGAGCATAATTTCCAAGAAACAAAGGGTTGCCTGGATTTTCCTCAACC
+AGCTTCTTGTAATGCCCCTCAGCCCCATGGTTGTCTCCTCCATCATCACCAGATCCTTCC
+CAATTAACCTCTCCTACGCGTCTATCCCGACC
+>ds2020-328_797
+GGTCGGGATAGACGGTCGTCCTGCCTATTTAAAGTTTGAGAATAGGTCGAGGGCGATGCG
+CCCCCGAAGCCTCTAATCATTGGCTTTACCCGATAGAACTCGTACACGGGCTCCAGCTAT
+CCTGAGGGAAACTTCGGAGGGAACCAGCTACTAGACGGTTCGATTAGTCTTTCGCCCCTA
+TACCCAAGTCAGACGCGTCGTCTATCCCGACC
+>ds2020-328_798
+GGTCGGGATAGACGCTCAGATCACCTTCATCGGCTATGGCGAGGATGAATTTGGCTACCG
+CATTTGGGATAACGAAAACAAGAAGGTGATCCGCAGCAGAGATGTGATTTTTAATGAAAG
+AGTGATGTACAAGGACAGACATAAACACGACGCCAGCAACACAAAGCAGAGTGTGCCAAT
+ATTTGTAGATGCAATCTTCGTCTATCCCGCCC
+>ds2020-328_799
+GGTCGGGATAGACGTATGGGATGACTCCAGGTTCATATTAGGGAAAGGAGAGTGAGGGGA
+AGAGGGGGCAGCCCTCGGCCCGATCATCCAATTCGCTCCAACAGATAGGCATGGTTCTGT
+AGTCAAAGCAACTTCGTCACTTTCGTGTACCCATCGGACGGCAGCCCTTTCGGGGGTTCC
+TTAGGGACCGATTCACTGCGTCTATCCCGACC
+>ds2020-328_800
+ATCCACCACCTTCCTCCGGTTTGTCACCGGCAGTCTCTCTAAAGTGCCCATCTTACTGCT
+GGCAACTAGAAACGAGGGTTGCGCTCGTTGCGGGACTTAACCCAACATCTCACGACACGA
+GCTGACGACAGCCATGCACCACCTGTGTTCCGGCTCCCGAAGGCACTCATAGTGTCAAAA
+CCTCCCACTGGTGGTCCGCGTCTATCCCGACC
+>ds2020-328_801
+GGTCGGGATAGACGCTGACAGATCCTTTGTCTTTATTTGACCCCAAGAATGGATTGGATC
+GAAACGACTTTCCTGTCGAACCCCTTTTTGTCTGTATGAATTTCTGACCGCGCGGAATCT
+CCATAGCCAATTTTCCATTTTTGATTATGAAATCATAGGGTGCCTTTGGTAAAACTCTTA
+TTTCACACAATCCAGGAACTTCCATAACGTTG
+>ds2020-328_802
+GGTCGGGATAGACGGCTGGCGTCGCTTCCCGGCAAGTACCTTGCTTTTCCGGCGCTGGAA
+TCGATACCACTCGGTCTTCTACGGCGTCGTTTCATGGAGAGTTTCGGGTTCAGGGTCGTA
+GAGATTTTGGAGTGTCTTTGAGAACTAAAAGGTTTCGTGGGCAATCGAATTATGGATTTT
+GTGATGACGGGCATGATTCGTCTATCCCGACC
+>ds2020-328_803
+GGTCGGGATAGACGATACTAGCGCGTGGTCGGGATAGACGAACAGATTACCTGGTCGGGA
+TAGACGCAGGCCTAGTATTCGTCTATCCACGGACAGAGAGCCGTGGACCTAGTTGTACAA
+TCCCTGCCGTGGACCTAGTGTATAGTCCTTGCCGTGGACCTAGTTCTAATCCTCCTGCCG
+TGGACCAAGTCGACTTTTACTAGGTCCACGGC
+>ds2020-328_804
+GGTCGGGATAGACAGCAAGCCGAGTTGGCGTGTGGCAATTGATAACAGTGTATCAGTGGG
+TAGGGGGCAATAGGGTTATCCCTTTCTGTTGCTCCCCCCCACTGGGACACTGCCGATTGT
+TTGCGCGAATTCGCAAAAAGAAAAAGGCCAATGCGTTTGGTCGCTGGGTGTTAACATAAT
+TGCAAGATTGGGAGATTTCGTCTATCCCGACC
+>ds2020-328_805
+GGTCGGGATAGACGCATGGAGGAGCTGGAGAGGGAGAGGGGTAGAGCGAGAAAGATGAGA
+AAGGTCCATGGAAAGACTGTGATGAAGAAGAAGTAGTGGCTGGTGTTAAACAAGGACATG
+ATGGCTGGTTGGAAATGTTTAGAGAGAGCGAGCGAGAGAGAGCACGTAGCGGGTTTGTTT
+TTCGGGGGGGGAGGGCTTCGTCTATCCCGACC
+>ds2020-328_806
+GGTCGGGATAGACGACCTGAATCGGTGGTCGGGATAGGCGCCACACCTCAGCACATCGTC
+TATCCTCGGACAGAGAGCCGTGGACCTAGTTTGGTGCCGAGTGCCGTGGACCTAGTCGTA
+CTGCCTGTGCCGTGGACCTAGTGTGATCTCCCTGCCGTGGACCTAGTCGTAGATCCCCTG
+CCGTGGACTTAGCTTGATACTAGGTCCACGGC
+>ds2020-328_807
+TTAAAGGCACCTAAGGGTGTACTAAGTGGAAAAGGATGTGGGATCGCGAAGACAGCCAGG
+AGGTTGGCTTAATGTCAGCCAAACTCCGAATGCCATCAATTGTGTTGTGCGGCAGTGAGA
+CTGTGGGGGATAAGCTTCATAGTCGAGAGGGAAACAGCCCAGATCGCCGGTTAAGGCCCC
+TAAGGGTGTACTAAGTGGAAAAGGTGTGGTCT
+>ds2020-328_808
+GGTCGGGATAGACGTTATTGGGCCCTTCACGCCTTCCCTAGACCCCTCCAAGCTCACTCT
+GCAATCCTTCTTCCTCACTGAAAAGCTCACAACTTTAGCAATCTCCTCCAACTTCGATAT
+GATCGTCGAAACCGGGGCACCCGACACAAATCTCGCCTCCTCACCGCGCTCCTCAAACAA
+CCCACTAAGTCGTCTAACCCGACCGCCGAATT
+>ds2020-328_809
+GGTTGGATAGACGTTGGGAGGCAGTAGGAATGAAGGAGGCGGGAAGCTACCGCTTCTGGA
+ATGCAAGCTTATCCTTGACTTTTTTTTAGAGCGTACCGCTATAATAAATAAAGGTTTATG
+GATGAAGTAATCGGAGTGACAAATGGTTATGGTTGCGGAAACCAGAGAAAGTCGGTTACC
+CTTTGAATCAGATACCGACGTCTATCCCGACC
+>ds2020-328_810
+GGTCGGGATAGACGGGCGTGCGCCGTGGTCGGGATAGACGGTACCCGGACCTGGTCGGGA
+TAGACGAATCAATGGAGTGCTGGCGTCTATCCGGACAGAGAGCCGTGGACCTAGTTTGTC
+AGTTGGTCCACGGCAGTGTTGCCAGTACTAGGTCCACGGCAGGCACTTGGTTACTAGGTC
+CACGGCAGGCGATACGAGACTAGGTCCACGGC
+>ds2020-328_811
+GGTCGGGATAGACGGCCATATACCCTGGTCGGGATAGACGTTATTTGTGGGCATCGTCTA
+TCCCGACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTTACGGCACGGGTGAATT
+AACTAGGTCCAGGCACGGGGAGAACAACTAGGTCCACGGCAGCAGGCTAGTAACTAGGTC
+CACGGCAGGCTGTATAGGACTAGGTCCACGGC
+>ds2020-328_812
+GGTCGGGATAGACGAGCAGCTCACCTGGTCGGGATAGACGGCCGTAGTGTGTTTCCTCGT
+CTATCCCGACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTGGGTAGAGATCTGC
+CGTGGACCTAGTTGCTTATGGGGGCCGTGGACCTAGTTTCTTTACTCCTGCCGGGACCTA
+GTATTAACGCTCCTGGACACTAGGTCCACGGC
+>ds2020-328_813
+GGTCGGGATAGACGTACTAGGTGCCTGGTCGGGATAGACGAATTCATTGGGTGGGCGCGT
+CTATCCCGACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTCGTTACCCCCGTGC
+CGTGGACCTAGTCGCTTACTTGCTGCCGTGGACCTAGTAGTTTGGGGGATATAACTAGGT
+CCACGGAGCATAAATGGAACTAGGTCCACGGC
+>ds2020-328_814
+GGTCGGGATAGACGAACATTTTGGATCGCCGTCTATCCCGACCATACATCAATTACGTCT
+ATCCCCACCGCCGTAAATCAGGACCTAGTGAGGATTTAACTAGGTCCACGGCAGGATCGA
+TTATACTAGGTCCACGGCAGAGCAACTAAAACTAGGCACGGCACGGGCATATTACTAGGT
+CCACGGCCCCGGGTTACGACTAGGTCCACGGC
+>ds2020-328_815
+GGTCGGGATAGACGGTATTGATGGCTTTTTTGTAGTTGATGGCTTTTTGTAGTTGATGGC
+TTAGGGTCTCTAGGCCATTTAGCCTTTTGAAAACGCTTAGGCAACATGACGTGACTTCTT
+GTCTCTTTCAGCTGTTGTCTTCTCAGCCATACTCCTCCAGCCAACTTCTCTACAGCCAAC
+TCTTCATAGCCAACTTATGCGTCTATCCCGAC
+>ds2020-328_816
+GGTCGGGATAGACGGGCCATTACGATGAGGGGTTGTTGGTCGTTTCAAGGAGCGAGCTGA
+TCAGAAGCTATCGTTCGAGGTGGGGTCGTCACCGAACAGAGAAGAGCCGAGGATATGGTG
+AACCGACTGACAGTAATGTCGGAGACGGGAAGCTGGGGAAGCCGATCAATGAACTGGCGC
+GGGTGAGAGGAATTAGGCGTCTATCCCGACC
+>ds2020-328_817
+GAATTACGGCGGTCGGGATAGACGAAAAAAGGACATTATGCTGCATTTCTATCCAGAGAA
+TGCCAAGTATGAGGCGAAGGAGAAGCTAAGATGGCTAAAGTAAGTGGGGAGCGTGAAGGA
+CTATGTCACCACGTTCACCAACCTATTGTTCGAGGTGCCTAGCATGACGGATGAAGACAA
+ACTCATGTACTTCATGAGTGGCCTACAGAAT
+>ds2020-328_818
+GGTCGGGATAGACGCTGATTAGCACTCTAGGTCTCTTATCTTTGATCGCGATGTATCGAT
+GGCTTTCTTTCCGAAAGGTAAAGATGCCTAAAAGTTTCTTTCATCGCTTTTTATGTTTTT
+TAACTATTTTAGTGGTCGTGATAGTCAGAGATTGGGTAGTGCGCTTCATTGCCGTAGAGG
+CAATCTTCCCTATATCTCGTCTATCCCGACC
+>ds2020-328_819
+GAATAGTCAGACTAGCCAACCGGGGCTTCCTTCACAGGCCAACAAGCAATACCGCGCCAA
+CGAGAGAAAGCCGAAAGAATCTTTCGAAGAGGGGCTTGCTAAAGAGGCTCGAAGAGGGGC
+GGCGAAGGAATACACTAAGGCAGGTTTCAGAGCTCGATAAAGCAGACTAATACTTCTAGG
+TAACTAAGCGCTCATCGCGTCTATCCCGACC
+>ds2020-328_820
+GGTGGGGATAGACGGTCCGGCTCAGTAGCATAAAAGAAAACGGTAGCATAAAAGGAAATG
+GGGCGGCTAAGTGGGATAGCCGAGCCAGAAAAAAAAATAGATTTAGAAGATATAAATGAG
+TAGAAAAGAAAGGAATACTTTTAAAATATGACCTGATCCACCATACATATTAGGTTTGGT
+GGAATCAATTTTATTCCTACTTCAAGCATTG
+>ds2020-328_821
+GGTCGGGATAGACGATCGCCAGCTCTATCTGCTGCTTGGGCCAAGGCTCTCATGGTAGGA
+TATATGTTGGCAGTGACCACCGCCTGAATGTCTAACCACAGACCCTCTTCAAAACGTGTA
+CACTTGTCTTCCTCTGTGGTGACCAACTCAGGTGCAAACCTGGACAGCTCATTAAACTTG
+TGCTCATACTCCAACACCGTCTATCCCGACC
+>ds2020-328_822
+GGTCGGGATAGACGAGCTGCCTTCGAGCTTTCTACTACCATCCATTGTCCTTCTTCTGAG
+GAGAAGAGCCATTCATGAGCCCGAGTCTTAGGCACAATAAAAACCCCACAATGATATGCA
+AATGGACCAGATGATTCCTGGGCATCAAGAACTACAGCTCTGTAACTGAAACGGGAATCA
+CCACCCAAAGTAAGCTGAAAACGATGACCTG
+>ds2020-328_823
+GGTCGGGTAGACGGTCCCTCTGCTTGTTTGCCTCTGCATTAACGTTGTTAACTGCTATGC
+CGTGCGATAGCGCGAATGAGTTATATGCCGATGCTGGTCCTAGCGTAGCGCCATCAAAAG
+CCCCCGAGCAATGCATGCCATCGTACGTGGCATAGCCAACCACCAGGACATGCGGTGGTC
+CCAACACTGACCAACTCCGTCTATCCCGACC
+>ds2020-328_824
+CGGCGGTCGGGATAGACATCATAAGTGAGTGTGGTTGATGCAGTTGGGAGGAGGGGCTGT
+GCGAAGCGTGAGTTATTGAACTTGGAATCATCAAGTTCTGGTATTTCCAACTCGTCAAAC
+TTAACAAAACCTGCACCCTGTTTAGCTACTCTGAACGTCCAAGCATTCTTCCCAGTGATT
+AAGTCATCCGCATCAAACGTCTATCCCGACC
+>ds2020-328_825
+CTTACATCAATTGCCCAGCTGTTGTCTTTGACTTCAATAAGGGACTACCCTTGACAATAA
+TTAAGATTGGAAAGAACGCTAACGCAATCTCCGCTTGCAATCAAAGGCTTTTCAATAGGG
+AGGGGATAGACGGCATGCGTTCTTAACGTCTTCCCGACCAGGCGCCCGAGACGTCTATCC
+CGACCAGAGCTTACATGCGTCTATCCCGACC
+>ds2020-328_826
+GGTCGGGATAGACGTTTGGTTTGGTTATGACGAAGATAGACGGGTTTCCAGAGAAGCAAT
+GCTGATCATTCCGTGTTCATAAAAAGGAGAAAAGAGGAAACTACTGTTCTCCTAGTGTAC
+TCAGTTTAGAACTCTAAATTAACAAGTAAAATTTAGATATTAGTAAGATATGCAGCGAGT
+ACGCTCGGCGAGTACGGCGTCTCTCCCGACC
+>ds2020-328_827
+GGTCGGGATAGACGGGCCCCTCCCCTAATCTACTATCAAAACGTTTAACTATATATACGT
+AAAGAAACACATGCACAGACGATATAGCCAGTCACCGAACCTCTTCCCCGAATGAGTCGA
+AATTGCTACAGCCCTAAACCCGACAGAACTGAACCGGATGTGTGTCGACGACGAGTCTCA
+GGACGATGAGTGACATGCGTCTATCCCGACC
+>ds2020-328_828
+GGTCGGGATAGACGTTACCTAGCCCTGGAGTAATGTATTCTATGAATAATAAATAAAGGA
+GTAATGTATTCTATGAATAATAAATATGAAGAATACTCTTTCAATCAAAGAAATATTTCA
+ACTATTTCCGTGTTCGTATTTCGAAAGTAAAAAAACGTAATAGGAATACAAAAGATAGGA
+AATTTATTACAGATGAATTCTTCATAAATTT
+>ds2020-328_829
+GGTCGGGATGACGGCTTAGGGGACTAGGGACTGCCCTACGGCTCCCACTGAACCTGGAAT
+GCTCGGTCCTGATTCCACAAAAATTCACAAGTTCCCAACCCAGAAGTCACTTCTTGACAG
+CGAACTTGGGGGACTACTGTTTACACCATAATCAACCAAACATATCCAGCATCAAAACAA
+CTCGCACTGGCAAAATACGTCTATCCCGACC
+>ds2020-328_830
+GGTCGGGATAGACGCTTACCTTCCCATGGTGAGGTTAATTACTTTTCTGAGTACTTGAAA
+GGTAAAGCGATCGATGATGATGATCTATACGTTGATCCTATTTGTTTAGTTTCTATGGAT
+AAGTATAGACATATGATAAAATCCCAACTTACACCAGTTGAAGATAACAGTATGATGTTT
+GAGAGGCCTCTGGCAGCCGTCTATCCCGGCC
+>ds2020-328_831
+GCCGTGGACCTAGTCTGATATCCCCTGCCGTGACTAGTTTCCCACCGTCTTAGGCACTAG
+GTCCACGGCAGGACACGACGAACTAGGTCCACGGCAGAGTTCGCAGCACTAGGTCCACGG
+CTCTCTGTCCGTGAATTACGGCGGTCGGGATAGACGACATTCCTGCCTGGTCGGGATAGA
+CGTACAACCACCATGCTCGTCTATCCCGACC
+>ds2020-328_832
+GGTCGGGATAGACGAACTGTTCCACTGGTCGGGATAGACGTAAAGGTGGTTTGTCCGTCT
+ATCCCGACCGCCGTAATTCACGGACAAGAGCCGTGGACCTAGTCCGAACCCCCCTGCCGT
+GGACCTAGTTCTAAACTTCCTGCCGTGGACCTAGTTTTAGTGCACCTGCCGTGACCTAGT
+TCAGCACCGTCTTTGATACTAGGTCCACGGC
+>ds2020-328_833
+GGTCGGGATAGACGATACATACCCCTGGTCGGGATAGACGACACGATGGGGTGTTTGCGT
+CTATCCGACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTTCATAGAGCCGTGCC
+GTGGACCTAGTGTCTTTCCTGCTGCCGTGGACCTAGTGTCCACCACGGGCCGTGGCCTAG
+TTCCTATCGCACTTATAACTAGGTCCACGGC
+>ds2020-328_834
+GGTCGGATAGACGTACGGGCCTTGTCGGGATAGACGTGACGAATGCCTGGTCGGGATAGA
+CGGACTAGCCCCCGAACACGTCTATCCCGGACAGAGAGCCGTGGACCTAGTCATACATTA
+CTTGGTCCACGGCAGCCAGCTTGACACTAGGTCCACGGCAGGGGAAATGTCACTAGGTCC
+ACGGCAGGTCGAATGGCACTAGGTCCACGGC
+>ds2020-328_835
+GGTCGGGATAGACGGAGACCACGTATATCCCGACCAGGAACCACCAACGTCTATCCCGAC
+CAGGTGAGGCCGGCGTCTATCCCGACCCGGACAGAGAGCCGTGGACCTAGTGTGAGGGGT
+ATTAGGTCCACGGCAGAGAGTAGCAAACTAGGTCCACGGCAGGCTACATAGTACTAGGTC
+CACGGCCCCGCATGTTTACTAGGTCCACGGC
+>ds2020-328_836
+GGTCGGAAGACGGTCCATTTCGGTGGTCGGGATAGACGAGTTCGCTGCACCGTCTATCCT
+CGGACAGAGAGCCGTGGACCTAGTATTCTCTAACATGCCGTGGACCTAGTGCGCTCTCAC
+CTGCCGTGGACCTAGTTCCGTATCCTCTGCCGTGGACCTAGTGTTCTACCCCTGCCGTGG
+ACTAGAGGTCTTGAATTACTAGGTCCACGGC
+>ds2020-328_837
+GGTCGGGATAGACGCCCTCATCACCTCCACACGTCTATCCCGACCAGCGGTGTGTATCGT
+CTATCCCGACCGCCGAATTCCCGGACAGAGAGCCGTGGACCTAGTTAGTCCATACCTGCC
+GTGGACCTAGTACCCCCCCCCCTGCCGTGGACCTAGTCTTGAACCCCTGCCGTGGCCTAG
+TCTATACCAGTCTAGCCACTAGGTCCACGGC
+>ds2020-328_838
+GGTCGGGATAGACGCGCCGTGGTTGGTCAAGTGACATTACAAAGAGACACGGCCTCCTTC
+CGCCATCCTCCTTCTTTACGCAGCCCGCCGAGCGGACAGAGGTAGGGGCTTTGAAGGAAC
+TATCTTAGTAGCAGAACTATTAATAAGAATAACTGCTCACGCGGCAGATCGAAGTAGAAG
+CGTCAAAGGTCATAACTCGTCTATCCCGACC
+>ds2020-328_839
+GGTCGGGATAGACGGGGTCAAGTCCTTTTGAGTTGGCAACAGGACAACAACCTTTGACAC
+CGAACACAGTGGTGTCAGGCTACACGGGGAGTAGCCCAGCTGCATACAAGACAGCCAAGG
+AGTGGCAGGTGACTAATGAGCTGGCTCGGGCTCAATTGGAAAAGGCGACTAGGAAGATGA
+AGAAATGGGCTATAGACGTCTATCCCGACC
+>ds2020-328_840
+GGTCGGGATAGACGTCTGTTCCCACTCCACTTGTTTAGTGTATAATCCTCAGTAGCTCTT
+ACCAACGTTTCTCTTGTTAGCTTCGTCTTTGCCCTGTAATTATGATCGCTCTTAATGTTT
+ATTTTTCCTTTTCCATTCCATGGTTCCTTAGTCCTCTTATCACCTATTAGGCCAAGTCCG
+CCACAGCTTACCTTTATACAGTCTAGTTTT
+>ds2020-328_841
+GGTCGGGATAGACGATATCACTGGCTGCGTGCTACCCCGTGATCGCCAGCTGTTCCTGCC
+TGGGAGAGGAGACCTCATTGTCAGCCTTAAGGTAAATTCGATCGATCATGAAATGTTTTG
+TTATGTTCTTTTTGAACGGTTCCTTCTTTATACCAAAAATTATGCAAGCCCAGTTACCGT
+CTATCCCGACCGCCGTAATTCACACGGCAG
+>ds2020-328_842
+GATCTTAATTACGGCGGTCGGATAGACGACCCCCTCCCCTAGCTTTCGTCTCTCAGTGTC
+AGTGTCGGCCCAGCAGAGTGCTTTCGCCGTTGGTGTTCTTTCCGATCTCTACGCATTTCA
+CCGCTCCACCGGAAATTCCCTCTGCCCCCACCGTATTCGTGTCAGTACCCCTCCTGTCAG
+GCCCAAAGACAACAACCGTCTATCCCGACC
+>ds2020-328_843
+AATTACGGCGGTCGGATAGACGCCAGTTGCTTGTGAAGGGAGGGATCGGGTGGAAAGATG
+TGAAGTGTTTGGGAAGTGGCGGGCCCGCATGGGGATGGCGGGGTTCGAGTTGAGGCCCAT
+GAGCCAAAACATGACCGAGGTTTTGAAGCAGCGACTGAGTTCGGGTAATAACCGAGTCAA
+CTCGAGGGCTGTTAATCGTCTATCCCGACC
+>ds2020-328_844
+AACGGCCGCCACTAGATATGTTGGGTTTTTGGAAGTGAAGGAAACTGAGGAGAAGAGCAA
+GAGAATTAGGGTTGAGGAGGAGATGAGGGAGAGACTTGATGAGAAAGAGAATGAGCTTAG
+TTTGTTCAAGAAGAAAATTGAGGAATTGGAGTCGGTGACCACCAAGAACGGTGTTGAATA
+GTGGCGGCCGTTGCTGTGTATTAGATCGGA
+>ds2020-328_845
+GCCGTGGACCTAGTTAGGAGAGTAATTTCGGATGGTGTTCTTTACTGCTCTCTGATTTTC
+TGATAAGATTATCGCCGGCGTGGCTGCTACTCCCTCTGAAGCCTCTACTGCTGGCTTCGC
+AGTCAGGTGCAATAGATCCCTTGGATCTATCATATTCTCCCAGATATAATTTACAAGGCC
+CCTTCTTATCACGTTGTAATTCTTATACAC
+>ds2020-328_846
+GCCGTGGACCGAGTAGTTAGCCATTTGGTCCACGGCAGAGGCCAAAGAACTATGTCCAGG
+CAGGGGGAGATAACTAGGTCCACGGCAGTGTCTACCCGACTAGGTCCACGGCTCTCTGTC
+CGATCGGGATAGACGGTGTGCGTTGGTCTATCCCGACCAGGGCATTCTGACGTCTATCCC
+GACCAAGGGCCAATAACGTCTATCCCGACC
+>ds2020-328_847
+GGTCGGGATAGACGTGGGAGCCTAGTGTATCCTAGCTCCCTGTACGTTAAGAGAAAATGT
+ATTAATTACGTCCGCTCCGACTCTGCATGCGTTTACACCCTGCCACTCATCACTGTCTTC
+TTCGACGTGTATCAGGACGTGGGATGCTTGATGGCGGTCGACTGCATTAAGCCTAGCACC
+CCTACACGACTCATTTCGTCTATCCCGACC
+>ds2020-328_848
+GGTCGGGATAGACGGACCCTGTTGATTGGACTTTGAAAACTGAGTCTCAACCCGTATCTA
+TTCAACGTAGTTTAAATGATTTAGATTACATTCAGCAGTATTCTGATGGCACCGTTAAAA
+TTAATTTTGGTAATCAACCTAAGCCTCTCGTACAGCCTAAGTCTACTGTCCATTTGCCGC
+AGTTACCCACCCGCGGCGTCTATCCCGACC
+>ds2020-328_849
+GGTCGGGATAGACGATTATTATGTGTGGTTAGTGGCACTTGAATTGGTTGAGGGTAAGTT
+TGGATGATCAAGAATGGAAGAAGAGGATGGTGGTTGGTGAGAGACTTTGTGAGCAAAAGG
+CCTCAAAAGGTAAGAAGGAGGTGAAGGCCCCAAACCCAAACCCCCTCCTCCTCCTCCAGC
+TGATCTCATGAGGGCTCGTCTATCCCGACC
+>ds2020-328_850
+GGTCGGGATAGACGTCCCCCCGCTCTGTCTTTTCTCGCTTTGCTAATCTTCCCCTCTAAC
+GCGGGCCGGGCGCGGGAGTAAGAAACCTAAGAGAGGACGCTCTTCTCTTAGGTCCTTTTT
+TTCAGTGCAACACAGGAAAGCGCCCTCTTTTTGTTTTGTCAAACCTGCAGCTTTCCAGAT
+TTTGTATTGAACGCAGGCGTCTTCCCGACC
+>ds2020-328_851
+GGTCGGGATAGACGTTGCAAGCTCGTGGTCGGGATAGACGTTAACATTCACTGGTCGGGA
+TAAACGTTCGGCCCGTCTATCCTCGGACAGAGAGCCGTGGACCTAGTTCTTATCGTCCTG
+CCGTGGACCTAGTCCTCCTGCAGCTGCCGTGGACCTAGTACGCATCTACCTGCCGTGGAC
+CTAGACTCCCGACCCTACTAGGTCCACGGC
+>ds2020-328_852
+GGTCGGGATAGACGAAATAACTCCCTGGTCGGGATAGACGTATAGTGGCCCTTTCCGTCT
+ATCACGGACAGAGAGCCGTGGACCTAGTGCTTCCTCGCCTCTAGGGTAGTCAGAATGAGA
+CTAGGTCCACGGCAGGGAAAGACTACTAGGTCCACGGCAGTGATGGAGGTACTAGGTCCA
+CGGCAGGGGGCATGGGACTAGGTCCACGGC
+>ds2020-328_853
+GGTCGGGATAGACAGCACTTGCAGGTTATCGTCTATCCCGACCAGGAGTCCTTGTCGTCT
+ATCCCGACCGCCGTAATTCTCGGACAGAGAGCCGTGGACCTAGTGTCCTGCTGCTGCCGT
+GGACCTAGTCAATTCTAAACTGCCGTGGACCTAGTGAGTCGCCCCCTGCCGTGACCTAGT
+ACACAAACCCATCCTGACTAGGTCCACGGC
+>ds2020-328_854
+GCCGTGGACCTAGTTCATATATTCCTGCCGTGGACCTAGTCAGCTAAGTACTGCCGTGGA
+CCTAGTCTTTCACCGCCTGCCGTGGCCTAGTGTTTACTGGTGTGCATACTAGGTCCACGG
+CTCTCTGTCCGTGAATTACGGCGGTCGGGATAGACGGCTGTGCCCAATCCGCGTCTATCC
+CACCAGGCCTGTCTTACGTCTATCCCGACC
+>ds2020-328_855
+GGTCGGGATAGACGAGTTGGTGCATTAGAGGCGACGCTAAACCATCGTCGTTTAATGAAT
+TCTCTAGAAACGGAGAATTATTTGTTAGTGGTGATTATGAATCCGCCACTGATAATCTAA
+ACTCTGAGGTCCAACTCGCCATTCTTGACGAGCTGCTGCAGCGCTCTACTTCGGTACCCA
+GGGGTATCCAGGGCACGCGTCATCCCGACC
+>ds2020-328_856
+GGTCGGGATAGACGAAAGTCCCATATTGCGTCTATCCGACCAGAGATGATCATCGTCTAT
+CCCGACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTCTATGGTGGCCTGCCGTG
+GACCTAGTACTTATTCCCCTGCCGTGGACCTAGTTCCTAAAACCCTGCCGTGACCTAGTC
+ACATAACTGCTACCGTACTAGGTCCACGGC
+>ds2020-328_857
+GGTCGGGATAGACGCATCCAGCTCATCGCACAACTCCTTTGCCATGCCTTCACCAACCAC
+TAGACGTCGACGCACCTTGCGACGCATGCGCTCGAATTCGAATGTGACGACAGAGATGGA
+CTCCCTTGTGTCAATGTTTAACAACATACAAATCCTTGGACGCATTGATTCATATCACAA
+GTTGGATCCTGATCTGCGCACTGCGGACCC
+>ds2020-328_858
+GGTCGGGATAGACGTCGAGAGTCCATCCTAGTAGTATAAACAAAATAACCTCACTATATG
+ATCCCATAGTAGTAAGAGCATTCCAAAATGCTTTCCAGCTTAAAAACGAGACTGATGCTG
+TTTGGATCATACAAAACAGAGCTAAATCTGCCGAATATGGTGATAATCATCTTGCTGTTC
+TAGTCAGGGCGGTCGTACGTCTATCCGACC
+>ds2020-328_859
+CAGCAAGCGGACTGGAATCAGAGTGATAGGGCGTACCCCAACCAAAGAAAGATGGAGGAA
+GTGAAAACAGAATTCCACGATTCATATGAAAGGCCGCTACAAGACAGGCAATTCAAGTTG
+CGGCTAGGGGAAACCTTGGATAAGGGGGAAACGTGGCAAACTGATGATTGACCGAAGCGG
+ACGAAGAGGCAGTTTCTAGTGGCGGCCGTT
+>ds2020-328_860
+GGTCGGGATAGACGACCTCCTCCAGGCGCTCAATCTTTCCCACAGCTTCAGGAAAGTGCT
+TTAAGCCTATTATAGTCTGCACGGAGCTCTTTAAGCGAGGAACAATGACCAATAGTATGA
+GGAATTTCTTCAATATCATTGGTTTCCACATTCAATATCTTGAGGCTAGCAAGGGACCCA
+ATTGAGTCAGGAAGCGCGTCTATCCCGACC
+>ds2020-328_861
+GGTCGGGATAGACACTCGTACCAATTGGGATAGATTCTGGGCATCTAGGTGGGGTTGGGC
+GCCTACAGGTGCTTATCACTCCCAGTACGTTGATGATGCTCAGTACAGAGCAAAGGAAGC
+CACTTTACGCAACAAGCCTTTTGCTGTATCAACCGTGACGGAACGCAATCGTGATTTTTT
+CACGACACCATCGCCCCGTCTATCCCGACC
+>ds2020-328_862
+TGATTGAATTACGGCGGTCGGGATAGACGATATTGACGGCTGTGTAGGTCCTGCCCTTGC
+TACACGTCGTTATGTACACACACAAATCTCACCTACTCTGTAGGTTCGAGACGGCATAAG
+GAACCCCAAATGCGGGGGTTCGACGTGTTGAGCCTTAGCTGCTCTCGCGTTGCCACGGCA
+GGCAGGGGACTGATTCGTCTATCCCGACC
+>ds2020-328_863
+GGGTAAACGCTTACTGAAGGACGTCTTGCTGGCAGGGAAGAACGCCAAGAAGCACAACAT
+ACGTCTGCAGATGAGCAAGTGTGCGTACGGAGCTATAGCTGAATTCCTTCGTGTAGATCA
+CAAGCGCGGATCTAAGGGGCAATATCTGTCGAGGGCAATGGCAACTCTGGTGCACTCAAG
+AATAGAGTCGAACAACGTCTATCCCGACC
+>ds2020-328_864
+GGTCGGGATAGACGGGTCATGGCCTTCTATTTAGTCGATGCTTGTTTTTCCGGATAAGTA
+GTATTTTATCTTCAAGTTCAAGGGAGTTGTTGGAGTGCTTTTGTAAGTCCTGTTGGCGTG
+CTATAAAATTTCATTTGAATGATAGGCCAATCTAAGTCTTCCATGTCGGTTCGAGGGGAA
+GGAAGGTGCAAACGTCTATCCCGCCGCCG
+>ds2020-328_865
+AATTACGGCGGTCGGGATAGACGCTTCAGTGTGGTATTCATTCTCGTTCGGCTCTTGGAA
+TCACATCCAGCAGTGGTTGGAACAGCTCGCAAAATCCAACCACTTTACCTACTTCATTGC
+CCCCAACCGTTTCTCGTACCTCTATTGAAACAGAATGGTTTCATGTTCCTTCATCGATTG
+GTTATTGCTCTACTTCGTCTATCCCGACC
+>ds2020-328_866
+GGTCGGGATAGACGGCATTATAGGGTTAATGCAATTTCATACCAGTACATTGCTTGCTAG
+CATTGTGCATAATTTAAAAACTGCCCTAGGCTTGAAACAAAAATATGGACTATCTTAGGA
+TTATTGTGTCTGTTGGTTGGCAAAACTAGCCAATAGACGTGAATTTACTGCAATTTAGGA
+GACAGGGACGTCATTCGTCTATCCCGACC
+>ds2020-328_867
+GGTCGGATAGACGTCTAGTAGCGCTTGCATCTGTTCTTTTGAAAACTTGTTTTTGAAGAC
+AGCACCGTATGCATCAATAACTGCCTGCATAGAAGATATTGAGTGCTGGCTGTTAAAGTC
+TTCAAAGTCAAGACAGTAAGGTAGTCGTCCTGCTAGCACCCCCGACACGCGAGCGCTGAC
+ATTTGCGTCATTGGCGTCTATCCCGACCC
+>ds2020-328_868
+GGTCGGGATAGACGCGTAATAACTGTACATGACGATGAAGAGAAGTCAGGTTACGTGCTG
+TTGAAGAATGGTCTTAATGACTACGCCAATTACGTGGTCGAGAGATTAGGGATAGAGTTT
+GATATCCCAAATAGAGAAGAAATGTTCAAACGATTAGTGAATTCACTAACAAAACCAAAG
+AGAACATAGAAGATAGTTATTGATATCGA
+>ds2020-328_869
+GGTCGGGATAGACGGACGATTTGGGTGCAGGTATTGGTAGGCGCCGCAGGGACTCATCAG
+GCTTTGGTGGGCCAAGTCAGGGCCCATCAAAGAGGGGTGGATCCAGTTCGAGTGCTGCTG
+GTTGGGATCTTTTTAAACTGTGAATTTTGAGCAGGTTGAAAGTTGGGAAATATTCAATTT
+ACAAGGGAGAAAATTCGTCTATCCCGACC
+>ds2020-328_870
+TACGGCGGTCGGGATAGACGTAGTAGGTGGATGGTCTGGTTAATTGGGAAGAGGAGCATA
+AAAACAGGGTGTCTCCCAATTTGGCGGAGATGCCGGAGGGTCTGGTTTACGAGCGAGCTT
+CACAACTTTTCAGCAGGTCAATATCAGCTGGTAAAAGGCCTAGAAAGTTCGACTGGCGTG
+AAAACTGGCATATACCGTCTATCCCGACC
+>ds2020-328_871
+GGTCGGGATAGACGAGGCGGGCAGATTAGCGTAGATTTCTGAAGCCGTGTAGTGTATGTG
+ATGTTCACCAGATATTGCCTCTTTCGGTAACTCATCCAATCTGTTAATGGGTGAGACGTC
+AGAGAATGACCAGTCTGGGTGGCGGTCTATTAAACTTTCAACAGAATAAGAAATGTTATC
+TAAAGAAGCAAGGTGCGTCTATCCTGACC
+>ds2020-328_872
+TGAATTACGGCGGTCGGGATAGACGTCAAGGGCTCCTGTCTTCAAAACGGTAACCCTTGG
+CAAGTGCATGTACAACATCGACAATCGCGCGTTCGGCATTGCCATATAGCAAAATATCAG
+CGCGGCTATCCATCAAAATGCTACGGCGCACTTTGTCTGACCAATAATCAGAATGGGCGA
+TACACCATGACATACCGTCTATCCCGACC
+>ds2020-328_873
+GGTCGGGATAGACGGGTTATCGGGGGGTCGGGGTAGACGGTCGCACGTGCTATATTCCCT
+AAAAGTGACTTGGTGCACACAACCTTCGCACCTTTGAGCCTAGCTCCCATCTCTACGGCG
+GTTTGCGCATCCGGCACAAGAAGCATTGATCTCCCTTTATGATTCTCGGCCACGTACCTA
+GCCAAGCCCACCAAGCGTCTATCCCGACC
+>ds2020-328_874
+GGTCGGGATAGACGGATCCCCCAACTAACAACTGATCCATCAACATTTCCTCGTCTCCTG
+TCATCATTTCTATTGTATTGTACTCAATGTCATTTCCCTTGTTAGTGTCAATTATATAAT
+AAGGCGATAGCAACCTGTTCACCATCTCCACTTCAATTAAATCTTCAGGAGCATCTGCTA
+TTAATGAGCCTCGGACGTCTATCCCGACC
+>ds2020-328_875
+GCCGTGGACCGAGTAGCCGCTCTCGTGCCGTGGACCTAGTCCCTTTCCCCTGCCGTGGAC
+CTAGTTTGACTCCCCTTGCCGTGGACCTAGTATATAGCTACATACTAGGAGGAGCCCGAT
+GACTAGGTCCACGGCTCTCTGTCCGAGGATAGACGGTAATTTGGCCTATCGTCTATCCCG
+ACCACCGCATCTTCTCGTCTATCCCGACC
+>ds2020-328_876
+GGTCGGGATAGACGATTTTTGAACATGGCTGGGCTGACTGTAAGAGAGTGCAGCATAGCT
+GAATACATTATAACGGGGAACCAACGTACAACGCCGTTTTTAATAGACCAGACCTTCACC
+AATTACTCAAGTGGTAAAAAAATTGTTGCTTACAATTCTGCGGGCGCAACTAACAATCAA
+GCACAAGTAACCCAAACGTCTATCCGACC
+>ds2020-328_877
+GGTCGGGATAGACGTTGCTGGTCGGGATAGACGTCCCAGGACACTGGTCGGGATAGACGA
+TTGGGGGGTTCCGTCTATCCACGGACAGAGAGCCGTGGACCTAGTCAGCCGAGGGGTACT
+AGGTCAACGGCAGGTCGAGGGACACTAGGTCCACGGCACGACAGAGTAGACTAGGTCCAC
+GGCAGGCGAGGATGTACTAGGTCCACGGC
+>ds2020-328_878
+GGTCGGGATAGACGCTCTACACCCTTGGTCGGGATAGACGACAAGGAAGCCTGTCGGGAT
+AGACGCGAATCATCCGTCTATCCTCGGACAGAGAGCCGTGGACCTAGTGAGGAGTAGTGT
+GCATACTAGGTCAGGTGCACTATCACTAGGTCCACGGCAGACAAAGGACGACTAGGTCCA
+CGGCAGGAGCAAGGAACTAGGTCCACGGC
+>ds2020-328_879
+GGTCGGGATGACGGCGCTCATGCCTGGTCGGGATAGACGTTTCAAGGGTCTAATCTCGTC
+TATCCCGACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTGCGACGTGTCCTGCC
+GTGGACCTAGTATTCCACTCCTGCCGTGGTCCTTGTGTCATTTTGCCTGCCGTGGCCTAG
+TGCATCAGGGTTTGAACTAGGTCCACGGC
+>ds2020-328_880
+GCCGTGGACCTAGTCTAAAGAACACTGCCGTGGACCTAGTGACTAATTTGCTTCCGTGGA
+CCTAGTCTGTACCCTCTACACAACTAGGTCCACGGCTCTCTGTCCGTAATTACGGCGGTC
+GGGATAGACGACAAGGCCAAATCTCCGTCTATCCCGACCAGGAGCTAGAGACGTCTATCC
+CGACCAGGAGGTTATTCGTCATCCCGACC
+>ds2020-328_881
+GGTCGGGATAGACGCATGTATCTTCTGGTTGCTTCTGGGTCTGGTCTAAGGTTGGTTCTA
+AGGCTGGTTTGGAACCCTTCCCTTGAACAGGAGCTTCAGCTTAAGTAGCCGCTGGTGTCG
+AAGCTGAAACTGCAGGATCTGTTGTAGACGCAGGAGCTTGTCTCGTCCGCTACTATCCCT
+CTGATGATCGATGTCCGTCTATCCGACC
+>ds2020-328_882
+GGTCGGGATAGACGATACTCGGTGGTATAATCTGGGTATACAAGGCGCTAACGATATGCA
+CCCATATAGAATTATTCTAGAATGCTGTTCTTTAAGGTTCGGTAAGCAATTCGATATAAA
+ATGGGACACTATAGCTGGACCAGACATAATGACAGAGCTAGCTACATCGGAAGTAGTCAA
+ACAACGAGATATTGAGATTGAAATTGTA
+>ds2020-328_883
+GGTCGGGATAGACGCTTTCGGGCCTTTTGATAACTAATTAGAGTTGACATGAAATGGATC
+GCGGAAGAAGACGTATCTGATGAATGAATGATTCAATCCCCTCCCACCCGCACGGTTCCT
+CTATTGAAGGGGTTCCACTTCATTCTATGTGAGGTGGGGCGTACGTAAGAGCGGAACCTA
+GATAGAACGCGGAGCGCCGGCCCCGGCC
+>ds2020-328_884
+GGTCGGGATAGACGGAGTTGCATCATAAGAAAGAAAATTGAAAGATGAAGACCTGTCCAG
+CCTAAAAAAGAATGCTATTTCCCCATTGAAGAGGACAAGGAGAGACTTGCTAGGAGAAGA
+AAAGTAAACAAGTGGAGCTCTTTGGAAGAGGACACCTTGAGGGCTGGTGTAGGGCAGTAT
+GGAGTGGGACTAATCGTCTATCCCGACC
+>ds2020-328_885
+GGTCGGGATAGACGGGGGGTCCTGCGGTCGGGATAGACGGAAAGGCCTAGTCTATCCGAC
+CAGGCAGATTTGGCGTCTATCCACGGACAGAGAGCCGTGGACCTAGTTTCCAATTGGCTG
+CCGTGGACCTAGTATTTTTGGCCTTGCCGTGGACCTAGTGCGGCCTCTCCTGCCGTGGAC
+CTACTCAATTATTCACTAGGTCCACGGC
+>ds2020-328_886
+GGTCGGGATAGACGAGAAGCCGGGGTGCGCTCTAAACAGGTCTCTTAGCCTGAAGGAAGC
+TGAATTGTTGGGGTACACAAAAATCACAGCGGCTCATCATGTACACTACACAGTGTCTGA
+GGCCGCGGCTTCTGTCCAAAAGGAAAAAAGATCTCTAATACCTAAGGCTCTCCGTCTACC
+ACACGATGCCACAGCGTCTATCCCGACC
+>ds2020-328_887
+GGTCGGGATAGACGTTCGTGCTCCTTCTATGCTCCGGCGGGCTCCGCTTCTGCTTTAGTT
+ATGGAAGCCCTATCTTGATTCTCACCCTTGGTTTGTTTAGTCCTTCTTTCCCGCTGTCGT
+TCTCGGATGAAAGATACGAAAGGTACGGAGTAACTCGACTGGCAAGAGATTTATGGGGTC
+TCCTTCTCTTCTTGGCCGATATTCCACT
+>ds2020-328_888
+GGTCGGGATAGACGTCGAGCAGCCCTCTTCAACGGAGAGTTTGATCCTGGCTCAGGATGA
+ACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGATGATCCCAGCTTGCTGGGGGATT
+AGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTTAACTCTGGGATAAGCCTGGG
+AAACTGGGTCTAATACCGGATATGACTC
+>ds2020-328_889
+GGTCGGGATAGACGATTCTTGGTTCTGAAAGAAAGGTCCCGATTCCGGGACGGAGCCGTA
+TGACGCGAGAGTGTCACGTACGGTTTCTTTGAGAAGGGTGTGATACCACCACCTATCAGG
+CCCGACCAGCTGTCCACGGAGCTGCATCCCTACTCACCTGGTCCATGCACATCGCTCTCT
+CCAGCAGGGTTGACCGTCTATCCCGACC
+>ds2020-328_890
+GGTCGGGATAGACGCAGCCCAGTACTTGCTCCACTTCATGCACACAGGCTTCCTGCCTAT
+AAGGCTAGCCTGCCTGAATATCGATGATGATGCTTCAAACACTTCATCATAACTCAGATT
+CGCCAGCCTCGGTTCGGTCCTATTATCCTTCTCGAGTTGCCAGTCTACGTCTCCATCCAC
+ACGGTTGATTATCACGTCTATCCCGACC
+>ds2020-328_891
+GGTCGGGATAGACGATTTCGGGGGCTAGAAGATAGGGAAGGGCAAATGCATAAATTGTGG
+CGTGGCTTATATTCCGGGTGGCGAGGCACTACCTGGATAAACACTGTTCTAAATTTCTGC
+TATGTTCACATAGCGCTGGTGAACCTGGAAAGGATAACAGGGATAAGTGTTGTTTTAATG
+GTAGGCCACGGCGGCGTCTATCCCGACC
+>ds2020-328_892
+GGTCGGGATAGACGATCTCTTCGTCTCGGGTCTACACCCAGCGACTCGACGCCCTGTTCG
+GACTCGGTTTCCCTTCGCCTTCCCTATTCGGTTAAGCTTGCCACTGAATGTAAGTCGCTG
+ACCCATTATACAAAAGGTACGCCGTCACCCGTTTCCAGGCTCCGACTTTTTGTATGCATG
+CGGACCGGCGATTCCGTCTATCCCGACC
+>ds2020-328_893
+TGGTCGGGATAGACGCCAGCAAGCAGTAGGTATGCTTAAAAATGCCGATGCGATGAACGT
+GAGGGCGCAGCCGGCCAAATGTGCATTCGGCGCTGTAGCAGAGTTCCTAAGGGTAGACAG
+ACAGAATGGCGCTAACGCGCAATACCTGCCCAGGGCAATAGCGACTTTGGTCCATTCGAG
+AATAGAAAGCGGTACGTCTATCCCGACC
+>ds2020-328_894
+GCCGTGGACCTAGTCCTGGTTGGGCTAATATACTAGGTCCACGGCAGACAGAGACTCACT
+AGGTCCACGGCAAGAGCAACGCCACTAGGTCCACGGCTCTCTGTCCGGTCGGGATAGACG
+TCAGAAACCTCTGGTCGGGATAGACGCGAGCTTCCCCTGGTCGGGATAGAGTACTCCCCT
+GTTCCGTCTATCCCGACCGCCGTAATTC
+>ds2020-328_895
+GGTCGGGATAGACGTCGTCTGCACTGTCCAATCTGTAGGCTACTTTGACATATCCATCTA
+GGGTAGTGTAGTTGACGGGCCCCTCGTCCTCATAAACCATCGCTGCATTGTATACCGCCC
+CGTCTCCACCGACTACTTGTGTGTCGCCGTCGAAACAGATACTCTGATCAGCCGCTACGT
+CCATACAACCTGAGCGTCTATCCCGACC
+>ds2020-328_896
+GGTCGGGATAGACGGGGGGCCTTCTTTCACTCCACACCCCCCATGCACAGGCAACAAAGA
+AAAAGATGAGACTGGGAACATCGACGACCATCGGTGGAACTCTTTTCGGAGGTCCACTTA
+CCCCGGCGGCGGCTTGGGCCCACGACCAGACAAGGTCTACCTGGGCAAAGTACCTCAAAG
+AAACGGACGCCAGTCGTCTATCCCGACC
+>ds2020-328_897
+GGTCGGGATAGACGAATACTGCACCTGGTCGGGATAGACGAACCCAAGCGCTGGTCGGGA
+TAGACCACAGTACCGTCTATCCCTCGGACAGAGAGCCGTGGACCTAGTAGCGTTGATTGT
+AGGTCCACGGCAGTGAATATCAAACTAGGTCCACGGCAGGTGAGTGGTACTAGGTCCACG
+GCAGGTGTCTAGGTACTAGGTCCACGGC
+>ds2020-328_898
+GGTCGGGATAGACGACCGAGGGCCATCAACGTCTATCCCGACCAGTAGAGTTAGACGTCT
+ATCCCGACCATGTGCTGGCAGCGTCTATCCCGACCGCGTAATTCACGGACAGAGAGCCGT
+GGACCTAGTCGCATCCCAGCTCAGACTAGGTCAGGCAGAGGATCACAGACTAGGTCCACG
+GCAGCGCATAAAGAACTAGGTCCACGGC
+>ds2020-328_899
+GGTCGGGATAGACGGAAAGACTGGGTCCCCGTCTTCCCGACCAGGTTAAAGATACGTCTA
+TCCCGACCATGGGGAAGGCGCGTCTATCCGACCGCCGAATTCACGGACAGAGAGCCGTGG
+ACCTAGTTCTAATCGGGGTATTACTAGGTCCACGGCAGCAAAATAGATACTAGGTCCACG
+GCAGGAGAGCATGTACTAGGTCCACGGC
+>ds2020-328_900
+GCCGTGGACCTAGTACTGTTTCCTGTTCAACGTTCATCGTAGCATGGTGAGTCGGCCCCT
+AAGGCGAGGCAGAGATGCGTAGCTGATGGGAAGCAGGTTAATATTCCTGCACCGTCGTAT
+GATGCGATGGGGGGACGGATCGCGGATGGTTGTCCAGCTGTTGGAATAGCTGGTTCTTGA
+CTCATAGAAGGCGCTTAGGCAAATCCGG
+>ds2020-328_901
+GGTCGGGATAGACGTAATTGAGCAGTAACTTTATCATGCTGAAACAATAAACCAACCTGC
+ACAGTACCCAGAATATACCGTAGAATCCATTTCACAGATTGCCAATGCCCTTTTCCTGGA
+TTATGCACATATCTACTGACAATACTAACAGCTTGTGAAATATCAGGCCTTGTACACACC
+ACAGAGTACAAACTCGTCTATCCCGACC
+>ds2020-328_902
+GGTCGGGATAGACGCTTAACCATGCTATCAATCTTTTTGACCTCCATTGTACCGTTCCCT
+TCCCCCAATATCACTGGTGAAAAGTGATTTTGGTCTCGCAATATTGTTACATTATTCTCT
+TGACTTCCATCATTATAATTAGTAACCCGTCCACTCTCTTTATCTAGCAATCTTAGGCCG
+AACCCCCCATGAGCGTCTATCCCGACC
+>ds2020-328_903
+GGTCGGGATAGACGGTAAAGGAGCGTAGACGAGCGAGTAGAGCCCAGGAAACAGGGAAGC
+CCGTCATAGAGCAGTCGACTAGAAGTAGAAGACTGCTGGCCTGAGAGAAGGCGGCCTCTC
+CCGGGAAACATGGCCCAATTTCTCTTCTTTCTTTTTTATTTCGGGTTTCTTTATTTTTTC
+AGGGGGGGCAGCCCGTCTATCCCGACC
+>ds2020-328_904
+GGTCGGGATAGACGGTTAATCGGTATGTATTTTTCAAATATTTGAGGGATATGATAGGTT
+AGATGCATTTTATGCAGCAATTGTCACCATAATCACTGTTGGTTATGGTGACAAAACTCC
+AAGTTCTAAAGTAGAGGATATACAGATAATTGAGATGGCTTCAAACATGCTTTCTAATTG
+TAGTTAGGTATTTCGTCTATCCCGACC
+>ds2020-328_905
+GGTCGGGATAGACGAACCCCCCCCCCATCTCGTACCGGAACCGAGTTCCAACTGCGAGAC
+GGACTTGCACACTACCCCATCGTATCGTATTTACTGTATTGATTTTCCTACAGACTCGAG
+ATCGTCGTAGTCTGCCGGTGGTCGTATCGTCCCACCGGATAAAATACCGTAAGCTCCTCT
+CACCACGTTTTTGCGTCTATCCCGACC
+>ds2020-328_906
+GGGCGGGATAGACGCCCGGCGGTGATTGCACACTAGCTGGCCCGTGGGGGTAAGAGAGTG
+TTCCGTTGGTGTTCTCAGTCTCAGTGCGACCTTGCTTGGTCAACAAGGGGATCAAAATGT
+CCCCCATCAATAAAGTGAGGGCTTTCCGGACCTTCTCCACCTCCCTTTTTCTTTTTTTTC
+CATGCTTTCCGTCCGTTTATCCCGACC
+>ds2020-328_907
+GGTCGGGATAGACGCCGGGTGAAGCTAACTTTGCAGCACAATTATCCTCATGCATACAGA
+ACTGTAGAAGCTTACAGAGGTACCAACTACCGGTAAAATGGTATACAGATTTATTTAGGA
+CGGTAGGATCCGCGGCTTGTGAGGCGATGTGCTATCAGCAGTGGCGGCGATAAAGACCTA
+TAGTGGAGGCAGCCGTCTATCCCGACC
+>ds2020-328_908
+GGTCGGGATAGACGATGTTAAGTGCTGGCTGTTGAAGTCCTCAAAGTCTAGACAATATGG
+CAACCTATTCTTCAAGACACCCGCCACTCTGTTTACTACATTTCTGTCGTTTGCGTCTTT
+ACCTACCGGGAATCTGTTCGGCAAGACGTTCTCGCAATTGTAGAACGCGAAGTTTGCAAG
+TACGTAACTCGTTCGTCTATCCCGACC
+>ds2020-328_909
+GGTCGGATAGACGGGCGGCTGGTATCGTCCATTCTTACACCCTCGACACCAACTAAGAGT
+TTTTCTTATACTTGCGAAAAACTCAAAGAATTTGAAAATTTCGGTGTTCCTTCCCATGTC
+AATCATCGTGGTACCAGTGTCAGATATGTTCCGTTCATTGAACAAATCACCTGGACCTAC
+TACTGCCCCCATGCGTCTATCCCGACC
+>ds2020-328_910
+GCCCGGGATAGACGAGGAGGTGATATTGACGCCGATGGATATAGGTTTCTTGGGAGAGTC
+AACGGTAGGTATAGAAGTAAAGCACGAAGAAATGAATTATAGGTATGTTAGATTGGATTT
+TGTGACAATAAGAACGCCAAAAATAATGGCAACTGTTGGTGCAAATATATCGGGTAATAT
+AAGGGCCAGGCGTCGTCTATCCAGACC
+>ds2020-328_911
+GGTCGGGATAGACGTTACACGTCACTCCGCTAATAGCAGCAACACCTGATAGTGCTTCAA
+TGCAAAACGGCAGCCCGAAGGCTGCCGTTTTTGTATCCATTTCTGATATTCGCTGAAGCG
+CTTTATCTCAACTCATCCCGTCAACTATGACCGCAATTTTTGCCTTCCACAAGGTAAATC
+TCATCTCTTCCTACCGTCTATCCCGCC
+>ds2020-328_912
+GGTCGGGATAGACGGTTACCACCCCTGGTCGGGATAGACGCCCACCGTGGCTGGTCGGGA
+TAGACGTCTATCCTCCCTGGTCGGGATAGCCAAATCTTACGTCTATCCCTCGGACAGAGA
+GCCGTGGACCTAGTTGGAGCTCACTTGGTCCACGGCAGTGTGTCACAGACTAGGTCCACG
+GCCCCAATTGCAGACTAGGTCCACGGC
+>ds2020-328_913
+GGTCGGGATAGACGCTTGCTCCCCTGGTCGGGATAGACGTACTTGCGGCCTGGTCGGGAT
+ATACGTTAAAGCCGTCTATCCCGTCGGACAGAGAGCCGTGGACCTAGTTCTAAGCGCCTG
+CCGTGGACCTGGTCGTGCGCTTCATGCCGTGGACCTAGTCAACAATCAGCTGCCGTGGAC
+CAAGTCATCAAGTACTAGGTCCACGGC
+>ds2020-328_914
+GGTCGGATAGACGATACATGTGGCTGCGTCTATCCCGACCAAGGGTTGGAGCCGTCTATC
+CCGACCGCCGTATTCACGGACAGAGAGCCGTGGACCTAGTATATAAACCCCTGAGATACT
+AGGTCCCGGCAGCATGTTACGTACTAGGTCCACGGCCCCCTACCTACACTAGGTCCACGG
+CAGGGGGCGTAGAACTAGGTCCACGGC
+>ds2020-328_915
+GGTCGGGATAGACGGATAGACGATGTCCAGGGGTGATTGTCGTCTATCCCGACCCCCGAA
+GTGATCGTCTATCCCGACCGCCACGGACAGAGAGCCGTGGACCTAGTAAGGATAGTACTA
+GGCCACGGCAGACTTAATTGCACTAGGTCCACGGCACGATAGCGGGAACTAGGTCCACGG
+CAGGCATTCAACGACTAGGTCCACGGC
+>ds2020-328_916
+GGTCGGGATAGACGAAACGCAATCATGTCTATCCCGACCAGGTGTTCTAACCGTCTATCC
+CGACCGCCGTAATTCCGGACAGAGAGCCGTGGACCTAGTCGCATTGTCTCTGCCGTGGAC
+CTAGTCACTCAAAGGGTTAATAACTAGGTCCACGGCAGGTCGGTGATACTAGGTCCACGG
+CACCCCCGACACAACTAGGTCCACGGC
+>ds2020-328_917
+GGTCGGGATAGACGATTTGGAGTTGTCTATCCCGACCAGGGAGATTCCTCGTCTATCCCG
+ACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTTGGGTAGTGGCTGCCGTGGACC
+TAGTAACGCTCACCGTGCCGTGGACCTAGTGATCTGTGCGGTGCCGTGGACCTAGTCCTC
+CAGCAGCAGGCGAACTAGGTCCACGGC
+>ds2020-328_918
+GCCGTGGACCTAGTCTCCAACTGTCTGCCGTGGACCTAGTTCTCATACCCCTGCCGTGGA
+CCTAGTTTAGATTCCCTGCCGTGGACCTATTGAAATGGTGGTATTACTAGGTCCACGGCT
+CTCTGTCCGAGAATTACGGCGGTCGGATAGACGGTAACCCAACCTAACGTCTATCCCGAC
+CAGAGGGTGTTTTCGTCTATCCCGACC
+>ds2020-328_919
+GGTCGGGATAGACGCGCTTGGGTACTGGTCGGGATAGACGGTGTAGCCCCCTGTCGGGAT
+AGACATAGCTGCGTGTTTCGTCTATCCCGACCGCCGTAATTCCCGGACAGAGAGCCGTGG
+ACCTAGTTAAGACTACTCTGCCGTGGACTTAGTTTCTTCACGGGGCCGTGGACCTAGTAT
+CTCCCCTGCTACAACTAGGTCCACGGC
+>ds2020-328_920
+GGTCGGGATAGACGGGGGATTTAAATTTTAATTAGCATCAAGACGAACATTCCGAGGTCG
+CACCCCCCCGTCTTACTGTAGCAGGCATGGCAAACCTGACCCGTTTACGCACGCTTGTTA
+CGTCCGGTGAGCTCGAGGTGGTGTCAGCCGCAGCTGTTCTCTTCCACCTTTCTCGGAATC
+CAACCCTACATGACGTCTATCCCGACC
+>ds2020-328_921
+GGTCGGGATAGACGCCCACTCCGCATCTATCGTTCCAGAAATTTTCCCATGTATATATCT
+CCGGCCGCCCGCCCATACCCCTAAGTGTTTTGAAAAGCTGTTTTATGATTTCATACATCT
+GAGATTGGTCGACTTTTGCTAATTCTGGTTTTGTTCTGTTTATTTTTTCTTGATTCCAAT
+CTATGCCCCCGACTCCCCTATTAACT
+>ds2020-328_922
+GAGTGGCTGCCGTGGACCTAGTCAGTAAACCGGGCCGTGGACCTAGTCGCCGCTTACCTT
+ACATTGACCGAACCTTTACTGCACCTCGCACTCACTCTCACAATGCCCCCCTCGCCCCTC
+TTTCTTACCACACGGAAAGAACTCGCCCTAATCCACCCCCACCCTCCACGAGTACTTCTT
+AAACTACTCCCATCGACTTCCCGACC
+>ds2020-328_923
+GGTCGGGATAGACGACCGTTACCCCTGTTGAAGATCTCTATCGATAGAGCATCAGCACTG
+ATAGGATGCTCGGGCATCCTCATTAACCGTTTTCTTCGGAAAATGGAACGGAATTTTCAA
+TTCTTCTCTTTTAAGGGTATACACCCGCTCTTTGGAGTTCGAATTCCAAAGTTAAGATGT
+ATTCCTTCTGTGGAGTCTTCCAACAT
+>ds2020-328_924
+GGTCGGGATAGACGGGCCCCCCTACGCTGGCGAATGCCCCCTTTCTCTTCTCTGAAGTCT
+ACAACAAGTGGGCGAGGCAGGATTCGAACCTACGTAGAAAAACTTCAACAGATTTACAGT
+CTGTCGCTTTTGACCGCTCGGCCACTCTCCCCTTCCCGGGCTGAGGCCCCCTCACTGGGT
+TCTAAGAAGGGGGCGCCGCCCTGAAT
+>ds2020-328_925
+AACCTGATGCCGCATGGAAGTTTCACAGTAGGCTGGGTAAATGTAACCAAAACTGAAGAT
+GAGAGGATTAAAGTTGAGCAAAAAAGAATCTCAAAACACATAAGGTTAACGCATGATTGT
+AACAAAAAACCAGGGACTAATTTGAGATCAGGTAGACAGGAAAGATTTGGACCAGAGGAA
+AAGTCAAGTAACCGTCTATCCCGACA
+>ds2020-328_926
+GGTCGGGATCGACGTTAAGCACCCCTGCTCTTGCATATGCCCTGGTGGAGTCCATGTCCT
+TAGGCGGCACCGGTGGCATACTCACACTTACACTATTAGCTGCGTATATTTTATGTACCC
+CAGTTCGCAGCGGGTGTAAATATTTTAGATTATGCCCATTCCACCTCATAACTGTCCCCA
+AAGCCCACAAGTCGTCTATCCCGACC
+>ds2020-328_927
+GGTCGGGATAGACGTGTCATGATTTTATGAAAGTAGGTTTGAATGAATTCCGCTCTTTGA
+TTTTGGTCTTTCAACGGGCCCTACAAGCTCATGTGTCAATTCTTCGCATTTTAAACCAAT
+TTATAGTGACCAAGAAAGACCAAAATCAAAGAGCGGAATTCATTCAAGCCTACTTACTTT
+TTACCTAACCAACGTCTATCCCGACC
+>ds2020-328_928
+TGGCCGGGATAGACGTGGAGCCGCCCTTTACTTGGATCTGGATCCCATCCCTAGCTCGTA
+AAGCTTGATTCCAGTTCCGTGTAGTCAGGGTGGTGCTTTTGGCCTTTACGCTCTGGTTGG
+TAATCGCGGTTGCTGCCCCTAGCCACTGACTATTCTTATTTAAGTAAGCCTACCCAGTTT
+AATCCCCCCAGGCGTCTATCCCGACC
+>ds2020-328_929
+TGAATTACGGCGGTCGGGATAGACGCCCCTTTCGCCTGGTCGGGATAGACGATAAATTTG
+GGGGTCGGGATAGACGGGACTACCATTATTCGTCTATCCCTGTCCACTCCAACCTGCCGT
+GGACCTAGTTCGCTGTAGCCTGCCGTGGACCTAGTCAATGAGTCCCTGCCGTGACCTAGT
+AGATTGATCATTACTAGGTCCACGGC
+>ds2020-328_930
+GCCGTGGACCTAGTCTATACCCCCTGCCGTGGACCTAGTTCGATGGCCGCTGCCGTGGAC
+CTAGTGGAAGGGGGATGGGCACTAGGTCCACGGCTCTCTGTCCGAATACGGCGGTCGGGA
+TAGACGTATTGATTCCCTGGTCGGGATAGACGTGGTCTTTCACTGGTCGGGTAGACGATT
+ATCAGGGTTCGCCGTCTATCCCGACC
+>ds2020-328_931
+GGTCGGGATAGACGGAATCCCCTCGGTCGGGATAGACGTTAATTCGCATGGTCGGGATAG
+ACTGGTGAGCTGCGTCTATCCTCGGACAGAGAGCCGTGGACCTAGTGGTCAAACCCGTGC
+CGTGGACCTAGTTACTGAATTGCTGCCGTGGACCTAGTAGGTGAGATACTAGATCCACGG
+CAGGGATCACAGACTAGGTCCACGGC
+>ds2020-328_932
+GGTCGGGATAGACGTATCCGATCGGTCCTTGTAACACTTCAGTTTCAAATATATCTTTAA
+CGAAATAACCTTCTTTAGTTAAATTATCGTTTTCCCACCCTTTATTCTTGCGATATGAAT
+TGGGAATGAACTTCCAAATTCTCATTTTATGATGAAACCTGTTTTCCGTATTTGCATTTA
+AGCCTGTTGTGGCGTCTATCCCGACC
+>ds2020-328_933
+GGTCGGGATTAGTATTGAACCTAGATAAATGTTATCAGGTGCCTACATTGAGCATGAATA
+TGATTATATCATGTTCATTGCAACACGGTCATTCATTTAAGTTAGAGAATAATGGTTATT
+CTGTTTACATGAATGATACCTTTCATGGTCATGCACCCTATGTGAATGGTTCATTGAATC
+TCGGTCGTGGTAAGAGGTTTCGCATC
+>ds2020-328_934
+GGTCGGGCTAGACGATCGAGAGTAGTCTGATTATGGGAACCGAGGCCGGCTACTGTGACG
+CAGCTAATGGTACGCTTATCCAAAAGGCAGGGGTAGCCCGAGAATGCCGCTCCCCCTTGA
+CCGTAAGCTGGTTGTCCCGTGTTATCCATATTTTGGGAAAGGGTTCGATCCCCATCGTCG
+ATGGTAAGCACTCGTCTATCCCGACC
+>ds2020-328_935
+TTCCCCTCCCGTTTGCGGCACTTAACATGAATGTAGTGCTGATAGAGGTTTCGATGAAGT
+CTAAGAAGTCCACCATCGACGAACCAGTATAATCAGAATCCACATGATGATAAATCTCCT
+TCATGTAATCTTTCCACGAAGCAATTGCACCTTTAGTATTCCAAGGCCTGAACCATTCAA
+ACATAACAGAATCGTCTATCCCGACC
+>ds2020-328_936
+TTTTAACTGCAACAACTTAAATATACGCTATTGGAGCTGGAATTACCGCGGCTGCTGGCA
+CCAGACTTGCCCTCCAATGGATCCTCGTTAAGGGATTTAGATTGTACTCATTCCAATTAC
+CAGACTCGATGAGCCCAGTATTGTTATTTATTGTCACTACCTCCCCATGTCAGGATTGGG
+TAATTAGTGGCGGCCGTT
+>ds2020-328_937
+TTCCTCACCACACTCCAAGCTTCTCTCCTGCCTGTTCCTCACCACACTCCAAGCTCCTCT
+CCAAGCCTGTTCCTCACCACATAAGACCGTCTATCCCGACCAGGGAATATGCTCGTCTAT
+CCCGACCCCCGTCTATCGTCTATCCCGACCGCCGTAATTCAGATC
+>ds2020-328_938
+GGTCGGGATAGACGAACACATTCCCTGGTCGGGATAGACGTTGCAATACGCTGGTCGGGA
+TAGACACGACTTGTTCTCGTCTATCCCCACCAGCGTATTGCAACGTCTATCCCGACCAGG
+GAATGTGTTCGTCTATCCCGACC
+>ds2020-328_939
+TACTCTCAGTACAATCTGCTCTGATGCCGCATAGTTAAGCCAGCCCCGACACCCGGGTCG
+GGATAGACGAATCTTCGCCCTACTCTCAGTACAATCTGCTCTGATGCCGCATAGTTAAGC
+CAGCCCCGACACCCG
+>ds2020-328_940
+ACCACTCAATTTATCGTCTATCCCGAAGTGTGAAAACCCGTCTATCCCGACCAGTGTGCC
+ACGACGTCTATCCCGACCACCACTCAATTTATCGTCTATCCCGAAGTGTGAAAACCCGTC
+TATCCCGACCAGT
+>ds2020-328_941
+TTATTCCCGACCTGCCGTGGACCTAGTCACTCACCCGGTGCCTGACCTAATCCTCTCTGC
+ACTGCCGTGGACCTAGTTATTCCCGACCTGCCGTGGACCTAGTCACTCACCCGGTGCCTG
+ACCTAATCCTC
+>ds2020-328_942
+GAATGGAGGTACTGAATGACTAGGTCCCGGCAAGCATGATATCAACGGGGATGTTCCTAT
+ATTCATTAACATTGGTGAATGGAGGTACTGAATGACTAGGTCCCGGCAAGCATGATATCA
+ACGGGGATGTT
+>ds2020-328_943
+AGTAAACTGGTGGCTTGTAGACTGGTGTGGGTGGTGGGGGAGACTTGTAGTGGTAGGGGT
+GCTTGGGTGGTGAAGGTGATGGTGGTGGTGGAGACTTGTAGTGGTAGGGGTGCTTGGGTG
+GTGAAGGTGA
+>ds2020-328_944
+CGTTCCACTGGTCGGGATAGACGATGATGTTTGCTGGTCGGATAGACATTCACCGGGTCG
+GGATAGACGCTACGTTCCACTGGTCGGGATAGACGATGATGTTTGCTGGTCGGATAGACA
+TTCACCG
+>ds2020-328_945
+CTGACCCCTGCCGTGGACCTATTTGTCAATCGCTGCCTGGACCTAGATCTTGTCGGCCGT
+GGACCTAGTAACCTGACCCCTGCCGTGGACCTATTTGTCAATCGCTGCCTGGACCTAGAT
+CTTGTCG
+>ds2020-328_946
+TCCACGGCCGTCGAATTAGGCCACGGCAGGCGTTTAATGACTAGGTCCACGGCAGGGGAA
+TGTATACTAGGTCCACGGCCGTCGAATTAGGCCACGGCAGGCGTTTAATGACTAGGTCCA
+CGGCAG
+>ds2020-328_947
+CTCCTCCACCACCCTCACCATCACCACCCAAGCATCCTTACCACTACAAGTCTCCACCAC
+CACCCTCACCTTCACCACCCAAGCACCCCTACCACTACAAGTCTCCACCACCACCATCAC
+>ds2020-328_948
+GCCCCCCCTTTCGCCCTTTTTTATGCAGACGATTCCCCGATCGGGGAATCGTCTGATTCC
+CTACGTATTAATCTTCTTCTTTTCTCCTTTTTCGCGTTTTCCTCTTATTCC
+>ds2020-328_949
+CCCTGCCGTGGACCTAGTTCCTTTCCACCTGCCGTGGACCTAGTAGAGTTGCCCCTGCCG
+TGGACCTAGTTCCTTTCCACCTGCCGTGGACCTAGTAGAGTTGCCCC
+>ds2020-328_950
+TTCTTCGATGATGCGCAAATTGAAGCTTCGGTACCCTTGTTTTTTCCAATCGCCCAATTT
+CTCTTCTTTCTTTTTTATTTCGGGTTTCTTTATTTTTTCAGGGGGG
+>ds2020-328_951
+AACCAAGAGCGCTTTTTCTTTCCATTCGCCTGGGACAAGGCCTCCCATCACGCTTCCATT
+GAAGAGTTAATCCTTCAAGTAGCGGTGGTGCACCCTGCCTGTACT
+>ds2020-328_952
+TGGAGTGATGGTGGCTTGTATGGTTTCTTAGGTGGTAGGGGTGGTGAGTAAACTGGTGGC
+TTGTAGACTGGTGTGGGTGGTGGGGGAGACTTGTAGTGGTA
+>ds2020-328_953
+AGCTTGGAGTGTGGTGAGGAACAGGCAGGAGAGAAGCTTGGAGTGTGGTGAGGAACAGGC
+AGGAGAGAAGCTTGGAGTGTGGTGAGGAA
+>ds2020-328_954
+GCTTAGGTGGTGAAGGTGATGGTGGTGGTGGAGACTTGTAGTGGTATGGGTGCTTAGGTG
+GTGAAGGTGATGGTGGTGGTGGAG
+>ds2020-328_955
+GATTGATTTCTTGTTTATTGGCGTCAGTGGTGAGGTTTGACACCATGTGTTTGAAGGAGG
+GATCGTGTGCGTCTATCCCGACC
+>ds2020-328_956
+CGTCTATCCCGACCAGCGATTGTGACCGTCTATCCCGACCAGGGCACTGCCACGTCTATC
+CCGACCGCCGTAATTCAGATC
+>ds2020-328_957
+TCGAAGAGGGGCTTGCTAAAGAGGCTCGAAGAGGGGCTTGCTAAAGAGGCTCGAAGAGGG
+GCTTGCTAAAGAGGCTCGAA
+>ds2020-328_958
+TGAATTACGGCGGTCGGGATAGACGAGCTAAACGCCTGGTCGGGATAGACGAACGTATTC
+TCTGGTCGGGATAGACG
+>ds2020-328_959
+GGAACACCAGTGGCGAAGGAAGGAACACCAGTGGCGAAGGAAGGAACACCAGTGGCGAAG
+GAAGGAACACCAGTGG
+>ds2020-328_960
+GAATTACGGCGGTCGGGATAGACGCGAAGCACCGGTGGTCGGGATAGACGGCCGACCCCC
+TTGGTCGGGATAGACG
+>ds2020-328_961
+TGGATTACGGCGGTCGGGATAGACGTTGACCGTGCCTGGTCGGGATAGACGAGTGAACCG
+CTGGTCGGGATAGACG
+>ds2020-328_962
+TGAATTACGGCGGTCGGGATAGACGCCAATCGCCCCTGGTCGGGATAGACGCAATACCAC
+CCTTCGGGATAGACG
+>ds2020-328_963
+CGTCTATCCCGACCAGGTCCCATTTTCGTCTATCCCGACCAAGGCTAAATGACGTCTATC
+CGCCGCCGTAATTCA
+>ds2020-328_964
+GAATTCGGCGGTCGGGATAGACGAAAGGAGCGGGGGTCGGGATAGACGATTGCTTGCCTT
+GGTCGGGATAGACG
+>ds2020-328_965
+TTAGACGTCTAGTGTCCCTGGTCGGGATAAACGGGGCAAATCGTCTATCCCGACCAGGGA
+CACTAGACGTCTAT
+>ds2020-328_966
+TCTATCCCGACCAGGGAAATACACCGTCTATCCCGACCAGGAGCGGGGTTCGTCTATCCG
+ACCGCCGAATTCA
+>ds2020-328_967
+AGGTAGTTTACTTGCTTACTTGTTAGAGTAAGGAAGAGAGGAAAAGGGTGCTGTCGTCTA
+TCCCGACCC
+>ds2020-328_968
+GTGATGGTGGTGGTGGAGACTTGTAGTGGTAGGGGTGCTTGGGTGGTGAAGGTGATGGTG
+GTGGTGGAG
+>ds2020-328_969
+CGTCTATCCCGACCAACGTCTATCCCGACCAGTGGTATTAATCGTCTATCCCGACCGCCG
+TAATTCA
+>ds2020-328_970
+GGTCGGGATAGACGCCGCGGTATCCTGGTCGGGATAGACGGTAATATTGCCTGGTCGGGA
+TAGACG
+>ds2020-328_971
+GGTCGGGATAGACGAGATAATTACCTGGTCGGGATAGACGTCATGAGTCCCTGGTCGGGA
+TAGACG
+>ds2020-328_972
+CGTCTATCCCGACCAGGCGGTGTATACGCCAATCCCGACCAGGGGGTTAGGGCGTCTATC
+CCGACC
+>ds2020-328_973
+GGTCGGGATAGACGGAACATGACGCTGGTCGGGATAGACGACATAGACCCCTGGTCGGGA
+TAGAC
+>ds2020-328_974
+TTCGAGCCTCTTTAGCAAGCCCCTCTTCGAGCCTCTTTAGCAAGCCCCTCTTCGAAAGAT
+TCTTT
+>ds2020-328_975
+GGTCGGGATAGACGATCACACCCTGGTCGGGATAGACGCACGAACAGGCTGGTCGGGATA
+GACG
+>ds2020-328_976
+AGTGATGTCAGTGATGTCAGTGATGTCAGTGATGTCAGTGATGTCAGTGATGTCAGTGAT
+GTCA
+>ds2020-328_977
+CGTCTATCCCGACCAGGGGCAAATTGCGTCTATCCCGACCAAATCCTTCGTCTATCCCGA
+CCG
+>ds2020-328_978
+GTAGGTCCGTAGGTCCGTAGGTCCGTAGGTCCGTAGGTCCGTAGGTCCGTAGGTCCGTAG
+GTC
+>ds2020-328_979
+GGTCGGGATAGACGGATGGACTCGTGGTCGTGATAGACGTTTCCCAGTCTGTCGGGATAG
+ACG
+>ds2020-328_980
+TCACTTTTCACTTTTCACTTTTCACTTTTCACTTTTCACTTTTCACTTTTCACTTTTCAC
+TT
+>ds2020-328_981
+CATACGTCATACGTCATACGTCATACGTCATACGTCATACGTCATACGTCATACGTCATA
+CG
+>ds2020-328_982
+GGTCGGGATAGACGAACAAAGACACTGGTCGGGATAGACGCTCGATACTACTGGTCGGGA
+TA
+>ds2020-328_983
+TTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGG
+T
+>ds2020-328_984
+GTGGTGGAGACTTGTAGTGGTATGGGTGCTTGGGTGGTGAAGGTGATGGTGGTGGGGGAG
+>ds2020-328_985
+CATCCATCCATCCATCCATCCATCCATCCATCCATCCATCCATCCATCCATCCATCCAT
+>ds2020-328_986
+TTCCGATCTGAATTACGGCGGTCGGGATAGACGATAGCCACCACTGGTCGGGATAGACG
+>ds2020-328_987
+GTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTG
+>ds2020-328_988
+GGTCGGGATAGACGCATGCATTGTCTGGTCGGGATAGACGGCGCGCTGCACTGTCGG
+>ds2020-328_989
+GGTCGGGATAGACGTTAGCACCCACTGGTCGGGATAGACGAGACAGTTAGCTGGTCG
+>ds2020-328_990
+GGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGG
+>ds2020-328_991
+GGTCGGGATAGACGTAGACAGCCCCCGGTCGGGATAGACGTTAATTTCTGCTGGTC
+>ds2020-328_992
+GGTCGGGATAGACGATTATGCTCTCTGGTCGGGATAGACGTGTGACTCCCCTGGTC
diff --git a/tools/virAnnot/test-data/otu_s2_rps.tab b/tools/virAnnot/test-data/otu_s2_rps.tab
new file mode 100755
index 00000000000..a1e48c88fba
--- /dev/null
+++ b/tools/virAnnot/test-data/otu_s2_rps.tab
@@ -0,0 +1,149 @@
+#query_id query_length cdd_id hit_id evalue startQ endQ frame description superkingdom no rank family genus
+"ds2020-328_1" "2975" "pfam00006" "gnl|CDD|376291" "6.25354e-106" "1359" "2033" "-1" "pfam00006, ATP-synt_ab, ATP synthase alpha/beta family, nucleotide-binding domain. This entry includes the ATP synthase alpha and beta subunits, the ATP synthase associated with flagella and the termination factor Rho." "Bacteria(0.88);Archaea(0.07);Eukaryota(0.05);" "(1.00);" "(0.07);Mycoplasmataceae(0.06);Clostridiaceae(0.04);Spirochaetaceae(0.03);Rhodobacteraceae(0.02);" "Mycoplasma(0.06);(0.03);Clostridium(0.03);Treponema(0.01);Persephonella(0.01);"
+"ds2020-328_1" "2975" "pfam00306" "gnl|CDD|366015" "1.33353e-53" "1008" "1340" "-1" "pfam00306, ATP-synt_ab_C, ATP synthase alpha/beta chain, C terminal domain. " "Bacteria(0.94);Eukaryota(0.06);" "(1.00);" "(0.08);Mycoplasmataceae(0.08);Clostridiaceae(0.06);Ruminococcaceae(0.03);Eubacteriaceae(0.02);" "Mycoplasma(0.07);(0.07);Clostridium(0.05);Eubacterium(0.02);Faecalibacterium(0.01);"
+"ds2020-328_1" "2975" "pfam02874" "gnl|CDD|367225" "8.80807e-19" "2202" "2405" "-1" "pfam02874, ATP-synt_ab_N, ATP synthase alpha/beta family, beta-barrel domain. This family includes the ATP synthase alpha and beta subunits the ATP synthase associated with flagella." "Bacteria(0.60);Eukaryota(0.28);Archaea(0.13);" "(1.00);" "Spirochaetaceae(0.04);Bacillaceae(0.04);Schizosaccharomycetaceae(0.03);Chlamydomonadaceae(0.03);Sulfolobaceae(0.03);" "Treponema(0.04);Schizosaccharomyces(0.03);Chlamydomonas(0.03);Bacillus(0.03);Thermotoga(0.02);"
+"ds2020-328_10" "1434" "pfam17917" "gnl|CDD|375428" "1.68574e-20" "187" "453" "-1" "pfam17917, RT_RNaseH, RNase H-like domain found in reverse transcriptase. DNA polymerase and ribonuclease H (RNase H) activities allow reverse transcriptases to convert the single-stranded retroviral RNA genome into double-stranded DNA, which is integrated into the host chromosome during infection. This entry represents the RNase H like domain." "unknown" "unknown" "unknown" "unknown"
+"ds2020-328_10" "1434" "pfam00078" "gnl|CDD|365856" "1.48081e-05" "920" "1051" "-3" "pfam00078, RVT_1, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses." "Eukaryota(0.62);Viruses(0.23);Bacteria(0.15);" "(0.77);Ortervirales(0.21);Poxviridae(0.02);" "Retroviridae(0.15);Drosophilidae(0.15);Brassicaceae(0.12);Enterobacteriaceae(0.09);Caulimoviridae(0.06);" "Drosophila(0.15);Arabidopsis(0.12);Lentivirus(0.08);Escherichia(0.08);Bombyx(0.05);"
+"ds2020-328_101" "454" "pfam14111" "gnl|CDD|372914" "8.33283e-09" "213" "353" "3" "pfam14111, DUF4283, Domain of unknown function (DUF4283). This domain family is found in plants, and is approximately 100 amino acids in length. Considering the very diverse range of other domains it is associated with it is possible that this domain is a binding/guiding region. There are two highly conserved tryptophan residues." "Eukaryota(1.00);" "(1.00);" "Salicaceae(0.35);Brassicaceae(0.27);Poaceae(0.13);Vitaceae(0.08);Solanaceae(0.06);" "Populus(0.35);Brassica(0.13);Arabidopsis(0.11);Brachypodium(0.10);Vitis(0.08);"
+"ds2020-328_106" "446" "pfam01348" "gnl|CDD|279664" "1.08017e-09" "40" "303" "-3" "pfam01348, Intron_maturas2, Type II intron maturase. Group II introns use intron-encoded reverse transcriptase, maturase and DNA endonuclease activities for site-specific insertion into DNA. Although this type of intron is self splicing in vitro they require a maturase protein for splicing in vivo. It has been shown that a specific region of the aI2 intron is needed for the maturase function. This region was found to be conserved in group II introns and called domain X." "Eukaryota(1.00);" "(1.00);" "Saccharomycetaceae(0.40);Brassicaceae(0.20);Schizosaccharomycetaceae(0.20);Poaceae(0.20);" "Saccharomyces(0.40);Hordeum(0.20);Schizosaccharomyces(0.20);Baimashania(0.20);"
+"ds2020-328_109" "442" "pfam02123" "gnl|CDD|280316" "1.59804e-23" "115" "429" "-2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_113" "433" "pfam00253" "gnl|CDD|376307" "1.11487e-07" "329" "415" "2" "pfam00253, Ribosomal_S14, Ribosomal protein S14p/S29e. This family includes both ribosomal S14 from prokaryotes and S29 from eukaryotes." "Bacteria(0.75);Eukaryota(0.25);" "(1.00);" "(0.08);Clostridiaceae(0.02);Mycoplasmataceae(0.02);Lactobacillaceae(0.02);Saccharomycetaceae(0.02);" "(0.03);Clostridium(0.02);Lactobacillus(0.02);Mycoplasma(0.02);"
+"ds2020-328_115" "426" "pfam00078" "gnl|CDD|365856" "4.24722e-08" "268" "405" "-1" "pfam00078, RVT_1, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses." "Eukaryota(0.62);Viruses(0.23);Bacteria(0.15);" "(0.77);Ortervirales(0.21);Poxviridae(0.02);" "Retroviridae(0.15);Drosophilidae(0.15);Brassicaceae(0.12);Enterobacteriaceae(0.09);Caulimoviridae(0.06);" "Drosophila(0.15);Arabidopsis(0.12);Lentivirus(0.08);Escherichia(0.08);Bombyx(0.05);"
+"ds2020-328_115" "426" "pfam17919" "gnl|CDD|375430" "4.69948e-06" "13" "81" "-1" "pfam17919, RT_RNaseH_2, RNase H-like domain found in reverse transcriptase. " "unknown" "unknown" "unknown" "unknown"
+"ds2020-328_118" "424" "pfam00665" "gnl|CDD|366234" "6.81632e-21" "93" "413" "3" "pfam00665, rve, Integrase core domain. Integrase mediates integration of a DNA copy of the viral genome into the host chromosome. Integrase is composed of three domains. The amino-terminal domain is a zinc binding domain pfam02022. This domain is the central catalytic domain. The carboxyl terminal domain that is a non-specific DNA binding domain pfam00552. The catalytic domain acts as an endonuclease when two nucleotides are removed from the 3' ends of the blunt-ended viral DNA made by reverse transcription. This domain also catalyzes the DNA strand transfer reaction of the 3' ends of the viral DNA to the 5' ends of the integration site." "Bacteria(0.76);Viruses(0.14);Eukaryota(0.09);Archaea(0.01);" "(0.86);Ortervirales(0.12);Inoviridae(0.03);" "Retroviridae(0.12);Mycobacteriaceae(0.09);Streptococcaceae(0.08);Enterobacteriaceae(0.06);Burkholderiaceae(0.05);" "Mycobacterium(0.09);Streptomyces(0.05);Escherichia(0.05);Burkholderia(0.04);Sinorhizobium(0.04);"
+"ds2020-328_124" no_hit
+"ds2020-328_136" "372" "pfam02123" "gnl|CDD|280316" "8.1339e-10" "160" "363" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_15" "1120" "pfam00146" "gnl|CDD|376297" "8.26121e-18" "936" "1097" "-3" "pfam00146, NADHdh, NADH dehydrogenase. " "Bacteria(0.78);Archaea(0.12);Eukaryota(0.10);" "(1.00);" "(0.04);Peptococcaceae(0.02);Flavobacteriaceae(0.02);Desulfurococcaceae(0.02);Prevotellaceae(0.02);" "(0.02);Prevotella(0.02);Bacteroides(0.01);"
+"ds2020-328_153" "353" "pfam01385" "gnl|CDD|366606" "1.33121e-13" "52" "330" "-3" "pfam01385, OrfB_IS605, Probable transposase. This family includes IS891, IS1136 and IS1341. DUF1225, pfam06774, has now been merged into this family." "Bacteria(0.57);Archaea(0.38);Viruses(0.05);" "(0.95);Bicaudaviridae(0.05);" "Sulfolobaceae(0.19);Mycobacteriaceae(0.10);Thermoproteaceae(0.10);Synergistaceae(0.05);Halorubraceae(0.05);" "Caldivirga(0.10);Mycobacterium(0.10);Saccharolobus(0.10);Sulfurisphaera(0.05);Synechocystis(0.05);"
+"ds2020-328_154" "351" "pfam00146" "gnl|CDD|376297" "1.33812e-16" "131" "331" "-3" "pfam00146, NADHdh, NADH dehydrogenase. " "Bacteria(0.78);Archaea(0.12);Eukaryota(0.10);" "(1.00);" "(0.04);Peptococcaceae(0.02);Flavobacteriaceae(0.02);Desulfurococcaceae(0.02);Prevotellaceae(0.02);" "(0.02);Prevotella(0.02);Bacteroides(0.01);"
+"ds2020-328_170" "343" "pfam02123" "gnl|CDD|280316" "1.56034e-16" "85" "330" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_172" "338" "pfam02123" "gnl|CDD|280316" "9.08289e-09" "87" "305" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_176" "336" "pfam00361" "gnl|CDD|366050" "7.24395e-08" "101" "256" "-3" "pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla." "Eukaryota(0.54);Bacteria(0.46);" "(1.00);" "Culicidae(0.23);Rhodobacteraceae(0.23);Poaceae(0.15);Enterobacteriaceae(0.15);Phasianidae(0.08);" "Paracoccus(0.23);Anopheles(0.23);Escherichia(0.15);Zea(0.15);Aspergillus(0.08);"
+"ds2020-328_177" "335" "pfam00346" "gnl|CDD|366043" "6.6413e-32" "147" "314" "3" "pfam00346, Complex1_49kDa, Respiratory-chain NADH dehydrogenase, 49 Kd subunit. " "Bacteria(0.80);Eukaryota(0.11);Archaea(0.09);" "(1.00);" "(0.06);Rhodobacteraceae(0.02);Acetobacteraceae(0.02);Campylobacteraceae(0.02);Rhodospirillaceae(0.02);" "(0.01);Geobacter(0.01);Campylobacter(0.01);Archaeoglobus(0.01);"
+"ds2020-328_188" no_hit
+"ds2020-328_193" "321" "pfam03040" "gnl|CDD|367312" "3.21306e-19" "69" "296" "3" "pfam03040, CemA, CemA family. Members of this family are probable integral membrane proteins. Their molecular function is unknown. CemA proteins are found in the inner envelope membrane of chloroplasts but not in the thylakoid membrane. A cyanobacterial member of this family has been implicated in CO2 transport, but is probably not a CO2 transporter itself. They are predicted to be haem-binding however this has not been proven experimentally." "Bacteria(0.77);Eukaryota(0.23);" "(1.00);" "Synechococcaceae(0.17);Aphanothecaceae(0.08);Microcoleaceae(0.06);Chlorellaceae(0.04);Merismopediaceae(0.04);" "Synechococcus(0.13);Oscillatoria(0.04);Physcomitrella(0.04);Microcystis(0.04);Synechocystis(0.04);"
+"ds2020-328_196" "318" "pfam02123" "gnl|CDD|280316" "1.94206e-07" "6" "284" "-2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_197" "318" "pfam03154" "gnl|CDD|367360" "8.39525e-05" "24" "158" "-2" "pfam03154, Atrophin-1, Atrophin-1 family. Atrophin-1 is the protein product of the dentatorubral-pallidoluysian atrophy (DRPLA) gene. DRPLA OMIM:125370 is a progressive neurodegenerative disorder. It is caused by the expansion of a CAG repeat in the DRPLA gene on chromosome 12p. This results in an extended polyglutamine region in atrophin-1, that is thought to confer toxicity to the protein, possibly through altering its interactions with other proteins. The expansion of a CAG repeat is also the underlying defect in six other neurodegenerative disorders, including Huntington's disease. One interaction of expanded polyglutamine repeats that is thought to be pathogenic is that with the short glutamine repeat in the transcriptional coactivator CREB binding protein, CBP. This interaction draws CBP away from its usual nuclear location to the expanded polyglutamine repeat protein aggregates that are characteristic of the polyglutamine neurodegenerative disorders. This interferes with CBP-mediated transcription and causes cytotoxicity." "Eukaryota(1.00);" "(1.00);" "Muridae(0.20);Coelacanthidae(0.20);Characidae(0.20);Cyprinidae(0.20);Cichlidae(0.20);" "Rattus(0.20);Danio(0.20);Astyanax(0.20);Oreochromis(0.20);Latimeria(0.20);"
+"ds2020-328_199" "316" "pfam13650" "gnl|CDD|379313" "2.17852e-11" "2" "229" "-1" "pfam13650, Asp_protease_2, Aspartyl protease. This family consists of predicted aspartic proteases, typically from 180 to 230 amino acids in length, in MEROPS clan AA. This model describes the well-conserved 121-residue C-terminal region. The poorly conserved, variable length N-terminal region usually contains a predicted transmembrane helix." "Bacteria(0.81);Eukaryota(0.17);Archaea(0.02);" "(1.00);" "Flavobacteriaceae(0.06);Bacteroidaceae(0.06);Rhizobiaceae(0.05);Caulobacteraceae(0.05);Cytophagaceae(0.04);" "Bacteroides(0.06);Geobacter(0.02);Phenylobacterium(0.02);Agrobacterium(0.02);Spirosoma(0.02);"
+"ds2020-328_207" "313" "pfam02123" "gnl|CDD|280316" "1.55736e-08" "34" "306" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_210" "311" "pfam00124" "gnl|CDD|365890" "2.92409e-39" "14" "283" "2" "pfam00124, Photo_RC, Photosynthetic reaction centre protein. " "Bacteria(0.95);Eukaryota(0.05);" "(1.00);" "Rhodobacteraceae(0.13);Chromatiaceae(0.13);Ectothiorhodospiraceae(0.08);Synechococcaceae(0.05);(0.05);" "Rhodobacter(0.08);Sphingomonas(0.05);Halorhodospira(0.05);Roseiflexus(0.05);Thioflavicoccus(0.05);"
+"ds2020-328_219" "306" "pfam07727" "gnl|CDD|369488" "2.43458e-28" "22" "285" "-1" "pfam07727, RVT_2, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses. This Pfam entry includes reverse transcriptases not recognized by the pfam00078 model." "Eukaryota(1.00);" "(1.00);" "Debaryomycetaceae(0.83);Saccharomycetaceae(0.17);" "Candida(0.50);Debaryomyces(0.33);Saccharomyces(0.17);"
+"ds2020-328_222" "304" "pfam00471" "gnl|CDD|376336" "2.61553e-13" "31" "201" "-2" "pfam00471, Ribosomal_L33, Ribosomal protein L33. " "Bacteria(0.86);Eukaryota(0.14);" "(1.00);" "(0.07);Mycoplasmataceae(0.07);Clostridiaceae(0.06);Bacillaceae(0.03);Lactobacillaceae(0.03);" "Mycoplasma(0.06);Clostridium(0.05);(0.04);Lactobacillus(0.02);Bacillus(0.02);"
+"ds2020-328_226" "300" "pfam02123" "gnl|CDD|280316" "5.93549e-06" "76" "276" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_229" "299" "pfam02123" "gnl|CDD|280316" "2.23217e-17" "58" "276" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_235" "295" "pfam00006" "gnl|CDD|376291" "7.80612e-20" "51" "284" "3" "pfam00006, ATP-synt_ab, ATP synthase alpha/beta family, nucleotide-binding domain. This entry includes the ATP synthase alpha and beta subunits, the ATP synthase associated with flagella and the termination factor Rho." "Bacteria(0.88);Archaea(0.07);Eukaryota(0.05);" "(1.00);" "(0.07);Mycoplasmataceae(0.06);Clostridiaceae(0.04);Spirochaetaceae(0.03);Rhodobacteraceae(0.02);" "Mycoplasma(0.06);(0.03);Clostridium(0.03);Treponema(0.01);Persephonella(0.01);"
+"ds2020-328_241" no_hit
+"ds2020-328_244" "292" "pfam01737" "gnl|CDD|366779" "1.98587e-12" "60" "224" "3" "pfam01737, Ycf9, YCF9. This family consists of the hypothetical protein product of the YCF9 gene from chloroplasts and cyanobacteria. These proteins have no known function." "Bacteria(0.76);Eukaryota(0.24);" "(1.00);" "Synechococcaceae(0.15);Prochloraceae(0.09);Phaeodactylaceae(0.06);Bathycoccaceae(0.03);Poaceae(0.03);" "Synechococcus(0.12);Prochlorococcus(0.09);Phaeodactylum(0.06);Stanieria(0.03);Acaryochloris(0.03);"
+"ds2020-328_249" "290" "pfam00115" "gnl|CDD|376293" "5.40542e-13" "18" "248" "3" "pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I. " "Bacteria(0.87);Archaea(0.09);Eukaryota(0.04);" "(1.00);" "(0.07);Sulfolobaceae(0.03);Flavobacteriaceae(0.03);Bacillaceae(0.02);Burkholderiaceae(0.02);" "(0.03);Methylobacterium(0.01);Hyphomicrobium(0.01);Rhodanobacter(0.01);"
+"ds2020-328_251" "288" "pfam02123" "gnl|CDD|280316" "1.42582e-09" "22" "270" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_26" "872" "pfam01443" "gnl|CDD|366646" "1.90681e-33" "10" "699" "-3" "pfam01443, Viral_helicase1, Viral (Superfamily 1) RNA helicase. Helicase activity for this family has been demonstrated and NTPase activity. This helicase has multiple roles at different stages of viral RNA replication, as dissected by mutational analysis." "Viruses(1.00);" "Riboviria(0.99);unclassified viruses(0.01);" "Alphaflexiviridae(0.36);Virgaviridae(0.24);Betaflexiviridae(0.15);Tymoviridae(0.10);Bromoviridae(0.07);" "Potexvirus(0.26);Allexivirus(0.10);Tymovirus(0.08);Carlavirus(0.08);Tobamovirus(0.08);"
+"ds2020-328_272" "281" "pfam00253" "gnl|CDD|376307" "1.57301e-14" "125" "256" "2" "pfam00253, Ribosomal_S14, Ribosomal protein S14p/S29e. This family includes both ribosomal S14 from prokaryotes and S29 from eukaryotes." "Bacteria(0.75);Eukaryota(0.25);" "(1.00);" "(0.08);Clostridiaceae(0.02);Mycoplasmataceae(0.02);Lactobacillaceae(0.02);Saccharomycetaceae(0.02);" "(0.03);Clostridium(0.02);Lactobacillus(0.02);Mycoplasma(0.02);"
+"ds2020-328_273" "280" "pfam13976" "gnl|CDD|372857" "1.39388e-05" "38" "160" "-1" "pfam13976, gag_pre-integrs, GAG-pre-integrase domain. This domain is found associated with retroviral insertion elements and lies just upstream of the integrase region on the polyproteins." "Eukaryota(1.00);" "(1.00);" "Vitaceae(0.49);Poaceae(0.30);Brassicaceae(0.11);Trichocomaceae(0.02);Fabaceae(0.01);" "Vitis(0.49);Oryza(0.28);Arabidopsis(0.10);Talaromyces(0.02);Zea(0.02);"
+"ds2020-328_285" "275" "pfam00954" "gnl|CDD|366384" "3.5917e-06" "91" "264" "-3" "pfam00954, S_locus_glycop, S-locus glycoprotein domain. In Brassicaceae, self-incompatible plants have a self/non-self recognition system. This is sporophytically controlled by multiple alleles at a single locus (S). S-locus glycoproteins, as well as S-receptor kinases, are in linkage with the S-alleles. This region is inferred to be a domain due to it having other domains adjacent to it." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.96);Poaceae(0.04);" "Arabidopsis(0.89);Brassica(0.07);Sorghum(0.04);"
+"ds2020-328_29" "847" "pfam13456" "gnl|CDD|372609" "2.18686e-07" "176" "397" "2" "pfam13456, RVT_3, Reverse transcriptase-like. This domain is found in plants and appears to be part of a retrotransposon." "Eukaryota(0.85);Bacteria(0.15);" "(1.00);" "Euphorbiaceae(0.30);Brassicaceae(0.22);Poaceae(0.22);Aphanothecaceae(0.11);Peronosporaceae(0.04);" "Ricinus(0.30);Arabidopsis(0.22);Oryza(0.19);Gloeothece(0.07);Synechocystis(0.04);"
+"ds2020-328_293" "272" "pfam02123" "gnl|CDD|280316" "4.40145e-17" "17" "259" "-2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_295" no_hit
+"ds2020-328_300" "271" "pfam02392" "gnl|CDD|308156" "2.01502e-45" "15" "239" "-3" "pfam02392, Ycf4, Ycf4. This family consists of hypothetical Ycf4 proteins from various chloroplast genomes. It has been suggested that Ycf4 is involved in the assembly and/or stability of the photosystem I complex in chloroplasts." "Bacteria(0.78);Eukaryota(0.22);" "(1.00);" "Synechococcaceae(0.17);Aphanothecaceae(0.09);Prochloraceae(0.07);Microcoleaceae(0.06);Oscillatoriaceae(0.04);" "Synechococcus(0.13);Prochlorococcus(0.07);Oscillatoria(0.04);Gloeobacter(0.04);Cyanobium(0.02);"
+"ds2020-328_303" "271" "pfam02123" "gnl|CDD|280316" "5.58457e-14" "3" "206" "-3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_309" "270" "pfam07727" "gnl|CDD|369488" "1.02409e-13" "2" "157" "-3" "pfam07727, RVT_2, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses. This Pfam entry includes reverse transcriptases not recognized by the pfam00078 model." "Eukaryota(1.00);" "(1.00);" "Debaryomycetaceae(0.83);Saccharomycetaceae(0.17);" "Candida(0.50);Debaryomyces(0.33);Saccharomyces(0.17);"
+"ds2020-328_312" no_hit
+"ds2020-328_319" "268" "pfam00112" "gnl|CDD|365882" "8.20186e-05" "73" "150" "1" "pfam00112, Peptidase_C1, Papain family cysteine protease. " "Eukaryota(0.96);Viruses(0.03);" "(0.97);Baculoviridae(0.03);" "Rhabditidae(0.10);Poaceae(0.07);Fabaceae(0.07);Haemonchidae(0.06);Brassicaceae(0.06);" "Caenorhabditis(0.10);Arabidopsis(0.05);Haemonchus(0.05);Homo(0.04);Entamoeba(0.03);"
+"ds2020-328_322" "268" "pfam01425" "gnl|CDD|366635" "5.34115e-12" "33" "248" "3" "pfam01425, Amidase, Amidase. " "Bacteria(0.58);Eukaryota(0.32);Archaea(0.10);" "(1.00);" "Mycobacteriaceae(0.19);Rhabditidae(0.10);Archaeoglobaceae(0.06);Aspergillaceae(0.06);Merismopediaceae(0.06);" "Mycobacterium(0.19);Caenorhabditis(0.10);Synechocystis(0.06);Aspergillus(0.06);Saccharomyces(0.06);"
+"ds2020-328_326" "267" "pfam00385" "gnl|CDD|366065" "3.90569e-05" "64" "192" "1" "pfam00385, Chromo, Chromo (CHRromatin Organisation MOdifier) domain. " "Eukaryota(1.00);" "(1.00);" "Hominidae(0.18);Drosophilidae(0.13);Schizosaccharomycetaceae(0.09);Rhabditidae(0.08);Brassicaceae(0.07);" "Homo(0.16);Drosophila(0.13);Schizosaccharomyces(0.09);Caenorhabditis(0.08);Arabidopsis(0.07);"
+"ds2020-328_335" "266" "pfam02123" "gnl|CDD|280316" "2.32783e-14" "26" "265" "2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_361" "260" "pfam00069" "gnl|CDD|365850" "2.38711e-21" "15" "242" "3" "pfam00069, Pkinase, Protein kinase domain. " "Eukaryota(1.00);" "(1.00);" "Saccharomycetaceae(0.31);Hominidae(0.17);Muridae(0.14);Schizosaccharomycetaceae(0.11);Drosophilidae(0.06);" "Saccharomyces(0.31);Homo(0.17);Schizosaccharomyces(0.11);Rattus(0.08);Drosophila(0.06);"
+"ds2020-328_364" "259" "pfam02491" "gnl|CDD|376796" "1.8796e-18" "85" "249" "1" "pfam02491, SHS2_FTSA, SHS2 domain inserted in FTSA. FtsA is essential for bacterial cell division, and co-localizes to the septal ring with FtsZ. The SHS2 domain is inserted in to the RNAseH fold of FtsA, and is involved in protein-protein interaction." "Bacteria(1.00);" "(1.00);" "(0.07);Prevotellaceae(0.04);Spirochaetaceae(0.04);Flavobacteriaceae(0.03);Helicobacteraceae(0.02);" "(0.04);Prevotella(0.04);Clostridium(0.02);Helicobacter(0.02);Bacteroides(0.02);"
+"ds2020-328_37" "681" "pfam00416" "gnl|CDD|366086" "4.04787e-35" "92" "409" "-3" "pfam00416, Ribosomal_S13, Ribosomal protein S13/S18. This family includes ribosomal protein S13 from prokaryotes and S18 from eukaryotes." "Eukaryota(0.55);Bacteria(0.27);Archaea(0.18);" "(1.00);" "Brassicaceae(0.18);Muridae(0.09);Poaceae(0.09);Drosophilidae(0.09);Mycobacteriaceae(0.09);" "Arabidopsis(0.18);Geobacillus(0.09);Rattus(0.09);Haloarcula(0.09);Shigella(0.09);"
+"ds2020-328_386" "255" "pfam04332" "gnl|CDD|367905" "1.67088e-13" "22" "162" "1" "pfam04332, DUF475, Protein of unknown function (DUF475). Predicted to be an integral membrane protein with multiple membrane spans." "Bacteria(1.00);" "(1.00);" "Mycobacteriaceae(0.29);Sphingomonadaceae(0.14);Streptococcaceae(0.14);Xanthomonadaceae(0.14);Deinococcaceae(0.14);" "Mycobacterium(0.29);Deinococcus(0.14);Streptomyces(0.14);Lactococcus(0.14);Xylella(0.14);"
+"ds2020-328_388" "255" "pfam05919" "gnl|CDD|253459" "2.68273e-30" "4" "237" "-1" "pfam05919, Mitovir_RNA_pol, Mitovirus RNA-dependent RNA polymerase. This family consists of several Mitovirus RNA-dependent RNA polymerase proteins. The family also contains fragment matches in the mitochondria of Arabidopsis thaliana." "Viruses(0.90);Eukaryota(0.10);" "Riboviria(0.90);(0.10);" "Narnaviridae(0.90);Ceratobasidiaceae(0.10);" "Mitovirus(0.90);Thanatephorus(0.10);"
+"ds2020-328_395" "254" "pfam02123" "gnl|CDD|280316" "3.0801e-11" "25" "240" "-3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_4" "2545" "pfam00177" "gnl|CDD|365924" "1.11505e-28" "229" "618" "1" "pfam00177, Ribosomal_S7, Ribosomal protein S7p/S5e. This family contains ribosomal protein S7 from prokaryotes and S5 from eukaryotes." "Bacteria(0.79);Archaea(0.11);Eukaryota(0.10);" "(1.00);" "(0.09);Clostridiaceae(0.04);Mycoplasmataceae(0.03);Spirochaetaceae(0.02);Ruminococcaceae(0.01);" "(0.04);Clostridium(0.04);Mycoplasma(0.03);Treponema(0.01);Desulfovibrio(0.01);"
+"ds2020-328_401" "253" "pfam02123" "gnl|CDD|280316" "1.12879e-10" "29" "193" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_414" "251" "pfam02123" "gnl|CDD|280316" "1.26275e-09" "31" "234" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_415" "251" "pfam01058" "gnl|CDD|376447" "2.16687e-17" "20" "229" "-2" "pfam01058, Oxidored_q6, NADH ubiquinone oxidoreductase, 20 Kd subunit. " "Bacteria(0.70);Archaea(0.30);" "(1.00);" "(0.05);Syntrophobacteraceae(0.04);Aquificaceae(0.04);Methanosarcinaceae(0.04);Thermococcaceae(0.04);" "Methanosarcina(0.04);Syntrophobacter(0.04);Pyrococcus(0.03);Geobacter(0.03);Methanococcus(0.03);"
+"ds2020-328_419" "250" "pfam10369" "gnl|CDD|378420" "1.59899e-17" "75" "212" "-3" "pfam10369, ALS_ss_C, Small subunit of acetolactate synthase. ALS_ss_C is the C-terminal half of a family of proteins which are the small subunits of acetolactate synthase. Acetolactate synthase is a tetrameric enzyme, containing probably two large and two small subunits, which catalyzes the first step in branched-chain amino acid biosynthesis. This reaction is sensitive to certain herbicides." "Bacteria(0.90);Archaea(0.06);Eukaryota(0.04);" "(1.00);" "(0.07);Clostridiaceae(0.06);Lachnospiraceae(0.05);Ruminococcaceae(0.03);Peptococcaceae(0.03);" "Clostridium(0.06);(0.05);Eubacterium(0.03);Ruminococcus(0.02);Roseburia(0.02);"
+"ds2020-328_43" "644" "pfam00078" "gnl|CDD|365856" "2.15977e-08" "190" "636" "-3" "pfam00078, RVT_1, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses." "Eukaryota(0.62);Viruses(0.23);Bacteria(0.15);" "(0.77);Ortervirales(0.21);Poxviridae(0.02);" "Retroviridae(0.15);Drosophilidae(0.15);Brassicaceae(0.12);Enterobacteriaceae(0.09);Caulimoviridae(0.06);" "Drosophila(0.15);Arabidopsis(0.12);Lentivirus(0.08);Escherichia(0.08);Bombyx(0.05);"
+"ds2020-328_430" "248" "pfam00931" "gnl|CDD|366375" "1.82192e-16" "27" "245" "-1" "pfam00931, NB-ARC, NB-ARC domain. " "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.75);Solanaceae(0.12);Hominidae(0.12);" "Arabidopsis(0.75);Solanum(0.12);Homo(0.12);"
+"ds2020-328_431" "247" "pfam01788" "gnl|CDD|366811" "4.75718e-09" "24" "116" "3" "pfam01788, PsbJ, PsbJ. This family consists of the photosystem II reaction centre protein PsbJ from plants and Cyanobacteria. In Synechocystis sp. PCC 6803 PsbJ regulates the number of photosystem II centers in thylakoid membranes, it is a predicted 4kDa protein with one membrane spanning domain." "Bacteria(0.65);Eukaryota(0.35);" "(1.00);" "Microcoleaceae(0.12);Prochloraceae(0.08);Oscillatoriaceae(0.08);Synechococcaceae(0.08);Chroococcaceae(0.08);" "Oscillatoria(0.08);Prochlorococcus(0.08);Synechococcus(0.08);Ectocarpus(0.04);Arenga(0.04);"
+"ds2020-328_432" "247" "pfam00116" "gnl|CDD|365885" "2.6628e-32" "16" "159" "1" "pfam00116, COX2, Cytochrome C oxidase subunit II, periplasmic domain. " "Eukaryota(1.00);" "(1.00);" "Saccharomycetaceae(0.09);Sordariaceae(0.09);Phasianidae(0.09);Cercopithecidae(0.09);Schizosaccharomycetaceae(0.09);" "Gallus(0.09);Triticum(0.09);Sus(0.09);Neurospora(0.09);Oryzias(0.09);"
+"ds2020-328_452" no_hit
+"ds2020-328_457" no_hit
+"ds2020-328_462" "244" "pfam02123" "gnl|CDD|280316" "7.52004e-11" "18" "236" "3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_464" "244" "pfam00421" "gnl|CDD|366090" "1.67641e-26" "57" "242" "-3" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-328_47" "623" "pfam00346" "gnl|CDD|366043" "7.39818e-56" "191" "496" "-2" "pfam00346, Complex1_49kDa, Respiratory-chain NADH dehydrogenase, 49 Kd subunit. " "Bacteria(0.80);Eukaryota(0.11);Archaea(0.09);" "(1.00);" "(0.06);Rhodobacteraceae(0.02);Acetobacteraceae(0.02);Campylobacteraceae(0.02);Rhodospirillaceae(0.02);" "(0.01);Geobacter(0.01);Campylobacter(0.01);Archaeoglobus(0.01);"
+"ds2020-328_473" "243" "pfam00146" "gnl|CDD|376297" "3.36196e-12" "16" "114" "1" "pfam00146, NADHdh, NADH dehydrogenase. " "Bacteria(0.78);Archaea(0.12);Eukaryota(0.10);" "(1.00);" "(0.04);Peptococcaceae(0.02);Flavobacteriaceae(0.02);Desulfurococcaceae(0.02);Prevotellaceae(0.02);" "(0.02);Prevotella(0.02);Bacteroides(0.01);"
+"ds2020-328_476" "243" "pfam02123" "gnl|CDD|280316" "1.20816e-09" "22" "237" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_485" no_hit
+"ds2020-328_490" "241" "pfam00016" "gnl|CDD|365810" "1.89423e-13" "2" "121" "2" "pfam00016, RuBisCO_large, Ribulose bisphosphate carboxylase large chain, catalytic domain. The C-terminal domain of RuBisCO large chain is the catalytic domain adopting a TIM barrel fold." "Bacteria(0.89);Eukaryota(0.05);Archaea(0.05);" "(1.00);" "Rhodospirillaceae(0.11);Oceanospirillaceae(0.11);Rhodobacteraceae(0.11);Prochloraceae(0.05);Thalassiosiraceae(0.05);" "Marinomonas(0.11);Magnetospirillum(0.05);Saccharomonospora(0.05);Rhodospirillum(0.05);Paenibacillus(0.05);"
+"ds2020-328_491" "241" "pfam02123" "gnl|CDD|280316" "7.45437e-11" "2" "241" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_497" "240" "pfam01501" "gnl|CDD|279798" "4.58533e-06" "38" "202" "2" "pfam01501, Glyco_transf_8, Glycosyl transferase family 8. This family includes enzymes that transfer sugar residues to donor molecules. Members of this family are involved in lipopolysaccharide biosynthesis and glycogen synthesis. This family includes Lipopolysaccharide galactosyltransferase, lipopolysaccharide glucosyltransferase 1, and glycogenin glucosyltransferase." "Eukaryota(0.62);Bacteria(0.38);" "(1.00);" "Brassicaceae(0.54);Enterobacteriaceae(0.12);Pasteurellaceae(0.12);Helicobacteraceae(0.08);Bacillaceae(0.04);" "Arabidopsis(0.54);Haemophilus(0.08);Salmonella(0.08);Helicobacter(0.08);Bacillus(0.04);"
+"ds2020-328_50" "620" "pfam00115" "gnl|CDD|376293" "1.44178e-51" "78" "548" "3" "pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I. " "Bacteria(0.87);Archaea(0.09);Eukaryota(0.04);" "(1.00);" "(0.07);Sulfolobaceae(0.03);Flavobacteriaceae(0.03);Bacillaceae(0.02);Burkholderiaceae(0.02);" "(0.03);Methylobacterium(0.01);Hyphomicrobium(0.01);Rhodanobacter(0.01);"
+"ds2020-328_517" "237" "pfam00361" "gnl|CDD|366050" "5.54755e-11" "18" "224" "3" "pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla." "Eukaryota(0.54);Bacteria(0.46);" "(1.00);" "Culicidae(0.23);Rhodobacteraceae(0.23);Poaceae(0.15);Enterobacteriaceae(0.15);Phasianidae(0.08);" "Paracoccus(0.23);Anopheles(0.23);Escherichia(0.15);Zea(0.15);Aspergillus(0.08);"
+"ds2020-328_52" "598" "pfam00115" "gnl|CDD|376293" "2.60011e-33" "21" "302" "3" "pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I. " "Bacteria(0.87);Archaea(0.09);Eukaryota(0.04);" "(1.00);" "(0.07);Sulfolobaceae(0.03);Flavobacteriaceae(0.03);Bacillaceae(0.02);Burkholderiaceae(0.02);" "(0.03);Methylobacterium(0.01);Hyphomicrobium(0.01);Rhodanobacter(0.01);"
+"ds2020-328_536" "236" "pfam00453" "gnl|CDD|376335" "3.91827e-17" "51" "188" "3" "pfam00453, Ribosomal_L20, Ribosomal protein L20. " "Bacteria(0.90);Eukaryota(0.10);" "(1.00);" "(0.10);Clostridiaceae(0.05);Mycoplasmataceae(0.03);Spirochaetaceae(0.02);Synergistaceae(0.02);" "(0.06);Clostridium(0.04);Mycoplasma(0.03);Treponema(0.01);"
+"ds2020-328_560" "233" "pfam00421" "gnl|CDD|366090" "1.00705e-37" "17" "232" "2" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-328_562" "233" "pfam00201" "gnl|CDD|278624" "3.71727e-13" "22" "195" "1" "pfam00201, UDPGT, UDP-glucoronosyl and UDP-glucosyl transferase. " "Eukaryota(1.00);" "(1.00);" "Hominidae(0.46);Muridae(0.31);Leporidae(0.15);Poaceae(0.08);" "Homo(0.46);Rattus(0.31);Oryctolagus(0.15);Zea(0.08);"
+"ds2020-328_564" "232" "pfam00119" "gnl|CDD|376294" "2.43866e-07" "4" "201" "-2" "pfam00119, ATP-synt_A, ATP synthase A chain. " "Bacteria(0.92);Eukaryota(0.08);" "(1.00);" "(0.05);Flavobacteriaceae(0.03);Clostridiaceae(0.03);Mycoplasmataceae(0.03);Bacillaceae(0.02);" "(0.03);Clostridium(0.03);Mycoplasma(0.02);Bacteroides(0.02);Prevotella(0.02);"
+"ds2020-328_565" "232" "pfam00119" "gnl|CDD|376294" "4.75161e-06" "106" "189" "-2" "pfam00119, ATP-synt_A, ATP synthase A chain. " "Bacteria(0.92);Eukaryota(0.08);" "(1.00);" "(0.05);Flavobacteriaceae(0.03);Clostridiaceae(0.03);Mycoplasmataceae(0.03);Bacillaceae(0.02);" "(0.03);Clostridium(0.03);Mycoplasma(0.02);Bacteroides(0.02);Prevotella(0.02);"
+"ds2020-328_568" "232" "pfam00160" "gnl|CDD|365914" "7.47948e-06" "91" "231" "-2" "pfam00160, Pro_isomerase, Cyclophilin type peptidyl-prolyl cis-trans isomerase/CLD. The peptidyl-prolyl cis-trans isomerases, also known as cyclophilins, share this domain of about 109 amino acids. Cyclophilins have been found in all organisms studied so far and catalyze peptidyl-prolyl isomerisation during which the peptide bond preceding proline (the peptidyl-prolyl bond) is stabilized in the cis conformation. Mammalian cyclophilin A (CypA) is a major cellular target for the immunosuppressive drug cyclosporin A (CsA). Other roles for cyclophilins may include chaperone and cell signalling function." "Bacteria(0.57);Eukaryota(0.41);Archaea(0.02);" "(1.00);" "Flavobacteriaceae(0.09);Theileriidae(0.04);Babesiidae(0.04);Cryptococcaceae(0.04);Vibrionaceae(0.04);" "Cryptococcus(0.04);Vibrio(0.04);Gloeobacter(0.04);Babesia(0.04);Theileria(0.04);"
+"ds2020-328_579" "230" "pfam09220" "gnl|CDD|370369" "3.32926e-12" "15" "212" "3" "pfam09220, LA-virus_coat, L-A virus, major coat protein. Members of this family form the major coat protein of the Saccharomyces cerevisiae L-A virus." "Eukaryota(1.00);" "(1.00);" "Debaryomycetaceae(1.00);" "Debaryomyces(1.00);"
+"ds2020-328_58" "561" "pfam17921" "gnl|CDD|375431" "1.48639e-11" "411" "551" "-2" "pfam17921, Integrase_H2C2, Integrase zinc binding domain. This zinc binding domain is found in a wide variety of integrase proteins." "unknown" "unknown" "unknown" "unknown"
+"ds2020-328_594" "229" "pfam02123" "gnl|CDD|280316" "5.55224e-12" "25" "213" "-2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_597" "229" "pfam00421" "gnl|CDD|366090" "5.55907e-21" "15" "218" "3" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-328_600" "229" "pfam05518" "gnl|CDD|253234" "1.13476e-09" "26" "229" "2" "pfam05518, Totivirus_coat, Totivirus coat protein. " "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(1.00);" "Victorivirus(0.57);Leishmaniavirus(0.29);(0.14);"
+"ds2020-328_604" "228" "pfam01333" "gnl|CDD|366578" "1.59517e-20" "54" "218" "3" "pfam01333, Apocytochr_F_C, Apocytochrome F, C-terminal. This is a sub-family of cytochrome C. See pfam00034." "Bacteria(0.82);Eukaryota(0.18);" "(1.00);" "Synechococcaceae(0.18);Prochloraceae(0.07);Aphanothecaceae(0.07);Nostocaceae(0.05);Microcoleaceae(0.05);" "Synechococcus(0.14);Prochlorococcus(0.07);Gloeobacter(0.04);Oscillatoria(0.04);Nostoc(0.04);"
+"ds2020-328_609" "228" "pfam00006" "gnl|CDD|376291" "1.76934e-18" "20" "211" "2" "pfam00006, ATP-synt_ab, ATP synthase alpha/beta family, nucleotide-binding domain. This entry includes the ATP synthase alpha and beta subunits, the ATP synthase associated with flagella and the termination factor Rho." "Bacteria(0.88);Archaea(0.07);Eukaryota(0.05);" "(1.00);" "(0.07);Mycoplasmataceae(0.06);Clostridiaceae(0.04);Spirochaetaceae(0.03);Rhodobacteraceae(0.02);" "Mycoplasma(0.06);(0.03);Clostridium(0.03);Treponema(0.01);Persephonella(0.01);"
+"ds2020-328_611" "228" "pfam00421" "gnl|CDD|366090" "2.00297e-10" "23" "226" "-3" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-328_62" "551" "pfam02123" "gnl|CDD|280316" "7.88589e-16" "4" "294" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_624" "226" "pfam00421" "gnl|CDD|366090" "2.78889e-19" "14" "193" "2" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-328_625" "226" "pfam01660" "gnl|CDD|366745" "1.80876e-05" "15" "209" "3" "pfam01660, Vmethyltransf, Viral methyltransferase. This RNA methyltransferase domain is found in a wide range of ssRNA viruses, including Hordei-, Tobra-, Tobamo-, Bromo-, Clostero- and Caliciviruses. This methyltransferase is involved in mRNA capping. Capping of mRNA enhances its stability. This usually occurs in the nucleus. Therefore, many viruses that replicate in the cytoplasm encode their own. This is a specific guanine-7-methyltransferase domain involved in viral mRNA cap0 synthesis. Specificity for guanine 7 position is shown by NMR in and in vivo role in cap synthesis. Based on secondary structure prediction, the basic fold is believed to be similar to the common AdoMet-dependent methyltransferase fold. A curious feature of this methyltransferase domain is that it together with flanking sequences seems to have guanylyltransferase activity coupled to the methyltransferase activity. The domain is found throughout the so-called Alphavirus superfamily, (including alphaviruses and several other groups). It forms the defining, unique feature of this superfamily." "Viruses(1.00);" "Riboviria(1.00);" "Betaflexiviridae(0.23);Alphaflexiviridae(0.21);Virgaviridae(0.15);Tymoviridae(0.14);Bromoviridae(0.10);" "Potexvirus(0.16);Carlavirus(0.11);Tymovirus(0.08);Tobamovirus(0.07);Alphavirus(0.05);"
+"ds2020-328_634" "225" "pfam13041" "gnl|CDD|372443" "6.23279e-08" "54" "185" "-2" "pfam13041, PPR_2, PPR repeat family. This repeat has no known function. It is about 35 amino acids long and is found in up to 18 copies in some proteins. The family appears to be greatly expanded in plants and fungi. The repeat has been called PPR." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.30);Euphorbiaceae(0.25);Salicaceae(0.16);Funariaceae(0.05);Poaceae(0.04);" "Arabidopsis(0.30);Ricinus(0.25);Populus(0.16);Physcomitrella(0.05);Naegleria(0.03);"
+"ds2020-328_641" "225" "pfam04392" "gnl|CDD|367921" "7.39814e-09" "28" "177" "-1" "pfam04392, ABC_sub_bind, ABC transporter substrate binding protein. This family contains many hypothetical proteins and some ABC transporter substrate binding proteins." "Bacteria(1.00);" "(1.00);" "Streptococcaceae(0.33);Phyllobacteriaceae(0.17);Pseudomonadaceae(0.17);Rickettsiaceae(0.17);Aquificaceae(0.17);" "Streptococcus(0.33);Rickettsia(0.17);Pseudomonas(0.17);Mesorhizobium(0.17);Aquifex(0.17);"
+"ds2020-328_654" "224" "pfam00223" "gnl|CDD|365957" "8.28468e-21" "41" "205" "-2" "pfam00223, PsaA_PsaB, Photosystem I psaA/psaB protein. " "Bacteria(0.83);Eukaryota(0.17);" "(1.00);" "Prochloraceae(0.28);Synechococcaceae(0.11);Gloeobacteraceae(0.11);Acaryochloridaceae(0.11);Funariaceae(0.06);" "Prochlorococcus(0.28);Acaryochloris(0.11);Gloeobacter(0.11);(0.06);Selaginella(0.06);"
+"ds2020-328_657" no_hit
+"ds2020-328_659" "223" "pfam01809" "gnl|CDD|376620" "7.3686e-08" "121" "189" "-2" "pfam01809, Haemolytic, Haemolytic domain. This domain has haemolytic activity. It is found in short (73-103 amino acid) proteins and contains three conserved cysteine residues." "Bacteria(0.99);Eukaryota(0.01);" "(1.00);" "Clostridiaceae(0.07);(0.06);Ruminococcaceae(0.03);Flavobacteriaceae(0.02);Eubacteriaceae(0.02);" "Clostridium(0.07);(0.05);Eubacterium(0.02);Ruminococcus(0.02);Lactobacillus(0.01);"
+"ds2020-328_66" "532" "pfam09044" "gnl|CDD|370259" "2.02105e-23" "65" "373" "-1" "pfam09044, Kp4, Kp4. Members of this fungal family of toxins specifically inhibit voltage-gated calcium channels in mammalian cells. They adopt an alpha/beta-sandwich structure, comprising a five-stranded antiparallel beta-sheet with two antiparallel alpha-helices lying at approximately 45 degrees to these strands." "Eukaryota(1.00);" "(1.00);" "Hypocreaceae(0.29);Aspergillaceae(0.21);Nectriaceae(0.21);Glomerellaceae(0.14);Clavicipitaceae(0.07);" "Trichoderma(0.29);Aspergillus(0.21);Fusarium(0.21);Colletotrichum(0.14);Metarhizium(0.07);"
+"ds2020-328_675" "222" "pfam02468" "gnl|CDD|367094" "3.35789e-17" "22" "123" "1" "pfam02468, PsbN, Photosystem II reaction centre N protein (psbN). This is a family of small proteins encoded on the chloroplast genome. psbN is involved in photosystem II during photosynthesis, but its exact role is unknown." "Bacteria(0.88);Eukaryota(0.12);" "(1.00);" "Synechococcaceae(0.15);Nostocaceae(0.07);Prochloraceae(0.07);Aphanothecaceae(0.07);Microcoleaceae(0.05);" "Synechococcus(0.12);Prochlorococcus(0.07);Cyanobacterium(0.05);(0.03);Trichodesmium(0.03);"
+"ds2020-328_677" "222" "pfam00978" "gnl|CDD|250270" "1.73152e-12" "24" "206" "-2" "pfam00978, RdRP_2, RNA dependent RNA polymerase. This family may represent an RNA dependent RNA polymerase. The family also contains the following proteins: 2A protein from bromoviruses putative RNA dependent RNA polymerase from tobamoviruses Non structural polyprotein from togaviruses." "Viruses(1.00);" "Riboviria(1.00);" "Bromoviridae(0.35);Virgaviridae(0.32);Closteroviridae(0.16);Togaviridae(0.10);Betaflexiviridae(0.03);" "Tobamovirus(0.13);Ilarvirus(0.10);Alphavirus(0.10);Cucumovirus(0.10);Bromovirus(0.10);"
+"ds2020-328_681" "222" "pfam00562" "gnl|CDD|366167" "2.61251e-09" "26" "145" "-3" "pfam00562, RNA_pol_Rpb2_6, RNA polymerase Rpb2, domain 6. RNA polymerases catalyze the DNA dependent polymerization of RNA. Prokaryotes contain a single RNA polymerase compared to three in eukaryotes (not including mitochondrial. and chloroplast polymerases). This domain represents the hybrid binding domain and the wall domain. The hybrid binding domain binds the nascent RNA strand / template DNA strand in the Pol II transcription elongation complex. This domain contains the important structural motifs, switch 3 and the flap loop and binds an active site metal ion. This domain is also involved in binding to Rpb1 and Rpb3. Many of the bacterial members contain large insertions within this domain, as region known as dispensable region 2 (DRII)." "Bacteria(0.49);Eukaryota(0.34);Archaea(0.09);Viruses(0.08);" "(0.92);Iridoviridae(0.05);Mimiviridae(0.02);Asfarviridae(0.02);" "Iridoviridae(0.05);Hexamitidae(0.05);Trichomonadidae(0.03);Poaceae(0.03);Cryptosporidiidae(0.03);" "Giardia(0.05);Cryptosporidium(0.03);Trichomonas(0.03);Plasmodium(0.03);Rhodopirellula(0.02);"
+"ds2020-328_687" no_hit
+"ds2020-328_689" "222" "pfam02670" "gnl|CDD|335036" "5.85343e-14" "34" "135" "1" "pfam02670, DXP_reductoisom, 1-deoxy-D-xylulose 5-phosphate reductoisomerase. This is a family of 1-deoxy-D-xylulose 5-phosphate reductoisomerases. This enzyme catalyzes the formation of 2-C-methyl-D-erythritol 4-phosphate from 1-deoxy-D-xylulose-5-phosphate in the presence of NADPH. This reaction is part of the terpenoid biosynthesis pathway." "Bacteria(0.96);Eukaryota(0.04);" "(1.00);" "Bacillaceae(0.05);Vibrionaceae(0.05);Corynebacteriaceae(0.04);Pasteurellaceae(0.04);Pseudomonadaceae(0.04);" "Bacillus(0.05);Clostridium(0.04);Corynebacterium(0.04);Pseudomonas(0.04);Vibrio(0.04);"
+"ds2020-328_69" "528" "pfam01660" "gnl|CDD|366745" "2.23499e-10" "222" "500" "-2" "pfam01660, Vmethyltransf, Viral methyltransferase. This RNA methyltransferase domain is found in a wide range of ssRNA viruses, including Hordei-, Tobra-, Tobamo-, Bromo-, Clostero- and Caliciviruses. This methyltransferase is involved in mRNA capping. Capping of mRNA enhances its stability. This usually occurs in the nucleus. Therefore, many viruses that replicate in the cytoplasm encode their own. This is a specific guanine-7-methyltransferase domain involved in viral mRNA cap0 synthesis. Specificity for guanine 7 position is shown by NMR in and in vivo role in cap synthesis. Based on secondary structure prediction, the basic fold is believed to be similar to the common AdoMet-dependent methyltransferase fold. A curious feature of this methyltransferase domain is that it together with flanking sequences seems to have guanylyltransferase activity coupled to the methyltransferase activity. The domain is found throughout the so-called Alphavirus superfamily, (including alphaviruses and several other groups). It forms the defining, unique feature of this superfamily." "Viruses(1.00);" "Riboviria(1.00);" "Betaflexiviridae(0.23);Alphaflexiviridae(0.21);Virgaviridae(0.15);Tymoviridae(0.14);Bromoviridae(0.10);" "Potexvirus(0.16);Carlavirus(0.11);Tymovirus(0.08);Tobamovirus(0.07);Alphavirus(0.05);"
+"ds2020-328_691" "221" "pfam00329" "gnl|CDD|376317" "1.3793e-18" "81" "197" "-1" "pfam00329, Complex1_30kDa, Respiratory-chain NADH dehydrogenase, 30 Kd subunit. " "Bacteria(0.79);Archaea(0.12);Eukaryota(0.09);" "(1.00);" "(0.05);Peptococcaceae(0.02);Bacteroidaceae(0.02);Desulfurococcaceae(0.02);Rhodobacteraceae(0.01);" "Bacteroides(0.02);(0.02);Prevotella(0.01);Geobacter(0.01);"
+"ds2020-328_7" "2116" "pfam01787" "gnl|CDD|366810" "1.27327e-63" "325" "936" "-2" "pfam01787, Ilar_coat, Ilarvirus coat protein. This family consists of various coat proteins from the ilarviruses part of the Bromoviridae, members include apple mosaic virus and prune dwarf virus. The ilarvirus coat protein is required to initiate replication of the viral genome in host plants. Members of the Bromoviridae have a positive stand ssRNA genome with no DNA stage in there replication." "Viruses(1.00);" "Riboviria(1.00);" "Bromoviridae(1.00);" "Ilarvirus(1.00);"
+"ds2020-328_7" "2116" "pfam01573" "gnl|CDD|279858" "6.78673e-46" "1134" "1835" "-3" "pfam01573, Bromo_MP, Bromovirus movement protein. " "Viruses(1.00);" "Riboviria(1.00);" "Bromoviridae(1.00);" "Ilarvirus(0.50);Alfamovirus(0.50);"
+"ds2020-328_704" "220" "pfam05724" "gnl|CDD|368581" "5.77087e-08" "38" "196" "2" "pfam05724, TPMT, Thiopurine S-methyltransferase (TPMT). This family consists of thiopurine S-methyltransferase proteins from both eukaryotes and prokaryotes. Thiopurine S-methyltransferase (TPMT) is a cytosolic enzyme that catalyzes S-methylation of aromatic and heterocyclic sulfhydryl compounds, including anticancer and immunosuppressive thiopurines." "Bacteria(0.55);Eukaryota(0.45);" "(1.00);" "Pseudomonadaceae(0.27);Brassicaceae(0.18);Muridae(0.09);Vibrionaceae(0.09);Hominidae(0.09);" "Pseudomonas(0.27);Batis(0.09);Ralstonia(0.09);Arabidopsis(0.09);Brassica(0.09);"
+"ds2020-328_724" "219" "pfam02123" "gnl|CDD|280316" "1.52156e-13" "35" "199" "-3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_746" "217" "pfam02123" "gnl|CDD|280316" "4.96199e-13" "13" "210" "-2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_750" "216" "pfam02123" "gnl|CDD|280316" "7.51118e-17" "8" "214" "-3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_761" "215" "pfam02123" "gnl|CDD|280316" "4.08427e-09" "37" "198" "-3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_763" "215" "pfam00201" "gnl|CDD|278624" "6.35685e-07" "113" "193" "-2" "pfam00201, UDPGT, UDP-glucoronosyl and UDP-glucosyl transferase. " "Eukaryota(1.00);" "(1.00);" "Hominidae(0.46);Muridae(0.31);Leporidae(0.15);Poaceae(0.08);" "Homo(0.46);Rattus(0.31);Oryctolagus(0.15);Zea(0.08);"
+"ds2020-328_768" "215" "pfam02123" "gnl|CDD|280316" "5.01402e-08" "33" "209" "3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_775" "214" "pfam00361" "gnl|CDD|366050" "1.62796e-10" "59" "196" "-1" "pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla." "Eukaryota(0.54);Bacteria(0.46);" "(1.00);" "Culicidae(0.23);Rhodobacteraceae(0.23);Poaceae(0.15);Enterobacteriaceae(0.15);Phasianidae(0.08);" "Paracoccus(0.23);Anopheles(0.23);Escherichia(0.15);Zea(0.15);Aspergillus(0.08);"
+"ds2020-328_784" "213" "pfam07727" "gnl|CDD|369488" "2.2825e-05" "25" "93" "-1" "pfam07727, RVT_2, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses. This Pfam entry includes reverse transcriptases not recognized by the pfam00078 model." "Eukaryota(1.00);" "(1.00);" "Debaryomycetaceae(0.83);Saccharomycetaceae(0.17);" "Candida(0.50);Debaryomyces(0.33);Saccharomyces(0.17);"
+"ds2020-328_788" "213" "pfam00069" "gnl|CDD|365850" "1.68423e-10" "23" "193" "2" "pfam00069, Pkinase, Protein kinase domain. " "Eukaryota(1.00);" "(1.00);" "Saccharomycetaceae(0.31);Hominidae(0.17);Muridae(0.14);Schizosaccharomycetaceae(0.11);Drosophilidae(0.06);" "Saccharomyces(0.31);Homo(0.17);Schizosaccharomyces(0.11);Rattus(0.08);Drosophila(0.06);"
+"ds2020-328_79" "507" "pfam00507" "gnl|CDD|376344" "3.59591e-31" "17" "244" "2" "pfam00507, Oxidored_q4, NADH-ubiquinone/plastoquinone oxidoreductase, chain 3. " "Bacteria(0.80);Eukaryota(0.13);Archaea(0.07);" "(1.00);" "(0.04);Prevotellaceae(0.02);Cytophagaceae(0.02);Sphingobacteriaceae(0.02);Desulfobulbaceae(0.02);" "(0.02);Prevotella(0.02);Bacteroides(0.02);Geobacter(0.01);"
+"ds2020-328_79" "507" "pfam00164" "gnl|CDD|333891" "1.13503e-12" "341" "493" "2" "pfam00164, Ribosom_S12_S23, Ribosomal protein S12/S23. This protein is known as S12 in bacteria and archaea and S23 in eukaryotes." "Bacteria(0.45);Eukaryota(0.27);Archaea(0.27);" "(1.00);" "Thermococcaceae(0.09);Micrococcaceae(0.09);Enterobacteriaceae(0.09);Thermaceae(0.09);Muridae(0.09);" "Thermococcus(0.09);Saccharomyces(0.09);Rickettsia(0.09);Synechococcus(0.09);Thermus(0.09);"
+"ds2020-328_808" "212" "pfam03822" "gnl|CDD|367678" "6.58628e-13" "73" "189" "-3" "pfam03822, NAF, NAF domain. " "Eukaryota(1.00);" "(1.00);" "Poaceae(0.30);Brassicaceae(0.18);Solanaceae(0.12);Musaceae(0.09);Fabaceae(0.08);" "Solanum(0.11);Musa(0.09);Brassica(0.09);Glycine(0.08);Arabidopsis(0.07);"
+"ds2020-328_817" "211" "pfam03732" "gnl|CDD|367628" "2.37772e-05" "26" "208" "2" "pfam03732, Retrotrans_gag, Retrotransposon gag protein. Gag or Capsid-like proteins from LTR retrotransposons. There is a central motif QGXXEXXXXXFXXLXXH that is common to Retroviridae gag-proteins, but is poorly conserved." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.58);Poaceae(0.29);Tetraodontidae(0.04);Solanaceae(0.02);Plantaginaceae(0.02);" "Arabidopsis(0.58);Oryza(0.18);Sorghum(0.05);Takifugu(0.04);Zea(0.04);"
+"ds2020-328_821" "211" "pfam03732" "gnl|CDD|367628" "4.10271e-05" "96" "200" "-3" "pfam03732, Retrotrans_gag, Retrotransposon gag protein. Gag or Capsid-like proteins from LTR retrotransposons. There is a central motif QGXXEXXXXXFXXLXXH that is common to Retroviridae gag-proteins, but is poorly conserved." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.58);Poaceae(0.29);Tetraodontidae(0.04);Solanaceae(0.02);Plantaginaceae(0.02);" "Arabidopsis(0.58);Oryza(0.18);Sorghum(0.05);Takifugu(0.04);Zea(0.04);"
+"ds2020-328_825" no_hit
+"ds2020-328_830" "211" "pfam00978" "gnl|CDD|250270" "2.36362e-14" "16" "201" "1" "pfam00978, RdRP_2, RNA dependent RNA polymerase. This family may represent an RNA dependent RNA polymerase. The family also contains the following proteins: 2A protein from bromoviruses putative RNA dependent RNA polymerase from tobamoviruses Non structural polyprotein from togaviruses." "Viruses(1.00);" "Riboviria(1.00);" "Bromoviridae(0.35);Virgaviridae(0.32);Closteroviridae(0.16);Togaviridae(0.10);Betaflexiviridae(0.03);" "Tobamovirus(0.13);Ilarvirus(0.10);Alphavirus(0.10);Cucumovirus(0.10);Bromovirus(0.10);"
+"ds2020-328_84" "501" "pfam00284" "gnl|CDD|366000" "1.57316e-21" "211" "324" "-1" "pfam00284, Cytochrom_B559a, Lumenal portion of Cytochrome b559, alpha (gene psbE) subunit. This family is the lumenal portion of cytochrome b559 alpha chain, matches to this family should be accompanied by a match to the pfam00283 family also. The Prosite pattern pattern matches the transmembrane region of the cytochrome b559 alpha and beta subunits." "Bacteria(0.86);Eukaryota(0.14);" "(1.00);" "Synechococcaceae(0.17);Microcoleaceae(0.09);Aphanothecaceae(0.09);Prochloraceae(0.06);Phaeodactylaceae(0.03);" "Synechococcus(0.17);Prochlorococcus(0.06);Stanieria(0.03);Acaryochloris(0.03);Selaginella(0.03);"
+"ds2020-328_84" "501" "pfam00283" "gnl|CDD|365999" "1.14937e-08" "346" "432" "-1" "pfam00283, Cytochrom_B559, Cytochrome b559, alpha (gene psbE) and beta (gene psbF)subunits. " "Bacteria(0.59);Eukaryota(0.41);" "(1.00);" "Synechococcaceae(0.29);Prochloraceae(0.12);Pseudanabaenaceae(0.06);Acaryochloridaceae(0.06);Thalassiosiraceae(0.06);" "Synechococcus(0.29);Prochlorococcus(0.12);Selaginella(0.06);Gloeobacter(0.06);Thalassiosira(0.06);"
+"ds2020-328_84" "501" "pfam00283" "gnl|CDD|365999" "2.11473e-07" "100" "186" "-1" "pfam00283, Cytochrom_B559, Cytochrome b559, alpha (gene psbE) and beta (gene psbF)subunits. " "Bacteria(0.59);Eukaryota(0.41);" "(1.00);" "Synechococcaceae(0.29);Prochloraceae(0.12);Pseudanabaenaceae(0.06);Acaryochloridaceae(0.06);Thalassiosiraceae(0.06);" "Synechococcus(0.29);Prochlorococcus(0.12);Selaginella(0.06);Gloeobacter(0.06);Thalassiosira(0.06);"
+"ds2020-328_843" "210" "pfam03514" "gnl|CDD|335361" "1.72129e-13" "26" "130" "2" "pfam03514, GRAS, GRAS domain family. Proteins in the GRAS (GAI, RGA, SCR) family are known as major players in gibberellin (GA) signaling, which regulates various aspects of plant growth and development. Mutation of the SCARECROW (SCR) gene results in a radial pattern defect, loss of a ground tissue layer, in the root. The PAT1 protein is involved in phytochrome A signal transduction. A sequence, structure and evolutionary analysis showed that the GRAS family emerged in bacteria and belongs to the Rossmann-fold, AdoMET (SAM)-dependent methyltransferase superfamily. All bacterial, and a subset of plant GRAS proteins, are predicted to be active and function as small-molecule methylases. Several plant GRAS proteins lack one or more AdoMet (SAM)-binding residues while preserving their substrate-binding residues. Although GRAS proteins are implicated to function as transcriptional factors, the above analysis suggests that they instead might either modify or bind small molecules." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.80);Poaceae(0.13);Solanaceae(0.07);" "Arabidopsis(0.80);Oryza(0.07);Solanum(0.07);Zea(0.03);Triticum(0.03);"
+"ds2020-328_863" "209" "pfam02123" "gnl|CDD|280316" "7.16978e-05" "38" "181" "2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_867" "209" "pfam02123" "gnl|CDD|280316" "3.29677e-10" "13" "186" "-3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_87" "488" "pfam02123" "gnl|CDD|280316" "1.40535e-08" "300" "467" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_872" "209" "pfam08497" "gnl|CDD|378013" "5.53746e-25" "38" "181" "-2" "pfam08497, Radical_SAM_N, Radical SAM N-terminal. This domain tends to occur to the N-terminus of the pfam04055 domain in hypothetical bacterial proteins." "Bacteria(0.94);Archaea(0.06);" "(1.00);" "Clostridiaceae(0.11);(0.10);Prevotellaceae(0.06);Lachnospiraceae(0.05);Ruminococcaceae(0.04);" "Clostridium(0.11);(0.08);Prevotella(0.05);Eubacterium(0.04);Ruminococcus(0.03);"
+"ds2020-328_891" "208" "pfam02123" "gnl|CDD|280316" "2.76435e-10" "31" "150" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_893" "208" "pfam02123" "gnl|CDD|280316" "1.90193e-07" "35" "181" "2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_9" "1487" "pfam00361" "gnl|CDD|366050" "2.3647e-49" "715" "1476" "-3" "pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla." "Eukaryota(0.54);Bacteria(0.46);" "(1.00);" "Culicidae(0.23);Rhodobacteraceae(0.23);Poaceae(0.15);Enterobacteriaceae(0.15);Phasianidae(0.08);" "Paracoccus(0.23);Anopheles(0.23);Escherichia(0.15);Zea(0.15);Aspergillus(0.08);"
+"ds2020-328_90" "476" "pfam01578" "gnl|CDD|307628" "6.70073e-11" "145" "399" "-3" "pfam01578, Cytochrom_C_asm, Cytochrome C assembly protein. This family consists of various proteins involved in cytochrome c assembly from mitochondria and bacteria; CycK from Rhizobium, CcmC from E. coli and Paracoccus denitrificans and orf240 from wheat mitochondria. The members of this family are probably integral membrane proteins with six predicted transmembrane helices. It has been proposed that members of this family comprise a membrane component of an ABC (ATP binding cassette) transporter complex. It is also proposed that this transporter is necessary for transport of some component needed for cytochrome c assembly. One member CycK contains a putative heme-binding motif, orf240 also contains a putative heme-binding motif and is a proposed ABC transporter with c-type heme as its proposed substrate. However it seems unlikely that all members of this family transport heme nor c-type apocytochromes because CcmC in the putative CcmABC transporter transports neither. CcmF forms a working module with CcmH and CcmI, CcmFHI, and itself is unlikely to bind haem directly." "Bacteria(0.56);Eukaryota(0.38);Archaea(0.05);" "(1.00);" "Enterobacteriaceae(0.10);Pasteurellaceae(0.08);Histionidae(0.05);Marchantiaceae(0.05);Archaeoglobaceae(0.05);" "Escherichia(0.08);Reclinomonas(0.05);Archaeoglobus(0.05);Marchantia(0.05);Bradyrhizobium(0.05);"
+"ds2020-328_904" no_hit
+"ds2020-328_908" "207" "pfam02123" "gnl|CDD|280316" "5.3529e-06" "4" "207" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_921" no_hit
+"ds2020-328_97" "461" "pfam02123" "gnl|CDD|280316" "5.16988e-30" "39" "461" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_98" "458" "pfam02123" "gnl|CDD|280316" "1.94825e-26" "27" "443" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_99" "458" "pfam03732" "gnl|CDD|367628" "7.72961e-07" "256" "441" "1" "pfam03732, Retrotrans_gag, Retrotransposon gag protein. Gag or Capsid-like proteins from LTR retrotransposons. There is a central motif QGXXEXXXXXFXXLXXH that is common to Retroviridae gag-proteins, but is poorly conserved." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.58);Poaceae(0.29);Tetraodontidae(0.04);Solanaceae(0.02);Plantaginaceae(0.02);" "Arabidopsis(0.58);Oryza(0.18);Sorghum(0.05);Takifugu(0.04);Zea(0.04);"
diff --git a/tools/virAnnot/test-data/otu_s2_tblastx.tab b/tools/virAnnot/test-data/otu_s2_tblastx.tab
new file mode 100755
index 00000000000..4b49f3ddafd
--- /dev/null
+++ b/tools/virAnnot/test-data/otu_s2_tblastx.tab
@@ -0,0 +1,139 @@
+#algo query_id nb_reads query_length accession description organism percentIdentity nb_hsps queryOverlap hitOverlap evalue score tax_id taxonomy sequence
+TBLASTX ds2020-328_275 16 279
+TBLASTX ds2020-328_625 13 226 NC_008039 Prune dwarf virus RNA 1, complete sequence Prune dwarf virus 90.7 3 100 17.0 1.9242059400026399e-29 420.172 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGGCCGCCCGCCATACTGAGCGTCTCATGCAGTACACTACCTACAAGACTAGTAGACCTGATGAAGTTCATGAACCGAACTTTTGTGAAAACACATTCCAGGACTGCTCCTTGCAAGGTAAGTATGCCATGGCAATCCATTCCACTTCGGATTTACCCTTAGGTGAGCTCTGTGAGAGCTTAAGGAAGAAGGGAGTGATTCGTCTATCCCGACC
+TBLASTX ds2020-328_196 14 318 NC_033468 Wuhan insect virus 27 strain WHZM10130 hypothetical protein 1 and hypothetical protein 2 genes, complete cds Wuhan insect virus 27 45.3 1 100 6.0 2.90542e-27 118.644 1923731 Viruses;Wuhan insect virus 27 GGTCGGGATAGACGTTTAGCAGCCTTAAACTCTTCATCTTCAGGGTATTGTGAGTGATATGCTCCCGTAGGTGCCCACTGCCACCTCTTATTCCAATAACTTTTCCACTTTATGTTATCTGGTTTACTCCCGAGGTTTTTCAATCTAGTGAACATTTCTCCACTAGCCCTGTATATCTGCTCTCTAGTGAAAGAAGCGACGTTGGGTTTGGTTCTGTGCTCTTTCTCGGCTTTCCAATCCACTTCTCCTATACCTCTGTTGACTAAAACTTCCATTTCAAAGAATGGTTTTAAGTTGAGCGGTGCGTCTATCCCGACC
+TBLASTX ds2020-328_638 4 225 NC_030890 Arabidopsis halleri partitivirus 1 gene for capsid protein, complete cds Arabidopsis halleri partitivirus 1 48.2 1 100 10.0 1.45353e-08 55.5941 1849335 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Arabidopsis halleri partitivirus 1 GTCGGGATAGACGTACCAGTCAACTTTTTGCAATTTTCTTCATACATCACATGGTATGACTTGGTTTGCCCAAGTCCGCGATGTAGCCGCAGCCGAAGCCTCGTCTTTCGAAGGCTCAGGCACCCTGGCTGATTGTCCCCCATTCGGGATAACGTCAAACCAGGTAGTTGTTAACTACTTGGCCCCAGCCACACTGCCAACGTCCCCTATTCGTCTATCCCGACC
+TBLASTX ds2020-328_858 2 210
+TBLASTX ds2020-328_761 8 215
+TBLASTX ds2020-328_553 2 234
+TBLASTX ds2020-328_845 11 210 NC_003689 Cherry virus A, complete genome Cherry virus A 75.0 2 100 5.0 5.449000000000025e-19 225.74040000000002 42882 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Tymovirales;Betaflexiviridae;Capillovirus;Cherry virus A GCCGTGGACCTAGTTAGGAGAGTAATTTCGGATGGTGTTCTTTACTGCTCTCTGATTTTCTGATAAGATTATCGCCGGCGTGGCTGCTACTCCCTCTGAAGCCTCTACTGCTGGCTTCGCAGTCAGGTGCAATAGATCCCTTGGATCTATCATATTCTCCCAGATATAATTTACAAGGCCCCTTCTTATCACGTTGTAATTCTTATACAC
+TBLASTX ds2020-328_483 8 242 NC_033495 Botryosphaeria dothidea virus 1 strain YZN115 segment RNA4 hypothetical protein gene, complete cds Botryosphaeria dothidea virus 1 50.0 1 100 13.0 1.155e-07 52.8449 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 GGTCGGGATAGACGGAATTAACCCATGTAATGGCACAATCGAAGGCTCTAGCCGTGGCCGTTGCACGGATAACGAGAGGGAAGGGGCGGCACGACGCATCTGTAGAAGATTTCATCTTCTACATAGCCTCAAACGGGCGTGCCGTCTCCGCTTCGGATATACCATCCGGAGTCCATAGCTTGGCTTGCGGTCCTCGTGACCATGTGGAACCCTCTGAGCGTTTACCAGCGTCTATCCCGACC
+TBLASTX ds2020-328_910 2 207
+TBLASTX ds2020-328_531 10 236
+TBLASTX ds2020-328_893 4 208
+TBLASTX ds2020-328_507 26 238
+TBLASTX ds2020-328_594 8 229
+TBLASTX ds2020-328_600 4 229 NC_014823 Tolypocladium cylindrosporum virus 1, complete genome Tolypocladium cylindrosporum virus 1 55.8 2 100 7.0 8.34655e-06 145.07119999999998 939923 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Victorivirus;Tolypocladium cylindrosporum virus 1 GGTGGGGATAGACGTTTTGGTTCCTTCTAAAGGCCGCGCCCTCTCCCGCCCAATTGATGGTTCCCTGCTTGTTGAAGCGGGATACCCTACTGCTCATGCCTTGGCTGAGGATTTTGTTGGACTTTCTAAGAAGTACACTAATTTCTATGCCACGTCCGAGTACGCGTCCCTGGCTGACCTGGTTGAACACCTCATCCATGGTTTAGCTCCAACCTCCGTATATCCCGAC
+TBLASTX ds2020-328_765 8 215
+TBLASTX ds2020-328_575 4 231 NC_003710 Discula destructiva virus 2 segment 1, complete genome Discula destructiva virus 2 69.0 4 100 20.0 0.00012443 208.6303 160484 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Gammapartitivirus;Discula destructiva virus 2 GGTCGGGATAGACGTACGTCTGGCATGAGTATGGGTGTATTAATGAAATACCACACCATGGCGTCCCAAACATTCTTCCACTTTTGCTTCTCAACCTGATCTGTCACAGGTTTTCCATTGAAGGAAGAGAAGTTCACGTTCTGTTTCAACACGTCAAACGCGACGCGTATCAACCACGCTGGTACTTTCGTATCAAAAGCGGAAAAATCTATGACCACGTCTATCCCGACC
+TBLASTX ds2020-328_229 20 299 NC_007539 Penicillium chrysogenum virus segment 1, complete genome Penicillium chrysogenum virus 61.8 2 100 13.0 9.88605e-10 217.03480000000002 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GTTACATGCATTGGACTCGCGACTTGAATTACGGCGGTCGGGATAGACGTTGTTCGCGGATGGAGAGGTACAACATGGATAAATTCTACTTTAAATTTTTGCTATGTGGCTATTGCACTCCAAAATATGGAACGTATACATGGTGTAAGTTGTGTATTATATGTAGATCATGGCGGAGATGATATAGATTTAGGATTAAGTGAACCTGCCATGCTGCCATTGTTCCTAGAAATAATGGATAGCATGCTGTTCAAGGCGAATAAATGGAAACAAATGTCCGATCCACGTCTATCCCGACC
+TBLASTX ds2020-328_172 14 338 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 57.5 3 100 14.0 2.4114403333333332e-05 280.4185 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B ATTACGGCGGTCGGGATAGACGGAGGGCGTCCTTCTAGCACCCCCGACACGCGAGCGCTGACATTTGCGTCATTGGCGTCTCTCCCGACTGGGAATCTGTTTGGGAGCACGTTTTCACAATTGTAAAACGCAAAGTTGGCAAGGACGTAACTCGTTGTATCTGTTCCATAGATTGCACGGAGCTTGCCCCATTCATACTTTGTTGATGCCCAAGCGTGTATTTCGGGGTTGCGTGATGTGAAGTATTCGATGTCAAAAGATGGCATGTTCGATATCATTATGAACTTGTTTTTGAGAGCGCGGTCAGTTCTGATGAGAACATCTCGTCTATCCCGACC
+TBLASTX ds2020-328_293 15 272 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 67.1 1 100 5.0 8.1393e-29 123.409 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B GGTCGGGATAGACGCCTCGCAGGAATTCAGCTATAGCTCCGAATGCACATTTAGAGGGTTGTGTCCGTATACAAAGCCTCTGTCCTCTCTGTAGTGTGAAGCGGGTTATCTCAAGTGATGTCGTTCCCAGAAGTACATCGTCACCGTTGTGTAGTGAAGAGCCAACCTCTTTCATCGGACCTAACATGAAGTCAGTGTAGACGGCATTCAGGACGGAGTTAAGGAACGTAGTAAGTCGGTAACCTGACAGCAGAATCCCGTCTATCCCGACC
+TBLASTX ds2020-328_746 2 217 NC_020903 Xanthophyllomyces dendrorhous virus L1A capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1A 52.5 2 100 8.0 0.000128888 153.5807 1167690 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1A GGTCGGGATAGACGCGTCACCCCCATTATGTAAACTGTTTCCTCGCTTCAACGTGTCTTCAGATATCGCTTTTGTGTATATATAATTCAATATACTGTTCATGAATGTTGTCAGTCTCCAGCCTGACAGCAGTGTGTCTTTCGCCCTGTATGTACGCTTCGTACCAACATTGTCATGTATTACCTGGTTGCCTACAGATTCAGCCGTCCATAAGGCC
+TBLASTX ds2020-328_768 6 215
+TBLASTX ds2020-328_337 18 265
+TBLASTX ds2020-328_328 8 267 NC_007540 Penicillium chrysogenum virus segment 2, complete genome Penicillium chrysogenum virus 37.5 1 100 7.0 1.12376e-11 66.4405 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GTCTAGTACTACATCCATATTTGAGAGCCACGTCCGCCAACATTGCGAGTTTGCCACATATGACAGACTGTTATTAGGTAAACTTTCTACATTCCCAAACCATGAACTTTTCAATTTTCTGGCTCTACCAAATTCACTTATCTCTTCACTTTCGTTCCAACGTTCTATATTAAGATTTACCCGTTTTGTAAATTTGTTATTACCGTTTAACATGCTCACTTTTTCCAGACCGCATGTCTCTAAATTTGATGTTATAGCTTCTACATT
+TBLASTX ds2020-328_476 6 243
+TBLASTX ds2020-328_71 18 526 NC_033465 Wuhan insect virus 26 strain WHZM10161 hypothetical protein 1 and hypothetical protein 2 genes, complete cds Wuhan insect virus 26 47.4 1 100 6.0 1.70533e-19 93.8794 1923730 Viruses;Wuhan insect virus 26 GGTCGGGATAGACGGAGACTAAGAGTGGGCAGAAAGTCGAATGACGGGGGGCAATACCTACCGAGAGCTATAGCGACGTTAGTGCACTCGCGGATAGAGAGCGGACCAGCAACTTCATTAGCTGATGCACTGAGATCAAACGAAATACGTCTGTATGAAGCAATAGAGCGGGGTATGGACGCCGAAATAGCATTGAAACTACGGTCGTTGTATATATCACGAGTGGCGCCTTTGTACGGTAATAACAGGCAAGAAGCTATGGAGCTATTAGAGGCGTCGTCTGTAGTAGGAGGACTGAGTATGGACAGGGAGGCCAGAGTAGACAAAACATTTACGGAAACTGAGCCAACGTCGAAGGAGTCTGACGAAATAATGAACTTGGCGGGACACAGAAAATGGAGGGGAGTGTCAGACATGGCCAACGTGGTACTAGAAAAAATATCTGAACAAGGAGGAAGTGCCATAACGATAAAAAACATAACGAAGCGAATTTATAATTATAAGCTGAGTGCGTTGTCTATAAAAA
+TBLASTX ds2020-328_241 10 293 NC_033494 Botryosphaeria dothidea virus 1 strain YZN115 segment RNA3 hypothetical protein gene, complete cds Botryosphaeria dothidea virus 1 43.6 2 100 14.0 1.22557e-10 81.7433 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 GGTCGGGTAGACGGCGGAGTGTACTTGATACCTTTCGAATTCACGGGGTAGATTTTGTCGGCATATTCGTCTGGCTCGGGCAAAGGAATGGTAGGAAATTCTTTCGGCTGCGAAATTAAAGTGGCGTCAGAAGTATATGACAAAGGGAGTTTCTCACGACGTCTGTACCTGTAGAGGTACTGGTCCCAGACCTGATAGCCGGTTGATGACATGTCTGTCGTCCAGCACATCACCGAATCGAATTCTGGATGCTCAACTCGGGCAGTGTAACAAACATCATCAGCGAACCGGCC
+TBLASTX ds2020-328_391 21 254
+TBLASTX ds2020-328_668 2 223 NC_005977 Penicillium stoloniferum virus S segment 2, complete genome Wuhan insect virus 27 48.5 1 100 13.0 1.11015e-17 85.8359 1923731 Viruses;Wuhan insect virus 27 GGTCGGGATAGACGTGGGATGTGGCTATGCCGAGTTCCGTGGACTGGTCCTATCCCACTAAAACGAGGCGTTCAACCCTCTCTCAGCAGTGGGCGCGTGTTTCAACGTCCTACGCAATGTTCTTCGAGATGTCGGCGGGTCTGTCGACCGGTCAATCTGCGCAAGGCAGTCATGCACAAATGGTAGAAGTGACTATTATAGAGGGAGTACGTCTATCCCGACC
+TBLASTX ds2020-328_920 2 207 NC_033477 Botryosphaeria dothidea virus 1 strain YZN115 segment RNA2 hypothetical protein gene, complete cds Botryosphaeria dothidea virus 1 50.0 1 100 5.0 2.52205e-05 44.5971 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 GGTCGGGATAGACGGGGGATTTAAATTTTAATTAGCATCAAGACGAACATTCCGAGGTCGCACCCCCCCGTCTTACTGTAGCAGGCATGGCAAACCTGACCCGTTTACGCACGCTTGTTACGTCCGGTGAGCTCGAGGTGGTGTCAGCCGCAGCTGTTCTCTTCCACCTTTCTCGGAATCCAACCCTACATGACGTCTATCCCGACC
+TBLASTX ds2020-328_428 15 248 NC_020903 Xanthophyllomyces dendrorhous virus L1A capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1A 44.8 3 100 10.0 2.988626666666667e-05 175.03 1167690 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1A GAAGAGCTGTCGGGAGTGGAACAAGTTGTGGGATAGTAGGGGGCAGTGGGGTGCTGCGGGAAGCACGCATTCGCAGTACCAGGAGGACATGGCTTACGTCCTCAAGGACGACATAAGGCTCAAGAATAAGTTCATTACCATATCGAACATGCCGCGCTTTCCCATGACAAGATTTACAAACAGACCGCAGGAGATACAGGCTTGGGCGTCCACTAAGTACGAATGGGGCGGGGTCGTCTATCCCGACC
+TBLASTX ds2020-328_395 2 254 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 60.8 1 100 5.0 4.53232e-23 104.164 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B GGTCGGATAGACGGTCTGCCCCCTTCTGTGGTCAACTCTCAAGAACTCTGCTATGGCCCCAAATGCACATTTCGAGCTCTGCAACCTCACACCAAACTTGTGCGCGTTTGCCTGACATGCTTGAGCACATGCTAGGTTATTTGTTCCTATGAGTACGTCGTCCCCGTTGTGCAAGCTTGAGCCTGGTGTTCTCCACTCTTTTGCTATCTTCGATGTGTAGACGAAGTTCAGCACGCTGTTACGTCTATCCCACC
+TBLASTX ds2020-328_361 6 260
+TBLASTX ds2020-328_414 6 251 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 53.0 2 100 9.0 0.0001746225 154.7177 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B GGTCGGGATAGACGAGGCTACGTGGTAAACAGAGTAGCGGGGGTTTTGAAAGACAGATTACCATATTGTCTAGACTTTGAGGATTTCAACAGCCAGCACAGTCTATCAAGTATGCAAGCGGTCATAGATGCGTACTATGAAGTATTCGGGCCGAATATGTCGGAAGGGCAGAGACAGGCAGTACTTTGGACAAGAGAATCACTGTCTAATAACGTGGTACATGATAATATGGGTACACGTCTATCCCGACC
+TBLASTX ds2020-328_983 0 61 NC_036592 Pleurochrysis carterae circular virus isolate PcCV-1, complete genome Pleurochrysis carterae circular virus 100.0 8 100 21.0 0.0002522995 315.9968999999999 2057942 Viruses;Shotokuvirae;Cressdnaviricota;Arfiviricetes;Cirlivirales;Circoviridae;Pleurochrysis carterae circular virus TTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGT
+TBLASTX ds2020-328_492 7 241
+TBLASTX ds2020-328_381 4 256 NC_003710 Discula destructiva virus 2 segment 1, complete genome Discula destructiva virus 2 44.0 1 100 13.0 7.29476e-19 90.2231 160484 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Gammapartitivirus;Discula destructiva virus 2 GGTCGGGATAGACGCGCCAGCTGATGTATCAGTTCGAAGATACTGACCTACTTCGTGCCAATCACACGGTTCTTCACGGTGACTAAGGGTGAACCTCTCACGTGTAGCAGAGACCGCCTTGCGCAGCAAGGTTGATTCGCGTTCAGTTAGATCAGACCAACGTTTGTGTTGGCCTTCAAACTTCATCAAAGAGTTATACAGTCCGGGTAAACCGGCACCTCTTCGGGTAAAACCACAATTTTCGTCTATCCCGACC
+TBLASTX ds2020-328_886 8 208
+TBLASTX ds2020-328_902 13 207 NC_007542 Penicillium chrysogenum virus segment 4, complete genome Penicillium chrysogenum virus 38.6 1 100 6.0 9.22662e-09 55.9603 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGACGCTTAACCATGCTATCAATCTTTTTGACCTCCATTGTACCGTTCCCTTCCCCCAATATCACTGGTGAAAAGTGATTTTGGTCTCGCAATATTGTTACATTATTCTCTTGACTTCCATCATTATAATTAGTAACCCGTCCACTCTCTTTATCTAGCAATCTTAGGCCGAACCCCCCATGAGCGTCTATCCCGACC
+TBLASTX ds2020-328_512 10 238 NC_033494 Botryosphaeria dothidea virus 1 strain YZN115 segment RNA3 hypothetical protein gene, complete cds Botryosphaeria dothidea virus 1 43.5 1 100 11.0 2.01783e-13 71.9341 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 GGTCGGGATAGACGAGTAGGGGCCATCAAGGAGAAGAACGCCAGGGAAACCATCAAACTTTGGCAACGCAGTTGAGATTGAATGGACGTTAATGTCATCGGTTGCCGGGATACGTTTGACTCCACGTGCGTTGATGGGAATGAGCTGATCGGCTGTGGCGTCAAACTGCATTGGTGGGCCGATATCAATTGTCGCTGGCTGGGGGAGTTTCGTGGTACTTATGACGCCGCGGCTGGTT
+TBLASTX ds2020-328_677 9 222 NC_008037 Prune dwarf virus RNA 2, complete sequence Prune dwarf virus 84.3 3 100 21.0 3.5279036738626664e-25 366.104 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGACTATCAGTGTTGAGGATAGGAGCGTTCATGTTCCTTTTTGTCACCGACCGTGCCACTTCTCTAAAGGTACTTTGCCTATTGGAAGTTTGACCTGTCATTAAGGTGGAATCCACTCCAGACTTTCCTTTATCCCATGAAACAAAATGGGATAAATCAAAAGAGCAGTCATCAAGTTCAACTGCAATATCATCCGGCGTCTATCCCACC
+TBLASTX ds2020-328_571 10 231 NC_007540 Penicillium chrysogenum virus segment 2, complete genome Penicillium chrysogenum virus 50.0 1 100 6.0 2.90834e-16 81.2538 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGACGAATCTGGCTATTTATGGGCCAAACCAAGTCTTAAACTCTTATCGTAGAGATGGACGAGCATATGTTTTCAATTCCAAACCCGAGTCGGTAGGGCATACGGCACTGTTATTCAAAATGTGCGAATCTTATCCTCCAAGAGAATTTAGGTCGCATGTAAGCATACCATCGGACGGGGATGAGATATTTATGGTAGCACAACGTCTATCCCGACCGCCGT
+TBLASTX ds2020-328_777 4 214
+TBLASTX ds2020-328_870 9 209
+TBLASTX ds2020-328_10 760 1434 NC_038512 Trichoplusia ni TED virus strain mutant FP-D ORF A, ORF B, and ORF C genes, complete cds Trichoplusia ni TED virus 31.5 3 100 7.0 4.12604e-15 129.2094 2083181 Viruses;Pararnavirae;Artverviricota;Revtraviricetes;Ortervirales;Metaviridae;Errantivirus;Trichoplusia ni TED virus GGTCGGGATAGACGTCTTCTCTTCGTCTACCGCAAATAGAATAGCCTCGCCCGGGAAATTAGTCCCCTTACTAAAAAAATCAAGCTTATAGTCAGGCACGGGATGGGATGATCCGCAGGTGGTCTGCTATTGCCTGCCTCTTGCCTTTCTCATTTAGGGCTTCCGGGTGACGTACACAATATAGAACTCTGAGAGTAACATCTGCCACCTTGCTGTACGGCCCGTGAGGGCTGGCTTTTCAAAGAGATACTTCAGCGGGTCCACCCTTGCAATCAGCATGGTCGTATAGTTCAACATGTAGTGGCGTAGGCGTTGCGAGGCCCGTGTAAGAGCACAACAGGTCTTTTCTAGAACCGTATACCTTGTCTCATAATCAGTGAACTTCTTGCTGAGATAGTATACGGCTCTTTCCTTCCTACCCGTTTCATCGTGCTGACCAAGGACACAACTCATGGATGCTTCCATTACTGACAGATACATCAGGAGAGGTCGACAGGCGTTGGCGGTGCCTGGATGGGAGGATTGAGTAGATATTTCTTAACTTTGTCAAACGCCTTTTGGCAATCCTCGTTCCTTGTGTCTATCTTTTCTGAAAGGCGGGGTATTCTTTCTGAGCAGTTTAAAGATCGGCTCACAGATGGGTGTGAGCTGGGCAATGAACCTGCTGATGTATTGTAGCCTGCCCCAAAAAGCCCTGATTTCTTTCTCTGTCTTTGGTACCGGCATGTCGATAATTGCTTTGCCTTTTGCAGGTCGACTTCGATTTCTCTTTTGCTGACAATGAACCCGAGTAGCTTACCTGACAAAGCACCAAACCCCCCTCCCGGCTTTCTTTTTCGGATGAAGACGAAGACTGTATTTCCGAAATCTGTCAAACACTTTCTTCAAATTCACCGTCTTCTTAAGCCCAAGACTTGGCGATCATGTCATCGACATAGACCTCCATTTCCTTGTGAATCATATCATGAAACAGCGCAGTCATGGCTCGCTGGTACGTCGCCCCGGTATTCTTTAGACCAAACGGCATCACCTTGTAACAGAACGTGCCCTCCTATCCGATATTGTGATAAACGCTCTGTCTTCCTCGGCCATCTTGATCTGGTTATATCAAGAGAAAGCATCCATAAAGGACAGCATCCCATGTCCAGCGGTGTTGTCCACCAGAACATCGATGTGAGGAAGAGGAAAAAAAGATTTTCGGCTTGCCTTGTTTAGGGTCTTTTGACTCACGGAACCAGCTTTCTGAGGGAAAAACCGTTCTCGAAAAGCGTGACCATCCAGTTGAATCTCGTTACCCTCCCGTGTGGTTATGGGGGCGCGCCCACTTTCCACTATTATGGAGCCGGGCCGCAAGCAAGTGAATGTGACCCCGCCCTCCATCAGCCGTTGTGTGTGAGCTTCGCTCCTTATAACTCTCCACCGTCTATCCCGACC
+TBLASTX ds2020-328_3 8577 2589 NC_026260 Sewage-associated circular DNA virus-18 isolate SaCV-18_NZ-BS3994-2012, complete genome Sewage-associated circular DNA virus-18 35.3 1 100 9.0 0.000149016 46.8882 1592085 Viruses;Sewage-associated circular DNA virus-18 TTCCCTACGTATTAATCTTCTTCTTTTCTCCTTTTTCGCGTTTTCCTCTTATTCCTCTTTCGTTTTCCTCTTATTCTTTTTATACGCAATTTCTTTTTTAATTTCTTACTGGTCTAAGTCCCACTCCTCTTTCTCCCCGTTTTGCGTTAAGAATATTTCACATGGCATCGGTTTATAGCCTTTTTCCCTTGTCATCTCCTCTACAATCTTTTCTATTTTTTCATATTTCTTCTTATAAAATTCTTCCTCTTCTCTTCTCTTGCTTACTTGTATGGTTGCCGGAAATACTCTTGTTTCGCCTATTTGTATTTGTAGAGGCCATGTAGCATAGTCGTTTCCTTGTTGAGCCCCCTTACTTCTTTTAACTTCCATGTAGCTTCTTGCTGTCCAATCCCTTTTATCGTAGAATATCCTTTTAATTTTCTTTGTTTCTGAGTTTTCGTCTTGCTCTCTCTCTCCTTCATTTTCCTCGTCGCTTCCCTCCTGGTTTTCCTCCTCATATTCTTCCTTACTCTTAAATAGCTGCAAGAATCTCCTTCTTTTTTTCTCCTCTTTTTCTTCTTTCTTTTTTACGGGTATACACGCAAAATCTAACAGTGCCATTTCCTTCTCTTGTTCGCCCCATGTGTAGCATTCCTCACCATCGATTGTTTGTAATTCAAACATCAAATAACTTCCTCCCGCTGTGGTTTTAATCTTTTTTATTTTTACTTCATATATTTTTCCTTTTTTTGTTATAAAGATAACTTCTTTCTTTAGAATGTATTCTGCGGCCTCTGGGTTCAACTCCCTTTGATACGGTATGTTTATATTTTTTATGTACTGCTTCCATTTTTTTTGACTGTTTTTCATCTCCTTAGGATCGTCCTCAATAGGAATAAAGGTTCCCACGGTTTTGTTGTATGTTAAGATGACTTCCGTTGGTGTGCTTCTTTCCTTAAAATAGGGGCTCTTACACGCTCTTCTCATTATACACCCATATAAGGTTGCTACTATTCTTTCTTCCTCCAAATGCTCTATGTTTGATGAGAACCTAACCCTATAGAACCTTGCTCTAAAGGGTCCATGTTGTCTCATTATTTGAGGTAGTTTGTTGGCAATCATAACAATTGGTACATTTCTTTTCTTTTTGAATACTCTTGCATATTTGGAGTCTAATCTACATTCTTGTCCATCAAGTACCTTGAGAATAGTGTTTGCAAATGCCGTTCCTTCTGCTGTGGCGCCTATAAGGGAGCTCTCGTCGTTTGGTTCATGAAACTCATCGAATGCCCATAGATCATAGTAATCATTTGCTCCCGTAAAGTCATTTCTTCTTGCACTGGCAAAATAAATTCTTAATACTTTTGCTAGTAAGTGGAATAGTAATGTTTTTTGTGTGCTTGGTTCGCCATATATGAATAGTTGCTTTGTTTTTATGGGTCTCTTGAAGCATATTTGACACGCTATCCAATCTATAACGAGGTACTTTTCTCTTAGCTCTTCCACGTCATACTCCCTTGGTTCCCCTCTTTTTATTAGATAGGATACAATTCTTTCTAGGGTGTTTGTCTCTATATCTTTTAGTATCTTTAAATCTTCATAAGCTTCCTTCATTCTTGGTAGATGCATTAAAACTTTCTTTTGTAATATATCATCTCTATATACTTGGTACCAATCCTCCGTCTTCTCTAGTCTTTTGAGTATTTCTGATGGGTCTGGATTCCCCTGTGCTTCCTTATGTTGTTCATGTGCCTTTGCTAACCCTCTTGTTTGCTCTAAAGAGTATTCTCCCCATATTAATGGTTCTTTATCTTCCTTTAAAATATATTTGCAAATAGTTCCCCATCCCTTATGTGCCTTTACATCTATACATCTTCCATCCCACTCTTTGAATCCATTTCTAATTCCTTTTGCTAAATTGTTCTTTGATGCACTCTCATTCCATACTCCAATGTGGTAATGAAATCCTTTCTCTCCGTGATTTTCCTTTGCTATTATGACTGATCTGCATTGAAACATCTTGATGATTCTCTCCTTTATTACTCCCCTATCTATTTTTTTCCGTTCTGTCGTTTCCGCATGAATAAGTGTTATTAGTAAGTAGGGTCTTATAGTGTTTAGTTTCATGTTCATTGTGTTGTTTCTTTTCCGTGATTTCCTTTTCTTCTTTTGTTTGCGCTAGGTTATGGAGTTGCTGCTGTGAGTGGATGTAACTTCTAGTGGATGTAACTTCTAGTGGATGTAACTTCTAGGTGGGAGTGGATGTAACTAATAGGGGGGTCCGGGGGAAGTGGGTCCCCCCCGGGCAAGAGACAAGATAGGTAACTCCAACATCCTCGTATGAAGAGTAAACAGAAGGGAAGTGAGGCTCCCTTATACAGGAGCCGAACGTTACTTCAATACCTATAAAGTTAAGGTAGTGCTCTTTTTGTTAAATACAAGCAGCCGACAACCCCGCCTAGCTCTAGTAATAGGGGTTGTCGGCGTATCGTCTGATTCTTCGGCGAATCGTCTGCTTTTTTTCTTTTTCCACTCGTGAAGCCCCCCCTTTCGCCCTTTTTTATGCAGACGATTCCCCGATCGGGGAATCGTCTGCATAAAAAAGGG
+TBLASTX ds2020-328_882 20 208
+TBLASTX ds2020-328_115 32 426 NC_043491 Cladosporium fulvum T-1 virus LTR-retrotransposon encoding homologues to retroviral gag, pol, and env genes Cladosporium fulvum T-1 virus 39.7 1 100 5.0 7.5847e-27 117.911 2052899 Viruses;Pararnavirae;Artverviricota;Revtraviricetes;Ortervirales;Metaviridae;Metavirus;Cladosporium fulvum T-1 virus GGTCGGGATAGACGTAAGCACTGGTTCCTCCATAAGTGCCTTCTTCAACTCATTGAAGGCATGCTGGCATCGGGGCGTCCACTCCCACGCCTTGTTCTTCTTTAGCAAATCCGTCAAGGGGGCCGCAATGGCTGAATATCCCTTGATGAACCTGCGGTAGTAGTTAACCAATCCAAGGAATGACCGCAACTCAGGTACCTTGGTTGGTGGCTCCCATTCTTGAATGGCTCGCACCTTGCCCTCCTCCATGAGCAACTGTCCACCCCGTATCTTGTGACCAAGGAACTCCACCTCATTTTGGGCAAACGAGCATTTCTCCTTCTTCACATATAGGTTGTTCTCCCTCAGAACTTTGAACACCTGATGCAAGTGCTCGAGGTGCTCCTCTAGAGAATTGCTAAACACGCACCAACGTCTATCCCGACC
+TBLASTX ds2020-328_513 8 238 NC_038784 Verticillium dahliae chrysovirus 1 segment 1, complete sequence Verticillium dahliae chrysovirus 1 57.1 1 100 6.0 1.6282e-24 108.746 759389 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Verticillium dahliae chrysovirus 1 GGTCGGGATAGACGCCAGACACATCCATTTGCATCAGGGACACCCAATCCACCTTGACTTTCCAGCCCACGAATAACCTCACGCGGCAGATCTAGCCATTCTTCGTCTATTTTGACCCGGCACCAGTGGCTCAGAGCACCTATAACACATCCGCGCGCTATATCTTGATCGAAGCCTCTGCGCTCTAGTTTGTGCATTTGATCTCGGATACCAGCAACTCAGATCGTCTATCCCGACC
+TBLASTX ds2020-328_72 40 520 NC_030891 Sclerotium hydrophilum virus 1 isolate ShR#77 hypothetical protein genes, complete cds Sclerotium hydrophilum virus 1 30.4 1 100 25.0 5.98328e-21 98.7021 1895000 Viruses;Sclerotium hydrophilum virus 1 GGTCGGGATAGACGTTGCCCTCCCCTTTCTCTCCAGCCCGAACCTACCTCTCTCCCTATTCAATGGTGCCGCCTTAACTTCCGTCTTCTTGATGCGAGGAGCGTAGTAGTTGATGCGGGTCTGTATAACACGGTCCGCCTCTGCTATACGCTCAGTTAGGGCGTTCATCTCCTTCTTGTATTCCTGAACGATGTAGGCTTGCTCCCCTTGAATACGGCGGGCGGTTTGATACTCCGCCAACTCTGCCGCGCTCAACGTTGAATCGTCCACCGTCATATTGCGTCTGGCCGATACAATCTTGTAAAAAGCCATTATACATGGTACGGCCACGCTGGCGTGCTTAGCATACCAGACGGCATTCTCCGGAAGAATGTCCTGAGTTTGGTACATCTCCCTCAACCCCACTGTCCAGCGCTCCAAGGACTTTTCGTTGCCATTGAAGCTAGCACGTGGTTCCCTAGACTTTGCTGGGTCGAAGTCTTGGATGCGGGCCCACTCCATCCACACGTCTATCCCGACC
+TBLASTX ds2020-328_449 2 246 NC_017990 Botrytis porri RNA virus 1 RNA 1, complete genome Botrytis porri botybirnavirus 1 75.7 5 100 10.0 1.7255383031988e-20 352.20029999999997 1918014 Viruses;Orthornavirae;Botybirnavirus;Botrytis porri botybirnavirus 1 GGTCGGGATAGACGTGTGGAACTCAACGTGCCCACCGCAAGCTTCAACTGCTCCTGTTAGTGTATAAATCAGAAGGATAGGTAAACCGAGAACTTTGATGCAGAGGCAACCTGGCACTGTTGACGAGCCGTAGTTTACTACGATAGCGGTGGGAATTGAAGCCCACTGTAATCTCCCAACATCTAGGCCCATCAGGGTAAAGTGTGAGAATGAAATTCAAAATGCCCCACTTCGTCTATCCCGACC
+TBLASTX ds2020-328_122 22 418 NC_008039 Prune dwarf virus RNA 1, complete sequence Prune dwarf virus 86.9 3 100 33.0 8.71734076908784e-59 720.298 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGCCCGCGACTTCTCTCTTTATGAACGGTGGGGCAATTCCTGGAACCTTTTTAAGGGTTTTTTATCAGGAGATATGGAAGTCGAAGGGTTTCTTGTTTCTGATCCACAATTCTTCGTTCCACTTACTGGAGTTCTTCATATGAAGAAATTGATAAGTGATGCTGGGAAGGTCCTTAGTGTTAAGGATTTACTCGAAGAACAGCGCGCTCTTGTTGCTTTAAAAATGCGCGAACAGATTGCTGAAAGGGAGAAAGCTGAAAAGAGTCGCCGAGAATATGAGAAGGCGATTATTCAACTTGCTGCTTGGACTAAAGCACATCCAGATGCTAAGGTTCCAAAAGGGCTTTCCGTGGAAGAACCACTGATGCCGGACGTTGTCAAGAAAGTGACGACGTCTATCCCGACC
+TBLASTX ds2020-328_529 6 236
+TBLASTX ds2020-328_421 8 249
+TBLASTX ds2020-328_642 4 225
+TBLASTX ds2020-328_87 54 488 NC_003823 Ustilago maydis virus H1, complete genome Ustilago maydis virus H1 60.9 1 100 5.0 9.72556e-33 137.736 28882 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Ustilago maydis virus H1 GGTCGGGATAGACGTTCCTTGTTGCTTTTCTTACCATTATCTACAGTCCCTACAGCACCACTTTCATTTTTATCACTATTTCCAGTCATATTCATTCTGTTACTGTTAATCCCCATTGTTATTTTCCACTGCTCTGCCGTTGTCTCACTGTCCCATCGAAATCTTTGTGCTGCTCTTTCGAAACTCTTCTTCCATAACGCCTGTACTTTGCTCGTCTTCACTCCTCTCCTTTCTAAGACTGCCAGATTGGAGTATATTTCATGTAGTTTACTGTCAAATCCAACCACTCTGTCTGTTTCCCAGTTACCACAGACAAAAGTAGCACATGATCTAGCCAAGCACCCTCTGAGTTTGCCGTCTTTACACCCTAGAACACGTAGGTATTCATGGTAAGACTGATCCGTAAGCAACTTGACTTCTTGCCCCTTAAGATTACATTTAGTGGCAACTTCATTCCAAGCTAAAGCGCAATGCCGTCTATCCCGACC
+TBLASTX ds2020-328_214 30 308 NC_038697 Scheffersomyces segobiensis virus L isolate NRRL Y-11571, complete genome Scheffersomyces segobiensis virus L 34.1 2 100 6.0 2.15313e-12 87.81970000000001 1300323 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Scheffersomyces segobiensis virus L GGTCGGGATAGACGGCATTAATATGTTAGGGTTATAAACCTTCACGTTAGAATATGTCAATTTTCCATTGTTAAATAACGCATACGTCTTTGGATTAACTTTAACTTTGATATCCAACTGCCTACCGGACTGTATTATTTCTATCCAATTCTTAGCCCTCTTTATTAAAGTGTGCATTGGCATTACAAACAGGTTTGCTGCTCCAGTCCCTGGTATATCTGGCATTACATGACCATTTGCATTTGCAGCCCAATTTTTGTATTTCTTACCAGTCATCGCATCATACACCGTAGACGTCTATCCCGACC
+TBLASTX ds2020-328_717 8 219 NC_038782 Verticillium dahliae chrysovirus 1 segment 2, complete sequence Verticillium dahliae chrysovirus 1 37.1 1 100 6.0 8.08632e-06 46.43 759389 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Verticillium dahliae chrysovirus 1 GGTCGGGATAGACGAAGGCCTAGAGTTGAATACATACGAACGATCACCGTGCCTAAAGGTACCTACCACATCACGGGGATTGTACACAACATAGTCTTGAACGTCTAGATCTACATCTATTGCTCCCCTGTCCATGCATTCTAGTAACATCCAGAAGCCTTTCACCAACCGAGTCAACTTAGATTGCCCAACAAAAACGCGCCAATGTCTATCCCGACC
+TBLASTX ds2020-328_351 20 261 NC_007540 Penicillium chrysogenum virus segment 2, complete genome Penicillium chrysogenum virus 40.5 1 100 7.0 1.87072e-15 78.9628 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGACGACGAGGGGCAGTATTGGGACGAACAGTTGCCGAGGTAGTGAACTACTTTGACAACAAATGTTCGAATGCACTTGAGGTTATGGCAGACGATAAATTTAGTGTATCCTATCATACTTACTATGACGTAGATAGGCCAGCTGTGTTGGGTTTGAATACAATGACTGTGAACGTACCGGTATATTGGACGAAGTTACCAGTAAAAATACAGCCTTACACATCAGAGCTTACCAGGGCGTCTATCCCGACC
+TBLASTX ds2020-328_418 18 250 NC_038826 Flammulina velutipes browning virus RdRp gene for RNA-dependent RNA polymerase, complete cds Flammulina velutipes browning virus 40.3 1 100 11.0 1.21395e-11 66.1329 568090 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Alphapartitivirus;Flammulina velutipes browning virus AGGTCGGGAAAAGCGATTGGCTTTAGGCGGCGCGAGGGACGGAACATCTTCTCGATAACACGAAGAGCTCTTTTGTAGTGGAAATCCCTTGGAACGTCGTGGTAAGGGAGGTCAGTCTTAAGGAAGTCTTCTTCTCCGGCGGCGGGGTTAGTTGCAGAACGGCGGTAGCCATTGATTGCTTCGTTTGCCAAATCGGGGGGACAGCACTTATAGATTGCCTTCTGACGTCTATCCCGACCGCCGTAATTCA
+TBLASTX ds2020-328_149 24 357 NC_007542 Penicillium chrysogenum virus segment 4, complete genome Penicillium chrysogenum virus 44.1 1 100 7.0 3.29805e-16 82.1702 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGGCGGTGTTGTAGCATGTAGCACTGGGACCTGAGGAACAACATTTGTGTGCTGAGGTTGGCGAAAGAAGATTAAATGACGTATCATTTTGGGTTAATGATAGCTTGGGTGGAAGGGAGGATGAAAATGAAGTAATTGGTTCCAGCCTAATAAATACAGATTACCCAGGAACAAAATGCGCCATGGTATACAGCTATGTAGAGGACAAATGGGTAGAAATGAGTAATAAAAATTACGGTGAGTATACAAGGAAAAGCTTCCATGGCGATGTGAGACCTAGTGTACCTTTAAGGCGAACAATGGAAAAAGAACCTGCACCTGTAACTTGGTGCGTCGTCTATCCCGACC
+TBLASTX ds2020-328_591 22 229
+TBLASTX ds2020-328_579 14 230
+TBLASTX ds2020-328_462 6 244 NC_040551 Panax notoginseng virus B isolate YNSL1212, complete genome Panax notoginseng virus B 73.3 1 100 5.0 2.01042e-34 141.737 2248770 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Panax notoginseng virus A GGTCGGGATAGACGGGAGCAATATATGGGGTGGATTTAACTTCGGCAACAGTAGCACACTTTGCCATGTTTAATTGTGAAGAAGCCTTGAAGCATAGGTTCCCGGTAGGTGAAGATGCGGAAGCCGGGCGTGTGCATAAGCGGCTAAAAGCTATGTTAGAAGGATGTGACTCGTACTGCTATGATTTCGATGATTTCAACGCTCAGCACTCGACGTCGAGTATGGTCGCTGTGATAAAGGCGTA
+TBLASTX ds2020-328_867 11 209
+TBLASTX ds2020-328_908 8 207 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 68.4 2 100 8.0 3.53985e-06 185.418 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B GGTCGGGATAGACGATGTTAAGTGCTGGCTGTTGAAGTCCTCAAAGTCTAGACAATATGGCAACCTATTCTTCAAGACACCCGCCACTCTGTTTACTACATTTCTGTCGTTTGCGTCTTTACCTACCGGGAATCTGTTCGGCAAGACGTTCTCGCAATTGTAGAACGCGAAGTTTGCAAGTACGTAACTCGTTCGTCTATCCCGACC
+TBLASTX ds2020-328_7 1825 2116 NC_008038 Prune dwarf virus, complete genome Prune dwarf virus 88.5 19 100 100 0.0 3998.4456999999993 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGTCACCACATCCTCCTTAAAGGGGCATCCTCACCTTACGGTGAGGGCATCTACAAATTTGTAGGCAATAAAAAGTGTCATCCATTCAGGATACAATGGGCATTTTTATCTTAACTTTTAACGCACGCAGTGCAAGTTAACCAAAAGGATTTAACATTCAGTGACAAAATCTGAATGGTGGATTCTATTGCAAAAGCAGCATCTCCAGCTACGAATATTCCTAGGAATACTCATAGTGGAGGTACAATCAAACAACGGATCATATAGTCATCCACTGACTATTTTATCCATTGCATCCATGAGAGCGGTATCCCGTTCAGCGTATAACACTGAATCAGGGATCTCGACTCTCTTGGGCATCGAGTGTTGTAGGTACTGAGTACAGAACCATACCGGAACGCCGGGCTGAAAAGCATTGTCATATTTTATGACAAACCAGAGATCATCTGGTATATCCCCGACGGTCATACCAGTAGGAGCAAGAATTTGCACCCCACTGGCTTGTTTCGCTGTGAACTTCCTACGTTGTAGGGGATTAGGCGCCACTGGCGCATTCACATCGAAACCTTTAATGAGTCCGTAGACACCATTAGAAACATCAAGGCAGTAACGAAAAACAATTCCGTATACCTTGGTATCAGCAGAAAAGTCCTTGAAAAGTTCTCGGACTTTCATGGTGTAGTAAACACCGGAAGCGGTCGAATTGACCGTCAAATTCTCGGTACGAGATATCATACCGGAAAAATTTTTTACGGGCACATTTGGCCCGTGAAGCATCCACTCGGAAACAGACTTCGAGCTTCCACCCGGGAATTGTTTCTTAACAAAACCAGCAGGGGGGGTAGTATTATTATTCTTCCGAGCTAAAGCAAAGCTTTGTGATCGGGTAGTAGGCTTTCCAGATTTAGTGGCTTTCCCAGACATTATGAGAGTATAAACAAACGAGAATTGGAAGAAATTGGTAAACAAAACGAGCTATTAACTCACAAAGTGAGTTAACCAATCGTTACACCAAAAGCTTCCTTGTCGGACTTCTCTTTTTTTAGAGGAACAGACTCGGCTTCCTTGAAACTGTCAAGGGAAGATTTACCCTTTACGGGTACAGCAATATTCTTAAAATCCACTGTTAAAGCCTTCTTTGACTCGTCAGACTTAATTTCAATAAGTCTGGGATTGATATCAACCTTTCCACTACTCCCAATTACCAAACGTGATTTGGCGAATGTTTGGAGTATCTTTACATTGTCCACAGCAGCAAGGGCTTCCGATTTCTCAATCGGGAATCTCAAAGTTGGGTACATTTTCTCATATGGTTTCTTCTTGTGCAATGAGTCATCCCAGAAGGGGTAAACAGTTCCAACAATCGACGCGTGTTTAGCGTCTACACTTACAGCTGATGCTAGTAAACATATACCATCTCCGTCATCAGCATGAACTGCTCTTGGCCATCTCGCTACGAAAATAGCCGCTTCATTCAATGGTGAATCTGTATCTATATCAATAGATTCACCTGTATTCACATTGAAAAGTTTCAATGTCAATACCCCACTAGTTGTTTCCAGAATGGTCGGAATGTACAACAAGTAAATTATACTATGATGCACGTACACATGACCTTTTGCTTTAGCGGATAATCTTGCCAAAGCGCTTCGGGATTCTTTGGATTGCAACTTCATGGGTTGAATTGGAACACCATTCTTCAACTGTAAAGAAAAACATTTCTTAGTTGGAAGATTCTTCATCATAGTTTGGGAATAAAAGTCATCCACTTCGCTGAGTATTGTATTCCAATCTTCAGCGGAAACTTCAAATGCCGAACTGGTACTGGCTTCGGACGTCTGTCCGGTAATGGTCCTGGATACACCAGAGAAAGCCATATTCAATTCAGGAGATAAATCTACAACCGAATTGTTTCACTCAATAAAATAAAGAGGTTAATGAATAGGAACAAGTCCGATTAGTGAGATAAATCTCAAACGTCACAAACTTGTCTTCTTCACACTTTGCAAGAAACCTTGCAGTAACTCAATTTCTTGAGGGTTTATAGAGAACCGCACGTCTGTCAACTTCCACAGCTTAGCACAACCACGCGTCTATCCCGCCC
+TBLASTX ds2020-328_563 2 233
+TBLASTX ds2020-328_410 21 251 NC_008037 Prune dwarf virus RNA 2, complete sequence Prune dwarf virus 78.6 6 100 24.0 7.989507454006384e-19 381.2186 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGGCGGGATAGACGGCTATTGTGGTTGTTCGTATTTTAAAATGGATTCCCTACTTGAGTTTTTGCTACCTTCACATGAAGATGCGATCGAATTGGTTGATGCCAATTCGGTTAAGACTAGCTTCAGCTTGCCTGATTCTAGTGGGGATGTTTCCCCACTTTGTAGGTCGTTGTGTCAGTTCTTCGGATTTCTTATGATCCGAGATACTGTTGTCAGACCTGACAAATTTTCTGGTTTCGTCTATCCCGACC
+TBLASTX ds2020-328_646 23 224
+TBLASTX ds2020-328_537 38 235 NC_007540 Penicillium chrysogenum virus segment 2, complete genome Penicillium chrysogenum virus 47.7 1 100 6.0 1.50506e-11 65.6747 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGACGTTAGCACGGGTTGGAGTAGAGATTCAGTTAGGCAGATAGGTGACGATATGATGCAAACGCTCAGGGTATTGCTTGAGACGGCAGTTGTGGGACAAGAGAAGTTGTGTAGATTAGTTAAAGGGTACCTTTGGCTTCTAGAATGTATGGAAAGAGGTACTATAGATGTTACCGTGGATAGCCAGAATTGTGTAATTTATGGGCCAAATGCGTCTATCCCGACC
+TBLASTX ds2020-328_26 164 872 NC_008039 Prune dwarf virus RNA 1, complete sequence Prune dwarf virus 89.0 8 100 65.0 4.21136e-103 1500.4649 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGATAAACTGGGCTTCTCAGCTTGAGTATGCGTAACATACACAGCGGAGGCATCCACCTCAACTTGAGACAGAGCATTTATAGGTTTCACTTTAATAGACCTAAGAATATGTCTTTTTGTCTTAACAGGAGTCTTCTTTCTATAGAAGAACTTAGACAAAGCATATACCGTATCAGCAGGATTTCGGTATGTAATCGTTTGTTTCACATGATCACCTTTCAAAACATGGTGCTTCAGGAGAAACATATCATTCCTGGAAATAAACGGTATTTGTTCAGTGTCACCAAAGGCTATAACCTCTGATAAACCGGCAATTGCGTCTATCCCGACCNNNNNNNNNNGCGGTCGGATAGACGCAGCCCCCTCACCTCTTCTTCAACCTCATCTCCCTCTTTTGTTTCCAGCACCGGCAATTGTGGCAGCAGCATATATGCACCCAGCATGTTGCATGAAACACTCATCAAACAACATCTTCTTTGCCTTGGGAGCATTGTTTGTCATCAGATAGGAATCGCAAGTTCGAATGAACCTGCTTTTAACTAACTGGGATCCCTCAACAGCTTCTTTCAACTCAATTGCAGAAGATCTGTTGGAAGTCAAGAGTAGGTCTATATCATCTCCAACCATGGAGGCAATAGACTTGATCTTGGTAGTTTTTCCACAACCAGCAACACCGTCCATGATTGTGATTGAAAAATCACAATTCATCTTCAAAGCCTTTTCCAGTGAAGGTATAACCTTCTCCACTGATGAGAATACACAAGAGTCATCAACAATGACAATTTCGTATTCTCCGACAGATCGTACGCAGGCAGCGGACACATTTCCGGCATCATCCCACCATTCCGTCTATCCCGACC
+TBLASTX ds2020-328_246 39 291
+TBLASTX ds2020-328_409 6 252 NC_007540 Penicillium chrysogenum virus segment 2, complete genome Penicillium chrysogenum virus 48.6 1 100 7.0 7.72171e-14 73.4643 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus ACAGAGGTCTTTCTCGAACGTAAAGCTGCCTAAGGTTGTATCAGGCTACGATCTAATGGTGCCAGCATTTATGCACACAAACTCACAACTAGACAAACCAATACTGTCAATGCAAATGGCCAAATAGATTGGTAGGTTGCATCAAATGCTACTATTCATGAATGTTAAAGACATTCTAACAGCTGCTGAACTAAGCACACATTGAACTTTTGATCGTATTGATAGTAGTAGGTTGATTCGTCTATTCCGACC
+TBLASTX ds2020-328_401 2 253 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 52.1 2 100 8.0 2.658960000000012e-05 135.9315 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B TGGTCGGGATAGACATTGCGCGTCCCTGATTGTCATGCACTAGCACTCTGTCCAGCGATAGTCTGGTCCACTCCACAGCTGCCAGCTGCTCTTGAGTTAAGAAGTGACCAAACGTGTCCCTGTAGGCATCTATTACGGCCTTCATAGATTCCACACTGTGTTGACTGTTGAAATCTTCAAAGTCTACACAGTACTGAGTTCTGCCTTCTAAAACTGACCTCACTCTGATACGAACGTCTCGTCTATCCCGACC
+TBLASTX ds2020-328_374 14 257 NC_003885 Mycovirus FusoV RNA 1, complete sequence Fusarium solani virus 1 45.0 1 100 7.0 3.96088e-05 44.5971 1511847 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Gammapartitivirus;Fusarium solani virus 1 GGACGGGATAGACGACGGGCTCGGTTGCTCCAGGTAATTTCCTCCTTCGTAACAAAGTCAGTATATGCCAGACGATGTAAACTTTGTATTCGACAACGACCTCCCGGACGATGATGTGTTGGTTCATCCAGACATCACGGCGTTGGGCTCTCCGTCTTTAAAGACGAGACAACGTCAGTTCCGATCCGGAGCGTTATTTTCTGGTCCCGGTCTCAAAGAGATCGCTCGATATGGTGGTTACTCCGTCTATCCCGACC
+TBLASTX ds2020-328_390 16 254
+TBLASTX ds2020-328_413 6 251
+TBLASTX ds2020-328_58 39 561 NC_043491 Cladosporium fulvum T-1 virus LTR-retrotransposon encoding homologues to retroviral gag, pol, and env genes Cladosporium fulvum T-1 virus 45.8 3 100 6.0 1.5431e-35 185.1108 2052899 Viruses;Pararnavirae;Artverviricota;Revtraviricetes;Ortervirales;Metaviridae;Metavirus;Cladosporium fulvum T-1 virus TGGTCTGGATAGACGCCCGCTGCAAGTTATATGAGAACTGAGCAACATCCATCAACTTTGCCCAATTCCGCTGGTTGGCACTCACATAGTGCCTCAAGTAAAGCTCCAACAAGGCATTCACCCGTTCCGTCTGACCATCTGTCTGAGGGTGAAAGCTAGTTGAGAAGTTCAACTGTGAGCCAAGTAGCTTGAAGAGCTCCGTCCACAGCTTCCCTGTGAAGCGTCTATCCCGCCCNNNNNNNNNNGGTCGGGATGACGGTAGCATACTTGGTGAACCTGTCAACCACCACCAAAATTGAGCCACACCCTTCCGACTTGGGTAGACTCACAATGAAGTCCATGGATAAACTCTCCCATGGTCTGGTTGGAACTGGAAGTGGCTCTAGCAACCCGCCTGGCTGCTTCTGCAATGTCTTGTCTTGTTGGCATACAAGACAAGTCCGCACGAACGAGTCTACATCTTCCCGCATCTGTGGCCAATAATAAGCTTCACTCATCAAGGCTAATGTGCGATGAGTGAAGCTTATTATTGGCCACAGATGGCCACCGTCTATCCCGACC
+TBLASTX ds2020-328_595 8 229
+TBLASTX ds2020-328_692 10 221 NC_038838 Crimson clover cryptic virus 2 isolate IPP_IncarnatSK segment RNA 2, complete sequence Crimson clover cryptic virus 2 53.4 1 100 7.0 1.40883e-16 82.1702 1323528 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Betapartitivirus;Crimson clover cryptic virus 2 CCCCGCTTCCACACCCGCTCACTACTACTCCAAAGTGTATCAAATCTTTACGTCTGTCTTTAACCCAGCTTTGTTCCGCTCCTATCAACGCCGATCCGTTCTCGCCTCAATCGCTCTCGACCCCGTCACCTACCCCGACCGTCACATGAACTTCTTCGATCTCGTTTTCTCCGCTTCCCGCTCCAATCTCGCCGAACTCCGCGCAAACGTCTATCCCGACC
+TBLASTX ds2020-328_51 130 617
+TBLASTX ds2020-328_484 7 242
+TBLASTX ds2020-328_467 20 243 NC_038784 Verticillium dahliae chrysovirus 1 segment 1, complete sequence Verticillium dahliae chrysovirus 1 32.4 1 100 6.0 6.62632e-05 43.6807 759389 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Verticillium dahliae chrysovirus 1 GGTCGGGATAGACGGTCAGTCCCCCTTTGAAATCAAGCACCTCTAACCTCAGCTTGTTCCCCGTTATTATACCTACCATTTCGGCTCTAGTTACGGAGTTGCCATTACGTGTGACATAAGCCGCATATTCCGTATACTTGTCGCATATGCCTTTCAATTTCTCGGCTTCTTCATCCACTTCTTTATTGAACATCACATCTTCTAAACCACTACACTCACGTGGCTCCGTCGTCTATCCCGACC
+TBLASTX ds2020-328_593 14 229
+TBLASTX ds2020-328_332 10 266
+TBLASTX ds2020-328_724 2 219
+TBLASTX ds2020-328_921 20 206
+TBLASTX ds2020-328_136 40 372 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 59.4 1 100 6.0 7.87159e-34 140.821 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B GGTCGGGATAGACGTCAGACGGTTCTTCAGCGTCTATCCAGACCGCCGTTATTCTAGCAACGGCCGGCACGTTGGCATTCCCCTAGACACTGAATCGTCCAGACGCGACTCCAGCGCTTCCAAAAGGTCCCTCATATCGCTTGAAGGTTTTGACTCTATCCTCGAGTGTACCAAGGTTGCCATAGCTCTAGATAGATACTGTCCCTTAGACCCACGTTTGTGGTCTACGCGTAGAAACTCTGCTATGGCCCCATACGCACATTTGCTCATCTGCAGGCGTATGTTGTGCTTCTTGGCATTTTTGCCAGCTAGCAACACGTCCTCGAGCGAATTACTTCCCAGTAGCACGTCGTCACCGTAGTGGCGGCCGTT
+TBLASTX ds2020-328_303 4 271
+TBLASTX ds2020-328_706 4 220 NC_003689 Cherry virus A, complete genome Cherry virus A 79.4 3 100 8.0 4.376753333333334e-21 351.4408 42882 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Tymovirales;Betaflexiviridae;Capillovirus;Cherry virus A GGTCGGGATAGACGAAATCATGTGCATTACTCAATGGGTTCTTGAAAACCAATCTTTTCTTGACTGCGCTCCAGAAAGTTAAATCATCATTAGCAAAATGTCTCGGGAAAACAGCTTCAGGGAGCATTGCGCAATTATCCTCCACCTGATCTTTCTGATTTGGCTCATCTTTGAACTGCTTGCTCCATCCGACACCAATCTCGACTAGGTCCACGGCTCT
+TBLASTX ds2020-328_463 6 244 NC_010985 Curvularia thermal tolerance virus RNA1, complete sequence Curvularia thermal tolerance virus 50.0 1 100 7.0 2.06484e-10 62.0091 421976 Viruses;Curvularia thermal tolerance virus GGTCGGGATAGACGATTGCCGTTGCTGAAAATGACGGGCATCAATTGGTTGGGGGATAAGAGCTTTGGTACCACAATTCTGGAAGATGACGAAGGATGTGGGCACCACCTCAGGTCACAGTTTCAACACGTTGATCCAATCTATTTGTACCTTGATGGTGGGCTATGCCGCACTCTTCGACCTGGTTCCTGATGAAGACTGGGATCGGCTCTGGCAGGAGGCGTAGCTCGCGTCTATCCCGACC
+TBLASTX ds2020-328_69 43 528 NC_008039 Prune dwarf virus RNA 1, complete sequence Prune dwarf virus 93.7 5 100 42.0 9.0761104e-87 1082.5864000000001 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGCCCATTGACATTAGGTTTGTACTGTCGGAATGAAGCCTCACACACTCTGGATAGAACCTTCGTGTCAACCAGTATGTGTCTTCTGGACACCGCTTCTAAAGAAGGGTGTACTACTGACGTAATATCAGTAGCCATGACCAAAGTTTTTGACTTCAGTTTGGTCAACCAGGCACAGGATCTTCCTGCATTCAACTCAATTCCAGGTTTATACCCGGAGCAATAGGTGATATCGATAATCATGACTCCATGAAAATCGGTTTTCCGCTCGACACGAAAGGCGGCATCACCTAGATCAACAGCATTGTAATGCAAATACTCCATAAGTGTAGAATACTTATGGTCATACCCCAAACAGGGTGCATCGACAAAGTCAAAATAAATTCTGTCTTTGTCCTTGTCCACATGCCAATCCACATTGAAATGATCTATGTGACCCCTGTCCTTAATGTACATCTCGGGATCGATCATAACAGAACAAATGAATTTCATCACGCTTATTTCGTCTATCCCGACC
+TBLASTX ds2020-328_861 4 210
+TBLASTX ds2020-328_2 8845 2632 NC_026260 Sewage-associated circular DNA virus-18 isolate SaCV-18_NZ-BS3994-2012, complete genome Sewage-associated circular DNA virus-18 35.3 1 100 9.0 0.000151579 46.8882 1592085 Viruses;Sewage-associated circular DNA virus-18 CCCCCCCTTTCGCCCTTTTTTATGCAGACGATTCCCCGATCGGGGAATCGTCTGCTTCCCTACGTATTAATCTTCTTCTTTTCTCCTTTTTCGCGTTTTCCTCTTATTCCTCTTTCGTTTTCCTCTTATTCTTTTTATACGCAATTTCTTTTTTAATTTCTTACTGGTCTAAGTCCCACTCCTCTTTCTCCCCGTTTTGCGTTAAGAATATTTCACATGGCATCGGTTTATAGCCTTTTTCCCTTGTCATCTCCTCTACAATCTTTTCTATTTTTTCATATTTCTTCTTATAAAATTCTTCCTCTTCTCTTCTCTTGCTTACTTGTATGGTTGCCGGAAATACTCTTGTTTCGCCTATTTGTATTTGTAGAGGCCATGTAGCATAGTCGTTTCCTTGTTGAGCCCCCTTACTTCTTTTAACTTCCATGTAGCTTCTTGCTGTCCAATCCCTTTTATCGTAGAATATCCTTTTAATTTTCTTTGTTTCTGAGTTTTCGTCTTGCTCTCTCTCTCCTTCATTTTCCTCGTCGCTTCCCTCCTGGTTTTCCTCCTCATATTCTTCCTTACTCTTAAATAGCTGCAAGAATCTCCTTCTTTTTTTCTCCTCTTTTTCTTCTTTCTTTTTTACGGGTATACACGCAAAATCTAACAGTGCCATTTCCTTCTCTTGTTCGCCCCATGTGTAGCATTCCTCACCATCGATTGTTTGTAATTCAAACATCAAATAACTTCCTCCCGCTGTGGTTTTAATCTTTTTTATTTTTACTTCATATATTTTTCCTTTTTTTGTTATAAAGATAACTTCTTTCTTTAGAATGTATTCTGCGGCCTCTGGGTTCAACTCCCTTTGATACGGTATGTTTATATTTTTTATGTACTGCTTCCATTTTTTTTGACTGTTTTTCATCTCCTTAGGATCGTCCTCAATAGGAATAAAGGTTCCCACGGTTTTGTTGTATGTTAAGATGACTTCCGTTGGTGTGCTTCTTTCCTTAAAATAGGGGCTCTTACACGCTCTTCTCATTATACACCCATATAAGGTTGCTACTATTCTTTCTTCCTCCAAATGCTCTATGTTTGATGAGAACCTAACCCTATAGAACCTTGCTCTAAAGGGTCCATGTTGTCTCATTATTTGAGGTAGTTTGTTGGCAATCATAACAATTGGTACATTTCTTTTCTTTTTGAATACTCTTGCATATTTGGAGTCTAATCTACATTCTTGTCCATCAAGTACCTTGAGAATAGTGTTTGCAAATGCCGTTCCTTCTGCTGTGGCGCCTATAAGGGAGCTCTCGTCGTTTGGTTCATGAAACTCATCGAATGCCCATAGATCATAGTAATCATTTGCTCCCGTAAAGTCATTTCTTCTTGCACTGGCAAAATAAATTCTTAATACTTTTGCTAGTAAGTGGAATAGTAATGTTTTTTGTGTGCTTGGTTCGCCATATATGAATAGTTGCTTTGTTTTTATGGGTCTCTTGAAGCATATTTGACACGCTATCCAATCTATAACGAGGTACTTTTCTCTTAGCTCTTCCACGTCATACTCCCTTGGTTCCCCTCTTTTTATTAGATAGGATACAATTCTTTCTAGGGTGTTTGTCTCTATATCTTTTAGTATCTTTAAATCTTCATAAGCTTCCTTCATTCTTGGTAGATGCATTAAAACTTTCTTTTGTAATATATCATCTCTATATACTTGGTACCAATCCTCCGTCTTCTCTAGTCTTTTGAGTATTTCTGATGGGTCTGGATTCCCCTGTGCTTCCTTATGTTGTTCATGTGCCTTTGCTAACCCTCTTGTTTGCTCTAAAGAGTATTCTCCCCATATTAATGGTTCTTTATCTTCCTTTAAAATATATTTGCAAATAGTTCCCCATCCCTTATGTGCCTTTACATCTATACATCTTCCATCCCACTCTTTGAATCCATTTCTAATTCCTTTTGCTAAATTGTTCTTTGATGCACTCTCATTCCATACTCCAATGTGGTAATGAAATCCTTTCTCTCCGTGATTTTCCTTTGCTATTATGACTGATCTGCATTGAAACATCTTGATGATTCTCTCCTTTATTACTCCCCTATCTATTTTTTTCCGTTCTGTCGTTTCCGCATGAATAAGTGTTATTAGTAAGTAGGGTCTTATAGTGTTTAGTTTCATGTTCATTGTGTTGTTTCTTTTCCGTGATTTCCTTTTCTTCTTTTGTTTGCGCTAGGTTATGGAGTTGCTGCTGTGAGTGGATGTAACTTCTAGTGGATGTAACTTCTAGTGGATGTAACTTCTAGGTGGGAGTGGATGTAACTAATAGGGGGGTCCGGGGGAAGTGGGTCCCCCCCGGGCAAGAGACAAGATAGGTAACTCCAACATCCTCGTATGAAGAGTAAACAGAAGGGAAGTGAGGCTCCCTTATACAGGAGCCGAACGTTACTTCAATACCTATAAAGTTAAGGTAGTGCTCTTTTTGTTAAATACAAGCAGCCGACAACCCCGCCTAGCTCTAGTAATAGGGGTTGTCGGCGTATCGTCTGATTCTTCGGCGAATCGTCTGCTTTTTTTCTTTTTCCACTCGTGAAGCCCCCCCTTTCGCCCTTTTTTATGCAGACGATTCCCCGATCGGGGAATCGTCTG
+TBLASTX ds2020-328_728 14 218
+TBLASTX ds2020-328_139 20 368
+TBLASTX ds2020-328_711 4 220
+TBLASTX ds2020-328_310 8 270 NC_009890 Black raspberry virus F, complete genome Black raspberry virus F 45.6 1 100 5.0 1.39013e-19 92.709 463392 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Black raspberry virus F GGTCGGGATAGACGTCCGAAGGGTCTACATCTATTACGTCTGGCCTCATTCTGTGTTCACGTTCTTTAACCCAGTCTACTTGACCGTAGCCTCGATTAACAAGTGTATTTAACTCAAACATATCCGTCAGATCAAGTAAGTCCCTAGAGTGTAATGCCTTCAGTGTCACTGATACGTCCATCAGTTGTTCAAGCATTGCGTAGGTGTTTTCACACCACACTTTGTCTGAGTGGGTCAACAATAGAGCACCACAGACCGTCTATCCCGACC
+TBLASTX ds2020-328_891 4 208 NC_007539 Penicillium chrysogenum virus segment 1, complete genome Penicillium chrysogenum virus 77.6 1 100 5.0 4.9233e-29 123.409 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGACGATTTCGGGGGCTAGAAGATAGGGAAGGGCAAATGCATAAATTGTGGCGTGGCTTATATTCCGGGTGGCGAGGCACTACCTGGATAAACACTGTTCTAAATTTCTGCTATGTTCACATAGCGCTGGTGAACCTGGAAAGGATAACAGGGATAAGTGTTGTTTTAATGGTAGGCCACGGCGGCGTCTATCCCGACC
+TBLASTX ds2020-328_317 8 269 NC_030889 Arabidopsis halleri partitivirus 1 gene for RNA dependent RNA polymerase, complete cds Arabidopsis halleri partitivirus 1 50.0 1 100 9.0 6.80502e-15 77.13 1849335 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Arabidopsis halleri partitivirus 1 GGGCGGGATAGACGAATCGTCTCTCGTCCCCAAAGTAGTCTGCCTTTTGTGTCATCATTTAAGTATGTTGCTTGTAGTGTCCAAATGAACATGTTTTCTGCTTGTAATAGAAGCTTGGTAGCTCCGAATACTGCTCGAATTTTGTCAGGTTCATCAGATGCGACAACATGTGAGCGTGCGTGTAACGTGCTCCAATAGTATGGCACTGGCTGACCATCTTTCCAGAATGGAGTTAATCCATCCTTAATAAAGTGGATGAGTGATCGGTT
+TBLASTX ds2020-328_871 4 209
+TBLASTX ds2020-328_518 12 237 NC_007539 Penicillium chrysogenum virus segment 1, complete genome Penicillium chrysogenum virus 70.3 1 100 6.0 3.59992e-34 140.821 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGACGGCTTCTCTACTTGCTTTGTAGTCTGGTACTACGACTTTGTACCACTCTTCGTTCACTTCTGGAACCTTGTCTTTCAATTTCCAAACCATGTTATCTACATCGGGCACTCCTAGCCCGTTGTCTTCAACGCGCCCATGTATTATTGTCTGAGGCAAGTTAAGCCATTTTTCGCCATCTTTTACTCTGCACCAGTGACTTATGCACTGTAGCGTCTATCCCCACC
+TBLASTX ds2020-328_475 6 243
+TBLASTX ds2020-328_693 12 221
+TBLASTX ds2020-328_855 4 210 NC_055143 Rhizoctonia solani ourmia-like virus 1 RNA 1 isolate RsAG2 RNA-dependent RNA polymerase gene, partial cds Ustilago maydis virus H1 64.2 2 100 6.0 1.27988e-11 84.154 28882 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Ustilago maydis virus H1 GGTCGGGATAGACGAGTTGGTGCATTAGAGGCGACGCTAAACCATCGTCGTTTAATGAATTCTCTAGAAACGGAGAATTATTTGTTAGTGGTGATTATGAATCCGCCACTGATAATCTAAACTCTGAGGTCCAACTCGCCATTCTTGACGAGCTGCTGCAGCGCTCTACTTCGGTACCCAGGGGTATCCAGGGCACGCGTCATCCCGACC
+TBLASTX ds2020-328_335 8 266 NC_038697 Scheffersomyces segobiensis virus L isolate NRRL Y-11571, complete genome Scheffersomyces segobiensis virus L 54.7 1 100 5.0 1.69281e-22 102.36 1300323 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Scheffersomyces segobiensis virus L GGTCGGGATAGACGGATCGGAGGCATTAAGTAAAGAACAGTCTATGTCACTAGATTGGACAATTGAGTCAATCTCAGACCAAGTGGTAAGGTTTAATGAGTTAGGAAAAACAGAAAGAATAAATGGAACCTTATTAAGCGGATGGCGTCTGACCTCGTTTATCAATACTGTATTAAATAGAGTGTACTTGTTAAACTCAGGACTAAGTACGTGTGTGAACTATGCGTTACACAACGGTGATGAGATGTATGCGTCTATCCCGACCC
+TBLASTX ds2020-328_890 8 208
+TBLASTX ds2020-328_863 22 209
+TBLASTX ds2020-328_109 77 442 NC_038697 Scheffersomyces segobiensis virus L isolate NRRL Y-11571, complete genome Scheffersomyces segobiensis virus L 59.1 1 100 9.0 5.79157e-51 198.097 1300323 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Scheffersomyces segobiensis virus L TGAATTACGGCGGTCGGGATAGACGCACATACCCCCTCTTGATATTATCTCATCAAACCTGTTATTCATAGATCGTATCAACTCTCTGTAGTCGTTTGCTGGTGCCATCTCTACCCTGCCATGTACCGCTGTTGACACAGCTCTTGCCAGGTACTGCGAACTCGTTTTGTAACTCGCCCTCGTGTCCACCCGTAAGAACTCACCTATGGTCCCAATATTTGTCTTTGCTAATTGTGCTCTTATCCCTGCGTCCTTTGCTCTTTTAGCCAGCTTCACTGCCTGTGCTACGTTTTGCGTTGTAGCGTACATGTCATCTCCGTTGTGCAGTGCATAGTTCACGCTACTATCTAAGCCAACGCTAACGAGATAAACTCTGTTGAGTATGGTGTTTATGAAAGATGTCAATCTCCACCCACTCAGCAATGTTCCGTCTATCCCGACC
+TBLASTX ds2020-328_93 51 471 NC_008037 Prune dwarf virus RNA 2, complete sequence Prune dwarf virus 81.8 6 100 42.0 1.201325e-28 685.9264000000001 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGAATTTTCTGGTGAGTTTATAACGCTTCCTTTCGTTATCGATCGGTTAAGAATGACATTCGATTTGGAGGATGATTATTCATTCTCTATGGGTGATTGTTCATACGATCTGGAACTCACTGATGCTCAACTTGATTATGTTGAAGTTCTTCAACAACAGAAAGATTTCTTTTCAGAAAGTCTTGGTAAGGTTGTTGTCGATTATGATTTTTCCCTTGATAGTGAAGATCCTTCCATCAAGGATGCTGTGAAAATACCCGATGAAATTCCGGAAGATTTCCCTCAGGAAAGTATACCAGCTGAAGTTGTAGCTGATGTTCCACAATCTGTTAGTGATGTCGTCGAAGAGCAAGTCGTGGCTGGAGAGTTGATACCTAGCTGCGAAACTGTCAATGAGAATGTTTGTGTGGAAGTTAAATACCCCACAAGCCTTATCCCTAGATTCCGTCTATCCCGACC
+TBLASTX ds2020-328_388 4 255 NC_004049 Ophiostoma mitovirus 3a, complete genome Ophiostoma mitovirus 3a 50.0 1 100 9.0 1.0261e-20 96.3747 198597 Viruses;Orthornavirae;Lenarviricota;Howeltoviricetes;Cryppavirales;Mitoviridae;Mitovirus;Ophiostoma mitovirus 3a ATAGTACGATAAAACATCTTTCTGAAAACGGATCGGTAAACGATCTGTAGCAGAGGATAAATCAAAGCTGTGGAATTGGTGGTCACCCAACATGCCTAATAACTTTTTATTTAGAAGAGAAATCAAAGGGGCACCTTGATTAAAGGTACCATCCTGTTGAATTCTTCTTAAAATAGAGAAGATATAATCATGAAGGGGCTTTAATATGGATTGTGTTACACAATCAGTAATAGCAAAGGAGTAGTGGCGGCCGTT
+TBLASTX ds2020-328_533 4 236 NC_004049 Ophiostoma mitovirus 3a, complete genome Ophiostoma mitovirus 3a 37.3 1 100 7.0 2.62461e-06 48.2628 198597 Viruses;Orthornavirae;Lenarviricota;Howeltoviricetes;Cryppavirales;Mitoviridae;Mitovirus;Ophiostoma mitovirus 3a GGTCGGGATAGACGAACCCGTCCCCTGGTCGGGATAGACGCCGAGTGTGGATGAACGTCTATCGAGAGTCGATCTCAAACCATTTGCACTTCGTGTACATTCTTTATGACGTTTGTCCGGGAAGAAATTCCTGGTCTTATATCTAAAAGATTGTCACCTCGTGTTAATGAAGTTTGTAGCCGGGGATCCTATTCAGGTTATACCTAATAGACCTCTGAAACATAGTGGCGGCCGTT
+TBLASTX ds2020-328_830 7 211 NC_008037 Prune dwarf virus RNA 2, complete sequence Prune dwarf virus 74.4 3 100 21.0 1.2368933870666668e-13 289.1245 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGCTTACCTTCCCATGGTGAGGTTAATTACTTTTCTGAGTACTTGAAAGGTAAAGCGATCGATGATGATGATCTATACGTTGATCCTATTTGTTTAGTTTCTATGGATAAGTATAGACATATGATAAAATCCCAACTTACACCAGTTGAAGATAACAGTATGATGTTTGAGAGGCCTCTGGCAGCCGTCTATCCCGGCC
+TBLASTX ds2020-328_62 44 551 NC_020903 Xanthophyllomyces dendrorhous virus L1A capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1A 58.1 2 100 8.0 1.13315e-41 187.709 1167690 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1A GGTCGGGATAGACGTGAAGATCAGGTATACGCAGCTTTATGGACAGCAGAATCTGTGGGTAGACAGGTAATACACGATAATGTAGGTACAAAACAAACTTACCTAGCTAAAGATACACTACTATCAGGATGGCGCCTAACCACGTTCATGAACAGCGTTCTTAACTATATATACTCTAAAGCCATAAGTCAAAATATGCTTAAAAGAGGAAACAGTCTTCATAATGGAGATGATGTTCTAATAGGGACGAAGAACTTTGAAGCGGTGCGGAGGGGTCTAGAAATGGCTAACAGGCCTATGACCTCTATCCCGACCNNNNNNNNNNTGAATTAGGCGGTCGGGATAGACGACTGTTTGCGCTGGTCGGGATAGACGCAGCTCACCCCTGGTCGGGATAGACGCGACACAGGGGTCTAGAAATGGCTAAGAGGCTAAACGTAAGGGTGCAAAGCACTAAATGTGCCTTTGCTGGAATAGCTGAATTTTTAAGAGTAGACCATAAACGGGGCAGCAAGGGCCAGTATCAACAAGAAACTGCGTCTATCCCGACC
+TBLASTX ds2020-328_631 4 226
+TBLASTX ds2020-328_253 7 287 NC_008037 Prune dwarf virus RNA 2, complete sequence Prune dwarf virus 79.7 3 100 27.0 2.2710920824666668e-33 432.08500000000004 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGCCCTTGTCGTTGTTGGTTTAGGCTATTTCTAGTCTGAAATCATTATTTGCTAATAAGAAGAAATGCAAGGACTTCTTATTTCCTGGGTTAAGAGATAAAAACTCAGATTTGCCCATGAGTATGGGTGCCCCTTTAAATATACGGGATGTTACCTCTAAAAGAATTAGAGGTAAAAAGAAGATGAAAGAGAATTCTCATGTTCATATAGATGGTAAGGTCGGTGGATGACCATACTATCTATTATTGTATACCTCCATATCGTCTACCCCGACC
+TBLASTX ds2020-328_487 16 241 NC_007540 Penicillium chrysogenum virus segment 2, complete genome Penicillium chrysogenum virus 45.3 1 100 5.0 1.31892e-09 59.2598 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGACGATGCCAAGTAATATATCATCAGATGCAATATCGGGTCTAGCAGAAGACCTAAAATGGAGAGTGGAGCCTGGGAGTGTGAGTGAAAGAGAGGTCAACATTGAAGATAGCAGATGGCTAATATTAGCAGCAATGGCACCAAAAGCAAACTTTGACGTAGAACAATTAAAGTTGCTTTGTAAGCACTTTAATGTACCTATAGACATGCGAACGGTGCGTCTATCCCGACC
+TBLASTX ds2020-328_545 10 235
+TBLASTX ds2020-328_491 11 241
+TBLASTX ds2020-328_405 6 252
+TBLASTX ds2020-328_688 2 222 NC_024705 Cladosporium cladosporioides virus 1 segment RNA2 hypothetical protein gene, complete cds Cladosporium cladosporioides virus 1 46.4 1 100 9.0 1.78828e-11 65.2165 1529605 Viruses;Cladosporium cladosporioides virus 1 GGTCGGGATAGACGGCGCGTTCGTATGAAGCAAGAGCAGGATTGCAGTCCGTAAGAGCAATTCTTGAGCCAGCCATAGCGATTCTGCATGCGTGCAGGTACGATCCCGTGTTGCTCGCTTTCGTAGACAAATATGGTAGGAAAATGTACGACATTGCAGCTAGAACAAAACACGTGCTTGTTGCGTTTTCGTACGTCCATTGCAGAGGTTCCCAGCCCCCCT
+TBLASTX ds2020-328_207 36 313 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 48.9 1 100 6.0 6.03013e-30 127.533 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B AACGGCCGCCACTAATCCGTCTTGGTTGATGTAGACTTAAGAAAGTTCTTTGAGCTGGAAGTTCTTGTCAACAGAGTGGATGGACTGGTCAACTGGGAGGAGGAGCACAAGAACAGGGTGTCCCCTAACTTGGCCGAGATGCCGGAGGGATTGGTTTATGAAAGGGCCTCGCAGCTCTTCAGTAGATCGATCTCAGCGGGTAAGAGACCGAGGAAGTTTGATTGGCGGGAGTACTGGCAGAGTAGGTGGCAGTGGAGTGCGGCCGGCAGCATACACTCGCAATATTCAGAAAACGAAAGTAGTGGCGGCCGTT
+TBLASTX ds2020-328_118 104 424
+TBLASTX ds2020-328_170 40 343 NC_038698 Tuber aestivum virus 1 capsid protein and RNA polymerase genes, complete cds Tuber aestivum virus 1 51.4 2 100 7.0 9.9289e-26 133.1825 927810 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Tuber aestivum virus 1 GGTCGGGAAAGACGGTGCGTGTGGGTATTATCTAGGTTGTTCCCAATTGGTGAAGCAGCGACGGACGAGAATGTCAGACCTACGGTACGCTAAGTTCTACGTAACGGGCAGCCATTTTGTTTCGATTATGAAGATTTCAATTCACAGCATAGCAACAGTTCGATGCAAGCGGTACTTGACGCCTATCTCTTGGTTTTTAAAGACTATTTAAGCGAGGAGCAGGTGGAAGCTATGTCATGGTCAGTGAATAGTCTTAATGATGTTAAGATAAAGCAGCCTAATGGCGACTGGTATGAGGCACGAGGGACACTATTATCAGGCTGGAGAGCCGTCTATCCCGACC
+TBLASTX ds2020-328_188 22 325 NC_003823 Ustilago maydis virus H1, complete genome Ustilago maydis virus H1 52.6 1 100 5.0 2.11696e-28 122.467 28882 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Ustilago maydis virus H1 GGTCGGGATAGACGAGGGGTAAAGGTAGATTGGGAAAAAGAACTCGGTAATAAAGCAACGCCACCAGATGAAGTAGTAGGCTATGCAAATGGAGTTTTTAGTAGACATGCTGCTGATGAAATTATCGGTCAGGCTATAAAAGATGTTGTTACCACAGCTTTTCCACACGCAGTACCAGCTAAGTTCAGTGATTTTATGGACGATGCATATGAGTGGTTGGTTTCTGGATCATCAGCTGGTATACCGAGAGCACTTAAGAATTCGTCAATGAGGACTTATATCCTAAAAGACTTGGGTCTACATACCAAGGGCGTCTATCCCGACC
+TBLASTX ds2020-328_716 13 219 NC_017991 Botrytis porri RNA virus 1 RNA 2, complete genome Botrytis porri botybirnavirus 1 67.2 3 100 7.0 5.963458525815334e-08 193.8168 1918014 Viruses;Orthornavirae;Botybirnavirus;Botrytis porri botybirnavirus 1 GGTCGGGATAGACGGCCGTAGCTTCTCTTTTTGGGAATAATTTTTATTGTAAAAATGATTATTTCAGATAATCCCCGTCAGGGTTAGAAGACACGCGGACGGATTGACGAACGTACGTGCAAGAAAGTCACATCTATTGGATTACTCTAAATGGAACCTCGGACACTCACAAACCGCCTTGTCAGGATATCAGCGGCTGCGAATAGACGTGTGGAACTC
+TBLASTX ds2020-328_251 22 288
+TBLASTX ds2020-328_510 16 238
+TBLASTX ds2020-328_98 46 458 NC_033468 Wuhan insect virus 27 strain WHZM10130 hypothetical protein 1 and hypothetical protein 2 genes, complete cds Wuhan insect virus 27 63.2 1 100 9.0 1.2276e-59 226.964 1923731 Viruses;Wuhan insect virus 27 AACGGCCGCCACTCTTGGGTGTCTATGTAGTTAAGCACGCTGTTCATGAACGTAGTGAGTCGCCACCCCGATAACAGGGTCCCCTTAGCGTTGTACTCCATTTTCAAGCCTTGATTGTCGTGTACTATTACCCTATCCAGTGAAAGCCGAGTCCACTCCACAGCTGCTAGTTGCTCCTGAGTCAGGAAGTGTCCGAAAGTATCTCTGTACGCATCTATTACTGCTTTCATAGATTGTACACTGTGTTGACTGTTGAAATCCTCGAAATCTACACAATACTGAGTCCTGCCTTCTAAGACTGACCTTACTCTACTGCGGACGTTCTCATCGTTGGCTGCTTTTCCCACCGGGAACGGCGAGGGCAATACGTCCTCGCAGTTATAGAAGGCGAAATGTGCCAATACGTAACTAGTGACATCTGTCCCGTAGATAGCGCGGAGTTTACGTCTATCCCGACC
+TBLASTX ds2020-328_226 10 300 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 47.3 1 100 6.0 3.23633e-27 118.369 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B GGTCGGGATAGACGCTATCGAGATAAATTTATTCTTCAACCTTATATCTGATTTATGTATAAATTGTTCGTCAGTTTTATATTGTGAATGGATACTCCCAGAAGCACTCCACTGCCATCTGTTGGTCCAAAATTTTTCCCAAGACATCACCATAGGAGTTCTCCCGCTAACTGCTGCACTCGCGAAGATTTTAAGTGCTTCATTCTGGATATAATCAGCACTTAGCTTGACTGTTGACGCTTTTGTTCTATGTGTGAACTCAGCTTCCCAATCGAGCGCGCCGTAACGTCTATCCCGACC
+TBLASTX ds2020-328_159 47 348 NC_008039 Prune dwarf virus RNA 1, complete sequence Prune dwarf virus 97.0 3 100 27.0 2.5280226430549335e-55 668.0630000000001 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGGTCGGGATAGACGGCAGATACCACTCGAACGTGGTTGTTCGTATTTTAAATCAATCATGACTTCTTCCGAGATCACTGCTGCCAATGTCCATGAACTTTTGGTTAAAGTTCTGGAAAAGCAATGCGCTGACGAGACCACTACCGTCGGTAAGGCTTTCTCTGAGAAAGCAAAACAGTCTTTGAATAAGACATTCGGACTAAATGACGAGTCCAAGCAACTGAAGATTTCTTTTGATTTGACGGCTGAACAGCAGGCGTTACTCAAGAGACATTTTCCGGGTCGATCGGTGATTTTTTCAAATTCATCGAGTTCCTCACACAGTTATGCAGCGCGTCTATCCCGACC
+TBLASTX ds2020-328_166 24 346 NC_005980 Helminthosporium victoriae 145S virus Helminthosporium victoriae 145S virus 26.8 1 100 8.0 1.12841e-07 53.7613 164750 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Chrysovirus;Helminthosporium victoriae 145S virus GGGTCGGGATAGACGTTAACTGCCCATACCAACCATGTTTGCTAGCCTTGCAACGTCAGCTATTTCCTGCCAAGTGTCGACAGCTGCCTCATCTCGCAGCCTATTGTATATCACTGCCTCATCTGCGGTTGTGCAATAACCACGTATACGTAAGTTCTGCACTAATGCATGTATTCCACAAGTACCATCTCCTTTTGTGTTAACTTCTGTCACTATTATTTTGTCCTCCTCTACTGGCATTGGCTCATCTTTGACCAACTTTGACTCTGTGCCTTTGTCTTTCAGTTCATATGAACTACCTAGCATTTCCTCACCATTTACGCCTTTGACATAAACTGGCGATGGT
+TBLASTX ds2020-328_97 31 461 NC_020903 Xanthophyllomyces dendrorhous virus L1A capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1A 52.1 2 100 14.0 1.888695e-05 241.7778 1167690 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1A AACGGCCGCCACTAAATTGTCCCCTTAGATCCGCGCTTGTGATCCACTCGTAGGAACTCCGCTATAGCTCCGTACGCGCACTTGCTCATTTGTAGTCGTATATTGTGCTTCTTCGCGTTTCGGCCGGCTAGTAACACGTCCCCGAGCGAGTTACTGCCCAGCAGCACGTCGTCGCCGTTATGAAGACTGTTTTGTGACTTCACGACATCTGGCACTATTAATTGAGTGTAAATGTAGTTCAGGACGCTATTCATGAATGTGGTGAGCCTCCACCCCGACAGTAAAGTTCCTTTAGCACTATACTCCATCTTCAAGCCTTGGTTGTCATGTACTATCACTCTGTTCAGCGACAGTCGAGTCCATTCCACCGCCGCCAGCTGCTCTTGCGTTAGGAAGGGCCTGAAGGTGTCTCTGTACGCATCTATCACTGTTTTCATTGACTGTACACTATGTTGACTGTT
+TBLASTX ds2020-328_750 10 216
+TBLASTX ds2020-328_92 33 472 NC_033465 Wuhan insect virus 26 strain WHZM10161 hypothetical protein 1 and hypothetical protein 2 genes, complete cds Wuhan insect virus 26 38.6 1 100 10.0 6.24209e-27 118.369 1923730 Viruses;Wuhan insect virus 26 CGTCATTGAGGAACAAATACTACTCGAGACAATGCGAGCGATTGCACATGACAGTTTCGGACTGTTATAAAATAAAGACCTCCCACAGGTGTGTGGGGGGCATAAGTGAAGACAAGAGATCGGACGTAAAGTGGATGATACGGTCGTCGGGCTTCAGGAAGGGTGCCACGCAGATAGGCGTGTTACCGGGAGTGGTGGACTACTCCAGGATGGTGAAAGCATCACTACAACTTGAAAGACCTTTGCAGGATTTCATTTCACGAATAATGCGCGCAACATACGACGCGGTGATACCAAAAGAAAGGAACATAAACGTTTCAAGGAATGGTAACATCAAGCGGTACGAGATTTTGCGAGCGTTATTCAAGGTACACAAAGAAGAAACAGACATAGTCAATTACGGAAAAGCCAAAATGACCGGCTTCCTGATGGACGTGTTGAATGGGACCAATTATTCATAGTGGCGGCCGTT
+TBLASTX ds2020-328_825 7 211
+TBLASTX ds2020-328_896 2 208 NC_033476 Botryosphaeria dothidea virus 1 strain YZN115 RNA-dependent RNA polymerase (RdRp) gene, complete cds Botryosphaeria dothidea virus 1 41.8 1 100 7.0 8.29721e-08 52.8449 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 GGTCGGGATAGACGGGGGGCCTTCTTTCACTCCACACCCCCCATGCACAGGCAACAAAGAAAAAGATGAGACTGGGAACATCGACGACCATCGGTGGAACTCTTTTCGGAGGTCCACTTACCCCGGCGGCGGCTTGGGCCCACGACCAGACAAGGTCTACCTGGGCAAAGTACCTCAAAGAAACGGACGCCAGTCGTCTATCCCGACC
diff --git a/tools/virAnnot/test-data/rps_test.tab b/tools/virAnnot/test-data/rps_test.tab
new file mode 100644
index 00000000000..35049d94a7a
--- /dev/null
+++ b/tools/virAnnot/test-data/rps_test.tab
@@ -0,0 +1,105 @@
+#query_id query_length cdd_id hit_id evalue startQ endQ frame description superkingdom
+ds2020-267_120 339 pfam01333 gnl|CDD|366578 0.000848733 197 325 -3 pfam01333, Apocytochr_F_C, Apocytochrome F, C-terminal. This is a sub-family of cytochrome C. See pfam00034. Eukaryota(19);Bacteria(1)
+ds2020-267_374 242 pfam00124 gnl|CDD|365890 5.09126e-07 21 125 3 pfam00124, Photo_RC, Photosynthetic reaction centre protein. Bacteria(9);Eukaryota(6);Viruses(4);unclassified sequences(1)
+ds2020-267_471 230 pfam00201 gnl|CDD|278624 3.12575e-07 46 210 1 pfam00201, UDPGT, UDP-glucoronosyl and UDP-glucosyl transferase. Eukaryota(20)
+ds2020-267_710 213 pfam01127 gnl|CDD|366480 0.000723904 46 210 1 pfam01127, Sdh_cyt, Succinate dehydrogenase/Fumarate reductase transmembrane subunit. This family includes a transmembrane protein from both the Succinate dehydrogenase and Fumarate reductase complexes. Bacteria(20)
+ds2020-267_692 214 pfam00680 gnl|CDD|366242 4.79875e-05 70 180 1 pfam00680, RdRP_1, RNA dependent RNA polymerase. Viruses(20)
+ds2020-267_817 208 pfam05656 gnl|CDD|377540 3.45664e-06 86 190 -1 pfam05656, DUF805, Protein of unknown function (DUF805). This family consists of several bacterial proteins of unknown function. Bacteria(17);unclassified sequences(2);Archaea(1)
+ds2020-267_98 379 pfam16203 gnl|CDD|374428 1.33948e-30 131 280 -1 pfam16203, ERCC3_RAD25_C, ERCC3/RAD25/XPB C-terminal helicase. This is the C-terminal helicase domain of ERCC3, RAD25 and XPB helicases. Bacteria(11);Eukaryota(6);Archaea(2);unclassified sequences(1)
+ds2020-267_21 858 pfam00680 gnl|CDD|366242 8.36679e-11 295 729 -1 pfam00680, RdRP_1, RNA dependent RNA polymerase. Viruses(20)
+ds2020-267_261 260 pfam01051 gnl|CDD|376444 1.77523e-19 26 217 -2 pfam01051, Rep_3, Initiator Replication protein. This protein is an initiator of plasmid replication. RepB possesses nicking-closing (topoisomerase I) like activity. It is also able to perform a strand transfer reaction on ssDNA that contains its target. This family also includes RepA which is an E.coli protein involved in plasmid replication. The RepA protein binds to DNA repeats that flank the repA gene. Bacteria(19);unclassified sequences(1)
+ds2020-267_773 210 pfam01641 gnl|CDD|376583 5.23903e-34 16 174 1 pfam01641, SelR, SelR domain. Methionine sulfoxide reduction is an important process, by which cells regulate biological processes and cope with oxidative stress. MsrA, a protein involved in the reduction of methionine sulfoxides in proteins, has been known for four decades and has been extensively characterized with respect to structure and function. However, recent studies revealed that MsrA is only specific for methionine-S-sulfoxides. Because oxidized methionines occur in a mixture of R and S isomers in vivo, it was unclear how stereo-specific MsrA could be responsible for the reduction of all protein methionine sulfoxides. It appears that a second methionine sulfoxide reductase, SelR, evolved that is specific for methionine-R-sulfoxides, the activity that is different but complementary to that of MsrA. Thus, these proteins, working together, could reduce both stereoisomers of methionine sulfoxide. This domain is found both in SelR proteins and fused with the peptide methionine sulfoxide reductase enzymatic domain pfam01625. The domain has two conserved cysteine and histidines. The domain binds both selenium and zinc. The final cysteine is found to be replaced by the rare amino acid selenocysteine in some members of the family. This family has methionine-R-sulfoxide reductase activity. Bacteria(18);Archaea(1);unclassified sequences(1)
+ds2020-267_287 256 pfam00115 gnl|CDD|376293 2.8946e-26 13 237 1 pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I. Eukaryota(18);Bacteria(2)
+ds2020-267_139 320 pfam05860 gnl|CDD|368641 1.34887e-13 167 298 2 pfam05860, Haemagg_act, haemagglutination activity domain. This domain is suggested to be a carbohydrate- dependent haemagglutination activity site. It is found in a range of haemagglutinins and haemolysins. Bacteria(20)
+ds2020-267_763 211 pfam00557 gnl|CDD|376349 0.000231782 167 298 2 pfam00557, Peptidase_M24, Metallopeptidase family M24. This family contains metallopeptidases. It also contains non-peptidase homologs such as the N terminal domain of Spt16 which is a histone H3-H4 binding module. Bacteria(18);Archaea(2)
+ds2020-267_571 221 pfam00501 gnl|CDD|366135 2.61467e-07 34 201 1 pfam00501, AMP-binding, AMP-binding enzyme. Bacteria(17);Eukaryota(2);unclassified sequences(1)
+ds2020-267_565 222 pfam03950 gnl|CDD|377172 9.52435e-10 53 184 -3 pfam03950, tRNA-synt_1c_C, tRNA synthetases class I (E and Q), anti-codon binding domain. Other tRNA synthetase sub-families are too dissimilar to be included. This family includes only glutamyl and glutaminyl tRNA synthetases. In some organisms, a single glutamyl-tRNA synthetase aminoacylates both tRNA(Glu) and tRNA(Gln). Bacteria(16);Archaea(3);Eukaryota(1)
+ds2020-267_427 235 pfam03154 gnl|CDD|367360 0.000552392 53 184 -3 pfam03154, Atrophin-1, Atrophin-1 family. Atrophin-1 is the protein product of the dentatorubral-pallidoluysian atrophy (DRPLA) gene. DRPLA OMIM:125370 is a progressive neurodegenerative disorder. It is caused by the expansion of a CAG repeat in the DRPLA gene on chromosome 12p. This results in an extended polyglutamine region in atrophin-1, that is thought to confer toxicity to the protein, possibly through altering its interactions with other proteins. The expansion of a CAG repeat is also the underlying defect in six other neurodegenerative disorders, including Huntington's disease. One interaction of expanded polyglutamine repeats that is thought to be pathogenic is that with the short glutamine repeat in the transcriptional coactivator CREB binding protein, CBP. This interaction draws CBP away from its usual nuclear location to the expanded polyglutamine repeat protein aggregates that are characteristic of the polyglutamine neurodegenerative disorders. This interferes with CBP-mediated transcription and causes cytotoxicity. Eukaryota(20)
+ds2020-267_4 2297 pfam00680 gnl|CDD|366242 4.43825e-05 995 1510 -2 pfam00680, RdRP_1, RNA dependent RNA polymerase. Viruses(20)
+ds2020-267_16 1165 pfam00680 gnl|CDD|366242 8.1737e-06 707 1042 -1 pfam00680, RdRP_1, RNA dependent RNA polymerase. Viruses(20)
+ds2020-267_438 234 pfam00078 gnl|CDD|365856 0.000870142 707 1042 -1 pfam00078, RVT_1, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses. Eukaryota(16);Viruses(4)
+ds2020-267_370 242 pfam00146 gnl|CDD|376297 2.41391e-10 22 111 1 pfam00146, NADHdh, NADH dehydrogenase. Bacteria(14);Eukaryota(3);Archaea(2);unclassified sequences(1)
+ds2020-267_278 258 pfam00012 gnl|CDD|365808 4.1355e-19 50 232 2 pfam00012, HSP70, Hsp70 protein. Hsp70 chaperones help to fold many proteins. Hsp70 assisted folding involves repeated cycles of substrate binding and release. Hsp70 activity is ATP dependent. Hsp70 proteins are made up of two regions: the amino terminus is the ATPase domain and the carboxyl terminus is the substrate binding region. Bacteria(15);Eukaryota(4);Viruses(1)
+ds2020-267_364 243 pfam00216 gnl|CDD|365952 1.5507e-10 134 241 -3 pfam00216, Bac_DNA_binding, Bacterial DNA-binding protein. Bacteria(19);unclassified sequences(1)
+ds2020-267_558 222 pfam03737 gnl|CDD|377116 4.93695e-13 57 179 -2 pfam03737, RraA-like, Aldolase/RraA. Members of this family include regulator of ribonuclease E activity A (RraA) and 4-hydroxy-4-methyl-2-oxoglutarate (HMG)/4-carboxy- 4-hydroxy-2-oxoadipate (CHA) aldolase, also known as RraA-like protein. RraA acts as a trans-acting modulator of RNA turnover, binding essential endonuclease RNase E and inhibiting RNA processing. RraA-like proteins seem to contain aldolase and/or decarboxylase activity either in place of or in addition to the RNase E inhibitor functions. Bacteria(19);unclassified sequences(1)
+ds2020-267_218 274 pfam01348 gnl|CDD|279664 1.66328e-05 51 257 3 pfam01348, Intron_maturas2, Type II intron maturase. Group II introns use intron-encoded reverse transcriptase, maturase and DNA endonuclease activities for site-specific insertion into DNA. Although this type of intron is self splicing in vitro they require a maturase protein for splicing in vivo. It has been shown that a specific region of the aI2 intron is needed for the maturase function. This region was found to be conserved in group II introns and called domain X. Eukaryota(15);Bacteria(5)
+ds2020-267_363 243 pfam00416 gnl|CDD|366086 2.02528e-05 15 134 -2 pfam00416, Ribosomal_S13, Ribosomal protein S13/S18. This family includes ribosomal protein S13 from prokaryotes and S18 from eukaryotes. Bacteria(16);Archaea(3);Eukaryota(1)
+ds2020-267_746 211 pfam01490 gnl|CDD|279788 0.000177299 15 134 -2 pfam01490, Aa_trans, Transmembrane amino acid transporter protein. This transmembrane region is found in many amino acid transporters including UNC-47 and MTR. UNC-47 encodes a vesicular amino butyric acid (GABA) transporter, (VGAT). UNC-47 is predicted to have 10 transmembrane domains. MTR is a N system amino acid transporter system protein involved in methyltryptophan resistance. Other members of this family include proline transporters and amino acid permeases. Eukaryota(20)
+ds2020-267_145 315 pfam02626 gnl|CDD|376868 3.97676e-05 140 256 -3 pfam02626, CT_A_B, Carboxyltransferase domain, subdomain A and B. Urea carboxylase (UC) catalyzes a two-step, ATP- and biotin-dependent carboxylation reaction of urea. It is composed of biotin carboxylase (BC), carboxyltransferase (CT), and biotin carboxyl carrier protein (BCCP) domains. The CT domain of UC consists of four subdomains, named A, B, C and D. This domain covers the A and B subdomains of the CT domain. This domain covers the whole length of KipA (kinase A) from Bacillus subtilis. It can also be found in S. cerevisiae urea amidolyase Dur1,2, which is a multifunctional biotin-dependent enzyme with domains for urea carboxylase and allophanate (urea carboxylate) hydrolase activity. Bacteria(19);unclassified sequences(1)
+ds2020-267_637 217 pfam07026 gnl|CDD|284449 1.36077e-13 47 172 2 pfam07026, DUF1317, Protein of unknown function (DUF1317). This family consists of several hypothetical bacterial and phage proteins of around 60 residues in length. The function of this family is unknown. Bacteria(20)
+ds2020-267_557 222 pfam00421 gnl|CDD|366090 3.32623e-20 12 200 -2 pfam00421, PSII, Photosystem II protein. Eukaryota(13);Bacteria(7)
+ds2020-267_117 344 pfam00252 gnl|CDD|376306 7.27175e-23 107 295 2 pfam00252, Ribosomal_L16, Ribosomal protein L16p/L10e. Bacteria(16);Archaea(3);Eukaryota(1)
+ds2020-267_352 245 pfam00946 gnl|CDD|366381 3.23548e-05 1 141 1 pfam00946, Mononeg_RNA_pol, Mononegavirales RNA dependent RNA polymerase. Members of the Mononegavirales including the Paramyxoviridae, like other non-segmented negative strand RNA viruses, have an RNA-dependent RNA polymerase composed of two subunits, a large protein L and a phosphoprotein P. This is a protein family of the L protein. The L protein confers the RNA polymerase activity on the complex. The P protein acts as a transcription factor. Viruses(20)
+ds2020-267_97 380 pfam04879 gnl|CDD|368171 1.9903e-08 125 274 -2 pfam04879, Molybdop_Fe4S4, Molybdopterin oxidoreductase Fe4S4 domain. This domain is found in formate dehydrogenase H for which the structure is known. This first domain (residues 1 to 60) of Structure 1aa6 is an Fe4S4 cluster just below the protein surface. Bacteria(19);unclassified sequences(1)
+ds2020-267_2 2436 pfam02123 gnl|CDD|280316 2.17343e-21 184 1476 1 pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus. Viruses(19);unclassified sequences(1)
+ds2020-267_595 219 pfam02123 gnl|CDD|280316 5.90575e-11 13 210 1 pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus. Viruses(19);unclassified sequences(1)
+ds2020-267_622 217 pfam01370 gnl|CDD|366597 1.5719e-08 50 172 2 pfam01370, Epimerase, NAD dependent epimerase/dehydratase family. This family of proteins utilize NAD as a cofactor. The proteins in this family use nucleotide-sugar substrates for a variety of chemical reactions. Bacteria(17);unclassified sequences(2);Archaea(1)
+ds2020-267_214 276 pfam00070 gnl|CDD|365851 1.70856e-05 135 254 3 pfam00070, Pyr_redox, Pyridine nucleotide-disulphide oxidoreductase. This family includes both class I and class II oxidoreductases and also NADH oxidases and peroxidases. This domain is actually a small NADH binding domain within a larger FAD binding domain. Eukaryota(12);Bacteria(5);unclassified sequences(2);Archaea(1)
+ds2020-267_610 218 pfam17759 gnl|CDD|380005 1.47034e-13 25 195 1 pfam17759, tRNA_synthFbeta, Phenylalanyl tRNA synthetase beta chain CLM domain. This domain corresponds to the catalytic like domain (CLM) in the beta chain of phe tRNA synthetase. Bacteria(17);Archaea(2);unclassified sequences(1)
+ds2020-267_94 386 pfam01347 gnl|CDD|366585 0.000224462 25 195 1 pfam01347, Vitellogenin_N, Lipoprotein amino terminal region. This family contains regions from: Vitellogenin, Microsomal triglyceride transfer protein and apolipoprotein B-100. These proteins are all involved in lipid transport. This family contains the LV1n chain from lipovitellin, that contains two structural domains. Eukaryota(20)
+ds2020-267_323 250 pfam00227 gnl|CDD|365960 5.8155e-09 10 150 -2 pfam00227, Proteasome, Proteasome subunit. The proteasome is a multisubunit structure that degrades proteins. Protein degradation is an essential component of regulation because proteins can become misfolded, damaged, or unnecessary. Proteasomes and their homologs vary greatly in complexity: from HslV (heat shock locus v), which is encoded by 1 gene in bacteria, to the eukaryotic 20S proteasome, which is encoded by more than 14 genes. Recently evidence of two novel groups of bacterial proteasomes was proposed. The first is Anbu, which is sparsely distributed among cyanobacteria and proteobacteria. The second is call beta-proteobacteria proteasome homolog (BPH). Eukaryota(8);Bacteria(7);Archaea(5)
+ds2020-267_168 298 pfam13546 gnl|CDD|379252 0.000766911 10 150 -2 pfam13546, DDE_5, DDE superfamily endonuclease. This family of proteins are related to pfam00665 and are probably endonucleases of the DDE superfamily. Transposase proteins are necessary for efficient DNA transposition. This domain is a member of the DDE superfamily, which contain three carboxylate residues that are believed to be responsible for coordinating metal ions needed for catalysis. The catalytic activity of this enzyme involves DNA cleavage at a specific site followed by a strand transfer reaction. Bacteria(18);unclassified sequences(2)
+ds2020-267_636 217 pfam13812 gnl|CDD|316342 0.000111468 16 123 -2 pfam13812, PPR_3, Pentatricopeptide repeat domain. This family matches additional variants of the PPR repeat that were not captured by the model for pfam01535. In the case of the Arabidopsis protein UniProtKB:Q66GI4, the repeated helices in this N-terminal region, of protein-only RNase P (PRORP) enzymes, form the pentatricopeptide repeat (PPR) domain which enhances pre-tRNA binding affinity. PROPRP enzymes process precursor tRNAs in human mitochondria and in all tRNA-using compartments of Arabidopsis thaliana. Eukaryota(20)
+ds2020-267_486 228 pfam17035 gnl|CDD|374956 5.12677e-09 108 203 3 pfam17035, BET, Bromodomain extra-terminal - transcription regulation. The BET, or bromodomain extra-terminal domain, is found on bromodomain proteins that play key roles in development, cancer progression and virus-host pathogenesis. It interacts with NSD3, JMJD6, CHD4, GLTSCR1, and ATAD5 all of which are shown to impart a pTEFb-independent transcriptional activation function on the bromodomain proteins. Eukaryota(20)
+ds2020-267_599 219 pfam05717 gnl|CDD|377551 3.2952e-06 28 147 1 pfam05717, TnpB_IS66, IS66 Orf2 like protein. This protein is found in insertion sequences related to IS66. The function of these proteins is uncertain, but they are probably essential for transposition. Bacteria(19);unclassified sequences(1)
+ds2020-267_837 207 pfam04061 gnl|CDD|367791 2.43363e-18 1 159 1 pfam04061, ORMDL, ORMDL family. Evidence form suggests that ORMDLs are involved in protein folding in the ER. Orm proteins have been identified as negative regulators of sphingolipid synthesis that form a conserved complex with serine palmitoyltransferase, the first and rate-limiting enzyme in sphingolipid production. This novel and conserved protein complex, has been termed the SPOTS complex (serine palmitoyltransferase, Orm1/2, Tsc3, and Sac1). Eukaryota(20)
+ds2020-267_516 225 pfam00115 gnl|CDD|376293 0.000272517 1 159 1 pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I. Eukaryota(18);Bacteria(2)
+ds2020-267_529 224 pfam00510 gnl|CDD|366140 6.14777e-23 35 211 2 pfam00510, COX3, Cytochrome c oxidase subunit III. Bacteria(15);Eukaryota(3);unclassified sequences(1);Archaea(1)
+ds2020-267_230 268 pfam00115 gnl|CDD|376293 1.95663e-15 81 236 -3 pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I. Eukaryota(18);Bacteria(2)
+ds2020-267_444 233 pfam00680 gnl|CDD|366242 0.00060937 81 236 -3 pfam00680, RdRP_1, RNA dependent RNA polymerase. Viruses(20)
+ds2020-267_336 248 pfam00113 gnl|CDD|365883 4.23282e-13 15 116 -1 pfam00113, Enolase_C, Enolase, C-terminal TIM barrel domain. Bacteria(17);Archaea(2);unclassified sequences(1)
+ds2020-267_365 243 pfam13041 gnl|CDD|372443 0.000129396 15 116 -1 pfam13041, PPR_2, PPR repeat family. This repeat has no known function. It is about 35 amino acids long and is found in up to 18 copies in some proteins. The family appears to be greatly expanded in plants and fungi. The repeat has been called PPR. Eukaryota(20)
+ds2020-267_75 425 pfam00005 gnl|CDD|365804 4.26261e-07 129 275 -1 pfam00005, ABC_tran, ABC transporter. ABC transporters for a large family of proteins responsible for translocation of a variety of compounds across biological membranes. ABC transporters are the largest family of proteins in many completely sequenced bacteria. ABC transporters are composed of two copies of this domain and two copies of a transmembrane domain pfam00664. These four domains may belong to a single polypeptide as in CFTR, or belong in different polypeptide chains. Bacteria(19);unclassified sequences(1)
+ds2020-267_8 1703 pfam00680 gnl|CDD|366242 2.85682e-13 685 1458 -3 pfam00680, RdRP_1, RNA dependent RNA polymerase. Viruses(20)
+ds2020-267_114 347 pfam00471 gnl|CDD|376336 8.05888e-12 132 302 3 pfam00471, Ribosomal_L33, Ribosomal protein L33. Bacteria(20)
+ds2020-267_589 219 pfam12161 gnl|CDD|378823 0.0004347 132 302 3 pfam12161, HsdM_N, HsdM N-terminal domain. This domain is found at the N-terminus of the methylase subunit of Type I DNA methyltransferases. This domain family is found in bacteria and archaea, and is typically between 123 and 138 amino acids in length. The family is found in association with pfam02384. Mutations in this region of EcoKI methyltransferase abolish the normally strong preference of this system for methylating hemimethylated substrate. The structure of this domain has been shown to be all alpha-helical. Bacteria(20)
+ds2020-267_206 279 pfam03947 gnl|CDD|377170 2.63457e-16 155 265 2 pfam03947, Ribosomal_L2_C, Ribosomal Proteins L2, C-terminal domain. Bacteria(15);Archaea(4);Eukaryota(1)
+ds2020-267_316 251 pfam02123 gnl|CDD|280316 3.50628e-08 28 228 -3 pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus. Viruses(19);unclassified sequences(1)
+ds2020-267_697 214 pfam00378 gnl|CDD|334046 5.08319e-08 45 170 -3 pfam00378, ECH_1, Enoyl-CoA hydratase/isomerase. This family contains a diverse set of enzymes including: enoyl-CoA hydratase, napthoate synthase, carnitate racemase, 3-hydroxybutyryl-CoA dehydratase and dodecanoyl-CoA delta-isomerase. Bacteria(17);unclassified sequences(2);Archaea(1)
+ds2020-267_318 251 pfam00252 gnl|CDD|376306 5.63854e-12 78 206 -1 pfam00252, Ribosomal_L16, Ribosomal protein L16p/L10e. Bacteria(16);Archaea(3);Eukaryota(1)
+ds2020-267_20 893 pfam02874 gnl|CDD|367225 7.30466e-19 126 329 3 pfam02874, ATP-synt_ab_N, ATP synthase alpha/beta family, beta-barrel domain. This family includes the ATP synthase alpha and beta subunits the ATP synthase associated with flagella. Bacteria(17);Eukaryota(2);Archaea(1)
+ds2020-267_329 249 pfam13173 gnl|CDD|379049 4.80752e-08 106 249 1 pfam13173, AAA_14, AAA domain. This family of domains contain a P-loop motif that is characteristic of the AAA superfamily. Bacteria(19);Archaea(1)
+ds2020-267_130 330 pfam00680 gnl|CDD|366242 7.64962e-05 124 282 1 pfam00680, RdRP_1, RNA dependent RNA polymerase. Viruses(20)
+ds2020-267_280 257 pfam01788 gnl|CDD|366811 2.47901e-09 132 224 -1 pfam01788, PsbJ, PsbJ. This family consists of the photosystem II reaction centre protein PsbJ from plants and Cyanobacteria. In Synechocystis sp. PCC 6803 PsbJ regulates the number of photosystem II centers in thylakoid membranes, it is a predicted 4kDa protein with one membrane spanning domain. Eukaryota(17);Bacteria(3)
+ds2020-267_100 376 pfam00401 gnl|CDD|366077 8.90041e-05 87 218 -3 pfam00401, ATP-synt_DE, ATP synthase, Delta/Epsilon chain, long alpha-helix domain. Part of the ATP synthase CF(1). These subunits are part of the head unit of the ATP synthase. This subunit is called epsilon in bacteria and delta in mitochondria. In bacteria the delta (D) subunit is equivalent to the mitochondrial Oligomycin sensitive subunit, OSCP (pfam00213). Bacteria(18);unclassified sequences(2)
+ds2020-267_436 234 pfam00155 gnl|CDD|365910 0.000283584 87 218 -3 pfam00155, Aminotran_1_2, Aminotransferase class I and II. Bacteria(19);Archaea(1)
+ds2020-267_210 276 pfam17919 gnl|CDD|375430 6.42624e-11 52 237 1 pfam17919, RT_RNaseH_2, RNase H-like domain found in reverse transcriptase. Eukaryota(20)
+ds2020-267_58 476 pfam03641 gnl|CDD|367590 7.19579e-14 142 315 -3 pfam03641, Lysine_decarbox, Possible lysine decarboxylase. The members of this family share a highly conserved motif PGGXGTXXE that is probably functionally important. This family includes proteins annotated as lysine decarboxylases, although the evidence for this is not clear. Bacteria(17);Eukaryota(2);unclassified sequences(1)
+ds2020-267_466 230 pfam00072 gnl|CDD|333815 5.42419e-08 50 208 2 pfam00072, Response_reg, Response regulator receiver domain. This domain receives the signal from the sensor partner in bacterial two-component systems. It is usually found N-terminal to a DNA binding effector domain. Bacteria(20)
+ds2020-267_118 343 pfam00421 gnl|CDD|366090 7.68219e-41 92 337 -1 pfam00421, PSII, Photosystem II protein. Eukaryota(13);Bacteria(7)
+ds2020-267_643 216 pfam00078 gnl|CDD|365856 0.000675747 92 337 -1 pfam00078, RVT_1, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses. Eukaryota(16);Viruses(4)
+ds2020-267_5 2029 pfam00680 gnl|CDD|366242 0.000288253 92 337 -1 pfam00680, RdRP_1, RNA dependent RNA polymerase. Viruses(20)
+ds2020-267_506 226 pfam05173 gnl|CDD|377479 2.45773e-17 93 215 -3 pfam05173, DapB_C, Dihydrodipicolinate reductase, C-terminus. Dihydrodipicolinate reductase (DapB) reduces the alpha,beta-unsaturated cyclic imine, dihydro-dipicolinate. This reaction is the second committed step in the biosynthesis of L-lysine and its precursor meso-diaminopimelate, which are critical for both protein and cell wall biosynthesis. The C-terminal domain of DapB has been proposed to be the substrate- binding domain. Bacteria(19);unclassified sequences(1)
+ds2020-267_315 251 pfam13426 gnl|CDD|379177 0.000472059 32 241 2 pfam13426, PAS_9, PAS domain. Bacteria(19);unclassified sequences(1)
+ds2020-267_227 272 pfam00873 gnl|CDD|334294 2.32215e-15 36 245 -1 pfam00873, ACR_tran, AcrB/AcrD/AcrF family. Members of this family are integral membrane proteins. Some are involved in drug resistance. AcrB cooperates with a membrane fusion protein, AcrA, and an outer membrane channel TolC. The structure shows the AcrB forms a homotrimer. Bacteria(20)
+ds2020-267_639 216 pfam00033 gnl|CDD|306530 3.68894e-05 2 118 2 pfam00033, Cytochrome_B, Cytochrome b/b6/petB. Eukaryota(16);Bacteria(4)
+ds2020-267_407 239 pfam00177 gnl|CDD|365924 1.14399e-06 28 126 1 pfam00177, Ribosomal_S7, Ribosomal protein S7p/S5e. This family contains ribosomal protein S7 from prokaryotes and S5 from eukaryotes. Bacteria(16);Archaea(3);Eukaryota(1)
+ds2020-267_457 231 pfam00481 gnl|CDD|366121 0.000499491 28 126 1 pfam00481, PP2C, Protein phosphatase 2C. Protein phosphatase 2C is a Mn++ or Mg++ dependent protein serine/threonine phosphatase. Eukaryota(20)
+ds2020-267_402 239 pfam06122 gnl|CDD|368759 0.000851192 28 126 1 pfam06122, TraH, Conjugative relaxosome accessory transposon protein. The TraH protein is thought to be a relaxosome accessory component, also necessary for transfer but not for H-pilus synthesis within the conjugative transposon. Bacteria(20)
+ds2020-267_369 243 pfam12137 gnl|CDD|378818 6.51052e-05 137 217 -3 pfam12137, RapA_C, RNA polymerase recycling family C-terminal. This domain is found in bacteria. This domain is about 360 amino acids in length. This domain is found associated with pfam00271, pfam00176. The function of this domain is not known, but structurally it forms an alpha-beta fold in nature with a central beta-sheet flanked by helices and loops, the beta-sheet being mainly antiparallel and flanked by four alpha helices, among which the two longer helices exhibit a coiled-coil arrangement. Bacteria(19);unclassified sequences(1)
+ds2020-267_750 211 pfam02391 gnl|CDD|376774 1.24642e-05 28 114 -2 pfam02391, MoaE, MoaE protein. This family contains the MoaE protein that is involved in biosynthesis of molybdopterin. Molybdopterin, the universal component of the pterin molybdenum cofactors, contains a dithiolene group serving to bind Mo. Addition of the dithiolene sulfurs to a molybdopterin precursor requires the activity of the converting factor. Converting factor contains the MoaE and MoaD proteins. Bacteria(17);Archaea(2);unclassified sequences(1)
+ds2020-267_428 235 pfam00164 gnl|CDD|333891 1.04166e-24 3 182 3 pfam00164, Ribosom_S12_S23, Ribosomal protein S12/S23. This protein is known as S12 in bacteria and archaea and S23 in eukaryotes. Bacteria(16);Archaea(3);Eukaryota(1)
+ds2020-267_203 281 pfam03040 gnl|CDD|367312 1.76794e-22 121 231 -3 pfam03040, CemA, CemA family. Members of this family are probable integral membrane proteins. Their molecular function is unknown. CemA proteins are found in the inner envelope membrane of chloroplasts but not in the thylakoid membrane. A cyanobacterial member of this family has been implicated in CO2 transport, but is probably not a CO2 transporter itself. They are predicted to be haem-binding however this has not been proven experimentally. Eukaryota(20)
+ds2020-267_33 680 pfam04157 gnl|CDD|367847 4.86455e-13 342 494 -1 pfam04157, EAP30, EAP30/Vps36 family. This family includes EAP30 as well as the Vps36 protein. Vps36 is involved in Golgi to endosome trafficking. EAP30 is a subunit of the ELL complex. The ELL is an 80-kDa RNA polymerase II transcription factor. ELL interacts with three other proteins to form the complex known as ELL complex. The ELL complex is capable of increasing that catalytic rate of transcription elongation, but is unable to repress initiation of transcription by RNA polymerase II as is the case of ELL. EAP30 is thought to lead to the derepression of ELL's transcriptional inhibitory activity. Eukaryota(17);Archaea(3)
+ds2020-267_6 1860 pfam02123 gnl|CDD|280316 1.35634e-17 1147 1764 -1 pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus. Viruses(19);unclassified sequences(1)
+ds2020-267_555 222 pfam00124 gnl|CDD|365890 7.71427e-08 48 203 3 pfam00124, Photo_RC, Photosynthetic reaction centre protein. Bacteria(9);Eukaryota(6);Viruses(4);unclassified sequences(1)
+ds2020-267_550 223 pfam05694 gnl|CDD|377548 0.00097637 48 203 3 pfam05694, SBP56, 56kDa selenium binding protein (SBP56). This family consists of several eukaryotic selenium binding proteins as well as three sequences from archaea. The exact function of this protein is unknown although it is thought that SBP56 participates in late stages of intra-Golgi protein transport. The Lotus japonicus homolog of SBP56, LjSBP is thought to have more than one physiological role and can be implicated in controlling the oxidation/reduction status of target proteins, in vesicular Golgi transport. Bacteria(12);Eukaryota(8)
+ds2020-267_65 462 pfam13406 gnl|CDD|372592 4.82338e-27 145 360 -1 pfam13406, SLT_2, Transglycosylase SLT domain. This family is related to the SLT domain pfam01464. Bacteria(19);unclassified sequences(1)
+ds2020-267_729 212 pfam01405 gnl|CDD|279713 5.43744e-05 19 99 -3 pfam01405, PsbT, Photosystem II reaction centre T protein. The exact function of this protein is unknown. It probably consists of a single transmembrane spanning helix. The Chlamydomonas reinhardtii psbT protein appears to be (i) a novel photosystem II subunit and (ii) required for maintaining optimal photosystem II activity under adverse growth conditions. Eukaryota(17);Bacteria(3)
+ds2020-267_404 239 pfam00361 gnl|CDD|366050 3.50341e-05 70 219 1 pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla. Bacteria(16);Eukaryota(2);Archaea(1);unclassified sequences(1)
+ds2020-267_312 252 pfam00585 gnl|CDD|278982 1.52007e-05 29 166 2 pfam00585, Thr_dehydrat_C, C-terminal regulatory domain of Threonine dehydratase. Threonine dehydratases pfam00291 all contain a carboxy terminal region. This region may have a regulatory role. Some members contain two copies of this region. This family is homologous to the pfam01842 domain. Bacteria(19);unclassified sequences(1)
+ds2020-267_176 291 pfam01235 gnl|CDD|376500 1.13408e-29 115 243 1 pfam01235, Na_Ala_symp, Sodium:alanine symporter family. Bacteria(19);unclassified sequences(1)
+ds2020-267_388 241 pfam02123 gnl|CDD|280316 6.16383e-08 35 214 -1 pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus. Viruses(19);unclassified sequences(1)
+ds2020-267_669 215 pfam17862 gnl|CDD|380037 4.46873e-06 33 122 -1 pfam17862, AAA_lid_3, AAA+ lid domain. This entry represents the alpha helical AAA+ lid domain that is found to the C-terminus of AAA domains. Eukaryota(9);Bacteria(8);Archaea(3)
+ds2020-267_187 287 pfam02673 gnl|CDD|376891 3.59766e-13 7 156 1 pfam02673, BacA, Bacitracin resistance protein BacA. Bacitracin resistance protein (BacA) is a putative undecaprenol kinase. BacA confers resistance to bacitracin, probably by phosphorylation of undecaprenol. More recent studies show that BacA has undecaprenyl pyrophosphate phosphatase activity. Undecaprenyl phosphate is a key lipid intermediate involved in the synthesis of various bacterial cell wall polymers. Bacitracin, a mixture of related cyclic polypeptide antibiotics, is used to treat surface tissue infections. Its primary mode of action is the inhibition of bacterial cell wall synthesis through sequestration of the essential carrier lipid undecaprenyl pyrophosphate, C55-PP, resulting in the loss of cell integrity and lysis. The characteristic phosphatase sequence-motif in this family is likely to be the PGxSRSGG, compared with the PSGH of the PAP family of phosphatases. Bacteria(19);unclassified sequences(1)
+ds2020-267_641 216 pfam00804 gnl|CDD|366315 9.72957e-23 23 187 -3 pfam00804, Syntaxin, Syntaxin. Syntaxins are the prototype family of SNARE proteins. They usually consist of three main regions - a C-terminal transmembrane region, a central SNARE domain which is characteristic of and conserved in all syntaxins (pfam05739), and an N-terminal domain that is featured in this entry. This domain varies between syntaxin isoforms; in syntaxin 1A it is found as three alpha-helices with a left-handed twist. It may fold back on the SNARE domain to allow the molecule to adopt a 'closed' configuration that prevents formation of the core fusion complex - it thus has an auto-inhibitory role. The function of syntaxins is determined by their localization. They are involved in neuronal exocytosis, ER-Golgi transport and Golgi-endosome transport, for example. They also interact with other proteins as well as those involved in SNARE complexes. These include vesicle coat proteins, Rab GTPases, and tethering factors. Eukaryota(20)
+ds2020-267_597 219 pfam00421 gnl|CDD|366090 8.10522e-27 22 207 1 pfam00421, PSII, Photosystem II protein. Eukaryota(13);Bacteria(7)
+ds2020-267_268 259 pfam02123 gnl|CDD|280316 3.22949e-21 18 251 3 pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus. Viruses(19);unclassified sequences(1)
+ds2020-267_719 213 pfam00072 gnl|CDD|333815 9.1657e-13 45 185 -2 pfam00072, Response_reg, Response regulator receiver domain. This domain receives the signal from the sensor partner in bacterial two-component systems. It is usually found N-terminal to a DNA binding effector domain. Bacteria(20)
+ds2020-267_811 208 pfam07991 gnl|CDD|285265 1.80927e-08 20 190 -1 pfam07991, IlvN, Acetohydroxy acid isomeroreductase, NADPH-binding domain. Acetohydroxy acid isomeroreductase catalyzes the conversion of acetohydroxy acids into dihydroxy valerates. This reaction is the second in the synthetic pathway of the essential branched side chain amino acids valine and isoleucine. This N-terminal region of the enzyme carries the binding-site for NADPH. The active-site for enzymatic activity lies in the C-terminal part, IlvC, pfam01450. Bacteria(16);Archaea(2);unclassified sequences(2)
+ds2020-267_642 216 pfam02874 gnl|CDD|367225 0.000376273 20 190 -1 pfam02874, ATP-synt_ab_N, ATP synthase alpha/beta family, beta-barrel domain. This family includes the ATP synthase alpha and beta subunits the ATP synthase associated with flagella. Bacteria(17);Eukaryota(2);Archaea(1)
+ds2020-267_504 226 pfam01578 gnl|CDD|307628 0.000112784 20 190 -1 pfam01578, Cytochrom_C_asm, Cytochrome C assembly protein. This family consists of various proteins involved in cytochrome c assembly from mitochondria and bacteria; CycK from Rhizobium, CcmC from E. coli and Paracoccus denitrificans and orf240 from wheat mitochondria. The members of this family are probably integral membrane proteins with six predicted transmembrane helices. It has been proposed that members of this family comprise a membrane component of an ABC (ATP binding cassette) transporter complex. It is also proposed that this transporter is necessary for transport of some component needed for cytochrome c assembly. One member CycK contains a putative heme-binding motif, orf240 also contains a putative heme-binding motif and is a proposed ABC transporter with c-type heme as its proposed substrate. However it seems unlikely that all members of this family transport heme nor c-type apocytochromes because CcmC in the putative CcmABC transporter transports neither. CcmF forms a working module with CcmH and CcmI, CcmFHI, and itself is unlikely to bind haem directly. Bacteria(19);Archaea(1)
+ds2020-267_274 258 pfam03713 gnl|CDD|367619 9.45376e-09 24 173 -2 pfam03713, DUF305, Domain of unknown function (DUF305). Domain found in small family of bacterial secreted proteins with no known function. Also found in Paramecium bursaria chlorella virus 1. This domain is short and found in one or two copies. The domain has a conserved HH motif that may be functionally important. This domain belongs to the ferritin superfamily. It contains two sequence similar repeats each of which is composed of two alpha helices. Bacteria(18);unclassified sequences(2)
+ds2020-267_42 575 pfam00283 gnl|CDD|365999 2.95472e-07 325 411 1 pfam00283, Cytochrom_B559, Cytochrome b559, alpha (gene psbE) and beta (gene psbF)subunits. Eukaryota(18);Bacteria(2)
+ds2020-267_283 257 pfam13041 gnl|CDD|372443 3.148e-06 13 114 1 pfam13041, PPR_2, PPR repeat family. This repeat has no known function. It is about 35 amino acids long and is found in up to 18 copies in some proteins. The family appears to be greatly expanded in plants and fungi. The repeat has been called PPR. Eukaryota(20)
+ds2020-267_685 214 pfam09334 gnl|CDD|370442 1.80219e-14 16 117 -2 pfam09334, tRNA-synt_1g, tRNA synthetases class I (M). This family includes methionyl tRNA synthetases. Bacteria(17);Archaea(2);unclassified sequences(1)
diff --git a/tools/virAnnot/test-data/rps_test.xml b/tools/virAnnot/test-data/rps_test.xml
new file mode 100755
index 00000000000..ce70880923a
--- /dev/null
+++ b/tools/virAnnot/test-data/rps_test.xml
@@ -0,0 +1,21944 @@
+
+
+
+ rpstblastn
+ RPSTBLASTN 2.10.1+
+ Stephen F. Altschul, Thomas L. Madden, Alejandro A. Schäffer, Jinghui Zhang, Zheng Zhang, Webb Miller, and David J. Lipman (1997), "Gapped BLAST and PSI-BLAST: a new generation of protein database search programs", Nucleic Acids Res. 25:3389-3402.
+ /home/tcandresse/work/pfam/Pfam
+ ds2020-267_269
+ No definition line
+ 259
+
+
+ BLOSUM62
+ 0.001
+ 11
+ 1
+ F
+
+
+
+
+ 1
+ ds2020-267_269
+ No definition line
+ 259
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.050055168
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 2
+ ds2020-267_1242
+ No definition line
+ 59
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 3
+ ds2020-267_333
+ No definition line
+ 248
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 75683825
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 4
+ ds2020-267_1111
+ No definition line
+ 70
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 5
+ ds2020-267_560
+ No definition line
+ 222
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 6
+ ds2020-267_120
+ No definition line
+ 339
+
+
+ 1
+ gnl|CDD|374695
+ pfam16639, Apocytochr_F_N, Apocytochrome F, N-terminal. This is the N-terminal domain of cytochrome f. It is a soluble lumen-side domain.
+ 374695
+ 154
+
+
+ 1
+ 91.1926
+ 227
+ 2.20279e-25
+ 197
+ 325
+ 112
+ 154
+ -3
+ 0
+ 30
+ 37
+ 0
+ 43
+ MVIGPVPGQKYSEITFPILSPDPATKKDVHFLKYPIYVGGNRG
+ LIVGPLPGDQYQEIVFPVLSPDPATDKSVHFGKYPVYVGGNRG
+ +++GP+PG +Y EI FP+LSPDPAT K VHF KYP+YVGGNRG
+
+
+
+
+ 2
+ gnl|CDD|366578
+ pfam01333, Apocytochr_F_C, Apocytochrome F, C-terminal. This is a sub-family of cytochrome C. See pfam00034.
+ 366578
+ 115
+
+
+ 1
+ 34.0526
+ 79
+ 0.000848733
+ 116
+ 163
+ 1
+ 16
+ -3
+ 0
+ 10
+ 13
+ 0
+ 16
+ NNNVYNATAAGIVSKI
+ NNNVFTASAAGTISAI
+ NNNV+ A+AAG +S I
+
+
+
+
+
+
+ 17919
+ 3004588
+ 70
+ 75261094
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 7
+ ds2020-267_374
+ No definition line
+ 242
+
+
+ 1
+ gnl|CDD|365890
+ pfam00124, Photo_RC, Photosynthetic reaction centre protein.
+ 365890
+ 260
+
+
+ 1
+ 42.9994
+ 102
+ 5.09126e-07
+ 21
+ 125
+ 91
+ 125
+ 3
+ 0
+ 12
+ 19
+ 0
+ 35
+ SVQLRPYNAIAFSGPIAVFVSVFLIYPLGQSGWFF
+ KLGMGPHVAWAFSAAIAAYLSLGLIRPILMGSWSE
+ + + P+ A AFS IA ++S+ LI P+ W
+
+
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 8
+ ds2020-267_470
+ No definition line
+ 230
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 9
+ ds2020-267_609
+ No definition line
+ 218
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 10
+ ds2020-267_128
+ No definition line
+ 332
+
+
+
+
+ 17919
+ 3004588
+ 68
+ 75016032
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 11
+ ds2020-267_870
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 12
+ ds2020-267_1236
+ No definition line
+ 59
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 13
+ ds2020-267_651
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 14
+ ds2020-267_648
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 15
+ ds2020-267_847
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 16
+ ds2020-267_978
+ No definition line
+ 121
+
+
+
+
+ 17919
+ 3004588
+ 13
+ 74834307
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 17
+ ds2020-267_973
+ No definition line
+ 123
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 18
+ ds2020-267_456
+ No definition line
+ 232
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 19
+ ds2020-267_272
+ No definition line
+ 259
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 20
+ ds2020-267_1065
+ No definition line
+ 74
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 21
+ ds2020-267_888
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 22
+ ds2020-267_866
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 23
+ ds2020-267_1034
+ No definition line
+ 76
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 24
+ ds2020-267_393
+ No definition line
+ 240
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 25
+ ds2020-267_1084
+ No definition line
+ 72
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 26
+ ds2020-267_489
+ No definition line
+ 228
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 27
+ ds2020-267_471
+ No definition line
+ 230
+
+
+ 1
+ gnl|CDD|278624
+ pfam00201, UDPGT, UDP-glucoronosyl and UDP-glucosyl transferase.
+ 278624
+ 499
+
+
+ 1
+ 43.5512
+ 103
+ 3.12575e-07
+ 46
+ 210
+ 353
+ 401
+ 1
+ 0
+ 14
+ 23
+ 10
+ 57
+ IL*ALTAGVPMICSPFFADQRTNCYYTCNEWGSGMEIDNTFGRAD--SMQSAEVLTA
+ VYEAICHGVPMVGMPLFGDQMDNAKHMEAKGA--------AVTLNVLTMTSEDLLNA
+ + A+ GVPM+ P F DQ N + + + +M S ++L A
+
+
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 28
+ ds2020-267_367
+ No definition line
+ 243
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 29
+ ds2020-267_535
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 30
+ ds2020-267_1201
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 31
+ ds2020-267_710
+ No definition line
+ 213
+
+
+ 1
+ gnl|CDD|366480
+ pfam01127, Sdh_cyt, Succinate dehydrogenase/Fumarate reductase transmembrane subunit. This family includes a transmembrane protein from both the Succinate dehydrogenase and Fumarate reductase complexes.
+ 366480
+ 122
+
+
+ 1
+ 33.1145
+ 76
+ 0.000723904
+ 13
+ 126
+ 8
+ 45
+ 1
+ 0
+ 13
+ 19
+ 0
+ 38
+ NSDLLIYKPQLTSTFPISHRISGAFLVTIVLFFYLLCL
+ SPHLGLYRAHLGTWLSILHRITGVALFVLGLIHLLLWL
+ + L +Y+ L + I HRI+G L + L LL L
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 32
+ ds2020-267_904
+ No definition line
+ 142
+
+
+
+
+ 17919
+ 3004588
+ 19
+ 74595556
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 33
+ ds2020-267_692
+ No definition line
+ 214
+
+
+ 1
+ gnl|CDD|366242
+ pfam00680, RdRP_1, RNA dependent RNA polymerase.
+ 366242
+ 470
+
+
+ 1
+ 37.3361
+ 87
+ 4.79875e-05
+ 70
+ 180
+ 82
+ 115
+ 1
+ 0
+ 16
+ 21
+ 3
+ 37
+ FTFEDATLDEAINGVEDLDYFDSLVIGTSEGYPYVLE
+ ADLGDLSVSEAINGA---EGFDALNKDTSPGLPYILE
+ D ++ EAING + FD+L TS G PY+LE
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 34
+ ds2020-267_1114
+ No definition line
+ 69
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 35
+ ds2020-267_813
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 36
+ ds2020-267_390
+ No definition line
+ 241
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 37
+ ds2020-267_217
+ No definition line
+ 275
+
+
+
+
+ 17919
+ 3004588
+ 54
+ 75367594
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 38
+ ds2020-267_654
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 39
+ ds2020-267_956
+ No definition line
+ 126
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 40
+ ds2020-267_1228
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 41
+ ds2020-267_608
+ No definition line
+ 218
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 42
+ ds2020-267_412
+ No definition line
+ 238
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 43
+ ds2020-267_211
+ No definition line
+ 276
+
+
+
+
+ 17919
+ 3004588
+ 55
+ 74704591
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 44
+ ds2020-267_419
+ No definition line
+ 236
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 45
+ ds2020-267_606
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 46
+ ds2020-267_817
+ No definition line
+ 208
+
+
+ 1
+ gnl|CDD|377540
+ pfam05656, DUF805, Protein of unknown function (DUF805). This family consists of several bacterial proteins of unknown function.
+ 377540
+ 108
+
+
+ 1
+ 39.1746
+ 92
+ 3.45664e-06
+ 86
+ 190
+ 72
+ 106
+ -1
+ 0
+ 15
+ 19
+ 0
+ 35
+ TGWLSLRMQIPALDLIFMIYLFAAKGTEGNNDYGP
+ SGWWLLLGLIPIIGLIVLLVLLCLPGTPGPNRYGP
+ +GW L IP + LI ++ L GT G N YGP
+
+
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 47
+ ds2020-267_1207
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 48
+ ds2020-267_98
+ No definition line
+ 379
+
+
+ 1
+ gnl|CDD|374428
+ pfam16203, ERCC3_RAD25_C, ERCC3/RAD25/XPB C-terminal helicase. This is the C-terminal helicase domain of ERCC3, RAD25 and XPB helicases.
+ 374428
+ 247
+
+
+ 1
+ 107.677
+ 270
+ 1.33948e-30
+ 131
+ 280
+ 108
+ 157
+ -1
+ 0
+ 39
+ 42
+ 0
+ 50
+ NMAFLSKVGDNSIDILEANVIIQISSHAGSRRQEAQRLGRILRAKGKLQD
+ NTIFLSKVGDTSIDLPEANVLIQISSHFGSRRQEAQRLGRILRAKRRSND
+ N FLSKVGD SID+ EANV+IQISSH GSRRQEAQRLGRILRAK + D
+
+
+
+
+
+
+ 17919
+ 3004588
+ 76
+ 82137200
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 49
+ ds2020-267_321
+ No definition line
+ 250
+
+
+
+
+ 17919
+ 3004588
+ 48
+ 75056660
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 50
+ ds2020-267_940
+ No definition line
+ 128
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 51
+ ds2020-267_61
+ No definition line
+ 465
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 120763012
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 52
+ ds2020-267_21
+ No definition line
+ 858
+
+
+ 1
+ gnl|CDD|366242
+ pfam00680, RdRP_1, RNA dependent RNA polymerase.
+ 366242
+ 470
+
+
+ 1
+ 60.0628
+ 146
+ 8.36679e-11
+ 295
+ 729
+ 205
+ 342
+ -1
+ 0
+ 33
+ 59
+ 13
+ 148
+ PIAVGQSWYHGGSQEFIDRMAPFDKFFCFDAKKFDSSINEWMVTIAINICRKQYYDGDNP---DYDTYWAFVAESLLRAPIYRDDGVRMQKYVGTTSGHSHNTLLQSIITLLIGYAALFELDGGLTIDNIDEHAWMESLGDDNIMAVS
+ GIAVGINPFSRDWERLGALIRKGSDVLDVDYSAFDSTLSPFVFDLVEDI-RSEFCGGLEPTRLALLEL--------LSNPIHILGGTIIKVEGGLPSGQPATSVINSILNNIYVLYALIKHTGESELD-DHETIRFISYGDDNLVAVN
+ IAVG + + + + D FDS+++ ++ + +I R ++ G P L PI+ G ++ G SG +++ SI+ + AL + G +D E S GDDN++AV+
+
+
+
+
+
+
+ 17919
+ 3004588
+ 85
+ 297776073
+ 0.066953256
+ 0.267
+ 0.14
+
+
+
+
+ 53
+ ds2020-267_1079
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 54
+ ds2020-267_1216
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 55
+ ds2020-267_1183
+ No definition line
+ 62
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 56
+ ds2020-267_1156
+ No definition line
+ 65
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 57
+ ds2020-267_225
+ No definition line
+ 272
+
+
+
+
+ 17919
+ 3004588
+ 54
+ 73330632
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 58
+ ds2020-267_1022
+ No definition line
+ 81
+
+
+
+
+ 17919
+ 3004588
+ 2
+ 74218750
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 59
+ ds2020-267_707
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 60
+ ds2020-267_264
+ No definition line
+ 260
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 61
+ ds2020-267_1059
+ No definition line
+ 74
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 62
+ ds2020-267_514
+ No definition line
+ 225
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 63
+ ds2020-267_718
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 64
+ ds2020-267_627
+ No definition line
+ 217
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 65
+ ds2020-267_533
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 66
+ ds2020-267_1025
+ No definition line
+ 79
+
+
+
+
+ 17919
+ 3004588
+ 1
+ 74666725
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 67
+ ds2020-267_267
+ No definition line
+ 259
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 68
+ ds2020-267_143
+ No definition line
+ 315
+
+
+
+
+ 17919
+ 3004588
+ 65
+ 73594120
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 69
+ ds2020-267_88
+ No definition line
+ 400
+
+
+
+
+ 17919
+ 3004588
+ 77
+ 90990200
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 70
+ ds2020-267_954
+ No definition line
+ 126
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 71
+ ds2020-267_76
+ No definition line
+ 423
+
+
+
+
+ 17919
+ 3004588
+ 78
+ 101235078
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 72
+ ds2020-267_241
+ No definition line
+ 266
+
+
+
+
+ 17919
+ 3004588
+ 52
+ 74620800
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 73
+ ds2020-267_1158
+ No definition line
+ 64
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 74
+ ds2020-267_422
+ No definition line
+ 236
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 75
+ ds2020-267_361
+ No definition line
+ 243
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 76
+ ds2020-267_563
+ No definition line
+ 222
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 77
+ ds2020-267_1073
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 78
+ ds2020-267_1141
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 79
+ ds2020-267_212
+ No definition line
+ 276
+
+
+
+
+ 17919
+ 3004588
+ 55
+ 74704591
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 80
+ ds2020-267_261
+ No definition line
+ 260
+
+
+ 1
+ gnl|CDD|376444
+ pfam01051, Rep_3, Initiator Replication protein. This protein is an initiator of plasmid replication. RepB possesses nicking-closing (topoisomerase I) like activity. It is also able to perform a strand transfer reaction on ssDNA that contains its target. This family also includes RepA which is an E.coli protein involved in plasmid replication. The RepA protein binds to DNA repeats that flank the repA gene.
+ 376444
+ 221
+
+
+ 1
+ 76.5582
+ 189
+ 1.77523e-19
+ 26
+ 217
+ 94
+ 157
+ -2
+ 0
+ 28
+ 42
+ 0
+ 64
+ RWVDKIGYIDDLGCVELVFASDVIPLITRLEQRFTEYDIDQVSNLQSKYAVRLYELLVQWRSTG
+ LWVGYIISAKGEGKVEIEFSPDLKPYLLELKKNFTKYELKEFLKLKSKYSIRLYELLKQYRSTG
+ WV I G VE+ F+ D+ P + L++ FT+Y++ + L+SKY++RLYELL Q+RSTG
+
+
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 81
+ ds2020-267_689
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 82
+ ds2020-267_892
+ No definition line
+ 181
+
+
+
+
+ 17919
+ 3004588
+ 30
+ 74010540
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 83
+ ds2020-267_1243
+ No definition line
+ 59
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 84
+ ds2020-267_521
+ No definition line
+ 225
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 85
+ ds2020-267_773
+ No definition line
+ 210
+
+
+ 1
+ gnl|CDD|376583
+ pfam01641, SelR, SelR domain. Methionine sulfoxide reduction is an important process, by which cells regulate biological processes and cope with oxidative stress. MsrA, a protein involved in the reduction of methionine sulfoxides in proteins, has been known for four decades and has been extensively characterized with respect to structure and function. However, recent studies revealed that MsrA is only specific for methionine-S-sulfoxides. Because oxidized methionines occur in a mixture of R and S isomers in vivo, it was unclear how stereo-specific MsrA could be responsible for the reduction of all protein methionine sulfoxides. It appears that a second methionine sulfoxide reductase, SelR, evolved that is specific for methionine-R-sulfoxides, the activity that is different but complementary to that of MsrA. Thus, these proteins, working together, could reduce both stereoisomers of methionine sulfoxide. This domain is found both in SelR proteins and fused with the peptide methionine sulfoxide reductase enzymatic domain pfam01625. The domain has two conserved cysteine and histidines. The domain binds both selenium and zinc. The final cysteine is found to be replaced by the rare amino acid selenocysteine in some members of the family. This family has methionine-R-sulfoxide reductase activity.
+ 376583
+ 120
+
+
+ 1
+ 110.138
+ 277
+ 5.23903e-34
+ 16
+ 174
+ 6
+ 58
+ 1
+ 0
+ 32
+ 36
+ 0
+ 53
+ LTDVQYYVTQQNGTERPFSHEYDHQFEPGIYVDIVSGEPLFSSSDKYDSGCGW
+ LTPEQYRVLREKGTERPFTGEYWDNKEPGIYVCAGCGTPLFSSDTKFDSGCGW
+ LT QY V ++ GTERPF+ EY EPGIYV G PLFSS K+DSGCGW
+
+
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 86
+ ds2020-267_619
+ No definition line
+ 217
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 87
+ ds2020-267_675
+ No definition line
+ 215
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 88
+ ds2020-267_974
+ No definition line
+ 122
+
+
+
+
+ 17919
+ 3004588
+ 13
+ 74834307
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 89
+ ds2020-267_912
+ No definition line
+ 135
+
+
+
+
+ 17919
+ 3004588
+ 17
+ 75599020
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 90
+ ds2020-267_1054
+ No definition line
+ 75
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 91
+ ds2020-267_287
+ No definition line
+ 256
+
+
+ 1
+ gnl|CDD|376293
+ pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I.
+ 376293
+ 433
+
+
+ 1
+ 97.2464
+ 243
+ 2.8946e-26
+ 13
+ 237
+ 326
+ 400
+ 1
+ 0
+ 47
+ 57
+ 0
+ 75
+ NTPGLDIALHDTYYVVAHFHYVLSMGAVFALFAGFHYWVGKIFGRIYPETLGQIHFWITFFGVNLTFFPMHFLGL
+ ALPPVNYYVHDTYFVVAHFHYVLFGGVVFALFAGIYYWFPKLTGRMYSERLGKLHFWLLFIGFNLTFFPMHILGL
+ P ++ +HDTY+VVAHFHYVL G VFALFAG +YW K+ GR+Y E LG++HFW+ F G NLTFFPMH LGL
+
+
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 73802330
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 92
+ ds2020-267_139
+ No definition line
+ 320
+
+
+ 1
+ gnl|CDD|368641
+ pfam05860, Haemagg_act, haemagglutination activity domain. This domain is suggested to be a carbohydrate- dependent haemagglutination activity site. It is found in a range of haemagglutinins and haemolysins.
+ 368641
+ 118
+
+
+ 1
+ 59.967
+ 146
+ 1.34887e-13
+ 167
+ 298
+ 56
+ 99
+ 2
+ 0
+ 20
+ 26
+ 0
+ 44
+ GEAKIILGQVNSTSPSQLAGYTEIAGGKAELVIANPAGITCSGG
+ GAASNILNRVTGGNPSQIQGYIEVAGANANVFLANPNGIIFGGN
+ G A IL +V +PSQ+ GY E+AG A + +ANP GI G
+
+
+
+
+
+
+ 17919
+ 3004588
+ 65
+ 75433973
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 93
+ ds2020-267_763
+ No definition line
+ 211
+
+
+ 1
+ gnl|CDD|376349
+ pfam00557, Peptidase_M24, Metallopeptidase family M24. This family contains metallopeptidases. It also contains non-peptidase homologs such as the N terminal domain of Spt16 which is a histone H3-H4 binding module.
+ 376349
+ 206
+
+
+ 1
+ 34.896
+ 81
+ 0.000231782
+ 15
+ 74
+ 76
+ 95
+ -3
+ 0
+ 12
+ 14
+ 0
+ 20
+ FLIDAGASFHGYASDITRIY
+ VLIDVGAEYDGYCSDITRTF
+ LID GA + GY SDITR +
+
+
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 94
+ ds2020-267_624
+ No definition line
+ 217
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 95
+ ds2020-267_70
+ No definition line
+ 445
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 109640103
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 96
+ ds2020-267_1209
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 97
+ ds2020-267_196
+ No definition line
+ 283
+
+
+
+
+ 17919
+ 3004588
+ 57
+ 73378585
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 98
+ ds2020-267_1102
+ No definition line
+ 71
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 99
+ ds2020-267_346
+ No definition line
+ 246
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 75683825
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 100
+ ds2020-267_612
+ No definition line
+ 218
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 101
+ ds2020-267_607
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.04777374
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 102
+ ds2020-267_571
+ No definition line
+ 221
+
+
+ 1
+ gnl|CDD|366135
+ pfam00501, AMP-binding, AMP-binding enzyme.
+ 366135
+ 361
+
+
+ 1
+ 43.7436
+ 104
+ 2.61467e-07
+ 34
+ 201
+ 1
+ 56
+ 1
+ 0
+ 17
+ 29
+ 0
+ 56
+ LERSATVYGDCPSLIYNDTTYTWTQTHRRCIRVASSISSLVIKSRHVVSVLSPNTP
+ LERQAARTPDKTALVGEGRRLTYRELDERANRLAAGLRALGVKKGDRVAILLPNSP
+ LER A D +L+ T+ + R R+A+ + +L +K V++L PN+P
+
+
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 103
+ ds2020-267_592
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 104
+ ds2020-267_764
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 105
+ ds2020-267_1015
+ No definition line
+ 85
+
+
+
+
+ 17919
+ 3004588
+ 3
+ 73770775
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 106
+ ds2020-267_1151
+ No definition line
+ 65
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 107
+ ds2020-267_69
+ No definition line
+ 451
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 112818077
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 108
+ ds2020-267_167
+ No definition line
+ 298
+
+
+
+
+ 17919
+ 3004588
+ 60
+ 75248472
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 109
+ ds2020-267_23
+ No definition line
+ 835
+
+
+
+
+ 17919
+ 3004588
+ 85
+ 285924289
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 110
+ ds2020-267_872
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 111
+ ds2020-267_578
+ No definition line
+ 221
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 112
+ ds2020-267_611
+ No definition line
+ 218
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 113
+ ds2020-267_565
+ No definition line
+ 222
+
+
+ 1
+ gnl|CDD|377172
+ pfam03950, tRNA-synt_1c_C, tRNA synthetases class I (E and Q), anti-codon binding domain. Other tRNA synthetase sub-families are too dissimilar to be included. This family includes only glutamyl and glutaminyl tRNA synthetases. In some organisms, a single glutamyl-tRNA synthetase aminoacylates both tRNA(Glu) and tRNA(Gln).
+ 377172
+ 174
+
+
+ 1
+ 49.5699
+ 119
+ 9.52435e-10
+ 53
+ 184
+ 63
+ 108
+ -3
+ 0
+ 16
+ 27
+ 2
+ 46
+ EIRLRNSYVLKIEEHITDDNGEVVGLTATIDPKTLGNN--PEGLVH
+ EVRLMDAYNIKVTEVVKDEDGNVTELHCTYDGDDLGGARKVKGIIH
+ E+RL ++Y +K+ E + D++G V L T D LG +G++H
+
+
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 114
+ ds2020-267_468
+ No definition line
+ 230
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 115
+ ds2020-267_202
+ No definition line
+ 281
+
+
+
+
+ 17919
+ 3004588
+ 56
+ 74041588
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 116
+ ds2020-267_826
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 117
+ ds2020-267_503
+ No definition line
+ 226
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 118
+ ds2020-267_197
+ No definition line
+ 283
+
+
+
+
+ 17919
+ 3004588
+ 57
+ 73378585
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 119
+ ds2020-267_307
+ No definition line
+ 253
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 120
+ ds2020-267_427
+ No definition line
+ 235
+
+
+ 1
+ gnl|CDD|367360
+ pfam03154, Atrophin-1, Atrophin-1 family. Atrophin-1 is the protein product of the dentatorubral-pallidoluysian atrophy (DRPLA) gene. DRPLA OMIM:125370 is a progressive neurodegenerative disorder. It is caused by the expansion of a CAG repeat in the DRPLA gene on chromosome 12p. This results in an extended polyglutamine region in atrophin-1, that is thought to confer toxicity to the protein, possibly through altering its interactions with other proteins. The expansion of a CAG repeat is also the underlying defect in six other neurodegenerative disorders, including Huntington's disease. One interaction of expanded polyglutamine repeats that is thought to be pathogenic is that with the short glutamine repeat in the transcriptional coactivator CREB binding protein, CBP. This interaction draws CBP away from its usual nuclear location to the expanded polyglutamine repeat protein aggregates that are characteristic of the polyglutamine neurodegenerative disorders. This interferes with CBP-mediated transcription and causes cytotoxicity.
+ 367360
+ 980
+
+
+ 1
+ 34.611
+ 79
+ 0.000552392
+ 40
+ 213
+ 578
+ 636
+ -2
+ 0
+ 19
+ 37
+ 1
+ 59
+ KEMEEGKHKSRKEGESK-RSHRDRQREKERNGERHRDKDKDKDKRDRDSRRSEREKSSD
+ KKREEALEKAKREAEQKAREEREREKEREKEREREREREREAERAAKASSSSHEGRMSD
+ K+ EE K+++E E K R R+R++E+E+ ER R+++++ ++ + S S + SD
+
+
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 121
+ ds2020-267_738
+ No definition line
+ 212
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 122
+ ds2020-267_1160
+ No definition line
+ 64
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 123
+ ds2020-267_1066
+ No definition line
+ 74
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 124
+ ds2020-267_7
+ No definition line
+ 1772
+
+
+
+
+ 17919
+ 3004588
+ 91
+ 685605541
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 125
+ ds2020-267_786
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 126
+ ds2020-267_44
+ No definition line
+ 545
+
+
+
+
+ 17919
+ 3004588
+ 81
+ 155314900
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 127
+ ds2020-267_475
+ No definition line
+ 229
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 128
+ ds2020-267_928
+ No definition line
+ 130
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 129
+ ds2020-267_752
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 130
+ ds2020-267_988
+ No definition line
+ 116
+
+
+
+
+ 17919
+ 3004588
+ 11
+ 75801933
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 131
+ ds2020-267_265
+ No definition line
+ 260
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 132
+ ds2020-267_1219
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 133
+ ds2020-267_115
+ No definition line
+ 345
+
+
+
+
+ 17919
+ 3004588
+ 72
+ 73720060
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 134
+ ds2020-267_559
+ No definition line
+ 222
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 135
+ ds2020-267_51
+ No definition line
+ 500
+
+
+
+
+ 17919
+ 3004588
+ 80
+ 135111848
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 136
+ ds2020-267_1185
+ No definition line
+ 62
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.061499328
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 137
+ ds2020-267_520
+ No definition line
+ 225
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 138
+ ds2020-267_1137
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 139
+ ds2020-267_1191
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 140
+ ds2020-267_548
+ No definition line
+ 223
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 141
+ ds2020-267_4
+ No definition line
+ 2297
+
+
+ 1
+ gnl|CDD|280316
+ pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus.
+ 280316
+ 465
+
+
+ 1
+ 187.283
+ 476
+ 1.96254e-52
+ 824
+ 1858
+ 121
+ 464
+ -2
+ 0
+ 94
+ 136
+ 19
+ 354
+ VRKSRLVNWEEEHKNRVSPNLAEMPEGLVYERASQLFSRSISAGKRPR-KFD-WREYWQSRWQWSAAGSIHSQYSEDDKYIFKDIYLKNKFISILAMPDMNMDSWRER----DPELHAWSSTKYEWSKLRAIYGTDVTSYVLAHFAFYNCEDVLPSPFPVGKAANDEN--VRSRVRSVLEGRTQYCVDFEDFNSQHSVQSMKAVIDAYRDTFGHFLTQEQLAAVEWTRLSLDRVIVHDNQGLKMEYNAKGTLLSGWRLTTFMNSVLNYIYTQLIVPDVVQSQNSLHNGDDVLLGSNSLEDVLLAGKNAKKHNIRLQMSK-CAYGAIAEFLRVDHKRGSKGQYLSRAMATLVHSR
+ GRGVTNVDWEEEAKNRVDLAVVCRLVLLPMEELRAHIDAVLDELVVRRGLCDPIRLFVKNEPLWCVNGHPDHKLRE---GRLRLLSSVSLVDQLVRR--MLFEPQNNNEIAWWGSVPSKPSMKLEHGKSRAIYACDTRSYLAFEYLLAPVEKAWANKSVILNPGEGDISGFDWSVQDWKRGGVSLMLDYDDFNSQHSTESMRAVFERLR----RRLPDEPAEAADWLVCSMDSMYQLSD-GTLLAQRVPGTLKSGHRATTFINSVLNCAYAELAGAPWADVPTSIHMGDDVLEGLRTPADATSLLDKYARLGFKVNPSKQSVGHTIAEFLRVAFCSHEVRGYLARAIASLVSGN
+ R V+WEEE KNRV + L E + R D R + ++ W G + E + + + ++ M + + + S K E K RAIY D SY+ + E + + + V+ G +D++DFNSQHS +SM+AV + R L E A +W S+D + + G + GTL SG R TTF+NSVLN Y +L S+H GDDVL G + D + ++ SK IAEFLRV YL+RA+A+LV
+
+
+
+
+ 2
+ gnl|CDD|366242
+ pfam00680, RdRP_1, RNA dependent RNA polymerase.
+ 366242
+ 470
+
+
+ 1
+ 44.6549
+ 106
+ 4.43825e-05
+ 995
+ 1510
+ 166
+ 342
+ -2
+ 0
+ 44
+ 65
+ 31
+ 190
+ KYEWSKLRAIYGTDVTSYVLAHFAFYNCEDVLPSPFPVGKAANDENVRSRVRSVLEGRTQ-----YCVDFEDFNSQHSVQSMKAVIDAYRDTFGHFLTQEQLAAVEWTRLSLDRVIVHDNQGLKMEYNAK-----GTLLSGWRLTTFMNSVLNYIYTQLIVPD-VVQSQNSLH-------NGDDVLLGSN
+ KVQAGKTRLFWGCPVEVNLVARAVFGPFCNKIYSNALKLGIAVGINPFSRDWERLGALIRKGSDVLDVDYSAFDSTLSPFVFDLVEDIRSEFCGGL---------EPTRLALLELLSNP----IHILGGTIIKVEGGLPSGQPATSVINSILNNIYVLYALIKHTGESELDDHETIRFISYGDDNLVAVN
+ K + K R +G V ++A F + + S A N SR L + VD+ F+S S V D + G E TRL+L ++ + G L SG T+ +NS+LN IY + +S+ H GDD L+ N
+
+
+
+
+
+
+ 17919
+ 3004588
+ 93
+ 899217312
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 142
+ ds2020-267_573
+ No definition line
+ 221
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 143
+ ds2020-267_16
+ No definition line
+ 1165
+
+
+ 1
+ gnl|CDD|280316
+ pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus.
+ 280316
+ 465
+
+
+ 1
+ 141.829
+ 358
+ 1.58664e-38
+ 536
+ 1078
+ 288
+ 464
+ -1
+ 0
+ 62
+ 85
+ 6
+ 182
+ SRVRAVLEGRTQYCVDFEDFNSQHSVQSMKAVIDAYRDTFGHFLTQEQLAAVEWTRLSLNRVIVHDNQGLKMEYSAKGTLLSGWRLTTFMNSVLNYIYTQLIVPDVVKSQNSLHNGDDVLLGSNSLGDVLLAGRNAKKHNIRLQMSK-CAYGAIAEFLRVDHKRGSKGQYLSRAMATLVHSR
+ WSVQDWKRGGVSLMLDYDDFNSQHSTESMRAVFERLR----RRLPDEPAEAADWLVCSMDSMYQLSD-GTLLAQRVPGTLKSGHRATTFINSVLNCAYAELAGAPWADVPTSIHMGDDVLEGLRTPADATSLLDKYARLGFKVNPSKQSVGHTIAEFLRVAFCSHEVRGYLARAIASLVSGN
+ V+ G +D++DFNSQHS +SM+AV + R L E A +W S++ + + G + GTL SG R TTF+NSVLN Y +L S+H GDDVL G + D + ++ SK IAEFLRV YL+RA+A+LV
+
+
+
+
+ 2
+ gnl|CDD|366242
+ pfam00680, RdRP_1, RNA dependent RNA polymerase.
+ 366242
+ 470
+
+
+ 1
+ 45.4253
+ 108
+ 8.1737e-06
+ 707
+ 1042
+ 231
+ 342
+ -1
+ 0
+ 30
+ 45
+ 16
+ 120
+ YCVDFEDFNSQHSVQSMKAVIDAYRDTFGHFLTQEQLAAVEWTRLSLNRVIVHDNQGLKMEYSAKGTLLSGWRLTTFMNSVLNYIYTQLIVPD-VVKSQNSLH-------NGDDVLLGSN
+ LDVDYSAFDSTLSPFVFDLVEDIRS----EFCGGLEPTRLALLELLSNPIHILGGTIIKVE----GGLPSGQPATSVINSILNNIYVLYALIKHTGESELDDHETIRFISYGDDNLVAVN
+ VD+ F+S S V D F + + L N + + +K+E G L SG T+ +NS+LN IY + +S+ H GDD L+ N
+
+
+
+
+
+
+ 17919
+ 3004588
+ 88
+ 428314800
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 144
+ ds2020-267_753
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 145
+ ds2020-267_438
+ No definition line
+ 234
+
+
+ 1
+ gnl|CDD|365856
+ pfam00078, RVT_1, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses.
+ 365856
+ 184
+
+
+ 1
+ 33.8002
+ 78
+ 0.000870142
+ 110
+ 220
+ 97
+ 136
+ -3
+ 0
+ 11
+ 17
+ 3
+ 40
+ VLPFGLKNDGAPYQRAMTALFHDMIHKE---MEVYVDDMI
+ GLPQGLVLSPALFQLFMNELLRPLRKRAGLTLVRYADDIL
+ LP GL A +Q M L + + + Y DD++
+
+
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 146
+ ds2020-267_370
+ No definition line
+ 242
+
+
+ 1
+ gnl|CDD|376297
+ pfam00146, NADHdh, NADH dehydrogenase.
+ 376297
+ 301
+
+
+ 1
+ 52.4668
+ 127
+ 2.41391e-10
+ 22
+ 111
+ 269
+ 298
+ 1
+ 0
+ 20
+ 24
+ 0
+ 30
+ VRAAFPRYRYDQLMGLGRKVFLPLSLARVV
+ IRATLPRFRYDQLMRLGWKVLLPLSLANLL
+ +RA PR+RYDQLM LG KV LPLSLA ++
+
+
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 147
+ ds2020-267_798
+ No definition line
+ 209
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 148
+ ds2020-267_278
+ No definition line
+ 258
+
+
+ 1
+ gnl|CDD|365808
+ pfam00012, HSP70, Hsp70 protein. Hsp70 chaperones help to fold many proteins. Hsp70 assisted folding involves repeated cycles of substrate binding and release. Hsp70 activity is ATP dependent. Hsp70 proteins are made up of two regions: the amino terminus is the ATPase domain and the carboxyl terminus is the substrate binding region.
+ 365808
+ 598
+
+
+ 1
+ 77.6867
+ 192
+ 4.1355e-19
+ 50
+ 232
+ 417
+ 477
+ 2
+ 0
+ 27
+ 37
+ 0
+ 61
+ SQTFSTAEDGQSQILLHLYRGDSAMAKSAHSLGTFQITGIAPMPRGEPSVRVEFLADTGGI
+ SQIFSTAADNQTAVEIQVYQGEREMAPDNKLLGSFELDGIPPAPRGVPQIEVTFDIDANGI
+ SQ FSTA D Q+ + + +Y+G+ MA LG+F++ GI P PRG P + V F D GI
+
+
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 149
+ ds2020-267_314
+ No definition line
+ 252
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 150
+ ds2020-267_1251
+ No definition line
+ 58
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 151
+ ds2020-267_435
+ No definition line
+ 234
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 152
+ ds2020-267_1017
+ No definition line
+ 83
+
+
+
+
+ 17919
+ 3004588
+ 2
+ 74218750
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 153
+ ds2020-267_1214
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 154
+ ds2020-267_960
+ No definition line
+ 125
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 155
+ ds2020-267_772
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 156
+ ds2020-267_937
+ No definition line
+ 129
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 157
+ ds2020-267_812
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 158
+ ds2020-267_66
+ No definition line
+ 460
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 117585038
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 159
+ ds2020-267_425
+ No definition line
+ 235
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 160
+ ds2020-267_1010
+ No definition line
+ 96
+
+
+
+
+ 17919
+ 3004588
+ 6
+ 75323924
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 161
+ ds2020-267_727
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 162
+ ds2020-267_745
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 163
+ ds2020-267_512
+ No definition line
+ 225
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 164
+ ds2020-267_899
+ No definition line
+ 146
+
+
+
+
+ 17919
+ 3004588
+ 20
+ 74093824
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 165
+ ds2020-267_1020
+ No definition line
+ 81
+
+
+
+
+ 17919
+ 3004588
+ 2
+ 74218750
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 166
+ ds2020-267_724
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 167
+ ds2020-267_1163
+ No definition line
+ 64
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 168
+ ds2020-267_62
+ No definition line
+ 464
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 119174025
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 169
+ ds2020-267_824
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 170
+ ds2020-267_495
+ No definition line
+ 227
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 171
+ ds2020-267_479
+ No definition line
+ 229
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 172
+ ds2020-267_437
+ No definition line
+ 234
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 173
+ ds2020-267_947
+ No definition line
+ 127
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.065298648
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 174
+ ds2020-267_531
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 175
+ ds2020-267_454
+ No definition line
+ 232
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 176
+ ds2020-267_931
+ No definition line
+ 129
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 177
+ ds2020-267_364
+ No definition line
+ 243
+
+
+ 1
+ gnl|CDD|365952
+ pfam00216, Bac_DNA_binding, Bacterial DNA-binding protein.
+ 365952
+ 88
+
+
+ 1
+ 50.2082
+ 121
+ 1.5507e-10
+ 134
+ 241
+ 53
+ 88
+ -3
+ 0
+ 23
+ 24
+ 0
+ 36
+ ARPQRKRRNPATGEAIQIPAKKAPIFKAGKALKDAV
+ KRAARTGRNPKTGEAITIPAKKVVKFKPGKELKEAV
+ R R RNP TGEAI IPAKK FK GK LK+AV
+
+
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 178
+ ds2020-267_790
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 179
+ ds2020-267_953
+ No definition line
+ 126
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 180
+ ds2020-267_340
+ No definition line
+ 247
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 75683825
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 181
+ ds2020-267_822
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 182
+ ds2020-267_1241
+ No definition line
+ 59
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 183
+ ds2020-267_558
+ No definition line
+ 222
+
+
+ 1
+ gnl|CDD|377116
+ pfam03737, RraA-like, Aldolase/RraA. Members of this family include regulator of ribonuclease E activity A (RraA) and 4-hydroxy-4-methyl-2-oxoglutarate (HMG)/4-carboxy- 4-hydroxy-2-oxoadipate (CHA) aldolase, also known as RraA-like protein. RraA acts as a trans-acting modulator of RNA turnover, binding essential endonuclease RNase E and inhibiting RNA processing. RraA-like proteins seem to contain aldolase and/or decarboxylase activity either in place of or in addition to the RNase E inhibitor functions.
+ 377116
+ 147
+
+
+ 1
+ 57.5038
+ 140
+ 4.93695e-13
+ 57
+ 179
+ 104
+ 147
+ -2
+ 0
+ 18
+ 28
+ 3
+ 44
+ VFA---IPRKSNRKGVGETDIEISFGGLTINSGMYVYADNNGII
+ VFALGTTPRGSPKKGGGEVNVPVTIGGVTVRPGDIVVADEDGVV
+ VFA PR S +KG GE ++ ++ GG+T+ G V AD +G++
+
+
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 184
+ ds2020-267_43
+ No definition line
+ 563
+
+
+
+
+ 17919
+ 3004588
+ 81
+ 164633794
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 185
+ ds2020-267_702
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 186
+ ds2020-267_1230
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 187
+ ds2020-267_1186
+ No definition line
+ 62
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 188
+ ds2020-267_925
+ No definition line
+ 131
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 189
+ ds2020-267_122
+ No definition line
+ 338
+
+
+
+
+ 17919
+ 3004588
+ 70
+ 73510836
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 190
+ ds2020-267_770
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 191
+ ds2020-267_1078
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 192
+ ds2020-267_102
+ No definition line
+ 375
+
+
+
+
+ 17919
+ 3004588
+ 76
+ 80494456
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 193
+ ds2020-267_713
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 194
+ ds2020-267_660
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 195
+ ds2020-267_1147
+ No definition line
+ 65
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 196
+ ds2020-267_760
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 197
+ ds2020-267_542
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 198
+ ds2020-267_11
+ No definition line
+ 1579
+
+
+
+
+ 17919
+ 3004588
+ 91
+ 597672165
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 199
+ ds2020-267_209
+ No definition line
+ 277
+
+
+
+
+ 17919
+ 3004588
+ 55
+ 74704591
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 200
+ ds2020-267_618
+ No definition line
+ 218
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 201
+ ds2020-267_1133
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 202
+ ds2020-267_939
+ No definition line
+ 128
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 203
+ ds2020-267_749
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 204
+ ds2020-267_1008
+ No definition line
+ 96
+
+
+
+
+ 17919
+ 3004588
+ 6
+ 75323924
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 205
+ ds2020-267_135
+ No definition line
+ 323
+
+
+
+
+ 17919
+ 3004588
+ 66
+ 74699294
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 206
+ ds2020-267_218
+ No definition line
+ 274
+
+
+ 1
+ gnl|CDD|279664
+ pfam01348, Intron_maturas2, Type II intron maturase. Group II introns use intron-encoded reverse transcriptase, maturase and DNA endonuclease activities for site-specific insertion into DNA. Although this type of intron is self splicing in vitro they require a maturase protein for splicing in vivo. It has been shown that a specific region of the aI2 intron is needed for the maturase function. This region was found to be conserved in group II introns and called domain X.
+ 279664
+ 140
+
+
+ 1
+ 38.6047
+ 90
+ 1.66328e-05
+ 51
+ 257
+ 32
+ 100
+ 3
+ 0
+ 21
+ 32
+ 0
+ 69
+ PIHVACLTNVSDGDIVNWSAGIAINPLSYYRCRDNLYQVRTIVDHQIRWSAIFTLAHKHKSSARNIILK
+ PRSVGRWTDLDDRDILLRYNAIIRGILNYYSFADNKKRLYTRIYYILRLSCAKTLARKLKLGTVRKVIK
+ P V T++ D DI+ I L+YY DN ++ T + + +R S TLA K K ++K
+
+
+
+
+
+
+ 17919
+ 3004588
+ 54
+ 75367594
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 207
+ ds2020-267_777
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 208
+ ds2020-267_1105
+ No definition line
+ 71
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 209
+ ds2020-267_972
+ No definition line
+ 123
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 210
+ ds2020-267_1070
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 211
+ ds2020-267_835
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 212
+ ds2020-267_286
+ No definition line
+ 257
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 73802330
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 213
+ ds2020-267_820
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 214
+ ds2020-267_324
+ No definition line
+ 250
+
+
+
+
+ 17919
+ 3004588
+ 48
+ 75056660
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 215
+ ds2020-267_363
+ No definition line
+ 243
+
+
+ 1
+ gnl|CDD|366086
+ pfam00416, Ribosomal_S13, Ribosomal protein S13/S18. This family includes ribosomal protein S13 from prokaryotes and S18 from eukaryotes.
+ 366086
+ 109
+
+
+ 1
+ 37.3005
+ 87
+ 2.02528e-05
+ 15
+ 134
+ 2
+ 41
+ -2
+ 0
+ 14
+ 21
+ 0
+ 40
+ ISGARSVADEQVRIASTKIDGIGPKKAIQVRYRLGISGDI
+ ILGTDIDGDKKVEIALTYIKGIGRRRANIILKKAGVDLDK
+ I G D++V IA T I GIG ++A + + G+ D
+
+
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 216
+ ds2020-267_674
+ No definition line
+ 215
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 217
+ ds2020-267_863
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.070739016
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 218
+ ds2020-267_1109
+ No definition line
+ 70
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 219
+ ds2020-267_45
+ No definition line
+ 540
+
+
+
+
+ 17919
+ 3004588
+ 81
+ 153761751
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 220
+ ds2020-267_746
+ No definition line
+ 211
+
+
+ 1
+ gnl|CDD|279788
+ pfam01490, Aa_trans, Transmembrane amino acid transporter protein. This transmembrane region is found in many amino acid transporters including UNC-47 and MTR. UNC-47 encodes a vesicular amino butyric acid (GABA) transporter, (VGAT). UNC-47 is predicted to have 10 transmembrane domains. MTR is a N system amino acid transporter system protein involved in methyltryptophan resistance. Other members of this family include proline transporters and amino acid permeases.
+ 279788
+ 410
+
+
+ 1
+ 35.3596
+ 82
+ 0.000177299
+ 21
+ 176
+ 358
+ 410
+ 3
+ 0
+ 11
+ 21
+ 1
+ 53
+ WPLAIYFPVEMYFVQKKI-GSWTRKWIVLEAFSLVCFLVTVVGVIGSVQGLIS
+ APLSFILPPLFHLKLKKTKKKSQEKLWKPDILDVICIVIGLLLMAYGVAGLIL
+ PL+ P + KK K + ++C ++ ++ + V GLI
+
+
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 221
+ ds2020-267_403
+ No definition line
+ 239
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 222
+ ds2020-267_350
+ No definition line
+ 245
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 223
+ ds2020-267_144
+ No definition line
+ 315
+
+
+
+
+ 17919
+ 3004588
+ 65
+ 73594120
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 224
+ ds2020-267_1049
+ No definition line
+ 75
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 225
+ ds2020-267_499
+ No definition line
+ 227
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 226
+ ds2020-267_22
+ No definition line
+ 841
+
+
+
+
+ 17919
+ 3004588
+ 85
+ 288887235
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 227
+ ds2020-267_862
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 228
+ ds2020-267_294
+ No definition line
+ 255
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 73802330
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 229
+ ds2020-267_31
+ No definition line
+ 712
+
+
+
+
+ 17919
+ 3004588
+ 84
+ 229406976
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 230
+ ds2020-267_1019
+ No definition line
+ 81
+
+
+
+
+ 17919
+ 3004588
+ 2
+ 74218750
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 231
+ ds2020-267_747
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 232
+ ds2020-267_543
+ No definition line
+ 223
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 233
+ ds2020-267_1072
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 234
+ ds2020-267_784
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 235
+ ds2020-267_879
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 236
+ ds2020-267_1120
+ No definition line
+ 67
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 237
+ ds2020-267_1126
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 238
+ ds2020-267_1218
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 239
+ ds2020-267_915
+ No definition line
+ 134
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 76100752
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 240
+ ds2020-267_1026
+ No definition line
+ 79
+
+
+
+
+ 17919
+ 3004588
+ 1
+ 74666725
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 241
+ ds2020-267_845
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 242
+ ds2020-267_405
+ No definition line
+ 239
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 243
+ ds2020-267_1240
+ No definition line
+ 59
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 244
+ ds2020-267_145
+ No definition line
+ 315
+
+
+ 1
+ gnl|CDD|376868
+ pfam02626, CT_A_B, Carboxyltransferase domain, subdomain A and B. Urea carboxylase (UC) catalyzes a two-step, ATP- and biotin-dependent carboxylation reaction of urea. It is composed of biotin carboxylase (BC), carboxyltransferase (CT), and biotin carboxyl carrier protein (BCCP) domains. The CT domain of UC consists of four subdomains, named A, B, C and D. This domain covers the A and B subdomains of the CT domain. This domain covers the whole length of KipA (kinase A) from Bacillus subtilis. It can also be found in S. cerevisiae urea amidolyase Dur1,2, which is a multifunctional biotin-dependent enzyme with domains for urea carboxylase and allophanate (urea carboxylate) hydrolase activity.
+ 376868
+ 262
+
+
+ 1
+ 38.5476
+ 91
+ 3.97676e-05
+ 140
+ 256
+ 46
+ 78
+ -3
+ 0
+ 13
+ 17
+ 6
+ 39
+ VCLTGALYEAYVTDTAKQTRERVPNGWRIAIKAGQTLEL
+ IAVTGADMPATLDG------EPVPMWTPIAVKAGDVLSF
+ + +TGA A + E VP IA+KAG L
+
+
+
+
+
+
+ 17919
+ 3004588
+ 65
+ 73594120
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 245
+ ds2020-267_1107
+ No definition line
+ 71
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 246
+ ds2020-267_889
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 247
+ ds2020-267_154
+ No definition line
+ 309
+
+
+
+
+ 17919
+ 3004588
+ 63
+ 75027640
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 248
+ ds2020-267_391
+ No definition line
+ 241
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 249
+ ds2020-267_637
+ No definition line
+ 217
+
+
+ 1
+ gnl|CDD|284449
+ pfam07026, DUF1317, Protein of unknown function (DUF1317). This family consists of several hypothetical bacterial and phage proteins of around 60 residues in length. The function of this family is unknown.
+ 284449
+ 60
+
+
+ 1
+ 57.0614
+ 137
+ 1.36077e-13
+ 47
+ 172
+ 1
+ 44
+ 2
+ 0
+ 21
+ 28
+ 2
+ 44
+ MTHAHEDIRVGTLCLPF--FGNGWLMPWGEVVSNTLKAQRLAEE
+ MKHNHDDIQVGAITCPYSTFHRGWLFPGGKIIKNPFKAQNAAEE
+ M H H+DI+VG + P+ F GWL P G+++ N KAQ AEE
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 250
+ ds2020-267_614
+ No definition line
+ 218
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 251
+ ds2020-267_1198
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 252
+ ds2020-267_1252
+ No definition line
+ 57
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 253
+ ds2020-267_1135
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 254
+ ds2020-267_52
+ No definition line
+ 500
+
+
+
+
+ 17919
+ 3004588
+ 80
+ 135111848
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 255
+ ds2020-267_705
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 256
+ ds2020-267_236
+ No definition line
+ 266
+
+
+
+
+ 17919
+ 3004588
+ 52
+ 74620800
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 257
+ ds2020-267_41
+ No definition line
+ 583
+
+
+
+
+ 17919
+ 3004588
+ 82
+ 171945760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 258
+ ds2020-267_189
+ No definition line
+ 285
+
+
+
+
+ 17919
+ 3004588
+ 57
+ 75361790
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 1
+ ds2020-267_1038
+ No definition line
+ 76
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.072287616
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 2
+ ds2020-267_986
+ No definition line
+ 116
+
+
+
+
+ 17919
+ 3004588
+ 11
+ 75801933
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 3
+ ds2020-267_1033
+ No definition line
+ 76
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 4
+ ds2020-267_921
+ No definition line
+ 131
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 5
+ ds2020-267_494
+ No definition line
+ 227
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 6
+ ds2020-267_682
+ No definition line
+ 215
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 7
+ ds2020-267_964
+ No definition line
+ 125
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 8
+ ds2020-267_141
+ No definition line
+ 319
+
+
+
+
+ 17919
+ 3004588
+ 65
+ 75433973
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 9
+ ds2020-267_517
+ No definition line
+ 225
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 10
+ ds2020-267_557
+ No definition line
+ 222
+
+
+ 1
+ gnl|CDD|366090
+ pfam00421, PSII, Photosystem II protein.
+ 366090
+ 499
+
+
+ 1
+ 80.2474
+ 198
+ 3.32623e-20
+ 12
+ 200
+ 148
+ 214
+ -2
+ 0
+ 40
+ 41
+ 10
+ 70
+ ACFGFGAFHVTGLYGPGIWVSDP-------YGLTGRVQSVNPAWGVEGFDPFVPGGSASHPIAAGTLFIL
+ GCFGFGAFHFGGLG---TWVSDPTLDPGVIYGYTGHVQPVAPVWGAEGFSPFGPGGIVGHHIAAGILGII
+ CFGFGAFH GL WVSDP YG TG VQ V P WG EGF PF PGG H IAAG L I+
+
+
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 11
+ ds2020-267_171
+ No definition line
+ 294
+
+
+
+
+ 17919
+ 3004588
+ 60
+ 73319024
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 12
+ ds2020-267_282
+ No definition line
+ 257
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 73802330
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 13
+ ds2020-267_507
+ No definition line
+ 226
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 14
+ ds2020-267_117
+ No definition line
+ 344
+
+
+ 1
+ gnl|CDD|376306
+ pfam00252, Ribosomal_L16, Ribosomal protein L16p/L10e.
+ 376306
+ 124
+
+
+ 1
+ 84.0016
+ 209
+ 7.27175e-23
+ 107
+ 295
+ 53
+ 116
+ 2
+ 0
+ 32
+ 44
+ 1
+ 64
+ RAMSRRNSKIWVRVLADLPITRKPTEVRMGRGKGNPTGWIARVSTGQIPFEM-DGVSLSNARQA
+ RYLKKRGGKLWIRVFPDKPVTKKPGEDRMGKGKGKPEGWVARVKPGRILFEIRGGVHEEVAKEA
+ R + +R K+W+RV D P+T+KP E RMG+GKG P GW+ARV G+I FE+ GV A++A
+
+
+
+
+
+
+ 17919
+ 3004588
+ 71
+ 74490577
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 15
+ ds2020-267_352
+ No definition line
+ 245
+
+
+ 1
+ gnl|CDD|366381
+ pfam00946, Mononeg_RNA_pol, Mononegavirales RNA dependent RNA polymerase. Members of the Mononegavirales including the Paramyxoviridae, like other non-segmented negative strand RNA viruses, have an RNA-dependent RNA polymerase composed of two subunits, a large protein L and a phosphoprotein P. This is a protein family of the L protein. The L protein confers the RNA polymerase activity on the complex. The P protein acts as a transcription factor.
+ 366381
+ 1015
+
+
+ 1
+ 38.0729
+ 89
+ 3.23548e-05
+ 1
+ 141
+ 690
+ 736
+ 1
+ 0
+ 13
+ 24
+ 0
+ 47
+ KKATEAIAQVSSRVGQIVKPTECIYSTCFLTYGKEMILRGAYLRTCS
+ RRIFKALRKVTSKLGLNLKLEETIISSDFFIYSKRIYYDGVILPQSL
+ ++ +A+ +V+S++G +K E I S+ F Y K + G L
+
+
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 16
+ ds2020-267_659
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 17
+ ds2020-267_564
+ No definition line
+ 222
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 18
+ ds2020-267_1044
+ No definition line
+ 76
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 19
+ ds2020-267_298
+ No definition line
+ 254
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 20
+ ds2020-267_73
+ No definition line
+ 430
+
+
+
+
+ 17919
+ 3004588
+ 78
+ 104448890
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 21
+ ds2020-267_137
+ No definition line
+ 322
+
+
+
+
+ 17919
+ 3004588
+ 66
+ 74699294
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 22
+ ds2020-267_695
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 23
+ ds2020-267_923
+ No definition line
+ 131
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 24
+ ds2020-267_1006
+ No definition line
+ 98
+
+
+
+
+ 17919
+ 3004588
+ 6
+ 75323924
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 25
+ ds2020-267_980
+ No definition line
+ 120
+
+
+
+
+ 17919
+ 3004588
+ 13
+ 74834307
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 26
+ ds2020-267_1144
+ No definition line
+ 65
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 27
+ ds2020-267_656
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 28
+ ds2020-267_80
+ No definition line
+ 417
+
+
+
+
+ 17919
+ 3004588
+ 78
+ 98021266
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 29
+ ds2020-267_3
+ No definition line
+ 2407
+
+
+
+
+ 17919
+ 3004588
+ 94
+ 934703016
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 30
+ ds2020-267_930
+ No definition line
+ 130
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 31
+ ds2020-267_830
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 32
+ ds2020-267_1002
+ No definition line
+ 106
+
+
+
+
+ 17919
+ 3004588
+ 9
+ 73926242
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 33
+ ds2020-267_987
+ No definition line
+ 116
+
+
+
+
+ 17919
+ 3004588
+ 11
+ 75801933
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 34
+ ds2020-267_1238
+ No definition line
+ 59
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 35
+ ds2020-267_443
+ No definition line
+ 233
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 36
+ ds2020-267_233
+ No definition line
+ 268
+
+
+
+
+ 17919
+ 3004588
+ 53
+ 73975716
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 37
+ ds2020-267_1092
+ No definition line
+ 72
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 38
+ ds2020-267_577
+ No definition line
+ 221
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 39
+ ds2020-267_55
+ No definition line
+ 484
+
+
+
+
+ 17919
+ 3004588
+ 80
+ 127256508
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 40
+ ds2020-267_152
+ No definition line
+ 310
+
+
+
+
+ 17919
+ 3004588
+ 63
+ 75027640
+ 0.074731812
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 41
+ ds2020-267_257
+ No definition line
+ 261
+
+
+
+
+ 17919
+ 3004588
+ 51
+ 75265884
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 42
+ ds2020-267_205
+ No definition line
+ 279
+
+
+
+
+ 17919
+ 3004588
+ 56
+ 74041588
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 43
+ ds2020-267_604
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 44
+ ds2020-267_616
+ No definition line
+ 218
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 45
+ ds2020-267_1237
+ No definition line
+ 59
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 46
+ ds2020-267_97
+ No definition line
+ 380
+
+
+ 1
+ gnl|CDD|368171
+ pfam04879, Molybdop_Fe4S4, Molybdopterin oxidoreductase Fe4S4 domain. This domain is found in formate dehydrogenase H for which the structure is known. This first domain (residues 1 to 60) of Structure 1aa6 is an Fe4S4 cluster just below the protein surface.
+ 368171
+ 55
+
+
+ 1
+ 45.3437
+ 108
+ 1.9903e-08
+ 125
+ 274
+ 1
+ 50
+ -2
+ 0
+ 14
+ 23
+ 0
+ 50
+ MQYAPSICHGCSTGCNISAGERYGELRRIENRFNGEVKAYFLCDHGHFGY
+ MKVVKTICPYCGVGCGLLVHVKDGKIVKVEGDPDHPVNRGRLCVKGRFGL
+ M+ +IC C GC + + G++ ++E + V LC G FG
+
+
+
+
+
+
+ 17919
+ 3004588
+ 76
+ 82137200
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 47
+ ds2020-267_1167
+ No definition line
+ 64
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 48
+ ds2020-267_1028
+ No definition line
+ 77
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 49
+ ds2020-267_2
+ No definition line
+ 2436
+
+
+ 1
+ gnl|CDD|280316
+ pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus.
+ 280316
+ 465
+
+
+ 1
+ 95.9902
+ 239
+ 2.17343e-21
+ 184
+ 1476
+ 70
+ 464
+ 1
+ 0
+ 90
+ 155
+ 58
+ 442
+ WAKCGSMAEYIVEAK--NLTTKMKALDNQVT-LGDFELDLSP-LFEWEVLNHRAVLKGIYDKEVTERRDQKQ---SIKLSAADLEEEIDSVFQDVGSVLDARTKEGEKSPLYATWDDWYVDRVQTTPAG-SAFTVNKDMMEARNMLKANGVQNLTKTQVMAQMRDKLPLASILGSEPMILAQMSWKLEWSKLRALFAASMEHWMPSAFALGQIEEYLPSDCPIGKAA--DAHNVCRRVMEMSTQGVVACIDAKNFNILHTHEIMSAILKSASKMLGDRLSSEQHDCLKWLAKAELNQKVLVKTGEVTEQLLQVGRRDGWINKLTKGDGTVVEAADVTVGMFSGTRFTMLYNTVLNRAYYKVAEKRAKIKTLSLHSGDDVYAVFANYIDVYKMKREMALIGYTLQLGK-CFLQGVREFLRISHKNANTSQYLARSAATAIHGR
+ YAASKPGGYRLRRAAWANSSDFAKDLSDILKSLGLNASSPGPKLVEGNPLLGRGVTNVDWEEEAKNRVDLAVVCRLVLLPMEELRAHIDAVLDE----------LVVRRGLCDPIRLFVKNEPLWCVNGHPDHKL--REGRLRLLSSVSLVDQLVR-RMLFEPQNNNEIAWW----GSVPSKPSMKLEHGKSRAIYACDTRSYLAFEYLLAPVEKAWANKSVILNPGEGDISGFDWSVQDWKRGGVSLMLDYDDFNSQHSTESMRAVFER----LRRRLPDEPAEAADWL----------VCSMDSMYQLS----DGTLLAQRVPG------------TLKSGHRATTFINSVLNCAYAELAGAPWADVPTSIHMGDDVLEGLRTPADATSLLDKYARLGFKVNPSKQSVGHTIAEFLRVAFCSHEVRGYLARAIASLVSGN
+ +A + A N + K L + + LG P L E L R V +++E R D + L +L ID+V + + L + + G + R + + V L + +++ + ++ +A + ++ S KLE K RA++A ++ + L +E+ + I D V + GV +D +FN H+ E M A+ + L RL E + WL V + + QL + + G + SG R T N+VLN AY ++A S+H GDDV D + + A +G+ + K + EFLR++ + YLAR+ A+ + G
+
+
+
+
+
+
+ 17919
+ 3004588
+ 94
+ 947905036
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 50
+ ds2020-267_595
+ No definition line
+ 219
+
+
+ 1
+ gnl|CDD|280316
+ pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus.
+ 280316
+ 465
+
+
+ 1
+ 54.0035
+ 130
+ 5.90575e-11
+ 13
+ 210
+ 377
+ 441
+ 1
+ 0
+ 24
+ 32
+ 1
+ 66
+ NNAYLRAAVGKTWYEGALSLHTGDDVFIRANTLADCSVILSDAVAFGCRMNPTKQSIGFYNRLALR
+ NCAYAEL-AGAPWADVPTSIHMGDDVLEGLRTPADATSLLDKYARLGFKVNPSKQSVGHTIAEFLR
+ N AY G W + S+H GDDV T AD + +L G ++NP+KQS+G LR
+
+
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 51
+ ds2020-267_243
+ No definition line
+ 265
+
+
+
+
+ 17919
+ 3004588
+ 52
+ 74620800
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 52
+ ds2020-267_400
+ No definition line
+ 239
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 53
+ ds2020-267_295
+ No definition line
+ 255
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 73802330
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 54
+ ds2020-267_854
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 55
+ ds2020-267_613
+ No definition line
+ 218
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 56
+ ds2020-267_585
+ No definition line
+ 220
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 57
+ ds2020-267_289
+ No definition line
+ 256
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 73802330
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 58
+ ds2020-267_762
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 59
+ ds2020-267_679
+ No definition line
+ 215
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 60
+ ds2020-267_1118
+ No definition line
+ 68
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 61
+ ds2020-267_574
+ No definition line
+ 221
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 62
+ ds2020-267_1087
+ No definition line
+ 72
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 63
+ ds2020-267_1171
+ No definition line
+ 63
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 64
+ ds2020-267_9
+ No definition line
+ 1660
+
+
+
+
+ 17919
+ 3004588
+ 91
+ 634769058
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 65
+ ds2020-267_771
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 66
+ ds2020-267_50
+ No definition line
+ 510
+
+
+
+
+ 17919
+ 3004588
+ 80
+ 141396120
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 67
+ ds2020-267_251
+ No definition line
+ 262
+
+
+
+
+ 17919
+ 3004588
+ 51
+ 75265884
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 68
+ ds2020-267_851
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 69
+ ds2020-267_959
+ No definition line
+ 125
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 70
+ ds2020-267_1075
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.081235584
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 71
+ ds2020-267_357
+ No definition line
+ 244
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 72
+ ds2020-267_781
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 73
+ ds2020-267_411
+ No definition line
+ 238
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 74
+ ds2020-267_219
+ No definition line
+ 273
+
+
+
+
+ 17919
+ 3004588
+ 54
+ 75367594
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 75
+ ds2020-267_622
+ No definition line
+ 217
+
+
+ 1
+ gnl|CDD|379835
+ pfam16363, GDP_Man_Dehyd, GDP-mannose 4,6 dehydratase.
+ 379835
+ 330
+
+
+ 1
+ 55.2369
+ 134
+ 2.10592e-11
+ 29
+ 157
+ 47
+ 89
+ 2
+ 0
+ 12
+ 19
+ 0
+ 43
+ HVRKKLSFHKVDLRDKPALDKLFSSITFDAVIHFAGLKAVGES
+ HLNPNLVLHYGDLTDSSNLERLIAEVQPDEIYNLAAQSHVDVS
+ H+ L H DL D L++L + + D + + A V S
+
+
+
+
+ 2
+ gnl|CDD|366597
+ pfam01370, Epimerase, NAD dependent epimerase/dehydratase family. This family of proteins utilize NAD as a cofactor. The proteins in this family use nucleotide-sugar substrates for a variety of chemical reactions.
+ 366597
+ 234
+
+
+ 1
+ 46.8912
+ 112
+ 1.5719e-08
+ 50
+ 172
+ 43
+ 83
+ 2
+ 0
+ 19
+ 25
+ 0
+ 41
+ FHKVDLRDKPALDKLFSSITFDAVIHFAGLKAVGESAETIA
+ FVEGDLTDRDALEKLFADVQPDAVIHLAAVGGVGASIEDPE
+ F + DL D+ AL+KLF+ + DAVIH A + VG S E
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 76
+ ds2020-267_214
+ No definition line
+ 276
+
+
+ 1
+ gnl|CDD|369639
+ pfam07992, Pyr_redox_2, Pyridine nucleotide-disulphide oxidoreductase. This family includes both class I and class II oxidoreductases and also NADH oxidases and peroxidases. This domain is actually a small NADH binding domain within a larger FAD binding domain.
+ 369639
+ 298
+
+
+ 1
+ 44.2257
+ 105
+ 2.55939e-07
+ 129
+ 254
+ 164
+ 205
+ 3
+ 0
+ 14
+ 21
+ 0
+ 42
+ YCSVWRRLGSEVVVFEAKPEFLAAADKAVSKEAAKLLKAQGV
+ LAAALAKLGKEVTLVEARDRLLRAFDEEISAILEKALEKNGV
+ + +LG EV + EA+ L A D+ +S K L+ GV
+
+
+
+
+ 2
+ gnl|CDD|365851
+ pfam00070, Pyr_redox, Pyridine nucleotide-disulphide oxidoreductase. This family includes both class I and class II oxidoreductases and also NADH oxidases and peroxidases. This domain is actually a small NADH binding domain within a larger FAD binding domain.
+ 365851
+ 79
+
+
+ 1
+ 37.5344
+ 88
+ 1.70856e-05
+ 135
+ 254
+ 16
+ 55
+ 3
+ 0
+ 12
+ 20
+ 0
+ 40
+ SVWRRLGSEVVVFEAKPEFLAAADKAVSKEAAKLLKAQGV
+ GALARLGSKVTVVERRDRLLRGLDEEIAKILQERLEKNGI
+ RLGS+V V E + L D+ ++K + L+ G+
+
+
+
+
+
+
+ 17919
+ 3004588
+ 55
+ 74704591
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 77
+ ds2020-267_693
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 78
+ ds2020-267_245
+ No definition line
+ 264
+
+
+
+
+ 17919
+ 3004588
+ 52
+ 74620800
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 79
+ ds2020-267_728
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 80
+ ds2020-267_598
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 81
+ ds2020-267_1221
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 82
+ ds2020-267_221
+ No definition line
+ 273
+
+
+
+
+ 17919
+ 3004588
+ 54
+ 75367594
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 83
+ ds2020-267_353
+ No definition line
+ 245
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 84
+ ds2020-267_610
+ No definition line
+ 218
+
+
+ 1
+ gnl|CDD|380005
+ pfam17759, tRNA_synthFbeta, Phenylalanyl tRNA synthetase beta chain CLM domain. This domain corresponds to the catalytic like domain (CLM) in the beta chain of phe tRNA synthetase.
+ 380005
+ 212
+
+
+ 1
+ 60.2461
+ 147
+ 1.47034e-13
+ 25
+ 195
+ 77
+ 131
+ 1
+ 0
+ 23
+ 32
+ 2
+ 57
+ LWTGMLGTIVYNQNRQQNRVRIFESGLRFVPDNQANLGIRQDLLLAGAISGNRYEES
+ LLPGLLEVLAYNLNRGNPDVRLFEIGRVFLPDEEE--LPREERRLAGLLTGKRLPES
+ L G+L + YN NR VR+FE G F+PD + R++ LAG ++G R ES
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 85
+ ds2020-267_46
+ No definition line
+ 530
+
+
+
+
+ 17919
+ 3004588
+ 81
+ 147549155
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 86
+ ds2020-267_549
+ No definition line
+ 223
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 87
+ ds2020-267_1089
+ No definition line
+ 72
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 88
+ ds2020-267_935
+ No definition line
+ 129
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 89
+ ds2020-267_825
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 90
+ ds2020-267_1097
+ No definition line
+ 71
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 91
+ ds2020-267_184
+ No definition line
+ 288
+
+
+
+
+ 17919
+ 3004588
+ 58
+ 74680868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 92
+ ds2020-267_94
+ No definition line
+ 386
+
+
+ 1
+ gnl|CDD|366585
+ pfam01347, Vitellogenin_N, Lipoprotein amino terminal region. This family contains regions from: Vitellogenin, Microsomal triglyceride transfer protein and apolipoprotein B-100. These proteins are all involved in lipid transport. This family contains the LV1n chain from lipovitellin, that contains two structural domains.
+ 366585
+ 582
+
+
+ 1
+ 37.639
+ 88
+ 0.000224462
+ 112
+ 363
+ 208
+ 294
+ 1
+ 0
+ 17
+ 29
+ 5
+ 88
+ PDHVLLKQAYLEGAVVVTPN--PRGHAMLANKQNLTLLSDSQILRSWGLDEAAVERYWNTV--SASP*ANLRSSTSQTSCPSTSASGI
+ LKGFLIQSAETTEKVQVSPFLENSQKAEVESRQNLTLEEVEKTPGLIPPPANPRHRG-SLVYEYETEQASLSQELLQSPSSLSSVPNA
+ L++ A V V+P A + ++QNLTL + R + V + A+L Q+ +S
+
+
+
+
+
+
+ 17919
+ 3004588
+ 77
+ 82866075
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 93
+ ds2020-267_300
+ No definition line
+ 254
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 94
+ ds2020-267_1106
+ No definition line
+ 71
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 95
+ ds2020-267_447
+ No definition line
+ 233
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 96
+ ds2020-267_970
+ No definition line
+ 124
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 97
+ ds2020-267_1068
+ No definition line
+ 74
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 98
+ ds2020-267_663
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 99
+ ds2020-267_1203
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 100
+ ds2020-267_989
+ No definition line
+ 116
+
+
+
+
+ 17919
+ 3004588
+ 11
+ 75801933
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 101
+ ds2020-267_1037
+ No definition line
+ 76
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 102
+ ds2020-267_828
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 103
+ ds2020-267_539
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 104
+ ds2020-267_744
+ No definition line
+ 212
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 105
+ ds2020-267_1188
+ No definition line
+ 62
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 106
+ ds2020-267_890
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 107
+ ds2020-267_708
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 108
+ ds2020-267_1143
+ No definition line
+ 65
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 109
+ ds2020-267_292
+ No definition line
+ 255
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 73802330
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 110
+ ds2020-267_602
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 111
+ ds2020-267_323
+ No definition line
+ 250
+
+
+ 1
+ gnl|CDD|365960
+ pfam00227, Proteasome, Proteasome subunit. The proteasome is a multisubunit structure that degrades proteins. Protein degradation is an essential component of regulation because proteins can become misfolded, damaged, or unnecessary. Proteasomes and their homologs vary greatly in complexity: from HslV (heat shock locus v), which is encoded by 1 gene in bacteria, to the eukaryotic 20S proteasome, which is encoded by more than 14 genes. Recently evidence of two novel groups of bacterial proteasomes was proposed. The first is Anbu, which is sparsely distributed among cyanobacteria and proteobacteria. The second is call beta-proteobacteria proteasome homolog (BPH).
+ 365960
+ 188
+
+
+ 1
+ 47.9435
+ 115
+ 5.8155e-09
+ 10
+ 150
+ 5
+ 51
+ -2
+ 0
+ 17
+ 29
+ 2
+ 48
+ TTIVSVRRNGHVVIAGDGQATLGNTV-MKGNVKKVRRLYNDKVIAGFA
+ TTIVGIKGKDGVVLAADKRATRGSKLLSKDTVEKIFKI-DDHIGMAFA
+ TTIV ++ VV+A D +AT G+ + K V+K+ ++ +D + FA
+
+
+
+
+
+
+ 17919
+ 3004588
+ 48
+ 75056660
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 112
+ ds2020-267_372
+ No definition line
+ 242
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 113
+ ds2020-267_238
+ No definition line
+ 266
+
+
+
+
+ 17919
+ 3004588
+ 52
+ 74620800
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 114
+ ds2020-267_596
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 115
+ ds2020-267_368
+ No definition line
+ 243
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 116
+ ds2020-267_945
+ No definition line
+ 127
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 117
+ ds2020-267_465
+ No definition line
+ 230
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 118
+ ds2020-267_1172
+ No definition line
+ 63
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 119
+ ds2020-267_1014
+ No definition line
+ 86
+
+
+
+
+ 17919
+ 3004588
+ 3
+ 73770775
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 120
+ ds2020-267_932
+ No definition line
+ 129
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 121
+ ds2020-267_168
+ No definition line
+ 298
+
+
+ 1
+ gnl|CDD|379252
+ pfam13546, DDE_5, DDE superfamily endonuclease. This family of proteins are related to pfam00665 and are probably endonucleases of the DDE superfamily. Transposase proteins are necessary for efficient DNA transposition. This domain is a member of the DDE superfamily, which contain three carboxylate residues that are believed to be responsible for coordinating metal ions needed for catalysis. The catalytic activity of this enzyme involves DNA cleavage at a specific site followed by a strand transfer reaction.
+ 379252
+ 266
+
+
+ 1
+ 34.9929
+ 81
+ 0.000766911
+ 54
+ 260
+ 40
+ 130
+ -3
+ 0
+ 22
+ 37
+ 22
+ 91
+ TDSQYRRLQRFIASAVIDYD----QLAILIYRLFGLSKVTITIDRTNW-KWGK----------------SNINIFM-LGVVYKGIAIPLYW
+ HDGSHQALQRFLSRSPWDDARLRRRLARLVLPAIAPEAPVLAIDDTGFPKDGKHSVGVARQYCGVLGKPDNCQVAVSLGLAYERVSAPLDW
+ D ++ LQRF++ + D +LA L+ + ID T + K GK N + + LG+ Y+ ++ PL W
+
+
+
+
+
+
+ 17919
+ 3004588
+ 60
+ 75248472
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 122
+ ds2020-267_95
+ No definition line
+ 382
+
+
+
+
+ 17919
+ 3004588
+ 76
+ 83779944
+ 0.050055168
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 123
+ ds2020-267_831
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 124
+ ds2020-267_200
+ No definition line
+ 281
+
+
+
+
+ 17919
+ 3004588
+ 56
+ 74041588
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 125
+ ds2020-267_690
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 126
+ ds2020-267_105
+ No definition line
+ 370
+
+
+
+
+ 17919
+ 3004588
+ 76
+ 77208968
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 127
+ ds2020-267_818
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 128
+ ds2020-267_636
+ No definition line
+ 217
+
+
+ 1
+ gnl|CDD|372443
+ pfam13041, PPR_2, PPR repeat family. This repeat has no known function. It is about 35 amino acids long and is found in up to 18 copies in some proteins. The family appears to be greatly expanded in plants and fungi. The repeat has been called PPR.
+ 372443
+ 50
+
+
+ 1
+ 67.3836
+ 166
+ 7.94482e-18
+ 64
+ 195
+ 5
+ 48
+ -2
+ 0
+ 18
+ 32
+ 0
+ 44
+ TFNIMLKGYFRAGQIKEAWEFFLQMKKRKCEIDVVTYTTLVHGF
+ TYNTLINGYCKNGKVEEAFKLFNEMKKRGIKPNVYTYTILINGL
+ T+N ++ GY + G+++EA++ F +MKKR + +V TYT L++G
+
+
+ 2
+ 40.4196
+ 96
+ 2.82898e-07
+ 13
+ 99
+ 2
+ 30
+ -2
+ 0
+ 14
+ 23
+ 0
+ 29
+ DVVTYTTLVHGFGVVGEIKKARKVFDEMV
+ DVVTYNTLINGYCKNGKVEEAFKLFNEMK
+ DVVTY TL++G+ G++++A K+F+EM
+
+
+
+
+ 2
+ gnl|CDD|372345
+ pfam12854, PPR_1, PPR repeat. This family matches additional variants of the PPR repeat that were not captured by the model for pfam01535. The exact function is not known.
+ 372345
+ 32
+
+
+ 1
+ 46.161
+ 111
+ 1.10553e-09
+ 13
+ 108
+ 1
+ 32
+ -2
+ 0
+ 14
+ 20
+ 0
+ 32
+ CEIDVVTYTTLVHGFGVVGEIKKARKVFDEMV
+ LKPDVVTYNTLIDGLCRAGRVDEAFELFDEME
+ + DVVTY TL+ G G + +A ++FDEM
+
+
+ 2
+ 37.3014
+ 88
+ 4.32035e-06
+ 118
+ 204
+ 4
+ 32
+ -2
+ 0
+ 11
+ 20
+ 0
+ 29
+ NRTTFNIMLKGYFRAGQIKEAWEFFLQMK
+ DVVTYNTLIDGLCRAGRVDEAFELFDEME
+ + T+N ++ G RAG++ EA+E F +M+
+
+
+
+
+ 3
+ gnl|CDD|366695
+ pfam01535, PPR, PPR repeat. This repeat has no known function. It is about 35 amino acids long and found in up to 18 copies in some proteins. This family appears to be greatly expanded in plants. This repeat occurs in PET309 that may be involved in RNA stabilisation. This domain occurs in crp1 that is involved in RNA processing. This repeat is associated with a predicted plant protein that has a domain organisation similar to the human BRCA1 protein. The repeat has been called PPR.
+ 366695
+ 31
+
+
+ 1
+ 40.141
+ 95
+ 3.20398e-07
+ 106
+ 195
+ 2
+ 31
+ -2
+ 0
+ 11
+ 21
+ 0
+ 30
+ TFNIMLKGYFRAGQIKEAWEFFLQMKKRKC
+ TYNSLISGYCKNGKLEEALELFKEMKEKGI
+ T+N ++ GY + G+++EA E F +MK++
+
+
+ 2
+ 35.9038
+ 84
+ 1.47382e-05
+ 13
+ 93
+ 1
+ 27
+ -2
+ 0
+ 10
+ 19
+ 0
+ 27
+ VTYTTLVHGFGVVGEIKKARKVFDEMV
+ VTYNSLISGYCKNGKLEEALELFKEMK
+ VTY +L+ G+ G++++A ++F EM
+
+
+
+
+ 4
+ gnl|CDD|316342
+ pfam13812, PPR_3, Pentatricopeptide repeat domain. This family matches additional variants of the PPR repeat that were not captured by the model for pfam01535. In the case of the Arabidopsis protein UniProtKB:Q66GI4, the repeated helices in this N-terminal region, of protein-only RNase P (PRORP) enzymes, form the pentatricopeptide repeat (PPR) domain which enhances pre-tRNA binding affinity. PROPRP enzymes process precursor tRNAs in human mitochondria and in all tRNA-using compartments of Arabidopsis thaliana.
+ 316342
+ 63
+
+
+ 1
+ 36.1819
+ 84
+ 1.92367e-05
+ 16
+ 123
+ 6
+ 41
+ -2
+ 0
+ 13
+ 23
+ 0
+ 36
+ MKKRKCEIDVVTYTTLVHGFGVVGEIKKARKVFDEM
+ MVRDGIQLNVNTYTHLLHAYANVGNLKLALEIFERM
+ M + +++V TYT L+H + VG +K A ++F+ M
+
+
+ 2
+ 34.2559
+ 79
+ 0.000111468
+ 61
+ 195
+ 17
+ 61
+ -2
+ 0
+ 14
+ 23
+ 0
+ 45
+ TFNIMLKGYFRAGQIKEAWEFFLQMKKRKCEIDVVTYTTLVHGFG
+ TYTHLLHAYANVGNLKLALEIFERMKKKGIKPTLDTYNAILGVIG
+ T+ +L Y G +K A E F +MKK+ + + TY ++ G
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 129
+ ds2020-267_358
+ No definition line
+ 244
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 130
+ ds2020-267_603
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 131
+ ds2020-267_1181
+ No definition line
+ 62
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 132
+ ds2020-267_486
+ No definition line
+ 228
+
+
+ 1
+ gnl|CDD|374956
+ pfam17035, BET, Bromodomain extra-terminal - transcription regulation. The BET, or bromodomain extra-terminal domain, is found on bromodomain proteins that play key roles in development, cancer progression and virus-host pathogenesis. It interacts with NSD3, JMJD6, CHD4, GLTSCR1, and ATAD5 all of which are shown to impart a pTEFb-independent transcriptional activation function on the bromodomain proteins.
+ 374956
+ 64
+
+
+ 1
+ 45.5577
+ 109
+ 5.12677e-09
+ 108
+ 203
+ 1
+ 32
+ 3
+ 0
+ 13
+ 21
+ 0
+ 32
+ EMSMEEKHKLGVGLQSLPKDKMEQVV*MIKKR
+ PMTYEEKRELSERINKLPGEKLGRVVEIIKER
+ M+ EEK +L + LP +K+ +VV +IK+R
+
+
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 133
+ ds2020-267_599
+ No definition line
+ 219
+
+
+ 1
+ gnl|CDD|377551
+ pfam05717, TnpB_IS66, IS66 Orf2 like protein. This protein is found in insertion sequences related to IS66. The function of these proteins is uncertain, but they are probably essential for transposition.
+ 377551
+ 100
+
+
+ 1
+ 38.9712
+ 92
+ 3.2952e-06
+ 28
+ 147
+ 9
+ 49
+ 1
+ 0
+ 13
+ 24
+ 3
+ 42
+ PMDMRSGSNKLLAFILEKHHGIKPHC--AYLFYNKTGTRLKV
+ PTDMRKGIDGLAA-LVQEVLGLDPFSGHLFVFRNRRRDRIKI
+ P DMR G + L A ++++ G+ P ++F N+ R+K+
+
+
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 134
+ ds2020-267_1071
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 135
+ ds2020-267_906
+ No definition line
+ 141
+
+
+
+
+ 17919
+ 3004588
+ 19
+ 74595556
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 136
+ ds2020-267_277
+ No definition line
+ 258
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 137
+ ds2020-267_359
+ No definition line
+ 244
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 138
+ ds2020-267_82
+ No definition line
+ 414
+
+
+
+
+ 17919
+ 3004588
+ 78
+ 96414360
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 139
+ ds2020-267_704
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 140
+ ds2020-267_1023
+ No definition line
+ 79
+
+
+
+
+ 17919
+ 3004588
+ 1
+ 74666725
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 141
+ ds2020-267_35
+ No definition line
+ 657
+
+
+
+
+ 17919
+ 3004588
+ 83
+ 206354296
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 142
+ ds2020-267_635
+ No definition line
+ 217
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 143
+ ds2020-267_288
+ No definition line
+ 256
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 73802330
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 144
+ ds2020-267_99
+ No definition line
+ 378
+
+
+
+
+ 17919
+ 3004588
+ 76
+ 82137200
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 145
+ ds2020-267_785
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 146
+ ds2020-267_837
+ No definition line
+ 207
+
+
+ 1
+ gnl|CDD|367791
+ pfam04061, ORMDL, ORMDL family. Evidence form suggests that ORMDLs are involved in protein folding in the ER. Orm proteins have been identified as negative regulators of sphingolipid synthesis that form a conserved complex with serine palmitoyltransferase, the first and rate-limiting enzyme in sphingolipid production. This novel and conserved protein complex, has been termed the SPOTS complex (serine palmitoyltransferase, Orm1/2, Tsc3, and Sac1).
+ 367791
+ 135
+
+
+ 1
+ 70.6546
+ 174
+ 2.43363e-18
+ 1
+ 159
+ 83
+ 135
+ 1
+ 0
+ 25
+ 37
+ 0
+ 53
+ QHVRNRKFLTVVPVVLYLIASHTTDYQHPMLFFNSLAVIVLVIAKFSNMHKVR
+ QYTPTRKFLTVVPIVLFLLSTHYTKYDLTLFIINFIALLVVVIPKLPFMHRVR
+ Q+ RKFLTVVP+VL+L+++H T Y + N +A++V+VI K MH+VR
+
+
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 147
+ ds2020-267_382
+ No definition line
+ 242
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 148
+ ds2020-267_263
+ No definition line
+ 260
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 149
+ ds2020-267_67
+ No definition line
+ 460
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 117585038
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 150
+ ds2020-267_979
+ No definition line
+ 121
+
+
+
+
+ 17919
+ 3004588
+ 13
+ 74834307
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 151
+ ds2020-267_992
+ No definition line
+ 114
+
+
+
+
+ 17919
+ 3004588
+ 11
+ 75801933
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 152
+ ds2020-267_883
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 153
+ ds2020-267_699
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 154
+ ds2020-267_516
+ No definition line
+ 225
+
+
+ 1
+ gnl|CDD|376293
+ pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I.
+ 376293
+ 433
+
+
+ 1
+ 35.2292
+ 82
+ 0.000272517
+ 21
+ 101
+ 1
+ 27
+ -2
+ 0
+ 11
+ 18
+ 0
+ 27
+ RVVRQFSVMAVVWGIVGMLVGVVIATQ
+ RIGLLYLVTALVWFLVGGLLGLLIRLQ
+ R+ + V A+VW +VG L+G++I Q
+
+
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 155
+ ds2020-267_192
+ No definition line
+ 284
+
+
+
+
+ 17919
+ 3004588
+ 57
+ 73378585
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 156
+ ds2020-267_957
+ No definition line
+ 125
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 157
+ ds2020-267_572
+ No definition line
+ 221
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 158
+ ds2020-267_721
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 159
+ ds2020-267_469
+ No definition line
+ 230
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 160
+ ds2020-267_385
+ No definition line
+ 241
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 161
+ ds2020-267_48
+ No definition line
+ 525
+
+
+
+
+ 17919
+ 3004588
+ 81
+ 145996006
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 162
+ ds2020-267_472
+ No definition line
+ 229
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 163
+ ds2020-267_40
+ No definition line
+ 586
+
+
+
+
+ 17919
+ 3004588
+ 82
+ 173480990
+ 0.050180004
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 164
+ ds2020-267_1101
+ No definition line
+ 71
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 165
+ ds2020-267_898
+ No definition line
+ 147
+
+
+
+
+ 17919
+ 3004588
+ 21
+ 73592092
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 166
+ ds2020-267_136
+ No definition line
+ 322
+
+
+
+
+ 17919
+ 3004588
+ 66
+ 74699294
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 167
+ ds2020-267_344
+ No definition line
+ 246
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 75683825
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 168
+ ds2020-267_1053
+ No definition line
+ 75
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 169
+ ds2020-267_806
+ No definition line
+ 209
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 170
+ ds2020-267_1179
+ No definition line
+ 62
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 171
+ ds2020-267_793
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 172
+ ds2020-267_1224
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 173
+ ds2020-267_1200
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 174
+ ds2020-267_124
+ No definition line
+ 337
+
+
+
+
+ 17919
+ 3004588
+ 70
+ 73510836
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 175
+ ds2020-267_732
+ No definition line
+ 212
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 176
+ ds2020-267_529
+ No definition line
+ 224
+
+
+ 1
+ gnl|CDD|366140
+ pfam00510, COX3, Cytochrome c oxidase subunit III.
+ 366140
+ 258
+
+
+ 1
+ 85.9226
+ 213
+ 6.14777e-23
+ 35
+ 211
+ 127
+ 185
+ 2
+ 0
+ 30
+ 39
+ 0
+ 59
+ PFLNTPILLSSGAAVTWAHHAILAGKEKRAVYALVATVSLALVFTGFQGMEYYQAPVNI
+ PLLNTIILLSSGVTVTYAHHSLIEGNRKQALQGLFITILLGVYFTGLQAMEYTEASFTI
+ P LNT ILLSSG VT+AHH+++ G K+A+ L T+ L + FTG Q MEY +A I
+
+
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 177
+ ds2020-267_779
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 178
+ ds2020-267_160
+ No definition line
+ 304
+
+
+
+
+ 17919
+ 3004588
+ 62
+ 73850790
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 179
+ ds2020-267_230
+ No definition line
+ 268
+
+
+ 1
+ gnl|CDD|376293
+ pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I.
+ 376293
+ 433
+
+
+ 1
+ 67.586
+ 166
+ 1.95663e-15
+ 81
+ 236
+ 34
+ 84
+ -3
+ 0
+ 29
+ 35
+ 1
+ 52
+ QLYNVLITAHAFLMIFFMVMPAMIGGSGNWSVPILIGAPDMAFPRLNNISFW
+ LTYNQLRTLHGNLMIFWFATPFIFGF-GNYLVPLMIGARDMAFPRLNALSFW
+ YN L T H LMIF+ P + G GN+ VP++IGA DMAFPRLN +SFW
+
+
+
+
+
+
+ 17919
+ 3004588
+ 53
+ 73975716
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 180
+ ds2020-267_93
+ No definition line
+ 387
+
+
+
+
+ 17919
+ 3004588
+ 77
+ 84490900
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 181
+ ds2020-267_49
+ No definition line
+ 517
+
+
+
+
+ 17919
+ 3004588
+ 80
+ 144538256
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 182
+ ds2020-267_1082
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 183
+ ds2020-267_1063
+ No definition line
+ 74
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 184
+ ds2020-267_896
+ No definition line
+ 152
+
+
+
+
+ 17919
+ 3004588
+ 21
+ 76220381
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 185
+ ds2020-267_159
+ No definition line
+ 305
+
+
+
+
+ 17919
+ 3004588
+ 62
+ 73850790
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 186
+ ds2020-267_1047
+ No definition line
+ 75
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 187
+ ds2020-267_347
+ No definition line
+ 245
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 188
+ ds2020-267_444
+ No definition line
+ 233
+
+
+ 1
+ gnl|CDD|366242
+ pfam00680, RdRP_1, RNA dependent RNA polymerase.
+ 366242
+ 470
+
+
+ 1
+ 34.2545
+ 79
+ 0.00060937
+ 51
+ 155
+ 281
+ 315
+ -1
+ 0
+ 14
+ 22
+ 0
+ 35
+ GYLVNLFGTMPSGSYYTSLINTNANNMLILGHLID
+ GTIIKVEGGLPSGQPATSVINSILNNIYVLYALIK
+ G ++ + G +PSG TS+IN+ NN+ +L LI
+
+
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 189
+ ds2020-267_814
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 190
+ ds2020-267_302
+ No definition line
+ 254
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 191
+ ds2020-267_169
+ No definition line
+ 298
+
+
+
+
+ 17919
+ 3004588
+ 60
+ 75248472
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 192
+ ds2020-267_396
+ No definition line
+ 240
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 193
+ ds2020-267_942
+ No definition line
+ 127
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 194
+ ds2020-267_378
+ No definition line
+ 242
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 195
+ ds2020-267_308
+ No definition line
+ 253
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 196
+ ds2020-267_722
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 197
+ ds2020-267_156
+ No definition line
+ 307
+
+
+
+
+ 17919
+ 3004588
+ 62
+ 75744400
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 198
+ ds2020-267_336
+ No definition line
+ 248
+
+
+ 1
+ gnl|CDD|365883
+ pfam00113, Enolase_C, Enolase, C-terminal TIM barrel domain.
+ 365883
+ 296
+
+
+ 1
+ 60.1682
+ 146
+ 4.23282e-13
+ 15
+ 116
+ 187
+ 220
+ -1
+ 0
+ 21
+ 27
+ 0
+ 34
+ SNTKILKEGIDKKIANSILIKFNQIGTLTETLEA
+ TNPKRLKTAIEKKAANSLLLKVNQIGSLTESLAA
+ +N K LK I+KK ANS+L+K NQIG+LTE+L A
+
+
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 75683825
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 199
+ ds2020-267_658
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 200
+ ds2020-267_1003
+ No definition line
+ 106
+
+
+
+
+ 17919
+ 3004588
+ 9
+ 73926242
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 201
+ ds2020-267_561
+ No definition line
+ 222
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 202
+ ds2020-267_712
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 203
+ ds2020-267_365
+ No definition line
+ 243
+
+
+ 1
+ gnl|CDD|372443
+ pfam13041, PPR_2, PPR repeat family. This repeat has no known function. It is about 35 amino acids long and is found in up to 18 copies in some proteins. The family appears to be greatly expanded in plants and fungi. The repeat has been called PPR.
+ 372443
+ 50
+
+
+ 1
+ 34.2564
+ 80
+ 0.000129396
+ 49
+ 186
+ 5
+ 50
+ -1
+ 0
+ 8
+ 21
+ 0
+ 46
+ ICNNMIRAYTNSVFPIKAIHIYNYMQETNVRSDHFTYNFALKACAR
+ TYNTLINGYCKNGKVEEAFKLFNEMKKRGIKPNVYTYTILINGLCK
+ N +I Y + +A ++N M++ ++ + +TY + +
+
+
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 204
+ ds2020-267_75
+ No definition line
+ 425
+
+
+ 1
+ gnl|CDD|365804
+ pfam00005, ABC_tran, ABC transporter. ABC transporters for a large family of proteins responsible for translocation of a variety of compounds across biological membranes. ABC transporters are the largest family of proteins in many completely sequenced bacteria. ABC transporters are composed of two copies of this domain and two copies of a transmembrane domain pfam00664. These four domains may belong to a single polypeptide as in CFTR, or belong in different polypeptide chains.
+ 365804
+ 150
+
+
+ 1
+ 44.5558
+ 106
+ 4.26261e-07
+ 129
+ 275
+ 19
+ 64
+ -1
+ 0
+ 13
+ 22
+ 3
+ 49
+ SNGEGKSTLFKVISGQVKADSGEFQISGNLKIAMLEQDIPETSGKVSDI
+ PNGAGKSTLLKLISGLLSPTEGTILLDGQ---DLTDDERKSLRKEIGYV
+ NG GKSTL K+ISG + G + G + + + ++ +
+
+
+
+
+
+
+ 17919
+ 3004588
+ 78
+ 101235078
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 205
+ ds2020-267_787
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 206
+ ds2020-267_140
+ No definition line
+ 319
+
+
+
+
+ 17919
+ 3004588
+ 65
+ 75433973
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 207
+ ds2020-267_174
+ No definition line
+ 291
+
+
+
+
+ 17919
+ 3004588
+ 59
+ 73999946
+ 0.06226824
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 208
+ ds2020-267_237
+ No definition line
+ 266
+
+
+
+
+ 17919
+ 3004588
+ 52
+ 74620800
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 209
+ ds2020-267_8
+ No definition line
+ 1703
+
+
+ 1
+ gnl|CDD|366242
+ pfam00680, RdRP_1, RNA dependent RNA polymerase.
+ 366242
+ 470
+
+
+ 1
+ 70.078
+ 172
+ 2.85682e-13
+ 685
+ 1458
+ 100
+ 348
+ -3
+ 0
+ 54
+ 102
+ 41
+ 274
+ SAMPTTTSPGFPWVNQGYKTKAEVFADPVATGKIHR----AWDSIGRGIPW------SLPDCLAFNRVVASEQPNVKVRPVWGYPTDVILEEARFFIPLFSELKELCNREDACYGIGMETMKSGHSHLARSMIDNIVSLTTDFSRFDANVTHWIIRDTFSFISDWFDFSKVRDSEGIVWNVRSDQTARRWKAMVSYFINTKIRTPRGLRVQKSTGIPSGSMWTNLLDTIVNAVQMRTAIYRVTGALPVKDYY------YGDDSSIFLDRPIDLV
+ DALNKDTSPGLPYILEG-GKKRDLVKDEEADKVLLKAAYEALKLAENGEGLPGVYTTCLKDELRPLEKVQAG----KTRLFWGCPVEVNLVARAVFGPFCNKIYS--NALKLGIAVGINPFSRDWERLGALIRKGSDVLDVDYSAFDSTLSPFVFDLVEDIRSEFCGGLE---------------PTRLALLEL---LSNPIHILGGTIIKVEGGLPSGQPATSVINSILNNIYVLYALIKHTGESELDDHETIRFISYGDDNLVAVNPDVDSV
+ A+ TSPG P++ +G K ++ D A + + A G L D L V + K R WG P +V L F P +++ N +G+ L + L D+S FD+ ++ ++ S++ + R + ++ I G ++ G+PSG T+++++I+N + + A+ + TG + D+ YGDD+ + ++ +D V
+
+
+
+
+
+
+ 17919
+ 3004588
+ 91
+ 654004484
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 210
+ ds2020-267_1074
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 211
+ ds2020-267_119
+ No definition line
+ 342
+
+
+
+
+ 17919
+ 3004588
+ 71
+ 74490577
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 212
+ ds2020-267_1098
+ No definition line
+ 71
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 213
+ ds2020-267_528
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 214
+ ds2020-267_326
+ No definition line
+ 250
+
+
+
+
+ 17919
+ 3004588
+ 48
+ 75056660
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 215
+ ds2020-267_913
+ No definition line
+ 135
+
+
+
+
+ 17919
+ 3004588
+ 17
+ 75599020
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 216
+ ds2020-267_981
+ No definition line
+ 120
+
+
+
+
+ 17919
+ 3004588
+ 13
+ 74834307
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 217
+ ds2020-267_1247
+ No definition line
+ 58
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 218
+ ds2020-267_894
+ No definition line
+ 160
+
+
+
+
+ 17919
+ 3004588
+ 24
+ 74661428
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 219
+ ds2020-267_335
+ No definition line
+ 248
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 75683825
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 220
+ ds2020-267_743
+ No definition line
+ 212
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 221
+ ds2020-267_547
+ No definition line
+ 223
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 222
+ ds2020-267_804
+ No definition line
+ 209
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 223
+ ds2020-267_414
+ No definition line
+ 238
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 224
+ ds2020-267_1039
+ No definition line
+ 76
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 225
+ ds2020-267_1142
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 226
+ ds2020-267_476
+ No definition line
+ 229
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 227
+ ds2020-267_1032
+ No definition line
+ 76
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 228
+ ds2020-267_114
+ No definition line
+ 347
+
+
+ 1
+ gnl|CDD|376336
+ pfam00471, Ribosomal_L33, Ribosomal protein L33.
+ 376336
+ 47
+
+
+ 1
+ 53.6312
+ 130
+ 8.05888e-12
+ 132
+ 302
+ 1
+ 47
+ 3
+ 0
+ 25
+ 31
+ 10
+ 57
+ VTVILECTSCLRNRVNKESTGISRYITQKNRHNTPGRLKLRKFCPCCYKHTIHGEIK
+ VKITLACTECKE----------RNYTTTKNKKNTPERLELKKYCPKCRKHTLHKETK
+ V + L CT C Y T KN+ NTP RL+L+K+CP C KHT+H E K
+
+
+
+
+
+
+ 17919
+ 3004588
+ 72
+ 73720060
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 229
+ ds2020-267_864
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 230
+ ds2020-267_1086
+ No definition line
+ 72
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 231
+ ds2020-267_1138
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 232
+ ds2020-267_897
+ No definition line
+ 150
+
+
+
+
+ 17919
+ 3004588
+ 21
+ 76220381
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 233
+ ds2020-267_1128
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 234
+ ds2020-267_737
+ No definition line
+ 212
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 235
+ ds2020-267_589
+ No definition line
+ 219
+
+
+ 1
+ gnl|CDD|378823
+ pfam12161, HsdM_N, HsdM N-terminal domain. This domain is found at the N-terminus of the methylase subunit of Type I DNA methyltransferases. This domain family is found in bacteria and archaea, and is typically between 123 and 138 amino acids in length. The family is found in association with pfam02384. Mutations in this region of EcoKI methyltransferase abolish the normally strong preference of this system for methylating hemimethylated substrate. The structure of this domain has been shown to be all alpha-helical.
+ 378823
+ 134
+
+
+ 1
+ 33.892
+ 78
+ 0.0004347
+ 11
+ 148
+ 58
+ 101
+ 2
+ 0
+ 10
+ 19
+ 2
+ 46
+ RKESGFVFYNTNKWTLKKLKESASNNQQLLLSNFEEYLNGFSAKSK
+ PLDAGFGFYIPSELRWSKLLNNDDGDE--LGENLNDAFPGLSELNP
+ ++GF FY ++ KL + ++ L N + G S +
+
+
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 236
+ ds2020-267_259
+ No definition line
+ 261
+
+
+
+
+ 17919
+ 3004588
+ 51
+ 75265884
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 237
+ ds2020-267_971
+ No definition line
+ 123
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 238
+ ds2020-267_477
+ No definition line
+ 229
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 239
+ ds2020-267_1000
+ No definition line
+ 107
+
+
+
+
+ 17919
+ 3004588
+ 9
+ 73926242
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 240
+ ds2020-267_96
+ No definition line
+ 382
+
+
+
+
+ 17919
+ 3004588
+ 76
+ 83779944
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 241
+ ds2020-267_668
+ No definition line
+ 215
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 242
+ ds2020-267_30
+ No definition line
+ 721
+
+
+
+
+ 17919
+ 3004588
+ 84
+ 233905152
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 243
+ ds2020-267_646
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 244
+ ds2020-267_166
+ No definition line
+ 298
+
+
+
+
+ 17919
+ 3004588
+ 60
+ 75248472
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 245
+ ds2020-267_206
+ No definition line
+ 279
+
+
+ 1
+ gnl|CDD|377170
+ pfam03947, Ribosomal_L2_C, Ribosomal Proteins L2, C-terminal domain.
+ 377170
+ 126
+
+
+ 1
+ 66.2303
+ 163
+ 2.63457e-16
+ 155
+ 265
+ 10
+ 46
+ 2
+ 0
+ 22
+ 29
+ 0
+ 37
+ DMPLGTAIHNIEITLGKSGQLARAAGAVAKLIAKEGK
+ NIPEGTIIHNIELKPGDGGQLARSAGTYAQIVAKEGK
+ ++P GT IHNIE+ G GQLAR+AG A+++AKEGK
+
+
+
+
+
+
+ 17919
+ 3004588
+ 56
+ 74041588
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 246
+ ds2020-267_757
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 247
+ ds2020-267_1052
+ No definition line
+ 75
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 248
+ ds2020-267_591
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 249
+ ds2020-267_1056
+ No definition line
+ 75
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 250
+ ds2020-267_508
+ No definition line
+ 226
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.050180004
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 251
+ ds2020-267_1131
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 252
+ ds2020-267_320
+ No definition line
+ 250
+
+
+
+
+ 17919
+ 3004588
+ 48
+ 75056660
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 253
+ ds2020-267_836
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 254
+ ds2020-267_661
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 255
+ ds2020-267_951
+ No definition line
+ 127
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 256
+ ds2020-267_944
+ No definition line
+ 127
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 257
+ ds2020-267_1206
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 258
+ ds2020-267_1197
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 259
+ ds2020-267_47
+ No definition line
+ 528
+
+
+
+
+ 17919
+ 3004588
+ 81
+ 147549155
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 260
+ ds2020-267_193
+ No definition line
+ 284
+
+
+
+
+ 17919
+ 3004588
+ 57
+ 73378585
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 261
+ ds2020-267_1184
+ No definition line
+ 62
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 262
+ ds2020-267_1043
+ No definition line
+ 76
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 263
+ ds2020-267_946
+ No definition line
+ 127
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 264
+ ds2020-267_673
+ No definition line
+ 215
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 265
+ ds2020-267_1164
+ No definition line
+ 64
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 266
+ ds2020-267_544
+ No definition line
+ 223
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 267
+ ds2020-267_634
+ No definition line
+ 217
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 268
+ ds2020-267_1189
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 269
+ ds2020-267_1132
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 270
+ ds2020-267_316
+ No definition line
+ 251
+
+
+ 1
+ gnl|CDD|280316
+ pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus.
+ 280316
+ 465
+
+
+ 1
+ 46.6847
+ 111
+ 3.50628e-08
+ 28
+ 228
+ 377
+ 444
+ -3
+ 0
+ 26
+ 34
+ 1
+ 68
+ NAVYTDFMLGPMKEVGSSLHNGDDVLLGTTSLEITRFTLQRGQRLCIRTQPSKCAFGA-IAEFLRVDH
+ NCAYAELAGAPWADVPTSIHMGDDVLEGLRTPADATSLLDKYARLGFKVNPSKQSVGHTIAEFLRVAF
+ N Y + P +V +S+H GDDVL G + L + RL + PSK + G IAEFLRV
+
+
+
+
+
+
+ 17919
+ 3004588
+ 48
+ 75056660
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 271
+ ds2020-267_338
+ No definition line
+ 247
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 75683825
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 272
+ ds2020-267_85
+ No definition line
+ 411
+
+
+
+
+ 17919
+ 3004588
+ 77
+ 97489500
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 273
+ ds2020-267_967
+ No definition line
+ 124
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 274
+ ds2020-267_783
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 275
+ ds2020-267_1239
+ No definition line
+ 59
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 276
+ ds2020-267_968
+ No definition line
+ 124
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 277
+ ds2020-267_109
+ No definition line
+ 357
+
+
+
+
+ 17919
+ 3004588
+ 74
+ 75536190
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 278
+ ds2020-267_1162
+ No definition line
+ 64
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 279
+ ds2020-267_1001
+ No definition line
+ 107
+
+
+
+
+ 17919
+ 3004588
+ 9
+ 73926242
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 280
+ ds2020-267_445
+ No definition line
+ 233
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 281
+ ds2020-267_739
+ No definition line
+ 212
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 282
+ ds2020-267_17
+ No definition line
+ 1094
+
+
+
+
+ 17919
+ 3004588
+ 88
+ 394049616
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 283
+ ds2020-267_1042
+ No definition line
+ 76
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 284
+ ds2020-267_706
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 285
+ ds2020-267_10
+ No definition line
+ 1619
+
+
+
+
+ 17919
+ 3004588
+ 91
+ 615533632
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 286
+ ds2020-267_802
+ No definition line
+ 209
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 287
+ ds2020-267_1182
+ No definition line
+ 62
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 288
+ ds2020-267_730
+ No definition line
+ 212
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 289
+ ds2020-267_807
+ No definition line
+ 209
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 290
+ ds2020-267_1232
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 291
+ ds2020-267_467
+ No definition line
+ 230
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 292
+ ds2020-267_875
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 293
+ ds2020-267_880
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 294
+ ds2020-267_652
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.050180004
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 295
+ ds2020-267_481
+ No definition line
+ 228
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 296
+ ds2020-267_697
+ No definition line
+ 214
+
+
+ 1
+ gnl|CDD|334046
+ pfam00378, ECH_1, Enoyl-CoA hydratase/isomerase. This family contains a diverse set of enzymes including: enoyl-CoA hydratase, napthoate synthase, carnitate racemase, 3-hydroxybutyryl-CoA dehydratase and dodecanoyl-CoA delta-isomerase.
+ 334046
+ 251
+
+
+ 1
+ 45.4314
+ 108
+ 5.08319e-08
+ 45
+ 170
+ 89
+ 130
+ -3
+ 0
+ 17
+ 24
+ 0
+ 42
+ KPYVVAVQGLCFTAGIELMLNADIVIASDDSCFAQMEVKRGL
+ KPVIAAVNGYAIGGGCELALACDIIIAADNASFGLNEILIGI
+ KP + AV G G EL L DI+IA+D++ F E+ G+
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 297
+ ds2020-267_398
+ No definition line
+ 240
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 298
+ ds2020-267_207
+ No definition line
+ 278
+
+
+
+
+ 17919
+ 3004588
+ 55
+ 74704591
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 299
+ ds2020-267_655
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 300
+ ds2020-267_858
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 301
+ ds2020-267_686
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 302
+ ds2020-267_53
+ No definition line
+ 492
+
+
+
+
+ 17919
+ 3004588
+ 80
+ 131969712
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 303
+ ds2020-267_666
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 304
+ ds2020-267_191
+ No definition line
+ 284
+
+
+
+
+ 17919
+ 3004588
+ 57
+ 73378585
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 305
+ ds2020-267_1005
+ No definition line
+ 99
+
+
+
+
+ 17919
+ 3004588
+ 7
+ 74858030
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 306
+ ds2020-267_296
+ No definition line
+ 254
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 307
+ ds2020-267_146
+ No definition line
+ 313
+
+
+
+
+ 17919
+ 3004588
+ 64
+ 74310880
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 308
+ ds2020-267_318
+ No definition line
+ 251
+
+
+ 1
+ gnl|CDD|376306
+ pfam00252, Ribosomal_L16, Ribosomal protein L16p/L10e.
+ 376306
+ 124
+
+
+ 1
+ 54.7265
+ 133
+ 5.63854e-12
+ 78
+ 206
+ 81
+ 124
+ -1
+ 0
+ 23
+ 28
+ 1
+ 44
+ MGSGKGSPEYWVAVVKPCRIL-SAMSGVAENIARRAISIEASKM
+ MGKGKGKPEGWVARVKPGRILFEIRGGVHEEVAKEALRLAAHKL
+ MG GKG PE WVA VKP RIL GV E +A+ A+ + A K+
+
+
+
+
+
+
+ 17919
+ 3004588
+ 48
+ 75056660
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 309
+ ds2020-267_1050
+ No definition line
+ 75
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 310
+ ds2020-267_819
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 311
+ ds2020-267_809
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 312
+ ds2020-267_857
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 313
+ ds2020-267_725
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 314
+ ds2020-267_991
+ No definition line
+ 114
+
+
+
+
+ 17919
+ 3004588
+ 11
+ 75801933
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 315
+ ds2020-267_20
+ No definition line
+ 893
+
+
+ 1
+ gnl|CDD|376291
+ pfam00006, ATP-synt_ab, ATP synthase alpha/beta family, nucleotide-binding domain. This entry includes the ATP synthase alpha and beta subunits, the ATP synthase associated with flagella and the termination factor Rho.
+ 376291
+ 212
+
+
+ 1
+ 160.19
+ 407
+ 4.59259e-49
+ 498
+ 866
+ 1
+ 113
+ 3
+ 0
+ 44
+ 69
+ 10
+ 123
+ GLKAVDSLVPIGRGQRELIIGDRQTGKTAIAIDTILNQKQLNSRATSESETLYCVYVAIGQKRSTVAQLVQILSEANALEYSILVAATASDPAPLQFLAPYSGCAMGEYFRDNGMHALITYDN
+ GIRAIDGLLPIGRGQRIGIFGGSGVGKTVLA-GMIARQASAD---------VVVVYALIGERGREVREFIEELLESGALKRTVVVVATSDEPPLARYLAPYTALTIAEYFRDQGKDVLLIMDS
+ G++A+D L+PIGRGQR I G GKT +A I Q + + VY IG++ V + ++ L E+ AL+ +++V AT+ +P ++LAPY+ + EYFRD G L+ D+
+
+
+
+
+ 2
+ gnl|CDD|367225
+ pfam02874, ATP-synt_ab_N, ATP synthase alpha/beta family, beta-barrel domain. This family includes the ATP synthase alpha and beta subunits the ATP synthase associated with flagella.
+ 367225
+ 69
+
+
+ 1
+ 76.7994
+ 190
+ 7.30466e-19
+ 126
+ 329
+ 2
+ 69
+ 3
+ 0
+ 32
+ 39
+ 0
+ 68
+ VDEIGRVVSVGDGIARVYGLNEIQAGEMVEFASGVKGIALNLENENVGIVVFGSDTAIKEGDLVKRTG
+ VQVIGPVVDVEFGIGRLPGLLNALEVELVEFGTGVLGEVLNLGEDKVRVQVFGGTSGLSRGDEVKRTG
+ V IG VV V GI R+ GL E+VEF +GV G LNL + V + VFG + + GD VKRTG
+
+
+
+
+
+
+ 17919
+ 3004588
+ 86
+ 308809894
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 316
+ ds2020-267_982
+ No definition line
+ 119
+
+
+
+
+ 17919
+ 3004588
+ 12
+ 75318120
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 317
+ ds2020-267_215
+ No definition line
+ 275
+
+
+
+
+ 17919
+ 3004588
+ 54
+ 75367594
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 318
+ ds2020-267_1139
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 319
+ ds2020-267_434
+ No definition line
+ 234
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 320
+ ds2020-267_86
+ No definition line
+ 408
+
+
+
+
+ 17919
+ 3004588
+ 77
+ 95864675
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 321
+ ds2020-267_484
+ No definition line
+ 228
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 322
+ ds2020-267_1129
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 323
+ ds2020-267_551
+ No definition line
+ 223
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 324
+ ds2020-267_545
+ No definition line
+ 223
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 325
+ ds2020-267_900
+ No definition line
+ 142
+
+
+
+
+ 17919
+ 3004588
+ 19
+ 74595556
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 326
+ ds2020-267_731
+ No definition line
+ 212
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 327
+ ds2020-267_394
+ No definition line
+ 240
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 328
+ ds2020-267_1069
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 329
+ ds2020-267_329
+ No definition line
+ 249
+
+
+ 1
+ gnl|CDD|379049
+ pfam13173, AAA_14, AAA domain. This family of domains contain a P-loop motif that is characteristic of the AAA superfamily.
+ 379049
+ 128
+
+
+ 1
+ 44.8626
+ 107
+ 4.80752e-08
+ 106
+ 249
+ 8
+ 51
+ 1
+ 0
+ 17
+ 24
+ 4
+ 48
+ TGVRRSGKSVLLMQYRDYLLSQQISAENIIYINFESFEYQWVKVADVL
+ TGPRQVGKTTLLKQLAKELLPP----ENILYINLDDPRLLELADFELL
+ TG R+ GK+ LL Q LL ENI+YIN + + ++L
+
+
+
+
+
+
+ 17919
+ 3004588
+ 48
+ 75056660
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 366
+ ds2020-267_74
+ No definition line
+ 425
+
+
+
+
+ 17919
+ 3004588
+ 78
+ 101235078
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 367
+ ds2020-267_714
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 368
+ ds2020-267_130
+ No definition line
+ 330
+
+
+ 1
+ gnl|CDD|366242
+ pfam00680, RdRP_1, RNA dependent RNA polymerase.
+ 366242
+ 470
+
+
+ 1
+ 38.1065
+ 89
+ 7.64962e-05
+ 124
+ 282
+ 203
+ 255
+ 1
+ 0
+ 18
+ 30
+ 2
+ 54
+ TTPIKVGM-PLNGFWLSKLFSKHARCQMHIEGDFEAFDSTISGSVVDLIKDVRK
+ KLGIAVGINPFSRDW-ERLGALIRKGSDVLDVDYSAFDSTLSPFVFDLVEDIRS
+ I VG+ P + W +L + + ++ D+ AFDST+S V DL++D+R
+
+
+
+
+
+
+ 17919
+ 3004588
+ 68
+ 75016032
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 369
+ ds2020-267_247
+ No definition line
+ 264
+
+
+
+
+ 17919
+ 3004588
+ 52
+ 74620800
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 370
+ ds2020-267_1062
+ No definition line
+ 74
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 371
+ ds2020-267_183
+ No definition line
+ 288
+
+
+
+
+ 17919
+ 3004588
+ 58
+ 74680868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 372
+ ds2020-267_995
+ No definition line
+ 111
+
+
+
+
+ 17919
+ 3004588
+ 10
+ 76285746
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 373
+ ds2020-267_717
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 374
+ ds2020-267_720
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 375
+ ds2020-267_280
+ No definition line
+ 257
+
+
+ 1
+ gnl|CDD|366811
+ pfam01788, PsbJ, PsbJ. This family consists of the photosystem II reaction centre protein PsbJ from plants and Cyanobacteria. In Synechocystis sp. PCC 6803 PsbJ regulates the number of photosystem II centers in thylakoid membranes, it is a predicted 4kDa protein with one membrane spanning domain.
+ 366811
+ 38
+
+
+ 1
+ 46.2086
+ 110
+ 2.47901e-09
+ 132
+ 224
+ 1
+ 31
+ -1
+ 0
+ 22
+ 27
+ 0
+ 31
+ DTTGRIPLWIIGTVAGILVIGLIGIFFYGSY
+ SGTGRIPLWLVATVAGLGVIGVVGIFFYGSY
+ TGRIPLW++ TVAG+ VIG++GIFFYGSY
+
+
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 73802330
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 408
+ ds2020-267_28
+ No definition line
+ 727
+
+
+
+
+ 17919
+ 3004588
+ 84
+ 236903936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 409
+ ds2020-267_696
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 410
+ ds2020-267_100
+ No definition line
+ 376
+
+
+ 1
+ gnl|CDD|376940
+ pfam02823, ATP-synt_DE_N, ATP synthase, Delta/Epsilon chain, beta-sandwich domain. Part of the ATP synthase CF(1). These subunits are part of the head unit of the ATP synthase. The subunit is called epsilon in bacteria and delta in mitochondria. In bacteria the delta (D) subunit is equivalent to the mitochondrial Oligomycin sensitive subunit, OSCP (pfam00213).
+ 376940
+ 79
+
+
+ 1
+ 48.1873
+ 116
+ 3.06167e-09
+ 228
+ 347
+ 39
+ 79
+ -3
+ 0
+ 15
+ 26
+ 1
+ 41
+ TAVDIGILRIRL-NDQWLTMALMGGFARIGNNEITVLVNDA
+ TALKPGVLRIKTADGEEEYIAVSGGFLEVQPNEVTILADTA
+ TA+ G+LRI+ + + +A+ GGF + NE+T+L + A
+
+
+
+
+ 2
+ gnl|CDD|366077
+ pfam00401, ATP-synt_DE, ATP synthase, Delta/Epsilon chain, long alpha-helix domain. Part of the ATP synthase CF(1). These subunits are part of the head unit of the ATP synthase. This subunit is called epsilon in bacteria and delta in mitochondria. In bacteria the delta (D) subunit is equivalent to the mitochondrial Oligomycin sensitive subunit, OSCP (pfam00213).
+ 366077
+ 45
+
+
+ 1
+ 35.8096
+ 84
+ 8.90041e-05
+ 87
+ 218
+ 1
+ 45
+ -3
+ 0
+ 16
+ 23
+ 1
+ 45
+ SDIDPQEAQQTLEIAEANLRKAEGKRQ-TIEANLALRRARTRVEA
+ EDIDEERAEEAKERAEERLAQAKQDDIDYARAQAALARALARLQA
+ DID + A++ E AE L +A+ A AL RA R++A
+
+
+
+
+
+
+ 17919
+ 3004588
+ 76
+ 80494456
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 430
+ ds2020-267_926
+ No definition line
+ 130
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 431
+ ds2020-267_436
+ No definition line
+ 234
+
+
+ 1
+ gnl|CDD|365910
+ pfam00155, Aminotran_1_2, Aminotransferase class I and II.
+ 365910
+ 356
+
+
+ 1
+ 35.3773
+ 82
+ 0.000283584
+ 12
+ 191
+ 276
+ 329
+ -2
+ 0
+ 13
+ 24
+ 6
+ 60
+ QQRNIAIERLNAIKGISCTMPQGAFYCFPKIDRDIYPIEDDMQFMMELLLQEKVLMVTGT
+ KRRDYLRDGLQAA-GLSVLPSQAGFFLLTGLDP-----ETAKELAQVLLEEVGVYVTPGS
+ ++R+ + L A G+S Q F+ +D E + LL + V + G+
+
+
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 432
+ ds2020-267_158
+ No definition line
+ 305
+
+
+
+
+ 17919
+ 3004588
+ 62
+ 73850790
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 433
+ ds2020-267_996
+ No definition line
+ 109
+
+
+
+
+ 17919
+ 3004588
+ 10
+ 73460348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 434
+ ds2020-267_1076
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 435
+ ds2020-267_871
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 436
+ ds2020-267_748
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 437
+ ds2020-267_210
+ No definition line
+ 276
+
+
+ 1
+ gnl|CDD|375428
+ pfam17917, RT_RNaseH, RNase H-like domain found in reverse transcriptase. DNA polymerase and ribonuclease H (RNase H) activities allow reverse transcriptases to convert the single-stranded retroviral RNA genome into double-stranded DNA, which is integrated into the host chromosome during infection. This entry represents the RNase H like domain.
+ 375428
+ 103
+
+
+ 1
+ 58.6334
+ 143
+ 1.59337e-13
+ 52
+ 240
+ 12
+ 76
+ 1
+ 0
+ 25
+ 34
+ 4
+ 66
+ AS---MSCVLGQHDETGRKERALYYLSKKFTDYETRYTVLEKTCCALTRASQRLRHYMLNYTTMLI
+ ASDYGIGAVLSQEDEDG-KERPIAYASRKLTPAERNYSTTEKELLAIVWALKKFRHYLLGRKFTVY
+ AS + VL Q DE G KER + Y S+K T E Y+ EK A+ A ++ RHY+L +
+
+
+
+
+ 2
+ gnl|CDD|375430
+ pfam17919, RT_RNaseH_2, RNase H-like domain found in reverse transcriptase.
+ 375430
+ 100
+
+
+ 1
+ 51.7059
+ 125
+ 6.42624e-11
+ 52
+ 237
+ 37
+ 100
+ 1
+ 0
+ 21
+ 33
+ 4
+ 65
+ AS---MSCVLGQHDETGRKERALYYLSKKFTDYETRYTVLEKTCCALTRASQRLRHYMLNYTTML
+ ASDYGIGAVLSQEDD-GGGERPIAFASRKLSPAERNYSTTEKELLAIVWALKKFRHYLLGRKFTI
+ AS + VL Q D+ G ER + + S+K + E Y+ EK A+ A ++ RHY+L +
+
+
+
+
+
+
+ 17919
+ 3004588
+ 55
+ 74704591
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 438
+ ds2020-267_1223
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 439
+ ds2020-267_246
+ No definition line
+ 264
+
+
+
+
+ 17919
+ 3004588
+ 52
+ 74620800
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 440
+ ds2020-267_856
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 441
+ ds2020-267_58
+ No definition line
+ 476
+
+
+ 1
+ gnl|CDD|367590
+ pfam03641, Lysine_decarbox, Possible lysine decarboxylase. The members of this family share a highly conserved motif PGGXGTXXE that is probably functionally important. This family includes proteins annotated as lysine decarboxylases, although the evidence for this is not clear.
+ 367590
+ 128
+
+
+ 1
+ 62.6055
+ 153
+ 7.19579e-14
+ 142
+ 315
+ 1
+ 58
+ -3
+ 0
+ 25
+ 35
+ 0
+ 58
+ VADGVIEKNGIAVGVIPEFMMDREVAHGGLTRLHLTDTMHTSKAIMAEYASAFITLPG
+ VADGALEAGGRVIGIIPNILLPEEIPNPNVTELIIVPDMHERKAKMAELADAFVALPG
+ VADG +E G +G+IP ++ E+ + +T L + MH KA MAE A AF+ LPG
+
+
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 125529973
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 442
+ ds2020-267_903
+ No definition line
+ 142
+
+
+
+
+ 17919
+ 3004588
+ 19
+ 74595556
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 443
+ ds2020-267_413
+ No definition line
+ 238
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 444
+ ds2020-267_733
+ No definition line
+ 212
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 445
+ ds2020-267_754
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 446
+ ds2020-267_299
+ No definition line
+ 254
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 447
+ ds2020-267_36
+ No definition line
+ 651
+
+
+
+
+ 17919
+ 3004588
+ 83
+ 203319674
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 448
+ ds2020-267_1166
+ No definition line
+ 64
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 449
+ ds2020-267_451
+ No definition line
+ 232
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 450
+ ds2020-267_466
+ No definition line
+ 230
+
+
+ 1
+ gnl|CDD|333815
+ pfam00072, Response_reg, Response regulator receiver domain. This domain receives the signal from the sensor partner in bacterial two-component systems. It is usually found N-terminal to a DNA binding effector domain.
+ 333815
+ 111
+
+
+ 1
+ 44.0621
+ 105
+ 5.42419e-08
+ 50
+ 208
+ 1
+ 51
+ 2
+ 0
+ 19
+ 32
+ 2
+ 53
+ VLVVDDHDLVRMGIVRMLSDSPDIDMIGEATDGETAIIKTKQLNPDVVLLDVR
+ VLIVDDDPLIRELLRQLL-EKEGYV-VAEADDGKEALELLKEERPDLILLDIN
+ VL+VDD L+R + ++L + + EA DG+ A+ K+ PD++LLD+
+
+
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 451
+ ds2020-267_1208
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 452
+ ds2020-267_327
+ No definition line
+ 249
+
+
+
+
+ 17919
+ 3004588
+ 48
+ 75056660
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 453
+ ds2020-267_691
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 454
+ ds2020-267_775
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 455
+ ds2020-267_975
+ No definition line
+ 122
+
+
+
+
+ 17919
+ 3004588
+ 13
+ 74834307
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 456
+ ds2020-267_1222
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 457
+ ds2020-267_483
+ No definition line
+ 228
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 458
+ ds2020-267_1159
+ No definition line
+ 64
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 459
+ ds2020-267_1048
+ No definition line
+ 75
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 460
+ ds2020-267_568
+ No definition line
+ 221
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 461
+ ds2020-267_12
+ No definition line
+ 1539
+
+
+
+
+ 17919
+ 3004588
+ 90
+ 588764394
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 462
+ ds2020-267_950
+ No definition line
+ 127
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.049250052
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 463
+ ds2020-267_861
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 464
+ ds2020-267_118
+ No definition line
+ 343
+
+
+ 1
+ gnl|CDD|366090
+ pfam00421, PSII, Photosystem II protein.
+ 366090
+ 499
+
+
+ 1
+ 138.798
+ 350
+ 7.68219e-41
+ 92
+ 337
+ 323
+ 404
+ -1
+ 0
+ 59
+ 64
+ 0
+ 82
+ LTVRGSMDNGDGIAVGWLGHPIFRDKEGRELFVRRMPTFFETFPVVLVDGDGIVRADVPFRRAESKYSVEQVGVTVEFYGGA
+ LFRVGPMDNGDGLMRSWLGHIIFGDETGRFLDVRRMPNFFETFPVVLVDKDGIVRADIPFRRGESGYSLEQTGVTVQFYGGE
+ L G MDNGDG+ WLGH IF D+ GR L VRRMP FFETFPVVLVD DGIVRAD+PFRR ES YS+EQ GVTV+FYGG
+
+
+
+
+
+
+ 17919
+ 3004588
+ 71
+ 74490577
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 465
+ ds2020-267_703
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 466
+ ds2020-267_304
+ No definition line
+ 253
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 1
+ ds2020-267_962
+ No definition line
+ 125
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.06567078
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 2
+ ds2020-267_848
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 3
+ ds2020-267_643
+ No definition line
+ 216
+
+
+ 1
+ gnl|CDD|365856
+ pfam00078, RVT_1, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses.
+ 365856
+ 184
+
+
+ 1
+ 33.8002
+ 78
+ 0.000675747
+ 76
+ 204
+ 41
+ 72
+ 1
+ 0
+ 12
+ 17
+ 11
+ 43
+ SHFRSGRGRHSALRRIKEEWGTSRWFLEFDIRKCFHTINRSSL
+ PGFRPGRSLKKA-----------KWFLKLDLKKAFDQVPLDEL
+ FR GR A +WFL+ D++K F + L
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 4
+ ds2020-267_1196
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 5
+ ds2020-267_18
+ No definition line
+ 1037
+
+
+
+
+ 17919
+ 3004588
+ 87
+ 372973830
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 6
+ ds2020-267_623
+ No definition line
+ 217
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 7
+ ds2020-267_853
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 8
+ ds2020-267_626
+ No definition line
+ 217
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 9
+ ds2020-267_5
+ No definition line
+ 2029
+
+
+ 1
+ gnl|CDD|366242
+ pfam00680, RdRP_1, RNA dependent RNA polymerase.
+ 366242
+ 470
+
+
+ 1
+ 41.5733
+ 98
+ 0.000288253
+ 840
+ 1661
+ 166
+ 417
+ 3
+ 0
+ 50
+ 85
+ 50
+ 288
+ KDDPNKMRTIWGCSKPWIIADTMLWWEYVAYAKLQPGATPMLWSYETFTGGWLRLNHALFSSYIRHSYITLDWKRFDKKAYFCIIDKIFDGVETFLDFDNGYLPTKD--YPDTKSTWTQERSTRLKRLFDWTKENFYHAPIVLPNGHMYVRKFAGIPSGLFITQLIDSWYN-YTMLATILSAMGF----DPRSCIIKVQGDDSIIRLSALIPPDAHDSFLTKVQELADYYFQSVVSVNKSE---VRNELNGCEVLSYR-HRHGLPYRDEL---AMLAQLYHTKARNPS
+ KVQAGKTRLFWGCPVEVNLVARAVFGPFCNKIYSNALKLGIAVGINPFSRDWERL-GALIRKG--SDVLDVDYSAFDSTLSPFVFDLVEDIRSEFCGG----LEPTRLALLELLSN-----------------------PIHILGG-TIIKVEGGLPSGQPATSVINSILNNIYVLYALIKHTGESELDDHETIRFISYGDDNLVAVNPDVDSVGDRLS----EHLKDLG-LTPTRADKTSEFSPIKPLEEVSFLKRTFSRTEGGVRPRLDRKSIERQLAWARAGNTS
+ K K R WGC + ++ + + F+ W RL AL + +D+ FD + D + D F L + S PI + G ++ G+PSG T +I+S N +L ++ G D + GDD+++ ++ + + L D + +K+ L L R R L ++ QL +A N S
+
+
+
+
+
+
+ 17919
+ 3004588
+ 92
+ 791927360
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 10
+ ds2020-267_501
+ No definition line
+ 227
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 11
+ ds2020-267_938
+ No definition line
+ 128
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 12
+ ds2020-267_177
+ No definition line
+ 290
+
+
+
+
+ 17919
+ 3004588
+ 58
+ 74680868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 13
+ ds2020-267_408
+ No definition line
+ 238
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 14
+ ds2020-267_416
+ No definition line
+ 237
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 15
+ ds2020-267_1225
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 16
+ ds2020-267_842
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 17
+ ds2020-267_796
+ No definition line
+ 209
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 18
+ ds2020-267_761
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 19
+ ds2020-267_628
+ No definition line
+ 217
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 20
+ ds2020-267_1192
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 21
+ ds2020-267_590
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 22
+ ds2020-267_506
+ No definition line
+ 226
+
+
+ 1
+ gnl|CDD|377479
+ pfam05173, DapB_C, Dihydrodipicolinate reductase, C-terminus. Dihydrodipicolinate reductase (DapB) reduces the alpha,beta-unsaturated cyclic imine, dihydro-dipicolinate. This reaction is the second committed step in the biosynthesis of L-lysine and its precursor meso-diaminopimelate, which are critical for both protein and cell wall biosynthesis. The C-terminal domain of DapB has been proposed to be the substrate- binding domain.
+ 377479
+ 132
+
+
+ 1
+ 68.2474
+ 168
+ 2.45773e-17
+ 93
+ 215
+ 15
+ 55
+ -3
+ 0
+ 25
+ 28
+ 0
+ 41
+ LYTGYDIEIIEAHHKHKADAPSGTALKMGEVIDEARGTFKP
+ LGDAYDVEIIEKHHNQKKDAPSGTALKLAEAIAEARGEYNA
+ L YD+EIIE HH K DAPSGTALK+ E I EARG +
+
+
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 23
+ ds2020-267_297
+ No definition line
+ 254
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 24
+ ds2020-267_838
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 25
+ ds2020-267_965
+ No definition line
+ 124
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 26
+ ds2020-267_228
+ No definition line
+ 271
+
+
+
+
+ 17919
+ 3004588
+ 54
+ 73330632
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 27
+ ds2020-267_1021
+ No definition line
+ 81
+
+
+
+
+ 17919
+ 3004588
+ 2
+ 74218750
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 28
+ ds2020-267_1150
+ No definition line
+ 65
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 29
+ ds2020-267_1202
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 30
+ ds2020-267_1127
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 31
+ ds2020-267_57
+ No definition line
+ 477
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 127118960
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 32
+ ds2020-267_665
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 33
+ ds2020-267_846
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 34
+ ds2020-267_442
+ No definition line
+ 233
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 35
+ ds2020-267_142
+ No definition line
+ 318
+
+
+
+
+ 17919
+ 3004588
+ 65
+ 75433973
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 36
+ ds2020-267_901
+ No definition line
+ 142
+
+
+
+
+ 17919
+ 3004588
+ 19
+ 74595556
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 37
+ ds2020-267_1174
+ No definition line
+ 63
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 38
+ ds2020-267_584
+ No definition line
+ 220
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 39
+ ds2020-267_315
+ No definition line
+ 251
+
+
+ 1
+ gnl|CDD|366402
+ pfam00989, PAS, PAS fold. The PAS fold corresponds to the structural domain that has previously been defined as PAS and PAC motifs. The PAS fold appears in archaea, eubacteria and eukarya.
+ 366402
+ 112
+
+
+ 1
+ 37.783
+ 88
+ 1.61999e-05
+ 32
+ 241
+ 1
+ 72
+ 2
+ 0
+ 19
+ 34
+ 2
+ 72
+ KHYRQLVNHASEGIIVV-QNQKIVFANPQIYKLTARQPDSLLAFNFTDLIDEADRLIVQD-YEQRCLQGERC
+ EDLRAILESLPDGIFVVDEDGRILYVNAAAEELLGLSREEVIGKSLLDLIPEDDRAEVVELLRQALRQGEES
+ + R ++ +GI VV ++ +I++ N +L + ++ + DLI E DR V + Q QGE
+
+
+
+
+ 2
+ gnl|CDD|379059
+ pfam13188, PAS_8, PAS domain.
+ 379059
+ 65
+
+
+ 1
+ 33.6888
+ 77
+ 0.000292007
+ 32
+ 199
+ 1
+ 58
+ 2
+ 0
+ 15
+ 26
+ 2
+ 58
+ KHYRQLVNHASEGIIVV-QNQKIVFANPQIYKLT-ARQPDSLLAFNFTDLIDEADRLI
+ ERLRALFESSPDGILVLDDGGRIIYANPAALELLGYELLGELLGELLPDLDPLLEDLL
+ + R L + +GI+V+ +I++ANP +L LL DL + L+
+
+
+
+
+ 3
+ gnl|CDD|379177
+ pfam13426, PAS_9, PAS domain.
+ 379177
+ 102
+
+
+ 1
+ 33.9742
+ 78
+ 0.000472059
+ 62
+ 193
+ 1
+ 45
+ 2
+ 0
+ 12
+ 24
+ 1
+ 45
+ SEGIIVV-QNQKIVFANPQIYKLTARQPDSLLAFNFTDLIDEADR
+ PDGILITDEDGRIIYVNPAALRLLGYTREELLGKSITDLFTEPEA
+ +GI++ ++ +I++ NP +L + LL + TDL E +
+
+
+
+
+
+
+ 17919
+ 3004588
+ 48
+ 75056660
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 40
+ ds2020-267_227
+ No definition line
+ 272
+
+
+ 1
+ gnl|CDD|334294
+ pfam00873, ACR_tran, AcrB/AcrD/AcrF family. Members of this family are integral membrane proteins. Some are involved in drug resistance. AcrB cooperates with a membrane fusion protein, AcrA, and an outer membrane channel TolC. The structure shows the AcrB forms a homotrimer.
+ 334294
+ 1010
+
+
+ 1
+ 67.321
+ 165
+ 2.32215e-15
+ 36
+ 245
+ 179
+ 248
+ -1
+ 0
+ 18
+ 40
+ 0
+ 70
+ GRQRQIRVLLNPTQMNAYKVSVNQISNALRPQNVELPVGTITNQNQEMVIQVNGLVKTPNEFNQISVAQN
+ GSQYAMRIWLDPQKLASYGLTLTDVVSALKAQNVNIGAGQLEGQGLQALIRAQGRLQSAEDFEKIIVKNQ
+ G Q +R+ L+P ++ +Y +++ + +AL+ QNV + G + Q + +I+ G +++ +F +I V
+
+
+
+
+
+
+ 17919
+ 3004588
+ 54
+ 73330632
+ 0.05830098
+ 0.267
+ 0.14
+
+
+
+
+ 41
+ ds2020-267_458
+ No definition line
+ 231
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 42
+ ds2020-267_170
+ No definition line
+ 295
+
+
+
+
+ 17919
+ 3004588
+ 60
+ 73319024
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 72
+ ds2020-267_639
+ No definition line
+ 216
+
+
+ 1
+ gnl|CDD|379304
+ pfam13631, Cytochrom_B_N_2, Cytochrome b(N-terminal)/b6/petB.
+ 379304
+ 169
+
+
+ 1
+ 42.2222
+ 100
+ 4.98182e-07
+ 2
+ 214
+ 81
+ 152
+ 2
+ 0
+ 23
+ 35
+ 1
+ 72
+ GGYSVDSPTLTRFFTFHF-ILPFIIAALAALHLLFLHETGSNNPLGITSHSDKITFHPYYTIKDALGLLLFL
+ GGDFPGTATLPRFYALHVLLLPGLILALIVAHLLLVEKHGQFPPPGTEKNVVGVPFWPVFAVKMLLFFLVTV
+ GG + TL RF+ H +LP +I AL HLL + + G P G + + F P + +K L L+ +
+
+
+
+
+ 2
+ gnl|CDD|306530
+ pfam00033, Cytochrome_B, Cytochrome b/b6/petB.
+ 306530
+ 189
+
+
+ 1
+ 37.3615
+ 87
+ 3.68894e-05
+ 2
+ 118
+ 151
+ 189
+ 2
+ 0
+ 28
+ 32
+ 0
+ 39
+ GGYSVDSPTLTRFFTFHFILPFIIAALAALHLLFLHETG
+ GSFSVDQATLTRFFSLHFLLPFILAILMLLHLLFLHETG
+ G +SVD TLTRFF+ HF+LPFI+A L LHLLFLHETG
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 73
+ ds2020-267_72
+ No definition line
+ 438
+
+
+
+
+ 17919
+ 3004588
+ 78
+ 109269608
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 74
+ ds2020-267_865
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 99
+ ds2020-267_927
+ No definition line
+ 130
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 100
+ ds2020-267_116
+ No definition line
+ 345
+
+
+
+
+ 17919
+ 3004588
+ 72
+ 73720060
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 101
+ ds2020-267_407
+ No definition line
+ 239
+
+
+ 1
+ gnl|CDD|365924
+ pfam00177, Ribosomal_S7, Ribosomal protein S7p/S5e. This family contains ribosomal protein S7 from prokaryotes and S5 from eukaryotes.
+ 365924
+ 143
+
+
+ 1
+ 41.2271
+ 98
+ 1.14399e-06
+ 28
+ 126
+ 111
+ 143
+ 1
+ 0
+ 15
+ 20
+ 0
+ 33
+ EKCLFAEILDAYRKRGIARKKRENLHRLASTNR
+ AERLANELIDAANGRGAAVKKKEETHRMAEANR
+ + L E++DA RG A KK+E HR+A NR
+
+
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 102
+ ds2020-267_687
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 103
+ ds2020-267_457
+ No definition line
+ 231
+
+
+ 1
+ gnl|CDD|366121
+ pfam00481, PP2C, Protein phosphatase 2C. Protein phosphatase 2C is a Mn++ or Mg++ dependent protein serine/threonine phosphatase.
+ 366121
+ 253
+
+
+ 1
+ 34.6201
+ 80
+ 0.000499491
+ 10
+ 111
+ 34
+ 67
+ 1
+ 0
+ 12
+ 18
+ 0
+ 34
+ RKAFGVYDGHGGAEVARACRDRMHELVAEAVELE
+ WSFFAVFDGHGGSEAAKYCGKHLHTILALRRSFL
+ F V+DGHGG+E A+ C +H ++A
+
+
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 104
+ ds2020-267_601
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 105
+ ds2020-267_402
+ No definition line
+ 239
+
+
+ 1
+ gnl|CDD|368759
+ pfam06122, TraH, Conjugative relaxosome accessory transposon protein. The TraH protein is thought to be a relaxosome accessory component, also necessary for transfer but not for H-pilus synthesis within the conjugative transposon.
+ 368759
+ 357
+
+
+ 1
+ 33.8542
+ 78
+ 0.000851192
+ 65
+ 235
+ 191
+ 244
+ 2
+ 0
+ 16
+ 21
+ 7
+ 59
+ GNVTWQALSKVAGLREVDKRR--FMGLLGKVVFGENGKITPYFTSNDKVIEEVDPSCGR
+ GNLVWKALKKNGFFAGDTELAELLMSLVGTVIIGANAA-----DGGGKVDVRVIPPLAT
+ GN+ W+AL K + M L+G V+ G N KV V P
+
+
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 106
+ ds2020-267_1083
+ No definition line
+ 72
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 107
+ ds2020-267_914
+ No definition line
+ 134
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 76100752
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 108
+ ds2020-267_566
+ No definition line
+ 221
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 109
+ ds2020-267_518
+ No definition line
+ 225
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 110
+ ds2020-267_694
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 111
+ ds2020-267_369
+ No definition line
+ 243
+
+
+ 1
+ gnl|CDD|378818
+ pfam12137, RapA_C, RNA polymerase recycling family C-terminal. This domain is found in bacteria. This domain is about 360 amino acids in length. This domain is found associated with pfam00271, pfam00176. The function of this domain is not known, but structurally it forms an alpha-beta fold in nature with a central beta-sheet flanked by helices and loops, the beta-sheet being mainly antiparallel and flanked by four alpha helices, among which the two longer helices exhibit a coiled-coil arrangement.
+ 378818
+ 360
+
+
+ 1
+ 37.1168
+ 87
+ 6.51052e-05
+ 137
+ 217
+ 135
+ 162
+ -3
+ 0
+ 14
+ 19
+ 1
+ 28
+ LHPSDEVQVQGL-AVPEDGMTLTFERDQ
+ LRPSDHMLVPDFPGLPEDGMTVTFDRET
+ L PSD + V +PEDGMT+TF+R+
+
+
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 112
+ ds2020-267_735
+ No definition line
+ 212
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 113
+ ds2020-267_32
+ No definition line
+ 701
+
+
+
+
+ 17919
+ 3004588
+ 84
+ 223409408
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 114
+ ds2020-267_239
+ No definition line
+ 266
+
+
+
+
+ 17919
+ 3004588
+ 52
+ 74620800
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 115
+ ds2020-267_795
+ No definition line
+ 209
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 116
+ ds2020-267_750
+ No definition line
+ 211
+
+
+ 1
+ gnl|CDD|376774
+ pfam02391, MoaE, MoaE protein. This family contains the MoaE protein that is involved in biosynthesis of molybdopterin. Molybdopterin, the universal component of the pterin molybdenum cofactors, contains a dithiolene group serving to bind Mo. Addition of the dithiolene sulfurs to a molybdopterin precursor requires the activity of the converting factor. Converting factor contains the MoaE and MoaD proteins.
+ 376774
+ 112
+
+
+ 1
+ 37.815
+ 89
+ 1.24642e-05
+ 28
+ 114
+ 61
+ 89
+ -2
+ 0
+ 8
+ 17
+ 0
+ 29
+ AKGQFDIENAIAIHRIGDLAIGEMAVWIG
+ ARERWPLLDVAIVHRVGRLPVGEAIVLVA
+ A+ ++ + + +HR+G L +GE V +
+
+
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 117
+ ds2020-267_919
+ No definition line
+ 131
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 118
+ ds2020-267_148
+ No definition line
+ 313
+
+
+
+
+ 17919
+ 3004588
+ 64
+ 74310880
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 119
+ ds2020-267_581
+ No definition line
+ 220
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 120
+ ds2020-267_1157
+ No definition line
+ 64
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 121
+ ds2020-267_452
+ No definition line
+ 232
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 122
+ ds2020-267_1100
+ No definition line
+ 71
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 123
+ ds2020-267_816
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 124
+ ds2020-267_428
+ No definition line
+ 235
+
+
+ 1
+ gnl|CDD|333891
+ pfam00164, Ribosom_S12_S23, Ribosomal protein S12/S23. This protein is known as S12 in bacteria and archaea and S23 in eukaryotes.
+ 333891
+ 113
+
+
+ 1
+ 86.7373
+ 215
+ 1.04166e-24
+ 3
+ 182
+ 32
+ 100
+ 3
+ 0
+ 37
+ 45
+ 9
+ 69
+ KKPNSALRKMAKVRLS-NQHDTFAYIPGEG--HNLQEHSMVLIRGGR----VKDLPGVKFHCIR--GVK
+ KQPNSALRKCVRVRLIKNGKEVTAFIPGDGAIHFLQEHDEVLIRGGGGPHAVGDLPGVRYKVVRVAGVS
+ K+PNSALRK +VRL N + A+IPG+G H LQEH VLIRGG V DLPGV++ +R GV
+
+
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 125
+ ds2020-267_1199
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 126
+ ds2020-267_684
+ No definition line
+ 215
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 127
+ ds2020-267_1231
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 128
+ ds2020-267_199
+ No definition line
+ 283
+
+
+
+
+ 17919
+ 3004588
+ 57
+ 73378585
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 129
+ ds2020-267_430
+ No definition line
+ 235
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 130
+ ds2020-267_997
+ No definition line
+ 109
+
+
+
+
+ 17919
+ 3004588
+ 10
+ 73460348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 131
+ ds2020-267_203
+ No definition line
+ 281
+
+
+ 1
+ gnl|CDD|367312
+ pfam03040, CemA, CemA family. Members of this family are probable integral membrane proteins. Their molecular function is unknown. CemA proteins are found in the inner envelope membrane of chloroplasts but not in the thylakoid membrane. A cyanobacterial member of this family has been implicated in CO2 transport, but is probably not a CO2 transporter itself. They are predicted to be haem-binding however this has not been proven experimentally.
+ 367312
+ 228
+
+
+ 1
+ 84.8795
+ 211
+ 1.76794e-22
+ 121
+ 231
+ 192
+ 228
+ -3
+ 0
+ 26
+ 32
+ 0
+ 37
+ LVSTFPVILDTIFKYWIFRYLNRVSPSLVVIYHSMND
+ FIATFPVILDTVFKYWIFRYLNRISPSAVATYRNMNE
+ ++TFPVILDT+FKYWIFRYLNR+SPS V Y +MN+
+
+
+
+
+
+
+ 17919
+ 3004588
+ 56
+ 74041588
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 132
+ ds2020-267_887
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 173
+ ds2020-267_1217
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 174
+ ds2020-267_536
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 175
+ ds2020-267_1177
+ No definition line
+ 63
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 176
+ ds2020-267_33
+ No definition line
+ 680
+
+
+ 1
+ gnl|CDD|367847
+ pfam04157, EAP30, EAP30/Vps36 family. This family includes EAP30 as well as the Vps36 protein. Vps36 is involved in Golgi to endosome trafficking. EAP30 is a subunit of the ELL complex. The ELL is an 80-kDa RNA polymerase II transcription factor. ELL interacts with three other proteins to form the complex known as ELL complex. The ELL complex is capable of increasing that catalytic rate of transcription elongation, but is unable to repress initiation of transcription by RNA polymerase II as is the case of ELL. EAP30 is thought to lead to the derepression of ELL's transcriptional inhibitory activity.
+ 367847
+ 216
+
+
+ 1
+ 63.8066
+ 156
+ 4.86455e-13
+ 342
+ 494
+ 1
+ 51
+ -1
+ 0
+ 21
+ 35
+ 0
+ 51
+ VGVSGILRKEQEMWESTDKSLQDAFQDLNALMSKAKEMVMLAEKMRQKLLS
+ VGIAAIERRQEQQREQYDELLSSAFEDLEALMSKFKELVEFAKKHKKEIKK
+ VG++ I R++++ E D+ L AF+DL ALMSK KE+V A+K ++++
+
+
+
+
+
+
+ 17919
+ 3004588
+ 83
+ 216975473
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 197
+ ds2020-267_885
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 198
+ ds2020-267_6
+ No definition line
+ 1860
+
+
+ 1
+ gnl|CDD|280316
+ pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus.
+ 280316
+ 465
+
+
+ 1
+ 83.6639
+ 207
+ 1.35634e-17
+ 1147
+ 1764
+ 288
+ 464
+ -1
+ 0
+ 49
+ 81
+ 31
+ 207
+ RRVMEMSTQGVVACIDARNFNILHTQEVMASILESASVMLGSRLSEEQHKCLKWLSKAELNQKVLVKKGEVTEELLSAGRQEGWINQMMKGDGTMVEAATVTVGMFSGTRFTMLYNTILNRAYYKVAEELAGIKTLSLHSGDDVYSAFASYIDVYKMKKAMAFIGYTLQLAK-CFLQGVREFLRISHKNANTSQYLARSAATAIHGR
+ WSVQDWKRGGVSLMLDYDDFNSQHSTESMRAVFER----LRRRLPDEPAEAADWLVCS--------------------------MDSMYQLSDGTLLAQRVPGTLKSGHRATTFINSVLNCAYAELAGAPWADVPTSIHMGDDVLEGLRTPADATSLLDKYARLGFKVNPSKQSVGHTIAEFLRVAFCSHEVRGYLARAIASLVSGN
+ V + GV +D +FN H+ E M ++ E L RL +E + WL + ++ M + + A V + SG R T N++LN AY ++A S+H GDDV + D + A +G+ + +K + EFLR++ + YLAR+ A+ + G
+
+
+
+
+
+
+ 17919
+ 3004588
+ 92
+ 715989120
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 199
+ ds2020-267_1246
+ No definition line
+ 58
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 200
+ ds2020-267_555
+ No definition line
+ 222
+
+
+ 1
+ gnl|CDD|365890
+ pfam00124, Photo_RC, Photosynthetic reaction centre protein.
+ 365890
+ 260
+
+
+ 1
+ 44.9254
+ 107
+ 7.71427e-08
+ 48
+ 203
+ 20
+ 63
+ 3
+ 0
+ 17
+ 25
+ 8
+ 52
+ VFIIAFIAAPPVDIDGIREPVSGSLLYGNNIISGAMLPTSAAIGFHV*PISE
+ IIGIGFVAAPSVDW--------NPLLFGRNLWTLAIEPPSPSYGLSFAPLWE
+ + I F+AAP VD LL+G N+ + A+ P S + G P+ E
+
+
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 201
+ ds2020-267_525
+ No definition line
+ 225
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 202
+ ds2020-267_587
+ No definition line
+ 220
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 203
+ ds2020-267_1220
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 204
+ ds2020-267_87
+ No definition line
+ 403
+
+
+
+
+ 17919
+ 3004588
+ 77
+ 92615025
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 205
+ ds2020-267_1176
+ No definition line
+ 63
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 206
+ ds2020-267_834
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 207
+ ds2020-267_909
+ No definition line
+ 139
+
+
+
+
+ 17919
+ 3004588
+ 18
+ 75097288
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 208
+ ds2020-267_911
+ No definition line
+ 138
+
+
+
+
+ 17919
+ 3004588
+ 18
+ 75097288
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 209
+ ds2020-267_594
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 210
+ ds2020-267_195
+ No definition line
+ 283
+
+
+
+
+ 17919
+ 3004588
+ 57
+ 73378585
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 211
+ ds2020-267_640
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 212
+ ds2020-267_583
+ No definition line
+ 220
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 213
+ ds2020-267_1013
+ No definition line
+ 91
+
+
+
+
+ 17919
+ 3004588
+ 4
+ 76255712
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 214
+ ds2020-267_1250
+ No definition line
+ 58
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 215
+ ds2020-267_530
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 216
+ ds2020-267_751
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 217
+ ds2020-267_550
+ No definition line
+ 223
+
+
+ 1
+ gnl|CDD|377548
+ pfam05694, SBP56, 56kDa selenium binding protein (SBP56). This family consists of several eukaryotic selenium binding proteins as well as three sequences from archaea. The exact function of this protein is unknown although it is thought that SBP56 participates in late stages of intra-Golgi protein transport. The Lotus japonicus homolog of SBP56, LjSBP is thought to have more than one physiological role and can be implicated in controlling the oxidation/reduction status of target proteins, in vesicular Golgi transport.
+ 377548
+ 454
+
+
+ 1
+ 33.4244
+ 77
+ 0.00097637
+ 43
+ 216
+ 128
+ 182
+ -2
+ 0
+ 21
+ 27
+ 3
+ 58
+ GAARPQTHACGPCGRLRQYHLGRADQPRIADVLLLDSGSKDVRA*LQRWDKARSPTQL
+ GYSRPHTVHCLPDGEIYISALGDADGNGPGGFLLLDHETFEVKG---RWEKDRGPQLF
+ G +RP T C P G + LG AD LLLD + +V+ RW+K R P
+
+
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 218
+ ds2020-267_958
+ No definition line
+ 125
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 219
+ ds2020-267_554
+ No definition line
+ 222
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 220
+ ds2020-267_474
+ No definition line
+ 229
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 221
+ ds2020-267_127
+ No definition line
+ 334
+
+
+
+
+ 17919
+ 3004588
+ 69
+ 74263434
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 222
+ ds2020-267_65
+ No definition line
+ 462
+
+
+ 1
+ gnl|CDD|372592
+ pfam13406, SLT_2, Transglycosylase SLT domain. This family is related to the SLT domain pfam01464.
+ 372592
+ 292
+
+
+ 1
+ 100.321
+ 251
+ 4.82338e-27
+ 145
+ 360
+ 50
+ 121
+ -1
+ 0
+ 32
+ 50
+ 0
+ 72
+ PWEYIDGAASSSRVSGGQRNFASQSALLDRIENQYGVPASIVTAIWGMESSYGQGTGNSSLDNSLATLAYDG
+ WWDYLARFVTPARIARGRAFLQEHAALLARIEKRYGVPPEIIVAIWGVETNYGRYTGNFPVLDALATLAFDG
+ W+Y+ + +R++ G+ +ALL RIE +YGVP I+ AIWG+E++YG+ TGN + ++LATLA+DG
+
+
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 119174025
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 223
+ ds2020-267_1168
+ No definition line
+ 63
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 224
+ ds2020-267_330
+ No definition line
+ 249
+
+
+
+
+ 17919
+ 3004588
+ 48
+ 75056660
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 225
+ ds2020-267_678
+ No definition line
+ 215
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 226
+ ds2020-267_83
+ No definition line
+ 414
+
+
+
+
+ 17919
+ 3004588
+ 78
+ 96414360
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 227
+ ds2020-267_985
+ No definition line
+ 117
+
+
+
+
+ 17919
+ 3004588
+ 12
+ 75318120
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 228
+ ds2020-267_1067
+ No definition line
+ 74
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.07531314
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 229
+ ds2020-267_833
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 230
+ ds2020-267_432
+ No definition line
+ 234
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 231
+ ds2020-267_726
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 232
+ ds2020-267_734
+ No definition line
+ 212
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 233
+ ds2020-267_588
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 234
+ ds2020-267_924
+ No definition line
+ 131
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 235
+ ds2020-267_843
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 236
+ ds2020-267_672
+ No definition line
+ 215
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 237
+ ds2020-267_132
+ No definition line
+ 328
+
+
+
+
+ 17919
+ 3004588
+ 67
+ 75768630
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 238
+ ds2020-267_1029
+ No definition line
+ 77
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 239
+ ds2020-267_39
+ No definition line
+ 603
+
+
+
+
+ 17919
+ 3004588
+ 82
+ 182692370
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 240
+ ds2020-267_729
+ No definition line
+ 212
+
+
+ 1
+ gnl|CDD|279713
+ pfam01405, PsbT, Photosystem II reaction centre T protein. The exact function of this protein is unknown. It probably consists of a single transmembrane spanning helix. The Chlamydomonas reinhardtii psbT protein appears to be (i) a novel photosystem II subunit and (ii) required for maintaining optimal photosystem II activity under adverse growth conditions.
+ 279713
+ 29
+
+
+ 1
+ 34.2227
+ 79
+ 5.43744e-05
+ 19
+ 99
+ 1
+ 27
+ -3
+ 0
+ 22
+ 23
+ 0
+ 27
+ MEALVYTFLLVSTLGIIFFAIFFREPP
+ MEALVYTLLLALTLGTLFFAIFFREPP
+ MEALVYT LL TLG +FFAIFFREPP
+
+
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 241
+ ds2020-267_977
+ No definition line
+ 121
+
+
+
+
+ 17919
+ 3004588
+ 13
+ 74834307
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 242
+ ds2020-267_19
+ No definition line
+ 1000
+
+
+
+
+ 17919
+ 3004588
+ 87
+ 355626210
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 243
+ ds2020-267_519
+ No definition line
+ 225
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 244
+ ds2020-267_532
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 245
+ ds2020-267_644
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 246
+ ds2020-267_496
+ No definition line
+ 227
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 247
+ ds2020-267_345
+ No definition line
+ 246
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 75683825
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 248
+ ds2020-267_213
+ No definition line
+ 276
+
+
+
+
+ 17919
+ 3004588
+ 55
+ 74704591
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 249
+ ds2020-267_387
+ No definition line
+ 241
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 250
+ ds2020-267_404
+ No definition line
+ 239
+
+
+ 1
+ gnl|CDD|366050
+ pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla.
+ 366050
+ 291
+
+
+ 1
+ 37.675
+ 88
+ 3.50341e-05
+ 70
+ 219
+ 53
+ 98
+ 1
+ 0
+ 18
+ 24
+ 4
+ 50
+ CSMIYGSTGATHFDQLAKILTGYEITGARSSGIFMGILSIAVGFLFKITA
+ IFLMYNYTGTLSFTELSKALDF----GLNSWGLLLLFLLILVGFLFKSAQ
+ ++Y TG F +L+K L G S G+ + L I VGFLFK
+
+
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 251
+ ds2020-267_1229
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 252
+ ds2020-267_873
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 253
+ ds2020-267_850
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 254
+ ds2020-267_389
+ No definition line
+ 241
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 255
+ ds2020-267_961
+ No definition line
+ 125
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 256
+ ds2020-267_827
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 257
+ ds2020-267_485
+ No definition line
+ 228
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 258
+ ds2020-267_312
+ No definition line
+ 252
+
+
+ 1
+ gnl|CDD|278982
+ pfam00585, Thr_dehydrat_C, C-terminal regulatory domain of Threonine dehydratase. Threonine dehydratases pfam00291 all contain a carboxy terminal region. This region may have a regulatory role. Some members contain two copies of this region. This family is homologous to the pfam01842 domain.
+ 278982
+ 91
+
+
+ 1
+ 37.6361
+ 88
+ 1.52007e-05
+ 29
+ 166
+ 17
+ 62
+ 2
+ 0
+ 18
+ 24
+ 2
+ 47
+ IPERTGAFLDFCRSLKGRN-ITVFNYRINTNPKYDGQCVALSVSKEQ
+ FPEQPGALLTFLDLLGGRNNITLFEYR-KHGDKNGCVLVGVELSQAE
+ PE+ GA L F L GRN IT+F YR K V + +S+ +
+
+
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 259
+ ds2020-267_1134
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 260
+ ds2020-267_121
+ No definition line
+ 339
+
+
+
+
+ 17919
+ 3004588
+ 70
+ 75261094
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 261
+ ds2020-267_81
+ No definition line
+ 415
+
+
+
+
+ 17919
+ 3004588
+ 78
+ 96414360
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 262
+ ds2020-267_176
+ No definition line
+ 291
+
+
+ 1
+ gnl|CDD|376500
+ pfam01235, Na_Ala_symp, Sodium:alanine symporter family.
+ 376500
+ 389
+
+
+ 1
+ 106.748
+ 268
+ 1.13408e-29
+ 115
+ 243
+ 5
+ 47
+ 1
+ 0
+ 34
+ 38
+ 0
+ 43
+ GVSSFQALAMSLAGRVGTGNIAGVATAITFGGPGALFWMWMVA
+ GISSFQALCTSLAARVGTGNIAGVATAIALGGPGAVFWMWVIA
+ G+SSFQAL SLA RVGTGNIAGVATAI GGPGA+FWMW++A
+
+
+
+
+
+
+ 17919
+ 3004588
+ 59
+ 73999946
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 263
+ ds2020-267_244
+ No definition line
+ 265
+
+
+
+
+ 17919
+ 3004588
+ 52
+ 74620800
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 264
+ ds2020-267_740
+ No definition line
+ 212
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 265
+ ds2020-267_570
+ No definition line
+ 221
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 266
+ ds2020-267_388
+ No definition line
+ 241
+
+
+ 1
+ gnl|CDD|280316
+ pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus.
+ 280316
+ 465
+
+
+ 1
+ 45.9143
+ 109
+ 6.16383e-08
+ 35
+ 214
+ 369
+ 432
+ -1
+ 0
+ 30
+ 33
+ 8
+ 66
+ TTFINSVLNSIYTDKITKGAR--EVGDSLHNGDDVLIGTHSLKVARESL----RLGRKFNTRIQSA
+ TTFINSVLNCAYA--ELAGAPWADVPTSIHMGDDVLEGLRTPADATSLLDKYARLGFKVNPSKQSV
+ TTFINSVLN Y GA +V S+H GDDVL G + A L RLG K N QS
+
+
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 267
+ ds2020-267_527
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 268
+ ds2020-267_106
+ No definition line
+ 366
+
+
+
+
+ 17919
+ 3004588
+ 76
+ 75566224
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 269
+ ds2020-267_253
+ No definition line
+ 262
+
+
+
+
+ 17919
+ 3004588
+ 51
+ 75265884
+ 0.080313
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 270
+ ds2020-267_759
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 271
+ ds2020-267_669
+ No definition line
+ 215
+
+
+ 1
+ gnl|CDD|380037
+ pfam17862, AAA_lid_3, AAA+ lid domain. This entry represents the alpha helical AAA+ lid domain that is found to the C-terminus of AAA domains.
+ 380037
+ 45
+
+
+ 1
+ 37.5358
+ 88
+ 4.46873e-06
+ 33
+ 122
+ 8
+ 37
+ -1
+ 0
+ 12
+ 20
+ 0
+ 30
+ AGLSEGYTGSDLLELCKKAAYFPIRDLLDE
+ AERTEGFSGADLEALCREAALAALRRGLEA
+ A +EG++G+DL LC++AA +R L+
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 272
+ ds2020-267_1094
+ No definition line
+ 71
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 273
+ ds2020-267_187
+ No definition line
+ 287
+
+
+ 1
+ gnl|CDD|376891
+ pfam02673, BacA, Bacitracin resistance protein BacA. Bacitracin resistance protein (BacA) is a putative undecaprenol kinase. BacA confers resistance to bacitracin, probably by phosphorylation of undecaprenol. More recent studies show that BacA has undecaprenyl pyrophosphate phosphatase activity. Undecaprenyl phosphate is a key lipid intermediate involved in the synthesis of various bacterial cell wall polymers. Bacitracin, a mixture of related cyclic polypeptide antibiotics, is used to treat surface tissue infections. Its primary mode of action is the inhibition of bacterial cell wall synthesis through sequestration of the essential carrier lipid undecaprenyl pyrophosphate, C55-PP, resulting in the loss of cell integrity and lysis. The characteristic phosphatase sequence-motif in this family is likely to be the PGxSRSGG, compared with the PSGH of the PAP family of phosphatases.
+ 376891
+ 259
+
+
+ 1
+ 60.5192
+ 148
+ 3.59766e-13
+ 7
+ 156
+ 10
+ 58
+ 1
+ 0
+ 24
+ 28
+ 1
+ 50
+ LTVFLPISSTGHLILADSLLNFWTKDKADLFIAVIQLGAISAVIYLYWGR
+ LTEFLPVSSSGHLILVPHLLGFSE-DGLAAFDVVIHLGTILAVLVYFRKD
+ LT FLP+SS+GHLIL LL F D F VI LG I AV+ +
+
+
+
+
+
+
+ 17919
+ 3004588
+ 57
+ 75361790
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 274
+ ds2020-267_852
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 275
+ ds2020-267_1036
+ No definition line
+ 76
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 276
+ ds2020-267_91
+ No definition line
+ 395
+
+
+
+
+ 17919
+ 3004588
+ 77
+ 87740550
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 277
+ ds2020-267_821
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 278
+ ds2020-267_810
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 279
+ ds2020-267_1112
+ No definition line
+ 69
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 280
+ ds2020-267_1146
+ No definition line
+ 65
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 281
+ ds2020-267_641
+ No definition line
+ 216
+
+
+ 1
+ gnl|CDD|366315
+ pfam00804, Syntaxin, Syntaxin. Syntaxins are the prototype family of SNARE proteins. They usually consist of three main regions - a C-terminal transmembrane region, a central SNARE domain which is characteristic of and conserved in all syntaxins (pfam05739), and an N-terminal domain that is featured in this entry. This domain varies between syntaxin isoforms; in syntaxin 1A it is found as three alpha-helices with a left-handed twist. It may fold back on the SNARE domain to allow the molecule to adopt a 'closed' configuration that prevents formation of the core fusion complex - it thus has an auto-inhibitory role. The function of syntaxins is determined by their localization. They are involved in neuronal exocytosis, ER-Golgi transport and Golgi-endosome transport, for example. They also interact with other proteins as well as those involved in SNARE complexes. These include vesicle coat proteins, Rab GTPases, and tethering factors.
+ 366315
+ 200
+
+
+ 1
+ 83.7113
+ 208
+ 9.72957e-23
+ 23
+ 187
+ 80
+ 133
+ -3
+ 0
+ 24
+ 36
+ 1
+ 55
+ GPGSSADRTRTSVVSGLGKKLKDMMDDFQGLRGRMTSEYKETIERRYFTITGEKA
+ GPGSAVDRIRKSQTAALRKKLKEVMFEYNELRERIREECKERIQRQ-LEVTGKEV
+ GPGS+ DR R S + L KKLK++M ++ LR R+ E KE I+R+ +TG++
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 282
+ ds2020-267_71
+ No definition line
+ 444
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 109640103
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 283
+ ds2020-267_808
+ No definition line
+ 209
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 284
+ ds2020-267_832
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 285
+ ds2020-267_464
+ No definition line
+ 231
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 286
+ ds2020-267_360
+ No definition line
+ 244
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 287
+ ds2020-267_1248
+ No definition line
+ 58
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 288
+ ds2020-267_1031
+ No definition line
+ 76
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 289
+ ds2020-267_482
+ No definition line
+ 228
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 290
+ ds2020-267_190
+ No definition line
+ 285
+
+
+
+
+ 17919
+ 3004588
+ 57
+ 75361790
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 291
+ ds2020-267_252
+ No definition line
+ 262
+
+
+
+
+ 17919
+ 3004588
+ 51
+ 75265884
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 292
+ ds2020-267_305
+ No definition line
+ 253
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 293
+ ds2020-267_801
+ No definition line
+ 209
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 294
+ ds2020-267_650
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 295
+ ds2020-267_597
+ No definition line
+ 219
+
+
+ 1
+ gnl|CDD|366090
+ pfam00421, PSII, Photosystem II protein.
+ 366090
+ 499
+
+
+ 1
+ 98.737
+ 246
+ 8.10522e-27
+ 22
+ 207
+ 267
+ 324
+ 1
+ 0
+ 42
+ 46
+ 4
+ 62
+ PIELFGPTRYQWDQGYFQPEIYRRIGAGLAENQSLSEAWSKIPEKLAFYDYIGNNPAKGGSF
+ PSELFGPTRYQWDSGYFQQEIDRRVQAG----ASQAQAWTFIPRDLAFYDYIGNAPAKGGLF
+ P ELFGPTRYQWD GYFQ EI RR+ AG S ++AW+ IP LAFYDYIGN PAKGG F
+
+
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 296
+ ds2020-267_1254
+ No definition line
+ 57
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 297
+ ds2020-267_1211
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 298
+ ds2020-267_34
+ No definition line
+ 669
+
+
+
+
+ 17919
+ 3004588
+ 83
+ 212423540
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 299
+ ds2020-267_426
+ No definition line
+ 235
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 300
+ ds2020-267_649
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 301
+ ds2020-267_490
+ No definition line
+ 228
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 302
+ ds2020-267_179
+ No definition line
+ 290
+
+
+
+
+ 17919
+ 3004588
+ 58
+ 74680868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 303
+ ds2020-267_522
+ No definition line
+ 225
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 304
+ ds2020-267_147
+ No definition line
+ 313
+
+
+
+
+ 17919
+ 3004588
+ 64
+ 74310880
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 305
+ ds2020-267_502
+ No definition line
+ 226
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 306
+ ds2020-267_1081
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 307
+ ds2020-267_1007
+ No definition line
+ 97
+
+
+
+
+ 17919
+ 3004588
+ 6
+ 75323924
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 308
+ ds2020-267_379
+ No definition line
+ 242
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 309
+ ds2020-267_328
+ No definition line
+ 249
+
+
+
+
+ 17919
+ 3004588
+ 48
+ 75056660
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 310
+ ds2020-267_580
+ No definition line
+ 220
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 311
+ ds2020-267_262
+ No definition line
+ 260
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 312
+ ds2020-267_424
+ No definition line
+ 236
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 313
+ ds2020-267_371
+ No definition line
+ 242
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 314
+ ds2020-267_151
+ No definition line
+ 311
+
+
+
+
+ 17919
+ 3004588
+ 63
+ 75027640
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 315
+ ds2020-267_268
+ No definition line
+ 259
+
+
+ 1
+ gnl|CDD|280316
+ pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus.
+ 280316
+ 465
+
+
+ 1
+ 83.6639
+ 207
+ 3.22949e-21
+ 18
+ 251
+ 215
+ 291
+ 3
+ 0
+ 32
+ 47
+ 1
+ 78
+ MASEFVETNPLPTWDGTTHVSKSAKLEHGKTRAIFACDTRSYFGFSWILDATQQAWKNERVVMDPGKGGKCGMTQRLR
+ MLFEPQNNNEI-AWWGSVPSKPSMKLEHGKSRAIYACDTRSYLAFEYLLAPVEKAWANKSVILNPGEGDISGFDWSVQ
+ M E N + W G+ S KLEHGK+RAI+ACDTRSY F ++L ++AW N+ V+++PG+G G ++
+
+
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.059998248
+ 0.267
+ 0.14
+
+
+
+
+ 316
+ ds2020-267_1170
+ No definition line
+ 63
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 317
+ ds2020-267_351
+ No definition line
+ 245
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 354
+ ds2020-267_1080
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 355
+ ds2020-267_418
+ No definition line
+ 237
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 356
+ ds2020-267_719
+ No definition line
+ 213
+
+
+ 1
+ gnl|CDD|333815
+ pfam00072, Response_reg, Response regulator receiver domain. This domain receives the signal from the sensor partner in bacterial two-component systems. It is usually found N-terminal to a DNA binding effector domain.
+ 333815
+ 111
+
+
+ 1
+ 56.0033
+ 136
+ 9.1657e-13
+ 45
+ 185
+ 65
+ 111
+ -2
+ 0
+ 19
+ 28
+ 0
+ 47
+ RAAGKHTPVLFLTAKDDLSDRIKGIEIGGDDYLTKPFAFAELIVRIK
+ RRRDPTTPVIILTAHGDEDDAVEALEAGADDFLSKPFDPDELLAALR
+ R TPV+ LTA D D ++ +E G DD+L+KPF EL+ ++
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 357
+ ds2020-267_893
+ No definition line
+ 179
+
+
+
+
+ 17919
+ 3004588
+ 29
+ 74548110
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 406
+ ds2020-267_811
+ No definition line
+ 208
+
+
+ 1
+ gnl|CDD|285265
+ pfam07991, IlvN, Acetohydroxy acid isomeroreductase, NADPH-binding domain. Acetohydroxy acid isomeroreductase catalyzes the conversion of acetohydroxy acids into dihydroxy valerates. This reaction is the second in the synthetic pathway of the essential branched side chain amino acids valine and isoleucine. This N-terminal region of the enzyme carries the binding-site for NADPH. The active-site for enzymatic activity lies in the C-terminal part, IlvC, pfam01450.
+ 285265
+ 165
+
+
+ 1
+ 45.9993
+ 110
+ 1.80927e-08
+ 20
+ 190
+ 79
+ 132
+ -1
+ 0
+ 20
+ 32
+ 3
+ 57
+ EKVFSHMKPNSILGLSHGFLLGHLQSVGLDFPKNISVIAVCPKGMGPSVRRLYVQGK
+ EEIAPNLKEGAALAFAHGF---NIHFGQIKPPKDVDVIMVAPKGPGHLVRREYEEGG
+ E++ ++K + L +HGF ++ + PK++ VI V PKG G VRR Y +G
+
+
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 407
+ ds2020-267_917
+ No definition line
+ 133
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 76100752
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 408
+ ds2020-267_515
+ No definition line
+ 225
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 409
+ ds2020-267_1064
+ No definition line
+ 74
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 410
+ ds2020-267_776
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 411
+ ds2020-267_1110
+ No definition line
+ 70
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 412
+ ds2020-267_421
+ No definition line
+ 236
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 413
+ ds2020-267_1088
+ No definition line
+ 72
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 414
+ ds2020-267_279
+ No definition line
+ 258
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 415
+ ds2020-267_676
+ No definition line
+ 215
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 416
+ ds2020-267_381
+ No definition line
+ 242
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 417
+ ds2020-267_983
+ No definition line
+ 117
+
+
+
+
+ 17919
+ 3004588
+ 12
+ 75318120
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 418
+ ds2020-267_1123
+ No definition line
+ 67
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 419
+ ds2020-267_462
+ No definition line
+ 231
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 420
+ ds2020-267_952
+ No definition line
+ 126
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 421
+ ds2020-267_907
+ No definition line
+ 141
+
+
+
+
+ 17919
+ 3004588
+ 19
+ 74595556
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 422
+ ds2020-267_716
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 423
+ ds2020-267_487
+ No definition line
+ 228
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 424
+ ds2020-267_157
+ No definition line
+ 307
+
+
+
+
+ 17919
+ 3004588
+ 62
+ 75744400
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 425
+ ds2020-267_54
+ No definition line
+ 486
+
+
+
+
+ 17919
+ 3004588
+ 80
+ 128827576
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 426
+ ds2020-267_642
+ No definition line
+ 216
+
+
+ 1
+ gnl|CDD|367225
+ pfam02874, ATP-synt_ab_N, ATP synthase alpha/beta family, beta-barrel domain. This family includes the ATP synthase alpha and beta subunits the ATP synthase associated with flagella.
+ 367225
+ 69
+
+
+ 1
+ 32.8867
+ 76
+ 0.000376273
+ 2
+ 121
+ 27
+ 66
+ -3
+ 0
+ 16
+ 20
+ 0
+ 40
+ VVLVEFEEGTIGIALNLESNNVGVVLMGDGLMIQEGSSVK
+ VELVEFGTGVLGEVLNLGEDKVRVQVFGGTSGLSRGDEVK
+ V LVEF G +G LNL + V V + G + G VK
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 427
+ ds2020-267_849
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 428
+ ds2020-267_334
+ No definition line
+ 248
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 75683825
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 429
+ ds2020-267_936
+ No definition line
+ 129
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 430
+ ds2020-267_178
+ No definition line
+ 290
+
+
+
+
+ 17919
+ 3004588
+ 58
+ 74680868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 431
+ ds2020-267_629
+ No definition line
+ 217
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 432
+ ds2020-267_700
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 433
+ ds2020-267_216
+ No definition line
+ 275
+
+
+
+
+ 17919
+ 3004588
+ 54
+ 75367594
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 434
+ ds2020-267_778
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 435
+ ds2020-267_633
+ No definition line
+ 217
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 436
+ ds2020-267_255
+ No definition line
+ 261
+
+
+
+
+ 17919
+ 3004588
+ 51
+ 75265884
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 437
+ ds2020-267_79
+ No definition line
+ 421
+
+
+
+
+ 17919
+ 3004588
+ 78
+ 99628172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 438
+ ds2020-267_538
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 439
+ ds2020-267_990
+ No definition line
+ 115
+
+
+
+
+ 17919
+ 3004588
+ 11
+ 75801933
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 440
+ ds2020-267_504
+ No definition line
+ 226
+
+
+ 1
+ gnl|CDD|307628
+ pfam01578, Cytochrom_C_asm, Cytochrome C assembly protein. This family consists of various proteins involved in cytochrome c assembly from mitochondria and bacteria; CycK from Rhizobium, CcmC from E. coli and Paracoccus denitrificans and orf240 from wheat mitochondria. The members of this family are probably integral membrane proteins with six predicted transmembrane helices. It has been proposed that members of this family comprise a membrane component of an ABC (ATP binding cassette) transporter complex. It is also proposed that this transporter is necessary for transport of some component needed for cytochrome c assembly. One member CycK contains a putative heme-binding motif, orf240 also contains a putative heme-binding motif and is a proposed ABC transporter with c-type heme as its proposed substrate. However it seems unlikely that all members of this family transport heme nor c-type apocytochromes because CcmC in the putative CcmABC transporter transports neither. CcmF forms a working module with CcmH and CcmI, CcmFHI, and itself is unlikely to bind haem directly.
+ 307628
+ 211
+
+
+ 1
+ 36.1828
+ 84
+ 0.000112784
+ 28
+ 135
+ 63
+ 98
+ -2
+ 0
+ 10
+ 18
+ 0
+ 36
+ LPPLLQDPGLIFHPPMLYMGFVGAVVPFAFAMAALW
+ LNPGLQSPILMLHVPLALLSYATLIIAALLSIALLL
+ L P LQ P L+ H P+ + + ++ ++A L
+
+
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 441
+ ds2020-267_441
+ No definition line
+ 234
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 442
+ ds2020-267_258
+ No definition line
+ 261
+
+
+
+
+ 17919
+ 3004588
+ 51
+ 75265884
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 443
+ ds2020-267_500
+ No definition line
+ 227
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 444
+ ds2020-267_963
+ No definition line
+ 125
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.076703376
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 445
+ ds2020-267_399
+ No definition line
+ 239
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 446
+ ds2020-267_701
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 447
+ ds2020-267_204
+ No definition line
+ 279
+
+
+
+
+ 17919
+ 3004588
+ 56
+ 74041588
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 448
+ ds2020-267_271
+ No definition line
+ 259
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 449
+ ds2020-267_1108
+ No definition line
+ 71
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 450
+ ds2020-267_625
+ No definition line
+ 217
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 451
+ ds2020-267_274
+ No definition line
+ 258
+
+
+ 1
+ gnl|CDD|367619
+ pfam03713, DUF305, Domain of unknown function (DUF305). Domain found in small family of bacterial secreted proteins with no known function. Also found in Paramecium bursaria chlorella virus 1. This domain is short and found in one or two copies. The domain has a conserved HH motif that may be functionally important. This domain belongs to the ferritin superfamily. It contains two sequence similar repeats each of which is composed of two alpha helices.
+ 367619
+ 151
+
+
+ 1
+ 48.8384
+ 117
+ 2.00811e-09
+ 24
+ 185
+ 98
+ 151
+ -2
+ 0
+ 18
+ 29
+ 0
+ 54
+ PDMIFVNTMLSHFDEIIALANIEQRYGKNPELLDLAQDIISSRQNESQILQNWL
+ FDRLFLELMIPHHQGAVEMARDALDRGTNPEVRALAQDIITAQQAEIAQMRQLL
+ D +F+ M+ H + +A G NPE+ LAQDII+++Q E ++ L
+
+
+ 2
+ 46.9124
+ 112
+ 9.45376e-09
+ 24
+ 173
+ 4
+ 53
+ -2
+ 0
+ 16
+ 29
+ 0
+ 50
+ FVNTMLSHFDEIIALANIEQRYGKNPELLDLAQDIISSRQNESQILQNWL
+ FAQDMIPHHQQAVEMAELALERAQDPEVRALAQDIIAAQQPEIGQMRGWL
+ F M+ H + + +A + ++PE+ LAQDII+++Q E ++ WL
+
+
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 452
+ ds2020-267_688
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 453
+ ds2020-267_934
+ No definition line
+ 129
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 454
+ ds2020-267_859
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 455
+ ds2020-267_301
+ No definition line
+ 254
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 456
+ ds2020-267_42
+ No definition line
+ 575
+
+
+ 1
+ gnl|CDD|366000
+ pfam00284, Cytochrom_B559a, Lumenal portion of Cytochrome b559, alpha (gene psbE) subunit. This family is the lumenal portion of cytochrome b559 alpha chain, matches to this family should be accompanied by a match to the pfam00283 family also. The Prosite pattern pattern matches the transmembrane region of the cytochrome b559 alpha and beta subunits.
+ 366000
+ 38
+
+
+ 1
+ 81.1398
+ 201
+ 1.02897e-21
+ 187
+ 300
+ 1
+ 38
+ 1
+ 0
+ 24
+ 34
+ 0
+ 38
+ LAYDVFGSPRPNEYFTESRQGIPLITGRFDSLEQLDEF
+ LAYDVFGTPRPNEYFTQERQELPIVSDRFEAKQQIDEF
+ LAYDVFG+PRPNEYFT+ RQ +P+++ RF++ +Q+DEF
+
+
+
+
+ 2
+ gnl|CDD|365999
+ pfam00283, Cytochrom_B559, Cytochrome b559, alpha (gene psbE) and beta (gene psbF)subunits.
+ 365999
+ 29
+
+
+ 1
+ 46.6507
+ 111
+ 1.54942e-08
+ 79
+ 165
+ 1
+ 29
+ 1
+ 0
+ 12
+ 21
+ 0
+ 29
+ GERSFADIITSIRYWVIHSITIPSLFIAG
+ GERPFSYPIFTVRWLAIHALTVPTVFFLG
+ GER F+ I ++R+ IH++T+P++F G
+
+
+ 2
+ 43.1839
+ 102
+ 2.95472e-07
+ 325
+ 411
+ 1
+ 29
+ 1
+ 0
+ 19
+ 21
+ 0
+ 29
+ MTIDRTYPIFTVRWLAVHGLAVPTVSFLG
+ GERPFSYPIFTVRWLAIHALTVPTVFFLG
+ +YPIFTVRWLA+H L VPTV FLG
+
+
+
+
+
+
+ 17919
+ 3004588
+ 82
+ 167340070
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 457
+ ds2020-267_260
+ No definition line
+ 261
+
+
+
+
+ 17919
+ 3004588
+ 51
+ 75265884
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 458
+ ds2020-267_788
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 459
+ ds2020-267_541
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 460
+ ds2020-267_317
+ No definition line
+ 251
+
+
+
+
+ 17919
+ 3004588
+ 48
+ 75056660
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 461
+ ds2020-267_839
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 462
+ ds2020-267_1195
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 463
+ ds2020-267_303
+ No definition line
+ 254
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 464
+ ds2020-267_680
+ No definition line
+ 215
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 465
+ ds2020-267_632
+ No definition line
+ 217
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 466
+ ds2020-267_59
+ No definition line
+ 474
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 125529973
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 467
+ ds2020-267_354
+ No definition line
+ 245
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 468
+ ds2020-267_366
+ No definition line
+ 243
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 469
+ ds2020-267_523
+ No definition line
+ 225
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 470
+ ds2020-267_874
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 471
+ ds2020-267_24
+ No definition line
+ 827
+
+
+
+
+ 17919
+ 3004588
+ 85
+ 281479870
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 472
+ ds2020-267_125
+ No definition line
+ 335
+
+
+
+
+ 17919
+ 3004588
+ 69
+ 74263434
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 473
+ ds2020-267_453
+ No definition line
+ 232
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 474
+ ds2020-267_537
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 475
+ ds2020-267_1012
+ No definition line
+ 92
+
+
+
+
+ 17919
+ 3004588
+ 4
+ 76255712
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 476
+ ds2020-267_711
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 477
+ ds2020-267_1041
+ No definition line
+ 76
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 478
+ ds2020-267_283
+ No definition line
+ 257
+
+
+ 1
+ gnl|CDD|372443
+ pfam13041, PPR_2, PPR repeat family. This repeat has no known function. It is about 35 amino acids long and is found in up to 18 copies in some proteins. The family appears to be greatly expanded in plants and fungi. The repeat has been called PPR.
+ 372443
+ 50
+
+
+ 1
+ 38.4936
+ 91
+ 3.148e-06
+ 13
+ 114
+ 15
+ 48
+ 1
+ 0
+ 13
+ 22
+ 0
+ 34
+ KLG*VEKSLEMFSEMKKCGVAPNEITFIGVLGAC
+ KNGKVEEAFKLFNEMKKRGIKPNVYTYTILINGL
+ K G VE++ ++F+EMKK G+ PN T+ ++
+
+
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 73802330
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 479
+ ds2020-267_955
+ No definition line
+ 126
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 480
+ ds2020-267_224
+ No definition line
+ 272
+
+
+
+
+ 17919
+ 3004588
+ 54
+ 73330632
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 481
+ ds2020-267_1161
+ No definition line
+ 64
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 482
+ ds2020-267_111
+ No definition line
+ 353
+
+
+
+
+ 17919
+ 3004588
+ 73
+ 74646044
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 483
+ ds2020-267_175
+ No definition line
+ 291
+
+
+
+
+ 17919
+ 3004588
+ 59
+ 73999946
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 484
+ ds2020-267_77
+ No definition line
+ 422
+
+
+
+
+ 17919
+ 3004588
+ 78
+ 99628172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 485
+ ds2020-267_342
+ No definition line
+ 246
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 75683825
+ 0.073678116
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 486
+ ds2020-267_395
+ No definition line
+ 240
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 487
+ ds2020-267_805
+ No definition line
+ 209
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 488
+ ds2020-267_685
+ No definition line
+ 214
+
+
+ 1
+ gnl|CDD|370442
+ pfam09334, tRNA-synt_1g, tRNA synthetases class I (M). This family includes methionyl tRNA synthetases.
+ 370442
+ 391
+
+
+ 1
+ 63.8538
+ 156
+ 1.80219e-14
+ 16
+ 117
+ 124
+ 157
+ -2
+ 0
+ 18
+ 22
+ 0
+ 34
+ PKKGMFLSDRFIKGTCPKCKSEDQYGDSCEDIGT
+ PSDERFLPDRYVEGTCPHCGSEDARGDQCENCGR
+ P FL DR+++GTCP C SED GD CE+ G
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 489
+ ds2020-267_60
+ No definition line
+ 471
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 123940986
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+
diff --git a/tools/virAnnot/virAnnot_blast2tsv.xml b/tools/virAnnot/virAnnot_blast2tsv.xml
new file mode 100755
index 00000000000..9df21d99c6d
--- /dev/null
+++ b/tools/virAnnot/virAnnot_blast2tsv.xml
@@ -0,0 +1,94 @@
+
+ convert XML blast results to tabular file with taxonomic informations
+
+ macros.xml
+
+
+
+
+
+
+
+
+
+
+ BLASTX
+ BLASTP
+ TBLASTX
+ BLASTN
+ DIAMOND
+
+
+ 0
+ 0.1
+ 0.01
+ 0.001
+ 0.0001
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
diff --git a/tools/virAnnot/virAnnot_otu.xml b/tools/virAnnot/virAnnot_otu.xml
new file mode 100755
index 00000000000..f4991e028e0
--- /dev/null
+++ b/tools/virAnnot/virAnnot_otu.xml
@@ -0,0 +1,102 @@
+
+ create viral OTUs based on RPS and Blast annotations
+
+ macros.xml
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ 0.1
+ 0.2
+ 0.3
+ 0.4
+ 0.5
+
+
+ 50
+ 80
+ 100
+ 150
+ 200
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
\ No newline at end of file
diff --git a/tools/virAnnot/virAnnot_rps2tsv.xml b/tools/virAnnot/virAnnot_rps2tsv.xml
new file mode 100755
index 00000000000..839b5aa434d
--- /dev/null
+++ b/tools/virAnnot/virAnnot_rps2tsv.xml
@@ -0,0 +1,57 @@
+
+ Convert xml rpstblast results to tab file with taxonomic informations
+
+ macros.xml
+
+
+
+
+
+
+ 0
+ 0.1
+ 0.01
+ 0.001
+ 0.0001
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+