# HG changeset patch
# User iuc
# Date 1724245979 0
# Node ID b82ce29791e710c304ea3e5e36c95d5f581522ea
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/virAnnot commit ab5e1189217b6ed5f1c5d7c5ff6b79b6a4c18cff
diff -r 000000000000 -r b82ce29791e7 blast2tsv.py
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/blast2tsv.py Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,297 @@
+#!/usr/bin/env python3
+
+
+# Name: blast2tsv
+# Author(s): Sebastien Theil, Marie Lefebvre - INRAE
+# Aims: Convert blast xml output to tsv and add taxonomy
+
+
+import argparse
+import csv
+import logging as log
+import os
+
+from Bio import Entrez
+from Bio import SeqIO
+from Bio.Blast import NCBIXML
+from ete3 import NCBITaxa
+
+ncbi = NCBITaxa()
+
+
+def main():
+ options = _set_options()
+ _set_log_level(options.verbosity)
+ hits = _read_xml(options)
+ _write_tsv(options, hits)
+
+
+def _guess_database(accession):
+ """Guess the correct database for querying based off the format of the accession"""
+ if accession.isdigit():
+ db = 'taxonomy'
+ else:
+ database_mappings_refseq = {'AC': 'nuccore', 'NC': 'nuccore', 'NG': 'nuccore',
+ 'NT': 'nuccore', 'NW': 'nuccore', 'NZ': 'nuccore',
+ 'AP': 'protein', 'NP': 'protein', 'YP': 'protein',
+ 'XP': 'protein', 'WP': 'protein', 'OX': 'nuccore'}
+ try:
+ db = database_mappings_refseq[accession[0:2]]
+ except KeyError:
+ db = 'nuccore'
+ log.warning("DB not found for " + accession + ". Set to nuccore.")
+ return db
+
+
+def _read_xml(options):
+ """
+ Parse XML blast results file
+ Keep only the first hit
+ """
+ log.info("Read XML file.")
+ results = open(options.xml_file, 'r')
+ records = NCBIXML.parse(results)
+ xml_results = {}
+ for blast_record in records:
+ for aln in blast_record.alignments:
+ hit_count = 1
+ for hit in aln.hsps:
+ hsp = {}
+ if hit_count == 1:
+ first_hit_frame = hit.frame[1] if len(hit.frame) > 0 else 0 # strand
+ cumul_hit_identity = hit.identities if hit.identities else 0
+ cumul_hit_score = hit.bits # hit score
+ cumul_hit_evalue = hit.expect # evalue
+ cumul_hit_length = hit.align_length if hit.align_length is not None else 0
+ hit_count = hit_count + 1
+ else:
+ # all HSPs in different strand than 1st HSPs will be discarded.
+ if (first_hit_frame > 0 and hit.frame[1] > 0) or (first_hit_frame < 0 and hit.frame[1] < 0):
+ cumul_hit_identity = cumul_hit_identity + hit.identities
+ cumul_hit_length = cumul_hit_length + hit.align_length
+ cumul_hit_evalue = cumul_hit_evalue + hit.expect
+ cumul_hit_score = cumul_hit_score + hit.bits
+ hit_count = hit_count + 1
+ if hit_count == 1:
+ final_hit_count = hit_count
+ elif hit_count > 1:
+ final_hit_count = hit_count - 1
+ hsp["evalue"] = cumul_hit_evalue / final_hit_count # The smaller the E-value, the better the match
+ hsp["query_id"] = blast_record.query # or query_id
+ hsp["query_length"] = blast_record.query_length # length of the query
+ hsp["accession"] = aln.accession.replace("ref|", "")
+ hsp["description"] = aln.hit_def
+ hsp["hit_length"] = aln.length # length of the hit
+ hsp["hsp_length"] = hit.align_length # length of the hsp alignment
+ hsp["queryOverlap"] = _get_overlap_value(options.algo, hsp, 'hsp', hsp["query_length"])[0]
+ if cumul_hit_length == 0:
+ hsp["percentIdentity"] = round(cumul_hit_identity, 1) # identity percentage
+ else:
+ hsp["percentIdentity"] = round(cumul_hit_identity / cumul_hit_length * 100, 1) # identity percentage
+ hsp["score"] = cumul_hit_score # The higher the bit-score, the better the sequence similarity
+ hsp["num_hsps"] = final_hit_count
+ hsp["hit_cumul_length"] = cumul_hit_length
+ hsp["hitOverlap"] = _get_overlap_value(options.algo, hsp, 'hit', hsp["query_length"])[1]
+ db = _guess_database(hsp["accession"])
+ try:
+ handle = Entrez.esummary(db=db, id=hsp["accession"])
+ taxid = str(int(Entrez.read(handle)[0]['TaxId']))
+ handle.close()
+ log.info("Taxid found for " + hsp["accession"])
+ lineage = ncbi.get_lineage(taxid)
+ names = ncbi.get_taxid_translator(lineage)
+ ordered = [names[tid] for tid in lineage]
+ taxonomy = ordered[1:]
+ hsp["tax_id"] = taxid
+ hsp["taxonomy"] = ';'.join(taxonomy)
+ hsp["organism"] = taxonomy[-1]
+ except RuntimeError:
+ hsp["tax_id"] = ""
+ hsp["taxonomy"] = ""
+ hsp["organism"] = ""
+ log.warning(f"RuntimeError - Taxid not found for {hsp['accession']}")
+ except Exception as err:
+ hsp["tax_id"] = ""
+ hsp["taxonomy"] = ""
+ hsp["organism"] = ""
+ log.warning(f"Taxid not found for {hsp['accession']}. The error is {err}")
+ if hsp["evalue"] <= options.max_evalue and hsp["queryOverlap"] >= options.min_qov and \
+ hsp["hitOverlap"] >= options.min_hov and hsp["score"] >= options.min_score:
+ xml_results[hsp["query_id"]] = hsp
+ else:
+ xml_results[hsp["query_id"]] = [hsp["query_length"]]
+
+ return xml_results
+
+
+def _get_overlap_value(algo, hsp, type, qlength):
+ """
+ Set hsp or hit overlap values for hit and query
+ Return array [query_overlap, hit_overlap]
+ """
+ if type == 'hsp':
+ q_align_len = qlength
+ h_align_len = hsp["hsp_length"]
+ else:
+ q_align_len = qlength
+ h_align_len = hsp["hit_cumul_length"]
+
+ if algo == 'BLASTX':
+ if q_align_len:
+ query_overlap = (q_align_len * 3 / q_align_len) * 100
+ if hsp["hit_length"]:
+ hit_overlap = (h_align_len / hsp["hit_length"]) * 100
+ elif algo == 'TBLASTN':
+ if q_align_len:
+ query_overlap = (q_align_len / q_align_len) * 100
+ if hsp["hit_length"]:
+ hit_overlap = (h_align_len * 3 / hsp["hit_length"]) * 100
+ elif algo == 'TBLASTX':
+ if q_align_len:
+ query_overlap = (q_align_len * 3 / hsp["hsp_length"]) * 100
+ if hsp["hit_length"]:
+ hit_overlap = (h_align_len * 3 / hsp["hit_length"]) * 100
+ else:
+ if q_align_len:
+ query_overlap = (q_align_len / q_align_len) * 100
+ if hsp["hit_length"]:
+ hit_overlap = (h_align_len / hsp["hit_length"]) * 100
+ if query_overlap is None:
+ query_overlap = 0
+ if query_overlap > 100:
+ query_overlap = 100
+ if 'hit_overlap' not in locals():
+ hit_overlap = 0
+ if hit_overlap > 100:
+ hit_overlap = 100
+
+ return [round(query_overlap, 0), round(hit_overlap, 0)]
+
+
+def _write_tsv(options, hits):
+ """
+ Write output
+ """
+ # get a list of contig without corresponding number of mapped reads
+ if options.rn_file is not None:
+ with open(options.rn_file) as rn:
+ rows = (line.split('\t') for line in rn)
+ rn_list = {row[0]: row[1:] for row in rows}
+ fasta = SeqIO.to_dict(SeqIO.parse(open(options.fasta_file), 'fasta'))
+ headers = "#algo\tquery_id\tnb_reads\tquery_length\taccession\tdescription\torganism\tpercentIdentity\tnb_hsps\tqueryOverlap\thitOverlap\tevalue\tscore\ttax_id\ttaxonomy\tsequence\n"
+ if not os.path.exists(options.output):
+ os.mkdir(options.output)
+ tsv_file = options.output + "/blast2tsv_output.tab"
+ log.info("Write output file: " + tsv_file)
+ f = open(tsv_file, "w+")
+ f.write(headers)
+ for h in hits:
+ if options.rn_file is not None:
+ read_nb = ''.join(rn_list[h]).replace("\n", "")
+ else:
+ read_nb = ''
+ if len(hits[h]) > 1:
+ f.write(options.algo + "\t" + h + "\t" + read_nb + "\t" + str(hits[h]["query_length"]) + "\t")
+ f.write(hits[h]["accession"] + "\t" + hits[h]["description"] + "\t")
+ f.write(hits[h]["organism"] + "\t" + str(hits[h]["percentIdentity"]) + "\t")
+ f.write(str(hits[h]["num_hsps"]) + "\t" + str(hits[h]["queryOverlap"]) + "\t")
+ f.write(str(hits[h]["hitOverlap"]) + "\t" + str(hits[h]["evalue"]) + "\t")
+ f.write(str(hits[h]["score"]) + "\t" + str(hits[h]["tax_id"]) + "\t")
+ if h in fasta:
+ f.write(hits[h]["taxonomy"] + "\t" + str(fasta[h].seq))
+ else:
+ f.write(hits[h]["taxonomy"] + "\t\"\"")
+ f.write("\n")
+ else:
+ f.write(options.algo + "\t" + h + "\t" + read_nb + "\t" + str(hits[h])[1:-1] + "\t")
+ f.write("\n")
+ f.close()
+ _create_abundance(options, tsv_file)
+
+
+def _create_abundance(options, tsv_file):
+ """
+ extract values from tsv files
+ and create abundance files
+ """
+ log.info("Calculating abundance.")
+ file_path = tsv_file
+ abundance = dict()
+ with open(tsv_file, 'r') as current_file:
+ log.debug("Reading " + file_path)
+ csv_reader = csv.reader(current_file, delimiter='\t')
+ line_count = 0
+ for row in csv_reader:
+ if line_count == 0:
+ # headers
+ line_count += 1
+ else:
+ # no annotation
+ if len(row) == 16:
+ if row[14] != "":
+ nb_reads = row[2]
+ if nb_reads == "":
+ current_reads_nb = 0
+ log.debug("No reads number for " + row[1])
+ else:
+ current_reads_nb = int(nb_reads)
+ contig_id = row[14]
+ if contig_id in abundance:
+ # add reads
+ abundance[contig_id]["reads_nb"] = abundance[row[14]]["reads_nb"] + current_reads_nb
+ abundance[contig_id]["contigs_nb"] = abundance[row[14]]["contigs_nb"] + 1
+ else:
+ # init reads for this taxo
+ abundance[contig_id] = {}
+ abundance[contig_id]["reads_nb"] = current_reads_nb
+ abundance[contig_id]["contigs_nb"] = 1
+ else:
+ log.debug("No annotations for contig " + row[1])
+ else:
+ log.debug("No annotations for contig " + row[1])
+ log.debug(abundance)
+ reads_file = open(options.output + "/blast2tsv_reads.txt", "w+")
+ for taxo in abundance:
+ reads_file.write(str(abundance[taxo]["reads_nb"]))
+ reads_file.write("\t")
+ reads_file.write("\t".join(taxo.split(";")))
+ reads_file.write("\n")
+ reads_file.close()
+ log.info("Abundance file created " + options.output + "/blast2tsv_reads.txt")
+ contigs_file = open(options.output + "/blast2tsv_contigs.txt", "w+")
+ for taxo in abundance:
+ contigs_file.write(str(abundance[taxo]["contigs_nb"]))
+ contigs_file.write("\t")
+ contigs_file.write("\t".join(taxo.split(";")))
+ contigs_file.write("\n")
+ contigs_file.close()
+ log.info("Abundance file created " + options.output + "/blast2tsv_contigs.txt")
+
+
+def _set_options():
+ parser = argparse.ArgumentParser()
+ parser.add_argument('-x', '--xml', help='XML files with results of blast', action='store', required=True, dest='xml_file')
+ parser.add_argument('-rn', '--read-count', help='Tab-delimited file associating seqID with read number.', action='store', dest='rn_file')
+ parser.add_argument('-c', '--contigs', help='FASTA file with contigs sequence.', action='store', required=True, dest='fasta_file')
+ parser.add_argument('-me', '--max_evalue', help='Max evalue', action='store', type=float, default=0.0001, dest='max_evalue')
+ parser.add_argument('-qov', '--min_query_overlap', help='Minimum query overlap', action='store', type=int, default=5, dest='min_qov')
+ parser.add_argument('-mhov', '--min_hit_overlap', help='Minimum hit overlap', action='store', type=int, default=5, dest='min_hov')
+ parser.add_argument('-s', '--min_score', help='Minimum score', action='store', type=int, default=30, dest='min_score')
+ parser.add_argument('-a', '--algo', help='Blast type detection (BLASTN|BLASTP|BLASTX|TBLASTX|TBLASTN|DIAMONDX).', action='store', type=str, default='BLASTX', dest='algo')
+ parser.add_argument('-o', '--out', help='The output file (.csv).', action='store', type=str, default='./blast2tsv', dest='output')
+ parser.add_argument('-v', '--verbosity', help='Verbose level', action='store', type=int, choices=[1, 2, 3, 4], default=1)
+ args = parser.parse_args()
+ return args
+
+
+def _set_log_level(verbosity):
+ if verbosity == 1:
+ log_format = '%(asctime)s %(levelname)-8s %(message)s'
+ log.basicConfig(level=log.INFO, format=log_format)
+ elif verbosity == 3:
+ log_format = '%(filename)s:%(lineno)s - %(asctime)s %(levelname)-8s %(message)s'
+ log.basicConfig(level=log.DEBUG, format=log_format)
+
+
+if __name__ == "__main__":
+ main()
diff -r 000000000000 -r b82ce29791e7 macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,30 @@
+
+
+
+ virannot
+
+
+
+
+ biopython
+ ete3
+ clustalo
+ curl
+ r-base
+ pyaml
+ openpyxl
+ xlsxwriter
+ xlrd
+ pandas
+ krona
+ zip
+
+
+
+
+
+
+ 10.1094/PBIOMES-07-19-0037-A
+
+
+
diff -r 000000000000 -r b82ce29791e7 otu.py
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/otu.py Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,442 @@
+#!/usr/bin/env python3
+
+
+# Name: virAnnot_otu
+# Author: Marie Lefebvre - INRAE
+# Reuirements: Ete3 toolkit and external apps
+# Aims: Create viral OTUs based on RPS and Blast annotations
+
+
+import argparse
+import csv
+import logging as log
+import os
+import random
+import re
+
+import pandas as pd
+import xlsxwriter
+from Bio import SeqIO
+from Bio.Align.Applications import ClustalOmegaCommandline
+from ete3 import NodeStyle, SeqGroup, SeqMotifFace, Tree, TreeStyle
+
+
+def main():
+ """
+ 1 - retrieve info (sequence, query_id, taxo) from RPS file
+ 2 - align protein sequences of the same domain, calculate
+ matrix of distances, generate trees
+ 3 - get statistics (read number) per otu
+ 4 - create HTML report
+ """
+ options = _set_options()
+ _set_log_level(options.verbosity)
+ hits_collection = _cut_sequence(options)
+ _align_sequences(options, hits_collection)
+ _get_stats(options, hits_collection)
+ _create_html(options, hits_collection)
+
+
+def _cut_sequence(options):
+ """
+ Retrieve viral hits and sequences from RPS files
+ """
+ log.info("Cut sequences")
+ i = 0 # keep track of iterations over rps files to use the corresponding fasta file
+ collection = {}
+ options.rps.sort()
+ for rps_file in options.rps:
+ log.debug("Reading rps file " + str(rps_file))
+ with open(rps_file[0], 'r') as rps_current_file:
+ rps_reader = csv.reader(rps_current_file, delimiter='\t')
+ headers = 0
+ for row in rps_reader:
+ if headers == 0:
+ # headers
+ headers += 1
+ else:
+ if row[1] == "no_hit":
+ pass
+ else:
+ query_id = row[0]
+ cdd_id = row[2]
+ startQ = int(row[5])
+ endQ = int(row[6])
+ frame = float(row[7])
+ description = row[8]
+ superkingdom = row[9]
+ match = re.search("Viruses", superkingdom)
+ # if contig is viral then retrieve sequence
+ if match:
+ options.fasta.sort()
+ seq = _retrieve_fasta_seq(options.fasta[i][0], query_id)
+ seq_length = len(seq)
+ if endQ < seq_length:
+ seq = seq[startQ - 1:endQ]
+ else:
+ seq = seq[startQ - 1:seq_length]
+ if frame < 0:
+ seq = seq.reverse_complement()
+ prot = seq.translate()
+ if len(prot) >= options.min_protein_length:
+ log.debug("Add " + query_id + " to collection")
+ if cdd_id not in collection:
+ collection[cdd_id] = {}
+ collection[cdd_id][query_id] = {}
+ collection[cdd_id][query_id]["nuccleotide"] = seq
+ collection[cdd_id][query_id]["protein"] = prot
+ collection[cdd_id][query_id]["full_description"] = description
+ if options.blast is not None:
+ options.blast.sort()
+ with open(options.blast[i][0], 'r') as blast_current_file:
+ blast_reader = csv.reader(blast_current_file, delimiter='\t')
+ for b_query in blast_reader:
+ if b_query[1] == query_id:
+ collection[cdd_id][query_id]["nb"] = b_query[2]
+ if len(b_query) > 10:
+ collection[cdd_id][query_id]["taxonomy"] = b_query[14]
+ else:
+ collection[cdd_id][query_id]["taxonomy"] = "Unknown"
+ else:
+ if "nb" not in collection[cdd_id][query_id]:
+ collection[cdd_id][query_id]["nb"] = 0
+ if "taxonomy" not in collection[cdd_id][query_id]:
+ collection[cdd_id][query_id]["taxonomy"] = "Unknown"
+ else:
+ log.info("No blast file")
+ collection[cdd_id][query_id]["taxonomy"] = "Unknown"
+ collection[cdd_id][query_id]["nb"] = 0
+
+ collection[cdd_id]["short_description"] = description.split(",")[0] + description.split(",")[1] # keep pfamXXX and RdRp 1
+ collection[cdd_id]["full_description"] = description
+ i += 1
+ return collection
+
+
+def _retrieve_fasta_seq(fasta_file, query_id):
+ """
+ From fasta file retrieve specific sequence with id
+ """
+ contigs_list = SeqIO.to_dict(SeqIO.parse(open(fasta_file), 'fasta'))
+ try:
+ seq = contigs_list[query_id].seq
+ except KeyError:
+ print("KeyError for " + query_id + " file " + fasta_file)
+ else:
+ return seq
+
+
+def _create_tree(tree, fasta, out, color):
+ """
+ Create phylogenic tree from multiple alignments
+ """
+ try:
+ f = open(tree, 'r')
+ except IOError:
+ log.info("Unknown file: " + tree + ". You may have less than 2 sequences to align.")
+ return
+
+ line = ""
+ for word in f:
+ line += word.strip()
+
+ f.close()
+ seqs = SeqGroup(fasta, format="fasta")
+ t = Tree(tree)
+ ts = TreeStyle()
+ ts.show_branch_length = True
+ colors = _parse_color_file(color)
+ node_names = t.get_leaf_names()
+ for name in node_names:
+ seq = seqs.get_seq(name)
+ seqFace = SeqMotifFace(seq, seq_format="()")
+ node = t.get_leaves_by_name(name)
+ for i in range(0, len(node)):
+ if name in colors:
+ ns = NodeStyle()
+ ns['bgcolor'] = colors[name]
+ node[i].set_style(ns)
+ node[i].add_face(seqFace, 0, 'aligned')
+
+ t.render(out, tree_style=ts)
+
+
+def _parse_color_file(file):
+ fh = open(file)
+ reader = csv.reader(fh, delimiter="\t")
+ data = list(reader)
+ colors = {}
+ for i in range(0, len(data)):
+ colors[data[i][0]] = data[i][1]
+
+ return colors
+
+
+def _align_sequences(options, hits_collection):
+ """
+ Align hit sequences with pfam reference
+ """
+ log.info("Align sequences")
+ if not os.path.exists(options.output):
+ os.mkdir(options.output)
+ color_by_sample = {}
+ for cdd_id in hits_collection:
+ cdd_output = options.output + "/" + hits_collection[cdd_id]["short_description"].replace(" ", "_")
+ if not os.path.exists(cdd_output):
+ os.mkdir(cdd_output)
+ if os.path.exists(cdd_output + "/seq_to_align.fasta"):
+ os.remove(cdd_output + "/seq_to_align.fasta")
+ file_seq_to_align = cdd_output + "/seq_to_align.fasta"
+ file_color_config = cdd_output + "/color_config.txt"
+ f = open(file_seq_to_align, "a")
+ f_c = open(file_color_config, "w+")
+ log.info("Writing to " + file_seq_to_align)
+ count = 0 # count number of contig per domain
+ for query_id in hits_collection[cdd_id]:
+ if query_id not in ["short_description", "full_description"]:
+ sample = query_id.split("_")[0] # get sample from SAMPLE_IdCONTIG
+ sample_color = "#" + ''.join([random.choice('ABCDEF0123456789') for i in range(6)])
+ # same color for each contig of the same sample
+ if sample not in color_by_sample.keys():
+ color_by_sample[sample] = sample_color
+ f.write(">" + query_id + "\n")
+ f.write(str(hits_collection[cdd_id][query_id]["protein"]) + "\n")
+ f_c.write(query_id + '\t' + color_by_sample[sample] + '\n')
+ count += 1
+ f.close()
+ f_c.close()
+ file_seq_aligned = cdd_output + '/seq_aligned.final_tree.fa'
+ tree_file = cdd_output + '/tree.dnd'
+ file_cluster = cdd_output + '/otu_cluster.csv'
+ # create alignment for domain with more than 1 contigs
+ if count > 1:
+ log.info("Run clustal omega...")
+ clustalo_cmd = ClustalOmegaCommandline("clustalo", infile=file_seq_to_align, outfile=file_seq_aligned,
+ guidetree_out=tree_file, seqtype="protein", force=True)
+ log.debug(clustalo_cmd)
+ stdout, stderr = clustalo_cmd()
+ log.debug(stdout + stderr)
+
+ # create tree plot with colors
+ file_matrix = cdd_output + "/identity_matrix.csv"
+ log.info("Create tree...")
+ _create_tree(tree_file, file_seq_aligned, tree_file + '.png', file_color_config)
+ _compute_pairwise_distance(options, file_seq_aligned, file_matrix, cdd_id)
+ log.info("Retrieve OTUs...")
+ # if os.path.exists(file_cluster):
+ # os.remove(file_cluster)
+ otu_cmd = os.path.join(options.tool_path, 'seek_otu.R') + ' ' + file_matrix + ' ' + file_cluster + ' ' + str(options.perc)
+ log.debug(otu_cmd)
+ os.system(otu_cmd)
+ # only one contig
+ else:
+ mv_cmd = 'cp ' + file_seq_to_align + ' ' + file_seq_aligned
+ log.debug(mv_cmd)
+ os.system(mv_cmd)
+
+ f = open(file_cluster, "w+")
+ f.write('OTU_1,1,' + list(hits_collection[cdd_id].keys())[0] + ',')
+ f.close()
+
+
+def _compute_pairwise_distance(options, file_seq_aligned, file_matrix, cdd_id):
+ """
+ Calculate paiwise distance between aligned protein sequences
+ from a cdd_id
+ """
+ log.info("Compute pairwise distance of " + cdd_id)
+ matrix = {}
+ for k1 in SeqIO.parse(file_seq_aligned, "fasta"):
+ row = []
+ for k2 in SeqIO.parse(file_seq_aligned, "fasta"):
+ identic = 0
+ compared = 0
+ keep_pos = 0
+ for base in k1:
+ base2 = k2[keep_pos]
+ # mutation, next
+ if base == 'X' or base2 == 'X':
+ keep_pos += 1
+ continue
+ # gap in both sequences, next
+ if base == '-' and base2 == '-':
+ keep_pos += 1
+ continue
+ # gap in one of the sequence, next
+ if base == '-' or base2 == '-':
+ keep_pos += 1
+ continue
+ # identity
+ if base == base2:
+ identic += 1
+ compared += 1
+ keep_pos += 1
+ # set minimum overlap to 20
+ if compared == 0 or compared < 20:
+ percentIdentity = 0
+ else:
+ percentIdentity = (identic / compared) * 100
+ row.append(percentIdentity)
+ matrix[k1.id] = row
+ log.debug("Write " + file_matrix)
+ f = open(file_matrix, "w+")
+ for row in matrix:
+ f.write(row + ',' + ', '.join(map(str, matrix[row])) + "\n")
+ f.close()
+
+
+def _get_stats(options, hits_collection):
+ """
+ Retrieve annotation and number of read
+ for each OTUs
+ """
+ file_xlsx = options.output + '/otu_stats.xlsx' # Create a workbook
+ workbook = xlsxwriter.Workbook(file_xlsx)
+ log.info("Writing stats to " + file_xlsx)
+ for cdd_id in hits_collection:
+ otu_collection = {}
+ cdd_output = options.output + "/" + hits_collection[cdd_id]["short_description"].replace(" ", "_")
+ worksheet = workbook.add_worksheet(hits_collection[cdd_id]["short_description"]) # add a worksheet
+ file_cluster = cdd_output + '/otu_cluster.csv'
+ with open(file_cluster, 'r') as clust:
+ otu_reader = csv.reader(clust, delimiter=',')
+ samples_list = []
+ for row in otu_reader:
+ contigs_list = row[2:len(row) - 1] # remove last empty column
+ otu_collection[row[0]] = {} # key -> otu number
+ otu_collection[row[0]]['contigs_list'] = contigs_list
+ for contig in contigs_list:
+ sample = contig.split('_')[0]
+ samples_list.append(sample) if sample not in samples_list else samples_list
+ if sample not in otu_collection[row[0]]:
+ otu_collection[row[0]][sample] = {}
+ otu_collection[row[0]][sample][contig] = {}
+ # add read number of the contig and annotation
+ if 'nb' in hits_collection[cdd_id][contig]:
+ otu_collection[row[0]][sample][contig]['nb'] = hits_collection[cdd_id][contig]["nb"]
+ else:
+ otu_collection[row[0]][sample][contig]['nb'] = 0
+ if 'taxonomy' in hits_collection[cdd_id][contig]:
+ otu_collection[row[0]][sample][contig]['taxonomy'] = hits_collection[cdd_id][contig]["taxonomy"]
+ else:
+ otu_collection[row[0]][sample][contig]['taxonomy'] = 'unknown'
+ else:
+ otu_collection[row[0]][sample][contig] = {}
+ # add read number of the contig and annotation
+ if 'nb' in hits_collection[cdd_id][contig]:
+ otu_collection[row[0]][sample][contig]['nb'] = hits_collection[cdd_id][contig]["nb"]
+ else:
+ otu_collection[row[0]][sample][contig]['nb'] = 0
+ if 'taxonomy' in hits_collection[cdd_id][contig]:
+ otu_collection[row[0]][sample][contig]['taxonomy'] = hits_collection[cdd_id][contig]["taxonomy"]
+ else:
+ otu_collection[row[0]][sample][contig]['taxonomy'] = 'unknown'
+ if 'taxonomy' in hits_collection[cdd_id][contig]:
+ otu_collection[row[0]]['global_taxonomy'] = hits_collection[cdd_id][contig]["taxonomy"]
+ else:
+ otu_collection[row[0]]['global_taxonomy'] = 'unknown'
+
+ # calculate total number of reads for each sample of each OTU
+ for otu in otu_collection:
+ for sample in otu_collection[otu]:
+ if sample not in ['contigs_list', 'global_taxonomy']:
+ total_nb_read = 0
+ for contig in otu_collection[otu][sample]:
+ total_nb_read += int(otu_collection[otu][sample][contig]['nb'])
+ otu_collection[otu][sample]['total_nb_read'] = total_nb_read
+ row = 0
+ column = 0
+ item = '#OTU_name'
+ worksheet.write(row, column, item)
+ for samp in samples_list:
+ column += 1
+ worksheet.write(row, column, samp)
+ worksheet.write(row, column + 1, 'taxonomy')
+ worksheet.write(row, column + 2, 'contigs_list')
+ row = 1
+ # column = 0
+ for otu in otu_collection:
+ if isinstance(otu_collection[otu], dict):
+ column = 0
+ worksheet.write(row, column, otu)
+ # prepare table with 0 in each cells
+ for sample in otu_collection[otu]:
+ column = 1
+ for samp in samples_list:
+ worksheet.write(row, column, 0)
+ column += 1
+ # fill in table with nb of read for each sample and each OTU
+ for sample in otu_collection[otu]:
+ column = 1
+ for samp in samples_list:
+ if samp == sample:
+ worksheet.write(row, column, otu_collection[otu][sample]['total_nb_read'])
+ column += 1
+ worksheet.write(row, len(samples_list) + 1, otu_collection[otu]['global_taxonomy'].replace(';', ' '))
+ worksheet.write(row, len(samples_list) + 2, ",".join(otu_collection[otu]['contigs_list']))
+ row += 1
+ workbook.close()
+ read_file = pd.ExcelFile(file_xlsx)
+ for sheet in read_file.sheet_names:
+ cluster_nb_reads_file = options.output + "/" + sheet.replace(" ", "_") + "/cluster_nb_reads_files.tab"
+ data_xls = pd.read_excel(file_xlsx, sheet, dtype=str, index_col=None)
+ data_xls.to_csv(cluster_nb_reads_file, encoding='utf-8', index=False, sep='\t')
+
+
+def _create_html(options, hits_collection):
+ """
+ Create HTML file with all results
+ """
+ # create mapping file with all informations to use to create HTML report
+ map_file_path = options.output + "/map.txt"
+ if os.path.exists(map_file_path):
+ os.remove(map_file_path)
+
+ map_file = open(map_file_path, "w+")
+ headers = ['#cdd_id', 'align_files', 'tree_files', 'cluster_files', 'cluster_nb_reads_files', 'pairwise_files', 'description', 'full_description\n']
+ map_file.write("\t".join(headers))
+ for cdd_id in hits_collection:
+ cdd_output = hits_collection[cdd_id]["short_description"].replace(" ", "_")
+ short_description = cdd_output
+ file_seq_aligned = cdd_output + '/seq_aligned.final_tree.fa'
+ tree_file = cdd_output + '/tree.dnd.png'
+ file_cluster = cdd_output + '/otu_cluster.csv'
+ file_matrix = cdd_output + "/identity_matrix.csv"
+ cluster_nb_reads_files = cdd_output + "/cluster_nb_reads_files.tab"
+ map_file.write(cdd_id + "\t" + file_seq_aligned + "\t" + tree_file + "\t")
+ map_file.write(file_cluster + "\t" + cluster_nb_reads_files + "\t" + file_matrix + "\t")
+ map_file.write(short_description + "\t" + hits_collection[cdd_id]["full_description"] + "\n")
+ map_file.close()
+ log.info("Writing HTML report")
+ html_cmd = os.path.join(options.tool_path, 'rps2tree_html.py') + ' -m ' + map_file_path + ' -o ' + options.output
+ log.debug(html_cmd)
+ os.system(html_cmd)
+
+
+def _set_options():
+ parser = argparse.ArgumentParser()
+ parser.add_argument('-b', '--blast', help='TAB blast file from blast2ecsv module.', action='append', required=False, dest='blast', nargs='+')
+ parser.add_argument('-r', '--rps', help='TAB rpsblast file from rps2ecsv module.', action='append', required=True, dest='rps', nargs='+')
+ parser.add_argument('-f', '--fasta', help='FASTA file with contigs', action='append', required=True, dest='fasta', nargs='+')
+ parser.add_argument('-p', '--percentage', help='Percentage similarity threshold for OTUs cutoff.', action='store', type=int, default=90, dest='perc')
+ parser.add_argument('-vp', '--viral_portion', help='Minimun portion of viral sequences in RPS domain to be included.', action='store', type=float, default=0.3, dest='viral_portion')
+ parser.add_argument('-mpl', '--min_protein_length', help='Minimum query protein length.', action='store', type=int, default=100, dest='min_protein_length')
+ parser.add_argument('-tp', '--tool_path', help='Path to otu_seek.R', action='store', type=str, default='./', dest='tool_path')
+ parser.add_argument('-o', '--out', help='The output directory', action='store', type=str, default='./Rps2tree_OTU', dest='output')
+ parser.add_argument('-rgb', '--rgb-conf', help='Color palette for contigs coloration', action='store', type=str, default='rgb.txt', dest='file_rgb')
+ parser.add_argument('-v', '--verbosity', help='Verbose level', action='store', type=int, choices=[1, 2, 3, 4], default=1)
+ args = parser.parse_args()
+ return args
+
+
+def _set_log_level(verbosity):
+ if verbosity == 1:
+ log_format = '%(asctime)s %(levelname)-8s %(message)s'
+ log.basicConfig(level=log.INFO, format=log_format)
+ elif verbosity == 3:
+ log_format = '%(filename)s:%(lineno)s - %(asctime)s %(levelname)-8s %(message)s'
+ log.basicConfig(level=log.DEBUG, format=log_format)
+
+
+if __name__ == "__main__":
+ main()
diff -r 000000000000 -r b82ce29791e7 rps2tree_html.py
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rps2tree_html.py Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,153 @@
+#!/usr/bin/env python3
+import argparse
+import csv
+import logging
+import sys
+
+
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+
+
+def main():
+ options = _set_options()
+ data, headers = _read_map_file(options.map)
+ html = _print_html(data, headers, options.out)
+ index_file = options.out + '/index.html'
+ fh = open(index_file, mode='w')
+ fh.write(html)
+ fh.close()
+
+
+def _get_google_script_headers(data, headers, out_dir):
+ html = '' + "\n"
+ html += '' + "\n"
+ return html
+
+
+def _get_google_js(data, headers, out_dir):
+ java_scripts = []
+ chart_names = []
+ for cdd in data:
+ chart_names.append(cdd['cdd_id'] + '_' + cdd['description'])
+ js = 'var data = new google.visualization.DataTable();' + "\n"
+ mat, head = _parse_csv(out_dir + '/' + cdd['cluster_nb_reads_files'])
+ for el in head:
+ if el == '#OTU_name':
+ js += 'data.addColumn(\'string\', \'' + el + '\');' + "\n"
+ elif el == 'taxonomy':
+ js += 'data.addColumn(\'string\', \'' + el + '\');' + "\n"
+ elif el == 'contigs_list' or el == 'seq_list':
+ js += 'data.addColumn(\'string\', \'' + el + '\');' + "\n"
+ else:
+ js += 'data.addColumn(\'number\', \'' + el + '\');' + "\n"
+ js += 'data.addRows([' + "\n"
+ for j in range(0, len(mat)):
+ js += '[\'' + mat[j][head[0]] + '\''
+ for i in range(1, len(head) - 2):
+ js += ',' + mat[j][head[i]]
+ js += ',\'' + mat[j][head[len(head) - 2]] + '\''
+ js += ',\'' + mat[j][head[len(head) - 1]] + '\''
+ js += ']'
+ if j != (len(mat) - 1):
+ js += ','
+ js += "\n"
+ js += ']);' + "\n"
+ js += 'var table = new google.visualization.Table(document.getElementById(\'' + (cdd['cdd_id'] + '_' + cdd['description']).replace('-', '_') + '_div' + '\'));' + "\n"
+ js += 'table.draw(data, {showRowNumber: false, width: \'70%\', height: \'70%\'});' + "\n"
+ java_scripts.append(js)
+ return chart_names, java_scripts
+
+
+def _parse_csv(file):
+ fh = open(file)
+ reader = csv.reader(fh, delimiter="\t")
+ data = list(reader)
+ headers = data[0]
+ matrix = []
+ for i in range(1, len(data)):
+ dict = {}
+ for j in range(0, len(data[i])):
+ if data[i][j] == '':
+ dict[headers[j]] = None
+ elif data[i][j] == 'null':
+ dict[headers[j]] = None
+ else:
+ dict[headers[j]] = data[i][j]
+ matrix.append(dict)
+ return matrix, headers
+
+
+def _print_html(data, headers, out_dir):
+ html = '' + "\n"
+ html += '
' + "\n"
+ html += '' + 'rps2tree' + ' '
+ html += _get_google_script_headers(data, headers, out_dir)
+ html += '' + "\n"
+ html += '' + "\n"
+ html += '
rps2tree ' + "\n"
+ html += '' + "\n"
+ html += _print_data(data, headers)
+ html += '' + "\n"
+ html += '' + "\n"
+ html += '' + "\n"
+ return html
+
+
+def _print_data(data, headers):
+ html = ''
+ for cdd in data:
+ html += '' + cdd['cdd_id'] + ' ' + cdd['description'] + ' ' + "\n"
+ html += '' + cdd['full_description'] + '' + '
' + "\n"
+ html += '
' + "\n"
+ html += '' + "\n"
+ html += '' + "\n"
+ html += ' ' + "\n"
+ html += '' + "\n"
+ html += '' + cdd['align_files'] + ' ' + "\n"
+ html += '' + "\n"
+ html += '' + cdd['cluster_files'] + ' ' + "\n"
+ html += '' + "\n"
+ html += '' + cdd['cluster_nb_reads_files'] + ' ' + "\n"
+ html += '' + "\n"
+ html += '' + cdd['pairwise_files'] + ' ' + "\n"
+ html += '' + "\n"
+ html += '' + "\n"
+ html += ' ' + "\n"
+ return html
+
+
+def _read_map_file(file):
+ reader = csv.reader(file, delimiter="\t")
+ data = list(reader)
+ headers = data[0]
+ headers[0] = headers[0][1:]
+ map_obj = []
+ for i in range(1, len(data)):
+ dict = {}
+ if len(data[i]) != len(headers):
+ sys.exit('line and headers not the same length.')
+ for j in range(0, len(headers)):
+ dict[headers[j]] = data[i][j]
+ map_obj.append(dict)
+ return map_obj, headers
+
+
+def _set_options():
+ parser = argparse.ArgumentParser()
+ parser.add_argument('-m', '--map', help='The map file produced by rps2tree.pl script.', action='store', type=argparse.FileType('r'), required=True)
+ parser.add_argument('-o', '--out', help='The title for the HTML page.', action='store', type=str, default='./')
+ args = parser.parse_args()
+ return args
+
+
+if __name__ == "__main__":
+ main()
diff -r 000000000000 -r b82ce29791e7 rps2tsv.py
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rps2tsv.py Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,131 @@
+#!/usr/bin/env python3
+
+
+# Name: rps2ecsv
+# Author: Marie Lefebvre - INRAE
+# Aims: Convert rpsblast xml output to csv and add taxonomy
+
+
+import argparse
+import json
+import logging as log
+from urllib import request
+from urllib.error import HTTPError, URLError
+
+from Bio.Blast import NCBIXML
+from ete3 import NCBITaxa
+
+ncbi = NCBITaxa()
+
+
+def main():
+ options = _set_options()
+ _set_log_level(options.verbosity)
+ hits = _read_xml(options)
+ _write_tsv(options, hits)
+
+
+def _read_xml(options):
+ """
+ Parse XML RPSblast results file
+ """
+ log.info("Read XML file " + options.xml_file)
+ xml = open(options.xml_file, 'r')
+ records = NCBIXML.parse(xml)
+ xml_results = {}
+ for blast_record in records:
+ for aln in blast_record.alignments:
+ for hit in aln.hsps:
+ hsp = {}
+ hit_evalue = hit.expect
+ if hit_evalue > options.max_evalue:
+ continue
+ hit_frame = hit.frame[0] # frame
+ hit_evalue = hit.expect # evalue
+ hit_startQ = hit.query_start
+ hit_endQ = hit.query_end
+ hsp["frame"] = hit_frame
+ hsp["evalue"] = hit_evalue
+ hsp["startQ"] = hit_startQ
+ hsp["endQ"] = hit_endQ
+ hsp["query_id"] = blast_record.query_id
+ hsp["cdd_id"] = aln.hit_def.split(",")[0]
+ hsp["hit_id"] = aln.hit_id
+ hsp["query_length"] = blast_record.query_length # length of the query
+ hsp["description"] = aln.hit_def
+ hsp["accession"] = aln.accession
+ hsp["pfam_id"] = hsp["description"].split(",")[0].replace("pfam", "PF")
+ log.info("Requeting Interpro for " + hsp["pfam_id"])
+ url = "https://www.ebi.ac.uk/interpro/api/taxonomy/uniprot/entry/pfam/" + hsp["pfam_id"]
+ req = request.Request(url)
+ try:
+ response = request.urlopen(req)
+ except HTTPError as e:
+ log.debug('Http error for interpro: ', e.code)
+ except URLError as e:
+ log.debug('Url error for interpro: ', e.reason)
+ else:
+ encoded_response = response.read()
+ decoded_response = encoded_response.decode()
+ payload = json.loads(decoded_response)
+ kingdoms = []
+ for item in payload["results"][:6]:
+ if item["metadata"]["parent"] is not None:
+ lineage_parent = item["metadata"]["parent"]
+ translation = ncbi.get_taxid_translator([int(lineage_parent)])
+ names = list(translation.values())
+ if len(names) > 0:
+ if names[0] == "root":
+ taxonomy = names[1:] # remove 'root' at the begining
+ else:
+ taxonomy = names
+ else:
+ taxonomy = names
+ if len(taxonomy) != 0:
+ kingdoms.append(taxonomy[0])
+ frequency = {kingdom: kingdoms.count(kingdom) for kingdom in kingdoms} # {'Pseudomonadota': 9, 'cellular organisms': 4}
+ sorted_freq = dict(sorted(frequency.items(), key=lambda x: x[1], reverse=True))
+ concat_freq = ";".join("{}({})".format(k, v) for k, v in sorted_freq.items())
+ hsp["taxonomy"] = concat_freq
+ xml_results[hsp["query_id"]] = hsp
+ return xml_results
+
+
+def _write_tsv(options, hits):
+ """
+ Write output
+ """
+ log.info("Write output file " + options.output)
+ headers = "#query_id\tquery_length\tcdd_id\thit_id\tevalue\tstartQ\tendQ\tframe\tdescription\tsuperkingdom\n"
+ f = open(options.output, "w+")
+ f.write(headers)
+ for h in hits:
+ f.write(h + "\t" + str(hits[h]["query_length"]) + "\t")
+ f.write(hits[h]["cdd_id"] + "\t" + hits[h]["hit_id"] + "\t" + str(hits[h]["evalue"]) + "\t")
+ f.write(str(hits[h]["startQ"]) + "\t" + str(hits[h]["endQ"]) + "\t" + str(hits[h]["frame"]) + "\t")
+ f.write(hits[h]["description"] + "\t" + hits[h]["taxonomy"])
+ f.write("\n")
+ f.close()
+
+
+def _set_options():
+ parser = argparse.ArgumentParser()
+ parser.add_argument('-x', '--xml', help='XML files with results of blast', action='store', required=True, dest='xml_file')
+ parser.add_argument('-e', '--max_evalue', help='Max evalue', action='store', type=float, default=0.0001, dest='max_evalue')
+ parser.add_argument('-o', '--out', help='The output file (.tab).', action='store', type=str, default='./rps2tsv_output.tab', dest='output')
+ parser.add_argument('-v', '--verbosity', help='Verbose level', action='store', type=int, choices=[1, 2, 3, 4], default=1)
+ args = parser.parse_args()
+ return args
+
+
+def _set_log_level(verbosity):
+ if verbosity == 1:
+ log_format = '%(asctime)s %(levelname)-8s %(message)s'
+ log.basicConfig(level=log.INFO, format=log_format)
+ elif verbosity == 3:
+ log_format = '%(filename)s:%(lineno)s - %(asctime)s %(levelname)-8s %(message)s'
+ log.basicConfig(level=log.DEBUG, format=log_format)
+
+
+if __name__ == "__main__":
+ main()
diff -r 000000000000 -r b82ce29791e7 seek_otu.R
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/seek_otu.R Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,48 @@
+#!/usr/bin/env Rscript
+
+## Redirect R error handling to stderr.
+options(show.error.messages = FALSE, error = function() {
+ cat(geterrmessage(), file = stderr())
+ q("no", 1, FALSE)
+})
+
+## Avoid crashing Galaxy with a UTF8 error on German LC settings
+loc <- Sys.setlocale("LC_MESSAGES", "en_US.UTF-8")
+
+args <- commandArgs(trailingOnly = TRUE)
+if (length(args) == 0) {
+ stop("Arguments missing for Rscrpit", call. = FALSE)
+} else {
+ # percentage of identity
+ id_threshold <- as.numeric(args[3])
+ # get input data (matrix)
+ data <- read.csv(args[1], header = FALSE, sep = ",", row.names = 1)
+ # remove last 2 columns
+ data_length <- length(data)
+ # create matrix
+ mat <- as.matrix(data[, 1:data_length], fill = TRUE)
+ # create coordinate matrix
+ d <- as.dist(1 - mat)
+ # create tree
+ hc <- hclust(d, method = "single")
+ # assign otu based on identity value
+ otu <- cutree(hc, h = -id_threshold)
+ # group contigs by otu
+ # Print results to output file
+ output <- args[2]
+ # unique is used to know the number of different otu
+ for (i in unique(otu)) {
+ # retrieve contigs belonging to the same otu
+ clust <- which(otu == i)
+ # write otu number and number of contigs in this otu
+ cat(
+ paste("OTU_", i, ",", length(clust), ",", sep = ""),
+ file = output, append = TRUE
+ )
+ for (n in names(clust)) {
+ # write contigs name
+ cat(paste(gsub(" ", "", n), ",", sep = ""), file = output, append = TRUE)
+ }
+ cat("\n", sep = "", file = output, append = TRUE)
+ }
+}
diff -r 000000000000 -r b82ce29791e7 test-data/blast2tsv_contigs.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/blast2tsv_contigs.fa Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,373 @@
+>NODE_1_length_506_cov_10.687361
+CTAACCTGTGTTGGGTGTGTTTGGTGTCTTGGGTCGGCATTAGCAACTAAATCAAAAGGC
+ATAAACCTTGTGAGTTGATGATTGGCAGGAATGTTGACCGGCGTTTCCGGAGCAGATGTC
+GCAGCGTAAATTACGTCGCGAGGAGCATGGGTAGCAGTAGCAGCAGCAGCGGGGCGTTGG
+AGAAAGCAAATGTCTTGAGCACGGGCTTCGTCAGTAACGAAGTTGAGGTGGGTAAAGGCA
+GCATAAAGGTTGGCTTTATTCGTTTCACGACCGGCAATCCATGTAGGAAGGGCGTAGGTT
+GAATAACCATGCTTTATGATCGCAGAACCAGAGGGATTTTCAATCAGCTGGAACAGAGTC
+ATGGTGGGGTTCGTAACGTCATTAGCAATAGCAGTGACGGCTTGAAGAACAACTTTAATT
+TCACGTAGGTTGCCAGGAGTAGCAGCAAACAACATGTCATAGGCGTTCACATGATTTGTA
+GCGAAGATAGGAGGCTGTAGTGACAG
+>NODE_2_length_429_cov_3.631016
+GTCTAACCTGTGTTGGGTGTGTTTGGTTAGTTGGCTGGAATTCATGCACCGTTGACACGG
+GTTGCTTAACATCTTGCCTCATCCTAGTTTTGGCTGCTTGGTAGAACGTCAAAACAACAT
+CCACCTTCTGCTTGGCTGCTATACTCTTGATGCTCTCTGGTTCGTACCTGTCCATATCCA
+CTAATATTACATCGGTATTGTAGTCACACTTGCTGGTAATGTTAACCCCCAATTGTGATA
+ACACCGCACATATTGAATGACCGTACCTGTAGGTCGTGGTCAACACCTCACGATTGTGCA
+CCAAATCCAACACATTACTCAGCACCCTCTCACCGTGGGCTGGGCTTGTGTCTATGCTTC
+CTACCTGATCCATGTCACCATAACATATTACATTTTTAAATGCCCAAACACACCCAACAC
+AGGTTAGAC
+>NODE_3_length_365_cov_1.074194
+GTCTAACCTGTGTTGGGTGTGTTTGGTGGTCCGTTGAGCTAGATTGGAAGAAATTTGATA
+GGGAGAGGCCAGCTGAGGACATTTCTTTCTGCATTGATGTATTTCTTTCATGTTTTGAGC
+CGCGGTCTGAAAGGGAGACAAGACTTTTGAGGGCATATGGCATTTGTATGAGAAGAGCAC
+TCGTGGAACGCCTGTTCGTGACGGATACGGGTTGCGTATTCGGTATCGACGGGATGGTTC
+CAAGTGGCTCTCTATGGACTGGCTTCCTTGATACCGCGCTCAATATTCTATATATTTCTG
+ATGTTCTTTTGGATATGGGTTTCTACCCCCCCCTGGCTTCCAAACACACCCAACACAGGT
+TAGAC
+>NODE_4_length_351_cov_1.547297
+GTCTAACCTGTGTTGGGTGTGTTTGGTTTCTAGGTGAATGATGTCAACAAGCGCCCTGGA
+CCGTCTGCTCATGCTGCCTCATGGAAAGAAGTTTCCTGGAAAACTAGCTTTGTATCCTTC
+CTACAAAGTCTGCCTGTTCCTGAATTTCTTGTACCGATACTTAAACAGTTCAGTCACTTT
+ACTACTGATCGAACTAAGAACGTATTCTTTATTCCATCTGCCGCTGGCTATGACCATAAC
+ATCTTCTTTGGTCGCGTATTTCCTTTGAACATGTTTGCTGCCATTCATGATTGCACCGCT
+ACACTGCCAAGCAATTCCTCAGAAGTTCCAAACACACCCAACACAGGTTAG
+>NODE_5_length_344_cov_3.273356
+CTAACCTGTGTTGGGTGTGTTTGGGCTGGGGGCGACCAACAAAACGGTTATTTCCTCTCA
+CAATGTTGCTTGAGTTTGTTGTGATGTGTGATTGATTTTGCGCTCATTCATGGACATGTT
+CTCCTATTTCTAATTAAGATTATCTCATGTAGTTTCCAGTCGTTATGAATCTCTTGTGGT
+ATACTAACGGTCTTTGTATCATTTTTAATAGTTCACTTATGTTTTGATTTAACTCAAATT
+CATTTATGTCATATTTTAGCTGAGTTGCATGTTTGCAACTCAGTACATCGTACCATGATC
+TTAAATCTAGCTCCGTACCCAAACACACCCAACACAGGTTAGAC
+>NODE_6_length_338_cov_1.314488
+GTCTAACCTGTGTTGGGTGTGTTTGGGTATCCTTGAGGCTCTCGGATTCCGTGTCACGAA
+CAAGTACTTCATCAAAGTTCTTGGCGATGACGTAATCTTCGGAATTTTAAAGCACATACC
+CATTTCGAAATGGGCTGACTTTTTGCAAGACTTCTCTACTGAAGCTAAGCGCCGATTCAA
+CGCTAAACTGAACCCCAATAAATGTGGCGCATCTGCAGGAATTCACGGTGCCCAAGTACT
+AAGCTACTTCAACTGGAACGGATTTCCCAAGCGCGAAACCACCCAATTGTTAGCACAACT
+ACTACACCGTACCCAAACACACCCAACACAGGTTAGAC
+>NODE_7_length_335_cov_1.714286
+GTCTAACCCGTGTTGGGTGTGTTTGGTGCCATCATGATTGCACCGCTACACTGCCAAGCA
+ATTCCTCCAGAATTCCAGTACTTCAAGACCTGTTCGCCCGCGTCCTGTATTCGATTACTG
+CTCCCGCTTTTACCTGCCTGATCCCCGATTTACTCGGTGCCTCCATTGATCAGACAACTA
+CTACGCATGTTAACTATATCAACTCCAAGTTGTTCCAAATATTTAACGCTGTTTTCAACC
+CAGTCCTGTTTCGTGACTATCAACGCCGCTCGTCTCTTGCTGCTCTGTCACTACAGCCTC
+CCGCCAATCCCAAACACACCCAACACAGGTTAGAC
+>NODE_8_length_331_cov_0.862319
+GTCTAACCTGTGTTGGGTGTGTTTGGGATTGGAGTGAAGAAAAATTAGAGATGAGAAATG
+ATAATAACGAAGAATGTGGCCCTTTCGTAGGAGCAGTAACCCCACCACGTGAGGAAGATT
+TAACGAACGCGAGTGGTAATATTCCTGTAGTGCCAAGACAAACGATCAGGAAGCTCTCTC
+AGAAGGAAATAGACGAAGGTCGTGACTTAGATGTTGACATGCCGCCATTGGAAGATGTCA
+CGGAATTGGATGAGCCAACCAATGAATTAACCAACAGATTCCCACAAGAACTGCACACTG
+AAGAGTATGCACCAGAAATAGAAGTGGAAAG
+>NODE_9_length_324_cov_2.141264
+GTCTAACCTGTGTTGGGTGTGTTTGGGGCCCCCTTTTTAAACCCCAGGGTGACTTTCAGT
+CACCCTGAACTATCTTTCTTCCCAATGTAACAATTTGTGTGCGAACACCTCATTGTCTCG
+CATCATTTTTACCAAAGATTTGACATGTTGGTCTGCTGAACCCATTGGCATTCCATGCTT
+CATTTCACTGGCCCTGAAACAACTACTCACATCATACCACAATGTGGGCTCCACAACCCA
+TTGTTTATCACGTATTAAATCCATCACTGGCTGAATCTTTCCTAGCATCATGCAGTAACT
+CATGCACCTGGCTTCCAAATTTTG
+>NODE_10_length_324_cov_1.371747
+GTCTAACCTGTGTTGGGTGTGTTTGGTTCGCAGTTGGGCTGTTACTCTAGCTGCAGGATC
+AGACTTTTGATCCTCCATTTGTTTCATGCTGTCGGTCTGCAACTTTAAGTATTCGTAGTA
+TTTTGATTTGGGCCCTTTCGCTGGTGGCTTTTTATTTATCAAACTTTTATTGTTTGTGAT
+TACCACCAGCTTTCTGTACTCTTCCACGTAACCTATGTCAGCCCACTCTAAATCATTGAT
+TGTAGATAACCACCATTTGTCAAAAACCTCGTTAAAACCGCCCATGTTTTCCTTTCCATA
+ACCAAACACACCCAACACAGGTTA
+>NODE_11_length_317_cov_1.125954
+CTAACCTGTGTTGGGTGTGTTTGGTGTCCTATTTCAACATTTTGTTGTTTCGCATCAAGG
+CCATCAAGACTGGTTTGGCTGGTAATCCGTCTAATCCACATAATTTGCAGTGGGCGGCCA
+AGCAATCCCATACGCAGTCATTAACGCCTAAAGCTTCGTGAATTGTATCAAACTCCACAT
+CTGAAACTTTGTACGTCATGTGATTCTCTAATTTTATTTCCTTTAACCAGTTTGGTCTGT
+CCATGGACCAGGATATTAATGTGGTAGCGCTGCTAGAGTCTACACCCATCGCCAAACACA
+CCCAACACAGGTTAGAC
+>NODE_12_length_311_cov_1.535156
+GTCTAACCTGTGTTGGGTGTGTTTGGACCTACATCGTTACTATGACAATACCCGTTATAA
+CCCTAGTAATGAGCTTAAATCCCTTGCCCTTAACAAGGAATACTCAATGTTAGTCCAAGC
+TTATCTTAATACTAATAAAGTGAAACACCAGCCTTATGAGCTTCACTGCCCTATCCCTGC
+TGATGCTGCCACTATCCCACCTTCAAGAGTCCCCGCTCCTGGAATAAAATTAGTTCCTCT
+CATGTACCATTATGGCCATGTAATTCGCGCTCACCCACTCAACTTCCAAACACACCCAAC
+ACAGGTTAGAC
+>NODE_13_length_295_cov_0.945833
+TGTGTTGGGTGTGTTTGGTTTCCGGTTACCATAATCGCTATTCTTTCAAACAGAAAGCGC
+ATGCTAAGTATTCTCACCCAGAGGAATATGCTGACAAGCCCTCCTCAAAAGGCTATTTTT
+ACAATGCCACCTATGAGAATGCACGAACTCTTATTCACTTCATTAAGCAATATGGATTGC
+CCTTCAATCCTGTTATTGCACCAGAAGATGCTGAACTAACTGATGAACAGATTCAATCTT
+ACATCAACACAGCAAACTCCTTCTTTAATGATTATCCGACGTTACTGTTCACCCG
+>NODE_14_length_294_cov_1.891213
+GTCTAACCTGTGTTGGGTGTGTTTGGTCGTCTCCCGTACTGAAGATTAGCGGTGCAAGTT
+ACACCCTTCAGATATAGTGGCCACATGACGTAGCCTTACCCCTGTTTCACTTTGTGGGAT
+CACAATTACAACTACCGTCTTTCTTATAGTAGCTGCTACACCCATTACAATACTCGTCTT
+GTTCAAGATGAAATCCGAGATCGTTTTTAGCAATCTGTTCAGTCTTTCCTAGTCCATTTT
+CAACCCCTTCAATGTGCACTCCAAGAACCCAAACACACCCAACACAGGTTAGAC
+>NODE_15_length_280_cov_1.413333
+GTCTAACCTGTGTTGGGTGTGTTTGGGGTCTGCGGATCACTCGGGAATGATTTGAAGTGG
+TTTTGCTTCCTGGGAGACGATGGTATATTAATTAGTGACCGAGATTTGGGAATGGCAGAA
+CTCAAAAAATACGGAAAAGCTTATTGCAACATGATACTGAAACCCAAGAGTAGTACCAGC
+AGTGCAACATTTTGCTGTTTTACAGTGTACAGAAACCAACTAGGACAAGCCAGGTTGGGA
+GCTGATCCCATCAGCCAAACACACCCAACACAGGTTAGAC
+>NODE_16_length_278_cov_0.901345
+GTCTAACCTGTGTTGGGTGTGTTTGGGCTGTAATCGAGGTATAGTGTCGAACAAGTCGGT
+GTCACTGTTGAATTCTATGGCGGCGAACTCAATGGAGTCAGTTATAGTGATCCTGCTACT
+GTGAAAAAATATGCTAGACGTGCTCAATTGGGTGAAATTTTTGAATTAGATCGTGCTACT
+TTAAAATCGGATGGTGTTTTTCGTAGCAGTCCAAGGGGTTGGTTTACTTTTGGACATGCG
+TCGTTTGCTCTGCTCTTCTTCCAAACACACCCAACACA
+>NODE_17_length_277_cov_1.540541
+GTCTAACCTGTGTTGGGTGTGTTTGGTGATTGATAGTTATTGTAGGCGAAACTACTTATG
+TAACTGATCCAGTTTTGGCAATCAACAACAATTTCCAACTACTAACAGTGGAAAAGTTGC
+AGGATTTGACATTTGAGGTTAGGATGAACACTCTACCATTCTGGATGATGCGTCCAGATC
+GTGGAGAGTTGATGAAGCAGCCAATGGGAGCCAGAGAAGCACTCAATTTCACAATGGATT
+GCCACAAAGCCCCCCAAACACACCCAACACAGGTTAG
+>NODE_18_length_274_cov_3.872146
+CTAACCTGTGTTGGGTGTGTTTGGCATTAGGTTGTAGCGTTTTGATGTTGATTTTATCGG
+GTCCCGGGCTCGCTCTGGAATGAACTTTGATTCTAGTCGTTGGCCCATAGTATGACACCC
+ACTCTCTTAGGTCTGTTTCCTCCCAAAGATCCATTATTCTAGCGTTGAGTTCACCAAATC
+TCAGGTTATTTGAACTTTCTTCTAATTCCCTCATGTTTACACCCAAATCACCACCTACTG
+ATACTCTACCAAACACACCCAACACAGGTTAGAC
+>NODE_19_length_271_cov_0.879630
+GTCTAACCTGTGTTGGGTGTGTTTGGTATGGAGGGAGGTGTATATGATACCTGGGCACCC
+GGAGGGGGAGATGTAAGAAAAATTACCAACTTGACCCTTAACCCAAGCGTGATATTTGGT
+TATTTACTAAAATCTCCTTTTGGGGGAGAAGGATGGATTGTTAGTGTGGACGATTTAGAA
+GATATAATTGGAGGACATGTCTGGTTAGGCTCCATTTGTATACTTGGTGGAATTTGGCAT
+ATCTTAACCAAACACACCCAACACAGGTTAG
+>NODE_20_length_267_cov_1.429245
+CTGTGTTGGGTGTGTTTGGACTTGGTATGTGAAGATACGTTGTTAGGTGCTCCGTTTTAT
+TTTCCCATTGAGGCCGAACCTAAACCTGTGCTCGAGAGATAGCTGTCCATATACTGATAA
+GGGATGTATGGATTCTCGAGAAGAGAGGAGCCATGGTGGTCCCTCCCGGACCGCCCGGAT
+CCCACGAGTGAATAGAAAGTTGGATCTACATTGGATCTCACCTGAATCGCCCCATAAACA
+ACCAAACACACCCAACACAGGTTAGAC
+>NODE_21_length_263_cov_1.177885
+GTCTAACCTGTGTTGGGTGTGTTTGGAGTGGGGGTATATTTAGACAATGAGATAGTAATG
+GTAATACAGCCATGCTATAACGCTGCCAACGACAGGGAGATACATTATGATCCAGATTAC
+CAAGAAGAACTAAGCTTACTTCTAAGACACTTAAATCTGATGAACGTGCTACAGCATTTT
+GATACGATTTTTTAACAGAAATCTATTTCAGAAAGTCAGAATTAGCCACACCCAACACCA
+AACACACCCAACACAGGTTAGAC
+>NODE_22_length_262_cov_1.053140
+GTCTAACCTGTGTTGGGTGTGTTTGGCTAGTCAGTAGCTTGTTATATGGGTCGTGAGTGG
+GAAGTTAGCTTCCGTCTGGGTATGCGCCCGTGGATTGCTGTTGCATATTCAGCTCCTGTT
+GCAGCTGCTACTGCTGTTTTCTTGATTTACCCAATTGGTCAAGGAAGTTTTTCTGATGGT
+ATGCCTCTAGGAATCTCTGGTACTTTCAACTTCATGATTGTATTCCAGGAGAGCACCCAA
+ACACACCCAACACAGGTTAGAC
+>NODE_23_length_260_cov_1.590244
+GTCTAACCTGTGTTGGGTGTGTTTGGGTTACCGTTGCTGTTCGGTGCTGGTTTGCTGGTG
+GATTGCTCTGACTCTTCTTGATCCGCGTGACCATAGAATAAGTTCTGAGCTTCCTCGGCT
+TGGGTTTTACCTGTTTCCACACCATTCTGGTTTAATTTGTCCTCTGAAGTTTCAATTAGT
+GGTATGTCGGTGTATAATTTAGCCAATTTCTTTAGCTCATGGGCCATCCTGCTTCCAAAC
+ACACCCAACACAGGTTAGAC
+>NODE_24_length_258_cov_0.935961
+GTGTTGGGTGTGTTTGGTTGGTGAACGCGCACCATTTAGTGGCAATCACGCGCGGGGAGG
+CTGAAAACTGCAAGCATAGATCTTTCGGCCCTTTCGAAGCTACCGCTTCCGAGAGCCTGG
+CTAAACTCTGCCCAGATTATCCGATCTGCTTGCCTGTACCTTACGACGTGATCAATAAAG
+TGTATAGGTATCTCAGAACGCTTAAGAAGCCTGATGTGCAGTCGCCCCACTACCAAACAC
+ACCCAACACAGGTTAGAC
+>NODE_25_length_256_cov_0.945274
+GTGTTGGGTGTGTTTGGCTGAAAAGCTTGGCGGACCTACTCCACCTAGATCCGTGACCAC
+CCTGATCAGATTGAACGATGGCGATGTCCAAACTTACACCAATCTCAACGTAATAACAAG
+GGATTTTGTAATGACTAGAACAAATTTGGTGGGTTGCAATACCGTGGCTAACGAGTCCGC
+TACAAAGTTGTTGATTTATGATTATGATGGTAGGGCACATCACAATTCCTCCAAACACAC
+CCAACACAGGTTAGAC
+>NODE_26_length_256_cov_0.895522
+GGTGCGCTCAATGTGGCACGTGCAACTTTATTTGGTTGCCCCACCATGAGGACAAGCTGA
+GCAACCAGCATTGTGGCATGTGCTTCTTTTCACTGGATTTGAAGCACATGGAAAATGATT
+GGTTCATTCCGGACATCATGGTCGAGGACATTAACCAATTGCACGTAGGGGCACTGCAAA
+AAGATATGTCGGAACTAATGAACCAACTGGATGGCGCAGAGGCTCACATACCAAACACAC
+CCAACACAGGTTAGAC
+>NODE_27_length_254_cov_0.793970
+CCTGTGTGGGGCCAACTGTCTGGAAATGATTCTAGGAAAGGTGGATTTGCCTTTCTTACG
+GCGTATAGCCAGCAGAGATAACATGTTCTCCAGCCAACATCTGGTGGATTATTTACATAT
+GCATGATCGAAATGCCGTGATTTTGATGAATGACGTTGCTGTGGCTCGAAGAATAAGAGA
+TGATTCCAATGCTTATTGCCGCATAGCGCATAGCAGCTACTTAGGCACCCAAACACACCC
+AACACAGGATAGAC
+>NODE_28_length_253_cov_1.313131
+GATCAACAGATCTTTTGAAATTAGAGGTAACTTTATTTGAAGGCAACTTAACAATTAAAG
+GTGATAACATCCAAGATCTGTTCAAATTAACCAAAATAGGTGGATCAAAATGGTTAACCA
+ACGATTCAACATTACTAGAGCATGATCCAAGGTGTGGCAGATTTTGCGTCAAAGTACAGG
+AATCTACAGAGTCACTCGTAGAAGAATTCTTAACGTCTTCATCCAAACCAAACACACCCA
+ACACAGGTTAGAC
+>NODE_29_length_250_cov_0.851282
+GTCTAACCTGTGTTGGGTGTGTTTGGGTTTCTTTGGAGCAACTCGATGAATTTAGTAAAT
+CCTTTTAGGAGGTTCCCAATGACCATAGATCGAACCTATCCAATTTTTACAGTGCGATGG
+TTGGCTGTTCACGGACTGGCTGTACCTACTGTTTCTTTTTTAGGGTCAATATCAGCAATG
+CAGTTCATCCAACGATAAACCTAATTCAAATTATAGAGCTAGCACACCAAACACACCCAA
+CACAGGTTAG
+>NODE_30_length_249_cov_1.298969
+GTGTTGGGTGTGTTTGGTTGATTTCTGACAAAATCACTTGCAAAAAGAAGCTTGCTTGGT
+TCTGTCTGCCCTAGAGATAACCGACTGCCAAACATTTGACTATGTTGATGCAGTGATGCC
+TGCGGGACTGGCCGAGCAGTGGTTACATGACACCATCCGGTTGCCAGGGTACGAGCTAGG
+GATGTTATTGGAACGAATTAGCATAGTTCCAGCTGCAATAGCCCCAAACACACCCAACAC
+AGGTTAGAC
+>NODE_31_length_249_cov_0.979381
+GTCTAACCTGTGTTGGGTGTGTTTGGCGAGTTGTGAGAGTGGAAAGCATGCAGTTTATGT
+CTTCTACAGCTTTGAATGAGAAATTCAAGCAGCTGATTGCAGAAGAAGGTATTGAAGGGA
+TGGAAGCGATGAATTCTGAATCAGTGGAACAGTTATTGGTGAATATAAGGGCCCATCCAG
+CCAGTTACCCTGAGGCAGCAGAGTTAACAAACATGCACAATTCACACAATAGTTTATGTT
+TGTGCGGGG
+>NODE_32_length_248_cov_0.979275
+GTCTAACCTGTGTTGGGTGTGTTTGGATATCGCTGTGCTTGTGATTGCTGACACTAGGGC
+GTCTGCTCTCCTATCTACGGGTAAGCTGTTATCTTCATAACCGCGCAACCTATATATTAT
+CTCGTGTGTATTCTTTGCATTAAATATAGACAGGTACTCTCCCCAATACCAACTAGTGTT
+AAACATGAAAGACTCAAGAGCTATTTGGTCACTCACTGTTTGTAGCTCAGCAACCACCAA
+ACACACCC
+>NODE_33_length_245_cov_1.000000
+TGTGTTGGGTGTGTTTGGGGCCTTGAGGAGTCATGGTTAGACGATTGGTAAATCATCCAT
+TCTCTTTTAACGCGAATCATACGTTCAGCAAGATAATTGCGGACGGCGTTGAACGGCATG
+GTGAGACGTTTTGGGTGAAAATTAAAACGAAGATTAATTTTCAAAATAATTTAGACGAAT
+GTGAATTCTAAATTTTAAAGCAAAAGGGGGGCCTTCCACCCAAACACACCCAACACAGGT
+TAGAC
+>NODE_34_length_245_cov_1.000000
+GTCTAACCTGTGTTGGGTGTGTTTGGATGGTGATCGGCAATTTAAAGGAATGTGTGCGAT
+ATTTTCACCAATATTCAAGGAGCTTAAAAATCGACTAAAAAGCGTGTTAGATATTAAATA
+CATGTATGCAGACGGATTGAGACCTGATCAGTTGTCGGAGCGCATGTCACAGATAGGTGC
+AGGTAAATATTTTATAGAGAATGATATGGAACAGCATCTCGCCAAACACACCCAACACAG
+GTTAG
+>NODE_35_length_242_cov_0.818182
+GTCTAACCTGTGTTGGGTGTGTTTGGGTGGGTAATGAAGTGTACATAATACCAGGTTGGT
+CCGACAGACCAAGCGTAACAGAAGTTTTAGACTACAAAGCTTGGACCAGAGCATATTATA
+TGATAAGCGATGGTTACATCTGTTGTATAGAACCACTGAGAATGGTTGACGACTTAGTGC
+TGAAGAAAATGACCTTAATAGGTAGGCAACCACAAGCCAAACACACCCAACACACCGTTG
+AC
+>NODE_36_length_240_cov_1.259459
+TCCGAATCAGTGTATTGGACACGGGCTATATCGGGATCGCGGTCGGACGATTGGTAAATC
+GACCATTCTCGTTTGACACGAATTAAGCGTTCAGCTAAATAATTTCGTACAGCGTTGAAG
+GGCATCGTAGGACGTTGGGTGAAAATTACAAATTGGGAGTTTGGATTTTCGAGAGAATTA
+GACGAATGTAAATTCTTGAATTAAAAAGGGGGGGGCGTCATCCCAAACACACCCAACACA
+>NODE_37_length_239_cov_1.032609
+TGTGTTGGGTGTGTTTGGCTTGGAGGGAAGGTACAACATTGGTGTCCCTCCTGCGGACAC
+TAACGTTCCTGCGGTGGTTTCTAACCCCAGGTGTAACTTTCTCCAATCAGTCAACTCTTG
+AATAAAAGGGGCATAAGTGAGTGCTCCAGATATGAAGTCCAGGAGGCCTTGTTTCTCACC
+CTTGACGTTGTAACCATTACTATACTCCCGCACCCAAACACACCCAACACAGGTTAGAC
+>NODE_38_length_239_cov_1.032609
+TTCATAATGTGGCAATATGCACATCTACGATGCCCTATACATTCTGCGTCAACACACACT
+ATTGTTAATTTCTTATCCACCATAGTAATATGGGGCACTCTGGTCCAATTTGTTTTCAAC
+ATCGCATATTGCATATCTTTTATGGTGCGTCCGAATTTTTTGATGATTTGCTGGATGGCC
+ATGTCTAGCAATTCAGGCAAACCTCCTTCCTCTACAGTCACCCAAACACACCCAACACA
+>NODE_39_length_238_cov_1.038251
+GTTGGGTGTGTTTGGGGGGCTTACGAGAAGAGAATGTGGCCAGATTGGCAGAAATAGAGA
+GAAAGAAGCTAGAAGATTTAAGGTTGGCTGAGATGGAAAGAATTGTGATAAAGGTGAGTG
+CTACAGTTCAGGGAAAGGAAATGGCATTTGCTAACAAAGGTGGGAATCCGATTTTTTTGA
+TAAGTGGAGTTGTAATTGATCCAGTGATCAAGCCAAACACACCCAACACAGGTTAGAC
+>NODE_40_length_238_cov_0.879781
+CCGTGTAAGATGCGCTGAAGGTTCAAGCTCCTGCACATTGCATGGTGCCGAATTGTTTGA
+AATGCCTTTGGGTTTCCAGGGGAGCCACAAGCATTCAGTGCGCGGTTGTACGGCGGGACG
+TTGCAGTGCCACTTTCAGGTGTTTGAAACGAGAATTAGAACCGCTTGATGAGCCCGAAGT
+GGTCCATGTGGAGGGCTGTACCGGATCTAGTGAAGAATCAGGCGGTGATGGGCAGGTT
+>NODE_41_length_236_cov_1.049724
+GTCTAACCTGTGTTGGGTGTGTTTGGACAAGGTGATTTGAGATACATAAGCAGAAAAACC
+ATCGCCAATCTATCTCGAGAAGATATTGAGATTGTGGAAGAACATGAAATAAGTGGTGAG
+GATCTCCTGTGTGGGGCCAACTGTCTGGAAATGATTCTAGGAAAGGTGGATTTGCCTTTG
+TTACGGCGTATAGCCAGCAGAGATAACATGTTTCTCCAGCCAAACACACCCAACAC
+>NODE_42_length_235_cov_1.855556
+TGTGTTGGGTGTGTTTGGGGATTGCTGTGGTGTGCATGTCCTCCAATGTGATTACGATCT
+TTTTGACCAATAATATGGTCAACTGCAATTGATTTTCACTAATTTGCTCTATTTGTTTGT
+GTTTCACTTTTGTGCTTATCAACCTGTGCAGATCATGTATCGTCATCTCTTGTATACTGA
+AACATTTGTTTTGATCTCCCTTCATCCCCCCAAACACACCCAACACAGGTTAGAC
+>NODE_43_length_234_cov_1.061453
+TGTGTTGGGTGTGTTTGGTTGAGTATTGGGTTATGGTGGAGTTTTTAACTGGTTTCATGT
+CATGATTTTGACTCCAAAAATTTACTAGAATTGGGTAGGTATCCCAAAGAGAAGAAGTAG
+TACTAATTCCTTGATTTTGTATGGGAAAATTTTCATATGTAATTCATCTACAAAGATAAG
+ACATTAATGATGAACCAAACCAAGCGGCCAAACACACCCAACACAGGTTAGACC
+>NODE_44_length_232_cov_1.073446
+TGTGTTGGGTGTGTTTGGAAGTAGTGGAGGGGAAAGCGCCTAATGAGGCAATGATAATAG
+ACGACGCAACACGCCCCGGGTCGGTAAACAGGTGGGCAGCTGCCGAATGTCTCAAAGTAG
+ATATACCCGATGTGCATTACAATGACTGCTACGTCATGTATAATAACACGGGAATAGAAA
+GGGATGACCACAGAGCCGTCAACGTGCCAAACACACCCAACACAGGTTAGAC
+>NODE_45_length_232_cov_1.073446
+TGTGTTGGGTGTGTTTGGGAGTCGTCGGGGTTCAATATTACATTTACTACACCTTATACC
+TAATGCTAGGCGTCATAGATGATGTCAGAGCGAGTGATAAGGGATCAAGCCTCGACTATT
+GTTGTTGTTGTCTATGGACAGACGGGACCACGTGTTCCGTTTTGTGATGTAGACTTCACG
+CTTATCTCTAATCGAGCCATCAACCTCCAAACACACCCAACACAGGTTAGAC
+>NODE_46_length_229_cov_1.091954
+TGTGTTGGGTGTGTTTGGTTGGATGCCTGGAATACAATCATGAAATTGAAAGTACCAGAT
+ATTCCTAAAGGCATGCCATCTGAAAAACTTCCTTGACCAATAGGGTAGATCAAGAAAACA
+GCTGTAGCAGCCGCGACAGGAGCTGAATATGCAACAGCAATCCAAGGACGCATACCCAGA
+CGGAAACTAAGCTCCCTCTCGCTCCAAACACACCCAACACAGGTTAGAC
+>NODE_47_length_229_cov_0.816092
+TTGGTAAATTGGCGGAAAGAGGAGGACTCAATGATTATTCGTTCGCCGGAACCAGAAGTA
+AAAATTTTGGTAGATAGGGATCACATAAAAACTTCTTTCGAGGAATGGGCCAGGCCGGGT
+CATTTCTCAAGAACACTAGCTAAAGGCCCTGACACTACCACTTGGATCTGGAACCTACAT
+GCTGATGCTCACGATCTTAATAGCCAAACACACCCAACACAGGTTAGAC
+>NODE_48_length_227_cov_1.273256
+GTCTAACCTGTGTTGGGTGTGTTTGGGAGACAGGAGTGTCAAAATTGATCAATTCAATCA
+AAAATTTGCCAAATCTTGAGGTGGTTAGATTAAGGCCAACTCGTAGATTAATCAAAGTGC
+AGCGTGATGGACCAACCGCCACCAGCAAAGCATCGAGAGATGACGTGCCGCCAACTCATG
+ACACGATGCACAACACAGGATCCGTGGCAACCAAACACACCCAACAC
+>NODE_49_length_227_cov_1.017442
+CTATCATGTGTAAGTAAGACATGCCTCCTGCCATTACTGGATTTGGCATTCCCATACTCA
+CGCCTATATCTGATAATTTTTCTTGTAAATTGTTACATTGCCTCATGTCGTGAATTTTGA
+CAAATTTAAGTTTTTCCATGGTCTTTAGCTCATCACTTACATAACTTGACACAGCTATAT
+AACTCCTGTTAGCATGTCCTCTCATCCATTGACTTAATTCATCTTTT
+>NODE_50_length_226_cov_2.269006
+GTCAACGGTGTGTTGGGTGTGTTTGGGAAAGGTCCTGGAATATGGGTGTCCGATCCTTAT
+GGACTAACCGGAACAGTGCAACCTGTAAATCCGGCGTGGGGCGTGGAAGGTTTTGATCCT
+TTTGTCCCGGGAGGAATAGCTTCTCATCATATTGCAGCAGGTACATTGGGCATATTAGCG
+GGCCTATTCCATCTTAGCGTACGGTCACCCCAGCCAAACACACCCA
+>NODE_51_length_225_cov_1.117647
+GTCTAACCTGTGTTGGGTGTGTTTGGTCGATCTGGCCGTTGTTAAGTATTTGCTCACGAT
+GTGCTTCAACCTTTGCTCGCCAAATTCTATAACATAAGTGGGTTGTCCATACTGTATCGT
+CAATCTTTTGACTTTGTTCCTTTCCATTATTTCTTGCGCTAATTCATTTGAAAAACTAAA
+CCCAACGGCCACCCATTTGCTTCGACCAAACACACCCAACACAGG
+>NODE_52_length_225_cov_0.917647
+GTCTAACCTGTGTTGGGTGTGTTTGGTTCCCTAGTGAGGCTGGTTTTCCCATGGTGTGAG
+AATAGCCGCTATTAACTTGATTACGCATCTCTGGTTCAACCCATTCCCCGCTAACATTCA
+CTTGGTCATGCGCGTAAGGACTATCGCTCGCGCTGAAACTTGGACCAGGTTGACCATCGT
+CTTCAATCTCATCACACTACCAAACACACCCAACACAGGTTAGAC
+>NODE_53_length_223_cov_3.303571
+TCTAACCTGTGTTGGGTGTGTTTGGTTCTCATGTCAATTTGTAATGTGTGGGCTCATCCC
+TTATTGGTATGTCATGGGTTTTCCACTTGGCACTGCTGGTCGGCAAATCTTTCCAAATCT
+CGCCACATATTTGTATATCTTGATCTTGCATGAATCTGCGCCCAAAGTAGTTAGGGATAC
+TTTGAGTTTTGAGCCGCATGCTATTAGCAATCATGGTTATTTC
+>NODE_54_length_223_cov_1.803571
+GTCTAACCTGTGTTGGGTGTGTTTGGTCGATTAATGGGAGTTCAACCAAATTCATAACTG
+TCTCGATGTCATCCTTTCCTTCCTTTTTATTTTGATTGTCTAAATATTCAGCTAAGACCA
+TTCCAACGCCCCCTTTCGCCATGCATAAACTGAACCCACAATTGGGATAAGCACGAAAAT
+GAAAGCCTCACGTTCACCCAAACACACCCAACACAGGTTAGAC
+>NODE_55_length_216_cov_1.596273
+GTTTTACCATCACTCTGTTACCTTGTCTTGTTATGAATAAATTTGTTTTAGGTTTACTGT
+TAACTAATACACTATACCCGAACGTGGAAATAAACAACTTGATGCAATTGTATAACAAAG
+TTCCTCCTAACCTTTCGTCAGATCCCTCTTTGTATCTATTGGAACTCATTTTGAGGCTGT
+CTGCTATTATTCTCACCTCCCAAACACACCCAACAC
+>NODE_56_length_216_cov_1.180124
+GTGTTGGGTGTGTTTGGGGTCTATGTGGTTTATTTGGTTCTACTGAACCAACATTAAATT
+TTGAAATATTAACTAATCAGTCCTATCCTGTGGCCTTGGAAATAATATTTTATATTGGAT
+TTTTTCTTGCTTTTGCTGTAAAATTACCAATCATACCCCTACATACATGGTTACCAGATA
+CCCACGAGAGCCAAACACACCCAACACAGGTTAGAC
+>NODE_57_length_216_cov_0.869565
+GTCTAACCTGTGTTGGGTGTGTTTGGATAGTTAGCGAGGTAGGTACTGAGCTGTTTACAT
+AGGGGGGGAGTTCGTGTGTTTAGCTTAGGTTTCTGCTAGTCTTGTTTTGATAAATATGAA
+TATAGTATTAGATACTCTTGTGAAGTATAAATTTGTAAGATTGAGTAGTAGTTTGACTAA
+GCCCATGATCGTGCCAAACACACCCAACACAGGTTA
+>NODE_58_length_215_cov_1.668750
+GTCTAACCTGTGTTGGGTGTGTTTGGGCACTGGGGTTCAATTTAAAGTTCATTGTGCACA
+TAGACCGCAAGCTGCCTCCAAATTTTTGTTTGATCAAGTCCATCATAAATTTGAGTGCCA
+CTGGATCTCGCGTTCCGTCTTCTTTCACTGCAGGTATCACTTCTGGCCTCATGGTCGTCC
+AATACGCCCTTGCTGCCCAAACACACCCAACACAG
+>NODE_59_length_215_cov_1.187500
+GTCTAACCTGTGTTGGGTGTGTTTGGGGGTGGTAGGACGGTAGGGGTCGCTAGGTCAGGA
+ACATCATCTTCAAAGTCATTGAAAAATTGGCGTTGAAAATAAAGGCTAGCGCGGGGGTCA
+GGCTTATAATCATCTCTGAAGATGTTGTAAACACCTTGGCAAAATGAGTGAAAGTATAAA
+TCTTGGCCGGCGGATGCATAGGCAATTCCGACAGC
+>NODE_60_length_215_cov_0.843750
+AAAGATCGAATTTTTAGTGGAGATGGCCACAACATGTACCAAGGGTCAACTGACACCCAC
+TTGCATATAAACCAATTTTCTGGTAACTTTTTATTAATCAATGCCACATATTTCTTATTC
+TGGCTGTTGATTTCATTCGGCCCAATCAGCACTTCATATATTCTTCCAATGGACAAGCGT
+GACTACTTACCCAAACACACCCAACACAGGTTAGA
+>NODE_61_length_214_cov_1.232704
+GTCTAACCTGTGTTGGGTGTGTTTGGTTGTAAGGATGCTTGATGCGCATGAGCAAGTGTT
+CTCGTCTGCTCTATATAATGTCCTGTCTGCCATTACTCATCGTGGGAGGCATAATCATGA
+AACAGGTTTTCGTAACACAACGGTTCGTGCCTCTTCGGACTGGGCTATGATGTGGGAGGA
+GGTCCACGCTGCGTATCCAAACACACCCAACACA
+>NODE_62_length_213_cov_0.936709
+GTCTAACCTGTGTTGGGTGTGTTTGGATCGAGTTGGGTTATGTTCATCAGGGACCATCCG
+GCAACAAAGTATCTCAAGCCCCTGCGTGGACTCAGAAAGCATACGGCATTGCACTGCATC
+AGTGATGAAGTAAGACCGAGGATCAGGTGCCTCCTGGGAGCATTAAACCCCCACCGCCGA
+TGACCATCCAAACACACCCAACACAGGTTAGAC
+>NODE_63_length_210_cov_1.225806
+TGTGTTGGGTGTGTTTGGCTTTCTGGCTCCATAGGTTTTAACCACTACTCTGTCAGTTGG
+ACCAACATTTTTGAGCAACCTTTCGGTTTTCCCGCTACCAGCAGGTCCTACAATGGCTTT
+CATTTGGGCAATCAATCTTTTCATAGTGTCCCATGATGCTATTCCCCTGTTCACCGCTCT
+TAGGCCAAACACACCCAACACAGGTTAGAC
+>NODE_64_length_208_cov_1.019608
+GTCTAACCTGTGTTGGGTGTGTTTGGTATGTTATTGCTCCTGATGTGCAAGGATACCCCC
+TTGATCCTCGTCTCTACAACATGATCACTACGAGGTACCCAGATTACCTGCCCATCATTA
+ACCTCTACTGCCGACCACTCGGAACCACCGAAGCTACCTTCGCTGATTTCAACAAAGAGC
+AGATTCCCTCTGATCCCATCTCAGATGA
diff -r 000000000000 -r b82ce29791e7 test-data/blast2tsv_contigs.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/blast2tsv_contigs.txt Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,6 @@
+1 Viruses Monodnaviria Shotokuvirae Cossaviricota Papovaviricetes Zurhausenvirales Papillomaviridae Firstpapillomavirinae Upsilonpapillomavirus Upsilonpapillomavirus 2
+1 cellular organisms Bacteria Thermodesulfobacteriota Desulfovibrionia Desulfovibrionales Desulfovibrionaceae Desulfovibrio unclassified Desulfovibrio
+2 cellular organisms Eukaryota Opisthokonta Metazoa Eumetazoa Bilateria Protostomia Ecdysozoa Panarthropoda Arthropoda Mandibulata Pancrustacea Hexapoda Insecta Dicondylia Pterygota Neoptera Polyneoptera Dictyoptera Blattodea Blattoidea Termitoidae Rhinotermitidae Heterotermitinae Heterotermes unclassified Heterotermes
+1 cellular organisms Eukaryota Opisthokonta Metazoa Eumetazoa Bilateria Protostomia Spiralia Lophotrochozoa Nemertea Enopla Hoplonemertea Monostilifera Eumonostilifera Tetrastemmatidae Tetrastemma
+1 cellular organisms Archaea environmental samples
+1 cellular organisms Bacteria Terrabacteria group Actinomycetota Actinomycetes Mycobacteriales Nocardiaceae Nocardia unclassified Nocardia
diff -r 000000000000 -r b82ce29791e7 test-data/blast2tsv_input.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/blast2tsv_input.xml Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,1665 @@
+
+
+
+ rpstblastn
+ RPSTBLASTN 2.14.1+
+ Stephen F. Altschul, Thomas L. Madden, Alejandro A. Schäffer, Jinghui Zhang, Zheng Zhang, Webb Miller, and David J. Lipman (1997), "Gapped BLAST and PSI-BLAST: a new generation of protein database search programs", Nucleic Acids Res. 25:3389-3402.
+ /data/db/databases/blast/2018-01-22/pfam/Pfam
+ Query_1
+ NODE_1_length_506_cov_10.687361
+ 506
+
+
+ BLOSUM62
+ 0.0001
+ 11
+ 1
+ F
+
+
+
+
+ 1
+ Query_1
+ NODE_1_length_506_cov_10.687361
+ 506
+
+
+
+
+ 16305
+ 2821655
+ 80
+ 133518440
+ 0.083353464
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 2
+ Query_2
+ NODE_2_length_429_cov_3.631016
+ 429
+
+
+
+
+ 16305
+ 2821655
+ 78
+ 100741225
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 3
+ Query_3
+ NODE_3_length_365_cov_1.074194
+ 365
+
+
+
+
+ 16305
+ 2821655
+ 75
+ 73543880
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 4
+ Query_4
+ NODE_4_length_351_cov_1.547297
+ 351
+
+
+
+
+ 16305
+ 2821655
+ 74
+ 69448655
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 5
+ Query_5
+ NODE_5_length_344_cov_3.273356
+ 344
+
+
+
+
+ 16305
+ 2821655
+ 72
+ 69203190
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 6
+ Query_6
+ NODE_6_length_338_cov_1.314488
+ 338
+
+
+
+
+ 16305
+ 2821655
+ 70
+ 70572810
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 7
+ Query_7
+ NODE_7_length_335_cov_1.714286
+ 335
+
+
+
+
+ 16305
+ 2821655
+ 70
+ 68892505
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 8
+ Query_8
+ NODE_8_length_331_cov_0.862319
+ 331
+
+
+
+
+ 16305
+ 2821655
+ 69
+ 69561010
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 9
+ Query_9
+ NODE_9_length_324_cov_2.141264
+ 324
+
+
+
+
+ 16305
+ 2821655
+ 67
+ 70898020
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 10
+ Query_10
+ NODE_10_length_324_cov_1.371747
+ 324
+
+
+
+
+ 16305
+ 2821655
+ 67
+ 70898020
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 11
+ Query_11
+ NODE_11_length_317_cov_1.125954
+ 317
+
+
+
+
+ 16305
+ 2821655
+ 65
+ 70473200
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 12
+ Query_12
+ NODE_12_length_311_cov_1.535156
+ 311
+
+
+
+
+ 16305
+ 2821655
+ 64
+ 69347265
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 13
+ Query_13
+ NODE_13_length_295_cov_0.945833
+ 295
+
+
+ 1
+ gnl|CDD|316155
+ pfam13603, tRNA-synt_1_2, Leucyl-tRNA synthetase, Domain 2. This is a family of the conserved region of Leucine-tRNA ligase or Leucyl-tRNA synthetase, EC:6.1.1.4.
+ 316155
+ 184
+
+
+ 1
+ 38.6378
+ 91
+ 2.277e-05
+ 159
+ 269
+ 128
+ 168
+ 3
+ 0
+ 17
+ 22
+ 4
+ 41
+ FIKQYGLPFNPVIAPEDAELTDEQIQSYINTA---NS-FFN
+ FAKKYNLPIKPVIKPEDGDLPDIMTEAYTEEGILVNSGEFD
+ F K+Y LP PVI PED +L D ++Y NS F+
+
+
+
+
+
+
+ 16305
+ 2821655
+ 60
+ 70047490
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 14
+ Query_14
+ NODE_14_length_294_cov_1.891213
+ 294
+
+
+
+
+ 16305
+ 2821655
+ 60
+ 70047490
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 15
+ Query_15
+ NODE_15_length_280_cov_1.413333
+ 280
+
+
+
+
+ 16305
+ 2821655
+ 56
+ 70617275
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 16
+ Query_16
+ NODE_16_length_278_cov_0.901345
+ 278
+
+
+ 1
+ gnl|CDD|306845
+ pfam00421, PSII, Photosystem II protein.
+ 306845
+ 500
+
+
+ 1
+ 132.634
+ 334
+ 7.65615e-39
+ 34
+ 270
+ 388
+ 466
+ 1
+ 0
+ 52
+ 61
+ 0
+ 79
+ SRYSVEQVGVTVEFYGGELNGVSYSDPATVKKYARRAQLGEIFELDRATLKSDGVFRSSPRGWFTFGHASFALLFFQTH
+ SGYSLEQTGVTVQFYGGELNGQTFTDPWQVKRYARHAQLGELNSVDRVTTESDGVFRVSPRGWLAFSHFCFALLFFFGH
+ S YS+EQ GVTV+FYGGELNG +++DP VK+YAR AQLGE+ +DR T +SDGVFR SPRGW F H FALLFF H
+
+
+
+
+
+
+ 16305
+ 2821655
+ 55
+ 71220560
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 17
+ Query_17
+ NODE_17_length_277_cov_1.540541
+ 277
+
+
+
+
+ 16305
+ 2821655
+ 55
+ 71220560
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 18
+ Query_18
+ NODE_18_length_274_cov_3.872146
+ 274
+
+
+
+
+ 16305
+ 2821655
+ 55
+ 69295680
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 19
+ Query_19
+ NODE_19_length_271_cov_0.879630
+ 271
+
+
+ 1
+ gnl|CDD|306845
+ pfam00421, PSII, Photosystem II protein.
+ 306845
+ 500
+
+
+ 1
+ 56.3644
+ 136
+ 1.69015e-11
+ 82
+ 252
+ 165
+ 224
+ 1
+ 0
+ 23
+ 34
+ 23
+ 70
+ ITNLTLNPSVIFGYL-------------LKSPFGGEGWIVSVDDLEDIIGGHVWLGSICILGGIWHILTK
+ VSDPTLDPGVIYGYTGHVQPVAPVWGAEGFSPFGPGG----------IVGHHIAAGILGIIGGIFHITTR
+ +++ TL+P VI+GY SPFG G I+G H+ G + I+GGI+HI T+
+
+
+
+
+
+
+ 16305
+ 2821655
+ 54
+ 69882660
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 20
+ Query_20
+ NODE_20_length_267_cov_1.429245
+ 267
+
+
+ 1
+ gnl|CDD|287774
+ pfam10839, DUF2647, Protein of unknown function (DUF2647). This eukaryotic family of proteins are annotated as ycf68 but have no known function.
+ 287774
+ 70
+
+
+ 1
+ 48.4966
+ 115
+ 7.70073e-10
+ 165
+ 233
+ 22
+ 44
+ -2
+ 0
+ 21
+ 22
+ 0
+ 23
+ GAIQVRSNVDPTFYSLVGSGRSG
+ GAIQVRSHVDLTFYSLVGSGRSG
+ GAIQVRS+VD TFYSLVGSGRSG
+
+
+ 2
+ 43.1038
+ 101
+ 7.90575e-08
+ 88
+ 222
+ 22
+ 70
+ -1
+ 0
+ 23
+ 27
+ 4
+ 49
+ GEIQCRSN----FLFTRGIRAVREGPPWLLSSRESIHPLSVYGQLSLEH
+ GAIQVRSHVDLTFYSLVGSGRSGGGPPALLFSREHIHLISVWGAISLAH
+ G IQ RS+ F G GPP LL SRE IH +SV+G +SL H
+
+
+ 3
+ 42.7186
+ 100
+ 1.07047e-07
+ 86
+ 175
+ 41
+ 70
+ -3
+ 0
+ 17
+ 18
+ 0
+ 30
+ GGPGGTTMAPLFSRIHTSLISIWTAISRAQ
+ GRSGGGPPALLFSREHIHLISVWGAISLAH
+ G GG A LFSR H LIS+W AIS A
+
+
+
+
+
+
+ 16305
+ 2821655
+ 53
+ 70469640
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 21
+ Query_21
+ NODE_21_length_263_cov_1.177885
+ 263
+
+
+
+
+ 16305
+ 2821655
+ 52
+ 69082825
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 22
+ Query_22
+ NODE_22_length_262_cov_1.053140
+ 262
+
+
+ 1
+ gnl|CDD|306604
+ pfam00124, Photo_RC, Photosynthetic reaction centre protein.
+ 306604
+ 258
+
+
+ 1
+ 99.6256
+ 249
+ 4.94039e-28
+ 31
+ 228
+ 77
+ 142
+ 1
+ 0
+ 27
+ 41
+ 0
+ 66
+ SVACYMGREWEVSFRLGMRPWIAVAYSAPVAAATAVFLIYPIGQGSFSDGMPLGISGTFNFMIVFQ
+ AFISWWLREYEIARKLGMGPHIAWAFSAAIAAYLSLGLIRPILMGSWSEGFPLGIFPHLDWTSNFS
+ + + RE+E++ +LGM P IA A+SA +AA ++ LI PI GS+S+G PLGI ++ F
+
+
+
+
+
+
+ 16305
+ 2821655
+ 52
+ 69082825
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 23
+ Query_23
+ NODE_23_length_260_cov_1.590244
+ 260
+
+
+
+
+ 16305
+ 2821655
+ 51
+ 69653500
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 24
+ Query_24
+ NODE_24_length_258_cov_0.935961
+ 258
+
+
+ 1
+ gnl|CDD|307679
+ pfam01660, Vmethyltransf, Viral methyltransferase. This RNA methyltransferase domain is found in a wide range of ssRNA viruses, including Hordei-, Tobra-, Tobamo-, Bromo-, Clostero- and Caliciviruses. This methyltransferase is involved in mRNA capping. Capping of mRNA enhances its stability. This usually occurs in the nucleus. Therefore, many viruses that replicate in the cytoplasm encode their own. This is a specific guanine-7-methyltransferase domain involved in viral mRNA cap0 synthesis. Specificity for guanine 7 position is shown by NMR in and in vivo role in cap synthesis. Based on secondary structure prediction, the basic fold is believed to be similar to the common AdoMet-dependent methyltransferase fold. A curious feature of this methyltransferase domain is that it together with flanking sequences seems to have guanylyltransferase activity coupled to the methyltransferase activity. The domain is found throughout the so-called Alphavirus superfamily, (including alphaviruses and several other groups). It forms the defining, unique feature of this superfamily.
+ 307679
+ 305
+
+
+ 1
+ 65.0021
+ 159
+ 8.38713e-15
+ 27
+ 230
+ 226
+ 296
+ 3
+ 0
+ 28
+ 38
+ 3
+ 71
+ AHHLVAITRGEA--ENCKHRSFGPFEATASESLAKL-CPDYPICLPVPYDVINKVYRYLRTLKKPDVQSPH
+ AHHLFKITRGDGLTLKPDSRTFGPFEAVLLPKIFVPRVLNYIRGKPIPLTVVNKLFSYLRSLKKRVVINGM
+ AHHL ITRG+ R+FGPFEA + +Y P+P V+NK++ YLR+LKK V +
+
+
+
+
+
+
+ 16305
+ 2821655
+ 51
+ 69653500
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 25
+ Query_25
+ NODE_25_length_256_cov_0.945274
+ 256
+
+
+
+
+ 16305
+ 2821655
+ 50
+ 70224175
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 26
+ Query_26
+ NODE_26_length_256_cov_0.895522
+ 256
+
+
+
+
+ 16305
+ 2821655
+ 50
+ 70224175
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 27
+ Query_27
+ NODE_27_length_254_cov_0.793970
+ 254
+
+
+
+
+ 16305
+ 2821655
+ 49
+ 70794850
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 28
+ Query_28
+ NODE_28_length_253_cov_1.313131
+ 253
+
+
+
+
+ 16305
+ 2821655
+ 49
+ 70794850
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 29
+ Query_29
+ NODE_29_length_250_cov_0.851282
+ 250
+
+
+ 1
+ gnl|CDD|278700
+ pfam00283, Cytochrom_B559, Cytochrome b559, alpha (gene psbE) and beta (gene psbF)subunits.
+ 278700
+ 29
+
+
+ 1
+ 42.0012
+ 99
+ 7.31211e-08
+ 79
+ 165
+ 1
+ 29
+ 1
+ 0
+ 17
+ 19
+ 0
+ 29
+ MTIDRTYPIFTVRWLAVHGLAVPTVSFLG
+ GERPFSYPITTVRWWAIHALTVPTVFFLG
+ +YPI TVRW A+H L VPTV FLG
+
+
+
+
+
+
+ 16305
+ 2821655
+ 48
+ 71365525
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 30
+ Query_30
+ NODE_30_length_249_cov_1.298969
+ 249
+
+
+
+
+ 16305
+ 2821655
+ 48
+ 71365525
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 31
+ Query_31
+ NODE_31_length_249_cov_0.979381
+ 249
+
+
+
+
+ 16305
+ 2821655
+ 48
+ 71365525
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 32
+ Query_32
+ NODE_32_length_248_cov_0.979275
+ 248
+
+
+
+
+ 16305
+ 2821655
+ 48
+ 69326510
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 33
+ Query_33
+ NODE_33_length_245_cov_1.000000
+ 245
+
+
+
+
+ 16305
+ 2821655
+ 47
+ 69880880
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 34
+ Query_34
+ NODE_34_length_245_cov_1.000000
+ 245
+
+
+ 1
+ gnl|CDD|250270
+ pfam00978, RdRP_2, RNA dependent RNA polymerase. This family may represent an RNA dependent RNA polymerase. The family also contains the following proteins: 2A protein from bromoviruses putative RNA dependent RNA polymerase from tobamoviruses Non structural polyprotein from togaviruses.
+ 250270
+ 441
+
+
+ 1
+ 45.7137
+ 109
+ 6.42106e-08
+ 44
+ 211
+ 164
+ 219
+ 2
+ 0
+ 21
+ 31
+ 0
+ 56
+ KGMCAIFSPIFKELKNRLKSVLDIKYMYADGLRPDQLSERMSQIGAGKYFIENDME
+ KLVTAYFSPIFRELFERLLYVLKPKVVFPTGMTSSLIAERFEFLDASEDFLEIDFS
+ K + A FSPIF+EL RL VL K ++ G+ ++ER + A + F+E D
+
+
+
+
+
+
+ 16305
+ 2821655
+ 47
+ 69880880
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 35
+ Query_35
+ NODE_35_length_242_cov_0.818182
+ 242
+
+
+
+
+ 16305
+ 2821655
+ 46
+ 70435250
+ 0.08832702
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 36
+ Query_36
+ NODE_36_length_240_cov_1.259459
+ 240
+
+
+
+
+ 16305
+ 2821655
+ 46
+ 70435250
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 37
+ Query_37
+ NODE_37_length_239_cov_1.032609
+ 239
+
+
+
+
+ 16305
+ 2821655
+ 45
+ 70989620
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 38
+ Query_38
+ NODE_38_length_239_cov_1.032609
+ 239
+
+
+
+
+ 16305
+ 2821655
+ 45
+ 70989620
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 39
+ Query_39
+ NODE_39_length_238_cov_1.038251
+ 238
+
+
+
+
+ 16305
+ 2821655
+ 45
+ 70989620
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 40
+ Query_40
+ NODE_40_length_238_cov_0.879781
+ 238
+
+
+
+
+ 16305
+ 2821655
+ 45
+ 70989620
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 41
+ Query_41
+ NODE_41_length_236_cov_1.049724
+ 236
+
+
+
+
+ 16305
+ 2821655
+ 45
+ 68901690
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 42
+ Query_42
+ NODE_42_length_235_cov_1.855556
+ 235
+
+
+
+
+ 16305
+ 2821655
+ 45
+ 68901690
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 43
+ Query_43
+ NODE_43_length_234_cov_1.061453
+ 234
+
+
+
+
+ 16305
+ 2821655
+ 45
+ 68901690
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 44
+ Query_44
+ NODE_44_length_232_cov_1.073446
+ 232
+
+
+
+
+ 16305
+ 2821655
+ 44
+ 69439755
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 45
+ Query_45
+ NODE_45_length_232_cov_1.073446
+ 232
+
+
+
+
+ 16305
+ 2821655
+ 44
+ 69439755
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 46
+ Query_46
+ NODE_46_length_229_cov_1.091954
+ 229
+
+
+ 1
+ gnl|CDD|306604
+ pfam00124, Photo_RC, Photosynthetic reaction centre protein.
+ 306604
+ 258
+
+
+ 1
+ 86.1436
+ 214
+ 4.26406e-23
+ 24
+ 194
+ 87
+ 143
+ -3
+ 0
+ 25
+ 36
+ 0
+ 57
+ ELSFRLGMRPWIAVAYSAPVAAATAVFLIYPIGQGSFSDGMPLGISGTFNFMIVFQA
+ EIARKLGMGPHIAWAFSAAIAAYLSLGLIRPILMGSWSEGFPLGIFPHLDWTSNFSY
+ E++ +LGM P IA A+SA +AA ++ LI PI GS+S+G PLGI ++ F
+
+
+
+
+
+
+ 16305
+ 2821655
+ 43
+ 69977820
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 47
+ Query_47
+ NODE_47_length_229_cov_0.816092
+ 229
+
+
+ 1
+ gnl|CDD|306687
+ pfam00223, PsaA_PsaB, Photosystem I psaA/psaB protein.
+ 306687
+ 717
+
+
+ 1
+ 61.3066
+ 149
+ 1.79906e-13
+ 124
+ 222
+ 1
+ 33
+ 1
+ 0
+ 22
+ 24
+ 0
+ 33
+ FSRTLAKGPDTTTWIWNLHADAHDLNSQTHPTQ
+ FSRDLAQGPKTTTWIWNLHATAHDFESHDGDTE
+ FSR LA+GP TTTWIWNLHA AHD S T+
+
+
+
+
+
+
+ 16305
+ 2821655
+ 43
+ 69977820
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 48
+ Query_48
+ NODE_48_length_227_cov_1.273256
+ 227
+
+
+
+
+ 16305
+ 2821655
+ 42
+ 70515885
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 49
+ Query_49
+ NODE_49_length_227_cov_1.017442
+ 227
+
+
+
+
+ 16305
+ 2821655
+ 42
+ 70515885
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 50
+ Query_50
+ NODE_50_length_226_cov_2.269006
+ 226
+
+
+ 1
+ gnl|CDD|306845
+ pfam00421, PSII, Photosystem II protein.
+ 306845
+ 500
+
+
+ 1
+ 89.1064
+ 221
+ 2.77182e-23
+ 31
+ 213
+ 160
+ 227
+ 1
+ 0
+ 41
+ 45
+ 7
+ 68
+ GPGIWVSDP-------YGLTGTVQPVNPAWGVEGFDPFVPGGIASHHIAAGTLGILAGLFHLSVRSPQ
+ GLGTWVSDPTLDPGVIYGYTGHVQPVAPVWGAEGFSPFGPGGIVGHHIAAGILGIIGGIFHITTRPPG
+ G G WVSDP YG TG VQPV P WG EGF PF PGGI HHIAAG LGI+ G+FH++ R P
+
+
+
+
+
+
+ 16305
+ 2821655
+ 42
+ 70515885
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 51
+ Query_51
+ NODE_51_length_225_cov_1.117647
+ 225
+
+
+
+
+ 16305
+ 2821655
+ 42
+ 70515885
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 52
+ Query_52
+ NODE_52_length_225_cov_0.917647
+ 225
+
+
+
+
+ 16305
+ 2821655
+ 42
+ 70515885
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 53
+ Query_53
+ NODE_53_length_223_cov_3.303571
+ 223
+
+
+
+
+ 16305
+ 2821655
+ 41
+ 71053950
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 54
+ Query_54
+ NODE_54_length_223_cov_1.803571
+ 223
+
+
+
+
+ 16305
+ 2821655
+ 41
+ 71053950
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 55
+ Query_55
+ NODE_55_length_216_cov_1.596273
+ 216
+
+
+
+
+ 16305
+ 2821655
+ 40
+ 69422560
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 56
+ Query_56
+ NODE_56_length_216_cov_1.180124
+ 216
+
+
+ 1
+ gnl|CDD|306795
+ pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla.
+ 306795
+ 291
+
+
+ 1
+ 42.6815
+ 101
+ 5.23486e-07
+ 18
+ 188
+ 52
+ 110
+ 3
+ 0
+ 16
+ 28
+ 4
+ 60
+ GLCGLFGSTEPTLNFEILTNQSYPVALEI---IFYIGFFLAFAVKLPIIPLHTWLPDTHE
+ GISLMYNYTG-TLSFTELSKALFNGLNSWGLLLLFLLILVGFLFKSAQVPFHTWLPDAYE
+ G+ ++ T TL+F L+ + + ++ + F K +P HTWLPD +E
+
+
+
+
+
+
+ 16305
+ 2821655
+ 40
+ 69422560
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 57
+ Query_57
+ NODE_57_length_216_cov_0.869565
+ 216
+
+
+
+
+ 16305
+ 2821655
+ 40
+ 69422560
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 58
+ Query_58
+ NODE_58_length_215_cov_1.668750
+ 215
+
+
+
+
+ 16305
+ 2821655
+ 39
+ 69944320
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 59
+ Query_59
+ NODE_59_length_215_cov_1.187500
+ 215
+
+
+
+
+ 16305
+ 2821655
+ 39
+ 69944320
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 60
+ Query_60
+ NODE_60_length_215_cov_0.843750
+ 215
+
+
+
+
+ 16305
+ 2821655
+ 39
+ 69944320
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 61
+ Query_61
+ NODE_61_length_214_cov_1.232704
+ 214
+
+
+
+
+ 16305
+ 2821655
+ 39
+ 69944320
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 62
+ Query_62
+ NODE_62_length_213_cov_0.936709
+ 213
+
+
+
+
+ 16305
+ 2821655
+ 39
+ 69944320
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 63
+ Query_63
+ NODE_63_length_210_cov_1.225806
+ 210
+
+
+
+
+ 16305
+ 2821655
+ 38
+ 70466080
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 64
+ Query_64
+ NODE_64_length_208_cov_1.019608
+ 208
+
+
+
+
+ 16305
+ 2821655
+ 37
+ 70987840
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+
+
diff -r 000000000000 -r b82ce29791e7 test-data/blast2tsv_output.tab
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/blast2tsv_output.tab Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,13 @@
+#algo query_id nb_reads query_length accession description organism percentIdentity nb_hsps queryOverlap hitOverlap evalue score tax_id taxonomy sequence
+TBLASTX NODE_13_length_295_cov_0.945833 295 316155 pfam13603, tRNA-synt_1_2, Leucyl-tRNA synthetase, Domain 2. This is a family of the conserved region of Leucine-tRNA ligase or Leucyl-tRNA synthetase, EC:6.1.1.4. Tursiops truncatus papillomavirus 2 41.5 1 100 67.0 2.277e-05 38.6378 316155 Viruses;Monodnaviria;Shotokuvirae;Cossaviricota;Papovaviricetes;Zurhausenvirales;Papillomaviridae;Firstpapillomavirinae;Upsilonpapillomavirus;Upsilonpapillomavirus 2;Tursiops truncatus papillomavirus 2 TGTGTTGGGTGTGTTTGGTTTCCGGTTACCATAATCGCTATTCTTTCAAACAGAAAGCGCATGCTAAGTATTCTCACCCAGAGGAATATGCTGACAAGCCCTCCTCAAAAGGCTATTTTTACAATGCCACCTATGAGAATGCACGAACTCTTATTCACTTCATTAAGCAATATGGATTGCCCTTCAATCCTGTTATTGCACCAGAAGATGCTGAACTAACTGATGAACAGATTCAATCTTACATCAACACAGCAAACTCCTTCTTTAATGATTATCCGACGTTACTGTTCACCCG
+TBLASTX NODE_16_length_278_cov_0.901345 278 306845 pfam00421, PSII, Photosystem II protein. 65.8 1 100 47.0 7.65615e-39 132.634 GTCTAACCTGTGTTGGGTGTGTTTGGGCTGTAATCGAGGTATAGTGTCGAACAAGTCGGTGTCACTGTTGAATTCTATGGCGGCGAACTCAATGGAGTCAGTTATAGTGATCCTGCTACTGTGAAAAAATATGCTAGACGTGCTCAATTGGGTGAAATTTTTGAATTAGATCGTGCTACTTTAAAATCGGATGGTGTTTTTCGTAGCAGTCCAAGGGGTTGGTTTACTTTTGGACATGCGTCGTTTGCTCTGCTCTTCTTCCAAACACACCCAACACA
+TBLASTX NODE_19_length_271_cov_0.879630 271 306845 pfam00421, PSII, Photosystem II protein. 32.9 1 100 42.0 1.69015e-11 56.3644 GTCTAACCTGTGTTGGGTGTGTTTGGTATGGAGGGAGGTGTATATGATACCTGGGCACCCGGAGGGGGAGATGTAAGAAAAATTACCAACTTGACCCTTAACCCAAGCGTGATATTTGGTTATTTACTAAAATCTCCTTTTGGGGGAGAAGGATGGATTGTTAGTGTGGACGATTTAGAAGATATAATTGGAGGACATGTCTGGTTAGGCTCCATTTGTATACTTGGTGGAATTTGGCATATCTTAACCAAACACACCCAACACAGGTTAG
+TBLASTX NODE_20_length_267_cov_1.429245 267 287774 pfam10839, DUF2647, Protein of unknown function (DUF2647). This eukaryotic family of proteins are annotated as ycf68 but have no known function. Desulfovibrio sp. G100IX 91.3 1 100 99.0 7.70073e-10 48.4966 287774 cellular organisms;Bacteria;Thermodesulfobacteriota;Desulfovibrionia;Desulfovibrionales;Desulfovibrionaceae;Desulfovibrio;unclassified Desulfovibrio;Desulfovibrio sp. G100IX CTGTGTTGGGTGTGTTTGGACTTGGTATGTGAAGATACGTTGTTAGGTGCTCCGTTTTATTTTCCCATTGAGGCCGAACCTAAACCTGTGCTCGAGAGATAGCTGTCCATATACTGATAAGGGATGTATGGATTCTCGAGAAGAGAGGAGCCATGGTGGTCCCTCCCGGACCGCCCGGATCCCACGAGTGAATAGAAAGTTGGATCTACATTGGATCTCACCTGAATCGCCCCATAAACAACCAAACACACCCAACACAGGTTAGAC
+TBLASTX NODE_22_length_262_cov_1.053140 262 306604 pfam00124, Photo_RC, Photosynthetic reaction centre protein. Heterotermes sp. TMJ-2004j 40.9 1 100 77.0 4.94039e-28 99.6256 306604 cellular organisms;Eukaryota;Opisthokonta;Metazoa;Eumetazoa;Bilateria;Protostomia;Ecdysozoa;Panarthropoda;Arthropoda;Mandibulata;Pancrustacea;Hexapoda;Insecta;Dicondylia;Pterygota;Neoptera;Polyneoptera;Dictyoptera;Blattodea;Blattoidea;Termitoidae;Rhinotermitidae;Heterotermitinae;Heterotermes;unclassified Heterotermes;Heterotermes sp. TMJ-2004j GTCTAACCTGTGTTGGGTGTGTTTGGCTAGTCAGTAGCTTGTTATATGGGTCGTGAGTGGGAAGTTAGCTTCCGTCTGGGTATGCGCCCGTGGATTGCTGTTGCATATTCAGCTCCTGTTGCAGCTGCTACTGCTGTTTTCTTGATTTACCCAATTGGTCAAGGAAGTTTTTCTGATGGTATGCCTCTAGGAATCTCTGGTACTTTCAACTTCATGATTGTATTCCAGGAGAGCACCCAAACACACCCAACACAGGTTAGAC
+TBLASTX NODE_24_length_258_cov_0.935961 258 307679 pfam01660, Vmethyltransf, Viral methyltransferase. This RNA methyltransferase domain is found in a wide range of ssRNA viruses, including Hordei-, Tobra-, Tobamo-, Bromo-, Clostero- and Caliciviruses. This methyltransferase is involved in mRNA capping. Capping of mRNA enhances its stability. This usually occurs in the nucleus. Therefore, many viruses that replicate in the cytoplasm encode their own. This is a specific guanine-7-methyltransferase domain involved in viral mRNA cap0 synthesis. Specificity for guanine 7 position is shown by NMR in and in vivo role in cap synthesis. Based on secondary structure prediction, the basic fold is believed to be similar to the common AdoMet-dependent methyltransferase fold. A curious feature of this methyltransferase domain is that it together with flanking sequences seems to have guanylyltransferase activity coupled to the methyltransferase activity. The domain is found throughout the so-called Alphavirus superfamily, (including alphaviruses and several other groups). It forms the defining, unique feature of this superfamily. Tetrastemma peltatum 39.4 1 100 70.0 8.38713e-15 65.0021 307679 cellular organisms;Eukaryota;Opisthokonta;Metazoa;Eumetazoa;Bilateria;Protostomia;Spiralia;Lophotrochozoa;Nemertea;Enopla;Hoplonemertea;Monostilifera;Eumonostilifera;Tetrastemmatidae;Tetrastemma;Tetrastemma peltatum GTGTTGGGTGTGTTTGGTTGGTGAACGCGCACCATTTAGTGGCAATCACGCGCGGGGAGGCTGAAAACTGCAAGCATAGATCTTTCGGCCCTTTCGAAGCTACCGCTTCCGAGAGCCTGGCTAAACTCTGCCCAGATTATCCGATCTGCTTGCCTGTACCTTACGACGTGATCAATAAAGTGTATAGGTATCTCAGAACGCTTAAGAAGCCTGATGTGCAGTCGCCCCACTACCAAACACACCCAACACAGGTTAGAC
+TBLASTX NODE_29_length_250_cov_0.851282 250 278700 pfam00283, Cytochrom_B559, Cytochrome b559, alpha (gene psbE) and beta (gene psbF)subunits. uncultured archaeon CRE-PA11a 58.6 1 100 100 7.31211e-08 42.0012 278700 cellular organisms;Archaea;environmental samples;uncultured archaeon CRE-PA11a GTCTAACCTGTGTTGGGTGTGTTTGGGTTTCTTTGGAGCAACTCGATGAATTTAGTAAATCCTTTTAGGAGGTTCCCAATGACCATAGATCGAACCTATCCAATTTTTACAGTGCGATGGTTGGCTGTTCACGGACTGGCTGTACCTACTGTTTCTTTTTTAGGGTCAATATCAGCAATGCAGTTCATCCAACGATAAACCTAATTCAAATTATAGAGCTAGCACACCAAACACACCCAACACAGGTTAG
+TBLASTX NODE_34_length_245_cov_1.000000 245 250270 pfam00978, RdRP_2, RNA dependent RNA polymerase. This family may represent an RNA dependent RNA polymerase. The family also contains the following proteins: 2A protein from bromoviruses putative RNA dependent RNA polymerase from tobamoviruses Non structural polyprotein from togaviruses. Nocardia sp. 431D04 37.5 1 100 38.0 6.42106e-08 45.7137 250270 cellular organisms;Bacteria;Terrabacteria group;Actinomycetota;Actinomycetes;Mycobacteriales;Nocardiaceae;Nocardia;unclassified Nocardia;Nocardia sp. 431D04 GTCTAACCTGTGTTGGGTGTGTTTGGATGGTGATCGGCAATTTAAAGGAATGTGTGCGATATTTTCACCAATATTCAAGGAGCTTAAAAATCGACTAAAAAGCGTGTTAGATATTAAATACATGTATGCAGACGGATTGAGACCTGATCAGTTGTCGGAGCGCATGTCACAGATAGGTGCAGGTAAATATTTTATAGAGAATGATATGGAACAGCATCTCGCCAAACACACCCAACACAGGTTAG
+TBLASTX NODE_46_length_229_cov_1.091954 229 306604 pfam00124, Photo_RC, Photosynthetic reaction centre protein. Heterotermes sp. TMJ-2004j 43.9 1 100 66.0 4.26406e-23 86.1436 306604 cellular organisms;Eukaryota;Opisthokonta;Metazoa;Eumetazoa;Bilateria;Protostomia;Ecdysozoa;Panarthropoda;Arthropoda;Mandibulata;Pancrustacea;Hexapoda;Insecta;Dicondylia;Pterygota;Neoptera;Polyneoptera;Dictyoptera;Blattodea;Blattoidea;Termitoidae;Rhinotermitidae;Heterotermitinae;Heterotermes;unclassified Heterotermes;Heterotermes sp. TMJ-2004j TGTGTTGGGTGTGTTTGGTTGGATGCCTGGAATACAATCATGAAATTGAAAGTACCAGATATTCCTAAAGGCATGCCATCTGAAAAACTTCCTTGACCAATAGGGTAGATCAAGAAAACAGCTGTAGCAGCCGCGACAGGAGCTGAATATGCAACAGCAATCCAAGGACGCATACCCAGACGGAAACTAAGCTCCCTCTCGCTCCAAACACACCCAACACAGGTTAGAC
+TBLASTX NODE_47_length_229_cov_0.816092 229 306687 pfam00223, PsaA_PsaB, Photosystem I psaA/psaB protein. 66.7 1 100 14.0 1.79906e-13 61.3066 TTGGTAAATTGGCGGAAAGAGGAGGACTCAATGATTATTCGTTCGCCGGAACCAGAAGTAAAAATTTTGGTAGATAGGGATCACATAAAAACTTCTTTCGAGGAATGGGCCAGGCCGGGTCATTTCTCAAGAACACTAGCTAAAGGCCCTGACACTACCACTTGGATCTGGAACCTACATGCTGATGCTCACGATCTTAATAGCCAAACACACCCAACACAGGTTAGAC
+TBLASTX NODE_50_length_226_cov_2.269006 226 306845 pfam00421, PSII, Photosystem II protein. 60.3 1 100 41.0 2.77182e-23 89.1064 GTCAACGGTGTGTTGGGTGTGTTTGGGAAAGGTCCTGGAATATGGGTGTCCGATCCTTATGGACTAACCGGAACAGTGCAACCTGTAAATCCGGCGTGGGGCGTGGAAGGTTTTGATCCTTTTGTCCCGGGAGGAATAGCTTCTCATCATATTGCAGCAGGTACATTGGGCATATTAGCGGGCCTATTCCATCTTAGCGTACGGTCACCCCAGCCAAACACACCCA
+TBLASTX NODE_56_length_216_cov_1.180124 216 306795 pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla. 26.7 1 100 62.0 5.23486e-07 42.6815 GTGTTGGGTGTGTTTGGGGTCTATGTGGTTTATTTGGTTCTACTGAACCAACATTAAATTTTGAAATATTAACTAATCAGTCCTATCCTGTGGCCTTGGAAATAATATTTTATATTGGATTTTTTCTTGCTTTTGCTGTAAAATTACCAATCATACCCCTACATACATGGTTACCAGATACCCACGAGAGCCAAACACACCCAACACAGGTTAGAC
diff -r 000000000000 -r b82ce29791e7 test-data/blast2tsv_output_with_rn.tab
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/blast2tsv_output_with_rn.tab Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,13 @@
+#algo query_id nb_reads query_length accession description organism percentIdentity nb_hsps queryOverlap hitOverlap evalue score tax_id taxonomy sequence
+TBLASTX NODE_13_length_295_cov_0.945833 264 295 316155 pfam13603, tRNA-synt_1_2, Leucyl-tRNA synthetase, Domain 2. This is a family of the conserved region of Leucine-tRNA ligase or Leucyl-tRNA synthetase, EC:6.1.1.4. Tursiops truncatus papillomavirus 2 41.5 1 100 67.0 2.277e-05 38.6378 316155 Viruses;Monodnaviria;Shotokuvirae;Cossaviricota;Papovaviricetes;Zurhausenvirales;Papillomaviridae;Firstpapillomavirinae;Upsilonpapillomavirus;Upsilonpapillomavirus 2;Tursiops truncatus papillomavirus 2 TGTGTTGGGTGTGTTTGGTTTCCGGTTACCATAATCGCTATTCTTTCAAACAGAAAGCGCATGCTAAGTATTCTCACCCAGAGGAATATGCTGACAAGCCCTCCTCAAAAGGCTATTTTTACAATGCCACCTATGAGAATGCACGAACTCTTATTCACTTCATTAAGCAATATGGATTGCCCTTCAATCCTGTTATTGCACCAGAAGATGCTGAACTAACTGATGAACAGATTCAATCTTACATCAACACAGCAAACTCCTTCTTTAATGATTATCCGACGTTACTGTTCACCCG
+TBLASTX NODE_16_length_278_cov_0.901345 377 278 306845 pfam00421, PSII, Photosystem II protein. 65.8 1 100 47.0 7.65615e-39 132.634 GTCTAACCTGTGTTGGGTGTGTTTGGGCTGTAATCGAGGTATAGTGTCGAACAAGTCGGTGTCACTGTTGAATTCTATGGCGGCGAACTCAATGGAGTCAGTTATAGTGATCCTGCTACTGTGAAAAAATATGCTAGACGTGCTCAATTGGGTGAAATTTTTGAATTAGATCGTGCTACTTTAAAATCGGATGGTGTTTTTCGTAGCAGTCCAAGGGGTTGGTTTACTTTTGGACATGCGTCGTTTGCTCTGCTCTTCTTCCAAACACACCCAACACA
+TBLASTX NODE_19_length_271_cov_0.879630 67 271 306845 pfam00421, PSII, Photosystem II protein. 32.9 1 100 42.0 1.69015e-11 56.3644 GTCTAACCTGTGTTGGGTGTGTTTGGTATGGAGGGAGGTGTATATGATACCTGGGCACCCGGAGGGGGAGATGTAAGAAAAATTACCAACTTGACCCTTAACCCAAGCGTGATATTTGGTTATTTACTAAAATCTCCTTTTGGGGGAGAAGGATGGATTGTTAGTGTGGACGATTTAGAAGATATAATTGGAGGACATGTCTGGTTAGGCTCCATTTGTATACTTGGTGGAATTTGGCATATCTTAACCAAACACACCCAACACAGGTTAG
+TBLASTX NODE_20_length_267_cov_1.429245 2 267 287774 pfam10839, DUF2647, Protein of unknown function (DUF2647). This eukaryotic family of proteins are annotated as ycf68 but have no known function. Desulfovibrio sp. G100IX 91.3 1 100 99.0 7.70073e-10 48.4966 287774 cellular organisms;Bacteria;Thermodesulfobacteriota;Desulfovibrionia;Desulfovibrionales;Desulfovibrionaceae;Desulfovibrio;unclassified Desulfovibrio;Desulfovibrio sp. G100IX CTGTGTTGGGTGTGTTTGGACTTGGTATGTGAAGATACGTTGTTAGGTGCTCCGTTTTATTTTCCCATTGAGGCCGAACCTAAACCTGTGCTCGAGAGATAGCTGTCCATATACTGATAAGGGATGTATGGATTCTCGAGAAGAGAGGAGCCATGGTGGTCCCTCCCGGACCGCCCGGATCCCACGAGTGAATAGAAAGTTGGATCTACATTGGATCTCACCTGAATCGCCCCATAAACAACCAAACACACCCAACACAGGTTAGAC
+TBLASTX NODE_22_length_262_cov_1.053140 262 262 306604 pfam00124, Photo_RC, Photosynthetic reaction centre protein. Heterotermes sp. TMJ-2004j 40.9 1 100 77.0 4.94039e-28 99.6256 306604 cellular organisms;Eukaryota;Opisthokonta;Metazoa;Eumetazoa;Bilateria;Protostomia;Ecdysozoa;Panarthropoda;Arthropoda;Mandibulata;Pancrustacea;Hexapoda;Insecta;Dicondylia;Pterygota;Neoptera;Polyneoptera;Dictyoptera;Blattodea;Blattoidea;Termitoidae;Rhinotermitidae;Heterotermitinae;Heterotermes;unclassified Heterotermes;Heterotermes sp. TMJ-2004j GTCTAACCTGTGTTGGGTGTGTTTGGCTAGTCAGTAGCTTGTTATATGGGTCGTGAGTGGGAAGTTAGCTTCCGTCTGGGTATGCGCCCGTGGATTGCTGTTGCATATTCAGCTCCTGTTGCAGCTGCTACTGCTGTTTTCTTGATTTACCCAATTGGTCAAGGAAGTTTTTCTGATGGTATGCCTCTAGGAATCTCTGGTACTTTCAACTTCATGATTGTATTCCAGGAGAGCACCCAAACACACCCAACACAGGTTAGAC
+TBLASTX NODE_24_length_258_cov_0.935961 101 258 307679 pfam01660, Vmethyltransf, Viral methyltransferase. This RNA methyltransferase domain is found in a wide range of ssRNA viruses, including Hordei-, Tobra-, Tobamo-, Bromo-, Clostero- and Caliciviruses. This methyltransferase is involved in mRNA capping. Capping of mRNA enhances its stability. This usually occurs in the nucleus. Therefore, many viruses that replicate in the cytoplasm encode their own. This is a specific guanine-7-methyltransferase domain involved in viral mRNA cap0 synthesis. Specificity for guanine 7 position is shown by NMR in and in vivo role in cap synthesis. Based on secondary structure prediction, the basic fold is believed to be similar to the common AdoMet-dependent methyltransferase fold. A curious feature of this methyltransferase domain is that it together with flanking sequences seems to have guanylyltransferase activity coupled to the methyltransferase activity. The domain is found throughout the so-called Alphavirus superfamily, (including alphaviruses and several other groups). It forms the defining, unique feature of this superfamily. Tetrastemma peltatum 39.4 1 100 70.0 8.38713e-15 65.0021 307679 cellular organisms;Eukaryota;Opisthokonta;Metazoa;Eumetazoa;Bilateria;Protostomia;Spiralia;Lophotrochozoa;Nemertea;Enopla;Hoplonemertea;Monostilifera;Eumonostilifera;Tetrastemmatidae;Tetrastemma;Tetrastemma peltatum GTGTTGGGTGTGTTTGGTTGGTGAACGCGCACCATTTAGTGGCAATCACGCGCGGGGAGGCTGAAAACTGCAAGCATAGATCTTTCGGCCCTTTCGAAGCTACCGCTTCCGAGAGCCTGGCTAAACTCTGCCCAGATTATCCGATCTGCTTGCCTGTACCTTACGACGTGATCAATAAAGTGTATAGGTATCTCAGAACGCTTAAGAAGCCTGATGTGCAGTCGCCCCACTACCAAACACACCCAACACAGGTTAGAC
+TBLASTX NODE_29_length_250_cov_0.851282 428 250 278700 pfam00283, Cytochrom_B559, Cytochrome b559, alpha (gene psbE) and beta (gene psbF)subunits. uncultured archaeon CRE-PA11a 58.6 1 100 100 7.31211e-08 42.0012 278700 cellular organisms;Archaea;environmental samples;uncultured archaeon CRE-PA11a GTCTAACCTGTGTTGGGTGTGTTTGGGTTTCTTTGGAGCAACTCGATGAATTTAGTAAATCCTTTTAGGAGGTTCCCAATGACCATAGATCGAACCTATCCAATTTTTACAGTGCGATGGTTGGCTGTTCACGGACTGGCTGTACCTACTGTTTCTTTTTTAGGGTCAATATCAGCAATGCAGTTCATCCAACGATAAACCTAATTCAAATTATAGAGCTAGCACACCAAACACACCCAACACAGGTTAG
+TBLASTX NODE_34_length_245_cov_1.000000 183 245 250270 pfam00978, RdRP_2, RNA dependent RNA polymerase. This family may represent an RNA dependent RNA polymerase. The family also contains the following proteins: 2A protein from bromoviruses putative RNA dependent RNA polymerase from tobamoviruses Non structural polyprotein from togaviruses. Nocardia sp. 431D04 37.5 1 100 38.0 6.42106e-08 45.7137 250270 cellular organisms;Bacteria;Terrabacteria group;Actinomycetota;Actinomycetes;Mycobacteriales;Nocardiaceae;Nocardia;unclassified Nocardia;Nocardia sp. 431D04 GTCTAACCTGTGTTGGGTGTGTTTGGATGGTGATCGGCAATTTAAAGGAATGTGTGCGATATTTTCACCAATATTCAAGGAGCTTAAAAATCGACTAAAAAGCGTGTTAGATATTAAATACATGTATGCAGACGGATTGAGACCTGATCAGTTGTCGGAGCGCATGTCACAGATAGGTGCAGGTAAATATTTTATAGAGAATGATATGGAACAGCATCTCGCCAAACACACCCAACACAGGTTAG
+TBLASTX NODE_46_length_229_cov_1.091954 471 229 306604 pfam00124, Photo_RC, Photosynthetic reaction centre protein. Heterotermes sp. TMJ-2004j 43.9 1 100 66.0 4.26406e-23 86.1436 306604 cellular organisms;Eukaryota;Opisthokonta;Metazoa;Eumetazoa;Bilateria;Protostomia;Ecdysozoa;Panarthropoda;Arthropoda;Mandibulata;Pancrustacea;Hexapoda;Insecta;Dicondylia;Pterygota;Neoptera;Polyneoptera;Dictyoptera;Blattodea;Blattoidea;Termitoidae;Rhinotermitidae;Heterotermitinae;Heterotermes;unclassified Heterotermes;Heterotermes sp. TMJ-2004j TGTGTTGGGTGTGTTTGGTTGGATGCCTGGAATACAATCATGAAATTGAAAGTACCAGATATTCCTAAAGGCATGCCATCTGAAAAACTTCCTTGACCAATAGGGTAGATCAAGAAAACAGCTGTAGCAGCCGCGACAGGAGCTGAATATGCAACAGCAATCCAAGGACGCATACCCAGACGGAAACTAAGCTCCCTCTCGCTCCAAACACACCCAACACAGGTTAGAC
+TBLASTX NODE_47_length_229_cov_0.816092 470 229 306687 pfam00223, PsaA_PsaB, Photosystem I psaA/psaB protein. 66.7 1 100 14.0 1.79906e-13 61.3066 TTGGTAAATTGGCGGAAAGAGGAGGACTCAATGATTATTCGTTCGCCGGAACCAGAAGTAAAAATTTTGGTAGATAGGGATCACATAAAAACTTCTTTCGAGGAATGGGCCAGGCCGGGTCATTTCTCAAGAACACTAGCTAAAGGCCCTGACACTACCACTTGGATCTGGAACCTACATGCTGATGCTCACGATCTTAATAGCCAAACACACCCAACACAGGTTAGAC
+TBLASTX NODE_50_length_226_cov_2.269006 315 226 306845 pfam00421, PSII, Photosystem II protein. 60.3 1 100 41.0 2.77182e-23 89.1064 GTCAACGGTGTGTTGGGTGTGTTTGGGAAAGGTCCTGGAATATGGGTGTCCGATCCTTATGGACTAACCGGAACAGTGCAACCTGTAAATCCGGCGTGGGGCGTGGAAGGTTTTGATCCTTTTGTCCCGGGAGGAATAGCTTCTCATCATATTGCAGCAGGTACATTGGGCATATTAGCGGGCCTATTCCATCTTAGCGTACGGTCACCCCAGCCAAACACACCCA
+TBLASTX NODE_56_length_216_cov_1.180124 166 216 306795 pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla. 26.7 1 100 62.0 5.23486e-07 42.6815 GTGTTGGGTGTGTTTGGGGTCTATGTGGTTTATTTGGTTCTACTGAACCAACATTAAATTTTGAAATATTAACTAATCAGTCCTATCCTGTGGCCTTGGAAATAATATTTTATATTGGATTTTTTCTTGCTTTTGCTGTAAAATTACCAATCATACCCCTACATACATGGTTACCAGATACCCACGAGAGCCAAACACACCCAACACAGGTTAGAC
diff -r 000000000000 -r b82ce29791e7 test-data/blast2tsv_read_nb.tab
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/blast2tsv_read_nb.tab Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,64 @@
+NODE_1_length_506_cov_10.687361 56
+NODE_2_length_429_cov_3.631016 301
+NODE_3_length_365_cov_1.074194 23
+NODE_4_length_351_cov_1.547297 183
+NODE_5_length_344_cov_3.273356 220
+NODE_6_length_338_cov_1.314488 121
+NODE_7_length_335_cov_1.714286 6
+NODE_8_length_331_cov_0.862319 322
+NODE_9_length_324_cov_2.141264 153
+NODE_10_length_324_cov_1.371747 235
+NODE_11_length_317_cov_1.125954 136
+NODE_12_length_311_cov_1.535156 196
+NODE_13_length_295_cov_0.945833 264
+NODE_14_length_294_cov_1.891213 155
+NODE_15_length_280_cov_1.413333 348
+NODE_16_length_278_cov_0.901345 377
+NODE_17_length_277_cov_1.540541 160
+NODE_18_length_274_cov_3.872146 25
+NODE_19_length_271_cov_0.879630 67
+NODE_20_length_267_cov_1.429245 2
+NODE_21_length_263_cov_1.177885 361
+NODE_22_length_262_cov_1.053140 262
+NODE_23_length_260_cov_1.590244 316
+NODE_24_length_258_cov_0.935961 101
+NODE_25_length_256_cov_0.945274 46
+NODE_26_length_256_cov_0.895522 153
+NODE_27_length_254_cov_0.793970 127
+NODE_28_length_253_cov_1.313131 20
+NODE_29_length_250_cov_0.851282 428
+NODE_30_length_249_cov_1.298969 249
+NODE_31_length_249_cov_0.979381 445
+NODE_32_length_248_cov_0.979275 496
+NODE_33_length_245_cov_1.000000 281
+NODE_34_length_245_cov_1.000000 183
+NODE_35_length_242_cov_0.818182 222
+NODE_36_length_240_cov_1.259459 179
+NODE_37_length_239_cov_1.032609 98
+NODE_38_length_239_cov_1.032609 405
+NODE_39_length_238_cov_1.038251 426
+NODE_40_length_238_cov_0.879781 105
+NODE_41_length_236_cov_1.049724 225
+NODE_42_length_235_cov_1.855556 440
+NODE_43_length_234_cov_1.061453 106
+NODE_44_length_232_cov_1.073446 136
+NODE_45_length_232_cov_1.073446 430
+NODE_46_length_229_cov_1.091954 471
+NODE_47_length_229_cov_0.816092 470
+NODE_48_length_227_cov_1.273256 450
+NODE_49_length_227_cov_1.017442 190
+NODE_50_length_226_cov_2.269006 315
+NODE_51_length_225_cov_1.117647 384
+NODE_52_length_225_cov_0.917647 405
+NODE_53_length_223_cov_3.303571 414
+NODE_54_length_223_cov_1.803571 355
+NODE_55_length_216_cov_1.596273 317
+NODE_56_length_216_cov_1.180124 166
+NODE_57_length_216_cov_0.869565 247
+NODE_58_length_215_cov_1.668750 267
+NODE_59_length_215_cov_1.187500 163
+NODE_60_length_215_cov_0.843750 124
+NODE_61_length_214_cov_1.232704 103
+NODE_62_length_213_cov_0.936709 421
+NODE_63_length_210_cov_1.225806 290
+NODE_64_length_208_cov_1.019608 498
\ No newline at end of file
diff -r 000000000000 -r b82ce29791e7 test-data/blast2tsv_reads.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/blast2tsv_reads.txt Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,6 @@
+0 Viruses Monodnaviria Shotokuvirae Cossaviricota Papovaviricetes Zurhausenvirales Papillomaviridae Firstpapillomavirinae Upsilonpapillomavirus Upsilonpapillomavirus 2
+0 cellular organisms Bacteria Thermodesulfobacteriota Desulfovibrionia Desulfovibrionales Desulfovibrionaceae Desulfovibrio unclassified Desulfovibrio
+0 cellular organisms Eukaryota Opisthokonta Metazoa Eumetazoa Bilateria Protostomia Ecdysozoa Panarthropoda Arthropoda Mandibulata Pancrustacea Hexapoda Insecta Dicondylia Pterygota Neoptera Polyneoptera Dictyoptera Blattodea Blattoidea Termitoidae Rhinotermitidae Heterotermitinae Heterotermes unclassified Heterotermes
+0 cellular organisms Eukaryota Opisthokonta Metazoa Eumetazoa Bilateria Protostomia Spiralia Lophotrochozoa Nemertea Enopla Hoplonemertea Monostilifera Eumonostilifera Tetrastemmatidae Tetrastemma
+0 cellular organisms Archaea environmental samples
+0 cellular organisms Bacteria Terrabacteria group Actinomycetota Actinomycetes Mycobacteriales Nocardiaceae Nocardia unclassified Nocardia
diff -r 000000000000 -r b82ce29791e7 test-data/blast2tsv_reads_with_rn.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/blast2tsv_reads_with_rn.txt Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,13 @@
+#algo query_id nb_reads query_length accession description organism percentIdentity nb_hsps queryOverlap hitOverlap evalue score tax_id taxonomy sequence
+TBLASTX NODE_13_length_295_cov_0.945833 264 295 316155 pfam13603, tRNA-synt_1_2, Leucyl-tRNA synthetase, Domain 2. This is a family of the conserved region of Leucine-tRNA ligase or Leucyl-tRNA synthetase, EC:6.1.1.4. Tursiops truncatus papillomavirus 2 41.5 1 100 67.0 2.277e-05 38.6378 316155 Viruses;Monodnaviria;Shotokuvirae;Cossaviricota;Papovaviricetes;Zurhausenvirales;Papillomaviridae;Firstpapillomavirinae;Upsilonpapillomavirus;Upsilonpapillomavirus 2;Tursiops truncatus papillomavirus 2 TGTGTTGGGTGTGTTTGGTTTCCGGTTACCATAATCGCTATTCTTTCAAACAGAAAGCGCATGCTAAGTATTCTCACCCAGAGGAATATGCTGACAAGCCCTCCTCAAAAGGCTATTTTTACAATGCCACCTATGAGAATGCACGAACTCTTATTCACTTCATTAAGCAATATGGATTGCCCTTCAATCCTGTTATTGCACCAGAAGATGCTGAACTAACTGATGAACAGATTCAATCTTACATCAACACAGCAAACTCCTTCTTTAATGATTATCCGACGTTACTGTTCACCCG
+TBLASTX NODE_16_length_278_cov_0.901345 377 278 306845 pfam00421, PSII, Photosystem II protein. 65.8 1 100 47.0 7.65615e-39 132.634 GTCTAACCTGTGTTGGGTGTGTTTGGGCTGTAATCGAGGTATAGTGTCGAACAAGTCGGTGTCACTGTTGAATTCTATGGCGGCGAACTCAATGGAGTCAGTTATAGTGATCCTGCTACTGTGAAAAAATATGCTAGACGTGCTCAATTGGGTGAAATTTTTGAATTAGATCGTGCTACTTTAAAATCGGATGGTGTTTTTCGTAGCAGTCCAAGGGGTTGGTTTACTTTTGGACATGCGTCGTTTGCTCTGCTCTTCTTCCAAACACACCCAACACA
+TBLASTX NODE_19_length_271_cov_0.879630 67 271 306845 pfam00421, PSII, Photosystem II protein. 32.9 1 100 42.0 1.69015e-11 56.3644 GTCTAACCTGTGTTGGGTGTGTTTGGTATGGAGGGAGGTGTATATGATACCTGGGCACCCGGAGGGGGAGATGTAAGAAAAATTACCAACTTGACCCTTAACCCAAGCGTGATATTTGGTTATTTACTAAAATCTCCTTTTGGGGGAGAAGGATGGATTGTTAGTGTGGACGATTTAGAAGATATAATTGGAGGACATGTCTGGTTAGGCTCCATTTGTATACTTGGTGGAATTTGGCATATCTTAACCAAACACACCCAACACAGGTTAG
+TBLASTX NODE_20_length_267_cov_1.429245 2 267 287774 pfam10839, DUF2647, Protein of unknown function (DUF2647). This eukaryotic family of proteins are annotated as ycf68 but have no known function. Desulfovibrio sp. G100IX 91.3 1 100 99.0 7.70073e-10 48.4966 287774 cellular organisms;Bacteria;Thermodesulfobacteriota;Desulfovibrionia;Desulfovibrionales;Desulfovibrionaceae;Desulfovibrio;unclassified Desulfovibrio;Desulfovibrio sp. G100IX CTGTGTTGGGTGTGTTTGGACTTGGTATGTGAAGATACGTTGTTAGGTGCTCCGTTTTATTTTCCCATTGAGGCCGAACCTAAACCTGTGCTCGAGAGATAGCTGTCCATATACTGATAAGGGATGTATGGATTCTCGAGAAGAGAGGAGCCATGGTGGTCCCTCCCGGACCGCCCGGATCCCACGAGTGAATAGAAAGTTGGATCTACATTGGATCTCACCTGAATCGCCCCATAAACAACCAAACACACCCAACACAGGTTAGAC
+TBLASTX NODE_22_length_262_cov_1.053140 262 262 306604 pfam00124, Photo_RC, Photosynthetic reaction centre protein. Heterotermes sp. TMJ-2004j 40.9 1 100 77.0 4.94039e-28 99.6256 306604 cellular organisms;Eukaryota;Opisthokonta;Metazoa;Eumetazoa;Bilateria;Protostomia;Ecdysozoa;Panarthropoda;Arthropoda;Mandibulata;Pancrustacea;Hexapoda;Insecta;Dicondylia;Pterygota;Neoptera;Polyneoptera;Dictyoptera;Blattodea;Blattoidea;Termitoidae;Rhinotermitidae;Heterotermitinae;Heterotermes;unclassified Heterotermes;Heterotermes sp. TMJ-2004j GTCTAACCTGTGTTGGGTGTGTTTGGCTAGTCAGTAGCTTGTTATATGGGTCGTGAGTGGGAAGTTAGCTTCCGTCTGGGTATGCGCCCGTGGATTGCTGTTGCATATTCAGCTCCTGTTGCAGCTGCTACTGCTGTTTTCTTGATTTACCCAATTGGTCAAGGAAGTTTTTCTGATGGTATGCCTCTAGGAATCTCTGGTACTTTCAACTTCATGATTGTATTCCAGGAGAGCACCCAAACACACCCAACACAGGTTAGAC
+TBLASTX NODE_24_length_258_cov_0.935961 101 258 307679 pfam01660, Vmethyltransf, Viral methyltransferase. This RNA methyltransferase domain is found in a wide range of ssRNA viruses, including Hordei-, Tobra-, Tobamo-, Bromo-, Clostero- and Caliciviruses. This methyltransferase is involved in mRNA capping. Capping of mRNA enhances its stability. This usually occurs in the nucleus. Therefore, many viruses that replicate in the cytoplasm encode their own. This is a specific guanine-7-methyltransferase domain involved in viral mRNA cap0 synthesis. Specificity for guanine 7 position is shown by NMR in and in vivo role in cap synthesis. Based on secondary structure prediction, the basic fold is believed to be similar to the common AdoMet-dependent methyltransferase fold. A curious feature of this methyltransferase domain is that it together with flanking sequences seems to have guanylyltransferase activity coupled to the methyltransferase activity. The domain is found throughout the so-called Alphavirus superfamily, (including alphaviruses and several other groups). It forms the defining, unique feature of this superfamily. Tetrastemma peltatum 39.4 1 100 70.0 8.38713e-15 65.0021 307679 cellular organisms;Eukaryota;Opisthokonta;Metazoa;Eumetazoa;Bilateria;Protostomia;Spiralia;Lophotrochozoa;Nemertea;Enopla;Hoplonemertea;Monostilifera;Eumonostilifera;Tetrastemmatidae;Tetrastemma;Tetrastemma peltatum GTGTTGGGTGTGTTTGGTTGGTGAACGCGCACCATTTAGTGGCAATCACGCGCGGGGAGGCTGAAAACTGCAAGCATAGATCTTTCGGCCCTTTCGAAGCTACCGCTTCCGAGAGCCTGGCTAAACTCTGCCCAGATTATCCGATCTGCTTGCCTGTACCTTACGACGTGATCAATAAAGTGTATAGGTATCTCAGAACGCTTAAGAAGCCTGATGTGCAGTCGCCCCACTACCAAACACACCCAACACAGGTTAGAC
+TBLASTX NODE_29_length_250_cov_0.851282 428 250 278700 pfam00283, Cytochrom_B559, Cytochrome b559, alpha (gene psbE) and beta (gene psbF)subunits. uncultured archaeon CRE-PA11a 58.6 1 100 100 7.31211e-08 42.0012 278700 cellular organisms;Archaea;environmental samples;uncultured archaeon CRE-PA11a GTCTAACCTGTGTTGGGTGTGTTTGGGTTTCTTTGGAGCAACTCGATGAATTTAGTAAATCCTTTTAGGAGGTTCCCAATGACCATAGATCGAACCTATCCAATTTTTACAGTGCGATGGTTGGCTGTTCACGGACTGGCTGTACCTACTGTTTCTTTTTTAGGGTCAATATCAGCAATGCAGTTCATCCAACGATAAACCTAATTCAAATTATAGAGCTAGCACACCAAACACACCCAACACAGGTTAG
+TBLASTX NODE_34_length_245_cov_1.000000 183 245 250270 pfam00978, RdRP_2, RNA dependent RNA polymerase. This family may represent an RNA dependent RNA polymerase. The family also contains the following proteins: 2A protein from bromoviruses putative RNA dependent RNA polymerase from tobamoviruses Non structural polyprotein from togaviruses. Nocardia sp. 431D04 37.5 1 100 38.0 6.42106e-08 45.7137 250270 cellular organisms;Bacteria;Terrabacteria group;Actinomycetota;Actinomycetes;Mycobacteriales;Nocardiaceae;Nocardia;unclassified Nocardia;Nocardia sp. 431D04 GTCTAACCTGTGTTGGGTGTGTTTGGATGGTGATCGGCAATTTAAAGGAATGTGTGCGATATTTTCACCAATATTCAAGGAGCTTAAAAATCGACTAAAAAGCGTGTTAGATATTAAATACATGTATGCAGACGGATTGAGACCTGATCAGTTGTCGGAGCGCATGTCACAGATAGGTGCAGGTAAATATTTTATAGAGAATGATATGGAACAGCATCTCGCCAAACACACCCAACACAGGTTAG
+TBLASTX NODE_46_length_229_cov_1.091954 471 229 306604 pfam00124, Photo_RC, Photosynthetic reaction centre protein. Heterotermes sp. TMJ-2004j 43.9 1 100 66.0 4.26406e-23 86.1436 306604 cellular organisms;Eukaryota;Opisthokonta;Metazoa;Eumetazoa;Bilateria;Protostomia;Ecdysozoa;Panarthropoda;Arthropoda;Mandibulata;Pancrustacea;Hexapoda;Insecta;Dicondylia;Pterygota;Neoptera;Polyneoptera;Dictyoptera;Blattodea;Blattoidea;Termitoidae;Rhinotermitidae;Heterotermitinae;Heterotermes;unclassified Heterotermes;Heterotermes sp. TMJ-2004j TGTGTTGGGTGTGTTTGGTTGGATGCCTGGAATACAATCATGAAATTGAAAGTACCAGATATTCCTAAAGGCATGCCATCTGAAAAACTTCCTTGACCAATAGGGTAGATCAAGAAAACAGCTGTAGCAGCCGCGACAGGAGCTGAATATGCAACAGCAATCCAAGGACGCATACCCAGACGGAAACTAAGCTCCCTCTCGCTCCAAACACACCCAACACAGGTTAGAC
+TBLASTX NODE_47_length_229_cov_0.816092 470 229 306687 pfam00223, PsaA_PsaB, Photosystem I psaA/psaB protein. 66.7 1 100 14.0 1.79906e-13 61.3066 TTGGTAAATTGGCGGAAAGAGGAGGACTCAATGATTATTCGTTCGCCGGAACCAGAAGTAAAAATTTTGGTAGATAGGGATCACATAAAAACTTCTTTCGAGGAATGGGCCAGGCCGGGTCATTTCTCAAGAACACTAGCTAAAGGCCCTGACACTACCACTTGGATCTGGAACCTACATGCTGATGCTCACGATCTTAATAGCCAAACACACCCAACACAGGTTAGAC
+TBLASTX NODE_50_length_226_cov_2.269006 315 226 306845 pfam00421, PSII, Photosystem II protein. 60.3 1 100 41.0 2.77182e-23 89.1064 GTCAACGGTGTGTTGGGTGTGTTTGGGAAAGGTCCTGGAATATGGGTGTCCGATCCTTATGGACTAACCGGAACAGTGCAACCTGTAAATCCGGCGTGGGGCGTGGAAGGTTTTGATCCTTTTGTCCCGGGAGGAATAGCTTCTCATCATATTGCAGCAGGTACATTGGGCATATTAGCGGGCCTATTCCATCTTAGCGTACGGTCACCCCAGCCAAACACACCCA
+TBLASTX NODE_56_length_216_cov_1.180124 166 216 306795 pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla. 26.7 1 100 62.0 5.23486e-07 42.6815 GTGTTGGGTGTGTTTGGGGTCTATGTGGTTTATTTGGTTCTACTGAACCAACATTAAATTTTGAAATATTAACTAATCAGTCCTATCCTGTGGCCTTGGAAATAATATTTTATATTGGATTTTTTCTTGCTTTTGCTGTAAAATTACCAATCATACCCCTACATACATGGTTACCAGATACCCACGAGAGCCAAACACACCCAACACAGGTTAGAC
diff -r 000000000000 -r b82ce29791e7 test-data/index.html
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/index.html Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,235 @@
+
+
+rps2tree
+
+
+
+
rps2tree
+
+
pfam02123 pfam02123_RdRP_4
+
pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus.
+
+
+
+
+
+
pfam02123_RdRP_4/seq_aligned.final_tree.fa
+
+
pfam02123_RdRP_4/otu_cluster.csv
+
+
pfam02123_RdRP_4/cluster_nb_reads_files.tab
+
+
pfam02123_RdRP_4/identity_matrix.csv
+
+
+
+
pfam00680 pfam00680_RdRP_1
+
pfam00680, RdRP_1, RNA dependent RNA polymerase.
+
+
+
+
+
+
pfam00680_RdRP_1/seq_aligned.final_tree.fa
+
+
pfam00680_RdRP_1/otu_cluster.csv
+
+
pfam00680_RdRP_1/cluster_nb_reads_files.tab
+
+
pfam00680_RdRP_1/identity_matrix.csv
+
+
+
+
pfam00665 pfam00665_rve
+
pfam00665, rve, Integrase core domain. Integrase mediates integration of a DNA copy of the viral genome into the host chromosome. Integrase is composed of three domains. The amino-terminal domain is a zinc binding domain pfam02022. This domain is the central catalytic domain. The carboxyl terminal domain that is a non-specific DNA binding domain pfam00552. The catalytic domain acts as an endonuclease when two nucleotides are removed from the 3' ends of the blunt-ended viral DNA made by reverse transcription. This domain also catalyzes the DNA strand transfer reaction of the 3' ends of the viral DNA to the 5' ends of the integration site.
+
+
+
+
+
+
pfam00665_rve/seq_aligned.final_tree.fa
+
+
pfam00665_rve/otu_cluster.csv
+
+
pfam00665_rve/cluster_nb_reads_files.tab
+
+
pfam00665_rve/identity_matrix.csv
+
+
+
+
pfam01443 pfam01443_Viral_helicase1
+
pfam01443, Viral_helicase1, Viral (Superfamily 1) RNA helicase. Helicase activity for this family has been demonstrated and NTPase activity. This helicase has multiple roles at different stages of viral RNA replication, as dissected by mutational analysis.
+
+
+
+
+
+
pfam01443_Viral_helicase1/seq_aligned.final_tree.fa
+
+
pfam01443_Viral_helicase1/otu_cluster.csv
+
+
pfam01443_Viral_helicase1/cluster_nb_reads_files.tab
+
+
pfam01443_Viral_helicase1/identity_matrix.csv
+
+
+
+
pfam00078 pfam00078_RVT_1
+
pfam00078, RVT_1, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses.
+
+
+
+
+
+
pfam00078_RVT_1/seq_aligned.final_tree.fa
+
+
pfam00078_RVT_1/otu_cluster.csv
+
+
pfam00078_RVT_1/cluster_nb_reads_files.tab
+
+
pfam00078_RVT_1/identity_matrix.csv
+
+
+
+
pfam01787 pfam01787_Ilar_coat
+
pfam01787, Ilar_coat, Ilarvirus coat protein. This family consists of various coat proteins from the ilarviruses part of the Bromoviridae, members include apple mosaic virus and prune dwarf virus. The ilarvirus coat protein is required to initiate replication of the viral genome in host plants. Members of the Bromoviridae have a positive stand ssRNA genome with no DNA stage in there replication.
+
+
+
+
+
+
pfam01787_Ilar_coat/seq_aligned.final_tree.fa
+
+
pfam01787_Ilar_coat/otu_cluster.csv
+
+
pfam01787_Ilar_coat/cluster_nb_reads_files.tab
+
+
pfam01787_Ilar_coat/identity_matrix.csv
+
+
+
+
pfam01573 pfam01573_Bromo_MP
+
pfam01573, Bromo_MP, Bromovirus movement protein.
+
+
+
+
+
+
pfam01573_Bromo_MP/seq_aligned.final_tree.fa
+
+
pfam01573_Bromo_MP/otu_cluster.csv
+
+
pfam01573_Bromo_MP/cluster_nb_reads_files.tab
+
+
pfam01573_Bromo_MP/identity_matrix.csv
+
+
+
+
+
+
diff -r 000000000000 -r b82ce29791e7 test-data/otu_s1.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/otu_s1.fa Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,6856 @@
+>ds2020-267_1
+CAGCACGTCCGCAAAAGGTCCTCGCTCCAAAACTGTCTCATCATCTCTATCGTGCCCTGA
+CCCGTTTTCATCTTTGTACCTAGCTCTACTTCTTCTATCCTTGTTGGCACTTCTATCGCC
+ATTACCCTCGCTATGTTGCCACGTTGTCCGTTGACCATAGGCCGCCACATCCTATAATGC
+CTCATGTCTCCAACTACTGCCCCACTCATTGTTATCTCTGTGTATACTGGACATGTTTGC
+CCTCTGTCTGGCCACAGCAGATTGGCTGCGGCTATAAACTTGTACAGTTTCACCTCGTCG
+TCATGTGGTGTCAGCACTATGTTCTTATCTATCACGACTCTAGCTTCATGTGGAAAGCAG
+TTCTCCTGATCTACCGGTATTCTGTGTAGTGAACCATACCCTAGGTGGCAACAGGGCAAC
+GACATGTGCACCAAATTCACGTGCGTGACTAGAGGCCTCTTGAAGTACATCTTCGCACGG
+TATTCAAACTCCGTTTGCATCATCCTTCCTTTCACACCTGCCACAATTGGGTTCCTGATG
+TGAAATTCTCCATATTCTAGTGACATTTCTAGGTTCACTGGCGTCACCAGGAACCCCAGC
+ATGTTTGACAGCCACGGCACCACTGCGTTGAATGTTGATAGCTCTCCAAGGTGTTGGTGC
+AGCTCACCAAGTCTGCAGTTCCTGAAGGAGTGTGGCAGTCTAATATCCAACTCCCTCACT
+TCAGACAGCTCCCAATGCCATATAGGAAAGTCTATGAAACTGCCTCTAATTGTGTTCTTA
+TCTTTCGTCTGCTTGAAGGAAGTACATCCCAGGCACACACAGTACCTCGTCACATCTCTG
+AAAGTTGCCTGACCAGGTGCAAACGTGGGTGGAGGCTGTGGTATCTTTGGTTCAATCAAC
+CTTATTATTTCAGCAGGTGCTATCCTGGTGAACATGTCTGCCTGTTTTGCCAGTTTCAGC
+AAAGAGTGCTCATCACCCTGCTTCTTGAATAGGCAGAAATGCGGCCCTGTGACATTGTGT
+TTGTGCCCACAGCTCAGCTTCAGCTGGCTATTCTGTGTAGAGTTGCCAAACCAGTTTATC
+TTTTCGCCGTAGTACATCCACCTACTTGGGTGCATTTCTTCTTCGTTAAGTGGCATGCCT
+TTCACCATCCCTTGCATAACCTGGGCCTCGGTATTGATGCCGTGTTCGTGGTCAAAAATA
+GGGCACTTGCCCTCTGCACCGCATGACATCAACGGCATGCCTTGCCATTTCCCGGTCAGT
+TCCTGGCAATTTTCAGGTGTCGGTGGTACCAGTGAGGTTCCTCCGCGCTTGAAAGTGTCA
+TCGTCATCACTCTGCTCTTCCATTATGTGACGTCTTATCCTTCCTAGCTCCTCTCTCGCT
+CGCTCAGTTCTGTAAGCCTTTTCTTCTTTTCTGTTCATCCATGGCACGTCCCATGATCGT
+GCGTCTTTTTCCCTTTGTTCCGAACTCGTGTCTGTTTGTGAATCGACAAACTCTTTCGCC
+TGCCTCAATTTTTCAGCCACATCATCACACTCGATTCTCACTTCTGGCTCTAGCACGACA
+TGCCCCTCACCTATAAGCAGGTTCTTCATGGTGTCCGCCCCCTCTGTATCTGACTCTGAC
+GCTTCGTCCTGCGTCTTAACAGGGCTTGGTGTAGGGCCACCATCGAACGTGACGTCAGTT
+TCTTGCTCTACATCCACCTCAACACTCAGCTTCTTAGAGTGAGCGCTTTTCCGTTCAGTG
+AACTTGTAGACCAACATGTTTGCGTTGTACATGAGCTGTCCCCTTATGTCTTCCGATTTG
+TCGCTTGGCCTACGCTGTTTCTGATCGAGCGCCTCGTCAACGTATTCAATGTCTGCTACG
+TGCTCAGTGCTCATCATCTTGGCGTCTATTACGTCCTCGATTGACGGTGTCCTCTTTAGA
+GTCTTCACCTCTAGTGTTCCGTCAACCACGACACCTGCCTCTTCGATTGCCTGGTTGCAC
+AGCGCGCACGACACAAGCTGCTTGCACTTCCTGCACACATGCTGCATTTTTATGTATCCA
+CAGCAACTTGTTTGGCACGGTGAAGACATCCTGACACACTTCTTGTTCTTCACCCTCGTC
+TTGGGGGTGCTCATCACTTCATGGACAGACTTGATATTGCGTTGCCCTTTTTGACCGGTT
+TCAGCCACACATACTTGATACGTGTGCACCAGGCTCAAGTAGTTTGGCCAGTTTGCATCA
+GCTGCCACCACCAGTGACGCAACATACCTCACACGCGGTGAGTAGTTAGCAAACAAAGTG
+TGTACCTGCTCCAATCTAGCAGCAGGTGTCATCTCGGTGCTGTTGAGTTTCTCATCCTTG
+TATTTTAAACCCCTTTTGGTCAAAGTGAGGGCGTAACCGGTGCAGGCGTGCCATACTAGT
+CTTGAAAGTGACCGTTTTGCGTGCTTGGTCAGTGGCAAGTAATAAACTTGCTTCGCATGT
+TCGAAAGCCCTCTTACTATGCCAGGTGTACTCGAGTTCACTTTCTTCTGCCAGCAGTGCT
+GCTGCATCTAGCCATTCTTACATGTCAGACTGATCAACGTACTGGCCTCCTGTTGCGGAC
+GTGCTGNNNNNNNNNNATCTAAGGAGCAGCACGTCCGCAATGATGGCCCCATACAGTAGT
+GATTTCTTGTCGAAACCACCAAATTCGAACACTGGCCTGTTGATACTTGAGCTAGTGATC
+AACATCTTAGCGTTTTCTGTCTCTGCAGTGAAAACAGACCTGTACGTTGCAGCTCCAATA
+ATGAGCTGTTTCAAATCCATTTGCTTGTCGTGCCATTTGGTCGGTGACACACATATTCCT
+CTCTTGGTTCTGATGCACATTAGCGCTCTGTACAAGTTTACGACTGACGCTGCTCCTGTC
+ACGTCGTTGATTGCTGACGTCAGTGACGCAAGGAACATCGATTTTGACGCCTGAGTTCCT
+ATTGGCCTACCGCTTGACGTCACCGGAACTGCAATCCTGCAGTTGCTATTTGTGGTAACA
+GCNNNNNNNNNNCAGCACGTCCGCAATTGCCTTCCATTGGGTTGCCAACTCCCAGTACCT
+TTTCGTCACTCACCCTCAGTTCGAAGCCATATCGCCTGAGTTCTGGTGCGATAGCCATCA
+CTCTCGCTTCTGCTCCCATTAACTGACCATTTATGATGTTGACATCAGATCTGTCGTTGC
+CATCAGCAACGCAAGCGTCATCAACCCATGCCATCAGCGAGTTCAATGCTCCTGCCGTTG
+CCCTCGCTGCTGATACATTAGTCAGCAGCACGCCTGCCTCATTTTGAGGGCCTTGGACAT
+ACTCATCATGTTGCGATGTCACCGAACAAGCGTAGCTACCTTCAGACTGAACGTCAGTAG
+TGTACCTGGTGCGCACTGCGCTACCTAGCACACTATCTGAAGTCAAAGCGCTTCTCGAGC
+TCATTATGCCCGCCCGCATGAAAGGTTCATCTTTGTCAACCACTTCATAAACACCATGAC
+CCGTCGGAGTTACAACGCTCTCGTCATGCTGCTTGTGTTTGCCACCAAAACCAGCGTATC
+TGTTGGTGGCGATTATTGGCGTGACTCTTGCTGCGACTGATTTTTCAGCAGAGTTGTATT
+GAAAAACTGGTACGCCCATCTTGTACAGTTGGCTGCAATGTCCCAA
+>ds2020-267_2
+CAGCACGTCCGCAACAGTTGGTCCTTGCTAACAGTAATGGCGACTTGTGGACACGCATGG
+GCGCCTTGCATGGACAAAGTTCTGCAGTGGCCTGACATAACGAACACGTTTATGTCATCA
+CTACTACTTGCCATGGCTGCACTACCACCAGAGTTATATGTACTAATGGTGGAGTGGAAC
+GGCTGGGCAAAGTGTGGCTCTATGGCAGAGTACATCGTAGAGGCAAAAAACCTGACGACT
+AAGATGAAGGCACTGGACAACCAGGTAACATTGGGTGACTTCGAACTCGACTTATCGCCT
+TTATTCGAGTGGGAAGTGCTAAATCACAGAGCGGTCTTGAAAGGCATCTATGACAAGGAA
+GTCACAGAGCGTAGAGATCAGAAACAGAGCATCAAGCTATCTGCTGCCGATCTGGAGGAA
+GAAATAGACAGCGTGTTTCAGGACGTGGGTTCCGTTCTAGACGCCAGGACAAAAGAGGGT
+GAAAAATCACCTCTGTATGCAACGTGGGATGATTGGTACGTTGACAGGGTGCAAACCACA
+CCAGCTGGGTCTGCATTCACAGTCAACAAGGACATGATGGAGGCAAGAAACATGCTGAAA
+GCCAATGGGGTCCAAAATCTGACCAAGACGCAAGTGATGGCGCAGATGAGGGACAAGCTC
+CCGCTGGCGTCTATCTTGGGTAGCGAGCCAATGATATTGGCCCAGATGTCATGGAAGTTG
+GAATGGTCAAAACTGAGGGCACTATTTGCTGCTAGCATGGAGCACTGGATGCCATCGGCA
+TTCGCCCTGGGGCAGATAGAAGAGTATCTACCCAGTGACTGCCCCATAGGTAAAGCTGCC
+GATGCGCACAACGTGTGCAGGCGCGTGATGGAAATGTCAACGCAAGGAGTGGTAGCATGC
+ATAGATGCAAAGAACTTCAACATCTTGCACACCCACGAGATAATGTCAGCAATACTGAAA
+TCCGCATCAAAGATGCTAGGAGATAGGCTGTCTAGTGAGCAACATGACTGCCTAAAGTGG
+CTGGCGAAAGCGGAGCTGAACCAGAAAGTGCTGGTCAAGACAGGTGAAGTAACTGAACAG
+TTGCTCCAGGTCGGCAGGAGAGACGGGTGGATTAACAAGCTAACTAAAGGTGACGGCACA
+GTGGTAGAAGCGGCTGACGTGACGGTTGGAATGTTTTCAGGTACTAGGTTCACGATGCTG
+TACAACACAGTGCTAAACAGGGCGTACTACAAAGTGGCGGAGAAACGTGCGAAGATAAAG
+ACTTTATCACTTCATTCGGGTGATGACGTGTATGCTGTTTTCGCTAACTATATAGACGTG
+TACAAGATGAAGCGTGAGATGGCGTTAATCGGCTACACACTGCAGTTAGGCAAGTGCTTC
+TTGCAGGGAGTCCGAGAATTCTTGAGAATATCTCATAAGAATGCAAACACTTCTCAATAC
+CTAGCGAGGTCCGCAGCAACGGCAATACATGGAAGAATAGAGGCAGATGAGCCTTCTGAT
+TTCGTGGCTTTTGTGGGGTCAATAATGAGAAGAGGTGCAGAGATGGTGGTCAGGCACGCG
+GCAAGAGCAGTGTTGCTAGATGTCATGAAGATACAGATAGCAGGAGCTTGCGCAAGGTGG
+GCGATTACAGCTATGGCGTGGGACTCATTCTTAATGTTGCCAAAAACAATGGGCGGTTGT
+GCTGCAAAAGCACGCCTGATGGAACAATGGAGTGGTTTTTCTATAGAAAGAACTGCAAGC
+GCCAGAGGTGGCATCGTAGACTATTTGGCTGAACAACCAGGTACCAAAACAGCGGCGAGG
+AGGCTGGTTGAGAAGTTGCAAATAATGAAGTACCACAAGAGAGTTGCACAAGCCGTTGCT
+GCGGCGATAGCACCTAAAGGAGTTTTGAAAAACTACGGTATGATAGTAAGGTGGATGAAC
+AAAGATGACATGGCACATATGTCGAGAGTGGCAGGGACACTAGGGCGAATAAGACAATCG
+AGAGAGTACATATTATCAAAAGCAGCAGGATTATTCAATACGCTAGCAATAAATGACAAC
+TTCTGGGGTGATGTGAGCGGTGTGTTCAGAGGCATACCGTCAGCGTGGCACGGCAGAGCA
+CTGACGTTCGCACTGTCTGAGAGGAGTGAGTCAGAAGCGCTGTTTGCAAATAAAATGTAC
+AAGCTACACTATAAAATGACAGAGTGGGCAAGAGCTGCAACAGAGAATAGACTGATAAGA
+ATGCAGCTAGATATGCCACCGGGGTAATGCTGGTGGTAATAAGTACGATAGAACTTGCCA
+TCCACTAGGGAAGTGGACACAAGCGGAGTAGGCGACCGGTGGCAAGTATAACAAGCCAGG
+CTGAACGGCCGTACGTGGCTCCCAGACGTACAAACATTGGCGCTATCAACTAGCGCCTAC
+ACAATATAAAATATGCGTTTAGTTGCGGACGTGCTG
+>ds2020-267_3
+CAGCACGTCCGCAATCTGAAACGGCTGTCTGGCACGCCTGCACTGGCTTCATTCTCTTCG
+TGACCAAGGCATGTCTGGTGTACGATGGGGGTGAGAATTCAACATCTGAAGTCACACCGG
+CAGCTAGGCTTGACCAGGTACACCGAGTGTACGCGGCGTACAGTAGCAGGGTTAGGTACG
+TAGTGTCTCTTCTAGTCGGCGAGGATGCCAACTGGCCGAACCCAATCGGACTAGTTCACG
+TCTACCAGCTGGCAGTCACGCCCGGGCACCCGAAAGACATGTTGTCTTCGGATGACATTC
+ACTCAGTTTTGAGCACACCCACCGCGAGGGTGAAGAACGGCAGGTGCACAAGGATGGATG
+CACCATGTCAAGTCAGTTGCTTTGCCCGCCTTGATGATTTGCACGAGTGTAGGCGATGCA
+AGTGCCGGGTGACGTGCGCACTGTGCATCAAGGCATTGTGCCTAACAGGTTACGCGCATG
+ATGGGAGTAGAAAATCGAACAGCCAGGAAACTACGCCTGCTACCGGGGGCGATGTACTCC
+ACGCTAAGACGATGGGATCCGAATACGTCGGTGAATTGCACGACACTGAATCTATAGTGG
+GTGCAAAGCCGATTGACTTGGCACCTGTAAACGTCGATGTGCGTTCCGAGCTGGTTGAAC
+TCGCAAGCAATCTGCTCAAGATGAACGGTAGGCGACCTAGTGCCCAGGTTAAGAAACTGA
+GCGTGGGCGACACTGACGAGAACAGGAATGAACATGGCTTCGAAAGTTTGTCTGAGTCGG
+ATAACAACGCACAAGAGCTCGATGCAGAATCAAGCGGTGATGTCAGCATGGTAGGTGAGA
+TAAGCGAGCAGCAAGTTAGGGATGCAATCGCTCACTCGGAAGCGGAAAGTCGACTGTTCG
+ATGACACAGCTGACGTGGATGACAAATTGTTTGAAGCGTGTTCGTACGTACCGGGTGACG
+CAAGCGAGGTTGGGGTATCGGACGTGGACGTGACTCCTAAGAAGAGTGCGATACGACCAC
+CAATATCATCAAGACGCTCATCCACGCCCACGCCTACCACGTCACGGGGGCTGAAGTTCG
+ACGTTGATATCATTGCAGACATACTACACGAGCCACCGAAAATGTGGGACCAGTCGCGCG
+AATTCGTTGAACAAACGGAACCACCGGTTAGCTTAGAGCAATGCACGGCTCTGGTGCCGA
+TGCACGCCGGTTTTGCGATGCCAGTGTGCAGCAAATTGGGCTACTGTGACATACTAAGCG
+ACAAATCAGCGCTGCAAGACGAGCTCGTGGTGAACGACGAAATCATCAATTTCAAGGTGC
+CAGAGCAAGAAGAAGCCGAAATGTCGGCATCAATCTTTGCGGTTGAAAGGAGTGGTGAGT
+GGATCAAGTTATTGCCACAGCGGCAGAAGCTGAAGCTCAGCTGCGGGCGAGATCACTCCA
+TGACAGGGCCCCACTGGTGTGTACTGAAGAAACAAGATGGCAACTCGTCACTGCGGAAGA
+TAATCAGTGATGCAGGCATGACGGACAGACTAGTAAGGTCACAGTTGATACGCAAGATTG
+TCCCTGGGAGACCATCAACACTGTACCTACCAGGCAGTGCGATGTTCAGGGACATCACCA
+AAAACTGTGTGTGTGCAGGGTGCTCGTCCTTCAAGAGGACGAACGACCCAAACATGGTCA
+AACGCAGTGCTGTGGACTTCCCAATATGGCACTACGATCTGGGGGAGCTGCATTCATTGG
+ACATCAAGATACCGGAAGGCCAGCGCGATTCAATCGTCGGCGACCTGATGGAGAATAGGG
+GCGCAATGGAGCAGTTCTGTGCCATCAAACCCTGGCTGTCAAACATGCTCGGGTTCATGG
+TCAAACCAGGCACAGTGAACCAAGTCGGTGGGTACGGAGATTTTCACTTCAGCAACCCCA
+GGATAAACGTCAGCACGCACCCAATGAGCCATGAATCAAACTACAACTTGCCGCTATTCT
+ATCGCAAACCACTGGTAATGCACATCAACAAGATACATGCGTCGCTGCCATGTTGCTCAA
+TGGGTTACGGCGACATCCTGACGTTCCCTCCAGACCTGGAGAACGGGATGCCATTCGAGG
+CAAGGATGAGAATAGACAAATCGATTGTGCTGAACTCACACGATGATGAAACAAAAATGT
+TTCTCATAGCGGCGCTGGCGACATTACTGTGGCCTAGGCCAGGGGAAGAAGACCCACAAA
+GAGCAAGTCTGAGTTTTTCAGGCGTGATGCTCGGTGACATGAGGCATTACTCGATGAGAA
+GAGTAGTGCGTGATGGCAAACTGACGGATGACTCCGTGCTTCGCGCAGTAACGGTGTCTG
+ATCGAATGGACAAGGTGGAAAAACTGAGTAAAGTGAGAGTAAGCGAAAAGACATTGCGGA
+CGTGCTG
+>ds2020-267_4
+CTTCCGATCTATCTAAGGAGCAGCACGTCCGCAATTCAGCTACTCTCAGCACGTCCGCAA
+TACTAACAGCTCAGCGCGTCCGCAACACGACTGGGGCACACGTCCGCAACGTCCACGACT
+TATCACTTGCGGACGTGCTGCTCCTTAGATTCTGGAAGTAAGGACGTTCGGGCTTCCTAT
+TCCGCTTTATTAAGGTACACTAAGTAACTATTCCTATTAACTCCATCGGGTCCTTAGATC
+CTTTGAGTAGGTGTAGTAGTGGGCCGCTTTTATTGGTCCCATTCAACACGTCCATCAGGA
+AGCCGGTCATTTTGGCTTTTCCGTAATTGACTATGTCTGTTTCTTCTTTGTGTACCTTGA
+ATAACGCTCGCAAAATCTCGTACCGCTTGATGTTACCATTCCTTGAAACGTTTATGTTCC
+TTTCTTTTGGTATCACCGCGTCGTATGTTGCGCGCATTATTCGTGAAATGAAATCCTGCA
+AAGGTCTTTCAAGTTGTAGTGATGCTTTCACCATCCTGGAGTAGTCCACCACTCCCGGTA
+ACACGCCTATCTGCGTGGCACCCTTCCTGAAGCCCGACGACCGTATCATCCACTTTACGT
+CCGATCTCTTGTCTTCACTTATGCCCCCCACACACCTGTGGGAGGTCTTTATTTTATAAC
+AGTCTGAAACTGTCATGTGCAATCGCTCACATTGTCTCGAGTAGTATTTGTTCCTCAATG
+ACGCCGCTAACCACATTGGCATTCCCCTAGACACTGAATCGTCCAGACGCGACTCCAGCG
+CTTCCAAAAGGTCCCTCATATCGCTTGAAGGTTTTGACTCTATCCTCGAGTGTACCAAGG
+TTGCCATAGCTCTAGATAGATACTGTCCCTTAGACCCACGTTTGTGATCTACGCGTAGAA
+ACTCTGCTATGGCCCCATACGCACATTTGCTCATCTGCAGGCGTATGTTGTGCTTCTTGG
+CATTTTTGCCAGCTAGCAACACGTCCTCGAGCGAATTACTTCCCAGTAGCACGTCGTCAC
+CGTTGTGGAGGCTGTTTTGCGATTGTACCACGTCAGGTACTATCAGTTGAGTGTAAATGT
+AGTTAAGCACGCTGTTCATGAACGTAGTGAGTCGCCACCCCGATAACAGGGTCCCCTTAG
+CGTTGTACTCCATTTTCAAGCCTTGATTGTCGTGTACTATTACCCTATCCAGTGAAAGCC
+GAGTCCACTCCACAGCTGCTAGTTGCTCCTGAGTCAGGAAGTGTCCGAAAGTATCTCTGT
+ACGCATCTATTACTGCTTTCATAGATTGTACACTGTGTTGACTGTTGAAATCCTCGAAAT
+CTACACAATACTGAGTCCTGCCTTCTAAGACTGACCTTACTCTACTGCGGACGTTCTCAT
+CGTTGGCTGCTTTTCCCACCGGGAACGGCGAGGGCAATACGTCCTCGCAGTTATAGAAGG
+CGAAATGTGCCAATACGTAACTAGTGACATCTGTCCCGTAGATAGCGCGGAGTTTGCTCC
+ATTCATACTTCGTGGATGACCATGCGTGAAGTTCAGGATCTCTTTCGCGCCACGAGTCCA
+TATTCATATCCGGCATGGCCAGTATTGATATGAACTTGTTCTTGAGGTATATGTCTTTGA
+ATATGTATTTATCGTCTTCTGAATATTGCGAGTGTATGCTGCCGGCCGCACTCCACTGCC
+ACCTACTCTGCCAGTACTCCCGCCAATCAAACTTCCTCGGTCTCTTACCCGCTGAGATCG
+ATCTACTGAAGAGCTGCGAGGCCCTTTCATAAACCAATCCCTCCGGCATCTCGGCCAAGT
+TAGGGGACACCCTGTTCTTGTGCTCCTCCTCCCAGTTGACCAGTCTTGATTTGCGGACGT
+GCTGCTCCTTAGATANNNNNNNNNNGGACGTTCGGGCTTTGCGCTGGCAATGGAGAACAG
+TCCTGACCCTCTAGCGAGCTGCATCTCCTCGGGGGTGAGACCAGCTGCCCACAGTGCCAC
+GCCCGTAAGGAATGAGTTAGTAGCTTCTCTGGTTATTGATAAGGCCAGAGCTACGCTGTC
+AGAGTTGACTCCCAAAATGTCTACCACCTCCTTGAACGAAAAGTGAACATGATGCGACGC
+CGTTATCTTGGTGTGTTTTGCCGACATTGCTTCATGTAACTGCCACCCTCTGCCTTGCTG
+TCCATTTACTTTCCTCAATAATCGCTTCGGAGACACAGGGTCCTCAAAGTCGATAGAATC
+GTAAAGACCTGAGGTGTGCCTGGTCATTTGAGAAAGTATTTCTTTGCGTATACCCCAAGA
+TCTTTGCGGACGTGCTG
+>ds2020-267_5
+ATCGCACATGATAAAGCCCGATATCTAAGGAGCAGCACGTCCGCAACCCTCTGCCTCCAA
+CAATAAAGCAGATTTCTTTGCTCTTCTAACAGCTATTACTTACCACAATGGACCACCTCA
+CTTCCCTTTTCGAGCTTTTTGCTATCACACCGAAAACACAAAACAATCTACAGTTTGTTG
+GGATCTACCACAGACCTCCACACTCCGTTCGAGCAAACCTCCGCAACGTTGAAAAACACA
+AAATCACAGTCGCTCACGCCATGCACAAGTACCTTTACCCGCATGAAATCGACTTTGTTA
+TCAACCAAATGCGACGCTCAGACGTCACTGAAGATGCCATACTTGCTGACTTTTTCGACA
+ACAACGTCGAACCACTTGAACCTGTTCTTGACGAACACTTCGAACGTGGACTCTCCGCAA
+TGCTGGACGCTTTTCGCCCTCCGCAGAAATGCCTACCTGCCCACATCTATGATGTGCAGC
+ACCACTACCCATATAAATGGCAAGTGAACGCTGAAGCCCCCTTCTCCACCGATTCCTATT
+TCTTAGCGAATCGACCAACCTTCCGCGCAGTGTTTGAACGACTCGAATCGCTCTACACAC
+ACCTCGCAACCGATTGGCACCGCCGATACGGAAACAAAACCGACAATGATGATTTTATGA
+ATGATCATGTCCCTGCGAAATTTGGCCCTATGAAAGAAACAGTCTTCTCATGGACTCACC
+GATGGCACCACGTCATCAAATCCAACTTCACCGACACAGCTGGATTGTCTAAAGACTATT
+ACTTCAAAAACCGATACATCTTCCCAATGCTACTTCACACGAAGACAGCGATTGTCAAGA
+AAGACGACCCGAATAAGATGCGAACCATCTGGGGCTGTTCAAAGCCTTGGATCATCGCAG
+ACACCATGCTATGGTGGGAATACGTCGCGTACGCTAAGTTACAACCTGGAGCCACACCAA
+TGCTCTGGAGTTACGAAACCTTCACAGGTGGCTGGCTTAGACTCAACCACGCACTTTTCT
+CTTCATACATACGGCACTCGTACATCACACTCGACTGGAAACGCTTCGACAAGAAAGCGT
+ATTTCTGCATCATCGACAAAATTTTCGATGGCGTTGAAACATTCCTCGACTTTGACAACG
+GCTATTTGCCTACGAAAGATTATCCCGATACCAAATCGACTTGGACACAAGAACGTTCCA
+CCCGCCTCAAACGCCTGTTTGACTGGACAAAAGAGAACTTCTACCATGCACCAATTGTCC
+TACCCAATGGGCACATGTACGTCCGAAAATTCGCTGGAATACCCTCTGGCCTATTTATCA
+CTCAACTGATCGATTCCTGGTACAACTACACCATGCTCGCAACCATCCTATCCGCGATGG
+GCTTCGACCCTCGGTCCTGTATTATTAAAGTCCAAGGTGATGACTCAATCATCCGCCTCA
+GTGCACTCATCCCTCCGGATGCTCACGATTCTTTTTTAACTAAGGTCCAAGAACTCGCCG
+ACTACTACTTTCAATCAGTAGTCTCCGTGAACAAGTCTGAAGTACGCAACGAGCTCAACG
+GATGCGAAGTTTTATCGTACCGACACAGACACGGTTTACCATACCGCGATGAACTAGCTA
+TGCTAGCTCAACTGTATCACACGAAAGCACGCAACCCAAGTCCCGAAATCACAATGGCAC
+AATCCATCGGCTTCGCCTACGCTTCCTTCGGAAATCATGAAAGAGTACGTCTCGTACTAC
+ATGATATCTACGAATATTACAAGCATCAAGGCTACACACCCAACCGAGCCGGACTCAGCC
+TCGTCTTCGGAAACTCTCCTGACCTCATGATCCCGCACTACACACTTGATCACTTTCCCT
+CAATCAGGGAAATAAAAATGTTCCTGACTAATGCAAAATATGCCAATGAAGAAACCAACT
+CACGAACGTGGCCTTTAACCCACTTTCTCCATCTTCCTTGTCATCGCACTTAGTATTTGA
+GCAATTGCAATTACAACATAATTACAAAAAAAGGATTGCGGACGTGCTG
+>ds2020-267_6
+TGAGGCTATTGTGCTGTTCTTCTGACAGCCTGGAACCTATCATCACTGACGCTGATTCCA
+ATAGTGCTATTGCTAGTGTGTTGTTTTACTTGCCTGGGAGCCGCAAGCGGCTTGCAAAGC
+CTGGCGTTAATTGTACGTGCACCGGTTGCCTACACCGACGTTGACGGCGCTAGCTCTCCC
+TCAGCTAACGGGTCGTTAGTGACCAATTCTTTTGCGCCCATTTCGTGCTTGCTTGTCTGG
+GAGCCACAAGCGGCATTTGCAGCCTGGCGAGTTATTTGATACGTGTACCGAGTGCCTACC
+CCGACATTGACGGCGCCAACCTTCCCTAGGTTGACGGGAGCCACAAGTGTTTCACACTCA
+TGGCTCTAATTACAGTGGCCTTTGGCCCAAGTTGAGCCTATGTCTCGTTTGCGAGTAGTT
+CGTCGCCACTCCTATCCACCCCATCACTGTGGTATGTAGCTTGAACCTCCTGTTATCGAA
+CAGTGCTTTCTCCTCGCCTCTTTTCGCCAGCGCGAACGTTAGTGCTCTGGCGTGCCACGC
+TGACGGTATGCCTCTAAAGACTCCCGTCACGTCGCCCCAAAAGTGGTCGTTGATGGCCAG
+CGTGTTGAACAAGCCAGCTGCTTTGGATAAGATGTACTCACGTGACTGTCTTATCCTTTC
+CAGTTGACCCGTCACGGTCGCTAAATGCTCAAGATCGTCCTTGTTCATCCACCTGACTAT
+CATTCCATAGTTCTTGAGGACACCTTTTGGTGCTATGGCTGCTGCCACGGCTTGCGCAAC
+TCTTTTGTGGTACCGCCGTATGCCTAGTGCCTCTACTAACTGTCTCGCAGCAGTCTTGAC
+TCCTGGTTGCTGCGCCAGGTAGTCGACTATACCACCACGTGCGCTGGCAGTTCGCTCGAT
+AGAGTACCCACTCCACTCGTCTGCCTTTCGTGGTCGCGCAGCACACCCACCCATGACGTT
+TGGCAACACCAGAAATGCGTCCCAAGTCATGGCCGAAATTGCCCAGCGTGCACAAGCCCC
+TGCAATTTGCAGCTTCATCACGTCGAGCAACACGGTTCTCGTTGCATGTCTGACAACCAT
+TTCTGCACCACGTCTCATGATGGAACCCACGAATGCCACAAAGTCTGATGGTTCATCAGC
+CTCAATTCTACCATGTATTGCAGTAGCTGCAGACCTCGCCAGATACTGTGACGTGTTTGC
+GTTCTTGTGTGAGATCCTTAAAAACTCTCTCACACCCTGCAAGAAGCACTTCGCTAGTTG
+CAGTGTGTACCCAATGAACGCCATCGCTTTCTTCATTTTGTACACGTCAATGTAGCTGGC
+AAACGCAGAGTATACATCATCGCCAGAGTGTAGTGACAGTGTTTTGATCCCGGCGAGTTC
+TTCGGCCACCTTGTAGTATGCCCTGTTGAGTATCGTGTTATACAACATCGTGAACCTCGT
+TCCTGAAAACATGCCAACCGTGACCGTCGCTGCTTCCACCATGGTGCCGTCACCCTTCAT
+CATTTGGTTTATCCACCCTTCTTGTCTCCCTGCCGACAGCAGTTCCTCTGTGACCTCACC
+TTTCTTCACTAGTACCTTCTGGTTCAACTCAGCTTTGGACAGCCATTTGAGGCACTTGTG
+CTGTTCTTCTGACAGCCTGGAACCTAGCATCACTGACGCTGATTCCAATATAGATGCCAT
+CACCTCCTGGGTGTGCAAGATGTTAAAGTTCCTCGCATCTATGCATGCAACTACTCCCTG
+AGTAGACATCTCCATGACTCGTCGGCACACCCTGTGTGCATCGGCTGCCTTGCCGATGGG
+GCAGTCAGCTGGCAAGTACTCTTCAATCTGCCCAAGCGCTAAGCCGTTGCGGACGTGCTG
+>ds2020-267_7
+CAGCACGTCCGCAAAGTTCGCTCTCTTCATTGAGCTAATTGGTTAAAAGTCTACTTGTTA
+AGTAGCATTCACATCAAGGAAAGAATTTCGTCAAAATGGCATACCAAAAGCCCGACAAAT
+CGACCGTCTCCGGCACGACTCTTACGCCAGATGACTCAGCCTCACAAGCTGGTCCACAAA
+ATGATACCCCCAATCCTGCGAAGTCCGGACGCCCAAAGCGTTCATCAAAGATTTCAAAGG
+GCAAAGATCTACCTCCGGGTGCGATCAAGGTACCAAAAGGTGGCGCCAACATGACGGGGA
+AAGCATCTCCCGTACAGTCTGCAACCATTCCATTTCGGGATGGGGAGAAATAGACCTCAA
+CTCTCATAGAAATGAGATTGAGCCGGTCTTCACAGTCGACGCTCAGCCGTATGACGACCT
+TGTCAACGTGGTGTACTCATCACTTCAGTCGCGATACTCAAATGCGGCGAAGCACATCCC
+GTTTGGCCTCTTCCGCTACTACTGCATGCAATTGTGGTGGTATCGGGTTCTTTTTCTGCA
+TCGCACGAACGGCAATGCTCTCACATCTGACGAACGTCAGTTCATGAGCATCATGGAGAC
+TGGACAAGAGTTCCAAATCCCCTCCCAAATAGCACAGTATCTTGCCAACCTTGGCAATTT
+CATGCAAGGAGGAGAGAACTTCTTTTTCCGCCTGCCCCCACACGCCTTCGCCGAAGCAAC
+AGGCACTATCCACTCAGGATGGTTTGCCTCTGGTCTTCCCACCGCCAAGGTGGACACAAC
+TTCCTTCTGGAAGTACGCTCAACTTCCGAGTCCGGGCGTTTTCGTGTCCTATATGTGCAA
+CGAAGCACATTACAACACCCCTGGCCACCAGCCCAATCGTCTCTTCGATCTCTCAGAGAT
+CGCCCCCACCATTTCCGACGACAGTTATTCAGTTCCGACTGATAACATCGTTGGTTGGAG
+TAACGGCATTTACACTGCCACGCACGCCTCCTGGCGTTCGACATACTCCAATCTTGGCTG
+GTCAATCGACGGTTGTGCCCTTGACTCTCAGACAACATTCATGCTCTCGACATCGACCAT
+GCGTGCCGTGTCTGACCGTATTGCGTCCGTCACCGGACTCAAAGTGAACACGTCAACACA
+GTTGACACTCTCTGTGCAAGGCAATCCCCTGGATTGCTACTACCTTGCAACTGTGGACTA
+CGCCTCCAACCGCTCTCAGTGGCCAAAGGCACCTGGTCCTCATCAACAACAGAAAGTGAA
+CGGCTGTTTGCACACAGAACTCGCCCTCCACTCCCGCTACGCCATGGACTCAAAAGTCCT
+ATCACCCGCGTTCTCGTTCGGATATCGCCTAGAGCGATCGCTCATCTGGAACGGTACATA
+CGATACCGACAGACGTCCGGTCCACGCTCAGGCCAGCAACTATCAGCCCTGGCTGATACA
+GTCTGAAGCCGACGACAAATACCGCGATCCTGGCCCCGCATGGATGGCCCATATGAACGA
+TTCGTTCAATTTTGGTTCTTCATTGAACTTGAATTTACGACGATTTTCGACTCATGGCCT
+CATTCGTTCTGTCGCGCTTGACGCGTCCGTTGTCCTCAGTGACACCAAGTAGAAACTTCT
+TCTTCTACTACAGCAACTCTCTCTCTTGGTAAAGCTCACTGGTAACCGGTCCAAAACGAA
+ACTCTTAAAACAGTGGATACCCTCCGGGGCGCACGTCCGCAAGGGTCCGGCAGTTGCGGA
+CGTGCTACCCAAAGACCTTTGCGGACGTGCTG
+>ds2020-267_8
+CAGCACGTCCGCAAACTGGGGTGTCTGGTATGGTAACTTCTGTTTTTTGTTACTGATATG
+TCAATCAGTAAAGAACGCTTCCTCGAGGTGGAGTTCCGAATAGAGGGGCCGTGTTTCTTG
+ATATTTTTCGAAATCAGAAAAAGAACGTTGGCGTAGTGCTCTGTTGGAATAAGCCTCGGG
+TATGAACGCGTACTCGGGTAGGTTTCTATCTCTTCTTGAGATGAATTTCCGTGGCGAGGG
+TTGAGGTAGTAGCGCAGGGAAGAAAAATCCGCCGAAAGGATCGGTTTGTCGGATGGGAAG
+TGTGATTTCCTTCATCTCGAGACCGAGAGTGGAGAGATATTTGAATGCCTTTGAAGGCTT
+CTCTGCCACGTAGGCGTTGAGGGTTTTCTCTTGTATGCCGTTGGTGCTCATGATGTGTTT
+GATCGCATCATAGAATACATTGCATAGTTTTGGATCCATGCAGGAGTAGAGCTGTCCAAG
+TAGGCGTGCGCATGACTCGAGTGGTGAGTCAACTGGGCGTTCCGGGTAGATGGTGGAAGC
+GAAGATGAAGTCGTATGACCTTCGCGGTCCGGTAACTCGGTGGAAGTATCCGAGCCAGTG
+TATATTCTCAGGGTTATTACTGAGAATCGTCTTGTCCAGGTTAAGAATGCCATTGAAAAC
+ATCCTTTAAAACAACACCAAGTTCGACGAGATCAATCGGTCTATCTAGAAAGATGGACGA
+ATCATCTCCGTAGTAGTAGTCCTTAACGGGTAAGGCTCCAGTGACTCGGTAGATGGCAGT
+ACGCATTTGCACTGCGTTGACGATTGTGTCGAGAAGGTTGGTCCACATTGAACCAGATGG
+GATGCCAGTGCTCTTTTGTACTCGGAGACCGCGGGGTGTGCGTATCTTCGTGTTGATGAA
+GTAAGAGACCATGGCTTTCCATCGTCGTGCTGTTTGGTCTGAACGGACGTTCCATACTAT
+CCCTTCAGAATCTCTGACTTTTGAAAAGTCAAACCAATCAGAAATGAACGAGAATGTGTC
+TCGTATTATCCAATGGGTAACATTGGCGTCGAAGCGTGAAAAGTCGGTGGTGAGGGAAAC
+GATATTGTCGATCATGCTCCTCGCAAGATGCGAGTGGCCTGACTTCATTGTTTCCATTCC
+GATGCCGTAGCACGCGTCCTCTCTGTTGCAGAGTTCCTTCAATTCTGAGAAAAGAGGAAT
+GAAGAAGCGGGCCTCTTCAAGGATGACATCAGTTGGGTAACCCCAAACTGGACGTACTTT
+GACATTCGGTTGCTCACTTGCGACAACCCTGTTGAAAGCAAGGCAGTCGGGCAGCGACCA
+TGGGATTCCTCTTCCGATACTATCCCAAGCCCGATGTATCTTTCCGGTGGCAACTGGGTC
+TGCGAAGACCTCAGCTTTTGTCTTGTATCCTTGGTTGACCCAAGGGAAGCCGGGAGATGT
+CGTGGTGGGCATTGCGGAGTGCTTGGCAGCAGCTCCGAGGGTTAGCGGTATGATACGGTT
+AGCGGGGCGAAGTTCATCGAGTGTTTTCTTGATAATCGCAAGATAGTCACCATCAACACA
+CCGGGTGGTGGGTCGTTGGTCGTAATCCATGAGATTATCTTCGAGAACCGACTGGTCCGC
+GGACGGACGGTGCCATGTCGATGAGATGTTGCTAATGAAGTCACAGAGATCCGGAGAACC
+TGTCAATAGTTGCGGACGTGCTG
+>ds2020-267_9
+TATCTAAGGAGCAGCACGTCCGCAAGCCACGTACGGTGAAAAGAGAGCAGTCGCGCCTGG
+CGACTTGGGCTTGGTGGACTCGCTTGTGGTGAAGTCACAGATTGATTGGTGGCATTGCAA
+TGTCACTATGTGGGTGGCCGCTTACAAGTTGTCTGTGACGCTAGCTGCATCGTGTGGTGA
+CATGAACTTCAGTGGTGAGGAAGTTAATGAGATCATACAGTACACGTTCAGCCGCTCAAC
+ATACAGGAAGCTCGTAGCGAGCGACGCGGTGATGGACTCGACTAGAGACATTGCAGCAAG
+TGAGGTGACGCAGGCAGCGTCAACGCCAGTCAGGTGGGCTAGGCAAGTGAACCCAATCGT
+GCTGGTGCTCGACGATGTCGAGTACGCCATCACACGCAACGAAGTTAATGATGTCTTGAC
+AAAGGTATACGATAAGGTACACGCTGCAATCATGAAACAAGCTGGAAAAGGTTACGGTGA
+CTACAACAGTACTGGGCTTGAGCTGGTCTACAGCGAGGAGACAGGGCTATCAGCAGGTGA
+AACTCCGAGAGGGGTTTTGAACCCGGTTTTTGGTTACGCAAAGCTGGCAAATGGCGCAAT
+AACTGTGGAGCCATGCAAGTGCGCAGACTCAAACGCCGTACTCATGACGATGAGTGAAGG
+TGAGCAAAAACCAGGGCTGAGTGAGGTGTCAATCGGCAGCGAATCAGTCAAGGTAGTTAA
+ACGAAACAGAGGCGGAAGGACTTTGACCTATCTGATGCCAGAGACGATAAGCGGCATGGG
+GGCAGACAGGTCATATGTCTATCTTGCGGGGATGCACTTCAGAGAGGATGAGCTCAAGTA
+CTCACTGCCAACCCTGGAGTTCCTGTCACAGTTCACAACAAAGTACAAACCACTACAGCC
+GTCAGAAAGGTTGAGCAAGCTACGAGTGCTAACCGATCCAACTTCAACGCGAGTGCACCA
+CAGGCACATGTCTATGTTGACCGTGATGGCGACTTGCTGTCATGCGTGGGCTCCGTGCAT
+GGACACAGTGTTAGATTGGCCTGACATCACGAACACGTTTATGTCAGCGCTAATGCTAAC
+GATGGCTGCAGTGCCACCTGAACTGTATGTGCTCATGTGTGAATGGAACGGGTGGGCCAG
+CTGCAAAAGCATGGCAGAGTACGTAGTGACTGCGAAAGAACTTACAACAAAGATGAAAGC
+TCTAGACAACCAGGTGGCAATCGGCGATTTTGAGCTGGACCTGTCGCCACTGTTTGAGTG
+GGAGGTGTTGAATCACAGAGCTGTGACAAAAGGCATCTACGACAAGGAGCTAATCGAAAG
+ACGTGATGCAATGCAAAGCATTAAGCTCACGCCAGAGCAGCTCAGGCCGCACATCGATAG
+TGTATTCAGGGACATCAGTGCGATACTAGACAAGCGCACAAAGCATGGTGAGAAGTCGCC
+GATTTTTGCAAATTGGGACGATTGGTATGCTGATAGGGTGCAGGCAACACCTGCGGGATC
+AGCATTCACAGTCGAGGAGTCTCTTTTGCAGGCAAGACAAGTCTTAAAAGATAACGGCGT
+GCAGAACCTGACAAAGACACAAGTCATGGCGCAAATGCAGGATGGATTAAAACTGGATAC
+TCTACTCAGTCATGAGCCAGACATCATTGCGGACGTGCTG
+>ds2020-267_10
+CAGCACGTCCGCAATTTGGGTGGTCTGTTGAGACCATTAGATTGTTTCATTGCGTGTTGA
+ACGCATTGCGACAGAAACAGTTGAGTGGGGCTTAAAGTAGAAAAAAAGCAAACAACAATG
+GAAGGTCGTTCAGTAAAAAGAAATTAGAAAACAGAAAAAGAGAAAAACTCGGGGGTGTCG
+CGAGAATTTGCGCTTCTCTATTCAAATCTGAGTGCGGAGGGGGTGTGGTAGTAGCCGGAA
+ATCAACGGTGCAATGGTGTTGCTGACGTTGTATTGCGAAGTTCGACGACTATCGGGAATA
+CTGAAGATTGGTCCGACGTGGGTTGACTTAAAGTCAGGGCCAGAAGTGTCGGTGACATCT
+TTGTTGATGTCAGTCCAATCGGAGTTGAGCTGAGTGAGGATGCCGGCCTGTTCAGTGACT
+AGGTCGAGAAACTCTTCAGAGTGGAGGTGGATCGTAGTGATTCCAGTAAATTCTGGAATA
+TCATACCGGAGCGTGGAACCGGTCTGATAACGGACTTTGCGCGTGGTAACGGCATGAACA
+AGAATGTTCTTGTTTTGCCTAGTAGCCACGTACTTTGTACGTACATAGGAGATCCCAGTG
+CCAGTAGTGGTCACGGAGCCAAGGGAAACAGTGTCCTTGAAGAAATCACTGTAAGGCTGC
+ATGACGCGGATGACTTGAGCAAACCAACCGTAAGGTCGGTCAGCATGATTGCCGATGCCG
+CGAAAACCGAAGACCTGGTCGAGGTCGAGGGTATCGTCGTCGTCGGAGATGACATATTGA
+CTGTCACCGTCATTGGCGAAGGGGAGGGTGTTGCGCCACACGTTGGATGAGGTGGCGAGG
+CCGTTGAGGAGACCAACAGTGGTCTGGAAGTCGGACCGAGCACTAGGCGTAAGCATAGCA
+AAACGGGTCGCTTCGTCCTTGGAGGCGGGGGCGCCGAAGATCGTCGTATAGACGGTATCC
+GTGTGGGAAGCATTGGCTTGGACTGGGCCAGAGTTGACAGGCGAGATCAGGGAGATCAAT
+CGCATGAACTGATCAAGAATGAAGATCACATTCGGGAGAATGGTGTGAACTTTGTCTTGC
+CAGAGGAAACTGGTGCAGTTGATGTCATGGGCATTGGGTATGCCAAAGACAAGATTGCCA
+AAATTTTCGTTGGGGCCAGCGTTGGCGGCGAGAGACTGGAAGAAGATGGCGACAGGGCCA
+GGGATCTTCAAGTGTTCGGCCTTGAATTGGCTGTCGAGAAACTCGACAAACAAACGTTGA
+TCGTTGGTGATCATACCACCGTGAGATTGGTTCTTGAGAACCTGGTAGTAGAACAACACA
+GCGATGTAAAGCTGGGAGACGAAAGGGTGCCAGTCAGGGTTGGCGTCGGTGAAACGCTTG
+GTTCTGACCATCTGCGTGTCCATGATAGACAGGACGTAGAAGAGCTGAGTGGTGTCAGGC
+ACGACATAGGATATGTCATTGTGCTTGATGCCGAAGAAGGGGAGGTCGGAGACGCCTGAT
+AGCATCATTGAGAGACCCGGGTTCTTGGGGCCAGCGGAGCTTGCAGTGGGTTCGCGAGGG
+GCGAAACTCTTCTGCTTCTTGGCAGGAACCGAGTATTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_11
+ATCTAAGGAGCAGCACGTCCGCAATAGATGTTGGGTTCCGGGGCTTGGAAGAAGTGGTGA
+AGCAAGTCGCTAAGAATGAGACGGCTTCTGGTTCTGACGTAGAGGCAGTTCTGGCTGACT
+TGGAGGTCATGGTATACGAGCGAGCTCAATCTAAAGACCTTGCTTGCAAAGGCGAAAAGG
+CAGTCGCACTACCGAAAGATGTGCACGCCAGCTCATTCATCCACGGCGTCTCGACGGGGT
+TCAAGAAGCGTCAGTGGGCGGAGGTGACGCTTAACAGTGAGAGTTTTTTGCCTGTCGATG
+AGAGCTTTGACATTTTTGATGGCGTGATCACAGCTGGCGCGTACTCAACTGAAAAACTAC
+TGATCAGCGCACTGCCTTGTGAAGAACATGTGTCAAATGGGCACGCTTCAGTGAACACTT
+TCGTGGTCGCGCCGAGAAACGGCAAAGTCAATTTCAGGGACGTGATGTCAGCTGATTCGG
+AATACAAGAACATGGCAAAGAACATCCTGACGATGCTTACATTTGCCAGTCTGGATGCCG
+AATATGAGAACGCTGAGATTGAAGGCTTCGTTAAGGCGAGGCAAACCTTCCCATTGATAT
+CGACATCTCACATTGCCGAGTTTGGACACGGGTCAACAACGAAGAGAGAATATGACGTGT
+CAACTGCTTCAAGCAACACGCTGATCAACCTCAAGACTAAAATTGATGGTGACCAGATAG
+AACTTGCTGGGTGCTCTGTGACACTGAAATGTGCGATACTGATCGCATATCAAGTCCATC
+CGGCTCTTTGGAATGATTTTTTTGAAGGGCTCGTACCCCCGCCATTTAGTGGCCAGCTCC
+CGAGCATGCAGGGCATTATGCGGCGGGCGATTGCGGAGTTAGACATCCAGAATGATGAGC
+TGAGACTATTGATCGCCGAGACAGCCGCTACAACTGGTAGAGTTTACGGCATGTCAGATG
+AGTCCATGGTGGAGCAGCTCACGATCTCATACGCCAGGGCTGTCCCTTTTGGCGACACGT
+TGTTCCCGAGGGACGGAGACAAATTGCCTGCTGCCGATGTATCTAGCTGGCAAGTCAGAG
+GCGTGCTCACGCTGGAACTAGCGTTCACTAGGCTATTCAGCTTGTTTGCGCACCAGACAG
+ATCGAAACAAGTACGAGAGGAGCACACACTACGATCAGCTCAGCTCGGCTGGTTTTGCAC
+TTTTTGCGAAAGACGAAGAAGGCCAGTTTGTTTTGCCTATCGCGTCCATTATTTCGACGA
+ACGTCTTCAGGAAGTCTGCGACTTCAACTGGCACTGTGAAGAAACAGTTCAAAGCAAGAC
+CAGTCGGACACGTATTGCGCGAATTAGTTACCAGTGACTTGCCACTCATGCGTAAAGGGG
+TAGCTAGTGCAAGGGACGTGTTGATGGCTGATAACCTACTAGGTGCCAAAGCAAGGGGTA
+GATACGCAACCGACGTCAAATCAGAGGGCAGTTATGCATGCTCTGTTGCCACAGAGCCGA
+ATGAGTATGTCTGCGGGCCACGTGACACAGATGGCTCGATGCTCACCAATGTGATGGCCG
+CCATGTTGCGGACGTGCTG
+>ds2020-267_12
+AACGATTGCGGACGTGCTGCTCCTAGATAATCTAAGGAGCAGCACGTCCGCAAGCACCGC
+CCGGTGGGACAAGTGACTAAGTGCACATGGTGGATGCCTTGGCGATATCAGGCGATGAAG
+GACGTAGTAGCTTGCGATAAGCTGCGGGGAGTGAGCAAACACACATTGATCCGCAGATTT
+CCGAATGGGGAAACCCGGCCGAAAGGTCATCGTATTCTGAATACATAGGGATACGAAGCG
+AACGTGGCGAACTGAAACATCTAAGTAGCTACAGGAAAAGAAATCAACCGAGATTCCCAA
+AGTAGTGGCGAGCGAAATGGGAAGAGCCTGCATGATTTAGCATCTTTGATAATAGAACGG
+AATGGAAAGTCCGGCCATAGAGGGTGATAGCCCCGTATATAAAATCATCGGTGTGGAACT
+AAGTATGCGACAAGTAGGGCGGGACACGTGAAATCCTGTCTGAACATGGGGGGACCATCC
+TCCAAGGCTAAATACTCGATATCGACCGATAGTGAACCAGTACCGTGAGGGAAAGGCGAA
+AAGAACCCCGGAAGGGGAGTGAAATAGAACCTGAAACCGTGTGCATACAAACAGTAGGAG
+CAGACTTGTTCTGTGACTGCGTACCTTTTGTATAATGGGTCAGCGACTTACATTCAGTGG
+CAAGCTTAACCGCATAGGGAAGGCGCAGAGAAATCGAGTCCGAATAGGGCGAAATCAGTC
+GCTGGGTGTAGACCCGAAACCAAGTGATCTACCCATGGCCAGGTTGAAGGTGCGGTAACA
+CGCACTGGAGGACCGAACCCACTAATGTTGAAAAATTAGGGGATGAGCTGTGGGTAGGGG
+TGAAAGGCTAAACAAACTTGGAAATAGCTGGTTCTCTCCGAAAACTATTTAGGTAGTGCC
+TCTTGTATCACCGTCGGGGGTAGAGGCTCTATTGCGGACGTACTAAGGGGGAAAATTTGC
+GGACGTGCTGNNNNNNNNNNCAGCACGTCCGCAACTCCCGACCCATTGCAAACTCCGAAT
+ACCGACGAGTGCGAGCAAGGGAGACAGACATCGGGTGCTAACGTCCGGTGTCAAGAGGGA
+AACAACCCAGACCGCCAGCTAAGGTCCCAAAGTACAGCTAAGTGGAAAACGAAGTGGGAA
+GGCTAAAACAGTCAGGAGGTTGGCTTAGAAGCAGCCACCCTTTAAAGAAAGCGTAATAGC
+TCACTGATCGAGTCGTCCTGCGCGGAAGATGTAACGGGGCTAAGCTGTACACCGAAGCTG
+CGGATATCCTTTTAGGATATGGTAGGAGAGCGTTCTGTAAGCCTGCGAAGGTGACTTGTA
+AAGGTTGCTGGAGGTATCAGAAGTGCGAATGCTGACATGAGTAGCGATAATGGGGGTGAA
+AAGCCCCCACGCCGTAAGCCCAAGGTTTCCTGTTCAACGTTCATCGGAGCAGGGTGAGTC
+GGCCCCTAAGGCGAGGCAGAGATGCGTAGCTGATGGGAAGCAGGTTAATATTCCTGCACC
+GTCGTATGATGCGATGGGGGGACGATTGCGGACGTGCTG
+>ds2020-267_13
+CAGCACGTCCGCAAGTGCCAGGGCCTCTTGGAGTGTTAGAGTCGTTGGCACAACACTCGG
+GTACGGATGCACAGGTCGTCAAGGTAATGTACTCTGACAACAACGACCAGGGAGAGTTCA
+CCGTCAGGCCACGTGAACTGAGCATGGCAATGAATGCACTGCTGCGTGGCTACGGAGTCA
+AGGCTGAGCAGTTCAACGCCGCCGTCGTGAAACTAGGCGAGACCGTTGCTCATGCGTTTC
+CCATGAGGTCAAAAACAGGATCTATCAGTGCGCCGGCTCTCGCGCTGAGATTGCNNNNNN
+NNNNCAGCACGTCCGCAAAAGATTGCCAATTGAGCACGTGTATGGGATCCAGGGGCAGCG
+TTCACTGAACGTGTTTGGAATGCAGAGCCCGCAAGACACAGGCATGTCGGAGAACATCAA
+TTATATGCCAAACTTGCTGGGTGCTTGCACATCGATGGCTGCTATGATGTGGCAGTCATC
+ACTCAAGACGAACAATGGTAGAATGCTGGTAGAAGATGGCTCTGATGTCATCGATGTGGC
+ATCAACGATGAGCGACACAGTGAAGACTTATGCTGATGGAGTAGAGGTGAGGAAAGATGA
+GTACTCTGCGATAGGTACTGGTGAATGGCGACAAGGTAGAGCAGCGGCAAGCTACTTCCA
+TGTGAGTGGCGTGAAGGAAACCAAGAGCATTGCTGACGCTGTCTCACGCTATGGAAGCAA
+TGCAATGGTAGAACATGCGGGTGTCAGAACAGCGGTAGGCACTGTCATCGATCAGGGTAT
+GGCTGGTGGCAGGGTAGCAACTGTCGCGGCCCACTCCAGAGAACTGACTTTCGATTTCGA
+TCGCGGTTCTGCGGTCAAGAAGTGGCACAGATTGCCACAAGTGCTGGATGAGCACCAAGT
+CACCCTTGACGGTGTTGGTGACGTGAGGGTGGTTACGGTAGCAGTGAATGTCGCTCACGT
+CCGTTTTGACACGTTCAGGGTGGCTGACGGTGAAGTTGGTGCAGCCGAGCTCAAGGTGAG
+GCGCACGCGTTATGGGATGGAATTGGGAACACTGGAGCACACGTTGATGCAGGCAATTGA
+CACGGCAAAGAAACCAATGACTGACACTGTCAACGTCGCCGCGACTGCAGGTATGAGCCC
+TCGCTCGGCATCTGACCTANNNNNNNNNNCAGCACGTCCGCAATTCAATGGCAGTGGCGA
+GTTCAACTCCAGGATACAGCATGTCATTGATCAAAGAAGCTGGTGCCAACGGGCCAGCAA
+AGATAACTCTCACTGGCAAAGTACCAGTGTGCACTGTTGGTGAGTTTGCGAAGCTGATGG
+GTAACATGACGATAGCGCCTGTTTCTGAAAAACCTGTCCCTTCCTCATTAGCCACATCTT
+GCGGACGTGCTGC
+>ds2020-267_14
+CAGCACGTCCGCAACCGGGTATCCACTGTTTTAAGAGTTTCGTTTTGGACCGGTTACCAG
+TGAGCTTTTACCAAGAGAGAGCGTTGTAGTAGAAAAGAAGTATTGATCTACTTGGTGTCA
+CTGAGGACGACAGATGCGTCAAGCGCGACAGAACGAATTAGGCCATGAGTCGAGAAACGT
+CGAAGATTCAGGTTCAAAGAAGAACCGAAATTGAACGAGTCGTTCATGTGTGCCATCCAT
+TCGATGCCAGGATCACGATATGTATTGTCGGCGTCAGACTGTATCAGCCAGGGCTGATAA
+TTGCTGGCCTGAGCAAAGACCGGTGATCTATCTGGATTGTATGTTCCAGACCAGATGAGC
+GATCGCTCAAGGCGGTAGCCGAACGAATACGCTGGTGACAGGACTTTGGAGTCCATGGCG
+TATCGAGAATGAAGGGCGAGTTCTGTGTGCAAACACGCGTTGACCTTCTGATTTTGATGA
+GGACCTGGTGCCTTTGGCCACTGGGAGCGGTTGGAGGCGTAGTCCTCTGTTGCAAGGAAG
+TAACAATCCAGGGGATTGCCTCGCACAGAAAGAGTCAACTGTGTTGACGAATTCACCTTG
+AGTCCTGTGACGGACGCAATTCGGTCAGACACGGCGCGCATGGTCGATGTGGAGAGCATG
+AACGTTGTCTGAGAGTCAAGGGCGCAACCATCTATGGACCAACCAAGATTAGAGTATGTC
+GCACGCCAGGAGGCGTGAGTGGCAGTGTAAGTGCCATTACTCCATCCAACGATGTTCTCG
+GTCGGAACCGAGTAACTGTCATCAGAAACGGAAGGTGAGATCTCAGAGAGATCAAAAAGA
+CGATTGGGCTGGGAGCCAGGGGTGCAAGAATGTGCTTCATTGCACAGGTAAGACACGAAA
+ACACCCGGACTCGGAAGTTGGGCGTACTTCCAGAAGGAAGTAGTGTCTACCCTAGCGTCG
+GGAAGACCAGAGGCGAACCATCCGGAGTGGATAGTGCCTGTTGCTTCGGCAAAGGTGTGG
+GGAGGTAGGCGAAAGAAGAAGTTTTCTCCTCCTTGCATGAAATTGCCTAAATTGGCAAGA
+TACTGAGCAATTTGGGAGGGTATTTGAAACTCCTGCCCCATCTCCATCACGTTCATGAAC
+TGACGTTCGTCAGAATTCAAGACGTTACCGTTTGCGCGATGCAGGTAAAGAACCCGGTAC
+CACCACAATTGCATGCAGTAGTAGCGGAAGAGGCCGAATGGGATGTGCTTCGCCGCATTT
+GAGTAGCGCGACTGAAGTGATGTGTACACCACATTGACCAGGTCGTCATATGGCTGTGCA
+GTTGCGGACGTGCTG
+>ds2020-267_15
+TATCTAAGGAGCAGCACGTCCGCAACCCAATGTGGCTCTAGGATGGTGGCACGGATCAAC
+GGTGAACGTGCTGGCGAGGTGGTACGCGGTGGACACCGATAACGAGTGGACACCTCTGAT
+CTCGAGGAGGTTCGCAGAAGATGCCAAGAGCACGGACGGGAGCTACGAGGAGACGCTAGC
+TTACTGCTTTACGTCACACATGTTGGCGGAAGGCGGAGCATATTTGACGATAGCTGCGGG
+GTCACAGTGGTCAACAGTAGGGGCTTCAATTGTGTCAGGGGCCGCCGTGCCAGTTGTGAC
+ACAAAAATGGGCTATAATGGATTGCTCCAGAAGCATAGACAATGGAAACAGCGACGGCGC
+TAGGCTAGGAGACCTGATGGCAAAGATGGTGCGAGAAGGCACGACAGCAATGGTCAAGAT
+TGATGCCGTGGTGCAGGTACGCAGCATGCCCACCGTGATGGAGGGTAATAGAGACACGAA
+TGCCCATGCCACGCAACACAGCAATGTGGTGACGTCAGCAATAAACCACCCCATGTTGGC
+GTTGACAACGTTGTACTACGTGCCTGGAGAGCAACAAGTAGTAGACTCTGTGATACTGCG
+AACAACGGACGACACCCACAGCTCCAAGATAAGAGGACAGAATGCTATGGGAGGCGCTGA
+GTTGGCTGAGATATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAGANNNNNNNNNNCA
+GCACGTCCGCAATCTTCGGGGCCTTGGTGATCCTGCAACTGACCCAGATGCTGCAACCAC
+ATAGTATGAAAGTGCGGGTGGGAGGGTGGCAAGACATCAATGATGTCAAAACTACGTGCT
+TCATCGGGCACGTAGCTTTCTTTTGTTTTTCTTTTGTTTTGTTTTTGTTTATTCATGCGT
+CTTTATCTCATTTGTATCGTTTACCTCTGATTTTGCGTGAGTGTTCTTCAGTCTTGAACG
+TGTGCACATGGCAGACTGTGCCAAGCGATGGCTTCGTTGGCAAAGTATTCGCTGAAACAA
+AAACAAAAACAGAAGATACGGAACGAGTAACCGGCGTAGGTCAAATCAGCAAAACAGGCA
+GACGTGGCACCTGAGCTGGGAAATGGCACTTGAACAGGTGCACAACACGGCGAGTACCAG
+CCAAAGTACCGTTTTCACGAGGACGGTGTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_16
+CGTCCATCAGGAAGCCGGTCATTTTGGCTTTTCCGTAATTGACTATGTCTGTTTCCTCTT
+TGTGTACCTTGAATAGCGCGCGCAAAATCTCGTACCGCTTGATATTACCATTTTTTGAAA
+CGTTTATGTTCCTTTCTTTTGGTATTACCGCGTCGTATGTTGCGCGCATTATCCTTGAAA
+TGAAATCCTGCAAAGGTTTTTCAAGTTGTAATGATGCTTTCACCATTCTGGAGTAGTCCA
+CCACTCCCGGTAACACGCCTATTTGCGTGGCACCCTTCCTGAAGCCTGATGACCGTATCA
+TCCACTTTACGTCCGATCTCCTGTCTTCACTTATGCCCCCCACACACCTATGAGAAGTTT
+TTATTTTGTAACAGTCTGAAACTGTCATGTGCAATCGCTCACACTGTCTCGAGTAGTATT
+TGTTCCTCAGTGATGCTGCTAGCCACGTGGGCATGCCTCTCGACACCGAGTCGTCGAGGC
+GTGATTCCAACGCCTCTAGAAGGTCCCTCATGTCACTCGAAGGTTTTGATTCTATCCTCG
+AGTGTACTAAGGTCGCCATGGCCCTTGATAAATATTGTCCCTTAGATCCGCGCTTGTGAT
+CCACTCGTAGGAACTCCGCTATAGCTCCGTACGCGCACTTGCTCATTTGTAGTCGTATAT
+TGTGCTTCTTCGCGTTTCGGCCGGCTAGTAACACGTCCCCGAGCGAGTTACTGCCCAGCA
+GCACGTCGTCGCCGTTATGAAGACTGTTTTGTGACTTCACGACATCTGGCACTATTAATT
+GAGTGTAAATGTAGTTCAGGACGCTATTCATGAATGTGGTGAGCCTCCACCCCGACAGTA
+AAGTTCCTTTAGCACTATACTCCATCTTCAAGCCTTGGTTGTCATGTACTATCACTCTGT
+TCAGCGACAGTCGAGTCCATTCCACCGCCGCCAGCTGCTCTTGCGTTAGGAAGTGCCCGA
+AGGTGTCTCTGTACGCATCTATCACTGCTTTCATTGACTGTACACTATGTTGACTGTTGA
+AGTCTTCAAAGTCTACGCAGTATTGAGTTCTACCCTCGAGAACCGCCCTCACTCTGCTAC
+GAACGTTCTCATCATTCGCAGCCTTGCCTACCGGGAATGGTGAAGGTAACACGTCTTCAC
+AGTTGTACAATTGCGGACGTGCTGG
+>ds2020-267_17
+CAGCACGTCCGCAAACCGACTTGGCTGACAGAACTGCCTACTTAGAGACCGTCAAGAGAA
+TCGTCAGTGATCGTGTGCTTGCTCGTGACAGGGCTCTGAAAAAGTACCAGCACTCGTGCG
+CACCGCAAGCAACTAGTGTCAATCCGGTGTTGGGAGCGCCAGCTCAGGGTTTTGGCGGCG
+TAGCAACTAATGACTACTACTTGACAGAGGGCAACTTGCTGCCCGTGGAAGAACATTTAG
+AAGCGTACGATGGAGTGTTGACTGCAGGCGCAATGTCGTCGGAGAGGATGGCGGTCGGTA
+AGGTGCCACTCAAAGCGCCAATGAGAGCAGGGTCTGTTACGGTCAACACTTTCGTGGTAA
+CGCCGAGGGCAGGAGAAGTGCGCATGGTGAACCTAAAAACTTCATTTAGAGAGACTCAGA
+ACATGAGTCGAAATGTGCTGACTGTTTTGACAGCAGCCAGTTTTGACGGCGAGTTTCTCA
+ACACCCCACTGGATGGCGTGATATCATTCAGAAGGCGGAGGCCGTTGATCTCGACTTCTC
+ACGTAGTCGAGACTGGGTCGGGCGTGGCCACGAGGCGAGAGTATGACGTGTCAATGGCAG
+AGTCGACGCAAATAATCAACATAAGGAAGAGTATGCGTGGCACGAAGATACGCTTTGCAC
+CTGGGACTCAACTTGTGCACTGCGCGCTGGTGCTAGCATATCATGTAGTACCACATGTTT
+GGAGCGCTGTCTTTGGGGACAAGGTGCCTGAACAGTACAGTGGGAAGACCCCGAATGCTG
+ACTACATGATTAGAGCTGCCATCGCACGTTTGGACTTCAAACCTAGTGAGCATCAGGTGT
+TAGTCGCCGAAGCGGCTGCAGCTTTGGCATGCGTGTATGGCATGTCTGACGAGTCCATGG
+TGGAATCGATCTCACCAGTTGTTTCTGTACTAGAGCCCACAGGTGACTTGGTGGTGTCCA
+ACATCTCGAGCACTGTTAGAGCCACGCAAGTGATCAAATGGCAGACTCAAGGCGTGCTAA
+CGTTCGAGCTCGCGCTAACTAGGCTCTTCAGTTTGTTCACTTCGCAGGTGGACAAGCACA
+AGTACGAAAGATTG
+>ds2020-267_18
+CAGCACGTCCGCAAAGTGAAGCCGGTAAGAGGTCAGGCGACGTTGGCCAGAGCAAGGCTA
+TGGCTGCAGGTGACATAGGGAGAGTTGACGCAATGGTGATTGCGTCACAGACAAGCTGGT
+GGCACCCTGGCGTGACTATGTGGATTGCAGCCTACAAGCTAGCCGTAGCAATACTGGCTA
+GCGCCAAAACTCTGATGATGACCGAGAAGGAGATAGAGGCTCTTATCAACTACACGTTCA
+CAAGGACCACGTACAGGAAACTAGTAGCCAGCAACGCGCTAATGGATTCTACGAGAGACA
+TAGCAGCCAGTGAGGTGACCCAAGCAGCATCAACCCCAGTCAGGTGGGAGAGGCAGGTGC
+ACCCAATAGTCCTAGTACTAGACGATGCAGAGTACTCGATTACAAGAAAGACAGCTAGTG
+CAGAAATCACTAGCGTGTACGACAAAGTGCACTCGCACATGGCGCTAAGCCTTGGGTCTC
+TCTACGGTGACATGGCGCACACTAGGATGAAGCAGCCAAATAGGATTGGCACTGGTTTGT
+TGGCAAAATCAGGCAGGGCACAAAGGGCAAGTCCAGTTTTTGCCAAACTGAGATTGACTG
+ATAACACAGTGACAGTTACGGCGTGCCCTACATCAGACTCAGACGCAGTACTGATGTCGA
+TAAGCAAAGGCATTGAAAAGGCTGGCCTACACAACGTTACGCTGGGAAATGAAGTGGTGA
+AAGTTGTGAGGAAGCCTGAGTACGGCATGACACTGACGTACCTGATACCTTCGACAATCA
+GTGGGAAAGGTGCTGACAAGTCATATGTCTATTTGGCTGGCATGCACTTCAGGGAGGACG
+ATCTAACGTACTCTTTGCCTACGCTAGAGTTCTTGTCGCAGTTCACGACAGAATATGAAC
+CGGTCAAGCCTGACAAGCGGCAAAAGATGTTTCGCCTGCTAGTAGACCCAGTGACGACAA
+GGGTCCACCACAGGCACATGTCCTTGCTAACAGTAATGGCGACTTGTGGACACGCATGGG
+CACTTGCGGACGTGCTG
+>ds2020-267_19
+CAGCACGTCCGCAATTCAACCTTCCTCGGTCTTCAGTCCATCAATGCCGTGGTGTGCCAT
+GCCGGCTTTCATACACCTTGCCATTAGTGACTGAATAGCACTTCTGTTCCTATCACAGAA
+ATTGGAGTACTCCCTCAGGTACCCATCCTCTGTAACAGAGTACTTGCTACTAATCGAGTC
+TACTTGGCTCACCACAGCGTGGTTTGAGCCAATTCTCGATTGTATCCTCATCGGCCTTAT
+TGACGCCCTGGATTCCATAGTGTGCAACAATACGGCATTCAGGATTATTTGGTCCTTGTC
+CGATTTGCCAGCTGCCTGTTGGTTCAGCAGTATCTGGCATGCATGTGCTGCGATGTCTGA
+AGTGACCGCTCTGGCCCCACCTAGCACTGCAATTGTCTTCAAGCTCTGCGGGGCGAAAGA
+CAGCATCATAGGGTCTTCATTTGGCAGGGGAGACATCATCGGATATACGCCCATTGCATA
+TTGCTTCTTCTGCACAATGGCTGACCCTACCCACTTCTTGAGATTCAAAGCTGCTTCCTG
+GTGGTCAATAAATCGTAGTTCATTATCACACACACAGTAGTTTGGATCCGCAAAAGCGTC
+TAGTGGGCTGGACCTCACGCCGGTTGACCTCAAGACCTTGATCATCTCCGGCTCTATGTT
+GACTTCGCTTGCAGAGCACATATCACTGATATCAGTTCGCGCAAGGTATCCTATGAAGTC
+TGCTAGCTTCTCATCAGGGTACATCACCCATGCACCTGGGTTCCCTCTTCCGCTTGCACC
+AGTTGGGCTGTTTGGTGCTCTTCTTGCTCGTTTGTGCTCCGGCAATTCTTCGCTGTCAAT
+GAATGGAGCGCCCTGATCATTCCTTTCTGACATATTCTCCATAAACATGTGGTGTGCCAT
+GTTTAGTTCTTATTTTCACTGTACTCCTTTGCAATTGAGTTCGTAAAGTAGTTTTGGTGT
+TTTATCGTCCAGCAGCTGAAAGATATTGCGGACGTGCTGC
+>ds2020-267_20
+CAGCACGTCCGCAAAGGCCCTCCCTTGACTTGATCTTAAATTGAATTATGGAATTCTCTC
+CCAGAGCTGCGGAACTAACGACTCTATTAGAAAGTAGAATTACCAACTTTTACACGAATT
+TTCAAGTGGATGAGATCGGTCGAGTGGTCTCAGTTGGAGATGGGATTGCACGTGTTTATG
+GATTGAACGAGATTCAAGCTGGGGAAATGGTTGAATTTGCCAGCGGTGTGAAAGGAATAG
+CGTTGAATCTTGAGAATGAGAATGTAGGGATTGTTGTCTTTGGTAGTGATACCGCTATTA
+AAGAAGGGGATCTTGTCAAGCGCACTGGATCCATTGTGGATGTTCCTGCGGGAAAGGCTA
+TGCTAGGGCGCGTGGTCGACGGGTTGGGAGTTCCTATTGATGGAAGAGGGGCTCTAAGCG
+ATCACGAGCGAAGACGTGTCGAAGTGAAAGCCCCTGGGATTATTGAACGTAAATCTGTGC
+ACGAGCCTATGCAAACAGGGTTAAAAGCGGTAGATAGCCTGGTTCCTATAGGCCGTGGTC
+AACGAGAACTTATAATCGGGGACCGACAAACTGGAAAAACAGCTATTGCTATCGATACCA
+TATTAAACCAAAAGCAACTGAACTCAAGGGCCACCTCTGAGAGTGAGACATTGTATTGTG
+TCTATGTAGCAATTGGACAGAAACGCTCAACTGTGGCACAATTAGTTCAAATTCTTTCAG
+AAGCGAATGCTTTGGAATATTCCATTCTTGTAGCAGCCACCGCTTCGGATCCAGCTCCTC
+TGCAATTTCTGGCCCCATATTCTGGGTGTGCCATGGGGGAATATTTCCGCGATAATGGAA
+TGCACGCATTAATAACCTATGATAATTGCGGACGTGCTGCTCCTTAGATAGAT
+>ds2020-267_21
+CAGCACGTCCGCAAATCCCGCTTGTTTCGTGAGTTGGCCATATTCCGGATAGAGCAGGCG
+CAGGTAGGTCTCCTCCGCTGGGCGGTAGGGAAGGGGGAGCTGAATGACCCCATCCACCAC
+TGGGTAGTCGGCTAGGAACCAATACTTTCCCAAGAACTGAATCCCTTGAAACTCCCCCTC
+AATGGCATCCAGTAGACGGGTGGTGGAGAAGGACTTCTTTCCCCACCAATCGATGGCCAC
+CATCCTCTGGACACACTCCGCAATCGTCTCCGTCGTGAGGTGGGCCAACCTGAGGGAGAC
+CGCCATGATATTGTCGTCCCCCAATGACTCCATCCATGCGTGCTCGTCAATGTTGTCGAT
+GGTGAGCCCCCCGTCCAGTTCGAAAAGCGCCGCATATCCGATGAGTAGGGTGATGATGGA
+CTGCAGGAGCGTGTTGTGGGAATGGCCACTTGTCGTGCCCACATACTTCTGCATGCGGAC
+CCCATCATCGCGATAGATTGGAGCCCGCAGCAGGCTTTCTGCCACAAAGGCCCAATAGGT
+GTCGTAATCGGGATTGTCCCCATCGTAATACTGCTTGCGACAGATGTTAATGGCGATGGT
+GACCATCCATTCATTGATGCTGGAGTCGAACTTCTTGGCGTCGAAGCAGAAGAACTTGTC
+GAAAGGCGCCATCCTGTCGATGAACTCCTGTGACCCCCCGTGGTACCATGATTGACCCAC
+CGCGATTGGATAGTTAGGGGCGGACCAGGCCTTCGTTAACTGGTTCTCTGTGACCCCACA
+CAACTTCAAGTCACGGTGGCTCATCATGAGGATCAGACGCCCCACGGGGGGGATCTTGGA
+TTCCTTGCGGACGTGCTG
+>ds2020-267_22
+CAGCACGTCCGCAATTGACTCTGGATCCGGCCTAACCGGAACACTGCCGAGTAGCAGTGT
+ATTTATAGCCCCGGCATAACCGGGACACCACCGCTGGCCAGCAGTGGTGAGAGCATCCTT
+TTCTAGGCTTAGCAAACCACATCTCCACTCCGAATACCAAGGTACTCAGAACGAAAATAT
+CGTTCGAAAGCTAACAAAAAGGAAAACTCTGGGATCAGGCATGACCGATGCTTGATTCAA
+GTAACCATCATTTCCCAAAGATGAATGGTCGCTGATTTGGGTGACGTGTCAGCACACGGG
+ACTACAGGTCAGACGTATGTTACGACCCTAACCAACTGCATTGCTAGCAGGATATAAAAG
+GTAAAGCTATCATTGGGATAGCTAGCCCTCCCCAACCGAATACATCAGCTAGCGAGAAAC
+GCGATACGGCTTACGACTGCAACGCCCTCACTATCGTAAGGCATACCGCTATCTCTACAC
+AAGATAATGCACCAGAAGGGGAAGTACTAGGTCTCCAGGACCCGGGTCGGGTCCGCTTCG
+TAAGGTAATACTTACGAAGAAACCGTTATGTGGTGGTTTTACGCCAGAGGTCATGAGATA
+TACGTATCTCTACAGACGGGCCTCGCTACTTCGTTGCCTGGGTGATAACGAGCACAAGGA
+CACCAGCCGATGGGGGGCAAAACCTCACCTCTCTCTACCCCCAAGAGAGGCCCAGCATGA
+CACTTGCTAGTGCCAGTTTGTGATCAGAGAGCCTCCTCCCCTTTGCTCGACTAAGTCGTA
+ACCTAAGAATGGAAGGTGGCGCTCCACTGATTTGCACAGGAGCTATGTTGCGGACGTGCT
+G
+>ds2020-267_23
+CAGCACGTCCGCAAGCCCACACTCAGCACGTCCGCAACGTCACAGGCATCAGCACGTCGC
+AACTTGGGCCTAATTGCGGACGTATCTAAGGAGCAGCACGTCCGCAAGCGCGGTATCACC
+GCACATCATAAGGGCGCTGAGGACGATGGGTGTTCAGGGGAATGAGCAAGGGGCTTTTTC
+CGACCCAAACTACTGCGTTCACGATAATCAGGTGCGGCGTATCGATAGGGTCAAGGCCGC
+AATGAACATGCGACGTTGGGTCGGGTCCGCTATCGTGCAGAGGAAAAAGACGTCTATGGG
+CACATACCCTGTTCTTTCACCGATACCAAATGACGACCCGATGATGATGAAATTTTCACC
+TTTCCCACTGCAATTAGAGCTTTACTTTGGTGGCAAGAGGGCAATGAACACAGACCAAGC
+AGCACAAGCGTGTCAAATAGTCATGAACCAGATGACAGAAGGCATGTCGTCTAAAGAGCA
+GGCGCTGATGCACACCGTACTGTTGCAGGGCTATCAGTCCAGGGGCTCAATTGCGCGCAT
+GGAGATCAAGTCGAGAATGGGGAAGATGAATCCCCCGATTGACTCAAACATGAGCATCAG
+CGATAAGTACTCGATGCATGAACCGGAGTATGAAGCGGCGTACGTACGCTTTTGCGACGC
+AAACGAAAACACTATAAGGGACTATATGGCCAGATGCATCAAGGTTGGCGTGGCTGCACA
+TGGCTTCGAGGGTACCAAGACTGAAGAAGCGGCTGCCATGGCGAAGCTGGCACGAAGGAA
+AGCAGGCACGTACGGTGAAAAGAGAGGCAATTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_24
+AGTACCTTTTATCCGTTGAGCGATGGCCCTTCCATACAGAACCACCGGATCACTATGTCC
+TACTTTCGTACCTGCTCGACTTGTCAGTCTCGCAGTTAAGCACGCTTATGCCATTGCACT
+ATTAGCACGATGTCCGACCGTACCTAGCGTACCTTCGAACTCCTCCGTTACACTTTGGGA
+GGAGACCGCCCCAGTCAAACTGCCTACCATGCACTGTCCCCGACCCGGATTACGGGCCAA
+GGTTAGAACCTCAAATAAACCAGGGTGGTATTTCAAGGATGGCTCCACGCAAACTGGCGT
+CCACGCTTCTAAGCCTCCCACCTATCCTACACAGATCGATTCAAAGTCCAATGCAAAGCT
+ACAGTAAAGGTTCATGGGGTCTTTCCGTCTAGCCGCGGGTAGATTGCATCATCACAAACA
+CTTCAACTTCGCTGAGTCTCGGGAGGAGACAGTGTGGCCATCGTTACGCCATTCGTGCAG
+GTCGGAACTTACCCGACAAGGAATTTCGCTACCTTAGGACCGTTATTGTTACGGCCGCCG
+TTTACTGGGACTTCAATCAAGAGCTTGCACCCCATCATTTAATCTTCCAGCACCGGGCAG
+GCGTCACACCCTATACGTCCACTTTCGTGTTTGCAGAGTGCTGTGTTTTTATTAAACAGT
+CGCAGCCACCAGTTTATTGCAACCCCTTCGTCCTTCCCCCGCAGGGAGGTCAAACTACCA
+GGGCGTACCTTATCCCGAAGTTACGGTACCAATTTGCCGAGTTCCTTCTCCCGAGTTCTC
+TCAAGCGCCTTAGAATACTCATCTCGCCCACCTGTGTCGGTTTGCGG
+>ds2020-267_25
+AGTGATTCCAATCTACCTTGTCGGGAGGTCTCTTTCCACACAAGTGCTACTGCCATCATT
+TTCACACGTAATAGTTGTATCACTAGGGGATATCCATATGGTAAGCGTACCGTCAGTCGA
+GGTATAGATTGTTTCTCCTTCGCAGTCAGGCGTGTATGTGAAGGCCTTGTTACAGAACGT
+TGAAAACGTGTCTGCGCCTGCATAACCGCCTGCCGCGACTATAGCATATGTAACTATGTG
+ACAGTCTACGTTGTTCTGATTACACGCCAAGTTGTCTACGATATAAGTTGCGGCGCCAGA
+TGACCCTGCGATGATCGAAGCTACACTCGGGCAAACGAAGGCGGCTAGTCTGCTCTGTGA
+TCCTAATCCGATAGTAAGACCGTTTCCCAGAGACCGGCAGCTATTGGTATCACGCTTACT
+GTGAGGCGCGGTATCAGTCGGGTCAGTACCCATGAGCATGTTGTGGACGTATTTGTGCTC
+CTCCTCATTACTCGTGTCCACAATTATCACCTGTCTGCTCGTGTTGTTGAGGTCGGGCAC
+CATCCACCTCATGTCCCACATTGAATCGCTGCCCTTCGTCAGTGCGCCAGCGCTGTCTAC
+GTATAAAAAAGCCCTGGCGCCCATTAGTCCGAGTGACCAGGCCAGCAGGAACAGCCCCAT
+GTTGAACATTGTTATCTCAGACGTGTATCACTCGATTGGTAGTTATCAAGTTGCAATCAC
+TTTAAAGCTATTATTTTCAGGGAGATGACAACGGTCAGTGCGTCGCCTTAAGCGTATCTA
+AGGAGCAGCACGTCCGCAATATA
+>ds2020-267_26
+CAGCACGTCCGCAAATCGCTCACAGTCTATGTTTGAACTTGTGGTGTCACTTTCAACCCG
+CGGTAGAGAGGTTGGAGAGCTTGGTTGGTGGACAAGAACAAAAGTCCGTCGATCATCATC
+TCCCCTTAAAGCCAAAGGAAGACAGTGATAGTAAACATATTACTAACTGCTAAGCACGTG
+CCCACCGCCGGGTGGGGGGGGTTATACCAGACATAGAGGAATACTATGTCAGAGGGAACC
+ACCCTGCTGCCTGAAGCCTTCGTGCAGCTTTTGAGGTGCTCTCGCTTTCTCCCGAGTTGA
+TGCATGTCAACAGGGAAGGGCCCGCACACCTCCCGTTCACGTTGAACGTTTCCCTTTTCC
+CACTGAAGGGACGGACGCTGGAGCTACGGTTGGTACTTTCGTACCGGTCGGCTCTGCTCG
+CCCGGAAAACGCTCTATGAACGGAAATGTCCTTGGAGGGTCGGTGGTTCGCCATAAGTCA
+GCAAACCACTACCAAGGACTAGTCGCTCATTCCATTAGCATTCTGGGTCTGGTTAGGACC
+CGCGCCCCAAGACACATAACCACGCTACCTATGTCTCCTGACTGGAATAACTAATGGACC
+GCGACGCATATCCGGGTGGTACCGTAATACCACTCTGGCAGACTGTGCATCGGTCTGTCC
+GGATATTGACTAGGAAGGGTTACAAGCTTGTAACCAGGAGCAGGACGTCAACCTGCCTTC
+CCCCATGCCCACCGTACTTACTTTGCGGACGTGCTG
+>ds2020-267_27
+ACAGCACGTCCGCAATTGATGCAGTTTCAACCTCGGCCCAGGCCTTTGTAGGGTTTGGTG
+GAGGCTTTGCCTCTTGAGTTTCATTGTGTTTTACATGCCGACGCAGTTTTTGATGCCTGT
+GGTGGAGTTTTTGATACAGGTCTTTGCCACCCTTACTACTCGAGGGTTCTGGCCTGACCA
+TAATGACTCTGGTGGGTCATTTGTAGAGTGGCTTGTCTGGAGATTCACTTGGGTCGTTGT
+CAACGCGACCGCTGTTGCTGAGTCTGTCAATGCCGAAGTCCGCAAGAGGCACAGTGACAA
+AATATCACCAGACTCTGTCCGTCTTGCAGCAATTTTCAGGAGTTTCTTCATTCAGGGTGT
+TGCCTTCATTGATGAGTTGGGATTGCCTCACTATCTACGATCCTACACCCCTGTGGAAAT
+GACTAAACAGGCCCTGGACAAGTCTCTGTCTCTAATGGCTGAAGTCGGGTGGCCAGTGAA
+TGTGGCCACGGATGAGAGGGTTGATCCCATTGCGGAACGCATGGGATTCAAAGAGTGGGT
+CCTTTGTGGACGTGCTGNNNNNNNNNNCATTTGTAGAGTGGCTTGTCTGGAGATTCACTT
+GGGTCGTTGTCAACGCGACCGCTGTTGCTGAGTCTGTCAATGCCGAAGTCCGCAAGAGGC
+ACAGTGACAAAATATCACCAGACTCTGTCCGTCTTGCAGCAATTTTCAGGAGTTTCTTCA
+TTCAGGGTG
+>ds2020-267_28
+TATCTAGGAGCAGCACGTCGCAATAATTTCCCCGTCAGCACATCCCAACACAGTAGCCTT
+GCGGACGTGCGCCCCAAGCAGCTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGAC
+GCACTGACCGTATAGCTGGTTCTCCCCGAAATGCATTTAGGTGCAGCGTTGCGTGGTTCT
+TGTTGGAGGTAGAGCACTGGATGGTCTAGGGGGCTTATCGGCTTACCGAAATCAGCCAAA
+CTCCGAATGCTGGCAAGTGTAGCGTGGCAGTGAGACGGCGGGGGATAAGCTTCGTCGTCG
+AGAGAGAAACTACAAAGCCCGAACGTCCTTACTTCCAGAGCACGTCCGCAAAGACCATCG
+CCTTTAAGTTGCGGACGTGCTGNNNNNNNNNNCAGCAGTCCGCAATCGAGTAGATCTCAG
+CACGTCCGCAAGGTGAGGCCCCTAAGGGTGTACTAAGTGGAAAAGGATGTGGGATCGCGA
+AGACAGCCAGGAGGTTGGCTTAGAAGCAGCCATCCTTGAAAGAGTGCGTAATAGCTCACT
+GGTCAAGTGATTCCGCGCCGATAATGTAGCGGGGCTTAAGTTATCCGCCGAAGCTGTGGC
+AACCTGTGTGGTTGGGAAGGGGGGGCGTACGGTCAGTGCGTCGCCTAGCGTATCTAAGGA
+GCAGCACGTCGCAAGGATGCATTCAGCACGTCCCAAGTTTAAGGCGGTGTTGGTTGCGGA
+CGTGCTG
+>ds2020-267_29
+CATGCGTAGGGGAAGTCCCCCTGCAGGAGGCCTTACGTCCGCAGAATTGGTTGAAGTTGT
+GTACCGCACACGCAAGTTGGGGTCCGTCGTAATGTCAACGATGACGATGCTGACTCCCCG
+TGCTGACATGCAAGTGAGTGCTCCCTGCATGATGTTTGAGGGGTTGAGCACTCCATCATC
+GAAAGCGCCCGGGTGAAAACCTCGAACCTGCTGTGAGAAGTTGTAAAACTCGCCGGCAAT
+AGGCCAAGACAACAGGGTCGCCGCCGTTGAGGCTTCATCAGGCCCTAACTTAATCAGCGT
+TCCTCCCGCGATTCGCTCTCTGACAGCCGTGTTGTGCATGTTCATGCGGGCCAAGAGCTT
+GAAGGCCCAGCCAGTCGGGTCAACATTGTCTCGGTACTGTGATCCCCTATTACCAGACGT
+CATCTTTGACGCCTCCTGAAGCTCGTGAACTGCAGCATTGCTCCGAACGGCGTCATTGTA
+CTGCTTGACATCCTCAGCTGCATCAGTGTTGACAATGTGGTGCAAGAGGACGTGAGCGCA
+AGATCGCAGCTTGTCAGCCGTCTTTGTCGTGACGGTAACGCCAACGTTTATGTTCCAGCC
+AACAACAATGGGGATGTTGTAGGACGTCTTGACAGGCACAGTGGCCTTCTTGTTGCTGTC
+TGTCATAGCAGCAGTGACATCGATGTGCTCGATCATGTTGAACGCGCTGACATTGCGGAC
+GTGCTG
+>ds2020-267_30
+CAGCACGTCCGCAAAATATTTCCCCTCAGCACGTCCGCAACAGGAGCCATGTCAGCACGT
+CGCAACTTACCTATTGATATTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGC
+ACTGACCGTGTCGACAACCTTGCAATCTCCATCCTATCCTCCTTGCTCTTCCTCTGCTCC
+TTCCTCGCCTTGACCTTCTTCCTCACCGACCCCTCAACTTGCCTGGAATGCCCCAAAATC
+CGATCCCCTGCATTCTCCTGGAACCTATGCTCGTACTCCTCTTGCCTTTCAATCTCCATC
+TCGTCCTCAGACACCATCTCCAAATCCTCCTCATTTACCTCGGGACCGCTTCCCTTGCTC
+CGNNNNNNNNNNAGCACGTCCGCAACAGCATTCTTATCTTTTTCTACCAATAACTCGCCA
+TTATCATCCTCTTCCTCCTCGGCAACGGCACTTAAGAATTCTTTCCTTCTGTGTTCTTGC
+TCTTCATCGTAGACCTTGGTGTTATTATCATCCTCCTTAAGTTCGGGGCCATCCTCGATC
+AAATGCTTAGCCACAGGGATACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCA
+CGTCCGCAAAAAGTCCCCGGTTCTATTGCGACGTGCTGGGCTATTGATCTTGCGGACGTG
+TGCCCGATAAGCATTGCGGACGTGCTGCCTCTCTCGACTTGCGGACGTGTGCTCCTTAGA
+T
+>ds2020-267_31
+CAGCACGTCCGCTATCTAAGGAGCAGCACGTCCGCAAGGGTTGGGCTTCGGCCACATACG
+TGCTTAGGATGCTGGCATAATGTCTTTAATCGACCCGTCTTGTAACACGGACCAAGGAGT
+CTAACATGCCCGCGAGTGTTTGGGTGGAAAACCCGAGCGCATAATGAAAGTGAAAGTTGA
+GACCTCTGTCGTGGAGGGCATCGACGCCCGGATCAGAACTTTTGGGACGATTCCGCGGTA
+GAGCGTGTATGTTGGGACCCGAAAGATGGTGAACTATGCCTGAATAGGGTGAAGCCAGAG
+GAAACTCTGGTGGAGGCTCGTAGCGATTCTGACGTGCAAATCGATCGTCGAATTTGGGTA
+TAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCTGCCGAAGTTTCCCTCAGG
+ATAGCAGAAACTCATGTCAGATTTATGTGGTAAAGCGAATGATTAGAGGCCTTGGGGTTG
+AAACAACCTTAACCTATTCTCAAACTTTAAATATGTAAGAACGAGCCGTCTCTTGATTGG
+ACCGCTCGGCGATTGAGAGTTTCTAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCG
+GGATGAACCGAACGCGAGGTTAAGGTGCCGGAATTCACGCTCATCAGACACCACAAAAGG
+TGTTAGTTCATCTAGACAGCAGGACGAAGGCCATGAGGTTGCGGACGTGCTG
+>ds2020-267_32
+CAGCCGTCCGCAATGAGTCACGGGCAGCACGTCCCAATGGGCCTTTGCTTGCGGACGTGC
+TGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTAGTTTATTACCTCTTTACTGTTC
+AAAGATCAAAGAGAAAACCATTCTGTTATTCTGTTATTACATTACGTGGATACACATTTT
+CTATGGGAAACAACATAGACATTGTAGTTGTCCAACGAGATACTGCACATACTAATGTCT
+TGGGCGAGTCATGCGCACTTACCGTTTGTTTTATTATTTTAGAAATTTTATTTATGTTGT
+GCTTGTTTTATTGAACCCATTTCATATCATGGTTCAAACGTTAAAAATCGACTCCGAAGA
+AGTTCCCGTGGATCATTTGTCAACTGCTCAATCAATGACTTCTATAATGGGTATAATAAA
+ATGGGTATAGTATAATAAAATAATCTTTTTGTTAGCATTCCGACGAAGAAGTCATTGATT
+CTTTTGATCGGGATTCATATTGAAAATAATCAGAAATCTAGGAATTATAATCGCTTTTAA
+TCGCTTTCGATTATTTAAAATTAATTGAAATCAACACAAATAGATAAAGCAAAGAAATAG
+AATTGGGACATTATATACATTATCACTATGTATATTCTATATGTATATATGTAATTGATT
+TCCCTATAAATAGGCCAGGAACCACAGACGGTCAGTGCGTC
+>ds2020-267_33
+CAGCACGCCGCAACTATTGATCGGTAGCACGTCCGCAACGTCATGTCCCTCACACGTCCC
+AAACCAAAACCATTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACC
+GTTGGTCTGCCCCCCCCCAGATCTCTCAAGTGGAAGTCTGACAAAATCTGCTAACTGACG
+GGACAATTGTTGGTGATACATAGCACCAGCAGACTCCTTGGTAACAGGCGATATAATACC
+AACACTCAGNNNNNNNNNNCACACGTCCGCAACCAATCTTGCATCTCTTGTTTGGAACCC
+AATTCTTCATCATTTTCCGCACTGGGCTGAGAAGTCGAGCCAGATAAAAGTTTCTGCCTC
+ATTTTCTCTGCTAGCATCACCATCTCTTTAGCCTTACTCATGAGAGCATTCAAGTCCTGG
+AAAGCGTCTTGCAAGCTCTTATCAGTACTCTCCCACATCTCCTGCTCCTTCCTTAGAATC
+CCTGACACTCCAACCATCCTCACCGCCCCTTCCCTCGTATACATCCCAGAGCTCGACCCA
+GGACCCTCCAGACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAA
+GTATTCAAGCCTCAGCACGTCCGCAAACTCCCGGGGCAGCACGTCCCAAGAATCACACCG
+TTCAATTTGCGGACGTGCTG
+>ds2020-267_34
+CAGCACGTCCGCAAGCCAGTCGCAGTGCCGATGTCTCCTGGTTGCGTGTACGTTAGGCAA
+AACAGCCACAGGTTGTCAAGCTACGTACAACGAGACCTGTCGTACGGCAGAGATCAAGTG
+GTGAGAATGCTAGGGCAGAGGGCAGGCTGCATTGCCACAGTAGATGGACACGAGGCTGTG
+ACAAGCCCACACGACTACCCTGCGTGCGTGGTTGATTGTACTGCATATGAAATAGGTTTG
+GTGAACACGAACGCGAGGGCGCTAGCACTCGAAAAACCATCTTTCTTCAGCCAAGCCATA
+ACGCTGTGTCGGGACACGTGGTCGTTCAGGAATGTCAGGGCGTTCTCGTATAACCCGGAG
+GAGGTGGAGTCAATGATAAGGGCGATCAGCAGGAGCGACGAGTATGCAACCATGTTGTAT
+GCTTCTATGAATGATGGCACTGCACCACAAGAGCAAGCAGTCACCCTGGAGGAATTGATC
+ACAAATGCGTGCAGAGACGAAGACATGACATCGATCAAAGCGGGAGCTGGCCAGCGAATG
+AGGCATGAGCACAGGCTGTTCATGACAATCGTGGCCGGTGTCGTGGATGATATCAGGGGA
+TTGGAATTGGGCATAACACCGGAGGTGCGGTACGCGGCCAAAGAGACAGTGGCATTTGCG
+GACGTGCTG
+>ds2020-267_35
+CAGCACGTCCGCAAAAGTTGCCATCTCAGCACGTCCGCAACAGGGTGACCTTGCGACCGG
+AGCCTAATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTCATA
+TTGGGCCTGAGTAAGCGGACGAATAAGGAGAAGAGGGATTGGAATTATGGTTAGGGTTTG
+CGGTAATTGTCGGTGGCAAAGTGGCATAACTGGGAGCCGATTGATTCTGATCGTATGGCG
+GATGATACGATTGCTGCTGAGGCGGCGGTTGATAGGGCGCATGGGGCTCAAATGCAGGGA
+CGTTGCGGACGCTCTGACCCAAAGCTTTTGCAGACGTGCTGACGGAANNNNNNNNNNCAG
+CACGTCCGCAATATAAGGGAGGGAAAGAAGGTGGTTGAGGTGTGGGATTGAAGGTTTGCA
+AATTAGGGCTGGAGATTGGAGGAGGGGTATAGGAAGGAGCGGTGGGAGGGGCAGGATCAG
+GATTCAGAGAATACGGAGGGTAAGATTGGGAATAAGGCGAGTAATCGGAGGTGCTACGGT
+CAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATAGATTATCAGTCAGC
+ACGTCCGCAAGCTTTTTTCCTCAGCACGTCCACAAGACCCTAGTTGCGGACGTGCTG
+>ds2020-267_36
+CAGCACGTCCGCAACTACGACACGTTTTTGTAGCGCTCCCTGGCCGTGTCTGCGTTCTGC
+ATTGCTCGCGGCAAACACAGCAGGTTGTGTGCATGATCAAGTTGCAGACGCGTAACGTCC
+TCATCTTTTAGACACATTTGTGACCGCTGTGCCACGTGCACCTCTGCCATCGCTCTACCG
+CTGCCCAACATCTGGATGCTCGAGCAGATCATGCTGACCATCTCATCACCGTTGATTGAC
+GAATTCTCACTGATCTTGTTAAACTGAGGGCTGTTAGATGATGAAAACAGCCTGTCAACC
+GTTGGCTCGCAAAAGGGTTGTACCACTTTGTACACCCCTGCGTAAAACACGTCAGCATAG
+TCGTGGTGGGACAAGGCTGCAGGCTGGTAGGTAGACGCCACAGCTAGCGACGCCATTAAC
+ATCACGTTTTTAGAAGCCATGAAGTGCCTGGTCGTGACGTGTCCAATGAGGTCCAACATG
+TCGTTGATCGAGAAACCAACACTGTTGAACCAGTCTCTGTCGAGGTGGGGCGCTGACGAC
+CCTACACCTGCAATGAAGGACACATTGCACTCACTTGCCACCGCCATCAACTTCTGATGC
+CCCACAGCAGCCTCAATGGAAGGCGAGAACCCCGTATTTGCGGACGTGCTG
+>ds2020-267_37
+CAGCACGTCCGCAACTGTAATCCCCCAGCACGTCCGCAACATGTCCGCCGTCGGCACGCC
+GCAAACCATAGCTGAATGATTGCGGACGTGCTGCTCCTTAGATTCGCTTAAGGCGACGCA
+CTGACCGTTCCACTTTTGTTCTATTTCACTCCCCTCCCGGGGTTCTTTTCACCTTTCCCT
+CGCGGTACTCTTCTCTATCGGTCACACAGGAGTATTTAGCCTTACGAGGTGGTCCTCGTG
+GATTCAATCGGAATTTCTCGTGTTCCGACCTNNNNNNNNNNAACACCTCTCAAGTGTTTC
+GTCTAGCCGCTAGATTCCATATCGCTGTCCCACAACCCCAGCAGTAAAAACTACTGGTTT
+AGGCTCTTCCCGCTTCGCTCGCCGCTACTAAGGGAATCGAGTTTTCTTTCTCTTCCTGCA
+GCTACTTAGATGTTTCAGTTCACTGCGTTGGCTCATACCCACCTATTTATTCAGCGAGCT
+GTATTTAGGGTTGCCCCATTCGGAAATCTCTGGATCAATGCCTGCTTCCGGCTCCCCAAA
+GCGTATCATACGGTCAGTGCGTCGCCTAAGCGCGTCCGCAAATTTGAGCCCATGTAAATT
+GCGGACGTGCTGACTGATCAAATATTGCGGACGTGCTG
+>ds2020-267_38
+CAGCACGTCCGCAAATACAGTTGCATCTATCTCCCCCTCAAATCTGACACTGGTAGAGGG
+TCGAGATTTGGAAGAAGAGAAAATGAAATAATAGTAAAGAGACTCAAACATGCCAGTCTC
+GTGGTAGAAACAAATGCAAGGAAAGGTGGAATGGAGATGGGCATCCGACAACTGGAGAAA
+AGGAATAAAAGATGGAAAAGAGTCAAAACATTAGGCACAAATGTGATGTGCTGNNNNNNN
+NNNGACGTGTATGCACACATAGAGAGAAAGGGATGAATATTGTATAGATAGGGTAGGTGA
+CGTGGACAAGTGTAAGAGGTGTTGAAACGGAAGCCAAGTTATTGGCGTGGGTGTGCATGA
+GAACGAAGAGATGAGGAGAAAACACCCGTGGGTAACACAGAGAAAAGTGAAAGGCAACAA
+GGGAGAAGAAATATATCAGACAAAAATGGGATGGAAATAGAGTGGAAGAAATAATTTAAG
+GAAATAAAGGGGAATAAAGTAAGAAGTATGTGATAGGTGGTGAGAAAAGAAACCATAAAT
+AAGAAAACACAAGATGTTGGCGTGAGAGAGAGAAATAGTCAAACAGGATAGGAAACGGTC
+AGTGCGTC
+>ds2020-267_39
+CAGCACGTCCGCAAACACTAACCCATCAGCACGTCCGCAAATATCCGGGTCTTGTGGACG
+TGCTGAGGGCCGGGTCCTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACT
+GACCGTTCTGCCTGGAGTTGGCTAGCGATTTCCTCTGCATGGGTAGGTGATAGTTGTGAT
+TCTTGTGCGAGGGACGTTAGGGGAGTATCCGCAGGTACTAGACTGGCGTAGCAGTTATCT
+AGAGTTGGTCGTGGACGATGCTGGCAGTTACTCGTCATCCAAAGCAGGTGTGGTGGACGG
+ATGCGTGATTGCGGACGTGCTGNNNNNNNNNNCAGCACGTCCGCAAATCGAGGTGGGCAC
+ACGTCCGCAACCGTGACTGTCCTCCAGAATAGGACTAAGCCCTGTATCTTGTAACGCAGA
+ATGAAGTTCACGCGGAGTAACATCCGCAATAGCAACTGTGGGGGCGATGAGGCGTAAACC
+GCAGTTCTGTAATGCAGGTGATAAGGGCTCACCCACGGTCAGTGCGTCGCCTTAAGCGGT
+CCGCAAGCTTCACGGTCTTCGAATTGCGGACGTGCTGAGGGGAAGAAGGTTGCGGACGTG
+CTG
+>ds2020-267_40
+TCTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTCTCGCTACC
+TGTACTTGCAAGCCCCTACTGCTGGTTGGCTGAATGAGAATGATATAGTTTCCCCTTCCA
+TCGTAAGCACGTGCGGTAAGGGGAAAGATCGTCCAGTTCGTTCCTCAGAATCACATACCC
+TGACGGCAGCCCCCGGAATAACAGTGTCAAATACTGACTCGGGTGCGATTATACATTCTC
+TCACGTTACAGTAGGGCGTAAAAAGACCCCTTGAACTTAGGTCTTCGAACACCACTTCGT
+GCCCGAAGACTCTGTAAGCGTTTGCTAGTCGCAAGGCATCTCTAGGCTCCATGACGAAAT
+CATCACCAATAGGTATAGACTGCATCCCTGTCAAATGTGAAATCCCGTCGTACCCATCAA
+CCACACAACCCGCTAACAATGCTCCCGAGACGTAAACAGGTACGGTCAGTGCGTCGCCTT
+AAGCGTATCTAAGGAGCAGCACGTCCGCAATCCGGTATCCCTCAGCACGTCCGCAACTGA
+TAGCTACTCAGCACGTCCCAACAGTCAACCCCTTGCGGACGTGCTG
+>ds2020-267_41
+TATCTAAGGAGCAGCACGTCGCAATAGTGACCCCCTCAGCACGTCCGCAACAGGTCCTCC
+TCAGCACGTCGCAAGAGTGTGGGTTTTTTGCGGACGTGCTGCTCCTTAGATTCGCTTAAG
+GCGACGCACTGACCGTTTCCTCATTGCTCCATGTTGGGCGCACAAACTTGACATTCTGGA
+TTATCATCTAATAAATCACATGTAATAAAATTTTGTAACGTCATGTCGCTCATCATCGTT
+CCTTAAGTCAATTGTTTTTGGGAAGGTTAGTTTCTAAACCGCGTCATCGCTAGCATTTCA
+CTGTTACTGATAACTTGGGTTTTTTGGGCAATATCGACACGATTAGCAGATTTTTCATAG
+GTATGTTTGACGTGCCAATTGTTGCTCACCAGCGCCATTGCCATCGTTACCCTATCGGCT
+AAAACACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGTATGT
+CTCGTTCCACGTCCAAAACCTGGCTCCTCAGCCGTCCGCAATTGACATCAGTTCAGCACG
+TCGCAAATCCATGCCCTTTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_42
+CAGCACGTCCGCAAATTAGGCCGCCCCCCCCCCCTGACTGTACAAGAATATGCGGAGCTC
+AACATGTCTGGAAGCACAGGAGAACGTTCTTTTGCTGATATTATTACCAGTATTCGATAC
+TGGGTCATTCATAGCATTACTATACCTTCCTTATTTATTGCGGGTTGGTTATTCGTCAGC
+ACGGGTTTAGCTTACGATGTATTTGGAAGCCCTCGTCCAAACGAGTATTTTACAGAAAGC
+CGACAAGGAATTCCATTAATAACTGGCCGTTTTGATTCTTTGGAACAACTCGATGAATTT
+AGTAGATCTTTTTAGGAGGCCCCAATGACTATAGATAGAACCTATCCGATTTTTACAGTG
+CGATGGTTGGCTGTTCACGGACTAGCTGTACCTACCGTTTCTTTTTTAGGGTCAATATCA
+GCAATGCAGTTCATCCAACGATAAACCTAATCCGAATCATAGAGCCATTTACGGTCAGTG
+CGTCGCCTTAAGCGAATCTAAGGAGCAGCACGTCCGCAAGGGATTCTGACTCACACGTCC
+GCAAAGTACACCACCTATAGTTTGCGGACGTGCTG
+>ds2020-267_43
+CAGCACGTCCGCAACTACTCTCCCTTGCATCAGGCGGTGAAATGCGCTCTCTGCGTCGGC
+TTGTGCCAGGGGATTCGCCTCTTCCCTGGTCTTAAGTCCCATTGTAGCGTACTCAATGCC
+GGCGAACTTCTTGGGGTAGAACTTAACGGTGGCGAGATCTTCCACTGCCGGGAAGAAGAG
+GAAGTCGGGAAGGTCGAGTAACTTTGCCACTACATAGGCGGCCTTCTCTATGGAGTCGGT
+GTAGCGGGGGTCAGGGGTGTGATTTGGCCGATCGAAGTGGCGAAGGTGTGCCATCTCAAC
+TGGGGTGCAGGCCTTGACGAATGTGAATTCCTCCGGCTTGAAATTGTTGATGGGGGGGGG
+ATGGAGGAGGGTGTAGGCGACAACTTCGGGGTCGGGTGGCGCAATGTCGAGTTCCTTGTT
+TAGCTTCCCATAGGCTTCAACCCTACCGAGGATTCGTATATGTTGGAACATGTTGGTGAG
+TTCCATCACTTCGCGGGTCGCGGCCTCTTTGGACCTCATGGATCGCATACGCGTCCTACG
+CTTGATAGATTGCGGACGTGCTG
+>ds2020-267_44
+CAGCACGTCCGCAACATGCCTTGCCTGGAGACCAACCGCAAGGGGGGGTAGCCCTTCTCT
+GTGTTCTGGAAAGAACCAGACGCAAGAGCTACCTTACTTGTAGGGCTGACGGAGTCGAAC
+CGCCGGTGGTCACACCCTATACTCTTCTTGAAGTAGGACCGTCCTACCAATATATCTAAC
+CTTTTAAGCACACTCACTGATATATAGTTTTACTAGTTTCAGAAAACGACACCTAACGCC
+ACGTCCCGAGCCGGAGCTGTTTACCCCCGCCCCTTCCGTTTACGTAGACGCTACCTCGAA
+AAAAAGGCATGAACGCTTGGCATCTATCATCCACTAGTCCGTGTGCCTGAACCTCCAACA
+GACAGGCGGAAGAACGCCTTACCCTCGGCTTGATCGCCCGTGAAATCACAGAGCTTCCAC
+ACTAAGTGGTGTACCTCAGAGTAAGAACGATTTACCTATTATGGCTAACCGTAAAGGCCA
+AAAGTGAAACATAATTAGAGATCTAAGAAAGTCATATAAATAGAGTGAGTGTTGCGGACG
+TGCTG
+>ds2020-267_45
+CTAAGGAGCAGCACGTCCGCAATATGCCCCGTTTCAGTGTGCGTTTGTCCGTGCTAGACA
+AGGGTTTTTGGTATAGTGCCCTTGCCGCGTTGTAGCCGTCTTGGCTTGCCCATGCGTACT
+CCAGTTCTTGGTCATCTGCAAGTGTAGCTGCGGCATCCATTGCCTCAGCCAAGCTCTCTT
+GGTCAACGAATTGCCCACATTGCATAGCCGCGTAGGTTGCTGAAGACACTCTGGTACCAA
+GNNNNNNNNNNTCAGCACGTCCGCAAGACACACATGCTTTGACACCGTACCGCATTGTCT
+TCTTGTTGAAGCCACCAAACTCGTTGATTGGTCTGTTGAGGCTTGAGCTGGTAACCACAA
+CCTGATCAATAGTGCTTCCGCCTGAGAAGCTCAAACCAAAAGTTGCCGTTCCGACGATGA
+CTTGGTTGTTGTCGATCCTAGCTTGATGCCAGAACCTTGGGTTCGTTACTACACCCTTTT
+TCAATTTGATGCAGTTCAATGCTCTGTACAGGCACAAGATGTAGGGTTGCGGACGTGCTG
+>ds2020-267_46
+CAGCACGTCCGCAAGATTGACCAGGTGAGTAAGGATGCAGCTCCGTGGACCGCTCGTCGG
+GCCTGATAGGTGGTGGTATCACACCCTTCTCAAAGAAACCGTACGTGACACTCTCGCGTC
+ATACGGCTCCGTCCCGGAATCGGGACCTTTCTTTCAGAACCTTTGACCAACGGGTCCTCG
+AACCAACCTGTCCTCCCCCTCGGTAAGCGGTTTCTTTTCATTCATTCATTGATTGATTCA
+AGGTAGCTGTAGCTTGCTTCCAAGTCCAAGTGCTAGCGGTAGAAGCTAGTCGCCAGAAGC
+GAACTTCCGGGCCGGGAAGGAGCCAAAAAACGTGAGCGCCCCTGCAATCTTTCTAAAGCA
+ACAAGCGAGAAACCTTACTTTGAGAAAGAAGCGCCTTCTATTATAATATTAGTAAAGGCG
+TCTTAGCCTATCTATAGTAAGGGGCCTTTTCTTGCTCGTTAGCGCTTTCAATAAGGACGT
+TTAGGCTTTACTAATAGAATATATAGGGCTCTGCGCTTGCGGACGTGCTG
+>ds2020-267_47
+CAGCACGTCCGCAAGTTAATGGTATTGGATTGCGACGTGCTGAGGTCTCTTAATTGCGGA
+CGTGCTGAGACAGTGTGCTTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCA
+CTGACCGTGTGGCCTTTACTATAGTTTGGTATTGGTGTTCGGTGTGGCTTGTGTAGGATA
+GGTGGGAGACTCAAGCGGGCACGCCAGTGTTCGTGGAGTCGTCGTTGAAATACCACTCTG
+GTCACTCTGGATATNNNNNNNNNNCGGGCAGGGAGACAGTGTCAGGTGGGCAGTTTGACT
+GGGGCGGTTGCCTCCTAAAATGTAACGGAGGCGCCCAAAGGTTCCCTCAGCCTGGTTGGC
+AATCAGGTGTCGAGTGCAAGTGCACAAGGGAGCTTGACTGTGAGAGTGGCAACCGAGCAG
+GAACGGTCAGTGCGTCGCCTTAAGCGCGTCCGCAACATACTCCTCGTCATTTGCGGACGT
+GCTGAGGAGGAACCTATTGCGGACGTGCTGAGGGACCAACTGTTGCGG
+>ds2020-267_48
+CAGCACGTCCGCAATACATCGCATATATTGGTAGTCCCCTCCTTAGTAAGCTGCAAACGT
+CAAGTGATATTGGAATAATGGAGTACCTGTACCTTGTTGATCAATCTCCGTTACGAATTC
+GAATGGTTGAATTTCCGTGTCCACTTGCCTAGTTATATCATCCAGGACAGTGTACCAATC
+GTTCTCGGAGAGGTAGGTGATAGGTGTTCCACTCAGCAATGTAATCTCTATGATTATATT
+ACCGGATCCAGTATCATATGTTATGCTAGGACCAGGGCCATTGGCATCACGTGCATCAGC
+TACAGCTTCTTGAATCTCTCCGTTGGCAGTTTCAAGGTCATCTTCGTCATAAGGAGGATC
+GTCTTGGTTCTCTTGAACTTGAACGCTAGACAACACAGTTACTCCAAGATCTGGTAGATC
+AAAGTATTCTATGTCACCTACTTCCTTCTTAATCAGTTGATCCTGAGAGAGAGGATTCTT
+AGCTGTAGCTCTACAAGTTACGAAAGCAGGCACGGTCAGTGCGTC
+>ds2020-267_49
+CAGCACGTCCGCAATTTAGCATAGGTACACGTCCGCAACACCCACTGCTTGCGGACGGCT
+GCTCCTTAGATTCGCTTAAGGCGACGCACTGACCGTACTATTAAGCTTTTTCCTACCCGG
+TTATTTTACCAGACATAGCGGGTTAGTATCCGTAAGCTATAACTCCCGCCCGTTGCCAGA
+GGCCGTTTAGTCCGGTAGACCTTTTAAAGTTGTTTTCTCTGTGTTTTTGTTTTTTTTTAA
+AAAATAAACCTCACATACAGCAACTGGTTGCCAGCCGATGTCACTCGGCCGACTACATCC
+CGTCCCTGTCCAAGGTTTTTAATACTGTGTTTTTGAAATTTGTAGTTTTAAAGACGTTGT
+TAGGAAGTTGAGGGCTAAGCGCTACTACCTTCCACACTACGTCACGTCCCCCGACTTGCT
+CTTAACAAGTCAAGCCGACGGACAGTAATCCGTCAACCGTTTAGTGATTCCAATCTACCT
+TGTCGGGAGGTCTCTTTCCACACAAGTGCTACTGCCA
+>ds2020-267_50
+CAGCACGTCCGCAACGCCACCGAAGCCTACCTCGCCGACCATGTCTCGAATGTCGAAGCT
+ACCGCCCTGGAGATGGTGCGGGTGGATATAGTGGGTTTAATGGTTACTTCTTCTTACCGG
+AAGGGGTTGAACCAGACCCACTCAATACCGCCACAGCCCCTGATCCTAAGGAAGCTACCC
+CCAAGACGTTTGAGATCTTTCGTCGACGCCACTACCCTCATGAAGAGTCCAGTTAGACAT
+GGGTGCCTCACACAGTATCCCATCCTACAGCTCTTCGCCTCACGGCTCTCTGAAGCAGAA
+CTCCGCACCCTCGTAACCGAAGTGGGCGGAGATTCGACTGCAAGAGATATCCGGAGGGAG
+GCATTTGGCGCCGAATCCGTCACGAGGAACATCGTAGGTTTCATCCCGCTCGCCGACGCA
+TCCTCGCTAGCGTCCAGAACGGACTATGACAACATCATGGTCCAATACCAAGTTTATCTA
+TAATAGCCTGCTACATTTGCGGACGTGCTG
+>ds2020-267_51
+CAGCACGTCCGCAAGGAATTCCCCCTCAGCACGTCCGCAACGTATGCCCATCAGCACGTC
+CCAAACCCAACCCAATTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTG
+ACCGTCGAGAAGCAACTAACTCGTTCCTAACGGGTGTGGCGCTGTGGGCGGCTGGCCTCA
+CTGATGACGAGATGATGCTTGCTAGGGGGTCAGGGCTGTTCTCCCTCGCAAGCGTCAAGG
+ATTACAAGCGCGAAGCTAAGCGCATAAGCGTGGAAGCAAAATCTCTACAAAACTTGGTAG
+ATGTGGACTTGAGAAAGTTCTTCGAACTAGAGGTGCTAGTCAATAGGGGACACGACGGTC
+AGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAAAAGACCTGAGTTTATT
+GCGACGTGCTGAGGGACTCGAGTTTGCGGACGTGCTGAGACGTAAACATTGCGGACGTGC
+TGCGCCTTAGATAGAGCGGA
+>ds2020-267_52
+CAGCACGTCCGCAATCGTTGCAGACTACAATCCGGACTACGATACACTTTCTGGGATTAG
+CTCCCCCTCGCGGGTTGGCGGCCCTCTGTATGTACCATTGTATGACGTGTGAAGCCCTAC
+CCATAAGGGCCATGAGGACTTGACGTCATCCCCACCTTCCTCCGGTTTGTCACCGGCAGT
+CTCATTAGAGTGCCCTTTCGTAGCAACTAATGACAAGGGTTGCGCTCGTTGCGGGACTTA
+ACCCAACATCTAACGAGGGCATGACAATTGCGGACGTGCTGNNNNNNNNNNCAGCAGGTC
+CGCAATGGGTGCCGCTTGTGCGGGTCCCCGTCAATTCCTTTGAGTTTTAATCTTGCGACC
+GTACTCCCCAGGCGGTCTACTTCACGCGTTAGCTGCGTTACCAAGACAATTAAGTCCCGA
+CAACTAGTAGACATCGTTTAGGGCGTGGACTACCAGGGTATCTAATCCTGTTTGAGGGAC
+CTGATGTTGCGGACGTGCTG
+>ds2020-267_53
+CAGCACGTCCGCAATCCCTTTCCTCTTCCTAACTCCTCCCCGGGTAGTTCCCAATGTTTG
+GCACTTTCCATACTTCGTGGGTGCAACATCAACAAATTCGCTCATGATCAAGTTACAACC
+TAAGATCTATGACCATATTATGTTAACTGTTCGTATTTCGTTCATTCCATCGGTATGCTC
+CCAGGTACCTGTAATTGTGATCCGTTTGCCAGAACTAAGGGGTCTTTCTGTGGAAACCTT
+CACGAACAATCGTCGTTTTTTGATGGTTTTTCCGCTTCTCACAGCTGCTCTTTCTACACC
+CCCGGATATCTGGTGCCAAACCGTCGCCCGTTTCCTTATTTCTTCGATAATAGAGTTGTC
+TATCTTTGTGGCATCGATTGTACAAGTTCGTGAAGAAGGCTGGACGAGTGGAATGAGGGA
+AAGCGGCTCGATCGACAAAAAAGAAGAGTAGCCCAACCCAAGAACCTTGCGGACGTGCGC
+TCCTTAGATAGA
+>ds2020-267_54
+CAGCACGTCCGCAAGGGTCGTTTGGTCTTCCAAGGAATCTGATCCTGAGAGAGTGTCGTC
+ATTAAAGAGTAGGTTTTACTCTTTCTTGGTAGGTTATGGTCGCAAGAGAGCTTCTGTGTT
+CAGGAAGATCTTTCTTCGTGAGAACCTAAGCACGATTTATTCGTGTCGGCGGTCTTTAAC
+GAGAGGTATGGGGATGAAAGTGACGGAGGAGGAGTTGAGGGACTGCGGTCTCCNNNNNNN
+NNNATCTAAGAGCAGCACGTCCGCAACAGGGCGGTGGTGGACGGAAGCCAATTGGGGCTG
+TTCCACTTGGGGTTTAAGCGAGTTTGTCACCCCTAGGATGACTCGTCTTACTGGTCTGAC
+CAGACGCCTCTTGTGGAAGTGGGTTTGTCTACGCCGGAACGAATCTGTTTTCGGACGGGT
+TCGCTTTTGTAAAGGAAAAGGACATAATTGCGGACGTGCTGGGGGCTATATTTTGCGGAC
+GTGCTG
+>ds2020-267_55
+CAGCACGTCCGCAAAAAAATCAGGTCAGCACGTCCGCAAGGGAATAGCCGTCAGCACGTC
+CACAAGATCACAGTTGCGGACGTGCTCGCTTAAGGCGACGCACTGACCGTACATGTATTC
+GTGCGGTACACATTTTGCTAGCAACTTCGGAGCCGCTACTTCGGGATGCGTACCCGGTGA
+CGGATATGCTCACTACGGAGGTTCAGCGTGGTTGAACTGCCGCGCGCTGCAAGAGTGCCA
+GAACGAGGGTAACGATGTAGTTAAGAGATCTGAACTCAATGTCACTAGCTCCGACGTTCG
+TGGAGCTATGTCTGGTGGTGTGGTGATGCCGGACTTTCTGTACGCGTACGGCACCACCTA
+CTTTATCCACGGACAAAACAAGTCCGGGGGTCACGTTGACGCTAAGATTTTTGACAACAC
+TGAATCTGAGGACTTGATGAAAGATCTGGTCAACATGACTGAAACCGACTTCGTTGCCAA
+ATAC
+>ds2020-267_56
+ACTCTGTATGCGTTCGCCAAACGCAACGCATCCCTAGGCTCCATGACGAAATCGTCGCCA
+ATGGGTATCGATTGCATCCCAGATAGGTGTGACACACCGTCATACTCATCGACTACGCAG
+CCAGCCAATAGTGCTCCTGAGACGTAAGCGGGTATGCAAGTCAGGCGCTTTGATAAGGGA
+TAGCCCTCCTCTATCAGCCTGGTCGCCTTGACTTCTTGGACTTCGGCAAGGTGTCCAAAT
+TCGAAGGCCAGCCAACACGAGTCGTTCGCGACAGTAGGAACCTCTTTCCCGAAAGGGACA
+GAGCACATTGCGGCTCTGCCTATTGGGGACATCATCATCCGGATTGCTACGGTCAGTGCG
+TCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAAGTCTTAACCCTCAGCACGTCCC
+AATACATTTTCCGTCAGCACGTCCGAAAATCTACCACTTGCGGACGTGCTGCTCCTTA
+>ds2020-267_57
+CAGCACGTCCGCAATACGTGGTCCCTCAGCACGTCCGCAAAACCTAACCGCTCAGCACGT
+CCGCAATGTGTTGACCCCGCTTAAGGCGACGCACTGACCGTCCGTAATCCGCTCATCCAA
+GCGGTACTATTCTGGGTTGCTACGGCATTCTTAGCAGTCGGTCTATTCGTGACACCAATC
+TTGAACGGTGGTAAAGATCCTAAATACCAAAAATTGGGTGTGGACATCATGGCGATTCAT
+CAAATCATGCCTGACAACTTAAACTTCTGGTTTGGTCACCAAGGTTATGAATTTATTGAT
+ATCGGTCGTTTCTGGCAGATCTTAAAATGGGTTGGCGTATTATTAAGGCGGGTACGGTCA
+GTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATTCCTTCTTCCTCAGCAC
+GTCCCAATAGTCCGTCCCTCAGCACGTCGCAAATGGAGGTCTGTTGCGGACGTGCTG
+>ds2020-267_58
+CAGCACGTCCGCAAGACAATATGGCTCAGCACGTCCGCAAGTCGACGCCCCTCAGCACGT
+CGCAACCATACCGACTACTTTTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACG
+CACTGACCGTGGTTGATTCTCTCCTGGCAAGGTGATAAAGGCACTGGCGTACTCTGCCAT
+GATGGCTTTACTGGTATGCATGGTATCGGTCAAATGCAAACGCGTCAACCCGCCATGCGC
+CACTTCTCGATCCATCATAAACTCAGGAATCACACCCACGGCTATACCGTTTTTTTCAAT
+CACACCATCGGCAACCGCGCCCATGCATCCAATCACCGCACCGCCATACACCAGACCTAA
+CCCCGCTTCAACCAACCCCCAAATTACGGTCAGTGCGTCGCCTTAAGCGAACGTCCGCAA
+GTTTTGAGGGGTGGGATTGCGGACGTGCTGACTCAGTAGTATTTGCGGACGTGCTG
+>ds2020-267_59
+CAGCACGTCCGCAAGCACACTTAATTGGGACGTGCTGAGTTGATTAATTTGCGGACGTGC
+TGCCCGATAACAATTGCGGACGTGCTGCTCCTTAGATAATCTAAGGAGCAGCACGTCCGC
+AAATGGCCATTCCTCGTCTCTGGATACCTAGGCACCCAGAGACGAGGAAGGGCGTAGTAA
+GCGACGAAATGCTTCGGGGAGTTGAAAATAAGCGTAGATCCGGAGATTCCCGAATAGGTT
+AACCTTTCGAACTGCTGCTTAATCCATGGGCAGGCAAGAGACAACCTGGCGAACTGAAAC
+ATCTTAGTAGCCAGAGGAAAAGAAAGCAAAAGCGATTCCCGTAGTAGCGGCGAGCGAAAT
+GGGAGCAGCCTAAACCGTGAAAACGGGGTTGTGGGAGAGCAATACAAGCGTCGTGCTGCT
+AGGCGAAGCGGTGGAGTGCTGCACCCTAGAGGGCAAGCTATTGCGGACGTGCTG
+>ds2020-267_60
+CGGATCTCACGCCCGATCTATCTAAGGAGCAGCACGTCCGCAAGATTTTTGGAGTTGCGA
+CGGCTGGGCCATATTCATTGCGGACGTGTGAGTGTAATATCTTTGCGGACGTGCTGCTCC
+TTAGATACGCTTAAGGCGACGCACTGACCGTGTACTTGTTGTTTCCATTCGGGTTGTTCC
+ATTCCATTCCATTCCATTCCACTCCATTCCATTGCACTCGGGTTTATTCCATTCCATTCC
+ATTCCATTCCATTCCATTCCATTCCATTCCATTCCATTCCATTCCATTCCATTCCTTTCC
+GTTCCATACCATTCCATTCCATTCCATTCCATTCCATTCCGTTCCGTTCCGTTCCATTCC
+ATCCTATTCCAAACGGTCAGTGCGTCGCCTTAAGCTATCTAAGGAGCAGCACGTCCGCAA
+CTCTATCCTTGTAACTGGACGTGCTGAGGTACGGGCTTTTGCGGACGTGCT
+>ds2020-267_61
+CAGCACGTCCGCAAGGATGCACTCTCAGCACGTCCGCAATAAAGGGGCATGTGTTGCGGA
+CGTCGCTTAAGGCGACGCACTGACCGTCTTTTCGCCCTTGGGACACTCGATTCCCACCAG
+TTCTGGTACCTGATTGGCACATTCTTCATAGAGTGAGGAAACATCCTTAGCAACTTTTGA
+ATTGGGTTGTATTCTCAGGCTTCCAACCTCACCNNNNNNNNNNNNNNNNNNNNNNNNNNN
+NNNNNNNNNNNTGAAGTCAACATGTTCTGTGCCAAGCAAACGAGGATCATTCTTCGTGAT
+AACGCTGGGTATCTTTTCACAGGGAGTTTCCAGGTGCCACTCGAGTGGTGTTTCCACCAA
+ACTGGAGGGCCACGAACACGGTCAGTGCGTCGCCTTAAGCGACGTCCGCAAGTAAGATTC
+CTTCGCACGTCCGCAATAGAGCTGTCTTTATTTGCGGACGTGCTG
+>ds2020-267_62
+CAGCACGTCCGCAAGTCTAAGCCCCTAAATCATAGTTAAGTGGGAAACGATGTGGGAAGG
+CATAGACAGCTAGGAGGTTGGCTTAGAAGCAGCCACCCTTTAAAGAAAGCGTAATAGCTC
+ACTAGTCGAGTCGGCCTGCGCGGAAGATGTAACGGGGCTAAAACTATGTGCCGAAGCTGC
+GGATTTGACATTAGTCAAGTGGTAGGGGAGCGTTCTGTAAGCCGATGAAGGTGTATTGAG
+AAGTATGCTGGAGGTATCAGAAGTGCGAATGCTGACGTGAGTAACGACAATGCGAGTGAA
+AAACTCGCACGCTGAAAGACCAAGGGTTCCAGTCCAACGTTAATCGGGGCTGGGTGAGTC
+GACCCCTAAGGCGAGGCCGAAAGGCGTAGTCGATGGGAAATCGGTTAATATTCCGATACT
+TGTTTATAATGCGATGGAGGGACGGTCTTTTGCGGACGTGCTGA
+>ds2020-267_63
+CAGCACGTCCGCAAACTTTTCATTGCGGACGTGACGCTTAAGGCGACGCACTGACCGTCT
+ATATGCACCTCTCTTGTCTCAGAACTGGGCCGTGGAGATTCAGGAACTATGGGAGTTTGG
+GAAGACATGGTTTGGAGGAACCCTTATCTGCGCATTCGGTGGCGCAAGGGACAATTCAAG
+GTTAAGATCATCAAGGTGAGTGCATGAGGATGCCATTGTTTTGTTTTTGGATTTTTTGAT
+GTTTTTCTCTGAATTTGCCTTACTTGCGGACGTGCTGNNNNNNNNNNGGGACACTGACCA
+CCAGCACCAACCTCCATCCCCCGGCACCTGCCTTTATCACCCATTTCCCAGGTGAGGACA
+GGTGCTCAAAGAGGGGCAGGGTTCCTCTGAGGTAACACAGCAGGGCGGCAACAACGGTCA
+GTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATC
+>ds2020-267_64
+CAGCACGTCCGCAATGATACGCCGATATTTGAGTACCTTTCCCGAGCAGATTCTGCATCT
+TGCGTCGACCTTGGTATCGTTAGCAGACTGTGTGCGTGGTCAAGCTGCAATCGCTCAACG
+TTGTTTTTGTTCAGGCACACAGTTGCGCGTTGTGCAACGTGCACCTCTGCTAGTGCTCTG
+CCAAAACACAGACTCTGTATGGTTGAGCACAACATGGCCAACATCGCGTCACCATTTTGA
+GGTGCTGCGCTATTTAGTCTCAGGGTCTCCTCCGTGTTGTGAGCCATCATCAGTCTGTCC
+ACCGCTGGCTCACAAAAGGGTTGGTTCACCCTGTACAACCCTGCATACAGCACGTCAGTA
+TAATCGTGGTGTGATGCCGCTGCTGACTGGAAAAGTGAAGCAATGGCGGCCGACGCTACT
+AGCATCACATTCTGCAATGCCAGAGACTTGCGGACGTGCTGC
+>ds2020-267_65
+CAGCACGTCCGCAAAGTGTACCCGATGTCTATTGCGGACGTGCTGACGGGTGCTCCTTTG
+CGGACGTGCTGAGGAGTCCTGATTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGA
+CGCACTGACCGTCACCTTCGTGCTACCATCATATGCCAAGGTCGCCAAACTATTGTCCAG
+TGAAGAGTTACCTGTGCCTTGACCATAAGAAGATTCCATGCCCCAAATGGCAGTCACAAT
+AGAGGCCGGCACACCATACTGATTTTCAATGCGATCAAGTAGGGCGCTTTGGCTGGCAAA
+ATTGCGCTGACCCCCACTAACACGACTACTCGACGCGGCACCATCGATATATTCCCAAGG
+CATTTAGCAACGGTCAGTGCGTCGCCTTAAGCGTAGCAGCACGTCCGCAATAGTTGATGA
+GTCAGCACGTCGCAACAGACCCACTTCATTGCGGACGTGCTG
+>ds2020-267_66
+CAGCACGTCCGCAACTTTCCTCTTGTTGTCTCGCCACATCGATGAGGTGCTGCTTGACGA
+CCGAGAACCCAGTAGCTGCAAAATCCTTACGTCGCTCTTTCTCAGCATCACTGACATTAA
+CGGCGTCAGCGTGCTCCAATTTCTGAGTTCCTTTGACGCTCAAGAAGCTGTTGACTACCT
+CCGAGGCCACAGCATCGATTCTTTTTCCTTCCTCTTTCACCTCAGCCTTGTAAGCTGCTT
+CCTCCTTCGTCATCATTTCTCCGTTGATATCAATGGTCTCAGGGAGACCATTCGGGTTTG
+CCATGGCTCGCATCTTCTTCTCCGCGGTCTCGCGCGCTTTCTGGTTCTTCTGTCGGCGCG
+CCATCTTGTCTCTGTCCAGCGGCGATCTCTTCGAAAAAAGAAAAATTTGGTCGTAGTTGT
+TGCTTCTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_67
+TCTAAGGAGCAGCACGTCCGCAACGGCAGCAAAAGCGCCAGCCGAGGCAGCACTGAACCA
+TGAGCAGCGATTGTTTGTCACCATAATGGCAGGCATTGTGGACAAGGTCAGGGCGATTGA
+GCACGAAACATCTGAGGCTGCTCTGTATTCCATCAAGGAAGCAGTTGCCATCGGGTGGTG
+GAACGCGTCGACGGTTGCCTCATTGGCAAAGTGGTACGCCTTCGACTCAAAGAATGAGTG
+GGTGACGTTGACTTCAAAGAAGTTGGCCGGTGATGCGAGAGGGGCAATCGGCGAATACCA
+ACTGCCAATGGCCCACTGCTTCTTGTCTGCCCTATTAGCGCAGTCACAGACGTACATCGT
+GGTTGCATCACAGTCACAGTGGGCAACGATCGGATCGACTATCGTTGGTGGGGGCGCATC
+TCCTGTGATCACGCAGCCCAAGGAAATTGCGGACGTGCTG
+>ds2020-267_68
+AGCACGTCCGCAAGTAGTGGGGGATTGGGACGTGCTACTGGAAGTAAGGACGTTCGGGCT
+TGCGTTGTCTGCTATAAGATAGCTAGTTGGGGGCTTTCGACATAAAAAAGCCTATCCGGC
+TTGGCTTCGCTATGGCTCATGACTTGTATTGTAGTCGTAGTCTTGTAGTCGGCCCGGAAT
+GCCTTTGTAGTCTTTCTAATGCTAATGCCTTCTTCCTTAGCACAAGCGCTAAGCGATAAT
+AATTCCTTCATTCATTTTTTTTTAGTTGCGGTAGCTTCCGCGCCAGCAAGATACGGACGG
+CAAAGCCAAAGCAATACTAAACAAGCGAGAAAAGCCCTATATATTCTATTAGTAAAGCCC
+GAACGTCCTTACTTCCAGTAGCTAAGGAGCAGCACGTCCGCAAGGCGAGGCAAGTCAGCA
+CTCCGCAAATAAATTAGGTTGCGGACGTGCTG
+>ds2020-267_69
+CAGCACGTCCGCAAGCCATTGCCACTCAGCACGTCCGCAACGACGGCCACCCCACGTCCG
+CAACGTTGATCGAGTTAAAATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGC
+ACTGACCGTAAGCTCCCTGGTTGTTGAGACCAGTTTATTGAGATCGCCTTCCAGTCGCCC
+CATATCAGACGATATGCCCTTCTCACATTATTTTGTAATTAATTTATTGTTTTACCCGTG
+TTTTTCCGCTGATTTACATTTTGCGCCCGGTTGCATTTTCCACCAATTGCCCCTGTCGAC
+CTGCCATAGGGCTTAACAAGTCAACTCATCCACCTTTGGTCATCATTCAACGACTTATGC
+AGCACCGAACAAGTCGCCGTCTACACCAAGGTGCGCGTATTTGGCAACGAAGTCGGTTTC
+AGTCATGTTGACCAGATCTTTCATCAAGTCC
+>ds2020-267_70
+CAGCACGTCCGCAAACCTATTTTTGTGGACGTGCGAGGCACTGATAGTTGCGGACGTGCT
+GACGGATCACGCATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACC
+GTCATGATGTGGATGCGCTGCGTTGGCGCGCTGACACCAGTTCTAAATTACCATCTGCAC
+TTTCTGCAACTTACAGCACATCTGCCATGGCAGTAGTCAATAACTTAACTTCGCGATGGC
+CGAGGCTCTAAGCGCCACCAGATGAAACTTCAGTGGCAGGTCACCGAGAGGAAGAAATTA
+CCGGTACCAGCTAACACAGCAGAGCCCTGCTGACACGGTCAGTGCGTCAGGGGTTCGGAA
+ACGGTCAGTGCGTCGCCTTAAGCGTTCCGCAATCACTCGCCCTTGTTGCGGACGTGCTGA
+GGGACTTATTGTTGCGGACGTGCTG
+>ds2020-267_71
+CAGCACGTCCGCAACCTACTCCAATTGGGACGTGCTGAGGCTTGGGAGATTGCGGACGTG
+AGGGTCAAGCTTTTGCGGACGTGCTGAGGTCTTTCCCTCGTGTGCGGAACAACTAGCCGG
+TCTTTCGAGATAGAGTAGTCGCAGGTACAGAAAGCATGTTCAATTCCTCCCGTAACGGGG
+TGGGTCCCACGCAGGTTCGTGGTTCCCTTACTCGAGAGAGACTATTAGTACAAGAAGGCG
+GACGTTGGTTGATGGCAAGGCACATGGTGTGATTCTGCCATTAGTCGTCATCCCTGTATG
+CCTGTGGAGGTCAGCCCGGACAGATGCATATATATGACAGCGAAGCGAAAGCGACGGTGG
+CTCCATACCCTGGAAAGGTGGTTACTAACTTTGCGGACGTGCTGAGGGTGCGCTGCTTGC
+GGACGTGCTGAGGGGTGGAATCTT
+>ds2020-267_72
+CAGCACGTCCGCAAGCTCAGTACGGTGTTGGAATTGATGTCCGTGATCTCAAAAATATAT
+GACATAGAAGTGAGAGAAGAATTTAAATTAGGCAGCAAGATCGGCGAAGCCGGAAAGGTT
+CAGACGTCCATGCTGAGTAACATGGTAAACAAGATAACCAGCTCCGTAGTGAGGGAATTG
+GCTGACAAAATAATAAGCCAGAAATCATTGCAAGATTCGGGGAAGAAGATGGAGGAAGAG
+AAGAAAAAAGAAACTGAAATTAGAGAGAAAAGAAGCGCATATGCCATGCTGTCTAACAAA
+TCGTGCCAAATAGAAACGGATGCAGAAGCTGAAGTTTGGAGAAACGTGGAGTGCAAAGGT
+AGGGCGACATGTTTTGACAAAACGTAGGGGAGTAACGTTGCGGACGTGCTGCTCCTTAGA
+TACCTTGCGGACGTGCTG
+>ds2020-267_73
+TTCCGATCTATCTAAGGAGCAGCACGTCCGCAATTTCATCTGACTTGGGACGTGCTGAGC
+CAAGCATGTTGCGGACGTGCTGAGGTGTGATGCCTTGCGGACGTGCTGCTCCTTAGATAC
+GCTTAAGGCGACGCACTGACCGTATTGTACCCGCTGCGATGTCTTCGAATACTGCCAGTG
+CGGTTTCCAGTGCAGTGGCGCCAACTTCTACTGGCAGTGCCCTTGCCATGATAGATATTG
+AATTGGCAGACTAAACCTACGACTGAGATGAATTTATGAAACCGCACGCCTCACTGAGCC
+AATCCCTGCAAAAACTAACCACGCCTCTGGGAACGGAGCTTGAACGGTCAGTGCGTCGCC
+TTAAGCGTGTCCGCAACCGATGCCCAATAGCTTGCGGACGTGTGACATAAATACGATTGC
+GGACGTGCTG
+>ds2020-267_74
+ATCTAAGGAGCAGCACGTCCGCAAATTCGTGGGGTTGATCATGTCACCTCTCGTTGCGTA
+CTCTGTGTAAGTGAAAGCCAGGGTAGTCTCAGGTGAAGTTGGTGGCAGTGCGATAGTTGC
+ATGCTCAACCATGGTTGACATGACTCTGTTGGCTGTGTTCGCGAGCACTGCATCGTAAGA
+GAACAACCATCCCAGTATGGGCGCTGACAACACCTGCAGAGACAGTGGTGCCCTTCCTTG
+CACTCAGAAGGCTTTGACTTCCGTGATGGCTCTTTGCATCACTGACCCTGTGTGTGTCGT
+CATGATCGCGTCAGCGACATCTCCACCAAAACGCTCGCCTGATGCGCAAGCAAGGTCTGC
+CATGCCGATGGGGTGCGCGTATTTCTCAGACCCAGCCAGTATTGCGGACGTGCTGCTCCT
+TAGAT
+>ds2020-267_75
+CAGCACGTCCGCAACGGTTTGGGGGTATGGATGGGGTATGGCCGTTTGCACGTGCGAGTG
+TTACTCCTTTGCGGACGTGCTCGCTTAAGGCGACGCACTGACCGTGTGCTTCCCCGTCCT
+GCCATAACGATATCGCTGACTTTGCCCGAGGTTTCTGGAATGTCTTGCTCAAGCATGGCA
+ATTTTCAGATTGCCACTGATTTGGAATTCGCCACTGTCAGCCTTGACTTGACCGCTAATG
+ACTTTAAACAAAGTTGATTTGCCTTCACCATTGCTAAGACGGTCAGTGCGTCGCCTTAAG
+CAATCTAAGGAGCAGCACGTCCGCAAAGGCCAACTGGTCACACGTCCCAACTGGATCTTC
+TTGCGGACGTGCTGAGGGCTAATGCTTGCGGACGTGCTGAGGCTGATGGGCTTGCGGACG
+TGCTG
+>ds2020-267_76
+CAGCACGTCCGCAATAGAACTGGGGTTAGTTTGGGACGTGCTGACCCCCTCGGTTTGCGG
+ACGTGCTGAGTCGTGGCATCTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGC
+ACTGACCGTGGGGTTCCGGGTTGGAGGCAACACACTAGGAACGGGAGCAGGACAAATAAA
+CCCGAAAAAGGCAGCGCATCCCGGGCTCATCTATGACATCACAGTGGATGACTATATCAG
+CTTCTTGTGCAAGCAAGGCTACAACAGCACCAACATTGGCATACTTGTTGGAGGCAAAAA
+GAACATCTGACGGTCAGTGCGTCGCCTTAAGCGAAGCACGTCCGCAAGACTCAACATTTT
+CGGACGTGCTGAACGGAATCCGCTTGCGGACGTGCTGAGCCTCTGGTTATTGCGGACGTG
+CTG
+>ds2020-267_77
+TAAGGAGCAGCACGTCCGCAATGGTCACGGGGTGTTAATTCATCCCCCCACCCCCCCTCC
+ACCCGCGAGGGGGGGGAGAGTTCGACTGTTCTTCACCGAGCAGTTTGGGTGATTTTTGCC
+GACCAATGCGCGGGTACGTGTGATATACTGCATTAAGCGCACGGATTATTGGGAGCAAGT
+GGTGGGAGGAACCGGCATCTATCGGGTACAGGCAACGATGGCCACTCCGGGACCCACGCC
+TGGCAACAGGATACAAGAAAGGACGGTCAAGGTTTAGGATCTGTGGTCCCGCGAGGGAAA
+TCTCCTTTACCTCATAACAAGCCGTACACTGCGAATCCCTTGGCACCTCGGTGCTTTAAG
+AGTTCATGACCAGCCCAGTGCAGTGGGTGCCTTCTTAGGGGGTCTAGTTTGCGGACGTGC
+TG
+>ds2020-267_78
+CAGCACGTCCGCAATAGACTATGGGTAGCACGTCCGCAACAGGTACACCCTGAGGCTTGC
+GGACACGCTTAAGGCGACGCACTGACCGTACCCGCCCTGCTCCCCACTGACATTCACAGA
+AGCTTCTGTCTCGCGGTAACGGGCGGTGGCGGTATTGCTGCTGACTTGTGGACTGACGCT
+TTGCACATAAGGCTGTTCTGCAACTGCATTAGCATTCTCGTACGGTTAAAGTATTGGTGC
+CTAAGGAGCTGATATCATTGAGAATTTTTTGTTGAGAGCCTTGCCCTAGACCCACTACCG
+ATACCACAGAGGCAATACCGATAATCACCCCCTGCAGAGCACGGTCAGTGCCTCGCACTT
+AGCGTGCGGACGTGCTGACGGGGATCCTTTGCGGACGTGCTGAGGGGCATTGATTTGCGG
+AC
+>ds2020-267_79
+CAGCACGTCCGCAATTTAGGCCAATTACGTTGCGGACGTGCTGGACTGGTAAATTTGCGG
+ACGTGCTGCTCCTTAGATACGCTTAGGCGACGCACTGACCGTGGGTGAGTTGAGTTTTGT
+GCTCAATTCACAACAAGTGGTATCAGAGCTGTGTTGGAGCAGCAAGTTGCTAGAGTGTTG
+AAGATGGCAGGTGACAAGGAAGCTGAAGGTGAAAGTAGCTCTATGCTGCAGAGGCTGCCA
+CAATCTGTCAACATGAAGGTGGAGTTAAAGCCCTTCACAGGGAAGGAGAACTTCACGCTT
+TGGCAAAGGAGGATGAAGTCAGCCCTTACACAACAACATCTCCATGTTGTGTTGGTGGGC
+AAGGAAAAGAAGCCAACAGGTATGTACACGGTCAGTGCGTCGCCTTAAGCGGGACGTGCT
+G
+>ds2020-267_80
+CAGCACGTCCGCAATCCTAGGTGAATCTTGCGGACGTGCTGACCATAATCACTTTGCGGA
+CGTGCTCGCTTAAGGCGACGCACTGACCGTGTCTGGTTCGTTGTGTGTGTTTTTTTTAAG
+GCTTATCCGGGGGCTGCTGCTCTGGGGCATCCAATTCTTCTTCTTTCTTTTGCTGCTGAT
+CTCACAGCGAGAGCAGCTCCTTCTTGTTCAGGGTCATAAGATGAGAGATCTTCCTCCGAT
+TCCGAGAAATCGGTCAAGCGGGGGGCTACCCTCGGCTCACCTCTCTATCTATAGAGGTCC
+CTCCCCAGAGAGGGGCACGCGGACGGTCAGTGCGTCGCCTAAGCGATCTAAGGAGCAGCA
+CGTCCGCAATGATATTCCCCTCAGCACGTCCACAAGATCGCCTTTGCGGACGTGCTG
+>ds2020-267_81
+CAGCACGTCCGCAAATTAGAACCCGTTCCAGAGCTAATACATGCAAACAACATGACACCG
+CCGGCTCGCCGGAGGCACATGTGCTTTTATTAGATTAAAACCATACCGCTCTTGGGCGGT
+TCACTTTAGACGAATCTGGATAATTTTGGCTGATCGTATGGTCTCGTACCGACGACACAT
+CATTCAAATGTCTGCCCTATCAACTATTGATGGTAGTATAGAGGACTACCATGGTTGCAA
+CGGGTAACGGGGAATCAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACAT
+CTAAGGAAGGCAGCAGGCGCGTAAATTACCCAATCCCGGCACGGGGAGGTAGTGACGAAA
+AATAACAATACAGGACTGGTGTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_82
+GCAGCACGTCCGCAATTTCCACCCCATTAGTGTTACTACATTGAGCTCGGTTACGGCCTT
+AGAGGCGTTCAGGCATAATCCAACAGACGTAGCTTCATACCACTGTTCGATCGAACAAGT
+ATTGTACCAGAGGTCTGTACCAGCGGTTCCTCTCGTACAACGCTAGTATGCTCTTGTAAT
+AACGGTTCATCAGTAGGGTAAAACTAACCTGTCTCACGACGGTCTAATCCCAGCTCACGT
+TCCCTATTGGTGGGTGAACAATCCAACACTTGGTGAATTCTGCTTCACAATGATAGGAAG
+AGCCGACATCGAAGGATCAAAAAGCAACGTCGCTATGAACGCTTGGCTGCCACAAGCCAG
+TTATCCCTGTGGTAACTTTTCTGACACCTCTAGCTTCAAATTCCGAAGGTCTAA
+>ds2020-267_83
+CAGCACGTCCGCAACTTCATGGGCCTCTTATTGCGACGTGCTGAGTGTATTATATTTGCG
+GACGTGCTGACGGAAGTATAATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACG
+CACTGACCGTGAAACTCCCCCCATCGTCAGCTTTCTTGGCGTCTGCAAGTTGTTCTATTT
+TTTCCTGAGCAGTCTCTTTAAGCATGGCTGCTTTTTCTTGAGCTGTTTCTTTTAAGGTTT
+CAGTTGTTTGCATGACACTGTCAATCACGGTGCTTTTATCATTAGTGCTATCTTTCGCAA
+GGTCTTTGCGACGGTCAGTGCGTCGCCTAAGCGTCGCTTAAGGCGACGCACTGACCGTAG
+TACACTCGTTACCACACGGTCAGTGCGTCCCCGACTATTCACGGTCAGTGCGTC
+>ds2020-267_84
+CAGCACGTCCGCAATGACGTTGGGATCTCCGTAACCGTGAATGTTGACTGGCTGAGCGGC
+TACCCACTGATTGTAACTGCGTCTCTGTCTGTTGCTGGTGCAAACTGCCTTCATCTGCAT
+GACCCATCCGAACAGCGCAGCAAGCATTACTGTTCCTGCTGTCTTTGCCGCGCTAACGCT
+GCTTGGTTCTATCGTTCTGAGTGCCTGTATCTCATCTGCATCAAGCTGCAGCCCACTTGC
+CGTGACACCAGCCACTGCTTTGCCATTCAATAGCTGTGAGACCACAGCGTTCTCACTCAC
+ACTGATGCCCTCATCTTCTGCCAGCACAGGCATCTCACCGATGACTCGCATGCTCACAAC
+CTCGTATGTGTTAACGATGTGGTATTGCGGACGTGCTGTCCTTAGATAGATC
+>ds2020-267_85
+GCAGCACGTCCGCAACCGGTCATCAGTTTGCCACGTTTCCCCCTTATCCAAGGTTTCCCC
+TAGCCGCAACTTGAATTGCCTGTCTTGTAGCGGCCTTTCATATGAATCGTGGAATTCTGT
+TTTCACTTCCTTCATCTTTCTTTGGTTGGGGTACGCCCTATCACTCTGATTCCAGTCCGC
+TTGCTGATCGAGAGTCGGGTAAACCGTCAACTGTTGTTGCTCCACCTTCTGGACACCCGA
+AACCGTTAGTGGCAAGGCAGCGTAGTCACTGCAATTCTTTCAGAACCTTCTTTCTCCATA
+TCTTAAGCACTAAGGGCCTGTTTTGTTTCTTACAGAATATGGGTATGTCCCACGAATGCT
+GGTTCCCGTGTATCGGGTCTACCCAAGTGCTTGCGGTTTGCGGACGTGCTG
+>ds2020-267_86
+CAGCACGTCCGCAACTTCATACACGTCCTCATAATGAAGCTACCCTTCAACTCCAAGGGC
+ACAGAGGCCTACATAGCCTCCCTCGAAGCCTCTCCCGTATTGCCACGTGTCAACTTCATC
+ACCCTCCCAAAAGTCCCAGACCTAGACAAGCACCTCAGCTCCCACTCCTTCCGCAACCAG
+TTCGTCGAAAGCCACAAAACCCACGTCAAAAACGCGGTCGCCGAACTCACCGAGTCAAAG
+TCCGAGTCAAGGCCTCGGCTTGCTGGGTTCGTCATCGACATGTTTTGCACAACAATGATC
+GATGTGGCGGATGATTTTGGGGTTCCTACGTACATGTTCTTCACTTCACCTGCTGGGTTT
+CTCGGGCTGCTGTTTAACCTACAAAGGGCCAAAATTGCGGACGTGCTG
+>ds2020-267_87
+GCAGCACGTCCGCAATAATGCGCCGCTCAGCACGTCCGCAATTGCAACCCGATAAGACTG
+GGGAACACCGATTGCGGAGATAAGGAAAGAGGCAAGGAGGGCGGTGAAGAGTGGGGAGGT
+GGTGTCGGTGGCGAAGGCGAATGAGGTTTTGTTTGAAGAGGATGAGGTGGTTGAGGAGGA
+GAGGCAGAGAGAAAGGGAATTGCAAGAGAGGAGTGAGAGGGAGAAAGAGTTTGTGGTGCA
+CGTGCCGTTGCCGGACGATAAGGAGATTGAGAAGAGGGTGCACGAGAAGCCCGAACGTCC
+TTACTTCCAGGCACGTCCGCAAACTACTCTGGCTCGCACTCCGCAAGTAATACCCCATAC
+AGATTGCGGACGTGCTGAGGGCCCACATCTTGCGGACGTGCTG
+>ds2020-267_88
+CAGCACGTCCGCAATTTTGGCCCCCTATGTCTTTTCACAATGTCAAACTAGAGTCAAGCT
+CAACAGGGTCTTCTTTCCCCGCTGATTTTGCGAAGCCCGTTCCCTTCGCTGTGGTTTCGC
+TAGATAGTAGATAGGGACAGTGGGAATCTCGTTAATCCATTCATGCGCGTCACTAATTAG
+ATGACGAGGCATTTGGCTACCTTAAGAGAGTCATAGTTACTCCCGCCGTTTACCCGCGCT
+TGGTTGAATTTCTTCACTTTGACATTCAGAGCACTGGGCAGAAATCACATTGCGTCAACA
+CCATTTTCTGGCCATCGCAATGCTATGTTTTAATTAGACAGTCAGATTCCCCTTGTCCGT
+ACCAGTTCTAAGTTGGGTGTTAAGCCTTGCGGACGTGCTG
+>ds2020-267_89
+AGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACATCCAAGGAAGGCAGCAG
+GCGCGCAAATTACCCAATCCTGACACGGGGAGGTAGTGACAATAAATAACAATACCGGGC
+TCATAGAGTCTGGTAATTGGAATGAGTACAATCTAAATCCCTTAACGAGGATCCATTGGA
+GGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTG
+TTGCAGTTAAAAAGCTCGTAGTCGGACAATAACGGTCAGTGCGTCGCCTTAAGCGTATCT
+AAGGAGCAGCACGTCCGCAAACGATTCTCCCTCACACGTCCGCAATTTTACCCTCCTGAT
+ATTGGACGTGCTGACCGGTTGCACATTGCGGACGTGCTG
+>ds2020-267_90
+CAGCACGTCCGCAAAGGGAAACCGGTTAATATTCCGGTACCTCGATGTGGATTATCCGCG
+GCAACGCAACTGAAGGTGGAGACGTCGGCGGGGGCCCCGGGAAGAGTTCTCTTTTCTTCT
+TAACTGTCTATCACCCTGAAATCGGTTTGTCCGGAGCTAGGGTTTAATGGCAGGTAGAGC
+AGCACACCTTTGTGCTGTCCGGTGCGCTCTCGACGACCCTTGAAAATCCGCCGGAAGGAA
+TGATTTTCACGCGAGGTCGTACTCATAACCGCAGCAGGTCTCCAAGGTGAACAGCCTCTA
+GTTGATAGAACAATGTAGATAAGGGAAGTCGGCAAAATAGATCCGTAACTTCGGGAAAAG
+GATTGGCTCTAGGGGTTGGGCATTGCGGACGTGCTG
+>ds2020-267_91
+CAGCACGTCCGCAATACCCGTATGATTGCGGACGTGTGAGGACATAGACCTTGCGGACGT
+GCTGCTCCTTAGATTCGCACTGACCGTCGATGTTGCCCTTTATGATTCGGATAAAATCAA
+TGACTCACTTGCATCAGCCATTAATATTCAAAGCTTAAATTCAGAGACATCCGATGATGA
+GGCGCGCGTTGAATTGACTTATAAAGACCAAACGCGCAATGCCAAATTGTATTACAACCA
+AGCCGATGAAGGCTTTACGCCAGCAACTTCACCTATTACTGCTGGGCGAGGACGGTCTCC
+ACGGTCAGTGCGTCGCCTATCTAAGGAGCAGCACGTCCGCAAAGTTTTGGCCCCAGCACG
+TCCCAACCCAACCCCGATTAATTGCGGACGTGCTG
+>ds2020-267_92
+CAGCACGTCCGCATGCTTCGCCGTCTTGCCATCACCATCAGTCATCATTCCACCGAAGTA
+AACATCGCTAACGTTCTTCAGCTTGTTGTTGACGTCCTCGTGCATAGCCTTCTTCGCCAC
+ACCGTATTCAGCCTCCTCTTTAGTCATCATGACGCCATCCGTCATGATGCCCTCAACCAG
+TCCATTGGGGTTCATCGCCTTCTTCACCCGCTCGGCCACCACCTCGTCTCGCTTAACTTG
+TTTCTTTGGTGCAGCCATCGTAACGTCCTTTCTCGCTTCTGGTGGTATCGTTGCAATTTG
+CGAAAAACAGTGATCTTTTGTGGGGTTCTTAGCAAAAGGTTGTGTTTGTTCGTAAGTGAA
+ATTCCTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_93
+TATCTAAGGAGCAGCACGTCCGCAAATTCATTTCTCTCAGCACGTCCGCAAAGTGGTGGC
+CTCACACGTCCATCTATACTGGCTTTAAGTTGCGGACGTGCTGCTCCTTAGATACGCTTA
+AGGCGACGCACTGACCGTATTTGCAGGGGTATAAGAACAAAGTTCAATCATCTCTATCAG
+ATCACGATCTGATAAATTTTCACTCCCTATTTGAACTAGTCTGTTTAATAGTTCTAGATT
+AAATGCCTTAAATATATGAGTACCATCATAAGACCACAATTCAAATTCTAGATGAGTAAC
+ACGATTTCTCATGTTTTCTACGTCTAAGGCCCATTGATTGTACTAGGGTATGGAGGACGG
+TCAGTGCGTCGCCTAAGCGTATCTAAG
+>ds2020-267_94
+CAGCACGTCCGCAAATCGACCGGCGTACTGTTGGACGTGCTGAGTGATACCAGCTTGCGA
+CGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTCATGAGGACCCTGACCAT
+GTATTGCTTAAGCAGGCTTATTTAGAGGGTGCTGTGGTAGTGACACCCAATCCCCGCGGA
+CATGCTATGTTGGCCAATAAGCAAAACCTGACATTGCTATCAGACTCCCAAATATTGCGC
+TCTTGGGGTCTGGATGAGGCTGCAGTGGAGAGGTACTGGAACACGGTCAGTGCGTCGCCT
+TAAGCGAATCTAAGGAGCAGCACGTCGCAAACTTCTTGCCCTAGCACGTCCGCAAGTGGG
+ATAGGGTGGATATTGCGGACGTGCCG
+>ds2020-267_95
+GGACGTTCGGGCTTGGGTGGAGTGATTTGTCTGCTTAATTGCGATAACGAACGAGACCTT
+AACCTGCTAAATAGCCAGGCCCGCTTTGGCGGGTCGCCGGCTTCTTAGAGGGACTATCGG
+CTCAAGCCGATGGAAGTTTGAGGCAATAACAGGTCTGTGATGCCCTTAGATGTTCTGGGC
+CGCACGCGCGCTACACTGACAGGGCCAGCGAGTTTATCACCTTGGCCGGAAGGTCTGGGT
+AATCTTGTGAAACCCTGTCGTGCTGGGGATAGAGCATTGCAATTATTGCTCTTCAACGAG
+GAATTCCTAGTAAGCGCATGTCATCAGCATGCGTTGATTACGTCCCTGCCCTTTGTACAC
+ACCGAGGAAAGCCCGAACGTCC
+>ds2020-267_96
+CAGCACGTCCGCAATCAGCCTGTTATCCCCAGAGTACCTTTTATCCGTTGAGCGATGGCC
+CTTCCATACAGAACCACCGGATCACTAAGACCTACTTTCGTACCTGCTCGACTTGTGGGT
+CTCGCAGTTAAGCGCGCTTTTGCCTTTATACTCTACGCGTGATTTCCGACCACGCTGAGC
+GCACCTTCGTACTCCTCCGTTACTCTTTAGGAGGAGACCGCCCCAGTCAAACTACCCACC
+AGACACGGTCCTCGTCCCGGATAACGGGACAGAGTTAGAACCTCAACATTACCAGGGTGG
+TATTTCAAGGACGGCTCCATTGGAACTAGCGTTCCAACTTCAAAGCCTCCCACCTATCCT
+ACACCCGTTGCGGACGTGCTGG
+>ds2020-267_97
+CAGGTATGTTTTCGGACGTGCTGACAATCAGGTCCTTGCGGACGTGCTGACCCCATACTA
+ATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTCCTGGTCTCC
+CTCCATAGCCGAAATGACCATGGTCACACAGGAAGTAAGCCTTGACTTCCCCATTAAAAC
+GGTTTTCGATACGGCGCAATTCACCATAGCGCTCACCCGCTGAGATATTACAACCTGTCG
+AACAGCCATGACAAATGCTTGGTGCATATTGCATGTCCCAATCCACGGTCAGTGCGTCGC
+CTTTAGCGTATCTAAGGAGCAGCACGTCCGCAAACGAGATTTTGTGGACGTGCTGCCGGA
+TGAGCCTTGCGGACGTGCTG
+>ds2020-267_98
+CAGCACGTCCGCAACGTCCTTACACTCAGCACGTCCGCAAGACTATCAGCCTCAGCACGT
+CCCAACCGAGTCTCTTTTGCGGACGTGCTGCTCCTTAGAAAGGACGTTCGGGCTTTCCTG
+CTGCCATCCGATCCTGAAGTTTACCCTTTGCCCTTAGAATACGACCAAGGCGCTGCGCTT
+CTTGACGCCTTGAACCAGCATGTGACGATATCTGAATTATCACATTTGCCTCCAGAATGT
+CTATGGAATTATCACCTACCTTAGACAAAAATGCCATGTTAAGCCCGAACGTCCTTACTT
+CCAGTATCTAAGGAGCAGCACGTCCGCAATATTCACACTCTCAGCACGTCCGCAAAGGGA
+ATGGGATTGCGACGTGCTG
+>ds2020-267_99
+CAGCACGTCCGCAATGGGCATGGCATCGGTTTGAAACATCGGAATTGACGACTCTGGCCA
+TAAGATAATGTCCTGACCAAGGCGGATGAATTGCGGACGTGCTGCTCCTTAGATACGCTT
+AAGGCGACGCACTGACCGTAGCTCTGTCCCCCCCAGTCGAAAACTGGAGCTCTGATACCA
+CTTGTTGTGCGGAAGCGTCAACCAATTGCGAGTGAAAAATAAACAACAACTGGCAGGAGA
+TAAATGGAACCAAAACAAAACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCAC
+GTCGCAATCCATCACGACTCAGCACGTCCCAATGTCTAGGCCCCAGCACGTACCCAATGA
+TTTCTTGCGGACGTGCTG
+>ds2020-267_100
+TCAATCGGCAGGAACAAAATTAGGTGTATAAACTTATTTTGCTTATTCGGACGGACCAAC
+TAGACTAGTTACGACATCACATTGATAGCCTCTACTCGTGTCCTAGCTCGTCTGAGAGCT
+AAATTTGCCTCAATTGTTTGTCTCTTGCCTTCAGCTTTCCTCAAGTTAGCTTCCGCTATT
+TCAAGAGTTTGTTGCGCTTCTTGTGGATCAATGTCACTACCCTTCTCTGCATCATTTACT
+AAAACCGTGATCTCATTATTGCCTATTCTAGCAAAACCACCCATCAGAGCCATCGTTAAC
+CATTGGTCGTTAAGGCGTATTCTCAAAATACCGATATCTACAGCTGTGGCAGGGCGTGAA
+CCTTGCGGACGTGCTG
+>ds2020-267_101
+CAGCACGTCCGCAATCAGTGTGTCCTCTGCTCATTGTCACGTGCACCTGACTGCTTCATG
+TGCTGTAGCCAACCAAACAGGCTAGTCAGCGCGACTGTACCTGCCATTTTAGCTGCACTG
+ACACTGTTGAGCTCGATTCTTGTCATAGCAGCTATCTCTTGTTCATCCAACTGCATGCCG
+GGAGCAGCTACACCAGCGACTGCCTTGCCGTTAAGTAAGTGCGCCATGACTGCATTTTCA
+CTGACGCTGATTCCTTCTGCCTCAGCCATGATCGGCAGCTCACCGATCACTCTGATCTGG
+TGCGGCTGAAACACAGTGATGATCTCACTTGTCAGCGTCTTGTCAGAAGACTTGGCCATG
+GTTGCGGACGTGCTG
+>ds2020-267_102
+GAGTTCTCTCAAGCGCCTTAGAATACTCATCTCGCCCACCTGTGTCGGTTTGCGGTACGG
+TCTCGTATGACTGAAGCTTAGAGGCTTTTCTTGGAACCACTTCCGATCGCTTCGTGAGCA
+TGCTCACTCGTCTCAACCCCTTGAATTCCGTGCCCGGATTTACCTAGACACCTTCTCCAA
+GTCAAGAACAGGCTCTTCCAACCGCCTGACGACCTTCCGCGATCCGTCCCCCCATCGCTC
+CATCGACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATTGTTT
+AGTCCTCAGCACGTCCGCAAGATATTTTCCGTCAGCACGTCCCAAACTAAGGTAGGTGTA
+ATTGCGGACGTGCTG
+>ds2020-267_103
+TATCTAAGGAGCAGCACGTCCGCAACTACTTGGCTGTATTTGCGGACGTGTGAGGGAAAT
+ACCTTGCGGACGTGCTGAGGGTAAGCGTTTTGCGGACGTGCTGCTCCTTAGATTCGCTTA
+AGGCGACGCACTGACCGTGGTTTGACTCCTAAAATGTCTACCACCTCCTTGAAGGAAAAG
+TGGACATGATGCGATGCTGTTATCTTGGTATGCTTTGCCGACATGGCTTCGTACAGCTGC
+AATCACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGCACCCA
+GCCCTCAGCACGTCCGCAAGATGATCTCACTCAGCACGTCGCAAAAGTTCCTGTATGGTT
+TGCGGACGTGCTG
+>ds2020-267_104
+CAGCACGTCCGCAACCTCTAGGCCCTCCTTGGGAACCATCACAAGTACGGCCGGCCTATA
+TTTAAACGAGAATGCCGTGTCGTCCAGCGGAGCCTAGAAGAAGGTGACTCGCGCAGACAG
+CGGACTCCTTTTCAATAGAAAGGAATAGCCAAACCAACCCAGCTGGCTGGTCAATCTCAG
+AGATCTTATCGGCCGGCAAACCGGAGACGGACGACCACGGTCCCGACCTTACCAGCACCG
+GAGGTGTACTAATCAATGAACCCCCGAAACCTACTTTCTTTTCTGACAAAATCAACCAAA
+GTACTCTTGCGGACGTGTGAGGTCTCTGAACTTGCGGACGTGCTGAGGGGGGCTATGTTG
+CGGACGTGCTG
+>ds2020-267_105
+CAGCACGTCCGCAATTTCTGATCCCTCAGCACGTCCGCAAGCCGCTGTCTCTCACACGTC
+CGCAACTACCAGGTTTTGCGGACGTGCTGCTCCTTAGATATAAGGCGACGCACTGACCGT
+CAAATGGTAGGTAGTTATTGCCAGCGTATGCCATGTGCTCTTCGCATTCAGCTAAGAGGA
+GTGCTGGCTCACTATGCATGGCCGCTGCAACACGTTGACCGAGCGATAACGGCACGGTCA
+GTGCGAATCTAAGGAGCAGCACGTCCGCAAATCAGTTTTCCTCAGCCGTCCGCAAATGTT
+CTCTCCTTGCGGACGTGCTGAGTAACTATGCATTGCGGACGTGCTGCTCTTAGATAGATC
+GGAAGACCAC
+>ds2020-267_106
+GCGACGCACTGACCGTCTATCCGTTCCTTCCTGCAATCTTGATTGAATGGTTTGAATCCA
+AGTAATCAACTTCAATAATTCTTCATCGGCAATGGCTTGCCAAGTCAGACAGCAGCTTTC
+ATCATAGTTTTTGCCGGGCGTATTCATCGCATCCGTAATGACCTCCGTGATAACATCTGT
+GATAACAGCATTGATAACATCAGCGTCGCCAGTTAAATTTTCGTCCAGTCGCATCGGGGC
+TGTTGGTTTGCTAGATGGGCAGTAACGGTCAGTGCGTCGCCTTAAGCGTCTAAGGAGCAG
+CACGTCCGCAAACGAGTAACGGTAGCGTTGCGGACGGCTGACAGCTTATTAATTGCGGAC
+GTGCTG
+>ds2020-267_107
+CAGCACGTCCGCAAATGTTACCCGATGGTCCTTGCGACGTGCTGAGGAGGTCTGAATTGC
+GGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTGCATTCGCCGCTGCC
+ACCGAAGTTTTCTTTGCTTTCCCGACTTAGCTGCAATCAGCTGAGCCTTGAATTCTAGCA
+CAGATTTTGAAGATCTGTCAAACTTTTTGATCTCTTCTTTTGCTGCAATCGCTTTTTCAA
+AGCAACCACCGCAATCAGCGAAGCCTTAGATTGTACAACAGTTTTTACACCGCAATCAAC
+AAATTCCAAAACTTCTTCAACCAACCCCGATACAGACGGTCAGTGCGTCGCCTTAAGCGA
+ATCTA
+>ds2020-267_108
+CAGCACGTCCGCAATGGTCCGCCCTTCCTCTCCCTCTCCCTATGGTCGAGCTAGTTTAAC
+CTTCCTCCAAGACTTGAATCAGGAATATCTTTTCTGTACTATGCCCTGCGCCTGGTCTTT
+CTTCTTTATTGCCTTGGCCTTTCACCGGATCGATCCCTTCCACCATTCCTCCAACAGATG
+CGGATGAATTAGCTGCCGTTATTCTTTCAACATTTGCAGAGCTAACCCCTGAAGTGACTT
+CAGTCCCGTGTTAGAGCTAACTGCTGCTTCTTCTATAGCAAGTGCCGAGCGAGTGCATAT
+TGCGCTGAAGGCCCCCGCGTTGCGGACGTGCTGAGAGAAGGGATGTTGCGGACGTGCTG
+>ds2020-267_109
+CAGCACGTCCGCAAACATAGGGAGCCAATTGCGGACGTGCTGTCTGGAAGTAAGGACGTT
+CGGGCTTGTTCATACTACTCCCCATAGCGACACCATGTGCTACCGACGCAAGATTTGACG
+GTACGCAAAGACTTGCCATAGGCATGCCCTGTTTCAAAACCTGCGTTGATTAAGCGTTCC
+CAAATATCGGGCAATTGGTCAATACGTGCACCAAATAAATCCACACGTTACCCACCAGTA
+AAAGCCCGAACGTCCTTTATCTAAGGAGCAGCACGTCCGCAACATAGCGCCCCTCAGCAC
+GTCCCAAGTAGTGTGCCCTCAGCACGTCCACAATGTAGGTCTATTGCGGACGTGCTG
+>ds2020-267_110
+TATCTAAGGAGCAGCACGTCCGCAAGGTGCCCAGGGTGCCTTGCTTATGTCTTAAACGGT
+TAAGGGGATTAAAATGATTGCTGTTGTTATCATTGCTTTAGGTGTCATGATTTGCGGACG
+TGCTGCTCCTTAGATTCGCTTAAGGCGACGCACTGACCGTTGTAGTTTGCCTGTAGGTGC
+TGCAAATGCTCATTGAGCTGTTGCTGGTTATTTGTGAGTGCATGCTCTTCAAGTAATAAC
+TGCTGTAATTGGCGATTGATGTTATCAAGCCGTTGTTTGGCAATCGCTAATTGTTGCTCG
+GTATCATCGGGCGTGTAGGGCTGATGGGAGGCCAAATAACACGGTCAGTGCGTC
+>ds2020-267_111
+CAGCACGTCCGCAACGAGTAGCCACTCAGCACGTCCGCAACTCCCGGGACTTTGCGACGT
+GCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTAACAGCGTGGTTGGAACGCAA
+GAACTGTTTGTGCAGATCAGTTATTGTGTGTTCTGACTTACACGCCCGTGTCACTCCGGA
+TTTATCGGGATGGCGGTAAGTGCTTTGCCGTTGTCCACATAAAGACGGGGTGGACGTTTC
+ATTTACTCTTTTCCCAAATAAGAAGTGGAACGGACCTCGGTCAGTCCGACCTAAGTTTGC
+ATCGCAGAACATCCTGTATTGATTATAACGGTCCTTTACTTGCGGACGTGCTG
+>ds2020-267_112
+CAGCACGTCCGCAATCATTGGCTGGTGTTGCGGACGGGATGAAGAAGGATTTGCGGACGT
+GCTGCTCCTTAGATCCGCTTAAGGCGCGCACTGACCGTCCAGACTGGGATGGCGCATATT
+TGGCCGGTTAATATTTTCTATCTAAGCCTCCATGTTCCTAGGAACCTAGAGGATCCCCCC
+CCTCATCTTCCATTTCAGCAATCTCAACGTCGCGCAGCCACTTTGGCTTCCTGTTCGACC
+GTTTGTTCTTTCTCCTTCGGCTGTCGGAATTCGGGTACTTGACTCGATACGTGTTCTTAT
+CCATCATGACCAATCCATCAACGGTCAGTGCGTCGCCTTAAGCGAGATCG
+>ds2020-267_113
+CAGCACGTCCGCAACACATCCGTTCTTCACATCCAGGCACTCCAATGTCGCTTGTGAGTA
+GGGCTTCCCAGGCCCGAGTGAACGATGAGTTTGGTGAACGCATGTCTTGGGTAGACACGC
+TCGGTCCGCGGCCCCGTAAGAGGTACACCGGCGAGTGGCGGGTTCTCAATCGATGGAGTA
+GGGTTCCGTTGATCCCTGACATTGAGAATCACCTCACCAAACCGCCTCCCGTTTCTGCAC
+CCGTAACGTAAATGGATGCAAACACCGTCGGCTCGTTCCTTGCGAACGTGCTTGCGAGCC
+CTAGAGGGGGTCGCATTGACAAGAACGCCAACCGATTGCGGACGTGCTG
+>ds2020-267_114
+GACGCACTGACCGTGATCGGCTTTCTATTTTTTTTGTGTCCTTTATTCTTCCTTGCTTCG
+GATCGGAAAATTAAAGAATTGAGTGAATCATAAACCAAAGGAGGTTCATGGCCAAGGGTA
+AAGATGTCCGAGTAACAGTTATTTTGGAATGTACCAGTTGTCTTCGAAATCGTGTTAATA
+AGGAATCAACGGGCATTTCCAGATATATTACTCAAAAGAATCGACACAATACGCCTGGTC
+GATTGAAATTGAGAAAATTCTGTCCCTGTTGTTACAAACATACGATTCATGGGGAGATAA
+AGACATAGATCGACCCGACCGCAGCGCGCGATAGTGCGGACGTGCTG
+>ds2020-267_115
+CAGCACGTCCGCAAAGTGGTGGCGCTAAGCGAACTGATGTCAACTCTAGGAATGATACCC
+ATAGACGAGGCGCTGACTGCCGAAGCTTGCGGGTCAACAAGCCCAATCGAGTGGGGAAAA
+GAAGGAAGAGAAAGAATAATGAGCGAAAGAATAGAAACGTTACGTGAAGCTGCGTCTGAG
+CCTTCGGCGAGAACGACGACGCTATTTGTAGAAGAAAGGTGACAAGAAGAAAACATAGGA
+AGTACGCGGCTGGGTGCCAGCGAAAGAACGGAAGGATAAGCAAACAGAGGAGAAGAAGTG
+GATGGTGAAAAGAAAGAAAAGAGAAAGTTCATTGCGGACGTGCTG
+>ds2020-267_116
+CAGCACGTCCGCAGCGACGAGTTCATTGTAGCGCGCGTGCAGCCCAGGACATCTAAGGGC
+ATCACAGACCTGTTATTGCTCAATCTCGTTATTGCTAGACGCAATTTGTCCATTTAAGAA
+GCAAAGTGTCCTCTTAAGACAAACCAAACAGGTATGACTCCATCGCACGTGCCGAAGCAC
+ATGAAACTTCAACGCCATAGTCCTGCAGGCATCTATTTAAAAAAGTTTGAGTCTCGTTCG
+TTATCGGAATTAACCAGACAAATCACTCCACGAACTAAGAACGGCCATACACCACCACCC
+ATAGATTCGAGAAAGAGCTATGGGTTGCTAGTTGCGGACGTGCTG
+>ds2020-267_117
+ATCTAAGGAGCAGCACGTCCGCAACGCAAATGGCCTCAGCACGTCCGCAATTACCAACCC
+CCATTTGCGGACGTGCCTGGAAATAAGGACGTTCGGGCTTATTCCTCGTGCTATGAGCCG
+AAGAAATAGTAAGATATGGGTAAGAGTTCTCGCTGATCTCCCTATTACCCGGAAACCTAC
+AGAAGTAAGAATGGGAAGAGGAAAAGGAAATCCTACGGGTTGGATCGCTCGTGTGTCCAC
+GGGACAAATCCCATTTGAAATGGATGGTGTGAGTTTGTCAAATGCTCGACAAGCCGCTGT
+CAAAGTGTGGATTTCATTTTGTAAAAAATAAGGGGGACGTGCTG
+>ds2020-267_118
+CAGCACGTCCGCAAGGGTGCCCCACCCACACGTCCGCAATGAATCGTTTGTGGTTTGCGG
+ACGTGCTGCTCCTTAGATACGCACTGACCGTTGCGCCGCCATAGAACTCGACAGTTACAC
+CTACTTGTTCGACACTATATTTTGATTCTGCCCTTCTAAAAGGAACATCGGCTCTAACAA
+TTCCGTCTCCGTCTACCAAAACAACCGGAAACGTTTCAAAAAAGGTAGGCATACGACGTA
+CAAAAAGTTCGCGCCCCTCTTTATCTCTAAAGATAGGATGTCCTAACCACCCAACAGCTA
+TTCCATCCCCGTTGTCCATTGAGCCACGAACGGTCAGTGCGTC
+>ds2020-267_119
+ATCTAAGGAGCAGCACGTCCGCAAATGACCTGAAGTGAGAGACCCGAGAGTGGAAGTGGT
+GTCAGACGGACAGATAGAAGCAGAAATACCACTTGATGTTCAAACAGCCAATGAGATCAT
+GGAGTCGAAAGCAGTTTACAAGTTCAAAGGGTCCAGAGATTACGTCGAAGGGCTTGGAAG
+CACGTACGGAGTGACTTGGAAGCATGAAGGAAAGAAGAGGGCAGTGGCACTCATCGCTGC
+TGGGAACCTGATGGTGGGAGCAAGGCAGTCAACCGGGATGCACGATGAACTCAGCAGAGA
+CGTGGAGCTTTCCACAGGGGACGGAACTTGCGGACGTGCTGG
+>ds2020-267_120
+GACGCACTGACCGTAACCTTGACCTTGACGCACTGACCGTTCCCTTTCCCTTCGTATCTA
+TGGCACAACGGACGGTCAGTGCAGGAGCAGCACGTCCGCAACCCCGGCTTCGTATGATTT
+TGCTTACTATACCTGCTGCTGTAGCATTATAAACATTATTGTTACTCTTGCTCCCGTCGG
+GATAAATCTGACCCCTTCCCCTGTTCCCGCCTACGTATATGGGATATTTTAAGAAGTGAA
+CATCTTTCTTAGTAGCGGGGTCCGGGGAAAGAATAGGAAATGTGATTTCACTATATTTCT
+GACCAGGGACAGGACCTATCACCATTTGCGGACGTGCTG
+>ds2020-267_121
+GCAGCAGTGGGGACTCTTGGACAATGGGCGAAAGCCCGATCCAGCACTATCGCGTGAGTG
+AAGAAGGGCAACGCCGCTTGTAAAGCTCTTTCGTCGAGTGCGCGATCATGACAGGACTCG
+AGGAAGAAGCCCCGGCTAACTCCGTGCCAGCAGCTGCGGTAAGACGGGGGGGGCAAGTGT
+TCTTCGGAATGACTAGGCGTAAAGGGCACGTAGGCGGTGAATCGGGTTGAAAGCGAAAGT
+CGCCAAAAACTGGTGGAATGCTCTCGAAACCAATTCACTTGAGTGAGACAGAGGAGAGTG
+GAATTTCGTGTGTAGGGGTTACAGGTTGCGGACGTGCTG
+>ds2020-267_122
+ATCTAAGGAGCAGCACGTCCGCAATAAACTCCCGGTAGAAAGAGATTTCACTAATGAAAA
+AGCTTTCAATGCTGCCCGATATCCCTTCCTTTTCCAAATATTTTTACGAATCCGTTTTTT
+TGAAATAGAGGTGCGTTTTTTTGGAACTGCCATTAAAAAATTATATTATAATAGGTTCTT
+CGGTTGGATGTGAAAGACATCTATTGTTCAACTCTTCTCTATCTATTTATTCTCTAAATC
+ATACTCCCTTCATAAAAAAGGGGGGGGGGGTTGCGGACGTGCTGCTCCTTAGCTACGTTC
+GGGCTTGTTATAGGGGTTGGTTGAAAGCCCGAACGTCC
+>ds2020-267_123
+GACGCACTGACCGTCGCCCCCCGTGCTTCTGGCATGTTACATTCCTCTTCGTGCTGAGCC
+CCCCTTTCTCGTCGGTCCGCAGAGACAAAATGTAGGACTGGTGCCAACAGTTCATCACGG
+AAGAAAGGACTCGCTGAGCCGAGATCACTAACTAATACTAATCTAATACTAATGAAAATG
+CTAATATAATAGAAAAGAACTGTCTTTTCTGTATACTTTCCCCGGTTCCGTTGCTACCGC
+GGGCTTTACGCAATCGATCGGATCATATAGATATCCCTTCAACACAACCTAGTTCACTGC
+CAGGATCTCGGAGACACGCCACCAAGCCCGCACGTCCC
+>ds2020-267_124
+CAGCACGTCCGCAAATGTATCCTCCTGTGATTGGGACGTGCTGAGGGCCCATGAGTTGCG
+GACGTGCTGAGTGGCCTTGTGTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACG
+CACTGACCGTGGTTGTCACCCTACTCCATCCATACCACATATACTCTACATACACATCAT
+ATACACACATACCATACACACTGTCACACACACCGCATACACCACACACACCCACACATA
+CCACACACACATATACATCACAGACACCATACCCACTCACACACAGAAACATATACCCCG
+GCAAATACGGTCAGTGCGTCGCCTTAAGCGAGATCGG
+>ds2020-267_125
+CAGCACGTCCGCAATGTATCAGGGTTGGTTGCGGACGTGTGAGGGAGTGGCTATTGCGGA
+CGTGTGATGGGTATGAAGTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCAC
+TGACCGTCTTACTTGGCCTCTCGTCACATACCTTCATGTTGGGAGAGCTGTCTACGGCAT
+AGTCTAATTGCCATTCTTTAGGGGCTTCGCTGTCGCTTCTAAGAAAGATTTCAATAGCTC
+TTCTTATAATTTTGAACCGCTTTCCTGCGTCCACTTGTTCAACATGGTTGGTCGTGCCAT
+AGGATCTGGGTTGCGGACTTGCTGCTCCTTAGCTA
+>ds2020-267_126
+GACGCACTGACCGTGTTCCAGGCCCTCTCTTAACTGAGACAGAGATCCAATGCTTGAAGT
+AGGAATAAAATTGATTCCACCAAACCTAATATGTATGGTAGATCAGGTCATATTTTAAAA
+GTATTCCTTTCTTTTCTACTCATTTATATCTTCTAAATCTATTTTTTTTTCTGGCTCGGC
+TAAGTGGGATAGCCGAGCCATTTCCTTATTATGCTACCGATTCCTTTTATGCTACAGCCG
+GGACTACGGTCAGTGCGTCGCCTAAGCGCACGTCCGCAATCCAAGGAGCATGTAGTTGCG
+GACGTGCTGAGGGCATTAACATTGCGGACGTGCTG
+>ds2020-267_127
+CAGCACGTCCGCAATTTTCGCTACCTTAGGACAGTTAGAGTTACTGCCGCCGTTTACCGG
+GGCTTCCATTCAAAGCTTATAACACTTCTCCTTCCGACCTTCCAGCACCGGGCAGGTGTC
+AGACTCTATACATCGTGTTACCACTTAGCAGAGTCCTGTGTTTTTAATAAACAGTCGCTA
+CCCCCTGGTATGTGCCGCTTTCCTAATCAAAAGATAGGAGAGCACCCCTTCTCCCGAAGT
+TACGGGGTCATTTTGCCGAGTTCCTTCGACATGGTTCTCTCAAGCGCCCTAGTATACTCT
+ACTTGTTCACCCGTGTCAGTTTGCGGACGTGCTG
+>ds2020-267_128
+CAGCACGTCCGCAATATGGCTGAGCTTCCAGTACGTGGGGCGCAACGCCCACTCTCTACT
+GAGCATCCCGTCCGACATCAATTGCTGCTCGTCAGCAAAACGAGCCCCAGACTAGACTAT
+CTGGGGGAAGGTATACCGGGGTTTGTTAAGACCCGGATGCCCCATAGGAGGCCGTCATTA
+CACACTTGGGCGTTTGCTAAACGTTAACCCCAAGATTGCACCTATTGAGAGATCTCTCAT
+GCAGTGCTCCTGACTTACCTTCACCTTTTCCAAGACTTCCCCGCACGAGATGCCTATGCA
+TCACATACGTGGGCGGTGTTGCGGACGTGCTG
+>ds2020-267_129
+GGACGTTCGGGCTTCATCTAAGGGGTACCTCATGCTCTTCAAGGTCGAGGCTAGCGCTGG
+AGGTTCGAATGTGGATTTGATGGATCTGTCGACGCTTGACTTCGCTCTCATGGCCGAGTT
+TGATCAGCACATCCTCGAGTATATTCGGCAGCAAGTCATCGACGCCCTCGAGAAGGCTAA
+ACACGCCAGCGACGAGGCGATCGAGAAAGCCCTGAGGAAAGCCCGAACGTCCTTAATCTA
+AGGAGCAGCACGTCCGCAACCCGTATTCCCCGCACGTCCGCAACAATTAACTACTGATTG
+GGACAAGGCCACAGCATTGCGGACGTGCTG
+>ds2020-267_130
+CAGCACGTCCGCAACTGCAAATGGATAGACTCCAAGGTCCGAACTGTAATTGGTTCTCCT
+ATAACCCAGTATATAATGAGCACCATATGGAATTATGGTCCCAATCACAACTTTGCTTGG
+GAGACCACACCCATCAAAGTGGGCATGCCACTAAATGGGTTTTGGCTGTCCAAGTTGTTC
+TCTAAACATGCCAGGTGCCAAATGCACATTGAGGGTGACTTTGAAGCTTTTGACTCAACC
+ATCTCCGGGTCCGTTGTTGACCTTATTAAGGATGTGAGGAAGAAAGGGTATGAAATGCAT
+AGAGACAGGGCTTCAGTTGCGGACGTGCTG
+>ds2020-267_131
+CAGCACGTCCGCAATCCACGACCGCTAGCGAAGGTCCCAAAGTCATGGTTAAGTGGGAAA
+CGATGTGGGAAGGCCCAGACAGCCAGGATGTTGGCTTAGAAGCAGCCATCATTTAAAGAA
+AGCGTAATAGCTCACTGGTCGAGTCGGCCTGCGCGGAAGATGTAACGGGGCTAAACCATG
+CACCGAAGCTGCGGCAGCGACGCTTATGCGTTGTTGGGTAGGGGAGCGTTCTGTAAGCCT
+GTGAAGGTGTGCTGTGAGGCATGCTGGAGGTATCAGAAGTGCGAATGCTGACATATGAAC
+AATGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_132
+CAGCACGTCCGCAAGTGCTAACGATAGTAGGTTGGGACGTGCTGAGAGTAATTAGTTTGC
+GGACGTGCTGAGTGGTTAGACTTTGCGGACGTGCTGCTCCTTATCGCTTAAGGCGACGCA
+CTGACCGTCGTTCTGGTGCTCCCTGTGCTTGTCCCCATAACTGTCACTGTAGCTATCACT
+TGGGCTATGACTTGCATACTCATGCACTGCCGAGGGTGCACTGTTCGGGGGATAATCTTG
+GCTAGCAGAAGCAGGATAAACATCATCCGACACTAGATAATCTTCCAATCCTTCAGTTTC
+ATGGCGGGTAAAACGGTCAGTGCGTCAG
+>ds2020-267_133
+CAGCACGTCCGCAATCAGTTTGTGGCGGTCACTGATTACTTCCGGTGGGGTTGACTGGAG
+GGATTGGTGACCGGGGTTGAATGGCATCAGACAGCGTGGCCTGAGGAGAAGCATGCAGCA
+TCCGGACTCTTGAAGGATGAAGACGTCAATTACCGTTGAGAGGGACGGTTCATGTAGGGG
+TACGTTAGCGAGTAAAAGACTAAGCGTAGAAAAGGAGATGCCGTGACCGCCATATTGAGC
+CGTTTCCGTTTTGTTCTCCCATCTCACCATAGATGAAAAGCTGGTACTAGTTGGATCCAT
+CGACTAGGGGATTGCGGACGTGCTG
+>ds2020-267_134
+CAGCACGTGCGCTCGCTTAAGGCGACGCACTGACCGTAGTAATGAGGGTTCCAGTTATGT
+GTTTTAGATTCTTCATTCCAAGTATATTCACTATGAATATCATAAAGAAGTTCTTGATCT
+AAACAAGTATAAGCTTTACTCTCTTGTTGCCTAACAATTTCTTCAATGATTTCATTAGCA
+CGAACAGTATAACCTTTACCAAGTAACCAGAAAGCCAAAGACGGTCAGTGCGTCGCCTTA
+AGCGAATCTAAGGAGCAGCACGTCCGCAATTACATTGGGCTGAGGTTTGCGGACGTGCTG
+AGGGGATCAGTTGCGGACGTGCTG
+>ds2020-267_135
+CAGCACGTCCGCAATGTGTTGCCCTCAGCCGTCCCGCAACCGTCTAGACCTTGCGGACGT
+GCTGCCACCGCTTAAGGCGACGCACTGACCGTGAATCTACAGGGACGCACTGACCGTACC
+CTTCTTCCTGACGCACTGACCGTGACTTCAACACTGACGCACTGACCGTCCGAGTATGCG
+TGACGCACTGACCGTCGTTGGATACTGACGCCTGACCGTTACGAGATCTCATACGGTCAG
+TGCTATCTAAGGAGCAGCACGTCCGCAACCTACCCGGGGTATATTGCGGATGTGCTGAGT
+CATGCGTATTTGCGGACGTGCTG
+>ds2020-267_136
+CAGCACGTCCGCAAGTATGCCTGGTTTCAGGATCTATTTCACTCCCCTCACAGGGGTTCT
+TTTCGCCTTTCCCTCACGGTACTGGTTCACTATCGGTCAGTCAGGAGTATTTAGCCTTGG
+AGGATGGTCCCCCCATATTCAGACAGGATACGACGTGTCCCGCCCTACTCATCGAGCTCA
+CAGCATGTGCATTTTTGTGTACGGGGCTGTCACCCTGTATCGCGCGCCTTTCCAGACGCT
+TCCACTAACACACACACTGATTCAGGCTCTGGGCTCCTCCCCGTTCGCTCGCCGCTACTG
+GGGAAATCTTGCGGACGTGCTG
+>ds2020-267_137
+CAGCACGTCCGCAACGTATGCCCCCTCGCGGAGCTAAGTCTTCGTTGCCGTCTTAAGACA
+ATCCACCGGTAGTGTGGCGCATAACTTGGGTTCTGGGCTAAAGTCGAGCGCAACTGCATA
+AGAAGCGTGCGATCCGTTCGGACCACTTTGTGTGTCTTACTCTGAGGGCTTTGTCACGGG
+GCGGTGATATGTGAGGTAGGCCCCTTTGAGAAAGGGTCTTTAAAGCGTGCCGTAGGACGT
+GCGCGCCTCATGTTACCGGGTACCCAAGGTCATAGGAACTGGGACTGCCTTGCGGACGTG
+CTGCCCCTTAGATAGATCGGCA
+>ds2020-267_138
+CAGCACGTCCGCAACCGCGTTCATCTCAGCACGTCCGCAAGCGACCTCACGTCAGCACGT
+CCGCAATGGCCATATCGTTGCGACGTGCTGCTCCTTAGATATAGGCGACGCACTGACCGT
+ATCGTCGCCCCTGGTGGCATGGGCCTGTAGTCCCAGCTACTCAGGAGGCTGAGTCAGGAG
+AATTGCTTGAACCTGGGAGGCAGAGGTTGCAGTGAGCCGAGATCATGCCATTGCACTCCA
+GACTGAGGTGTTCGCTCTTGGGACGTGCTGAGAGGAAGATGTTTGCGGACGTGCTGAGCC
+TTATCCTATTGCGGACGTGCTG
+>ds2020-267_139
+CAGCACGTCCGCAAACAGCCTATCCTCGCACGTCCGCAACATCGCTTAAGGCGACGCACT
+GACCGTTTGTTGCTGGGTAGTGACGGCGTTATCTTAAACAACAGCCGAAAAAAACACCCA
+GACCCAAACGGCTGGGTGGGTGGAAGGTAACCCGTGGCTTGGTAAAGGCGAAGCCAAAAT
+TATTTTGGGTCAGGTCAATTCAACCAGCCCCAGTCAATTGGCCGGTTATACCGAAATTGC
+CGGGGGCAAAGCCGAGCTGGTGATTGCTAACCCAGCAGGGATTACCTGTTCGGGAGGTCT
+AGTTGGACGGTCAGTGCGTC
+>ds2020-267_140
+CAGCACGTCCGCAATGAGTTTGGGCGCTTAAGGCGACGCACTGACCGTCAAAGCAGCCAT
+CCTTAAAAGAGTGCGTAATAGCTCACTGGTCAAGCGTTCCTGCGCCGAAAATGAATGGGA
+CTAAGCATTGCACCGAAGCTGTGGGTTTGTCTTTAATTAGACAAGCGGTAGAGGATGCTA
+AACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATGCATGTGGG
+GTCAGCCGTCCGCAATAAATCACCCCTGAGCCATGCACGTGCTGAGGAAGAGCGCGTTGC
+GGACGTGCTGCTCCTTAGA
+>ds2020-267_141
+CAGCACGTCCGCAACGTGGTCATTCTCAGCACGTCCCAACCTAGTATGCCTCAGCACGTC
+GCAAAGACCGGAACCTTTTTGCGGACGTGCTGCTCCTTAGATACTGGAAGTAAGGACGTT
+CGGGCTTTGCGTCTCCCCTAGATCGCATCTTGCGTTGGGGTGATGCTAAAGCTTGGCATG
+TCAGCAAGTTCAGTGCCTGCAGGGATAGACACTGTAACCCCAGCAATCGCTTGTGCCACT
+GTCAGGGTTTGGGTTGTGCCATCAGCATTGGTGAGCACGATGCTAGCAATGTCAGCCGCG
+TAGTTAAGCCCGAACGTCC
+>ds2020-267_142
+CAGCACGTCCGCAAACATTCACGGGTCAGCACGTCCGCACGCTTAAGGCGACGCACTGAC
+CGTATTGAATGCCGTGACGCACTGACCGTCACTGCGACCTTGTTTGTGTTGGTCATAACT
+GACGGTAATATCGGTATTATCATTAATATCTTTTACCAAGGGGTGCCCTACGGTCAGTGC
+GTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAATGATTGAAATTGCGGCGTGCT
+GAGCTGGAGTCCTTGCGGACGTGCTGAGTTGTAACCCCTTGCGGACGTGCTGAGGGCATA
+AGTTTTGCGGACGTGCTG
+>ds2020-267_143
+CAGCACGTCCGCAAACAACTGCCCTTAAAATGGATGGCGCTTAAGTCGTCTGCCTATACA
+CCGCCGCTACGGCACAGGCGGTTGCGTACTTGTGCGCAGCCGCATTAGGCCGTAGTGAGT
+AGGAGGGTACAATGGTGTGCGTCGAAGCTTTGGACGTGAGTCCGAGTGGAGCCGCCATTG
+GCACAGATCTTGGTGGTAGTAGCAAATAATCGAATGAGACCTTGGATGACTGAAGTGGAG
+AAGGGTTCCGTGTGAACAGTGGTTGATCACGGGTTAGTCGGTCCTAAGCACCAAGCAGCC
+ATTGCGGACGTGCTG
+>ds2020-267_144
+CAGCACGTCGCAATCCTAGCGTAGTCACACTCCGCAGACCTCTCTTGTTGCGGACGTGCT
+GCTCCTTAGATTCGCTTAAGGCGACGCACTGACCGTCCCCTAATTGCTGGTGTGGTCGTA
+GTGCCAGCAGTTGATGTCGTCGACGCTTGTGTGCGGTTTGGGCTGTATGGTGTCATCAAA
+GATGAGGTGCCGATGGCATTGGGTGTGGCATTTTCATGCTGTCTTAGCATGGGTTTAATC
+AGTTGCCATTGTTCTTTGGCGGTGAGTGTTTCACTGTTTAGAAAGCGGGACAGCGAGATA
+TACGGTCAGTGCGTC
+>ds2020-267_145
+CAGCACGTCCGCAATCGGTGTATACTCAGCACGTCCGCAAAGTCTGTCAGTTCAGCACGT
+CCCAACACCCCCCCACTCTTGCGGACGTGCGCTCCTTAGATACGCTTAAGGCGACGCACT
+GACCGTGTAAGGATATCTCCAGTTCCAAAGTTTGCCCTGCCTTGATGGCAATTCGCCAAC
+CATTGGGTACTCGCTCTCGTGTTTGCTTGGCTGTATCAGTCACATAGGCTTCGTACAACG
+CCCCAGTTAAGCAGACACTAATCTCCCCTCTAGTCGCATCCACATCGCTATCACCAAATG
+AACGGTCAGTGAGTC
+>ds2020-267_146
+ACAGCACGTCCGCAAGTCTTTTCGGTTGGAATCAAAAATGGGCTGTCTCCTCTCTGATGA
+TCTTTTCTATAGGTAGAACTACTGTGAGCGGTCTAAACTTCGACCCTTATTTCTTTCTTA
+AAAAAAAAGAAAAAAAGGACATTCGACCCAATACCTTAACCATGTAATTTCTCCGACATT
+ATTTTCTATCGCCACATCAAGGTGACAGGATTCGAACCTATGGCCCTCTGTACCCAAAAC
+AGATGCGCTGACCAGACTGCGCTACACCTCGCGTCTCACCCCCCCCCATTGCGGACGTGC
+TGCTCCTTAGATA
+>ds2020-267_147
+GATCTCGCTTAAGGCGACGCACTGACCGTCAAGTCGCCTCTCCATCTTAAGCTAAACCAC
+TCGCAGGCTTATTTGCTACTCACCGACCAAGCGGCGCACAACCCAACGGGCGATTTTGCC
+TTAGAAAATGGCAAGGTTAAGGCAGATGGTACGCCAAAATATACCTTTGCAGGGATTAGT
+GTGATGTCACCAAGATTATTGGATACGGGAGCCAACGGTCAGTGCGTCGCCTAAGCGTAT
+CTAAGGAGCAGCACGTCGCAAATGTCTGGCCCTATTGCGGACGTGCTGAGAAGACTAACC
+TTGCGGACGTGCT
+>ds2020-267_148
+CAGCACGTCCGCAACCTGACTACTCTCAGCACGTCCGCAAGTCTGATACCCTCAAAGTTG
+CGGACTATCTAAGGAGCAGCACGTCCGCAACAGGTGAGTAGTACGGTACGGATATGGGTA
+TCAGTTTTGTATCTTGCGAATAGCTGAGTATGGATTTGGGTATCATTTATGTATCTTTCC
+AATAACTGAGTAGTATAGATATGGGCATCATATTCTGAATTTGAATGTGTATCATTTTTC
+TATCTTGATAATAGGTAAGAAATATAAATTTGGGTATCCGATTTTGTATCCGGAGATGAT
+TGCGGACGTGCTG
+>ds2020-267_149
+CAGCACGTCCGCAATATTCGCACCATTGCTGCCTCCCGTAGGAGTCTGGACCGTGTCTCA
+GTTCCAGTGTGGCTGGTCGTCCTCTCAGACCAGCTACTGATCGTCGCCTTGGTAGGCTTT
+TACCCTACCAACTAGCTAATCAGATATCGGCCATTCCAATAGCACAAGGTCCGAAGATCC
+CCTGCTTTCATCCACAGATCGTATGCGGTATTAGCTATCCTTTCGGATAGTTATCCCCCA
+CTACTGGGTATGTTCCGATATATTACTCACCCGTTCGCCACTCGCCACCAGACCCATGTT
+GCGGACGTGCTG
+>ds2020-267_150
+CAGCACGTCCGCAATTCACCCGGCATCGATCGATCGCGCGAGTACGCATCTAGTCAGCAC
+ATAGCGAACGAAAAAAGCATTCATCCTGGATTGGATTCTCTTCCTCAATCAAAATGTCTA
+TCAATTGATCCCCATTCATTCGGTCAAAGTCTCACCCTTGAGAGGTGCACCATGTTGATA
+GGAATCGGCAAAGACCCTCTTGTACACATCCTCGAGGGCAGCATTCATGGCAATCATCAC
+TAGTTTATCCCGAGGGCATGGTATGGCTTTGTTCTTGGTGTTGTTTAATAGATTTCGATT
+GCGGACGTGCTG
+>ds2020-267_151
+CAGCACGTCCGCAATCCTTCGTTCTTGATTAATGAAAACATCCTTGGCAAATGCTTTCGC
+AGTAGTTAGTCTTCAATCAATCCAAGAATTTCACCTCTGACGATTGAATACTGATGCCCC
+CGACTATCCCTATTAATCATTACGGCGGTCCTAGAAACCAACAAAATAGAACCACACGTC
+CTATTCTATTATTCCATGCTAATGTATTCGAGCAAAGGCCTGCTTTGAACACTCTAATTT
+TTTCAAAGTAAACGTCCTGGTTCCCTACCACACCCGGAAAGCCCGAACGTCCTTACTTCC
+AGAGATCGGAA
+>ds2020-267_152
+CTTCCAATCTATCTAAGGAGCAGCACGTCCGCAATGTTCTAACCATAAACGATGCCAGCT
+AGCAATTGAATGTAGCTACTAATTTCGGTTCATTCAGTCGCTTTCCGGGAAACCAAAGCT
+TTTGGGCTCCGGGGGAAGTATGGTTGCAAAGCTGAAACTTAAAGGAATTGACGGAAGGGC
+ACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGAAAACTTACCAGGTCC
+GAACATAAATGAGTAAGACAGATTGATAGCTCTTTCTCGAATCTATGGGTGCTGGTTTGC
+GGACGTGCTG
+>ds2020-267_153
+TATCTAAGGAGCAGCACGTCCGCAATCAGCCAGCCCTTGACATATGAACAACAAAACCTG
+TCCTTAACGGGATGGTACTTACTTTCATACAGGTGCTGCATGGCTGTCGTCAGCTCGTGT
+CGTGAGATGTTTGGTCAAGTCCTATAACGAGCGAAACCCTCGTTTTGTGTTGCTGAGACA
+TGCGCCTAAGGAGAAAGTCTTTGCAACCGAAGTGAGCCGAGGAGCCGAGTGACGTGCCAG
+CGCTACTAATTGAGTGCCAGCACGTAGCAGTGCTGTCAGTAAGAAAGGAGCCTGACTTGC
+GGACGTGCTG
+>ds2020-267_154
+CAGCACGTCCGCAATCTTGCAGCCCTGAGCTCTCCCTTGATCGTGGGATCGCCTTCTGAA
+AGTTCAGCAAGCACTTTCAAATGGTTACCTTTAAAGGTAGCCTGTTCCTCACGAAGTCTT
+TCGTTGAGGGTCCTAATGGGCTCTGTTCCCATTATGGCAATCTCTCGGCTTTTTGCATCG
+AGAGCCATCTTGACATCCAGTTCTGTCAAGACTAATCCGTCCTTTCTCAAGGCCGAGATG
+ACCGCTCCTTCGACAAAGGAGCTGGGATTGATCTCGGTCGCATAGGCCAAGTACCTTGCG
+GACGTGCTG
+>ds2020-267_155
+CCGCAGGTCCGCGAACTGAGGGGAATTGATAGCTCAGCTTACTGGCTCATCAAATCCTTT
+CTAAGATGAGTCAATTGGGCCTGAGATTGATCTTTCATTTTTGTACGAAGGGTTCTGCGC
+ATCAGGTTTCAGTAAATTTCTTTCAAAGACAACAGGGAGTAGCCAAAGCTCTGGTCCAAT
+AAGAGCACTCACGTGGTTTTTCAAGCCGAAAGCACCACTAGGCGCAGGGGCCGAAGAAGT
+CCTTTTATCTCATTCCGTACCTGACGGTATCACGGAGCGTAGATTGCGGACGTGCTGCTC
+CTTAGATA
+>ds2020-267_156
+CAGCACGTCCGCAAGAGTTCTTCCCTCAACCAAGCTGTCTCTCGACTGTTAGTTTGTCTT
+ACGCCTTCCTGAGACGCAGACTACTGCCTACTGTTGCAAATAGTACGCAGGCTCATCATT
+TATAACGCGCGAGTAGCACCGCGCATAGCTATCAACTTCGCCTTAGTAACGCAGCTCACC
+CAGCCTGTCCTTACCGACCTAGAGTCACTCCCAGCCTAACTAGCTATCTACGGCGAAATG
+AAAAGACTAGCTAACTGGAGACGAAAGCACAAATGAAACGAGGTTGCGGACGTGCTGCTC
+CTTAGAT
+>ds2020-267_157
+ACAGCACCTCCACAAAAGGGGGACAGTAGGTTTATGAGAAAGGGATGCTCTTATCATGTT
+CTTGCTGAAAAGAAAAACCGAATTCCTCTATTTGATGTCGATTCATCCACACTTCCATTC
+TTTGTAGAGGAAGGCTAACTGCTTGCTGGCTGGGAGCTGTATGAGCGGTAACGTCCACGT
+ACGGCTCCGTGAGAAGGTCGGTGGACAGAAATGGCCTTGTTGTACCTCACTCTCGTCTTC
+AATGGGGTCTGCTCTTTTTTTTGGGAGAGTATGCCAATATGATCTCAATAAGGTTGCGGA
+CGTGCTG
+>ds2020-267_158
+CAGCACGTCCGCAAAGTTTATCCCCTCAGCACGTCCGCAATTACGAGGAGATGGGGTTTG
+CGGACGTGCGCTTAAGGCGACGCACTGACCGTGTTTCTGGGGCTGACGCACTGACCGTAT
+AATGCACCCTGACGCACTGACCGTGCAAAGGGGAATTGGACGGTCAGTGCGTATCTAAGG
+AGCAGCACGTCCGCAAGTGATCTACCCTCAGCACGTCCCAAGGCCACACCATTGCGGACG
+TCTGAGTGATCGGAGTTTGCGGACGTGGATGGCTCCTGATTTGCGGACGTGCTGCTCCTT
+AGATA
+>ds2020-267_159
+ATCTAAGAGCAGCACGTCCGCAATCGGTCACCCTCAGCACGTCCGCAAACTCCCGCCTCG
+AGCACCATCAATGACTATCAAGAAGCGTATTTTACTGTCATCAAGCAGCCAAGCATCGAT
+GCGGCTGCAGCCAGTGACCCAAACACCCTCAATCAATTTGACTATATACCCATCAACTTA
+CGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATACTCATCGGGT
+TTGGTGGGACTGTAGCCCAATTGGCTTGCGGACGTGCTGAGTACCGGCATTTTGCGGACG
+TGCTG
+>ds2020-267_160
+CAGCACGTCCGCAAGGGTGGCGGAATTAGTAGTAACTTTAGCTGTTCATCAGCCTGGGTG
+CCGCTGACGGATCGCTAGTCCTGGCTAGTTTTACGTTTACTGAGAGCCTACCCCAGCATT
+GACGAGAACCGATGTTTACCCTTACACCGGGCGCTTCCACCACCCCAGCCCCTCCCTCCC
+ACCGCATGTAGAGAAGGGCGCTAATAGTTGGCAGTTGACAGCTCAATCGCTGTGGCAACG
+TCGACATTGTACGCTCTCGTACGCCCACCTATCACTTCATCGACTCTCTGTTGCGGACGT
+GCTG
+>ds2020-267_161
+GACGCACTGACCGTTACTTGCCGGATTATACCAGTGTTTACCTTTCTTACTACAGAACAC
+CAGCTTTCCACATTAGACTTTTCCTGCTTTACAGCCTTTACATCTTCTCTTCTCTTCTCT
+TGCCTCTTCATACAGCCAACTTCTTCCCCCTACTCAAAATTTAAGTTTCATGCCAACATT
+TCAGAGGGAGCGCCTATACGACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCA
+CGTCGCAAAGGATTCCCCTTTTGTTGCGGACGTGTGAGGCTCAGTCGTTTGCGGACGTGC
+TG
+>ds2020-267_162
+GATCTATCTAAGAGCAGCACGTCCGCAATGGGCCTCCCTTACCTACATTATTCTATCGAC
+TAGAGACTTTTAACCTTGGAGACCTGCTGCGGATATTGGTACGGTCTATTGAGAATGTTT
+ACGTGGCCCTGGCATAGATTTTCAAGGTTCGAGGAAGACGCACGCGACACAGCAATATAG
+GCCATGCTCTTCTAGTCCATCAACCATATCTCTCTTCGAAAGACTTCCATGGTTGTACGA
+CTATAAAACAGAAAAGAAAACTCTTTCGGTGCGCACCGACGATTTCTCTAAGCCAACAGA
+A
+>ds2020-267_163
+CAGCACGTCCGCAACATCGCCCACATTGCCAACGCCTGTCTGCGGATTCTGGAACAAGCA
+AGACAGGAAAGTCGTAAGCCATATCCTCCCATCCATCATACGCCTGACGAAGTATCTCAC
+GTTGTTTGCAGTCCGGTCTCCATCTTGCTTGAGTGGCAGCCCTGTCACCGGAGGCCTGAT
+GTTGGCTTCGTCATTCGTTGTCGTGTAAGTCACCGTGACGGCTGGTGCACTCACTATGTC
+AACTATGACGATCCTTTCACCTGAACGTGACATCACCCCGAACTTATTGCGGACGTGCTG
+>ds2020-267_164
+TATCTAAGGAGCAGCACGTCCGCAAGGTGGACCCCCTCAGCACGTCCGCAAGTACAATTC
+GGTCAGCACGTCCGAAAGTCTCTAAGTTGCGGACGTGCTGCTCCGTAGACGCTTAAGGCG
+ACGCACTGACCGTTTCCCTGCTGCTCCAATGTGCAGCGGATTATGGCGATTATGTGTGAG
+CTGGATGAATACGATGCTATTTATGAGATTATCAATACAAAAATTGACGGGCTAACCTTG
+GGGATGAGTGTGGGCGTGCATCCCTGCGAAGACAGTGCCATGGCTACGGTCAGTGCGTC
+>ds2020-267_165
+GGACGTTCGGGCTTCACGGCAACACTTCCCAAGCCCTCAAACACCTTGCCTACACTTCCA
+ACTGCCCCAACTCTGCCCAAGACCACATTGCCTCCACTTCCCTCAACCTCATTGCCTACG
+CTTCCAACTGCTCCAACTTTGCCAAAGCCGGCCACGTTGCCACCGTTGCCCTCTACCCAA
+TTGCCTACTAACCCAACAAAAAAGCCCGAACGTCCTTACTTCCAGAATCTAAGAGCAGCA
+CGTCCGCAACACAATCTCGCTCGCACGTCCGCAACTATGGCTGAATTGCGACGTGCTG
+>ds2020-267_166
+CAGCACGTCCGCAAGGTGGAGCCTCCAGCACGTCCGCATATGGAACTCGTTGCGACGTGC
+TGCTCCTTAGATTCGCTTAAGGCGACGCACTGACCGTCCGAAGCGACTTCTGTTGAAAAA
+GGAGCGGATGAGGTGTGGTTAGGGGTGAAATGCCAATCGAACCTGGAGCTAGCTGGTTCT
+CCTCGAAATGTGTTTAGGCGCAGCGGTATTGATTATAGCCGGGGGGTAAAGCACTGATTC
+GGTGCGGGCTGAGGAGGTCACTTTGCGGACGGAGAGGTCGGGTCTTGCGGACGTGCTG
+>ds2020-267_167
+ACGTGCTCGCTTAAGGCGACGCACTGACCGTATCTGGAGAGGTCAATAATAGTCGCCCAA
+AGTGTCGCACTGGCAATGCGGCTTTCTTGCTTGGTCGCGGCAAGATAGCCTAACGTCAAT
+GCGGTCAACATACCCCCAATACAGTAACCTGTAATAATGATGGTTTTTTCACCCGAGCTC
+TCATCCCACGGTCAGTGCGTCGCCTAAGCGTCGTCCGCAATTTCGGTTGGTTCTTGCGGA
+CGTGTGAGGGATTAAGAGTTGCGGACGTGCTGAGGGGTGTTCCGTTGCGGACGTGCTG
+>ds2020-267_168
+CAGCACGTCCGCAAAGTAAGGTGGTTTGTGTTACCCCGTTTGTCTAGCATGTCCCAGTAC
+AGTGGTATGGCAATGCCCTTATAGACCACCCCTAGCATAAATATGTTGATGTTGCTTTTC
+CCCCATTTCCAGTTGGTGCGGTCAATGGTAATGGTGACTTTGCTAAGTCCAAATAGCCGA
+TATATCAATATGGCTAGTTGGTCATAGTCTATGACAGCACTGGCGATAAATCGCTGTAGC
+CTGCGGTATTGACTGTCCGTCTTGCCACTTTTAGGTAAGTTTCCTTGCGGACGGGCTT
+>ds2020-267_169
+CAGCACGTCCGCAATCCCTTTATAGTTGCGGACGTGCTGAGTGTAACTCGATTGCGGACG
+TGCTGCTCCTTAGATTCGCTTAAGGCGACGCACTGACCGTCCTGGTGGGGGTACCTTTAA
+TAAGATAGAGCTATTAGAGGAATATCCAGATAAAGAATATAATGGAGAGGATGTAGTAAT
+TTATAGTCTCGGAGAAAGGTATTTTTTTAAGAATTCAAGGGAGAGAACCTTTGGAAATTT
+TAAGCAGACTAAACCTTTGCAGCTTGAAGAGAAGTGGGCGACTACGGTCAGTGCGTCG
+>ds2020-267_170
+GACGCACTGACCGTCGCCCAAAGACAGGTTGGAGAAGGCAGTGGCAGCTGCATGGGCTTT
+GGGTTTTACAGATCTGGAAGGCAGTCCTGGCTCAGTCCCTGTACCTTAAGGAAACTCAAA
+CAACTTATTTGGCCTTTCTGATCATAATATATATCATTTTTGAAATGGGAGAAAACGGTC
+AGTGCGTCGCCTAAGCGTCTAAGGAGCAGCACGTCCGCAACCCGAGTTACTTGCGGACGT
+GCTGAGGGCGCGAAACTTGCGGACGTGCTGCCCTGTGCAGATTGCGGACGTGCTG
+>ds2020-267_171
+CAGCGCTTAAGGCGACGCACTGACCGTGCTTCCCTCCCCCTGTAATTGATTCTTCCTGGG
+TCGATGCCCGAGCGGTTAATGGGGACGGACTGTAAATTCGTTGGCAATATGTCTACGCTG
+GTTCAAATCCAGCTCGGCCCAATAATTCGCCGATCCACCATGAAATAATATAACCCATAG
+TGTTACGGTCAGTGCGTCGCCTTAAGCGTCACGTCCGCAACCATCGTAGTTTCGGACGTG
+CTGAGGGGATCAATTTGCGGACGTGCTGGGGTCCCTGGTCTTGCGGACGTGCTG
+>ds2020-267_172
+CCAGCACGTCCGCAAGTGGCAGGCCCTAGTATGTTCCTCATTTAATGAGTTCAGACCGAC
+GGTTTCTAGAAGAGAAGTTAGGACGTGTTTCACCTCCCTTACTTCTCCTTTTTCGGAGAG
+ATACTGTAATAGATAATCATCTATTAGTTGTGTCTTCTTTAACTGCTTGGTTTTAGGATC
+CAATACTGGATTATTACCAAAGAAGCTATGATCCCTACGAAGAGCTCCAAGCGTAAGCTT
+GGGGTCATTCCGGAATTTAGATCGAACACGGATGGCTATTTGCGGACGTGCTG
+>ds2020-267_173
+CAGCACGTCCGCAAACAATGTCCTCTGCTGTTTTCCTGTCTACATCGCTTTCGCGGCTTT
+CATCTCTTACGTCATCTTTATCCTTCACCACTTCAGCATATGTGGGTTTGCTTGATTCGA
+CACTTCTATTCGTTCCAGAATCCCTCGACTGCTCTTTGGGCTCTCCGTCGTTTCCTTCGC
+ATGTCGGCTCATTCTCTTCCGCGCCCATCTCACTCACCGCTTCATTTTCCACTAATCTAA
+GCGATGCTTTCTCACGCCTTCCTTTAGCCTCCTGTCTTTGCGGACGTGCTG
+>ds2020-267_174
+CAGCACGTCCGCAATCCAACTGCTCAGACTCCGCAATCAACTCGTCGTCAATTCTAATGT
+ACCGCTGATCCATACTTACTATTGGCAGATTTTCGTATGTGTTGAATCTCATGTTTGTGT
+CTCTCGAACTGCCGGAGGATAGTGCATGTAGGGGTAGATCTGGTTCCTCCTCTTCTTCCT
+CATCCTCATCCCCAGCATTGCTAGGTGGAGCACGAGGTCTTTCATTCAACGCACCTCCAA
+AGCTCCGCAGCACTCTGGAGTCATCATTGCCCCTCATTTGCGGACGTGCTG
+>ds2020-267_175
+CAGCACGTCCGCAACCGAACTGCACTCAGCACGTCCGCAAATGAGACCCCATGTAGATTG
+CGGACGCACTGACCGTCATTCAGCGGTTCAGGTACGGTCAGTGCGTCCCGGATATTACGG
+TCAGTGCGTCAGGGAAGATCCCACGGTCAGTGCGTCACGCTAGAAAGCACGGTCAGTGCG
+TCGCCTTAAGCGTCCGCAAGATCTTAGGGGTTGGGACGTGCTGGGATGGGCTGATTGCGG
+ACGTGCTGCCGGCGACCTATTGCGGACGTGCTGAGGGGATGGACATTGCGG
+>ds2020-267_176
+CAGCACGTCCGCAAGCCAAAGCCCCTTCTATTGCGGACGTGCGAATGGTATCGTGTTGCG
+ACGTGCTGCTCCTTAGATACGCTTAGGCGACGCACTGACCGTTCGCATTTCCCTGGGGTG
+TCTTCATTCCAAGCACTCGCTATGTCACTCGCAGGTCGTGTGGGTACAGGCAATATTGCC
+GGTGTGGCAACGGCGATTACCTTTGGTGGTCCTGGTGCATTATTCTGGATGTGGATGGTG
+GCAGACACGGTCAGTGCGTCGCCTTAAGCGGCGACGTGCTGCTCCTTAGAT
+>ds2020-267_177
+AAGCCCACTATTTCAAACTTTGCTTTTGCTACACTTCTTTGCTCTCTTGACCATCTGTGT
+TTATTCCCAATGGCTTTTCCCCTGTTTGTTGATACCTATGAGCATGTTGCAAAACATGAC
+AAGAAATATTATGGATCTTTCCCAGCCACCTTCACTTTGGTTGCTGGAGGTGGGGTGATT
+GATCTTGAGAAAATGTTTTCTGGAGTCCGCAAACTAAAGCGCCATTTGACGCTACACCGA
+ATGTTTGCGGGCTGTGTTCTGGGCACAGAAGCTGCTTTGCGGACGTGCTG
+>ds2020-267_178
+AAGGAGCGCACGTCCGCAACCTACCAGCCTTAGCACGTCCGCAACTCAGGGGATTGGGAC
+GTGCTGAGGGGCTAGTGCTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCAC
+TGACCGTTGTCGCTGCATTGTGTTAGTAAAGGAATCCTTACATCGAAACTTCCGAAAGGA
+TGAAGGATAAACCTATATGCATACGTATAGTACTGCAATACTATCTCCAAATGATTAATG
+ACGGCCCCGTAGACGGTCAGTGCGTCGCCTTAAGCGAGATCGGAAGAGCG
+>ds2020-267_179
+GCGACGCACTGACCGTCCAAATATGCTTAAGACGGAAGAATCCCACGAGGCGAGTAATCT
+CACCCCATGAACACGCCACCGCCATCATACCTAAGAAGGCTGTTAGGCTCACCATCAACA
+GCGATAACCCATCAATGGCCAGAGGGAAACTGACCCCCAATGAGGGCATCCAAGGTAAAC
+ATGGCAGAGCACGGTCAGTGCGTCGCCTAAGCGTAAGGAGCAGCACGTCCGCAACGTAAT
+GTCGGTCAGCACGTCCCAATGATGAGACCCTAGTTTTTGCGGACGTGCTG
+>ds2020-267_180
+CACTGACCGTGTGGTCGCTGATGTGGAAAGAAAGTGATCCTATCGCCATCAAAATGGGCT
+TAGCCTGGGCAGTCATCGGTCTAATTTACTTGGCATTTAAAACCGGTGGTTTTAAGCGTC
+ATCCACCTATGCACAATGAACATGAGAGGGGCTGCGAAACGGTCAGTGCGTCGCCTTAAG
+CGTATCTAAGGAGCAGCACGTCCGCAACTTGTATTCTCTCAGCACGTCCGCAAGGGGTAT
+TTCCTCAGCACGTCCGCAAGCTACAGGCCTTAGGAATTGCGGACGTGCTG
+>ds2020-267_181
+CAGCACGTCCGCAATCACTGGTACCTTTTGCGACGTGCTGACGGTAATGATATTGGGACG
+TGCTGAGGCAGTGGCACTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACT
+GACCGTTTCATCCGGCCTCCAGCTTCCAAGCGGCTGCACCGGCAATCAGTCCGCGAAACA
+TATCATTCATAATTAACACTCCCCTTTTTCGAACTATGTGTATTGAAAGCAGTCAGAAAC
+CGCCGCTTTCACAACATTCGGCAATCAGCGTTCCAAAGATGTGTTCAAA
+>ds2020-267_182
+ACGGTGATAACCGAGAGCTGCGGAGAGAGGCTAGCTCTTTGCTTGCACGGGGGTCTGCGG
+ATGTCTGGAAGTAAGGGCGTTCGGGCTTTCGATTCTGGACGTTCGGGCTTTCGCTGGTGG
+GTATGAAGCCCGAACGCCAGGATTCAAGGAAGCCCGAACGTCCTTACTTCCAGACACGTC
+CGCAAAATACCTGTGGTCGATTGCGGACGTGTGAGGATTCGTGTCTTGCGGACGTGCTGG
+GGAATTTATCTTGCGGACGTGCTGAGGGCGAGGATCTTGCGGACGTGCT
+>ds2020-267_183
+CAGCACGTCCGCAACACCAGATCCCTGTGGTAACTTTTCTGACACCTCTTGCTAAAAACT
+CATTAATGCCAAAAGGATCGATAGACCGGGCTTTCGCCGTCTCTATGTTTACTGAACATC
+GAGATCAAGCCAGCATTTGCTCTTTTGCTCTACGTGTGGTTTCTGTCCGCACTGAGCTGG
+CCTTGGGACACCTCCGTTATTATTTTAGAGATGTACCGCCCCAGTCAAACTCCCCACCTG
+GCAGTGTCCCTGACTTGGATCGCGCCAGGTGGGATTGCGGACGTGCTG
+>ds2020-267_184
+CAGCACGTCCGCAATCTATTCCGAGTTTAGGAACCTAGGTAATAGTATCCCGATCAAACA
+GCTGACGAAGGGGATGAGCGAAACAGGGAGTCTACTAGACGGGGTTCAACTAGCGGACAC
+TCTTGGAACGGCCGGAGTAAGAAGTCCCCAAGTGAGCGTATTATGGGGGACCGTCAAGCA
+CATCCGGCAAGAATCAAAGGGGATCTCGTTGTTGCATAGCTCAGGTCGGAGCAAGGCGCC
+ATCGGACGTTCAACGGGCAACCTTTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_185
+CAGCACGTCCGCAACCCAACTCCCATCAATTAACCTTCCGGCACCGGGCAGGCGTCACAC
+CCTATACGTCCACTTTCGTGTTTGCACAGTGCTGTGTTTTTAATAAACAGTTGCAGCCAG
+CTGGTATCTTCGACTGATTTCAGCTCCACGAGCAAGTCGCTTCACCTACATATCAGCGTG
+CCTTCTCCCGAAGTTACGGCACCATTTTGCCTAGTTCCTTCACCCGAGTTCTCTCAAGCG
+CCTTGGTATTCTCTACCTGACCACCTGTGTCGTTTTGCGGAGGTGCTG
+>ds2020-267_186
+CAGCACGTCCGCAAAAGTCACACCTTTTCAGGGAGAGCTAATGCTTGTTGGGTATTTTGG
+TTTGACACTGCTTCACACCCAAAAAGAAGCGAGCTACGTCTGAGTTAAACTTGGAGATGG
+AAGTCTTCTTTCGTTTCTCGACGGTGAAGTAAGACTAAGCTCATGAGCTTATTATCCTAG
+GTCGGAACAAGTTGATAGGATCCCCTTTTTTACGTCCCCATGTCCCTCCCGTGTGGCGAC
+GTGGGGGCGTAAAAAAGGAAAGAGAGGACAGGGGAAGCCCGAACGTCC
+>ds2020-267_187
+GACGCACTGACCGTTTTTTTACCGATTTCAAGTACTGGGCATTTAATTCTTGCCGACTCT
+CTGTTAAATTTTTGGACCAAAGACAAAGCCGACTTGTTTATCGCCGTCATTCAGCTGGGT
+GCGATTTCAGCGGTAATTTATTTGTACTGGGGGAGGACCAGTGTCACGGTCAGTGCGTCG
+CCTTAAGCGGTCTAAGGAGCAGCACGTCCGCAAGAGCCATTTCGTTGCGGACGTGGACCT
+GACCGTTTTGCGGACGTGCTGAGGACAGCTAGCTTGCGGACGTGCTG
+>ds2020-267_188
+CAGCACGTCCGCAATATCCCCGTATTCGACATCGGCCCACGATTTCACGTTGAGGGGCGC
+AGGGGCCCAAAACACCTCTTTTTCGGCCTCGTCAGGATTCTGAGCTGTGCCGCTTTTCGA
+GCTCTTGGAGGAACCCTTCTCGTCCTTCTTCTTCTTCTTCAAGCTCCCGAGCGCCGCAAA
+CACGTTGGTGCTATTCAGAACCACAGACTCGTCCTTTCTGTTCCCGCCTCCCACCATTTC
+TTAACCCAGCGTAAGTCTAGACTTACCGAGCTTTGCGGACGTGCTG
+>ds2020-267_189
+CAGCACGTCCGCAATCGATCCATCCCCCGTTTTTCTTTTCTTTGCTGATTCCTCTCAATG
+AAATTTGCCATGTTGCACTAAGTTACTTACGGATGTATGCATGCAATCCGGGAACACTTT
+GGGGTGAACACCCATCCGAACAAGTAGGGTCAATAGTTCAGCATTTAGGCCGTAACATTT
+AGCAAAAAAAATCTTTAACCCAACAAGTGCTCTCCGAACCAAGCTAGATAGTCTCCTATC
+ACTAGGCTCACCAACCAACCTTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_190
+TATCTAAGAGCAGCACGTCCGCAAACGGTGGCCCCTCAGCACGTCCGCAAAGTGGTTGTA
+TTTTGGGAGGAGTCGCGTAGAATTGCGGACGTGTGAAGAGACCACCAAACAGGCTTTGTG
+TGAGCAATAAAGCTGTTTATTTCACCTGGGTGCAGGTGGGCTGAGTCTGAAGAGAGTCAG
+CAAAGGGTGGTGGATTATCATTAGTTCTTATAGGTTTTAGGATAGGTGGTGAAGTTAAGA
+GCAATGTTTTGCAGGCAGGAGTTCGCGATGCACGGTCAGTGCGTC
+>ds2020-267_191
+GCTCCTTTATGTAAGATGGATAAATTCCCAGATTAAGACATGAACGAAATAAAAAAAAAT
+TCCACCCATAACATCTATGTCAGCTTTTCTGTCTGAATGTATTCAGAACAACCCGCTTTC
+TAGACGATCCCTAATAGAAAAGAGGGGGGCTAGGGGTTATAGTCGACGTTGATTCATCAT
+TTTTAACGTCTCTAATTCAAAACTGAACGTGAAACTTTGGTTTCATTCGGCTCCTTTATG
+TAAGATGGATAAATTCCCAGATTAAGACATGAACGAAATAAAAA
+>ds2020-267_192
+CAGCACGTCCGCAAGGCCACCGACCTAAGTTCCTTGGAACAGGACGTCATAGAGGGTGAG
+AATCCCGTATGCGGTCGGAAAGGCGCTCTATACGTAGCTCCTTCGACGAGTCGAGTTGTT
+TGGGAATGCAGCTCTAAATGGGAGGTAAATTTCTTCTAAAGCTAAATATTGGCCAGAGAC
+CGATAGCGCACAAGTAGAGTGATCGAAAGATGAAAAGCACTTTGGAAAGAGAGTTAAAAA
+GCACGTGAAATTGTTAAAAGGAAAGGGAATTTGCGGACGTGCTG
+>ds2020-267_193
+GACGCACTGACCGTGGGCTTCCCCGTTCAGATATCGCCGGATCACAGGATATTGCCGCCT
+CCCCGACGCTTTTCGCAGGCTGTCACGTCTTTCATCGCCTCTGACTGCCAAGGCATCCAC
+CATGTGCACTTCATTACTTGACTATACAACAGGGCAACCGCGACGGTCAGTGCGTCGCCT
+AAGCGTATCTAAGGAGCAGCACGTCCGCAATTTGGGTCCCCTCAGCACGTCCGCAAGAAG
+CCTCACTCAGCACGTCCGAAAGTGTGCCTATTGCTGACGTGCTG
+>ds2020-267_194
+CAGCACGTCCGCAAGCACCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAA
+TGGGGGCAACCCTGATCCAGCAATGCCGCGTGAGTGAAGAAGGCCCTCGGGTTGTAAAGC
+TCTTTTGTCAGGGAAGAAACGGAGTTCTCTAATATAGGATTCTAATGACGGTACCTGAAG
+AATAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTAA
+TCGGAATTACTGGGCGTAAAGCGGCCCCATTGCGGACGTGCTG
+>ds2020-267_195
+CAGCACGTCCGCAATTCGGTTGCCCTAAGCGTCGCCAGTATCAACCTACTCAAAGAGGTC
+GGTGCATGGCAGCGTATCGAACAAAGCAAACGCAAAGCCGACTATACCCAAATGCAGGTA
+TGGCAAACCAATGGCGTGGGCGAGCTAAATTTTGGTGATGCTCAAACACCGCAATTATTG
+GGCAGTATGGTTGAGCCCTTTATCATCGAAAAAGCGCTGTATGACGGTTTTGACAATGAG
+AGCCTTGTCCATCAGGGAGACATGTGACTTTGCGGACGTGCTG
+>ds2020-267_196
+CAGCACGTCCGCAATGAGATGACGGTGAGCTGGATATCAAGAAATACTATGATATCATCC
+AAGAAGATCGAGTTTATATTTTCTTGGATGGTTTGGATGATCGACTTGACAAAGCCCGAA
+GTGATGTGCTCCAAATGAGTCTATTTCCTACAGTAGAGCAAGCCTATGCTCATGTTCGAC
+GAGAAGATATTCGACAAGCTGTGGTGTTAGGAGCTCCAACACCAACCGGAGTGGGGTTGC
+GGACGTGCTGGGGAGAATGAATTGCGGACGTGCTGCTCCTTAG
+>ds2020-267_197
+CAGCACGTCCGCAAATGCCTACTCATCAGAAACCAACCATCGCCATCAGAACCTAACTAA
+AGTTCAACTCCAAAATATTACCCAAATCTTGAACTTCACTGCAAATAATCTTTGATTAAT
+CCTCTAAACGAAGTAACCTCAAGATGTCCTTAATCCACCTCCATTGGTCGAAAGCCCATC
+TGAGTAGAACTCATAGTTGACCAAAATCAGCTTAAGAATCACAAGCCGAAACCAGTAGAG
+ACACAGAACCCCTGGCCCGTTGCGGACGTGCTGCTCTTAGATA
+>ds2020-267_198
+CAGCACGTCCGCAAACCTTCCCACCTTTTGACATGCCTGGACCGCCAGAGAGATCTGGCT
+TTCTCTTCGGAGACTAGGACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGAT
+GTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTTTCCTTATTTGCCAGCGGGTTAAGCCG
+GGAACTTTAAGGATACTGCCAGTGACAAACTGGAGGAAGGCGGGGACGACGTCAAGTCAT
+CATGGCCACGGAGATCGAATTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_199
+TCTTCCGATCTATCTAAGGAGCAGCACGTCCGCAAAAGTATCCCCTCCCTCAGTGAAACT
+ATGAACCCGGGCCCAGGCTCAAATTAATATTAATATAATAATAGAGTGGAAATGAAAATG
+TGATGGTTGGGGCAACTATATCATACAAGATACTTAACTGAAAATACTGTACGGAAGGTC
+GATGGTAAGCCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCACGTCCGCAAATTGA
+AACCAGTCACACTCGCAAAAACATAGGACTTGCGGACGTGCTG
+>ds2020-267_200
+TATCTAAGGAGCAGCACGTCCGCAAGGCATTACGCCTATTGCAAAGGCTATTGGCTTTTG
+ACCCGAAGGATCGACCAACTGCTGAAGAGGCACTAGCTGATCCTTACTTCAAAGGTCTAG
+CCAAAGTTGAGAGAGAACATTCTTGTCAGCCTATTTCAAAGCTGGAATTTGAATTTGAAA
+GGCGAAGAGTCACAAAGGAGGACATTAGGGAACTAATTTACCGGGAAATACTAGAATACC
+ATCCTCAGCTACTTAAGGACTACTTGATTGCGGACGTGCTG
+>ds2020-267_201
+CAGCACGTCCGCAAATGGAGTTGAGTTTTTCTTAATGGGTGGTGTGCTTTCTCTCACGGC
+TGGCTAAGTGGCGATTGACACCAAGAGAGGGTGAATATCAGCCATGAAAGTAGAGATCAA
+GTTCCCGGTTCTATGAAGTCGAACAAGGGCGTGAATTCGAGATCGCGGGCAGCGACTCAC
+GACTAAGTGGACACACAGGTCGCTGAACGTGGTGCACGACAAGGACAGTCGGTTCTCGTT
+GGTGACAAACGGATACAACGCCCTACATTGCGGACGTGCTG
+>ds2020-267_202
+CAGCACGTCCGGAAGCACTGATCGGTCAGAGGTCAACATAATGGCTGGCTGCGTCGTCGG
+GTCAGAGGCACGTGTTACCACGGTAGCTACTGAGCTGAAACGTTACGGTTTTGAACTAAG
+GGTTAGCGATAAGCTCGCTCTAGGCGTCGGCAACCCAAGGAAAGACTACGCGTTCACGAC
+CAACGCTCAGCAGACAGTTGCGGCAAGGATAGAGCGAACAAGCCGTCAAATCGGTAAGCG
+CGCTGCTACAAGCACGTTCATGTCGAAGCTGACCGTGGCGT
+>ds2020-267_203
+CAGCACGTCCGCAAAGGAACCGCCCTCTTTGGATGGGTAGAAAGAATAAGTACAATTTTG
+AATGTTTTGCTTATCCACAAAGTAACAAATATTATAATTGGATCGTTCAATCATTTTTCA
+GTCATTCATTGAATGATAAATCACTACAAGTGAAGGAGATACACGATTTAAATAACGAAA
+GATCCAATATTTAAAAATTGTATCTAAAATGACTGGAAAAGTAGAAACAAGACCGATACG
+GCTTGCGGACGTGCTACCCAGGTGTTCTTGCGGACGTGCTG
+>ds2020-267_204
+CAGCACGTCCGCAATTGGATACCGGTCATTCACTGAATTCGTTGATAGAGTAGGCGGTGT
+GTCAAGGTACGGAGCACATTTTTACGTCGATCACCACGTGTTTGCATCTTCATTTGAGGA
+GGGCCACGTCCTTGGCGATGTTGTAGAAGAAGAGGACTATAACGCAGCAACCATTTGCGG
+ACGTTACGCGTCGGACATAACCTTTTCCTGCGAGTCAGAAACGCCAGATTTTGAATTGGT
+AGCAAGATTTCTGTCGTCGGAAGCTGCGGACGTGCTGAG
+>ds2020-267_205
+GACGCACTGACCGTTCGGGTTTTTCTGTTCTGTTGTGGGAAGGGGGGATTTTCGCATCTA
+CAAGTTGAGAGTGTGCTGGGGCAAGTGGGCTAACCCGAACTCCCTGTAAGGGGCTTTTCC
+TTCAATAGGAATAAGGGTAATGTAACTCTTGTTTGAGAACTTTAGCTACGTACTTAGGTT
+AGTTAGCTCAGCTTCTCCTATGTCTATTTGGATTAAGGAAGTGGGGTAATGGGCAGACAA
+GGAGGTCCTAATAATGGTGGGTCGAAAGCCCGAACGTCC
+>ds2020-267_206
+CAGCACGTCCGCAAGAAGCCGCCCCTTGTTTCAAAGAGAGGAGGACGGGTTATTCACATT
+TCATTTGATGGTCAGAAGGCCGTATGCTTTGGAAGAAGCTTGTACAGTTTGGGAAGGGGT
+TTTGATTGATCAAAAAGAAGAATCTACTTCAACCGATATGCCCTTAGGCACGGCCATACA
+TAACATAGAAATCACACTTGGAAAGAGTGGACAATTAGCTAGAGCAGCAGGTGCTGTAGC
+GAAACTGATTGCAAAAGAAGGGAAATTGCGGACGTGCTG
+>ds2020-267_207
+TCTGGAAGTAAGGACGTTCGGGCTTCCCTATACCTTCTGCATAATGAATTAACTAGAAAT
+AACTTTGCAAGGAGAGCCAAAGCTAAGACCCCCGAAACCAGACGAGCTACCTAAGAACAG
+CTAAAAGAGCACACCCGTCTATGTAGCAAAATAGTGGGAAGATTTATAGGTAGAGGCGAC
+AAACCTACCGAGCCTGGTGATAGCTGGTTGTCCAAGATAGAATCTTAGTTCAACTTTAAA
+TTTGCCCACAGAACCCCCTCAACAAAGCCCGAACGTCC
+>ds2020-267_208
+CAGCACGTCCGCAATACCCATGCGCTACAATGGCGACTACAGAGGGTTAATCCTTAAAAG
+TCGTCTCAGTTCGGATTGTCCTCTGCAACTCGAGGGCATGAAGTTGGAATCGCTAGTAAT
+CGCGGATCAGCATGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACAC
+CATGGGAGTTTGTTGCACCAGAAGTAGCTAGCCTAACTGCAAAGAGGGCGGTTACCACGG
+TGTGGCCGATGACTGGGGTAGATTTGCGGACGTGCTA
+>ds2020-267_209
+CAGCACGTCCGCAATATACCACGCGTTACTGGTTCCCGGAAGAGTTAATATCTCCATTAG
+CTAAACCCTTTCTTACCCTTCCCTTGGACTCGTATTTTGTTTGTACACAATCAACGGAGG
+CCTCCCCGACATATGTTGCAACGTCTTCAATAGCATGCTCTTATTTCGTCTTTCCCTTAA
+TAAGTCATCAAATTTGGTGCTTTTTGATCCCCAGTTGCTATGGAGAACAAAGGACGAAAT
+AAGAGCATGCTATTGAAGACGGTTTGCGGACGTGCTG
+>ds2020-267_210
+CAGCACGTCCGCAACGGTCGACCTCTCCTGATGTATCTGTCAGTAATGGAAGCATCCATG
+AGTTGTGTCCTTGGTCAGCACGATGAAACGGGTAGGAAGGAAAGAGCCTTATACTATCTC
+AGCAAGAAGTTCACTGATTATGAGACAAGGTATACGGTTCTAGAAAAGACCTGTTGTGCT
+CTTACACGGGCCTCGCAACGCCTACGCCACTACATGTTGAACTATACGACCATGCTGATT
+GCAAGGGTGGACCCGGTGAAGATTGCGGACGTGCTG
+>ds2020-267_211
+CAGCACGTCCGCAACCACGGCCCCCTATCGAAACGACAGAGTTGTCGTCGTTTATAGCCT
+CATCGACGACGAGACGGTTCGGCGACTTCTTCCGCTCCAGAATCGCGGTCGAGAAGTCCT
+TCTTCTTCGAGTCGGACGATTCGGCTGGGTGAGCCATGGTGGAGATTTCAGAGATCAGGA
+AAGTACGGTAGACGAAAAGCAAACAGACCAAGAGAGAGAGAGAGAGAAAGAGAACATTGC
+GGACGTGCTGAGGCCCATATTTTTGCGGACGTGCTG
+>ds2020-267_212
+CAGCACGTCCGCAATCCGAGACCCCACCACGCGAAATGCTTTTCATCGTTGCCATGAAAA
+TTGCCATTTTTTATTTTGGTCCTTTGTGGTTTTTGCCGTCCCACGTTTAATCAATAATGC
+CACACAGGCGATTGGATAAAGTGGGGCGGTGGGGGTCAAGGGGAGGGCCTACCGACGGTC
+AGTGCGTCGCCTTAAGCGTATCTAAGAGCAGCACGTCGCAAGATGTTAACAGTAGCATTG
+CGGACGTCTGAGGACAGCGTGTTTGCGGACGTGCTG
+>ds2020-267_213
+GGACGTTCGGGCTTCCTAAAGCGGTTATCCCTTCCGAACATAGCTACCCGGCGATGCGAC
+TGACGTCACAACCGGTACACCAGAGGTTCGTCAACTCTGGTCCTCTCGTACTAGGAGCAG
+ATCCTCTCAAATTTCCAGCGCCCACGGTAGATAGGGACCAAGCCCGAACGTCCAATCTAA
+GGAGCAGCACGTCCGCAACAATCAGGCGTTATTGCGGACGGCTGACGGGCTGCAAATTGC
+GGACGTGCTGAGTGGATACCGTTTGCGGACGTGCTG
+>ds2020-267_214
+TCTAAGGAGCAGCACGTCCGCAAGGATCGGCCGCTTCCGCAAAGACCTAAGGGTTGCGGA
+CGTGCTAGGGTTGAGGTTTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCAC
+TGACCGTCTACTGTTCGGTATGGCGTCGTTTGGGTAGTGAAGTGGTAGTGTTTGAAGCCA
+AGCCAGAATTTTTGGCAGCGGCAGACAAAGCGGTGAGCAAAGAAGCGGCAAAACTACTAA
+AAGCCCAAGGAGTAATGTCAAAACGGTCAGTGCGTC
+>ds2020-267_215
+TATCTAAGGAGCAGCACGTCCGCAATGTTCTCGTCGTTTCTTCGTGGTCGTAACAATCAC
+TTCAAGCAGTGGAAATAACAAAAGATGTGCTCCAAGTCCTTGGGCTCTTGAACAGAATTC
+AACCACACTGGAATGGATGGTACAAAGTCCTCCAGCTTTTCATACTTTTGGAGAACTTCC
+AGCTATCAAGGAAACCGTGAAGTAAAAGAAGAAAAGGTAGACCACTAATACTAAGAACCT
+AACAGAACAAGCAATGCCCCGTTGCGGACGTGCTG
+>ds2020-267_216
+ATCTAAGGAGCAGCACGTCCGCAAAGACTTCCGACTACTTGGGACGTGTGACTCCTTCTG
+GGTTGCGGACGTGCTGAGTGGTTTTGTCTTGCGGACGTGCTGCTCCTTAGATTATCTAAG
+GAGCAGCACGTCCGCAAACTAAGTCAGCTCAGCACGTCGCAAAACCGCGGAATTGGGACG
+TGAGGGGCTACGCATTGCGGACGTGCTGCTCCTTAGATAATCTCAGGGTTCGTTTGTTGC
+GGACGTGTGTCCGATTTAGTATTGCGGACGTGCTG
+>ds2020-267_217
+TGTAAGGACGTTCGGGCTTCGCCCACCCGGTGACGTTCGGGCTTATTGGAGTGGGTGTTG
+GAATTTTGAGAGGATTTGTCCCTAGTACGAGAGGACCGGGATGAACGTACCTCTGGTGGA
+GCAGTTGTCGCGCCAGCGGCAGTGCTGCATAGCTATGTACGGACGGGATAACCGCTGAAA
+GCATCTAAGCGGGAAACCCACCTCAAAACGAGAATTCCCTTGAGAACCGTGGAAGACGAC
+CACGTTGATAGACCGCGGTGGAAGCCCGAACGTCC
+>ds2020-267_218
+GGACGTTCGGGCTTCGGGATCGAGGTATCATTAGCCGAAGAAGACCCTGGCCAATCCACG
+TGGCCTGCTTGACGAACGTCAGCGACGGAGACATCGTAAATTGGTCCGCGGGCATCGCAA
+TAAATCCTCTGTCCTACTACAGGTGCCGCGATAACCTTTACCAAGTCCGAACGATTGTCG
+ACCACCAGATCCGCTGGTCTGCAATATTCACCCTAGCCCACAAGCACAAATCCTCGGCGC
+GGAATATAATCCTAAAACCGTTGCGGACGTCCTG
+>ds2020-267_219
+CAGCACGTCCGCAACATGCTAGCTCTTAATTTTTTTTTAATTTTCCTTTTTCCTTGCATG
+AAATTTTGTTGCCAAAATTAAATTTCATATGATAGTTGATTTGCTACCAAGTTGGTGTGC
+CTTTCTTGTGGTTTTGGTCTAAATTATCTTAGCAAGGTGCTATATTGGCCTCTCCGTCCA
+AGGAGAAAAGTGAGAATTCACAGACCATTGGGAGGAACTGTTCTACTGGAATTACCAAAT
+ATGCCGAACGGATGAACTCTTGCGGACGTGCTG
+>ds2020-267_220
+TGTATTCATTATACCGGTCCTTTACTTGCTGTTGCGCTGCGATACGTGCCCTGGTTAGGT
+TTGTAGGCTTACAAACACAATCAGAGGTGATCTCTGTGTAGTCGTGTAGAACCAATTGTA
+GCTCAGCGAAGCTACGCTTGGTTGAGGGGGGTGTCGACGGTCAGTGCGTCGCCTTAAGCG
+ACGTCCGCAACACGCACCCCATAACACTTGCGGACGTGCTGACCGAACAAGCATTGCGGA
+CGTGCTGAGAGGGGGATAATTGCGGACGTGCTG
+>ds2020-267_221
+GACGCACTGACCGTCCTTTCCCTGGTATCCGATTCTGCCGCTACAAACAATAAGTGCTTG
+CTATTAATTAAGTTTAACCATTCCCCCCGTTCTTTGCCTGATAGCCCAACTGAAGACAGT
+ATTCTAAGTACAGCTTCTTCATCATTCTCTTGAGCATCTTTAGGTCTCCCGACTAAGAAT
+TCTTGATATTTTCTGTTTCTTTCCGCTATATTGCCTTCCTCTGCATCTTTGATAGCTGCA
+CCTATTAACTCTAGGCAGCACGGTCAGTGCGTC
+>ds2020-267_222
+CAGCACGTCCGCAAGTCTCACCTGGTCGCTCCTTCTTCTTCTTCTTCTAATATTCTGTCA
+ATCGCTTCCAAGTTCAGCCCATGGAGATGGAAATGGAGGTGGTACAACAACTACTAGTAC
+TATTACTAGGGCGGTTGTTGTTGGGGAGCAGCAGCCACCACTGCCAGCTACAAATTACCA
+TGTCAGTACTTTGCTTCACACAACTCGGAAGCTTAAGCTTGGGGTTCACATGAAAATAAC
+CCATACGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_223
+ATCTAAGGAGCAGCACGTCCGCAAACTAAATCGACTTTTACTTCCTCTAAATAATCAAGT
+TCGGTCAGCTTCCGTGCGACAAACAAATTACCACGAGGGTATCATGTTGTACACGTCCAG
+AGACCTCACTAAACAAGGGGCAGCACGTCCGCAAAGCCTAATCGCTTGCGGACGTGCTGA
+GGAGGTTGAGTTTGCGGACGTGCTGATGCTTAGATAGATCGGAAGCGCACGCGTCTGGCT
+TCCGTTCACTCCTGAGCTTCCCGTATGCTGTG
+>ds2020-267_224
+AAGCACGTCCGCAACCTCTCTCGACTGCCCAATCTCGTTCCCTCCCCAGAGTGCCAGTTG
+CTGAGTACATGCAGGGAGAGCCAATCCACAGTAGGTTGCGCAAATTGACCACTTCTCTTG
+CGGGGACTCTCCCAACGCACAAACTTGCGTTCATAGCGGGCGGCATACAACATGCACTCG
+ATACCCCCGTGTCGGTGTGCGTGGACGGTGTAACCACGCACAACGCATTGATGGATGTAC
+ACACAGACGTTAATGCTCTTGCTGACGTGCTG
+>ds2020-267_225
+ATCTAAGGAGCAGCACGTCCGCAAAGTTGAGGGGATGAGTTGTGGATAGGGGTGAAAGGC
+CAATCAAACACCGTGATAGCTGGTTCTCCCCGAAATGCATACGGTGCAGCGTTGCGTGTT
+TCTTGCCGGAGGTAGAGCACTGGATAGCCGATGGGCCCTACAAGGTTACTGACGTTAGCC
+AAACTCCGAATGCCGGTAAGTGAGAGCGCAGCAGTGAGACTGCGGGGGATAAGCTCCGTA
+GTCGAGAGGGGAAAACGAAAGCCCGAACGTCC
+>ds2020-267_226
+GGACGTCCGGGCTTGGTTGCTCCCCTCTGCCTTTGCACTCGAGGGCCAATCTCCGTCTGG
+CCCGAGGAAACCTTTGCACGCCTCCGTTACCTTTTGGGAGGCCTACGCCCCATAGAAACT
+GTCTACCTGAGAATGTCCCTTGGCCCGTAGGTCCTGACACAAGGTTAGAATTCTAGCTCT
+TCCAGAGTGGTATCTCACTGATGGCTCGGGCCCCCCCGGAAGGGGGCCTTCTTCGCCTTC
+CACCTAAGCTGCGGGGAATTGCGGACGTGCTG
+>ds2020-267_227
+CAGCACGTCCGCAACTGGCAACCCGCGCTTTAACGATTTTGTGCGACACTGATTTGATTA
+AACTCATTGGGTGTTTTGACCAACCCGTTAACTTGAATCACCATTTCTTGGTTTTGATTG
+GTGATAGTACCGACAGGTAATTCGACGTTCTGTGGGCGTAGCGCATTGCTAATTTGATTG
+ACTGAGACTTTATAGGCATTCATTTGGGTGGGATTGAGCAGCACACGGATTTGACGCTGC
+CGACCCACCGGGCCCAGATTGCGGACGTGCTG
+>ds2020-267_228
+CAGCACGTCCGCAAGCTCACATGGGTTATCTCTCTGCTCATCCACTACTACCTAATTTGG
+AATTATCATTCTCATCATTTCACTAAAATCAATTAAATTAAATTAAATTCATCACCTCTA
+TCAATTGATCCTCCAGAAGGCTTTTTCACCACTGCTTCTGGAGCCTCTGTAAAACAGACC
+AAAAGAAACCAAATTTACCACAAACACTCTGTAAAGTTTTCATCTTTTTACTGTTTCACT
+GTGTGAGAGAGACGAAATTGCGGACGTGCTG
+>ds2020-267_229
+CAGCACGTCCGCAATCCGCTGGCTGTATTTGTTGCTTTAGGTTTGTTTAGTAGAAGGTGC
+ACTGGGGTAGGCTCTGGTGGTAGTGGAGGTGGTGGAGGAGGAGCCGATTTTGGTGGTGGA
+GGAGGAGCCGATTGCGGTGATGGAGGAGGGGCTGATTTCGGTGGTGGAGGAGGAGGAGGA
+GGAGGTGATTTCGGTGGTGGAGGAGGTGGTGGAGGAGGAGGAGGAGGAGATTTCGGTGGT
+GGAGAAGGGATAGTTTGCGGACGTGCTG
+>ds2020-267_230
+CAGCACGTCCGCAAATCAGTGCCGCTACCTACTTCTACTAAGGCGGAGCTTAATAGGAGC
+AAGAGACTTGGTGGCAACAACCAGAATGAAATATTATTTAATCGTGGAAATGCCATGTCA
+GGTGCACCTATTAGAATCGGAACAGACCAATTACCAGATCCACCTATCATCGCCGGCATA
+ACCATAAAAAAGATCATTAAAAAAGCGTGAGCCGTTATTAAAACATTATAAAGTTGATGA
+TTACCACCATTCGCTTGCGGACGTGCTG
+>ds2020-267_231
+CAGCACGTCCGCAATGTTACCGCCCTCCCCTTAGATGTCTATGCATCCTTTAGCATCTCC
+CGATTTTTTTTTATATCGTTATATCTGCCCTCTCTCCATTTTTTTGAGAGAGAGCAGATG
+GATCCTATCCCCTATATCGAACACTAAATCCTATCTATTGATAGAAAGATCTTCGTCAAA
+TACCGGACTTTGCCTTTTTTTAGGAATTCCTCATATCCAAGGCAGCTTACCACAAGCACC
+CCATACGATACTAGTTGCGGACGTGCTG
+>ds2020-267_232
+CAGCACGTCCGCAAAACTGATGCAATAATGGTGGCTGCCTCAGCATCAGAAATGGAGGCT
+TCTCTAACTCTCATTAGTATCTGCTGCTTAAATGCCCTCCTCTCTCTCTGCCTCAGCCCT
+TCACCCACCTCCAATTGCACAGCAAATCTCGCCACACAACTAGAAAACGGGTGGTTCTCG
+AAGAACCTATTTTCCCTGCACTCTCTTGTTGTCTTCTTCTCCTTAACCCCACCACCACCA
+CCGGCTACCCCAGCTTGCGGACGTGCTG
+>ds2020-267_233
+GACGCACTGACCGTACCATCGCACCTTCAATAATCGATGAGCCAATCGCCACATGAGATA
+GTTGCACCAAAGCAAAGCCTAACAGTAAGCTCGTCACCAATAAGCCTAAACCCAATTATT
+TGTGACGGGCAAACACCATGCCCATGCCAACTGCAAGCACCACGTGAGTGAACATAGGAC
+GGTCAGTGCGTCGCCTTAAGCGACAGCACGTCCGCAATAATATGCCTCCACGTCCGCAAA
+TAACTGGCTATCTTTTGCGGACGTGCTG
+>ds2020-267_234
+GACGCACTGACCGTGGGGGTCCTCGTAGGCAATCGCTGTATTGTCGTCAATAGGTTTATC
+GGTGACTGCTTGAACGGCAGGACCTTTTGGGATAACTTTTACTACAGGTACCACAACCGC
+AGGTTTGGGTTGAGCATTCATAGGTGCACTTGCGCAACAGATTTGTTAGTGCTTTTGAAA
+CGGTCAGTGCGTCGCCTAAGCGCACGTCCGCAACATGAATCTCCTAAGCTTGCGGACGTG
+CTGGCGGAGGAACCTTGCGGACGTGCTG
+>ds2020-267_235
+CAGCACGTCCGCAATTCTTGGCTAGTGACGAGGCACTTCAACGGGTTGTACGAGTCGATT
+TACTTTGATGCACCAACCGAGGTGGAAGCCATGTTTTATGACAGGCTGCCGAACATGCCA
+GTCCGGAAGCCAAAAACAGAAAAACAGATAGACGGTCTAGGCTACACGAAGATCACGTCG
+AATCACCACATCCATTTCACTCCGTCCGAAGTGAGAAAGGCGGTTAGGAATGAAGCACGC
+GACAAGCCGAAGTTTGCGGACGTGCTG
+>ds2020-267_236
+CAGCACGTCCGCAAAGAACTCCGACTTCTGGAAGGGATGCATTTATTAGATAAAAGGCTG
+ACGCGGGCTCTGCCCGTTGCTCTGATGATTCATGATAACTCGACGGATCGCACAGCCATC
+GTGCTGGCGACGCATCATTCAAATATCTGCCCTATCAACTTTCGATGGTAGGATAGTGGC
+CTACCATGGTGGTGACGGGTGACGGAGAATTAGGGTTCGATTCCGGAGAGGGAGCCTGAG
+AAACGGCTACCACATCCAAGGAAGGC
+>ds2020-267_237
+GTTATCCCTGTGGTAACTTTTCTGACACCTCTAGCTTCAAATTCCGAAGGTCTAAAGGAT
+CGATAGGCCACGCTTTCACGGTTCGTATTCGTACTGGAAATCAGAATCAAACGAGCTTTT
+ACCCTTTTGTTCCACACGAGATTTCTGTTCTCGTTGAGCTCATCTTAGGACACCTGCGTT
+ATCTTTTAACAGATGTGCCGCCCCAGCCAAACTCCCCACCTGGCAGTGTCCCTGACTTGG
+ATCGCGCCTAAGTTGCGGACGTGCTG
+>ds2020-267_238
+CAGCACGTCCGCAAACTTTGTCAACTGGTTGTTGGGAGGGTTTCTTCTCAGTAACGTAGC
+TAACGCGTGAAGTTGACCGCCTGGGGAGTACGGCCGCAAGGTTGAAACTCAAAGGAATTG
+ACGGGGACCCGCACAAGCGGTGGATGATGTGGTTTAATTCGATGCAACGCGAAAAACCTT
+ACCTACCCTTGACATGTCTGGAATCCTGAAGAGATTTGGGAGTGCTCGAAAGAGAGCCAG
+AACTCCAGGTGCTTGCGGACGTGCTG
+>ds2020-267_239
+CGGAACTTCCGCAATCTCGGCCCTGGATAGAATTTCTTGGGTCTTCAACAAAAAAATTCT
+AAGTTTCAGTACAAATAATGATATATATTGTTAATTATTCAATTTAAATTTTAAATGGGG
+ATTCCTTGCTCAAAGATGTTCGTTTGTACGTGTATCAGATATATAACACATGAGGCTTGT
+GATAGGGCAGCACGTCCGCAAGACACAGACGGTATCTTGCGGACGTGCTGAGAGCGGCTA
+CCTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_240
+GACGCACTGACCGTTTTTGGCAAGGTTTAAATCATGGCTAATCAAAAGCATCGCCATGCC
+CCGCTCGTTTTTTAGCCGATGCAGTAACCCCAAAATCTCATGGCGTAAAGTCACATCTAG
+GGCGGTGGAGGTGGGGTACTACGGTCAGTGCGTCGCCTTAAGCGATCTAAGGAGCAGCAC
+GTCCGCAACTCCTCATCCCTCAGCACGTCCGCAATCGATCGTTGGCCACGTCCGCAAGTG
+GGGTCAGGTACATTGCGGACGTGCTG
+>ds2020-267_241
+CAGTTCGTCCGCAACTCTACCCGGATGCCCTTGCGGACGTGCTGACGGGTAAACTATTGC
+GACGTGCTGCTCCTTAGATAATCTAAGGAGCAGCACGTCCGCCACCACATCCGCCTCAGC
+ACGTCTGCAACTCCGTAAATGTGCGACGTGGAGGTATAGGATCTTGCGGACGTGCTGCTC
+CTTAGATTATCTAAGGAGCAGCCGTCCGCAACACTGATGGCCTCAGCACGTCGCAATCCT
+ATCCCATTTAGTTTGCGGACGTGCTG
+>ds2020-267_242
+CAGCACGTCCGCGAATGCCTCGGCGCGTCCGGTGGCTGGGCCCGCGGCGCGGCCGCGGTG
+GGGGTGGCGCAGCCTGTGCGCCGCCGGGTGCGGGTGTGGTGCGGGCGTGGGGTGGGCCCG
+GGGTTGGGGGGGTGGGGGTGGGGAGGGGGGCGTGCCGATGGAGGTAAGGGGCGGGACGTG
+GGGGAGGGTCGAGGGTTGAGATTGCGAGGTGGTGAGGTCAGGGTCATTGCGGACGTGCTG
+AGAGGCTTTCAATTGCGGACGTGCTG
+>ds2020-267_243
+CAGCACGTCCGCAATTTCATCCTTTTTCAAACCTGCCCCCGATCAGTGCAATGGGATGTG
+TCTATTTATCTATCTCTTGACTCGAAATGGGAGCAGGTTTGAAAAAGGATCTTAGAGTGT
+CTAGGGTTGGGCCAGGAGGGTCTCTTAACGCCTTCTTTTTTCTTCTCATCGGAGTTATTT
+CACAAAGACTTGCCATGGTAAGGAAGAAGGGAGGAACAAGCACACTTGGAGAGCGCAGTA
+CAACGGGTCAAACGGTCAGTGCGTC
+>ds2020-267_244
+CAGCACGTCCGCAAGATGGACACCCTGTAGATTGCGGACGTGCGACAGATTATTCATTGC
+GGACGTGTGAGAGTCTATCTTTGCGGACGTGCTGCTCCTTAGATACAGGAAGTAGGACGT
+TCGGGCTTTCCAGCGGCACTTGCTGTCGCTTATAATAACACACACGTCCAGGTTTGAGAT
+TGACTATGGTGGCTTATCATATCATGTTGTTACATGTTAGTAACAAAGGTTCTTTTTGGT
+AGGGAGTGTATAAGCCCGAACGTCC
+>ds2020-267_245
+CAGCACGTCCGCAAAGCCTCCGCCCTGATTCTTGATTAATAAACATGCCCTAATAAAAGG
+AGATTGATTATCGGGAATGGGTTAGGAATCGTAATTCAACTTTCTAATTGAAACAAACAT
+TATATTTCAAGCTAATATTGATGATGATTGTTGTTGGAAACAAACATAATATTTCTAGCA
+GATATATATTATATCCAGCTCCTCCTATCCTATAACAGAAAGAAAGAAAGGAGGGATAAT
+GAAGATCGAGTTGCGGACGTGCTG
+>ds2020-267_246
+CAGCACGTCCGCAATACCTGACGCTTCACTTGTTTCCGAACAAAATCGTCTAGTCGCGCT
+CTTCACGAGCTAATTGGTAAAAAGTCTACTGTCTAGTAGCATATTCACATCAAGGAAAGA
+ATCTTCGTCAAAATGGCTTATCAAAAGTCAGACAAGTCAACTGTCTCCGGCACAACAATC
+ACGCCAGATGACTCAGCCTCGCAAGCTGGACCACACATCGACACCCCTACCAAGTATCAC
+ATGCACCGGAAAGCCCGAACGTCC
+>ds2020-267_247
+GACGCACTGACCGTGAAAACGCCTCTGACGCACTGACCGTCTGTCGTTGGCTGACGCACT
+GACCGTTGGGAACGCTCTGACGCACTACCGTTCTATAGGGGTGTGTACGGTCAGTGCGTC
+GCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATATCATACCGTTGCGGACGGCTGAG
+GCTCGAGAATTGCGGACGTGCTGAGGTGTTTCTATTGCGGACGTGCTGAGCGCATATAGC
+TTGCGGACGGCTGCTCCTTAGATA
+>ds2020-267_248
+CAGCACGTCCGCAATACGTATCATCTTGCGACGTGCTGGGTGATTGACCTTGCGCACGTG
+CTGAGAGGAAGTGACTTGCCGACGTGCTGCTCCTTAGATAATCGAAGGGGCAGCACGTCC
+GCCAACTACTTTACCTCAGCCGTCCGCAAAACACCGAGCCATACTTGCGGACGTGCTGCT
+CCTTAGATTATCTAAGGAGCAGCACGTCGCATCAGTCACCGGTCAGCACGTCCGCAAAAG
+GGCCTCGGTATTGCGGACGTGCTG
+>ds2020-267_249
+TCAGCACGTCCGCAATCTGCGACCCCTGGAGTAATGTATTCTATGAATAATAAATAAATA
+TGAAGAATACTCTTTCAATCAAAGAAATATTTCAATTATTTTCGTGTTCGTATTTCGAAA
+GTAAAAAAACGTAAAAGGAATACAAAAGGTAGGAAATTTATTACAGCTGAATTCTTCATA
+AATTTTCTATTTCGATGAACTGACTCTTACAAAAGTTGTATATGGACCATGAGGAAGAAC
+AGACCCCCATTGCGGACGTGCTG
+>ds2020-267_250
+CAGCACGTCCGCAATACCCCACCACTATGAATGCTGGAAGCAACCCAACGCAAACTTGCA
+TAGGACATGCAAAGGGATATGATCAATACTCTCAACTCACCTGGGCACATAATGCACCAA
+TCGGTAGTTACAAGCAAAAGATCTTAAAACTCCTTCCTCTTTATTTTTCTCTCGATACTC
+TTCGACCCCTTTATCGCAATTAAAACTAAGCACAAAATTTATCTGCGCTGAAGAAAAAGG
+GCCACTCTATTGCGGACGTGCTG
+>ds2020-267_251
+CCGATCTATCTAAGGAGCAGCACGTCCGCAACAGGCAGTCTCACGATCGGGCATGAGCGT
+CCGGAAGTTGTCATTGTATACTCCCGCGGGTCGGAAGGCGGCGGGGGAAGGAGGAGGACA
+CTGGGCGGGATCTATCAGCAGCGAATTCCCCATACAGATAGAGGCGCCTATCAAAAAGAT
+ACTCCGAAGGCTTCGGGATCGAGGTATCATTAGCCGAAGAAGACCCTGGCCAATCCAACG
+GACCATACTTGCGGACGTGCTG
+>ds2020-267_252
+TCAGCACGTCCGCAATTCTATTTCACTCCATACCTAGCAAAAACAGGCTGGCTAAAAAAA
+TAAGACGACGTTTGAACAGGGGTCTTAGCTTGATGGCACTCACCAAGGTCAATTAAGCCC
+TATGTTAAATTAGTTAAATTGACGCCCAATAAATTTGACGGTTTCATCCTTGGCTTTTTT
+GACGGCAAGTTTGCGGTTTTGTCCTAGCAGTAATTTAATTTGCCACAGTTTTTCTTGATA
+CAAGGTTGTTGCGGACGTGCTG
+>ds2020-267_253
+GCGACGCACTGACCGTACTTTACCACAATTTATAGCTCGTGCAATTACCCAATCTCAAAC
+GGGTCATCTGGATTGATAGCCCAAAGTCCACTGAGGATTTTAGCTATATGCAAAAATTCT
+CAGCGTGGATTGCCTAAGGCGATGCCGATGATCCGGCAGTGGCGGAACGTGCCAAAAAGC
+TCAACCCCAATAACCCCCTCACTTTGCGGACGTGCTGAGGACATAGTAGTTGCGGACGTG
+CTGAGTATTATCTGGTTGCGGA
+>ds2020-267_254
+CAGCACGTCCGCAAAATGTCCTGGCTGGTTGGGACGTGCTGAGGCTCCTTACATTGCGGA
+CGTGCTGAGGCTAAAGTTGTTGCGACGTGCTGCTCCTTAGATCGCTTAGGCGACGCACTG
+ACCGTGGGCTTTGGGGTGTTTAAAGTGTAAAGCTGCAAAGGGTTGTTACCAATCGGTAAA
+TGTTGCTCGTGGGTCGCCCCTGCGGTGGGGAACGGTGTGGGAACGGTCAGTGCGTCAGGG
+TACTCCCAACGGTCAGTGCGTC
+>ds2020-267_255
+CAGCACGTCCGCAAACTGGCTGAGTTCTCTGTAGCTTTGCATACCACCAGTACCGCGGGA
+GAACAACTCAACGCTAAGTTCCCCCTGGACGACTTGAGGGGATACTGTTGCGGAGAAAGC
+AACTATGAGATGCTGGGTTTGGGTGGTGCTGTCGTCTACCACAGCTTGGTCAAGGATGCA
+GGTTGTCAGGCTCCAAGGTCAATTCTGAAAGGTTGCTGGAGCGAGGACGAGAAGGACGAA
+GAAGTCGTTGCGGACGGGCTG
+>ds2020-267_256
+CAGCAGTCCGCAATAGGCCCCGACTTCCGGGAGGGGTGTATTTATTAGATAAAAAACCAA
+CGCGGCTCGCCGCTCTTTTGGTGATTCATAATAACTTGTCGAATCGCATGGCCTTGCGCC
+GGCGATGCTTCATTCAAATATCTGCCCTATCAACTTTCGATGGTAGGATAGAGGCCTACC
+ATGGTTTCAACGGGTAACGGGGAATAAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACG
+GCTACCACATCCAAGGAAGGC
+>ds2020-267_257
+CAGCACGTCCGCAACAACCATCAATTAAATGTAGGAGCTATTCATGTTTTCACATGTAGA
+ACCGTATGCGGGTGACCCGATTTTGGGGCTGATGGACAAGCATAAACAAGACCCACGTGC
+CGACAAAGTTAATTTGGGTGTGGGTGTCTAATTTGATAATGAGGGTAAATTACCCGTCCT
+CAACTGTGTGCAAAAAGCTGAAGCACAAATCGCAAATCCACCAAAACCACGTCCCAGCCG
+GAATTCCTTGCGGACGTGCTG
+>ds2020-267_258
+CGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTCTGTCAAGTCGGATGTGAA
+ATCCCCGGGCTCAACCTGGGAACTGCATTCGAAACTGGCAGGCTAGAGTCTTGTAGAGGG
+GGGTAGAATTCCAGGTGTAGCCGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGA
+AGGCGGCCCCCTGGACAAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGAT
+TGTAGTTTTGCGGACGTGCTG
+>ds2020-267_259
+CAGCACGTCCGCAACTCAAACGGGGCGCACGTCCGCAATAGATCCCTCTTTTTGCGACGT
+GCTGCTCCTTAGATTATCTAAGGAGCAGCACGTCAGCAAAATAGCCCCGTTAGCACGTCC
+GCAAACGAGATCGCTCAGCCGTCCGCAATTTATGGCCATGGATGTGCGGACGTGCTGCTC
+CTTAGATAATCTAAGGAGCAGCACGTCGCAAAACACCCGTCATGTTGCGGACGTGAGCGA
+AGGCCAGTTGCGGACGTGCTG
+>ds2020-267_260
+CGTCCGCAAGTCGGATTGGGTCAGCACGTCCGCAAGAAAGGAGCCCTCAGCACGTCCGCA
+ATATTTTCTCGGTCGCCGTCCGCAAGTCAGTGTTGGTTGCGGACGTGCTGCTCCTTAGAT
+ACGCTTAAGGCGACGCACTGACCGTCGTGGGGACGCACTGACCGTACTCTTTCCCCTGAC
+GCACTGACCTTCTCATCTGATTTGACGCACTGACCGTCGTTGTGGGACTTGGCGGAGGGG
+ACAAACTACGGTCTGTGCGTC
+>ds2020-267_261
+CAGCACGTCCGCAAGGGCATACTACTCCAGTGCTGCGCCATTGGACAAGCAGTTCATACA
+ATCTTACAGCGTATTTACTTTGTAGGTTACTTACTTGGTCAATATCATACTCAGTAAAAC
+GTTGCTCAAGCCTTGTGATTAGCGGTATTACATCACTAGCAAAGACCAGCTCAACACAGC
+CCAAGTCATCAATATAGCCAATTTTATCCACCCAACGGCTTTTGAAATGACCGAATTTGC
+GGACGTGCTGCTCCTTAGAT
+>ds2020-267_262
+CAGCACGTCCGCAACTTTACCCTCTTTTTGGATGACTCACAATTATATATACTATATATT
+TCTATACGATCAGATATCATGCAAACCCTTTCTATACTAATAGCATAGAACCTTACTCTA
+TATTAATCTAACAAATATTTCATCTAATACTAATAAAAGTTAAAATTTCTTTTTTTGAAA
+TTGAAGAAGTTCTATTTGCTCAATAAACTTACCTATATTTATTTTTGTTTGTCCAGGGGT
+AGCCGCTTGCGGACGTGCTG
+>ds2020-267_263
+TCAGCACGTCCGCAATCACATACCGCTCTCGCCATGCTGGCTTATCTAAATTATGATTTG
+ATGATTGGCAATTTGGAAATGGATGTGATGGATGGCGAGCTGCGCTTTAAGACGTCGCTT
+GATTTGGAAGTGACGGGGGTGAGCGAGCTCATTATGAGTTATTTGCTACAGAGTAATTTC
+TCGTTGTTTTCACGGCTGTATGACACCATTCGCGAGATGATTGAGCAGCCCAATACTACC
+ATGGATTTGCGGACGTGCTG
+>ds2020-267_264
+CAGCACGTCCGCAAGAATCGCTGGCTGATCCAAGGGAATTTCGTACATTGTATTCATTTG
+TCTTTGTCAAGCATCCTGACATAAAGGGAACCGTCTACTGGCAAGCGAAGTCATCTCGAC
+GATGTAGCACTCTACTAATACCATAATCTTTAGTCGGAATTTTGTGAAAGAAAGAAAGGG
+CGCTCCCACATACTACTAAAAGCTCCAGCTCGGGCAATAATCCTCTCCACTCAAAAAGAA
+AGGGTCTTGCGGACGTGCTG
+>ds2020-267_265
+CAGCACGTCCGCAACACCCTCTGCATGAAGTAAGTGTAATTCCTTAACGCGAAATAGAAT
+GGCTGAACATCACGTGAGTTTGCCCGCCTTGCAAACTCACAGAGGCAGTCCAATCCACAG
+AATCTACAAGATATGCTATTTCCATTTTTTTTCTTTTGTAATCAAGTTAGCCTACAAGTC
+AGTATCTCTGATACTGAGACTCTACAATAAGCAGCTCCCATGGAAGCCCACTAGAGGGCA
+TAGTGTTTGCGGACGTGCTG
+>ds2020-267_266
+CAGCACGTCCGCAAGTTGCCCGCCAGCGTTGGTATTTCCAGTCTGTATCCCGAAGCTGCG
+TTCGGGGTGATTGAGACTGACACGTCACTGTCTAAGCTCTCTGAGATGCCCCCCGCCACC
+CTGTGCACTCTTTTGATTGTGTAGAAGTCCTCCTTCTCCATTGAGCACACTAGTGCTTGC
+CTGACATAGGATATTTCCCTCACTAACGATATTGTGAGGAGGGAAATATACTATATCAGG
+CAAGCTTTGCGGACGTGCTG
+>ds2020-267_267
+CAGCACGTCCGCAACACCCATCCACTCTTTCAGCATCCTGCAAATCTTCTTCCTTCTTCT
+TCAGTGCTGCCAATGCAGCAAGAAGATCAGACTCCAGGATTTCAAGGTTAAACCCTAGCT
+GGATATCCTGAGGATGATGAGAATTTCGGTTCATCTGTTCTTCCAGTTTCTGAGTCTGTG
+CAAACAACCTCTCAAGAAGAATCCTTGCAGGTTCCGATGCTCCATTGTCACTAATGCTCG
+ACTTATTGCGGACGTGCTG
+>ds2020-267_268
+CAGCACGTCCGCAATGCATGGCCTCTGAGTTTGTGGAAACGAACCCTCTGCCAACCTGGG
+ACGGCACGACCCACGTCTCTAAGTCTGCCAAGTTAGAACACGGGAAGACCCGCGCAATAT
+TCGCCTGCGACACCCGGTCGTATTTTGGGTTTTCGTGGATCCTAGATGCGACCCAACAGG
+CCTGGAAGAACGAACGGGTTGTCATGGATCCGGGCAAAGGTGGGAAGTGTGGGATGACGC
+AACGATTGCGGACGTGCTG
+>ds2020-267_269
+GACGCACTGACCGTCAAGCTTTCCCTCCCGACAATTTCAAGCACTCTTTGACTCTCTTTT
+CAAAGTCCTTTTCATCTTTCCCTCGCGGTACTTGTTTGCTATCGGTCTCTCGCCCGTATT
+TAGCCTTGGACAGAATTTACCGCCCGATTGGGGCTGCATTCCCAAACAACCCGTCATTGC
+ACGGTCAGTGCGTCAGGGAAAGACGTGTGCCCCTAATAGCTTGCGGACGTGCTGCCACAG
+GAGCCTTGCGGACGTGCTG
+>ds2020-267_270
+CAGCACGTCCGCAACTTAGCCGTCCTCATCATCATGAACCAGAGTCATACAAAGTAGAAC
+AAGAGGAGGAGAAGGAGAAGAAGCACGGCAGTCTTTTGGAGAAGCTTCACCGATCCGACA
+GCAGCTCTAGCTCTTCGAGCGATGAAGAGGGAGGTGAAGGAGAAGAGAAAAAGAAGAAGA
+AGAAAGAAAAGAAGGGACTGAAGGATAAGATCTCTGGTCATCATGATCAGAAGGCGGTGG
+ACAAAGCCCGAACGTCCTT
+>ds2020-267_271
+GACGCACTGACCGTTTCGGTCTCGGGACGCACTGACCGTCGAATCGGGAATAAAACGAGG
+CATATCGACACGGTCAGTGCGTCGCCTTAAGCGTAGCACGTCCGCAATAAATCGGGGATC
+GGTTGGGACGTGCTGAGGGAACGCGTATTGCGGACGTGCTGGGGTATTACGGTTGCGGAC
+GTGCTGGGGGATCGGTTGGGACGTGCTGAGGGAATGCGTATTGCGGACGTGCTAGGGTAT
+TACGGTTGCGGACGTGCTG
+>ds2020-267_272
+GGACGTTCGGGCTTTTCGTGGTGTTTGGGTTGCAATCCGCAATACTCAATGACGCTGCAG
+TCTTGCTTGGTCAGGATTTGCCCTCTTGGCTCAAGGAATGTGATGCTATGGTTGACTATA
+TGCACTTGTTTGCTGTAGCTCCGCGAGATGTCATTGATCGTATGCAAAAGCCTCTCAGCC
+TTGGGAGGCAACTCAGAATTATCTACAGAAAATTGTGCAATAGATATCGAGCTTAGTTCC
+CGGGTTTGCGGACGTGCTG
+>ds2020-267_273
+CCGATCTATCTAAGGAGCAGCCGTCCGCAACAGGCGCAGTTTGCTCAGTTGCAGGGACAG
+CAGCAGTGCTCGTCGTAGAGCCGGTGGTCGCGGGTGCAGACATTTTGACGTGGTAGCGTA
+AATGTGTGGGATGTGGGGGGAGGTAATACCTGTTAGGAGAGCGTGGAATGAACTTTTATG
+TTGGAGGTGTCAGACTTTGAGATTTACGTTCCTCAGATAATTCAGGGCAAGTTCGTTGCG
+GACGTGCTGCTCCTTAGA
+>ds2020-267_274
+ATCTAAGGAGCAGCACGTCCGCAAAGCCAATTCTGTAATATTTGTGATTCATTTTGGCGT
+GAGCTAATAATGTCTTGGGCTAAGTCTAGCAGTTCAGGATTTTTGCCGTATCGCTGCTCA
+ATATTGGCAAGCGCGATGATTTCATCAAAATGACTCAGCATGGTATTGACAAAAATCATA
+TCCGGTGAGATGGGTATATAGTCAAATTGATTGAGGGCGTTTGGGTCACTGGAGTGCACA
+GTGATTGCGGACGTGCTG
+>ds2020-267_275
+CAGCACGTCCGCAAATTTGCCGCTCTTCTTATTCCCAGAATCCTTAGCCTCTTCCTAAAT
+AAGGCCCCTCCCTAGTCCTTATTCTCTATTCCTTATAAAATGAAAGATTCATTCTTTAGC
+CAGATCAACATCCTTCTTCCTATTACCTATCTCCAGATCAAGATCCTAACATGATTTAAG
+CCATAACTCTACTATGGAAGTACTTAGTAATCCTACTTCCTATTCACTATCTACTTCCTT
+CGTCAGCCTTCCTCCATA
+>ds2020-267_276
+TAAGGAGCAGCCGTCCGCAACAGAATCCCCCTCAATTCTCCAGCGCCCACGGCAGATAGG
+GACCGAACTGTCTCACGACGTTCTAAACCCAGCTCGCGTACCACTTTAAATGGCGAACAG
+CCATACCCTTGGGACCTACTTCAGCCCCAGGATGTGATGAGCCGACATCGAGGTGCCAAA
+CACCGCCGTCGATATGAACTCTTGGGCGGTATCAGCCTGTTATCCCCGGAGTAACTTTTA
+TCCGTTGCGGACGTGCTG
+>ds2020-267_277
+GTCGCAACGTGGAAGCCCCAGCACGTCCGCAATGGGACTCCAGTCAGCACGTCCGCAAAT
+TACAGGTGGTCGGGGAAGAGTGGAATTAGAGGAAATCGGAGGTGAATTGGGTCGGGGTGA
+GGTTCGATTGGAGATAATTACGGTTTGATTGCAGAGGTTGACATTTGGGGGTTAGGGTTT
+GGTAGAGAGGGCAAGAGAGAGAGAGAGAGATAGAGGCAGAAGCGCCGAGTCCAACTGTAG
+GAACTTGCGGACGTGCTG
+>ds2020-267_278
+CAGCACGTCCGCAATGTTGGCCCTGTGCTGCAAGATTCATTGTTCGCTTTCTCAGACCTT
+TAGCACTGCAGAGGATGGGCAGAGCCAGATTCTTCTTCACCTCTACCGTGGAGATTCAGC
+TATGGCCAAGTCAGCCCATTCTTTAGGCACCTTCCAGATCACTGGTATTGCTCCAATGCC
+ACGTGGAGAGCCCAGCGTTCGCGTAGAGTTCCTAGCTGACACTGGGGGCATCACTCTCAA
+AGCATTGCGGACGTGCTG
+>ds2020-267_279
+AGGACGTTCGGGCTTTTTCGGTCGAGTTGTTTTATAGACCGGGGTTGCCCAGGGCGGGGC
+CAGGCGGGAGAAAGATACTTCGGGGATAGAATTGGATAGAGAACCTGTACCAAGAGATGT
+GTCAATTGAATAACGCGAGAAAGCCTCAAATCCCGCCCAACTCTATTGAATGAATCAGTC
+CACCTGAACCCACAGGTCAAAGGGGAAAGCAACGAGGAATTTCAAAGTGGAAAGGTAAAC
+GCAAGCCCGAACGTCCTT
+>ds2020-267_280
+CAGCACGTCCGCAATAAGGGCCCCCCCCCCCTCCTTCCTTGTCTGATTCGAGGGGGATCC
+CGTTGAGTTCTTATGCTTTCATGTCTACAACTCAGTTCATCCGATTATTACAGGGATGAA
+CCTAATCCAGAATAGGAACCATAAAAGAAAATACCGATTAAACCGATCACAAGAATACCC
+GCTACAGTACCTATTATCCAAAGAGGAATCCTTCCAGTAGTATCGGCCTATCTTTGCGGA
+CGTGCTGCTCCTTAGAT
+>ds2020-267_281
+CAGCACGTCCGCAATGTCTAGCGCATGGAGGATCCGTTGAGAGTTTCTGTTGTCTCGGTA
+GGGAACTGTATGATCTTTTCCCCTATTGTATTGAATCAATAAAAAAAAGAGGTCAGTGCT
+ACGGCCCCCTATTGTTTGATCCAATATTGACCGGGGACGAGCCCCGACTTCCATAGGTCC
+TTGGTTTGACCTCCCGTAGTGGTCCTTGCTTTTAATAAAGTGGAGCGGGGAAATTTTCTC
+GACTTGCGGACGTGCTG
+>ds2020-267_282
+CAGCACGTCCGCAAGCCGGGTCCCCTGGAAAAGTGAAAGTAGAAAGGGAAGTGCATTTCG
+GTAGAGAAATCAAGTAGGGGTGCATTTCTGTAAATACTCGGGATTCTTTGGGCTAACATT
+TTCGGTTTAGGCGGTGAAAGAAAGTTTGGGAGGAGGTTAGGATGAAAAAAGGGTGAATGG
+AAATTCGCCCCTTCTTTTTTGATGGTTTAGGCCAGATTCAGTGTACTCAGCAGCGGAGTT
+CACTTGCGGACGTGCTG
+>ds2020-267_283
+CAGCACGTCCGCAAACTTGGGTAGGTGGAGAAGTCACTTGAAATGTTTTCAGAGATGAAA
+AAATGTGGCGTGGCACCTAATGAGATAACCTTTATTGGGGTTCTTGGGGCTTGTCGACAC
+ATGGGCTTAGTCGATGAGGGGCGCCGCCATTTTGATTCCATTGTCCAGGAACACAAGATA
+GAACCCAACGTTGATTTGAGATATTGATAAGGCGAATTACCTGCCTATTCAATGCCAAGC
+GAGAAGCCCGAACGTCC
+>ds2020-267_284
+CAGCACGTCCGCAATGAGGCTTGACTCACACGTCCGCAATGAATACCCACTTCTGTTTGC
+CACTGTTGTTTTCTTTCTTCTTTTCCTTCTTGGTTATGTCTTTCTCCTTCTTCTTTGATT
+TCTCCTCGTCTTTATCAATATGTTTCTCCTCATCCTTTTTATGTTTTGGCTTCTCTTTTA
+CCACTGACTTGGTCTTTAATTCAAGTTCCACCTCAGCCTTCTCCTTCTTTAAATCCCCTG
+GTCTTGCGGACGTGCTG
+>ds2020-267_285
+GACGCACTGACCGTGACTGCTCTCCTCCGTCAATGTGCGTTTGTCAGAAGACAAAGTGCT
+ATATACCATCAATCATGCCAAACCAAAAGCGCTACTGTTAAATTCAGAATTGTCACCGAT
+GATCAAAAGCCACACCCAAGATGCGCCATCAATCGAGCATTTGATTTGGTTGGATGATAA
+CAATACGCCAATACACCCATACAGACGGTCAGTGCGTCGCCTAAGCGGGAGAGCATACCA
+ACATTGCGGACGTGCTG
+>ds2020-267_286
+CGCACGTCCGCAAATTCATGGGGGTGTTTGGTAGTATTTAATTCGTAGTATTTAACCGGT
+GGCATATATATTTATAGTACTCAGTCCGAGACTCCGAGAGTGTCACATGTGTTGTTATTG
+CCAGTGGTTGCCGTTGTGAATGAGATAGAGCCGACTACTAGGGTTTCCATGAGCATGGCA
+AATATTAGCACAGTGAGGAACCTTGACGGCTGATTTCTGAAAAGACGTCGTAGTCTCTAA
+TTTTTGCGGACGTGCTG
+>ds2020-267_287
+CAGCACGTCCGCAATACTCCGGGGCTAGACATTGCTCTACATGATACTTATTATGTGGTT
+GCACATTTCCATTATGTACTTTCTATGGGAGCCGTTTTTGCTTTATTTGCAGGATTTCAC
+TATTGGGTGGGTAAAATCTTTGGTCGGATATACCCTGAAACTTTAGGGCAAATACATTTT
+TGGATCACTTTTTTCGGGGTTAATCTGACCTTCTTTCCAATGCATTTCTTAGGGCTATCG
+GTTTGCGGACGTGCTG
+>ds2020-267_288
+CAGCACGTCCGCAAGGGGTTTTTAGTTCCTGTGGAGGATGTATGGATCGAGACACGCAGC
+TTCGACAAGTCTTTCTACCGGATACTACTGGGAGAGGTCCAGCTCGCTTGTTTGCCACGA
+ATATAATTCCTTTTAACTCATTTTTTTTATGCTAGGTTGGATCTACGGCAGTGCAGTTCT
+ACTTGAGCTTAACGATCACCAAAGGTCAGGTGAAATAGGAACGGAAAGCCAATTGCGGAC
+GTGCTGCTCCTTAGAT
+>ds2020-267_289
+GGACGTTCGGGCTTCTCATGTCCCCTTTCACCCGTAGGTCGTATGCGGTATTAATTCGAG
+TTTCCCCGAGCTATCCCCCACTACTAGGCAGATTCCTAAATGTTACTCACCCGTCCGCCA
+CTAATCATATCTAGCGAGCTAGATAATCATCGTTCGACTTGCCCTGTTAAGCCCGAACGT
+CCTTACTTCAGACGTCCGCAAGTAGCAGTAGGTAATCATTGCGGACGTGCTGAGGTGCTA
+ATTTGCGGACGTGCTG
+>ds2020-267_290
+CAGCACGTGCGCAAATATACTGATGTATTCAACGAGTCTATAGCCTTGGCCGACAGGCCC
+GGGTAATCTTTGAAATTTCATCGTGATGGGGATAGATCATTGCAATTGTTGGTCTTCAAC
+GAGGAATTCCTAGTAAGCGCGAGTCATCAGCTCGCGTTGACTACGTCCCTGCCCTTTGTA
+CACACCGCCCGTCGCTCCTACCGATTGAATGGTCCGGTGAAGTGTTCGGATCGCGGCGAC
+ATTGCGGACGTGCTG
+>ds2020-267_291
+CAGCACGTCCGCAATCCTTCTCCCCTCACCGTCTGAACAAGGTCCGGCATGTTCCATTCC
+GGGGGTAATTGCTTATCGGACCTCGACACCCACTTGGTGTATTCCGAACAGAGCGCCTCA
+AATATTTGCTCACACTCAGGTGGAGCGCTTTGCGCGTCAGACCTAGTCGAAGAGGTACTT
+GACGAGAAAGACATACTCTCATCGTCCAGCATAAAATGTAAATCCCCGGGGGGCAGGATG
+CTTGCGGACGTGCTG
+>ds2020-267_292
+GACGCACTGACCGTGCATCCACGCCTGACGCACTGACCGTGGTTACACACCTGACGCACT
+GACCGTAAGTAGAGACCTGACGCACTGCCGTTAGTGAGACGGTGAATAACGGTCAGTGCG
+TCGCCTTAAGCGTCACGTCCGCAATACGTCAGGGATGGCCTTGCGGACAGTCCAACTCGC
+TTGCGGACGTGCTGAGGGAAGTTTGTTTGCGGACGTGCTGACGGGTAGGAGTTGCGACGT
+GCTGCTCCTTAGATA
+>ds2020-267_293
+ATCTAAGAGCAGCACGTCCGCAAGTTGAGAACCCTCTTGACTACAGACGTTAGCACCCGC
+AGTCTGTCTCCCGGATATCACTCATCGGTATTCGGAGTTTGCATCGGTTTGGTAAGAGAG
+GCGGCTGGAAGCCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCCGTCCGCAACCAA
+TTTCGGGTAGCACGTCCGCAACATCTGCTCCTCACACTCCGCAAATTAGACCCCATATCG
+TTTGCGGACGTGCTG
+>ds2020-267_294
+TCCGCAAGCATAATCCGCTCAGCACGTCCGCAAAGGCCTACCCCCAGCACGTCCGCAAGC
+TGGAAACGGTTGCTGTTGCGACGTGCTGGGCTTAAGACCTTGCGACGTGCTGAGTCATAT
+CTGCTTGCGGACGTGCTGCTCCTTAGATATCCGCAAGGCAACTGGAATTGCGGACGTGAG
+GAGAGGATAGTTGCGGACGTGCTGAGTGACCGTACTTTGCGGACGTGCTGCCTCGAGATG
+TTTGCGGACGTGCTG
+>ds2020-267_295
+CAGCACGTCCGCAAAAGCCCCACCCTGCTTGCAAAATGAAAGAAAAGCCCCTTTTTATAA
+GTTAAAAAGACTGTTATGAAAAAAAAGTGCTAGAATCTACATTTACACATTGATTCTTTT
+TTTTCGTGATTTTTGTTGAACCGTATGCATCAAAAGGTGCATGTACGGTTTCTAATGGAT
+ACAACTTTATCCCATTAAACCGACTTTATAGAGAAAGATTAATTTTTTGAGGACTGGGTA
+ATTGCGGACGTGCTG
+>ds2020-267_296
+CAGCACGTCCGCAAGCCGAGAGCGGTTAGTAACAGATTAAGTGGAGTATTCGTCACACAC
+GACGATACCGCACTTTTACAAGGGTTCAAGTTGTTTAGCTACACAAGGTGAGCAGAGGTT
+ATTAACATGGCATCTCACTCAAGCATGGCATAGCACACAAACATGGCAAGAGGTGAAGCA
+TAAATAAACTACCTAAGCTAGTCAATTTAAGTGGGGTGAAATCCTAGACATGGCAAACTA
+TTGCGGACGTGCTG
+>ds2020-267_297
+GACGCACTGACCGTGTCCTCCTCCCTATTACTCGTGTCCATGAAGAGACGAAATCTGCTC
+GCAACCGCGCTCCTTCGAGCTCCACACCGCTTTCGGGCGGATGAGAGGCACGAAAGAGCC
+GTCGTGAGAATCGAAGAAAGACGAATTTAAAGAACAATAAGCGGACGGTCAGTGCGTCGC
+CTTAAGCGACGTCCGCAAGGAACATCCGGTACTCATTGCGGACGTGCTGAGGAGTCCGTC
+TTGCGGACGTGCTG
+>ds2020-267_298
+GGACGTTCGGGCTTGACTACAGCAGTGAATGAGGACCTGCACAAGGAGTGGCAGGAATAC
+CTGGATGAGACCAAGCATCACGAGCAGGTGCTGACCCAGGTTTTTGAAGAACTGGGATTG
+GACACCGAAGAGATGAGTCCGGGCAGAGAGGTGGTGGCGCATAACGGCGCCTCCTTGGTG
+GCCGAGTATGCATAGATTAAAGCCCGAACGTCCTTATGCGGACGTGCTACCCGGAATCTG
+TTGCGGACGTGCTG
+>ds2020-267_299
+GACGCACTGACCGTTAACCACGCGCTTCAACCTGGCCATGGGTAGATCACTCCGCTTCGG
+GTCTAGGACACGCGACTCAATCGCCCTATTCAGACTCGCTTTCGCTACGGCTTCCCCACA
+CGGGTTAACCTCGCCACGTATCACTAACTCGCAGGCTCATTCTTCAAAAGGCACGCTGTC
+ACCCCACAAGGAGGCATACGGTCAGTGCGTCGCCTTAAGCGACGTGCTGGGGAGCGCTAG
+TTGCGGACGTGCTG
+>ds2020-267_300
+CAGCACGTCCGCAAATTAGTCTGCACTTTATTCCCTTCCCAAAAGCCATAACTCCTCCTG
+GGAACCTTCTCAATCCCCAGATAACTACTACAATCAAACTTCAGGACAGAAGAATTTCCA
+TCAGCATTGTGATGCCAAGTGAATTTTAGGTTAGATGACGTGTTGCTTAACTTATGGTTG
+TGAGCTCCCTTTTCTTCATTCTCCTGGATGTTGGAACCTGACTTGGGCAGGGACTCTGTA
+TTGCGGACGTGCTG
+>ds2020-267_301
+GGACGTTCGGGCTTTGTTTGGTCAATTGTCGCTTGAGTTCAATCCAACCTGCATCGTAAA
+CCGATTTGGCTAGTTTGCCTTTTTACTGTTAAATTGGGTTGTTCTAACGTAACCTACCAC
+GATTAGGAGGCGTGAACAAAAGCCCGAACGTCCTTAATCTAAGAGCAGCACGTCCGCAAG
+GCGTCACTAGTTGCGGACGTGTGAGGGGCTATGTATTGCGGACGTGCTAAGGCCCCCTAC
+TTGCGGACGTGCTG
+>ds2020-267_302
+GTCCGCAAAATTAACACCCTCAGCACGTCCGCAATACATTCCAGTCAGCACGTCGCAATC
+AGGCAAGTTTGCGAGGAGTGCTGTATGCTTGCGGACGTCTGCTCCTTAGATAAAGGACGT
+TCGGGCTTGACCAATCGCCTGGACGTTCGGGCTTGGTGATCCCCTGCCCGCTGTCCTTGA
+CTTGACCCAAGATAGTTCATCACAAAACTTACAAAACCTACCTAACCTATCAGAGCAGTG
+AAGCCCGAACGTCC
+>ds2020-267_303
+GGGGGGGTGTGTTTGGGTGTTGGTGTTGTGGGTGGTGGGTGGGGGTGGGGGGGGGGTTTT
+GGGTTTGTTTGGTGGTGGTGGTGGGGTTTGTGGGTTGGGTGTGCTGGTGGGTTTGGGGTT
+GGTTTTGGGGTGGTGGTGGGTTTTGGGGTGGGTGTGTGGGTGTTTTGTTGTGTGGGTTGT
+GTTGTTTATACGGTCAGTGCGTCAGGGTGGGATTAACGGTCAGTGCGTCAGGGGACGATC
+GACGGTCAGTGCGC
+>ds2020-267_304
+CAGCACGTCCGCAATGCATTTTCGGTCCCTGTTGAGAAAGGCAGATTCTCTCACCCGATC
+TGGGACTACTAATCTCTGCATAATCAAATGAGCACAAAATAAACTTACACTTTGTTTATA
+CCACTGTATTTGGGGTCTCTATTTCAGAAGCTCAGCCTGTGTCCTACTTATTCAACCCCT
+TAGAGGAATACAGCACTAATATAGAGGAAAAGGTAGTTTCCAGGTAAACTGGGGCCCATT
+TGCGGACGTGCTG
+>ds2020-267_305
+CAGCACGTCCGCAATGAGTTGGCACTGAGGGCCTTGAGGGCAACGGAAACGTTCTTTGCG
+ATAGCGGGATTGAGGATGTAGTGGCACGAAATATCCCAACCAACAGCACCGAACTGGTAG
+GAAAGAGAGTACCCATAAATCAATGCGTTGATAAAGGCATCTTCATGGAGTCTACCAGCA
+CAAAGGAAAATCATACCAATCAGTGGGCGGGCACAACCAATGCGGACAAGGGTTCAGTGT
+TGCGGACGTGCTG
+>ds2020-267_306
+CAGCACGTCCGCAATGGCATGGGGATTTAAGAGTTTCAAGAGGAGGATGGGAGGAAAAGC
+TTAAGGCTTGAAGGCTATGGTATTTATAGCTTGGAAGGGTATGAGGAGGACGGAAAATCT
+TGATTGTGATGGTTGATGAATAGCTGGGATGATTGCTGGAATGCTTGCTGCAGCCAAAGG
+GAGAAAGGAAAGTGGTTCGATGGTTGTTGGGGGCTTGAGCAACCAAGAGATGCTGGTGAT
+TGCGGACGTGCTG
+>ds2020-267_307
+CAGCACGTCCGCAAATGTCGTCCCCTCAGCACGTCCGCAAACACTCCGATATGGTTGCGA
+CGTGCTAAGACTTAGTACTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCAC
+TGACCGTGGTTCTTCCTATCACTCGTAACGCTCTCTCTCGCTCTCACTTTCCAACTCCTC
+CCATTCCCCTTTCCCAATCCAATGGCAGCAACCAAATCCAAAATCCTCTTCATCGGAGGC
+ACTGGCTACATCG
+>ds2020-267_308
+CAGCACGTCCGCAATCACCTCTGTATTTTCTTCAAACTCTGACCTACCGTCGGACGGTGA
+TTGGGATTCAAAGTTCTCCGGCTGGAGGTCATAGTTTGAAGCAAATAGCGAGAAGGAGAG
+GGAGAAAAGATAGGTCTGTATTTGAGGAAATAATTAATATTATTATTTCTTTTTTTGTAT
+TTAAAAAATGGGTTTTGGAATTTTTGAAAAAAATAAATTGCGAAGAGAAGGTTATAGAAT
+TGCGGACGTGCTG
+>ds2020-267_309
+CAGCACGTCCGCAACCTGGCGGCCATATAACTAAAAGTAAAGATAAAGTGAATTATTTTG
+TAAATGATATAAATTCATTGTTACATGTTATAATACCCATATTTGATTATGTAAATCTGA
+ATAGTTCAAAATATCATCACTTTGATATTTTTTATTTAAAAAAGGGGGTCGGTGTTATTA
+ACTAAAAATAAAAGTCATTTAACGGCTGAAGGTAAATTGGCAATAAAAGGTCAAGAACTT
+GCGGACGTGCTG
+>ds2020-267_310
+CAGCACGTCCGCAAACCTGGTGGGGTGCAACCTGTGCGGGTGGTCCGCAGCGGAGAAGCG
+GTATGGAATTTGTCCTCCGTTTCCTTAACCAGATGCTCGTCGTGTAGCCTGTTATTGGCG
+TGAGAGCACTTGATCTCGTCTTTGACGTGTTTAGTTCGTTGACTATCTCGGTCGCGACGT
+GAAACAAAGAGATATGACACCGCAAGGGGTCTATCGGGGTACCTCAACGGACTTATGCTT
+GCGGACGTGCTG
+>ds2020-267_311
+TATCTAAGGAGCAGCACGTCCGCAAATGTGTCCCGGTTGTTGTTCGATCAAATGCCAAGC
+CCGGATTTTTATTCGTGGAAGGTGATGCTGAGGTGGTACTTTATGCACAACTTGTATGCA
+GAGGTTATGGGGTTCTATACCCGTATGAGAATATGCGTCAGAGAACATGACAACGTTGTT
+TTCTCGATTGTTCTGAAGGCTTGTAGTGAATTGCGGGACTTCAATGAGGGGAGAACTATT
+GCGGACGTGCTG
+>ds2020-267_312
+GACGCACTGACCGTGGCGGTAGCCCTCCATTCCTGAGCGCACAGGCGCTTTCTTGGATTT
+TTGCCGCTCGCTCAAAGGCCGCAACATCACCGTATTTAACTACCGCATCAACACCAACCC
+CAAATACGACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAAAC
+CACTTCACTTGGGACGTGCTGAGGTGTGCAGCGTTGCGACGTGCTGAGCCCTAGTCGATT
+GCGGACGTGCTG
+>ds2020-267_313
+CAGCACGTCCGCAAGGACACACTCTCAGCACGTCCGCAAGATTTATCTCCTCACACGTCC
+GCAACAAGGGCCGATTATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACT
+GACCGTTCCTTTGATCCTTCTGCAGGTTCACCTACAGAAACCTTGTTACGACTTTTACTT
+CCTCTAAGTGACCAAGTTTGCCTAAGTTTTCAGCGGCCTGCTACCGTTGCCGGTACAAGC
+TGCCAATCCCAA
+>ds2020-267_314
+GACGCACTGACCGTGAAAGCCTCCCTGACGCACTGACCGTTTCGTATGCTCTGACGCACT
+GCCTTATATCCCCTATGGGGGATGGGACGGTCAGTGCGTCAGGGAAGTGTCAACGGTCAG
+TGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAACCCATTACCCGTTAGCAGT
+TGGGACGTGCTGAGGTGGCGAAATTTGGGACGTGCTGAGGGAGGGCGTATTGCGACGTGC
+TGCTCCTTGATA
+>ds2020-267_315
+CAGCACGTCCGCAAGCAGCCATAGGTCTGAGAAGCATTACCGCCAACTGGTGAATCATGC
+GTCTGAAGGCATTATTGTTGTGCAGAATCAGAAAATTGTTTTTGCTAATCCTCAGATATA
+CAAACTCACGGCACGCCAACCGGATTCTTTACTGGCATTCAATTTTACTGATTTAATTGA
+CGAAGCTGATCGGCTGATCGTACAGGATTACGAGCAGCGTTGCTTACAGGGGGAACGTTG
+CGGACGTGCTG
+>ds2020-267_316
+GACGCACTGACCTTTGTCACCACGTTTGTGATCAACGCGTAGAAACTCAGCTATTGCACC
+GAATGCGCACTTAGAGGGCTGCGTTCGTATGCAAAGCCTTTGTCCTCTCTGGAGTGTGAA
+ACGAGTTATTTCCAGTGACGTCGTCCCTAGAAGCACATCGTCACCGTTGTGCAGTGAAGA
+GCCGACTTCTTTCATCGGACCCAACATGAAGTCGGTGTAAACGGCATTTCGGACGAGTTG
+CGGACGTGCTG
+>ds2020-267_317
+CAGCACGTCCGCAATCGACCGCCATTAGCTTGGGACGTGCTGAGGAGATGGAGCTTGCGG
+ACGTGCTGAGTGCAGAATAGTTGCGGACGTGCTGCTCCTTAGATAGGAAGTAAGGACGTT
+CGGGCTTAGAATTATCCCTGGCGTTCGGCTTCCTACAGCGAGTGGAAAGCCCGAACGTCC
+TTACTTCCAGAAGTGCGTCAGCGGGTCGCATACGGTCAGTGCGTCAAGGATGTTTCGACG
+GTCAGTGCGTC
+>ds2020-267_318
+CAGCACGTCCGCAATCTGGACCCCTTTCCTTTGTTTCTACATCCCTATCCCAAAAGACTG
+AATTGAGTTCGTATAGGCATTTTGGATGCCTCTATTGAAATTGCCCTTCTGGCTATATTT
+TCTGCTACTCCGCTCATTGCAGAAAGTATTCTACAGGGTTTAACAACAGCTACCCAATAT
+TCGGGAGATCCTTTACCCGAACCCATAAGTGTATCTGTAGTGCTGAGTGTAACGTGTTTG
+CGGACGTGCTG
+>ds2020-267_319
+CAGCACGTCCGCAAATGAGTCCCCCTAGCTTGCGGACGTGCTCTGGAAGTAAGGACGTTC
+GGGCTTTATGGGAGCTCTGAGCGCATTCTGTTTTTCAAGGGTAATTCCTAGCCTTTCCGG
+ACCAGAGTTGGGCGTAGTTCCTGGATTGAAGTCTGCCTGAGAAGCTTGTACAGCAAGGCT
+CTAAGGTTGCGGCGTGCTGACGTATAGGGGTTTGCGGAGTGCTGAACTCACCAATGTTGC
+GGACGTGCTG
+>ds2020-267_320
+GGAGGCAACTTTCCCGTATGAGCATTCGGTACATGTATCAGTCCGTGGAAGAGTGAAAGG
+GTCACCACTACTGAGGATCTCCCCCCTAATCTTAGATAGGTCGTCTGAGGGTTCGCCGCG
+GTTCATTGCTGTGCTTACACACTAGGCTACCCTTCTCCGAAAGCTCCGCGGGACCACCTA
+CCACTAGTCTTCGGCCGGAGGGGTTTATTGCACAAAAACGCCAGTCCGCAAGCCCGAACG
+TCCTTAATCT
+>ds2020-267_321
+GGACGTTCGGGCTTTTTCAGTTGGGTATGAAGCCCGAAGTCCAAGGAACCTTGTAAGCCC
+GAACGTCCTTACTTCCAGACACTGACCGTCGGGGGACAATTACGGTCAGTGCGTCAGGGA
+AACCTAAAGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATCCTT
+TATGGTTGGGACGTGCTGAGCGGTAGTGGTTTGCGGACGTGCTGAGGGAGCGCAAGTTGC
+GGACGTGCTG
+>ds2020-267_322
+GGACGTTCGGGCTTAACATTGACTCTGGGTAACTGATGTGTAGGATAGGTGGGAGCCTGT
+GATCCGGCGTCGCTAGGCGTCGGTTAGGCAACGTTGAAATACCACCCTTCAGTTGCTTGG
+AGCCTAATCCCCGAGGGGGAGACATTGTTTGGTGGGTAGTTTGACTGGGGTGGTATCTAA
+GGAGCAGCACGTCCGCAACAGCGCCAGAGTGATTGGGACGTGCTGCCCGTGTCATATTGC
+GGACGTGCTG
+>ds2020-267_323
+CAGCACGTCCGCAAAGCCCGCGATGACTTTGTCGTTGTACAGACGGCGGACCTTTTTCAC
+GTTGCCTTTCATTACGGTATTGCCCAACGTGGCCTGACCATCACCAGCGATGACCACATG
+GCCGTTACGGCGTACGCTTACTATAGTTGTCACGAGCTGACCCCTTGGTTACGAATACAG
+AGTACAAACCCCGTACAAAAGTACGGGGCATAATGCAATTATAGATGGCTGAGGTGTTGC
+GGACGTGCTG
+>ds2020-267_324
+TTTCGATCTAGCTAAGGAGGAGCAAGTCGGCAATGAAGCCGCTTTGTATGAGGCGCTTGT
+TTCACGTTTGGGTGGAGAATATCTTGATGTCGCCTTCGATGCTGTAGGAGGGCCACATAT
+TGAACAGATTGCAAAAGCGATGTCTGTGGGAGGACCCGAATGCAACCGGTCAGTGCGTCG
+CCTTAAGCGATCCGCAAGTAGGTAGGTATAGTTGCGGACGTGCTGAGTACAGGTCACTTG
+CGGCGTGCTG
+>ds2020-267_325
+CAGCACGTCCGCAAGCTGATTCTCCTCAGCACGTCGCAATATCATTAGCCTCAGCACGTC
+GCAATAATCGGCCTTTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGA
+CCGTGCGCTTCGCGCTCCCCAATTGTTCGCGCCGAAATTTTCTGTAATCCAAAATGACCC
+GCTGAGATTCGTTGTCCAAATAGTCAAATTTGCGTGATTTGATGGCGTAATAAATGTCAA
+AAATAGACAA
+>ds2020-267_326
+CAGCACGTCCGCAAAGCGGCCCGCTAGCCGTCCGCAACTATCTTCCCCTCAGCACGTCCC
+AACTAGTTCCAGATTGCGGACGTGCTGCTCCTTAGATAAGCTGGAAGTAAGGACGTTCGG
+GCTTGTGGCTCCATCTTATTTAAGGAGCAGCACGTCCGCAAGTGCCAGCTCCTAACGTTT
+GGGACGTGCTGAGGGTACCTACATTGGGACGTGCTGAGGGCAGTGAGATTGCGGACGTGC
+TGCTCCTTAG
+>ds2020-267_327
+CAGCACGTCCGCAAGACATCACCTATTGCGACAAGTTAATGGACACTCCATACACTGCAT
+CCCCAATTGGCCGTTTAGAAGCCAATGGGCTAAGTGCTGGGCTTTTCCCGTTTCGCTCGC
+CGCTACTCAGGGAATCCTAGTTAGTTTCTTTTCCTCCCCTTATTAATATGCTTAAATTCA
+GGGGGTAGTCTCATATGAGTTGAGGTCGCAAGGGAATGGGTTTGCGGTCGTGCTGCTCCT
+TAGATAGAT
+>ds2020-267_328
+CAGCACGTCCGCAATGTTCACCATTTCCATAAACAAATGAGTACTATCCTCGACTGCTAC
+TAACTTTAGTGCGTTCTCAGTTCTGCCTGACGCTCTTAATATTACGATTGACGCCGGCGC
+CTGGTTTGGCCTCAATCGCAGCCTGACATAGTTATTTGACCTTAACGCTGAAGCGCTCGC
+CGTAGCCATCACTATGCCGTGCCAATCATAACCAGAACCTCCCACTGGCGGCGTATTGCG
+GACGTGCTG
+>ds2020-267_329
+CAGCACGTCCGCAATATAATATCTCTCAGCACGTCCACAACTTGATTCTTGCGGACCTGC
+TGCTCCTTAGATACGCTTAGGCGACGCACTGACCGTGTGTAAGCGACTGGGGTACGCCGT
+TCTGGCAAATCTGTTTTATTGATGCAATATCGAGATTATTTGCTGTCCCAACAAATTAGT
+GCAGAAAATATTATTTATATCAATTTTGAGAGTTTTGAGTACCAGTGGGTTAAAGTTGCG
+GACGTGCTG
+>ds2020-267_330
+GACGCGCACTGCCGGCAGCCCGGCCCTCTGCTCTGCCCACCCGCGAAATAACCAGCACGT
+CCGCAACCATGATCCCCTAGCACGTCCGCAAACTAATTGGACTCCACGTCCGCAACTGAT
+TGGTGCTTGCGGACGTGGAGTCCAATTAGTTTGCGGACGTGCTAGGGGATCATGGTTGCG
+ACGTGCTGACGAGATCTTAATTGGGACGTGCTGAGGGACTGCGACTTGCGGCGTGCTGCT
+CCTTAGATA
+>ds2020-267_331
+TTCCGATCTATCTAAGGAGCAGCACGTCCGCAATTTTCGTTCCTCAGCACGTCCGCAAAG
+ATCCAATCCTCAGCACGTCCCAACCGGCTATGGTTTGCGGACGTGCTGCTCCTTAGATCT
+GGAAGTAAGCCCGAACGTCCTTACTTCCAGATCTAAGGAGCAGCACGTCCGCAAACGACA
+CTGACTCAGCCGTCCGCAACCCCTTCCCCTTCAGCACGTCCCAACCTTCCAATACTTGCG
+GACGTGCTG
+>ds2020-267_332
+CAGCACGTCCGCAAATTTCTCTCTTTCCAAAGTTCTTTTCATCTTTCCCTCACGGTACTT
+GTTCGCTATCGGTCTCTCGCCTATATTTAGCTTTAGATGGAATTTACCACCCATTTTGAG
+CTGCATTCCCAAACAACTCGACTCTTCGAGAGCACACCACAATGCATCGGTAGTCCGTGT
+CATATACGGGATTCTCACCCTCTACGACGCTCCGTTCCAGGAGGGGGGTATGCGTTGCGG
+ACGTGCTG
+>ds2020-267_333
+CAGCACGTCCGCAAGAGCCCCGTCTTCCTTCTCCTATTTCAATTCTTGACAAAGCTGGAC
+GAGCACATCATGCAAGTGTTCATATAGAGGATGGTGGAATAGTTTGAGTCTTGGCTCTTG
+TTTCATGTTGACAGTATCAGGTTCTTGATTAAGTTCCTCTGATGTGCTAACAATTTCCTG
+ACTTCATTTTATATAATAGATAGTGGAATAGTAGAAGATACCATGCATGGCCTATTGCGG
+ACGTGCTG
+>ds2020-267_334
+CAGCACGTCCGCAAGATCATGGTCCTCTGCTTTAGACTCGTCCCAGCCCATGGTCACCAT
+GAACTTCAACGCTCGTTTGTTGTAAGGGACATTGACTGTGGCTGGCAATTCAATTGAACG
+TGAAACCCACAGGGCCCGGTCTTCGCCAACTTCACGGATTAGGTCAACCTCATCCCTAAT
+CCACGCAAGGACTACGGAATACAACTTGAAAGGAGCAAATCCAGCGAACTTGGATTGCGG
+ACGTGCTG
+>ds2020-267_335
+CAGCACGTCCGCAACGAACCTCGAGTAAGACAACCAACCCTGGAGGCCATGGCTTGGCTT
+TATCCCGTAGGTAGTAAGAACAGAGAGAGCCTTCTGTGCTAGCAATACAGAGAGGTGGGG
+ATTGAATGAGGCGAGCGCTGACTGCAGCAAGACCACCAGACCCTAAAAAGAATAATAACA
+ACGTTCAGCAAGCCGAAGCCAGCCAGACAGGCACCACCAGATACAGGGCTTGGATTGCGG
+ACGTGCTG
+>ds2020-267_336
+GGACGTTCGGGCTTGGCTTCTAGGGTTTCTGTCAGGGTGCCGATCTGGTTGAACTTGATC
+AGGATCGAGTTGGCGATCTTTTTGTCGATGCCTTCTTTCAGGATCTTGGTGTTGGAGGAT
+TCCCTGAAAGCCCGAACGTCCTTAATCTAAGGAGCAGCACGTCCGCAACCCTTACCCAGT
+GACACTTGCGGACGTGTGAGGATCCGGCCATTGCGACGTGCTGACCCAAACTCTGTTGCG
+GACGGCTG
+>ds2020-267_337
+CAGCACGTCCGCAACTTCAAGGGTGTGTTTTCTTTTGTACCTGCGGGTTATTTTGCTTGA
+TTACATACATATACATGGAATAAAGCAGTTTTACTATCTACTTTGTGACCTGCTGAAGTG
+TTTTTGGTATCATTTATATTGCATTTTTGCAGATAATAGGAAATACAAAGGAGTTTAAGC
+AGAAACTGAAAGATAGCATCAGAAGGAAATCTGATTTGTTTAAGAATGGTAATTTGCGGA
+CGTGCTG
+>ds2020-267_338
+CAGCACGTCCGCAAGCTTTTTGGGGTGTCGAGAGATACCTACACGTCCGCTATTGAGTCC
+CTTGGGTCTTTTTCGTTGACTGAGGTTGAAGAAATTGTAGAAAAATACAAGAAGATGTGT
+CTTACTCCCCTCGAGTGCATGAGGAATTTATTATCTTTCATGTTGCAGATGAGGTGTGGT
+GCGAGAGGCCAAAAAAGAATGGATCCAAATAAAGATTTGTAGCGGCATCATGGTTGCGGA
+CGTGCTG
+>ds2020-267_339
+CAGCACGTCCGCAATACGAGACCGCTCCCAATAGATATTTGAGCATATATTCATGCCCTT
+TACCTGATGAACCAAGCAAGTTTGAACGCCAAATAAACAGATTGCGTGGGAAGTTGGCAG
+GGTTATCTGGGCTTTCACAGGCAAAACTTAATGAGCCATTTTGTAGGCTTTCGACCACAT
+AATCTTCCACTTTCATGCCTTTTGCTTTGGCTTCATTGGCAAAGGAGAGTGAGTTGCGGA
+CGTGCTG
+>ds2020-267_340
+GGACGTTCGGGCTTCTCGCACTGGGTCTGGAGCTGGGTCACGTGCTATCCTTAGGTTAAT
+AATGTTAACAATAAGTCAGTAATTTTTAAAAAAACACAAACTGATAGCATAAAAAAAAAG
+AATGGCGCTAAACCATTCTTTTTTGAAAATGTTTAGTTTTTATATCCACACGCATCAAGT
+CAATTGACGATGATTGACTTTGTCTAATTTTAACGCTTCCAACTATATGCTTATTGCGGA
+CGTGCTG
+>ds2020-267_341
+GACGCACTGACCGTTATAGGGCCTATTACACGGTCAGTGCGTCGGAAAAATGGGAACGGT
+CAGTGCGTCAAGGGACGCCCTACGGTCAGTGCGTCGCCTTAAGCGCTTAAGGCGACGCAC
+TGACCGTAGTTTAATGCCTGACGCACTGACCGTAACCATCTGCCTGACGCACTGACCGTG
+AACCTACCCGTGACGCACTGACCATTTCCCCCCGGACGGTCAGTGCGTCGCCTTAAGCGA
+CGTGCTG
+>ds2020-267_342
+CAGCACGTCCGCAACCCTCTATTGTTATCCATGGATCCTTTATTTATACTTATTCATTTA
+GAACTTATCCATTTAGAATAGAAGTATTGATCCAATAAAAAAAATTATGTTTCGTAATCT
+CATAATCCAATTTTTCAACTTTTCATTGATTCTTGGATACAAATCACGAGAATGTATATT
+ATTCCTCGAATTTTTTATTGAGAGGTAAAGGATTAAATCCAGGGGGATGCGATTGCGGAC
+GTGCTG
+>ds2020-267_343
+CAGCACGTCCGCAAAGGACTAACCTTCAGCACGTCCGCAAGTCAATACCTCTAGTTTGCG
+GACGTGCTGGGGAATTCCGGGTTCATGTGAACAGTTACAGTCCACAATCCCAACCAAGAA
+GGTGGTTCAATGTTTACCCAGACCTCTCGGCCAAGGATAAAACACACTGATACCTTCATT
+GTAGCGCGCGTGCAGCCCAGGACATCTAAGGGCATCACAGAGAGGACACATTTTGCGGAC
+GTGCTG
+>ds2020-267_344
+AGCAGCACTGACCGTCTCTGTTGCCATGACGCACTGACCGTCCTCATGCGACTGACGCAC
+TGACCGTCATGCACCACCTGACGCACTGACCGTTAATTATTGCCTGACGCACTGAACGTG
+GATTGTACGGTCAGTGCGTCGCCTTAAGCGCACGTCCGCAAATGGTAGGTAATTGGGACG
+TGCTGGGGTCTGGAACTTGCGGACGTGCTGGGGCCCTTCAGTTGCGGACGTGCTGCTCCT
+TAGATA
+>ds2020-267_345
+CAGCACGTCCGCAACTGATCACCACTCGAGGGTTTTGGCCTGGCCCTGCCCATTCTGGTG
+GGTCGTTCGTCGAGTGGCTCGTCTGGCGCTTCACTTGGATTGTTGTTAACGCAACTGCCG
+TCGCTGAGTCTGTCAATGCCGAAGTTCGGAAAAGGCATAGTGATAAAATATCACCAGACT
+CTGTCCGCCTTGCAGCAATATTCAGGAGTTTCTTTATTCAAGGTGTTGCTCTTTGCGGAC
+GTGCTG
+>ds2020-267_346
+GGACGTTCGGGCTTTGTGTTGCATGTTTATCAAAAACAAGCACAACAATTGAGCATCTTT
+GTAGAAACGCTACAACCGCCGCTACAATTATTAATTTTTGGCGCGGGGCAAGATTGTTTA
+CCCTTGATGACCATGGCAAAGGCTCGTTACTAAGCCCGAACGTCCTTACTCAGTATCTAA
+GGAGCAGCACGTCCGCAAAAGGAATATTGTGGACGTGCTGAGGGGCAGTAAATTGCGGAC
+GTGCTG
+>ds2020-267_347
+CTTCCGATCTATCTAAGGAGCAGCACGTCCGCAACAAAGAACGCCTCCCTTCTATAACCA
+TTTCTTTACAGAAGGCATCTATTACCCGATCATAAAGATGTTTTTGTGATTTCAACGTAC
+AATTCACAACGATTGTAAAGTTAATATTGTCTCGATGAACAGCGTCTCGGAAACCTTTAT
+TAACTTGATGTTGTAAGTATTGAGTGAAACCCGGATGTGCTTGCGGACGTGCTGCTCCTT
+AGATA
+>ds2020-267_348
+TCTGGAAGTAAGGACGTTCGGGCTTTTCGTAGTGGCTCGTTGGGAGAGGGTGGGTTGTCG
+TAGCTGAGGGCTTTTCAGGGTGTCAGGTTCCGATTCGGAGCTGGTGGTGGAGGTTGGTGG
+GTTGGTAGTAACGGAAACTGCATCTGATATCGATGGTTGCTTGGTAGGTGTTGGTCTTGG
+TCTAAGAGACATGTTGGACTGTGGCAGCGGAGGTGGCGGAGGCCGTGACTGTTGCGGACG
+TGCTG
+>ds2020-267_349
+CAGCACGTCCGCAATACTAACGCTGTCCCCCCTCAGCTCACCCTAGCCCCGGGCCTTTTG
+CTCTTCTAACGTAAGCTCCAAGGCTTCACACCAAGTCTTCACTGACATAATATGCATGCT
+TAAGTAGGGTCAGGCAGAACCGTTGTTGCCTGATGGGAACTTCCCCCATATTGCTATCAA
+TGTCTTCATGTCGCACGACCTCTTAACATTACACCACTGAAACCAAATCCTTTGCGGACG
+TGCTG
+>ds2020-267_350
+AGCAGCACGGCCGCAAGATCCATCTGATGATCGATGTTGGGTATTTTACAATTTGCTTTA
+TTACATTATCATTATATAGGCTCGCCCCAGTTCGCTATTCTTGTGATTCCGAATGCTAGC
+TGGTGGGCTTTCAAAGGTATGGGACGATCAGGATGGCTTGGTCCAGCTCCCTTTAATCTT
+TAGATCAATCATATGCCCTCCCCAACCTTTTCTATCTAGTAGGGCGATATGATGCGGACG
+TGCTG
+>ds2020-267_351
+GACGCACTGACCGTATAATGACCCATGGACGCACTGACCGTCTTCTTATGCCTGACGCAC
+TGACCGTGTGGTCACTCTTGACGCACTGACCGTTGAACTACTGTGACGCACTGACTATGT
+CGACCACGGTCAGTGCGTCGCCTTAAGCGTAGCACGTCGCAAACTTCGGCCCTTAGCACG
+TCCACAAGATCCCAACCGTGGACAATTGCGGACGTGCTGAGGGATACTGCCTTGCGGACG
+TGCTG
+>ds2020-267_352
+AAAAAGGCGACAGAGGCTATTGCCCAGGTAAGCTCCCGGGTGGGACAAATTGTGAAGCCT
+ACCGAGTGCATCTATTCGACTTGCTTCTTGACGTACGGAAAGGAGATGATCCTGAGAGGC
+GCCTACTTGCGGACGTGCTCTCCGTAGATAGATCGAGGCGACGCCCTGACCGCTCGCAGT
+CCTCGACGCACCGACCGCCCCTTCGCCCCTGACGCACTGATCGTGACATGTACGGTCAGT
+GCGTC
+>ds2020-267_353
+GACGCACTGACCGTTCTGCGCTGGCTTTTTCTGAATGAGAACACGCTGACGCCGGTTGAA
+CATACTTCCTGGAAATTAAGTGCGCTGCGTATTTTTCTGCTGTCCGGTTTTCTTCTGGAA
+GGCGGAATTGCGATTCACAGTTCATTGCATGCCTATGCACAAGGCACTTACCCTGTACTG
+TGGGCTTATTCTAGGCGGTGTATAAAGCCCGAACGCCAGGGTGTTCCGCAAGCCCGAACG
+TCCTT
+>ds2020-267_354
+GGACGTTCGGGCTTTGGATTTTTGGTTTTTTCCTCTTTCTCTATCCCTATCCCGTAGGTA
+CAGCGTTTGAATCAATAGAGAACCTTTTTTTCTGTATCTGTATAAATGTATCTAATCGAT
+ATTATTACATTCCAATTCCTTCCCGATACCTCCCAAGGAAAATTCCGAATTGTATCTCAA
+ATTGCGGACGTGTGAGCGAAAGCCTTTTGCGGACGTGCTGGGCCCATGTATTTGCGGACG
+TGCTG
+>ds2020-267_355
+CAGCACGTCCGCAAACCCCCCTCTTAATAATCCCCGTAACCCCCGAGAGGAGCACGGGCC
+ACTTTGGCGTTAGGCCACGCCTTGCGATAATCCTCTCGCCCCAAGAGGACTAAATCGCGC
+CACTGCTCAAATGTCAGCCGCTTGGGAATTGGCACCTCAACACCCACATTGCTATAGTCC
+CGCGATACCATGCGTTTGAAGTTCGGGGGCCAATCGAGGGGCGGGGTCATTTGCGGACGT
+GCTG
+>ds2020-267_356
+TATCTAAGGAGCAGCACGTCCGCAAGGGGTGCGTCGCTGGCGCGCGGATTAACAACGACC
+ATCAACAAACAATCGATTCAGAACTGGCACGGACCAGGGAAATCCGACTGTCTAATTAAA
+ACAAAGCATTGTGATGGCCCCAACGGGTGTTGACACAATGTGATTTCTGCCCAGTGCTCT
+GAATGTCAATGTGAAGAAATTCAAGAAAGCGCGGGTAAACGGCGGATCCATTGCGGACGT
+GCTG
+>ds2020-267_357
+ACAGCACGTCCGCAAAGGTCGCCAGAAAAGTCAGCATAATCAGCCTCCGAAATCATCAAG
+CATGATGTTCTCATCTTCCACGCCAAGATATTTTAGCATCTTAATCACGGCGGCGTTCAT
+CATTGGTGGACCACACATATAGAACTCGCAGTCTTCCGGTGCCGGGTGCTGTTTGAGGTA
+ATTTTCATACAGCACGTTGTGGATGAAGCCCGTATAGCAGGGGAGTTTCCTTGCGGACGT
+GCTG
+>ds2020-267_358
+CAGCACGTCCGCAAAGCTCACTTCGTTGCTCTGTCTCTGTCTCGATCCCGCTCCCGTTCC
+TTGTATCTTTCTCGATCCCGATCACTATCCCTTTCTCTTTCTCTTTCTCTTTCTCGATTC
+CGATCCCGGTCCCTTCCTCTGTCCCTGTCCCTGTCCCTGTCCGAATATTCTCTGTCAGAA
+TACTCACGGCTCTGGCTGCGATGGGTCCGTAGATCATCACTGCTGGCTGCTTGCGGACGT
+GCTG
+>ds2020-267_359
+AGATACGCTTAAGGCGACGCACTGACCGTGGAGTCTCCCCTGGGGAACATACGAAAGCTT
+TGGAATATTATTTTCGGGCCCTAGAGCGAAACCCATTCTTACCACAAGCTTTTAATAATA
+TGGCCGTGATCTGTCATTACGTGCGACTATCTCCACTATAGAAATAAAAAAAGGAAATAA
+AGAAAAAATCCGTTAACGTTAGTAAATACTAGAAACAAAGTGTAGGCTTAACGGTCAGTG
+CGTC
+>ds2020-267_360
+CGCACGTCCGCAACTTTGGAGGAAGAATTAGAAAGTGGCTGTTGAAAGTTGGTCTCTTTC
+AATGGTCCTGCCTCAATAACAGGCTTGTCAATAATTTGGATCTCACTACTCTGAACTGTG
+TGCTTCTCAGTCTCAAGATCAACTGCCGCTGGTTGAGGAGCTGATCTGATGGTAGATGCA
+TGGGGAGGCACTAGGTCAGATTGAACTCTAGGCGGCACAGAAAGATGCTGTTGCGGACGT
+GCTG
+>ds2020-267_361
+CAGCACGTCCGCAATTCGACCCGCTTTTGGATAACAAGAAGGCGAGCTGATCTGCTTTGA
+TCAAGGAAAAAGCCCAGTCAGCCACCAACTCGGTGCAGGTCACGTGACCTGCAGCTCGGC
+CTTCGCTTTTTGAGGCTTCCTCTACCCACATCTCTATGTGCCCGCAGCACTTCCATATGG
+AGAAAGATAGGCTTACCATGTTCCATCAATAGCACCTAACTAATGGAACTTGCGGACGTG
+CTG
+>ds2020-267_362
+CAGCACGTCCGCAACCACCCCCCACTTTCGTTCTTGATTAATGAAAACATCCTTGGCAAA
+TGCTTTCGCAGTTGTTCGTCTTTCATAAATCCAAGAATTTCACCTCTGACTATGAAATAC
+GAATGCCCCCGACTGTCCCTGTTAATCATTACTCCGATCCCGAAGGCCAACAGAATAGGA
+CCGAAATCCTATGATGTTATCCCATGCTAATGTATCCAGAGCGTAGGCCTTGCGGACGTG
+CTG
+>ds2020-267_363
+CAGCACGTCCGCAAAATGTCCCCACTGATACCTAATCGATAACGAACCTGAATGGCTTTT
+TTAGGTCCAATTCCATCAATTTTTGTTGAGGCAATTCTTACTTGTTCATCGGCAACTGAT
+CTAGCTCCTGAAATATATGACATTCTTGATCCTTTCCTTTACTAGTCTTCTCGGCTGGAA
+TCAAAAATGGGCTGTCTCCTCTCTGATGATCTTTTCTATAGGTAGAACATTGCGGACGTG
+CTG
+>ds2020-267_364
+CAGCACGTCCGCAACGGTCAAGGGGCAGCACGTCCGCAAGGTATCCGGGCCATCATTTTT
+CCTTATTTCACTTACAAAATAGGCGTATCACCAACGCAATACGCCTTTGTATAGGTTGAT
+TGATAGGTTAGTTCACTGCATCTTTTAACGCTTTACCTGCCTTGAAAATTGGGGCTTTTT
+TGGCAGGTATTTGGATGGCTTCGCCTGTAGCAGGGTTACGCCTTTTTCTTTGCGGACGTG
+CTG
+>ds2020-267_365
+CAGCACGTCCGCAACTTTCACCTCGTCTTCTTCCATACGTTTCATCACTCTAGCACAAGC
+CTTGAGAGCAAAATTGTATGTGAAATGATCAGACCTAACATTCGTTTCCTGCATATAGTT
+GTAAATATGTATAGCTTTGATGGGGAAGACGCTGTTGGTGTAAGCCCTGATCATGTTGTT
+GCAGATGAGAGGGTCGTCCATGGTGGTCTCTTCGAACAGGGCTTAAGATTTGCGGACGTG
+CTG
+>ds2020-267_366
+CAGCACGTCCGCAAGTGGTAATTCCTCCCTGCTTAAGAGCCACAGCATGTACAACAAAGT
+TTGAACTTCTCAGCAAGATCTAGAAAGCCTGTCCCAACCCGGCTGCAGCCTCCTCTTGGC
+AGCCTCACCTTCAGGCCTTTGCTCCTACAGTTCTCTCTGCTTTGCATGCCTCTCCCATCC
+GCTTGTCCAACTTTTGCTCAACCTTGAACTTTTGCCCATCATAACTCAATTGCGGACGTG
+CTG
+>ds2020-267_367
+TCCGCAATTGCCGTCCCCCAGCACGTCCGCAATAGCAGTCCACTCAGCACGTCCGCAATA
+CGATCTCCCTCAGCACGTCCGCAAAGGGTAGTCAAATTGGGACGTGCTGACCGATGTGAC
+GTTGCGGACGTGTCTGGAAGTAAGGACGTTCGGGCTTAAATTTGCTTATGATGATATGGG
+CTAGTAGCGCAGCGGTGGCAACGCTTTTATCGATGATAGTGATCACCAGAAGCCCGAACG
+TCC
+>ds2020-267_368
+CAGCACGTCCGCAAATATTCCTGGGCAGCATGTCCGCAATTCGTATCACCTCACACGTCC
+GCAACTATACCCTGTTAATTGCGGACGCGCTTAAGGCGACGCACTGACCGTGTCACAACC
+CCTATGGCGTTTACCCTTTGGTTCGCCCCATCATTTGAAGAAGTCAAACAACGTAGAGCG
+GAACTTGCTTTGATAGAACGTGAGACAGGGGCGTGGAAGTGCGGACGTGCTGCCCCTTAG
+ATA
+>ds2020-267_369
+CAGCACGTCCGCAACATTTTATCCATTGGACGTGCTGAGAAGAGGCTTTTGCGGACGTGC
+TGAGTGGGCGGACTTTGCGGACGTGCTGCTCCTTAGATACTGTAAGTAAGGACGTTCGGG
+CTTCCGCATACACCTCTTGGTCACGCTCAAAGGTCAAGGTCATACCATCTTCAGGGACTG
+CCAGTCCTTGCACTTGTACTTCATCGCTCGGATGTAGCATCAGTAATAAGCCCGAACGTC
+CTT
+>ds2020-267_370
+TCAGCACGTCCGCAATCTTCGGTCCGTGCAGCATTTCCACGATATCGTTATGATCAATTA
+ATGGGACTTGGCCGGAAAGTGTTCTTGCCTCTATCATTAGCTCGGGTAGTCCCCGTTTCT
+GGTGTTTCAGTCACCTTTCAATGGCTCCCTTAATTATGCGCGAGGAATTTTCCTCTGGAA
+GCGGGCTAGTCCCCGAAAATGCTCGTTAAAGTTGGGGGGGCAGTTTGTTTGCGGCCGTGC
+TG
+>ds2020-267_371
+CAGCCCGGTCTGACTCAATCGTCTTCCGACTTGGGAAGAAGTGCCCCCGAAGCACTCCAT
+TCATCTGGTGATGAAGAATCTCCTATCGCTTCATCTTCCGCTGCCCTTTCATTCTCTTCA
+GTTGTCTTCCTTCTTCCGTGTGGAGGAATGCCGATAGAACTGTGGATACCTCAGCTTTGG
+GAGAGACCTCCGTTTTGGTCTTCCTAGAAAGTGAGGAGGCGCCAGATTTTGCGGACGTGC
+TG
+>ds2020-267_372
+CAGCACGTCCGCAACCGCATGCGATCTACGGGTGAAAGGGGGCGCAAGCTCTTGCTATTA
+GATGAGCCTAAATCAGATTAGCTAGTTGGTGGGGTAAAGGCCCACCAAGGCGACGATCTG
+TAACTGGTCTGAGAGGATGATCAGTCACACCGGAACTGAGACACGGTCCGGACTCCTACG
+GGAGGCAGCAGTGGGGAATATTGGACAATGGGGGCAGTTTGCGGACGTGCTGCTCCTAGA
+TA
+>ds2020-267_373
+CAGCACGTCCGCAAGCTATACATGCTGCATATCTTTTCAAAGAGGCTGGAAACCAACAAG
+TGAATGGAATTGTACCACCGAAACCAAGTTCTGCTGGCGATTTTCCAATTGGACAGGAGC
+AACTAGTTTCAGTGACGAGGGATCATAATTTTCCCGCTCTGCAACAATATGGGGGGGTCA
+AAGGGCTGGGAGATTTATTAAAAACAAATCTAGACAAGGGATTACATGTTGCGGACGTGC
+TG
+>ds2020-267_374
+CAGCACGTCCGCAATGACTCTCTGTTCAATTGCGACCTTATAATGCAATTGCATTCTCCG
+GTCCAATTGCTGTTTTTGTTTCTGTATTCCTAATTTATCCGCTAGGTCAGTCTGGTTGGT
+TTTTTTGCGCCCAGTTTTGGTGTAGCAGCTATTTCGATTCATCCTCTTTTTCCAAGGGTT
+TCATAATTGGACATTGAACCCATTTCATATGATGGGAGGTGCTGTGTGTTGCGGACGTGC
+TG
+>ds2020-267_375
+TCAGGGTATGGAGCCACCGTCGCATCGGTATAGCATATCGAGTGGAAAAGGCTGATAGGG
+GTCACCACTCCCCGTCCTATTTCCAATGCGAAGAATCCCAGTTGAGTTAAGAAAACAGAT
+AGGTCGAACCTATCCCAAGCATTTATAGCCCTCGTGAATTCTATCTAAGGGGTATCCAAA
+CCACCAACCCCAACTAGATCCAACCAATGCCATTTGTAAAGCCCGAACGTCCTTACTTCC
+AG
+>ds2020-267_376
+GGACGTTCGGGCTTCATTGACTCTTGGACGTTCGGCTTATCGTCCCTACTAGAAAGCCCG
+AAGTCCAGGCCCCTAATTAAGCCCGAACGTCCTTATAAGGAGCAGCACGTCCGCAACTGC
+TGCGCCCTAGCACGTCCGCAAGACGCAACGCCTCAGCACGTCAGTGCGTCAGGATGTAAG
+TGACGGTCAGTGCGTCAGGGCAGAACAGACGGTCAGTGCGTCGCCTTAAGCGAGATCGGA
+AG
+>ds2020-267_377
+CTGGAAGTAAGGACGTTCGGGCTTACCGGATTGCCCCCATCAGCGAAGCCAAACGCTATG
+AGCAAGCATGGCTAGGCAAAATCAATGTCGTCATTAAGTTGCCAGCTATCACGTGGGGGC
+ACAGTGGTATAGTTGCTGTCTTTATCTAAGGAGCAGCACGTCCGCAACAACTGGGATTTT
+GCGGACGGCTGGAGGGCCTGCATTGCGGACGTGCTGAGTGTCAATGTGTTGCGGACGTGC
+TG
+>ds2020-267_378
+CAGCACGTCCGCAAATACAACGGATTACTGAGGTTCTTTCCAGTTCCACGCGTACTTATC
+TGAAACTATACCTATCTTCGGTGCTTTGGAGAGGGAGTACCCAAACAAAGATGAGTTAGT
+TGAGGAGATGACGGGGGGTTCTGGAGGGGTTGACTGATGAAGAAACTTTAAACTTACACC
+TACCCCGCAGATGAAAGGTTTCTTACCTCAGCGCTCAAAGGAAAATGCTTGCGGACGTGC
+TG
+>ds2020-267_379
+CAGCACGTCCGCAATCATATAGGGGTCTTTGCGGACGTGTGAGTCGGGTCAAGTTGGGAC
+GTGCTGAGGGGGTACTAGTTGCGGACGTGCTGCTCCTTAGATACGTTCGGGCTTGTGGAA
+AATCGTAGGCTAAATGATTGTTGTCGCTATTTAATAGCGGATAAAAACGCTGTCCTTCAT
+GCCCTTTTACCACCGCGGCATTGTCTTTATAGGCGGACCGTGTTCAGTAAGCCCGAACGT
+CC
+>ds2020-267_380
+GACGCACTGACCGTGGCATTTCCGATGTTGATTAAACAATCATTCCCAGATGTGAATCCG
+CTTAAAGTGGCGTTTTTAGGACCTTTGGTTGGTGCGTTATTCCGTCCGTTCGGTGGCTGG
+CTTGCTGACAAATTGGGCGGTGCAAAAGTCACCTTAATCAACTATGGCGTGATGGCTATT
+GGGACGTGCTGAGGTGGTGGATATTGCGGACGTGCTAAGTGGCTGGGCTTGCGGACGTGC
+TG
+>ds2020-267_381
+GGACGTTCGGGCTTTGATGACCTCCTCTCGTGTTACTGCCAGCTTGTCAATGTAAGCTTA
+TCAAGGTTAAAATGTTGTTTTTTAAGTTAAGCCCGCTACCTATTTGAGCCGTTTGTCAGT
+TCGTAGCCAGTTAGCGTATTACCCCACGAGATAAGCCCGAACGTCCTTATCTAAGGAGCA
+GCACGTCCGCAAAGTATATTCGCTCAGCACGTCCGCAATAGGTACAGCCTTGCGACGTGC
+TG
+>ds2020-267_382
+CAGCACGTCCGCAAGGTCTCATTCATCCGCCCTCATGATTGGGTGAGCCACGAGGGGGAG
+AGAGACAATGTGGAGGGGTCGGATGACGTGGACATGGTTGCGGCGGGGCGCTCTAACTCT
+GACTCCGAGGCAGCCGAGGAGGAATCCTCGGAGGATAGTGATGATGAGGCCACGAAAGTG
+GAGGAAAGGGGAGTGGGGGGGGCCAATCCCCCCTCCACGGTGATTTCATTGCGGACGTGC
+TG
+>ds2020-267_383
+GGAAGTAAGGACGTTCGGGCTTGTTGTCCCCTCGGACGTTCGGGCTTGATCTACGGGGGG
+ACGTTCGGGCTTGTTACGTAACCTGGACGTTCGGCTTAGAGACCACCGTAAAAGCCCGAA
+CGTCCTTACTTCCAGACTCTAAGGAGCAGCACGTCCGCAACTTCTAGGCCTTAGGGGTTG
+GGACGTGCTGAGTGTATGGTCCTTGCGGACGTGCTGAGGGTCGGCCAATTGCGGACGTGC
+TG
+>ds2020-267_384
+ATCTAAGGAGCAGCACGTCCGCAATGGCCACTCACTCGCTTGAAGATGCCGAATAACCGC
+CGGTTCTTTAGTACTTGGTTGGAATACCCAAGAGATCCCACTGGATAAGGCCTATTCCCT
+GCTCGTAAATTAACGGTTTAAGTTCATTTTTTCTTACTGTCGCAAGCCATTCTTCCACTC
+TATGATTATGATATGATTCACTTTCAAACGGAACAGGGCCTCTCATTTGCGGACGTGCTG
+A
+>ds2020-267_385
+CAGCACGTCCGCAAATCCAGGGTGGTGACTTGGCGATGGGCGGCGGCGTCTGGGAGCCTA
+AGCTTGACCTCAACCTCCATTAGAGGTTTGAGAATGTGAGACATAATACGGCGAGTTATA
+TTTTGGTGTTTGGGGTGCATAACTTTCAATTAGAAGGGACGGGCCTTTGCGGACGTGCTG
+AGCCTTAAATAATTGCGACGTGCTGAGTGCAATGAATTTGCGGACGTGCTGCTCCTTAGA
+T
+>ds2020-267_386
+CAGCACGTCCGCAAGCAGTCGCACCTTCTCCTTTGAGCACTCCACCCGCCGCCGCTCCTT
+CTCCTTTGAGCACTCCACCCGCTGCTTCACCTTCTCCTTTGAGTACCTCACCTTCTCCTT
+CGGGCACTCCACCCTCGGCTGCTCCTTCTACATCTCCGGTCGCAGACTCTCCACCTTCTC
+CCCCATCGTCTTCTCCTGAATCTCCAGCCAATTCCCCTTGCGGACGTGCTGCTCCTTAGA
+T
+>ds2020-267_387
+GCGCACTTCCGATCTATCTAAGTAGCAGCACGTCCGCAATTGAAGGGATCTCACACGTCC
+GCAAAGGTCGTTCAGTCAGACGTCCGCAATATGCCTGTCATTGGGACGTGCTGACGGGTC
+CGCCGTTGCGGACGCGCTTAAGGCGACGCACTGACCGTGTCTTTTTGGCTGACGCACTGA
+CCGTTGGTAAGTCCCTACGCACTGACCGTTGTCGACAGCCTGGTGGGACGGTCAGTGCGT
+C
+>ds2020-267_388
+CAGCACGTCCGCAATCATCCGCCCATGCACATTTAGCACTTTGGATCCTGGTGTTGAACT
+TCCGCCCCAGACGTAATGACTCCCTAGCCACTTTCAAGCTGTGTGTGCCGATAAGGACAT
+CGTCTCCGTTGTGCAGGCTGTCCCCTACTTCTCGTGCCCCTTTAGTGATCTTGTCCGTAT
+AGATGCTGTTCAATACTGAGTTGATGAAAGTGGTCACCCCCATCACCTTGCGGACGTGCT
+G
+>ds2020-267_389
+CAGCACGTCCGCACCTGGCATGAGATGGTTGGTACCTAAGAGGATGCAGGGGATTGGAGC
+AAGTGGTGCGGTTGACATGATACCAGATAAGCCAATGCTTGGAAGCGCGTGTACACTAAC
+AGAACTGCAAGAAATTGTTGACAAACTGCAAATCATCCACCCCCCACAAATCAACCACAA
+TGGAGCGGAAATGCTGGCCAATGTATTGGCTAATGATAGCGACCTACTTGCGGACGTGCT
+G
+>ds2020-267_390
+GACGCACTGACCGTAAATCAGCCCATGAACTACGGCAGTGCGTCAAGGTCAGTATTACGG
+TCAGTGCGTCACGGGGGCGCAACGGTCAGTGCGTCAGAGCGTTATACAGGTCAGTGCGTC
+GCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAATGTTTACCACTCAGCACGTCCGCA
+ATATTTCCTCACTCAGCACGTCGCAACCCCCAAGCCTTGCGGACGTGCTGCTCCTTAGAT
+A
+>ds2020-267_391
+CAGCACGTCCGCAAATTTCTGGGGCAGCACGTCCGCAAGAAGGTTTAAACGTCCGCAAGA
+CTGTATGGTTGCGGACGTGCTGCTCCTTAGATACTGGAAGTAAGGACGTTCGGGCTTGTC
+CATACAGGTAGCGGAGTTGAAGAAAGGGGTCGGTTTAGGACCGGAATCAGCTTCACTTCC
+CTGGCCCGTTTCCGTACCCGTTCTCGGCGGCCGGGAGCGGGTCCAGTAAGCCCGAACGTC
+C
+>ds2020-267_392
+CAGCACGTCCGCAAGTTGTCCGGCTTAAATCTTTAGCCCCTAACTTAAGTGCCGCTACAG
+CTCCATTTTCTATTACTTTTTTTGTTCTATCACATAACCACATTCCTTCGAAGACTGATA
+GTTGTGAAATTTCATATATGTTGTCTTCATCTAAGTAATATAGAAATTTGAAACTTGGTG
+TTGCGTCCGTTAAACGTAGATCAGTGAAGTACGCACCCATTCGTAGTTGCGGACGTGCTG
+>ds2020-267_393
+CAGCACGTCCGCAAGATTTTCAGGTTAGGGTAATTGTAATCCACAATTTTGAAATATCGA
+GCAGTGGCCTCAAGTTCATTTTCTTCTGAAGCAAAGTTCTCAGCACGGCGGTATTCCAGA
+GCCATCTTGCGTAAGTCCTCCAGGTCTTCATCAACCATTATCTTCAGGTTTCGGATCCCT
+TGTTTAAAATCTGAACCACAAAGGACCCACTCTTTGAATCCCATGCGTTCAGCTATGGGA
+>ds2020-267_394
+GACGCACTGACCGTCCGCCCAAATGTACGTATTTGGCAATCACTTGCTGATGGATGGGGA
+AATTACCGAGCGTTGCCCCTGCTTTACGGTCAGCAAAATAATGTTGCAGGGAGCGTGATG
+GGCACGGTCAGTGCGGATCTAAGGAGCAGCACGTCCGCAATGCTACTTGTATATGCTTGG
+GACGTGCGAGTGTTACTCCCTTGCGGACGTGCTGACGAAACTAATGTTGCGGACGTGCTG
+>ds2020-267_395
+GACGCACTGACCGTTGGACCCCACCTAGTCCAACCGAACCGGATAAATCGGTGACACGGG
+ATGCTGAGCTATTAATGGTAGGCAAACACATCAACGCCAACGACTTGACGGTGATTGTTG
+CAGGTGATTTTAACGATGAGGCGACGGTCAGTGCGTCGCCTATCTAAGGAGCAGCACGTC
+CGCAAAGGTACCCCTCTTGGATTGCGACGTGCTGACGAACAGTATCTTGCGGACGTGCTG
+>ds2020-267_396
+CAAGCGCCTCCGCAGGCACTCTTGCAATAGGAGAATATGCTTTTCATTCACCACTCTAGT
+CGACGGAGACAACTACTATCGGATTCAGTTGAGCCAGCCTTATGAGGGCCTTAGTGCGCT
+AGGTGGTAGTTCAGCTGTAAGTGTCAACCAGTCGGAAGGAGAACTCATAGCAGGGGGGGA
+ACCAATTTCAAGGGGAGAGAAAGTGAGATAATGAAGGGACGGGGAGAAGCCCGAACGTCC
+>ds2020-267_397
+CAGCACGTCCGCAAATCATTCTCCGTTTGGGACGTGCTGAGGACGTAATATTTGCGGACG
+TGCTGAGGGATAACCGTTTGCGGACGTGCTGCTCCTTAGATACTGGAAGTAAGGACGTTC
+GGGCTTCACTCATGCATTGTACCAATATCAACCTTAGCCATGACCCTCTCCTCAAACTCA
+TTGAGCCTTCTCTCAAACATGCCCTCAAGTCTCTCAGGGGGTTAGTAAGCCCGAACGTCC
+>ds2020-267_398
+CAGCACGTCCGCAACGGGTAACTCGTATATTCTTCTCATCAAAGCCACCAAAGACTTTCC
+TGTTGCTTTATTCTCACACGTTTCCTCAATAATTTTTTCTCTCATGATTCTCACCGCCTC
+TATAGCCCACAATCTTTGCTGTGCATCGTAAGATGAGTGGTCCAATGACACCCTCCAAGC
+TTTAACTTTGTTATGTCTCTCTCTCTCCTCTGCTATCGCGGGCCCTTTGCGGACGTGCTG
+>ds2020-267_399
+CAGCACGTCCGCAACTTTCTTCGCCTCTTTTTTCGACAACCAGTATAGAAAGTATCTCGC
+CCCTCTGTAATTCTTATCCGTCCCCAGATGCTGAATGAGCTAATCCTGATCTTTCTCTCA
+TAGGGTGAGAACAAGCTCGACCACTCTTAAGCTAGCCCGAAGCTTGATCCCGCGGCCCCG
+ATGCTACACATCAGTTCTGAACTCTACACATAAGTTCCTTGGCATTGCGGACGTGCTGC
+>ds2020-267_400
+ATCGAAGGAGCAGCACGTCCGCAATCAGGGACCTCGTTTCTGAACAACTGACCCACGGTG
+AATATCCTGTGTCCTACTCTGAGTGCTGGCAACATCAATGCCTGGCTCATCGTTATGTCG
+GTAGGCACCACCAATCCATGTTTCTCCACGTTATCGCTCATCGTCGCTTTGTGGTTCACA
+GCCCCCATGAGGTCACCTACCGGCACGTTTCTCAGCATACCAGCCTTGCGGACGTGCTG
+>ds2020-267_401
+CAGCACGTCCGCAAGTCTTCCCTAGTACAAGCAACTAAATTCAGTTAGCCCTTTTCCTTG
+GGAATGAACTGGATTTAGTTGCTTGTACTGGGGATTGGCTTAGCAGGAAGATTGGATATG
+ATTCTACTCGAGCGAACCCTGCAATGATTATAAGAGCCCAAGTGAGTCTTCCTTATTTTA
+CTGGAAGTGCTTTAATTTAAGGTGAACTATAAGACGAAGAGTTAATTGCGGACGTGCTG
+>ds2020-267_402
+TATCTAAGGAGCAGCACGTCCGCAATGGCAAAACAATCCCGAAAGAGAGCAAGATTTACC
+AACAGGTAATGTAACGTGGCAAGCATTGAGCAAAGTTGCTGGACTAAGAGAAGTAGATAA
+ACGGCGTTTTATGGGATTATTGGGAAAAGTTGTATTTGGTGAGAATGGGAAGATCACACC
+GTATTTCACATCAAACGACAAAGTTATTGAGGAAGTGGACCCATCTTGCGGACGTGCTG
+>ds2020-267_403
+CAGCACGTCCGCAATGACCCTTACCCTAAACAATCTTATCCGGTAAAGCGAATGATTAGA
+GGCTTATTGGGGACGAAACGTTCTCAACCTATTCTCAAACTTTAAATGGGTAAGACCTAG
+ACTTTCTTGATTGAAGTCTTACAGGTTTAGATGTATGTTGTACTTAGTGGGCCACTTTTG
+GTAAGCAGAACTGGCGCTGTGGAATGAACAGAGCTTGCTGACGTGCTGCTCCTTAGATA
+>ds2020-267_404
+GCACGTACGGTAACGAGGGGGGTTCGCGTCTATACGTGTAGTGTGGTGGTTGGGCCTACC
+CACCCTATTTGTTCCATGATCTATGGGTCTACTGGAGCTACCCACTTCGATCAATTAGCC
+AAAATTTTGACTGGATATGAAATCACTGGTGCTCGATCTAGTGGTATTTTTATGGGGATT
+CTATCTATCGCTGTAGGATTCCTATTCAAGATCACTGCAGATCTTTTGCGGACGTGCTG
+>ds2020-267_405
+GACGCACTGACCGTTATTTCCGACCTGCACGAATGGAGTAACGATTTCCCTACTGTCTCC
+ACCATGAACTCGGTGAAATTGCATTACGAGTAAAGATGCTCGTTACGCGCAGCAGGACGG
+AAAGACCCCGTGACCTTTACTACAGCTTGGTATTGGTGTTCGGTGTGGCTTGTGTAGGAT
+AGGTGGGAGACTGTGAAGCTCAGACGCTAGTTCGGGTGGAGTCATTGTTGAAATACCAC
+>ds2020-267_406
+GGACGTTCGGGCTTCAGTTTTTTGGTGGTGGTGATGTTTGGATCGTTGATCTTGGTGTTG
+GGTTTTTGTTTTGATCGATCTTGATTCTTGCTAGAAAGTGATCAATTTAAGGCAGAGATA
+GATCACAAAGCTTCAGAAAAAGAAAAATGCTTGGAAATGGGGTGGTGGGGATTTTTTCAG
+AGTCAGTGAACAAGTGGGAGAGAAGAGCACCTTTGACTCCATCTCACTGTGCTAGGCTG
+>ds2020-267_407
+GGACGTTCGGGCTTCAGGATATGCTTAGAGAAATGTTTATTTGCTGAGATACTGGATGCT
+TACCGAAAGAGGGGAATTGCACGTAAGAAAAGAGAGAATCTTCATAGACTGGCTTCCACC
+AATCGAAGTTTCGCGCATTTCAGATGGTGGTAAAGTGAGACACATAAAGAGCTCTTCCTC
+ATTCAGTCTGATTATTCAGTAAGAGATGGTTTGACCCTTTTTCTTTTTGCGGCGTGCTG
+>ds2020-267_408
+CAGCACGTCCGCAACCCGTTTCGCTCCAAACCCTAAAAAATAGGGTAAGGCAAGGTAAAG
+AAAGTCAAGAGCAAAGGCAAGGTCAACGGGCGTGACACAGCGGAAACACACCAGCAAAGG
+CATAAGCAACAATATTGGCACCATAACAGGCAGGAGCAATACAAGGCACTGGCACCAACA
+AGAGTAATACAAGGCACTGGCACCAGCAAGTCAAGGTAGGGAAATTGCGGACGTGCTG
+>ds2020-267_409
+CAGCACGTCCGCAAGAGTTCCGCCCTCATCATCATCATCGAAGTCCTCAAACTCCATGTC
+AAACTGCTCTGCCAAAACCCTCCACAAGTGCTTCCACTTATACAAATCCCCATTGCTGCA
+ATTGAAAGCCTCATTCTTGGCATAAGGATCAACTGCTGCCCATATCTCATGCTCAGCAAT
+CAGATCAGCATCTGAGGCATCCCAGTACCCGTACCAAAATCCCGTTGCGGACGTGCTG
+>ds2020-267_410
+CAGCACGTCCGCAAGCACAAGATCCTCGGCGCGGAATATAATCCCAAAGTACTCCAAAGA
+CTCAATTATAGTAAATCAAGAAGGTGGTAAGACCCTTGCAGAGTTCCCCAACAGCATAGA
+GCTGGGGAAGCTCGGACCCGGTCAAGATCCGAACAACAAGGAGCACTCAACTACTAGTCT
+AGTCTAGTAGTTGTTTTTTTCTATTAGTTGCGACGCGAACCCAATTGCGGACGTGCTG
+>ds2020-267_411
+CAGCACGTCCGCAAAGTGAGGCCCCTTCTGACCCCTTCTTTATTGAGCCCCAGTCACTGG
+TGGATGGTTGAAGTCAGTCCTCCCCCTACACGGGGGCGAGAGTTTGGCACCTCTCGGACT
+GTTCTAGATCTCGGCATCAGAAATCATGTCGGACGTACCATCTTCGTTCCGATCTCAGCG
+AGCAATGTTTTCGCTTGTCTGATTGAAGGAATATGACTGCTTACTTGCGGACGTGCTG
+>ds2020-267_412
+CAGCACGTCCGCAAGCGTCTTTCCCCCCCTTTTTGTCTGTATGAATTTCTGACCGCGCGG
+AATCTCCATAGCCAATTTTCCATTTTTGATTATGAAATCATAGGGTGCCTTTGGTAAAAC
+TCTTATTTCACACGATCCAGGAACTTCCATAACGTTGGCGTGATTCAGTTTGAGCAACGG
+ATCCTGACGTGATACATCTTCGTAATGAAAATAGAGTGGAATGCTTGTGGACGTGCTG
+>ds2020-267_413
+CAGCACGTCCGCAATTTCTTCCTGATTGTAAAATTGAATTAGTGAGGTCCTTTGCGTGAA
+CCACATTAATTGCATATTTGCATCCTATGATAGCCAAGGAGGTTAGAACCTCCTTGCTCA
+TAATGTGATCTACATCCCAGTATTCTTCGCAAAAGAAGAATCGGTTATGGCTAAGTCCTG
+ATTTGCTAGCTTTCACTAGCATTGCCATGCTGACCTGGGCCAGATTGCGGACGTGCTG
+>ds2020-267_414
+GGACGTTCGGGCTTAAGGCTGGTGTTAATAGCGGAACTGACGGGGCGACAATATCAGCAT
+CAGTTAAGGGACAGGCAAGTAACCAATACTACTTGAATAATGGAACTCATATCCTACCAA
+ACTATTCGTCAGCAGACTTACTAATAGATGAATGGTTATCAATTTACGATAACACAGAAT
+TAGTTATAAAAGCGATGAGGACTACTTACGGAACATGAAGATGAAAGCCCGAACGTCC
+>ds2020-267_415
+CAGCACGTCCGCAAAAGTCTTCTCATGCGGGCGAAGGAGATGCATTTCTGGTACTGGTAG
+TACTGGACAAGCTCTCAGGGAATAATCTCTTTCTTATTTCTGCCTTTCTTTCCCATGACG
+ACTAGGAACGGGCAAATCAAAAATTTCACTTTGAATTCCGGACCTCAACATCCTGCTGCT
+CATGGTGTTTCACGATCAGTATTGGAAATGAACGGAGAAGCTCTTGCGGACGTGCTG
+>ds2020-267_416
+CAGCACGTCCGCAACGTTTTAGGGGTGTAATTTGCGGACGTGCTGACGGCTTGGTCTTGC
+GGACGTGCTGACACCATTACCTTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGAC
+GCACTGACCGTTGCATGAGATATAACACGGTCAGTGCGTCACGGAACGGAGTACGGTCTG
+TGCGTCAGGGATACGACCACGGTCAGTGCGTCAGCAGTATGAAACGGTCAGTGCGTC
+>ds2020-267_417
+TATCTAAGGAGCAGCACGTCCGCAACATTCATGCCCTCAGCACGTCGCAATATCGGCCCG
+GTCAGCACGTCCCAACTCTCCCACCACCACCAGTACCTTACCATGCTTCCCCACCTGATC
+ACTCTAAACATGATCTAGTGCCGCCATTACCTCCAAATCATTACTCGTATGCTTCACCAA
+CAAGAGAACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAT
+>ds2020-267_418
+CAGCAGTCCGCAAGTATTACTCAGTGTACTCCATTTGGTCCTTGTCGCTGAACCTCTTTG
+ATTTAGATGGAGGGGGACTTCCTTGATAGTCATTATCATAAATACCTTCATAGTTTACCT
+CCGCTGCAACAGCATTGTAGTAGTCCTGCCTCTTGCACCGGAAAACTTCTACATACCTCC
+GCCCCATGTTCTGACGATCTCTATGAAGAGCAAACTCAACCTGTTGCGGACGTGCTG
+>ds2020-267_419
+CAGCACGTCCGCAACAGACGCAGAGTTGAAACTCTCAAATTGTTTGGTGACGATCTTCAA
+CCAACCTACGTTTATATCGACAAGTCGAAAAACTTTTTCATCGGGAATGCTGCTTCCGCG
+AAATACGAGACAAATCTTAAGACTAAATCAGATGATGGTTGGTTGTATAAAGATATAAAA
+CGTTGGGTAGGTGTGAACAAACACAACTTTACGGTGTAGCGTTTGCGGACGTGCTG
+>ds2020-267_420
+AATGATAAGGAAGTGGAAAGCACCTTTGGCAAATGGACCTTGAGCCAGGCATCTGAGACA
+GGCAATAATGATGAATGGGATGATAGTTTGCTAACTAAGGAGGAAGTGGAGGCAAGGTTG
+CAGAAGAAGGACGAAGCCCGAACGTCCTTACTTCCAGACACGTCCGCAATTCCTAATCGG
+CACTAGGTCGGGATATTTGCGGACGTGCTGAGGAATCTGGCCTTGCGGACGTGCTG
+>ds2020-267_421
+GACGCACTGACCGTTTCCTAATCCCTGACGCACTGACCGTAAGGCTCCTCGTGACGCACT
+GACCGTAGAAGGCACCCTGACGCACTGACCGTAATTCACAGGTTCGGCGACGGTCAGTGC
+GTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAACCCCAATGCCCTCGCACGTCCG
+CAAGTGACTCTCGCCACACGTCGCAACCATAAGGGGGTAACATTGCGGACGTGCTG
+>ds2020-267_422
+CAGCACGTCCGCAACACACCCATCGTGTAACGCTCTCTCTCTCCGACGCAGTCATCTTCC
+TCCCTCAGCCATCCAAGCTTAATCCCACAGTTCACATCCACGAGGTACTGTTCACGTTCC
+TTTTCTTAGAAATTTGGGGTTTTTGTGTATTTGGTTTATGGTGTATGGATTTGTATTAAA
+TTGGTTGAGGGGTTTCTTCCAAATTGGTTTAGGGTTTGCGGGTTGCGGACGTGCTG
+>ds2020-267_423
+GGACGTTCGGGCTTTTCGTCGTGCCTTTGGTATCATGCTACCGGCGTATGGCAATGAAGT
+GATTTTTATGCTCAAAGGCAGTGCGCTGGCATCGACCATCACTTTGATGGATATCACCGG
+TGAGGCAAAGACTGAAGCCCGAACGTCCTTACTTCCAGTATCTAAGGAGCAGCACGTCGC
+AAAAAGGCCCCACGTTTCTTGCGGACGTGCTGGGGTATGTCCCTTGCGGACGTGCG
+>ds2020-267_424
+GGACGTTCGGGCTTGGTGTAGGCTGTGGTCGGCTTTGTTCTACTTGTCGTTGCTTTTCGA
+CTTCCAATTGTGCATGTTGCTCTGCAAAGCTTTTTCCGCTTTCCATTGCTCGTACTTACT
+CATGGCGGAACCCCTACTAGAAGCCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCA
+CGTCCGCAATTCATTGAAGATTGGGACGTGAGTACGTACACTTTGCGGACGTGCTG
+>ds2020-267_425
+CAGCACGTCCGCAAGTGTGTCGAACTCCCCCTCCCCCCCGCCAATAAGTCTGTCTTACAT
+TTGTGCAGTAAATCATGCTCAAACGCCTTCAATGGCTTAGTGTAGGTCTCTTATGTACAA
+TTTAAAATCCTCAATAAATGTGCCTAACTGAAAGTTTTAGCTCTGTGCCTCCTCTCTCAT
+ATAATCTCTTATTTGATTACTGATGCTTAACCTGACGAGATTTGCGGACGTGCTG
+>ds2020-267_426
+CAGCACGTCCGCAAACAGCACCGCTCAGCACGTCCGCAAAATCCTCCGCTCAGCACGTCC
+CAATGCGATAAGGCTTGCGGACGTGCGCTTTAGGCGACGCACTGACCGTAATCCCTCCTT
+TCGAAAATCCTGCTTAGCCGGAGCTCTCACTGAGAAGGCTGGCCTATAGGAGACTGCATT
+ATTGGCAGATACTCTGAACTCCATTTCTTTACGAGGCTTCCTAACCCTAACGCTG
+>ds2020-267_427
+GGACGTTCGGGCTTCTTTAGCTTCATACCTATCCTCAGAATCAGAACTCTTTTCTCTCTC
+AGAGCGCCGACTATCACGGTCTCTCTTATCTTTATCTTTATCTTTATCCCTGTGTCTCTC
+TCCATTCCTCTCTTTTTCACGTTGCCGATCTCGATGACTCCTCTTGGATTCCCCCTCCTT
+CCTGGATTTATGCTTGCCCTCTTCCATTTCTTTCTTCCTGATACACGACGTGCTG
+>ds2020-267_428
+CGAAAAAACCAAATTCAGCTCTACGTAAGATGGCCAAAGTACGTTTGAGCAATCAACATG
+ATACATTTGCTTACATTCCAGGCGAAGGTCATAATTTGCAGGAACATTCTATGGTGTTAA
+TAAGAGGAGGTAGAGTGAAAGATTTGCCAGGTGTGAAATTCCATTGTATTCGAGGAGTCA
+AGGATTTGCTGGGAATTCCGGATCGAAGAAGAGGGGCTACAACGGTCAGTGCGTC
+>ds2020-267_429
+GGACGTTCGGGCGTCTATTTACGGATGGCAGCCCAAGGCGCAATCTTTCAGGATCATGCA
+CGTCCGATGTTTCCGCCATGGCCCGGGACCCGATGAAGAAAGCCCGAACGTCCTTACTTC
+CAGTAGGAGCAGCACGTCCGCAAATGTACTCCGCTCAGCACGTCCGCAACGTGTCACCAC
+TCAGCACGTCCCAAGTGTCCACTGGCTATAGATTGCGGACGTGCTGCTCCTAGAT
+>ds2020-267_430
+CAGCACGTCCGCAAACGCTCACGCTTCAGCACGTCGCAATGTTCGTCCGGTCAGCACGTC
+CACAAACCCTGAATTGCGGACGTGGCGCTTAAGGCGACGCACTGACCGTGCAGCCCCTGT
+TATATTGTCGGTGCAGGGCTACTTGACCAGTGAGCTATTACGCTTTCTTTAAAGGATTGC
+TGCTTCTAAGCAAACCTCCTGGCTGTCAGTGCTTCCCCACTTCCTTTTCCACTTA
+>ds2020-267_431
+GGACGTTCGGGCTTTCACTCCCAGATATAAGCCCGAACTCCAGGATGCCAGGCAAGCCCG
+AACGTCCAGACAGAAGAATAAGCCCGAAACGTCCACCGGAACGCACAAGCCCGAACGTCC
+TTACTTCCAGTATCTAAGGAGCAGCACGTCCGCAAGTCACCCATCGTGCGGAGAGTGAAT
+TATAATTGCGGACGTGCTGAGGGCGGTTTTTTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_432
+CAGCACGTCCGCAACCTGCTTTCCCTCCGAATAAGCAAAATAAGTTTATACACCTAATTT
+TGTTCCTGCCGATTGAATAAGAATCAAATACAATCAAGTGGAATAAAATTCTAATGAAAT
+ACAAAAATTTTTAAAATTAAATTAACTAAAGAGAGAAGGTAGGAAGGGGGCAAATACGGT
+CAGTGCGTCGCCTTAAGCCCGAACGTCCAGCCCGCATGTCAAGCCCGAACGGCC
+>ds2020-267_433
+TATCTAAGGAGCAGCACGTCCGCAAACGCATGCACATTGGACAGCGATTGGTTGGGTTGC
+CCAAGGTACGGCTTTAATTGTGTGGGGAGTAACTGAGCGCTACCGTTTAAGCCGATATAT
+TGGTGTGGTTTTAGTTTTACTTAGTTCTATTGCGCTGTTTTATCAGGTGTGGGTAAACGA
+AGAGTTCCCAACGCTAAGCACAAGCATCACAGCCAAACGATTGCGGACGTGCTG
+>ds2020-267_434
+CTATCTAAGGAGCAGCACGTCCGCAACAATAATTCCTTATTGAAAAATTCGCTCACAGGG
+CTTCTGCAACTGGGTAATGCATGCTTGTGAGCGAATTTTTCAATAAGGAGCTCCCACAAT
+AAGAATGTGGGTCTGGGCTGCCAACCACAAGGTCACCAAAATCATTGTTTGTGTCAACCA
+ATGTTTCACGGGAATCCAGATATCTGTGAGACCAATTCGAAAGCCCGAACGTCC
+>ds2020-267_435
+CAGCACGTCCGCAATTTTGCAGCCATGTACGCCCTGGCCATGGCTGGTCTGTTCACGGTT
+TTGAGGTGTTCCGTTGCCTGCTCTTCAGCGGCCAATATCTCCTTGTATGACTTAGGCGGC
+TCACCGATGGCAAGCGTCGTTCCCAGCGCCTTTGCCATAAGGTTAGACAAATCCCCCGTC
+CTCACGATTTGAGACCCCCTGGCGGCGCCCACCCATGATGTTGCGGACGTGCTG
+>ds2020-267_436
+GACGCACTGACCGTACCTGTAACCATCAATACTTTTTCTTGCAGTAATAATTCCATCATA
+AACTGCATATCATCTTCGATTGGATAAATGTCACGGTCAATTTTTGGGAAACAATAAAAC
+GCCCCTTGTGGCATGGTGCACGAGATACCTTTAATGGCGTTTAGACGCTCGATAGCGATG
+TTGCGCTGCTGATACAGGAGCCAATACGGAACGGTCAGTGCGTCGCCTTAAGCG
+>ds2020-267_437
+GACGCACTGACCGTCGGACATTCCTTGACGCACTGACCGTTCCTGCGCTGGGACGCACTG
+ACCGTTATACCCCAAATCAACGCACTCTCGTACGAAGGCTAGCGATACGGTCAGTGCGTC
+GCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGTACCAGGCTGTTGCGGACGTGGAG
+TAAGAGACATTGCGGACGTGCTGACCCCACCCCATTAAAATTGCGGACGTGCTG
+>ds2020-267_438
+CAGCACGTCCGCAACTGGCACCTTTTTCGGATGAAGACGAAGACTGTATTTCCGAAATCT
+GTCAAACACTTTCTTCAAATTCACCGTCTTCTTAAGCCCAAGACTTGGCGATCATGTCAT
+CGACATAGACCTCCATTTCCTTGTGAATCATATCATGAAACAGCGCAGTCATGGCTCGCT
+GGTACGGCGCCCCGTCATTCTTTAGACCAAACGGCAACACTGGCGGACGTGCTG
+>ds2020-267_439
+GACGCACAGACCGTCGATATGGCTCTAGCATAGGCAGTGCGTCCCGGGCACCTCACGGTC
+AGTGCGTCAGGAACATAATAACGGTCAGTGCGTCAGGGCATACTCTACGGTCAGTGCGTC
+GCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAAGGACTATCTCTCAGCACGTCCGCA
+ACTTCTTTGTCGTCAGCACGTCCCAATAACTGGTGGATGCTTGCGGACGTGCTG
+>ds2020-267_440
+TCAGCACGTCCGCAAGCTAACCTTTGTAATTATTGTAATTTTTCTTTACTCTCTTTTCAT
+TTCAAATTTATTCAATTTTCTTTGAGCTTTCTCTCTCTAGCTCTTCCAATTTCGACGTTC
+TCTTTGTTTGAACACCTCCTTCTTTTCTTCCACCGACTTCCGTCATTTCCCGCGTCCCAG
+TTTTCTTCACTGATAATTCTTCCTCCTCCTCGTCGGATCCACGGTCAGTGCGTC
+>ds2020-267_441
+CAGCACGTCCGCAAGTTGAGTTCAGTGGTGTAAACGAGTTGTCCAGTGTGGTAACGGTAA
+GGGAGTACAGTAATGCCAGGTTGTGGAAATCTGTTGTTTGGAAGTTCGTTGTCGTCTAAG
+TGACGATAAAATTCGAAGGGTTCGTTACGGTCAATGTTCGCTTGAGTGTAGCGTTCATAT
+GTTTGAGAGAAGGTGTGTTCGTATTCTGATGTGCGATGACTTGCGGACGTTCTG
+>ds2020-267_442
+CAGCACGTCCGCAAACCACGCCTTTTATGAGCAGCTAAGTCAGCTGCAGATTTTGCAACA
+ACAGATTGCATCTTTGACCACTAGCACCACCAACTAAAAATTGCCCAGCAAACGCTACAA
+GCCGATATTCAGCAGCGTTTTGCGACATTGGGTTTTGTGGATGACGCCGATAATCGCGCT
+GCGGTGTTGGTTGATACCGAGCGAGAAAGGGTTGAACTATTGCGGACGTGCTG
+>ds2020-267_443
+AAGCAGGTATACGGGTCAGACGTTTAGATGCAGGGTAGCCCTCTTCTACTATCCTGGTTG
+CCTTGACTTCCTGAACTTCAGCCAGATGTCCAAATTCAAAGGCTAACCAACACGAATCAT
+TTGCGACGGTAGGCACTTCTTTTCCGAAAGGCACAGAACACATTGCAGCCCTACCTATTG
+GGGGGGGGAGGGCACGGTCAGTGCGTCGCCTAAGCGCTCTTGCGGACGTGCTG
+>ds2020-267_444
+CAGCACGTCCGCAATGTGGCAACCGTGTACGACGTTTCCGATGACACCCTGTCTATCAAG
+TGCCCCAGTATCAGCATATTATTGGCGTTTGTGTTGATAAGGGACGTGTAATAGGAACCA
+CTCGGCATCGTCCCAAAAAGGTTGACAAGGTACCCCGAAGGATGCTCAAGAAGCTTCTTG
+AGAAGCTGGCGCTTTGACACAGATGACATAGCCTAACGTTTGCGGACGTGCTG
+>ds2020-267_445
+CAGCACGTCCGCAAAGGGCCGGGGATTGCGGACGGCTGAGTAGAGGGTAGTTGTTATTTT
+TGCATGCAAGCTACTGACGTCTTTTTTTTTGAGTGTTCGATGGCTTTGGAGAAAGGTTTT
+TAGGATTAGTGCATCAGGGGAAGATGATGCATCTGATGAGCATAAAGGTATGGAGGTTGC
+GGACGTGGAGGTGTAGCTTCTTGCGGACGTGCTGAGGTCAGTCGGGTTGCGGA
+>ds2020-267_446
+GGACGTTCGGGCTTTTGAGTTTCCCTGGACTTCGGGCTTGTTTCTGCGGCTGGACTTCGG
+GCTTTGTCTCTGGGGGGACGTTCGGGCTTATCTACACCCTGGAAGTAAGCCCGAACGTCC
+TTACTTCCAGTATCTAAGGAGCAGCACGTCCGCAACCGGCAAAACCTCAGCACGTCCGCA
+AGACGAACTACTCAGCCGTCCGCAAAGACCCCATCATTGCGGACGTGCTGCTC
+>ds2020-267_447
+GACGCACTGACCGTCGACGAGCCGATAGTACGGTCAGTGCGTCAGTTCTGTTCAGACGGT
+CAGTGCGTCAAGGTAGGGGCAACGGTCAGTGCGTCAGCGGAACTCGAACGGTCAGTGCGT
+CGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGTTATATACGGTCAGCACGTCCGC
+AATGCGGTCTCCCTCAGCATGTCCCAAACCCAGTGCGTGTTGCGGACGTGCTG
+>ds2020-267_448
+GACGCACTGACCGTAGCTGCCTGCTTCTTGACTTACATTCTTGGCCCCTTCCCTGGCGAC
+CACTACCATTATGCGATATAAAGTGAAATCCAACCTAAATTCCCAAACAACTTGAGGTTG
+CTGACTCATCATGTGGGTCAAAAACTGAACTAATTCCACATTTCCAGTGCAGTGAACTCC
+ACTTAATATAACCATTTTAGTGATTTAAGGTAAGTGTTTACGGTCAGTGCGTC
+>ds2020-267_449
+GACGCACTGACCGTTCTCTTCAGGATGACGCACTGACCGTTGCCCTTTCGATGACGCACT
+GACCGTCCTGAGACAGTTGACGCACTGACCGTTCCATTATCGCTGACGCACTGCACGTCT
+GACGGTCAGTGTATCTAAGGAGCAGCACGTCCGCAATAGAGTCCCCCTCAGCACGTCCGC
+AATAACTAGACGCTCCACGTCCCACGACCCTGGCTTATGTTGCGGACGTGCTG
+>ds2020-267_450
+CAGAACGTCAGCAATCGGCGTACCCTAGCGCGTCCGCAAGGAACAATCCTTCAGCACGTC
+CCAACTATCGTGCAGCACGTCCGCAAGAGTCGTACCCCAGCACGTCCGCAAGTAACAATC
+CTTCAGCACGTCCCAACTATCGTGCAGCACGTCCGCAAGCGCCGTACCCCAGCACGTCCG
+CAAGTAACAATCCTTCAGCACGTCCCAACTATCGGGGCATTGCGGACGTGCTG
+>ds2020-267_451
+CAGCACGTCCGCAAACCCAAAGCTCTCACTGCATCTTCCATCTCCTTCCTCCTCCCCTGC
+ACCGAAACGACGCCGTACGTACCCCTTCCCAACATTTCCAAACTCTCACGACCACTCGTT
+TTCCGTCTCTCGTCTGATCCGGAACCGGAACTACTCGACAATACGATGTCGTTTTCTGTA
+GACGAAAATGACACAGATAAAACCTTAGCCGGAACACATTGCGGACGTGCTG
+>ds2020-267_452
+CAGCACGTCCGCAAAGCTCCGTTGGTTAGAGCACTGCCTTGATAAGGCAGGGGTCATAAG
+TTCAAGTCTTATTAGACTCACCATTAGATGAGCTTAGTAAGCGCAAGCGAACTTAGCGAA
+ACTTATGTACCGCTACTTAATTACTGTAGCTGGTTAAAGTCTTATGTATCTTTACTCAAT
+TAAGTAACGACTCAATTAAGTAGCGGAGTGCGACATGATTGCGGACGTGCTG
+>ds2020-267_453
+TTGACAGAGACGGCACTCACAGGAATTAGTCTAGCAGCATGGTAGAAAGTCTTAGCCCAC
+AATTGCTTAAGTGGGGCAAAGCCCCCTATGTCTGAAATGAAATGGGAGCGCTTATACTTC
+TGCCATGTGCGGACGGGATTAGTCATGAAAGCACCAAGCCCGTATTTCTTTTCCCATTTT
+CCTATGATGTAGTTGAACGGGACCAGATTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_454
+CAGCACGTCCGCCACTGATCCGCCATTGTGAGCGGGCTGGCCGACGCGCGACCAACTCCC
+ATCCTATTGAAGCTGCTGATGTCTGTACAGCGGTAAGTGGGGGTGTCTGAATGCGGTACT
+CGGAAGTGAAATTGCACAGGTGCCAGCGAGGTACATAGCGTCACAGCTGCTAACGTTGCA
+TCAGGATTACAAGCAAGCGGTGCCGGAGGAAAAACGGATTGCGGACGTGCTG
+>ds2020-267_455
+CAGCACGTCCGCAACCTCACGCCTCTCAGCACGTCCGCAACCTCCTCTTCCCCCCTGAGT
+GGGAGGGCTGTAAACTCCTCTTTGTCCTTACCGACAAGTCCCTTGTCAACGCATTCCACT
+TCCCCCTGATTCCCACTCAGCAGAACTCCATGCTACACAACGCTGCGGCTGAGGCTCTCA
+TGCATCTCAAGTGCACCATCCACCTCAGCCCCATCATCAAGCCCGAACGTCC
+>ds2020-267_456
+GGACGTTCGGGCTTTGCGTGAGGGGTGTTGTGGGGCCATGTTGGACTCTTCTGCCGGAGG
+GTCGCGCCGCATGATGCTGGGAGTTGAACAGTCTGGGAAGTCTGGTGTAGAAGCCCGAAC
+GTCCTTACTTCCTATCTAAGGAGCAGCACGTCCGCAAAATGACAAGGTGGTTGCGGACGT
+GGCCCAAGTGGAATTGCAACGTGCTGACGGGCTGGGGTTTGCGGACGTGCTG
+>ds2020-267_457
+CAGCACGTCCGCAAGGCCTTTGGGGTGTATGACGGGCACGGTGGGGCTGAGGTGGCGAGG
+GCTTGCAGAGATAGGATGCATGAGTTGGTGGCGGAGGCAGTGGAACTGGAAAGGATTAAT
+AATAGTAATAATAAGAAGAAGAAAGATCCGGTGGATTGGGATTGGGAGAGGGTGATGGAG
+GGGTGTTTTGGTAAAATGGATGAGGAGGTGAGCGGGATTGCGGACGTGCTG
+>ds2020-267_458
+CAGCACGTCCGCAATTCATAGCCCCTCACTATAGAAGCTCCCATTGGAACTATGAGTACC
+CCAAATGAATGGGTGGCACATAATAGACCCAACTTCAATCGGTTACGTTGTTCATCACGA
+ATCTCTCACGTCAGCAAACATGTAAAGAGAGAGATAGAGACAATGTTTTATACAACACAT
+TGCCCGGGAGTTCCTTCCAGATGAAGACTACGAAGAGGTTGCGGACGGCTG
+>ds2020-267_459
+GACGCACTGACCGTATTAATGCATGTTGTAACGGTCAGTGCGTCAGCGCGTCGGGAACGG
+TCAGTGCGTCAGCAAGAGTTATACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGAGCAGC
+ACGTCCGCAAAGACCACGGGGTCAGCACGTCCGCAAGTGAGGCCTACTCAGCACGTCCCA
+ACTTACATTCCCTCAGCACTCCGCAAAAGGGTTCAAGTTGCGGACGTGCTG
+>ds2020-267_460
+CAGCACGTCCGCAATGGTATTAGTCTGAGAGGAGCAGAGGTAAGCACGTTAGAGCGTTCT
+TTTTTCACCTTTGTTTCTCATATAGAAGTCAAACTGAATGCATCTAATTTTGCTTCTCAG
+GCAAAAATCTATGGCGCACTACAACAGTCGTCAATTCGGATGGTCGCGCGTGATGTTGCA
+ACGTGGCAGGACTTTGATGCCTGCTCTGCTTTGGGATTTGCGGACGTGCTG
+>ds2020-267_461
+CAGCACGTCCGCAAACACTTCTGGGCGCCGTCGCAAAATGGTCGTGATATTGGGACGTGC
+TGAGGAGCGAGCCATTGCGGACGTGCTGCTCCACGCTTAAGGCGACGCACTGACCGTCGG
+TATACCCTTGACGCACTGACCGTCCTCACACATCTGACGCACTGACCGTCGTAGCAAGGA
+TTTTACGGTCAGTGCGTCACGCGACCTGCTACGGTCAGTGCGTCGCCTTAA
+>ds2020-267_462
+GACGCACTGACCGTAGTCTGAACACTGACGCACTGACCGTGATTGCGGGGTTAGAACGGT
+CAGGCGTCAGGGTAACGTTAACGGTCAGTGCGTCAAGGCATAGATTACGGTCAGTGCGTC
+GCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAACCACAGGCCGGTCAGCACGTCCGCA
+ACGGCACTTTCCTCAGCACGTCCCAAGACCTAATCATTTGCGGACGTGCTG
+>ds2020-267_463
+CAGCACGTCCGCAACCCAGCCTTCCTCATTCACCACCACCACCGCCACATTCACCACCAC
+CACCAATTTATCCGTATCCATCACCTCCACCTCCCGTCCATTCCCCACCTCCCCCAGTGT
+ACCAGTCCCCTCCACCACCACCACCACTTTGTATGGAGCCACCCCCTCCACCTTCGCCAC
+CACCACCAGGTATTGAGTACTCACCGCCACCTACTCCTTGCGGACGTGCTG
+>ds2020-267_464
+CAGCACGTCCGCAAGCCGATACTTTTATAGCACCTTTAGCTGACTGGCTGTCACACTTTT
+TGCCACTCGGCCAATCGTTAGACCTTGAATTAAAATGGAAAATACCACAATCGCATAAGT
+CAACGTTAATAACAAATCTCGCTCGGCCCCGGCAGGTAATTGTAATACTAATGCCACTGA
+AATACCGCCTCGCAGTCCACCCACCAATCATGCTTTGCGGCCGTGCTGCTC
+>ds2020-267_465
+CAGCACGTCCGCAACTTGTCCCCTGTGCGCTTACCCAGGATCGTAGGTATACCCTCTGGT
+GTGGTGGACACGAGTGGGTCGTCTACTGGACAACCGCATAGGAAGTTCAGGATAGACAAC
+CTAATCGCTTTTGCATGGGCAATGCAAAACTTTAGGCCCCTTTTGTTATTAACTGATTCC
+AAGTAATCAGTTAGATCATCCAATACACGTGCTTTATTGCGGACGTGCTG
+>ds2020-267_466
+CAGCACGTCCGCAAAATATGCGCGGTGGAGATAAGAAATGATGATTAGAGTATTGGTCGT
+TGACGATCATGATTTAGTCCGAATGGGCATCGTACGGATGCTGTCAGATAGCCCTGACAT
+CGATATGATTGGTGAAGCTACTGATGGTGAAACCGCGATTATCAAAACCAAACAATTAAA
+CCCTGATGTGGTGTTACTTGATGTACGGAATGTACATTGCGGACGTGCTG
+>ds2020-267_467
+TTAGATTCGCTTAAGGCGACGCACTGACCGTTGTTATGCTGGTATACTATGTGTATATGT
+TTAATAGAACTACTTCTAACAACCTATGCATTCGGTTATCGTTTCCAATTGGATGATCCA
+TTAATGCAACTGACAGAGGATTATAAATGGATCAATTTTTTTGATTTTTACTGGAGATTG
+GGAATAGATGGAATTTCTATAGGAAGCCCTCAGCTTACGGTCAGTGCGTC
+>ds2020-267_468
+TAGCACGTCCGCAACATGCCGCCCATGATAAAGCACTGATACTAACCACCGCGGATGCAT
+TGGTGGTCTTCTTTGAAGTCTGGTGGTGTTGATGTCGTGGGGCCTGATGTGTGGTTCAAG
+TGATGGGGTGACGCAGTGAGGTAGCCGCGCCACTTAGTGGATTGGTGGTGTAAGCGTGTA
+GGCCGTGTGGTAGGTAAATCCGCCGCACTTTATGGTTGTGGCGTGGTGCG
+>ds2020-267_469
+CAGCACGTACGCAAGAAGCATGGGGTATTGAAACTTGGCAGGGGGGTGTGGAGCTTGAAG
+AAGTGATGCGGCCGGTACCTAAGGATGCGGCGGCTGGGTTACGTGGTTAGGAGGATGGGC
+CGGGCTGCGTTCGAGCTTGGTTTGAGAAGTGCGACTGGATTATGCCCGACCGGGTTTTTC
+AAATATAGCTTGGGCACGGCCAGGATACGGAGGTTTTTGCGGACGTGCTG
+>ds2020-267_470
+GGACGTTCGGGCTTCACTCCAATCCTAGCTTCACAACCACCACCACCCACAAGCCCTCCC
+ACTCCCTCTCTACCCCCACTTTTCTCAAATTCCCAACCGAATCCCCAAATCCAAGCCCGA
+ACGTCCTTACTTCCAGTATCTAAGGAGCAGCACGTCCGCAATACACATGGGGTGCCCCGC
+AAAACCACATCGCTCACACGTCCGAAATGTATTCACTTGCGGACGTGCTG
+>ds2020-267_471
+GGACGTTCGGGCTTAGCGCACACCCTCTCAATCAGATTCCAGAAGATTCTTTGAGCTCTG
+ACTGCAGGAGTGCCTATGATCTGCTCGCCATTCTTTGCTGACCAGAGAACCAATTGTTAT
+TATACTTGCAATGAATGGGGCAGTGGCATGGAGATTGATAACACTTTCGGACGGGCTGAC
+AGTATGCAAAGTGCGGAAGTGCTGACAGCATAGTTATTGCGGACGTGCTG
+>ds2020-267_472
+CAGCACATACGCAATTGTCATCCCCTCAACACGTCCGCAACCTATACCCCCTTGACTTTG
+CGGACGTGCGCTTAGGCGACGCACTGACCGTGTATACCCCCCTCTGACACACTCTAGCCT
+TGCAGTCTCCAATGCAGTTCCCAGGTTGAGCCCGGGGATTTCACATCAGACTTACAAAAC
+CGCCTGCGCACGCTTTACGCCCAGTAATTCCGATTAACGCTTGCACCCT
+>ds2020-267_473
+CAGCACGTCCGAAAGTTATTCTTTATTGCGAAGTTCCAGTCTGTTAGCCTCAATCGTGAG
+TTCCTCCTCATCTCTGGGGAATCCGATCTCGATCTTGACGTTTCCCTCAGACTTGTTTCT
+GAAGTGGGGCATTTCAACGTGAGCGTCTTTGTAGCACCCAGATTTGAAGACCATAAAATC
+ATCTTCACCTTTGGTTGCCACATAGATCACTGACTTTGCGGACGTGCTG
+>ds2020-267_474
+CAGCACGTCCGCAACCGGTCTCGGCTGCTTACAGATAAATTATTGGCTTAGCATGAGAAG
+CTTGTGGCATGGGAGCAAAATCGACATGAGTTTAGCACCGAAGAGAAAATTGAGTGTTCT
+TGGGAGAAAAAGGGGTATTAAGGTAGGAGATGGAGAGTTTGCAAAGAGGTTTGGCTGAGA
+AAGGAGGGAAGGAAAGGAAAAGATGGCTTGGGCGATTGCGGACGTGCTG
+>ds2020-267_475
+CAGCACGTCCGCAATTCTGGGTCCTTGTACTGTAGCTTGACTTAAGCAAGCTATTTACTT
+AAAAAAAAACCGTCTTGATCTACGGCCATAACATCTAAAATCTTTTGTAATCGAGACCGA
+TACCGATACGCGCGAACTGGTTCTCGCCGTTCGGAAGGCATCGGTGGAGTCTATTCATTA
+CTTGTTTAAGCACCTCAATAACGACTAGGGCGGATTTGCGGACGTGCTG
+>ds2020-267_476
+CAGCACGTCCGCAATCTATAGGCCCTATACCCAAGTCAGACGAACGATTTGCACGTCAGT
+ATCGCTGCGGGCCTCCACCAGAGTTTCCTCTGGCTTCGCCCCGCTCAGGCATAGTTCACC
+ATCTTTCGGGTCCCGACAGGCATGCTCTCACTCGAACCCTTCTCAGAAGATCAAGGTCGG
+TCGGCGGTGCAACCCTCAAGAGGCATCATTAGTTGCGGACGTGCTGCTC
+>ds2020-267_477
+CAGCACGTCCGCAAACCAATATCGGTGGCTCACACCTGTAATCCCAGCACTTTGGGAGGC
+CAAGGCAGGCAGATCACTTGAGGTAAGATGTTCGAGACCAGTCTGACCAACATAGAGAAA
+CCCCATCTCTACTAAAAACACAAAAAGCTTGGCATAGTGGCTCGCGCCTGTAATCCCAGT
+TACTCTGGAGGCTGATGCAGGAGAAGCCTATAGAATTGCGGACGTGCTG
+>ds2020-267_478
+CCGCAAGGTAATAAGTCTCAGCACGTCCGCAAAACCCCGGGCCTCAGCACGTCCGCAAAC
+CGTAATCCCCCACTCGAACGTATACCCATTAAGCCTTGCTCTACTCCTCTCCTTCCTCAC
+TTGTTCTCACATCAATCTCCAACCTTTTTATTGGATTTTCATCCTCTTTCACCTCCTTGC
+TCCTCATCCCCCAGATCCCCCCACTCCACCCAACAAGCCCGAACGTCCT
+>ds2020-267_479
+GGACGTTCGGGCTTGGAGCTTCCCATGGACTTCGGGCTTTGCCAAACCCCTGGCGTTCGG
+GCTTCAATTATAGCCTGGACTTCGGGCTTAGCTCACCGCTTTTAAAAAGCCCGAACGTCC
+TTACTTCCAGATCCGCAACCGTGTTAGGGTGGAGCAATTGCGGACATGCTGCCCCTAGTT
+TGCGGACGTGCTGAGGGATGTTATTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_480
+GACGCACTGACCGTAGGTTCCCGACTGACGCACTGACCGTAGTTAATTCCCTGACGCACT
+GACCGTCTTCAGCGCCCCACACGTCCGCAATCTTTGGTCGGTGGCGTCTTGACCTAACTC
+GCATTGGTTACGGTTCAAAATCTGGTCTTCAATGGCGTTTCTAACGTATGGGTCGATATC
+GTAATACAACTCTAGCATGGCGGGGAGGATACCACTTGCGGACGTGCTG
+>ds2020-267_481
+CAGCACGTCCGCAATCGTACTTTCGTTCTTGATTAATGAAAACATCCTTGGCAAATGCTT
+TCGCTTAAGTTAGTCTTACGAGGGTCTACGAATTTCACCTCTCGCCTCGTAATACTAATG
+CCCCCAACTGCTTCTATTAATCATTACCTCTTGGTCTAAAAACCAATGAAAGTAGAACAG
+AGGTCCTGATTACTAGCAAGCTATTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_482
+CAGCACGTCCGCAACGCACTCGGGTTCACTTCTTTACGGGTCGGTTACCTGCGAAGCGGA
+GGTTGCCAAACACCTACACCAGAGGGGGCAAGTAGCCACCGATGATTACGGGACTCTTGG
+CCCTGACCAGGCCCTGTTGCTTGCGAATGTATACAGGGTTTTCGGACACACGCTGGAGCT
+GCAACACTTTAAGACTCAGGAGAGATACGGACCTTTGCGGACGTGCTG
+>ds2020-267_483
+TAAGGACGTTCGGGCTTAGAGATGCGGGTGCTGATTCTGATAATTGGGGGAGGAAGAAGG
+AGGAGAGTAATGGTGGGTCTGGTTTTGATCGAGAAAGAAGAGTTGGGTTCGTGTCCAATG
+GTGGTGGTGCGGATTCTGAGGTTTGGGGGAAGAAGAAGGAGGAGAGTAATGGTGGTCCTC
+GGGGTTGTTTGCGGACGTGCTGAGGCGACTATAGTTGCGGACGTGCTG
+>ds2020-267_484
+CAGCACGTCCGCAAGCTTCCTCTAATAAAGCGGGAAATACCTCTTGGTGCTCATATGGCA
+GTGTTACATCTTTCATTGCATCTTTGTAGTTTTTCATGTGTTATGTCTTCTAACTATGTT
+ATCATGTTGAATATAGGGTTGGGATCCCTCCATTATGGATTCTGACATTTGCTATTTCTT
+ACAGGATTCTCCAATTCTTGGGATGCCAACAATTTTGCGGACGTGCTG
+>ds2020-267_485
+AGACGTTCGGGCTTTTTAGATCCCTTGGACTTCGGGCTTTTTCCCGTCCCTGGAGTTCGG
+GCTTAACTCAGGGGTTAAGCAAGCCCGAACGTCCTTACTTCCAGAAGCACGTCCGCAAGT
+AACAGAGGTTGGGACGTGCTGAGGTGAGCCCAATTGCGACGTGCTGAGAGATTTAGGGTT
+GCGGACGTGCGAGTGCATTTATTTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_486
+CAGCACGTCCGCAATCGGAACCGGTTCGGAAGAATTCACAGGTAAGGGGCCCAGGTGTGA
+AGCCGTTGAAGCAACCGAAACCCAAGGCTAAGGACCCAAATAAGAGGGAGATGAGTATGG
+AGGAGAAGCACAAGTTGGGAGTTGGGTTGCAGAGTTTGCCGAAGGACAAGATGGAGCAGG
+TGGTGTAGATGATAAAGAAGAGGGGCGGAGTGCGGACGTGCTCTCCTT
+>ds2020-267_487
+GGACGTTCGGGCTTCTAAGGGAGTGTAGGTGGCTCATTAAGTCACATGTGAAATCCCCGG
+GCTTAACCTGGGAACTGCATGTGATACTGGAGAGATACAGCCAAGCCCGAACGTCCTTAC
+TTCCAGAGCAGCACGTCCGCAATCAGCCCGCCCTCAGCACGTCCGCAAGCCGTATTTCCT
+CAGCACGTCCACAATCCCCGCATTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_488
+GGACGTTCGGGCTTCCATGCTGCAATGGCTGGTACAGAGAGTGGCGAGCCTGTGAGGGTG
+AGCGAATCTCGGAAAGCCAGTCTCAGTTCGGATTGGGGTCTGCAACTCGACCCCATGAAG
+TCGGAGTCGCTAGTAATCGCAGATCAGCAACGCTGCGGTGAATACGTTCCCGGGCCTTGT
+ACACACCGCCCGTCAAGTCATGAAAATAGGTAACAAGCCCGAACGTCC
+>ds2020-267_489
+GGACGTTCGGGCTTGAATTCGGCAGTGGACGTTCGGGCTTTTACATTACGTGGCGTTCGG
+GCTTAGAACCCTGGCTGGACGTTCGGCTTTCATTACCGGGTTATATAAGCCCGAACGTCC
+TTACTTCCAGTATCTAAGGAGCAGCACGTCCGCAATATTTCACAGCTCCCGTCCGCAATG
+CGCAGTTGCTTGGGACGTGCTGAGAAGAGTCCAGTTGCGGACGTGCTG
+>ds2020-267_490
+GGACGTTCGGGCTTTACCCCCCCACTCAATAATCCTACCGATATGTGTAAACAAATAATT
+CACAGCCTTATCTTGCGCGCAATTAAAGAGCATAGGGAAAGCATTTCGCTTACTGGAAGG
+GTCCTGCTCGGAGGCCAAGAACCGATCGATGATCTCCGGCGCGCTATCCAGCAATGTCTC
+CCCCGTGGTTTGCGGACGTGCTGAGGGAACAGCCTTTGCGACGTGCTG
+>ds2020-267_491
+GGACGTTCGGGCTTTCTGCCGCCCCTAAGGATCATATAAGAAACCATCTAGAATATGAAT
+CTTGAGAGTACACACGATGCTTGTAATGACCTAGCCATTCTACAATTAAAAGTTCGACTA
+GAACTGTAACCAAGGCACAGCTCGAAGCCCGAACGTCCTTATCTAAGGAGCACCACGTCC
+GCAAGACGTCTCACTTCCACGCAACTTAACTGCATTGCGGACGTGCTG
+>ds2020-267_492
+CAGCACGTCCGCAAAGTGTCTGGGATAGTCTTTGACTGTGATACAGGCATACCAACGGTT
+ACGGCTGTCTTGCACCAACTCGCAAGTGTTGATTTGATATAGGCTAAGGTTGTAGCTGTA
+CCATAGGTCAATGATTAGTTTCTGCCCTTTGGCTAAAGATAGTTGTAAGGTGGATTTTAA
+GCCCTTTTTGCCTGTTTGGTGAGGGATACCGCATTGCGGACGTGCTG
+>ds2020-267_493
+CAGTACGTCCGCAAGTGTCGGGTCTTGTTTTCTTTTGGGTTTGAGGTTGTGGAGGGAGTG
+AAAGGGGTGGTTGATGAAGATGAGGAAGGGGTGTGTTTGGGGATTTGGAGAAGAGAGAGG
+GCTTGGAGAGTGCAAGTGAGTGTGTTTGGGATTGATCTTCTGTGAATGGGTTTTCTGCTG
+AAGAAAATTGAGGTGGAGGAGGAAGAGGGGGGGTTGCGGACGTGCTG
+>ds2020-267_494
+GGACGTTCGGGCTTGACACCATTCCTGGACGTTCGGGCTTGGACGCGGGACTATAAGCCC
+AAGTCCAGATACGAATCGAAGCCCGAACGTCCTTACTTCCAGACACGTCCGCAAAGTTAC
+CGGGGTATGTTGCGACGTGGGGGAGAGGGAGATTGCGGACGTGCTGAGTATGAAAATTTT
+GCGGACGTGCTGCCCGCGAGCTGTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_495
+TCACTCCATCATAGTCTGATAGATCTTTTTAAGAATTGATTAATCGGACGAGAATAAAGA
+TAGGGTCCCATTATACATGTCAATATCGACAACAATGAAATTTATAGTAAGAGGAGGTCC
+AGATGGACGGTCAGTGCGTCGCCTTAAGCGAATCTAAGGAGCAGCACGTCCGCAATACCG
+CGTCGATGTTGCGGACGTGCTGCCCAGAATCTCTTGCGGACGTGCTG
+>ds2020-267_496
+CAGCAGGTCCGCAACGTCGGTTTTGTGTCCGTATCGGCGGTGCCAATCGGTTGCGAGGGG
+TGTGTAGAGCGATTCGAGTCGGTCAAACACTGCGCGGAAGGTTGTTCGATTCGCTAAGAA
+ATAGGAATCGGTGGCGAAGGGGGCTTCAGCGTTCACGTGCCATTTATATGGGTAGTGGGG
+CTGCACATCATAGATGTGGGCAGGTCGTCAATTTTGCGGACGTGCTG
+>ds2020-267_497
+CAGCACGTCCGCAACTGAAGGTTCTTTCTATCTATGATCTTTCTATCTCTGTGCAGCTAC
+TTCACGCCATTCAAATAAATAGCTCATCCTCCAAATTCCAGACCCTTTTGGTTTCTGCAA
+AAATGTCGAGAGCTCAACCACACAGATGGCTCTCCCTACTCATCCTCTTCCTTGTACACC
+TTTCACACACATCTCACGCCGACGTGGACTCTGTTTCGGACGTGCTT
+>ds2020-267_498
+GACGGCACTGACCGTCTAAGTGTAGATAGTGTAGATGTATCGCAAGCTATGCCAACTATC
+GATGACGCATCTATGATGTTTGCCGCAGGCACAGGTGAGCTAGCGGATAAACACATCTCT
+GAGCCTATAACGGGTGTAGAGATGGCTGTACAGGACGCGGCTATTGGGACGTGCTGGCTG
+GGGTGACGTTGCGGACGTGTGACGCGTGCGTTGTTGCGGACGTGCTG
+>ds2020-267_499
+TAAGGAGCAGCACGTCCGCAACGAGTTAGGGGTCAGCACGTCCGCAAGTCGACTACGGTC
+AGCACGTCCCAAGTGGAGCCAATTTGCGGACGTGTCGCTTAGGCGACGCACTGACCGTTG
+GCGTATGGGGTACGCACTGACCGTGTGTCATCCCATTAGATACGGCCAGTGCGTCAGGTA
+AAAATCTACGGTCAGTGCGTCAGCCCCCCGAGAACGGTCAGTGCGTC
+>ds2020-267_500
+GACGCACTGACCGTGATTTATCCCCTGGACTACGGTCAGTGCGTCAGGCAACACTATACG
+GTCAGTGCGTCAACCCGTTCCTAACGGTCAGTGCGTCGCCTTAAGCGTGGCAGCACGTCC
+GCAACCAGATATCGATCATTGCGACGTGCTGACCGTACAATGATTGCGGACGTGGAGGCA
+GATGGACTTGCGGACGTGCTGAGCGAATTCCCTTTGCGGACGTGCTG
+>ds2020-267_501
+CAGCACGTCCGCAAGACTTCGCCCCTATTTCTATCCGTGTAATTTCGAATACTTGAACGG
+TCGATTCTTTTTTTTTCATCTTAGCTTTCACCTTTTCGAATGAAACCAGAGGAGTGTTTC
+ATTATGATCTGGATTACACTTTTATCTTTCATTTTATTCTTATCCTTTTCTTCGGGCAGA
+CCCTCTATAACATAACAAAAAAAAGGGGGCCTCTTGGGGACGTGCTG
+>ds2020-267_502
+CAGCACGTCCGCAACTTGTCCCCCGTTATGTTATAGAAGAACTGAACTTATTGCTGGGCT
+GGTTATTCAGAGCCAGCAATTGGCTGCCGGATTTCGTCCCGCAACTAGAAGAAGATCGCT
+TCGGGGGTCACTGTGGCGTGGCTGAATGTAGAGCAGTCTGCCCCTACAGCGTTTGATCAG
+TAGATTATTTAGAACTTCGGAGGGCCAGCCCATTGCGGACGTGCTG
+>ds2020-267_503
+GGGGAAACCTGGAATGTCCGGAGTAGTGTCCGGTGGCCCTGCCCTGAATGTATAGGGGTG
+TGGGTGGTAACGCGGGGAAGTGAAACATCTTAGTACCCGTAGGAAGAGAAAACAAGTGTG
+ATTCCGTGAGTAGTGGCGAGCGAAAGCGGAGGAGGCTAAACCGTGTGTGTTCAAGCCGGC
+AGGTGTTGGATGTGCGGGGTAGTGAGGGGACTTTGCGGACGTGCTG
+>ds2020-267_504
+ACATTACGTTCGCTTGCATCCGGCTGTCCATAAAGCTGCCATGGCAAAAGCAAACGGTAC
+CACCGCGCCCACAAAGCCCATATACAGCATCGGCGGGTGAAAAATTAACCCGGGGTCTTG
+CAGTAGTGGAGGGAGAGCCAGTTGCGGACGTGCTGCTCCTTAGATTGTCCGCAACTACGG
+CTTAATACTTGCGGACGTGCCAAGAGTGGTCCCTTGCGACGTGCTG
+>ds2020-267_505
+CAGCACGTCCGCAATAAAACCACTGGAAGTAAGGACGTTGGGGCTTCATTACGCTCGTTG
+GTAGTATCTACCTGACAACCTGTGTCGGTTTGGGGTACGATTTGATGTTACCTGATGCTT
+AGAGGCTTTTCCTGGAAGCAGGGCATTTGTTGCTTCAGCACCGTAGTGCCTCGTCATCGC
+GGACGTGCTGAGGTGCCGAATATTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_506
+CAGCACGTCCGCAACTCCTACTGCCTAGCCCTTGGGACGTGCTGAGGGTCTCAATATTGC
+GGACGTGCTGCTCCTTAGATATAAGGACGTTCGGGCTTAAAGGTCCCTCTCGCCTCGTCA
+ATCACTTCGCCCATCTTCAGCGCCGTGCCCGAGGGGGCGTCCGCCTTGTGCTTGTGGTGC
+GCCTCGATGATCTCGATGTCATAGCCCGTATAAAGCCCGAACGTCC
+>ds2020-267_507
+CAGCACGTCCGCAAGAGCTTCCCGATCTCTTAGGATCGACTGACCCATGTCCAACTGCTG
+TTACCATGGAACCTTTCTCCACTTCAGTCTTCAAGGTTCTCACTTGAATATTTGCTACTA
+CCACCAAGATCTGCACTAGAGGCTGTTCCACCCAGCATCGCTGCCAAGGCTTCCACTCCC
+TCCTATAAGCCCGAACGTCCAGCATGTCAAATAAGCCCGAACGTCC
+>ds2020-267_508
+ATCTAAGGAGCAGCACGTCCGCAACGTACTACTGGTCAGCACGTCCGCAATTACCTGAGA
+CTCAGCACGTCCGCAATCAATTACGGGCCCGCAACTTCCCTGATTTGCGGACGTGCTGCT
+CCTTAGATATCTAAGGAGCAGCACGTCCGCAAAAACCTTTAAGTGGGACGTGCTGGGGGT
+TAATGATTGCGGACGTGCTGAGGGATGACGCCTTGCGGACGTGCTG
+>ds2020-267_509
+CAAGCTTTTAATAATATGGCCGTGATCTGTAATTACGTGCGACTATCTCCACTATAGAAA
+TAAAAAAAGGAGAGAAAGAAAAAATCCGTTAACGTTAATAAATACTAGAAACAAAGTGTA
+GGCTTAACGGTCAGTGCGTCGCCTTAAGCGAGGAGCAGCACGTCCGCAACTGGCGACCGG
+TGTAACATTGCGGACGTGTGAGTGTGATAATTTTGCGGACGTGCTG
+>ds2020-267_510
+GGACGTTCGGGCTTCTACTAAGGGCTGGACGTTCGGGCTTGCAAACTTCACTGGACGTTC
+GGCTTATAAACCCTACTAAGCCCGAACGTCCTTACTTCCAGAGCACGTCCGCAAGTTGTC
+TCGACTCAGCACGTCCCAACCTCGCACTTGTTGCGGACGTGCTGACCGAGTGACATTTGC
+GGACGTGCTGAGGTACGAATATTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_511
+CAGCACGTCCGCAAAGAATCCCCGCTTTGTGGCGGAAGAAGCTGGTGATGATGATTTCTG
+TGATGTGGGAAGTGTGAGAACAGCGGCTGCTCACCCCCATCACTCAGAAGAAGAGGAAGG
+AGATGGTCTTGAGGTTGAAGATGGTAGAGAAAGAGTGGAGAAGAAAGCAGTTCTTTATAT
+TTGGAAGTCTCAGAGGCAGAGCGAACGAGTATTGCGGACGTGCTG
+>ds2020-267_512
+CAGCACGTCCGCAAATTCGTTGGAATACCCTCTGGCCTATTTATCACTCAACTGTTCGAT
+TCCTGCTGATGGCGTGCCACGAAGTTCATTATGGAGCTCTACGGCCCGAAAGGCTTAGTG
+GGGTACTCCCTTGGGAGGGTTGGCCCGGTAATGAATGGACGGTCAAAAGACCATCAGTTC
+GGCTGGGTCCGTGCGTCATAGGAACGAAACTTTGCGGACGTGCTG
+>ds2020-267_513
+CAGCACGTCCGCAATTCAACACCAATCTTACCCTCAATGATCTCATGTTTCCCATCTTGG
+TCTTCTTCAAATTCATCCGAAGAACTCCCATTTTCTTCAACCCCTCCGTTCACACCAGCC
+ATAGCCATAGTAGCATCCGTCACCGCCTTTTTCTCCTTACTCGAAAAAGACTCCAACTTT
+TCAACACTACCCTAGGGAAGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_514
+CTAAGGAGCAGCACGTCCGCAAGGATCTCACCCCAGCACGTCCGCAACATCTCTCCCTTT
+GCTTTCGCTCCTCAGCGTCAGTTACTGCCCAGAGACCTGCCTTCGCCATCGGTGTTCCTC
+CTGATATCTGCGCATTTCACCGCTACACCAGGAATTCCAGTCTCCCCTACAGCACTCAAG
+TTATGCCCGTATCGCCTGCACGCCCAAATCGAAGCCCGAACGTCC
+>ds2020-267_515
+CAGCACGTCCGCAATTAGTCCTCCCCAGCACGTCCGCAAACTCTATACCCCCAGCACGTC
+CGCACTGCTCTCCGGCAGCACGTCCAGACAGTTACGTTTGCGGACGTGCTTCTGGAAGTA
+AGGACGTTCGGGCTTGGGGTGTGAGTTATTACCGCAAATTTTTTATCCTTTGGTCACAGG
+ACGCGCCAATGGTACAGGGAGGAGGTCTGTAAAGCCCGAACGTCC
+>ds2020-267_516
+CAGCACGTCCGCAAGGCAGGTTGGGTTGCAATCACCACGCCTACCAGCATGCCGACTATT
+CCCCAAACCACAGCCATGACAGAAAATTGGCGCACAACCCTATAGTTGTATGAGTTTTCT
+TTAGTTATCGTCATGATCTCACTCTGTTGTAAAAATACACTGAAAGAATAACAACCGCAC
+TGCACAACTACCATCACACACACCAATGATATTGCGGACGAGCTG
+>ds2020-267_517
+GACGCACTGACCGTCGCCATCCTCTTGACGCACTGACCGTAAGGGGACACCTGACGCCTG
+ACCGTTTCTATGCTGTTGGTCACGGTCAGTGCGTCGCCTTAAGCGTCGTCCGCAAATCCG
+CTGGGGTTGGGACGTGCTGAGATGGACCGGGTTGCGGACGTGCTGAGTGAATACTGTTTG
+CGGACGTGTGAGGAGTTATCGGTTGCGGACGTGCTGCCCTTAGAT
+>ds2020-267_518
+TATCTAAGGAGCAGCACGTCCGCAATACCAAGGGGCTGGAATTGCGACGTGCTGATGGGA
+TAAGTCTTGCGGACGTGCTGAGGGATTCGACCTTGCGGACGTGCTGTCTGGAAGTAAGGA
+CGTTCGGGCTTCCCGTGGCTTGTGGACGTGCAGTTAGCTATGTCGATGTTGTCAAGATCT
+GCCATGTTTTACTCATAGGAGCCTGCAAGTCAAGCCCGAACGTCC
+>ds2020-267_519
+CAGCACGTCCGCAAGCATCTAAGGCGGGTTGCGGACGTGCTGTCTGAAGTAAGGACGTTC
+GGGCTTGGATGCGCTTTGTGGAGGGCTGCACTATGATGCGGGAAACCCCAGTTTTGTCTC
+TGCCACTGTGGAGCAGCACGTCCGCAATGGAGATGGAGTGAGTTGCGGACGTCTGGGCCA
+ATAATGTTGCGGACGTGTGAGGGACGGCTGTTTGCGGACGTGCTG
+>ds2020-267_520
+CAGCACGTCCGCAAACTCAGTACTCTTGCAGTTGCCCTCAACTTCTCAACCTGCTCTCTG
+AACACCAACGCTTCTTCTTTCTTACCACGCAGTTGTTCGATTAGGTCCCCTACCTCCTCC
+TTCAACTTCACTCTTTCACCATTTGTTTCCGCAATCCAGTTCTTTGCAGTTTGAAGCTCC
+TTTGTTGTTCCTAGAATACACTTCTCGTACTTTGCGGACGTGCTG
+>ds2020-267_521
+TCTAAGGAGCAGCACGTCCGCAATTACAGCCCCCCAGCACGTCCGCAAGCAATTTAGGGC
+CTCACACGTCCCAAACCCCTATCTTTGCGGACGCGCTTAGGCGACGCACTGACCGTTTCC
+AAGCCCCTGACGCACTGACCGTGTCGCTGACTCTGACGCACTGACCGTCTTTATCCCCCT
+GACGCACTGACCGTGCGTTAGCGTGTCGGGTACGGTCAGTGCGTC
+>ds2020-267_522
+CAGCACGTCCGCAATAGTGGTCTCCTCAGCACGTCCCAATATATCTTAGGTCGCACGTCC
+GAAATCCCTCCCTCTTGCGGACGTGCTGCTCCTTAGACGCTTAAGGCGACGCACTGACCG
+TTATATTGGTGGTAGGTGAATCCGTGTTATAATTGGCAATATTTCAATGAAAGGAGCTAG
+GGTACTACGGTCAGTGCGTCACAGTGCGTTACACGGTCAGTGCGT
+>ds2020-267_523
+GACGCACTGACCGTACGAGTAGCCTGACGCACTGACCGTCCAGCGCTGTATGACGGTCAG
+GCGTCACACGAGAGATAACGGTCAGTGCGTCCCCCATGTGACACGGTCAGTGCGTCGCCT
+AAGCGTATCTAGGAGCAGCACGTCCGCAATGGACTACTCCTCAGCACGTCCGCAAACTAT
+GATCCCTCAGCACGTCCCAACCCAAGACCCTTTGCGGACGTGCTG
+>ds2020-267_524
+TCTAAGGAGCAGCACGTCCGCAACGTTAGACACGTCAGCACGTCCGCAAAGGATTTTCAC
+TCTCCGCAATTCCCCCTAACTTGCGGACGTGCTGCTCCTTAACGCTTAAGGCGACGCACT
+GACCGTTCGCAGGCCCCTGACGCACTGACCGTATCGTACATCCTGACGCACTGACCGTAT
+CATCAGCTGTGACCGTAATATCCCACCTCGCACGGTCAGTGCGTC
+>ds2020-267_525
+CTCCGGCGCGCCTGGACCCCAGCCGCGCGCACTACCCATCGCCCGAACGCGCCGCACGTC
+CGCAACTCCCAGGGGTCAGCACGTCCGCAACTTTTGCACACTCAGCACGTCCGCAATCGT
+AATGTGTTGGGACGTGCTGAGGGAATGACCCTTGCGGACGTGCTGAGTGCAATGTCTTGG
+GACGTGCTGAGGTGAGTGGAATTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_526
+CAGCACGTCCGAAATCCCAGAAGTCTTCTGTTTTCCTTGCTCGCGGTTTCGTCAGTGCGG
+CTACACTGCTTAAACAGAAGCTCGAGCGTGGGTGTCTGTCACAGTATCCTATTATCCGCC
+TTTTTGGGAATCGCCTCGACCACAACAGTTTACGGCGACTTATCGTCCTCGCCGGCTGCA
+ATCCTGCTGCTCGTGATTTACGTGAAAAAGCTTGCGGACGTGCTG
+>ds2020-267_527
+CAGCACGTCCGCAAGGATGCCGGCATTGGGACGTGCTGAGAGTGTAAAGCCAGTCACACA
+AACAGATCAAAACGAAAAATCAAGAACAGCGTGTGATTGGGAGGTTTTCGGTTGCGCCTA
+GTCTGGATGACCATGAAGTGCAACGAGTTAATGCTGCTATAAATGAGGAAGAAGCCAATG
+TTCTTGATAATAATAATCAGAGACAGCGAATTGCGGACGTGCTG
+>ds2020-267_528
+CAGCACGTCCGCAATTTTCCGGCCCCCCAAAAGAACATTCATTCATTTCTTTCTTCCCCG
+TCGACCACGACGACTGAAACGACACGAAAAATCCAGACCCGGAAAGGAGAAGGGCCGGTG
+GTGGGCATTTGGGAAAGTCGGGCCGATCGGGTGTCTTCATTCAAGCGACGATACAGAAGA
+AGAACGAAACGAAGTGAGAGGCCAGGGTATTTGCGGACGTGCTG
+>ds2020-267_529
+ATCTAAGGAGCAGCACGTCCGCAAAGACTTCACCCCTTTTCTTAATACCCCTATTCTCCT
+TTCATCCGGAGCTGCCGTAACTTGGGCTCATCATGCTATACTCGCGGGGAAGGAAAAACG
+AGCTGTTTACGCTTTAGTAGCTACCGTTTCGCTGGCTCTAGTATTCACTGGCTTTCAAGG
+AATGGAATATTATCAAGCACCTGTCAACATTTGCGGGCGTGCTG
+>ds2020-267_530
+CGTCCGCAAGAGGCCATCACTCAGCACGTCCGCAAATTCTGGTGGCTGCCTCCTCGGGTA
+TTGAAGTCAGTTTGGTGCGCACAGACGCGGGACGGTTCATCTTAATTTCTTCTCTCACTC
+TCATTGCAATGCGCTCTACATCTCTATCGGACAGCGAACTGGTACGTGATGACCCCTCAT
+CCCGTGCAGAGCTAAGCGATTGCCTAGGCTTTGCGGACGTGCTG
+>ds2020-267_531
+CAGCACGTCCGCAAGATTCCGTGGGTTCCAAACTATATGCGGTCTCGCTATTCTTTGTTT
+GCATTCAAAGGTCTTGTGCCTGCGCTATCGAGTCACGTGCCTAACTTCCAAAGAATGAAT
+CATATGGTAGAGGAGCGAAAGTGGCCGGGGCGGCGGTGTAGAGCTATAAGGAGCGAAGCT
+CACACACACCGGCGTGAGGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_532
+CAGCACGTCCGCAATGATCGGCCTTTTTCCCATTTCTTTGAGCAATGATCTTCTCAATCT
+CTGAATCATAATCTGAATCTGAACTCTCACTGTCTTCATCCTCATCCTCACTCTCTTCAC
+TCTCAGCCACGTTTTTCCCATTCGTCCTACCCAGCTTCCTCTTCAACTTACTCAATTCAG
+ACGCAACATCAGCCTGAATTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_533
+GATCTATCTAAGGAGCAGCACGTCCGCAATTGGCCAGGGCAGCACGTCCGCAAAACATAT
+TACCTCCACGTCCCAACCCAAAAACGACGCCAAAGAATTGTACGGTATCATCCCAACCTA
+ACCCGAAAGCCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCACGTCCGCAAGGAGT
+GAGGGATTGGGACGTGCTGCCCCCAAATGTTTGCGGACGTGCTG
+>ds2020-267_534
+GGACGTTCGGGCTTTCAGGCCACCCTGGAGTTCGGGCTTATCTTATTACCTGGACGTTCG
+GGCTTCTTGCACGGCCTGGACTCGGGCTTTAATTCGAAAGGGAAAGCCCGAACGTCCTTA
+GCACGTCCGCAAGATACACGGCATGTTGATTGCGGGTGCTGAGGGCGATAGGGTTGCGGA
+CGTGCTGAGTGGGCGTGAGTTGCGGACGTGCTGCTTCTTAGATA
+>ds2020-267_535
+TATCTAAGGAGCAGCACGTCCGCAAATCAAAGGAAATCCCTTGCGACGTGGCCCAAGGAA
+TATTGCGGACGTGCTGGGGGTGCACAATTGCGGACGTGCTGGGGAGGCATCCTTGCGGAC
+GTGCTGCTCCTTAGATAACGTCCGCAATCAGGGCCGGCTACTTGCGGACTGCTGAGGGTT
+CGAATCTTGCGGACGTGCTGCCCATACCCATTTGCGGACGTGCT
+>ds2020-267_536
+GGACGTTCGGGCTTACCAATACACCTCTTAAGCCCGAAGTCCAGGGGATCATTCAAGCCC
+GAACGTCCAGCGAGATGAGCAAGCCCGAACGTCCTTACTTCCAGTCTAAGGAGCAGCACG
+TCCGCAAGTAATACTCCTTAGCCGTCCGCAATGACATACCACTCAGCACGTCCGCAAATT
+GCACATTGTGGACGTGTGACCGACATAGGGTTGCGGACGTGCTG
+>ds2020-267_537
+CAGCACGTCCGCAAAGCATCACCCCTCACACATTGCGGACGTGTGAGAGCTATATCGTTG
+CGGACGTGCTAGGGCTGAATGTTTGCGGACGTGCTGCTCCTTAGATACTGGAAGTAAGGA
+CGTTCGGGCTTTATTAAATCCCTGCCACAACCCCATAAACAATACAAACCACACTAACAT
+ATCTAACAAAGTCATCGGAGTCGTAATTGTAAGCCCGAACGTCC
+>ds2020-267_538
+GGACGTTCGGGCTTCTGGTCATGGGTTAGAATTCTAGCTTCGCCAGAGTGGTATCTCACC
+GTTGGCTCCATACTCCCCACAAGGAATACTTCATCGCCTCCCACCTATCCTGCGCAAGCC
+AAGCCCGAACGTCCTTATTCCAGTATCTAAGGAGCAGCACGTCCGCAAACGGCTCTGACT
+CAGCACGTCCGCAAGCTGCATGCCTTTGAGATTGCGACGTGCTG
+>ds2020-267_539
+GACGCACTGACCGTGTCAGCTTCCGTCCATTTAACTAAAGAGCAGAAGGTTAGCTTACCC
+AGTAGCATTGAAGAGGTGTTATGCCGTGACTATTGATGGCAAATTCACGCCTGTTCATAA
+ATTAGATGTTTTTCGACTATTAATCAGACGGTCAGTGCGTCGCCTAAGCGTATCTAAGGA
+GCAGCACGTCCGCAAGAAAGGGGCCATCGATTGCGGACGTGCTG
+>ds2020-267_540
+GAAAGGAGTATGTCGCTGACGGACTAGGCTCTATTGAGGGAGTAAGTCGCTGACGGACTA
+GGCTTTAATGAAGGAGTCACTTAAGTGGTTGTTCCTACAATTGTTGAGAACAGAAGGGTG
+GACACAAAGCCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCACGTCCGCAAGTTTC
+TTAGTTTTGCGACGTGCTGCCCCTCAAGGGTTGCGGACGTGCTG
+>ds2020-267_541
+CAGCACGTCGCAATCATCCGGTGTTTGTTGCGGACGTGCGAGGAGTGCATAATTGCGGAC
+GTGCGCCCAGCGGTCATTGCGGACGTGCTGCTCCTTAGATATCTAAGGAGCAGCACGTCC
+GCAAGTTCTGACCCCTCACACGTCCGCAACCAGTGCACCATTGCGACGTGCTGAGGCTGA
+CGTATTGCGGACGTGCTGACAGGTGAATAATTGCGGACGTGCTG
+>ds2020-267_542
+TCCGCAAATATAACGGCCTCAGCACGTCCGCAAGTCGAGGCACCTCAGCACGTCCGCAAT
+CCGTGGGTCCTGTCCGCAACCTCCACCCGTATCGATTTGCGGACGTGCTGCTCCTAGATC
+GCTTAAGGCGACGCACTGACCGTATAACTAAGCCTGACGCACTGACCGTACCAACCGCCT
+GACGCACTGACTGTTCATAAGGGACTGCAAACGGTCAGTGCGTC
+>ds2020-267_543
+CAGCACGTCCGCAATGCCCCATGCCTTTTTTGGTTGGACCAGCCCAACCGGCGATTTCCG
+TCTTCCTGAATTGGGAGAGCAAGCACAAGTCTCTCTTCTTTTTTTCCTTTGAATTACTCA
+TATATATATCCTATGAATTTCATTTCGCACCGGAAACTATTCTAGGAGAAGTTCGAATCC
+GTTCCGTTCGGATATTGATCGGTCTTGATTTGCGGACGTGCTG
+>ds2020-267_544
+CAGCACGTCCGCAATTGCGTGGCCCTCCACCTCGTTGGGAAAAGTAAAAAGAAATAACAA
+GCCCTAAACTAAATATCAACTAGCAGCTTATCAACCACCGAACACAGACTCATGTTGGCG
+ATGCCATGGTCAAGTAAGAGGACGACCCATTCACCTCAAAAGAAAAATCTCGCCTCTCAA
+GTAAGCTATGTTGCGGACGTGCTGCTCCTTAGATAGATCGGAA
+>ds2020-267_545
+CAGCACGTCCGCAACTTGCCCGGCATGAATTTATCAGCCACCGTGTAATACAAATTATAT
+CAACGTAATTTTCACGTTTTGGACCATACAAATCCCATATATATAAAACCCAGAAACCAA
+AAACTACGAAAAAAAAGAAGAAGAAAAACGGTGTAATAATTAATACTCCGTTCCGTTCCC
+GTTCAATTGAATTGGCACCTGGTTAGCTTTGCGGACGTGCTGA
+>ds2020-267_546
+CAGCACGTCCGCAAGTTAGCCCGCCTCAGCCGTCCGCAACGCGATAACTCTCAGCAGTCC
+GCAACCAGATGGCTATACTTGCGGACGTGCAATCTAAGGAGCAGCACGTCCGCAATTTCG
+GGGTCTTGAGACGTGCTGCCGGACAATACTTGGGACGTGCTGAGGACTACGATTTGCGGA
+CGTGCTGGGCCATTAGGATTGCGGACGTGCTGCTCCTTAAGAT
+>ds2020-267_547
+GACGCACTGACCGTGGCTTTAGGGGTGAAAGGCTAATCAAATTCCGTGATAGCTCGTTCT
+CGTCGAAATATCTTTAGGGATAGCCTCGGATGAATCATTGTGGTGGTAGAGCACTGACTG
+GACTAGGGGCCTCACAAGGTTACCGAATTCAATCAAACTCCGAATGCCAATGAATTATGG
+TCGGCAGTCAGACTGCGAGTGCTATCAAGTTGCGGACGTGCTG
+>ds2020-267_548
+CAGCCCGTCCGCAAAACCGGTCTCCTCCGGCTAGTTTGTTGCCTTTACCTTTACCTTTAT
+CTTTATCTTTATCTTTTTTTCCTGTATCTGGCTCGATGTTTTCGGCATTTGGGGTCTGAC
+GCGGTGCGATACTATCAAAAATACTTGCCATCGATATATCAAAATTATATTTGAGCATGG
+CTTCACCACGGGCCTGGACTTGCGGACGTGCTGCTCCGTAGAT
+>ds2020-267_549
+GGACGTTCGGGCTTAAGATGGGGGGTGATAACGGGTCTGCTTGCAGACGAAGTGAGTGAT
+ACCCTGCTTCCAGGAAAAGCCACTAAGCTTCAGCTACACACGACCGTACCGCAAACCGGC
+ACTGAAGCCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCACGTCCGCAATTTCTGC
+CTATTGCGGACGTGCTGAGAAGGGGTGTGTTGCGGACGTGCTG
+>ds2020-267_550
+GGACGTTCGGGCTTACCTTGCTCCCTGGACGTTCGGGCTTCGTAATTGGGTTGGACTTCG
+GGCTTTATCCCACCGCTGTAACTAAGCCCGAACGTCCTTACTTCCAGAATCTAAGAGCAG
+CACGTCCGCAATACGGGGTTGGTCAGCACGTCCCAAGTGATATTGCCTCAGCCGTCCGCA
+AGGTCCACACGCGTGGGTTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_551
+CAGGTCGTCCGCAATGGCGAATCCCTCGGGTCGTCCGGAAGCAGTCTTGAGTCTTTGAGG
+AGGGGGGGGGGGGTGGGGGGGGGGGGCGGGGGGGGGGCGGGGGGCGGGGGGGGGGGGGGG
+GGGGGGGGGCGGTGGGGGGGGGGGGGGGGGTGGGGCGGGGGGTGGGGGGGGGGGGGGGGG
+GGGGGGTGTGCGGGGGGGGGGGGGGGGGGGGGGGGGTGGGGGC
+>ds2020-267_552
+GGACGTTCAGGCTTACTGACTCCCCTGGAAAAGAAACTGACTAGGATTCCCTTAGTAACG
+GCGAGTGAACCGGGAAAAGCTCAAATTTAAAATCTGGCGTCTTTCAGGCGTCCGAGTTGT
+AACCTATATGGATAAGCCCGAACGTCCTTACTTCCAGTCAGCACGTCCGCAAGAGCTTAT
+CCCCAGACTCCGCAATCTATTGTTCCTGATTGCGGACGTGCTG
+>ds2020-267_553
+TATCTAAGGAGCAGCACGTCCGCAAGCATGCCGGCCTCAGCACGTCCGCAAACCGATCCC
+CTCAGCACGTCCGCAATCTAACTGCTTTATATTGGGACGTGCTGCAGCATGGTTAGATGT
+GTAGGGGAGACGGGGGAACTCCGGTGGCGGGGGGTGGTGGGGGGTGGCGTGTTGGGGGGG
+TGGTGGTGGGTGGTTGGGTGGGTGGGGGGGGGGGGGGGGGGGG
+>ds2020-267_554
+CAGCACGTCCGCAATCGGTATTTTGTCTTGTGGGAGATTAAAGCTTAGGAGGCATGGAAG
+ACAAGCTCTGGTGATCCACGTTTTGGGAAAGCAGCGAAAACGAAGAGGTTGGTTGCGGAA
+AACAGGGTTTTGGTAACGAAAGATTTACAAACGGAGAAACGGAGAAACGGAGAAAGAGAG
+AGGTTTTTTTTTGGGGGGGTACTCTCCCTTGCGGACGTGCTG
+>ds2020-267_555
+CAGCACGTCCGCAAAACACATCCCCTCAGCACGTCCGCAATTTACCTGTATTTATTATTG
+CTTTCATTGCTGCACCTCCAGTAGATATTGATGGTATTCGTGAACCTGTTTCTGGATCTT
+TACTTTATGGAAACAATATTATTTCTGGTGCAATGCTTCCTACCTCTGCAGCTATAGGGT
+TTCACGTTTAACCGATATCAGAAGCGCCTTGCGGACGTGCTG
+>ds2020-267_556
+CAGCACGTGCGCAATACTGCCCAATTTTTTGGTGGGTATCAAAGTTTTCTGTCTACCCAT
+ATATATATATGAAAATCTTTTCTTTGCTACCTCTTCTCTTTCACGCCAATAACTTGGCTT
+CCTTTTCCCTTTATTTTATTGGACTTGTTTTGCACCATATGCCTCTTCCGTTTCAACACC
+TCTTACACTTGTCCACATCACCTACCCTTTGCGGACGTGCTG
+>ds2020-267_557
+CAGCACGTCCGCAAGATGAACAAGGTACCGGCTGCAATAGGATGAGACGCGCTTCCTCCC
+GGCACAAAAGGATCAAAACCCTCCACACCCCACGCTGGATTTACGGATTGTACCCTTCCG
+GTTAGTCCATAAGGATCGGACACCCATATTCCAGGACCATACAATCCTGTTACATGAAAT
+GCACCAAAACCAAAGCAAGCCTGCGCCGTTGCGGACGTGCTG
+>ds2020-267_558
+GGACGTTCGGGCTTTCTGGTTACCCTTCCCTAGTCGATTAGTGATTTTTGACTAAGAATG
+ATACCGTTATTATCCGCATACACATACATGCCAGAGTTGATAGTTAGACCGCCAAAGCTG
+ATTTCGATATCCGTCTCGCCCACACCTTTGCGATTGGATTTTCGGGGGATAGCGAAAACC
+AGTTGCGGACGTGCTGACGGATATGCTCTTGCGGACGTGCTG
+>ds2020-267_559
+TCTAAGGAGCAGCACGTCCGCAACGTAGCCTGGGCAGCACGTCCGAACTCTCTACTCCTC
+AGCACGTCCGCAAGGGACAAGGTCTTGCGGACGTGTGAGGGACGGCTATTGCGGACGTGC
+TGCTCAATCTAAGGAGCAGCACGTCCGCAACGTAGCCTGGGCAGCACGTCCGAACTCTCT
+AGTCCTCAGCACGTCCACAGTGATTGGTTTGCGGACGTGCTG
+>ds2020-267_560
+CAGCACGTCCGCAAATACTGTGGCCTCAGCACGTCCGCAAATTCCCTTCCCTCACACGTC
+CGCAACAGGACAACCCTCAGCACGTCCGCAAATACTCTGGCCTCAGCACGTCCGCAAATT
+CCCTTCCCTCACACGTCCGCAACAGGACACCCCTCAGCACGTCCGCAAAATAAACTGCAT
+GCCCTTGGGACGTGTGAGCGAATCACTATTGCGGACGTGCTG
+>ds2020-267_561
+CACGTCCGCAATTGGTGTTGTGGGGCGGGGGGGGCGGGCGGGGGGGGGTGGGGGGGGGTG
+GGGGGGGGGGGGGTGGGGGGGGGGGGGGGGGGGTGGGTGGGGGTGGGGGGGGGGGGGGGG
+GGGGGGGGGTGGGGGGGGGGGGGGGGGTGGGGGGGGGTGGGGTGGGGGGGGGGGGGGGGT
+GGGGGGGGGGGGGTGGGGGGGGGGGGGGGGTGGGGGGGGGGG
+>ds2020-267_562
+CAGCACGTCCGCAAGTAGCGCAGCCTCAGCACGTCCGCAAGCAGAACTCCCTCACACGTC
+CGCAATTATTCTCCTTCTGTTGCGGACGCCGCTTAAGGCGACGCACTGACCGTTAGATCC
+CTCCTGACGCACTGACCGTATCTAATCCCCTGACGCACTGACCGTCGGACCGTCTCTGAC
+GCACTGACCGTCAACTAAGGACTGTAAAACGGTCAGTGCGTC
+>ds2020-267_563
+TCATGGCCTCAAGCTTGGCTCGGTACTACCATTATAGGCGACTGTGCATTATCGATACGC
+CGCTCATAGACTTCGCAGGTGTTACCATGAACTGGGGCCTCGTGGTCGTGTGGGAGCTGA
+TCTGGGAAGCCCGAACGTCCTTACTTCCAGTATCTAAGGAGAGCACGTCCGCAATAGGTT
+GGGAGTCAGCACGTCCGCAATGGTGCGCTTGCGGACGTGCTG
+>ds2020-267_564
+GACGCACTGACCGTTCTACAGCCATTGTCACACGGTAAGTGCGTCAGGAATCCGGCCACG
+GTCAGTGCGTCAGGCAGAATCTCACGGTCAGTGCGTCGCCTTAAGCGTAGCACGTCCGCA
+ATGGCGCTAATATTGGGACGTGCTGAGCGCATAACCATTGCGGACGTGCTGGGGTATCGG
+CATTGCGGACGTGCTGAGGAAATACGTGTTGCGGACGTGCTG
+>ds2020-267_565
+AAGCCTGGTTCTTTGACGCACTGACCGTTGGAGGCCCACTGACGCACTGACCGTGAACGA
+GTCCTTCTGGATTGTTGCCCAACGTTTTTGGGTCAATAGTTGCTGTTAGCCCCACCACTT
+CGCCATTGTCATCGGTGATGTGCTCCTCAATCTTTAGCACATAACTATTGCGTAAGCGGA
+TTTCTGGGTTTTACGGAGGCATCAGTAGACGGTCAGTGCGTC
+>ds2020-267_566
+CAGCACGTCCGCAATTGGTCCCGGCAGCACGTCGCAACCAAATAGACATTGCGGACGTGC
+TGCTCCTTAGACGCTTAAGGCGACGCACTGACCGTATTTGTCCGAGTTTAATTTCAATTC
+AATTAAGAGAACTAACAGTAAGTAATTACTAGATTACAAAGTATCCATTGCTTGGAATTC
+AAATTGTATCCATTGCTTGGAATTCAAATTTGATCTCCTTC
+>ds2020-267_567
+CAGCACGTCCGCAATTCCTCGTGACTCAGCACGTCCGCAAAACCTTTAGCCTCAGCACGT
+CCGCAACGGGGCTCCACTCAGCACGTCCCAAGTTTACCGCCATTAATTTGCACGTGCTGA
+GGAGTTCGAAATTGCGGACGTCTGGAAGTAAGGACGTTCGGGCTTCAGTCCACCCCTGGC
+GTTCGGGCTTAACTCACGGATTAGCGCAAGCCCGAACGTCC
+>ds2020-267_568
+CAGCACGTCCGCAAGTTATGATCGCCCCGTCCCAACCTCATCCCGCTGATCTTGCGGACG
+TTGCTCCTTAGCTTGCTTAAGGCGACGCACTGACCGTTGGATTGAGCCTTGGTATGGAAA
+CCTACCAAGTGAGAACTTTCAAATTCAGAGAAACCCTGGAATTAAAAATGGGCGATCCTG
+AGCCAAATCCTGTGTTATTAAAACAAACAAGGGGTTAATAA
+>ds2020-267_569
+CAGCACGTCCGCAACAAGCAATGGTGCGAAGCTATCATCTGCTGGATAATGGCTGAACGC
+CTCTAAGCCAGAATCCGTGCTAGAAGCGATAACGTTGGTCCCGCACATGCCTAGTGTTGG
+AATAGAGCTTTGCTCGTACACCATACAAGCCGCGTGCAGCCGGAAGGGGTAGCGTGGTTG
+ATTGCAATGTAAACAAGCGCGGGGAGCTTGCGGACGTGCTG
+>ds2020-267_570
+TCAGCCCGTCCGCAATAACCCACGGCTCACCCGCCCGCAATAGTTCGGCCCCAGCCGTCC
+GCAACCTGGCGAGGTCCTGGCGGACGTCTGGGGCCTAACTATTGCGGACGTGTGAGCAGT
+GGGTTATTGCGGACGTGCTGAGTCCGCAATCTCTTACGCCTCAGCACGTCCCAAGGTTTT
+AAGGGTGCGACGTGGAAAGGATCCCGCTTGCGGACGTGCTG
+>ds2020-267_571
+CAGCACGTCCGCAATACACATCCCTGCAGCTTTCTAGAAAGATCAGCCACCGTCTACGGT
+GACTGCCCCTCTCTTATTTACAACGATACCACCTACACGTGGACGCAGACCCACCGTCGA
+TGCATCCGAGTCGCTTCCTCTATATCATCGCTCGTCATCAAGAGTCGCCACGTGGTGTCT
+GTTCTCTCTCCCAACACTCCCCCCATATTGCGGACGTGCTG
+>ds2020-267_572
+CAGCACGTCCGCAAGCCGCAAATGGTATTTTTTTAATAGCCCTTGGTACTATCTTTTTGG
+GTACGCGCTTGTATCTTTAAGCATATTTTTCGCTAAATCAAAGCCAAATCATGTTGATGG
+TAGTTGCCATCTTATTGTTAATTTTTTTCCCCTTTTTTCCCTATTATAGGTAGAGGGCCC
+GCCATCTAAAATGCCAACAGTGGAACCTTGCGGACGTGCTG
+>ds2020-267_573
+GACGCACTGACCGTGTGCCACCCCTGACGCACTGACCGTCATTATGGGGCTGTAGACGTC
+AGTGCGTCAGGACTATGTGCACGGTCAGTGCGTCACGGGGGCACCTACGGTCAGTGCGTC
+GCCTTAAGCGTAGCACGTCCGCAATTGGTATCGGTTTGGGACGTGCTGAGCCGAAAGACT
+TTGCGGACGTGCTGAGGGGAAGAGATATTGCGGACGTGCTG
+>ds2020-267_574
+GACGCACTGACCGTTGGATTTGGGTGACGCACTGACCGTACGTATACCTCTGACGCACTG
+ACCGTACATCAGACCCTAACACACGGTCAGTGCGTCAGGTCGTACTTGACGGTCAGTGCG
+TCGCCTTAAGCGTGTCCGCAAATCCCATGCATTGCTCTTTGCGGACGTGTGGGCCTACAT
+ACTTGCGACGTGCTGAGGATTTCGTCCTTGCGGACGTGCTG
+>ds2020-267_575
+GGACGTTCGGGCTTATTCTATGCATTGGACTTCGGGCTTGTGCTATCCCTGGACTTCGGG
+CTTGAGCCTAAACATGGACTTCGGGCTTACAAATGCTGCTAGAAGCCCGAACGTCCTTAC
+TTCCAGCCACGTCCGCAAGCTCCTTACGCTCAGCCGTCCCACAACATCTACCATTTGCGG
+ACGTGCTGGGGACACATATTTGCGGACGTGCTGCTCCTTAG
+>ds2020-267_576
+GGACGTTCGGGCTTTTACGGCCCCCCCCCTTCTCATATCAATAACTAAAATGAAAAAAAG
+GGGAATATCAACGAATCCGGAAAAAAACGATTGATCTCTATCAATAAATGTCACACTAAG
+CCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCACGTCCGCAATTCTCATGATCTAG
+GACTTGCGGACGTGTGAGGGGCCTTGTGTTGCGACGTGCTG
+>ds2020-267_577
+CAGCACGTCCGCAACGCCGATACTATTGCGACGTGCTGGGGGTTTGTTATTGCGGACGTG
+CTGCTCCTTAGATTCGCTTAAGGCGACGCACTGACCTTGGACGTTGTTCTGACGCACTGA
+CCGTACACTCTCGCCTGACGCACGACCGTAGTATATCCCCGACAGCACGGTCAGTGCGTC
+GCCTTAAGCGAATCTATATCCCCTGGTTTGCGGACGTGCTG
+>ds2020-267_578
+CAGCACGTCCGCAACCATGGTCCCTCCACACGTCCGCAACGGCTCCAATATTGGGACGTG
+CTGAGGCGACGCACTGACCGTATGTAGGCCTCTGGACGCACTGACCGTTCTTCTCAAACT
+GACGCACTGACCGTGGTTACTAGCCTGACGCACTGACCGTGTCATTCGAACTCGAGATTT
+CTGTTCTCGTTGAGCACATTCCTAGGGACGGTCTGTGCGTC
+>ds2020-267_579
+GGACGTTCGGGCTTAGGTTACGGAATACAAAGCCCGAACGCCAAAGGATGCGAAGCCCGA
+ACGTCCTTAATCTAAGGGCAGCACGTCCGCAAACTCCTCCTCCTAGAAAACCTTCTATCC
+TTCAAAGCAGCTCCATCTTTTCGGGTCTTGTTCAGAATCAATGCGCGTTCCCTTTCTTTC
+TTTCGCTTCTCCCTTTCCAATCGTTCTTCCCTCAATTCTT
+>ds2020-267_580
+CAGCACGTCCGCAAACTTCCGGGTCTTTTCATTGCATTCACTTACAACAAGAAACAACCA
+CCAGCGTTTGGTGCAGCACCTGCATTTTGGTGCATTCTTCTTTCTTTCCTTGGTCTTTCG
+TTCCGTCATATTCCTAATAACTTATCCAATTACAACGTATTAACCGCTAATGCACCTTTC
+TTTTATCAAATCTCAGGGACAGCCCGTTGCGGACGTGCTG
+>ds2020-267_581
+CAGCACGTCCGCAATAACAGGCTGGTGACATATCGAAGAGACAGGACGTGCAAGGCAGTA
+GTACTGATGAGACCGGACGGATTTAAGCCGGACGTCATAGCGACCGTTTATGGGTTCGCG
+TACGGTTTGACCGAAAACGTCTTGACGATACCTCGAGGAGCCAAAGACGAAGGGAGTCAG
+GCCGGTGGGACAGGCGTATGGATCAAGACGGACGATAAGA
+>ds2020-267_582
+CAGCACGTCCGCAAACGGCACTGTCTCCAGACCCAGTGCCAGACCCAAAGCTGTGTGTCG
+TAACGATGTCATTGTCATCTCTCTTATTGTGCCGGATGCGCGATATCACGCGTTTTATGC
+TCGCGAGGTAACATGACATGCTCGAATGACAGAAAAATAACTGTTTGTTTACAGATAAGT
+GACAGCCAGGCGTCAGAGGTCTGAGGTTGCGGACGTGCTG
+>ds2020-267_583
+CAGCACGTCCGCAAGTCTAGCTAAGTCCCATGCCACTCTCCATGATGAGAAGTGCAATCT
+TGGATCCCTTAACATAGCATCCCAATTGTCCCTTCCATGTCTCCTCACACCTATCCATAG
+AAAATCCAACTCCTCTTCAGACCACATGGTACTATATGGCTTATATTTGTCATGAAAACT
+ACTCCTTTCATTGAAAGCTCAGCGGCTTGCGGACGTGCTG
+>ds2020-267_584
+GACGCACTGACCGTCTACTACTCCCTGACGCACTGACCGTGTGGACCCCCATGACGCACT
+GACCGTAAGTTTTCCCTTGACGCACTGACCATTTCATCCCCTACGGTCAGTGCGTCGCAA
+ACTAAAGTCCCTCAGCACGTCCGCAATAGTTCTGGCCTCAGCACGTCGCAAGTCCTTGTC
+CGTCCACGTCCGCAATAGCCAATTGTTTGCGGACGTGCTG
+>ds2020-267_585
+GACGCACTGACCGTACCACCTCAAATAACACTCAGTGCGTCAGACAATAAACTACGGTCA
+GTGCGTCAGACTATACCTAACGGTCAGTGCGTCGCCTTAAGCGGAGCAGCACGTCCGCAA
+TCGGCGTTTACTCAGCACGTCCGCAACGATAGACCTCTCACACGTCCGCACTAGCCGGGA
+ATTGCGGACGTGCTACCCGGAATTACTTGCGGACGTGCTG
+>ds2020-267_586
+GACGCACTGACCGTTACGGGGGGGGTGGTGTGGGTAAAAAACTAATAAATATTTAATTTA
+TCAACAACAATGCAAAATCACATGGGGGTGTATCCGTATTTGGCGGAGTAGGTGAGCGTA
+CTCGTGAAGGAAATGATCTTTACATGGAAATGAAAGAATCTGGAGTAATTAACGAACAAA
+ATATTGCAGAATCAAAAGTGTCTCCCACGGTCAGTGCGTC
+>ds2020-267_587
+CTCAGCACGCCCGCAATAGAAAACGAGTGAGTGTGAACGGTGTGGCAGAAGGAACTGCAA
+GAGGTGGTGTGCCTTTAGGTAGAATTGCTGTTTACAAAGTGTGCGAGCCAGTGGGTTGCA
+ATGGTGAACGAATTTTGGCTGCGTTCGACGATGCTATAGCGGATGGGGTAGATGTTTTAC
+CCATTTCTCTTGGAGACTAGCTTAGGCTTGCGGACGTGCG
+>ds2020-267_588
+CAGCACGTCCGCAAGAGCCTTTCCCTGATAACTTCTCGTTCGCCAGGCGACAATATATCC
+TTTTCCATCTCTACACCATTTACCCTTGTTTTAAGTGATACATTGCGCCTTGATTCTACA
+TTAAATACAAATTTTTTGTTATGGTTGTGAGAATCTGCCATGCCATTCATGTAATCCACG
+ACTCTTGCTGCTGATGCCATTTTGTTTGCGGACGTGCTG
+>ds2020-267_589
+GCAGCACGTCCGCAAAGAGTCAGGTTTTGTATTTTACAATACTAACAAATGGACGCTCAA
+AAAACTCAAGGAATCAGCCAGCAATAATCAGCAATTGCTACTTTCCAACTTTGAGGAGTA
+TTTAAATGGCTTTAGTGCTAAGTCAAAGACATATTAGTGCGGTTTAAATTACTTGACCAA
+GTTCGCCATATGGAGATGAGATTGTTTGCGGACGTGCTG
+>ds2020-267_590
+CAGCACGTCCGCAAGTGTTTCGCCTTCTTTCCTAATATCGTTCGTGATAACTGTAATACA
+GTTAAGACTCACGACATTACCATAGGGTTTCCTCTTAAGATTTCTTTTCTTATCGACATT
+GGTAACATTGTCGGTAGATTAGTCTTCTTACAGAGGGATATCCCAAATGGTCTAGGAAGG
+TGTTGACCTCCTAAGGTTCTCGTAATTGCGGACGTGCTG
+>ds2020-267_591
+CAGCACGTCCGCAAATCGCCGAAGATTGAGGAACAAGAAGAGATCTATTAAGAGAAAGAT
+TTATCCGAGAAAAAATCTTAACAGTTACATCCAATCACAAACTACACGAAAGTTGCCCCT
+TTTTCATGGGGATTTACCCATCACAGAGATGCACAGAGGAACAGAGCGAACTTCATATAT
+CCCTTTTCCACTCAAACCAGGAAACTTGCGGACGTGCTG
+>ds2020-267_592
+CAGCACGTCCGCAATTGTCATATCGTCCGTCGATGCTTTCGAACTTCTTCGTCAGCTTGT
+TGAGGAAGCCGACGTCAAGAGTCCTAGAGCCGGTCGACGTATTCGTCGAAGCAATTGGAG
+CTTTCTTGCCATGTGTTTGTGCCTTCAGAAGAACGGAGGGGGAGCCCATGCGGACTCCCC
+CTCGTGTACTACGAACAATCGTGGTTTGCGGACGTGCTG
+>ds2020-267_593
+CAGCACGTACGCAAAGTACTCTCTGGTGGAACCATGAAGGGAATGTAGTGCTTGTCGACG
+CGTTTGAACAGTGTATCACAGTCGACCTTAATTCTGATCTGGTAAGGCTTACCATTGTTT
+ATGCAAAGTGCTCCATTCAGGAGAGACGGCTTCTTTGGGAAAAACGGAAATTACTGTCCT
+AAGACATACAAGATCCATACCTGGTTGCGGACGTGCTGC
+>ds2020-267_594
+CAGCACGTCCGCAACCGCCCGCCCGTAAACCTAAGGGTTCCTCCGCAAGGTTCGTCCACG
+GAGGGTGAGTCAGGGCCTAAGATCAGGCCGAAAGGCGTAGTCGATGGACAACAGGTGAAT
+ATTCCTGTACTACCCCTTGTTGGTCCCGAGGGACGGAGGAGGCTAGGTTAGCCGAAAGAT
+GGTTATCGGTTCAAGGCAGAATGAGTTGCGGACGTGCTG
+>ds2020-267_595
+CAGCACGTCCGCAACAATGCGTATCTGAGGGCGGCCGTAGGGAAGACCTGGTACGAGGGT
+GCGCTATCGCTGCACACAGGCGACGATGTCTTTATCAGGGCGAACACCCTCGCCGACTGT
+TCCGTCATTCTCAGTGATGCGGTTGCCTTCGGATGCCGTATGAACCCAACCAAACAGTCA
+ATCGGATTCTACAATCGACTAGCCTTGCGGACGTGCTGA
+>ds2020-267_596
+TATCTAAGGAGCAGCACGTCCGCAACTTTTACTCGGTCAGCACGTCCGCAATGTTCGCTG
+CCTCAGCACGTCGCAATATGTTACTCATCAGCACGTCCGCAAGAAGATGAGGGTTCATTT
+GCGGACGTGCAGTGAGTCACTATTGCGGACGTGCTGAGTGGTAGTCAATTGCGGACGTGC
+TGAGGAGGTTTAAGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_597
+CAGCACGTCCGCAACTATCCGCCGATTGAATTATTTGGTCCCACTCGTTATCAATGGGAT
+CAAGGATACTTCCAACCAGAAATATATCGCAGAATTGGTGCTGGGTTAGCTGAAAATCAA
+AGTTTATCTGAAGCTTGGTCTAAAATTCCTGAAAAACTGGCTTTTTATGATTACATCGGC
+AATAATCCGGCAAAGGGGGGAAGCTTTGCGGACGTGCTG
+>ds2020-267_598
+TATCTAAGGAGCAGCACGTCCGCAATCAAAGAGGGATGCCATTGGGACGTGCTGAGGGGT
+TTGGCGTTGCGGACGTGTGCCTCACCGGCATTGCGGACGTGCTGCTCCTTAGGCGCTTAG
+GCGACGCACTGACCGTCGTCTACTCCTTGACGCACTGACCGTTCCTATGCTGGTGGACGC
+ACTGACCGTAATGAGGGGGTTCGGCACGGTCAGTGCGTC
+>ds2020-267_599
+GACGCACTGACCGTTCGTTGCCACCTCCCCATGGACATGCGAAGTGGCAGCAACAAACTA
+CTCGCCTTTATTCTAGAAAAACACCATGGTATCAAGCCGCACTGTGCCTACCTATTTTAC
+AACAAAACTGGCACACGGTTAAAAGTGCAGGGACCTGCTATTGCGGACGTGCTGAGTGAC
+AAAATGTTGCGGACGTGCTGAGGGTAGGTAATTGCGGAC
+>ds2020-267_600
+TCCTCCGGAGTGCCTGAAGTTCAGACCTGTCCCCTTCCGATCTATCTACGGACCAGCACG
+TCCGCAAGTCATGACCCCTCAGCACGTCCCAAGGTTGCTCCCTCAGCCGTCCGCAATTAT
+GTCAGTTTGCGGACGTGCTGCTCCTTAGAGATAGGAAGAGCGTCGTGTAGGGAAAGAGTG
+TGCCTCTATGTGTAGATCTCGGAGGTCGCCGTATCATTA
+>ds2020-267_601
+GACGCACTGACCGTAGCCAATTCCCTGACGCACTGACCGTGTCGTATCGCTTGACGCACT
+GACCGTAGGCAATCTACTGACGCACTGCCGTATGAAAGCCGGTAAGGCGGTCAGTGCGTC
+GCCTTAAGCGTCAGCACGTCCGCAAGCATTCACGTCTCAGCACGTCGCAACCAACCATCG
+CCATTTGGGACTGAGGGGTGACATATTGCGGACGTGCTG
+>ds2020-267_602
+GGACGTTCGGGCTTATATTGGGGGATAGAAGCCGAACGTCCAGGGATAAAGTAAAGCCCG
+AACGTCCAGGGGGCGCCGCAAGCCCGAACGTCCTTACTTCCAGCACGTCCGCAATAGTCT
+CGGTGTGCATTGCGACGTGCTGACCCAGTTCTGTTGCGGACGTGCTGAGGGGCTGAGAAT
+TGCGGACGTGCTGAGGCTGACGAGCTTGCGGACGTGCTG
+>ds2020-267_603
+GACGCACTGACCGTCGGAGAACTGGTGACGCACTGACCGTCATTGCAGAGGTTACGGTCA
+GTGCGTCAGGGGACGCACTGACCGTAGGGATGACCTGATGCACTGACCGTTGTAATTCGC
+CTACGTACGGTCAGTGCACGTCCGCAATTGAACCTGCTCCACGTCCCACCTGGTCAACCT
+TGCGGACGTGCTGAGCGTACCAGCGTTGCGGACGTGCTG
+>ds2020-267_604
+GACGCACTGACCGTCGTACCCCGATTCCTAGCCTTTGGTAGTGTTGATAAACGTATTACC
+GCCAAACTATCACTAGGGCAAGGGCTTTACGCCAATAACTTTACAAGCTGGTCAAGATAC
+TATGGCACGACCAACGTAACAGGCGAAACCACCAAAAAACGGTCAGTGCGTCGCCTTAAG
+CGAGGACGTGCTGAGCTGGAGCTTCTTGCGGACGTGCTG
+>ds2020-267_605
+GACGCACTGACCGTGGCTTGGATTTTAAGACAAGGAAGAAGAGAACAGAGAGAAGGGAAT
+GTTTAAATAGGAGCTGGGATTTCGAAGGTGGAATGTAAAGTTTGGGTCTTTAGCTGTATT
+TCGCTTTGTGGGCAAGTAATGGTAATGGTAATGGAGGATACTTCGAGAGCAAGGTTATAG
+TTGTGGACGTGCTGGGCGAACTGGGTTGCGGACGTGCTG
+>ds2020-267_606
+GGACGTTCGGGCTTTGTGCTGCGGGTGATTTTACCTACGGGTGAGCAAATTGAAATTTGC
+GGGGGTGAGGCGAATACCACCAACAACCGCATGGAGCTGATGGGGAGGGGGCCAATCAAG
+CCCGAACGTCCTTACTTCCAGAATCTAAGGAGCAGCACGTCCGCAACTCTTCGCTCCTCA
+GCACTTCCGCAATTAGTGAATGATGTTTGCGACGTGCTG
+>ds2020-267_607
+AGGAGCAGCACGTCCGCAAAGGATTCGTCATCAGCACGTCCGCAATCCCAAGCCCGTCTC
+TATGGCGGGTGCTGAGCATCGATTATTGCTGAGGTGCTGTTCCTTAGATCATCTAAAGCG
+CATCACGTCCGACATTATTGTATCCTCAGCACCGCCGAATAGCATCTTCCTCCTCGTCCC
+AATTAATGGGGATTGATTGCGGACGTGCTGCTCCTTAGA
+>ds2020-267_608
+CAGCACGTCCGCAACCAACGTACCCTCTGATTTCGATACAATCCAAACCCTAATCTAACC
+CTAATTCCAATTATTGCAATTTCTTTCTCTTTCGTAAACCCTACTTTCCTTGAGTTCTTC
+GACACAATTATTCATTTTTACTGGATTTGATTGATTCATGGGCCGTAACTCCCTCGCTCC
+CGGGTTCCGATTCCACCCGAGAACTTGCGGACGTGCTG
+>ds2020-267_609
+CAGCACGTCCGCAACTATCATGCTATGGTCACAGAGCTCTTGTAGCTCAACATACCTGCA
+GCTGATGCCATCCGCATTGATGCAAGGGATGTTGAAAGTGATGACGGCACAGGCGTTTCA
+GAAACCGGTGCCAGCGTCATGTTTCCACACAACTTGGCCAGTTCACTGACTGTCGCAACA
+GGCACCTTGCCCATCAAGGTGTCATTGCGGACGTGCTG
+>ds2020-267_610
+CAGCACGTCCGCAATGCCGTAGCCCTGTGGACCGGGATGCTGGGCACTATCGTTTACAAC
+CAGAATCGCCAGCAAAACCGCGTGCGAATTTTCGAAAGCGGTTTGCGCTTTGTACCGGAT
+AATCAGGCAAATTTAGGCATCCGTCAGGATCTCCTGCTGGCTGGTGCTATCAGTGGCAAC
+CGTTATGAAGAGAGTGCCCGGAGATTGCGGACGTGCTG
+>ds2020-267_611
+CAGCACGTCCGCAATCGCTCTTAGATCCTCGTACCGCCAGTCCCCTTCTATTAGTGTCAG
+CAGAAGCTCAGTGGACCTCCGTAATGCCTCGTCCCAAAGATCTCATGCTTCCTATTTTGT
+TTCCCCCAATTCCTTTGGTTACCCATCTTTTTCACCCCTGAACTCAAGATACCTGTCTGT
+TGCACACATTCCAAGCCCTAACAATTGCGGACGTGCTG
+>ds2020-267_612
+CAGCACGTCCGCAAAGGGCCCACCCTCAGCACGTCCGCAACGCACTATCCCTCAGCACGT
+CCCCAAGTATCTAAGGAGCAGCACGTCCGCAACGGTGACCCCTTAACCATTGGACGTGCT
+GAGGGTTCGATACTTGGGACGTGCTGAGCGGACAGTTCTTGCGGACGTGCTGACAGATTG
+CCGCTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_613
+GACGCACTGACCGTACCACGCCCCTGACGCACTGACCGTGACGTAAGCGCTGACGCACTG
+ACCGTAACACTACCTGTGACGCACTGACCGTCCCTATACGGCTGACGCACTGACGTATTA
+GATCTGGTCCAACGGTCAGTGCGTCGCCTTAAGCGATCCGCAAGATTATAGAGGTTGGAT
+TGCGGACGTGCTGCCCGGACTATCTTGCGGACGTGCTG
+>ds2020-267_614
+GGACGTTCGGGCTTTGGTGTCATGGTTTGGGGTGGGGGTGTGTTATCTCAACTTGGTTGG
+CAAAGTACCCAGTTGCTTACCATTACCACAATGGCTCTACCCACCGTGTGCCGGAAGCCC
+GAACGTCCTTACTTCCATATCTAAGGAGCAGCACGTCCGCAATGGTCAGACCCTGATATT
+TGCGGACGTTGCGGGCTAGTTGCTTTGCGGACGTGCTG
+>ds2020-267_615
+CAGCACGTCCGCAAGTTCATCGGGATGTGTATAGTGATAGGATCACTCGATTCATGCGTC
+TTGGTTGGCAGGGGCTGGTTGGAAACACAGCAACAACCACACGCATCGAGAATGCAGAAT
+TGACCACACTTGGTGGTAATCATGTCGTTGACGTTCCCGTTCCTTTTTTATGAACGGAAG
+CTACGACTACAAACCCAGTTGGAATTGCGGACGTGCTG
+>ds2020-267_616
+CAGCACGTCCGCAAGTCGTCCGCTATCAGCACGTCCGCAATGGTTTTGTCCTCAGCACGT
+CCCAATACCGGATCCCTTGCGGACGTGCTGCTCACGCTTAAGGCGACGCACTGACCGTAC
+TTGCACGCCTGACGCACTGACCGTGAGCACATGAGTGACGCACTGACCGTCCAGACTACT
+TTAAACGGTCAGAGGAGTGGAACGACGGTCAGTGCGTC
+>ds2020-267_617
+GACGCACTGACCGTGTCCTATTCGTTGACGCACTGACCGTCACTCTGTTTCTGACGCACT
+GACCGTTACTAGCGCCCTGACGCCTGACCGTATCTGCGAGAATACGGTCAGTGCGTCGCC
+TTAAGCGTCAGCACGTCCGCAAGAGGCACCGGGCACACGTCCGCAATAGTCACCCGGTGA
+TTGCGTCGTGCTAAGGCTATATAATTGCGGACGTGCTG
+>ds2020-267_618
+GACGCACTGACCGTTTTAGCTACGGTCAGTGCGTCAGCCATATAAACACGGTCAGTGCGT
+CAGGGGCACGGCGACGGTCAGTGCGTCGCCTTAAGCGACTAAGGAGCAGCACGTCCGCAA
+TCCGTCGGCACTTGGGACGTGCTGAGGGAAACATCATTGCGGACTGACCGGTAACCTCTT
+GCGGACGTGCTGAGGGATAAACAGTTGCGGACGTGCTG
+>ds2020-267_619
+CAGCACGTCCGCAAATCCTAATCCTAACCCTAGAGAGCACAACAGCAGCAGTAATAGCCA
+TGGAGTGCGAGAGAAGAGAGACATTGATGGATGGATAGGATGAGTTTTTCCTGGAGCAAC
+TCCAATTGATCAGAAATTTGGGTTGCAGGGAGGGAAAACCCGAACCCTAAATTTTGGGGA
+CGTGGAAACGGAGGAGTGTAACATTGCGGACGTGCTG
+>ds2020-267_620
+GCAGCACGTCCGCAACTTCGGCCCCCTCCAGCCATGCCGCGTGTGTGAAGAAGGCCTTAT
+GGTTGTAAAGCACTTTAAGCGAGGAGGAGGCTACTTTAGATAATACCTAGAGATAGTGGA
+CGTTACTCGCAGAATAAGCACCGGCTAACTCTGTGCCAGCAGCCGCGGTAATACAGAGGG
+TGCGAGCGTTAATTGGGATACCATTGCGGACGTGCTG
+>ds2020-267_621
+CAGCACGTCCGCAACCATCTAGTTTTCCGAAACCGAACTGAATAGAATTGTGACTTTCCA
+AAAATGCTTGCTGAAAATCAAAGAAAGAAGGTCCATTTTCCCACGTAGTTCGTCGGTCAA
+ACCAACGATTCTCTTCTCAAAGTAATAGAGAGATCTTTTTCTAGTTAGACTTCTATCAAT
+GCAATGAAAGAACCATCCCTTATTTGCGGACGTGCTG
+>ds2020-267_622
+CAGCACGTCCGCAAAATCCATTGGGCAGCACGTCCGCAAAAAGCTCTCCTTTCACAAGGT
+GGACCTCCGGGACAAACCAGCACTGGATAAACTCTTTTCTTCAATAACATTTGATGCTGT
+CATACACTTTGCTGGACTCAAAGCAGTTGGTGAAAGTGCAGAAACCATTGCTGTATTATA
+ACAACAATTTAATCAGGACCGAATTGCGGACGTGCTG
+>ds2020-267_623
+CAGCACGTCCGCAACAATAGACCTCTGTGCTGCCATCTTCAAAGTTCGTATATCCACATT
+TCTAGGCTATAATCAAAATCTGATAAAAAGACGCCTCTAAAATCATCCCATGCTAGACAA
+GTGTGTTTCAATCACACAATCTTCCAACAAAAGATAGCCATCTTCAAAGTGCATATATGC
+ACATATATTGCATATCACAACCTATGTACACGTGCAA
+>ds2020-267_624
+CAGCACGTCCGCAAGCTAAAAGGTTTTGGTAGCCTCCTATCAACCAAACCCAATCGAAAT
+CAGTTAGGAAAGCCTCTCTAGCATGGTCCAAAGGGGCATTTGATGAAGTTGAATATTGAG
+GCACATTCCATTCGTTCCAAAATTTAGGGGTGTTTCGACATTTGCCCTTTTTTTTTATTT
+ATATAATTCCCACGGCTGCACGGTTGCGGCCGTGCTG
+>ds2020-267_625
+GCAGTTGACTCCTACATCCCTGCTCCACTGGGCTCGGGGCGATATAGCACAGTTGGTAGA
+GCTCCGCTCTTGCAATTGGGTCGTTGCGATTACGGGTTGGATGTCTAATTGTCCAGGCGG
+TAATGATAGTATCTTGTACCTGAACCGGTGGCTCACTTTTTCTAAGTAATGGGAGGGGGG
+CGCGTTTGCGGACGTGCTGCTCCTTAGATAGATCGGA
+>ds2020-267_626
+GACGCACTGACCGTCTTTCAGGTGATTAGATACGGTCAGTGCGTCAGTTAGCCATTAACG
+GTCAGTGCGTCAGGCCGCTTGGCACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGAGCAG
+CACGTCCGCAATCCATGGCCCCTTGCGACGTGCTGAGGACTAAATACTTGCGGACGTGCT
+GAGCAACAGCCCTTTGCGGACGGCTGCGCCTTAGATA
+>ds2020-267_627
+CAGCACGTCCGCAACTCCCTCACACTCAGCACGTCCGCAAGCATCTCCCCTCAGCACGTC
+CGCAACTCCCTCACACTCAGCACGTCCGCAACCAAGTAGAAGTGGACGTGGGGGAGCCAG
+ATTGCGGACGTGCTGAGCTGACTGGCCTTGCGGACGTGCTGATCCTTAGATAGATCGGAC
+GAGCGCACGCCTGAACGTGAAGCACTCCGGAGAAGAC
+>ds2020-267_628
+GGACGTTCGGGCTTGGATTACTCTGTGCGATCGGGAATCAGCAGTCGCTTCGCCATCTCT
+CGCAAGCTATCCGGGACAGCGATCTCGGAAAGCCCGAACGTCCTTTCTAAGGAGCAGCCG
+TCCGCAACAGGCATGGGGTAGCACGTCCGCAATCAAGTCTCCCTCAGCACGTCCCAACAT
+AACCCGGGTCTTTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_629
+CAGCACGTCCACAAACCAGACTTTGCGGACGTGCTGAGGGCGGTTACCTTGCGGACTGCT
+GCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTGTTTTGTTGATTGGTTTTAATGCC
+TTGGCGTATGTGTTGCCGCCCCTGCGTTCCAATACAGACAAAAAAGCGCTGCAAGAGGGC
+TTGCAAGATGGAGATATCCACCAACGGTCAGTGCGTC
+>ds2020-267_630
+GACGCACTGACCGTGTGAATACAGCTGACGCACTGACCGTGATTGTCTTGGGACGCACTG
+CCGTTGTGTGTACCCTGACGCCTGACCGTCGTCCAGTGGTATGATAACGGTCAGTGCGTA
+TCTAAGAGCAGCACGTCCGCAAGGGGCATCGAATTGCGGACGGCTGAGGGGAAGATGCTT
+GCGGACGTGTGAGCAGTTAGAGATTGCGGACGTGCTG
+>ds2020-267_631
+GACGCACTGACCGTAACCAGTACACTCCTTATTAACAGATGACCAATAAAAAAGGTTGGT
+AACTTACCAACCTTTTTTGGGTTTCTTTTTGACCTTTAAATACAAAAAATTTGATTACAG
+AAAATCAGTTTTTATAACTTTCATCTGCGGTCCGACGGTCAGTGCGTCGCCTTAAGCGTG
+CGGACGTGCTGAGGCGAGGGCCCTTGCGGACGTGCTG
+>ds2020-267_632
+CAGCACGTCCGCAACCATTGACCCGTTGCGACGTGCTGAGGGCTGGCCTATTGCGGACGT
+GCTGACCGAGACCAAGTTGCGGACGTAAGGACGTTCGGGCTTAGTGTGTCATCTGAGTTT
+GTGTCGGTTTGCTTACTTTCACTTAGGCATCCCTGGACGTTCGGCTTATGTGGGGGATGA
+AGCCCGAACGCAGGTCGCGAAGCAAGCCCGAACGTCC
+>ds2020-267_633
+GGACGTTCGGGCTTGAGTGGTAAGGTCTGCGAGGAGTGAGGCTTCAGCTGGATAAAGCTA
+ATTTCGAGCGGCTGAGCGGGGAGAAAAAGCCCGAACGTCCAGGCCTGAAATGAAGCCCGA
+ACGTCCTTACTTCCAGAATCTAAGGAGCAGCACGTCCGCAACGGATTTTTCCTCAGCACG
+TCCGCAAGGTCACCGGTATTTCTTTGCGGACGTGCTG
+>ds2020-267_634
+CTTACAATAAGATTAACTCCAGTCTCTCAGCTGGGCAATAGAAGGAATTGAGTCTCTAAT
+CCCCACCTAGGACAGTAACCATAGAACTTCACTTCTTAGCATTAGCAAGGTAGCAAAGCA
+GCCCGGAAGCCCGAACGTCCTTACTTCCAGACACGTCCGCAAGCTCCATACCGTATATGT
+TGCGGACGTGCGAGTGTACCGGTGTTGCGACGTGCTG
+>ds2020-267_635
+GGACGTTCGGGCTTTGTAGTTTGTTTTGTAGAAAGGGGCTTCTTAAAATATCCCATAAAT
+AAGTAGGGGCTTCAAAGCTTGTTGTAGTTTAGGGGTGCGCAGGTTTGGAACCCCATACAG
+GGGGCTAGCGCGCAATGGCTTTCTCTGAAAGGGGCTCGCTTCTTCAAGCTCCGCTCCGCT
+TGCTGCTTTTCATTTTGTTAGGAGTAGGTGCTTGCTG
+>ds2020-267_636
+CAGCACGTCCGCAACCATCTCATCAAAAACTTTTCGAGCTTTCTTAATCTCACCAACAAC
+ACCAAACCCATGAACCAAAGTCGTGTAAGTAACAACATCAATCTCACACTTCCTCTTCTT
+CATTTGCAAAAAGAACTCCCAAGCTTCCTTAATCTGGCCAGCTCTAAAATACCCTTTAAG
+CATTATGTTAAACGTGGTTCGGTTTGCGGACGTGCTG
+>ds2020-267_637
+CAGCACGTCCGCAAGTTGGCCTCGGTGGCGCTTCAAGGAGTGACTAATGACTCACGCTCA
+CGAAGACATCAGGGTTGGCACACTGTGCCTTCCCTTCTTTGGTAACGGCTGGCTAATGCC
+ATGGGGTGAAGTGGTCAGCAATACATTAAAGGCGCAGCGGCTCGCTGAGGAATATCGGGA
+AAGTCAGGAGGACTTGTATAGCCTTGCGGACGTGCTG
+>ds2020-267_638
+GTCCGCAACTCAGCGGCCTCAGCACGTCCGCAAATTAAAACGCCCAGCACGTCCGCAATA
+TATCCGCCGTCAGCACGTCCGCAAGGCCAACCTGATACAGTTTGCGGACGTGCTTAAGGC
+GACGCACTGACCGTCCTCCAACCCCTACAGCACGGTCAGTGCGTCAGAGTAAACCCCACG
+GTCAGTGCGTCAGGGAAGGGCACACGGTCAGTGCGTC
+>ds2020-267_639
+AGGAGGCTACTCAGTAGACAGTCCCACCCTCACACGATTCTTTACCTTTCACTTCATCTT
+GCCCTTCATTATTGCAGCCCTAGCAGCACTCCACCTCCTATTCTTGCACGAAACGGGATC
+AAACAACCCCCTAGGAATCACCTCCCATTCCGATAAAATCACCTTCCACCCTTACTACAC
+AATCAAAGACGCCCTCGGCTTACTTCTCTTCCTTCT
+>ds2020-267_640
+CAGCACGTCCGCAAACATTTTCTTCTTCTTTTTCTTTTTCTTCTTCCTTCTCTCCTGCCT
+TGCGACACTCGTCTTCCTGCCCTAACATGCATTTGGGACAATCTACTATCGTTTGATGAG
+GGAGGGAGACTAGAGGAGCTTCTTCTTCCATATTAATTCCTACTATGACGGAGGGCTTGC
+GGACGTGCTGAGGGGGAAGGTATTGCGGACGTGCTG
+>ds2020-267_641
+CAGCACGTCCGCAATTCCCCACTGCTTTCTCTCCGGTTATAGTAAAATACCTGCGTTCTA
+TTGTTTCTTTATATTCAGATGTCATTCTACCTCTCAATCCCTGAAAGTCATCCATCATGT
+CCTTGAGTTTCTTCCCCAAACCACTAACCACTGAGGTCCTGGTTCGATCTGCGGAGGAGC
+CAGGGCCACAACCAGGAAGGCTTTGCGGACGTGCTG
+>ds2020-267_642
+CTTTTACAGAACTCCCCTCTTGTATCATCAAACCGTCACCCATTAATACAACACCAACAT
+TATTTGATTCCAAATTCAGAGCAATGCCTATCGTACCCTCTTCAAATTCTACTAATACAA
+CCTACCACGGTCAGTGCGTCGCCTTAAGCGACGTCCGCAAGATAATCGACTTGATATTGC
+GGACGTGCTGATGGCATACGCTTTGCGGACGTGCTG
+>ds2020-267_643
+CAGCACGTCCGCAATATGGTACCCCTGATCAGAATGGTACTCGAATTCATTTACGATCCC
+GAGTTTCCAGACACATCGCACTTCCGCTCGGGTCGAGGCCGCCACTCGGCCCTAAGACGG
+ATCAAAGAAGAGTGGGGAACCTCTCGCTGGTTTTTGGAATTCGACATCCGGAAGTGTTTT
+CACACCATCAACCGATCATCGTTGAGGACGTGCTGC
+>ds2020-267_644
+CAGCACGTCCGCAACTCTGTCTTTAATGGCTGAAGTTGGGTGGCCAGTGAATGTGGCCAC
+AGATGAGAAGGTTGACCCCATTGCTGAGCGCATGGGATTCAAGGAGTGGGTCCTTTGTGG
+CTCAGACTTCAAACAAGGGATTCGAAATCTGAAAATGATGGTTGATGAGTACCTTGAGGA
+CTTGCGCAAAATGCCTTTGGAATTGAGGACGTGCTG
+>ds2020-267_645
+TCTAAGGAGCAGCACGTCCGCAACAAACCGGCCATTATTGGGACTGGACCCAATACGCGT
+TGCGGAAGGCCATTTCATTTGCGGACGTGCTGAGCGGTGTCAGGTTGCGGACGTGCTGCT
+CCTTAGATAGCACGTCCGCAACGAGAATTGCCTCACACGTCCCAACCTCGAACTATTTGC
+GGACGTGCTGACGATCGTTTCCTTGCGGACGTGCTG
+>ds2020-267_646
+CAGCACGTCCGCAACCACGACCGTCTTTCCTTGGCGAATGTCTTCAATGGCCTCTGGGAT
+GGAAGCAAATCCTTTTGTGGGGCAATCCAAATCAAATTCATCATTATCAACTGGAAAACC
+ACTAGTTGTTGGAACAGTATCTGCTGAAAGTGTTCCAAATGCTACTGCATCCGGCTGTAT
+CTCAATCCCAACTGACTAAGCATTGCGGACGTGCTG
+>ds2020-267_647
+GACGCACAGACCGTATACCCAGAATTGGACGGTCAGTGCGTCACACGGGATTATACGGTC
+AGTGCGTCAGGCCAACCAAACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCAC
+GTCCGCAAAAGCTCGACGGTCAGCACGTCGCAACACCTTAGCTCTTGCGGAACAGGACCA
+TAATTGCGGACGTGCTGCTCCTTAGATAGATCGGAA
+>ds2020-267_648
+TATCTAAGGAGCAGCACGTCCGCAAATTCATGGCATTCGACTTGGACGTGCTGAGGGAGC
+GCGAATTGCGGACGTGCTGAGGGACTGATTGCGGACGTGCTGCTCCTTAGATAGATCGGA
+AGAGCGTCGTGTAGGGAAAGAGTGTGCCTCTATGTGTAGATCTCGGTGGTCGCCGTATCA
+TTAAAAAAGTTTAATTGCGGACGGCGCTCCTTAGGT
+>ds2020-267_649
+CTAAGGAGCAGCACGTCCGCAAATGTTCTCGGGTAGCACGTCCGCAAGAGGTCCTGCCTC
+AGCACGTCCGCAACTCATTTAATAAACCTATTAAAACTATACAGGCTGCTAATATTATGG
+GAGCTATTCTGTTAGAAATAGATCCACCTATTGAAAAAACAAATGAAAAGACTTTAAATT
+TTACTTTAGAAGGGGGTCGGGGTTGCGGACGTGCTG
+>ds2020-267_650
+GGACGTTCGGGCTTAGGGGGTGCCCCTGATTTTTCAGGGTAAGAAGGGGTAGAGAAAATG
+CCTCGAGCCAATGTTCGAGTACCAGGCGCCACGGCGCTGAAGTAACCCATGCCATTCCCA
+CCTTAAAGCCCGAACGTCCTTAATCTAAGGAGCAGCACGTCCGCAATGGCCTAGTTATTT
+GCGGACGTGTGAGGGTTGACGACTTGCGACGTGCTG
+>ds2020-267_651
+CCCTGGACGTTCGGGCTTGATTTTGATGGTGATGAGGAGGAAGAGGTGGAGGAGAATATG
+ACGTCGTTTAAAGGAAGGGAAATGGGGTCGAATTTTTTAGAGGATATTGAATTTTCTGAG
+TTGCTGGGAGGGTTTGGTTCCATTGATGGGTATTTTTTGGAGGATATGTTGGTTGACTTG
+TGACAGTGGTGATGATGATGCTTTGCGGACGTGCTG
+>ds2020-267_652
+GGACGTTCGGGCTTTGGATCAGGGGTAGCGTGAAGCCCGAAGTCCAGGCAAATGGTTAAG
+CCCGAACGTCCAGGAGCAACGCTAAGCCCGAACGTCCTTACTTCCAGTCTAAGGAGCAGC
+ACGTCCGCAATTCCTCTAGTTTGCGACGTGCTGAGCCAGTTTCCCTTGCGGACGTGCTGA
+CGGAGTCCTCTTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_653
+CTTCCGATCTATATAAGGAGCAGCACGTCCGCAAAGACATACCCCTCAGCACGTCCGCAA
+TTAGCCTCCCCTCAGCACGTCCGCAAAGATGTACCTGTCAGCACGTCGCAACTCAGCTCC
+ATTCGATTGCGGACGTGCTGCTCCTTAGATACGTCCGCAACCCCAACCCAATTCATTTGC
+GGACGTGCTGAGTGGGATGGCTTTGCGGACGTGCTG
+>ds2020-267_654
+GGACGTTCGGGCTTGGTTTTGGTATTTGAGCTAGTGACGCAACTGGGCGGCGAGGCCGGG
+CCGAGAGTACACGACAAGCCCGAACGTCCTTACTTCCAGACACGTCCGCAACTTTACACC
+GATAGGATAGAGGGTCTGTATTGCGGACGTGCTGAGGCTAGAAAGATTGCGGACGTGCTG
+AGCGGCCTATGATTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_655
+TATCTAAGGAGCAGCACGTCCGCAATAAGTGTTCCCTCAGCACGTCCGCAACGTACATTC
+TCTCAGCACGTCGCAACTAGGAGGATCTCCTTGCGGACGTGCTGCTCCTTAGATTATCTA
+AGGAGCAGCACGTCCGCAACTCCTATTCCGTCAGCACGTCCGCCACTTCATAGGGCTCCA
+CGTCCCAATTAGATAGCGTATTTTGCGGACGTGCTG
+>ds2020-267_656
+GGACGTTCGGGCTTGTTCATCCCTTTTATAAAGCCCGAAGTCCAAGCCCGCCAAAAAGCC
+CGAACGTCCTTACTTCCAGACACGTCCGCAAATCGCTGTTGTTGGACGTGCTGAGGCAGC
+GCTGATTGCGGACGTGCTGAGGGGAACAAGGTTGCGGACGTGCTGCTCGTTAGATAGATC
+GGAAGAGCGCCCGTCGGAACTCCTGGCAGTCGGGGG
+>ds2020-267_657
+GACGCACTGACCGTGACACTTCCCCTGACGCACTGACCGTGCCCCTACCACCGACGCCTG
+ACCGTGTTATCCATGTTTATACGGTCAGTGCGTCGCCTTAAGCGACACGTCCGCAACGGT
+ACAGGACTTATGTTGCGACGTGCTGAAGCCCTTTAATTTGCGGACGTGCTGAGTGGGGAC
+TTATTGCGGACGTGCTGAGGCCAGCGATATTGCGGA
+>ds2020-267_658
+TCACAATTGCATGCAGTACTAGGGGTGAAATGCGTAGAGATGTGGAGGAACACCAGTGGC
+GAAGGCGACTCTCTGGTCTGTAACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGCGTAGG
+ATAAGCCCGAACGTCCTTACTTCCAGTGTCCGCAATTAGTTTCCCCTCGCACTCCCAAAA
+ATTCCGAAGTGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_659
+CAGGCGGAGTGCCGCCTACGAGGGTCTCCGGAGTGAATGGAGTGCGGACGTGTGCTCTTC
+CGATCTATCTAAGGGGCAGCACGTCCGCAACAAAGGGTCACTTGGGACGTGCTGAGAGCG
+GGGCGTTTGCGGACGTGCTGAGCTAATGTGAATTGCGGACGTGCTGCTCCTTAGATAGAT
+CGGAAGAGCGGCGTTCTGAACTTTAGTCACTGTGGA
+>ds2020-267_660
+GGACGTTCGGGCTTACCCGTCCACCCCCTCTCGAGTTTCCGGCTGTTTCCTAGATTGAAG
+TAGCCTTTCGTCACCCTACCAAACGAAAGAAGTCACTATCAAACAGCCCCCCCAACTAGT
+CGTATGGGGTGCTTGTGGTAAGCTGCCTTGGTTGTGGACGTGCTGGCGAGCAGGAATTGC
+GGACGTGTTGAGGAGCGTGGGTTTGCGGACGTGCTG
+>ds2020-267_661
+CAGCACGTCCGCAATATGCCGTGCATTCTCCCATTTCGTATACAATTTCATTATTGTTAT
+TTAAAATGATAGTAGAATCACTGCGATTTGCGGACGTGCTGCTCCTTAGATTCGCTTAAG
+GCGACGCACTGACCGTGGGGTCTCTCCTGACGCACTGACTGTATTGTTGGCCCTGACGCA
+GTGACCTTTAAATGCCTCATGTACGGTCAGTGCGTC
+>ds2020-267_662
+GGACGTTCGGGCTTCCATTGGACGCTGAAAGCCGAACGTCCAGGGCCCAGGCCAAGCCCG
+AACGTCCAGGAGTGGTTGCAAGCCCGAACGTCCTTACTTCCAGACACGTCCGCAATACTT
+TGGATATTGGGACGTGCTGGAGGGGTCACGTTGCGGACGTGCTGAGTGTGAACTACTTGC
+GGACGTGCTGAGTGGTACGGATTTGCGGACGTGCTG
+>ds2020-267_663
+GGACGTTCGGGCTTTACCCCACCGATATGTTCTCCCCCCATTCCCCATGACCACCACGCA
+AGATCCAACCTTCAAACCCATACCACAACCACCCTCCACCCCAGAGGCAAACACAAGCCC
+GAACGTCCTTACTTCCAGTATCTAAGGAGCAGCACGTCGCAAGGTTCAGCCTCTCACACG
+TCCGAAATTCAACTCCCTGGGTTTGCGGACGTGCTG
+>ds2020-267_664
+GACGCACTGACCGTGGGGTGGACCCTGACGCACTGACCGTGTGATGTACCTTGACGCGCT
+GACCGTCTGATGTTTCCTGACGCACTGATAGTCCTTAGCACGGTCAGTGCGTCGCCTTAA
+GCGTGCACGTCCGCAATCCGAAACCCCTCTGCATTGGGACGTGCTGAGAGGGTAGTGGTT
+GCGACGTGCTGCCCGACACTGTTTGCGGACGTGCTG
+>ds2020-267_665
+GGACGTTCGGGCTTTTATCTCGGGCTGGAGGAGCTCCTAATGTGTCTGATGCAGATACCA
+TCAATGGTCAACCTGGTGATCTTTACAATTGCTCGGGCCAAGACACAATCATAGTTCCTA
+TAGACTTCGGTGAGACCACCCTTCTTGTCTCCCTGCCGACAGCAGTGCCTCTGTGACCTC
+ACCTTTCTTCACTAGTTATATGTTGCGGACGTGCTG
+>ds2020-267_666
+GGACGTTCGGGCTTCATGGTTGTGGTATTGATCTTACGGGGGGAACGAAATCAAAGAATA
+TATAGACTTGTAGAGACCCTCTATGTAGTTGTCTATCTAGGGCGATCGGTCTACATCTTT
+CCCCATAGCCCCGGGGCTGTGTTTCGATCTCCTACGTGCGAAATCTGAGGGTTCTTATTG
+CGGACGTGCGAGTTGATGCGGATTGCGGACGTGCTG
+>ds2020-267_667
+GTCCGCAATAACAGCAAGGTCAGCACGTCCGCAACTGCACACCCTCAGCACGTCCGCAAC
+AATCACTGGGTGAATCTTGCGGACGCGCTTAAGGCGGCGCACTGACCGGCCAGGTCCCCG
+TGACGCACTGACCGTGTCCATAGCCTTGACCCACTGACCTTATAGAATCACAGGACGCCT
+GCCTTTTCTTTGTCGGTACCGTACGGTCAGTGCGTC
+>ds2020-267_668
+CAGCACGTCCGCAAGCGAGTCCCCCCCCTAGTTCATATCTTTGTTTCGTGTGTTCCCGGG
+AGTAATTCGATCTCTTCAATCTCGGGATACCACCTAAATAACTGCGGCCAGAGAGTAAAA
+TAGGTCGGGAAGAAAGAGTCTGAGGTTGGGTCGGACGACATACATCTTGGAAGGAAGGTT
+CATTCTTTAAATCAGCGATGGTTGCGGACGTGCTG
+>ds2020-267_669
+CTTGGTGCAGAAGATCTTTTTCCACTCTTTTCTTCATCTAGTAGGTCTCTGATAGGGAAA
+TAAGCTGCTTTCTTGCAAAGCTCAAGTAGATCTGAACCTGTGTAACCCTCACTCAAGCCA
+GCTGATACGGTCAGTGCGTCGCCTTAAGCGTGTCCGCAACGTTTAACTGGTAAGATTTGC
+GGACGTGCGAGTGGCTTTCAGTTGCGGACGTGCTG
+>ds2020-267_670
+CAGCACGTCCGCAAGGGAGACATTCTCAGCACGTCCGCAAACTCTACTGGCTGGTTATTG
+CGGACACGCTTAGGCGACGCACTGACCGTAATTGCCACCTTATCTTTAGGGTTTTGTTGC
+CCTATCTGGGCTTTCTTTGCCATGCCTTGCCACCTTGCCTTTGCTTGGCCTTTATTTGCC
+TTACCTTGCCTTACCCTTTCTTTTTAGGGTTTGGT
+>ds2020-267_671
+TATCTAAGGAGCAGCACGTCCGCAAGTGCTTATCGGTGATATGTGCGACGTGCTGAAGTG
+GCTTCTCTTGCGGACGTGTGACACTACTGGTGTTGCGGACGTGCTGCTCCTTACGCTTAA
+GGCGACGCACTGACCGTCCGACTCACCCTACGGTCAGTGCGTCAGGGAGACATGAACGGT
+CAGTGCGTCAGGCGAGGACACACGGTCAGTGCGTC
+>ds2020-267_672
+GGACGTTCGGGCTTCAGAATGAGGATGGTTAAGCCCGAAGTCCCCAGGTGGGGCAAGCCC
+GAACGTCCTTACTTCCAGAAGCACGTCCGCAATAACACCACAGTCAGCACGTCCCAACCG
+CCCTCTCCTTGCGGAAGTAACATGGGATACATTGCGACGTGCTGACCGCGCCTCTATTGC
+GGACGTGCTGATGGGTAACCGTTGCGGACGTGCTG
+>ds2020-267_673
+CAGCACGTCCGCAAACCTGAACTGTTGCGACGTGCTGACCCCTTAACTCTTGCGGACGTG
+TGAGACCATACGCCTTGCGGACGTGCTGCTCCTTAGATTGAGCAGCACGTCCGCAAGGCG
+GCTTTCCTCAGCACGTCCGCAAAACGCGTCTCTCACACGTCCGCAATGGCCCATAGGTTG
+CGGACGTGTGAGAGACGCGTTTTGCGGACGTGCTG
+>ds2020-267_674
+GACGCACTGACCGTCTAAATTCCGTTGCTGCGATTCATGCAGGGCGCAAAGCGGAAAACC
+AAGACACCTTGACAATGCAAACGCTGGTGCCAACAGGGGATATAACACGGTCAGTGCGTC
+AGTAGTGGGATCACGGTCAGTGCGTCGCCTAAGCGTGTCCGCAACTCACAGCCTGTTGCG
+GACGTACTGAGTAACGTGACATTGCGGACGTGCTG
+>ds2020-267_675
+TTCTGGGCGTGTCTATGTAAGGAGCCGCCCTGCGTCAAGGGGATGGAGATTGGGACGTGC
+TGAGGTGCGGTGTATTGCGGACGTGCTGAGGGTTCGCGGGTTGCGGACGTGCTGAGTGAT
+TACGTTTTGCGGACGTGCTGCTCCTTAGATACACGTCCGCAAACAGTTAGGAGTATGTTG
+GGACGTGCTGCCCACCTAGGCTTGCGGACGTGCTG
+>ds2020-267_676
+ATCTAAGGAGCAGCACGTCCGCAATCTTCCCCCGCTCAGCACGTCCGCAATGCATTATAG
+CTCAGCACGTCCGCAATGGTTGCGGAAGTGCTGGAGAATCCAGGTTTTGCGGACGTGTAA
+GGACGTTCGGGCTTGAAGTACCCGCTGGACGTTCGGGCTTTCAACACCGCCTAGGACAAG
+CCGAACACCAGGGGATTGATAAAGCCCGAACGTCC
+>ds2020-267_677
+TATCTAAGAGCAGCACGTCCGCAAGCTAATCACCCTAGCACGTCCGCAAACCCCAGGCCC
+TCACACGTCCGCAATATAAAGCCGATAATGTTGCGGACGTGCTGCTCCTTAGATATCTAA
+GGAGCAGCACGTCCGCAAGATTGGTCCGCTCAGCACGTCCCAACTACATCGACATGTTCT
+TGCGGACGGAGTGGGTAAACTTTGCGGACGTGCTG
+>ds2020-267_678
+GACGCACTGACCGTTCCCCGCCGCCCCCTCTTTGACTCAGACGTTGCCGAGCGTCCGGCT
+ATTACCAATACAGAGGCTTTGTGGATAGACGCTTTTGATGATTTTCAAACGTCTGATAAC
+TTAGATGCAAGCTTTATCCCTTTTGGCGAGTATGATGTTGCAAGCTTTGGCGGATTTTCA
+CCCTTTGATAACATGGGCAATACGGTCAGTGCGTC
+>ds2020-267_679
+CAGCACGTCCGCAAAGACATACTCGTCCCTATTTTTAAGTCCTGTAACGCGGGAGGTTAT
+GCTCCGCTTTGTTTATAATTATAAAGATTTTGCACTTCCTAAAAATGCGGTGTTAAGCAC
+ATTTATACGCAGGTTAAACTATCCGTCTGATTAAATTTCATCATTCGGAGAAAACGTTCC
+TAATGTGCAAATGCCAGAAATTTGCGGACGTGCTG
+>ds2020-267_680
+GGACGTTCGGGCTTTAGAGGACCGGGGCGTTCGGCTTACAATACAGCCTTGAAGCCCGAA
+CGTCCACCAGAAAAGTTAAGCCCGAACGTCCAAAGGTGGACGGAAGCCCGAACGTCCTTA
+CTTCCAGGCACGTCCGCAATGGAGTCACAGGTAACACGTTGGGACGTGCTGAGGTGACCT
+CTATTGCGACGTGCTGACGGTTTGCGGACGTGCTG
+>ds2020-267_681
+GGACGTTCGGGCTTGTGATCTGCAGTATGGTTTGGATCTGTGTCCCCACACAAATCTCAT
+GTTCAGTTCCCAATGTTGGAGGGGGGGCTGGTGGGAAGAGATTGGATCATGGGGAGGTAA
+AATAAAAAGCCCGAACGTCCTTTATCTAAGGAGCAGCACGTCCGCAAGAGTTGGTCGATT
+GCGACGTGTGAGTATCGATGGCTTGCGGACGTGCT
+>ds2020-267_682
+TCCGCAAACTCATCTCCCTCAGCACGTCCGCAATACCAGCCCCCTCAGCACGTCCGCAAT
+AATGGGCCCTCACACGTCCGCAATTGAACCCTTCGTAATTTGCGGACGACGCTTAAGGCG
+ACGCACTGACCGTAGTGCTGACCGTGACGCACTGACCGTGTTGTTCCCCTTGACGCACTG
+ACCGTGTAGATGGGGTAACAAACGGTCTGTGCGTC
+>ds2020-267_683
+GCAATTGCATGTCCCTCGCACGTCCGCAAGCTCTTACCCATCAGCACGTCGCAAGAGCCA
+ACGCCTCAGCATGTCGCAAATTGGAGGTCGTTGCGGACGTGCTGCTCCTCGCTTAAGGCG
+ACGCACTGACCGTGACGGAACCGGTCATATAAGGTCAGGCGTCAGGCGAATAAAAACGGT
+CAGTGCGTCAGCCATACTCCAACGGTCAGTGCGTC
+>ds2020-267_684
+CAGCACGTCCGCAATTCCAATGCCTTCTGACCTGCTCCATTTAATATTTAATAATGAGAA
+TAAGCAGACTAACTTAGACCAGGGAGACCGCATTGCGGACGTGCTGCTACGCTTAAGGCG
+ACGCACTGACCGTATAATTTAGCCTGACGCACTGACCGTACAATTGAGTCTGACGCCTGA
+CCGTTCCCAACCTGATGAAGCACGGTCAGTGCGTC
+>ds2020-267_685
+CAGCACGTCCGCAAAGGTGCCGATATCCTCACATGAGTCGCCGTATTGATCTTCTGATTT
+ACATTTTGGGCATGTACCCTTAATGAAACGGTCAGACAAGAACATCCCTTTTTTGGGTCA
+AATAATTGAGTTACAGGACGAACTGCAATATTTCCAGCTTCACGGTTTTTAATATAGATA
+TCTGTTGAACGCGCTTTGATTTGCGGACGTGCTG
+>ds2020-267_686
+CAGCACGTCCGCAAGTGCAGAAGGGTGGGAAGGAAAAGGGGGAAGCTTTCATTCATCCTG
+TTTGTTTATCATCATTTAATTTCTTACAGATATATGGAATATAATTTTAGGAATTTCAAA
+ATATTTCAAGTGATGTATTTTGTGTATCTTCAATTCTACCTCGTAATTCAATCCAATCCT
+ATTCACAAAATGGCCCGAATTTGCGGACGTGCTG
+>ds2020-267_687
+CAGCACGTCCGCAACGAATGTGGATTCGTGTCGGAGGAGTTTTGAGCGTGAGCTACCACT
+CATGCAGCGGCAAGGACCCGCAACTCTCGAGGGGGCCACCAACCGCCCGAATAACTCCTT
+TACTCAATGGATAGCGCTTATCCTCTTTCAATCAACAAAATGAGAAATGGGGGAGAAAGA
+AAGAGAGAAAGAGGTTAGGATTGCGGACGTGCTG
+>ds2020-267_688
+CAGCACGTCCGCAATCGCTATGCCCTATCAAAGAAACTAGCGGACTGATCACTAAATAGA
+TACAAATAGGTGCAAATTCTGACATCACCACAGCCCACTTGGTTCTTTCGCTCCTTGCTC
+GCGGAGCGGCATAACGGAAAAAAGTCGGAATTCTACAATTTCGTGGTCCGCTGGGCGAAC
+GCCGGATATTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_689
+CAGCACGTCCGCAATGGAACCCGCCTCAGCACGTCCGCAATAACAAACCGCTCAGCACGC
+CCCACATTATTCTTCTCACACGTCCGCAATCCCCAGCGCCTACACCTTGCGGACGTGTGA
+GAAGAATAATGTGGGACGTGCTGAGCGGTTTGTTATTGCGGACGTGCTGAGGCGGGTTCC
+GTTGCGGACGTGCGCTCCTTAGATAGATCGGAAG
+>ds2020-267_690
+CAGCACGTCCGCAAGACCCGGCAGGTGTTGATTCTGCAGGACGGGCAACAGGTGCCGGGG
+CTGCGGAGAATGTGGTCGGTACATTTTTACCTGCCGAAACGTCTTTCAGGCGCTTGTATT
+CAGTGAGCACACGGCTGCCATAGCCTGAGTCGTTTTCAAAGGCGCTGGCACCGACATACA
+TTTTCAATACGGCTTTCACTTTGCGGACGTGCTG
+>ds2020-267_691
+CAGCACGTCCGCAATTCGGCCTGGGCAGCACGTCCCAAATATTATTCGCTTGCGGACGTG
+CTGTCGCTTAAGGCGACGCACTGACCGTTTTCTCCTGGCTTTTAGCACTTCATTGTCATC
+AAGCAGCACGGGTAGCACGTCTGCAAACGACAAGGATGGGACGTGTGACTGAAATCAGAT
+TGCGGACGTGCTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_692
+GACGCACTGACCGTCTATGGGGCTGGGTGTAATGAAATTGTTGGGGAGTGGAAAGATGCC
+TCTCCACATTTCACATTTGAAGATGCCACTTTGGATGAGGCTATTAATGGTGTTGAAGAC
+TTGGATTACTTTGACTCCCTTGTGATCGGAACTTCGGAAGGCTATCCCTATGTTCTTGAG
+AGGGAGACAAATCAGAAAGGTAAGTCGCGATATT
+>ds2020-267_693
+GACGCACTGACCGTGGGTTAAGGCATGGGATACGGTCAGTGCGGTCAGGGAGGAGCACAC
+GGTCAGTGCGTCAGGCAGAGACTGACGGTCAGTGCGTCAGGGTAAGATCTACGGTCAGTG
+CGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAACCCTAGCCGAGTAGCATTCGG
+ACGTGCTGACCTAGACGCAATTGCGGACGTGCTG
+>ds2020-267_694
+GGACGTTCGGGCTTGGTTTTATCTCTGGACGTTCGGGCTTGGGCCGCATCCTGGCGTTCG
+GGCTTTTCCCACACCCTGGACGTTCGGCTTTACCGTAACCATTAAGCCCGAACGTCCTTA
+CTTCCAGACAGCACGTCCGCAACATATTCGGCTTCCGCAATTACTCATAACTCATTGCGG
+ACGTGCTGAAGAGTGAAAACTTGCGGACGTGCTG
+>ds2020-267_695
+CAGCACGTCCGCAACGTTTCTGGCTTTTAATCAAGTTCGGAACCCCACCGACGGAACTTC
+GTTGGTCTCCAGTACAGGGGCACGGTTCACCTGCCCCATTATTGAAATTGGATCATCATC
+TGAGAGCTCTGTTGCAGCCAGTCAGAATACTTATTTTGAAGATGGTTTAAGCAGTGTTCA
+TACAAGTAATCAGGGGCCGATTGCGGACGTGCTG
+>ds2020-267_696
+TCTAAGGAGCAGCACGTCCGCAACACTTATCCCCTCAGCACGTCCGCAACAATCAATACC
+TCAGCACGTCGCAATCGGGGGCAGCTTGCGGACGTGCTGCTCCTTAGATTCTGGAAGTAA
+GGACGTTCGGGCTTTGTTTCTCCCCTGGACGTTCGTGCTTAGAGCACTCCCTGGCGTTCT
+GGCTTCTTACCTGCTATACAAACCCCGAACGTCC
+>ds2020-267_697
+GCGACGCACTGACCGTGCCCCGATACATCCCCACCAAACCGCAACAACCCTCGTTTCACC
+TCCATTTGGGCAAAGCAGCTGTCATCACTGGCAATCACAATGTCGGCATTGAGCATGAGC
+TCGATACCCGCGGTAAAACAAAGCCCTTGTACCGCAACAACGTAAGGTTTAGTACGCGGC
+ATACCTACCACGTCCCCAACGGTCAGTGCGTCGC
+>ds2020-267_698
+CAGCACGTCCGCGAACGCGTTCGCCTCAGCACGTCCGCAATTTACCCGCCTCAGCACGTC
+GCAACCATCAGGTATTTGCGGACGTGCTGGAAGTAAGGACGTTCGGGCTTACTTCCAGCA
+CGTCCGCAATCATAGCTGGGTCGTCGCAAAGAGGTCCCAGGGTTTGCGGACGTGCTGAGA
+GGTTTAGCCTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_699
+CAGCACTTGTCTCCTAAATTAGCAAGATCGCGCGTTCACCCTTTTGTTTCAAGCAGGTTG
+CTTAGTTATGGTGATAACCAAATTGTTAGCGAAGAGTTGTTTGTATCCGTCGGGTTACGC
+TATGACCCGGAAAAACATGCACAGCATCTGGCCAGATTTGGTATGACCCTAAAAATTGAC
+GAAACTGAAGTGACTATATATTGCGGACGTGCTG
+>ds2020-267_700
+CAGCACGTCCGCAACATGCCCAGCACGTCCGCAAATGTAAGTACCTCCGTCCCAACCCCG
+CCAGTTCCATTCCCGAACTTTCTCGCCAAATCCACATCTGCAAGCCCCCCTCCCTCCCCA
+AAACACACCCCTCTCCGCAATAGATCATTTGTGGACGTGCTGAGGCTCTGGCACTTGCGG
+ACGTGCTGAGGGGAACAAGATTGCGGACGTGCTG
+>ds2020-267_701
+CTTCTTCTCTGCCGAAAGGAAAGACAAAGGCGAGGGGGTACGGTCAGTGCGTCGCCTTAA
+GCGTATCTAAGGAGCAGCACGTCCGCAACTTTCAACGCCTGGTAATTGCGGACGTGCTGA
+GGCAACAACGTTTGCGGACGTGCTGAGAGGGAGAATGTTGCGGACGTGCGCTCCTTAGAT
+AGATCGGACGAGCACCCGGCGGACCTCCCGTCAC
+>ds2020-267_702
+TAGACCCTATCGATACGCCGCACCAGAGTATCGTGAACGCAGTAGTTTGGGTCGGAAAAA
+GCCCCGGGCTCATTCCCCTGACCACCCATCGTCCTCAGCGCCCTTCTGCTGTGCGGTGAT
+CCCGCGCTTGCGGACGTGCTGCTCCTTAGATACGCTTAGGCACACGGGTCAGCGGTTGCG
+GACGTGCTCAGGGGTTAGGGTTGCGGCCGTGCTG
+>ds2020-267_703
+CAGCAGTCCGCAATCGGTGTCCCCTCAGCACGTCCGCAATGGACAACACCTCAGCACGTC
+CGCAATTATTCACCCTCACACGTCCCAACAAGTCGGCAGTTGCGGACGTGCTGCTCCTAT
+CTAAGGAGCAGCACGTCCGCAAGCGCTAATTCCTCAGCACGTCCCAAAGGGGGATCGGCA
+GCACGTCGCAATTGATAATCGTTGCGGACTGCTG
+>ds2020-267_704
+GGACGTTCGGGCTTTTGTGGTCGCCTATTTTGAAATTCCACCCTCCTTTATTCGAATAAG
+ATATATATGTATAATAATGCAAGTAATCTTTCCAACTCAACAAAACCCTTCAGCCCAGTT
+TTACAAATAAACTAGATGCTCCAACCGTAACCATTCTCGCACTCTAGTCCAAACACCTTC
+GTCCGCAACTTCTGCCGGGTTTGCGGACGTGCTG
+>ds2020-267_705
+CGTCCGCAGTGCCCAGCCCCTTGATCTTGCGGACGCGCTTAAGGCGACTCTCTGACCGTT
+TAAAGCACGATACCCGGTCAGTGCGTCAGGACATACTCCACGGTCAGTGCGTCAGGGGCA
+GGGCGACGGTCAGTGCGTCGCCTTAAGCGACACGTCCGCAACAACCTGGCCTTCATTGCG
+GACGTGCGAGCGCTAAAATATTGCGGACGTGCTG
+>ds2020-267_706
+CAGCACGTCCGCAACCCGATGATGCTCCCTGAGCAAGGGCTATTTATTAATGTGTTTATT
+CAAGAATGTGTTAAAGCTCAGTTTTATTGTGGTGGTAAGTTTATGCCTACTCATGTAGTT
+ATGGAAGTGTATGAGTATGTTCGTAATAGTTTTATTGCTAATCGTACTCCTGTTGTACAA
+GAACCTGCAGCTTGCGGACGTGCTGCTCCTTAG
+>ds2020-267_707
+AAGCACGTCCGCAAGATTCAGCCACTATTGTTAATGATGGTATTAGAGCACTCGGCAGAT
+TGGGAGGGATTTATGTCCATCCGACTAATATCCTCAGTCAGTTCTTCCAAGTTGGGTGCT
+AAAGTGGAATTTTCTGCAATTCAAACCATAAGACTTTAGATGATGATAAAAAGAAACAAA
+TACAATGAATAAGATAAGGTTGCGGACGTGCTG
+>ds2020-267_708
+TCGCTTAAGGCGACGCACTGACCGTACTTTTTAGGCTTGCCAGTACCGCAAACGGATTTT
+CTTTTTCCGCCACTGCCTGTGGCAACTCACCCACCTCAGTCACTGCCATTTCGCAGTCGT
+CATGCTTGGGCGCTAATGGCAAATCCACCAATAACTCATCTTCAACCACGGCAACTTGGA
+CGTGCTGAGGATCTGAACATTGCGGACGTGCTG
+>ds2020-267_709
+GGACGTTCGGGCTTAATACCTGCCCTGTTAAGCCCGAAGTCCCCGCTACAAGCCCGAACG
+TCCAGCGTAGTGAGCAAGCCCGAACGTCCTTACTTCCAGTAGGAGCAGCACGTCCGCAAT
+AATGATCCGGTGGTTGAGGAAAACGCGTTTGCGGACGTGTGACCCCGAATAAGTTGCGGA
+CGTGCTGAGGGGGTACAAATTGCGGACGTGCTG
+>ds2020-267_710
+CAGCACGTCCGCAACTCTGACCTTCTTATTTATAAGCCACAGCTCACTTCGACGTTTCCA
+ATTTCCCATAGAATCTCCGGGGCTTTCCTAGTCACTATAGTTTTGTTTTTTTATCTTCTT
+TGTCTGAAAATAGGTTTGATTTGCCCAGCACGTCCGCAAAAAGAAACCTATACTTGCGGA
+CGTGCTGACCCAGTTTCGGTTGCGGACGTGCTG
+>ds2020-267_711
+TATCTAGGAGCAGCACGTCCGCAATCTTCTGGTATTTGCGGACGGCTGAGGCCGACGTGC
+TTGCGGAGTGCTGAGGGTCCAACACTTGCGGACGTGCTGCCCTTAGATCCTGGAAGTAAG
+GACGTTCGGGCTTGTTCAGGGAGATAATAAGCCCGAAGTCCACCCTGAAAACGAAGCCTG
+AACGTCCAGGCGATTCTAGAAGCCCGAACGTCC
+>ds2020-267_712
+TATGTAGGGAGCAGCACGTCCGCAATGACCCCGCACTCAGCACGTCCAATCATGATGGTC
+TCAGCCGTCCGCAATACACTGGGAACCCTGGCCTGGTTAATTGCGATTCTGAGCGGCTTT
+GTTCCCATACTGATGGATGGAGGAGAGTTTGGTCAGAATGTATTCATTCTCACCGGATTT
+TCGCTGCTGGGATTGTCTTACGGTCAGTGCGTC
+>ds2020-267_713
+GACGCATGACCGTGAATAAGCCTGTTCTATTTTTATCGACATTGACAGGGATGCTATTGG
+GAATCGGATCGGTGATTAAGCCACCGATATCTGCAGGCATGGTAGGCAATGGCAAGGTAA
+TGGGTAAATTGCCAGTATTGTTATTGACTGCGTTGTCAATGGCATTGGCTAGGACCCCAC
+TAGCGACGGTCAGTGCGTCGCCTTAAGCGTATC
+>ds2020-267_714
+GGACGTTCGGGCTTACACACCGCCATAAAGCCAAGTCCAGGGAACCTATAAAGCCCGAAC
+GTCCAAGGGAACGCCTAAGCCCGAACGTCAGCACGTCCGCAAGACCGGGATACTTGCGAC
+GTGCTGAGCCATCACCACTTGCGGACGTGCTGAGGTGTGCCTGATTGCGGACGTGCTGAG
+AGATGTCCGATTGCGGCGTGCTGCTCCTTAGAT
+>ds2020-267_715
+TCCGCAACATAGGTCCGGTCAGCACGTCCGCAAACGGTCTCCCTCAGCACGTCCGCAAGA
+ATAGGGGGCAGCACGTCGCAAAGTAGATGGGATTTGCGGACGTGCTACGCTTAGGCGACG
+CACTGACCGTATAGGTACCCCTGACGCACTGACCGTCTTTATTTGCCTGACGCACTGACC
+GTTTAACAGGCCATAAGCGACGGTCAGTGCGTC
+>ds2020-267_716
+GACGCACTGACCGTTCTAAACACAGTCAGTGCGTCAAGGGGCCAGATACGGTCAGTGCGT
+CAGCGGATGTGATACGGTCAGTGCGTCGCCTTAAGCGATCTAAGAGCAGCACGTCCGCAA
+TAACCAACGGCTGACCTTTGGGACGTGCTGAGGAGTGTCGACTTGCGGACGTGCTGAGGG
+TGGGGCTCTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_717
+GAGTCCGATGACGCAGAGCATGACGCACTTAGCCTAGATCGCACCGTTGACGAGACTCCG
+CCGATATTGATCCGCCACAGCACGTCCGCAAAGTTTCGTTCCTATGACGCACGGACCCAG
+TTTCCGTTGCGGACGTGTGTCCTTACATAGATGGGAGGGCCGTCCGGGCCGGCACCTGTG
+AGCCAGGATCGTTAGTGCACGGTGGGCGCCATA
+>ds2020-267_718
+ATCTAAGGAGCAGCACGTCCGCAATCGAATGTCGGTCAGCACGTCCCAATTCTAAGTGCC
+TCAGCACGTCCCAAAGCGTTTCGGTTGCGGCGTGCTGCTCCTTAGATACGCTTAAGGCGA
+CGCACTGACCGTTGTATTTGGCCTGACGCACTGACCGTGACACATGCCCTGACGCACTGC
+CGTGTTGTTGTGGGTCCATACGGTCAGTGCGTC
+>ds2020-267_719
+CAGCACGTCCGCAATTCCAATTCTATGCAAAATATATTCAGGCGTTTTATTCGGACAATT
+AGCTCGGCAAAAGCAAAAGGTTTGGTCAGATAATCATCGCCACCAATTTCAATGCCCTTA
+ATCCGATCGCTTAAATCATCTTTAGCGGTTAAAAATAAAACAGGCGTATGCTTTCCAGCA
+GCACGGTAGCCCACCAGCAAAGCCCGAACGTCC
+>ds2020-267_720
+GGACGTTCGGGCTTTAAGTTGGGGATAGAAGCCGAACGTCCAGGGGTGAAAGTAGGCCCG
+AACGTCCAGACCACTCAGCAAGCCCGAACGTCCTTACTTCCAGACTCTAAGGAGCAGCAC
+GTCCGCAAGATCGTGGGTGTTGGGACGTGCTGAGGTGAGCCAGCTTGGGACGTGCTGAGA
+GCCTGATAATTGCGGACGTGCTGCTCTTAGATA
+>ds2020-267_721
+GACGCACTGACCGTGCTCCTACCCCTGACGCACTGACCATCTTCACTCCAGTTACGGTCA
+GTGCGTCAGAGGCCCAGTAACGGTCAGTGCGTCAGAGGCCCAGTAACGGTCAGTGCGTCA
+GGCTGTTCAACGGAGACATTAACATACGGTCAGTGCACGTCCGCAAGATACCGGTTGTGG
+ACGTGCTGCCGAGGAACGCTTGCGGACGTGCTG
+>ds2020-267_722
+GGACGTTCGGGCTTGTGCCACCCACTCTCCGAGTACCTTTGTGACTATTTCGCTCAGCAT
+CTGGTTCCGAAACGGTATCAGGATGGTAAGGAAGGCCAAGTCGGTGGCGAGACGGAGCAA
+TGGGTTCGATACCGTTTCTTTATGTCCTTACTTCCAGCGTCCGCAACAACCGGTTTGTGG
+ACGTGCTGAGGGTATCACCTTGCGGACGTGCTG
+>ds2020-267_723
+CAGCACGTCCGCAATCCAGACACGCTCGCACGTCCGCAACGTCAGAAAGTAGGTAGAGTA
+TGCCGCTTCGCTTGCCCTTTCTCCTTCCTCTGCAATAGGAAGTGAAAGAACTGCCTGCCA
+TTTCTTAGGTTAGGCTGCTGTGTGATGCTTACTCCATCTCAACGGATAAGCTCAGCTGGC
+TTACTAATAGAAAGATACAAGCCCGAACGTCCT
+>ds2020-267_724
+GACGCACTGACCGTTGGATAGGTTGTTGGTGCGACAAGGGATAGTTTTATACTGAATGGC
+ATCGCCAGCGACTGGGGTAAAGTAAGGGAGGGGTAGCTCTACGGTCAGTGCGTCGCCTTA
+AGCGTCACGTCCGCAATATGCGACTCCTCAGCACCCGCAATGTACTCCCTGTACGTTGCG
+GACGTGCTACCCCATACTATTGCGGACGTGCTG
+>ds2020-267_725
+TCCGCAATAGGTCTCGTCTCAGCACGTCCGCAACTGACCCCCGCTCAGCACGTCGCAAGT
+GTCATACCATCACACGTCCGCAAGCCACACACCCAGAGCTTTGCGGATCGCTTAAGGCGA
+CGCACTGACCGTTCATACTGGCTGACGCACTGACCGTGGTTAATCCTCTGACGCACTGAC
+CGTACAAAGGCCACGGATGACGGTCAGTGCGTC
+>ds2020-267_726
+TATCTAAGGAGCAGCACGTCCGCAAATCAAGTCAGATGCGGTTGCGGCGTGCTGACCACC
+TAGCCTTGGGACGTGCTGAGGGGCCGCCAATTGCGGACGTGCTGCTCCTCTGGAAGTAAG
+GACGTTCGGGCTTAGGTCGCCCCCTCATTCTGCGTGTAAGGCAGACGCTCTACCAACTGA
+GTTAACGACCCCGATATACAAGCCCGAACGTCC
+>ds2020-267_727
+GACGCACTGACCGTATACCACCCCGTAACGAACGGTCAGTGCGTCAGGGCAACCTGGACG
+GTCAGTGCGTCAAGCGGAGTTCTACGGTCAGTGCGTCGCCTTAAGCGCACGTCCGCAAAA
+CGAGTTATCTCACACCAGGGACCTGGGCTTGCGGACGTGCTGAGGGCAAGTAGTTTGCGG
+ACGTGCTAAGCTGATAAACTTGCGGACGTGCTG
+>ds2020-267_728
+CCGCAAAAAGAGCTCACTTACACGTCGTGCCGAGGGATTCTGGATTGCGGACGTGCTGAG
+GTCCTCCATCTTGCGGGCGTGCTGGCAAAAAGAGCTCACTTTTCGGACGTGCTGAGGGAT
+TCTGGATTGCGGACGTGCTGAGGACCTCTATATTGCGGACGTGCTGACCAAAAGAGCTCA
+CTTTTCGGACGTGCTGAGGGATTCTGGTTTTCG
+>ds2020-267_729
+CAGCAAGTCCGCAAAATTAGGCGGTTCTCGAAAAAAGATAGCGAAAAAAATTATTCCTAG
+AGTTGAGACTAAAAGGAATGTATAAACCAATGCTTCCATAGATTTGATCGTGGTTTACAA
+TTATAGCTTCCATACCTGTTTATTGGGGATCGTCTCCCGGATAAATAAAGAACAAGAGTC
+AAAGAAAAGGCGAATTATTGCGGACGTGCTGA
+>ds2020-267_730
+GGATCCTATAGACCAACATTCTCAGTTAGGGCACCGGCTAAACAGGATTTTCGAAAAGAC
+ACTTCGAACTATGCCCCGGGGCTGACCGCTGGCAGTGCCCGAGTGGCGGAGAGCACGGCA
+CTACAGGAACAGGTACCTGCAGAGATTGTAGAATAGAAAATTACAAGCCCTCTACACAGG
+TATCGCCGACTAGACACTTCTATACGCCAGTA
+>ds2020-267_731
+TCGCTTAGGCGACGCACTGACCGTGCTGGTACCCCTGATGGATTTAGAGTATGCTATTAA
+AGCTCTAGAAGAAATCTTAGACTAAACTTCTGACCCTACAGCTAACAGTATCGCTGCTGA
+CGCCTTAGAAAAAGTATCTCAAGGTGATTACTTTGAATGTGCGCGGTTTCCCTCTCTAGT
+AAGACAAGTGCCGAAACATTGCGGACGTGCTG
+>ds2020-267_732
+TCAGCCGTCCGCAATGGCCAGAAAGTGTATCCCTTGATGGATTTGAATTGTGTAATCCCA
+TTGGATTCCCAAAAGCAGAAGATCCTTTATGTATATTTTCCTTCATATATGATTTCTTGT
+CCTGGAGAACTTCAAATATAAGAACTTATATTTTAATGATGAACGTCATATTTTTGAAAA
+TGCATTAACAACCCTGGCTTGCGGACGTGCTG
+>ds2020-267_733
+TTCCCCCATTGCCACCCTCATCCACTCTGTAGGGGGGTGCGGTCAGTTCTCTCTTCGCCT
+GTTACGCCACCTACAGAGTGGAAGATTGTGGCAATGGGGGAATTTCTCGAATACAAGGAT
+TGCAGTGGACGAAGGCGAAGGAGCACACCCAACGCCCGAAGGGAATCGGCAGCACGTCGC
+AAAATCAGGGCCCGGTTATTGCGGACGTGCTG
+>ds2020-267_734
+CAGCACGTCCGCAATTGGTAGATCCTCAGCACGTCCGCAATACACCCTCGTTAGCTTGCG
+GACGCTTAAGGCGACGCACTGACCGTCGCGTGGGCCCTGTCATGGTAGGAATAGAATTTG
+CATCAACATCGATTGAGCGCTCAAATGAGCCTTCATCGACATTGTTGCCAATTTATCTAT
+CTCTCTGTCCTTTAAATACATCACAGCGTTCT
+>ds2020-267_735
+CAGCACGACCGCAATTTTCGTCACCTTGGGGTTTTACGGCTACGGATGATAAAGTAAATC
+ACTGTAATTGCTAAGTAGCATCAAGATTTTGCAGCCATGGTATCGCTTTATATTCAAACC
+GGATGATTAGTTGTCACCGTTCTGTCACGAATCAGTCAAGCCACTGTCACATATCCCCTC
+TAACATACTCTAGTAAGTGCGGACGTGCTGCT
+>ds2020-267_736
+CCCTCAGCACGTACGCAAATATGATTGGGTTCTATATTGGCACCTAAATGGGAAACCGAA
+TCGGACCAAACCCTTTGTCAGGCTATTGTTCTCTTGTTTTGTTCCCTAAAAGTCATAGAG
+TAAGACATCAATTTATCAATAAGATCAAATATTTTTTTGATTACATGATGGACTCCTCTG
+AAAAACATCGGCGCGCGTTTGCGGACGTGCTG
+>ds2020-267_737
+ATCGTCTGGACTTCGGGCTTCTAACAGCCCCTGAGAAAAGCCCGAACGTCCTTACTTCCA
+GAATCTAAGGAGCAGCACGTCCGCAATAGATCTACCTTTTATTGCGACGTGCTGAGGGCA
+ATGATGTTGCGGACGTGCTGAGGGTACTCCAATTGCGGACGTGCTGGGCCTTATCTCTTG
+TTGAAGGGCACACTCCGGAACTACAACCACCC
+>ds2020-267_738
+ATCTAAGGAGCAGCACGTCCGCAATTTGCTATCCCTCAGCACGTCGCAAGTCCCACTCCC
+TAATGTTTGCGGACGTGCTACCCTGTGTCCTTTGCGGACTGCTGCTCCTTAGACACGTCC
+GCAACCATCCCAGGCTAATTGCGGACGTGCGGGTCTATCCTCTTGCGGACGTGCTGAGGT
+GGCCAATCTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_739
+GGACGTTCGGGCTTATGGCTGCAGATGGTCGATTTATCCAAGAAATTGAACTGGTTAAAG
+GGTATAATCAGCTCGACAAGGGTCGATTAAAAGCCCGAACGTCCTTACTTCCAGAGGAGC
+AGCACGTCCGCAAACGATGAGGGATATATTGGGACGTGCTGAGGAGGTATCTGTTGCGGA
+CGTGCTGAGGCCAATATATTGCGGACGTGCTG
+>ds2020-267_740
+GACGCACTGACCGTTTGTCCGTCCCTGACGCACTGACCGTTCCTGACTCCTGACGCACTG
+ACCGTATACTAGCGGCCGGAAGACGGTCAGTGCTAGCACGTCCGCAAAGACCCTACCATA
+TTGCGGACATGCTGACCGTAAGATCGTTGCGGACGTGCTGATCCACTGCAGGTTGCGGAC
+GTGCTGAGGGAATGAAACTTGCGGACGTGCTG
+>ds2020-267_741
+GACGCACTGACCGTATCTACTTTCCTGACGCACTGACCGTAGGTATAGGCCTGACGCACT
+GACCGTATTTGCATCCGTGACGCACTGACCGTCCTTATCCGGGGTGAAACGGTCAGTGCG
+TCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGGGCAGGAGACTGTGATTGCGAC
+GTGCTGAGCTGATGTAAATTGCGGACGTGCTG
+>ds2020-267_742
+CAGCACGTCGCAATACAATCGATCTAGCTTGCGGACGTGCTGAGGTATGCTATTTTGCGG
+ACGTGCTGAGGGGATACTGGTTGCGGACGTGCTGCTCCTTAGATTATCTAAGGAGCAGCA
+CGTCCGCAATCATGACCGAGTTACTATTGCGGAAGTGCTGAGGGAGTGACACTTGCGGAC
+GTGCTGACACTGACCGACTTGCGGACGTGCTG
+>ds2020-267_743
+GACGCACTGACCGTCTTAGTTTCAATAACGGTCAGGCGTCAGGGGCTGGAACACGGTCAG
+TGCGTCACGGAGGTAACAACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGAGCAGCACGT
+CCGCAACAACGCTGGGGTATTTGGGACGTGCTGAGGGGCTAAGCTTTGCGGACGTGCTGG
+GGGATAGGCCTTGCGGACGTGCTGCTCCTTAG
+>ds2020-267_744
+GTCCGCAATCCGATGGTCTCAGCACGTCCGCAATTCATTGGGCCTCAGCACGTCCGCAAG
+TGCCCTTCCTCAGCACGTCCGCAGATCGGCGTAATTGCGGACGTGCGCTTAAGGCGACGC
+ACTGACCGTACCCGAACCCTTAAATGACGGTCAGTGCGTCAGCGGAATGCATACGGTCAG
+TGCGTCAGGGATACCCCGACGGTCAGTGCGTC
+>ds2020-267_745
+CAGCACGTCCGCAAGGGGGCCCTTAGTCTTTTGATTAGAGTAGGGGTCGCGAGAGAGCAG
+AGCGTACCGCCCTGCCATAGTCGCGAGTCTGTTTATAGTCGCGACTGTTGTCATAGTCAA
+CAAGGTTGAAACTTCCAGGAAAAAACTTCGAATTGGGAGGGCGATCCTCCCGGTGAACTG
+ACCGTACCCCATTCATGTTGCGGACGTGCTG
+>ds2020-267_746
+CAGCACGTCCGCAAGTAAAATGGCCTTTGGCTATATATTTCCCTGTAGAAATGTACTTTG
+TACAAAAGAAAATTGGGTCCTGGACAAGAAAATGGATTGTTCTAGAGGCATTCAGTTTAG
+TTTGCTTTCTTGTCACAGTTGTGGGGGTTATTGGATCAGTTCAAGGACTTATAAGTGCCA
+AACTTAGCTAGGGAGTCTTGCGGACGTGCTG
+>ds2020-267_747
+CAGCACGTCCGCAACGAAATATTTATTCACGAGATCTGACGATTGATGATTTTATGAAAG
+TAGGTTTGAATGAATTCCGCTCTTTGATTTTGGTCTTTCTTGGTCACTATAAATTGGTTT
+AAAATGCGAAGAATTGACACATGAGCTTGTAGGGCCCGTTGAAGTCCCCGAATAAGGGGG
+AAAAAAGAGGATGCTACTTGCGGACGTGCTG
+>ds2020-267_748
+CAGCACGTCCGCAATTGACCAGTCCTCCATTGTCCCCTCAGCCATGGAAAGAGAATCCAT
+GGGGAGTTACCACTGAAGCCGTTCAGTTCCACCAGAATATTAATTCTCAAACTAACATAA
+ATGGCGTTGCTTGGGGAGCACATGTGTACCATGCAAATGATTCCACTTTATCTGTTGCTG
+CTTTCAGAGGAGAGAGCTTGCGGACGTGCTG
+>ds2020-267_749
+CAGCACGTCCGCAACAGCGCATCAGTCATTCCTGGTTACTAAGAAACTGTTCGACTATAG
+AACTGATTGTGAGAATTACCAACCTTTGCGCCTTACCTGTCCTGTGGACAGTGTTGCGGT
+ATGAATCCACTCTTCGCGGATCCCACTTTCGACTGACCGAAGATCGTCTCTTCCCGCACC
+ATGATGTACATGTCAGCTTGCGGACGTGCTG
+>ds2020-267_750
+CAGCACGTCCGCAAGGCGGATACGCTCCCCAATCCACACCGCCATCTCACCAATCGCAAG
+GTCGCCAATACGGTGGATGGCAATGGCGTTTTCGATGTCAAACTGGCCTTTGGCTTTCAA
+TCAGTTTTTTGCCTTGATTGACTGCCAGCTGCTCGTAGCCATAATAAGTGAGCTTGCTAA
+CAGGGAGGCGTAAGGTCACGGTCAGTGCGTC
+>ds2020-267_751
+GACGCACTGACCGTAAACTCTGCCCTGACGCACTGACCGTCTTTTCTGCCCTGACGCACT
+GACCGTAGTCTATGGGGTTATACACGGTCAGTGCGTCGCCTTAAGCGCACGTCCGCAATC
+TCTATGGCCTAACACTTGCGACGTGCTGAGGAGACGGACGTTGCGGACGTGCTGAGGGAA
+AGGTACTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_752
+CCGCAACTGCGTGGACCTCAGCACGTCCGCAACCAACTGAGCCTCAGCACGTCCGCAAAC
+ATCGTGTAGTGCGACGGCTAGGGGTGTGGTCTTGCGGACGTGCTACGCTTAAGGCGACGC
+ACTGACCGTTCATTGGACCTTGACGCACTGACCGTAAGTGTTTCCGTGACGCACTGACCG
+TCAATACCTGGAGTCGCACGGTCAGTGCGTC
+>ds2020-267_753
+TCCGCAATCGGTTGGGTCTCAGCACGTCCGCAAGCCTTTTTCACTCAGCACGTCCGCAAC
+TGAACACCCCTCAGCACTCCGCAACCGGGGCCAATTTGCGGACGTGCTGCTCCTAGATCA
+CTGACCGTACCAAACACCGTGCCCCACGGTCAGTGCGTCAAGGCTAGCAAAACGGTCAGT
+GCGTCAGGCAAGAATAAACGGTCAGTGCGTC
+>ds2020-267_754
+GACGCACTGACCGTTTGTCTTGCCCTGACGCACTGACCGTAAATAGTTCGTTGACGCACT
+GACCGTTGTTACCCCTTTACACACGGTCAGTGCGTCGCCTTAAGCGTAGCACGTCCGCAA
+GATCCAACCAGTGTAGATTGCGGAAGTGCTGAGGACGGACTACTGCGGACGTGCTGAGGG
+GTCACGGATTGCGGACGTGCTGCTCCTTAGA
+>ds2020-267_755
+GAGTGCCTGTAGTCGAAGGGGGTGTTGTTCGAATCTATGAAAGGTGCAGCACGTCCGCGT
+CCGCAAAGTGGTGGACTTGGGACGTGTGAGTGCCTTAGATTTGCGACGTGCTGACCGGTT
+GACTATTGCGGACGTGCTGCTCCTTAGATACGTCCGCAAGCCAACGGGGATGTAATTGCG
+GACGTGAGGGAAATAGTTTGCGGACGTGCTG
+>ds2020-267_756
+CAGCACGTCCGCAAACTTTCACAGCTCAGCACGTCCGCAAACCCCCGCGCTCAGCACGTC
+GCAATCACCCCTCATTGCGGACGCGCTTAAGGCGACGCACTGACCGTCAGCATCATCATG
+ACGGTCGTGCGTCAGGTGTCTTCGTACGGTCAGTGCGTCACGGGAGAAAACACGGTCAGT
+GCGTCAGGCGGCAAGACACGGTCAGTGCGTC
+>ds2020-267_757
+CTGGAAGTAAGGACGTTCGGGCTTTAGGTACCATGGTAAGCCCGAACGTCCAATCTAAGG
+AGCAGCACGTCCGCAAATTCAACGACCTCAGCACGTCCGCAAGGTATATTCCGTCAGCAC
+GTCCGCAACTGGCTCGGATTGCGGACGTGCTGAGTGTTACGTCTTTGCGGACGTGCTGAG
+GGGGCTAACGTTGCGGACGTGCTGCTCCTTA
+>ds2020-267_758
+TCTAAGGAGCAGCACGTCCGCAAGTCGGTGTCCCCAGCACGTCCGCAAGTGAGTGGCCTC
+AGCACGTCCGCAACTAAATTCGGGTCAGCACGTCACAAATATGCTCTTGCGGACGTGCTG
+CTCCTTGAATTCTGGAAGTAAGTACGTTCGGGCTTGCCAAGATCCTTGGAGTTCGGGCTT
+AGTACACCTGGAGTATGAAGCCCGAACGTCC
+>ds2020-267_759
+GGACGTTCGGGCTTTGGGGTGTGTATTTTACTTGTCTTTGGTGACTTTTGAAATTTTCTT
+TACGGTGGAGTTTCAAGAGTTTTCGTGGGTGTTCCTTGTGGGTAGTGTGTAGTTTGTTGC
+TTTGATTTTCTCTATGTACTTTGGGTAGCATTGTTTAAGGCTACATGGGTTTTGCGGACG
+TGCTGACATAGGCCCCGTTGCGGACGTGCTG
+>ds2020-267_760
+CAGCACGTCCGCAAGTACGTAACCGTCAGCACGTCGCAATGGGACACCTCTCCGCAAATG
+GGTGGTAGGTTGCGGACGTGCTGTCTGGAAGTAAGGACGTTCGGGCTTACTTAGGAGGGT
+ATGAAGCCCGAAGTCCAGGGAATTGATAAAGCCGACGTCCAGGGATGACAGCAAGCCCGA
+AGTCCAAGGCAAGAAACAAGCCCGAACGTCC
+>ds2020-267_761
+CAGCACGTCCGCAAAATTTGGGTTGTGGACGTGCTGAGCGGGATGTTTTGCGGACGTGCT
+GAGTGAGTGATAATTGCGGACGTGCGAGACGCTTAAGGCGACGCACTGACCGTCTTTGCT
+CGCCTGACGCACTGACCGTACCTTATCGCCTGACGCACTGACCGTCTTATTTTCCCTGAC
+GCCTGACCACGGTTGATACGGTCAGTGCGTC
+>ds2020-267_762
+GACGCACTGACCGTAACCTATACACTGACGCACAGACCGTAACCTATACACTGACGCACT
+GACCGTTAAACCGCGGCTCACTGACCGTTATGAAAGGCGTGACGACACGGTCAGTGCGTC
+GCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGCGCATTGCCCTCAGCACGTCCGCA
+AACCCCAGGCCTTAGAAATTGCGACGTGCTG
+>ds2020-267_763
+GGACGTTCGGGCTTGTAGATGCGGGTGATGTCGCTGGCATAGCCGTGGAAGCTGGCGCCG
+GCATCGATCAGGAAGCTGCGCAGCAGGTCGGGAGGTCATGGTAAAAGCCCGAACGTCCTT
+ACTAGTCCGCAAGATTCATCTGCTCACACGTCCGCAAACAAGACGTAATAGTTGCGGACG
+TGCTGAGGGACATTTCCTTGCGGACGTGCTG
+>ds2020-267_764
+GACGCACTGACCGTTTGAAACTGGGTGTTCTACGGTCAGTGCGTCAGCAGATCATTGACG
+GTCAGTGCGTCAGGGGAACCCCCACGGTCAGTGCGTCAGAATAGTTACTACGGTCAGTGC
+GTCGCCTTAAGCGAATCTAAGGAGCAGCACGTCCGCAATTGTATGTCCTTGGTTGCGACG
+TGCTGACCTGATAAAAGTTGCGGACGTGCTG
+>ds2020-267_765
+CAGCACGTCCGCAAAGGAACTTGGGTAGCACGTCCGCAAGGAGATACCAGTTAATTTGCG
+GACGTGCTGCTCCTTAGATTCGCTTAAGGCGACGCACTGACCGTTGACGACGCTCTGACG
+CACTGACCGTTCTCTGACCCCTGACGCACTGACCGTTGCCACATCCCTGACGCACTGACC
+GTGATACCATTAGAGAGACGGTCAGTGCGTC
+>ds2020-267_766
+CAGCACGTCCGCAAGCGAGGTTGGATACCAATCCATGTCCCCTAACTGGTCTACCGTATG
+TCCAGGTCTGGGTTTGAACGGGGGGATGCCCCCCCACATAAATGGCATCATGACAATACA
+CCCCACGACATGCCAAGGCGCAGAGGGGTAGAGCGGCCGCTCGTTGATAAAACGGCCAAA
+CCACCAGGGGTAGGCGGTTGCGGACGTGCTG
+>ds2020-267_767
+CCGCAAAGTCAGATCCCTCAGCACGTCCGCAAGGACCCTTACCTCAGCACGTCCGCAAAT
+AACCTGGGCTGTTTTGCACGTGGAGTCGACTAAAGTTGCGGACGTGACTGGAAGTAAGGA
+CGTTCGGGCTTTTGTTAGGTGTTAGGTGAAGCCCGAAGTCCAGACGATGATATAAGCCCG
+AACGCCAGTGACGGGACAAGCCCGAACGTCC
+>ds2020-267_768
+CAGCACGTCCGCAAACTGAAGGGAGTGGGGCTTGGGTTGTGGCTGGAGGTGCGGGTGGTC
+TGAGTTTTATACAGCCCGTGTTTCTAAAATTGGTGTAATAGATTAGGGCCTTAGCATGCA
+CAGAAAGATTAATTGAATCTTTGTTTTGTCTTGCTAAAAGTGGAAGATGTTGGATTGAAG
+CAGAGATGTGGCAAAGGTTGCGGACGTGCTG
+>ds2020-267_769
+TAGCACGTCCGCAAGTGGGATTTGGTGGACACAGATGCGGCAAGGTTGCTCGAGTTGGTC
+CCTGAGTTCGTTTGTCAATGGCAAAATGCGGATTATGATGGGAATGACGAGGAAAGCAAT
+TTGGCGTTATGTAGTGCTCCGCCGAAATTCTGACGTTTTTGGCAGATGTCAGTTTTCGAG
+GGGGAAGGGTGCGGGCTTGCGGACGTGCTG
+>ds2020-267_770
+CAGCACGTCCGCAACGCTCTCCCCTCCGTACCGTAAGGTGCGTGGTTTTTTGCTTTGGGC
+GTTATTCCTCTCCTTGAAACTTTCTTACCTTCCTCTTGCAGACTCGACATTCAGGCCGGA
+TCTCGGTATTGTTAGCTGTCTGGATGTCTAAACGTTTATACGTATGCTTTGAGGATTCAA
+CGATATGGACGCTTCATTGCGGACGTGCTG
+>ds2020-267_771
+CAGCACGTCCGCAATCGCTTACCCCTCTACCATATAAGTATTCACCTACAGGAATATACA
+ATTTACTTTGACCCTACTCTAAGCATAACCAGTTATAACCTTCTGCTTCACCCAAGAATA
+ATTTTTGGATTACTTCAACAAGAAAATCACGATTACAAAAACTAGGAACACTATCTGCAG
+CATCACGGTCATCTATTTGCGGACGTGCTG
+>ds2020-267_772
+TACGAGGAATTGGAGCAAACGCACAGAAATGCTTTTCCTTCAGCCCAAATACCTAGATTT
+TTCCAAGATTTCAAGAGAGCTGAACTTAGTGATGAGGTTGGTAAGGGTAAAGAAAATAAG
+ATTAACCGCAATGATTTCGTGAAAATAGCAACCCACACGGGTGGCAAACAAAATACACTA
+CGAGACCGATATCCTCTTGCGGCCGTGCTG
+>ds2020-267_773
+CAGCACGTCCGCAATTTGACTGATGTGCAATATTATGTGACCCAGCAAAACGGCACTGAG
+CGTCCTTTTAGCCATGAATATGATCACCAATTTGAACCTGGAATTTATGTGGATATTGTG
+AGTGGTGAGCCGCTTTTTAGCTCATCGGACAAATATGACTCAGGTTGTGGTTGGAGAGGC
+ATTTTGTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_774
+CAGCACGTCCGCAATGCACGCTTCCTCTTCTTTCGAATGCTAATGTGTGGTTTTGTCCTA
+CTTCCAAAGTCACAGAGGGAGCTGGAGCCGATTTTTTGTTTGACTACCTTCAATCGACGG
+ATGGTGCTAAAGGAGTTGGGAGAAGAGTCCACCTATAGTTATAGTAGTTAGAAGCCCAGC
+TTCAATCGCTCAGAGGTTGGGGACGTGCTG
+>ds2020-267_775
+GGACGTTCGGGCTTCACCTGCACCCTGGACGTTCGGCTTGTATCCACTCTGGACGTTCGG
+CTTTATAGTGCCCCTAAAGCCCGAACGTCCTTACTTCCAGAAGGAGCAGCACGTCCGCAA
+TCGGTCCGTCCTCAGCACGTCCGCAAGGAACTTTCCCTCAGCACGTCCCAAGGCACCCCA
+ATTTCGTTGCGACGTGCTGCTCCTTAGATA
+>ds2020-267_776
+GCAGCAAGTCCGCAAAAACGAGCAAATTGCAAGAGAGGAGCTCTACCAACTGATCTATAT
+CCCCCCGAGCCAAGTGGAGCATGCATGAAGGAGTCAAATGCTTCTTCTATTCTTTTCCTT
+GGCGCAGCTGGGCCATCCTGGACTTGAACCAGAGACCTCGCCCGTGAAGTAAATCATCGC
+ACCTACAGTACAACTATTGCGGACGTGCTG
+>ds2020-267_777
+GGACGTTCGGGCTTTACCCCATCCCTCAGAAAAGCCCAAACGTCCAACGCTACGGTGAAG
+CCCGAACGTCCACTGCATGATGCAAGCCCGAACGTCCTTACTTCCAGGGCACGTCCGCAA
+AACAAGCCAGGTTAGTTGGGACGTGCTGAGGGGGTCAAGTTGCGGACGTGCTGAGGGACG
+TAACGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_778
+GGACGTTCGGGCTTTGGTCCTACGGTGGCGTTCGGGCTTCAGAGAGGTAGGCAAGCCCGA
+ACGTCCTTACTTCCAGGATCTAAGGAGCAGCACGTCCGCAATCTATCATCCCTCACACGT
+CCGCAAAGGTATGCATTTCGGACGGCTGAGCGTAATACGGTTGCGGACGTGCTGCCCAAT
+TACGCTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_779
+GGACGTTCGGGCTTAGCCGGTCCCGCTTTTTATGGTCTTTTCCACGTAAACGCAGTTGGT
+TTTATATCCATTGTTCAAATAGCCGTAAGCGGTGGTTCAGGAAATGTTTTAGAATAGGTT
+GTTACAGAATACGCTGTGGGACGTCGAGGAGTATTAATTTGCGGACGTGCTGAGGCGGAA
+GTTTTTGCGGACGTGCTGCTCCTTAGATAG
+>ds2020-267_780
+CAGCACGTCCGCAATAGCATGTAGCTGGTTGAGTAAGATTATTTTCCTAATGCTTTTCTG
+AATATGTCAAGCAAAGAGAAAGGTGACCTTTCCATAAAGAAATTCATGTGCCTTTATATC
+ATGGGCATCTTTGATGAGAAGCTTATGTGCCCAAGTGTTGGGCAAGTCTTATTTATTTAT
+TTATTTCCTAGGACACTTGAGGACGTGCTG
+>ds2020-267_781
+GACGCACTGACCGTGCGAAAGGCCCTTAATTACGGTCAGTGCGTCAGGGAACTAGGAACG
+GTCAGTGCGTCAGGGCAATAGAGACGGTCAGTGCGTCGCCTTAAGCGCACGTCCGCAATC
+ATAGAGTATTGTTGTTGGGACGTGCTGAGGAAAAATTACTTGCGGACGTGCTGAGGATAA
+GTTGCTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_782
+GGAGTGGCTGGAATACAGACGTGGCCGGGGCAACTCGAGTTCAGAAGTGTCCTCTTCCGA
+TCTATATAAGGAGCAGCACGTCCGCAAAGATCCGGGAGTATTTGGGACGTGCTGAGCCAT
+AATGTATTGCGGACGTGCTGACTCGAGCCCTTTTGCGGACGTGCTGCTCCGTAGATACGC
+TTAAGGCGACGCACTGAGCGTGGGGGCTGG
+>ds2020-267_783
+GACGCACTGACCGTCATTTGATTTCTACCAGTTCAACTAATGAGGAAAGGGTAGGAAGCA
+ATGTGAAAACCAGGCCTAGAGTTTTCGATAGCAAAAAGAGGCTTATACGTTATTCTGGGA
+TGCTTCGAACCTGTGTTTTGCAAGGGTCTTTGAATGAGGGGAAGGCTATTCATGGGCAGG
+GAGTAGAAAACGGGAAACGGTCAGTGCGTC
+>ds2020-267_784
+GACGCACTGACCGTCTCCACGGCTTTTAACACGGTCAGTACGTCAGGCGTTTATATGCGG
+TCAGTGCGTCACGTCACCAGGTGCGGTCAGTGCGTCGCCTTAAGCGTAGCACGTCCGCAA
+GTTAAGGCAGTTAGGTTGGGACGTGCTGAGGGGTCTACCGTTGCGGACGTGCTGCCCCTG
+CAACGTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_785
+CAGCACGTCCGCAAGCGGATAACATTGGACGTGCTGACTGCTTGATAGTTGCGGACGTGC
+TGGGCCAAGGTTATTGCGGACGTGCTGCTCCTTAGATATCCCTTGACGCACATCTAAGGA
+GCAGCACGTCCGCAATTATTTGCACCTCAGCACGTCCGCAAATTACACTCGCTCAGCCGT
+CCCAAGCCGATTGTTGTTGCGGACGTGCTG
+>ds2020-267_786
+GGACGTTCGGGCTTCCTCCACTCGCTCAAAAAACATACTGCAAGCAAGGCCCAGTGGTCC
+GTGCGTCGATGCACTTGCTTGTATCCGCAAGCGTCTGACACCTTCATCACCTGCCACAAG
+CCCGAACGTCCTTTATCTAAGGAGCAGCACGTCCGCAAAGGGCAATACCTCAGCACGTCC
+GCAACAAGTGTGCCTCATTGCGACGTGCTG
+>ds2020-267_787
+GACGCACTGACCGTATTCAAATCCGTGACGCACTGACCGCTTGATGAGACCTACGCACTG
+ACCGTGTTAATCCATAGACACACGGTCAGTGCGTCGCCTTAAGCGATAAGGAGCAGCACG
+TCCGCAACCCAACCCCCCTAGCTAGGCGCCCTATCCGAATGCCATGAGATTTGCGGACGT
+GCTGAGGACATAGAACTTGCGGACGTGCTG
+>ds2020-267_788
+GGACGTTCGGGCTTCTGTCTCTCCTTGATAAATGGGCTTAGCCACCACGTTGTGAGTCAA
+GTTATTACCAAATCTTACCCCCATGATTAAGCCCGAACGTCCTTACTTCCAGAGGAGCAG
+CACGTCCGCAACACACTGGTCTTATGTTGGGACGTGCTGAGGGCGAATAACTTGCGGACG
+TGCTAGGGGTTAGGGGTTGCGGACGTGCTG
+>ds2020-267_789
+CAGCACGTCCGCAACCCGACTCCTATCACTTTTCAAAAATACAATCTTACTCCCCGAAAG
+CCGAAAAATATGAGTGAGAGGAGAGCCTACGAACCCCTACTTCATCACAAATATCTCAAA
+GCCTCCGCAGCTCACCCACACGAAGAAGACGGCAGATCCCTAAAAGCGGCGAAACACAGC
+ACACACCAAATCCATGTTGCGGACGTGCTG
+>ds2020-267_790
+CCGCAAAGATAATGGCCTCAGCACGTCCGCAAACATCATCACCTCAGCACGTCCGCAACT
+AACTCCGACTCAGCACGTCCACAATCATGTTTTTGCGGACGTGCTGCTCCTAGATACACT
+GACCGTAGCGTATGGGTTGAAAAGACGGTCAGTGCGTCAGGGGCGATCACACGGTCAGTG
+CGTCAGGGTGGATAGAACGGTCAGTGCGTC
+>ds2020-267_791
+CAGCACGTCCGCAAATGTTAACCCGTCAGCACGTCCGCAAGCCGCCCGCCCTCGCACGTC
+CGCAATCGTGTCTAGTGTTTTGCGGACGTGCTGCTCCTTAGATTCGCTTAAGGCGACGCA
+CTGACCGTTTTCTTCTACCTGACGCACTGACCGTTCATCAACGCCTACGTGTCGGTCAGT
+GCGTCAAGGTAACCACACGGTCAGTGCGTC
+>ds2020-267_792
+GACGCACAGACCGTCGTTAAGGGGATCCTTACGGTCAGAGCGTCAATAGATAAATCACGG
+TCAGTGCGTCAGGGGATGGGCTACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAG
+CACGTCCGCAAGATGGTGGCGGTATTTGGGGACGTGTGAGGGTCGTGGAGTTGCGGACGT
+GCTGAGCTAAAAGTACTTGCGGACGTGCTG
+>ds2020-267_793
+TCCGCAAAGAAAGCCCCCTCAGCACGTCCGCAATCGTCACACGCTCAGCACGTCCCAATC
+TATAGGCCCCAGCACCGTCCGCAATATCGAGTCTGTTGCGGACGTGCTCTGGAAGTAAGG
+ACGTTCGGGCTTATCACCCCAAATGAAGCCCGACGTCCAGGGAGAAATTAAAGCCCGAAC
+GTCCAGGGAGGTTAGGAAGCCCGAACGTCC
+>ds2020-267_794
+AAACTTCGCACCCTCAGCACGTCCGCAAATTCGGCCTCCTCAGCACGTCCGCAAGGGTTG
+TAACTTGCGGACTACGGCGACCACCGAGGTCTACACATAGAGGTACACTGTGTCGCTAGA
+CGAGGGTTTTCCGATCTGTCGGGGGAGCAGCACGTCGCAAGTGGAGTGTTATTGCGGACG
+TGCGAGACGTGCTGTGTGGGGGGCGTGGTG
+>ds2020-267_795
+CAGCACGTCCGCAAACTCCTTTTCCTCATCTCATTAAGTTCTCTGATACAACACGTAAAC
+GCTCTAATTTTAATGATTATTTTATGATCCTATCTTTTCTTTTAACTTTGACTTTTTATT
+ACGACCAATTTTATTGTTTTATTGTTCGACAAAAGGTTCATTTATATACAATAATCGGAT
+TGTAGCGGGTTTAGTTTGCGGACGTGCTG
+>ds2020-267_796
+CAGCACGTCCGCAAGCCTTGTTCATTTGTTTCATGATGAGGCGATAGATGAGCGTTAGCT
+CCTCAATCGGGATGCGAACTTTCTCGCGTCCAATGACCTCCCGGAATTTCTTTCTGGCAG
+GTTCTGCCACCCACCTAGGCAGGTAACCCATGTTTCTCGTTTGAGAGAAACCTCCCATGG
+TATAGACCCTGAAGATTGCGGACGTGCTG
+>ds2020-267_797
+CAGCACGTCCGCAATTAGCCCTCCTTTAGAAAGGAATCTCCCCTACCATATATATATTTT
+TTCCTCAAATAAAAAGGTGACATGACAAAAATAGAAATAAAAATAAAAAGGTGCCAAATG
+TGCATCCAATCAATTTCTCATTACTGACGAACAAAATCAAAGAAACTACAGATTTCATTT
+GAAACCCTGAATAGATTGCGGACGTGCTG
+>ds2020-267_798
+CAGCACGTCCGCAACCCGGTCTGGCTATCTCTATCAATATTATAAAGTTTCTTGGTGGTT
+CAGTGCCTCCAGTCCCAAGCGGGGCTGGCCGAGATTCATTTCAGCCGAATCTTTCACTTC
+GACTCGATACTTGGTGAAGGATAGTTGCGACGTGCTGAGGAACAGAGGTTTGCGGACGTG
+CTGACGGTGTGGTATTTGCGGACGTGCTG
+>ds2020-267_799
+CCGATCTATCTAGGAGCAGCACGTCCGCAATGGTATTCCCCTCAGCACGTCCGCAAAAGC
+AATCCCCTAGCACGTCCGCAACGTGCTGGTACTCAGCACGTCCCAAGTTTAAGCACCTCC
+GGACCTTTGCGGACGTGCTAGGGGATTGCTTTTGCGGACGTGCTGAGGGGGCGGATATTG
+CGGACGTGCTGCTCCTTAGATAGATCGGA
+>ds2020-267_800
+GGACGTTCGGGCTTTTTCCGACCCCTGGACGTTCGGACTTCGACACCCAAGCCCGAACGT
+CCTACTTCAGGGCACGTCCGCAAACATGTCCCTGTCATATTGCGGACGCTGAGGGGCTTT
+GGCTTGCGGACGTGCTACCTCGAAATCGTTGCGGACGTGCTGAGGCTAATCCAATTGCGG
+ACGTGCTGCTCCTTAGATAGATCGGGAGA
+>ds2020-267_801
+TATCTAAGGAGCAGCACGTCCGCAACGCGTTATACCTCAGCACGTCCGCAATTCTCACAC
+GCTTTCCCTTGGGACGTGGAGGGCGGAGTCATTGCGGACGTGCTGAGGCAGGTCCTTTTG
+CGGACGTGCTGGATGACCATATGCTTGGGACGTGCTGATGGAGATATTGTTGCGGACGTG
+CTGAGGCAGGTCCTTTTGCGGACGTGCTG
+>ds2020-267_802
+GACGCACTGACCGTAACACAGCGCCTAACGCACGGTCAGTGCGTCAGCAAATTTCATACG
+GTCAGTGCGTCAGGTGGTGATGTACGGTCAGTGCGTCAGGAGGTAACCTACGGTCAGTGC
+GTCGCCTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGACATGAGTTCTCCACGTCCCAA
+CACACCCTGAAACATTTGCGGACGTGCTG
+>ds2020-267_803
+GACGCACTGACCGTCAAGATGATCATTAAAACGGCAGTGCGTCAGGAGGCAATACACGGT
+CAGTGCGTCAGCTACAATCACACGGTCAGTGCGTCAGGGGTATCGCTACGGTCAGTGCGT
+CGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAACCCACGAGACTTGATTGGGACGTG
+CTGAGGAGTATGTCATTGCGGACGTGCTG
+>ds2020-267_804
+GACGCACTGACCGTTATGATTCTGCTGACGCACTGACCGTCCTCTCCCACATGACCACTG
+ACCTGTCTACACGCAAACGCACGGTCAGTGCGTCGCCTTAAGCGCGTCCGCAATCACACC
+TCTGTATTGCGCAGGAACTCACCTTGCGGACGTGCTGACTGAATGTTTGTTGCGGACGTG
+CTGAGAGGAAACGCGTTGCGGACGTGCTG
+>ds2020-267_805
+GGACGTTCGGGCTTGAAACTTTGGGTGAGTTGGTCTTTGTTAAAGAGTTTGGGGATATAT
+TTTAGAGCAGCAATGGCGTTAAGGGGTTGGTTGTACCATGACATAGGGTAGTCCTCAAAG
+CCCGAACGTCCTTACTTCCAGTGCACGTCCGCAATCTCTAGACTGTGGGGATTGGGACGT
+GCTGAGACCGTTATTTTGCGGACGTGCTG
+>ds2020-267_806
+GTCCGCAAAGCTTCCCCCTCAGCACGTCCGCAACCATCATGCCCTCAGCACGTCCGCAAA
+GAAGACGCCCTCAGCACGTCCGCAACTATAAACCCCTTTTTTTTTGCGGACGAATCTAAG
+GAGCAGCACGTCCGCAACGGTTTCAGCTTGGGACGTGCTGGGGCATTTTGTTTGCGGACG
+TGCTGGCCGGGATTATTGCGGACGTGCTG
+>ds2020-267_807
+CCGCAATGCATATTTCCTCAGCACGTCCGCAATTCAAACTCGCTCAGCACGTCCGCAAGT
+TTAATCCTCTCAGCACGTCCCAACGGATAGGCTTTGCGGACGTGCTAATCTAAGGAGCAG
+CACGTCCGCAAAGCTTTCCCGATCAGCACGTCCGCAAACCTCTTTCCCTCAGCACGTCGC
+AATACCCGTGGGCTCTTGCGGACGTGCTG
+>ds2020-267_808
+GTAAGGACGTTCGGGCTTCACACCACACTTGGCGTTCGGGCTTTCAAGATGGGGGGACTT
+CGGGCTTACAGGCGCGAGTAGAAGCCCGAACGTCCTTACTTCCAGTAGCACGTCCGCAAA
+CTAAGAACTGTTGGGACGTGCTGACGGAGAACATATTGCGACGTGCTGAGGGTTCTGTTA
+TTGCGGACGTGCTGAGTGAAAGGCCATTG
+>ds2020-267_809
+CAGCACGTCCGCAACTAACCACCCCTTTCTGTAACATAACTACACATCCAGTACCACATT
+GAATCAGCGTCCGTCCAGTCTATGTTCTCATCGCCTTCGTACAAGGCGTCGTTTCCGCTG
+GTAGTTCTGGTGCTTAAGTTTTGGAGCTGGACGCCTGGCACCTTGACGTCGAAGTTGAAC
+GAGGTGGTCGTATTTGCGGACGTGCTGC
+>ds2020-267_810
+CAGCACGTCCGCAATCTCTCCACTTCCCTCCTAGAATGGAAAGCCGCTTTCGGGGGAGAA
+CTCTTGCTCACAGGCTCCCCGAAACCAAGAGACGAGACAGAAGATGCATAAGATGCAGAG
+GATACTATGGATTCAGGGTGAGCCCCTATCCTATGTCTAGGAGTAGAGAAGAGAGCACCT
+TCACCCGGACTTCATTGCGGACGTGCTG
+>ds2020-267_811
+TTCCCGCACCATTTATCTCTTTTCCTTGGACATAAAGTCGCCTTACAGATGGACCCATCC
+CCTTCGGACATACAGCAATTACACTGATGTTCTTGGGGAAGTCAAGACCCACTGACTGCA
+AATGCCCTAAAAGGAAACCATGGGAAAGGCCCAGTATACTATTGGGCTTCATGTGTGAAA
+ATACTTTCTCATAATTGCGGACGTGCTG
+>ds2020-267_812
+CAGCACGTCCGCTATGTTTAACCACTCCTGTAATAATTGTTGAGCTATTTAGTCAATATT
+TGGCTTCTGTGCATAGTTACCCACATTACGCAGAGCCACTTTATGCCTCCAGTGATCATT
+TAGGACCACCACTCCTCCTTCTATTCCTCTAAGTTCAAATGTTGACCTCTGTACCGGGCT
+CAATCAGTATCATTGGCGGACGTGCTGC
+>ds2020-267_813
+GACGCACTGACCGTCGCCTATCTCCTTATCCACCCTATCCTTATCAAAGTTATTCTCAAG
+TGGTTTATTAAGACTACCTACGAGGGACAAAATGACGGTCAGTGCGTCAGGTAAGTGACT
+ACGGTCAGTGCGTCGCCTAAGCGTCAGCACGTCCGCAAGGTCCACTGGTTGCGGACGTGC
+TGAGGGCTACCTTATTGCGGACGTGCTG
+>ds2020-267_814
+CAGCACGTCCGCAAACCATTGTCTATTGCGGACGTGTGAGCTTTTGCCCATTGCGGACGT
+GCTGGGGACGAACAGTTGGGACGTGCTGAGAGCGATCGGATTGCGGACGTGCTGCTCCTT
+AGATATCCGCAACTATTCAGGGTTTGGGACGTGCTGAGGATGTGCAGGTTGCGGACGTGC
+TGAGGGCATGCTAATTGCGGACGTGCTG
+>ds2020-267_815
+CAGCACGTCCGCAAAGCCGAAGAAGTTATCATGGACGAGCCACATGCAGGGAAACTTGCA
+CGTGTGGTTCTGGCCGGGCTTTCCTGAGGTATCTAATAACCTTGCTTCTGCTCGCCGCTG
+GCGCACCTCTCCTAACTATTGCCCATTTATACTGGAATAATCTTTTTAGGAGGGACAATT
+TTACATATTTCTGCCAAATACTTCTATT
+>ds2020-267_816
+CAGCACGTCCGCAATTTGAATGCCCTCAGCACGTCCGCAACGTTTCCCGCCCAGCACGTC
+GCAAGCTATCACTCATGTTTTGCGGACGTGCTGCTCCTTAGGATTCGCTTAAGGCGACGC
+ACTGACCGTCGTTCATCTGGTGACGCACTGACCGTCCTTTTTGCCGTGACGCCTGACCGT
+GTACCCATCACATAACGGTCAGTGCGTC
+>ds2020-267_817
+CAGCACGTCCGCAATGTCCAGTAAGTGGCATTAGGACAATATAAATCCAGCCTAAAACAC
+GTTCCCAACCAGGGGTAGGGCGCTGTGGGCCGTAATCATTATTGCCTTCTGTACCTTTTG
+CCGCAAAGAGATAGATCATAAAAATCAGGTCTAAGGCGGGGATCTGCATACGTAAAGATA
+GCCACCCTGTATTCTTGCGGACGTGCTG
+>ds2020-267_818
+CGATCTATCTAAGGAGCAGCACGTCCGCAATGATGAAGCCGTACGTCTATGCCAAGCCAA
+CCGCAAGTTTTTAATCCCCAGTCTACCAATAAACCTGCCACCCATCATCAAGCCAACCGT
+AAAGACACGTCCGCAATCTTGATCTTGTGGACGTGCTGGGGGGGCTTCGTTGCGACGTGC
+TGACCGATCAACCTTTGCGGACGTGCTG
+>ds2020-267_819
+GGACGTTCGGGCTTGTATTGTGGGCTGGTTGAGCTGGGCAAGGGTAGGTTGTTTGGGGTT
+TTGCATCGGTGAGGTGCTACTAGCAACACTCGAGGCAAGCTCTGGCTGTTTGGCGAGCGG
+TTGTCCTGTTTTTGGGTCAGTGACGACAACTTGCGGTGCTGCATGGGTCAGGCTTGTCAC
+CTACCAGGAGCAGGAAGCCCGAACGTCC
+>ds2020-267_820
+CAGCACGTCCGCAAACAGACCGGTCTAGATTTGGGACGTGCTGAGCGACTGAGATTTGCG
+GACGTGCTGAGCGAGCCGCTATTGCGGACGTGCTGCTCCTTAGATTCGCTTAAGGCGACG
+CACTGACCGTCGATGGGCATCTACGGTCAGTGCGTCAGCAGTAACAACACGGTCAGTGCG
+TCAAGGGTGCTCACACGGTCAGTGCGTC
+>ds2020-267_821
+AGACCGCAGACGGGAGTGTCCAGAGCGCATGGAGGCCAGACGCGTGCTCTTCCTATCTAT
+CTAAGGAGCAGCACGTCCGCAATCCGCGTCCCCTCAGCACGTCCGCAATCAAACACGCTC
+AGCACGTCCGCAAAGCTTTGATCCTCAGCACGTCGCAACATGAAGAGGGTGGACTTGCGG
+ACGTGTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_822
+CAGCACGTCCGCAAAGGATGGCACCTCAGCCCGTCCGCAAAATGTCTGGGTTATTGCGGA
+CGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTGAAGGCTCCCTTGACGCA
+CTGACCGTGTCCTGGACCTTGACGCACTGACCGTCTTGAAACCCCTGACGCCTGACCGTA
+ATACCCAAGCTTGTACGGTCAGTGCGTC
+>ds2020-267_823
+GGACGTTCGGGCTTTACATTGAGGTTGCGATTGTACTTGTGACTCATGGTTGGTGGATTG
+GTTAGCTAATGCTTGGGCGTTGGCTAGGGTTTGTGCTGGTCGATTTTCTTGTTTTACCAC
+CAAATAATTAATGCAGGTGTGTGGCCAAGCCCGAACGTCCTTACTTCCAGATGCGACGTG
+CGAGGGGAAGGCAGTTGCGGACGTGCTG
+>ds2020-267_824
+GACGCACTGACCGTTTCCTGACCCTTGACGCACTGACCGTATGTAGAGCACTGACGCACT
+GACCGTACCGTCACCCATGCTACGACGGTCAGTGCGTCGCCTTAAGCGTCTAAGGAGCAG
+CACGTCCGCAAGCTATCCGGGGTAGCACGTCCGCAATACACACTGGGCAACGTCCGCAAC
+ATACAGGATTTCGCTTGCGGACGTGCTG
+>ds2020-267_825
+GGACGTTCGGGCTTAGGTTACGGATTGAAGCCCGAAGTCCAGGGTGTCTGACAAGCCCGA
+AGTCCAGGGGAGGCTCAAGCCCGAACGTCCTTACTTCCAGCGTCCGCAATTCTACCAACC
+TCAGCACGTCGCAATGCTCGTTGGGTGATTGCGGACGTGCGAGGAGATGGGCATTGCGGA
+CGGGGGGTGACTTTTTGCGGACGTGCTG
+>ds2020-267_826
+GACGCACTGACCGTGTCACCCTTACTCAGACGGCAGTGCGTCAGGGAGCGATCTACGGTC
+AGTGCGTCAGCCAACAACATACGGTCAGTGCGTCGCCTTAAGCGCTGGAAGTAAGGACGT
+TCGGCTTACTGACCCCTATCGAGAAGCCCGAACGCCAGACCATACAAGTTGCGGACGTGC
+TGATTGTGATCAAGTTGCGGACGTGCTG
+>ds2020-267_827
+CAGCACGTCCGCAAACGTTTCCGGGTAGCACGTCCGCAACAGTAATCAATTGCGGACTGC
+TGAGTACTTTGGACTTGCGGACGCCTGGAAGTAAGGACGTTCGGGCTTGCCAGTCTGGGG
+GACGTTCGGGCTTACGAGTGGCTGTAAGCCCGAAGTCCAGGCCCAAGAGCAAGTCGAACG
+TCACCCCTAATTCTAAGCCCGAACGTCC
+>ds2020-267_828
+GACGCACTGACCGTACCTACCTGGCTGACGCACTGACCGTCTCGGGTCCTCTGACGCACT
+GACCGTATTAGGGGACGTCGCACGGTCAGTTCACGTCCGCAAACGTTATGCACTCAGCAC
+GTCCCAATGTTGACCTGGTGAGCCTTGCGGACGTGCTGCCCGTTATTGTTGCGGACGTGC
+TGACTAGGTCGATTTTGCGGACGTGCTG
+>ds2020-267_829
+CAACTGTTTTGGCCTCAGCACGTCCGCAATCAAATCCCCCTCAGCACGTCCGCATTCCAG
+TAAGCTCAGCACGTCCCAACCTCGGGATCTTGCGGACGTGCTGCTCCTTAGTCGCTTAAG
+GCGACGCACTGACCGTTTATACCTCCCTGACGCACTGACCGTATTGGTTTCTCTGACGCA
+CTAACCGATTCTGCACGGTCAGTGCGTC
+>ds2020-267_830
+GGACGTTCGGGCTTGATGGTTAAGGTAAAGCCCGAAGTCCAGGCAACTCGGAAGCCCGAA
+GTCCACCAGCCTATAGAAGCCCGAACGTCCTTACTTCCAGAGTCCGCAATCGGTTGGGCT
+TGCGGACGTGTGACCGGCTTGAAGTTGCGACGTGCTGAGTGAAAAAGGTTTGCGGACGTG
+CTGAGTGATTGGTATTGCGGACGTGCTG
+>ds2020-267_831
+CAGCACGTCCGCAAATATTAGGGGTTCATAGTTGCGGAGCTGAGGCGAAGGGTATTGCGG
+ACGTGTGAGACCATTGGCCTTGCGGACGTGCTGCTCTTAGATACGCTTAAGGCGACGCAC
+TGACCGTTCAGGTACCCCTGACGCACTGACCGTTAGCTTCTCGCTGACCACTGACCGTTT
+AGATAGCTATGTGCACGGTCAGTGCGTC
+>ds2020-267_832
+CAGCACGTCCGCAAACCCTTGCTTGTCCACGTACGCAAGTTAATTGGGTCAGCATTGGGA
+CGTGCTGAGGCGAGCCACATTGCGGACGTGCTGCTCCTTAGATACTGGAAGTAAGGACGT
+TCGGGCTTGCCTGCATCACTGGCGTCCGGGCTTTACATCTATCCTGGCGTTCGGGCTTCC
+ATAGTCCCATCTCAAAGCCCGAACGTCC
+>ds2020-267_833
+CAGCACGTCCGCAAATGAGGTTCGCTAATTTCTGCAGGAACAGGGAAGGTGGCTTAGAAA
+CCAGCCATTGAGAGAATAATGATACAACAAACAAACACTAATTGGACAATACTAGAAAAA
+ACCATGAATACGGAGCTCAAACCTGATTAAACTTTGAAAGCTGATCAACAGCATCATTTC
+CACCCAGTGCCGGTTGCGGACGTGCTG
+>ds2020-267_834
+CTCTCCCGATCTATCTAAGGAGCGCACGTGCGCAACAGGCCCCCCCTCGGAAAGAGAGGG
+ATTCGAACCCTCGGTACGAAAAACTCGTACAACGGATTAGCAATCCGACGCTTTAGTCCA
+CTCAGCCATCTCTCCCACGTCCGCAAATCCGGGTCGGTATTTGCGGACGTGCTGAGGGTC
+GTATAATTGCGGACGTGCTGCTCCTTA
+>ds2020-267_835
+CAGCACGTCCGCAATCGGCGCACACTCAGCACGTCCGCAAAGTGGTTTGGGTACAATCTA
+AAAAAAACGATTCCACATGAGGGAGAACCGGACAATTTCCCTCTTGAGTAATGGGAAATG
+GGAAGCGGGCTAGTCCCCGAAAATGCTCGTTAAAGTTGGGGGTTACAATTCACCCTGTGA
+CTAATTCCTTCGGTCGCGGACGTGCTG
+>ds2020-267_836
+GGACGTTCGGGCTTAACAACCCCCTTGGACTTCGGGCTTGCCTGTTCACCTGGACGTTGG
+GCTTTATTGTTGCGATGAAGCCCGAACGTCCTTACTTCCAGTATCTAGGAGCAGCACGTC
+CGCAAGTGAAGCCGACTGAAATTGCGACATGCTGAGGGCCAGTAGATTGCGGACGTGCTG
+AGGGCCCGGTGGTTTGCGGACGTGCTG
+>ds2020-267_837
+CAGCACGTCCGCAACAGGAAGTTCTTAACCGTTGTTCCTGTGGTGCTGTACTTGATAGCC
+TCACACACAACTGACTACCAGCACCCGATGCTCTTTTTCAACAGTCTTGCAGTCATTGTG
+CTAGTTATTGCCAAATTCTCCAATATGCACAAAGTCCGGATCTTCGGAATCAATGGAGAT
+AAGGAGTTGGGCCTTGCGGACGTGCTG
+>ds2020-267_838
+CAGCACGTCCGCAAAGACTTACCCCTCAGCACGTCCGCAAGAACCATGCCCTCAGCACTC
+CGCAATCTGATCTCGGTGTAAGCTATTGCCACGTGAACGTGTCGAGCGCTTGCTAGATGC
+CGGTACGCCATTTTTGGAAGTCTCACCGATGGCAGCGTATGGCATGTATGATGCCGATAT
+CACGGGTAACGGCTTGCGGACGTGCTG
+>ds2020-267_839
+GGACGTTCGGGCTTCGAACAACCCTTGGCGTTCGGCTTACAACCCTCCATGAAAGCCCGA
+ACGTCCTTAAGCACGTCCGCAAGACTTGACTACTTCCGCAAACCTTTGAGCCTCAGCACG
+TCCGCAACGTAACAGGGATACATTGGGACGTGCTGAGGCTCAAAGGTTTGCGGACGTGCT
+GAGGGCTCAGACCTTGCGGACGTGCTG
+>ds2020-267_840
+AATTTCTAGCCCCTCAGCACGTCCGCAAGTTGGCACACCTCAGCACGTCCGCAACCATAC
+CCAGTTCAATTTGCGGACGTGCTGAGCGGTGAGGATTTGCGGACGTGCTGAGACGTACAT
+GGTTGCGGACGTGCTGCCGGGTACCGTTTGCGGACGTGCTGAGCGGTGAGGATTTGCGGA
+CGGCTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_841
+CAGCACGTCCGCAATTTCCACTGGTTAGCACGTCCGCAAAAGATCTTACCTCACACGTCC
+GAAACCCCAGCACGTCCGCAATTTCCACTGGTCAGCACGTCCGCAAAAGATCTTACCTCA
+CACGTCCGCAACCCCAGCACGTCCGCAATTTCCACTGGTCAGCACGTCCGCAAAAGATAT
+GACTTCACACGTCCGGAACCCCTTGCA
+>ds2020-267_842
+GACGCACTGACCGTCGAAATGTGGATCAACACGGTCAGTGCGTCAGGAAAACAGCGACGG
+TCAGTGCGTCAGGGGTATAGTCACGGTCAGTGCGTCGCCTTAAGCGTACGTCCGCAACAG
+TATGCCCTTAGCGTTGGGACGTGCTGACGGAATTGTGGTTGCGGACGTGCTGAGGTAGGA
+CCGCTTGCGGACGTGCTGCTCCTTAGA
+>ds2020-267_843
+CTATCTAAGGAGCAGCACGTCCGCAACAAGACTACACTCGCACGTCCTCAAAAGTGTTAG
+GGTGTCCCAGCACGTCCGCAATAAGACTACACTCGCACGTCCGCAAAAGTGTGAGGGTGG
+CCCAGCACGTCCGCAATAGGACTACACTCGCACGTCCGCAAAAGTGTGAGGGTGGCCGAC
+TTGCGGACGTGCTGCTCCTTAGATAGA
+>ds2020-267_844
+TGCCGCAAGTACAGACGTATCCCCATCCGCTCTATCTAAGCATCAGCACGTCCGCAAAGA
+TTATGGCCTCAGCACGTCCGCAAGACACATTCCCTCACACGTCCGCAACGGATAGGCCAT
+CTAAATTGCGGACGTGCTGCTCCTTAGATACGCTTATGGCGACGCACTGACCGTTGAAGT
+CGAGGTATCGATTGTTTCTCCTTCGCA
+>ds2020-267_845
+GACGCACTGACCGTAGTATTGTCGCTCTGACCGTACTACAGGGCTTTTTACGGTCAGTGC
+GTCACGGGTCCAGTACGGTCAGTGCGTCAGGCCCAAACAGACGGTCAGTGCGTCGCCTTA
+AGCGGTCCGCAAATTGCTGCCTTTGGGACGTGCTGAGGGATCACTGATTGCGGACGTGCT
+GAGGGAGTTGCACTTGCGGACGTGCTG
+>ds2020-267_846
+TACGCACTGACCGTGTCATCATGGTTACGCCTGACCGTTGTATAGACCCTGACGCTGACG
+CACTGACCGTGTCATCATGGTGACGCCTGACCGTTGTATAGACCCTGACGCTGCCGTACA
+AGTTCGGGGCTACGGTCAGTGCGTCGCCTAAGCGTATCTAAGGAGCAGCACGTCGCAAGG
+CAGAATCGATTTATTGCGGACGTGCTG
+>ds2020-267_847
+GACGCACTGACCGTAGTTCCACCCCTACACACACGGTCAGTGCGTCAGGGCTAGAGGGAC
+GGTCAGGGCGTCAGGATAGGGCAAACGGTCAGTGCGTCAAGGGTAGCTAAACGGTCAGTG
+CGTCGCCTTAAGCGAATCTAAGGAGCAGCACGTCGCAAACTCAAGCCCCTCAGCCGTCCC
+AAATGTATACTGGTTGCGGACGTGCTG
+>ds2020-267_848
+TCCGCAATTCTCCCGGCTTAGCACGTCCGCAACTGTTGGTCACTCAGCACGTCCGCAATA
+TCGAGCACCTCAGCACGTCCCAACAGAGACCCAATTGCGGACGTGCTGGAAGTAAGGACG
+TTCGGGCTTTAGACTCCCCCTGGACGTTCGGGCTTCAGGCTCTCCTTGGACTTCGGGCTT
+AACTCTTCCCGGAAAGCCCGAACGTCC
+>ds2020-267_849
+GACGCACTGACCGTGACGTTACCCCTGACGCACTGACCGTGGAATTAGCCCTGACGCACT
+GACCGTAACAATGCCCTTGACGCACTGCCGTATTTACTGGACTAGCAACGGTCAGTGCGT
+CGCCTTAAGCGAATCTAAGGAGCAGCACGTCCGCAATTGCGAGTCCGTCAGCACGTCCGC
+AACTGGCCCATGATTGCGGACGTGCTG
+>ds2020-267_850
+GACGCACTGACCGTTTAACTCGTCCTGACGCACTGACCGTTATCGTGCCCCTGACGCACT
+GACCTTACAATAAGAGCGACGGTCAGTGCGTCGCCTTAAGCGTATCTAGGAGCAGCACGT
+CCGCAAACCATATGTCTTAGCAATTGGGACGTGCTGAGGAATGCAGGCTTGCGGACGTCT
+GACGGGCGAATATTTGCGGACGTGCTG
+>ds2020-267_851
+TCTAAGGAGCAGCACGTCCGCAAATAACTTGGGATTGGGACGGCTGACTGGGGGCGTTTG
+CGGACGTGCGAGTGATAATGTGTTGCGGACGTGCTGCCTTAGATACGCTTAAGGCGACGC
+ACTGACCGTTACTTTTCCCCTGACGCACTGACCGTTAAAAATCTTCTGACGCCTGACCGT
+CAAGAGGTCGGTGACGGTCAGTGCGTC
+>ds2020-267_852
+CAGCACGTCCGCAAATGCGTTTACCTCAGCACGTCCGCAATCTCATGGGTGTTGCTTCGC
+TTAAGGCGACGCACTGACCGGAGTTACAGCTTTAGGTATCAGCACTATGGCTTTCAACTT
+AAATGGTTTTAATTTCAATCAATCTGTAGTTGATAGTCAGGGTCGTGTAATTAATACTTG
+GGCTGATATTATTAACCGGGCTAACCT
+>ds2020-267_853
+CAGCACGTCCGCAAGGTTTAATTCCTGTTAGTTGCGACGTGCTGAGTGATGTTTAATTGC
+GGACGTGCTGCTCCTTAGATTCGCTTAAGGCGACGCACTGACCGTGCTTCTAGGGGTGAA
+TAACGGCAGAGAGGCAACGGGACGGTCAGTGCGTCAAGGGGCACCGAACGGTCAGTGCGT
+CAGTGGGGAATGGACGGTCAGTGCGTC
+>ds2020-267_854
+GGACGTTCGGGCTTACACTTTTCCCTGGACGTTCGGGCTTAGTGGACCCTTGGCGTTCGG
+CTTTCTATCGCCTGTAGCAAGCCCGAACGTCCTTACTTCCAGACGTCCGCAAGGCTTGAA
+CAGTCACGTCCAGGCGATTGGGGTAGATTTGCGGACGTGCTGAGGGTCAGGCCATTGCGG
+ACGTGCTGAGAGGGATACACTTGCGGA
+>ds2020-267_855
+TATCTAAGGAGCAGACGACTTAAGCGCCATCCATTTTAAGGGCTAGTTGTTTCGGCAGGT
+GAGTTGTTACACACTCCTTAGCGGTTTACAACTTCCATGTCCACCGTCCTGCTGTCTTAA
+ACAACCAACACCTAGGGCAGCACGTCCGCAAAACAGTTAGGCTGTATTGCGGACGTGCTG
+AGTGAGCCTCCCTTGCGGACGTGCTG
+>ds2020-267_856
+CAGCACGTCCGCAAGGACCATGGCATATTTAATTTAATTCTAAAGGAAAAGTGGCAAGAT
+GTGTGGCACTCTGCTGAGATGGAGAGTCTTGGTGATGATAATATCACAGGCTTACCGGAG
+TGGATGAAGCATATCACAGCCGAGGAGTTGGGGCAATCCGTGTTGGATATGACGGGGATA
+AATAGGCAGAGGTTGCGGACGTGCTG
+>ds2020-267_857
+CAGCACGTCCGCAAACACAGCACCCTAGCATAGCAAAAAATCCGCCACAGGGCAAAAGCT
+ATATGCAAAACTAAGTCTGTGCAATGGGCGAAGTCCCACTGACTAAGTGCGAGTTTTCGA
+CTTGATATTAATATTTCGCTAATGCTCCAAATTCCCACAAGTCAAAACCTCGGCAGGGGA
+TGGACAACACCTTGCGGACCGTGCTG
+>ds2020-267_858
+CAGCACGTCCGCAATAGACCCACCATTATAAATCCCCCCACCCAAACCAAAAAAATAAAA
+GCTTTTATATATATGAGTTTTTATATTTTCTGATCTGATTGAGAGTACTTGTTCTGTTTT
+CTCAGTAACTGCACTCTCTTTCCTCTTTTTCCCGCGCTTTAAAAATCCCAACTTTTTCTC
+ACCCCCCGCAATTTGCGGACGTGCTG
+>ds2020-267_859
+CAGCACGTCCGCAATCCCAGGTAGCTTGCTTACTTATTGCTTGCACTAAGGGCAAGCGGG
+CCTTGTCTAGGTTGGAGCTATGAAGCTTCCCTTATTATTATGAAAGGGTTGTTTACTTGC
+TTACTTGTTTTGTTAGAGTAAGGTAGCTTGCTTACTTAGTGCTTGCACTAAGGGGAAGGG
+GGGGGAGATACCTTGCGGACGTGCTT
+>ds2020-267_860
+GACGCACTGACCGTTCCGGAGTACCTAACAACGTATCTTCACAGACCAAGAACTACGAGA
+TCGCCCCTTTCATTCTGGGGTGACGGAGGGATCGTACCATTCGAGCCTTTTTTTTTCATG
+CTTTTCCCGGAGGTCTGGAGAAAGCTGCAATCAATAGGATTTTCCTAATCCTCCCTTCCC
+GGGGGGTGTTGTACGGTCAGTGCGTC
+>ds2020-267_861
+CAGCACGTCCGCAACCAAGATGCTATGTGCCCTTCCACTTTAAGGAGCTGTTTCCAGATG
+CGTGGTGTGCTTTGCAGTGAGAATTTGTTGGAATTTGAGGATTCTTCTGTTTCAGGGCTA
+TTGAAAACTCCATTGCCTTTTCGACACATCTCCTGTATGATATCATAATACCATGTGAGT
+ACGCGAGCACTGTTGCGGACGTGCTG
+>ds2020-267_862
+CAGCACGGCCGCAATCGAAGCCGGCTCCTTCGGTTGACGTGACCGGAGGCGCTAAGCCTC
+TGGTCATACAAGCGTATAGCTTCCTCAATGACACATCGATTTGTGTCGACAAGTACGGCA
+TGAGTCTTACCCATGCTGCAGAGGCGCTTGATGCGCTGAAACGAGACCCTGATGAGGGAA
+AAAGACTCGTGGATGCGGACGTGCTG
+>ds2020-267_863
+CAGCACGTCCGCAATGCCTACGCCCTCCACAGGTAACAGATTAAAATCGTTTTATCCCCG
+AATTTTTCACGACTTTCGTTACAAAAAATTTGACTGAAAACGGCATTAATTTTGTAACCC
+TAAAACAACTGTCTAAATATAGCCCATCGATTTTTGAGCAGTTGTTTGATGATGAAACCC
+AATAAACGGAGATTGCGGACGTGCTG
+>ds2020-267_864
+GGACGTTCGGGCTTAGGCTAACCGCTGGACTTCGGGCTTGAAGGTGTGACTGGACTTGGG
+CTTATTGGAGGCAACAAGCCCGAACGTCCTTACTTCCAGTCACGTCCGCAAACGGTTTGG
+GTTGGGACGTGCTGAGGGGCAGTATTTTGCGGAGGACATAATGCATATTGCGGACGTGCT
+GCCCTAAGCCTTTTGCGGACGTGCTG
+>ds2020-267_865
+GACGCACTGACCGTCTACAGCCTCCTTAACACGGTCAGTGCGTCAGTTAAGTCCGAACGG
+TCAGTGCGTCCCCGAGAAACACGGTCAGTGCGTAGCACGTCCGCAAAAGTGAAGTTGTGG
+ACGTGCTGAGGGATACACAGTTGCGGACGTGCTGAAGGCATAACAGTTGCGGACGTGCTG
+AGGCAATAATACTTGCGGACGTGCTG
+>ds2020-267_866
+GACGCACTGACCGTTTTCTACCCCATAGACAACGGTCAGTACGTCAGGCCTGAGATAACG
+GTCAGTGCGTCAGGGAATTACCTACGGTCAGTGCGTCAGGCATTATGCGACGGTCAGTGC
+GTCGCCTTAAGCGAGGAGCAGCACGTCCGCAAATAACGAGGGGTAGGTTGGGACGTGCTG
+AGACATGTGTCCTTGCGGACGTGCTG
+>ds2020-267_867
+CAGCACGTCCGCAACAGGGAACAGATTATTAAAAGTATTTAAAGCCAGTGAAGTAACACT
+CATTGCCTTTATGGGTGAAATAGCCGATTGTGTGGGTGATTATTCATCATTCCATAGCCT
+TATAACTGATGGGCTAGATGATGGCGAAATTCCTGTTACCAACTTACAGACCATTAACCA
+ACGCGCATTATTTTGCGGACGTGCTG
+>ds2020-267_868
+CAGCACGTCCGCAATGTCGTAATCGTCCCTTTCAGACCTTGCTGCAAACGCCACACTCGC
+AGCCGATATTGCTAACCCAAGCGAAGCGAGCTTTTATAATGTCAGCGAAGCGAGCTTTGC
+TAACGTCAGTGAAGAGAATTTGCTAAAAAACGCTGCTTAAACCAAGTTTCAGCCGATTGT
+CATTGGTAATCGTTGCGGACGTGCTG
+>ds2020-267_869
+CAGCACGTCCGCAAGTCTGCCCTCAGCACGTCGCAAGATAGGCGGGGTGGGTTGCTGCTA
+CCCGGTGTCCATTGCGGACGTGCTGCTCCTTAGATATCTAAGGAGCAGCACGTCCGCAAT
+ACCTGCCGTCTGTTGCGACGTGCTGAGGAAAGACGACTTGCGGACGTGCTGAGGTGTTTT
+GTTTGCGGACGTGTGCTCCTTAGATA
+>ds2020-267_870
+CAGCACGTCGCAACAGGTTCCGGATGTGCTGAGCCACTCCCAATTGCGGACGTGCTGCTC
+CTTAGATACGCACTGACCGTCTCTTGCCGACTCTCCCCTAGCTACTATCGTATAAAAGAT
+GAAAGGCATTAATCTTCAAAGGTTAGATGAAAGAATTGTGGTTGGCGATATGCCGTTAGA
+ATTACGTCCACTACGGTTAGTGCGTC
+>ds2020-267_871
+ATCTAAGGAGCAGCACGTCCGCAAATATTTTGTCCTCAGCACGTCCGCAAGTATCATCCC
+TTCAGCACGTCCGCAAGCCACCTCCTGTCAGCACGTCGCAAATCAACTGGCATGGCTTTG
+GGACGTGAGGAGCCGCCTATTGCGGACGTGCTGCTCATTAGATTAAGGACGTTCGGGCTT
+GGTTGCGGTTGAAAGCCCGAACGTCC
+>ds2020-267_872
+GGACGTTCGGGCTTGTGGGTCAAATTAAAGAAGCCAAAGAAGCCCAGGCCCGTGCCAACG
+CTGAAGCCTACAATGCGCAGGCAGCCTCAGAAGCCCGAACGTCCTTACTTCCAGACGTTA
+GGGTCATAGTTTTGCGGAGTGCTGAGGGAATTAGCTTGCGGACGTGCTGACGGATCTCGC
+ATTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_873
+GAGTTTCGTTTTAGGTCGGGGAGTCCGCTGTCATTTATACTCGTACAGTGAGTTTTATCA
+TTGATTAACAGCTACACGTTAATGAAGAAGTTGGCTATACTATATTCTATTGATTGCCAA
+CATCCCACGGTCAGTGCGTCGCCTAAGCGTCCGCAAGTTGGCGCTGTTGCGGACGTGCTA
+GGGCTACCAGATTTGCGGACGTGCTG
+>ds2020-267_874
+CAGCACGTCCGCAATCTGGGAGGGTTGAGACCAAGCCAAGGGCAGGGGCCTAAAGTATCG
+AAAAGGCAAGGACTCCAAGAAGAAGCCAAGCCTGAGGCCAAGAAAAGCGAGTTCAAGATC
+AGGAGCCAAAGCGGGCCGAGAAGAAAGAAGGAAGGCTTCATCTGCTCCAAGCCCCTAAAG
+AGGCTCAGCGGGTAGCGGACGTGCTG
+>ds2020-267_875
+GGACGTTCGGGCTTAAATGTGGCGATGTGTTAAGCCCGAAGCCAGGGAAACAATAAAGCC
+CGAACGTCCAGGGGTTATTCCAAGCCCGAACGTCCTTACTTCCAGGGCACGTCCGCAATA
+TCCCCGACCTATTTGCGACGTGCTGAGGATTGAACGGTTGCGGACGTGCTGAGGTGGGCC
+CGATTGCGGACGTGCTGCTCCTTAGA
+>ds2020-267_876
+TATCTAAGGAGCAGCACGTCCGCAATACTCGCCTACTCAGCACGTCCGCAATGCCGTAGT
+TATCACACGTCCGCAAGCAAGAACGACATGTTGCGGACGTGTGATATCTAAGGAGCAGCA
+CGTCCGCAACAACAGGTCGGTTGTGCGGACGGCTGAGAGATTCATATTGCGGACGTGCTG
+AGCCAACACAGCTTGCGGACGTGCTG
+>ds2020-267_877
+GGACGTTCGGGCTTTGTTGAAACCCTGGACGTTCGGGCTTAATCATACCACTGGACGTTC
+GGCTTATCATATAGGTTACCAGAAGCCCGAACGTCCTTACTTCCAGACACGTCCGCAAGG
+TCGAATATATTGCCGTTGGTTTGCGGACGTGCTGAGGCAAACGTAATTGCGGACGTGCTG
+AGACGATAGGTATTGCGGACGTGCTG
+>ds2020-267_878
+TCTAAGGAGCAGCACGTCCGCAAATTCACAGGGCTCAGCACGTCCGCAACTTAATCCCTA
+TCAGCACGTCCCAATCTATCCCCCCTTACTTGCGGACGTGCTGCCGCTTAAGGCGACGCA
+CTGACCGTCCCCGAACCACTACGGTCAGTGCGTCAGGGGGAAAGATACGGTCAGTGCGTC
+AGGGGCAAAGCAACGGTCAGTGCGTC
+>ds2020-267_879
+GACGCACTGACCGTTTAGATTGCCCTGACGCACTGACCGTCTAATTATAGCTGACGCACT
+GACCGTAGATATGGACGTAAGGACGGTCAGTGCGTCGCCTTAAGCGTGGAGCAGCACGTC
+CGCAATCCCTAGCCCGTGATCATTGCGGACGTGTGCCCGGCCAAAGTTGCGGACGTGCTG
+AGGCATATTACTTTGCGGACGTGCTG
+>ds2020-267_880
+GACGCACTGACCGTACTCTTTATGCTGACGCACTGACCGTTTGTGTTTTCCTGACGCACT
+GACCGTAGTCCAGACATTACTAGACGGTCAGTGCGTCGCCTTAAGCGGATCTAAGAGCAG
+CACGTCCGCAAATGAGATCGATTGCGACGTGCTGAGTGGTTCGAACTTGCGGACGTGCTG
+AGTGGAATCGAATTGCGGACGTGCTG
+>ds2020-267_881
+GACGCACTGACCGTCATAGAGCAGTTAACGCACCCTCGTACGCCCCGTTCTACACGGTCA
+GTGCGTCAGTGGTTGTACAAGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACG
+TCCGCAAAAGAGGAGCGCTCAGCACGTCCGCAGTTGGTTCTCTCTCACACGTCCGCAAGC
+TAAATCCTCTGAGTTGCGACGTGCTG
+>ds2020-267_882
+GGACGTTCGGGCTTGCAAGGGCCCCTGGACGTTCGAGCTACCTCATGAAGCCCGAAGTCC
+AGGGTAGGTACTAAGCCCGAACGTCCAGGAGACAAGAAAGCCCGAACGTCCTTACTTCAA
+GCACGTCCGCAATGATACCGTCCCAGCACGTCCGCAATTTGTAATCCGTCAGCCGTCCCA
+ACTCTCATTTCGTTGCGGACGTGCTG
+>ds2020-267_883
+GGACGTTCGGGCTTTTGCAACCACCTGACAAGCCCGAAGTCCACGGAATGGCGTAAGCCC
+GAACGTCCAGGGATAGGACGAAGCCCGAACGTCCTTACTTCCAGACTAAGGAGCAGCACG
+TCCGCAACTGAACTCCCTCAGCACGTCCGCAAATGGCACCCCCCAGCACGTCCCAAATCC
+CCGGCTATTCCCTTGCGGACGTGCTG
+>ds2020-267_884
+CAGCACGTCCGCAACAAGTCATTTCTCTTGCGGACGTGCGAGAAACTGAACCTTGCGGAC
+GTGCTGCTCCTTAGATTATCTAAGGAGCAGCACGTCCGCAAACCTGTGTCCGTCAGCACG
+TCCGCAATTGAGTGGCCCCAGCACGTCCGCAAGGGGCAATCCATCAGCACGTCCCAATAC
+ACCCAGGATGCTTTGCGGACGTGCTG
+>ds2020-267_885
+CCGCAATAGAGTTGCACTCAGCACGTCCGCAATGCGATGTTACTCAGCACGTCCGCAATT
+GCTAACATCTTGCGGAGTGTGAGTGAGAGATCTTTGCGGACGACGCTTAAGGCGACGCAC
+TGACCGTCTACTTGGGGGTCTAGGTCAGTGCGTCAGGGTACTATCGACGGTCAGTACGTC
+AGCATCAGTATTACGGTCAGTGCGTC
+>ds2020-267_886
+CAGCACGTCCGCAATGCGCGGTCCCTCAGCACGTCCGCAATAAGGGTGGGGTCGTTGCGA
+CGTGCTGCTCCTTAGATAATCTAAGGAGCAGCACGTCCGCAAATCATCGGCTCTGTATTG
+GGACGTGCTGAGGTGTGTTGGTTGCGGACGTGCTGAGTGACGTAAAATTGCGGACGTGCT
+GCCTGATTCGATTTGCGGACGTGCTG
+>ds2020-267_887
+CAGCACGTCCGCAAACTCAAACCGGTATGATTGCGGACGTGTGAGGCGTACTGCTTTGGG
+ACGTGCTGGGGGTCTTCCTTTGCGGACGTGCTGCTCCTTAGATTCTGGAAGTAAGGACGT
+TCGGGCTTCCCTCATGCCCTGGACGTTCGGGCTTACACTCACCCGTGGCGTTCGGCTTCC
+AAGCAGTATACGAAGCCCGAACGTCC
+>ds2020-267_888
+GGACGTTCGGGCTTTCTTACCAACCTACAGAAGCCCAACGTCCAGGGGGGGAGTAAAGCC
+CGAACGTCCACCAATTCGTGGAAGCCCGAACGTCCTTACTTCCAGATAAGGAGCAGCACG
+TCCGCAATCACAGTACCCTCAGCACGTCCGCAACAACTGCCCCCTCAGCACGTCCCAACT
+ACCCTGCCTTTTTTGCGGACGTGCTG
+>ds2020-267_889
+CAGCACGTCCGCAATGACAAAGCCCTCAGCACGTCCGCAATCCTAGTCGCCTCAGCACGT
+CCGCAAAAATGCCGAGCTCGTTGCGGACTCGCTTAAGGCGACGCACTGACCGTTACCAGA
+GTCATAACGGTCAGGAGTGGCGCTTGGACGGTCAGTGCGTCCCCGAACGGTCAGTGCGTC
+AGGGGTATATCAACGGTCAGTGCGTC
+>ds2020-267_890
+CAGCACGTCCGCAATAAGACCCTATTGTTGCGGACGTGCTGAGCGAGGCGCCTTTGCGGA
+CGTGCTGCCCATAGCGTATTGCGGACGTGCTGCTCCTTAGACGCTTAAGGCGACGCACTG
+ACCGTTGGCGAGGGGTTATTACGGTCAGTGCATCAGCAAAACTGGAACGGTCAGTGCGTC
+AATTGGCCACTTACGGTCAGTGCGTC
+>ds2020-267_891
+GCAACTGCGTTACCCTCAGCACGTCCAATGGTACTCGACATCTGTTGCGGACGTGTATCT
+AAGGAGCAGCACGGCCGCAAGACTGATTCCCTCAGCACGTCGCAAAGCCGCTCAACTCAG
+CACGTCCGCAACTGCGTTACCCTCAGCACGTCCAATGGTACTCGACATCTGTTGCGGACG
+TG
+>ds2020-267_892
+TCAGCACGTCGCAATCTATCAGTGGTTCATTGCGGACGTGCTATCTAAGGAGCAGCACGT
+CGCAATCACTCCCCCCAGCACGTCCGCAACAGCATCTAGGTCAGCACGTCCGCAATCTGT
+AACCGGTCAGCACGTCGCAATCTATCAGTGGTTCATTGCGGACGTGCTATCTAAGGAGCA
+G
+>ds2020-267_893
+AGTGCGTCAGCGTACCCATCACGGTCAGTGCGTCAGCGGCTAAAACACGGTCAGTACGTC
+GCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCACTGACCGTGTCAATCCTGGTCTGTAC
+GGTCAGTGCGTCAGCGTACCCATCACGGTCAGTGCGTCAGCGGCTAAAACACGGTCAGT
+>ds2020-267_894
+TCTTCCGATCTATCTAAGAGCAGCACGTCCGCAATTATATCCAGGTATATTGCGGAAGTG
+CTGAGGTTGTCCGCCTTGCGGACGTGCTGACGGATTTAGGCTTGCGGACGTGCTGAGGCG
+TTATATGTTGCGGACGTGCTGCTCCTTAGATAGATGGGGA
+>ds2020-267_895
+CGATCTATCTAAGGAGCAGCACGTCCGCAAAACGCCATGTGTGACATTATTCGCCAACCA
+ACCATTGTACTTTGGTGCGCTGCTCCACACGCATTTGTGGGCTTTCAGGATGCTGAGGGG
+TCGGAACTTGCGGACGTGCTGCTCCTTAGATAGATCG
+>ds2020-267_896
+TACCTTTGCCGTGTTCACAGGGTTTCTGTGTCCTTTGCCGTGTTCACAGGGTTTCTGTGT
+CCTTGCCGTGTTCACAGGGTTTCTGTGTCCTTTACCTTACCTTTGCCGTGTTCACAGGGT
+TTCTGTGTCCTTTGCCGTGTTCACAGGGTTTC
+>ds2020-267_897
+ATCGAAGGAGCAGCACGTCCGCAACTGCTCTGCCCTGTCCGCAAAGACCATACGCTGAAA
+CTTGCGGACGTGCTGAGTCGGTACATATTGCGGACGTGCTGAGTGGCTCCTTTTTGCGGA
+CGTGCTGCTCCTTAGATAGATCGGAAAGAG
+>ds2020-267_898
+CAGCACGTCCGCAATTTTAATCGCCTCAGCACGTCCGAATGATTCGTCCCTCAGCACGTC
+CGCAACATGAACCCGGTGAGTCTTGCGGACGGGCTGAGGGACGAATCATTCGGACGTGCT
+GAGGCGATTAAAATTGCGGACGTGCTG
+>ds2020-267_899
+TATCTAAGGAGCAGCACGTCCGCAAACATATCGGCCTGACGTCCGCAATGCCTAACCTGT
+CTCATTTGCGGACGTGCTGAGCCGACACACTTGCGGACGTGCTACCCCATGACAATTGCG
+GACGTGCTCTCCTTAGATAGATCGGA
+>ds2020-267_900
+CAGCACGTCCGCAACAAGTGGCTCTTGAATTTTTGCTTACGCCAGTAACCTCAAAAACAG
+CATGAGATTACCAGAAAAAAAAGCCGGCCGACTGGCCGGCTTTTCGATTACATCACCAGG
+CGGCGAATGTCGCTCAGCATGT
+>ds2020-267_901
+GCAGCACGTCCGCAAATAGCCTTCCTTCACCTCTCAGAGGTAGTAACTGCATTGATCTTC
+AACCCCGTGATCGATTTGGTGTTGTCAGCGCCATTAGCTTGATTGCAAAAGCATCATGTT
+GGTGCCACACCCTGCCTTTCCA
+>ds2020-267_902
+TTATTGGGACGTGCTGAGGAAAGATAGATGCGGACGTGCTGACCGAGTCCCCCTTGCGGA
+CGTGCTGGGTACGTGCTGAGTCATTGATTATTGGGACGTGCTGAGGAAAGATAGATGCGG
+ACGTGCTGACCGAGTCCCCCTT
+>ds2020-267_903
+TATCTAAGGAGCAGCACGTCCGCAAAGGTCACGCCCCAGCACGTCCGCAATACATTTTCC
+CTCAGCACGTCGCAACAACCCCTCAACTCTTGCGGACGTGCTGCTCCTTAGATACGCTTA
+AGGCGACGCACTGACCGTCTCG
+>ds2020-267_904
+AGCAGCACGTCCGCAATCTCAATGCTCTCAAGTGCTAAGCTCTCAGCACGTCCGCCAGCA
+CGTCGCAATGGTTAGGGGATAGATGTTGCGGACGTGCTGAGAGCTTAGCACTTGAGAGCA
+TTGAGATTGCGGACGTGCTGCT
+>ds2020-267_905
+CAGCACGTCCGCAACGACCGTGGGCAGCACGTCCGCAACATATTACCGCTCACACGTCCG
+CAATCAGATAGCGTTTTATTTGCGGATGTGTGAGCGGTAATATGTTGCGGACGTGCTGCC
+CACGGTCGTTGCGGACGTGCTG
+>ds2020-267_906
+TCGCTCAGCACGTCCACAAAGTAACCACCTTACTATTGCGCAGCACGTCCGCAAGCTGCC
+GTTCCTCAGCACGTCGCAAATAAACTTCGCTCAGCACGTCCACAAAGTAACCACCTTACT
+ATTGCGCAGCACGTCCGCAAG
+>ds2020-267_907
+CAGCACGTCCGCAAGGAATAACCCGTCAGCACGTCCGCAAGGAGTGTCCGCTCACGTCCG
+CAACCAACCAGTCGTTTTTGCGGACGGTGAGCGGACACTCCTTGCGGACGTGCTGACGGG
+TTATTCCTTGCGGACGTGCTG
+>ds2020-267_908
+GCAGCACGTCCGCAAGGATTGTTCGGTCAGCACGTCCGCAAAGTATTACCCTCAGAACGT
+CCCAACCCCACGCCGTTGCGGACGTGCTGAGGGTAATACTTTGCGGACGTGCTGACCGAA
+CAATCCTTGCGGACGTGCTGC
+>ds2020-267_909
+CACAGTTATCTCAAATCCATCAACTGTTACAGAGTCAAAATAATTTTCATGTTCTCAGCA
+CGTCCGCAACCCGTCCCCACTCTTCACAGTTATCTCAAATCCATCAACTGTTACAGAGTC
+AAAATAATTTTCATGTTCT
+>ds2020-267_910
+TTTGCGGACGTGCTGCCGCAAGTGAATAGCTGTATCGTGGGACGGGACACCCCTAAGACA
+TTGCGACGTGCTGAGGGTGAACTCTTTGCGGACGTGCTGCCGCAAGTGAATAGCTGTATC
+GTGGGACGGGACACCCCTA
+>ds2020-267_911
+ATTCCCTCAGCACGTCCGCAATGTGTTCTCCCTCAGCACGTCGCAAAAGTCAAGGTTTGT
+TGCGCAGCACGTCCGCAAGGCGAATTCCCTCAGCACGTCCGCAATGTGTTCTCCCTCAGC
+ACGTCGCAAAAGTCAAGG
+>ds2020-267_912
+TGAATGTCCCTGAAGGTCATGGGACAGAGGATACCGAGATTGTGGAGGAGCTGAAAGTCG
+CTGAAGGTCATGGAACAGAGGATACCGAGATTGTGAAGGAGCTGAGTGTCGCCGAAGGTC
+ATTGCGGACGTGCTG
+>ds2020-267_913
+TCAGCACGTCCGCAAAAGAAATAGGCTCAGCACGTCCCAACCCATTAATTATTGCCAGCA
+CGTCCGCAAAACATATACCCTCAGCACGTCCGCAAAAGAAATAGGCTCAGCACGTCCCAA
+CCCATTAATTATTGC
+>ds2020-267_914
+ACTCCAGCCACTCAGCACGTCCCAATAGCCCACTTGAGTCAGCACGTCCGCAAGCTCATA
+TAACTCAGCACGTCCGCAAACTCCAGCCACTCAGCACGTCCCAATAGCCCACTTGAGTCA
+GCACGTCCGCAAGC
+>ds2020-267_915
+TGCGTCCGATTGGCCTATGAACGGCAGTGCGTCAGGTGGAATTGTACGGTCAGTGCGTCA
+GGCATCTAAGGACGGTCAGTGCGTCCGATTGGCCTATGAACGGCAGTGCGTCAGGTGGAA
+TTGTACGGTCAGTG
+>ds2020-267_916
+CCCTATCTAAAACTTCTATTTGAAAAACTAGATCACCCAGGTCTGCACGGTCAGTTGCGT
+CAGCAATTAAGTTTCTCACCCTATCTAAAACTTCTATTTGAAAAACTAGATCACCCAGGT
+CTGCACGGTCAGT
+>ds2020-267_917
+CTGAGGGAAATAGTCTTGCGGACGTGCTGAGGGCAGAATGATTGCGGACGTGCTGACCGG
+GAATACCTTGCGGACGTGCTGAGGGAAATAGTCTTGCGGACGTGCTGAGGGCAGAATGAT
+TGCGGACGTGCTG
+>ds2020-267_918
+CTTGGGACGTGCTGAGAGAAATGCCGTTGCGGACGTGCTGAGGGTATACAGGTTGCGGAC
+GTGCTGAGTGGACCGAACTTGGGACGTGCTGAGAGAAATGCCGTTGCGGACGTGCTGAGG
+GTATACAGGTTG
+>ds2020-267_919
+GCTGAGGGAGTGCCCTTTGGGACGTGCTGAGGTGTGATTCGTTGCGGACGTGCTGAGCAG
+ATGTAGGTTGGGACGTGCTGAGGGAGTGCCCTTTGGGACGTGCTGAGGTGTGATTCGTTG
+CGGACGTGCTG
+>ds2020-267_920
+TCAACACGGTCAGGCGTCAGACAAAGAGATACGGTCAGTGCGTCAGGTGATCCCCCACGG
+TCAGGCGTCAGAGCATTCAACACGGTCAGGCGTCAGACAAAGAGATACGGTCAGTGCGTC
+AGGTGATCCCC
+>ds2020-267_921
+GCAAGGTAACCCTCCTCACACGTCCGCAATTCTAGGAGCCTAGCACGTCCGCAAGACTGT
+ATCCCTCAGCACGTCCGCAAGGTAACCCTCCTCACACGTCCGCAATTCTAGGAGCCTAGC
+ACGTCCGCAAG
+>ds2020-267_922
+GACAGTGTAGGACTTGCGGACGTGGAGACCGGAACATTTGCGGACGTGCTGGACTAACTA
+CTCCTTGCGGACGGCTGACAGTGTAGGACTTGCGGACGTGGAGACCGGAACATTTGCGGA
+CGTGCTGGACT
+>ds2020-267_923
+GCAAATGCCTATCCCTCAGCACTCCGCAATCCCATTGACGCAGCACGTCCGCAAGATAAC
+CCACCTCAGCACGTCCGCAAATGCCTATCCCTCAGCACTCCGCAATCCCATTGACGCAGC
+ACGTCCGCAAG
+>ds2020-267_924
+AACAACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATCCCTTA
+ACCCTCAGCACGTCCGCAAAGGTCTCCGGCTCAGCACGTCCCAACATCCGTTTGCTCTTG
+CGGACGTGCTG
+>ds2020-267_925
+CAACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATATACTGCC
+TTTATATTGGGACGTGCTGAGGGAACACGTCTTGCGGACGTGCTGAGGGTATGCGTTTTG
+CGGACGTGCTG
+>ds2020-267_926
+GCCCTCAGCACGTCCCAATCATACATCTCTCAGCACCTCCGCAAAGCGCACTCTCCAGCA
+CGTCCGCAATGGTGAGCCCTCAGCACGTCCCAATCATACATCTCTCAGCACCTCCGCAAA
+GCGCACTCTC
+>ds2020-267_927
+ATTGCGGACGTGCTGACGGACTCTACATTGCGGACGTGCTGCCGTTTGTTTATTGGGACG
+TGTGAGTGTGGGCTTATTGCGGACGTGCTGACGGACTCTACATTGCGGACGTGCTGCCGT
+TTGTTTATTG
+>ds2020-267_928
+GCACGTCCGCAACAGATGTCCCCTCAGCACGTCTGCAAGAACGCCTCCAGCACGTCCGCA
+ACTTGCTAGACCTCAGCACGTCCGCAACAGATGTCCCCTCAGCACGTCTGCAAGAACGCC
+TCCAGCACGT
+>ds2020-267_929
+TTGAACTTGCGACGTGCTGAGGGCCTAGGATTTGGGACGTGCTGAGGGGGAATTCCTTGC
+GGACGTGCTAGGGGTTTGAACTTGCGACGTGCTGAGGGCCTAGGATTTGGGACGTGCTGA
+GGGGGAATTC
+>ds2020-267_930
+ATGGTCAATACATCACGGAAGGCGCCGTATTTGCGGACGTGCTGGCAGCGCGCATAGGTA
+GATTTTCCCAAACAAATGGTCAATACATCACGGAAGGCGCCGTATTTGCGGACGTGCTGG
+CAGCGCGCAT
+>ds2020-267_931
+CTTTTGCGGACGTGCTGCCCGCAATTCACTCCCAATTTATTGAGGTGTTGTCAATGGGAC
+GTGTGACGAGATTGCTTTTGCGGACGTGCTGCCCGCAATTCACTCCCAATTTATTGAGGT
+GTTGTCAAT
+>ds2020-267_932
+CTTGCGGACGTGCTGCCGGGTTCTGATTGGGACGTGTGAGGAGAGAAACTTTGGGACGTG
+CTGAGTGCCTTCCTCTTGCGGACGTGCTGCCGGGTTCTGATTGGGACGTGTGAGGAGAGA
+AACTTTGGG
+>ds2020-267_933
+CAATATACATTCCCTCAGCACGTCCCAATTAGACAGCCCAGCACGTCCGCAAAGTAGGGG
+TCCTCAGCACGTCCCAATATACATTCCCTCAGCACGTCCCAATTAGACAGCCCAGCACGT
+CCGCAAAGT
+>ds2020-267_934
+CTGAGTAGTCTGTCTTTGCGGACGTGCTGGGTCAATCTGTTGGGACGTGCTGAGGTAGAC
+TCAGTTGGGACGTGCTGAGTAGTCTGTCTTTGCGGACGTGCTGGGTCAATCTGTTGGGAC
+GTGCTGAGG
+>ds2020-267_935
+TCGGCAGCACGTCCGCAAAAAATCCACACTCAGCACGTCCGCAACTATTTTCGGGCAGCA
+GTCCGCAAGCTGATTCGGCAGCACGTCCGCAAAAAATCCACACTCAGCACGTCCGCAACT
+ATTTTCGGG
+>ds2020-267_936
+GATTAGAGCCCCTGTATTGCGGACGTGCTGCGCAAACACATCCTCCTAGCACGTCCGCAA
+CGATCAACCCTTATGATTAGAGCCCCTGTATTGCGGACGTGCTGCGCAAACACATCCTCC
+TAGCACGTC
+>ds2020-267_937
+CCACTTCCTCTCAGCACGTCCGAAACATATTGCAGTCAGCACGTCCCAATCATCCGGGGC
+AGCACGTCCGCAACCCACTTCCTCTCAGCACGTCCGAAACATATTGCAGTCAGCACGTCC
+CAATCATCC
+>ds2020-267_938
+TGGCCCCACTATTGCGACGTGCTGAGAGTTTATTAGTTGCGACGTGCTGAGGCGGGAACA
+CTTGCGGACGTGCTGGCCCCACTATTGCGACGTGCTGAGAGTTTATTAGTTGCGACGTGC
+TGAGGCGG
+>ds2020-267_939
+GGACGAAATACGGTCAGTGCGTCGGTCTACTACGGCAGTGCGTCAACAATGAGATCACGG
+TCAGTGCGTCAGCGGACGAAATACGGTCAGTGCGTCGGTCTACTACGGCAGTGCGTCAAC
+AATGAGAT
+>ds2020-267_940
+TAAGGGGTCACACTCCAACAGTGATTCGCTTGCGGACGTGCTGAGGCAATTTGGCCAGCA
+CGTCCGCAAATAATAAGGGGTCACACTCCAACAGTGATTCGCTTGCGGACGTGCTGAGGC
+AATTTGGC
+>ds2020-267_941
+GTGCTGGGCTTAAGTTGCGGACTGCTGAGTCGTAACAGATTGCGGACGTGCGAGAGAGTC
+TCCATTGCGGACGTGCTGGGCTTAAGTTGCGGACTGCTGAGTCGTAACAGATTGCGGACG
+TGCGAGA
+>ds2020-267_942
+GGACGTGCTGCCCATTGTTTTGCGGAGTGCTGAGGGTAACCGTTTGCGGAGTGCTGAGGG
+ATACAGCTTTGCGGACGTGCTGCCCATTGTTTTGCGGAGTGCTGAGGGTAACCGTTTGCG
+GAGTGCT
+>ds2020-267_943
+CGTCCCAAACATGAGCCAGCACGTCCGCAATTGGTAACCCCTCAGCACGTCCGCAAGTAT
+GAACCCTCAGCACGTCCCAAACATGAGCCAGCACGTCCGCAATTGGTAACCCCTCAGCAC
+GTCCGCA
+>ds2020-267_944
+ATTGCGGACGTGTGAGAAGTGCGTTCTTGCGGACGTGCTGAGTAGATGTTGGGACGTGCT
+GAGGAATGTCGTATTGCGGACGTGTGAGAAGTGCGTTCTTGCGGACGTGCTGAGTAGATG
+TTGGGAC
+>ds2020-267_945
+CAGCACGTCCGCAACCAGTTCCCCTCAGCACGTCCGCAATTTCTTGCCACTCAGCACGTC
+GCAACTATTCCCCAGCACGTCCGCAACCAGTTCCCCTCAGCACGTCCGCAATTTCTTGCC
+ACTCAGC
+>ds2020-267_946
+CCGTCATTTTGCGACGTGCTGAGGGATAACAATTTGCGGACGTGCTGAGTTATAACGGTT
+GCGGACGTGCTGCCGTCATTTTGCGACGTGCTGAGGGATAACAATTTGCGGACGTGCTGA
+GTTATAA
+>ds2020-267_947
+ACCGGTACTGACGCACTGACCGTTAACCTGACCCTGACGCCTGACCTACTTACATGACAC
+ACTGACCGTCGTACCGGTACTGACGCACTGACCGTTAACCTGACCCTGACGCCTGACCTA
+CTTACAT
+>ds2020-267_948
+GCCTTGCGGACGTGCTGGGTTTGTTTGGGACGTGCTGAGGGAGATCTGTTTGCGGACGTG
+CTGAGGAGATGAGCCTTGCGGACGTGCTGGGTTTGTTTGGGACGTGCTGAGGGAGATCTG
+TTTGCGG
+>ds2020-267_949
+GCAAAACCAGTTCACTCAGCATGTCCGCAACTAGGGCAGCACGTCCGCAATACCCAGTGG
+CTCAGCACGTCCGCAAAACCAGTTCACTCAGCATGTCCGCAACTAGGGCAGCACGTCCGC
+AATACCC
+>ds2020-267_950
+GGCTGAATATGACGGTCAGTGCGTCCCTGAATACGGCAGTGCGTCACGGAAGTCTGTACG
+GTCAGTGCGTCAGGCTGAATATGACGGTCAGTGCGTCCCTGAATACGGCAGTGCGTCACG
+GAAGTCT
+>ds2020-267_951
+TTCAGGGCTCACACGTCCCAATGGTTTCTCCCTCAGCACTCCGCAATCTGGAACCCAGCA
+CGTCCGCAATTTTTCAGGGCTCACACGTCCCAATGGTTTCTCCCTCAGCACTCCGCAATC
+TGGAACC
+>ds2020-267_952
+CGTCCCCACTCAGCACGTCCGCAATATGCTCTACCTCAGCACGTCCCAACTGACCCAGCA
+CGTCCGCAATACGTCCCCACTCAGCACGTCCGCAATATGCTCTACCTCAGCACGTCCCAA
+CTGACC
+>ds2020-267_953
+GTTATGGCCTCGCACGTCCGCAAAACTCCCTATCTCGCACGTCGCAATAATCTGGCAGCA
+CGTCCGCAATTGTTATGGCCTCGCACGTCCGCAAAACTCCCTATCTCGCACGTCGCAATA
+ATCTGG
+>ds2020-267_954
+GCAATCATAGAGCTATTGCGGAAGCGAGTCTGTCTTGCGGACGTGCGACGAGTGTGGAGT
+TGCGGACGTGGGCAATCATAGAGCTATTGCGGAAGCGAGTCTGTCTTGCGGACGTGCGAC
+GAGTGT
+>ds2020-267_955
+AGGGAGTTGCGACGTGCTGACGGAATTACGGTTGCGGACGTGCTGAGGAAAAGTACGTTG
+CGGACGTGCTGAGGGAGTTGCGACGTGCTGACGGAATTACGGTTGCGGACGTGCTGAGGA
+AAAGTA
+>ds2020-267_956
+ACATTCCCTCAGCACGTCCGCAAGATTGTACGCCTCAGCACGTCCCAAATTCGGCAGCAC
+GTCCGCAAGTTACATTCCCTCAGCACGTCCGCAAGATTGTACGCCTCAGCACGTCCCAAA
+TTCGGC
+>ds2020-267_957
+GCACGTCCGCAATGAGTTCACCTTCAGCACGTCCGCATTAAAGCAGCCTCAGCACGTCCC
+AATTTCCCCAGCACGTCCGCAATGAGTTCACCTTCAGCACGTCCGCATTAAAGCAGCCTC
+AGCAC
+>ds2020-267_958
+GGCAAATTGGACGTGCTGAGTGAATGTGACTTGCGGACGTGCTGAGGAGTAGTCTCTTGC
+GGACGTGCTGGGCAAATTGGACGTGCTGAGTGAATGTGACTTGCGGACGTGCTGAGGAGT
+AGTCT
+>ds2020-267_959
+ATTTCTTGCGGACGTGCGAGGCCGATATTATTGCGGACGTGCGGGTTTAGGTTGGGACGT
+GTGAGGGTGAATTTCTTGCGGACGTGCGAGGCCGATATTATTGCGGACGTGCGGGTTTAG
+GTTGG
+>ds2020-267_960
+CCAAGTTCTTTTTCCTCAGCACGTCCCAACCGGCTCAGCACGTCCGCAAGTTGGAGTCCC
+TCAGCACGTCCCAAGTTCTTTTTCCTCAGCACGTCCCAACCGGCTCAGCACGTCCGCAAG
+TTGGA
+>ds2020-267_961
+ACCGTAGACCTCAGCACGTCCCAACCACTAATCCCTCAGCACGTCCCAACAGGTGCAGCA
+CGTCCGCAACACCGTAGACCTCAGCACGTCCCAACCACTAATCCCTCAGCACGTCCCAAC
+AGGTG
+>ds2020-267_962
+TCAGAGGTACGGAATAAGGTCAGTGCGTCAGAGTGAAACCAACGGTCAGTGCGTCGCGGA
+TTATCTACGGTCAGAGGTACGGAATAAGGTCAGTGCGTCAGAGTGAAACCAACGGTCAGT
+GCGTC
+>ds2020-267_963
+CAATCTCCCACGTCCGCAATCTAGTACAAGTCAGCACGTCCACACCAACCACCTAGACGC
+AGCACGTCCGCAATCTCCCACGTCCGCAATCTAGTACAAGTCAGCACGTCCACACCAACC
+ACCTA
+>ds2020-267_964
+TCCAAAACATAAGCCCTCAGCACGTCGCAACCTCTATCAGCACGTCCGCAACGCCTTAAC
+CCTCAGCACGTCCAAAACATAAGCCCTCAGCACGTCGCAACCTCTATCAGCACGTCCGCA
+ACGCC
+>ds2020-267_965
+AGGGGATTGGGACGTGCTGAGGCTAAAATGATGCGGACGTGTGAAGGACATGTAGTTGCG
+GACGTGCTGAGGGGATTGGGACGTGCTGAGGCTAAAATGATGCGGACGTGTGAAGGACAT
+GTAG
+>ds2020-267_966
+GATTGCGGACGTGCTGCCCGATGTTGGACGGTGAGGACCTAAGATTTGCGGACGTGCTGA
+GTACAACACGATTGCGGACGTGCTGCCCGATGTTGGACGGTGAGGACCTAAGATTTGCGG
+ACGT
+>ds2020-267_967
+CAGCACGTCCGCAATCTCTATCCCCTCACACGTCCGCAATCTGTAACCCCTCACACGTCA
+AATTGAGGCCAGCACGTCCGCAATCTCTATCCCCTCACACGTCCGCAATCTGTAACCCCT
+CACA
+>ds2020-267_968
+ATGCGGACGGGAGATGGATTTGATTGGGACGTGCTGAGGCCTAACTCCTTGCGGACGTGC
+TGCCCCATTATGCGGACGGGAGATGGATTTGATTGGGACGTGCTGAGGCCTAACTCCTTG
+CGGA
+>ds2020-267_969
+ATCCTTCTGCACTCGCACGTCGCAACTCACCCAGCACGTCCGCAATGGTTGATTACTCAG
+CACGTCCCAATCCTTCTGCACTCGCACGTCGCAACTCACCCAGCACGTCCGCAATGGTTG
+ATTA
+>ds2020-267_970
+GCTGTCCGATTGGGACGTGCTGAGCGACACTGAATTGGGACGTGCTGAGGAGACTAAGGT
+TGCGGACGTGCTGTCCGATTGGGACGTGCTGAGCGACACTGAATTGGGACGTGCTGAGGA
+GACT
+>ds2020-267_971
+ACTAGTAGTTGCGGACGTGCTGGGGAGAAATTGCGGACGAGCTTGGATACGTTGCGGACG
+TGTGAGGTACTAGTAGTTGCGGACGTGCTGGGGAGAAATTGCGGACGAGCTTGGATACGT
+TGC
+>ds2020-267_972
+CTGACTGAATACTTGTTGGGACGTGTGAGTGTCGGGGTCTTGCGGACGTGCTGGGGGGAT
+TGGGACGGCTGACTGAATACTTGTTGGGACGTGTGAGTGTCGGGGTCTTGCGGACGTGCT
+GGG
+>ds2020-267_973
+GGGCATTGCGACGTGCTGAGGTAATCTCTGTTGCGGACGTCTGAGTTATGAAAAATTGCG
+GACGTGCTGGGCATTGCGACGTGCTGAGGTAATCTCTGTTGCGGACGTCTGAGTTATGAA
+AAA
+>ds2020-267_974
+ATTGCGGACGTGCTGGGGGTTTATGTTGCGGACGGTCGTGTTGTTGCGGACGGCTGAGTG
+GATGTATATTGCGGACGTGCTGGGGGTTTATGTTGCGGACGGTCGTGTTGTTGCGGACGG
+CT
+>ds2020-267_975
+AAATGTTGCGGACGTGCTGCCTCGATTTGGATGTGAGGGATGGGAACTTGCGGACGTGTG
+AGCCAGTAAATGTTGCGGACGTGCTGCCTCGATTTGGATGTGAGGGATGGGAACTTGCGG
+AC
+>ds2020-267_976
+GTCTGAGTGTATAAAGGTTGCGGACGTGTGGGGTTCTGTACTTGCGGACGTGCTGGGGCA
+CTGGGACGTCTGAGTGTATAAAGGTTGCGGACGTGTGGGGTTCTGTACTTGCGGACGTGC
+TG
+>ds2020-267_977
+AATAGCGTCTCCCTCCACGTCGCAAAGCTCCAGCACGTCCGCAAGAACCATTCCTCACAC
+GTCCGCAATAGCGTCTCCCTCCACGTCGCAAAGCTCCAGCACGTCCGCAAGAACCATTCC
+T
+>ds2020-267_978
+GGCTTCCCTCAGCACGTCCGCAATTACACTCCAGTTAATTGAGGGCTCGCGGCTTGCGAC
+GTGCTGGGCTTCCCTCAGCACGTCCGCAATTACACTCCAGTTAATTGAGGGCTCGCGGCT
+T
+>ds2020-267_979
+TGGCGTGTGACCTCCACCCAAACCTTAACCAATACAGATAAATCCAGTATCGCGGACGTT
+CGGGCTTGGCGTGTGACCTCCACCCAAACCTTAACCAATACAGATAAATCCAGTATCGCG
+G
+>ds2020-267_980
+CAAGTTTCTCCGGGTCTCGCAATAATCCTTTTAACCAGTTATAACAATTTCACCCAGCAC
+GTCCGCAAGTTTCTCCGGGTCTCGCAATAATCCTTTTAACCAGTTATAACAATTTCACCC
+>ds2020-267_981
+CAGCACGTCCGCAATACCGTACACTTGCGGAGCCGAAGGTTATTGCGGACGTGTGCCTAG
+GCAGTCAGCACGTCCGCAATACCGTACACTTGCGGAGCCGAAGGTTATTGCGGACGTGTG
+>ds2020-267_982
+GGCAGTTGGGACGTGCTGAGGAAATTCTGATACGTGTGAGGAGGATTACATTGCGGACGT
+GCTGGGCAGTTGGGACGTGCTGAGGAAATTCTGATACGTGTGAGGAGGATTACATTGCG
+>ds2020-267_983
+TATCTAAGGAGCAGCACGTCCGCAAGTAGCTGGCTGTCAGCACGTCCGCAAGGTTGGATC
+CTCAGCACGTCCCAACCTGTATTGCCTCATGTTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_984
+TATATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTTGACCCT
+TAAGTGATTCCAATCTACCTTGTCGGGAGGTCTCTTTCCACACAAGTGCTACTGCCA
+>ds2020-267_985
+TCCGCAATTCGATTACTCTCAGCACGTCGCAATCCTGAACCCATGTAACTTGCGGCAGCA
+CGTCCGCAATTCGATTACTCTCAGCACGTCGCAATCCTGAACCCATGTAACTTGCGG
+>ds2020-267_986
+CAAGTTTCTCCGGGTCTCGCAATAATCCTTTTAACCAGTTATAACAATTTCACCCCGCCA
+AAATTTTGCTAATCTCTCCTAGACAGGAGGCCAATTGCGGACGTGCTGCTCGTTAG
+>ds2020-267_987
+TCTCCTGGTTACCTCTTCCTCCCACTCCAGATTCTTTGCGGCAGCACGTCCGCAATCGGT
+TTCTCCTGGTTACCTCTTCCTCCCACTCCAGATTCTTTGCGGCAGCACGTCCGCAA
+>ds2020-267_988
+CTCCGCCAGCACGTCCGCAAGATCTAGCCTCTCAGCACGTCCCAAGCTAACCCCGCTCAC
+ACTCCGCCAGCACGTCCGCAAGATCTAGCCTCTCAGCACGTCCCAAGCTAACCCCG
+>ds2020-267_989
+GTCCGCAATTGCGAATGCCTCAGCACGTCCCAATATGAGGCAGGTAAAGTTGCGGCAGCA
+CGTCCGCAATTGCGAATGCCTCAGCACGTCCCAATATGAGGCAGGTAAAGTTGCGG
+>ds2020-267_990
+TTGCGGACGTGAGCAAGGAGGTTTTGCGGACGTGCTGAGCGCTTCGTAATTGCGGACGTG
+CGGCTGCTTAGATAGGGGGGATGAGCAGCTGTTTGAAGTCTAGTCACTCCGGAGA
+>ds2020-267_991
+CAGCACGTCCGCAAGTGCAAATCACTCAGCACGTCCGCAACTCAGCGACCCTCAGCGTCC
+GCAAACATATTACACTCAGCACGTCCGCAATTCCTTCTCGGCACACGTCCGCAA
+>ds2020-267_992
+GCAACCATACTATGCTCAGCACGTCCGCAAGACTTATCCCTCAGCACGTCCGCAAAGGGA
+AAGGCATTGGGACGTGTGAGAGTAGCCAGATTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_993
+CGTGCTGAGGGGTAGTTATTTGCGGACGTGCTGGGGCCTATTTGCGGACGTGCTGGGGAC
+GTGCTGAGGGGTAGTTATTTGCGGACGTGCTGGGGCCTATTTGCGGACGTGCTG
+>ds2020-267_994
+TTTGCGGACGTGCTGACGTGAGGGGAACCTGGTTGCGGACGTGCTGAGAGTGTCCTGTTT
+GCGGACGTGCTGACGTGAGGGGAACCTGGTTGCGGACGTGCTGAGAGTGTCC
+>ds2020-267_995
+CCGGAACCTGGTGACCTTTGGGACGTGCTGAGACCTTGAATATTGCGGACGTGCTGCCGG
+AACCTGGTGACCTTTGGGACGTGCTGAGACCTTGAATATTGCGGACGTGCT
+>ds2020-267_996
+GTATTTGGCAACGAAGTCGGTTTCAGTCATGTTGACCAGATCTTTCATCAAGTCCGAGAC
+GGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAGA
+>ds2020-267_997
+TCTTCCGATCTCTAAGGAGCAGCACGTCCGCAACGAGTACGTCGTCAGCACGTCCGCAAG
+TGTTATAGCCTCAGCACTTCCGCAATCCCACCCGTCTCCACGTCCGCAA
+>ds2020-267_998
+TTGCGGACGTGTGAGGTGAAGACGGTTGCGGACGTGCTGAGGCTAAAGGCGTTGCGGACG
+TGCTGAGGCAGGAAATATTGCGGACGTGCTGAGTACCTGCTATTTGCGG
+>ds2020-267_999
+TAGGCTCTTCAGTTTGTTCACTTCGCAGGTGGACAAGCACAAGTACGAAAGATTGGGACA
+TTGCAGCCAACTGTACAAGATGGGCGTACCAGTTTTTCAATACAACT
+>ds2020-267_1000
+GATTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTTGTTATCCC
+TGTGGTAACTTTTCTGACACCTCTAGCTTCAAATTCCGAAGGTCTAA
+>ds2020-267_1001
+GTCAAAACGATTCTAACGGTCAGTGCGTCATCGCGGTTCTAACGGTCAGTGCGTCAAAAC
+GATTCTAACGGTCAGTGCGTCATCGCGGTTCTAACGGTCAGTGCGTC
+>ds2020-267_1002
+TGAATGTCCCTGAAGGTCATGGGACAGAGGATACCGAGATTGTGGAGGAGCTGAATGTCC
+CTGAAGGTCATGGGACAGAGGATACCGAGATTGTGGAGGAGCTGAA
+>ds2020-267_1003
+TAGGGGTGTCCCGTCCCACGATACAGCTATTCACTTGCGGCAGCACGTCCGCAAATGACC
+TCCCCTCAGCACGTCGCAACACTAAAACATTATTGCGGACGTGCTG
+>ds2020-267_1004
+TTGCGGACGTGCTGAGGGATAAGTCTTGCGGACGTGCTGAGCATAGTATGGTTGCGGACG
+TGCTGAGGGATAAGTCTTGCGGACGTGCTGAGCATAGTATGGTTGC
+>ds2020-267_1005
+TATCTAAGGAGCAGCACGTCCGCAAGCCGAAGCCCTCAGCACGTCCGCAAAGACAGCACC
+TCAGCACGTCCGCAAGATCGTTGGGGCACACGTCCGCAA
+>ds2020-267_1006
+TCTCAAAAAGCCTATCGTAGTCCGGATTGGGATGTGATGCTAATCTCAAAAAGCCTATCG
+TAGTCCGGATTGGGATGTGATGCTAATCTCAAAAAGCC
+>ds2020-267_1007
+CACAGTTATCTCAAATCCATCAACTGTTACAGAGTCAAAATAATTTTCATGTTCTTCAGG
+AGATAGGTCATAATCCTGGTGTTTTGCGGACGTGCTG
+>ds2020-267_1008
+AACCATCCCTGTGCCGTTCTGTCCCTATCTCAATCCTTGAGAACCATCCCTGTGCCGTTC
+TGTCCCTATCTCAATCCTTGAGAACCATCCCTGTGC
+>ds2020-267_1009
+GGACGTGCTGGGGAGAGGCTATGCGGACGTGCTGACCCTTAGGTAATTGCGGACGTGCTG
+AGGGGAGCCAGGTTGCGGACGTGCTGCTCCTTAGAT
+>ds2020-267_1010
+CAGACGCCTGTTCGCGACAGCGGACTAAGGAGCAGCACGTCCGCAACCTCTATTCCGTCA
+GCACGTCCGCAAATCTCGCCCTTCAGCACGTCCGCA
+>ds2020-267_1011
+AGCACTTTAAGCAGGGAGGAGAGGCTAATGGTTAAGTAAAGCACTTTAAGCAGGGAGGAG
+AGGCTAATGGTTAAGTAAAGCACTTTAAGCAGGG
+>ds2020-267_1012
+TCGAAGGAGTAGCACGTCCGCAAACACTTACCCCTTTTTGCGGACGTGCTGAGGGAGAAG
+TTGTTGCGGACGTGCTGAGGGAGAAGTTGTTG
+>ds2020-267_1013
+CTAAGGAGCAGCACGTCCGCAAAAACATACGGCTCAGCACGTCCCAACCTTCTCAGCACG
+TCCGAAGGCCCGCTTCCCAGCACGTCCGCAA
+>ds2020-267_1014
+CAGCACGTCCGCAACGGTGATACGCTCAGCACGTCCGCAATGTCCACAGCCTCAGCACGT
+CCCAATACTCTTCAGGCAGCACGTCC
+>ds2020-267_1015
+CAGCACGTCCGCAACTGTTGTTGACTCACACGTCCGCAAGAGCATACCCTCAGCACGTCC
+CAATGTACTAACGCTCAGCACGTCC
+>ds2020-267_1016
+AGGAGAGGGTAACGAAGTAGCTCGACTGAAAGGAGAGGGTAACGAAGTAGCTCGACTGAA
+AGGAGAGGGTAACGAAGTAGCTCGA
+>ds2020-267_1017
+GGACGTGTGAGTGGTTAAAACATGGGACGTGGAGTGAATTTTTGTTGCGGACGTGTGAGG
+TATCGACCTTTGCGGACGTGCTG
+>ds2020-267_1018
+TTGCGGACGTGCTGAGGGTTTATTATTTGCGGACGTGCTACCCAGTGAGTATTGCGGACG
+TGCTGCTCCTTAGATATATCGG
+>ds2020-267_1019
+TTGCGGACGTGCTGAGGGAGAAGTTGTTGCGGACGTGCTGAGGGAGAAGTTGTTGCGGAC
+GTGCTGAGGGAGAAGTTGTTG
+>ds2020-267_1020
+GTCCGCAATTTAAGTCACCTCAGCACGTCCGCAATTTAAGTCACCTCAGCACGTCCGCAA
+TTTAAGTCACCTCAGCACGTC
+>ds2020-267_1021
+CAGCACGTCCGCAATGAGGTCCGGGCAGCACGTCCGCAAACATGGGACATTGCGGATCTG
+GAAGTAAGGACGTTCGGGCTT
+>ds2020-267_1022
+GTGCTGGCGGGGATCACTTGCGGACGTGCTGAGGGAATTGGGCTTGCGGACGTGCGAGGG
+AAGGTCCTTGCGGACGTGCTG
+>ds2020-267_1023
+CCGCAACCTCCACTATCCACACGTCCGCAACCTCCACTATCCACACGTCCGCAACCTCCA
+CTATCCACACGTCCGCAAC
+>ds2020-267_1024
+CAGCCGTTTCTCAGGCTCCCTCTCCAGCCGTTTCTCAGGCTCCCTCTCCAGCCGTTTCTC
+AGGCTCCCTCTCCAGCCGT
+>ds2020-267_1025
+TGGACTTCGGGCTTGTCCCTCCAGTGGACTTCGGGCTTGTCCCTCCAGTGGACTTCGGGC
+TTGTCCCTCCAGTGGACTT
+>ds2020-267_1026
+TTGCGGACGGCTGAGCGCGGTTAATTGCGGACGTGCTGAGCGAACGAGATTTGCGGACGT
+GCTGACCGGTGGGAATTTG
+>ds2020-267_1027
+TTCACCTTTCCCCTCTTCGGCCTTCACCTTTCCCCTCTTCGGCCTTCACCTTTCCCCTCT
+TCGGCCTTCACCTTTCC
+>ds2020-267_1028
+CAGCACGTCCGCAACAACTTCCCCCTGCTTAAAGTGCTTTACTTAACCATTAGCCTCTCC
+TCCCTGCTTAAAGTGCT
+>ds2020-267_1029
+ATTGCGGACGTCTGAGGGAGAAGACTTTGCGGACGTGCTGACGAGTGTAACTTTGCGGAC
+GTGCTGCTCCTTAGATA
+>ds2020-267_1030
+CCCTTATTCTGCCAAGCCCGTTCCCTTATTCTGCCAAGCCCGTTCCCTTATTCTGCCAAG
+CCCGTTCCCTTATTCTG
+>ds2020-267_1031
+CTAATGCCACCATCCAATCCGCTAATGCCACCATCCAATCCGCTAATGCCACCATCCAAT
+CCGCTAATGCCACCAT
+>ds2020-267_1032
+TTATGAAAGGGCCTCGCAGCTCTTCAGTAGATCGATCTCAGCGGGTAAGAGACCGTGGAG
+TTTGCGGACGTGCTGC
+>ds2020-267_1033
+ATCTAAGGAGCAGCACGTCCGCAACTACACTTTCCTCAGCACGTCCGCAAATGAGCTTCC
+CTCAGCACGTCCGCAA
+>ds2020-267_1034
+TTGCGGACGTGCTGAGGGAATAATACTTGCGGACGTGCTGAGGGATAATGTTTTGCGGAC
+GTGCTGCTCCTTAGAT
+>ds2020-267_1035
+ATCTAAGGAGCAGCACGTCCGCAAAGTCAATCATGTCAGCACGTCCGCAAAGTTCATTCA
+CTCAGCACGTCCGCAA
+>ds2020-267_1036
+TTGCGGACGTGCTGAGCGAGTAGCCCTTGCGGACGTGCTGAGTATGTGTCGTTGCGGACG
+TGCTGCTCCTTAGATA
+>ds2020-267_1037
+TTGCGGACGTGTGAGAGGAAACAATTTGCGGACGTGCTGACGGGTAGGACCTTGCGGACG
+TGCTGCTCCTTAGATA
+>ds2020-267_1038
+ATTGCGGACATGCTGGGCGGAGTAATTTGCGGACGTGCTGCCGAGCGCTTATTGCGGACG
+TGCTGCTCCTTAGATA
+>ds2020-267_1039
+TTGCGGACGTGCTGATCGAATGGAATTGCGGACGTGCTGGACTCGGCTTGGATTGCGGAC
+GTGCTGCTCCTTAGAT
+>ds2020-267_1040
+TTGCGGACGTGTGAGATAACTCGGGTTGCGGACGTGCTGAGAACCGTCACCTTGCGGACG
+TGCTGCTCCTTAGATA
+>ds2020-267_1041
+TTGCGGACGTCTGAGCCTCAAGAGATTGCGGACGTGCTGAGGTGCTTTTCATTGCGGACG
+TGCTGCTCCTTAGATA
+>ds2020-267_1042
+ATCTAAGGAGCAGCACGTCCGCAAGATGACGCCCGGTAGCACGTCCGCAAGTGGGAGCCA
+CTCAGCCGTCCGCAAT
+>ds2020-267_1043
+TTGCGGACGTGCTGAGTAACAGAGTCTTGCGGACGTGCTGAGCGGCACAACATTGCGGAC
+GTGCTGCTCCTTAGAT
+>ds2020-267_1044
+TTGCGGACGTGCTGAGAGGATTACCGTTGCGGACGTGCTGAGGGATAGAATCTTGCGGAC
+GTGCTGCTCCTTAGAT
+>ds2020-267_1045
+TCCGCAACCGTATATACCTCAGCACGTCCGCAATCGTTACTCCTCAGCACGTCCGCAATG
+TTAAACGCCTCAGCAC
+>ds2020-267_1046
+TCACCAGACTCTGTCCGTCTTGCAGCAATTTTCAGGAGTTTCTTCATTCAGGGTGCTGCC
+TTTGCGGACGTGCTG
+>ds2020-267_1047
+TTGCGGACGTGCGAGTGACAATGGATTGCGACGTGCTGAAGGAGTAGTCCTTGCGGACGT
+GCTGCTCCTTAGATA
+>ds2020-267_1048
+TATCTATGGAGCAGCACGTCCGCAACATGAATATACTCAGCACGTCCCAAGATGTCTTCC
+GTCACACGTCCGCAA
+>ds2020-267_1049
+TTGCGGACGTGGAAGCGTAAATCCTTGCGGACGTGCTGAGAGACATGGTGTTGCGGACGT
+GCTGCTCCTTAGATA
+>ds2020-267_1050
+TTGCGGACGTGTGGGGCCAGACTGTTGCGGACGTGTGCAGCCGGGAAATATTGCGGACGT
+GCTGCGCCTTAGATA
+>ds2020-267_1051
+ATCTAAGAGCAGCACGTCCGCAAACCCATTACCCTCAGCACGTCCGCAACATGCCATCCC
+TCAGCACGTCCGCAA
+>ds2020-267_1052
+TAGCAAGGAGCAGCACGTCCGCAAGTTATTCGGCCTCAGCACGTCCGCAAGCCCTTTATG
+CCAGCACGTCCGCAA
+>ds2020-267_1053
+TTGCGGACGTGTGAGGTGGCTGGCGTTGCGGACGTGCTGAGGGCTAGAGTTTTGCGGACG
+TGCTGCTCCTTAGAT
+>ds2020-267_1054
+TTGCGGACGTGCTGAGGAGTGCAGTGTTGCGGACGTGTGAGGTGCTTTTTATTGCGGACG
+TGCTGCTCCTTAGAT
+>ds2020-267_1055
+TTGCGGACGTGCTGAGGGAGAAGAGTTTGGACGTGCTGAGGGGTGTCGCCTTGCGGACGT
+GCTGCTCCTTAGACA
+>ds2020-267_1056
+TTGCGGACGTGCTGAGGGGTAGTTCATTGCGGACGTGGAGGAGTGTGGGTTTGCGGACGT
+GCTGCTCCTTAGAGA
+>ds2020-267_1057
+TTGCGGACGTGCTGAGGCCTAACCATTTGCGGACGTGCTGGGGGAATCGCATTGCGGACG
+TGCTGCTCCTTAGAT
+>ds2020-267_1058
+TAGGCTCTTCAGTTTGTTCACTTCGCAGGTGGACAAGCACAAGTACGAAAGATTGAGGAC
+TTGCGGACGTGCTG
+>ds2020-267_1059
+TGCGGACGTGTGAGGGTAGACATATTGGGACGTGCTGACTAAGGCAAGCTTGCGGACGTG
+CTGCTCCTTAGATA
+>ds2020-267_1060
+TTGCGGACGTGCTGAGCCGTTACAGATTGGGACGTGCTGGGAGAACATAATTGCGGACGT
+GCTGCTCCTTAGAT
+>ds2020-267_1061
+ATCTAAGGAGCAGCACGTCCGCAAAATGGTTATGCTCAGCACGTCCGCAAGATACTACCC
+TCACACGTCCGCAA
+>ds2020-267_1062
+TTTGCGGACGGAAGGATTCTCGGTTGCGGACGTGCTGACGGGGAATCTCTTGCGGACGTG
+CTGCTCCTGAGATA
+>ds2020-267_1063
+TTGCGGACGTGCGCCAGTCAGTTATTGCGGACGTGCGACTGATGTGGCTTTGCGGACGTG
+CTGCTCCTTAGATA
+>ds2020-267_1064
+TTGCGGACGTGCGACAAATATTAAATTGGGACGTGCTGACCCAGTTGCTTTGCGGACGTG
+CTGCTCCTTAGATA
+>ds2020-267_1065
+CGGACGTGCTGAGACGTGACCGTTTGCGGACGTGCTGAGTGGTATGGTCTTGCGGACGTG
+CTGCTCCTTAGATA
+>ds2020-267_1066
+TTGCGGACGTGGACTCAATCATTATTGGGGACGTGCTGAGCGGTTGCGGATTGCGGACGT
+GCTGCTCTTAGATA
+>ds2020-267_1067
+TTGCGGACGTGTGAGGGATAGTGTTTGCGGACGTGTGAGGGTTGCTAGATTGCGGACATG
+CTGCTCCTTAGATA
+>ds2020-267_1068
+TTGCGGACGTGCTGGGGGTGAAAGATTGCGGACGTGCTACCAGGTACCTCTTGCGGACGT
+GCTGCTCCTTAGAT
+>ds2020-267_1069
+ATTGCGGACGTGGAGAAGTACTAATTGCGGACGTGCGGGGGCCTCGCGTTGCGGACGTGC
+TGCTCCTTAGATA
+>ds2020-267_1070
+CCAGACTCTTACCTTCCTCCAGACTCTTACCTTCCTCCAGACTCTTACCTTCCTCCAGAC
+TCTTACCTTCCTC
+>ds2020-267_1071
+TTGCGGACGTGTGGGTGGCAGAGATTGCGGACGTGCTGACCCCTATGCATTTGCGGACGT
+GCTGCTCCTTAGA
+>ds2020-267_1072
+TATCTAAGGGCAGCACGTCCGCAACGCGATTGCACTCACACGTCCGCAAGCCTCTTCCTT
+CACACGTCCGCAA
+>ds2020-267_1073
+CTAAGGAGCAGCACGTCCGCAAATCGTTATCCCTCAGCACGTCCGCAAAATGCATTACCT
+CAGCCGTCCGCAA
+>ds2020-267_1074
+TTTGCGGACGTAGGGAGCCGTAATTGCGGACGTGCTGACGAAACCTCCCTTGCGGACGTG
+CTGCTCTTAGATA
+>ds2020-267_1075
+GGACGTGCTGAGGGCCAACACCTTGCGGACGTGCTGAGAATATTAGATTTGCGGACGTGC
+TGCTCCTTAGATA
+>ds2020-267_1076
+TATCTAAGGAGCAGCACGTCCGCAAAGATGGCCACCTCAGCACGTCCGCAAGTGTTATGT
+CCTCAGCACGTCC
+>ds2020-267_1077
+GGACGTGCTGAGTAGTAATAGCTTGCGGACGTGCTGAGGTAACTCACTTTGCGGACGTGC
+TGCTCCTTAGATA
+>ds2020-267_1078
+TTCACCTTTCCCCTCTTCGGCCTTCACCTTTCCCCTCTTCGGCCTTCACCTTTCCACTCT
+TGCGGACTTGCTG
+>ds2020-267_1079
+GGACGTGCTGAGTGGGACCGTATTGCGGACGTGCTGAGTGATCCTATTTTGCGGACGTGC
+TGCTCCTTAGATA
+>ds2020-267_1080
+GGACGTGCTGAGGGTCTACGAATTGCGGACGTGCTGAGGGGTAAGTGCTTGCGGACGTGC
+TGCTCCTTAGATA
+>ds2020-267_1081
+TTGCGGACGTGCTGAGGCTATGGGGCTTGCGGACGTGCTAAGCGAGTAGTCTTGCGGACG
+GCTGCCCTTAGAT
+>ds2020-267_1082
+TTGCGGACGTGTGAGGGATTCAGAGTTGCGACGTGCTGAGAGCGGACACGTTGCGACGTG
+CTGCTCTTAGATA
+>ds2020-267_1083
+TTGCGGACGTGCTGAGGAAGAGGCTTTTGCGGACGTGCTGGGGTGAATTGCGGACGTGCT
+GCTCCTTAGATA
+>ds2020-267_1084
+GGACGTGCTGAGGGAAAGACATTGCGGACGTGCTGACCGGTTGCCTATTGCGGACGTGCT
+GCTCCTTAGATA
+>ds2020-267_1085
+TTGCGGACGTGGGGGCCAACCCTTGCGGACGTGCTGCCCATGACAACTTGCGGACGTGCT
+GCTCCTTAGATA
+>ds2020-267_1086
+GGACGTGCTGAGGAGAGCGACCTTGCGGACGTGCTGAGTGTGTAACCTTTGCGGACGTGC
+TGCTCCTTAGAT
+>ds2020-267_1087
+TATCTAAGGAGCAGCACGTCCGCAACTCTGTGCACTCAGCACGTCCGCAACACACTTACC
+CTCGCACGTCCG
+>ds2020-267_1088
+GACGTGCTGAGCGGAAGATCTTTGCGGACGTGCTGAGGGGAACCGGATTGCGGACGTGCT
+GCTCCTTAGATA
+>ds2020-267_1089
+GGACGTGCTGAGGAACGAACGATTGCGGACGTGCTGCCCTGAACACCTTGCGGACGTGCT
+GCTCCTTAGATA
+>ds2020-267_1090
+GGACGTGCTGAGGGCAAAGCTATTGCGGACGTGCTGGGGGAACTTGCTTGCGGACGTGCT
+GCTCCTTAGATA
+>ds2020-267_1091
+TATCTAAGGAGCAGCACGTCCGCAAGTGTGACGGGGCAGCACGTCCGCAAGTTACTCGCC
+CTCAGCACGTCC
+>ds2020-267_1092
+CGGACGTGCTGAGGGATCACTCGTTGCGGACGTGCTGAGGGGGAAAGTTTTGCGGACTGC
+TGCTCCTTAGAT
+>ds2020-267_1093
+GGACGTGCTGAGGAAGCTCGGATTGCGGACGTGCTGAGACCATAATAATTGCGGACGTGC
+TGCTCCTTAGAT
+>ds2020-267_1094
+AGTTGTATTGAAAAACTGGTACGCCCATCTTGTACAGTTGGCTGCAATGTCCCAACCTTG
+CGGACGTGCTG
+>ds2020-267_1095
+ATCTAAGGAGCAGCACGTCCGCAACATCCCGGCAGCACGTCCGCAAAATGGAGGCTCTCA
+CACGTCCGCAA
+>ds2020-267_1096
+TATCTAAGGAGCAGCACGTCCGCAACGATACTAACCTCAGCACGTCCGCAAGTTCTCCAC
+CCCAGCACGTC
+>ds2020-267_1097
+TTGCGGACGTGGAGGGTTTGGTAGTTGGGACGTGCTGAGGCGTATGACTTGCGGACGTGC
+TGCTCCTTAGA
+>ds2020-267_1098
+TATCTAAGAGCAGCACGTCCGCAAGGTAAGCCTCGTCAGCACGTCGCAAAGTTAAGTGCC
+TCAGCACGTCC
+>ds2020-267_1099
+GGACGTGCTGAGGTATCGCGGTTTGCGGACGTGCTGAGTAATCTACGTTTGCGGACGTGC
+TGCTCCTTAGA
+>ds2020-267_1100
+GGACGTGCTGACGGACTACTCCTTGCGGACGTGCAGGCGATCGTCATTGCGGACGTGCTG
+CTCCTTAGGTA
+>ds2020-267_1101
+TATCTAAGGAGCAGCACGTCCGCAAATGTGACCGGGTAGCACGTCCGCAACGCCTATTGA
+CTCAGCACGTC
+>ds2020-267_1102
+ATCTAAGGAGCAGCACGTCCGCAAATGACACTTCCTCAGCACGTCCGCAATACAGATCCG
+TCAGCACGTCC
+>ds2020-267_1103
+TATCTAAGGAGCAGCACGTCCGCAAGTCAATGGCCCTCACACGTCCGCAATAAGATATGC
+CTCGCACGTCC
+>ds2020-267_1104
+GACGTGCTGAGGGCTCACGACTTGCGGACGTGCTGAGTGGTAAGGCTTTGCGGACGTGCT
+CTCCTTAGATA
+>ds2020-267_1105
+ATCTAAGGAGCAGCACGTCCGCAAGGCCTCCCCACTCAGCCGTCCGCAATGGTCCTACCC
+TCAGCACGTCC
+>ds2020-267_1106
+GACGTGCTGATGGTCTGGTGATTGCGGACGTGCTGAGGAGTTAGGCTTGCGGACGTGCTG
+CTCGTTAGATA
+>ds2020-267_1107
+TCCGATCTACCTAAGGAGCAGCACGTCCGCAAATTCTAACTCTTAGCACGTCGCAAGTGG
+GCAGCACGTCC
+>ds2020-267_1108
+GCGGACGTGCTGCCCGGTAAAGCTTGCGGACGTGCTGAGCGGTGTAAGCTTGCGGACGTG
+CTGCTCCTTAG
+>ds2020-267_1109
+TTGCGGACGTGCTGGCGGACGTGCTGAGGTGAACAAATTTGCGGACGTGCTGCTCCTTAG
+ATAGATCGGA
+>ds2020-267_1110
+TCCGATCTATCTAAGGAGCAGCAGTCCGCAAGAATCATAGACTCACACGTCCGCAACGAT
+CAGCACGTCC
+>ds2020-267_1111
+TCTAAGGAGCAGCACGTCCGCAATGGTTGCATCCTCAGCACGTCCGCAATCCAGTGTCCC
+TCAGCACGTC
+>ds2020-267_1112
+TCTAAGGAGCAGCACGTCCGCAATACGACCTGGGCAGCACGTCCCAAGCATACTCACCTC
+ACGTCCGCA
+>ds2020-267_1113
+TATCTAAGGGCGCACGTCCGCAAGGAGTTAGGGGTAGCACGTCGCAAGCTGCAGTCTCTC
+AGCACGTCC
+>ds2020-267_1114
+GGACGTGCTGCCCGCTAAAGGTTGGGACGTGCTGGGAGATTGCTATTGCGGACGTGCTGC
+TCCTTAGAT
+>ds2020-267_1115
+TATCTAAGGAGCAGCACGTCCGCAAAAAGTGGCCCCTCAGCACGTCCGCAAGCTAAACCC
+CCTCAGCAC
+>ds2020-267_1116
+TAAGGAGCACCGTCCGCAATCTATTATGCTTAGCACGTCCGCAACCTCTACCAGTCACAC
+GTCCGCAA
+>ds2020-267_1117
+TAAGGAGCAGCACGTCCGCAATGGTCAATACTTAGCACGTCCGCAAGTAAGTTGGCCTAC
+GTCCGCAA
+>ds2020-267_1118
+GCGTTGGGACGTGCTGAGTGAATATACCTTGCGGACGTGCTGAGTGGATAGCAATTGCGG
+ACGTGCTG
+>ds2020-267_1119
+CTATCTAAGGAGCAGCACGTCCGCAAAAGACGCCCGGTAGCACGTCCGCAAAGATTACCT
+TGTCAGC
+>ds2020-267_1120
+TAAGGAGCAGCACGTCCGCAACCATCTCTCCCGCACGTCCCAGCTAGATGGCATCACACG
+TCCGCAA
+>ds2020-267_1121
+TCTTCCGATCTATCTAAGGAGCAGCACGTCCGCAATTGGGCAGCACGTCCGCAATGCAAT
+CCACGTC
+>ds2020-267_1122
+TTGCGGACGTGTGCCGAAGGGCATTGCGGACGTGCTGACGGTTTTAAGCTTGCGGACGTG
+CTGCTCC
+>ds2020-267_1123
+CAGCACGTCCGCAACGTGGTACGCCTCAGCACGTCCGCAACAATAGACCGCTCAGCACGT
+CCGCAAT
+>ds2020-267_1124
+TCTTCGAGGTATCTTCGAGGTATCTTCGAGGTATCTTCGAGGTATCTTCGAGGTATCTTC
+GAGGTA
+>ds2020-267_1125
+GAGCAGCACGTCCGCAACACTCGTCAACTCAGCACGTCCGCAATGACCCTGCTCTCCCGT
+CCGCAA
+>ds2020-267_1126
+GAGCAGCACGTCCGCAAACAGATAGCCCTCAGCACGTCCGCAAACGATAACGGGCCACGT
+CCGCAA
+>ds2020-267_1127
+GAGCAGCACGTCCGCAACGACAGACCCTTAGCACGTCCGCAAAGAAACCCGACTCCACGT
+CCGCAA
+>ds2020-267_1128
+CAGCACGTCCGCAACATCGGTCCCCTCAGCACGTCCGCAACGCACCTTCTCTCAGCACGT
+CCGCAA
+>ds2020-267_1129
+CAGCACGTCCGCAAGCTCATCTCCCTCAGCACGCCCGCAATCGTACCTGACTCAGCACGT
+CCGCAA
+>ds2020-267_1130
+CAGCACGTCCGCAACAGCTAGCTCCTCAGCACGTCCGCAAATGACTTTCCCTCAGCACGT
+CCGCAA
+>ds2020-267_1131
+TTGCGGACGTGCTGAGCGAAGGATAATTGCGGACGTGCTGAGGGGGGGCAAGTTGCGGAC
+GTGCTT
+>ds2020-267_1132
+CAGCACGTCCGCAATATGTCGTGGCTCAGCACGTCCGCAAAAAGTCCTCCCTCAGCACGT
+CCGCAA
+>ds2020-267_1133
+TCTAAGGAGCAGCACGTCCGCAACAAATACGCCGTCAGCACGTCGCAAATACAGGGCAGC
+ACGTCC
+>ds2020-267_1134
+GTTGCGGACGTGTGACAGAAGACTATTTGCGGACGTGCTGACAGAAGGGAAATTGCGGAC
+GTGCTG
+>ds2020-267_1135
+TTGCGGACGTGCTGAGACAGTAACTGTTGCGGACGTGCTGAGTGTGTAACCTTTGCGGAC
+GTGCTG
+>ds2020-267_1136
+TTGCGGACGTACTGAGGGAAATCAACTTGCGGACGTGCTAGCGGAACGGGGTTGCGACGT
+GCTGGT
+>ds2020-267_1137
+CAGCACGTCCGCAAGGAATACTCCTCAGCACGTCCGCAACCGATCGCCCCTCAGCACGTC
+CGCAAT
+>ds2020-267_1138
+TTGCGGACGTGCTGAGTGAGGGGGGCTTGCGGACGTGCTGAGGGAGTCGACTTTGCGGAC
+GTGCTG
+>ds2020-267_1139
+TTGCGGACGTGCTGAGGGATGACCTGTTGCGGACGTGCTGAGTGCATCGGTATTGCGGAC
+GTGCTG
+>ds2020-267_1140
+TTGCGGACGTGCTGAGTGGTCTATTATTGCGGACGTGCTGAGGGGTTTTCGATTGCGGAC
+GTGCTG
+>ds2020-267_1141
+TTTGCGGACGTGCTAAGGGTACGGAATTGCGGACGTGCTGAGCCCGCGACGTTTGCGGAC
+GTGCTG
+>ds2020-267_1142
+TTGCGGACGTGCTGAGGGAGAAGCAATTGCGGACGTGCTGATAGTAGAAGTGTTGCGGAC
+GTGCTG
+>ds2020-267_1143
+GCAGCACGTCCGCAATTGTACGCTACTCAGCACGTCCGCAATGCTCCTGGCCCACACGTC
+CGCAA
+>ds2020-267_1144
+GCAGCACGTCCGCAACATAAACTCTGTCAGCACGTCCCAATACGGTACACCTCACACGTC
+CGCAA
+>ds2020-267_1145
+AGCAGCACGTCCGCAAAGAAAGTTCCCTCAGCACGTCCGCAATTAACTACGGGCACACGT
+CCGCA
+>ds2020-267_1146
+CAGCACGTCCGCAAATACACACTCCTCAGCACGTCCGCAAGGGGGATACTCTCAGACGTC
+CGCAA
+>ds2020-267_1147
+GCAGCACGTCCGCAACATACAGTCCCTCAGCACGTCCCAATGTGTTGAACCTCGCACGTC
+CGCAA
+>ds2020-267_1148
+TTGCGGAGTGCTGGGGCACAACAATTGCGGACGTGCTGAGCCCACCTAGATTGCGGACGT
+GCTGC
+>ds2020-267_1149
+CAGCACGTCCGCAAGTCTATTCTCCTCAGCACGTCCGCAAAGCATATCCCCCAGCACGTC
+CGCAA
+>ds2020-267_1150
+CAGCACGTCCGCAACGTTACTTCCCTCAGCACGTCCCAAGGCACTCATCTCAGCACGTCC
+GCAAA
+>ds2020-267_1151
+CAGCACGTCCGCAAGAGCACTCTTCTCAGCACGTCCGCAATTGGTATGGCTTCACACGTC
+CGCAA
+>ds2020-267_1152
+CAGCACGTCCGCAATTGGACCACCTCAGCACGTCCGCAACTATTATACTCTCAGCACGTC
+CGCAA
+>ds2020-267_1153
+TTGCGGACGTGTGAGCCAAGTAGAGTTGCGGACGTGCTGACTGCGACAAGGTTGCGGACG
+TGCTG
+>ds2020-267_1154
+TTGCGGACGTGCTGAGGACTTACGATTGCGGACGTGCTGACCGGACAAACATTGCGGACG
+TGCTG
+>ds2020-267_1155
+TTGCGGACGTGCTGAGGGAAATGTCTTGCGGACGTGCTGAGTGAATACGCGTTGCGGACG
+TGCTG
+>ds2020-267_1156
+AGTATTTACCTTGACTTCGGGCTTTAAAAACGGATTGGAAAGCCCGAACGTCCAGGGGTT
+GCCAA
+>ds2020-267_1157
+CAGCACGTCCGCAACAGGAGTAACCTCAGCACGTCCGCAAACCTGTGTGGGCACACGTCC
+GCAA
+>ds2020-267_1158
+CAGCACGTCCGCAATGTGTAGTCCCTCAGCACGTCCGCATATGGAACCCCCAGCACGTCC
+GCAA
+>ds2020-267_1159
+AGCAGCACGTCCGCAATGTCTTCTCACTCAGCACGTCCGCAATATAAATCCTTGCCGTCC
+GCAA
+>ds2020-267_1160
+CAGCACGTCCGCAAGCTACTAATACTCACACGTCCGCAACACTCGTGCCCTCGCACGTCC
+GCAA
+>ds2020-267_1161
+CAGCCGTCCGCAACTTGGACTACCTCGCACGTCCGCAATTCGTAAGCCGTCAGCACGTCC
+GCAA
+>ds2020-267_1162
+TTGCGGACGTGCGAGGCGCTGTGGATTGCGGACGTGCTGACACAGTATCGATTGCGGACT
+GCTG
+>ds2020-267_1163
+CAGCACGTCCGCAATGTCATAGCCCTAGCCGTCCGCAACACTGGTGCCCTCAGCACGTCC
+GCAA
+>ds2020-267_1164
+CAGCACGTCCGCAATGGTAGTCCCCTCAGCACGTCCGCAAGATGTTTGGGCTGCACGTCC
+GCAA
+>ds2020-267_1165
+TTGCGGACGTGCAACCATTAGATATTGCGGACGTGCTGAGGGGCCGATATTTGCGGACGT
+GCTG
+>ds2020-267_1166
+TTGCGGACGTGGACCGAGAGAGTATTGCGGACGTGCTGAGGAGTAATGGATTGCGGACGT
+GCTG
+>ds2020-267_1167
+CAGCACGTCCGCAAACGATGATGCCTCAGCACGTCCGCATCTGGAAGTAAGGACGTTCGG
+GCTT
+>ds2020-267_1168
+ATGGTTGTATGGTTGTATGGTTGTATGGTTGTATGGTTGTATGGTTGTATGGTTGTATGG
+TTG
+>ds2020-267_1169
+CAGCACGTCCGCAAACCGACACAGGTGGGCGAGATGAGTATTCTAAGGCGCTTGAGAGAA
+CTC
+>ds2020-267_1170
+CAATTGGTCAATTGGTCAATTGGTCAATTGGTCAATTGGTCAATTGGTCAATTGGTCAAT
+TGG
+>ds2020-267_1171
+CAGCCGTCCGCAACGTTCATTCCCTCAGCACGTCCGCAACCGCTAGCTCTCGCACGTCCG
+CAA
+>ds2020-267_1172
+CAGCACGTCCGCAATCTGAGGTACCCAGCCGTCCGCAATGGCTCGTGTCTCGCACGTCCG
+CAA
+>ds2020-267_1173
+TTGCGGACGTGCTGAGTGAAGCAGGGTTGCGGACGTGTGGGAGAGTCTGGTTGCGGACTG
+CTG
+>ds2020-267_1174
+TTGCGGACGTGAGTATAGAATGGTTGCGGACGTGCTGAGTACGTTTTGCTTGCGGACGTG
+CTG
+>ds2020-267_1175
+GGACGTGCTGAGGGTTGACATCTTGCGGACGTGCTGAGCTGTCTCCTCTTGCGGACGTGC
+TGC
+>ds2020-267_1176
+CTGTCTAAGGAGCAGCACGTCCGCAACTGCCGCAGAGTCTTGGTTAACGTCAATGGGTTT
+TAG
+>ds2020-267_1177
+TCTTCCAATCTATCTAAGGAGCAGCACGTCCGCAAGCTACGGTCTCTCAGCACGTCCGCA
+ATT
+>ds2020-267_1178
+GCAGCACGTCCGCAAAACTAGATCGGCAGCACGTCCGCAAGGGCTAATGACTCAGCACGT
+CC
+>ds2020-267_1179
+CAGCACGTCCGCAAGGATAGGTCACTCAGCACGTCCGCAAACCACCTGCCCTCAGCACGT
+CC
+>ds2020-267_1180
+CAGCAGTCCGCAACAGATACCGACTAGCACGTCCGCAAACCCCCTACGCCAGACGTCCGC
+AA
+>ds2020-267_1181
+GGACGTGCTGAAGGAGATAACATTGCGGACGCGCTGAGGTCAGCTGGTTTGCGGACGTGC
+TG
+>ds2020-267_1182
+GGACGTGCTGAGGGACCGAGTATTGCGGACGTGCTGAGTGTGGCTTCATTGCGGCGTGCT
+GC
+>ds2020-267_1183
+TCTTCCGATCTATCTAAGGAGCAGCACGTCCGCAACCTATTCGCCCTCAGCACGTCCGCA
+AT
+>ds2020-267_1184
+CTATTGCGGACGTGCTAAGGTCTATATTTTGCGGACGTGCTGCTCCTTAGATAGATCGGT
+AG
+>ds2020-267_1185
+CATATTTGGCATGGCGTTCGTCTTACACAGAAGAGTAAGCCCGAACGTCCAGCCAGTGAC
+GT
+>ds2020-267_1186
+TTGCGGACGTGCTGAGTGCTAGTTTCTTGCGGACGTGCTGCTCCTTAGATAGATCCGAAG
+AG
+>ds2020-267_1187
+TTGCGGACGTGCTGACCCTATACTAATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAT
+AG
+>ds2020-267_1188
+TCTTCCAATCTATCTAAGGAGCAGCACGTCCGCAAACTGCCCGCGCCCAGCACGTCCGCA
+AT
+>ds2020-267_1189
+AGCAGCACGTCCGCAAACAGAAGGCCTCGCACGTCCGCACTTTCCTCGTCTCAGCACGTC
+C
+>ds2020-267_1190
+CAGCACGTCCGCAATCTGGAACTACTCAGCACGTCCGCAAACTTCTCCGGCTCAGCACGT
+C
+>ds2020-267_1191
+CAGCAGTCCGCAAGTGATGACATCTCAGCACGTCCGCAATTGACGTCCACTCAGCACGTC
+C
+>ds2020-267_1192
+AAGCACGTCCGCAAAACATCGGGGCTCAGCACGTCCCAAAACTGCCCCACTCAGCACGTC
+C
+>ds2020-267_1193
+GACGTGCTGAGCGATTTTATGTTGCGGACGTGCTGAGGCTTGACTTTTTGCGGACGTGCT
+G
+>ds2020-267_1194
+CAGCACGTCCGCAAAACTTTGTCCCTCAGCACGTCCGAACCCTTAACTACTCAGCACGTC
+C
+>ds2020-267_1195
+GACGTGCTGACGGAACAGAACTTGCGGACGTGCTGAGTGGTGCCAGTTGCGGAGTGCTGC
+T
+>ds2020-267_1196
+TTTGCGGACGTGCTGACCCAGTCAACTTTGCGGACTGCTGCTCCTTAGATAGATCGGAAG
+A
+>ds2020-267_1197
+TCTCCGATCTATCTAAGGAGCAGCACGTCCGCAAAGTCAATAGCCTCACACGTCCGCAAT
+C
+>ds2020-267_1198
+GTTGCGGACGTGCTGAGGGTACTCGATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+A
+>ds2020-267_1199
+TCTCCGATCTATCTAAGGAGCAGCACGTCCGCAATCACATATCCCTCAGCACGTCCGCAA
+A
+>ds2020-267_1200
+TTCCGATCTATCTAAGGAGCAGCACGTCCGCAACCGGTCTGCCCTCAGCACGTCCGCAAA
+G
+>ds2020-267_1201
+TTGCGGACGTGCTGAGGGGATTGACATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+A
+>ds2020-267_1202
+CTTTCCGATCTATCTAAGGAGCAGCACGTCCGCAATAGCGTACATCTCAGCACGTCCGCA
+A
+>ds2020-267_1203
+TTTGCGGACGTGCTGACCCGGGATCCATTGCGGACGTGCTGCTCCTTAGATAGATCGGAA
+G
+>ds2020-267_1204
+TCGTCCGATCTATCTAAGGAGCAGCACGTCCGCAATCGTTCGACCCTCAGCACGTCCGCA
+A
+>ds2020-267_1205
+TCTTCCGATCTATCTAAGGAGCAGCACGTCCGCAAGACCTCGCGCCTCAGCACGTCCGCA
+A
+>ds2020-267_1206
+TTGCGGACGTGCTGAGGACGCTTACTTTGCGGACGTGCTGCTCCTTAGATAGATCGGGAA
+G
+>ds2020-267_1207
+CTTCCCGATCTATCTAAGGAGCAGCACGTCCGCAAGATATACGACATCAGCACGTCCGCA
+A
+>ds2020-267_1208
+TTGCGGACGTGCTGAAGGGCTACTTTTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+A
+>ds2020-267_1209
+CTTGCGGACGTGCTGAGTACAATATCTTTGCGGACGTGCTGCTCCTTAGATAGATCGGAA
+G
+>ds2020-267_1210
+TTGCGGACGTGCTGACCGGATCTAAGTTGCGGACGTGCTGCTCCTTAGATAGATCGTAAG
+A
+>ds2020-267_1211
+TTGCGGACGTGCTGAGGGGATTCGCTTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+A
+>ds2020-267_1212
+CAGCACGTCCGCAAACGATAGGCGTTAGCACGTCCGCAAGTTTATACGCCTCAGCACGTC
+>ds2020-267_1213
+CAGCACGTCCGCAATGCAGACCCTTTAGCACGTCCGCAATTCGGCACTCTCAGCACGTCC
+>ds2020-267_1214
+TTGCGGACGCGCTGGACGTGCTGATCAAGGCGCATTTGCGGACGTGCTGCTCCTTAGATA
+>ds2020-267_1215
+TCTCCGATCTATCTAAGGAGCAGCACGTCCGCAATTACACCCACCTCAGCACGTCCGCAA
+>ds2020-267_1216
+CTTCCGATCTATCTAAGGAGCAGCACGTCCGCAAGTGATGATCTCTCAGCACGTCCGCAA
+>ds2020-267_1217
+GCAGCCGTCCGCAACCAACTGCTGCTCAGCACGTCGCAAGTCATATGGCCTCAGCACGTC
+>ds2020-267_1218
+GGACGTGCTGAGGACTGCTACATTGGGACGTGCTAAGCGAGCATGGTTGCGGACGTGCTG
+>ds2020-267_1219
+TTGCGGACGTGCTGAGGTATGGTAGATTGCGGACTGCTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_1220
+TTGCGGACGTGCTGAGGGATCCGCAGTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_1221
+TTGCGGACGTGCTGAGGGGCGTGCTATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_1222
+TTGCGGACGTGCTGAGCCATGCACACTTGCGGACTGCTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_1223
+TTGCGGACGTGCTGAGTCCCGACCACTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_1224
+CTTCCGATCTATCTAAGGAGCAGCACGTCCGCAAATCAAAGTACCTCAGCACGTCCGCAA
+>ds2020-267_1225
+TCTCCGATCTATCTAAGGAGCAGCACGTCCGCAACGTAGGATCTGTCAGCACGTCCGCAA
+>ds2020-267_1226
+TTGCGGACGTGCTGAGGATTCCACATTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_1227
+TTGCGGACGTGCTGAGGTAAGGAGCATTGCGGACGTGCTGCTCCTTAGATAGATCGGGAG
+>ds2020-267_1228
+CTCTCCGATCTATCTAAGGAGCAGCACGTCCGCAAGCGTTATCCCTCAGCACGTCCGCAA
+>ds2020-267_1229
+TTGCGGACGTGCTGCCCGGATAACATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_1230
+TTGCGGACGTGCTGCCGAGATAACATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_1231
+TTGCGGACGTGCTGAGAGAATCAAGTTGCGGACGTGCTGCTCCTTAGATAGATCGGGAAG
+>ds2020-267_1232
+TTGCGGACGTGCTACCCCGTGATACTTGCGGACGTGCTGCTCCTTAGATAGATCGAAAGA
+>ds2020-267_1233
+TTGCGGACGTGCTGAGGGGATCCTTATTGCGGACGTGCTGCTCCTTAGATAGATCGGAAG
+>ds2020-267_1234
+TCCGATCTATCTAAGGAGCAGCACGTCCGCAACCTGCTATCCGTCAGCACGTCCGCAACT
+>ds2020-267_1235
+TGAGTGAGTGAGTGAGTGAGTGAGTGAGTGAGTGAGTGAGTGAGTGAGTGAGTGAGTGA
+>ds2020-267_1236
+CCACTGCCACTGCCACTGTTGAGACTATCCCCCAAGCCAAAGGTATTGCGGACGTGCTG
+>ds2020-267_1237
+TTGCGGACGTGCTGACTGAGAGGGCATTGCGGAAGTGATCACGTATTGCGGACGTGCTG
+>ds2020-267_1238
+TTCCGATCTATCTAAGGAGCAGCACGTCCGCAAATTCATTCTGGTCAGCACGTCCGCAA
+>ds2020-267_1239
+ATTGCGGACGTGCTGAGGCACTGTTCGTTGCGGACGTGCTGCTCCTTAGATAGATCGGA
+>ds2020-267_1240
+TTGCGGACGTGCTGATGGGTTTCGTCTTGCGGACGTGCTGCTCCTTAGATAGATCGGAA
+>ds2020-267_1241
+CTTCCGATCTATCTAAGGAGCAGCACGTCCGCAACGTGCTATGCCTCACACGTCCGCAA
+>ds2020-267_1242
+TTGCGGACGTGCTGAGGGAACCGGCTTTGCGGACGTGCTGCTCCTTAGATAGATCGGAA
+>ds2020-267_1243
+TTCCGATCTATCTAAGGAGCAGCACGTCCGCAATCCGATTGCCCTCAGCACGTCCGCAA
+>ds2020-267_1244
+CTTCGATCTATCTAAGGAGCAGCACGTCCGCAAGAGATTACTCCTCAGCACGTCCGCAA
+>ds2020-267_1245
+TTGCGGACGTGCTGGGGAGTATTGCTTGCGGACGTGCTGCTCCTTAGATAGATCGGGAG
+>ds2020-267_1246
+TTAGAGGGACTATCGGCTCAAGCCGATGGAAGTTTGAGGCAATAACAGGTCTGTGCTG
+>ds2020-267_1247
+TTGCGGACGTGCTGAGGCGATACCTCTTGCGGACGTGCTGCTCCTTAGATAGATCGGA
+>ds2020-267_1248
+GTAAAAGCTCACTGGTAACCGGTCCAAAACGAAACTCTTAAAACAGTGGATACCCTCC
+>ds2020-267_1249
+CGGACGTGCTGAGACAATGGCGCTTGCGGACGTGCTGCTCCTTAGATAGATCGGAAGA
+>ds2020-267_1250
+CCCGATCTATCTAAGGAGCAGCACGCCCGCAAATGTACACCGGTCAGCACGTCCGCAA
+>ds2020-267_1251
+TCCGATCTATCTAAGGAGCAGCACGTCCGCAAGGTAGACGCCCTCAGCACGTCCGCAA
+>ds2020-267_1252
+GTGCTGAGCCAGACTACTTGCGGACGTGCTGAGGGAGCCTAAATTGCGGACGTGCTG
+>ds2020-267_1253
+TTGCGGACGTGCTGAGTGTTTACAATTTGCGGACGTGCTGCTCCTTAGATAGATCGG
+>ds2020-267_1254
+TGCTGAGCGACTATAAATTGCGGACGTGCTGAGGGATTCACCGTTGCGGACGTGCTG
+>ds2020-267_1255
+TTGCGGACGTGCTGACGGACGACTATTTGCGGACGTGCTGCTCCTTAGATAGATCGG
+>ds2020-267_1256
+GGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGG
+>ds2020-267_1257
+GCTGAGGGCAGTGGGCTTGCGGACGTGCTGACGGATACGTCATTGCGGGCGTGCTG
+>ds2020-267_1258
+CTCACTCCTCAGCACGTCCGCAAACTGCTTCGGGTTGGGACGTGCTGAGGAGTGAC
diff -r 000000000000 -r b82ce29791e7 test-data/otu_s1_rps.tab
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/otu_s1_rps.tab Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,109 @@
+#query_id query_length cdd_id hit_id evalue startQ endQ frame description superkingdom no rank family genus
+"ds2020-267_100" "376" "pfam02823" "gnl|CDD|376940" "3.06167e-09" "228" "347" "-3" "pfam02823, ATP-synt_DE_N, ATP synthase, Delta/Epsilon chain, beta-sandwich domain. Part of the ATP synthase CF(1). These subunits are part of the head unit of the ATP synthase. The subunit is called epsilon in bacteria and delta in mitochondria. In bacteria the delta (D) subunit is equivalent to the mitochondrial Oligomycin sensitive subunit, OSCP (pfam00213)." "Bacteria(0.97);Eukaryota(0.03);" "(1.00);" "Lactobacillaceae(0.05);Rhodobacteraceae(0.04);Streptococcaceae(0.03);Bacillaceae(0.03);Burkholderiaceae(0.02);" "Lactobacillus(0.04);Streptococcus(0.03);Bacillus(0.02);Mycoplasma(0.02);Synechococcus(0.01);"
+"ds2020-267_100" "376" "pfam00401" "gnl|CDD|366077" "8.90041e-05" "87" "218" "-3" "pfam00401, ATP-synt_DE, ATP synthase, Delta/Epsilon chain, long alpha-helix domain. Part of the ATP synthase CF(1). These subunits are part of the head unit of the ATP synthase. This subunit is called epsilon in bacteria and delta in mitochondria. In bacteria the delta (D) subunit is equivalent to the mitochondrial Oligomycin sensitive subunit, OSCP (pfam00213)." "Bacteria(0.97);Eukaryota(0.03);" "(1.00);" "(0.06);Clostridiaceae(0.05);Lachnospiraceae(0.05);Bacillaceae(0.04);Peptococcaceae(0.04);" "(0.06);Clostridium(0.05);Lactobacillus(0.03);Bacillus(0.03);Eubacterium(0.02);"
+"ds2020-267_114" "347" "pfam00471" "gnl|CDD|376336" "8.05888e-12" "132" "302" "3" "pfam00471, Ribosomal_L33, Ribosomal protein L33. " "Bacteria(0.86);Eukaryota(0.14);" "(1.00);" "(0.07);Mycoplasmataceae(0.07);Clostridiaceae(0.06);Bacillaceae(0.03);Lactobacillaceae(0.03);" "Mycoplasma(0.06);Clostridium(0.05);(0.04);Lactobacillus(0.02);Bacillus(0.02);"
+"ds2020-267_117" "344" "pfam00252" "gnl|CDD|376306" "7.27175e-23" "107" "295" "2" "pfam00252, Ribosomal_L16, Ribosomal protein L16p/L10e. " "Bacteria(0.58);Eukaryota(0.29);Archaea(0.13);" "(1.00);" "(0.08);Clostridiaceae(0.03);Mycoplasmataceae(0.03);Spirochaetaceae(0.02);" "(0.04);Clostridium(0.03);Mycoplasma(0.02);"
+"ds2020-267_118" "343" "pfam00421" "gnl|CDD|366090" "7.68219e-41" "92" "337" "-1" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-267_120" "339" "pfam16639" "gnl|CDD|374695" "2.20279e-25" "197" "325" "-3" "pfam16639, Apocytochr_F_N, Apocytochrome F, N-terminal. This is the N-terminal domain of cytochrome f. It is a soluble lumen-side domain." "Bacteria(0.75);Eukaryota(0.25);" "(1.00);" "Synechococcaceae(0.25);Gloeobacteraceae(0.07);Prochloraceae(0.07);Aphanothecaceae(0.07);(0.07);" "Synechococcus(0.21);Prochlorococcus(0.07);Gloeobacter(0.07);Oscillatoria(0.04);Aureococcus(0.04);"
+"ds2020-267_130" "330" "pfam00680" "gnl|CDD|366242" "7.64962e-05" "124" "282" "1" "pfam00680, RdRP_1, RNA dependent RNA polymerase. " "Viruses(1.00);" "Riboviria(1.00);" "Caliciviridae(0.30);Picornaviridae(0.30);Secoviridae(0.20);Potyviridae(0.20);" "Vesivirus(0.20);Aphthovirus(0.10);Sequivirus(0.10);Bymovirus(0.10);Potyvirus(0.10);"
+"ds2020-267_139" "320" "pfam05860" "gnl|CDD|368641" "1.34887e-13" "167" "298" "2" "pfam05860, Haemagg_act, haemagglutination activity domain. This domain is suggested to be a carbohydrate- dependent haemagglutination activity site. It is found in a range of haemagglutinins and haemolysins." "Bacteria(1.00);" "(1.00);" "Nostocaceae(0.36);Burkholderiaceae(0.14);Pasteurellaceae(0.14);Pseudomonadaceae(0.12);Neisseriaceae(0.07);" "Nostoc(0.36);Ralstonia(0.14);Pseudomonas(0.12);Haemophilus(0.10);Neisseria(0.07);"
+"ds2020-267_145" "315" "pfam02626" "gnl|CDD|376868" "3.97676e-05" "140" "256" "-3" "pfam02626, CT_A_B, Carboxyltransferase domain, subdomain A and B. Urea carboxylase (UC) catalyzes a two-step, ATP- and biotin-dependent carboxylation reaction of urea. It is composed of biotin carboxylase (BC), carboxyltransferase (CT), and biotin carboxyl carrier protein (BCCP) domains. The CT domain of UC consists of four subdomains, named A, B, C and D. This domain covers the A and B subdomains of the CT domain. This domain covers the whole length of KipA (kinase A) from Bacillus subtilis. It can also be found in S. cerevisiae urea amidolyase Dur1,2, which is a multifunctional biotin-dependent enzyme with domains for urea carboxylase and allophanate (urea carboxylate) hydrolase activity." "Bacteria(0.86);Eukaryota(0.13);Archaea(0.01);" "(1.00);" "Bacillaceae(0.03);Pseudonocardiaceae(0.03);Clostridiaceae(0.03);Corynebacteriaceae(0.03);Streptomycetaceae(0.03);" "Clostridium(0.03);Corynebacterium(0.03);Pseudomonas(0.02);Streptomyces(0.02);Bacillus(0.02);"
+"ds2020-267_16" "1165" "pfam02123" "gnl|CDD|280316" "1.58664e-38" "536" "1078" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_168" no_hit
+"ds2020-267_176" "291" "pfam01235" "gnl|CDD|376500" "1.13408e-29" "115" "243" "1" "pfam01235, Na_Ala_symp, Sodium:alanine symporter family. " "Bacteria(1.00);" "(1.00);" "Bacillaceae(0.10);Lachnospiraceae(0.07);Clostridiaceae(0.06);(0.06);Corynebacteriaceae(0.03);" "Bacillus(0.06);Clostridium(0.06);(0.06);Corynebacterium(0.03);Blautia(0.03);"
+"ds2020-267_187" "287" "pfam02673" "gnl|CDD|376891" "3.59766e-13" "7" "156" "1" "pfam02673, BacA, Bacitracin resistance protein BacA. Bacitracin resistance protein (BacA) is a putative undecaprenol kinase. BacA confers resistance to bacitracin, probably by phosphorylation of undecaprenol. More recent studies show that BacA has undecaprenyl pyrophosphate phosphatase activity. Undecaprenyl phosphate is a key lipid intermediate involved in the synthesis of various bacterial cell wall polymers. Bacitracin, a mixture of related cyclic polypeptide antibiotics, is used to treat surface tissue infections. Its primary mode of action is the inhibition of bacterial cell wall synthesis through sequestration of the essential carrier lipid undecaprenyl pyrophosphate, C55-PP, resulting in the loss of cell integrity and lysis. The characteristic phosphatase sequence-motif in this family is likely to be the PGxSRSGG, compared with the PSGH of the PAP family of phosphatases." "Bacteria(0.97);Archaea(0.03);" "(1.00);" "Clostridiaceae(0.08);(0.06);Lachnospiraceae(0.03);Ruminococcaceae(0.02);Bacillaceae(0.02);" "Clostridium(0.08);(0.04);Bacillus(0.02);Eubacterium(0.02);Prevotella(0.01);"
+"ds2020-267_2" "2436" "pfam02123" "gnl|CDD|280316" "2.17343e-21" "184" "1476" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_20" "893" "pfam00006" "gnl|CDD|376291" "4.59259e-49" "498" "866" "3" "pfam00006, ATP-synt_ab, ATP synthase alpha/beta family, nucleotide-binding domain. This entry includes the ATP synthase alpha and beta subunits, the ATP synthase associated with flagella and the termination factor Rho." "Bacteria(0.88);Archaea(0.07);Eukaryota(0.05);" "(1.00);" "(0.07);Mycoplasmataceae(0.06);Clostridiaceae(0.04);Spirochaetaceae(0.03);Rhodobacteraceae(0.02);" "Mycoplasma(0.06);(0.03);Clostridium(0.03);Treponema(0.01);Persephonella(0.01);"
+"ds2020-267_20" "893" "pfam02874" "gnl|CDD|367225" "7.30466e-19" "126" "329" "3" "pfam02874, ATP-synt_ab_N, ATP synthase alpha/beta family, beta-barrel domain. This family includes the ATP synthase alpha and beta subunits the ATP synthase associated with flagella." "Bacteria(0.60);Eukaryota(0.28);Archaea(0.13);" "(1.00);" "Spirochaetaceae(0.04);Bacillaceae(0.04);Schizosaccharomycetaceae(0.03);Chlamydomonadaceae(0.03);Sulfolobaceae(0.03);" "Treponema(0.04);Schizosaccharomyces(0.03);Chlamydomonas(0.03);Bacillus(0.03);Thermotoga(0.02);"
+"ds2020-267_203" "281" "pfam03040" "gnl|CDD|367312" "1.76794e-22" "121" "231" "-3" "pfam03040, CemA, CemA family. Members of this family are probable integral membrane proteins. Their molecular function is unknown. CemA proteins are found in the inner envelope membrane of chloroplasts but not in the thylakoid membrane. A cyanobacterial member of this family has been implicated in CO2 transport, but is probably not a CO2 transporter itself. They are predicted to be haem-binding however this has not been proven experimentally." "Bacteria(0.77);Eukaryota(0.23);" "(1.00);" "Synechococcaceae(0.17);Aphanothecaceae(0.08);Microcoleaceae(0.06);Chlorellaceae(0.04);Merismopediaceae(0.04);" "Synechococcus(0.13);Oscillatoria(0.04);Physcomitrella(0.04);Microcystis(0.04);Synechocystis(0.04);"
+"ds2020-267_206" "279" "pfam03947" "gnl|CDD|377170" "2.63457e-16" "155" "265" "2" "pfam03947, Ribosomal_L2_C, Ribosomal Proteins L2, C-terminal domain. " "Bacteria(0.62);Eukaryota(0.27);Archaea(0.11);" "(1.00);" "(0.09);Mycoplasmataceae(0.03);Clostridiaceae(0.02);Spirochaetaceae(0.01);Ruminococcaceae(0.01);" "(0.05);Mycoplasma(0.02);Clostridium(0.02);"
+"ds2020-267_21" "858" "pfam00680" "gnl|CDD|366242" "8.36679e-11" "295" "729" "-1" "pfam00680, RdRP_1, RNA dependent RNA polymerase. " "Viruses(1.00);" "Riboviria(1.00);" "Caliciviridae(0.30);Picornaviridae(0.30);Secoviridae(0.20);Potyviridae(0.20);" "Vesivirus(0.20);Aphthovirus(0.10);Sequivirus(0.10);Bymovirus(0.10);Potyvirus(0.10);"
+"ds2020-267_210" "276" "pfam17917" "gnl|CDD|375428" "1.59337e-13" "52" "240" "1" "pfam17917, RT_RNaseH, RNase H-like domain found in reverse transcriptase. DNA polymerase and ribonuclease H (RNase H) activities allow reverse transcriptases to convert the single-stranded retroviral RNA genome into double-stranded DNA, which is integrated into the host chromosome during infection. This entry represents the RNase H like domain." "unknown" "unknown" "unknown" "unknown"
+"ds2020-267_214" "276" "pfam07992" "gnl|CDD|369639" "2.55939e-07" "129" "254" "3" "pfam07992, Pyr_redox_2, Pyridine nucleotide-disulphide oxidoreductase. This family includes both class I and class II oxidoreductases and also NADH oxidases and peroxidases. This domain is actually a small NADH binding domain within a larger FAD binding domain." "Bacteria(0.82);Eukaryota(0.09);Archaea(0.09);" "(1.00);" "Pseudomonadaceae(0.12);Nocardiaceae(0.07);Thermococcaceae(0.05);Enterobacteriaceae(0.05);Merismopediaceae(0.05);" "Pseudomonas(0.12);Rhodococcus(0.07);Synechocystis(0.05);Pyrococcus(0.05);Streptococcus(0.04);"
+"ds2020-267_218" "274" "pfam01348" "gnl|CDD|279664" "1.66328e-05" "51" "257" "3" "pfam01348, Intron_maturas2, Type II intron maturase. Group II introns use intron-encoded reverse transcriptase, maturase and DNA endonuclease activities for site-specific insertion into DNA. Although this type of intron is self splicing in vitro they require a maturase protein for splicing in vivo. It has been shown that a specific region of the aI2 intron is needed for the maturase function. This region was found to be conserved in group II introns and called domain X." "Eukaryota(1.00);" "(1.00);" "Saccharomycetaceae(0.40);Brassicaceae(0.20);Schizosaccharomycetaceae(0.20);Poaceae(0.20);" "Saccharomyces(0.40);Hordeum(0.20);Schizosaccharomyces(0.20);Baimashania(0.20);"
+"ds2020-267_227" "272" "pfam00873" "gnl|CDD|334294" "2.32215e-15" "36" "245" "-1" "pfam00873, ACR_tran, AcrB/AcrD/AcrF family. Members of this family are integral membrane proteins. Some are involved in drug resistance. AcrB cooperates with a membrane fusion protein, AcrA, and an outer membrane channel TolC. The structure shows the AcrB forms a homotrimer." "Bacteria(1.00);" "(1.00);" "Enterobacteriaceae(0.40);Merismopediaceae(0.20);Pseudomonadaceae(0.13);Helicobacteraceae(0.13);Burkholderiaceae(0.07);" "Escherichia(0.40);Synechocystis(0.20);Pseudomonas(0.13);Helicobacter(0.13);Cupriavidus(0.07);"
+"ds2020-267_230" "268" "pfam00115" "gnl|CDD|376293" "1.95663e-15" "81" "236" "-3" "pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I. " "Bacteria(0.87);Archaea(0.09);Eukaryota(0.04);" "(1.00);" "(0.07);Sulfolobaceae(0.03);Flavobacteriaceae(0.03);Bacillaceae(0.02);Burkholderiaceae(0.02);" "(0.03);Methylobacterium(0.01);Hyphomicrobium(0.01);Rhodanobacter(0.01);"
+"ds2020-267_261" "260" "pfam01051" "gnl|CDD|376444" "1.77523e-19" "26" "217" "-2" "pfam01051, Rep_3, Initiator Replication protein. This protein is an initiator of plasmid replication. RepB possesses nicking-closing (topoisomerase I) like activity. It is also able to perform a strand transfer reaction on ssDNA that contains its target. This family also includes RepA which is an E.coli protein involved in plasmid replication. The RepA protein binds to DNA repeats that flank the repA gene." "Bacteria(0.97);(0.02);" "(0.99);" "Streptococcaceae(0.08);Enterobacteriaceae(0.07);Campylobacteraceae(0.07);Lactobacillaceae(0.07);Pasteurellaceae(0.06);" "Lactococcus(0.07);Campylobacter(0.07);Lactobacillus(0.06);Acinetobacter(0.04);Escherichia(0.04);"
+"ds2020-267_268" "259" "pfam02123" "gnl|CDD|280316" "3.22949e-21" "18" "251" "3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_274" "258" "pfam03713" "gnl|CDD|367619" "2.00811e-09" "24" "185" "-2" "pfam03713, DUF305, Domain of unknown function (DUF305). Domain found in small family of bacterial secreted proteins with no known function. Also found in Paramecium bursaria chlorella virus 1. This domain is short and found in one or two copies. The domain has a conserved HH motif that may be functionally important. This domain belongs to the ferritin superfamily. It contains two sequence similar repeats each of which is composed of two alpha helices." "Bacteria(1.00);" "(1.00);" "Nocardiaceae(0.13);Mycobacteriaceae(0.13);Pseudonocardiaceae(0.10);Kineosporiaceae(0.08);Micromonosporaceae(0.08);" "Nocardia(0.13);Mycolicibacterium(0.13);Saccharopolyspora(0.10);Kineococcus(0.08);Streptomyces(0.08);"
+"ds2020-267_278" "258" "pfam00012" "gnl|CDD|365808" "4.1355e-19" "50" "232" "2" "pfam00012, HSP70, Hsp70 protein. Hsp70 chaperones help to fold many proteins. Hsp70 assisted folding involves repeated cycles of substrate binding and release. Hsp70 activity is ATP dependent. Hsp70 proteins are made up of two regions: the amino terminus is the ATPase domain and the carboxyl terminus is the substrate binding region." "Eukaryota(0.54);Bacteria(0.38);Archaea(0.08);" "(1.00);" "Saccharomycetaceae(0.12);Schizosaccharomycetaceae(0.08);Enterobacteriaceae(0.08);Hominidae(0.08);Plasmodiidae(0.04);" "Homo(0.08);Schizosaccharomyces(0.08);Escherichia(0.08);Saccharomyces(0.08);Synechocystis(0.04);"
+"ds2020-267_280" "257" "pfam01788" "gnl|CDD|366811" "2.47901e-09" "132" "224" "-1" "pfam01788, PsbJ, PsbJ. This family consists of the photosystem II reaction centre protein PsbJ from plants and Cyanobacteria. In Synechocystis sp. PCC 6803 PsbJ regulates the number of photosystem II centers in thylakoid membranes, it is a predicted 4kDa protein with one membrane spanning domain." "Bacteria(0.65);Eukaryota(0.35);" "(1.00);" "Microcoleaceae(0.12);Prochloraceae(0.08);Oscillatoriaceae(0.08);Synechococcaceae(0.08);Chroococcaceae(0.08);" "Oscillatoria(0.08);Prochlorococcus(0.08);Synechococcus(0.08);Ectocarpus(0.04);Arenga(0.04);"
+"ds2020-267_283" "257" "pfam13041" "gnl|CDD|372443" "3.148e-06" "13" "114" "1" "pfam13041, PPR_2, PPR repeat family. This repeat has no known function. It is about 35 amino acids long and is found in up to 18 copies in some proteins. The family appears to be greatly expanded in plants and fungi. The repeat has been called PPR." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.30);Euphorbiaceae(0.25);Salicaceae(0.16);Funariaceae(0.05);Poaceae(0.04);" "Arabidopsis(0.30);Ricinus(0.25);Populus(0.16);Physcomitrella(0.05);Naegleria(0.03);"
+"ds2020-267_287" "256" "pfam00115" "gnl|CDD|376293" "2.8946e-26" "13" "237" "1" "pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I. " "Bacteria(0.87);Archaea(0.09);Eukaryota(0.04);" "(1.00);" "(0.07);Sulfolobaceae(0.03);Flavobacteriaceae(0.03);Bacillaceae(0.02);Burkholderiaceae(0.02);" "(0.03);Methylobacterium(0.01);Hyphomicrobium(0.01);Rhodanobacter(0.01);"
+"ds2020-267_312" "252" "pfam00585" "gnl|CDD|278982" "1.52007e-05" "29" "166" "2" "pfam00585, Thr_dehydrat_C, C-terminal regulatory domain of Threonine dehydratase. Threonine dehydratases pfam00291 all contain a carboxy terminal region. This region may have a regulatory role. Some members contain two copies of this region. This family is homologous to the pfam01842 domain." "Bacteria(0.69);Eukaryota(0.31);" "(1.00);" "Solanaceae(0.23);Enterobacteriaceae(0.15);Pasteurellaceae(0.15);Bacillaceae(0.08);Burkholderiaceae(0.08);" "Solanum(0.23);Haemophilus(0.15);Salmonella(0.15);Mycobacterium(0.08);Saccharomyces(0.08);"
+"ds2020-267_315" "251" "pfam00989" "gnl|CDD|366402" "1.61999e-05" "32" "241" "2" "pfam00989, PAS, PAS fold. The PAS fold corresponds to the structural domain that has previously been defined as PAS and PAC motifs. The PAS fold appears in archaea, eubacteria and eukarya." "Bacteria(0.65);Eukaryota(0.35);" "(1.00);" "Bacillaceae(0.14);Enterobacteriaceae(0.14);Bradyrhizobiaceae(0.12);Brassicaceae(0.08);Drosophilidae(0.06);" "Bacillus(0.14);Bradyrhizobium(0.12);Escherichia(0.10);Arabidopsis(0.08);Drosophila(0.06);"
+"ds2020-267_316" "251" "pfam02123" "gnl|CDD|280316" "3.50628e-08" "28" "228" "-3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_318" "251" "pfam00252" "gnl|CDD|376306" "5.63854e-12" "78" "206" "-1" "pfam00252, Ribosomal_L16, Ribosomal protein L16p/L10e. " "Bacteria(0.58);Eukaryota(0.29);Archaea(0.13);" "(1.00);" "(0.08);Clostridiaceae(0.03);Mycoplasmataceae(0.03);Spirochaetaceae(0.02);" "(0.04);Clostridium(0.03);Mycoplasma(0.02);"
+"ds2020-267_323" "250" "pfam00227" "gnl|CDD|365960" "5.8155e-09" "10" "150" "-2" "pfam00227, Proteasome, Proteasome subunit. The proteasome is a multisubunit structure that degrades proteins. Protein degradation is an essential component of regulation because proteins can become misfolded, damaged, or unnecessary. Proteasomes and their homologs vary greatly in complexity: from HslV (heat shock locus v), which is encoded by 1 gene in bacteria, to the eukaryotic 20S proteasome, which is encoded by more than 14 genes. Recently evidence of two novel groups of bacterial proteasomes was proposed. The first is Anbu, which is sparsely distributed among cyanobacteria and proteobacteria. The second is call beta-proteobacteria proteasome homolog (BPH)." "Eukaryota(0.68);Archaea(0.21);Bacteria(0.11);" "(1.00);" "Drosophilidae(0.11);Rhabditidae(0.07);Schizosaccharomycetaceae(0.07);Unikaryonidae(0.07);Saccharomycetaceae(0.07);" "Drosophila(0.11);Schizosaccharomyces(0.07);Caenorhabditis(0.07);Saccharomyces(0.07);Encephalitozoon(0.07);"
+"ds2020-267_329" "249" "pfam13173" "gnl|CDD|379049" "4.80752e-08" "106" "249" "1" "pfam13173, AAA_14, AAA domain. This family of domains contain a P-loop motif that is characteristic of the AAA superfamily." "Bacteria(0.78);Archaea(0.22);" "(1.00);" "Bacteroidaceae(0.12);Coxiellaceae(0.09);Mycoplasmataceae(0.09);Sulfolobaceae(0.08);Prevotellaceae(0.05);" "Bacteroides(0.12);Coxiella(0.09);Mycoplasma(0.09);Prevotella(0.05);Sulfurisphaera(0.04);"
+"ds2020-267_33" "680" "pfam04157" "gnl|CDD|367847" "4.86455e-13" "342" "494" "-1" "pfam04157, EAP30, EAP30/Vps36 family. This family includes EAP30 as well as the Vps36 protein. Vps36 is involved in Golgi to endosome trafficking. EAP30 is a subunit of the ELL complex. The ELL is an 80-kDa RNA polymerase II transcription factor. ELL interacts with three other proteins to form the complex known as ELL complex. The ELL complex is capable of increasing that catalytic rate of transcription elongation, but is unable to repress initiation of transcription by RNA polymerase II as is the case of ELL. EAP30 is thought to lead to the derepression of ELL's transcriptional inhibitory activity." "Eukaryota(1.00);" "(1.00);" "Saccharomycetaceae(0.06);Debaryomycetaceae(0.05);(0.03);Schizosaccharomycetaceae(0.02);Mamiellaceae(0.02);" "Candida(0.02);Schizosaccharomyces(0.02);Micromonas(0.02);Leishmania(0.01);Naumovozyma(0.01);"
+"ds2020-267_336" "248" "pfam00113" "gnl|CDD|365883" "4.23282e-13" "15" "116" "-1" "pfam00113, Enolase_C, Enolase, C-terminal TIM barrel domain. " "Eukaryota(0.67);Bacteria(0.33);" "(1.00);" "Pleosporaceae(0.11);Bacillaceae(0.11);Anatidae(0.11);Schizosaccharomycetaceae(0.11);Debaryomycetaceae(0.11);" "Shigella(0.11);Anas(0.11);Bipolaris(0.11);Zea(0.11);Bacillus(0.11);"
+"ds2020-267_352" "245" "pfam00946" "gnl|CDD|366381" "3.23548e-05" "1" "141" "1" "pfam00946, Mononeg_RNA_pol, Mononegavirales RNA dependent RNA polymerase. Members of the Mononegavirales including the Paramyxoviridae, like other non-segmented negative strand RNA viruses, have an RNA-dependent RNA polymerase composed of two subunits, a large protein L and a phosphoprotein P. This is a protein family of the L protein. The L protein confers the RNA polymerase activity on the complex. The P protein acts as a transcription factor." "Viruses(1.00);" "Riboviria(1.00);" "Paramyxoviridae(0.44);Rhabdoviridae(0.31);Pneumoviridae(0.12);Filoviridae(0.12);" "Lyssavirus(0.12);Aquaparamyxovirus(0.06);Rubulavirus(0.06);Respirovirus(0.06);Avulavirus(0.06);"
+"ds2020-267_363" "243" "pfam00416" "gnl|CDD|366086" "2.02528e-05" "15" "134" "-2" "pfam00416, Ribosomal_S13, Ribosomal protein S13/S18. This family includes ribosomal protein S13 from prokaryotes and S18 from eukaryotes." "Eukaryota(0.55);Bacteria(0.27);Archaea(0.18);" "(1.00);" "Brassicaceae(0.18);Muridae(0.09);Poaceae(0.09);Drosophilidae(0.09);Mycobacteriaceae(0.09);" "Arabidopsis(0.18);Geobacillus(0.09);Rattus(0.09);Haloarcula(0.09);Shigella(0.09);"
+"ds2020-267_364" "243" "pfam00216" "gnl|CDD|365952" "1.5507e-10" "134" "241" "-3" "pfam00216, Bac_DNA_binding, Bacterial DNA-binding protein. " "Bacteria(0.95);Eukaryota(0.02);Viruses(0.01);Archaea(0.01);" "(0.99);Caudovirales(0.01);" "Tannerellaceae(0.09);Mycoplasmataceae(0.06);Pseudomonadaceae(0.05);Aquificaceae(0.05);Bacteroidaceae(0.05);" "Parabacteroides(0.09);Mycoplasma(0.05);Pseudomonas(0.05);Bacteroides(0.05);Desulfovibrio(0.04);"
+"ds2020-267_365" no_hit
+"ds2020-267_369" "243" "pfam12137" "gnl|CDD|378818" "6.51052e-05" "137" "217" "-3" "pfam12137, RapA_C, RNA polymerase recycling family C-terminal. This domain is found in bacteria. This domain is about 360 amino acids in length. This domain is found associated with pfam00271, pfam00176. The function of this domain is not known, but structurally it forms an alpha-beta fold in nature with a central beta-sheet flanked by helices and loops, the beta-sheet being mainly antiparallel and flanked by four alpha helices, among which the two longer helices exhibit a coiled-coil arrangement." "Bacteria(1.00);" "(1.00);" "Pasteurellaceae(0.14);Alteromonadaceae(0.07);Morganellaceae(0.05);Methylococcaceae(0.05);Shewanellaceae(0.04);" "(0.04);Marinobacter(0.04);Shewanella(0.04);Pseudomonas(0.03);Psychromonas(0.03);"
+"ds2020-267_370" "242" "pfam00146" "gnl|CDD|376297" "2.41391e-10" "22" "111" "1" "pfam00146, NADHdh, NADH dehydrogenase. " "Bacteria(0.78);Archaea(0.12);Eukaryota(0.10);" "(1.00);" "(0.04);Peptococcaceae(0.02);Flavobacteriaceae(0.02);Desulfurococcaceae(0.02);Prevotellaceae(0.02);" "(0.02);Prevotella(0.02);Bacteroides(0.01);"
+"ds2020-267_374" "242" "pfam00124" "gnl|CDD|365890" "5.09126e-07" "21" "125" "3" "pfam00124, Photo_RC, Photosynthetic reaction centre protein. " "Bacteria(0.95);Eukaryota(0.05);" "(1.00);" "Rhodobacteraceae(0.13);Chromatiaceae(0.13);Ectothiorhodospiraceae(0.08);Synechococcaceae(0.05);(0.05);" "Rhodobacter(0.08);Sphingomonas(0.05);Halorhodospira(0.05);Roseiflexus(0.05);Thioflavicoccus(0.05);"
+"ds2020-267_388" "241" "pfam02123" "gnl|CDD|280316" "6.16383e-08" "35" "214" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_4" "2297" "pfam02123" "gnl|CDD|280316" "1.96254e-52" "824" "1858" "-2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_402" no_hit
+"ds2020-267_404" "239" "pfam00361" "gnl|CDD|366050" "3.50341e-05" "70" "219" "1" "pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla." "Eukaryota(0.54);Bacteria(0.46);" "(1.00);" "Culicidae(0.23);Rhodobacteraceae(0.23);Poaceae(0.15);Enterobacteriaceae(0.15);Phasianidae(0.08);" "Paracoccus(0.23);Anopheles(0.23);Escherichia(0.15);Zea(0.15);Aspergillus(0.08);"
+"ds2020-267_407" "239" "pfam00177" "gnl|CDD|365924" "1.14399e-06" "28" "126" "1" "pfam00177, Ribosomal_S7, Ribosomal protein S7p/S5e. This family contains ribosomal protein S7 from prokaryotes and S5 from eukaryotes." "Bacteria(0.79);Archaea(0.11);Eukaryota(0.10);" "(1.00);" "(0.09);Clostridiaceae(0.04);Mycoplasmataceae(0.03);Spirochaetaceae(0.02);Ruminococcaceae(0.01);" "(0.04);Clostridium(0.04);Mycoplasma(0.03);Treponema(0.01);Desulfovibrio(0.01);"
+"ds2020-267_42" "575" "pfam00284" "gnl|CDD|366000" "1.02897e-21" "187" "300" "1" "pfam00284, Cytochrom_B559a, Lumenal portion of Cytochrome b559, alpha (gene psbE) subunit. This family is the lumenal portion of cytochrome b559 alpha chain, matches to this family should be accompanied by a match to the pfam00283 family also. The Prosite pattern pattern matches the transmembrane region of the cytochrome b559 alpha and beta subunits." "Bacteria(0.86);Eukaryota(0.14);" "(1.00);" "Synechococcaceae(0.17);Microcoleaceae(0.09);Aphanothecaceae(0.09);Prochloraceae(0.06);Phaeodactylaceae(0.03);" "Synechococcus(0.17);Prochlorococcus(0.06);Stanieria(0.03);Acaryochloris(0.03);Selaginella(0.03);"
+"ds2020-267_42" "575" "pfam00283" "gnl|CDD|365999" "1.54942e-08" "79" "165" "1" "pfam00283, Cytochrom_B559, Cytochrome b559, alpha (gene psbE) and beta (gene psbF)subunits. " "Bacteria(0.59);Eukaryota(0.41);" "(1.00);" "Synechococcaceae(0.29);Prochloraceae(0.12);Pseudanabaenaceae(0.06);Acaryochloridaceae(0.06);Thalassiosiraceae(0.06);" "Synechococcus(0.29);Prochlorococcus(0.12);Selaginella(0.06);Gloeobacter(0.06);Thalassiosira(0.06);"
+"ds2020-267_42" "575" "pfam00283" "gnl|CDD|365999" "2.95472e-07" "325" "411" "1" "pfam00283, Cytochrom_B559, Cytochrome b559, alpha (gene psbE) and beta (gene psbF)subunits. " "Bacteria(0.59);Eukaryota(0.41);" "(1.00);" "Synechococcaceae(0.29);Prochloraceae(0.12);Pseudanabaenaceae(0.06);Acaryochloridaceae(0.06);Thalassiosiraceae(0.06);" "Synechococcus(0.29);Prochlorococcus(0.12);Selaginella(0.06);Gloeobacter(0.06);Thalassiosira(0.06);"
+"ds2020-267_427" no_hit
+"ds2020-267_428" "235" "pfam00164" "gnl|CDD|333891" "1.04166e-24" "3" "182" "3" "pfam00164, Ribosom_S12_S23, Ribosomal protein S12/S23. This protein is known as S12 in bacteria and archaea and S23 in eukaryotes." "Bacteria(0.45);Eukaryota(0.27);Archaea(0.27);" "(1.00);" "Thermococcaceae(0.09);Micrococcaceae(0.09);Enterobacteriaceae(0.09);Thermaceae(0.09);Muridae(0.09);" "Thermococcus(0.09);Saccharomyces(0.09);Rickettsia(0.09);Synechococcus(0.09);Thermus(0.09);"
+"ds2020-267_436" no_hit
+"ds2020-267_438" no_hit
+"ds2020-267_444" no_hit
+"ds2020-267_457" no_hit
+"ds2020-267_466" "230" "pfam00072" "gnl|CDD|333815" "5.42419e-08" "50" "208" "2" "pfam00072, Response_reg, Response regulator receiver domain. This domain receives the signal from the sensor partner in bacterial two-component systems. It is usually found N-terminal to a DNA binding effector domain." "Bacteria(0.94);Eukaryota(0.06);" "(1.00);" "Enterobacteriaceae(0.38);Bacillaceae(0.13);Pseudomonadaceae(0.10);Rhodobacteraceae(0.08);Saccharomycetaceae(0.04);" "Escherichia(0.21);Bacillus(0.13);Salmonella(0.12);Pseudomonas(0.10);Rhodobacter(0.06);"
+"ds2020-267_471" "230" "pfam00201" "gnl|CDD|278624" "3.12575e-07" "46" "210" "1" "pfam00201, UDPGT, UDP-glucoronosyl and UDP-glucosyl transferase. " "Eukaryota(1.00);" "(1.00);" "Hominidae(0.46);Muridae(0.31);Leporidae(0.15);Poaceae(0.08);" "Homo(0.46);Rattus(0.31);Oryctolagus(0.15);Zea(0.08);"
+"ds2020-267_486" "228" "pfam17035" "gnl|CDD|374956" "5.12677e-09" "108" "203" "3" "pfam17035, BET, Bromodomain extra-terminal - transcription regulation. The BET, or bromodomain extra-terminal domain, is found on bromodomain proteins that play key roles in development, cancer progression and virus-host pathogenesis. It interacts with NSD3, JMJD6, CHD4, GLTSCR1, and ATAD5 all of which are shown to impart a pTEFb-independent transcriptional activation function on the bromodomain proteins." "Eukaryota(1.00);" "(1.00);" "(0.06);Poaceae(0.05);Brassicaceae(0.05);Saccharomycetaceae(0.05);Musaceae(0.05);" "Musa(0.05);Glycine(0.03);Populus(0.03);Ichthyophthirius(0.03);Arabidopsis(0.03);"
+"ds2020-267_5" no_hit
+"ds2020-267_504" no_hit
+"ds2020-267_506" "226" "pfam05173" "gnl|CDD|377479" "2.45773e-17" "93" "215" "-3" "pfam05173, DapB_C, Dihydrodipicolinate reductase, C-terminus. Dihydrodipicolinate reductase (DapB) reduces the alpha,beta-unsaturated cyclic imine, dihydro-dipicolinate. This reaction is the second committed step in the biosynthesis of L-lysine and its precursor meso-diaminopimelate, which are critical for both protein and cell wall biosynthesis. The C-terminal domain of DapB has been proposed to be the substrate- binding domain." "Bacteria(0.89);Archaea(0.07);Eukaryota(0.04);" "(1.00);" "Clostridiaceae(0.07);(0.06);Flavobacteriaceae(0.04);Lachnospiraceae(0.03);Ruminococcaceae(0.03);" "Clostridium(0.06);(0.04);Prevotella(0.02);Eubacterium(0.02);Ruminococcus(0.01);"
+"ds2020-267_516" no_hit
+"ds2020-267_529" "224" "pfam00510" "gnl|CDD|366140" "6.14777e-23" "35" "211" "2" "pfam00510, COX3, Cytochrome c oxidase subunit III. " "Eukaryota(1.00);" "(1.00);" "Culicidae(0.14);Phasianidae(0.14);Rhabditidae(0.14);Schizosaccharomycetaceae(0.14);Saccharomycetaceae(0.14);" "Anopheles(0.14);Schizosaccharomyces(0.14);Caenorhabditis(0.14);Gallus(0.14);Neurospora(0.14);"
+"ds2020-267_550" no_hit
+"ds2020-267_555" "222" "pfam00124" "gnl|CDD|365890" "7.71427e-08" "48" "203" "3" "pfam00124, Photo_RC, Photosynthetic reaction centre protein. " "Bacteria(0.95);Eukaryota(0.05);" "(1.00);" "Rhodobacteraceae(0.13);Chromatiaceae(0.13);Ectothiorhodospiraceae(0.08);Synechococcaceae(0.05);(0.05);" "Rhodobacter(0.08);Sphingomonas(0.05);Halorhodospira(0.05);Roseiflexus(0.05);Thioflavicoccus(0.05);"
+"ds2020-267_557" "222" "pfam00421" "gnl|CDD|366090" "3.32623e-20" "12" "200" "-2" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-267_558" "222" "pfam03737" "gnl|CDD|377116" "4.93695e-13" "57" "179" "-2" "pfam03737, RraA-like, Aldolase/RraA. Members of this family include regulator of ribonuclease E activity A (RraA) and 4-hydroxy-4-methyl-2-oxoglutarate (HMG)/4-carboxy- 4-hydroxy-2-oxoadipate (CHA) aldolase, also known as RraA-like protein. RraA acts as a trans-acting modulator of RNA turnover, binding essential endonuclease RNase E and inhibiting RNA processing. RraA-like proteins seem to contain aldolase and/or decarboxylase activity either in place of or in addition to the RNase E inhibitor functions." "Bacteria(0.81);Archaea(0.09);Eukaryota(0.09);" "(1.00);" "(0.05);Alcaligenaceae(0.03);Burkholderiaceae(0.03);Saccharomycetaceae(0.03);Streptomycetaceae(0.03);" "Bacillus(0.03);Corynebacterium(0.03);Streptomyces(0.03);(0.03);Advenella(0.02);"
+"ds2020-267_565" "222" "pfam03950" "gnl|CDD|377172" "9.52435e-10" "53" "184" "-3" "pfam03950, tRNA-synt_1c_C, tRNA synthetases class I (E and Q), anti-codon binding domain. Other tRNA synthetase sub-families are too dissimilar to be included. This family includes only glutamyl and glutaminyl tRNA synthetases. In some organisms, a single glutamyl-tRNA synthetase aminoacylates both tRNA(Glu) and tRNA(Gln)." "Bacteria(0.37);Archaea(0.36);Eukaryota(0.27);" "(1.00);" "(0.07);Thermoproteaceae(0.04);Sulfolobaceae(0.04);Methanobacteriaceae(0.04);Desulfurococcaceae(0.04);" "(0.07);Geobacter(0.02);Caenorhabditis(0.02);Encephalitozoon(0.02);Dictyostelium(0.02);"
+"ds2020-267_571" "221" "pfam00501" "gnl|CDD|366135" "2.61467e-07" "34" "201" "1" "pfam00501, AMP-binding, AMP-binding enzyme. " "Bacteria(0.56);Eukaryota(0.35);Archaea(0.09);" "(1.00);" "Bacillaceae(0.12);Streptomycetaceae(0.10);Mycobacteriaceae(0.09);Rhabditidae(0.09);Brassicaceae(0.07);" "Bacillus(0.12);Streptomyces(0.10);Caenorhabditis(0.09);Mycobacterium(0.07);Archaeoglobus(0.07);"
+"ds2020-267_58" "476" "pfam03641" "gnl|CDD|367590" "7.19579e-14" "142" "315" "-3" "pfam03641, Lysine_decarbox, Possible lysine decarboxylase. The members of this family share a highly conserved motif PGGXGTXXE that is probably functionally important. This family includes proteins annotated as lysine decarboxylases, although the evidence for this is not clear." "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Brassicaceae(0.17);Pseudomonadaceae(0.12);Mycobacteriaceae(0.08);Caulobacteraceae(0.08);Streptomycetaceae(0.08);" "Arabidopsis(0.17);Pseudomonas(0.12);Mesorhizobium(0.08);Caulobacter(0.08);Mycobacterium(0.08);"
+"ds2020-267_589" no_hit
+"ds2020-267_595" "219" "pfam02123" "gnl|CDD|280316" "5.90575e-11" "13" "210" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_597" "219" "pfam00421" "gnl|CDD|366090" "8.10522e-27" "22" "207" "1" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-267_599" "219" "pfam05717" "gnl|CDD|377551" "3.2952e-06" "28" "147" "1" "pfam05717, TnpB_IS66, IS66 Orf2 like protein. This protein is found in insertion sequences related to IS66. The function of these proteins is uncertain, but they are probably essential for transposition." "Bacteria(0.99);" "(1.00);" "(0.07);Burkholderiaceae(0.06);Lachnospiraceae(0.05);Rhizobiaceae(0.05);Bacteroidaceae(0.04);" "(0.06);Bacteroides(0.04);Burkholderia(0.02);Bradyrhizobium(0.02);Sinorhizobium(0.02);"
+"ds2020-267_6" "1860" "pfam02123" "gnl|CDD|280316" "1.35634e-17" "1147" "1764" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-267_610" "218" "pfam17759" "gnl|CDD|380005" "1.47034e-13" "25" "195" "1" "pfam17759, tRNA_synthFbeta, Phenylalanyl tRNA synthetase beta chain CLM domain. This domain corresponds to the catalytic like domain (CLM) in the beta chain of phe tRNA synthetase." "unknown" "unknown" "unknown" "unknown"
+"ds2020-267_622" "217" "pfam16363" "gnl|CDD|379835" "2.10592e-11" "29" "157" "2" "pfam16363, GDP_Man_Dehyd, GDP-mannose 4,6 dehydratase. " "Bacteria(0.76);Eukaryota(0.19);Archaea(0.05);" "(1.00);" "(0.05);Flavobacteriaceae(0.05);Paenibacillaceae(0.02);Spirochaetaceae(0.02);Nocardioidaceae(0.02);" "Flavobacterium(0.02);Leptospira(0.01);Paenibacillus(0.01);Plasmodium(0.01);Methylobacterium(0.01);"
+"ds2020-267_636" "217" "pfam13041" "gnl|CDD|372443" "7.94482e-18" "64" "195" "-2" "pfam13041, PPR_2, PPR repeat family. This repeat has no known function. It is about 35 amino acids long and is found in up to 18 copies in some proteins. The family appears to be greatly expanded in plants and fungi. The repeat has been called PPR." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.30);Euphorbiaceae(0.25);Salicaceae(0.16);Funariaceae(0.05);Poaceae(0.04);" "Arabidopsis(0.30);Ricinus(0.25);Populus(0.16);Physcomitrella(0.05);Naegleria(0.03);"
+"ds2020-267_637" "217" "pfam07026" "gnl|CDD|284449" "1.36077e-13" "47" "172" "2" "pfam07026, DUF1317, Protein of unknown function (DUF1317). This family consists of several hypothetical bacterial and phage proteins of around 60 residues in length. The function of this family is unknown." "Viruses(0.50);Bacteria(0.50);" "Caudovirales(0.50);(0.50);" "Siphoviridae(0.50);Morganellaceae(0.50);" "Photorhabdus(0.50);Lambdavirus(0.50);"
+"ds2020-267_639" "216" "pfam13631" "gnl|CDD|379304" "4.98182e-07" "2" "214" "2" "pfam13631, Cytochrom_B_N_2, Cytochrome b(N-terminal)/b6/petB. " "Bacteria(0.65);Archaea(0.25);Eukaryota(0.10);" "(1.00);" "Mycobacteriaceae(0.15);Thermomonosporaceae(0.10);Sulfolobaceae(0.10);Thermoplasmataceae(0.10);Drosophilidae(0.05);" "Thermomonospora(0.10);Mycobacterium(0.10);Saccharolobus(0.10);Thermoplasma(0.10);Streptomyces(0.05);"
+"ds2020-267_641" "216" "pfam00804" "gnl|CDD|366315" "9.72957e-23" "23" "187" "-3" "pfam00804, Syntaxin, Syntaxin. Syntaxins are the prototype family of SNARE proteins. They usually consist of three main regions - a C-terminal transmembrane region, a central SNARE domain which is characteristic of and conserved in all syntaxins (pfam05739), and an N-terminal domain that is featured in this entry. This domain varies between syntaxin isoforms; in syntaxin 1A it is found as three alpha-helices with a left-handed twist. It may fold back on the SNARE domain to allow the molecule to adopt a 'closed' configuration that prevents formation of the core fusion complex - it thus has an auto-inhibitory role. The function of syntaxins is determined by their localization. They are involved in neuronal exocytosis, ER-Golgi transport and Golgi-endosome transport, for example. They also interact with other proteins as well as those involved in SNARE complexes. These include vesicle coat proteins, Rab GTPases, and tethering factors." "Eukaryota(1.00);" "(1.00);" "Adrianichthyidae(0.08);Tetraodontidae(0.08);Brassicaceae(0.08);Poaceae(0.06);Funariaceae(0.06);" "Oryzias(0.08);Physcomitrella(0.06);Oreochromis(0.06);Selaginella(0.06);Arabidopsis(0.05);"
+"ds2020-267_642" no_hit
+"ds2020-267_643" no_hit
+"ds2020-267_65" "462" "pfam13406" "gnl|CDD|372592" "4.82338e-27" "145" "360" "-1" "pfam13406, SLT_2, Transglycosylase SLT domain. This family is related to the SLT domain pfam01464." "Bacteria(1.00);" "(1.00);" "Rhizobiaceae(0.23);Phyllobacteriaceae(0.08);Chromobacteriaceae(0.08);Methylococcaceae(0.08);Legionellaceae(0.08);" "Sinorhizobium(0.23);Piscirickettsia(0.08);Acinetobacter(0.08);Desulfotalea(0.08);Ruegeria(0.08);"
+"ds2020-267_669" "215" "pfam17862" "gnl|CDD|380037" "4.46873e-06" "33" "122" "-1" "pfam17862, AAA_lid_3, AAA+ lid domain. This entry represents the alpha helical AAA+ lid domain that is found to the C-terminus of AAA domains." "unknown" "unknown" "unknown" "unknown"
+"ds2020-267_685" "214" "pfam09334" "gnl|CDD|370442" "1.80219e-14" "16" "117" "-2" "pfam09334, tRNA-synt_1g, tRNA synthetases class I (M). This family includes methionyl tRNA synthetases." "Bacteria(0.57);Archaea(0.26);Eukaryota(0.17);" "(1.00);" "Erwiniaceae(0.09);Methanocaldococcaceae(0.04);Thermoproteaceae(0.04);Streptomycetaceae(0.04);Methanosarcinaceae(0.04);" "Saccharolobus(0.04);Leptospira(0.04);Wigglesworthia(0.04);Borreliella(0.04);Saccharomyces(0.04);"
+"ds2020-267_692" "214" "pfam00680" "gnl|CDD|366242" "4.79875e-05" "70" "180" "1" "pfam00680, RdRP_1, RNA dependent RNA polymerase. " "Viruses(1.00);" "Riboviria(1.00);" "Caliciviridae(0.30);Picornaviridae(0.30);Secoviridae(0.20);Potyviridae(0.20);" "Vesivirus(0.20);Aphthovirus(0.10);Sequivirus(0.10);Bymovirus(0.10);Potyvirus(0.10);"
+"ds2020-267_697" "214" "pfam00378" "gnl|CDD|334046" "5.08319e-08" "45" "170" "-3" "pfam00378, ECH_1, Enoyl-CoA hydratase/isomerase. This family contains a diverse set of enzymes including: enoyl-CoA hydratase, napthoate synthase, carnitate racemase, 3-hydroxybutyryl-CoA dehydratase and dodecanoyl-CoA delta-isomerase." "Bacteria(0.56);Eukaryota(0.44);" "(1.00);" "Bacillaceae(0.33);Hominidae(0.22);Enterobacteriaceae(0.11);Rhabditidae(0.11);Rhodobacteraceae(0.11);" "Bacillus(0.33);Homo(0.22);Rhodobacter(0.11);Escherichia(0.11);Mus(0.11);"
+"ds2020-267_710" no_hit
+"ds2020-267_719" "213" "pfam00072" "gnl|CDD|333815" "9.1657e-13" "45" "185" "-2" "pfam00072, Response_reg, Response regulator receiver domain. This domain receives the signal from the sensor partner in bacterial two-component systems. It is usually found N-terminal to a DNA binding effector domain." "Bacteria(0.94);Eukaryota(0.06);" "(1.00);" "Enterobacteriaceae(0.38);Bacillaceae(0.13);Pseudomonadaceae(0.10);Rhodobacteraceae(0.08);Saccharomycetaceae(0.04);" "Escherichia(0.21);Bacillus(0.13);Salmonella(0.12);Pseudomonas(0.10);Rhodobacter(0.06);"
+"ds2020-267_729" "212" "pfam01405" "gnl|CDD|279713" "5.43744e-05" "19" "99" "-3" "pfam01405, PsbT, Photosystem II reaction centre T protein. The exact function of this protein is unknown. It probably consists of a single transmembrane spanning helix. The Chlamydomonas reinhardtii psbT protein appears to be (i) a novel photosystem II subunit and (ii) required for maintaining optimal photosystem II activity under adverse growth conditions." "Bacteria(0.73);Eukaryota(0.27);" "(1.00);" "Synechococcaceae(0.33);Prochloraceae(0.13);Aphanothecaceae(0.07);Chlamydomonadaceae(0.07);Chamaesiphonaceae(0.07);" "Synechococcus(0.33);Prochlorococcus(0.13);Aureococcus(0.07);Geitlerinema(0.07);Rippkaea(0.07);"
+"ds2020-267_746" no_hit
+"ds2020-267_75" "425" "pfam00005" "gnl|CDD|365804" "4.26261e-07" "129" "275" "-1" "pfam00005, ABC_tran, ABC transporter. ABC transporters for a large family of proteins responsible for translocation of a variety of compounds across biological membranes. ABC transporters are the largest family of proteins in many completely sequenced bacteria. ABC transporters are composed of two copies of this domain and two copies of a transmembrane domain pfam00664. These four domains may belong to a single polypeptide as in CFTR, or belong in different polypeptide chains." "Bacteria(0.74);Eukaryota(0.26);" "(1.00);" "Enterobacteriaceae(0.41);Saccharomycetaceae(0.13);Pseudomonadaceae(0.07);Streptococcaceae(0.06);Bacillaceae(0.04);" "Escherichia(0.37);Saccharomyces(0.13);Pseudomonas(0.07);Bacillus(0.04);Lactococcus(0.04);"
+"ds2020-267_750" "211" "pfam02391" "gnl|CDD|376774" "1.24642e-05" "28" "114" "-2" "pfam02391, MoaE, MoaE protein. This family contains the MoaE protein that is involved in biosynthesis of molybdopterin. Molybdopterin, the universal component of the pterin molybdenum cofactors, contains a dithiolene group serving to bind Mo. Addition of the dithiolene sulfurs to a molybdopterin precursor requires the activity of the converting factor. Converting factor contains the MoaE and MoaD proteins." "Bacteria(0.72);Eukaryota(0.21);Archaea(0.07);" "(1.00);" "(0.04);Bacillaceae(0.03);Mycobacteriaceae(0.02);Burkholderiaceae(0.02);Paenibacillaceae(0.02);" "Bacillus(0.02);(0.01);Drosophila(0.01);Paenibacillus(0.01);Mycobacterium(0.01);"
+"ds2020-267_763" no_hit
+"ds2020-267_773" "210" "pfam01641" "gnl|CDD|376583" "5.23903e-34" "16" "174" "1" "pfam01641, SelR, SelR domain. Methionine sulfoxide reduction is an important process, by which cells regulate biological processes and cope with oxidative stress. MsrA, a protein involved in the reduction of methionine sulfoxides in proteins, has been known for four decades and has been extensively characterized with respect to structure and function. However, recent studies revealed that MsrA is only specific for methionine-S-sulfoxides. Because oxidized methionines occur in a mixture of R and S isomers in vivo, it was unclear how stereo-specific MsrA could be responsible for the reduction of all protein methionine sulfoxides. It appears that a second methionine sulfoxide reductase, SelR, evolved that is specific for methionine-R-sulfoxides, the activity that is different but complementary to that of MsrA. Thus, these proteins, working together, could reduce both stereoisomers of methionine sulfoxide. This domain is found both in SelR proteins and fused with the peptide methionine sulfoxide reductase enzymatic domain pfam01625. The domain has two conserved cysteine and histidines. The domain binds both selenium and zinc. The final cysteine is found to be replaced by the rare amino acid selenocysteine in some members of the family. This family has methionine-R-sulfoxide reductase activity." "Bacteria(0.79);Eukaryota(0.16);Archaea(0.05);" "(1.00);" "Flavobacteriaceae(0.05);(0.04);Saccharomycetaceae(0.02);Vibrionaceae(0.01);Spirochaetaceae(0.01);" "(0.02);Mycoplasma(0.01);Vibrio(0.01);Corynebacterium(0.01);"
+"ds2020-267_8" "1703" "pfam00680" "gnl|CDD|366242" "2.85682e-13" "685" "1458" "-3" "pfam00680, RdRP_1, RNA dependent RNA polymerase. " "Viruses(1.00);" "Riboviria(1.00);" "Caliciviridae(0.30);Picornaviridae(0.30);Secoviridae(0.20);Potyviridae(0.20);" "Vesivirus(0.20);Aphthovirus(0.10);Sequivirus(0.10);Bymovirus(0.10);Potyvirus(0.10);"
+"ds2020-267_811" "208" "pfam07991" "gnl|CDD|285265" "1.80927e-08" "20" "190" "-1" "pfam07991, IlvN, Acetohydroxy acid isomeroreductase, NADPH-binding domain. Acetohydroxy acid isomeroreductase catalyzes the conversion of acetohydroxy acids into dihydroxy valerates. This reaction is the second in the synthetic pathway of the essential branched side chain amino acids valine and isoleucine. This N-terminal region of the enzyme carries the binding-site for NADPH. The active-site for enzymatic activity lies in the C-terminal part, IlvC, pfam01450." "Bacteria(0.76);Archaea(0.24);" "(1.00);" "Bacillaceae(0.07);Helicobacteraceae(0.05);Sulfolobaceae(0.05);Bartonellaceae(0.02);Leptospiraceae(0.02);" "Bacillus(0.07);Thermus(0.02);Tropheryma(0.02);Corynebacterium(0.02);Pyrococcus(0.02);"
+"ds2020-267_817" "208" "pfam05656" "gnl|CDD|377540" "3.45664e-06" "86" "190" "-1" "pfam05656, DUF805, Protein of unknown function (DUF805). This family consists of several bacterial proteins of unknown function." "Bacteria(1.00);" "(1.00);" "Veillonellaceae(0.07);Sutterellaceae(0.06);Sphingomonadaceae(0.05);Rhodobacteraceae(0.04);Caulobacteraceae(0.04);" "Veillonella(0.04);Sphingomonas(0.04);Asticcacaulis(0.03);Dakarella(0.03);Prevotella(0.03);"
+"ds2020-267_837" "207" "pfam04061" "gnl|CDD|367791" "2.43363e-18" "1" "159" "1" "pfam04061, ORMDL, ORMDL family. Evidence form suggests that ORMDLs are involved in protein folding in the ER. Orm proteins have been identified as negative regulators of sphingolipid synthesis that form a conserved complex with serine palmitoyltransferase, the first and rate-limiting enzyme in sphingolipid production. This novel and conserved protein complex, has been termed the SPOTS complex (serine palmitoyltransferase, Orm1/2, Tsc3, and Sac1)." "Eukaryota(1.00);" "(1.00);" "Saccharomycetaceae(0.15);Nosematidae(0.04);(0.04);Phaffomycetaceae(0.03);Salpingoecidae(0.03);" "Kazachstania(0.04);Thalassiosira(0.03);Trichomonas(0.03);Nosema(0.03);Nakaseomyces(0.03);"
+"ds2020-267_94" no_hit
+"ds2020-267_97" "380" "pfam04879" "gnl|CDD|368171" "1.9903e-08" "125" "274" "-2" "pfam04879, Molybdop_Fe4S4, Molybdopterin oxidoreductase Fe4S4 domain. This domain is found in formate dehydrogenase H for which the structure is known. This first domain (residues 1 to 60) of Structure 1aa6 is an Fe4S4 cluster just below the protein surface." "Bacteria(0.75);Archaea(0.25);" "(1.00);" "Enterobacteriaceae(0.11);Bacillaceae(0.09);Pseudomonadaceae(0.08);Methanobacteriaceae(0.06);Phyllobacteriaceae(0.06);" "Bacillus(0.09);Escherichia(0.09);Pseudomonas(0.08);Mesorhizobium(0.06);Synechococcus(0.06);"
+"ds2020-267_98" "379" "pfam16203" "gnl|CDD|374428" "1.33948e-30" "131" "280" "-1" "pfam16203, ERCC3_RAD25_C, ERCC3/RAD25/XPB C-terminal helicase. This is the C-terminal helicase domain of ERCC3, RAD25 and XPB helicases." "Eukaryota(1.00);" "(1.00);" "Cryptosporidiidae(0.06);Vahlkampfiidae(0.06);(0.03);Opisthorchiidae(0.03);Chaetomiaceae(0.03);" "Naegleria(0.06);Cryptosporidium(0.06);Micromonas(0.03);Batrachochytrium(0.03);Caenorhabditis(0.03);"
diff -r 000000000000 -r b82ce29791e7 test-data/otu_s1_tblastx.tab
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/otu_s1_tblastx.tab Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,57 @@
+#algo query_id nb_reads query_length accession description organism percentIdentity nb_hsps queryOverlap hitOverlap evalue score tax_id taxonomy sequence
+TBLASTX ds2020-267_392 26 240 NC_005979 Helminthosporium victoriae 145S virus Helminthosporium victoriae 145S virus 40.0 1 100 6.0 1.12512e-11 66.1329 164750 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Chrysovirus;Helminthosporium victoriae 145S virus CAGCACGTCCGCAAGTTGTCCGGCTTAAATCTTTAGCCCCTAACTTAAGTGCCGCTACAGCTCCATTTTCTATTACTTTTTTTGTTCTATCACATAACCACATTCCTTCGAAGACTGATAGTTGTGAAATTTCATATATGTTGTCTTCATCTAAGTAATATAGAAATTTGAAACTTGGTGTTGCGTCCGTTAAACGTAGATCAGTGAAGTACGCACCCATTCGTAGTTGCGGACGTGCTG
+TBLASTX ds2020-267_268 14 259 NC_001963 Sphaeropsis sapinea RNA virus 1, complete genome Sphaeropsis sapinea RNA virus 1 62.0 1 100 5.0 1.78772e-31 132.115 73497 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Victorivirus;Sphaeropsis sapinea RNA virus 1 CAGCACGTCCGCAATGCATGGCCTCTGAGTTTGTGGAAACGAACCCTCTGCCAACCTGGGACGGCACGACCCACGTCTCTAAGTCTGCCAAGTTAGAACACGGGAAGACCCGCGCAATATTCGCCTGCGACACCCGGTCGTATTTTGGGTTTTCGTGGATCCTAGATGCGACCCAACAGGCCTGGAAGAACGAACGGGTTGTCATGGATCCGGGCAAAGGTGGGAAGTGTGGGATGACGCAACGATTGCGGACGTGCTG
+TBLASTX ds2020-267_4 1434 2297 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 44.3 8 100 64.0 1.9240409540575e-07 928.6219 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B CTTCCGATCTATCTAAGGAGCAGCACGTCCGCAATTCAGCTACTCTCAGCACGTCCGCAATACTAACAGCTCAGCGCGTCCGCAACACGACTGGGGCACACGTCCGCAACGTCCACGACTTATCACTTGCGGACGTGCTGCTCCTTAGATTCTGGAAGTAAGGACGTTCGGGCTTCCTATTCCGCTTTATTAAGGTACACTAAGTAACTATTCCTATTAACTCCATCGGGTCCTTAGATCCTTTGAGTAGGTGTAGTAGTGGGCCGCTTTTATTGGTCCCATTCAACACGTCCATCAGGAAGCCGGTCATTTTGGCTTTTCCGTAATTGACTATGTCTGTTTCTTCTTTGTGTACCTTGAATAACGCTCGCAAAATCTCGTACCGCTTGATGTTACCATTCCTTGAAACGTTTATGTTCCTTTCTTTTGGTATCACCGCGTCGTATGTTGCGCGCATTATTCGTGAAATGAAATCCTGCAAAGGTCTTTCAAGTTGTAGTGATGCTTTCACCATCCTGGAGTAGTCCACCACTCCCGGTAACACGCCTATCTGCGTGGCACCCTTCCTGAAGCCCGACGACCGTATCATCCACTTTACGTCCGATCTCTTGTCTTCACTTATGCCCCCCACACACCTGTGGGAGGTCTTTATTTTATAACAGTCTGAAACTGTCATGTGCAATCGCTCACATTGTCTCGAGTAGTATTTGTTCCTCAATGACGCCGCTAACCACATTGGCATTCCCCTAGACACTGAATCGTCCAGACGCGACTCCAGCGCTTCCAAAAGGTCCCTCATATCGCTTGAAGGTTTTGACTCTATCCTCGAGTGTACCAAGGTTGCCATAGCTCTAGATAGATACTGTCCCTTAGACCCACGTTTGTGATCTACGCGTAGAAACTCTGCTATGGCCCCATACGCACATTTGCTCATCTGCAGGCGTATGTTGTGCTTCTTGGCATTTTTGCCAGCTAGCAACACGTCCTCGAGCGAATTACTTCCCAGTAGCACGTCGTCACCGTTGTGGAGGCTGTTTTGCGATTGTACCACGTCAGGTACTATCAGTTGAGTGTAAATGTAGTTAAGCACGCTGTTCATGAACGTAGTGAGTCGCCACCCCGATAACAGGGTCCCCTTAGCGTTGTACTCCATTTTCAAGCCTTGATTGTCGTGTACTATTACCCTATCCAGTGAAAGCCGAGTCCACTCCACAGCTGCTAGTTGCTCCTGAGTCAGGAAGTGTCCGAAAGTATCTCTGTACGCATCTATTACTGCTTTCATAGATTGTACACTGTGTTGACTGTTGAAATCCTCGAAATCTACACAATACTGAGTCCTGCCTTCTAAGACTGACCTTACTCTACTGCGGACGTTCTCATCGTTGGCTGCTTTTCCCACCGGGAACGGCGAGGGCAATACGTCCTCGCAGTTATAGAAGGCGAAATGTGCCAATACGTAACTAGTGACATCTGTCCCGTAGATAGCGCGGAGTTTGCTCCATTCATACTTCGTGGATGACCATGCGTGAAGTTCAGGATCTCTTTCGCGCCACGAGTCCATATTCATATCCGGCATGGCCAGTATTGATATGAACTTGTTCTTGAGGTATATGTCTTTGAATATGTATTTATCGTCTTCTGAATATTGCGAGTGTATGCTGCCGGCCGCACTCCACTGCCACCTACTCTGCCAGTACTCCCGCCAATCAAACTTCCTCGGTCTCTTACCCGCTGAGATCGATCTACTGAAGAGCTGCGAGGCCCTTTCATAAACCAATCCCTCCGGCATCTCGGCCAAGTTAGGGGACACCCTGTTCTTGTGCTCCTCCTCCCAGTTGACCAGTCTTGATTTGCGGACGTGCTGCTCCTTAGATANNNNNNNNNNGGACGTTCGGGCTTTGCGCTGGCAATGGAGAACAGTCCTGACCCTCTAGCGAGCTGCATCTCCTCGGGGGTGAGACCAGCTGCCCACAGTGCCACGCCCGTAAGGAATGAGTTAGTAGCTTCTCTGGTTATTGATAAGGCCAGAGCTACGCTGTCAGAGTTGACTCCCAAAATGTCTACCACCTCCTTGAACGAAAAGTGAACATGATGCGACGCCGTTATCTTGGTGTGTTTTGCCGACATTGCTTCATGTAACTGCCACCCTCTGCCTTGCTGTCCATTTACTTTCCTCAATAATCGCTTCGGAGACACAGGGTCCTCAAAGTCGATAGAATCGTAAAGACCTGAGGTGTGCCTGGTCATTTGAGAAAGTATTTCTTTGCGTATACCCCAAGATCTTTGCGGACGTGCTG
+TBLASTX ds2020-267_18 840 1037 NC_016760 Rosellinia necatrix quadrivirus 1 segment 3, complete genome Rosellinia necatrix quadrivirus 1 27.1 2 100 15.0 2.0868e-13 98.9223 1000373 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Quadriviridae;Quadrivirus;Rosellinia necatrix quadrivirus 1 CAGCACGTCCGCAAAGTGAAGCCGGTAAGAGGTCAGGCGACGTTGGCCAGAGCAAGGCTATGGCTGCAGGTGACATAGGGAGAGTTGACGCAATGGTGATTGCGTCACAGACAAGCTGGTGGCACCCTGGCGTGACTATGTGGATTGCAGCCTACAAGCTAGCCGTAGCAATACTGGCTAGCGCCAAAACTCTGATGATGACCGAGAAGGAGATAGAGGCTCTTATCAACTACACGTTCACAAGGACCACGTACAGGAAACTAGTAGCCAGCAACGCGCTAATGGATTCTACGAGAGACATAGCAGCCAGTGAGGTGACCCAAGCAGCATCAACCCCAGTCAGGTGGGAGAGGCAGGTGCACCCAATAGTCCTAGTACTAGACGATGCAGAGTACTCGATTACAAGAAAGACAGCTAGTGCAGAAATCACTAGCGTGTACGACAAAGTGCACTCGCACATGGCGCTAAGCCTTGGGTCTCTCTACGGTGACATGGCGCACACTAGGATGAAGCAGCCAAATAGGATTGGCACTGGTTTGTTGGCAAAATCAGGCAGGGCACAAAGGGCAAGTCCAGTTTTTGCCAAACTGAGATTGACTGATAACACAGTGACAGTTACGGCGTGCCCTACATCAGACTCAGACGCAGTACTGATGTCGATAAGCAAAGGCATTGAAAAGGCTGGCCTACACAACGTTACGCTGGGAAATGAAGTGGTGAAAGTTGTGAGGAAGCCTGAGTACGGCATGACACTGACGTACCTGATACCTTCGACAATCAGTGGGAAAGGTGCTGACAAGTCATATGTCTATTTGGCTGGCATGCACTTCAGGGAGGACGATCTAACGTACTCTTTGCCTACGCTAGAGTTCTTGTCGCAGTTCACGACAGAATATGAACCGGTCAAGCCTGACAAGCGGCAAAAGATGTTTCGCCTGCTAGTAGACCCAGTGACGACAAGGGTCCACCACAGGCACATGTCCTTGCTAACAGTAATGGCGACTTGTGGACACGCATGGGCACTTGCGGACGTGCTG
+TBLASTX ds2020-267_699 10 214 NC_033476 Botryosphaeria dothidea virus 1 strain YZN115 RNA-dependent RNA polymerase (RdRp) gene, complete cds Botryosphaeria dothidea virus 1 61.5 1 100 7.0 1.87612e-16 81.712 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 CAGCACTTGTCTCCTAAATTAGCAAGATCGCGCGTTCACCCTTTTGTTTCAAGCAGGTTGCTTAGTTATGGTGATAACCAAATTGTTAGCGAAGAGTTGTTTGTATCCGTCGGGTTACGCTATGACCCGGAAAAACATGCACAGCATCTGGCCAGATTTGGTATGACCCTAAAAATTGACGAAACTGAAGTGACTATATATTGCGGACGTGCTG
+TBLASTX ds2020-267_595 10 219 NC_038928 Aspergillus foetidus slow virus 1 CP gene and RdRp gene, genomic RNA Aspergillus foetidus slow virus 1 51.2 2 100 7.0 1.97993e-05 142.3464 1087070 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Victorivirus;Aspergillus foetidus slow virus 1 CAGCACGTCCGCAACAATGCGTATCTGAGGGCGGCCGTAGGGAAGACCTGGTACGAGGGTGCGCTATCGCTGCACACAGGCGACGATGTCTTTATCAGGGCGAACACCCTCGCCGACTGTTCCGTCATTCTCAGTGATGCGGTTGCCTTCGGATGCCGTATGAACCCAACCAAACAGTCAATCGGATTCTACAATCGACTAGCCTTGCGGACGTGCTGA
+TBLASTX ds2020-267_512 12 225
+TBLASTX ds2020-267_10 16208 1619 NC_038825 Flammulina velutipes browning virus CP1 gene for coat protein, complete cds Flammulina velutipes browning virus 35.1 2 100 30.0 3.63103e-21 125.3928 568090 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Alphapartitivirus;Flammulina velutipes browning virus CAGCACGTCCGCAATTTGGGTGGTCTGTTGAGACCATTAGATTGTTTCATTGCGTGTTGAACGCATTGCGACAGAAACAGTTGAGTGGGGCTTAAAGTAGAAAAAAAGCAAACAACAATGGAAGGTCGTTCAGTAAAAAGAAATTAGAAAACAGAAAAAGAGAAAAACTCGGGGGTGTCGCGAGAATTTGCGCTTCTCTATTCAAATCTGAGTGCGGAGGGGGTGTGGTAGTAGCCGGAAATCAACGGTGCAATGGTGTTGCTGACGTTGTATTGCGAAGTTCGACGACTATCGGGAATACTGAAGATTGGTCCGACGTGGGTTGACTTAAAGTCAGGGCCAGAAGTGTCGGTGACATCTTTGTTGATGTCAGTCCAATCGGAGTTGAGCTGAGTGAGGATGCCGGCCTGTTCAGTGACTAGGTCGAGAAACTCTTCAGAGTGGAGGTGGATCGTAGTGATTCCAGTAAATTCTGGAATATCATACCGGAGCGTGGAACCGGTCTGATAACGGACTTTGCGCGTGGTAACGGCATGAACAAGAATGTTCTTGTTTTGCCTAGTAGCCACGTACTTTGTACGTACATAGGAGATCCCAGTGCCAGTAGTGGTCACGGAGCCAAGGGAAACAGTGTCCTTGAAGAAATCACTGTAAGGCTGCATGACGCGGATGACTTGAGCAAACCAACCGTAAGGTCGGTCAGCATGATTGCCGATGCCGCGAAAACCGAAGACCTGGTCGAGGTCGAGGGTATCGTCGTCGTCGGAGATGACATATTGACTGTCACCGTCATTGGCGAAGGGGAGGGTGTTGCGCCACACGTTGGATGAGGTGGCGAGGCCGTTGAGGAGACCAACAGTGGTCTGGAAGTCGGACCGAGCACTAGGCGTAAGCATAGCAAAACGGGTCGCTTCGTCCTTGGAGGCGGGGGCGCCGAAGATCGTCGTATAGACGGTATCCGTGTGGGAAGCATTGGCTTGGACTGGGCCAGAGTTGACAGGCGAGATCAGGGAGATCAATCGCATGAACTGATCAAGAATGAAGATCACATTCGGGAGAATGGTGTGAACTTTGTCTTGCCAGAGGAAACTGGTGCAGTTGATGTCATGGGCATTGGGTATGCCAAAGACAAGATTGCCAAAATTTTCGTTGGGGCCAGCGTTGGCGGCGAGAGACTGGAAGAAGATGGCGACAGGGCCAGGGATCTTCAAGTGTTCGGCCTTGAATTGGCTGTCGAGAAACTCGACAAACAAACGTTGATCGTTGGTGATCATACCACCGTGAGATTGGTTCTTGAGAACCTGGTAGTAGAACAACACAGCGATGTAAAGCTGGGAGACGAAAGGGTGCCAGTCAGGGTTGGCGTCGGTGAAACGCTTGGTTCTGACCATCTGCGTGTCCATGATAGACAGGACGTAGAAGAGCTGAGTGGTGTCAGGCACGACATAGGATATGTCATTGTGCTTGATGCCGAAGAAGGGGAGGTCGGAGACGCCTGATAGCATCATTGAGAGACCCGGGTTCTTGGGGCCAGCGGAGCTTGCAGTGGGTTCGCGAGGGGCGAAACTCTTCTGCTTCTTGGCAGGAACCGAGTATTGCGGACGTGCTGCTCCTTAGAT
+TBLASTX ds2020-267_29 426 726
+TBLASTX ds2020-267_235 16 267
+TBLASTX ds2020-267_177 50 290 NC_039077 Prunus virus F isolate 8816-v1 segment RNA1 polyprotein 1 gene, complete cds Prunus virus F 90.4 3 100 13.0 5.317733333334419e-40 575.046 1855510 Viruses;Orthornavirae;Pisuviricota;Pisoniviricetes;Picornavirales;Secoviridae;Fabavirus;Prunus virus F AAGCCCACTATTTCAAACTTTGCTTTTGCTACACTTCTTTGCTCTCTTGACCATCTGTGTTTATTCCCAATGGCTTTTCCCCTGTTTGTTGATACCTATGAGCATGTTGCAAAACATGACAAGAAATATTATGGATCTTTCCCAGCCACCTTCACTTTGGTTGCTGGAGGTGGGGTGATTGATCTTGAGAAAATGTTTTCTGGAGTCCGCAAACTAAAGCGCCATTTGACGCTACACCGAATGTTTGCGGGCTGTGTTCTGGGCACAGAAGCTGCTTTGCGGACGTGCTG
+TBLASTX ds2020-267_444 10 233 NC_033476 Botryosphaeria dothidea virus 1 strain YZN115 RNA-dependent RNA polymerase (RdRp) gene, complete cds Botryosphaeria dothidea virus 1 68.5 1 100 7.0 1.4637e-19 92.2508 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 CAGCACGTCCGCAATGTGGCAACCGTGTACGACGTTTCCGATGACACCCTGTCTATCAAGTGCCCCAGTATCAGCATATTATTGGCGTTTGTGTTGATAAGGGACGTGTAATAGGAACCACTCGGCATCGTCCCAAAAAGGTTGACAAGGTACCCCGAAGGATGCTCAAGAAGCTTCTTGAGAAGCTGGCGCTTTGACACAGATGACATAGCCTAACGTTTGCGGACGTGCTG
+TBLASTX ds2020-267_441 2 234 NC_006961 Pleurotus ostreatus virus 1 RNA-1, complete genome Pleurotus ostreatus virus 1 36.2 1 100 9.0 6.11518e-09 56.9688 674983 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Betapartitivirus;Pleurotus ostreatus virus 1 CAGCACGTCCGCAAGTTGAGTTCAGTGGTGTAAACGAGTTGTCCAGTGTGGTAACGGTAAGGGAGTACAGTAATGCCAGGTTGTGGAAATCTGTTGTTTGGAAGTTCGTTGTCGTCTAAGTGACGATAAAATTCGAAGGGTTCGTTACGGTCAATGTTCGCTTGAGTGTAGCGTTCATATGTTTGAGAGAAGGTGTGTTCGTATTCTGATGTGCGATGACTTGCGGACGTTCTG
+TBLASTX ds2020-267_7 1414 1772 NC_033486 Wuhan fly virus 5 strain fly34516 segment Seg 2 hypothetical protein gene, complete cds Wuhan fly virus 5 28.4 1 100 15.0 9.16869e-08 56.9688 1923699 Viruses;Wuhan fly virus 5 CAGCACGTCCGCAAAGTTCGCTCTCTTCATTGAGCTAATTGGTTAAAAGTCTACTTGTTAAGTAGCATTCACATCAAGGAAAGAATTTCGTCAAAATGGCATACCAAAAGCCCGACAAATCGACCGTCTCCGGCACGACTCTTACGCCAGATGACTCAGCCTCACAAGCTGGTCCACAAAATGATACCCCCAATCCTGCGAAGTCCGGACGCCCAAAGCGTTCATCAAAGATTTCAAAGGGCAAAGATCTACCTCCGGGTGCGATCAAGGTACCAAAAGGTGGCGCCAACATGACGGGGAAAGCATCTCCCGTACAGTCTGCAACCATTCCATTTCGGGATGGGGAGAAATAGACCTCAACTCTCATAGAAATGAGATTGAGCCGGTCTTCACAGTCGACGCTCAGCCGTATGACGACCTTGTCAACGTGGTGTACTCATCACTTCAGTCGCGATACTCAAATGCGGCGAAGCACATCCCGTTTGGCCTCTTCCGCTACTACTGCATGCAATTGTGGTGGTATCGGGTTCTTTTTCTGCATCGCACGAACGGCAATGCTCTCACATCTGACGAACGTCAGTTCATGAGCATCATGGAGACTGGACAAGAGTTCCAAATCCCCTCCCAAATAGCACAGTATCTTGCCAACCTTGGCAATTTCATGCAAGGAGGAGAGAACTTCTTTTTCCGCCTGCCCCCACACGCCTTCGCCGAAGCAACAGGCACTATCCACTCAGGATGGTTTGCCTCTGGTCTTCCCACCGCCAAGGTGGACACAACTTCCTTCTGGAAGTACGCTCAACTTCCGAGTCCGGGCGTTTTCGTGTCCTATATGTGCAACGAAGCACATTACAACACCCCTGGCCACCAGCCCAATCGTCTCTTCGATCTCTCAGAGATCGCCCCCACCATTTCCGACGACAGTTATTCAGTTCCGACTGATAACATCGTTGGTTGGAGTAACGGCATTTACACTGCCACGCACGCCTCCTGGCGTTCGACATACTCCAATCTTGGCTGGTCAATCGACGGTTGTGCCCTTGACTCTCAGACAACATTCATGCTCTCGACATCGACCATGCGTGCCGTGTCTGACCGTATTGCGTCCGTCACCGGACTCAAAGTGAACACGTCAACACAGTTGACACTCTCTGTGCAAGGCAATCCCCTGGATTGCTACTACCTTGCAACTGTGGACTACGCCTCCAACCGCTCTCAGTGGCCAAAGGCACCTGGTCCTCATCAACAACAGAAAGTGAACGGCTGTTTGCACACAGAACTCGCCCTCCACTCCCGCTACGCCATGGACTCAAAAGTCCTATCACCCGCGTTCTCGTTCGGATATCGCCTAGAGCGATCGCTCATCTGGAACGGTACATACGATACCGACAGACGTCCGGTCCACGCTCAGGCCAGCAACTATCAGCCCTGGCTGATACAGTCTGAAGCCGACGACAAATACCGCGATCCTGGCCCCGCATGGATGGCCCATATGAACGATTCGTTCAATTTTGGTTCTTCATTGAACTTGAATTTACGACGATTTTCGACTCATGGCCTCATTCGTTCTGTCGCGCTTGACGCGTCCGTTGTCCTCAGTGACACCAAGTAGAAACTTCTTCTTCTACTACAGCAACTCTCTCTCTTGGTAAAGCTCACTGGTAACCGGTCCAAAACGAAACTCTTAAAACAGTGGATACCCTCCGGGGCGCACGTCCGCAAGGGTCCGGCAGTTGCGGACGTGCTACCCAAAGACCTTTGCGGACGTGCTG
+TBLASTX ds2020-267_692 5 214 NC_039077 Prunus virus F isolate 8816-v1 segment RNA1 polyprotein 1 gene, complete cds Prunus virus F 67.4 3 100 9.0 7.700429233333334e-12 283.7636 1855510 Viruses;Orthornavirae;Pisuviricota;Pisoniviricetes;Picornavirales;Secoviridae;Fabavirus;Prunus virus F GACGCACTGACCGTCTATGGGGCTGGGTGTAATGAAATTGTTGGGGAGTGGAAAGATGCCTCTCCACATTTCACATTTGAAGATGCCACTTTGGATGAGGCTATTAATGGTGTTGAAGACTTGGATTACTTTGACTCCCTTGTGATCGGAACTTCGGAAGGCTATCCCTATGTTCTTGAGAGGGAGACAAATCAGAAAGGTAAGTCGCGATATT
+TBLASTX ds2020-267_496 273 227 NC_038824 Carrot cryptic virus segment RNA 1 RNA-dependent RNA polymerase gene, complete cds Carrot cryptic virus 47.8 1 100 10.0 1.27723e-14 75.7553 589918 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Alphapartitivirus;Carrot cryptic virus CAGCAGGTCCGCAACGTCGGTTTTGTGTCCGTATCGGCGGTGCCAATCGGTTGCGAGGGGTGTGTAGAGCGATTCGAGTCGGTCAAACACTGCGCGGAAGGTTGTTCGATTCGCTAAGAAATAGGAATCGGTGGCGAAGGGGGCTTCAGCGTTCACGTGCCATTTATATGGGTAGTGGGGCTGCACATCATAGATGTGGGCAGGTCGTCAATTTTGCGGACGTGCTG
+TBLASTX ds2020-267_40 385 586 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 38.7 1 100 7.0 9.86751e-21 98.2075 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B TCTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTCTCGCTACCTGTACTTGCAAGCCCCTACTGCTGGTTGGCTGAATGAGAATGATATAGTTTCCCCTTCCATCGTAAGCACGTGCGGTAAGGGGAAAGATCGTCCAGTTCGTTCCTCAGAATCACATACCCTGACGGCAGCCCCCGGAATAACAGTGTCAAATACTGACTCGGGTGCGATTATACATTCTCTCACGTTACAGTAGGGCGTAAAAAGACCCCTTGAACTTAGGTCTTCGAACACCACTTCGTGCCCGAAGACTCTGTAAGCGTTTGCTAGTCGCAAGGCATCTCTAGGCTCCATGACGAAATCATCACCAATAGGTATAGACTGCATCCCTGTCAAATGTGAAATCCCGTCGTACCCATCAACCACACAACCCGCTAACAATGCTCCCGAGACGTAAACAGGTACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAATCCGGTATCCCTCAGCACGTCCGCAACTGATAGCTACTCAGCACGTCCCAACAGTCAACCCCTTGCGGACGTGCTG
+TBLASTX ds2020-267_526 4 225
+TBLASTX ds2020-267_305 14 253
+TBLASTX ds2020-267_204 13 279 NC_033494 Botryosphaeria dothidea virus 1 strain YZN115 segment RNA3 hypothetical protein gene, complete cds Botryosphaeria dothidea virus 1 35.8 1 100 8.0 1.7348e-05 45.9718 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 CAGCACGTCCGCAATTGGATACCGGTCATTCACTGAATTCGTTGATAGAGTAGGCGGTGTGTCAAGGTACGGAGCACATTTTTACGTCGATCACCACGTGTTTGCATCTTCATTTGAGGAGGGCCACGTCCTTGGCGATGTTGTAGAAGAAGAGGACTATAACGCAGCAACCATTTGCGGACGTTACGCGTCGGACATAACCTTTTCCTGCGAGTCAGAAACGCCAGATTTTGAATTGGTAGCAAGATTTCTGTCGTCGGAAGCTGCGGACGTGCTGAG
+TBLASTX ds2020-267_419 16 236
+TBLASTX ds2020-267_130 45 330 NC_006937 Fusarium graminearum dsRNA mycovirus-1, complete genome Little cherry virus 2 52.4 2 100 8.0 1.496345e-12 249.1092 154339 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Closteroviridae;Ampelovirus;Little cherry virus 2 CAGCACGTCCGCAACTGCAAATGGATAGACTCCAAGGTCCGAACTGTAATTGGTTCTCCTATAACCCAGTATATAATGAGCACCATATGGAATTATGGTCCCAATCACAACTTTGCTTGGGAGACCACACCCATCAAAGTGGGCATGCCACTAAATGGGTTTTGGCTGTCCAAGTTGTTCTCTAAACATGCCAGGTGCCAAATGCACATTGAGGGTGACTTTGAAGCTTTTGACTCAACCATCTCCGGGTCCGTTGTTGACCTTATTAAGGATGTGAGGAAGAAAGGGTATGAAATGCATAGAGACAGGGCTTCAGTTGCGGACGTGCTG
+TBLASTX ds2020-267_27 60 729 NC_006937 Fusarium graminearum dsRNA mycovirus-1, complete genome Little cherry virus 2 47.7 3 100 5.0 1.29455e-22 141.58100000000002 154339 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Closteroviridae;Ampelovirus;Little cherry virus 2 ACAGCACGTCCGCAATTGATGCAGTTTCAACCTCGGCCCAGGCCTTTGTAGGGTTTGGTGGAGGCTTTGCCTCTTGAGTTTCATTGTGTTTTACATGCCGACGCAGTTTTTGATGCCTGTGGTGGAGTTTTTGATACAGGTCTTTGCCACCCTTACTACTCGAGGGTTCTGGCCTGACCATAATGACTCTGGTGGGTCATTTGTAGAGTGGCTTGTCTGGAGATTCACTTGGGTCGTTGTCAACGCGACCGCTGTTGCTGAGTCTGTCAATGCCGAAGTCCGCAAGAGGCACAGTGACAAAATATCACCAGACTCTGTCCGTCTTGCAGCAATTTTCAGGAGTTTCTTCATTCAGGGTGTTGCCTTCATTGATGAGTTGGGATTGCCTCACTATCTACGATCCTACACCCCTGTGGAAATGACTAAACAGGCCCTGGACAAGTCTCTGTCTCTAATGGCTGAAGTCGGGTGGCCAGTGAATGTGGCCACGGATGAGAGGGTTGATCCCATTGCGGAACGCATGGGATTCAAAGAGTGGGTCCTTTGTGGACGTGCTGNNNNNNNNNNCATTTGTAGAGTGGCTTGTCTGGAGATTCACTTGGGTCGTTGTCAACGCGACCGCTGTTGCTGAGTCTGTCAATGCCGAAGTCCGCAAGAGGCACAGTGACAAAATATCACCAGACTCTGTCCGTCTTGCAGCAATTTTCAGGAGTTTCTTCATTCAGGGTG
+TBLASTX ds2020-267_51 94 500 NC_020903 Xanthophyllomyces dendrorhous virus L1A capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1A 54.8 1 100 5.0 4.95153e-19 92.2508 1167690 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1A CAGCACGTCCGCAAGGAATTCCCCCTCAGCACGTCCGCAACGTATGCCCATCAGCACGTCCCAAACCCAACCCAATTTGCGGACGTGCTGCTCCTTAGATACGCTTAAGGCGACGCACTGACCGTCGAGAAGCAACTAACTCGTTCCTAACGGGTGTGGCGCTGTGGGCGGCTGGCCTCACTGATGACGAGATGATGCTTGCTAGGGGGTCAGGGCTGTTCTCCCTCGCAAGCGTCAAGGATTACAAGCGCGAAGCTAAGCGCATAAGCGTGGAAGCAAAATCTCTACAAAACTTGGTAGATGTGGACTTGAGAAAGTTCTTCGAACTAGAGGTGCTAGTCAATAGGGGACACGACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAAAAGACCTGAGTTTATTGCGACGTGCTGAGGGACTCGAGTTTGCGGACGTGCTGAGACGTAAACATTGCGGACGTGCTGCGCCTTAGATAGAGCGGA
+TBLASTX ds2020-267_9 1360 1660 NC_016760 Rosellinia necatrix quadrivirus 1 segment 3, complete genome Rosellinia necatrix quadrivirus 1 33.7 6 100 35.0 5.95825e-14 361.9737 1000373 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Quadriviridae;Quadrivirus;Rosellinia necatrix quadrivirus 1 TATCTAAGGAGCAGCACGTCCGCAAGCCACGTACGGTGAAAAGAGAGCAGTCGCGCCTGGCGACTTGGGCTTGGTGGACTCGCTTGTGGTGAAGTCACAGATTGATTGGTGGCATTGCAATGTCACTATGTGGGTGGCCGCTTACAAGTTGTCTGTGACGCTAGCTGCATCGTGTGGTGACATGAACTTCAGTGGTGAGGAAGTTAATGAGATCATACAGTACACGTTCAGCCGCTCAACATACAGGAAGCTCGTAGCGAGCGACGCGGTGATGGACTCGACTAGAGACATTGCAGCAAGTGAGGTGACGCAGGCAGCGTCAACGCCAGTCAGGTGGGCTAGGCAAGTGAACCCAATCGTGCTGGTGCTCGACGATGTCGAGTACGCCATCACACGCAACGAAGTTAATGATGTCTTGACAAAGGTATACGATAAGGTACACGCTGCAATCATGAAACAAGCTGGAAAAGGTTACGGTGACTACAACAGTACTGGGCTTGAGCTGGTCTACAGCGAGGAGACAGGGCTATCAGCAGGTGAAACTCCGAGAGGGGTTTTGAACCCGGTTTTTGGTTACGCAAAGCTGGCAAATGGCGCAATAACTGTGGAGCCATGCAAGTGCGCAGACTCAAACGCCGTACTCATGACGATGAGTGAAGGTGAGCAAAAACCAGGGCTGAGTGAGGTGTCAATCGGCAGCGAATCAGTCAAGGTAGTTAAACGAAACAGAGGCGGAAGGACTTTGACCTATCTGATGCCAGAGACGATAAGCGGCATGGGGGCAGACAGGTCATATGTCTATCTTGCGGGGATGCACTTCAGAGAGGATGAGCTCAAGTACTCACTGCCAACCCTGGAGTTCCTGTCACAGTTCACAACAAAGTACAAACCACTACAGCCGTCAGAAAGGTTGAGCAAGCTACGAGTGCTAACCGATCCAACTTCAACGCGAGTGCACCACAGGCACATGTCTATGTTGACCGTGATGGCGACTTGCTGTCATGCGTGGGCTCCGTGCATGGACACAGTGTTAGATTGGCCTGACATCACGAACACGTTTATGTCAGCGCTAATGCTAACGATGGCTGCAGTGCCACCTGAACTGTATGTGCTCATGTGTGAATGGAACGGGTGGGCCAGCTGCAAAAGCATGGCAGAGTACGTAGTGACTGCGAAAGAACTTACAACAAAGATGAAAGCTCTAGACAACCAGGTGGCAATCGGCGATTTTGAGCTGGACCTGTCGCCACTGTTTGAGTGGGAGGTGTTGAATCACAGAGCTGTGACAAAAGGCATCTACGACAAGGAGCTAATCGAAAGACGTGATGCAATGCAAAGCATTAAGCTCACGCCAGAGCAGCTCAGGCCGCACATCGATAGTGTATTCAGGGACATCAGTGCGATACTAGACAAGCGCACAAAGCATGGTGAGAAGTCGCCGATTTTTGCAAATTGGGACGATTGGTATGCTGATAGGGTGCAGGCAACACCTGCGGGATCAGCATTCACAGTCGAGGAGTCTCTTTTGCAGGCAAGACAAGTCTTAAAAGATAACGGCGTGCAGAACCTGACAAAGACACAAGTCATGGCGCAAATGCAGGATGGATTAAAACTGGATACTCTACTCAGTCATGAGCCAGACATCATTGCGGACGTGCTG
+TBLASTX ds2020-267_615 4 218 NC_039078 Prunus virus F isolate 8816-s1 segment RNA2 polyprotein 2 gene, complete cds Prunus virus F 66.3 3 100 15.0 1.3506373333333334e-12 273.5446 1855510 Viruses;Orthornavirae;Pisuviricota;Pisoniviricetes;Picornavirales;Secoviridae;Fabavirus;Prunus virus F CAGCACGTCCGCAAGTTCATCGGGATGTGTATAGTGATAGGATCACTCGATTCATGCGTCTTGGTTGGCAGGGGCTGGTTGGAAACACAGCAACAACCACACGCATCGAGAATGCAGAATTGACCACACTTGGTGGTAATCATGTCGTTGACGTTCCCGTTCCTTTTTTATGAACGGAAGCTACGACTACAAACCCAGTTGGAATTGCGGACGTGCTG
+TBLASTX ds2020-267_482 16 228
+TBLASTX ds2020-267_184 26 288
+TBLASTX ds2020-267_8 3373 1703 NC_028469 Penicillium aurantiogriseum partiti-like virus 66 kDa protein gene, complete cds Penicillium aurantiogriseum partiti-like virus 47.7 7 100 100 1.2504600000000032e-13 1057.2269000000001 1755781 Viruses;Penicillium aurantiogriseum partiti-like virus CAGCACGTCCGCAAACTGGGGTGTCTGGTATGGTAACTTCTGTTTTTTGTTACTGATATGTCAATCAGTAAAGAACGCTTCCTCGAGGTGGAGTTCCGAATAGAGGGGCCGTGTTTCTTGATATTTTTCGAAATCAGAAAAAGAACGTTGGCGTAGTGCTCTGTTGGAATAAGCCTCGGGTATGAACGCGTACTCGGGTAGGTTTCTATCTCTTCTTGAGATGAATTTCCGTGGCGAGGGTTGAGGTAGTAGCGCAGGGAAGAAAAATCCGCCGAAAGGATCGGTTTGTCGGATGGGAAGTGTGATTTCCTTCATCTCGAGACCGAGAGTGGAGAGATATTTGAATGCCTTTGAAGGCTTCTCTGCCACGTAGGCGTTGAGGGTTTTCTCTTGTATGCCGTTGGTGCTCATGATGTGTTTGATCGCATCATAGAATACATTGCATAGTTTTGGATCCATGCAGGAGTAGAGCTGTCCAAGTAGGCGTGCGCATGACTCGAGTGGTGAGTCAACTGGGCGTTCCGGGTAGATGGTGGAAGCGAAGATGAAGTCGTATGACCTTCGCGGTCCGGTAACTCGGTGGAAGTATCCGAGCCAGTGTATATTCTCAGGGTTATTACTGAGAATCGTCTTGTCCAGGTTAAGAATGCCATTGAAAACATCCTTTAAAACAACACCAAGTTCGACGAGATCAATCGGTCTATCTAGAAAGATGGACGAATCATCTCCGTAGTAGTAGTCCTTAACGGGTAAGGCTCCAGTGACTCGGTAGATGGCAGTACGCATTTGCACTGCGTTGACGATTGTGTCGAGAAGGTTGGTCCACATTGAACCAGATGGGATGCCAGTGCTCTTTTGTACTCGGAGACCGCGGGGTGTGCGTATCTTCGTGTTGATGAAGTAAGAGACCATGGCTTTCCATCGTCGTGCTGTTTGGTCTGAACGGACGTTCCATACTATCCCTTCAGAATCTCTGACTTTTGAAAAGTCAAACCAATCAGAAATGAACGAGAATGTGTCTCGTATTATCCAATGGGTAACATTGGCGTCGAAGCGTGAAAAGTCGGTGGTGAGGGAAACGATATTGTCGATCATGCTCCTCGCAAGATGCGAGTGGCCTGACTTCATTGTTTCCATTCCGATGCCGTAGCACGCGTCCTCTCTGTTGCAGAGTTCCTTCAATTCTGAGAAAAGAGGAATGAAGAAGCGGGCCTCTTCAAGGATGACATCAGTTGGGTAACCCCAAACTGGACGTACTTTGACATTCGGTTGCTCACTTGCGACAACCCTGTTGAAAGCAAGGCAGTCGGGCAGCGACCATGGGATTCCTCTTCCGATACTATCCCAAGCCCGATGTATCTTTCCGGTGGCAACTGGGTCTGCGAAGACCTCAGCTTTTGTCTTGTATCCTTGGTTGACCCAAGGGAAGCCGGGAGATGTCGTGGTGGGCATTGCGGAGTGCTTGGCAGCAGCTCCGAGGGTTAGCGGTATGATACGGTTAGCGGGGCGAAGTTCATCGAGTGTTTTCTTGATAATCGCAAGATAGTCACCATCAACACACCGGGTGGTGGGTCGTTGGTCGTAATCCATGAGATTATCTTCGAGAACCGACTGGTCCGCGGACGGACGGTGCCATGTCGATGAGATGTTGCTAATGAAGTCACAGAGATCCGGAGAACCTGTCAATAGTTGCGGACGTGCTG
+TBLASTX ds2020-267_316 18 251 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 63.2 1 100 5.0 2.97582e-26 114.703 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B GACGCACTGACCTTTGTCACCACGTTTGTGATCAACGCGTAGAAACTCAGCTATTGCACCGAATGCGCACTTAGAGGGCTGCGTTCGTATGCAAAGCCTTTGTCCTCTCTGGAGTGTGAAACGAGTTATTTCCAGTGACGTCGTCCCTAGAAGCACATCGTCACCGTTGTGCAGTGAAGAGCCGACTTCTTTCATCGGACCCAACATGAAGTCGGTGTAAACGGCATTTCGGACGAGTTGCGGACGTGCTG
+TBLASTX ds2020-267_14 1984 1335 NC_033486 Wuhan fly virus 5 strain fly34516 segment Seg 2 hypothetical protein gene, complete cds Wuhan fly virus 5 28.4 1 100 15.0 2.39383e-07 55.1359 1923699 Viruses;Wuhan fly virus 5 CAGCACGTCCGCAACCGGGTATCCACTGTTTTAAGAGTTTCGTTTTGGACCGGTTACCAGTGAGCTTTTACCAAGAGAGAGCGTTGTAGTAGAAAAGAAGTATTGATCTACTTGGTGTCACTGAGGACGACAGATGCGTCAAGCGCGACAGAACGAATTAGGCCATGAGTCGAGAAACGTCGAAGATTCAGGTTCAAAGAAGAACCGAAATTGAACGAGTCGTTCATGTGTGCCATCCATTCGATGCCAGGATCACGATATGTATTGTCGGCGTCAGACTGTATCAGCCAGGGCTGATAATTGCTGGCCTGAGCAAAGACCGGTGATCTATCTGGATTGTATGTTCCAGACCAGATGAGCGATCGCTCAAGGCGGTAGCCGAACGAATACGCTGGTGACAGGACTTTGGAGTCCATGGCGTATCGAGAATGAAGGGCGAGTTCTGTGTGCAAACACGCGTTGACCTTCTGATTTTGATGAGGACCTGGTGCCTTTGGCCACTGGGAGCGGTTGGAGGCGTAGTCCTCTGTTGCAAGGAAGTAACAATCCAGGGGATTGCCTCGCACAGAAAGAGTCAACTGTGTTGACGAATTCACCTTGAGTCCTGTGACGGACGCAATTCGGTCAGACACGGCGCGCATGGTCGATGTGGAGAGCATGAACGTTGTCTGAGAGTCAAGGGCGCAACCATCTATGGACCAACCAAGATTAGAGTATGTCGCACGCCAGGAGGCGTGAGTGGCAGTGTAAGTGCCATTACTCCATCCAACGATGTTCTCGGTCGGAACCGAGTAACTGTCATCAGAAACGGAAGGTGAGATCTCAGAGAGATCAAAAAGACGATTGGGCTGGGAGCCAGGGGTGCAAGAATGTGCTTCATTGCACAGGTAAGACACGAAAACACCCGGACTCGGAAGTTGGGCGTACTTCCAGAAGGAAGTAGTGTCTACCCTAGCGTCGGGAAGACCAGAGGCGAACCATCCGGAGTGGATAGTGCCTGTTGCTTCGGCAAAGGTGTGGGGAGGTAGGCGAAAGAAGAAGTTTTCTCCTCCTTGCATGAAATTGCCTAAATTGGCAAGATACTGAGCAATTTGGGAGGGTATTTGAAACTCCTGCCCCATCTCCATCACGTTCATGAACTGACGTTCGTCAGAATTCAAGACGTTACCGTTTGCGCGATGCAGGTAAAGAACCCGGTACCACCACAATTGCATGCAGTAGTAGCGGAAGAGGCCGAATGGGATGTGCTTCGCCGCATTTGAGTAGCGCGACTGAAGTGATGTGTACACCACATTGACCAGGTCGTCATATGGCTGTGCAGTTGCGGACGTGCTG
+TBLASTX ds2020-267_588 38 219 NC_007542 Penicillium chrysogenum virus segment 4, complete genome Penicillium chrysogenum virus 35.4 1 100 7.0 1.82953e-09 58.494 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus CAGCACGTCCGCAAGAGCCTTTCCCTGATAACTTCTCGTTCGCCAGGCGACAATATATCCTTTTCCATCTCTACACCATTTACCCTTGTTTTAAGTGATACATTGCGCCTTGATTCTACATTAAATACAAATTTTTTGTTATGGTTGTGAGAATCTGCCATGCCATTCATGTAATCCACGACTCTTGCTGCTGATGCCATTTTGTTTGCGGACGTGCTG
+TBLASTX ds2020-267_272 4 259 NC_039077 Prunus virus F isolate 8816-v1 segment RNA1 polyprotein 1 gene, complete cds Prunus virus F 90.4 3 100 9.0 3.231256727625802e-20 349.6072 1855510 Viruses;Orthornavirae;Pisuviricota;Pisoniviricetes;Picornavirales;Secoviridae;Fabavirus;Prunus virus F GGACGTTCGGGCTTTTCGTGGTGTTTGGGTTGCAATCCGCAATACTCAATGACGCTGCAGTCTTGCTTGGTCAGGATTTGCCCTCTTGGCTCAAGGAATGTGATGCTATGGTTGACTATATGCACTTGTTTGCTGTAGCTCCGCGAGATGTCATTGATCGTATGCAAAAGCCTCTCAGCCTTGGGAGGCAACTCAGAATTATCTACAGAAAATTGTGCAATAGATATCGAGCTTAGTTCCCGGGTTTGCGGACGTGCTG
+TBLASTX ds2020-267_355 78 244 NC_021222 Cryphonectria parasitica bipartite mycovirus 1 strain 09269 segment RNA1, complete sequence Cryphonectria parasitica bipartite mycovirus 1 69.8 1 100 8.0 5.21666e-22 100.499 1329781 Viruses;Cryphonectria parasitica bipartite mycovirus 1 CAGCACGTCCGCAAACCCCCCTCTTAATAATCCCCGTAACCCCCGAGAGGAGCACGGGCCACTTTGGCGTTAGGCCACGCCTTGCGATAATCCTCTCGCCCCAAGAGGACTAAATCGCGCCACTGCTCAAATGTCAGCCGCTTGGGAATTGGCACCTCAACACCCACATTGCTATAGTCCCGCGATACCATGCGTTTGAAGTTCGGGGGCCAATCGAGGGGCGGGGTCATTTGCGGACGTGCTG
+TBLASTX ds2020-267_856 16 206 NC_010985 Curvularia thermal tolerance virus RNA1, complete sequence Curvularia thermal tolerance virus 37.2 1 100 6.0 0.000320058 40.9315 421976 Viruses;Curvularia thermal tolerance virus CAGCACGTCCGCAAGGACCATGGCATATTTAATTTAATTCTAAAGGAAAAGTGGCAAGATGTGTGGCACTCTGCTGAGATGGAGAGTCTTGGTGATGATAATATCACAGGCTTACCGGAGTGGATGAAGCATATCACAGCCGAGGAGTTGGGGCAATCCGTGTTGGATATGACGGGGATAAATAGGCAGAGGTTGCGGACGTGCTG
+TBLASTX ds2020-267_61 32 465 NC_039077 Prunus virus F isolate 8816-v1 segment RNA1 polyprotein 1 gene, complete cds Prunus virus F 72.3 6 100 11.0 5.1484708137e-16 421.9992 1855510 Viruses;Orthornavirae;Pisuviricota;Pisoniviricetes;Picornavirales;Secoviridae;Fabavirus;Prunus virus F CAGCACGTCCGCAAGGATGCACTCTCAGCACGTCCGCAATAAAGGGGCATGTGTTGCGGACGTCGCTTAAGGCGACGCACTGACCGTCTTTTCGCCCTTGGGACACTCGATTCCCACCAGTTCTGGTACCTGATTGGCACATTCTTCATAGAGTGAGGAAACATCCTTAGCAACTTTTGAATTGGGTTGTATTCTCAGGCTTCCAACCTCACCNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNTGAAGTCAACATGTTCTGTGCCAAGCAAACGAGGATCATTCTTCGTGATAACGCTGGGTATCTTTTCACAGGGAGTTTCCAGGTGCCACTCGAGTGGTGTTTCCACCAAACTGGAGGGCCACGAACACGGTCAGTGCGTCGCCTTAAGCGACGTCCGCAAGTAAGATTCCTTCGCACGTCCGCAATAGAGCTGTCTTTATTTGCGGACGTGCTG
+TBLASTX ds2020-267_21 912 858 NC_021222 Cryphonectria parasitica bipartite mycovirus 1 strain 09269 segment RNA1, complete sequence Cryphonectria parasitica bipartite mycovirus 1 58.3 4 100 63.0 1.336125e-15 550.4540000000001 1329781 Viruses;Cryphonectria parasitica bipartite mycovirus 1 CAGCACGTCCGCAAATCCCGCTTGTTTCGTGAGTTGGCCATATTCCGGATAGAGCAGGCGCAGGTAGGTCTCCTCCGCTGGGCGGTAGGGAAGGGGGAGCTGAATGACCCCATCCACCACTGGGTAGTCGGCTAGGAACCAATACTTTCCCAAGAACTGAATCCCTTGAAACTCCCCCTCAATGGCATCCAGTAGACGGGTGGTGGAGAAGGACTTCTTTCCCCACCAATCGATGGCCACCATCCTCTGGACACACTCCGCAATCGTCTCCGTCGTGAGGTGGGCCAACCTGAGGGAGACCGCCATGATATTGTCGTCCCCCAATGACTCCATCCATGCGTGCTCGTCAATGTTGTCGATGGTGAGCCCCCCGTCCAGTTCGAAAAGCGCCGCATATCCGATGAGTAGGGTGATGATGGACTGCAGGAGCGTGTTGTGGGAATGGCCACTTGTCGTGCCCACATACTTCTGCATGCGGACCCCATCATCGCGATAGATTGGAGCCCGCAGCAGGCTTTCTGCCACAAAGGCCCAATAGGTGTCGTAATCGGGATTGTCCCCATCGTAATACTGCTTGCGACAGATGTTAATGGCGATGGTGACCATCCATTCATTGATGCTGGAGTCGAACTTCTTGGCGTCGAAGCAGAAGAACTTGTCGAAAGGCGCCATCCTGTCGATGAACTCCTGTGACCCCCCGTGGTACCATGATTGACCCACCGCGATTGGATAGTTAGGGGCGGACCAGGCCTTCGTTAACTGGTTCTCTGTGACCCCACACAACTTCAAGTCACGGTGGCTCATCATGAGGATCAGACGCCCCACGGGGGGGATCTTGGATTCCTTGCGGACGTGCTG
+TBLASTX ds2020-267_2 7516 2436 NC_016760 Rosellinia necatrix quadrivirus 1 segment 3, complete genome Rosellinia necatrix quadrivirus 1 41.5 7 100 53.0 5.655557142857142e-05 679.2049 1000373 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Quadriviridae;Quadrivirus;Rosellinia necatrix quadrivirus 1 CAGCACGTCCGCAACAGTTGGTCCTTGCTAACAGTAATGGCGACTTGTGGACACGCATGGGCGCCTTGCATGGACAAAGTTCTGCAGTGGCCTGACATAACGAACACGTTTATGTCATCACTACTACTTGCCATGGCTGCACTACCACCAGAGTTATATGTACTAATGGTGGAGTGGAACGGCTGGGCAAAGTGTGGCTCTATGGCAGAGTACATCGTAGAGGCAAAAAACCTGACGACTAAGATGAAGGCACTGGACAACCAGGTAACATTGGGTGACTTCGAACTCGACTTATCGCCTTTATTCGAGTGGGAAGTGCTAAATCACAGAGCGGTCTTGAAAGGCATCTATGACAAGGAAGTCACAGAGCGTAGAGATCAGAAACAGAGCATCAAGCTATCTGCTGCCGATCTGGAGGAAGAAATAGACAGCGTGTTTCAGGACGTGGGTTCCGTTCTAGACGCCAGGACAAAAGAGGGTGAAAAATCACCTCTGTATGCAACGTGGGATGATTGGTACGTTGACAGGGTGCAAACCACACCAGCTGGGTCTGCATTCACAGTCAACAAGGACATGATGGAGGCAAGAAACATGCTGAAAGCCAATGGGGTCCAAAATCTGACCAAGACGCAAGTGATGGCGCAGATGAGGGACAAGCTCCCGCTGGCGTCTATCTTGGGTAGCGAGCCAATGATATTGGCCCAGATGTCATGGAAGTTGGAATGGTCAAAACTGAGGGCACTATTTGCTGCTAGCATGGAGCACTGGATGCCATCGGCATTCGCCCTGGGGCAGATAGAAGAGTATCTACCCAGTGACTGCCCCATAGGTAAAGCTGCCGATGCGCACAACGTGTGCAGGCGCGTGATGGAAATGTCAACGCAAGGAGTGGTAGCATGCATAGATGCAAAGAACTTCAACATCTTGCACACCCACGAGATAATGTCAGCAATACTGAAATCCGCATCAAAGATGCTAGGAGATAGGCTGTCTAGTGAGCAACATGACTGCCTAAAGTGGCTGGCGAAAGCGGAGCTGAACCAGAAAGTGCTGGTCAAGACAGGTGAAGTAACTGAACAGTTGCTCCAGGTCGGCAGGAGAGACGGGTGGATTAACAAGCTAACTAAAGGTGACGGCACAGTGGTAGAAGCGGCTGACGTGACGGTTGGAATGTTTTCAGGTACTAGGTTCACGATGCTGTACAACACAGTGCTAAACAGGGCGTACTACAAAGTGGCGGAGAAACGTGCGAAGATAAAGACTTTATCACTTCATTCGGGTGATGACGTGTATGCTGTTTTCGCTAACTATATAGACGTGTACAAGATGAAGCGTGAGATGGCGTTAATCGGCTACACACTGCAGTTAGGCAAGTGCTTCTTGCAGGGAGTCCGAGAATTCTTGAGAATATCTCATAAGAATGCAAACACTTCTCAATACCTAGCGAGGTCCGCAGCAACGGCAATACATGGAAGAATAGAGGCAGATGAGCCTTCTGATTTCGTGGCTTTTGTGGGGTCAATAATGAGAAGAGGTGCAGAGATGGTGGTCAGGCACGCGGCAAGAGCAGTGTTGCTAGATGTCATGAAGATACAGATAGCAGGAGCTTGCGCAAGGTGGGCGATTACAGCTATGGCGTGGGACTCATTCTTAATGTTGCCAAAAACAATGGGCGGTTGTGCTGCAAAAGCACGCCTGATGGAACAATGGAGTGGTTTTTCTATAGAAAGAACTGCAAGCGCCAGAGGTGGCATCGTAGACTATTTGGCTGAACAACCAGGTACCAAAACAGCGGCGAGGAGGCTGGTTGAGAAGTTGCAAATAATGAAGTACCACAAGAGAGTTGCACAAGCCGTTGCTGCGGCGATAGCACCTAAAGGAGTTTTGAAAAACTACGGTATGATAGTAAGGTGGATGAACAAAGATGACATGGCACATATGTCGAGAGTGGCAGGGACACTAGGGCGAATAAGACAATCGAGAGAGTACATATTATCAAAAGCAGCAGGATTATTCAATACGCTAGCAATAAATGACAACTTCTGGGGTGATGTGAGCGGTGTGTTCAGAGGCATACCGTCAGCGTGGCACGGCAGAGCACTGACGTTCGCACTGTCTGAGAGGAGTGAGTCAGAAGCGCTGTTTGCAAATAAAATGTACAAGCTACACTATAAAATGACAGAGTGGGCAAGAGCTGCAACAGAGAATAGACTGATAAGAATGCAGCTAGATATGCCACCGGGGTAATGCTGGTGGTAATAAGTACGATAGAACTTGCCATCCACTAGGGAAGTGGACACAAGCGGAGTAGGCGACCGGTGGCAAGTATAACAAGCCAGGCTGAACGGCCGTACGTGGCTCCCAGACGTACAAACATTGGCGCTATCAACTAGCGCCTACACAATATAAAATATGCGTTTAGTTGCGGACGTGCTG
+TBLASTX ds2020-267_56 95 478 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 32.4 1 100 7.0 2.87431e-13 73.0061 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B ACTCTGTATGCGTTCGCCAAACGCAACGCATCCCTAGGCTCCATGACGAAATCGTCGCCAATGGGTATCGATTGCATCCCAGATAGGTGTGACACACCGTCATACTCATCGACTACGCAGCCAGCCAATAGTGCTCCTGAGACGTAAGCGGGTATGCAAGTCAGGCGCTTTGATAAGGGATAGCCCTCCTCTATCAGCCTGGTCGCCTTGACTTCTTGGACTTCGGCAAGGTGTCCAAATTCGAAGGCCAGCCAACACGAGTCGTTCGCGACAGTAGGAACCTCTTTCCCGAAAGGGACAGAGCACATTGCGGCTCTGCCTATTGGGGACATCATCATCCGGATTGCTACGGTCAGTGCGTCGCCTTAAGCGTATCTAAGGAGCAGCACGTCCGCAAAGTCTTAACCCTCAGCACGTCCCAATACATTTTCCGTCAGCACGTCCGAAAATCTACCACTTGCGGACGTGCTGCTCCTTA
+TBLASTX ds2020-267_393 23 240
+TBLASTX ds2020-267_50 128 510 NC_038928 Aspergillus foetidus slow virus 1 CP gene and RdRp gene, genomic RNA Aspergillus foetidus slow virus 1 45.9 2 100 8.0 2.41899e-28 142.8046 1087070 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Victorivirus;Aspergillus foetidus slow virus 1 CAGCACGTCCGCAACGCCACCGAAGCCTACCTCGCCGACCATGTCTCGAATGTCGAAGCTACCGCCCTGGAGATGGTGCGGGTGGATATAGTGGGTTTAATGGTTACTTCTTCTTACCGGAAGGGGTTGAACCAGACCCACTCAATACCGCCACAGCCCCTGATCCTAAGGAAGCTACCCCCAAGACGTTTGAGATCTTTCGTCGACGCCACTACCCTCATGAAGAGTCCAGTTAGACATGGGTGCCTCACACAGTATCCCATCCTACAGCTCTTCGCCTCACGGCTCTCTGAAGCAGAACTCCGCACCCTCGTAACCGAAGTGGGCGGAGATTCGACTGCAAGAGATATCCGGAGGGAGGCATTTGGCGCCGAATCCGTCACGAGGAACATCGTAGGTTTCATCCCGCTCGCCGACGCATCCTCGCTAGCGTCCAGAACGGACTATGACAACATCATGGTCCAATACCAAGTTTATCTATAATAGCCTGCTACATTTGCGGACGTGCTG
+TBLASTX ds2020-267_266 2 260
+TBLASTX ds2020-267_119 45 342
+TBLASTX ds2020-267_388 10 241
+TBLASTX ds2020-267_6 1161 1860 NC_016760 Rosellinia necatrix quadrivirus 1 segment 3, complete genome Rosellinia necatrix quadrivirus 1 41.9 5 100 39.0 1.1597159999999999e-05 494.24539999999996 1000373 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Quadriviridae;Quadrivirus;Rosellinia necatrix quadrivirus 1 TGAGGCTATTGTGCTGTTCTTCTGACAGCCTGGAACCTATCATCACTGACGCTGATTCCAATAGTGCTATTGCTAGTGTGTTGTTTTACTTGCCTGGGAGCCGCAAGCGGCTTGCAAAGCCTGGCGTTAATTGTACGTGCACCGGTTGCCTACACCGACGTTGACGGCGCTAGCTCTCCCTCAGCTAACGGGTCGTTAGTGACCAATTCTTTTGCGCCCATTTCGTGCTTGCTTGTCTGGGAGCCACAAGCGGCATTTGCAGCCTGGCGAGTTATTTGATACGTGTACCGAGTGCCTACCCCGACATTGACGGCGCCAACCTTCCCTAGGTTGACGGGAGCCACAAGTGTTTCACACTCATGGCTCTAATTACAGTGGCCTTTGGCCCAAGTTGAGCCTATGTCTCGTTTGCGAGTAGTTCGTCGCCACTCCTATCCACCCCATCACTGTGGTATGTAGCTTGAACCTCCTGTTATCGAACAGTGCTTTCTCCTCGCCTCTTTTCGCCAGCGCGAACGTTAGTGCTCTGGCGTGCCACGCTGACGGTATGCCTCTAAAGACTCCCGTCACGTCGCCCCAAAAGTGGTCGTTGATGGCCAGCGTGTTGAACAAGCCAGCTGCTTTGGATAAGATGTACTCACGTGACTGTCTTATCCTTTCCAGTTGACCCGTCACGGTCGCTAAATGCTCAAGATCGTCCTTGTTCATCCACCTGACTATCATTCCATAGTTCTTGAGGACACCTTTTGGTGCTATGGCTGCTGCCACGGCTTGCGCAACTCTTTTGTGGTACCGCCGTATGCCTAGTGCCTCTACTAACTGTCTCGCAGCAGTCTTGACTCCTGGTTGCTGCGCCAGGTAGTCGACTATACCACCACGTGCGCTGGCAGTTCGCTCGATAGAGTACCCACTCCACTCGTCTGCCTTTCGTGGTCGCGCAGCACACCCACCCATGACGTTTGGCAACACCAGAAATGCGTCCCAAGTCATGGCCGAAATTGCCCAGCGTGCACAAGCCCCTGCAATTTGCAGCTTCATCACGTCGAGCAACACGGTTCTCGTTGCATGTCTGACAACCATTTCTGCACCACGTCTCATGATGGAACCCACGAATGCCACAAAGTCTGATGGTTCATCAGCCTCAATTCTACCATGTATTGCAGTAGCTGCAGACCTCGCCAGATACTGTGACGTGTTTGCGTTCTTGTGTGAGATCCTTAAAAACTCTCTCACACCCTGCAAGAAGCACTTCGCTAGTTGCAGTGTGTACCCAATGAACGCCATCGCTTTCTTCATTTTGTACACGTCAATGTAGCTGGCAAACGCAGAGTATACATCATCGCCAGAGTGTAGTGACAGTGTTTTGATCCCGGCGAGTTCTTCGGCCACCTTGTAGTATGCCCTGTTGAGTATCGTGTTATACAACATCGTGAACCTCGTTCCTGAAAACATGCCAACCGTGACCGTCGCTGCTTCCACCATGGTGCCGTCACCCTTCATCATTTGGTTTATCCACCCTTCTTGTCTCCCTGCCGACAGCAGTTCCTCTGTGACCTCACCTTTCTTCACTAGTACCTTCTGGTTCAACTCAGCTTTGGACAGCCATTTGAGGCACTTGTGCTGTTCTTCTGACAGCCTGGAACCTAGCATCACTGACGCTGATTCCAATATAGATGCCATCACCTCCTGGGTGTGCAAGATGTTAAAGTTCCTCGCATCTATGCATGCAACTACTCCCTGAGTAGACATCTCCATGACTCGTCGGCACACCCTGTGTGCATCGGCTGCCTTGCCGATGGGGCAGTCAGCTGGCAAGTACTCTTCAATCTGCCCAAGCGCTAAGCCGTTGCGGACGTGCTG
+TBLASTX ds2020-267_16 824 1165 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 50.8 1 100 25.0 1.27294e-121 434.533 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B CGTCCATCAGGAAGCCGGTCATTTTGGCTTTTCCGTAATTGACTATGTCTGTTTCCTCTTTGTGTACCTTGAATAGCGCGCGCAAAATCTCGTACCGCTTGATATTACCATTTTTTGAAACGTTTATGTTCCTTTCTTTTGGTATTACCGCGTCGTATGTTGCGCGCATTATCCTTGAAATGAAATCCTGCAAAGGTTTTTCAAGTTGTAATGATGCTTTCACCATTCTGGAGTAGTCCACCACTCCCGGTAACACGCCTATTTGCGTGGCACCCTTCCTGAAGCCTGATGACCGTATCATCCACTTTACGTCCGATCTCCTGTCTTCACTTATGCCCCCCACACACCTATGAGAAGTTTTTATTTTGTAACAGTCTGAAACTGTCATGTGCAATCGCTCACACTGTCTCGAGTAGTATTTGTTCCTCAGTGATGCTGCTAGCCACGTGGGCATGCCTCTCGACACCGAGTCGTCGAGGCGTGATTCCAACGCCTCTAGAAGGTCCCTCATGTCACTCGAAGGTTTTGATTCTATCCTCGAGTGTACTAAGGTCGCCATGGCCCTTGATAAATATTGTCCCTTAGATCCGCGCTTGTGATCCACTCGTAGGAACTCCGCTATAGCTCCGTACGCGCACTTGCTCATTTGTAGTCGTATATTGTGCTTCTTCGCGTTTCGGCCGGCTAGTAACACGTCCCCGAGCGAGTTACTGCCCAGCAGCACGTCGTCGCCGTTATGAAGACTGTTTTGTGACTTCACGACATCTGGCACTATTAATTGAGTGTAAATGTAGTTCAGGACGCTATTCATGAATGTGGTGAGCCTCCACCCCGACAGTAAAGTTCCTTTAGCACTATACTCCATCTTCAAGCCTTGGTTGTCATGTACTATCACTCTGTTCAGCGACAGTCGAGTCCATTCCACCGCCGCCAGCTGCTCTTGCGTTAGGAAGTGCCCGAAGGTGTCTCTGTACGCATCTATCACTGCTTTCATTGACTGTACACTATGTTGACTGTTGAAGTCTTCAAAGTCTACGCAGTATTGAGTTCTACCCTCGAGAACCGCCCTCACTCTGCTACGAACGTTCTCATCATTCGCAGCCTTGCCTACCGGGAATGGTGAAGGTAACACGTCTTCACAGTTGTACAATTGCGGACGTGCTGG
+TBLASTX ds2020-267_101 84 375 NC_016758 Rosellinia necatrix quadrivirus 1 segment 4, complete genome Rosellinia necatrix quadrivirus 1 22.3 1 100 8.0 0.000188849 43.2225 1000373 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Quadriviridae;Quadrivirus;Rosellinia necatrix quadrivirus 1 CAGCACGTCCGCAATCAGTGTGTCCTCTGCTCATTGTCACGTGCACCTGACTGCTTCATGTGCTGTAGCCAACCAAACAGGCTAGTCAGCGCGACTGTACCTGCCATTTTAGCTGCACTGACACTGTTGAGCTCGATTCTTGTCATAGCAGCTATCTCTTGTTCATCCAACTGCATGCCGGGAGCAGCTACACCAGCGACTGCCTTGCCGTTAAGTAAGTGCGCCATGACTGCATTTTCACTGACGCTGATTCCTTCTGCCTCAGCCATGATCGGCAGCTCACCGATCACTCTGATCTGGTGCGGCTGAAACACAGTGATGATCTCACTTGTCAGCGTCTTGTCAGAAGACTTGGCCATGGTTGCGGACGTGCTG
+TBLASTX ds2020-267_236 66 266
+TBLASTX ds2020-267_443 18 233
+TBLASTX ds2020-267_450 2 233 NC_006642 Cotesia congregata virus complete genome, segment Circle10 Cotesia congregata bracovirus 41.1 4 100 5.0 0.00020802475 172.0095 39640 Viruses;Polydnaviridae;Bracovirus;Cotesia congregata bracovirus CAGAACGTCAGCAATCGGCGTACCCTAGCGCGTCCGCAAGGAACAATCCTTCAGCACGTCCCAACTATCGTGCAGCACGTCCGCAAGAGTCGTACCCCAGCACGTCCGCAAGTAACAATCCTTCAGCACGTCCCAACTATCGTGCAGCACGTCCGCAAGCGCCGTACCCCAGCACGTCCGCAAGTAACAATCCTTCAGCACGTCCCAACTATCGGGGCATTGCGGACGTGCTG
+TBLASTX ds2020-267_644 8 216
+TBLASTX ds2020-267_36 424 651 NC_016758 Rosellinia necatrix quadrivirus 1 segment 4, complete genome Rosellinia necatrix quadrivirus 1 28.0 2 100 13.0 3.23046e-12 88.7361 1000373 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Quadriviridae;Quadrivirus;Rosellinia necatrix quadrivirus 1 CAGCACGTCCGCAACTACGACACGTTTTTGTAGCGCTCCCTGGCCGTGTCTGCGTTCTGCATTGCTCGCGGCAAACACAGCAGGTTGTGTGCATGATCAAGTTGCAGACGCGTAACGTCCTCATCTTTTAGACACATTTGTGACCGCTGTGCCACGTGCACCTCTGCCATCGCTCTACCGCTGCCCAACATCTGGATGCTCGAGCAGATCATGCTGACCATCTCATCACCGTTGATTGACGAATTCTCACTGATCTTGTTAAACTGAGGGCTGTTAGATGATGAAAACAGCCTGTCAACCGTTGGCTCGCAAAAGGGTTGTACCACTTTGTACACCCCTGCGTAAAACACGTCAGCATAGTCGTGGTGGGACAAGGCTGCAGGCTGGTAGGTAGACGCCACAGCTAGCGACGCCATTAACATCACGTTTTTAGAAGCCATGAAGTGCCTGGTCGTGACGTGTCCAATGAGGTCCAACATGTCGTTGATCGAGAAACCAACACTGTTGAACCAGTCTCTGTCGAGGTGGGGCGCTGACGACCCTACACCTGCAATGAAGGACACATTGCACTCACTTGCCACCGCCATCAACTTCTGATGCCCCACAGCAGCCTCAATGGAAGGCGAGAACCCCGTATTTGCGGACGTGCTG
+TBLASTX ds2020-267_5 37987 2029 NC_023684 Rhizoctonia solani dsRNA virus 2 segment 1, complete sequence Rhizoctonia solani dsRNA virus 2 47.6 8 100 100 3.1306275000000004e-37 1379.9565000000002 1411681 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Rhizoctonia solani dsRNA virus 2 ATCGCACATGATAAAGCCCGATATCTAAGGAGCAGCACGTCCGCAACCCTCTGCCTCCAACAATAAAGCAGATTTCTTTGCTCTTCTAACAGCTATTACTTACCACAATGGACCACCTCACTTCCCTTTTCGAGCTTTTTGCTATCACACCGAAAACACAAAACAATCTACAGTTTGTTGGGATCTACCACAGACCTCCACACTCCGTTCGAGCAAACCTCCGCAACGTTGAAAAACACAAAATCACAGTCGCTCACGCCATGCACAAGTACCTTTACCCGCATGAAATCGACTTTGTTATCAACCAAATGCGACGCTCAGACGTCACTGAAGATGCCATACTTGCTGACTTTTTCGACAACAACGTCGAACCACTTGAACCTGTTCTTGACGAACACTTCGAACGTGGACTCTCCGCAATGCTGGACGCTTTTCGCCCTCCGCAGAAATGCCTACCTGCCCACATCTATGATGTGCAGCACCACTACCCATATAAATGGCAAGTGAACGCTGAAGCCCCCTTCTCCACCGATTCCTATTTCTTAGCGAATCGACCAACCTTCCGCGCAGTGTTTGAACGACTCGAATCGCTCTACACACACCTCGCAACCGATTGGCACCGCCGATACGGAAACAAAACCGACAATGATGATTTTATGAATGATCATGTCCCTGCGAAATTTGGCCCTATGAAAGAAACAGTCTTCTCATGGACTCACCGATGGCACCACGTCATCAAATCCAACTTCACCGACACAGCTGGATTGTCTAAAGACTATTACTTCAAAAACCGATACATCTTCCCAATGCTACTTCACACGAAGACAGCGATTGTCAAGAAAGACGACCCGAATAAGATGCGAACCATCTGGGGCTGTTCAAAGCCTTGGATCATCGCAGACACCATGCTATGGTGGGAATACGTCGCGTACGCTAAGTTACAACCTGGAGCCACACCAATGCTCTGGAGTTACGAAACCTTCACAGGTGGCTGGCTTAGACTCAACCACGCACTTTTCTCTTCATACATACGGCACTCGTACATCACACTCGACTGGAAACGCTTCGACAAGAAAGCGTATTTCTGCATCATCGACAAAATTTTCGATGGCGTTGAAACATTCCTCGACTTTGACAACGGCTATTTGCCTACGAAAGATTATCCCGATACCAAATCGACTTGGACACAAGAACGTTCCACCCGCCTCAAACGCCTGTTTGACTGGACAAAAGAGAACTTCTACCATGCACCAATTGTCCTACCCAATGGGCACATGTACGTCCGAAAATTCGCTGGAATACCCTCTGGCCTATTTATCACTCAACTGATCGATTCCTGGTACAACTACACCATGCTCGCAACCATCCTATCCGCGATGGGCTTCGACCCTCGGTCCTGTATTATTAAAGTCCAAGGTGATGACTCAATCATCCGCCTCAGTGCACTCATCCCTCCGGATGCTCACGATTCTTTTTTAACTAAGGTCCAAGAACTCGCCGACTACTACTTTCAATCAGTAGTCTCCGTGAACAAGTCTGAAGTACGCAACGAGCTCAACGGATGCGAAGTTTTATCGTACCGACACAGACACGGTTTACCATACCGCGATGAACTAGCTATGCTAGCTCAACTGTATCACACGAAAGCACGCAACCCAAGTCCCGAAATCACAATGGCACAATCCATCGGCTTCGCCTACGCTTCCTTCGGAAATCATGAAAGAGTACGTCTCGTACTACATGATATCTACGAATATTACAAGCATCAAGGCTACACACCCAACCGAGCCGGACTCAGCCTCGTCTTCGGAAACTCTCCTGACCTCATGATCCCGCACTACACACTTGATCACTTTCCCTCAATCAGGGAAATAAAAATGTTCCTGACTAATGCAAAATATGCCAATGAAGAAACCAACTCACGAACGTGGCCTTTAACCCACTTTCTCCATCTTCCTTGTCATCGCACTTAGTATTTGAGCAATTGCAATTACAACATAATTACAAAAAAAGGATTGCGGACGTGCTG
+TBLASTX ds2020-267_43 465 563 NC_021222 Cryphonectria parasitica bipartite mycovirus 1 strain 09269 segment RNA1, complete sequence Cryphonectria parasitica bipartite mycovirus 1 57.9 2 100 21.0 5.04473e-43 192.2912 1329781 Viruses;Cryphonectria parasitica bipartite mycovirus 1 CAGCACGTCCGCAACTACTCTCCCTTGCATCAGGCGGTGAAATGCGCTCTCTGCGTCGGCTTGTGCCAGGGGATTCGCCTCTTCCCTGGTCTTAAGTCCCATTGTAGCGTACTCAATGCCGGCGAACTTCTTGGGGTAGAACTTAACGGTGGCGAGATCTTCCACTGCCGGGAAGAAGAGGAAGTCGGGAAGGTCGAGTAACTTTGCCACTACATAGGCGGCCTTCTCTATGGAGTCGGTGTAGCGGGGGTCAGGGGTGTGATTTGGCCGATCGAAGTGGCGAAGGTGTGCCATCTCAACTGGGGTGCAGGCCTTGACGAATGTGAATTCCTCCGGCTTGAAATTGTTGATGGGGGGGGGATGGAGGAGGGTGTAGGCGACAACTTCGGGGTCGGGTGGCGCAATGTCGAGTTCCTTGTTTAGCTTCCCATAGGCTTCAACCCTACCGAGGATTCGTATATGTTGGAACATGTTGGTGAGTTCCATCACTTCGCGGGTCGCGGCCTCTTTGGACCTCATGGATCGCATACGCGTCCTACGCTTGATAGATTGCGGACGTGCTG
+TBLASTX ds2020-267_453 17 232
+TBLASTX ds2020-267_352 4 245
diff -r 000000000000 -r b82ce29791e7 test-data/otu_s2.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/otu_s2.fa Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,6446 @@
+>ds2020-328_1
+GGTCGGGATAGACGTTGGAGCGCGGTCAGCCGAGACCCCTGACAGAGGAAAGAGTCTTGA
+GGAGTCCAACGTTCGGCCAGGCATAATAATTCGTGCCCACTAATCGAATCGGTTTACTCG
+CCCACCATGTCAGCGCCTTCGGGTTAGTTCTTTATGGAGTTATTTCTTGTTCTTTCTGTC
+ATAACAATTCTCCTTATGGAAGTCCCCCACAAGATTAAGAATGCTTGTTGCCGCGGCTGT
+CTTGGTTCTTCGTTTAGCTTTCTGGCATATTCTACGGAGCTTTCCACTCTGGAGCTGGCT
+TTCAGAAAAACCTTCATTCACTAGATGTGAAGCACCCCTATGGGGGAACCCTCTTACCCG
+CTTTCCTCCCCCCCCGATATGGGGGGCCTCGCTGTCGCCTTTGGCTCGAGCTACTTTTTC
+TCCTGGAACGGATAGCTTTCTGTCCAAGTCTATCTCCCAAAAGTCAGCCATGTAATTGAC
+TTCTAACGTCTAATTTTCTTTTTCACCGGGGGTCCCTGATCCCCGTTGAATATTCCTTCC
+TTCTGAAAAAGCTGTGACTCCTAAATTCTTTGATTGAATGAAATGTGGACTTGGTCACGG
+GGCAATCTTCTTTTTTAGACCCCGCTTCTCTCGGTGTTACCTTTTTCGCCTTCTCGTCTC
+GCTTCGCGTCGTCNNNNNNNNNNGGTCGGGATAGACGCGCCGCTTCCGTCTGTTTTACCT
+TGTTAGAATTCTCGGCGCGCTTGGCGTCGTCTTTAGAGTCAATTCTATTGGAATCTCCTT
+TCCCCTTCTTTTCTTCCCCCACGATGAAAAAAATAAATATTGCAAAAAGAACAATATTTC
+CCCCCGTGGTCATCATAGTGGTTCCTTCTGATCCTAGAAAACGATTAAAAAGAAGGCAAA
+AAAAACAAAGGAGGATCTGCTTTTTCATATTAAAGCGCTTTCTTTCTTTTAAAAATACAT
+CATAGTAAAGCGCTTCCTTTTAAAAAAGCATCTGGTTCCATCTTTCTTTCGTTAGTTAAC
+CCACCTTTTTCTAAAAGGGATTGTAGTAATTCTGGTTTTACACTATTTAGAATGGCTCTC
+TCATATTGAGAGATTCTGTCTAGTGGCATTCGATCACAGAATCCATTGACAGCTGCATAA
+ATGACTAGAATTTGTTTTTCAATTGGAAGTGGTGCATATTGTGGTTGTTTCAGTACTTCT
+GTAAGCCTTGCACCTCTATTGAGTAATGCCTGAGTCGCAGCATCAAGGTCTGACCCAAAT
+TGAGCAAAGGCCGCCACTTCGCGATACTGTGCCAATTCCAGTTTTAAACTACCGCAGACC
+TGTTTCATAATTTTCAACTGAGCGGCAGACCCGACGCGACTGACAGATAAGCCGACGTTA
+ATAGCAGGTCTAATTCCGCGATAAAAGAGCTCTGTTTCCAAACAGATTTGTCCATCAGTA
+ATGGAGATTACATTGGTTGGAATATAGGCCGATACGTCTCCAGCTTGTGTTTCAATGACG
+GGTAAGGCGGTCAAGCTACCTGCACCTGTCTGGTCCGATCGTTTAGCGGCTCTTTCTAAG
+AGACGGGAATGTAAATAGAAAACATCGCCTGGGAAAGCCTCACGGCCTGGTGGTCGGCGT
+AACAATAATGACATTTGTCGATATGCCACCGCCTGTTTACTAAGATCATCATAGATTATT
+AATGCGTGCATTCCATTATCGCGGAAATATTCCCCCATGGCACACCCAGAATATGGGGCC
+AGAAATTGCAGAGGAGCTGGATCCGAAGCGGTGGCTGCTACAAGAATGGAATATTCCAAA
+GCATTCGCTTCTGAAAGAATTTGAACTAATTGTGCCACAGTCGAGCGTTTCTGTCCAATT
+GCTACATAGACACAATACAATGTCTCACTCTCAGAGGTGGCCCTTGAGTTCAGTTGCTTT
+TGGTTTAATATGGTATCGATAGCAATAGCTGTTTTTCCAGTTTGTCGGTCCCCGATTATA
+AGTTCTCGTTGACCACGGCCTATAGGAACCAGGCTATCTACCGCTTTTAACCCTGTTTGC
+ATAGGCTCGTGCACAGATTTACGTTCAATAATCCCAGGGGCTTTCACTTCGACACGTCTT
+CGCTCGTGATCGCTTAGAGCCCCTCTTCCATCAATAGGAACTCCCAACCCGTCGACCACG
+CGCCCTAGCATAGCCTTTCCCGCAGGAACATCCACAATGGATCCAGTGCGCTTGACAAGA
+TCTCCTTCTTTAATAGCGGTATCACTACCAAAGACAACAATCCCTACATTCTCATTCTCA
+AGATTCAACGCTATTCCTTTCACACCGCTGGCAAATTCAACCATTTCCCCAGCTTGAATC
+TCGTTCAATCCATAAACACGTGCAATCCCATCTCCAACTGAGACCACTCGACCGATCTCA
+TCCACTTGAAAATTCGTGTAAAAGTTGGTAATTCTACTTTCTAATAGAGTTGTTAGTTCC
+GCAGCTCTGGTAGAGAATTCCATAATTTTTTCTTTTAAAGAAAGTCAAGGGAGAATTCCG
+CTTATTGTTTTTGGCTCGAAATAAAGCTAGGGTCCTGATCGAGCAACTAGTAGTCCTATC
+TATCCACCTCTCCAGAAGGGCTATTTGGGGTCTAATTTTCTTTCTATCTGACAGGACAAA
+CAAAGAGGAAGGGGTGGTTCTTTCATTGCATTGATAGAAGTCTAACTAGAAAAAGATCTC
+TCTATTACTTTGAGAAGAGAATCGTTGGTTTGACCGACGAACTACGTGGGAAATATGAGT
+TGAGAGGACAAGAGGATTCGATCTCCACGAAAGGCTAAAGGAACATAAAAAAAGCTAGAA
+TTTGTTGCAAACAGTGACCGAGATGCCAGGGAAAAACTGTTGTTTCACATTTCCGGAAAG
+ACCACCTATTTGTTCGTTTACCAGGTTCGGTACGAAATCATAAATAAGCTCTACCCCGGG
+CCATCGCCTTATGGCCTAGGGGCGTCTATCCCGCC
+>ds2020-328_2
+CCCCCCCTTTCGCCCTTTTTTATGCAGACGATTCCCCGATCGGGGAATCGTCTGCTTCCC
+TACGTATTAATCTTCTTCTTTTCTCCTTTTTCGCGTTTTCCTCTTATTCCTCTTTCGTTT
+TCCTCTTATTCTTTTTATACGCAATTTCTTTTTTAATTTCTTACTGGTCTAAGTCCCACT
+CCTCTTTCTCCCCGTTTTGCGTTAAGAATATTTCACATGGCATCGGTTTATAGCCTTTTT
+CCCTTGTCATCTCCTCTACAATCTTTTCTATTTTTTCATATTTCTTCTTATAAAATTCTT
+CCTCTTCTCTTCTCTTGCTTACTTGTATGGTTGCCGGAAATACTCTTGTTTCGCCTATTT
+GTATTTGTAGAGGCCATGTAGCATAGTCGTTTCCTTGTTGAGCCCCCTTACTTCTTTTAA
+CTTCCATGTAGCTTCTTGCTGTCCAATCCCTTTTATCGTAGAATATCCTTTTAATTTTCT
+TTGTTTCTGAGTTTTCGTCTTGCTCTCTCTCTCCTTCATTTTCCTCGTCGCTTCCCTCCT
+GGTTTTCCTCCTCATATTCTTCCTTACTCTTAAATAGCTGCAAGAATCTCCTTCTTTTTT
+TCTCCTCTTTTTCTTCTTTCTTTTTTACGGGTATACACGCAAAATCTAACAGTGCCATTT
+CCTTCTCTTGTTCGCCCCATGTGTAGCATTCCTCACCATCGATTGTTTGTAATTCAAACA
+TCAAATAACTTCCTCCCGCTGTGGTTTTAATCTTTTTTATTTTTACTTCATATATTTTTC
+CTTTTTTTGTTATAAAGATAACTTCTTTCTTTAGAATGTATTCTGCGGCCTCTGGGTTCA
+ACTCCCTTTGATACGGTATGTTTATATTTTTTATGTACTGCTTCCATTTTTTTTGACTGT
+TTTTCATCTCCTTAGGATCGTCCTCAATAGGAATAAAGGTTCCCACGGTTTTGTTGTATG
+TTAAGATGACTTCCGTTGGTGTGCTTCTTTCCTTAAAATAGGGGCTCTTACACGCTCTTC
+TCATTATACACCCATATAAGGTTGCTACTATTCTTTCTTCCTCCAAATGCTCTATGTTTG
+ATGAGAACCTAACCCTATAGAACCTTGCTCTAAAGGGTCCATGTTGTCTCATTATTTGAG
+GTAGTTTGTTGGCAATCATAACAATTGGTACATTTCTTTTCTTTTTGAATACTCTTGCAT
+ATTTGGAGTCTAATCTACATTCTTGTCCATCAAGTACCTTGAGAATAGTGTTTGCAAATG
+CCGTTCCTTCTGCTGTGGCGCCTATAAGGGAGCTCTCGTCGTTTGGTTCATGAAACTCAT
+CGAATGCCCATAGATCATAGTAATCATTTGCTCCCGTAAAGTCATTTCTTCTTGCACTGG
+CAAAATAAATTCTTAATACTTTTGCTAGTAAGTGGAATAGTAATGTTTTTTGTGTGCTTG
+GTTCGCCATATATGAATAGTTGCTTTGTTTTTATGGGTCTCTTGAAGCATATTTGACACG
+CTATCCAATCTATAACGAGGTACTTTTCTCTTAGCTCTTCCACGTCATACTCCCTTGGTT
+CCCCTCTTTTTATTAGATAGGATACAATTCTTTCTAGGGTGTTTGTCTCTATATCTTTTA
+GTATCTTTAAATCTTCATAAGCTTCCTTCATTCTTGGTAGATGCATTAAAACTTTCTTTT
+GTAATATATCATCTCTATATACTTGGTACCAATCCTCCGTCTTCTCTAGTCTTTTGAGTA
+TTTCTGATGGGTCTGGATTCCCCTGTGCTTCCTTATGTTGTTCATGTGCCTTTGCTAACC
+CTCTTGTTTGCTCTAAAGAGTATTCTCCCCATATTAATGGTTCTTTATCTTCCTTTAAAA
+TATATTTGCAAATAGTTCCCCATCCCTTATGTGCCTTTACATCTATACATCTTCCATCCC
+ACTCTTTGAATCCATTTCTAATTCCTTTTGCTAAATTGTTCTTTGATGCACTCTCATTCC
+ATACTCCAATGTGGTAATGAAATCCTTTCTCTCCGTGATTTTCCTTTGCTATTATGACTG
+ATCTGCATTGAAACATCTTGATGATTCTCTCCTTTATTACTCCCCTATCTATTTTTTTCC
+GTTCTGTCGTTTCCGCATGAATAAGTGTTATTAGTAAGTAGGGTCTTATAGTGTTTAGTT
+TCATGTTCATTGTGTTGTTTCTTTTCCGTGATTTCCTTTTCTTCTTTTGTTTGCGCTAGG
+TTATGGAGTTGCTGCTGTGAGTGGATGTAACTTCTAGTGGATGTAACTTCTAGTGGATGT
+AACTTCTAGGTGGGAGTGGATGTAACTAATAGGGGGGTCCGGGGGAAGTGGGTCCCCCCC
+GGGCAAGAGACAAGATAGGTAACTCCAACATCCTCGTATGAAGAGTAAACAGAAGGGAAG
+TGAGGCTCCCTTATACAGGAGCCGAACGTTACTTCAATACCTATAAAGTTAAGGTAGTGC
+TCTTTTTGTTAAATACAAGCAGCCGACAACCCCGCCTAGCTCTAGTAATAGGGGTTGTCG
+GCGTATCGTCTGATTCTTCGGCGAATCGTCTGCTTTTTTTCTTTTTCCACTCGTGAAGCC
+CCCCCTTTCGCCCTTTTTTATGCAGACGATTCCCCGATCGGGGAATCGTCTG
+>ds2020-328_3
+TTCCCTACGTATTAATCTTCTTCTTTTCTCCTTTTTCGCGTTTTCCTCTTATTCCTCTTT
+CGTTTTCCTCTTATTCTTTTTATACGCAATTTCTTTTTTAATTTCTTACTGGTCTAAGTC
+CCACTCCTCTTTCTCCCCGTTTTGCGTTAAGAATATTTCACATGGCATCGGTTTATAGCC
+TTTTTCCCTTGTCATCTCCTCTACAATCTTTTCTATTTTTTCATATTTCTTCTTATAAAA
+TTCTTCCTCTTCTCTTCTCTTGCTTACTTGTATGGTTGCCGGAAATACTCTTGTTTCGCC
+TATTTGTATTTGTAGAGGCCATGTAGCATAGTCGTTTCCTTGTTGAGCCCCCTTACTTCT
+TTTAACTTCCATGTAGCTTCTTGCTGTCCAATCCCTTTTATCGTAGAATATCCTTTTAAT
+TTTCTTTGTTTCTGAGTTTTCGTCTTGCTCTCTCTCTCCTTCATTTTCCTCGTCGCTTCC
+CTCCTGGTTTTCCTCCTCATATTCTTCCTTACTCTTAAATAGCTGCAAGAATCTCCTTCT
+TTTTTTCTCCTCTTTTTCTTCTTTCTTTTTTACGGGTATACACGCAAAATCTAACAGTGC
+CATTTCCTTCTCTTGTTCGCCCCATGTGTAGCATTCCTCACCATCGATTGTTTGTAATTC
+AAACATCAAATAACTTCCTCCCGCTGTGGTTTTAATCTTTTTTATTTTTACTTCATATAT
+TTTTCCTTTTTTTGTTATAAAGATAACTTCTTTCTTTAGAATGTATTCTGCGGCCTCTGG
+GTTCAACTCCCTTTGATACGGTATGTTTATATTTTTTATGTACTGCTTCCATTTTTTTTG
+ACTGTTTTTCATCTCCTTAGGATCGTCCTCAATAGGAATAAAGGTTCCCACGGTTTTGTT
+GTATGTTAAGATGACTTCCGTTGGTGTGCTTCTTTCCTTAAAATAGGGGCTCTTACACGC
+TCTTCTCATTATACACCCATATAAGGTTGCTACTATTCTTTCTTCCTCCAAATGCTCTAT
+GTTTGATGAGAACCTAACCCTATAGAACCTTGCTCTAAAGGGTCCATGTTGTCTCATTAT
+TTGAGGTAGTTTGTTGGCAATCATAACAATTGGTACATTTCTTTTCTTTTTGAATACTCT
+TGCATATTTGGAGTCTAATCTACATTCTTGTCCATCAAGTACCTTGAGAATAGTGTTTGC
+AAATGCCGTTCCTTCTGCTGTGGCGCCTATAAGGGAGCTCTCGTCGTTTGGTTCATGAAA
+CTCATCGAATGCCCATAGATCATAGTAATCATTTGCTCCCGTAAAGTCATTTCTTCTTGC
+ACTGGCAAAATAAATTCTTAATACTTTTGCTAGTAAGTGGAATAGTAATGTTTTTTGTGT
+GCTTGGTTCGCCATATATGAATAGTTGCTTTGTTTTTATGGGTCTCTTGAAGCATATTTG
+ACACGCTATCCAATCTATAACGAGGTACTTTTCTCTTAGCTCTTCCACGTCATACTCCCT
+TGGTTCCCCTCTTTTTATTAGATAGGATACAATTCTTTCTAGGGTGTTTGTCTCTATATC
+TTTTAGTATCTTTAAATCTTCATAAGCTTCCTTCATTCTTGGTAGATGCATTAAAACTTT
+CTTTTGTAATATATCATCTCTATATACTTGGTACCAATCCTCCGTCTTCTCTAGTCTTTT
+GAGTATTTCTGATGGGTCTGGATTCCCCTGTGCTTCCTTATGTTGTTCATGTGCCTTTGC
+TAACCCTCTTGTTTGCTCTAAAGAGTATTCTCCCCATATTAATGGTTCTTTATCTTCCTT
+TAAAATATATTTGCAAATAGTTCCCCATCCCTTATGTGCCTTTACATCTATACATCTTCC
+ATCCCACTCTTTGAATCCATTTCTAATTCCTTTTGCTAAATTGTTCTTTGATGCACTCTC
+ATTCCATACTCCAATGTGGTAATGAAATCCTTTCTCTCCGTGATTTTCCTTTGCTATTAT
+GACTGATCTGCATTGAAACATCTTGATGATTCTCTCCTTTATTACTCCCCTATCTATTTT
+TTTCCGTTCTGTCGTTTCCGCATGAATAAGTGTTATTAGTAAGTAGGGTCTTATAGTGTT
+TAGTTTCATGTTCATTGTGTTGTTTCTTTTCCGTGATTTCCTTTTCTTCTTTTGTTTGCG
+CTAGGTTATGGAGTTGCTGCTGTGAGTGGATGTAACTTCTAGTGGATGTAACTTCTAGTG
+GATGTAACTTCTAGGTGGGAGTGGATGTAACTAATAGGGGGGTCCGGGGGAAGTGGGTCC
+CCCCCGGGCAAGAGACAAGATAGGTAACTCCAACATCCTCGTATGAAGAGTAAACAGAAG
+GGAAGTGAGGCTCCCTTATACAGGAGCCGAACGTTACTTCAATACCTATAAAGTTAAGGT
+AGTGCTCTTTTTGTTAAATACAAGCAGCCGACAACCCCGCCTAGCTCTAGTAATAGGGGT
+TGTCGGCGTATCGTCTGATTCTTCGGCGAATCGTCTGCTTTTTTTCTTTTTCCACTCGTG
+AAGCCCCCCCTTTCGCCCTTTTTTATGCAGACGATTCCCCGATCGGGGAATCGTCTGCAT
+AAAAAAGGG
+>ds2020-328_4
+CTGAAGTGCGGGGGCGGGATAGACGGGAAAGAGGAATAGAAAGGGGGGGGGACAGGTTGG
+TTCGAGGACTCGTTGGTCAAAGGAAAGATGGAAACAGGGGAGTTGGCTGATAAAGATGGA
+CAGTAACGATCGCGTAATATCAATTTATCGGCCTCGTCATTGAAAGCGGCTTCCAATTGC
+TCGGAAATTCTAAGCTATATGGGGGGCTTGGATGGTGAGCAAAAACAATTGATCAAGAAG
+TTGGTCAACTTTCGCATGAAAGAAGGTAAAAGAACGAGAGTTCGTGCTATTGTTTATCAA
+ACTTTTCATCGCCTAGCTCAAACCGAACGCGATGTAATCAAACTTATGGTTGACGCCGTA
+GAGAATATAAAGCCCATATGCGAAGTGGAAAAGGTAGGAGTAGCAGGTACTATTTATGAT
+GTCCCTGGGATTGTAGCCAGGGATCGTCAACAAACCTTAGCTATTCGTTGGATCCTTGAA
+GCAGCTTTCAAACGACGTATAAGCTACAGGATAAGCTTAGAGAAATGTTCATTTGCTGAG
+ATACTGGATGCTTACCGAAAGAGGGGAATTGCACGTAAGAAAAGAGAGAATCTTCATAGA
+CTGGCTTCCACCAATCGAAGTTTCGCGCATTTCAGATGGTGGTAAAGTGAGACCACATAA
+AGAGCTCTTCCTCATTCAGTCTGATTATTCAGTAAGATATGGTTTGACCCTTTTTCTTTT
+TGTTTGAATCTTCATATAGAAAGCCGGCCTTCCTCATACTCCTCCCTTCATTCATTGAGT
+TGGAGGAATCCATAGGGGCCCGCCCGTTATGCATTCCATGAAATAACCCTTCTTTGTATG
+ACTTCTCTTTTGCCTCAGGTCGAATGAATCCGAAAGGGAGATCAATCAAAAAAGAGGCCA
+TGAATGAAGAAGTAGTGGGCCTTTCACCCTCTTTCTAGTGACTCGGGGAGCTGATCTGAT
+AAATGCACTTCAAAGGGAGGGAAGCTAGGTTTCCCATGTTGGTATGGCCGGGCATAAAAG
+ATTTTGAAGTTAGGTCAAAAAGAAGAGGTAGAGAGAGAGAACAGAACGGAACCGATAGCC
+CCGAATTATGTCAGGGCAAGAGAAAGAAAAGAAAAGTAAGGACTCTCGTTTTCCGCATAC
+GCATATAGGCTGTGAAAAAGAAGTCCACTTTTCCAATAGAGAAAGAGAGTGATTCGTCTA
+CTTTGTTAATAAGGTAACGGAACGAACTTCAAGTACTTCGTAGGACGCCGCCGTTTGCTA
+AGATGTGCTTCCACATCGTGAGCTTTAGTGCACAAGTCGTCGAATCCCTTAAAGGTTTGG
+GGCAGGGGACGACAAGTCGTGCCTGAAGTTGTTCATGCACATCTTGAGGAGCTCTTGCGG
+AGTAAACTTCTGGGGACAGGCAAAAGTAGGGGCTCGCCACCTTGCAATGAACTCCGTGAC
+AGGTTCATGCTTGGTCTTGAGTTGTTCGGGCACTCCAACCCTTCTTTGTGTGTTGCTGAA
+CTGCTTCCTGAACTCCGAGACCCTTGCTTCCCAAGTCGGGATCGACTCTTCAGAGAGGTG
+GGCGTACCGTGTAAAGGCGGGCCCCTCCAATGATTGTACGAAAAGCCTAAGGCACAGTGC
+CCCATTCTGCGCTACCGGCCCACATCTTACCAGGAAATGCGCTAGATGCTGGTGCGGGTC
+TCCCCGTTCCGTCGAACTTTAGTCTGGCTGAGAGAACCCTGGCGTATACGGCACGGAATC
+TATCCAAGCCGGATAAGGTTTGGTGATCATGTGGTTATCCTCCTCCTTTTCCTTGGCCTC
+TTTTACTCTTTTCTTGACCAACTGATTCATTGTTGCGAGGAGGGTTGTCAAGCTTGTATA
+AAAAAAGACGTATAATAAATCGTTGATTGCTATTCTTGAACCTCTTCACCATGCTAATAA
+GATTCAGGAATTCTCCAACAGAATGGGTTTCCACTTTTCATTGGCAAATCAAGAGGCAGA
+TGATAAAATATGGCTCTGTTGGAATCATGAAGTGAATGTAGTGCTTGTCGACGCGTTTGA
+ACAGTGTATCACAGTCGACCTTAATTCTGATCTGGTAAGGCTTACCATTGTTTATGCAAA
+GTGCTCCATTCAGGAGAGACGGCTTCTTTGGGAAAAACTTCAATTACTGTCCTAAGACAT
+ACAAGGTCCATGGATGGTTGCGGGTGATTTTAACGCAATTTCATATGTGTCTGAAAAACT
+TGGTGGCAGACCTCCAAATCTTTATCTTTAGAGGAATTCAAATGAAAAATTCACGGACTC
+GCCATTTCTGTGAGAGATCCGATCCCAGTTGGTTTCAACTTTTTCTTCCCTCTCAATTCC
+ATCCATATCCCGCCTTCAATCTGAATGATCTGGAATTCATTTCCAATTCCTTATATCAAC
+TAATGGGGATACCGGGAGGGAGGAGAGAAAGCACCCCGCTAACTTTTTCTTTCTTCTACC
+AATGATCAGTAGATTGAGCACTAACGGAATATCGAGAAAGAAAGAGCGGAGCAACTAAAT
+CAAAAAAGTGCGTCTATCCCGACCA
+>ds2020-328_5
+GGTCGGGATAGACGAAAATCGCCTGTCAAAAAAGGAAACGAACGAACAGCTTTTGCGCGC
+GGAATAGGGAGAGACCTCTTTTTATAACGACAGCCGACCCCTTCTAGAAAGATTTTTGGG
+TAACCCCCCTGAAAATAAGGAAATGGATGTCGATTAACCCCACTTGGAGAAAAAGGGAGG
+CCAACGCAAGAGTCACCCACTCCGTGTGTGAATGGGCGAGGATAAGGCAGCCAATCAGGC
+TAAAATAAATGACGTGCACCTTATCCTTTGCCTCAAGAATGAGGTGGTTCAAATTTGCCG
+CAGCTTGTGAGCCCCCTGCTTCGTCTATCCCGACCNNNNNNNNNNGTGGAGGGAAAAAGA
+ATACAAGTGATCCTTACCTTTTTTCGCAATATAGAGAAAGAAAATGGCGCAAGCGCCCGA
+GAGGGGGAACAGCTGGTACTTTATTATTATGATAAAGTCTTGTGGGGCCAAAAAGATGCC
+TAGGGAGGCCAAGAGACTGACGACGCAAAGATAGAGAATGGCTAAATAAAGGGAGAAGGC
+CGGATGGATGCGAAGTCCCTCTTTCCAGAGAAAAAGGAAAAAGATTTGAATTAATAGGGC
+GATTCCCCCTTCGAAGGCGAAACACCGCCCTATTAATAATAATAGGAAGACCCAATCCCT
+CGGTAAGAGGAGAAGGGTTATCAACGCCGCAATGGGGTAAAGAGGGTCTGTAAGTAGAAA
+GCCGAAAAGGCTACTACTCAAAAAAGATGTAAAACTCAATTTACGTTGGAAGGGAGTCGT
+CGCCATAGTGGCGTAGAAAATACCCGAGCTTCCGCCCAGGACTTGTATTACTTGGATTAT
+TTTTTCCCATGGCAAAGGGGCCAAAAGGACCTTTATTGTATAAATAATAATTACAAAACA
+GATAATAATAATATCATCTGTATCATGGAAAAAATCCGTCAATAAATGACGAACCCCATT
+ACACAGATGATAGGACAGGGCTAAGGCTGCGATCTCGACAGAGATGGGGATTAACTTTGA
+TGAATAAAAGAGGAATTGGTAGAAATTCTCATGGTGCCCGCTATTCAGTGATGGTGAGCT
+GGTCAAGTAAGGAGAATCGGAATAATCGAGCTAATCGGTATCAGTCTTGGAGCAGGGTAG
+CGGATCAAAAAGTACCCCAAAAGAGTAGCAATAAGGTACCTATTACTCCATTCGTCAAAG
+CACGCTGAACACCGGCTCTTGATCCAGGGGTTTTTCATGTAAGTGGCTTAGAGTGAGATT
+CTTGTGACCGACCACCTCACTCCGGAATAGAGATTCTCAATAAAGTAAGAAAGAGAAAGA
+AGGAATACTAAGAGATTGAAGGCTTTTAGATTCAAGAAAGAATGCGAAGAGGACGCTAAG
+CAGGATGCAGAGAGCAAGCTTGGCTTATCCGTATCCGTCTTTTCCTCGGTTTTACTTTTT
+ATCTTTCTTAATGGAAGGCAAGGTACAGGTACTCTCAAGTGCGCGAGAGGAAAGCGAGCT
+TGATAGAAAAAGTCGCGTTTAAGCCGCTTGATATGAGTCAAAGAGCAATAAGCATTTCTT
+CTTGGTGAAGGGGCAAATTGATAAAGAAAGTTGTTTAAGCCCTTTGCTTTGAGAAAGGTA
+GGTAAGCCCCTTGATCGATCGTTTAAGGCGAGGGATCAGATCGGTGTGCCACAGAATATT
+ATTGTATTCTACCTTGGGATATTTTTTCCTGACCAATTGCCAAGCTGATTTGAACGAGAA
+ATCCCCTTCCGTAGATAACGTCCATACCACCCTGTCAGGCAAAGGTACTGGGGAAAGATC
+CAATGCCCTAATCTCCTGCCATATGTCCTCCAGAAAAAAATTTATGGCTGTAGGAAGAAC
+CCACCTCTGATTACCAATAAGGTCCGAAACGCGGTTCTGGCCTACGAGAGAAATTAACTT
+TACATACTGATATCGCATACCGAAGGGAAGGCCTAATTGCACCACTCCTCCTTATCTTCC
+GCCTGCCGTCTCCCTCCTCTTTGCTTTGCTAGCATCCTTTGATAAGCAAGTTGAATGAGC
+CTTCAAAAAGAACCCACCCATATATGTACCCCTTTAGGCTCTCCGAGCAAGCAAGTGAGT
+GAGCTAGTAAGCAAGCCAAAGATACCAATCCGCTGTTTTGGATTCCCGTAGGAGTTAGCG
+ATAGAAGTTGTGTCGTAAGTCCTGCCCCTTGGGGCAGAACCGCCAGCGATTTGCTTCCAT
+CAATGACAGCCGTCTTGTACTGATCCGCTTATCTTTTGATTGACGATCAAGTAGCTTTCG
+CCTAGTCTCATACACCCTCAGAATGGTTACTGGACAAGTTTGGTCCTTTGCTGATACAGA
+AATAGGGCAGCTCACCTGTTATAACACTTCGGCCCTAGCGTGGTCTTTCCACGGATAAAA
+CCTGTTCTGTATCAAGGACCCGGAACGAACGTCTATCCCGACC
+>ds2020-328_6
+AACACCAAGAAGTATCCATTCTTAACACAATGAAACCGCCGGCTTTTTAAAAATATTTCC
+TCTTCAATTATGCACGATTTACTGTACTGGGGTTGTCTTCCTTTCTTGGGAGTAAAGTGA
+GGAGTCAATGAAGGTTTGCTTGTGGTTTTAATTGATAGGTGTTTGCAATGGGCTTTCGTC
+TCAGGCTCAGGTAGTTCAGTCTCCGGTGAAGTAGGGTTAGATCAGTCTCAGGGTCCGAAG
+GAGATAGAGTTATGGCATTTCTAGGGTTCGAAGACGGTACTATTGATTTCATCAATACCA
+AGCGGGACTTGCTTAATGGGACATTCGAGAAGGAGCTGGACAGAGGAATTCGATCTTCAG
+CTAAAGGTACTTGAGGGTAAGGAAAGCCGTATAGTGAGTCAAGCTCAATTGTAGTTCCCT
+TTCCCCTATATGTGCGATTAGATTACCTTTCTCATTTGCTTAGTCCCGCTCCGTCTGTCC
+TTTCTTCCGTCTCTATGTCTATTTCTCAATAGGCAGTGAATGAACAACTTCTTATATAAG
+GATTTCTCGTAAGCGAAGAAACTTCTTTTCTAACTGGGTGTGTTCGTCTATCCCGACCNN
+NNNNNNNNGGTCGGGATAGACGCGTATTATGGGTGAGGGTACGACACTACAAGGCAACGA
+AGTTAAGAATAAGTTCTTCTGGTAATCAAGGAGCAGCCAAAGGAAGGTACTCTCGGGAAA
+ATCCATGTGAATAAGGAATGAGATCCGCGGAAGGGAGGAATTTAATCTTCTTCTTGAAAG
+CTGAAGGAAGTGTAAACTGTTCGAACGGCCGGTACTTAGCAACGGAAGTAGGAGGAGATC
+GAGCTAATCAGTCTATGTTGCTCCCGCTCAGGAAAGAAGACAGGGGCAAGTCGATGAAAG
+TCAGGTTTTTAACCGATTCAGGATCAACTTCGAATCCAATAGAAGGACTTCTAGGTTCAG
+ACAAGGTTGCTCTGCTTCGCAACCAGTGTTTCAAGTGCCAATCCCAAGCTCTCCAACGGC
+AGCATTCCAAGCAACCCTAACCAGCAGCAAAGCGCTTCCTCGAAGGCAAAGTAAGCACCG
+TAGATAGACATAATGTAACCAATCAAAGGTGCACCGCGTCTACCCCGACCNNNNNNNNNN
+ATGGGTTCAACTATTTCTTCTACGTACAGGATTCTATCCCTTCAAACCTGCCAGTGCTCA
+AGTCAAGTAGAAATAGGGTGGTTAGGGAGGGTCGATCCATCAACGGATCCAACAACAGAT
+CAATCCTCAAGTAATCCACGGAGAAATAAAATAGTATATGACTAAGATCTGTCTTTTGAT
+GCGGGAAAATGAGGCAAAGAAGTCAGTGCAGGCTCTTATGATTAGTAAGAGGAAGGTAAG
+TTTACGCTCTTACGACCGGAAGCGAAAGATGACTTGACCTTTAGACTTTATCAGAGGAAT
+TATTATCGCTTAGCGCTTGCGCGGAGGAAGGAAAACGAAAGCTCCGAGGAAGACAGAGTA
+ATTCGATCTTTTGGGAATGGGGGATTCAGGTAAGAGTTCATTCCGGCATAACTTGGCGCA
+AGGAATTTGCTCGTTCCGAGCGAGGTTCGACGTTAGTTGAAGTTGACATTGAGTCGCGCA
+CTTCCTGGAGTGGGGAGTGAATTCATGCGTACCTCAACGCAAGGATTGAATTAGCTCATC
+TCGAGTTACGTGAGTGAACTTTCGCTTCTTCTTACTTTGGTCGATCAGTCAACCTCCCCT
+TTATCAGTCTTAAGCGAACTCTTTCCCGACTGGCATCTTAGAATAAAGGAATATAAACTC
+TTCCAGATCCGGAATTTGCAACATCAAGAATAGAAGTAGAAGCATGCTATGCTAGCATAG
+AATAGAAGTCCCGAGTGAAAACGACTTTCCTTAGGATGAGCTTTTAGGGCACAGTAGAAA
+GAGCTTATTCGTCGATAACAAGCCTTTCTTCATATCATAAAGGAATAGAACCGGAAAGCT
+TTGATGCGAGAAAAGTAAGTCCATCCGCACTAGGTCCACGGATGAGTTCGACTACTAGGT
+CCACGGCNNNNNNNNNNACCCAATGCAAGACAGAGGGATCCTATAATAAGACTGACTCCT
+TCTATTCTCTTCACTTACACCTTACACTTCCGCTGAGTCTAACGAGGCTCAGGTGCGGAG
+CCTTCCACTGTGGACCGAGACTACACAAAGGTAGAACACTATAGAAACTTCGCTGACTTT
+ATCATAAACCTCGATTTCGCTACGCTCAATAAGAACCCGGAATAGCGGAAATAGGTTCGT
+GTTCCGCTTCCAAAGTAAGTCGTCTTTGCCCAAGTGTGAACCGCAGGCGAC
+>ds2020-328_7
+GGTCGGGATAGACGTCACCACATCCTCCTTAAAGGGGCATCCTCACCTTACGGTGAGGGC
+ATCTACAAATTTGTAGGCAATAAAAAGTGTCATCCATTCAGGATACAATGGGCATTTTTA
+TCTTAACTTTTAACGCACGCAGTGCAAGTTAACCAAAAGGATTTAACATTCAGTGACAAA
+ATCTGAATGGTGGATTCTATTGCAAAAGCAGCATCTCCAGCTACGAATATTCCTAGGAAT
+ACTCATAGTGGAGGTACAATCAAACAACGGATCATATAGTCATCCACTGACTATTTTATC
+CATTGCATCCATGAGAGCGGTATCCCGTTCAGCGTATAACACTGAATCAGGGATCTCGAC
+TCTCTTGGGCATCGAGTGTTGTAGGTACTGAGTACAGAACCATACCGGAACGCCGGGCTG
+AAAAGCATTGTCATATTTTATGACAAACCAGAGATCATCTGGTATATCCCCGACGGTCAT
+ACCAGTAGGAGCAAGAATTTGCACCCCACTGGCTTGTTTCGCTGTGAACTTCCTACGTTG
+TAGGGGATTAGGCGCCACTGGCGCATTCACATCGAAACCTTTAATGAGTCCGTAGACACC
+ATTAGAAACATCAAGGCAGTAACGAAAAACAATTCCGTATACCTTGGTATCAGCAGAAAA
+GTCCTTGAAAAGTTCTCGGACTTTCATGGTGTAGTAAACACCGGAAGCGGTCGAATTGAC
+CGTCAAATTCTCGGTACGAGATATCATACCGGAAAAATTTTTTACGGGCACATTTGGCCC
+GTGAAGCATCCACTCGGAAACAGACTTCGAGCTTCCACCCGGGAATTGTTTCTTAACAAA
+ACCAGCAGGGGGGGTAGTATTATTATTCTTCCGAGCTAAAGCAAAGCTTTGTGATCGGGT
+AGTAGGCTTTCCAGATTTAGTGGCTTTCCCAGACATTATGAGAGTATAAACAAACGAGAA
+TTGGAAGAAATTGGTAAACAAAACGAGCTATTAACTCACAAAGTGAGTTAACCAATCGTT
+ACACCAAAAGCTTCCTTGTCGGACTTCTCTTTTTTTAGAGGAACAGACTCGGCTTCCTTG
+AAACTGTCAAGGGAAGATTTACCCTTTACGGGTACAGCAATATTCTTAAAATCCACTGTT
+AAAGCCTTCTTTGACTCGTCAGACTTAATTTCAATAAGTCTGGGATTGATATCAACCTTT
+CCACTACTCCCAATTACCAAACGTGATTTGGCGAATGTTTGGAGTATCTTTACATTGTCC
+ACAGCAGCAAGGGCTTCCGATTTCTCAATCGGGAATCTCAAAGTTGGGTACATTTTCTCA
+TATGGTTTCTTCTTGTGCAATGAGTCATCCCAGAAGGGGTAAACAGTTCCAACAATCGAC
+GCGTGTTTAGCGTCTACACTTACAGCTGATGCTAGTAAACATATACCATCTCCGTCATCA
+GCATGAACTGCTCTTGGCCATCTCGCTACGAAAATAGCCGCTTCATTCAATGGTGAATCT
+GTATCTATATCAATAGATTCACCTGTATTCACATTGAAAAGTTTCAATGTCAATACCCCA
+CTAGTTGTTTCCAGAATGGTCGGAATGTACAACAAGTAAATTATACTATGATGCACGTAC
+ACATGACCTTTTGCTTTAGCGGATAATCTTGCCAAAGCGCTTCGGGATTCTTTGGATTGC
+AACTTCATGGGTTGAATTGGAACACCATTCTTCAACTGTAAAGAAAAACATTTCTTAGTT
+GGAAGATTCTTCATCATAGTTTGGGAATAAAAGTCATCCACTTCGCTGAGTATTGTATTC
+CAATCTTCAGCGGAAACTTCAAATGCCGAACTGGTACTGGCTTCGGACGTCTGTCCGGTA
+ATGGTCCTGGATACACCAGAGAAAGCCATATTCAATTCAGGAGATAAATCTACAACCGAA
+TTGTTTCACTCAATAAAATAAAGAGGTTAATGAATAGGAACAAGTCCGATTAGTGAGATA
+AATCTCAAACGTCACAAACTTGTCTTCTTCACACTTTGCAAGAAACCTTGCAGTAACTCA
+ATTTCTTGAGGGTTTATAGAGAACCGCACGTCTGTCAACTTCCACAGCTTAGCACAACCA
+CGCGTCTATCCCGCCC
+>ds2020-328_8
+GGGCGGGATAGACGCTAAGACGTCATGGAGATCTTGGTCTAGATCCGGTGGTTCGCAGAA
+TTCGGGACCTAACGATGTTCGGTTCGTCACATGAACGGGAGCGGACGATTCCCTCGTCTC
+TCCCTTTTCGGGGAATGGCTGCAATCACAAGCAAGTTATTGAATGGGTGGGGGGCTCCGA
+AAGCACATGCGGGATAAGCAGGTGTTTCAGGAGACGGTCTAAAAATGGGCCCGGTCTAGA
+ATAGAAAGAAAAGAGAACTCTCAACAAGCTGAAACTAATCAAGATCAATAGGAAGGCTAG
+TAATTTATTGACAAAGTTCATGCGACGACGATCTATATGGAAGGGCTGTTTTGTTGATGC
+ATTCCTGTTGAGAAAGTGTTTTTTTTATTCTCCAACTCCGGATGAGTTTGAGGCCTCCGG
+CGCCTTTTTTGAAGACTTTTTGTTGCGCCCCTATCTCTAAAGGGCGAGGGTGGCGGCCTT
+GATTTGGTGCCCCTCCAAGATCCCCCCGGTAAACTCGGGCTCGGGGGGCCTTTGCCTTCA
+TTTCTTGAAGAGCACGAGGTCACCTCTTCATCAATAGAAAGGAACGTCAGAAAAAAATGT
+TGTGAACTCCCCCCGGAATCCAAGAAAAAATAGCGGTAAGTCATGAGAGGGCGGCTTTCT
+TGTGGTAGTAATTTCGAACTAATTATATTTTTGGAGGATTCGTCCCCTATTCCTGCGGCT
+GAGAAGCCTCAAGCTCCGCCACCCTTACTCTCTCTCTATAAAAAAGCCCTTTCCCCTTAG
+TGCAAGTACTAAGTAAGCAAGCTACCTCTCCCTACCTTTGGTCGAGCAAGTAAACTACCT
+TTTCATAATAATAAGGCAAGCTCCAGAACCGGCGGAATTGCCCAATCCTATCTTTCCTTG
+AAGTAAGTCCGGAGCGGGAGCAACTTCTACAGCTAATTCAGACTAAACTCGATCACTTGG
+CAGGGGGGTCTTTTTGAGCGCATGTTTCTCATATCGATAAAGCAGGTTTCGTCTCATTTT
+CCGGAAAGCCTGTCATACTATTCCACTTTAGCTAAGCTAATGATGAAACAGGATCTGGAT
+TTGTCTGCAGATGATGATGTCCACTCCTGGCTCGAAGCGCTTAACGAAAGGGAACTCTCT
+AGATTAAGAAAGAATTTCCTTCATAATTAAGCAGCATCCTTTAAGTGAGTAGGGGTGCGC
+CGGACCGCCGACGAATAATAGGTACCCCACCTATCGTTGTGAAATAAGAGCACTCGATCG
+AAGACAATGTCAATTGGCCAAGCCATAAGCAAAGCAAGGAAGAGGCATCCAGTCCAATCT
+GCTCTTAATGTTCGAGTAGCCGGTGCCGCTTTTTATGGTCTTTTCCACGTAACCGCAGTT
+GGTTTTATATCCATTGTTCAAATAGCCGTAAGCGGTGGTTCAGGAAATGTTTTAGAATCG
+GTTGTTACAGAATACGCTGTGGGACGTCGAGGAAGAGCAGTGGGCCCCAGGTGCGGAGGT
+CTCGTTTGCAAGTGGAATCCGAAGGGGTTGTGCACAGTTAAGAAGAAGAAGTTGTTTTCA
+ATTTCATAAGACCTATGAAGGTACGAATGGGATTGAAGGACAGATGATCTTCCTTTTCTA
+AAGATAAAGAATCCCTGATCTGACTCAATAGGAACTACACTGAAACCTTTTCTGGTATGG
+TGGAGCTGAGACCACAGGTAATCGTCTTTTGATGCTTAAATTTAAATATAGGGAGTTTCA
+GAGAGAAGAGAGAGAGGGAGGGGAAGGTCAAAAGAGTCTACCTCGATTTACGGTTAATGC
+AAAACTGAGTTAGAATTCGGTCTCTTAAGACAGAAATCCCCTTAAACTGTCTCAGATAGC
+CCGATTTTTTCTTGGAGGACCTCTTTTTGTTATTTATTATGATTACTTT
+>ds2020-328_9
+GGTCGGGATAGACGCTGGGTGGGTTTGTTTATCCTTCCAGTTTCGAGTGTCTTCTCGGAT
+AGTTATAGCGGCCCATAGGCGCAAGATGTACCTTGTGGGGGGGCGGCGGTCCCCTGGACA
+TAGTCCTTTCAGGCAGTGGCCGTTTAGTCCATGGTCCATTGGATGGTCGGTGCAAGGCCA
+GAAATTGGAACACATTGATTCCGCTCGTTCCCGTCCTTCGCTTCAGGGCCTGCCCCTCGG
+TTTGGTCAGTACTCCATACTGTCGGGCAGCGAAGCTTACACTTGTTCACTAATTATGACG
+GTTCGCCAGGGCCTCTTTCCTCCTCCCTTTTCTGCTCACTCGTAGGGGTCCGGACCCCCA
+CAAAGGGGAAGGGAGTCGACTGAACATCTCAGCCATTGGCGGGAATTTCGCCCGCATCCG
+ATCCCCAATTCTTGTTCACCCCGGATGATCGTGTTGGGTGAATTGTGACCTCGTACGATC
+GTGTCGGGTGAGCAACAGCCGCTTCGTCACAGTACTTACTTATGGGCTAACGGGTCACAC
+TTTGGCCAAGTATCCTACAAAGAGACTCCCGAGAGCCAGAAGTATTGAAGGAATGGCCAT
+AGGAATGGGCGCATCATGACATCGTAAGATGTCTCGCCCGAATGAATTAGTTGGTACTAG
+AAATGTTAAAAAAAGTAAACGAAAAGAGTAATAAGAAGTGAAAAGGACAGAGACACTTCC
+CAACCAGAAAGCAAAGTTCCCACTGATGGTATACTTAGTGTAAGCGAGCTCTAAGATCAC
+ATCTTTGGAATAAAATCCAGTTAGAAAAGGAAATCCTATTAGAGATAAGCTGCCCATGAG
+CATCATGGCATAGGTAAAAGGGAACGAGGAGGCAAGCCCCCCCATCTTCCGCATATCTTG
+CTCATCCGACATGGCATGAATCACCGAACCTGCACTCAGGAATAGTAATGCTTTGAAAAA
+CGCGTGATTCATTAAGTGAAAGACGCTAACCGAATAGTTAGAGATGCCGCAAGCAAAGAT
+CATATAGCCTAATTGACTGCAAGTTGAATAAGCTATGACCCTCTTTAGATCGTTCTGTAA
+TATTCCAGTGGTTGCCGCTAGGAATGACGTCGTAGCTCCTGCAGAAGTAATAACAATCAA
+AGCCGTAGGTGGGTATTCAAATAAAGGGGAGCACCTTGCTATCATGAAAACGCCAGCTGT
+TACCATAGTAGCTGCATGAATCGAAGCGGATACTGGAGTGGGACCCTCCATAGCATCGGG
+TGACCAAGTATGCAATCCTATCTGTGCCGATTTCCCAACAGCACCAATAAAAAGTAAAAT
+ACAAATAAGAGTTATGGCATTAAATCTCATATTGCAAGAAATCCAAGAATTTCTGGGGGC
+ACTAGCACGAGCAAAAATGGTTGAAAAGTCTACTGTTTGAAAGAGAGTAAAACGGCCCGA
+AATCCCAGGAGCTAATCCAAAATCACCTACGCCCGTCTATCCCGACC
+>ds2020-328_10
+GGTCGGGATAGACGTCTTCTCTTCGTCTACCGCAAATAGAATAGCCTCGCCCGGGAAATT
+AGTCCCCTTACTAAAAAAATCAAGCTTATAGTCAGGCACGGGATGGGATGATCCGCAGGT
+GGTCTGCTATTGCCTGCCTCTTGCCTTTCTCATTTAGGGCTTCCGGGTGACGTACACAAT
+ATAGAACTCTGAGAGTAACATCTGCCACCTTGCTGTACGGCCCGTGAGGGCTGGCTTTTC
+AAAGAGATACTTCAGCGGGTCCACCCTTGCAATCAGCATGGTCGTATAGTTCAACATGTA
+GTGGCGTAGGCGTTGCGAGGCCCGTGTAAGAGCACAACAGGTCTTTTCTAGAACCGTATA
+CCTTGTCTCATAATCAGTGAACTTCTTGCTGAGATAGTATACGGCTCTTTCCTTCCTACC
+CGTTTCATCGTGCTGACCAAGGACACAACTCATGGATGCTTCCATTACTGACAGATACAT
+CAGGAGAGGTCGACAGGCGTTGGCGGTGCCTGGATGGGAGGATTGAGTAGATATTTCTTA
+ACTTTGTCAAACGCCTTTTGGCAATCCTCGTTCCTTGTGTCTATCTTTTCTGAAAGGCGG
+GGTATTCTTTCTGAGCAGTTTAAAGATCGGCTCACAGATGGGTGTGAGCTGGGCAATGAA
+CCTGCTGATGTATTGTAGCCTGCCCCAAAAAGCCCTGATTTCTTTCTCTGTCTTTGGTAC
+CGGCATGTCGATAATTGCTTTGCCTTTTGCAGGTCGACTTCGATTTCTCTTTTGCTGACA
+ATGAACCCGAGTAGCTTACCTGACAAAGCACCAAACCCCCCTCCCGGCTTTCTTTTTCGG
+ATGAAGACGAAGACTGTATTTCCGAAATCTGTCAAACACTTTCTTCAAATTCACCGTCTT
+CTTAAGCCCAAGACTTGGCGATCATGTCATCGACATAGACCTCCATTTCCTTGTGAATCA
+TATCATGAAACAGCGCAGTCATGGCTCGCTGGTACGTCGCCCCGGTATTCTTTAGACCAA
+ACGGCATCACCTTGTAACAGAACGTGCCCTCCTATCCGATATTGTGATAAACGCTCTGTC
+TTCCTCGGCCATCTTGATCTGGTTATATCAAGAGAAAGCATCCATAAAGGACAGCATCCC
+ATGTCCAGCGGTGTTGTCCACCAGAACATCGATGTGAGGAAGAGGAAAAAAAGATTTTCG
+GCTTGCCTTGTTTAGGGTCTTTTGACTCACGGAACCAGCTTTCTGAGGGAAAAACCGTTC
+TCGAAAAGCGTGACCATCCAGTTGAATCTCGTTACCCTCCCGTGTGGTTATGGGGGCGCG
+CCCACTTTCCACTATTATGGAGCCGGGCCGCAAGCAAGTGAATGTGACCCCGCCCTCCAT
+CAGCCGTTGTGTGTGAGCTTCGCTCCTTATAACTCTCCACCGTCTATCCCGACC
+>ds2020-328_11
+GGTCGGGATAGACGTTGTGGTCTGATTGTTTTTGTCTGGGTTGGGAAGCTCCCCCTTGTT
+AAAAGAGTCCTCTATCTGCACACTAACCTGGGAGACTTTCACCCTGTTTTTCTGCTTCTA
+AGCCGCTTTGAATTGGCCTGTGCCCGTTGATGAATCATCAATCCATTCAGCCGTCACGTC
+AGCCGAGAAGACGGACTTGCTGGTATCGTCAAATAGAGTATAGAAGGCTTCTTCCGCTCT
+AGTGGCGGGTTTATCTTTTCATTAAGTAGCCCCTCACCTCGTACACTGAGTCAAGCGACT
+TCTCCTTTTCTGTCATGAAGAGGAAGTGAGATGATGACAATGCGGCTGGGAAAAATCCAT
+ATCAATCCATTTCTTCTATATATAAGAGAATTGGATCCCGACCCAGACCTAATAAATTTA
+ATTATATGCTGATTTCATTCCACTAGTACCCGTAGCTTCTTTTGTTGGGTTGGTTGGAGT
+GCTTTAATCAAACACTTGACCGAGTAGATCATGTTGGGATCTTCACCATGAATGATCCTC
+CGGGCGAACATCTCATGGCACACCATTGATCAATAAGACAGGATAAATAGAATATACGGG
+GATAACCCCCATTCCTATCAGCGTGAAATGAAATTCATTCAATCAGTCCTCTCCTCCGCT
+CTCTCTGTCCCTGGCTTCTACTTTAACATACATACCTTCTGGCCTCAGTCGTTGACTTTG
+ACCCTTCCGCTCCTCCATTTAACAAGCAATTTCATTTAGTGGTTGTTCGCTCCTGAACGA
+AGCTATTGGGACAGCGGCTTTGATAGCGCTTTCTCAATGAGATAAATCATATCGTGGTAG
+AGCTCCTATCTGTGCTTTGACAAATCCCTCTCTGGCGTCATCTACTGGCTGACTGCACAC
+TGCCTTCTGCCTGACTATGGCTTTTATTAGAAAGCAAGATCCCTCCGTTTATCACTCTAT
+AGAAAGAACATCCCATACAGAGTCTTTCAACTAAGCTATTCGAGCCTTCACCTAAGCTCT
+CATCGATAGACCCCCTTTCTTTTTGGTTGTAGTCAGACACCTAACCGTTCAACCTCGTAG
+GCATCTTTCTATTAACCAAATCTGATACCGTCAGGTACGGAATGAAATAAAAGGACTTCT
+TCGGCCCCTGCGCCTAGTGGTGCTTTCGGCTTGAAAAACCACGTGAGTGCTCTTATTGGA
+CCAGAGCTTTGGCTACTCCCTGTTGTCTTTGAAAGAAATTTACTGAAACCTGATGCGCAG
+AACCCTTCGTACAAAAATGAAAGATCAATCTCAGGCCCAATTGACTCATCTTAGAAAGGA
+TTTGATGAGCCAGTAAGCTGAGCTATCAATGCCCAACTATCGTCTATCCCGACC
+>ds2020-328_12
+ACCGGCGTCATTTCCATCACTTGATCCGGTTTCTTAGGAAAAGCCATAGTTATGCTGCCG
+AAGTCAGCCATCGTTTGCGGAGATCCTCCTGGGTGTACCAACGCTGAGCTTACGCTTTCT
+CTCCCCACTTCGGTAGCTCGCTGCATCGCCATCTCCCTGTTGGCCATAACAGTCCTTATG
+CTGCTTCCTGACTTCTCCTGAGACATTTCTTCGCCTTCGTCTTCTTCATCGCTTGCATCT
+TCTACCAACACTCGTTCCATTTCTCTTGGCTCCGTATGCTTCTTATCTCCATCTTCAACT
+TTCGTCTTCTGGGCTTCGTTCTCCTGCTTTTCTTCCACTTGCTTCCCTTCTCTAGACTTG
+TCGCGCTTCTCGCCCTCTTCTTCAAGGCTCGGGTTTTCTTCTGCTGCGTCTCGATTCCTT
+TCCCCTGCTGTTTTCCTGTCTACATCGCTTTCGCGGCTTTCATCTCTTACGTCATCTTTA
+TCCTTCACCACTTCAGCATATGTGGGTTTGCTTGATTCGACACTTCTATTCGTTCCAGAA
+TCCCTCGACTGCTCTTTGGGCTCTCCGTCGTTTCCTTCGCATGTCGGCTCATTCTCTTCC
+GCGCCCATCTCACTCACCGCTTCATTTTCCACTAATCTAAGCGATGCTTTCTCACGCCTT
+CCTTTAGCCTCTGGCATGCGAGGGTGCTCCTCGGCGTTTTTGAATTTTCTAAACTTATTC
+AACACTCTTTTCCCAGCCAGCTTGGCTCTATCTGCGACCTTCTGGCATTTAATTTCAAAA
+TCAGCAGTCATTTTCTCATCGGCCTTTACTTTATCTCCTACAGAAGATAGCTCCTCGACC
+ATCGCTTCTGCGGTTTTGAAAGAAATATCTCCGACGTTAGCGCTCTCCAGAAGCTTCGTC
+ATGCAATTCATTGACATCTTCGTTACAAATGCGCTATCTTCATCTTCTGTACTCCATAAA
+TTAGATGAATTACGGCGGTCGGGATAGACGAAAGCGGGCCATCGCATTAGTGTCCGTTAT
+ATTCGCTAAACCTGCTTCAGTTATGAACTTACCTATGTGCGCTTCACACACATCATCTAC
+TAGAGCCATCCTCTCCGTCAAATCTCTGAGTGACGTCATCCCGAGGAGCATGATTAAAGC
+TTCCTCTTCCGGCACTCCAAAAGCCGCCGCCATCACCATCGTCTTGACGTCTTCTTCTTC
+CCATACTATATCTCTGGTTAGATTATACATCAGCCAACCCGAAGGGAAGATCCGCCTCGA
+TCTGAACCTACCTCCTCTCATCCCGTTCAAAGCCGACATCAGAGGCATGAACGCGTAAGT
+AACGTCCATCGGCTCCCCTTCCGTTTTCAGCATCTCGTGACGTCTATCCCGACC
+>ds2020-328_13
+GGTCGGGATAGACGACACTTTGCCATGGTTGTTGTGAAAGAAGAAACTCTTGGAGGAAAT
+GCCTTCTTAGCAATTGAATCAACTCCTGGTGATGAAGAAGAAGAAGGAGCTGTGAGGAAG
+GGAATGATTGCACTAGTCCCACACCCACGGACAGAAGGAATAGAATACGCTCTTTGAAGG
+ACGTTAATCAATAGGAGAAGATAGCCACGCACAGAAGTAGCNNNNNNNNNNATCGTAAAC
+GCTCTTCTTCCAATAGGAGTGATTCTTTGCCTTGACGCTGTGAGAGCTTCCGGTCCTTGA
+GTATGAGTACTCCTATCCGCTCTTGGGTTCATAACCGGTCCTATTGAATACGGTCTTCTC
+GGCTTTCCCTTTCCTCCTTGGCTTTGACTCTTTCGATCTCTGGTCTGCCTGTCTGTAACC
+AATGCCTGGATGACTGTCTTGGCTTTCTGTCTCGACTCTCTTCCTTCCTGGTGAAGACTG
+TGGTAGTGGTATCGGTTCTTTGCTTGGTTGATTGAATATCTCTTTCCTTGCCTACCTTAG
+TCTTAATCCGCCTTTAGGGAGTGAAGTGAACCGGGGGTGATCTAATAAGTTGTGAAAGAA
+TCGGTTTAGAACGTATCCGCTGTTTTAGCCATATCCGCTGCGCTCGTCCTTTCTTCCTAG
+ATGCTTTGAATATCCCCGCCATATTCAACAATTTTGCTTTCCAACCGGAGAGTCTTCCTT
+GCACTTTCTCTAAAAAATCTGCATAAGTTCTCCGAGAAACCCTTTCATGAATTAGTGGCA
+CGCCAAGATACTTCCCCGAGTTCTTTGTGACAGGCATCCCTACAATTCACTTTATTTAAC
+ACATCTCGAGAGGTATTCGGAGACACAAATACCTGGGAGTCTTTGGGCATCTCACAGTAA
+TGCAACGATCAAATCTTAATAAGATGTTGACCCGTTTTTCTTTTCTTTGCTGATTCCTCT
+CAATGAAATTTGCCATGTTGCACTAAGTTACTTACGGATGTATGCATGCAATCCGGGAAC
+ACTTTGGGGTGAACACCCATCCGAACAAGTAGGGTCAATAGTTCAGCATTTAGGCCGTAA
+CATTTAGCAAAAAAAATCTTTAACCCAACAAGTGCTCTCCGAACCAAGCTAGATAGTCTC
+CTATCACTAGGCTCACCAACCAACCTGGACTTTGATTTTTATTATTCCTACCGGATACCA
+AAACCATAAGGATTGTTTCCAGCCATGAGTTCCCATATGACATGACATAAGCGCTCTTGG
+GTGGGCTGGGCCATTCCATCAAATCTTTGAGAAGGGGCCCTTGCGTCTATCCCGACC
+>ds2020-328_14
+AACCGAATTACGGCGGTCGGGATAGACGGCGCCCCACCATCTGTTCTCAACGTTTGTAAG
+AGCAACCACTTAAGTGACTCCCTCTTTAAAGCCTAGTCCGTCAGCGACTTACTCCCTCAA
+TAGAGCCTAGTCCGTCAGCGACTTACTCCCTTCGAAGACTGCACCATTTCGGTCTTGAGC
+TCCCACCAGTTTTCTCCCCGAACAAGGTCCCGCACCTTTTGTCCAACATCGTCACCAACT
+CCCTTGCGCATATGCGCTTTTGCCACACCTCATGGCATTTGTGGGTCTCCCCCACTTATC
+TCGTCGACGCACCCTCACGTCAACGTGCCTCTGAAGCTGAGCTCTCTAACACTTTCGGCC
+TTCACAATTCACCAAGGTTCAATGCCATCCCTACTACGAGTAGAACATACTTCCGTAGCA
+TCCCCAAGGGAACAAGCACGACATCCTCCCCCAAGTTACTTCCTCTTTGGCCTTCCACCA
+AGTGCGGACTTAACACGTCCTCAGCCCCCATCTCACACAAAAGACTCCGGGATCAACCTT
+TGGAACACTCCCGCATTCCGCATTTTAGCTAGCAACCTTGTGTCAAACATTGTACTCCAC
+CCACACATTCTCCACAATTGCAAGAGCAACCACTTGAGTGACTCCTTCATTGAAGCCTAG
+TCCGTCAGCAACTTACTCCCTCAATGGAGCCAAGTTCGTCGGCGACTTACTCCCTGTCGA
+AGACTGCACTAATTCGGTCTTCAGCCCCCACAACTCTTCCCTGAACAAGGGTCTTGCACC
+ATCTGCTCAACTTGTTGCCAACAGAGTTTTTCTCAACCTTCACGGCATGCCACGGTTCGA
+GTGCTAGTTCATCTTCAACACTCTCACCAAACTCGCGCTCCCATTCTCCCCACATCCTGA
+ACTAAACAAGCAACATCACTTCGTCGCAAGTCAGAACCCCTGCCTACCCGACTTCCGGGC
+GCTTGGTGCACGGACTAGAAAACTAGGCAACCGAGCAGCACAACCAGCCATCATCCCACA
+TCTTAGAGTCATCCTGCTTGATGTCTTCACAAAACTTCAAGGCAAACTTTTGGCTACCTT
+CACCCTTCCATAGGATCCAGCACCAAGACGGGTTTCCATCAACCGTCACAACCTGATTCC
+AACTATCATCCACAGTGACGTTGGGTTCTTCAACCAACTTTGCAAATCCATTACCCAACA
+CCGTCAACCTGACCGTCTATCCCGACC
+>ds2020-328_15
+GGTCGGGATAGACGAAACTTCGGGCTGGTAAGGTCGGGACCGTGGTCGTCCGTCTCCGGT
+TTGCCGGCCGATAAGATCTCTGAGATTGACCAGCCAGCTGGGTTGGTTTGGCTATTCCTT
+TCTATTGAAAAGGAGTCAGCTGTCTGCGCGAGTCACCTTCTTCTAGGCTCCGCTGGACGA
+CACGGCATTCTCGTTTAAATATAGGCCGGCCGTACTTGTGATGGTTCCCAAGGATCCAAT
+ATGACCACTTAGGTCTACGTTGCCACGATATTGTTCTATGGAAGCGGGCGGGCTGTTAGT
+TAGAAGTTCGGCCCGGTTTTTTTGGTGTCGTAGGGAAGGGATTGACCTTTCTAACGCATA
+TTCAGTCGTACCGGCATGGCCCCACTGATTTGTTTTCGATCGGAGCATCAAGCAACGCAA
+CCCGGTTCTACTTGACTAAGCCCCGTGCTCGTCCAAGGAGGGAGTTTGCTTTACCCAACT
+CCCTTTTTGATAACAAGGCAGAAACCCCCGACCCGACATTCATTAGTTTCAAATGAAGAA
+TGAAGAGTACCCTGCCCCAGAAAGCACCAAATTACGTCTATCCCGACCNNNNNNNNNNGG
+TCGGGATAGACGAATGCGCCTACTCCTATAAAAAAAAAGCGTGACTTTACTAAACAAGCA
+AGAAAAGCCCTTTCTATGTTATTAGTAAAGCGCTAACGAGCAAGAAAACGGATGCGCGTT
+AGCGCAACGGCTTTCGCGCAGCTCAATCCCTTGCTTTGTTCTATAGTTAGGGGCCTTTTC
+AATAAGGCTCGCGTAGGGGCGCTCACGTTTTTTGGCTTCCCTAAAATCTAATTTTAAGTT
+GGTAAAGACCCACCCCTTGTTTCAGTCAGAATGAGTCCCCGGGACCCCGGGACATTGGCT
+TCCGCCAACAGTGGACTATTAAGGATCGCATCCCGCGCATATTCTACATTATAGCCTGCA
+ACTGATTCAGCTTCCGCTTCTGGGAGATCAAACGGAGCTCGATTAGTTTCTGCTAGACGA
+GAAATGAAGAACATAACCAATACAGGGAACAGGGGAATACCGGACCATATCTGCTTTTGC
+GCCATGACAATCTCACTCCAAATGCCCGTCTATCCCGACC
+>ds2020-328_16
+CTACCCGGTTATTTTACCAGACATAGCGGGTTAGTATCCGTAAGCTATAACTCCCGCCCG
+TTGCCAGAGGCCGTTTAGTCCGGTAGACCTTTTAAAGTTGTTTTCTCTGTGTTTTTGTTT
+TTTTTAAAAAATAAACCTCACATACAGCAACTGGTTGCCAGCCGATGTCACTCGGCCGAC
+TACATCCCGTCCCTGTCCAAGGTTTTTAATACTGTGTTTTTGAAATTTGTAGTTTTAAAG
+ACGTTGTTAGGAAGTTGAGGGCTAAGCGCTACTACCTTCCACACTACGTCACGTCCCCCG
+ACTTGCTCTTAACAAGTCAAGCCGACGGACAGTAATCCGTCAACCGTTTAGTGATTCCAA
+TCTACCTTGTCGGGAGGTCTCTTTCCACACAAGTGCTACTGCCATCATTTTCACACGTAA
+TAGTTGTATCACTAGGGGATATCCATATGGTAAGCGTACCGTCAGTCGAGGTATAGATTG
+TTTCTCCTTCGCAGTCAGGCGTGTATGTGAAGGCCTTGTTACAGAACGTTGAAAACGTGT
+CTGCGCCTGCATAACCGCCTGCCGCGACTATAGCATATGTAACTATGTGACAGTCTACGT
+TGTTCTGATTACACGCCAAGTTGTCTACGATATAAGTTGCGGCGCCAGATGACCCTGCGA
+TGATCGAAGCTACACTCGGGCAAACGAAGGCGGCTAGTCTGCTCTGTGATCCTAATCCGA
+TAGTAAGACCGTTTCCCAGAGACCGGCAGCTATTGGTATCACGCTTACTGTGAGGCGCGG
+TATCAGTCGGGTCAGTACCCATGAGCATGTTGTGGACGTATTTGTGCTCCTCCTCATTAC
+TCGTGTCCACAATTATCACCTGTCTGCTCGTGTTGTTGAGGTCGGGCACCATCCACCTCA
+TCTCCCACATTGAATCGCTGCCCTTCGTCAGTGCGCCAGCGCTGTCTACGTATAAAAAAG
+CCCTGGCGCCCATTAGTCCGAGTGACCAGGCCAGCAGGAACAGCCCCATGTTGAACATTG
+TTATCTCAGACGTGTATCACTCAATGGTAGTGGCGGCCGTTGCTGTGGATTATCCCGACC
+AAGGCGCACTCCGTCTATCCCGACC
+>ds2020-328_17
+GGTCGGGATAGACGGCTTCGAACCTTCTACCGGCGATACGCTCCTGGCCTTAATTGGCCG
+GGTCGTGCCTCCGGTGCTGTTACTTTGAAGAAATTAGAGTGCTCAAAGCAAGCCTACGCT
+CTGGATACATTAGCATGGGATAACATCATAGGATTTCGGTCCTATTCTGTTGGCCTTCGG
+GATCGGAGTAATGATTAACAGGGACAGTCGGGGGCATTCGTATTTCATAGTCAGAGGTGA
+AATTCTTGGATTTATGAAAGACGAACAACTGCGAAAGCATTTGCCAAGGATGTTTTCATT
+AATCAAGAACGAAAGTTGGGGGCTCGAAGACGATCAGATACCGTCCTAGTCTCAACCATA
+AACGATGCCGACCAGGGATCGGCGGATGTTACTTTTAGGACTCCGCCGGCACCTTATGAG
+AAATCAAAGTTTTTGGGTTCCGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATT
+GACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAAC
+TTACCAGGTCCAGACATAGTAAGGATTGACAGACTGAGAGCTCTTTCTTGATTCTATGGG
+TGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGCGATTTGTCTGGTTAATTCCGTTAACGA
+ACGAGACCTCAGCCTGCTAACTAGCTATGCGGAGGATCCCTCCGCGGCCAGCTTCTTAGA
+GGGACTATGGCCGCTTAGGCCAAGGAAGTTTGAGGCAATAACAGGTCTGTGATGCCCTTA
+GATGTTCTGGGCCGCACGCGCGCTACACTGAGGTATTCAACGCGTCTATCCCGACCCCCA
+ACGAAATCGTCTATCCCACCNNNNNNNNNNGGTCGGGATAGACGCTAGCGCCTGCTATAT
+TCAACGAGTCTATAGCCTTGGCCGACAGGCCCGGTTAATCTTTGAAATTTCATCGTGATG
+GGGATAGATCATTGCAATTGTTGGTCTTCAACGAGGAATTCCTAGTAAGCGCGAGTCATC
+AGCTCGCGTTGACTACGTCCCTGCCCTTTGTACACACCGCCAGCTCGCGTCTATCCCGAC
+CGCCGTAATTCAGATCGGAAG
+>ds2020-328_18
+GGTCGGGATAGACGATGACCCTCACTGCAGGACCGTAGAGTGTCCATCGGCTAGACCTAC
+TGAGCGGTAATTTTGCATAAACAATTGCAAACAGCCCGTCAGTGACTACACTTAGGGATA
+AGTGAAGTGATTTTGAATTAGAGCTACGTTAATTCCATCATTTGTAATATAAATACTAGG
+AAGGCACAATCCTAAATAAAGAAATGAAACTAATAAAACATCAAATTAGTTTCATAATTT
+TAGCGGTCTCTTCAGTGTGCAGTGTGTTGTGCGAACAAACATGTGATGCAGGCTGCAACC
+AAGCATACCAAAACTGCTTAATAACACGCGAAAGGTGTCAACAAGCGTGCAACCCTAACA
+GAATATACTGTGGGAATAACGCACCCGGCACATCGCAGACCTGTGATAATTTAATAGCCT
+GCGAAAACGGCTGTAGCCCTTGTGAAGAGATTTATAGGTCATGTGCTAATGGATGTGACA
+TTTGTGAAGGCAGCGCGGAAATGAAAAAACGTAGTCTTAACTATGACGTGTGCTACACAT
+ACACAAACTGTAAAGTAGTTAAAGTTGCGTGCAATCAAAAATGTAACGGCAACCAACAAG
+CACTTCAAGTGTGCAAGCAGTGCGTTAGCAGATGCCTAATAGCAGAAAAGTGTCGGGACT
+GTGTTTCAAAACAAATCCTTGGGTCCGACCCCGACCCAAAACAGACATGCATAACAGCAA
+AGCAGTGCAGTAAGGCAGTAATAGCAGCCGCAGGTATATAGGCACCAGGGGCAGCTATAC
+ACGAAAGAAGAAACTATGCGGCGACGGCTATAAACTCAGATCTTAGGAGATGAAATAAAG
+AACAGGCGTTCTAACCGTGAAACGAGTAGGACAATCCAGAAATGCAATAGGGGCAACGTT
+AGACTTAAATCTTCGGAAATAGGGTAATGGCGATACAAGCGCTCCACCGTGAAAATCGGG
+AATCCACTAAAAAACATGCAAGGGGACTATACGTCTATCCCGACC
+>ds2020-328_19
+GGTCGGGATAGACGAAGGTTCCGGGTGTCTTCCAGTGGTCTTCTAGCGTTAGAAGAAGTC
+GTGTCCGTCCCGGACATCTGCAATGTCCTCCCACGCTTTTTTTTAATATAGGACAAACTG
+AAGGAAAAGACTGACCCATTCGGTTACTTTCGCGGTCGCCCTCACTGAACCGACTTGAAT
+CTGAACTACGATTCAGATCAAGTCTTACCGACATCGGATTTCCTTTTCGTGCCATATGCG
+CTTTTACTTTACTTTACTTTACCCCTTTTGATTCCCGGTCCAATATTTGTTCTCGAAAGT
+CTTCGTTTTCGTTGCTCTAAGGTACACCCGAGCACCTTTTGGTGATGCGATGGTTTGATC
+CTATCCTCTCTCTCGCTTAAAGCCTTCAAACAAAGAAAGCTACTCCGCTATATATACTAA
+AAATTTTTCATATACGAGATTTCTGTTCCATTCCCCTCCTGCAGCCAAAGTGTTAGCGGC
+TGTAGCATCCACCGATAATGTGTGGAAGAGGGTAAGCTTTCTATGTGGATAGGACGTATC
+AACACCTTTTGCATCTTTTAAAGGAAATATATAAGAATGAATAATATTGTGTTGGGTCCT
+GAGGATCAGGATGGCCGAAGATCAAAACCTAAATGTGCCAGGGGTTGATCATCGAAGCCA
+GGGACGATGAAGGAATTTGAGCGCTGATGTAGCTAACAGCCACCTTCATAGTCGATTCAT
+TAGGGTCGCCACTCGTCTATCCCGACCNNNNNNNNNNGGGCTGTTAAGCCTCACAGCTAT
+GGGACTTCCTAAAGAAAACCGCAATCGTAGTTTATCAACCACTCACAAGACCACCGAGAT
+CTTCGGCTTAGCTCCCAAAGGTAATCCACCCGGCCCTTGCCCAACCTATACAAGGGGAGC
+GGAAGATAACGAAAGGGAGACAAAGTCCTAACTAAATCATAACACAAGAACCTCCGTCTA
+TATCATAACACAAGCTACCCATTAGCCTCGTCTATCCCGACC
+>ds2020-328_20
+GGTCGGGATAGACGTTAACATTGGCTACTTAAGCAATATTGGACACCAAGCACTTCGTGA
+AGGAATTTCCAATTAGGGATGAGGAAGAGGAAAGTAGCTCGACCAAAGGGAGAGGAAGAG
+CAGTGGTTGACAATCATTTGCCGACTCTTGCCCAGTTCAACTGATAAGGAAATTGAAGTC
+AAGAGGGGCTTGCCACCTGGTGAGATAGTAGTAGTGCCTATGCATGCAACTATTGGAGAC
+CNNNNNNNNNNAACGGCCGCCACTAATGTGTTTTTGTTCAGCGTGTGAGGTTTTGGAATT
+GGAATTGGAATTCGAGGAGTGCGCTGAGGGATACTTCTTTTATCACAGAGTGGTTTGTGG
+TTATCGGAATCGAAGGCTTGGATGAAATGGAGGATATGGAAGTACTTTTTGGAGTAGTTT
+TTTCGGGAGCAGGAGTTGGTGTGAGTGGAAGTGGGATAGATTTAGACACGCCTTTGAGGT
+ACGAAGGTGGATCTGATACTTGGATGGTGAGATGTGAGTGTGGTGCTAGAGATGACGATG
+GGGAGTTAAAGAGGTTAGCTCAAGACTTTTCCAGGAAAACCGAGACCAAGTTTGATTTCC
+ATAAAGAAAACGTTTAAAATTCACCAAATGAAAAAGTCTCTTGTTCTTTACTATAAACTC
+AAAGCATTAAAATAATTGATCTTGTTTGGAAGTTTTTACTTTAAAAAGCAATGATAAGAC
+CCCGTATTTGCGTCTATCCCGACCNNNNNNNNNNTTGCAAAACTTGCTTTAAGATAACTA
+GAAAGCTAGACCTACAGGTGCTCTGAATTCCCACAAAATTTGCTGTACATCTGCCAAATC
+ACATCTCGGTCTCTCCTCTTTCTTGTTAGTCCTTGGCTCGGGCTGGCCCTTTCGGATTAG
+CTTGTCTTCCTAGCTGCCTTTCTTTCCCCTGCCTTATGACTCTCGTACATAGAAGAATGA
+GTGGCAAAGCACTCGACCCGTCTATCGCGACC
+>ds2020-328_21
+GGTCGGGATAGACGAATATCAGCCCTGTAGATTCGTTCCCATGGTTCGATCCTTCCCAGT
+AAAACGCGGCGTGTTCGAATTCTGATCGCTTTTACGCGAGAAAGGGGGACCACCCTCTAA
+GCCTAAGTATTCCTCAATGACCGATAGCGTACAAGTACCGTGAGGGAAAGGTGAAAAGAA
+CCCTATTTAGGGAGTGCAATAGAGAACCTGAGATCCGATGCGAACAATCAGTCGAAGGAG
+CGGAGCTTAGAGCCTTTACTTTATATTAGTAAAGCGCGCTCACTCTAACGGCGTACCTTT
+TGCATGATGGGTCAGCGAGAAAATGGGAACAGCGGCTTAAGCCATTAGGTGTAGGCGCTT
+TCCAGAGGTGGAATCTTCTAGTTCTTCCTATTTGACCCGAAACCGATCGATCTAGCCATG
+AGCAGGTTGAAGAGAGCTCTAACAGGCCTTGGAGGACCGAACCCACGTATGTGGCAAAAT
+ACGGGGATGACTTGTGGCTAGGGGTGAAAGGCCAACCAAGATCGGATATAGCTGGTTTTC
+CGCGAAATCTATTTCAGTAGAGCGTATGATGTCGATGGCCCGAGGTAGAGCACTCAATGG
+GCTAGGGTGGCCCCATTTCGCCTTACCAACCCCAGGGAAACTCCGAATACAGGCCTAGAT
+CGTTTGTACAGACAGACTTTTGGGGTGCTAAGATCCAAAGTCGAGAGGGAAACAGCCCAG
+ATCGTACGCTAAGGTCCCTAAGCAATCACTTAGTGGAAAAGGAAGTGATCGAGCGATGAC
+AACCAGGAGGTGGGCTTGGAAGCAGCCATCCTTTGAAGAAAGCGTAATAGCTCACTGGTC
+TAGCTCCATGGCACCGAAAATGTATCAGGGCTCAAGTGATTCACCGAAGCGACGAGACCT
+TGAAAGCTTCTTTTTCAAGTGTCAGTAGCGGAACGTTCTGTCAATGGGGAAATGTTTTTG
+GTGACAACACGTGGAGATATCAGAAGT
+>ds2020-328_22
+GGTCGGGATAGACGTGCGTTCTCCTTATTGAAAGCGCTAACGCGCATCCGTTTTCTTGCT
+CGTTAGCGCTTTCAATAAGGACTTTTTTTAGGCTTATAACATAGAAAGGGCTTTTCCCAA
+CCAACCTAGGTTATGGGCTAGCGCGGCTCGCTTCGCTTTTGTTGCGGAGCTCGCTGCTTT
+TCATTTTGTTAGGAGTAGGTGCTTGCCCTTTGTTGGGTTTGGGTTGGGGGAAGAGGTCAT
+TTCCATCGCGAAGGATTCAATCCAGCCACAGGTTCCCCTACGGCTACCTTGTTACGACTT
+CACCCCAGTCGAAGACCCCACCGTGGTATGCGCCAATAAGACCACCAAAAGCCTTTGTGG
+CACTAGTGGTACACAGAAGTCATGGGTGATCATTGGTCCGATGCTTCGGGCGAAACCAAT
+TCCCAGGGTGTGACGGGCGGTGTGTACAGGGCCCGGGTACATATTCACCGCGGCATGCTG
+ATCCGCGATTACTAGCGATTCCAACTTCATGTTCCCGAGTTGCAGAGAACAATCCGAACT
+GAGGCAATCTTTCCGGATTCGCTCCGCCTTACAGCCTTGCTTCCCATTGTAATTGCCATT
+GTAGCACGTGTGTGGCCCAGCCCATAAGGGCCATGCGGACTTGACATCATCCCCCTACGT
+CTATCCCGACCNNNNNNNNNNGGTCGGGATAGACGACTCTAGCCCCTATCTCCGTCTATC
+CCGACCAGTGAGGTGATACGTCATCCCCACCTTCCTCCAGTATATCACTGGCAGTCCCTC
+GTGAGTGCGGCACGCACCTTTTTGTTTGTTTCGGAGCCGTTTTGGCGGGGTGTACTAAAC
+TCACTACGTACCACACCACCGGGCGGCTCGCCTGAATGCCTCGTACTTCGACTCAGCCAA
+CCCCGGCGTCTATCCCGACC
+>ds2020-328_23
+TGAATTACGGCGGTCGGGATAGACGGGAGCTACTACTCATGCAGCGGCAAGGACCCGCAA
+CTCTCGAGGGGGCCACCAACCGCCCGAATAACTCCTTTACTCAATGGATAGCGCTTATCC
+TCTTTCAATCAACAAAATGAGAAATGGGGGAGAAAGAAAGAGAGAAAGAGGTCTTTATTG
+AAGAGGCTTTGCACCTGAAATAGGACTAATGAAGATCCAGAAGAATGGGTCTGGGCTTTC
+GAAAAGATGAAGATGCAAAGGGTAAAGAGAAAAAGTCTTTTGAACAACCAACCTGACATA
+AGGATTATAGCTCGCCCACTTAGAGCAGATGGTGATTCTCGGACGGGGAAAAGCGGCACT
+CGAAATCTATTAAACAACACCAAGAACAAAGCCATACCATGCCCTCGGGATAAACTAGTG
+ATGATTGCCATGAATGCTGCCCTCGAGGATGTGTACAAGAGGGTCTTTGCCGATTCCTAT
+CAACATGGTGCACCTCTCAAGGGTGAGACTTTAACCGAATGAATGGGGATCAATTGATAG
+ACATTTTGATTGAGGAAGAGAATCCAATCCAGGATGAATGCTTTTTTCGTTCGCTATGTG
+CTGACTAGATGCGTACTCGCGCGATCGATCGATGCACGGGGGAATTGCGTGAATGACGAG
+ACCGGCCTAACCTAAAGTAAAGGCTCTTCCCTCTCTTCATGGCGAATCTTGATTGACTGA
+CACTAGGAGCCGACTCGGAGAAACAAGAAGCATGGCATGAGATTCGCGGCGGAATTAATT
+CCGATAGCGAATTACTTGATTCGATGGATGGAGGGAGAGCCCTCCAACTCAAGCACAAAA
+TCAATGTTGAATCAACAATCATCGAGAGCGAGAAGGGCCCCATGACGTCTCTCCCGACC
+>ds2020-328_24
+GGTCGGGATAGACGCCCCGGTTGAGTTTGAGAGCCGTGTGATGGGTGACTATCCTGCACG
+GTTCGGGGAGCACTTTTTGTCTGCGTTGGTGAATGGAAGCCCCCACTATCAAGCAAGAAA
+GAAGCGGCTCTTCCCACGGCGGAGTCCCCATTGACTCTATTTATTATTATGGTAAATCAG
+TGTATCAAGATGTCAATCTGAGATCTTATTTCGGTTCAATACGTCCACCTACGAGACTGA
+CCTTTGGCTTTCGTCTCGGTACGTGTATTATAATAAATTTTCCCAAAAGAACATTCATTC
+ATTTCTTTCTTCCCCGTCGACCACGACGACTGAAACGACACGAAAAATCCAGACCCGGAA
+AGGGAACGGCCGGTGGGGGGCAGTCGGGAAATGCGGGNNNNNNNNNNGGTCGGGATAGAC
+GGTGGTGGGCATTTGGTAAAGTCGGGCCGATCGGGTGTCTTCATTCAAGCGACGATACAG
+AAGAAGAACGAAACGAAGTGAGAGGCCGGGGGGCAGGGAAAAGAGTCGAGTCGATCAGGC
+TCGACGACCGGGAGAAGCAAAACGAAATTAGGATTTGGCCGAAAAAGAAGCAACGCTATG
+GATACCATGACCGATCACCATCGATAAAGAAGAATCTTTCTAAATCACTTCGGGTCAGCA
+GGGCCTTCAAGCACCCGAAATACGCCGGGGTTGTAAATGACATAGCGTTCCTGATAGAAA
+ATGACGACTCCTTCAGAAAAACTAAGTTATTCAAGTTCTTTTTGCCAAAGAAGTCCCGCT
+CCGACGGCCCGACGAGTCATCTACTTAAAAGGACCCTCCCTGCAGTGCGCCCCTCCTTCA
+ATTATTTGGTCATGCAATACTTATTGAATACAAAGAACGGGCATCGTCTATCCCCACC
+>ds2020-328_25
+ACTCCACCTAGACTCTTAATCTTAGACAATCTGTCACCGACCTTAACATAAAAGGATGAG
+CCCGGCCTGTCTATTTATATGCATTGGCTTAACTCATTCCTATACACTGCAAAGAACACA
+AAATTAAAACAGCCTGGTAAGGGCTGTACAAGGGAACGAAAAGGGAGTTTGTTTGATAAG
+AAAGAGTTTGTGCTTAGTTAACAAACATCGAGTTTGGAGTCGGGGCAGCGTGGATACGAG
+ACTATTGAAGTTAAGTTTGGAATCATTTTGGTTTTCTATCTTCAGATTACCAAATTGGAG
+AATCACCAAGGCCTTTCAGCGATTCGACGCGCCCCCCTAAGCTAGACGCTTCACCTACCC
+AGAGAATAGAATGAGTCGCCCGCCTAGTCTTACTAAGAGTTTGAATTGCTCCGGGCGAAT
+GAATCGCATTAGTGTGATTTGGCTAGCAGAATCGCCCTTATATTATATATATTTTTCAAC
+CAGGTCAACGCATCGCCACTACGGAAACGAAATTTCCTTAGTCCTTTTTCTGTGAAACAA
+AGCCAAGTCTTTTCCGCCTTCCATCCCGCGTTTCCCTGCTTGAGACTGCTTTTTATTAGC
+CCAGTCATGAACCACCCCGGTTGGAGCCATGGTCTACCCGGCAGTGCTTCATAGCCCCCT
+TGCTCTTTGTCTAATCTTAGACTAAAGGTACGGCATCCTTTTTTGTTGTTTTTCTTTTGG
+CCGTAGGTTGTACGCCAGCCATATGTAGCTTGAACTGTGATGGCCACAATGCTTAGCTAC
+CCAAGATGCCTTTGGTTGAATGTTCACACCCGTCTGCACTTCCTACATTCATTCCCGGAA
+ATTGAAACAAAACAGGAAAACTGGAATTGTAACCCCCCGGCGCGTCTATCCCGACC
+>ds2020-328_26
+GGTCGGGATAGACGATAAACTGGGCTTCTCAGCTTGAGTATGCGTAACATACACAGCGGA
+GGCATCCACCTCAACTTGAGACAGAGCATTTATAGGTTTCACTTTAATAGACCTAAGAAT
+ATGTCTTTTTGTCTTAACAGGAGTCTTCTTTCTATAGAAGAACTTAGACAAAGCATATAC
+CGTATCAGCAGGATTTCGGTATGTAATCGTTTGTTTCACATGATCACCTTTCAAAACATG
+GTGCTTCAGGAGAAACATATCATTCCTGGAAATAAACGGTATTTGTTCAGTGTCACCAAA
+GGCTATAACCTCTGATAAACCGGCAATTGCGTCTATCCCGACCNNNNNNNNNNGCGGTCG
+GATAGACGCAGCCCCCTCACCTCTTCTTCAACCTCATCTCCCTCTTTTGTTTCCAGCACC
+GGCAATTGTGGCAGCAGCATATATGCACCCAGCATGTTGCATGAAACACTCATCAAACAA
+CATCTTCTTTGCCTTGGGAGCATTGTTTGTCATCAGATAGGAATCGCAAGTTCGAATGAA
+CCTGCTTTTAACTAACTGGGATCCCTCAACAGCTTCTTTCAACTCAATTGCAGAAGATCT
+GTTGGAAGTCAAGAGTAGGTCTATATCATCTCCAACCATGGAGGCAATAGACTTGATCTT
+GGTAGTTTTTCCACAACCAGCAACACCGTCCATGATTGTGATTGAAAAATCACAATTCAT
+CTTCAAAGCCTTTTCCAGTGAAGGTATAACCTTCTCCACTGATGAGAATACACAAGAGTC
+ATCAACAATGACAATTTCGTATTCTCCGACAGATCGTACGCAGGCAGCGGACACATTTCC
+GGCATCATCCCACCATTCCGTCTATCCCGACC
+>ds2020-328_27
+AACGGCCGCCACTATACGAATACCATAGGGGGTAGAGCACTGTTTCGGCTAGGGGGTCAT
+CCCGACTTACCAAACCGATGCAAACTCCGAATACCTATGAGTACTATCCGGGAGACAGAC
+TGCGGGTGCTAACGTCCGTAGTCAAGAGGAAAACAATCCAGACCGCCAGCTAAGGCCCCA
+AAATCATAGTTAAGTGGGAAACGATGTGGGAAGGCATAGACAGCTAGGAGGTTGGCTTAG
+AAGCAGCCACCCTTTAAAGAAAGCGTAATAGCTCACTAGTCGAGTCGGCCTGCGCGGAAG
+ATGTAACGGGGCTAAAACTATGTGCCGAAGCTGCGGATTTGACATTAGTCAAGTGGTAGG
+GGAGCGTTCTGTAAGCCGATGAAGGTGTATTGAGAAGTATGCTGGAGGTATCAGAAGTGC
+GAATGCTGACGTGAGTAACGACAAAACGGGTGAAAAACCCGTTCGCCGAAAGACCAAGGG
+TTCCAGTCCAACGTTAATCGGGGCTGGGTGAGTCGACCCCTAAGGCGAGGCCGAAAGGCG
+TAGTCGATGGGAAATCGGTTAATATTCCGATACTTGTTTATAATGCGATGGAGGGACGGA
+GAAGGTTATGCCAACCGCGCGTCTATCCCGACCNNNNNNNNNNGGTCGGGATAGACGGAT
+GAGAAGGTTAAGTCAGCCTGGCGTTGGTTGTCCAGGTGGAAGGATGTAGGTATGTATCTT
+AGGCAAATCCGGGGTACTCTATACTGAGATCCGATAGCAAGCTGTACTTGTACAGTGAAG
+TGGCTGATACCATGCTTCCAGGAAAAGTCTCTAAGCTTCAGTTACACAGGAATCGTACCC
+GACTATACCGTCTATCCCGACC
+>ds2020-328_28
+GGGAGGGATAGACGAACAGTATGAGCCAATGGACCTATCAGATGCTAGTAGCGACGAGAC
+GGTTGGATGAAGGTTATAGATCAGAATACATAAGCGCAATGATCGTAGAAGCAGTTAAGC
+AAAACAGAATAAGAACCGTGAAGACTTTAGAGATAATCTCGGGGGCTCGAATGACAGAAG
+AAGAAAATGAAGTTTTCGGAAATTTGGCGGAAGCTGAGAGAAAATTAGAAGAAGATAAAA
+GAAGCTTTAGGAAGGTAGCTGGAATGATGGTGAAGAAGGTGGGAATGGTGATAGGATTGC
+CTTTCGTGATATCAGATTTCTGCATGGCTGCTTAGCGTCTATCCCGACCNNNNNNNNNNA
+GGTCGGGATAGACGACGCTTGGGTTTCTGGTTCGTAAGGACAGTGTCTTCAGCTCGAGAA
+AAGATATCAAGGACGGCGTCAGCTGCAGCTGCGTGGACATTAGACAAAATTGGAAAAATC
+AAGTCTTCGCAGGTTAAAATATTAGGAAATGTGTCGTCGCTACTCAGAAGGGCGTTGGAA
+TTGATGTCCGTGATCTCAAAAATATATGACATAGAAGTGAGAGAAGAATTTAAATTAGGC
+AGCAAGATCGGCGAAGCCGGAAAGGTTCAGACGTCCATGCTGAGTAACATGGTAAACAAG
+ATAACCAGCTCCGTAGTGAGGGAATTGGCTGACAAAATAATAAGCCAGAAATCATTGCAA
+GATTCGGGGAAGAAGATGGAGGAAGAGAAGAAAAAAGAAACTGAAATTAGAGAGAAAAGA
+AGCGCATATGCCATGCTGTCTAACAAATCGTGCCAAATAGAAACGGATGCAGAAGCTGAA
+GTTTGGAGAAA
+>ds2020-328_29
+GGTCGGGATAGACGGTGCAGTCGATTAGAACGGAAATGGAGTTGGAAGCAGCCCCTTTCT
+ACATGCTTGATATCTTAAAGCTCGCCAAAAGGAGCCCAGCCCATATTCCCATAGCTGTCA
+AGTTGAGATTCTTTTGCACAAACAAACAATATCGCAGAATATTCTGCGTGTATCACAGGC
+GCTTCGCGCCCTCGAGTTGAGAATCAAGGAGATTGATGTATATGGAGATTCGTCACTTAT
+CATCTTTCAGACAACTGGTGATTGGAAAACCAAAGATCAGAAGCTCATTCCCTACCATCA
+GTATCTGGAAGATATCAGCCTAAAGTTCAGACGGATTACCTTCAATTATATGTCGAGGAC
+GAAGAATAAGTTTGCTGACGCATTGGCCACACTAGCTTCCATGATCAGTAGACGGTATTG
+ATATCCGGCCAATAGAATAGAGTCGACGAATCGGATTGAAATCAGTGTGAAGAAGAGTCA
+TGCGAGGACTAATCAAGCACAGCTAAATAGTAGTCATATCCACAAAGAAAGGAAAAAAGA
+TCGTCAACGCTTCTAACGTCCGTAGGAACTAAGTAGGAGGGCCGGAACTTGAGGCACTCG
+TCTATCCCGACCNNNNNNNNNNTGAGACCCCATTTCCTGTCTACCTCTCTGAATCCTGAG
+TTTTCGGAGCAGTAGAGACTCGCGCTTTAGCCGCTTCATCTGAAGTGAAGGAGGGCTTAC
+AGAAGTCACAGCACCAGAAAGTGACAATAGGCAAATCAACATAAATGCAAGAAAAAGAGG
+AAACTGTACATCAAGCCCTGTATAGCGAGACAGAGAAAAGAAATGGTACCTGGCGTCTAT
+CCCGACC
+>ds2020-328_30
+TTCTTCGATGATGCGCAAATTGAAGCTTCGGTACCCTTGTTTTTTCCAATCGCCCTTTTC
+TCTTCTTTCTTCTTTTCTTCACTTCCTTCCTGCTTTAATTCTTCATCAGACCCTCCTTTC
+TTCCTCGCTGCTGCTTTAGCCGACTTCCCGCTGTTTTCATCGGTTTTTTCTTCTGTCTCA
+TTCTTCTTTGCTACCGGGTATTTAGCCGCGTTTCTTCCTATCAGCAAGTCCCACGTCCTT
+CTCATTGTCCGCGACGCCTTCCTCACTATTCTCACTGCTTTGTCTTTCAATTCCACAGCC
+CTTCTGACGATAGTCCTGTTTAGAAGTCTTCGCACGCCTACGATTTTCCTGCTTATCCAC
+CTTATCACCGTCGCCAGCTTACTGCCAACCGCTCCGTTCGCGTCGTTTATTTTCAGCTTC
+AGTGCCCAGAACCACCCTTGGTCCATTTCTGTGACTTTCAAAGCTTCTCCGGTGAGCACT
+TCCTCCTTAGACAGCATCGTCGATGCTATGGATGGGTTCTTCATCCTGTCCGTCAACTTA
+CTTATTATGGTGCTTGGGTCCATCATGTAGCTGCATCCTCTTGTCCGACAATCTGCTAGC
+CTTTTGAATAACTCATCTCGGCCCACGTCTTCTCCTGCTATTCTATTCTTCCTTTTCATC
+TTTATTCTTTCGGGATTTTCTATTCCCATTGGTGCCCTAGGGCTGAACTCGCTTGAATAC
+AAATATGCTATCTTGAATCTGTCATTCAAATCATTTAGAACCGCAGCCATTCTCAACGCG
+TCCGTTAACAACTCAGTTTCGCAACCAAGACACCACGTCTATCCCGACC
+>ds2020-328_31
+GGGCGATTGGAAAAAACAAGGGTACCGAAGCTTCAATTTGCGCATCATCGAAGAAGATCA
+GCTGGGCGGATCAATGCGAAGGAGAGGAAGCCGTCTATCCCGACCNNNNNNNNNNGGTCG
+GGATAGACGAACACACGGGATAGTGGCTAGATCGGTGATGACAGCTATAAGGACAGGAGT
+GAAACTGGCGCTAATTGGTCCTAAAATAGCATTATTTGCTGTAGGAAAGGTGTTGAGTGA
+TTGCAGGTCTAAAGTCACAGAAAGTCTGTCCAGAGCGACCCAAGTTATGAGGTTGGGACT
+TAAAATGCTGCAGAAATTAAGGTCCCAAGTAAGGAGTCGAGTCGGCGAGAAGATCCTATC
+GAAAGCGAAGAGTGTGGCTTGCGCCAAGGCTGGAAAGAAAAACACGGCGAAGGAAGAAGG
+CGAGGCAATCAAAAAGAACAGAAACGGACCGATGGAACAAGTGGCAAGGGCGGCTTTAGA
+TGAAATGAAAAAAGGAGCAAGAAAGTTCGTGTCGAGGATGTTCAGTGAGTTAAGGAGGCT
+AGCATCAAGTGCGGAAGAGAGAATTGAGAAGTTTTTTAGCTCGATTAGCAGAGCATGGAG
+TAGGCTAAGCAAAGAAGTGAAAGATTTATATTTCCAAACAAACCTTTTAGTGCGCGCGAT
+GATGGGCAAAAAAATGGACGTTGGCAAGCACTTTTGCTTATTCAGGAAAGGGGAAACAAG
+CTCAGCTGATTTGATAATTTCCGTAAGCAGAGCGATCATGGGGTTGTTGGGGAGAATAGT
+GATATTCTGTGTGTCGACTGATTCCCCACGTCTATCCCGACC
+>ds2020-328_32
+GGTCGGGATAGACGTTCCCCCCCCCCTTTCTATTCCTCGCGAGCATATTCCCACATAAGG
+GAGTACAATCGATTTTTCCCCCTGGAACTTGTGAATGAAAAGGGAATATGCTCGCCATTA
+TTGTAGTGCTCCCGCTGAAGCGACTCCACTCTCCCTAGCAGAGCTTTACAAAATCCAACC
+TCAGCCTTATCCAGCGCTAACGATTCGATGTACTTGTAAAAGGTTCTGTCGGGAAGGGTG
+CGCTTCCTTCCAGAAAAAAAAGTGGTTCTTACCTTCCTGTACGAGTAGTGAAGAACTATA
+GTGAGTTGTGGTTGGTTGTTGACCAACGGAAAGCGTGGGAGAAAGAAGGAGTCATCGACG
+GGGCGGGGATCACGCAATAGATCTCCGGGGGTGGGGGGGTACCTTACTTAAGTATGGATG
+TGATTTTGACCCCGTTCCACCCCAGCTCAAAATCCATTGGGATGCCCCAATTGTTGAATA
+TGATTAAAGCCATAAGGAATGTGTGGGAGGCTGTATAAAGAAGTAGAAACAAAAATAGAG
+ATTTCGATAGTCCATGAAGAAAAGGAAGGATTTGTTGATATGTAGCAGCTCCGGCACCTA
+TTGATTTTGCACCCTCTAACATCTCCGAGTTAAGAATTCTCGTCACGCTTTTTCATTCAC
+GATTTTATGTTATTGATTCCTCGTCGATTCTGCCCCCCCCAAAAAAAATGAAGAAAGACT
+TGTCGGAAATCGCCGGTTGGGTTTACCAACCAAGAAAGACATGGGAATTTTAGGCGTCAG
+ATTCTTTTTCTTCAGGGCTTGGCGACGTCTATCCGACCGC
+>ds2020-328_33
+TGGTCGGGATAGACGAGTTGGGGCCGAGTCCCGTAGATACTACATAAGAAATTTTTTCAT
+TGATGGATGGGAAGGTGTATAAAAAAAGGTAAAAGCGCTTATGGGGCATCCCACCTCCCG
+AGAAGGTTGAAGGGATAGAGGAGCTTTTTAGCCCTTTTGAGGAATTGGTTGGAAAAGCGC
+TACCACCCTGGCCGGAAATCCTATGTCCAAGCGCTTCAGAGGTCAAGGGAGTTCGATCCG
+GCTACAACTCTCCTCCTTCCACGCACGGACAAGGATCGGTTGTTGAAACAAATTCATCTA
+GAAACAAATAAGTTCTTGTTTGATCCGCCGCTGTTGTAACACCACAATATTCGTCCTTTT
+CCTTTTGAGGTTAATCCTCTCAATGGTGAATCGAGCACTCGAAAAATTTCTTCGACGGAA
+TGGAAGAAAGGTAAGGAAACCCGCGATGGCTACTGAATACCCGCCCTTTACTTTCTTAAT
+AAAAAAGCCCCTTACCTTTGTATTCGTTCGCCAAATCTTGTTCAGTTCCATCCAAGCTCG
+GTTTTGTCTGAATCTTCGCGGAAGAAGAAGAAGCGGTTCACCAGCCACTACATCTGTGGA
+TCCCACCAAATTTTTAAACCTGGCGGCTGCTCGCTCTTTGATCAGTGATTCACCGGCCAC
+TACATCGATGAAGAATCTCTCCAAAATCTGCTCTTTGATCAGTGATTCACCGGCCACTAC
+ATCCAGGGATCCCACCTTATTCTCAAACCTGGAGTGCAAGTCTATCACGACC
+>ds2020-328_34
+GGTCGGGATAGACGCTTACCGGGATTGGGGAAGACGGGTGGATTATAGAGCTAGGGGCGG
+ATCGAAGGTTTGCCCGTTGGGATTGGGCATGGACGAGCCTCGACTGGGCCAGCGTTGATG
+AAAAAATGAAAAAAAAACTTCTCCCATCGCATCATTAACCGGTGTAGGATTAAAGATCAG
+GTCCAGGATTCGAGGCAAATCAACCTCCCCTCTCATCTCAGGGTGAGGCAAGGAATTCAA
+TGTTCGTTGTTCAATATCTCGGCTGCTCAAGAAGTTGGACTAGCAGCTCCTCCGACCCGG
+AGTGGATTCTAGGGGAAGGGCAGAGCCTCACCTTGCAGTAGGAAGGTGGTCGTTGCTGGG
+ACGGGTTCAAACAGGACTGAAGGGAGGATAAATTCAATACTCCGATCTTACTGGGGATTC
+ATCACTGGCTAGGGCTTTCGAATCAAAGCATGGGCATCCGCAACTAAGAGGGAGCAGTAG
+ATCGTCGATTGAAGAGCCAGGTCAGTAAACTTCTATTGATTATTGATTCGACTAGAGGGA
+CTCCTAGCAACAAACTTGTATGAAGGGCCCCCCGTGGAGATGCAGGAGCCGCCAGCCGGA
+TCGACCAATAAATGATAGGCCAGAGGGATGGGCTCATTCGACTAATTAGTGATCCCTGGC
+CCTACCTAACAAGGGGTATGTGTCGTCTATCCCGACC
+>ds2020-328_35
+GGTCGGGATAGACGTTGACTTTCGCTTTCTCCCTTGTAGCCGTTACCCGAATTCGCGCAA
+GTGTGTCCACACCCCCCAAACTGACTTGACGAGGAATCCATTCTCGCGAACAAACACAAC
+CCCTACACACACCTAGGAGCACCCCTTCCTGCATATCCATACAAGACCCGAGTAGGCGGG
+TCGAGGTCCTACGAGGTACCCACTACTCGGAGTACCCTCCCAAAAGGAAAAAGATGTGTC
+TGTCAGGTTCGGTTCTTCTTAGTTGGGTTGGGCGGGTTCGACCAGAAATGCTATGCTTAC
+ACACAAGACTACCCCTCTTCCCGAAAGCTTCGCGGGGACTACTTTACGACGACGGACGAC
+CGCCCGTAGGGGGTTTACTGCACAAGGCCCCTGCAGAGGAAAGGCTTTATCCCAGCGAAT
+AGAAGATGCTCAGCTCCGCACAACATAGGGATTAGCACGCTTTCGGAAAGAACATAGAAT
+AGTAAAGGATCCAGCATGCGGAACACGGCGATCATTAGAAATTCACGAATTAGAGATGCT
+GTAATATACTCTTTCCCATAACTTCTCATACCAGACCAACCCACTGAAATGCAAATAGGG
+ATCAGAAATGTGGTCAATATCACGAAGAATAAAGAGATACCGTCTATACCCAAATAAAAA
+TTTATGTTTTATCGTCTATCCCGACC
+>ds2020-328_36
+GTACAGCTTTGGCTAGCAACTTCGGAGCCGCTACTTCGGGATGCGTACCCGGTGACGGAT
+ATGCTCACTACGGAGGTTCAGCGTGGTTGAACTGCCGCGCGCTGCAAGAGTGCCAGAACG
+AGGGTAACGATGTAGTTAAGAGATCTGAACTCAATGTCACTAGCTCCGACGTCCGTGGAG
+CTATGTCTGGTGGTGTTGTGATGCCGGACTTTCTGTACGCGTACGGCACCACCTACTTTA
+TCCACGGACAAAACAAGTCCGGGGGTCACGTTGACGCTAAGATTTTTGACAACACTGAAT
+CTGAGGACTTGATGAAAGATCTGGTCAACATGACTGAAACCGACTTCGTTGCCAAATACG
+CGCACCTTGGTGTAGACGGCGACTTGTTCGGTGCTGCATAAGTCGTTGAATGATGACCAA
+AGGTGGATGAGTTGACTTGTTAAGCCCTATGGCAGGTCGACAGGGGCAATTGGTGGAAAA
+TGCAACCGGGCGCAAAATGTAAATCAGCGGAAAAACACGGGTAAAACAATAAATTAATTA
+CAAAATAATGTGAGAAGGGCATATCGTCTGATATGGGGCGACTGGAAGGCGATCTCAATA
+AACTGGTCTCAACAACCAGGGAGCGCAGAACAAAAAAAACACACATAAGAAAATAACTCA
+TATAGTGGCGGCCGTTGCTGTGTATT
+>ds2020-328_37
+GGTCGGGATAGACGCACGCTCACACTGGTCGGGATAGACGGTACCAAGGGCTTTCGGTAG
+ACTTCTTTCATTTCCGAATTAGCTTGCGAAAAGTCCTAGCATTAGTATGAGTTCGTTGAC
+CGCGTAAGGGCGATCCATCTTGATGACGAATTCCACGATAACGAGAAATAGAAATTAATC
+GTTCGATGTCTGCTCGCTCTCCCCTCTTCAATTCCCAATGAACAACATGATCTTGACCTA
+TCATTTGTTCAATTTGGTCGATCTGATACTTAGTTAACTCTTTTATCTTTATGTTCCCAC
+TGATACCTAATCGATAACGAACCTGAATGGCTTTTTTAGGTCCAATTCCATCAATTTTTG
+TTGAGGCAATTCTTACTTGTTCATCGGCAACTGATCTAGCTCCTGAAATATATGACATTC
+TTGATCCTTTCCTTTACTAGTCTTCTCGGCTGGAATCAAAAATGGGCTGTCTCCTCTCTG
+ATGATCTTTTCTATAGGTAGAACTACTGTGAGCGGTCTAAACTTCGACCCTTATTTCTTT
+CTTAAAAAAAAAGAAAAAAAGGACATTCGACCCAATACCTTAACCATGTAATTTCTCCGA
+CATTATTTTCTATCGCCACATCAAGGTGACAGGATTCGAACCTATGGCCCTCTGTACCCA
+AAACAGACGTCTATCCCGACC
+>ds2020-328_38
+GGTCGGGATAGACGAATCATGATTTTACTACGAAGGAAGGAACTCGAAGTGAGACGGCAC
+TGTCTTGTCCAACGCAACGATATGGCCCTCTATCATCTTCTATCCGGTAGACTTGGTAAA
+AGGGCCCCGACTTTTTTCCAGAATTAGAGTTCGACCGCGGCTGCCCCCTTTTTTGGGGGG
+TTGGTCAGAAGTCAGTCTTGTTTGGTAAGACGGAATTGGACAAAGAAAAGAGAGTGCTCG
+ACCGGAGCAACGGCCAACAAAGACCGTAATTACATAGATAACCGCTCCTCCCCTTCTCCG
+TCTTTAAGGCTTTAAGGCGAACCGTATGGCGGCTGGAAAGAAAGACGACCTCACCTTCTC
+GTAGATGGTGTTAGTGAGAGCAACTTTAGTATCCCCCGTTGACCTTCTTTTGCAGATAGA
+ATCTTCAATGAGTGGAAACAAGCAACCTTACTAATAAAGGTGCTTGTTGAGTAAGGCCGG
+CGCCCAAGCCCCTTGTATAGGTTGGGTGCTTGAGCGCATGTTTCTCATATCGATCAAGGC
+TTTCCTTGAGTTTTCAATAAGGGGCGCGTTAGCACTCCTGCAAGAAAACGGCCTAGCTAA
+CGCGCGCCCTTACGTTTTCTTCGCTTGCTCTGCCTGCAGTACGAGCCTCATACAGAGCGC
+GCCCCATCGTCTATCCCGACC
+>ds2020-328_39
+GGTCGGGATAGACGACGGATCCCAGTCAGCCTTCTTCCTCTTCAGGACATACCTGACTCT
+CACAACTCCGCGAGAGGTTCACCTTCGGCGTCGTCCTCCACTGGACAACGAGTCACATTA
+CCTTGTGACAACACAATCACTCCGCATCCGGCAACGAACCCTCGACGCCCATACATCAAG
+CGTTGCATAAGACACGTCAACTGCATCGACCACGTCGCATGCTTCACTCATGGCTCGCTC
+ATGTCCAAGTCAAGACATAGCGATCCAACACACCATCGGTTTACCCACACTTCTGTCGGT
+CATTCCTTTAGCATCCACGATAGCCCACTTCCTCAAGCTATACACGCAAGCAGTCCTACT
+TGCATGTCGCCCAAGCCTTGGCGACATATATATTCCGAATGTCCCACATAACCGTCTATG
+CATTGCATGGGGTCGCAACCCATGCGTACCGGCATCCGAATATCTTCCTTCCAACATTAG
+ACAAGGCCGAACCCCAACCAAGTCTATCGAGTCTTGCCACATGCCTCGCTAGCCGATGGC
+ATAGCGAATGCCATTCCGTGACCTCACTCTTTCCGACAATGCCCAATACGAACGGCCCGA
+CGTGTTCGTACTGTCCTCGGGAAATCCTTTCCCTCGGAGACACAGATCATCCTCATTCAG
+CGTCTATCCCGACC
+>ds2020-328_40
+AACGGCCGCCACTACTTTTTGCCTTTATTGATATGATATAAAACAAGCTTACTTACTAAT
+AAAGCGGCAACAAGCACCTTCTTTCTCAAAAAGTAAAGTTTCGCGCTTGTTGCTTTAGAA
+AAATGGCAGCGTTAGCGCTTTACTAATACTTATATATAATATATCAAGTAAAGGCTCTTC
+TCCTTTTCTACTAATCTACAACTCTCTTTACTGAGCGAGACTCCATCCATATCCCTACTA
+GTGGTTCTTTTTTTTTCTATTCTATCATTTGTTTGACAGCTTAAACCAGGCTCCATTTTA
+GAGAGTTTTCGGTCTTAATCAAGATAGGTCAGGGGCGCGTCAGAACGGTCGGTGGCTGCT
+TAGTCTCATCCGAGAATCTCTTTGTACTGCTTTTTTTCAAAGAAAAAAAAAGAAAGAAGG
+GGTTCGATTTAGGCTCCTTCCCTTACAGAGCATAGCTGCGCTAGCAGGTACTACGAGCCC
+TCTGTCCCGCGCATCTAACCAGCTCGCGTGGTTCACCGGTTCCACCGAAAACTCTCATTT
+GTTGAAGCGGAGCATAGTGCGCTTTAGGCGCCGAGCGAGAAACGTCTCTTCTTTCGTTTC
+GATTTATTCACTGATCTGAAACTTTGCACTTGTTTTCTTATTGATTCCAGGGGCGGCGGC
+GTCTATCCCGACC
+>ds2020-328_41
+GCCGTGGACCTAGTTGCCTACCCCCTAAACCACTAGATCCACGGCTGGTACTTATTTACT
+AGGTCCACGGCGGTCGGGATAGACGACGAGAGCCCGTTCTAGTGCCTGAACTACTCCGAT
+TATTATAGGCCTCAAACTCGTGTCCTGCAGCTCTAATTCTTTTGCTATTTCTTCCAACTC
+TCTTTCTCTATCAACTTCCGCTTCTTCTTCGACTATCTCTTCTTCCGTCTCAGCCAGCAG
+CCTTTTCCTCAATTTCATTTCTTCGTGAGCCGCTTTGCATAACTTAGCGTCCTCAGAATT
+AGATGCTGCTATAGCCCCTCCGCACAGCAATGTCTCAGCTGCCACATCTCAGCTACGTCT
+ATCCCGACCNNNNNNNNNNGGTCGGGATAGACGTGTACTGCTTCTTTATCGGATAAAATC
+TGGCCATCTCTCTCGCAGCCGCGCACAGTCTTATTGCCTCTTTCGTAGTAAACTCTTTCT
+TTCCGAATGACTCTGTTTTCTCTACTATAGCTTTCATCCATTCTTTTTGCCCTTCGACTT
+CTTCTCTATTCAGGAGGTCTATTGAGCTATATCGGTCCCAATTATCGAACCTCCAGTACC
+TTTGCTCACCCTCTTTCTCTTCCGAAGCTCCCTCAACCATCGATTTGTTCGCGTCGTCTA
+ACCCGACC
+>ds2020-328_42
+GGTCGGGATATACGAGGCACTGGACTGGAGTGCTTTCATCAAATGATGCATGTGGGCTGG
+GCCATTCCCATCCCAAAGGGCGGCCCGATTCGGCCTGGCCTGGTCGGGAAGAGATTCACA
+TAGAGACTATCGCTATCCGGGAATCTATTTCTTTCTATGTTAGCTAGCGGGGGCGGGCTT
+TCCTATGGTAGTCCCGCTGCGGCCTCTGACCGTCCGTCCCGTCTCATCTTGATTTGGCTA
+TACTTGTATGTAGCCACCCTCCACATGATAGCCTTTTTCTAAAGGCTAAAAAGGCACTCA
+TCAGTCAGCTCGGCCCCTTTCCTATTAAGCTTTGCCACCTTACCTTAAGAGAATAGGTCC
+CGTTCAAGCGCCCCGCCTTTATTCATCTATACCAACTGCCACGCACGACCCAATATGAAC
+GATTTCAGCGCCTCTCTCTAGATAAGAAGCGGAACGCGCCATCACCTACAGCCCTTTCCT
+CTGCCGGGGACTTCCACGAAATGAAAACGGGCGGCATCGTCGTATGCTCGACATTTGTTG
+CCCGGGGTTATCTCCCGGAGTACTCCTATGGCCGATCTGTCACCCAACCAACTTAAACAA
+CCTCAATCGCTTGGCCCCGACCCGTTTGGAGAATGACCCTTATCGCACGGCTACGTCTAT
+CCCGACC
+>ds2020-328_43
+GGTCGGGATAGACGCGCGGGGGGTGTGCCACGACGAAACAAGGGAATTTAAGGCCACTTT
+GCGTTGGATGCTCTTTACCCTCCCCACAATGACGGCTCTGTTGTCTTGGGGAGCGTTGAA
+GCTTGCTTCTTCTCCAGAGTTTTCTTGGTCATCAATATGACCTGTCCTTAATAGAACCAA
+TCTGATTCTCTGAACAATCGGAATTTCGTACTTCTGTCGGATCCTCCCTATCTCCTGATC
+GAGCTTGTGTAGGTAGATGTTGCCTAGTAGGGCCGATAGTAGTACACTGTGTGGGACGGA
+ATAAGGGCCCTTCTCACCTCCTACGAGTCGTCCGGCGGAAAAGACTTTCTGAATGGGGTA
+AAAGAACTTGGGATCGTCGATCTCTTCCTTAAAGATTGGGATGAGTCGATGTCGGTCGAT
+GGTGTGAAAACACTTCCTGATGTCGAATTCCAAAAACCAGCGAGAGGTTCCCCACTCTTC
+TTTGATCCGTCTTAGGGCCGAGTGGCGGCCTCGACCCGAGCGGAAGTGCGATGTGTCTGG
+AAACTCGGGATCGTAAATGAATTCGAGTACCATTCTGATCGCCTCTTTCATGATCTTTTC
+TATAGGTAGAACTACTGTGAGCGGTCTAAACTTCGACCCTTATT
+>ds2020-328_44
+GGTCGGGATAGACGTGGGTGCTGGGTCGATTTATTCTATGGCGAAGCATCCGAAGCATAA
+CTGCACACTCACACGATCTTTGCCGAGAGATAGGAGCATTCGGTGGAACCGGTGAACTAC
+ACTTGCTTCTGGATAGATGTGTGGGACAGAGGGCTCGTGGTACCTGCTGCCCACCCTTCC
+TCCTCTGCTTTGAGAACCGTGTGAACGGAGAGTGGGCAGAAGGGAAGGAGGTCCTCATAC
+GGAGTCGCACACTTACTTGAGCAGTGCGGGAGACTGGGGAATGGGTCGAGCAAACTCCCC
+CTGGGCCGAAAAATTACAGACGAAGCTTTACTTAGATAGGGCTTTGATTTGATTGGTATT
+GATTTTTTCTTAGTGATTGGAAAGGAGGGCGCCGGGGTATGTTATAGAAAGGGAAGGCGG
+AGGTAGTACTTCGAATGGCGAAGAGCGGCGGCTCGGCAGGGAAGGAATGGGAAATCGTCA
+AGGATGACTTCTTTGTTGGCGAAACGAAGGGCTAAATAGCGCCAGTGATTCTCTGAGCCG
+GTCTGGATTTCCAACGCCTCGGGAAACTGGTCGAGATAGATGACAGCACCCTTTTCCTCT
+CTTCCTTACTCTAACAAGTAAGCAAGTAAACTACCT
+>ds2020-328_45
+GGTCGGGATAGACGTATATAAGCCCTGTATAGCGAGACAGAGAAAAGAAATGGTACCCCT
+CCGCCCCTTGCTATTAAGAAAATGACCAGACGTACCTGGTTGCGATCAGATGTAGGAGAG
+AAGTGCGTTTAGGAGCCACCGCATACGTTTACTCTTGAATTAATTCGTGAGATTTGCGAT
+CCCCTCGCAGGTCCTCCAAACCCCCTTGAGTATTCAAAGAAAAATTGTTTGATCATTCAA
+TGGATCAAGCAAGGTGTTGATTTCTCTTTTCAAATCAAGGTCTTCTTCGAAAGAACCAGA
+GTTAGCCGAGGAGCTCGAGCAGGAGTTTCTTAAAAGCTGAAAAACGGAAGACTGGGGCCT
+TTTTACAAAAAGTATGGGAAACCGGAAACGGAATACCTAGGTCGCAGGGCAAGGGAGGAC
+GGAACCCCACTTCGACTCACCAAGGAGAAGGTAAGTACTTTTATATCGTTTCTTCTGAAG
+TGATATAGAGCAATGCCTGGACTGGGGGGGGGGCGTCGGCCCACGGGAAACCATTTGCAG
+ATGCGACCATGAATCGAACCAGATCGAAACATTCAGCTTCGACGGACAAACCGAACCGTC
+GATCGCAAACGAAGAATGGCCGTCTATCCCGACC
+>ds2020-328_46
+GGTCGGGATAGACGCCCCTTAGCCCTGAATGGTAGCATAGTAGGGGAAACGGGTTTGGTC
+GGTTTCTCAGTCATATGAGCAGCAACACTCTACCTCAAAAAGGGCTCTGCTTAGGGAGAT
+CGGGTCGACGTCATTTCTCCGCTATACAACCAGACCAAATGAGAATGATGGCTCTAGAGT
+GCCCTACCAACAATAAGGCGGTTGACGTGACTCGCCAGTTATGTCGAACAGCGAAAAGTG
+GACTTGAATGAGATGCTTCTTAATGGAGGGTGAGTCGGAACCCTGGAACCGGGGAATACT
+GCGATTCGCAGATTCTATTCATCACTTTCCATGAGTCCCCAACCCTCCTGCGCGTATAGT
+CGCGAGAGTAAGCAACCCACTAAGCTCCTCCGTCTATCCCGACCCCGTATCAACCAGCAT
+TTCGACATTTCGGGTAAGATGGAACCCTTTTCTATACCCTTAACCTGCCACGGGTGTGAG
+TGGACCTTTCTCCTCAAGCGCTTCCCAACTCCCCCTATTCCAATCGCTCGTCGCCCATTC
+TCTAAGGGGGCTCTCTCCTGCTCCGTCAGCGTGGCACTCTTCTGCTCGGTCAACCGGGAC
+TGATTCCCCGTTGACGTCTATCCCGACC
+>ds2020-328_47
+GGTCGGGATAGACGCTTGTCCCCCCTCAGCTCACCCTAGCCCCGGGCCTTTTGCTCTTCT
+AACGTAAGCTCCAAGGCTTCACACCAAGTCTTCACTGACATAATATGCATGCTTAAGTAG
+GGTCAGGCAGAACCGCTGTTGCCCGATGGGAACTTCCCCCATATTGCTATCAATGTCTTC
+ATGTCGCACGACCTCTTAACATTACACCACTGAATCCCCAATCCTTTGCTTGCTGTGCAG
+TGACAGTACCAATATCCACTAATCGTTGTTTCCAGATACGGTTGCCGGTTGACATCTCTT
+CTAATTCGTCGATACGAGAAGCAAATTGTTGTGTGGAGGAATCAATATCTCGACATAAGC
+CAAGAGGCAAATCTTGGGCCACTCCACCTGGTCGTATGAAACTGGCATGCATCCTGGCTC
+CGGAGACTCTTTCATAGAATTCCAACAATTTCTCCCGCTCCTCAAAAGCCCACAGGAACG
+GAGTTGATGCTCCCACATCCATAGCATGAGTAGTTAAAGCAAGTGAATGATTTGAAATTC
+GAGTTATTTCACGGAATAACACTCGTATATATTGAGCTCGTAATGGTACCTCGCAATTCA
+AAAGTCTCTCTACGGCTGAAGAA
+>ds2020-328_48
+GGTCGGGATAGACGATGCATATGGGTAGCAAGAGGGCGCTTATGCCCCGACGGTGGGGCC
+TTATGGGGAAGGGCCCAGCCAAATAGGGACAGCACACCCCCCACTTCAAGCGCATCTCTG
+TATCGACTGAATCACTCTAAGAGTCTAGTCGGTGGAACCGGTGAACCACGCGAGCTGGTT
+AGATGCGTGGGGCAGAGGGCTCGTAGTACCCCCTTTTCTTGATCCAGCCTTTTCTTCACT
+TCGGTAGTGAATCACCTACTAAAAAAAGAGGCAGGCCTGCGCGCCCTATTTGAGACTACT
+AAGGCAGGCGGTGGACTCTTTCATTAGGGAAGGGAAGAAGGGGCCTAAGCACGGCAGATG
+CCGTACACTTGAGTGGCAAAGGAAAGCGAGATCGTACCAGTTTTTCCAGGCCTGTTCGGA
+CATATGGTTCCCGCGGAAGATCAAGTTGGTGAGCCGTGTGATGGGAAACCTTCCCGCACG
+GTTCGGAGAGCACTGAATTAGAATGAGAGGTTCACCACCACATCATTGCATGCAAGGGGA
+GCTCGCTCGATTCGCAAATTGGTCCGACTCGTAATTCACTTCTGACCCCGTGTCCCGTCT
+ATCCGACCGCCGTAATTCTCTCA
+>ds2020-328_49
+GGTCGGGATAGACGTTGGTACCCCCTTCATTCAGCTGACGTTAAGAAAACAACAACAGTT
+TGCACCCTCGAACATGCCTAGTGCTCCAAGAAACACCGCTGCCTTTGTGGCCTCATTCGA
+ATCGAACCAAGTTCGCCCTGAACCTGGCCGTTTCGTCCCGACCTTCCGTCCGATGTTTGG
+AATTGATGGACCCGTCCTCGATACCGTCTCCTTGACAAAGAACATCTTGTCTATCGTCTC
+TGACGTAGCCTCTGGAAGCCCCGGAAAAGCCGCTTTCTATGCCGCCGGTACCCTCTTGAA
+TCTCTCGGTCGTTTTCACCTCTACGAGCCAATCCCTGTCTGACGACGATATCTCAAACAT
+GGTCAACCTTCCAACTGCCCTCCAGCAATTGGTAATTGGATACTCTAGAGCGAAGTGTTC
+TCAGGAAAAAGTGGTTCTATTTGACTCTCGAACCGAGGTTTCCCGTCTGTTATGGACTTT
+CGATCAGATCGCAACAACTGGCCAAGTTATGGCTTTGTCTGCCCTGTCCGTCCCCATGAC
+TCCGTCTACCTCTCTTCCCGCTGCAGTCCTTCTCCACAACTTCCTTCGTCTATCCCGACC
+GCCGTAATTCAGATCGGAACA
+>ds2020-328_50
+GGGCGGGATAGACGCGACGGTCCGTTCTAGTGACAGCATTCCTACTTTTATTATAGCTTC
+CGGTACTGGCGGGGGCAATTACCATGTTATTAACCGATAGAAACTTTAATACAACCTTTT
+CTGATCCCGCTGGAGGGGGAGACCCCATATTATACCAGCATCTCTTTCGGTTCTTCGGTC
+ATCCAGAGGTGTATATTCTCATTCTGCCTGGATCCGGTATCATAAGTCATATCGTTTCGA
+CTTTTTCGGGAAAACCGGTCTTCGGGTATCTAGGCATGGTTTATGCCATGATCAGTACAG
+GTGTTCTTGGATTTCTTGTTTGGGCTCATCATATGTTTACTGTGGGCTTAGACGTTGATA
+CCCGTGCCTACTTTACCGCAGCTACCATGATCATAGCTGTCCCCACTGGAATCAAAATCT
+TTAGTTGGATCGCTACCATGTGGGGGGGTTCGATACAATACAAAACACCCATGTTATTTG
+CTGTAGGGTTCATCTTTTTGTTCTCCATAGGAGCACTCACTGGAATAATCCTGGCAAATT
+CTGGGCTGGCCACGGCCCACTTCTCCCTCCGGTGCGCACTCCAATCCATAATACAACCAG
+ATTGAGCGTCTATCCCGACC
+>ds2020-328_51
+ATTGCAAAAGAAAGGGCTTGCTGATAGAGCGGGGCGGGGAGGCGATACTAGTTATCAGGT
+CAGAGAGACGCCTGGCCCGTAAGCCGGCCCCCTTAAAACCCCATTACTTAATAAGGATTT
+GTTACGCGCGATATGCCGACGACTTACTACTGGGAATCGTGGGTGCCGTAGAGCTTCTCA
+TAGAAATACAAAAACGTATCGCCCACTTCCTACAATCCGGCCTGAACCTTTGGGTAGGCT
+CTGCAGGATCAACAACAATAGCTGCACGGAGTACGGTAGAATTCCCCGGTACGGTCATTC
+GGGAAGTCCCTCCGAGGACGACTCCCATACAATTCTTGCGAGAGCTGGAGAAGCGTCTAC
+GGGTAAAGCACCGTATCCATATAACTGCTTGCCATCTACGCTCCGCCATCAATTCCAAGT
+TTAGGAACCTAGGTAATAGTATCCCGATCAAACAGCTGACGAAGGGGATGAGCGAAACAG
+GGAGTCTACTAGACGGGGTTCAACTAGCGGACACTCTTGGAACGGCCGGAGTAAGAAGTC
+CCCAAGTGAGCGTATTATGGGGGACCGTCAAGCACATCCGGCAAGAATCAAAGGGGTATC
+TTACGTCTATCCCGACC
+>ds2020-328_52
+GGTCGGGATAGACGTTTGATCTACATGATACTTATTATGTGGTTGCACATTTCCATTATG
+TACTTTCTATGGGAGCCGTTTTTGCTTTATTTGCAGGATTTTACTATTGGGTGGGTAAAA
+TCTTTGGTCGGATATACCCTGAAACTTTAGGGCAAATACATTTTTGGATCACTTTTTTCG
+GGGTTAATCTGACCTTCTTTCCAATGCATTTCTTAGGGTTATCGTGTCTGCCACGGCGCA
+TTCCAGATTATCCAGATTCTTACGCTGGGTGGAATGCCATTAGCAGTTTTGGCTCTTATA
+TATCCGTAGTTGGGATTCGTCGTTTCTTCGTGGTCGTAACAATCACTTCAAGCAGTGGAA
+ATAACAAAAGATGTGCTCCAAGTCCTTGGGCTCTTGAACAGAATTCAACCACACTGGAAT
+GGATGGTACAAAGTCCTCCAGCTTTTCATACTTTTGGAGAACTTCCAGCTATCAAGGAAA
+CCGTGAAGTAAAAGAAGAAAAGGTAGACCACTAATACTAAGAACCTAACAGAACAAGCAA
+TGCCCCATGCCTTTCTTGGTTGGACCAGCCCAACCGGCGAATTACGTCTATCCCGACC
+>ds2020-328_53
+GGTCGGGATAGACGGGGCAGGTGCATGCGTCGCTTCTAGCCGGATTCTGACTTAGAGGCG
+TTCAGTCATAATCCAGCGCACGGTAGCTTCGCGCCACTGGCTTTTCAACCAAGCGCGATG
+ACCAATTGTGCGAATCAACGGTTCCTCTCGTACTAGGTTGAATTACTATTGCGACACTGT
+CATCAGTAGGGTAAAACTAACCTGTCTCACGACGGTCTAAACCCAGCTCACGTTCCCTAT
+TGGTGGGTGAACAATCCAACACTTGGTGAATTCTGCTTCACAATGATAGGAAGAGCCGAC
+ATCGAAGGATCAAAAAGCAACGTCGCTATGAACGCTTGGCTGCCACAAGCCAGTTATCCC
+TGTGGTAACTTTTCTGACACCTCTAGCTTCAAATTCCGAAGGTCTAAAGGATCGATAGGC
+CACGCTTTCACGGTTCGTATTCGTACTGGAAATCAGAATCAAACGAGCTTTTACCCTTTT
+GTTCCACACGAGATTTCTGTTCTCGTTGAGCTCATCTTAGGACACCTGCGTTATCTTTTA
+ACAGATGTGCCGCCCCAGCCAAACTCCCCACCAAACAACGTCGTCTATCCCGACC
+>ds2020-328_54
+GGTCGCGAAAGCCGCTCCGTGCTCTTTCATTAACTGATATAAATATCGGCTAGTCTACCA
+TATTTTTTATTGACAGAAAGATAAAAGGATGGCTCCATGTGCTCTGATTCATTATGTGGA
+TTCATCCAGGAGCACTACCAAAGTGTTTCAAAGAAGGGTTATCCTGACGTAGGTCTGCTT
+CTGGCCTAGATCAACTTAAGTTAAATGGAGTTTCTATCGCCCTGCTTGAATCAAATATGA
+AACTTCATACACCTTAAAGTTCATAAGATAGGACGAAAAGAGAGTTTTTTTGAGGTCCTT
+ATACTCATTATGCCTGGCATTGAATAGACAGGTAATTCGCCTTATCAATATCTCAAATCA
+ATGATGGGTTCTATATTGGCACCTAAATGGGAAACCGAATCGGACCAAACCCTTTGTCAG
+GCTATTGTTCTCTTGTTTTGTTCCCTAAAAGTCATAGAGTAAGACATCGATTTATCAATA
+AGATCAAATATTTTTTTGATTACATGATGGACTCCTCTGAAAAACATTGGCGCGCGTGTA
+AACGAGGTGCTCTACCTAACTGACCTATGGCGTCTATCCCGACC
+>ds2020-328_55
+ATCTAATACACAGCAACGGCCGCCACTATGCCTTTCGCCTACCTTTTCACCGTCCGGTTT
+CTCCTAAAGCTAGAATTACGGCTGCCAGGTTTGAACCACAGCGTCTGCCGACTAGCCTAT
+CACGAGATCTGCCTTATAGTGTCCAGTTCGGGTGGGATTTTTGTTGTTTTAAAATGTTTT
+TGTGTTTTTCTGGTTTTTTAAATGTTTTTGATTAAAAATTAATATCCACATGGTGGTTGA
+GGGTCAACCGTATAGCCACTGCCTGTTAACGTCAAGCTCATATCTACATCATCACCATCA
+TCAAATGCTATTGTTGAACAGAAATAGGTAGTGGCGGCCGTTGCTGTGTATTANNNNNNN
+NNNTCCGCTATTACTCCAGCTACCTGATCAGCCAAACTGTCGGTATATCCACTTTCCCAG
+GTGAAAGCCGATGCTTCAGAGAACTCTGCTTCTAGCTCAGTAGCAGTATAATCTTCCTAC
+CTCTAACTGTTAGTGGCGGCCGTTGCTGTGTATTAGGGATAGACGGAAAATACTCCTGGT
+CCGTCTATCCCGACCAGGGCCTGATGACGTCTATCCCGGCC
+>ds2020-328_56
+GGTCGGGATAGACGACCAGGTCTGGTGATGTTCAGGTTTGTCATAAATTACAGAATTTGC
+AATAGTTTCTGGTTAAATTTGGATATCGGGTGTGTGTTTATGTTGCTGTCATTTATAATA
+CTTATTGATCATGATCATGATGGTGCGTGGAGATATATACTATAATATGTATGCAATTAT
+AAAACCACTGGCTAGGAGACGTGTATTTAAGATGATCAAAGAATCTTTNNNNNNNNNNNN
+NNNNNNNNNNNNNNNNNNNNNNGGTCGGGATAGACGTATTTGAGGTATTTATGTTCATGT
+CTTTTATAGTTCTATTATGATTGCCTCAATTTTGTTTGTATTTGCAGTGGGATGACTGTA
+GTTACATCAAAAGAAAGAAAATTGAAAGATGAAGACCTGTCTAGCCCAAAAAAGAATGTT
+ATTTCCACACCAAAGAAGGATAAGGATAGACTTGCTAGGCGAAGAAAAGTAAACAAGTGG
+AGCTCTTTGGAAGAGGACACCTTGAGGGCTGGTATAGAGCAGTATGGAGTAGGACGTTAG
+AAGTTAATCTTGACTAGCAACCAGGACCGTCTATCCCGACC
+>ds2020-328_57
+GGTCGGGATAGACGACGATGGACCATGAGGAAGAACGGAACCCTTTTTATTTTACTTTTT
+ATTTTGTTTACCTCTTTACTGTTCAAAGATCAAAGAGAAAACCATTCTGTTATTCTGTTA
+TTCTGTTATTACATTACGTGGATACACATTTTCTATGGGAAACAACATAGACATTGTAGT
+TGTCCAACGAGATACTGCACATACTAAAATATTGTCTTGGCTAGTCATGCGCACTTACCC
+GTTGTTTTATTATTTTAGAAATTTTATTTATGTTCTGCTTGTTTTATTGAACCCATTTCA
+TATCATGGTTCAAACGTTAAAAATCGACTCCGAAGAAGTTCCCGTGGATCATTTGTCAAC
+TGCTCAATCAATGACTTCTATAATGGGTATAATAAAATAATCTTTTTGTTAGCATTCCGA
+CGAAGAAGTCATCGATTCTTTTGATCGGGATTCATATTGAAAATAATCAGAAATCTAGGA
+ATTATAATCGCTTTTAATCGCTTTCGATTATTTAAAATTAATTGAAATCAACACAAATAG
+ATAAAGCAAAGCTCTCCATCTATCCCGACC
+>ds2020-328_58
+TGGTCTGGATAGACGCCCGCTGCAAGTTATATGAGAACTGAGCAACATCCATCAACTTTG
+CCCAATTCCGCTGGTTGGCACTCACATAGTGCCTCAAGTAAAGCTCCAACAAGGCATTCA
+CCCGTTCCGTCTGACCATCTGTCTGAGGGTGAAAGCTAGTTGAGAAGTTCAACTGTGAGC
+CAAGTAGCTTGAAGAGCTCCGTCCACAGCTTCCCTGTGAAGCGTCTATCCCGCCCNNNNN
+NNNNNGGTCGGGATGACGGTAGCATACTTGGTGAACCTGTCAACCACCACCAAAATTGAG
+CCACACCCTTCCGACTTGGGTAGACTCACAATGAAGTCCATGGATAAACTCTCCCATGGT
+CTGGTTGGAACTGGAAGTGGCTCTAGCAACCCGCCTGGCTGCTTCTGCAATGTCTTGTCT
+TGTTGGCATACAAGACAAGTCCGCACGAACGAGTCTACATCTTCCCGCATCTGTGGCCAA
+TAATAAGCTTCACTCATCAAGGCTAATGTGCGATGAGTGAAGCTTATTATTGGCCACAGA
+TGGCCACCGTCTATCCCGACC
+>ds2020-328_59
+GGTCGGGATAGACGCTAGGGGGGAGTGCTACTACTTCACTTTCTTGATTTGAGACCCAGA
+TCATAGAGGAAAATGGGCTGTTTGACGGAAGGCATAGCGCTAGTCCTCTTACGGATAGAT
+GGGACTAGGACCGATATCATGCTATTCTAGAGATAGATAGGCGAACAACGACAAGGAAAT
+CCCAAGCTATGAATGTTCTAATGTTTGCGTCTTTGAAGCTTGTTCCTTTCCCACCCACCC
+TCCATCTTTACTTCTTTGAGTGTGAAGCACATGTTGGCATTCCAAGCTCCTTAAAACTCT
+ATGACCTACTAAATTTTTCTTCTTTCACTCTTTATCTTATAGTTCACCTTAAATTAAAGC
+ACTTCCAGTAAAATAAGGAAGACTCACTTGGGCTCTTATAATCATTGCAGGGTTCGCTCG
+AGTAGAATCATATCCAATCTTCCTGCTAAGCCAATCCCCAGTACAAGCAACTAAATCCAG
+TTCATTCCCAAGGAAAAGGGCTAACTGAATTCCCCTTCTCGAGCGAGAGTTCGGGACTTG
+AGTAGTGGCGGCCGTT
+>ds2020-328_60
+GGTCGGGATAGACGAGAGGGCTGGCTCATCAATATAGTACGGTCCGTGTGCCCTTTTTTC
+TCTTAGTCGCTAATAGAAGAGAGCTGCACAATCATTGGAGTGCCCGGGCATATCAACATC
+CAATTCCTATTCATAAAGCTGGACAGATTCTCTGAAAGTGATCGGACGGGTAGCTAAAGT
+AGAACGAGAGAGATCGGTAAACATAGGGGTTCCAGATCGGTAGACGAGAGGACTTTGACA
+CAAGCTTTTGAAAGCGATTGTGAAAGAAGATTTTTGCCTTCCTTCCAGCTGCAAAGATGG
+CTTTGAAAGCTTCGGCAGGGTCTTTTGATCTGTGCGGAGAATCAACCATTCTTAAACCAT
+TGGTTCTTATTAGGTAAAGAATAAACTGCCTCACCTTGACTTGAATGGAAGGTTCCGCCA
+TCCTCTTACTGAATATGGTCTGTCGAGCAAGAAAGATTCTATAACCCCGAGCTCGTATCA
+AAGCCCGACCACATTGCGTACCCCGAACTAAAGAGGGGACTCCCTGTCAAAGAATGGACC
+TCGTCTTCCCGACC
+>ds2020-328_61
+GGTCGGGATAGACGGTCAGCACCAGTGATTTCATATCCAGTCAAAATTTTGGCTAATTGA
+TCGAAGTGGGTAGCTCCAGTAGACCCATAGATCATGGAACAAATAGGGTGGGTAGGCCCA
+ACCACCACACTACACGTATAGACGCGAACCCCCCTCGTTACCGTACGTGCGACTCTCACC
+GCATACGGCTCGCACAAAGACTCCTAAATCCATCCCGAGCCTTTTCTTCCACCTCTCCTC
+TCCAATCCTCGATCAAACTTGCGTTCCCCAGGCGCTATGAAATGGGGGGGTCTTTCCTTC
+GCCTATCATATGTATCGGCTTGGCTTCGTCCAGAACCAAGGAGGCATTCCGGCGGGCGCG
+TGCGTGTAGGAAGGCCGACCACTACATAAGCTAAAAGACTACGACTACAAGCCAAGCCGG
+AAGCGACTCGCTTCTATTCTCGTTGGGATTGAATATAGATGGGGAATCTATAGATCGTAG
+TAGTTCGCCAACCTCTCTAACTAACATACGATACAATTTCACTTCAGTGCACGGTGTCGT
+CTATCCCGACC
+>ds2020-328_62
+GGTCGGGATAGACGTGAAGATCAGGTATACGCAGCTTTATGGACAGCAGAATCTGTGGGT
+AGACAGGTAATACACGATAATGTAGGTACAAAACAAACTTACCTAGCTAAAGATACACTA
+CTATCAGGATGGCGCCTAACCACGTTCATGAACAGCGTTCTTAACTATATATACTCTAAA
+GCCATAAGTCAAAATATGCTTAAAAGAGGAAACAGTCTTCATAATGGAGATGATGTTCTA
+ATAGGGACGAAGAACTTTGAAGCGGTGCGGAGGGGTCTAGAAATGGCTAACAGGCCTATG
+ACCTCTATCCCGACCNNNNNNNNNNTGAATTAGGCGGTCGGGATAGACGACTGTTTGCGC
+TGGTCGGGATAGACGCAGCTCACCCCTGGTCGGGATAGACGCGACACAGGGGTCTAGAAA
+TGGCTAAGAGGCTAAACGTAAGGGTGCAAAGCACTAAATGTGCCTTTGCTGGAATAGCTG
+AATTTTTAAGAGTAGACCATAAACGGGGCAGCAAGGGCCAGTATCAACAAGAAACTGCGT
+CTATCCCGACC
+>ds2020-328_63
+TTGGGGCGGATTAATCGAAGAGTCAAACTTCTCGTCTCGGCCCTATTAGGGTAAGGCCAA
+TGCACCAGCCAGCCGGGGTGGTGGCGAACACGATCTGCTGTAAGCTAAGCTGTTCACCTT
+GTAGACGGAGGAGATATAGAAAGTGTGCCGTGCGTGATTCATAAGATTATATAGTAACAC
+CAGTATATTATTATATTTCACTTAGCCTGCCTCTCCCATGACTTTCCGGACCAACCAACC
+CGGATCTGCCCTCGCAAGTCTCTCCGCGTTTTGGGAGCAGAGCCTGCAAAATCGAGCAAT
+GGGTCTGAGAAGAATTAAATTTTGAACGGCATGACTCTTTCTATTTTTGCGCCGGCATTT
+GAGTTGTCTCCCCTCCTCTTTCAATCGACACACTCCACACAGATAGCTCCCGTGGCCCCG
+GCTTCTGCCTCTATCAGGCGGCGACAGCCCCTACCTTCCCCAAGAACCCTTTTTTAAGGA
+TTCGGCAGGCCCGTAAAAAAAAATTGGGATACTTCCCCCGAAAAACCGCGGTTCGGCGTC
+TATCCCGACC
+>ds2020-328_64
+GGTCGGGATAGACGTTCAGTGCCCATCTTAACGGTACAAGTAAATTTTATTGATAATAAA
+AAAATAGACGGGGGGACATGCAGTTTCATCTTGATAGTAACTTCTTGATGAGACTCGACT
+CTTACAGTTTCATCTTCAATTCCTTGAGGTTGAGAAGGAGGTTGCTCCTCACAAATTGGA
+GGAGACAGAGAAGGACCCGAAGGCATGCTAGTTGATGATTCATCATTGTTTCTCTTAAAA
+AAATCTTGAATGGTCCTTGATCTCTTAACATTACGATGTTGACCCGACATTATAAAGTAT
+AACCTATTGAATAATATATAGAAGATGTAAACATATACACCCACAAAAATTTCAAAAGAA
+AAGAAGATGAAGAATGGAAGATTACCTTAGGTTGCTTTAATTAAGTCCAAGGACATGCAC
+AATTTTCCTTCTTGTCGAAGAGCAAGAGTTAGGCGCTAGAGGATGCAATAGAGAAAATTC
+TTTTTCTGTCTTTCCTTTTTTTTTCGGTAAAGGAGAGTGACGTCTATCCCGACC
+>ds2020-328_65
+GGTCGGGATAGACGCAGCCGCCTCATCCCTAAACCAAGGAAAGGACCGCGGTCATACTTT
+CTTTTAAACTATATAGGCCTTACACCTGGGGCGATTGATCGATTCTGCCGTTGACTCGAA
+TTCTTCGGGAACGAAGGATACCAGTACCAGACTAATAGAATAGAATCGTCGAGCACTATA
+ATCCGACGGACCGACCTAGTGATAGGAAGAGAAGGAGTAGCTCGCAACTGGCGAGCGATC
+GATTGGGGATTGATTTAGTGCCCTATTACAGAAGGCCGATGGGTAGACCCAATATCTATC
+AGTACTCGTGATCTGGGGAGTACCTAGGGAACTTATAAGGCCTCTACATTGAGGGAAACC
+CTGCTCTACGTGAAAAAGGAGAAGTTAACTTTTGCATAACCTCTGTTTTCATTGGGCATT
+GGAACAATCACAAGTGCAGGAAAGAACTTGTTGATATAAGAAGATCTCTTACCATATGGT
+CTTAAGTTGAGTATAGTACTCAGCAACAGGCATATCCCCCGTCTATCCCGACC
+>ds2020-328_66
+GGTCGGGATAGACGCACGCTTGCCATTTTTATTCATACAGTGAATGTTATTTTCTTTACT
+ATGCTACATGATTGACGGTCAGTTGCCCCCTTGAACTATCATTGTCATAGAAGGGCGCGC
+TACCACATTTTTTACATCCGTGGTTTGTGATCTGTCCTATCAGATTACATGCTCTAGCCC
+CATTTATAGTTTCTCCGGTGTTTGCTGTAAATGCAGTTAGATGCCCTACCGTTGCAATGT
+GCTGTCCTGGCGCGTAGTTCCCGTTGTACCCGTCACGGCATATTTTATCAACTAGACTAC
+CCAAATCATTGGGTCCAACACCACCACTACACAATGCGCTTCCTCTGCAATTTATGCCTA
+ATGCCCGAGTACTAACGTCTGCCACTGGCGTACCCCGCGACTCAATGGGGTTTGCCATAG
+CACACACTACTACAGCAACTAGGGAAGCCCCTAACAATCTCATATTAACAGTTAACATTT
+CTATGGGAATTTCCAGAGGATCTCTCAAAGTAATGTCCCGTCTATCCCGACC
+>ds2020-328_67
+TGAATTACGGCGGTCGGGATAGACGTCATTCAATGGTGGGGTGCTCATAGAAAAGAAGGC
+GTCGCCCAACAAGTGGCGGATTTTGATGGAGTCTCGCTTTGACGCTGGGGAGATCCATAG
+ATCTGGATAGAGTCTCGCCCATAGATAGAGGAAGAGTACGCGCGCTACGGCTTACGCAGT
+TGATCGGATCAGATAGCCCTTCGGGCAACCAACCAAACCCGGCACATCAAATGCCGATCA
+ACAACTGGGAGGTATGGCTGAGTGGCTTAAGGCATTGGTTTGCTAAATCGACATACAAGA
+AGATTGTATCATGGGTTCGAATCCCATTTCCTCCGGCACGGAAGTGGAACGGGCGGGCGA
+AATTACGTGAGAGAAAGAACCTCTTGGTGGAGTCCCCCGGAGGACAGAATAGCACTATTT
+AGTGACTAGGAGCGGAGAGCCCGTTGCGCGTTGTTTTTGTTTGACCGACCTATCTTCTTT
+CTATAAGCAAGCTCCCGCTGGCAATCCCTGTGTCCGTCTATCCCGACCA
+>ds2020-328_68
+GGTCGGGATAGACGAACGCCAACGGTTATCCCGACCAGGAGTACGTCGCGTCTATCCCGA
+CCAGGGCTGTTGACCGTCTATCCCGACCGCCGTAATTCATACACAGCAACGGCCGCCACT
+AACACGGAAACAGACAATGATTTGACTTTATCAACATGGAATAGTGAATTTTCTAAGGAT
+TATCCAGCGACCGGATCGACCAGTTTCGATGTCCTAAACCCTCTCTCAGACGGCTCGGAA
+TTAGAATTGGAAGTGTTAGTGTCATCTGGAAATATCTTTGGAAACTATCCGGTTGAAGAT
+TGGGCAACTATCACCAATTGGATCGTAGATACCATCTATGTCACCGAATTCAGTCCAGGA
+TACTTGACCGTACTTGTACATGATGAACAGGCAAACCGTGACATATGTGTCGTATCGTTC
+TATTGGATTGATGGTTAAAATATATGGCGGAACTTTAAAAACATGCAATAATAGTGGCGG
+CCGTTGCTGCGTATTACGATCTAAGGTGTTTTTCCGTCTAGCCCGACC
+>ds2020-328_69
+GGTCGGGATAGACGCCCATTGACATTAGGTTTGTACTGTCGGAATGAAGCCTCACACACT
+CTGGATAGAACCTTCGTGTCAACCAGTATGTGTCTTCTGGACACCGCTTCTAAAGAAGGG
+TGTACTACTGACGTAATATCAGTAGCCATGACCAAAGTTTTTGACTTCAGTTTGGTCAAC
+CAGGCACAGGATCTTCCTGCATTCAACTCAATTCCAGGTTTATACCCGGAGCAATAGGTG
+ATATCGATAATCATGACTCCATGAAAATCGGTTTTCCGCTCGACACGAAAGGCGGCATCA
+CCTAGATCAACAGCATTGTAATGCAAATACTCCATAAGTGTAGAATACTTATGGTCATAC
+CCCAAACAGGGTGCATCGACAAAGTCAAAATAAATTCTGTCTTTGTCCTTGTCCACATGC
+CAATCCACATTGAAATGATCTATGTGACCCCTGTCCTTAATGTACATCTCGGGATCGATC
+ATAACAGAACAAATGAATTTCATCACGCTTATTTCGTCTATCCCGACC
+>ds2020-328_70
+GGTCGGATAGACGGTTATGATTGGTTGAGGAGGACAACAAAGATCCGGCGGGGAGACCAT
+GATCCCCATCTGAGCGGAGGTGCCATATGTGCTTGAGCAAAGCTGCATGATTCAAAGATT
+CCATTTTGGAGATTCCTAGGCAATCTAGAAAGACAGACCGTAGCCCAAGCAACCTTGGCC
+CTTCTATGGTCAAGATCACTTCTAGAGAAAGGCATGGAGAATATGCTAAACCCGCTGGAT
+TACTCCTTGAGGAAGGAATAAAAGAGAAGACCAGGATGGCGAAAAGGATAGAGTTAACTA
+ACTGTAACCTGCCCGCGAAAGAAAGAGCCTTACTAGCCCAACAACTGATGCCTTTCCGAC
+CGGACTATAGATAGGCCTTACGCCCAGACTGAACTACACGATTGAAAGCCGTTACGTTAG
+CCCGCAACCAGAACTTCTTGCTTACTTCCCTCCGTAGCCAAGACTTTTCTTACCTTTTCC
+ACTCGGGTAGCTCACTCTATATGGCTTGTTTTTTGGGAGGTAAGCT
+>ds2020-328_71
+GGTCGGGATAGACGGAGACTAAGAGTGGGCAGAAAGTCGAATGACGGGGGGCAATACCTA
+CCGAGAGCTATAGCGACGTTAGTGCACTCGCGGATAGAGAGCGGACCAGCAACTTCATTA
+GCTGATGCACTGAGATCAAACGAAATACGTCTGTATGAAGCAATAGAGCGGGGTATGGAC
+GCCGAAATAGCATTGAAACTACGGTCGTTGTATATATCACGAGTGGCGCCTTTGTACGGT
+AATAACAGGCAAGAAGCTATGGAGCTATTAGAGGCGTCGTCTGTAGTAGGAGGACTGAGT
+ATGGACAGGGAGGCCAGAGTAGACAAAACATTTACGGAAACTGAGCCAACGTCGAAGGAG
+TCTGACGAAATAATGAACTTGGCGGGACACAGAAAATGGAGGGGAGTGTCAGACATGGCC
+AACGTGGTACTAGAAAAAATATCTGAACAAGGAGGAAGTGCCATAACGATAAAAAACATA
+ACGAAGCGAATTTATAATTATAAGCTGAGTGCGTTGTCTATAAAAA
+>ds2020-328_72
+GGTCGGGATAGACGTTGCCCTCCCCTTTCTCTCCAGCCCGAACCTACCTCTCTCCCTATT
+CAATGGTGCCGCCTTAACTTCCGTCTTCTTGATGCGAGGAGCGTAGTAGTTGATGCGGGT
+CTGTATAACACGGTCCGCCTCTGCTATACGCTCAGTTAGGGCGTTCATCTCCTTCTTGTA
+TTCCTGAACGATGTAGGCTTGCTCCCCTTGAATACGGCGGGCGGTTTGATACTCCGCCAA
+CTCTGCCGCGCTCAACGTTGAATCGTCCACCGTCATATTGCGTCTGGCCGATACAATCTT
+GTAAAAAGCCATTATACATGGTACGGCCACGCTGGCGTGCTTAGCATACCAGACGGCATT
+CTCCGGAAGAATGTCCTGAGTTTGGTACATCTCCCTCAACCCCACTGTCCAGCGCTCCAA
+GGACTTTTCGTTGCCATTGAAGCTAGCACGTGGTTCCCTAGACTTTGCTGGGTCGAAGTC
+TTGGATGCGGGCCCACTCCATCCACACGTCTATCCCGACC
+>ds2020-328_73
+GGTCGGGATAGACGCGCGGCACTGCTATTGGCATAACAACCGGTACACCATAGGTTGGCC
+CAACCCAGTCCTCTCGTACTAGGGTTGGCTCCTCGCAGTTCTCCCTTTAACACCAACGGT
+AGATAGGAACCGAACTGTCTCACGACGTTCTAAACCCAACTCACGTACCACTTGAATCGG
+CGAACAACCGAACCCTTGGGACCTTCTTCAACCCCAGGATGTGATGAGTCGACATCGAGG
+TGCCAAACGACTCCGTCGATAAGAGCTCTTGGGAGTCATCAGCCTGTTATCCCCGGCGTA
+CCTTTGATCCGTCGAGCGAGAGCCCTTCCACACGGGACTCCCGGATCACTATGGCCGACT
+TTCGTCTCTGTTCGACCAGTAGGTCTCACAGTCAGGCAGGCTTATACCATTACGCTCAAC
+AGCAGAATCTTAGCTTGAGCCTACCTTCGCACACCTCCGTTACTCTTTAGGAGGCATCCG
+CCCCAGATAAACTACCCACTACACGCGTCCATCCCGCCC
+>ds2020-328_74
+GGTCGGGATAGACGAACAACTACCATCTCGCTCTTTCCTTTTTTCGGTGCTACCTTTTTC
+TTTCTAAGGGATGGGATTGGGATGTATAATAACCTTTTTTTTGAGGATGCCCGGGAACAA
+CTCCTAGGTCAATTAAGGATCAAATGTTGGAACCTCATGGGTAAGGATAAGGTAATGGAA
+TTGATAGAGAAATTCATAGACCTAGGTAGGATAGGAGAATTGATAAGGGGAATAGAGATG
+ATGATAGAGATCATACTGAGAAACAGAATAATCCCGTACGGGTACAACTCTTATTTGAAC
+GAAGTGAAAAAAATGCGATCTTTGTTGTCTAATAGAACAAACACTAATACCTTAATTGAG
+TCGGTCAAGATCAAATCTGTTTATCAAAGTGCTTCTCCGATTGCTCAAGACATCTCTTTT
+CAACTGAGAAACAAAACAAGATCATTTCGTTCCATTTTTAGTAAAATAGTGAAGGATATT
+CCATTAGTAATGAAAAAAGTGTTTCGTCTATCCCGACC
+>ds2020-328_75
+GATCTGAATTACGGCGGTCGGGATAGACGAAATGCCCTTGTTTCTATCCGACCTAAAGGT
+TGGGCATCCCCAAGACAAGAGAAATATCAGTCGGTGAGGTTCGGATCGATCGGATCAACG
+GGAGCGAAAGCTGCTCGGAGAGAAAAAGAAAGTATGGCGTCTTTGGTCTTCTATGGAAGT
+CTTGGCTGAATCACTTGATCCAGTTAATCAAGAATCTTCTGACGAATAAGGATTGGAATT
+CACATCTGAGCAGTAAGGGAGGTGGAAGGACAGCAAGGTGGAGTAGTGGCGGCCGTTNNN
+NNNNNNNAAAAGTAGTAGGATTCAGAGAAAACCCAACGGCGGAAAACCGCTCCCCTTTCA
+GTCGAGCAAGTAGATTCAGCGATTATTGCTATTCTTTAACGCCCCCCGAAGATTCATTAA
+CATTAAGTAGCGTACGCCTGGTTCACCGCTAAATACACGAAAGAAGAACGGCTCTCCCGT
+TTGATGACTAAGGGGAAAAAATCGTCTATCCCGACC
+>ds2020-328_76
+GGTCGGGATAGACGAACTCACCGCTTCTATAGCCCACAATCTTTGCTGTGCATCGTAAGA
+TGAGTGGTCCAATGACACCCTCCAAGCTTTAACTTTGTTATGTCTCTCTCTCTCCTCTGC
+TATCGCGGCCATTTGCACTACATCATCTTCCGCAAATTCGCCGAAGTGGTTTATTCCTAA
+GCTCATGTTATTTCTGAATCTCGTCATTTTCAACATCTTATCCATCACCGAGAATAGGCT
+CAGCTCCACGTCTATCCCGACCNNNNNNNNNNGGTCGGGATAGACAGTTGTTTGCCCTGT
+TAATCTGCTTGTCTTCTTCTTTTCTACTCTTCTTTTAGCGAAAACGTTGGCAGCGACCTC
+TCCTCCTTTGGCTTTGCCGTCTATGAGCATGTCTCTTACTGCCTTCACTCTTCTGATCTT
+TCTTGGCAGATAACTAGCTATCAGTGGCAGTCCTGATCTGTGTCTGTCTATTATTCCTGA
+TGTCGCTTTGTTATTCGCGTACGTCTATCCCGACC
+>ds2020-328_77
+GGTCGGGATAGACGCTCGTTCTCTCTCTCTCTCTCTCTCTAGTTTTGCTCGGCTGAGAAC
+CAGCCAGCTCTCTCCTCCTCTCCTAAAGCCCTCTTCTCTTTATTTACAAAGGCTCTCAAG
+CCTACCTCAATGTAATACAACTCTCTATACATATATACAAACACAACAACCAGTGGATGT
+AGCCCGAATTCATGGGTGAACCACTCTATCTCTTCGTTTTACTTGTATGATTGTGATATT
+ACGGCTATCCCGATTTTATGGGTTCAACATTTGGCGCCGTCTGTGGGAACCCGCACGAAA
+GGCATGTGTTCTCATTTCTCTTAAAACACCTCATCTCTACCAAAAACAACTATCCTCATG
+GTCCCAGCACTCTTAGCCAACCAAGACAAGCAGAAAAGGTCACGTTCTCCACACTCCAAA
+ATCTGCTCAAGACACCCATGTGTCTCCTTGGCTCATTCTCTCCCTCGCGCAGCTCTCATC
+CACTTCAACATCCCCTGCGCACGTCTATCCCGACC
+>ds2020-328_78
+GGTCGGGATAGACGGTGACCTCTCGGGAAAAAAAAACAACGCAAAATCGAAAGTCCAATA
+TAGATATACAACGCCCCTTACGAACAAGAAAATCAAGTGGCCTTTGTTGAAGGCTTCTAG
+AGTGAGGAAAGGTTCTTAGCCACCGGTGACCGGCTTTCAAAAAAGCACCTTTGGGCGGAG
+GTTTCTCGATAAACTATCAGGGGCTTGCAACGTCTATCCCGACCNNNNNNNNNNTTTATA
+TAAAAAATTTTCAGGCCAGTCCTTTGCTTTGTACCAGAAGAGTGCGGCAAGGAGGAGATA
+CTAAGCAATCAAAGGGATGCAAGCAAGGAATTCGGCCTATTGGATTAAAGCAAGGAAGCA
+AGAAAAGAGATAAGCGTTAGAAGGAGGTAGGAAGCTCTTGCTATGCCGCACTCTCATACT
+TTTGAGTAAGGAATTCCCTGCAGGGCGGTTAACGGCTGTCGGATAGGGCATCGGGAAGAA
+CATATGGAAAAGTAGCGTCTATCCCGACC
+>ds2020-328_79
+GGTCGGGATAGACGATTTGCTGGCCTATGAATGTGGTTTCGATCCTTTCGGTGATGCCAG
+AAGTCGTTTCGATATACGATTTTATCTTGTTTCAATTTTATTTATTATCCTTGATCCGGA
+AGTAACCTTTTCCTTTCCTTGGGCAGTACCTCTCAACAAGATTGATCCGTTTGGATCTTG
+GTCCATGATGGCCTTTTTATTGATTTTGACGATTGGATCTCTCTATGAATGGAAAAGGGG
+TGCTTCGGATCGGGAGTAATCACTAGTGATAGGGCAAAAATAGGGGGGAAGGACAAAGGA
+AAGAGCGATGCCCACATTAAATCAATTGATTCGTCATGGTAGAGAAGAAAAACGGCGCAC
+GGACCGTACTCGAGCTTCGGATCAATGTCCCCAGAAGCAAGGAGTATGCCCGCGTGTTTC
+AACGAGAACACCGAAAAAACCAAATTCAGCTCCACGTAAGATAGCCAAAGTACGTTTGAG
+CAGGGACCGGTTTCGTCTATCCCGACC
+>ds2020-328_80
+GGTCGGGATAGACGCGCATCCCCCTGGTCGGGATAGACGTACATTGGGGCTGGTCGGGAT
+AGACGTCTAGGGGCCATCATAGAAACATAGATAGGGTCAACGACGGAACGAACAACGAAA
+CTTTACGACAGCTTTTTCGTACACGTTCACTTGCATCACATACACAAGTGCTCTCTGAAC
+CGTGCAATAAGGTTACCCATAACACGGCTCTCCCACTTGAGTTACCTTAGCCCCAGGCCA
+TGCTATTCAATGATATTGGAAAAATGGCAGCGTAACGTAACAACTAGTATTGAAAGCAGG
+TCGCCTTTTGAGGGATGGAAAGCGTTTCAATAGGAGCCCAGCTTCCCTCTTTGCTTTGCG
+ACCTCATCACTTCAATTCAAGCGCAAACCAATTTCTTTCTTAGTCACCGGGCGGGAGGTG
+AAGGCCATAAGAGAAGATTGCCCTCCCGGTAAGGTAGTTTACTTGCTTACTTGTTAGAGT
+AAGGAAGAGAGGAAAAGGGTGCTGTC
+>ds2020-328_81
+GGTCGGGATAGACGAAACTTCCAATTTGTAAACGTTGTTTGTATTCTGTTAGATGCTCTG
+ATATTGCCCTGTTAGGATTCGGTATTTTGAGGCCGGAGGCCATGGGTTGTTAACACTATG
+CTTGTGTATTGTATGCTGGCTGTTGGGTTGTAAATATCTGTGTTTTTGACAGGTTTAAAT
+TTTGGGATTTGTCCTGTTTACAGGGGAGACTGCCAAATTTTTGGTAGGAAGTCTCGGTTA
+TTAGTAAGTGGGCCCGGCATCTAAATAGTGGCGGCCGTTNNNNNNNNNNATTCCGGGGCG
+GGTCCTGTCAGCTTGGTATCAGAGCATTAGGTTCTTTTCCTGTGACTTCCATGCTTTCTT
+TGCATGTTATTACTGAAGATTTTGTGGTTCCTTTTGTTTAGAATCATGCATCGCCGAGGT
+GCTCGGTTAAGAGGTCGTGTTCCAAGATACGGACCGAATCCTCCACCTCCATCTCCGCCA
+ACCGTCTATCCCGACCGCCGTAATTC
+>ds2020-328_82
+GGTCGGGCTTGACGTACGGAAGCCATATCCGAAGCTAAAAAGATATTAGCGAGACTTAAC
+CAAAAAATAAGTAAGAAGAGGTTGGTGGAGGCGCTGGCCGGCGGCGAAATCGCTGTGGTG
+GCGCTAAGCGAACTGATGTCAACTCTAGGAATGATACCCATAGACGAGGCGCTGACTGCC
+GAAGCTTGCGGGTCAACAAGCCCAATCGAGTGGGGAAAAGAAGGAAGAGAAAGAATAATG
+AGCGAAAGAATAGAAACGTTACGTGAAGCTGCGTCTGAGCCTTCGGCGAGAACGACGACG
+CTATTTGTAGAAGAAAGGTGACAAGAAGAAAACATAGGAAGTACGCGGCTGGGTGCCAGC
+GAAAGAACGGAAGGATAAGCAAACAGAGGAGAAGAAGTGGATGGTGAAAAGAAAGAAAAG
+AGAAGACAGACAGCGGTCAGTTGAATTGGACCAGAGGATCGGAAAAGAAAGGGAGGTGTG
+TCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_83
+AACTGCTACATGCACTACCATGTAACAGCTCAGGCACTGTGGACACATTGAAGCAAACCG
+GCTCGGACGGGTGGCTAGGACCTACGTGTTTCACCGAAAATAGGCAAGGTCTGGAAAGGA
+TGGCTGGCATGATCAGAGTAACGAGAGAGCTACACTTAACCGATAGGAAGTTGGCAATGT
+TGAGAAGAAAAGTAGATGTTCTAAAAGATACTGCATGCCAGGAGTGGTTGCAGATGCATC
+TCAGCGGGTTGTTTCGTCTATCCCGACCNNNNNNNNNNGATGCAAGGATGGTATGGTGTG
+GTGCTATCACTACTATGTTGTGTAATGATACAGGGAAAAATCTACACATGTGGAGAAGGT
+CATATATAAGCTGTATTGAAGAGATAATAACTAATGCTGCAGTGTGCTTCGAGGCTGCCA
+ATAATGGTGTGTCAGCATCCATTTTAATAACTCGGGGAGCTAGTGCATCATGCCATACCA
+CAATTAAACGTCTATCCCGACC
+>ds2020-328_84
+TCGGCGGTCGGGATAGACGGGTAGTTCGGGTTTGATTGTGTCATAGCTCTATGATTCGGA
+TTAGGTTTATCGTTGGATGAACTGCATTGCTGATATTGACCCTAAAAAAGAAACGGTAGG
+TACAGCTAGTCCGTGAACAGCCAACCATCGCACTGTAAAAATTGGATAGGTTCTATCTAT
+AGTCATTGGGGCCTCCTAAAAAGATCTACTAAATTCATCGAGTTGTTCCAAAGAATCAAA
+ACGGCCAGTTATTAATGGAATTCCTTGTCGGCTTTCTGTAAAATACTCGTTTGGACGAGG
+GCTTCCAAATACATCGTAAGCTAAACCCGTGCTGACGAATAACCAACCCGCAATAAATAA
+GGAAGGTATAGTAATGCTATGAATGACCCAGTATCGAATACTGGTAATAATATCAGCAAA
+AGAACGTTCTCCTGTGCTTCCAGACATGTTGAGCTCCGCATATTCTTGTACAGTCAGGGG
+AGGGGGTCGTCTATCCCGACC
+>ds2020-328_85
+GGTCGGGATAGACGAATTCACCTCCTGATTTCTGGTTACTATCCACCTCCTTTCTCCCAC
+GGCTAACACTAAGCAGTCTACTATCAGCCTGATCTCCAGCCCTCCAGCCTTAAACAAAAT
+AGCTCCGCATTCTTTGATCTCCTCAGTCCTGAATTCTTCCAGCCCTCTTACTATTTCCAC
+CACCGCTTTTCCTTTCGCGCTCACTAATACGTCTGTCGATTCATCGACGATCACTATTTT
+TTCCGGCTCAGTTTCCGGATAAAACAGCATGTTAGCCCATTTAAACATGGACCATGGTTC
+GTATGTTATGCTGCTTTCAGCTATCTCGATTTCCACTTGTCCTTGAGCCTTTATTAGTTC
+GTCTATCACTTCTATCTCGAGGAACACCGACTTCTTCAATATAGCATTCCCTATCCATTT
+GTTCATTCGCATCAGCGGAACTCTCTCATTCCTCGCCATTCTGGGGAACATTTCTAGTAT
+GTTGTGGACCATCA
+>ds2020-328_86
+AACGGCCGCCACTACTATTCTTCATTTAGTACTTAAACCGGGAAAGTCCTTCCTTTCCTT
+CTCTTTACGAAGCCTAATCCGCTGAATAAGGGGAATTTGCTTTCTCCTGCTAGTTTACCA
+AAGCGGATCATATGGCTTTATTTTTCCCCAGCTGCTACTCTGAAAGTGCCCTTTCAACCT
+TCAATTGCTTCCTGTGCTAGCGGTTGATGTGCTTTCCTTCCAGACGGCTACGAACTTGCT
+TAGCCCTCTTCTTATTCCCAGAATCCTTAGCCTCTTCCTAAATAAGGCCCCTCCCTAGTC
+CTTATTCTCTATTCCTTATAAAATGAAAGATTCATTCTTTAGCCAGATCAACATCCTTCT
+TCCTATTACCTATCTCCAGATCAAGATCCTAACATGATTTAAGCCATAACTCTACTATGG
+AAGTACTTAGTAATCCTACTTCCTATTCACTATCTACTTCCTTCGTCAGCCTTCCTGCTC
+GTCTATCCCGACC
+>ds2020-328_87
+GGTCGGGATAGACGTTCCTTGTTGCTTTTCTTACCATTATCTACAGTCCCTACAGCACCA
+CTTTCATTTTTATCACTATTTCCAGTCATATTCATTCTGTTACTGTTAATCCCCATTGTT
+ATTTTCCACTGCTCTGCCGTTGTCTCACTGTCCCATCGAAATCTTTGTGCTGCTCTTTCG
+AAACTCTTCTTCCATAACGCCTGTACTTTGCTCGTCTTCACTCCTCTCCTTTCTAAGACT
+GCCAGATTGGAGTATATTTCATGTAGTTTACTGTCAAATCCAACCACTCTGTCTGTTTCC
+CAGTTACCACAGACAAAAGTAGCACATGATCTAGCCAAGCACCCTCTGAGTTTGCCGTCT
+TTACACCCTAGAACACGTAGGTATTCATGGTAAGACTGATCCGTAAGCAACTTGACTTCT
+TGCCCCTTAAGATTACATTTAGTGGCAACTTCATTCCAAGCTAAAGCGCAATGCCGTCTA
+TCCCGACC
+>ds2020-328_88
+GGTCGGGATAGACGGGGTGCTCCTCTGTTTCTCTCACCATGAATTTCATCGACTCTTTTA
+TCATTCTCTCTGTTATTTTATCGAATTCTTTCTCGCTTGCCACTTTCCCAGTTGAAACCA
+TCATGCTTATTGAGCTCGGCGCACAGTCTTCGTTGTCTAGAGCTATTAGATTGACTGCCT
+CCACCATTGCCAACGGCCATAGATACGCCGCGATTCTAATCAGCGCATGTGCTATTGATA
+TAANNNNNNNNNNGGTCGGGATAGACGAGCCGCTAATATCCAATCTATTAGTACCAGCGA
+GCTTACACCGACGCTCGCCAATATGGACATAGTTGTGGCGCAATAAGCTGCATAAGACGC
+AACCCCTATTGCGCTGGCTCTCAGTGCTATATTGTATGCCTCTCTATTCTCCATGTACAC
+ATTTATGTTATCTGCTGTGTGTTTTCTCTCTGACAACACTCCTATTCCACGTCTATCCCG
+ACC
+>ds2020-328_89
+GGTCGGGATAGACGCATGGGTTGCATAGCGCAGCCTGGAGGGAGGTGCTGCTTCAGCACC
+TTAGACATGGGCCAGATGTCTGTAAGCTACAGTGGCTACACAGGCACTGACATCAAGACG
+GTATCTGTGTATGATTCTGACCCGCAGTATGGGTGTGGTACTGAAACATCATCAAAGTAT
+GGCACTGCAACGTCAGGTTGCGTGCCCGGCGATGGGTACGCTCACTACGGAGGTTCTGCA
+TGGATAGATTGCAAGACCATAATGGCGTGTCAAGAGTATTACGACGACATAGCAAAGCGT
+GACGCAGGAGATGTATCATCAAATCGAGGTACCAACGTCACTGTTGTCAACGAGAGTCCA
+GCAGGATTCATGTTTGTGTACGACCTGTTGATGTTCATCAACGGGCAGCCCAGACCTCAA
+GGTCACGAGAAAGCCTACTTGTTCTCAGTACCAGAGACCACGGACCCGTCTATCCCGACC
+>ds2020-328_90
+GGTCGGGATAGACGGGTCCGATGCCTGCTGCTTCATCTGGGAGAAAAGAATCATAGATAT
+GCCGGTCATTAGAAGGAAGAACCGCCATAAAAAGATTCCTCGTGTATCATCTGTAGCAAA
+ACTATGAACGGAAGCTAGCAATCCGGACCGTATTGAAAAGGTTCCTGAGACACAGCATGG
+AAGAGTCACAATATTAAGAAACGAGGTCCAAGAATGAAGAAGGGGTAGAATTACTGAATG
+AATACGAGCTGTGGCTAATACCCGAGGCATAAAAGAAGCATTTTCTACGGGATCCCGAAA
+CCACCAGCCACCCCGACCTAATTCATGATGAGCCCACCAACTTCCTGGCAAGATGCCTAC
+GGTTAAAAACCACCGACATGTCAAGATCCAAATTCGAATTGGTTCCTGGTTTTGGTCAGA
+GACCACTGTGTTCGCGCCGGCAGTCCAACAATGAGGCAGCTTCGTCTATCCCGACC
+>ds2020-328_91
+TCCGATCTAATTACGGCGGTCGGGATAGACGGCTCGGAGCCCTCAGAATGTCAAATACCA
+AACCTGGTTCATAGATAAACCAGGCCTCAGTCCAGTTTTCGTGGGTCAGCTTGCAGGCAT
+CAGTTCAGCTATTTACACAAGTCAGATGAGTCGACACCCTTGATAGAAGTTGTTCCAATG
+GGTGTCTACTATAACATATCCAAATTTCAGCCCAATTGGATAAGTCTGGAGCCCTCAGCA
+TGTCAAATACCGAACCTGGTTCACAGACAAACCATGTGAGCTCACAGCAAAGCATGAGCT
+GCCACACATGGAGGCAAAGCATGAGCAGCTGTTGAGCCATGTGCTTAAAGCAGCCACACA
+TGGAGGCAAAGCATGTATCAGCTGCAAAGAGAGGTGTTGTGACCTAAGATGAGCTGCCAT
+GCATAGGAGACAAAGCATGAGCTGCCAAGGGGGAAAAATCGTCTATCCCGACC
+>ds2020-328_92
+CGTCATTGAGGAACAAATACTACTCGAGACAATGCGAGCGATTGCACATGACAGTTTCGG
+ACTGTTATAAAATAAAGACCTCCCACAGGTGTGTGGGGGGCATAAGTGAAGACAAGAGAT
+CGGACGTAAAGTGGATGATACGGTCGTCGGGCTTCAGGAAGGGTGCCACGCAGATAGGCG
+TGTTACCGGGAGTGGTGGACTACTCCAGGATGGTGAAAGCATCACTACAACTTGAAAGAC
+CTTTGCAGGATTTCATTTCACGAATAATGCGCGCAACATACGACGCGGTGATACCAAAAG
+AAAGGAACATAAACGTTTCAAGGAATGGTAACATCAAGCGGTACGAGATTTTGCGAGCGT
+TATTCAAGGTACACAAAGAAGAAACAGACATAGTCAATTACGGAAAAGCCAAAATGACCG
+GCTTCCTGATGGACGTGTTGAATGGGACCAATTATTCATAGTGGCGGCCGTT
+>ds2020-328_93
+GGTCGGGATAGACGAATTTTCTGGTGAGTTTATAACGCTTCCTTTCGTTATCGATCGGTT
+AAGAATGACATTCGATTTGGAGGATGATTATTCATTCTCTATGGGTGATTGTTCATACGA
+TCTGGAACTCACTGATGCTCAACTTGATTATGTTGAAGTTCTTCAACAACAGAAAGATTT
+CTTTTCAGAAAGTCTTGGTAAGGTTGTTGTCGATTATGATTTTTCCCTTGATAGTGAAGA
+TCCTTCCATCAAGGATGCTGTGAAAATACCCGATGAAATTCCGGAAGATTTCCCTCAGGA
+AAGTATACCAGCTGAAGTTGTAGCTGATGTTCCACAATCTGTTAGTGATGTCGTCGAAGA
+GCAAGTCGTGGCTGGAGAGTTGATACCTAGCTGCGAAACTGTCAATGAGAATGTTTGTGT
+GGAAGTTAAATACCCCACAAGCCTTATCCCTAGATTCCGTCTATCCCGACC
+>ds2020-328_94
+AGAAGTGGGGAAAAAGTAAAAAAAAATCTCTTCAAACCTGAGCTTTTCGGTTCGCCCCCC
+CTATGTGGTCGGTCTTCTTACCAGTCTGCCTCCTTTCTCTTGATGGAATATAAAAAAGCC
+CGAGCTCCTGCTTTGCTTGCGCTCTTCACTGGCGCTCGCCAGATGTATCACTCATCCCGC
+TCCAAAGGCAAGGAGTCTTCTGTATGTTAGAATCTTTACGGGAATGAATCGCATATGTTG
+GTTGAGAATTGCTCGGGAATTCATTTATAGTTATTTTGCCAGGTTCTAGGGTTGGGCTAC
+TCTTCTTTTTTGTCGATCGAGCCGCTTTCCCTCATTCCACTCGTCCAGCCTTCTTCACGA
+ACTTGTACAATCGATGCCACAAAGATAGACAACTCTATTATCGACGAAATAAGGAAACGG
+GGGACGGTTTGGCACCAGATATCCAGGGTAACCGTCTATCCCGACC
+>ds2020-328_95
+GGTCGGGATAGACGGGACTTGTTCCCACTTCAACACAGCGCTCTATAGGTAGGCAATTTT
+TTTGAGAATTTTGGTCCTAAAAGTAGCCGAGCTCTCACAAATAGAATTGGAGTACCACGG
+AGAAAAGCTAGCTGGATAAACAAGACAGGGATCGCCCGCTCGGCAATGCTGCCTTGGGGA
+GGAAACAACAAAACACTTTAATATAACAATTAAAAACTCATATTCAAAAGCTTTTCGATA
+TATGAACAAGATTACTATAAAAGAGTTGGTGAACATTGTTCTGACTCATAGCTCTAAGAT
+GACTAGCATGAATAAGCCAGCTTCAACACCACCTATACTCTTAATCATAGACAGACTTGC
+ACCGACCTCAACATAAAAGGATGAGAACGGCCTGTCTATTTATATGCCTTGGCTTAACTC
+ATTCCTATACACTGCAAAGAACACAAAATTAAAACAGCCTGG
+>ds2020-328_96
+GGTCGGGATAGACGTTTAAGGGGCCTGCACAAGCGGTGGAGCATGTGGTTTAATTCGATA
+CAACGCGCAAAACCTTACCAGCCCTTGACATATGAACAACAAAACCTGTCCTTAACGGGA
+TGGTACTTACTTTCATACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTT
+GGTCAAGTCCTATAACGAGCGAAACCCTCGTTTTGTGTTGCTGAGACATGCGCCTAAGGA
+GAAAGTCTTTGCAACCGAAGTGAGCCGAGGAGCCGAGTGACGTGCCAGCGCTACTAATTG
+AGTGCCAGCACGTAGCAGTGCTGTCAGTAAGAAGGGAGCCGGCGCTTTTCTCGCTTGTTT
+AGTAAAGTCAAGTTTTTGGCCTTATCTTGCAGGTGACGACGACGTCGAGTTGGCGGCGGG
+GAAAGACTCGGCATACAGGCGAGTATCGTCTATCCCGACCG
+>ds2020-328_97
+AACGGCCGCCACTAAATTGTCCCCTTAGATCCGCGCTTGTGATCCACTCGTAGGAACTCC
+GCTATAGCTCCGTACGCGCACTTGCTCATTTGTAGTCGTATATTGTGCTTCTTCGCGTTT
+CGGCCGGCTAGTAACACGTCCCCGAGCGAGTTACTGCCCAGCAGCACGTCGTCGCCGTTA
+TGAAGACTGTTTTGTGACTTCACGACATCTGGCACTATTAATTGAGTGTAAATGTAGTTC
+AGGACGCTATTCATGAATGTGGTGAGCCTCCACCCCGACAGTAAAGTTCCTTTAGCACTA
+TACTCCATCTTCAAGCCTTGGTTGTCATGTACTATCACTCTGTTCAGCGACAGTCGAGTC
+CATTCCACCGCCGCCAGCTGCTCTTGCGTTAGGAAGGGCCTGAAGGTGTCTCTGTACGCA
+TCTATCACTGTTTTCATTGACTGTACACTATGTTGACTGTT
+>ds2020-328_98
+AACGGCCGCCACTCTTGGGTGTCTATGTAGTTAAGCACGCTGTTCATGAACGTAGTGAGT
+CGCCACCCCGATAACAGGGTCCCCTTAGCGTTGTACTCCATTTTCAAGCCTTGATTGTCG
+TGTACTATTACCCTATCCAGTGAAAGCCGAGTCCACTCCACAGCTGCTAGTTGCTCCTGA
+GTCAGGAAGTGTCCGAAAGTATCTCTGTACGCATCTATTACTGCTTTCATAGATTGTACA
+CTGTGTTGACTGTTGAAATCCTCGAAATCTACACAATACTGAGTCCTGCCTTCTAAGACT
+GACCTTACTCTACTGCGGACGTTCTCATCGTTGGCTGCTTTTCCCACCGGGAACGGCGAG
+GGCAATACGTCCTCGCAGTTATAGAAGGCGAAATGTGCCAATACGTAACTAGTGACATCT
+GTCCCGTAGATAGCGCGGAGTTTACGTCTATCCCGACC
+>ds2020-328_99
+GGGCGGGATAGACGCTTGGTGATACTTACTTCACTTCGTGAGGAGGTGAAGGACGTAAAG
+GGAGACTGGGCCTTATGCAAGGAAGCTGTCTTGAACAAGACCCGGACTCCGAAGGAACCC
+AAAGTGCTGGATTCTTTCAAACCCAAATCCTATAATGGGAAGAGGGAGGCGAAGGAGCTA
+GACACGTTTTTGTGGAATATCGAAAGATATTTCAAGTATCTGAAGCTCGAGGAGGACGAG
+CCGAAGATCAACACGGCAACATTGTTTCTCACCGACAATGCTCTCATGTGGTGGCGACGT
+CGATCCATGGAAATCGACCAAGGTACGTTTGTACTAGACACTTGGGATGCATTTAAAAAG
+GATATTATGCTGCATTTCTATCCAGAGAATGCCAAGTATGAGGCAAAAGAGAAGCTGAGA
+TGGCTAAAGCAGACGGGGATGTTCCGTCTATCCCGACC
+>ds2020-328_100
+GGTCGGGGTAGACGGCGAAGAGAGCTACGCCACAATGAATGGTAACAGATGAATTGAAAC
+TAAAGCGACGGGTGTCAATTACCAAAAACGACTCGACCACTAACTCAGTCCCGCGGGTAA
+CACAAGGCCGAAGATGGATGCGAAGAATATTTGAAACCGCTCTCGAACCATCACACGGAT
+TCCGATCCAACTGCCCATGATATGGTAAGAACGAAATGGAAAGGCAAAAAAACGATTCTA
+TGCGCAGACGTGAAAGCTCTATCGATAGAAGCATTCTAGCCTATTTTGATTTAGAGAGGA
+GCGATTCCCTCGTCTGAGAACCGCCATTCCCGCACTATTCCTCCCCACTAAAAAGATTGA
+TAATCTCGATAACCAAAACAAAAATGCAGAAGTGAGCGTACCCCACTCCTCTCTCCCCCC
+TTTTTAGCCAACCCCAAATAACGTCTATCCCGACC
+>ds2020-328_101
+GGTCGGGATAGACGGTCGGCTGGCTTGAGAAGGAGGTCGGGATTTTCCATTATCAGAATA
+ACAGAGCTTTTTTTGTTTGTGACAATCTGGAGGAAGCTAAATGGTGTGCTAGGGTGGGAA
+AGGTAACGATGGAAGGTTCTTGTGACTTGCTCCTGTTCGCTTGGAAACAAAGTCTGGAAA
+ATAATATGAGGAAGGTGGTGAGTTATGGGGGATGGATTGCAATTACTGGGCTGCCGCTTC
+ATTGGTGGTCCCTAAAATTTTTCAGCCGAATTGGTGAGGCATGTGGAGGGTTAATCGAAG
+TTGATTTGAGGACTTCAAATTTGGAGTATTTGATCGACGCAAAATTAAGAGTCAGACCTA
+ATGAAATCGGTCTTTTACCTGGTGACTTGAGAATTGCTGATAATGGGGAGGTTCACGTCG
+TCCAAATAAGGCCTTGTCGACGTCTATCCCGACC
+>ds2020-328_102
+GGTCGGGATAGACGAGAAGGTGGTTTATCATTGGGTCAATAATGCTAATCCCTCTTTTTG
+TGCTACTCCTAGGGCGAGAAGAAGATAAGAAAACGCAAAGCGTTCTCTCCCAACCTGTTT
+ATTTCTAAAGGCTACCCTCTCTCGGCTGGATGTTGGTCCAGCCTACTACGAAGATCCCGT
+ATCCAACAACCCAACCTAAAAAAAGGGCATAAAAGCGCCTTGTCTAGGTTNNNNNNNNNN
+GTTTCACGCCCCAACGTAGCTAGGGTTTGTGTAGAAATCGGTCTTCCCTTATTATTATGA
+AAAGGTTGTTTACTTGCTTACTTATTTTGTTAGAGTAAGGTAGCTTGCTTACTTAGTGCT
+TGCACTAAGGGGAAGGGGCTTTATCGGCTAGTGCGCAGGAGCGCACTTCCGTTTTCCCTT
+TACTAGTAGGGGTTCCGCGCGTCTATCCCGACC
+>ds2020-328_103
+GGTCGGGATAGACGTGCGTTGGATATATTATTTATTCAATGTTTGAAATTGGTATTTTTA
+TGATGCATTGGCATTATTTGGGGATTTTGATATATTTGAGTATCTTGAGTATGCATACAT
+GGATTTTGGAGATTGCCTATATGTTATTGGTTATGTGTGGGGTACTTGGGTTGTTGAGTT
+GAGATTGTAGAAAGGTTTGAGTATAGAATGTCAGTTTGGAGTGCTTTAAGCGCTACCCTA
+TGTACCTCCCCGGATTTGGAACTTGAGATACTTGGAATTGTTAAGACTTGGGGCAACCTT
+AACGGGTTGTAGCCGAGGACCCTGCGGGGTGGTAGTCTGCGCGCGTAGGACTGTTCGCAG
+ACGTACAAGCTTTGATTTGGTATCGGCTGTACGTGCTGGCTGAGAGTTGGTCCCTCGTCG
+TCTATCCCGACCGCCGTAATTCTGATCGGAAG
+>ds2020-328_104
+GGTCGGGATAGACGTGGTAAGTTGCTAAAACAAACGGGAGGGGAGGATCGACCCGTTCAG
+TATAATTCCGAAGAAAGACTGTTGGCAGCAGGTGTTGACATTTATTTTGCTCCCTTCAAA
+AGGAAATGCGGGCGGGGTTAAGCTCGGCAGAGGGTTAATGGGGTAGGGTCCTGCCCTTAA
+GATTCAGATAAGAAAAGAGTTCCAAACCTTTATGCATGCACCTCCGTATAAGTGCTGCGT
+ACAAGTTCCGGCTAGGATAATTGGGAAAGATCAAACCAATTTGAAGCGCTCACATCACAC
+ACAGTAGTAGTAGCGTAAAGGCCGTAAGTCGGGGGCGGCCATAACATAAAGTTATTACTT
+TCACATCTCTCTCTAGATATCTTTAGATAAAAAGAGAGAGAGAGAGAGATCCGCTGCGTG
+AGCAACCCGAACTAGCGTCTATCCCGACC
+>ds2020-328_105
+TCTGAATTACGGCGGTCGGGATAGACGCGCACCCCAACTCTATCTTCCTTATCAGTGAAC
+CGGAAATAGTGCGTAGGTACTCTTCAATGCAAGCGGGGACGAGACGACGTGACATACTAC
+GATGACGTACAGAAGTGCTGCCCTTCGGCTCGGCAATATGGAACCTCTCAACAGCTCCCG
+TTCCTTTATGAGGTCCTATCGGGATAGGTAGGCCCAATCCTTTCCCCTCCCCCTCCCTCT
+CCCTTTGGTCGAGCTAGTTTACTCCCTCTATAAGACCCTATTTATCTTTCCCCCTCGAGA
+AAGAGAAAGAAGAGAATCACTCCTTTCTTTCTTCTCTTCTTTCATGTTGTGAACGGCCCC
+TTCTTGTATCGAAAGGTTTTTCGTGCTATACACCACGTTGAGAAAGACACTTGATCGTCT
+ATCCCGACCGCCGTAATTCAGATCGGA
+>ds2020-328_106
+GGTCGGGATAGACGCGGTGGAGTACTTTGGGATTATATTCCGCGCCGAGGATTTGTGCTT
+GTGGGCTAGGGTGAATATTGCAGACCAGCGGATCTGGTGGTCGACAATCGTTCGGACTTG
+GTAAAGGTTATCGCGGCACCTGTAGTAGGACAGAGGATTTATTGCGATGCCCGCGAACCA
+ATTTACGATGTCTCCGTCGCTGACGTTCGTCAAGCAGGCCACGTGGATTGGCCAGGGTCT
+TCTTCGGCTAATGATACCTCGATCCCGAAGCCTTCGGAGTATCTTTTTGATAGGCGCCTC
+TATCTGTATGGGGAATTCGCTGCTGATAGATCCCGCCCAGTGTCCTCCTCCTTCCCCCGC
+CGCCTTCCGACCCGCGGGAGTATACAATGACAACTTCCGGACACTCATGCCCGATCGTGA
+GACTGCCGGTTCACGTCTATCCGACC
+>ds2020-328_107
+ATGAATCCTTTGTTACATCTGGCACGAGATGATAAAGAGAGAGCTTCGTCTATCAATGAA
+CATCTGATTGACGGAGCTCTTGGCATTGCTTTGTTTTTCTCTCCTTTCCTATCAGCGAGT
+TCCGATCCTTTTGTTCGAAATTTCTTCGTTCGTACCGAACCGCTTGCAGAATCAAATCCT
+GTTCCACAAGATCCTATATCAGCTATACATCCTCCTTGCANNNNNNNNNNGGTCGGGATC
+GACGTCCGCCAGTGCTATGGGCTTTGGCTTATGTAGATCAAAAATGATGAATGGGATTGC
+GGCACTCCACTCGACGCCAATGCGGAAGGATGCCGTCGAAAAGAATGGAACGCTGCTTCG
+CTCTGCTGGATGCGTCGGATCCCGTACAACAAGCGAGCTTTTTACCGTCAAATTCAAACA
+TGTGGGGGCAGCGTCTATCCCGACC
+>ds2020-328_108
+TGAATTACGGCGGTCGGGATAGACGTAGAGGGGCTTTCTCGAGCATGCATACCCTTGAAG
+CTAGCGGTTTGACATAGGTTATACTAGCATTGACGTTTGAATCCCCCTCTTTGATTACCG
+CCTTACCACACTGAGATTCAGTTTGAGAGTTCTCTAGCTCTATTTCTTCCAATAAGCATC
+TGTATTTATTTGGTATGAGTATATGCCAGTGTTGGTCTTCCAACNNNNNNNNNNAGCGTA
+TGAGTGTCCAACCTAATCCCACCATCACCAACAGTCCTACGTATGGCGTCTAAAGTCATC
+TTTTCTAACCTTTGAAGTCTCAGAGATAGTTGTACCGCTTTCCAAGCACAATCACCATTA
+CTAGTAACATGACCCTGGTTCCTGAGAACAAGGGATGGACTACTCTCCAACCCACACTGG
+CGTCTATCCCGACCGCCGAATTCA
+>ds2020-328_109
+TGAATTACGGCGGTCGGGATAGACGCACATACCCCCTCTTGATATTATCTCATCAAACCT
+GTTATTCATAGATCGTATCAACTCTCTGTAGTCGTTTGCTGGTGCCATCTCTACCCTGCC
+ATGTACCGCTGTTGACACAGCTCTTGCCAGGTACTGCGAACTCGTTTTGTAACTCGCCCT
+CGTGTCCACCCGTAAGAACTCACCTATGGTCCCAATATTTGTCTTTGCTAATTGTGCTCT
+TATCCCTGCGTCCTTTGCTCTTTTAGCCAGCTTCACTGCCTGTGCTACGTTTTGCGTTGT
+AGCGTACATGTCATCTCCGTTGTGCAGTGCATAGTTCACGCTACTATCTAAGCCAACGCT
+AACGAGATAAACTCTGTTGAGTATGGTGTTTATGAAAGATGTCAATCTCCACCCACTCAG
+CAATGTTCCGTCTATCCCGACC
+>ds2020-328_110
+GGTCGGGATAGACGCCTGTTCCCCATTGTTTGTTGTGGGTCGCGCCTCACCGCAAGCACT
+GAATGAAATGAGTGGAGATCTTCCTTCCCCCTTGTTAATTACCAAGAACTTCGTTGCCAC
+TAGTGGCGAAGAATAATCCTACCATCCTACCCCAAAACAACTCTGAGCCTAAAGAGAAGA
+GAGTTCAGTCTACAAGAAGCTGGCAGAGCTTTAGCCATTGGACTACATCCATCCATCCTA
+CCTAAACAGTAACCTTTTTTTGTTCGTTCTTCGCATGGCGCGAGTGTAGAGAAATTCCTT
+CCGGCTAATGAAGAGGCTACTCCAATCTTCCCATTCATTCCCAGTGGATCCTTCTTCTCC
+CTAAGAATTGAACGAACCAAGTTCACCTATACGAGAGTGAGGAATAAAAACCAACAATCA
+ACCCGCTACGTCTATCCCGACC
+>ds2020-328_111
+GGTCGGGATAGACGCTCGGAACTGGTATATGGATCTCTCCATGTAGTGGTCGGCCTTCTA
+GAAGCTTCGCCAGAAGCGACTAGTCGCTTCCCGAATGCCTCTTTACTTTAGTATGGTCTA
+GTCTTTCCAATGCCTCCTTCCTTGCCGCCAACGTACGCTACTAGGAGAGTAAGCAAGCTA
+CCTTGCTTGCATTCTAGAAACGGTAGCTTCCGCGCCCTTCCTGCCTGCTGAAATTGATGT
+GAATGATCGTGACAGCTCTTCAAATCCTATTCAGTCTGATTAGATATGTCACTGAAACAA
+TCCGTTCTGTCTCTGTTTTATTTTCGGATTCCGAGGATGAGCCGGCCGATCCTAACATCA
+TTTATGAGGAGCCGGACGACGAAGCCTCCTCCTCAGATAAAGATGTCTCCGTAACGTCTA
+TCCCGACCGCCGTAATTCA
+>ds2020-328_112
+GGTCGGATAGACGCCTACCCCCTCTGCTCGTCTATCCCGACCACTGAGCATGCACGTCTA
+TCCCGACCGCCGACTTCGGATGATCGGAAACACAGGACCGCGAGTTGCTTCGTCGCGCTC
+GGCTTCTAGCAAAAGCATAAAAATGCCGCATTTCGATGCACGCTCTGAAATGAGTACCTC
+TATTCGTATGAGCAGGCTGTGGATGAGGTTAAATCAGCCGGATTTTTTTTGAACGCGTCG
+ATAGGCCATTGCGTCGACGAGGTGGTATACGTTGGGGTTACTCTCTCGCAAGGAGAGTCC
+CATCGGGAAGAAAGCGCAGTAACGCCGTATTAACGCCATGGCATATCTTGGGAGTTTACA
+CCAAGTTATTGTTTTCCGCCTTCCGCTTATAATTTCCCTTTGCATAAGTCACTGGGTTTA
+GTTAGTGGCGTCCGTT
+>ds2020-328_113
+GGTCGGGATAGACGCCGATAGCGGGTTTCTTGATTGCCTCTACATCGGGTAAATTTGGTT
+AATTCTTTATTTTATGTGGTGTATCCGCAATAATATCATACCGTTTCTTTCGATGGAGAA
+GGGATCTACCTTCTTATATTTTTACATCTAGGATCGGACTTGTATCATTGGTACTAATAG
+GAATTGAACCCTTATGGCAAGAAAAAGTTTGATTCAGCGGGAGAAGAAGAGACAAAAATT
+GGAAAAAAAATATCATTTGATTCGTCGATCCTCAAAAAAAGAAATAAGCAAAGTTCCCTC
+GTTGAGCGAGAAATGGGAAATTCATGGAAAGTTACAATCCCCACCACGTAATAGTGCACC
+TACACGCCTTCATCGACGTTGTTTTTCGACCGGAAGACCGAGAAACTATCGAGATCTTTC
+GTCTATCCCGACC
+>ds2020-328_114
+GGGCGGGATAGACCCGCGGGCGGCCGTAAAATTGTGCTAACATCTGGTGTGGAGTAGTAC
+GTAGATTTCTGAGGGTATAGTTTATTTAATTGAGTGAAATTCCGCCAGTAGTCGTGATAG
+TTGAGAACTGTGATTATTCGCTCGATCAACTCTTTGCCATCACGCTCTTTTTCTTTAGCA
+TCTGCCGAGCACATCTAAGCGCAAAATAGAAAAAAGAACCCGGTTTTAAATTGGATATCC
+TTATTCCCTGTTCCGGGTACAAGTCAAGTTGAATTTTCAAATTTGAATTCAGTGTTATAA
+TTATTCAAATCCATAAATTCACTACGAAACAAGGCCAGAACCAAGCCCTAAATTTGAGAC
+TTTGAAAAACTGCAAGTAAACTTAAACTATTAATCATATTAATATTACACCCTGAAAACG
+TCTATCCCGACC
+>ds2020-328_115
+GGTCGGGATAGACGTAAGCACTGGTTCCTCCATAAGTGCCTTCTTCAACTCATTGAAGGC
+ATGCTGGCATCGGGGCGTCCACTCCCACGCCTTGTTCTTCTTTAGCAAATCCGTCAAGGG
+GGCCGCAATGGCTGAATATCCCTTGATGAACCTGCGGTAGTAGTTAACCAATCCAAGGAA
+TGACCGCAACTCAGGTACCTTGGTTGGTGGCTCCCATTCTTGAATGGCTCGCACCTTGCC
+CTCCTCCATGAGCAACTGTCCACCCCGTATCTTGTGACCAAGGAACTCCACCTCATTTTG
+GGCAAACGAGCATTTCTCCTTCTTCACATATAGGTTGTTCTCCCTCAGAACTTTGAACAC
+CTGATGCAAGTGCTCGAGGTGCTCCTCTAGAGAATTGCTAAACACGCACCAACGTCTATC
+CCGACC
+>ds2020-328_116
+GGGTCGGGATAGACGTTCCACACCCTTTCCCCCATATGACCGCTATCAAAGAGAAGCTTT
+TTCCTATACTATAGTTGCAAGTCTATTGTTGTGTTTTGGAATTAGGGGAAGCAAAGCTTC
+AACAAGTAGAAGCTTCCTGGCAAAGCTTCAAACAAAGAGGTTGGGCTGTTCACTTCATTG
+ATTTTACTTAACTTTGCTTAAGATTAAAGATAGGGGCCGGGCGGGCAGTGAAGGCTCGTT
+TAGTAGACAGCACGGCTTTGACGAGCAGCAAGCACCTACTCCTAACAAAATGAAAAGCAG
+CAAGCGGAGCGGAGCTTGAAGAAGCGAGCCCCTTTCAGAGAAAGCCATTGCGCGCTAGCC
+CCCTGTATGGGGTTCCAAACCTGCGCACCCCTAAACTACAACCAGCGAAGATCGTCTATC
+CCGACC
+>ds2020-328_117
+CGGTCGGGATAGACGCCTTCCCCCACTTCCGCAAAAGGGTGACCCATAGAACGATGGATT
+AGCGGGCTAGGGTAGGGATGGTACTTCATTTAAACAGTGACATTGCTCATGGATTTGAAC
+AGCAATCCTAGATCACACCTATATGAAGCCTTGCTGCATCTCTAACTTCCTGCCTCGTCA
+TCCCAGGCCACCCACCCTAACCTAATGGAGAAGATTACTGGGCCACTCTCTGCAGGTTAA
+CTCTGGTTGGCCAGTCAAAAGACACACGCTACCATAACAGAACACTTAATTAACATCAAC
+TTGGGCAGCTTCACCCCGGAAAAGCATTGGAGTCTTTCTTTTTTGATGATCCCCGACCCG
+ACTCCGAAGTCTTCTGCGTGCATTATTCTGCCCTCAACAACTCTTTTCCTCGTCTATCCC
+GACC
+>ds2020-328_118
+GGGTCGGGATAGACGTGTGCGAAGATTGCATATTTGGAAAACAGAAGAGGGTCAGCTTTC
+AGACAAGTGGCAGAACCCCAAAGAAGGAAAGGCTAGAGCTTGTTCACTCTGATGTTTGGG
+GACCAACGACCATTTCATCCATTGGTGGGAAACACTACTTCGTGACTTTCATCGATGATC
+ACTCTCGGAAGGTATGGGTTTACTTTCTAAAGCATAAGTCTGAAGTGTTTGAGGTTTTCA
+AGAGATGGAAAGCTATGGTTGAAAATGAGACAGGTCTGAAGATTAAAAGGCTCAGAACCG
+ACAATGGTGGTGAATATGAAGACACCAGATTCAAGAAGTTCTGCTATGAGCAAGGAATCA
+GAATGGAGAGAACCGTACCAGGTACGCCTCAACATAATGGTGTAGCTGAGCGTCTATCCC
+GACC
+>ds2020-328_119
+GGTCGGGATAGACGGAAGCTGCCCCTGAGTGGACGAGAAAGAAAGGATTTCTCGGAGCAA
+CCCCCCAGGTTCCAGACCCAGGAGTCAACTTTCCCGTATGAGCATTCGGTACATGTATCA
+GTCCGTGGAAGAGTGAAAGGGTCACCACTACTGAGGATCTCCCCCCTAATCTTAGATAGG
+TCGTCTGAGGGTTCGCCGCGGTTCATTGCTGTGCTTACACACTAGGCTACCCTTCTCCGA
+AAGCTCCGCGGGACCACCTACCACTAGTCTTCGGCCGGAGGGGTTTATTGCACAAAAACG
+CCGGGACGCAGGCTCCCGAAGAGGGAAGCCCAACGAATGTCAGATGCAAAGCTCCGCACC
+TCATTAAGATCATATTGGCATACTCTCCCAAAAAAAAAGAGCAGGCCCCCGTCTATCCCG
+ACC
+>ds2020-328_120
+GGTCGGGATAGACGCGTTGGCTGCCTTCGAGACTATAAAATATAACCCAAGTGGTCTAAC
+CCCCCGGGGCGGACCCCAACCGAAAGGCGCTAGACGGACTAACGGCAAGCGAGATAAAGA
+AAGCAGCTGGCCCTATGGAACGGAACTGGTTGCTTATTTACTTTTAGTAAGACCACTTTG
+GTAAGCAAAATTAGATTATATAGGCATGGTTGCTTACAAGACAAAAGATCTGTTCTTTGC
+CTGAACATATAGAGGAAACAACCTTCTATCTGGCCTCTGTACCAGTAGTGGAGTGGCTTG
+CTACTTTCAATCAGAAAAGGAAAATTGAGCAAGGCAAGGGAGAAAGAAGTTGTCCCATCT
+TCTCTGGTAACCCGCCACCGCATATGTCGAAAAAGAGGGAGCCGTGTCGTCTATCCCGAC
+C
+>ds2020-328_121
+GGTTGGGATAGACGACCGGTTGGGCTGCAATCTCCGACAGAATTGCCATTCTCTAACTGC
+TGACCATTATCCCTGTTTGTCAGGCCGTACATAGCTAAGTCTGTCGACATGTATCTGTGC
+TTTCCATTGAAGTCTACAAATACGTGGTCTATAAACGGTATGATATGCGTATCGTTGTTG
+AATACCGCATGGTAGCCGTCTGAAGCGTGCCTGTCCAAACTGATGTGACCTGTTAAAAAC
+GGAACGTTCATGCCATGTAAGACATCCCAGTTTGCCTGTTCTATCCAGTTCGGCATTGGT
+GCCTCATTGAGCCTAGCGACTCCAGAGGTATTTTGCCAATTGTCAACCGATGGCTTAATA
+ATCCCACCGCCGTCAATATCAGGGTCTTCTCTGGCGAAATCGGTCCCAAGCGCGACCGGT
+>ds2020-328_122
+GGTCGGGATAGACGCCCGCGACTTCTCTCTTTATGAACGGTGGGGCAATTCCTGGAACCT
+TTTTAAGGGTTTTTTATCAGGAGATATGGAAGTCGAAGGGTTTCTTGTTTCTGATCCACA
+ATTCTTCGTTCCACTTACTGGAGTTCTTCATATGAAGAAATTGATAAGTGATGCTGGGAA
+GGTCCTTAGTGTTAAGGATTTACTCGAAGAACAGCGCGCTCTTGTTGCTTTAAAAATGCG
+CGAACAGATTGCTGAAAGGGAGAAAGCTGAAAAGAGTCGCCGAGAATATGAGAAGGCGAT
+TATTCAACTTGCTGCTTGGACTAAAGCACATCCAGATGCTAAGGTTCCAAAAGGGCTTTC
+CGTGGAAGAACCACTGATGCCGGACGTTGTCAAGAAAGTGACGACGTCTATCCCGACC
+>ds2020-328_123
+GGTCGGGATAGACGTCCACTCGCCCTAGCACACTCTCAACTTGTAGATGCGAAAATCCCC
+CCTTCCCACAACAGAACAGAAAAACCAACAGAACACGAACACCAGCACGTATGAAAGCAG
+ACCTAAGGAGCGGGCAACTATCCAATCTTCACTCAAATGGACTTATTTCCCTTCGTTAAC
+TACTTCAAACGGTGTAGCTACCTCGGCTCCATGTTGGGACAAAGAGCAATAACCGTGCTT
+ATCCTTCTAATAAAGAAACAAAAACTTGCCTAAGAAACCGATTCACTCATTACTCCTACT
+ACTAGTATAGAAGAAGATCTATTAACGCGCATGGCTACCTATATAACAGGGGGCCTCTGA
+CCTCTGTCTCACAACCGAAAATAGAACCTGTAGCTCGCACCAGCGTCTATCCCGACC
+>ds2020-328_124
+GGTCGGGATAGACGAGAAGTAAGGATTCGAGAGTCCAGGCTGAAAATACATGCATAGATA
+GTGGTCTAATGACAAAGGCCGACGACGGAAGCTCGGGACGGAGCCGTATGATGCGGAAGT
+CTCACGTACGGTTCCCTGAGAAGGGAGTGGCTACCTACTGGAGCTTCGACCAACCACCAC
+CGGTCAATTCCGCTTTGGGGCCACCCCTTACTCTACCATTATTATAGGGGTATGGGGTTC
+GAGACAAAGAAAGATCAAGGCAGCATATCAGTTTTTCCTTTATACTTTACTTGGATCTGT
+TTTTATGCTATTAGCTATTCTGTTGATTCTTCTCCAAACAGGAACCACCGATTTACAAAT
+ATCATTAACCACAGAATTTAGCGAGCGGGCGCGTCTATCCCGACCA
+>ds2020-328_125
+TGATCGCCCCCTCGGATTCGTTCTAGAACTTTCTATGCCCCCTTGTATAGGTTGGGCGAA
+TCCACCGACTCACGTCGAATACGAACGCCTCTCTCGACAAACTAGCCCACGTCTTTCTAT
+CGGACTAGACCGATAGAAGTAGCTTGGGTCGGGATAGACGCCCCACTACGCTGCCACCAT
+GTGAGAGTCGGTGCGTAATGGATCTACGCCTGCCTTCGAAAGCTCCACTCCTGTTTACCA
+GGATCCTGGAACCATTCCTTGATTGATTGAAAATCACGAGTCGAATTTTTCTCTACCTAT
+TCGACTATCAAGCTCTTGACACCCTGTTTAGCCTAGCGCCCTCCTCCTCTTTTGTTCGCT
+TCGCTCTCCTCCCTCAACCAGGCAAGTAACCCGTCTATCCCGACC
+>ds2020-328_126
+GGTCGGGATAGACGTATTGGCATGTTGCTTTTTATAGACGCCCAGCCTATGATCGTAAAA
+GTGCGGTCACCATCAATCATGAGTTTGAGACAGTTGGATGTCTTGGTGGTGCCGTATGAG
+CTCCCTGTGGTGAACTCAGGTTGCTTCTGAGCAAGCTTTCCCCCAGGTTATGTCATACCC
+ATATAAACAAGGTAAGAAGGGAAAGGAAGACTTTGACTACTAGGGTAGCTGGGCCAACCG
+CTAATAGATCAAATTAAGAGGGAGTGAACGACATATAATATAATCCGAATGGGAAGTTTT
+GAGCAATCGATTCTTTCTCATGTACGGCTAAACCTTGCAGTTGCAGGTAATTTGAGTCTG
+GACCCCCGAGTGATGGTAAATCGCCGTCTATCCCGACC
+>ds2020-328_127
+GGTCGGGATAGACGGGGGGTTTGTCTACGCCGGAACGAGTCTGTCTTCGGACGGGCTCGT
+TTTTGTAAAGGAAAAGGAGTGTTGAAACCGGACGCGGCATGTCTTCTAGACGATCGCGTT
+GAAGATGTGGAGAATAAGAGCTACAATTGCGTTCCTCCCCCTGCATGTTTGATGTAGGGG
+AGCTGAGTAACTATGTGACCAGCTTCGCGTATGTAAGGTTCATCCAAGTACAAAGCAATG
+GGAGACTTCGGTCGACCGCCTTCGGGTTACCATTGTGGATTATCAGTTCGGCTGGGTCCG
+TGCGTCATAGGGACGAAAGTATTGCGGTGTGTTGTCTTCGGACATTAATGGCGGATACAC
+TTCAACGGTGCTATCAAGGACAAGTAGTGGCGGCCGTT
+>ds2020-328_128
+TACAAACGGCGTAGTCGATGGACAACGGGTAAATAGTCCCGTACTGAAATTGATTGGTGC
+AGAGGGACGGAGAAGGCGGACATCAGCCGGATGTTGGTTACCGGTTCAACTGTGTGAGGT
+GATGAGAGGCGGAGAAAACGCTTTGAGCCGAGCCAGGNNNNNNNNNNCGAGTCCCTACGG
+GGGCGAAGTGGTGAAGTCATGCTTCCAAGAAAAGCTCTAAACACCATAAATCAATTTTAC
+CTGTACCCAAAACCGACACAGGTAGGGAGGTTGAGAATACCAAGGGGCGCGAGATAACTC
+TCTCTAAGGAACTCGGCAAAATGGCCCCGTAACTTCGGAAGAAGGGGTGCCCACAGCAAT
+GTGGGTCGCAGTGAAGAGATCCAAAA
+>ds2020-328_129
+GGTCGGGATAGACGCCCTTCTTGCCTGACTCCTGTTTTGTTTGCTTGTTTTTAGTGTTCA
+TCTGAACACCGCTTGTCGACAGGCCTATAACTTACTAGAATGCACCACTGCACACTCGCG
+TAATTAGCTTGCCCTCCTTTACACCCAAGTCAGTGCGTAGGATCACTCTTACACTGAAAC
+GCATTTCGCTCAACCTGAGGTCATAATTCAGGTGTCATGACTAGTGCGATAGTTACACGG
+AGTACGAAATGTTACAGTACATTTCGTAGGGCCAGATTTTTGTCACGCCAGGCTGGCCAA
+ACCCCGACGTCTTAGCTTCTACTATAGGTTTTTATCGCCGCCACTGCTGATAGCACATCG
+CCGCACAAACCGCGTCTATCCCGACT
+>ds2020-328_130
+GGTCGGGATAGACGAGCGCTACCGGTATAGCACCGAGAGGATCATTTGTAGGCATATACG
+GGTCATGCGGAGTCACGGTCATAAATAATGACGAAGAAAGAGAGGCAACTGTACCATACA
+ACAGTTTTGCAGCCGACAGTCTAATAACATCAAATTTCGTAGGAAGTTATTCGCTTGGAG
+GTGGGGGTGAAGAGCAGGCTCCTGAGCTCAGGTGTACACAGTATTTGATGGGTGAACCGG
+ACAGAATAGCGCCAAACTCAGCAGCTATAGAAGGCTGTATAGCACATGCCAATCACAATG
+TGGGAGGGTGCTTATAATGCATCTAACCCGCTCATTGATTAATTAATTGATGAAGCCAGT
+GCTCCGTTTCGTCTATCCCGACC
+>ds2020-328_131
+GGTCGGGATAGACGCGACGGTTCAATCACCCTAGAGCTAGAGGGGAGGCGATCTCAATAC
+CCGCTTTTTCCATGCCACAGTTATTAGGCATTAGGCGTCGGGCTCGAAATAGAATCGTGT
+TGGATTTCACACTCTATTTATCTGGGAGAAGAGGCGGTCTAATCTTAATTAGCCTTCGCA
+TTCGCTTCTGAACTCAACTATAAGTAATCAGTACAGTTAGGCTTTCCTACCGCCGGATCC
+TACCACCGCTTTCTTCTAAGATTTCATCTTGCCTATAACAACCAGGGTGTACTTGATTGG
+CTCTTTCTCGGCTTGACTAAACCAATCTATCAACCTTAATGCCCTGCCTTTCCGTAGTCC
+ACCGTACCGTCTATCCCGACC
+>ds2020-328_132
+GGTCGGGATAGACGACGCACCACCATCAAAGAAACCTTACCACTACTCATCTCCTCCTCC
+TCCTCCTCCACACAAGAAGCCGTACCACCCAGTGCATTCACCACCACCACCAAATAAACC
+TTACCACTACAAGTCTCCCCCACCACCCACACCCTCACCACCTAAGCATCCTTACCACTA
+CAAATCTCCACCACCACCCTCACCATCACCCCCTAAGCACCCTTACCACTACAAGTCTCC
+CCCACCACCATCACCTTCACCACCCAAGCACCCCTACCACTACAAGTCTCCTCCACCACC
+CTCACCATCACCACCCAAGCATCCTTACCACTACAAGTCTCCTCCACCACCCTCACCATC
+ACCACCCAAGCATCCTTACC
+>ds2020-328_133
+GGTCGGGATAGACGAAGCTCTCTCTTTATCATCTCGTGCCAGATGTAACAAAGGATTCAT
+CCTTTTTCCTTCTCGCGAACCACGGGAGCGCCTAGTGCCCAGAGGAGCAAAGCAAATTTT
+CCTTTCGGGGTAAAGCGGCGCATAAAAAAGGGCTGGCCCGTCAAAAGCCCGGTTCCTTCG
+CGAACGAAGTTCAGAATCAACAAGGGTTCGTAGAACGAAGGGGGTGTACAACTGGCGGTG
+TACAACACCACCACTTTTTTGTTCGTAACGAGGGAGAGATAGAATGGAGTTCTTCACGAA
+GTTCGAGACAAAGGAATAAAAAAGAGTTTCTCTATGGCCTCCTCGTTTTGAGACAGTCTG
+TTGGCGTCTATCCCGACC
+>ds2020-328_134
+GGTCGGGATAGACGTCCGTCAGGGATAAGCGTTTAGGGGAAGCCGGCTATTCCGGTAAGC
+GAGTAGTCCGTTATGGACCCCCCCTTACCCCACTTTTTTGTTCTTGACCCTTTCCGGCTG
+TGTGCCCTTAATCTATCTTAGCTGGGCCTTCCCGACTTTCCTTACCAAATCCCCTTTTCA
+AATCTTTTCCCCAAGTGATGGCTAGCCCGAGAATATCCCCATTTGCTTTATTTTATTGCC
+CCGGATCCTTATTCTTCCCGAAGGAACCCTATCAAACCTACTGGTAAAGGGAAATGGCCC
+TAAGCGTCTATAAGGAAATTGTCTTTACATACCTAATACCTAATATGACTTAGGGATCGA
+TCGTCTATCCCGACC
+>ds2020-328_135
+CGGTCGGGATAGACGGGACCGCCCCCTACTACCCAATTCCTGTCTTCGGAACTACGAAGA
+TAGGTTACTTTCTGCGATGGCCCTCCACCTCGTTGGGAAAAGTAAAAAGAAATAACAAGC
+CCTAAACTAAATATCAACTAGCAGCTTATCAACCACCGAACACAGACTCATGTTGGCGAT
+GCCATGGTCAAGTAAGAGGACGACCCATTCACCTCAAAAGAAAAATCTCGCCTCTCAAGT
+AAGCCAAACGATTGACGTCAAAGAGAAGGACCACCCACCCAGCAAAGAGCGAGGTCTTTC
+AGCAATGAACTTCACAAAAAGAGTGGAAGGCGAGAAAGACACTTAGACAACATTAGAGGA
+TCTTTTGTTTTTA
+>ds2020-328_136
+GGTCGGGATAGACGTCAGACGGTTCTTCAGCGTCTATCCAGACCGCCGTTATTCTAGCAA
+CGGCCGGCACGTTGGCATTCCCCTAGACACTGAATCGTCCAGACGCGACTCCAGCGCTTC
+CAAAAGGTCCCTCATATCGCTTGAAGGTTTTGACTCTATCCTCGAGTGTACCAAGGTTGC
+CATAGCTCTAGATAGATACTGTCCCTTAGACCCACGTTTGTGGTCTACGCGTAGAAACTC
+TGCTATGGCCCCATACGCACATTTGCTCATCTGCAGGCGTATGTTGTGCTTCTTGGCATT
+TTTGCCAGCTAGCAACACGTCCTCGAGCGAATTACTTCCCAGTAGCACGTCGTCACCGTA
+GTGGCGGCCGTT
+>ds2020-328_137
+GGTCGGGATAGACGAAAAATGAACCTCTCGGTGCTATACCGGTAGCTTTTTCAATCCTCC
+TTTTAGCATTATAAGTAGCATCTTCCACCAACACGGAACAGTCTGCATAATCCATTGTAT
+TTCCACAGTTTAGACCGCATCCTGCATAAACATGTATGTATCCTGGTGTAATATTACTAC
+CGCTAGAATCGCTAGTATTATTTGGTACGTTTATTGCATTCGTGTCCATGCCTTTCTTAG
+TAATTGGCCTATTATGTATCCTCATGTTCCCTGACCTGCCGTGATCAATACAACTCTTAA
+ACTTTCCCATGGCATCTCCTCTAATGTCAGATAACACCTCAATACTGGATGGATACGTCT
+ATCCCGACC
+>ds2020-328_138
+AACGGCCGCCACTACTAATTCTGCCTACTCGCCGGGGCGTAAATTTTGCCCCGGCGGGGG
+GGTATAAGTAACACGCTTGAGCGCCATCCATTTTCAGGGCTAGTTCATTCGGCAGGTGAG
+TTGTTACACATTCCTTAGCGGATTCCGACTTCCATGGCCACCGTCCTGCTGTCTAGATGA
+ACCAACACCTTTTGTGGTGTCTGATGAGCGTGTATTCCGGCACTTTAACCCCCCGTTCGG
+TTCATCCCGCATCGCCAGTTCTGCTTACCAAAAATGGCCCACTATAAACGTTTCATTCAC
+CTGTCCACGTTCAATTAAGTAACAAGGACTTCTTACATATTTAAAGTTTGAAAATAGTGG
+CGGCCGTT
+>ds2020-328_139
+GCCGTGGACCTAGTTTGTAAGGGGGTCTAGACTAGGTCCAGCAGAAATGTCACTAGGTCC
+ACGGCTCTCTGTCCGTGAATACGGCGGTCGGGATAGACGTGCCATGGCCATATCAGCAGT
+AATGTAATTCATGGATATGACTTTGTCTTTTAAATTGTACTTACTGTATCCTAAACCGAT
+GGCGTAAGTCACCAATTCCTCATATGTGCATTTTCCGGTGCTTGCTCGAATCAACAATAA
+TTTCAAAAATTCTTTTTCTATTGGTACCTCCTTCCACTCAATGACATTGCTTGCCACTTG
+GCTCAGCAGGGTTTTCCACACTGGCACAGGCATTAAAACTCTTTGCTGTGAGCCCTTTGC
+GATCGGTT
+>ds2020-328_140
+GGTCGGGATAGACGCCGCGCCTCCGTTTGACTGCCGCTCGGGGATGTAGTTGTAGATACT
+TTAGTCTTAGTGGGTCGTTGGCTCCACCTGTTATCTCCTTCTACGACATGCTGTTGTCGT
+CGCCATATTCCATATGTCACTTAGTCATCTCTGCCTCGCTGCGGGTCAGCACCTCCGAAA
+GAAACGGAGGACTTCATTCAGTGACTCCGCGATCGCCCTCTGAACGATCAGAATAAGGTA
+AAGCTTGAAGATAAGTTTTGTACTCTATTAATTTCTCAGTCCCTCTAGTCGGGTGGGCGC
+CGGCCGGTCTTTCGACCAGATATCCCCCTAAAAACCGTACGTGCGGGTCCGACCGTCTAT
+CCCGACC
+>ds2020-328_141
+CGCCGGGATAGACGGAGCCTCACGGTACTTGTTCACTATCGGTCGATTACGAGTATTTAG
+CCTTGGAGGATGGTCCCCCCATCTTCAGACAGGATTTCTCGTGTCCCGCCCTACTTATCG
+TCCACTCAGTTCCACACCAAACTTTTCTCATACGGGGCTATCACCCGCTATGGCCGGACT
+TTCCATTCCGTTCTGCTAGCAATACTGCTAAAGAGTACAAGGCTGATCCCATTTCGCTCG
+CCACTACTTTGGGAATCTCGGTTGATTTCTGTTCCTACAGCTACTTAGATGTTTCAGTTC
+GCTGCGTTCGCTTCCCTTGCCTATGTACTCAGCAAGGGATGACCCATCCATGCCGTCTAT
+CCCGACC
+>ds2020-328_142
+GATCTGAATTACGGCGGTCGGGATAGACGTTGATTTGAGGTGGTGGCGGGGGTTGGAATT
+TCGATAGATTTGGAGGGCATAATTGGGATGAGTCGTCGTCTTCTTCGCCGTCGGATCCTG
+CGTTTGATTTCGTGTACGAGGTGATGTGTTGGATTGCGCTTTCGAATTGCGTGCACTTCG
+CCTTCAAGAGGGTTATTCGTATCGTGGCGGATGGGTTGGGCGATGCGGAGAGAGCGAAGG
+TGCCGATGAGATTGACTTCGGTCTGCTGATGCGGTACCGTTTCGTTCTCAATGCTTAACG
+TATCAAAAAGGGGATACAAATCTGGTTTTAATTTATGTGTTGGTTGGGTTTGCGTCTATC
+CCGACC
+>ds2020-328_143
+GGTCGGGATAGACGGATCGAATTCGTTACGCTCCTTAGCTCGGTAGGGGGTACAAGAGTT
+AGCTCGTTTGGATCGGAGTGAACCGAAAAGGGAATGTATTCAATATGCGAGTAAGAAGAT
+TCATTTATAGGCTTGAAACCTAACTTGTCTGGAGAGCGAAATTAAACAATCAATTAAAAG
+CACATTAATTAGTTAATGCTTAACACTACAGCTAAGGGAAAAAGAAGTTCATCCATACAC
+TTAAAAAAGGAGGTTAATATTCTCATCTTTTATCCTCTTTGGCTAAAAACAGACTGCTAG
+CTTTCAAGATTCCAGTTTTCAAACTTGCCTAAGCTCTCCATAGCTTTACGTCTATCCCGA
+CC
+>ds2020-328_144
+GGTCGGGATAGACGAATTCGAGGTTTGTTCGGCGGCACGATTCGTTAAAATAATTTTTTT
+TTGCGTCGATCTATACGATCGACCCCGGACGTACCCATTCGCCGCGTGGGGAACCGGGTA
+ACCAAAGTCACGATCAGAATAAAAAAGGAAGTTCGCTGGGGAAGTCCGGGGTGCTGGTTC
+AAATCAAGTTCGTGACATGGTAATCTCGATGAGAATAAGAGCGGCCGGTATTGGACGAAG
+GGGAAGCTGCCCCAACCACTACAACATAGGGGGCTCGGAAGGCAAATTTGTTCACTGTCC
+TAGATTCAGAGGGGGCCGTGGAAGAGGGGCGCGGGCCGTCTATCCCGACCGCCGTAATTC
+AG
+>ds2020-328_145
+AACGGCCGCCACTAGTTCGTATTTCTCGGTTGTGAAGAATCACACGAGGGAGCAGTTTGG
+GGGTGGGTCTAAGGTATCGAATCCGAATGAGCGCTTTGGTTCTATTAGGACGAGGTGCTT
+ACTTCCCCAGCTGCGCTATTTACCTCCGTTTGGTGACGATATTACCTGCTGTAGTTCGTG
+AGTTCTCGGGTTAGTATGCGACCCCGTAACCGTTTGGCGTTTAGCTGCTTCACAAAAGCT
+ATTGTCTCGCTTCTACAGTGCCTAGCTGGCGTGCCCTCGCTTAGCACTTGAACGTGTAGT
+TAGGCCGACTTCGGATGATCGGAAACACAGGACCGCGAGTTGCTTCGTCTATCCCGAC
+>ds2020-328_146
+GGTCGGGATAGACGACCAGTTGCTTTGCCGGCGGGCCCACTTAGGTTAGGGGGGGCATTG
+TCCCTCAGTTCTTACCAACCTCCGGTGTGTAATCGACATGTTGCTAGCTTCAACTCGGTT
+GAATAAGAATCATTGATTCCCTATGCTGTCCATTTCTTATTCATTCAGGGCGCTCGGCCG
+GTGCTCCTTTAAAAAACCAAAACCACTCTGAACGTAAGGGAAGATAAGGGAAGACCGCCT
+GAGCGAACCGACCGAAAGGACTTTTGACTTATTTGAACCGAACGATAGCGGCTTAAAGCT
+AAGCCTATCACGAGCAGCGTCGCTGCTTGATCAGCGGTGAGGAGCGTCTATCCCGACC
+>ds2020-328_147
+AACGGCCGCCACTAAATGGAACAGGTACCTGCAGAGACTGTAGAATAGAAAATTACAAGC
+CCTCTACACAGGTATCGCCGACTAGACACTTCTATACGCCAGTAGGAGGTTCCGGTTATG
+ATTGGCATGGCGTAGAACTGGCCACGGCGAACGCATCAGCGTTAAGGTCAAGTAATTACG
+TCAGGCTGCGATTGAGGCCAAACCAGGCGCCGGCGTCAATCGTAGTACTAAGAGCGTCAG
+GCAGAACTGAGAACGCATTAAAGTTAGTAGCAGTCGAGGACAGTACTCACTTGTTTATGG
+GAATGGTTGATGGCGTTTTTGAGGGTGATATTAATGTTTGCGCTTAGTGGCGGCCGTT
+>ds2020-328_148
+GGTCGGGATAGACGTATAAAGCAGCAATGTCACTCCCCCTCAAATCCGACGACGTATGAG
+AGTCGAGATTTGGAGAAAGCAACACCGGTAATGACAATAAAGTTGCAGCACCCAAATAAA
+GTTGCATCTATCTCCCCCTCAAATCTGACACTGGTAGAGGGTCGAGATTTGGAAGAAGAG
+AAAATGAAATAATAGTAAAGAGACTCAAACATGCCAGTCTCGTGGTAGAAACAAATGCAA
+GGAAATGTGGAATGGAGATGGGCATCCGACAACTGGAGAAAAGGAATAAAAGATGGAAAA
+GAGTCTGCAACCCAAACAAAAAGGAGGAAAGTGTAGTGGCGGCCGTTGCTGTGTATTA
+>ds2020-328_149
+GGTCGGGATAGGCGGTGTTGTAGCATGTAGCACTGGGACCTGAGGAACAACATTTGTGTG
+CTGAGGTTGGCGAAAGAAGATTAAATGACGTATCATTTTGGGTTAATGATAGCTTGGGTG
+GAAGGGAGGATGAAAATGAAGTAATTGGTTCCAGCCTAATAAATACAGATTACCCAGGAA
+CAAAATGCGCCATGGTATACAGCTATGTAGAGGACAAATGGGTAGAAATGAGTAATAAAA
+ATTACGGTGAGTATACAAGGAAAAGCTTCCATGGCGATGTGAGACCTAGTGTACCTTTAA
+GGCGAACAATGGAAAAAGAACCTGCACCTGTAACTTGGTGCGTCGTCTATCCCGACC
+>ds2020-328_150
+GGTCGGGATAGACGAAGCCTACTCCTAACAAGTTGCTGGCTTTTCAGCCGTTGCGCGCTA
+GCGTTTTACCTTACTAGTAAAGGGGCTGCTGGTTGTAGCGCGCAGTGTGCTAGTGAATAG
+GAAAAGCGGATTGAGATTACTAATGACGGATGGAGACACCGAAGGTGATAGAACATGTTC
+GGTGCCTCGCTCTTGTCTCCTTCGCCGGAGACTGCAAATGATGGGAATCCTATCGATAAA
+GAAGAGGCATAGGCATCGCCTCTCGATCCAATCCGCCTTCCCCGGCCTCCCCAACACACT
+CTTGATACGAAAAAAACCATCACCATCGTCTATCCCGACCGCCGTAATTCAGATC
+>ds2020-328_151
+TGAATTACGGCGGTCGGATAGACGGACGCGCGAGGTTAAGGTGCCGGAATACACGCTCAT
+CAGACACCACAAAAGGTGTTAGTTCATCTAGACAGCAGGACGGTGGCCATGGAAGTCGGA
+ATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATGAACTAGCCCTGAAAATGGATGG
+CGCTTAAGCGTGTTACCTATACCTCACCGTCAGTGTTAGAGCGATGCGCTGACGAGTAGG
+CAGGCGTGGAGGTTGTATCGAAGCCTAGGCAGTGATGCTGGGTGGAACAGCCTCTAGTGC
+AGATCTTGGTGGTAGTAGCAAATATTCAAGTGGAGAACGTTAGTGGCGGCCGTT
+>ds2020-328_152
+GGTCGGGATAGACGAAAGCTCTGCCTGTGTTCTACCTGAGTTGATTTTAATACACAATGG
+TATCATCCCCTGCCTTAACCTGTATTCTTTCCGATTTTTAGTCGGTTTTTCACTCTCAGC
+CACACTTATGAAGCCAAGAGAGAAAGTGTAATCTTGTCCGTAACCCGTTGTTTCGTAATC
+AATAAATTTGCTGTCCGTGTTAGGTGCCGGTATGGGCATCTTATAATTCTCTATTCTGCA
+ATTTCTACAGGAGGAACTTCCGCACCTTCTACTCCCCGCGCATCCACTAGTTGATCTTGC
+GTTTGGCTGGCGTCTAACTGTCTGCTCATTGGGACCGGTCGTCTATCCCGACC
+>ds2020-328_153
+GGTCGGGATAGACGGCGGTTTGCCTTTTTTACTATTAAATTGATTACTCTGAATATCACC
+GACCACGATTAGGGCATTGTCTTTGACTAATTGGGTGGTAAATTTGTGTATCAGGTCTTG
+CCGTGTGTTTTTGATTTTGGCATGGATAGCCTTGATACGTTTTTTGTTGTTTGAGCGTTG
+GGCTATAGCTAATTGTTTTGCATATTTTAGCGTTTGCTTAATGGTTAGCTTGTCACCGTT
+TGAGGCGGTAGCACTGTCTTTAAGTCCTAAGTCAATACCTACACTACCTGTTCCGCATGA
+TTGTTTGGGATAGTCTTTGACTGTGATACAGGCATACCAACGATTACGGCTGT
+>ds2020-328_154
+GGTCGGGATAGACGATCCTCAGCCCTGTAAGCCCACACCTGTGTAGAGTGGATCGTTCAA
+CACCTGCGGCACAAACCCATTTTTGACCTATTGGTCCTAGTATCATAGGCGACCGAACGG
+CCGCCCCCTAATTACTAGACCAACCTGCTATAATAATTCCATAAACACCTAGCGAAGATA
+TGGCAAACAAATAAAGTAGCCCTATGTTCGAATCTGACAATACCATACCATAATCAAAAG
+GTACAACGGCCCGAGCAACCAGACTTAACATAAATGTAGTCACTGGAGCCATTCTAAAAA
+GGGAGAAATTAGCACTACTTGGTGAAATAGGTTTGAACGTCTATCCCGACC
+>ds2020-328_155
+GGTCGGGATAGACGATCCAGTTTCCTTTGATGGGGCCCTTCCTGCAGCAGATTCGTTCAC
+AGACGATTCAATAGCAACCCCTTCTTTTCTTGCAGCAAGAGGGTATTCGAGAACAAGCTC
+CTCTAGAGATGAATGTGCAGCTGATTCAATAGGAGCTTCTACGATCACAGTAAGAGCCTC
+TATGCCAACAGCGGCAACTCTCACAGCAGATAGGCAACGGTTACTGAAACAGTTAGCCAA
+AGAAGAAGACCGGTAACGAAAGCAACGGATATTCCAACAACAATAGGTATTGTAACAATA
+GGATTCTAAACCTTCTCGTCTTCTGAAGACCACTCGACGTCTATCCCGACC
+>ds2020-328_156
+GGTCGGGATAGACGGTATTGATCGCTTCTTCAAAAGCCAACCCACCCCCAACGTGTTCGA
+GTGGCCCACGATTCGCTAGCTTCTTCATGAACTCCGCCGAAAGCCATCCTCGACGTACTC
+GTGCATTGAGAAGGTTTGGTGGCCGTACTCCCAACACAAAAGCATAACCGAAGACAACCC
+CAAGCTAAAGTTCACCCAAAGCCCACTCATCATCACCACGTGTGTTCGTGTGGCCAACAA
+TTGACTAGCTTCTTCATCAACCCCGCCGAAAGCCATCCCCGACGTACCCGTGCATTGAGA
+AGGTTTGGTGGCCGTACTCCCAACACAAAAGCAATACGTCTATCCCGACC
+>ds2020-328_157
+GGTCGGGATAGACGGGGGGGCGGAGTGTTCTTCGGAATGACTAGGCGTAAAGGGCACGTA
+GGCGGTGAATCGGGTTGAAAGCGAAAGTCGCCAAAAACTGGTGGAATGCTCTCGAAACCA
+ATTCACTTGAGTGAGACAGAGGAGAGTGGAATTTCGTGTGTAGGGGTGAAATCCTAAGAT
+CTACGAAGGAACGCCAAAAGCGAAGGCAGCTCTCTGGGTCCCTACCGACGCTGGAGTGCG
+AAAGCATGGGGAGCGAACGGGATTAGATACCCTGGTAGTCCATGCCGTAAACGATGAGTG
+TTCGCCCTTGGTCTACGCAGATCAGGGGCCCATTTCGTCTATCCCGACC
+>ds2020-328_158
+GGTCGGGATAGACGCCCCTGCCCCATCATTTTAAAATAATTCAATTATTTGAGTTCCACT
+CCTTATCCCCAATGATTTTGCTTATTAGCCTATCATTGGGTCGTACCCATTATTTTTTAC
+CTTCGAATAATCCGTAGTATTTTCGCATATTTTCCATCATCCATTTCTCCAACCTGAACT
+TACCAGTTATTGTTTTTAAGTAATCCTGATCAATGATGCTCCTAGGAACACTCGCTGCCA
+ATACAATTAATTTACTGTCCTCCTCATTTGCTTTCCTAGGTCCAAAGCTTGCTGGCGCTT
+TTAGAAATTCCAGCGTTCTTGGTACCCCCTCACACCGTCTATCCCGACC
+>ds2020-328_159
+GGGTCGGGATAGACGGCAGATACCACTCGAACGTGGTTGTTCGTATTTTAAATCAATCAT
+GACTTCTTCCGAGATCACTGCTGCCAATGTCCATGAACTTTTGGTTAAAGTTCTGGAAAA
+GCAATGCGCTGACGAGACCACTACCGTCGGTAAGGCTTTCTCTGAGAAAGCAAAACAGTC
+TTTGAATAAGACATTCGGACTAAATGACGAGTCCAAGCAACTGAAGATTTCTTTTGATTT
+GACGGCTGAACAGCAGGCGTTACTCAAGAGACATTTTCCGGGTCGATCGGTGATTTTTTC
+AAATTCATCGAGTTCCTCACACAGTTATGCAGCGCGTCTATCCCGACC
+>ds2020-328_160
+GGTCGGGATAGACGTCGACCACAATTTCCCAAGTAAGAAAGAGATAGAATTTCACTAATT
+GGATTGGAAGGAAAAGGAGGGCTTCGATCCATTGTGATTAGGATCCTTGGTGTGGAGAGA
+TCCCTGCCAAAAATCAAAGAGCGACGTAATTCCCCATTCATCCGAAGTAGTATTTTAGTA
+TAGAACAGAGGCTTTCTGAGCCGACTACTACGACTACATGCGCATCTAGTGCAGTGGCTT
+GGAAGCAAGCTACCTTGACCATCTTCCGAAGTTCTAAATAATCTACTGATCAAACGCTGT
+AGGGGCAGACTGCTCTACATTCAACCACACATTGCGTCTATCCCGACC
+>ds2020-328_161
+GGTCGGGATAGACGAAGCGAACTCATCCACATGATCCCGATCTTTTGGGACCATAGAAAG
+GCACTTAGTCGGTTACTAAGTCGCGCTACATGTAGGTAATCATCCTACAGGTAGAACGTG
+TGGAAACACACACCATATCAATAGTGACTACTAATCACTATCAACCGATATGTGTGCCAC
+GGGCACATGCTAACCGGGGCGATCAGCACGAGGGTGGAACCACCACCATCCAAGGAAAAT
+CCTCGGCGCCAAGTAAGAAGTTTTGTTTCGCTAGTTTTACTGTTTCTCTTCCCGCGAAAT
+CTCTAGCGTTTCTCTCCCCAATAACCCCTAGTTAAGTCTATCCCGACC
+>ds2020-328_162
+GGTCGGGATAGACGCTTCCTCAATCTCCAATTCAGTGAGGATCCTTCTGAACCCAAAAAC
+CCAGCTGAGAGGGAGCCCATCCGATCCCATAAAGGAGGCAATGTTGTGGTTATGCTTGCT
+GGATAGGTTGAAGAGTCTAGGGAATACCTCTTTCAGGACCCCACCCTTGTTCCAATCATC
+CTCCCAAAATCTGACCCTAACTCCACAACCTACCACGAAAACGCAGCCTTGAAGGAACAA
+ATTGTAGCCACTAGAAATGTCTCTCCAAGGGCTACGACACGATCCTCGACTCACAGGATT
+AGCAAAATCATACGAAAAGAAAAAGGGGGGGGCGCCGTCTATCCCGAC
+>ds2020-328_163
+GGTCGGGATAGACGCATAGGGGGGCTGTTCACTACAAGCTATCAGTGCTGTCTTAGATTG
+AACGGCAATAAGATAAGTCGACGTTCAATCTCTAGGGCGGGTTTCCGCTGAGAACGGAAT
+AGTGTTCGTGTCCAAAGGCGAACAACGCCCTAGCTTCTAGAGTTCGCTGCTTTTCCCAGG
+CCGGAGAAGGTCTTATACCGCTCGCCTTTGTTTGATATGTTCATTCAGTACCAATACAAA
+CTACAACTACACAAAAAAAAGGAAGGGCCGCTATAGAAGCTAAAAGTAGCCTATAGTAGA
+GTAGTCGGCCTAACAAAAGCGTCACGGCAACATAAAATTCCCCTCTCT
+>ds2020-328_164
+GGTCGGGATAGACGGTGTGACTGGCTGGAGCGGCAGCTGAGATTATGACAGGGACCGGAA
+ACAAGGTGGTAAAAAAGAGGCCGTGGAAGATACAGGCCGAGCACAACCTGGGACGAGGGC
+TGGTTGCTCATGAAAAGCAAGCCTTGGGGCATGTGCTGGAGAAGGTTACACGGGAAAGTG
+ACATGGAAGCTGCGTTAAAGAGGTTCATAGTGAGGCCAGAGTCTACTGCTTGTAGACGGC
+TACTGTGGCACATCCACTGTAAAGGAAACGTGGAAAAGAGTAAACTTGAGGCATGGGCTA
+ACAATTTCAAGTTAGAGTGGCATGTGGCTCTCACGTCTATCCCGACC
+>ds2020-328_165
+GGTCGGGATAGACGCTAGTTCAAGGTTAGAAGAAGAAGGAATAAACTGGTGGGGTTGAGC
+AATGAGGTGGGTGAATGGATCACTGATAAGGAGGAGTTGAAAGCTGTGGCTGTGAAGTAT
+TTGAAAGATTTGTTTGATAGGAGTGATGCGGGATTCTGATTTGCCTAATCTTTTCCCAGC
+TTTAGATCCCAGGTTGTATGCTGACCTGGGTAGAAGTGTGAGTGACCAGGAAATTAAGGA
+TAGTCTCTTTGCTATTGGCCCTTACAAAGCTCCTGGTCCGGATGGTTTCTCTGCTTGCTT
+TTATCAGGGATGTCTGTGCCTCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_166
+GGGTCGGGATAGACGTTAACTGCCCATACCAACCATGTTTGCTAGCCTTGCAACGTCAGC
+TATTTCCTGCCAAGTGTCGACAGCTGCCTCATCTCGCAGCCTATTGTATATCACTGCCTC
+ATCTGCGGTTGTGCAATAACCACGTATACGTAAGTTCTGCACTAATGCATGTATTCCACA
+AGTACCATCTCCTTTTGTGTTAACTTCTGTCACTATTATTTTGTCCTCCTCTACTGGCAT
+TGGCTCATCTTTGACCAACTTTGACTCTGTGCCTTTGTCTTTCAGTTCATATGAACTACC
+TAGCATTTCCTCACCATTTACGCCTTTGACATAAACTGGCGATGGT
+>ds2020-328_167
+TTTTTGCAAGTATGATACTCCATTAGAGAAACACCCCAGTGCATTTTTGGGTATATTTCT
+TGCTGCTATACGACTCCATATTTCTGATTCTTCCAAACCTAGTATGCATGGTCTAACACC
+ACCTCGACTCTCCTGCATTACTATAACACCGTCCTTATCACATATTAGCGCACAAACCAT
+AAAACCTTTGAAGCATTCTATAACTCTTATGCTCCAGTCTACACCTGATAGACCCGACTC
+CACATCACAGCTAAGCATTGATGCTATTGCATGACTTAAATCTTGGCCAGTAGACCTGGC
+TTCTAATAATTTTACTGCCATAACGACCACCCGTCTATCCCGACC
+>ds2020-328_168
+GGTCGGGATAGACGCAATCCCCCGCTGCTGCCTCCCGTAGGAGTCTGGACAGTGTCTCAG
+TTCCAGTGTGACTGATCATCCTCTCAGACCAGCTAGGGATCGTCGCCTAGGTGAGCCGTT
+ACCCCACCTACTAGCTAATCCCATCTGGGCACATCTGATGGCAAGAGGCCCGAAGGTCCC
+CCTCTTTGGTCTTGCGACGTTATGCGGTATTAGCTACCGTTTCCAGTAGTTATCCCCCTC
+CATCAGGCAGTTTCCCAGACATTACTCACCCGTCCGCCACTCGTCAGCGAAACAGCAAGC
+TGTTTCCTGTTACCGTTCGACTTGCATGTGGTAGTGGCGGCCGTT
+>ds2020-328_169
+CGACCATAGGAGAGGGAGTGAAACTTGCTTAGAGTGAAACGCTAAGAGAGGAGCCCTCTT
+ACCTATCAATGGAAAGATCTACGTGCGTGGCGTGATAAGGAATCCTAGAAAAGATCTCAT
+GAGACCCGCCCACTATTACTACGAAAAAAGTACTGCCCTTTTCCGTCGCTGCTAGGAGAG
+TCAGCTACTTCTATTAGCGCCGGACCTTGAGTCGAATTGATCGTGTCATGTGCAACGTCC
+ATCAATGATGGTTCATTAATGTCCATTGATTTAGACTCCTTCCCCCCTCCCAACTACGAA
+TAAGATCGAGAGGAGCCCGAAAGTACCCATACGTCTATCCCGACC
+>ds2020-328_170
+GGTCGGGAAAGACGGTGCGTGTGGGTATTATCTAGGTTGTTCCCAATTGGTGAAGCAGCG
+ACGGACGAGAATGTCAGACCTACGGTACGCTAAGTTCTACGTAACGGGCAGCCATTTTGT
+TTCGATTATGAAGATTTCAATTCACAGCATAGCAACAGTTCGATGCAAGCGGTACTTGAC
+GCCTATCTCTTGGTTTTTAAAGACTATTTAAGCGAGGAGCAGGTGGAAGCTATGTCATGG
+TCAGTGAATAGTCTTAATGATGTTAAGATAAAGCAGCCTAATGGCGACTGGTATGAGGCA
+CGAGGGACACTATTATCAGGCTGGAGAGCCGTCTATCCCGACC
+>ds2020-328_171
+GGTCGGGATCGCGTTTATACAGTACGCGTGTTGCGATACTGATAGTAGTGAGCGGGGGGA
+CTTGGGATAAATTTCCTGAGCCAGGGAAGAATCGATTGGCGATTTCGGCGGCGGCGAGGA
+GGTGTTTCATCCAGTCAAAACTTGCATCATCGGAAAATCCGAGGAAAGCCGGGAGAGTAC
+GGAGGTCAGCGTTGCCCGGGATGTCTGGGATGTTCCAGCGGCGGATACGCGAATGCTTCG
+CTGTTTCTTCAAAACTACCAATTTTGTCACCTGTTTCAGCAGGGGCAAGCCAGGCCAGGT
+TGTAGGCGAGGGATTGGAATGAGGCAGTAGTGGCGGCCGTT
+>ds2020-328_172
+ATTACGGCGGTCGGGATAGACGGAGGGCGTCCTTCTAGCACCCCCGACACGCGAGCGCTG
+ACATTTGCGTCATTGGCGTCTCTCCCGACTGGGAATCTGTTTGGGAGCACGTTTTCACAA
+TTGTAAAACGCAAAGTTGGCAAGGACGTAACTCGTTGTATCTGTTCCATAGATTGCACGG
+AGCTTGCCCCATTCATACTTTGTTGATGCCCAAGCGTGTATTTCGGGGTTGCGTGATGTG
+AAGTATTCGATGTCAAAAGATGGCATGTTCGATATCATTATGAACTTGTTTTTGAGAGCG
+CGGTCAGTTCTGATGAGAACATCTCGTCTATCCCGACC
+>ds2020-328_173
+GGTCGGGATAGACGGAGGGAGTCCATCAATAAATGGACCATTTGTTACGGAGACACAAGA
+AAAACCTAGAAAGCATTTTTTCTGCAAGTCATCTCGAGGCTTTCAAACGCATCCAAGCAA
+TTGGTATGGTATCCGATTGATAGAAACCATAGATTCGCGTCGCCTACTTGCTGAAAGCAC
+AAATAGAATTGCCGATCATTCATTGTATGAAGTTTTTAAGACCTCACTAATCGGCCTTAC
+ATTTTTTAGTTCATAATGAATGAAATGACCCCCGGATGAAGAAAAAATCTCCCTTCCTTT
+TTACTAAACCATGGGGAGCCCTCGTCTATCCCGACC
+>ds2020-328_174
+GGTAAACGGACTTCTGGAGCAATCGACTCCCAGGGTGTGACGGGCGGTGTGTACAAGGCC
+CGGGAACGTATTCACCGTGGCATTCTGATCCACGATTACTAGCGATTCCGACTTCATGGA
+GTCGAGTTGCAGACTCCAATCCGGACTACGACGCACTTTATGAGGTCCGCTTGCTCTCGC
+GAGGTCGCTTCTCTTTGTATGCGCCATTGTAGCACGTGTGTAGCCCTGGTCGTAAGGGCC
+ATGATGACTTGACGTCATCCCCACCTTCCTCCAGTTTATCACTGGCAGTCTCCTTTGAGT
+TCCCGGCCGGACCGCTGGCAACACAGGCTAAGGGTT
+>ds2020-328_175
+GGTCGGGATAGACGGCAGACTTGAGTACCGAACTGGGACCAAGACCAACGGCTCCACCAA
+AGGTGCCTCCTATTCCCGTCATCAAGAGTCGCTCCAGCCCCGAAGGCGAGGACAAAGAGC
+ATGCTAAGAAACCTGAGAATGGTAATGGTCGTGAGAATGGAGGTGTTGTGAAACCCAGCC
+ATGAAGGAGCTAACGGTGGTGGCAGCAGTCATAATCGGAAGCATTCTGAAGGTGGCAGTG
+GTCCTAATAATGGGAAGCCGAATGGTGGAGTTTGCTGGTGATGAAGGAGGAAACGATGCT
+GATGCGATGAAGGGGTGCTATACGTCTATCCCGACC
+>ds2020-328_176
+GTAATACCCGATCCGATAGTTTACGATATAGATAGATATATATTTAACAACAACATTCTA
+AGAAAGGATATTTTTAGATATCGGTAGTTGTCCGGTCGTACCCAAACAGTAATATTCCAG
+AGGGAAATGCACCTAAGATCAAATATTTCGAGCCGGCTTCCGTGGAAAATTCATACGTTC
+TTTTTGATGCTGCGATCACATAAAAACATAAACTTTGAGGTTCAATAGCTAAATACATGG
+CAATTGAATCATGAGCCGAGATCATAAAGAGCATACTGCGAGTAGGAAGTGGAATTAATA
+CAATGAATTCAAAAGCAATGGTCGTCTATCCCGACC
+>ds2020-328_177
+TCTAGATAGAAAGCCCTATGATTGGAAACTACCACGTTAGGTTTGGAGAGAGACGGGACC
+GGTTATATAATAGGGGGAGCAGATGCAAGCTTTTTCTTTCAATAGCCGGCCAAATGACTA
+CAGGATCATCGGTCTACTCTACCTCAATTCACCATTTCGAACCTTATACAGAAGGTTTTT
+CCGTACCAGCTTCTTCTACCTATACCGCAGTTGAAGCACCTAAAGGAGAATTTGGTGTCT
+TTCTGGTCAGTAATGGAAGCAATCGTCCCTACCGTCGTAAAATAAGAGCACCTGGCTTTG
+CCCATTTACAAGGACCCTGTTCGTCTATCCCGACC
+>ds2020-328_178
+GAAACAAGGGATCAAAGCGTCGAGGCGCGAAGTCTTTAAGATCGGATGCAATTCCGAAGC
+TGGTACATGCTGCACTGGTCCATGTTTCTGGCAGGCCTGGAATCTCTTAGCATATTAAAA
+GAAATCGGACAAGATGGTTGGCCTGTAATGGCCATGCCTTCTGATCAGCCAACGCATTTT
+ATGCCCTGCTTGATGTGATCCACATACTATACTCCATCATGGACTTGAAACAGAATTTTT
+TCGGCTTCTTGCTCACTCACACACCTGAGGAGCAGTCCGTCCTTTCCACGCCGAACCAAT
+ATCCCGACCACGGACCAAAACCGTCTATCCCGCCC
+>ds2020-328_179
+GGTCGGGATAGACGTGATTCTTGCCTATGTATGCTCTTTCCTGCCCACATTGCTTGCCCT
+ACTGTTCTGGTTGAACTACGGCTTTGGCTGAACTACCACCTGACACCAGTATTCTTAGTT
+TACTGTCTGCTTCCTGCCTGATCGGTGCTGACTGCCTGTTCTTGCTTGTCTTGGGCCTGC
+ACTTCTGGCTTACCGGCTTGCTTGTTTGCCCGACTACCTGACTATCTGACTACTACGACT
+ATTCCGCTTGGCTATCGGACTACTTAACATCGGGATTCTTGTCTGTGCTGCTTACTCCCC
+TTCTTCTTACCTGAACAAAACGTCTATCCCGACC
+>ds2020-328_180
+GGTCGGGATAGACGGTGGGTGGTGGTTGATCTCAATGCTAATGGTTATCCCCAAGGTTCA
+ACGAATGAATGGGGCTATGATTGTACCCGGATAGAGATGACGGTCTTCCTCTGATGTCTC
+CAAGCCGGCCATAATAGAATAGATAGGCGAAGCAGCCAATAGCAGTCTGTTCTCGCCTAT
+CGATAGATAGTAGGTTGCTTCCAAGCTCAAACCATTTGAAACTGAATTGCTACTTTATTC
+TTGTTATTGATAGAGTGGTATTCTCCGCCCCTGTCAAATAAAGTAGAGGGAGAGAACTGG
+AAGAGAGAAGGGAAGAGTGGCGTCTATCCCGACC
+>ds2020-328_181
+GGTCGGGATAGACGCTGTTCCCCAATAACCAAAGGCCATGCACCACCTGTTCCTCCAAGA
+TTTCTGCGTGGAAGGCTTATGACCAATAAAATAACCTCTCTCTTTTGCCTTTCGGCAATT
+AGCTTGTACCCAGCCAAAAGTTCCCTGTTGCTTTGAAATTGAGTACAAGTACATGAACTG
+CTCGAATGTTGGCTCTCCCAACCCAACCAACCACCAAGCAATGTATACTCCATGAAGCAG
+AAGCCAGAAGTTGGGATTATACTGCCCCGGCGCATACCCCAGCTTGGCCAACATCATCTG
+CACCCAAAGATGAAGCGGCGTCTATCCCGACC
+>ds2020-328_182
+GCATTAGGCTATTGAATCTCGCGACTAGAATTACGGCGTCGGGATAGACGCTTTCTCCCG
+GTCGAGGTTCAGTACATCCGGGTTCTCAGCTCGATTTTCTCTCTGTATCCACCTTTAGTC
+GGTATTCAGGGTTCCATTCTTGATGTATCTACTATTTAAGTTCCTTCTGATCTATCTACT
+GTAGGTTCAATCCCCGGTCATTCTATCTTTAGTGAGGGGACGAGTCATCTTGCTCGACAT
+CATGGGATCGCGCTTTCATTAACGGGCTGCTTACTCCGAATTGGGATATATAATTAGCCC
+AAGCATGACAAGGCTCCGTCTATCCCGACC
+>ds2020-328_183
+GGTCGGGATAGACGCCGGGTTCCGCTTTCCGGCTAAGCAAGTGATAAAGGAGTAGCGGAT
+CCCTTTGTCTGTCGCATGATACCGGGGAGGCCTTCTTTTAGCACCGGTAGCTATGAGTCA
+GTCGGGGTAGTCACTCCCAAGAGAAGGTAAAGATGGGATCGTTTGTATGCGCCATACCTA
+TAAGAGGGGAGAGAAGGTCGAACGCTAATTCCTGACTGAAGGGCTGAGAATGAACACAAG
+ACTTTGAAGACCAGACTCAGGAAAGCGGACGGGAACAACAACGACGTAGTGACGTTGACT
+AAATCCGAGGGGCCAACGTCTATCCCGACC
+>ds2020-328_184
+AGGATATTCGAAAAAAACGCAAGTAGGACAAAATGACTGAGGTCAAATGGCACGCGGTAG
+TCATTCAAACAAAAGACGCTGAGGAACCTCCATCGAGCCACGTGATCCGCTACAACTCAC
+ACAAAGACTAGGTTCGGCTTCTAAAAAGAAAAGGGGGGGGGGAGAAAAGAGGACAGGGGC
+GCTCCCCGCTAACCGAAGTCTTGGATTTTTCTTTCAAAGGAAAGACAAGCAGTGGTTTCC
+CAGTTATCTTCAATTACTTAGTGAGAGCTTATCGAATTGATGTAAGGCGGGGATACCATG
+TAGGAGGCCTGCCCTGCGTCTATCCCGACC
+>ds2020-328_185
+GCGTGGACAAGGGCGGTCTTGCTTGGCGCGAAGGCTGCTGGTTCGGGGGTAGGGTACGGT
+ACTAAAGGTCCTCGGACTTCCAGGCGGTTTTTCTTTTGGGCAGCTGTTCACCGTTGGATC
+TCGCCAATACAGCCCCCTATAGTTTTCGTTACCGAGATATCTTTTTTTTTCATTGTTCCC
+AGGGATCTTTTGGGTAATCCGCTCCCATGCTGCAAACAGTCAAATCTGAACTAAACCTTG
+TTGCTCTTCTTTCTTTCCTCGCGGGCAGGAAGCACACCAGCAGCGTGCGTTGCGTGGAAA
+GAAGGAAGAGGCAACGTCTATCCCGACC
+>ds2020-328_186
+GGTCGGGATAGACGGCTACTCCCCCTTTTCTTCCTTCTTTTCCGTGTCTTTTTCTTCTTT
+CTTCTTTCCTTTGTGTCTTTTTCTCCTTTCTCCCTTTCCGTGTGTCTTCTCCTTTCTTTC
+CCTTTCCTTATTGGTTTGTCTTTTTCTTCTTTTTCCTTTTTCATTTCTTCTTCCTCTCGT
+TCTTCTTTTCTGCTCTTCTTCTCCCCACTCAATAGACTCCATCAGCCTAGCCACCAGGGA
+TCAAGGAGGAGGTATCTGGGTCAATCCACAGAGGGTGATTGTGATTCTAGAGGTCCACGG
+ACCCCCGTTCTAACTAGGTCCACGGC
+>ds2020-328_187
+GGTCGGGATAGACGCTGTGTCCCCCTGGAGGGGGAGATTGTTGGATCCAGCCCATAATGA
+AGAGACACCATGATGATGTCTATTGGTGAAATGTTTTTCCCTTGCCATCATGACTCTTAC
+TTTTGGAATTTGGTTTTGGCCGGTTTCTTCGGCATGAGGTGACTTTGTTTCTTTTGGAAT
+TTGGCTTTAGCATGCAGCGGGTTCTTCGGCAAGAAACATGGTGGTAGAAAGTGGAGGTAA
+TGATGGGTGAGAGACCAACATCATTATGTTTTCTTCTTTTCGCATGTGGTTGTTTTTTGG
+CGCGTTCTTGCACGTCTATCCCGACC
+>ds2020-328_188
+GGTCGGGATAGACGAGGGGTAAAGGTAGATTGGGAAAAAGAACTCGGTAATAAAGCAACG
+CCACCAGATGAAGTAGTAGGCTATGCAAATGGAGTTTTTAGTAGACATGCTGCTGATGAA
+ATTATCGGTCAGGCTATAAAAGATGTTGTTACCACAGCTTTTCCACACGCAGTACCAGCT
+AAGTTCAGTGATTTTATGGACGATGCATATGAGTGGTTGGTTTCTGGATCATCAGCTGGT
+ATACCGAGAGCACTTAAGAATTCGTCAATGAGGACTTATATCCTAAAAGACTTGGGTCTA
+CATACCAAGGGCGTCTATCCCGACC
+>ds2020-328_189
+GGTCGGGATAGACGAAATTGGCGGATGGTGCTAAAGGAGTTGGGAGAAGAGTCCACCTAT
+AGTTATAGTAGTTAGAAGCCCAGCTTCAATCGTCAGCAGGTGAGTCAGCAAAGTTCTCTA
+GGAAGTCAGCCCATTGCTTTGACTTTTAGCTGCCACTGCTTCATCGCATCGGATGTTGCC
+CTTGAATTTCTTTCTGTAGCCGCATCGGAGGATGTAATAGCAAAGTATGCCACCGCTCCT
+TCGGAGGTCTCCTCCCCCCTTTTGGACCTATAGATTGGTACCACACGAAACCGGACCCAA
+CGTCTATCCCGACCGCCGTAATTC
+>ds2020-328_190
+AGTAAACTGGTGGCTTGTAGACTGGTGTGGGTGGTGGGGGAGACTTGTAGTGGTAAGGCT
+TCTTTGGTGGTGATGGTGGTGGTGGAGACTTGTAGTGGTAAGGATGCTTGGGTGGTGAGT
+AGACCGGAGGAGTAGGAGAAGGTGGTGGTGGTGGAGACTTGTAATGGTAAGGCTTCTTGG
+GTGGTGATGGTGGTGGGGGAGACTTGTAGTGGTATGGGTGCTTAGGTGGTGAAGGTGATG
+GTGGTGGTGGAGACTTGTAGTGGTATGGGTGCTTGGGTGGTGAAGGTGATGGTGGTGGTG
+GAGACTTGTAGTGGTAGGGGT
+>ds2020-328_191
+GTGAAGGTGATGGTGGTGGTGGAGACTTGTAGTGGTAGGGGTGCTTGGGTGGTGATGGTG
+AGGGTGGTGGAGGAGACTTGTAGTGGTATGGGTGCTTGGGTGGTGAAGGTGATGGTGGTG
+GGGGAGACTTGTAGTGGTAGGGGTGCTTGGGTGGTGAAGGTGATGGTGGTGGTGGAGACT
+TGTAGTGGTAGGGGTGCTTGGGTGGTGATGGTGAGGGTGGTGGAGGAGACTTGTAGTGGT
+ATGGGTGCTTGGGTGGTGAAGGTGATGGTGGTGGGGGAGACTTGTAGTGGTAGGGGTGCT
+TGGGTGGTGAAGGTGATGGTG
+>ds2020-328_192
+CGGCGGTCGGGATAGACGCGTGTGATTGGTGCGCCTGTTTGGAGTTGGACTTCTAATCAA
+ACGATTGTGGCCGAGAGAGGAACTTATCTCGGCCGTTAGGTTAACGGCCTGAGCTACAAG
+GCCATTTAGTGGTGGTGTTGGTGGTGGATTTTGGGCGGTGCTCCGGCGCGTTGCTCAGAG
+AGCGACGGTCGTATGATATATGGGGTGAATGAGGCGATAACAGGGATGATGCTCCGGCGC
+CTTAAAAAATCAAGGGTCGTATGATATATTGATGAATGAATTTTCCTTACAATCTACCAC
+TACTCTTAGGAAAGCATGTAA
+>ds2020-328_193
+GGTCGGATAGACGGAGGAACGAGGTGCGCTCAGTAAAAATTAAAAAATTAACAGACGAAA
+AAATTGCAAAAAAGAAAGTATTAATTTCACTTCTAAATCTTTAATCAATATTCTTTTTGC
+CTTGGTGGATCTCTCTCTCATTTAATAAAAGTCTGGAATCTTGGGTTACTAATTGGTGGA
+ATACTAGGCAATCCGAAATCTTTTTGAATGATATTCAAGAAAAGAGTATTTTAAAAAAAT
+TCATAGACTTAGAGGAACTCCTACATTTGGACGAAATGTTAAAGGAATACCCGGAAGCAC
+AATAGAGCGTCTATCCCGACC
+>ds2020-328_194
+GGTCGGGATAGACGTTGGGGTTCGGTGCTTGGCTGTGGTTGGCTATTGATCAAGTAGTAA
+TCCGTTGACTACATTTGTGCGAGTGATGTAACTGGTGGGTTTGTGCTTGTACCATCGTCC
+GCGTGCGGAGTTGCGATGGGAGGTTCGCCGTGTAATTGCACTTGCCTATTGTAAGTGGGC
+TATCTTTCCGTTCGTTTGTAGAAAAGGCGGTAGTGGCAGTGACCTTGCTGTGGCATGGAC
+AGGTGGGTAGCTACACTTAGGATGCTGCTGTATCTGTGGTTTGGTTTCTGGGTTGCTTTC
+GGGTGTAGCTGGCGGCCGTT
+>ds2020-328_195
+GCCGTGGACCTAGTCTCAGTCCCCTGGTGGCGGATCAGCCTCTCAGACCCGCTACAGATA
+GTCGCCATGGTAGGCCTTTACCCCACCAATTAGCTAATCCGACTTAGGCTCATCTATTAG
+CGCAAGGTCCGAAGATCCCCTGCTTTCTCCCGTAGGACGTATGCGGTATTAGCATTCCTT
+TCGAAATGTTGTCCCCCACTAATAGGCAGATTCCTAAGCATTACTCACCCGTCCGCCGCT
+AAGATCAGTAGCAAGCTACCTCTCTCCGCTCGACTTGCATGTGTTAAGCCTGGCGGAGCG
+TCTATCCCGACCGCCGTA
+>ds2020-328_196
+GGTCGGGATAGACGTTTAGCAGCCTTAAACTCTTCATCTTCAGGGTATTGTGAGTGATAT
+GCTCCCGTAGGTGCCCACTGCCACCTCTTATTCCAATAACTTTTCCACTTTATGTTATCT
+GGTTTACTCCCGAGGTTTTTCAATCTAGTGAACATTTCTCCACTAGCCCTGTATATCTGC
+TCTCTAGTGAAAGAAGCGACGTTGGGTTTGGTTCTGTGCTCTTTCTCGGCTTTCCAATCC
+ACTTCTCCTATACCTCTGTTGACTAAAACTTCCATTTCAAAGAATGGTTTTAAGTTGAGC
+GGTGCGTCTATCCCGACC
+>ds2020-328_197
+GGTCGGGATAGACGCCTCGAACAACTCCCTCTCTCTGTCCCCTCCTCTCTCTGTCTCTTT
+CTCTCTCCCTTTCTGTCACTCTCCCTCTCTTTCTCTGTCTCTCTCTTGCCCTCTCTCTCC
+TTGTGTATCTTCCCCACCATCTCTCTTTCTCTCTCTTTGTTAGGCTCTGTTTCTCCATCT
+CTCTCTGCCTCTCTCTCTCTCTCCATCTCTTCCCTCTCCCCCCTCCTCTCTCTGTCTCTG
+TCTGTGTCTCTTTCTCCTTTTCTCTCTCTCCCTCTATCTCTGTCTGTCTCTCACCCCATG
+TCCTCGTCTATCCCGACC
+>ds2020-328_198
+TAATACCCATTAGATTAGACGTTACCTGCAGAATAAGCACCGGCTAACTCTGTGCCAGCA
+GCCGCGGTAATACAGAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGAGTGTA
+GGTGGCTCATTAAGTCACATGTGAAATCCCCGGGCTTAACCTGGGAACTGCATGTGATAC
+TGGTGGTGCTAGAATATGTGAGAGGGAAGTAGAATTCCAGGTGTAGCGGTGAGATGCGTA
+GAGATCTGGAGGAATACCGATGGCGAAGGCGCATCTCTAGCCAAAGACCGACATACCAGC
+ATTTCGTCTATCCCGACC
+>ds2020-328_199
+GGTCGGGATAGACGGAGAAGGCTACTCCCTTCCAAGTGGCAATGTGTAGCTCCACACCAC
+GAGCTACTCCATCAATCGGTTTGGCAGTTGAATTCACCGTCTTCATACTGCCTGCTTCCT
+TTGAGACCCGACACCCAAGTCTCTTTGCTTCCTGCACGGACATGAAGTTGTGTAAAGCAC
+CCGTATCCACCAGACAACGGGTTGTCTTGCCATTCACCATGACATCGACGAACATCACGC
+CTTTTGCTTGAACCTGTGGTTGAGCTCCCTTGGCCTGTAAGGCATTGAAGCGGTTAATGG
+CCCCTATTCCTGCTTC
+>ds2020-328_200
+TACTTCCTTCGTCAGCCTTCCTCCATAGCTACCTTTGAAGGGAAAGCTGGCTAGACCAAG
+CCTAGTAATTAATTGAATAAGAAGGAAAAAGGCCACTCAGGTCTATATCTAGAAAGGAGG
+CTGGATTGGAAGATTGAGAGACCCGGGACAGTGCAGGTTTGCAGAGAGGCTAGAGCATTC
+CCTTCACTAAAATAGAATAGTAGGTAAGATTCACTAGCTAGAAGTTTACTGAGAAGGGTA
+GAGTTTGCAGTAATCGATGAGAGAATGGTAATGCTAAAGGTAGGAAGAAAGAAGGGCAAA
+GACTAGGTCCACGGC
+>ds2020-328_201
+AGACTTCGGTGCCCCTCGGTTTTCTCTTATTTCTCTATCATCTTCCTGCTCTCTTTTCTC
+TAGGAACGTCATTCTTCCTACGTATCTCATCTGATTTTTGAACAGAAATTCCAACGCTCC
+CAGACTTCGGTGCCCCTCGGTTTTCTCTTCTTCCGTTTTCGATATCCCTATATCCTGACC
+TCTGTATGATAGTATCATATTCCTGTCCTCATGATTTAACTTCCATTTCCTATCCACTAT
+GAAGTCTTCTATTTCATGTTCTATCATTAATTTCTTTCTACTAGCCTTCACAACTTCGGC
+GCGTCTATCCCGACC
+>ds2020-328_202
+GGTCGGGATAGACGAAGAAGCGAACGTCATCGTCAGTAGCCTCGGACCAGTCAAGGCGTG
+GCATACGGAGCGCAGGGAGGTACCTAATTTCCCTCCAGTGGAATCGTTGCTGAGCAACGA
+TGCACACGGCGAGAAACGGGGGGAAGAAAGCCGTTTCAGACACGACGGTGTCATCAACAA
+AGAAATCATCCCCACTGACATCAGCAGCGTTGACTACGAGGAGGGCCCCAGACAACGCGA
+ACTGCGAAAGTGGTCGGTACTCCATAACGTCCCGTGAAAACAAAGCCACAAGGAAGCTTA
+TCGTCTATCCCGCCC
+>ds2020-328_203
+GGTCGGGATAGACGGCGGCGAAGATTTAACACCTCCTAAGGGCTGGGTGAGAGAAAGCGT
+CCTTTGTTGATACCTAGTGTACACCGCAACCTACTGAAATGGATTAATAAACGTTGCTTT
+CTATTGCTTGTAGCGGCGTTGCTTCCTTTTGTTCACCGCGAATAATTCAATCTTGAGAAA
+GAAGGCCTTGTGGGGCATCTCCAACAGCGCCAAAGAAGGAAGATGTTAAGTATTCTTTGT
+AGACTCGCACCGCTCACTTACGGTTTTATACAGAGGGGGGTTGTATTGAAGGGCCTTGTG
+ACGTCTATCCCGACC
+>ds2020-328_204
+GGTCGGGATAGACGAAGAGAGAGAATATGGCTGCTTAGCAGCGGAAGCTGGGGATCGAGA
+AGCGGAGGGAGAGCTTAGGCTTGAAATGGAGCTAGGATACCGGTATTTTTCCCTACCTGG
+ATCCGAGTCTTTCTCTTCTCCTGGACCGAGCACCGAGACCGAGGAACGAGAGGCTGGATA
+CGAGTCTGATGAGATCAGAGCCAGTGAAGAGAAGAGGGAAGGCTGACTCTGCTAGGCTGG
+CTTGCTTGTTCGACTAGAGCACATAAATAAGGTAGCTTGCTTACTTAGAGCGAAACGAGA
+CGTCTATCCCGACC
+>ds2020-328_205
+GGTCGGGATAGACGTTAACTTGAAATCATAATCAGTCATTAAGTGGGTCTTGTATGTCTT
+GTTTTCATATGTAGATGTTTTGTAGTATTTAACCATAATCATCTCTATGTCTTCTGTTCC
+TGACCCCTCGGCATCCCATGTTGGTGCTATCTGAGCAACCACGTCCATACGAGTCCATGT
+GTAAACAGTATTATATGTTATCAGCCTGTCATAAGGGGTACCAAACTGGTGTTCTCTGGG
+CAAAACTCGTTCAAGAGTGTATGAGGTAGCTTCGTCTAAGGTGGCCAGGTCGTCTATCCC
+GACCGCCGAATTCA
+>ds2020-328_206
+AACGGCCGCCACTAGATTATCCGTGTCCACTTGCCTAGTTATATCATCCAGGACAGTGTA
+CCAATCGTTCTCGGAGAGGTAGGTGATAGGTGTTCCACTCAGCAATGTAATCTCTATGAT
+TATATTACCGGATCCAGTATCATATGTTATGCTAGGACCAGGGCCATTGGCATCACGTGC
+ATCAGCTACAGCTTCTTGAATCTCTCCGTTGGCAGTTTCAAGGTCATCTTCGTCATAAGG
+AGGATCGTCTTGGTTCTCTTGAACTTGAACGCTAGACAACACAGTTACTCCAAGATCTGG
+TAGTGGCGGCCGTT
+>ds2020-328_207
+AACGGCCGCCACTAATCCGTCTTGGTTGATGTAGACTTAAGAAAGTTCTTTGAGCTGGAA
+GTTCTTGTCAACAGAGTGGATGGACTGGTCAACTGGGAGGAGGAGCACAAGAACAGGGTG
+TCCCCTAACTTGGCCGAGATGCCGGAGGGATTGGTTTATGAAAGGGCCTCGCAGCTCTTC
+AGTAGATCGATCTCAGCGGGTAAGAGACCGAGGAAGTTTGATTGGCGGGAGTACTGGCAG
+AGTAGGTGGCAGTGGAGTGCGGCCGGCAGCATACACTCGCAATATTCAGAAAACGAAAGT
+AGTGGCGGCCGTT
+>ds2020-328_208
+GGTCGGGATAGACGTCAAGAATCCCGCACGGGTTCGATTCCCGTAAGGGATAGGTACTCA
+TTCCCGGCCGCTTTCAGTTAGTGTTCATTGCTGAGTGATCGCTCGCTATTTGGCTGGAAA
+GGGTGGTCTGGAAGCTTCCTCTCTCCCAGCAAGCAAGACGAGATCACCGCTTCTCTCAGT
+AATGGACTTCCTTGAATTCTTCCTTATCCTGATTCCAAAGTTTTTATTTATTCTTTACTT
+TTAAGTGAAAAGGGGGAGTTGGATCATAAAGAAGAGTTTGTTCCTTAACTAGTAATCAAC
+GTCTATCCCTACC
+>ds2020-328_209
+GGTCGGGATAGACGTTCTTTAGGTGGGGAGGATAAGTTTCAAGTGCGGATACTTCATTTC
+AAATGGGTGAGAAATTTTTGATTGAGACAACATCATCCATTGTGATGCTAACCATCCCCA
+AGTGGGATTGGGTTTTTTTACCAAGTGCCCCAAGAAGTGAGTCGATAATGGTTACCTGAT
+AGGGGACCTAGGCTTGTTGATTGGTAAACTTCACTGAGTTCCTCGGCCAACCCTTTCATT
+CCCGAATGGAAATAGGGTACAATTGCTACAGACGATCCTTTAAGGATGTAAATGATGCGT
+CTATCCCGACC
+>ds2020-328_210
+GGTCGGGATAGACGGGGTGCGCCCTTGGATTGCTGTTGCATATTCAGCTCCTGTTGCAGC
+TGCTACTGCTGTTTTCTTGATATATCCAATTGGTCAAGGAAGCTTTTCTGACGGTATGCC
+CCTAGGAATCTCCGGTACTTTCAACTTCATGATTGTATTCCAAGCTGAGCACAACATCCT
+TATGCACCCATTTCACATGTTAGGCGTAGCTGGTGTATTCGGCGGCTCCCTATTCAGTGC
+TATGCATGGGTCCTTGGTAACCTCTAGTTTGATCAGGGAACAGATATAGTGGCGGGCGTT
+GCTGTGTATTA
+>ds2020-328_211
+GGTCGGGATAGACGAGTCTGTGTTCTGCGGTTCGGCGGGTAGAGGAGATCACTATGAAGA
+ATAAAAGGCATCGGAAGAGGGCTTTAGCCCAAGAGGTAGCATTTGGGAACGATCCATATC
+AATTGGTATGAAAGCCTACAGCAAGAAAGAAGGAAAGAACGAATGATAGGAATGTAGCGG
+AAGAAAAAAGTTCTTTGAAGGGGGCCCACCGCCCTCCATTTGGGAACTCTTTTCTATCCT
+TGTCCCTTGCCGGCTAGAGCCACGGAGCTAAAGGCGGATTCTTTAGTCGCTTATGCCGTC
+TATCCCGACC
+>ds2020-328_212
+GGTCGGGATAGACGTTGGAGCGGGCTGGGGATCCTATCAACTTGTTCCGACCTAGGATAA
+TAAGCTCATGAGCTTAGTCTTACTTCACCGTCGAGAAACGAAAGAAGACTTCCATCTCCA
+AGTTTAACTCAGACGTAGCTCGCTTCTTTTTGGGTGTGAAGCAGTGTCAAACCAAAATAC
+CCAACAAGCATTAGCTCTCCCTGAAAAGGAGGTGATCCAGCCGCACCTTCCAGTACGGCT
+ACCTTGTTACGACTTCACTCCAGTCACTAGCCCTGCCTTCGGCATCCCCGTGTATCGTCT
+ATCCCGACC
+>ds2020-328_213
+GGTCGGATAGACGGTCATCTGGCCTCGAATACGGTTCCCTTCTTTTATTCTATAGCTTTT
+ATTCAATTAGGGCGAATACCTTGTAACCGAATTTCTTTCTTGAAAGATATGCTACTTCCC
+GGTCGAGCTGTCTTGTAACGGTCTCTAGGGTCTTCAGTCGAATTTTTCTTCTTTCCTGTA
+GTAGTTCATCTGATGAGTTCATCGCGCAATTTGAGTTTAAGCATCGGGCTTCTCAAAGCT
+ATCTTCTGTAGGGATCGGAGATCGCCTTGTATAACTATCGATCAATGGTATAGAATAGTG
+GCGGCCGTT
+>ds2020-328_214
+GGTCGGGATAGACGGCATTAATATGTTAGGGTTATAAACCTTCACGTTAGAATATGTCAA
+TTTTCCATTGTTAAATAACGCATACGTCTTTGGATTAACTTTAACTTTGATATCCAACTG
+CCTACCGGACTGTATTATTTCTATCCAATTCTTAGCCCTCTTTATTAAAGTGTGCATTGG
+CATTACAAACAGGTTTGCTGCTCCAGTCCCTGGTATATCTGGCATTACATGACCATTTGC
+ATTTGCAGCCCAATTTTTGTATTTCTTACCAGTCATCGCATCATACACCGTAGACGTCTA
+TCCCGACC
+>ds2020-328_215
+GGTCGGGATAGACGAACGAGATGGCTAAAGCAGACGGGGAGCGTGAAAGACTATGTCACC
+ACGTTCACCAACCTATTGTTCGAGGTGCCTAGCATGACGGACGAGGACAAGCTCATGTAC
+TTCATGAGTGGCCTACAGAATTGGGCCAAGCTGGAGTTACAACGGAGGCACGTCCAAACC
+TTGTCAGAGGCATTGCTGCAGCCGAGTCTCTTGTGGAGTTCAAGAGAAGTGATCAAAGCG
+ACTCTAAGTTCAAAGGAAGGAAAGATGGCAGCGGATCCAGTGAGGGAAACTGGGCGTCTA
+TCCCGACC
+>ds2020-328_216
+GGTCGGGATAGACGCGGGGTTTCTGTGTGAAGGGGTCGTGATCCAAGTGGTCCAGGTGCT
+TGATTAGCTTGTGGAGGTTGGGAAGGACGATAAGACAGTGGTTTGTCTCGCTTATTGGTT
+GAGAGGATCTCAGGAGTGTGAGCGTCCGGGAGTCGACCATTTAAGTCTTCTTCTTTGAAG
+GTGGTATTAGACATTCTGTGTTAACAGAGGGGTAAGGGGTAGATGAGGTTTGGGTGTGTT
+AGTTTTCGTAGGAAAAGTTCAAAAGTTTGAGTGGGAAGGAGGGATATTTACCCCGTCTAT
+CCCGACC
+>ds2020-328_217
+GAATTACGGCGCTCATGTCTCGCCCCCCCCGTCTAGTGACCGGTTCCATGTTTCCCCCGA
+ATTTCATCAGTTCCAGGCTCAAGTGCCTGCTCATCCATCTTCATTCCAAAGGCGAACATT
+TCCTTGAGTGACTGTAACTGCTATGGTTTACAGTCAATAGTTCTTAACCAACCCTTTCTC
+TTAGAGCTTTATAAAGCTTTAAGAGAGAATAGGGAGTAAGGGGGAGCTTCGCTTCATTAT
+AAAATTTACCCGGACCTTCTTTCTACTCCTGCGGAGCCCTGCGAAAGTAACCTCGTCTAG
+CCCGACC
+>ds2020-328_218
+TGAATTACGGCGGTCGGGATAGACGAAAATGGGTGGTTGTGGTAGTTGAGGGCTTTTCGG
+GGTGTCAGGTTCCGATTCGGAGCTGGTGGTGGAGGCTGGTGGGTTGGTAGTAACGGAAAC
+TGCATCTGATATCGATGGTTGCTTGGTAGGTGTTGGTCTTGGTCTAAGAGACATGTTGGA
+CTGTGGCGGCTGAGGTGGCGGTGGTGGTGGTGTTGGCGGTGGCAATTGTGGTGGCTTTGA
+GAATTGTTAGTATTTAGAGGAGACACTTGGCTCTTGGCGTACGGGGGGAGACCGTCTATC
+CCGACC
+>ds2020-328_219
+GGGGCGGGATAGACGGCACCTGGACCTATAGCTTTTAAAGTAGCAACAGTGGTCGGCGTT
+ACACTTCTGGAAACCTTCCTTGTGCATGAAACCGTCAAACTTTTTGTACCACTGTCTTGG
+AGCTTGTTTCAGGCCATACAAACTCTTCTTAAGTTTGCACACCATGTTCTTATTCCCTCT
+TTCTGAGAAACCTTCTGGCTGGTGCATGTATATCTCCTCATCCAAGTCTCCGTGAAGAAA
+TGCGGTCTTCACGTCTAACTGTTCAAGATAAAGATCTTCAATGGCAGTGTCGCGTCTATC
+CCGACC
+>ds2020-328_220
+GGTCGGGATAGACGTGCCCTTGGAGTGCGCTCTTTGCCCGCGATTGTTCTTCTCAACCTG
+TCATAGAGCTCGACATCCTCCAATACGACCTGCTTGTCCGCGCTATGGTACACGTACCAC
+TCAAACCCAAGGCACCTGTACACTGTTACGTCTCCGCGGACATAGACTTCCCTATCTTTT
+TTGATCATTTCCCAGGGGTCGACAATTTTATTACACTTGTCGACTCCACACAACACGAAC
+TTGATATGGTATGTATCCCCAGCAAGTTTGTTTATATCCCAAAGCACTAATCCGTCTATC
+CCGACC
+>ds2020-328_221
+GGTCGGGATAGACGGGCAATACTCTTCATTCTTCGTAACCTTTATTTTTTGTATTTTTAA
+AATTCTTCCATGACTTAACCTCCAAATATCTCATGAAGCTTTTCCAAAAGCTTCTCAAGA
+ATTCCACATTCTCCACCACCTCCTCCTCCTCCAGTACACTCACCTCCTCCACCAAAGGCG
+CCTTACCACTACAAATCCCCACCACCACCACCCAAGAAGCCTTACCACTACAAATCTCCC
+CCACCACCACCAAAGAAACCTTACCACTACTCATCTCCTCCTCCTCCTCCTCCACACAAG
+AAGCC
+>ds2020-328_222
+GGTCGGGATAGACGGGCTTTCGTTCTATTTCTTTATCTCCCCATGAATCGTATGTTTGTA
+ACAACAGGGACAGAATTTTCTCAATTCCAATCGACCAGGCGTATTGTGTCGATTCTTTTG
+AGTAATATATCTGGAAATGCCCCTTGATTCCTTATTAACACGATTTCGAAGACAACTGGT
+ACATTCCAAAATAACTGTTACTCGGACATCTTTACCCTTGGCCATGAACCTCCTTTGGTT
+TATGATTCACTCAATTCTTTAATTTTCCGATCCGAAGCAGGGCATGTGTTCGTCTATCCC
+GACC
+>ds2020-328_223
+GGTCGGGATAGACGTTTCTTTACTATAGATAGATTGTCTCACCGCGCTTTCGATCTCGTT
+ATGGCTGAATGATGCGTCAGCAGTGAAAGGAACAGGTAGATCTCATACCTTTATTTATAT
+AGAATAAGCTTTTCTTTTCAAGTAGTTTTAGCTTCTCGCCCTATAGTATAGGTAGGGAAT
+GGACTGAAAGCCAACTCCTGCTGATGAACATATACGCTACTTCCCGCCCCGGAAGAACCT
+ACTTCCATTCAACTACCTGAACAAAATAGAATAAGAAAGGGGGGAGGTTCGTCTATCCCG
+ACC
+>ds2020-328_224
+GGTCGGGATAGACGCCTATTTGCATTTGTTATTGGAAAATGAGGAGGAAGCCATCTGTCA
+TGGAGAGGCAATCCTCAAATACGTACTTTGACCTGACGGCTTACCGTTCTTAGCTTCTGA
+TGGGAATTCCAAGTCGTATTGTCCATCGGAACCATCAATCATAAGATTAGCCAGTCAGAA
+AGTCTTCGCTCTTCCAAAGCCTCATTAGCACGCCAGTCAGTCAGCTTGACCAAGAAGACC
+CGAAAAGGCACACAATAAGGAAAGGAAGAAAAAAAGTACCGTTCCATGCGTCTAGCCCGA
+CC
+>ds2020-328_225
+GGTCGGGATAGACGAGGAGATGCGATTCATCAACAAAGGGATAAGGAACTTTTAAGCCAC
+TCTTCTAATTGGCTATTTCCGATCGGATCTTGCCGGGAGTTAGTGTATTGATGCCGAGAA
+TACGCTCTTTGATAGAATAAGCTCTTGTCTCAATATACGCTGTTTTAGCATTCTCCGAGC
+AGGAGAACATGAAGCTTGTTTGCTCTTTTGATTGAGTTCACGAAGGCTTTATTGAAAAGA
+CTTTCTGATTTTAAATAGAAAGAAAGTCCAGACCAACGGCTGCCGGCGTCTATCCCGACC
+>ds2020-328_226
+GGTCGGGATAGACGCTATCGAGATAAATTTATTCTTCAACCTTATATCTGATTTATGTAT
+AAATTGTTCGTCAGTTTTATATTGTGAATGGATACTCCCAGAAGCACTCCACTGCCATCT
+GTTGGTCCAAAATTTTTCCCAAGACATCACCATAGGAGTTCTCCCGCTAACTGCTGCACT
+CGCGAAGATTTTAAGTGCTTCATTCTGGATATAATCAGCACTTAGCTTGACTGTTGACGC
+TTTTGTTCTATGTGTGAACTCAGCTTCCCAATCGAGCGCGCCGTAACGTCTATCCCGACC
+>ds2020-328_227
+GGTCGGGATAGACGAAAAGAGCCTCTGGGGAAGGGATTTCGAGCGGCGAACCAGGAAGCC
+GCTGCCCGACTCCCTGAGAAGGCTGCGAATTTATTTCTTCCCCCGGTTCAGCGGTCCCTC
+TAATCCAACCTGAAAGCCCCTCAAAAAAGGAAGAGGAAGAATGGTCATCCCCCCGGGGCC
+CAGATGCATCCATCATCATACCTGATGAGGTAATTGCCCCTACGGCAATCAAGCGCACTC
+CCCAATCTCCGTCTGTCACGACAACTAAAATATTTAAAAAACATAAAAACCGTTGAACG
+>ds2020-328_228
+GGTCGGGATAGACGCCCTTGCTCCATAGCGTTTCTTTGATGTTGCAGCTCCCTTCGTTGC
+TGCGTTCGTTATCGTTTGGTATTGATATATTCAGTACCTACGTGATGCGACGACACACAA
+AACGTTTCGTCCATCAGGACTCTTCAGGGCACATGTTTACTGTATATCTAATCGCCTCCC
+AAGCACTGCCGTCTTCGCTGAACACCCAACTGTGTCAAGCTTATTTTCCTGCTCTGCTGC
+TCGTGTCTGTACAATTCGTGCACACAGAAGTGTATCGCATCTAGACGTCTACCCCGACC
+>ds2020-328_229
+GTTACATGCATTGGACTCGCGACTTGAATTACGGCGGTCGGGATAGACGTTGTTCGCGGA
+TGGAGAGGTACAACATGGATAAATTCTACTTTAAATTTTTGCTATGTGGCTATTGCACTC
+CAAAATATGGAACGTATACATGGTGTAAGTTGTGTATTATATGTAGATCATGGCGGAGAT
+GATATAGATTTAGGATTAAGTGAACCTGCCATGCTGCCATTGTTCCTAGAAATAATGGAT
+AGCATGCTGTTCAAGGCGAATAAATGGAAACAAATGTCCGATCCACGTCTATCCCGACC
+>ds2020-328_230
+GGTCGGGATAGACGATTTGGACGCCTGGTCGGGATAGACTTCACGTACGCGTCTATCCGA
+CCGCCGTAATTCACAGCAACGGCCGCCACTATGACCTTGCTGTCCATTTACTTTCCTCAA
+TAATCGCTTCGGAGACACAGGGTCCTCAAAGTCGATAGAATCGTAAAGACCTGAGGTGTG
+CCTGGTCATTTGAGAAAGTATTTCTTTGCGTATACCCCATGAATTACGGCGGTCGGGATA
+GACGCCTATGTTGAGTGTTACGTTATCCCGACCCCCCGCAAATCCGTCTATCCCGACC
+>ds2020-328_231
+GGTCGGGATAGACGTACCTGGTGGCTTGTTTGCTTTCCTCTTTCGGGGAGCAGGACAGAT
+AGCCTAAGGGACGCGGAAAGACTACGGGAAGGCTTGTTTGCCGGCGATTAATGCTTTCCT
+ATCTTGAGTTATTCCCTGTGATCCATCTATGAGATCGCTTGCACCGGAAGAAGTCTTTCA
+GATCCTCCAAACTAAAGCCGTCGAAACAGAACTCAACCGAAGCCCTTTCCCGTAACAACC
+TAACCTACAAGAAGGACCAAAGGGGGGGTTCGTCTATCCCGACCGCCGTAATTCAGAT
+>ds2020-328_232
+GGTCGGGATAGACGTTTTTGGGCCGGCCTTAACAGATGACTTACATTGTAGAGAAAGGTT
+TATCTAACTAGTGTGGGAGTTTGGCTGACCACCCTGCTTTCTGACGCTTTCTCGACGGTA
+GGCACCCAACGTCGCCAAACAAATTAGCCTCTCCTTCTTCCTCAATAGCTGCCTTAGTTT
+AGTCTTTGGTTGGTGTGCGACTATGAGCTTCTGGGCCTGTACGATTTCCTGTCCGAAAAG
+GCAATCCTCTACAGGAAGGGCCAATGGCTACGTCCCGCCGGTTCGTCTATCCCGACC
+>ds2020-328_233
+GGTCGGGATAGACGCTGTTTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGGAAGC
+CGGGTTACGGTGCCCAACTGCGCGCTAACCTAGAACCCACAAAGGGTGTTGGTCGATTAA
+GACAGCAGGACGGTGGTCATGGAAGTCGAAATCCGCTAAGGAGTGTGTAACAACTCACCT
+GCCGAATCAACTAGCCCCGAAAATGGATGGCGCTGAAGCGCGCAACCTATACTCGGCCGT
+CGGAGCAATTGCCTGGCTCCGATGAGTAGGAAGACAAAACAGTAGTGGCGGCCGTT
+>ds2020-328_234
+CGGTCGGGATAGACGGGTCGGCATACTTGTAGACTAGTTTTCTATGGGGGTACCCGGAAT
+CTATAGTGGCATGTGATATATGTGAAATATGGCATCACAGTCGCTGAAGTGGCATTGAGG
+ATGCGGAAGCTCTGCCACCTGTTTGTTCACACAGGGCGATTTCGGGGGCCTTTGCTTCGA
+AAGGGGCGTAGCGGAAAGAAGTAGCGGAATCAGGCGACTTGCCACACACCAGGAAGAATT
+CCTTCTTAGGCGTATCTAACTCTTTTGACAAATGCCCAGAGGACGTCTATCCGGCC
+>ds2020-328_235
+GGTCGGGATAGACGTAAGAGGGGGGTGTATCCGTATTTGGCGGAGTAGGTGAGCGTACTC
+GTGAAGGAAATGATCTTTACTTGGAAATGAAAGAATCTGGAGTAATTAATGAACAAAATA
+TTGCAGAATCAAAAGTGGCTCTAGTCTACGGTCAGATGAATGAACCGCGAGGAGCTCGTA
+TGAGAGTTGGTTTAACCGCCCTAACTATGGCGGAATATTTCCGAGATGTTAATGAACAAG
+ACGTACTTCTATTTATCGACCATATTATCCTTTTTATGCAAGCAGCGTTTGTTCT
+>ds2020-328_236
+GGTCGGGATAGACGTATCTTATTCCTTATGTTTAAGTACCAGCATGTCCAGCCAGAAGGA
+TAATGCATCACTCCTCTCATCTGCATACCTTTTCTTGTGTTTCATCCTTCCGTCTTTGAC
+ATTCCATCTGGTTATCATCTCTTTGGCTAGTCTCTTACTAACATTGTTCTTTGTGGCTAG
+CGCTAAAGTCTCTATGTCTTGCACCATCCTGCAATACACCACCTCATTTTAGTCCTGTCC
+TGCTCTGACTTAGCAATTTCCCCTCGCTCAGCATCATTAGCCGTCTATCCCGACC
+>ds2020-328_237
+GGTCGGGATAGACGTAATGCGCCACTTGCGTCTACCCGACCATGAGACGTCGGCGTCTAT
+CCCGACCAGGGGGATGGACCGTCTATCCCGACCGCCGTAATTCCCGGACAGAGGCCGTGG
+ACCTAGTCGTTCTGCCCCTGCCGTGGACCTCGTGAGTAGCGGGGTGATTACTAGGTCCTC
+GGCTCTCTGTCCGGCGGACAGAGAGCCGTGGACCTAGTAGTATTGTGAGTATAACTAGGT
+GAATTACGGCGGTCGGGATAGACGTAATTAGGGGGTTCGGTCGTCTATCCCGACC
+>ds2020-328_238
+GCCGTGGACCTAGTTATTTAGAGGGTTTCTGACTAGGTCCACGGCAGACCCAGGAGGACT
+AGGTCCACGGCTCTCTGTGAATTCGGCGGTCGGGATAGACGGCTTGGATTGCTGCAAGCT
+CTGACGAACATGTATTTTTAATCTCCAACTGCGTGATGTCTATTTCCATTGATTCCCCTG
+TGTTATTGAACATTTGCCCCTGCAACATGCGCTTATGCATTTCTCCATCTGGCTGACTTG
+CCATGTACTCCACCACGGATTTGAATTGTAGTCCTGACATTTTGTTTATTTTCG
+>ds2020-328_239
+GCCGTTGACCTAGTCTTTCGATGGCGCTTAGGGGTCGTTTTGGTATAAGAGGACATAATG
+AGATCACGGTTTTAGTAAATGATGCAGAGAAGGGTAGTGATATTGACCCACAAGAAGCGC
+AACAAACTCTTGAAATAGCGGAAGCTAACTTGAGGAAAGCTGAAGGCAAGAGACAAACAA
+TTGAGGCAAATTTAGCTCTCAGACGAGCTAGGACACGAGTAGAGGCTATCAATGTGATGT
+CGTAACTAGTCTAGTTGGTCCGTCCGAACCGGGGCGTGACGTCTATCCCGACC
+>ds2020-328_240
+GGTCGGGATAGACGTTCAATGGCGATGTGGTGGTGGAGGACAAGGAGGTGGTGGTTTAGG
+ATAGTCATGGTGATGTGGGGGTGTAGGAGAAGGAGGTGGAGGTTTAGGATAGTCATGATG
+GTGCGGTGGTGGTGGTGACGCAGTTGGTGGCTTTGGATAGTCATGGTGGTGTGGGGGTGG
+AGGTGGTGGAGAAGGTGAGGGAAGTGGTGGCTTTGGATAGTCATGGTGGTGGTGTGGTGG
+TGACGGAGTTGGTGGCTTCGGATAATCATGGTGGTGGTGCGTCTATCCCGACC
+>ds2020-328_241
+GGTCGGGTAGACGGCGGAGTGTACTTGATACCTTTCGAATTCACGGGGTAGATTTTGTCG
+GCATATTCGTCTGGCTCGGGCAAAGGAATGGTAGGAAATTCTTTCGGCTGCGAAATTAAA
+GTGGCGTCAGAAGTATATGACAAAGGGAGTTTCTCACGACGTCTGTACCTGTAGAGGTAC
+TGGTCCCAGACCTGATAGCCGGTTGATGACATGTCTGTCGTCCAGCACATCACCGAATCG
+AATTCTGGATGCTCAACTCGGGCAGTGTAACAAACATCATCAGCGAACCGGCC
+>ds2020-328_242
+GGTCGGGATAGACGGGGCACAATTCTAAGAGTACATAGAACAACATACTTCAATTTGGAA
+ACGATCCTACGGTCGGAACCTATCAAACCCGGATAACGCATAATATGCGATAATCCGTTC
+GATAGTCAAACGACCTCCGAATCGAGATCCGCGAAATCCTACACGCTCGTGACAACCTAA
+GGATCTCATTGGGACAAAATGCAGCTTCACCACTTCTGCCCTTGCGCGTGGGTTGCTTGA
+GTAAATTCCGGCGACCGTAAAAACTTCAAATCGCCACCTCGTCTATCCCGACC
+>ds2020-328_243
+AACGGCCGCCACTATTTGTCATTTTTATTTCATGCTACCGTAACCTCACAAAACTTAGAG
+CCTCCGTGTGGAGCATAAGCGATATATGACATACGGTAGCATGAAATAAAAATACAAAAA
+CAGTATAAAAATATAAAATCCTACCCGAACCGGACACTATAAGGTAGATCTTATGATAGA
+TTAGTTGGCAGGAGCTGTGGTTAAAACCTGGAAGCCGTAATTCTGATCTTAGGAGAAACC
+GGACGGTGATAAGGCTAACTAACTAAACAATGCGGAATTAGTGGCGGCCGTT
+>ds2020-328_244
+GGTCGCAATAGACGCCGGCGGTAGATTGGAGGATTAGAAACATGACTATTACTCTCCGAT
+TGGCTGTTTTTGCATTAATTGCTACTTCATTAATCTTATTGATTAGTGTACCTGTTGTAT
+TTGCTTCTCCTGAGGGTTGGTCGGGTAACAAAAATGTTGTATTTTCCGGTACATCATTAT
+GGATTGGATTAGTCTTTCTGGTGGGTATCCTTAATTCTCTCATCTCTTGAACCTATTCGT
+TCTAGATCCAAAAATGACATTACCCCTCCCTCCGAATTCCTTCAGGTGGTGA
+>ds2020-328_245
+GGCGGGATAGACGCGCGCCTTTTCTACTTGATTATCTTTTGGGTTAATATCGCAATAATG
+GGACTTGTTGTTACTGCCTTCAAGAGACAGACTTAAACCCCCCTTTACCATTTCAAAGAG
+GGTGGATGCCGATGCCAAGAGAGAGATTCCGTAGGGGAGAGATTCGATTACAATTTCTTT
+TTTTTTACTAGCATTTTTTTCCGTTCGCCCTACTACGAAAGTTACTAACCGCAATTTATT
+ACTTGGCAGCTTCTATGAGTTGAAGAAAAAGACAGCCCCGTCTATCCCGACC
+>ds2020-328_246
+AACGGCCGCCACTATTTGCTGTCCTTCCACCTTCCTTAACAATCTTTTCGGAGACACAGG
+GTCCTCGAAGTCTATCGAATCGTAGAGGCCCGAGGTGTGCCTGGTCATTTGAGAAAGAAT
+TTCCTTCCGCATTCCCCAAGTCCTCTGACTGACGTCGTAGTAGACTGCCGATCTGTTGCC
+CGGCATAGGCGATACGTACGCCTTAATTAAATTACCGTAAGCACAAACATTGATATCGCC
+TTCAAAAACGCCATTAACCATTCCCATAAACAAATGAGTACTATCCCGACC
+>ds2020-328_247
+GGTCGGGATAGACGGACGAAAGTGGTTAGTTAAGTAAGGTTTTCGGAGTATGAAGGTTAG
+TTAAGGCCTTCACCATATGTATTTCCCAAAGGGAAAGGGGAAGACCCTAATTCTGCAGTC
+AATTATATGGCAAAGGTAGCTCTTTGCTTTATTTCAGCAACCTCGATTGAAGCTGTAGGT
+TTAGGGCGAGCTATCAGAGCAGCAAGTGGTAGGCTGTAAGCCGAATGAGAGAGCTATCCA
+GTTTTCAGGTAAGAAGAAGGGGAGTAAGCAGCCCATACGTCTATCCCGACC
+>ds2020-328_248
+AACGGCCGCCACTAGTTTCGGTCCCTAAATATTGCTAAGTGGGAAACGAAGTGGGAAGGC
+TAAAACAGTCAGGAGGTTGGCTTAGAAGCAGCCACCCTTTAAAGAAAGCGTAATAGCTCA
+CTGATCGAGTCGTCCTGCGCGGAAGATGTAACGAGGCTGGTTAGTGGCGGCCGTTGCTGT
+GAATTACGGCGGTCGGGATAGACGATTACGAGGGCTGGTCGGGATAGACGATAATGACCG
+CTGGGAAGACGCATGATCAGCAAGTTGCGTCTATCCCGACCGCCGAATTCA
+>ds2020-328_249
+GGTCGGGATAGACGATCGCTCACGCTTTTTTAATGATCTTTTTTATGGTTATGCCGGCGA
+TGATAGGTGGATCTGGTAATTGGTCTGTTCCGATTCTAATAGGTGCACCTGACATGGCAT
+TTCCACGATTAAATAATATTTCATTCTGGTTGTTGCCACCAAGTCTCTTGCTCCTATTAA
+GCTCAGCCTTAGTAGAAGTGGGTAGCGGCACTGGGTGGACGGTCTATCCGCCCTTAAGTG
+GTATTACTAGCCAGTCTGGGGGAGCGGTGGCTTTAGCAATTTATAGGCTT
+>ds2020-328_250
+GGTCGGGATAGACGCATTCGCCATCTAGAGATATCTTTCCAAATGGTATAAATTTCCTTC
+TTTGCTCAGTGAGGCCACCCTGAATGTAAGTGACCTGTTCGAGGTACTGGCTTGTGGGTA
+TCGCCCTCCCTATCATTGCTCCATACATAGCATCGGCTCTATCAGATGCCTTGAGAACCA
+TGTCTGTATCCAGATATTGACGTTCTAAAATAGTTTGTAAATTGGGCGCGTTATGTATTA
+ATAAATATTATCCCCAGTACCAACAAGTATTCGCCCCCGTCTATCCGCCC
+>ds2020-328_251
+GGTCGGGATAGACGCAGACCCCCCGTTATGAGTGCTAACCACCGGGTCATCTCTTGTAGA
+AATTTCAGTATACACAAAGTTGAGTACCGTGTTCATAAATGTAGTCAGTCTCCAGCCTGA
+TAATAGAGTTACCGCACAGCGGTAAGTAGATCCGTCTCCTCTTCTAACTTCTGTCTTATC
+CAAGGCATCAATGGTCCAAGCTATACTAGCTAGCTGTTCCGGTTCAAGATATGTCTTAAA
+TACCGCACCGTACGCCTGCAAAACTGCCTGTTACCGTCTATCCCGACC
+>ds2020-328_252
+GGTCGGGATAGACGCCCGTTTGCCCTTAGTTGTCTCGAAGTTAGCTGCTTGGCATGAGTA
+GCTTGGGCAGTCTTAGTGAGTAGCTTGGCTTGCTCATGCGGGGCTTTGGAAAGAAAGTAA
+CCAGGGAATTCATATACTAATCTTCTAATCAGAAGTTTTTTTGTTTAAAAGTAGATCGGG
+AGTTCAAGCAGATGTTAAATTAAGGTGAGGTTTACTATTCTAGTCTACAGGCCATTTAGC
+TAAAAAAAATCCTGAGTATCGACTGTCATGATCCGTCTATCCCGACC
+>ds2020-328_253
+GGTCGGGATAGACGCCCTTGTCGTTGTTGGTTTAGGCTATTTCTAGTCTGAAATCATTAT
+TTGCTAATAAGAAGAAATGCAAGGACTTCTTATTTCCTGGGTTAAGAGATAAAAACTCAG
+ATTTGCCCATGAGTATGGGTGCCCCTTTAAATATACGGGATGTTACCTCTAAAAGAATTA
+GAGGTAAAAAGAAGATGAAAGAGAATTCTCATGTTCATATAGATGGTAAGGTCGGTGGAT
+GACCATACTATCTATTATTGTATACCTCCATATCGTCTACCCCGACC
+>ds2020-328_254
+GGTCGGGATAGACGGCAGCGACACTTGATCGATTTCAGACGCATGAGTCGCCACGTCACG
+GGACTAGGTTGAGCGGGGTCGTGGTCCGACAACGACATCTGTTTGTCGTATTATCGACAA
+TAATGGAAGGACAAAATCGAGGTGTTTGATGTCCAAGATGAATGTATCCTTGGTTCCTCT
+CAAGAGAAACCTTTTCCAAGGGTACATGGGGAAGAAGTTAGGAGTTGAAATCGGCGGTAT
+CGCTAAGGCAAGGAATGGTCATGGGGAGTCCTCGTCTATCCCGACC
+>ds2020-328_255
+GGTCGGGATAGACAAATATGTTCCCTGGTCGGGATAGACGTATCATGAACCTGGTCGGGA
+TAGACGCACGCTAGGTCTGTCGGTGTCTGAGCCGTTACTACCATGGGAAGTGTAGCCAAT
+GCCATCATAGTGGCAGATAGTTTTTTGATGTTCATAGAAATGGTTATTAATAGATTTGGG
+TAGATATACTATTTTTGTTCGGGAAGAAGGTAGGGCTGTGTTTTCTCTGTCACATTTCCT
+TGCAAGGATACCACAGCGGTACCCACGCAGCCCGTCTATCCCGACC
+>ds2020-328_256
+GAGAGGGAAGAGTTTTCAAGGAACCAGCTCCTGGGGACTTCTATTAAGAACGGCTTTTGG
+TCTTAGTATGTGGTACAGCATATAGAGTCGTGAGACGCTCTACTTCCTCTTGTTCAGTTA
+TCGATTCGCTGGCTGTTTCCGGGGGGCCCAGATGCTTTGCGAGACTGAAAGCTTCATTTT
+GTGTTCGGTTGCGTTATCTACCGCAAAGAGGGACTCCCCCTTTCTATTAGAACAGTGTTA
+GTTCGCTATTACTGCCGGTCAGGCCCTGGGTACGTCTATCCCGACC
+>ds2020-328_257
+TCCTGTTTGTCAATGCTCTCCCACCTCCTTTATCACTTAGTGCCAATTTTGGGGCCTTAG
+CTGGTGGTCTGGGCTGTTTCCCTCTTGACAATGGAGCTTATCCCCCACTGTCTCACTGGT
+TGTGTGTGCATCTGGTATTCTGAGTTTGTCTCGATTTGGTACCGCGTTAGCAGCCCGCAC
+CGAAACAGTGCTTTACCCCCAGACTATATTCACAACCGCTGGTCGGGATAGACGATGTTA
+GGTCCTGGTCGGATAGACGAATATGAGGACCCCGTCTATCCCGACC
+>ds2020-328_258
+GGTCGGGATAGACGAAACTAGAATTCTAACCTGGTGCCGTTAACCGGCATCGGAACAGTT
+TCAGGTGGGCAGTTTGACTGGGGCGGTCGCCTCCTAAAAGGTAACGGAGGCGCGCAAAGG
+TTCCCTCAGCACGGTTGGAAATCGTGCAAAGAGTGTAAAAGCATTAAGGGAGCTTGACTG
+CAAGAGCAACAACTCGAGCAGGGACGAAAGTCGGCTTTAGTGATCCGACGGCACTGCGTG
+GAAGGGCCGTCGCTCAACGGATAAAAGTTACTCTAGGGATCGTCTT
+>ds2020-328_259
+CTTTTTTTTTCGGTATAGGAGAGATGGAATGTCTATACCTAGTGGGAGTCTAATTTTTTT
+CACGTGGGGTGTGGGGTTTAGTTCTTTTTATTTATTTGTTGGTCAGCCTAGTTCTAGTGG
+GATTAGTTAATAATATTTTAAAAAAGATAGCCTAGTCCTAATGGGAATAGTTAATAATAC
+TTATTTGGATGAAGGTTTGTTTGAAATTGAAAGTAATTATGATAAAATTGGTTGCCATTT
+GCAGCCATTGATTGACGGCAAAGAACCCATACGTCTACCCCGACC
+>ds2020-328_260
+GGTCGGGATAGACGGGGCTTAGTGGTCGAGATATGCTTCCCCGTATCCAAGAGGGGTGGG
+CTGCCCGATCTCCCTATTCAAGAGAGGTGGGCGAACTGCCTATATAGCTGTCATTGGTTC
+CCCACTCCAAGGAAGGAGCCTTGAAAGGTTGAGAGTCAACCCGAAGGCAAATACAGACAC
+AGATCTCTCAATAGATCAAGGGATTGGTTTTTTCAAAAACTTAATAACCGATGCTTTCCG
+TACAATGTTTCTTCCAGTTAGGGCTTAGAATCGTCTATCCCGACC
+>ds2020-328_261
+GGTCGGGATAGGCGCCAGCCCAGGCGGTGTAAGCTCATCGGCAATCTCACGAAGAACACC
+GTCCGCTAACTGCAATCCAATCGCAGTGAGTGCCCGATTCAAGACCTCATCCTTTTCCAT
+CGTTGGAACACATTGTTGGCCATGCTTAGATACCCTTTAGTGCCTTTTGAGCAGCCCCTG
+TTGCACTAACAAGGCTCTCATCTTCAACACCAAAGTCTGGAATTTTTCTCCCGTCAAAAT
+AATTTCATATTTTCTCAACACGTCCCTGCTTCGTCTATCCCGACC
+>ds2020-328_262
+GGTCGGGATAGACGCAAACACCAACTACCCCATCAACACCGCCCGCAGGAAACTCTCAGC
+AACAGTCAGCTTACACCCCTCTACCCATTACTCCTAGCGAAGCTGTACAAGATGCAGGAG
+GGGTATTACCATCTTGTACACCCACTGGCGCACGTGGAGCACTCACAAATCTAGACGCCA
+TCTCTCTAGAAATGGAGGAGTGGATACCTGAAGAGATGGACGCTAAGACCCGAAGGGGTA
+TACTATTGAGTGCCGAGCATAGGGAGGTGACGTCTATCCCGACC
+>ds2020-328_263
+GGTCGGGATAGACGGAGCATGCTGTTGCTCTTGCATGGGCGGATAGCGTTGGGAAGGAAG
+AAACCGTAATCCGCACCTTGAACAAAAGGGGAACGATGAAGTTAGCCTAGCTTCGGTCTC
+TCTTCCCTTTCGTCTGCTATTCCTACGCCTTCCTGCCTTTACTTTTATGCTTGCCTGGAA
+GGAATGGGCAGACAGCAAGAAAGAAGGATTGATAATCAAAGAATAGAAGAAAGGCGCATC
+TCTAGCCAAAGACCGACATACCAGCATTTCGTCTATCCCGACC
+>ds2020-328_264
+GGTCGGGATAGACGTGTTTCAATCTTACAATGATTTTGTGCTCCGCCTCATTTCGGCCCC
+TTACTAACAATATGATCGGATGTCCATAATTAGATCTGCCAAATAAGATATGAGACTTTG
+ACAATTCTTTACCCCAATCTGGAGGTGTAACGTTAAGATACTCTTCATCCCAGTGTTCAC
+ATAATTTAAGATAACTAGGTTCAAGCTCCCTTTCTCCCCCCTTGAACTCGAGAGCCAATC
+TTGATAGCAAGAGCCACAGCCCCCGTCGTCGTCTATCCCGACC
+>ds2020-328_265
+GGTCGGGATAGACGAGCCTCTGCCCTGCTGTCCCATCTATTTGCAAGACCTGCCTTATAG
+TCGCCGGAGGGAATCCCGTAATCTCACTCAATAAATCGAATGTTGAGTACCCTGCTGGCA
+GCTTAATTGTTGACAGTAGTATATGGTAGGCTTTTATATGGTTCCTGATCCTCCAATCTG
+ATTTCGTATCATCTATATCAAGTGCCACCCTGTCGTACCCCCCTACCTGCCCTGAACTCA
+TCGCGTCCTCTTGTTCCAACACCCATGGTCGTCTATCCCGACC
+>ds2020-328_266
+GGTCGGGATAGACGATCAGACACGATACTCGCCTGGGCCCTCGTCGAGACCAACTCACTT
+CTCTCTCCTTAACGTCTGGTACCATTGCCCCGCCACTCTGCCTGTCTTCTTGTGGCCGGG
+TCGGGTCATTCTTCACTCCTGTTACAAGGGAGACCCCTCTTCGCATACCGACCCTCCAGT
+TAGTTCCACTTCTGGGGAGAAGCTGAGAACTCAGGGCATAAGGGCCTGCGGTGATTATTA
+ACATGCTTTTCCAGCCCATATTACTAGGTCCACGGCCCCACAT
+>ds2020-328_267
+TCTTCCGATCTGAATTACGGCGGTCGGGATAGACGTGATTTGTTCTTCCTCTTCCTGAGT
+TCACTCCTCTCTCCTCTCTCCTCTTTCTTTTTTTATTCTTCTTTTTTCTTTCCTTTCCTT
+CTCTCCTCTCTCCCCTCTCCCTTTCCTTCTCTCTCTTTTTTCCTTCTTTCTCTCCTCCAG
+TTTTCTTCTCTCTTGTCATCTGGCGATTTTTTTTTCCTTCTTCTCTCTTCTGGCTAGTTG
+GCTCTTTTTTTTCCTTTATCTCCTGCAACACTAGGTCCACGGC
+>ds2020-328_268
+GAATTACGGCGGTCGGGATAGACGCGGGTGAGAACATAGACTCAAGGAAATCGACGAAGG
+CAACCCTACGGAAACAAAGGGCAAAGGGTGAACCAAAAGTTAAGCCCGTGTCTGAACTGA
+CTACCCCAGCTACTGAAGTACCAGATGAGAAACCAGCAGTTGAACAGACACAACAAGTCA
+GTGACGTAACCGAGCCGAAGGAATTGATAAGGGAGAAAACAGAGCAGAAGGTTGACGTCA
+AGATTGAAGAACCGACAAGTAGCCACACACGTCTAGCCCGACC
+>ds2020-328_269
+GGTCGGGTTAGAAGCAAAAAGGACGTGGCCTACTCATCACCTTGCTCTTATGAAAGAGGA
+CATTCGTGAACAACCCCTAGATTCGGATTAGTGAAAATCGAAAACGCTAGATTAACGAAC
+AGCGGTTATTAGCCTAAGAGCGCTTACTGTAAGACCGTTTCACAGCAGCGGATGTGGTTA
+TTCCTCGAACAGCGCTTATTGCAAAGAGCCAAAGAGCCTTTTCTTCCTAAGGAGATATTC
+ATTAAACCATTAACAGTCGAACCGGCCGGAGAGAGATTGCTTC
+>ds2020-328_270
+AACCGATGAAGCAGGATTTTCGCAGTGGCGATTTGACCCATGCCCCCGGGCAAACAAGGC
+CAGAAGCTCGTGCCCAGAATGTAGAGGATCAGGACAATCAACCGACTGCGGAAGATGTAG
+GGTAGAGAACGTGAAGCCGAACCTGCCGGGAAGCAGAGACTGGATTAACTACATGACGCC
+TAAAGGAAAATCACTCAAATGGAACGGTATACAACTTATGACTGTGTCTGACACCAAGGA
+CAGAAGAGCTAATAACAGAAGACGGCTACGTCTATCCCGACC
+>ds2020-328_271
+AACGGCCGCCACTATATGATTTAGCTTTTTCCTACCCGGTTATTTTACCAGACATAGCGG
+GTTAGTATCCGTAAGCTATAACTCCCACCCTTAGCTTGTTTGGTTTGGACCCTTACGTTC
+GGTACACTCGTTAGGAAGCGAAGGGCTATAAAAAGGACTGCTTTCCAACTCACTAGCTTT
+AAAGTAAGGCTCTCCTAATGGCTCTGATCCACCTCCTCCCTCGCCCGGAACTACCACTCA
+AACTAGATCGCTGACAGAAGGAAGGTGCGTCTATCCCGACC
+>ds2020-328_272
+GGTCGGGATAGACGGGGCCCAACCGGAGATTGCTCGCGGCTCAATATGAATTGAGACGAA
+AGCTTTATAAAGCCTTTTGTAAAGATCCCGATTTCCTAGTGATATGCGGGACAAACATCG
+TTATAAGTTGTCCAAGTTGCCAAGAAAGAGTTCCTTTGCACGAGTAAGAAACCGATGTAT
+TTCCACGGGCCGCCCTCGTTCCGTATATGAGTTCTTTCGAATTTCTCGTATCGTTTTTCG
+TGGATTAGCATTTCGATGGGCTGTTAACGTCTATCCCGACC
+>ds2020-328_273
+GGTCGGGAGAGACGGCACCCACCCACTCTTTCCCCTTCCCCCTCTCACTCATATGCCCGA
+TACACATATGCCATAACTGGGTAGAAGCAGCATCTGAATCTACTGTAGATGACACATTAG
+CACTACCAAGAATAGTGCTTCCCTGAAGATGGTAGAGACCGTTAATCAACTTCCCTTTTA
+TCACAACCAGGGCACCCCGAAAAACCTTCAAAACTCCACCTCCACCCGACCCCATAGTAT
+CCGTCTATCCCGACCAAGGACTCTCTCCGTCTATCCCACC
+>ds2020-328_274
+GGTCGGGATAGACGAAAGCTTGGTGTTGCATTGCAATTTCAAATTTGATTTTATGATTTT
+ATTGATTTTGGTTGTTTCTTACAAGCTGTTGGCATGAAAGTTTTGGTTTTTAAGTTGTTG
+ATTTGGTTGGTTTAGGTCTCTCCTTACTAGTTGTTGTTATGTAGTTGGTTTTTAGTTGTT
+TTAGGATGTTGCTTACTAGGTGGTGTAGTTGGTGCAGTTGTGCCTCCTCCAATTAGGAAG
+AGACCAGCTTTAAGACTGCCAATGAACGTCTATCCCGACC
+>ds2020-328_275
+GGTCGGGATAGACGTGTAGAAATGGTTATTTACAGATATACCAGCTCTAATATTTCCAGA
+TATATTCGCCCCCACCGTAGCCATTATCTTAGGTGTTCTTATCGTAACAAAATCCAGTCT
+CACATATCTTAGTAACATTCCCTTCACACATACTTCTATCCCGCACGAGGACTCATTTAA
+ATAACCTATATACATTGGTGTCATTATCTTCCCATCCCTACTCGTCGGTTCCCAAGATCT
+GCAAACCTCTATTAATAGCCTATCCCGTCTATCCCGACC
+>ds2020-328_276
+GGTCGGCATAGACGATGGTTGGGGCTAACCAGGTGTTTCATTAGAGGTCTTAACCTGCCA
+ACCAAGATTTTAGTGAGAACCTTATAAAAAGTATTACACAGGCTAATCGGTCTCAGCTGC
+ATCATAGTCAAAGGGTTCTCAACTTTAGGAACCAAAGTTATTAGAGTTCTATTGAGGACA
+GCAGGCACTTCACAGGATCGGAAAATTCCCCTAACAAGGGAATACATATCAGCAGCACCG
+ACATCCCTGCTAAAAGCGATCAGAGCGTCTATCCCGACC
+>ds2020-328_277
+GGTCGGGATAGACGCCAACCCTTCCTGTTTTCCACATCGTTATTTCCTCCATCGATATCA
+AATTTCTCTTGCCATTTATTTTTTTGGGTCTTTATTGATTTATATACTCATCATCCCGCC
+GCTCCTACCAACGCTTACTTACTTATTCAAAGGGGTTCTAAATAAAATAATCAGCCCTTT
+GAATAAGCGAGGCTTTCCCGATAGAAATAGTTGCATGCGAAAGAGATCCCAATTCCGTGT
+ATCCGGTTAAGCAAGCCCTTCCTACGTCTATCCCGACC
+>ds2020-328_278
+GGTCGGGATAGACGTAGACTGTTTCCTTTACCAGTTGTACTTACGAGGAGACGTTTGTTC
+GCTATGTTGCAGGCGACTTTTATGACCTCGCTACCATATGTGGGCGTTATAGCGATGACA
+AGTGCTATTCTTGGTCAGGAATGTCTTCCGATGTCCTCCGCCGTGTCGCCTCTTACACTC
+TTCATTCGTCGCCGTCAATGGTCCAGTGCTGGGAAATGTTCCACTATCGCCTTGACCTCC
+CACCAGCGACCACCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_279
+GGTCGGGCTATACGGCGTCTGCCCTTGAAATCTTCGAGATAAGATGAAACTTCATCTACA
+TCCCCATTCGCACACTTGATAACCAATCGTAAGTCGTCACGCTGCACGAGCTGCTTCAGT
+AAACCGAAGGTAATGACTCTTAGCATTGTGCACTGATGCTGACTTGCATCTAGCACTATG
+ACTGAGTAGAGCTGTAAAACCCTCATGTCAGACAAATCCTATTATCAGTCATATATTCGA
+CATCATCCTCACAGCCCCATGTTTCGTCTATCCCGACC
+>ds2020-328_280
+GGTCGGGATAGACGCTAGTCCGCCATGTATTCAGCCTCCGTAGTCGACAGAGAAACTGTA
+GATTGTAGAATCGACCTCCAACTCACTGGACCTCCAGCAATACTGAATACAAAACCTGTA
+GTGGACCTACGCTTGTCCAAATCACCTGCGTAATCAGAATCCACATATCCAACAACACAT
+TGACCAGTAACTTTATCCTGCTGAAACAATAAACCAACATCCACAGTACCCCAAATAAGC
+GTCTATCCCGACCAGTGGGCATTGTCGTCTATCCGACC
+>ds2020-328_281
+GGTCGGGATAGACGTCAACGGGTACTCAAAATGATTTGAAGTGTAATGCGAAAGGGATAG
+ATAAGATAGATGAATTGAATGAAAGCTCGAAGACAAAGAGAACCGGGCTTTCCCAAAGAA
+TTACTGAAGCTTTCCCACTTCCTAATAGGATCATGAAGAGGAGACATGCTCTGGTAAAAA
+AAGTTCCCTTTCTTTTCATAGGTTCTATCGTTTTGCTTTTCTATCTTATTAGTCTTCTTT
+TTTCCTGCCAAACCCGATCTCGCCGTCTATCCCGACC
+>ds2020-328_282
+AACGGCCGCCACTATTGTTTTTTCCTCATCTCATTAAGTTCTCTGATACAACACGTAAAC
+GCTCTAATTTTAATGATTATTTTATGATCCTATCTTTTCTTTTAACTTTGACTTTTTATT
+ACGACCAATTTTATTGTTTTATTGTTCGACAAAAGGTTCATTTATATACAATAATCGGAT
+TGTAGCGGGTATAGTTTAGTGGTAAAAGTGTCGTTCGTTCTATCATCCCTTAGTAGTTAA
+GGGATTATAGAGCATCACACCCACGTCTATCCCGACC
+>ds2020-328_283
+GGTCGGGATAGACGCCGTGACTCCCCCCCCTATTTTTAAAGTACCCCTCTTCCTATTTAG
+GGGGTTGAGGCGAGAAATGGCTTGATGAACCGTTCCGTTCGCCACGCACCGGCCCCATTC
+ACTTGCTTATCGTAGAGGCTGTAAGTACACAGTGCTCCACAACTATTCATAGTATAGTGG
+GGTTGAAACACGAGAGTGCCCGCCCTTTCTTTCAAGCAGGCCACTCTTTCCGGACCGCCG
+TCCGCGGTAACCCCGACCTAACGTCTATCCCGCCC
+>ds2020-328_284
+GGTCGGGATAGACGTCACATCCTCATAATCCGTCTATCCCGACCAGGCAACTCTCACGTC
+ATCCCGACCGCCGTAATTCACCCCTAACCACACCTCATCCGCTGATTTTTCAACATCAGT
+CGGTTCGGACCTCCACTTGGTGTTACCCAAGCTTCATCCTGGACATGGTTAGATCACCCG
+GGTTCGGGTCTATAAACAGTGACGAACGCCCTCTTCAGACTCGCTTTCGCTTTGGCTTCA
+GCACAACTATGCTTTAACCTGCCACTGCCAACTAA
+>ds2020-328_285
+GGTCGGGATAGACGAAGAGACGGTGTTGGCGGGATTCGTGAGCTCAATTTTCCTTTCGCA
+TCCACTATCTTTGATTCCACCGACGGATTCTTTAAACCCAGGTGGGCATACACAGTATGA
+AGAACTCGAACCATCGCTGACACATATGGCATTAGGCCCGCACATGCCGTGAACTCTGCA
+CAATTCGTACCCTGCTTGCCAACCGACGGTCAATTCTCTAGGGCTCTGATCGAAACTGTA
+AATTCTGAGATCCCCGCGCGTCGTCTATCCCGACC
+>ds2020-328_286
+TAATACACAGCAACGGCCGCCACTATAACACTTGTCTTCCTATCTTTCTGCCTATCTGTC
+TTTCCTCTTTCTGCTTTGTCTTTCTCGCTGTCGGTAGAGATTAGTATTTCCTAAGTTGTC
+TGAGGCTGAGCTTCCCTACTTCTGTACTTGGTTGCCTGTCTCTAAGCTGTACTTCCTTGC
+CTGTATCTAAGTAGGTACGTCTCGCTTCGCTCCTCATTTCCTTGCCGTCTTTCAATTCTG
+ACTATTGAGAAATATCCATGAGTCTGTCCCGACC
+>ds2020-328_287
+GGTCGGGATAGACGGTTCGGTTTCCTCTCCCGTCGATTGGGGGCATTGAGTAAAAGGGGA
+ATGGGTGATCGATGAAAGAAATCTACTCCTCAGTCTGATAGCGGTCAGGTCTTATGGCTG
+TCGGGCAATCGCTCCTAGGCCGTTGAGCATGCCGGTAGTCAATTAAGAGTTCGGAACGAC
+ACTAACACATCGGAAAGTTAGCCGTACCGGCTCTTCCCGGCTTCCTAGCTTAGTTGGTAG
+CTGACCTAACCTACGCGCAACGTCTATCCCGACC
+>ds2020-328_288
+CGTAAAGCCGGTAGGAGTAGTGAAGAACTATAGATAACTTTTGTTGGTTGTTAACCAACG
+GAAAGCATGGGAGTGGAGCTCGCCTTAGCGAGCGAAACACGCGACATAACATAAAGGAGA
+GTATGAAAGTGAAAGCGGAGATCCTGGATAGCTGCCCTGTTTATAAAGGATCTACAAGGA
+GAGATCTATATAGAATTAGGGTTCCACTTTCCCTATCTCGGAGCCAACCCTAGGGCTAGG
+GTGAGGCTGGGAGGTTTGCGAAACACTCCGCCGA
+>ds2020-328_289
+GGGCGGGATAGACGATAGATAGGTGTTGAAGGAAATAGTCTCTGCTTCTCAGGGTGCTTT
+CGTGAAAAATAGGCAGATTTTGGATGCCGTCTTAGTTGCTAACGAGGTTGTTCAGGAAGC
+CGTGAAGCGGAATAAGGCGGGTCTGGTCTTTAAGATTGATTTTGACCATGCTTATGATCA
+TGTAGAATGGGATATGGTCGATGAGGTTTTGGTTAGGAAGGGTTTCGGAGGAAGATGGAG
+GAGATGGATCAGGGACCACCGTCTATCCCGACC
+>ds2020-328_290
+GGTCGGGATAGACGATACTCTGGGGTCAGCTTCCAAAGCCAACAACGATGGCTCATACCA
+CTCCAGAGTGGGATCATACCGCGTGGTCATGTAAACATCGAAGCAAACACCGGGAATGTA
+ATCGGAACCGTATAACATAGACTTAGCAGCCTCCACACCGCGAACGAAAACCTTACGAGT
+AGCATTAACAACGTAATCGGTCATGAACCAAGCCAACCTCTCAATGCTGCATGACTAGGT
+CCACGGCACAGCGAAAGAAACTAGGTCCACGGC
+>ds2020-328_291
+GGTCGGATAGACGCTGCTAACCTCTGGTCGGGATAGACGATACGAAGGGGTGCGGTCCGT
+CTATCCTCGGACAGAGAGCCGTGGACCTAGTGTTGCCGTTGTTTGTGTTGTGGGAGTGTT
+TGGAGCTTCTGGACTTTGGAGAACGAAGAAGGCCAATTTCCCCAAACGAAAAACTGAAAC
+AGAGAGAGAGCCATGGAATCCAACGAATATGAACGTCTGAAACGTAATTGATTTTAGAGG
+TAAAGAGAGGGCACCTAGGACTAGGTCCACGGC
+>ds2020-328_292
+GAGAAACTTATGAGGAATTTCTTATGGGAAGGTTTGGATGGAAAAAAGAACCACGCTGTG
+TGGTGGGAGGTTGTAGGCAAAGGAAAACTTTTCGGAGGGTTGGGAGTAGGTTCGCTGAGG
+ACAAGGTGTGCGGCTCTACGAGCCAAATGGCTATGGCGCTTTCCGATCGAGCCCCACGCT
+CTATGGCATAAAGTGATTAGAAGCATCTATGGATTGGATACAAATGGGTGGGATGCTAAT
+CCTGTAAGTCGAGAACCGCGTCGATCCCGACC
+>ds2020-328_293
+GGTCGGGATAGACGCCTCGCAGGAATTCAGCTATAGCTCCGAATGCACATTTAGAGGGTT
+GTGTCCGTATACAAAGCCTCTGTCCTCTCTGTAGTGTGAAGCGGGTTATCTCAAGTGATG
+TCGTTCCCAGAAGTACATCGTCACCGTTGTGTAGTGAAGAGCCAACCTCTTTCATCGGAC
+CTAACATGAAGTCAGTGTAGACGGCATTCAGGACGGAGTTAAGGAACGTAGTAAGTCGGT
+AACCTGACAGCAGAATCCCGTCTATCCCGACC
+>ds2020-328_294
+GGTCGGGATAGACGGGTAATCTCCCTCTTGTTGCTTAGGCAACTTAAACCCTCAACATAG
+TGAGGTGTGGGGCGAAAGGGGCCACCATTCTCTTTCTTTCTTCAATCGTTCCGATCAGCA
+CAAGTGGGTTGGTTCGTTTCGTCCTTCTATCTACGCAATTCTCTGTCTTCGTTCGTGATC
+ATGTTGGGCGAAAGGTAGTTGTAGAGGAGCGGCTGTGAAACGGTGATTCCCCCTTTCCAT
+TGAAGTAGGGGGGTCCCGCGTCTATCCCGACC
+>ds2020-328_295
+CGGTCGGGATAGACGGCGGAGGAAACGAGGAAGTTGCTGAGGGTGGCCCAGTTGGAGGCT
+GTGAAATCGAAGCTTCGAGAAGTCCAGAAAAGCTGGGTATCGTATCCGGAGTTTGTTCGG
+ATATGCAAGGAGGGTTGTTCGGATCCGGATCTGGGTCTCGGGTTCGCCAAATCGTTAGAC
+GAAAACGGGTCCGTTATCGTGTTGGGAAACGCCGTTTGCTTGAGGCCTGAGCAGGTAGCT
+AAAGCCATCCAGGTTCATCGTCTATCCCGACC
+>ds2020-328_296
+GGTCGGGATAGACGGTTGGTACCTATCTGCCGTGGGCGTTGGAAGTTTGAAGGGGGCTGC
+TCCTAGTACGAGAGGACCGGAGTGGACGAACCTCTGGCGTACCGGTTGTCACGCCAGTGG
+CATTGCCGGGTAGCTATGTTCGGAAGGGATAACCGCTGAAAGCATCTAAGCGGGAAACTC
+GCCTTAAGATGAGACTTCCCAGAGACTAGATCTCTTTAAAGGGTCGTTCGAGACCAGGAC
+GTTGATAGGCTGGGTGAACGTCTATCCCGACC
+>ds2020-328_297
+GAGAGCCGTGGACCTAGTTTCGGTCGTCCTGCCGTGGACCTAGTTAAGTTGCGCCTGCCG
+TGGACCTACTCGGTTCATGACTAGGTCCACGGCTCTCTGTCCGTATTACGGCGGTCGGGA
+TAGACGAGATGGGTGTGTATCCCGACCAGAGCAATTATACGTCTATCCCGACCAGGGGTA
+TGCTCCGTCTATCCCGACCAGGATTAAGATGCGTCTATCCCGACCAGGGAATTCGTACGT
+CTATCCCGACCGCCGTAATTCAACGTCACAGC
+>ds2020-328_298
+GGTCGGGATAGACGCGATACCTCCCTTACCTTACTTTTAGTGCTTTTAGTCTCGCCAATG
+CCTTCAGTCGAGTTAAACTTTCCAGCTACTCCGTACTCTTCTCTTACAGATGAAGTTAGA
+GATTTCGCTTTACCAAACCTTCTTCCAGAAGTCAAAGATTTTACAACCCTAGTTAGATTG
+TTATATTGGAATACAATATACTTAGCTAGCTGTGTTTTAGTCCCTCCTAAACCCTTCACT
+CCTCTAAACTTACTCCTCGTCTATCCCGACC
+>ds2020-328_299
+GGTCGGGATAGACGGGGTACAAGAGTTGAGGGACTGCGGTCTTTGGCATCGCGAGCTTTT
+CTACCTTGAACAGGTTGATGAGCCCGATTTGCCCTTTTGGTCTTTTGCCGAGATCAAGAG
+CAATAATCTTCCAACTGGTTGGACTCGGGTGTCACCTCGGTGGTATCCCGATGAGGTAGT
+CCGCGGATGGCAGTTTAGACTGTCACACGAGACGATCAAGCTTGCTTGGTCTCAACCAGT
+TATTAAGGATTCTGCTACGTCTATCCCGACC
+>ds2020-328_300
+GGTCGGGATAGACGACGAATTTCTATTCTTATGGACTGAATGTCTTTCATAAGGAATCGG
+AGGAATATTCGACGATTTTTTCCAGGAAATCCCCAACGAAAAATACACACTACGCCCTCT
+TTTATATCGAATCGATCATAACCACTACCTACATTCCACGAAATTGTGCACCACAAATAA
+GAGCTAATAAAAAGACCTGCGATCCCATGAAAACACATCACGATCCCTTGTGGGAAAAAA
+AATTATTTGCCGAGAAGGAAATAAAGATATA
+>ds2020-328_301
+GGTCGGGATAGACGGGAAATGGTGATGATGGAACAGAGAAGAAAAATGATGAGGAAAAGG
+TTGATGAGATTAAAAAAGAAGGGAAGAAGAAGAAAGATGTGGAGGAGAAAAAGAAGAAAC
+ACAAGGGTGATGATGATGAGAAGGAGAAGAAAAAGGATGAGGAAAAAGACAATGAAAGCA
+AAAAAGAAGGGAAGAAGAAGAAAGACAAAGATGATAAAAAGAAGAAACACAAGGGTGAAG
+ATGATAGGAACTTAGGACGTCTATCCCGACC
+>ds2020-328_302
+GGTCGGGATAGACGGGGGGCATGCGTCTATGGCTCATAGGGAAACTTCGGTTAATAATTT
+ACTTACTGCAAGCCATACATTAGAAATCCAACAAGCAGTACAAGGTTTAGAAGATGCTGT
+TGCGACAGGTATGGAAAAAGCTCAGAGTAAAAGTTCAACAGCTGTAGTAGATTTAATGGA
+TATAACTAAAGTATACCAAGGTGTGTTAGCAGAACATGGTATTTTAAATTATGGGCTAGT
+TGGGGAGAGCAGCGAGGCGTCTATCCCGACC
+>ds2020-328_303
+CAGTTACCTTTCACAAATGTAGCTATCGATCGGGCTAAACATCCTCTGAGAGTACCATCT
+TTTGTACCCATAACCCTAAGGTATTCATGGTAGGTTTCGTCCACTAGTAATTTTGACTCC
+TGTCCTTTAAGCCTTGCTTTTGCAGCCACCTCGTTCCACGATATTGCACCTGAATAAGTA
+CTATGTATGCTGATAACGTCATCGCCGTGGCACAAACGCATTTCAAGCCCTGATTCGACG
+CCCATATTAGCCTGAGACGTCTATCCCGACC
+>ds2020-328_304
+GGTCGGGATAGACGCCTCATCGGTATGCTCCCAGGTACCTGTAATTGTGATCCGTTTGCC
+AGAACTAAGGGGTCTTTCTGTGGAAACCTTCACGAACAATCGTCGTTTTTTGATGGTTTT
+TCCGCTTCTCACAGCTGCTCTTTCTACACCCCCGGATATCTGGTGCCAAACCGTCGCCCG
+TTTCCTTATTTCTTCGATAATAGAGTTGTCTAGCTTTGTGGCATACATTTTACAAGTTCG
+TGAAGAAGGCAGGACGAGTGGATTGAGGGAA
+>ds2020-328_305
+GGTCGGGATAGACGACGAGTCTTCTGCCGCTGTTGCTGTAGTTTAGTCCGGGAAGAGGAA
+ATTCATTAAGTGTCACAGCTTGATAGTGAGAAACTATCTAATTCATCTATATCTTACAAT
+CGATGGACACTGCTCTATCCCTACCTGAGCTAGCTGCAAGACAAGCGAACTGCCCTTCCA
+CTTCAAGAGACAGCCTGCCTCCATTTCACTTAAATAGTAATTAATCAGCAAACGGGGCTT
+AGTCAAGAGAAAGGCTGCGTCTATCCCGACC
+>ds2020-328_306
+GGTCGGGATAGACGTTGGACTCCACTAGCGTTAATAACACGTTAAGTGGCAGGACTAAGA
+TTAAACAACGGTCGAAGTCTGAACATCATATGTAAACTGCATTATGGAAATATAATTGTG
+GAGAAATTAGGGTGTATATGAGACTATAAATACACGAAGCAATGACTAAAGTTAAATAGC
+AATGCGACATGTGTTATAACCTCAACAAACATTAGAAGAATGGTTTAGTGGCGGCCGTTG
+CTGTGGTATTACTCTTTCGTCTATCCCGACC
+>ds2020-328_307
+TGAATTACGGCGGTCGGGATAGACGAATTTGCTCCCTATAACGTCTCTCTCTCTTCATCT
+CCACATACCACTCAAACCTCCCCTTCCCATTCACCTCATTCCTCCTCTTTCCTCCCTCGA
+TCGCACTCTCCAAAATTACCAAACTCTCCTTCCCGTTCAAATGATTCCCCTCCATGCCCT
+CCACCTGCATGCTTACCTCCCTCACGTGCAGCTCCCCGCCTTCGCTCCAATTGCATGTGA
+CCACCATACCGCACTTCCGTCTATCCCGACC
+>ds2020-328_308
+GGTCGGGATAGACGATTATTGTTCCTCTGTGCATCTCTGTGATGGGTAAATCCCCATGAA
+AAAGGGGCAACTTTCGTGTAGTTTGTGATTGGATGTAACTGTTAAGATTTTTTCTCGGAT
+AAATCTTTCTCTTAATAGATCTCTTCTTGTTCCTCAATCTTCGGAGAATGCGGCGTTGTA
+TTATTGTAAGTTCTCTGTTCCGAACATTTCCTGAAAGTAGACGACAAGTTTTAAATCTTA
+ATGCAGACAAGGGCAGTAGTGGCGGCCGTT
+>ds2020-328_309
+GGTCGGTGTAGTCAACTCCTTCCTTCTGCTGGAATCCTTTGACAACTAGTCGGGCTTTGT
+ATCTCTTAGAACCATCATGTTCTTCTTTCACTCGGTACACCCATTTGTTGTGAAGTGCCT
+TCTTCCCCACGGGTAACTCAGCTAGTTCCCATGTCTGGTTGGAGATCAGAGACCTCATCT
+CGTCTTTCATGGCAAGCTCCCACTTGCTAGCATCTCCAGTCTGACAAGCTTCATCATAGC
+ATTCAGGCTCACCCTTCGTCTATCCCGACC
+>ds2020-328_310
+GGTCGGGATAGACGTCCGAAGGGTCTACATCTATTACGTCTGGCCTCATTCTGTGTTCAC
+GTTCTTTAACCCAGTCTACTTGACCGTAGCCTCGATTAACAAGTGTATTTAACTCAAACA
+TATCCGTCAGATCAAGTAAGTCCCTAGAGTGTAATGCCTTCAGTGTCACTGATACGTCCA
+TCAGTTGTTCAAGCATTGCGTAGGTGTTTTCACACCACACTTTGTCTGAGTGGGTCAACA
+ATAGAGCACCACAGACCGTCTATCCCGACC
+>ds2020-328_311
+GGTCGGGATAAACGAGCCTCACGCTTCAATGAGAGCCACTCTGTGGCCGCTGCAGACTTA
+GATGACAAGAGGTAGACCCCGAGTGATCTGTCCAGCTGGCGTAGTCGCTTCAAAGTCACA
+CGCGAGTCAAGGCAGGAAACTTCCCGTGCTATAACCACTGTCGGATGTAATGCTCTGTGG
+TCACTCACAAAGACATCCTATCGAAGGACGCCTTTATGTTTCCATTCACCCTTGGATCTG
+TAAGAGCTACCTGTCACGTCTATCCCGACC
+>ds2020-328_312
+GGTCGGGATAGACGATGTACACACCACCCACTTTCCTCTCATCACAATAATCCAACAACA
+CAACTCCAATGTAATCTGTTCTCCAAGCCTCTTAAGTGATGTCCTAACAACATGCACCTG
+CCAGCAGAAAACGAAACCTTTAGAATGCAATCTCTAATGGAAATTGGATCGATTAGTAAG
+ATACTAAGATATGTGAAGATTGACAGTTCCCAGAAGTGAGTTATTGCAATGAAAATTTGG
+ACAAACAAGAAAAACACGTCTATCCCGACC
+>ds2020-328_313
+GGTCGGGATAGACGGACATATTAGGTGGGTTGAGGCCTTTGAGTTGCCCATAGTGTTTGC
+CCTTTGCACTCTGATGGAAATCAACTGTATTGTGTTAATTGGTGCGGTTGAAACAGCATC
+AATTGCTATGAGGTCTGCGGATGGCGGAAAGTCCTTTGTTCTGTCATCCCGTCCAAAATT
+GCAGTCCAGCACGTCTGCCTTTAGCATGGCCAAGGTTGCAACATCGGCCGCGTCATTTGG
+AGGAACGGGGCAAGAACGTCTATCCCGACC
+>ds2020-328_314
+TGAATTCGGCGGTCGGGATAGACGTGGATGAGTCATATGGAGAAGGATTGGGAGCAGAGG
+AGTATGATGAAGGATTGGGATTTGACTAAGACTGTGTATTTGTGTTTTGGCACCTATGGC
+CGGAGTGCTGCTGTTTTTTGCAATATTGAATCCTTGGAATTTTCGTCTTCTGGTGTTTGG
+TCGATGAAGGTATATTCAGTTGGCACAGCGCTCAACGGTATGGGTATAGGTGCCAAAACA
+CAAATACCGCACTTTCGTCTATCCCGACC
+>ds2020-328_315
+GGTCGGGATAGACGCAACCATCCCCTTATCGATGAATACGGAAGGGCGAATCCGGAGATT
+ATCCGTACGTCGTCCAACCAACCCTATAGCTGGAAACCTTTTCTTCGGGGTCGATTGACT
+GAAGGATCTCCCTCCTCCAACTATTTCAACTCTCTGTTATTAGTATGGCGAGCCGAACTA
+AAGGCGGTTCTCTTCTCAAATGAATTGCAGTTTGACCCAATAGTGAGTAGCCTTTCTTCT
+TTCTACTAGGTCCACGGCTCTCTGTCCGA
+>ds2020-328_316
+GGTCGGGAAGACGGGGTGGACGTATGTCCGGAGGTGATAACAGGAGACTCATGTTATGTG
+GGTTGGTGAGGGTCGAGGACAGTGGTACCCGCGGACCGGTGTCGCGGTACGCGCTGACAC
+CGACAGGTACGGAAACGGACAGACTTCAGGAACAATATGCCTTATACGGCTTAAAATTTA
+TTCAAAAACAGTATTAAAAGAAGTATAAAATCGGATAAAACAATATAATCTTAATAATTG
+ACAGTGACACAGTGTCTTAAACGTGCTAA
+>ds2020-328_317
+GGGCGGGATAGACGAATCGTCTCTCGTCCCCAAAGTAGTCTGCCTTTTGTGTCATCATTT
+AAGTATGTTGCTTGTAGTGTCCAAATGAACATGTTTTCTGCTTGTAATAGAAGCTTGGTA
+GCTCCGAATACTGCTCGAATTTTGTCAGGTTCATCAGATGCGACAACATGTGAGCGTGCG
+TGTAACGTGCTCCAATAGTATGGCACTGGCTGACCATCTTTCCAGAATGGAGTTAATCCA
+TCCTTAATAAAGTGGATGAGTGATCGGTT
+>ds2020-328_318
+GGTCGGGATAGACGATTTTCCTTTCTTGGCTGGGCCAACCGATATCACCTCTGTTTTAGA
+AACTATCTTCCTCAATTTAATCGCTATTAGCGCTGAATCCAACTGTTAGCTTTTGGTTCC
+TGCTGCAATTTCAGAATATCTGACATTTTCCTGTCCAATTCAACTTGTGTGTCACGGATT
+TCCTTATTCAAAAGCAAGATGGCCTTCACATCCTCTTTTAGCTGCAGCTTCAATCTCTTT
+AACAGTATTACCCCCCGTCTATCCCGACC
+>ds2020-328_319
+GGTCGGGATAGACGATATTGCCCTCTTTTCTTCCTAGACTATACTAATTCAAAATCTCTC
+TTATTAGCATACTGTTGGGCTTTTGCGGTAACCGCGTGCATTGAGACCCTTCATACCTTA
+CGCACTGGGAGGAACACTACGCTTTCACCCAAGAGTGTAAGCCAGCGTCTCAGCCATGTT
+CAAAAGCGTACCACAGGTTATCGCTCAGCCAAGACTCAAGCACTCATATGGATGAAGGGG
+ATACATCTAGCTGACGTCTATCCCGACC
+>ds2020-328_320
+GGTCGGGATAGACGGGTAGGTCGGCTACTGAGATCAACACCACGGTTGGGAAATCGAACT
+GGAGTTGGGTGGTGGCCTGTGAGAGTCAAGTACTTCATCAATCTTGGGATGTTATCAGGT
+CGGCCCTATCATGCTGGTTAGATAAAGAAGTTGAGCTATTTCCATATCAGGTTAACAGGG
+CTTTCTTTGTTTGTGAAAGTAAAGAGGAGGCTCTGAGAGTAAGCAGCGCTGGTAAGCTCG
+TGATGGAGGTTGTTCGTCTATCCCGACC
+>ds2020-328_321
+GGGCGGGATGGACGGCCGGGGGCTCTGGCGAAGTCGGAAGAGGATTGCAGTCATCTTGGG
+GTGGGCTTACTACTTAGATGCTTTCAGCAGTTATCCGCTCCGCACTTGGCTACCCAGCGT
+TTACCGTGGGCACGATAACTGGTACACCAGAGGTGCGTCCTTCCCGGTCCTCTCGTACTA
+GGGAAAGGTCCTCTCAATGCTCTAACGCCCTACCGGAGGCTCTGGGGAAGTCGGAATAGG
+AGAGCACTGTCGTACGTCTATCCCGACC
+>ds2020-328_322
+GGTCGGGATAGACGACGGTCGGGTTATTTCAAGAATATGCAGGTTATCCAACATCTTATG
+GATGCCAAGCATTTAAACGTACGTGCCATATTGCAGATCATAATGCAGAAATTGTAAACC
+GTTGGGAAAACACAGGCATTTTAACTTTTTGGCGTACCAATACTCCTGAGTTTGGTATCA
+AAGGCATTACAGAATCATATGCTTGTGGAGCTTGTCATAATCCTTGGAATTTAAAACATA
+ACAGTGGTTGTTAACGTCTATCCCGACC
+>ds2020-328_323
+GGTCGGGATAGACGGGGGTGAATAATCTGAAGAAGGCTATTCCGAATCCGAGGGAAACTG
+TGAAGAAGAAGACTACGAAGAAGGAAACCGATGCCTAGGCCAAGGCTGGTACCTAATTTT
+AAGTTGAATCTAAAGCTGAAGTTAGGGCTGGAGCCTGAGTTGGTGTTGATGTCCTAGAGT
+AGCGAAACTACAAGTGAAGGGGCGCTATCCGGAACCCTTAAGGTCGGGGACAATCTGCTT
+CGATTGGGACTTGCCGTCTATCCCGCCC
+>ds2020-328_324
+GCCGTGGACCTAGTTACTTACTATCTCCTCTCAATATTCTCTATGTTTTGACATGGTATC
+AGAGCAGCGATCTTGCTGACTCTAGTCTTGAATTGTTGTTACCATCATGGGAGAAGATGA
+TTTTTCCCCTGTTGGGAGTAGCACCACCGATCCTACTACTTTCACCGAATTTGCTGCTCA
+AATGGCTGAGTTGATGAAGATACAAGCATCAACATCAAATACAACCCCGACCCCGACTAT
+TACCGACGAAATGGCATCAAATACGACC
+>ds2020-328_325
+GGTCGGGATAGACGGACGGCTGTATAGGGGGATGAAGGGAGTGAAGCAATGGTTAGGTGA
+AGAATGGAAGCCAAAACTGAAGTCGGCGAAGTATGGCTGTGTAAAATAGTCGAAGCCTCC
+AGATGTAGACATCGAAGAACCAACAGCTCTCCCATTTTACCCCTGAAGCTCTCCAAACAG
+CTAGTTGAAATCCAACCAGACGCCTCTCAACCCTAAACATCCGCTAGTTACATCCCAAGG
+AAAGAAAGGGCCAACGTCTATCCCGACC
+>ds2020-328_326
+GGTCGGGGTAGACGACGGCCGGGCGTCAGGGGGGTCGAGGGCATGATGGCCAAGCGAGAA
+GTGCGACGCAAGGGTGTACCGAGGTACTTTGAGTATTTTGTCAAATGGAAGGGCCTGCCA
+GAGTCCGAAGGCAATTGGGAGAAAGAGGAGTCCTTATGGCAGTACAAGGACTACATCGAA
+GCATTCGAACGAGACGGATCAACCTCGACGACGAGGACGTCGCCGAAGTAGGTGGGGGAG
+GATGTCCCCGGCATGTCTATCCCGACC
+>ds2020-328_327
+GGTCGGGATAGACGTGCGGGGTGTTTGATGCACCAGTCCAGCGTCAACAGTTTCCTATCT
+ACAAGGTAGTAAGCCATGGGGTGTGCATTGAGTTTACAGACAAACGCATGAATGCTTCCA
+AGGTTTACAAGGAAGCACCTAAGCCAAAATCTATGTGGAAAATTGCCAATCGGCACGGTA
+CTTCAGTAGAAAAGATCTACGAAGAAATTATCTGATCTTCTATAACGGTTGCGAACTCTG
+CACCGGGCAATCGCGTCTATCCCGACC
+>ds2020-328_328
+GTCTAGTACTACATCCATATTTGAGAGCCACGTCCGCCAACATTGCGAGTTTGCCACATA
+TGACAGACTGTTATTAGGTAAACTTTCTACATTCCCAAACCATGAACTTTTCAATTTTCT
+GGCTCTACCAAATTCACTTATCTCTTCACTTTCGTTCCAACGTTCTATATTAAGATTTAC
+CCGTTTTGTAAATTTGTTATTACCGTTTAACATGCTCACTTTTTCCAGACCGCATGTCTC
+TAAATTTGATGTTATAGCTTCTACATT
+>ds2020-328_329
+GGTCGGGATAGACGGGGGGATAGCTTAAACATCATCTCCTCCTATCCCGGTGGGAGTACT
+GAAAGAGGGTGTTACGGGCTTCTTCTTATAAGAAGGAGGGCTTTAGGGCTTAACTAAGTA
+AGAGGGAGGGCTTTAGGGCTTAACGAAGTAAGAAGGAGGGCTTTAGGGCTTAACTAAGTA
+TTAGTTAAGGGCTCGGAACTTCTAGTAAGTGAAGGTCAGCGGGAGCTGCTATCGGTAGCG
+GAAAGGGCCTTGTCGTCTATCCCGACC
+>ds2020-328_330
+AGTCGATAGCCATTGTAGTCTCGCGACAGAATTACGGCGGTCGGGATAGACGTGCGCCGT
+GGATAAAGACATAAAAAAAAATTACTGTAATAGTGGATTCGGAATTGTGGTGTAACCTCC
+CATTGCTCTATCTCCGATAGCATGCAGCCGATAATGAGGACAGATATATAGAAAGTGTGC
+AGTGAGGGATCTTTATAGGTAACCAGTCTTTACTTATCTCGACTCAAGCTTTACTTAGCC
+CAAGCAATGGGTGCGTCATCCCGACC
+>ds2020-328_331
+GGTCGGGATAGACGACGTCTGGGAATCTAAAGTGACCGGAGCGGCTTTTCTGTATGGATC
+GACGTCTGGCCCCCCATTTCTCGTGTTTTTTGGCTTAACATTTATTCGCTATGAAACTGA
+CAGAGATGTAAAGGCAGAAGCCTTGTGGTGCTCTTTGATGGCAAGGATGCTTTAACTTGC
+ACGCGGTAACCCGTATTCCGTATTCCTGTTGAAACAAATCCATTCTTCCAGAACCTGTTG
+GAAAAGCTCACTACTTCGTAGCCTTT
+>ds2020-328_332
+GCCGTGGACCTAGTCGGTGTTGGGCTGAATGGAGGCAGCAGAATATGCGACGACGATCAT
+AGTAGAACAGGTCAGGGCGGCAGTGAGGTCAGCATTTCCGGCCGCCAAACCGAGCACATT
+CGACGACTTCATGGACGATGCTTACGAGTGGCTGGTCTCGGGATCTTCTGCAGGGATGCC
+AAGTGTATTAAAAAACACAACTGACCCTGTAAGGGATTTTATACTCAAAGATTTGGGATT
+AGCACCGAACAACGTCTATCCCGCCC
+>ds2020-328_333
+GGTCGGTATAGACGGTCGCTGGTGGTGCGAGCTGGGAAATGGGGTGTGCTGGTGAGTGAT
+GTGGAATCGGCGGAAAAAGAAGTGCTGAATGTTTCATCCAAGGAAGTAAGGCAGATAGAG
+AAATCTATGGCATCAACAAGAGAGATGAAGAAATATGTGATAGGTAGGAAGTAAATAGCT
+TAATAGCTGTCACTTGACTAGAGGTTTGAGTCTAGGTCAGGGACGAGAGTTCATAAGGGG
+GCTTAAAACGCGCGTCTATCCCGACA
+>ds2020-328_334
+GGTCGGGATAGACGAGACAGTTGCATCTATACTATTGAGTTGAGAGAAAGAGAAGATGGG
+ACTAGTTTGCTACTCCCGCGGGCCCTACTTACGTAAAGCTTATCTCCTCCAGGAGGCAAG
+GGATTGCTGCTTCCACAGCTGTCTCCACTCGGTCAAATGCGTCCTGCCTTGAACGAAGAT
+GAACAGAGACTCCTTGGGACGTAAAGTTCGGATCTTGGCCTTTCCTATCTGCCAACAAAC
+ACCTTGCGCGTGCGTCTATCCCGACC
+>ds2020-328_335
+GGTCGGGATAGACGGATCGGAGGCATTAAGTAAAGAACAGTCTATGTCACTAGATTGGAC
+AATTGAGTCAATCTCAGACCAAGTGGTAAGGTTTAATGAGTTAGGAAAAACAGAAAGAAT
+AAATGGAACCTTATTAAGCGGATGGCGTCTGACCTCGTTTATCAATACTGTATTAAATAG
+AGTGTACTTGTTAAACTCAGGACTAAGTACGTGTGTGAACTATGCGTTACACAACGGTGA
+TGAGATGTATGCGTCTATCCCGACCC
+>ds2020-328_336
+GGTCGGATAGACGTGTTGGCTGCTTCAGCAAGAAGCTTGCTGTCTGCCCAAGGAATTCGC
+TTCGACTTCCTACTATTTCAAGGGATCACCTTTCTAGTTGTTGGCCTTGGTTTGATAGGA
+GAGCAGGTGAGCTGACCTCCTCAGAGTAATGCTTTCAAGCGGTGTTGAGTGCTTTCCCGG
+AATGTACCATGGGGCGGGTACTTTGATCAGAGCTTTGAAATCCATATCGGCGCGCCGATG
+ACAGAGCTGTCCCGTCTATCCCGACC
+>ds2020-328_337
+GGTCGGGATAGACGAATGTGCGGCATGATAGGTGGCGTAAGCACGGTGTAGCTAACAATG
+TTAGTGACGAAGAATGGTCGCAACTGTTATATATGCAGTCACTATATGGCAGAGGTGGTG
+TGGTAGTCGACTGGCAGAAGGAGTTCGAGGGTAAAGCGAGGGAGCCTGAGAATATTTTGG
+CGTTCAATGGTTCAGTGTGGTCAGCAGAATATGCGACGACGATCATAGTAGAACAGGTCA
+GGACTGGCAGGCGTCTATCCCGACC
+>ds2020-328_338
+GGTCGGGATAGACGTATCAATACACTGGTCGGGATAGACGTACAAGGGGGTTGTTGGCCC
+ACGCTACCGTGGAAGGAATGAAGAAGGGGATGTTGGTCCAGGGTAAGGATCTGAGTGCGG
+AGGAGCTGGCGGAGTATCAAACTTGCCGCAAGATCATTGCCACCGCGGCGTTCCGAGTGG
+CGGAGATCAAGAAAATGATCAATGAGTACACGGGTACTGTTGATAAAGCTATCAAGAACA
+TACAGGGGGTACGTCTATCCCGACC
+>ds2020-328_339
+GGTCGGGATAGACGCCTGTATCCATTATGCTCTCTTCTTCATTGCTAAGAAAGAAAAGAA
+GAACCTATCTATATAGTATAAATAAACTCTTGTTTTGCATCCGGGTCGATAGCTCTCCAA
+AGTTCCGACTCTCTCTTTCTATATGCAATAATTTGAATCACCTACTTGGTACGCCCCTTC
+TGGCACAACACACATCCCCACTCACAAGAGCACACCTGAAATTCGGATAGAGCACCTCAC
+CTCGTCTATCCCGACCGCCGAATTC
+>ds2020-328_340
+GGTCGGGATAGACGAACGACCGTGCTGAATGAAAAAGTTTCCCCCATTCAATTTGTAGGG
+ACAACCCCTACCTCCTCTCTTCTAGAATGCTTTTAGGCGTTCTGGTTTTGCTTCTCATTA
+AGAAGCACACCGGGCTGCTTAGTCGGGGTAGGCAAGCGGTGTGCTTTAAGAGTAAAATAA
+TTCATATCAGAATGAAACGTAAGCTTTCTATTTTTCAGTACGGATCACAGTTTGATCCAA
+CCGGTCCCCCACGTCTATCCCGACC
+>ds2020-328_341
+GGTCGGGATAGACGAGAGTAGTTGGTGTCCGGAAGTAAGATAGAGAAAGTGATCGATCAA
+ATTGAAGGGAGTGGTATGGTACAATTACAAAATGATCCAACTGAAATTGAAGATCCATGT
+GAAGTATTTGAACCCGCACAGCCTGAAGTTGGATTGAGTGTGCAGGGAACAAGGGATGTA
+AAGGAGACATTGGATCCGCCCGTCTATCCCGACCACCCGAAGATTTCGTCTATCCCGACC
+AGAGAGCATGTACGTCATCCCGACC
+>ds2020-328_342
+GGTCGGATAGACGCTTGATTCGCCTACTTCAATCAGATCTGCACCAATGGCAAAAGCAGC
+TACAAGATAGGAGGAGTTAGAAGGTTCCGTTGTGGGATTGATCAGAAGATTAGGGAGTAA
+CTCACTTAGTGCTCTTATGCCAAGGAGTCGCTTCTAGTACATATCTCTTCCAAACCTTGA
+TACGAAATAGCCCCCTCTTCTCTAACAAGTCTTTTTCGGGAGAACTGCATGCTCCACGAA
+GGGCGTATGGACGTCTATCCCGACC
+>ds2020-328_343
+GGTCGGGATAGACGAAAAAGCCCCCTGGTATGTGCCGCTTTCCTAATCAAAAGATAGGAG
+AGCACCCCTTCTCCCGAAGTTACGGGGTCATTTTGCCGAGTTCCTTCGACATGGTTCTCT
+CAAGCGCCCTAGTATACTCTACTTGTTCACCTGTGTCGGTTTGGGGTACGGTCAGTTCAC
+CGGGAGGATCGCCCTCCCAATTCGAAGTTTTTTCCTGGAAGTTTCAACCTTGTTGACTAT
+GACAACGACGCGTCTATCCCGACC
+>ds2020-328_344
+GGTCGGGATAGACGTCTACTACCCCTCTTCTTATGGTGTATCATCCGCTTAAATATGAAT
+GGTAAAAGGAAGAGCTACCTCTCCCATATGCGTCTCAATTTCTTTCATCTTTCCCTCACC
+CACCGGTCGAATCTAAGGTGCTTATAGCGCCTGGTCAACTACCTACTTCTCTCTCGATTT
+GGTTGATCGCAAGCAAGCTACCTTAGCGCAGCGCTCACACCTGAACCCCCCGTCTATCCC
+GACCGCCGTAATTCAGATCGGAAG
+>ds2020-328_345
+GGTCGGGATAGACGATATAGAGCGTTAATGGCTTGCGTTGTCAAAGGACTGTCCGATTGA
+GACAATGTTAACCATGCTGGGTAAAAAGGCAAGGATTGATAAAATTGTAGCGTTGAGTCA
+GTATCTTGAATGAGTAAAGGCTTAACTTGACTCTCTTTGGCACGTATTTGACCGGCAACC
+TGTTCAACTTTGTCTTTGGGTACCCCAAAGTAAGCTTGACCGACCAAATTAAGCGGACAC
+CACACTGACCGTCTATCCCGACC
+>ds2020-328_346
+TGAATTACGGCGGTCGGGATAGACGGTCACTTTGGGTTGTGCAAGGGGGCCATGGAGACT
+AGGTTGCTGTTTAGTGTGGCTTTTGGTAGTATTTGGTTTGGGAGGTTGGGATACACGTTT
+CTACGTGGAAGTTATGGGGTGTCGAGAGGTACCTACACAACCGTTATTGAGTACCTTGGG
+TCTTTTTCGTTGACTGAAGTTGAAGAAATTGTAGGAAAATACAAGAAAATGTGCATTACT
+CCCCCTACGCGTCTATCCCGACC
+>ds2020-328_347
+GGTCGGGATAGACGGTGCCCTAGGATGAACGAAGGAGAATGGTAGTCCCTACTAAGACTG
+TGCCTCTTGTGCACCTATTATGCTATTCATACAGGTGATCATGAACGACAGGCTCAGGTC
+AACGAAACCGCTTCTGCGCCTCTAGTCCACCATCAAATAAGGTCTTCATTGGTTCTATCC
+TGCCGCTCCATCATCGGTCAATTTCGCCAACCACAGCCCGCCATACGCAACCAAAGCACG
+ACGACGCGTCTATCCGACCGCCG
+>ds2020-328_348
+CTGAATTGCGGCGGTCGGGATAGACGGCTCAAGGGTTTCTATACAAAGCCCTTCTCTTCT
+TCACTCAAAGGGGCAATGCACTCTTTGAATGGTACTTGATTCATAAAGAATGAATCTTTT
+GGTTAGAAGTTATACGGACTTTATAAAAGTAAATGCCACGTTCCGCGTGTCACGAGATAT
+GGGGCGTTCTAATCGAAGGGTCGTACTCCTCGTCTCGGCCCTATTAGGGTAAGGCCAATG
+CACCAGCCAGCCGGGGTGGTGG
+>ds2020-328_349
+GGTCGGGATAGACGCTCACCTACCCTCAAAGGCACGGTTTTACGTGATGTAGTTTCTACA
+CAACATGGGGGTATCCTACTCAGACTGTGAGGGAAGCCAAATTGGGACTTACTCCCCCTC
+CAGGGTACCAGCGTTGGGGTGGCCTCTTGCCCCAAAGCAAAAAGGTACGACACCGGGTTC
+GTGATCAAGACATCACAAACTCATCCACATGATCCCGATCTTTTGGGACCATAGAAAGGC
+ACACGGTCCGTCTATCCCGGCC
+>ds2020-328_350
+GGTCGGGATAGACGCGAGGTGGAGGTCCTAGTTCTAACTAGGACTGTCATAGGAGCTAAA
+AGAAACTCAAGATAGAGGAGCGGGTTTCCACTGTTAACCGTTGCACACGAAAGAGGATCG
+GAGGCTCCCCCAACCTCTTAATCAAGGGGTTTTGAGCCCCATCTACATCCATGTCAGCAG
+CATCACCCGGGATTATATCCATTGACTATTCATACCAGGTCAAAGGAAAATCGAAAAGAC
+CAACGCCTCGTCTATCCCGACC
+>ds2020-328_351
+GGTCGGGATAGACGACGAGGGGCAGTATTGGGACGAACAGTTGCCGAGGTAGTGAACTAC
+TTTGACAACAAATGTTCGAATGCACTTGAGGTTATGGCAGACGATAAATTTAGTGTATCC
+TATCATACTTACTATGACGTAGATAGGCCAGCTGTGTTGGGTTTGAATACAATGACTGTG
+AACGTACCGGTATATTGGACGAAGTTACCAGTAAAAATACAGCCTTACACATCAGAGCTT
+ACCAGGGCGTCTATCCCGACC
+>ds2020-328_352
+GGTCGGGATAGACGAGCGGAAGGTGTTCAGTGTACCTTAGTACAAGATCGAAAAGAATGC
+ATTGGATGGATGCCCGGGCATTGAGAAGGAAGGACGCTTTCAGAGGCGAAAGGCCATGGG
+GAGATACCGTCTGTGATCCATGGATCTCCGATCGGGAAACCGTATCCAAGCTCCGCGGCT
+AGTCTGCGCTCTTTGGACTTTTAAAACTTAGCGAACTGAAACATCTGAGTAGCTAAAGGA
+AGGCGTTCGTCTATCCCGACC
+>ds2020-328_353
+GGTCGGGATCGACGAACAATCCCCGTAAAATCCTTTGTTCCTCTCATTTATACTTTGGTT
+TATATTCTCCGCTTATTTATCTTTTGTTTTGATTCTATTCAAATATAAAACTATTGATTC
+GTTCTATATCATACCGTTTGAATTTGGATTGAAAAAACAAATAAATAAAGAAGAGTTAAG
+TAAAATCAAATAGTCTTCTTCACAATATACTATGACCAGTAATGCGGTATAAGTAATTCC
+CGAAATCCGTCTATCCCGCCC
+>ds2020-328_354
+CTAACTCTAAATCTCTTACTTGAGTCGTATTTTTGCCCTTTATGAAGTCTCGTTCGACTC
+CTGTAGAGGGAGTCTCACTCTCTTTCAGCATTCCTTCATGGATGTTTAAGTTTACCTGTT
+GCTTAAGGAATCCCGTACAAACAAGATAATGAAACCAAACCCCTTTATACCGTTCGACTC
+CTTTCCTAGTCCTAGCGCTGGATAAATCAACTTACAATCGTGCTTGTTCCTTTACAGTAG
+ACCGATGCGTCTACCCGAACC
+>ds2020-328_355
+GGTCGGTATCGACGTATGGGGCTAGCTTGCTTCTACTGGTGGCGGGCGGGCGAAGGGTCC
+AAAGGACACGTAGCCGGGGGCGAGTCACAAAATCCAATAGTTCCTCCTTAGCGCAAGCAC
+TAAGTAAGCAAGCTACCTCCCCCTATGGTCGAGCAAGTAAACTACCTTCTTGTTCATCAA
+TCGGAAATCAAGACAAACCGGGCACTACGGTGAGACGTGAAAACACCCGATCCCCTTCCG
+ACCTCGATATGTGGAATCACC
+>ds2020-328_356
+GGTCGGGATAGACGTAATTGGCCTTTCTTCTATTCTAGTCCGGATATCTGCATACCATGC
+CGGCTGATCGGAAGCTACATTCTTCCATCGTACAGCAACAGTAGTTCCTTAGCTGCCATC
+CATAGCTACATTATTCGACTAGACTAGTAAATTCAACTAGCTACCCCATGTTCTAACATG
+AAGTCTGCAATGGCTGTATCCATGCCTTTAACGGGAACATGCGGATACATTAGCAACTGG
+AGGAGTGCGTCTATCCCGACC
+>ds2020-328_357
+GGTCGGGATAGACGTGTGCCCTCTCTCCTCTGTTTATGGGATTGCGGCAGCGTATTGGTA
+TGTGGGAAGATTTGGGCAATGGTGTACAATCTCAAAGTTGGAACATGCCACTCGATCAAA
+GTCACTTCGATTGGCATGTGTCATTGCGCATGCTGTCTGTAGCTTTGGACGCTATCGCCA
+AGCTCATCCGAAGACGCGCAAGTGACAAAGTGAGACGGGACTTGCTATCTGTGTTACGCG
+GTGTCCCCGTCTATCCCGACC
+>ds2020-328_358
+GGTCGGGATAGACGTCGTAGATACCTTATCAGATAGAGGGGGGCTCAAACCTCTTCCTGA
+CGGAAATACCACCATTGAGGGAAATTCAGACTCACTCTTGGTATCGATTCTGAGAAGACT
+TTTGCCCCACCGGCAAAGGTTACTTTTGTACGGGCTTGCAGTTGTTGCCACGGTCAGAAA
+GTAGTCTTTGTTCCGGGAATGCTTTTCAGAAAGGAAAACTACGGTTAAAAACTAATGCAG
+AGCCGCCGTCTATCCCGACC
+>ds2020-328_359
+AGGGTATTGAGGTTGTGCGACACTAGGCCTGGCGTCCGCCTAATTAGTGGGGAGACATTG
+ATGTACGCGGTCAGCGGGGTAAAAGATCACCAGAGATACCTTCAAAAGTAAGTGACCAAC
+CGGGAAGTCGCTGCCGTTTCTAGCTTTGCGGCTAACGAATGTGGGAATGAGTTCGCCCCT
+ATGGGCGAGACTCCCATCCATCGGGTCTCCAAGCAATGATCACTCAACTTTATCAACTCT
+GCTCGACGTCTATCCCGACC
+>ds2020-328_360
+GGTCGGGATAGACGATGATGGCCGCTGGTCGGGATAGACGGTGAGACCCCTGGTCGGATA
+GACGTCCCCGCGCCCTGGTCGGGATAGACGATGCACTGGGGGTCGGGATAGACACAAGGC
+GCAATCGTCTATCCACGGACAGAGAGCCGTGGACCTAGTCGGATAATTAGTAGGTCCACG
+GCAAGGCTACACTGACTAGGTCCACGGCAGGCGGCTACAAACTAGGTCCACGGCAGGTAG
+TTCGCAACTAGGTCCACGGC
+>ds2020-328_361
+GGTCGGGATAGACGTTTTTGGCACCTGAGATCATTAAGGGCGAAGGTCATGGAAGTGCTG
+TTGATTGGTGGACTTTTGGAATCTTTTTATATGAGCTGTTGTTTGGTAAAACTCCTTTTA
+AGGGTTCTGGGAATCGTGCAACATTGTTCAACGTTGTTGGTCAGCCTCTCCGGTTTCCAG
+AATCACCAGTCGTCGGTTTTGCAGCAAGAGATCTCATAAGGGGATTGCTTGTAAAGGACC
+CCGCCGCGTCTATCGCGACC
+>ds2020-328_362
+TGGTGGGATAGACGTCCTCCCTTAGTGTTACCCAACCTTCAACCTGCCCATGGCTAGATC
+ACCGGGTTTCGGGTCTATACCCTGCAACTTAACGCCCAGTTAAGACTCGGTTTCCCTTCG
+GCTCCCCTATTCGGTTAACCTTGCTACAGAATATAAGTCGCTGACCCATTATACAAAAGG
+TACGCAGTCACACAGATTGCTCTGTGCTCCCACTGCTTGTACGTACACGGTTTCAGGTTC
+TTTTTCGTCTATCCCGACC
+>ds2020-328_363
+AATTACGGCGGTCGGGTAGACGGGGCAGAGAAGTAAGGGAAGCATTAAGTAAGTAGAGCG
+TGAAGGTAGGGCATGAAGGAAGCATGAAGCTTGCGGACCGAACTCTCACTCGAGAAGGGG
+AAGAAGCACGGCAGTCTTTTGGAGAAGCTTCACCGATCCGACAGCAGCTCTAGCTCTTCG
+AGCGATGAAGAGGGAGGTGAAGGAGAAGAGAAAAAGAAGAAGAAGAAAGAATCAGTAGTG
+GCGGCCGTTGCTGTGTATT
+>ds2020-328_364
+GGTCGGGATAGACGCTGGCGCGCCATCGATCAGGCTGAATTAATGGCGGATTGCCAGATT
+TCTTCTGTCTATCTGGCCCTTTCTGGCAAGCACATCAGCTGCCAGAACGAAATCGGTATG
+GTGCCGATTTCCGAAGAAGAAGTGACGCAGGAAGACGTTGAAAACGTGGTGCATACGGCG
+AAGTCCGTGCGCGTGCGCGATGAACATCGTGTACTGCACGTGATCCCGCAGGAACCCGGA
+TACATCGTCTATCCCGACC
+>ds2020-328_365
+GGTCGGGATAGACGTTGGTCGGCAATCTGCAGGCGTAGGCTTGCTTGCTTGCTTGACTCG
+GCGGTCACTTTGTCGGTCATCTGCGGTATCTTGATGAAGGCGCTTTTCACGAAATTAATG
+CCGGATCGGTCCAAATCGAGGAGATAGTGTCCACGTGGGACTCTCTGGAAGACAGTTTCT
+TTGCCAGATATCATTTCGAAGGTGGGTCTGTCGACTTTTGGTGCATGCTTACAAAGGGGC
+AAGTAGCGTCTATCCGACC
+>ds2020-328_366
+GGTCGGGATAGACGGAAGAAGCCTTTTTCTTCCTTTCCGTCTTTAAACCAACTGCGAAAT
+GCCTTTCTAATTAAGTTGCAAAAGCACTAGAAACCATCTGGAGCTATGTATATTAATGTA
+GGTACGCTTAGCGCTTGGTAGGTCAGGAGCAGAGCTTGTAGTATAGTAGTTCCAAATCCA
+ACTTCTAGGGCATAGGTTTTCCTAACCAAACTAACAACTCTAGTTTATACTGAGGCCATC
+TACCCGTCTATCCGGACC
+>ds2020-328_367
+GGTCGGGATAGACGCCAAGATCTACTTCGGAACAGATACCTTTCCACCTACCTCTCTCTA
+ACAATTACTTGTAGAGACGTATGCTAGGATATTCCATGTTTCCATGGAAAAGATCAATGG
+TCTTCCGACCACTTGAATTGACTCTCTATAGTTGTCTAAGCTATAGAGAACCCTTTCTTG
+ATGTCACCATCAAGAAAAGATTCCGTTTCGAAGGCATTTCAGCCTTCTCATCAGTGAGTT
+CCATCGTCTATCCCGACC
+>ds2020-328_368
+GGTCGGGATAGACGATGCGCACCTGTCTTTGAAGAATGCTGCGAACCCGGCCTAAACGCT
+TCCTGAGACTCAACCCTACTTCGTCTTCGCCCTCCAGCCTTTCCAGTAGTGGATTCAGCT
+CATATTATAAATTCTTACTTCACGAGAGAGATACTCACTATTGAAGGGTATACCCACGGG
+AGAGATACCGAAACTAGAAGCTTTGTTGCACCGCGCTCATTGACTTTCTATCAGAGGGGT
+TGACCGTCTATCCCGACC
+>ds2020-328_369
+GGTCGGGATAGACGTTGTCCGGTAGTGGTTCTGGTTCCAACATCTCTAATTGTGATGTCT
+GTGTAGGTTTTGTCAACGACGTGCCAGCGGTCAGTCTTTCCACGTGAAAACCCGGCGCTA
+GTAAGTCAAACTTGACGGACAGCCTAGCCAACACATCTTTCACCATGTCACTAGCCTGGG
+TGTATGATCTAGGAGTAGGCATAGTGAAGTCATCATATGATGCAACTGCAGCACACCAGC
+TCATCGTCTATCCCGACC
+>ds2020-328_370
+GGTCGGGATAGACGGTGTGGTGGCTTTCATAGTTGCTATTGGGAGGCAGCTTTCGAGTAT
+ATTCAATTGATTTTTGGTATTATTTAGTTTAGGTCAAATGTTCTTTAATTGTACTTCTTT
+TTTCTATGCCCGCGGGCCACCACATATCGTATCAAACTATTGCCCTGTTTGCATTAATGA
+TGGCCTTTTTTATCTCATTCGTATTCCGATCGAGTTTTTTTATGAAACTTGAAAACGTCT
+CTCTCGTCTATCCCGACC
+>ds2020-328_371
+GGTCGGGATAGACGTGGGAACCGGTTGTATGATATCATATTTGAATTGTAACAGGATATT
+AAGTAGACTACTGAGTCATAGCCCGTTGTTCATGTCGGGGAGAGTTAAATTGGAATATAG
+ATTATATATTGTGAGGTGCCTTTTTTATAGCAGCAACCAAGCTTGAAGGCATTTTGTTGC
+TATGCAATTTAGGCGATGGTGGAGCATATGTTATTCTGGACGCTCTGGCTATACTTGCGA
+TTGGCGTCTATCCCGGCC
+>ds2020-328_372
+GGTCGGGATAGACGCAGCCTACTTCTCCAGTGTCTTCAACATCAAACCTGTCCCGGTTCT
+GTATCGCGGCGAGTTCGACCTGAAGACACTGGAGAAGTTGGCTGAGACTATTGACCCCGT
+CTCGAAGGAAGGCTTCGTTGTTCGTGTCACCGACCGAGTTGCCTACGATGAGTTTGACCT
+GAAGTTCTCCAAGTGGGTGCGGAAGGGTCACGTCCACACCGACAAGCACTGGATGTCTCA
+CATACGTCTATCCCGACC
+>ds2020-328_373
+GGTCGGGATAGACGCCGCAAATCCCAATAGAACGAAGAACTTACCCTATTATTATATTAC
+CCAAACGAGGAGATAGACTATCAGCTTACCACTTACTTAGATACGGCTGAAGCAGAGCCG
+GGGAACGAGACGGGTTGAGGTTGAACCAGGAAAACAAGCCACAAAGACGGTGTTTGAGCC
+CGCTGCCCCTTTCTATTACAATTTCTTTCCCTACTCCTTAACCTTGGAGCTCTAGATAAG
+ATCTACCCTTCAGTGAG
+>ds2020-328_374
+GGACGGGATAGACGACGGGCTCGGTTGCTCCAGGTAATTTCCTCCTTCGTAACAAAGTCA
+GTATATGCCAGACGATGTAAACTTTGTATTCGACAACGACCTCCCGGACGATGATGTGTT
+GGTTCATCCAGACATCACGGCGTTGGGCTCTCCGTCTTTAAAGACGAGACAACGTCAGTT
+CCGATCCGGAGCGTTATTTTCTGGTCCCGGTCTCAAAGAGATCGCTCGATATGGTGGTTA
+CTCCGTCTATCCCGACC
+>ds2020-328_375
+AAAACCCCCCTCAGCAGCCGCGGTAATACGGAGGATGCAAGCGTTATCCGGAATGATTGG
+GCGTAAAGGGTCCGCAGGTGGCACATCAAGTCTGCTGTTAAAGGACAGGGCTTAACCCTG
+TAAATGCAGTGGAAACTGAAGAGCTAGAGTGTGGTAGGGGCAGAGGGAATTCCTGGTGAA
+TTACGGCGGTCGGGATAGACGACACAGCTCCCTGGTCGGGATAGACTATATACCTGCCTT
+TTACGTCTATCCCGACC
+>ds2020-328_376
+GCCGTGGACCTAGTTTACATTTATCTGCCTGGACCTAGTTAATTTAGCGGTAATAGGTCC
+ACGGCACTGTACCGACTACTAGGTCCACGGCAGGCAAAAGGCGACTAGGTCCACGGCGGG
+ATGCGATAACTAGGTCCACGGCTCTCTGTCCGTGAATTACGGCGGTCGGGATAGACGACT
+TTTGCTGCTGGTCGGGATAGACGCGCTTATACCCTGGTGGGATAGACGGCCAGTGCGCTA
+TTCCGTCTATCCCGACC
+>ds2020-328_377
+GAATTTCACCTCTAGCATGTAAGTACTCATGCCCCCGACTGCCCCTATTAATCATTACGG
+CGATTCCAAAAACCAACAAAATAGAACCGCACGTCCTATTCTATTATTCCATGCTAATGT
+ATTCGAGCAAAGGCCTGCTTTGAACACTCTAATTTTTTCAAAGTAAAAGTCCTGTTTCCC
+CAGCACGCCCAGTGGAGGGCATGAGGTTCTTCAGAAGGCAGGCCCGGCCGGACGAGTGCT
+TCGTAGTGGCGGCCGTT
+>ds2020-328_378
+GGTCGGGATAGACGCGGCATGCACCTCCAGTTAAACCATAACTCACCAACAAATTCTCTG
+TCTGCCAGTATCATCTCAATATTGTCTTTACCAAACTGCTTGATAAAGCGTTCAATGAGT
+TCGGCTTGCTCAAGATGGTTTGTGTTACCCCGTTTGTCTAGCATGTCCCAGTACAGTGGT
+ATGGCAATGCCCTTATAGACCACCCCTAGCCCAGTTAAACCATAACTCACCAACACGTTC
+CCACGTCTATCCCGACC
+>ds2020-328_379
+GGTCGGGATAGACTCCCCTACCCCCTACTCTAGTCAGCTTTCTATCTCTTTCTCCAACCT
+TCGATGATCCTCCTGCGGGCAAATCATCGAAGTCAAGAAGAAGTGATGGGCCTGATCTTC
+CGATATCGATATCAGATCCATAAGCTAGCTCTTGGTTAAGAAAATCCTGAATATGCTGAC
+CCGGGTGCAGTAAACGAACTTATATTCTCTTCCCTCCCCTCTATCCCGACCAGGGTGTTG
+ATCGTCTATCCCGACC
+>ds2020-328_380
+GGTCGGGATAGACGAGAAACCCTCCTGATGTATTTTAGTATAAATGTCCGCCATCTTCAC
+ATCAATTCTAATTTTTACAGTAAAATTGCTTTGCAGTAATGGAGGTAAATTTGCCAATCT
+CGGACTGACGGAATCAGTGATCTGATCATAAGTAGAATGAATTATACCTCACCGTTGCAT
+TATTGCAAAATCGTGATATGACATTTCAACTACATCGTAATATCTTTTGAAAACCGAATG
+TAGCGTCTATCCGACC
+>ds2020-328_381
+GGTCGGGATAGACGCGCCAGCTGATGTATCAGTTCGAAGATACTGACCTACTTCGTGCCA
+ATCACACGGTTCTTCACGGTGACTAAGGGTGAACCTCTCACGTGTAGCAGAGACCGCCTT
+GCGCAGCAAGGTTGATTCGCGTTCAGTTAGATCAGACCAACGTTTGTGTTGGCCTTCAAA
+CTTCATCAAAGAGTTATACAGTCCGGGTAAACCGGCACCTCTTCGGGTAAAACCACAATT
+TTCGTCTATCCCGACC
+>ds2020-328_382
+GGTCGGGATAGACGTTAGAGCCGAATGGAGCTCAAGAGGTCTCTTGAATTGCTCATAAAG
+AAGACGGAGGATGAAGGAGCAATAGTCATTTCCAATCCAGAAAATCATTGTAATAGAGTG
+TATCTCAAAAAAAGGGAGTAAGGGAAGCAGTTTTAGTATTTCCTCACAACTCCGAATTCT
+CAAAGAAATCTCTAAGAAGCCTCATCGTCATCGGAGTTGACCTCCACCCAACGCACACCA
+CCGTCTATCCCGACC
+>ds2020-328_383
+GGTCGGGATAGACGCGTAGCCCCCCTGAAGAAAGATGGTATCGTAAAGTAGAGTGGATTC
+GACGGTATGCCAGTTGCGTATAGAAAGAAGTTCTACGATTTCATGATGCAGCACGGAGTA
+TAAAATCTCCGTTAGTTCAGTTTCTGCTTTTTCCCTTATTTCCCACTCCTTATGTCAGGC
+AAAACCTGACCACGCGGACTTGAAAGAAAAAGCTTCGATGCATGAGAAGAGGACCGGGCA
+GCGTCTATCCCGACC
+>ds2020-328_384
+GGTCGGGATAGACGACGTGTCCACTGGTCGGGATAGACGACACATTTCCCTGGTCGGGAT
+AGACGTAACAGGGGATCAGATCGTCTATCCCGACCGCCGTAATTCATAGGCAAGTGGACA
+CGGAAATTCAACCATTCGAATTCGTAACGGAGATTGATCAACAAGGTACAGGTACTCCAT
+TATTCCAATATCACTTGACGTTTGCAGCTTACTAAGGAGGGGACTACCAATATATGCGTA
+ATAGTGGCGGCCGTT
+>ds2020-328_385
+AAAGAAGAGCAGCAGCTAGCCATTGGGGTGAAGGATAGACGGAAGAAATGACAATAATGG
+AAAAACAAATACTTAAATGGACTGTAGAAAAAGCAACAGGCCAAAAAACACAGAAGGATA
+AAACAGTAGAATTTATGTCGGAACTAAGAAAAATAAGACAGGCTGACGGTGGGTTAGGCA
+CAGCAAAAACTATATACAAGGGAAAAATACCTATGAGAAATGGGTTGCCAGACTTAGCGG
+ACGTCTATCCCGACC
+>ds2020-328_386
+GGTCGGGATAGACGTTTAGTTGGGATGTTCTTGTTGCTGGTCTTTTTAAACTTCATTTTT
+GATGAAAAAGAAGTGATGTGGTTTGAATGGCTAGAGCATAAATTGGCACGATTTGGCAAG
+GTCGATGCCATGAGCGTGTTTGTCGCCTTGGTACTACTAATGACCAGCAACAAGAACATC
+CCAACTAAACGTCTATCCCGACCAGGGGAAGCTACCGTCTATCCCGACCAGGAGTCTTCT
+TCGTCTATCCCGACC
+>ds2020-328_387
+GGTCGGGATAGACGTATCGTGTGCCTAGACGACTACAACTATCAAGTCAAGTGCTTAATT
+GAAGCTATTAAAACTGGACCTAGTGCTTGTGGTACTAGTATAAATGATAAAGGTGTATAT
+GATATCTTAGAAAATCTAATCAGGTGGACAAGGTCTCAGAGTGCTGATACATCAGATGAC
+AAGAATAAATTCTTTGAATTTGCTACCAACGTATGGCACTGCTATAGTTATGATGATGAC
+CCGTCTATCCCGACC
+>ds2020-328_388
+ATAGTACGATAAAACATCTTTCTGAAAACGGATCGGTAAACGATCTGTAGCAGAGGATAA
+ATCAAAGCTGTGGAATTGGTGGTCACCCAACATGCCTAATAACTTTTTATTTAGAAGAGA
+AATCAAAGGGGCACCTTGATTAAAGGTACCATCCTGTTGAATTCTTCTTAAAATAGAGAA
+GATATAATCATGAAGGGGCTTTAATATGGATTGTGTTACACAATCAGTAATAGCAAAGGA
+GTAGTGGCGGCCGTT
+>ds2020-328_389
+GGTCGGGATAGACGAGGGGTGGATATGGGGGAGAAGGTGGAGAGTCTGTGACGGGAGATT
+TAGAAGGAGCAGTCGAGGGTGGAGTGCCCGCAGGAGAAGGTGAAGCAGCTGGGGTAGGCT
+CTGGTGGTAGTGGAGGTGGTGGAGGAGGAGCCGATTTTGGTGGTGGAGGAGGAGCCGATT
+GCGGTGATGGAGGAGGGGCTGATTTCGGTGGTGGAGGAGGAGGAGGAGGAGGTGATTGAG
+GTAGTGGCGGCCGTT
+>ds2020-328_390
+GGTCGGATAGACGTACGTTTGACATAATCGATGATCCAATCCCATAATATTTCAGGCTTG
+TGAAACGGTATGTTCTCTGTGTCAATGCGGATTGCTGAATCGTGTGCGTTAACTCTATCT
+ACCGCTGCGTCTGCGATTTGAAAGGTTGGGATCGGAATGTCAAAATTTAAAGCGCTAGTT
+TGGTCTCGTCCGCATGCATGATATAGGTAGAAGGTTTCTTTTGCAGGAGTGGAGGCGTCA
+TAGTGCATAACGTA
+>ds2020-328_391
+AACGGCCGCCACTAAACCATTCTTCGTGGATGACCATGCGTGAAGTTCAGGATCTCTTTC
+GCGCCACGAGTCCATATTCATATCCGGCATGGCCAGTATTGATATGAACTTGTTCTTGAG
+GTATATGTCTTTGAATATGTATTTATCGTCTTCTGAATATTGCGAGTGTATAGTGGCGGC
+CGTTGCTGTGTACTTCGGGATAGACGCGGTGTGGCCTTCTATCCCGACCAGGGTGTTGTA
+CGTCTATCCCGACC
+>ds2020-328_392
+GGTCGGGATAGACGAAGACTCACTTTCTATTTGTTTGGCAATGCTGCTCTCCGCTATGAT
+GTTGCGACAGATGTTTGCTGATGAACCCATCCATTATGTTGGTCTGAATGCACAATTATT
+TTGTCTAAATTACATAGTTGGTGATACCATAAGTAACATCCCAGGTGATGGTGAAATATT
+CATACGGCAGATGATGACTGCAAAGTGCGCATCAATTGCCAAACAAATAGAAGGTGAGGC
+GGAAAACCGTTATC
+>ds2020-328_393
+GCCGTGGACCTAGTTTGCAATGGGGTAAGACTAGGTCCACGGCAGGGGGGTCAGGACTAG
+GTCCACGGCAGGAAGGCAGTACTAGGTCCACGGCTCTCTGTCCGTGAATTCGGCGGTCGG
+GATAGACGTTTGTGCGCCCTGGTCGGGATAGACACGGACAGAGAGCCGTGGACCTAGTGA
+CATTGCAACTCCTAGTAATCTAGGCGGTGAGGGACTAGGTCCACGGCAGTGGATAGGGAC
+TAGGTCCACGGCTC
+>ds2020-328_394
+GGTCGGGATAGACGTTAGAATGCCATCATCCCATTTAATTTTACTTCAACCGCACATATC
+TCTATTTCTTTTACTATAAGAATAACATTATGAATATCAGTAGTACTATTTGGATGAGTA
+AATAACTTTAAAAAAATAATAACACACCTAACGCCAACAGGAACCCCTAATAGACTAATA
+AATTTCATAGGATTAAGCGAACTAGTGAGCATAATGATTCGACCTATCACCCAATCTACT
+CGTCTATCCCGACC
+>ds2020-328_395
+GGTCGGATAGACGGTCTGCCCCCTTCTGTGGTCAACTCTCAAGAACTCTGCTATGGCCCC
+AAATGCACATTTCGAGCTCTGCAACCTCACACCAAACTTGTGCGCGTTTGCCTGACATGC
+TTGAGCACATGCTAGGTTATTTGTTCCTATGAGTACGTCGTCCCCGTTGTGCAAGCTTGA
+GCCTGGTGTTCTCCACTCTTTTGCTATCTTCGATGTGTAGACGAAGTTCAGCACGCTGTT
+ACGTCTATCCCACC
+>ds2020-328_396
+GGTCGGGATAGACGCTGCGTGCCAGTCGATCCGCCCATTGACGAATAAAACCTTGTTTGA
+ATGATTTGATAGAAAAAGATACGCAATTGTCGGGGTCAAAGTGAGATTAGCTGAGTCGAT
+GATGTCCTTCCACTCTTTGGAGCCCAAAGTAAAGATGGCAAGTTTGAAATCGAGAACACT
+AAGCCATGTCATTTTCCTATTGAACGGACGACTCCATTGCGTCTATCCCGACCGCCGTAA
+TTCAGATCGGAAG
+>ds2020-328_397
+GGTCGGGATAGACGTGGGATAGGCGTATGGATCAAGACGGACGATAAGAGCAGGAGGAAG
+AACCAAGGGACTAACAATGTACACAGCTTAGTCAGGCTGCTCCCATCTGGAAAAAAACAG
+ATGAAAGATTTGACTGATGTGGACGCCAAAGTGTTCGTGCTGACTACTGAAGTTCACTCG
+ACGTACATGCATAAGCTTAGAGAGGAATTCGCAAGCGAACACTCGATATCGGTGATGAGC
+GTCTATCCCGACC
+>ds2020-328_398
+GGTCGGGATAGACGAGGGGTCCATTTGGGTACCTAAAAATAGGAAAATCCATCATCTGTG
+ACATAAGTTTTGTAGCTGACATTTTTACGTAGTTTAAAATAACCTAACCAAGTTTTCTGA
+ATTTTTGGACAGAGATCTCATGATGTGAATCTTGGCCAGCGTGTGGCTCCACTTGAGGCG
+GCTCCATTGCCCCTCACCTTCCACTGCAGTCACAGGTGCATTTTGCGTCTATCCCGACCG
+CCGTAATTCAGAT
+>ds2020-328_399
+TGGTCGGGATAGACGGCCCGTTTCTTCTCCTACGGGTACTGAGATGTTTCACTTCCCCGC
+GTCAACCCCCACACAGACTATGAATTCACCTGCGGGTAACACCACACAACTGGTGCTGGG
+TTTCCCCATTCGGACATCCTCGGATCAACGCTTTGTTGGCAACTCCCCGAGGCATAACGC
+AGCCTCACACGTCCTTCATCGGCTCAGCATGCCAAGGCATCCACCATACGCCCGCAACCC
+GTCTATCCCGACC
+>ds2020-328_400
+GGTCGGGATAGACGGCACGGCTTACTCACAAGTGAATATTATGATGTAATCTTACATGGA
+CCAAATGCTTGGTTATGTAACGATATTCTTGCATTTTTAGATCTGGTAAACTATGTCTTT
+TAGTTCCGGAAATGTGAAACAACAGTTTTTCCCTGGCATCTCGGTCACTTAGTCAGTGCA
+CAGTGTCAGATTTGATATTCAGTAAGTAACGCAGTGAGTGTTTTCTAGGGAGGGCTTGAC
+GTCTATCCCGACC
+>ds2020-328_401
+TGGTCGGGATAGACATTGCGCGTCCCTGATTGTCATGCACTAGCACTCTGTCCAGCGATA
+GTCTGGTCCACTCCACAGCTGCCAGCTGCTCTTGAGTTAAGAAGTGACCAAACGTGTCCC
+TGTAGGCATCTATTACGGCCTTCATAGATTCCACACTGTGTTGACTGTTGAAATCTTCAA
+AGTCTACACAGTACTGAGTTCTGCCTTCTAAAACTGACCTCACTCTGATACGAACGTCTC
+GTCTATCCCGACC
+>ds2020-328_402
+GGTCGGGATAGACGGTTAGATCCCCTCAGGAAGGTGGCCTCACGTCGTCGGCAAGCTCTA
+GAACGGGGAAGGAGACCTGGACGTTAGTAGAGCTCTGCCGACGACGATGGAATGGCTGAC
+TAGACTGCAAGAGGAAGGCATCGACGGCCTCGGGGGAATGGAGACTGACATTCTGTCGGA
+AGTGATTAAAGGGTGCTTATGGGACTCCAATAATCCAAGAAGCGTTGAGTGCGCTTACTC
+GTCTATCCCGACC
+>ds2020-328_403
+GGTCGGGATAGACGCTTTCGGCCCATGCTACGCGGTTACTCATCTAACACGACGTCCGCC
+ACTGGTTAACAAGTCAACTCAGCGACGGTGTTCGTCGTAAGACGCTAGCACTGCGTTTAG
+AACCCATAGGGGTTTCCAAGTACCGCCTTGTCAGAATATTTATTTACAAAGTCTGTTTCT
+GCCATACTTAGGTAGTCATTCTCCATGGTCCTGGTCTCTGGTACTTAGAACAAGTAGGCT
+TTCTCGTGACCT
+>ds2020-328_404
+GGTCGGGATAGACGCAAACTACCACTAATAAAGAGGTGACCGGCTACGAAATACCTTTAC
+TTCACCCTTAGGGCGGAGCTTGAGAACAATTGGCTTCTTGTAAAAGGTAGTTAAACGGGA
+TTAGATTAATCACAAACAAACAAAAAAAAATCCTAGCATCGCGCTATGCGCTAGCACTTG
+TTGGGGAGGAGTGTGTGCCATAGCTTTGTGAGAGGCAGAGAGGCAGAGGGTTGAAGAATA
+GTGGCGGCCGTT
+>ds2020-328_405
+CACCCCCGCCACTACTACAACAGCTGCCAGCGCGTGCTCCACTCTATTGAGCCTGACGTA
+GTCAATGATCCATTCCCAAAGTGTCTCTGCCTTGTCCCAGGGAATTGATTCATAATCCTG
+TGACATAAACTGGGTGCCCCCAACACAGTCGACTAGAACCTGAGCGCAGTCCACGCCAGG
+TATGTTTATGTCGACGTTAAGTTCACTTTGCTTATTTCGGCCAGACAGATGTTCGTATTA
+GTGGCGGCCGTT
+>ds2020-328_406
+GGTCGGGATAGACGTTCCCCTCGGGTGCTTCTACTTTTTTCCATCCTCTTAGAGAGCTAA
+TAGGTAAAGTATGTATCTGTAGTCCAGGAAGTCAGACATGAAGGAGTACTACACCCATTC
+GCAAAGAAGACGGATAATACCTAGTGAGTTCTCATAAATTGCCGTTGGAAGCTACTTGTT
+GGCTTTGACCGAAGAAGACCTTTCTCTACTTAGTTGGGTAGTACCTATAACCGGCTTCCG
+TCTATCCCGACC
+>ds2020-328_407
+GGTCGGGATAGACAACGCTGAGGGGTATTTTGGGTATTTCGGAAGGATACGGGAGGAACC
+TGAAGAAACTCAGAACACGAAAGTTGTTCGTAATGACAAGATACACGCTATGCAACTGAC
+GGTTTGCCATTCGGAGTTCGTATGAAGAAGTTATGCCCAATTATGACTCCTCGTGCATAG
+GTGATGTTCCCTCCTGGCACAAGGCTAAATGCATAAAATGCTATATAGGGGGTGACAGCG
+TCTATCCCGACC
+>ds2020-328_408
+GGTCGGGATAGACGACAACTTACAATGGATGTATTAGCTATTCTTGCAGTGAATGTATCT
+ATGAGGCAGCACAGCTGCGCAAGGTCTTATTAAGGGTTGTTGGTGACTGGTGTACCATTT
+TTCTTCCTTTTTTTGGCTTCAAAACAGATGAACATACATCCTCTCAAAGACAACCAATAG
+ACCAAGATCGAGGATGGAGAAAACGGCAGTACGATGAAATGGCTGAAGGGCGACTCCACG
+TCTATCCCGACC
+>ds2020-328_409
+ACAGAGGTCTTTCTCGAACGTAAAGCTGCCTAAGGTTGTATCAGGCTACGATCTAATGGT
+GCCAGCATTTATGCACACAAACTCACAACTAGACAAACCAATACTGTCAATGCAAATGGC
+CAAATAGATTGGTAGGTTGCATCAAATGCTACTATTCATGAATGTTAAAGACATTCTAAC
+AGCTGCTGAACTAAGCACACATTGAACTTTTGATCGTATTGATAGTAGTAGGTTGATTCG
+TCTATTCCGACC
+>ds2020-328_410
+GGGCGGGATAGACGGCTATTGTGGTTGTTCGTATTTTAAAATGGATTCCCTACTTGAGTT
+TTTGCTACCTTCACATGAAGATGCGATCGAATTGGTTGATGCCAATTCGGTTAAGACTAG
+CTTCAGCTTGCCTGATTCTAGTGGGGATGTTTCCCCACTTTGTAGGTCGTTGTGTCAGTT
+CTTCGGATTTCTTATGATCCGAGATACTGTTGTCAGACCTGACAAATTTTCTGGTTTCGT
+CTATCCCGACC
+>ds2020-328_411
+GGTCGGGATAGACGTCCGCCAGCCATATGTACTGAGATTGTTCGGGAGACATGGTCCAAG
+CCCGGTATGGCATAGGAATAGAAGAGTCATTCTTTAATAACTGTATTTTAATTAAAAAGA
+ACACTACCATGTTAGGTTTGGAGTGCGGTGCATCTTTCTTTCTCCTGTCGTTATTATGTT
+TAAAAAGTCTTGTTCCTCGCCCTCAGATAGATGTTCTTACCAGCAACTGGTGCTATGCGT
+CTATCCCGACC
+>ds2020-328_412
+TGAATTCGGCGGTCGGGATAGACGTATTTGGCTCCTAGTTGCGTAGTCAAATGTACTACA
+CTGAACCGCTTCTGACAAGGCTAGACTGTGTAATATTATCCTATTCGGGGTACTTCTCCA
+GTTATAATAAGTATCCCAAGCAGCACTATTCACTACGAAAGGAACACCAGCCATAGTGGT
+GGACTGACACCCTCTCAAGCTGCACACTTCTGGCATGAGCATTATGTCGTCTTTCGTGTT
+CCAGATCATTG
+>ds2020-328_413
+AACGGCCGCCACTACTCGTCTGATATGGGGCGACTGGAAGGCGAGCTCAACGTGGACATC
+AACATACCTGGAGTAGACTGCGCGCAAGTTCTCGTCGACTGTGTTGGCGGAACACAGTTC
+ATGTCTCAGGACTATGAGTCCATTCCTTGGGACAAGGCTGAGACACTCTGGGAATGGATC
+ATCGACTACGTAAGGCTCAACAGAGTGGCACGTCTATCCCACCCCCGCAGTGTCCGTCTA
+TCCCGACCGCC
+>ds2020-328_414
+GGTCGGGATAGACGAGGCTACGTGGTAAACAGAGTAGCGGGGGTTTTGAAAGACAGATTA
+CCATATTGTCTAGACTTTGAGGATTTCAACAGCCAGCACAGTCTATCAAGTATGCAAGCG
+GTCATAGATGCGTACTATGAAGTATTCGGGCCGAATATGTCGGAAGGGCAGAGACAGGCA
+GTACTTTGGACAAGAGAATCACTGTCTAATAACGTGGTACATGATAATATGGGTACACGT
+CTATCCCGACC
+>ds2020-328_415
+GGTCGGGATAGACGGAACACCCCCCTGTAATTGTACATGCTCCCATAGAAATAACGTATT
+TTGGTTCAGGCATTTGTTCATATAATCTCACTAAAGAAGGAGCCATTTTCATTGTTACTG
+TGCCTGCTGTTAAAATTAGGTCTGCCTGTCTAGGACTAGATCGTGGCACCAGTCCATAAC
+GATCAAAGACGAATCGTGAGCCTATTAATGAACCAAATTCAATGAAGCAACATTTCTCGT
+CTATCCCGACC
+>ds2020-328_416
+GGTCGGGATAGACGAGCGAGGTTGGTGCAGAGGACGAGATTGAGGTGAAGATGGGCTCTG
+AGGATAGAGGCATGGACAGTTTAAGGGGACAAAAGGGTGTGGCTTTGCTTTATCAGTGAT
+ATGCATGTCATGTGCTTGGATTTTGTAATTCTAAGGGGTTTGTGAAATACGATCAATTAG
+GAAGATTGGGGTTGTTGGGGTTTTTGCTTCTGCATCAGACAGACTAGTGCAACGTTTCGT
+CTATCCCGACC
+>ds2020-328_417
+GGTCGGGATAGACGATTCCGCACCCTCTGTTGTCTCTGAAAAATCTCGTCGTACCGTTAG
+TCCCGTCCTGCGCTTGCCCGACGTTGACTATTCCTGTTCTTGGCTTGCTGTTATCTCTTG
+GGGAGCGTCGTGGATTTCCACTTCTGCGTGTTGAAAACCCTGCATGGGTTCGTGGGCTGC
+AATAGCAGGCCTTGTGACTTGCACCTTCTCTACGTGCATGCCCGTAGCAACACGCCCCGT
+CTATCCCGCCC
+>ds2020-328_418
+AGGTCGGGAAAAGCGATTGGCTTTAGGCGGCGCGAGGGACGGAACATCTTCTCGATAACA
+CGAAGAGCTCTTTTGTAGTGGAAATCCCTTGGAACGTCGTGGTAAGGGAGGTCAGTCTTA
+AGGAAGTCTTCTTCTCCGGCGGCGGGGTTAGTTGCAGAACGGCGGTAGCCATTGATTGCT
+TCGTTTGCCAAATCGGGGGGACAGCACTTATAGATTGCCTTCTGACGTCTATCCCGACCG
+CCGTAATTCA
+>ds2020-328_419
+GGTCGGGATAGACGACAGATACCGATCCTCTAAAATGCGTTCACGTCCCATCAATTCGAT
+AAAGCCGTCCAATTTTCGGTGTCACCGACAATTTGAATGGTATAAACATTGGGCGTGATA
+TCAACAATACTTGCAGGGAAGATATCCGCACAGCGCTTGACTTCTTCGCGGTTGCTACAC
+GTGGCGCGTACTTTGATCAGCATGAGTTCGCGCTCAATATGTACACCTCCGATCAGCGTC
+TATCCCGACC
+>ds2020-328_420
+TGAATTACGGCGGTCGGATAGACGCGAACTCCACGTTAGAAGAAAAGGCGTTAGCAAACG
+CTAAGCGAAAGGCCAAACAAAAGGAAGAGGAAAAACTAAAATTGCAGCGTCAGTTAGAAG
+ACGAGCGTTTGCAGGCGTATATGCAGCAGCAACAAGAACGTCAGCGACGACAAGCGGTGG
+AAGCAAGGAGCTTGATGCCGATTTATGGTGAGACCCCAATGACTCGTCTATCCCGACCGC
+CGTAATTCA
+>ds2020-328_421
+GGTCGGGATAGACGGTTCAGCAGCGTGGACTAAAGTAAAGTGGGATATTGAGAGGTTGTC
+TCGCTAGAGCTTGTGCTACCTTTGTTAACGTCAATTGGGAAACAGATAGAATCATAGGGT
+TTGACAACAAACTGCATGAAATATTTTCCTCGGTGGCTGTGTTAGAAAGAAGAGGTGCTT
+CGACTAAATCATGCCAGAAAATCTGGAAAGCTGCTTTCTTGCGATCAGCAAAGAATTATG
+GTTGGGATC
+>ds2020-328_422
+GGTCGGGATTGTTGAGGGGAATGAGGGAAGTGGGTTGGCTGGCAATGGAGGGAGCACCGT
+AGGCAATGTGGATTTTGGCAAAGATGGGATTTGGGGTTGGAAGGTTGGCAATGGGGGCAG
+AGTAGTTGGGAGAGTAGGCAATTGGGTAGACGGCAACGGTGGCAACGTGGCCGGCTTTGG
+CAAAGTTGGAGCAGTTGGAAGCGTAGGCAATGGGGTGGTGTAGTGGCGGCCGTTGCTGTG
+TATTAGATC
+>ds2020-328_423
+GGTCGGGATAGACGATCTTCGCCCCTTGAGTCACGGTACTTTGGTTTAGTCAGGATCACC
+CTGTAAAACTAGCTTAATAGAGGTCGAAATAAAAGAGTTTTGGGGTTCAATCTTCAAGTA
+AGGAGGAGTAAAGAAGAGGAATCGCGAACATACTCAATAGATATCTTTCTTCGACGAGGC
+GGTGCCTATTAAAGAGTTATTATTTCAGGGACGCCACCCTACCACCGATGTCATGCGTCT
+ATCCCGACC
+>ds2020-328_424
+GGTCGGGATAGACGATACAGTCCCCTCACTCACTATGTAGCGCAAGGAAGTGTGCGAGCT
+TGCTAGGAGTGTAATGATTAGCAGCTTTCCCTTTAGGCTGTTAGATGCTAGAGACAGGAA
+GAAAGGAAGAACTTTCCTTCCGCTCATGCTCTTTTCGAGAGAGCGTTCACTTACTATAAG
+AGCAAGGAAGTTATGGAGCTAGGAGTTAAGTAATGTTAAAACAACTGGAACACTCGTCTA
+TCCCGACC
+>ds2020-328_425
+GGTCGGGATAGACGAGGGATCACACTGTTCTACTACGTACCTTTCATATGCATACGATAT
+TTCTTGTACAATAGCTCTCTCATCGTTAATATTAGAAATTATTTCAAACGTTTAGGAGGA
+CCAAATATGATGAGAAGTATTTACATAAATTGTTGAAGGAAAAACTAGGAGACAAACATT
+TGCACGACACATTTACTAACGTTGTAATCCCAACTTTTGATATTAAGCAGCAACGTCTAT
+CCCGACCG
+>ds2020-328_426
+GGTCGGGATAGACGTATGGACACAGTGTCTCGACAGGGCCGCAACGGAACAACGGAAGTT
+CACTGGGTAACTCTAATCTAAGGGGTACGGGGACGTAGGTTCGAATCCTATTTGCGGCTA
+ATACCACCAATGGTGTGCTCAAAAGGTTCTTGTTCGTAGTCCAATGGCAGGTAAATTCTC
+CTTTTTCACTCCCGAGTTGTTTAGATTCAAGCAAAGCCCAAAAAGGAACGTTCCCGTCTA
+TCCCGACC
+>ds2020-328_427
+TGGTCGGGATAGACGCTGAAACCACCTTATATAAGCTCGTCACCAAACTTATAGGCCTAA
+AATCCCTAAGTCTGGCAGATTCTATCTTTTGGGAATCAGGCAGATTAGGGTTTCATTAGT
+TACTGCGTTGATAATTCCGGAGTTATAGAAATCATCCATTACCTTCATGAGATCACCTTT
+AATAGTATCCCAGCAAGATTGGAAGAAGAATAAAGTGAACCCAGGGAGGATGTACGTCTA
+TCCCGACC
+>ds2020-328_428
+GAAGAGCTGTCGGGAGTGGAACAAGTTGTGGGATAGTAGGGGGCAGTGGGGTGCTGCGGG
+AAGCACGCATTCGCAGTACCAGGAGGACATGGCTTACGTCCTCAAGGACGACATAAGGCT
+CAAGAATAAGTTCATTACCATATCGAACATGCCGCGCTTTCCCATGACAAGATTTACAAA
+CAGACCGCAGGAGATACAGGCTTGGGCGTCCACTAAGTACGAATGGGGCGGGGTCGTCTA
+TCCCGACC
+>ds2020-328_429
+GGTCGGGATAGACGGCGAACAAAATGTAAAACATATCAGAGATGTAGTATTTTAAGAAAG
+AGGGGGGAAGGGGAAAGTCAAGGCCAAAGAACAAAGGCCAAATAAGGGCTACACAAGACG
+AAAAACCAGAGGCAGCGCTAAGGCGCGAGGGGGATGTGAAAACAACAACAGTTCCACATG
+AAGGTCCTTGGAATGGAAGAAGGATCGGTAAAGTCGAGAAGCAGTGAGAGGCCACGTCTA
+TCCCGACC
+>ds2020-328_430
+GGTCGGGATAGACGTTGACATTCCGTGAATGCTTTTCTGCATAACAACTTCCAACTGTCC
+TCTTGGCTTCGAAATCGCAGTTCATGGGGAAGGCTTTGGGCATCTGCATGCAGAGCAACA
+TTGTTGTTGCGAGTTGTAAGCAATAATTTATTGCCACTGCCATCACTTGGGAAGGCCTTT
+GCAAGACTGTCAAAAGCGGTGGTACTCCATGTATCATCTAAAACAGCCAAAATGCGTCTA
+TCCCGACC
+>ds2020-328_431
+GGTCGGGATAGACGACTGTGGCCGATACTACTGGAAGGATTCCTCTTTGGATAATAGGTA
+CTGTAGCGGGTATTCTTGTGATCGGTTTAATCGGTATTTTCTTTTATGGTTCCTATTCTG
+GATTAGGTTCATCCCTGTAATAATCGGATGAACTGAGTTGTAGACATGAAAGCATAAGAA
+CTCAACGGGATCCCCCTCGAATCAGACAAGGAAAAAGGGGGGGGGGGTTCATGCGTCTAT
+CCCGACC
+>ds2020-328_432
+GGTCGGGATAGACGTTCCTCAGGTGTCAAATGTGATGCTGTACCTGGTCGTTTAAATCAG
+ATCTCTACTTCGGTACAACGAGAAGGAGTTTACTATGGTCAGTGCAGTGAGATTTGTGGA
+ACTAATCATGCCTTTATGCCTATCGTCGTAGAAGCAGTTCCTAGGAAAGATTATGGTTCT
+CGGGTATCCAATCAATTAATCCCCCAAACGGGGGAAGCTTAAGCGGTGGCATTCGTCTAT
+CCCGACC
+>ds2020-328_433
+GGTCGGGATAGACGACAAAGGCCTGTTCGCATCGCAACTAATAGAAAAAAACAACTACTA
+GACTAGACTAGTAGTTGAGTGCTCCTTGTTGTTCGGATCTTGACCGGGTCCGAGCTTCCC
+CAGCTCTATGCTGTTGGGGAACTCTGCAAGGGTCTTACCACCTTCTTGATTTACTATAAT
+TGAGTCTTTGGAGTACTTTAGGATTATATTCCGCGCCGAGGATTTGTGCTTGACGTCTAT
+CCCGACC
+>ds2020-328_434
+GGTCGGGATAGACGGGATGCTTTTGTTGAAGGGAGGAAGATTAAAGATAATGTCCTTGGA
+ACGGGTCTAAACGAAACTTCCGAGCCCCTATGTTGTAATGGTTGGGGCTGCTAATATAAA
+GACTTTTTTGGGTCATACGACACCTGCAAAACGAAAAAGCCCTAATTTCAGCCCCGAGCG
+GATAGCCCATGAAATACCTGTCACTTTGAGCCCGTGGAGGCATATGCTGCAAAGACAACC
+TCGTACC
+>ds2020-328_435
+ATAGGGCCCTATCTGGCTTTAATAGGGGGGCAGCGCCAGTTGTTTGTTTTCAAGTCAAGC
+CCCGTATCCCTATCTCTTTTTAGGTTGGCATAACAAAGAAAGAGAGTGCCAAGAAACAAC
+ACATACCCCCCCGCTTTTGGAAGGTTCGGGATCGTCAGGGAGCCCCTATAGACGTAAAGA
+CTTGACTTCACTGAACCGGCACTACTATTTGTCGGCTCCTACCACTCGCCTCCGTCTATC
+CCGACCG
+>ds2020-328_436
+GGTCGGGATAGACGTTTGGCAGCGTTATGGCTTTCCCCTCGGAGATTGCATCGGACTGTT
+TCAGCAATCTCTGGAACATCCTGTGACCAATTGAGATCATTTCCTTGTCATTCCGCTTGC
+GAATGCCATAGAAAATCTTATAGTCATTGGAGTTGCCAGGGTTGCACCTCTCCTCGATTT
+CATTGGGGCCATATTCTGAAATTGGGACGGCGTCGACAAACACCCCGTTCTTGCGTCTAT
+CCCGACC
+>ds2020-328_437
+GGTCGGGATAGACGCCGTGTACCGCTGGTCGGGATAGACGATACGAACTAGGGATGGGAT
+CCCGCCAAAGAGAGTCGAGAGCCTCTATTCCATGCTTTCGCCAAGCTAGTCTGCGAGTTG
+TCCGCCTAACTCACGACAGTTGGTACATTAGTGAAAGATGCAGTTCGCTTACCTATTCGT
+TTTAGATATTTTAGCTTTAGCTAGAATCAACCCCCAATATTAGCACCCAATGCCGTCTAT
+CCCGACC
+>ds2020-328_438
+GGTCGGGATAGACGGACAACGGCATTAAAAGAAGAGAAGGCCAGTCCTTGAGCCAGAGGT
+CATAGTGATCCTGTCCTTTCAATAGTTAAAGGCACACAAGAGAATCGCTTGGGAAAGAAG
+GGCTAAATAGCGCCAGAGGGAGCTGCTAGAGAATCAGCCCCCACTCTCTTTCATTTCCTC
+CCTCTCTAGTTAGCGCGTAGTGGGAATAGCCCTTCATCGACCCGGGTCAAGAGCGTCTAT
+CCCGACC
+>ds2020-328_439
+GGTCGGGATAGACGGGGGTGCAGTATGTCTATCCCGACCAGCGCGAGTACACGTCTATCC
+CGACCAGTATAAGCAAACGTCTTCCCGACCGCCGTAATTCTCGGACAGAGAGCCGTGGAC
+CTAGTAATTGGAACCGTGCCGTGACCTAGTTTTACTGCTCGTGCCGGGACCTAGTGACTA
+ATGGGGCCTAGTCGTCAGGGGGTTAATGACTAGGTCCACGGAGGGGAAAGCGGACTAGGT
+CCACGGC
+>ds2020-328_440
+GGTCGGGATAGACGATATACGCCGCTAACCCTAGCACTGCTCAAACATACTGATATAAAG
+CATATCCGCCATGTGATTGGCTCACACCAAGACCCTGATATCATTGCGTCATTGCCGCGT
+TGGTTATTGCATACCCAAGCCAATATCGTCATCTCAAGGTTGTGGGAGCGTATTTTACCG
+CATCTTAACTCCGCGTTTACTACTGACCGTCTGCAAGAAGGGGGGGAATCGTCCGTCTAT
+CCCGACC
+>ds2020-328_441
+GGTCGGGATAGACGTGCCCAGCTACTTCAAGAGTTAGATCCTTTGGCAGACATACGTCAC
+TTCTACCACTAGCAGTTTACAAACATAACACCGAAACTAGCTATGTAATTGCGAAACCAG
+AAATATCAATAGTCAAACTGGGTCAGAGAAACGTAAGAGTGAATCATGCACAACTAGTGC
+ATGGTAAGAAAAAAGATGTTATGTTTCATGTAGTTGGCAGTGCCGTCTATCCCGACCGCC
+GTAATTC
+>ds2020-328_442
+GGTCGGGATAGACGAGTCAGGGCTCTCAAAACCAAGTCAGTTAAAGACAAGATGGATTTG
+CAACCGCCAAAGGCCAAAGGAGGGCAGAGCCCCCCTCATACTCGACCTTGGCAACAAGCC
+TTAGCCGACAGGGGCTGATTCCTGCTCTGCAAAGTCTTTTGAGTGTTCATCCGGTTCTGC
+TGATTCCTGCTCTCCCAAGTCTTCTGAGCCTCGAATTCATAACCTGCATGTCACGTCTAT
+CCCGACC
+>ds2020-328_443
+GGTCGGGATAGACGTTGCAGCATGGTAAAATAACTGATCCTTCCGGGCAAGTACACACAT
+TGTATTATGGTGGTACTGCAGGGGGTGGAATTGAACATTTTGGGGGTACATTCACATTAA
+ATTGTGGAACTCATTATTATTACGGAGATGCCAACCATAACACGAAGGCGCCTTATGACT
+GTTAATACTGATGTCACCCAGCACTCACTGTATGAGTATAAATGGCAGCCGGCGTCTATC
+CCTACA
+>ds2020-328_444
+GGGTCAATCCAGAGAGGGTGATTGTGCTTCTTGAGTTGTTTGTTTTGGTTCTCTCATTTA
+ATTTTCAATTTTCTTTCTTCCTCAATTTATGTAGTTGTTGGGTTTTTAAGATATGTATGA
+GAGATATATATATATATATTGTTTGTGGTGAGAAGAATGAAATGAAGAAGGAAAGAGGGA
+AAGAGGGAAGAACAGTTAGGGTTGGGGTTTGGGGGAAAAAAGACAGGGATGACGTCTATC
+CCGACC
+>ds2020-328_445
+GGTCGGGATAGACGTAAGTGGCTTTTCCCAAGTCGACCTGACCGTGAAGTTCGTGGTAGT
+CGATGTATCGTTGTACTACATTTGATATTCTTGCAAACTTCGGGTAGTAGTTTGTTCTCC
+CCCCAGCCAGTGTTGGCCAGTGCGATCGCTTTCGGTTGGCAGGAACTATCTTGTACATTG
+CTGTTGATGCAAGCCTATATTTCATGGGTCTAGGCTTGTGATTCGCCTGTATCGTCTATC
+CCGACC
+>ds2020-328_446
+GGTCGGGATAGAGATAAGGGTTCTGGCTTGAATACCACGACTTGATCATGACCATAGTCG
+GCTTGGTGGTCGAAATCTCTGAGGGTTTGGAGGTTTTGAGGTGGGTAGAGAAAAGGGTTG
+GCGTTGATGTCGTGAATGGAGGTGGGATTTATGGGGAAATTAATGGAGGAGGGCTGTGGA
+TCCAAGTAATTGAGATGGTTGCGGAAGGTGGAGGCTGAGGAAGAGGAAGAATACTAGGTC
+CACGGC
+>ds2020-328_447
+GGTCGGGATAGACGCCGAGCCTGCTTTCGTGCCTTCTCTCTCTCTCTTCTTCTGCGTAGA
+AGCATCAGTTTGATCATTCAGTTCTGCACTTTTTGCCTTTCTTGCAGGGACTCTTCCTTT
+GGTCGTCTCCTTGAGATAGTTTGCCCTCTCCTTTCAGTCGAGCTACTTCGTTACCCTCTC
+CTCTCCTCTCTTGTGTCGATTGTTCTGCTAGCTCCTCTTTGTACCGCCATCAGCAAGGAA
+TCGGGT
+>ds2020-328_448
+GGTCGGATAGACGGATATGTTCCTTGGTCGGGATAGACGACCAGGCGTTGTTTTCGTCTA
+TCCCGACCGCCGGACAGAGAGCCGTGGACCTAGTCTGACTTCCCTTGCCATGGACCTAGT
+CTTCATTCTCCTGCCGTGGACCTAGTCTGTTTATACCTGCCGTGGACCTAGTCATCACCT
+CCCTGCCGTGGACCTAGTGCTAAGTCGGGTGCCGTGGACCAAATCTATTCCCACTAGGTC
+CACGGC
+>ds2020-328_449
+GGTCGGGATAGACGTGTGGAACTCAACGTGCCCACCGCAAGCTTCAACTGCTCCTGTTAG
+TGTATAAATCAGAAGGATAGGTAAACCGAGAACTTTGATGCAGAGGCAACCTGGCACTGT
+TGACGAGCCGTAGTTTACTACGATAGCGGTGGGAATTGAAGCCCACTGTAATCTCCCAAC
+ATCTAGGCCCATCAGGGTAAAGTGTGAGAATGAAATTCAAAATGCCCCACTTCGTCTATC
+CCGACC
+>ds2020-328_450
+GGTCGGGATAGACGTAGATGAACGGTATCTGGGGAATAAGCATCGGCTAACTCTGTGCCA
+GCAGCCGCGGTAATACAGAGGATGCAAGCGTTATCCGGAATGATTGGGCGTAAAGCGTCT
+GTAGGTGGCTTTTTAAGTCCGCCGTCAAATCCCAGGGCTCAACCCTGGACAGGCGGTGGA
+AACTACCAAGCTGGAGTACGGTAGGGGGCGTCTATCCCGACCGCCGTAATTCAGATCGGA
+GGGCA
+>ds2020-328_451
+GGTCGGGATAGACGCGCCCACAATATCAAGCCTACAAAGAAGGCCTCGTGCATGTCACCC
+TTTTTGTGTAAATCCTTAATAACGTTAAACATGAACCCTGCCTTACTAATAATTGTTTGG
+AAATCAATAGCCGCTAATTCCCTCACAGTAATGTGTCTCAGGTGACTGGCAGACACCTTC
+AGCACGGGTAGGTCAACCACCCCTGAAAAAATATTCTCAATAAATTTCACGCTGGCCAAG
+CTTGG
+>ds2020-328_452
+GGTCGGGATAGACGGCCATTCCGTTTTTTTTTAATCCAATTGTTGACGAGGAAGAAGCAG
+ATAGAGCAAAGGTCTCCTCTTTCCGTCCGCTCTTCCCGAAGTGAGCGAATTGCATGTAGA
+GATCCGTAGGGGCTTATAGTTTAATTGGTTGAAACGTACCGCTCATAACGGTTATATTGT
+AGGTTCGAGCCCTACTAAGCCTACCACCCCCTTCTCTGCACCCGACCCCGTCGTCTATCC
+CGACC
+>ds2020-328_453
+GGTCGGGATAGACGAATTCGTGCGGTCTTTCTATTTTGAGGCAATGTTGTAAGCATCTTG
+TTCAGATGGACTGCTCATTGTTATGTACGTTGGATTTCGGAGTCCAACATGGATTGGTTC
+GAGCGTGGACCGTGGTTCCTTTCCATCTATGATAATCTCTGTAGGCATTCCTGGTTACTC
+CCGTTTAGCGTGGATACTGGGTTCATTGGTAGGTGAGTACCCAGGATGACCCGTCTATCC
+CGACC
+>ds2020-328_454
+GGTCGGGATAGACGGATAGGCCCAATTATCGTCTATCCCGACCGCCGTAATTCATACCAT
+GACGTATCTGTAATAGTAATCATGAGTAAAACAAAAATACTTGTACAAACTGGCAAAGTA
+ACCCCATCCCCAACGGTCCAAAGATTCAAATCTTTGTAATATTCTGAACCATTCATAAAC
+ATCACAGCAAATACGATTAAAACATTTATAGCTCCCACGAGAGGGGTCGCATAGTGGCGG
+CCGTT
+>ds2020-328_455
+GGTCGGGATAGACGAGCTCTCCGCATATCCAATAAAAACAAAGCGTGCTGCTTCAACGAG
+CTCTCCTTCTGATGGTGGTGGATCAATAACTGAGTTTAATGTAGTTCTTCCCTCCGGAAA
+CTTGGTTTTAAGCTATTTTTCGCTCCCAGAGCTAGTTGAAGAAGACTCACTACCCTACTT
+CACTGATAAGAGTGGAGTCCCAAGCCACGCAAGAGACGGATTCATAGTCAACGTCTATCC
+CGACC
+>ds2020-328_456
+GGTCGGGATAGACGTTGTGGGTGGATAAAAGTTGTGCATTTTAAAGGGTAGTTTTGAGGA
+ATGTGCGATTTTATATTATATAGGAAAACTGTTTGAATTATTACTTTAAGCTAGAAAAGG
+AGATTTCCTACATCCCAAGCTGCTAATTCTTAAAACAATTCAATTATTACGGTAGTAAAG
+TAAGAAATTTGTTATCCTTCTGTCCTTAAAACCACATTTTAAATTAAATTATTGGTAGCA
+GTTTA
+>ds2020-328_457
+GGTCGGGATAGACGGTCTAATGAGGTGGTGGAGGAAAGTCGAAGGCTTAACAAGTCTGGG
+ATGTTGTTCAAAATTGATTTTGAGAAAGCCTATGATCATGTGGAATGGAGATTTGTTGAT
+GAGGTTATGATTAGGAAGGGTTTTGGGGAAAGGTGGAGAAGATGGATTTGTGGATGCCTC
+AAGACGGCTAATTTTTCTGTGATGATTAATGGAAGACCAAGGGAGGTGGGCGTCTATCCC
+GACC
+>ds2020-328_458
+GGTCGGGATAGACGGAAGGTAGCATTGATAGGCAGAAGGATTTGGTGACGGTGAAGGGCT
+CAATGGACATGAAGGAATTGGCTGAGACTTTGAAGGAGAAGCTCAAGAGGCCTGTTGACA
+TTGTGCCGCCAAAGAAGGAGAAGGAGAAGGAGAAAGCCGAAAACAACGGCGGCGGCGGTG
+GCGGTGGAGATAAGAAGAAAAAGGAGGAAGAGGGGCATATAGTGGCGGCCGTTGCTGTGT
+ATTA
+>ds2020-328_459
+GGTCGGGATAGACGAGGCCGTCACCTATGGTTTTTGTCTCACTGTACGGGACCAGTCTAC
+AAATATGGAGATGTACAAGCATTGGGAAAATAAGAATCCTTGGTCGATAGAGAGCCGTTA
+GCTAGCAGCCGAAGACGAAGGAACAGACCAGTAAGTGTGGAGATGAGCCTGCTAGACGCA
+GAGCTGGATCTGCTATATGCGGTAGTTCTTCCTTCCGAAACGCCTTACCTCGTCTATCCC
+GACC
+>ds2020-328_460
+GGTCGGGATAGACGTGGTAATGGTATGGTTGTGTGGAAAGACTTGAGGAAAGAACTACGT
+GTGGCTTGATCCCTCAAAAAGGGTACGCAGGCAGCCTGAAGTTACTAGGCGCGGCCGCGG
+ATTAGGCACCACTTAAGTGGTTTTGTTGATGGGTTCGGACCTCGTGGTTGGTTCCGAAAT
+TTGGTTGAATTTGAGGTTCGCTAGGTGAGTTGAGTGTAAGTGTGGTTCACCGTCTATCCC
+GACC
+>ds2020-328_461
+GGTCGGGATAGACGGAAGGAGGTCGTGTAATAGGAAGGTAAGGTGTAAGCCTCGAAAGCC
+TTTGGTACTTCGGTAGGGCGAGCAGCCCTTAAACCAAAAAGGTTTGGAACCCTTCCCCTA
+TTTCTGCATTTCATTCTCTAGCCTCAAACAAAATTAGAAAAAAGGAGAGGCCTTCGCATT
+CCTAATCCGGTGGGGGGCCGGACGGCTTTGTTTGCCCCAGCTTGGCGAATCGTCTATCCC
+GACC
+>ds2020-328_462
+GGTCGGGATAGACGGGAGCAATATATGGGGTGGATTTAACTTCGGCAACAGTAGCACACT
+TTGCCATGTTTAATTGTGAAGAAGCCTTGAAGCATAGGTTCCCGGTAGGTGAAGATGCGG
+AAGCCGGGCGTGTGCATAAGCGGCTAAAAGCTATGTTAGAAGGATGTGACTCGTACTGCT
+ATGATTTCGATGATTTCAACGCTCAGCACTCGACGTCGAGTATGGTCGCTGTGATAAAGG
+CGTA
+>ds2020-328_463
+GGTCGGGATAGACGATTGCCGTTGCTGAAAATGACGGGCATCAATTGGTTGGGGGATAAG
+AGCTTTGGTACCACAATTCTGGAAGATGACGAAGGATGTGGGCACCACCTCAGGTCACAG
+TTTCAACACGTTGATCCAATCTATTTGTACCTTGATGGTGGGCTATGCCGCACTCTTCGA
+CCTGGTTCCTGATGAAGACTGGGATCGGCTCTGGCAGGAGGCGTAGCTCGCGTCTATCCC
+GACC
+>ds2020-328_464
+GCCGTGGACCTAGTGGTGTCCCTGTTGCCGTGGACCTAGTGTAATGGAGCCTGCCGTGGA
+CCTAGCAACTCACTAGGATAGGCGGTATTATTGAACCAAACAAAGCAACAAGCAATAAAA
+CCAAAAACAGATAAAGCAGCTAAACTATAAGACAGGTAAGCCTCTCCATACCATACAAGT
+GCACGGCGAGCCCATGCAAAAGGTTTGGTTAAGATATGCCAGATTCCACCAAGTATACAA
+ATGG
+>ds2020-328_465
+GGTCGGGATAGACGTCGACCCCGCTTCTTCCACTTCTCTTTCTTGTGGTAGTCGTTCTCT
+TCCTTGTGGTAGTCGAATGAGGAAGTATGTTGCGGCAACTAAAGAGTTATCGAGACTGAC
+CGCAATTGCAGTAAGAGTTTGACTTTCTTTCAGTTATGTAAAGTTGTTTAGTACGAGATC
+GCTTCACACCTCGCGGTGCTTACACCTCTCCCCACTCAATAGACTCCATAACTAGGTCCA
+CGGC
+>ds2020-328_466
+ACTGCTGCAGAAGCGGAATCGAAGGGGTTGGTTGAAAGGTAAGGATAGCGTGATTGGCCG
+ATTGGTTGGAAGGTAAGGATAGCATGATTGACTGGTTGCGGGTCCTTTGGATCATGGGCC
+ACAGCTACTTGGGTAGAGACCGCTGAACATCATTTGGACAGGCCGAGGCTATATGTGCTT
+AGGCCTTTTGATGGCTGTCATTTTCTGGGCTATTTGGAAGGGTTAATGTCGTCTATCCCG
+ACC
+>ds2020-328_467
+GGTCGGGATAGACGGTCAGTCCCCCTTTGAAATCAAGCACCTCTAACCTCAGCTTGTTCC
+CCGTTATTATACCTACCATTTCGGCTCTAGTTACGGAGTTGCCATTACGTGTGACATAAG
+CCGCATATTCCGTATACTTGTCGCATATGCCTTTCAATTTCTCGGCTTCTTCATCCACTT
+CTTTATTGAACATCACATCTTCTAAACCACTACACTCACGTGGCTCCGTCGTCTATCCCG
+ACC
+>ds2020-328_468
+GGGCGGGATAGACGAAGGAGATGCATTTCTGGTACTGGTGATACTGGACAAGCTCTCAGG
+GAATAATCTCTTTCTTATTTCTGCCTTTCTTTCCCATGACGACTAGGAACGGGCAAATCA
+AAAATTTCACTTTGAATTCCGGACCTCAACATCCTGCTGCTCATGGTGTTTCACGATCGG
+TATTGGAAATGAACGGAGAAGTGGTGGAACGTGCGGAACCACGCCGGACGTCTATCCCGA
+CCA
+>ds2020-328_469
+GGTCGGGATAGACGAAGAATGGCTCTTACCTAGCTATTGCCCTGATCCTATTCGATCGTA
+TAGAACGCTACTATAGACCCTAGCTATTCCGCCCTATCAAAGCCCAGAGCAAAGAAGGAT
+GGAGGGACAACAACCCCTGAGGGAAAGGCAGAAGCATAAGCACTGACACGAGATGTCCTT
+ATCATCACTCTTTCTCGATCGAAGGCTTTAGCATTCCAATCTCCGCGGCCGTCTATCCCG
+ACC
+>ds2020-328_470
+GGCGGAAGACGAAGCGGGAGGAGATTCTTCATCACCAGATGAATGGAGTGCTTCGGGGGC
+ACTTCTTCCCAAGTCGGAAGACGATTGAGTCAGACCGGGCTCACTTTTCTAGTTAGTTCT
+AGACAAAGACTTCAGTGAAGGAACGGAGCTTTGTTGAAGCTATTACTCAGACTCTTTTTC
+GTACTATTGGCAGTGGAAGAAAGATCTTAGAATAAGTATCCGATTCAGACGTCTATCCCG
+ACC
+>ds2020-328_471
+GCCGTGGACCTAGTATTCGACCCCCTAGCCATAACAGTGCTCTACCCCCGACGGTGATAC
+GAGAGGCACTACCTAAATAGTTTTCGGAGAGAACCAGCTATTTCCAAGTTTGTTTAGCCT
+TTCACCCCTACCCACAGCTCATCCCCTAATTTTTCAACATTAGTGGGTTCGGTCCTCCAG
+TGCGTGTTACCGCACCTTCAACCTGGCCATGGGTAGATCACTTGGTTTCGGGTCTACACC
+CAG
+>ds2020-328_472
+TTCGTATCGATAGTTTTTATTTGTGACAACTTTCGTCACTAATAAAACCTACTTCAACTG
+AAGGGTGATAAATCAGCCGTACTCTTTCCCAATCCATGCTATCTATGGCGTGTAGAAATA
+CACCAGCTGTAACCGACCAATACCTACAAATGCATCTCAAGTAATTTGAGTTATTTTATT
+AGGCGGGGACAGGATTCGAACCTGCAGTCTTCAGGTCATGAGCCATATTCGTCTATCCCG
+ACC
+>ds2020-328_473
+GGTCGGGATAGACGTATGATATGGGTCCGTGCAGCATTTCCACGATATCGTTATGATCAA
+TTAATGGGACTTGGCCGGAAAGTGTTCTTGCCTCTATCATTAGCTCGGGTAGTCCCCGTT
+TCTGGTGTTTCAGTCACCTTTCAATGGCTCCCTTAATTATGCGCGAGGAATTTTCCTCTG
+GAAGCGGGCTAGTCCCCGAAAATGCGCGTTAAAGTTGGGGCTAAAAGATGGACAGAAAAA
+CGT
+>ds2020-328_474
+GGTCGGGATAGACGCGTGAGGACTCTTTCTCCGCCGGGTCAATCCTAATATGGGTGAGGG
+GGAAATCGAACTCTGTTATTCATTGCCGCAGAGACGCAAATTGGAGATTTCATCCCCTCC
+GCTCTAATCGGAACCCTTTTTGCGATACGTAATGCGTGAATTGGAACCTTTCTTTCGGAA
+CGGGATACGCTAGAACCAGTTGCTGGTAAGAACATCTATCTGAGGGCGACGTCTATCCCG
+ACC
+>ds2020-328_475
+GGTCGGGATAGACGATTTCTGAGAGTAGACCACAAACGAGGCTCAAAAGGACAGTATCTG
+GCGAGGGCAACGTCAACATTGGTACACTCACGAATAGAGTCTAAGCCGTCAAGTGACATA
+AGAGACCTAGTTGAATCACTAGAGTTCAGGTTTGATGACTGCTTATCTAGAGGGATGGAT
+AGCAGCGTGATAGTAGCGCTACGTCAGACATATTATAAGAGACCTGACACGTCTATCCCG
+ACC
+>ds2020-328_476
+GGTCGGGATAGACGATGAGTGGCCATCTATGGTACTGACGTGTCAAGTTACATCATGTCG
+CAGTTCGCATTCTACAACTGTGAGGAAGTACTGCCGGCTCAATTCCCAGTGGGGCCTGAT
+GCGAACGACAGAAACGTTACGGCAAAAGTGCAAGGAGTGTTGGAAGGGAAGGAAGCTTTC
+TGCCTCGACTACGAAGACTTCAACAGTCAGCACTCAGATGAGGCAAAGGCGTCTATCCCG
+ACC
+>ds2020-328_477
+GGTCGGGATAGACGTTGTTGGGTAGTGTGGAAAGGATTTTTGATAAAACGATATACTATA
+TTTCACACAATACAACAACTACCAACACATTACTAACATATTTTACACGCACATTTCACA
+GCATGCCGCTCACCAGTGAACAGAAGCTGGCATCTCGCCAAGCCAGAAAGCACCACCAAC
+ACGGTCTGGTAGAGCTGGCAGCGTATAAGCCCTCCCTCTCGTCTATCCCGACCGCCGTAA
+TTC
+>ds2020-328_478
+GGTCGGGATAGACGGCAGGTCGTGGTTATTTTCTAGCTAACTATAGCTTACATCCCTGCT
+CGGGAACCGCGGTAGTTGCCTATCCGGGAAAAGCACGTTATGACGTCTTGCTAACTCATC
+ACCATTAATCACCCCTCGCTGGTAGTCTCGTTGGGCACAGTCAAGCATAGTTTTCGCTGA
+CGCCAAATTGGGCACTAATTCGTGGTCACGCTCTAATATGCCATCGAATCGTCTATCCCG
+ACC
+>ds2020-328_479
+TGAATTACGGCGGTCGGGATAGACGGCGTCGGACGGTGGTTCGTGGATGATAGTGTGAAT
+GTCAAGGTTGTCAGGGATAACGATGCGTTTTTGTCGTTTAGGATGAGTCGGCTTTTTGGA
+TTGAATGTCTGTGCTATCGTTGTGTGTGTTAATCGGTTTGCTAGCAGGCAGTTTGGCTCG
+CTCGTCATCGCTAAGCTTGGCTAAGAAGTTATCATGAGGGGAATCTATCGTCTATCCCGA
+CC
+>ds2020-328_480
+GGTCGGGATAGACGTCGCAGCTCCTTGGTCGGGATAGACGTGAAGGTAAGGTAACGCTGT
+GATTCCTGCTCAAAAAGCAGACCGAACGCGTTCGAGTTATTGGCTCGTCCAACACGGCTG
+CATTCATGAATCGCTCGTTCAACTGTCCCTCGGAGACACGGTCGAGAAGTACCATGTACG
+GTTGCCCCCCGTCCTTTCTTTATCTCGGTCCCACCCAGCAGCTGCGTCTATCCGACCGCC
+GT
+>ds2020-328_481
+GGTCGGGATAGACGAGTAGAAGGGGTAAGACTGGCTCTCGTGGTATAAATCGTTCTACGA
+TTAGAAGAGCGGGGTATGCTTGGGAGTTATCTCTTGCTTTTAGGCTAACCAAGCGAAAGG
+TGGTTATTGGAGCGTAGGTGTTAAATGTAGCCGTCTCCCTACATTGATCACAGCTATCTG
+CCGGCGCAGGCAGGGGTATTCTACTTGACACTCTTCATTAGGATCTTACGTCTATCCCGA
+CC
+>ds2020-328_482
+TTATGATACGAACACTAAGCCAAACATTTATATGGATTCCTAAAAAATGAAATAATAGAC
+TATCATGTCATAATATATGACAGAAGCATCACTCTGTCTGTTGGATGCCCTTCTTCACTG
+CAAACATTTATGTGTTGCCCTTTCTTTAGATTGAAGATCGAACTGACAACCATCATCCTA
+TCTTATTCCTATTTTTACTTTACAGGCACAAGAAGGAGTACTATTATACGTCTATCCCGA
+CC
+>ds2020-328_483
+GGTCGGGATAGACGGAATTAACCCATGTAATGGCACAATCGAAGGCTCTAGCCGTGGCCG
+TTGCACGGATAACGAGAGGGAAGGGGCGGCACGACGCATCTGTAGAAGATTTCATCTTCT
+ACATAGCCTCAAACGGGCGTGCCGTCTCCGCTTCGGATATACCATCCGGAGTCCATAGCT
+TGGCTTGCGGTCCTCGTGACCATGTGGAACCCTCTGAGCGTTTACCAGCGTCTATCCCGA
+CC
+>ds2020-328_484
+GGTCGGGATAGACGATATATCTGCCTGGTCGGGATAGACGTGGACATCCCTTGGTCGGGA
+TAGACGCAAACGGTCTATGTCGTCTATCCCGGAATCCACAGCAACGGCCGCCACTATCTC
+CCTTGCATAGTATTTGTTGCGCAGCGAAGCTGCTAGCCACATAGGCATTCCTCTTGACAC
+TGAGTCATCTAACCGCGACTCAAGCGCTTCCAGGAGGTCCCGCATGTCGCTAGAAGGCTT
+CG
+>ds2020-328_485
+GGTCGGGATAGACGTGAGGGCGGCTATTTTAGGTAGTGTTATAAATGCACTGGCTAAACC
+TATTGATGGTCGGGGCGAAATTTCATCTTCTGAATCTCGATTAATTGAATCTCCTGCTCC
+TGGTATTATTTCGAGACGTTCCGTATACGAGCCTCTTCAAACCGGACTTATTGCTATTGA
+TTCTATGAGCCCTATAGGGCGTGGTCAGCAAGAATTAATTATTGGGTCCCGTCTTCCCGA
+CC
+>ds2020-328_486
+GGTCGGGATAGACGTTTTTGTGCCATGCGTTGCCTCGTGCCGCGTTTTAGGAACGTCAAG
+TTTTATTCTTTACGTGTTTTTTTGGGTTTATTTATTTTATAGTGTTTTTAATACCACTTT
+CACAAGTGAGTTTTTAGTTTTATCGCATCGTGCGATGCCGCTGTCAGCTCACAGCTGATC
+GATGTCCCGTAGTCTCTAGACCTACAGACCCATGCTACGCGGTGTACTCGTCTATCCCGA
+CC
+>ds2020-328_487
+GGTCGGGATAGACGATGCCAAGTAATATATCATCAGATGCAATATCGGGTCTAGCAGAAG
+ACCTAAAATGGAGAGTGGAGCCTGGGAGTGTGAGTGAAAGAGAGGTCAACATTGAAGATA
+GCAGATGGCTAATATTAGCAGCAATGGCACCAAAAGCAAACTTTGACGTAGAACAATTAA
+AGTTGCTTTGTAAGCACTTTAATGTACCTATAGACATGCGAACGGTGCGTCTATCCCGAC
+C
+>ds2020-328_488
+ACGGCGGTCGGGATAGACGTCATGTGGTCCTCCTATTCAACTACTTCAACCATTTTCGAA
+CACCTCATAGCATTTTCCGAACGTTCGAGGCTTCTATCATTTATGTATTATTTGATTTCT
+CGTACACTGTCCCTTCTTTTGAATGGGTTTCGAATAGAAAAATAATTTATTGGTCTGTAA
+CCCGACCTAGTTTAATCCATGGACTCAATTCGGTTATACCGGAACCACGTCTATCCCGAC
+C
+>ds2020-328_489
+TGAATTACGGCGGTCGGGATAGACGTAGTCAAGTAATTAAGTGCATGTGGTGGATGCCTT
+GGCAGTCAGAGGCGATGAAAGACGTGATAGCCTGCGAAAAGCTCCGGGGAGGCGGCAAAT
+ATCCTTTGATCCGGAGATTTCTGAATGGGGGAACCCACCTACTTTAAGGTAGGTATTGCA
+ACATGAATACATAGTGTTGCAAGGCGAACGAGGGGAAGTGAAACATCTCAGTACCCTTAG
+G
+>ds2020-328_490
+TGCCGAAGCGATTTATAAAGCACAGGCTGAAACAGGTGAAATCAAAGGGCATTACTTGAA
+CGCTACTGCAGGTACAGTAGACGAGATGATGAAAAGAGCTGCATTTGCCAGAGAATTGGG
+GGTTTCTAGTGGCGGCCGTTGCTGACGGCGGTCGGGATAGACGAGAATACCGGGTGTCGG
+GATAGACGAAGAAGCGCCCTGGTGGGATAGACGATACCCATCACGAGCGTCTATCCCGAC
+C
+>ds2020-328_491
+TGTATATACCTGCCATGTGCTCGTGGCTGTGCCTACTATTGAAGTCGGGATAGACGTAGG
+AGCTGAATACCGACGACACTCTGCATTTATCACTTCGCATCATCATCATCTCAAAGAACT
+TTTTATTATTCAAGTTGATGTCTATACTTGGGTGGTTCAGATGTTTCTCCACTGGTGCCA
+TGATCCAATTTGAGTAAATATAATGCCAGATTGATACGCCACCTACCCGTCTATCCCGAC
+C
+>ds2020-328_492
+GGTCGGGATAGACGTCATGTGAGACTCGCTGCCCACAGTGCCACGCCCGTGAGGAATGAA
+TTAGTTGCCTCCTTGGTTATTGACAGCGCCAGAGATACACTGTCTGAATTAACGCCTAAG
+ATGTCAACTACTTCCTTAAACGAAAAGTGGACGTGGTGCGACGCCGTTATCTTAGTGTGT
+TTGGCTGAAATTGCTTCGTGTAACAGCCAACCTTTACTTAGCTTTCCCGTCTATCCCGAC
+C
+>ds2020-328_493
+GCCGTGGACCTAGTGAATTTGGCTCTGCCGTGGACCTAGTGTTGGCACATCTGCCGTGGA
+CCTAGTGTGTCTACGCCTGCCGTGGACCTAGTTTTAACAGGCTTGCCGTGGACCTAGTAA
+CACTTAACCTGCCGTGGACCAAGTGGTACAAAACTAGGTCCACGGAGAATTACGGCGGTC
+GGGATAGACGGATCGGGGGGGGTCGGGATAGACGTTATCTATTTTGCGCGTCTATCCGAC
+C
+>ds2020-328_494
+GGTCGGGATAGACGGATGGTGCCCCTATACCCAAATTTGACGATCGATTTGCACGTCAGA
+ACCGCTGCGAGCCTCCACCAGAGTTTCCTCTGGCTTCACCCTATTCAGGCATAGTTCACC
+ATCTTTCGGGTCCCAACAGCTATGCTCTTACTCAAATCCATCCGAAGACATCAGGATCGG
+TCGATGATGCACCTTGCGGTTCTCACCTCCGTTCACTTTCATTACGCGTCTATCCCGACC
+>ds2020-328_495
+CCCCAGGTCCTCTGACTGACGTCGTAATAGACTGCAGACTTGTTGCCTGGCATCGGGGCT
+ACATACGCTTTCACTAAATTGCCGTACGCACAGACATTTATATCACCTTCAAAAACGCCG
+TTCACCATTCCCATAAACAAATGAGTACTATCCTCGACTGCTACTAACTTTAACTCGTTC
+ACAGTTCTGCCTGACGCTCTTAATACTACGATTGATGCCGGCATATCGTCTATCCCGACC
+>ds2020-328_496
+GGTCGGGATAGACGATGGAGAAAGCCCTCGTCGCGAAAAAAAAGATGTTCGGATAACTCT
+TGGAGATTTACTTCTGCGGGTAGGTTCACGTTCCCATCCGGAGTAGTATCTCTATAGACT
+CTAAAAATTATTGAGAGTTGTTCCACTATTTTTTCTTTAATAACATTCATGGTTACATCA
+GTAACCTTTGTTTCTATATTCATACTATCCATTAGATGGAGCATGGCCGTCTATCCGACC
+>ds2020-328_497
+TGAATTACGGCGGTCGGGATAGACGACACCACCCCCTTGGAAAGGTGTGGTTGGCCTGGC
+TAAGGGCCTTAGGAAGACCAAATCTGCATACCCGCTTGTGGTGGCCGTCCTGCCTGATGT
+TCCTGAGGAGCACCTCCAGATTCTTGAATCTCAAGGATGCATTGTGCGCCAGATTGAGCC
+TGTCTACCCTACTGAAAACCAAACCCAATTTGCCATGGCCTCTTCGTGTCTATCCCGACC
+>ds2020-328_498
+AACTGCCTCCACTATTTTTCGTAGCTATTCTTTTATTATTTTCATTTTAGTGAGTTTAAA
+GTTATTTTCTAAGTTAGATGTAAGGCTTAAGGAGGTTAATTTTTTAATTTATTTAGTGGC
+TCCTATTTTTATGCTTTTGCTTTCTATTTTTTTATGGTTTATTTTCCCTTTTGGTGGTTT
+TCTCTATTATTCTAGCTATTCTTTTATTATTTTCATTTTAGTGAGATAGTGGCGGCCGTT
+>ds2020-328_499
+GGTCGGGATAGACGGGCAGGTCATATGGAAGCGGCATATCTAGTTGGACTACTTGGCATG
+TGCGGAATTGGTCAGTCAAAAGAGGATGCATTAGAATTCTTGTGTTCTTTGAATCAACGT
+AACAACATTGATATGAAAGGAACCAGGGATGCTTTGAGACGAAGATTACGCGGAATTTTC
+TCTGTTGGAAGACATATCGTAGATATGTTCGACCATGGGAGGGTGCCGTCTATCCCGACC
+>ds2020-328_500
+AACGGCCGCCACTATTGTAATCTTCTATTTGAAGTGTTGGTTTGCAGAGAATGCTTTATG
+TATTGTGAGTTGTGATCACTAGTAATCGATGAATTTCATTCCACAAAGAGCCTCCTTCTT
+GTTTCTTGTTCCCTTCATCTAGTTTGGTTTTCTTTAACACAATCCCTCAAGACACTGAAT
+GAGAAGCCCTTTGACTGGTTTGGGCGCCAAGGGAATGGAAGCGACGTAGTGGCGGCCGTT
+>ds2020-328_501
+GGTCGGGATAGACGACGTCCGTAGCTTTGAGGTCGTAGTAGTTGGAAGATGAATTACAGT
+CGTCGAACACTACCTGATGGTGAGGATGATGATTTTGAGTTTGTGGAGGAGGCGGGCTCA
+GTGATTTGCTCATCTGTTGATCTCGGAAATCGATGGAGGTGATGGTGGAGGACTCGGCCG
+GAGCTAAGAACGAGTCGTCGCCGAGTTGGACTTGTTGCTGCTGATTAGGAAGCGGTACA
+>ds2020-328_502
+TGAATTACGGCGGTCGGGATAGACGTAAGGTGTCGGTTGTGGTTGGGGTCATGTCAGGTA
+TGGGGAATGCTGGTGGTGGTAGCAGTGGCAGCTGTAGAGGCAGCGCTATTGGTTCCGGTA
+GTGGTTGGTTTTAGTGTTGAAGGTGGCAGTTATGGTGGTGGTGGGGCCCTTTGGGGGTGG
+TCACAACAGCATGTAGGTGGAAGGGTTGTGACCAACTCCCCAGGGCGTCTATCCCGACC
+>ds2020-328_503
+GGTCGGGATAGACGACGAGTGCTATTTAGTGGGAGTTGTTGGTGAAGTGCACTAGCCAAA
+AGATGAGTTTTTAATTACAAGTGCTATTGGCATAAACCATATTCAATTCAAATATTCCCC
+TTCCATTCTCCCTATAAATAGCACTCCAATTCTAAACACAAGGGCATTCACAATTCATCT
+CATTCACTTCATCCTTCCACAAACACTCCATTCATCCACCTGTACCGTCTATCCCGACC
+>ds2020-328_504
+AGTGGGTAGAGACGAGTGTGGGCTGTGCGTGTTGTGCGCTTGTTTGACACTTTAAGATAA
+TATGTTAGTCTTGTGTGCGATAGGATGTCCTGTGCCCGAGACGCACAAGGTATACTGGTT
+TCTGAAAGGCCTAGGCCCAAACTAACAGACTTTCGTCATCACCATCATGGCAAAACATCT
+GATACCCTCTCTCAAGGAGATTATTCCCCAATTTCCGAGTAACACTTCTTCAGTCCTAC
+>ds2020-328_505
+AGTGGACGATGTGGGTGTGTTAGAACAAGATTGCTCTGCCGTTGCGCAATAGAATTCTTT
+CTCCGATATGTACCTTCCATCCGGGAGTACCTGTTTATCAGTGATCTCTTGGAAACCAAC
+ATAGTCCAGTGTACCAAATAGTGGTCGGATCCTAGATTTAAAAGAGTCATTCTCCCTGAT
+CGAGCGGGAGTAAGAAGAAGAAGGAGCACTTTCATCTTCCGGGCTTACACGACGAGACC
+>ds2020-328_506
+GGTCTAGATAGACGCTTATGACTGATTTATTTAATGATGCTGTTCTGGGAAACAGGGGGA
+AGGCTGTTAGCCTATCTCAATCTGGTTCCACAGTCTACCATCTTTGCTTTGCTGATGACT
+TGCTTCTATTTGCTAATGCTAGTACCAGGATCATGAAGGATTGTTTGGATAAATTTTGTC
+TTGCCTCTGGCCGCTTTGAGAAGTCAATGATCTACTGCTCCCCTAATGTGGACTCGGTT
+>ds2020-328_507
+CGGTCGGGATAGACGGTTACACACCCAGAGCGGCTTCATGCTAAGACTGATCGGTAGTCT
+GAGCTGCTGGAAAGAGAGTAGTCTGACCAGTATGGCTAACGCGTTAAAGAAATCAGTGCG
+AGCAGCGAAGCTTCTGCAGAACAATACAGCGTTAGATCTTCTGCCGATATTCGAGGCGGA
+GGTGTTAATTAACAGGGGAATAGGTGCAGTGGACTGGGGCAAAACGTCTATCCCGACC
+>ds2020-328_508
+TGAATTACGGCGGTCGGGATAGACGCAAATTTCCTCTTCATTAAAACATCATCATACACC
+GTCCACAAATCTTTATTTAGATCCGTTCTCTTTCGACCTCTCGCGCCACACCTCATCTGC
+AACATGAAAGATAATAAATCTCTCATGCACTCTAGGGGAGTAAGGCACATCTTCTTATAT
+TTTCCTACAATTTCTTCAACTTCAGTCAACAAAAGAGACCCCGGCGTCTATCCCGACC
+>ds2020-328_509
+GAATTACGGCGGTCGGGATAGACGATTCGTGGGTCTAGACGATGGACACTCTACGGTCCT
+GCGGTGAGGGGCTTCGTATTGTGGAAGGTCCAATGATTTCGAAATTATTTCTATATAATT
+CTCAATTTGAATATTATTGAAGCTAGTAAAACGTGAAAACCTAGCAGGATAGATACTAAG
+ACTGGTTAGTGAACAAGTTTAGTTTCTTTTTCAGGGCTGCGTCTCGTCTATCCCGACC
+>ds2020-328_510
+GGTCGGGATAGACGTCCATTCCCCCTCGTTACACCAGGTCGGTATCTACCAGACATCTTC
+ATCATTTCATTCAACATATTTTCATCGATAGACCCGTATTCGTTGATTGTCTTTGCATTG
+AAACCATCGAAGCTGGCAGTATCATTTACAACTTTTACATCGAGTCTCCCGAAAGGTGAC
+ATTACGTTAGAAAACAACGCTCCACGTCTTTCATGTTCTCTATGCGTCTATCCCGGCC
+>ds2020-328_511
+GAACAACTGATCTGTTATTGTTTGTGATAATATGGAGGAAGCTCAATGGTGTGCTAGAGC
+GGGAAAGATAACGATGGATGGATCTGGTGATTTGCTTCTGTATTCCTGGAAACAAAAGTC
+TGGGAAATAATTCGAGGAAGGTGGTGAGTTACGCGGGATGGATTGCAATATTTGGGTTGC
+CGGTCCCTAAATGTCCCGACCCGACTCCCCTAGCACCCACTGTCCGTCTATCCCGACC
+>ds2020-328_512
+GGTCGGGATAGACGAGTAGGGGCCATCAAGGAGAAGAACGCCAGGGAAACCATCAAACTT
+TGGCAACGCAGTTGAGATTGAATGGACGTTAATGTCATCGGTTGCCGGGATACGTTTGAC
+TCCACGTGCGTTGATGGGAATGAGCTGATCGGCTGTGGCGTCAAACTGCATTGGTGGGCC
+GATATCAATTGTCGCTGGCTGGGGGAGTTTCGTGGTACTTATGACGCCGCGGCTGGTT
+>ds2020-328_513
+GGTCGGGATAGACGCCAGACACATCCATTTGCATCAGGGACACCCAATCCACCTTGACTT
+TCCAGCCCACGAATAACCTCACGCGGCAGATCTAGCCATTCTTCGTCTATTTTGACCCGG
+CACCAGTGGCTCAGAGCACCTATAACACATCCGCGCGCTATATCTTGATCGAAGCCTCTG
+CGCTCTAGTTTGTGCATTTGATCTCGGATACCAGCAACTCAGATCGTCTATCCCGACC
+>ds2020-328_514
+GGTCGGGATAGACGACCTTCCCCCTTGCTCTCACGTTCGAGTGTTTGCTCGTCGTTTAGG
+CCGGTGAGTGAGATTTCTGCTCATTGCAGTCACCTCCGGGGTTCTTCGCACCTGGATAGT
+ACCAGGACCCTTGTGCCCCGGCCCTTGATCAGATAAAGCTGCCCGCCCTATGACCCACAA
+CTAAAAATGAGCCTTGCGACGAGACGCGGGCAATCCACATGCTGCGTCTATCCCGACC
+>ds2020-328_515
+GGTCGGGATAGACGGATTTCTCCAATGTCTTTATTGGTTGGTAAACCCAACTCGAAATTT
+CCGTCTTCCTGAATTGGGAGAAAGCAGAAGTCTCTCTCTTTTTTGGGGGGAGCAGAGCTA
+GCTATTGAACAAAAAGCCCTTTGCAATGAACAACAGGAATTCCTTGATACTTTATGGGGA
+TCCCACATCCGCTGATCTACGATTTATGCATAGTGACCCGTTTCGTCTATCCCGACC
+>ds2020-328_516
+GGTCGGGATAGACGATCGCCCTTGGTTGGTGACACATGGAGGAGAGCTAACTAAAATAAA
+ATGCGACATGGAGGACGTGGTAAGGCTGCACGAGATGACTGCGAAGACAGCGGCGTCGAA
+ATTCAAAGGATGGAGAATCAGCATGGGAGTTGATGAACTAGAGATGATGAGAAAAACAGC
+TTTGATGGTCCACAACATACTAGAAATGTTCCCCAGAATGGCGAGGAATGAGAGAGA
+>ds2020-328_517
+GGTCGGGATAGACGGGAGATAACTCTCTTCAATTATTCCTGGGATGGGAGGGAGTAGGTC
+TTGCTTCATATTTGTTAATTCATTTCTGGTTTACACGACTTCAGGCAGATAAAGCAGCTA
+CAAAAGCTATGCTTGTCAATCGAGTAGGTGATTTTGGATTAGCTCCTGGGATTTCGGGCC
+GTTTTACCCTCTTTCAAACAGTAGACTTTTCAGCCATTTCTCTCGTCTATCCCGACC
+>ds2020-328_518
+GGTCGGGATAGACGGCTTCTCTACTTGCTTTGTAGTCTGGTACTACGACTTTGTACCACT
+CTTCGTTCACTTCTGGAACCTTGTCTTTCAATTTCCAAACCATGTTATCTACATCGGGCA
+CTCCTAGCCCGTTGTCTTCAACGCGCCCATGTATTATTGTCTGAGGCAAGTTAAGCCATT
+TTTCGCCATCTTTTACTCTGCACCAGTGACTTATGCACTGTAGCGTCTATCCCCACC
+>ds2020-328_519
+TGAATTACGGCGGTCGGGATAGACGAAGAGATACTGTCTGGCATAGGACACTTCCGTGTC
+GGTAACTATTCGGTACCTGTGACTGAAATATGTGGCGGTGGGGTCCGTGCTCTGTATTTA
+GATGTCATGTATCCTGTGCCCTTGCTGCCCCCCCTCGTGAAACAACGTATTGCGGCCATG
+TACTCCATGGTGGCCTCTTACGACTACGGGGGCGTCGACGGCACGTCTATCCCGATC
+>ds2020-328_520
+GGTCGGGATAGACGTGGACACGTATTTCACCTCTGACTATGAAATACGAATGCCCCCGAC
+AGTCCCTATTAATCATTACTCCGGTCCCGAAGGCCAACACAATAGGACCAGACTCCTATC
+ACGTTATTCCATGCTAATGTATTCAGAGCATAAGCTTGCTTTGAGCACTCTAATTTTTTC
+AAAGTAACAGCGCCGGAACCGCGACCCAGCCAATTAAGACCAGTAGTGGCGGCCGTT
+>ds2020-328_521
+GGTCGGGATAGACGTACACCGCTGCTATCATCACTATTATCATCAGCCGTTACCACTACT
+TTGAGTCCCGAGTCTTCGCCTTTGTTCTTGCGGGTATTGGCAAACCGTGTTTCGAGAATG
+CGCATGCTTCGACGCTTCGGGATCACGGGAACTTCCTTACCCTTGCCTTTATTTTGGGAA
+GTACCTGTAAAATAAAATAAAATGTATACTTACTGTAACACCCCGTCTATCCCGACC
+>ds2020-328_522
+GGTCGGGATTGACGGCAGAAGTTGCTCTCCTTCATGAACACGAGCGAGCTTAGAGAATCC
+CCTCAAAATGTGATCCTCCGAGACATCGTGCACGATCCCGGCGTCTACGAGTTGTGGGAA
+CCTTCTAAAAATACCAGAAGGCGACATAACTTGGCAGGAGAGTTTGTTCTCTCGGAAGGT
+TTGAGCGAAATCGCCCGTTATGGTGGATACCAGAGTAAGACCTCGTCTATCCCGACC
+>ds2020-328_523
+GGCGGTCGGATAGACGTCTCCTCCATGTGGCACCAACCAAGGGAGATTGTCCTTTATTTT
+CTTTATTGATTTGGGTCCCAGCTTGCTCACTCTCTTTATTGTGGCCATTGCTGCGAAGAA
+TGCTACAACGCAGTACACCACCACATCTCCGAAGGCCCCGTACATGTACGTGAAACTCAA
+AGCTTTCGACGCCAGTAAGCTAGCCTGGCTTACTTGTTCGACACGTCTATCCCGACC
+>ds2020-328_524
+GTCGGGATAGACGCAAGAGATCGCTCTTCTCTAGACATGAATCAGGCGAGTCCGAATGCC
+TTTCTCTTTTGTCAGCGGCTCCTACCACATTTCATAGAAAGCCTATATCTTATATTATAG
+CGCGTACAAGAACTAGTGGTGGGCAATCTTCTCTGCGCTCTTTGATCTACCATAGATCCT
+TAGTGGTGGACCGATCTCAAGCCCTATCGTAAAAGACACACCTCGTCTATCCCGACC
+>ds2020-328_525
+GGTCGGGATAGACGAAGAGAGAGAGAGAGAGAGAGAGAGAGAGAGCAGAACAACAACGAT
+AGACTCAGCGAAACAAGACGCTGAATCATATTGAATTGGATTTATAGAGATAAGGTGATT
+CCGATTCCAATTCCGATTCCGAGTCTGGTTCAGTTTTTCTCTCTTCTAAGAGAAAGAGAG
+AGAGAGAAAAGAGGGGAAGCTCAAAAGAGAGAAAGTAAGTATTTAGTGGCGGCCGTT
+>ds2020-328_526
+GGTCGGGATAGACGCCTCCTCTTTGCGATGATAAATGACCTACTTAACTCAGTGGTTAGA
+GTATTGCTTTCATCCGGCGAGAGTCATTGGTTCAAATCCAATAGTAGGTAAAACTTATTA
+GATACCAGTAGATACCAGAGTCAATTGTATCTAATAAGTTTTTCTACTTATCTTTTTTAT
+ATTAGTTTTTTATCTTTTTCGTCCTACCTTCAGGGGGTATTGTCGTCTATCCCGACC
+>ds2020-328_527
+GGTCGGGATAGACGGCTGTTAGTTCTTTCCGCGAAATCTCTAGCGTTTCTCTCCCCAATA
+ACCCCTTTGGGAATTTCCCCTACGTATGGAGCCATCGTCGCTTTCGCTTCGCTGCCATTT
+CATTATGAACTTGTCCGGGTACACCTCCACAGTCATAGATGAAATGACGGTTAACCGCAG
+CCGCTCGGTCCATATCCGCCTTACGAGTTAACCAATGCCCGACGTCTATCCCGACC
+>ds2020-328_528
+GGTCGGGATAGACGCACCGCCGGCTTGTTGAAGAGGGAAAGATCACTCCTAAATGCAGCC
+GTGATCTTATATACGATACCATCAGACGCGCCTCTCGCAGTCAAAACTCTCCTCGCCAGT
+AGTGGGACCAGCCGGGCCGGAAGCCTCGTTTCCTTCAACTAACTCAAGCGATTCGGTCAG
+TAGGAAAGTCATCTCACTGAACATTGGATTATATACAGGAACCGTCTATCCCGACC
+>ds2020-328_529
+GGTCGGGAGAGACGAATCGCCCCATTCGTATTTAGTCATTGCCTTGGCCCTTAATTGTGG
+GATTCTAGAGTTAAAGTGTTCAAATTCTTTCTTTCCCATTGCACACAAACTAAATATCTT
+ATTGCGTAATGTTGATTCTCTAGCTCTAAATTGGTCATCTTCTTCAAACTGGCTATAGTA
+ACTACCAGCAGGAGCCCACTTCCACCGAGTACTCCAAAAATTCGTCTATCCCGACC
+>ds2020-328_530
+GGTCGGGATAGACGATACTTGTGGTTCGGATGGAAATGATACTGAAACCGCTTCCAAAGA
+CTCAGCGATAGGGTAGGGCGTAGTGACTACTCAGATGAAAGCTTCGGAGGAAGCATGGTG
+TTAAACGAGGTTAGAAGCGGGTTCTTTGCTTCATATTCATTCTCGCCCACTTCGTATTCT
+TTATGGTTGAGTTTGTTCCACCTTCTTATACTGTGGAGCCACCGTCTCTCCCGACC
+>ds2020-328_531
+GGTCGGGATAGACGACTCGCCCCATTCGTATTTGGTTGATGCCCATGCCTGTATTTCTTC
+TGGTCTTGAAAGGAAGTACTCTAATGGTAGCTCTGGCATGTTGGATATCATTATAAATTT
+GTTTTTAAGGTTTCGATCAGTCCTCACTACATGCCGCTCGTCATCGTGATACTGCGAATG
+GACGCTGCCGGCAGCACTCCATTGCCATCTAGACCGCAAGCACGTCTATCCCTCCC
+>ds2020-328_532
+GTTGGGTGTAGCGGGTATCTCGATGTCAAGGCAGGGAATGGAATGTTTTGAGGCTAATAG
+GGCCTTTGGTGCCTTGCGAAGAGAAAGACCTTGAGTCTAAAACCATAGTATGGAAGGGGT
+CCAACGATCTTCTTTGGTTTGGCGCCTAGAGATGGGTTTGGGTGGGTTGTCGTCTATCCC
+GACCAGGACAAGACCCCGTCTATCCCGACCATGTCATTATGCCGTCTATCCCGACC
+>ds2020-328_533
+GGTCGGGATAGACGAACCCGTCCCCTGGTCGGGATAGACGCCGAGTGTGGATGAACGTCT
+ATCGAGAGTCGATCTCAAACCATTTGCACTTCGTGTACATTCTTTATGACGTTTGTCCGG
+GAAGAAATTCCTGGTCTTATATCTAAAAGATTGTCACCTCGTGTTAATGAAGTTTGTAGC
+CGGGGATCCTATTCAGGTTATACCTAATAGACCTCTGAAACATAGTGGCGGCCGTT
+>ds2020-328_534
+GGTCGGGATAGACGACACACTCCGGTGGTCGGGATAGACGCTTCCATCTGGTGGTCGGGA
+TAGACCATGGGTGTGCTCCGTCTATCCCGACCGCCGTAATTCACGGACAGAGAGCCGTGG
+ACCTAGTCACCGCTGCCCTGCCGTGGACCTAGTGCTTGATCCCTTGCCGTGGACCTAGTC
+TTATCTCTGCTGCCGTGGACCTAGTTGCGCAAGGGGTATCATACTAGGTCCACGGC
+>ds2020-328_535
+GGTCGGGATAGACGCAGGTTCACCCTGACCAAAACATCCAGTAATAAGTCTTATCACCAT
+TAGCGTATACGTCAATTCGCTTCCTGTCGTTGACTTGTACTTCGTATTTGGATTGCCACT
+CGTCTGATATGGGTATTACGTTCATACCCTGCTGATAACAGGTCGCATCGCATTGAGGGT
+CTCCTTGATACATTCTTTGTGCCCTGAAGCAATATCTTTGCCCGTCTATCCCGACC
+>ds2020-328_536
+TGAATTACGGCGGTCGGGATAGACGTAGACAAAAGAGAGATTTTCGTCGTTTGTGGATCA
+CTCGTATAAATGCAGTAATTCGCGAGAATAAAGTATACTTCAGTTATAGCAAATTAATAC
+ACAATCTGTACAAGAGACAGTTGCTTCTTAATCGTAAAATACTTGCACAAATAGCTATAT
+TAAATAAGAGTTGTCTTTATATGATTTCCAATGAGATCACGGCGTCCATCCCGACC
+>ds2020-328_537
+GGTCGGGATAGACGTTAGCACGGGTTGGAGTAGAGATTCAGTTAGGCAGATAGGTGACGA
+TATGATGCAAACGCTCAGGGTATTGCTTGAGACGGCAGTTGTGGGACAAGAGAAGTTGTG
+TAGATTAGTTAAAGGGTACCTTTGGCTTCTAGAATGTATGGAAAGAGGTACTATAGATGT
+TACCGTGGATAGCCAGAATTGTGTAATTTATGGGCCAAATGCGTCTATCCCGACC
+>ds2020-328_538
+GGTCGGGATAGACGGTGTTCTTCCTTTCGTGTTATCTGGCTAGCTGTCCCTCACTCTGGC
+GCTTGGTCTATTAGTTGACCTTTTCAGCCGCTGACTTGCCCTCCTATAGCTTACGCTCAT
+ACGTTGTTCCGTGTTATACTGCGCTTAGTTACCGTTAGTCCTCGGAAATTCTCGCTTTCT
+CGGGGCTCTTGCTACTTGCCTTCTAGTGTACCTCCGGCCTGCGTCTAGCCCGACC
+>ds2020-328_539
+CCGATCTGAATTACGGCGGTCGGGATAGACGAACACTGGGGCTTGGGGCTGCGAAGTTGG
+GGCTTGGCCTATGTCGTATTTGGGTCTCCCCTTAGGAGGGAACCCCAGAGCGATCAAATT
+CTGGGATCCCGTCGTGGAAAAGGTGGAGAATAGATTACAAAAATGGAAGAAAGCATGCTT
+ATCCAAAGGGGGAAGACTAACAATGATTCAGGCAGAAACAACGTCTATCCCGACC
+>ds2020-328_540
+GGTCGGGATAGACGGTCGCTGCACATATCCTTTTTTATTCTCGGTTTTTGATACCCTTGT
+TTGTTTTAATAAAACAGGATTTGGCTCAGGATCGCCCATTTTTAATTCCAGGGTTTCTCT
+GAATTTGAAAGTTCTCACTTGGTAGGTTTCCATACCAAGGCTCAATCCAATATGTAGACG
+CCCCATCGCTGTCGAACGTCTAGCCCGACCAGACTGGTGGCTCGTCATCCCGACC
+>ds2020-328_541
+TGGATTCGGCGGTCGGGATAGACGCAAGGTGGCAATGTGTCTAGTATCAGTTTGTGTTTC
+ACTTGGGGTTGCCCTTGTTGGTTATGTGTCCTTACATTGTAGACTCTTACTGCATTTGGG
+TCTAACAGAGTTATGTCTATTTCGGTCTTGTCTGTCTGAGTGACAGGTTCAAGCCAATTA
+TATCTTAACAGACCAACGCTCGTCTGCCAAGGTGCTTTTCCCGTCTATCCCGACC
+>ds2020-328_542
+GGTCGGGATAGACGAAGTACGGACCTGGTCGGGATAGACGTATATAAGCCCTGGTCGGGA
+TAGACGCATGCATACGGTGGTCGGGATAGACGTCGCATGTATATGGTCGGGATAGAAGGC
+TGCCGGTTACGTCTATCCCGGACAGAGAGCCGTGGACCTAGTACGACATACTTGGTCCAC
+GGCAGAGAGACGATGACTAGGTCCACGGCAGGGAGAACTATACTAGGTCCACGGC
+>ds2020-328_543
+GGTCGGGATAGACGTGTCATACGGCTCCGTCCCGGAATCGGGACCTTTCTTTCAGAACCT
+TTGACCAACGGGTCCTCGAACCAACCTGTCCTCCCCCTCGGTAAGCGGTTTCTTTTCATT
+CATTCATTGATTGATTCAAGGTAGCTGTAGCTTGCTTCCAAGTCCAAGTGCTAGCGGTAG
+AAGCTAGTCGCCAGAAGCGAACTTCCGGGCCGGGAAGGAGCCAAAAAACGTGAGC
+>ds2020-328_544
+GCCGTGGACCTAGTCGTTCACTTACGAGGCCACGGCAGGAGCATCCTCACTAGGTCCACG
+GCAGGGGATGTGGCGCAATTACTAGGTCCACGGCTCTCTGTCCGTGTCGGGATAGACGCA
+CTAGCAGACTGGTCGGGATAGACGTGGGAAAGTACTGGTCGGGATAGACGGTACCCCCCC
+CTTATCGTCTATCCCGACCAGGGAGGTTTATCGTCTATCCCGACCGCCGTAATTC
+>ds2020-328_545
+GCCGTGGACCTAGTTTAGATGGCCTGCCGTGGACCTAGTGCTCGCTTCGCTGCCGTGGAC
+CTAGTTAGCAGGCAGGTGACTAGGTTGAATTCGGCGGTCGGGATAGACGGGTTCCGGGGA
+TGCGCATAGCGGGAACAGAACTTGAAGCTTTAGCCAAGTCTGGGGCAACTAACGACTCGC
+ATGAGTCATACATACTAAATAGGTTAATATCGTGGTTTATCGCTAAGATGTATCA
+>ds2020-328_546
+GGTCGGGATAGACGGAGGCTTCTGCTTGTTTATTGTCAAACCAATCCCCCGCCCCCTGAA
+CACACTGTTAATTGTTATGAGAATTATAGTACAACAACCCTTATATGAATGGGTTTTGGT
+CAATTGGCTATGAATGGTTCGATGCAACAGTCCATCAGTGGGTACTATCACTCTATCAAC
+CAAATCCATATCCTTCACTGCCTGCTTTACTTGTTCTGACCGTCTATCCCGACC
+>ds2020-328_547
+CTATTCTGACCACTTACTATGGCTCTTCTCTCATTTGATTTTGGAATCTTATTTAAGCCA
+AGATTAGGCTATCGATTGGAGGAAGAAAGCATGCCTTTGTTGGTCACCATCACCACCATC
+GTTAACATCGGTACACTCCTAAATAAGGCCTACCTCCCTTCCATTCAACCAGAGCAGCGA
+TGAAAACAGAGACTCAATTAGCTAAGCAATGCATCAAACTCGTCTATCCCGACC
+>ds2020-328_548
+GGGTCGGATAGACGGGGTGTAAGTTTAGGAGACGTTCTGTTAATGCGGTAGAGCCGGCAG
+TTCCAGAATATCTAAAATGGTCAGAGGTGCCGATTACTTGGAGCAGGGAGGATCACCCGC
+CCAGAGTTGATAATCCGGGTCATCTGGCACTTGTGGTAGCACCCCAAGTTGGAGGATATG
+CTCTCACTAAGGTTCTGATGGATGGTGGAGGACATCGACTCGTCTATCCCGACC
+>ds2020-328_549
+ATTACGGCGGTCGGGATAGACGTGCATCCTCACTTAAAGTGCTTTACAACCATAAGGCCT
+TCTTCACACACGCGGCATGGCTGGATCAGGCTTTCGCCCATTGTCCAATATTCCCCACTG
+CTGCCTCCCGTAGGAGTCTGGACCGTGTCTCAGTTCCAGTGTGACTGATCATCCTCTCAG
+ACCAGTTACTGATCGTCGCCTTGGTAAGCCCTTACCCCACCAACTAGCTAATCT
+>ds2020-328_550
+GGGCGGGATAGACGAATTCAGAGTGTCTTTCTTTGGAGGCCCCCAATGCCTAACCTAATA
+GGGGATTCCCCATAGATGGATCAAGAAAGTAGGGCTCTTATCTTTCAACGCCTTTCGTGG
+TTTGGGAGGAAATCTCAAGAGTCCGCCCGAAGAGATGAAGGAATGAATGCGTAAAGTCGA
+GAGTACGCCGTCTGGAAGCGGGGCTATTAGGGGCCACGCACGTCTATCCCGACC
+>ds2020-328_551
+GGTCGGGATAGACGCACTCAAGCCCTCAAGTCCGCTGGTGCCATATCCGCGAAGACATGG
+TTACCCCAGTTGGCAGCTGGAGCATTACGCTTGGGCAATTTTATATTGTTTTACAGTGTT
+TTTGTTATTGAATTTTGTCGTATTTGTTTGCCACCCGATCTGCCCGATAACCCAGTAGCG
+GTGGTTCGTCGCCGCGCCTACTTCCAAAACGTCCGCACACCGTCTATCCCGACC
+>ds2020-328_552
+TGATTTAGGCGGTCGGGATAGACGACAAGTATCCCTAGGTCGGGATAGACGCCCATTTAC
+CCTGGTCGGGATAGACGCCTTGAGCCTGTGAATTCGTCTATCCCGACCGCCCGGACAAGA
+GCCGTGGACCTAGTGTCCTCACGCCTGCCGTGGACCTAGTATCTAGTCACCTGCCGTGGA
+CCTAGTGTCTCGCGTCCTGCCGTGGACCAAATCTTGATCAACTAGGTCCACGGC
+>ds2020-328_553
+GGTCGGGATAGACGTATCAGCCACTTAATTCGGCCAGACAGATGTGAGTAGTAGAACTCG
+GCTTGCCCTTTTGACGAAGCAGAATGGTAAAAGACGTATGGCTTTGCGAAGTAGTTTTCT
+TTGTTGCGAAGTTCCAGTCTGTTAGCCTCAATCGTGAGTTCCTCTTCGTCTCTGGGGAAT
+CCGATCTCGATCTTGACGTTTCCCTCAGACTTGTTTCTCGTAGTGGCGGCCGTT
+>ds2020-328_554
+GGTCGGGATAGACGCTTGCAACCCCTAACAATTTCCCTTTCTGATTTCAAGACACTCAAA
+AACTGACAAGATCCGAAAGGTGGATGCTGCCTGCCAAAACTGAAAGAGGGTGAAATATCA
+CTCAATCTGGCCCGCACAACCAAAACACCACCCAGCATCCTCAGACAACTCAAATTCCCC
+AACCCCGCTCCCTCCTCCCCCCCGCCCAACACAACGCGAACCAAAACGGCTGTA
+>ds2020-328_555
+GCCGTGGACCTAGTAGCAATCTGGATAGGTCCACGGCAGAGGTACTTCGACTAGGTCCAC
+CGCACGGGAGTCCGTACTAGGTCCACGGCGGGGGAGTCAAACTAGGTCCACGGCTCTCTG
+TCCGTGAATTACGGCGGTCGGGATAGACGATTGTTATGTATCTAGACGCTTAACCCCAGT
+AAACGTCTATCCCGACCAGGCAGCGCAACCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_556
+TGAATTCGGCGGTCGGATAGACGGGCGAAAATCGTCTATCCCAACCAGGCCGCTGTTCCG
+TCTATCCCGACCAGGGAGCTCGATCGTCTATCCCGACCGCCGTAATCCACGGACAGATAG
+CCGTGGACCTAGTGCGTCGGGTTCTAGGTCCACGGCAGTGAATGCTATACTAGGTCCACG
+GCAAGAGGTACGAAACTAGGTCCACGGCAGCGAATGTGACACTAGGTCCACGGC
+>ds2020-328_557
+GCCGTGGACCTAGTATAATTGGGGGGAGAAGAAAAGAAAGGGATGGGAGGGAGGGAGCCT
+ATCACCGCTTATGGCCCGCTTCCTATTTTTTAATCAATTCCTGGTTCACAGGCGAATAAA
+GCAGCTATCAAGGCTATGCTTGTCAATCTAGTAGGCTCCTTAGTGCTTGCGCTAAGGTAG
+TTTACTTGCTTACTTGTTAAGGAACAAACTCTTCTTTTTACGGCTATCCCGACC
+>ds2020-328_558
+GGTCGGGATAGACGCACTACGCCCCTACATGCGCTGAAAAGCGCATATCCATGATTTGTA
+TATGTTCTGAGCTATAGCTCATGTAAGTTCCTCAGTCCTATTGAGTGGGTTATGGTTTTG
+CATAAATGCATTTGAATCAGTTAAATACCCTCCAAATTTTTCATAGAATTTTTGTTTAAA
+GCAGTAATACAACATGGCCGTTTTTTCAGGCAACAGATTCGTCTATCCCGACC
+>ds2020-328_559
+GGTCGGGATAAACGACACCCATTACTATCATCCCATAATTCCCCTTTTGTTAGTCATCTT
+GTCTAACTCCCTTTCGCCAGTCCCGAATCACCCAATAAAAACCATGTGCACTGGGATCCC
+TGAGACCTGGTACCTGCCAAGAGTTTAGACTCAACTACACAAAAGACTATATCCATTACC
+CTCTTTTCCACTATCATCTCCTCCACCCAACTACTCCAGCGTCTAGCCCGACC
+>ds2020-328_560
+GGTGGGGATACACGAGGGGGGGTTATTCAGAGCGGGCTCAATGGACAACGGGGATGGAAT
+AGCTGTTGGGTGGTTAGGACATCCTATCTTTAGAGATAAAGAGGGGCGCGAACTTTTTGT
+ACGTCGTATGCCTACTTTTTTTGAAACATTTCCGGTTGTTTTGGTAGACGGAGACGGAAT
+TGTTAGAGCCGATGTTCCTTTTAGAAGGGCAGAATCAAAATATAGTGTCGAAC
+>ds2020-328_561
+GGTCGGGATAGACGTGGATTCGCCCTACTAGCTCACTCAATCTGCTGTAATATTCAGGTT
+CCGATGTACATTGAGCAGCCAACTGCCTCCCGATCTTCCGCTCAACCAATGTCCACACCT
+TGCTTTGCTTGAAGTTGTCTCTTTGGCTGTTCGGTCCTTGTTTTTTAACCATTTAGATGT
+ATCGTTTTTTGTTCTCTTTTTTCGCTCGCCCTACAATGGCGTCGATCACGCCC
+>ds2020-328_562
+GGTCGGGATAGACGCCGGGCTGTGGTGTCTTGGTGTGACCAATTGAGGGTGTTGTGCCAT
+GATTCTATTGGTGGGTTTTGGTCACATTGTGGTTGGAATTCAACCCTAGAAGCTGTTTAT
+GCTGGTGTTCCAATTCTCACTTACCCTATATTAGGGGATCAAATGCTCAACGCTGAGAAA
+ATTGTGGAAGATTGGAAGATTGGATACAGGGTGCTGACTCGTCTATCCCGACC
+>ds2020-328_563
+GGTCGGGATAGACGTGTAAAGGGGCTGCTTTCGAGATGCTTTCAACCATTGCGCTGCAAC
+CTAAGCCATCATTTCAAGAGGGGGTGGTATGGCAAGAGACATCGCTTCAAGTCAATTTAG
+CACGTTTTACACCAACGAGAGCCAGAGTTCCCGCTAACTTGGAAGGAGATGCTTACCGCT
+TAGAAAGCGAGTCAACAAATTCAATCAAACAACATAAGACCGTCTTCCCGACC
+>ds2020-328_564
+AGAAACATGAGCTTGTGATATAGCTACACCTAATTCCGGACCGGTTAATGCAAGAACTAT
+AAATAAAGGACCAGGATCTCCTATAAAAAATAAAAGATCATTCATACATAGCATAGTCCA
+AGCGAACCCACTTAAAATCTTTACTGAACTATGACCGGCCATCATATTAGCAAATAAACG
+TATTCCTGAGCTTAATGCGCGAAAACAATGAAGCGCATCGTCTATCCCGACC
+>ds2020-328_565
+GGTCGGGATAGACGGGCGGTTCCTAGTCCGCTTTGGCTCCTGATCTTGAGCTCGCTTTTG
+TTCAATTATAAATAAAAAACCGCTTTGATGGAGATTTGTAGCATCATTCAAGTAAATACA
+GATTAAGATCGTAAAAACATAAGCTTGTAATATAGCCACACCTAATTCCGGACCGGTTAA
+TGCAAGCGCTACGTGCCCTTTTTTAAAAGTGCTACCAGCGTCTATCCCGACC
+>ds2020-328_566
+GGTCGGGATAGACGTCGAGGCTGTATCATGTAACAAAACGATACAAATAGAAGGAATGGA
+AAAAGAGGAAATCGGAGAGATATTCAGGAGCTCACTGGGACCTGAGAACATAGTTAAACC
+GACAGATGGTGATGGCACAGCAGAAGTTAAAGCAGTGCAAAAAGGAAGAAAGAAAGATCA
+GGGACATAAAGAACGGAGTGGTGAAGAGCCTATGGTCAAATTTCAAGATAGT
+>ds2020-328_567
+TGAATTACGGCGGTCGGGATAGACGCATGGTGTGCTTGGTCACCGGTGGAAGTGGCTTGG
+TCACCGGTGGAAGTGGCTTGGTCACCGGTGTAGGTGGCGGTGCATGTATAATAGGAGGCT
+GAGTGCTTGGTGGTTTGCCATAAGGTGAAGATGGTGGTGGCCTCACCACTCTAGGAGGCA
+GAGTTGGTGGTTTGGGTTTGGGCACTATTGGTTAGGGCCGTCTATCCCGACC
+>ds2020-328_568
+AATACACAGCAACGGCCGCCACTACTGTACCTTGTATAGTCCAAGCTCTTCCAAAGTTGA
+TCCATAAAAAGGTAATTTCTCTCCCTCCACCGTGATTTCTAATGGTATTGTCCTGGTTTT
+CTCTGTACTTGGATCTATGAAACCCTCTGCTGGTCCTTCAGGATCACCAGTTTGTACAAC
+AAAACCATCCGCTCTTTGGATTTCCATGCCATCATAAAAGTGTCTATCCACC
+>ds2020-328_569
+GGTCGGGATAGACGGTGATGGCCTTTTCACAAGAGAGATTGGAGAGGAAGAGGAACTTGT
+TCCACGTTCCTAAGAACAGTGGGACAGCAATCAACCGCGCGAAAAGGGATAGGAGCAACA
+TAAAATTGTGGGATGCATCTGAGGGTGGTTCCGTGGTGGAAGGAAAGGACATACGAGTAG
+GTGAATTGTCCGACATATCTAATCTGTTCACCAGCCGATACACTGGTGGTAT
+>ds2020-328_570
+GGTCGGGATAGACGTCTCCATGTGCTGCACGCAGTTAGCCGCTTAAGGCTCATGGATCAT
+AACAACAGTGTTAATCAGGGTGATCCGCAGGAGGGAATGACCAGTGATGTGGTCATGGAA
+ATATTTGAACGGCTCTTCCGCGCAACGGGGGGAGCCGCTTCGCATTGGGACGTTTTGAAG
+GGAGCGTCAAGTCTTAAATTCCTTCGAGAGGCTGGAATCGTCTATCCCGACC
+>ds2020-328_571
+GGTCGGGATAGACGAATCTGGCTATTTATGGGCCAAACCAAGTCTTAAACTCTTATCGTA
+GAGATGGACGAGCATATGTTTTCAATTCCAAACCCGAGTCGGTAGGGCATACGGCACTGT
+TATTCAAAATGTGCGAATCTTATCCTCCAAGAGAATTTAGGTCGCATGTAAGCATACCAT
+CGGACGGGGATGAGATATTTATGGTAGCACAACGTCTATCCCGACCGCCGT
+>ds2020-328_572
+GGTCGGTATAGACGAACACCCCGCCTATTGAGAGCGAACTTAAAGAAGTTGATACTAATC
+AACAAATTAGGCCAAATCCCAAAACGAAATATTTAAATAACGTAGAAATTTAAGGACCAG
+ATATGCATAACTCCTCAAGACATCCGCCAGTCTTATAAAAACCACATGGCTCATAGAATT
+ACAAAACATTAATGCGTCTATCCCGACCGCCGGAATTCGTCTATCCCGACC
+>ds2020-328_573
+GGTCGGGATAGACGCAGGTTTGCTCTGGACTCCACATAAGCAGTTGTCGATATGCCTTTA
+TAGTATGACACATAACCCTGGAATATCTTGCCTAGGTTTTTAAGCACACCGGTATCATTG
+ACTAACTGGAACTGCCTCCTATCCAATTTGGCCATAGCTAGCGCGCACTTACCTAATTCT
+AGATCGTTTACATCATAATGAACCACATCGCCAGTCCCGTCTATCCCGACC
+>ds2020-328_574
+TGCCCTTGTTTCCAGCTTGGGAATGAGAGTGAGTAAGTAATTCCATGCTAGTACCTGTAA
+GCAAGCGTTTTAGGCAAACCTGTATACCCTCTTACCAGGGCTATACATAGGTAGAGAACG
+GCTCCATCTACATCCAGAGAGCTGCCTTTCGCGGTTAGAAAAGGAGGTGAAACTGCTTTT
+CTAACACAGGACAGGATACGGCCCATCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_575
+GGTCGGGATAGACGTACGTCTGGCATGAGTATGGGTGTATTAATGAAATACCACACCATG
+GCGTCCCAAACATTCTTCCACTTTTGCTTCTCAACCTGATCTGTCACAGGTTTTCCATTG
+AAGGAAGAGAAGTTCACGTTCTGTTTCAACACGTCAAACGCGACGCGTATCAACCACGCT
+GGTACTTTCGTATCAAAAGCGGAAAAATCTATGACCACGTCTATCCCGACC
+>ds2020-328_576
+GGTCGGGATAGACGACCCATCCACCTCTGCATCTTTCATATCCTCCAGCACCTCCTCTTT
+CATATCCACCAGCACCTCTTTCATATCCTCCAGCACCTCCTCTTTCATACCCACCAGAAC
+CTCCTCCTCTTTCATACCCACCAGCACCATTTCCCCTTTCATACCCACCAGCACCATTTC
+CCCTTTCATACCCACCACCACCATTCCCTTTTACCGTCTATCCCGACCGCC
+>ds2020-328_577
+GGTCGGGATAGACGGAGTTGCGGCATGGACTTAGAGTGATTTGGTCATTGGACTACGCAG
+TCCAGTTCCAACTCCATTTCAAGCCAATCATGGTTTAGTGGTGTATCTATCTATTAAAAT
+GTTATGAGTTCCGGTGTGCACGATTGGGCTAAGCAATATGAATGCCCCTTACTAAATGCA
+TATTGGAAAATTGCTAAACCTATCCAGCATGACTGAACGTCTATCCCGACC
+>ds2020-328_578
+GGGCGGGATAGACGTTGACTTCTCATCGAGATTGGGTTGGTGCTTAGATCGATTCAAGCG
+GATCGAACTTTATCTTCTATAAGGGGATTGGTTCATATCAATCAGAAGTGCATTCAGTTA
+TCTCTTTTTTCTTTTTCTTCTCGTCAGTTAGCTCTGCCGAATGCCTAAAAGGATTCCATT
+CTTTCTGGCGGATCTAGTTCTTATAAGGCAGAGATGCGTCTATCCCGACC
+>ds2020-328_579
+GGTCGGGATAGACGTTTAACTGGCCTTGTGGTCATATGGATGAAGACATCCCTAACTTCT
+ATCACGGAAATGATTACATTCCACAATCACACGGTGACTACATAGATATATCGCCACTTA
+GCGACAAGGAATCAAGGTTCGTGTTGCTGATGCTTGGTAGGTGGAAAAGGACGACAAGAT
+ACATGTTGGACTTTGATTTACCGAAGTTAGCGACGGCGTCTATCCCGACC
+>ds2020-328_580
+AAGCAAGGCCTCTTTTAGATTGACTGTTGGCAGATCGAGATTGAACAACGAAGTGCTTTC
+ACCTCTTGTAGTAGATCCGTTCATCAAACGAGACTCGGAAAGAGTGGCGTTAAAGAGGAC
+TGGGGCGCCTCTCGAAGTCTCCGATCTCACAGATGGTTAGGCTGCAATTCCTTCGCTTGT
+GAAGAAGCTTGGCTAGTTCTCCTTACTTGGAAATTACGTCTATCCCGACC
+>ds2020-328_581
+GGTCGGGATAGACGAAATGGCTGGTTCTTCTTGATCTTGAGGTCATGGGCTAACTCGACC
+GTAGGGAGAGGGGTTCAAGATGCCCTCGTCTAAGTCTGTCTATTTCGTTCTTTGCTTTAG
+GAGCTCGTAGGTCTCAAGGGTTGTTTTCCAACTCGACCGGAGGACTTGAGATGTCGCTAA
+GGGAACGTCTTCCGGATCGATCGAAGGGGAGGTGATACTAGGTCCACGGC
+>ds2020-328_582
+GGTCGGGATAGACGCACAATCGGAGTTTCCTTAGGCAGCCACCGACCTACAGTTATCCTT
+AAACTTCCGTGCTTGGTGGAGAAGAAGCGAACAAAGGTACGCTCGCTTGCTGTCTTGTTC
+TCTGCCGCGAACTGGGATCGCTCGCCAGCTAGGTCAGATTGGAGCAACTTATTTTTTGAG
+AACATATTACCCATATTCGGGGACAAGGGGCGGACCCGTCTATCCCGACC
+>ds2020-328_583
+GGTCGGGATAGACGAGAGGTCCCCATCGGACGGCAGCCCTTTCGGGGGTTCCTTAGGGAC
+CGATTCACTCTGCGTAGATTGACTGAACGCAGAAAGCCTTCCACTGGCAGGCGATCGTGT
+TTTTCACAGGATTTATCGTTACTCATGTCAGCATTCTCACTTCTGATATCTCCAGGTGTT
+GTCACCAAAAACCTTCCCCGATTGACAGAACTTCCACGTCTATCCCTCCC
+>ds2020-328_584
+GGTCGGGATAGACGACCACTGTGCCTGCCAGACTCGTCATATTATGATAGGGATTATCGA
+TCGATTTATTTGGCTTTAAGTGACAAGGCCCCCTTTCTCCAAAAAAAACAACAAGCAGCC
+TCTTAGGCAATCCCCTCCCCCGAGGTAGCTGCTTGCCGATGGCATTGCGATAGATCGGTG
+GTTGACTTACTGGTTTGTGACTCCCACTGCACTCCCACGTCTATCCGACC
+>ds2020-328_585
+TGAATTCGGCGGTCGGGATAGACGCAGCTGGCCTCTGGTCGGGATAGACGAACCTGCCCC
+CTGGTCGGGATAGACGACCAAGTGCCATCATTCGTCTATTCGGACAGAGAGCCGTGGACC
+TAGTTTTAAACCCCTTTGCAACTAGGCCACGGCCCCCGAACATTACTAGGTCCACGGCAG
+ATGGTTGAGGACTAGGTCCGCGGCAGAGAAGGGCCCACTAGGTCCACGGC
+>ds2020-328_586
+GGTCGGGATAGACGACCCACAGGACTCGAAGTAAGGAGAGAGGGTAAAAAACAATAAGCG
+GTAAGTGAGCCAGCAAACAAAGCCGTAGAAAGTGTTAAACATTCAGAGAGGTTCTATGTG
+TCAATGCATGAAGCCGGCGAGTATGATATGGACATGAGAGATAATAAATACCAGACATCT
+ATACCAACATTCCTTGATGAAAACATGGCTACCTTTCGTCTATCCCGACC
+>ds2020-328_587
+GGTCGGGATAGACGTGGATGTGGGGCAGGAGAGGATAATCGAGTTAGTTACGCCGACGGA
+GAAATCCATGTTGGAAGTAGCTCCACAGATTGTAGTGTACTTAGCAGCATAGTCGCGAAG
+GAGGGTCTGATACCAGTCATTGGCACGGGTAGGGGTGCCAGTCATGTCAGGCATCTTTCC
+AACCATTAGGGTTGAAAGACCAGTAACTGACATTAGCGTCTATCCCGACC
+>ds2020-328_588
+GGTCGGGATAGACGCTACAATCCCCTGGTCGGGATAGACGAACATCATCTCTGGTCGGGA
+TAGACGTTTGAAGGGGTTGTTGACGTCTATCCCGACTCGGACAAGAGCCGTGGACCTAGT
+GATCATCGCCTGCCGTGGACCTAGTAAATCCTTGCCTGCGTGGACCTAGTTCAGTATCGG
+GTATCTACTAGGCCACGGAACGCTAATGAGACTAGGTCCACGGCCTCTGT
+>ds2020-328_589
+GGTCGGGATAGACGTGCTTGTTGGGTGAAGGGATTCAGAAGACCGAGTGAAGCGACTAAA
+GCGACGACCATACATAGAGCTGGAAGCTGCACTAGTGGACGAAGAAGTAACTAAAGCCTG
+AACTGGATGTGGAGACGAAACTGTACAGGAAGAAGAATCGCCCTACTTTATTACATTACG
+GCCTTTCCCTCTTGGAATGAGCATAGCACTATACACCGTCTATCCCGACC
+>ds2020-328_590
+GATCTAATACACAGCAACGGCCGCCACTACTGATCTTCATCGAGGAGGAATGTGGTGGTA
+GTGGAATAGAGAGCAGACCAGGACTTGAAGGGTCGATTGGGGTGTTGGTGAGCTGAGATG
+AAGTAGAGGGTGTCGTTTTTGAGGATGGGGCGGTCGTGGAAGAGGCTTCCGGGTTCGGAG
+TGTAAGAGTTTGGGGGTGGGGAGTTAGTGGCGGCCGTTGCTGTGTATTA
+>ds2020-328_591
+GGTCGGGATAGACGCGAGGATGCAATTGGCTAAGGGGTCAGGGTTGTTCTCTCTAGCAAG
+CGTTAAGGATTACAAGAGGGAGGCTAAGCGTATAAGCGTCGAGGCAAAGTCTCTGCAAAA
+CCTGGTTGATGTGGATTTGAGGAAGTTCTTTGAATTGGAAGTGCTGGTAAATAGGGTGGA
+CGGTCTTGTCAATTGGGAAGAGGAGCACAAAACGGCGTCTATCCCGACC
+>ds2020-328_592
+GTGCACAGAATCCGAGCAGTACCTTAGGGGCAGGGTTTACCAGTATGAAATAATGCCGGT
+GGTCACACCAGAGGATATGCAGATACTTCTTGATCTGAAGCGCGTGCAAAATTGGGCGGG
+CTCTGTTTATATCGACCAGAGCATCGAGGAAAATAATGGTGTTATTTTGCGAATGGCAGC
+TGGAGCCGGAATCAATGTCTATGAGGGGCCAACGACGTCTATCCCGACC
+>ds2020-328_593
+GGGCGGGATAGACGATCACCTCCTTTCAGTGGGTGTAGTAACATTATTAATTCGGCCATC
+CCATCCTCTTGGTCAAACACTTTGTCAACGTAAGATATTACTTGTCTTCTTACACACTGT
+GACACTTCTACTGAGCCTCCTCTAGCTATTATTTCGTCAAATCTATTGTTCATTGATCTG
+ATCAATTCCCTATAATCGTTTGCAGGTGCCAGATACGTCTATCCCGACC
+>ds2020-328_594
+GGTCGGGGTAGACGCCAAGAAACACTTTGTCGGCTGAAATCTTATGTTAAACAATTCTGC
+ATTCTTCATTAGTAAATTGACTTGGCTCATAGACTGTACAGCTGCCAGGACGTCATCTCC
+GTTATGTAAACTAACAATAGTCTGGTTGGGTAAGCATTCTGAGATATAAATCTTATTTAA
+TAGAGTATTCATAAATGTAGTTAACCGCCTTCCTCCGTCTATCCCGACC
+>ds2020-328_595
+GGTCGGGATAGACGTTTCGCCAAGGTAATCATCTTTAACCATAAGTGGCCACGTCGAAGA
+TGATTCGTTAGGTGCGTAAGGTCGGGTCGCGTTTTCTAGCGCCATCGGGGTTTTAATTGT
+TAGGTCGTACCCACACAGCCTGCTAGCCCAGGCCCAGTGCCATAACTGATATGGCGTCGC
+TTTCCATCCTAATCTATTGCGTTGTAGCTTAGCTGCGTCTATCCCGACC
+>ds2020-328_596
+GGTCGGGATAGACGCTAGTACCTCTTTGCCCAAGGATTGCGAATATGCTTGACTGAGATT
+CCAAGCAAGCTACCTGGGCCTAAAAGACTGCTTCTTGAGCACATGAATATTCAATTGCTC
+CCGAGCCTTCGAGAAAGCCCATCCTCTTTCAATGCCATCTGACCCATCTGTTCAACCCCC
+ACTTCCGGATATTCTAATTCTGTATTTCCGCCCGACGTCTATCCCGACC
+>ds2020-328_597
+GTTCTGGATAGACGGTAGCTGCTTTATCTGTTTTTGGTTTTATTGTTTGTGGCTTTGTTT
+GTTTCTATAATATTGCCTTTCCTAGTGAGTTTTACGGGCCCACTGGACCAGAAGCTTCTC
+AAGCTCAAGCATTTACTTTTTTGGTTAGAGACCAACGTCTTGGGGCTAACGTAGGATCTG
+CTCAAGGACCTACCGGTTTAGGTAAATATCGAATGCGCCTATCCCGACC
+>ds2020-328_598
+GGTCGGATAGACGGGAGGGGGCGGTGAGGAAGGGTCTTTCGAATCTCGATCAAATAGCAT
+AGCACGGGACCGTGCCAAGCTGTAAGCATAGCGAGTTAGGTATGGGCTTTCTTTTAACTA
+CCAGAATCAGCAGTTGGCCTGTTGTTGATCAAAGTCTGGGTCGGCGGTCCCTAGTTATAG
+ATTGGCTTTCGCCTTCCTTTTTCCGTCCAACGCAACGTCTATCCCGACC
+>ds2020-328_599
+TGAATTACGGCGGTCGGGATAGACGTCTCACGGACCTGATAGACGAGCAGCACCAATACG
+CGTCTATCCCGACCAGCCCAAATACGTCTTGAAATAACTCCGGCTTAATCCCCAAAACAC
+CAAACCCAACACCAAATGGAACTCAAATTCACAAAACTATCCTTACATACGATCTGAAAT
+ACCAATGTGCTTGAATTCTCTGAACCAAAATCACACAAACCACATTTCT
+>ds2020-328_600
+GGTGGGGATAGACGTTTTGGTTCCTTCTAAAGGCCGCGCCCTCTCCCGCCCAATTGATGG
+TTCCCTGCTTGTTGAAGCGGGATACCCTACTGCTCATGCCTTGGCTGAGGATTTTGTTGG
+ACTTTCTAAGAAGTACACTAATTTCTATGCCACGTCCGAGTACGCGTCCCTGGCTGACCT
+GGTTGAACACCTCATCCATGGTTTAGCTCCAACCTCCGTATATCCCGAC
+>ds2020-328_601
+GGTCGGGATAGACGTTGGCGCTTAATTAGCTACCAAAACGCAGAAATTTCTCAAACCTAA
+CACAACCAGCAGCTAGAGCTCAAAGAGTAGATGAATTTACATACCTTATGCGTCCAAATC
+GGTTGAGAAACGAATGAGAACGAATGCTCCAAAGTTCTGTCAAAATCCGGCGAATTTTCT
+GCATTTTCCTGCGAATATCGAGGAGTCCAGTGGGCCGTCTATCCCGACC
+>ds2020-328_602
+TGTCGGGATAGACGCGTAGTTGCATTGACAATATATCTACTTTTCAATCCTTTCTCGTCC
+GGCTTTATAAATGCTTTCAAAACATCAGATTTGATTGTATCTAAACTAACCATCCTCAAA
+ACCTCCGCATCACTCAGCGTAATTGCAGCACCCAACTTTGTTCTCATCTTATCTCCGTCA
+ACCAACAACTTAGAGTGAGAGCTAGCACCCAGAGTCGTCTATCCCGACC
+>ds2020-328_603
+GGTCGGGATAGACGGGGACTCACTCTCTCCAATTTAGTGTCCTTTTTATGTGCCCTGCGT
+AAATGGCTGATAAGTATCCTACTACTTAACCTTAATATAATATTGTTAACTTAATAAAAT
+AAAAAACTGAAAAGCTAAAAATTGAAAAACACAAAAACACTAAATCATAGCAGCCACCAT
+TACCAAGTCCCTCCGCCCAGCCAACGCAAAACCCCCGTCTATCCCGACC
+>ds2020-328_604
+GGTCGGGATAGACGAGGGGAAGGGGTCAGATTTATCCCGACGGGAGCAAGAGTAACAATA
+ATGTTTATAATGCTACAGCAGCAGGTATAGTAAGCAAAATCATACGAAAAGAAAAAGGGG
+GGTACGAAATAACCATAGCGGGTGCATCGGATGGACGTCGAGTGGTTGATATTATCCCTA
+CAGCACCGGAACTTCTTGTTTCAGAGGGCGATTACGTCTATCCCGACC
+>ds2020-328_605
+GGTCGGGATAGACGCTCCTGGGTGCTTTTGGGAGTCCAATAATCCCAGAAGAGCGAAAGG
+CGTGATGTACTTCAGGAACGTCTGGGACTCAGCGAAGGCAAGAGCCCCCGGCGATAATAA
+CAGTCTGAAAAGGTGTTTAAATCATTGCACGCTGGCAGACTTTATAAATGTAGTGATAGA
+CATTTCGGTGGAGAACCTCAGGATCAGGTTACGGCGTCTATCCCGACC
+>ds2020-328_606
+GGTCGGGATAGACGGCCCAACGACCTCATTCTCCTTTTCCTTCATGACAACTTTCTCCTT
+CATGGCAGGAACAGCAGCAGCAACATTCTCCTTCTTAATAAACAGTACAATTATAAAACC
+CCAAGCTATCATAATCTCAATAATCATTTGAATTTATAAACCGAAAGTTTGAGATGAGAT
+AAAATGATGCATACATAAATTCAATAGATATAAGCGTCTATCCCGACC
+>ds2020-328_607
+GGTCGGGATAGACGGTAGCAGCGGGTTGAGCTGTCTCAGGATGCCCTTCAGGAGAGCGAC
+CCACATGGGGGTAGTTCACGGGCCGGCCGCTGAAAGTGATGAGAATTTCACGTTCTCATG
+TGTGATCATAAGCGCTGAAACGATAGTGACCGACTTTGTGAGAGGAGGGCGGCTGGTGAC
+ATATCGAAGAGACAGGACGTGCAAGGCAGTGGCGCGTCTATCCCGACC
+>ds2020-328_608
+GTTTGGACATCTAGCTTGATGCTATCCAGTGCGGAGTTGAGGGCTCCCTGGAATTGGCCT
+TGAAGTTCTTCCACCATAACTTCGAAGCCCCCCTTTGTAAGGACATCCTCCTCGAGTCTT
+TGATCGAACTCGATCACGGCTCTCTCCATCTTAGAAAGCCGATTCTCCATGGTTGCTGCA
+TCTCTAGATCGTTCCCTCTTTGATTTGCCGCCCACGTCTATCCCGACC
+>ds2020-328_609
+GGTCGGATAGACGTCAAAAGTGGCTCAGGTGGTGACTGCATTACTGGTGGTTGGTGTTAC
+GGATTACACTATTGTGAAGGCTGAAACGGCGGACTCCCCTGCTACATTACAATACCTTGC
+TCCTTATACAGGAGCAGCTCTGGCTGAATATTTTATGTATCGTGAACAACACACTTTAAT
+CATTTATGACGATCCCTCCAAACAAGCGCAGTTCCGTCTATCCCGACC
+>ds2020-328_610
+CAACTAGTGCTCCGACTGAAAGGTCGGGGGGTACAACACCGAAAGGCGTGCTAAACCTTA
+AGGTGGCGTTCATCATGGTAGAGCCTAGTCATGGTTAAGAAACCGAGGATTGGAACGGGT
+GGAAATTAGTGGCGGCCGTTGCTGTGTATTAGAATTACGGCGGTCGGGATAGACGTAATA
+GCACCTGGTCGGGATCGACGAGAGGGGGGCTTTCCGTCTATCCCGACC
+>ds2020-328_611
+GGTCGGGATAGACGCCCGGAGCCCAGGTATCATATACACCCCCAAAATAAAGCGCCTTGA
+ATACTAGAAGAAAAGCACCTATACCTAACAAGATTAAGTGAATACCCAAAATTGTAGTCA
+TTTTGTTTCTATCTTTCCAGACATAACCGAAGAATGGAAAAGATTCTTCAAGAGTCTCGG
+GTCCCAGAAGTGCATGATAAATCCCGCCTAGATACGTCTATCCCGACC
+>ds2020-328_612
+GGTCGGGATAGACGGTGCGGTGGGATGGGAGAACTCACTGGCATGAATGCCCCTGCTTCA
+TCGAGTGGGATACGACCCCCGTTTGATCTTAACATGGCTCCGGACCCGGAGCCGGAACCT
+TCCTCTTCACCCGGCCTAAAAAATAGAATTCTCGAGGCGGAGTTAGAAGAGGCCCAGAAA
+GAACTTCGCTTCTGGCAAGAGAAGGGAAGGCGTTCGTCTATCCCGACC
+>ds2020-328_613
+AACCGCCGCCACTACGTTTATCAATTGTTAAAGGCGATAACCCAGCCCACGCAGGACGCC
+CCCCAAGCTGGAAATTCATCATGGTTTCAGATAGGAGCGCACGGCTAATGTCTCCCATCA
+GTGGGGCAGTATGGGAGCCTGGCGCTCTAGTGGCGGCCGTTGCTGTTGATAGACGAACCA
+GCACCATGCGTCTATCCCGACCAGTGAATCTTTTCGTCTATCCCGACC
+>ds2020-328_614
+GGTCGGGATAGACGTCACCTCCCCATCCCGGTTCAGGAATTTTAACCCGATTCCCTTTCG
+AAGTTCGCGCGAGACGCGCTATCAGACGGGCTTCCCCCGTCTCTTAGGATCGACTAACCC
+ATGTGCAAGTGCCGTTCACATGGAACCTTTCCCCTCTTCGGCCTTCAAAGTTCTCATTTG
+AATATTTGCTACTACCACCATAGATCGTCTATCCGACCGCCGTATTC
+>ds2020-328_615
+GGTCGGGATGGACGAAGAAGGGCATTTTAAAAAAGAAAGAGATAGGTTCGTGCGTGCAGC
+CGTATACGAAAGTACGCTTCCTCTTCTTTCGAATGCTAATGTGTGGTTTTGTCCTACTTC
+CAAAGTCACAGAGGGAGCTGGAGCCGATTTTTTGTTTGACTACCCTCAATCGACGGATGG
+TGCTAAAGGAGTTGGGAGAAGAGTCCACAGGCGCGTCTATCCCGACC
+>ds2020-328_616
+GGTCGGGATAGAGGATGGCCGGCTTTGTTTCTCAGAATTAACTCACCCTCTACGCGCCTT
+AGCCATATGAGCTAAATGGGTTGCTCGGAAATCTTGCCTTTCCTTACTCTTAGGGCTTTC
+CTCCCTATCTTCAGGCAGCACACCGCCATCGGTTTCTGAATCAACGCTTACTATAGATCC
+TGACCTTTTCTCCGACGACACACCCACCTTAACCGTCTATCCCGACC
+>ds2020-328_617
+ATCTGCCTGGTTTCGGGTCTATACCCAGCAACTAAACGCCCTATTAAGACTCGATTTCTC
+TACGGCTCCCCTATACGGTTAACCTCGCTACTGAATATAAGTCGCTGACCCATTATACAA
+AAGGTACGCAGTCACACCACGAAGGTGCTACCACTGCTTGTATGCATGCGGTTTCAGGAT
+CTATTTCACTCCCCTCACAGGGGTTCTTTTCGCCTTTCCCTCACGGT
+>ds2020-328_618
+GCCGTGGACCTAGTTTTAACACTCTGCCGTGGACCTAGTATTCTATCTCGTGCCGTGGAC
+CTAGTCATTGAAAACTAGGTTCGGGATAGACGTAAAGGTCGCCTGGTCGGGATAGACGAG
+TTATAGGGGTGGTCGGGATAGACGTTATAACGCCCTGGTCGGGATAGACGCTGTACGCCT
+GGTCGGGATAAACAGGAATCCCCGTCTATCCCGACCGACGTAATTCA
+>ds2020-328_619
+GGTCGGGATAGACGCGTAACTGTCATCGATCTTTTCTTCTTTCTTCAATCGGTCATATCT
+GATCCGTAGCTGGTAGCGACATGAGGAAAAGGTCCAGAATAGTCTATTTTATTTGCTAAA
+TCGCGAGTTTAAGGGGTCGGATGGGTCAAGTATGGCCTCTAAAAACATGCGATAATCGGC
+TTTTTTAGTAGCATCTGTCCTACCCGCCCTGATCGTCTATCCCGACC
+>ds2020-328_620
+GGTCGGGATAGACGCTTGCCACTCCTGGTCGGGATAGACGTTGTTTTTCGCTGGTCGGGA
+TAGACTAGGTGATTGTTACGTCTATCCCGACCGCCGTAATTCACGGACAGAGAGCCGTGG
+ACCTAGTTATATCGTACCTGCCGTGGACCTAGTTAGCCTGGTTGTGCCGTGGACCTAGTG
+AAGTCAATGCTGCCGTGGACCAACTTAGCCCCCACGAGCGCCACGGC
+>ds2020-328_621
+GAGAGCCGTGGACCTAGTGAGGTTGTTGCTGCGGTGGACCTAGTATCCGAGGGGGTTGAA
+AACTAGGTCCACGGCAGCGGGTTTGAGACTAGGTCCACGGCAGGCAGCAGATCACTAGGT
+CCACGGCTCTCTGTCCGTGGATAGACGACACCCCAATCTGTTCGTCTATCCCGACCAAGG
+GTAATCTCCGTCTATCCCGACCAGGCACATGTTACGTCTATCCGACC
+>ds2020-328_622
+GGTCGGGATAGACGGGACCCTCGAATCTCTGGGATTGGCATGTAATAGAAGGATTGGGAT
+ACTCGAAACAACGCGGCACTGTCATCGGTAAAATAACGTCTAATAGATAGACCTGGAAAT
+CGATGCTTTCTGGCTCCTCACTTCCGGTCGGTGTGCCTCCCCTTTTTGTTTTATTTGATT
+CACAAGCAGGAATTGAACCAGAATCTCCGGTTACGTCTATCCCGACC
+>ds2020-328_623
+GGTCGGGATAGACGGCGCCACCTGCTATCTCGCCTTTCTGATTATTATTATCAAGAACAT
+TGGCTTCTTCCTCATTTATAGCAGCATTAACTCGTTGCACTTCATGGTCATCCAGACTAG
+GCGCAACCGAAAACCTCCCAATCACACGCTGTTCTTGATTTTTTGTTTTGATCTGTTTGT
+GTGACTGGCTTTACACTCTCAGCAGCTTTCAACGTCTATCCCGACC
+>ds2020-328_624
+GGTCGGGATAGACGGTGAAATGTGCATTGGTTTTGTTGCATTTCATGTAACAGGATTGTA
+TGGTCCTGGAATATGGGTGTCCGATCCTTATGGACTAACGGGAAGGGTACAATCCGTAAA
+TCCAGCGTGGGGTGTGGAGGGTTTTGATCCTTTTGTTCCGGGAGGAATAGCCTCTCATCA
+TATTGCAGCAGGGACATAGCATAGTGGCGGCCGTTGCTGTGTATTA
+>ds2020-328_625
+GGTCGGGATAGACGGCCGCCCGCCATACTGAGCGTCTCATGCAGTACACTACCTACAAGA
+CTAGTAGACCTGATGAAGTTCATGAACCGAACTTTTGTGAAAACACATTCCAGGACTGCT
+CCTTGCAAGGTAAGTATGCCATGGCAATCCATTCCACTTCGGATTTACCCTTAGGTGAGC
+TCTGTGAGAGCTTAAGGAAGAAGGGAGTGATTCGTCTATCCCGACC
+>ds2020-328_626
+AGGAATACCTAGTGGTGGACGAAGAACCATTGGCTATAGTTCCTTTGGGGATAGACGTGG
+TTGATGATTATCCACACACAGACCCAATGGTCTGTATACCCTTGAACCTCGACTCCTGCA
+TTGTCCAGCCACACCCCCACCTACAAAGACCCTCTAGCCTCGTTGGAGATGTTGACTACA
+TGGTTCATTGGCAATACCCTAATTCCGCCGTTCGTCTATCCCGACC
+>ds2020-328_627
+GGTCGGGATAGACGCGTGCCCAGCCTCCGTTTCACGGAATAAGTAAAATAACGTTAAAAG
+TAGTGGTATTTCAATTTCGCCGAAGCTCCCACTTATACTACACCTCTCAAGTCATTTCAC
+AAAGTCGGACTAGAGTCAAGCTCAACAGGGTCTTCTTTCCCCGCTGATTCTGCCAAGCCC
+GTTCCCTTGGCTGTGGATTCGCTAGGTAGGTGCTAGGGACAGTGGG
+>ds2020-328_628
+GGTCGGGATAGACGTGTTGGGTCAGCATCTCCGAACCTTGGCGAGGAATCTTTCCTATCT
+GGCTCAAGATCCTCTTAGTCAATCCATTTGAAATGGAACTTCTAGCCACTGGGTCAACGT
+TAACTCCACAAAGATTTTCGAGTTAGCTTCTGCTTACCTGCATTAGAAGTAAAGTCTTGG
+TACCAGTTACATACTTTTCTACCGTACTGATTCGTCTATCCCGACC
+>ds2020-328_629
+GGCGCCCTTTTTGTAAGAATTTGGGCATGAGCGACTTAGTGGTTAGCCGAGCTAGTTACT
+CACTCCATGGCATGATGGGAAAAGCCCCCTTCTGATGGTTGAGCGGGTAAAGCCCTTATG
+AAAAGAGTGAACCGGGCGTAGCGTAGAGGCTGCTAAGAGAGCTTTAAACCTCTATCTTAC
+ACCTGGCAGGAGATGTAAATACTTACTTTCGGGTTATTGGCCTCTG
+>ds2020-328_630
+CTGCCGTGGACCTAGTACTAGCCCAGGTCCGTGGACCTAGTAACCCACATCTTACTAGAG
+CGGGCATACTACTAGGTCCACGGCAAGCGACGAAATACTAGGTCCACGGCAGGGGAAATG
+TAACTAGGTCCACGGCTCTCTGTCCGTGAATTACGGCGGTCGGATAGACGTTTTAGATGG
+TTGGCTCGTCTATCCCGACCAGTGTCAGTGGTCGTCTATCCCGACC
+>ds2020-328_631
+GGTCGGGATAGACGCTGCATGTGCCTCTTCAACGCTTAGCTGTCTGTTAACCTCCCGCTC
+AGGGTACCTATCACGGAATAAAGCTGAAGGCGAAGTCGGAATCTCAATGTCAACGCTTTC
+GTAAAGCCTATTGAAATGACGTGTCATGATCAGAATAGGTTCAGGTGCTAGCGAAACTAG
+ATATTGATCGATCTTTGCAAAAATGTAATCTCCGTCTATCCCGACC
+>ds2020-328_632
+GGTCGGGATAGACGGAAATCTGCCCTGATCGTTTTCGGAAAGCGCCTTCTCCTTTTTGGT
+TGGTTTAAGGGGCGAGAGGGGGCGTGGAACTACTACTACGATTCTCATTATTCTCATTTC
+GCTTTCTACTAAAAAGAGGAACACGGAAAAAAAGGTTAAAAAAAAAGTGCAAAGAGGCGA
+TTCATGACTCCAGCATAAAAAACAGCACGATCGTCTATCCCGACC
+>ds2020-328_633
+GGTCGGGATAGACGGTGTTCCGTTTTAAGCATGTAGGCGGAGGTTCCAGGTAAATCCGGT
+ACCTTTTAACGCTGAGGTGTGATGACGAGGCACTACGGTGCTGAAGCAACAAATGCCCTG
+CTTCCAGGAAAAGCCTCTAAGCATCAGGTAACATCAAATCGTACCCCAAACCGACACAGG
+TGGTCAGGTAGAGCATACCAAGGCACCCGGGCGTCTATCCCGACC
+>ds2020-328_634
+GGGCGGGATAGACGTCCCATTACTCTTTCTACTCCTTCAAAATCGTTTAAAGACGCAAAG
+CTCTGCATCCAGATGTTATACGTAAATGTGTCCAGAGGGATGTTCCTCTGCTTCATTTCT
+TGCACTAAAGGAGCCACTTTCTCTGGTTGCTGCTTTCTCATATGCATAGACATGAGATTG
+TTAAAGACCAAAGAAGAGGAGTCTAAGTCGCCGTCTATCCCGACC
+>ds2020-328_635
+GGTAGGGATAGACGCAAAACCTCTATCATTATCGGCGAACCGAGAAAAGAGTCGGCGAAT
+CGTTAACTGCTATGTCAGCGAATCACAAAAAGAAACAAACTAGCTAACAATCATTCTTGG
+CCTAGCCAGGCCCATCTTGTCCTCTTCTAAACTAATCAAAACATCTTCAGGAGGGGTCTC
+TAACTCATGCAAGCCCAGAATCCAGCATACCCGTCTATCCCGACC
+>ds2020-328_636
+CGATCTGAATTACGGCGGTCGGGATAGACGAACTGTGGCGGTCATTAGAGTCAATCGAAG
+AAAGGCTTGACAGGCTGAGAGTAATAAGGAAAGAGGATGGTGGACTAGGATGCGGAAAGG
+CATTGTTTCGTGGTACAATGGAAAAGAGAAACGGGCTATGGACAGGAAAAGGTGACATAA
+AAGTCGACAGGGGGAGCACACATGTACAAAAGCCAAAAGAAATTA
+>ds2020-328_637
+AGGTCGGGATTGAAGACCACTTTCCCTATTTTTTACTCTGAGTTAAGCCCTGTCTTTGTT
+TTGTCTACTTCAATTATTTTGTCTCAACAGAATGGACGTTCAGCAAGCATTTCTTAATAG
+CATAAGAAATGACTTCAATCAGAACTAGTCTCGTTGCACTGTTATGGGGGCATTTCTCAA
+TCGTTATAGTTTTTCTGGATCTCCTTTTGATCGTCGATCCCGACC
+>ds2020-328_638
+GTCGGGATAGACGTACCAGTCAACTTTTTGCAATTTTCTTCATACATCACATGGTATGAC
+TTGGTTTGCCCAAGTCCGCGATGTAGCCGCAGCCGAAGCCTCGTCTTTCGAAGGCTCAGG
+CACCCTGGCTGATTGTCCCCCATTCGGGATAACGTCAAACCAGGTAGTTGTTAACTACTT
+GGCCCCAGCCACACTGCCAACGTCCCCTATTCGTCTATCCCGACC
+>ds2020-328_639
+GGTCGGGATAGACGGCGTGGCCGGGTCTTGCGGCTGATGGGCCATTTGATAAGAGAGGAT
+TGCCTTTTTTTGATGTTCTTTGTAACAAAGCCCGGTAGGGGCGCGTCTGATAATATTGTT
+AAAAGGGCACATCAGCCGCAAGACCCGGCCACTTCGTCTATCAGGAAGAGGAACCGTCTA
+TCCCGACCAGGGGCTCTTCTCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_640
+GGTCGGGATAGACGTTATTTGGTCTCGGGGAGACCGCCCATTTATCACATGGGAGGAGAA
+GACTAGTCAAACATTCGAGCTGTAAACTCGCAATATAGACTTGAAAAAAAGAAAGATATT
+GAGACGGAATATGAATGAAGGATTGAAGCATCTGACTGGGCTCCGGAGATGAATACCGAA
+AGAGCTTACCGGATGCACCATCGCACCACAACGTCTATCCCGACC
+>ds2020-328_641
+GGTCGGGATAGACGAAGGACCACCCTCCGCTTGGTAAAGCGACTCATAGGCGGATACCAC
+GTTGTTGTCAAGTGAGGTATAGATGAGCTGAACTTTACCTTGTAGACCACGAGCCGCTTG
+GGGAATATCGGTAGTGCGCTGTGCAGGTGCTGCAACGATGCTAATGCCCATAGGTTTAAA
+TTTTGTTTCAAGCGCTTTGAGTACCCCAGGTCGTCTATCCCGACC
+>ds2020-328_642
+GGTCGGGATGGACTTTGCGCCTTGTTAAAGCTTCACCTATTTCTAAAATTTCTGGAGAAC
+ATCACATACATTTCACAGCCGCGGAGGTGCTGCGCGCCATTCCTCGCGAAAAGAAGCTAC
+AGGCTCTACAAGCACTCCGTCTTCCTACGGATACCACTACCACCATGCTGGGGGGAGTCA
+TGTTATGGCTGGCCAGTCTAGACCCGTTTTCCGTCTATCCCGACC
+>ds2020-328_643
+GCCGTGGACCTAGTGCCGGATCGGGTGATGAACTAGGTCCACGGAGGTTACAGACAACAA
+AGTCCACCGCAGGGAGGAGTGAACTAGGTCCACGGCACCGTACTGTAAACTAGGTCCACG
+GCACGGGTCTAACAACTAGGTCCACGGCTCTCTGTCCGAGGATAGACGCTCACAGGGCCT
+GTAGACGTCTATCCCGACCAGGGCTCCCGTTCGTCTATCCCGACC
+>ds2020-328_644
+GGTCGGGATAGACGTTTAAACCTCTTGTGCGTCTATCCGAGGGGCTCAAACCGTCTATCC
+CGACCAGGGAGAGCCACGTCTATCCCGACCAGGGCGATTGTGCGTCTATCCCGACCGCCG
+TGGACCTAGTATCAGGCTTCGTGCCGTGGACCTAGTTCAAGCTCACCTGCCGGGACCTAG
+TATTAATTGGTCTGCCGTGAACCAAGATTCGACTAGGTCCACGGC
+>ds2020-328_645
+GGTCGGATAGACGAAATGGACCAGTGAGCGTCTATCCCGACCAGCCATGGTGCCGTCTAT
+CCCGACCGCCGTATCGGACAGAGAGCCGTGGACCTAGTTTCCGCCCCCCTGCCGCGGACC
+TAGTACGTTCCTCCTTGCCGTGGACCTAGTTGTGGTGACCCTGCTGTGGACCTAGTAGAG
+TCTCGACTAGGTCCACGGCAGAATATGATTCACTAGGTCCACGGC
+>ds2020-328_646
+GGTCGGGATAGACGATAGCTGCCCATAGTGCCACGCCCGTAAGGAATGAGTTAGTAGCTT
+CTCTGGTTATCGATAAGGCCAGAGCTACGCTGTCAGAGTTGACTCCCAAGATGTCTACCA
+CCTCCTTGAACGAAAAGTGAACATGATGCGACGCCGTTATCTTGGTGTATTTTGCCGACA
+TTGCTTCATGTAACTGCCACCCTAGGACTGTAGTGGCGGCCGTT
+>ds2020-328_647
+GGTCGAGCTACTTCGTTACCCTCTCCTCTGAGATACGAGCTTGACAACCACATAGTAATA
+TCCTTTCAAGTACGCCTACAGGGATAGGATTTTCCTTCTTTTTTCGACAACCAGTATAGA
+AAGTATCTCGCCCCTCTGTAATTCTTATCCGTCCCCAGATGCTGAATGAGCTAATCCTGA
+TCTTTCTCTCATAGGGTGAGAACAACTCTGCGTCTATCCCGACC
+>ds2020-328_648
+GGTCGGGATAGACGGTGAAAACCCCTTTTAACCTGATATAAAGATTGTTTTAACCGTTTA
+GCCTGTCTGGCTAACTGCAGCCAAACCAGCATACAACAACAAATATGATTCCGCTGAATA
+CGAGCCTTACGACACTGATTAGCTTCAATACCAGTGAGTTGTTTAAGTTATCGGTGAAAC
+TGCTCAATCTTCCGGGGGAGGCCCAACGAACGTCTATCCCGACC
+>ds2020-328_649
+GGTCGGGATAGACGGAGTGGCTGTATTTCTGGGTGCAGTTGTTCTCAGCTTAGCTCTTTC
+CGAGTCTGTGTGTGTAGTAGGTTTCAGTGCTGTGTAGTCAGCAAGTTTATGTTGTTGTTG
+TGACTCTTCTTTCTTAATATTTTGACTATGGAAGCGGGCTATTCCCCTAAAATGTTCGTT
+AACGTTGGGATGTAGTTTAGGTAAGTGTAGCGTCTATCCCGACC
+>ds2020-328_650
+GGTCGGGATAGACGTTGGGATGGATTTCATTAACACCCATAGACCAGAAAAGGTGTTCGT
+AGGCATACCGCTTGCTGTTCAAGAATCGGTAGCGGTTTTAAGGGAGACTACCGAGCTCCA
+CGAGAAGCGCCTATCATCTCTATGCGAATTCTGACCTTAGCTTTTCGTCTTTTATTAGTA
+TTAGTGAAAGCTCGCTCGACTTAGATATCGCGTCTATCCCGACC
+>ds2020-328_651
+GGGCGGGATAGACGATAGTAGGCCATTAAAACTTCCCACGACGCCCCTGTTAAGTCTAAA
+CAATGCAGCCATAGCGCTACTGCAGCTACGAACTCCGCAGCTTGGTTTACATGGTCCTTA
+CACCAGGATAATACTAACACACTTTGTTGCCTAGAGCGACTGAGTCCACGAAGTTTATCC
+ACACCTGCCAAATTTTTAACTGACTTGCCACGTCTATCCCGACC
+>ds2020-328_652
+GGTCGGGTTAGACGACCAACGGGCGTAATAGAACTCAAGGCAAGTAAGAAGGGCAGTCCG
+CCTCGTAGATCGATTTCGGAGTCGTAAGTTAATGTTTCCTTCTCGGCCGTTGATGAAGGG
+GACCCTTCGGCAAGCCTGGCGGTTGCTGCCTTGAGCCGATATCTTCCCAGTCCAAGCATT
+AGAGAACGTGTGGGGATAAGGCCGACGCTGCGTCTATCCCGACC
+>ds2020-328_653
+GGCGGGATAGACGGTTTACCTCCTGGTCGGGATAGACGGTGTTTATGCCTGGTCGGGATA
+GACGGTCATAGGAGTTGGGGTCGTCTATCCCGTCGGACAGAGAGCCGTGGACCTAGTCTA
+TACCCCTTTGTGCACTAGGTCCACGGCACCGTAAGTCAACTAGGTCCACGGCAGGGCGTA
+GGCCACTAGGTCCACGGCAGGGAGCGACCAACTAGGTCCACGGC
+>ds2020-328_654
+GGTCGGGATAGACGGTTCGGATGGTTAAGAGATTATCTATGGATAAACTATTCATACCAA
+AAGGATTATATCCATTAATAAGTTGCGAAGAGTTTAACCATAGATAATCTCTTAACCATC
+CCATCAAATATGTGGAAGACTCATTAAACTGTGACACGTTACCCTGCCATAATGTGATGT
+GATTCCAATGACAATAAAAAGAGACCCCCTCGTCTATCCCGACC
+>ds2020-328_655
+GGTCGGGATAGACGAGAAAAGCAGCTCAAGTATGAGACTGTGATTAGCCCATCGGTCCGT
+TACTCTGCGCTGATGCAGACGCCATCAGTCATGTCCCCTGGCATGGCATCGGTTGAAAGA
+ATACCGATACAGGAGCGGATAGTGACTAATAAGCCTTACCACTCTTCATGTGTTTATCAC
+TAAGAAGTAAAACGAATAAAAGTCAAAATCGTCTATCCCGACC
+>ds2020-328_656
+GGTCGGGATAGACGTCTGCTGTTCGTCAGGACTTTGATGGATGCTACGTTAAGTATCTCA
+TACAGTGAGGCCACTATAGGTGCGGCTGAAATAGGGCGTGCTAAATCGGTGGTTAGGTCC
+GCTCTGCGGCTCAGGAAACCAAGGCACGATATGACATTTAAGGTTAAAGCTGCAAGCTCA
+GTATCGTATAGGCCTATAATGGGAGTGACCGTCTATCCCGACC
+>ds2020-328_657
+GGTCGGGATAGACGCAGATCTCTTTTCTGCTCCATACCTCCTCTGGTATTCTATGCTCCA
+ATGGAACCGATGGGCCTCGGTTGATCAAGTAAGCTACTGTGTTGACTGCTTCTGCCCAGA
+ACTGCTTCGGTAGACCTGACTGTATACGAATGCTTCTGGCTCTTTCTGTCAACGTTCGGT
+TCATACGCTCAGCTATACCATTATTTTGAGGCGTACCCGGTAC
+>ds2020-328_658
+GGTCGGGATAGACGGTCATAGCTTTTACTGATGCTTATGGATCACTTTCTGAATCGAACC
+CAAAAACGGATAGGTTTGATCGGCCTGGCCTCGGGTGGTGGATCGAATGAACACTCAACC
+GCGTCATCACGGAAGCGATGGATGCCCAACCTTTATATCACTTCCTTCTCAATAAAGGCG
+GGGATGGACTCTGAAATACTCCTCTCTGTCGTCTATCCCGACC
+>ds2020-328_659
+GGTCGGGATAGACGGACGCCACTCCTGCCACATCAATTAATGATAGTGGTAAGCATATAC
+CAAAAAGTAAGACGGGCGTGTGTCAATATAATGATAGCGGTAGCGATATAATGGCTTAGG
+GACAAAATCAATCCCATGCCCACCCCAAGGATGACAGCGCGCGATACGCTTGGCTGTTAA
+TAATCCACCCCCTGCACTCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_660
+AACGGCCGCCACTACATTATGCACATCTGCGCCTCAACTACCGCCACAAAAGCCACCGCC
+ACCCACCACCACCACTTGAGGATGAAACTTTGAGCTCTTACTGCACATAGTCACCCAAAT
+GCAGGCACCCACCTCAATCTCTCCGCTGTAAAAACTCCCAATGCCCACATTGTGAAAAAA
+ACACCAAACCCATCCAAACCAATCCCAATTAGTGGCGGCCGTT
+>ds2020-328_661
+GGTCGGGATAGACGTTGGGATGAGTTTGGGTGATTGGTGATGGTAGAGAAAGATGAAATT
+CGTAGAGAATAGGAAGGGGGTTTTCTGGAGGTGTTTTGGTGATTTTGGACAGAATGGAGT
+GTTTGGGGAAGGATGGAAGTGTGAGAGGTTGGCTAGAGTGAATTGTAGTGGCTGAATGGA
+ATGAGATGTTGGGGATGTGAAGGATGGAGCGTCTATCCCGACC
+>ds2020-328_662
+GGTCGGGATAGACGCGGGAGTCAGTTCAAGTCTTACCTGAGACAATAGTATATAAAGTAG
+CTCAACCAATGGCAATTCCTCACGTATTCGAAGATCGGTAAATGCCTTAATCAACTAATT
+TAGGTTTTCTAGTGCGTGTAATTTCCATCCATTCATTACCAACGTAGTCTGGCTATAGCC
+CAGTTGTCCTGATCAGAAGAGGGGGTCCCCGTCTATCCCGACC
+>ds2020-328_663
+GGTCGGGATAGACGGAATAAGATACTTGTGGACGGATGACGTGGGAAGAAGTGGGGATCG
+GAGGTTGATGTGACGGTGGTTACAATGGTGTGGGCTGGTCATGTGGAGGACGAAGAACTG
+AACGCTTTGAGGAAACAATGGAGACAATGCGGCAAAATAGCCTCTCCTTTTCTTGGGTTG
+ATTGATGTTGTGTTCTTAGGAGAGTAGTGCGTCTATCCCGACC
+>ds2020-328_664
+AGAGCTTATCCCAATAGATCTAGCGGATCTAAGGGGTTTTTCCTCCTTTTCTTGGGAGAG
+TCTCTCCAGCTGGATCATAAGGGCACAAAACACCTTTGACTAGGTTCAAGCCTAGCCTAG
+GATACCCCGCTTCCGCATACACACCAGGGAATGAATTTGGAGAAGGATCAAAAGGAATTG
+GACTTGCTAACCCAATTGACGGGAATTAGTCGTCTATCCCGCC
+>ds2020-328_665
+GGTCGGGATAGACGAAGCTGCATCATGTCGGTGTTGACCATACCATAAAGCAAGAAAAAA
+GTAACTTGATCCAAACATATCCCAATAAATGCACAGATAAGGTAAGAGGACATGGACGCG
+CAGAAAGTAGTGACGAAGAGACTGACGAACAGGCAAAAAGCACAGATAAATAAGACGGCA
+AGTGCGCTAGAAAGAGAAGAAGCCGAATCCGTCTATCCCGACC
+>ds2020-328_666
+GGTCGGGATAGACGGGCGGTTTTGGTGAGTGAGAATGCGCTGCGATGGCTATCTTGCGCC
+CGGAGGTGTTGTGAAGCATTTGATTGCTGGAATGGCCACTCAATGAGCTGGCTGGATGGC
+GGAAGGTTGACCGAGATGCATGACGTGGCGCCGTCAGTTTTCCTTTATTTATTTATTTAT
+TTTTGTTTGGTTTTCGATAGTCAATCGAAGCGTCTATCCGACC
+>ds2020-328_667
+GGTCGGGATAGGCGGGAGTGTCGACTGGTCGGGATAGACGTAGAATGTATCTGTATCGTC
+TATCCCGAGACAGAGAGCCGTGGACCTAGTTCGCCGACTCTTGCCGTGGACCTAGTTCCT
+TAGCGGGTGAGTCACTAGGTCCACGGCAGGAAACTGGCACTAGGTCCACGGCAGAAAAAC
+GAGTACTAGGTCCACGGCAGAGATTATTAACTAGGTCCACGGC
+>ds2020-328_668
+GGTCGGGATAGACGTGGGATGTGGCTATGCCGAGTTCCGTGGACTGGTCCTATCCCACTA
+AAACGAGGCGTTCAACCCTCTCTCAGCAGTGGGCGCGTGTTTCAACGTCCTACGCAATGT
+TCTTCGAGATGTCGGCGGGTCTGTCGACCGGTCAATCTGCGCAAGGCAGTCATGCACAAA
+TGGTAGAAGTGACTATTATAGAGGGAGTACGTCTATCCCGACC
+>ds2020-328_669
+GGTCGGGATAGACGACGGCCGGCCATATACTTGCACATCAAAGAAGATTCCGACTGTCAG
+TCCCTGTTTGATACTTTCATCAGCTCAGACAACTACAAGTCAGAACTCAAAGCCTTCAAA
+GATGGCACTTATGATCAGAAGTACTCCGGCTCGACTACAATCGCCAGAAAAACGGTCCTC
+GCAAGTATCTTTTCAGACCAGTTCCCACATAAGGTCCACGGC
+>ds2020-328_670
+AATGACTCTAAGCCGAGGAATGATAAATTTGTCGGAATCCACCAGGGGTTTATTATCATG
+ACACCACTGTTCTAAGGAACAATCAACTTTGCGAGTGAACACCAATATATCTCCACTGCC
+AACTTCATGTACAAGCTTTGGTTCAAGAAAATATTTTGAACCGCACATTGCTGATAATCG
+ACGCCACCCATTTGCCACCTACCTCAAACGTCTATCCCGACC
+>ds2020-328_671
+CGTCGGGATAGACGGCTTTGGCTCTTGCCTCTTGCCCTACCGATCTATGCTACCTCGTAT
+GGTACTGTCTTTCTCGCTGCGTGCTTTTCTACAGGAAGCATCCCAACCAGCAGCTTAAGA
+AGGAGTTCCGGTGCCAATTTCATACCCTTTACCATAAAAGGGTAGTGCTCCTACCTTCCG
+GTCTACTGGTTATAGATCAATGGCTTACACCCCGTCCACGGC
+>ds2020-328_672
+AACGGCCGCCACTAATCAACTTTCTTTGGTGGGTCACAGTCGAAGGCTGATGAATCGGAC
+AGTTGGGTATCCAATAAGAGCTCTGTGTCGTCTGAGGGACGGAGATTCGGTGCTTCCGGT
+GGTGGGTTCGATCGGGAGAGGAAAGTGGGGTTCACATCTGATGGAGGTGCTGATTCTGAT
+AATTGGGGGAGGAAGAAAGAGGAGCGTACGTCTATCCCGACC
+>ds2020-328_673
+GGTCGGGATAGACGGCTTGCTGCCCTGCTTAATGGGTGGCTAGGCTTTGGCTACAAGCCC
+CAAAGGCCCAGACCCAGTTTCAATTTCAACTTAATTAATTGAAACAACAACAACAACAAT
+AACAATAATAACAAAATAATAGTCACAACAAATTGTAATAATCTTAATTCTTATATCAAC
+AATCAAGCAGCCGTCGAACTGTCCTCTGGGGCGGTCCACGGC
+>ds2020-328_674
+GGTCGGGATAGACGTACGGTTGCCCTGGGGGACTTGTTCTGTGATAAACAAATGACTCCA
+AACAAGAACCCCAGGGCAGCCAATCGTAAGAAAAGAGGTGAACCTGAGAAGAGCAGTAAG
+AGTAAGCGTTCAGGTGCTGGTGCTATGACCTTAAAGGCGGAAGATCCTCCCCTGGTTCTA
+ACCACCCTGAATGAAGAGAGGGCGCAGACGTCTATCCCGACC
+>ds2020-328_675
+GGTCGGGATAGACGTTCAGGTGCCATCTTTTTATCCGGTTTACTTGTAAGTTTTACTGGG
+TACGCCTTATATACTGCTTTTGGGCAACCCTCTCAACAACTAAGAGATCCATTCGAGGAA
+CACGGGGCTGATTACTAGGTCCACGGCTCTCTGTCCGAGGATAGACGGCAAAAGGAAGTG
+TTCGTCTATCCCGACCAGGGCAGTTATACGTCTATCCCGACC
+>ds2020-328_676
+AACGGCCGCCACTAAAGAAGCATAATCAACACATCACACATCATCAACACCCACCATGGC
+CGCAAACGACTACTACACCTCCCATCCCATGGAGAATTCCACCCTCGCACCCCCAGACCT
+AACCTACTCCGCCTCCGCCACACAACACAACTACAACAACACATCACACATCATCAACAC
+CCACCATAGCACATCGACGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_677
+GGTCGGGATAGACGACTATCAGTGTTGAGGATAGGAGCGTTCATGTTCCTTTTTGTCACC
+GACCGTGCCACTTCTCTAAAGGTACTTTGCCTATTGGAAGTTTGACCTGTCATTAAGGTG
+GAATCCACTCCAGACTTTCCTTTATCCCATGAAACAAAATGGGATAAATCAAAAGAGCAG
+TCATCAAGTTCAACTGCAATATCATCCGGCGTCTATCCCACC
+>ds2020-328_678
+GGTCGGGATAGACGAGCAGGCCCCATTCCTTAACAATAGGTAGCCAAAACAGGAACCCGT
+TAACCCGCACAAGCCAATCTTGAAGCATCAATGACGAGGGGTATGAGACGACAGTTCGAT
+GCCAGAGCACAGAGCCTGCCGGTGCATACAACCCATTCACCACTCACACGCCGTTGCTTT
+GGCGAAGCCCAGCACCACCAAACCTGACCGTCTATCCCGACC
+>ds2020-328_679
+GGTCGGGATAGACGGACTTCAACGCTCTGATGCCCGCCCTTGTCGCTTTGGGCTATGACT
+AGGGCAACCATACCCGCCATTACCACAAGCCCGCCTTGTGCCATTGGTGAGCATTGCGGG
+CATGATGCCAAGCTTGTTCCTGTCATTGGTCAGTCAGTACCAGCTACCAGCCAAGCCGAT
+GCCAACCATTCACGATAACCACAACCAGCGTCTATCCCGACC
+>ds2020-328_680
+GGTCGGGATAGACGACGGACTCCGCTGAGAAGGATTCTCGTGCCAACTATTATGTTCAAA
+GACAGGCCTCAACGTGACTTTAAAGCGATTATTCTCGATTGAAATTTCCATAGATAGAAT
+AGAAATTAGGCCATCTCCTCAGAGGCGGCTTCGGCTGCGTCTTTGCCTATTCTCACCTGA
+GATAGCGTCTCATGACACCCATATTAACCGTCTATCCCGACC
+>ds2020-328_681
+GGTCGGGATAGACGTTTGCACTCGGTCCGGTACGACCATCAAACAATACTTGCTGACCTG
+AGGTTGGCATACCTGCTAATTCTAGCAAGCCTTTGATTTGCTGTTCTTTAGCGCCATCAA
+ATACTGCCGTACCCATTGGTACGCCTGCACGTAGATTTTTTGACATCGCAATGATTTCCT
+CATCACTGAGGCTGCCTAAGTCCTTTTCGCGTCTATCCGACC
+>ds2020-328_682
+GCCGTGGACCTAGTCGTCTATCCCATACAATATTAGGTCCACGGCAGGGGGAGCTCCACT
+AGGTCCACGGCCCCCCCGTGGACCTAGTTATGGAGGGAATACTAGGTCCACGGCAGGGTA
+GCAGGTACTAGGTCCACGGCTCTCTGTCCGTGAATTACGGCGGTCGGATAGACGCTGTCA
+ACGCCTGGTCGGGATAGACGTGACCAATCGTCTATCCCGACC
+>ds2020-328_683
+GGTCGGGATAGACGTGATACTAGCCTGGTCGGGATAGACGGACTACCCCCCTGGTCGGGA
+TAGACGCAGGTATGTTCGTCGTCTATCCCGTGTCATCAGATTCAAGCCTCAATAGAAGAG
+AAACCATAAAGAAAAGAATTTCTGAAGGAGAAAGTAGCTCTGCTGCTAGGGGGAAGAAGA
+TGAATGGGTCATCATCAACGGGAGCACAACTAGGTCCACGGC
+>ds2020-328_684
+GGTCGGGATAGACGATACCGCGGGGTACGCCGTCTATCCGACCAGGGTTTCAAAGCGTCT
+ATCCCGACCAGTGAATCGGGTCGTCTATCCCGACCAGGGTCCCTGATCGTCTATCCCGAC
+GGACAGAGAGCCGTGGACCTAGTTAGGCAGCAGGTACCGGACTAGGTCCAGAGGAGTTCA
+GTCACTAGGTCCCGGCAGAGGCCCGTCCACTAGGTCCACGGC
+>ds2020-328_685
+GGTCGGGATAGACGAGTGAATCGGTTTGCGCATTTTTGCACGTAACTTTGAGGTTGTAAT
+ACTGTGTCTGATAACCGTCGGTATACGCACTAAATGGCGCAACGTTATACGATGATGAGT
+CCTCGTTATAGTAGCTGCGTGCCCGCTTAGTTACTCCTTGCGTTGTTGATCCCTGGCCGT
+TGTCTTCCCCCACGTAGACAGCCCGACCGCGTCTATCCGACC
+>ds2020-328_686
+TAGTTAGAATTACGGGGTCGGGATAGACGTTTAATGTGCCTGGTCGGGATAGACGCATAT
+AACCGCTCGTTCCGTCACCACAACCACCACCACCGCCGACGACAATAACATCAACAAGAA
+CGATAACCACCGGAAAGACAACAACATCAACCAGAACGACAACAACATCAACCAGAACGA
+CAACAACAAGAGCGACAAGCAGGATAAGTAGTGGCGGCCGTT
+>ds2020-328_687
+GGTCGGGATAGACGGCGAGCCACCATGTGTGAAAAAGCACCCCACCGCCTCATTTGATAA
+AACTTCCAACTGAGGGCTCCATGCTACTATCAACCCTTTGCATTCACCACCATCTTCACT
+AGTACTAGTACTTCTCTCCAGCTCCAGCTCCTCTATGAAGTTGGGTGGCAGCTTCGCCTT
+TTCGGATTCCTTGACCACCCACGAACAGCGTCTATCCCGACC
+>ds2020-328_688
+GGTCGGGATAGACGGCGCGTTCGTATGAAGCAAGAGCAGGATTGCAGTCCGTAAGAGCAA
+TTCTTGAGCCAGCCATAGCGATTCTGCATGCGTGCAGGTACGATCCCGTGTTGCTCGCTT
+TCGTAGACAAATATGGTAGGAAAATGTACGACATTGCAGCTAGAACAAAACACGTGCTTG
+TTGCGTTTTCGTACGTCCATTGCAGAGGTTCCCAGCCCCCCT
+>ds2020-328_689
+GGTCGGGATAGACGGTACGTGGTCCTGGTCGGTGCCGCTATCGTCGGTACTGCAGGCTTG
+CCATCAACGCTGGCAGCGGCTAACGCGGGTAAAAAGATTTTGCTTGCTAATAAAGAAGCA
+TTATTGATGGCAGGTGAGCTGATGATTAAAGCCGTCAAGAAGTCAAATGACAAATTGCTG
+CCAATTAATAGCGAGCAGTGGTACTTGGCGTCTATCCCGACC
+>ds2020-328_690
+GGTTACCACGCGCTCAGGCGGAGAAGGGGCAGTTCGTGAGTTATGTGATTTGATATTAAA
+AGCCACCGGTCATTACAATGATATTTTGGCAAGCTATGTGGTTTAGTGACTGTAAGTTAG
+CTTGAGTAATTTTTTCTAAGTGGTTTAGTTTAAGTAATTTGTTTTAAGTGATTTGGCGTA
+TGCGGCTTGGTGTGGAGTGGGTATGCTCGTCTATCCCGACC
+>ds2020-328_691
+GGGCGGGATAGACGGGATTCTTGGGTCATCTCAATGGGTTCAGAAACCACACGTTTCTCT
+GGATCATCATAGCGTACTTCTACATATCCACTCAGAGGAAGGTCTTTTCGTAATGGATGA
+CCCTCGAAACCATAATCTGTTGATATACGGCGTAGATCCGGATGATTGATGGAAGAAACA
+CCAAACATATCCCAAACTAGTTCGCACCGTCTATCCCGACC
+>ds2020-328_692
+CCCCGCTTCCACACCCGCTCACTACTACTCCAAAGTGTATCAAATCTTTACGTCTGTCTT
+TAACCCAGCTTTGTTCCGCTCCTATCAACGCCGATCCGTTCTCGCCTCAATCGCTCTCGA
+CCCCGTCACCTACCCCGACCGTCACATGAACTTCTTCGATCTCGTTTTCTCCGCTTCCCG
+CTCCAATCTCGCCGAACTCCGCGCAAACGTCTATCCCGACC
+>ds2020-328_693
+GGTCGGGAGAGACGGAGGCCATGTGTCTTATATATCACACCTGAGGCGGTCTGGGATGGT
+ATACGCAAGGTTTTGGGATTAGCACCACGACCAACAAAGAGATCAGTTTCCGAGGCAATA
+ACCAGGGAACAAGTTGCTGCAATACTCAAAACGGAGCCGAAAGTAGTAGCCAAGGCCCAC
+ATGAAGTTAAATGAAACGGGGAGGTAGCGTCTATCCCGACC
+>ds2020-328_694
+GGTCGGGATTGGATGGAGATGATGGTGAAGATGAGATGGGTATTCTGGAAGCAATGTTGG
+CTGGCCGAAAGAGTAGGAAAAATGCAGCTTTGAGGGTTGAGCAAGAGGATTCCTTCGTGA
+CTGATATTCATGTGGAGAATGATGGCGATGAGGTGGAGTTCATGGAAAATGATAACCGGA
+AGAGCACAAGAAGGAAAGGATTAAAGATAGTGGCGGCCGTT
+>ds2020-328_695
+GCGGGATAGACGTTGAATCACCTTGGTCGGGATAGACGAGCATGGGGCCTTATCGTCTAT
+CACGGACAGAGAGCCGTGGACCTAGTGCGGCTCGGGCTGAAGAACTAGATCCACGGCAGG
+GATAAGTATACTAGGTCCACGGCAGGGACTGACGGACTAGGTCCACGGCAGGGGACTTAG
+AACTAGGTCCACGGCAGCCCTCGGTTTACTAGGTCCACGGC
+>ds2020-328_696
+GGTCGGGATAGACGGGGGAAGCTCCTGAGAAATGGAAGAGGGTGTTCCAAAGAGGTGGAT
+CCGGAAGTCTCACTGTATGAGTTCCGAGGACATGGGGTATGTCCGCACTCGATGGCAGAG
+GGCCTAAGTGTTGCGGGGCTTTGCTGTGGTTTACACCTTGAGGTGGGGGTGTGCCAACGA
+GACAAGTAGGGGGAGAACCTCGAAACTCGTCTATCCCGACC
+>ds2020-328_697
+TCATCCACCTGGTCGGGATAGCCGTGCCATCCCTAGTGTGCCGCTGGCTCTTAGGTTTCT
+GAATGTACCTCTGTGCTCCCGCCAGTTTCGTGCGCGATCTATGTTAAGATTATCAGTAAC
+TTGTACTGTTGCTCTCTTTATAGATAACGCCTTTAGCGTAGAGTTGTACACTCTTTTTGT
+TATGTTGTTTATTGTTATATCTCCCTTCCGTCTATCCGACC
+>ds2020-328_698
+GTCGGGATAGACGCCGGAATTGACTCAAAAAAGACCAGCTAACATATCCACTGTGCAAAG
+CATTGCAAACGACACTTCAGTCCAAATACCTACCGCTGAATATGTAGCAACAATAGTTAA
+AAGAAGCGGTATGAATTGGACAGGAAAAGAAGTCGGTTCTTTTTCAAAAATCATGGAAGA
+TGTTGGATTCGCCGAAGGCCGACAACCCGTCTATCCCGACC
+>ds2020-328_699
+GGTCGGGATAGACGAGAGGCACCACTGGTCGGGATAGACGACTGAAGCTCGTGGTCGGGA
+TAGACGACGAAGTGGGGTCAGCGTCTATCCACGGACAGAGAGCCGTGGACCTAGTGCCAG
+TAACCGTGCCGTGGACCTAGTCCGCTTGTACGTGCCGTGGACCTAGTTTCTTCTGCCTTG
+CCTGGACCTAGTAGAAGCGACTGTCCAACTAGGTCCACGGC
+>ds2020-328_700
+GGTCGGGATAGACGATTACGCGCGCTGGTCGGGATAGACGATTATTTCCCCTGGTCGGGA
+TAGACGGCATACAACTCTGGTCGGGATAGACGAGAGCAGTGGATGTAGTCGTCTATCCCG
+GACAGAGAGCCGTGGACCTAGTCTACCAGACCCTGCCGTGGACCTAGTCCAGTTACTCCT
+GCCGTGGACCTAGTAATCGGGGTAAGTACTAGGTCCACGGC
+>ds2020-328_701
+GGTCGGGATAGACGTCACACCCTCTTCGAGGGTTTCCTTAGCATTTCTATGCCAGAGAAC
+TTTGCCGCACAATGGGATTAGTTTACTTTGAAGGGGACTCCTGACCTTGTTATCATAAAG
+CTCATGACGAGCCACTTCGCATTAAAGAACCAATACCATAATGGCAAGCCGTGACCCTAC
+CCTATAACCCCTGTACGAGAGAGCGGCGTCTATCCCGACC
+>ds2020-328_702
+GGTCGGGATAGACGCCTGTCGCAAGTGTAATACTTTTCGTTCTATGACTAATTTTTTTTA
+TTTGACAATATAATGTTGGGAACAATTTCTAGGATTCATTTTGCAAAGTCATATCAGGGT
+GAATTGGGTGAGAGAAGTTCTTATGTATTTCTTGATGGATAACTGTTGTTAATCGAGGTT
+GAGAAGACGTTGGAAGCTGTCAACTGCGTCTATCCCGACC
+>ds2020-328_703
+GGTCGGATAGACGCTATTATCCTCTGGTCGGGATAGACGCGCATGAACCTTGGTGGGTAG
+ACGTAAATCACTGGTTGACGTCTATCCCACGGACAAGAGCCGTGGACCTAGTCATCATTG
+CCGTGCCGTGGACCTAGTGGTAGTACCCGTGCCGTGGACCTAGTCTATACCCGAGGCCGT
+ACTAGGTCCACGGCAGGGTAGTGTTAACTAGGTCCACGGC
+>ds2020-328_704
+AACGGCCGCCACTATCCTCGTCTCTCACTCGGTCAACGACGCCGAATTTTGGCAAAAACG
+CTATGATGATGGCTATACTGGGTGGGATATCGGTCAAGTTTCGTCACCCCTGCAAGCCTA
+TATCGAGCATTTACTTGACAACGGCGTGAGTAAATCGGTACAGATTTTAATCCCTGGGGC
+GGGCAACGCTTATGAGTAGTGGCGGCCGTTGCTGTGTATT
+>ds2020-328_705
+GGTCGGGATAGACGTCCACGTGTGATGAGATACAGTATTTTCATATAAATTAAAATAGCA
+GTTTATAAGGCAAAAAGGGACTGAGGGAGAACCATACTCTAGCTAGTTAAATCAGGCCCG
+CCTGAACAAGTAGATAGAAGTCACGAACGTCGCATTGACGTGGCTGGCCTTGAGCTAAGT
+GATGACAGAGATCCAGGAGAGCGGATCGTCTATCCCGACC
+>ds2020-328_706
+GGTCGGGATAGACGAAATCATGTGCATTACTCAATGGGTTCTTGAAAACCAATCTTTTCT
+TGACTGCGCTCCAGAAAGTTAAATCATCATTAGCAAAATGTCTCGGGAAAACAGCTTCAG
+GGAGCATTGCGCAATTATCCTCCACCTGATCTTTCTGATTTGGCTCATCTTTGAACTGCT
+TGCTCCATCCGACACCAATCTCGACTAGGTCCACGGCTCT
+>ds2020-328_707
+GCCGTGGACCTAGTGATGACCGCCATGGAGAGGCAACGTGAGACTAGGTCCACGGCACCG
+ACCCCCCGACGAGGTCCACGGCAGGGCATGCTTAACTAGGTCCACGGCTCTCTGTCCGTG
+AATTACGGCGGTCGGGATAGACGTTTCACACCCCTGGTCGGGATAGACGGACTGAACCCC
+TGGTCGGGATAGACATAGGCGCCCACCGTCTATCCCGACC
+>ds2020-328_708
+GGTCGGGATAGACGCGCAACAACCTGGTCGGGATAGACGGAAATACCACCTGGTCGGGAT
+AGACGCATGGCCAATCAACGTCTATCCTCGGACAGAGAGCCGTGGACCTAGTAACAACTG
+CTCTTGGCCGCTATGGAGCCCAATAAAGGACTAGGTCCACGGCAGGTGTTGATGAACTAG
+GTCCACGGCAGGGGATACAAAACTAGGTCCACGGCTCTCT
+>ds2020-328_709
+GGTCGGGATAGACGTTAATGTCGCCTGGTCGGGATAGACGTTATGACTACCTGGTCGGGA
+TAGACAGGCACCACCCTCGTCTATCCACGGACAGAGAGCCGTGGACCTAGTCGTTAATTC
+GCTGCCGTGGACCTAGTACCGATGTCCCTGCCGTGGACCTAGTTCTAAATTTCGTGCCGT
+GGACCTAGTTCTAAAGGGCTTGTGCCACTAGGTCCACGGC
+>ds2020-328_710
+GGTCGGGATAGACGTGCGAGTTCCCTGGTCGGGATAGACGCATCAGAATCCTGGTCGGGA
+TAGACGTAACCAGCACTTTAGAACGTCTATCCTCGGACAGAGAGCCGTGGACCTAGTTAT
+ATTACGCTTGCCGTGGACCAGTGCCCCATGTCGTGCCGTGGACCTAGTTCGTCGACCCCT
+GCCGTTGACCTAGTACTTGCAGGGATACTAGGTCCACGGC
+>ds2020-328_711
+GGTCGGGATAGACGTAGATCGGTGGTGAGTCAGTACGAGGAAGAAATATACATAAAAAAG
+ATGTTACCCACAGATGCGAGAGATAAAGCAGGCTGGTTTTGTGCTTCTAAAATAAGTGAT
+CACAGTAAGTGGATGGAGCGACACCCAGAACTATATGCTTCAACACGCTTGAAGTACGAG
+TGGGGTAAAGTAAGAGCGCTACTAAACGTCTATCCCGCCC
+>ds2020-328_712
+GGTCGGGATAGACGAATCACTGTTATTCACTTCACCTGCTGGGCTTCTCGGGCTGCTGTT
+TAAACTGCAAAGAATTCGCGATGTGTATGGCAAGGATGTCAGTGAGTTCAAAGACTCGGA
+CACTGAGTTGTTCCTGCCCACTTTTGTCAACTCGGTTCCCGGCAGAGTCTTGCCTAGTGT
+GATTCTGGACAAAGAGGGCGCGGAGACGTCTAACCCGACC
+>ds2020-328_713
+TAATACACAGTAACGGCCGCCACTAAGTGATGCTTTTGCCATTGCACTTTAGGTACGATG
+TCCGACCGTACCAAGCGTACCTTCGAACTCCTCCGTTACACTTTGGGAGGAGACCGCCCC
+AGTCAAACTGCCTACCATGCACTGTCCCCGACCCGGATAGACGGGCCAAGTGCATGCATC
+GTCTATCCCGACCAGGCACCTGACTCGTCTATCCCGACC
+>ds2020-328_714
+TGAATTACGGCGGTCGGGATAGACGGTGGTGAGGAGTGTGTGTTGCATGTTGGGGGATAA
+GAGGGCTAGAGAGAGTGTGATGAGGAGCAATGGGGCGGCAAAGGTGTTGTTGGTGATGCA
+AAGTGGATATGGGGAGGGGAATTTTGTGAGGAGGATGTGTGGGGATTTGATTAAAGTTTT
+GAGTGTTGGGTTGAGGTGTGGGGTTCGTCTATCCCGACC
+>ds2020-328_715
+AAGGGACATTGTTTACAACTCAAAAGCACGGGATGTTAATATGTTAGGCTAAGGCACCTC
+TCATCACAGCACGTCGAAAGCATGCCATCAAATTCATTATTTAAAGCCTTAGAGCAGTAG
+CACGCACAGGGATAGAAAACCCTTCTGATCCCAAGGAATGCGCGTCTGGTGGTATCGAGA
+GAAAGGTTGCATTTAGGAGTGATTTCGTCTATCCCGACC
+>ds2020-328_716
+GGTCGGGATAGACGGCCGTAGCTTCTCTTTTTGGGAATAATTTTTATTGTAAAAATGATT
+ATTTCAGATAATCCCCGTCAGGGTTAGAAGACACGCGGACGGATTGACGAACGTACGTGC
+AAGAAAGTCACATCTATTGGATTACTCTAAATGGAACCTCGGACACTCACAAACCGCCTT
+GTCAGGATATCAGCGGCTGCGAATAGACGTGTGGAACTC
+>ds2020-328_717
+GGTCGGGATAGACGAAGGCCTAGAGTTGAATACATACGAACGATCACCGTGCCTAAAGGT
+ACCTACCACATCACGGGGATTGTACACAACATAGTCTTGAACGTCTAGATCTACATCTAT
+TGCTCCCCTGTCCATGCATTCTAGTAACATCCAGAAGCCTTTCACCAACCGAGTCAACTT
+AGATTGCCCAACAAAAACGCGCCAATGTCTATCCCGACC
+>ds2020-328_718
+GCCGTGGACCTAGTCTTATGTGTGGTCAGACTAGGTCACGGCAGGGAGGTGGGCACTAGG
+TCCACGGCACTGGAGTTTCGACTAGGTCCACGGCAGGGGATACGAACTAGGTCCACGGCT
+CTCTGTCCGGGTCGGGATAGACGGCTTGACCCCCTGGTCGGGATAGACGAGGAGCACCCC
+TGGGATAGAGCCGACACTAATTGGACGTCTATCCCGACC
+>ds2020-328_719
+TGAATTACGGCGGTCGGGATAGACGTAGTTTGCTAATGGCGGTGTTGGTGGGGTAGTTGG
+TGTTGGCGCCTGCCTGGATGTAACCGTGAGCTCCCTGGGTTTAGGAGGGGCAGATGATCC
+GTTGCTACGTAGTGGTTGTGGAGCTGTTGGTTTGCGACGGTCGTATGATATATGGGGTGA
+ATGAGGCGATAACAGGGATGCTGGCCGTCTATCCCGACC
+>ds2020-328_720
+GGTCGGGATAGACGATGGTAATGCATGGTCGGGATAGACGTAACCCTTCCTTGGTGGGTT
+GCGGGTGATTGTTGTGAAGGCCACTTTTGGAGGTCCAGTGCTGCAAAAACTGGCCTTTGT
+GTGCAAAAATGGGTCTTGGGACGAGGGCTGAAGGAGGGTTTGGTTGAGAAAATGGGGCGG
+TTAGTGCAGGCTGTTAGTGGCGGCCGTTGCTGTGTATTA
+>ds2020-328_721
+GGTCGGGATAGACGCTTGGTCGCTTTTAGTTGTTTTCTTTGTTGCTGCCATTGACCCCTA
+TGCTGCATTCGATCCATCTGTCCCATCACCAGAGGCGGATATGTGCCCAGGCATCAGATG
+CCTTTCGGACCTGTAAGGGAAATCAGTCATAGGTAGGCCCCATAGCCATCTCCATTCATC
+AGAAACTATCAATTACGAGTCTGTGCCGTCTTCCCGACC
+>ds2020-328_722
+GGTCGGGATAGACGTAACTCATGGCTAACAACGTGTTTTGGGGCGGTAACCAGACTGTGG
+AATCAATCGATTCCGCGGTGAGTGCGGGCGACCTTACGGGTGATGTGGATACCCTAGTAA
+ACTCTAATGCCAAAAGGAGTGAACGGTACCAGAGCATGCTCAGCCGGTACCGTAGCGCGC
+CATCTGAACAAAAGGCAGGGTCCGTCTATCCCGACCGCC
+>ds2020-328_723
+GGTCGGGATGACGTACGCAAGCACTGGTCGGGATAGACGCACCATACCCCTGGTCGGGAT
+AGACGTTAGTGCGCTGTTTCGTCTATCCTGACAGAGAGCCGTGGACCTAGTCCTAGGGGC
+GTTATTTACTAGGTCCACGGCAGGTCAAGGTCCACTAGGTCCACGGCAGGAAAAATATAA
+CTAGGTCCACGGCACGGGGACTACGACTAGGTCCACAGC
+>ds2020-328_724
+TGCCTCTGGCCTTATATTCTCCCGTCCCACCTATGTTATCATGGACTATCATGTCGTCTA
+CTGACGATATTGTCCACGCCATAGCTTGCTTCTGCTCACCCGTCATCTCACCGCTGTACG
+TGTCGGCGAACGCTCGTAACACCGATTTCATGGATCCTGTGCTATGTTGGGAATTGAAAT
+CCTCGAAGTCAAAACATAACGCACCCGTCTATCCCGACC
+>ds2020-328_725
+GGTCGGGATAGACGAATATAACCCTTGGTCGGGATAGACGTTTTAGTACTGGTCGGGATA
+GACGCCCGTCCCCCCTGGTCGGGATAGATGGCACCTTTTCGTCTATCCCGACACGGACAG
+AGAGCCGTGGACCTAGTACTAGCGTGGGTGTATCACTAGGTCCACGGCAAGGGAGCTTGG
+ACTAGGTCCACGGCAGGGATGAGACACTAGGTCCACGGC
+>ds2020-328_726
+GGTCGGGATAGACGTAATGATCGGCTGGTCGGGATAGACGTTATAGTACCCTGTCGGGTA
+GACGACCCCTACAATGCGTCTATCCCACGGACAGAGAGCCGTGGACCTAGTGGGATGTTG
+GGTGCCGTGGACCTAGTAACTGGGCTCCTCAATAACTAGGTCCAGGCATGCTGGTAAGAA
+CTAGGTCTACGGCAGGCCGAGTATTACTAGGTCCACGGC
+>ds2020-328_727
+GGTGGGGCTGACGTGGCGAGGGCTTGCAGAGATAGGATGCATGAGGTGGTGGCGGAGGCA
+GTGGAACTGGAACGGATTTATAATAATAAGAAAGATCCGGTGGATTGGGATTGGGAGAGG
+GTGATGGAGGTGTGTTTTGGTAAAATGGATGAGGAGGTGAGTGGGATTGCGGCGGCCAGG
+AAGGTTGGGGGATACTAGGTCCACGGCTCTCTGTCCGA
+>ds2020-328_728
+GGTCGGGATAGACGTAGAGCTGCTGTTAGCCAAATAGGCATCCCCCTGGACACAGAGTCG
+TCCAAGCGTGACTCGAGTGCTTCGAGCAGGTCCCTCATGTCACTCGAGGGTTTCGACTCT
+ATTCTTGAGTGCACCAGAGTTGCCATTGCCCTCGCCAGATATTGCCCCTTAGATCGGCGC
+TAGTGATCTACACAAAGGGTTCAGCGTCTATCCCGACC
+>ds2020-328_729
+GGTCGGGATAGACGCGCTTTCGCCATTGGCTACTGTAACTTTTGTTTTGTACATCTTCGC
+CCACCTACTAATCGCCTCTTCACTATTCACTCCTTTTGGTCATATTATTTACATTCTGTT
+TTACTTCTGTGATCGTGTTAAGACGACGGTTTTGATGTTATGTGTAGTTGCTGTTGTATT
+GATACGGTTATCATTATATATGTAACCGATGGGGATTG
+>ds2020-328_730
+GGTCGGGATAGACGATCAGGCCCTCGAGAAAGACACTTAGACAACATTAGAGGATCTTTT
+TTTTTACTGTATGAGTGGCTCGGAAGAATAATCGCGCCTCCAGTCGATTCTACTTCATGT
+CTGACTAGATAAGTCACAAGGCCTGTCCTTCTTCAGGCCCCGGTCATCTAGTCGGGGTCG
+ACCAAACTTTCCCAAGTAAGAAACAAACAGAATTTCAC
+>ds2020-328_731
+GGTCGGATAGACGCCGGATGTCCTTGACGAAACCTTTGTACCTAGTGCTCGAAATCTGAG
+AATCAGCTTCCTTGAAGAAATCTCCACTCTCTGTTCTATACGCACAAGCGGTGGCATAGG
+CCGCAACGACAACGTTCACGAGCTCATCGGGGCGGTGTGAAAACCCCGACGAAAGCACGA
+TTCCGCTAAGCGAAATGGCGTTGACGTCTATCCCGACC
+>ds2020-328_732
+GGTCGGGATAGACGTTTCAAGCTCCTCTAGTCGTTCCTCAACTAGGTCGGACGCGGAAAG
+CGCTCCACCTGAGTTCGAGCGGTTATTTGATCGAATCTGTGATGAATACGCAGAGTGGGT
+GGGGAGAAGCGGGAGGCAATTACCTCCCGAATGGACGGTGCCCGACCTTGTTCGGGCAGT
+TATTACCGACAATCGTCTATCCCGACCGCCGTAATTCA
+>ds2020-328_733
+GGTCGGGATAGACGACCCAATGCCCTGGTCGGGATAGACGGTCTACTCACCTGGTCGGGA
+TAGACGTCAGGGCTAAAATTCGTCTATCCCACGGACAGAGAGCCGTGGACCTAGTCCCAA
+ACACCCTGCCGTGGACCTAGTTCTCCTGTCTCTGCCGTGGACCTAGTCAGACCACAGCCG
+ACTAGGTCCCGGCCCCGAATCACAACTAGGTCCACGGC
+>ds2020-328_734
+GGTCGGGATAGACGGAGTGACCGGGGGTCGGGATAGACGCGCAACCCACTTGGTCGGGAT
+AGACGAATAACAATGCTCCGTCTATCCACGGACAGAGAGCCGTGGACCTAGTCAAATGTC
+CGCTGATACTAGGTCCACGGCAGGGATAAGTTGACTAGGTCCACGGCAGGTGCCCTTGAA
+CTAGGTCCACGGCAGGGATGTAGTACTAGGTCCACGGC
+>ds2020-328_735
+GGTCGGGATAGACGGCCTCGTACGCTGGTCGGGATAGACGCATACAGCCCCAATAGTCGT
+CTATCCCACGGACAGAGAGCCGTGGACCTAGTTATCAGCTACTTTGTCCACGGCAGCGCT
+CACGACACTAGGTCCACGGCAGTGAGCGAAAGACTAGGTCCACGGCAGGTGTAAAGTGAC
+TAGGTCCACGGCAGGGGTGTATCTACTAGGTCCACGGC
+>ds2020-328_736
+GGTCGGGATAGACGTATTAAGGCCTGGTCGGGATAGACGGTTCATATCCCTGGTCGGGAT
+AGACGGCCTATTTCCCTGGTCGGGATAGACGTATATGTAGCTTGGACGTCTATCCCGTGA
+CAGAGAGCCGTGGACCTAGTGCGGCAACCCCTGCCGTGGACCTAGTTACATTTTGCCTGC
+CGTGGACTAGTTATCCCCCCAATGACTAGGTCCACGGC
+>ds2020-328_737
+GGTCGGGATAGACGTTTGGGCAGTGTATCCCGACCAGCCACGCGTGTCGTCTATCCCGAC
+CAAGGCGTTCCACCGTCTATCCCGACCGGACAGAGAGCCGTGGACCTAGTACCCTGTTCC
+GTGCCGTGGACCTAGTAATTAGATCACTGCCGTGGACCTAGTCCCTTACTCCATACATGA
+ATAGGTCACGGCAACGGCATCTCAACTAGGTCCACGGC
+>ds2020-328_738
+GGTCGGGATAGACGGGTGCATACGCTGCGGGTCAGTTTCGGGGCGGGGGGGCAAATAGAG
+ACCAGAAGAATGATTCATTTGGATCGACGAGCTTTTTCAGCCCCAAAACTAAGAATCAAT
+GGAATGTCTGTCTATCCATGAATATCTATTCTATCTGTATATCTAGGGAATCACTTTATA
+CATATAAAATTATATTATGGCATGATATGATCGCCTA
+>ds2020-328_739
+GGTCGGGATAGACGAGGTTTGTACTTGACTAGCGATGGTTGAGTGCGACAAGAGACGGAG
+GTCTCGGCCCAAGATGAGGGAAAGGATACAACTTTGAAAGAGAAGTTGAAAAGGGTTAAG
+GCAGTGGTGCTTTGTGGTCCATGGAGCGAGGAGAAGAGAAATTCCTATATGGATTGTTAT
+GCAGCAGTGCAGTGGGGCCAATCCGTCTATCCCGACC
+>ds2020-328_740
+GGTCGGGATAGACGGGTGGTTGTTATTCTCTTACTAAATTGCCTGTAGACATGTGGGAAT
+TAATTAATTTGCATCATCTTGACGTGAGTGGAACCCAAATTGTAGAGATGCCAATGCAAA
+TGAGTACATTGAAAAGCTTGAGAACATTGTCCGCTTTTATTGTGGGCAAATCTACTGGGT
+CGACTATTGGAAGCGGGGGGAATCGTCTATCCCGACC
+>ds2020-328_741
+GCCGTGGACCTAGTATCTCTTACCCTGCCGTGGACCTAGTAATTGGGAGGGTGACTAGGT
+CCACGGCTCTCTGTCCGTGTCATAACCCCCTGTGACGTCTATCCCACCATCTATTGTACA
+CGTCTATCCCGACCAGGGGTCGCCGTCGTCTATCCCGACCAGCTATTTGGAACGTCTATC
+CCGACCCCCTTCACGTCTATCCCGACCGCCGTAATTC
+>ds2020-328_742
+GGTCGGGATAGACGACGCCTCCCCGTCCTATGCCGTGAGCACAAATCTGAGCAACAACTA
+GCCCTGGGTTTGAGCCTAGCATTGCATACTTGGTCTGGATTCTTGTTTTAATGAAGTCGT
+TCCACACTTTGCTTTTCCTGATGTTTATATAATCTTGGGGTCTAAGTGTATCTAAATCAC
+CGTTGAACTTTACTCCCAAAGAACGTCTATCCCGACC
+>ds2020-328_743
+GGTCGGGATAGACGATTGCCACCACTCACTTTACTTTAGTCCACCCGGCATAACCGCATG
+TGAACCAACCGACTAACTTGCCTCTCCGGGATGAGAACCCATGATTTGATCTGCTAGCTT
+GAACGCCTGGATCATGCCGAGAAGAGAAAGTGAAGAAAAGACTGTCGGAACCGATCGGAG
+GAGTATTTCAGAGTCCATCCCCGCGTCTATCCCGACC
+>ds2020-328_744
+GGTCGGGATAGACGAAGAGAGGTCGTATTTCTTTGGGTTGGTAGTAATGGAATGGTTTCA
+TTATCTAAAATCAAGAACATTTCCCACCAAAGGATCAGTCCAATAATACCACTCACTGGT
+AAATAGCGCAATACTTCTTCGTGAATCTCCGCTATTTGAATATGGAACATCATAACAACG
+AATAGGAATGAAACGGCATAGGTCGTCTATCCCGACC
+>ds2020-328_745
+GGTCGGGATAGACGGATCGTATATATACTAGCAACACTCGAGGCAAGCTCTGGCTTTTTG
+GCGAGCGGTTGTCCTGTTTTTGGGTCAGTGACGACAACTTGCGGTGCTGCATGGGTCAGG
+CTTGTCACCTGTAGTACCGTCAATAACACTGCGCCGTTTGCCAAAGAGCCCACCAATTTT
+TTCATGCTTGTCACTTGTCCCCCCCGTCTATCCGACC
+>ds2020-328_746
+GGTCGGGATAGACGCGTCACCCCCATTATGTAAACTGTTTCCTCGCTTCAACGTGTCTTC
+AGATATCGCTTTTGTGTATATATAATTCAATATACTGTTCATGAATGTTGTCAGTCTCCA
+GCCTGACAGCAGTGTGTCTTTCGCCCTGTATGTACGCTTCGTACCAACATTGTCATGTAT
+TACCTGGTTGCCTACAGATTCAGCCGTCCATAAGGCC
+>ds2020-328_747
+GGTCGGGATAGACGGCGTGTTTTGGTATGTTGGGAGATATCATTATTGCCGAACCCAATG
+CTTACATTGCATTTGCGGGTAAAAGAGTAATTGAACAAACATTGAATAAGACAGTACCCG
+AGGATTCACAAGTGGCTGAATATTTATTCCATAAGGGCTTATTCGATCCAATCGTACCAC
+GTAATCCTTTACAGGGCGTATATCGTCTATCCCGACC
+>ds2020-328_748
+GGTCGGGATAGACGATTTGTGGGATTCATTACTGCAACCAAAGATGCTGCGTGATTTAAG
+TGAGGAAGTTGGCGATCGGATAATGGAAGGCCAAAGCGTTGACGAAGCATCGCTAATATG
+TGCCAGGCCATTAGGACAAGCAATCAGGTTGTTAAACCCACACGAAGACGTCATTCTAAT
+GGCGCAATCATATGGACTGTTAGAAAGTATAGGTGT
+>ds2020-328_749
+GGTCGGGATAGACGAACCCCACTGATCTAACTTTTGATGCGACGGATGTTGAGTTGAACG
+ATATTAAAATGCTAGTAACTGACTTCAAGTTTCAAGTTCAGTATGCTGTATCACAAAATG
+AGTAAGTTTTTTTTACAATTTTGTAACTCTTTTGATATTATCTGTTTCTTTTTGAAGTGC
+TTCCAGTTTCAGATTTGTACGGCGTCTATCCCGACC
+>ds2020-328_750
+GGTCGGGATAGACGTCGTCACCATTATGCACAGAGTCCACCACACCCGAGTGTGTGAATA
+CGCCTGCAATGTCCATGTATACATAGTTTAACACCGTATTGAGGAACGTAGTTAGCCTAG
+ACCCAGACAGCAAAGTGCCCGCAGGTCTGTAATTTTTCCCGTCTCCTGCATGAATCAGTA
+TGTCAGTGTAGCTATTTAGTATCCAGTCCATCGCGC
+>ds2020-328_751
+GCCGTGGACCTAGTATATTGTCACTTGGTCCACGGCAGGTAGAGGCACACTAGGTCCACG
+GCAGGAGCAAAGCAACTAGGTCCACGGCAAGCGGAACATTACTAGGTCCACGGCTCTCTG
+TCCGAGGGATAGACGAACGATGGGGCTTCACGTCTATCCCGACCACGGAGTGGTTACGTC
+TATCCCGACCACCACATTCTTTCGTCTATCCCGACC
+>ds2020-328_752
+GGTCGGGATAGACGATGGGGACAATTGTCAAACGATGTGCTCCGTTTGGAAGGCGGGGAC
+CGAGTCTCCATCCTTGTAAGGCCTGATGATGTTGATATTGTGAGAGTGAAGAAGACAGGG
+GTCCATCTAGAATGGGACAAAGTCATGAAGGAGAATAAATCGGATCGTCATTTGTATGAT
+TGGGAAATAAATGGGGATTTCGCGTCTATCCCGACC
+>ds2020-328_753
+GCCGTGGACCTAGTATTCATTACCCTGCCGTGGACCGTTATAGTTACGGCCGCCGTTTAC
+TGGGACTTCAATCAAGAGCTTGCACCCCATCATTTAATCTTCCAGCACCGGGCAGGCGTC
+ACACCCTATACGTCCACTTTCGTGTTTGCAGAGTGCTGTGTTTTTATTAAACAGTCGGGG
+GGGCCAGTTTATTGAACCCCTTCGTCTATCCCGACC
+>ds2020-328_754
+GGTCGGGATAGACGCGGGGTTGTTTTGTATTTAAGTCGGCAAAGCAACTCGTTATTGTGA
+CAGCTGCTCTTGTTTAAGATATACAGTTTGTCTGTTGAACGTTAGCTTTATTAATTGGTT
+ACTTGTTAGTTGGTTTACTTGATATTCACTTTCTCTACACTTTGTTACACGTGTTGGGAG
+ACGTACCATGACCCAGTGCCCTCGTCTATCCCGACC
+>ds2020-328_755
+GCCGTGGACCTAGTCAGACCTTCACTGCCGTGGACCTAGTCCATGCATGCGTGCCGTGGA
+CCCATGTATTTAGCCACTAGGTCCACGGCTCTCTGTCCGAGAATTAGGCGGTCGGGATAG
+ACGTGGGCCCCCACTGGTCGGGATAGACGGTACGCGGGACTGGTCTGGATAGACGGTTAT
+ATGCCCTTTGGTCGTCTATCCCGACCGCCGTAATTA
+>ds2020-328_756
+GGTCGGGATAGACGAAACCACGGCTGGTCGGGATAGACGTACTAAATCCCTGGTCGGGAT
+AGTCGGCGTTATCTCGTCTATCCAGACCAGGGGGAGGACACGTCTATCCCGACACGGACA
+GAGAGCCGTGGACCTAGTGATCGCATTCGTGACTAGGTCCCGGCAGGCAACTTATTACTA
+GGTCCACGGCAAGGGCAGAACAACTAGGTCCACGGC
+>ds2020-328_757
+GTCGGGATAGACGGCGATGTAGAATCGATTGAAGCCAAAGTGAATGAAGACTTTGTGCCG
+GCATGGCCTTGGCTGCCGATTGGGATTGGGATGAAAATATTGCCGCTTAAAGTTATGACC
+AAATTTTTATAAGCGCATATCTAAAAATTTTAAACTCTCAGCATCATCAACAGCGCCTTG
+GCAGCTGATGACGTTTATTATCCGTCTATCCCGACC
+>ds2020-328_758
+GGTCGGGATAGACGAGCAGCGGGGGTGTGAGAGCAGGCAGATAATGTGAGAGCTTGATTG
+CTTGATCGAGAAGAATGCCTTTTCTTGATTGCTTGATCGACTCACTCGTCTGATTGGCCC
+TACTATTCATTATGGCCTTCCCTCCCGACACGAGCATGAAGTCTTTCAATTCGAGTCTGT
+CATTAAGAAATAGTGGGTTAGCGTCTATCCCGACC
+>ds2020-328_759
+CGGTCGGATAGACGATGGTCCTGGTTTGACATGGTTTACGCGTTACTGGTTCCCGGAAGA
+GTTAATATCTCCATTAGCTAAACCCTTTCTTACCCTGCCCTTGGACTCGTATTTTGTTTG
+TACACAATCAACGGAGGCCTCCCCGACATATGTTGCAACGTCTTCAATAGCATGCGCTGT
+TTTCGTCTATCCCGACCGCCATAATTCAGATCGGA
+>ds2020-328_760
+GGTCGGGATAGACGGCAGATCGGGGTGTCCGGTGAGACGACGAGGAGGAGCTCCCAGGCG
+GGAAAGAGAATGGAAACGGTGGAGATGGCGGAGTGGTTGATGATGATGGAGGAGACGTGG
+AGAGCGCGATGAGTGGCGGGAAGCTGAGGGTGGTGATTGTCGTTGTAGAAGATTGCGTAG
+TTGGTGTGGATGTTGTCGATGGCGGTTGGTAAGTG
+>ds2020-328_761
+GGTCGGGATAGACGACTTTCCGCGCGCTTCTTCTTTAATATAGCAGTTATCTAATGAATA
+TAGTAACCACGGGAACACTCGTTGTTGTTCGAGGGACATCCTTTTACCAAACACTGCAAA
+ATATGCTTCCAACACAGCTTTCATCGAGCCCACGCTATGTTGCGAGTTAAAATCTTCAAA
+GTCAAAGCAGTAATGTACCCTGTCTATCCCGACCA
+>ds2020-328_762
+GGTCGGGATAGACGGAACTTCTTGCTCAGCAGGCGTAGCTTGGAGGGGGAGTGTAGCGGG
+GGTAAGGTAAGGAAGAGCCGCCAGAGAGGAAGCCAAACCGGCCTATTAAGCGCAGCTAAG
+CTAATATGCGCCGGAGAAAGCCAGGTGCCGGAGGTAAGCTCTATTCGGCCCGGAGCAAAA
+ATTCCCCATAACGAATGGACTCGACTGTCCCGACC
+>ds2020-328_763
+CGGTCGGGATAGACGGTGCTCTTCTCTCCAATTCATCCCCAAATACAAACCCATCTTCCT
+CTCTCTGCACCACAGCAATCGCCATCTCCATTTCCTTCACCAAAATACTCCTATTCATGT
+GCTGCTCTGCATAGAGCGGCCACGCCACCATCGACACCCCGGCGATCACCGCTTCAAGCA
+CCGAGTTCCAGCCACGTTTATCGTCTATCCCGACC
+>ds2020-328_764
+GGTCGGGTAGACGCATATGAGGTGTGCTATGTGCAACGCCAACGATATACAGCAGGGATA
+TCATTGGGCTGTAAGATTGGATAGATGTATGAGACAAATAATCGTGTCCCTATTATGTGC
+AGAAAAGAAAAGCACTAATGTAATAATAGAGTCCGGATTCCTCCATCAAGCGTCTGTGGT
+AAATGTAAACGAGCACGAAGACGTCTATCCCGTCC
+>ds2020-328_765
+GGTCGGGATAGACGTTAGCTGTCCATTTCTTGTATTTCTTACCAGTCATTGCATCATACA
+TGGTCGCATCATAGCCTCCTACTCTCAACGCTAACAGCATCTTGTTTGCAACTTTATTAT
+CATTAGTCGTGTACGATTTGGATCTGGCATCATAATCCATTCTAGCTTCGTATTGAAGAG
+AATTCATGTAGTACCTGTCGTCGTCTATCCCGACC
+>ds2020-328_766
+GGTCGGGATAGACGTGGCGTGGGTCTGAGAGTGTACGGACACACAGAGAAGAAAGGGGGA
+AGATAGAGAAATATGAAAAAAGCTTTGTGTTTGGATCAAACCCGCAACTTTTGGTATCTT
+TTTTTCCAACACAGAGAAGAGGTTCTCAGATATGAGAGAGAGAGAGAGAGAGAGAGAGAG
+AGAGAGGGGGGCGGCTGTTCGCGTCTATCCAGACC
+>ds2020-328_767
+GGTCGGGATAGACGACCAGCAGCATTACACAACACCCGATTTGCGGATGTTCAAGACACA
+GAGGACATGAGTACACACTACGAGCCAACGTTCGATGTGACCAGTGCGGCGGCTGAGGTA
+CAGAACACTGTACCTATCAGGTACGCGCCCACGGATGGTGCGAAGCATGACAAAGAGCCG
+CGTGCCCCTCAGCCCAGTAGTCCGTCTATCCGACC
+>ds2020-328_768
+GTCGGGATAGACGCTGGTAGATGGTAGCTGGGGTGTACAGTGGTAATAGGGATACTACAT
+TGATAAACACATTGTTGAACATAGCATACGCTAAGGTAGTTGACATTTCAGCTAACAACT
+TGAAAGTGAATATAGGGCTAGAAAGTAGATTGTGACATGGTGATGACATCATCAGTGTGC
+ATAGTACCTATACTGGCTCTGCGTCTATCCCGACC
+>ds2020-328_769
+GGTCGGGATAGACGCCGGGTTCACTTCTATCCCGACCAGCCCACGTAAACGTCTATCCCG
+ACCAGGAGGGTGAATCGTCTATCCCGACCCGGACAGAGAGCCGTGGACCTAGTGGGGTTG
+ACAATTAGGTCCACGGCAGGAGGTAATCTACTAGGTCCACGGCACTGGATAAATTACTAG
+GTCCACGGCAGGAATTATAATACTAGGTCCACGGC
+>ds2020-328_770
+GGTCGGGATAGACGCTCAAGGGCCATGTTCGTCTATCCCAGGATACTCGACCGTCTATCC
+CGACCAGGTGCATGTACCGTCTATCCCGACCGCCGTAATTCTAATACCAGCAACGGCCGC
+CACTAGTCGTGTGGGTTGATTATGATGAGAAGGAAATGGAACAACTCGATGAATTTAGTA
+GATCTTTTTAGGAGACCCAGGTAGTGGCGGCCGTT
+>ds2020-328_771
+GGTCGGGATAGACGCGCAGCCCCCTGGTCGGGATAGACGTTCCCTTGGTCTGGTCGGGAT
+AGACGAATAGGGTGGTTGTCCGTCTATCCCCCGGACAGAGAGCCGTGGACCTAGTCTACA
+ACTTGCTGCCGTGGACGTTTAGAATGCGCTGCCGTGGACCTAGTGGATGAAGGGGCCGTG
+GCCTAGTTCAACCCGCTAGAGACTAGGTCCACGGC
+>ds2020-328_772
+GGTCGGGATAGACGATCGTAAATCTCTGTAAGAGTTATCTTATCTTGTTATTTGCAATGG
+TGTACCCAGTTAACGCTGATACATTTGGGATACTGTGGAAATACATCAAGTAGTGATACA
+GTATTCTCGCACGAAGAGTAGCGAAAGTTCTTCGCTGTAGATGCATTTGCGATTGTCCTT
+GAAACACCTAAGGAGTATTTATAGTGGCGGCCGTT
+>ds2020-328_773
+GGTCGGGATAGACGAGGCAGCTTAATGGGAATGGTAAATGGAGTTTTTGAGGGTGACATC
+AATGTTTGTGTCTACGGTAATTTGATAAAGGCGTACGTGGCTCCGATGCCAGGGAACAGG
+TCAGCAGTCTACTATGACGTTAGTCAGCGAACTTGGGGAATACGTAAAGAAATACTCTCG
+CAGATGACGAGGCACAGCAACCGTCTATCCCGACC
+>ds2020-328_774
+TTTCTTATTATTTGACAGTGCAGAATGTTATTGATGACCATCAGCCATCATGCGCAAAAG
+CTTCACAAAGCCCCACTAAGAACATCATGATGACATCCTGAAAATGGTCCCAGCTACTAT
+TGCCGAAGGTCTGAACACCCGGCTCCTATTTTCAAACCAAGTCCTAGGTTCCAGCTACAA
+AAAAAGAGAGTAGGCAGCGTCGTCTATCCCGACC
+>ds2020-328_775
+CATGTTTTGGCCTTGTGTGTCCATAACTCAAAATAGGTGACCTAACGGCCGCCGCCCGAC
+TAAACATACCAATAGTCACCAGATTCATATGGGCTACTGAGGAGTAAGCAATGATCTTCT
+TAAGATCGATCTGTCTTGAAGTGGTCAAGGAAGTATATATTATAGCAATCGCGCTTGGAG
+TATAAATGAAAGAAGTCCCGCGTCTATCCCGACC
+>ds2020-328_776
+TATATTAGCGCTCTCCAAGTGTGCTTGTTCCTCCCTTCTTCCTTACCATGGCAAGTCTTT
+GTGAAATAACTCCGATGAGAAGAAAAAAGAAGGCGTTAAGAGACCCTCCTGGCCCAACCC
+TAGACACTCTAAGATCCTTTTTCAAACCTGCTCCCATTTCGAGTCAAGAGATAGATAAAT
+AGACACATCCCATTGCACTGACCGGGTTCGTTCG
+>ds2020-328_777
+TAACGGCCTATTTGCCAGATGAGACCACGCCAACAACAGCTTGTTTCTCAACGGTTCCTG
+ATGTTTCAGCCCATGATCCCTAAGTATACCATTGTACCTTGGGTCTGTGCGTACATCTGA
+CCCCTTAGTGCATGTACTGTCACCTAATCCGCCCGTTGCTTCAACAAGATTAGCAGCTTC
+CATCTTGTACAGCGAGCCGACGTCTATCCCGACC
+>ds2020-328_778
+GGTCGGGATAGACGATTTCGTACTCTGTATCTGAGCCGAACCGACTAGCGCCACAACTGA
+TAACCGATTATTATGGCGTCAACCACCGCATATCTACGGTAGACACGCACATAGCGGTAG
+CTGCAGAGGTTCGCAGGGTAAGGGGTTATATCCAACGAGCCCCGGCGGCTTTTCAATTTG
+TCGACACCATTCAGCCTGAGCGTCTAGCCCGCCC
+>ds2020-328_779
+GGTCGGGATAGACGAGGCTAAGGACTGGTCGGGATAGACGACATAACCACCTGGTCGGGA
+TAGACGAAAAACGCCGCTGCGTCTATCCCTCGGACAGAGAGCCGTGGACCTAGTGCTCGG
+AGGGCTGCCGTGGACCTAGTCTTTCCCGCCCTGCCGTGGACCTAGTGTTAGGTGCTCTGC
+CTGGACCTAGTTAGTCTGCTACTAGGTCCACGGC
+>ds2020-328_780
+GGTCGGGATAGACGCTAACATCAGGTTTTCACGTCTATCCCGACCAGGGCCCGTATACGT
+CTATCCGACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTCCACCACCCACTATA
+ACACTAGGTCCACGGCAGGGCAGTTTTCACTAGGTCCACGGCAGGGCGAACTAAACTAGG
+TCCACGGCAGAGGGCGCATGACTAGGTCCACGGC
+>ds2020-328_781
+GGTCGGGATAGACGGTTCATTCGCCTGGTCGGGATAGACGATGACTCCTCTTGGTCGGGA
+TAGACAGGGATGATCCGTCTATCGGACAGAGAGCCGTGGACCTAGTTGTGTAGAGGGTGG
+ATGACTAGGTCACGGCAGACTGATAAGGACTAGGTCCACGGCAGGTGCTTTCTGACTAGG
+TCCACGGCAAGGCGATCGTCACTAGGTCCACGGC
+>ds2020-328_782
+GGTCGGGATAGACGACTGGTCGCCCTGGTCGGGATAGACGGATCTCCCCGCTGGTCGGGA
+TAGACGGTTATTGCGCCTGGTCGGGATAGACGAAGAGGTCCAGTACGTCTATCCCACGGA
+CAGAGAGCCGTGGACCTAGTCCATGCCCCGTTGCCGTGGACCTAGTTGGGTTGCTGCTGC
+CGTGGACCAAGTGCGTAAGTACTAGGTCCACGGC
+>ds2020-328_783
+GCCGTGGACCTAGTCAATGGCTCCCTGCCGTGGACCTAGTGCATACTTCCCTGCCGTGGA
+CCTAGTGCTGCAACGACTGCCGTGGCCTAGTGTATGGTCTGGAAAACTAGGTCCACGGCT
+CTCTGTCCGAATTACGGCGGTCGGGATAGACGTACAGAACTGGTGGTCGGGATAGACGGT
+TACACTCACTGGTGGGATAGACGCACTACCGACC
+>ds2020-328_784
+GGTCGGGATAGACGCCGCTTTGTGTTTCAGGGTATATACCCACCTGCAGCCAACCGTACG
+TTTGCCTCTTGGTAACGTGATCAGTTCCCAAGTGTCGTTCTTCTTTAGAGCCTCTATTTC
+TTCTATCATAGCTTTCTTCCCCTGAGGATGATTGAGGGCTTCTTCAAAATTGGGAGACCG
+TCTATCCCGACCGCCGTAATTCAGATCGGAAGA
+>ds2020-328_785
+GGTCGGGATAGACGGGCCGTAACAGCAGAAGCAAGGCTTAGATTACCAGATCGTGGACAC
+AATCTTCCTAGAGATGGAGAGCCCCCTGCCTCGCCTTTTCTAGCCTCTCCTTCTTGCTTG
+CTTACCTAGCTCTTGTCTTAGTGACTCTTCCTCTTTCTCATTATTCAGAACAGTGGAGCT
+TTCGATCATTTGGTTCGCGCGTCTATCCCGACC
+>ds2020-328_786
+GGTCGGGATAGACGTTTAGGGGCAATACAGTCAGGCAGCTATCTACCGATCCTCTCCTGC
+TTCTGCTTGATCTACGTCGTCTATTACCAGTCGCAGAGGCATACCCTGAGTCATCAGTAG
+TCCTCTGCTTATTGTGTCGCGTTAACGGCGGACGCTGGTCGCCTCTGCTCACTTCACTTG
+TGGAAGCACCTCCCATTCTCGTCTATCCCGACC
+>ds2020-328_787
+AATGGCACAGTCATTTCTCTTCTCGCTTTCTTTCCAGCACGGGGATTCGCCCGACGATCT
+TACCGCTAGCCAACATTTGATTTTTTATTAATAGGAATTTCTCTCTTCGTCTTGATGCCT
+GCTATCTTCCTAAACAGGATAGAAAGAAAGCCCCAACCTCTTCCTTCTTATACTAAGAGT
+ACACTTCAAAATAGCCCCCCCGCTATCCCGACC
+>ds2020-328_788
+GGTCGGGATAGACGGGGTTGGTACATTGCAGGCTGTGTATGAGGAGTCAAATTGTTTTCA
+TCTTGTGATGGAGTTGTGCTCTGGAGGGCGCCTGATTGATCAGATGGTTCAGGAGGTTCA
+GTATTCAGAGCACCGGGCTGCCAAGATATTCAAGGAAGTGATGCTAGTTATCAAGTATTG
+TCATGATATGGGACGGATGCGTCTATCCCGACC
+>ds2020-328_789
+GGTCGGGATAGACGCAGGATGGTATTTTCCCTAATTAGGAAAGATTGAATGTGTTATATC
+ATGTTCTTGGCTGCTGAAAGACGAGTTTTTTCAAAACCTGCTTCTCGCCCTGAGCTGAGC
+CCTACCACAAGAATACGTTTTAGGACTAGCAGATCGACTTGTTTAGCCCTTTTCTATTGG
+TTTAGTGAATCCCACCAATACGTCTTCCCGACC
+>ds2020-328_790
+GGTCGGGATAGACGAGTTATTTCCATGGTCGGGATAGACGCTATAGGGTGGTGCTTCGTC
+TATCCCGACCGCCGTAATTCTCGGACAGAGAGCCGTGGACCTAGTCTGGGATGGGGGCCG
+TGGACCTAGTAAGCACCTACCTGCCGTGGACCTAGTGGTCCACCTCCTGCCGTGGACCTA
+GTTCGTTAGGGGGTCGGTCACTAGGTCCACGGC
+>ds2020-328_791
+GGTCGGGATAGACGTCGAACGGACTATCGCATATTGTGTGTTATCCGGGTTTGATAGGTT
+CCGACCGTTGGATCGTTTCCAAATTGAAGTAGGTTGTACTAGGTACTCTTAGAACCGTGT
+AGGTTTTTGCGGATCGTGAATCGGAGCCCCGGTTGTTCCGATTCATTAACTTAAAGTTTG
+GAGTTTTACGGTAACTGTACGTCTATCCCGACC
+>ds2020-328_792
+GGTCGGGATGACGGTTATATACGGTGGTCGGGATAGACGTGGATACCCCGTGGTCGGGAT
+AGACACTTGCGACCCTCGTCTATCCCTCGGACAGAGAGCCGTGGACCTAGTGCTGCCGCC
+CCCGTGGACCTAGTGATGATTATCCTGCCGTGGACCTAGTGGCCACTCTCTGCCGTGGAC
+CAGTCACACCCCTGCACTCACTAGGTCCACGGC
+>ds2020-328_793
+GGTCGGGATAGACGCACGGTTACCTGGTCGGGATAGACGTCAGAGTGCCCTGGTCGGGAT
+AGACGAGTGTAAGTTTACGTCTATCCACGGACAGAGAGCCGTGGACCTAGTTACCGGTCA
+CCTGCCGTGGACCTAGTCCTATCTCCGCTGCCTGGACCTAGTTCATCATCGGATTAGACA
+CTAGGTCAGGGGACGGAACACTAGGTCCACGGC
+>ds2020-328_794
+GCCGTGGACCTAGTAAATTCAACAATAGGTCAACGGCAGGGGGGGAATGACTAGGTCCAC
+GGCAGGTGAGGTTGGACTAGGTCCACGGCAGGAGCCAAGGAACTAGGTCCACGGCTCTCT
+GTCCGAGGATAGACGGGATTCACACTTATCGTCTATCCCGACCAGGGCGAATCAGCGTCT
+ATCCCACCAGGGGTACGTACGTCTATCCCGACC
+>ds2020-328_795
+GGTCGGGATAGACGCCACAAAGGGGTAAGGGGCAGGAAGGAGCCGCTTAACAAGGCACTT
+CCATTTCTCGCTCATCCGCTCGCAGCTAAAAAGCTATCCTTTGCTTTGATCCATTACTGG
+TTCCGCAGGCTCAAGCTTACTTCATTTTCCATCTCTCTATTTTTCTTTCTATTTTCTCGC
+CCAGCTAACAACAGCAACCGTCTATCCCGACC
+>ds2020-328_796
+TAAAGACAAAAAAAAGAACAAGTCAAAAATACAAATTTATTGAAGCAGAAGAGGCTCACC
+TGATACAAAAATTGAGCATAATTTCCAAGAAACAAAGGGTTGCCTGGATTTTCCTCAACC
+AGCTTCTTGTAATGCCCCTCAGCCCCATGGTTGTCTCCTCCATCATCACCAGATCCTTCC
+CAATTAACCTCTCCTACGCGTCTATCCCGACC
+>ds2020-328_797
+GGTCGGGATAGACGGTCGTCCTGCCTATTTAAAGTTTGAGAATAGGTCGAGGGCGATGCG
+CCCCCGAAGCCTCTAATCATTGGCTTTACCCGATAGAACTCGTACACGGGCTCCAGCTAT
+CCTGAGGGAAACTTCGGAGGGAACCAGCTACTAGACGGTTCGATTAGTCTTTCGCCCCTA
+TACCCAAGTCAGACGCGTCGTCTATCCCGACC
+>ds2020-328_798
+GGTCGGGATAGACGCTCAGATCACCTTCATCGGCTATGGCGAGGATGAATTTGGCTACCG
+CATTTGGGATAACGAAAACAAGAAGGTGATCCGCAGCAGAGATGTGATTTTTAATGAAAG
+AGTGATGTACAAGGACAGACATAAACACGACGCCAGCAACACAAAGCAGAGTGTGCCAAT
+ATTTGTAGATGCAATCTTCGTCTATCCCGCCC
+>ds2020-328_799
+GGTCGGGATAGACGTATGGGATGACTCCAGGTTCATATTAGGGAAAGGAGAGTGAGGGGA
+AGAGGGGGCAGCCCTCGGCCCGATCATCCAATTCGCTCCAACAGATAGGCATGGTTCTGT
+AGTCAAAGCAACTTCGTCACTTTCGTGTACCCATCGGACGGCAGCCCTTTCGGGGGTTCC
+TTAGGGACCGATTCACTGCGTCTATCCCGACC
+>ds2020-328_800
+ATCCACCACCTTCCTCCGGTTTGTCACCGGCAGTCTCTCTAAAGTGCCCATCTTACTGCT
+GGCAACTAGAAACGAGGGTTGCGCTCGTTGCGGGACTTAACCCAACATCTCACGACACGA
+GCTGACGACAGCCATGCACCACCTGTGTTCCGGCTCCCGAAGGCACTCATAGTGTCAAAA
+CCTCCCACTGGTGGTCCGCGTCTATCCCGACC
+>ds2020-328_801
+GGTCGGGATAGACGCTGACAGATCCTTTGTCTTTATTTGACCCCAAGAATGGATTGGATC
+GAAACGACTTTCCTGTCGAACCCCTTTTTGTCTGTATGAATTTCTGACCGCGCGGAATCT
+CCATAGCCAATTTTCCATTTTTGATTATGAAATCATAGGGTGCCTTTGGTAAAACTCTTA
+TTTCACACAATCCAGGAACTTCCATAACGTTG
+>ds2020-328_802
+GGTCGGGATAGACGGCTGGCGTCGCTTCCCGGCAAGTACCTTGCTTTTCCGGCGCTGGAA
+TCGATACCACTCGGTCTTCTACGGCGTCGTTTCATGGAGAGTTTCGGGTTCAGGGTCGTA
+GAGATTTTGGAGTGTCTTTGAGAACTAAAAGGTTTCGTGGGCAATCGAATTATGGATTTT
+GTGATGACGGGCATGATTCGTCTATCCCGACC
+>ds2020-328_803
+GGTCGGGATAGACGATACTAGCGCGTGGTCGGGATAGACGAACAGATTACCTGGTCGGGA
+TAGACGCAGGCCTAGTATTCGTCTATCCACGGACAGAGAGCCGTGGACCTAGTTGTACAA
+TCCCTGCCGTGGACCTAGTGTATAGTCCTTGCCGTGGACCTAGTTCTAATCCTCCTGCCG
+TGGACCAAGTCGACTTTTACTAGGTCCACGGC
+>ds2020-328_804
+GGTCGGGATAGACAGCAAGCCGAGTTGGCGTGTGGCAATTGATAACAGTGTATCAGTGGG
+TAGGGGGCAATAGGGTTATCCCTTTCTGTTGCTCCCCCCCACTGGGACACTGCCGATTGT
+TTGCGCGAATTCGCAAAAAGAAAAAGGCCAATGCGTTTGGTCGCTGGGTGTTAACATAAT
+TGCAAGATTGGGAGATTTCGTCTATCCCGACC
+>ds2020-328_805
+GGTCGGGATAGACGCATGGAGGAGCTGGAGAGGGAGAGGGGTAGAGCGAGAAAGATGAGA
+AAGGTCCATGGAAAGACTGTGATGAAGAAGAAGTAGTGGCTGGTGTTAAACAAGGACATG
+ATGGCTGGTTGGAAATGTTTAGAGAGAGCGAGCGAGAGAGAGCACGTAGCGGGTTTGTTT
+TTCGGGGGGGGAGGGCTTCGTCTATCCCGACC
+>ds2020-328_806
+GGTCGGGATAGACGACCTGAATCGGTGGTCGGGATAGGCGCCACACCTCAGCACATCGTC
+TATCCTCGGACAGAGAGCCGTGGACCTAGTTTGGTGCCGAGTGCCGTGGACCTAGTCGTA
+CTGCCTGTGCCGTGGACCTAGTGTGATCTCCCTGCCGTGGACCTAGTCGTAGATCCCCTG
+CCGTGGACTTAGCTTGATACTAGGTCCACGGC
+>ds2020-328_807
+TTAAAGGCACCTAAGGGTGTACTAAGTGGAAAAGGATGTGGGATCGCGAAGACAGCCAGG
+AGGTTGGCTTAATGTCAGCCAAACTCCGAATGCCATCAATTGTGTTGTGCGGCAGTGAGA
+CTGTGGGGGATAAGCTTCATAGTCGAGAGGGAAACAGCCCAGATCGCCGGTTAAGGCCCC
+TAAGGGTGTACTAAGTGGAAAAGGTGTGGTCT
+>ds2020-328_808
+GGTCGGGATAGACGTTATTGGGCCCTTCACGCCTTCCCTAGACCCCTCCAAGCTCACTCT
+GCAATCCTTCTTCCTCACTGAAAAGCTCACAACTTTAGCAATCTCCTCCAACTTCGATAT
+GATCGTCGAAACCGGGGCACCCGACACAAATCTCGCCTCCTCACCGCGCTCCTCAAACAA
+CCCACTAAGTCGTCTAACCCGACCGCCGAATT
+>ds2020-328_809
+GGTTGGATAGACGTTGGGAGGCAGTAGGAATGAAGGAGGCGGGAAGCTACCGCTTCTGGA
+ATGCAAGCTTATCCTTGACTTTTTTTTAGAGCGTACCGCTATAATAAATAAAGGTTTATG
+GATGAAGTAATCGGAGTGACAAATGGTTATGGTTGCGGAAACCAGAGAAAGTCGGTTACC
+CTTTGAATCAGATACCGACGTCTATCCCGACC
+>ds2020-328_810
+GGTCGGGATAGACGGGCGTGCGCCGTGGTCGGGATAGACGGTACCCGGACCTGGTCGGGA
+TAGACGAATCAATGGAGTGCTGGCGTCTATCCGGACAGAGAGCCGTGGACCTAGTTTGTC
+AGTTGGTCCACGGCAGTGTTGCCAGTACTAGGTCCACGGCAGGCACTTGGTTACTAGGTC
+CACGGCAGGCGATACGAGACTAGGTCCACGGC
+>ds2020-328_811
+GGTCGGGATAGACGGCCATATACCCTGGTCGGGATAGACGTTATTTGTGGGCATCGTCTA
+TCCCGACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTTACGGCACGGGTGAATT
+AACTAGGTCCAGGCACGGGGAGAACAACTAGGTCCACGGCAGCAGGCTAGTAACTAGGTC
+CACGGCAGGCTGTATAGGACTAGGTCCACGGC
+>ds2020-328_812
+GGTCGGGATAGACGAGCAGCTCACCTGGTCGGGATAGACGGCCGTAGTGTGTTTCCTCGT
+CTATCCCGACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTGGGTAGAGATCTGC
+CGTGGACCTAGTTGCTTATGGGGGCCGTGGACCTAGTTTCTTTACTCCTGCCGGGACCTA
+GTATTAACGCTCCTGGACACTAGGTCCACGGC
+>ds2020-328_813
+GGTCGGGATAGACGTACTAGGTGCCTGGTCGGGATAGACGAATTCATTGGGTGGGCGCGT
+CTATCCCGACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTCGTTACCCCCGTGC
+CGTGGACCTAGTCGCTTACTTGCTGCCGTGGACCTAGTAGTTTGGGGGATATAACTAGGT
+CCACGGAGCATAAATGGAACTAGGTCCACGGC
+>ds2020-328_814
+GGTCGGGATAGACGAACATTTTGGATCGCCGTCTATCCCGACCATACATCAATTACGTCT
+ATCCCCACCGCCGTAAATCAGGACCTAGTGAGGATTTAACTAGGTCCACGGCAGGATCGA
+TTATACTAGGTCCACGGCAGAGCAACTAAAACTAGGCACGGCACGGGCATATTACTAGGT
+CCACGGCCCCGGGTTACGACTAGGTCCACGGC
+>ds2020-328_815
+GGTCGGGATAGACGGTATTGATGGCTTTTTTGTAGTTGATGGCTTTTTGTAGTTGATGGC
+TTAGGGTCTCTAGGCCATTTAGCCTTTTGAAAACGCTTAGGCAACATGACGTGACTTCTT
+GTCTCTTTCAGCTGTTGTCTTCTCAGCCATACTCCTCCAGCCAACTTCTCTACAGCCAAC
+TCTTCATAGCCAACTTATGCGTCTATCCCGAC
+>ds2020-328_816
+GGTCGGGATAGACGGGCCATTACGATGAGGGGTTGTTGGTCGTTTCAAGGAGCGAGCTGA
+TCAGAAGCTATCGTTCGAGGTGGGGTCGTCACCGAACAGAGAAGAGCCGAGGATATGGTG
+AACCGACTGACAGTAATGTCGGAGACGGGAAGCTGGGGAAGCCGATCAATGAACTGGCGC
+GGGTGAGAGGAATTAGGCGTCTATCCCGACC
+>ds2020-328_817
+GAATTACGGCGGTCGGGATAGACGAAAAAAGGACATTATGCTGCATTTCTATCCAGAGAA
+TGCCAAGTATGAGGCGAAGGAGAAGCTAAGATGGCTAAAGTAAGTGGGGAGCGTGAAGGA
+CTATGTCACCACGTTCACCAACCTATTGTTCGAGGTGCCTAGCATGACGGATGAAGACAA
+ACTCATGTACTTCATGAGTGGCCTACAGAAT
+>ds2020-328_818
+GGTCGGGATAGACGCTGATTAGCACTCTAGGTCTCTTATCTTTGATCGCGATGTATCGAT
+GGCTTTCTTTCCGAAAGGTAAAGATGCCTAAAAGTTTCTTTCATCGCTTTTTATGTTTTT
+TAACTATTTTAGTGGTCGTGATAGTCAGAGATTGGGTAGTGCGCTTCATTGCCGTAGAGG
+CAATCTTCCCTATATCTCGTCTATCCCGACC
+>ds2020-328_819
+GAATAGTCAGACTAGCCAACCGGGGCTTCCTTCACAGGCCAACAAGCAATACCGCGCCAA
+CGAGAGAAAGCCGAAAGAATCTTTCGAAGAGGGGCTTGCTAAAGAGGCTCGAAGAGGGGC
+GGCGAAGGAATACACTAAGGCAGGTTTCAGAGCTCGATAAAGCAGACTAATACTTCTAGG
+TAACTAAGCGCTCATCGCGTCTATCCCGACC
+>ds2020-328_820
+GGTGGGGATAGACGGTCCGGCTCAGTAGCATAAAAGAAAACGGTAGCATAAAAGGAAATG
+GGGCGGCTAAGTGGGATAGCCGAGCCAGAAAAAAAAATAGATTTAGAAGATATAAATGAG
+TAGAAAAGAAAGGAATACTTTTAAAATATGACCTGATCCACCATACATATTAGGTTTGGT
+GGAATCAATTTTATTCCTACTTCAAGCATTG
+>ds2020-328_821
+GGTCGGGATAGACGATCGCCAGCTCTATCTGCTGCTTGGGCCAAGGCTCTCATGGTAGGA
+TATATGTTGGCAGTGACCACCGCCTGAATGTCTAACCACAGACCCTCTTCAAAACGTGTA
+CACTTGTCTTCCTCTGTGGTGACCAACTCAGGTGCAAACCTGGACAGCTCATTAAACTTG
+TGCTCATACTCCAACACCGTCTATCCCGACC
+>ds2020-328_822
+GGTCGGGATAGACGAGCTGCCTTCGAGCTTTCTACTACCATCCATTGTCCTTCTTCTGAG
+GAGAAGAGCCATTCATGAGCCCGAGTCTTAGGCACAATAAAAACCCCACAATGATATGCA
+AATGGACCAGATGATTCCTGGGCATCAAGAACTACAGCTCTGTAACTGAAACGGGAATCA
+CCACCCAAAGTAAGCTGAAAACGATGACCTG
+>ds2020-328_823
+GGTCGGGTAGACGGTCCCTCTGCTTGTTTGCCTCTGCATTAACGTTGTTAACTGCTATGC
+CGTGCGATAGCGCGAATGAGTTATATGCCGATGCTGGTCCTAGCGTAGCGCCATCAAAAG
+CCCCCGAGCAATGCATGCCATCGTACGTGGCATAGCCAACCACCAGGACATGCGGTGGTC
+CCAACACTGACCAACTCCGTCTATCCCGACC
+>ds2020-328_824
+CGGCGGTCGGGATAGACATCATAAGTGAGTGTGGTTGATGCAGTTGGGAGGAGGGGCTGT
+GCGAAGCGTGAGTTATTGAACTTGGAATCATCAAGTTCTGGTATTTCCAACTCGTCAAAC
+TTAACAAAACCTGCACCCTGTTTAGCTACTCTGAACGTCCAAGCATTCTTCCCAGTGATT
+AAGTCATCCGCATCAAACGTCTATCCCGACC
+>ds2020-328_825
+CTTACATCAATTGCCCAGCTGTTGTCTTTGACTTCAATAAGGGACTACCCTTGACAATAA
+TTAAGATTGGAAAGAACGCTAACGCAATCTCCGCTTGCAATCAAAGGCTTTTCAATAGGG
+AGGGGATAGACGGCATGCGTTCTTAACGTCTTCCCGACCAGGCGCCCGAGACGTCTATCC
+CGACCAGAGCTTACATGCGTCTATCCCGACC
+>ds2020-328_826
+GGTCGGGATAGACGTTTGGTTTGGTTATGACGAAGATAGACGGGTTTCCAGAGAAGCAAT
+GCTGATCATTCCGTGTTCATAAAAAGGAGAAAAGAGGAAACTACTGTTCTCCTAGTGTAC
+TCAGTTTAGAACTCTAAATTAACAAGTAAAATTTAGATATTAGTAAGATATGCAGCGAGT
+ACGCTCGGCGAGTACGGCGTCTCTCCCGACC
+>ds2020-328_827
+GGTCGGGATAGACGGGCCCCTCCCCTAATCTACTATCAAAACGTTTAACTATATATACGT
+AAAGAAACACATGCACAGACGATATAGCCAGTCACCGAACCTCTTCCCCGAATGAGTCGA
+AATTGCTACAGCCCTAAACCCGACAGAACTGAACCGGATGTGTGTCGACGACGAGTCTCA
+GGACGATGAGTGACATGCGTCTATCCCGACC
+>ds2020-328_828
+GGTCGGGATAGACGTTACCTAGCCCTGGAGTAATGTATTCTATGAATAATAAATAAAGGA
+GTAATGTATTCTATGAATAATAAATATGAAGAATACTCTTTCAATCAAAGAAATATTTCA
+ACTATTTCCGTGTTCGTATTTCGAAAGTAAAAAAACGTAATAGGAATACAAAAGATAGGA
+AATTTATTACAGATGAATTCTTCATAAATTT
+>ds2020-328_829
+GGTCGGGATGACGGCTTAGGGGACTAGGGACTGCCCTACGGCTCCCACTGAACCTGGAAT
+GCTCGGTCCTGATTCCACAAAAATTCACAAGTTCCCAACCCAGAAGTCACTTCTTGACAG
+CGAACTTGGGGGACTACTGTTTACACCATAATCAACCAAACATATCCAGCATCAAAACAA
+CTCGCACTGGCAAAATACGTCTATCCCGACC
+>ds2020-328_830
+GGTCGGGATAGACGCTTACCTTCCCATGGTGAGGTTAATTACTTTTCTGAGTACTTGAAA
+GGTAAAGCGATCGATGATGATGATCTATACGTTGATCCTATTTGTTTAGTTTCTATGGAT
+AAGTATAGACATATGATAAAATCCCAACTTACACCAGTTGAAGATAACAGTATGATGTTT
+GAGAGGCCTCTGGCAGCCGTCTATCCCGGCC
+>ds2020-328_831
+GCCGTGGACCTAGTCTGATATCCCCTGCCGTGACTAGTTTCCCACCGTCTTAGGCACTAG
+GTCCACGGCAGGACACGACGAACTAGGTCCACGGCAGAGTTCGCAGCACTAGGTCCACGG
+CTCTCTGTCCGTGAATTACGGCGGTCGGGATAGACGACATTCCTGCCTGGTCGGGATAGA
+CGTACAACCACCATGCTCGTCTATCCCGACC
+>ds2020-328_832
+GGTCGGGATAGACGAACTGTTCCACTGGTCGGGATAGACGTAAAGGTGGTTTGTCCGTCT
+ATCCCGACCGCCGTAATTCACGGACAAGAGCCGTGGACCTAGTCCGAACCCCCCTGCCGT
+GGACCTAGTTCTAAACTTCCTGCCGTGGACCTAGTTTTAGTGCACCTGCCGTGACCTAGT
+TCAGCACCGTCTTTGATACTAGGTCCACGGC
+>ds2020-328_833
+GGTCGGGATAGACGATACATACCCCTGGTCGGGATAGACGACACGATGGGGTGTTTGCGT
+CTATCCGACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTTCATAGAGCCGTGCC
+GTGGACCTAGTGTCTTTCCTGCTGCCGTGGACCTAGTGTCCACCACGGGCCGTGGCCTAG
+TTCCTATCGCACTTATAACTAGGTCCACGGC
+>ds2020-328_834
+GGTCGGATAGACGTACGGGCCTTGTCGGGATAGACGTGACGAATGCCTGGTCGGGATAGA
+CGGACTAGCCCCCGAACACGTCTATCCCGGACAGAGAGCCGTGGACCTAGTCATACATTA
+CTTGGTCCACGGCAGCCAGCTTGACACTAGGTCCACGGCAGGGGAAATGTCACTAGGTCC
+ACGGCAGGTCGAATGGCACTAGGTCCACGGC
+>ds2020-328_835
+GGTCGGGATAGACGGAGACCACGTATATCCCGACCAGGAACCACCAACGTCTATCCCGAC
+CAGGTGAGGCCGGCGTCTATCCCGACCCGGACAGAGAGCCGTGGACCTAGTGTGAGGGGT
+ATTAGGTCCACGGCAGAGAGTAGCAAACTAGGTCCACGGCAGGCTACATAGTACTAGGTC
+CACGGCCCCGCATGTTTACTAGGTCCACGGC
+>ds2020-328_836
+GGTCGGAAGACGGTCCATTTCGGTGGTCGGGATAGACGAGTTCGCTGCACCGTCTATCCT
+CGGACAGAGAGCCGTGGACCTAGTATTCTCTAACATGCCGTGGACCTAGTGCGCTCTCAC
+CTGCCGTGGACCTAGTTCCGTATCCTCTGCCGTGGACCTAGTGTTCTACCCCTGCCGTGG
+ACTAGAGGTCTTGAATTACTAGGTCCACGGC
+>ds2020-328_837
+GGTCGGGATAGACGCCCTCATCACCTCCACACGTCTATCCCGACCAGCGGTGTGTATCGT
+CTATCCCGACCGCCGAATTCCCGGACAGAGAGCCGTGGACCTAGTTAGTCCATACCTGCC
+GTGGACCTAGTACCCCCCCCCCTGCCGTGGACCTAGTCTTGAACCCCTGCCGTGGCCTAG
+TCTATACCAGTCTAGCCACTAGGTCCACGGC
+>ds2020-328_838
+GGTCGGGATAGACGCGCCGTGGTTGGTCAAGTGACATTACAAAGAGACACGGCCTCCTTC
+CGCCATCCTCCTTCTTTACGCAGCCCGCCGAGCGGACAGAGGTAGGGGCTTTGAAGGAAC
+TATCTTAGTAGCAGAACTATTAATAAGAATAACTGCTCACGCGGCAGATCGAAGTAGAAG
+CGTCAAAGGTCATAACTCGTCTATCCCGACC
+>ds2020-328_839
+GGTCGGGATAGACGGGGTCAAGTCCTTTTGAGTTGGCAACAGGACAACAACCTTTGACAC
+CGAACACAGTGGTGTCAGGCTACACGGGGAGTAGCCCAGCTGCATACAAGACAGCCAAGG
+AGTGGCAGGTGACTAATGAGCTGGCTCGGGCTCAATTGGAAAAGGCGACTAGGAAGATGA
+AGAAATGGGCTATAGACGTCTATCCCGACC
+>ds2020-328_840
+GGTCGGGATAGACGTCTGTTCCCACTCCACTTGTTTAGTGTATAATCCTCAGTAGCTCTT
+ACCAACGTTTCTCTTGTTAGCTTCGTCTTTGCCCTGTAATTATGATCGCTCTTAATGTTT
+ATTTTTCCTTTTCCATTCCATGGTTCCTTAGTCCTCTTATCACCTATTAGGCCAAGTCCG
+CCACAGCTTACCTTTATACAGTCTAGTTTT
+>ds2020-328_841
+GGTCGGGATAGACGATATCACTGGCTGCGTGCTACCCCGTGATCGCCAGCTGTTCCTGCC
+TGGGAGAGGAGACCTCATTGTCAGCCTTAAGGTAAATTCGATCGATCATGAAATGTTTTG
+TTATGTTCTTTTTGAACGGTTCCTTCTTTATACCAAAAATTATGCAAGCCCAGTTACCGT
+CTATCCCGACCGCCGTAATTCACACGGCAG
+>ds2020-328_842
+GATCTTAATTACGGCGGTCGGATAGACGACCCCCTCCCCTAGCTTTCGTCTCTCAGTGTC
+AGTGTCGGCCCAGCAGAGTGCTTTCGCCGTTGGTGTTCTTTCCGATCTCTACGCATTTCA
+CCGCTCCACCGGAAATTCCCTCTGCCCCCACCGTATTCGTGTCAGTACCCCTCCTGTCAG
+GCCCAAAGACAACAACCGTCTATCCCGACC
+>ds2020-328_843
+AATTACGGCGGTCGGATAGACGCCAGTTGCTTGTGAAGGGAGGGATCGGGTGGAAAGATG
+TGAAGTGTTTGGGAAGTGGCGGGCCCGCATGGGGATGGCGGGGTTCGAGTTGAGGCCCAT
+GAGCCAAAACATGACCGAGGTTTTGAAGCAGCGACTGAGTTCGGGTAATAACCGAGTCAA
+CTCGAGGGCTGTTAATCGTCTATCCCGACC
+>ds2020-328_844
+AACGGCCGCCACTAGATATGTTGGGTTTTTGGAAGTGAAGGAAACTGAGGAGAAGAGCAA
+GAGAATTAGGGTTGAGGAGGAGATGAGGGAGAGACTTGATGAGAAAGAGAATGAGCTTAG
+TTTGTTCAAGAAGAAAATTGAGGAATTGGAGTCGGTGACCACCAAGAACGGTGTTGAATA
+GTGGCGGCCGTTGCTGTGTATTAGATCGGA
+>ds2020-328_845
+GCCGTGGACCTAGTTAGGAGAGTAATTTCGGATGGTGTTCTTTACTGCTCTCTGATTTTC
+TGATAAGATTATCGCCGGCGTGGCTGCTACTCCCTCTGAAGCCTCTACTGCTGGCTTCGC
+AGTCAGGTGCAATAGATCCCTTGGATCTATCATATTCTCCCAGATATAATTTACAAGGCC
+CCTTCTTATCACGTTGTAATTCTTATACAC
+>ds2020-328_846
+GCCGTGGACCGAGTAGTTAGCCATTTGGTCCACGGCAGAGGCCAAAGAACTATGTCCAGG
+CAGGGGGAGATAACTAGGTCCACGGCAGTGTCTACCCGACTAGGTCCACGGCTCTCTGTC
+CGATCGGGATAGACGGTGTGCGTTGGTCTATCCCGACCAGGGCATTCTGACGTCTATCCC
+GACCAAGGGCCAATAACGTCTATCCCGACC
+>ds2020-328_847
+GGTCGGGATAGACGTGGGAGCCTAGTGTATCCTAGCTCCCTGTACGTTAAGAGAAAATGT
+ATTAATTACGTCCGCTCCGACTCTGCATGCGTTTACACCCTGCCACTCATCACTGTCTTC
+TTCGACGTGTATCAGGACGTGGGATGCTTGATGGCGGTCGACTGCATTAAGCCTAGCACC
+CCTACACGACTCATTTCGTCTATCCCGACC
+>ds2020-328_848
+GGTCGGGATAGACGGACCCTGTTGATTGGACTTTGAAAACTGAGTCTCAACCCGTATCTA
+TTCAACGTAGTTTAAATGATTTAGATTACATTCAGCAGTATTCTGATGGCACCGTTAAAA
+TTAATTTTGGTAATCAACCTAAGCCTCTCGTACAGCCTAAGTCTACTGTCCATTTGCCGC
+AGTTACCCACCCGCGGCGTCTATCCCGACC
+>ds2020-328_849
+GGTCGGGATAGACGATTATTATGTGTGGTTAGTGGCACTTGAATTGGTTGAGGGTAAGTT
+TGGATGATCAAGAATGGAAGAAGAGGATGGTGGTTGGTGAGAGACTTTGTGAGCAAAAGG
+CCTCAAAAGGTAAGAAGGAGGTGAAGGCCCCAAACCCAAACCCCCTCCTCCTCCTCCAGC
+TGATCTCATGAGGGCTCGTCTATCCCGACC
+>ds2020-328_850
+GGTCGGGATAGACGTCCCCCCGCTCTGTCTTTTCTCGCTTTGCTAATCTTCCCCTCTAAC
+GCGGGCCGGGCGCGGGAGTAAGAAACCTAAGAGAGGACGCTCTTCTCTTAGGTCCTTTTT
+TTCAGTGCAACACAGGAAAGCGCCCTCTTTTTGTTTTGTCAAACCTGCAGCTTTCCAGAT
+TTTGTATTGAACGCAGGCGTCTTCCCGACC
+>ds2020-328_851
+GGTCGGGATAGACGTTGCAAGCTCGTGGTCGGGATAGACGTTAACATTCACTGGTCGGGA
+TAAACGTTCGGCCCGTCTATCCTCGGACAGAGAGCCGTGGACCTAGTTCTTATCGTCCTG
+CCGTGGACCTAGTCCTCCTGCAGCTGCCGTGGACCTAGTACGCATCTACCTGCCGTGGAC
+CTAGACTCCCGACCCTACTAGGTCCACGGC
+>ds2020-328_852
+GGTCGGGATAGACGAAATAACTCCCTGGTCGGGATAGACGTATAGTGGCCCTTTCCGTCT
+ATCACGGACAGAGAGCCGTGGACCTAGTGCTTCCTCGCCTCTAGGGTAGTCAGAATGAGA
+CTAGGTCCACGGCAGGGAAAGACTACTAGGTCCACGGCAGTGATGGAGGTACTAGGTCCA
+CGGCAGGGGGCATGGGACTAGGTCCACGGC
+>ds2020-328_853
+GGTCGGGATAGACAGCACTTGCAGGTTATCGTCTATCCCGACCAGGAGTCCTTGTCGTCT
+ATCCCGACCGCCGTAATTCTCGGACAGAGAGCCGTGGACCTAGTGTCCTGCTGCTGCCGT
+GGACCTAGTCAATTCTAAACTGCCGTGGACCTAGTGAGTCGCCCCCTGCCGTGACCTAGT
+ACACAAACCCATCCTGACTAGGTCCACGGC
+>ds2020-328_854
+GCCGTGGACCTAGTTCATATATTCCTGCCGTGGACCTAGTCAGCTAAGTACTGCCGTGGA
+CCTAGTCTTTCACCGCCTGCCGTGGCCTAGTGTTTACTGGTGTGCATACTAGGTCCACGG
+CTCTCTGTCCGTGAATTACGGCGGTCGGGATAGACGGCTGTGCCCAATCCGCGTCTATCC
+CACCAGGCCTGTCTTACGTCTATCCCGACC
+>ds2020-328_855
+GGTCGGGATAGACGAGTTGGTGCATTAGAGGCGACGCTAAACCATCGTCGTTTAATGAAT
+TCTCTAGAAACGGAGAATTATTTGTTAGTGGTGATTATGAATCCGCCACTGATAATCTAA
+ACTCTGAGGTCCAACTCGCCATTCTTGACGAGCTGCTGCAGCGCTCTACTTCGGTACCCA
+GGGGTATCCAGGGCACGCGTCATCCCGACC
+>ds2020-328_856
+GGTCGGGATAGACGAAAGTCCCATATTGCGTCTATCCGACCAGAGATGATCATCGTCTAT
+CCCGACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTCTATGGTGGCCTGCCGTG
+GACCTAGTACTTATTCCCCTGCCGTGGACCTAGTTCCTAAAACCCTGCCGTGACCTAGTC
+ACATAACTGCTACCGTACTAGGTCCACGGC
+>ds2020-328_857
+GGTCGGGATAGACGCATCCAGCTCATCGCACAACTCCTTTGCCATGCCTTCACCAACCAC
+TAGACGTCGACGCACCTTGCGACGCATGCGCTCGAATTCGAATGTGACGACAGAGATGGA
+CTCCCTTGTGTCAATGTTTAACAACATACAAATCCTTGGACGCATTGATTCATATCACAA
+GTTGGATCCTGATCTGCGCACTGCGGACCC
+>ds2020-328_858
+GGTCGGGATAGACGTCGAGAGTCCATCCTAGTAGTATAAACAAAATAACCTCACTATATG
+ATCCCATAGTAGTAAGAGCATTCCAAAATGCTTTCCAGCTTAAAAACGAGACTGATGCTG
+TTTGGATCATACAAAACAGAGCTAAATCTGCCGAATATGGTGATAATCATCTTGCTGTTC
+TAGTCAGGGCGGTCGTACGTCTATCCGACC
+>ds2020-328_859
+CAGCAAGCGGACTGGAATCAGAGTGATAGGGCGTACCCCAACCAAAGAAAGATGGAGGAA
+GTGAAAACAGAATTCCACGATTCATATGAAAGGCCGCTACAAGACAGGCAATTCAAGTTG
+CGGCTAGGGGAAACCTTGGATAAGGGGGAAACGTGGCAAACTGATGATTGACCGAAGCGG
+ACGAAGAGGCAGTTTCTAGTGGCGGCCGTT
+>ds2020-328_860
+GGTCGGGATAGACGACCTCCTCCAGGCGCTCAATCTTTCCCACAGCTTCAGGAAAGTGCT
+TTAAGCCTATTATAGTCTGCACGGAGCTCTTTAAGCGAGGAACAATGACCAATAGTATGA
+GGAATTTCTTCAATATCATTGGTTTCCACATTCAATATCTTGAGGCTAGCAAGGGACCCA
+ATTGAGTCAGGAAGCGCGTCTATCCCGACC
+>ds2020-328_861
+GGTCGGGATAGACACTCGTACCAATTGGGATAGATTCTGGGCATCTAGGTGGGGTTGGGC
+GCCTACAGGTGCTTATCACTCCCAGTACGTTGATGATGCTCAGTACAGAGCAAAGGAAGC
+CACTTTACGCAACAAGCCTTTTGCTGTATCAACCGTGACGGAACGCAATCGTGATTTTTT
+CACGACACCATCGCCCCGTCTATCCCGACC
+>ds2020-328_862
+TGATTGAATTACGGCGGTCGGGATAGACGATATTGACGGCTGTGTAGGTCCTGCCCTTGC
+TACACGTCGTTATGTACACACACAAATCTCACCTACTCTGTAGGTTCGAGACGGCATAAG
+GAACCCCAAATGCGGGGGTTCGACGTGTTGAGCCTTAGCTGCTCTCGCGTTGCCACGGCA
+GGCAGGGGACTGATTCGTCTATCCCGACC
+>ds2020-328_863
+GGGTAAACGCTTACTGAAGGACGTCTTGCTGGCAGGGAAGAACGCCAAGAAGCACAACAT
+ACGTCTGCAGATGAGCAAGTGTGCGTACGGAGCTATAGCTGAATTCCTTCGTGTAGATCA
+CAAGCGCGGATCTAAGGGGCAATATCTGTCGAGGGCAATGGCAACTCTGGTGCACTCAAG
+AATAGAGTCGAACAACGTCTATCCCGACC
+>ds2020-328_864
+GGTCGGGATAGACGGGTCATGGCCTTCTATTTAGTCGATGCTTGTTTTTCCGGATAAGTA
+GTATTTTATCTTCAAGTTCAAGGGAGTTGTTGGAGTGCTTTTGTAAGTCCTGTTGGCGTG
+CTATAAAATTTCATTTGAATGATAGGCCAATCTAAGTCTTCCATGTCGGTTCGAGGGGAA
+GGAAGGTGCAAACGTCTATCCCGCCGCCG
+>ds2020-328_865
+AATTACGGCGGTCGGGATAGACGCTTCAGTGTGGTATTCATTCTCGTTCGGCTCTTGGAA
+TCACATCCAGCAGTGGTTGGAACAGCTCGCAAAATCCAACCACTTTACCTACTTCATTGC
+CCCCAACCGTTTCTCGTACCTCTATTGAAACAGAATGGTTTCATGTTCCTTCATCGATTG
+GTTATTGCTCTACTTCGTCTATCCCGACC
+>ds2020-328_866
+GGTCGGGATAGACGGCATTATAGGGTTAATGCAATTTCATACCAGTACATTGCTTGCTAG
+CATTGTGCATAATTTAAAAACTGCCCTAGGCTTGAAACAAAAATATGGACTATCTTAGGA
+TTATTGTGTCTGTTGGTTGGCAAAACTAGCCAATAGACGTGAATTTACTGCAATTTAGGA
+GACAGGGACGTCATTCGTCTATCCCGACC
+>ds2020-328_867
+GGTCGGATAGACGTCTAGTAGCGCTTGCATCTGTTCTTTTGAAAACTTGTTTTTGAAGAC
+AGCACCGTATGCATCAATAACTGCCTGCATAGAAGATATTGAGTGCTGGCTGTTAAAGTC
+TTCAAAGTCAAGACAGTAAGGTAGTCGTCCTGCTAGCACCCCCGACACGCGAGCGCTGAC
+ATTTGCGTCATTGGCGTCTATCCCGACCC
+>ds2020-328_868
+GGTCGGGATAGACGCGTAATAACTGTACATGACGATGAAGAGAAGTCAGGTTACGTGCTG
+TTGAAGAATGGTCTTAATGACTACGCCAATTACGTGGTCGAGAGATTAGGGATAGAGTTT
+GATATCCCAAATAGAGAAGAAATGTTCAAACGATTAGTGAATTCACTAACAAAACCAAAG
+AGAACATAGAAGATAGTTATTGATATCGA
+>ds2020-328_869
+GGTCGGGATAGACGGACGATTTGGGTGCAGGTATTGGTAGGCGCCGCAGGGACTCATCAG
+GCTTTGGTGGGCCAAGTCAGGGCCCATCAAAGAGGGGTGGATCCAGTTCGAGTGCTGCTG
+GTTGGGATCTTTTTAAACTGTGAATTTTGAGCAGGTTGAAAGTTGGGAAATATTCAATTT
+ACAAGGGAGAAAATTCGTCTATCCCGACC
+>ds2020-328_870
+TACGGCGGTCGGGATAGACGTAGTAGGTGGATGGTCTGGTTAATTGGGAAGAGGAGCATA
+AAAACAGGGTGTCTCCCAATTTGGCGGAGATGCCGGAGGGTCTGGTTTACGAGCGAGCTT
+CACAACTTTTCAGCAGGTCAATATCAGCTGGTAAAAGGCCTAGAAAGTTCGACTGGCGTG
+AAAACTGGCATATACCGTCTATCCCGACC
+>ds2020-328_871
+GGTCGGGATAGACGAGGCGGGCAGATTAGCGTAGATTTCTGAAGCCGTGTAGTGTATGTG
+ATGTTCACCAGATATTGCCTCTTTCGGTAACTCATCCAATCTGTTAATGGGTGAGACGTC
+AGAGAATGACCAGTCTGGGTGGCGGTCTATTAAACTTTCAACAGAATAAGAAATGTTATC
+TAAAGAAGCAAGGTGCGTCTATCCTGACC
+>ds2020-328_872
+TGAATTACGGCGGTCGGGATAGACGTCAAGGGCTCCTGTCTTCAAAACGGTAACCCTTGG
+CAAGTGCATGTACAACATCGACAATCGCGCGTTCGGCATTGCCATATAGCAAAATATCAG
+CGCGGCTATCCATCAAAATGCTACGGCGCACTTTGTCTGACCAATAATCAGAATGGGCGA
+TACACCATGACATACCGTCTATCCCGACC
+>ds2020-328_873
+GGTCGGGATAGACGGGTTATCGGGGGGTCGGGGTAGACGGTCGCACGTGCTATATTCCCT
+AAAAGTGACTTGGTGCACACAACCTTCGCACCTTTGAGCCTAGCTCCCATCTCTACGGCG
+GTTTGCGCATCCGGCACAAGAAGCATTGATCTCCCTTTATGATTCTCGGCCACGTACCTA
+GCCAAGCCCACCAAGCGTCTATCCCGACC
+>ds2020-328_874
+GGTCGGGATAGACGGATCCCCCAACTAACAACTGATCCATCAACATTTCCTCGTCTCCTG
+TCATCATTTCTATTGTATTGTACTCAATGTCATTTCCCTTGTTAGTGTCAATTATATAAT
+AAGGCGATAGCAACCTGTTCACCATCTCCACTTCAATTAAATCTTCAGGAGCATCTGCTA
+TTAATGAGCCTCGGACGTCTATCCCGACC
+>ds2020-328_875
+GCCGTGGACCGAGTAGCCGCTCTCGTGCCGTGGACCTAGTCCCTTTCCCCTGCCGTGGAC
+CTAGTTTGACTCCCCTTGCCGTGGACCTAGTATATAGCTACATACTAGGAGGAGCCCGAT
+GACTAGGTCCACGGCTCTCTGTCCGAGGATAGACGGTAATTTGGCCTATCGTCTATCCCG
+ACCACCGCATCTTCTCGTCTATCCCGACC
+>ds2020-328_876
+GGTCGGGATAGACGATTTTTGAACATGGCTGGGCTGACTGTAAGAGAGTGCAGCATAGCT
+GAATACATTATAACGGGGAACCAACGTACAACGCCGTTTTTAATAGACCAGACCTTCACC
+AATTACTCAAGTGGTAAAAAAATTGTTGCTTACAATTCTGCGGGCGCAACTAACAATCAA
+GCACAAGTAACCCAAACGTCTATCCGACC
+>ds2020-328_877
+GGTCGGGATAGACGTTGCTGGTCGGGATAGACGTCCCAGGACACTGGTCGGGATAGACGA
+TTGGGGGGTTCCGTCTATCCACGGACAGAGAGCCGTGGACCTAGTCAGCCGAGGGGTACT
+AGGTCAACGGCAGGTCGAGGGACACTAGGTCCACGGCACGACAGAGTAGACTAGGTCCAC
+GGCAGGCGAGGATGTACTAGGTCCACGGC
+>ds2020-328_878
+GGTCGGGATAGACGCTCTACACCCTTGGTCGGGATAGACGACAAGGAAGCCTGTCGGGAT
+AGACGCGAATCATCCGTCTATCCTCGGACAGAGAGCCGTGGACCTAGTGAGGAGTAGTGT
+GCATACTAGGTCAGGTGCACTATCACTAGGTCCACGGCAGACAAAGGACGACTAGGTCCA
+CGGCAGGAGCAAGGAACTAGGTCCACGGC
+>ds2020-328_879
+GGTCGGGATGACGGCGCTCATGCCTGGTCGGGATAGACGTTTCAAGGGTCTAATCTCGTC
+TATCCCGACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTGCGACGTGTCCTGCC
+GTGGACCTAGTATTCCACTCCTGCCGTGGTCCTTGTGTCATTTTGCCTGCCGTGGCCTAG
+TGCATCAGGGTTTGAACTAGGTCCACGGC
+>ds2020-328_880
+GCCGTGGACCTAGTCTAAAGAACACTGCCGTGGACCTAGTGACTAATTTGCTTCCGTGGA
+CCTAGTCTGTACCCTCTACACAACTAGGTCCACGGCTCTCTGTCCGTAATTACGGCGGTC
+GGGATAGACGACAAGGCCAAATCTCCGTCTATCCCGACCAGGAGCTAGAGACGTCTATCC
+CGACCAGGAGGTTATTCGTCATCCCGACC
+>ds2020-328_881
+GGTCGGGATAGACGCATGTATCTTCTGGTTGCTTCTGGGTCTGGTCTAAGGTTGGTTCTA
+AGGCTGGTTTGGAACCCTTCCCTTGAACAGGAGCTTCAGCTTAAGTAGCCGCTGGTGTCG
+AAGCTGAAACTGCAGGATCTGTTGTAGACGCAGGAGCTTGTCTCGTCCGCTACTATCCCT
+CTGATGATCGATGTCCGTCTATCCGACC
+>ds2020-328_882
+GGTCGGGATAGACGATACTCGGTGGTATAATCTGGGTATACAAGGCGCTAACGATATGCA
+CCCATATAGAATTATTCTAGAATGCTGTTCTTTAAGGTTCGGTAAGCAATTCGATATAAA
+ATGGGACACTATAGCTGGACCAGACATAATGACAGAGCTAGCTACATCGGAAGTAGTCAA
+ACAACGAGATATTGAGATTGAAATTGTA
+>ds2020-328_883
+GGTCGGGATAGACGCTTTCGGGCCTTTTGATAACTAATTAGAGTTGACATGAAATGGATC
+GCGGAAGAAGACGTATCTGATGAATGAATGATTCAATCCCCTCCCACCCGCACGGTTCCT
+CTATTGAAGGGGTTCCACTTCATTCTATGTGAGGTGGGGCGTACGTAAGAGCGGAACCTA
+GATAGAACGCGGAGCGCCGGCCCCGGCC
+>ds2020-328_884
+GGTCGGGATAGACGGAGTTGCATCATAAGAAAGAAAATTGAAAGATGAAGACCTGTCCAG
+CCTAAAAAAGAATGCTATTTCCCCATTGAAGAGGACAAGGAGAGACTTGCTAGGAGAAGA
+AAAGTAAACAAGTGGAGCTCTTTGGAAGAGGACACCTTGAGGGCTGGTGTAGGGCAGTAT
+GGAGTGGGACTAATCGTCTATCCCGACC
+>ds2020-328_885
+GGTCGGGATAGACGGGGGGTCCTGCGGTCGGGATAGACGGAAAGGCCTAGTCTATCCGAC
+CAGGCAGATTTGGCGTCTATCCACGGACAGAGAGCCGTGGACCTAGTTTCCAATTGGCTG
+CCGTGGACCTAGTATTTTTGGCCTTGCCGTGGACCTAGTGCGGCCTCTCCTGCCGTGGAC
+CTACTCAATTATTCACTAGGTCCACGGC
+>ds2020-328_886
+GGTCGGGATAGACGAGAAGCCGGGGTGCGCTCTAAACAGGTCTCTTAGCCTGAAGGAAGC
+TGAATTGTTGGGGTACACAAAAATCACAGCGGCTCATCATGTACACTACACAGTGTCTGA
+GGCCGCGGCTTCTGTCCAAAAGGAAAAAAGATCTCTAATACCTAAGGCTCTCCGTCTACC
+ACACGATGCCACAGCGTCTATCCCGACC
+>ds2020-328_887
+GGTCGGGATAGACGTTCGTGCTCCTTCTATGCTCCGGCGGGCTCCGCTTCTGCTTTAGTT
+ATGGAAGCCCTATCTTGATTCTCACCCTTGGTTTGTTTAGTCCTTCTTTCCCGCTGTCGT
+TCTCGGATGAAAGATACGAAAGGTACGGAGTAACTCGACTGGCAAGAGATTTATGGGGTC
+TCCTTCTCTTCTTGGCCGATATTCCACT
+>ds2020-328_888
+GGTCGGGATAGACGTCGAGCAGCCCTCTTCAACGGAGAGTTTGATCCTGGCTCAGGATGA
+ACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGATGATCCCAGCTTGCTGGGGGATT
+AGTGGCGAACGGGTGAGTAACACGTGAGTAACCTGCCCTTAACTCTGGGATAAGCCTGGG
+AAACTGGGTCTAATACCGGATATGACTC
+>ds2020-328_889
+GGTCGGGATAGACGATTCTTGGTTCTGAAAGAAAGGTCCCGATTCCGGGACGGAGCCGTA
+TGACGCGAGAGTGTCACGTACGGTTTCTTTGAGAAGGGTGTGATACCACCACCTATCAGG
+CCCGACCAGCTGTCCACGGAGCTGCATCCCTACTCACCTGGTCCATGCACATCGCTCTCT
+CCAGCAGGGTTGACCGTCTATCCCGACC
+>ds2020-328_890
+GGTCGGGATAGACGCAGCCCAGTACTTGCTCCACTTCATGCACACAGGCTTCCTGCCTAT
+AAGGCTAGCCTGCCTGAATATCGATGATGATGCTTCAAACACTTCATCATAACTCAGATT
+CGCCAGCCTCGGTTCGGTCCTATTATCCTTCTCGAGTTGCCAGTCTACGTCTCCATCCAC
+ACGGTTGATTATCACGTCTATCCCGACC
+>ds2020-328_891
+GGTCGGGATAGACGATTTCGGGGGCTAGAAGATAGGGAAGGGCAAATGCATAAATTGTGG
+CGTGGCTTATATTCCGGGTGGCGAGGCACTACCTGGATAAACACTGTTCTAAATTTCTGC
+TATGTTCACATAGCGCTGGTGAACCTGGAAAGGATAACAGGGATAAGTGTTGTTTTAATG
+GTAGGCCACGGCGGCGTCTATCCCGACC
+>ds2020-328_892
+GGTCGGGATAGACGATCTCTTCGTCTCGGGTCTACACCCAGCGACTCGACGCCCTGTTCG
+GACTCGGTTTCCCTTCGCCTTCCCTATTCGGTTAAGCTTGCCACTGAATGTAAGTCGCTG
+ACCCATTATACAAAAGGTACGCCGTCACCCGTTTCCAGGCTCCGACTTTTTGTATGCATG
+CGGACCGGCGATTCCGTCTATCCCGACC
+>ds2020-328_893
+TGGTCGGGATAGACGCCAGCAAGCAGTAGGTATGCTTAAAAATGCCGATGCGATGAACGT
+GAGGGCGCAGCCGGCCAAATGTGCATTCGGCGCTGTAGCAGAGTTCCTAAGGGTAGACAG
+ACAGAATGGCGCTAACGCGCAATACCTGCCCAGGGCAATAGCGACTTTGGTCCATTCGAG
+AATAGAAAGCGGTACGTCTATCCCGACC
+>ds2020-328_894
+GCCGTGGACCTAGTCCTGGTTGGGCTAATATACTAGGTCCACGGCAGACAGAGACTCACT
+AGGTCCACGGCAAGAGCAACGCCACTAGGTCCACGGCTCTCTGTCCGGTCGGGATAGACG
+TCAGAAACCTCTGGTCGGGATAGACGCGAGCTTCCCCTGGTCGGGATAGAGTACTCCCCT
+GTTCCGTCTATCCCGACCGCCGTAATTC
+>ds2020-328_895
+GGTCGGGATAGACGTCGTCTGCACTGTCCAATCTGTAGGCTACTTTGACATATCCATCTA
+GGGTAGTGTAGTTGACGGGCCCCTCGTCCTCATAAACCATCGCTGCATTGTATACCGCCC
+CGTCTCCACCGACTACTTGTGTGTCGCCGTCGAAACAGATACTCTGATCAGCCGCTACGT
+CCATACAACCTGAGCGTCTATCCCGACC
+>ds2020-328_896
+GGTCGGGATAGACGGGGGGCCTTCTTTCACTCCACACCCCCCATGCACAGGCAACAAAGA
+AAAAGATGAGACTGGGAACATCGACGACCATCGGTGGAACTCTTTTCGGAGGTCCACTTA
+CCCCGGCGGCGGCTTGGGCCCACGACCAGACAAGGTCTACCTGGGCAAAGTACCTCAAAG
+AAACGGACGCCAGTCGTCTATCCCGACC
+>ds2020-328_897
+GGTCGGGATAGACGAATACTGCACCTGGTCGGGATAGACGAACCCAAGCGCTGGTCGGGA
+TAGACCACAGTACCGTCTATCCCTCGGACAGAGAGCCGTGGACCTAGTAGCGTTGATTGT
+AGGTCCACGGCAGTGAATATCAAACTAGGTCCACGGCAGGTGAGTGGTACTAGGTCCACG
+GCAGGTGTCTAGGTACTAGGTCCACGGC
+>ds2020-328_898
+GGTCGGGATAGACGACCGAGGGCCATCAACGTCTATCCCGACCAGTAGAGTTAGACGTCT
+ATCCCGACCATGTGCTGGCAGCGTCTATCCCGACCGCGTAATTCACGGACAGAGAGCCGT
+GGACCTAGTCGCATCCCAGCTCAGACTAGGTCAGGCAGAGGATCACAGACTAGGTCCACG
+GCAGCGCATAAAGAACTAGGTCCACGGC
+>ds2020-328_899
+GGTCGGGATAGACGGAAAGACTGGGTCCCCGTCTTCCCGACCAGGTTAAAGATACGTCTA
+TCCCGACCATGGGGAAGGCGCGTCTATCCGACCGCCGAATTCACGGACAGAGAGCCGTGG
+ACCTAGTTCTAATCGGGGTATTACTAGGTCCACGGCAGCAAAATAGATACTAGGTCCACG
+GCAGGAGAGCATGTACTAGGTCCACGGC
+>ds2020-328_900
+GCCGTGGACCTAGTACTGTTTCCTGTTCAACGTTCATCGTAGCATGGTGAGTCGGCCCCT
+AAGGCGAGGCAGAGATGCGTAGCTGATGGGAAGCAGGTTAATATTCCTGCACCGTCGTAT
+GATGCGATGGGGGGACGGATCGCGGATGGTTGTCCAGCTGTTGGAATAGCTGGTTCTTGA
+CTCATAGAAGGCGCTTAGGCAAATCCGG
+>ds2020-328_901
+GGTCGGGATAGACGTAATTGAGCAGTAACTTTATCATGCTGAAACAATAAACCAACCTGC
+ACAGTACCCAGAATATACCGTAGAATCCATTTCACAGATTGCCAATGCCCTTTTCCTGGA
+TTATGCACATATCTACTGACAATACTAACAGCTTGTGAAATATCAGGCCTTGTACACACC
+ACAGAGTACAAACTCGTCTATCCCGACC
+>ds2020-328_902
+GGTCGGGATAGACGCTTAACCATGCTATCAATCTTTTTGACCTCCATTGTACCGTTCCCT
+TCCCCCAATATCACTGGTGAAAAGTGATTTTGGTCTCGCAATATTGTTACATTATTCTCT
+TGACTTCCATCATTATAATTAGTAACCCGTCCACTCTCTTTATCTAGCAATCTTAGGCCG
+AACCCCCCATGAGCGTCTATCCCGACC
+>ds2020-328_903
+GGTCGGGATAGACGGTAAAGGAGCGTAGACGAGCGAGTAGAGCCCAGGAAACAGGGAAGC
+CCGTCATAGAGCAGTCGACTAGAAGTAGAAGACTGCTGGCCTGAGAGAAGGCGGCCTCTC
+CCGGGAAACATGGCCCAATTTCTCTTCTTTCTTTTTTATTTCGGGTTTCTTTATTTTTTC
+AGGGGGGGCAGCCCGTCTATCCCGACC
+>ds2020-328_904
+GGTCGGGATAGACGGTTAATCGGTATGTATTTTTCAAATATTTGAGGGATATGATAGGTT
+AGATGCATTTTATGCAGCAATTGTCACCATAATCACTGTTGGTTATGGTGACAAAACTCC
+AAGTTCTAAAGTAGAGGATATACAGATAATTGAGATGGCTTCAAACATGCTTTCTAATTG
+TAGTTAGGTATTTCGTCTATCCCGACC
+>ds2020-328_905
+GGTCGGGATAGACGAACCCCCCCCCCATCTCGTACCGGAACCGAGTTCCAACTGCGAGAC
+GGACTTGCACACTACCCCATCGTATCGTATTTACTGTATTGATTTTCCTACAGACTCGAG
+ATCGTCGTAGTCTGCCGGTGGTCGTATCGTCCCACCGGATAAAATACCGTAAGCTCCTCT
+CACCACGTTTTTGCGTCTATCCCGACC
+>ds2020-328_906
+GGGCGGGATAGACGCCCGGCGGTGATTGCACACTAGCTGGCCCGTGGGGGTAAGAGAGTG
+TTCCGTTGGTGTTCTCAGTCTCAGTGCGACCTTGCTTGGTCAACAAGGGGATCAAAATGT
+CCCCCATCAATAAAGTGAGGGCTTTCCGGACCTTCTCCACCTCCCTTTTTCTTTTTTTTC
+CATGCTTTCCGTCCGTTTATCCCGACC
+>ds2020-328_907
+GGTCGGGATAGACGCCGGGTGAAGCTAACTTTGCAGCACAATTATCCTCATGCATACAGA
+ACTGTAGAAGCTTACAGAGGTACCAACTACCGGTAAAATGGTATACAGATTTATTTAGGA
+CGGTAGGATCCGCGGCTTGTGAGGCGATGTGCTATCAGCAGTGGCGGCGATAAAGACCTA
+TAGTGGAGGCAGCCGTCTATCCCGACC
+>ds2020-328_908
+GGTCGGGATAGACGATGTTAAGTGCTGGCTGTTGAAGTCCTCAAAGTCTAGACAATATGG
+CAACCTATTCTTCAAGACACCCGCCACTCTGTTTACTACATTTCTGTCGTTTGCGTCTTT
+ACCTACCGGGAATCTGTTCGGCAAGACGTTCTCGCAATTGTAGAACGCGAAGTTTGCAAG
+TACGTAACTCGTTCGTCTATCCCGACC
+>ds2020-328_909
+GGTCGGATAGACGGGCGGCTGGTATCGTCCATTCTTACACCCTCGACACCAACTAAGAGT
+TTTTCTTATACTTGCGAAAAACTCAAAGAATTTGAAAATTTCGGTGTTCCTTCCCATGTC
+AATCATCGTGGTACCAGTGTCAGATATGTTCCGTTCATTGAACAAATCACCTGGACCTAC
+TACTGCCCCCATGCGTCTATCCCGACC
+>ds2020-328_910
+GCCCGGGATAGACGAGGAGGTGATATTGACGCCGATGGATATAGGTTTCTTGGGAGAGTC
+AACGGTAGGTATAGAAGTAAAGCACGAAGAAATGAATTATAGGTATGTTAGATTGGATTT
+TGTGACAATAAGAACGCCAAAAATAATGGCAACTGTTGGTGCAAATATATCGGGTAATAT
+AAGGGCCAGGCGTCGTCTATCCAGACC
+>ds2020-328_911
+GGTCGGGATAGACGTTACACGTCACTCCGCTAATAGCAGCAACACCTGATAGTGCTTCAA
+TGCAAAACGGCAGCCCGAAGGCTGCCGTTTTTGTATCCATTTCTGATATTCGCTGAAGCG
+CTTTATCTCAACTCATCCCGTCAACTATGACCGCAATTTTTGCCTTCCACAAGGTAAATC
+TCATCTCTTCCTACCGTCTATCCCGCC
+>ds2020-328_912
+GGTCGGGATAGACGGTTACCACCCCTGGTCGGGATAGACGCCCACCGTGGCTGGTCGGGA
+TAGACGTCTATCCTCCCTGGTCGGGATAGCCAAATCTTACGTCTATCCCTCGGACAGAGA
+GCCGTGGACCTAGTTGGAGCTCACTTGGTCCACGGCAGTGTGTCACAGACTAGGTCCACG
+GCCCCAATTGCAGACTAGGTCCACGGC
+>ds2020-328_913
+GGTCGGGATAGACGCTTGCTCCCCTGGTCGGGATAGACGTACTTGCGGCCTGGTCGGGAT
+ATACGTTAAAGCCGTCTATCCCGTCGGACAGAGAGCCGTGGACCTAGTTCTAAGCGCCTG
+CCGTGGACCTGGTCGTGCGCTTCATGCCGTGGACCTAGTCAACAATCAGCTGCCGTGGAC
+CAAGTCATCAAGTACTAGGTCCACGGC
+>ds2020-328_914
+GGTCGGATAGACGATACATGTGGCTGCGTCTATCCCGACCAAGGGTTGGAGCCGTCTATC
+CCGACCGCCGTATTCACGGACAGAGAGCCGTGGACCTAGTATATAAACCCCTGAGATACT
+AGGTCCCGGCAGCATGTTACGTACTAGGTCCACGGCCCCCTACCTACACTAGGTCCACGG
+CAGGGGGCGTAGAACTAGGTCCACGGC
+>ds2020-328_915
+GGTCGGGATAGACGGATAGACGATGTCCAGGGGTGATTGTCGTCTATCCCGACCCCCGAA
+GTGATCGTCTATCCCGACCGCCACGGACAGAGAGCCGTGGACCTAGTAAGGATAGTACTA
+GGCCACGGCAGACTTAATTGCACTAGGTCCACGGCACGATAGCGGGAACTAGGTCCACGG
+CAGGCATTCAACGACTAGGTCCACGGC
+>ds2020-328_916
+GGTCGGGATAGACGAAACGCAATCATGTCTATCCCGACCAGGTGTTCTAACCGTCTATCC
+CGACCGCCGTAATTCCGGACAGAGAGCCGTGGACCTAGTCGCATTGTCTCTGCCGTGGAC
+CTAGTCACTCAAAGGGTTAATAACTAGGTCCACGGCAGGTCGGTGATACTAGGTCCACGG
+CACCCCCGACACAACTAGGTCCACGGC
+>ds2020-328_917
+GGTCGGGATAGACGATTTGGAGTTGTCTATCCCGACCAGGGAGATTCCTCGTCTATCCCG
+ACCGCCGTAATTCACGGACAGAGAGCCGTGGACCTAGTTGGGTAGTGGCTGCCGTGGACC
+TAGTAACGCTCACCGTGCCGTGGACCTAGTGATCTGTGCGGTGCCGTGGACCTAGTCCTC
+CAGCAGCAGGCGAACTAGGTCCACGGC
+>ds2020-328_918
+GCCGTGGACCTAGTCTCCAACTGTCTGCCGTGGACCTAGTTCTCATACCCCTGCCGTGGA
+CCTAGTTTAGATTCCCTGCCGTGGACCTATTGAAATGGTGGTATTACTAGGTCCACGGCT
+CTCTGTCCGAGAATTACGGCGGTCGGATAGACGGTAACCCAACCTAACGTCTATCCCGAC
+CAGAGGGTGTTTTCGTCTATCCCGACC
+>ds2020-328_919
+GGTCGGGATAGACGCGCTTGGGTACTGGTCGGGATAGACGGTGTAGCCCCCTGTCGGGAT
+AGACATAGCTGCGTGTTTCGTCTATCCCGACCGCCGTAATTCCCGGACAGAGAGCCGTGG
+ACCTAGTTAAGACTACTCTGCCGTGGACTTAGTTTCTTCACGGGGCCGTGGACCTAGTAT
+CTCCCCTGCTACAACTAGGTCCACGGC
+>ds2020-328_920
+GGTCGGGATAGACGGGGGATTTAAATTTTAATTAGCATCAAGACGAACATTCCGAGGTCG
+CACCCCCCCGTCTTACTGTAGCAGGCATGGCAAACCTGACCCGTTTACGCACGCTTGTTA
+CGTCCGGTGAGCTCGAGGTGGTGTCAGCCGCAGCTGTTCTCTTCCACCTTTCTCGGAATC
+CAACCCTACATGACGTCTATCCCGACC
+>ds2020-328_921
+GGTCGGGATAGACGCCCACTCCGCATCTATCGTTCCAGAAATTTTCCCATGTATATATCT
+CCGGCCGCCCGCCCATACCCCTAAGTGTTTTGAAAAGCTGTTTTATGATTTCATACATCT
+GAGATTGGTCGACTTTTGCTAATTCTGGTTTTGTTCTGTTTATTTTTTCTTGATTCCAAT
+CTATGCCCCCGACTCCCCTATTAACT
+>ds2020-328_922
+GAGTGGCTGCCGTGGACCTAGTCAGTAAACCGGGCCGTGGACCTAGTCGCCGCTTACCTT
+ACATTGACCGAACCTTTACTGCACCTCGCACTCACTCTCACAATGCCCCCCTCGCCCCTC
+TTTCTTACCACACGGAAAGAACTCGCCCTAATCCACCCCCACCCTCCACGAGTACTTCTT
+AAACTACTCCCATCGACTTCCCGACC
+>ds2020-328_923
+GGTCGGGATAGACGACCGTTACCCCTGTTGAAGATCTCTATCGATAGAGCATCAGCACTG
+ATAGGATGCTCGGGCATCCTCATTAACCGTTTTCTTCGGAAAATGGAACGGAATTTTCAA
+TTCTTCTCTTTTAAGGGTATACACCCGCTCTTTGGAGTTCGAATTCCAAAGTTAAGATGT
+ATTCCTTCTGTGGAGTCTTCCAACAT
+>ds2020-328_924
+GGTCGGGATAGACGGGCCCCCCTACGCTGGCGAATGCCCCCTTTCTCTTCTCTGAAGTCT
+ACAACAAGTGGGCGAGGCAGGATTCGAACCTACGTAGAAAAACTTCAACAGATTTACAGT
+CTGTCGCTTTTGACCGCTCGGCCACTCTCCCCTTCCCGGGCTGAGGCCCCCTCACTGGGT
+TCTAAGAAGGGGGCGCCGCCCTGAAT
+>ds2020-328_925
+AACCTGATGCCGCATGGAAGTTTCACAGTAGGCTGGGTAAATGTAACCAAAACTGAAGAT
+GAGAGGATTAAAGTTGAGCAAAAAAGAATCTCAAAACACATAAGGTTAACGCATGATTGT
+AACAAAAAACCAGGGACTAATTTGAGATCAGGTAGACAGGAAAGATTTGGACCAGAGGAA
+AAGTCAAGTAACCGTCTATCCCGACA
+>ds2020-328_926
+GGTCGGGATCGACGTTAAGCACCCCTGCTCTTGCATATGCCCTGGTGGAGTCCATGTCCT
+TAGGCGGCACCGGTGGCATACTCACACTTACACTATTAGCTGCGTATATTTTATGTACCC
+CAGTTCGCAGCGGGTGTAAATATTTTAGATTATGCCCATTCCACCTCATAACTGTCCCCA
+AAGCCCACAAGTCGTCTATCCCGACC
+>ds2020-328_927
+GGTCGGGATAGACGTGTCATGATTTTATGAAAGTAGGTTTGAATGAATTCCGCTCTTTGA
+TTTTGGTCTTTCAACGGGCCCTACAAGCTCATGTGTCAATTCTTCGCATTTTAAACCAAT
+TTATAGTGACCAAGAAAGACCAAAATCAAAGAGCGGAATTCATTCAAGCCTACTTACTTT
+TTACCTAACCAACGTCTATCCCGACC
+>ds2020-328_928
+TGGCCGGGATAGACGTGGAGCCGCCCTTTACTTGGATCTGGATCCCATCCCTAGCTCGTA
+AAGCTTGATTCCAGTTCCGTGTAGTCAGGGTGGTGCTTTTGGCCTTTACGCTCTGGTTGG
+TAATCGCGGTTGCTGCCCCTAGCCACTGACTATTCTTATTTAAGTAAGCCTACCCAGTTT
+AATCCCCCCAGGCGTCTATCCCGACC
+>ds2020-328_929
+TGAATTACGGCGGTCGGGATAGACGCCCCTTTCGCCTGGTCGGGATAGACGATAAATTTG
+GGGGTCGGGATAGACGGGACTACCATTATTCGTCTATCCCTGTCCACTCCAACCTGCCGT
+GGACCTAGTTCGCTGTAGCCTGCCGTGGACCTAGTCAATGAGTCCCTGCCGTGACCTAGT
+AGATTGATCATTACTAGGTCCACGGC
+>ds2020-328_930
+GCCGTGGACCTAGTCTATACCCCCTGCCGTGGACCTAGTTCGATGGCCGCTGCCGTGGAC
+CTAGTGGAAGGGGGATGGGCACTAGGTCCACGGCTCTCTGTCCGAATACGGCGGTCGGGA
+TAGACGTATTGATTCCCTGGTCGGGATAGACGTGGTCTTTCACTGGTCGGGTAGACGATT
+ATCAGGGTTCGCCGTCTATCCCGACC
+>ds2020-328_931
+GGTCGGGATAGACGGAATCCCCTCGGTCGGGATAGACGTTAATTCGCATGGTCGGGATAG
+ACTGGTGAGCTGCGTCTATCCTCGGACAGAGAGCCGTGGACCTAGTGGTCAAACCCGTGC
+CGTGGACCTAGTTACTGAATTGCTGCCGTGGACCTAGTAGGTGAGATACTAGATCCACGG
+CAGGGATCACAGACTAGGTCCACGGC
+>ds2020-328_932
+GGTCGGGATAGACGTATCCGATCGGTCCTTGTAACACTTCAGTTTCAAATATATCTTTAA
+CGAAATAACCTTCTTTAGTTAAATTATCGTTTTCCCACCCTTTATTCTTGCGATATGAAT
+TGGGAATGAACTTCCAAATTCTCATTTTATGATGAAACCTGTTTTCCGTATTTGCATTTA
+AGCCTGTTGTGGCGTCTATCCCGACC
+>ds2020-328_933
+GGTCGGGATTAGTATTGAACCTAGATAAATGTTATCAGGTGCCTACATTGAGCATGAATA
+TGATTATATCATGTTCATTGCAACACGGTCATTCATTTAAGTTAGAGAATAATGGTTATT
+CTGTTTACATGAATGATACCTTTCATGGTCATGCACCCTATGTGAATGGTTCATTGAATC
+TCGGTCGTGGTAAGAGGTTTCGCATC
+>ds2020-328_934
+GGTCGGGCTAGACGATCGAGAGTAGTCTGATTATGGGAACCGAGGCCGGCTACTGTGACG
+CAGCTAATGGTACGCTTATCCAAAAGGCAGGGGTAGCCCGAGAATGCCGCTCCCCCTTGA
+CCGTAAGCTGGTTGTCCCGTGTTATCCATATTTTGGGAAAGGGTTCGATCCCCATCGTCG
+ATGGTAAGCACTCGTCTATCCCGACC
+>ds2020-328_935
+TTCCCCTCCCGTTTGCGGCACTTAACATGAATGTAGTGCTGATAGAGGTTTCGATGAAGT
+CTAAGAAGTCCACCATCGACGAACCAGTATAATCAGAATCCACATGATGATAAATCTCCT
+TCATGTAATCTTTCCACGAAGCAATTGCACCTTTAGTATTCCAAGGCCTGAACCATTCAA
+ACATAACAGAATCGTCTATCCCGACC
+>ds2020-328_936
+TTTTAACTGCAACAACTTAAATATACGCTATTGGAGCTGGAATTACCGCGGCTGCTGGCA
+CCAGACTTGCCCTCCAATGGATCCTCGTTAAGGGATTTAGATTGTACTCATTCCAATTAC
+CAGACTCGATGAGCCCAGTATTGTTATTTATTGTCACTACCTCCCCATGTCAGGATTGGG
+TAATTAGTGGCGGCCGTT
+>ds2020-328_937
+TTCCTCACCACACTCCAAGCTTCTCTCCTGCCTGTTCCTCACCACACTCCAAGCTCCTCT
+CCAAGCCTGTTCCTCACCACATAAGACCGTCTATCCCGACCAGGGAATATGCTCGTCTAT
+CCCGACCCCCGTCTATCGTCTATCCCGACCGCCGTAATTCAGATC
+>ds2020-328_938
+GGTCGGGATAGACGAACACATTCCCTGGTCGGGATAGACGTTGCAATACGCTGGTCGGGA
+TAGACACGACTTGTTCTCGTCTATCCCCACCAGCGTATTGCAACGTCTATCCCGACCAGG
+GAATGTGTTCGTCTATCCCGACC
+>ds2020-328_939
+TACTCTCAGTACAATCTGCTCTGATGCCGCATAGTTAAGCCAGCCCCGACACCCGGGTCG
+GGATAGACGAATCTTCGCCCTACTCTCAGTACAATCTGCTCTGATGCCGCATAGTTAAGC
+CAGCCCCGACACCCG
+>ds2020-328_940
+ACCACTCAATTTATCGTCTATCCCGAAGTGTGAAAACCCGTCTATCCCGACCAGTGTGCC
+ACGACGTCTATCCCGACCACCACTCAATTTATCGTCTATCCCGAAGTGTGAAAACCCGTC
+TATCCCGACCAGT
+>ds2020-328_941
+TTATTCCCGACCTGCCGTGGACCTAGTCACTCACCCGGTGCCTGACCTAATCCTCTCTGC
+ACTGCCGTGGACCTAGTTATTCCCGACCTGCCGTGGACCTAGTCACTCACCCGGTGCCTG
+ACCTAATCCTC
+>ds2020-328_942
+GAATGGAGGTACTGAATGACTAGGTCCCGGCAAGCATGATATCAACGGGGATGTTCCTAT
+ATTCATTAACATTGGTGAATGGAGGTACTGAATGACTAGGTCCCGGCAAGCATGATATCA
+ACGGGGATGTT
+>ds2020-328_943
+AGTAAACTGGTGGCTTGTAGACTGGTGTGGGTGGTGGGGGAGACTTGTAGTGGTAGGGGT
+GCTTGGGTGGTGAAGGTGATGGTGGTGGTGGAGACTTGTAGTGGTAGGGGTGCTTGGGTG
+GTGAAGGTGA
+>ds2020-328_944
+CGTTCCACTGGTCGGGATAGACGATGATGTTTGCTGGTCGGATAGACATTCACCGGGTCG
+GGATAGACGCTACGTTCCACTGGTCGGGATAGACGATGATGTTTGCTGGTCGGATAGACA
+TTCACCG
+>ds2020-328_945
+CTGACCCCTGCCGTGGACCTATTTGTCAATCGCTGCCTGGACCTAGATCTTGTCGGCCGT
+GGACCTAGTAACCTGACCCCTGCCGTGGACCTATTTGTCAATCGCTGCCTGGACCTAGAT
+CTTGTCG
+>ds2020-328_946
+TCCACGGCCGTCGAATTAGGCCACGGCAGGCGTTTAATGACTAGGTCCACGGCAGGGGAA
+TGTATACTAGGTCCACGGCCGTCGAATTAGGCCACGGCAGGCGTTTAATGACTAGGTCCA
+CGGCAG
+>ds2020-328_947
+CTCCTCCACCACCCTCACCATCACCACCCAAGCATCCTTACCACTACAAGTCTCCACCAC
+CACCCTCACCTTCACCACCCAAGCACCCCTACCACTACAAGTCTCCACCACCACCATCAC
+>ds2020-328_948
+GCCCCCCCTTTCGCCCTTTTTTATGCAGACGATTCCCCGATCGGGGAATCGTCTGATTCC
+CTACGTATTAATCTTCTTCTTTTCTCCTTTTTCGCGTTTTCCTCTTATTCC
+>ds2020-328_949
+CCCTGCCGTGGACCTAGTTCCTTTCCACCTGCCGTGGACCTAGTAGAGTTGCCCCTGCCG
+TGGACCTAGTTCCTTTCCACCTGCCGTGGACCTAGTAGAGTTGCCCC
+>ds2020-328_950
+TTCTTCGATGATGCGCAAATTGAAGCTTCGGTACCCTTGTTTTTTCCAATCGCCCAATTT
+CTCTTCTTTCTTTTTTATTTCGGGTTTCTTTATTTTTTCAGGGGGG
+>ds2020-328_951
+AACCAAGAGCGCTTTTTCTTTCCATTCGCCTGGGACAAGGCCTCCCATCACGCTTCCATT
+GAAGAGTTAATCCTTCAAGTAGCGGTGGTGCACCCTGCCTGTACT
+>ds2020-328_952
+TGGAGTGATGGTGGCTTGTATGGTTTCTTAGGTGGTAGGGGTGGTGAGTAAACTGGTGGC
+TTGTAGACTGGTGTGGGTGGTGGGGGAGACTTGTAGTGGTA
+>ds2020-328_953
+AGCTTGGAGTGTGGTGAGGAACAGGCAGGAGAGAAGCTTGGAGTGTGGTGAGGAACAGGC
+AGGAGAGAAGCTTGGAGTGTGGTGAGGAA
+>ds2020-328_954
+GCTTAGGTGGTGAAGGTGATGGTGGTGGTGGAGACTTGTAGTGGTATGGGTGCTTAGGTG
+GTGAAGGTGATGGTGGTGGTGGAG
+>ds2020-328_955
+GATTGATTTCTTGTTTATTGGCGTCAGTGGTGAGGTTTGACACCATGTGTTTGAAGGAGG
+GATCGTGTGCGTCTATCCCGACC
+>ds2020-328_956
+CGTCTATCCCGACCAGCGATTGTGACCGTCTATCCCGACCAGGGCACTGCCACGTCTATC
+CCGACCGCCGTAATTCAGATC
+>ds2020-328_957
+TCGAAGAGGGGCTTGCTAAAGAGGCTCGAAGAGGGGCTTGCTAAAGAGGCTCGAAGAGGG
+GCTTGCTAAAGAGGCTCGAA
+>ds2020-328_958
+TGAATTACGGCGGTCGGGATAGACGAGCTAAACGCCTGGTCGGGATAGACGAACGTATTC
+TCTGGTCGGGATAGACG
+>ds2020-328_959
+GGAACACCAGTGGCGAAGGAAGGAACACCAGTGGCGAAGGAAGGAACACCAGTGGCGAAG
+GAAGGAACACCAGTGG
+>ds2020-328_960
+GAATTACGGCGGTCGGGATAGACGCGAAGCACCGGTGGTCGGGATAGACGGCCGACCCCC
+TTGGTCGGGATAGACG
+>ds2020-328_961
+TGGATTACGGCGGTCGGGATAGACGTTGACCGTGCCTGGTCGGGATAGACGAGTGAACCG
+CTGGTCGGGATAGACG
+>ds2020-328_962
+TGAATTACGGCGGTCGGGATAGACGCCAATCGCCCCTGGTCGGGATAGACGCAATACCAC
+CCTTCGGGATAGACG
+>ds2020-328_963
+CGTCTATCCCGACCAGGTCCCATTTTCGTCTATCCCGACCAAGGCTAAATGACGTCTATC
+CGCCGCCGTAATTCA
+>ds2020-328_964
+GAATTCGGCGGTCGGGATAGACGAAAGGAGCGGGGGTCGGGATAGACGATTGCTTGCCTT
+GGTCGGGATAGACG
+>ds2020-328_965
+TTAGACGTCTAGTGTCCCTGGTCGGGATAAACGGGGCAAATCGTCTATCCCGACCAGGGA
+CACTAGACGTCTAT
+>ds2020-328_966
+TCTATCCCGACCAGGGAAATACACCGTCTATCCCGACCAGGAGCGGGGTTCGTCTATCCG
+ACCGCCGAATTCA
+>ds2020-328_967
+AGGTAGTTTACTTGCTTACTTGTTAGAGTAAGGAAGAGAGGAAAAGGGTGCTGTCGTCTA
+TCCCGACCC
+>ds2020-328_968
+GTGATGGTGGTGGTGGAGACTTGTAGTGGTAGGGGTGCTTGGGTGGTGAAGGTGATGGTG
+GTGGTGGAG
+>ds2020-328_969
+CGTCTATCCCGACCAACGTCTATCCCGACCAGTGGTATTAATCGTCTATCCCGACCGCCG
+TAATTCA
+>ds2020-328_970
+GGTCGGGATAGACGCCGCGGTATCCTGGTCGGGATAGACGGTAATATTGCCTGGTCGGGA
+TAGACG
+>ds2020-328_971
+GGTCGGGATAGACGAGATAATTACCTGGTCGGGATAGACGTCATGAGTCCCTGGTCGGGA
+TAGACG
+>ds2020-328_972
+CGTCTATCCCGACCAGGCGGTGTATACGCCAATCCCGACCAGGGGGTTAGGGCGTCTATC
+CCGACC
+>ds2020-328_973
+GGTCGGGATAGACGGAACATGACGCTGGTCGGGATAGACGACATAGACCCCTGGTCGGGA
+TAGAC
+>ds2020-328_974
+TTCGAGCCTCTTTAGCAAGCCCCTCTTCGAGCCTCTTTAGCAAGCCCCTCTTCGAAAGAT
+TCTTT
+>ds2020-328_975
+GGTCGGGATAGACGATCACACCCTGGTCGGGATAGACGCACGAACAGGCTGGTCGGGATA
+GACG
+>ds2020-328_976
+AGTGATGTCAGTGATGTCAGTGATGTCAGTGATGTCAGTGATGTCAGTGATGTCAGTGAT
+GTCA
+>ds2020-328_977
+CGTCTATCCCGACCAGGGGCAAATTGCGTCTATCCCGACCAAATCCTTCGTCTATCCCGA
+CCG
+>ds2020-328_978
+GTAGGTCCGTAGGTCCGTAGGTCCGTAGGTCCGTAGGTCCGTAGGTCCGTAGGTCCGTAG
+GTC
+>ds2020-328_979
+GGTCGGGATAGACGGATGGACTCGTGGTCGTGATAGACGTTTCCCAGTCTGTCGGGATAG
+ACG
+>ds2020-328_980
+TCACTTTTCACTTTTCACTTTTCACTTTTCACTTTTCACTTTTCACTTTTCACTTTTCAC
+TT
+>ds2020-328_981
+CATACGTCATACGTCATACGTCATACGTCATACGTCATACGTCATACGTCATACGTCATA
+CG
+>ds2020-328_982
+GGTCGGGATAGACGAACAAAGACACTGGTCGGGATAGACGCTCGATACTACTGGTCGGGA
+TA
+>ds2020-328_983
+TTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGG
+T
+>ds2020-328_984
+GTGGTGGAGACTTGTAGTGGTATGGGTGCTTGGGTGGTGAAGGTGATGGTGGTGGGGGAG
+>ds2020-328_985
+CATCCATCCATCCATCCATCCATCCATCCATCCATCCATCCATCCATCCATCCATCCAT
+>ds2020-328_986
+TTCCGATCTGAATTACGGCGGTCGGGATAGACGATAGCCACCACTGGTCGGGATAGACG
+>ds2020-328_987
+GTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTG
+>ds2020-328_988
+GGTCGGGATAGACGCATGCATTGTCTGGTCGGGATAGACGGCGCGCTGCACTGTCGG
+>ds2020-328_989
+GGTCGGGATAGACGTTAGCACCCACTGGTCGGGATAGACGAGACAGTTAGCTGGTCG
+>ds2020-328_990
+GGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGG
+>ds2020-328_991
+GGTCGGGATAGACGTAGACAGCCCCCGGTCGGGATAGACGTTAATTTCTGCTGGTC
+>ds2020-328_992
+GGTCGGGATAGACGATTATGCTCTCTGGTCGGGATAGACGTGTGACTCCCCTGGTC
diff -r 000000000000 -r b82ce29791e7 test-data/otu_s2_rps.tab
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/otu_s2_rps.tab Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,149 @@
+#query_id query_length cdd_id hit_id evalue startQ endQ frame description superkingdom no rank family genus
+"ds2020-328_1" "2975" "pfam00006" "gnl|CDD|376291" "6.25354e-106" "1359" "2033" "-1" "pfam00006, ATP-synt_ab, ATP synthase alpha/beta family, nucleotide-binding domain. This entry includes the ATP synthase alpha and beta subunits, the ATP synthase associated with flagella and the termination factor Rho." "Bacteria(0.88);Archaea(0.07);Eukaryota(0.05);" "(1.00);" "(0.07);Mycoplasmataceae(0.06);Clostridiaceae(0.04);Spirochaetaceae(0.03);Rhodobacteraceae(0.02);" "Mycoplasma(0.06);(0.03);Clostridium(0.03);Treponema(0.01);Persephonella(0.01);"
+"ds2020-328_1" "2975" "pfam00306" "gnl|CDD|366015" "1.33353e-53" "1008" "1340" "-1" "pfam00306, ATP-synt_ab_C, ATP synthase alpha/beta chain, C terminal domain. " "Bacteria(0.94);Eukaryota(0.06);" "(1.00);" "(0.08);Mycoplasmataceae(0.08);Clostridiaceae(0.06);Ruminococcaceae(0.03);Eubacteriaceae(0.02);" "Mycoplasma(0.07);(0.07);Clostridium(0.05);Eubacterium(0.02);Faecalibacterium(0.01);"
+"ds2020-328_1" "2975" "pfam02874" "gnl|CDD|367225" "8.80807e-19" "2202" "2405" "-1" "pfam02874, ATP-synt_ab_N, ATP synthase alpha/beta family, beta-barrel domain. This family includes the ATP synthase alpha and beta subunits the ATP synthase associated with flagella." "Bacteria(0.60);Eukaryota(0.28);Archaea(0.13);" "(1.00);" "Spirochaetaceae(0.04);Bacillaceae(0.04);Schizosaccharomycetaceae(0.03);Chlamydomonadaceae(0.03);Sulfolobaceae(0.03);" "Treponema(0.04);Schizosaccharomyces(0.03);Chlamydomonas(0.03);Bacillus(0.03);Thermotoga(0.02);"
+"ds2020-328_10" "1434" "pfam17917" "gnl|CDD|375428" "1.68574e-20" "187" "453" "-1" "pfam17917, RT_RNaseH, RNase H-like domain found in reverse transcriptase. DNA polymerase and ribonuclease H (RNase H) activities allow reverse transcriptases to convert the single-stranded retroviral RNA genome into double-stranded DNA, which is integrated into the host chromosome during infection. This entry represents the RNase H like domain." "unknown" "unknown" "unknown" "unknown"
+"ds2020-328_10" "1434" "pfam00078" "gnl|CDD|365856" "1.48081e-05" "920" "1051" "-3" "pfam00078, RVT_1, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses." "Eukaryota(0.62);Viruses(0.23);Bacteria(0.15);" "(0.77);Ortervirales(0.21);Poxviridae(0.02);" "Retroviridae(0.15);Drosophilidae(0.15);Brassicaceae(0.12);Enterobacteriaceae(0.09);Caulimoviridae(0.06);" "Drosophila(0.15);Arabidopsis(0.12);Lentivirus(0.08);Escherichia(0.08);Bombyx(0.05);"
+"ds2020-328_101" "454" "pfam14111" "gnl|CDD|372914" "8.33283e-09" "213" "353" "3" "pfam14111, DUF4283, Domain of unknown function (DUF4283). This domain family is found in plants, and is approximately 100 amino acids in length. Considering the very diverse range of other domains it is associated with it is possible that this domain is a binding/guiding region. There are two highly conserved tryptophan residues." "Eukaryota(1.00);" "(1.00);" "Salicaceae(0.35);Brassicaceae(0.27);Poaceae(0.13);Vitaceae(0.08);Solanaceae(0.06);" "Populus(0.35);Brassica(0.13);Arabidopsis(0.11);Brachypodium(0.10);Vitis(0.08);"
+"ds2020-328_106" "446" "pfam01348" "gnl|CDD|279664" "1.08017e-09" "40" "303" "-3" "pfam01348, Intron_maturas2, Type II intron maturase. Group II introns use intron-encoded reverse transcriptase, maturase and DNA endonuclease activities for site-specific insertion into DNA. Although this type of intron is self splicing in vitro they require a maturase protein for splicing in vivo. It has been shown that a specific region of the aI2 intron is needed for the maturase function. This region was found to be conserved in group II introns and called domain X." "Eukaryota(1.00);" "(1.00);" "Saccharomycetaceae(0.40);Brassicaceae(0.20);Schizosaccharomycetaceae(0.20);Poaceae(0.20);" "Saccharomyces(0.40);Hordeum(0.20);Schizosaccharomyces(0.20);Baimashania(0.20);"
+"ds2020-328_109" "442" "pfam02123" "gnl|CDD|280316" "1.59804e-23" "115" "429" "-2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_113" "433" "pfam00253" "gnl|CDD|376307" "1.11487e-07" "329" "415" "2" "pfam00253, Ribosomal_S14, Ribosomal protein S14p/S29e. This family includes both ribosomal S14 from prokaryotes and S29 from eukaryotes." "Bacteria(0.75);Eukaryota(0.25);" "(1.00);" "(0.08);Clostridiaceae(0.02);Mycoplasmataceae(0.02);Lactobacillaceae(0.02);Saccharomycetaceae(0.02);" "(0.03);Clostridium(0.02);Lactobacillus(0.02);Mycoplasma(0.02);"
+"ds2020-328_115" "426" "pfam00078" "gnl|CDD|365856" "4.24722e-08" "268" "405" "-1" "pfam00078, RVT_1, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses." "Eukaryota(0.62);Viruses(0.23);Bacteria(0.15);" "(0.77);Ortervirales(0.21);Poxviridae(0.02);" "Retroviridae(0.15);Drosophilidae(0.15);Brassicaceae(0.12);Enterobacteriaceae(0.09);Caulimoviridae(0.06);" "Drosophila(0.15);Arabidopsis(0.12);Lentivirus(0.08);Escherichia(0.08);Bombyx(0.05);"
+"ds2020-328_115" "426" "pfam17919" "gnl|CDD|375430" "4.69948e-06" "13" "81" "-1" "pfam17919, RT_RNaseH_2, RNase H-like domain found in reverse transcriptase. " "unknown" "unknown" "unknown" "unknown"
+"ds2020-328_118" "424" "pfam00665" "gnl|CDD|366234" "6.81632e-21" "93" "413" "3" "pfam00665, rve, Integrase core domain. Integrase mediates integration of a DNA copy of the viral genome into the host chromosome. Integrase is composed of three domains. The amino-terminal domain is a zinc binding domain pfam02022. This domain is the central catalytic domain. The carboxyl terminal domain that is a non-specific DNA binding domain pfam00552. The catalytic domain acts as an endonuclease when two nucleotides are removed from the 3' ends of the blunt-ended viral DNA made by reverse transcription. This domain also catalyzes the DNA strand transfer reaction of the 3' ends of the viral DNA to the 5' ends of the integration site." "Bacteria(0.76);Viruses(0.14);Eukaryota(0.09);Archaea(0.01);" "(0.86);Ortervirales(0.12);Inoviridae(0.03);" "Retroviridae(0.12);Mycobacteriaceae(0.09);Streptococcaceae(0.08);Enterobacteriaceae(0.06);Burkholderiaceae(0.05);" "Mycobacterium(0.09);Streptomyces(0.05);Escherichia(0.05);Burkholderia(0.04);Sinorhizobium(0.04);"
+"ds2020-328_124" no_hit
+"ds2020-328_136" "372" "pfam02123" "gnl|CDD|280316" "8.1339e-10" "160" "363" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_15" "1120" "pfam00146" "gnl|CDD|376297" "8.26121e-18" "936" "1097" "-3" "pfam00146, NADHdh, NADH dehydrogenase. " "Bacteria(0.78);Archaea(0.12);Eukaryota(0.10);" "(1.00);" "(0.04);Peptococcaceae(0.02);Flavobacteriaceae(0.02);Desulfurococcaceae(0.02);Prevotellaceae(0.02);" "(0.02);Prevotella(0.02);Bacteroides(0.01);"
+"ds2020-328_153" "353" "pfam01385" "gnl|CDD|366606" "1.33121e-13" "52" "330" "-3" "pfam01385, OrfB_IS605, Probable transposase. This family includes IS891, IS1136 and IS1341. DUF1225, pfam06774, has now been merged into this family." "Bacteria(0.57);Archaea(0.38);Viruses(0.05);" "(0.95);Bicaudaviridae(0.05);" "Sulfolobaceae(0.19);Mycobacteriaceae(0.10);Thermoproteaceae(0.10);Synergistaceae(0.05);Halorubraceae(0.05);" "Caldivirga(0.10);Mycobacterium(0.10);Saccharolobus(0.10);Sulfurisphaera(0.05);Synechocystis(0.05);"
+"ds2020-328_154" "351" "pfam00146" "gnl|CDD|376297" "1.33812e-16" "131" "331" "-3" "pfam00146, NADHdh, NADH dehydrogenase. " "Bacteria(0.78);Archaea(0.12);Eukaryota(0.10);" "(1.00);" "(0.04);Peptococcaceae(0.02);Flavobacteriaceae(0.02);Desulfurococcaceae(0.02);Prevotellaceae(0.02);" "(0.02);Prevotella(0.02);Bacteroides(0.01);"
+"ds2020-328_170" "343" "pfam02123" "gnl|CDD|280316" "1.56034e-16" "85" "330" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_172" "338" "pfam02123" "gnl|CDD|280316" "9.08289e-09" "87" "305" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_176" "336" "pfam00361" "gnl|CDD|366050" "7.24395e-08" "101" "256" "-3" "pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla." "Eukaryota(0.54);Bacteria(0.46);" "(1.00);" "Culicidae(0.23);Rhodobacteraceae(0.23);Poaceae(0.15);Enterobacteriaceae(0.15);Phasianidae(0.08);" "Paracoccus(0.23);Anopheles(0.23);Escherichia(0.15);Zea(0.15);Aspergillus(0.08);"
+"ds2020-328_177" "335" "pfam00346" "gnl|CDD|366043" "6.6413e-32" "147" "314" "3" "pfam00346, Complex1_49kDa, Respiratory-chain NADH dehydrogenase, 49 Kd subunit. " "Bacteria(0.80);Eukaryota(0.11);Archaea(0.09);" "(1.00);" "(0.06);Rhodobacteraceae(0.02);Acetobacteraceae(0.02);Campylobacteraceae(0.02);Rhodospirillaceae(0.02);" "(0.01);Geobacter(0.01);Campylobacter(0.01);Archaeoglobus(0.01);"
+"ds2020-328_188" no_hit
+"ds2020-328_193" "321" "pfam03040" "gnl|CDD|367312" "3.21306e-19" "69" "296" "3" "pfam03040, CemA, CemA family. Members of this family are probable integral membrane proteins. Their molecular function is unknown. CemA proteins are found in the inner envelope membrane of chloroplasts but not in the thylakoid membrane. A cyanobacterial member of this family has been implicated in CO2 transport, but is probably not a CO2 transporter itself. They are predicted to be haem-binding however this has not been proven experimentally." "Bacteria(0.77);Eukaryota(0.23);" "(1.00);" "Synechococcaceae(0.17);Aphanothecaceae(0.08);Microcoleaceae(0.06);Chlorellaceae(0.04);Merismopediaceae(0.04);" "Synechococcus(0.13);Oscillatoria(0.04);Physcomitrella(0.04);Microcystis(0.04);Synechocystis(0.04);"
+"ds2020-328_196" "318" "pfam02123" "gnl|CDD|280316" "1.94206e-07" "6" "284" "-2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_197" "318" "pfam03154" "gnl|CDD|367360" "8.39525e-05" "24" "158" "-2" "pfam03154, Atrophin-1, Atrophin-1 family. Atrophin-1 is the protein product of the dentatorubral-pallidoluysian atrophy (DRPLA) gene. DRPLA OMIM:125370 is a progressive neurodegenerative disorder. It is caused by the expansion of a CAG repeat in the DRPLA gene on chromosome 12p. This results in an extended polyglutamine region in atrophin-1, that is thought to confer toxicity to the protein, possibly through altering its interactions with other proteins. The expansion of a CAG repeat is also the underlying defect in six other neurodegenerative disorders, including Huntington's disease. One interaction of expanded polyglutamine repeats that is thought to be pathogenic is that with the short glutamine repeat in the transcriptional coactivator CREB binding protein, CBP. This interaction draws CBP away from its usual nuclear location to the expanded polyglutamine repeat protein aggregates that are characteristic of the polyglutamine neurodegenerative disorders. This interferes with CBP-mediated transcription and causes cytotoxicity." "Eukaryota(1.00);" "(1.00);" "Muridae(0.20);Coelacanthidae(0.20);Characidae(0.20);Cyprinidae(0.20);Cichlidae(0.20);" "Rattus(0.20);Danio(0.20);Astyanax(0.20);Oreochromis(0.20);Latimeria(0.20);"
+"ds2020-328_199" "316" "pfam13650" "gnl|CDD|379313" "2.17852e-11" "2" "229" "-1" "pfam13650, Asp_protease_2, Aspartyl protease. This family consists of predicted aspartic proteases, typically from 180 to 230 amino acids in length, in MEROPS clan AA. This model describes the well-conserved 121-residue C-terminal region. The poorly conserved, variable length N-terminal region usually contains a predicted transmembrane helix." "Bacteria(0.81);Eukaryota(0.17);Archaea(0.02);" "(1.00);" "Flavobacteriaceae(0.06);Bacteroidaceae(0.06);Rhizobiaceae(0.05);Caulobacteraceae(0.05);Cytophagaceae(0.04);" "Bacteroides(0.06);Geobacter(0.02);Phenylobacterium(0.02);Agrobacterium(0.02);Spirosoma(0.02);"
+"ds2020-328_207" "313" "pfam02123" "gnl|CDD|280316" "1.55736e-08" "34" "306" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_210" "311" "pfam00124" "gnl|CDD|365890" "2.92409e-39" "14" "283" "2" "pfam00124, Photo_RC, Photosynthetic reaction centre protein. " "Bacteria(0.95);Eukaryota(0.05);" "(1.00);" "Rhodobacteraceae(0.13);Chromatiaceae(0.13);Ectothiorhodospiraceae(0.08);Synechococcaceae(0.05);(0.05);" "Rhodobacter(0.08);Sphingomonas(0.05);Halorhodospira(0.05);Roseiflexus(0.05);Thioflavicoccus(0.05);"
+"ds2020-328_219" "306" "pfam07727" "gnl|CDD|369488" "2.43458e-28" "22" "285" "-1" "pfam07727, RVT_2, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses. This Pfam entry includes reverse transcriptases not recognized by the pfam00078 model." "Eukaryota(1.00);" "(1.00);" "Debaryomycetaceae(0.83);Saccharomycetaceae(0.17);" "Candida(0.50);Debaryomyces(0.33);Saccharomyces(0.17);"
+"ds2020-328_222" "304" "pfam00471" "gnl|CDD|376336" "2.61553e-13" "31" "201" "-2" "pfam00471, Ribosomal_L33, Ribosomal protein L33. " "Bacteria(0.86);Eukaryota(0.14);" "(1.00);" "(0.07);Mycoplasmataceae(0.07);Clostridiaceae(0.06);Bacillaceae(0.03);Lactobacillaceae(0.03);" "Mycoplasma(0.06);Clostridium(0.05);(0.04);Lactobacillus(0.02);Bacillus(0.02);"
+"ds2020-328_226" "300" "pfam02123" "gnl|CDD|280316" "5.93549e-06" "76" "276" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_229" "299" "pfam02123" "gnl|CDD|280316" "2.23217e-17" "58" "276" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_235" "295" "pfam00006" "gnl|CDD|376291" "7.80612e-20" "51" "284" "3" "pfam00006, ATP-synt_ab, ATP synthase alpha/beta family, nucleotide-binding domain. This entry includes the ATP synthase alpha and beta subunits, the ATP synthase associated with flagella and the termination factor Rho." "Bacteria(0.88);Archaea(0.07);Eukaryota(0.05);" "(1.00);" "(0.07);Mycoplasmataceae(0.06);Clostridiaceae(0.04);Spirochaetaceae(0.03);Rhodobacteraceae(0.02);" "Mycoplasma(0.06);(0.03);Clostridium(0.03);Treponema(0.01);Persephonella(0.01);"
+"ds2020-328_241" no_hit
+"ds2020-328_244" "292" "pfam01737" "gnl|CDD|366779" "1.98587e-12" "60" "224" "3" "pfam01737, Ycf9, YCF9. This family consists of the hypothetical protein product of the YCF9 gene from chloroplasts and cyanobacteria. These proteins have no known function." "Bacteria(0.76);Eukaryota(0.24);" "(1.00);" "Synechococcaceae(0.15);Prochloraceae(0.09);Phaeodactylaceae(0.06);Bathycoccaceae(0.03);Poaceae(0.03);" "Synechococcus(0.12);Prochlorococcus(0.09);Phaeodactylum(0.06);Stanieria(0.03);Acaryochloris(0.03);"
+"ds2020-328_249" "290" "pfam00115" "gnl|CDD|376293" "5.40542e-13" "18" "248" "3" "pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I. " "Bacteria(0.87);Archaea(0.09);Eukaryota(0.04);" "(1.00);" "(0.07);Sulfolobaceae(0.03);Flavobacteriaceae(0.03);Bacillaceae(0.02);Burkholderiaceae(0.02);" "(0.03);Methylobacterium(0.01);Hyphomicrobium(0.01);Rhodanobacter(0.01);"
+"ds2020-328_251" "288" "pfam02123" "gnl|CDD|280316" "1.42582e-09" "22" "270" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_26" "872" "pfam01443" "gnl|CDD|366646" "1.90681e-33" "10" "699" "-3" "pfam01443, Viral_helicase1, Viral (Superfamily 1) RNA helicase. Helicase activity for this family has been demonstrated and NTPase activity. This helicase has multiple roles at different stages of viral RNA replication, as dissected by mutational analysis." "Viruses(1.00);" "Riboviria(0.99);unclassified viruses(0.01);" "Alphaflexiviridae(0.36);Virgaviridae(0.24);Betaflexiviridae(0.15);Tymoviridae(0.10);Bromoviridae(0.07);" "Potexvirus(0.26);Allexivirus(0.10);Tymovirus(0.08);Carlavirus(0.08);Tobamovirus(0.08);"
+"ds2020-328_272" "281" "pfam00253" "gnl|CDD|376307" "1.57301e-14" "125" "256" "2" "pfam00253, Ribosomal_S14, Ribosomal protein S14p/S29e. This family includes both ribosomal S14 from prokaryotes and S29 from eukaryotes." "Bacteria(0.75);Eukaryota(0.25);" "(1.00);" "(0.08);Clostridiaceae(0.02);Mycoplasmataceae(0.02);Lactobacillaceae(0.02);Saccharomycetaceae(0.02);" "(0.03);Clostridium(0.02);Lactobacillus(0.02);Mycoplasma(0.02);"
+"ds2020-328_273" "280" "pfam13976" "gnl|CDD|372857" "1.39388e-05" "38" "160" "-1" "pfam13976, gag_pre-integrs, GAG-pre-integrase domain. This domain is found associated with retroviral insertion elements and lies just upstream of the integrase region on the polyproteins." "Eukaryota(1.00);" "(1.00);" "Vitaceae(0.49);Poaceae(0.30);Brassicaceae(0.11);Trichocomaceae(0.02);Fabaceae(0.01);" "Vitis(0.49);Oryza(0.28);Arabidopsis(0.10);Talaromyces(0.02);Zea(0.02);"
+"ds2020-328_285" "275" "pfam00954" "gnl|CDD|366384" "3.5917e-06" "91" "264" "-3" "pfam00954, S_locus_glycop, S-locus glycoprotein domain. In Brassicaceae, self-incompatible plants have a self/non-self recognition system. This is sporophytically controlled by multiple alleles at a single locus (S). S-locus glycoproteins, as well as S-receptor kinases, are in linkage with the S-alleles. This region is inferred to be a domain due to it having other domains adjacent to it." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.96);Poaceae(0.04);" "Arabidopsis(0.89);Brassica(0.07);Sorghum(0.04);"
+"ds2020-328_29" "847" "pfam13456" "gnl|CDD|372609" "2.18686e-07" "176" "397" "2" "pfam13456, RVT_3, Reverse transcriptase-like. This domain is found in plants and appears to be part of a retrotransposon." "Eukaryota(0.85);Bacteria(0.15);" "(1.00);" "Euphorbiaceae(0.30);Brassicaceae(0.22);Poaceae(0.22);Aphanothecaceae(0.11);Peronosporaceae(0.04);" "Ricinus(0.30);Arabidopsis(0.22);Oryza(0.19);Gloeothece(0.07);Synechocystis(0.04);"
+"ds2020-328_293" "272" "pfam02123" "gnl|CDD|280316" "4.40145e-17" "17" "259" "-2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_295" no_hit
+"ds2020-328_300" "271" "pfam02392" "gnl|CDD|308156" "2.01502e-45" "15" "239" "-3" "pfam02392, Ycf4, Ycf4. This family consists of hypothetical Ycf4 proteins from various chloroplast genomes. It has been suggested that Ycf4 is involved in the assembly and/or stability of the photosystem I complex in chloroplasts." "Bacteria(0.78);Eukaryota(0.22);" "(1.00);" "Synechococcaceae(0.17);Aphanothecaceae(0.09);Prochloraceae(0.07);Microcoleaceae(0.06);Oscillatoriaceae(0.04);" "Synechococcus(0.13);Prochlorococcus(0.07);Oscillatoria(0.04);Gloeobacter(0.04);Cyanobium(0.02);"
+"ds2020-328_303" "271" "pfam02123" "gnl|CDD|280316" "5.58457e-14" "3" "206" "-3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_309" "270" "pfam07727" "gnl|CDD|369488" "1.02409e-13" "2" "157" "-3" "pfam07727, RVT_2, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses. This Pfam entry includes reverse transcriptases not recognized by the pfam00078 model." "Eukaryota(1.00);" "(1.00);" "Debaryomycetaceae(0.83);Saccharomycetaceae(0.17);" "Candida(0.50);Debaryomyces(0.33);Saccharomyces(0.17);"
+"ds2020-328_312" no_hit
+"ds2020-328_319" "268" "pfam00112" "gnl|CDD|365882" "8.20186e-05" "73" "150" "1" "pfam00112, Peptidase_C1, Papain family cysteine protease. " "Eukaryota(0.96);Viruses(0.03);" "(0.97);Baculoviridae(0.03);" "Rhabditidae(0.10);Poaceae(0.07);Fabaceae(0.07);Haemonchidae(0.06);Brassicaceae(0.06);" "Caenorhabditis(0.10);Arabidopsis(0.05);Haemonchus(0.05);Homo(0.04);Entamoeba(0.03);"
+"ds2020-328_322" "268" "pfam01425" "gnl|CDD|366635" "5.34115e-12" "33" "248" "3" "pfam01425, Amidase, Amidase. " "Bacteria(0.58);Eukaryota(0.32);Archaea(0.10);" "(1.00);" "Mycobacteriaceae(0.19);Rhabditidae(0.10);Archaeoglobaceae(0.06);Aspergillaceae(0.06);Merismopediaceae(0.06);" "Mycobacterium(0.19);Caenorhabditis(0.10);Synechocystis(0.06);Aspergillus(0.06);Saccharomyces(0.06);"
+"ds2020-328_326" "267" "pfam00385" "gnl|CDD|366065" "3.90569e-05" "64" "192" "1" "pfam00385, Chromo, Chromo (CHRromatin Organisation MOdifier) domain. " "Eukaryota(1.00);" "(1.00);" "Hominidae(0.18);Drosophilidae(0.13);Schizosaccharomycetaceae(0.09);Rhabditidae(0.08);Brassicaceae(0.07);" "Homo(0.16);Drosophila(0.13);Schizosaccharomyces(0.09);Caenorhabditis(0.08);Arabidopsis(0.07);"
+"ds2020-328_335" "266" "pfam02123" "gnl|CDD|280316" "2.32783e-14" "26" "265" "2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_361" "260" "pfam00069" "gnl|CDD|365850" "2.38711e-21" "15" "242" "3" "pfam00069, Pkinase, Protein kinase domain. " "Eukaryota(1.00);" "(1.00);" "Saccharomycetaceae(0.31);Hominidae(0.17);Muridae(0.14);Schizosaccharomycetaceae(0.11);Drosophilidae(0.06);" "Saccharomyces(0.31);Homo(0.17);Schizosaccharomyces(0.11);Rattus(0.08);Drosophila(0.06);"
+"ds2020-328_364" "259" "pfam02491" "gnl|CDD|376796" "1.8796e-18" "85" "249" "1" "pfam02491, SHS2_FTSA, SHS2 domain inserted in FTSA. FtsA is essential for bacterial cell division, and co-localizes to the septal ring with FtsZ. The SHS2 domain is inserted in to the RNAseH fold of FtsA, and is involved in protein-protein interaction." "Bacteria(1.00);" "(1.00);" "(0.07);Prevotellaceae(0.04);Spirochaetaceae(0.04);Flavobacteriaceae(0.03);Helicobacteraceae(0.02);" "(0.04);Prevotella(0.04);Clostridium(0.02);Helicobacter(0.02);Bacteroides(0.02);"
+"ds2020-328_37" "681" "pfam00416" "gnl|CDD|366086" "4.04787e-35" "92" "409" "-3" "pfam00416, Ribosomal_S13, Ribosomal protein S13/S18. This family includes ribosomal protein S13 from prokaryotes and S18 from eukaryotes." "Eukaryota(0.55);Bacteria(0.27);Archaea(0.18);" "(1.00);" "Brassicaceae(0.18);Muridae(0.09);Poaceae(0.09);Drosophilidae(0.09);Mycobacteriaceae(0.09);" "Arabidopsis(0.18);Geobacillus(0.09);Rattus(0.09);Haloarcula(0.09);Shigella(0.09);"
+"ds2020-328_386" "255" "pfam04332" "gnl|CDD|367905" "1.67088e-13" "22" "162" "1" "pfam04332, DUF475, Protein of unknown function (DUF475). Predicted to be an integral membrane protein with multiple membrane spans." "Bacteria(1.00);" "(1.00);" "Mycobacteriaceae(0.29);Sphingomonadaceae(0.14);Streptococcaceae(0.14);Xanthomonadaceae(0.14);Deinococcaceae(0.14);" "Mycobacterium(0.29);Deinococcus(0.14);Streptomyces(0.14);Lactococcus(0.14);Xylella(0.14);"
+"ds2020-328_388" "255" "pfam05919" "gnl|CDD|253459" "2.68273e-30" "4" "237" "-1" "pfam05919, Mitovir_RNA_pol, Mitovirus RNA-dependent RNA polymerase. This family consists of several Mitovirus RNA-dependent RNA polymerase proteins. The family also contains fragment matches in the mitochondria of Arabidopsis thaliana." "Viruses(0.90);Eukaryota(0.10);" "Riboviria(0.90);(0.10);" "Narnaviridae(0.90);Ceratobasidiaceae(0.10);" "Mitovirus(0.90);Thanatephorus(0.10);"
+"ds2020-328_395" "254" "pfam02123" "gnl|CDD|280316" "3.0801e-11" "25" "240" "-3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_4" "2545" "pfam00177" "gnl|CDD|365924" "1.11505e-28" "229" "618" "1" "pfam00177, Ribosomal_S7, Ribosomal protein S7p/S5e. This family contains ribosomal protein S7 from prokaryotes and S5 from eukaryotes." "Bacteria(0.79);Archaea(0.11);Eukaryota(0.10);" "(1.00);" "(0.09);Clostridiaceae(0.04);Mycoplasmataceae(0.03);Spirochaetaceae(0.02);Ruminococcaceae(0.01);" "(0.04);Clostridium(0.04);Mycoplasma(0.03);Treponema(0.01);Desulfovibrio(0.01);"
+"ds2020-328_401" "253" "pfam02123" "gnl|CDD|280316" "1.12879e-10" "29" "193" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_414" "251" "pfam02123" "gnl|CDD|280316" "1.26275e-09" "31" "234" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_415" "251" "pfam01058" "gnl|CDD|376447" "2.16687e-17" "20" "229" "-2" "pfam01058, Oxidored_q6, NADH ubiquinone oxidoreductase, 20 Kd subunit. " "Bacteria(0.70);Archaea(0.30);" "(1.00);" "(0.05);Syntrophobacteraceae(0.04);Aquificaceae(0.04);Methanosarcinaceae(0.04);Thermococcaceae(0.04);" "Methanosarcina(0.04);Syntrophobacter(0.04);Pyrococcus(0.03);Geobacter(0.03);Methanococcus(0.03);"
+"ds2020-328_419" "250" "pfam10369" "gnl|CDD|378420" "1.59899e-17" "75" "212" "-3" "pfam10369, ALS_ss_C, Small subunit of acetolactate synthase. ALS_ss_C is the C-terminal half of a family of proteins which are the small subunits of acetolactate synthase. Acetolactate synthase is a tetrameric enzyme, containing probably two large and two small subunits, which catalyzes the first step in branched-chain amino acid biosynthesis. This reaction is sensitive to certain herbicides." "Bacteria(0.90);Archaea(0.06);Eukaryota(0.04);" "(1.00);" "(0.07);Clostridiaceae(0.06);Lachnospiraceae(0.05);Ruminococcaceae(0.03);Peptococcaceae(0.03);" "Clostridium(0.06);(0.05);Eubacterium(0.03);Ruminococcus(0.02);Roseburia(0.02);"
+"ds2020-328_43" "644" "pfam00078" "gnl|CDD|365856" "2.15977e-08" "190" "636" "-3" "pfam00078, RVT_1, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses." "Eukaryota(0.62);Viruses(0.23);Bacteria(0.15);" "(0.77);Ortervirales(0.21);Poxviridae(0.02);" "Retroviridae(0.15);Drosophilidae(0.15);Brassicaceae(0.12);Enterobacteriaceae(0.09);Caulimoviridae(0.06);" "Drosophila(0.15);Arabidopsis(0.12);Lentivirus(0.08);Escherichia(0.08);Bombyx(0.05);"
+"ds2020-328_430" "248" "pfam00931" "gnl|CDD|366375" "1.82192e-16" "27" "245" "-1" "pfam00931, NB-ARC, NB-ARC domain. " "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.75);Solanaceae(0.12);Hominidae(0.12);" "Arabidopsis(0.75);Solanum(0.12);Homo(0.12);"
+"ds2020-328_431" "247" "pfam01788" "gnl|CDD|366811" "4.75718e-09" "24" "116" "3" "pfam01788, PsbJ, PsbJ. This family consists of the photosystem II reaction centre protein PsbJ from plants and Cyanobacteria. In Synechocystis sp. PCC 6803 PsbJ regulates the number of photosystem II centers in thylakoid membranes, it is a predicted 4kDa protein with one membrane spanning domain." "Bacteria(0.65);Eukaryota(0.35);" "(1.00);" "Microcoleaceae(0.12);Prochloraceae(0.08);Oscillatoriaceae(0.08);Synechococcaceae(0.08);Chroococcaceae(0.08);" "Oscillatoria(0.08);Prochlorococcus(0.08);Synechococcus(0.08);Ectocarpus(0.04);Arenga(0.04);"
+"ds2020-328_432" "247" "pfam00116" "gnl|CDD|365885" "2.6628e-32" "16" "159" "1" "pfam00116, COX2, Cytochrome C oxidase subunit II, periplasmic domain. " "Eukaryota(1.00);" "(1.00);" "Saccharomycetaceae(0.09);Sordariaceae(0.09);Phasianidae(0.09);Cercopithecidae(0.09);Schizosaccharomycetaceae(0.09);" "Gallus(0.09);Triticum(0.09);Sus(0.09);Neurospora(0.09);Oryzias(0.09);"
+"ds2020-328_452" no_hit
+"ds2020-328_457" no_hit
+"ds2020-328_462" "244" "pfam02123" "gnl|CDD|280316" "7.52004e-11" "18" "236" "3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_464" "244" "pfam00421" "gnl|CDD|366090" "1.67641e-26" "57" "242" "-3" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-328_47" "623" "pfam00346" "gnl|CDD|366043" "7.39818e-56" "191" "496" "-2" "pfam00346, Complex1_49kDa, Respiratory-chain NADH dehydrogenase, 49 Kd subunit. " "Bacteria(0.80);Eukaryota(0.11);Archaea(0.09);" "(1.00);" "(0.06);Rhodobacteraceae(0.02);Acetobacteraceae(0.02);Campylobacteraceae(0.02);Rhodospirillaceae(0.02);" "(0.01);Geobacter(0.01);Campylobacter(0.01);Archaeoglobus(0.01);"
+"ds2020-328_473" "243" "pfam00146" "gnl|CDD|376297" "3.36196e-12" "16" "114" "1" "pfam00146, NADHdh, NADH dehydrogenase. " "Bacteria(0.78);Archaea(0.12);Eukaryota(0.10);" "(1.00);" "(0.04);Peptococcaceae(0.02);Flavobacteriaceae(0.02);Desulfurococcaceae(0.02);Prevotellaceae(0.02);" "(0.02);Prevotella(0.02);Bacteroides(0.01);"
+"ds2020-328_476" "243" "pfam02123" "gnl|CDD|280316" "1.20816e-09" "22" "237" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_485" no_hit
+"ds2020-328_490" "241" "pfam00016" "gnl|CDD|365810" "1.89423e-13" "2" "121" "2" "pfam00016, RuBisCO_large, Ribulose bisphosphate carboxylase large chain, catalytic domain. The C-terminal domain of RuBisCO large chain is the catalytic domain adopting a TIM barrel fold." "Bacteria(0.89);Eukaryota(0.05);Archaea(0.05);" "(1.00);" "Rhodospirillaceae(0.11);Oceanospirillaceae(0.11);Rhodobacteraceae(0.11);Prochloraceae(0.05);Thalassiosiraceae(0.05);" "Marinomonas(0.11);Magnetospirillum(0.05);Saccharomonospora(0.05);Rhodospirillum(0.05);Paenibacillus(0.05);"
+"ds2020-328_491" "241" "pfam02123" "gnl|CDD|280316" "7.45437e-11" "2" "241" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_497" "240" "pfam01501" "gnl|CDD|279798" "4.58533e-06" "38" "202" "2" "pfam01501, Glyco_transf_8, Glycosyl transferase family 8. This family includes enzymes that transfer sugar residues to donor molecules. Members of this family are involved in lipopolysaccharide biosynthesis and glycogen synthesis. This family includes Lipopolysaccharide galactosyltransferase, lipopolysaccharide glucosyltransferase 1, and glycogenin glucosyltransferase." "Eukaryota(0.62);Bacteria(0.38);" "(1.00);" "Brassicaceae(0.54);Enterobacteriaceae(0.12);Pasteurellaceae(0.12);Helicobacteraceae(0.08);Bacillaceae(0.04);" "Arabidopsis(0.54);Haemophilus(0.08);Salmonella(0.08);Helicobacter(0.08);Bacillus(0.04);"
+"ds2020-328_50" "620" "pfam00115" "gnl|CDD|376293" "1.44178e-51" "78" "548" "3" "pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I. " "Bacteria(0.87);Archaea(0.09);Eukaryota(0.04);" "(1.00);" "(0.07);Sulfolobaceae(0.03);Flavobacteriaceae(0.03);Bacillaceae(0.02);Burkholderiaceae(0.02);" "(0.03);Methylobacterium(0.01);Hyphomicrobium(0.01);Rhodanobacter(0.01);"
+"ds2020-328_517" "237" "pfam00361" "gnl|CDD|366050" "5.54755e-11" "18" "224" "3" "pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla." "Eukaryota(0.54);Bacteria(0.46);" "(1.00);" "Culicidae(0.23);Rhodobacteraceae(0.23);Poaceae(0.15);Enterobacteriaceae(0.15);Phasianidae(0.08);" "Paracoccus(0.23);Anopheles(0.23);Escherichia(0.15);Zea(0.15);Aspergillus(0.08);"
+"ds2020-328_52" "598" "pfam00115" "gnl|CDD|376293" "2.60011e-33" "21" "302" "3" "pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I. " "Bacteria(0.87);Archaea(0.09);Eukaryota(0.04);" "(1.00);" "(0.07);Sulfolobaceae(0.03);Flavobacteriaceae(0.03);Bacillaceae(0.02);Burkholderiaceae(0.02);" "(0.03);Methylobacterium(0.01);Hyphomicrobium(0.01);Rhodanobacter(0.01);"
+"ds2020-328_536" "236" "pfam00453" "gnl|CDD|376335" "3.91827e-17" "51" "188" "3" "pfam00453, Ribosomal_L20, Ribosomal protein L20. " "Bacteria(0.90);Eukaryota(0.10);" "(1.00);" "(0.10);Clostridiaceae(0.05);Mycoplasmataceae(0.03);Spirochaetaceae(0.02);Synergistaceae(0.02);" "(0.06);Clostridium(0.04);Mycoplasma(0.03);Treponema(0.01);"
+"ds2020-328_560" "233" "pfam00421" "gnl|CDD|366090" "1.00705e-37" "17" "232" "2" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-328_562" "233" "pfam00201" "gnl|CDD|278624" "3.71727e-13" "22" "195" "1" "pfam00201, UDPGT, UDP-glucoronosyl and UDP-glucosyl transferase. " "Eukaryota(1.00);" "(1.00);" "Hominidae(0.46);Muridae(0.31);Leporidae(0.15);Poaceae(0.08);" "Homo(0.46);Rattus(0.31);Oryctolagus(0.15);Zea(0.08);"
+"ds2020-328_564" "232" "pfam00119" "gnl|CDD|376294" "2.43866e-07" "4" "201" "-2" "pfam00119, ATP-synt_A, ATP synthase A chain. " "Bacteria(0.92);Eukaryota(0.08);" "(1.00);" "(0.05);Flavobacteriaceae(0.03);Clostridiaceae(0.03);Mycoplasmataceae(0.03);Bacillaceae(0.02);" "(0.03);Clostridium(0.03);Mycoplasma(0.02);Bacteroides(0.02);Prevotella(0.02);"
+"ds2020-328_565" "232" "pfam00119" "gnl|CDD|376294" "4.75161e-06" "106" "189" "-2" "pfam00119, ATP-synt_A, ATP synthase A chain. " "Bacteria(0.92);Eukaryota(0.08);" "(1.00);" "(0.05);Flavobacteriaceae(0.03);Clostridiaceae(0.03);Mycoplasmataceae(0.03);Bacillaceae(0.02);" "(0.03);Clostridium(0.03);Mycoplasma(0.02);Bacteroides(0.02);Prevotella(0.02);"
+"ds2020-328_568" "232" "pfam00160" "gnl|CDD|365914" "7.47948e-06" "91" "231" "-2" "pfam00160, Pro_isomerase, Cyclophilin type peptidyl-prolyl cis-trans isomerase/CLD. The peptidyl-prolyl cis-trans isomerases, also known as cyclophilins, share this domain of about 109 amino acids. Cyclophilins have been found in all organisms studied so far and catalyze peptidyl-prolyl isomerisation during which the peptide bond preceding proline (the peptidyl-prolyl bond) is stabilized in the cis conformation. Mammalian cyclophilin A (CypA) is a major cellular target for the immunosuppressive drug cyclosporin A (CsA). Other roles for cyclophilins may include chaperone and cell signalling function." "Bacteria(0.57);Eukaryota(0.41);Archaea(0.02);" "(1.00);" "Flavobacteriaceae(0.09);Theileriidae(0.04);Babesiidae(0.04);Cryptococcaceae(0.04);Vibrionaceae(0.04);" "Cryptococcus(0.04);Vibrio(0.04);Gloeobacter(0.04);Babesia(0.04);Theileria(0.04);"
+"ds2020-328_579" "230" "pfam09220" "gnl|CDD|370369" "3.32926e-12" "15" "212" "3" "pfam09220, LA-virus_coat, L-A virus, major coat protein. Members of this family form the major coat protein of the Saccharomyces cerevisiae L-A virus." "Eukaryota(1.00);" "(1.00);" "Debaryomycetaceae(1.00);" "Debaryomyces(1.00);"
+"ds2020-328_58" "561" "pfam17921" "gnl|CDD|375431" "1.48639e-11" "411" "551" "-2" "pfam17921, Integrase_H2C2, Integrase zinc binding domain. This zinc binding domain is found in a wide variety of integrase proteins." "unknown" "unknown" "unknown" "unknown"
+"ds2020-328_594" "229" "pfam02123" "gnl|CDD|280316" "5.55224e-12" "25" "213" "-2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_597" "229" "pfam00421" "gnl|CDD|366090" "5.55907e-21" "15" "218" "3" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-328_600" "229" "pfam05518" "gnl|CDD|253234" "1.13476e-09" "26" "229" "2" "pfam05518, Totivirus_coat, Totivirus coat protein. " "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(1.00);" "Victorivirus(0.57);Leishmaniavirus(0.29);(0.14);"
+"ds2020-328_604" "228" "pfam01333" "gnl|CDD|366578" "1.59517e-20" "54" "218" "3" "pfam01333, Apocytochr_F_C, Apocytochrome F, C-terminal. This is a sub-family of cytochrome C. See pfam00034." "Bacteria(0.82);Eukaryota(0.18);" "(1.00);" "Synechococcaceae(0.18);Prochloraceae(0.07);Aphanothecaceae(0.07);Nostocaceae(0.05);Microcoleaceae(0.05);" "Synechococcus(0.14);Prochlorococcus(0.07);Gloeobacter(0.04);Oscillatoria(0.04);Nostoc(0.04);"
+"ds2020-328_609" "228" "pfam00006" "gnl|CDD|376291" "1.76934e-18" "20" "211" "2" "pfam00006, ATP-synt_ab, ATP synthase alpha/beta family, nucleotide-binding domain. This entry includes the ATP synthase alpha and beta subunits, the ATP synthase associated with flagella and the termination factor Rho." "Bacteria(0.88);Archaea(0.07);Eukaryota(0.05);" "(1.00);" "(0.07);Mycoplasmataceae(0.06);Clostridiaceae(0.04);Spirochaetaceae(0.03);Rhodobacteraceae(0.02);" "Mycoplasma(0.06);(0.03);Clostridium(0.03);Treponema(0.01);Persephonella(0.01);"
+"ds2020-328_611" "228" "pfam00421" "gnl|CDD|366090" "2.00297e-10" "23" "226" "-3" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-328_62" "551" "pfam02123" "gnl|CDD|280316" "7.88589e-16" "4" "294" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_624" "226" "pfam00421" "gnl|CDD|366090" "2.78889e-19" "14" "193" "2" "pfam00421, PSII, Photosystem II protein. " "Bacteria(0.79);Eukaryota(0.21);" "(1.00);" "Gloeobacteraceae(0.14);Synechococcaceae(0.14);Prochloraceae(0.14);Acaryochloridaceae(0.14);Nostocaceae(0.07);" "Acaryochloris(0.14);Gloeobacter(0.14);Prochlorococcus(0.14);Synechococcus(0.14);Nostoc(0.07);"
+"ds2020-328_625" "226" "pfam01660" "gnl|CDD|366745" "1.80876e-05" "15" "209" "3" "pfam01660, Vmethyltransf, Viral methyltransferase. This RNA methyltransferase domain is found in a wide range of ssRNA viruses, including Hordei-, Tobra-, Tobamo-, Bromo-, Clostero- and Caliciviruses. This methyltransferase is involved in mRNA capping. Capping of mRNA enhances its stability. This usually occurs in the nucleus. Therefore, many viruses that replicate in the cytoplasm encode their own. This is a specific guanine-7-methyltransferase domain involved in viral mRNA cap0 synthesis. Specificity for guanine 7 position is shown by NMR in and in vivo role in cap synthesis. Based on secondary structure prediction, the basic fold is believed to be similar to the common AdoMet-dependent methyltransferase fold. A curious feature of this methyltransferase domain is that it together with flanking sequences seems to have guanylyltransferase activity coupled to the methyltransferase activity. The domain is found throughout the so-called Alphavirus superfamily, (including alphaviruses and several other groups). It forms the defining, unique feature of this superfamily." "Viruses(1.00);" "Riboviria(1.00);" "Betaflexiviridae(0.23);Alphaflexiviridae(0.21);Virgaviridae(0.15);Tymoviridae(0.14);Bromoviridae(0.10);" "Potexvirus(0.16);Carlavirus(0.11);Tymovirus(0.08);Tobamovirus(0.07);Alphavirus(0.05);"
+"ds2020-328_634" "225" "pfam13041" "gnl|CDD|372443" "6.23279e-08" "54" "185" "-2" "pfam13041, PPR_2, PPR repeat family. This repeat has no known function. It is about 35 amino acids long and is found in up to 18 copies in some proteins. The family appears to be greatly expanded in plants and fungi. The repeat has been called PPR." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.30);Euphorbiaceae(0.25);Salicaceae(0.16);Funariaceae(0.05);Poaceae(0.04);" "Arabidopsis(0.30);Ricinus(0.25);Populus(0.16);Physcomitrella(0.05);Naegleria(0.03);"
+"ds2020-328_641" "225" "pfam04392" "gnl|CDD|367921" "7.39814e-09" "28" "177" "-1" "pfam04392, ABC_sub_bind, ABC transporter substrate binding protein. This family contains many hypothetical proteins and some ABC transporter substrate binding proteins." "Bacteria(1.00);" "(1.00);" "Streptococcaceae(0.33);Phyllobacteriaceae(0.17);Pseudomonadaceae(0.17);Rickettsiaceae(0.17);Aquificaceae(0.17);" "Streptococcus(0.33);Rickettsia(0.17);Pseudomonas(0.17);Mesorhizobium(0.17);Aquifex(0.17);"
+"ds2020-328_654" "224" "pfam00223" "gnl|CDD|365957" "8.28468e-21" "41" "205" "-2" "pfam00223, PsaA_PsaB, Photosystem I psaA/psaB protein. " "Bacteria(0.83);Eukaryota(0.17);" "(1.00);" "Prochloraceae(0.28);Synechococcaceae(0.11);Gloeobacteraceae(0.11);Acaryochloridaceae(0.11);Funariaceae(0.06);" "Prochlorococcus(0.28);Acaryochloris(0.11);Gloeobacter(0.11);(0.06);Selaginella(0.06);"
+"ds2020-328_657" no_hit
+"ds2020-328_659" "223" "pfam01809" "gnl|CDD|376620" "7.3686e-08" "121" "189" "-2" "pfam01809, Haemolytic, Haemolytic domain. This domain has haemolytic activity. It is found in short (73-103 amino acid) proteins and contains three conserved cysteine residues." "Bacteria(0.99);Eukaryota(0.01);" "(1.00);" "Clostridiaceae(0.07);(0.06);Ruminococcaceae(0.03);Flavobacteriaceae(0.02);Eubacteriaceae(0.02);" "Clostridium(0.07);(0.05);Eubacterium(0.02);Ruminococcus(0.02);Lactobacillus(0.01);"
+"ds2020-328_66" "532" "pfam09044" "gnl|CDD|370259" "2.02105e-23" "65" "373" "-1" "pfam09044, Kp4, Kp4. Members of this fungal family of toxins specifically inhibit voltage-gated calcium channels in mammalian cells. They adopt an alpha/beta-sandwich structure, comprising a five-stranded antiparallel beta-sheet with two antiparallel alpha-helices lying at approximately 45 degrees to these strands." "Eukaryota(1.00);" "(1.00);" "Hypocreaceae(0.29);Aspergillaceae(0.21);Nectriaceae(0.21);Glomerellaceae(0.14);Clavicipitaceae(0.07);" "Trichoderma(0.29);Aspergillus(0.21);Fusarium(0.21);Colletotrichum(0.14);Metarhizium(0.07);"
+"ds2020-328_675" "222" "pfam02468" "gnl|CDD|367094" "3.35789e-17" "22" "123" "1" "pfam02468, PsbN, Photosystem II reaction centre N protein (psbN). This is a family of small proteins encoded on the chloroplast genome. psbN is involved in photosystem II during photosynthesis, but its exact role is unknown." "Bacteria(0.88);Eukaryota(0.12);" "(1.00);" "Synechococcaceae(0.15);Nostocaceae(0.07);Prochloraceae(0.07);Aphanothecaceae(0.07);Microcoleaceae(0.05);" "Synechococcus(0.12);Prochlorococcus(0.07);Cyanobacterium(0.05);(0.03);Trichodesmium(0.03);"
+"ds2020-328_677" "222" "pfam00978" "gnl|CDD|250270" "1.73152e-12" "24" "206" "-2" "pfam00978, RdRP_2, RNA dependent RNA polymerase. This family may represent an RNA dependent RNA polymerase. The family also contains the following proteins: 2A protein from bromoviruses putative RNA dependent RNA polymerase from tobamoviruses Non structural polyprotein from togaviruses." "Viruses(1.00);" "Riboviria(1.00);" "Bromoviridae(0.35);Virgaviridae(0.32);Closteroviridae(0.16);Togaviridae(0.10);Betaflexiviridae(0.03);" "Tobamovirus(0.13);Ilarvirus(0.10);Alphavirus(0.10);Cucumovirus(0.10);Bromovirus(0.10);"
+"ds2020-328_681" "222" "pfam00562" "gnl|CDD|366167" "2.61251e-09" "26" "145" "-3" "pfam00562, RNA_pol_Rpb2_6, RNA polymerase Rpb2, domain 6. RNA polymerases catalyze the DNA dependent polymerization of RNA. Prokaryotes contain a single RNA polymerase compared to three in eukaryotes (not including mitochondrial. and chloroplast polymerases). This domain represents the hybrid binding domain and the wall domain. The hybrid binding domain binds the nascent RNA strand / template DNA strand in the Pol II transcription elongation complex. This domain contains the important structural motifs, switch 3 and the flap loop and binds an active site metal ion. This domain is also involved in binding to Rpb1 and Rpb3. Many of the bacterial members contain large insertions within this domain, as region known as dispensable region 2 (DRII)." "Bacteria(0.49);Eukaryota(0.34);Archaea(0.09);Viruses(0.08);" "(0.92);Iridoviridae(0.05);Mimiviridae(0.02);Asfarviridae(0.02);" "Iridoviridae(0.05);Hexamitidae(0.05);Trichomonadidae(0.03);Poaceae(0.03);Cryptosporidiidae(0.03);" "Giardia(0.05);Cryptosporidium(0.03);Trichomonas(0.03);Plasmodium(0.03);Rhodopirellula(0.02);"
+"ds2020-328_687" no_hit
+"ds2020-328_689" "222" "pfam02670" "gnl|CDD|335036" "5.85343e-14" "34" "135" "1" "pfam02670, DXP_reductoisom, 1-deoxy-D-xylulose 5-phosphate reductoisomerase. This is a family of 1-deoxy-D-xylulose 5-phosphate reductoisomerases. This enzyme catalyzes the formation of 2-C-methyl-D-erythritol 4-phosphate from 1-deoxy-D-xylulose-5-phosphate in the presence of NADPH. This reaction is part of the terpenoid biosynthesis pathway." "Bacteria(0.96);Eukaryota(0.04);" "(1.00);" "Bacillaceae(0.05);Vibrionaceae(0.05);Corynebacteriaceae(0.04);Pasteurellaceae(0.04);Pseudomonadaceae(0.04);" "Bacillus(0.05);Clostridium(0.04);Corynebacterium(0.04);Pseudomonas(0.04);Vibrio(0.04);"
+"ds2020-328_69" "528" "pfam01660" "gnl|CDD|366745" "2.23499e-10" "222" "500" "-2" "pfam01660, Vmethyltransf, Viral methyltransferase. This RNA methyltransferase domain is found in a wide range of ssRNA viruses, including Hordei-, Tobra-, Tobamo-, Bromo-, Clostero- and Caliciviruses. This methyltransferase is involved in mRNA capping. Capping of mRNA enhances its stability. This usually occurs in the nucleus. Therefore, many viruses that replicate in the cytoplasm encode their own. This is a specific guanine-7-methyltransferase domain involved in viral mRNA cap0 synthesis. Specificity for guanine 7 position is shown by NMR in and in vivo role in cap synthesis. Based on secondary structure prediction, the basic fold is believed to be similar to the common AdoMet-dependent methyltransferase fold. A curious feature of this methyltransferase domain is that it together with flanking sequences seems to have guanylyltransferase activity coupled to the methyltransferase activity. The domain is found throughout the so-called Alphavirus superfamily, (including alphaviruses and several other groups). It forms the defining, unique feature of this superfamily." "Viruses(1.00);" "Riboviria(1.00);" "Betaflexiviridae(0.23);Alphaflexiviridae(0.21);Virgaviridae(0.15);Tymoviridae(0.14);Bromoviridae(0.10);" "Potexvirus(0.16);Carlavirus(0.11);Tymovirus(0.08);Tobamovirus(0.07);Alphavirus(0.05);"
+"ds2020-328_691" "221" "pfam00329" "gnl|CDD|376317" "1.3793e-18" "81" "197" "-1" "pfam00329, Complex1_30kDa, Respiratory-chain NADH dehydrogenase, 30 Kd subunit. " "Bacteria(0.79);Archaea(0.12);Eukaryota(0.09);" "(1.00);" "(0.05);Peptococcaceae(0.02);Bacteroidaceae(0.02);Desulfurococcaceae(0.02);Rhodobacteraceae(0.01);" "Bacteroides(0.02);(0.02);Prevotella(0.01);Geobacter(0.01);"
+"ds2020-328_7" "2116" "pfam01787" "gnl|CDD|366810" "1.27327e-63" "325" "936" "-2" "pfam01787, Ilar_coat, Ilarvirus coat protein. This family consists of various coat proteins from the ilarviruses part of the Bromoviridae, members include apple mosaic virus and prune dwarf virus. The ilarvirus coat protein is required to initiate replication of the viral genome in host plants. Members of the Bromoviridae have a positive stand ssRNA genome with no DNA stage in there replication." "Viruses(1.00);" "Riboviria(1.00);" "Bromoviridae(1.00);" "Ilarvirus(1.00);"
+"ds2020-328_7" "2116" "pfam01573" "gnl|CDD|279858" "6.78673e-46" "1134" "1835" "-3" "pfam01573, Bromo_MP, Bromovirus movement protein. " "Viruses(1.00);" "Riboviria(1.00);" "Bromoviridae(1.00);" "Ilarvirus(0.50);Alfamovirus(0.50);"
+"ds2020-328_704" "220" "pfam05724" "gnl|CDD|368581" "5.77087e-08" "38" "196" "2" "pfam05724, TPMT, Thiopurine S-methyltransferase (TPMT). This family consists of thiopurine S-methyltransferase proteins from both eukaryotes and prokaryotes. Thiopurine S-methyltransferase (TPMT) is a cytosolic enzyme that catalyzes S-methylation of aromatic and heterocyclic sulfhydryl compounds, including anticancer and immunosuppressive thiopurines." "Bacteria(0.55);Eukaryota(0.45);" "(1.00);" "Pseudomonadaceae(0.27);Brassicaceae(0.18);Muridae(0.09);Vibrionaceae(0.09);Hominidae(0.09);" "Pseudomonas(0.27);Batis(0.09);Ralstonia(0.09);Arabidopsis(0.09);Brassica(0.09);"
+"ds2020-328_724" "219" "pfam02123" "gnl|CDD|280316" "1.52156e-13" "35" "199" "-3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_746" "217" "pfam02123" "gnl|CDD|280316" "4.96199e-13" "13" "210" "-2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_750" "216" "pfam02123" "gnl|CDD|280316" "7.51118e-17" "8" "214" "-3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_761" "215" "pfam02123" "gnl|CDD|280316" "4.08427e-09" "37" "198" "-3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_763" "215" "pfam00201" "gnl|CDD|278624" "6.35685e-07" "113" "193" "-2" "pfam00201, UDPGT, UDP-glucoronosyl and UDP-glucosyl transferase. " "Eukaryota(1.00);" "(1.00);" "Hominidae(0.46);Muridae(0.31);Leporidae(0.15);Poaceae(0.08);" "Homo(0.46);Rattus(0.31);Oryctolagus(0.15);Zea(0.08);"
+"ds2020-328_768" "215" "pfam02123" "gnl|CDD|280316" "5.01402e-08" "33" "209" "3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_775" "214" "pfam00361" "gnl|CDD|366050" "1.62796e-10" "59" "196" "-1" "pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla." "Eukaryota(0.54);Bacteria(0.46);" "(1.00);" "Culicidae(0.23);Rhodobacteraceae(0.23);Poaceae(0.15);Enterobacteriaceae(0.15);Phasianidae(0.08);" "Paracoccus(0.23);Anopheles(0.23);Escherichia(0.15);Zea(0.15);Aspergillus(0.08);"
+"ds2020-328_784" "213" "pfam07727" "gnl|CDD|369488" "2.2825e-05" "25" "93" "-1" "pfam07727, RVT_2, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses. This Pfam entry includes reverse transcriptases not recognized by the pfam00078 model." "Eukaryota(1.00);" "(1.00);" "Debaryomycetaceae(0.83);Saccharomycetaceae(0.17);" "Candida(0.50);Debaryomyces(0.33);Saccharomyces(0.17);"
+"ds2020-328_788" "213" "pfam00069" "gnl|CDD|365850" "1.68423e-10" "23" "193" "2" "pfam00069, Pkinase, Protein kinase domain. " "Eukaryota(1.00);" "(1.00);" "Saccharomycetaceae(0.31);Hominidae(0.17);Muridae(0.14);Schizosaccharomycetaceae(0.11);Drosophilidae(0.06);" "Saccharomyces(0.31);Homo(0.17);Schizosaccharomyces(0.11);Rattus(0.08);Drosophila(0.06);"
+"ds2020-328_79" "507" "pfam00507" "gnl|CDD|376344" "3.59591e-31" "17" "244" "2" "pfam00507, Oxidored_q4, NADH-ubiquinone/plastoquinone oxidoreductase, chain 3. " "Bacteria(0.80);Eukaryota(0.13);Archaea(0.07);" "(1.00);" "(0.04);Prevotellaceae(0.02);Cytophagaceae(0.02);Sphingobacteriaceae(0.02);Desulfobulbaceae(0.02);" "(0.02);Prevotella(0.02);Bacteroides(0.02);Geobacter(0.01);"
+"ds2020-328_79" "507" "pfam00164" "gnl|CDD|333891" "1.13503e-12" "341" "493" "2" "pfam00164, Ribosom_S12_S23, Ribosomal protein S12/S23. This protein is known as S12 in bacteria and archaea and S23 in eukaryotes." "Bacteria(0.45);Eukaryota(0.27);Archaea(0.27);" "(1.00);" "Thermococcaceae(0.09);Micrococcaceae(0.09);Enterobacteriaceae(0.09);Thermaceae(0.09);Muridae(0.09);" "Thermococcus(0.09);Saccharomyces(0.09);Rickettsia(0.09);Synechococcus(0.09);Thermus(0.09);"
+"ds2020-328_808" "212" "pfam03822" "gnl|CDD|367678" "6.58628e-13" "73" "189" "-3" "pfam03822, NAF, NAF domain. " "Eukaryota(1.00);" "(1.00);" "Poaceae(0.30);Brassicaceae(0.18);Solanaceae(0.12);Musaceae(0.09);Fabaceae(0.08);" "Solanum(0.11);Musa(0.09);Brassica(0.09);Glycine(0.08);Arabidopsis(0.07);"
+"ds2020-328_817" "211" "pfam03732" "gnl|CDD|367628" "2.37772e-05" "26" "208" "2" "pfam03732, Retrotrans_gag, Retrotransposon gag protein. Gag or Capsid-like proteins from LTR retrotransposons. There is a central motif QGXXEXXXXXFXXLXXH that is common to Retroviridae gag-proteins, but is poorly conserved." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.58);Poaceae(0.29);Tetraodontidae(0.04);Solanaceae(0.02);Plantaginaceae(0.02);" "Arabidopsis(0.58);Oryza(0.18);Sorghum(0.05);Takifugu(0.04);Zea(0.04);"
+"ds2020-328_821" "211" "pfam03732" "gnl|CDD|367628" "4.10271e-05" "96" "200" "-3" "pfam03732, Retrotrans_gag, Retrotransposon gag protein. Gag or Capsid-like proteins from LTR retrotransposons. There is a central motif QGXXEXXXXXFXXLXXH that is common to Retroviridae gag-proteins, but is poorly conserved." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.58);Poaceae(0.29);Tetraodontidae(0.04);Solanaceae(0.02);Plantaginaceae(0.02);" "Arabidopsis(0.58);Oryza(0.18);Sorghum(0.05);Takifugu(0.04);Zea(0.04);"
+"ds2020-328_825" no_hit
+"ds2020-328_830" "211" "pfam00978" "gnl|CDD|250270" "2.36362e-14" "16" "201" "1" "pfam00978, RdRP_2, RNA dependent RNA polymerase. This family may represent an RNA dependent RNA polymerase. The family also contains the following proteins: 2A protein from bromoviruses putative RNA dependent RNA polymerase from tobamoviruses Non structural polyprotein from togaviruses." "Viruses(1.00);" "Riboviria(1.00);" "Bromoviridae(0.35);Virgaviridae(0.32);Closteroviridae(0.16);Togaviridae(0.10);Betaflexiviridae(0.03);" "Tobamovirus(0.13);Ilarvirus(0.10);Alphavirus(0.10);Cucumovirus(0.10);Bromovirus(0.10);"
+"ds2020-328_84" "501" "pfam00284" "gnl|CDD|366000" "1.57316e-21" "211" "324" "-1" "pfam00284, Cytochrom_B559a, Lumenal portion of Cytochrome b559, alpha (gene psbE) subunit. This family is the lumenal portion of cytochrome b559 alpha chain, matches to this family should be accompanied by a match to the pfam00283 family also. The Prosite pattern pattern matches the transmembrane region of the cytochrome b559 alpha and beta subunits." "Bacteria(0.86);Eukaryota(0.14);" "(1.00);" "Synechococcaceae(0.17);Microcoleaceae(0.09);Aphanothecaceae(0.09);Prochloraceae(0.06);Phaeodactylaceae(0.03);" "Synechococcus(0.17);Prochlorococcus(0.06);Stanieria(0.03);Acaryochloris(0.03);Selaginella(0.03);"
+"ds2020-328_84" "501" "pfam00283" "gnl|CDD|365999" "1.14937e-08" "346" "432" "-1" "pfam00283, Cytochrom_B559, Cytochrome b559, alpha (gene psbE) and beta (gene psbF)subunits. " "Bacteria(0.59);Eukaryota(0.41);" "(1.00);" "Synechococcaceae(0.29);Prochloraceae(0.12);Pseudanabaenaceae(0.06);Acaryochloridaceae(0.06);Thalassiosiraceae(0.06);" "Synechococcus(0.29);Prochlorococcus(0.12);Selaginella(0.06);Gloeobacter(0.06);Thalassiosira(0.06);"
+"ds2020-328_84" "501" "pfam00283" "gnl|CDD|365999" "2.11473e-07" "100" "186" "-1" "pfam00283, Cytochrom_B559, Cytochrome b559, alpha (gene psbE) and beta (gene psbF)subunits. " "Bacteria(0.59);Eukaryota(0.41);" "(1.00);" "Synechococcaceae(0.29);Prochloraceae(0.12);Pseudanabaenaceae(0.06);Acaryochloridaceae(0.06);Thalassiosiraceae(0.06);" "Synechococcus(0.29);Prochlorococcus(0.12);Selaginella(0.06);Gloeobacter(0.06);Thalassiosira(0.06);"
+"ds2020-328_843" "210" "pfam03514" "gnl|CDD|335361" "1.72129e-13" "26" "130" "2" "pfam03514, GRAS, GRAS domain family. Proteins in the GRAS (GAI, RGA, SCR) family are known as major players in gibberellin (GA) signaling, which regulates various aspects of plant growth and development. Mutation of the SCARECROW (SCR) gene results in a radial pattern defect, loss of a ground tissue layer, in the root. The PAT1 protein is involved in phytochrome A signal transduction. A sequence, structure and evolutionary analysis showed that the GRAS family emerged in bacteria and belongs to the Rossmann-fold, AdoMET (SAM)-dependent methyltransferase superfamily. All bacterial, and a subset of plant GRAS proteins, are predicted to be active and function as small-molecule methylases. Several plant GRAS proteins lack one or more AdoMet (SAM)-binding residues while preserving their substrate-binding residues. Although GRAS proteins are implicated to function as transcriptional factors, the above analysis suggests that they instead might either modify or bind small molecules." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.80);Poaceae(0.13);Solanaceae(0.07);" "Arabidopsis(0.80);Oryza(0.07);Solanum(0.07);Zea(0.03);Triticum(0.03);"
+"ds2020-328_863" "209" "pfam02123" "gnl|CDD|280316" "7.16978e-05" "38" "181" "2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_867" "209" "pfam02123" "gnl|CDD|280316" "3.29677e-10" "13" "186" "-3" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_87" "488" "pfam02123" "gnl|CDD|280316" "1.40535e-08" "300" "467" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_872" "209" "pfam08497" "gnl|CDD|378013" "5.53746e-25" "38" "181" "-2" "pfam08497, Radical_SAM_N, Radical SAM N-terminal. This domain tends to occur to the N-terminus of the pfam04055 domain in hypothetical bacterial proteins." "Bacteria(0.94);Archaea(0.06);" "(1.00);" "Clostridiaceae(0.11);(0.10);Prevotellaceae(0.06);Lachnospiraceae(0.05);Ruminococcaceae(0.04);" "Clostridium(0.11);(0.08);Prevotella(0.05);Eubacterium(0.04);Ruminococcus(0.03);"
+"ds2020-328_891" "208" "pfam02123" "gnl|CDD|280316" "2.76435e-10" "31" "150" "1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_893" "208" "pfam02123" "gnl|CDD|280316" "1.90193e-07" "35" "181" "2" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_9" "1487" "pfam00361" "gnl|CDD|366050" "2.3647e-49" "715" "1476" "-3" "pfam00361, Proton_antipo_M, Proton-conducting membrane transporter. This is a family of membrane transporters that inlcudes some 7 of potentially 14-16 TM regions. In many instances the family forms part of complex I that catalyzes the transfer of two electrons from NADH to ubiquinone in a reaction that is associated with proton translocation across the membrane, and in this context is a combination predominantly of subunits 2, 4, 5, 14, L, M and N. In many bacterial species these proteins are probable stand-alone transporters not coupled with oxidoreduction. The family in total represents homologs across the phyla." "Eukaryota(0.54);Bacteria(0.46);" "(1.00);" "Culicidae(0.23);Rhodobacteraceae(0.23);Poaceae(0.15);Enterobacteriaceae(0.15);Phasianidae(0.08);" "Paracoccus(0.23);Anopheles(0.23);Escherichia(0.15);Zea(0.15);Aspergillus(0.08);"
+"ds2020-328_90" "476" "pfam01578" "gnl|CDD|307628" "6.70073e-11" "145" "399" "-3" "pfam01578, Cytochrom_C_asm, Cytochrome C assembly protein. This family consists of various proteins involved in cytochrome c assembly from mitochondria and bacteria; CycK from Rhizobium, CcmC from E. coli and Paracoccus denitrificans and orf240 from wheat mitochondria. The members of this family are probably integral membrane proteins with six predicted transmembrane helices. It has been proposed that members of this family comprise a membrane component of an ABC (ATP binding cassette) transporter complex. It is also proposed that this transporter is necessary for transport of some component needed for cytochrome c assembly. One member CycK contains a putative heme-binding motif, orf240 also contains a putative heme-binding motif and is a proposed ABC transporter with c-type heme as its proposed substrate. However it seems unlikely that all members of this family transport heme nor c-type apocytochromes because CcmC in the putative CcmABC transporter transports neither. CcmF forms a working module with CcmH and CcmI, CcmFHI, and itself is unlikely to bind haem directly." "Bacteria(0.56);Eukaryota(0.38);Archaea(0.05);" "(1.00);" "Enterobacteriaceae(0.10);Pasteurellaceae(0.08);Histionidae(0.05);Marchantiaceae(0.05);Archaeoglobaceae(0.05);" "Escherichia(0.08);Reclinomonas(0.05);Archaeoglobus(0.05);Marchantia(0.05);Bradyrhizobium(0.05);"
+"ds2020-328_904" no_hit
+"ds2020-328_908" "207" "pfam02123" "gnl|CDD|280316" "5.3529e-06" "4" "207" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_921" no_hit
+"ds2020-328_97" "461" "pfam02123" "gnl|CDD|280316" "5.16988e-30" "39" "461" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_98" "458" "pfam02123" "gnl|CDD|280316" "1.94825e-26" "27" "443" "-1" "pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus." "Viruses(1.00);" "Riboviria(1.00);" "Totiviridae(0.44);Solemoviridae(0.19);Luteoviridae(0.15);Reoviridae(0.15);Chrysoviridae(0.07);" "Sobemovirus(0.19);Rotavirus(0.15);Victorivirus(0.15);Polerovirus(0.11);Totivirus(0.11);"
+"ds2020-328_99" "458" "pfam03732" "gnl|CDD|367628" "7.72961e-07" "256" "441" "1" "pfam03732, Retrotrans_gag, Retrotransposon gag protein. Gag or Capsid-like proteins from LTR retrotransposons. There is a central motif QGXXEXXXXXFXXLXXH that is common to Retroviridae gag-proteins, but is poorly conserved." "Eukaryota(1.00);" "(1.00);" "Brassicaceae(0.58);Poaceae(0.29);Tetraodontidae(0.04);Solanaceae(0.02);Plantaginaceae(0.02);" "Arabidopsis(0.58);Oryza(0.18);Sorghum(0.05);Takifugu(0.04);Zea(0.04);"
diff -r 000000000000 -r b82ce29791e7 test-data/otu_s2_tblastx.tab
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/otu_s2_tblastx.tab Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,139 @@
+#algo query_id nb_reads query_length accession description organism percentIdentity nb_hsps queryOverlap hitOverlap evalue score tax_id taxonomy sequence
+TBLASTX ds2020-328_275 16 279
+TBLASTX ds2020-328_625 13 226 NC_008039 Prune dwarf virus RNA 1, complete sequence Prune dwarf virus 90.7 3 100 17.0 1.9242059400026399e-29 420.172 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGGCCGCCCGCCATACTGAGCGTCTCATGCAGTACACTACCTACAAGACTAGTAGACCTGATGAAGTTCATGAACCGAACTTTTGTGAAAACACATTCCAGGACTGCTCCTTGCAAGGTAAGTATGCCATGGCAATCCATTCCACTTCGGATTTACCCTTAGGTGAGCTCTGTGAGAGCTTAAGGAAGAAGGGAGTGATTCGTCTATCCCGACC
+TBLASTX ds2020-328_196 14 318 NC_033468 Wuhan insect virus 27 strain WHZM10130 hypothetical protein 1 and hypothetical protein 2 genes, complete cds Wuhan insect virus 27 45.3 1 100 6.0 2.90542e-27 118.644 1923731 Viruses;Wuhan insect virus 27 GGTCGGGATAGACGTTTAGCAGCCTTAAACTCTTCATCTTCAGGGTATTGTGAGTGATATGCTCCCGTAGGTGCCCACTGCCACCTCTTATTCCAATAACTTTTCCACTTTATGTTATCTGGTTTACTCCCGAGGTTTTTCAATCTAGTGAACATTTCTCCACTAGCCCTGTATATCTGCTCTCTAGTGAAAGAAGCGACGTTGGGTTTGGTTCTGTGCTCTTTCTCGGCTTTCCAATCCACTTCTCCTATACCTCTGTTGACTAAAACTTCCATTTCAAAGAATGGTTTTAAGTTGAGCGGTGCGTCTATCCCGACC
+TBLASTX ds2020-328_638 4 225 NC_030890 Arabidopsis halleri partitivirus 1 gene for capsid protein, complete cds Arabidopsis halleri partitivirus 1 48.2 1 100 10.0 1.45353e-08 55.5941 1849335 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Arabidopsis halleri partitivirus 1 GTCGGGATAGACGTACCAGTCAACTTTTTGCAATTTTCTTCATACATCACATGGTATGACTTGGTTTGCCCAAGTCCGCGATGTAGCCGCAGCCGAAGCCTCGTCTTTCGAAGGCTCAGGCACCCTGGCTGATTGTCCCCCATTCGGGATAACGTCAAACCAGGTAGTTGTTAACTACTTGGCCCCAGCCACACTGCCAACGTCCCCTATTCGTCTATCCCGACC
+TBLASTX ds2020-328_858 2 210
+TBLASTX ds2020-328_761 8 215
+TBLASTX ds2020-328_553 2 234
+TBLASTX ds2020-328_845 11 210 NC_003689 Cherry virus A, complete genome Cherry virus A 75.0 2 100 5.0 5.449000000000025e-19 225.74040000000002 42882 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Tymovirales;Betaflexiviridae;Capillovirus;Cherry virus A GCCGTGGACCTAGTTAGGAGAGTAATTTCGGATGGTGTTCTTTACTGCTCTCTGATTTTCTGATAAGATTATCGCCGGCGTGGCTGCTACTCCCTCTGAAGCCTCTACTGCTGGCTTCGCAGTCAGGTGCAATAGATCCCTTGGATCTATCATATTCTCCCAGATATAATTTACAAGGCCCCTTCTTATCACGTTGTAATTCTTATACAC
+TBLASTX ds2020-328_483 8 242 NC_033495 Botryosphaeria dothidea virus 1 strain YZN115 segment RNA4 hypothetical protein gene, complete cds Botryosphaeria dothidea virus 1 50.0 1 100 13.0 1.155e-07 52.8449 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 GGTCGGGATAGACGGAATTAACCCATGTAATGGCACAATCGAAGGCTCTAGCCGTGGCCGTTGCACGGATAACGAGAGGGAAGGGGCGGCACGACGCATCTGTAGAAGATTTCATCTTCTACATAGCCTCAAACGGGCGTGCCGTCTCCGCTTCGGATATACCATCCGGAGTCCATAGCTTGGCTTGCGGTCCTCGTGACCATGTGGAACCCTCTGAGCGTTTACCAGCGTCTATCCCGACC
+TBLASTX ds2020-328_910 2 207
+TBLASTX ds2020-328_531 10 236
+TBLASTX ds2020-328_893 4 208
+TBLASTX ds2020-328_507 26 238
+TBLASTX ds2020-328_594 8 229
+TBLASTX ds2020-328_600 4 229 NC_014823 Tolypocladium cylindrosporum virus 1, complete genome Tolypocladium cylindrosporum virus 1 55.8 2 100 7.0 8.34655e-06 145.07119999999998 939923 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Victorivirus;Tolypocladium cylindrosporum virus 1 GGTGGGGATAGACGTTTTGGTTCCTTCTAAAGGCCGCGCCCTCTCCCGCCCAATTGATGGTTCCCTGCTTGTTGAAGCGGGATACCCTACTGCTCATGCCTTGGCTGAGGATTTTGTTGGACTTTCTAAGAAGTACACTAATTTCTATGCCACGTCCGAGTACGCGTCCCTGGCTGACCTGGTTGAACACCTCATCCATGGTTTAGCTCCAACCTCCGTATATCCCGAC
+TBLASTX ds2020-328_765 8 215
+TBLASTX ds2020-328_575 4 231 NC_003710 Discula destructiva virus 2 segment 1, complete genome Discula destructiva virus 2 69.0 4 100 20.0 0.00012443 208.6303 160484 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Gammapartitivirus;Discula destructiva virus 2 GGTCGGGATAGACGTACGTCTGGCATGAGTATGGGTGTATTAATGAAATACCACACCATGGCGTCCCAAACATTCTTCCACTTTTGCTTCTCAACCTGATCTGTCACAGGTTTTCCATTGAAGGAAGAGAAGTTCACGTTCTGTTTCAACACGTCAAACGCGACGCGTATCAACCACGCTGGTACTTTCGTATCAAAAGCGGAAAAATCTATGACCACGTCTATCCCGACC
+TBLASTX ds2020-328_229 20 299 NC_007539 Penicillium chrysogenum virus segment 1, complete genome Penicillium chrysogenum virus 61.8 2 100 13.0 9.88605e-10 217.03480000000002 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GTTACATGCATTGGACTCGCGACTTGAATTACGGCGGTCGGGATAGACGTTGTTCGCGGATGGAGAGGTACAACATGGATAAATTCTACTTTAAATTTTTGCTATGTGGCTATTGCACTCCAAAATATGGAACGTATACATGGTGTAAGTTGTGTATTATATGTAGATCATGGCGGAGATGATATAGATTTAGGATTAAGTGAACCTGCCATGCTGCCATTGTTCCTAGAAATAATGGATAGCATGCTGTTCAAGGCGAATAAATGGAAACAAATGTCCGATCCACGTCTATCCCGACC
+TBLASTX ds2020-328_172 14 338 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 57.5 3 100 14.0 2.4114403333333332e-05 280.4185 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B ATTACGGCGGTCGGGATAGACGGAGGGCGTCCTTCTAGCACCCCCGACACGCGAGCGCTGACATTTGCGTCATTGGCGTCTCTCCCGACTGGGAATCTGTTTGGGAGCACGTTTTCACAATTGTAAAACGCAAAGTTGGCAAGGACGTAACTCGTTGTATCTGTTCCATAGATTGCACGGAGCTTGCCCCATTCATACTTTGTTGATGCCCAAGCGTGTATTTCGGGGTTGCGTGATGTGAAGTATTCGATGTCAAAAGATGGCATGTTCGATATCATTATGAACTTGTTTTTGAGAGCGCGGTCAGTTCTGATGAGAACATCTCGTCTATCCCGACC
+TBLASTX ds2020-328_293 15 272 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 67.1 1 100 5.0 8.1393e-29 123.409 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B GGTCGGGATAGACGCCTCGCAGGAATTCAGCTATAGCTCCGAATGCACATTTAGAGGGTTGTGTCCGTATACAAAGCCTCTGTCCTCTCTGTAGTGTGAAGCGGGTTATCTCAAGTGATGTCGTTCCCAGAAGTACATCGTCACCGTTGTGTAGTGAAGAGCCAACCTCTTTCATCGGACCTAACATGAAGTCAGTGTAGACGGCATTCAGGACGGAGTTAAGGAACGTAGTAAGTCGGTAACCTGACAGCAGAATCCCGTCTATCCCGACC
+TBLASTX ds2020-328_746 2 217 NC_020903 Xanthophyllomyces dendrorhous virus L1A capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1A 52.5 2 100 8.0 0.000128888 153.5807 1167690 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1A GGTCGGGATAGACGCGTCACCCCCATTATGTAAACTGTTTCCTCGCTTCAACGTGTCTTCAGATATCGCTTTTGTGTATATATAATTCAATATACTGTTCATGAATGTTGTCAGTCTCCAGCCTGACAGCAGTGTGTCTTTCGCCCTGTATGTACGCTTCGTACCAACATTGTCATGTATTACCTGGTTGCCTACAGATTCAGCCGTCCATAAGGCC
+TBLASTX ds2020-328_768 6 215
+TBLASTX ds2020-328_337 18 265
+TBLASTX ds2020-328_328 8 267 NC_007540 Penicillium chrysogenum virus segment 2, complete genome Penicillium chrysogenum virus 37.5 1 100 7.0 1.12376e-11 66.4405 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GTCTAGTACTACATCCATATTTGAGAGCCACGTCCGCCAACATTGCGAGTTTGCCACATATGACAGACTGTTATTAGGTAAACTTTCTACATTCCCAAACCATGAACTTTTCAATTTTCTGGCTCTACCAAATTCACTTATCTCTTCACTTTCGTTCCAACGTTCTATATTAAGATTTACCCGTTTTGTAAATTTGTTATTACCGTTTAACATGCTCACTTTTTCCAGACCGCATGTCTCTAAATTTGATGTTATAGCTTCTACATT
+TBLASTX ds2020-328_476 6 243
+TBLASTX ds2020-328_71 18 526 NC_033465 Wuhan insect virus 26 strain WHZM10161 hypothetical protein 1 and hypothetical protein 2 genes, complete cds Wuhan insect virus 26 47.4 1 100 6.0 1.70533e-19 93.8794 1923730 Viruses;Wuhan insect virus 26 GGTCGGGATAGACGGAGACTAAGAGTGGGCAGAAAGTCGAATGACGGGGGGCAATACCTACCGAGAGCTATAGCGACGTTAGTGCACTCGCGGATAGAGAGCGGACCAGCAACTTCATTAGCTGATGCACTGAGATCAAACGAAATACGTCTGTATGAAGCAATAGAGCGGGGTATGGACGCCGAAATAGCATTGAAACTACGGTCGTTGTATATATCACGAGTGGCGCCTTTGTACGGTAATAACAGGCAAGAAGCTATGGAGCTATTAGAGGCGTCGTCTGTAGTAGGAGGACTGAGTATGGACAGGGAGGCCAGAGTAGACAAAACATTTACGGAAACTGAGCCAACGTCGAAGGAGTCTGACGAAATAATGAACTTGGCGGGACACAGAAAATGGAGGGGAGTGTCAGACATGGCCAACGTGGTACTAGAAAAAATATCTGAACAAGGAGGAAGTGCCATAACGATAAAAAACATAACGAAGCGAATTTATAATTATAAGCTGAGTGCGTTGTCTATAAAAA
+TBLASTX ds2020-328_241 10 293 NC_033494 Botryosphaeria dothidea virus 1 strain YZN115 segment RNA3 hypothetical protein gene, complete cds Botryosphaeria dothidea virus 1 43.6 2 100 14.0 1.22557e-10 81.7433 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 GGTCGGGTAGACGGCGGAGTGTACTTGATACCTTTCGAATTCACGGGGTAGATTTTGTCGGCATATTCGTCTGGCTCGGGCAAAGGAATGGTAGGAAATTCTTTCGGCTGCGAAATTAAAGTGGCGTCAGAAGTATATGACAAAGGGAGTTTCTCACGACGTCTGTACCTGTAGAGGTACTGGTCCCAGACCTGATAGCCGGTTGATGACATGTCTGTCGTCCAGCACATCACCGAATCGAATTCTGGATGCTCAACTCGGGCAGTGTAACAAACATCATCAGCGAACCGGCC
+TBLASTX ds2020-328_391 21 254
+TBLASTX ds2020-328_668 2 223 NC_005977 Penicillium stoloniferum virus S segment 2, complete genome Wuhan insect virus 27 48.5 1 100 13.0 1.11015e-17 85.8359 1923731 Viruses;Wuhan insect virus 27 GGTCGGGATAGACGTGGGATGTGGCTATGCCGAGTTCCGTGGACTGGTCCTATCCCACTAAAACGAGGCGTTCAACCCTCTCTCAGCAGTGGGCGCGTGTTTCAACGTCCTACGCAATGTTCTTCGAGATGTCGGCGGGTCTGTCGACCGGTCAATCTGCGCAAGGCAGTCATGCACAAATGGTAGAAGTGACTATTATAGAGGGAGTACGTCTATCCCGACC
+TBLASTX ds2020-328_920 2 207 NC_033477 Botryosphaeria dothidea virus 1 strain YZN115 segment RNA2 hypothetical protein gene, complete cds Botryosphaeria dothidea virus 1 50.0 1 100 5.0 2.52205e-05 44.5971 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 GGTCGGGATAGACGGGGGATTTAAATTTTAATTAGCATCAAGACGAACATTCCGAGGTCGCACCCCCCCGTCTTACTGTAGCAGGCATGGCAAACCTGACCCGTTTACGCACGCTTGTTACGTCCGGTGAGCTCGAGGTGGTGTCAGCCGCAGCTGTTCTCTTCCACCTTTCTCGGAATCCAACCCTACATGACGTCTATCCCGACC
+TBLASTX ds2020-328_428 15 248 NC_020903 Xanthophyllomyces dendrorhous virus L1A capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1A 44.8 3 100 10.0 2.988626666666667e-05 175.03 1167690 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1A GAAGAGCTGTCGGGAGTGGAACAAGTTGTGGGATAGTAGGGGGCAGTGGGGTGCTGCGGGAAGCACGCATTCGCAGTACCAGGAGGACATGGCTTACGTCCTCAAGGACGACATAAGGCTCAAGAATAAGTTCATTACCATATCGAACATGCCGCGCTTTCCCATGACAAGATTTACAAACAGACCGCAGGAGATACAGGCTTGGGCGTCCACTAAGTACGAATGGGGCGGGGTCGTCTATCCCGACC
+TBLASTX ds2020-328_395 2 254 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 60.8 1 100 5.0 4.53232e-23 104.164 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B GGTCGGATAGACGGTCTGCCCCCTTCTGTGGTCAACTCTCAAGAACTCTGCTATGGCCCCAAATGCACATTTCGAGCTCTGCAACCTCACACCAAACTTGTGCGCGTTTGCCTGACATGCTTGAGCACATGCTAGGTTATTTGTTCCTATGAGTACGTCGTCCCCGTTGTGCAAGCTTGAGCCTGGTGTTCTCCACTCTTTTGCTATCTTCGATGTGTAGACGAAGTTCAGCACGCTGTTACGTCTATCCCACC
+TBLASTX ds2020-328_361 6 260
+TBLASTX ds2020-328_414 6 251 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 53.0 2 100 9.0 0.0001746225 154.7177 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B GGTCGGGATAGACGAGGCTACGTGGTAAACAGAGTAGCGGGGGTTTTGAAAGACAGATTACCATATTGTCTAGACTTTGAGGATTTCAACAGCCAGCACAGTCTATCAAGTATGCAAGCGGTCATAGATGCGTACTATGAAGTATTCGGGCCGAATATGTCGGAAGGGCAGAGACAGGCAGTACTTTGGACAAGAGAATCACTGTCTAATAACGTGGTACATGATAATATGGGTACACGTCTATCCCGACC
+TBLASTX ds2020-328_983 0 61 NC_036592 Pleurochrysis carterae circular virus isolate PcCV-1, complete genome Pleurochrysis carterae circular virus 100.0 8 100 21.0 0.0002522995 315.9968999999999 2057942 Viruses;Shotokuvirae;Cressdnaviricota;Arfiviricetes;Cirlivirales;Circoviridae;Pleurochrysis carterae circular virus TTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGTTAGGGT
+TBLASTX ds2020-328_492 7 241
+TBLASTX ds2020-328_381 4 256 NC_003710 Discula destructiva virus 2 segment 1, complete genome Discula destructiva virus 2 44.0 1 100 13.0 7.29476e-19 90.2231 160484 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Gammapartitivirus;Discula destructiva virus 2 GGTCGGGATAGACGCGCCAGCTGATGTATCAGTTCGAAGATACTGACCTACTTCGTGCCAATCACACGGTTCTTCACGGTGACTAAGGGTGAACCTCTCACGTGTAGCAGAGACCGCCTTGCGCAGCAAGGTTGATTCGCGTTCAGTTAGATCAGACCAACGTTTGTGTTGGCCTTCAAACTTCATCAAAGAGTTATACAGTCCGGGTAAACCGGCACCTCTTCGGGTAAAACCACAATTTTCGTCTATCCCGACC
+TBLASTX ds2020-328_886 8 208
+TBLASTX ds2020-328_902 13 207 NC_007542 Penicillium chrysogenum virus segment 4, complete genome Penicillium chrysogenum virus 38.6 1 100 6.0 9.22662e-09 55.9603 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGACGCTTAACCATGCTATCAATCTTTTTGACCTCCATTGTACCGTTCCCTTCCCCCAATATCACTGGTGAAAAGTGATTTTGGTCTCGCAATATTGTTACATTATTCTCTTGACTTCCATCATTATAATTAGTAACCCGTCCACTCTCTTTATCTAGCAATCTTAGGCCGAACCCCCCATGAGCGTCTATCCCGACC
+TBLASTX ds2020-328_512 10 238 NC_033494 Botryosphaeria dothidea virus 1 strain YZN115 segment RNA3 hypothetical protein gene, complete cds Botryosphaeria dothidea virus 1 43.5 1 100 11.0 2.01783e-13 71.9341 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 GGTCGGGATAGACGAGTAGGGGCCATCAAGGAGAAGAACGCCAGGGAAACCATCAAACTTTGGCAACGCAGTTGAGATTGAATGGACGTTAATGTCATCGGTTGCCGGGATACGTTTGACTCCACGTGCGTTGATGGGAATGAGCTGATCGGCTGTGGCGTCAAACTGCATTGGTGGGCCGATATCAATTGTCGCTGGCTGGGGGAGTTTCGTGGTACTTATGACGCCGCGGCTGGTT
+TBLASTX ds2020-328_677 9 222 NC_008037 Prune dwarf virus RNA 2, complete sequence Prune dwarf virus 84.3 3 100 21.0 3.5279036738626664e-25 366.104 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGACTATCAGTGTTGAGGATAGGAGCGTTCATGTTCCTTTTTGTCACCGACCGTGCCACTTCTCTAAAGGTACTTTGCCTATTGGAAGTTTGACCTGTCATTAAGGTGGAATCCACTCCAGACTTTCCTTTATCCCATGAAACAAAATGGGATAAATCAAAAGAGCAGTCATCAAGTTCAACTGCAATATCATCCGGCGTCTATCCCACC
+TBLASTX ds2020-328_571 10 231 NC_007540 Penicillium chrysogenum virus segment 2, complete genome Penicillium chrysogenum virus 50.0 1 100 6.0 2.90834e-16 81.2538 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGACGAATCTGGCTATTTATGGGCCAAACCAAGTCTTAAACTCTTATCGTAGAGATGGACGAGCATATGTTTTCAATTCCAAACCCGAGTCGGTAGGGCATACGGCACTGTTATTCAAAATGTGCGAATCTTATCCTCCAAGAGAATTTAGGTCGCATGTAAGCATACCATCGGACGGGGATGAGATATTTATGGTAGCACAACGTCTATCCCGACCGCCGT
+TBLASTX ds2020-328_777 4 214
+TBLASTX ds2020-328_870 9 209
+TBLASTX ds2020-328_10 760 1434 NC_038512 Trichoplusia ni TED virus strain mutant FP-D ORF A, ORF B, and ORF C genes, complete cds Trichoplusia ni TED virus 31.5 3 100 7.0 4.12604e-15 129.2094 2083181 Viruses;Pararnavirae;Artverviricota;Revtraviricetes;Ortervirales;Metaviridae;Errantivirus;Trichoplusia ni TED virus GGTCGGGATAGACGTCTTCTCTTCGTCTACCGCAAATAGAATAGCCTCGCCCGGGAAATTAGTCCCCTTACTAAAAAAATCAAGCTTATAGTCAGGCACGGGATGGGATGATCCGCAGGTGGTCTGCTATTGCCTGCCTCTTGCCTTTCTCATTTAGGGCTTCCGGGTGACGTACACAATATAGAACTCTGAGAGTAACATCTGCCACCTTGCTGTACGGCCCGTGAGGGCTGGCTTTTCAAAGAGATACTTCAGCGGGTCCACCCTTGCAATCAGCATGGTCGTATAGTTCAACATGTAGTGGCGTAGGCGTTGCGAGGCCCGTGTAAGAGCACAACAGGTCTTTTCTAGAACCGTATACCTTGTCTCATAATCAGTGAACTTCTTGCTGAGATAGTATACGGCTCTTTCCTTCCTACCCGTTTCATCGTGCTGACCAAGGACACAACTCATGGATGCTTCCATTACTGACAGATACATCAGGAGAGGTCGACAGGCGTTGGCGGTGCCTGGATGGGAGGATTGAGTAGATATTTCTTAACTTTGTCAAACGCCTTTTGGCAATCCTCGTTCCTTGTGTCTATCTTTTCTGAAAGGCGGGGTATTCTTTCTGAGCAGTTTAAAGATCGGCTCACAGATGGGTGTGAGCTGGGCAATGAACCTGCTGATGTATTGTAGCCTGCCCCAAAAAGCCCTGATTTCTTTCTCTGTCTTTGGTACCGGCATGTCGATAATTGCTTTGCCTTTTGCAGGTCGACTTCGATTTCTCTTTTGCTGACAATGAACCCGAGTAGCTTACCTGACAAAGCACCAAACCCCCCTCCCGGCTTTCTTTTTCGGATGAAGACGAAGACTGTATTTCCGAAATCTGTCAAACACTTTCTTCAAATTCACCGTCTTCTTAAGCCCAAGACTTGGCGATCATGTCATCGACATAGACCTCCATTTCCTTGTGAATCATATCATGAAACAGCGCAGTCATGGCTCGCTGGTACGTCGCCCCGGTATTCTTTAGACCAAACGGCATCACCTTGTAACAGAACGTGCCCTCCTATCCGATATTGTGATAAACGCTCTGTCTTCCTCGGCCATCTTGATCTGGTTATATCAAGAGAAAGCATCCATAAAGGACAGCATCCCATGTCCAGCGGTGTTGTCCACCAGAACATCGATGTGAGGAAGAGGAAAAAAAGATTTTCGGCTTGCCTTGTTTAGGGTCTTTTGACTCACGGAACCAGCTTTCTGAGGGAAAAACCGTTCTCGAAAAGCGTGACCATCCAGTTGAATCTCGTTACCCTCCCGTGTGGTTATGGGGGCGCGCCCACTTTCCACTATTATGGAGCCGGGCCGCAAGCAAGTGAATGTGACCCCGCCCTCCATCAGCCGTTGTGTGTGAGCTTCGCTCCTTATAACTCTCCACCGTCTATCCCGACC
+TBLASTX ds2020-328_3 8577 2589 NC_026260 Sewage-associated circular DNA virus-18 isolate SaCV-18_NZ-BS3994-2012, complete genome Sewage-associated circular DNA virus-18 35.3 1 100 9.0 0.000149016 46.8882 1592085 Viruses;Sewage-associated circular DNA virus-18 TTCCCTACGTATTAATCTTCTTCTTTTCTCCTTTTTCGCGTTTTCCTCTTATTCCTCTTTCGTTTTCCTCTTATTCTTTTTATACGCAATTTCTTTTTTAATTTCTTACTGGTCTAAGTCCCACTCCTCTTTCTCCCCGTTTTGCGTTAAGAATATTTCACATGGCATCGGTTTATAGCCTTTTTCCCTTGTCATCTCCTCTACAATCTTTTCTATTTTTTCATATTTCTTCTTATAAAATTCTTCCTCTTCTCTTCTCTTGCTTACTTGTATGGTTGCCGGAAATACTCTTGTTTCGCCTATTTGTATTTGTAGAGGCCATGTAGCATAGTCGTTTCCTTGTTGAGCCCCCTTACTTCTTTTAACTTCCATGTAGCTTCTTGCTGTCCAATCCCTTTTATCGTAGAATATCCTTTTAATTTTCTTTGTTTCTGAGTTTTCGTCTTGCTCTCTCTCTCCTTCATTTTCCTCGTCGCTTCCCTCCTGGTTTTCCTCCTCATATTCTTCCTTACTCTTAAATAGCTGCAAGAATCTCCTTCTTTTTTTCTCCTCTTTTTCTTCTTTCTTTTTTACGGGTATACACGCAAAATCTAACAGTGCCATTTCCTTCTCTTGTTCGCCCCATGTGTAGCATTCCTCACCATCGATTGTTTGTAATTCAAACATCAAATAACTTCCTCCCGCTGTGGTTTTAATCTTTTTTATTTTTACTTCATATATTTTTCCTTTTTTTGTTATAAAGATAACTTCTTTCTTTAGAATGTATTCTGCGGCCTCTGGGTTCAACTCCCTTTGATACGGTATGTTTATATTTTTTATGTACTGCTTCCATTTTTTTTGACTGTTTTTCATCTCCTTAGGATCGTCCTCAATAGGAATAAAGGTTCCCACGGTTTTGTTGTATGTTAAGATGACTTCCGTTGGTGTGCTTCTTTCCTTAAAATAGGGGCTCTTACACGCTCTTCTCATTATACACCCATATAAGGTTGCTACTATTCTTTCTTCCTCCAAATGCTCTATGTTTGATGAGAACCTAACCCTATAGAACCTTGCTCTAAAGGGTCCATGTTGTCTCATTATTTGAGGTAGTTTGTTGGCAATCATAACAATTGGTACATTTCTTTTCTTTTTGAATACTCTTGCATATTTGGAGTCTAATCTACATTCTTGTCCATCAAGTACCTTGAGAATAGTGTTTGCAAATGCCGTTCCTTCTGCTGTGGCGCCTATAAGGGAGCTCTCGTCGTTTGGTTCATGAAACTCATCGAATGCCCATAGATCATAGTAATCATTTGCTCCCGTAAAGTCATTTCTTCTTGCACTGGCAAAATAAATTCTTAATACTTTTGCTAGTAAGTGGAATAGTAATGTTTTTTGTGTGCTTGGTTCGCCATATATGAATAGTTGCTTTGTTTTTATGGGTCTCTTGAAGCATATTTGACACGCTATCCAATCTATAACGAGGTACTTTTCTCTTAGCTCTTCCACGTCATACTCCCTTGGTTCCCCTCTTTTTATTAGATAGGATACAATTCTTTCTAGGGTGTTTGTCTCTATATCTTTTAGTATCTTTAAATCTTCATAAGCTTCCTTCATTCTTGGTAGATGCATTAAAACTTTCTTTTGTAATATATCATCTCTATATACTTGGTACCAATCCTCCGTCTTCTCTAGTCTTTTGAGTATTTCTGATGGGTCTGGATTCCCCTGTGCTTCCTTATGTTGTTCATGTGCCTTTGCTAACCCTCTTGTTTGCTCTAAAGAGTATTCTCCCCATATTAATGGTTCTTTATCTTCCTTTAAAATATATTTGCAAATAGTTCCCCATCCCTTATGTGCCTTTACATCTATACATCTTCCATCCCACTCTTTGAATCCATTTCTAATTCCTTTTGCTAAATTGTTCTTTGATGCACTCTCATTCCATACTCCAATGTGGTAATGAAATCCTTTCTCTCCGTGATTTTCCTTTGCTATTATGACTGATCTGCATTGAAACATCTTGATGATTCTCTCCTTTATTACTCCCCTATCTATTTTTTTCCGTTCTGTCGTTTCCGCATGAATAAGTGTTATTAGTAAGTAGGGTCTTATAGTGTTTAGTTTCATGTTCATTGTGTTGTTTCTTTTCCGTGATTTCCTTTTCTTCTTTTGTTTGCGCTAGGTTATGGAGTTGCTGCTGTGAGTGGATGTAACTTCTAGTGGATGTAACTTCTAGTGGATGTAACTTCTAGGTGGGAGTGGATGTAACTAATAGGGGGGTCCGGGGGAAGTGGGTCCCCCCCGGGCAAGAGACAAGATAGGTAACTCCAACATCCTCGTATGAAGAGTAAACAGAAGGGAAGTGAGGCTCCCTTATACAGGAGCCGAACGTTACTTCAATACCTATAAAGTTAAGGTAGTGCTCTTTTTGTTAAATACAAGCAGCCGACAACCCCGCCTAGCTCTAGTAATAGGGGTTGTCGGCGTATCGTCTGATTCTTCGGCGAATCGTCTGCTTTTTTTCTTTTTCCACTCGTGAAGCCCCCCCTTTCGCCCTTTTTTATGCAGACGATTCCCCGATCGGGGAATCGTCTGCATAAAAAAGGG
+TBLASTX ds2020-328_882 20 208
+TBLASTX ds2020-328_115 32 426 NC_043491 Cladosporium fulvum T-1 virus LTR-retrotransposon encoding homologues to retroviral gag, pol, and env genes Cladosporium fulvum T-1 virus 39.7 1 100 5.0 7.5847e-27 117.911 2052899 Viruses;Pararnavirae;Artverviricota;Revtraviricetes;Ortervirales;Metaviridae;Metavirus;Cladosporium fulvum T-1 virus GGTCGGGATAGACGTAAGCACTGGTTCCTCCATAAGTGCCTTCTTCAACTCATTGAAGGCATGCTGGCATCGGGGCGTCCACTCCCACGCCTTGTTCTTCTTTAGCAAATCCGTCAAGGGGGCCGCAATGGCTGAATATCCCTTGATGAACCTGCGGTAGTAGTTAACCAATCCAAGGAATGACCGCAACTCAGGTACCTTGGTTGGTGGCTCCCATTCTTGAATGGCTCGCACCTTGCCCTCCTCCATGAGCAACTGTCCACCCCGTATCTTGTGACCAAGGAACTCCACCTCATTTTGGGCAAACGAGCATTTCTCCTTCTTCACATATAGGTTGTTCTCCCTCAGAACTTTGAACACCTGATGCAAGTGCTCGAGGTGCTCCTCTAGAGAATTGCTAAACACGCACCAACGTCTATCCCGACC
+TBLASTX ds2020-328_513 8 238 NC_038784 Verticillium dahliae chrysovirus 1 segment 1, complete sequence Verticillium dahliae chrysovirus 1 57.1 1 100 6.0 1.6282e-24 108.746 759389 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Verticillium dahliae chrysovirus 1 GGTCGGGATAGACGCCAGACACATCCATTTGCATCAGGGACACCCAATCCACCTTGACTTTCCAGCCCACGAATAACCTCACGCGGCAGATCTAGCCATTCTTCGTCTATTTTGACCCGGCACCAGTGGCTCAGAGCACCTATAACACATCCGCGCGCTATATCTTGATCGAAGCCTCTGCGCTCTAGTTTGTGCATTTGATCTCGGATACCAGCAACTCAGATCGTCTATCCCGACC
+TBLASTX ds2020-328_72 40 520 NC_030891 Sclerotium hydrophilum virus 1 isolate ShR#77 hypothetical protein genes, complete cds Sclerotium hydrophilum virus 1 30.4 1 100 25.0 5.98328e-21 98.7021 1895000 Viruses;Sclerotium hydrophilum virus 1 GGTCGGGATAGACGTTGCCCTCCCCTTTCTCTCCAGCCCGAACCTACCTCTCTCCCTATTCAATGGTGCCGCCTTAACTTCCGTCTTCTTGATGCGAGGAGCGTAGTAGTTGATGCGGGTCTGTATAACACGGTCCGCCTCTGCTATACGCTCAGTTAGGGCGTTCATCTCCTTCTTGTATTCCTGAACGATGTAGGCTTGCTCCCCTTGAATACGGCGGGCGGTTTGATACTCCGCCAACTCTGCCGCGCTCAACGTTGAATCGTCCACCGTCATATTGCGTCTGGCCGATACAATCTTGTAAAAAGCCATTATACATGGTACGGCCACGCTGGCGTGCTTAGCATACCAGACGGCATTCTCCGGAAGAATGTCCTGAGTTTGGTACATCTCCCTCAACCCCACTGTCCAGCGCTCCAAGGACTTTTCGTTGCCATTGAAGCTAGCACGTGGTTCCCTAGACTTTGCTGGGTCGAAGTCTTGGATGCGGGCCCACTCCATCCACACGTCTATCCCGACC
+TBLASTX ds2020-328_449 2 246 NC_017990 Botrytis porri RNA virus 1 RNA 1, complete genome Botrytis porri botybirnavirus 1 75.7 5 100 10.0 1.7255383031988e-20 352.20029999999997 1918014 Viruses;Orthornavirae;Botybirnavirus;Botrytis porri botybirnavirus 1 GGTCGGGATAGACGTGTGGAACTCAACGTGCCCACCGCAAGCTTCAACTGCTCCTGTTAGTGTATAAATCAGAAGGATAGGTAAACCGAGAACTTTGATGCAGAGGCAACCTGGCACTGTTGACGAGCCGTAGTTTACTACGATAGCGGTGGGAATTGAAGCCCACTGTAATCTCCCAACATCTAGGCCCATCAGGGTAAAGTGTGAGAATGAAATTCAAAATGCCCCACTTCGTCTATCCCGACC
+TBLASTX ds2020-328_122 22 418 NC_008039 Prune dwarf virus RNA 1, complete sequence Prune dwarf virus 86.9 3 100 33.0 8.71734076908784e-59 720.298 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGCCCGCGACTTCTCTCTTTATGAACGGTGGGGCAATTCCTGGAACCTTTTTAAGGGTTTTTTATCAGGAGATATGGAAGTCGAAGGGTTTCTTGTTTCTGATCCACAATTCTTCGTTCCACTTACTGGAGTTCTTCATATGAAGAAATTGATAAGTGATGCTGGGAAGGTCCTTAGTGTTAAGGATTTACTCGAAGAACAGCGCGCTCTTGTTGCTTTAAAAATGCGCGAACAGATTGCTGAAAGGGAGAAAGCTGAAAAGAGTCGCCGAGAATATGAGAAGGCGATTATTCAACTTGCTGCTTGGACTAAAGCACATCCAGATGCTAAGGTTCCAAAAGGGCTTTCCGTGGAAGAACCACTGATGCCGGACGTTGTCAAGAAAGTGACGACGTCTATCCCGACC
+TBLASTX ds2020-328_529 6 236
+TBLASTX ds2020-328_421 8 249
+TBLASTX ds2020-328_642 4 225
+TBLASTX ds2020-328_87 54 488 NC_003823 Ustilago maydis virus H1, complete genome Ustilago maydis virus H1 60.9 1 100 5.0 9.72556e-33 137.736 28882 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Ustilago maydis virus H1 GGTCGGGATAGACGTTCCTTGTTGCTTTTCTTACCATTATCTACAGTCCCTACAGCACCACTTTCATTTTTATCACTATTTCCAGTCATATTCATTCTGTTACTGTTAATCCCCATTGTTATTTTCCACTGCTCTGCCGTTGTCTCACTGTCCCATCGAAATCTTTGTGCTGCTCTTTCGAAACTCTTCTTCCATAACGCCTGTACTTTGCTCGTCTTCACTCCTCTCCTTTCTAAGACTGCCAGATTGGAGTATATTTCATGTAGTTTACTGTCAAATCCAACCACTCTGTCTGTTTCCCAGTTACCACAGACAAAAGTAGCACATGATCTAGCCAAGCACCCTCTGAGTTTGCCGTCTTTACACCCTAGAACACGTAGGTATTCATGGTAAGACTGATCCGTAAGCAACTTGACTTCTTGCCCCTTAAGATTACATTTAGTGGCAACTTCATTCCAAGCTAAAGCGCAATGCCGTCTATCCCGACC
+TBLASTX ds2020-328_214 30 308 NC_038697 Scheffersomyces segobiensis virus L isolate NRRL Y-11571, complete genome Scheffersomyces segobiensis virus L 34.1 2 100 6.0 2.15313e-12 87.81970000000001 1300323 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Scheffersomyces segobiensis virus L GGTCGGGATAGACGGCATTAATATGTTAGGGTTATAAACCTTCACGTTAGAATATGTCAATTTTCCATTGTTAAATAACGCATACGTCTTTGGATTAACTTTAACTTTGATATCCAACTGCCTACCGGACTGTATTATTTCTATCCAATTCTTAGCCCTCTTTATTAAAGTGTGCATTGGCATTACAAACAGGTTTGCTGCTCCAGTCCCTGGTATATCTGGCATTACATGACCATTTGCATTTGCAGCCCAATTTTTGTATTTCTTACCAGTCATCGCATCATACACCGTAGACGTCTATCCCGACC
+TBLASTX ds2020-328_717 8 219 NC_038782 Verticillium dahliae chrysovirus 1 segment 2, complete sequence Verticillium dahliae chrysovirus 1 37.1 1 100 6.0 8.08632e-06 46.43 759389 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Verticillium dahliae chrysovirus 1 GGTCGGGATAGACGAAGGCCTAGAGTTGAATACATACGAACGATCACCGTGCCTAAAGGTACCTACCACATCACGGGGATTGTACACAACATAGTCTTGAACGTCTAGATCTACATCTATTGCTCCCCTGTCCATGCATTCTAGTAACATCCAGAAGCCTTTCACCAACCGAGTCAACTTAGATTGCCCAACAAAAACGCGCCAATGTCTATCCCGACC
+TBLASTX ds2020-328_351 20 261 NC_007540 Penicillium chrysogenum virus segment 2, complete genome Penicillium chrysogenum virus 40.5 1 100 7.0 1.87072e-15 78.9628 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGACGACGAGGGGCAGTATTGGGACGAACAGTTGCCGAGGTAGTGAACTACTTTGACAACAAATGTTCGAATGCACTTGAGGTTATGGCAGACGATAAATTTAGTGTATCCTATCATACTTACTATGACGTAGATAGGCCAGCTGTGTTGGGTTTGAATACAATGACTGTGAACGTACCGGTATATTGGACGAAGTTACCAGTAAAAATACAGCCTTACACATCAGAGCTTACCAGGGCGTCTATCCCGACC
+TBLASTX ds2020-328_418 18 250 NC_038826 Flammulina velutipes browning virus RdRp gene for RNA-dependent RNA polymerase, complete cds Flammulina velutipes browning virus 40.3 1 100 11.0 1.21395e-11 66.1329 568090 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Alphapartitivirus;Flammulina velutipes browning virus AGGTCGGGAAAAGCGATTGGCTTTAGGCGGCGCGAGGGACGGAACATCTTCTCGATAACACGAAGAGCTCTTTTGTAGTGGAAATCCCTTGGAACGTCGTGGTAAGGGAGGTCAGTCTTAAGGAAGTCTTCTTCTCCGGCGGCGGGGTTAGTTGCAGAACGGCGGTAGCCATTGATTGCTTCGTTTGCCAAATCGGGGGGACAGCACTTATAGATTGCCTTCTGACGTCTATCCCGACCGCCGTAATTCA
+TBLASTX ds2020-328_149 24 357 NC_007542 Penicillium chrysogenum virus segment 4, complete genome Penicillium chrysogenum virus 44.1 1 100 7.0 3.29805e-16 82.1702 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGGCGGTGTTGTAGCATGTAGCACTGGGACCTGAGGAACAACATTTGTGTGCTGAGGTTGGCGAAAGAAGATTAAATGACGTATCATTTTGGGTTAATGATAGCTTGGGTGGAAGGGAGGATGAAAATGAAGTAATTGGTTCCAGCCTAATAAATACAGATTACCCAGGAACAAAATGCGCCATGGTATACAGCTATGTAGAGGACAAATGGGTAGAAATGAGTAATAAAAATTACGGTGAGTATACAAGGAAAAGCTTCCATGGCGATGTGAGACCTAGTGTACCTTTAAGGCGAACAATGGAAAAAGAACCTGCACCTGTAACTTGGTGCGTCGTCTATCCCGACC
+TBLASTX ds2020-328_591 22 229
+TBLASTX ds2020-328_579 14 230
+TBLASTX ds2020-328_462 6 244 NC_040551 Panax notoginseng virus B isolate YNSL1212, complete genome Panax notoginseng virus B 73.3 1 100 5.0 2.01042e-34 141.737 2248770 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Panax notoginseng virus A GGTCGGGATAGACGGGAGCAATATATGGGGTGGATTTAACTTCGGCAACAGTAGCACACTTTGCCATGTTTAATTGTGAAGAAGCCTTGAAGCATAGGTTCCCGGTAGGTGAAGATGCGGAAGCCGGGCGTGTGCATAAGCGGCTAAAAGCTATGTTAGAAGGATGTGACTCGTACTGCTATGATTTCGATGATTTCAACGCTCAGCACTCGACGTCGAGTATGGTCGCTGTGATAAAGGCGTA
+TBLASTX ds2020-328_867 11 209
+TBLASTX ds2020-328_908 8 207 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 68.4 2 100 8.0 3.53985e-06 185.418 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B GGTCGGGATAGACGATGTTAAGTGCTGGCTGTTGAAGTCCTCAAAGTCTAGACAATATGGCAACCTATTCTTCAAGACACCCGCCACTCTGTTTACTACATTTCTGTCGTTTGCGTCTTTACCTACCGGGAATCTGTTCGGCAAGACGTTCTCGCAATTGTAGAACGCGAAGTTTGCAAGTACGTAACTCGTTCGTCTATCCCGACC
+TBLASTX ds2020-328_7 1825 2116 NC_008038 Prune dwarf virus, complete genome Prune dwarf virus 88.5 19 100 100 0.0 3998.4456999999993 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGTCACCACATCCTCCTTAAAGGGGCATCCTCACCTTACGGTGAGGGCATCTACAAATTTGTAGGCAATAAAAAGTGTCATCCATTCAGGATACAATGGGCATTTTTATCTTAACTTTTAACGCACGCAGTGCAAGTTAACCAAAAGGATTTAACATTCAGTGACAAAATCTGAATGGTGGATTCTATTGCAAAAGCAGCATCTCCAGCTACGAATATTCCTAGGAATACTCATAGTGGAGGTACAATCAAACAACGGATCATATAGTCATCCACTGACTATTTTATCCATTGCATCCATGAGAGCGGTATCCCGTTCAGCGTATAACACTGAATCAGGGATCTCGACTCTCTTGGGCATCGAGTGTTGTAGGTACTGAGTACAGAACCATACCGGAACGCCGGGCTGAAAAGCATTGTCATATTTTATGACAAACCAGAGATCATCTGGTATATCCCCGACGGTCATACCAGTAGGAGCAAGAATTTGCACCCCACTGGCTTGTTTCGCTGTGAACTTCCTACGTTGTAGGGGATTAGGCGCCACTGGCGCATTCACATCGAAACCTTTAATGAGTCCGTAGACACCATTAGAAACATCAAGGCAGTAACGAAAAACAATTCCGTATACCTTGGTATCAGCAGAAAAGTCCTTGAAAAGTTCTCGGACTTTCATGGTGTAGTAAACACCGGAAGCGGTCGAATTGACCGTCAAATTCTCGGTACGAGATATCATACCGGAAAAATTTTTTACGGGCACATTTGGCCCGTGAAGCATCCACTCGGAAACAGACTTCGAGCTTCCACCCGGGAATTGTTTCTTAACAAAACCAGCAGGGGGGGTAGTATTATTATTCTTCCGAGCTAAAGCAAAGCTTTGTGATCGGGTAGTAGGCTTTCCAGATTTAGTGGCTTTCCCAGACATTATGAGAGTATAAACAAACGAGAATTGGAAGAAATTGGTAAACAAAACGAGCTATTAACTCACAAAGTGAGTTAACCAATCGTTACACCAAAAGCTTCCTTGTCGGACTTCTCTTTTTTTAGAGGAACAGACTCGGCTTCCTTGAAACTGTCAAGGGAAGATTTACCCTTTACGGGTACAGCAATATTCTTAAAATCCACTGTTAAAGCCTTCTTTGACTCGTCAGACTTAATTTCAATAAGTCTGGGATTGATATCAACCTTTCCACTACTCCCAATTACCAAACGTGATTTGGCGAATGTTTGGAGTATCTTTACATTGTCCACAGCAGCAAGGGCTTCCGATTTCTCAATCGGGAATCTCAAAGTTGGGTACATTTTCTCATATGGTTTCTTCTTGTGCAATGAGTCATCCCAGAAGGGGTAAACAGTTCCAACAATCGACGCGTGTTTAGCGTCTACACTTACAGCTGATGCTAGTAAACATATACCATCTCCGTCATCAGCATGAACTGCTCTTGGCCATCTCGCTACGAAAATAGCCGCTTCATTCAATGGTGAATCTGTATCTATATCAATAGATTCACCTGTATTCACATTGAAAAGTTTCAATGTCAATACCCCACTAGTTGTTTCCAGAATGGTCGGAATGTACAACAAGTAAATTATACTATGATGCACGTACACATGACCTTTTGCTTTAGCGGATAATCTTGCCAAAGCGCTTCGGGATTCTTTGGATTGCAACTTCATGGGTTGAATTGGAACACCATTCTTCAACTGTAAAGAAAAACATTTCTTAGTTGGAAGATTCTTCATCATAGTTTGGGAATAAAAGTCATCCACTTCGCTGAGTATTGTATTCCAATCTTCAGCGGAAACTTCAAATGCCGAACTGGTACTGGCTTCGGACGTCTGTCCGGTAATGGTCCTGGATACACCAGAGAAAGCCATATTCAATTCAGGAGATAAATCTACAACCGAATTGTTTCACTCAATAAAATAAAGAGGTTAATGAATAGGAACAAGTCCGATTAGTGAGATAAATCTCAAACGTCACAAACTTGTCTTCTTCACACTTTGCAAGAAACCTTGCAGTAACTCAATTTCTTGAGGGTTTATAGAGAACCGCACGTCTGTCAACTTCCACAGCTTAGCACAACCACGCGTCTATCCCGCCC
+TBLASTX ds2020-328_563 2 233
+TBLASTX ds2020-328_410 21 251 NC_008037 Prune dwarf virus RNA 2, complete sequence Prune dwarf virus 78.6 6 100 24.0 7.989507454006384e-19 381.2186 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGGCGGGATAGACGGCTATTGTGGTTGTTCGTATTTTAAAATGGATTCCCTACTTGAGTTTTTGCTACCTTCACATGAAGATGCGATCGAATTGGTTGATGCCAATTCGGTTAAGACTAGCTTCAGCTTGCCTGATTCTAGTGGGGATGTTTCCCCACTTTGTAGGTCGTTGTGTCAGTTCTTCGGATTTCTTATGATCCGAGATACTGTTGTCAGACCTGACAAATTTTCTGGTTTCGTCTATCCCGACC
+TBLASTX ds2020-328_646 23 224
+TBLASTX ds2020-328_537 38 235 NC_007540 Penicillium chrysogenum virus segment 2, complete genome Penicillium chrysogenum virus 47.7 1 100 6.0 1.50506e-11 65.6747 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGACGTTAGCACGGGTTGGAGTAGAGATTCAGTTAGGCAGATAGGTGACGATATGATGCAAACGCTCAGGGTATTGCTTGAGACGGCAGTTGTGGGACAAGAGAAGTTGTGTAGATTAGTTAAAGGGTACCTTTGGCTTCTAGAATGTATGGAAAGAGGTACTATAGATGTTACCGTGGATAGCCAGAATTGTGTAATTTATGGGCCAAATGCGTCTATCCCGACC
+TBLASTX ds2020-328_26 164 872 NC_008039 Prune dwarf virus RNA 1, complete sequence Prune dwarf virus 89.0 8 100 65.0 4.21136e-103 1500.4649 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGATAAACTGGGCTTCTCAGCTTGAGTATGCGTAACATACACAGCGGAGGCATCCACCTCAACTTGAGACAGAGCATTTATAGGTTTCACTTTAATAGACCTAAGAATATGTCTTTTTGTCTTAACAGGAGTCTTCTTTCTATAGAAGAACTTAGACAAAGCATATACCGTATCAGCAGGATTTCGGTATGTAATCGTTTGTTTCACATGATCACCTTTCAAAACATGGTGCTTCAGGAGAAACATATCATTCCTGGAAATAAACGGTATTTGTTCAGTGTCACCAAAGGCTATAACCTCTGATAAACCGGCAATTGCGTCTATCCCGACCNNNNNNNNNNGCGGTCGGATAGACGCAGCCCCCTCACCTCTTCTTCAACCTCATCTCCCTCTTTTGTTTCCAGCACCGGCAATTGTGGCAGCAGCATATATGCACCCAGCATGTTGCATGAAACACTCATCAAACAACATCTTCTTTGCCTTGGGAGCATTGTTTGTCATCAGATAGGAATCGCAAGTTCGAATGAACCTGCTTTTAACTAACTGGGATCCCTCAACAGCTTCTTTCAACTCAATTGCAGAAGATCTGTTGGAAGTCAAGAGTAGGTCTATATCATCTCCAACCATGGAGGCAATAGACTTGATCTTGGTAGTTTTTCCACAACCAGCAACACCGTCCATGATTGTGATTGAAAAATCACAATTCATCTTCAAAGCCTTTTCCAGTGAAGGTATAACCTTCTCCACTGATGAGAATACACAAGAGTCATCAACAATGACAATTTCGTATTCTCCGACAGATCGTACGCAGGCAGCGGACACATTTCCGGCATCATCCCACCATTCCGTCTATCCCGACC
+TBLASTX ds2020-328_246 39 291
+TBLASTX ds2020-328_409 6 252 NC_007540 Penicillium chrysogenum virus segment 2, complete genome Penicillium chrysogenum virus 48.6 1 100 7.0 7.72171e-14 73.4643 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus ACAGAGGTCTTTCTCGAACGTAAAGCTGCCTAAGGTTGTATCAGGCTACGATCTAATGGTGCCAGCATTTATGCACACAAACTCACAACTAGACAAACCAATACTGTCAATGCAAATGGCCAAATAGATTGGTAGGTTGCATCAAATGCTACTATTCATGAATGTTAAAGACATTCTAACAGCTGCTGAACTAAGCACACATTGAACTTTTGATCGTATTGATAGTAGTAGGTTGATTCGTCTATTCCGACC
+TBLASTX ds2020-328_401 2 253 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 52.1 2 100 8.0 2.658960000000012e-05 135.9315 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B TGGTCGGGATAGACATTGCGCGTCCCTGATTGTCATGCACTAGCACTCTGTCCAGCGATAGTCTGGTCCACTCCACAGCTGCCAGCTGCTCTTGAGTTAAGAAGTGACCAAACGTGTCCCTGTAGGCATCTATTACGGCCTTCATAGATTCCACACTGTGTTGACTGTTGAAATCTTCAAAGTCTACACAGTACTGAGTTCTGCCTTCTAAAACTGACCTCACTCTGATACGAACGTCTCGTCTATCCCGACC
+TBLASTX ds2020-328_374 14 257 NC_003885 Mycovirus FusoV RNA 1, complete sequence Fusarium solani virus 1 45.0 1 100 7.0 3.96088e-05 44.5971 1511847 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Gammapartitivirus;Fusarium solani virus 1 GGACGGGATAGACGACGGGCTCGGTTGCTCCAGGTAATTTCCTCCTTCGTAACAAAGTCAGTATATGCCAGACGATGTAAACTTTGTATTCGACAACGACCTCCCGGACGATGATGTGTTGGTTCATCCAGACATCACGGCGTTGGGCTCTCCGTCTTTAAAGACGAGACAACGTCAGTTCCGATCCGGAGCGTTATTTTCTGGTCCCGGTCTCAAAGAGATCGCTCGATATGGTGGTTACTCCGTCTATCCCGACC
+TBLASTX ds2020-328_390 16 254
+TBLASTX ds2020-328_413 6 251
+TBLASTX ds2020-328_58 39 561 NC_043491 Cladosporium fulvum T-1 virus LTR-retrotransposon encoding homologues to retroviral gag, pol, and env genes Cladosporium fulvum T-1 virus 45.8 3 100 6.0 1.5431e-35 185.1108 2052899 Viruses;Pararnavirae;Artverviricota;Revtraviricetes;Ortervirales;Metaviridae;Metavirus;Cladosporium fulvum T-1 virus TGGTCTGGATAGACGCCCGCTGCAAGTTATATGAGAACTGAGCAACATCCATCAACTTTGCCCAATTCCGCTGGTTGGCACTCACATAGTGCCTCAAGTAAAGCTCCAACAAGGCATTCACCCGTTCCGTCTGACCATCTGTCTGAGGGTGAAAGCTAGTTGAGAAGTTCAACTGTGAGCCAAGTAGCTTGAAGAGCTCCGTCCACAGCTTCCCTGTGAAGCGTCTATCCCGCCCNNNNNNNNNNGGTCGGGATGACGGTAGCATACTTGGTGAACCTGTCAACCACCACCAAAATTGAGCCACACCCTTCCGACTTGGGTAGACTCACAATGAAGTCCATGGATAAACTCTCCCATGGTCTGGTTGGAACTGGAAGTGGCTCTAGCAACCCGCCTGGCTGCTTCTGCAATGTCTTGTCTTGTTGGCATACAAGACAAGTCCGCACGAACGAGTCTACATCTTCCCGCATCTGTGGCCAATAATAAGCTTCACTCATCAAGGCTAATGTGCGATGAGTGAAGCTTATTATTGGCCACAGATGGCCACCGTCTATCCCGACC
+TBLASTX ds2020-328_595 8 229
+TBLASTX ds2020-328_692 10 221 NC_038838 Crimson clover cryptic virus 2 isolate IPP_IncarnatSK segment RNA 2, complete sequence Crimson clover cryptic virus 2 53.4 1 100 7.0 1.40883e-16 82.1702 1323528 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Betapartitivirus;Crimson clover cryptic virus 2 CCCCGCTTCCACACCCGCTCACTACTACTCCAAAGTGTATCAAATCTTTACGTCTGTCTTTAACCCAGCTTTGTTCCGCTCCTATCAACGCCGATCCGTTCTCGCCTCAATCGCTCTCGACCCCGTCACCTACCCCGACCGTCACATGAACTTCTTCGATCTCGTTTTCTCCGCTTCCCGCTCCAATCTCGCCGAACTCCGCGCAAACGTCTATCCCGACC
+TBLASTX ds2020-328_51 130 617
+TBLASTX ds2020-328_484 7 242
+TBLASTX ds2020-328_467 20 243 NC_038784 Verticillium dahliae chrysovirus 1 segment 1, complete sequence Verticillium dahliae chrysovirus 1 32.4 1 100 6.0 6.62632e-05 43.6807 759389 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Verticillium dahliae chrysovirus 1 GGTCGGGATAGACGGTCAGTCCCCCTTTGAAATCAAGCACCTCTAACCTCAGCTTGTTCCCCGTTATTATACCTACCATTTCGGCTCTAGTTACGGAGTTGCCATTACGTGTGACATAAGCCGCATATTCCGTATACTTGTCGCATATGCCTTTCAATTTCTCGGCTTCTTCATCCACTTCTTTATTGAACATCACATCTTCTAAACCACTACACTCACGTGGCTCCGTCGTCTATCCCGACC
+TBLASTX ds2020-328_593 14 229
+TBLASTX ds2020-328_332 10 266
+TBLASTX ds2020-328_724 2 219
+TBLASTX ds2020-328_921 20 206
+TBLASTX ds2020-328_136 40 372 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 59.4 1 100 6.0 7.87159e-34 140.821 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B GGTCGGGATAGACGTCAGACGGTTCTTCAGCGTCTATCCAGACCGCCGTTATTCTAGCAACGGCCGGCACGTTGGCATTCCCCTAGACACTGAATCGTCCAGACGCGACTCCAGCGCTTCCAAAAGGTCCCTCATATCGCTTGAAGGTTTTGACTCTATCCTCGAGTGTACCAAGGTTGCCATAGCTCTAGATAGATACTGTCCCTTAGACCCACGTTTGTGGTCTACGCGTAGAAACTCTGCTATGGCCCCATACGCACATTTGCTCATCTGCAGGCGTATGTTGTGCTTCTTGGCATTTTTGCCAGCTAGCAACACGTCCTCGAGCGAATTACTTCCCAGTAGCACGTCGTCACCGTAGTGGCGGCCGTT
+TBLASTX ds2020-328_303 4 271
+TBLASTX ds2020-328_706 4 220 NC_003689 Cherry virus A, complete genome Cherry virus A 79.4 3 100 8.0 4.376753333333334e-21 351.4408 42882 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Tymovirales;Betaflexiviridae;Capillovirus;Cherry virus A GGTCGGGATAGACGAAATCATGTGCATTACTCAATGGGTTCTTGAAAACCAATCTTTTCTTGACTGCGCTCCAGAAAGTTAAATCATCATTAGCAAAATGTCTCGGGAAAACAGCTTCAGGGAGCATTGCGCAATTATCCTCCACCTGATCTTTCTGATTTGGCTCATCTTTGAACTGCTTGCTCCATCCGACACCAATCTCGACTAGGTCCACGGCTCT
+TBLASTX ds2020-328_463 6 244 NC_010985 Curvularia thermal tolerance virus RNA1, complete sequence Curvularia thermal tolerance virus 50.0 1 100 7.0 2.06484e-10 62.0091 421976 Viruses;Curvularia thermal tolerance virus GGTCGGGATAGACGATTGCCGTTGCTGAAAATGACGGGCATCAATTGGTTGGGGGATAAGAGCTTTGGTACCACAATTCTGGAAGATGACGAAGGATGTGGGCACCACCTCAGGTCACAGTTTCAACACGTTGATCCAATCTATTTGTACCTTGATGGTGGGCTATGCCGCACTCTTCGACCTGGTTCCTGATGAAGACTGGGATCGGCTCTGGCAGGAGGCGTAGCTCGCGTCTATCCCGACC
+TBLASTX ds2020-328_69 43 528 NC_008039 Prune dwarf virus RNA 1, complete sequence Prune dwarf virus 93.7 5 100 42.0 9.0761104e-87 1082.5864000000001 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGCCCATTGACATTAGGTTTGTACTGTCGGAATGAAGCCTCACACACTCTGGATAGAACCTTCGTGTCAACCAGTATGTGTCTTCTGGACACCGCTTCTAAAGAAGGGTGTACTACTGACGTAATATCAGTAGCCATGACCAAAGTTTTTGACTTCAGTTTGGTCAACCAGGCACAGGATCTTCCTGCATTCAACTCAATTCCAGGTTTATACCCGGAGCAATAGGTGATATCGATAATCATGACTCCATGAAAATCGGTTTTCCGCTCGACACGAAAGGCGGCATCACCTAGATCAACAGCATTGTAATGCAAATACTCCATAAGTGTAGAATACTTATGGTCATACCCCAAACAGGGTGCATCGACAAAGTCAAAATAAATTCTGTCTTTGTCCTTGTCCACATGCCAATCCACATTGAAATGATCTATGTGACCCCTGTCCTTAATGTACATCTCGGGATCGATCATAACAGAACAAATGAATTTCATCACGCTTATTTCGTCTATCCCGACC
+TBLASTX ds2020-328_861 4 210
+TBLASTX ds2020-328_2 8845 2632 NC_026260 Sewage-associated circular DNA virus-18 isolate SaCV-18_NZ-BS3994-2012, complete genome Sewage-associated circular DNA virus-18 35.3 1 100 9.0 0.000151579 46.8882 1592085 Viruses;Sewage-associated circular DNA virus-18 CCCCCCCTTTCGCCCTTTTTTATGCAGACGATTCCCCGATCGGGGAATCGTCTGCTTCCCTACGTATTAATCTTCTTCTTTTCTCCTTTTTCGCGTTTTCCTCTTATTCCTCTTTCGTTTTCCTCTTATTCTTTTTATACGCAATTTCTTTTTTAATTTCTTACTGGTCTAAGTCCCACTCCTCTTTCTCCCCGTTTTGCGTTAAGAATATTTCACATGGCATCGGTTTATAGCCTTTTTCCCTTGTCATCTCCTCTACAATCTTTTCTATTTTTTCATATTTCTTCTTATAAAATTCTTCCTCTTCTCTTCTCTTGCTTACTTGTATGGTTGCCGGAAATACTCTTGTTTCGCCTATTTGTATTTGTAGAGGCCATGTAGCATAGTCGTTTCCTTGTTGAGCCCCCTTACTTCTTTTAACTTCCATGTAGCTTCTTGCTGTCCAATCCCTTTTATCGTAGAATATCCTTTTAATTTTCTTTGTTTCTGAGTTTTCGTCTTGCTCTCTCTCTCCTTCATTTTCCTCGTCGCTTCCCTCCTGGTTTTCCTCCTCATATTCTTCCTTACTCTTAAATAGCTGCAAGAATCTCCTTCTTTTTTTCTCCTCTTTTTCTTCTTTCTTTTTTACGGGTATACACGCAAAATCTAACAGTGCCATTTCCTTCTCTTGTTCGCCCCATGTGTAGCATTCCTCACCATCGATTGTTTGTAATTCAAACATCAAATAACTTCCTCCCGCTGTGGTTTTAATCTTTTTTATTTTTACTTCATATATTTTTCCTTTTTTTGTTATAAAGATAACTTCTTTCTTTAGAATGTATTCTGCGGCCTCTGGGTTCAACTCCCTTTGATACGGTATGTTTATATTTTTTATGTACTGCTTCCATTTTTTTTGACTGTTTTTCATCTCCTTAGGATCGTCCTCAATAGGAATAAAGGTTCCCACGGTTTTGTTGTATGTTAAGATGACTTCCGTTGGTGTGCTTCTTTCCTTAAAATAGGGGCTCTTACACGCTCTTCTCATTATACACCCATATAAGGTTGCTACTATTCTTTCTTCCTCCAAATGCTCTATGTTTGATGAGAACCTAACCCTATAGAACCTTGCTCTAAAGGGTCCATGTTGTCTCATTATTTGAGGTAGTTTGTTGGCAATCATAACAATTGGTACATTTCTTTTCTTTTTGAATACTCTTGCATATTTGGAGTCTAATCTACATTCTTGTCCATCAAGTACCTTGAGAATAGTGTTTGCAAATGCCGTTCCTTCTGCTGTGGCGCCTATAAGGGAGCTCTCGTCGTTTGGTTCATGAAACTCATCGAATGCCCATAGATCATAGTAATCATTTGCTCCCGTAAAGTCATTTCTTCTTGCACTGGCAAAATAAATTCTTAATACTTTTGCTAGTAAGTGGAATAGTAATGTTTTTTGTGTGCTTGGTTCGCCATATATGAATAGTTGCTTTGTTTTTATGGGTCTCTTGAAGCATATTTGACACGCTATCCAATCTATAACGAGGTACTTTTCTCTTAGCTCTTCCACGTCATACTCCCTTGGTTCCCCTCTTTTTATTAGATAGGATACAATTCTTTCTAGGGTGTTTGTCTCTATATCTTTTAGTATCTTTAAATCTTCATAAGCTTCCTTCATTCTTGGTAGATGCATTAAAACTTTCTTTTGTAATATATCATCTCTATATACTTGGTACCAATCCTCCGTCTTCTCTAGTCTTTTGAGTATTTCTGATGGGTCTGGATTCCCCTGTGCTTCCTTATGTTGTTCATGTGCCTTTGCTAACCCTCTTGTTTGCTCTAAAGAGTATTCTCCCCATATTAATGGTTCTTTATCTTCCTTTAAAATATATTTGCAAATAGTTCCCCATCCCTTATGTGCCTTTACATCTATACATCTTCCATCCCACTCTTTGAATCCATTTCTAATTCCTTTTGCTAAATTGTTCTTTGATGCACTCTCATTCCATACTCCAATGTGGTAATGAAATCCTTTCTCTCCGTGATTTTCCTTTGCTATTATGACTGATCTGCATTGAAACATCTTGATGATTCTCTCCTTTATTACTCCCCTATCTATTTTTTTCCGTTCTGTCGTTTCCGCATGAATAAGTGTTATTAGTAAGTAGGGTCTTATAGTGTTTAGTTTCATGTTCATTGTGTTGTTTCTTTTCCGTGATTTCCTTTTCTTCTTTTGTTTGCGCTAGGTTATGGAGTTGCTGCTGTGAGTGGATGTAACTTCTAGTGGATGTAACTTCTAGTGGATGTAACTTCTAGGTGGGAGTGGATGTAACTAATAGGGGGGTCCGGGGGAAGTGGGTCCCCCCCGGGCAAGAGACAAGATAGGTAACTCCAACATCCTCGTATGAAGAGTAAACAGAAGGGAAGTGAGGCTCCCTTATACAGGAGCCGAACGTTACTTCAATACCTATAAAGTTAAGGTAGTGCTCTTTTTGTTAAATACAAGCAGCCGACAACCCCGCCTAGCTCTAGTAATAGGGGTTGTCGGCGTATCGTCTGATTCTTCGGCGAATCGTCTGCTTTTTTTCTTTTTCCACTCGTGAAGCCCCCCCTTTCGCCCTTTTTTATGCAGACGATTCCCCGATCGGGGAATCGTCTG
+TBLASTX ds2020-328_728 14 218
+TBLASTX ds2020-328_139 20 368
+TBLASTX ds2020-328_711 4 220
+TBLASTX ds2020-328_310 8 270 NC_009890 Black raspberry virus F, complete genome Black raspberry virus F 45.6 1 100 5.0 1.39013e-19 92.709 463392 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Black raspberry virus F GGTCGGGATAGACGTCCGAAGGGTCTACATCTATTACGTCTGGCCTCATTCTGTGTTCACGTTCTTTAACCCAGTCTACTTGACCGTAGCCTCGATTAACAAGTGTATTTAACTCAAACATATCCGTCAGATCAAGTAAGTCCCTAGAGTGTAATGCCTTCAGTGTCACTGATACGTCCATCAGTTGTTCAAGCATTGCGTAGGTGTTTTCACACCACACTTTGTCTGAGTGGGTCAACAATAGAGCACCACAGACCGTCTATCCCGACC
+TBLASTX ds2020-328_891 4 208 NC_007539 Penicillium chrysogenum virus segment 1, complete genome Penicillium chrysogenum virus 77.6 1 100 5.0 4.9233e-29 123.409 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGACGATTTCGGGGGCTAGAAGATAGGGAAGGGCAAATGCATAAATTGTGGCGTGGCTTATATTCCGGGTGGCGAGGCACTACCTGGATAAACACTGTTCTAAATTTCTGCTATGTTCACATAGCGCTGGTGAACCTGGAAAGGATAACAGGGATAAGTGTTGTTTTAATGGTAGGCCACGGCGGCGTCTATCCCGACC
+TBLASTX ds2020-328_317 8 269 NC_030889 Arabidopsis halleri partitivirus 1 gene for RNA dependent RNA polymerase, complete cds Arabidopsis halleri partitivirus 1 50.0 1 100 9.0 6.80502e-15 77.13 1849335 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Arabidopsis halleri partitivirus 1 GGGCGGGATAGACGAATCGTCTCTCGTCCCCAAAGTAGTCTGCCTTTTGTGTCATCATTTAAGTATGTTGCTTGTAGTGTCCAAATGAACATGTTTTCTGCTTGTAATAGAAGCTTGGTAGCTCCGAATACTGCTCGAATTTTGTCAGGTTCATCAGATGCGACAACATGTGAGCGTGCGTGTAACGTGCTCCAATAGTATGGCACTGGCTGACCATCTTTCCAGAATGGAGTTAATCCATCCTTAATAAAGTGGATGAGTGATCGGTT
+TBLASTX ds2020-328_871 4 209
+TBLASTX ds2020-328_518 12 237 NC_007539 Penicillium chrysogenum virus segment 1, complete genome Penicillium chrysogenum virus 70.3 1 100 6.0 3.59992e-34 140.821 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGACGGCTTCTCTACTTGCTTTGTAGTCTGGTACTACGACTTTGTACCACTCTTCGTTCACTTCTGGAACCTTGTCTTTCAATTTCCAAACCATGTTATCTACATCGGGCACTCCTAGCCCGTTGTCTTCAACGCGCCCATGTATTATTGTCTGAGGCAAGTTAAGCCATTTTTCGCCATCTTTTACTCTGCACCAGTGACTTATGCACTGTAGCGTCTATCCCCACC
+TBLASTX ds2020-328_475 6 243
+TBLASTX ds2020-328_693 12 221
+TBLASTX ds2020-328_855 4 210 NC_055143 Rhizoctonia solani ourmia-like virus 1 RNA 1 isolate RsAG2 RNA-dependent RNA polymerase gene, partial cds Ustilago maydis virus H1 64.2 2 100 6.0 1.27988e-11 84.154 28882 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Ustilago maydis virus H1 GGTCGGGATAGACGAGTTGGTGCATTAGAGGCGACGCTAAACCATCGTCGTTTAATGAATTCTCTAGAAACGGAGAATTATTTGTTAGTGGTGATTATGAATCCGCCACTGATAATCTAAACTCTGAGGTCCAACTCGCCATTCTTGACGAGCTGCTGCAGCGCTCTACTTCGGTACCCAGGGGTATCCAGGGCACGCGTCATCCCGACC
+TBLASTX ds2020-328_335 8 266 NC_038697 Scheffersomyces segobiensis virus L isolate NRRL Y-11571, complete genome Scheffersomyces segobiensis virus L 54.7 1 100 5.0 1.69281e-22 102.36 1300323 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Scheffersomyces segobiensis virus L GGTCGGGATAGACGGATCGGAGGCATTAAGTAAAGAACAGTCTATGTCACTAGATTGGACAATTGAGTCAATCTCAGACCAAGTGGTAAGGTTTAATGAGTTAGGAAAAACAGAAAGAATAAATGGAACCTTATTAAGCGGATGGCGTCTGACCTCGTTTATCAATACTGTATTAAATAGAGTGTACTTGTTAAACTCAGGACTAAGTACGTGTGTGAACTATGCGTTACACAACGGTGATGAGATGTATGCGTCTATCCCGACCC
+TBLASTX ds2020-328_890 8 208
+TBLASTX ds2020-328_863 22 209
+TBLASTX ds2020-328_109 77 442 NC_038697 Scheffersomyces segobiensis virus L isolate NRRL Y-11571, complete genome Scheffersomyces segobiensis virus L 59.1 1 100 9.0 5.79157e-51 198.097 1300323 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Scheffersomyces segobiensis virus L TGAATTACGGCGGTCGGGATAGACGCACATACCCCCTCTTGATATTATCTCATCAAACCTGTTATTCATAGATCGTATCAACTCTCTGTAGTCGTTTGCTGGTGCCATCTCTACCCTGCCATGTACCGCTGTTGACACAGCTCTTGCCAGGTACTGCGAACTCGTTTTGTAACTCGCCCTCGTGTCCACCCGTAAGAACTCACCTATGGTCCCAATATTTGTCTTTGCTAATTGTGCTCTTATCCCTGCGTCCTTTGCTCTTTTAGCCAGCTTCACTGCCTGTGCTACGTTTTGCGTTGTAGCGTACATGTCATCTCCGTTGTGCAGTGCATAGTTCACGCTACTATCTAAGCCAACGCTAACGAGATAAACTCTGTTGAGTATGGTGTTTATGAAAGATGTCAATCTCCACCCACTCAGCAATGTTCCGTCTATCCCGACC
+TBLASTX ds2020-328_93 51 471 NC_008037 Prune dwarf virus RNA 2, complete sequence Prune dwarf virus 81.8 6 100 42.0 1.201325e-28 685.9264000000001 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGAATTTTCTGGTGAGTTTATAACGCTTCCTTTCGTTATCGATCGGTTAAGAATGACATTCGATTTGGAGGATGATTATTCATTCTCTATGGGTGATTGTTCATACGATCTGGAACTCACTGATGCTCAACTTGATTATGTTGAAGTTCTTCAACAACAGAAAGATTTCTTTTCAGAAAGTCTTGGTAAGGTTGTTGTCGATTATGATTTTTCCCTTGATAGTGAAGATCCTTCCATCAAGGATGCTGTGAAAATACCCGATGAAATTCCGGAAGATTTCCCTCAGGAAAGTATACCAGCTGAAGTTGTAGCTGATGTTCCACAATCTGTTAGTGATGTCGTCGAAGAGCAAGTCGTGGCTGGAGAGTTGATACCTAGCTGCGAAACTGTCAATGAGAATGTTTGTGTGGAAGTTAAATACCCCACAAGCCTTATCCCTAGATTCCGTCTATCCCGACC
+TBLASTX ds2020-328_388 4 255 NC_004049 Ophiostoma mitovirus 3a, complete genome Ophiostoma mitovirus 3a 50.0 1 100 9.0 1.0261e-20 96.3747 198597 Viruses;Orthornavirae;Lenarviricota;Howeltoviricetes;Cryppavirales;Mitoviridae;Mitovirus;Ophiostoma mitovirus 3a ATAGTACGATAAAACATCTTTCTGAAAACGGATCGGTAAACGATCTGTAGCAGAGGATAAATCAAAGCTGTGGAATTGGTGGTCACCCAACATGCCTAATAACTTTTTATTTAGAAGAGAAATCAAAGGGGCACCTTGATTAAAGGTACCATCCTGTTGAATTCTTCTTAAAATAGAGAAGATATAATCATGAAGGGGCTTTAATATGGATTGTGTTACACAATCAGTAATAGCAAAGGAGTAGTGGCGGCCGTT
+TBLASTX ds2020-328_533 4 236 NC_004049 Ophiostoma mitovirus 3a, complete genome Ophiostoma mitovirus 3a 37.3 1 100 7.0 2.62461e-06 48.2628 198597 Viruses;Orthornavirae;Lenarviricota;Howeltoviricetes;Cryppavirales;Mitoviridae;Mitovirus;Ophiostoma mitovirus 3a GGTCGGGATAGACGAACCCGTCCCCTGGTCGGGATAGACGCCGAGTGTGGATGAACGTCTATCGAGAGTCGATCTCAAACCATTTGCACTTCGTGTACATTCTTTATGACGTTTGTCCGGGAAGAAATTCCTGGTCTTATATCTAAAAGATTGTCACCTCGTGTTAATGAAGTTTGTAGCCGGGGATCCTATTCAGGTTATACCTAATAGACCTCTGAAACATAGTGGCGGCCGTT
+TBLASTX ds2020-328_830 7 211 NC_008037 Prune dwarf virus RNA 2, complete sequence Prune dwarf virus 74.4 3 100 21.0 1.2368933870666668e-13 289.1245 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGCTTACCTTCCCATGGTGAGGTTAATTACTTTTCTGAGTACTTGAAAGGTAAAGCGATCGATGATGATGATCTATACGTTGATCCTATTTGTTTAGTTTCTATGGATAAGTATAGACATATGATAAAATCCCAACTTACACCAGTTGAAGATAACAGTATGATGTTTGAGAGGCCTCTGGCAGCCGTCTATCCCGGCC
+TBLASTX ds2020-328_62 44 551 NC_020903 Xanthophyllomyces dendrorhous virus L1A capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1A 58.1 2 100 8.0 1.13315e-41 187.709 1167690 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1A GGTCGGGATAGACGTGAAGATCAGGTATACGCAGCTTTATGGACAGCAGAATCTGTGGGTAGACAGGTAATACACGATAATGTAGGTACAAAACAAACTTACCTAGCTAAAGATACACTACTATCAGGATGGCGCCTAACCACGTTCATGAACAGCGTTCTTAACTATATATACTCTAAAGCCATAAGTCAAAATATGCTTAAAAGAGGAAACAGTCTTCATAATGGAGATGATGTTCTAATAGGGACGAAGAACTTTGAAGCGGTGCGGAGGGGTCTAGAAATGGCTAACAGGCCTATGACCTCTATCCCGACCNNNNNNNNNNTGAATTAGGCGGTCGGGATAGACGACTGTTTGCGCTGGTCGGGATAGACGCAGCTCACCCCTGGTCGGGATAGACGCGACACAGGGGTCTAGAAATGGCTAAGAGGCTAAACGTAAGGGTGCAAAGCACTAAATGTGCCTTTGCTGGAATAGCTGAATTTTTAAGAGTAGACCATAAACGGGGCAGCAAGGGCCAGTATCAACAAGAAACTGCGTCTATCCCGACC
+TBLASTX ds2020-328_631 4 226
+TBLASTX ds2020-328_253 7 287 NC_008037 Prune dwarf virus RNA 2, complete sequence Prune dwarf virus 79.7 3 100 27.0 2.2710920824666668e-33 432.08500000000004 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGTCGGGATAGACGCCCTTGTCGTTGTTGGTTTAGGCTATTTCTAGTCTGAAATCATTATTTGCTAATAAGAAGAAATGCAAGGACTTCTTATTTCCTGGGTTAAGAGATAAAAACTCAGATTTGCCCATGAGTATGGGTGCCCCTTTAAATATACGGGATGTTACCTCTAAAAGAATTAGAGGTAAAAAGAAGATGAAAGAGAATTCTCATGTTCATATAGATGGTAAGGTCGGTGGATGACCATACTATCTATTATTGTATACCTCCATATCGTCTACCCCGACC
+TBLASTX ds2020-328_487 16 241 NC_007540 Penicillium chrysogenum virus segment 2, complete genome Penicillium chrysogenum virus 45.3 1 100 5.0 1.31892e-09 59.2598 158372 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Alphachrysovirus;Penicillium chrysogenum virus GGTCGGGATAGACGATGCCAAGTAATATATCATCAGATGCAATATCGGGTCTAGCAGAAGACCTAAAATGGAGAGTGGAGCCTGGGAGTGTGAGTGAAAGAGAGGTCAACATTGAAGATAGCAGATGGCTAATATTAGCAGCAATGGCACCAAAAGCAAACTTTGACGTAGAACAATTAAAGTTGCTTTGTAAGCACTTTAATGTACCTATAGACATGCGAACGGTGCGTCTATCCCGACC
+TBLASTX ds2020-328_545 10 235
+TBLASTX ds2020-328_491 11 241
+TBLASTX ds2020-328_405 6 252
+TBLASTX ds2020-328_688 2 222 NC_024705 Cladosporium cladosporioides virus 1 segment RNA2 hypothetical protein gene, complete cds Cladosporium cladosporioides virus 1 46.4 1 100 9.0 1.78828e-11 65.2165 1529605 Viruses;Cladosporium cladosporioides virus 1 GGTCGGGATAGACGGCGCGTTCGTATGAAGCAAGAGCAGGATTGCAGTCCGTAAGAGCAATTCTTGAGCCAGCCATAGCGATTCTGCATGCGTGCAGGTACGATCCCGTGTTGCTCGCTTTCGTAGACAAATATGGTAGGAAAATGTACGACATTGCAGCTAGAACAAAACACGTGCTTGTTGCGTTTTCGTACGTCCATTGCAGAGGTTCCCAGCCCCCCT
+TBLASTX ds2020-328_207 36 313 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 48.9 1 100 6.0 6.03013e-30 127.533 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B AACGGCCGCCACTAATCCGTCTTGGTTGATGTAGACTTAAGAAAGTTCTTTGAGCTGGAAGTTCTTGTCAACAGAGTGGATGGACTGGTCAACTGGGAGGAGGAGCACAAGAACAGGGTGTCCCCTAACTTGGCCGAGATGCCGGAGGGATTGGTTTATGAAAGGGCCTCGCAGCTCTTCAGTAGATCGATCTCAGCGGGTAAGAGACCGAGGAAGTTTGATTGGCGGGAGTACTGGCAGAGTAGGTGGCAGTGGAGTGCGGCCGGCAGCATACACTCGCAATATTCAGAAAACGAAAGTAGTGGCGGCCGTT
+TBLASTX ds2020-328_118 104 424
+TBLASTX ds2020-328_170 40 343 NC_038698 Tuber aestivum virus 1 capsid protein and RNA polymerase genes, complete cds Tuber aestivum virus 1 51.4 2 100 7.0 9.9289e-26 133.1825 927810 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Tuber aestivum virus 1 GGTCGGGAAAGACGGTGCGTGTGGGTATTATCTAGGTTGTTCCCAATTGGTGAAGCAGCGACGGACGAGAATGTCAGACCTACGGTACGCTAAGTTCTACGTAACGGGCAGCCATTTTGTTTCGATTATGAAGATTTCAATTCACAGCATAGCAACAGTTCGATGCAAGCGGTACTTGACGCCTATCTCTTGGTTTTTAAAGACTATTTAAGCGAGGAGCAGGTGGAAGCTATGTCATGGTCAGTGAATAGTCTTAATGATGTTAAGATAAAGCAGCCTAATGGCGACTGGTATGAGGCACGAGGGACACTATTATCAGGCTGGAGAGCCGTCTATCCCGACC
+TBLASTX ds2020-328_188 22 325 NC_003823 Ustilago maydis virus H1, complete genome Ustilago maydis virus H1 52.6 1 100 5.0 2.11696e-28 122.467 28882 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Ustilago maydis virus H1 GGTCGGGATAGACGAGGGGTAAAGGTAGATTGGGAAAAAGAACTCGGTAATAAAGCAACGCCACCAGATGAAGTAGTAGGCTATGCAAATGGAGTTTTTAGTAGACATGCTGCTGATGAAATTATCGGTCAGGCTATAAAAGATGTTGTTACCACAGCTTTTCCACACGCAGTACCAGCTAAGTTCAGTGATTTTATGGACGATGCATATGAGTGGTTGGTTTCTGGATCATCAGCTGGTATACCGAGAGCACTTAAGAATTCGTCAATGAGGACTTATATCCTAAAAGACTTGGGTCTACATACCAAGGGCGTCTATCCCGACC
+TBLASTX ds2020-328_716 13 219 NC_017991 Botrytis porri RNA virus 1 RNA 2, complete genome Botrytis porri botybirnavirus 1 67.2 3 100 7.0 5.963458525815334e-08 193.8168 1918014 Viruses;Orthornavirae;Botybirnavirus;Botrytis porri botybirnavirus 1 GGTCGGGATAGACGGCCGTAGCTTCTCTTTTTGGGAATAATTTTTATTGTAAAAATGATTATTTCAGATAATCCCCGTCAGGGTTAGAAGACACGCGGACGGATTGACGAACGTACGTGCAAGAAAGTCACATCTATTGGATTACTCTAAATGGAACCTCGGACACTCACAAACCGCCTTGTCAGGATATCAGCGGCTGCGAATAGACGTGTGGAACTC
+TBLASTX ds2020-328_251 22 288
+TBLASTX ds2020-328_510 16 238
+TBLASTX ds2020-328_98 46 458 NC_033468 Wuhan insect virus 27 strain WHZM10130 hypothetical protein 1 and hypothetical protein 2 genes, complete cds Wuhan insect virus 27 63.2 1 100 9.0 1.2276e-59 226.964 1923731 Viruses;Wuhan insect virus 27 AACGGCCGCCACTCTTGGGTGTCTATGTAGTTAAGCACGCTGTTCATGAACGTAGTGAGTCGCCACCCCGATAACAGGGTCCCCTTAGCGTTGTACTCCATTTTCAAGCCTTGATTGTCGTGTACTATTACCCTATCCAGTGAAAGCCGAGTCCACTCCACAGCTGCTAGTTGCTCCTGAGTCAGGAAGTGTCCGAAAGTATCTCTGTACGCATCTATTACTGCTTTCATAGATTGTACACTGTGTTGACTGTTGAAATCCTCGAAATCTACACAATACTGAGTCCTGCCTTCTAAGACTGACCTTACTCTACTGCGGACGTTCTCATCGTTGGCTGCTTTTCCCACCGGGAACGGCGAGGGCAATACGTCCTCGCAGTTATAGAAGGCGAAATGTGCCAATACGTAACTAGTGACATCTGTCCCGTAGATAGCGCGGAGTTTACGTCTATCCCGACC
+TBLASTX ds2020-328_226 10 300 NC_038699 Xanthophyllomyces dendrorhous virus L1b capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1B 47.3 1 100 6.0 3.23633e-27 118.369 1167691 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1B GGTCGGGATAGACGCTATCGAGATAAATTTATTCTTCAACCTTATATCTGATTTATGTATAAATTGTTCGTCAGTTTTATATTGTGAATGGATACTCCCAGAAGCACTCCACTGCCATCTGTTGGTCCAAAATTTTTCCCAAGACATCACCATAGGAGTTCTCCCGCTAACTGCTGCACTCGCGAAGATTTTAAGTGCTTCATTCTGGATATAATCAGCACTTAGCTTGACTGTTGACGCTTTTGTTCTATGTGTGAACTCAGCTTCCCAATCGAGCGCGCCGTAACGTCTATCCCGACC
+TBLASTX ds2020-328_159 47 348 NC_008039 Prune dwarf virus RNA 1, complete sequence Prune dwarf virus 97.0 3 100 27.0 2.5280226430549335e-55 668.0630000000001 33760 Viruses;Orthornavirae;Kitrinoviricota;Alsuviricetes;Martellivirales;Bromoviridae;Ilarvirus;Prune dwarf virus GGGTCGGGATAGACGGCAGATACCACTCGAACGTGGTTGTTCGTATTTTAAATCAATCATGACTTCTTCCGAGATCACTGCTGCCAATGTCCATGAACTTTTGGTTAAAGTTCTGGAAAAGCAATGCGCTGACGAGACCACTACCGTCGGTAAGGCTTTCTCTGAGAAAGCAAAACAGTCTTTGAATAAGACATTCGGACTAAATGACGAGTCCAAGCAACTGAAGATTTCTTTTGATTTGACGGCTGAACAGCAGGCGTTACTCAAGAGACATTTTCCGGGTCGATCGGTGATTTTTTCAAATTCATCGAGTTCCTCACACAGTTATGCAGCGCGTCTATCCCGACC
+TBLASTX ds2020-328_166 24 346 NC_005980 Helminthosporium victoriae 145S virus Helminthosporium victoriae 145S virus 26.8 1 100 8.0 1.12841e-07 53.7613 164750 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Chrysoviridae;Chrysovirus;Helminthosporium victoriae 145S virus GGGTCGGGATAGACGTTAACTGCCCATACCAACCATGTTTGCTAGCCTTGCAACGTCAGCTATTTCCTGCCAAGTGTCGACAGCTGCCTCATCTCGCAGCCTATTGTATATCACTGCCTCATCTGCGGTTGTGCAATAACCACGTATACGTAAGTTCTGCACTAATGCATGTATTCCACAAGTACCATCTCCTTTTGTGTTAACTTCTGTCACTATTATTTTGTCCTCCTCTACTGGCATTGGCTCATCTTTGACCAACTTTGACTCTGTGCCTTTGTCTTTCAGTTCATATGAACTACCTAGCATTTCCTCACCATTTACGCCTTTGACATAAACTGGCGATGGT
+TBLASTX ds2020-328_97 31 461 NC_020903 Xanthophyllomyces dendrorhous virus L1A capsid protein (CP) and RNA-dependent RNA polymerase (RdRp) genes, complete cds Xanthophyllomyces dendrorhous virus L1A 52.1 2 100 14.0 1.888695e-05 241.7778 1167690 Viruses;Orthornavirae;Duplornaviricota;Chrymotiviricetes;Ghabrivirales;Totiviridae;Totivirus;Xanthophyllomyces dendrorhous virus L1A AACGGCCGCCACTAAATTGTCCCCTTAGATCCGCGCTTGTGATCCACTCGTAGGAACTCCGCTATAGCTCCGTACGCGCACTTGCTCATTTGTAGTCGTATATTGTGCTTCTTCGCGTTTCGGCCGGCTAGTAACACGTCCCCGAGCGAGTTACTGCCCAGCAGCACGTCGTCGCCGTTATGAAGACTGTTTTGTGACTTCACGACATCTGGCACTATTAATTGAGTGTAAATGTAGTTCAGGACGCTATTCATGAATGTGGTGAGCCTCCACCCCGACAGTAAAGTTCCTTTAGCACTATACTCCATCTTCAAGCCTTGGTTGTCATGTACTATCACTCTGTTCAGCGACAGTCGAGTCCATTCCACCGCCGCCAGCTGCTCTTGCGTTAGGAAGGGCCTGAAGGTGTCTCTGTACGCATCTATCACTGTTTTCATTGACTGTACACTATGTTGACTGTT
+TBLASTX ds2020-328_750 10 216
+TBLASTX ds2020-328_92 33 472 NC_033465 Wuhan insect virus 26 strain WHZM10161 hypothetical protein 1 and hypothetical protein 2 genes, complete cds Wuhan insect virus 26 38.6 1 100 10.0 6.24209e-27 118.369 1923730 Viruses;Wuhan insect virus 26 CGTCATTGAGGAACAAATACTACTCGAGACAATGCGAGCGATTGCACATGACAGTTTCGGACTGTTATAAAATAAAGACCTCCCACAGGTGTGTGGGGGGCATAAGTGAAGACAAGAGATCGGACGTAAAGTGGATGATACGGTCGTCGGGCTTCAGGAAGGGTGCCACGCAGATAGGCGTGTTACCGGGAGTGGTGGACTACTCCAGGATGGTGAAAGCATCACTACAACTTGAAAGACCTTTGCAGGATTTCATTTCACGAATAATGCGCGCAACATACGACGCGGTGATACCAAAAGAAAGGAACATAAACGTTTCAAGGAATGGTAACATCAAGCGGTACGAGATTTTGCGAGCGTTATTCAAGGTACACAAAGAAGAAACAGACATAGTCAATTACGGAAAAGCCAAAATGACCGGCTTCCTGATGGACGTGTTGAATGGGACCAATTATTCATAGTGGCGGCCGTT
+TBLASTX ds2020-328_825 7 211
+TBLASTX ds2020-328_896 2 208 NC_033476 Botryosphaeria dothidea virus 1 strain YZN115 RNA-dependent RNA polymerase (RdRp) gene, complete cds Botryosphaeria dothidea virus 1 41.8 1 100 7.0 8.29721e-08 52.8449 1516075 Viruses;Orthornavirae;Pisuviricota;Duplopiviricetes;Durnavirales;Partitiviridae;Botryosphaeria dothidea virus 1 GGTCGGGATAGACGGGGGGCCTTCTTTCACTCCACACCCCCCATGCACAGGCAACAAAGAAAAAGATGAGACTGGGAACATCGACGACCATCGGTGGAACTCTTTTCGGAGGTCCACTTACCCCGGCGGCGGCTTGGGCCCACGACCAGACAAGGTCTACCTGGGCAAAGTACCTCAAAGAAACGGACGCCAGTCGTCTATCCCGACC
diff -r 000000000000 -r b82ce29791e7 test-data/rps_test.tab
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/rps_test.tab Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,26 @@
+#query_id query_length cdd_id hit_id evalue startQ endQ frame description superkingdom
+ds2020-267_120 339 pfam01333 gnl|CDD|366578 0.000848733 197 325 -3 pfam01333, Apocytochr_F_C, Apocytochrome F, C-terminal. This is a sub-family of cytochrome C. See pfam00034. cellular organisms(1);Eukaryota(1);Viridiplantae(1);Streptophyta(1)
+ds2020-267_374 242 pfam00124 gnl|CDD|365890 5.09126e-07 21 125 3 pfam00124, Photo_RC, Photosynthetic reaction centre protein. cellular organisms(1);Eukaryota(1);Viridiplantae(1);Streptophyta(1)
+ds2020-267_471 230 pfam00201 gnl|CDD|278624 3.12575e-07 46 210 1 pfam00201, UDPGT, UDP-glucoronosyl and UDP-glucosyl transferase. cellular organisms(1);Eukaryota(1);Viridiplantae(1);Streptophytina(1)
+ds2020-267_710 213 pfam01127 gnl|CDD|366480 0.000723904 46 210 1 pfam01127, Sdh_cyt, Succinate dehydrogenase/Fumarate reductase transmembrane subunit. This family includes a transmembrane protein from both the Succinate dehydrogenase and Fumarate reductase complexes. Bacteria(2);cellular organisms(1);Pseudomonadota(1)
+ds2020-267_692 214 pfam00680 gnl|CDD|366242 4.79875e-05 70 180 1 pfam00680, RdRP_1, RNA dependent RNA polymerase. Viruses(1);Riboviria(1);Orthornavirae(1);Pisuviricota(1)
+ds2020-267_817 208 pfam05656 gnl|CDD|377540 3.45664e-06 86 190 -1 pfam05656, DUF805, Protein of unknown function (DUF805). This family consists of several bacterial proteins of unknown function. Bacteria(2);cellular organisms(1);Pseudomonadota(1)
+ds2020-267_98 379 pfam16203 gnl|CDD|374428 1.33948e-30 131 280 -1 pfam16203, ERCC3_RAD25_C, ERCC3/RAD25/XPB C-terminal helicase. This is the C-terminal helicase domain of ERCC3, RAD25 and XPB helicases. cellular organisms(2);Bacteria(1);Terrabacteria group(1)
+ds2020-267_261 260 pfam01051 gnl|CDD|376444 1.77523e-19 26 217 -2 pfam01051, Rep_3, Initiator Replication protein. This protein is an initiator of plasmid replication. RepB possesses nicking-closing (topoisomerase I) like activity. It is also able to perform a strand transfer reaction on ssDNA that contains its target. This family also includes RepA which is an E.coli protein involved in plasmid replication. The RepA protein binds to DNA repeats that flank the repA gene. cellular organisms(1);Bacteria(1);Pseudomonadota(1);Gammaproteobacteria(1)
+ds2020-267_773 210 pfam01641 gnl|CDD|376583 5.23903e-34 16 174 1 pfam01641, SelR, SelR domain. Methionine sulfoxide reduction is an important process, by which cells regulate biological processes and cope with oxidative stress. MsrA, a protein involved in the reduction of methionine sulfoxides in proteins, has been known for four decades and has been extensively characterized with respect to structure and function. However, recent studies revealed that MsrA is only specific for methionine-S-sulfoxides. Because oxidized methionines occur in a mixture of R and S isomers in vivo, it was unclear how stereo-specific MsrA could be responsible for the reduction of all protein methionine sulfoxides. It appears that a second methionine sulfoxide reductase, SelR, evolved that is specific for methionine-R-sulfoxides, the activity that is different but complementary to that of MsrA. Thus, these proteins, working together, could reduce both stereoisomers of methionine sulfoxide. This domain is found both in SelR proteins and fused with the peptide methionine sulfoxide reductase enzymatic domain pfam01625. The domain has two conserved cysteine and histidines. The domain binds both selenium and zinc. The final cysteine is found to be replaced by the rare amino acid selenocysteine in some members of the family. This family has methionine-R-sulfoxide reductase activity. Bacteria(2);cellular organisms(1);Pseudomonadota(1)
+ds2020-267_287 256 pfam00115 gnl|CDD|376293 2.8946e-26 13 237 1 pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I. cellular organisms(1);Eukaryota(1);Opisthokonta(1);Metazoa(1)
+ds2020-267_139 320 pfam05860 gnl|CDD|368641 1.34887e-13 167 298 2 pfam05860, Haemagg_act, haemagglutination activity domain. This domain is suggested to be a carbohydrate- dependent haemagglutination activity site. It is found in a range of haemagglutinins and haemolysins. Bacteria(2);cellular organisms(1);Pseudomonadota(1)
+ds2020-267_763 211 pfam00557 gnl|CDD|376349 0.000231782 167 298 2 pfam00557, Peptidase_M24, Metallopeptidase family M24. This family contains metallopeptidases. It also contains non-peptidase homologs such as the N terminal domain of Spt16 which is a histone H3-H4 binding module. cellular organisms(2);Bacteria(2)
+ds2020-267_571 221 pfam00501 gnl|CDD|366135 2.61467e-07 34 201 1 pfam00501, AMP-binding, AMP-binding enzyme. Bacteria(2);cellular organisms(1);Terrabacteria group(1)
+ds2020-267_565 222 pfam03950 gnl|CDD|377172 9.52435e-10 53 184 -3 pfam03950, tRNA-synt_1c_C, tRNA synthetases class I (E and Q), anti-codon binding domain. Other tRNA synthetase sub-families are too dissimilar to be included. This family includes only glutamyl and glutaminyl tRNA synthetases. In some organisms, a single glutamyl-tRNA synthetase aminoacylates both tRNA(Glu) and tRNA(Gln). cellular organisms(2);Bacteria(1);Eukaryota(1)
+ds2020-267_427 235 pfam03154 gnl|CDD|367360 0.000552392 53 184 -3 pfam03154, Atrophin-1, Atrophin-1 family. Atrophin-1 is the protein product of the dentatorubral-pallidoluysian atrophy (DRPLA) gene. DRPLA OMIM:125370 is a progressive neurodegenerative disorder. It is caused by the expansion of a CAG repeat in the DRPLA gene on chromosome 12p. This results in an extended polyglutamine region in atrophin-1, that is thought to confer toxicity to the protein, possibly through altering its interactions with other proteins. The expansion of a CAG repeat is also the underlying defect in six other neurodegenerative disorders, including Huntington's disease. One interaction of expanded polyglutamine repeats that is thought to be pathogenic is that with the short glutamine repeat in the transcriptional coactivator CREB binding protein, CBP. This interaction draws CBP away from its usual nuclear location to the expanded polyglutamine repeat protein aggregates that are characteristic of the polyglutamine neurodegenerative disorders. This interferes with CBP-mediated transcription and causes cytotoxicity. Eukaryota(1);cellular organisms(1);Opisthokonta(1);Metazoa(1)
+ds2020-267_4 2297 pfam00680 gnl|CDD|366242 4.43825e-05 995 1510 -2 pfam00680, RdRP_1, RNA dependent RNA polymerase. Viruses(1);Riboviria(1);Orthornavirae(1);Pisuviricota(1)
+ds2020-267_16 1165 pfam00680 gnl|CDD|366242 8.1737e-06 707 1042 -1 pfam00680, RdRP_1, RNA dependent RNA polymerase. Viruses(1);Riboviria(1);Orthornavirae(1);Pisuviricota(1)
+ds2020-267_438 234 pfam00078 gnl|CDD|365856 0.000870142 707 1042 -1 pfam00078, RVT_1, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses. Viruses(1);Riboviria(1);Pararnavirae(1);Artverviricota(1)
+ds2020-267_370 242 pfam00146 gnl|CDD|376297 2.41391e-10 22 111 1 pfam00146, NADHdh, NADH dehydrogenase. cellular organisms(1);Eukaryota(1);Opisthokonta(1);Metazoa(1)
+ds2020-267_278 258 pfam00012 gnl|CDD|365808 4.1355e-19 50 232 2 pfam00012, HSP70, Hsp70 protein. Hsp70 chaperones help to fold many proteins. Hsp70 assisted folding involves repeated cycles of substrate binding and release. Hsp70 activity is ATP dependent. Hsp70 proteins are made up of two regions: the amino terminus is the ATPase domain and the carboxyl terminus is the substrate binding region. cellular organisms(2);Eukaryota(1);Bacteria(1)
+ds2020-267_364 243 pfam00216 gnl|CDD|365952 1.5507e-10 134 241 -3 pfam00216, Bac_DNA_binding, Bacterial DNA-binding protein. Bacteria(2);cellular organisms(1);Pseudomonadota(1)
+ds2020-267_558 222 pfam03737 gnl|CDD|377116 4.93695e-13 57 179 -2 pfam03737, RraA-like, Aldolase/RraA. Members of this family include regulator of ribonuclease E activity A (RraA) and 4-hydroxy-4-methyl-2-oxoglutarate (HMG)/4-carboxy- 4-hydroxy-2-oxoadipate (CHA) aldolase, also known as RraA-like protein. RraA acts as a trans-acting modulator of RNA turnover, binding essential endonuclease RNase E and inhibiting RNA processing. RraA-like proteins seem to contain aldolase and/or decarboxylase activity either in place of or in addition to the RNase E inhibitor functions. Bacteria(2);cellular organisms(1);Pseudomonadota(1)
+ds2020-267_218 274 pfam01348 gnl|CDD|279664 1.66328e-05 51 257 3 pfam01348, Intron_maturas2, Type II intron maturase. Group II introns use intron-encoded reverse transcriptase, maturase and DNA endonuclease activities for site-specific insertion into DNA. Although this type of intron is self splicing in vitro they require a maturase protein for splicing in vivo. It has been shown that a specific region of the aI2 intron is needed for the maturase function. This region was found to be conserved in group II introns and called domain X. cellular organisms(1);Eukaryota(1);Viridiplantae(1);Streptophyta(1)
+ds2020-267_363 243 pfam00416 gnl|CDD|366086 2.02528e-05 15 134 -2 pfam00416, Ribosomal_S13, Ribosomal protein S13/S18. This family includes ribosomal protein S13 from prokaryotes and S18 from eukaryotes. cellular organisms(2);Bacteria(2)
+ds2020-267_746 211 pfam01490 gnl|CDD|279788 0.000177299 15 134 -2 pfam01490, Aa_trans, Transmembrane amino acid transporter protein. This transmembrane region is found in many amino acid transporters including UNC-47 and MTR. UNC-47 encodes a vesicular amino butyric acid (GABA) transporter, (VGAT). UNC-47 is predicted to have 10 transmembrane domains. MTR is a N system amino acid transporter system protein involved in methyltryptophan resistance. Other members of this family include proline transporters and amino acid permeases. cellular organisms(1);Eukaryota(1);Opisthokonta(1);Metazoa(1)
diff -r 000000000000 -r b82ce29791e7 test-data/rps_test.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/rps_test.xml Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,5021 @@
+
+
+
+ rpstblastn
+ RPSTBLASTN 2.10.1+
+ Stephen F. Altschul, Thomas L. Madden, Alejandro A. Schäffer, Jinghui Zhang, Zheng Zhang, Webb Miller, and David J. Lipman (1997), "Gapped BLAST and PSI-BLAST: a new generation of protein database search programs", Nucleic Acids Res. 25:3389-3402.
+ /home/tcandresse/work/pfam/Pfam
+ ds2020-267_269
+ No definition line
+ 259
+
+
+ BLOSUM62
+ 0.001
+ 11
+ 1
+ F
+
+
+
+
+ 1
+ ds2020-267_269
+ No definition line
+ 259
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.050055168
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 2
+ ds2020-267_1242
+ No definition line
+ 59
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 3
+ ds2020-267_333
+ No definition line
+ 248
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 75683825
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 4
+ ds2020-267_1111
+ No definition line
+ 70
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 5
+ ds2020-267_560
+ No definition line
+ 222
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 6
+ ds2020-267_120
+ No definition line
+ 339
+
+
+ 1
+ gnl|CDD|374695
+ pfam16639, Apocytochr_F_N, Apocytochrome F, N-terminal. This is the N-terminal domain of cytochrome f. It is a soluble lumen-side domain.
+ 374695
+ 154
+
+
+ 1
+ 91.1926
+ 227
+ 2.20279e-25
+ 197
+ 325
+ 112
+ 154
+ -3
+ 0
+ 30
+ 37
+ 0
+ 43
+ MVIGPVPGQKYSEITFPILSPDPATKKDVHFLKYPIYVGGNRG
+ LIVGPLPGDQYQEIVFPVLSPDPATDKSVHFGKYPVYVGGNRG
+ +++GP+PG +Y EI FP+LSPDPAT K VHF KYP+YVGGNRG
+
+
+
+
+ 2
+ gnl|CDD|366578
+ pfam01333, Apocytochr_F_C, Apocytochrome F, C-terminal. This is a sub-family of cytochrome C. See pfam00034.
+ 366578
+ 115
+
+
+ 1
+ 34.0526
+ 79
+ 0.000848733
+ 116
+ 163
+ 1
+ 16
+ -3
+ 0
+ 10
+ 13
+ 0
+ 16
+ NNNVYNATAAGIVSKI
+ NNNVFTASAAGTISAI
+ NNNV+ A+AAG +S I
+
+
+
+
+
+
+ 17919
+ 3004588
+ 70
+ 75261094
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 7
+ ds2020-267_374
+ No definition line
+ 242
+
+
+ 1
+ gnl|CDD|365890
+ pfam00124, Photo_RC, Photosynthetic reaction centre protein.
+ 365890
+ 260
+
+
+ 1
+ 42.9994
+ 102
+ 5.09126e-07
+ 21
+ 125
+ 91
+ 125
+ 3
+ 0
+ 12
+ 19
+ 0
+ 35
+ SVQLRPYNAIAFSGPIAVFVSVFLIYPLGQSGWFF
+ KLGMGPHVAWAFSAAIAAYLSLGLIRPILMGSWSE
+ + + P+ A AFS IA ++S+ LI P+ W
+
+
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 8
+ ds2020-267_470
+ No definition line
+ 230
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 9
+ ds2020-267_609
+ No definition line
+ 218
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 10
+ ds2020-267_128
+ No definition line
+ 332
+
+
+
+
+ 17919
+ 3004588
+ 68
+ 75016032
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 11
+ ds2020-267_870
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 12
+ ds2020-267_1236
+ No definition line
+ 59
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 13
+ ds2020-267_651
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 14
+ ds2020-267_648
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 15
+ ds2020-267_847
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 16
+ ds2020-267_978
+ No definition line
+ 121
+
+
+
+
+ 17919
+ 3004588
+ 13
+ 74834307
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 17
+ ds2020-267_973
+ No definition line
+ 123
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 18
+ ds2020-267_456
+ No definition line
+ 232
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 19
+ ds2020-267_272
+ No definition line
+ 259
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 20
+ ds2020-267_1065
+ No definition line
+ 74
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 21
+ ds2020-267_888
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 22
+ ds2020-267_866
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 23
+ ds2020-267_1034
+ No definition line
+ 76
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 24
+ ds2020-267_393
+ No definition line
+ 240
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 25
+ ds2020-267_1084
+ No definition line
+ 72
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 26
+ ds2020-267_489
+ No definition line
+ 228
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 27
+ ds2020-267_471
+ No definition line
+ 230
+
+
+ 1
+ gnl|CDD|278624
+ pfam00201, UDPGT, UDP-glucoronosyl and UDP-glucosyl transferase.
+ 278624
+ 499
+
+
+ 1
+ 43.5512
+ 103
+ 3.12575e-07
+ 46
+ 210
+ 353
+ 401
+ 1
+ 0
+ 14
+ 23
+ 10
+ 57
+ IL*ALTAGVPMICSPFFADQRTNCYYTCNEWGSGMEIDNTFGRAD--SMQSAEVLTA
+ VYEAICHGVPMVGMPLFGDQMDNAKHMEAKGA--------AVTLNVLTMTSEDLLNA
+ + A+ GVPM+ P F DQ N + + + +M S ++L A
+
+
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 28
+ ds2020-267_367
+ No definition line
+ 243
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 29
+ ds2020-267_535
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 30
+ ds2020-267_1201
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 31
+ ds2020-267_710
+ No definition line
+ 213
+
+
+ 1
+ gnl|CDD|366480
+ pfam01127, Sdh_cyt, Succinate dehydrogenase/Fumarate reductase transmembrane subunit. This family includes a transmembrane protein from both the Succinate dehydrogenase and Fumarate reductase complexes.
+ 366480
+ 122
+
+
+ 1
+ 33.1145
+ 76
+ 0.000723904
+ 13
+ 126
+ 8
+ 45
+ 1
+ 0
+ 13
+ 19
+ 0
+ 38
+ NSDLLIYKPQLTSTFPISHRISGAFLVTIVLFFYLLCL
+ SPHLGLYRAHLGTWLSILHRITGVALFVLGLIHLLLWL
+ + L +Y+ L + I HRI+G L + L LL L
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 32
+ ds2020-267_904
+ No definition line
+ 142
+
+
+
+
+ 17919
+ 3004588
+ 19
+ 74595556
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 33
+ ds2020-267_692
+ No definition line
+ 214
+
+
+ 1
+ gnl|CDD|366242
+ pfam00680, RdRP_1, RNA dependent RNA polymerase.
+ 366242
+ 470
+
+
+ 1
+ 37.3361
+ 87
+ 4.79875e-05
+ 70
+ 180
+ 82
+ 115
+ 1
+ 0
+ 16
+ 21
+ 3
+ 37
+ FTFEDATLDEAINGVEDLDYFDSLVIGTSEGYPYVLE
+ ADLGDLSVSEAINGA---EGFDALNKDTSPGLPYILE
+ D ++ EAING + FD+L TS G PY+LE
+
+
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 34
+ ds2020-267_1114
+ No definition line
+ 69
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 35
+ ds2020-267_813
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 36
+ ds2020-267_390
+ No definition line
+ 241
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 37
+ ds2020-267_217
+ No definition line
+ 275
+
+
+
+
+ 17919
+ 3004588
+ 54
+ 75367594
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 38
+ ds2020-267_654
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 39
+ ds2020-267_956
+ No definition line
+ 126
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 40
+ ds2020-267_1228
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 41
+ ds2020-267_608
+ No definition line
+ 218
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 42
+ ds2020-267_412
+ No definition line
+ 238
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 43
+ ds2020-267_211
+ No definition line
+ 276
+
+
+
+
+ 17919
+ 3004588
+ 55
+ 74704591
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 44
+ ds2020-267_419
+ No definition line
+ 236
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 45
+ ds2020-267_606
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 46
+ ds2020-267_817
+ No definition line
+ 208
+
+
+ 1
+ gnl|CDD|377540
+ pfam05656, DUF805, Protein of unknown function (DUF805). This family consists of several bacterial proteins of unknown function.
+ 377540
+ 108
+
+
+ 1
+ 39.1746
+ 92
+ 3.45664e-06
+ 86
+ 190
+ 72
+ 106
+ -1
+ 0
+ 15
+ 19
+ 0
+ 35
+ TGWLSLRMQIPALDLIFMIYLFAAKGTEGNNDYGP
+ SGWWLLLGLIPIIGLIVLLVLLCLPGTPGPNRYGP
+ +GW L IP + LI ++ L GT G N YGP
+
+
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 47
+ ds2020-267_1207
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 48
+ ds2020-267_98
+ No definition line
+ 379
+
+
+ 1
+ gnl|CDD|374428
+ pfam16203, ERCC3_RAD25_C, ERCC3/RAD25/XPB C-terminal helicase. This is the C-terminal helicase domain of ERCC3, RAD25 and XPB helicases.
+ 374428
+ 247
+
+
+ 1
+ 107.677
+ 270
+ 1.33948e-30
+ 131
+ 280
+ 108
+ 157
+ -1
+ 0
+ 39
+ 42
+ 0
+ 50
+ NMAFLSKVGDNSIDILEANVIIQISSHAGSRRQEAQRLGRILRAKGKLQD
+ NTIFLSKVGDTSIDLPEANVLIQISSHFGSRRQEAQRLGRILRAKRRSND
+ N FLSKVGD SID+ EANV+IQISSH GSRRQEAQRLGRILRAK + D
+
+
+
+
+
+
+ 17919
+ 3004588
+ 76
+ 82137200
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 78
+ ds2020-267_1141
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 79
+ ds2020-267_212
+ No definition line
+ 276
+
+
+
+
+ 17919
+ 3004588
+ 55
+ 74704591
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 80
+ ds2020-267_261
+ No definition line
+ 260
+
+
+ 1
+ gnl|CDD|376444
+ pfam01051, Rep_3, Initiator Replication protein. This protein is an initiator of plasmid replication. RepB possesses nicking-closing (topoisomerase I) like activity. It is also able to perform a strand transfer reaction on ssDNA that contains its target. This family also includes RepA which is an E.coli protein involved in plasmid replication. The RepA protein binds to DNA repeats that flank the repA gene.
+ 376444
+ 221
+
+
+ 1
+ 76.5582
+ 189
+ 1.77523e-19
+ 26
+ 217
+ 94
+ 157
+ -2
+ 0
+ 28
+ 42
+ 0
+ 64
+ RWVDKIGYIDDLGCVELVFASDVIPLITRLEQRFTEYDIDQVSNLQSKYAVRLYELLVQWRSTG
+ LWVGYIISAKGEGKVEIEFSPDLKPYLLELKKNFTKYELKEFLKLKSKYSIRLYELLKQYRSTG
+ WV I G VE+ F+ D+ P + L++ FT+Y++ + L+SKY++RLYELL Q+RSTG
+
+
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 81
+ ds2020-267_689
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 82
+ ds2020-267_892
+ No definition line
+ 181
+
+
+
+
+ 17919
+ 3004588
+ 30
+ 74010540
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 83
+ ds2020-267_1243
+ No definition line
+ 59
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 84
+ ds2020-267_521
+ No definition line
+ 225
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 85
+ ds2020-267_773
+ No definition line
+ 210
+
+
+ 1
+ gnl|CDD|376583
+ pfam01641, SelR, SelR domain. Methionine sulfoxide reduction is an important process, by which cells regulate biological processes and cope with oxidative stress. MsrA, a protein involved in the reduction of methionine sulfoxides in proteins, has been known for four decades and has been extensively characterized with respect to structure and function. However, recent studies revealed that MsrA is only specific for methionine-S-sulfoxides. Because oxidized methionines occur in a mixture of R and S isomers in vivo, it was unclear how stereo-specific MsrA could be responsible for the reduction of all protein methionine sulfoxides. It appears that a second methionine sulfoxide reductase, SelR, evolved that is specific for methionine-R-sulfoxides, the activity that is different but complementary to that of MsrA. Thus, these proteins, working together, could reduce both stereoisomers of methionine sulfoxide. This domain is found both in SelR proteins and fused with the peptide methionine sulfoxide reductase enzymatic domain pfam01625. The domain has two conserved cysteine and histidines. The domain binds both selenium and zinc. The final cysteine is found to be replaced by the rare amino acid selenocysteine in some members of the family. This family has methionine-R-sulfoxide reductase activity.
+ 376583
+ 120
+
+
+ 1
+ 110.138
+ 277
+ 5.23903e-34
+ 16
+ 174
+ 6
+ 58
+ 1
+ 0
+ 32
+ 36
+ 0
+ 53
+ LTDVQYYVTQQNGTERPFSHEYDHQFEPGIYVDIVSGEPLFSSSDKYDSGCGW
+ LTPEQYRVLREKGTERPFTGEYWDNKEPGIYVCAGCGTPLFSSDTKFDSGCGW
+ LT QY V ++ GTERPF+ EY EPGIYV G PLFSS K+DSGCGW
+
+
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 86
+ ds2020-267_619
+ No definition line
+ 217
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 87
+ ds2020-267_675
+ No definition line
+ 215
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 88
+ ds2020-267_974
+ No definition line
+ 122
+
+
+
+
+ 17919
+ 3004588
+ 13
+ 74834307
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 89
+ ds2020-267_912
+ No definition line
+ 135
+
+
+
+
+ 17919
+ 3004588
+ 17
+ 75599020
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 90
+ ds2020-267_1054
+ No definition line
+ 75
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 91
+ ds2020-267_287
+ No definition line
+ 256
+
+
+ 1
+ gnl|CDD|376293
+ pfam00115, COX1, Cytochrome C and Quinol oxidase polypeptide I.
+ 376293
+ 433
+
+
+ 1
+ 97.2464
+ 243
+ 2.8946e-26
+ 13
+ 237
+ 326
+ 400
+ 1
+ 0
+ 47
+ 57
+ 0
+ 75
+ NTPGLDIALHDTYYVVAHFHYVLSMGAVFALFAGFHYWVGKIFGRIYPETLGQIHFWITFFGVNLTFFPMHFLGL
+ ALPPVNYYVHDTYFVVAHFHYVLFGGVVFALFAGIYYWFPKLTGRMYSERLGKLHFWLLFIGFNLTFFPMHILGL
+ P ++ +HDTY+VVAHFHYVL G VFALFAG +YW K+ GR+Y E LG++HFW+ F G NLTFFPMH LGL
+
+
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 73802330
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 92
+ ds2020-267_139
+ No definition line
+ 320
+
+
+ 1
+ gnl|CDD|368641
+ pfam05860, Haemagg_act, haemagglutination activity domain. This domain is suggested to be a carbohydrate- dependent haemagglutination activity site. It is found in a range of haemagglutinins and haemolysins.
+ 368641
+ 118
+
+
+ 1
+ 59.967
+ 146
+ 1.34887e-13
+ 167
+ 298
+ 56
+ 99
+ 2
+ 0
+ 20
+ 26
+ 0
+ 44
+ GEAKIILGQVNSTSPSQLAGYTEIAGGKAELVIANPAGITCSGG
+ GAASNILNRVTGGNPSQIQGYIEVAGANANVFLANPNGIIFGGN
+ G A IL +V +PSQ+ GY E+AG A + +ANP GI G
+
+
+
+
+
+
+ 17919
+ 3004588
+ 65
+ 75433973
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 93
+ ds2020-267_763
+ No definition line
+ 211
+
+
+ 1
+ gnl|CDD|376349
+ pfam00557, Peptidase_M24, Metallopeptidase family M24. This family contains metallopeptidases. It also contains non-peptidase homologs such as the N terminal domain of Spt16 which is a histone H3-H4 binding module.
+ 376349
+ 206
+
+
+ 1
+ 34.896
+ 81
+ 0.000231782
+ 15
+ 74
+ 76
+ 95
+ -3
+ 0
+ 12
+ 14
+ 0
+ 20
+ FLIDAGASFHGYASDITRIY
+ VLIDVGAEYDGYCSDITRTF
+ LID GA + GY SDITR +
+
+
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 94
+ ds2020-267_624
+ No definition line
+ 217
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 95
+ ds2020-267_70
+ No definition line
+ 445
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 109640103
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 96
+ ds2020-267_1209
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 97
+ ds2020-267_196
+ No definition line
+ 283
+
+
+
+
+ 17919
+ 3004588
+ 57
+ 73378585
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 98
+ ds2020-267_1102
+ No definition line
+ 71
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 99
+ ds2020-267_346
+ No definition line
+ 246
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 75683825
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 100
+ ds2020-267_612
+ No definition line
+ 218
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 101
+ ds2020-267_607
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.04777374
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 102
+ ds2020-267_571
+ No definition line
+ 221
+
+
+ 1
+ gnl|CDD|366135
+ pfam00501, AMP-binding, AMP-binding enzyme.
+ 366135
+ 361
+
+
+ 1
+ 43.7436
+ 104
+ 2.61467e-07
+ 34
+ 201
+ 1
+ 56
+ 1
+ 0
+ 17
+ 29
+ 0
+ 56
+ LERSATVYGDCPSLIYNDTTYTWTQTHRRCIRVASSISSLVIKSRHVVSVLSPNTP
+ LERQAARTPDKTALVGEGRRLTYRELDERANRLAAGLRALGVKKGDRVAILLPNSP
+ LER A D +L+ T+ + R R+A+ + +L +K V++L PN+P
+
+
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 103
+ ds2020-267_592
+ No definition line
+ 219
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 104
+ ds2020-267_764
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 105
+ ds2020-267_1015
+ No definition line
+ 85
+
+
+
+
+ 17919
+ 3004588
+ 3
+ 73770775
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 106
+ ds2020-267_1151
+ No definition line
+ 65
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 107
+ ds2020-267_69
+ No definition line
+ 451
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 112818077
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 108
+ ds2020-267_167
+ No definition line
+ 298
+
+
+
+
+ 17919
+ 3004588
+ 60
+ 75248472
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 109
+ ds2020-267_23
+ No definition line
+ 835
+
+
+
+
+ 17919
+ 3004588
+ 85
+ 285924289
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 110
+ ds2020-267_872
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 111
+ ds2020-267_578
+ No definition line
+ 221
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 112
+ ds2020-267_611
+ No definition line
+ 218
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 113
+ ds2020-267_565
+ No definition line
+ 222
+
+
+ 1
+ gnl|CDD|377172
+ pfam03950, tRNA-synt_1c_C, tRNA synthetases class I (E and Q), anti-codon binding domain. Other tRNA synthetase sub-families are too dissimilar to be included. This family includes only glutamyl and glutaminyl tRNA synthetases. In some organisms, a single glutamyl-tRNA synthetase aminoacylates both tRNA(Glu) and tRNA(Gln).
+ 377172
+ 174
+
+
+ 1
+ 49.5699
+ 119
+ 9.52435e-10
+ 53
+ 184
+ 63
+ 108
+ -3
+ 0
+ 16
+ 27
+ 2
+ 46
+ EIRLRNSYVLKIEEHITDDNGEVVGLTATIDPKTLGNN--PEGLVH
+ EVRLMDAYNIKVTEVVKDEDGNVTELHCTYDGDDLGGARKVKGIIH
+ E+RL ++Y +K+ E + D++G V L T D LG +G++H
+
+
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 114
+ ds2020-267_468
+ No definition line
+ 230
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 115
+ ds2020-267_202
+ No definition line
+ 281
+
+
+
+
+ 17919
+ 3004588
+ 56
+ 74041588
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 116
+ ds2020-267_826
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 117
+ ds2020-267_503
+ No definition line
+ 226
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 118
+ ds2020-267_197
+ No definition line
+ 283
+
+
+
+
+ 17919
+ 3004588
+ 57
+ 73378585
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 119
+ ds2020-267_307
+ No definition line
+ 253
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 120
+ ds2020-267_427
+ No definition line
+ 235
+
+
+ 1
+ gnl|CDD|367360
+ pfam03154, Atrophin-1, Atrophin-1 family. Atrophin-1 is the protein product of the dentatorubral-pallidoluysian atrophy (DRPLA) gene. DRPLA OMIM:125370 is a progressive neurodegenerative disorder. It is caused by the expansion of a CAG repeat in the DRPLA gene on chromosome 12p. This results in an extended polyglutamine region in atrophin-1, that is thought to confer toxicity to the protein, possibly through altering its interactions with other proteins. The expansion of a CAG repeat is also the underlying defect in six other neurodegenerative disorders, including Huntington's disease. One interaction of expanded polyglutamine repeats that is thought to be pathogenic is that with the short glutamine repeat in the transcriptional coactivator CREB binding protein, CBP. This interaction draws CBP away from its usual nuclear location to the expanded polyglutamine repeat protein aggregates that are characteristic of the polyglutamine neurodegenerative disorders. This interferes with CBP-mediated transcription and causes cytotoxicity.
+ 367360
+ 980
+
+
+ 1
+ 34.611
+ 79
+ 0.000552392
+ 40
+ 213
+ 578
+ 636
+ -2
+ 0
+ 19
+ 37
+ 1
+ 59
+ KEMEEGKHKSRKEGESK-RSHRDRQREKERNGERHRDKDKDKDKRDRDSRRSEREKSSD
+ KKREEALEKAKREAEQKAREEREREKEREKEREREREREREAERAAKASSSSHEGRMSD
+ K+ EE K+++E E K R R+R++E+E+ ER R+++++ ++ + S S + SD
+
+
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 121
+ ds2020-267_738
+ No definition line
+ 212
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 122
+ ds2020-267_1160
+ No definition line
+ 64
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 123
+ ds2020-267_1066
+ No definition line
+ 74
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 124
+ ds2020-267_7
+ No definition line
+ 1772
+
+
+
+
+ 17919
+ 3004588
+ 91
+ 685605541
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 125
+ ds2020-267_786
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 126
+ ds2020-267_44
+ No definition line
+ 545
+
+
+
+
+ 17919
+ 3004588
+ 81
+ 155314900
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 127
+ ds2020-267_475
+ No definition line
+ 229
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 128
+ ds2020-267_928
+ No definition line
+ 130
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 129
+ ds2020-267_752
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 130
+ ds2020-267_988
+ No definition line
+ 116
+
+
+
+
+ 17919
+ 3004588
+ 11
+ 75801933
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 131
+ ds2020-267_265
+ No definition line
+ 260
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 132
+ ds2020-267_1219
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 133
+ ds2020-267_115
+ No definition line
+ 345
+
+
+
+
+ 17919
+ 3004588
+ 72
+ 73720060
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 134
+ ds2020-267_559
+ No definition line
+ 222
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 135
+ ds2020-267_51
+ No definition line
+ 500
+
+
+
+
+ 17919
+ 3004588
+ 80
+ 135111848
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 136
+ ds2020-267_1185
+ No definition line
+ 62
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.061499328
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 137
+ ds2020-267_520
+ No definition line
+ 225
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 138
+ ds2020-267_1137
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 139
+ ds2020-267_1191
+ No definition line
+ 61
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 140
+ ds2020-267_548
+ No definition line
+ 223
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 141
+ ds2020-267_4
+ No definition line
+ 2297
+
+
+ 1
+ gnl|CDD|280316
+ pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus.
+ 280316
+ 465
+
+
+ 1
+ 187.283
+ 476
+ 1.96254e-52
+ 824
+ 1858
+ 121
+ 464
+ -2
+ 0
+ 94
+ 136
+ 19
+ 354
+ VRKSRLVNWEEEHKNRVSPNLAEMPEGLVYERASQLFSRSISAGKRPR-KFD-WREYWQSRWQWSAAGSIHSQYSEDDKYIFKDIYLKNKFISILAMPDMNMDSWRER----DPELHAWSSTKYEWSKLRAIYGTDVTSYVLAHFAFYNCEDVLPSPFPVGKAANDEN--VRSRVRSVLEGRTQYCVDFEDFNSQHSVQSMKAVIDAYRDTFGHFLTQEQLAAVEWTRLSLDRVIVHDNQGLKMEYNAKGTLLSGWRLTTFMNSVLNYIYTQLIVPDVVQSQNSLHNGDDVLLGSNSLEDVLLAGKNAKKHNIRLQMSK-CAYGAIAEFLRVDHKRGSKGQYLSRAMATLVHSR
+ GRGVTNVDWEEEAKNRVDLAVVCRLVLLPMEELRAHIDAVLDELVVRRGLCDPIRLFVKNEPLWCVNGHPDHKLRE---GRLRLLSSVSLVDQLVRR--MLFEPQNNNEIAWWGSVPSKPSMKLEHGKSRAIYACDTRSYLAFEYLLAPVEKAWANKSVILNPGEGDISGFDWSVQDWKRGGVSLMLDYDDFNSQHSTESMRAVFERLR----RRLPDEPAEAADWLVCSMDSMYQLSD-GTLLAQRVPGTLKSGHRATTFINSVLNCAYAELAGAPWADVPTSIHMGDDVLEGLRTPADATSLLDKYARLGFKVNPSKQSVGHTIAEFLRVAFCSHEVRGYLARAIASLVSGN
+ R V+WEEE KNRV + L E + R D R + ++ W G + E + + + ++ M + + + S K E K RAIY D SY+ + E + + + V+ G +D++DFNSQHS +SM+AV + R L E A +W S+D + + G + GTL SG R TTF+NSVLN Y +L S+H GDDVL G + D + ++ SK IAEFLRV YL+RA+A+LV
+
+
+
+
+ 2
+ gnl|CDD|366242
+ pfam00680, RdRP_1, RNA dependent RNA polymerase.
+ 366242
+ 470
+
+
+ 1
+ 44.6549
+ 106
+ 4.43825e-05
+ 995
+ 1510
+ 166
+ 342
+ -2
+ 0
+ 44
+ 65
+ 31
+ 190
+ KYEWSKLRAIYGTDVTSYVLAHFAFYNCEDVLPSPFPVGKAANDENVRSRVRSVLEGRTQ-----YCVDFEDFNSQHSVQSMKAVIDAYRDTFGHFLTQEQLAAVEWTRLSLDRVIVHDNQGLKMEYNAK-----GTLLSGWRLTTFMNSVLNYIYTQLIVPD-VVQSQNSLH-------NGDDVLLGSN
+ KVQAGKTRLFWGCPVEVNLVARAVFGPFCNKIYSNALKLGIAVGINPFSRDWERLGALIRKGSDVLDVDYSAFDSTLSPFVFDLVEDIRSEFCGGL---------EPTRLALLELLSNP----IHILGGTIIKVEGGLPSGQPATSVINSILNNIYVLYALIKHTGESELDDHETIRFISYGDDNLVAVN
+ K + K R +G V ++A F + + S A N SR L + VD+ F+S S V D + G E TRL+L ++ + G L SG T+ +NS+LN IY + +S+ H GDD L+ N
+
+
+
+
+
+
+ 17919
+ 3004588
+ 93
+ 899217312
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 142
+ ds2020-267_573
+ No definition line
+ 221
+
+
+
+
+ 17919
+ 3004588
+ 40
+ 75498324
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 143
+ ds2020-267_16
+ No definition line
+ 1165
+
+
+ 1
+ gnl|CDD|280316
+ pfam02123, RdRP_4, Viral RNA-directed RNA-polymerase. This family includes RNA-dependent RNA polymerase proteins (RdRPs) from Luteovirus, Totivirus and Rotavirus.
+ 280316
+ 465
+
+
+ 1
+ 141.829
+ 358
+ 1.58664e-38
+ 536
+ 1078
+ 288
+ 464
+ -1
+ 0
+ 62
+ 85
+ 6
+ 182
+ SRVRAVLEGRTQYCVDFEDFNSQHSVQSMKAVIDAYRDTFGHFLTQEQLAAVEWTRLSLNRVIVHDNQGLKMEYSAKGTLLSGWRLTTFMNSVLNYIYTQLIVPDVVKSQNSLHNGDDVLLGSNSLGDVLLAGRNAKKHNIRLQMSK-CAYGAIAEFLRVDHKRGSKGQYLSRAMATLVHSR
+ WSVQDWKRGGVSLMLDYDDFNSQHSTESMRAVFERLR----RRLPDEPAEAADWLVCSMDSMYQLSD-GTLLAQRVPGTLKSGHRATTFINSVLNCAYAELAGAPWADVPTSIHMGDDVLEGLRTPADATSLLDKYARLGFKVNPSKQSVGHTIAEFLRVAFCSHEVRGYLARAIASLVSGN
+ V+ G +D++DFNSQHS +SM+AV + R L E A +W S++ + + G + GTL SG R TTF+NSVLN Y +L S+H GDDVL G + D + ++ SK IAEFLRV YL+RA+A+LV
+
+
+
+
+ 2
+ gnl|CDD|366242
+ pfam00680, RdRP_1, RNA dependent RNA polymerase.
+ 366242
+ 470
+
+
+ 1
+ 45.4253
+ 108
+ 8.1737e-06
+ 707
+ 1042
+ 231
+ 342
+ -1
+ 0
+ 30
+ 45
+ 16
+ 120
+ YCVDFEDFNSQHSVQSMKAVIDAYRDTFGHFLTQEQLAAVEWTRLSLNRVIVHDNQGLKMEYSAKGTLLSGWRLTTFMNSVLNYIYTQLIVPD-VVKSQNSLH-------NGDDVLLGSN
+ LDVDYSAFDSTLSPFVFDLVEDIRS----EFCGGLEPTRLALLELLSNPIHILGGTIIKVE----GGLPSGQPATSVINSILNNIYVLYALIKHTGESELDDHETIRFISYGDDNLVAVN
+ VD+ F+S S V D F + + L N + + +K+E G L SG T+ +NS+LN IY + +S+ H GDD L+ N
+
+
+
+
+
+
+ 17919
+ 3004588
+ 88
+ 428314800
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 144
+ ds2020-267_753
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 145
+ ds2020-267_438
+ No definition line
+ 234
+
+
+ 1
+ gnl|CDD|365856
+ pfam00078, RVT_1, Reverse transcriptase (RNA-dependent DNA polymerase). A reverse transcriptase gene is usually indicative of a mobile element such as a retrotransposon or retrovirus. Reverse transcriptases occur in a variety of mobile elements, including retrotransposons, retroviruses, group II introns, bacterial msDNAs, hepadnaviruses, and caulimoviruses.
+ 365856
+ 184
+
+
+ 1
+ 33.8002
+ 78
+ 0.000870142
+ 110
+ 220
+ 97
+ 136
+ -3
+ 0
+ 11
+ 17
+ 3
+ 40
+ VLPFGLKNDGAPYQRAMTALFHDMIHKE---MEVYVDDMI
+ GLPQGLVLSPALFQLFMNELLRPLRKRAGLTLVRYADDIL
+ LP GL A +Q M L + + + Y DD++
+
+
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 146
+ ds2020-267_370
+ No definition line
+ 242
+
+
+ 1
+ gnl|CDD|376297
+ pfam00146, NADHdh, NADH dehydrogenase.
+ 376297
+ 301
+
+
+ 1
+ 52.4668
+ 127
+ 2.41391e-10
+ 22
+ 111
+ 269
+ 298
+ 1
+ 0
+ 20
+ 24
+ 0
+ 30
+ VRAAFPRYRYDQLMGLGRKVFLPLSLARVV
+ IRATLPRFRYDQLMRLGWKVLLPLSLANLL
+ +RA PR+RYDQLM LG KV LPLSLA ++
+
+
+
+
+
+
+ 17919
+ 3004588
+ 46
+ 74130676
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 147
+ ds2020-267_798
+ No definition line
+ 209
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 148
+ ds2020-267_278
+ No definition line
+ 258
+
+
+ 1
+ gnl|CDD|365808
+ pfam00012, HSP70, Hsp70 protein. Hsp70 chaperones help to fold many proteins. Hsp70 assisted folding involves repeated cycles of substrate binding and release. Hsp70 activity is ATP dependent. Hsp70 proteins are made up of two regions: the amino terminus is the ATPase domain and the carboxyl terminus is the substrate binding region.
+ 365808
+ 598
+
+
+ 1
+ 77.6867
+ 192
+ 4.1355e-19
+ 50
+ 232
+ 417
+ 477
+ 2
+ 0
+ 27
+ 37
+ 0
+ 61
+ SQTFSTAEDGQSQILLHLYRGDSAMAKSAHSLGTFQITGIAPMPRGEPSVRVEFLADTGGI
+ SQIFSTAADNQTAVEIQVYQGEREMAPDNKLLGSFELDGIPPAPRGVPQIEVTFDIDANGI
+ SQ FSTA D Q+ + + +Y+G+ MA LG+F++ GI P PRG P + V F D GI
+
+
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 75910968
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 149
+ ds2020-267_314
+ No definition line
+ 252
+
+
+
+
+ 17919
+ 3004588
+ 49
+ 74429495
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 150
+ ds2020-267_1251
+ No definition line
+ 58
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 151
+ ds2020-267_435
+ No definition line
+ 234
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 152
+ ds2020-267_1017
+ No definition line
+ 83
+
+
+
+
+ 17919
+ 3004588
+ 2
+ 74218750
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 153
+ ds2020-267_1214
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 154
+ ds2020-267_960
+ No definition line
+ 125
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 155
+ ds2020-267_772
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 156
+ ds2020-267_937
+ No definition line
+ 129
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 157
+ ds2020-267_812
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 158
+ ds2020-267_66
+ No definition line
+ 460
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 117585038
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 159
+ ds2020-267_425
+ No definition line
+ 235
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 160
+ ds2020-267_1010
+ No definition line
+ 96
+
+
+
+
+ 17919
+ 3004588
+ 6
+ 75323924
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 161
+ ds2020-267_727
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 162
+ ds2020-267_745
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 163
+ ds2020-267_512
+ No definition line
+ 225
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 164
+ ds2020-267_899
+ No definition line
+ 146
+
+
+
+
+ 17919
+ 3004588
+ 20
+ 74093824
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 165
+ ds2020-267_1020
+ No definition line
+ 81
+
+
+
+
+ 17919
+ 3004588
+ 2
+ 74218750
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 166
+ ds2020-267_724
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 167
+ ds2020-267_1163
+ No definition line
+ 64
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 168
+ ds2020-267_62
+ No definition line
+ 464
+
+
+
+
+ 17919
+ 3004588
+ 79
+ 119174025
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 169
+ ds2020-267_824
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 170
+ ds2020-267_495
+ No definition line
+ 227
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 171
+ ds2020-267_479
+ No definition line
+ 229
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 73724343
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 172
+ ds2020-267_437
+ No definition line
+ 234
+
+
+
+
+ 17919
+ 3004588
+ 44
+ 75349168
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 173
+ ds2020-267_947
+ No definition line
+ 127
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.065298648
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 174
+ ds2020-267_531
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 175
+ ds2020-267_454
+ No definition line
+ 232
+
+
+
+
+ 17919
+ 3004588
+ 43
+ 75958414
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 176
+ ds2020-267_931
+ No definition line
+ 129
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 177
+ ds2020-267_364
+ No definition line
+ 243
+
+
+ 1
+ gnl|CDD|365952
+ pfam00216, Bac_DNA_binding, Bacterial DNA-binding protein.
+ 365952
+ 88
+
+
+ 1
+ 50.2082
+ 121
+ 1.5507e-10
+ 134
+ 241
+ 53
+ 88
+ -3
+ 0
+ 23
+ 24
+ 0
+ 36
+ ARPQRKRRNPATGEAIQIPAKKAPIFKAGKALKDAV
+ KRAARTGRNPKTGEAITIPAKKVVKFKPGKELKEAV
+ R R RNP TGEAI IPAKK FK GK LK+AV
+
+
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 178
+ ds2020-267_790
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 179
+ ds2020-267_953
+ No definition line
+ 126
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 180
+ ds2020-267_340
+ No definition line
+ 247
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 75683825
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 181
+ ds2020-267_822
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 182
+ ds2020-267_1241
+ No definition line
+ 59
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 57087172
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 183
+ ds2020-267_558
+ No definition line
+ 222
+
+
+ 1
+ gnl|CDD|377116
+ pfam03737, RraA-like, Aldolase/RraA. Members of this family include regulator of ribonuclease E activity A (RraA) and 4-hydroxy-4-methyl-2-oxoglutarate (HMG)/4-carboxy- 4-hydroxy-2-oxoadipate (CHA) aldolase, also known as RraA-like protein. RraA acts as a trans-acting modulator of RNA turnover, binding essential endonuclease RNase E and inhibiting RNA processing. RraA-like proteins seem to contain aldolase and/or decarboxylase activity either in place of or in addition to the RNase E inhibitor functions.
+ 377116
+ 147
+
+
+ 1
+ 57.5038
+ 140
+ 4.93695e-13
+ 57
+ 179
+ 104
+ 147
+ -2
+ 0
+ 18
+ 28
+ 3
+ 44
+ VFA---IPRKSNRKGVGETDIEISFGGLTINSGMYVYADNNGII
+ VFALGTTPRGSPKKGGGEVNVPVTIGGVTVRPGDIVVADEDGVV
+ VFA PR S +KG GE ++ ++ GG+T+ G V AD +G++
+
+
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 184
+ ds2020-267_43
+ No definition line
+ 563
+
+
+
+
+ 17919
+ 3004588
+ 81
+ 164633794
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 185
+ ds2020-267_702
+ No definition line
+ 214
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 186
+ ds2020-267_1230
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 187
+ ds2020-267_1186
+ No definition line
+ 62
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 188
+ ds2020-267_925
+ No definition line
+ 131
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 73382868
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 189
+ ds2020-267_122
+ No definition line
+ 338
+
+
+
+
+ 17919
+ 3004588
+ 70
+ 73510836
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 190
+ ds2020-267_770
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 191
+ ds2020-267_1078
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 192
+ ds2020-267_102
+ No definition line
+ 375
+
+
+
+
+ 17919
+ 3004588
+ 76
+ 80494456
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 193
+ ds2020-267_713
+ No definition line
+ 213
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 194
+ ds2020-267_660
+ No definition line
+ 216
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 195
+ ds2020-267_1147
+ No definition line
+ 65
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 63096348
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 196
+ ds2020-267_760
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 197
+ ds2020-267_542
+ No definition line
+ 224
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 198
+ ds2020-267_11
+ No definition line
+ 1579
+
+
+
+
+ 17919
+ 3004588
+ 91
+ 597672165
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 199
+ ds2020-267_209
+ No definition line
+ 277
+
+
+
+
+ 17919
+ 3004588
+ 55
+ 74704591
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 200
+ ds2020-267_618
+ No definition line
+ 218
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 76089651
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 201
+ ds2020-267_1133
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 202
+ ds2020-267_939
+ No definition line
+ 128
+
+
+
+
+ 17919
+ 3004588
+ 15
+ 73866681
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 203
+ ds2020-267_749
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 204
+ ds2020-267_1008
+ No definition line
+ 96
+
+
+
+
+ 17919
+ 3004588
+ 6
+ 75323924
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 205
+ ds2020-267_135
+ No definition line
+ 323
+
+
+
+
+ 17919
+ 3004588
+ 66
+ 74699294
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 206
+ ds2020-267_218
+ No definition line
+ 274
+
+
+ 1
+ gnl|CDD|279664
+ pfam01348, Intron_maturas2, Type II intron maturase. Group II introns use intron-encoded reverse transcriptase, maturase and DNA endonuclease activities for site-specific insertion into DNA. Although this type of intron is self splicing in vitro they require a maturase protein for splicing in vivo. It has been shown that a specific region of the aI2 intron is needed for the maturase function. This region was found to be conserved in group II introns and called domain X.
+ 279664
+ 140
+
+
+ 1
+ 38.6047
+ 90
+ 1.66328e-05
+ 51
+ 257
+ 32
+ 100
+ 3
+ 0
+ 21
+ 32
+ 0
+ 69
+ PIHVACLTNVSDGDIVNWSAGIAINPLSYYRCRDNLYQVRTIVDHQIRWSAIFTLAHKHKSSARNIILK
+ PRSVGRWTDLDDRDILLRYNAIIRGILNYYSFADNKKRLYTRIYYILRLSCAKTLARKLKLGTVRKVIK
+ P V T++ D DI+ I L+YY DN ++ T + + +R S TLA K K ++K
+
+
+
+
+
+
+ 17919
+ 3004588
+ 54
+ 75367594
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 207
+ ds2020-267_777
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 208
+ ds2020-267_1105
+ No definition line
+ 71
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 209
+ ds2020-267_972
+ No definition line
+ 123
+
+
+
+
+ 17919
+ 3004588
+ 14
+ 74350494
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 210
+ ds2020-267_1070
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 211
+ ds2020-267_835
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 212
+ ds2020-267_286
+ No definition line
+ 257
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 73802330
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 213
+ ds2020-267_820
+ No definition line
+ 208
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 214
+ ds2020-267_324
+ No definition line
+ 250
+
+
+
+
+ 17919
+ 3004588
+ 48
+ 75056660
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 215
+ ds2020-267_363
+ No definition line
+ 243
+
+
+ 1
+ gnl|CDD|366086
+ pfam00416, Ribosomal_S13, Ribosomal protein S13/S18. This family includes ribosomal protein S13 from prokaryotes and S18 from eukaryotes.
+ 366086
+ 109
+
+
+ 1
+ 37.3005
+ 87
+ 2.02528e-05
+ 15
+ 134
+ 2
+ 41
+ -2
+ 0
+ 14
+ 21
+ 0
+ 40
+ ISGARSVADEQVRIASTKIDGIGPKKAIQVRYRLGISGDI
+ ILGTDIDGDKKVEIALTYIKGIGRRRANIILKKAGVDLDK
+ I G D++V IA T I GIG ++A + + G+ D
+
+
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 216
+ ds2020-267_674
+ No definition line
+ 215
+
+
+
+
+ 17919
+ 3004588
+ 39
+ 73783904
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 217
+ ds2020-267_863
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.070739016
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 218
+ ds2020-267_1109
+ No definition line
+ 70
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 69105524
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 219
+ ds2020-267_45
+ No definition line
+ 540
+
+
+
+
+ 17919
+ 3004588
+ 81
+ 153761751
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 220
+ ds2020-267_746
+ No definition line
+ 211
+
+
+ 1
+ gnl|CDD|279788
+ pfam01490, Aa_trans, Transmembrane amino acid transporter protein. This transmembrane region is found in many amino acid transporters including UNC-47 and MTR. UNC-47 encodes a vesicular amino butyric acid (GABA) transporter, (VGAT). UNC-47 is predicted to have 10 transmembrane domains. MTR is a N system amino acid transporter system protein involved in methyltryptophan resistance. Other members of this family include proline transporters and amino acid permeases.
+ 279788
+ 410
+
+
+ 1
+ 35.3596
+ 82
+ 0.000177299
+ 21
+ 176
+ 358
+ 410
+ 3
+ 0
+ 11
+ 21
+ 1
+ 53
+ WPLAIYFPVEMYFVQKKI-GSWTRKWIVLEAFSLVCFLVTVVGVIGSVQGLIS
+ APLSFILPPLFHLKLKKTKKKSQEKLWKPDILDVICIVIGLLLMAYGVAGLIL
+ PL+ P + KK K + ++C ++ ++ + V GLI
+
+
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+
+
+ 221
+ ds2020-267_403
+ No definition line
+ 239
+
+
+
+
+ 17919
+ 3004588
+ 45
+ 74739922
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 222
+ ds2020-267_350
+ No definition line
+ 245
+
+
+
+
+ 17919
+ 3004588
+ 47
+ 73521430
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 223
+ ds2020-267_144
+ No definition line
+ 315
+
+
+
+
+ 17919
+ 3004588
+ 65
+ 73594120
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 224
+ ds2020-267_1049
+ No definition line
+ 75
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 75114700
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 225
+ ds2020-267_499
+ No definition line
+ 227
+
+
+
+
+ 17919
+ 3004588
+ 42
+ 74315670
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 226
+ ds2020-267_22
+ No definition line
+ 841
+
+
+
+
+ 17919
+ 3004588
+ 85
+ 288887235
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 227
+ ds2020-267_862
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 228
+ ds2020-267_294
+ No definition line
+ 255
+
+
+
+
+ 17919
+ 3004588
+ 50
+ 73802330
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 229
+ ds2020-267_31
+ No definition line
+ 712
+
+
+
+
+ 17919
+ 3004588
+ 84
+ 229406976
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 230
+ ds2020-267_1019
+ No definition line
+ 81
+
+
+
+
+ 17919
+ 3004588
+ 2
+ 74218750
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 231
+ ds2020-267_747
+ No definition line
+ 211
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 232
+ ds2020-267_543
+ No definition line
+ 223
+
+
+
+
+ 17919
+ 3004588
+ 41
+ 74906997
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 233
+ ds2020-267_1072
+ No definition line
+ 73
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 72110112
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 234
+ ds2020-267_784
+ No definition line
+ 210
+
+
+
+
+ 17919
+ 3004588
+ 38
+ 74357312
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 235
+ ds2020-267_879
+ No definition line
+ 206
+
+
+
+
+ 17919
+ 3004588
+ 36
+ 75504128
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 236
+ ds2020-267_1120
+ No definition line
+ 67
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 237
+ ds2020-267_1126
+ No definition line
+ 66
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 66100936
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 238
+ ds2020-267_1218
+ No definition line
+ 60
+
+
+
+
+ 17919
+ 3004588
+ 0
+ 60091760
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 239
+ ds2020-267_915
+ No definition line
+ 134
+
+
+
+
+ 17919
+ 3004588
+ 16
+ 76100752
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 240
+ ds2020-267_1026
+ No definition line
+ 79
+
+
+
+
+ 17919
+ 3004588
+ 1
+ 74666725
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+ 241
+ ds2020-267_845
+ No definition line
+ 207
+
+
+
+
+ 17919
+ 3004588
+ 37
+ 74930720
+ 0.041
+ 0.267
+ 0.14
+
+
+ No hits found
+
+
+
diff -r 000000000000 -r b82ce29791e7 virAnnot_blast2tsv.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/virAnnot_blast2tsv.xml Wed Aug 21 13:12:59 2024 +0000
@@ -0,0 +1,87 @@
+
+ convert XML blast results to tabular file with taxonomic informations
+
+ macros.xml
+
+
+
+
+
+
+
+
+
+
+
+ BLASTX
+ BLASTP
+ TBLASTX
+ BLASTN
+ DIAMOND
+
+
+ 0
+ 0.1
+ 0.01
+ 0.001
+ 0.0001
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+