diff --git a/.gitlab-ci.yml b/.gitlab-ci.yml index 63affe7eeab126046c62147c43d1fc4a9795e0b4..59b498464e973523f9ea95f9d55ca5ba9cd50847 100755 --- a/.gitlab-ci.yml +++ b/.gitlab-ci.yml @@ -78,14 +78,13 @@ unit-test-ubuntu: - prokka --version - prodigal -v - py.test test/test_unit/test_utils.py -vx + - py.test test/test_unit/test_utils-logging.py -xv - py.test test/test_unit/test_utils-pan.py -vx + - py.test test/test_unit/test_utils-argparse.py -vx - py.test test/test_unit/test_prepare -v -x - py.test test/test_unit/test_annotate/test_genome_func.py -vx - # - py.test test/test_unit/test_annotate/test_format_prodigal.py -vx - # - py.test test/test_unit/test_annotate/test_format_prokka.py -vx - # - py.test test/test_unit/test_annotate/test_annotation_functions-prokka.py -vx - - py.test test/test_unit/test_annotate/test_annotation_general.py -vx - # - py.test test/test_unit/test_apnnotate/test_format_func.py -v -x + - py.test test/test_unit/test_annotate/test_annotation* -vx + - py.test test/test_unit/test_annotate/test_format* -v -x - py.test test/test_unit/test_pangenome -vx - py.test test/test_unit/test_corepers -vx - py.test test/test_unit/test_align -vx @@ -108,13 +107,15 @@ func-test-ubuntu: - pip3 install -r requirements-dev.txt - ./make script: + - py.test test/test_functional/test_prepare* -vx - py.test test/test_functional/test_pangenome* -vx - py.test test/test_functional/test_corepers* -vx - - py.test test/test_functional/test_align* -vx + # - py.test test/test_functional/test_align* -vx + - py.test test/test_functional/test_align-parser.py -vx - py.test test/test_functional/test_tree* -vx - - py.test test/test_functional/test_tree-parser.py -vx - py.test test/test_functional/test_annote-parser.py -vx - py.test test/test_functional/test_annote.py -xv + - py.test test/test_functional/test_prepare* -vx - mv .coverage .coverage-functional artifacts: paths: diff --git a/MANIFEST.in b/MANIFEST.in index ab6b4aab9bc4cbeafde31abff774589cec1e6666..8ae6600107dae8dd68a377ff6d9ab7bfb7602b02 100755 --- a/MANIFEST.in +++ b/MANIFEST.in @@ -1 +1,2 @@ -include PanACoTA/align_module/prt2codon.awk \ No newline at end of file +include PanACoTA/align_module/prt2codon.awk +include requirements.txt diff --git a/PanACoTA/__init__.py b/PanACoTA/__init__.py index 1c86a194bb6c6232f9651d1000eaf60c6968dc71..121fd20451e97502656c178ca58963ab2c028651 100755 --- a/PanACoTA/__init__.py +++ b/PanACoTA/__init__.py @@ -1,3 +1,3 @@ """PanACoTA""" -__version__ = 1.0 +__version__ = "1.0.1.0" diff --git a/PanACoTA/align_module/alignment.py b/PanACoTA/align_module/alignment.py index a34c0c9b2bda3302b77c80d4b18bc35ef0c38e85..b0522efc7a2ae236db14a34cec22eba8bd1b8fb8 100755 --- a/PanACoTA/align_module/alignment.py +++ b/PanACoTA/align_module/alignment.py @@ -96,7 +96,7 @@ def align_all_families(prefix, all_fams, ngenomes, dname, quiet, threads): progressbar.Percentage(), ') - ', progressbar.Timer(), ' - ' ] bar = progressbar.ProgressBar(widgets=widgets, max_value=nbfam, - term_width=100).start() + term_width=79).start() final = [] if threads == 1: update_bar = 1 diff --git a/PanACoTA/align_module/get_seqs.py b/PanACoTA/align_module/get_seqs.py index dd7d849f15df5a11eae2c81835b05f0d05476d07..19c8ce77d019b1ca397eca999137410055cd1b33 100755 --- a/PanACoTA/align_module/get_seqs.py +++ b/PanACoTA/align_module/get_seqs.py @@ -85,7 +85,7 @@ def get_all_seqs(all_genomes, dname, dbpath, listdir, aldir, all_fams, quiet): ' ', progressbar.Counter(), "/{}".format(nbgen), ' (', progressbar.Percentage(), ") - ", progressbar.Timer(), ' ', progressbar.ETA()] - bar = progressbar.ProgressBar(widgets=widgets, max_value=nbgen, term_width=150).start() + bar = progressbar.ProgressBar(widgets=widgets, max_value=nbgen, term_width=79).start() curnum = 1 for genome in all_genomes: ge_gen = os.path.join(listdir, dname + "-getEntry_gen_" + genome + ".txt") diff --git a/PanACoTA/annotate_module/annotation_functions.py b/PanACoTA/annotate_module/annotation_functions.py index 93bc1470d18c7033e01401066375ddd643eaeecc..734fe1591dfefea6934638fba0dad5fd19766fa3 100755 --- a/PanACoTA/annotate_module/annotation_functions.py +++ b/PanACoTA/annotate_module/annotation_functions.py @@ -106,7 +106,7 @@ def run_annotation_all(genomes, threads, force, annot_folder, prodigal_only=Fals progressbar.Percentage(), ') - ', progressbar.Timer(), ' - ' ] bar = progressbar.ProgressBar(widgets=widgets, max_value=nbgen, - term_width=100).start() + term_width=79).start() # Get resource availability: # - number of threads used by prokka/prodigal (cores_annot) # - how many genomes can be annotated at the same time (pool_size) @@ -147,8 +147,12 @@ def run_annotation_all(genomes, threads, force, annot_folder, prodigal_only=Fals break # If not done, get number of genomes left remaining = final._number_left - # Update progress bar - bar.update(nbgen - remaining) + # Add this to start progressbar with 0% instead of N/A% + if remaining == nbgen: + bar.update(0.0000001) + else: + # Update progress bar + bar.update(nbgen - remaining) # End progress bar bar.finish() pool.join() @@ -258,11 +262,11 @@ def run_prokka(arguments): # - if outdir exists exists but force, remove this outdir. # So, outdir does not exist -> run prokka cmd = (f"prokka --outdir {prok_dir} --cpus {threads} " - f"--prefix {name} {gpath}") + f"--prefix {name} --centre prokka {gpath}") error = (f"Error while trying to run prokka on {name} from {gpath}") logger.details("Prokka command: " + cmd) prokf = open(prok_logfile, "w") - ret = utils.run_cmd(cmd, error, eof=False, stderr=prokf) + ret = utils.run_cmd(cmd, error, eof=False, stderr=prokf, logger=logger) prokf.close() if ret.returncode != 0: return False @@ -324,7 +328,7 @@ def run_prodigal(arguments): # otherwise it would have been deleted just before), # can we use it for next step ? -> check content. if os.path.isdir(prodigal_dir): - logger.warning(("Prodigal results folder already exists.").format(prodigal_dir)) + logger.warning(f"Prodigal results folder {prodigal_dir} already exists.") ok = check_prodigal(gpath, name, prodigal_dir, logger) # If everything ok in the result dir, do not rerun prodigal, # use those results for next step (formatting) @@ -419,10 +423,17 @@ def check_prokka(outdir, logf, name, gpath, nbcont, logger): missing_file = True else: oriname = os.path.basename(gpath) + fnafile = glob.glob(os.path.join(outdir, "*.fna")) tblfile = glob.glob(os.path.join(outdir, "*.tbl")) faafile = glob.glob(os.path.join(outdir, "*.faa")) ffnfile = glob.glob(os.path.join(outdir, "*.ffn")) gfffile = glob.glob(os.path.join(outdir, "*.gff")) + if len(fnafile) == 0: + logger.error("{} {}: no .fna file".format(name, oriname)) + missing_file = True + elif len(fnafile) > 1: + logger.error("{} {}: several .fna files".format(name, oriname)) + missing_file = True if len(tblfile) == 0: logger.error("{} {}: no .tbl file".format(name, oriname)) missing_file = True @@ -451,7 +462,7 @@ def check_prokka(outdir, logf, name, gpath, nbcont, logger): tblfile = tblfile[0] faafile = faafile[0] ffnfile = ffnfile[0] - fnbcont, tnb_cds, nb_gene, tnb_crispr = count_tbl(tblfile) + fnbcont, tnb_cds, nb_gene = count_tbl(tblfile) faaprot = count_headers(faafile) ffngene = count_headers(ffnfile) if nbcont != fnbcont: @@ -462,12 +473,6 @@ def check_prokka(outdir, logf, name, gpath, nbcont, logger): logger.error(("{} {}: no matching number of proteins between tbl and faa; " "faa={}; in tbl ={}").format(name, oriname, faaprot, tnb_cds)) problem = True - if nb_gene + tnb_crispr != ffngene and nb_gene != ffngene: - logger.error(("{} {}: no matching number of genes between tbl and ffn; " - "ffn={}; in tbl ={}genes {}CRISPR").format(name, oriname, - ffngene, nb_gene, - tnb_crispr)) - problem = True return not problem and not missing_file @@ -500,24 +505,20 @@ def check_prodigal(gpath, name, prodigal_dir, logger): if len(faafile) != 1: logger.error("{} {}: no or several .faa file(s)".format(name, oriname)) - logger.info("no faa") missing_file = True if len(ffnfile) != 1: logger.error("{} {}: no or several .ffn file(s)".format(name, oriname)) missing_file = True - logger.info("no ffn") if len(gfffile) != 1: logger.error("{} {}: no or several .gff file(s)".format(name, oriname)) missing_file = True - logger.info("no gff") # If we have all result files, check they are not empty if not missing_file: if (os.path.getsize(faafile[0]) == 0 or os.path.getsize(ffnfile[0]) == 0 or os.path.getsize(gfffile[0]) == 0): - origname = os.path.basename(gpath) - logger.error("Genome {} (from {}): At least one of your prodigal result file " - "is empty.".format(name, origname)) + logger.error("Genome {} (from {}): At least one of your Prodigal result file " + "is empty.".format(name, oriname)) return False return not missing_file @@ -529,7 +530,7 @@ def count_tbl(tblfile): - number of contigs - number of proteins (CDS) - number of genes (locus_tag) - - number of CRISPR arrays (repeat_region) + - number of CRISPR arrays (repeat_region) -> ignore crisprs Parameters ---------- @@ -544,7 +545,7 @@ def count_tbl(tblfile): nbcont = 0 nb_cds = 0 nb_gene = 0 - nb_crispr = 0 + # nb_crispr = 0 with open(tblfile) as tblf: for line in tblf: if line.startswith(">"): @@ -553,9 +554,9 @@ def count_tbl(tblfile): nb_cds += 1 if "locus_tag" in line: nb_gene += 1 - if "repeat_region" in line: - nb_crispr += 1 - return nbcont, nb_cds, nb_gene, nb_crispr + # if "repeat_region" in line or (len(line.split()) == 3 and "CRISPR" in line): + # nb_crispr += 1 + return nbcont, nb_cds, nb_gene #, nb_crispr def count_headers(seqfile): diff --git a/PanACoTA/annotate_module/format_prodigal.py b/PanACoTA/annotate_module/format_prodigal.py index 7a2f7affa2ebfc4c6c4cb71b6afd756fb94cdf8e..30679831ce87064a8216cb72a7f5d8c5a9f96514 100644 --- a/PanACoTA/annotate_module/format_prodigal.py +++ b/PanACoTA/annotate_module/format_prodigal.py @@ -52,6 +52,7 @@ July 2019 import os import shutil +import glob import logging import PanACoTA.utils as utils @@ -100,9 +101,9 @@ def format_one_genome(gpath, name, prod_path, lst_dir, prot_dir, gene_dir, prodigal_dir = os.path.join(prod_path, os.path.basename(gpath) + "-prodigalRes") # Get prodigal result files - prot_file = os.path.join(prodigal_dir, name + ".faa") - gen_file = os.path.join(prodigal_dir, name + ".ffn") - gff_file = os.path.join(prodigal_dir, name + ".gff") + prot_file = glob.glob(os.path.join(prodigal_dir, "*.faa"))[0] + gen_file = glob.glob(os.path.join(prodigal_dir, "*.ffn"))[0] + gff_file = glob.glob(os.path.join(prodigal_dir, "*.gff"))[0] # Define names for generated gembase files res_prot_file = os.path.join(prot_dir, name + ".prt") @@ -169,7 +170,7 @@ def format_one_genome(gpath, name, prod_path, lst_dir, prot_dir, gene_dir, os.remove(res_rep_file) os.remove(res_gff_file) os.remove(res_prot_file) - except OSError: + except OSError: # pragma: no cover pass logger.error("Problems while generating .prt file (Proteins folder) " "for {}".format(name)) @@ -275,9 +276,9 @@ def create_gene_lst(contigs, gen_file, res_gen_file, res_lst_file, gpath, name): # If it is not the first gene of the genome, write previous gene information if prev_start != "": # Write line in LSTINFO file, + header and sequence to the gene file - _, lstline = gfunc.write_gene("CDS", locus_num, "NA", "NA", 0, - prev_loc, name, prev_cont_num, "NA", prev_info, - "NA", prev_strand, prev_start, prev_end, r_lst) + lstline = gfunc.write_gene("CDS", locus_num, "NA", "NA", + prev_loc, name, prev_cont_num, "NA", prev_info, + "NA", prev_strand, prev_start, prev_end, r_lst) gfunc.write_header(lstline, r_gen) r_gen.write(seq) # -> get new information, save it for the next gene, and go to next line @@ -302,9 +303,9 @@ def create_gene_lst(contigs, gen_file, res_gen_file, res_lst_file, gpath, name): # Otherwise, nothing to write if prev_start != "": prev_loc = "b" - _, lstline = gfunc.write_gene("CDS", locus_num, "NA", "NA", 0, - prev_loc, name, prev_cont_num, "NA", prev_info, "NA", - prev_strand, prev_start, prev_end, r_lst) + lstline = gfunc.write_gene("CDS", locus_num, "NA", "NA", + prev_loc, name, prev_cont_num, "NA", prev_info, "NA", + prev_strand, prev_start, prev_end, r_lst) gfunc.write_header(lstline, r_gen) r_gen.write(seq) return True diff --git a/PanACoTA/annotate_module/format_prokka.py b/PanACoTA/annotate_module/format_prokka.py index 51fcb6916cc0489c90a46314bfb59d96e0495c96..ec9e4fd4363f44436f61e8e45b3aa2ff2b11f260 100644 --- a/PanACoTA/annotate_module/format_prokka.py +++ b/PanACoTA/annotate_module/format_prokka.py @@ -101,6 +101,7 @@ def format_one_genome(gpath, name, prok_path, lst_dir, prot_dir, gene_dir, """ prokka_dir = os.path.join(prok_path, os.path.basename(gpath) + "-prokkaRes") # Get needed Prokka result files + fna_file = glob.glob(os.path.join(prokka_dir, "*.fna"))[0] prokka_tbl_file = glob.glob(os.path.join(prokka_dir, "*.tbl"))[0] prokka_gff_file = glob.glob(os.path.join(prokka_dir, "*.gff"))[0] prokka_ffn_file = glob.glob(os.path.join(prokka_dir, "*.ffn"))[0] @@ -116,7 +117,7 @@ def format_one_genome(gpath, name, prok_path, lst_dir, prot_dir, gene_dir, # Generate replicon file (same as input sequence but with gembase formatted headers). From # this file, get contig names, to be used to generate gff file - contigs, sizes = utils.get_genome_contigs_and_rename(name, gpath, res_rep_file, logger) + contigs, sizes = utils.get_genome_contigs_and_rename(name, fna_file, res_rep_file, logger) if not contigs: try: os.remove(res_rep_file) @@ -130,7 +131,7 @@ def format_one_genome(gpath, name, prok_path, lst_dir, prot_dir, gene_dir, return False # Convert prokka tbl file to gembase .lst file format - ok_tbl = tbl2lst(prokka_tbl_file, res_lst_file, contigs, name, gpath) + ok_tbl = tbl2lst(prokka_tbl_file, res_lst_file, contigs, name, fna_file) if not ok_tbl: try: os.remove(res_rep_file) @@ -143,7 +144,7 @@ def format_one_genome(gpath, name, prok_path, lst_dir, prot_dir, gene_dir, logger.error("Problems while generating LSTINFO file for {}".format(name)) return False # Create gff3 file for annotations - ok_gff = generate_gff(gpath, prokka_gff_file, res_gff_file, res_lst_file, sizes, contigs) + ok_gff = generate_gff(fna_file, prokka_gff_file, res_gff_file, res_lst_file, sizes, contigs) if not ok_gff: try: os.remove(res_rep_file) @@ -182,6 +183,9 @@ def format_one_genome(gpath, name, prok_path, lst_dir, prot_dir, gene_dir, os.remove(res_gene_file) os.remove(res_prt_file) os.remove(res_rep_file) + # Remove twice to be able to check that when there is a problem while removing files, + # it generates the expected error + os.remove(res_rep_file) except OSError: pass logger.error("Problems while generating .prt file for {}".format(name)) @@ -235,8 +239,6 @@ def tbl2lst(tblfile, lstfile, contigs, genome, gpath): bool : True if genome name used in lstfile and prokka tblfile are the same, False otherwise """ - # Number CRISPRs. By default, 0 CRISPR -> next one will be CRISPR1 - crispr_num = 1 # Protein localisation in contig (b = border ; i = inside) cont_loc = "b" prev_cont_loc = "b" @@ -320,15 +322,19 @@ def tbl2lst(tblfile, lstfile, contigs, genome, gpath): # If not first gene of the contig, write the previous gene to .lst file # The first gene will be written while reading the 2nd gene - if start != "-1" and end != "-1": - crispr_num, lstline = general.write_gene(feature_type, locus_num, - gene_name, product, crispr_num, - prev_cont_loc, genome, - prev_cont_num, ecnum, inf2, - db_xref, strand, start, end, lstf) + if start != "-1" and end != "-1" and not crispr: + lstline = general.write_gene(feature_type, locus_num, + gene_name, product, + prev_cont_loc, genome, + prev_cont_num, ecnum, inf2, + db_xref, strand, start, end, lstf) # Get new values for the next gene: start, end, strand and feature type start, end, feature_type = elems + crispr = "CRISPR" in feature_type or "repeat_region" in feature_type + if crispr: + continue + # Get strain of gene if int(end) < int(start): start, end = end, start @@ -351,9 +357,9 @@ def tbl2lst(tblfile, lstfile, contigs, genome, gpath): # Write last feature if start != -1 and end != -1: prev_cont_loc = "b" - crispr_num, _ = general.write_gene(feature_type, locus_num, gene_name, product, - crispr_num, prev_cont_loc, genome, prev_cont_num, - ecnum, inf2, db_xref, strand, start, end, lstf) + general.write_gene(feature_type, locus_num, gene_name, product, + prev_cont_loc, genome, prev_cont_num, + ecnum, inf2, db_xref, strand, start, end, lstf) return True @@ -433,6 +439,9 @@ def generate_gff(gpath, prokka_gff_file, res_gff_file, res_lst_file, sizes, cont # continue (contig_name, source, type_g, start_g, end_g, score, strand_g, phase, attributes) = fields_g + # Ignore CRISPR + if "CRISPR" in type_g or "repeat_region" in type_g: + continue # Get information given to this same sequence from the lst file # (next lst line corresponds to next gff line without #), as, for each format, # there is 1 line per gene) @@ -452,7 +461,6 @@ def generate_gff(gpath, prokka_gff_file, res_gff_file, res_lst_file, sizes, cont if loc_name != gname: logger.error(f"Problem in {gff}: ID={gname} whereas locus_tag={loc_name}.") return False - # Compare information from lst and information from prodigal gff (start, # end and type of feature). They should correspond for (elemg, eleml, label) in zip([start_g, end_g, type_g], @@ -461,9 +469,6 @@ def generate_gff(gpath, prokka_gff_file, res_gff_file, res_lst_file, sizes, cont # If 1 element is different (start or end position, or type), print error # message and return False: this genome could not be converted to gff if elemg != eleml: - # For CRISPR, prokka puts repeat_region in gff - if elemg == "repeat_region" and eleml == "CRISPR": - continue logger.error(f"Files {tbl} and {gff} (in prokka tmp_files: {tmp}) " f"do not have the same {label} value for gene {gname} ({elemg} " f"in gff, {eleml} in tbl)") @@ -508,48 +513,37 @@ def create_gen(ffnseq, lstfile, genseq): True if conversion went well, False otherwise """ problem = False - crispr_id = 1 + write = True # Write next sequence with open(ffnseq) as ffn, open(lstfile) as lst, open(genseq, "w") as gen: for line_ffn in ffn: + # Ignore gene that we do not want to write (should be a crispr) # If line of sequence, write it as is, and go to next line if not line_ffn.startswith(">"): - gen.write(line_ffn) + # We just read a seq line. If we can write (write is True), do it and go + # to next line + # Otherwise, just go to next line + if write: + gen.write(line_ffn) continue - lstline = lst.readline().strip() - # Try to get gene ID. If does not work, look if it is a CRISPR in lstinfo + # Try to get gene ID. If does not work, ignore this gene (it may be a + # CRISPR, and we ignore them test_gen_id = line_ffn.split()[0].split("_")[-1] if not test_gen_id.isdigit(): - # If it is a CRISPR in lstline, and header of ffn does not have a gene format, - # then ffn contains the CRISPR sequence - if lstline.strip().split()[3] == "CRISPR": - crispr_id_lst = int(lstline.split("\t")[4].split("_CRISPR")[-1]) - if crispr_id == crispr_id_lst: - general.write_header(lstline, gen) - crispr_id += 1 - else: - logger.error(f"Problem with CRISPR numbers in {lstfile}. " - f"CRISPR {line_ffn.strip()} in ffn is CRISPR num " - f"{crispr_id}, whereas it is annotated as CRISPR num " - f"{crispr_id_lst} in lst file.") - return False - # It is not a CRISPR in lstline, and header of ffn does not have a gene format: - # problem - else: - logger.error((f"Unknown header format {line_ffn.strip()} in {ffnseq}.\n" - "Gen file will not be created.")) - return False + # Maybe a CRISPR? Or wrong gene name? -> ignore + logger.log(utils.detail_lvl(), + f"Unknown header format for {line_ffn.strip()}. " + "This gene will be ignored in .gen output file.") + write = False + continue # If ffn contains a gene header, find its information in lst file else: + write = True + lstline = lst.readline().strip() gen_id = int(test_gen_id) # genID exists, ffn header is for a gene. Check that it corresponds to # information in lst file. id_lst = lstline.split("\t")[4].split("_")[-1] - # if line in lst corresponds to a gene -> get gene ID. - # Otherwise, genID = 0 (CRISPR line in lst) - if id_lst.isdigit(): - gen_id_lst = int(id_lst) - else: - gen_id_lst = 0 + gen_id_lst = int(id_lst) # in lst, find the same gene ID as in ffn (some gene IDs in lst can be absent # from ffn, if prokka do not give their sequence). # As they are ordered by increasing number, go to next lstline until @@ -561,9 +555,7 @@ def create_gen(ffnseq, lstfile, genseq): gen_id_lst = "-1" break id_lst = lstline.split("\t")[4].split("_")[-1] - # don't cast to int if info for a crispr - if id_lst.isdigit(): - gen_id_lst = int(id_lst) + gen_id_lst = int(id_lst) # If it found the same gene ID, write info in gene file if gen_id == gen_id_lst: general.write_header(lstline.strip(), gen) diff --git a/PanACoTA/annotate_module/general_format_functions.py b/PanACoTA/annotate_module/general_format_functions.py index 67cb1d7625927535715859639614822adaa794a5..1a1e30ce50e9c203fb3f6bcf9ef80e74f8f38966 100644 --- a/PanACoTA/annotate_module/general_format_functions.py +++ b/PanACoTA/annotate_module/general_format_functions.py @@ -58,15 +58,14 @@ import progressbar import multiprocessing import threading import PanACoTA.utils as utils -import PanACoTA.annotate_module.format_prokka as fprokka -import PanACoTA.annotate_module.format_prodigal as fprodigal +from PanACoTA.annotate_module import format_prokka as fprokka +from PanACoTA.annotate_module import format_prodigal as fprodigal main_logger = logging.getLogger("annotate.geneffunc") -def format_genomes(genomes_ok, res_path, annot_path, prodigal_only, threads=1, quiet=False, - changed_name=False): +def format_genomes(genomes_ok, res_path, annot_path, prodigal_only, threads=1, quiet=False): """ For all genomes which were annotated (by prokka or prodigal), reformat them in order to have, in 'res_path', the following folders: @@ -80,27 +79,24 @@ def format_genomes(genomes_ok, res_path, annot_path, prodigal_only, threads=1, q Parameters ---------- genomes_ok : dict - genomes to format (annotation was OK) -> {genome: [name, gpath, size, nbcont, l90]} + genomes to format (annotation was OK) -> + {genome: [name, gpath, to_annot, size, nbcont, l90]} res_path : str path to folder where the 4 directories must be created annot_path : str - path to folder named "<genome_name>-[prokka, prodigal]Res" where all prokka/prodigal + path to folder containing "<genome_name>-[prokka, prodigal]Res" where all prokka/prodigal results are saved. prodigal_only: True if it was annotated by prodigal, False if annotated by prokka threads : int number of threads to use to while formatting genomes quiet : bool True if nothing must be sent to stderr/stdout, False otherwise - changed_name : bool - True if contig names have been changed (cutn != 0) -> contig names end by '_num', - False otherwise. Returns ------- - (skipped, skipped_format) : tuple + skipped_format : list - * skipped : list of genomes skipped because they had a problem in annotation step - * skipped_format : list of genomes skipped because they had a problem in format step + list of genomes skipped because they had a problem in format step """ main_logger.info("Formatting all genomes") lst_dir = os.path.join(res_path, "LSTINFO") @@ -133,7 +129,7 @@ def format_genomes(genomes_ok, res_path, annot_path, prodigal_only, threads=1, q # (genome, name, gpath, annot_path, lst_dir, prot_dir, gene_dir, rep_dir, # gff_dir, results, prodigal_only, q) params = [(genome, name, gpath, annot_path, lst_dir, prot_dir, gene_dir, - rep_dir, gff_dir, prodigal_only, q, changed_name) + rep_dir, gff_dir, prodigal_only, q) for genome, (name, _, gpath, _, _, _) in genomes_ok.items()] # Create pool and launch parallel formating steps @@ -195,7 +191,7 @@ def handle_genome(args): * genome name (used to get info from the pool.map_async) """ (genome, name, gpath, annot_path, lst_dir, prot_dir, - gene_dir, rep_dir, gff_dir, prodigal_only, q, changed) = args + gene_dir, rep_dir, gff_dir, prodigal_only, q) = args # Define which formatting must be used, given the annotation software if prodigal_only: @@ -216,7 +212,7 @@ def handle_genome(args): return ok_format, genome -def write_gene(gtype, locus_num, gene_name, product, crispr_num, cont_loc, +def write_gene(gtype, locus_num, gene_name, product, cont_loc, genome, cont_num, ecnum, inf2, db_xref, strand, start, end, lstopenfile): """ Write given gene to output file @@ -231,11 +227,6 @@ def write_gene(gtype, locus_num, gene_name, product, crispr_num, cont_loc, gene name found by prokka/prodigal ("NA" if no gene name -> Always the case with Prodigal) product : str found by prokka/Prodigal, "NA" if no product (always the case for prodigal) - crispr_num : int - current crispr number. In prokka tbl, CRISPRs are not numbered, they all - have the same name. We name them by adding a unique number to each CRISPR. If the current - gene to add is a CRISPR, this number will be incremented and returned. If not, this same - number will be returned. cont_loc : str 'i' if the gene is inside a contig, 'b' if its on the border (first or last gene of the contig) @@ -260,16 +251,9 @@ def write_gene(gtype, locus_num, gene_name, product, crispr_num, cont_loc, Returns ------- - tuple : - Current crispr number, lstline + str : + lstline """ - # if last gene was a crispr - if gtype == "repeat_region": - gtype = "CRISPR" - locus_num = "CRISPR" + str(crispr_num) - gene_name = "crispr" - product = "crispr-array" - crispr_num += 1 locus_name = "{}.{}{}_{}".format(genome, str(cont_num).zfill(4), cont_loc, str(locus_num).zfill(5)) # If '|' character found in those fields, replace by '_' to avoid problems while parsing @@ -279,7 +263,7 @@ def write_gene(gtype, locus_num, gene_name, product, crispr_num, cont_loc, db_xref.replace("|", "_")) lst_line = "\t".join([start, end, strand, gtype, locus_name, gene_name, more_info]) lstopenfile.write(lst_line + "\n") - return crispr_num, lst_line + return lst_line def write_header(lstline, outfile): diff --git a/PanACoTA/annotate_module/genome_seq_functions.py b/PanACoTA/annotate_module/genome_seq_functions.py index 639a4f9f0c31e6ed5c956d0bebaa70212491631b..dbb8a2b3a006bd9f78e29e65fd1b0accd95757a1 100755 --- a/PanACoTA/annotate_module/genome_seq_functions.py +++ b/PanACoTA/annotate_module/genome_seq_functions.py @@ -310,16 +310,7 @@ def format_contig(cut, pat, cur_seq, cur_contig_name, contig_sizes, gresf, num, if cut: # Cut sequence and write header + sequence to res file num = split_contig(pat, cur_seq, cur_contig_name, contig_sizes, gresf, num) - # PROKKA User does not want to cut, but will annotate with prokka, so we still - # have to create a new sequence file - elif gresf: - new_contig_name = "{}_{}\n".format(cur_contig_name, num) - gresf.write(new_contig_name) - gresf.write(cur_seq + "\n") - contig_sizes[new_contig_name] = len(cur_seq) - num += 1 - # PRODIGAL No cut, and prodigal used -> no new file created, but check - # contig unique names + # No cut -> no new file created, but check contig unique names else: if cur_contig_name in contig_sizes.keys(): logger.error("{} contig name is used for several contigs. Please put " @@ -334,7 +325,8 @@ def format_contig(cut, pat, cur_seq, cur_contig_name, contig_sizes, gresf, num, def split_contig(pat, whole_seq, cur_contig_name, contig_sizes, gresf, num): """ Save the contig read just before into dicts and write it to sequence file. - Contig name must be at most 20 characters (required by prokka) + Unique ID of contig must be in the first field of header, before the first space + (required by prokka) Parameters ---------- @@ -368,7 +360,7 @@ def split_contig(pat, whole_seq, cur_contig_name, contig_sizes, gresf, num): # we get empty contigs, if 2 occurrences of the pattern are side by side). if len(seq) == 0: continue - new_contig_name = "{}_{}\n".format(cur_contig_name, num) + new_contig_name = ">{}_{}\n".format(num, cur_contig_name.split(">")[1]) contig_sizes[new_contig_name] = len(seq) gresf.write(new_contig_name) gresf.write(seq + "\n") diff --git a/PanACoTA/prepare_module/download_genomes_func.py b/PanACoTA/prepare_module/download_genomes_func.py index bbab0ad92bfa532b4c554f42c36658aa9da04e86..e820316cc89e4c6f6f2003667a5ac284a583d6a0 100644 --- a/PanACoTA/prepare_module/download_genomes_func.py +++ b/PanACoTA/prepare_module/download_genomes_func.py @@ -53,7 +53,7 @@ from PanACoTA import utils logger = logging.getLogger("prepare.dds") -def download_from_refseq(species_linked, NCBI_species, NCBI_taxid, outdir, threads): +def download_from_refseq(species_linked, NCBI_species, NCBI_taxid, levels, outdir, threads): """ Download refseq genomes of given species @@ -79,7 +79,7 @@ def download_from_refseq(species_linked, NCBI_species, NCBI_taxid, outdir, threa """ # Name of summary file, with metadata for each strain: - sumfile = os.path.join(outdir, "assembly_summary-{}.txt".format(species_linked)) + sumfile = os.path.join(outdir, f"assembly_summary-{species_linked}.txt") abs_sumfile = os.path.abspath(sumfile) # arguments needed to download all genomes of the given species @@ -99,6 +99,10 @@ def download_from_refseq(species_linked, NCBI_species, NCBI_taxid, outdir, threa message += f" (NCBI_taxid = {NCBI_taxid})." else: message += f" NCBI_taxid = {NCBI_taxid}" + # If assembly level(s) given, add it to arguments, and write to info message + if levels: + keyargs["assembly_levels"] = levels + message += f" (Only those assembly levels: {levels}). " logger.info(f"Metadata for all genomes will be saved in {sumfile}") logger.info(message) diff --git a/PanACoTA/subcommands/align.py b/PanACoTA/subcommands/align.py index 315882b69c6172d6e5067da9b17a9472c556c710..0000d3f6bc36a041e1bb9cd0c7da7d744d748867 100755 --- a/PanACoTA/subcommands/align.py +++ b/PanACoTA/subcommands/align.py @@ -157,25 +157,7 @@ def build_parser(parser): """ import argparse import multiprocessing - - def thread_num(param): - try: - param = int(param) - except Exception: - msg = "argument --threads threads: invalid int value: {}".format(param) - raise argparse.ArgumentTypeError(msg) - nb_cpu = multiprocessing.cpu_count() - if param > nb_cpu: - msg = ("You have {} threads on your computer, you cannot ask for more: " - "invalid value: {}").format(nb_cpu, param) - raise argparse.ArgumentTypeError(msg) - elif param < 0: - msg = ("Please provide a positive number of threads (or 0 for all threads): " - "Invalid value: {}").format(param) - raise argparse.ArgumentTypeError(msg) - elif param == 0: - return nb_cpu - return param + from PanACoTA import utils_argparse # Create command-line parser for all options and arguments to give required = parser.add_argument_group('Required arguments') @@ -200,7 +182,7 @@ def build_parser(parser): help="Output directory, where all results must be saved ") optional = parser.add_argument_group('Optional arguments') - optional.add_argument("--threads", dest="threads", default=1, type=thread_num, + optional.add_argument("--threads", dest="threads", default=1, type=utils_argparse.thread_num, help=("add this option if you want to parallelize on several threads. " "Indicate on how many threads you want to parallelize. " "By default, it uses 1 thread. Put 0 if you want to use " diff --git a/PanACoTA/subcommands/annotate.py b/PanACoTA/subcommands/annotate.py index c8b7fde2a9a37e4d949c81645139a9a3087fef6b..616c2a1c19edd4e6ef20ae70321003019a27c25c 100755 --- a/PanACoTA/subcommands/annotate.py +++ b/PanACoTA/subcommands/annotate.py @@ -408,8 +408,7 @@ def main(cmd, list_file, db_path, res_dir, name, date, l90=100, nbcont=999, cutn skipped_format = [] # Generate database (folders Proteins, Genes, Replicons, LSTINFO) skipped_format = ffunc.format_genomes(results_ok, res_dir, res_annot_dir, - prodigal_only, threads, quiet=quiet, - changed_name=changed) + prodigal_only, threads, quiet=quiet) print(skipped_format) # At least one genome could not be formatted -> warn user if skipped_format: @@ -480,7 +479,7 @@ def build_parser(parser): optional.add_argument("--nbcont", dest="nbcont", type=utils_argparse.cont_num, default=999, help=("Maximum number of contigs allowed to keep a genome. " "Default is 999.")) - optional.add_argument("--cutn", dest="cutn", type=int, default=5, + optional.add_argument("--cutn", dest="cutn", type=utils_argparse.positive_int, default=5, help=("By default, each genome will be cut into new contigs when " "at least 5 'N' in a row are found in its sequence. " "If you don't want to " diff --git a/PanACoTA/subcommands/prepare.py b/PanACoTA/subcommands/prepare.py index 6a9c76591ebd2fa028b85199682e083035531498..ebe85ea69753ca1d6e2bac136df10d14f4a635e9 100644 --- a/PanACoTA/subcommands/prepare.py +++ b/PanACoTA/subcommands/prepare.py @@ -66,14 +66,14 @@ def main_from_parse(arguments): """ cmd = "PanACoTA " + ' '.join(arguments.argv) - main(cmd, arguments.NCBI_species, arguments.NCBI_species_taxid, arguments.outdir, - arguments.tmp_dir, arguments.parallel, arguments.no_refseq, arguments.db_dir, - arguments.only_mash, + main(cmd, arguments.NCBI_species, arguments.NCBI_species_taxid, arguments.levels, + arguments.outdir, arguments.tmp_dir, arguments.parallel, arguments.no_refseq, + arguments.db_dir, arguments.only_mash, arguments.from_info, arguments.l90, arguments.nbcont, arguments.cutn, arguments.min_dist, arguments.max_dist, arguments.verbose, arguments.quiet) -def main(cmd, NCBI_species, NCBI_taxid, outdir, tmp_dir, threads, no_refseq, db_dir, +def main(cmd, NCBI_species, NCBI_taxid, levels, outdir, tmp_dir, threads, no_refseq, db_dir, only_mash, info_file, l90, nbcont, cutn, min_dist, max_dist, verbose, quiet): """ Main method, constructing the draft dataset for the given species @@ -226,20 +226,15 @@ def main(cmd, NCBI_species, NCBI_taxid, outdir, tmp_dir, threads, no_refseq, db_ "output folder called 'new_outdir', make sure you have " "'-o new_outdir' option, " "and you specified where the uncompressed sequences to " - "use are ('-d sequence_database_path' -> " - "my_outdir/Database_init). ") + "use are ('-d sequence_database_path'). ") sys.exit(1) # add genomes from refseq/bacteria folder to Database_init nb_gen, _ = dgf.to_database(outdir) - # If no genome found, error -> nothing to analyse - if nb_gen == 0: - logger.error(f"There is no genome in {refseqdir}.") - sys.exit(1) # No sequence: Do all steps -> download, QC, mash filter else: # Download all genomes of the given taxID db_dir, nb_gen = dgf.download_from_refseq(species_linked, NCBI_species, NCBI_taxid, - outdir, threads) + levels, outdir, threads) logger.info("{} refseq genome(s) downloaded".format(nb_gen)) # Now that genomes are downloaded and uncompressed, check their quality to remove bad ones @@ -250,7 +245,7 @@ def main(cmd, NCBI_species, NCBI_taxid, outdir, tmp_dir, threads, no_refseq, db_ else: logger.warning('You asked to run only mash steps.') if not os.path.exists(info_file): # info-file missing -> error and exit - logger.error(f"Your info file {info_file} does not exist. Please Provide the " + logger.error(f"Your info file {info_file} does not exist. Please provide the " "right name/path, or remove the '--mash-only option to rerun " "quality control.") sys.exit(1) @@ -290,13 +285,21 @@ def build_parser(parser): general = parser.add_argument_group('General arguments') general.add_argument("-t", dest="NCBI_species_taxid", default="", help=("Species taxid to download, corresponding to the " - "'species taxid' provided by the NCBI") + "'species taxid' provided by the NCBI. A comma-separated " + "list of taxid can also be provided.") ) general.add_argument("-s", dest="NCBI_species", default="", help=("Species to download, corresponding to the " "'organism name' provided by the NCBI. Give name between " "quotes (for example \"escherichia coli\")") ) + general.add_argument("-l", "--assembly_level", dest="levels", default="", + help=("Assembly levels of genomes to download (default: all). " + "Possible levels are: 'all', 'complete', 'chromosome', " + "'scaffold', 'contig'." + "You can also provide a comma-separated list of assembly " + "levels. For ex: 'complete,chromosome'") + ) general.add_argument("-o", dest="outdir", help=("Give the path to the directory where you want to save the " "downloaded database. In the given directory, it will create " @@ -312,7 +315,7 @@ def build_parser(parser): "By default, it will be saved in your " "out_dir/tmp_files.") ) - general.add_argument("--cutn", dest="cutn", type=int, default=5, + general.add_argument("--cutn", dest="cutn", type=utils_argparse.positive_int, default=5, help=("By default, each genome will be cut into new contigs when " "at least 5 'N' in a row are found in its sequence. " "If you don't want to " @@ -325,16 +328,18 @@ def build_parser(parser): general.add_argument("--nbcont", dest="nbcont", type=utils_argparse.cont_num, default=999, help=("Maximum number of contigs allowed to keep a genome. " "Default is 999.")) - general.add_argument("--min", dest="min_dist", default=1e-4, type=float, + general.add_argument("--min_dist", dest="min_dist", default=1e-4, + type=utils_argparse.mash_dist, help="By default, genomes whose distance to the reference is not " "between 1e-4 and 0.06 are discarded. You can specify your own " "lower limit (instead of 1e-4) with this option.") - general.add_argument("--max_dist", dest="max_dist", default=0.06, type=float, - help="By default, genomes whose distance to the reference is not " - "between 1e-4 and 0.06 are discarded. You can specify your own " - "lower limit (instead of 0.06) with this option.") - general.add_argument("-p", dest="parallel", type=utils_argparse.thread_num, default=1, - help=("Run 'N' downloads in parallel (default=1). Put 0 if " + general.add_argument("--max_dist", dest="max_dist", default=0.06, + type=utils_argparse.mash_dist, + help="By default, genomes whose distance to the reference is not " + "between 1e-4 and 0.06 are discarded. You can specify your own " + "lower limit (instead of 0.06) with this option.") + general.add_argument("-p", "--threads", dest="parallel", type=utils_argparse.thread_num, + default=1, help=("Run 'N' downloads in parallel (default=1). Put 0 if " "you want to use all cores of your computer.")) optional = parser.add_argument_group('Alternatives') @@ -453,6 +458,20 @@ def check_args(parser, args): parser.error("Choose between a verbose output (-v) or a quiet output (-q)." " You cannot have both.") + # min_dist must be higher than max_dist + if args.min_dist >= args.max_dist: + parser.error(f"min_dist ({args.min_dist}) cannot be higher " + f"than max_dist ({args.max_dist})") + + # Check that levels, if given, are among possible ones + possible = ["all", "complete", "chromosome", "scaffold", "contig"] + if args.levels: + for level in args.levels.split(","): + if level not in possible: + parser.error("Please choose between available assembly levels: 'all', 'complete', " + "'chromosome', 'scaffold', 'contig'. If several levels, provide a " + f"comma-separated list. Invalid value: '{args.levels}'") + # WARNINGS # User did not specify a species name if not args.NCBI_species: diff --git a/PanACoTA/utils.py b/PanACoTA/utils.py index 4d51eecffea54da35762d47778cf6eced939526e..9828d464b413ea503e7cf1a27daf808c623028ed 100755 --- a/PanACoTA/utils.py +++ b/PanACoTA/utils.py @@ -824,7 +824,7 @@ def read_genomes_info(list_file, name, date=None, logger=None): if len(genomes) > 0: logger.info(("Found {} genomes in total").format(len(genomes))) else: - logger.error(f"no genome listed in {list_file} were found.") + logger.error(f"No genome listed in {list_file} was found.") sys.exit(1) return genomes @@ -1168,21 +1168,26 @@ def get_genome_contigs_and_rename(gembase_name, gpath, outfile, logger): else: seq += line cont_size += len(line.strip()) - # Write last contig - cont = "\t".join([prev_cont, str(cont_size)]) + "\n" - prevcont_nohead = "".join(prev_cont.split(">")[1:]) - prev_orig_name_nohead = prev_orig_name.split(">")[1] - if prev_orig_name_nohead: - if prev_orig_name_nohead in contigs: - logger.error(f"several contigs have the same name {prev_orig_name_nohead} " - f"in {gpath}.") - return False, False + # Write last contig, if there is one (if gpath not empty) + if prev_cont: + cont = "\t".join([prev_cont, str(cont_size)]) + "\n" + prevcont_nohead = "".join(prev_cont.split(">")[1:]) + prev_orig_name_nohead = prev_orig_name.split(">")[1] + if prev_orig_name_nohead: + if prev_orig_name_nohead in contigs: + logger.error(f"several contigs have the same name {prev_orig_name_nohead} " + f"in {gpath}.") + return False, False contigs[prev_orig_name_nohead] = prevcont_nohead sizes[prevcont_nohead] = cont_size grf.write(cont) grf.write(seq) + if not contigs: + logger.error(f"Your genome {gpath} does not contain any sequence, " + "or is not in fasta format.") return contigs, sizes - +# Add test with empty gpath +# Add test with non fasta gpath def logger_thread(q): diff --git a/PanACoTA/utils_argparse.py b/PanACoTA/utils_argparse.py index f5bb49bb4b75dd0228f0b80ae4da7166dafd6cf8..f553a571f80c99d7e5ed42793dd165306558f03b 100644 --- a/PanACoTA/utils_argparse.py +++ b/PanACoTA/utils_argparse.py @@ -99,3 +99,27 @@ def thread_num(param): elif param == 0: return nb_cpu return param + + +def positive_int(param): + try: + param = int(param) + except ValueError: + msg = f"error: argument --cutn: invalid int value: '{param}'" + raise argparse.ArgumentTypeError(msg) + if param < 0: + msg = f"error: argument --cutn must be a positive integer: invalid int value: '{param}'" + raise argparse.ArgumentTypeError(msg) + return param + + +def mash_dist(param): + try: + param = float(param) + except ValueError: + msg = f"error: mash distance: invalid float value: '{param}'" + raise argparse.ArgumentTypeError(msg) + if param < 0 or param > 1: + msg = f"error: mash distance must be between 0 and 1: invalid value: '{param}'" + raise argparse.ArgumentTypeError(msg) + return param diff --git a/README.md b/README.md index 1d8e88fe26652df1a53eb5de120b05e894547fdb..0db8a0c5a097287a3fccd101f293f771d90f38d0 100755 --- a/README.md +++ b/README.md @@ -1,9 +1,11 @@ # **PanACoTA** - [](COPYING) +[](https://badge.fury.io/py/PanACoTA) +[](https://github.com/gem-pasteur/PanACoTA/releases) [](https://singularity-hub.org/collections/4724) + [](https://doi.org/10.1101/2020.09.11.293472) -[](https://github.com/gem-pasteur/PanACoTA/releases) + [](COPYING) [](https://gitlab.pasteur.fr/aperrin/pipeline_annotation/-/commits) [](http://aperrin.pages.pasteur.fr/pipeline_annotation/htmlcov) @@ -39,14 +41,28 @@ If you use PanACoTA, please cite: Amandine PERRIN, Eduardo P.C. ROCHA (2020). PanACoTA: A modular tool for massive microbial comparative genomics. BioRxiv. [](https://doi.org/10.1101/2020.09.11.293472) +**Content of this README:** + +Installation +- [Dependences](#dep) +- [pip](#pypi) +- [cloning github repository](#clone) +- [singularity](#singularity) + +Running +- [Quick run](#run) +- [Examples](#example) +- [Documentation](#doc) + +[Development](#develop) # Installation -## Dependencies +## <a name="dep"></a> Dependencies PanACoTA is written in **python3**. So, you need python3 (and pip3 for installation) to run it. -PanACoTA has several dependencies. Install only the one(s) you need, according to the module you want to use: +Then, PanACoTA has several external dependencies. If you use [`singularity`](#singularity) installation (for ex. to run on a cluster), you do not need to install any dependency. Otherwise, install only the one(s) you need, according to the module(s) you want to use: - For prepare module: [**mash**](https://mash.readthedocs.io/en/latest/) (to filter genomes) - For annotate module: [**prokka**](https://github.com/tseemann/prokka) and/or [**prodigal**](https://github.com/hyattpd/Prodigal) (to uniformly annotate your genomes) - For pangenome module: [**mmseqs**](https://github.com/soedinglab/MMseqs2) (to generate pangenomes) @@ -70,55 +86,78 @@ For FastTree, we advise to download C code from [here](http://www.microbesonline You can then add the output `FastTreeMP` to your `$PATH` to be able to run it from everywhere. +## <a name="install"></a> Installing `PanACoTA` and update + +You have different possibilities to install `PanACoTa`. + +**Warning:** If you plan to work on the scripts, choose the development installation (see [Development section](#develop)). + +### <a name="pypi"></a> From pip -## Downloading and updating `PanACoTA` +A very simple way to install the last stable version. This will install files in your python site-packages folder. -You can download `PanACoTA` source code by downloading a [zip file](https://github.com/gem-pasteur/PanACoTA/archive/master.zip), or by cloning its github repository (which is more recommended). By cloning the github repository, you will then be able to update the code to new versions very easily and quickly. Here is how to clone the repository: + pip install panacota + +And to get new version: + + pip install panacota --upgrade + +If you have permission issues, you can either use 'sudo' before the previous command lines to install it as root, or add the `--user` option to install it locally. + +### <a name="clone"></a> From github repository + +This allows you to get the very last version, and be able to test the last enhancements before they are uploaded to the other platforms. For that, go to where you want to install it `(<your_dir>)`, and type: git clone https://github.com/gem-pasteur/PanACoTA.git -This will create a repository called `PanACoTA`. Go inside this repository to install `PanACoTA`, as described hereafter. +This will create a repository called `PanACoTA`, containing the content of this github repository. To install PanACoTA: -If a new version of `PanACoTA` is released, and you want to use it, type the following command to update the source code: + cd PanACoTA + ./make + +If you have permission issues, you can either use 'sudo' before the previous command lines to install it as root, or add the `--user` option to install it locally. +To upload to new version, go back to your repository: + + cd <your_dir>/PanACoTA git pull + ./make update -Then, you will be able to upgrade to the new version (see bellow). -## <a name="install"></a> Installing `PanACoTA` (final mode) +### <a name="singularity"></a> From singularity image +[](https://singularity-hub.org/collections/4724) -To install `PanACoTA`, and all its dependencies, from the root directory, type: +Very useful if you do not have permission rights on the computer, such as, for example, on a cluster. The other advantage is that you do not need to install any dependence (except singularity itself of course). Singularity image includes all of them. You just have to download 1 file, and nothing will be installed anywhere on your computer. - ./make +First, download the singularity image: -or + singularity pull --name panacota.img shub://gem-pasteur/PanACoTA[:<version>] - ./make install +If you want a specific version, like version 1.0, specify `shub://gem-pasteur/PanACoTA:1.0`. -You will then be able to use the package from any directory in your computer, -just as any other software. +To get latest version: -If you have permission issues, you can either use 'sudo' before the previous command lines to install it as root, or add the `--user` option to install it locally. + singularity pull --name panacota.img shub://gem-pasteur/PanACoTA -**Warning:** If you plan to work on the scripts, choose the development installation (see [Development section](#develop)). +(This is the same as `singularity pull --name panacota.img shub://gem-pasteur/PanACoTA:latest`) -## <a name="uninstall"></a> Uninstalling `PanACoTA` +It will replace your file panacota.img by a new one corresponding to the latest version. -If you don't want `PanACoTA` anymore, or if you want to install a newer version, uninstall it by typing: +### From zip version - ./make uninstall +For people wanting to download source code of a specific version, we provide releases. You can download last one here: [](https://github.com/gem-pasteur/PanACoTA/releases) -## Upgrade to new version +## <a name="uninstall"></a> Uninstalling `PanACoTA` -If you want to install a new version of `PanACoTA` (and you got it by cloning the gitlab repository): -- update source code to the new version (`git pull`) -- upgrade installation to the new version (`./make upgrade`) +If you don't want `PanACoTA` anymore uninstall it by typing: -If you installed it by downloading a zip file, [Uninstall it](#uninstall), and [install](#install) the new version (by cloning gitlab repository, or downloading the new zip file). + pip unintall panacota # If you installed from pip + ./make uninstall # If you installed from github repository +Or, if you used singularity, just remove the downloaded image: `rm -r panacota.img` -# Running `PanACoTA` +# <a name="run"></a> Running `PanACoTA` ## Quick run @@ -139,34 +178,23 @@ Each subcommand has its own options and inputs. To get the list of required argu PanACoTA <subcommand> -h -## Examples + +When using singularity, just replace `PanACoTA` by `./panacota.img`: + + ./panacota.img <subcommand_name> <arguments_for_subcommand> + ./panacota.img -h + +## <a name="example"></a> Examples We provide a folder, `Examples`, containing genomic sequences (in `Examples/genomes`) and examples of input files (in `Examples/input_files`) for the software. In the [example part of documentation](http://aperrin.pages.pasteur.fr/pipeline_annotation/html-doc/examples.html), you will find information explaining you how to run the different modules of `PanACoTA` with this dataset, so that you can try the software. We also describe the results that should be created by each command line. **Note:** the provided genomic sequences are taken from real genomes, but then modified and drastically shortened in order to have an example showing different situations, but running very fast. Hence, the examples results should not be interpreted biologically! -## Documentation +## <a name="doc"></a> Documentation You can find more information in [PanACoTA documentation](http://aperrin.pages.pasteur.fr/pipeline_annotation/html-doc)! - -## On cluster - -[](https://singularity-hub.org/collections/4724) - -We provide a singularity image, to help running PanACoTA on a cluster. - -First, download the singularity image: - - singularity pull --name panacota.img shub://gem-pasteur/PanACoTA - -Then, you can run PanACoTA as previously: - - ./panacota.img -h # to get help on the whole PanACoTA program - ./panacota.img <subcommand_name> <arguments_for_subcommand> # to run a module of PanACoTA on your data. - - # <a name="develop"></a> Development This part is for people who want to work on developing `PanACoTA` package. In the documentation, there is a part dedicated to [developers](http://aperrin.pages.pasteur.fr/pipeline_annotation/html-doc/develop.html). @@ -175,9 +203,7 @@ PanACoTA is also hosted in gitlab, where all CI is done. Here is the link: https ## Installing `PanACoTA` (development mode) -If you want to install `PanACoTA` while still working on modifying the scripts, type: - - ./make develop +If you want to install `PanACoTA` while still working on modifying the scripts, use `./make develop` instead of `./make install` once you have cloned the repository. Your changes will then be taken into account. As you installed the package, you will be able to run it from any directory in your computer. diff --git a/containers/Singularity b/containers/Singularity index bbe21147078959f9d084029f6d2a6db028df9c0a..026136f88357dc1d137864dec4838f9ef101e2e5 100644 --- a/containers/Singularity +++ b/containers/Singularity @@ -28,7 +28,7 @@ From:python:3.7-stretch rm mash-Linux64-v2.2.tar &&\ mv /opt/src/mash-Linux64-v2.2/mash /usr/local/bin &&\ rm -r mash-Linux64-v2.2 - + # Update makeblastdb and blastp for prokka cd /opt/src wget ftp://ftp.ncbi.nlm.nih.gov/blast/executables/LATEST/ncbi-blast-2.10.1+-x64-linux.tar.gz && \ diff --git a/containers/Singularity.1.0 b/containers/Singularity.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..2ef639f502c02cb20db9c4abf78ad047333a37a4 --- /dev/null +++ b/containers/Singularity.1.0 @@ -0,0 +1,157 @@ +Bootstrap: docker +From:python:3.7-stretch + +%post + # Update apt-get packages + apt-get update &&\ + apt-get -y upgrade + + # To use the "local" python, not the system one. + export PATH="/usr/local/bin":$PATH + # To avoid using python things installed in the HOME of root + # (that will be mounted during singularity build) + export PYTHONNOUSERSITE=1 + + # Install packages needed + apt-get install -y wget + + # Upgrade pip + pip3 install --upgrade pip + + # For manually-installed programs + mkdir -p /opt/src + + # Install mash + cd /opt/src + wget https://github.com/marbl/Mash/releases/download/v2.2/mash-Linux64-v2.2.tar &&\ + tar -xf mash-Linux64-v2.2.tar &&\ + rm mash-Linux64-v2.2.tar &&\ + mv /opt/src/mash-Linux64-v2.2/mash /usr/local/bin &&\ + rm -r mash-Linux64-v2.2 + + # Update makeblastdb and blastp for prokka + cd /opt/src + wget ftp://ftp.ncbi.nlm.nih.gov/blast/executables/LATEST/ncbi-blast-2.10.1+-x64-linux.tar.gz && \ + tar zxvpf ncbi-blast-2.10.1+-x64-linux.tar.gz &&\ + cp /opt/src/ncbi-blast-2.10.1+/bin/makeblastdb /usr/local/bin/ &&\ + cp /opt/src/ncbi-blast-2.10.1+/bin/blastp /usr/local/bin/ &&\ + rm ncbi-blast-2.10.1+-x64-linux.tar.gz + + # Install barrnap + cd /opt/src + wget https://github.com/tseemann/barrnap/archive/0.8.tar.gz &&\ + tar -xf 0.8.tar.gz &&\ + rm 0.8.tar.gz &&\ + mv /opt/src/barrnap-0.8/bin/barrnap /usr/local/bin &&\ + # Remove heavy useless files + rm -r /opt/src/barrnap-0.8/examples /opt/src/barrnap-0.8/build/*.aln + + # Install prodigal + cd /opt/src + wget https://github.com/hyattpd/Prodigal/archive/v2.6.3.tar.gz &&\ + tar -xzf v2.6.3.tar.gz &&\ + rm v2.6.3.tar.gz + cd /opt/src/Prodigal-2.6.3 + make &&\ + make install + + # Install prokka: + cd /opt/src + apt-get install -y\ + libdatetime-perl \ + libxml-simple-perl \ + libdigest-md5-perl \ + git \ + default-jre \ + bioperl + git clone https://github.com/tseemann/prokka.git + /opt/src/prokka/bin/prokka --setupdb &&\ + ln -s /opt/src/prokka/bin/prokka /usr/local/bin + + # Install MMseqs2 Version: f05f8c51d6e9c7c0b15fbd533e4b678303f50b3e + cd /opt/src + wget https://mmseqs.com/latest/mmseqs-linux-sse41.tar.gz &&\ + tar xvfz mmseqs-linux-sse41.tar.gz &&\ + rm mmseqs-linux-sse41.tar.gz &&\ + mv /opt/src/mmseqs/bin/mmseqs /usr/local/bin &&\ + # remove useless files + rm -r /opt/src/mmseqs + + + # Install mafft 7.313 + rm /usr/bin/mafft # remove mafft installed with bioperl + cd /opt/src + wget https://mafft.cbrc.jp/alignment/software/mafft-7.313-with-extensions-src.tgz &&\ + tar xf mafft-7.313-with-extensions-src.tgz &&\ + rm mafft-7.313-with-extensions-src.tgz + cd /opt/src/mafft-7.313-with-extensions/core + make clean &&\ + make &&\ + make install + + + # Install FastTree version 2.1.11 Double precision (No SSE3) + cd /opt/src + wget http://www.microbesonline.org/fasttree/FastTree.c &&\ + gcc -DOPENMP -fopenmp -DUSE_DOUBLE -Wall -O3 -finline-functions -funroll-loops -o FastTreeMP FastTree.c -lm &&\ + ln -s /opt/src/FastTreeMP /usr/local/bin + + + ## Install FastME FastME 2.1.6.1 + cd /opt/src + apt-get install -y automake &&\ + git clone https://gite.lirmm.fr/atgc/FastME.git + cd /opt/src/FastME + ./configure &&\ + make &&\ + make install + + + # Install quicktree + cd /opt/src + git clone https://github.com/tseemann/quicktree + cd quicktree + make &&\ + ln -s /opt/src/quicktree/quicktree /usr/local/bin + + + # Install iqtree + cd /opt/src + wget https://github.com/Cibiv/IQ-TREE/releases/download/v1.6.12/iqtree-1.6.12-Linux.tar.gz + tar -xzf iqtree-1.6.12-Linux.tar.gz &&\ + rm iqtree-1.6.12-Linux.tar.gz &&\ + ln -s /opt/src/iqtree-1.6.12-Linux/bin/iqtree /usr/local/bin + + + # Install iqtree2 + cd /opt/src + wget https://github.com/Cibiv/IQ-TREE/releases/download/v2.0.6/iqtree-2.0.6-Linux.tar.gz + tar -xzf iqtree-2.0.6-Linux.tar.gz &&\ + rm iqtree-2.0.6-Linux.tar.gz &&\ + ln -s /opt/src/iqtree-2.0.6-Linux/bin/iqtree2 /usr/local/bin + + + # Install PanACoTA + cd /opt/src + wget https://github.com/gem-pasteur/PanACoTA/archive/v1.0.tar.gz + tar -xzf v1.0.tar.gz + cd /opt/src/PanACoTA-1.0 + ./make + + +%environment + export LC_ALL=C + # To use the "local" python, not the system one. + export PATH="/usr/local/bin":$PATH + # To avoid using python things installed in the HOME of the user + # (that will be mounted during container execution) + export PYTHONNOUSERSITE=1 + + +%runscript + if [ "$*" ] + then + exec /usr/local/bin/PanACoTA "$@" + else + exec /usr/local/bin/PanACoTA -h + fi diff --git a/containers/Singularity.1.0.1 b/containers/Singularity.1.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..50668430c564cb9e4d09dc112093a8b7ce1abd31 --- /dev/null +++ b/containers/Singularity.1.0.1 @@ -0,0 +1,157 @@ +Bootstrap: docker +From:python:3.7-stretch + +%post + # Update apt-get packages + apt-get update &&\ + apt-get -y upgrade + + # To use the "local" python, not the system one. + export PATH="/usr/local/bin":$PATH + # To avoid using python things installed in the HOME of root + # (that will be mounted during singularity build) + export PYTHONNOUSERSITE=1 + + # Install packages needed + apt-get install -y wget + + # Upgrade pip + pip3 install --upgrade pip + + # For manually-installed programs + mkdir -p /opt/src + + # Install mash + cd /opt/src + wget https://github.com/marbl/Mash/releases/download/v2.2/mash-Linux64-v2.2.tar &&\ + tar -xf mash-Linux64-v2.2.tar &&\ + rm mash-Linux64-v2.2.tar &&\ + mv /opt/src/mash-Linux64-v2.2/mash /usr/local/bin &&\ + rm -r mash-Linux64-v2.2 + + # Update makeblastdb and blastp for prokka + cd /opt/src + wget ftp://ftp.ncbi.nlm.nih.gov/blast/executables/LATEST/ncbi-blast-2.10.1+-x64-linux.tar.gz && \ + tar zxvpf ncbi-blast-2.10.1+-x64-linux.tar.gz &&\ + cp /opt/src/ncbi-blast-2.10.1+/bin/makeblastdb /usr/local/bin/ &&\ + cp /opt/src/ncbi-blast-2.10.1+/bin/blastp /usr/local/bin/ &&\ + rm ncbi-blast-2.10.1+-x64-linux.tar.gz + + # Install barrnap + cd /opt/src + wget https://github.com/tseemann/barrnap/archive/0.8.tar.gz &&\ + tar -xf 0.8.tar.gz &&\ + rm 0.8.tar.gz &&\ + mv /opt/src/barrnap-0.8/bin/barrnap /usr/local/bin &&\ + # Remove heavy useless files + rm -r /opt/src/barrnap-0.8/examples /opt/src/barrnap-0.8/build/*.aln + + # Install prodigal + cd /opt/src + wget https://github.com/hyattpd/Prodigal/archive/v2.6.3.tar.gz &&\ + tar -xzf v2.6.3.tar.gz &&\ + rm v2.6.3.tar.gz + cd /opt/src/Prodigal-2.6.3 + make &&\ + make install + + # Install prokka: + cd /opt/src + apt-get install -y\ + libdatetime-perl \ + libxml-simple-perl \ + libdigest-md5-perl \ + git \ + default-jre \ + bioperl + git clone https://github.com/tseemann/prokka.git + /opt/src/prokka/bin/prokka --setupdb &&\ + ln -s /opt/src/prokka/bin/prokka /usr/local/bin + + # Install MMseqs2 Version: f05f8c51d6e9c7c0b15fbd533e4b678303f50b3e + cd /opt/src + wget https://mmseqs.com/latest/mmseqs-linux-sse41.tar.gz &&\ + tar xvfz mmseqs-linux-sse41.tar.gz &&\ + rm mmseqs-linux-sse41.tar.gz &&\ + mv /opt/src/mmseqs/bin/mmseqs /usr/local/bin &&\ + # remove useless files + rm -r /opt/src/mmseqs + + + # Install mafft 7.313 + rm /usr/bin/mafft # remove mafft installed with bioperl + cd /opt/src + wget https://mafft.cbrc.jp/alignment/software/mafft-7.313-with-extensions-src.tgz &&\ + tar xf mafft-7.313-with-extensions-src.tgz &&\ + rm mafft-7.313-with-extensions-src.tgz + cd /opt/src/mafft-7.313-with-extensions/core + make clean &&\ + make &&\ + make install + + + # Install FastTree version 2.1.11 Double precision (No SSE3) + cd /opt/src + wget http://www.microbesonline.org/fasttree/FastTree.c &&\ + gcc -DOPENMP -fopenmp -DUSE_DOUBLE -Wall -O3 -finline-functions -funroll-loops -o FastTreeMP FastTree.c -lm &&\ + ln -s /opt/src/FastTreeMP /usr/local/bin + + + ## Install FastME FastME 2.1.6.1 + cd /opt/src + apt-get install -y automake &&\ + git clone https://gite.lirmm.fr/atgc/FastME.git + cd /opt/src/FastME + ./configure &&\ + make &&\ + make install + + + # Install quicktree + cd /opt/src + git clone https://github.com/tseemann/quicktree + cd quicktree + make &&\ + ln -s /opt/src/quicktree/quicktree /usr/local/bin + + + # Install iqtree + cd /opt/src + wget https://github.com/Cibiv/IQ-TREE/releases/download/v1.6.12/iqtree-1.6.12-Linux.tar.gz + tar -xzf iqtree-1.6.12-Linux.tar.gz &&\ + rm iqtree-1.6.12-Linux.tar.gz &&\ + ln -s /opt/src/iqtree-1.6.12-Linux/bin/iqtree /usr/local/bin + + + # Install iqtree2 + cd /opt/src + wget https://github.com/Cibiv/IQ-TREE/releases/download/v2.0.6/iqtree-2.0.6-Linux.tar.gz + tar -xzf iqtree-2.0.6-Linux.tar.gz &&\ + rm iqtree-2.0.6-Linux.tar.gz &&\ + ln -s /opt/src/iqtree-2.0.6-Linux/bin/iqtree2 /usr/local/bin + + + # Install PanACoTA + cd /opt/src + wget https://github.com/gem-pasteur/PanACoTA/archive/v1.0.1.tar.gz + tar -xzf v1.0.1.tar.gz + cd /opt/src/PanACoTA-1.0.1 + ./make + + +%environment + export LC_ALL=C + # To use the "local" python, not the system one. + export PATH="/usr/local/bin":$PATH + # To avoid using python things installed in the HOME of the user + # (that will be mounted during container execution) + export PYTHONNOUSERSITE=1 + + +%runscript + if [ "$*" ] + then + exec /usr/local/bin/PanACoTA "$@" + else + exec /usr/local/bin/PanACoTA -h + fi diff --git a/doc/source/starting.rst b/doc/source/starting.rst index e47a546a2ddcc6dfeff055f17df88b6558dc1ff0..1c24a46e2f5098f67d3d282a30c283be9d8c070c 100755 --- a/doc/source/starting.rst +++ b/doc/source/starting.rst @@ -151,7 +151,9 @@ We provide a singularity image, to help running PanACoTA on a cluster. First, download the singularity image:: - singularity pull --name panacota.img shub://gem-pasteur/PanACoTA + singularity pull --name panacota.img shub://gem-pasteur/PanACoTA[:version] + +If you want a specific version, like version 1.0, specify ``shub://gem-pasteur/PanACoTA:1.0``. If you want the latest version, use ``shub://gem-pasteur/PanACoTA`` or ``shub://gem-pasteur/PanACoTA:latest``. Then, you can run PanACoTA in the same way as previously, using: diff --git a/setup.py b/setup.py index 7ce41fa008e6c63ce3098162ecf47c50f501c839..1d763e24925d3e8a60b61761dfc79bb218fed5cb 100755 --- a/setup.py +++ b/setup.py @@ -47,7 +47,7 @@ scripts = ['bin/PanACoTA'] classifiers = [ "Environment :: Console", "Intended Audience :: Science/Research", - "License :: AGPL v3", + "License :: OSI Approved :: GNU Affero General Public License v3", "Programming Language :: Python :: 3", "Operating System :: OS Independent", "Topic :: Scientific/Engineering :: Bio-Informatics", @@ -63,13 +63,13 @@ setup( description="Large scale comparative genomics tools: annotate genomes, do pangenome, " "core/persistent genome, align core/persistent families, infer phylogenetic tree.", long_description=long_description, + long_description_content_type="text/markdown", author='Amandine Perrin', author_email='amandine.perrin@pasteur.fr', license='AGPL v3', platforms='OS Independent', package_data={'': ['LICENSE']}, - download_url='??', - url='??', + url='https://github.com/gem-pasteur/PanACoTA', scripts=scripts, include_package_data=True, install_requires=requires, diff --git a/test/data/annotate/exp_files/exp_ALL-GENOMES-QC.lst b/test/data/annotate/exp_files/exp_ALL-GENOMES-QC.lst index ec6c0fb477026bc66abe8fdfc7460f57191a5b31..ebe711bc93e6b5658d59e8a7b291ca392b0d9b8b 100644 --- a/test/data/annotate/exp_files/exp_ALL-GENOMES-QC.lst +++ b/test/data/annotate/exp_files/exp_ALL-GENOMES-QC.lst @@ -1,4 +1,5 @@ orig_name to_annotate gsize nb_conts L90 B2_A3_5.fasta-changeName.fna B2_A3_5.fasta-changeName.fna 120529 5 4 H299_H561.fasta-all.fna H299_H561.fasta-all.fna 13259 7 3 -A_H738.fasta-all.fna A_H738.fasta-all.fna 20031 5 1 +A_H738.fasta-all.fna A_H738.fasta-all.fna 20066 5 1 +complete_genome.fna complete_genome.fna 88 1 1 diff --git a/test/data/annotate/exp_files/exp_A_H738.fasta-all.fna_prokka-split3N.fna b/test/data/annotate/exp_files/exp_A_H738.fasta-all.fna_prokka-split3N.fna new file mode 100644 index 0000000000000000000000000000000000000000..f284e70de0bce8992f89f5d8611b735ef13b0680 --- /dev/null +++ b/test/data/annotate/exp_files/exp_A_H738.fasta-all.fna_prokka-split3N.fna @@ -0,0 +1,14 @@ +>1_H738_S10 L001_R1_001_(paired)_contig_1 +GAAATATAGGGGCAAATCCATTGTGTATTCCTGACGGCAAAAATAAGGAATATAAAGAAATGATTGCTTTGGTTTCTTACAACACATCATTCCCTTTTCATTTAATAAAGCGGCATGATACAAAGTGAACATGATTTCGATTTACATTGCCACCATACCGCTTCAGACAACCGGTACATTACTTTGTTATAAGACGTGATATATAATTCAAAACAACGTGGTTTTGATTATTCATATCTCATAATAAAAGTCGCGTCAGCATTTGCTTGCCCTGCTGATGCACTTGTACCGGTGCCTTTATAACGTGCAGAAAAATGAAGAACGTTGGTCCCGGGGATCAAGTTCTGGTTGGTTGAGAAGCTATTCCCATCAGGTTTGAGAATTGCGGATGTATTATCAAGTATTTCAATACCGACACCCGTTGCTGTTGTTGTATTGGTACTGGATGCAATGGCCAATAAATTATCATTGATTGCATCAGCCTGACCAGAAAATGCAACGGCAGCATTAGCGGCAACAACAGGATCGCAGTCGTTCAACTGAATGGTGAATGGAATTAATGCAGAGGTATTACCAACAGCATTGAAAATATCGGTACGATATTGACCGAGTGTGACAACCTGGTCTGCCGAGTCAGTATTCACTGAACAGGCAGCATTCACCAGTTCGCCTTCAAAGTGAATTGTACCGCCATCTACAACGGCAGCATAACTACCCGTAGCGGCGAATAGTGCGGCAGCCAGCGCAGACGAAATAAATCTTAATTTCATATATATTCCTTCAATCTCATTTATCGACTCCACATCCGTATATAACCGATTACTTTATTTAAGACACTGATAGTAGTAAATTCCTTTTTATCCTCTAAGAATGTCTTAATTGAAAATATGCACTCTATTCTAAAAAATAGAGAGCCCCGTTAGATGAATACTTCCGCGCAAAATATATTCAACACAAATATAGACCTGAAGCGGTAAATTACCAGGCTGAAAATTCTTTTTATATTGTCAGGTATTTCTTAAATTATCTTAATCCTTAGACAAGGAAATAAATCAGTTCCAGATTTACAACGCCATCATGGACGAAAAATGAAGCTTTCAGTCTCAGCGACGGTGCGCCTCACCTTCGCAAGAGGTCGCTTCACGCGATAAATCTGAAACGAAACCTGACAGCGCGCCCCGCTTCTGACAAAATAGGCGCATCCCCTTCGATCTACGTAACAGATGGAATCCTCTCTCTGATGGCAGCAAAGATTATTGACGGTAAAACGATTGCGCAGCAGGTGCGCTCTGAAGTTGCTCAAAAAGTTCAGGCGCGTATTGCAGCCGGACTGCGGGCACCAGGACTGGCCGTTGTGCTGGTGGGTAGTAACCCTGCATCGCAAATTTATGTCGCAAGCAAACGCAAGGCTTGTGAAGAAGTCGGGTTCGTCTCCCGCTCTTATGACCTCCCGGAAACCACCAGCGAAGCGGAGCTGCTGGAGCTTATCGATACGCTGAATGCCGACAACACCATCGATGGCATTCTGGTTCAACTGCCGTTACCGGCGGGTATTGATAACGTCAAAGTGCTGGAACGTATTCATCCGGACAAAGACGTGGACGGTTTCCATCCTTACAACGTCGGTCGTCTGTGCCAGCGCGCGCCGCGTCTGCGTCCCTGCACCCCGCGCGGTATCGTCACGCTGCTTGAGCGTTACAACATTGATACCTTCGGCCTCAACGCCGTGGTGATTGGCGCATCGAATATCGTTGGCCGCCCGATGAGCATGGAACTGCTGCTGGCAGGTTGCACCACTACAGTGACTCACCGCTTCACTAAAAATCTGCGTCATCACGTAGAAAATGCCGATCTATTGATCGTTGCCGTTGGCAAGCCAGGCTTTATTCCCGGTGACTGGATCAAAGAAGGCGCAATTGTGATTGATGTCGGCATCAACCGTCTGGAAAATGGCAAAGTTGTGGGCGACGTCGTGTTTGAAGACGCGGCTAAACGCGCCTCATACATTACGCCTGTTCCCGGCGGCGTTGGCCCGATGACGGTTGCCACGCTGATTGAAAACACGCTACAGGCGTGCGTTGAATATCATGATCCACAGGATGAGTAACATGGCGACATTTTCTTTAGGTAAACATCCGCACGTTGAGCTGTGCGACTTGCTGAAACTGGAAGGCTGGAGCGAAAGCGGCGCGCAGGCGAAAATCGCGATTGCCGAAGGCCAGGTGAAAGTCGACGGTGCGGTTGAAACGCGCAAACGCTGCAAAATCGTCGCCGGTCAGACAGTGAGTTTTGCAGGTCACAGCGTACAGGTTGTTGCCTGATCCCTTTCCCGGCCTGTATCAACAGGCCGGTTCTCTTTTCAGACTTTTGCCCTCTACGCCCCGTTCATCCATGCTGATAGCATCGACATTTTGCCGAAGCGACCATCATGCCAACCGTTATTACGCACGCCGCCGTTCCCCTATGCATTGGTTTAGGGTTGGGTTCGAAAGTCATCCCTCCGCGTCTGTTATTTGCCGGAATCATCCTGGCGATGCTGCCCGACGCCGACGTATTGTCGTTTAAATTTGGCGTTGCTTACGGCAATGTTTTTGGTCATCGCGGGTTTACCCATTCGCTGGTGTTTGCGTTTGTTGTCCCGCTGTTATGTGTGTTTATTGGACGCCGATGGTTCAGGGCTGGGCTGATTCGCTGCTGGCTGTTTTTAACCGTCTCGTTGCTATCGCACAGCTTGCTGGATTCGGTAACCACTGGCGGTAAAGGCGTTGGCTGGCTGTGGCCGTGGTCAGATGAACGCTTTTTCGCTCCCTGGCAGGTGATAAAAGTCGCGCCGTTTGCATTGTCTCGTTACACCACGCCGTACGGGCATCAGGTGATTATTTCTGAATTGATGTGGGTGTGGTTGCCGGGGATGCTACTGATGGGAATGTTGTGGTGGCGCAGACGATAACCGGATGCGAAAACTCGCATCCGGCAATAGCGCAATTACTTACGACGCCAGGTGGTCCCTTGCGGGCCATCTTCCAGCACGATCCCCATCTCGTTAAGACGATCACGCGCCGCATCCGCCGCCGCCCAGTCTTTCGCTTTACGGGCATCCAGACGCTGTTGAATTAACGCTTCAATCTCAGCCACTTCGCT +>2_H738_S10 L001_R1_001_(paired)_contig_1 +GTCGTCTGCCTGCGCGCCGCTTTGCAGGAACGCTTCCGGTTCTTGCTCCAGCAGGCCCAATACAGCGGAAAGTTTACGCAGGTGAGATGCCATTGCATTCGCCGCTGCCATATCTTCTGCTTTCAGACGGTTTACTTCACGCGCCATATCAAACAGTACGGAATAGGCTTCCGGGGTGTTGAAATCGTCGTCCATCGCTTCAATAAAGCGCGCTTCAAACGCTTCGCCACCGGCAGGCGCAACGGTTTTATCTGTGCCGCGCAGCGCAGTGTAGAGACGCTCCAGCGCCGCACGCGCCTGCTTCAGGTTCTCTTCGCTGTAGTTCAACTGGCTGCGATAGTGGCCCGACATCAGGAAGTAACGCACGGTTTCCGCGTCGTAGTATTTCAGCACATCGCGCACGGTAAAGAAGTTACCCAGCGATTTGGACATCTTCTCGCGGTCAACCATCACCATCCCCGAGTGCATCCAGTAGTTCACATACTGACCATCATGGGCACAGGTGGACTGCGCGATTTCGTTTTCGTGGTGCGGGAACATCAGGTCTGAACCGCCGCCGTGGATATCAAAGTGGTTACCCAGCTGCTTGCAGTTCATTGCCGAACATTCAATGTGCCAGCCAGGACGACCCGCGCCCCACGGAGACGGCCAGCTCGGTTCGCCCTCTTTCGACATCTTCCACAGAACGAAGTCCATTGGGTTGCGTTTGTCGTCGACCACGTCAACGCGCGCGCCTGCCTGCAGCTGGTCGAGATCCTGACGCGACAGCACGCCATAAGTTGGATCGGTCGGGACGTCGAACATCACGTCGCCGTTGTCCGCCACATAAGCGTGACCTTTGGCGATCAGTTGTTCAGTGAGTTCAATAATTTCTGCGATATGGTGCGTCGCGCGCGGCTCCATATCCGGGCGCAGAATGTTCAAAGCATCAAAATCTTTGTGCATTTCGGCGATCATGCGATCCACCATCGCCACAAAGCTTTCGCCATTTTCATTGGCGCGTTTGATGATTTTGTCGTCGATATCGGTAATGTTGCGCACATACTTCAGTTTATAGCCGAGGAAACGCAGATAGCGCGCAACCACGTCAAAAGCAACAAAGGTACGCCCGTGACCGATATGACAGAGATCGTAAACGGTGATTCCACACACGTACATGCCGACTTCCCCGGCGTGAATAGGCTTAAATTCCTCTTTTTGGCGTGTCAGAGTATTGAAGATTTTTAGCATCGAAGATTCCGTTTAGACATGTGTGGGTAATTGAGTTGCGTATAATACCCATATTTCCCGCGCGAATCAGCATACATTGCGTGATGATCCGATCGTGCGGTTATGCTATAACACCACCCTATATATGACCCGAACTGGGTTGAAGCACCAATCAAACGGAACAGGATGCAAAAATGGTTACTTTCCACACCAATCACGGCGATATTGTCATCAAAACTTTTGACGATAAAGCACCTGAAACAGTTAAAAACTTCCTGGACTACTGCCGCGAAGGTTTTTACAACAACACCATTTTCCACCGTGTTATCAACGGCTTTATGATTCAGGGCGGCGGTTTTGAACCGGGCATGAAACAAAAAGCCACCAAAGAACCGATCAAAAACGAAGCCAACAACGGCCTGAAAAATACCCGTGGTACGCTGGCAATGGCACGTACTCAGGCTCCGCACTCTGCAACTGCACAGTTCTTCATCAACGTGGTTGATAACGACTTCCTGAACTTCTCTGGCGAAAGCCTGCAAGGTTGGGGCTACTGCGTGTTTGCTGAAGTGGTTGACGGCATGGACGTGGTAGACAAAATCAAAGGTGTTGCAACCGGTCGTAGCGGTATGCACCAGGACGTGCCAAAAGAAGACGTTATCATTGAAAGCGTGACCGTTAGCGAGTAATCGTGGCGACACTCTTTATTGCAGATCTTCATCTCTGCGTGGAAGAACCGGCGATCACCGCCGGTTTTCTGCGTTTTTTAGCGGGGGAAGCCCGCAAGGCCGACGCGCTGTATATTCTTGGCGATCTGTTTGAAGCATGGATTGGCGACGACGATCCCAACCCACTCCATCGCAAGATGGCGGCGGCGATCAAAGCGGTGTCCGATTCCGGCGTTCCCTGTTATTTCATTCATGGCAACCGTGATTTTCTGCTCGGCAAACGCTTTGCCCGTGAAAGTGGCATGACGTTATTGCCGGAAGAAAAGGTGCTCGAACTTTATGGTCGCCGGGTGTTGATTATGCATGGCGACACGCTGTGCACCGATGACGCGGGTTATCAGGCTTTTCGCGCCAAGGTCCACAAACCCTGGCTGCAGACGCTATTCCTCGCCCTGCCGTTGTTTGTGCGCAAACGCATTGCCGCGCGAATGCGCGCGAACAGCAAAGAAGCCAACAGCAGTAAATCGCTGGCGATCATGGACGTTAACCAAAACGCGGTGGTCAGTGCGATGGAAAAACATCAGGTGCAATGGCTGATCCACGGGCATACCCATCGCCCGGCGGTGCATGAACTTATCGCTAATCAGCAACCTGCTTTTCGCGTGGTACTGGGTGCCTGGCATACGGAAGGTTCAATGGTGAAAGTCACGGCGGATGACGTTGAGCTGATTCATTTTCCGTTTTAAAAAACCCGCAACTTTGCTGATTTCACAGCCACGCAACCGTTTTCCTTGCTCTCTTTCCGTGCTATTCTCTGTGCCCTCTAAAGCCGAGAGTTGTGCACCACAGGAGTTTTAAGACGCATGTCTTCCCGCAATAATCCGGCGCGTGTCGCCATCGTGATGGGGTCCAAAAGCGACTGGGCTACCATGCAGTTCGCCGCCGAAATCTTCGAAATCCTGAATGTCCCGCACCACGTTGAAGTGGTTTCTGCTCACCGCACCCCCGATAAACTGTTCAGCTTCGCCGAAAGCGCCGAAGAGAACGGTTATCAGGTGATTATTGCGGGCGCAGGCGGCGCAGCGCATCTGCCAGGCATGATTGCCGCCAAAACGCTGGTGCCGGTGCTGGGCGTGCCAGTACAGAGCGCCGCACTGAGCGGTGTCGATAGCCTCTACTCCATCGTACAAATGCCGCGCGGCATTCCGGTGGGTACGCTGGCGATTGGTAAAGCTGGCGCGGCAAACGCGGCGTTACTGGCAGCACAAATTCTTGCGACTCATGATAAAGAACTGCACCAGCGTCTGAATGACTGGCGCAAAGCCCAGACCGACGAAGTGCTGGAAAACCCGGACCCGCGAGGTGCGGCATGAAACAGGTTTGCGTCCTCGGTAACGGGCAGTTAGGCCGTATGCTGCGTCAGGCAGGCGAACCGTTAGGCATTGCTGTCTGGCCAGTCGGGCTGGACGCTGAACCGGCGGCGGTGCCTTTTCAACAAAGCGTGATTACCGCTGAGATAGAACGCTGGCCGGAAACCGCATTAACCCGCGAGCTGGCGCGCCATCCGGCCTTTGTGAACCGCGATGTGTTCCCGATTATTGCTGACCGTCTGACTCAGAAGCAGCTTTTCGATAAGCTCCACCTGCCGACTGCACCGTGGCAGTTACTTGCCGAACGCAGCGAGTGGCCTGCGGTGTTTGATCGTTTAGGTGAGCTGGCGATTGTTAAGCGTCGCACTGGTGGTTATGACGGTCGCGGTCAATGGCGTTTACGCGCAAATGAAACCGAACAGTTACCGGCAGAGTGTTACGGCGAATGTATTGTCGAGCAGGGCATTAACTTCTCTGGTGAAGTGTCGCTGGTTGGCGCGCGCGGCTTTGATGGCAGCACCGTGTTTTATCCGCTGACGCATAACCTGCATCAGGACGGTATTTTGCGCACCAGCGTCGCTTTTCCGCAGGCCAACGCACAGCAGCAGGCGCAAGCCGAAGAGATGCTGTCGGCGATTATGCAGGAGCTGGGCTATGTGGGCGTGATGGCGATGGAGTGTTTTGTTACCCCGCAAGGTCTGTTGATCAACGAACTGGCACCGCGTGTGCATAACAGCGGTCACTGGACACAAAACGGTGCCAGCATCAGCCAGTTTGAGCTGCATCTGCGGGCGATTACCGATCTGCCGTTACCGCAACCAGTGGTGAATAATCCGTCGGTGATGATCAATCTGATTGGTAGCGATGTGAATTATGACTGGCTGAAACTGCCGCTGGTGCATCTGCACTGGTACGACAAAGAAGTCCGTCCGGGGCGTAAAGTGGGGCATCTGAATTTGACCGACAGCGACACATCGCGTCTGACTGCGACGCTGGAAGCCTTAATCC +>3_H738_S10 L001_R1_001_(paired)_contig_1 +CGCTGCTGCCGCCGGAATATGCCAGCGGCGTGATTTGGGCGCAGAGTAAGTTCGGTTAACTGGTGCTCTATTCTTGCCGGATGCGGCGTAAACGCCTTATCCGGCCTACCGATCCGGTACCCATTGTAGGCCTGATAAGATGCGTCAAGCATCGCATCAGGCATTGTGCACCAATTGCCGGATGCGGCACCGGTTGTAGGCCTGATAAGACGCGTCAAGCGTCGCATCAGGCACAAATGTCTAATGCCTACGACTACAGCGAAATACAGGTCCCCGCTTCGCCCGCCAGCGTCTCTTCAATTCGCGATAACGCCCCAATCCACGCGGGTTTACCACGGCTTCTGACATAACCACTCACCGCCGTTACCTTCGGCCCCATCGAACCATCGGCTTTGGCAAATGGCGCTAACTCATCCGGTGTGGCATGGCGAATGGCACGTTGCTGCGGCGTTCCCCAGTTTTCATATACCGCATCAGCATCGGTGAGGATCACCAGTCCATCTGCATTAATCTGCTCGGCGAGCAACGCAGCGGCGAGATCTTTATCAATCACTGCTTCACTCCCTGCTCCGTCATCCGTCACAGGCACACCGCCGCCGCCACTGCAAATCACCACATGCCCCTCTTTTAGCAACAACTCGATGGCTTCGCTGTCGAGAATTTTACGCGGTTGCGGAGACGCCACCACCCGGCGCAAATATTTACCATCACGTTTCATCTGCCAGCCGTAAGCCGCTTCCAGTGCCTCTTGTTCTTCTGGCTGATAAACCGGACCAATAAATTTCTCTGGCTGCAAAAACGCCGGATCATCAGGCGAAACCTCAATGCGCGTCAGCACCGTCGTCACGGGCGGCATCTGCGGCTGTGCGCTCAAACTCTGCGCCAGCATATAGCCAATCATCCCCTGGCTTTCCGCAACCAGCACATCCAGCGGATACGGTTCTACCTCTTTCCACGCCAGATTCTGCAATGCCAGCAGCCCCACCTGCGGCCCGTTGCCGTGAACAATCGCCAACCGATAAGAACGGGCCAGGCGTGCCAGCGCGGGTACAGCACTGGCGATATTGCGATATTGATTTTCTGCCGTCAGCGCCTCACCGCGCTGGAGTAAGGCGTTGCCCCCAAGAGCCACAACCAGTGTTTTCATGGTTTTCCTTGTAATAATTGTTGGCCAAGCCAGAACCCCAGCAGCGTATCTGCCCCTGACGTATGCCCCAGCGCCAGCAGCGAATCAATCGCAACAGCGGTACGTTTCGGGCAACTCAGAGCATGAACAAAGTGCAGGAGTGGCGAGGCGAAATATCCTTGCGCGGCATAACGTAAATAACTGACGCTCACCGCTGTGGTAACGAGTTGCAGATTGTCGGAACAGGCAAAAAACGGACGACCGGAGCGCGCATCTAAAGCGCCATAATACCAGGCCGCCAGCAGCATTCCGCTCAGCGTGTCATCATGACTCGGCGTTAATCCGGGGCCTTTACCCAGCCAGTGCCGCCAGTCGGTCTTAACGCCATTGAGCGCGGCCTGAAAACAGTGACGAAACTGGCGTAACTCAGCAGGCAGCGGATCGCTTGCCGCCAACGCCAGTGGCCCGAAAAGCCCGGTTTCCTCCGCGCGTTGCATCCATGCAGCTGCAAGTGGTTGAGGATGCGCAGGCGGCGTAATACGCAGCAAACAATAACGCTGTGGCTGTTTAACCGTGAAACGCCCGAGGCGAATCCCTTGAGCCACAACCTGTGGTCGTTCATTGCCGCATAATCCACCGCATAACGCATCGAATTGCGCACGGCGAAGCACCCATCCTCCGGGGCCGAAACCACTACCCTGACGATGCAACGTTAACAGTTCGCCGCTTTCCGTCATCAGGTTAATCGCCCGCCGCCACACTCCCGCTAACCGCCAGGACTGGCGATAATTCGGTGCGCTACTACTGGCAAGCAGAGGATGGATGATCGTCATTGCGCGTTCCTCAACCAATACCCATGCTTTCAGCCAGTGCTTCCAGCGCCTGTTCAAAGCACGCCAGCGGTGCCCGCACGGTGCCTGCGCCAATCTGCCCGATCCCCGCCTCTTTATGGGCGATACCGGTATTGATGAGTGGCGTAATGCCGGTTTCTACCACGCGACGAATGTCCAGCCCCAGGCACGCGCCCTGAAAATCCCAGCTTGGGATCTGCAACTGCATATTGCGTTCAAGGTAAATTTCCGCCATCTCTTCAGATACCGCTCTTGCCGCTTCCATGCCACCCGCACCGACAAAGCGCGTTACGCCAGGCGCTGCGATCATTGCCGCACCTCCGATACCAAAGGTTTCGGTAATCGCGCTATCGCCCATATCCGGGTTCGCCTGCTCCTGCGAGAAGCCGGTGAAAAACAGACCTTGCGGAGTGTTTACAGGCGCAGTAAACCAGCGTTCGCCCAGCCCGCTTACCCGAATCCCGAACATATTGCCGTTGCGGGTCATTGCCGTGACGATGCTGCCTGCGCGGATCATCGCGCCAGCATCCATCGCCGCCTTGCAGTAAGCCATCGCGAGGTTGAGGAAGAACTGATCGGTCACGCTGAGGAAATCCATCACTTCGGCGATGTGCTGTTTATCATGATCGAGGCGAGCAATTTGTGGGGCCAGCGCACGCATTAACAGTGCAGAGGAAGCAATATTGCGTTGATGGAACTCATCGCCCATCGTAATGCCCTGCGCCATCATCGCCGTGAGATCGATACCGCGCTCCATGCGCCCCAGCGCCGCGCTTAATACTGGCATTAACACATCGCGCATCCAGCGATGGCGAGTCAGGACATCTTCGCCGTAAGCGCCAAAACGCATCACTTTGCCGATACCTTCGTTGAGGTTGCAGTACGCCCGGTTGCCGTCGGTCACGTTCTCAACCACCAGCATCGGCATACTGGCAGAAGTAATACCGCCCATTGGCCCGACGGCATTCACATGGTGACAAGGAATGAAGTTCACTTCCCCCTGCTCCAGTATTGCCAGCGCCTGCGCTTCATCTTTCGCCCAACCTTCGAACAGACATGCGCCCACGCACGCCCCTTTCATGGGTCCGGTCATCTCCTGCCAGCGCATTGGCGGCCCGGCGTGAAGCAGTGTTTTGCCCTCGTTTAGTTCGCTGATAAGTGAAGAAGCCGGTTGCACATCCAGCCAGTGTGGACGAGCGCGACGAATTTGTTCGATAACCGCAGCATTGGCTTGCGCCACTGATGTAAACATGGGAACCCCTTATTGCAAACGTTCTAATAAACGAGCCAGTTTTTTATTGCCACCGGCGACTGGCGACCATTGGTAATGCACAACCGGTTTGCTGGCGCTTTGTAGCTCCAGCGCAAAGCTGCGTAATCCGATGTTAATCACGGCGACGTTTTCCAGTAATGACGGTGTGTGTTGCTGTGCGGCAGGCGAGAGCGGATGAATTAACGCTGCCGCCAGCAAGGTGGCTTCCGGTAGCGAACTCACGACCGCAATCCCCGCATCTTCCAGCGTGGCGATTTGCTGCGAGCGGCATTGCGGGTCACGTTCAGTGCCTGTCACCGTGGCAATGGCATACAGTGGTTGATTATCTAAACGCGCGGCACAGGCTTTTTGCCAGGCGCTCACCAGCGAGGCGGCAGGATCGGCGGTCGCACCGAAGCCAATCACGACATCAAGCAGCAACACGCGCACTTGCGGTTTAGCGCCGAGATCGGCAATTAACTGGTTGCGTAAGGTTGGGTCGATCATCGGATGGGGACGCCCGACGGTGTAGAAATCATCGCCGAGGTCAATAATCTGGTGGCTATCGGCGTCCAGCATCATGCCATGTTGATGGGTATCGTCGGCTTCCACGCCAAGGTGTCCGGCAAGTAATCCCGCCGCTTCGGCAGCCAGCGTACCGCCGGTATACAAACCGCAAATAAATCCGCTGCTGACAGGCGCTATTGCGTTACGTCGCGCCGTGACGCGTGAAAGCAGGCAAGCCAGGCGTGCGGCCTCATCCAGCGAGGAGGCAAACCAGACATTCTCGTCGCGGGCCACCGCCGGGGTATAACCTAAAAACAGCGCCACCGTCGGTTTGCCGGTTGCTTTCATGGCATTAACAATTTTCAGACGCACAGCTTCGGCAGGTGGTTTTGAAACAAATGCCAGCACTTCGCTTTTCTCGTCTGCACTGAGCATTTCCAGCGCTGTTAGCGCACTGATGCCGCCCACTTCACGGCTGAGGTCGCGCCCGCCAAGGCCAATCGCGTGAGTAATTCCCTCCCCTGCCAGCGCAATCTGCGAACACAGCTCCTGAATCCCGGTACCGGAAGCGCCAATGACGCCAATATTGCCTTCCGGCATCACGTTAGCAAAAGCCAGCGGTGTGCCGGCAATCATCGACGTACCGCAGTCCGGCCCCATCACCAGCAAGCCTTTTTCCCGCGCGCGGGTTTTAAGTTGGATTTCATCTTCCAGCGTGACGTTATCGGAGAACATCATCACGTTGAGGTTGCGATCCAGCGCCTGGTTTGCCAGCTCCGCCGCATACTCGCCAGCCACTGAAATCAGCGCCAGATTGGCATCGGGTAATTTCTGACAGGCACTGTCCCAGCGACGCACCTGCATCAACGCCTGGCTGCTGCCTGACCCCTGCGCCAGTTGTTTTAGCGCCTCTTCAAGCTGCTGCATAATCGCCTGCGCGATCCCCGCATCCGCCGCTTCGCTACGAATTGCCACGCAAATATCGTTCGGCGTGGCGTTATTAAAATCGTCATGCCAGAAACCTGTGGTATCTAATAACGCTTTATTGGCGGGCGTACCCATCATTACGGAAACATCATCAACATTTTCTGATTCGCTGAGTTTTCGTGAAATAATCATTAAACTGACCGAATCCTGAAAACACCCTTTTTTAATAAAGGCGTGGATCATAACAACTCCTTAAAAATTGCACCCATGGCAATTGCACGAGCAGTGTTAATGTGGCGATTACGGTATCGATGACAACGAGTAAATAAGGTGATGAATATCACACAGGAATTATTAACAAAAGAATTCAAATAACCACCAGGCTATTACTCATTATTTTTTAATAAGCGTTGTTGTTTTAAAAATCAGGTTAAAAGTGAGCGGATTATCAAATAAATTCTAACTATATTTTTTTGCCTGTCTGGATCACATAATCCAGATATTTTCCCTGTATGTTAATTGCAGTCATGCTTCACACCGTCGTTAAAAAGGAAGACAGATGAAAATCAGTCGGGAAACACTCCACCAGCTAATTGAGAATAAACTCTGCCAGGCTGGGTTAAAACGTGAGCACGCTGCAACCGTGGCTGAAGTATTGGTTTACGCCGATGCCAGAGGGATCCACTCTCATGGCGCGGTGCGCGTGGAATACTACGCGGAACGCATTTCAAAAGGCGGCACCAACCGCGAACCGGAGTTTCGTCTTGAGGAAACCGGGCCGTGCTCGGCAATTTTACATGCCGACAATGCCGCCGGACAGGTCGCGGCGAAAATGGGTATGGAACATGCCATCAAAACCGCCCAGCAAAATGGCGTTGCGGTGGTCGGTATCAGCCGGATGGGTCACAGCGGCGCAATCTCTTATTTTGTGCAGCAGGCAGCCCGCGCCGGATTCATTGGCATTTCGATGTGCCAGTCCGATCCAATGGTGGTGCCGTTTGGCGGCGCGGAAATTTACTACGGTACTAACCCCCTGGCCTTTGCCGCGCCGGGAGAAGGCGACGAGATCCTTACCTTTGATATGGCGACTACCGTACAGGCATGGGGAAAAGTGCTCGACGCCCGCTCGCGTAATATGTCTATCCCGGATACCTGGGCGGTCGATAAAAACGGTGTACCAACAACCGATCCGTTCGCGGTACATGCTCTGCTCCCCGCCGCCGGGCCAAAAGGGTATGGCCTGATGATGATGATTGACGTCCTCTCAGGCGTCTTACTCGGCTTACCGTTCGGGCGACAGGTTAGTTCGATGTATGACGATTTACACGCAGGGCGTAATTTGGGGCAATTACATATAGTTATTAATCCGAACTTTTTCTCCTCCAGCGAATTATTCCGTCAACATCTTAGCCAGACCATGCGCGAATTAAATGCCATTACCCCCGCGCCCGGTTTTAATCAGGTTTATTATCCCGGACAGGATCAGGATATTAAACAACGCAAAGCCGCCGTCGAAGGCATCGAAATTGTTGATGATATTTACCAGTATTTAATTTCCGACGCGCTTTATAACACGTCATACGAAACGAAAAATCCCTTTGCGCAATAATTATTGAGACAGGACTTTCTTATGATTACACATTTCCGTCAAGCTATAGAAGAAACGCTGCCCTGGCTTTCCTCTTTTGGCGCTGACCCAGCGGGTGGGATGACCCGTTTACTTTATTCGCCGGAATGGCTGGAAACCCAGCAGCAATTTAAAAAAAGAATGGCAGCAAGCGGGCTGGAAACACGTTTCGATGAAGTGGGGAATTTATACGGTCGCCTGAATGGCACCGAATATCCACAGGAAGTGGTTCTGAGCGGTTCGCATATCGATACCGTGGTTAACGGCGGTAACCTTGACGGGCAATTCGGCGCGCTGGCGGCGTGGCTGGCAATTGACTGGCTGAAAACGCAATACGGCGCGCCGCTACGTACGGTCGAAGTGGTGGCGATGGCAGAAGAAGAAGGCAGCCGCTTCCCGTATGTCTTCTGGGGCAGTAAAAATATTTTTGGGCTGGCGAATCCTGACGACGTGCGGAATATCTGTGATGCCAAAGGAAATAGTTTTGTCGATGCGATGAAGGCTTGCGGATTTACTCTTCCGAACGCCCCACTAACTCCGCGTCAGGATATTAAAGCCTTTGTTGAACTGCATATTGAACAGGGCTGTGTGCTGGAAAGTAATGGGCAATCAATTGGCGTGGTGAATGCAATTGTCGGGCAGCGTCGTTATACGGTAACGCTGAACGGCGAATCAAACCATGCAGGCACCACGCCGATGGGTTATCGTCGTGATACAGTTTACGCTTTCAGTCGCATTTGCCATCAGTCGGTCGAAAAAGCGAAAAGGATGGGCGATCCGCTGGTTCTGACCTTTGGCAAAGTAGAGCCGCGCCCGAATACGGTAAATGTGGTGCCGGGTAAAACCACGTTCACCATTGATTGTCGTCATACCGACGCTGCCGTGCTGCGCGATTTCACCCAACAGTTAGAAAACGACATGCGGGCGATTTGCGATGAAATGGACATTGGTATTGATATCGATTTATGGATGGACGAAGAACCCGTGCCGATGAATAAGGAGCTGGTCGCCACCCTGACAGAATTGTGTGAAAGAGAAAAACTGAATTACCGGGTGATGCACAGTGGTGCCGGGCACGACGCGCAAATTTTCGCGCCTCGCGTACCAACCTGCATGATTTTTATCCCCAGCATCAACGGGATCAGCCATAACCCGGCGGAACGCACCAATATTACCGACCTTGCCGAAGGGGTCAAAACGTTGGCACTCATGCTTTATCAACTTGCCTGGCAGAAATAAGGAGTCATAAATGGGATATTTAAATAACGTCACCGGTTACCGCGAAGATTTACTGGCTAACCGTGCGATTGTTAAACACGGTAATTTCGCACTGTTAACCCCGGATGGTCTGGTAAAAAATATTATTCCGGGCTTTGAAAATTGTGACGCGACAATCCTCTCCACGCCAAAGCTGGGTGCCTCTTTTGTTGATTATCTGGTCACACTGCATCAAAACGGTGGCAACCAACAGGGCTTCGGTGGCGAAGGCATTGAAACGTTCCTGTATGTGATCTCTGGAAATATCACTGCCAAAGCCGAAGGCAAAACATTTGCCTTAAGCGAAGGTGGCTATCTTTATTGCCCGCCAGGCTCCTTAATGACGTTTGTTAACGCCCAGGCCGAAGACAGCCAAATCTTTTTATATAAGCGCCGCTATGTTCCGGTAGAAGGCTATGCACCGTGGCTGGTTTCTGGCAATGCCAGCGAACTGGAACGCATTCATTATGAAGGCATGGACGATGTTATTCTGCTGGATTTTCTGCCCAAAGAGTTAGGTTTTGATATGAACATGCATATCCTCTCTTTTGCACCAGGTGCCAGCCACGGTTATATCGAAACACACGTTCAGGAACACGGTGCCTATATTCTTTCCGGTCAGGGGGTTTATAACCTCGACAATAACTGGATCCCGGTGAAAAAAGGCGATTACATCTTTATGGGCGCTTATTCTTTACAGGCTGGTTATGGTGTAGGGCGTGGTGAAGCGTTCAGCTATATTTACTCGAAAGATTGTAACCGCGACGTAGAGATTTAAGTCATACCACTCGCCTGATTATTTTTAGCTATGTTGGATTTTGCCACGGTTTATACCGTGGCTTTTTTTGTAACATTGCCTGATGCGCTTCGCTTATCAGGCCTACATGATCTCTGCAATATATAGAATTTGCGCGATTTTCAGGAAGGATATGGTACTCATGCCGCATCCGGCATGAGTACTGCACTCTTATGCGATATAAATCGCATCCGCTTTAAAGGTAAGGGTTAGTTTTTAATTCCCTGACCTATTTTAATGGCGCAGGCAATATTTCGCGCGCTGTTGAAGAGATTGGTTTCACCGCTGGCGAGCACTTCGGCTAAAGGTGCCAGACGAGGCAAAATGCTGAATACCGCGTCAATGCCGTACTGGTGCACCACTTCCACGCCATCACCCAATACGCCAGCAATCCCAATCACCGGTACATTAAACTGCTTCGCCACCGACGCCACACCCAGCGGCGCTTTACCGCCTGCCGTTTGCGAGTCGATGCGCCCTTCCCCGGTAATCACCAGTGCTGCGCCCTGCACTGCCTGCGCAAGATTGACCGCATTCAACACAATTTCAATGCCCGGTTTAATATCCGCATTGAGAAATACCGCCGCCGCAATACCCATACCGCCCGCAGCGCCGCCGCCCGCCATCTGGCAGACATTAATTTCAGTTTGCTGTTGTAAAACACGGGCGTAATTTTGCAGCCCCTGTTCAAGTTCTTCGACCATCTCCGGCGTTGCCCCTTTTTGCGGGCCAAACACCGCCGCCGCGCCGCGTGCCCCTACCAGCGGGTTATCAACGTCACATGCTACTTCAATATGGCAATTCGCCAGACGCGGATCGCATTCATCCATCTCAATGCTTGCCACGCGCGCTAAATTACCACCGTTTGCCGCCAGCGCCTGACCGTCGGCATCAAGGAAACGCACACCGAGCGCCTGCGCCATGCCCATACCGCCGTCGACCGTCGCACTGCCGCCAATGCCGAGAATAATATGGCGAATGTCGTTATCCAGCGCATGACGAATTAACTCCCCCGTACCAAAACTGGAGGCCAGCAACGGATTACGCTTTTCAGGCGCGACCAGCATCAGGCCACTTGCTGCCGCCATCTCAATCACCGCCGTTTTCCCGTCGCCGGTAAGGCCATAAAAAGCATTCACTTTTTCGCCCATCGGCCCGCAGACTTCAAGCGTCACGATGTTGCCGCCCGTCGCGGCGACCATCGCATCCACCGTCCCTTCGCCGCCATCCGCTATCGGCAAACAGATATAGTTCGCATCGGGAAAGAGGGTCGAAAACCCGGCTTTAATTGCCTGACAACATTTTTCTGCACTTAAGCTCTCTTTAAAAGAGTCTGGCGCAATGACAATCTTCATTATCAATCCTTTTTCAACAAATTATTCGATGCGTTCCCACGGAATAAGGTTATCCATAAGAACAGCCAGTAAAATCCCGACCAATAAGCCGTTACTGAGCAGAGGACGAAGCGTTAATGGAAGGTCTTGCAGATACACAGGCGGTAATGCCATTAAAAATATGCCGACAAATAACGGCAATGCGAGTCGATAAATATTGCGAGCGGTAAACGTTATTTGCTGGCTAAACACCAGCGCGGAAAAGAGTAAAGGCAGATAAGAAACCAGCATGACCGCACTACTCACGGGTAAAGGGATACTGCAAAACAGTCGCGTGAGTGCAGGAACCAGCGCCACCAGCAGGCAAATAACGCTGCCATAAATAAACGAACGCCGCGTGTAATCGCCAGTCTGGGTTAATAAACCAATGGATGAAACAAACGGTGAAAATGGAATTACCGCCAGCGGTACGGTTATCAGCGTCATAAATCCGGTCGCCACAAAGCTACGACGATAACGCGTATTCCCTGCGCCCTGCTGCGGATAAAAAACATCCGTGCCCCGAATCGCACCGTAGGTATTGCTGATATTTACCAGACCTGTAATCACCGCCGTCAGAATAATTCCCGGCGACAAAGCACCGCCACTGCCGAGCGGGAACCACTGCCAGTGCAACTCACCGGAGAGCGAGTGCGAAGAAGGAAAGCAAAAGTACCACAACAACCAGCCGGTTATGGTGCCGACCAGCAGGCCATAACGGGCAAAACGTTGCGGCAGGAAGATAATCATCGCCAGTACCAGGCACATCACCGCCACCGAGAGCGCGAACGGCGGTAACTGAATTTTAAAATTCGGGTCGGCTATGCCAAACGGCAGCCCGAGCATACCTTTGAAAAAGATAGTGGTCAGCTGCGCGCCCAGCATCAACATAAACAAGACCATCACCGACGGCGTAAATAACCGTGCCAGGCGATGGCCTAATCCGCTAAAACCAATCAACATCGTCAGCACGCCGGAGAGTGCAATCCCCACTGCCAGGCTGGTGGCGATATCGTTGATCGGTGTCCCGCGCGATGCTTCACCAAGGGTGATAGTAAGGATGGTTCCCCACCACAGGCCACCTGGCCCTTCCATAATAGCGCGACGATGACCGCAAAACGCCTGAGCGAAGCAGGCCAGTGCGGTAGCAAGAAAAGCATATTGCGTGAGCGTAAGCAGGCTACTTTGCGGCAACTGAAAAGCAGAAAGTAGCGTAGGAGGAACCACAACCGTGTTGCAAAAAATAAAGAAAAACCACTGAAATCCTGATAACAGGCTTTCGCGGCTGACTGCAAAATTGAACATAAACACACCTTAACCGGAGAATGCCCGCCGCAAGGACGGGCATTGCAGGGGCCAGATTACTGCTGATGTTTAAGGATAAATTGACCTTTCGGCGCAACAGGGAAGCCCTGTTCAATGTCGTAAATCACATCACCACGTAAGATGGTTTTCGTGATACGCGCGCCAATGGTACGGCCAACATACGGGCTGACTTTGTGGCGATATTCCAGATCGTCATTGGTAAGAACATAGCTGCTATTCGGCTGAATGAAGACGAAGTCGGCATCTTTTCCTGGGGCGATACGGCCTTTTTGCTGCAGACCGAAAATATCTGCTGCGTTAGTCGCCATTAATTTGCCGAACATTGGCAGAGACATACCGCGTTTCTGTACCGCTTCATCGAACATCACGTCCATGCAGCTTTGCAGACCGGCGATACCGCCCCATGCTTTCATGATGTTACCGGCTTTCATTTCCGGCGGGCATGGAGAGTGGTCGGAAACCAGGCAGTCGATTTCACCGTTAAACAGTTTTTCCCACATGCCTTTCTGGTTTTCCAGATCGCGGATCGGCGGTGAACACTTCGCCAGAGTACCGATTTCTTCGAACTGATCGGTATCCAGTACAAAGTAATGCGGGCAGGATTCACAAGTAACGTCCTGACCTTCCTGACGTGCACGAGTCACTTCCTCAACACCTTCCGGGCTGCTGACGTGGCAAACGTGCAGACGGCAACCAGCAACTTTCGCCAGATACAGTACGCGGCGAATTGCTTCCACTTCGGTAAATACCGGACGCGAAGCCACATAGTCATGAGCGGTTACGCGACCTTCACGCTTCGCTTCTTCGCCCAGTTCGTCACAAATCAGCGCGTTTTCGCAGTGCACCAGCACCGGCTGACCCAGTTCGCCCAGCTTCTGCGCACCTTTGAAGAACTGCCAGTCGTTTACATCACGGAAGTCGTTGTCGATACCGCGATCGCCACAGGTCGCAACGAAGCATTTGAAGCCGACAACGCCCACTTCATCCAGCTCATGCAGACGGTCGATGTTGTAAGACACCAGGCCACCGAGTTGTGCCGCATCAATAGTCAGCTTGCCTTTAGCGGCATCGAACTTCAGTTCAATTGAAGCGCGGTCAACCGTTGCAGGCAGCTGGTTGAGCGGCATTTCGATCATGGTGGTGATACCACCTTTTGCCGCTGCGCGAGTACCGGTTTCATAACCTTCCCAGTGGCTACGACCCGGTTCAGAAATATGGGTGTGCGCATCAACCATGCCCGGCGAAACCACCAGACCAGACGCATCCATAACTTCTTTTGCATCGCCCAGATCCTGACCGATAGCAGCAATTTTTCCGCCTTTAACGGCGATATCTACAACGCGAGCTTCGTTTTCTAAAATAACGGTGCCGTTTTTAATGATTAAATCAAAAGACATAACAAACTCCTTGTAAAATACAGATTGGTTTTTAACTCAATGTTCAATATCGGGATTAATTAACCTATGGTTTTTTGCTCTCCTGTTTTTTCTGCTGTTGTACGTTTCTTTAATAAGGCGTAGGCCGCAAAGGCGACGATGACGC +>4_contig1 dgfdgd +ACGTTGCTGCGAATCGAGCTGTCTAGCGATCGAG +>5_contig2 +CGA +>6_contig3 +ATTCGGGCTTGA +>7_contig4 +AT diff --git a/test/data/annotate/exp_files/exp_complete_genome.fna_prokka-split3N.fna b/test/data/annotate/exp_files/exp_complete_genome.fna_prokka-split3N.fna new file mode 100644 index 0000000000000000000000000000000000000000..59df2730ff1596ed1c1fe1f3b4e332d9d85d0f67 --- /dev/null +++ b/test/data/annotate/exp_files/exp_complete_genome.fna_prokka-split3N.fna @@ -0,0 +1,2 @@ +>1_complete +CCGCTTAGGCTAGCGCCAGCTAGGAGCGCTCGAGAGACACAGCATTACNCCGATATTATAGAGGCCGCGCTTAGCACGCTAGGACGCG diff --git a/test/data/annotate/exp_files/exp_split_contig_cut3N.fna b/test/data/annotate/exp_files/exp_split_contig_cut3N.fna index d221ee3dd69d9f0361438df8b7413de308b1ace6..79c95494f384fabe70f6a98cea45473f7ac4d55e 100644 --- a/test/data/annotate/exp_files/exp_split_contig_cut3N.fna +++ b/test/data/annotate/exp_files/exp_split_contig_cut3N.fna @@ -1,4 +1,4 @@ ->my_contig_name_for_my_sequence_2 +>2_my_contig_name for_my_sequence AACTGCTTTTTAAGCGCGCTCCTGCG ->my_contig_name_for_my_sequence_3 +>3_my_contig_name for_my_sequence GGTTGTGTGGGCCCAGAGCGAGNCG diff --git a/test/data/annotate/exp_files/exp_split_contig_nocut.fna b/test/data/annotate/exp_files/exp_split_contig_nocut.fna index 8cdf33404f0ce78a2d56272b1dab695bbcd662a6..f6d01ad9e592c90a7522d79c69346f6ccae6fa6a 100644 --- a/test/data/annotate/exp_files/exp_split_contig_nocut.fna +++ b/test/data/annotate/exp_files/exp_split_contig_nocut.fna @@ -1,2 +1,2 @@ ->my_contig_name_for_my_sequence_2 +>2_my_contig name for my_sequence AACTGCTTTTTAAGCGCGCTCCTGCGNNNNNGGTTGTGTGGGCCCAGAGCGAGNCG diff --git a/test/data/annotate/exp_files/exp_split_empty_contig.fna b/test/data/annotate/exp_files/exp_split_empty_contig.fna index 0c5be8ca78c215b25d7d56dc1081445b0fb37d72..d123f54018d2913e99fc8b30aeff2cb0561f2bca 100644 --- a/test/data/annotate/exp_files/exp_split_empty_contig.fna +++ b/test/data/annotate/exp_files/exp_split_empty_contig.fna @@ -1,2 +1,2 @@ ->my_contig_name_for_my_sequence_2 +>2_my_contig_name_for_my_sequence AACTGCTTTTTAAGCGCGCTCCTGCGNGGTTGTGTGGGCCCAGAGCGAGNCG diff --git a/test/data/annotate/exp_files/genome2-split5N.fna b/test/data/annotate/exp_files/genome2-split5N.fna index e58ea8921d9107096f6e753605306c43b67174bc..f2053a5ebcd7fcf3cb453ae93c59a1aef67571c8 100644 --- a/test/data/annotate/exp_files/genome2-split5N.fna +++ b/test/data/annotate/exp_files/genome2-split5N.fna @@ -1,10 +1,10 @@ ->contig1 dgfdgd_1 +>1_contig1 dgfdgd ACGTTGCTGC ->contig1 dgfdgd_2 +>2_contig1 dgfdgd AGCTGTCTAG ->contig2_3 +>3_contig2 CGACGNNCGAG ->contig2_4 +>4_contig2 AGGTG ->contig3_5 +>5_contig3 ANNNNGGCTTGAGGTTGAA diff --git a/test/data/annotate/exp_files/res_create_gene_prokka-miss-lastGene.gen b/test/data/annotate/exp_files/res_create_gene_prokka-miss-lastGene.gen new file mode 100755 index 0000000000000000000000000000000000000000..7651710aad1253c7a8dafa1a07cafec1de668861 --- /dev/null +++ b/test/data/annotate/exp_files/res_create_gene_prokka-miss-lastGene.gen @@ -0,0 +1,37 @@ +>test.0417.00002.0001b_00001 501 NA | hypothetical protein | NA | NA | NA +aacgcgcatccagcgctagagacgctctcgacgagc +cagatctgca +cacaacaggtcgcgctcg +>test.0417.00002.0001i_00005 1653 yiaD | putative lipoprotein YiaD | NA | similar to AA sequence:UniProtKB:P37665 | NA +cagagatgcccc +ccgcgttt +>test.0417.00002.0001b_00008 3001 vgrG1 | Actin cross-linking toxin VgrG1 | 6.3.2.- | similar to AA sequence:UniProtKB:Q9KS45 | NA +aaccggcctcgcgcatcgcatcagcag +>test.0417.00002.0002b_00009 1161 NA | hypothetical protein | NA | NA | NA +acgctagagagctcgcgctaagagatc +>test.0417.00002.0002i_00010 1068 NA | hypothetical protein | NA | NA | NA +CCGAATAGCGCGCTCAGAGAGAGAGGA +CGATAGCTCTCGCA +CCGCATAGC +>test.0417.00002.0002i_00011 582 NA | hypothetical protein | NA | NA | NA +AAGCTCGCTAGACNNCTCGATACNNCTCGGATAGC +>test.0417.00002.0002i_00011 501 NA | hypothetical protein | NA | NA | NA +CAGATAGCNNCGCTAGAGGAGAGCTCTCGGAGA +>test.0417.00002.0002b_00011 369 NA | hypothetical protein | NA | NA | NA +CCGAGATCGCGCGCGCTCTTCTCGAGA +>test.0417.00002.0003b_00013 1140 NA | hypothetical protein | NA | NA | NA +AGCTCTCGAGAGGAGCGCTCGA +CGCTCGCGCA +CCTATAGGAACCACCGGGG +>test.0417.00002.0004b_00014 3354 NA | hypothetical protein | NA | NA | 12345 +CAGGATAGCGCGCTCAGAG +>test.0417.00002.0004b_00016 44128 NA | hypothetical protein | NA | similar to AA sequence:UniProtKB:P32 | 56 +AAGGGATATGGCCACACAGTT +>test.0417.00002.0007b_02927 77 NA | tRNA-Met(cat) | NA | COORDINATES:profile:Aragorn:1.2 | NA +CCAGAGATCGCGCGC +>test.0417.00002.0007i_02928 77 NA | tRNA-Met(cat) | NA | COORDINATES:profile:Aragorn:1.2 | NA +AGATATGGCGCGCTCTCTC +>test.0417.00002.0007i_03015 1638 NA | hypothetical protein | NA | NA | NA +AGATCCGCGCGCTATAGAGC +>test.0417.00002.0007i_03016 1761 NA | hypothetical protein | NA | NA | NA +AAGGATCTCTCGCGAGAGGA diff --git a/test/data/annotate/exp_files/res_create_gene_prokka-missGene.gen b/test/data/annotate/exp_files/res_create_gene_prokka-missGene.gen new file mode 100755 index 0000000000000000000000000000000000000000..fa72d9cf0323c3ebe9abfd91827472060c547afd --- /dev/null +++ b/test/data/annotate/exp_files/res_create_gene_prokka-missGene.gen @@ -0,0 +1,37 @@ +>test.0417.00002.0001b_00001 501 NA | hypothetical protein | NA | NA | NA +aacgcgcatccagcgctagagacgctctcgacgagc +cagatctgca +cacaacaggtcgcgctcg +>test.0417.00002.0001i_00005 1653 yiaD | putative lipoprotein YiaD | NA | similar to AA sequence:UniProtKB:P37665 | NA +cagagatgcccc +ccgcgttt +>test.0417.00002.0001b_00008 3001 vgrG1 | Actin cross-linking toxin VgrG1 | 6.3.2.- | similar to AA sequence:UniProtKB:Q9KS45 | NA +aaccggcctcgcgcatcgcatcagcag +>test.0417.00002.0002i_00010 1068 NA | hypothetical protein | NA | NA | NA +CCGAATAGCGCGCTCAGAGAGAGAGGA +CGATAGCTCTCGCA +CCGCATAGC +>test.0417.00002.0002i_00011 582 NA | hypothetical protein | NA | NA | NA +AAGCTCGCTAGACNNCTCGATACNNCTCGGATAGC +>test.0417.00002.0002i_00011 501 NA | hypothetical protein | NA | NA | NA +CAGATAGCNNCGCTAGAGGAGAGCTCTCGGAGA +>test.0417.00002.0002b_00011 369 NA | hypothetical protein | NA | NA | NA +CCGAGATCGCGCGCGCTCTTCTCGAGA +>test.0417.00002.0003b_00013 1140 NA | hypothetical protein | NA | NA | NA +AGCTCTCGAGAGGAGCGCTCGA +CGCTCGCGCA +CCTATAGGAACCACCGGGG +>test.0417.00002.0004b_00014 3354 NA | hypothetical protein | NA | NA | 12345 +CAGGATAGCGCGCTCAGAG +>test.0417.00002.0004b_00016 44128 NA | hypothetical protein | NA | similar to AA sequence:UniProtKB:P32 | 56 +CAGGATAGCGCGCTCAGAG +>test.0417.00002.0007b_02927 77 NA | tRNA-Met(cat) | NA | COORDINATES:profile:Aragorn:1.2 | NA +CCAGAGATCGCGCGC +>test.0417.00002.0007i_02928 77 NA | tRNA-Met(cat) | NA | COORDINATES:profile:Aragorn:1.2 | NA +AGATATGGCGCGCTCTCTC +>test.0417.00002.0007i_03015 1638 NA | hypothetical protein | NA | NA | NA +AGATCCGCGCGCTATAGAGC +>test.0417.00002.0007i_03016 1761 NA | hypothetical protein | NA | NA | NA +AAGGATCTCTCGCGAGAGGA +>test.0417.00002.0007b_03017 1080 NA | hypothetical protein | NA | NA | NA +CCAGGATAGCGCGCGC diff --git a/test/data/annotate/exp_files/res_create_gene_prokka.gen b/test/data/annotate/exp_files/res_create_gene_prokka.gen index 3a30831773727c399f51e934748498457b608c51..0e9b0c846400299fb19c1429abd2e3fd25699b49 100755 --- a/test/data/annotate/exp_files/res_create_gene_prokka.gen +++ b/test/data/annotate/exp_files/res_create_gene_prokka.gen @@ -19,15 +19,14 @@ AAGCTCGCTAGACNNCTCGATACNNCTCGGATAGC CAGATAGCNNCGCTAGAGGAGAGCTCTCGGAGA >test.0417.00002.0002b_00011 369 NA | hypothetical protein | NA | NA | NA CCGAGATCGCGCGCGCTCTTCTCGAGA ->test.0417.00002.0003b_CRISPR1 2671364 crispr | crispr-array | NA | NA | NA -aagcgctctgcg -cgctcg >test.0417.00002.0003b_00013 1140 NA | hypothetical protein | NA | NA | NA AGCTCTCGAGAGGAGCGCTCGA CGCTCGCGCA CCTATAGGAACCACCGGGG >test.0417.00002.0004b_00014 3354 NA | hypothetical protein | NA | NA | 12345 CAGGATAGCGCGCTCAGAG +>test.0417.00002.0004b_00016 44128 NA | hypothetical protein | NA | similar to AA sequence:UniProtKB:P32 | 56 +AAGGGATATGGCCACACAGTT >test.0417.00002.0007b_02927 77 NA | tRNA-Met(cat) | NA | COORDINATES:profile:Aragorn:1.2 | NA CCAGAGATCGCGCGC >test.0417.00002.0007i_02928 77 NA | tRNA-Met(cat) | NA | COORDINATES:profile:Aragorn:1.2 | NA @@ -36,7 +35,5 @@ AGATATGGCGCGCTCTCTC AGATCCGCGCGCTATAGAGC >test.0417.00002.0007i_03016 1761 NA | hypothetical protein | NA | NA | NA AAGGATCTCTCGCGAGAGGA ->test.0417.00002.0007i_CRISPR2 394 crispr | crispr-array | NA | NA | NA -AAACCGGCTCGGGCA >test.0417.00002.0007b_03017 1080 NA | hypothetical protein | NA | NA | NA CCAGGATAGCGCGCGC diff --git a/test/data/annotate/exp_files/res_create_gff-prokka.gff b/test/data/annotate/exp_files/res_create_gff-prokka.gff index 13f1386702c6222f5694ff88a8c2ad2373838399..1cf7b0d9e23a9572587ef3dad11f1566c98b5c89 100755 --- a/test/data/annotate/exp_files/res_create_gff-prokka.gff +++ b/test/data/annotate/exp_files/res_create_gff-prokka.gff @@ -14,12 +14,11 @@ test.0417.00002.0002 Prodigal:2.6 CDS 1279 2346 . + 0 ID=test. test.0417.00002.0002 Prodigal:2.6 CDS 2419 3000 . + 0 ID=test.0417.00002.0002i_00011;inference=ab initio prediction:Prodigal:2.6;locus_tag=test.0417.00002.0002i_00011;product=hypothetical protein test.0417.00002.0002 Prodigal:2.6 CDS 3500 4000 . + 0 ID=test.0417.00002.0002i_00011;inference=ab initio prediction:Prodigal:2.6;locus_tag=test.0417.00002.0002i_00011;product=hypothetical protein test.0417.00002.0002 Prodigal:2.6 CDS 4632 5000 . - 0 ID=test.0417.00002.0002b_00011;inference=ab initio prediction:Prodigal:2.6;locus_tag=test.0417.00002.0002b_00011;product=hypothetical protein -test.0417.00002.0003 Prodigal:2.6 repeat_region 296902 2968265 . - 0 ID=test.0417.00002.0003b_CRISPR1;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P0A6C5;locus_tag=test.0417.00002.0003b_CRISPR1 test.0417.00002.0003 Prodigal:2.6 CDS 3399 4538 . + 0 ID=test.0417.00002.0003b_00013;eC_number=3.1.11.5;Name=recD;gene=recD;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P04993;locus_tag=test.0417.00002.0003b_00013;product=RecBCD enzyme subunit RecD test.0417.00002.0004 Prodigal:2.6 CDS 4535 7888 . + 0 ID=test.0417.00002.0004b_00014;eC_number=3.1.11.5;Name=recB;gene=recB;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P08394;locus_tag=test.0417.00002.0004b_00014;product=RecBCD enzyme subunit RecB +test.0417.00002.0004 Prodigal:2.6 CDS 888 45015 . - 0 ID=test.0417.00002.0004b_00016;eC_number=56;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P08394;locus_tag=test.0417.00002.0004b_00016 test.0417.00002.0007 Prodigal:2.6 tRNA 3039279 3039355 . + 0 ID=test.0417.00002.0007b_02927;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P05458;locus_tag=test.0417.00002.0007b_02927 test.0417.00002.0007 Prodigal:2.6 tRNA 3039389 3039465 . + 0 ID=test.0417.00002.0007i_02928;eC_number=3.1.11.5;Name=recC;gene=recC;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P07648;locus_tag=test.0417.00002.0007i_02928;product=RecBCD enzyme subunit RecC test.0417.00002.0007 Prodigal:2.6 CDS 7854 9491 . + 0 ID=test.0417.00002.0007i_03015;inference=ab initio prediction:Prodigal:2.6;locus_tag=test.0417.00002.0007i_03015;product=hypothetical protein test.0417.00002.0007 Prodigal:2.6 CDS 9525 11285 . + 0 ID=test.0417.00002.0007i_03016;inference=ab initio prediction:Prodigal:2.6;locus_tag=test.0417.00002.0007i_03016;product=hypothetical protein -test.0417.00002.0007 Prodigal:2.6 repeat_region 2994578 2994971 . + 0 ID=test.0417.00002.0007i_CRISPR2;inference=ab initio prediction:Prodigal:2.6;locus_tag=test.0417.00002.0007i_CRISPR2;product=hypothetical protein -test.0417.00002.0007 Prodigal:2.6 CDS 11249 12328 . + 0 ID=test.0417.00002.0007b_03017;inference=ab initio prediction:Prodigal:2.6;locus_tag=test.0417.00002.0007b_03017;product=hypothetical protein \ No newline at end of file +test.0417.00002.0007 Prodigal:2.6 CDS 11249 12328 . + 0 ID=test.0417.00002.0007b_03017;inference=ab initio prediction:Prodigal:2.6;locus_tag=test.0417.00002.0007b_03017;product=hypothetical protein diff --git a/test/data/annotate/exp_files/res_create_gff_prodigal.gff b/test/data/annotate/exp_files/res_create_gff_prodigal.gff index ebf97f8c9e8f22f15fe2eac1b8320a30c51d8ba7..5ec00adf5f8ab81d91ef00803ba931a6c04dc26d 100644 --- a/test/data/annotate/exp_files/res_create_gff_prodigal.gff +++ b/test/data/annotate/exp_files/res_create_gff_prodigal.gff @@ -1,11 +1,11 @@ ##gff-version 3 -##sequence-region test.0417.00002.0001 1 14000 -##sequence-region test.0417.00002.0002 1 5000 -##sequence-region test.0417.00002.0003 1 4600 -##sequence-region test.0417.00002.0004 1 8000 -##sequence-region test.0417.00002.0005 1 1 -##sequence-region test.0417.00002.0006 1 10 -##sequence-region test.0417.00002.0007 1 15000 +##sequence-region test.0417.00002.0001 1 84 +##sequence-region test.0417.00002.0002 1 103 +##sequence-region test.0417.00002.0003 1 122 +##sequence-region test.0417.00002.0004 1 35 +##sequence-region test.0417.00002.0005 1 198 +##sequence-region test.0417.00002.0006 1 128 +##sequence-region test.0417.00002.0007 1 85 test.0417.00002.0001 Prodigal:2.6 CDS 287 787 . + 0 ID=test.0417.00002.0001b_00001;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00001;product=hypothetical protein test.0417.00002.0001 Prodigal:2.6 CDS 4416 6068 . + 0 ID=test.0417.00002.0001i_00002;Name=yiaD;gene=yiaD;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P37665;locus_tag=EPKOMDHM_00005;product=putative lipoprotein YiaD test.0417.00002.0001 Prodigal:2.6 CDS 9000 12002 . - 0 ID=test.0417.00002.0001b_00003;Name=vgrG1;gene=vgrG1;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:Q9HI36;locus_tag=EPKOMDHM_00006;product=Major exported protein diff --git a/test/data/annotate/exp_files/res_create_lst-prokka.lst b/test/data/annotate/exp_files/res_create_lst-prokka.lst index 57202f541ef79647534d098b6ad5ba16686d7f4e..8156f9b810a710cd0736463b53a7a995da55802c 100755 --- a/test/data/annotate/exp_files/res_create_lst-prokka.lst +++ b/test/data/annotate/exp_files/res_create_lst-prokka.lst @@ -6,13 +6,12 @@ 2419 3000 D CDS test.0417.00002.0002i_00011 NA | hypothetical protein | NA | NA | NA 3500 4000 D CDS test.0417.00002.0002i_00011 NA | hypothetical protein | NA | NA | NA 4632 5000 C CDS test.0417.00002.0002b_00011 NA | hypothetical protein | NA | NA | NA -296902 2968265 C CRISPR test.0417.00002.0003b_CRISPR1 crispr | crispr-array | NA | NA | NA 3399 4538 D CDS test.0417.00002.0003b_00013 NA | hypothetical protein | NA | NA | NA 4535 7888 D CDS test.0417.00002.0004b_00014 NA | hypothetical protein | NA | NA | 12345 +888 45015 C CDS test.0417.00002.0004b_00016 NA | hypothetical protein | NA | similar to AA sequence:UniProtKB:P32 | 56 3039279 3039355 D tRNA test.0417.00002.0007b_02927 NA | tRNA-Met(cat) | NA | COORDINATES:profile:Aragorn:1.2 | NA 3039389 3039465 D tRNA test.0417.00002.0007i_02928 NA | tRNA-Met(cat) | NA | COORDINATES:profile:Aragorn:1.2 | NA 7854 9491 D CDS test.0417.00002.0007i_03015 NA | hypothetical protein | NA | NA | NA 9525 11285 D CDS test.0417.00002.0007i_03016 NA | hypothetical protein | NA | NA | NA -2994578 2994971 D CRISPR test.0417.00002.0007i_CRISPR2 crispr | crispr-array | NA | NA | NA 11249 12328 D CDS test.0417.00002.0007b_03017 NA | hypothetical protein | NA | NA | NA diff --git a/test/data/annotate/exp_files/res_create_prt_prokka.faa b/test/data/annotate/exp_files/res_create_prt_prokka.faa index 25dd86a301a7d469c930bfb638fa24e3c9167c25..c421ab5756b2e6041cf0736df74a2d7a3f777446 100755 --- a/test/data/annotate/exp_files/res_create_prt_prokka.faa +++ b/test/data/annotate/exp_files/res_create_prt_prokka.faa @@ -25,6 +25,8 @@ CGCTCGCGCA CCTATAGGAACCACCGGGG >test.0417.00002.0004b_00014 3354 NA | hypothetical protein | NA | NA | 12345 CAGGATAGCGCGCTCAGAG +>test.0417.00002.0004b_00016 44128 NA | hypothetical protein | NA | similar to AA sequence:UniProtKB:P32 | 56 +CCGAGGTGCGAGGTGTGTTGTGTGCG >test.0417.00002.0007i_03015 1638 NA | hypothetical protein | NA | NA | NA AGATCCGCGCGCTATAGAGC >test.0417.00002.0007i_03016 1761 NA | hypothetical protein | NA | NA | NA diff --git a/test/data/annotate/exp_files/res_formatAll/prodigal/Genes/test.0417.00002.gen b/test/data/annotate/exp_files/res_formatAll/prodigal/Genes/test.0417.00002.gen new file mode 100644 index 0000000000000000000000000000000000000000..7143d6be6a7e775cbf1e0a62bdeccd7a6f4bfe34 --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prodigal/Genes/test.0417.00002.gen @@ -0,0 +1,1727 @@ +>test.0417.00002.0001b_00001 501 NA | NA | NA | ID=1_1;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.447 | NA +ATGGCCGACAGTTTCCAGAATGAAGTTCCCGCCGCTCGTGTAAATATCAAGCTTGATCTGCATACAGGCA +ATGCTAAAAAGAAAGTTGAACTCCCCCTCAAGCTTCTTGCCGTAGGCGATTACAGTAACGGAAAAGAGCA +ACGTCCGCTGTCCGAACGGGACAAGGTTGATATCAATAAAAACAACTTCAACAGCGTCATGGCTGAGTTT +TCGCCTGCGGTTAATTTAACAGTAGAAGATACGCTAAACGGAAACGGTAATGAACAAAATATCGCGCTTG +AATTTAAAAGCCTGAAGGATTTTGAACCCGAACAGGTAGCAAAAAATATTCCGCAACTTCGTGTATTACT +CGCTATGCGCAATTTACTACGTGACCTGAAATCCAATCTGCTGGATAACGCAACGTTTCGCCGTGAACTG +GAAAATATCCTGAAAGACCCGACGCTCAGTTCAGAACTGCGTGATGAACTGGCGAAAATTGCGCCGCAGG +AGAACGTTTAA +>test.0417.00002.0001i_00002 1539 NA | NA | NA | ID=1_2;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.511 | NA +ATGTCTGTACAACAAGAACATGCCACCTCTGAAACTGCAACACTCACCACCACTGAGTCCGGCGGCGTTT +ATCAGTCCCTGTTCGATAAAATTAATTTAACCCCGGTGTCTTCCATTCAGGAAATCGATTTATGGCAAAA +CAGCGAAACGCTGGCCGATGCCTCACCCGATGAGCGCGTGACGGCGGCGATTCACGTTCTGCTTTCCTGT +CTGGCGAAATCAGGCGAGGACGTGGTTAAGCTCGACAAGAGCCTGCTGGATTTTCATATCGACGATCTGG +ATCAGAAAATCAGTAAACAGCTTGATGCGGTCATGCACCACCCTGAATTCCAGAAAGTCGAGTCGCTGTG +GCGTGGTACATGGTTCGTCGTACAGCGCACTGATTTTCGCAAAAATGTCAGAATTGAACTGCTGGATATC +AGTAAAGAACATCTGCGGCAGGACTTTGATGATTCTCCGGAAATCATTCAAAGTGGTTTATATCGCCATA +CATACATTCAGGAGTACGATACGCCGGGTGGCGAACCTGTTGCCTCATTAATTTCCAGCTATGAATTTGA +TAACAGCCCGCAGGATATTGCCCTGCTGCGTAATATTTCCAGAGTGTCTGCCGCTTCCCATATGCCTTTT +ATCGGTTCTGTCGGACCGAAATTCTTCCTTAAAAATTCGATGGAAGAAGTCGCCGCGATTAAAGATATCG +GCAACTACTTTGACCGCGCAGAATATATTAAATGGAAGTCGTTCCGCGATACGGATGACAGCCGCTATGT +GGGATTAGTGATGCCGCGCGTGCTGGGCCGTCTGCCCTATGGGCCGGACACGGTGCCGGTACGCAGCTTT +AACTATGTGGAAGAAGTCAAAGGCCCGGATCACGAAAAATACCTGTGGACAAACGCCTCGTTCGCCTTTG +CCGCCAATATGGTGAAGAGCTTTGTTAATAATGGCTGGTGCGTGCAGATCCGTGGCCCACAGGCGGGCGG +CGCAGTGGCCGATCTGCCGATCCATCTTTACGATCTCGGCACCGGCAATCAGGTCAAAATTCCGTCCGAA +GTGATGATCCCGGAAACCCGCGAATTTGAATTTGCCAACCTTGGCTTTATTCCGCTCTCTTATTATAAGA +ATCGCGATTACGCCTGCTTCTTCTCGGCGAACTCTGCCCAGAAACCGGCGTTGTACGATACCGCTGACGC +CACCGCCAACAGCCGTATCAATGCCCGTCTGCCTTACATCTTCCTGCTGTCCCGCATTGCGCATTACCTG +AAAATTATTCAGCGCGAGAATATCGGCACCACCAAAGACCGCCGCGTGCTGGAACTGGAGCTGAATACCT +GGATCCGCACGCTGGTGACGGAGATGACCGATCCTGGCGATGAACTTCAGGCTTCGCATCCACTGCGCGA +CGGGAAAGTTATCGTCGAGGACATAGAGGACAATCCGGGCTTCTTCCGCGTCAGACTCTTTGCCGTGCCG +CATTTCCAGATTGAAGGGATGGATATCAACCTTTCTCTGGTTTCCCAGATGCCAAAAGCAAAAGCCTGA +>test.0417.00002.0001i_00003 1338 NA | NA | NA | ID=1_3;partial=00;start_type=ATG;rbs_motif=GGxGG;rbs_spacer=5-10bp;gc_cont=0.594 | NA +ATGAAAATTTGTCGACCACTGTGGGCTGAGGGGACATTCCTGTCTTCTCAGCAGTTTCAGCAGCAGGCCC +GCTGGGAAGCGTTCAGCAATGACTGTATTGCGCAGCTTTGTATTCGCCATCCGTGGGGGATCGCAAACGT +GCTCTTTGACCGGGATGCCCTGACGCCCGGAAAGCTGAAAACGCAGGCAGTACGCCTGCGTTTTGCTGAT +GGCACGCTGATCGATTCAGACGTGAGTGACGTTCTGCCGCTCGCCTGCGATCTGCGCGCGCTGAAGAACG +ACAGCGCGATTGTTTTGCTGGCGCTGCCGCTTGCACATGGTAACGGCGGTAATCTCGGTCAGGGTGAGCA +GACTGAAAGACCGCTGCGCTATCGTCAGGAATGGCAAAAGGTGCAGGATATCTACGGCAGTGACAGTGAA +GATATGGCCGTTGAGCGTCATGCGCTGTCCCTGCGCTTTGCTCATGATAACAATCAGGATTACATCACCT +GCCCACTGGCGCGTCTGGTGCGGGATGTTCAGGGCAACTGGACACAGGATGAGAGCTATATTCCGCCGTT +ACTGGCGTTTAACGCCCATGACGGGCTGGTACAGCGTCTGGACACATTGCTGTTGCAGCTACGGGCGAAG +TGCCAGCGTCTGATGGCGATGCGCCGGGAAAGCAACCAGCGTATGGCGGACTTTGCCGTCGCCGATGTCT +CCCTGTTCTGGCTGCTTAACGCGCTGAATTCCGCCGAGCCGGTGCTGAGCGATTTCCTGCGCTACCCGGC +TGTCCACCCCGAACTGGTCTGGCGGGAGCTGGCGAGGCTTGCCGGTGCGCTGCTGACGTTTTCCCTTGAG +CATAACGTCAGCGCCGTTCCGCCCTATGTCCACGAATCGCCGTCCACCGTCTTTCCGCCCCTGTTCTCCC +TGCTCAGCGAGCTGCTGGAAGCCAGCCTGCCGTCGCGGGTGATCGCGCTGGATCTGGCGTCCCTGCCGGG +CAACCGCTGGAAAGCCGACCTGCACGATCCGCGCCTGCGGGAAGAGGCCGATTTTTATCTGTCCGTTCGT +TCCTCACTGCCTGCGCATCAGGTACTGCATCAGCTACCGCTGGTCTGCAAAATCGGTGCGCCCGATGATG +TCACGCTGCTTATCAACGTGGCGCTGAACGGTGTTCAACTGGTGCCGCTTACCTCGGTTCCGGCGGCGCT +GCCGCTGCGGCTGGAGAACCAGTATTTTGCGCTGGATATGCACAGTGACGCGGCTAAATCGATGCTGGAG +TCCGGGAGCTGCATGATTTATGCGCCGGGAACCATGGGCGACCTGAAACCTGAACTGTTTGCGGTGCTGC +GCACATGA +>test.0417.00002.0001i_00004 666 NA | NA | NA | ID=1_4;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.590 | NA +ATGAAAAAAGATATGGATATCAATATCGATGCGCTGCTGCTCGACACGTTTCTGACGGTGGTGGAACTGC +GTCAGGGAACCACCGTGCGTCACGGTATCGAGCTGTATCGCCACTGTCAGCGGCAGGTGGAACTGGTCCG +CGAACGTCTGAAAGATGCCGGATTCAGTCGGGAGAACGTGGAGCACATAACTTACGCGCAGTGCGCCCTG +CTGGACGAAACGGTGCTCAGCCGTAGTGGCATGGACGACGGTCAGGCCATCTGGATGAAAAACCCACTCC +AGTCGCATTTCTTCAACACCCTGCAGGCAGGTGAGCTGCTGTACGAACGGATGAAGCAGGTGCTACAGGA +ACCCGCCCCCGCGCAGGCCGTGCTGACCTGCTTTCACCGTGTCCTGCTGCTGGGATTTCGCGGGCGTTAT +CAGGATCCGGCAGCCCCGGAGCGCGACCAGCTTATTTCGACGCTCAACGGGCAGGTCGCGCCATTTGGTG +TGCTGCCGGAAACGGCGGTACTGAACGTGCCGTTATCCACCCGTCAGCACCCTTTGCTGCATTCGCCATT +TTTCTGGCTGGTAACACTGGCGCTGCTACTGGCGGGCGTCTGGTGGGGGCTACACCACTGGCTGAACGTG +CTGGTGGATGAACTGCTGCCGCAAAGCCTGCGTTAA +>test.0417.00002.0001i_00005 1653 NA | NA | NA | ID=1_5;partial=00;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.614 | NA +GTGAGGAACACGCTGAAACAGGCCATCGTGCTGTGGGGAATGGTGTTACTGCTGGTGCTGTGGTCAGTGT +TTATCAGTCCGTCTGGCGTGCTGAGATGGGCCGGTGCGGCGGCTATCGTTCTGGCGGTTGCTGCGTTGTT +GATTTATCGGCGCAGGCAGGCGTGGACGGAGATGACCGGCGATGCCGGGTTGTCATCGCTGCCGCCGGAA +ACCTACCGGCAGCCGGTAGTGCTGGTCTGCGGCGGTCTGTCGGCGCACCTGTTCACTGACAGCCCGGTCC +GGCAGGTTTCAGAAGGGCTGTATCTGCATGTTCCTGATGAAGAACAGCTTGTGGCGCAGGTGGAGCGATT +GCTGACCCTTCGCCCGGCGTGGGCATCGCAGCTTGCCGTGGCGTATACCGTCATGCCCGGCATACACCGG +GATGTGGCGGTTCTGGCCGGACGGCTGCGACGGTTTGCCCACAGTATGGCGACGGTGCGTCGCCGGGCGG +GCGTAAACGTCCCCTGGCTTCTCTGGAGCGGGCTGTCCGGCTCGCCGTTGCCGGAAAGAGCGAGTTCACC +GTGGTTTATCTGTACCGGCGGCGAAGTTCAGGTAGCAACATCCACAGAGACCACCATGCCCGCGCAGTGG +ATTGCACAATCCGGCGTACAGGAGCGCAGTCAGCGACTCTGTTACCTGCTGAAAGCTGAAAGCCTGATGC +AGTGGCTGAATCTTAATGTGCTGACGGCACTGAACGGCCCGGAGGCGAAATGCCCGCCACTGGCGATGGC +CGTGGGGCTGGTCACCTCGTTGCCAGCGGTGGATAACAACCTGTGGCAAGTGTGGATCACCGCCAGAACC +GGCCTGACGACGGATATCGCGGACACCGGCACAGACGCCACGCTGCCGTTTCCGGATGCTCTGTTACGGC +AGTTGCCGCGTCAGTCGGACTTTACCCCGCTGCGGCGGGCCTGCGTGACCATGCTGGGCATTACCACCGC +GGCGGGTATCACCATGTTGTGCCTGTCAGCCACGGCAAATCGCCAGTTATTACGGCAGGTCGGTGACGAT +CTGCACCGGTTTTATGCCGTCCCGGTGGAGGAATTTATCACCAAAGCCCGTCACCTGTCGGTGCTGAAAG +ACAATGCGACCATGCTCGATGGGTATTACCGGGAAGGAGAACCACTGCGCCTCGGTCTGGGGTTATACCC +CGGCGAACGCATCCGCCAGCCGGTATTACGCGCCATTCGCGACTGGCGTCCGCCTGAACAAAAAATGGAG +GTGACGGCTTCGCTTCAGGTTCAGACCGTGCGTCTTGACAGTATGTCGCTGTTTGACGTCGGACAGGCCC +GCCTGAAAGACGGCTCGACAAAAGTGCTGGTGGATGCGCTGGTGAACATCCGGGCAAAACCGGGCTGGCT +GATCCTCGTGGCCGGATATACCGACGCCACCGGCGATGAAAAAAGCAATCAGCAGTTATCGCTGCGGCGT +GCCGAAGCGGTGCGCAACTGGATGCTGCAGACCAGCGACATCCCGGCCACCTGTTTTGCCGTACAGGGAC +TGGGCGAGAGCCAGCCTGCGGCGACCAACGACACGCCACAGGGCCGGGCAGTCAACCGGCGTGTCGAAAT +CAGTCTTGTTCCGCGTTCTGACGCCTGTCAGGACGTGAAATAA +>test.0417.00002.0001i_00006 492 NA | NA | NA | ID=1_6;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.514 | NA +ATGGCTATTCCTGCTTATCTCTGGCTGAAAGATGACGGCGGCGCGGATATCAAAGGTTCCGTGGACGTTC +AGGGGCGCGAAGGTAGCATCGAAGTGGTGGCGCTGGATCACGATGTGTACATCCCGACCGACAATAACAC +CGGCAAACTGACCGGTACCCGTACTCACAAGCCCTTTACGTTTACCAAAGAAATCGATGCCTCCAGCCCG +TATCTCTACAAAGCTGTGACCACCGGACAGACCCTGAAAACGGCAGAATTTAAGTTTTACCGCATCAACG +ATGCCGGTCAGGAAGTGGAGTACTTCAACATCACGCTTGATAACGTCAAGCTGGTCAGAGTCGCTCCGCT +TATGCACGACATCAAGGATCCTTCCAGAGAGAAGCATAACCACCTGGAACGTATTGAGTTCCGCTACGAG +AAAATCACCTGGACTTACAAAGACGGCAACATCATTCATTCCGACTCGTGGAATGAGCGTCCTTCCGCCT +GA +>test.0417.00002.0001i_00007 2637 NA | NA | NA | ID=1_7;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.603 | NA +ATGACAGGAAATCACTCCGCCGCGCTGCTGCGTCGCCTTAACCCATACTGTGCACGGGCGCTGGACGCTG +CCGCCTCACTGTGTCAGACCCGCGCCCATGCGGAAATAACCATTGAACACTGGCTGCTGAAACTGCTGGA +GCAGGGAGAAGGCGATATCACGGTGATTGCCCGCCGCTATGAATGGGATATCGACACGCTCTGGCAGTCT +CTGCTGGCACATCTGGACACCTTACCCCGCCCGGTCCGCGAACGTCCTCAACTTTCTGAACCGCTGGCAG +CGCTTATCCGACAGGCGTGGCTGATAGCGTCACTGGAAGGCGACGATCCACAAATCCGCAGCCAGCATCT +GCTGATGGCGCTGACAGAAAAACCGATGCTGCCCGCCTGTAATGACCTGTGGGTATTGCTGAGTCTGAGC +CGCGTGCAGCTTGAGCGGCTGCGTCCCCTGCTGGATGCGCAGTCGGATGAATGTCCGGCACGTCAGCCAC +AGGTCACCGAACCGCTGACCTCTGCACTGCCGGAGACGGCAACGGCGGACGCACCGGCAAAAACGCTGAC +GGAGAAACAGGATGACGCCCTGCTGGCGGTGCTTAACCGCTTTACCGAAGACGTGACGGAAAAAGCCCGC +AGCGGGCGAATCGACCCGGTATTCGGGCGCGACACGGAAATTCGCCAGATGGTCGATATCCTCTCCCGTC +GCCGCAAAAACAACCCGATTCTGGTGGGAGAACCGGGGGTGGGCAAAACCGCGCTGGTGGAAGGGCTGGC +GCTGCGTATCACCGAAGGCAACGTGCCGGACAGCCTGAAAACGGTGCATATCCGCACACTGGACCTCGGT +CTGTTACAGGCTGGCGCGGGCGTTAAAGGTGAATTTGAACAGCGGCTGAAAAATGTCATCGATGCAGTGC +AGAAATCACCGGAGCCGGTACTGCTGTTTATTGATGAAGCCCATACCATTATCGGTGCGGGTAATCAGGC +AGGCGGCGCGGATGCGGCGAACCTGCTGAAACCGGCACTGGCAAGGGGCGAACTGCGCACCATCGCGGCG +ACCACGTGGAGCGAATACAAACAGTATTTTGAGCGCGACGCCGCGCTGGAGCGCCGCTTCCAGATGGTTA +AGGTTGACGAGCCGGATGATGACACCGCCTGTCTGATGCTGCGGGGACTGAAGGCTCGCTATGCACAGCA +CCACGGCGTGCATATGCTGGACAGCGCCATTCAGACCGCCGTGCGCCTGTCGCGCCGCTATCTGACCGGA +CGCCAGCTGCCGGACAAGGCGGTTGATTTGCTGGATACCGCCGGGGCAAGAGTCCGCATGAGCCTTGACA +CCCTGCCGGAACCGTTGACGCAGCTTCATGCGCGACTGGCGGCACTGGATATTGAGCGGGAAGCGATTGA +GCAGGACAGCGTATTTTATCCCGAAGCCAGCCCGGAGCGGCTGGCGGAACTGACCGATTTGCGTGATGAG +CTACAGGCAGAAGCCGGGCATCTGGAAGCGCAGTATCAGCAAGAAAAGGCACTGGCGCAGCAGATTATGA +CGTTGCGTCAGGAAGGAACAGACAGCTCTGAACTGCAACAGCAACTGCGGACGCATCAGGGCTTTGCACC +GCTGCTGGCGCTGGATGTGGACGCCCGCGCCGTCGCCACGGTGGTGGCGGACTGGACCGGCATCCCGCTC +TCTTCCTTGCTCAAGGACGAGCAGAGCGACCTGCTCAGTATGGAACAGAGTCTTGAAAACCGCGTTGTCG +GGCAAAGCCCGGCGCTCTGCGCCATCGCACAGCGGCTGCGGGCGGCTAAGACCGGCCTCACGCCGGAGAA +CGGCCCGCAGGGGGTATTCCTGCTGACCGGCCCCAGCGGCACCGGTAAAACCGAAACTGCGCTCACACTG +GCCGACACTCTGTTTGGCGGTGAAAAATCCCTTATCACCATTAATCTTTCGGAATATCAGGAACCGCATA +CCGTTTCCCAGTTGAAAGGTTCGCCTCCGGGCTATGTCGGCTACGGTCAGGGCGGCGTGCTGACCGAAGC +GGTACGCAAACGCCCTTACAGCGTGGTGCTGCTCGACGAAGTGGAAAAGGCGCATCGCGACGTGATGAAC +CTGTTCTATCAGGTGTTCGACCGGGGCTTTATGCGCGACGGCGAAGGGCGGGAAATCGACTTCCGTAACA +CCGTGATTCTGATGACCGCCAATCTGGGCAGCGACCACATCATGCAGCTGCTGGAGGAAAAACCGGACGC +CACGGACGCAGACCTGCATGAACTGCTGTACCCCCTGCTGCGAGACCATTTTCAGCCTGCACTGATGGCG +CGCTTTCAGACGGTGATTTACCGCCCGCTGGGACAGGAGGCGATGCGCGCCATTGTGGAAATGAAACTGG +CGCAGGTGGCCCGCCGTCTTCACCAGCACTATGGGCTGGAAACGGAAATCAGTAACAGCCTGTACGACGC +CCTGACCGCCGCCTGCCTGCTGCCGGACACCGGTGCGCGTAATATCGACAGCCTGCTGAACCAGCAAATC +CTGCCGGTCTTAAGCCAGCAGTTGCTGGCGCAGCAGGCCGTGCATCATAAGCCTGCCCGACTGCGGCTTG +ACTGGGATGATGAAGACGGGATTGTGCTGGAATTTGATGAGAAATAA +>test.0417.00002.0001b_00008 147 NA | NA | NA | ID=1_8;partial=01;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.531 | NA +ATGAACGTACAGTTCTTCGACCACGCACACCACAAGCTCAAAATTCGCGGCCTGAAAAGCCCGGTGGACG +TGCTGACGTTTACGGGCCGGGAACAACTCAGCGCACCCTTCCGCTACGACATTGAATTTACCAGTACCGA +TAAAACC +>test.0417.00002.0002b_00009 1236 NA | NA | NA | ID=2_1;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.468 | NA +GATCTGATAGCTAATTGTAAGAAGATAAAGGAAGGCAACGATAAAAACGAGGACACCACCTGGGCATGGG +TAGCGATGATCCTGACACTGGTCGGTCTTATTCCAGTGGCAGGTTCTTTAATTAAAGGGATCTTCAAAGT +GCTGTTTAATTCGATAAGAAAGGCGGCGCTTTCCAGTAGGGATATTGTACGAGCGATTGATGCTTCCGTT +TCCCTGTTTAATAAATTTATCGATTTGCCAGCCGTGCAGGCGACAATGAAGTGGATGAAGATTTATAACC +CGTATACGTATGCTGAGAAGCAGGTCAGGGAACTGATGGCGCAACTTAACGTATCGGTGCTGTTAAGCAA +GCTGGATGAGTTAATGGACGTCACTGGTTCGCTACTCGAAAAGGCTAAATCTTGGGGGCCGGAGTCCATT +CGCCAGCCGATAGAGGTGATATGGGAACTGCTGGTGTCTATCCGCAGCCAAGCCAACACCATGCTTGCAA +AAGCGCTGGCACCGTTAAATGATGTGCTGGAAAAGCTGGCTGCCCGTCTGCACCGGGAAGGGGACGATTA +TTATAAAGCGCATACTGGTGCTAATCCGCATCGGCCTTCTCGCCTGAAAGATGCTGAAGAGGTGGAATTG +CTGGCTACCAAAAAGCCAGACTGGGCGGATATTGGGGGTAAAGAAAAATATCCACAACTGGAAAAAGCCA +GTGCGGAACAGAAAAGATTAATGGACCCGGAGAATAAGGAGGGCGGCTACCCGAATATTCCTGATGATAA +AGTGCAGACTTTTCATCAGATGGCTCCCGTTGAATTTAAAGAAGGCGAGAAACTCTACCGGGTGCTTGAC +CCTGGCAGTAGCGATAATAGTTTTTGCTGGATGCGTGAAGCAGAGTTTAAAGCACTGAAGAGTAAGTCTC +AGTGGCGACGACGCTTTGCGGTCTGGAAAAGCTGGAATGAAAATGGTGAGTATGTAGTTTATACCGTGCC +ACCCGGTACAACAATGAAGGTTTGGGAAGGTCCAGCTGCCTCTCAGGTGCGTGAAGTCACAGGTAAGAAT +GGAGAGAACATTAAAGTCGTGCTGGAAGGCGGATCACTTCAGATAGTGATAGATCCGACCGTTCTGAATT +TGGACTATTTGGGGAAACGTCAGTCTACAGGATGGGGGTATAGAGATTTTTCTGATGAAGTGGATATGTA +TATAGGTGTGCCTCAGTTGCAAACAAATATTTATGTACCTAAATAA +>test.0417.00002.0002i_00010 1068 NA | NA | NA | ID=2_2;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.547 | NA +ATGGCTATATTACATCCACAGGAGTGTTGGTTGCTGGAAAGAATAATGTCGCCGGAATATTATCGGCGCC +GTTTTGAGGGCTGGCAGGCGTTTGTCGAGCTGTGCGAACGGCAAGTGGCGGAGTGGAGCAAGACCATTCC +GCTGGATGTGCGCCGTCGTCCGCTGTACGAGCAGATTGACGCCGTCTGGGGCGGGCGGGTGTTGCCCAAT +ATCCGCAGCACTTTAAAGTCGGTACAGTATGACTTTATTCAGCTACAGCAGGGGGACCTGCGGGTACTGC +AATCCGGGGGCAATATTAGCAGTGATATGAAAGGACTGATTGATTATCCGCCGGACTGGATGTCACCCGC +CGCGCAAAAACAGTATGACAGGCTGAAATGGCGAGGTGCACATTATAATAATCTAATCAGACGTACCTCG +GGCGGATACTGGTATGACGGCGAACTGACTTATTATTATGAGGAAAGTCTGCACGGCCCGCTGGCCCTGC +CGATGCAATTACCGTTGTATGAGCTGGATAGCAGCGTATACCTGCGTGAGGATGACCCGGTAACGGTGGC +TGGCCTGTATCTGCCGGATATCCCAGATGCCAGCGCCCAACTGTTGTACCGGAGTGAACATATTCCCGAG +GCTTGGCAGGGGCGGGTACGAACGAAGTATGTCAACGAGGCTGGGATACAAGAATATTACTGGGAAAGCG +GGGCGTGGGCAAAATGCAACTGGAAACGTATACGGCGGGTGGCAAACCGATTTATCAATGTGCCGCCGGA +GGGATTTTTCCCACAGGGCATGCCGGAGGAGTTGTACAACTGGCCACAGCGCGAAGCGCAGTATGTAACA +GACCGGCAGCGGATAGCGGCCTATAGCGGTGAAGCTTGTCCTCATAGCGGGGAGTGGTCGATTTTTGTAG +AAGGTAGACAAGCGACGGAGACGCTGGAGCAGGGAGAGCAGATGCCGGAATGGACGGACAGGAAAATGGA +GGGGGAGTATAAAAGAGGTGAGAAATTCCATGTGCTGTGGTCGCTGATGAACCGCCACGATGGCGGGTCG +GTGTGGGTGGAAGCGTAG +>test.0417.00002.0002i_00011 381 NA | NA | NA | ID=2_3;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.357 | NA +ATGAGGATATCACTGGCAAGCTTGTTTTTTCTTTGCTGTACAGTATCAGACAGTGTTTATGCGGATACAG +ATCAAACATATGATATTTTTTGGGGAATGCTGGTAAAGGATAAAAAGGATACTATATTTGTTCGCTGTGA +CAGTCCGTTATTGAAAATGAAAATTGTGAGAATGGCGGATGCAAATACAGAAAACATTGATAAGGCATAC +CAGATATTTAATCAGAAAACGAAAAAATCAATTTATTTTGCTTTTATCGGTAATGTGACTGATGCCGGGA +GTGGAAAGTATATTTTCAATATGCTGGACGTGATGGAAACGAGAGAAGGCTATTGTAATCTGTCCGATGT +GCTTAATGCAATAGATGAACAGTTTCGATAG +>test.0417.00002.0002i_00012 264 NA | NA | NA | ID=2_4;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.424 | NA +ATGAAAGGTATTGTTGTTCTGGGAGATAAGACAACGCATGGTGGGCAGGTTATATCTGTGTCATCTTCGA +TGGTTATCAATGGAAAAAAAGTTGCGCTTGTAGGTGATAAGATAAACTGCCCTGTTAAAGGGCATGGTAT +TAATACCATCATCGAGGGGAGTTTTGATTGGATTTCTGATGGCAAACAGGTCGTCGTGAATGGCTGCAGG +TGTGAATGTGGCTGTGTTGTTATATCCAGTATTGCTGATGCCTTGATTGGATGA +>test.0417.00002.0002i_00013 1140 NA | NA | NA | ID=2_5;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.359 | NA +ATGGGATGGAAACGGACGTATACAGAAGAAATAGACAGGCCACAGGATATTTACTTTCATAAGTGGTTAT +TTTCTTTATTTATTTTATGTATATTATTACTCGTTATTTATTATTTTTTCCATGAATTTGTTGTAGCTAA +TAACGCATCTTTGTTAGCATTCTTTTCCCCATTATTATTGTGGGTATTGATTCTTTCAGTACAGGTAATA +TTTTATTCCAGAGCTATTCAGGATTATTCAATTTGGCTGGAGAACAGACTTAGTATCAACAGAGAGTGGG +AGGCATGGGGATCAAGATATGTTTCTGTTATGAATAGTAGTCTTCATCTTCCTGGAAAAGTCGATGTTTT +ATTCTTGTCTGGTGATGAATTAGAAACTCAGTATGGACTTGTCAATAAGTCAGATGATATCACATGGAAG +CAACATGATTGGTATGCCTGCTTTCAGACCCTTACTAATCATCTTGAACTTTATAAACTCCCATATCAAC +TTACACAAGAATTTATTATTCTTACTGATTTTGATGAAAGTATGTACTCTCAGATTGAAGAGGACTTTTT +CAGAACAGTGGAGAAAACCAACAGAACAGAGGGGCATTTTTTGTTGCATATTTCCCCTTCAATGTCCTTT +GGAGAGCTTGATTTATGGTTAAAGGATTCCGAAGAGAAAATATATATTGTCATGGTGTTGCAGATGGAGG +AGCAAACATCCTGTTCGGACGCTATGGCTTGCCTTATGTTTGCAACTGATGATGTTACTGCTAAGTACAA +ACTCACTGAAAAGGCCAGAATTTATCGCCCAATGGTAGTAAATAGTAATAATTTCAATAGTGACTTGAAT +ATTTTTATTGACACACAAAAAATATCCAAAAATGCCGCCGGGTTAGTTGGGGACAGTCAGCGTCTGTTTT +CTGTGAGTAGTAATGTATTGCAGTGTTTTAATGATAATAATGCTCAATTGAAAATTGATAATATCCATCT +TTTAGAAAGCCTTTGCGGATTACCAGGGGGAAATGCGGTCTGGTTAACGGCAGCGCTGACTATTTCGGTG +GTTGTTCACAAAAATTCAGATTACTTGATGATGTCCGAAAATAATGATGACTGGATCATTACCACCATTC +ATCCTATGGAGCATTCATGA +>test.0417.00002.0002i_00014 3354 NA | NA | NA | ID=2_6;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.592 | NA +ATGAAGAGAATAAATAAAAAAAGTGTTTTTATATCTAATGTACTTTTATTCTTGGTTATTGTGGCCTTCG +TGGGGGGGATCATCTGGCGTTTTGGTGATCATTTTGGACTGAAAGGGGATGAAAATAATTTTTTTGCGTG +GTTGATATGCATTATGACCCTCATTTTTGTACGGGCATCCTGGTATTTCTCTCGATTGTATCGCCTACGA +AAGGAACAACATCACTCCGAAAAGGAAAGATTACGCCCGGAGAAAGAGGCTCGTATTGAATATGGCAAGG +TCATAACCCTGAACATTGAGCTAGCTGAGTATTTATGTGCCCTATACGGCCCATTCTGGCGGCGTAAAGT +CCGCCTGCTGCTGGTGACCGGCGAGCCTGAACAGGCAGAGGCCATCGCGCCGGGGCTGACCGGGCAACAC +TGGCTGGAGGGCGACCACAAGGTGCTGATATATGGCGGCAGGCCATCAGCGGAGCCTGATGTCGCGCTAC +TGACCGCCTTAAAAAAACTGCGCCGCAGCCGCCCGCTGGACGGCATCATCTGGCCGCTGACAGAAGAACA +GAGCCGCCAGACAGCGCAACTCGACAAAGGCTGGCGCGAACTGATAAACGGCGGTAAGCGACTCGGTTTT +CAGGCTCCACTCTATTTGTGGCAGGTCTGTGACAACGGTGATTATCAGACCGGACGCCCCCTGCAAAGCG +TCGGCTGCCTGCTGCCGGAACGCTGTACCCCGGAACAACTGGCTGCAATGCTGGAAGCACAAACCCTGCC +GCTGACGGAACAGGGCATGTCGCAACTGCTGGCAGATAACCGCCATGATTTCCTGCTGCGTCTGGCCCAT +ACCCTTGCAGAGCGGGGTATCGCTCACTGGCAAAGCGTTCTGAAACCGCTGCTGGCAGGCGGCGCATTTT +CTTCCCTGCGCCTGCGTGGCCTGATGTTCAGCCCGCCGCTTGCCGCCGTGCCGGAGGCCGCACCTCATGC +GTGGCTGCCGTCACCGGTCTGGGCGGGCGTGACGGGTGATAACGCGCGCGGGCGTGCAGTGGGCTTTCCG +TGGCTACGCGCCGCGCTGATAACCAGCATCTGCATGCTGGCGATATGGGGGGCCGGAATGACGACCTCGT +TCTTCGCCAACCGCGCGCTTGTTCAGGAAACCGGTATCCAGACGGCACGTGCGCTTGATACCCGCCTGCC +GCTGGCAGAACAACTGGTGGCGCTGCATACCCTGCAGGGCGAACTGGAACGCCTGCAATATCGTATCCGC +GAAGGTGCGCCGTGGTATCAGCGTTTTGGCCTTGAACGTAACCAACAACTGCTCGCCGCCGCTTTTCCCG +GCTATGCGCAGGCGGCAAACCGGCTGGTGCGCGACGTGGCCGTTGACCATCTGCAACAGCAACTGAACGC +CTTTGTCGCCCTGCCGCCCAACAGTCCTCAGCGTACCGCCACCGGTGAACAACGCTATAAGCAGCTTAAG +GCATTGCTGATGACTTCCCGCCCGGAAAAGGCCGACGCTGCCTTTTTCAGTACCACGCTGATGGCGGACG +GTCTGCGCTACGAGAATATCCCGGAAGGTGTGCGGCAGAGCGTGTTGCCGTCACTGCTGACCTTCTGGAT +GGCGAACCTGCCGGAACACCCGCAGTGGAAAACCGCACCGCCGCCGGAACTGACCGGCGCGGTGCGTAAA +ATCCTGCTGCGCCAGATTGGTGTGCGTAATGCTGAAAACACCCTCTACCAGAACGTGCTGCAACAGGTGT +CCCGCAACTACGCCGATATGACGCTGGCGGACATGACCGGGGATACGCTCACCGAATCTCTTTTCAGTAC +GGAACAGACAGTGCCGGGGATGTTCACCCGTCAGGCGTGGGAAGGACAGGTCAGGGAAGCCATCGAGCAG +GTAGTGACGGCGCGGCGCGAGGAAATCGACTGGGTACTCAGCGACCGCCAGCAGGATACCTCTGCGGATA +TCTCGCCGGATACGCTGCGTAACCGTCTCACCTCACGCTACTTTACCGACTTTGCCGGAAGCTGGCTGGC +GTTTCTCAACAGCATTCGCTGGAAAAAGGAAGACTCGCTCTCCGGCATTCTCGACCAGCTGACACTGATG +GCCGATGCCCGTCAGTCGCCGCTGATTGCGCTGACCGATACCCTCGCGTGGCAGGCGGCGGCTGGCAGGG +AAAACCGTGGCCTGTCAGACTCGCTGGCGAAATCGGCACAGGAACTGTTTAACGGCAAGGAGAAAACGCC +GCAGCAATCCCGTGAAGGCAACGAGCCTGTCGGGCCGCTGGATAAAACCTTCGCGCCGCTGCTGCGGTTG +CTGGGCGATAAAGCCGGAGGCGGAGACAGCCAGCTGAGTCTGCAGACCTACCTTACCCGCGTTACCCGCG +TGCGCCTCAAACTGCAACAGGTGACCAACGCTCCCGACCCACAGGAGATGACCCAACAACTGGCGCAGAC +AGTCTTGCAGGGCAAAACCGTTGACCTCACCGACACCCGCGACTACGGACGGTTAATCGCCGCCAGTCTG +GGCGAGGAATGGAGTGGCTTCGGTCAGGCGCTGTTCGTCCGCCCGGTGGAACAGTCGTGGCGGCAGGTGC +TGACGCCTGCAGCGGACAGCCTGAACCGCCAGTGGCACCGGGCGATTGTCAGCCACTGGAATCAGGACTT +CGCCGGGCGCTATCCGTTCAAAGCCTCACAGAATGACGCTTCCCTCCCCCTGCTGGCGCAGTACCTGCGC +GATGACGGGCGCATCAACCAGTTTATTGCCGCCAACCTTTCCGGCGTTCTGAAACGTGAAGGCCGCTACT +GGGTGGCTGACGCCATGAACACGCAGGGGCTGACGGTCAATCCGGACTTTATCCGCGCCCTGAACCGCCT +GCGCGACGTGGCCGATACCGCCTTTGCCAGCGGCGATGCCGGGATACATTTTGAACTGCGGGCAAAACCG +GCCCGAGACGTGATGAAAACACATCTGGTGATTGACGGGCAGGAACTGGAATATTTCAACCAGAAAGAAC +GCTGGCAGCGTTTTAACTGGCCGGATGAACAGTGGCAGCCCGGCGCATCGCTGAGCTGGACCAGTACGCA +GGCGATGGAGCGCATACTGGCGGATTATCGGGGAAGCTGGAGCCTAATTCGTCTGCTGGAACAGGCGCAG +GTGACACCGGTGGACAGCAGCACCTTTAAAGTGGTGTGGAAAGCGCAGGACGGCCTGCCACTGAATTACC +TGCTGCGGGTTGAACAGGGAAAAGGGCCGCTGGCGCTGCTGGAACTGAAAAACTTCCGCCTGCCGGGACA +GGTATTTCTGACCGGCAGGAGTATGAAGGATGCGGAAGAATACGGGGAAGACGCCGATGAGTGA +>test.0417.00002.0002i_00015 1638 NA | NA | NA | ID=2_7;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.620 | NA +ATGCGGAAGAATACGGGGAAGACGCCGATGAGTGAGCTGTTGCAAAAGCTGACCCGTAGCTGTTTTGCCG +ACCGGGATGCACTGGATGTGGCGCGAACACAGGCGGCACTGTGGCAGACATGGCTGCTGCCGGTGACGGC +AGACACGCCGGTCGGGGAAGACCCCGGCTACCACGACGATTTCCTGCGTATCCGCGACGAGATGAACAAA +CTTTCCGGCGCGGATACGGACCTCATCTGCCAGCTTGCCGAATCCCTGCTGCTGACGCAGGCAAAAGACG +TGCGCATCGCCACTTACTACATCTGGGCGCGACTGCACCGCGACGGTGAGCGCGGACTGGCGGAAGGACT +GGCGCTGCTGACCGGACTGGTGGAACGCTTCGGTACGCAACTGCTGCCCTCGCGTCCGGCCAGCCGGAAA +ATGGCGCTGGAGTGGCTGGCAGGGGAAAAGATGCTCGACAGCCTTGCCCGCTACCCGGAAGTGGCAAAAG +AGGATTTTGCGAACATTGTTGCTGCTCTTAATCAACTGACGGTTTCCTTCGCCGCATGGCCCGAAGACCA +GCATTCCCCCTCCCTGATGCCGCTGATTAACGCGCTGGAATCACGTCTGGCGCAGTCGGGTGGGATGAAT +GCGGTGGTGCCGCAAAACAGCAGCAGCGTTCCTGCACCGTCATCCCCGGTGGATGCGCCACAGGTACAGA +CCATCACCTCCGGGCGCGACCTGCTCGACCAGGCGAAAGTGCTGGCCCGTTATCTGAACGAACAGCCGCA +GGGCTGGCTTTCAGCACACCGGCTGATGAAAACCCTGCGCTGGGACACGGTGCATGAACTGCCGCCGGAT +GTGGACGGCAAAACCCGGCTGGCCCCGCCGCGCACAGAATCGCGCAACCAGCTTAAGCGGCTGTATGCCC +AGCAGAACTGGACGGAACTGCTGGAGCAGGCCGACCTGATGTTCAGCACCGGTGTCAGCCATTTCTGGCT +GGACATTCAGTGGTATCTGCATCAGGCGCTGGCCAAGGCGGGCGCACCGTGGGACAGGTGGACAGCCGTT +ATCCGTCAGGACCTGACGTTACTGCTGGAGCGCCTGCCGGGACTGGAAAATCTGGCATGGAACGACGGCA +CACCGTTCGCCGACGAGGTGACGCGCAACTGGATAGCGCAGCAGGTCATGATGCGGGAAGACGGCGCATG +GCTTGCGGGGAAAGCCGCTGTACCGACAGACGACGCCACAAATGACGTACTGGCGCTGGAGCCGGAAGCA +CTGGCGATGGCAGACAGTCAGGGCGTGGAAGCGGCGCTGGGCTGGATACAGACCCGTCCGGGCATCACCA +CGGCACGACAGCGCCTGTTATTGCGGCTGCTGATGGCACGGGTGGCGGAACAGTACGGTAAAAACGAGAT +GGCGCTCCTGCTGCTGGAAGAACTGGATACCGCCGCACAGGGAATAACGCTGACGCAGTGGGAGCCAGAA +CTGCTGTTTGAAGTAAAAGCCCGGCAACTGAAACTGCTGCGCCTGCGGGCACATCGCCACGCGGACAAGG +CGGCGCTTGCCCGGAAAATGGACGCTCTGCTGGGTTCGCTGGTGGCAATCGATCCGGCGCGGACAGCGGT +ACTGTGTGATACGCAGCATAAGGACTGA +>test.0417.00002.0002i_00016 1761 NA | NA | NA | ID=2_8;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.580 | NA +ATGGACGACCTGACCCAACGCTACTTTGAGGCCGAAATGCGCTACCTGCGTGAAGCGGGTAAAGAATTTG +CGCAGGCTTACCCCGACCGCGCTGCGATGCTTAATCTTGATAAACCCGGCGCACGCGATCCCTATGTGGA +GCGCCTGTTCGAAGGCTTCGCCTTTTTAATGGGCCGCCTGCGCGAAAAGCTGGACGACGATCTGCCGGAA +CTGACTGAAGGGCTGGTCAGCCTGCTGTGGCCCCACTACCTGCGAACCATCCCGTCACTTTCCGTGGTTG +AACTGTCGACAGATCACCGGCAAATGAAGCAGAGCGAAACGCTGAGCGATTTTCAGGTATTGTCGCGCCC +TGTTGGCGAGCGCAGAACCCGCTGTTTCTACAGCGCCACGCGGGATATCACGCTGCATCCGCTGGCGTTG +CCGGACGTGTCATTGCAATATGAACCGGACGGACGTTCGGTTATCCGTCTGCGCTTTGAATGCGGCCCGC +TGGTCGGCGACTGGTCGCAGATCGATTTATCCCGCCTGCCGCTCTATCTCAATGCCGACAGCCCGGTAGC +CTGTGCGTTGCACCGGGCTTTAACGCTTGGCACGCAGCAGTTCTGGCTGCGTCTGCCGGGGCAGGATCGC +CGGATGCTTGGCGCACACTTTTCCCCGATGGGCTTTGAGGATGATGACAGGCTCTGGCCAAAAGGTGAGT +CAGCCTTCAGCGGTTACCAGTTGCTGCTGGAGTATTTCACCTTCCGCGAGAAGTTTATGTTCGTGGCGCT +GAACGGGCTGGAGCAGGTTGCATGGCCGGAGGGGATAACCGGCTTTGAGATTGACGTGGTGCTGAACGAG +AACTGGCCTCACGACCTGCCATTTGACAGCGATAATATCCGTCTGCACTGCGTGCCGGTCATCAACCTGT +TCCCGCTCGAAGCCGATCCGTTACACCTTTCGCCACTGGAAAACGAATTTCTGCTGCGCCCGATGCGCAT +TCAGGACGGGCATACCGAGATTTATTCCGTCGACAACATTATTTCTTCGCGCCATACCGGCAGTCAGGCA +TATGTCCCCTTTTCCAGCTTTCGTCACCGGGGCGGGATGCTGCGCCACGATGCGCCGGAACGCTATTACC +ACACGCGGGTAAAGCGCGGCCCTTCCGGCTTGCACGACACATGGCTGATTCTGGGCGGCGATGCGTTTGA +TTCCGACCGGATGCTGGAGGATGAAACCCTGTCCTTAAGTCTGACCGGCACCAACGGGCAGCTTCCCCGT +AAAGCCTTACAGAGCACCCTGCTCGATACGCCAGTTCATGCCTCACAGAACGTCCTGCGGGTGCGCAACC +TGTGCGCCCCGACGCAGCCCTGCTATCCCCCGGCGCGTGACCGCTTCCACTGGCGGGTGCTCAGCCACCT +CGGTTCTAACTTTTTATCGATGATGGATAACGCCGAAATTCTGCGCGGCACGCTGGCGCTGTACGACTGG +ACCGAAAGCGAGATGAACCGCCGTCGTCTGGAGGCGATTGTCGACGTTCAGCACAGCCTGATACAGCGTT +TTGAAAGAGGCTTTCTGCTGCGTGGCGTGGATATTCAGGTGACGCTGGACAGTAACGGCTTTGCCGGAGA +AGGTGATATCACGCTGTTTGGTGAACTGCTGCACCGCTTCTTCGCACTGTATGCCGATATCCACTTATTC +ACTCAACTGACCTTAATTCTGCAACCCACAGGAAAGTGCCTGCAATGGACAGAGCATCACAGCCAGCGCG +TACCGGGCTGA +>test.0417.00002.0002i_00017 1080 NA | NA | NA | ID=2_9;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=11-12bp;gc_cont=0.591 | NA +ATGGACAGAGCATCACAGCCAGCGCGTACCGGGCTGACCGACCGGCTGGCCCCGGATATTGCGCGGATCA +ATTTTTACCGTTTTTGCCAGTTGCTGGAACAGAGCCAGCAGAAAGCGCCGCTGGGCAGTACCGACAACCC +CGCCGCCGATGCGGTGCGTTTTCGCCCCCATCCCGGAATGGGCTTTCCGGTCAGCGAGTTAAAGAACGTT +GAACGTGACGTGGACAATCCCGACGCGCCACCCACGGTGCGCACCACCTTTCTCGGCCTGTACGGCGTGG +ATTCACCGCTGCCCACCGCCTATCTGGACTACATTACCCAGCGTCATGACGGACATGACGCAGTGATGGC +GTTTCTCGATATTTTTAACCATCGCTTTATCACCCAGTATTACCGCATCTGGCGCAAATATAACTACCCG +GCGTCGTTTGAAGCAGGTGCCGTGGATGACATTTCCCGTTGTCTGCTGGGGTTAATCGGGCTGGGTATTC +CCGGCAGCGAGAACCATATCGCCACGCCTGTATCCCGTTTTCTGGCCCTGCTCAGCGTGATGCGCCTGCC +CACCCGCACGGCTGAAGGCGTCACGGCACTGGTGGGGCTGCTTGCCCCGCTGACGAAAGCCACGGTGGTG +CCTCACGATCCGCAGCCTGTAATTCTCCCGGCCCCTGCGGGTCTGTCAAAAAATTCACGCATCAGCCTGA +AAACGCGAACGCTGCTGGGGCGTACCGGTACCGACGTCAACAGCCAGTTGCTGCTGAAACTGTATACCGA +AGATGCCGCAGAAGCACGTGGCTGGCTGCCCGGCGGGCAACTGCACAGCGATTTGCTGGTGCTGCTGCGC +GTTTATCTGGGCTGGCGCTGTCAGGCCCGTCTGCAACTGACGCTGCCCGTCAGCCTGTTGCCTGCTGCCC +GGCTGGGAAAACAGCGTGTACAGATTAGCCGTACCGGCATCCTTCTCGCCTCCTTTGCCGCGCCCGCGAC +CGGAACAGTGACGGTCAGTCTGGGGCGTTATCAGGGATTAATACCCGCTTTTTCCATTCGTAACAGGGAG +AGTATGACTCATGTTTCCTATTCGTTTTAA +>test.0417.00002.0002i_00018 537 NA | NA | NA | ID=2_10;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.508 | NA +ATGTTTCCTATTCGTTTTAAACGTCCGGCGTTGCTCTGTATGGCGATGCTGACGGTTGTTCTGAGTGGCT +GCGGGCTGATTCAGAAAGTGGTGGATGAATCGAAAAGCGTGGCCTCAGCCGTTTTCTACAAACAAATCAA +AATACTGCATCTCGATTTCTTCTCCCGCAGCGCCCTGAATACGGATGCGGAAGATACGCCGCTTTCCACG +ATGGTGCATGTCTGGCAACTGAAAACCCGCGAAGATTTTGACAAGGCGGATTACGACACCCTGTTTATGC +AGGAAGAGAAGACGCTGGAGAAGGACGTACTGGCAAAACACACCGTCTGGGTAAAACCGGAAGGCACGGC +ATCCCTGAATGTGCCGCTGGATAAAGAGACGCAGTTTGTCGCCATTATTGGGCAGTTTTATCACCCTGAT +GAAAAAAGCGACAGCTGGCGTCTGGTGATCAAAAGGGACGAACTGGAGGCCGACAAGCCGCGCTCGATTG +AACTGATGAGAAGCGACCTGCGACTGCTGCCTCTCAAGGATAAATAA +>test.0417.00002.0002i_00019 429 NA | NA | NA | ID=2_11;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.534 | NA +ATGTCGACACCTTCCTTATATGAAATGCTGACGTTCAGTTTCAGCGGCGAGTTACCGCTGGAACAGATCA +GCGAGCGGGATCAGCTTATCCTTTCCGTGATGGACAATATGCAACGCATTATCAACTGCCGGGCAGGCAC +GCTGGCGCATTTGCCGGATTACGGTCTGCCGGATCTCAGTCTGATCCATCAGGGGATGGCTGCGGGTATT +CATGGCCTGATGCGTCAGATTGAAGAAACACTGCTGCGTTATGAACCACGCCTGAGTCAGATACAGGTGG +AATTACTCCCCCAGCCCCGTCCGGGGCATCTTAATTACCTGATCCACGCGCAGCTTCCCGATACCGGCTG +GATACGCTTTGATGGCGTATTTTCTCCGGAAGGACGAATTGTTCTGCGTCATCTCAAACAACAGGAGCGG +GCGTACTGA +>test.0417.00002.0002i_00020 1377 NA | NA | NA | ID=2_12;partial=00;start_type=ATG;rbs_motif=AGGAG/GGAGG;rbs_spacer=11-12bp;gc_cont=0.548 | NA +ATGGCAAGTAACGCGAATTTTATCAGCCAGTTCGTCATGGGCGGCGATCCCTGTACTTATAAGGAATCCG +GTGAACTGCAGGCTGAAATGAGTAAACTGACTCACCCGGCCCGACCGGATGTGGACTGGCGTCAGGTGGA +AAAACTCTGCCTCGCGCTGTTCCGGCAAAATGGCGTGGAACTACAGACGCTGGTCTGTTACGTACTGGCG +ATAACCAGACGGCAGGGGCTGGCAGGGATGGCAGACGGACTCGGTTCACTGGATATACTGCTCCAGCGCT +GGGCTGACTTCTGGCCGGTACAGGTACATTCCAGAATATCACTGCTCAGCTGGGTCACAGAAAAAATGCA +GCAGGCACTGAGAACGCTGGATATTCAGTATCAGGATCTGCCGCAGATTTACCGTTGTGTACAGCATCTT +TCCGCCATCGAAACCACGCTGCAACAGTGTGAACTGTGGCATATGACGAAACTGGATCTACTGGCCGGGC +AGTTTCGCAATACCGCATTGCGTCTGGAACGGCTGGCGCCTCAGGGAGCGGAAACCACTATCACTCCCCC +TGAATTACCCCGCCGGGAAATGAATCAACCGAAAAAGTCAGAGGAAAGTCCACAGCCGGTTTTTGCAACC +AGATCCGTTCAGCAAAACGATAAGGATGCCAGTCCACCCGTTCCATCCCCTGAAATCTCCCGGCAGCGGA +CATGGCCGATATTTATGGCCGGAATGGTTGTGATGGCCGGTCTCGGCGGAACAGGATTATGGGGCTGGTC +GCAGCTTAATCAGCCGGACGCGCTAATCCAGCGAATACAACTGTCTGTCATGCCATTACCGCAGTCGCTG +GAGAGCGGCGAACTGGCAAAGCTGGATGTAAAGGATAAGGCGCTGCTGGCTCAGGACAGAACAATTGCGG +CAAGTCAGATGCAACTGGAGCAGTTAAACAAATTGCCTGCCCGCTGGCCACTGGAGCAGGGATATCGCCA +GCTACGCCAGCTTGATGCCCTGTGGCCGGATAATCCTCAGGTCAGGGCGCTGAACGCGCAGTGGCGCAAA +CAGCGGGAGCTGAGCGCCCTGTCTGCTGAGGCACTGAATGGCTATGCTCAGGCGCAGAGCCAGCTACAGC +GCCTGTCGGCGCAGCTGGATGCACTGGATGAACGTAAGGGGAGATATCTGACCGGTTCGGAACTAAAAAC +GGCGGTGTACGGCATCCGGCAGTCGTTAAAGGAGCCGCCGCTGGAAGAACTGCTTCGGCAACTGGAAGAG +CAAAAACAGACCGGAGAGGTTTCGCCAACGCTGTTGACGCAAATTGATACCCGGTTAAATCAGTTGTTGA +ATCGCTATGTCATTTTACTGGATACGAAGGTGGAACAAAGTCAGTAA +>test.0417.00002.0002i_00021 948 NA | NA | NA | ID=2_13;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.444 | NA +ATGAAAAATGTTCTGGTCACCGTCCCCAGCTTTTCAGCACGCTGTGTTTCCGCCAGCAAGTTGCTAAGAG +AGAATAATTTTAATCTTATTATTAAGAATAATGTGGAGCATCTGCTTAAATCAGAATCCACTGCATTACG +AGAATCTATTTGCGCGGTCATCGCCGGAAAAGATGGTTATCAGGCGGACACGCTATCATTGCTGCCTGGT +GTGAGAATAATATCGAGATTCGGGACGGGGATAGACAATATTGATCTTCGTGCGGCACAGCAATCCGGTA +TTGTTGTCAATAATGCGGTTGGGATTAATTCAAATGCGGTTGCGGAATTTATCATTGGACTTATCTTCGC +GAGCATGAGAAATATCCCTGGCAGCTATCATGCGATGCAAAATGGCTACTGGGGTGAGTCGCATGGCTGT +GAATTACAAGGGAAACGGATTGGCCTGGTTGGCTACGGTAATATAGGTAAAACTCTGGCGAAAAGGTTAT +CCGGTTTTGATGTTGAGCTTTTAGCTTTTGACAAACAACCCGACTATCAGGTTGCTGACAAAGCTGGAGT +TCAGTTTGTATCAATTGAAGATATCTTTATGCAGTCGCATGTCATCATTGTTCTTTTGCCTTTTTCTTCT +GAGCTGGAGAACTTCATTAGTCATAAATATTTGTCGATGATGCGCAATGGTGCTCTAATCATCAATGCCG +CAAGGGGAAAGTTGCTGGATGAGGGCGCTTTACTTCAGGTGATTGAAGAACGAAATGTGTTTGCGGCGCT +GGATGTGTTTAGCTCTGAACCGTTGGCGCAATTTAGCCCACTGCTACATGCCAAAAATATCATTACAACG +CCGCATATCGCGGCCGCCACCGTTGAGTCATACCAGCAAACCGGGATACACGTTGCCCAGTCGATAATTG +ATTACTTCGCAGGAAGGGAGATAAAAAACGTGTTGTGA +>test.0417.00002.0002i_00022 597 NA | NA | NA | ID=2_14;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.424 | NA +ATGAATAACACGGATCTTATCCATCTCATTAAACATTTTATGCGTAACGAACATAAAGCAGTTGAAGAAG +TTATTGATTCCCCTCTTTCGGAGGTCGCAAATTTAATTAAAGTATTACAATCTTGTCAGGGGAAAGTTGT +TTTTATTGGTGTTGGTAAGTCTGGTATTATTGCCAGGAAACTCGCCGCAACATTTGCCAGCACCGGAACT +CCCTCGTTTTTTGTTCACGGTACGGAAGCGGTACACGGCGACCTTGGAATGGTGGCGAAAGACGATGTTG +TTATTCTTATTTCAAACAGTGGTGAGACGGCGGAAATCCTGGCGACACTGCCTAGTCTGAAAAAAATGGG +TAATTATTTGATCTCTTTTACCCGCAGTCATCACTCATCGCTTGCGATAAGTTGTGATTTATCTGTTGAA +ATCCCCGTCAAAAGTGAGGCGGATAATTTAGGTTTAGCACCGTCATGCTCGTCGACTGTTGTTCTGGTTG +TTGGTGATGCGGTGGCGCTTGCACTCTCTGAATTGAAAAAATTTACTCGTGCTGATTTCGGCTTATATCA +TCCAGGAGGTGCACTCGGCATTAAAGCAAATTCATAA +>test.0417.00002.0002i_00023 1176 NA | NA | NA | ID=2_15;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.378 | NA +ATGGATGTTTTTAATACTCCTGTTTCCCGCAAAGGAACATATTGTACCCAATGGGACTTTTGCGAGGACA +GATTTGGTGTAAAAGATGTACTACCATTCTCTATTTCAGATATGGATCTTCCGATACCAGACGCTATCAC +CAGAGCATTAAAAAAACGCCTGGAACACCCGATTTTAGGGTACAGTCGTTGGCAACATGGTGAATATCTG +AATGCGATAGTAAACTGGTATTATCAACAATATCAAACAGATATTAAACCTGAATGGATAACCTATAGCC +CCAGTGTGATGTACTCTATTGCAAAAGCAATAGAGTTATTGACATCGCATGGTGATAATATTCTCGTTTT +TACACCTGTCTATAATGCATTTTTTGATGTAATTAAACATAGCGAGCGAAATATTCTGACAGCCTCTTTG +ATTATAAAAAATGAGGGGGGCTACGCTATCAACTGGCAAGATTTTGATCTTAAGATTAAAAGCGCAAAGA +TGATGTTATTATGTAATCCTCATAACCCGACAGGAACAGTCTGGTCGGAAGAAGAACTGCATAAAATCGC +TGCAAGCTGTACAAGGCATAATGTCTGGTTATGTTCAGATGAAATCCATAGTGATTTTGTTTTTAATCGT +AGCTTTACATCCGCGCTTAAAATAAAAAAAGAAAAAGTAGTAGTATTTAACTCGATATCGAAAACATTTA +ATGTTCCTGCACTAACAGGATCGTATATGATTTCAACTGACGATAATTTTAATCATAAGTTCAGAACGAT +ATCGAGGTATCGCGATTTTGTAAACTCCCCATCAGTACTGAATATAATTGCAACTATTATTGCCTACAAC +GAATGTGAGGGATGGTTAAAGTCATTAAAGGCACATATAGCCTCTAACATTCAATTCACCCAGCAGTATC +TGAATGAAAATATTCCAGAATTGATCGTAAGGCCAGCTGATGGTTGCTATTTTTCCTGGATAGATTGTTC +TGCTATTGGTTATCCTTTTGATGAATTCTACAGTCGATTAATTCATGAAGGCAAAGTGGGCATTATGGCG +GGGCATGTCTATGGAACGGAGGGGGAGGGCTACCTTCGTCTGAACCTGGCCTGCGGTCGAGAAAAATTAT +ATATGGGGCTTACGCGTCTTGTGAGTGTAATTAAAAATATTAATCAGGGAGAATAA +>test.0417.00002.0002i_00024 1581 NA | NA | NA | ID=2_16;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.441 | NA +ATGAAACAAAAGAAAGCCTGGAGTTTTTTTCAGAGCCTGGGGAAGGCATTTATGTATCCCATTGCTCTGC +TAAGTGTATGTGGCATGATGCTAGGGCTGGGAAGTGGTTTAGCCAGTGATGATATGGCAAAGTTAATTCC +ATTTCTGGCTATTCCAATAATTAAAACCATACTTGATTTCATTGTTAGTCTTGGTTTGTTTGCCTTTGTT +AATTTACCTGTATTGTTTGCGATAGCGATTCCCTTAGGATTATTAAAAGATAAAGAGGATAAAGCCTATG +GTGCTTTTTCTGGCTTAATTGGTTTTATGGCGATGCATTTGGGAACGAACTTTTATCTTAAACAGCACGA +CTTATTGGTCGTTGCTGACCAAATGTCGACACATGGGCAAACCATCATTCTGGGGATCCAGTCCTACAAT +ACCAGCGTGTTGGGGGGAATTGTTGCTGGGTTATTAGTCGCCAGCATGTATAAAAAGATCGTTAATTTAC +GCATTCCTGAATCGTTAGGTTTTTATAGCGGCCCACGTCTGGTGCCTATCATTACACTGATTGTGATGAG +TGGATTTGGTCTGATCATTCCTTTTATCTGGCCGCCGTTTTTCAATCTTTTCATGCTCATTGGCCACTGG +ATTTCAACTTCCGGTCCTGTTGGTTATTTCTTCTATGCAGTTGCCGAACGCGTGACGATTCCTTTTGGCT +TAAACCATCTGGTGACGTCAGTTTTCCGCTTTACGCCAATCGGCGGTTCGGCTGTGATTGGCGGCGAAGA +ATATTACGGCACCCTGAACATGTTTATGGCATACGTCAAAGAGAATGCGGTCATTCCGCTGGATTTGGCG +GGGAAAATGGAGCAGGGCAAACTGATGATTCAGTATGGTCTGGCTGGTGCCGCGCTGGCGATGTATCGCA +CTGCTCATGCTCAAAACAGAAAGGCTATCAAAGCATTGCTTATTTCCGGGGTGCTTACGGTGATTATTGG +CGGCGTCAGCGAACCGATTGAGTTTCTGTTCTTATTTGTCAGTCCACTGCTGTTTGTCTTCCATGCCTTT +ATGAATGGATTCGCTAACATGGTTCTGCCATATATGGGGGTGAAGATGGGATTTACTGGTGATCTGATTC +AATTTATTAGCTTTGGCGTATTGCGTGGCACAAGAACAGGTTGGCCGATCGCGGTGTGTGTCGAAGTGGC +CTATTTCTTCATTTATTACTTTGTGTTCCGTTGGACCATCCTTAAATTTAACCTGATGACCGTAGGCCGT +GAAGAGTCCAGTCCTGTTACGCTGAACGCTCACGAAGATACGGCTATAGCGGATATCCCAACTCCTGATA +AATCAGAGCTGCAAGCGGCGGAGCAGATGGTTAAGGCACTTGGTGGTAAAGAGAATATTAAGTCACTGGA +TAATTGCGTAACTCGTTTACGTTTAACAATCGCAGATATGAGATTGATTGACGAAGTTGCAATAAAAAGA +GCTGGCGGGATTGCGGTTGTAAAACTTGATCAAAATACCCTACAAGTCATTATCGGCACTAAAGTCATCG +CCCTGCGTCGGGATATGGATAACTATATGGGGATATACTGA +>test.0417.00002.0002i_00025 825 NA | NA | NA | ID=2_17;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.336 | NA +ATGATCATCGAAAAAGTCATGAACAATAATTGTGTACAGGCATCGATGAATGGACAGGAGGTTATCATTT +CTGGGCCTGGCGTCGGTTACAACAAAAAATATGGAATGTCGGTCCCTGAGCATCCGGCTAACCGGATTTT +TTATGTCAGAAATGAACAAAAAAACAAACTTTATAAATTGATTGAACATGTAGATATTGAGTATGTGTTT +GTTGCCGAAAAAATAGTGCAATATGCGGAGAAAAATCTCGAAAAAAATCTCAATCCATCGCTACTATTGA +TTCTTGCGGATCACATTTCGAATGCAATATCCCGAGTCGTTTCAGGTATACAAATTAATAATGTTTTCCT +TGATGAAATCAAAGCGTTGTACAAAGCAGAGTATGCGATAAGTCGCGATGCATTAACTATCATTAATGAG +CAATTCAGCGTTCAACTTCCTGATGATGAGATTGGTTTTATAGCATTGCATATTTTAAATAATTATGAAA +ATTCAGTTGATTATGAATCAGTACGGATTATTGAGTTGTCGCAAATAATCACGGAGCTTATTGAAGTTGT +TTATAACAGAAAGGTGGACAGAAGTTCATTTAACTATTCCAGATTTATGATGCACCTTAAATATTTTTCA +AGTCGCGTGTTATGCAATGAAAAAATAAAACAGAAAGATATTGGTGATATCTATGAACAGTTTCTTGAAA +AGGACATCCTGTTACAGCGCGCAATTCATGAAATTGAACGGTATCTGTATGCCACTTTTAAATATGAATT +AATTTTAGAAGAAAAATTATATCTCTCTATTCGTACCAAAGTATTAATGGACTAA +>test.0417.00002.0002i_00026 1254 NA | NA | NA | ID=2_18;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.538 | NA +ATGTCAGGATCCAACACTGCAATCAGCCGTCGTCGTTTACTGCAAGGCGCGGGTGCCATGTGGCTATTGA +GCGTAAGTCAGGTCAGCCTGGCTGCGGTCAGCCAGGTCGTGGCGGTGCGCGTCTGGCCTGCGTCCAGCTA +CACCCGCGTGACGGTAGAATCAAATCGTCAGCTGAAATATAAGCAGTTCGCGTTGAGTAATCCTGAACGC +GTGGTGGTGGATATCGAAGATGTAAACCTGAACTCGGTGCTCAAGGGGATGGCTGCGCAAATCCGCGCTG +ACGACCCGTTCATCAAGTCGGCGCGCGTCGGGCAATTTGACCCGCAAACCGTACGTATGGTTTTTGAATT +AAAGCAAAACGTAAAACCGCAGCTGTTTGCCCTTGCGCCGGTCGCCGGGTTTAAAGAGCGTCTGGTGATG +GACCTCTATCCGGCCAATGCACAGGATATGCAGGACCCGCTGCTGGCGCTGCTGGAGGATTACAACAAAG +GCGACCTCGAAAAGCAGGTGCCGCCAGCACAAAGTGGTCCACAACCGGGTAAAGCTGGGCGGGATCGTCC +GATTGTCATTATGCTTGACCCTGGCCACGGTGGCGAAGACTCCGGTGCGGTGGGGAAATACAAAACGCGC +GAAAAAGACGTGGTATTGCAAATAGCTCGCCGTCTGCGCTCTCTGATCGAGAAAGAGGGCAATATGAAGG +TGTACATGACGCGCAATGAAGACATCTTCATTCCGTTGCAAGTGCGCGTAGCAAAAGCCCAGAAACAGCG +CGCTGACTTGTTTGTTTCTATCCATGCCGACGCCTTTACCAGTCGCCAGCCGAGCGGTTCCTCGGTGTTT +GCGCTCTCAACCAAAGGCGCAACCAGTACTGCGGCAAAATATCTGGCACAAACCCAGAACGCCTCGGACT +TGATTGGTGGCGTAAGCAAAAGCGGTGACCGCTATGTCGACCACACCATGTTCGATATGGTGCAGTCGCT +GACCATTGCCGACAGCCTTAAGTTTGGTAAAGCGGTGCTGAATAAGCTCGGTAAAATCAACAAGCTGCAT +AAAAATCAAGTTGAACAGGCCGGGTTTGCCGTACTAAAGGCACCAGATATTCCCTCCATTCTGGTCGAAA +CGGCGTTTATCAGTAACGTTGAGGAAGAGCGTAAACTGAAAACGGCGACTTTCCAGCAGGAAGTTGCGGA +GTCTATTCTTGCGGGAATTAAAGCGTATTTTGCCGATGGGGCGACGCTGGCGAGAAGGGGATAA +>test.0417.00002.0002b_00027 519 NA | NA | NA | ID=2_19;partial=01;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.526 | NA +GTGGTAAAGGAACGTAAAACCGAGCTGGTCGAGGGATTCCGCCATTCGGTTCCCTATATCAATACCCACC +GGGGAAAAACGTTTGTCATCATGCTCGGCGGTGAAGCCATTGAGCATGAGAATTTCTCCAGTATCGTTAA +TGATATCGGGTTGTTGCACAGCCTCGGCATCCGTCTGGTGGTGGTCTATGGCGCACGTCCGCAGATCGAC +GCAAATCTGGCTGCACATCACCACGAACCGCTGTATCACAAGAATATACGTGTGACCGACGCCAAAACAC +TGGAACTGGTGAAGCAGGCAGCGGGAACATTGCAACTGGATATTACTGCTCGCCTGTCGATGAGTCTCAA +TAACACACCGCTGCAGGGCGCGCATATCAACGTCGTCAGTGGTAATTTTATTATTGCCCAGCCGCTGGGC +GTCGATGACGGCGTGGATTACTGTCATAGCGGGCGTATCCGGCGGATTGATGAAGACGCGATCCATCGTC +AACTGGACAGCGGTGCAATAGTGCTAATG +>test.0417.00002.0003b_00028 810 NA | NA | NA | ID=3_1;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.520 | NA +CCGGTCGCTGTTTCGGTCACTGGCGAGAGCTTTAATCTGACCTCGGAAGAGATTGCCACTCAACTGGCCA +TCAAACTGAAAGCTGAAAAAATGATTGGTTTTTGCTCTTCCCAGGGCGTCACTAATGACGACGGTGATAT +TGTCTCCGAACTTTTCCCTAACGAAGCGCAAGCACGGGTAGAAGCCCAGGAAGAGAAAGGCGATTACAAC +TCCGGTACGGTGCGCTTTTTGCGTGGCGCAGTGAAAGCCTGCCGCAGCGGCGTGCGTCGCTGTCATTTAA +TCAGTTATCAGGAAGATGGCGCGCTGTTGCAAGAGTTGTTCTCACGCGACGGTATCGGTACGCAGATTGT +GATGGAAAGCGCCGAGCAGATTCGTCGCGCAACAATCAACGATATTGGCGGTATTCTGGAGTTGATTCGC +CCGCTGGAGCAACAAGGTATTCTGGTACGCCGTTCTCGCGAGCAGCTGGAGATGGAAATCGACAAATTCA +CCATTATTCAGCGCGATAACACGACTATTGCCTGCGCCGCGCTCTATCCGTTCCCGGAAGAGAAGATTGG +GGAAATGGCCTGTGTGGCAGTTCACCCGGATTACCGCAGTTCATCACGGGGCGAGGTTCTGCTGGAACGC +ATTGCCGCTCAGGCGAAGCAGAGCGGCTTAAGCAAATTGTTTGTGCTGACCACGCGCAGTATTCACTGGT +TCCAGGAACGTGGATTTACCCCAGTGGATATTGATTTACTGCCCGAGAGCAAAAAGCAGTTGTACAACTA +CCAGCGTAAATCCAAAGTTTTGATGGCGGATTTAGGGTAA +>test.0417.00002.0003i_00029 1827 NA | NA | NA | ID=3_2;partial=00;start_type=ATG;rbs_motif=AGGAGG;rbs_spacer=3-4bp;gc_cont=0.549 | NA +ATGAAATTGCAAAAGCAATTACTGGAAGCTGTGGAGCACAAACAGCTACGCCCGCTGGACGTGCAGTTTG +CCCTGACCGTGGCGGGAGATGAACATCCTGCCGTCACCCTCGCGGCGGCACTATTAAGTCATGATGCCGG +AGAGGGACACGTTTGTTTGCCGCTTTCACGACTGGAAAATAACGAGGCATCGCATCCGCTGTTGGCGACC +TGTGTCAGTGAAATCGGTGAGCTACAAAATTGGGAAGAATGCTTGCTGGCTTCACAAGCGGTCAGCCGGG +GAGATGAACCAACGCCGATGATCCTCTGTGGCGATCGTCTTTATTTGAATCGCATGTGGTGTAACGAGCG +CACAGTGGCACGCTTTTTCAACGAAGTGAATCATGCCATTGAGGTTGATGAAGCTCTACTGGCGCAAACC +CTGGACAAACTTTTTCCAGTAAGCGATGAAATTAACTGGCAAAAAGTTGCGGCGGCAGTGGCGCTGACAC +GGCGGATCTCGGTGATTTCCGGTGGTCCTGGCACCGGTAAAACGACCACCGTAGCGAAGTTACTGGCAGC +GTTAATTCAAATGGCCGACGGCGAACGCTGCCGTATCCGTCTGGCTGCACCAACGGGTAAAGCTGCCGCG +CGCTTAACCGAATCTCTCGGCAAGGCTTTGCGACAATTACCGCTGACCGATGAACAAAAGAAACGCATTC +CGGAAGATGCCAGCACTTTGCACCGATTGCTGGGTGCGCAGCCGGGTAGCCAGCGTTTACGTCATCATGC +CGGTAACCCGCTGCATCTTGATGTGCTGGTGGTAGATGAAGCGTCAATGATCGATCTTCCTATGATGTCG +AGACTGATCGACGCCTTGCCCGATCATGCGCGAGTGATCTTTCTCGGCGATCGTGATCAACTGGCCTCGG +TTGAGGCTGGGGCTGTGCTGGGCGATATCTGCGCTTATGCCAACGCGGGCTTTACCGCCGAGCGTGCCGG +GCAGTTGAGCCGCCTGACGGGAAGCCACGTTCCGGCAGGAACTGGCACAGAAGCGGCATCTTTGCGCGAC +AGCCTCTGCCTGCTGCAAAAAAGCTATCGTTTCGGCAGCGATTCTGGCATTGGTCAGTTAGCTGCGGCGA +TTAACCGTGGTGATAAAACGGCAGTGAAAACCGTTTTTCAGCAGGATTTTACTGATATCGAAAAACGGCT +TTTACAGAGTGGCGAAGATTATATTGCGATGCTTGAGGAAGCTCTTGCGGGTTACGGGCGTTATCTGGAT +CTGCTGCAAGCGCGTGCCGAGCCGGATTTAATCATTCAGGCGTTCAATGAGTACCAGCTTTTGTGCGCCC +TGCGGGAAGGGCCGTTTGGCGTGGCTGGACTGAATGAGCGAATTGAGCAGTTTATGCAACAGAAGCGCAA +AATTCATCGTCATCCGCACTCTCGTTGGTACGAAGGCCGACCAGTGATGATTGCCCGTAATGACAGCGCG +CTTGGGTTGTTTAATGGCGATATTGGTATTGCGCTGGATCGCGGGCAGGGGACGCGCGTCTGGTTTGCGA +TGCCGGACGGCAATATTAAGTCTGTGCAACCGAGTCGCCTGCCAGAGCACGAAACGACGTGGGCGATGAC +GGTACATAAATCGCAGGGATCGGAGTTCGACCATGCGGCGTTGATTTTACCGAGTCAACGCACGCCGGTA +GTAACGCGAGAGCTGGTTTACACCGCGGTGACCCGCGCGCGTCGCCGTCTGTCGCTGTATGCCGATGAGC +GCATATTAAGTGCGGCAATCGCCACTCGTACTGAGCGGCGCAGTGGTCTGGCGGCGTTGTTTAGTTCACG +GGGATAA +>test.0417.00002.0003i_00030 3543 NA | NA | NA | ID=3_3;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.544 | NA +ATGAGTGATGTCGCCGAGACACTAGATCCTTTGCGCTTGCCCTTACAGGGCGAGCGCCTGATTGAAGCCT +CTGCCGGCACAGGCAAAACCTTTACGATTGCGGCGCTCTATTTGCGCCTGTTACTTGGACTAGGCGGTTC +TGCCGCCTTTCCCCGCCCGCTGACCGTTGAAGAACTGCTGGTGGTGACCTTTACCGAGGCTGCTACGGCA +GAATTGCGTGGTCGTATCCGTAGCAATATCCACGAGTTGCGCATCGCCTGTCTGCGTGAAACCACCGACA +ATCCACTGTACAAACGCCTGCTGGAAGAGATCGACGATAAAGCGCAAGCCGCGCAGTGGTTGTTGTTAGC +CGAGCGGCAGATGGATGAAGCGGCAGTCTTTACTATTCACGGCTTTTGCCAGCGCATGCTCAACCTGAAT +GCCTTTGAATCCGGCATGCTGTTTGAGCAGCAGCTGATTGAAGATGAGTCTCTGCTACGCTACCAGGCCT +GCGCCGATTTCTGGCGTCGCCACTGCTACCCGCTGCCGCGTGAAATTGCCCAGGTCGTCTTTGAAACCTG +GAAAGGGCCGCAGGCGTTGCTGCGCGATATTAATCGTTATCTGCAAGGCGAAGCGCCGGTTATCAAAGCA +CCGCCCCCCGATGATGAAACGCTGGCTTCCCGCCACGCGCAAATTGTGGCGCGTATTGATGCCGTAAAAC +AGCAGTGGCGCGACGCAGTGGGTGAACTGGATGCGCTGATCGAATCTTCTGGTATTGATCGACGCAAGTT +TAACCGTAGCAATCAGGCTAAATGGATCGAGAAGATCAGCGCCTGGGCAGAAGAAGAGACCAACAGCTAT +CAGTTGCCGGAGTCGCTGGAAAAATTCTCTCAGCGTTTCTTAGAAGATCGCACGAAAGCCGGGGGGGAAA +CCCCGCGACATCCACTGTTTGAGGCGATCGAACAACTGCTTGCAGAACCATTGTCGATCCGCGATCTGGT +GATCACTCGCGCATTGGCTGAGATCCGCGAAACAGTAGCGCGTGAAAAACGCCGCCGTGGCGAATTGGGT +TTTGATGACATGTTAAGTCGGCTCGATTCCGCGCTGCGTAGTGAAAGCGGCGAGGTATTGGCAGCGGCGA +TCCGTACGCGATTCCCGGTGGCAATGATCGATGAATTTCAGGATACCGACCCCCAACAGTATCGAATTTT +TCGCCGTATCTGGCACCATCAGCCGGAAACCGCATTGTTGCTGATTGGCGACCCGAAACAGGCCATATAT +GCATTCCGGGGTGCGGATATCTTCACTTATATGAAGGCGCGTAGCGAAGTTCATGCTCACTACACCTTAG +ATACCAACTGGCGTTCCGCACCGGGAATGGTGAACAGCGTTAACAAACTTTTCAGCCAGACTGATGACGC +GTTCATGTTTCGTGAAATACCGTTTATTCCTGTGAAATCTGCCGGCAAAAATCAGGCGTTACGTTTTGTA +TTTAAAGGTGAAACGCAGCCTGCGATGAAAATGTGGCTGATGGAAGGCGAAAGCTGCGGCGTTGGCGACT +ATCAAAGTACCATGGCGCAGGTATGTGCTGCGCAAATCCGCGACTGGCTACAAGCCGGGCAACGCGGCGA +AGCGTTGCTGATGAACGGCGACGATGCGCGTCCGGTGCGTGCTTCGGACATCAGTGTGCTGGTGCGCAGC +CGCCAGGAGGCCGCTCAGGTGCGCGATGCCTTAACGCTGCTGGAAATCCCTTCCGTTTACCTTTCGAACC +GCGACAGTGTTTTTGAAACTCTGGAAGCACAGGAGATGCTTTGGCTGTTGCAGGCGGTGATGACGCCCGA +ACGTGAGAACACCCTGCGCAGTGCGCTGGCAACGTCAATGATGGGGCTGAATGCGCTGGATATTGAAACG +CTGAATAATGACGAACATGCGTGGGATGCGGTCGTCGAAGAGTTCGATGGTTATCGGCAAATCTGGCGCA +AACGTGGCGTTATGCCGATGCTGCGGGCGCTGATGTCGGCGCGTAACATTGCAGAAAACTTGCTGGCAAC +GGCAGGCGGTGAGCGGCGTCTTACCGATATCTTGCATATCAGCGAACTGCTACAAGAAGCCGGAACGCAG +CTGGAAAGTGAACATGCGCTGGTACGCTGGTTATCGCAACATATCCTCGAGCCAGACAGTAATGCCTCCA +GCCAACAAATGCGCCTCGAAAGTGATAAACATCTGGTGCAGATTGTCACGATACACAAATCAAAAGGGCT +GGAATATCCGCTGGTCTGGTTGCCATTTATTACCAATTTCCGCGTCCAGGATCAGGCGTTTTATCACGAT +CGCCACTCGTTTGAGGCCGTTCTGGATCTTAATGCTGCGCCAGAAAGCGTCGACCTCGCGGAGGCCGAAC +GTCTGGCGGAAGATCTGCGTTTACTTTACGTGGCGCTGACGCGTTCGGTTTGGCATTGCAGTCTCGGCGT +TGCACCGCTGGTGCGCCGTCGTGGCGATAAAAAAGGTGATACCGACGTCCACCAAAGTGCGCTCGGGCGT +TTGCTGCAAAAAGGAGAACCGCAAGATGCGGCAGGGCTTCGTACCTGCATTGAAGCGTTGTGCGATGATG +ATATTGCCTGGCAAACGGCACAAATTGGTGATAACCAGCCCTGGCAGGTTAATGATGCATTAACTGCAGA +ACTGAATGCGAGGACGCTACAACGATTGCCCGGCGATAACTGGCGTGTCACCAGCTACTCCGGTTTGCAG +CAGCGTGGTCACGGTATCGCTCAGGATCTGATGCCACGGCTGGATGTTGATGCCGCAGGCGTGGTCAGCG +TCGTTGAAGAACCGACGTTAACACCGCATCAGTTCCCGCGCGGTGCGTCACCGGGGACATTCTTGCACAG +TTTGTTTGAAGACCTCGATTTTACCCAGCCGGTTGACCCGAACTGGGTACAGGAAAAACTGGAGCTCGGT +GGCTTTGAACCGCAGTGGGAACCGGTGTTGACTGAGTGGATCACGGCTGTCCTCCAGGCACCTCTCAATG +AAACGGGTGTTAGCCTGAATCAGCTTTCCGATCGCGATAAACAGGTGGAGATGGAGTTTTACCTGCCAAT +TAGCGAACCGCTCATCGCCAGCCAGCTTGATGCACTAATTCGCCAGTTTGACCCGCTATCCGCTGGCTGC +CCGCCGCTGGAGTTCATGCAGGTACGTGGCATGTTAAAAGGCTTTATCGATCTGGTGTTCCGCCACGAAG +GGCGTTATTACCTGCTCGACTATAAATCCAACTGGTTGGGTGAAGACAGTTCGGCTTACACCCAACAGGC +TATGGCAGCGGCAATGCAGGCACACCGCTATGATCTGCAATATCAGCTTTATACCCTGGCGCTGCACCGT +TATCTGCGCCATCGTATTGCTGATTACGACTATGAGCGCCACTTTGGCGGCGTTATTTATCTGTTCCTGC +GTGGCGTTGATAAAGAACATCCGCAACAAGGGATCTACGCGACCCGACCCAACGCCGGGTTGATTGACCT +GATGGATGAGATGTTTGCCGGTATGACCCTGGAGGAGGCGTAA +>test.0417.00002.0003i_00031 2889 NA | NA | NA | ID=3_4;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.510 | NA +ATGCCCCGCAGCATCTGGTTCAAAGCATTATTGTTGTTTGTTGCCCTCTGGGCACCCTTAAGTCAGGCAG +AAACGGGATGGCAGCCGATTCAGGAAACCATCCGTAAAAGTGATAAAGATAACCGCCAGTATCAGGCTAT +ACGTCTGGATAACGGTATGGTGGTCTTACTGGTTTCTGATCCGCAGGCAGTTAAATCGCTCTCGGCGCTG +GTGGTGCCCGTTGGGTCGCTGGAAGATCCTGAGGCGTACCAGGGGCTGGCACATTACCTTGAACATATGA +GTCTGATGGGGTCGAAAAAGTATCCGCAGGCTGACAGTCTGGCCGAATATCTCAAAATGCACGGCGGCAG +TCACAATGCCAGCACGGCACCGTATCGCACGGCTTTCTATCTGGAAGTTGAGAACGACGCCTTGCCCGGT +GCGGTAGACCGCCTGGCCGATGCTATTGCAGAACCCTTGCTCGACAAGAAATACGCCGAACGTGAACGTA +ATGCAGTGAATGCCGAATTAACCATGGCGCGTACGCGTGACGGGATGCGCATGGCACAGGTCAGCGCAGA +AACCATTAACCCGGCACACCCCGGTTCAAAGTTTTCTGGTGGTAACCTCGAAACTTTAAGCGACAAACCA +GGTAATCCGGTACAGCAGGCGCTGAAAGATTTCCACGAGAAGTACTATTCCGCCAATCTGATGAAGGCGG +TTATTTACAGCAATAAACCGTTGCCGGAGTTGGCGAAAATGGCGGCGGACACCTTTGGTCGCGTGCCGAA +CAAAGAGAGCAAAAAACCGGAAATCACCGTGCCGGTAGTCACCGACGCGCAAAAGGGCATTATCATTCAT +TACGTCCCGGCGTTGCCGCGTAAAGTTCTGCGCGTTGAGTTTCGCATCGATAACAATTCAGCGAAGTTCC +GTAGTAAAACGGATGAATTGATTACCTATCTGATTGGTAATCGCAGCCCTGGTACACTTTCTGACTGGCT +GCAAAAGCAGGGATTAGTTGAGGGCATTAGCGCCAATTCCGATCCTATCGTCAACGGCAACAGCGGCGTA +TTAGCGATCTCTGCGTCTTTAACCGATAAAGGTCTGGCGAATCGCGATCAGGTTGTGGCGGCCATTTTTA +GCTACCTCAATCTGTTACGTGAAAAAGGGATCGATAAACAATACTTCGATGAACTGGCGAATGTGCTGGA +TATCGACTTCCGTTATCCGTCAATCACCCGTGATATGGATTACGTCGAATGGCTGGCTGATACCATGATT +CGCGTTCCTGTTGAGCATACACTGGATGCAGTCAATATTGCCGATCGGTACGATGCTAAAGCAGTAAAAG +AACGTCTGGCGATGATGACGCCGCAGAATGCGCGTATCTGGTATATCAGCCCGAAAGAGCCGCACAACAA +AACGGCTTACTTTGTCGATGCGCCGTATCAGGTCGATAAAATTAGCGCACAAACTTTCGCGGACTGGCAG +AAAAAAGCCGCCAATATTGCGCTCTCCTTACCGGAGCTTAACCCCTATATTCCTGACGATTTCTCGCTGA +TTAAGTCAGAGAAGAAATACGACCATCCAGAGTTGATTGTTGATGAGTCGAATCTGCGCGTGGTGTATGC +GCCAAGCCGTTATTTTGCCAGTGAGCCCAAAGCTGATGTCAGCCTGATTTTGCGTAATCCGAAAGCCATG +GACAGCGCCCGCAATCAGGTGATGTTTGCGCTCAATGATTATCTCGCAGGGCTGGCGCTTGATCAGTTAA +GCAACCAGGCGTCGGTTGGTGGCATAAGTTTTTCCACCAATGCTAACAACGGCCTTATGGTTAATGCCAA +TGGTTACACTCAGCGCCTGCCGCAGCTGTTCCAGGCTCTGCTGGAGGGCTACTTTAGCTATACCGCTACG +GAAGATCAGCTTGAGCAGGCGAAGTCCTGGTATAACCAGATGATGGATTCCGCAGAAAAGGGCAAAGCGT +TTGAGCAGGCGATTATGCCCGCGCAGATGCTCTCGCAAGTGCCGTACTTCTCGCGAGATGAACGGCGCAA +AATTTTGCCCTCCATTACGTTGAAAGAGGTGCTGGCCTATCGCGACGCCTTAAAATCAGGGGCTAGACCA +GAGTTTATGGTTATCGGCAACATGACTGAAGCCCAGGCAACAACGCTGGCACGCCATGTGCAAAAACAGT +TGGGCGCTGATGGTTCAGAGTGGTGTCGTAACAAAGATGTCGTGGTCGATAAAAAACAATCCGTCATCTT +TGAAAAAGCTGGTAACAGCACCGACTCCGCACTGGCAGCGATATTTGTACCGACTGGCTACGATGAATAC +ACCAGCTCAGCCTATAGCTCTCTGTTGGGGCAGATCGTACAGCCGTGGTTCTACAATCAGTTGCGTACCG +AAGAACAGTTGGGCTATGCCGTGTTTGCGTTTCCAATGAGCGTGGGGCGTCAGTGGGGCATGGGCTTCCT +TTTGCAAAGCAATGATAAACAGCCTTCATTCTTGTGGGAGCGTTACAAGGCGTTTTTCCCAACCGCAGAG +GCAAAATTGCGGGCGATGAAGCCAGAGGAGTTTGCGCAAATCCAGCAGGCGGTAATTACTCAGATGCTGC +AGGCACCGCAAACGCTCGGCGAAGAAGCATCGAAGTTAAGTAAAGATTTCGATCGCGGCAATATGCGCTT +CGATTCGCGTGATAAAATCGTGGCCCAGATAAAACTGCTGACGCCGCAAAAACTTGCTGATTTCTTCCAT +CAGGCGGTGGTCGAGCCGCAAGGTATGGCTATTCTGTCGCAGATTTCCGGCAGCCAGAACGGGAAAGCCG +AATATGTGCATCCTGAAGGCTGGAAAGTGTGGGAGAACGTCAGCGCGTTGCAGCAAACAATGCCCCTGAT +GAGTGAAAAGAATGAGTGA +>test.0417.00002.0003i_00032 3369 NA | NA | NA | ID=3_5;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.535 | NA +ATGTTAAGGGTCTACCATTCCAATCGTCTGGACGTGCTGGAAGCGTTGATGGAGTTTATTGTCGAACGCG +AACGGCTGGACGATCCTTTCGAACCAGAGATGATTCTGGTGCAAAGTACCGGTATGGCACAGTGGCTGCA +AATGACCCTGTCGCAAAAGTTTGGTATTGCGGCAAACATTGATTTTCCGCTGCCAGCGAGCTTTATCTGG +GATATGTTCGTCCGGGTGTTACCGGAGATCCCCAAAGAGAGCGCCTTTAACAAACAGAGCATGAGCTGGA +AACTGATGACTCTGCTGCCGCAACTGTTGGAGCGCGAAGACTTTACCCTGTTGCGGCATTATCTGACTGA +CGATAGTGACAAGCGAAAACTGTTCCAGCTTTCTTCAAAAGCGGCGGACCTGTTTGACCAGTATCTGGTC +TATCGTCCGGACTGGCTGGCACAGTGGGAAACAGGACATCTGGTAGAAGGGTTGGGAGAAGCACAGGCCT +GGCAAGCGCCGTTGTGGAAGGCGTTGGTGGAATATACCGACGAACTTGGGCAACCGCGCTGGCACCGCGC +CAATCTCTATCAGCGCTTTATCGAAACGCTGGAGTCCGCGACGACCTGCCCGCCGGGGTTACCTTCGCGC +GTCTTTATATGCGGTATTTCCGCGTTACCGCCTGTTTATCTCCAGGCGCTACAGGCGCTGGGTAAACATA +TTGAAATCCATCTCCTGTTTACCAACCCCTGCCGTTATTACTGGGGCGACATTAAAGATCCAGCTTATCT +GGCGAAACTACTGACTCGCCAGCGCCGACACAGTTTTGAAGATCGCGAATTACCGCTATTTCGCGACAGC +GAAAATGCCGGGCAGCTCTTTAACAGCGATGGTGAACAGGATGTCGGCAACCCGCTGCTGGCTTCATGGG +GCAAGCTTGGGCGCGACTACATTTATCTCCTTTCTGACCTGGAGAGCAGCCAGGAGCTGGACGCTTTTGT +CGATGTGACGCCAGATAACCTGCTGCATAATATTCAGTCTGACATTCTGGAACTGGAAAACCGCGCCGTT +GCTGGTGTGAACATCGAAGAGTTTTCCCGTAGCGATAACAAACGCCCGCTTGATCCACTGGATAGCAGTA +TCACCTTCCACGTTTGCCATAGCCCGCAGCGTGAAGTTGAAGTTTTACACGATCGCCTGCTGGCGATGCT +GGAGGAAGACCCGACACTTACTCCGCGCGACATCATCGTGATGGTGGCTGATATCGACAGCTACAGTCCG +TTTATTCAGGCTGTGTTTGGTAGTGCACCTGCGGATCGTTACCTGCCTTACGCCATTTCCGACCGTCGGG +CGCGGCAGTCGCATCCTGTACTTGAAGCGTTTATCAGCCTGTTATCGCTGCCAGACAGCCGCTTTGTGTC +GGAAGACGTGCTGGCATTACTGGATGTGCCGGTGCTGGCAGCGCGGTTTGACATCACCGAAGAAGGGCTG +CGTTATTTACGTCAGTGGGTCAACGAATCCGGCATTCGTTGGGGGATAGATGACGACAACGTTCGCGAGC +TGGAACTTCCCGCTACCGGTCAACACACCTGGCGGTTTGGCCTGACGCGCATGTTGCTGGGCTACGCGAT +GGAGAGCGCGCAGGGCGAGTGGCAATCGGTTCTACCTTATGATGAATCGAGCGGCTTAATTGCAGAACTG +GTGGGGCATCTGGCTTCACTGCTAATGCAGCTAAATATCTGGCGTCGCGGGCTGGCGCAGGAGCGTCCGC +TGGAAGAGTGGTTGCCGGTTTGTCGCGATATGCTCAACGCCTTTTTCCTGCCGGATGCGGAAACCGAAGC +GGCGATGACGCTGATCGAACAACAATGGCAGGCGATTATCTCCGAAGGTTTAGGCGCGCAGTATGGCGAC +GCGGTGCCGCTGTCACTATTGCGTGATGAACTGGCACTGCGCCTGGATCAAGAACGTATCAGCCAGCGTT +TTCTCGCCGGACCGGTTAACATTTGTACTCTGATGCCAATGCGTTCAATTCCGTTCAAAGTGGTTTGCCT +GCTGGGAATGAACGACGGCGTTTATCCACGTCAGCTTGCGCCATTGGGCTTTGATCTGATGAGCCAGAAA +CCGAAGCGTGGCGACCGTAGCCGTCGCGATGACGACCGCTATCTGTTCCTGGAAGCGTTAATTTCCGCGC +AGCAAAAACTCTATATCAGCTATATTGGGCGTTCCATTCAGGATAACAGTGAACGTTTCCCGTCGGTACT +GGTGCAGGAACTGATCGACTACATCGGGCAAAGCCATTATCTACCGGGCGATGAAGCGCTTAACTGTGAT +GAAAGCGAGGCAAGGGTAAAAGCGCATCTTACTTGCCACCATACCCGGATGCCGTTTGACCCGCAAAACT +ACCAGCCCGGTAACTTACAAAGCTATGCGCGCGAGTGGCTACCTGCGGCCAGCCAGGCTGGTAAAGCACA +TTCTGAATTTGTTCAGCCGCTGCCATTTACCTTACCGGAAACCGTGCCGCTGGAAACGCTACAACGATTC +TGGGCACATCCGGTGCGGGCGTTTTTCCAGATGCGTTTGCAGGTGAACTTCCGTACCGAAGACAGCGAAA +TTCCCGACACTGAACCTTTTATTCTTGAAGGGCTTAGTCGTTATCAAATCAACCAGCAGTTATTAAATGT +ACTGGTTGAGCAGGATGATGCCGAACGCTTGTTCCGCCGATTCCGGGCGGCAGGTGATTTGCCGTATGGT +GCCTTTGGTGAAATTTTCTGGGAAACGCAGTGTCAGGAGATGCAGCAGCTTGCCGACAGAGTCATTGCCT +GTCGCCAGCCAGGGCAGAGTATGGAGATTGATCTCGCCTGCAACGGTGTGCAGATAACTGGCTGGTTGCC +GCAGGTGCAGCCGGATGGCCTGTTGCGCTGGTGTCCCTCTTTATTAAGTGTGGCGCAGGGAATGCAACTT +TGGCTGGAACACCTTGTCTACTGTGCCAGCGGTGGTAATGGTGAAAGTCGCCTTTTTCTACGCAAAGACG +GCGAGTGGCGTTTTCCGCCGCTTGCAGCCGAACAGGCTTTGCATTACCTCTCACAACTGATTGAGGGGTA +TCGTGAAGGAATGTCCGCGCCATTGCTGGTGTTACCTGAAAGTGGCGGCGCGTGGCTAAAAACCTGTTAT +GACGCGCAAAACGATGCCATGCTGGATGACGATTCCACGTTGCAAAAAGCCCGTACGAAATTCCTTCAGG +CTTACGAAGGCAACATGATGGTGCGTGGCGAAGGTGATGATATCTGGTATCAACGGCTCTGGCGGCAATT +AACACCAGAGACAATGGAGGCTATCGTTGAACAGTCGCAACGTTTCCTGTTACCGCTGTTTCGCTTTAAT +CAGTCATGA +>test.0417.00002.0003i_00033 324 NA | NA | NA | ID=3_6;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.543 | NA +ATGTCAGCTTCCCTGAGGAATCAACAAGGCTTTAGTCTGCCGGAGGTAATGTTGGCGATGGTGTTGATGG +TGATGATTGTCACTGCGTTATCGGGTTTCCAGCGAACATTAATGAACAGTCTTGCCAGCAGAAACCAGTA +CCAACAGCTCTGGCGGCATGGCTGGCAGCAAACGCAACTGCGCGCGATTTCGCCACCTGCTAACTGGCAG +GTCAACCGAATGCAGACATCGCAGGCGGGATGTGTCAGCATCAGCGTTACGCTAGTTTCACCCGGGGGCA +GAGAAGGCGAGATGACCCGCCTGCATTGCCCGAATCGTCAGTAG +>test.0417.00002.0003i_00034 408 NA | NA | NA | ID=3_7;partial=00;start_type=GTG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.527 | NA +GTGAACCGCGAAAAGGGAGTTTCGTCACTGGCTCTGGTCCTGATGCTGCTGATTTTGGGTAGCTTGCTAT +TGCAAGGAATGAGTCAGCAGGATCGCAGTTTTGCTTCTCGCGTGAGCATGGAAAGTCAGTCATTGAGCCG +CCAGGCCATCGTTCAGTCGGCGCTGGAGTGGGGAAAAATGCACTCCTGGCAGACGCAGCCCGCAGTTCAG +TGCTTACTGTATGCTGCCACCGGTGCCCGGGTTTGTCTGCGTTTACTGGCAGATAATGAAGCCTTATTGA +TTGCTGGTTATGAAGGCGTTTCGTTGTGGCGAACAGGCGAAGTCATCGATGGAAACATTGTTTTTTCGCC +ACGCGGCTGGAGCGATTTTTGTCCGCTGAAAGAGAGGGCGTTATGTCAGCTTCCCTGA +>test.0417.00002.0003i_00035 564 NA | NA | NA | ID=3_8;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.532 | NA +ATGCCTGTAAAAGAGCAAGGTTTTTCTCTGCTGGAAGTGTTGATTGCTATGGCGATCAGTAGCGTATTGT +TGCTGGGGGCTGCACGCTTTCTGCCTGCGTTACAGCGTGAAAGTTTAACGAGCACCCGTAAACTGGCGCT +GGAAGATGAAATCTGGCTGCGGGTATTTACCGTCGCGAAGCATCTCCAGAGGGCGGGTTATTGCCATGGC +AGCTGTACGGGCGAAGGGCTGGAAATTGTCGGACAGGGTGACTGTGTCATTGTGCAGTGGGATGCGAACA +GTAACGGTATCTGGGATCGCGAACCGGTAAAAGAGTCCGACCAGATTGGATTTCGTCTGAAGGAGCATGT +GCTGGAAACGCTACGCGGTGCGACATCCTGTGAAGGTAAGGGCTGGGATAAAGTCACTAATCCGGATGCC +ATCATTATCGACACTTTTCAGGTCGTACGTCAGGATGTCAGCGGCTTCTCGCCGGTGTTGACGGTTAATA +TACACGCTGCCAGCAAGGCTGATCCGCAAACCGTGGTGGATGCCAGCTATAGCGTGACAGGAGCCAACCT +GTGA +>test.0417.00002.0003i_00036 504 NA | NA | NA | ID=3_9;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.544 | NA +ATGAAAACACAACGTGGTTATACGCTGATTGAAACGCTGGTCGCGATGCTTATTCTGGTCATGCTAAGCG +CAAGTGGGCTCTATGGCTGGCAATACTGGCAGCAGTCGCAACGGCTTTGGCAAACCGCCAGCCAGGCGCG +GGACTATTTGCTCTATTTACGTGAAGATGCCAACTGGCATAACCGCGACCACAGTATCAGTCTTATCAGG +GAGGGGACGTTATGGTGCCTTGTGAGTTCCGTTGCTGGGGCGAATACCTGTCATGGCAGTTCCGTTGCTG +GGGCGAATACCTGTCATGGCAGTTCACCATTGGTCTTTGTGCCGCGCTGGCCCGAAGTCGAAATGAGCGA +CCTGACACCTTCGCTTGCTTTCTTTGGCCTGCGCAATACCGCATGGGCCGGGCATATTCGCTTCAAAAAC +TCAACGGGCGAGTGGTGGCTAGTGGTTTCGCCGTGGGGAAGACTCCGGCTTTGTCAGCAAGGAGAAACAG +AAGGATGCCTGTAA +>test.0417.00002.0003i_00037 795 NA | NA | NA | ID=3_10;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.516 | NA +ATGAAACAGTATTTAGAACTGATGCAAAAAGTGCTCGACGAAGGCACACAGAAAAACGACCGTACCGGAA +CCGGAACGCTTTCCATTTTTGGTCATCAGATGCGTTTTAACCTGCAGGATGGATTCCCGCTGGTGACAAC +TAAACGTTGCCACCTGCGTTCCATCATCCACGAACTGCTGTGGTTCCTGCAGGGCGACACTAACATTGCT +TATCTACACGAAAACAATGTCACCATCTGGGACGAATGGGCCGATGAAAACGGCGACCTCGGGCCAGTGT +ATGGTAAACAGTGGCGCGCCTGGCCAACGCCGGATGGTCGTCATATTGACCAGATCACTACGGTACTGAA +CCAGCTGAAAAACGACCCGGATTCCCGCCGCATTATTGTTTCAGCGTGGAACGTAGGCGAACTGGATAAA +ATGGCGCTGGCACCGTGCCATGCATTCTTCCAGTTCTATGTGGCAGACGGCAAACTCTCTTGCCAGCTTT +ATCAGCGCTCCTGTGACGTCTTCCTCGGCCTGCCGTTCAACATTGCCAGCTACGCGTTACTGGTGCATAT +GATGGCGCAGCAGTGCGATCTGGAAGTGGGTGATTTTGTCTGGACCGGTGGCGACACGCATCTCTACAGC +AACCATATGGATCAAACTCATCTGCAATTAAGCCGCGAACCGCGTCCGCTGCCGAAGTTGATTATCAAAC +GTAAACCCGAATCCATCTTCGACTACCGTTTCGAAGACTTTGAGATTGAAGGATACGATCCACATCCGGG +CATTAAAGCGCCGGTGGCTATCTAA +>test.0417.00002.0003i_00038 876 NA | NA | NA | ID=3_11;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.525 | NA +ATGACCAGTAGCTATCTGCATTTTCCGGAGTTTGATCCGGTCATTTTCTCAATAGGACCCGTGGCGCTTC +ACTGGTACGGCCTGATGTATCTGGTGGGTTTCATTTTTGCAATGTGGCTGGCAACACGACGGGCGAATCG +TCCGGGCAGTGGCTGGACCAAAAATGAAGTTGAAAACTTACTCTATGCGGGCTTCCTCGGCGTCTTCCTC +GGTGGACGTATTGGTTATGTTCTGTTCTACAATTTCCCGCAGTTTATGGCCGATCCGCTGTATCTTTTCC +GTGTATGGGACGGCGGCATGTCCTTCCACGGCGGCCTGATTGGCGTTATCGTGGTGATGATTATCTTCGC +CCGCCGTACTAAACGTTCCTTCTTCCAGGTCTCTGATTTTATTGCCCCACTCATTCCGTTTGGTCTTGGT +GCCGGGCGTCTGGGCAACTTTATTAACGGTGAATTGTGGGGCCGCGTTGACCCGAACTTCCCGTTTGCCA +TGCTGTTCCCTGGCTCCCGTACAGAAGATATTTTGCTGCTGCAAACCAACCCGCAGTGGCAATCCATTTT +CGACACTTACGGTGTGCTGCCGCGCCACCCATCACAGCTTTACGAGCTGCTGCTGGAAGGTGTGGTGCTG +TTTATTATCCTCAACCTGTATATTCGTAAACCGCGCCCAATGGGAGCTGTCTCAGGCTTGTTCCTGATTG +GTTACGGCGCGTTTCGCATCATTGTTGAGTTTTTCCGCCAGCCCGACGCGCAGTTTACTGGTGCCTGGGT +GCAGTACATCAGCATGGGGCAAATTCTTTCCATCCCGATGATTGTCGCGGGTGTGATCATGATGGTCTGG +GCATATCGTCGCAGCCCACAGCAACACGTTTCCTGA +>test.0417.00002.0003i_00039 2247 NA | NA | NA | ID=3_12;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.536 | NA +ATGCTCACTCGCCTGCGCGAAATAGTCGAAAAGGTAGCCAGCGCACCACGCCTGAATGAGGCGTTAAATA +TTCTGGTTACCGACATCTGTCTTGCGATGGATACCGAGGTCTGTTCGGTCTACCTGGCCGATCATGATCG +ACGTTGTTACTACCTGATGGCGACCCGGGGACTGAAAAAACCACGCGGTCGCACTGTAACGCTCGCGTTT +GATGAAGGGATCGTCGGCCTGGTTGGCAGGCTGGCGGAACCGATAAACCTTGCAGATGCGCAAAAGCACC +CCAGCTTCAAATACATCCCCTCCGTAAAAGAAGAACGTTTCCGCGCGTTTTTAGGCGTACCAATTATTCA +ACGTCGCCAGTTGCTTGGTGTACTGGTGGTACAGCAACGAGAGTTGCGCCAGTATGACGAAAGTGAAGAA +TCCTTCCTGGTGACGCTTGCCACCCAGATGGCAGCTATTCTTTCTCAGTCGCAGTTGACTGCCTTGTTTG +GGCAATATCGCCAGACGCGAATCCGTGCATTACCGGCAGCACCTGGTGTGGCGATTGCCGAAGGCTGGCA +GGATGCCACGTTACCTTTAATGGAACAGGTGTATCAGGCATCAACGCTGGATCCGGCTCTGGAACGCGAA +CGACTGACCGGGGCGTTGGAAGAGGCGGCTAACGAGTTTCGCCGCTATAGCAAACGCTTTGCTGCCGGTG +CACAAAAAGAAACGGCGGCTATTTTCGATCTTTACTCACACCTGCTTTCGGATACCCGGCTGCGTCGCGA +ATTGTTTGCCGAGGTTGATAAAGGCTCGGTGGCAGAGTGGGCGGTAAAAACGGTCATTGAAAAATTTGCC +GAACAGTTTGCCGCGCTAAGCGATAACTATCTCAAAGAGCGGGCTGGCGATTTACGTGCGCTGGGTCAGC +GATTGCTGTTTCATCTTGATGACGCTAATCAAGGGCCGAACGCCTGGCCGGAACGTTTCATTCTGGTGGC +AGATGAACTGTCAGCGACAACGCTTGCTGAGCTGCCCCAGGATCGCTTAGTCGGTGTTGTCGTGCGCGAT +GGCGCTGCCAACTCCCATGCTGCGATCATGGTACGTGCGCTGGGGATACCTACCGTGATGGGCGCGGATA +TTCAGCCTTCGGTACTGCATCGTCGGACGCTGATCGTCGATGGTTATCGCGGTGAATTGCTGGTCGATCC +GGAACCGGTACTGCTGCAAGAATATCAGCGGCTAATTAGTGAAGAGATCGAGCTTAGCCGTCTGGCGGAA +GATGACGTCAATTTACCCGCCCAGTTAAAAAGCGGCGAACGCATTAAAGTCATGCTCAATGCCGGTTTAA +GCCCGGAACATGAAGAAAAACTGGGCAGCCGTATTGATGGCATAGGACTTTATCGCACTGAAATCCCATT +CATGCTGCAAAGTGGTTTTCCGTCGGAAGAAGAACAGGTGGCGCAGTATCAGGGGATGCTGCAAATGTTT +AATGATAAACCCGTCACCTTGCGTACGCTGGATGTCGGAGCAGATAAGCAGCTGCCTTACATGCCGATCA +GCGAAGAGAATCCATGCCTGGGTTGGCGTGGGATTCGCATTACGCTCGATCAGCCGGAGATCTTCTTGAT +CCAGGTGCGGGCGATGCTGCGTGCTAATGCCGCTACGGGCAACCTGAATATTCTGTTGCCGATGGTCACA +AGCCTCGATGAAGTTGACGAAGCACGCCGCCTGATTGAACGTGCCGGACGTGAAGTCGAGGAGATGATCG +GTTACGAAATTCCCAAACCACGTATCGGCATCATGCTGGAAGTGCCGTCAATGGTATTTATGCTGCCGCA +TCTGGCAAAGCGGGTCGATTTCATCTCTGTTGGCACCAACGATCTGACTCAATACATCCTGGCCGTTGAT +CGCAACAATACCCGGGTGGCGAACATTTATGACAGTCTTCATCCTGCAATGTTACGAGCTCTGGCGATGA +TCGCCCGGGAAGCGGAAATACATGGAATCGATCTCCGTTTGTGCGGTGAAATGGCGGGCGATCCGATGTG +CGTGGCAATCCTCATTGGGCTTGGGTATCGCCATCTGTCTATGAACGGACGTTCTGTAGCGCGCGTAAAA +TACCTGCTGCGGCGCATTGATTTTGCTGAAGCAGAAAATCTTGCGCAGCGTAGTCTGGAAGCGCAACTGG +CGACCGAAGTTCGCCATCAGGTTGCAGCCTTTATGGAGCGTCGCGGCATGGGCGGGTTGATTCGCGGGGG +GTTATAG +>test.0417.00002.0003i_00040 531 NA | NA | NA | ID=3_13;partial=00;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.493 | NA +GTGATTGATGACGATGGCTACCGCCCAAACGTAGGTATCGTGATTTGTAATCGCCAGGGGCAGGTAATGT +GGGCCCGGCGATTTGGTCAGCACTCCTGGCAATTTCCGCAAGGCGGAATCAACCCCGGAGAATCCGCAGA +GCAGGCGATGTACCGTGAATTGTTTGAAGAAGTAGGATTAAGCCGCAAAGACGTTCGAATCCTTGCTTCA +ACGCGTAACTGGTTGCGCTACAAATTACCGAAACGTTTGGTGCGTTGGGACACGAAGCCGGTTTGTATCG +GCCAAAAACAAAAATGGTTTCTCTTGCAGCTGGTGAGCGGCGATGCAGAAATCAATATGCAAACCAGCAG +TACACCAGAGTTTGACGGCTGGCGATGGGTAAGTTACTGGTATCCAGTCAGACAGGTGGTGTCATTTAAA +CGTGATGTCTACCGTAGGGTAATGAAAGAGTTCGCGAGTGTGGTGATGTCACTGCAGGAAAATACGCCAA +AACCACAAAACGCATCTGCTTATCGACGTAAAAGAGGTTAA +>test.0417.00002.0003i_00041 162 NA | NA | NA | ID=3_14;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.395 | NA +ATGGAAACAGTAGTGGAGGTTTTTCACAGTTATCCCAGCTTTCTGTGGATAACATGGTGTAAGATCCTGT +TTATTTTCAGTGACCAGATTTGGAAAACCCGTTGCAGTGTTGCGCAACTCGATTACCGGAAACCTAAAAA +GCAATATAAATCAGAGAATTGA +>test.0417.00002.0003i_00042 690 NA | NA | NA | ID=3_15;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.539 | NA +ATGTCCCAACCTCGCCCACTGCTCTCTCCTCCCGAAACTGAAGAACAATTGTTAGCGCAAGCACAACAAC +TTTCTGGTTATACATTGGGAGAACTGGCGGCACTTGCCGGGCTGGTTACGCCGGAGAATTTAAAACGCGA +TAAGGGCTGGATTGGCGTGTTACTGGAGATCTGGCTAGGTGCCAGCGCAGGGAGTAAACCTGAGCAAGAT +TTTGCTGCTCTGGGCGTGGAACTTAAAACTATCCCTGTGGATAGTCTTGGTCGTCCGCTGGAAACAACAT +TCGTTTGTGTTGCCCCGTTAACGGGCAATAGCGGGGTGACCTGGGAAACCAGCCACGTGCGCCACAAGCT +CAAACGCGTGCTGTGGATACCGGTTGAAGGCGAGCGCAGCATCCCGCTGGCAAAGCGTCGCGTAGGATCA +CCGTTGCTGTGGAGCCCGAATGAAGAGGAAGACCGGCAGTTACGCGAAGACTGGGAAGAATTAATGGATA +TGATTGTTCTCGGTCAGGTTGAGCGGATCACCGCTCGGCACGGGGAATATTTACAGATACGACCGAAAGC +AGCGAATGCGAAAGCGCTGACCGAAGCTATTGGTGCCCGGGGCGAACGGATTCTGACGCTGCCGCGCGGA +TTTTATTTGAAGAAGAATTTCACCAGTGCGCTACTGGCCCGTCATTTTCTGATCCAGTAG +>test.0417.00002.0003i_00043 714 NA | NA | NA | ID=3_16;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.503 | NA +ATGTTATTTGCATGGATAACCGATCCTAACGCCTGGCTTGCGCTCGGTACACTGACGCTGCTGGAGATCG +TTCTTGGGATCGACAATATTATTTTCCTTTCTCTGGTGGTGGCAAAGCTTCCCACAGCACAACGTGCTCA +TGCGCGCCGTCTGGGGTTGGCGGGAGCCATGGTTATGCGTCTGGCGCTGCTGGCATCCATCGCCTGGGTT +ACGCGCCTGACGAATCCGCTTTTTACAATATTCAGTCAGGAAATTTCCGCCCGTGATTTGATTCTGCTTC +TGGGTGGCTTGTTCCTTATCTGGAAAGCCAGCAAGGAAATCCACGAATCCATCGAAGGTGAAGAAGAAGG +GCTGAAAACACGCGTTTCATCATTCCTCGGCGCTATCGTGCAGATTATGCTGCTGGATATTATCTTCAGC +CTCGACTCGGTGATTACCGCTGTGGGTCTGTCAGATCACCTGTTTATTATGATGGCAGCCGTGGTAATTG +CCGTAGGCGTGATGATGTTCGCTGCGCGTTCGATTGGTGATTTTGTCGAGCGCCATCCTTCGGTAAAAAT +GCTGGCGCTCTCTTTCCTGATTCTGGTGGGCTTTACCCTGATTCTGGAAAGTTTCGACATCCACGTACCG +AAAGGTTACATCTACTTCGCGATGTTCTTCTCTATTGCGGTTGAAAGCCTCAACCTGATTCGCAACAAAA +AGAATCCGCTCTGA +>test.0417.00002.0003i_00044 219 NA | NA | NA | ID=3_17;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.434 | NA +ATGAAAAAATGGGCAGTAATAATTTCTGCAGTCGGACTGGCGTTTGCTGTTTCCGGGTGTTCCAGTGATT +ACGTCATGGCGACCAAAGATGGCCGTATGATTTTGACCGATGGAAAACCTGAAATTGATGATGATACCGG +GCTGGTGAGTTATCACGATCAGCAAGGTAACGCGATGCAAATTAACCGTGATGATGTTTCGCAAATTATT +GAACGTTAA +>test.0417.00002.0003i_00045 1041 NA | NA | NA | ID=3_18;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.544 | NA +ATGCAATATCACCGTATACCCCACAGTTCGCTGGAAGTCAGCACGCTGGGGCTTGGCACGATGACGTTTG +GTGAACAGAACAGCGAAGCCGACGCCCACGCACAACTCGACTATGCCGTCGCTCAGGGCATTAACCTTAT +CGACGTTGCCGAAATGTACCCAGTACCTCCGCGCCCCGAAACTCAAGGGCTAACCGAAACCTACGTCGGC +AACTGGCTGGCGAAACATGGCAGCCGCGAAAAGTTAATTATCGCCTCCAAAGTGAGCGGACCGTCGCGCA +ATAATGACAAAGGCATCCGCCCGGATCAGGCGCTGGATCGGAAGAATATCCGCGAAGCGCTGCATGACAG +CCTCAAGCGTCTGCAGACTGATTACCTCGATCTTTATCAGGTGCACTGGCCGCAGCGCCCAACCAACTGC +TTCGGCAAACTCGGTTATAGCTGGACAGATTCTGCGCCTGCGGTTTCGCTGCTGGATACACTGGACGCAC +TGGCAGAGTACCAACGCGCGGGAAAAATTCGTTATATCGGCGTGTCGAACGAAACTGCATTTGGCGTAAT +GCGCTACCTGCATCTGGCGGACAAACACGATCTGCCGCGTATTGTCACCATTCAGAACCCCTACAGTCTG +TTAAACCGCAGTTTTGAAGTAGGTCTGGCAGAAGTCAGCCAGTATGAAGGGGTCGAACTGCTGGCCTATT +CGTGCCTGGGTTTCGGCACGCTGACCGGGAAATATCTCAACGGTGCAAAACCCGCTGGCGCACGTAATAC +GCTCTTTAGTCGGTTCACCCGCTATAGCGGTGAGCAAACGCAAAAAGCCGTCGCGGCGTATGTTGATATA +GCCAGACGTCATGGCCTGGATCCTGCACAGATGGCGCTCGCTTTTGTACGCCGTCAACCGTTTGTTGCCA +GCACTCTGCTGGGCGCAACCACGATGGAGCAGCTGAAAACTAACGTCGAAAGTTTGCATCTGGAGTTAAG +CGAAGACGTGTTGGCAGAAATTGAAGCGGTGCATCAGGTTTACACTTATCCGGCACCATAA +>test.0417.00002.0003i_00046 1194 NA | NA | NA | ID=3_19;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.553 | NA +ATGAGTGAGTCAGTGCACACTAACACTTCGTTGTGGTCGAAGGGGATGAAAGCGGTTATCGTGGCGCAGT +TTCTCTCTGCGTTTGGCGATAATGCGCTACTGTTTGCCACTCTGGCGTTACTGAAAGCGCAGTTCTATCC +GGAGTGGAGCCAGCCCATCCTGCAAATGGTGTTTGTAGGTGCTTACATTCTTTTTGCGCCGTTTGTCGGG +CAGGTGGCGGATAGCTTCGCCAAAGGCCGGGTGATGATGTTTGCCAACGGCCTGAAGCTACTGGGCGCAG +CCAGTATCTGCTTTGGTATCAATCCGTTTCTCGGCTATACGTTGGTGGGTGTTGGTGCTGCAGCCTATTC +ACCGGCGAAATACGGTATTCTCGGCGAATTAACCACGGGTAGTAAGTTAGTAAAAGCTAACGGTTTAATG +GAAGCGTCTACCATAGCGGCGATTTTGCTCGGTTCCGTAGCTGGTGGTGTTCTGGCTGACTGGCATATTC +TGGTTGCCCTGGTCGCATGCGCACTGGCCTACGGTGGCGCGGTCGTTGCCAATATCTACATTCCCAAACT +GGCGGCGGCGCGTCCGGGGCAGTCCTGGAATCTCATCAGCATGACCCGCAGTTTCCTGAATGCCTGCACC +TCGCTATGGCGCAATGGTGAAACGCGTTTTTCGCTGGTGGGCACCAGTTTATTCTGGGGAGCGGGTGTCA +CGCTGCGTTTCCTGTTGGTGCTGTGGGTACCGGTGGCGCTGGGTATTACCGATAACGCTACGCCGACCTA +TCTCAACGCGATGGTAGCGATTGGTATCGTGGTTGGTGCAGGTGCGGCAGCGAAGTTAGTTACGCTGGAA +ACCGTGTCACGCTGTATGCCAGCCGGGATTTTGATTGGCGTGGTGGTACTGATTTTCTCCCTGCAACACG +AGCTGCTGCCAGCCTATGCTTTGTTGATGCTGATTGGCGTGCTGGGGGGCTTTTTTGTCGTTCCGCTCAA +TGCGTTGCTACAGGAGCGGGGCAAAAAAAGCGTCGGGGCGGGGAATGCGATTGCAGTACAAAACCTTGGC +GAAAACAGCGCCATGTTGTTGATGCTGGGCATTTACTCGCTGGCGGTAATGGTAGGCATCCCGGTCGTGC +CCATTGGCATTGGCTTCGGTGCGCTGTTTGCGCTGGCAATAACGGCGCTGTGGATCTGGCAGCGCCGTCA +TTAA +>test.0417.00002.0003i_00047 2160 NA | NA | NA | ID=3_20;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.522 | NA +ATGCTTTTTAGCTTTTTTCGAAATTTGTGCCGTGTTTTGTATCGCGTTCGCGTTACGGGTGACACCAAGG +CACTGAAGGGCGAGCGCGTTCTAATTACGCCTAATCACGTCTCTTTTATTGATGGCATACTGCTGGCATT +GTTTTTACCCGTACGTCCGGTATTTGCCGTTTACACCTCAATAAGCCAACAGTGGTATATGCGTTGGCTG +AAATCATTTATCGACTTTGTTCCTCTCGACCCGACGCAACCTATGGCGATTAAACATCTGGTACGTCTGG +TGGAACAGGGCCGACCAGTGGTGATTTTCCCTGAAGGACGCATCACCACCACTGGCTCGCTGATGAAAAT +CTACGATGGCGCGGGATTTGTCGCGGCGAAGTCTGGTGCAACGGTTATTCCTGTGCGTATTGAAGGGGCG +GAACTTACGCACTTCAGCCGCCTGAAAGGTCTGGTTAAACGTCGCTTGTTCCCGCAAATTACTCTGCATA +TTTTGCCACCAACGCAGGTGGAGATGCCGGATGCGCCGCGTGCCCGTGACCGTCGCAAAATCGCTGGCGA +AATGCTGCATCAAATAATGATGGAAGCGCGTATGGCGGTGCGCCCGCGTGAAACGCTGTACGAATCTTTA +CTGAGCGCAATGTACCGCTTCGGAGCCGGGAAGAAATGTGTCGAAGACGTTAACTTTACCCCGGACTCCT +ATCGCAAATTGCTTACGAAAACGCTGTTTGTTGGACGCATCCTTGAAAAATACAGTGTTGAAGGCGAACG +CATCGGCTTAATGCTGCCCAATGCAGGCATCAGTGCTGCAGTGATTTTTGGGGCCATCGCCCGTCGCCGC +ATTCCCGCAATGATGAACTACACCGCCGGGGTAAAAGGGTTGACCAGTGCTATTACGGCGGCTGAAATCA +AAACCATTTTCACTTCCCGTCAGTTTCTCGATAAAGGCAAACTCTGGCATCTGCCGGAGCAACTTACTCA +GGTGCGCTGGGTCTATCTGGAAGATTTAAAAGCAGATGTCACCACTGCCGACAAAGTATGGATCTTCGCT +CATTTGCTGATGCCGCGTCTGGCACAGGTTAAACAGCAGCCGGAAGAAGAGGCGCTGATCCTTTTTACCT +CCGGTTCTGAAGGCCATCCGAAAGGCGTCGTCCATAGCCATAAAAGCATTCTGGCGAATGTCGAGCAGAT +TAAAACGATTGCCGACTTCACCACCAACGATCGCTTTATGTCGGCGTTACCGCTGTTTCACTCCTTTGGG +CTGACGGTAGGCCTGTTTACGCCACTGCTCACAGGTGCAGAAGTGTTCCTTTATCCAAGCCCGCTGCACT +ACCGTATTGTGCCGGAGTTGGTGTATGACCGCAGTTGCACCGTGTTGTTCGGTACCTCCACTTTCCTCGG +TCACTACGCGCGTTTCGCCAACCCGTATGACTTCTATCGTCTACGCTATGTGGTGGCAGGCGCAGAAAAA +CTACAAGAAAGTACTAAACAGCTTTGGCAGGATAAATTTGGCCTGCGCATCCTTGAAGGCTACGGTGTGA +CCGAATGCGCGCCTGTCGTTTCTATCAACGTACCGATGGCGGCGAAACCCGGTACGGTAGGGCGTATTCT +ACCAGGAATGGATGCGCGCCTGTTGTCGGTTCCTGGTATCGAAGAGGGCGGACGCCTGCAACTGAAAGGG +CCGAACATAATGAACGGCTATCTGCGGGTGGAGAAGCCTGGTGTACTGGAAGTGCCCACCGCCGAGAATA +TTCGCGGCGAAATGGAGCGCGACTGGTATGACACTGGCGATATTGTGCGTTTTGACGAGCAGGGCTTTGT +GCAGATTCAGGGCCGCGCAAAACGCTTTGCCAAAATTGCAGGCGAAATGGTGTCGCTGGAAATGGTGGAA +CAACTGGCACTTGGTGTTTCGCCAGATAAAGTCCATGCCACTGCGATTAAGAGCGATGCCAGCAAAGGCG +AGGCACTGGTGCTTTTCACCACAGATAACGAACTGACGCGCGATAAGTTACAACAGTATGCCCGCGAGCA +CGGCGTGCCGGAGCTTGCTGTACCGCGCGATATTCGCTATCTGAAACAGATGCCATTACTTGGCAGCGGC +AAACCTGACTTTGTCACTTTGAAAAGCTGGGTAGACGAAGCGGAACAACACGATGAGTGA +>test.0417.00002.0003i_00048 1032 NA | NA | NA | ID=3_21;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.529 | NA +ATGGCGACCATAAAGGATGTAGCCCGACTGGCAGGCGTTTCAGTCGCCACCGTTTCCCGCGTCATTAATA +ATTCACCCAAAGCCAGCGAAGCTTCCCGGCTTGCTGTGCATAGTGCAATGGAGTCTCTTAGCTATCACCC +GAACGCCAACGCCCGTGCTCTGGCGCAGCAGACCACTGAAACGATCGGTCTGGTCGTTGGTGATGTTTCC +GATCCGTTTTTCGGCGCAATGGTGAAAGCGGTCGAACAGGTGGCTTATCACACTGGTAATTTTTTATTGA +TTGGCAACGGTTACCACAACGAACAAAAAGAGCGTCAGGCCATTGAGCAACTGATCCGCCATCGCTGTGC +TGCGCTGGTTGTCCATGCCAAAATGATCCCGGATGCCGATTTAGCCTCATTAATGAAACAAATGCCCGGT +ATGGTGCTGATCAACCGTATCCTGCCTGGCTTTGAAAACCGTTGTATTGCTCTGGACGATCGTTACGGTG +CCTGGCTGGCAACGCGTCATTTAATTCAGCAAGGTCATACCCGCATTGGTTATCTGTGCTCTAACCACTC +TATTTCTGACGCCGAAGATCGTCTGCAAGGGTATTACGATGCCCTTGCTGAAAGTGGTATTCCGGCCAAT +GACCGGCTGGTGACATTTGGCGAACCAGACGAAAGCGGCGGCGAACAGGCAATGACCGAGCTTTTGGGAC +GAGGCAGAAATTTCACTGCGGTAGCCTGTTATAACGATTCAATGGCGGCGGGCGCGATGGGCGTGCTCAA +TGATAATGGTATTGATGTACCGGGTGAGATTTCGTTAATTGGCTTTGATGATGTGCTGGTGTCACGCTAT +GTGCGTCCGCGCCTGACCACCGTGCGTTACCCAATCGTGACGATGGCGACGCAGGCTGCCGAACTGGCTT +TGGCGCTGGCGGATAATCGCCCTCTCCCGGAAATCACTAATGTCTTTAGTCCGACGCTGGTACGTCGCCA +TTCAGTGTCAACTCCGTCGCTGGAGGCAAGTCATCATGCAACCAGCGACTAA +>test.0417.00002.0003i_00049 1263 NA | NA | NA | ID=3_22;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.525 | NA +ATGCCACATTCACTGTTCAGCACTGATACCGATCTCACCGCCGAAAATCTGCTGCGTTTGCCCGCAGAAT +TTGGCTGCCCGGTGTGGGTCTACGATGCGCAAATTATTCGTCGGCAGATTGCAGCGCTGAAACAGTTTGA +TGTGGTGCGCTTTGCACAGAAAGCCTGTTCCAATATTCATATTTTGCGCTTAATGCGTGAGCAGGGCGTA +AAAGTGGATTCCGTCTCGTTAGGCGAAATAGAGCGTGCACTGGCGGCGGGTTACAATCCGCAAACGCACC +CCGATGATATTGTTTTTACGGCAGATGTTATCGATCAGGCGACGCTTGAACGCGTCAGTGAATTGCAAAT +TCCGGTGAATGCGGGTTCTGTTGATATGCTCGACCAACTGGGTCAGGTTTCGCCAGGGCATCGGGTATGG +CTGCGTGTTAATCCGGGGTTTGGTCACGGGCATAGCCAAAAAACCAATACCGGTGGCGAAAACAGCAAGC +ACGGTATCTGGTACACCGATCTGCCCGCCGCACTGGACGTGATACAACGTCATCATCTACAGCTGGTCGG +CATTCACATGCACATTGGTTCTGGCGTCGATTATGCCCATCTGGAACAGGTATGTGGTGCTATGGTGCGT +CAGGTCCTCGAATTCGGTCAGGATTTACAGGCTATTTCTGCGGGCGGTGGGCTTTCTATTCCTTATCAAC +AGGGTGAAGAGGCGGTTGATACCGAACATTATTATGGTCTGTGGAATGCCGCGCGTGAGCAAATCGCCCG +CCATTTGGGCCATCCTGTGAAACTGGAAATTGAACCGGGTCGCTTTCTGGTAGCGCAGGCTGGCGTATTA +ATTACTCAAGTGCGGAGCGTCAAACAAATGGGTAGCCGCCACTTTGTGCTGGTTGATGCCGGGTTCAACG +ATCTGATGCGCCCGGCAATGTACGGTAGTTACCACCATATCAGTGCCCTGGCAGCTGATGGTCGTTCTCT +GGAACACGCACCAACGGTGGAAACCGTCGTCGCCGGGCCGTTATGTGAATCGGGCGATGTCTTTACCCAG +CAGGAAGGGGGAAATGTTGAAACCCGCGCCTTGCCGGAAGTGAAGGCGTGTGATTATCTGGTACTGCATG +ATACAGGGGCATATGGCGCATCAATGTCATCCAACTACAACAGCCGTCCGCTGTTACCAGAAGTTCTGTT +TGATAATGGTCAGGCGCGGTTGATTCGCCGTCGCCAGACCATTGAAGAATTACTGGCGCTGGAATTGCTT +TAA +>test.0417.00002.0003i_00050 936 NA | NA | NA | ID=3_23;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.533 | NA +ATGGCCGCCGTTAACTTACGTCATATTGAAATTTTTCATGCGGTAATGACCGCCGGAAGCCTGACTGAGG +CGGCACACCTGCTACACACCTCACAGCCAACCGTCAGCCGCGAACTGGCGCGCTTTGAGAAGGTGATCGG +GCTGAAATTGTTTGAGCGCATACGTGGACGATTACATCCTACCGTGCAAGGACTGCGTCTGTTTGAAGAA +GTGCAACGATCCTGGTACGGACTGGATCGCATTGTCAGTGCCGCAGAAAGTCTGCGCGAGTTTCGCCAGG +GAGAACTGTCTATTGCCTGCCTGCCGGTCTTTTCGCAATCTTTTTTACCGCAGCTCCTGCAACCCTTTCT +GGCACGTTATCCCGATGTCAGCTTAAATATCGTGCCCCAGGAATCACCGCTACTTGAAGAGTGGCTCTCG +GCCCAGCGTCATGATTTAGGACTCACTGAAACGCTCCATACGCCTGCGGGAACAGAACGTACCGAATTAC +TCTCTTTAGATGAAGTGTGTGTGTTACCTCCGGGCCATCCGCTGGCGGTAAAAAAGGTATTAACGCCGGA +TGATTTTCACGGTGAGAACTACATCAGCCTTTCCCGTACTGACAGCTATCGCCAGTTGCTGGATCAATTG +TTTACTGAGAATCAGGTTAAACGACGCATGATCGTAGAAACCCACAGCGCCGCGTCAGTCTGCGCAATGG +TACGGGCGGGGGTAGGCGTTTCGGTGGTTAACCCGCTCACCGCACTGGATTATGCGGCAAGCGGTTTAGT +GGTGCGGCGGTTCAGCATTGCGGTTCCATTCACCGTCAGCCTGATCCGCCCCCTGCACCGCCCGTCATCA +GCGCTGGTGCAGGCGTTTAGTGAGCATTTACAAGCGGGATTACCGAAACTGGTCACTTCTCTTGACACTA +TTTTGTCGTCAGCTACGACAGCATAA +>test.0417.00002.0003i_00051 693 NA | NA | NA | ID=3_24;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.506 | NA +ATGAAAACAATTGGTTTGCTGGGAGGAATGAGCTGGGAATCCACTATTCCTTACTATCGTCTGATAAATG +AAGGCATTAAACAGCGGCTTGGTGGGCTTCACTCTGCGCAAGTGCTGCTACATAGCGTCGATTTTCATGA +AATAGAAGAGTGCCAGCGTCGCGGTGAGTGGGACAAAACCGGGGATATTCTGGCTGAGGCGGCGCTTGGC +TTACAGCGGGCGGGCGCAGAAGGTATTGTGTTATGCACCAATACGATGCACAAAGTGGCGGATGCCATTG +AGTCTCGTTGCTCTCTGCCTTTCTTACACATAGCGGATGCCACTGGACGTGCAATTACCGGGGCAGGAAT +GACTCGTGTGGCGCTGCTGGGTACACGTTACACCATGGAACAGGATTTTTATCGCGGGCGGCTGACGGAA +CAATTTTCCATCAACTGTCTTATTCCTGAAGCGGATGAACGGGCGAAAATTAATCAGATTATTTTTGAAG +AACTGTGTCTGGGGCAATTTACCGAAGCGTCACGCGCTTATTATGCGCAAGTGATTGCTCGCCTTGCAGA +ACAGGGCGCACAGGGCGTCATTTTTGGCTGCACAGAAATTGGTTTACTGGTGCCAGAAGAGCGCAGTGTT +CTGCCTGTGTTTGATACCGCGGCGATCCATGCCGAGGATGCTGTCGCTTTTATGCTGTCGTAG +>test.0417.00002.0003i_00052 1419 NA | NA | NA | ID=3_25;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.517 | NA +ATGGTTACTATCAATACGGAATCTGCTTTAACGCCACGTCCTCTGCGGGATACGCGGCGTATGAATATGT +TTGTTTCGGTAGCTGCTGCGGTCGCAGGATTGTTATTTGGTCTTGATATCGGCGTAATCGCCGGAGCGTT +GCCGTTCATTACCGATCACTTTGTGCTGACCAGCCGTTTGCAGGAATGGGTGGTCAGTAGCATGATGCTC +GGCGCAGCAATTGGTGCGCTGTTTAATGGGTGGCTGTCGTTCCGCCTGGGGCGTAAATACAGCCTGATGG +CGGGGGCCATCCTGTTTGTACTCGGTTCGATAGGGTCCGCTTTTGCGACCAGCGTAGAGATGTTAATCGC +CGCTCGTGTGGTGTTGGGCATTGCTGTTGGGATCGCGTCTTACACCGCTCCTCTATATCTTTCTGAAATG +GCAAGTGAAAACGTTCGCGGTAAGATGATCAGCATGTACCAGTTGATGGTCACACTCGGCATCGTGCTGG +CGTTTTTATCCGATACAGCGTTCAGTTATAGCGGTAACTGGCGCGCAATGTTGGGGGTTCTTGCTTTACC +AGCAGTCCTGCTGATTATTCTGGTGGTCTTCCTGCCAAATAGCCCGCGCTGGCTGGCGGAAAAGGGGCGT +CATATTGAGGCGGAAGAAGTGTTGCGTATGCTGCGCGATACGTCGGAAAAAGCGCGAGAAGAACTCAACG +AAATTCGTGAAAGCCTGAAGTTAAAACAGGGCGGTTGGGCACTGTTTAAGATCAACCGTAACGTCCGTCG +TGCTGTATTTCTCGGTATGTTGTTGCAGGCGATGCAGCAGTTTACCGGTATGAACATCATCATGTACTAC +GCGCCACGTATCTTCAAAATGGCGGGCTTTACGACCACAGAACAACAGATGATTGCGACTCTGGTCGTGG +GGCTGACCTTTATGTTCGCTACCTTCATTGCGGTCTTTACGGTAGATAAAGCAGGGCGTAAGCCGGCTCT +GAAAATTGGTTTCAGCGTGATGGCGTTAGGCACTCTGGTGCTGGGTTACTGCCTGATGCAGTTTGATAAC +GGTACGGCTTCCAGTGGCTTGTCCTGGCTCTCTGTTGGCATGACGATGATGTGTATTGCCGGTTATGCGA +TGAGCGCCGCGCCAGTGGTGTGGATCTTGTGCTCTGAAATTCAGCCGCTGAAATGCCGCGATTTTGGCAT +CACCTGCTCAACGACGACAAACTGGGTGTCGAATATGATTATCGGCGCGACCTTCCTGACACTGCTTGAT +AGCATTGGCGCTGCCGGTACGTTCTGGCTCTACACTGCGCTGAACATTGCGTTTGTGGGCATCACTTTCT +GGCTCATTCCGGAAACCAAAAATGTCACGCTGGAACATATCGAGCGCAAACTGATGGCAGGCGAAAAGTT +GAGAAATATCGGCGTCTGA +>test.0417.00002.0003i_00053 762 NA | NA | NA | ID=3_26;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.521 | NA +ATGATTTTAAATGCATTTTCTCTCGAAGGTAAAGTTGCGGTCGTCACTGGTTGTGATACTGGGCTGGGCC +AGGGGATGGCGTTGGGGCTGGCGCAAGCGGGCTGTGACATTGTTGGCATTAACATCGTTGAACCGACTGA +AACCATCAAGCAGGTCACGGCGCAGGGGCGTCGTTTTTTAAGCCTGACCGCCGATCTGCGAAAGATTGAT +GGCATTCCTGGACTGCTGGATCGCGCGGTAGCGGAGTTTGGTCATATTGATATCCTGGTGAATAACGCCG +GATTGATTCGCCGCGAAGACGCTCTCGAGTTCAGCGAAACAGACTGGGACGATGTCATGAACCTGAATAT +CAAGAGCGTATTCTTCATGTCTCAGGCAGCGGCGAAACACTTTATCGCGCAAGGCAATGGCGGCAAGATT +ATCAATATCGCGTCAATGCTCTCCTTCCAGGGCGGGATCCGTGTGCCTTCTTATACCGCATCAAAAAGCG +GCGTGATGGGTGTGACGCGATTGATGGCGAACGAATGGGCTAAACACAACATTAATGTTAATGCGATAGC +TCCGGGTTACATGGCGACCAACAATACTCAACAACTGCGGGCAGATGAACAACGTAGCGCGGAAATTCTC +GACCGCATTCCAGCTGGCCGTTGGGGACTGCCGAGTGACCTGATGGGGCCGGTAGTGTTTCTTGCCTCCA +GCGCTTCAGATTATGTAAATGGTTATACCATTGCTGTGGATGGCGGTTGGCTGGCGCGTTAA +>test.0417.00002.0003i_00054 837 NA | NA | NA | ID=3_27;partial=00;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.495 | NA +GTGGACGTAAGACAGAGCATCCACAGTGCGCACGCAAAAACGCTGGATACCCAGGGGCTGCGCAATGAAT +TTTTGGTTGAAAAGGTATTTGTCGCCGATGAGTACACCATGGTTTACAGCCACATTGACCGTATTATTGT +TGGCGGCATTATGCCGGTAACTAAAACGGTTTCCGTTGGCGGGGAAGTTGGTAAACAACTCGGCGTAAGC +TATTTCCTTGAACGTCGCGAGTTAGGTGTTATCAATATTGGCGGTGCCGGTACGATTACTGTCGATGGTC +AATGCTATGAAATCGGTCACCGCGACGCCCTGTATGTTGGTAAAGGTGCAAAAGAAGTTGTCTTTGCCAG +TATTGATACCGCCACTCCGGCGAAGTTTTATTACAATTGCGCACCCGCGCATACGACGTATCCCACCAAA +AAAGTCACACCGGACGAAGTATCTCCAGTCACGTTAGGCGATAACCTCACCAGTAACCGTCGCACGATTA +ACAAATATTTTGTCCCGGATGTGCTGGAAACCTGCCAATTGAGTATGGGGCTGACGGAGCTGGCTCCAGG +TAACTTGTGGAACACCATGCCGTGTCACACCCACGAGCGCCGGATGGAAGTTTATTTCTATTTCAATATG +GATGATGACGCCTGCGTTTTCCACATGATGGGGCAACCGCAAGAAACGCGTCACATTGTGATGCATAACG +AGCAGGCGGTGATCTCCCCGAGCTGGTCGATCCATTCCGGCGTCGGAACCAAAGCTTATACCTTTATCTG +GGGCATGGTCGGTGAAAACCAGGTTTTTGATGATATGGACCATGTGGCCGTTAAAGATTTGCGCTAG +>test.0417.00002.0003i_00055 1182 NA | NA | NA | ID=3_28;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.531 | NA +ATGAAAGACGTTGTGATTGTCGGGGCGTTACGGACACCTATCGGCTGCTTTCGTGGTGCGTTAGCGGGTC +ATTCCGCCGTGGAACTTGGCAGCCTGGTCGTCAAAGCGTTAATAGAACGTACCGGCGTTCCTGCATATGC +GGTGGATGAAGTGATTCTTGGTCAGGTGTTGACTGCAGGGGCAGGGCAGAATCCGGCAAGGCAATCGGCT +ATTAAAGGTGGTCTTCCTAATAGCGTTTCTGCAATCACTATTAATGACGTTTGTGGTTCCGGGCTTAAAG +CACTGCATCTGGCTACTCAGGCGATACAGTGTGGCGAGGCTGATATTGTCATCGCCGGTGGCCAGGAAAA +CATGAGCCGCGCACCACATGTTCTGACTGATAGCCGCACCGGCGCACAGCTTGGCAATAGCCAGTTGGTT +GATAGTCTTGTGCATGATGGGTTGTGGGATGCCTTCAATGATTATCATATTGGTGTCACCGCCGAAAATC +TGGCTCGCGAATATGGCATCAGCCGTCAGTTGCAGGATGCTTACGCACTTAGCTCGCAACAAAAAGCGCG +AGCGGCGATTGACGCCGGACGATTTAAAGATGAGATCGTCCCGGTAATAACCCAAAGTAACGGTCAGACG +TTGGTTGTTGATACCGATGAACAGCCACGCACTGACACCAGCGCAGAAGCCTTAGCCCGTTTAAATCCTT +CATTTGATAGTCTCGGTTCTGTGACAGCGGGTAATGCATCATCCATAAACTATGGGGCAGCTGCAGTAAT +GATGATGAGCGAAGCCAAAGCACGAGCGTTGAATTTACCCGTGCTGGCCCGCATCCGCGCATTTGCCAGC +GTTGGTGTGGATCCGGCATTGATGGGAATTGCGCCGGTGTATGCGACCCGCCGTTGCCTGGAGCGTGTTG +GCTGGCAGTTGGCTGATGTCGATCTTATCGAGGCTAATGAAGCGTTTGCTGCACAGGCGCTTTCGGTTGG +CAAGATGCTTGAATGGGATGAGCGTCGGGTCAATGTCAATGGTGGTGCGATCGCACTCGGTCATCCGATA +GGCGCTTCCGGTTGCCGAATCCTGGTTTCTCTTGTTCATGAAATGGTGAAACGTAATGCCCGCAAAGGAC +TGGCAACGCTTTGTATCGGCGGGGGCCAGGGTGTGGCATTGACCATTGAACGTGACGAGTAG +>test.0417.00002.0003i_00056 1230 NA | NA | NA | ID=3_29;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.445 | NA +ATGTCTAATATTTGGTCAAAAGAAGAAACTCTGTGGAGTTTCGCGCTCTACGGCACAGCCGTTGGTGCAG +GCACGCTCTTCCTTCCTATTCAGTTAGGTTCGGCGGGGGCTGTGGTCCTGTTTATTACTGCTCTGGTCGC +CTGGCCTTTAACATATTGGCCACATAAAGCCTTATGCCAGTTCATCCTCTCATCGAAAACATCAGCAGGT +GAAGGGATAACGGGCGCGGTAACACACTACTATGGCAAGAAGATTGGTAATCTGATTACCACGCTGTACT +TCATCGCCTTTTTTGTCGTCGTGTTGATATATGCAGTGGCAATTACCAACTCACTTACAGAACAGCTGGC +AAAGCATATGGTTATTGATCTTCGCATCCGTATGTTGGTGAGTCTGGGGGTTGTATTAATCCTGAATCTC +ATTTTTCTGATGGGACGCCATGCCACTATTCGGGTAATGGGATTTTTGGTATTCCCATTGATTGCCTATT +TCTTATTTCTTTCTATTTACCTGGTCGGTAGTTGGCAACCTGATCTATTAACAACCCAGGTAGAGTTCAA +TCAGAATACCCTTCACCAGATATGGATATCGATTCCCGTGATGGTTTTCGCTTTTAGCCATACGCCCATT +ATTTCTACGTTTGCCATAGACAGACGTGAAAAATATGGCGAACACGCTATGGATAAATGCAAAAAAATTA +TGAAAGTCGCTTATCTCATCATCTGCATAAGTGTATTGTTCTTTGTCTTTAGCTGCCTGCTTTCTATTCC +ACCTTCGTATATTGAAGCGGCTAAAGAAGAAGGGGTTACCATTTTATCGGCGCTTTCTATGCTGCCGAAC +GCCCCAGCATGGTTGTCAATTTCCGGGATTATTGTCGCAGTAGTTGCGATGTCGAAATCATTCCTGGGTA +CGTACTTTGGCGTTATTGAAGGTGCCACAGAGGTCGTCAAAACAACATTACAGCAGGTTGGTGTAAAGAA +AAGTCGTGCATTTAACCGCGCACTATCAATTATGTTGGTATCGCTGATTACCTTCATTGTTTGTTGCATT +AACCCGAACGCGATTTCGATGATTTACGCGATCAGCGGCCCGCTCATTGCCATGATACTTTTCATCATGC +CTACGCTGTCAACGTATCTCATCCCGGCGCTTAAACCCTGGCGTTCCATCGGAAATCTGATTACCCTGAT +CGTGGGTATCCTGTGCGTATCGGTAATGTTCTTTAGCTAA +>test.0417.00002.0003i_00057 252 NA | NA | NA | ID=3_30;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.409 | NA +ATGCCTTACGCATCTCGAAGCGGGCGTAGTTCAATGGTAGAACGAGAGCTTCCCAAGCTCTATACGAGGG +TTCGATTCCCTTCGCCCGCTCCAATTTATCTTCACATCATCTACCTGCCATTTTTGTTGTATCTGATTTT +CTATATTATCTTAATTCAAGCGCTTCAGACTTTTCGCAATCGCCGTAATACTTCCCCATTTTTTGTAAAT +AAAAAGCGTTTACGCAATGCAATCGTCATGTATCTTAAATAG +>test.0417.00002.0003i_00058 351 NA | NA | NA | ID=3_31;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.501 | NA +ATGCCGTATTCGACAGCAGATGGCGGCAATAAAGGAATTGATATCTCAGCTCCACGGGGTACACCTATTT +ACGCCGCGGGTGCAGGAAAGGTGGTGTATGTGGGCAACCAGCTGCGTGGCTACGGTAATCTCATCATGAT +TAAACACAGTGAAGATTACATTACGGCTTACGCTCATAATGACACGATGCTGGTAAATAATGGGCAAAGC +GTGAAAGCTGGGCAAAAAATCGCCACCATGGGGAGCACTGATGCGGCATCTGTTCGCCTGCATTTCCAGA +TTCGTTACCGTGCAACGGCAATTGATCCGCTACGTTACTTGCCGCCTCAGGGCAGCAAGCCAAAATGCTG +A +>test.0417.00002.0003i_00059 2298 NA | NA | NA | ID=3_32;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.529 | NA +ATGGAAGCGCGGGAAGCAACCGCTACGGGTGAATCATGCATGCGCGTCGATGCCATTGCTAAGGTCACCG +GGCGGGCACGATATACTGACGATTATGTTATGGCGGGCATGTGTTACGCGAAATATGTACGTAGCCCTAT +CGCACATGGTTATGCTGTAAGTATTAATGATGAACAAGCCAGGAGTTTGCCGGGCGTCCTGGCGATTTTT +ACCTGGGAAGATGTGCCAGAAATCCCATTCGCCACGGCAGGGCATGCCTGGACACTTGACGAAAACAAGC +GCGATACCGCCGATCGCGCACTGCTAACTCGCCATGTTCGTCATCATGGCGACGCCGTTGCCATCGTCGT +GGCCCGCGATGAACTCACGGCAGAAAAAGCGGCGCAATTGGTCAGCATTGAGTGGCAAGAATTACCCGTT +ATCACCTCGCCAGAAGCGGCGCTGGCAGAAGACGCTGCACCAATCCATAACGGTGGCAATTTACTGAAAC +AAAGCACGATGTCGACGGGTAATGTCCAACAAACAATCGATGCCGCCGACTACCAGGTACAGGGGCACTA +TCAGACTCCCGTTATTCAACATTGTCATATGGAAAGCGTGACATCGCTGGCATGGATGGAGGATGACTCG +CGAATTACCATCGTTTCCAGCACCCAGATCCCGCACATTGTTCGCCGCGTGGTTGGTCAGGCGCTGGATA +TTCCCTGGTCATGCGTACGAGTCATCAAACCGTTTATCGGTGGCGGTTTTGGTAATAAACAGGATGTACT +GGAAGAGCCAATGGCGGCATTCCTGACCAGCAAACTTGGCGGCATTCCGGTGAAAGTTTCCCTTAGCCGT +GAAGAGTGTTTCCTCGCAACCCGTACCCGCCACGCTTTTACTATTGACGGGCAAATGGGCGTGAACCGCG +ACGGAACATTGAAAGGTTATAGTCTGGATGTTCTGTCTAACACCGGCGCTTATGCATCTCACGGGCACTC +CATTGCTTCTGCTGGGGGGAATAAAGTCGCTTACCTTTATCCTCGTTGTGCCTACGCTTACAGTTCAAAG +ACCTGCTATACCAACCTCCCCTCGGCTGGTGCGATGCGTGGTTATGGCGCGCCACAAGTCGTATTTGCCG +TTGAGTCTATGCTTGATGATGCCGCGACAGCGTTAGGTATTGATCCTGTTGAAATTCGTTTACGCAACGC +CGCCCGCGAAGGAGATGCTAATCCGCTCACGGGAAAACGTATTTACAGCGCAGGGTTGCCGGAGTGTCTT +GAAAAAGGCCGGAAAATCTTTGAATGGGAAAAACGCCGTGCAGAGTGCCAGAACCAGCAAGGCAATTTAC +GTCGTGGCGTTGGCGTCGCCTGTTTTAGCTACACCTCTAACACCTGGCCTGTCGGCGTAGAAATAGCAGG +CGCGCGCCTGTTGATGAATCAGGATGGAACCATCAACGTGCAAAGCGGCGCGACGGAAATCGGTCAGGGT +GCCGACACCGTCTTCTCGCAAATGGTGGCAGAAACCGTGGGGGTTCCGGTCAGCGACGTTCGCGTTATTT +CAACACAAGATACCGATGTTACGCCGTTCGATCCCGGCGCATTTGCCTCACGCCAGAGCTATGTTGCCGC +GCCTGCGCTGCGCAGTGCGGCACTGTTATTAAAAGAGAAAATCATCGCTCACGCCGCAGTCATGCTACAT +CAGTCAGCGATGAATCTGACCCTGATAAAAGGCCATATCGTGCTGATTGAACGACCGGAAGAACCGTTAA +TGTCGTTAAAAGATTTGGCGATGGACGCTTTCTACCACCCTGAACGCGGCGGGCAGCTCTCTGCTGAAAG +CTCCATCAAAACCACCACTAACCCACCGGCGTTCGGCTGTACATTTGTTGATCTGACGGTCGATATTGCA +CTGTGCAAAGTCACCATCAACCGCATCCTCAACGTTCATGATTCGGGGCATATTCTAAATCCGCTGCTGG +CAGAAGGTCAGGTACACGGCGGAATGGGAATGGGCATTGGCTGGGCGCTATTTGAAGAGATGATCATCGA +TGCGAAAAGCGGCGTGGTCCGTAACCCCAATCTGCTGGATTACAAAATGCCGACCATGCCGGATCTGCCA +CAACTGGAAAGCGCGTTCGTCGAAATCAATGAGCCGCAATCCGCATACGGACATAAGTCACTGGGTGAGC +CACCAATAATTCCTGTTGCCGCTGCTATTCGTAACGCGGTGAAGATGGCTACCGGTGTTGCAATCAATAC +ACTGCCGCTGACGCCAAAACGGTTATATGAAGAGTTCCATCTGGCAGGATTGATTTGA +>test.0417.00002.0003i_00060 879 NA | NA | NA | ID=3_33;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.538 | NA +ATGTTTGATTTTGCTTCTTACCATCGCGCAGCAACCCTTGCCGATGCCATCACCCTGCTGGCTGACAATC +CGCAGGCCAAATTGCTTGCCGGTGGCACTGACGTACTGATACAGCTTCACCATCACAATGACCGCTATCG +CCATATTGTTGATATCCACAATCTGGCAGAGCTTCAGGGAATAACACAGGCGGAAGATGGCGCGCTGCGA +ATCGGCTCCGCGACAACATTTACTCAGCTCATTGAAGATCCCGTAATCCAACGCAATCTCCCGGCGTTAT +GTGCTGCGGCTGCATCAATCGCCGGGCCGCAGATCCGTAATGTCGCCACCTACGGCGGAAATATTTGCAA +CGGTGCCACCAGCGCAGATTCTGCCACGCCAACGCTAATTTATGACGCGAAACTGGAGCTCCACTCCCCA +CGCGGTGTTCGTTTCGTCCCGATTAATGGCTTTCACACCGGGCCGGGCAAAGTGTCTCTTGAGCATGACG +AAATCCTTGTCGCCTTTCATTTTCCGCCACAGCCGAAAGAACACGCGGGCAGCGCACATTTTAAATATGC +CATGCGCGACGCAATGGATATTTCAACAATTGGCTGCGCCGCACATTGCCGACTGGATAACGGCAATTTC +AGCGAATTACGCCTGGCATTTGGTGTTGCCGCGCCAACGCCGATTCGCTGCCAACATGCCGAACAGACTG +CACAAAATGCGCCATTAAACCTGCAAACGCTGGAAGCCATCAGCGAATCAGTCCTGCAAGATGTCGCCCC +GCGTTCTTCATGGCGGGCCAGTAAAGAGTTTCGTCTGCATCTCATCCAGACGATGACCAAAAAAGTGATT +AGCGAAGCCGTCGCCGCGGCGGGGGGAAAATTGCAATGA +>test.0417.00002.0003i_00061 480 NA | NA | NA | ID=3_34;partial=00;start_type=ATG;rbs_motif=GGxGG;rbs_spacer=5-10bp;gc_cont=0.512 | NA +ATGAATCACAGCGAAACAATTACCATCGAATGCACCATTAACGGGATGCCTTTTCAGCTTCACGCCGCGC +CAGGAATGCCGCTTTCGGAACTACTCCGAGAACAAGGGCTTCTTAGTGTCAAACAAGGTTGCTGCGTAGG +CGAATGCGGTGCCTGTACGGTGCTGGTCGACGGCACTGCGATAGACAGTTGCTTATTCCTTGCGGCCTGG +GCTGAAGGAAAAGAGATCCGCACGCTGGAAGGTGAAGCGAAAGGCGGTAAACTTTCTCATGTCCAACTGG +CTTATGCGAAATCTGGTGCAGTGCAATGCGGGTTTTGTACGCCGGGCCTGATTATGGCTACCACGGCAAT +GCTGGCGAAACCACGCGAGAAGCCATTAACCATTACGGAAATTCGTCGTGGACTGGCGGGAAATCTTTGT +CGCTGCACAGGGTATCAGATGATTGTAAATACAGTTCTGGATTGCGAGAAAACGAAGTAA +>test.0417.00002.0003i_00062 1779 NA | NA | NA | ID=3_35;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.459 | NA +ATGGAGCTTGCGACTACGCAGTCAGTATTGATGCAAATTCAACCGACAATTCAGCGTTTTGCCAGAATGC +TTGCCAGCGTTTTGCAGCTTGAGGTTGAGATCGTTGATGAAAACTTGTGTCGCGTCGCCGGAACGGGCGC +GTATGGGAAGTTTCTTGGCCGCCAGTTGAGCGGCAACTCACGCCTGCTCCGCCACGTCCTGGAAACGAAA +ACTGAAAAAGTTGTGACACAGTCTCGCTTCGATCCCCTTTGTGAAGGTTGCGATAGTAAAGAAAATTGCC +GCGAAAAAGCATTTCTGGGTACGCCTGTCATTTTACAGGATCGTTGTGTTGGGGTGATAAGTTTGATTGC +CGTTACCCACGAGCAACAAGAACATATCAGTGATAATTTACGCGAATTTTCCGATTACGTTCGCCATATA +TCCACCATTTTTGTTTCTAAACTTCTGGAGGATCAGGGACCAGGAGATAACATCAGTAAAATATTCGCGA +CCATGATCGATAATATGGATCAGGGCGTGTTAGTGGTTGATGCTGATAATCGGGTTCAGTTTGTTAATCA +GACAGCTTTAAAAACACTCGGTGTTGTACAAAATAATATTATTGGAAAACCTGTTCGTTTCAGACCATTA +ACATTTGAGAGTAATTTTACCCATGGTCATATGCAACATATTGTTTCGTGGGATGATAAAAGTGAATTAA +TCATTGGTCAGTTGCATAACATCCAGGGCCGACAACTATTTTTAATGGCGTTTCACCAATCGCATACCAG +TTTTTCTGTAGCAAATGCACCTGATGAACCGCATATTGAACAATTGGTTGGCGAGTGCCGTGTTATGCGG +CAATTAAAACGACTCATTAGCCGTATTGCACCCAGCCCATCCAGCGTTATGGTGGTTGGTGAAAGCGGCA +CGGGTAAAGAAGTCGTCGCCCGTGCAATCCATAAGTTGAGCGGAAGACGGAATAAACCCTTTATTGCTAT +CAACTGTGCTGCGATTCCGGAACAGCTTCTGGAGAGCGAACTGTTCGGTTATGTTAAAGGCGCATTTACT +GGCGCTTCTGCCAACGGTAAAACAGGGTTGATTCAGGCGGCGAATACGGGCACGCTGTTTCTCGATGAAA +TTGGTGATATGCCATTAATGTTGCAGGCTAAATTACTGCGCGCTATTGAGGCGCGTGAAATTCTGCCGAT +TGGTGCCAGTAGCCCAATACAAGTCGACATCCGCATCATTTCTGCAACTAATCAGAATTTGGCCCAGTTC +ATTGCCGAAGGTAAATTCCGCGAAGATCTCTTCTACCGACTTAATGTTATCCCGATAACTCTTCCACCGC +TGCGTGAACGTCAGGAAGATATTGAATTACTGGTGCATTACTTTTTACATCTGCATACCCGTCGTCTGGG +ATCGGTTTATCCTGGCATTGCTCCTGATGTCGTCGAAATATTGCGTAAGCATCGTTGGCCCGGAAACCTG +CGCGAGTTAAGCAATTTGATGGAATATCTGGTTAACGTTGTTCCTTCAGGTGAAGTTATCGACAGCACGC +TATTGCCGCCAAATCTGCTGAATAATGGCACAACGGAGCAAAGTGATGTAACAGAGGTCAGTGAGGCGCA +CCTGTCACTCGATGATGCGGGCGGCACGGCGCTGGAGGAGATGGAAAAGCAAATGATCCGCGAGGCGCTT +TCACGTCATAACAGCAAGAAGGAAGTTGCTGATGAACTGGGCATCGGCATTGCTACGCTCTATCGCAAGA +TTAAGAAATATGAGTTGTTAAACACATAA +>test.0417.00002.0003i_00063 1188 NA | NA | NA | ID=3_36;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.506 | NA +ATGAAAACTGTTAATGAGCTGATTAAGGATATCAATTCGCTGACCTCTCACCTGCATGAAAAAGATTTTT +TGTTAACGTGGGAACAGACGCCAGACGAACTGAAACAAGTACTGGACGTTGCCGCCGCGTTAAAAGCACT +GCGTGCTGAAAACATCTCAACCAAAGTCTTTAATAGTGGATTAGGTATTTCCGTCTTCCGCGACAACTCC +ACCCGTACCCGCTTCTCTTATGCTTCCGCGCTTAACCTGCTCGGCCTTGCACAACAAGATCTTGACGAAG +GTAAATCACAAATCGCTCACGGCGAAACCGTGCGTGAAACCGCCAATATGATCTCCTTCTGCGCTGACGC +TATCGGTATTCGCGACGATATGTATCTGGGCGCAGGCAACGCCTATATGCGTGAAGTTGGCGCGGCACTT +GATGACGGCTACAAGCAGGGTGTGCTGCCGCAGCGTCCGGCTTTAGTGAACCTGCAATGCGATATTGACC +ACCCGACTCAGTCTATGGCTGACCTGGCATGGTTGCGTGAACACTTTGGTTCGCTGGAAAACCTGAAAGG +CAAAAAAATCGCCATGACCTGGGCCTACTCCCCAAGCTATGGCAAACCGCTCTCTGTACCACAAGGCATC +ATAGGTCTGATGACCCGCTTCGGTATGGATGTCACCCTGGCCCATCCGGAAGGCTACGACCTGATCCCGG +ATGTCGTTGAAGTTGCTAAAAACAATGCTAAAGCCTCCGGTGGTAGCTTCCGTCAGGTCACCAGCATGGA +AGAAGCCTTCAAAGACGCAGACATCGTTTATCCGAAGTCATGGGCACCTTACAAAGTGATGGAAGAGCGT +ACTGAATTGCTGCGTGCGAACGATCACGAAGGCTTAAAAGCACTGGAAAAACAGTGTCTGGCACAGAACG +CGCAACACAAAGACTGGCATTGTACTGAAGAGATGATGGAACTGACCCGTGATGGCGAAGCCCTGTACAT +GCACTGCCTGCCAGCTGATATCAGCGGCGTATCCTGCAAAGAAGGTGAAGTGACTGAAGGCGTATTCGAA +AAATACCGTATCGCTACCTACAAAGAAGCCAGCTGGAAGCCTTATATCATCGCCGCGATGATCCTGTCCC +GTAAATACGCCAAACCAGGTGCACTGCTCGAGCAACTGCTGAAAGAAGCGCAAGAACGCGTGAAATAA +>test.0417.00002.0003i_00064 1197 NA | NA | NA | ID=3_37;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.531 | NA +ATGTCCGTTTTCTCATTGAAGATTGATATCGCCGATAACAAATTTTTCAACGGCGAAACATCACCGCTTT +TTTCGCAAAGCCAGGCAAAACTGGCACGCCAGTTCCACCAGAAAATTGCTGGTTATCACCCAACACCGCT +TTGTGCGCTGGACGATCTCGCAAACCTGTTTGGTGTAAAGAAAATTCTCGTCAAAGACGAATCAAAACGA +TTCGGTCTGAACGCCTTCAAAATGCTCGGCGGTGCGTACGCCATCGCTCAATTATTGTGTGAAAAATATC +ATCTTGATATCGAAACGCTGTCATTTGAGCACCTGAAAAATGCCATCGGCGAAAAAATGACTTTCGCGAC +TACCACCGACGGCAACCACGGGCGCGGTGTGGCATGGGCAGCACAGCAACTCGGACAGAATGCGGTGATT +TACATGCCGAAAGGTTCTGCTCAGGAACGCGTTGACGCCATTCTAAACCTCGGTGCCGAGTGCATCGTCA +CGGATATGAACTATGACGATACCGTTCGCCTGACCATGCAACACGCGCAGCAGCACGGCTGGGAAGTGGT +ACAGGACACGGCATGGGAAGGCTACACCAAAATCCCAACCTGGATCATGCAAGGCTACGCAACACTGGCG +GATGAAGCCGTCGAGCAAATGCGTGAAATGGGCGTAACCCCGACACACGTTCTGCTACAAGCCGGTGTCG +GTGCAATGGCCGGTGGTGTGCTGGGTTATCTGGTCGACGTCTATAGCCCGCAAAATCTGCACAGCATTAT +TGTTGAACCTGACAAAGCTGACTGTATTTATCGCTCCGGCGTCAAAGGCGACATCGTCAACGTTGGCGGT +GATATGGCCACCATCATGGCGGGCCTGGCCTGCGGCGAACCTAACCCGCTGGGCTGGGAAATCCTACGTA +ACTGCGCCACCCAATTCATCTCCTGCCAGGACAGCGTTGCCGCATTAGGTATGCGCGTGCTGGGTAATCC +GTATGGCAACGACCCGCGCATCATCTCCGGTGAATCCGGCGCTGTCGGTTTGGGCGTTCTCGCAGCGGTT +CATTATCACCCGCAACGTCAAAGCCTGATGGAAAAACTGGCGCTGAACAAAGATGCCGTGGTGCTGGTTA +TCAGCACTGAAGGCGACACCGACGTGAAGCACTACCGCGAAGTTGTCTGGGAAGGCAAACACGCTGTAGC +ACCTTAA +>test.0417.00002.0003i_00065 1212 NA | NA | NA | ID=3_38;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.507 | NA +ATGGCTAAGAATATTCCATTCAAACTGATTCTTGAAAAAGCAAAAGATTACCAGGCAGACATGACTCGCT +TCCTACGCGATATGGTTGCTATTCCCAGTGAAAGCTGCGACGAGAAACGCGTAGTACATCGTATTAAAGA +AGAGATGGAAAAAGTCGGCTTCGATAAAGTTGAAATCGACCCAATGGGCAACGTTCTCGGTTATATCGGC +CACGGCCCGCGTCTGGTGGCAATGGACGCTCATATCGACACCGTCGGCATTGGCAACATCAAAAACTGGG +ACTTCGATCCGTATGAAGGCATGGAAACCGACGAGCTGATCGGTGGTCGCGGTACTTCCGACCAGGAAGG +CGGCATGGCATCTATGGTTTATGCCGGTAAAATCATTAAAGACCTCGGTCTGGAAGATGAATATACCCTG +CTGGTTACCGGTACTGTGCAGGAAGAAGACTGCGACGGTCTGTGCTGGCAATACATTATTGAACAATCCG +GCATTCGCCCGGAATTTGTGGTCAGTACCGAACCAACCGACTGCCAGGTATACCGTGGTCAACGCGGTCG +TATGGAAATTCGCATTGATGTTCAGGGTGTTAGCTGCCACGGTTCGGCACCAGAACGTGGTGATAACGCC +ATTTTCAAAATGGGTCCAATTCTTGGCGAATTACAGGAACTGTCTCAACGTCTGGGCTATGACGAATTCC +TCGGCAAAGGTACGCTGACTGTTTCCGAAATTTTCTTCACCTCCCCAAGTCGTTGCGCTGTCGCAGATAG +CTGCGCAGTTTCTATTGACCGCCGTCTCACCTGGGGCGAAACATGGGAAGGCGCGCTGGACGAGATCCGT +GCCCTGCCTGCAGTACAAAAAGCGAATGCTGTCGTTTCTATGTACAACTACGACCGTCCGTCCTGGACTG +GCCTGGTTTATCCAACCGAATGCTACTTCCCGACCTGGAAAGTGGAAGAAGATCACTTCACCGTTAAAGC +ACTGGTGAATGCTTATGAAGGGCTGTTTGGTAAAGCGCCTGTCGTTGATAAGTGGACCTTCTCAACTAAC +GGCGTATCCATCATGGGTCGCCACGGCATTCCGGTCATCGGTTTTGGCCCTGGTAAAGAACCGGAAGCGC +ACGCGCCAAACGAAAAAACCTGGAAATCTCACCTGGTAACCTGTGCCGCTATGTACGCTGCAATCCCATT +AAGCTGGCTGGCAACCGAATAA +>test.0417.00002.0003i_00066 1386 NA | NA | NA | ID=3_39;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.524 | NA +ATGCGCGTATTGATAAAAAACGGCATTGTTGTTAATGCAGATGGACAGGCGAAGCAGGATTTGCTGATTG +AAAGCGGGATTGTTCGCCAGTTGGGTACCGATATTTCGCCGCAACTCCCTTGCGAAGAAATTGATGCCTC +TGGCTGTTACGTTTTCCCTGGCGGCGTGGATGTCCATACGCATTTCAATATTGATGTCGGCATCGCGCGC +AGTTGTGATGATTTTTTTACCGGTACCCGCGCTGCTGCGTGTGGCGGTACAACAACCATTATTGACCATA +TGGGATTTGGCCCAAATGGCTGCCGGTTACGCCATCAACTGGAAGTTTATCGCGGTTATGCCGCCCACAA +AGCAGTCATCGACTACAGCTTTCACGGTGTCATTCAACATATTAATCACGCTATCCTCGACGAAATTCCG +ATGATGGTTGAGGAAGGACTGAGCAGCTTTAAACTCTATTTAACCTATCAATATAAACTCAACGATGATG +AAGTGTTGCAGGCATTACGCCGCTTGCATGAGTCCGGCGCGCTGACCACCGTACACCCGGAAAATGACGC +AGCTATCGCCAGCAAGCGGGCGGAGTTTATCGCCGCAGGGTTAACCGCGCCGCGTTATCATGCCTTGAGT +CGACCTCTGGAATGCGAAGCGGAAGCCATCGCCCGCATGATTAACCTGGCACAAATTGCCGGTAACGCCC +CGCTCTATATCGTGCACCTGTCTAACGGCTTAGGTCTAGATTATCTGCGTCTTGCCCGTGCGAATCACCA +GCCAGTCTGGGTTGAAACCTGCCCACAATATCTCCTGTTGGACGAACGCAGTTACGATACAGAAGATGGC +ATGAAGTTCATTCTTAGCCCACCGCTGCGTAACGTACGCGAGCAGGACAAACTGTGGTGTGGCATCAGCG +ATGGTGCGATTGACGTGGTGGCAACCGATCACTGCACCTTCTCGATGGCTCAACGCCTGCAAATTTCTAA +AGGCGATTTCAGCCGCTGCCCAAATGGCTTACCCGGTGTGGAGAACCGCATGCAACTGCTGTTCTCCAGT +GGCGTGATGACGGGACGTATCTCACCGGAGCGTTTTGTTGAGTTAACCAGTGCAATGCCCGCCAGGCTGT +TTGGCCTGTGGCCACAAAAAGGATTATTAGCGCCCGGTTCCGATGGCGACGTGGTGATTATAGACCCACG +TCAGAGCCAACAAATTCAGCATCGCCATCTCCACGACAACGCTGACTACTCGCCATGGGAGGGTTTTACC +TGTCAGGGCGCGATTGTCAGAACCTTATCTCGTGGTGAAACGATTTTCTGCGACAGCACCTTTACAGGCA +AAGCCGGGCGAGGTCGTTTCCTGCGACGCAAACCGTTTGTCCCTCCCGTGCTCTAA +>test.0417.00002.0003b_00067 870 NA | NA | NA | ID=3_40;partial=01;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.501 | NA +ATGAGTAAGAAAATTGTTCTCGCCCTGGGCGGGAATGCGCTGGGCGATGACCTGGCTGGGCAAATGAAAG +CGGTAAAAATTACTTCTCAGGCAATTGTTGATTTAATTGCCCAGGGACATGAGGTCATCGTCACTCATGG +CAACGGGCCACAGGTGGGCATGATTAACCAGGCCTTTGAAGCTGCAGCAAAAACTGAAGCGCACTCGCCA +ATGCTGCCGATGTCTGTCTGTGTTGCCTTAAGCCAGGGTTATATTGGTTACGATCTACAAAACGCCTTAA +GAGAAGAACTGCTTTCTCGTGGCATTAATAAACCTGTAGCAACGCTGGTTACCCAGGTCGAAGTCGATGC +TAACGATCCGGCATTCCTCACCCCGACCAAGCCGATCGGTTCGTTCTTTACCGAGCAAGAAGCAGAGCTA +CTGACAAAACAGGGTTACACTCTGAAAGAAGATGCGGGTCGCGGCTATCGCCGTGTCGTTGCTTCGCCAA +AACCGGTTGATATCATTGAAAAAGAAACGGTTAAAGCTCTGGTAGATGCCGGACAGGTGGTGATCACCGT +TGGCGGTGGTGGTATCCCTGTTATTCGTGAAGGTAACCATCTGCGTGGTGCCAGCGCGGTTATCGATAAA +GACTGGGCCAGCGCCCGTTTAGCAGAAATGATTGATGCCGATATGCTGATCATTCTGACTGCGGTAGAAA +AAGTGGCCATTAACTTCGGAAAAGAGAATGAACAGTGGCTCGATCGCCTGTCGTTAAGTGATGCTGAACG +CTTTATCGAAGAAGGTCATTTTGCGAAAGGTTCTATGCTGCCTAAAGTGGAAGCTGCCGCCTCGTTTGCT +CGCTCTCGCGCAGGTCGTGAAGCACTGATT +>test.0417.00002.0004b_00068 1626 NA | NA | NA | ID=4_1;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.523 | NA +ATGAATATTTTCACAGAGGCTGCAAAACTCGAAGAGCAAAATTGTCCGTTTGCGATGGCGCAAATTGTTG +ATAGCCGAGGCTCAACCCCCCGCCATTCTGCACAAATGTTAGTGCGCGCCGATGGTTCTATCGTCGGTAC +AATTGGTGGCGGAATGGTTGAACGGAAGGTGATTGAAGAGTCGCTTCAGGCATTGCAGGAACGTAAGCCG +CGATTATTCCATGGACGTATGGCTCGTAACGGTGCGGATGCTGTCGGGTCAGATTGTGGAGGTGCAATGT +CAGTATTTATCAGCGTCCATGGTATGCGTCCACGTCTGGTGTTGATTGGTGCGGGGCATGTCAACCGGGC +GATAGCCCAGAGTGCGGCGCTATTAGGATTTGATATCGCCGTTGCTGATATTTATCGCGAAAGCCTCAAT +CCTGAACTATTCCCACCATCAACCACGCTTCTCCATGCTGAGTCGTTTGGTGCGGCAGTGGAAGCACTGG +ATATTCGCCCTGATAATTTTGTCCTGATTGCCACGAATAATCAGGATCGTGAAGCCCTCGACAAACTCAT +TGAACAACCCATTGCATGGCTGGGGTTGCTGGCAAGTCGCCGCAAGGTTCAGCTTTTCCTGCGCCAATTG +CGTGAGAAAGGCGTGGCTGAAGAACATATTGCCCGTTTACATGCGCCCGTTGGTTACAATATAGGTGCGG +AAACGCCGCAAGAGATCGCCATCAGCGTGCTGGCAGAAATATTACAGGTGAAAAATAACGCGCCGGGTGG +GCTGATGATGAAGCCTTCTCATCCTTCCGGACACCAGCTGGTGGTGATTCGCGGTGCGGGGGATATCGCC +AGTGGTGTAGCGCTACGTCTGTATCATGCGGGTTTTAAAGTGATCATGTTGGAAGTGGAAAAACCGACAG +TGATTCGTTGTACCGTGGCGTTTGCCCAGGCCGTGTTCGATGGCGAAATGACGGTCGAAGGCGTCACCGC +CCGCCTGGCAACCAGCTCTGCGGAAGCGATGAAACTTACCGAACGCGGATTTATCCCTGTGATGGTAGAT +CCCACCTGTTCATTGCTTGATGAACTGAAACCGCTTTGCGTGGTGGACGCTATTCTGGCGAAACAGAATT +TGGGAACGCGGGCAGATATGGCACCAGTAACAATCGCGCTTGGGCCGGGCTTTACTGCAGGGAAGGATTG +TCATGCGGTAATTGAAACAAATCGCGGGCACTGGCTCGGTCAGGTGATTTACTCAGGTTGTGCGCAGGAG +AATACCGGTGTTCCCGGCAATATTATGGGGCATACCACCCGACGAGTGATCCGCGCTCCTGCTGCAGGCA +TTATGCGATCCAACGTGAAATTAGGCGATCTGGTGAAAGAGGGCGATGTCATTGCCTGGATTGGTGAGCA +TGAAATTAAAGCACCGTTGACGGGGATGGTGCGTGGCTTGTTGAACGACGGACTGGCCGTGGTCGGTGGT +TTTAAAATTGGTGATATCGATCCTCGTGGTGAAACGGCTGATTTCACCAGCGTTTCTGATAAAGCCCGGG +CGATTGGCGGCGGCGTACTTGAGGCGTTAATGATGTTGATGCATCAGGGCGTTAAAGCGACAAAAGAAGT +GCTGGAAGTGGCTTAA +>test.0417.00002.0004i_00069 480 NA | NA | NA | ID=4_2;partial=00;start_type=GTG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.504 | NA +GTGCAGGGATTTACGCCAGAAGCGATTGATGCACTGGTACAACGACCAGAGTGTGACGTAATTCTCATTG +AGGCAGATGGCTCGCGTGGAATGCCGTTAAAAGCGCCTGATGAGCACGAACCTTGCATACCTAAAAGCAG +TTGCTGCGTGATTGCTGTGATGGGAGGACATATTTTGGGTGCGAAAGTGAGCACAGAAAATGTCCATCGC +TGGTCGCAGTTTGCTGATATTACTGGGTTAACACCTGCTGCACCCTTGCAACTGAGCGATCTCGTTGCGC +TGGTTCGCCACCCTCAGGGGGCGTTTAAAAACGTACCACAAGGTTGTCGGCGAGTCTGGTTCATTAACCG +TTTTTCTCAATGTGAGAATGCGATTGCGCAAAGCGAGCTCCTTCAACCGCTGCAACAACACAACGTAGAG +GCAATCTGGCTGGGCGATATACAAGAACATCCTGCAATCGCGCGCAGATTTGTGAATTAG +>test.0417.00002.0004i_00070 579 NA | NA | NA | ID=4_3;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.430 | NA +ATGTCAGCCATCGACTGTATAATTACCGCCGCAGGATTATCATCAAGAATGGGGCAATGGAAAATGATGT +TACCCTGGCAACAGGGAACAATTCTTGATACAAGTATCAAAAATGCGTTGCAGTTTTGTAGCCGAATTAT +TTTAGTCACCGGCTATCGTGGTAATGAACTGCACGAACGTTATGCGAACCAGAGCAATATCACTATTATC +CACAACCCAGATTATGCGCAGGGTTTACTGACATCAGTAAAGGCCGCAGTACCCGCGGTACAAACAGAAC +ATTGTTTTCTCACCCACGGAGATATGCCAACCCTCACCATCGATATTTTTAGAAAAATCTGGTCGTTACG +AAATGATGGCGCAATACTGCCACTCCATAATGGCATCCCCGGCCATCCGATTTTAGTGTCAAAACCATGC +CTGATGCAGGCAATCCAGCGACCCAATGTCACCAATATGCGTCAGGCACTCCTTATGGGAGAACATTATT +CCGTCGAAATAGAAAATGCAGAAATAATTTTAGATATTGATACTCCGGACGACTTTATTACAGCGAAGAA +AAGGTATACTGAAATTTAG +>test.0417.00002.0004i_00071 3099 NA | NA | NA | ID=4_4;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.526 | NA +ATGGGGGATATTATGCGTCCCATTCCGTTTGAGGAACTTTTGACGCGCATATTTGATGAATACCAACAAC +AACGCTCAATCTTTGGTATTCCCGAGCAACAGTTTTACTCACCCGTAAAAGGTAAAACTGTTAGCGTCTT +CGGTGAAACCTGTGCCACTCCCGTCGGCCCTGCCGCTGGCCCGCACACGCAACTTGCGCAAAACATCGTC +ACCTCCTGGCTGACTGGCGGACGCTTCATCGAACTAAAAACCGTCCAAATTCTTGACCGCCTGGAGCTGG +AAAAGCCCTGTATCGATGCCGAAGACGAGTGCTTTAACACCGAATGGTCTACCGAATTTACCCTGCTTAA +AGCCTGGGATGAATACCTCAAAGCCTGGTTTGCCCTGCACCTTCTCGAAGCGATGTTCCAGCCTTCTGAT +TCCGGTAAATCGTTCATCTTTAATATGAGCGTCGGTTACAACCTCGAAGGTATTAAGCAACCGCCGATGC +AGCAGTTCATCGACAATATGATGGACGCATCTGACCATCCGAAATTCGCTCAATACCGCGATGCACTTAA +TAAGCTACTCCAGAATGAGGCATTTTTAGCCCGCCACGGATTGCAGGAAAAACGCGAAAGCTTGCAAGCC +TTACCCGCTCGCATCCCCACCAGCATGGTACAAGGGGTTACCCTCTCCACCATGCACGGCTGTCCTCCGC +ATGAAATCGAAGCCATTTGCCGCTACATGCTGGAAGAAAAAGGGCTCAACACCTTTGTGAAACTCAACCC +GACCTTACTGGGGTACGCGCGTGTTCGTGAGATCCTCGATGTCTGCGGTTTCGGTTACATCGGCTTAAAA +GAAGAGTCATTTGATCACGACCTCAAGCTGACGCAAGCGCTGGAAATGCTGGAACGCCTGATGGCACTGG +CAAAAGAAAAATCACTCGGCTTTGGCGTAAAACTGACTAACACTCTCGGCACCATTAATAACAAAGGCGC +ACTGCCTGGTGAAGAGATGTATATGTCAGGCCGTGCGCTGTTCCCGCTCTCCATCAACGTTGCAGCAGTT +CTCTCTCGCGCCTTTGACGGCAAACTGCCCATTTCTTATTCCGGTGGTGCCAGTCAGCTGACTATCCGCG +ATATTTTTGATACTGGTATTCGCCCTATTACTATGGCAACCGACCTGCTGAAACCTGGCGGCTATCTGCG +CTTAAGTGCCTGCATGCGCGAGCTGGAAGGCTCCGACGCCTGGGGACTTGACCATGTTGACGTCGAACGA +CTGAACAGACTGGCAGCAGACGCGTTAACCATGGAATACACCCAGAAACACTGGAAGCCAGAAGAGCGTA +TTGAAGTGGCTGAAGACCTGCCGCTGACCGATTGCTACGTTGCCCCCTGTGTTACTGCCTGCGCTATCAA +GCAAGATATTCCGGAATACATCCGTCTGCTTGGCGAACACCGCTATGCCGACGCGCTGGAACTCATCTAT +CAACGCAACGCCCTGCCCGCCATTACCGGTCATATTTGCGATCACCAGTGCCAATACAACTGTACCCGCC +TGGATTACGACAGTGCGCTGAATATCCGCGAACTGAAAAAAGTCGCGCTGGAAAAAGGTTGGGAGGAATA +TAAGCAACGCTGGCACAAACCAGCCGGTTCTGGTTCACGCCATCCGGTTGCCGTGATTGGTGCAGGTCCG +GCGGGTCTGGCCGCAGGTTACTTCCTTGCCAGAGCGGGCCATCCGGTTACGCTGTTTGAACGCGAAGCCA +ATGCGGGCGGCGTGGTGAAAAATATCATTCCTCAGTTCCGTATTCCTGCAGAGTTAATTCAGCACGATAT +CGATTTTGTTGCCGATCACGGCGTGAAATTTGAGTACGGTTGCTCACCCGATTTGACCGTTGAACAGTTA +AAAAATCAGGGCTTCCACTATGTTCTGATTGCCACCGGCACTGATAAAAATAGCGGTGTGAAACTGGCGG +GCGACAACCAAAATGTCTGGAAATCACTCCCCTTCCTGCGTGAATACAACAAGGGCACAGCGCTCAAGCT +GGGCAAACATGTGGTCGTTGTCGGGGCGGGTAACACGGCAATGGACTGCGCTCGTGCGGCGTTACGCGTT +CCAGGCGTAGAAAAAGCAACGGTCGTTTACCGTCGTTCACTGCAAGAGATGCCAGCATGGCGCGAAGAGT +ATGAAGAAGCGTTGCACGACGGCGTGGAGTTCCGTTTCCTGAATAATCCGGAACGTTTCGATGCTGATGG +CACCTTAACCTTGCGCGTTATGTCGCTTGGCGAACCTGATGAGAAAGGTCGTCGCCGTCCGGTTGAAACC +AACGAAACAGTAACGCTGCATGTAGACAGCCTGATCACCGCCATTGGTGAACAGCAGGATACTGAAGCCC +TGAATGCAATGGGCGTGCCGCTGGACAAAAACGGCTGGCCAGACGTCGACCATAATGGCGAAACGCGTCT +GACTGACGTCTTTATGATCGGCGACGTACAGCGCGGACCATCCTCCATTGTCGCTGCTGTCGGAACCGCG +CGTCGGGCGACCGATGCCATCCTGAGTCGGGAAAATATCCGTTCCCACCAGAACGATAAATACTGGAATA +ACGTCAATCCGGCGGAAATCTATCAACGTAAAGGCGATATCTCTGTCACTCTGGTGAACAGTGACGATCG +TGATGCGTTTGTCGCGCAGGAAGCCGCTCGCTGCCTTGAATGTAACTACGTTTGCAGCAAGTGTGTGGAT +GTCTGCCCGAACCGCGCCAACGTATCCATTGCGGTCCCAGGCTTCCAGAACCGTTTCCAGACGCTGCACC +TCGACGCTTACTGTAACGAATGTGGCAACTGCGCCCAATTCTGCCCGTGGAACGGTAAACCGTACAAAGA +CAAAATCACCGTCTTCAGCCTGTCGCAAGACTTTGATAACAGCAGCAACCCAGGCTTCCTTGTGGAAGAT +TGCCGGGTACGCGTACGTCTGAATAACCAAAGCTGGGTGTTAAACATCGACAGCGAAGGTCAGTTCAACA +ACGTACCACCGGAGCTGAACGATATGTGCCGCATCATTAGCCATGTCCACCAGCATCATCATTATCTGCT +GGGCCGCGTGGAGGTGTAA +>test.0417.00002.0004i_00072 1329 NA | NA | NA | ID=4_5;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.525 | NA +ATGTTGATTCTGAAGAATGTCACCGCAGTGCAGTTACACCCGGCGAAAGTGCAGGAAGGCGTTGATATCG +CCATCGAAAATGATGTGATTGTCGCTATCGACGATGCCCTGACGCAACGCTATCCCGATGCCAGCTACAA +AGAGATGCATGGTCGGATTGTGATGCCGGGAATTGTCTGCTCGCATAACCATTTTTACTCGGGGCTTTCC +CGCGGAATTATGGCAAACATCGCCCCCTGCCCGGATTTCATCTCAACGCTGAAAAATCTCTGGTGGCGGC +TCGATCGCGCCCTTGATGAAGAGTCGCTCTATTACAGCGGACTGATTTGTTCCCTGGAAGCAATTAAGAG +CGGATGTACATCGGTTATCGATCACCATGCCTCTCCAGCCTATATCGGCGGGTCGCTCTCCACATTGCGC +GACGCATTTTTAAAAGTTGGCCTGCGCGCGATGACCTGTTTTGAAACTACTGACCGTAACAGCGGCATCA +AAGAGTTGCAGGAAGGTGTAGAAGAAAACATCCGCTTCGCCCGTCAGATTGATGAGGCGAAGAAAGCAGC +AACCGAGCCGTATCTGGTGGAAGCACATATCGGCGCTCACGCGCCGTTTACCGTACCGGATGCCGGTCTG +GAGATGCTGTGTGAAGCCGTGAAAAGCACAGGTCGTGGTTTGCATATTCACGCTGCGGAAGACCTTTACG +ACGTTTCCTACAGTCACCATTGGTACGGCAAAGACCTGCTGGCACGACTGGCGCAATTCGATCTCATCGA +CAGCAAAACGCTGGTCGCTCATGGGCTGTACTTGTCGAAAGATGACATCGCCCTACTCAATCAGCGCGAT +GCGTTCCTGGTGCATAACGCCCGTTCAAACATGAACAACCATGTCGGCTACAACCATCACCTTAGCGACA +TCCGCAATCTGGCGTTGGGAACGGACGGCATTGGTTCGGACATGTTTGAAGAGATGAAATTTGCCTTCTT +TAAACATCGCGATGCGGGTGGCCCGCTGTGGCCTGACAGTTTTGCCAAAGCACTGGCTAACGGCAACGAA +CTGATGAGCCGCAACTTTGGCGCGAAATTTGGGCTTCTGGAAGCCGGTTACAAAGCCGATTTAACCATTT +GCGATTACAACTCGCCGACGCCGCTGCTGGCAGACAATATCGCCGGGCATATCGCTTTCGGTATGGGCTC +AGGCAGCGTTCACAGCGTGATGGTCAATGGTGTGATGGTCTATGAAGACCGTCAGTTTAACTTCGATTGC +GATTCCATTTATGCGCAAGCCAGAAAAGCCGCTGCCAGTATGTGGCGTCGGATGGATGCGCTGGCATAA +>test.0417.00002.0004i_00073 780 NA | NA | NA | ID=4_6;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.538 | NA +ATGATTGAACAATTTTTCAGACCCGACTCAGTCGAACAGGCGCTGGAACTGAAGCGCCGCTACCAGGATG +AAGCCGTCTGGTTCGCCGGGGGCAGCAAACTCAACGCTACACCAACCCGTACCGATAAAAAGATTGCCAT +TTCCTTGCAGGATCTGGAGCTGGACTGGATTGACTGGGATAACGGTGCACTACGAATTGGCGCAATGTCT +CGCTTGCAGCCACTGCGTGATGCGCGATTTATTCCTGCAGCACTGCGTGAAGCCCTCGGTTTTGTTTACT +CACGCCATGTTCGTAATCAGTCGACCATTGGTGGTGAAATCGCCGCCCGGCAAGAAGAGTCAGTGCTGCT +TCCCGTCCTGCTGGCACTGGATGCTGAACTGGTTTTTGGCAACGGCGAAACGCTGTCAATCGAGGACTAC +CTGGCCTGCCCATGCGATCGCCTGTTAACCGAAATTATCATTAAAGATCCGTATCGCACCTGTGCGACTC +GCAAAATTAGCCGTTCTCAGGCAGGTTTAACCGTCGTGACGGCAGCCGTTGCAATAACAGACCACGACGG +TATGCGAATTGCGCTGGATGGCGTCGCCAGTAAAGCACTGCGTCTGCACGATGTCGAAACTCAAAATCTG +GAAGGCAATGCACTTGAACAGGCTGTCGCCAACGCCATTTTCCCGCAGGAAGATTTGCGGGGCAGCGTGG +CCTATAAACGCTATATCACGGGAGTTCTGGTAGCCGATCTGTATGCCGACTGCCAACAGGCTGGGGAGGA +AGCCGTATGA +>test.0417.00002.0004i_00074 2871 NA | NA | NA | ID=4_7;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.527 | NA +ATGATCATCCACTTTACTTTAAATGGCGCGCCTCAGGAGCTAACCGTTAATCCAGGCGAAAACGTGCAAA +AGCTGTTGTTTAACATGGGAATGCACTCTGTACGCAACAGTGATGATGGTTTTGGGTTTGCCGGTTCTGA +CGCAATTATCTTTAACGGTAATATCGTTAACGCGTCCTTGCTTATCGCCGCACAGTTAGAGAAGGCAGAT +ATTCGTACCGCAGAATCTCTGGGCAAATGGAATGAGTTAAGTCTGGTTCAACAGGCCATGGTTGATGTTG +GCGTGGTGCAGTCTGGTTATAACGATCCAGCTGCGGCTCTGATTATCACCGATCTTCTCGATCGCATCGA +CGCACCTACCCGCGAAGAGATCGACGACGCACTCTCAGGTCTGTTTAGCCGCGATGCTGGCTGGCAGCAA +TACTATCAGGTCATTGAACTGGCGGTTGCACGTAAAAATAATCCGCAGGCCACCATTGATATCGCTCCGA +CTTTCCGTGACGACCTTGAAGTCATTGGCAAGCATTATCCTAAAACTGATGCCGCGAAAATGGTGCAGGC +GAAACCCTGCTATGTTGAAGATCGAGTAACGGCTGACGCCTGCGTCATTAAAATGTTACGTAGCCCACAC +GCTCACGCACTGATTACTCATCTGGATGTCAGCAAAGCTGAAGCCTTACCGGGCGTCGTTCACGTTATTA +CTCACCTGAATTGCCCGGATATTTACTATACCCCGGGTGGTCAGAGCGCACCGGAACCGTCACCGCTTGA +CCGCCGAATGTTCGGCAAGAAAATGCGTCACGTCGGCGATCGCGTTGCTGCGGTAGTAGCCGAAAATGAA +GACATTGCGCTCGAAGCACTGAAGCTCATCGACGTTGAATATGAAGTGCTTAAGCCGGTAATGTCGATTG +ACGAGGCAATGGCGGAAGATGCGCCTGTCGTGCACGATGAACCGGTGGTGTATGTTGCTGGTGCGCCAGA +TACTCTGGAAGATGATAACAGCCATGCAGCCCAGCGCGGCGAGCATATGATCATCAACTTCCCGATCGGT +TCTCGCCCACGCAAAAATATCGCTGCCAGTATTCATGGTCATATTGGCGATATGGACAAAGGCTTTGCCG +ATGCCGATGTGATCATTGAGCGAACCTATAACTCAACGCAGGCGCAGCAGTGCCCGACTGAAACACATAT +CTGCTTTACCCGTATGGACGGCGATCGTCTGGTGATCCACGCCTCCACCCAGGTACCATGGCACTTACGC +CGCCAGGTCGCGCGCCTCGTGGGCATGAAACAACATAAAGTTCATGTCATTAAAGAACGTGTAGGCGGCG +GTTTTGGTTCCAAACAGGACATCCTGCTGGAAGAAGTGTGCGCCTGGGCAACCTGCGTGACCGGGCGTCC +GGTACTGTTCCGCTACACCCGTGAAGAAGAGTTTATTGCTAACACCTCTCGTCACGTCGCGAAAGTCACC +GTCAAACTGGGCGCGAAAAAAGATGGTCGCCTGACGGCAGTGAAGATGGATTTCCGCGCCAACACGGGTC +CTTACGGTAACCACTCACTCACCGTACCGTGTAACGGACCGGCGCTGTCGCTGCCGTTATATCCATGCGA +TAACGTCGATTTTCAGGTCACCACCTACTACAGCAACATTTGCCCAAATGGTGCTTATCAGGGTTATGGC +GCGCCGAAAGGTAACTTCGCTATCACCATGGCGTTAGCGGAACTGGCGGAACAATTGCAGATCGACCAAC +TGGAAATTATTGAACGTAATCGTGTACACGAAGGGCAAGAGCTGAAAATTCTCGGTGCGATTGGTGAAGG +TAAAGCGCCGACATCCGTTCCTTCCGCCGCCAGCTGCGCACTGGAAGAGATCCTGCGTCAGGGTCGCGAG +ATGATCCAATGGTCTTCACCAAAACCACAAAACGGTGACTGGCACATCGGTCGTGGCGTCGCCATTATCA +TGCAGAAATCGGGTATCCCGGATATCGATCAGGCTAACTGCATGATCAAACTGGAATCAGACGGTACCTT +TATCGTTCATTCTGGCGGTGCGGATATTGGTACTGGTTTGGATACTGTGGTGACGAAACTGGCAGCAGAA +GTGCTGCACTGCCCCCCGCAGGACGTGCATGTTATCTCCGGTGATACCGATCATGCGTTGTTTGATAAAG +GCGCATATGCCTCGTCCGGTACTTGCTTCTCGGGTAACGCTGCGCGTTTGGCAGCGGAAAATCTGCGGGA +GAAAATCCTGTTCCACGGCGCGCAAATGTTGGGTGAGCCAGTGGCAGATGTTCAACTAGCAACGCCGGGC +GTCGTTCGCGGCAAGAAAGGCGAAGTTAGTTTCGGAGAGATAGCCCATAAAGGCGAAACCGGCACCGGCT +TTGGTTCACTGGTGGGAACTGGCAGTTATATCACGCCTGATTTCGCCTTCCCGTATGGCGCAAACTTCGC +TGAAGTTGCCGTCAACACGCGTACGGGTGAAATCCGCCTGGATAAATTCTACGCCTTGCTGGACTGCGGT +ACACCGGTCAATCCAGAGTTAGCGCTGGGACAAATCTACGGTGCCACCCTGCGTGCTATCGGCCACAGTA +TGAGCGAAGAGATCATTTATGACGCCGAAGGTCACCCGTTAACGCGTGATTTACGCAGTTACGGCGCACC +GAAAATTGGTGACATTCCGCGTGATTTCCGCGCTGTGCTGGTGCCGAGCGACGATAAAGTCGGCCCATTC +GGGGCGAAATCGATCTCGGAAATCGGTGTAAATGGCGCCGCTCCGGCGATTGCTACCGCAATTCACGATG +CCTGCGGCATCTGGTTACGCGAATGGCATTTCACACCGGAGAAAATACTCACCGCGCTGGAAAAAATATA +A +>test.0417.00002.0004i_00075 1401 NA | NA | NA | ID=4_8;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.490 | NA +ATGTCTGATATAAACCATGCAGGTTCTGACCTTATATTTGAACTGGAGGATCGCCCTCCCTTTCATCAGG +CTCTCGTAGGTGCCATTACCCATCTGTTGGCAATTTTCGTTCCGATGGTAACCCCCGCGTTAATCGTGGG +TGCGGCCTTACAGCTTTCCGCTGAAACAACTGCCTATCTTGTTTCTATGGCGATGATCGCCTCTGGTATT +GGTACCTGGTTACAAGTAAACCGCTACGGCATCGTCGGTTCTGGTTTACTTTCAATTCAGTCAGTCAATT +TTTCATTTGTTACGGTCATGATTGCGCTGGGTAGCAGCATGAAAAGCGACGGTTTTCACGAAGAGTTAAT +CATGTCGTCGCTCCTCGGCGTCTCCTTCGTTGGCGCATTTCTGGTTGTCGGCTCTTCTTTTATCCTGCCC +TATTTACGTCGGGTTATTACGCCTACCGTCAGCGGCATTGTGGTGCTGATGATCGGCTTAAGCCTGATTA +AAGTTGGCATTATTGATTTTGGCGGTGGTTTTGCAGCTAAAAGCAGCGGTACGTTCGGCAATTACGAGCA +TCTCGGCGTTGGCTTATTGGTTTTGATTGTGGTGATCGGCTTTAACTGCTGCAGCAGTCCGTTGCTACGC +ATGGGTGGGATCGCCATTGGGCTATGTGTCGGCTATATCGCATCGTTATGCCTGGGCATGGTGGATTTCA +GCAGTGTGCGCAATTTGCCGTTAATCACCATCCCGCATCCGTTCAAATACGGCTTTAGTTTTAGCTTCCA +TCAGTTCCTGGTGGTTGGCACGATTTATCTGCTTAGCGTGCTGGAAGCTGTCGGCGATATCACCGCCACG +GCAATGGTTTCCCGCCGTCCCATTCAGGGGGAAGAGTATCAGTCCCGACTGAAAGGCGGCGTGCTGGCAG +ATGGTCTGGTTTCTGTTATCGCCTCCGCTGTCGGTTCATTACCATTAACCACGTTTGCGCAAAATAATGG +GGTTATTCAGATGACTGGCGTCGCTTCACGTTATGTCGGGCGAACCATCGCGGTAATGCTGGTTATCCTC +GGCTTATTTCCGATGATTGGCGGCTTCTTCACGACCATTCCCTCAGCAGTTCTGGGAGGCGCAATGACGT +TGATGTTTTCCATGATTGCCATCGCAGGGATTCGCATCATCATCACCAACGGTTTAAAGCGCCGAGAAAC +ACTTATTGTCGCCACGTCTTTAGGTTTAGGGCTTGGCGTCTCCTACGATCCCGAAATTTTTAAAATATTG +CCAGCCTCTATTTATGTATTAGTTGAAAACCCTATTTGTGCTGGCGGGTTAACTGCGATTTTATTAAATA +TTATCCTCCCTGGTGGCTACCGACAGGAAAACGTTCTGCCTGGTATTACCTCAGCGGAAGAGATGGATTA +A +>test.0417.00002.0004i_00076 1317 NA | NA | NA | ID=4_9;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.483 | NA +ATGTCAGGAGAACACACGTTAAAAGCGGTACGAGGCAGTTTTATTGATGTCACCCGTACGGTCGATAACC +CGGAAGAAATTGCCTCTGCGCTGCGGTTTATTGAGGATGGTTTATTACTCATTAAACAGGGAAAAGTGGA +ATGGTTTGGCGAATGGGAAGACGGAAAGCATCAAATTCCTGACACCATTCGCGTGCGCGACTATCGCGGC +AAACTGATAGTACCGGGCTTTGTCGATACACATATCCATTATCCGCAAAGTGAAATGGTGGGGGCCTATG +GTGAACAATTGCTGGAGTGGTTGAATAAACACACCTTCCCTACTGAACGTCGTTATGAGGATTTAGAGTA +CGCCCGCGAGATGTCGGCGTTCTTCATCAAGCAGCTTTTACGTAACGGAACCACCACGGCGCTGGTGTTT +GGCACTGTTCATCCACAATCCGTTGATGCGCTGTTTGAAGCCGCCAGTCATATCAATATGCGTATGATTG +CCGGTAAAGTGATGATGGACCGAAACGCACCGGATTATCTGCTCGACACTGCCGAAAGCAGCTATCACCA +AAGCAAAGAACTGATTGAACGCTGGCACAAAAATGGTCGTCTGTTGTATGCGATTACGCCACGCTTCGCC +CCTACCTCATCTCCTGAACAGATGGCGATGGCGCAACGCCTGAAAGAAGAATATCCGGATACATGGGTAC +ATACCCATCTCTGTGAAAACAAAGATGAAATTGCCTGGGTGAAATTGCTTTATCCTGACCATGATGGTTA +TCTTGATGTTTACCATCAGTACGGCCTGACCGGTAAAAATTGTGTCTTTGCTCACTGCGTCCATCTCGAA +GAAAAAGAGTGGGATCGTCTCAGCGAAACCAAATCCAGCATTGCTTTCTGTCCGACCTCCAACCTTTACC +TCGGCAGCGGCTTATTCAACTTGAAAAAAGCATGGCAGAAGAAAGTCAAAGTGGGCATGGGAACAGATAT +CGGTGCCGGAACAACTTTTAACATGCTGCAAACGCTGAACGAAGCCTACAAGGTATTGCAATTACAAGGC +TATCGCCTCTCGGCATATGAAGCGTTTTACCTGGCCACGCTCGGCGGAGCGAAATCTCTGGGCCTTGACG +ATTTGATTGGCAACTTTTTACCTGGCAAAGAGGCTGATTTCGTGGTGATGGAACCCACTGCCACTCCGCT +ACAGCAGCTGCGCTATGACAACTCTGTTTCTTTAGTCGACAAATTGTTCGTGATGATGACGTTGGGCGAT +GACCGTTCGATCTACCGCACCTACGTTGATGGTCGTCTGGTGTACGAACGCAACTAA +>test.0417.00002.0004i_00077 1368 NA | NA | NA | ID=4_10;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.531 | NA +ATGTCTGGAGACATCCTACAAACACCGGACGCACCAAAGCCACAGGGCGCGCTGGATAATTATTTTAAAA +TTACCGCTCGTGGCAGTACCGTTCGTCAGGAAGTACTGGCTGGCTTAACGACCTTTCTGGCCATGGTTTA +TTCCGTTATCGTCGTTCCGGGAATGCTGGGCAAAGCAGGTTTTCCTCCCGCAGCTGTGTTTGTTGCCACC +TGTCTGGTCGCGGGCTTCGGCTCGTTGCTGATGGGGTTATGGGCCAATTTGCCAATGGCGATTGGTTGCG +CTATTTCCTTGACGGCGTTTACCGCATTCAGTCTGGTACTCGGGCAACAAATTAGCGTTCCTGTCGCACT +GGGCGCAGTCTTTCTGATGGGCGTCATCTTCACCGCTATTTCCGTAACCGGTGTGCGTACCTGGATCTTA +CGTAATTTGCCGATGGGGATCGCTCACGGTACAGGTATCGGTATCGGCCTGTTTCTGCTGCTGATTGCTG +CTAACGGTGTGGGAATGGTTATCAAAAACCCGATTGAAGGCTTGCCAGTGGCGCTCGGTGCGTTTACCTC +CTTCCCGGTGATGATGAGCTTACTGGGGCTGGCGGTCATCTTCGGTCTGGAAAAGTGCCGCGTACCCGGC +GGGATCTTGTTGGTGATTATTGCAATTTCGATCATCGGCTTAATCTTTGACCCAGCGGTGAAGTACCACG +GTCTGGTGGCAATGCCAAGCCTGACTGGCGAAGATGGTAAGTCTCTGATTTTCAGCCTCGATATTATGGG +CGCACTCCAGCCAACTGTACTTCCGAGTGTACTGGCATTGGTGATGACCGCAGTGTTCGACGCCACTGGC +ACCATCCGTGCCGTCGCCGGTCAGGCGAATTTGTTGGATAAAGACAACCAGATCATCAACGGCGGCAAAG +CCCTGACCAGTGACTCAGTAAGTTCAATATTCTCCGGCCTGGTGGGCGCAGCGCCCGCGGCGGTTTATAT +CGAATCAGCGGCAGGAACCGCCGCCGGGGGGAAAACCGGTTTAACCGCAACCGTGGTTGGTGTGTTGTTC +CTGATGATTCTGTTTTTATCACCGTTATCGTTTCTGATCCCCGGTTATGCCACAGCTCCCGCACTGATGT +ACGTGGGTTTGCTGATGTTAAGCAACGTCTCGAAGCTGGATTTCAACGATTTTATTGACGCAATGGCTGG +CCTGGTGTGTGCCGTGTTCATCGTTCTGACTTGTAATATCGTTACCGGTATTATGCTGGGCTTTGTAACA +CTGGTGGTGGGTCGCGTCTTTGCGCGCGAATGGCAAAAGCTGAATATTGGTACGGTGATCATTACTGCCG +CACTGGTCGCGTTTTACGCGGGTGGTTGGGCAATCTAA +>test.0417.00002.0004i_00078 489 NA | NA | NA | ID=4_11;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.554 | NA +ATGAAATCGTTAATTATCGTTAATCCGGCTGACTGTATTGGCTGCCGTACTTGTGAAGTGGCCTGTGTGG +TCGCTCACCCTTCAGAACAGGAGTTGAATGCCGATATCTTTTTACCCCGGCTGAAGGTACAACGGCTGGA +TAGCATCAGTGCGCCGGTGATGTGCCATCAGTGTGAAAACGCCCCTTGTGTTGGCGCTTGCCCCGTGGGG +GCGCTGACGATGGGCGAGCAGGTGGTGCAGGCCAATTCTGCCCGTTGTATTGGCTGTCAGAGTTGCGTTA +GCGCGTGCCCGTTTGGGATGATCACCATTCAGTCATTGCCGGGTGATCCCCGGCAACAAATCGTGAAATG +CGATCTCTGTGAACTGCGGGAAGAGGGGCCAGCCTGCGTTGAATCTTGCCCGACACAGGCGCTGCAGTTG +CTGACTGAAAGAGAACTCAGGCGTATCCGCCAGCAGCGTATTGCTGCCAGCAGTGAGAATCCTCTCTGA +>test.0417.00002.0004i_00079 1920 NA | NA | NA | ID=4_12;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.528 | NA +ATGAATAAGTTTATCGCTGCTGAAGCTGCGGAATGTATAGGCTGCCATGCTTGTGAAATTGCCTGTGCGG +TGGCACATAATCAAGAAAACTGGCCGCTGAGTCACAGTGACTTTCGACCGCGTATCCACGTTGTAGGGAA +AGGCCAGGCTGCGAATCCGGTGGCCTGCCATCACTGCAACAATGCCCCTTGCGTTACGGCTTGTCCGGTT +AATGCTCTGACTTTCCAGTCCGATAGCGTACAACTGGACGAGCAAAAATGTATTGGTTGTAAAAGATGCG +CAATCGCTTGCCCCTTTGGCGTCGTTGAGATGGTCGATACGATTGCACAGAAATGCGACCTTTGTAACCA +GCGCAGTTCCGGCACGCAAGCCTGTATTGACGTCTGCCCAACACAGGCGTTACGGCTGATGGACGATAAA +GGGTTGCAGCAGATAAAGGTGGCCCGCCAGCGCAAAACGGCAGCAGGAAAAGCGTCATCAGACGCTCAGC +CATCTCGCAGTGCAGCGTTGCTCCCCGTTAACTCGCGTAAAGGCGCAGATAAAATTTCAGCGAGTGAACG +GAAAACCCACTTTGGCGAAATCTATTGCGGGCTGGATCCACAACAAGCGACTTATGAGAGTGACCGCTGT +GTTTATTGTGCCGAAAAAGCTAACTGCAACTGGCATTGTCCGCTGCATAACGCTATTCCGGATTACATCC +GTCTGGTACAGGAAGGAAAGATTATTGAAGCGGCAGAACTTTGCCACCAGACCAGTTCCTTACCCGAAAT +CTGCGGCAGGGTATGTCCACAGGACCGTCTTTGTGAAGGTGCATGTACTTTGAAAGATCACTCTGGCGCA +GTCTCTATCGGTAATCTGGAACGCTACATCACCGATACTGCGCTGGCGATGGGCTGGCGTCCCGATGTCA +GCAAAGTTGTTCCCCGTAGCGAAAAAGTGGCGGTGATTGGCGCTGGACCTGCAGGATTAGGGTGTGCTGA +TATTCTGGCGCGCGCGGGAGTTCAGGTTGATGTCTTTGATCGCCATCCAGAAATTGGCGGTATGCTGACT +TTTGGCATTCCTCCTTTCAAACTCGATAAAACGGTATTAAGCCAGCGGCGAGAGATATTCACCGCAATGG +GAATCGATTTCCATCTCAACTGTGAAATTGGCCGCGATATCTCTTTCAACGAATTAACGGCGGAATATGA +TGCTGTTTTCCTCGGCGTGGGGACTTACGGGATGATGCGAGCAGATCTGCCGCATGAAGATGCGCCTGGT +GTCATTCAGGCGTTACCGTTCCTGACCGCCCATACCCGCCAGCTCATGGGATTGCCGGAGTCTGCAGAGT +ATCCGCTGACGGATGTGGAAGGGAAGCGAGTCGTGGTATTGGGCGGTGGCGATACGACAATGGATTGTTT +GCGGACTTCCATCCGCCTTAATGCTGCCAGCGTGACCTGTGCGTATCGTCGTGATGAAGTCAGTATGCCG +GGTTCGCGCAAAGAGGTGGTCAATGCCCGCGAGGAAGGTGTTGAGTTTCAGTTCAATGTTCAGCCGCAAT +ATATCGCTTGTGATGAAGATGGACGCTTAACGGCGGTGGGCCTGATTCGTACCGCTATGGGTGAGCCGGG +GCCGGATGGTCGCCGTCGTCCTCGTCCGGTTGCGGGTTCAGAGTTTGAATTGCCCGCCGATGTTCTCATT +ATGGCCTTTGGTTTCCAGGCACATACCATGCCGTGGTTGCAGGGCAGCGGAATTAAACTCGATAAATGGG +GCCTGATTCAAACCGGCGACGTCGGGTATTTACCTACCCAGACGCATCTGAAAAAAGTCTTTGCTGGTGG +TGATGCAGTTCATGGCGCGGATCTGGTTGTCACTGCAATGGCCGCAGGAAGGCAGGCGGCGCGCGATATG +TTAACTCTGTTTGATACGAAGGCATCGTGA +>test.0417.00002.0004i_00080 1449 NA | NA | NA | ID=4_13;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.500 | NA +ATGAGCGCCATAGATTCCCAACTTCCCTCATCTTCTGGGCAAGACCGCCCAACTGATGAGGTTGACCGCA +TATTATCACCAGGAAAGCTGATCATACTCGGTCTGCAACACGTCCTTGTCATGTACGCAGGTGCAGTCGC +TGTTCCTCTTATGATTGGTGACCGACTCGGCCTATCAAAAGAAGCTATTGCGATGCTCATCAGCTCGGAT +CTCTTTTGCTGCGGGATCGTCACATTATTGCAATGTATCGGTATCGGCCGCTTTATGGGGATCCGCCTGC +CGGTGATTATGTCGGTGACCTTCGCCGCTGTAACACCAATGATAGCCATTGGTATGAACCCGGATATCGG +CCTGCTGGGGATATTCGGTGCCACTATCGCCGCGGGTTTTATCACCACATTATTAGCGCCACTTATCGGT +CGCTTGATGCCTTTATTCCCGCCACTGGTTACCGGTGTGGTGATTACTTCTATCGGGCTTAGCATCATTC +AGGTGGGTATTGACTGGGCCGCCGGAGGTAAAGGGAATCCGCAATATGGTAATCCCGTTTATTTAGGTAT +CTCCTTTGCCGTCTTAATTTTTATCTTGCTCATTACTCGCTATGCGAAAGGATTTATGTCCAACGTCGCC +GTATTACTGGGGATTGTATTTGGCTTTTTACTTTCGTGGATGATGAATGAAGTCAATTTATCCGGGCTAC +ATGATGCTTCATGGTTTGCGATTGTCACGCCGATGTCATTTGGTATGCCGATTTTCGATCCCGTTTCCAT +TCTGACCATGACTGCCGTGTTAATCATCGTGTTTATCGAGTCGATGGGGATGTTCCTGGCACTGGGTGAA +ATAGTCGGTCGCAAACTCTCTTCCCAGGACATTATTCGTGGGTTACGCGTAGATGGGGTTGGGACAATGA +TTGGAGGCACGTTTAACAGCTTCCCACATACGTCATTTTCGCAGAACGTCGGGCTGGTCAGCGTGACGCG +CGTCCACAGCCGCTGGGTGTGCATTGCTTCCGGTATCATTTTGATCCTGTTCGGCATGGTGCCCAAAATG +GCGGTGCTGGTGGCCTCGATTCCGCAATTTGTGCTGGGCGGCGCGGGGCTGGTGATGTTCGGCATGGTAC +TGGCGACAGGGATTCGAATTCTGTCGCGCTGTAACTACACCACTAACCGTTACAACCTCTATATTGTGGC +GATCAGTCTCGGTGTTGGCATGACGCCAACGCTCTCTCACGATTTCTTTTCTAAGTTACCGGCCGTACTG +CAACCGTTGCTGCATAGCGGCATTATGCTCGCAACCCTTAGCGCCGTTGTGCTGAACGTCTTCTTTAATG +GCTACCAGCATCATGCTGACCTGGTGAAGGAATCCGTCTCTGATAAAGATTTAAAAGTCAGGACAGTACG +TATGTGGCTTCTGATGCGCAAGCTGAAGAAAAATGAGCATGGAGAATAA +>test.0417.00002.0004i_00081 126 NA | NA | NA | ID=4_14;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.357 | NA +ATGAATCTTTTAATGCGCGCTATATTCAGTCTGCTGTTGCTTTTTACTCTCTCTATTCCTGTCATTTCTG +ATTGTGTTGCAATGGCCATTGAAAGTCGCTTCAAATATATGATGCTGCTTTTTTAA +>test.0417.00002.0004i_00082 549 NA | NA | NA | ID=4_15;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.506 | NA +ATGCAAACGGAACACGTCATTTTATTGAATGCACAGGGAGTTCCCACGGGTACGCTGGAAAAGTATGCCG +CACACACGGCAGACACCCTCTTACATCTCGCGTTTTCCAGTTGGCTGTTTAATGCCAAAGGGCAATTATT +AGTTACCCGCCGCGCCCTTAGCAAAAAAGCATGGCCTGGCGTGTGGACTAACTCGGTTTGTGGGCACCCA +CAACCGGGAGAAAGCAACGAAGAGGCGGTGATCCGCCGTTGCCGTTATGAGCTTGGCGTAGAAATTACGC +CTCCTGAATCTATCTATCCTGACTTTCGCTACCGCGCCACCGATCCGAATGGCATTGTGGAAAATGAAGT +GTGTCCGGTATTTGCCGCACGCACGACCAGTGCGTTACAGATCAACGATGATGAAGTGATGGATTATCAA +TGGTGTGATTTAGCAGCGGTTTTACGCGGTATTGATGCTACGCCGTGGGCGTTCAGTCCGTGGATGGTGA +TGCAGGCGACAAATCGCGAAGCCAGAAAACGATTATCTGCATTTACCCAGCTTAAATAA +>test.0417.00002.0004i_00083 1518 NA | NA | NA | ID=4_16;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.529 | NA +ATGTCTGAACAACACGCACAGGGCGCTGACGCGGTAGTCGATCTTAACAATGAACTGAAAACGCGTCGTG +AGAAGCTGGCGAACCTGCGTGAGCAGGGGATTGCCTTCCCGAACGATTTCCGTCGCGATCATACCTCTGA +CCAATTGCACGCAGAATTCGACGGTAAAGAGAACGAAGAACTGGAAGCGCTGAACATCGAAGTCGCCGTT +GCTGGCCGCATGATGACCCGTCGTATTATGGGTAAAGCGTCTTTCGTTACCCTGCAGGACGTTGGCGGTC +GCATTCAGTTGTACGTTGCCCGTGACGATCTGCCGGAAGGCGTTTACAACGAGCAGTTCAAAAAATGGGA +CCTCGGCGATATCCTCGGCGCGAAAGGTAAACTGTTCAAAACCAAAACCGGCGAACTGTCTATCCACTGT +ACCGAGCTGCGTCTGCTGACCAAAGCACTGCGTCCGCTGCCGGATAAATTCCACGGCTTGCAGGATCAGG +AAGCGCGCTATCGTCAGCGTTATCTGGATCTCATCTCTAACGATGAATCCCGCAACACCTTTAAAGTGCG +CTCGCAGATCCTCTCTGGTATTCGCCAGTTCATGGTGAATCGCGGCTTTATGGAAGTTGAAACGCCGATG +ATGCAGGTGATCCCTGGCGGTGCCGCTGCGCGTCCGTTCATCACCCACCATAACGCGCTGGATCTCGACA +TGTACCTGCGTATCGCGCCGGAACTGTACCTCAAGCGTCTGGTGGTCGGTGGCTTCGAGCGTGTATTCGA +AATCAACCGTAACTTCCGTAACGAAGGTATTTCCGTACGTCATAACCCAGAGTTCACCATGATGGAACTC +TATATGGCTTACGCAGATTACAAAGATCTGATCGAGCTGACCGAATCGCTGTTCCGTACTCTGGCACAGG +ATATTCTCGGTAAGACGGAAGTGACCTACGGCGACGTAACGCTGGACTTCGGTAAGCCGTTCGAAAAACT +GACCATGCGTGAAGCGATCAAGAAATATCGCCCGGAAACCGACATGGCAGATCTGGACAACTTCGACTCT +GCGAAAGCGATTGCTGAATCTATCGGCATCCACGTTGAGAAGAGCTGGGGTCTGGGCCGTATCGTTACCG +AGATCTTCGAAGAAGTGGCAGAAGCACATCTGATCCAGCCGACCTTCATTACTGAATATCCGGCAGAAGT +TTCTCCTCTGGCGCGTCGTAACGACGTTAACCCGGAAATCACAGACCGCTTTGAGTTCTTCATTGGTGGG +CGTGAAATCGGTAACGGCTTTAGCGAGCTGAATGACGCGGAAGATCAGGCGCAGCGCTTCCTGGATCAGG +TTGCCGCGAAAGATGCAGGTGACGACGAAGCGATGTTCTACGACGAAGATTATGTCACCGCACTGGAACA +TGGCTTACCACCGACAGCCGGTCTGGGAATTGGTATCGACCGTATGGTAATGCTGTTCACCAACAGCCAT +ACCATCCGCGACGTTATTCTGTTCCCGGCGATGCGTCCGGTAAAATAA +>test.0417.00002.0004i_00084 882 NA | NA | NA | ID=4_17;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.533 | NA +ATGAAACAGGGGCTGGAAGATGTTTCTGGTCTGCTGGAACTGGCTGTAGAAGCTGACGACGAAGAAACCT +TTAACGAAGCCGTTGCTGAACTCGACGCCCTGGAAGAAAAACTGGCGCAGCTTGAGTTCCGCCGTATGTT +CTCTGGCGAATATGACAGCGCCGACTGCTACCTCGATATTCAGGCGGGGTCTGGCGGTACGGAAGCACAG +GACTGGGCGAGCATGCTTGAGCGTATGTATCTGCGCTGGGCTGAATCGCGTGGTTTCAAAACTGAAATCA +TCGAAGAGTCGGAAGGTGAAGTGGCGGGTATTAAATCCGTGACGATCAAAATCTCCGGCGATTACGCTTA +TGGCTGGCTGCGTACAGAAACCGGCGTTCACCGCCTGGTGCGTAAGAGCCCGTTTGACTCCGGTGGTCGT +CGCCACACGTCGTTCAGCTCCGCGTTTGTTTACCCGGAAGTTGATGATGATATCGATATCGAAATCAATC +CGGCGGATCTGCGCATCGACGTTTATCGCGCATCCGGCGCGGGCGGTCAGCACGTTAACCGTACCGAATC +TGCGGTGCGTATTACTCACATCCCAACCGGGATCGTGACCCAATGCCAGAACGACCGTTCCCAGCACAAG +AACAAAGACCAGGCCATGAAGCAGATGAAAGCGAAGCTTTATGAACTGGAGATGCAGAAGAAAAATGCCG +AGAAACAGGCGATGGAAGATAACAAATCCGACATCGGCTGGGGCAGCCAGATTCGTTCTTATGTCCTTGA +TGACTCCCGCATTAAAGATCTGCGTACCGGGGTAGAAACCCGCAACACGCAGGCCGTGCTGGACGGCAGC +CTGGATCAATTTATCGAAGCAAGTTTGAAAGCAGGGTTATGA +>test.0417.00002.0004i_00085 1734 NA | NA | NA | ID=4_18;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.565 | NA +GTGAAACAACAGATACAACTTCGTCGCCGAGAAGTCGATGAAACGGCCGACTTGCCCGCTGAATTGCCTC +CCTTGCTGCGCCGTTTATATGCCAGCCGGGGTGTGCGTAGCGCGCAGGAACTGGAACGCAGTGTTAAAGG +CATGCTGCCCTGGCAGCAACTGAGCGGCGTCGAAAAGGCCGTTGAGATCCTTTACAACGCTTTTCGCGAA +GGAACGCGGATTATTGTGGTCGGTGATTTCGACGCCGACGGTGCGACCAGCACGGCTCTAAGCGTGCTGG +CGATGCGCTCGCTTGGTTGCAGCAATATCGACTACCTGGTTCCAAACCGTTTCGAAGACGGTTACGGCTT +AAGCCCGGAAGTAGTCGATCAGGCTCATGCCCGTGGCGCGCAGTTAATTGTCACGGTGGATAACGGTATT +TCCTCCCATGCGGGGGTTGAACACGCTCGTTCGTTGGGCATTCCGGTTATTGTTACCGATCACCATTTGC +CAGGCGACACATTACCCGCAGCGGAAGCGATCATTAACCCTAACTTGCGCGACTGTAATTTCCCGTCGAA +ATCACTGGCAGGCGTGGGTGTGGCGTTTTATCTGATGCTGGCGCTGCGCACCTTTTTGCGCGATCAGGGC +TGGTTTGATGAGCGCGGCATCGCAATTCCTAATCTGGCAGAACTGCTGGATCTGGTAGCGTTGGGGACAG +TGGCGGACGTCGTGCCGCTGGACGCTAATAATCGCATTCTGACCTGGCAGGGGATGAGTCGCATCCGTGC +CGGAAAGTGCCGTCCGGGGATTAAAGCGCTGCTGGAAGTGGCCAATCGCGATCCACAAAAACTCGCCGCC +AGCGATTTAGGTTTTGCGCTGGGGCCACGTCTCAATGCTGCCGGGCGACTGGACGATATGTCCGTTGGCG +TGGCGCTGTTGTTGTGTGACAACATTGGCGAAGCGCGTGTGCTGGCGAATGAACTCGATGCACTAAACCA +AACACGTAAAGAGATCGAACAGGGAATGCAGGTTGAAGCGCTCACTCTGTGCGAGAAGCTGGAACGTAGC +CGCGACACGCTGCCAGGTGGGCTGGCAATGTATCACCCTGAATGGCATCAGGGCGTTGTTGGCATTCTGG +CATCGCGTATCAAAGAGCGTTTTCACCGTCCGGTTATCGCCTTTGCGCCTGCGGGCGACGGTACGCTGAA +AGGTTCCGGTCGCTCCATTCAGGGGCTGCATATGCGCGATGCGCTGGAGCGGCTAGACACGCTTTACCCC +GGCATGATGCTCAAGTTTGGCGGCCATGCGATGGCGGCGGGTTTGTCGCTGGAAGAGGAGAAATTCGAAC +TCTTTCAGCAACGCTTTGGCGAACTGGTTACCGAGTGGTTAGATCCTTCTTTATTGCAAGGGGAAGTGGT +ATCAGACGGCCCATTAAGTGCGGCAGAGATGACCATGGAAGTGGCGCAACTGCTGCGTGATGCTGGCCCG +TGGGGACAAATGTTCCCGGAACCGTTGTTTGACGGTCATTTCCGTCTGCTGCAACAGCGGCTGGTGGGCG +AGCGTCATTTGAAAGTCATGGTCGAGCCGGTCGGCGGCGGTCCGCTGCTGGATGGTATTGCTTTTAATGT +CGATACCGCCCTCTGGCCGGATAACGGCGTGCGCGAAGTGCAACTGGCTTACAAGCTCGATATCAACGAG +TTTCGCGGCAACCGCAGCCTGCAAATTATCATCGACAATATCTGGCCAATTTAG +>test.0417.00002.0004i_00086 711 NA | NA | NA | ID=4_19;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.482 | NA +ATGAAGAAAGGTTTTATGTTATTTACCTTGTTGGCAGCGTTTTCAGGCTTTGTTCAGGCTGATGACGCGG +CAATTCAACAAACGTTAGCCAAAATGGGCATCAAAAGCAGCGATATTCAGCCCGCGCCCGTAGCTGGCAT +GAAGACAGTTCTGACTAACAGCGGTGTGTTGTACATCACCGATGATGGTAAACATATCATTCAGGGGCCA +ATGTATGACGTTAGTGGCACGGCTCCGGTCAATGTCACCAATAAGATGCTGTTAAAGCAGTTGAATGCGC +TTGAAAAAGAGATGATCGTTTATAAAGCGCCGCAGGAAAAACACGTCATCACCGTGTTTACTGATATTAC +CTGTGGTTACTGCCACAAACTGCATGAGCAAATGGCAGACTATAACGCGCTGGGGATCACCGTGCGTTAT +CTTGCTTTCCCGCGCCAGGGGCTGGACAGCGATGCAGAGAAAGAAATGAAAGCTATCTGGTGTGCGAAAG +ATAAAAACAAAGCGTTTGATGATGTGATGGCAGGTAAAAGCGTCGCACCAGCCAGCTGCGACGTGGATAT +TGCCGACCATTACGCACTTGGCGTCCAGCTTGGCGTTAGCGGTACTCCGGCAGTTGTGCTGAGCAATGGC +ACACTTGTTCCGGGTTACCAGCCGCCGAAAGACATGAAAGAATTCCTCGACGAACACCAAAAAATGACCA +GCGGTAAATAA +>test.0417.00002.0004i_00087 897 NA | NA | NA | ID=4_20;partial=00;start_type=GTG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.530 | NA +GTGAAACAGGATCTGGCACGCATCGAGCAGTTTCTTGATGCTCTGTGGCTGGAAAAAAATCTGGCTGAAA +ATACGTTGAACGCTTACCGTCGCGATCTGTCAATGATGGTGGAGTGGTTGCATCACCGCGGGTTGACGCT +GGCGACGGCGCAAAGTGACGATTTGCAGGCATTACTGGCAGAACGGCTGGAGGGCGGGTATAAAGCCACC +AGCTCAGCGCGTTTGCTGAGTGCAGTGCGCCGATTGTTCCAGTATCTTTATCGCGAAAAGTTTCGTGAAG +ATGATCCCAGTGCGCATCTCGCTTCACCGAAATTGCCCCAGCGTTTGCCAAAAGATTTAAGCGAAGCGCA +GGTCGAACGTTTATTACAGGCACCATTAATTGATCAGCCACTGGAGCTACGCGATAAAGCCATGCTTGAA +GTGTTGTATGCTACCGGACTGCGTGTCTCTGAACTGGTCGGGCTGACAATGAGTGATATCAGCCTGCGTC +AGGGCGTGGTGCGGGTCATTGGTAAAGGCAACAAAGAGCGCCTGGTGCCGTTAGGTGAAGAGGCGGTTTA +CTGGCTGGAAACCTATCTGGAACATGGGCGTCCGTGGCTGTTGAATGGTGTGTCAATTGACGTGTTGTTT +CCCAGCCAGCGTGCGCAGCAGATGACGCGACAGACCTTCTGGCACCGCATTAAACATTATGCCGTGCTGG +CGGGTATCGACAGCGAAAAGCTGTCACCGCATGTGTTGCGTCACGCTTTTGCCACTCACTTATTAAATCA +TGGTGCGGATTTACGCGTGGTGCAGATGCTACTGGGCCACAGCGATCTCTCCACCACGCAAATTTATACG +CATGTCGCTACCGAGCGTCTGCGACAACTTCATCAACAGCATCACCCGCGGGCGTGA +>test.0417.00002.0004i_00088 522 NA | NA | NA | ID=4_21;partial=00;start_type=ATG;rbs_motif=AGxAG;rbs_spacer=5-10bp;gc_cont=0.517 | NA +ATGAATATGGGTCTTTTTTACGGTTCCAGCACCTGTTACACCGAAATGGCGGCAGAAAAAATCCGCGATA +TTATCGGCCCAGAACTGGTGACCTTACATAACCTCAAGGACGACTCCCCGAAATTAATGGAGCAGTACGA +TGTGCTCATTCTGGGTATCCCGACCTGGGATTTTGGCGAAATCCAGGAAGACTGGGAAGCCGTCTGGGAT +CAGCTCGACGACCTGAACCTCGAAGGTAAAATTGTTGCGCTGTATGGGCTTGGCGATCAACTGGGATACG +GCGAGTGGTTCCTCGATGCGCTCGGTATGCTGCATGACAAACTCTCGACCAAAGGCGTGAAGTTCGTCGG +CTACTGGCCAACGGAAGGATATGAATTTACCAGCCCGAAACCGGTGATTGCTGACGGGCAACTGTTCGTG +GGTCTGGCGCTGGATGAAACTAACCAGTATGACCTTAGCGACGAGCGTATTCAGAGCTGGTGCGAGCAAA +TCCTCAACGAAATGGCAGAGCATTACGCCTGA +>test.0417.00002.0004i_00089 408 NA | NA | NA | ID=4_22;partial=00;start_type=GTG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.539 | NA +GTGGTCCTGTGGCAATCTGATTTGCGCGTCTCCTGGCGCGCACAGTGGCTTTCCTTGCTGATTCATGGGC +TGGTTGCCGCTGTTATTTTACTCATGCCCTGGCCGCTCAGTTACACCCCGTTATGGATGGTGTTACTTTC +GCTGGTGGTGTTTGATTGCGTTCGCAGCCAGCGGCGCATTAATGCTCGCCAGGGGGAAATTCGCTTGTTG +ATGGACGGGCGTTTGCGTTGGCAAGGGCAGGAGTGGAGCATCGTCAAAGCGCCGTGGATGATTAAGAGCG +GCATGATGCTGCGTTTACGTTCTGACAGCGGAAAACGGCAACATTTATGGCTGGCAGCTGACAGCATGGA +CGAAGCCGAATGGCGGGATTTACGGCGGATATTGTTACAACAAGAGACGCAAAGATAA +>test.0417.00002.0004i_00090 267 NA | NA | NA | ID=4_23;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.491 | NA +ATGGACATTAACAACAAAGCCCGCATTCATTGGGCATGCCGCCGTGGTATGCGCGAACTCGATATTTCAA +TCATGCCGTTTTTCGAACATGAGTACGACAGCTTAAGCGATGACGAAAAACGCATCTTTATTCGTCTGCT +GGAATGTGACGATCCGGACCTGTTTAACTGGCTGATGAATCACGGTAAACCAGCCGATGCAGAACTGGAA +ATGATGGTCCGACTCATCCAGACACGGAACCGGGAACGTGGTCCTGTGGCAATCTGA +>test.0417.00002.0004i_00091 981 NA | NA | NA | ID=4_24;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.539 | NA +ATGGCTTTTACACCTTTTCCTCCCCGTCAGCCTACGGCTTCTGCCCGTTTGCCACTGACGCTGATGACGC +TTGATGACTGGGCGCTTGCCACTATTACTGGCGCGGACAGCGAAAAATATATGCAAGGCCAGGTGACAGC +AGATGTCAGCCAGATGACAGAAGATCAGCACCTGCTCGCCGCCCATTGCGACGCCAAAGGTAAAATGTGG +AGCAATTTACGTCTGTTCCGCGACGGCGATGGCTTTGCATGGATTGAACGGCGCAGCGTGCGTGAACCAC +AGCTGACTGAACTGAAAAAATATGCGGTGTTCTCTAAAGTGACAATCGCGCCAGACGACGAGCGTGTGCT +GCTTGGTGTTGCCGGTTTTCAGGCGCGCGCCGCGCTGGCAAATCTCTTTAGTGAACTGCCTTCGAAAGAA +AAACAGGTAGTTAAAGAAGGCGCGACTACTCTGCTTTGGTTTGAACATCCGGCAGAACGTTTCCTGATCG +TAACCGATGAAGCTACTGCCAATATGCTGACCGATAAACTGCGCGGTGAAGCGGAACTGAACAATAGCCA +ACAGTGGCTGGCATTAAACATTGAAGCGGGTTTCCCGGTGATTGATGCCGCCAACAGCGGGCAGTTTATC +CCCCAGGCGACCAACCTCCAGGCGCTGGGCGGTATCAGCTTTAAGAAAGGCTGCTATACCGGACAAGAGA +TGGTGGCGCGAGCAAAATTCCGTGGTGCCAACAAACGCGCGCTCTGGTTGCTGAAGGGTAGCGCCAGCCG +ACTGCCGGAAGCTGGTGAAGACTTAGAGCTGAAAATGGGCGAGAACTGGCGTCGTACCGGTACGGTGCTG +GCTGCGGTCAAACTGGAAGATGGTCAGGTTGTGGTGCAGGTTGTCATGAATAACGATATGGAACCGGACA +GCATCTTCCGCGTGCGTGACGATGCGAATACATTGCGTATCGAGCCACTGCCATATTCGCTGGAAGAGTA +A +>test.0417.00002.0004i_00092 660 NA | NA | NA | ID=4_25;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.518 | NA +ATGGTTCAGAAGCCCCTCATTAAGCAGGGATATTCGCTGGCAGAGGAAATTGCCAACAGCGTCAGTCACG +GCATTGGGCTGGTGTTTGGTATCGTTGGGCTGGTGTTGCTACTGGTTCAGGCGGTGGATCTCAATGCCAG +CGCCACGGCGATAACCAGTTACAGCCTCTATGGCGGCAGTATGATCCTGCTGTTCCTCGCTTCGACGCTC +TATCACGCCATTCCCCATCAACGGGCAAAAATGTGGCTGAAGAAATTTGACCACTGTGCCATTTATCTGT +TGATTGCCGGAACCTATACGCCGTTTTTGCTGGTGGGGCTGGATTCTCCGTTAGCGCGCGGGTTGATGAT +TGTTATCTGGAGCCTGGCATTGCTGGGTATTCTGTTTAAACTGACCATCGCGCACCGATTCAAAATTTTA +TCTCTGGTGACCTATCTGGCGATGGGCTGGCTGTCGCTGGTGGTAATTTATGAAATGGCAGTTAAGCTCG +CGGCGGGCAGCGTTACCTTACTGGCGGTAGGCGGTGTGGTTTATTCGCTCGGGGTGATTTTCTACGTCTG +CAAGCGCATTCCATACAATCATGCCATCTGGCACGGCTTTGTGCTCGGCGGTAGTGTGTGCCACTTTCTG +GCGATCTATTTGTATATTGGGCAGGCGTAA +>test.0417.00002.0004i_00093 312 NA | NA | NA | ID=4_26;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.455 | NA +ATGCAGCCAAACGACATCACTTTTTTTCAACGTTTCCAGGATGACATTCTGGCTGGGCGTAAAACCATCA +CCATCCGCGACGAGTCTGAATCGCACTTCAAAACGGGTGATGTGCTTCGTGTCGGACGTTTTGAAGATGA +CGGTTATTTTTGCACGATTGAAGTCACCGCAACCTCAACCGTAACGCTGGATACGCTGACGGAAAAACAT +GCAGAGCAGGAAAATATGACCCTGACTGAACTGAAAAAGGTCATTGCCGACATCTATCCCGACCAGACAC +AGTTTTATGTGATTGAATTTAAATGTCTTTAA +>test.0417.00002.0004b_00094 420 NA | NA | NA | ID=4_27;partial=01;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.500 | NA +GTGAAAAAACTCACCTTACCGAAAGATTTCTTATGGGGCGGCGCAGTTGCCGCTCATCAGGTCGAAGGCG +GCTGGAACAAAGGCGGCAAAGGGCCGAGCATTTGTGACGTTTTGACCGGTGGCGCACACGGCGTGCCGCG +CGAAATCACCAAAGAAGTTGTGCCTGGCAAATACTATCCAAACCATGAAGCCGTTGATTTTTATGGTCAC +TACAAGGAGGACATCAAGCTATTTGCCGAAATGGGCTTCAAATGTTTTCGTACTTCCATCGCCTGGACGC +GCATTTTTCCAAAAGGCGATGAAGCTCAGCCAAACGAAGAAGGGCTGAAGTTCTACGATGATATGATCGA +TGAACTGCTGAAATACAACATCGAACCGGTGATCACCCTCTCCCACTTTGAAATGCCGCTGCATCTGGTG +>test.0417.00002.0005b_00095 1011 NA | NA | NA | ID=5_1;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.515 | NA +CAATATGGTAGCTGGACCAACCGTAAAGTGGTTGATTTCTTTGTCCGTTTCGCGGAAGTGGTATTTGAAC +GCTATAAGCATAAAGTCAAATACTGGATGACTTTCAACGAAATTAACAACCAGCGTAACTGGCGTGCACC +GCTGTTCGGTTACTGCTGCTCCGGCGTGGTGTATACCGAGCATGAAAACCCGGAAGAGACGATGTATCAG +GTGCTGCATCACCAGTTTGTCGCCAGCGCCCTGGCGGTGAAAGCCGCGCATCGCATCAACCCGGAGATGA +AAGTCGGTTGTATGCTGGCGATGGTGCCGCTCTATCCTTACTCCTGTAACCCGGACGATGTGATGTTTGC +CCAGGAGTCGATGCGCGAACGTTACGTCTTTACCGATGTGCAGTTGCGTGGCTATTACCCGTCCTATGTG +TTGAACGAGTGGGAACGCCGCGGATTTAACATCAAAATGGAAGACGGCGATCTGGATGTACTGCGCGAAG +GCACCTGCGATTATCTCGGCTTCAGCTATTACATGACCAACGCGGTGAAGGCCGAAGGTGGCACCGGCGA +TGCGATTTCTGGTTTCGAAGGCAGCGTACCGAATCCGTATGTTAAAGCGTCTGACTGGGGCTGGCAGATT +GATCCGGTTGGTCTGCGCTACGCACTTTGCGAGCTGTATGAGCGTTACCAGAAGCCGCTGTTTATTGTCG +AAAACGGTTTTGGCGCTTACGACAAAGTGGAAGATGATGGCAGCATCAATGACGATTACCGCATTGATTA +CCTGCGTGCCCATATTGAAGAGATGAAAAAAGCGGTGACTTACGATGGCGTGGACCTGATGGGCTACACG +CCGTGGGGCTGCATCGACTGTGTGTCGTTCACCACCGGGCAGTACAGCAAACGCTACGGCTTTATCTATG +TGAATAAACATGACGACGGTACTGGCGATATGTCGCGTTCACGTAAGAAGAGCTTTAACTGGTACAAAGA +GGTGATTGCCAGCAACGGCGAGAATCTGTAA +>test.0417.00002.0005i_00096 2874 NA | NA | NA | ID=5_2;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.554 | NA +ATGACACAGACGTTAAGCCAGCTTGAAAACAGCGGCGCTTTTATTGAACGCCATATCGGACCGGACGCCG +CGCAACAGCAAGAAATGCTGAATGCCGTTGGCGCACAATCGTTAAACGCGCTGACCGGCCAGATTGTGCC +GAAAGATATTCAGCTTGCGACTCCGCCGCAGGTTGGCGCACCGGCGACCGAATACGCCGCACTGGCAGAA +CTCAAGGCTATTGCCAGTCGCAATAAACGCTTCACGTCTTACATCGGCATGGGTTACACCGCCGTGCAGC +TACCGCCGGTTATCCTGCGTAACATGCTGGAAAATCCGGGCTGGTATACCGCGTATACTCCGTATCAACC +TGAAGTCTCCCAGGGCCGCCTTGAAGCACTGCTCAACTTCCAGCAGGTAACGCTGGATTTAACCGGGCTG +GATATGGCCTCTGCTTCTCTTCTTGACGAAGCCACCGCTGCCGCCGAAGCAATGGCGATGGCGAAACGCG +TCAGCAAACTGAAAAATGCCAACCGCTTCTTTGTTGCTTCTGACGTTCATCCGCAAACGCTGGATGTGGT +CCGTACTCGTGCCGAAACCTTTGGTTTTGAAGTGATTGTCGATGACGCGCAAAAAGTGCTCGACCATCAG +GACGTTTTCGGCGTGCTGTTACAGCAGGTCGGCACTACTGGTGAAATTCACGACTACACCGCGCTTATTA +GCGAACTGAAATCACGCAAAATTGTGGTCAGCGTTGCCGCCGATATTATGGCGCTGGTGCTGTTAACTGC +GCCAGGTAAACAGGGCGCGGATATTGTTTTTGGTTCGGCGCAACGCTTTGGCGTACCGATGGGCTATGGT +GGCCCACACGCGGCATTCTTTGCGGCGAAAGACGAATACAAACGCTCAATGCCGGGCCGTATTATCGGTG +TATCGAAAGATGCAGCTGGCAACACCGCTCTGCGCATGGCGATGCAGACTCGCGAGCAACATATTCGTCG +TGAGAAAGCGAACTCCAACATTTGTACTTCCCAGGTACTGCTGGCAAACATTGCCAGCCTGTATGCCGTT +TATCACGGTCCGGTTGGCCTGAAACGTATCGCTAATCGCATCCACCGTCTGACCGATATCCTGGCGGCGG +GCCTGCAACAAAAAGGTCTGAAGCTGCGCCATGCGCACTATTTCGATACTTTGTGTGTGGAAGTGGCCGA +CAAAGCGGGCGTGCTGGCGCGTGCCGAAGCGGCTGAAATCAACCTGCGTAGCGATATTCTGAACGCGGTT +GGGATCACCCTTGATGAAACAACCACGCGCGAAAACGTGATGCAGCTTTTCAGCGTGCTGTTGGGCGATA +ACCACGGGCTGGACATCGACACACTGGACAAAGACGTGGCTCACGACAGTCGCTCTATTCAGGCTGCGAT +GCTGCGCGACGACGAAATCCTCACCCATCCGGTGTTTAATCGCTACCACAGCGAAACCGAAATGATGCGC +TATATGCACTCGCTGGAGCGTAAAGATCTGGCGCTGAATCAGGCGATGATCCCGCTGGGTTCCTGCACCA +TGAAACTGAACGCCGCCGCCGAGATGATCCCGATCACCTGGCCGGAATTTGCCGAACTGCACCCGTTTTG +CCCGCCAGAACAGGCTGAAGGTTATCAGCAGATGATCGCGCAGCTGGCTGACTGGCTGGTGAAACTGACC +GGTTACGACGCCGTTTGTATGCAGCCGAACTCTGGCGCACAGGGCGAATACGCGGGCCTGCTGGCGATTC +GTCATTATCATGAAAGCCGCAACGAAGGGCATCGCGATATCTGCCTGATCCCGGCTTCTGCGCACGGCAC +TAACCCGGCTTCCGCGCATATGGCAGGAATGCAGGTGGTGGTTGTGGCGTGTGATAAAAACGGCAACATC +GATCTGACTGATCTGCGCGCGAAAGCGGAACAGGCGGGCGATAACCTCTCCTGTATCATGGTGACCTATC +CTTCTACCCACGGCGTGTATGAAGAAACGATCCGTGAAGTGTGTGAAGTCGTGCATCAGTTCGGCGGTCA +GGTTTACCTTGATGGCGCGAACATGAACGCTCAGGTTGGCATCACCTCGCCGGGCTTTATTGGTGCGGAC +GTTTCCCACCTTAACCTGCATAAAACTTTCTGCATTCCGCATGGCGGTGGTGGTCCGGGTATGGGACCGA +TCGGTGTGAAAGCGCATCTGGCTCCGTTTGTACCGGGTCATAGCGTGGTGCAAATCGAAGGCATGTTAAC +CCGTCAGGGCGCGGTTTCTGCGGCACCGTTCGGTAGTGCCTCTATCCTGCCAATCAGCTGGATGTACATC +CGCATGATGGGCGCAGAAGGGCTGAAAAAAGCAAGCCAGGTGGCAATTCTTAACGCCAACTATATTGCCA +GCCGTCTGCAGGATGCCTTCCCGGTGCTGTATACCGGTCGCGACGGTCGCGTGGCGCACGAATGTATTCT +CGATATTCGCCCGCTGAAAGAAGAAACCGGCATCAGCGAGCTGGATATTGCCAAGCGCCTGATCGACTAC +GGTTTCCACGCGCCGACCATGTCGTTCCCGGTGGCGGGTACGCTGATGGTTGAACCGACTGAATCTGAAA +GCAAAGTGGAACTGGATCGCTTTATCGATGCGATGCTGGCTATCCGCGCAGAAATTGATCAGGTGAAAGC +CGGTGTCTGGCCGCTGGAAGATAACCCGCTGGTGAATGCGCCGCACATTCAAAGCGAACTGGTCGCCGAG +TGGGCGCATCCGTACAGCCGTGAAGTTGCAGTATTCCCGGCAGGTGTGGCAGACAAATACTGGCCGACCG +TGAAACGTCTGGATGATGTTTACGGCGACCGTAACCTGTTCTGCTCCTGCGTACCGATTAGCGAATACCA +GTAA +>test.0417.00002.0005i_00097 390 NA | NA | NA | ID=5_3;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.515 | NA +ATGAGCAACATACCAGCAGAACTGAAATACAGCAAAGAACACGAATGGTTGCGTAAAGAAGCCGACGGCA +CTTACACCGTTGGCATCACCGAACACGCTCAGGAGCTGTTAGGCGATATGGTGTTTATTGACCTACCGGA +AGTGGGCGCAACGGTTAGCGCGGGCGATGACTGCGCGGTTGCCGAATCGGTAAAAGCGGCGTCAGACATT +TATGCGCCAGTAAGCGGTGAAATCGTGGCGGTAAACGATGCACTGAGCGATTTCCCGGAACTGGTGAACA +GCGAACCGTATGCAGGCGGCTGGATTTTCAAAATCAAAGCCAGCGATGAAAGCGAACTGGAATCACTGCT +GGATGCAACCGCATACGAAGCATTGTTAGAAGACGAGTAA +>test.0417.00002.0005i_00098 1164 NA | NA | NA | ID=5_4;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.536 | NA +ATGCTGGGTTTCGTGGTGATAATTTCGCCATGGAAAAGTTGTCAGCCCCGCTTATTCAATGAGGACAAGA +TGGCACAACAGACTCCTTTGTACGAACAACACACGCTTTGCGGCGCTCGCATGGTGGATTTCCACGGCTG +GATGATGCCGCTGCATTACGGTTCGCAAATCGACGAACATCATGCGGTACGTACCGATGCCGGAATGTTT +GATGTGTCACATATGACCATCGTCGATCTTCGCGGCAGCCGCACCCGGGAGTTTCTACGTTATCTGCTGG +CGAACGATGTGGCGAAGCTCACCAAAAGCGGCAAAGCCCTTTACTCGGGGATGTTGAATGCCTCTGGCGG +TGTGATAGATGATCTCATCGTCTACTACTTTACTGAAGATTTCTTCCGCCTCGTTGTTAACTCCGCCACC +CGCGAAAAAGACCTCTCCTGGATTACCCAACACGCTGAACCTTTCGGCATCGAAATTACTGTTCGTGATG +ACCTTTCCATGATCGCCGTACAAGGGCCGAATGCGCAGGCAAAAGCTGCCACACTGTTTAATGACGCCCA +GCGTCAGGCGGTGGAAGGGATGAAACCGTTCTTTGGCGTGCAGGCGGGCGATCTGTTTATTGCCACCACC +GGTTACACCGGTGAAGCGGGCTACGAAATTGCGCTGCCCAATGAAAAAGCGGCCGATTTCTGGCGCGCGC +TGGTGGAAGCTGGCGTTAAGCCATGTGGCCTGGGCGCGCGTGACACGCTGCGTCTGGAAGCGGGCATGAA +TTTGTATAGCCAGGAGATGGACGAAACTATTTCTCCTTTAGCCGCCAATATGGGCTGGACTATCGCCTGG +GAACCGGCAGATCGTGACTTTATCGGTCGTGAAGCTCTGGAAGCGCAGCGTGAACATGGCACAGAAAAAC +TGGTTGGTCTGGTGATGACCGAAAAAGGCGTGCTGCGTAATGAACTGCCGGTACGTTTTACTGATGCGCA +GGGCAACCAGCATGAAGGCATTATCACCAGCGGTACTTTCTCCCCAACGCTGGGTTATAGCATTGCGCTG +GCGCGCGTGCCGGAAGGTATTGGTGAAACGGCGATTGTGCAAATTCGCAACCGTGAAATGCCGGTTAAAG +TGACGAAACCTGTTTTTGTGCGTAACGGCAAAGCCGTCGCGTGA +>test.0417.00002.0005b_00099 156 NA | NA | NA | ID=5_5;partial=01;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.231 | NA +TTTCTAATGCCACGAATTTTTGATTTAGTGTTTTTTGACATTTTTTTAGTTCTTAATGTTGTCTTATTCA +AATTAACTTTCTCATCTATTTATCTTTATATAGAGATTTGTTCATTTTTTGGTTTTTTATTCTGTTACGA +TTTTGGCGTTTTTTAA diff --git a/test/data/annotate/exp_files/res_formatAll/prodigal/Genes/test_runprokka_H299.gen b/test/data/annotate/exp_files/res_formatAll/prodigal/Genes/test_runprokka_H299.gen new file mode 100644 index 0000000000000000000000000000000000000000..b82e3435e7dd7a94f57b7f5446127f1f59a50eb5 --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prodigal/Genes/test_runprokka_H299.gen @@ -0,0 +1,208 @@ +>test_runprokka_H299.0001b_00001 138 NA | NA | NA | ID=1_1;partial=10;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.580 | NA +ATGGGTAAAGGCAGCAGTAAGGGGCATACCCCGCGCGAAGCGAAGGACAACCTGAAGTCCACGCAGCTGC +TGAGTGTGATCGATGCCATCAGCGAAGGGCCGGTTGAAGGTCCGGTGGACGGATTAAAAAGCGTGCTG +>test_runprokka_H299.0001i_00002 543 NA | NA | NA | ID=1_2;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.562 | NA +GTGAAAACGGGGTCCGAAGCCATCCGGGCGCTGGCCATGCAGATCCCGGCATTTCGTCAGAAACTGAGCG +ACGGCTGGTACCAGGTACGCATTGCCGGGCGTGATGCAGGTGAAACCGAATTGTCTGCCCGTCTTAATGA +GCCGCTGGAAAATGGTGCCGTGATCCATATCGTGCCGCGTCTGGCAGGAGCCAAAAGTGGCGGTGTGTTT +CAGGCTGTGCTGGGGGCGGCTGTTATGGCGGTTGCTATATGGATGCCGGGGGTAGGAATTATGGCGAGTA +ATCTGCTGTTTTCTCTCGGTGCCAGTATGACGCTTGGCGGTGTTGCACAGATGCTGGCCCCTAAACCCAA +AACCCCCCGCACACAGACAACGGATAACGGCAAACAGAATACCTATTTTTCTTCACTGGATAACATGGTT +GCCCAGGGCAATGTTCTGCCGGTTCTGTACGGTGAAATGCGCGTGGGGTCACGCGTGGTTTCTCAGGAGA +TCAGCACGGCAGACGAAGGGGATGGTGGTCAGGTTGTGGTGATTGGTCGCTGA +>test_runprokka_H299.0001i_00003 600 NA | NA | NA | ID=1_3;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.593 | NA +ATGTCGCCGGAGGACTGGCTGAGTGCAGAAATGCAGAGAGAGATTGTGGCGCTGGTCCACAGCCACCCCG +GTGGTCTGCCCTGGCTGAGTGAGGCCGACCGGCGGCTGCAGGTACAGAGTGATTTGCCGTGGTGGCTGGT +CTGCCGGGGGGCGATTCATAAATTCCGCTGTGTGCCGCATCTCACCGGGCGGCGCTTTGAGCACGGGGTA +ACGGACTGTTACACGCTGTTCCGGGACGCTTACCATCTGGCGGGAATTGAGATGCCGGATTTTCATCGCG +GGGATGACTGGTGGCGTAACGGTCAGAATCTCTATCTGGATAATCTGGAGGCCACAGGGCTGTATCAGGT +GCCGTTGTCAGCGGCGCAGCCGGGCGATGTGCTGCTGTGCTGTTTTGGTTCATCGGTGCCGAATCATGCC +GCCATTTACTGTGGTGACAGCGAGCTGCTGCACCATATTCCTGAACAACTGAGCAAACGAGAGAGGTACA +CCGACAAATGGCAGCGACGCACACACTCCCTCTGGCGTCACCGGGCATGGCACGCATCTGCCTTTACGGG +GATTTACAACGATTTGGCCGCCGCATCGACCTTCGAGTGA +>test_runprokka_H299.0001i_00004 699 NA | NA | NA | ID=1_4;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.558 | NA +ATGCAGGACATACAACAGGAAACGCTGAATGAATGCATTCGTGCGGAGCAGTCGGCCAGCGTGGTGCTCT +GGGAAATCGACCTGACCGAGGTAGGCGGGGATCGCTACTTTTTCTGTAATGAGCAGAACGAAAAAGGTGA +GTCTGTCACCTGGCAGAGTCGGCAGTATCAGGCCTATCCCATTCAGGGGAGTGGATTTGAGATGAACGGC +AAGGGCAGTGCTGCCCGTCCGACACTGACGGTCTCTAACCTGCACGGCATGATCACCGGGATGGCGGAAG +ATCTGCAGAGTCTGGTCGGCGGAACGGTGGTCCGGCGTAAGGTTTACGCCCGCTTTCTGGATGCGGTGAA +CTTCGTCAACGGAAACAGCGAAGCCGATCCGGAGCAGGAGGTGATCAGCCGCTGGCGCATCGAGCAGTGC +AGCGAACTGAGCGCGGTCAGTGCCTCTTTTGTACTGTCCACGCCGACTGAAACGGATGGCGCTGTTTTTC +CGGGACGTATCATGCTGGCCAACACCTGCACCTGGACCTATCGCGGCGATGAGTGCGGTTATAGCGGTCC +GGCGGTCGCGGATGAATATGACCAGCCGACGTCCGATATCACGAAGGATAAATGCAGCAAATGCCTGAGT +GGCTGTAAGTTTCGCAATAATGTCGGCAACTTTGGCAGCTTCCTTTCCATTAACAAACTTTCGCAGTAA +>test_runprokka_H299.0001i_00005 297 NA | NA | NA | ID=1_5;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.404 | NA +ATGAAAACAGAAAATAAACCATCGATAAAAACTGTAAGATTTGGCGATGGTTATGAGCAACGAAGTCCAA +ATGGACTTAATCATTCTCTGCGCGTTTTCACCTGTGATTTCAAAGTTGAGGCGAATGAACGTGATTCATT +TGAAAAATTTTTAGCCCGGCATGAAGGCTATAAATCTTTTTTTTGGCGCCCGCCGGGTATTAACAGAAAA +ATCAGAGTGGTGTGTCGAACGTGGTCAGCGACAGAACATATCACCTATACCGATTTTTCGTGTCAGTTTG +ACGAAGTGGTGATCTGA +>test_runprokka_H299.0001b_00006 963 NA | NA | NA | ID=1_6;partial=01;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.442 | NA +GCCGAAATAACAGCATGGCGTGATTCATTGCAGGCTTCGATTGATAATCGTCAGCAGGGGTATGATATTC +AGATTGCTGGTTATGGGGTTGGCGATAAAAATCAGCAACGCCAGCAGGAATTACTGCGGATTGAACATGG +ATATAACAATCAGCGTCTGCAACTTGAACGTGACTATGCAGATAAATCCCGTGGAATGTCAGATCATGTT +TTTCAAGAGAAAATGCAGGCTCTGAATGATGCTCTGGAACGGGAAAAAGAAATTGTCAGACAGAAAAACG +AGCAGCTCGATATTCAGGCAGGAGACTGGGTTAGTGGTGCCTCCCAGGGATTCAATAACTGGCTGGATGA +CACTAAGGATATCAGTGAGCAGATAAAATCAACCACGACTCAGATGTTTGATGGGATGACCGATGCGCTG +GGTGATTTTGTCACGACAGGCAAGGCAAATTTTCGTTCTTTCGCTACTTCCGTGATTTCGGATCTTAGTC +GAATAGCATTAAAGGCTTCAATTACTGGGATTTTCGACAGCATTAGTAACAGTTCTTCTGGGGGGATTTT +AGGAACTATCGGGAGTGCTATTAGTAAATTTATTCCGAATGCAAAGGGCGGTGTTTATGAGTCTCCGTCA +TTGAGCACGTATTCGAACGGTATTTATGATTCCCCGCAATTTTTTGCTTTTGCAAAAGGGGCTGGTGTTT +TTGGTGAGGCTGGACCGGAAGCCATTATGCCATTAACACGAACTTCCGATGGTTCTCTTGGTGTCAGAGC +TATTAATAGTAAAAGTGGTAATGGAGGCGGAGATATTACCTATGCCCCTGTATACCAAATCACTATTCAA +AATGACGGCCAGAATGGAGAGATTGGCCCTCAGGCAATAAAAGCACTTATGGGGATGGTTGATCAGCGGG +TGCAGGGCAATCTGTTAAATATGCGACGTGATGGGGGAATGTTAAGTGGCTAA +>test_runprokka_H299.0002b_00007 138 NA | NA | NA | ID=2_1;partial=10;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.572 | NA +ATGGGTAAAGGCAGCAGTAAGGGGCATACCCCGCGCGAAGCGAAGGACAACCTGAAGTCCACGCAGCTGC +TGAGTGTGATCGATGCCATCAGCGAAGGGCCGGTTGAAGGTCCGGTGGATGGATTAAAAAGCGTGCTG +>test_runprokka_H299.0002i_00008 543 NA | NA | NA | ID=2_2;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.547 | NA +GTGAAAACGGGGGCTGAAGCCATCCGGGCGCTGGCCACACAGCTCCCGGCGTTTCGTCAGAAACTGAGCG +ACGGCTGGTATCAGGTACGGATTGCCGGGCGTGATACAGGTGAAACGGAATTATCAGCCCGTCTTAATGA +ACCGCTGGCAAATGGTGCTGTGATCCATATCGTGCCGCGTCTGGCAGGAGCCAAAAGTGGCGGTGTGTTT +CAGGCTGTGCTGGGGGCGGCTGTTATGGCGGTTGCTATATGGATGCCGGGGGTAGGAATTATGGCGAGTA +ATCTGCTGTTTTCTCTCGGTGCCAGTATGACGCTTGGCGGTGTTGCACAGATGCTGGCCCCTAAACCCAA +AACCCCCAGCACACAGACAACGGATAACGGCAAACAGAACACCTATTTTTCTTCACTGGATAATATGGTT +GCCCAGGGCAATGTTCTGCCCGTTCTGTACGGTGAAATGCGCGTGGGATCACGTGTGGTATCTCAGGAGA +TCAGCACAGCAGATGAAGGTGATGGTGGTCAGGTTGTGGTGATTGGTCGCTGA +>test_runprokka_H299.0002i_00009 744 NA | NA | NA | ID=2_3;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.594 | NA +ATGACAGAGACAGAATCAGCGATTCTGGCGCACGCCCGGCGATGTGCGCCAGCGGAGTCGTGCGGCTTCG +TGGTGAGAACGCCGGAAGGGGAAAGATATTTCCCCTGCGTGAATATCTCCGGTGAGCCGGAGGCGTATTT +CCGGATGTCGCCGGAGGACTGGCTGCGGGCAGAGATGCAGGGTGAGATTGTGGCGCTGGTCCACAGCCAC +CCCGGTGGTCTGCCCTGGCTGAGTGAGGCCGACCGGCGGCTGCAGGTGCAGAGTGATTTGCCGTGGTGGC +TGGTCTGCCGGGGGACGATTCATAAGTTCCGCTGTGTGCCGCATCTCACCGGGCGGCGCTTTGAGCACGG +GGTGACGGACTGTTACACGCTGTTCCGGGATGCTTATCATCTGGCGGGGATTGAGATGCCGGATTTTCAT +CGCGAGGATGACTGGTGGCGTCACGGTCAGAATCTCTATCTGGATAATCTGGAGGCCACAGGGTTGTATC +AGGTGCCGTTGTCATCAGCACAACCGGGCGATGTGCTGCTGTGCTGTTTTGGTTCATCGGTGCCGAATCA +TGCCGCCATTTACTGTGGTGATGGCGAGCTGCTGCACCATATTCCTGAACAACTGAGCAAACGAGAGAGG +TATACCGACAAATGGCAGCGACGCACACACTCCCTCTGGCGTCACCGGGCATGGCGCGCATCTGCCTTTA +CGGGGATTTACAACGATTTGGTCGCCGCATCGACCTTCGTGTGA +>test_runprokka_H299.0002i_00010 699 NA | NA | NA | ID=2_4;partial=00;start_type=ATG;rbs_motif=AGxAGG/AGGxGG;rbs_spacer=5-10bp;gc_cont=0.557 | NA +ATGCAGGATATCCGGCAGGAAACACTGAATGAATGCACCCGTGCGGAGCAGTCGGCCAGCGTGGTGCTCT +GGGAAATCGACCTGACAGAGGTCGGTGGAGAACGTTATTTTTTCTGTAATGAGCAGAACGAAAAAGGTGA +GCCGGTCACCTGGCAGGGGCGACAGTATCAGCCGTATCCCATTCAGGGGAGCGGTTTTGAACTGAATGGC +AAAGGCACCAGTACACGCCCCACGCTGACGGTTTCTAACCTGTACGGTATGGTCACCGGGATGGCGGAAG +ATATGCAGAGTCTGGTCGGCGGAACGGTGGTCCGGCGTAAGGTTTACGCCCGTTTTCTGGATGCGGTGAA +CTTCGTCAACGGAAACAGCGACGCCGATCCGGAGCAGGAGGTGATCAGCCGCTGGCGCATCGAGCAGTGC +AGCGAACTGAGCGCGGTCAGTGCCTCCTTTGTACTGTCCACGCCGACGGAAACGGATGGTGCCGTTTTTC +CGGGGCGCATCATGCTGGCTAATACCTGCACCTGGACCTATCGCGGTGATGAGTGCGGTTATCACGGTCC +GGCTGTCGCGGATGAATATGATCAGCCGACGTCCGATATCACGAAGGATAAATGCAGCAAATGCCTGAAT +GGCTGTAAGTTTCGCAATAACGTCGGCAACTTTGGCGGCTTCCTTTCCATTAACAAACTTTCGCAGTGA +>test_runprokka_H299.0002i_00011 330 NA | NA | NA | ID=2_5;partial=00;start_type=ATG;rbs_motif=GGAGG;rbs_spacer=5-10bp;gc_cont=0.567 | NA +ATGAAAACCTTCCGCTGGAAAGTGAAACCCGGTATGGATGTGGCTTCGGCCCCTTCTGTAAGAAAGGTGC +GCTTTGGTGATGGCTATTCCCAGCGAGCGCCTGCCGGGCTGAATGCCAACCTGAAAACGTACAGCGTGAC +GCTTTCTGTCCCCCGTTGGGAGGCCACGGTACTGGAGTCGTTTCTGGAAGAGCACGGGGGCTGGAAAGCC +TTTCTGTGGACGCCGCCTTATGAGTGGCGGCAGATAAAGGTGACCTGCGCAAAATGGTCGTCGCGGGTCA +GTATGCTGCGTGTTGAGTTCAGCGCAGAGTTTGAACAGGTGGTGAACTGA +>test_runprokka_H299.0002i_00012 2580 NA | NA | NA | ID=2_6;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.592 | NA +ATGGCTGAACCGGTAGGCGATCTGGTCGTTGATTTGAGTCTGGATGCGGCCAGATTTGACGAGCAGATGG +CCAGAGTCAGGCGTCATTTTTCCGGTACGGAAAGTGATGCGAAAAAAACAGCGGCAGTCGTTGAACAGTC +GATGAGCCGGCAGGCGCTGGCTGCACAGAAAGCGGGGATTTCCGTCGGGCAGTATAAAGCCGCCATGCGT +ATGCTGCCTGCGCAGTTCACCGACGTGGCCACGCAGCTTGCAGGCGGGCAGAGTCCGTGGCTGATCCTGC +TGCAACAGGGTGGTCAGGTGAAGGACTCCTTCGGCGGGATGATCCCCATGTTCAGGGGGCTTGCCGGTGC +GATCACCCTGCCGATGGTGGGGGCCACCTCGCTGGCGGTGGCGACCGGTGCGCTGGCGTATGCCTGGTAT +CAGGGTAACTCAACCCTGTCCGATTTCAACAAAACGCTGGTCCTTTCCGGCAATCAGGCGGGACTGACGG +CAGATCGTATGCTGGTCCTGTCCAGAGCCGGGCAGGCGGCAGGGCTGACGTTTAACCAGACCAGCGAGTC +ACTGACGGCGCTGGTGAATGCCGGTGTGCGTGGTGGTGAGCAGTTTGAGGCGATCAGCCAGAGTGTGGCG +CGTTTCTCCTCTGCATCCGGTGTGGAGGTGGACAAGGTCGCTGAAGCCTTCGGGAAGCTGACCACAGACC +CGACGTCGGGGTTGACGGCGATGGCACGCCAGTTCCATAACGTGACGGCGGAACAGATTGCGTATGTTGC +TCAGTTGCAGCGTTCCGGCGATGAAGCCGGGGCATTGCAGGCGGCGAACGAGGCCGCAACGAAAGGGTTT +GATGACCAGACCCGACGCCTGAAAGAGAACATGGGCACGCTGGAGACCTGGGCAGACAGGACAGCACGGG +CATTCAAATCCATGTGGGATTCGGTGCTGGATATTGGTCGCCCGGACACTGCCCAGGGAATGCTGGAGAA +AGCAGAAAAGGCTTTTGATGAGGCGGACAAAAAATGGCAGTGGTATCAGAGCCGGAGCCACCGGCGCGGT +AAAACCTCAGCATTTCTTGCCAATCTCCGGGGAGCATGGGAGGACAGAGCGAATGCGCAACTTGGGCTTT +CCGCCGCCACGTTGCAGGCCGATCTTGAAAAGGCCAGAGAGATGGCAGCAAAGGACTGGGCCGAGTCTGA +GGCATCACGGCTGAAATATACCGAAGAGGCGCAGAAGGCTTACGAACGCCTGCAGACGCCGCTGGAGAAA +TATACCGCCCGTCAGGAAGAACTGAACAAGGCACTGAAAGACGGGAAAATCCTGCAGGCAGATTACAACA +CGCTGATGGCGGCGGCGAAAAAGGATTATGAAGCGACGCTGAAAAAGCCGAAACAGTCCGGCGTGAAGGT +GTCTGCGGGCGATCGTCAGGAAGACAGTGCTCATGCTGCCCTGCTGACGCTTCAGGCAGAACTCCGGACG +CTGGAGAAGCATGCCGGAGCGAATGAGAAAATCAGCCAGCAGCGCCGGGATTTGTGGAAGGCAGAAAGTC +AGTTCGCGGTACTGGAGGAGGCGGCACAACGTCGCCAGCTGTCCGCACAGGAGAAATCCCTGCTGGCGCA +TAAAGATGAGACGCTGGAGTACAAACGCCAGCTGGCTGCACTTGGCGACAAGGTTACGTATCAGGAGCGC +CTGAACGCGCTGGCGCAGCAGGCGGATAAATTCGCACAGCAGCAACGGGCAAAACGGGCCGCCATTGATG +CGAAAAGCCGGGGGCTGACTGACCGGCAGGCAGAACGGGAAGCCACGGAACAGCGCCTGAAGGAACGGTA +TGGCGATAATCCGCTGGCGCTGAATAACGTCATGTCAGAGCAGAAAAAGACCTGGGCGGCTGAAGACCAG +CTTCGCGGGAGCTGGATGGCAGGCCTGAAGTCCGGCTGGAGTGAGTGGGAAGAGAGCGCCACGGACAGTA +TGTCGCAGGTAAAAAGTGCAGCCACGCAGACCTTTGATGGTATTGCACAGAATATGGCGGCGATGCTGAC +CGGCAGTGAGCAGAACTGGCGCAGCTTCACCCGTTCCGTGCTGTCCATGATGACAGAAATTCTGCTTAAG +CAGGCAATGGTGGGGATTGTCGGGAGTATCGGCAGCGCCATTGGCGGGGCTGTTGGTGGCGGCGCATCCG +CGTCAGGCGGTACAGCCATTCAGGCCGCTGCGGCGAAATTCCATTTTGCGACTGGGGGATTTACGGGAAC +CGGCGGCAAATATGAGCCAGCGGGGATTGTTCACCGTGGTGAGTTTGTCTTCACGAAGGAGGCAACCAGC +CGGATTGGCGTGGGGAATCTTTACCGGCTGATGCGCGGCTATGCCACCGGCGGTTATGTCGGTACACCGG +GCAGCATGGCAGACAGCCGGTCGCAGGCGTCCGGGACGTTTGAGCAGAATAACCATGTGGTGATTAACAA +CGACGGCACGAACGGGCAGATAGGGCCACAGGCGCTGAAGGCTGTTTATGACGTAGCCCGTAAGGCGGCA +ATGGATGTTGTGACCGGGCAGATGCGCGATGGTGGCCTGTTCTCCGGAGGTGGACGATGA +>test_runprokka_H299.0002i_00013 435 NA | NA | NA | ID=2_7;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.559 | NA +GTGTTCGACGGTGAGCTGAGTTTTGCCCTGAAACTGGCGCGTGAAATGGGGCGACCCGACTGGCGCGCCA +TGCTTGCCGGGATGTCATCCACGGAGTATGCCGACTGGCACCGCTTTTACAGTACCCATTATTTTCATGA +TGTTCTGCTGGATATGCACTTTTCCGGGCTGACGTACACCGTGCTCAGCCTGTTTTTCAGCGATCCGGAT +ATGCATCCGCTGGATTTCAGTCTGCTGAACCGGCGTGAGGCTGACGAAGAGCCTGAAGATGATGTGCTGA +TGCAGAAAGCGGCAGGGCTTGCCGGAGGCGTTCGTTTTGGCCCGGACGGGAATGAAGTTATCCCCGCTTC +CCCGGATGTGGCGGACATGACGGAGGATGACGTAATGCTGATGACAGTATCAGAAGGGATCGCAGGAGGA +GTCCGGTATGGCTGA +>test_runprokka_H299.0002i_00014 423 NA | NA | NA | ID=2_8;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.515 | NA +ATGTTCCTGAAAACCGAATCATTTGAACATAACGGTGTGACCGTCACGCTTTCTGAACTGTCAGCCCTGC +AGCGTATTGAGCATCTTGCCTGGTTGAAAGAGCAGGAAAAAAAGGCTGAATCCAGTGGCAACCTGCAGGT +GTCTGTAGAGGATCTTATCAGAGGCGGGGCGTTTCTGGTGGCGATGTCTCTGTGGCATAACCATCCGCAG +AAGACAAAGCTGCCGTCCATGAATGAAGCCGTTAAACAGATTGAGCAGGAAGTGCTTACCACCTGGCCCA +CGGAGGCAATTGCTCAGGCTGAAAACGTGGTGTTACGTCTGTCCGGAATGTCTGAGTTTGTTGTGAATAA +TGCCCCTGAACAGGCAGATGATGCCGGGCCTGCAGAGCCTGTTTCTGCGGGAAAGTGTTCGACGGTGAGC +TGA +>test_runprokka_H299.0002i_00015 741 NA | NA | NA | ID=2_9;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.583 | NA +ATGCCTGTACCAAATCCTACAATGCCGGTGAAAGGTGCCGGGACCACCCTGTTGGTTTATAAGGGGAGCG +GTGACCCTTATGCGAACCCGCTTTCAGACGTTGACTGGTCGCGTCTGGCTAAAGTTAAAGACCTGACGCC +CGGCGAACTGACCGCTGAGTCCTATGACGACAGCTATCTCGATGATGAAGATGCGGACTGGGCTGCGACC +GGGCAGGGGCAGAAATCTGCCGGAGATACCAGCTTCACGCTGGCGTGGATGCCCGGAGAGCAGGGGCAGC +AGGCGCTGCTGGCGTGGTTTAATGAAGGGGATACCCGTGCCTATAAAATCCGCTTCCCGAACGGCACGGT +CGATGTGTTCCGCGGCTGGGTCAGCAGTATCGGTAAGGCGGTGACGGCGAAGGAAGTGATCACCCGCACG +GTGAAAGTCACCAACGTGGGACGTCCGTCGATGGCAGAAGATCGCAGCACGGTCACAGCGGCAACCGGCA +TGACCGTGACGCCTGCCAGCACTTCGGTGGTGAAAGGGCGGAGCACCACGCTGACCGTGGCATTCCAGCC +GGAAGGCGCAACCGACAAGAGCTTCCGTGCGGTGTCTGCGGATAAAACAAAAGCCACCGTGTCGGTCAGT +GGTATGACCATCACCGTGAAAGGTGTTGCTGCAGGCAAGGTCAACATTCCGGTCGTATCCGGTAATGGTG +AACTTGCTGCGGTTGCAGAAATCAACGTCACCAACAGCTAA +>test_runprokka_H299.0002b_00016 393 NA | NA | NA | ID=2_10;partial=01;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.539 | NA +AAACATACTGAACTCCGTGCAGCCGTACTGGATGCACTGGAGAAGCATGACACCGGGGCGACGCTTTTTG +ATGGTCGCCCCGCTGTTTTTGATGAGGAAGATTTTCCGGCAATTGCCGTTTATCTCACCGGCGCTGAATA +CACGGGCGAAGAGCTGGACAGCGATACCTGGCAGGCAGAGCTGCATATTGAAGTTTTCCTGCCTGCTCAG +GTGCCGGATTCAGAGCTGGATTCGTGGATGGAGTCCCGGATTTATCCGGTGATGAGCGATATCCCGGCGC +TGTCAGATTTGATCACCAGTATGGTGGCCAGTGGCTATGACTACCGGCGCGACGATGATGCGGGCCTGTG +GAGTTCAGCCGATCTGACGTATGTCATTACCTATGAAATGTGA +>test_runprokka_H299.0003b_00017 870 NA | NA | NA | ID=3_1;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.303 | NA +ATCATACAGTCATTTGTTAATATCTGTCTGACAAGGTACCAAGCAGAAAATAGGGTTAAGATATTTGTAG +CCATAAATATCATATATACGTTAGCCTATTTTTTTGGGGTTTTATATTCCTTATTTATAGATCACTGGGA +TAATGTTTGGAAAAATATTATTTTGTTTTATGTGCTTACAACAATAACAATGTTTTTCTTCTATTTTATA +CGAAAAGGGAAGGTTGTTAAGCTATTTTTCTTTCATTATATCTCAAAAAATAAAGTTTACGAAACTTTTA +TTTTTGGCCTTTACCAGCTCCCTCATGTTTTAAGCTCTTGGGTAAGGCTTGGATATGATAGACTGGTATT +GGGGGAACTAATATCAATGAGCTATGTTGGCGGATATTCGGTTGCAGTTCAAATATCTCTTGTGTCTAGC +GTGATATTTCAATCATTAAATAGGTTTTGGACCCCTTTCTTTATTAAAAAATTAAAGGAGAATAGTAAAC +AAAAAAAAATTATTGTTCTTGGAGGTTTTGGAATTATCTGCATAACAATACTTAATATACTATTTGGTTA +CGCATATTTTATTTTTTTCTTGCCCACAAATTATTCATCATTCTCCAATGCTCTTCCTATATTATGTATG +GCATATATGTTTCAGGGGCTATATTTTTTGATTGTTAATTATATATATTATCATGATGGTAATAAATTGA +TATCAATTCCATCCGTTGCCTCGATCGCTATACATATAGCTGTTGCCCCAGTTTTGATAAAACATATGGG +ATATTATGGAGCTGCAATTTCCTTATTGATTAGTTGGATAGTTCTTTTTTTATTTACATGCGTCATTATA +TTTTATGTTAGAAGGGGGTATCGTGGGTAA +>test_runprokka_H299.0003i_00018 933 NA | NA | NA | ID=3_2;partial=00;start_type=GTG;rbs_motif=AGxAGG/AGGxGG;rbs_spacer=5-10bp;gc_cont=0.309 | NA +GTGGGTAATATATTTATTGTTGAGTCTCCGTTTCAGCTTTCAAATGCTTTACTTTATCATAAAAAAAATG +ATAGTGTTATTGTCAGGCTCAACGGAGAAAATAAAAATGATTTTCAAATTGAAAAAATGTTATCGTCGTT +TAATGGCAAGGTATATATAAAAAAAGCATCAAAAGAATCGAAATTCGATTTGATTAGATTTGTTTTATTT +TTTGCCGTCCCTGTATTGATTGCTAATTTAAATAAAAAAGTAATTATTGGGAATTATAATTCATTGTGGA +TGAGAGTCATGGGATATTTGTTTAACCCATTTCATTTTGCCGTCCTTGATGATGGGTTGATTACTATACG +AACAATAAAAAGGTTGGATGATAATATATCGCGTTCTGGATCAATTAAGAAACGGTTTTTATTACTGCTG +GCACCAAGATTTATAACGCAATATAAGATATATTCCAACTTTATTCAGATATACAACCAAGAGATCAATA +AGAGAAAAAGAACTACCCGAGCCATTAAGGCAGGGCGAGTTTGTTTTATTGGCTCTCCATTATTTGACAA +AAATGTTCTCACATTTGATTTCTATGTAAAGTGCTTGGCTGCGATAAGTGATAACCTTAAGCGTTGTGGA +TATAGCATTGAGTATTACCCTCATCGCTCAGAAAAAAACATCTCATATTTAAATGTTTTTTTTGACGATG +TAATAAAATCAGATGATAGCATTGAAGTCTATTATTCAGCCAGTAATGAGTTGCCAGAAATATTTGTATC +ATTTTATTCATCGGCCCTTTTAAATTTGAGAAGTGATTATCCAGAGTGTAAATTTATATCTTATAAGTTA +GATTGTAATGAAATCAATGGTAAGTTTAGGTATGAAATAATGGAGGCATATAACTTTTTGGCATTCTCTG +GTATTGAGGTTGTAACTATATAG +>test_runprokka_H299.0003b_00019 693 NA | NA | NA | ID=3_3;partial=01;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.289 | NA +ATGTTAACATATTCTGTCGTTAACTGGAAAGCAAAATTATTATATTTCATTCTTTTTCTGAGTTTCCTTA +ATGCTGTTTTGAGGTTATCAGAGGATGGATTGTCGATTTATCGATTATTTATCCCTTTGCAAATATTTTT +AATTTATACATTAAGTGTCACCGAGTTCAAAAAGTTTATCGTAATTCTACTACTTTTATTATTGTTTGGT +GCTACTGGATGTATGATATCCACTTATTCTCTTAATGAGAATAATCTTGTATTTCTAATACATTACTCTA +TACTTATACTCACTTTTTTCTCTTCTTCTGTGTTGATATCTATTACTGGTGAAACTTGTTTTTACAAATT +CACCGCGTTCTTTTTTGGTTTTTTAATTGTTACTGGTATTATGGATTTGTTTGGTGTTACATTTCCTAAT +ATAGAACATATACCAGACGCTATACGAGGAATACATAGAATAGAGAATGATTATTCACTTGCGCTGGTTT +CGTTTGTTTTTGTTGTGTTTTCCATCTCTAGGAAAAAAATAACTGCTTCAATCCTTACTTTTTTTACGTC +TGCGATTTGTTTTTATAATGACTCTAAAGTTGCATTACTTTTTGTCGTTGCTGGTTATTTTTGTTTTATA +TTTAAAAATATAAGGTTTAGACAAAAGGAATTCAGGTGGATATTATTTCTTTTTGTCATAATG diff --git a/test/data/annotate/exp_files/res_formatAll/prodigal/LSTINFO/test.0417.00002.lst b/test/data/annotate/exp_files/res_formatAll/prodigal/LSTINFO/test.0417.00002.lst new file mode 100644 index 0000000000000000000000000000000000000000..c86fc36b9a0232778fb2b38b18cd18414c7da3f7 --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prodigal/LSTINFO/test.0417.00002.lst @@ -0,0 +1,99 @@ + 287 787 D CDS test.0417.00002.0001b_00001 NA | NA | NA | ID=1_1;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.447 | NA + 846 2384 D CDS test.0417.00002.0001i_00002 NA | NA | NA | ID=1_2;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.511 | NA + 2404 3741 D CDS test.0417.00002.0001i_00003 NA | NA | NA | ID=1_3;partial=00;start_type=ATG;rbs_motif=GGxGG;rbs_spacer=5-10bp;gc_cont=0.594 | NA + 3738 4403 D CDS test.0417.00002.0001i_00004 NA | NA | NA | ID=1_4;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.590 | NA + 4416 6068 D CDS test.0417.00002.0001i_00005 NA | NA | NA | ID=1_5;partial=00;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.614 | NA + 6126 6617 D CDS test.0417.00002.0001i_00006 NA | NA | NA | ID=1_6;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.514 | NA + 6808 9444 D CDS test.0417.00002.0001i_00007 NA | NA | NA | ID=1_7;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.603 | NA + 9456 9602 D CDS test.0417.00002.0001b_00008 NA | NA | NA | ID=1_8;partial=01;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.531 | NA + 2 1237 D CDS test.0417.00002.0002b_00009 NA | NA | NA | ID=2_1;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.468 | NA + 1279 2346 D CDS test.0417.00002.0002i_00010 NA | NA | NA | ID=2_2;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.547 | NA + 2419 2799 D CDS test.0417.00002.0002i_00011 NA | NA | NA | ID=2_3;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.357 | NA + 3130 3393 D CDS test.0417.00002.0002i_00012 NA | NA | NA | ID=2_4;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.424 | NA + 3399 4538 D CDS test.0417.00002.0002i_00013 NA | NA | NA | ID=2_5;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.359 | NA + 4535 7888 D CDS test.0417.00002.0002i_00014 NA | NA | NA | ID=2_6;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.592 | NA + 7854 9491 D CDS test.0417.00002.0002i_00015 NA | NA | NA | ID=2_7;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.620 | NA + 9525 11285 D CDS test.0417.00002.0002i_00016 NA | NA | NA | ID=2_8;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.580 | NA + 11249 12328 D CDS test.0417.00002.0002i_00017 NA | NA | NA | ID=2_9;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=11-12bp;gc_cont=0.591 | NA + 12309 12845 D CDS test.0417.00002.0002i_00018 NA | NA | NA | ID=2_10;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.508 | NA + 12849 13277 D CDS test.0417.00002.0002i_00019 NA | NA | NA | ID=2_11;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.534 | NA + 13277 14653 D CDS test.0417.00002.0002i_00020 NA | NA | NA | ID=2_12;partial=00;start_type=ATG;rbs_motif=AGGAG/GGAGG;rbs_spacer=11-12bp;gc_cont=0.548 | NA + 14955 15902 C CDS test.0417.00002.0002i_00021 NA | NA | NA | ID=2_13;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.444 | NA + 15974 16570 C CDS test.0417.00002.0002i_00022 NA | NA | NA | ID=2_14;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.424 | NA + 16573 17748 C CDS test.0417.00002.0002i_00023 NA | NA | NA | ID=2_15;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.378 | NA + 17748 19328 C CDS test.0417.00002.0002i_00024 NA | NA | NA | ID=2_16;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.441 | NA + 19360 20184 C CDS test.0417.00002.0002i_00025 NA | NA | NA | ID=2_17;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.336 | NA + 20442 21695 C CDS test.0417.00002.0002i_00026 NA | NA | NA | ID=2_18;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.538 | NA + 21927 22445 D CDS test.0417.00002.0002b_00027 NA | NA | NA | ID=2_19;partial=01;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.526 | NA + 3 812 D CDS test.0417.00002.0003b_00028 NA | NA | NA | ID=3_1;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.520 | NA + 874 2700 C CDS test.0417.00002.0003i_00029 NA | NA | NA | ID=3_2;partial=00;start_type=ATG;rbs_motif=AGGAGG;rbs_spacer=3-4bp;gc_cont=0.549 | NA + 2700 6242 C CDS test.0417.00002.0003i_00030 NA | NA | NA | ID=3_3;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.544 | NA + 6235 9123 C CDS test.0417.00002.0003i_00031 NA | NA | NA | ID=3_4;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.510 | NA + 9299 12667 C CDS test.0417.00002.0003i_00032 NA | NA | NA | ID=3_5;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.535 | NA + 12680 13003 C CDS test.0417.00002.0003i_00033 NA | NA | NA | ID=3_6;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.543 | NA + 12988 13395 C CDS test.0417.00002.0003i_00034 NA | NA | NA | ID=3_7;partial=00;start_type=GTG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.527 | NA + 13392 13955 C CDS test.0417.00002.0003i_00035 NA | NA | NA | ID=3_8;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.532 | NA + 13946 14449 C CDS test.0417.00002.0003i_00036 NA | NA | NA | ID=3_9;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.544 | NA + 14634 15428 C CDS test.0417.00002.0003i_00037 NA | NA | NA | ID=3_10;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.516 | NA + 15435 16310 C CDS test.0417.00002.0003i_00038 NA | NA | NA | ID=3_11;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.525 | NA + 16461 18707 C CDS test.0417.00002.0003i_00039 NA | NA | NA | ID=3_12;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.536 | NA + 18720 19250 C CDS test.0417.00002.0003i_00040 NA | NA | NA | ID=3_13;partial=00;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.493 | NA + 19695 19856 D CDS test.0417.00002.0003i_00041 NA | NA | NA | ID=3_14;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.395 | NA + 19935 20624 D CDS test.0417.00002.0003i_00042 NA | NA | NA | ID=3_15;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.539 | NA + 20693 21406 D CDS test.0417.00002.0003i_00043 NA | NA | NA | ID=3_16;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.503 | NA + 21544 21762 D CDS test.0417.00002.0003i_00044 NA | NA | NA | ID=3_17;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.434 | NA + 21870 22910 D CDS test.0417.00002.0003i_00045 NA | NA | NA | ID=3_18;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.544 | NA + 22942 24135 C CDS test.0417.00002.0003i_00046 NA | NA | NA | ID=3_19;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.553 | NA + 24128 26287 C CDS test.0417.00002.0003i_00047 NA | NA | NA | ID=3_20;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.522 | NA + 26873 27904 D CDS test.0417.00002.0003i_00048 NA | NA | NA | ID=3_21;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.529 | NA + 27911 29173 C CDS test.0417.00002.0003i_00049 NA | NA | NA | ID=3_22;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.525 | NA + 29295 30230 D CDS test.0417.00002.0003i_00050 NA | NA | NA | ID=3_23;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.533 | NA + 30217 30909 C CDS test.0417.00002.0003i_00051 NA | NA | NA | ID=3_24;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.506 | NA + 31038 32456 C CDS test.0417.00002.0003i_00052 NA | NA | NA | ID=3_25;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.517 | NA + 32771 33532 C CDS test.0417.00002.0003i_00053 NA | NA | NA | ID=3_26;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.521 | NA + 33562 34398 C CDS test.0417.00002.0003i_00054 NA | NA | NA | ID=3_27;partial=00;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.495 | NA + 34685 35866 C CDS test.0417.00002.0003i_00055 NA | NA | NA | ID=3_28;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.531 | NA + 36121 37350 D CDS test.0417.00002.0003i_00056 NA | NA | NA | ID=3_29;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.445 | NA + 37507 37758 C CDS test.0417.00002.0003i_00057 NA | NA | NA | ID=3_30;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.409 | NA + 37818 38168 C CDS test.0417.00002.0003i_00058 NA | NA | NA | ID=3_31;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.501 | NA + 38987 41284 D CDS test.0417.00002.0003i_00059 NA | NA | NA | ID=3_32;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.529 | NA + 41295 42173 D CDS test.0417.00002.0003i_00060 NA | NA | NA | ID=3_33;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.538 | NA + 42170 42649 D CDS test.0417.00002.0003i_00061 NA | NA | NA | ID=3_34;partial=00;start_type=ATG;rbs_motif=GGxGG;rbs_spacer=5-10bp;gc_cont=0.512 | NA + 42689 44467 C CDS test.0417.00002.0003i_00062 NA | NA | NA | ID=3_35;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.459 | NA + 44946 46133 D CDS test.0417.00002.0003i_00063 NA | NA | NA | ID=3_36;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.506 | NA + 46191 47387 D CDS test.0417.00002.0003i_00064 NA | NA | NA | ID=3_37;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.531 | NA + 47445 48656 D CDS test.0417.00002.0003i_00065 NA | NA | NA | ID=3_38;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.507 | NA + 48709 50094 D CDS test.0417.00002.0003i_00066 NA | NA | NA | ID=3_39;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.524 | NA + 50142 51011 D CDS test.0417.00002.0003b_00067 NA | NA | NA | ID=3_40;partial=01;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.501 | NA + 103 1728 C CDS test.0417.00002.0004b_00068 NA | NA | NA | ID=4_1;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.523 | NA + 1776 2255 C CDS test.0417.00002.0004i_00069 NA | NA | NA | ID=4_2;partial=00;start_type=GTG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.504 | NA + 2650 3228 D CDS test.0417.00002.0004i_00070 NA | NA | NA | ID=4_3;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.430 | NA + 3550 6648 D CDS test.0417.00002.0004i_00071 NA | NA | NA | ID=4_4;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.526 | NA + 6651 7979 D CDS test.0417.00002.0004i_00072 NA | NA | NA | ID=4_5;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.525 | NA + 8030 8809 D CDS test.0417.00002.0004i_00073 NA | NA | NA | ID=4_6;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.538 | NA + 8806 11676 D CDS test.0417.00002.0004i_00074 NA | NA | NA | ID=4_7;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.527 | NA + 11841 13241 D CDS test.0417.00002.0004i_00075 NA | NA | NA | ID=4_8;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.490 | NA + 13259 14575 D CDS test.0417.00002.0004i_00076 NA | NA | NA | ID=4_9;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.483 | NA + 14611 15978 D CDS test.0417.00002.0004i_00077 NA | NA | NA | ID=4_10;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.531 | NA + 16014 16502 C CDS test.0417.00002.0004i_00078 NA | NA | NA | ID=4_11;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.554 | NA + 16502 18421 C CDS test.0417.00002.0004i_00079 NA | NA | NA | ID=4_12;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.528 | NA + 18857 20305 D CDS test.0417.00002.0004i_00080 NA | NA | NA | ID=4_13;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.500 | NA + 20307 20432 D CDS test.0417.00002.0004i_00081 NA | NA | NA | ID=4_14;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.357 | NA + 20555 21103 D CDS test.0417.00002.0004i_00082 NA | NA | NA | ID=4_15;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.506 | NA + 21146 22663 C CDS test.0417.00002.0004i_00083 NA | NA | NA | ID=4_16;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.529 | NA + 22673 23554 C CDS test.0417.00002.0004i_00084 NA | NA | NA | ID=4_17;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.533 | NA + 23862 25595 C CDS test.0417.00002.0004i_00085 NA | NA | NA | ID=4_18;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.565 | NA + 25601 26311 C CDS test.0417.00002.0004i_00086 NA | NA | NA | ID=4_19;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.482 | NA + 26336 27232 C CDS test.0417.00002.0004i_00087 NA | NA | NA | ID=4_20;partial=00;start_type=GTG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.530 | NA + 27344 27865 D CDS test.0417.00002.0004i_00088 NA | NA | NA | ID=4_21;partial=00;start_type=ATG;rbs_motif=AGxAG;rbs_spacer=5-10bp;gc_cont=0.517 | NA + 27905 28312 C CDS test.0417.00002.0004i_00089 NA | NA | NA | ID=4_22;partial=00;start_type=GTG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.539 | NA + 28293 28559 C CDS test.0417.00002.0004i_00090 NA | NA | NA | ID=4_23;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.491 | NA + 28802 29782 D CDS test.0417.00002.0004i_00091 NA | NA | NA | ID=4_24;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.539 | NA + 29859 30518 C CDS test.0417.00002.0004i_00092 NA | NA | NA | ID=4_25;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.518 | NA + 30682 30993 C CDS test.0417.00002.0004i_00093 NA | NA | NA | ID=4_26;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.455 | NA + 31038 31457 D CDS test.0417.00002.0004b_00094 NA | NA | NA | ID=4_27;partial=01;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.500 | NA + 2 1012 D CDS test.0417.00002.0005b_00095 NA | NA | NA | ID=5_1;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.515 | NA + 1178 4051 C CDS test.0417.00002.0005i_00096 NA | NA | NA | ID=5_2;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.554 | NA + 4169 4558 C CDS test.0417.00002.0005i_00097 NA | NA | NA | ID=5_3;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.515 | NA + 4582 5745 C CDS test.0417.00002.0005i_00098 NA | NA | NA | ID=5_4;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.536 | NA + 5852 6007 C CDS test.0417.00002.0005b_00099 NA | NA | NA | ID=5_5;partial=01;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.231 | NA diff --git a/test/data/annotate/exp_files/res_formatAll/prodigal/LSTINFO/test_runprokka_H299.lst b/test/data/annotate/exp_files/res_formatAll/prodigal/LSTINFO/test_runprokka_H299.lst new file mode 100644 index 0000000000000000000000000000000000000000..0871ac277d23026f24e617ff4c91316af1dadb54 --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prodigal/LSTINFO/test_runprokka_H299.lst @@ -0,0 +1,19 @@ + 3 140 C CDS test_runprokka_H299.0001b_00001 NA | NA | NA | ID=1_1;partial=10;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.580 | NA + 201 743 C CDS test_runprokka_H299.0001i_00002 NA | NA | NA | ID=1_2;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.562 | NA + 740 1339 C CDS test_runprokka_H299.0001i_00003 NA | NA | NA | ID=1_3;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.593 | NA + 1489 2187 C CDS test_runprokka_H299.0001i_00004 NA | NA | NA | ID=1_4;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.558 | NA + 2187 2483 C CDS test_runprokka_H299.0001i_00005 NA | NA | NA | ID=1_5;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.404 | NA + 2518 3480 C CDS test_runprokka_H299.0001b_00006 NA | NA | NA | ID=1_6;partial=01;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.442 | NA + 3 140 C CDS test_runprokka_H299.0002b_00007 NA | NA | NA | ID=2_1;partial=10;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.572 | NA + 201 743 C CDS test_runprokka_H299.0002i_00008 NA | NA | NA | ID=2_2;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.547 | NA + 740 1483 C CDS test_runprokka_H299.0002i_00009 NA | NA | NA | ID=2_3;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.594 | NA + 1489 2187 C CDS test_runprokka_H299.0002i_00010 NA | NA | NA | ID=2_4;partial=00;start_type=ATG;rbs_motif=AGxAGG/AGGxGG;rbs_spacer=5-10bp;gc_cont=0.557 | NA + 2187 2516 C CDS test_runprokka_H299.0002i_00011 NA | NA | NA | ID=2_5;partial=00;start_type=ATG;rbs_motif=GGAGG;rbs_spacer=5-10bp;gc_cont=0.567 | NA + 2513 5092 C CDS test_runprokka_H299.0002i_00012 NA | NA | NA | ID=2_6;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.592 | NA + 5085 5519 C CDS test_runprokka_H299.0002i_00013 NA | NA | NA | ID=2_7;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.559 | NA + 5501 5923 C CDS test_runprokka_H299.0002i_00014 NA | NA | NA | ID=2_8;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.515 | NA + 5939 6679 C CDS test_runprokka_H299.0002i_00015 NA | NA | NA | ID=2_9;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.583 | NA + 6687 7079 C CDS test_runprokka_H299.0002b_00016 NA | NA | NA | ID=2_10;partial=01;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.539 | NA + 1 870 D CDS test_runprokka_H299.0003b_00017 NA | NA | NA | ID=3_1;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.303 | NA + 863 1795 D CDS test_runprokka_H299.0003i_00018 NA | NA | NA | ID=3_2;partial=00;start_type=GTG;rbs_motif=AGxAGG/AGGxGG;rbs_spacer=5-10bp;gc_cont=0.309 | NA + 1890 2582 D CDS test_runprokka_H299.0003b_00019 NA | NA | NA | ID=3_3;partial=01;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.289 | NA diff --git a/test/data/annotate/exp_files/res_formatAll/prodigal/Proteins/test.0417.00002.prt b/test/data/annotate/exp_files/res_formatAll/prodigal/Proteins/test.0417.00002.prt new file mode 100644 index 0000000000000000000000000000000000000000..840ff893a0a9e3c5bd411c96e2c57ba84e1c55f8 --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prodigal/Proteins/test.0417.00002.prt @@ -0,0 +1,753 @@ +>test.0417.00002.0001b_00001 501 NA | NA | NA | ID=1_1;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.447 | NA +MADSFQNEVPAARVNIKLDLHTGNAKKKVELPLKLLAVGDYSNGKEQRPLSERDKVDINK +NNFNSVMAEFSPAVNLTVEDTLNGNGNEQNIALEFKSLKDFEPEQVAKNIPQLRVLLAMR +NLLRDLKSNLLDNATFRRELENILKDPTLSSELRDELAKIAPQENV* +>test.0417.00002.0001i_00002 1539 NA | NA | NA | ID=1_2;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.511 | NA +MSVQQEHATSETATLTTTESGGVYQSLFDKINLTPVSSIQEIDLWQNSETLADASPDERV +TAAIHVLLSCLAKSGEDVVKLDKSLLDFHIDDLDQKISKQLDAVMHHPEFQKVESLWRGT +WFVVQRTDFRKNVRIELLDISKEHLRQDFDDSPEIIQSGLYRHTYIQEYDTPGGEPVASL +ISSYEFDNSPQDIALLRNISRVSAASHMPFIGSVGPKFFLKNSMEEVAAIKDIGNYFDRA +EYIKWKSFRDTDDSRYVGLVMPRVLGRLPYGPDTVPVRSFNYVEEVKGPDHEKYLWTNAS +FAFAANMVKSFVNNGWCVQIRGPQAGGAVADLPIHLYDLGTGNQVKIPSEVMIPETREFE +FANLGFIPLSYYKNRDYACFFSANSAQKPALYDTADATANSRINARLPYIFLLSRIAHYL +KIIQRENIGTTKDRRVLELELNTWIRTLVTEMTDPGDELQASHPLRDGKVIVEDIEDNPG +FFRVRLFAVPHFQIEGMDINLSLVSQMPKAKA* +>test.0417.00002.0001i_00003 1338 NA | NA | NA | ID=1_3;partial=00;start_type=ATG;rbs_motif=GGxGG;rbs_spacer=5-10bp;gc_cont=0.594 | NA +MKICRPLWAEGTFLSSQQFQQQARWEAFSNDCIAQLCIRHPWGIANVLFDRDALTPGKLK +TQAVRLRFADGTLIDSDVSDVLPLACDLRALKNDSAIVLLALPLAHGNGGNLGQGEQTER +PLRYRQEWQKVQDIYGSDSEDMAVERHALSLRFAHDNNQDYITCPLARLVRDVQGNWTQD +ESYIPPLLAFNAHDGLVQRLDTLLLQLRAKCQRLMAMRRESNQRMADFAVADVSLFWLLN +ALNSAEPVLSDFLRYPAVHPELVWRELARLAGALLTFSLEHNVSAVPPYVHESPSTVFPP +LFSLLSELLEASLPSRVIALDLASLPGNRWKADLHDPRLREEADFYLSVRSSLPAHQVLH +QLPLVCKIGAPDDVTLLINVALNGVQLVPLTSVPAALPLRLENQYFALDMHSDAAKSMLE +SGSCMIYAPGTMGDLKPELFAVLRT* +>test.0417.00002.0001i_00004 666 NA | NA | NA | ID=1_4;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.590 | NA +MKKDMDINIDALLLDTFLTVVELRQGTTVRHGIELYRHCQRQVELVRERLKDAGFSRENV +EHITYAQCALLDETVLSRSGMDDGQAIWMKNPLQSHFFNTLQAGELLYERMKQVLQEPAP +AQAVLTCFHRVLLLGFRGRYQDPAAPERDQLISTLNGQVAPFGVLPETAVLNVPLSTRQH +PLLHSPFFWLVTLALLLAGVWWGLHHWLNVLVDELLPQSLR* +>test.0417.00002.0001i_00005 1653 NA | NA | NA | ID=1_5;partial=00;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.614 | NA +MRNTLKQAIVLWGMVLLLVLWSVFISPSGVLRWAGAAAIVLAVAALLIYRRRQAWTEMTG +DAGLSSLPPETYRQPVVLVCGGLSAHLFTDSPVRQVSEGLYLHVPDEEQLVAQVERLLTL +RPAWASQLAVAYTVMPGIHRDVAVLAGRLRRFAHSMATVRRRAGVNVPWLLWSGLSGSPL +PERASSPWFICTGGEVQVATSTETTMPAQWIAQSGVQERSQRLCYLLKAESLMQWLNLNV +LTALNGPEAKCPPLAMAVGLVTSLPAVDNNLWQVWITARTGLTTDIADTGTDATLPFPDA +LLRQLPRQSDFTPLRRACVTMLGITTAAGITMLCLSATANRQLLRQVGDDLHRFYAVPVE +EFITKARHLSVLKDNATMLDGYYREGEPLRLGLGLYPGERIRQPVLRAIRDWRPPEQKME +VTASLQVQTVRLDSMSLFDVGQARLKDGSTKVLVDALVNIRAKPGWLILVAGYTDATGDE +KSNQQLSLRRAEAVRNWMLQTSDIPATCFAVQGLGESQPAATNDTPQGRAVNRRVEISLV +PRSDACQDVK* +>test.0417.00002.0001i_00006 492 NA | NA | NA | ID=1_6;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.514 | NA +MAIPAYLWLKDDGGADIKGSVDVQGREGSIEVVALDHDVYIPTDNNTGKLTGTRTHKPFT +FTKEIDASSPYLYKAVTTGQTLKTAEFKFYRINDAGQEVEYFNITLDNVKLVRVAPLMHD +IKDPSREKHNHLERIEFRYEKITWTYKDGNIIHSDSWNERPSA* +>test.0417.00002.0001i_00007 2637 NA | NA | NA | ID=1_7;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.603 | NA +MTGNHSAALLRRLNPYCARALDAAASLCQTRAHAEITIEHWLLKLLEQGEGDITVIARRY +EWDIDTLWQSLLAHLDTLPRPVRERPQLSEPLAALIRQAWLIASLEGDDPQIRSQHLLMA +LTEKPMLPACNDLWVLLSLSRVQLERLRPLLDAQSDECPARQPQVTEPLTSALPETATAD +APAKTLTEKQDDALLAVLNRFTEDVTEKARSGRIDPVFGRDTEIRQMVDILSRRRKNNPI +LVGEPGVGKTALVEGLALRITEGNVPDSLKTVHIRTLDLGLLQAGAGVKGEFEQRLKNVI +DAVQKSPEPVLLFIDEAHTIIGAGNQAGGADAANLLKPALARGELRTIAATTWSEYKQYF +ERDAALERRFQMVKVDEPDDDTACLMLRGLKARYAQHHGVHMLDSAIQTAVRLSRRYLTG +RQLPDKAVDLLDTAGARVRMSLDTLPEPLTQLHARLAALDIEREAIEQDSVFYPEASPER +LAELTDLRDELQAEAGHLEAQYQQEKALAQQIMTLRQEGTDSSELQQQLRTHQGFAPLLA +LDVDARAVATVVADWTGIPLSSLLKDEQSDLLSMEQSLENRVVGQSPALCAIAQRLRAAK +TGLTPENGPQGVFLLTGPSGTGKTETALTLADTLFGGEKSLITINLSEYQEPHTVSQLKG +SPPGYVGYGQGGVLTEAVRKRPYSVVLLDEVEKAHRDVMNLFYQVFDRGFMRDGEGREID +FRNTVILMTANLGSDHIMQLLEEKPDATDADLHELLYPLLRDHFQPALMARFQTVIYRPL +GQEAMRAIVEMKLAQVARRLHQHYGLETEISNSLYDALTAACLLPDTGARNIDSLLNQQI +LPVLSQQLLAQQAVHHKPARLRLDWDDEDGIVLEFDEK* +>test.0417.00002.0001b_00008 147 NA | NA | NA | ID=1_8;partial=01;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.531 | NA +MNVQFFDHAHHKLKIRGLKSPVDVLTFTGREQLSAPFRYDIEFTSTDKT +>test.0417.00002.0002b_00009 1236 NA | NA | NA | ID=2_1;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.468 | NA +DLIANCKKIKEGNDKNEDTTWAWVAMILTLVGLIPVAGSLIKGIFKVLFNSIRKAALSSR +DIVRAIDASVSLFNKFIDLPAVQATMKWMKIYNPYTYAEKQVRELMAQLNVSVLLSKLDE +LMDVTGSLLEKAKSWGPESIRQPIEVIWELLVSIRSQANTMLAKALAPLNDVLEKLAARL +HREGDDYYKAHTGANPHRPSRLKDAEEVELLATKKPDWADIGGKEKYPQLEKASAEQKRL +MDPENKEGGYPNIPDDKVQTFHQMAPVEFKEGEKLYRVLDPGSSDNSFCWMREAEFKALK +SKSQWRRRFAVWKSWNENGEYVVYTVPPGTTMKVWEGPAASQVREVTGKNGENIKVVLEG +GSLQIVIDPTVLNLDYLGKRQSTGWGYRDFSDEVDMYIGVPQLQTNIYVPK* +>test.0417.00002.0002i_00010 1068 NA | NA | NA | ID=2_2;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.547 | NA +MAILHPQECWLLERIMSPEYYRRRFEGWQAFVELCERQVAEWSKTIPLDVRRRPLYEQID +AVWGGRVLPNIRSTLKSVQYDFIQLQQGDLRVLQSGGNISSDMKGLIDYPPDWMSPAAQK +QYDRLKWRGAHYNNLIRRTSGGYWYDGELTYYYEESLHGPLALPMQLPLYELDSSVYLRE +DDPVTVAGLYLPDIPDASAQLLYRSEHIPEAWQGRVRTKYVNEAGIQEYYWESGAWAKCN +WKRIRRVANRFINVPPEGFFPQGMPEELYNWPQREAQYVTDRQRIAAYSGEACPHSGEWS +IFVEGRQATETLEQGEQMPEWTDRKMEGEYKRGEKFHVLWSLMNRHDGGSVWVEA* +>test.0417.00002.0002i_00011 381 NA | NA | NA | ID=2_3;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.357 | NA +MRISLASLFFLCCTVSDSVYADTDQTYDIFWGMLVKDKKDTIFVRCDSPLLKMKIVRMAD +ANTENIDKAYQIFNQKTKKSIYFAFIGNVTDAGSGKYIFNMLDVMETREGYCNLSDVLNA +IDEQFR* +>test.0417.00002.0002i_00012 264 NA | NA | NA | ID=2_4;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.424 | NA +MKGIVVLGDKTTHGGQVISVSSSMVINGKKVALVGDKINCPVKGHGINTIIEGSFDWISD +GKQVVVNGCRCECGCVVISSIADALIG* +>test.0417.00002.0002i_00013 1140 NA | NA | NA | ID=2_5;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.359 | NA +MGWKRTYTEEIDRPQDIYFHKWLFSLFILCILLLVIYYFFHEFVVANNASLLAFFSPLLL +WVLILSVQVIFYSRAIQDYSIWLENRLSINREWEAWGSRYVSVMNSSLHLPGKVDVLFLS +GDELETQYGLVNKSDDITWKQHDWYACFQTLTNHLELYKLPYQLTQEFIILTDFDESMYS +QIEEDFFRTVEKTNRTEGHFLLHISPSMSFGELDLWLKDSEEKIYIVMVLQMEEQTSCSD +AMACLMFATDDVTAKYKLTEKARIYRPMVVNSNNFNSDLNIFIDTQKISKNAAGLVGDSQ +RLFSVSSNVLQCFNDNNAQLKIDNIHLLESLCGLPGGNAVWLTAALTISVVVHKNSDYLM +MSENNDDWIITTIHPMEHS* +>test.0417.00002.0002i_00014 3354 NA | NA | NA | ID=2_6;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.592 | NA +MKRINKKSVFISNVLLFLVIVAFVGGIIWRFGDHFGLKGDENNFFAWLICIMTLIFVRAS +WYFSRLYRLRKEQHHSEKERLRPEKEARIEYGKVITLNIELAEYLCALYGPFWRRKVRLL +LVTGEPEQAEAIAPGLTGQHWLEGDHKVLIYGGRPSAEPDVALLTALKKLRRSRPLDGII +WPLTEEQSRQTAQLDKGWRELINGGKRLGFQAPLYLWQVCDNGDYQTGRPLQSVGCLLPE +RCTPEQLAAMLEAQTLPLTEQGMSQLLADNRHDFLLRLAHTLAERGIAHWQSVLKPLLAG +GAFSSLRLRGLMFSPPLAAVPEAAPHAWLPSPVWAGVTGDNARGRAVGFPWLRAALITSI +CMLAIWGAGMTTSFFANRALVQETGIQTARALDTRLPLAEQLVALHTLQGELERLQYRIR +EGAPWYQRFGLERNQQLLAAAFPGYAQAANRLVRDVAVDHLQQQLNAFVALPPNSPQRTA +TGEQRYKQLKALLMTSRPEKADAAFFSTTLMADGLRYENIPEGVRQSVLPSLLTFWMANL +PEHPQWKTAPPPELTGAVRKILLRQIGVRNAENTLYQNVLQQVSRNYADMTLADMTGDTL +TESLFSTEQTVPGMFTRQAWEGQVREAIEQVVTARREEIDWVLSDRQQDTSADISPDTLR +NRLTSRYFTDFAGSWLAFLNSIRWKKEDSLSGILDQLTLMADARQSPLIALTDTLAWQAA +AGRENRGLSDSLAKSAQELFNGKEKTPQQSREGNEPVGPLDKTFAPLLRLLGDKAGGGDS +QLSLQTYLTRVTRVRLKLQQVTNAPDPQEMTQQLAQTVLQGKTVDLTDTRDYGRLIAASL +GEEWSGFGQALFVRPVEQSWRQVLTPAADSLNRQWHRAIVSHWNQDFAGRYPFKASQNDA +SLPLLAQYLRDDGRINQFIAANLSGVLKREGRYWVADAMNTQGLTVNPDFIRALNRLRDV +ADTAFASGDAGIHFELRAKPARDVMKTHLVIDGQELEYFNQKERWQRFNWPDEQWQPGAS +LSWTSTQAMERILADYRGSWSLIRLLEQAQVTPVDSSTFKVVWKAQDGLPLNYLLRVEQG +KGPLALLELKNFRLPGQVFLTGRSMKDAEEYGEDADE* +>test.0417.00002.0002i_00015 1638 NA | NA | NA | ID=2_7;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.620 | NA +MRKNTGKTPMSELLQKLTRSCFADRDALDVARTQAALWQTWLLPVTADTPVGEDPGYHDD +FLRIRDEMNKLSGADTDLICQLAESLLLTQAKDVRIATYYIWARLHRDGERGLAEGLALL +TGLVERFGTQLLPSRPASRKMALEWLAGEKMLDSLARYPEVAKEDFANIVAALNQLTVSF +AAWPEDQHSPSLMPLINALESRLAQSGGMNAVVPQNSSSVPAPSSPVDAPQVQTITSGRD +LLDQAKVLARYLNEQPQGWLSAHRLMKTLRWDTVHELPPDVDGKTRLAPPRTESRNQLKR +LYAQQNWTELLEQADLMFSTGVSHFWLDIQWYLHQALAKAGAPWDRWTAVIRQDLTLLLE +RLPGLENLAWNDGTPFADEVTRNWIAQQVMMREDGAWLAGKAAVPTDDATNDVLALEPEA +LAMADSQGVEAALGWIQTRPGITTARQRLLLRLLMARVAEQYGKNEMALLLLEELDTAAQ +GITLTQWEPELLFEVKARQLKLLRLRAHRHADKAALARKMDALLGSLVAIDPARTAVLCD +TQHKD* +>test.0417.00002.0002i_00016 1761 NA | NA | NA | ID=2_8;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.580 | NA +MDDLTQRYFEAEMRYLREAGKEFAQAYPDRAAMLNLDKPGARDPYVERLFEGFAFLMGRL +REKLDDDLPELTEGLVSLLWPHYLRTIPSLSVVELSTDHRQMKQSETLSDFQVLSRPVGE +RRTRCFYSATRDITLHPLALPDVSLQYEPDGRSVIRLRFECGPLVGDWSQIDLSRLPLYL +NADSPVACALHRALTLGTQQFWLRLPGQDRRMLGAHFSPMGFEDDDRLWPKGESAFSGYQ +LLLEYFTFREKFMFVALNGLEQVAWPEGITGFEIDVVLNENWPHDLPFDSDNIRLHCVPV +INLFPLEADPLHLSPLENEFLLRPMRIQDGHTEIYSVDNIISSRHTGSQAYVPFSSFRHR +GGMLRHDAPERYYHTRVKRGPSGLHDTWLILGGDAFDSDRMLEDETLSLSLTGTNGQLPR +KALQSTLLDTPVHASQNVLRVRNLCAPTQPCYPPARDRFHWRVLSHLGSNFLSMMDNAEI +LRGTLALYDWTESEMNRRRLEAIVDVQHSLIQRFERGFLLRGVDIQVTLDSNGFAGEGDI +TLFGELLHRFFALYADIHLFTQLTLILQPTGKCLQWTEHHSQRVPG* +>test.0417.00002.0002i_00017 1080 NA | NA | NA | ID=2_9;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=11-12bp;gc_cont=0.591 | NA +MDRASQPARTGLTDRLAPDIARINFYRFCQLLEQSQQKAPLGSTDNPAADAVRFRPHPGM +GFPVSELKNVERDVDNPDAPPTVRTTFLGLYGVDSPLPTAYLDYITQRHDGHDAVMAFLD +IFNHRFITQYYRIWRKYNYPASFEAGAVDDISRCLLGLIGLGIPGSENHIATPVSRFLAL +LSVMRLPTRTAEGVTALVGLLAPLTKATVVPHDPQPVILPAPAGLSKNSRISLKTRTLLG +RTGTDVNSQLLLKLYTEDAAEARGWLPGGQLHSDLLVLLRVYLGWRCQARLQLTLPVSLL +PAARLGKQRVQISRTGILLASFAAPATGTVTVSLGRYQGLIPAFSIRNRESMTHVSYSF* +>test.0417.00002.0002i_00018 537 NA | NA | NA | ID=2_10;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.508 | NA +MFPIRFKRPALLCMAMLTVVLSGCGLIQKVVDESKSVASAVFYKQIKILHLDFFSRSALN +TDAEDTPLSTMVHVWQLKTREDFDKADYDTLFMQEEKTLEKDVLAKHTVWVKPEGTASLN +VPLDKETQFVAIIGQFYHPDEKSDSWRLVIKRDELEADKPRSIELMRSDLRLLPLKDK* +>test.0417.00002.0002i_00019 429 NA | NA | NA | ID=2_11;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.534 | NA +MSTPSLYEMLTFSFSGELPLEQISERDQLILSVMDNMQRIINCRAGTLAHLPDYGLPDLS +LIHQGMAAGIHGLMRQIEETLLRYEPRLSQIQVELLPQPRPGHLNYLIHAQLPDTGWIRF +DGVFSPEGRIVLRHLKQQERAY* +>test.0417.00002.0002i_00020 1377 NA | NA | NA | ID=2_12;partial=00;start_type=ATG;rbs_motif=AGGAG/GGAGG;rbs_spacer=11-12bp;gc_cont=0.548 | NA +MASNANFISQFVMGGDPCTYKESGELQAEMSKLTHPARPDVDWRQVEKLCLALFRQNGVE +LQTLVCYVLAITRRQGLAGMADGLGSLDILLQRWADFWPVQVHSRISLLSWVTEKMQQAL +RTLDIQYQDLPQIYRCVQHLSAIETTLQQCELWHMTKLDLLAGQFRNTALRLERLAPQGA +ETTITPPELPRREMNQPKKSEESPQPVFATRSVQQNDKDASPPVPSPEISRQRTWPIFMA +GMVVMAGLGGTGLWGWSQLNQPDALIQRIQLSVMPLPQSLESGELAKLDVKDKALLAQDR +TIAASQMQLEQLNKLPARWPLEQGYRQLRQLDALWPDNPQVRALNAQWRKQRELSALSAE +ALNGYAQAQSQLQRLSAQLDALDERKGRYLTGSELKTAVYGIRQSLKEPPLEELLRQLEE +QKQTGEVSPTLLTQIDTRLNQLLNRYVILLDTKVEQSQ* +>test.0417.00002.0002i_00021 948 NA | NA | NA | ID=2_13;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.444 | NA +MKNVLVTVPSFSARCVSASKLLRENNFNLIIKNNVEHLLKSESTALRESICAVIAGKDGY +QADTLSLLPGVRIISRFGTGIDNIDLRAAQQSGIVVNNAVGINSNAVAEFIIGLIFASMR +NIPGSYHAMQNGYWGESHGCELQGKRIGLVGYGNIGKTLAKRLSGFDVELLAFDKQPDYQ +VADKAGVQFVSIEDIFMQSHVIIVLLPFSSELENFISHKYLSMMRNGALIINAARGKLLD +EGALLQVIEERNVFAALDVFSSEPLAQFSPLLHAKNIITTPHIAAATVESYQQTGIHVAQ +SIIDYFAGREIKNVL* +>test.0417.00002.0002i_00022 597 NA | NA | NA | ID=2_14;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.424 | NA +MNNTDLIHLIKHFMRNEHKAVEEVIDSPLSEVANLIKVLQSCQGKVVFIGVGKSGIIARK +LAATFASTGTPSFFVHGTEAVHGDLGMVAKDDVVILISNSGETAEILATLPSLKKMGNYL +ISFTRSHHSSLAISCDLSVEIPVKSEADNLGLAPSCSSTVVLVVGDAVALALSELKKFTR +ADFGLYHPGGALGIKANS* +>test.0417.00002.0002i_00023 1176 NA | NA | NA | ID=2_15;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.378 | NA +MDVFNTPVSRKGTYCTQWDFCEDRFGVKDVLPFSISDMDLPIPDAITRALKKRLEHPILG +YSRWQHGEYLNAIVNWYYQQYQTDIKPEWITYSPSVMYSIAKAIELLTSHGDNILVFTPV +YNAFFDVIKHSERNILTASLIIKNEGGYAINWQDFDLKIKSAKMMLLCNPHNPTGTVWSE +EELHKIAASCTRHNVWLCSDEIHSDFVFNRSFTSALKIKKEKVVVFNSISKTFNVPALTG +SYMISTDDNFNHKFRTISRYRDFVNSPSVLNIIATIIAYNECEGWLKSLKAHIASNIQFT +QQYLNENIPELIVRPADGCYFSWIDCSAIGYPFDEFYSRLIHEGKVGIMAGHVYGTEGEG +YLRLNLACGREKLYMGLTRLVSVIKNINQGE* +>test.0417.00002.0002i_00024 1581 NA | NA | NA | ID=2_16;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.441 | NA +MKQKKAWSFFQSLGKAFMYPIALLSVCGMMLGLGSGLASDDMAKLIPFLAIPIIKTILDF +IVSLGLFAFVNLPVLFAIAIPLGLLKDKEDKAYGAFSGLIGFMAMHLGTNFYLKQHDLLV +VADQMSTHGQTIILGIQSYNTSVLGGIVAGLLVASMYKKIVNLRIPESLGFYSGPRLVPI +ITLIVMSGFGLIIPFIWPPFFNLFMLIGHWISTSGPVGYFFYAVAERVTIPFGLNHLVTS +VFRFTPIGGSAVIGGEEYYGTLNMFMAYVKENAVIPLDLAGKMEQGKLMIQYGLAGAALA +MYRTAHAQNRKAIKALLISGVLTVIIGGVSEPIEFLFLFVSPLLFVFHAFMNGFANMVLP +YMGVKMGFTGDLIQFISFGVLRGTRTGWPIAVCVEVAYFFIYYFVFRWTILKFNLMTVGR +EESSPVTLNAHEDTAIADIPTPDKSELQAAEQMVKALGGKENIKSLDNCVTRLRLTIADM +RLIDEVAIKRAGGIAVVKLDQNTLQVIIGTKVIALRRDMDNYMGIY* +>test.0417.00002.0002i_00025 825 NA | NA | NA | ID=2_17;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.336 | NA +MIIEKVMNNNCVQASMNGQEVIISGPGVGYNKKYGMSVPEHPANRIFYVRNEQKNKLYKL +IEHVDIEYVFVAEKIVQYAEKNLEKNLNPSLLLILADHISNAISRVVSGIQINNVFLDEI +KALYKAEYAISRDALTIINEQFSVQLPDDEIGFIALHILNNYENSVDYESVRIIELSQII +TELIEVVYNRKVDRSSFNYSRFMMHLKYFSSRVLCNEKIKQKDIGDIYEQFLEKDILLQR +AIHEIERYLYATFKYELILEEKLYLSIRTKVLMD* +>test.0417.00002.0002i_00026 1254 NA | NA | NA | ID=2_18;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.538 | NA +MSGSNTAISRRRLLQGAGAMWLLSVSQVSLAAVSQVVAVRVWPASSYTRVTVESNRQLKY +KQFALSNPERVVVDIEDVNLNSVLKGMAAQIRADDPFIKSARVGQFDPQTVRMVFELKQN +VKPQLFALAPVAGFKERLVMDLYPANAQDMQDPLLALLEDYNKGDLEKQVPPAQSGPQPG +KAGRDRPIVIMLDPGHGGEDSGAVGKYKTREKDVVLQIARRLRSLIEKEGNMKVYMTRNE +DIFIPLQVRVAKAQKQRADLFVSIHADAFTSRQPSGSSVFALSTKGATSTAAKYLAQTQN +ASDLIGGVSKSGDRYVDHTMFDMVQSLTIADSLKFGKAVLNKLGKINKLHKNQVEQAGFA +VLKAPDIPSILVETAFISNVEEERKLKTATFQQEVAESILAGIKAYFADGATLARRG* +>test.0417.00002.0002b_00027 519 NA | NA | NA | ID=2_19;partial=01;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.526 | NA +MVKERKTELVEGFRHSVPYINTHRGKTFVIMLGGEAIEHENFSSIVNDIGLLHSLGIRLV +VVYGARPQIDANLAAHHHEPLYHKNIRVTDAKTLELVKQAAGTLQLDITARLSMSLNNTP +LQGAHINVVSGNFIIAQPLGVDDGVDYCHSGRIRRIDEDAIHRQLDSGAIVLM +>test.0417.00002.0003b_00028 810 NA | NA | NA | ID=3_1;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.520 | NA +PVAVSVTGESFNLTSEEIATQLAIKLKAEKMIGFCSSQGVTNDDGDIVSELFPNEAQARV +EAQEEKGDYNSGTVRFLRGAVKACRSGVRRCHLISYQEDGALLQELFSRDGIGTQIVMES +AEQIRRATINDIGGILELIRPLEQQGILVRRSREQLEMEIDKFTIIQRDNTTIACAALYP +FPEEKIGEMACVAVHPDYRSSSRGEVLLERIAAQAKQSGLSKLFVLTTRSIHWFQERGFT +PVDIDLLPESKKQLYNYQRKSKVLMADLG* +>test.0417.00002.0003i_00029 1827 NA | NA | NA | ID=3_2;partial=00;start_type=ATG;rbs_motif=AGGAGG;rbs_spacer=3-4bp;gc_cont=0.549 | NA +MKLQKQLLEAVEHKQLRPLDVQFALTVAGDEHPAVTLAAALLSHDAGEGHVCLPLSRLEN +NEASHPLLATCVSEIGELQNWEECLLASQAVSRGDEPTPMILCGDRLYLNRMWCNERTVA +RFFNEVNHAIEVDEALLAQTLDKLFPVSDEINWQKVAAAVALTRRISVISGGPGTGKTTT +VAKLLAALIQMADGERCRIRLAAPTGKAAARLTESLGKALRQLPLTDEQKKRIPEDASTL +HRLLGAQPGSQRLRHHAGNPLHLDVLVVDEASMIDLPMMSRLIDALPDHARVIFLGDRDQ +LASVEAGAVLGDICAYANAGFTAERAGQLSRLTGSHVPAGTGTEAASLRDSLCLLQKSYR +FGSDSGIGQLAAAINRGDKTAVKTVFQQDFTDIEKRLLQSGEDYIAMLEEALAGYGRYLD +LLQARAEPDLIIQAFNEYQLLCALREGPFGVAGLNERIEQFMQQKRKIHRHPHSRWYEGR +PVMIARNDSALGLFNGDIGIALDRGQGTRVWFAMPDGNIKSVQPSRLPEHETTWAMTVHK +SQGSEFDHAALILPSQRTPVVTRELVYTAVTRARRRLSLYADERILSAAIATRTERRSGL +AALFSSRG* +>test.0417.00002.0003i_00030 3543 NA | NA | NA | ID=3_3;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.544 | NA +MSDVAETLDPLRLPLQGERLIEASAGTGKTFTIAALYLRLLLGLGGSAAFPRPLTVEELL +VVTFTEAATAELRGRIRSNIHELRIACLRETTDNPLYKRLLEEIDDKAQAAQWLLLAERQ +MDEAAVFTIHGFCQRMLNLNAFESGMLFEQQLIEDESLLRYQACADFWRRHCYPLPREIA +QVVFETWKGPQALLRDINRYLQGEAPVIKAPPPDDETLASRHAQIVARIDAVKQQWRDAV +GELDALIESSGIDRRKFNRSNQAKWIEKISAWAEEETNSYQLPESLEKFSQRFLEDRTKA +GGETPRHPLFEAIEQLLAEPLSIRDLVITRALAEIRETVAREKRRRGELGFDDMLSRLDS +ALRSESGEVLAAAIRTRFPVAMIDEFQDTDPQQYRIFRRIWHHQPETALLLIGDPKQAIY +AFRGADIFTYMKARSEVHAHYTLDTNWRSAPGMVNSVNKLFSQTDDAFMFREIPFIPVKS +AGKNQALRFVFKGETQPAMKMWLMEGESCGVGDYQSTMAQVCAAQIRDWLQAGQRGEALL +MNGDDARPVRASDISVLVRSRQEAAQVRDALTLLEIPSVYLSNRDSVFETLEAQEMLWLL +QAVMTPERENTLRSALATSMMGLNALDIETLNNDEHAWDAVVEEFDGYRQIWRKRGVMPM +LRALMSARNIAENLLATAGGERRLTDILHISELLQEAGTQLESEHALVRWLSQHILEPDS +NASSQQMRLESDKHLVQIVTIHKSKGLEYPLVWLPFITNFRVQDQAFYHDRHSFEAVLDL +NAAPESVDLAEAERLAEDLRLLYVALTRSVWHCSLGVAPLVRRRGDKKGDTDVHQSALGR +LLQKGEPQDAAGLRTCIEALCDDDIAWQTAQIGDNQPWQVNDALTAELNARTLQRLPGDN +WRVTSYSGLQQRGHGIAQDLMPRLDVDAAGVVSVVEEPTLTPHQFPRGASPGTFLHSLFE +DLDFTQPVDPNWVQEKLELGGFEPQWEPVLTEWITAVLQAPLNETGVSLNQLSDRDKQVE +MEFYLPISEPLIASQLDALIRQFDPLSAGCPPLEFMQVRGMLKGFIDLVFRHEGRYYLLD +YKSNWLGEDSSAYTQQAMAAAMQAHRYDLQYQLYTLALHRYLRHRIADYDYERHFGGVIY +LFLRGVDKEHPQQGIYATRPNAGLIDLMDEMFAGMTLEEA* +>test.0417.00002.0003i_00031 2889 NA | NA | NA | ID=3_4;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.510 | NA +MPRSIWFKALLLFVALWAPLSQAETGWQPIQETIRKSDKDNRQYQAIRLDNGMVVLLVSD +PQAVKSLSALVVPVGSLEDPEAYQGLAHYLEHMSLMGSKKYPQADSLAEYLKMHGGSHNA +STAPYRTAFYLEVENDALPGAVDRLADAIAEPLLDKKYAERERNAVNAELTMARTRDGMR +MAQVSAETINPAHPGSKFSGGNLETLSDKPGNPVQQALKDFHEKYYSANLMKAVIYSNKP +LPELAKMAADTFGRVPNKESKKPEITVPVVTDAQKGIIIHYVPALPRKVLRVEFRIDNNS +AKFRSKTDELITYLIGNRSPGTLSDWLQKQGLVEGISANSDPIVNGNSGVLAISASLTDK +GLANRDQVVAAIFSYLNLLREKGIDKQYFDELANVLDIDFRYPSITRDMDYVEWLADTMI +RVPVEHTLDAVNIADRYDAKAVKERLAMMTPQNARIWYISPKEPHNKTAYFVDAPYQVDK +ISAQTFADWQKKAANIALSLPELNPYIPDDFSLIKSEKKYDHPELIVDESNLRVVYAPSR +YFASEPKADVSLILRNPKAMDSARNQVMFALNDYLAGLALDQLSNQASVGGISFSTNANN +GLMVNANGYTQRLPQLFQALLEGYFSYTATEDQLEQAKSWYNQMMDSAEKGKAFEQAIMP +AQMLSQVPYFSRDERRKILPSITLKEVLAYRDALKSGARPEFMVIGNMTEAQATTLARHV +QKQLGADGSEWCRNKDVVVDKKQSVIFEKAGNSTDSALAAIFVPTGYDEYTSSAYSSLLG +QIVQPWFYNQLRTEEQLGYAVFAFPMSVGRQWGMGFLLQSNDKQPSFLWERYKAFFPTAE +AKLRAMKPEEFAQIQQAVITQMLQAPQTLGEEASKLSKDFDRGNMRFDSRDKIVAQIKLL +TPQKLADFFHQAVVEPQGMAILSQISGSQNGKAEYVHPEGWKVWENVSALQQTMPLMSEK +NE* +>test.0417.00002.0003i_00032 3369 NA | NA | NA | ID=3_5;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.535 | NA +MLRVYHSNRLDVLEALMEFIVERERLDDPFEPEMILVQSTGMAQWLQMTLSQKFGIAANI +DFPLPASFIWDMFVRVLPEIPKESAFNKQSMSWKLMTLLPQLLEREDFTLLRHYLTDDSD +KRKLFQLSSKAADLFDQYLVYRPDWLAQWETGHLVEGLGEAQAWQAPLWKALVEYTDELG +QPRWHRANLYQRFIETLESATTCPPGLPSRVFICGISALPPVYLQALQALGKHIEIHLLF +TNPCRYYWGDIKDPAYLAKLLTRQRRHSFEDRELPLFRDSENAGQLFNSDGEQDVGNPLL +ASWGKLGRDYIYLLSDLESSQELDAFVDVTPDNLLHNIQSDILELENRAVAGVNIEEFSR +SDNKRPLDPLDSSITFHVCHSPQREVEVLHDRLLAMLEEDPTLTPRDIIVMVADIDSYSP +FIQAVFGSAPADRYLPYAISDRRARQSHPVLEAFISLLSLPDSRFVSEDVLALLDVPVLA +ARFDITEEGLRYLRQWVNESGIRWGIDDDNVRELELPATGQHTWRFGLTRMLLGYAMESA +QGEWQSVLPYDESSGLIAELVGHLASLLMQLNIWRRGLAQERPLEEWLPVCRDMLNAFFL +PDAETEAAMTLIEQQWQAIISEGLGAQYGDAVPLSLLRDELALRLDQERISQRFLAGPVN +ICTLMPMRSIPFKVVCLLGMNDGVYPRQLAPLGFDLMSQKPKRGDRSRRDDDRYLFLEAL +ISAQQKLYISYIGRSIQDNSERFPSVLVQELIDYIGQSHYLPGDEALNCDESEARVKAHL +TCHHTRMPFDPQNYQPGNLQSYAREWLPAASQAGKAHSEFVQPLPFTLPETVPLETLQRF +WAHPVRAFFQMRLQVNFRTEDSEIPDTEPFILEGLSRYQINQQLLNVLVEQDDAERLFRR +FRAAGDLPYGAFGEIFWETQCQEMQQLADRVIACRQPGQSMEIDLACNGVQITGWLPQVQ +PDGLLRWCPSLLSVAQGMQLWLEHLVYCASGGNGESRLFLRKDGEWRFPPLAAEQALHYL +SQLIEGYREGMSAPLLVLPESGGAWLKTCYDAQNDAMLDDDSTLQKARTKFLQAYEGNMM +VRGEGDDIWYQRLWRQLTPETMEAIVEQSQRFLLPLFRFNQS* +>test.0417.00002.0003i_00033 324 NA | NA | NA | ID=3_6;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.543 | NA +MSASLRNQQGFSLPEVMLAMVLMVMIVTALSGFQRTLMNSLASRNQYQQLWRHGWQQTQL +RAISPPANWQVNRMQTSQAGCVSISVTLVSPGGREGEMTRLHCPNRQ* +>test.0417.00002.0003i_00034 408 NA | NA | NA | ID=3_7;partial=00;start_type=GTG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.527 | NA +MNREKGVSSLALVLMLLILGSLLLQGMSQQDRSFASRVSMESQSLSRQAIVQSALEWGKM +HSWQTQPAVQCLLYAATGARVCLRLLADNEALLIAGYEGVSLWRTGEVIDGNIVFSPRGW +SDFCPLKERALCQLP* +>test.0417.00002.0003i_00035 564 NA | NA | NA | ID=3_8;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.532 | NA +MPVKEQGFSLLEVLIAMAISSVLLLGAARFLPALQRESLTSTRKLALEDEIWLRVFTVAK +HLQRAGYCHGSCTGEGLEIVGQGDCVIVQWDANSNGIWDREPVKESDQIGFRLKEHVLET +LRGATSCEGKGWDKVTNPDAIIIDTFQVVRQDVSGFSPVLTVNIHAASKADPQTVVDASY +SVTGANL* +>test.0417.00002.0003i_00036 504 NA | NA | NA | ID=3_9;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.544 | NA +MKTQRGYTLIETLVAMLILVMLSASGLYGWQYWQQSQRLWQTASQARDYLLYLREDANWH +NRDHSISLIREGTLWCLVSSVAGANTCHGSSVAGANTCHGSSPLVFVPRWPEVEMSDLTP +SLAFFGLRNTAWAGHIRFKNSTGEWWLVVSPWGRLRLCQQGETEGCL* +>test.0417.00002.0003i_00037 795 NA | NA | NA | ID=3_10;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.516 | NA +MKQYLELMQKVLDEGTQKNDRTGTGTLSIFGHQMRFNLQDGFPLVTTKRCHLRSIIHELL +WFLQGDTNIAYLHENNVTIWDEWADENGDLGPVYGKQWRAWPTPDGRHIDQITTVLNQLK +NDPDSRRIIVSAWNVGELDKMALAPCHAFFQFYVADGKLSCQLYQRSCDVFLGLPFNIAS +YALLVHMMAQQCDLEVGDFVWTGGDTHLYSNHMDQTHLQLSREPRPLPKLIIKRKPESIF +DYRFEDFEIEGYDPHPGIKAPVAI* +>test.0417.00002.0003i_00038 876 NA | NA | NA | ID=3_11;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.525 | NA +MTSSYLHFPEFDPVIFSIGPVALHWYGLMYLVGFIFAMWLATRRANRPGSGWTKNEVENL +LYAGFLGVFLGGRIGYVLFYNFPQFMADPLYLFRVWDGGMSFHGGLIGVIVVMIIFARRT +KRSFFQVSDFIAPLIPFGLGAGRLGNFINGELWGRVDPNFPFAMLFPGSRTEDILLLQTN +PQWQSIFDTYGVLPRHPSQLYELLLEGVVLFIILNLYIRKPRPMGAVSGLFLIGYGAFRI +IVEFFRQPDAQFTGAWVQYISMGQILSIPMIVAGVIMMVWAYRRSPQQHVS* +>test.0417.00002.0003i_00039 2247 NA | NA | NA | ID=3_12;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.536 | NA +MLTRLREIVEKVASAPRLNEALNILVTDICLAMDTEVCSVYLADHDRRCYYLMATRGLKK +PRGRTVTLAFDEGIVGLVGRLAEPINLADAQKHPSFKYIPSVKEERFRAFLGVPIIQRRQ +LLGVLVVQQRELRQYDESEESFLVTLATQMAAILSQSQLTALFGQYRQTRIRALPAAPGV +AIAEGWQDATLPLMEQVYQASTLDPALERERLTGALEEAANEFRRYSKRFAAGAQKETAA +IFDLYSHLLSDTRLRRELFAEVDKGSVAEWAVKTVIEKFAEQFAALSDNYLKERAGDLRA +LGQRLLFHLDDANQGPNAWPERFILVADELSATTLAELPQDRLVGVVVRDGAANSHAAIM +VRALGIPTVMGADIQPSVLHRRTLIVDGYRGELLVDPEPVLLQEYQRLISEEIELSRLAE +DDVNLPAQLKSGERIKVMLNAGLSPEHEEKLGSRIDGIGLYRTEIPFMLQSGFPSEEEQV +AQYQGMLQMFNDKPVTLRTLDVGADKQLPYMPISEENPCLGWRGIRITLDQPEIFLIQVR +AMLRANAATGNLNILLPMVTSLDEVDEARRLIERAGREVEEMIGYEIPKPRIGIMLEVPS +MVFMLPHLAKRVDFISVGTNDLTQYILAVDRNNTRVANIYDSLHPAMLRALAMIAREAEI +HGIDLRLCGEMAGDPMCVAILIGLGYRHLSMNGRSVARVKYLLRRIDFAEAENLAQRSLE +AQLATEVRHQVAAFMERRGMGGLIRGGL* +>test.0417.00002.0003i_00040 531 NA | NA | NA | ID=3_13;partial=00;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.493 | NA +MIDDDGYRPNVGIVICNRQGQVMWARRFGQHSWQFPQGGINPGESAEQAMYRELFEEVGL +SRKDVRILASTRNWLRYKLPKRLVRWDTKPVCIGQKQKWFLLQLVSGDAEINMQTSSTPE +FDGWRWVSYWYPVRQVVSFKRDVYRRVMKEFASVVMSLQENTPKPQNASAYRRKRG* +>test.0417.00002.0003i_00041 162 NA | NA | NA | ID=3_14;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.395 | NA +METVVEVFHSYPSFLWITWCKILFIFSDQIWKTRCSVAQLDYRKPKKQYKSEN* +>test.0417.00002.0003i_00042 690 NA | NA | NA | ID=3_15;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.539 | NA +MSQPRPLLSPPETEEQLLAQAQQLSGYTLGELAALAGLVTPENLKRDKGWIGVLLEIWLG +ASAGSKPEQDFAALGVELKTIPVDSLGRPLETTFVCVAPLTGNSGVTWETSHVRHKLKRV +LWIPVEGERSIPLAKRRVGSPLLWSPNEEEDRQLREDWEELMDMIVLGQVERITARHGEY +LQIRPKAANAKALTEAIGARGERILTLPRGFYLKKNFTSALLARHFLIQ* +>test.0417.00002.0003i_00043 714 NA | NA | NA | ID=3_16;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.503 | NA +MLFAWITDPNAWLALGTLTLLEIVLGIDNIIFLSLVVAKLPTAQRAHARRLGLAGAMVMR +LALLASIAWVTRLTNPLFTIFSQEISARDLILLLGGLFLIWKASKEIHESIEGEEEGLKT +RVSSFLGAIVQIMLLDIIFSLDSVITAVGLSDHLFIMMAAVVIAVGVMMFAARSIGDFVE +RHPSVKMLALSFLILVGFTLILESFDIHVPKGYIYFAMFFSIAVESLNLIRNKKNPL* +>test.0417.00002.0003i_00044 219 NA | NA | NA | ID=3_17;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.434 | NA +MKKWAVIISAVGLAFAVSGCSSDYVMATKDGRMILTDGKPEIDDDTGLVSYHDQQGNAMQ +INRDDVSQIIER* +>test.0417.00002.0003i_00045 1041 NA | NA | NA | ID=3_18;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.544 | NA +MQYHRIPHSSLEVSTLGLGTMTFGEQNSEADAHAQLDYAVAQGINLIDVAEMYPVPPRPE +TQGLTETYVGNWLAKHGSREKLIIASKVSGPSRNNDKGIRPDQALDRKNIREALHDSLKR +LQTDYLDLYQVHWPQRPTNCFGKLGYSWTDSAPAVSLLDTLDALAEYQRAGKIRYIGVSN +ETAFGVMRYLHLADKHDLPRIVTIQNPYSLLNRSFEVGLAEVSQYEGVELLAYSCLGFGT +LTGKYLNGAKPAGARNTLFSRFTRYSGEQTQKAVAAYVDIARRHGLDPAQMALAFVRRQP +FVASTLLGATTMEQLKTNVESLHLELSEDVLAEIEAVHQVYTYPAP* +>test.0417.00002.0003i_00046 1194 NA | NA | NA | ID=3_19;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.553 | NA +MSESVHTNTSLWSKGMKAVIVAQFLSAFGDNALLFATLALLKAQFYPEWSQPILQMVFVG +AYILFAPFVGQVADSFAKGRVMMFANGLKLLGAASICFGINPFLGYTLVGVGAAAYSPAK +YGILGELTTGSKLVKANGLMEASTIAAILLGSVAGGVLADWHILVALVACALAYGGAVVA +NIYIPKLAAARPGQSWNLISMTRSFLNACTSLWRNGETRFSLVGTSLFWGAGVTLRFLLV +LWVPVALGITDNATPTYLNAMVAIGIVVGAGAAAKLVTLETVSRCMPAGILIGVVVLIFS +LQHELLPAYALLMLIGVLGGFFVVPLNALLQERGKKSVGAGNAIAVQNLGENSAMLLMLG +IYSLAVMVGIPVVPIGIGFGALFALAITALWIWQRRH* +>test.0417.00002.0003i_00047 2160 NA | NA | NA | ID=3_20;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.522 | NA +MLFSFFRNLCRVLYRVRVTGDTKALKGERVLITPNHVSFIDGILLALFLPVRPVFAVYTS +ISQQWYMRWLKSFIDFVPLDPTQPMAIKHLVRLVEQGRPVVIFPEGRITTTGSLMKIYDG +AGFVAAKSGATVIPVRIEGAELTHFSRLKGLVKRRLFPQITLHILPPTQVEMPDAPRARD +RRKIAGEMLHQIMMEARMAVRPRETLYESLLSAMYRFGAGKKCVEDVNFTPDSYRKLLTK +TLFVGRILEKYSVEGERIGLMLPNAGISAAVIFGAIARRRIPAMMNYTAGVKGLTSAITA +AEIKTIFTSRQFLDKGKLWHLPEQLTQVRWVYLEDLKADVTTADKVWIFAHLLMPRLAQV +KQQPEEEALILFTSGSEGHPKGVVHSHKSILANVEQIKTIADFTTNDRFMSALPLFHSFG +LTVGLFTPLLTGAEVFLYPSPLHYRIVPELVYDRSCTVLFGTSTFLGHYARFANPYDFYR +LRYVVAGAEKLQESTKQLWQDKFGLRILEGYGVTECAPVVSINVPMAAKPGTVGRILPGM +DARLLSVPGIEEGGRLQLKGPNIMNGYLRVEKPGVLEVPTAENIRGEMERDWYDTGDIVR +FDEQGFVQIQGRAKRFAKIAGEMVSLEMVEQLALGVSPDKVHATAIKSDASKGEALVLFT +TDNELTRDKLQQYAREHGVPELAVPRDIRYLKQMPLLGSGKPDFVTLKSWVDEAEQHDE* +>test.0417.00002.0003i_00048 1032 NA | NA | NA | ID=3_21;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.529 | NA +MATIKDVARLAGVSVATVSRVINNSPKASEASRLAVHSAMESLSYHPNANARALAQQTTE +TIGLVVGDVSDPFFGAMVKAVEQVAYHTGNFLLIGNGYHNEQKERQAIEQLIRHRCAALV +VHAKMIPDADLASLMKQMPGMVLINRILPGFENRCIALDDRYGAWLATRHLIQQGHTRIG +YLCSNHSISDAEDRLQGYYDALAESGIPANDRLVTFGEPDESGGEQAMTELLGRGRNFTA +VACYNDSMAAGAMGVLNDNGIDVPGEISLIGFDDVLVSRYVRPRLTTVRYPIVTMATQAA +ELALALADNRPLPEITNVFSPTLVRRHSVSTPSLEASHHATSD* +>test.0417.00002.0003i_00049 1263 NA | NA | NA | ID=3_22;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.525 | NA +MPHSLFSTDTDLTAENLLRLPAEFGCPVWVYDAQIIRRQIAALKQFDVVRFAQKACSNIH +ILRLMREQGVKVDSVSLGEIERALAAGYNPQTHPDDIVFTADVIDQATLERVSELQIPVN +AGSVDMLDQLGQVSPGHRVWLRVNPGFGHGHSQKTNTGGENSKHGIWYTDLPAALDVIQR +HHLQLVGIHMHIGSGVDYAHLEQVCGAMVRQVLEFGQDLQAISAGGGLSIPYQQGEEAVD +TEHYYGLWNAAREQIARHLGHPVKLEIEPGRFLVAQAGVLITQVRSVKQMGSRHFVLVDA +GFNDLMRPAMYGSYHHISALAADGRSLEHAPTVETVVAGPLCESGDVFTQQEGGNVETRA +LPEVKACDYLVLHDTGAYGASMSSNYNSRPLLPEVLFDNGQARLIRRRQTIEELLALELL +* +>test.0417.00002.0003i_00050 936 NA | NA | NA | ID=3_23;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.533 | NA +MAAVNLRHIEIFHAVMTAGSLTEAAHLLHTSQPTVSRELARFEKVIGLKLFERIRGRLHP +TVQGLRLFEEVQRSWYGLDRIVSAAESLREFRQGELSIACLPVFSQSFLPQLLQPFLARY +PDVSLNIVPQESPLLEEWLSAQRHDLGLTETLHTPAGTERTELLSLDEVCVLPPGHPLAV +KKVLTPDDFHGENYISLSRTDSYRQLLDQLFTENQVKRRMIVETHSAASVCAMVRAGVGV +SVVNPLTALDYAASGLVVRRFSIAVPFTVSLIRPLHRPSSALVQAFSEHLQAGLPKLVTS +LDTILSSATTA* +>test.0417.00002.0003i_00051 693 NA | NA | NA | ID=3_24;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.506 | NA +MKTIGLLGGMSWESTIPYYRLINEGIKQRLGGLHSAQVLLHSVDFHEIEECQRRGEWDKT +GDILAEAALGLQRAGAEGIVLCTNTMHKVADAIESRCSLPFLHIADATGRAITGAGMTRV +ALLGTRYTMEQDFYRGRLTEQFSINCLIPEADERAKINQIIFEELCLGQFTEASRAYYAQ +VIARLAEQGAQGVIFGCTEIGLLVPEERSVLPVFDTAAIHAEDAVAFMLS* +>test.0417.00002.0003i_00052 1419 NA | NA | NA | ID=3_25;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.517 | NA +MVTINTESALTPRPLRDTRRMNMFVSVAAAVAGLLFGLDIGVIAGALPFITDHFVLTSRL +QEWVVSSMMLGAAIGALFNGWLSFRLGRKYSLMAGAILFVLGSIGSAFATSVEMLIAARV +VLGIAVGIASYTAPLYLSEMASENVRGKMISMYQLMVTLGIVLAFLSDTAFSYSGNWRAM +LGVLALPAVLLIILVVFLPNSPRWLAEKGRHIEAEEVLRMLRDTSEKAREELNEIRESLK +LKQGGWALFKINRNVRRAVFLGMLLQAMQQFTGMNIIMYYAPRIFKMAGFTTTEQQMIAT +LVVGLTFMFATFIAVFTVDKAGRKPALKIGFSVMALGTLVLGYCLMQFDNGTASSGLSWL +SVGMTMMCIAGYAMSAAPVVWILCSEIQPLKCRDFGITCSTTTNWVSNMIIGATFLTLLD +SIGAAGTFWLYTALNIAFVGITFWLIPETKNVTLEHIERKLMAGEKLRNIGV* +>test.0417.00002.0003i_00053 762 NA | NA | NA | ID=3_26;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.521 | NA +MILNAFSLEGKVAVVTGCDTGLGQGMALGLAQAGCDIVGINIVEPTETIKQVTAQGRRFL +SLTADLRKIDGIPGLLDRAVAEFGHIDILVNNAGLIRREDALEFSETDWDDVMNLNIKSV +FFMSQAAAKHFIAQGNGGKIINIASMLSFQGGIRVPSYTASKSGVMGVTRLMANEWAKHN +INVNAIAPGYMATNNTQQLRADEQRSAEILDRIPAGRWGLPSDLMGPVVFLASSASDYVN +GYTIAVDGGWLAR* +>test.0417.00002.0003i_00054 837 NA | NA | NA | ID=3_27;partial=00;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.495 | NA +MDVRQSIHSAHAKTLDTQGLRNEFLVEKVFVADEYTMVYSHIDRIIVGGIMPVTKTVSVG +GEVGKQLGVSYFLERRELGVINIGGAGTITVDGQCYEIGHRDALYVGKGAKEVVFASIDT +ATPAKFYYNCAPAHTTYPTKKVTPDEVSPVTLGDNLTSNRRTINKYFVPDVLETCQLSMG +LTELAPGNLWNTMPCHTHERRMEVYFYFNMDDDACVFHMMGQPQETRHIVMHNEQAVISP +SWSIHSGVGTKAYTFIWGMVGENQVFDDMDHVAVKDLR* +>test.0417.00002.0003i_00055 1182 NA | NA | NA | ID=3_28;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.531 | NA +MKDVVIVGALRTPIGCFRGALAGHSAVELGSLVVKALIERTGVPAYAVDEVILGQVLTAG +AGQNPARQSAIKGGLPNSVSAITINDVCGSGLKALHLATQAIQCGEADIVIAGGQENMSR +APHVLTDSRTGAQLGNSQLVDSLVHDGLWDAFNDYHIGVTAENLAREYGISRQLQDAYAL +SSQQKARAAIDAGRFKDEIVPVITQSNGQTLVVDTDEQPRTDTSAEALARLNPSFDSLGS +VTAGNASSINYGAAAVMMMSEAKARALNLPVLARIRAFASVGVDPALMGIAPVYATRRCL +ERVGWQLADVDLIEANEAFAAQALSVGKMLEWDERRVNVNGGAIALGHPIGASGCRILVS +LVHEMVKRNARKGLATLCIGGGQGVALTIERDE* +>test.0417.00002.0003i_00056 1230 NA | NA | NA | ID=3_29;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.445 | NA +MSNIWSKEETLWSFALYGTAVGAGTLFLPIQLGSAGAVVLFITALVAWPLTYWPHKALCQ +FILSSKTSAGEGITGAVTHYYGKKIGNLITTLYFIAFFVVVLIYAVAITNSLTEQLAKHM +VIDLRIRMLVSLGVVLILNLIFLMGRHATIRVMGFLVFPLIAYFLFLSIYLVGSWQPDLL +TTQVEFNQNTLHQIWISIPVMVFAFSHTPIISTFAIDRREKYGEHAMDKCKKIMKVAYLI +ICISVLFFVFSCLLSIPPSYIEAAKEEGVTILSALSMLPNAPAWLSISGIIVAVVAMSKS +FLGTYFGVIEGATEVVKTTLQQVGVKKSRAFNRALSIMLVSLITFIVCCINPNAISMIYA +ISGPLIAMILFIMPTLSTYLIPALKPWRSIGNLITLIVGILCVSVMFFS* +>test.0417.00002.0003i_00057 252 NA | NA | NA | ID=3_30;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.409 | NA +MPYASRSGRSSMVERELPKLYTRVRFPSPAPIYLHIIYLPFLLYLIFYIILIQALQTFRN +RRNTSPFFVNKKRLRNAIVMYLK* +>test.0417.00002.0003i_00058 351 NA | NA | NA | ID=3_31;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.501 | NA +MPYSTADGGNKGIDISAPRGTPIYAAGAGKVVYVGNQLRGYGNLIMIKHSEDYITAYAHN +DTMLVNNGQSVKAGQKIATMGSTDAASVRLHFQIRYRATAIDPLRYLPPQGSKPKC* +>test.0417.00002.0003i_00059 2298 NA | NA | NA | ID=3_32;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.529 | NA +MEAREATATGESCMRVDAIAKVTGRARYTDDYVMAGMCYAKYVRSPIAHGYAVSINDEQA +RSLPGVLAIFTWEDVPEIPFATAGHAWTLDENKRDTADRALLTRHVRHHGDAVAIVVARD +ELTAEKAAQLVSIEWQELPVITSPEAALAEDAAPIHNGGNLLKQSTMSTGNVQQTIDAAD +YQVQGHYQTPVIQHCHMESVTSLAWMEDDSRITIVSSTQIPHIVRRVVGQALDIPWSCVR +VIKPFIGGGFGNKQDVLEEPMAAFLTSKLGGIPVKVSLSREECFLATRTRHAFTIDGQMG +VNRDGTLKGYSLDVLSNTGAYASHGHSIASAGGNKVAYLYPRCAYAYSSKTCYTNLPSAG +AMRGYGAPQVVFAVESMLDDAATALGIDPVEIRLRNAAREGDANPLTGKRIYSAGLPECL +EKGRKIFEWEKRRAECQNQQGNLRRGVGVACFSYTSNTWPVGVEIAGARLLMNQDGTINV +QSGATEIGQGADTVFSQMVAETVGVPVSDVRVISTQDTDVTPFDPGAFASRQSYVAAPAL +RSAALLLKEKIIAHAAVMLHQSAMNLTLIKGHIVLIERPEEPLMSLKDLAMDAFYHPERG +GQLSAESSIKTTTNPPAFGCTFVDLTVDIALCKVTINRILNVHDSGHILNPLLAEGQVHG +GMGMGIGWALFEEMIIDAKSGVVRNPNLLDYKMPTMPDLPQLESAFVEINEPQSAYGHKS +LGEPPIIPVAAAIRNAVKMATGVAINTLPLTPKRLYEEFHLAGLI* +>test.0417.00002.0003i_00060 879 NA | NA | NA | ID=3_33;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.538 | NA +MFDFASYHRAATLADAITLLADNPQAKLLAGGTDVLIQLHHHNDRYRHIVDIHNLAELQG +ITQAEDGALRIGSATTFTQLIEDPVIQRNLPALCAAAASIAGPQIRNVATYGGNICNGAT +SADSATPTLIYDAKLELHSPRGVRFVPINGFHTGPGKVSLEHDEILVAFHFPPQPKEHAG +SAHFKYAMRDAMDISTIGCAAHCRLDNGNFSELRLAFGVAAPTPIRCQHAEQTAQNAPLN +LQTLEAISESVLQDVAPRSSWRASKEFRLHLIQTMTKKVISEAVAAAGGKLQ* +>test.0417.00002.0003i_00061 480 NA | NA | NA | ID=3_34;partial=00;start_type=ATG;rbs_motif=GGxGG;rbs_spacer=5-10bp;gc_cont=0.512 | NA +MNHSETITIECTINGMPFQLHAAPGMPLSELLREQGLLSVKQGCCVGECGACTVLVDGTA +IDSCLFLAAWAEGKEIRTLEGEAKGGKLSHVQLAYAKSGAVQCGFCTPGLIMATTAMLAK +PREKPLTITEIRRGLAGNLCRCTGYQMIVNTVLDCEKTK* +>test.0417.00002.0003i_00062 1779 NA | NA | NA | ID=3_35;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.459 | NA +MELATTQSVLMQIQPTIQRFARMLASVLQLEVEIVDENLCRVAGTGAYGKFLGRQLSGNS +RLLRHVLETKTEKVVTQSRFDPLCEGCDSKENCREKAFLGTPVILQDRCVGVISLIAVTH +EQQEHISDNLREFSDYVRHISTIFVSKLLEDQGPGDNISKIFATMIDNMDQGVLVVDADN +RVQFVNQTALKTLGVVQNNIIGKPVRFRPLTFESNFTHGHMQHIVSWDDKSELIIGQLHN +IQGRQLFLMAFHQSHTSFSVANAPDEPHIEQLVGECRVMRQLKRLISRIAPSPSSVMVVG +ESGTGKEVVARAIHKLSGRRNKPFIAINCAAIPEQLLESELFGYVKGAFTGASANGKTGL +IQAANTGTLFLDEIGDMPLMLQAKLLRAIEAREILPIGASSPIQVDIRIISATNQNLAQF +IAEGKFREDLFYRLNVIPITLPPLRERQEDIELLVHYFLHLHTRRLGSVYPGIAPDVVEI +LRKHRWPGNLRELSNLMEYLVNVVPSGEVIDSTLLPPNLLNNGTTEQSDVTEVSEAHLSL +DDAGGTALEEMEKQMIREALSRHNSKKEVADELGIGIATLYRKIKKYELLNT* +>test.0417.00002.0003i_00063 1188 NA | NA | NA | ID=3_36;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.506 | NA +MKTVNELIKDINSLTSHLHEKDFLLTWEQTPDELKQVLDVAAALKALRAENISTKVFNSG +LGISVFRDNSTRTRFSYASALNLLGLAQQDLDEGKSQIAHGETVRETANMISFCADAIGI +RDDMYLGAGNAYMREVGAALDDGYKQGVLPQRPALVNLQCDIDHPTQSMADLAWLREHFG +SLENLKGKKIAMTWAYSPSYGKPLSVPQGIIGLMTRFGMDVTLAHPEGYDLIPDVVEVAK +NNAKASGGSFRQVTSMEEAFKDADIVYPKSWAPYKVMEERTELLRANDHEGLKALEKQCL +AQNAQHKDWHCTEEMMELTRDGEALYMHCLPADISGVSCKEGEVTEGVFEKYRIATYKEA +SWKPYIIAAMILSRKYAKPGALLEQLLKEAQERVK* +>test.0417.00002.0003i_00064 1197 NA | NA | NA | ID=3_37;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.531 | NA +MSVFSLKIDIADNKFFNGETSPLFSQSQAKLARQFHQKIAGYHPTPLCALDDLANLFGVK +KILVKDESKRFGLNAFKMLGGAYAIAQLLCEKYHLDIETLSFEHLKNAIGEKMTFATTTD +GNHGRGVAWAAQQLGQNAVIYMPKGSAQERVDAILNLGAECIVTDMNYDDTVRLTMQHAQ +QHGWEVVQDTAWEGYTKIPTWIMQGYATLADEAVEQMREMGVTPTHVLLQAGVGAMAGGV +LGYLVDVYSPQNLHSIIVEPDKADCIYRSGVKGDIVNVGGDMATIMAGLACGEPNPLGWE +ILRNCATQFISCQDSVAALGMRVLGNPYGNDPRIISGESGAVGLGVLAAVHYHPQRQSLM +EKLALNKDAVVLVISTEGDTDVKHYREVVWEGKHAVAP* +>test.0417.00002.0003i_00065 1212 NA | NA | NA | ID=3_38;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.507 | NA +MAKNIPFKLILEKAKDYQADMTRFLRDMVAIPSESCDEKRVVHRIKEEMEKVGFDKVEID +PMGNVLGYIGHGPRLVAMDAHIDTVGIGNIKNWDFDPYEGMETDELIGGRGTSDQEGGMA +SMVYAGKIIKDLGLEDEYTLLVTGTVQEEDCDGLCWQYIIEQSGIRPEFVVSTEPTDCQV +YRGQRGRMEIRIDVQGVSCHGSAPERGDNAIFKMGPILGELQELSQRLGYDEFLGKGTLT +VSEIFFTSPSRCAVADSCAVSIDRRLTWGETWEGALDEIRALPAVQKANAVVSMYNYDRP +SWTGLVYPTECYFPTWKVEEDHFTVKALVNAYEGLFGKAPVVDKWTFSTNGVSIMGRHGI +PVIGFGPGKEPEAHAPNEKTWKSHLVTCAAMYAAIPLSWLATE* +>test.0417.00002.0003i_00066 1386 NA | NA | NA | ID=3_39;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.524 | NA +MRVLIKNGIVVNADGQAKQDLLIESGIVRQLGTDISPQLPCEEIDASGCYVFPGGVDVHT +HFNIDVGIARSCDDFFTGTRAAACGGTTTIIDHMGFGPNGCRLRHQLEVYRGYAAHKAVI +DYSFHGVIQHINHAILDEIPMMVEEGLSSFKLYLTYQYKLNDDEVLQALRRLHESGALTT +VHPENDAAIASKRAEFIAAGLTAPRYHALSRPLECEAEAIARMINLAQIAGNAPLYIVHL +SNGLGLDYLRLARANHQPVWVETCPQYLLLDERSYDTEDGMKFILSPPLRNVREQDKLWC +GISDGAIDVVATDHCTFSMAQRLQISKGDFSRCPNGLPGVENRMQLLFSSGVMTGRISPE +RFVELTSAMPARLFGLWPQKGLLAPGSDGDVVIIDPRQSQQIQHRHLHDNADYSPWEGFT +CQGAIVRTLSRGETIFCDSTFTGKAGRGRFLRRKPFVPPVL* +>test.0417.00002.0003b_00067 870 NA | NA | NA | ID=3_40;partial=01;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.501 | NA +MSKKIVLALGGNALGDDLAGQMKAVKITSQAIVDLIAQGHEVIVTHGNGPQVGMINQAFE +AAAKTEAHSPMLPMSVCVALSQGYIGYDLQNALREELLSRGINKPVATLVTQVEVDANDP +AFLTPTKPIGSFFTEQEAELLTKQGYTLKEDAGRGYRRVVASPKPVDIIEKETVKALVDA +GQVVITVGGGGIPVIREGNHLRGASAVIDKDWASARLAEMIDADMLIILTAVEKVAINFG +KENEQWLDRLSLSDAERFIEEGHFAKGSMLPKVEAAASFARSRAGREALI +>test.0417.00002.0004b_00068 1626 NA | NA | NA | ID=4_1;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.523 | NA +MNIFTEAAKLEEQNCPFAMAQIVDSRGSTPRHSAQMLVRADGSIVGTIGGGMVERKVIEE +SLQALQERKPRLFHGRMARNGADAVGSDCGGAMSVFISVHGMRPRLVLIGAGHVNRAIAQ +SAALLGFDIAVADIYRESLNPELFPPSTTLLHAESFGAAVEALDIRPDNFVLIATNNQDR +EALDKLIEQPIAWLGLLASRRKVQLFLRQLREKGVAEEHIARLHAPVGYNIGAETPQEIA +ISVLAEILQVKNNAPGGLMMKPSHPSGHQLVVIRGAGDIASGVALRLYHAGFKVIMLEVE +KPTVIRCTVAFAQAVFDGEMTVEGVTARLATSSAEAMKLTERGFIPVMVDPTCSLLDELK +PLCVVDAILAKQNLGTRADMAPVTIALGPGFTAGKDCHAVIETNRGHWLGQVIYSGCAQE +NTGVPGNIMGHTTRRVIRAPAAGIMRSNVKLGDLVKEGDVIAWIGEHEIKAPLTGMVRGL +LNDGLAVVGGFKIGDIDPRGETADFTSVSDKARAIGGGVLEALMMLMHQGVKATKEVLEV +A* +>test.0417.00002.0004i_00069 480 NA | NA | NA | ID=4_2;partial=00;start_type=GTG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.504 | NA +MQGFTPEAIDALVQRPECDVILIEADGSRGMPLKAPDEHEPCIPKSSCCVIAVMGGHILG +AKVSTENVHRWSQFADITGLTPAAPLQLSDLVALVRHPQGAFKNVPQGCRRVWFINRFSQ +CENAIAQSELLQPLQQHNVEAIWLGDIQEHPAIARRFVN* +>test.0417.00002.0004i_00070 579 NA | NA | NA | ID=4_3;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.430 | NA +MSAIDCIITAAGLSSRMGQWKMMLPWQQGTILDTSIKNALQFCSRIILVTGYRGNELHER +YANQSNITIIHNPDYAQGLLTSVKAAVPAVQTEHCFLTHGDMPTLTIDIFRKIWSLRNDG +AILPLHNGIPGHPILVSKPCLMQAIQRPNVTNMRQALLMGEHYSVEIENAEIILDIDTPD +DFITAKKRYTEI* +>test.0417.00002.0004i_00071 3099 NA | NA | NA | ID=4_4;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.526 | NA +MGDIMRPIPFEELLTRIFDEYQQQRSIFGIPEQQFYSPVKGKTVSVFGETCATPVGPAAG +PHTQLAQNIVTSWLTGGRFIELKTVQILDRLELEKPCIDAEDECFNTEWSTEFTLLKAWD +EYLKAWFALHLLEAMFQPSDSGKSFIFNMSVGYNLEGIKQPPMQQFIDNMMDASDHPKFA +QYRDALNKLLQNEAFLARHGLQEKRESLQALPARIPTSMVQGVTLSTMHGCPPHEIEAIC +RYMLEEKGLNTFVKLNPTLLGYARVREILDVCGFGYIGLKEESFDHDLKLTQALEMLERL +MALAKEKSLGFGVKLTNTLGTINNKGALPGEEMYMSGRALFPLSINVAAVLSRAFDGKLP +ISYSGGASQLTIRDIFDTGIRPITMATDLLKPGGYLRLSACMRELEGSDAWGLDHVDVER +LNRLAADALTMEYTQKHWKPEERIEVAEDLPLTDCYVAPCVTACAIKQDIPEYIRLLGEH +RYADALELIYQRNALPAITGHICDHQCQYNCTRLDYDSALNIRELKKVALEKGWEEYKQR +WHKPAGSGSRHPVAVIGAGPAGLAAGYFLARAGHPVTLFEREANAGGVVKNIIPQFRIPA +ELIQHDIDFVADHGVKFEYGCSPDLTVEQLKNQGFHYVLIATGTDKNSGVKLAGDNQNVW +KSLPFLREYNKGTALKLGKHVVVVGAGNTAMDCARAALRVPGVEKATVVYRRSLQEMPAW +REEYEEALHDGVEFRFLNNPERFDADGTLTLRVMSLGEPDEKGRRRPVETNETVTLHVDS +LITAIGEQQDTEALNAMGVPLDKNGWPDVDHNGETRLTDVFMIGDVQRGPSSIVAAVGTA +RRATDAILSRENIRSHQNDKYWNNVNPAEIYQRKGDISVTLVNSDDRDAFVAQEAARCLE +CNYVCSKCVDVCPNRANVSIAVPGFQNRFQTLHLDAYCNECGNCAQFCPWNGKPYKDKIT +VFSLSQDFDNSSNPGFLVEDCRVRVRLNNQSWVLNIDSEGQFNNVPPELNDMCRIISHVH +QHHHYLLGRVEV* +>test.0417.00002.0004i_00072 1329 NA | NA | NA | ID=4_5;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.525 | NA +MLILKNVTAVQLHPAKVQEGVDIAIENDVIVAIDDALTQRYPDASYKEMHGRIVMPGIVC +SHNHFYSGLSRGIMANIAPCPDFISTLKNLWWRLDRALDEESLYYSGLICSLEAIKSGCT +SVIDHHASPAYIGGSLSTLRDAFLKVGLRAMTCFETTDRNSGIKELQEGVEENIRFARQI +DEAKKAATEPYLVEAHIGAHAPFTVPDAGLEMLCEAVKSTGRGLHIHAAEDLYDVSYSHH +WYGKDLLARLAQFDLIDSKTLVAHGLYLSKDDIALLNQRDAFLVHNARSNMNNHVGYNHH +LSDIRNLALGTDGIGSDMFEEMKFAFFKHRDAGGPLWPDSFAKALANGNELMSRNFGAKF +GLLEAGYKADLTICDYNSPTPLLADNIAGHIAFGMGSGSVHSVMVNGVMVYEDRQFNFDC +DSIYAQARKAAASMWRRMDALA* +>test.0417.00002.0004i_00073 780 NA | NA | NA | ID=4_6;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.538 | NA +MIEQFFRPDSVEQALELKRRYQDEAVWFAGGSKLNATPTRTDKKIAISLQDLELDWIDWD +NGALRIGAMSRLQPLRDARFIPAALREALGFVYSRHVRNQSTIGGEIAARQEESVLLPVL +LALDAELVFGNGETLSIEDYLACPCDRLLTEIIIKDPYRTCATRKISRSQAGLTVVTAAV +AITDHDGMRIALDGVASKALRLHDVETQNLEGNALEQAVANAIFPQEDLRGSVAYKRYIT +GVLVADLYADCQQAGEEAV* +>test.0417.00002.0004i_00074 2871 NA | NA | NA | ID=4_7;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.527 | NA +MIIHFTLNGAPQELTVNPGENVQKLLFNMGMHSVRNSDDGFGFAGSDAIIFNGNIVNASL +LIAAQLEKADIRTAESLGKWNELSLVQQAMVDVGVVQSGYNDPAAALIITDLLDRIDAPT +REEIDDALSGLFSRDAGWQQYYQVIELAVARKNNPQATIDIAPTFRDDLEVIGKHYPKTD +AAKMVQAKPCYVEDRVTADACVIKMLRSPHAHALITHLDVSKAEALPGVVHVITHLNCPD +IYYTPGGQSAPEPSPLDRRMFGKKMRHVGDRVAAVVAENEDIALEALKLIDVEYEVLKPV +MSIDEAMAEDAPVVHDEPVVYVAGAPDTLEDDNSHAAQRGEHMIINFPIGSRPRKNIAAS +IHGHIGDMDKGFADADVIIERTYNSTQAQQCPTETHICFTRMDGDRLVIHASTQVPWHLR +RQVARLVGMKQHKVHVIKERVGGGFGSKQDILLEEVCAWATCVTGRPVLFRYTREEEFIA +NTSRHVAKVTVKLGAKKDGRLTAVKMDFRANTGPYGNHSLTVPCNGPALSLPLYPCDNVD +FQVTTYYSNICPNGAYQGYGAPKGNFAITMALAELAEQLQIDQLEIIERNRVHEGQELKI +LGAIGEGKAPTSVPSAASCALEEILRQGREMIQWSSPKPQNGDWHIGRGVAIIMQKSGIP +DIDQANCMIKLESDGTFIVHSGGADIGTGLDTVVTKLAAEVLHCPPQDVHVISGDTDHAL +FDKGAYASSGTCFSGNAARLAAENLREKILFHGAQMLGEPVADVQLATPGVVRGKKGEVS +FGEIAHKGETGTGFGSLVGTGSYITPDFAFPYGANFAEVAVNTRTGEIRLDKFYALLDCG +TPVNPELALGQIYGATLRAIGHSMSEEIIYDAEGHPLTRDLRSYGAPKIGDIPRDFRAVL +VPSDDKVGPFGAKSISEIGVNGAAPAIATAIHDACGIWLREWHFTPEKILTALEKI* +>test.0417.00002.0004i_00075 1401 NA | NA | NA | ID=4_8;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.490 | NA +MSDINHAGSDLIFELEDRPPFHQALVGAITHLLAIFVPMVTPALIVGAALQLSAETTAYL +VSMAMIASGIGTWLQVNRYGIVGSGLLSIQSVNFSFVTVMIALGSSMKSDGFHEELIMSS +LLGVSFVGAFLVVGSSFILPYLRRVITPTVSGIVVLMIGLSLIKVGIIDFGGGFAAKSSG +TFGNYEHLGVGLLVLIVVIGFNCCSSPLLRMGGIAIGLCVGYIASLCLGMVDFSSVRNLP +LITIPHPFKYGFSFSFHQFLVVGTIYLLSVLEAVGDITATAMVSRRPIQGEEYQSRLKGG +VLADGLVSVIASAVGSLPLTTFAQNNGVIQMTGVASRYVGRTIAVMLVILGLFPMIGGFF +TTIPSAVLGGAMTLMFSMIAIAGIRIIITNGLKRRETLIVATSLGLGLGVSYDPEIFKIL +PASIYVLVENPICAGGLTAILLNIILPGGYRQENVLPGITSAEEMD* +>test.0417.00002.0004i_00076 1317 NA | NA | NA | ID=4_9;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.483 | NA +MSGEHTLKAVRGSFIDVTRTVDNPEEIASALRFIEDGLLLIKQGKVEWFGEWEDGKHQIP +DTIRVRDYRGKLIVPGFVDTHIHYPQSEMVGAYGEQLLEWLNKHTFPTERRYEDLEYARE +MSAFFIKQLLRNGTTTALVFGTVHPQSVDALFEAASHINMRMIAGKVMMDRNAPDYLLDT +AESSYHQSKELIERWHKNGRLLYAITPRFAPTSSPEQMAMAQRLKEEYPDTWVHTHLCEN +KDEIAWVKLLYPDHDGYLDVYHQYGLTGKNCVFAHCVHLEEKEWDRLSETKSSIAFCPTS +NLYLGSGLFNLKKAWQKKVKVGMGTDIGAGTTFNMLQTLNEAYKVLQLQGYRLSAYEAFY +LATLGGAKSLGLDDLIGNFLPGKEADFVVMEPTATPLQQLRYDNSVSLVDKLFVMMTLGD +DRSIYRTYVDGRLVYERN* +>test.0417.00002.0004i_00077 1368 NA | NA | NA | ID=4_10;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.531 | NA +MSGDILQTPDAPKPQGALDNYFKITARGSTVRQEVLAGLTTFLAMVYSVIVVPGMLGKAG +FPPAAVFVATCLVAGFGSLLMGLWANLPMAIGCAISLTAFTAFSLVLGQQISVPVALGAV +FLMGVIFTAISVTGVRTWILRNLPMGIAHGTGIGIGLFLLLIAANGVGMVIKNPIEGLPV +ALGAFTSFPVMMSLLGLAVIFGLEKCRVPGGILLVIIAISIIGLIFDPAVKYHGLVAMPS +LTGEDGKSLIFSLDIMGALQPTVLPSVLALVMTAVFDATGTIRAVAGQANLLDKDNQIIN +GGKALTSDSVSSIFSGLVGAAPAAVYIESAAGTAAGGKTGLTATVVGVLFLMILFLSPLS +FLIPGYATAPALMYVGLLMLSNVSKLDFNDFIDAMAGLVCAVFIVLTCNIVTGIMLGFVT +LVVGRVFAREWQKLNIGTVIITAALVAFYAGGWAI* +>test.0417.00002.0004i_00078 489 NA | NA | NA | ID=4_11;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.554 | NA +MKSLIIVNPADCIGCRTCEVACVVAHPSEQELNADIFLPRLKVQRLDSISAPVMCHQCEN +APCVGACPVGALTMGEQVVQANSARCIGCQSCVSACPFGMITIQSLPGDPRQQIVKCDLC +ELREEGPACVESCPTQALQLLTERELRRIRQQRIAASSENPL* +>test.0417.00002.0004i_00079 1920 NA | NA | NA | ID=4_12;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.528 | NA +MNKFIAAEAAECIGCHACEIACAVAHNQENWPLSHSDFRPRIHVVGKGQAANPVACHHCN +NAPCVTACPVNALTFQSDSVQLDEQKCIGCKRCAIACPFGVVEMVDTIAQKCDLCNQRSS +GTQACIDVCPTQALRLMDDKGLQQIKVARQRKTAAGKASSDAQPSRSAALLPVNSRKGAD +KISASERKTHFGEIYCGLDPQQATYESDRCVYCAEKANCNWHCPLHNAIPDYIRLVQEGK +IIEAAELCHQTSSLPEICGRVCPQDRLCEGACTLKDHSGAVSIGNLERYITDTALAMGWR +PDVSKVVPRSEKVAVIGAGPAGLGCADILARAGVQVDVFDRHPEIGGMLTFGIPPFKLDK +TVLSQRREIFTAMGIDFHLNCEIGRDISFNELTAEYDAVFLGVGTYGMMRADLPHEDAPG +VIQALPFLTAHTRQLMGLPESAEYPLTDVEGKRVVVLGGGDTTMDCLRTSIRLNAASVTC +AYRRDEVSMPGSRKEVVNAREEGVEFQFNVQPQYIACDEDGRLTAVGLIRTAMGEPGPDG +RRRPRPVAGSEFELPADVLIMAFGFQAHTMPWLQGSGIKLDKWGLIQTGDVGYLPTQTHL +KKVFAGGDAVHGADLVVTAMAAGRQAARDMLTLFDTKAS* +>test.0417.00002.0004i_00080 1449 NA | NA | NA | ID=4_13;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.500 | NA +MSAIDSQLPSSSGQDRPTDEVDRILSPGKLIILGLQHVLVMYAGAVAVPLMIGDRLGLSK +EAIAMLISSDLFCCGIVTLLQCIGIGRFMGIRLPVIMSVTFAAVTPMIAIGMNPDIGLLG +IFGATIAAGFITTLLAPLIGRLMPLFPPLVTGVVITSIGLSIIQVGIDWAAGGKGNPQYG +NPVYLGISFAVLIFILLITRYAKGFMSNVAVLLGIVFGFLLSWMMNEVNLSGLHDASWFA +IVTPMSFGMPIFDPVSILTMTAVLIIVFIESMGMFLALGEIVGRKLSSQDIIRGLRVDGV +GTMIGGTFNSFPHTSFSQNVGLVSVTRVHSRWVCIASGIILILFGMVPKMAVLVASIPQF +VLGGAGLVMFGMVLATGIRILSRCNYTTNRYNLYIVAISLGVGMTPTLSHDFFSKLPAVL +QPLLHSGIMLATLSAVVLNVFFNGYQHHADLVKESVSDKDLKVRTVRMWLLMRKLKKNEH +GE* +>test.0417.00002.0004i_00081 126 NA | NA | NA | ID=4_14;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.357 | NA +MNLLMRAIFSLLLLFTLSIPVISDCVAMAIESRFKYMMLLF* +>test.0417.00002.0004i_00082 549 NA | NA | NA | ID=4_15;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.506 | NA +MQTEHVILLNAQGVPTGTLEKYAAHTADTLLHLAFSSWLFNAKGQLLVTRRALSKKAWPG +VWTNSVCGHPQPGESNEEAVIRRCRYELGVEITPPESIYPDFRYRATDPNGIVENEVCPV +FAARTTSALQINDDEVMDYQWCDLAAVLRGIDATPWAFSPWMVMQATNREARKRLSAFTQ +LK* +>test.0417.00002.0004i_00083 1518 NA | NA | NA | ID=4_16;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.529 | NA +MSEQHAQGADAVVDLNNELKTRREKLANLREQGIAFPNDFRRDHTSDQLHAEFDGKENEE +LEALNIEVAVAGRMMTRRIMGKASFVTLQDVGGRIQLYVARDDLPEGVYNEQFKKWDLGD +ILGAKGKLFKTKTGELSIHCTELRLLTKALRPLPDKFHGLQDQEARYRQRYLDLISNDES +RNTFKVRSQILSGIRQFMVNRGFMEVETPMMQVIPGGAAARPFITHHNALDLDMYLRIAP +ELYLKRLVVGGFERVFEINRNFRNEGISVRHNPEFTMMELYMAYADYKDLIELTESLFRT +LAQDILGKTEVTYGDVTLDFGKPFEKLTMREAIKKYRPETDMADLDNFDSAKAIAESIGI +HVEKSWGLGRIVTEIFEEVAEAHLIQPTFITEYPAEVSPLARRNDVNPEITDRFEFFIGG +REIGNGFSELNDAEDQAQRFLDQVAAKDAGDDEAMFYDEDYVTALEHGLPPTAGLGIGID +RMVMLFTNSHTIRDVILFPAMRPVK* +>test.0417.00002.0004i_00084 882 NA | NA | NA | ID=4_17;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.533 | NA +MKQGLEDVSGLLELAVEADDEETFNEAVAELDALEEKLAQLEFRRMFSGEYDSADCYLDI +QAGSGGTEAQDWASMLERMYLRWAESRGFKTEIIEESEGEVAGIKSVTIKISGDYAYGWL +RTETGVHRLVRKSPFDSGGRRHTSFSSAFVYPEVDDDIDIEINPADLRIDVYRASGAGGQ +HVNRTESAVRITHIPTGIVTQCQNDRSQHKNKDQAMKQMKAKLYELEMQKKNAEKQAMED +NKSDIGWGSQIRSYVLDDSRIKDLRTGVETRNTQAVLDGSLDQFIEASLKAGL* +>test.0417.00002.0004i_00085 1734 NA | NA | NA | ID=4_18;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.565 | NA +MKQQIQLRRREVDETADLPAELPPLLRRLYASRGVRSAQELERSVKGMLPWQQLSGVEKA +VEILYNAFREGTRIIVVGDFDADGATSTALSVLAMRSLGCSNIDYLVPNRFEDGYGLSPE +VVDQAHARGAQLIVTVDNGISSHAGVEHARSLGIPVIVTDHHLPGDTLPAAEAIINPNLR +DCNFPSKSLAGVGVAFYLMLALRTFLRDQGWFDERGIAIPNLAELLDLVALGTVADVVPL +DANNRILTWQGMSRIRAGKCRPGIKALLEVANRDPQKLAASDLGFALGPRLNAAGRLDDM +SVGVALLLCDNIGEARVLANELDALNQTRKEIEQGMQVEALTLCEKLERSRDTLPGGLAM +YHPEWHQGVVGILASRIKERFHRPVIAFAPAGDGTLKGSGRSIQGLHMRDALERLDTLYP +GMMLKFGGHAMAAGLSLEEEKFELFQQRFGELVTEWLDPSLLQGEVVSDGPLSAAEMTME +VAQLLRDAGPWGQMFPEPLFDGHFRLLQQRLVGERHLKVMVEPVGGGPLLDGIAFNVDTA +LWPDNGVREVQLAYKLDINEFRGNRSLQIIIDNIWPI* +>test.0417.00002.0004i_00086 711 NA | NA | NA | ID=4_19;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.482 | NA +MKKGFMLFTLLAAFSGFVQADDAAIQQTLAKMGIKSSDIQPAPVAGMKTVLTNSGVLYIT +DDGKHIIQGPMYDVSGTAPVNVTNKMLLKQLNALEKEMIVYKAPQEKHVITVFTDITCGY +CHKLHEQMADYNALGITVRYLAFPRQGLDSDAEKEMKAIWCAKDKNKAFDDVMAGKSVAP +ASCDVDIADHYALGVQLGVSGTPAVVLSNGTLVPGYQPPKDMKEFLDEHQKMTSGK* +>test.0417.00002.0004i_00087 897 NA | NA | NA | ID=4_20;partial=00;start_type=GTG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.530 | NA +MKQDLARIEQFLDALWLEKNLAENTLNAYRRDLSMMVEWLHHRGLTLATAQSDDLQALLA +ERLEGGYKATSSARLLSAVRRLFQYLYREKFREDDPSAHLASPKLPQRLPKDLSEAQVER +LLQAPLIDQPLELRDKAMLEVLYATGLRVSELVGLTMSDISLRQGVVRVIGKGNKERLVP +LGEEAVYWLETYLEHGRPWLLNGVSIDVLFPSQRAQQMTRQTFWHRIKHYAVLAGIDSEK +LSPHVLRHAFATHLLNHGADLRVVQMLLGHSDLSTTQIYTHVATERLRQLHQQHHPRA* +>test.0417.00002.0004i_00088 522 NA | NA | NA | ID=4_21;partial=00;start_type=ATG;rbs_motif=AGxAG;rbs_spacer=5-10bp;gc_cont=0.517 | NA +MNMGLFYGSSTCYTEMAAEKIRDIIGPELVTLHNLKDDSPKLMEQYDVLILGIPTWDFGE +IQEDWEAVWDQLDDLNLEGKIVALYGLGDQLGYGEWFLDALGMLHDKLSTKGVKFVGYWP +TEGYEFTSPKPVIADGQLFVGLALDETNQYDLSDERIQSWCEQILNEMAEHYA* +>test.0417.00002.0004i_00089 408 NA | NA | NA | ID=4_22;partial=00;start_type=GTG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.539 | NA +MVLWQSDLRVSWRAQWLSLLIHGLVAAVILLMPWPLSYTPLWMVLLSLVVFDCVRSQRRI +NARQGEIRLLMDGRLRWQGQEWSIVKAPWMIKSGMMLRLRSDSGKRQHLWLAADSMDEAE +WRDLRRILLQQETQR* +>test.0417.00002.0004i_00090 267 NA | NA | NA | ID=4_23;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.491 | NA +MDINNKARIHWACRRGMRELDISIMPFFEHEYDSLSDDEKRIFIRLLECDDPDLFNWLMN +HGKPADAELEMMVRLIQTRNRERGPVAI* +>test.0417.00002.0004i_00091 981 NA | NA | NA | ID=4_24;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.539 | NA +MAFTPFPPRQPTASARLPLTLMTLDDWALATITGADSEKYMQGQVTADVSQMTEDQHLLA +AHCDAKGKMWSNLRLFRDGDGFAWIERRSVREPQLTELKKYAVFSKVTIAPDDERVLLGV +AGFQARAALANLFSELPSKEKQVVKEGATTLLWFEHPAERFLIVTDEATANMLTDKLRGE +AELNNSQQWLALNIEAGFPVIDAANSGQFIPQATNLQALGGISFKKGCYTGQEMVARAKF +RGANKRALWLLKGSASRLPEAGEDLELKMGENWRRTGTVLAAVKLEDGQVVVQVVMNNDM +EPDSIFRVRDDANTLRIEPLPYSLEE* +>test.0417.00002.0004i_00092 660 NA | NA | NA | ID=4_25;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.518 | NA +MVQKPLIKQGYSLAEEIANSVSHGIGLVFGIVGLVLLLVQAVDLNASATAITSYSLYGGS +MILLFLASTLYHAIPHQRAKMWLKKFDHCAIYLLIAGTYTPFLLVGLDSPLARGLMIVIW +SLALLGILFKLTIAHRFKILSLVTYLAMGWLSLVVIYEMAVKLAAGSVTLLAVGGVVYSL +GVIFYVCKRIPYNHAIWHGFVLGGSVCHFLAIYLYIGQA* +>test.0417.00002.0004i_00093 312 NA | NA | NA | ID=4_26;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.455 | NA +MQPNDITFFQRFQDDILAGRKTITIRDESESHFKTGDVLRVGRFEDDGYFCTIEVTATST +VTLDTLTEKHAEQENMTLTELKKVIADIYPDQTQFYVIEFKCL* +>test.0417.00002.0004b_00094 420 NA | NA | NA | ID=4_27;partial=01;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.500 | NA +MKKLTLPKDFLWGGAVAAHQVEGGWNKGGKGPSICDVLTGGAHGVPREITKEVVPGKYYP +NHEAVDFYGHYKEDIKLFAEMGFKCFRTSIAWTRIFPKGDEAQPNEEGLKFYDDMIDELL +KYNIEPVITLSHFEMPLHLV +>test.0417.00002.0005b_00095 1011 NA | NA | NA | ID=5_1;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.515 | NA +QYGSWTNRKVVDFFVRFAEVVFERYKHKVKYWMTFNEINNQRNWRAPLFGYCCSGVVYTE +HENPEETMYQVLHHQFVASALAVKAAHRINPEMKVGCMLAMVPLYPYSCNPDDVMFAQES +MRERYVFTDVQLRGYYPSYVLNEWERRGFNIKMEDGDLDVLREGTCDYLGFSYYMTNAVK +AEGGTGDAISGFEGSVPNPYVKASDWGWQIDPVGLRYALCELYERYQKPLFIVENGFGAY +DKVEDDGSINDDYRIDYLRAHIEEMKKAVTYDGVDLMGYTPWGCIDCVSFTTGQYSKRYG +FIYVNKHDDGTGDMSRSRKKSFNWYKEVIASNGENL* +>test.0417.00002.0005i_00096 2874 NA | NA | NA | ID=5_2;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.554 | NA +MTQTLSQLENSGAFIERHIGPDAAQQQEMLNAVGAQSLNALTGQIVPKDIQLATPPQVGA +PATEYAALAELKAIASRNKRFTSYIGMGYTAVQLPPVILRNMLENPGWYTAYTPYQPEVS +QGRLEALLNFQQVTLDLTGLDMASASLLDEATAAAEAMAMAKRVSKLKNANRFFVASDVH +PQTLDVVRTRAETFGFEVIVDDAQKVLDHQDVFGVLLQQVGTTGEIHDYTALISELKSRK +IVVSVAADIMALVLLTAPGKQGADIVFGSAQRFGVPMGYGGPHAAFFAAKDEYKRSMPGR +IIGVSKDAAGNTALRMAMQTREQHIRREKANSNICTSQVLLANIASLYAVYHGPVGLKRI +ANRIHRLTDILAAGLQQKGLKLRHAHYFDTLCVEVADKAGVLARAEAAEINLRSDILNAV +GITLDETTTRENVMQLFSVLLGDNHGLDIDTLDKDVAHDSRSIQAAMLRDDEILTHPVFN +RYHSETEMMRYMHSLERKDLALNQAMIPLGSCTMKLNAAAEMIPITWPEFAELHPFCPPE +QAEGYQQMIAQLADWLVKLTGYDAVCMQPNSGAQGEYAGLLAIRHYHESRNEGHRDICLI +PASAHGTNPASAHMAGMQVVVVACDKNGNIDLTDLRAKAEQAGDNLSCIMVTYPSTHGVY +EETIREVCEVVHQFGGQVYLDGANMNAQVGITSPGFIGADVSHLNLHKTFCIPHGGGGPG +MGPIGVKAHLAPFVPGHSVVQIEGMLTRQGAVSAAPFGSASILPISWMYIRMMGAEGLKK +ASQVAILNANYIASRLQDAFPVLYTGRDGRVAHECILDIRPLKEETGISELDIAKRLIDY +GFHAPTMSFPVAGTLMVEPTESESKVELDRFIDAMLAIRAEIDQVKAGVWPLEDNPLVNA +PHIQSELVAEWAHPYSREVAVFPAGVADKYWPTVKRLDDVYGDRNLFCSCVPISEYQ* +>test.0417.00002.0005i_00097 390 NA | NA | NA | ID=5_3;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.515 | NA +MSNIPAELKYSKEHEWLRKEADGTYTVGITEHAQELLGDMVFIDLPEVGATVSAGDDCAV +AESVKAASDIYAPVSGEIVAVNDALSDFPELVNSEPYAGGWIFKIKASDESELESLLDAT +AYEALLEDE* +>test.0417.00002.0005i_00098 1164 NA | NA | NA | ID=5_4;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.536 | NA +MLGFVVIISPWKSCQPRLFNEDKMAQQTPLYEQHTLCGARMVDFHGWMMPLHYGSQIDEH +HAVRTDAGMFDVSHMTIVDLRGSRTREFLRYLLANDVAKLTKSGKALYSGMLNASGGVID +DLIVYYFTEDFFRLVVNSATREKDLSWITQHAEPFGIEITVRDDLSMIAVQGPNAQAKAA +TLFNDAQRQAVEGMKPFFGVQAGDLFIATTGYTGEAGYEIALPNEKAADFWRALVEAGVK +PCGLGARDTLRLEAGMNLYSQEMDETISPLAANMGWTIAWEPADRDFIGREALEAQREHG +TEKLVGLVMTEKGVLRNELPVRFTDAQGNQHEGIITSGTFSPTLGYSIALARVPEGIGET +AIVQIRNREMPVKVTKPVFVRNGKAVA* +>test.0417.00002.0005b_00099 156 NA | NA | NA | ID=5_5;partial=01;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.231 | NA +FLMPRIFDLVFFDIFLVLNVVLFKLTFSSIYLYIEICSFFGFLFCYDFGVF* diff --git a/test/data/annotate/exp_files/res_formatAll/prodigal/Proteins/test_runprokka_H299.prt b/test/data/annotate/exp_files/res_formatAll/prodigal/Proteins/test_runprokka_H299.prt new file mode 100644 index 0000000000000000000000000000000000000000..4a4f994fab5f5e6e2a44d848f1f4a4622bdb4e00 --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prodigal/Proteins/test_runprokka_H299.prt @@ -0,0 +1,100 @@ +>test_runprokka_H299.0001b_00001 138 NA | NA | NA | ID=1_1;partial=10;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.580 | NA +MGKGSSKGHTPREAKDNLKSTQLLSVIDAISEGPVEGPVDGLKSVL +>test_runprokka_H299.0001i_00002 543 NA | NA | NA | ID=1_2;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.562 | NA +MKTGSEAIRALAMQIPAFRQKLSDGWYQVRIAGRDAGETELSARLNEPLENGAVIHIVPR +LAGAKSGGVFQAVLGAAVMAVAIWMPGVGIMASNLLFSLGASMTLGGVAQMLAPKPKTPR +TQTTDNGKQNTYFSSLDNMVAQGNVLPVLYGEMRVGSRVVSQEISTADEGDGGQVVVIGR +* +>test_runprokka_H299.0001i_00003 600 NA | NA | NA | ID=1_3;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.593 | NA +MSPEDWLSAEMQREIVALVHSHPGGLPWLSEADRRLQVQSDLPWWLVCRGAIHKFRCVPH +LTGRRFEHGVTDCYTLFRDAYHLAGIEMPDFHRGDDWWRNGQNLYLDNLEATGLYQVPLS +AAQPGDVLLCCFGSSVPNHAAIYCGDSELLHHIPEQLSKRERYTDKWQRRTHSLWRHRAW +HASAFTGIYNDLAAASTFE* +>test_runprokka_H299.0001i_00004 699 NA | NA | NA | ID=1_4;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.558 | NA +MQDIQQETLNECIRAEQSASVVLWEIDLTEVGGDRYFFCNEQNEKGESVTWQSRQYQAYP +IQGSGFEMNGKGSAARPTLTVSNLHGMITGMAEDLQSLVGGTVVRRKVYARFLDAVNFVN +GNSEADPEQEVISRWRIEQCSELSAVSASFVLSTPTETDGAVFPGRIMLANTCTWTYRGD +ECGYSGPAVADEYDQPTSDITKDKCSKCLSGCKFRNNVGNFGSFLSINKLSQ* +>test_runprokka_H299.0001i_00005 297 NA | NA | NA | ID=1_5;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.404 | NA +MKTENKPSIKTVRFGDGYEQRSPNGLNHSLRVFTCDFKVEANERDSFEKFLARHEGYKSF +FWRPPGINRKIRVVCRTWSATEHITYTDFSCQFDEVVI* +>test_runprokka_H299.0001b_00006 963 NA | NA | NA | ID=1_6;partial=01;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.442 | NA +AEITAWRDSLQASIDNRQQGYDIQIAGYGVGDKNQQRQQELLRIEHGYNNQRLQLERDYA +DKSRGMSDHVFQEKMQALNDALEREKEIVRQKNEQLDIQAGDWVSGASQGFNNWLDDTKD +ISEQIKSTTTQMFDGMTDALGDFVTTGKANFRSFATSVISDLSRIALKASITGIFDSISN +SSSGGILGTIGSAISKFIPNAKGGVYESPSLSTYSNGIYDSPQFFAFAKGAGVFGEAGPE +AIMPLTRTSDGSLGVRAINSKSGNGGGDITYAPVYQITIQNDGQNGEIGPQAIKALMGMV +DQRVQGNLLNMRRDGGMLSG* +>test_runprokka_H299.0002b_00007 138 NA | NA | NA | ID=2_1;partial=10;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.572 | NA +MGKGSSKGHTPREAKDNLKSTQLLSVIDAISEGPVEGPVDGLKSVL +>test_runprokka_H299.0002i_00008 543 NA | NA | NA | ID=2_2;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.547 | NA +MKTGAEAIRALATQLPAFRQKLSDGWYQVRIAGRDTGETELSARLNEPLANGAVIHIVPR +LAGAKSGGVFQAVLGAAVMAVAIWMPGVGIMASNLLFSLGASMTLGGVAQMLAPKPKTPS +TQTTDNGKQNTYFSSLDNMVAQGNVLPVLYGEMRVGSRVVSQEISTADEGDGGQVVVIGR +* +>test_runprokka_H299.0002i_00009 744 NA | NA | NA | ID=2_3;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.594 | NA +MTETESAILAHARRCAPAESCGFVVRTPEGERYFPCVNISGEPEAYFRMSPEDWLRAEMQ +GEIVALVHSHPGGLPWLSEADRRLQVQSDLPWWLVCRGTIHKFRCVPHLTGRRFEHGVTD +CYTLFRDAYHLAGIEMPDFHREDDWWRHGQNLYLDNLEATGLYQVPLSSAQPGDVLLCCF +GSSVPNHAAIYCGDGELLHHIPEQLSKRERYTDKWQRRTHSLWRHRAWRASAFTGIYNDL +VAASTFV* +>test_runprokka_H299.0002i_00010 699 NA | NA | NA | ID=2_4;partial=00;start_type=ATG;rbs_motif=AGxAGG/AGGxGG;rbs_spacer=5-10bp;gc_cont=0.557 | NA +MQDIRQETLNECTRAEQSASVVLWEIDLTEVGGERYFFCNEQNEKGEPVTWQGRQYQPYP +IQGSGFELNGKGTSTRPTLTVSNLYGMVTGMAEDMQSLVGGTVVRRKVYARFLDAVNFVN +GNSDADPEQEVISRWRIEQCSELSAVSASFVLSTPTETDGAVFPGRIMLANTCTWTYRGD +ECGYHGPAVADEYDQPTSDITKDKCSKCLNGCKFRNNVGNFGGFLSINKLSQ* +>test_runprokka_H299.0002i_00011 330 NA | NA | NA | ID=2_5;partial=00;start_type=ATG;rbs_motif=GGAGG;rbs_spacer=5-10bp;gc_cont=0.567 | NA +MKTFRWKVKPGMDVASAPSVRKVRFGDGYSQRAPAGLNANLKTYSVTLSVPRWEATVLES +FLEEHGGWKAFLWTPPYEWRQIKVTCAKWSSRVSMLRVEFSAEFEQVVN* +>test_runprokka_H299.0002i_00012 2580 NA | NA | NA | ID=2_6;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.592 | NA +MAEPVGDLVVDLSLDAARFDEQMARVRRHFSGTESDAKKTAAVVEQSMSRQALAAQKAGI +SVGQYKAAMRMLPAQFTDVATQLAGGQSPWLILLQQGGQVKDSFGGMIPMFRGLAGAITL +PMVGATSLAVATGALAYAWYQGNSTLSDFNKTLVLSGNQAGLTADRMLVLSRAGQAAGLT +FNQTSESLTALVNAGVRGGEQFEAISQSVARFSSASGVEVDKVAEAFGKLTTDPTSGLTA +MARQFHNVTAEQIAYVAQLQRSGDEAGALQAANEAATKGFDDQTRRLKENMGTLETWADR +TARAFKSMWDSVLDIGRPDTAQGMLEKAEKAFDEADKKWQWYQSRSHRRGKTSAFLANLR +GAWEDRANAQLGLSAATLQADLEKAREMAAKDWAESEASRLKYTEEAQKAYERLQTPLEK +YTARQEELNKALKDGKILQADYNTLMAAAKKDYEATLKKPKQSGVKVSAGDRQEDSAHAA +LLTLQAELRTLEKHAGANEKISQQRRDLWKAESQFAVLEEAAQRRQLSAQEKSLLAHKDE +TLEYKRQLAALGDKVTYQERLNALAQQADKFAQQQRAKRAAIDAKSRGLTDRQAEREATE +QRLKERYGDNPLALNNVMSEQKKTWAAEDQLRGSWMAGLKSGWSEWEESATDSMSQVKSA +ATQTFDGIAQNMAAMLTGSEQNWRSFTRSVLSMMTEILLKQAMVGIVGSIGSAIGGAVGG +GASASGGTAIQAAAAKFHFATGGFTGTGGKYEPAGIVHRGEFVFTKEATSRIGVGNLYRL +MRGYATGGYVGTPGSMADSRSQASGTFEQNNHVVINNDGTNGQIGPQALKAVYDVARKAA +MDVVTGQMRDGGLFSGGGR* +>test_runprokka_H299.0002i_00013 435 NA | NA | NA | ID=2_7;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.559 | NA +MFDGELSFALKLAREMGRPDWRAMLAGMSSTEYADWHRFYSTHYFHDVLLDMHFSGLTYT +VLSLFFSDPDMHPLDFSLLNRREADEEPEDDVLMQKAAGLAGGVRFGPDGNEVIPASPDV +ADMTEDDVMLMTVSEGIAGGVRYG* +>test_runprokka_H299.0002i_00014 423 NA | NA | NA | ID=2_8;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.515 | NA +MFLKTESFEHNGVTVTLSELSALQRIEHLAWLKEQEKKAESSGNLQVSVEDLIRGGAFLV +AMSLWHNHPQKTKLPSMNEAVKQIEQEVLTTWPTEAIAQAENVVLRLSGMSEFVVNNAPE +QADDAGPAEPVSAGKCSTVS* +>test_runprokka_H299.0002i_00015 741 NA | NA | NA | ID=2_9;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.583 | NA +MPVPNPTMPVKGAGTTLLVYKGSGDPYANPLSDVDWSRLAKVKDLTPGELTAESYDDSYL +DDEDADWAATGQGQKSAGDTSFTLAWMPGEQGQQALLAWFNEGDTRAYKIRFPNGTVDVF +RGWVSSIGKAVTAKEVITRTVKVTNVGRPSMAEDRSTVTAATGMTVTPASTSVVKGRSTT +LTVAFQPEGATDKSFRAVSADKTKATVSVSGMTITVKGVAAGKVNIPVVSGNGELAAVAE +INVTNS* +>test_runprokka_H299.0002b_00016 393 NA | NA | NA | ID=2_10;partial=01;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.539 | NA +KHTELRAAVLDALEKHDTGATLFDGRPAVFDEEDFPAIAVYLTGAEYTGEELDSDTWQAE +LHIEVFLPAQVPDSELDSWMESRIYPVMSDIPALSDLITSMVASGYDYRRDDDAGLWSSA +DLTYVITYEM* +>test_runprokka_H299.0003b_00017 870 NA | NA | NA | ID=3_1;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.303 | NA +IIQSFVNICLTRYQAENRVKIFVAINIIYTLAYFFGVLYSLFIDHWDNVWKNIILFYVLT +TITMFFFYFIRKGKVVKLFFFHYISKNKVYETFIFGLYQLPHVLSSWVRLGYDRLVLGEL +ISMSYVGGYSVAVQISLVSSVIFQSLNRFWTPFFIKKLKENSKQKKIIVLGGFGIICITI +LNILFGYAYFIFFLPTNYSSFSNALPILCMAYMFQGLYFLIVNYIYYHDGNKLISIPSVA +SIAIHIAVAPVLIKHMGYYGAAISLLISWIVLFLFTCVIIFYVRRGYRG* +>test_runprokka_H299.0003i_00018 933 NA | NA | NA | ID=3_2;partial=00;start_type=GTG;rbs_motif=AGxAGG/AGGxGG;rbs_spacer=5-10bp;gc_cont=0.309 | NA +MGNIFIVESPFQLSNALLYHKKNDSVIVRLNGENKNDFQIEKMLSSFNGKVYIKKASKES +KFDLIRFVLFFAVPVLIANLNKKVIIGNYNSLWMRVMGYLFNPFHFAVLDDGLITIRTIK +RLDDNISRSGSIKKRFLLLLAPRFITQYKIYSNFIQIYNQEINKRKRTTRAIKAGRVCFI +GSPLFDKNVLTFDFYVKCLAAISDNLKRCGYSIEYYPHRSEKNISYLNVFFDDVIKSDDS +IEVYYSASNELPEIFVSFYSSALLNLRSDYPECKFISYKLDCNEINGKFRYEIMEAYNFL +AFSGIEVVTI* +>test_runprokka_H299.0003b_00019 693 NA | NA | NA | ID=3_3;partial=01;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.289 | NA +MLTYSVVNWKAKLLYFILFLSFLNAVLRLSEDGLSIYRLFIPLQIFLIYTLSVTEFKKFI +VILLLLLLFGATGCMISTYSLNENNLVFLIHYSILILTFFSSSVLISITGETCFYKFTAF +FFGFLIVTGIMDLFGVTFPNIEHIPDAIRGIHRIENDYSLALVSFVFVVFSISRKKITAS +ILTFFTSAICFYNDSKVALLFVVAGYFCFIFKNIRFRQKEFRWILFLFVIM diff --git a/test/data/annotate/exp_files/res_formatAll/prodigal/Replicons/test.0417.00002.fna b/test/data/annotate/exp_files/res_formatAll/prodigal/Replicons/test.0417.00002.fna new file mode 100644 index 0000000000000000000000000000000000000000..6ffef978095cbd9caa8970fe901231a92e625ee2 --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prodigal/Replicons/test.0417.00002.fna @@ -0,0 +1,10 @@ +>test.0417.00002.0001 9603 +TCTCATACTACCCAATTTCTTAAAAGTGCAAATTTGTGAAGCTTATCCTGTTATTATTTTAAGTTTCATGCCAAATTCTCTCACCAGATAATGCCGCCCTCTTCCGAAAAATAATCAAGAGGCCAAACAATATCTAAAATGATACAACTGTATCTATTCCCCTGAAAAATACATTATTCATTTGTATATTTTCCTCATCATTGCTTTTTATTTAAATCATCCGATAATCCCCTGAATATAATTATGTCAATAACCATCAGAAAAAGTGGATGATGAGGAAAAGGATATGGCCGACAGTTTCCAGAATGAAGTTCCCGCCGCTCGTGTAAATATCAAGCTTGATCTGCATACAGGCAATGCTAAAAAGAAAGTTGAACTCCCCCTCAAGCTTCTTGCCGTAGGCGATTACAGTAACGGAAAAGAGCAACGTCCGCTGTCCGAACGGGACAAGGTTGATATCAATAAAAACAACTTCAACAGCGTCATGGCTGAGTTTTCGCCTGCGGTTAATTTAACAGTAGAAGATACGCTAAACGGAAACGGTAATGAACAAAATATCGCGCTTGAATTTAAAAGCCTGAAGGATTTTGAACCCGAACAGGTAGCAAAAAATATTCCGCAACTTCGTGTATTACTCGCTATGCGCAATTTACTACGTGACCTGAAATCCAATCTGCTGGATAACGCAACGTTTCGCCGTGAACTGGAAAATATCCTGAAAGACCCGACGCTCAGTTCAGAACTGCGTGATGAACTGGCGAAAATTGCGCCGCAGGAGAACGTTTAACCCGAACGCGTATTCAGGTTAAACCGGAGAAGAAAGGATCACTGAAAAGGAAATGCTGATGTCTGTACAACAAGAACATGCCACCTCTGAAACTGCAACACTCACCACCACTGAGTCCGGCGGCGTTTATCAGTCCCTGTTCGATAAAATTAATTTAACCCCGGTGTCTTCCATTCAGGAAATCGATTTATGGCAAAACAGCGAAACGCTGGCCGATGCCTCACCCGATGAGCGCGTGACGGCGGCGATTCACGTTCTGCTTTCCTGTCTGGCGAAATCAGGCGAGGACGTGGTTAAGCTCGACAAGAGCCTGCTGGATTTTCATATCGACGATCTGGATCAGAAAATCAGTAAACAGCTTGATGCGGTCATGCACCACCCTGAATTCCAGAAAGTCGAGTCGCTGTGGCGTGGTACATGGTTCGTCGTACAGCGCACTGATTTTCGCAAAAATGTCAGAATTGAACTGCTGGATATCAGTAAAGAACATCTGCGGCAGGACTTTGATGATTCTCCGGAAATCATTCAAAGTGGTTTATATCGCCATACATACATTCAGGAGTACGATACGCCGGGTGGCGAACCTGTTGCCTCATTAATTTCCAGCTATGAATTTGATAACAGCCCGCAGGATATTGCCCTGCTGCGTAATATTTCCAGAGTGTCTGCCGCTTCCCATATGCCTTTTATCGGTTCTGTCGGACCGAAATTCTTCCTTAAAAATTCGATGGAAGAAGTCGCCGCGATTAAAGATATCGGCAACTACTTTGACCGCGCAGAATATATTAAATGGAAGTCGTTCCGCGATACGGATGACAGCCGCTATGTGGGATTAGTGATGCCGCGCGTGCTGGGCCGTCTGCCCTATGGGCCGGACACGGTGCCGGTACGCAGCTTTAACTATGTGGAAGAAGTCAAAGGCCCGGATCACGAAAAATACCTGTGGACAAACGCCTCGTTCGCCTTTGCCGCCAATATGGTGAAGAGCTTTGTTAATAATGGCTGGTGCGTGCAGATCCGTGGCCCACAGGCGGGCGGCGCAGTGGCCGATCTGCCGATCCATCTTTACGATCTCGGCACCGGCAATCAGGTCAAAATTCCGTCCGAAGTGATGATCCCGGAAACCCGCGAATTTGAATTTGCCAACCTTGGCTTTATTCCGCTCTCTTATTATAAGAATCGCGATTACGCCTGCTTCTTCTCGGCGAACTCTGCCCAGAAACCGGCGTTGTACGATACCGCTGACGCCACCGCCAACAGCCGTATCAATGCCCGTCTGCCTTACATCTTCCTGCTGTCCCGCATTGCGCATTACCTGAAAATTATTCAGCGCGAGAATATCGGCACCACCAAAGACCGCCGCGTGCTGGAACTGGAGCTGAATACCTGGATCCGCACGCTGGTGACGGAGATGACCGATCCTGGCGATGAACTTCAGGCTTCGCATCCACTGCGCGACGGGAAAGTTATCGTCGAGGACATAGAGGACAATCCGGGCTTCTTCCGCGTCAGACTCTTTGCCGTGCCGCATTTCCAGATTGAAGGGATGGATATCAACCTTTCTCTGGTTTCCCAGATGCCAAAAGCAAAAGCCTGATCGGGCGGTGGTGTGATGTATGAAAATTTGTCGACCACTGTGGGCTGAGGGGACATTCCTGTCTTCTCAGCAGTTTCAGCAGCAGGCCCGCTGGGAAGCGTTCAGCAATGACTGTATTGCGCAGCTTTGTATTCGCCATCCGTGGGGGATCGCAAACGTGCTCTTTGACCGGGATGCCCTGACGCCCGGAAAGCTGAAAACGCAGGCAGTACGCCTGCGTTTTGCTGATGGCACGCTGATCGATTCAGACGTGAGTGACGTTCTGCCGCTCGCCTGCGATCTGCGCGCGCTGAAGAACGACAGCGCGATTGTTTTGCTGGCGCTGCCGCTTGCACATGGTAACGGCGGTAATCTCGGTCAGGGTGAGCAGACTGAAAGACCGCTGCGCTATCGTCAGGAATGGCAAAAGGTGCAGGATATCTACGGCAGTGACAGTGAAGATATGGCCGTTGAGCGTCATGCGCTGTCCCTGCGCTTTGCTCATGATAACAATCAGGATTACATCACCTGCCCACTGGCGCGTCTGGTGCGGGATGTTCAGGGCAACTGGACACAGGATGAGAGCTATATTCCGCCGTTACTGGCGTTTAACGCCCATGACGGGCTGGTACAGCGTCTGGACACATTGCTGTTGCAGCTACGGGCGAAGTGCCAGCGTCTGATGGCGATGCGCCGGGAAAGCAACCAGCGTATGGCGGACTTTGCCGTCGCCGATGTCTCCCTGTTCTGGCTGCTTAACGCGCTGAATTCCGCCGAGCCGGTGCTGAGCGATTTCCTGCGCTACCCGGCTGTCCACCCCGAACTGGTCTGGCGGGAGCTGGCGAGGCTTGCCGGTGCGCTGCTGACGTTTTCCCTTGAGCATAACGTCAGCGCCGTTCCGCCCTATGTCCACGAATCGCCGTCCACCGTCTTTCCGCCCCTGTTCTCCCTGCTCAGCGAGCTGCTGGAAGCCAGCCTGCCGTCGCGGGTGATCGCGCTGGATCTGGCGTCCCTGCCGGGCAACCGCTGGAAAGCCGACCTGCACGATCCGCGCCTGCGGGAAGAGGCCGATTTTTATCTGTCCGTTCGTTCCTCACTGCCTGCGCATCAGGTACTGCATCAGCTACCGCTGGTCTGCAAAATCGGTGCGCCCGATGATGTCACGCTGCTTATCAACGTGGCGCTGAACGGTGTTCAACTGGTGCCGCTTACCTCGGTTCCGGCGGCGCTGCCGCTGCGGCTGGAGAACCAGTATTTTGCGCTGGATATGCACAGTGACGCGGCTAAATCGATGCTGGAGTCCGGGAGCTGCATGATTTATGCGCCGGGAACCATGGGCGACCTGAAACCTGAACTGTTTGCGGTGCTGCGCACATGAAAAAAGATATGGATATCAATATCGATGCGCTGCTGCTCGACACGTTTCTGACGGTGGTGGAACTGCGTCAGGGAACCACCGTGCGTCACGGTATCGAGCTGTATCGCCACTGTCAGCGGCAGGTGGAACTGGTCCGCGAACGTCTGAAAGATGCCGGATTCAGTCGGGAGAACGTGGAGCACATAACTTACGCGCAGTGCGCCCTGCTGGACGAAACGGTGCTCAGCCGTAGTGGCATGGACGACGGTCAGGCCATCTGGATGAAAAACCCACTCCAGTCGCATTTCTTCAACACCCTGCAGGCAGGTGAGCTGCTGTACGAACGGATGAAGCAGGTGCTACAGGAACCCGCCCCCGCGCAGGCCGTGCTGACCTGCTTTCACCGTGTCCTGCTGCTGGGATTTCGCGGGCGTTATCAGGATCCGGCAGCCCCGGAGCGCGACCAGCTTATTTCGACGCTCAACGGGCAGGTCGCGCCATTTGGTGTGCTGCCGGAAACGGCGGTACTGAACGTGCCGTTATCCACCCGTCAGCACCCTTTGCTGCATTCGCCATTTTTCTGGCTGGTAACACTGGCGCTGCTACTGGCGGGCGTCTGGTGGGGGCTACACCACTGGCTGAACGTGCTGGTGGATGAACTGCTGCCGCAAAGCCTGCGTTAAAGGGAGTCGTGAGTGAGGAACACGCTGAAACAGGCCATCGTGCTGTGGGGAATGGTGTTACTGCTGGTGCTGTGGTCAGTGTTTATCAGTCCGTCTGGCGTGCTGAGATGGGCCGGTGCGGCGGCTATCGTTCTGGCGGTTGCTGCGTTGTTGATTTATCGGCGCAGGCAGGCGTGGACGGAGATGACCGGCGATGCCGGGTTGTCATCGCTGCCGCCGGAAACCTACCGGCAGCCGGTAGTGCTGGTCTGCGGCGGTCTGTCGGCGCACCTGTTCACTGACAGCCCGGTCCGGCAGGTTTCAGAAGGGCTGTATCTGCATGTTCCTGATGAAGAACAGCTTGTGGCGCAGGTGGAGCGATTGCTGACCCTTCGCCCGGCGTGGGCATCGCAGCTTGCCGTGGCGTATACCGTCATGCCCGGCATACACCGGGATGTGGCGGTTCTGGCCGGACGGCTGCGACGGTTTGCCCACAGTATGGCGACGGTGCGTCGCCGGGCGGGCGTAAACGTCCCCTGGCTTCTCTGGAGCGGGCTGTCCGGCTCGCCGTTGCCGGAAAGAGCGAGTTCACCGTGGTTTATCTGTACCGGCGGCGAAGTTCAGGTAGCAACATCCACAGAGACCACCATGCCCGCGCAGTGGATTGCACAATCCGGCGTACAGGAGCGCAGTCAGCGACTCTGTTACCTGCTGAAAGCTGAAAGCCTGATGCAGTGGCTGAATCTTAATGTGCTGACGGCACTGAACGGCCCGGAGGCGAAATGCCCGCCACTGGCGATGGCCGTGGGGCTGGTCACCTCGTTGCCAGCGGTGGATAACAACCTGTGGCAAGTGTGGATCACCGCCAGAACCGGCCTGACGACGGATATCGCGGACACCGGCACAGACGCCACGCTGCCGTTTCCGGATGCTCTGTTACGGCAGTTGCCGCGTCAGTCGGACTTTACCCCGCTGCGGCGGGCCTGCGTGACCATGCTGGGCATTACCACCGCGGCGGGTATCACCATGTTGTGCCTGTCAGCCACGGCAAATCGCCAGTTATTACGGCAGGTCGGTGACGATCTGCACCGGTTTTATGCCGTCCCGGTGGAGGAATTTATCACCAAAGCCCGTCACCTGTCGGTGCTGAAAGACAATGCGACCATGCTCGATGGGTATTACCGGGAAGGAGAACCACTGCGCCTCGGTCTGGGGTTATACCCCGGCGAACGCATCCGCCAGCCGGTATTACGCGCCATTCGCGACTGGCGTCCGCCTGAACAAAAAATGGAGGTGACGGCTTCGCTTCAGGTTCAGACCGTGCGTCTTGACAGTATGTCGCTGTTTGACGTCGGACAGGCCCGCCTGAAAGACGGCTCGACAAAAGTGCTGGTGGATGCGCTGGTGAACATCCGGGCAAAACCGGGCTGGCTGATCCTCGTGGCCGGATATACCGACGCCACCGGCGATGAAAAAAGCAATCAGCAGTTATCGCTGCGGCGTGCCGAAGCGGTGCGCAACTGGATGCTGCAGACCAGCGACATCCCGGCCACCTGTTTTGCCGTACAGGGACTGGGCGAGAGCCAGCCTGCGGCGACCAACGACACGCCACAGGGCCGGGCAGTCAACCGGCGTGTCGAAATCAGTCTTGTTCCGCGTTCTGACGCCTGTCAGGACGTGAAATAAAACATACCGCCGGAAGAAGGCGGTGCTTCAATCACACTAACAAGGAGAGTAATTCTCATGGCTATTCCTGCTTATCTCTGGCTGAAAGATGACGGCGGCGCGGATATCAAAGGTTCCGTGGACGTTCAGGGGCGCGAAGGTAGCATCGAAGTGGTGGCGCTGGATCACGATGTGTACATCCCGACCGACAATAACACCGGCAAACTGACCGGTACCCGTACTCACAAGCCCTTTACGTTTACCAAAGAAATCGATGCCTCCAGCCCGTATCTCTACAAAGCTGTGACCACCGGACAGACCCTGAAAACGGCAGAATTTAAGTTTTACCGCATCAACGATGCCGGTCAGGAAGTGGAGTACTTCAACATCACGCTTGATAACGTCAAGCTGGTCAGAGTCGCTCCGCTTATGCACGACATCAAGGATCCTTCCAGAGAGAAGCATAACCACCTGGAACGTATTGAGTTCCGCTACGAGAAAATCACCTGGACTTACAAAGACGGCAACATCATTCATTCCGACTCGTGGAATGAGCGTCCTTCCGCCTGATAACTGCGGCAGACAGGAAACTGTCTGCCTTTTTGTTGTGTGCTTTGTCCAGTGCCGCAGGCACCGGTACTGAGCAAAGCATACCCACAATCTGGTGAAACCTGATGGGCCTGAGTGAGGTAACGGCTATGGGCGGTAGCGTGCCTGAACGCGGATCGCAGGAATACAGAACACGATAAGGAACCCTTCTATGACAGGAAATCACTCCGCCGCGCTGCTGCGTCGCCTTAACCCATACTGTGCACGGGCGCTGGACGCTGCCGCCTCACTGTGTCAGACCCGCGCCCATGCGGAAATAACCATTGAACACTGGCTGCTGAAACTGCTGGAGCAGGGAGAAGGCGATATCACGGTGATTGCCCGCCGCTATGAATGGGATATCGACACGCTCTGGCAGTCTCTGCTGGCACATCTGGACACCTTACCCCGCCCGGTCCGCGAACGTCCTCAACTTTCTGAACCGCTGGCAGCGCTTATCCGACAGGCGTGGCTGATAGCGTCACTGGAAGGCGACGATCCACAAATCCGCAGCCAGCATCTGCTGATGGCGCTGACAGAAAAACCGATGCTGCCCGCCTGTAATGACCTGTGGGTATTGCTGAGTCTGAGCCGCGTGCAGCTTGAGCGGCTGCGTCCCCTGCTGGATGCGCAGTCGGATGAATGTCCGGCACGTCAGCCACAGGTCACCGAACCGCTGACCTCTGCACTGCCGGAGACGGCAACGGCGGACGCACCGGCAAAAACGCTGACGGAGAAACAGGATGACGCCCTGCTGGCGGTGCTTAACCGCTTTACCGAAGACGTGACGGAAAAAGCCCGCAGCGGGCGAATCGACCCGGTATTCGGGCGCGACACGGAAATTCGCCAGATGGTCGATATCCTCTCCCGTCGCCGCAAAAACAACCCGATTCTGGTGGGAGAACCGGGGGTGGGCAAAACCGCGCTGGTGGAAGGGCTGGCGCTGCGTATCACCGAAGGCAACGTGCCGGACAGCCTGAAAACGGTGCATATCCGCACACTGGACCTCGGTCTGTTACAGGCTGGCGCGGGCGTTAAAGGTGAATTTGAACAGCGGCTGAAAAATGTCATCGATGCAGTGCAGAAATCACCGGAGCCGGTACTGCTGTTTATTGATGAAGCCCATACCATTATCGGTGCGGGTAATCAGGCAGGCGGCGCGGATGCGGCGAACCTGCTGAAACCGGCACTGGCAAGGGGCGAACTGCGCACCATCGCGGCGACCACGTGGAGCGAATACAAACAGTATTTTGAGCGCGACGCCGCGCTGGAGCGCCGCTTCCAGATGGTTAAGGTTGACGAGCCGGATGATGACACCGCCTGTCTGATGCTGCGGGGACTGAAGGCTCGCTATGCACAGCACCACGGCGTGCATATGCTGGACAGCGCCATTCAGACCGCCGTGCGCCTGTCGCGCCGCTATCTGACCGGACGCCAGCTGCCGGACAAGGCGGTTGATTTGCTGGATACCGCCGGGGCAAGAGTCCGCATGAGCCTTGACACCCTGCCGGAACCGTTGACGCAGCTTCATGCGCGACTGGCGGCACTGGATATTGAGCGGGAAGCGATTGAGCAGGACAGCGTATTTTATCCCGAAGCCAGCCCGGAGCGGCTGGCGGAACTGACCGATTTGCGTGATGAGCTACAGGCAGAAGCCGGGCATCTGGAAGCGCAGTATCAGCAAGAAAAGGCACTGGCGCAGCAGATTATGACGTTGCGTCAGGAAGGAACAGACAGCTCTGAACTGCAACAGCAACTGCGGACGCATCAGGGCTTTGCACCGCTGCTGGCGCTGGATGTGGACGCCCGCGCCGTCGCCACGGTGGTGGCGGACTGGACCGGCATCCCGCTCTCTTCCTTGCTCAAGGACGAGCAGAGCGACCTGCTCAGTATGGAACAGAGTCTTGAAAACCGCGTTGTCGGGCAAAGCCCGGCGCTCTGCGCCATCGCACAGCGGCTGCGGGCGGCTAAGACCGGCCTCACGCCGGAGAACGGCCCGCAGGGGGTATTCCTGCTGACCGGCCCCAGCGGCACCGGTAAAACCGAAACTGCGCTCACACTGGCCGACACTCTGTTTGGCGGTGAAAAATCCCTTATCACCATTAATCTTTCGGAATATCAGGAACCGCATACCGTTTCCCAGTTGAAAGGTTCGCCTCCGGGCTATGTCGGCTACGGTCAGGGCGGCGTGCTGACCGAAGCGGTACGCAAACGCCCTTACAGCGTGGTGCTGCTCGACGAAGTGGAAAAGGCGCATCGCGACGTGATGAACCTGTTCTATCAGGTGTTCGACCGGGGCTTTATGCGCGACGGCGAAGGGCGGGAAATCGACTTCCGTAACACCGTGATTCTGATGACCGCCAATCTGGGCAGCGACCACATCATGCAGCTGCTGGAGGAAAAACCGGACGCCACGGACGCAGACCTGCATGAACTGCTGTACCCCCTGCTGCGAGACCATTTTCAGCCTGCACTGATGGCGCGCTTTCAGACGGTGATTTACCGCCCGCTGGGACAGGAGGCGATGCGCGCCATTGTGGAAATGAAACTGGCGCAGGTGGCCCGCCGTCTTCACCAGCACTATGGGCTGGAAACGGAAATCAGTAACAGCCTGTACGACGCCCTGACCGCCGCCTGCCTGCTGCCGGACACCGGTGCGCGTAATATCGACAGCCTGCTGAACCAGCAAATCCTGCCGGTCTTAAGCCAGCAGTTGCTGGCGCAGCAGGCCGTGCATCATAAGCCTGCCCGACTGCGGCTTGACTGGGATGATGAAGACGGGATTGTGCTGGAATTTGATGAGAAATAATGGAGGCTCTTATGAACGTACAGTTCTTCGACCACGCACACCACAAGCTCAAAATTCGCGGCCTGAAAAGCCCGGTGGACGTGCTGACGTTTACGGGCCGGGAACAACTCAGCGCACCCTTCCGCTACGACATTGAATTTACCAGTACCGATAAAACCA +>test.0417.00002.0002 22446 +CGATCTGATAGCTAATTGTAAGAAGATAAAGGAAGGCAACGATAAAAACGAGGACACCACCTGGGCATGGGTAGCGATGATCCTGACACTGGTCGGTCTTATTCCAGTGGCAGGTTCTTTAATTAAAGGGATCTTCAAAGTGCTGTTTAATTCGATAAGAAAGGCGGCGCTTTCCAGTAGGGATATTGTACGAGCGATTGATGCTTCCGTTTCCCTGTTTAATAAATTTATCGATTTGCCAGCCGTGCAGGCGACAATGAAGTGGATGAAGATTTATAACCCGTATACGTATGCTGAGAAGCAGGTCAGGGAACTGATGGCGCAACTTAACGTATCGGTGCTGTTAAGCAAGCTGGATGAGTTAATGGACGTCACTGGTTCGCTACTCGAAAAGGCTAAATCTTGGGGGCCGGAGTCCATTCGCCAGCCGATAGAGGTGATATGGGAACTGCTGGTGTCTATCCGCAGCCAAGCCAACACCATGCTTGCAAAAGCGCTGGCACCGTTAAATGATGTGCTGGAAAAGCTGGCTGCCCGTCTGCACCGGGAAGGGGACGATTATTATAAAGCGCATACTGGTGCTAATCCGCATCGGCCTTCTCGCCTGAAAGATGCTGAAGAGGTGGAATTGCTGGCTACCAAAAAGCCAGACTGGGCGGATATTGGGGGTAAAGAAAAATATCCACAACTGGAAAAAGCCAGTGCGGAACAGAAAAGATTAATGGACCCGGAGAATAAGGAGGGCGGCTACCCGAATATTCCTGATGATAAAGTGCAGACTTTTCATCAGATGGCTCCCGTTGAATTTAAAGAAGGCGAGAAACTCTACCGGGTGCTTGACCCTGGCAGTAGCGATAATAGTTTTTGCTGGATGCGTGAAGCAGAGTTTAAAGCACTGAAGAGTAAGTCTCAGTGGCGACGACGCTTTGCGGTCTGGAAAAGCTGGAATGAAAATGGTGAGTATGTAGTTTATACCGTGCCACCCGGTACAACAATGAAGGTTTGGGAAGGTCCAGCTGCCTCTCAGGTGCGTGAAGTCACAGGTAAGAATGGAGAGAACATTAAAGTCGTGCTGGAAGGCGGATCACTTCAGATAGTGATAGATCCGACCGTTCTGAATTTGGACTATTTGGGGAAACGTCAGTCTACAGGATGGGGGTATAGAGATTTTTCTGATGAAGTGGATATGTATATAGGTGTGCCTCAGTTGCAAACAAATATTTATGTACCTAAATAAAAAGTATCAACAGACAATTAATTGATAAATCAGGAGATAAAATGGCTATATTACATCCACAGGAGTGTTGGTTGCTGGAAAGAATAATGTCGCCGGAATATTATCGGCGCCGTTTTGAGGGCTGGCAGGCGTTTGTCGAGCTGTGCGAACGGCAAGTGGCGGAGTGGAGCAAGACCATTCCGCTGGATGTGCGCCGTCGTCCGCTGTACGAGCAGATTGACGCCGTCTGGGGCGGGCGGGTGTTGCCCAATATCCGCAGCACTTTAAAGTCGGTACAGTATGACTTTATTCAGCTACAGCAGGGGGACCTGCGGGTACTGCAATCCGGGGGCAATATTAGCAGTGATATGAAAGGACTGATTGATTATCCGCCGGACTGGATGTCACCCGCCGCGCAAAAACAGTATGACAGGCTGAAATGGCGAGGTGCACATTATAATAATCTAATCAGACGTACCTCGGGCGGATACTGGTATGACGGCGAACTGACTTATTATTATGAGGAAAGTCTGCACGGCCCGCTGGCCCTGCCGATGCAATTACCGTTGTATGAGCTGGATAGCAGCGTATACCTGCGTGAGGATGACCCGGTAACGGTGGCTGGCCTGTATCTGCCGGATATCCCAGATGCCAGCGCCCAACTGTTGTACCGGAGTGAACATATTCCCGAGGCTTGGCAGGGGCGGGTACGAACGAAGTATGTCAACGAGGCTGGGATACAAGAATATTACTGGGAAAGCGGGGCGTGGGCAAAATGCAACTGGAAACGTATACGGCGGGTGGCAAACCGATTTATCAATGTGCCGCCGGAGGGATTTTTCCCACAGGGCATGCCGGAGGAGTTGTACAACTGGCCACAGCGCGAAGCGCAGTATGTAACAGACCGGCAGCGGATAGCGGCCTATAGCGGTGAAGCTTGTCCTCATAGCGGGGAGTGGTCGATTTTTGTAGAAGGTAGACAAGCGACGGAGACGCTGGAGCAGGGAGAGCAGATGCCGGAATGGACGGACAGGAAAATGGAGGGGGAGTATAAAAGAGGTGAGAAATTCCATGTGCTGTGGTCGCTGATGAACCGCCACGATGGCGGGTCGGTGTGGGTGGAAGCGTAGCGGTAGCTGGATGTACACGTAAAAACCGGGGAATGGGTGATTTTATTCTGGTTTATACAGGAGAGATGAATAATGAGGATATCACTGGCAAGCTTGTTTTTTCTTTGCTGTACAGTATCAGACAGTGTTTATGCGGATACAGATCAAACATATGATATTTTTTGGGGAATGCTGGTAAAGGATAAAAAGGATACTATATTTGTTCGCTGTGACAGTCCGTTATTGAAAATGAAAATTGTGAGAATGGCGGATGCAAATACAGAAAACATTGATAAGGCATACCAGATATTTAATCAGAAAACGAAAAAATCAATTTATTTTGCTTTTATCGGTAATGTGACTGATGCCGGGAGTGGAAAGTATATTTTCAATATGCTGGACGTGATGGAAACGAGAGAAGGCTATTGTAATCTGTCCGATGTGCTTAATGCAATAGATGAACAGTTTCGATAGTTTCGGATAAAATTGTTATTTTATGCTTTCTTTTTTGATACGTTACGTCAGGTCGTTGTTTTTATAAATCAACAACCTCATTTATTAAATAACATAAATCAAAAGCAATGCCATTATGGCCAATGAATTTCAAGTGGATATTAAATCTGTTTATTATAAATTTTCCTATTTGTGTTGAAACACCTCTTAAGACTGAATGCTGAATTACTATATCAAGAGTCACATCAATTCATTATTTCTGATATTAAATTTAATGTTTTATTATTTTTATAATATTTAATATTAAAACTGCAATTTCCGTAAAATTATAACATTATGGAGGACTCAACCATGAAAGGTATTGTTGTTCTGGGAGATAAGACAACGCATGGTGGGCAGGTTATATCTGTGTCATCTTCGATGGTTATCAATGGAAAAAAAGTTGCGCTTGTAGGTGATAAGATAAACTGCCCTGTTAAAGGGCATGGTATTAATACCATCATCGAGGGGAGTTTTGATTGGATTTCTGATGGCAAACAGGTCGTCGTGAATGGCTGCAGGTGTGAATGTGGCTGTGTTGTTATATCCAGTATTGCTGATGCCTTGATTGGATGAATATTATGGGATGGAAACGGACGTATACAGAAGAAATAGACAGGCCACAGGATATTTACTTTCATAAGTGGTTATTTTCTTTATTTATTTTATGTATATTATTACTCGTTATTTATTATTTTTTCCATGAATTTGTTGTAGCTAATAACGCATCTTTGTTAGCATTCTTTTCCCCATTATTATTGTGGGTATTGATTCTTTCAGTACAGGTAATATTTTATTCCAGAGCTATTCAGGATTATTCAATTTGGCTGGAGAACAGACTTAGTATCAACAGAGAGTGGGAGGCATGGGGATCAAGATATGTTTCTGTTATGAATAGTAGTCTTCATCTTCCTGGAAAAGTCGATGTTTTATTCTTGTCTGGTGATGAATTAGAAACTCAGTATGGACTTGTCAATAAGTCAGATGATATCACATGGAAGCAACATGATTGGTATGCCTGCTTTCAGACCCTTACTAATCATCTTGAACTTTATAAACTCCCATATCAACTTACACAAGAATTTATTATTCTTACTGATTTTGATGAAAGTATGTACTCTCAGATTGAAGAGGACTTTTTCAGAACAGTGGAGAAAACCAACAGAACAGAGGGGCATTTTTTGTTGCATATTTCCCCTTCAATGTCCTTTGGAGAGCTTGATTTATGGTTAAAGGATTCCGAAGAGAAAATATATATTGTCATGGTGTTGCAGATGGAGGAGCAAACATCCTGTTCGGACGCTATGGCTTGCCTTATGTTTGCAACTGATGATGTTACTGCTAAGTACAAACTCACTGAAAAGGCCAGAATTTATCGCCCAATGGTAGTAAATAGTAATAATTTCAATAGTGACTTGAATATTTTTATTGACACACAAAAAATATCCAAAAATGCCGCCGGGTTAGTTGGGGACAGTCAGCGTCTGTTTTCTGTGAGTAGTAATGTATTGCAGTGTTTTAATGATAATAATGCTCAATTGAAAATTGATAATATCCATCTTTTAGAAAGCCTTTGCGGATTACCAGGGGGAAATGCGGTCTGGTTAACGGCAGCGCTGACTATTTCGGTGGTTGTTCACAAAAATTCAGATTACTTGATGATGTCCGAAAATAATGATGACTGGATCATTACCACCATTCATCCTATGGAGCATTCATGAAGAGAATAAATAAAAAAAGTGTTTTTATATCTAATGTACTTTTATTCTTGGTTATTGTGGCCTTCGTGGGGGGGATCATCTGGCGTTTTGGTGATCATTTTGGACTGAAAGGGGATGAAAATAATTTTTTTGCGTGGTTGATATGCATTATGACCCTCATTTTTGTACGGGCATCCTGGTATTTCTCTCGATTGTATCGCCTACGAAAGGAACAACATCACTCCGAAAAGGAAAGATTACGCCCGGAGAAAGAGGCTCGTATTGAATATGGCAAGGTCATAACCCTGAACATTGAGCTAGCTGAGTATTTATGTGCCCTATACGGCCCATTCTGGCGGCGTAAAGTCCGCCTGCTGCTGGTGACCGGCGAGCCTGAACAGGCAGAGGCCATCGCGCCGGGGCTGACCGGGCAACACTGGCTGGAGGGCGACCACAAGGTGCTGATATATGGCGGCAGGCCATCAGCGGAGCCTGATGTCGCGCTACTGACCGCCTTAAAAAAACTGCGCCGCAGCCGCCCGCTGGACGGCATCATCTGGCCGCTGACAGAAGAACAGAGCCGCCAGACAGCGCAACTCGACAAAGGCTGGCGCGAACTGATAAACGGCGGTAAGCGACTCGGTTTTCAGGCTCCACTCTATTTGTGGCAGGTCTGTGACAACGGTGATTATCAGACCGGACGCCCCCTGCAAAGCGTCGGCTGCCTGCTGCCGGAACGCTGTACCCCGGAACAACTGGCTGCAATGCTGGAAGCACAAACCCTGCCGCTGACGGAACAGGGCATGTCGCAACTGCTGGCAGATAACCGCCATGATTTCCTGCTGCGTCTGGCCCATACCCTTGCAGAGCGGGGTATCGCTCACTGGCAAAGCGTTCTGAAACCGCTGCTGGCAGGCGGCGCATTTTCTTCCCTGCGCCTGCGTGGCCTGATGTTCAGCCCGCCGCTTGCCGCCGTGCCGGAGGCCGCACCTCATGCGTGGCTGCCGTCACCGGTCTGGGCGGGCGTGACGGGTGATAACGCGCGCGGGCGTGCAGTGGGCTTTCCGTGGCTACGCGCCGCGCTGATAACCAGCATCTGCATGCTGGCGATATGGGGGGCCGGAATGACGACCTCGTTCTTCGCCAACCGCGCGCTTGTTCAGGAAACCGGTATCCAGACGGCACGTGCGCTTGATACCCGCCTGCCGCTGGCAGAACAACTGGTGGCGCTGCATACCCTGCAGGGCGAACTGGAACGCCTGCAATATCGTATCCGCGAAGGTGCGCCGTGGTATCAGCGTTTTGGCCTTGAACGTAACCAACAACTGCTCGCCGCCGCTTTTCCCGGCTATGCGCAGGCGGCAAACCGGCTGGTGCGCGACGTGGCCGTTGACCATCTGCAACAGCAACTGAACGCCTTTGTCGCCCTGCCGCCCAACAGTCCTCAGCGTACCGCCACCGGTGAACAACGCTATAAGCAGCTTAAGGCATTGCTGATGACTTCCCGCCCGGAAAAGGCCGACGCTGCCTTTTTCAGTACCACGCTGATGGCGGACGGTCTGCGCTACGAGAATATCCCGGAAGGTGTGCGGCAGAGCGTGTTGCCGTCACTGCTGACCTTCTGGATGGCGAACCTGCCGGAACACCCGCAGTGGAAAACCGCACCGCCGCCGGAACTGACCGGCGCGGTGCGTAAAATCCTGCTGCGCCAGATTGGTGTGCGTAATGCTGAAAACACCCTCTACCAGAACGTGCTGCAACAGGTGTCCCGCAACTACGCCGATATGACGCTGGCGGACATGACCGGGGATACGCTCACCGAATCTCTTTTCAGTACGGAACAGACAGTGCCGGGGATGTTCACCCGTCAGGCGTGGGAAGGACAGGTCAGGGAAGCCATCGAGCAGGTAGTGACGGCGCGGCGCGAGGAAATCGACTGGGTACTCAGCGACCGCCAGCAGGATACCTCTGCGGATATCTCGCCGGATACGCTGCGTAACCGTCTCACCTCACGCTACTTTACCGACTTTGCCGGAAGCTGGCTGGCGTTTCTCAACAGCATTCGCTGGAAAAAGGAAGACTCGCTCTCCGGCATTCTCGACCAGCTGACACTGATGGCCGATGCCCGTCAGTCGCCGCTGATTGCGCTGACCGATACCCTCGCGTGGCAGGCGGCGGCTGGCAGGGAAAACCGTGGCCTGTCAGACTCGCTGGCGAAATCGGCACAGGAACTGTTTAACGGCAAGGAGAAAACGCCGCAGCAATCCCGTGAAGGCAACGAGCCTGTCGGGCCGCTGGATAAAACCTTCGCGCCGCTGCTGCGGTTGCTGGGCGATAAAGCCGGAGGCGGAGACAGCCAGCTGAGTCTGCAGACCTACCTTACCCGCGTTACCCGCGTGCGCCTCAAACTGCAACAGGTGACCAACGCTCCCGACCCACAGGAGATGACCCAACAACTGGCGCAGACAGTCTTGCAGGGCAAAACCGTTGACCTCACCGACACCCGCGACTACGGACGGTTAATCGCCGCCAGTCTGGGCGAGGAATGGAGTGGCTTCGGTCAGGCGCTGTTCGTCCGCCCGGTGGAACAGTCGTGGCGGCAGGTGCTGACGCCTGCAGCGGACAGCCTGAACCGCCAGTGGCACCGGGCGATTGTCAGCCACTGGAATCAGGACTTCGCCGGGCGCTATCCGTTCAAAGCCTCACAGAATGACGCTTCCCTCCCCCTGCTGGCGCAGTACCTGCGCGATGACGGGCGCATCAACCAGTTTATTGCCGCCAACCTTTCCGGCGTTCTGAAACGTGAAGGCCGCTACTGGGTGGCTGACGCCATGAACACGCAGGGGCTGACGGTCAATCCGGACTTTATCCGCGCCCTGAACCGCCTGCGCGACGTGGCCGATACCGCCTTTGCCAGCGGCGATGCCGGGATACATTTTGAACTGCGGGCAAAACCGGCCCGAGACGTGATGAAAACACATCTGGTGATTGACGGGCAGGAACTGGAATATTTCAACCAGAAAGAACGCTGGCAGCGTTTTAACTGGCCGGATGAACAGTGGCAGCCCGGCGCATCGCTGAGCTGGACCAGTACGCAGGCGATGGAGCGCATACTGGCGGATTATCGGGGAAGCTGGAGCCTAATTCGTCTGCTGGAACAGGCGCAGGTGACACCGGTGGACAGCAGCACCTTTAAAGTGGTGTGGAAAGCGCAGGACGGCCTGCCACTGAATTACCTGCTGCGGGTTGAACAGGGAAAAGGGCCGCTGGCGCTGCTGGAACTGAAAAACTTCCGCCTGCCGGGACAGGTATTTCTGACCGGCAGGAGTATGAAGGATGCGGAAGAATACGGGGAAGACGCCGATGAGTGAGCTGTTGCAAAAGCTGACCCGTAGCTGTTTTGCCGACCGGGATGCACTGGATGTGGCGCGAACACAGGCGGCACTGTGGCAGACATGGCTGCTGCCGGTGACGGCAGACACGCCGGTCGGGGAAGACCCCGGCTACCACGACGATTTCCTGCGTATCCGCGACGAGATGAACAAACTTTCCGGCGCGGATACGGACCTCATCTGCCAGCTTGCCGAATCCCTGCTGCTGACGCAGGCAAAAGACGTGCGCATCGCCACTTACTACATCTGGGCGCGACTGCACCGCGACGGTGAGCGCGGACTGGCGGAAGGACTGGCGCTGCTGACCGGACTGGTGGAACGCTTCGGTACGCAACTGCTGCCCTCGCGTCCGGCCAGCCGGAAAATGGCGCTGGAGTGGCTGGCAGGGGAAAAGATGCTCGACAGCCTTGCCCGCTACCCGGAAGTGGCAAAAGAGGATTTTGCGAACATTGTTGCTGCTCTTAATCAACTGACGGTTTCCTTCGCCGCATGGCCCGAAGACCAGCATTCCCCCTCCCTGATGCCGCTGATTAACGCGCTGGAATCACGTCTGGCGCAGTCGGGTGGGATGAATGCGGTGGTGCCGCAAAACAGCAGCAGCGTTCCTGCACCGTCATCCCCGGTGGATGCGCCACAGGTACAGACCATCACCTCCGGGCGCGACCTGCTCGACCAGGCGAAAGTGCTGGCCCGTTATCTGAACGAACAGCCGCAGGGCTGGCTTTCAGCACACCGGCTGATGAAAACCCTGCGCTGGGACACGGTGCATGAACTGCCGCCGGATGTGGACGGCAAAACCCGGCTGGCCCCGCCGCGCACAGAATCGCGCAACCAGCTTAAGCGGCTGTATGCCCAGCAGAACTGGACGGAACTGCTGGAGCAGGCCGACCTGATGTTCAGCACCGGTGTCAGCCATTTCTGGCTGGACATTCAGTGGTATCTGCATCAGGCGCTGGCCAAGGCGGGCGCACCGTGGGACAGGTGGACAGCCGTTATCCGTCAGGACCTGACGTTACTGCTGGAGCGCCTGCCGGGACTGGAAAATCTGGCATGGAACGACGGCACACCGTTCGCCGACGAGGTGACGCGCAACTGGATAGCGCAGCAGGTCATGATGCGGGAAGACGGCGCATGGCTTGCGGGGAAAGCCGCTGTACCGACAGACGACGCCACAAATGACGTACTGGCGCTGGAGCCGGAAGCACTGGCGATGGCAGACAGTCAGGGCGTGGAAGCGGCGCTGGGCTGGATACAGACCCGTCCGGGCATCACCACGGCACGACAGCGCCTGTTATTGCGGCTGCTGATGGCACGGGTGGCGGAACAGTACGGTAAAAACGAGATGGCGCTCCTGCTGCTGGAAGAACTGGATACCGCCGCACAGGGAATAACGCTGACGCAGTGGGAGCCAGAACTGCTGTTTGAAGTAAAAGCCCGGCAACTGAAACTGCTGCGCCTGCGGGCACATCGCCACGCGGACAAGGCGGCGCTTGCCCGGAAAATGGACGCTCTGCTGGGTTCGCTGGTGGCAATCGATCCGGCGCGGACAGCGGTACTGTGTGATACGCAGCATAAGGACTGATTTCTTATTTGTATTTCAGATTAAAGGACTTTGATGGACGACCTGACCCAACGCTACTTTGAGGCCGAAATGCGCTACCTGCGTGAAGCGGGTAAAGAATTTGCGCAGGCTTACCCCGACCGCGCTGCGATGCTTAATCTTGATAAACCCGGCGCACGCGATCCCTATGTGGAGCGCCTGTTCGAAGGCTTCGCCTTTTTAATGGGCCGCCTGCGCGAAAAGCTGGACGACGATCTGCCGGAACTGACTGAAGGGCTGGTCAGCCTGCTGTGGCCCCACTACCTGCGAACCATCCCGTCACTTTCCGTGGTTGAACTGTCGACAGATCACCGGCAAATGAAGCAGAGCGAAACGCTGAGCGATTTTCAGGTATTGTCGCGCCCTGTTGGCGAGCGCAGAACCCGCTGTTTCTACAGCGCCACGCGGGATATCACGCTGCATCCGCTGGCGTTGCCGGACGTGTCATTGCAATATGAACCGGACGGACGTTCGGTTATCCGTCTGCGCTTTGAATGCGGCCCGCTGGTCGGCGACTGGTCGCAGATCGATTTATCCCGCCTGCCGCTCTATCTCAATGCCGACAGCCCGGTAGCCTGTGCGTTGCACCGGGCTTTAACGCTTGGCACGCAGCAGTTCTGGCTGCGTCTGCCGGGGCAGGATCGCCGGATGCTTGGCGCACACTTTTCCCCGATGGGCTTTGAGGATGATGACAGGCTCTGGCCAAAAGGTGAGTCAGCCTTCAGCGGTTACCAGTTGCTGCTGGAGTATTTCACCTTCCGCGAGAAGTTTATGTTCGTGGCGCTGAACGGGCTGGAGCAGGTTGCATGGCCGGAGGGGATAACCGGCTTTGAGATTGACGTGGTGCTGAACGAGAACTGGCCTCACGACCTGCCATTTGACAGCGATAATATCCGTCTGCACTGCGTGCCGGTCATCAACCTGTTCCCGCTCGAAGCCGATCCGTTACACCTTTCGCCACTGGAAAACGAATTTCTGCTGCGCCCGATGCGCATTCAGGACGGGCATACCGAGATTTATTCCGTCGACAACATTATTTCTTCGCGCCATACCGGCAGTCAGGCATATGTCCCCTTTTCCAGCTTTCGTCACCGGGGCGGGATGCTGCGCCACGATGCGCCGGAACGCTATTACCACACGCGGGTAAAGCGCGGCCCTTCCGGCTTGCACGACACATGGCTGATTCTGGGCGGCGATGCGTTTGATTCCGACCGGATGCTGGAGGATGAAACCCTGTCCTTAAGTCTGACCGGCACCAACGGGCAGCTTCCCCGTAAAGCCTTACAGAGCACCCTGCTCGATACGCCAGTTCATGCCTCACAGAACGTCCTGCGGGTGCGCAACCTGTGCGCCCCGACGCAGCCCTGCTATCCCCCGGCGCGTGACCGCTTCCACTGGCGGGTGCTCAGCCACCTCGGTTCTAACTTTTTATCGATGATGGATAACGCCGAAATTCTGCGCGGCACGCTGGCGCTGTACGACTGGACCGAAAGCGAGATGAACCGCCGTCGTCTGGAGGCGATTGTCGACGTTCAGCACAGCCTGATACAGCGTTTTGAAAGAGGCTTTCTGCTGCGTGGCGTGGATATTCAGGTGACGCTGGACAGTAACGGCTTTGCCGGAGAAGGTGATATCACGCTGTTTGGTGAACTGCTGCACCGCTTCTTCGCACTGTATGCCGATATCCACTTATTCACTCAACTGACCTTAATTCTGCAACCCACAGGAAAGTGCCTGCAATGGACAGAGCATCACAGCCAGCGCGTACCGGGCTGACCGACCGGCTGGCCCCGGATATTGCGCGGATCAATTTTTACCGTTTTTGCCAGTTGCTGGAACAGAGCCAGCAGAAAGCGCCGCTGGGCAGTACCGACAACCCCGCCGCCGATGCGGTGCGTTTTCGCCCCCATCCCGGAATGGGCTTTCCGGTCAGCGAGTTAAAGAACGTTGAACGTGACGTGGACAATCCCGACGCGCCACCCACGGTGCGCACCACCTTTCTCGGCCTGTACGGCGTGGATTCACCGCTGCCCACCGCCTATCTGGACTACATTACCCAGCGTCATGACGGACATGACGCAGTGATGGCGTTTCTCGATATTTTTAACCATCGCTTTATCACCCAGTATTACCGCATCTGGCGCAAATATAACTACCCGGCGTCGTTTGAAGCAGGTGCCGTGGATGACATTTCCCGTTGTCTGCTGGGGTTAATCGGGCTGGGTATTCCCGGCAGCGAGAACCATATCGCCACGCCTGTATCCCGTTTTCTGGCCCTGCTCAGCGTGATGCGCCTGCCCACCCGCACGGCTGAAGGCGTCACGGCACTGGTGGGGCTGCTTGCCCCGCTGACGAAAGCCACGGTGGTGCCTCACGATCCGCAGCCTGTAATTCTCCCGGCCCCTGCGGGTCTGTCAAAAAATTCACGCATCAGCCTGAAAACGCGAACGCTGCTGGGGCGTACCGGTACCGACGTCAACAGCCAGTTGCTGCTGAAACTGTATACCGAAGATGCCGCAGAAGCACGTGGCTGGCTGCCCGGCGGGCAACTGCACAGCGATTTGCTGGTGCTGCTGCGCGTTTATCTGGGCTGGCGCTGTCAGGCCCGTCTGCAACTGACGCTGCCCGTCAGCCTGTTGCCTGCTGCCCGGCTGGGAAAACAGCGTGTACAGATTAGCCGTACCGGCATCCTTCTCGCCTCCTTTGCCGCGCCCGCGACCGGAACAGTGACGGTCAGTCTGGGGCGTTATCAGGGATTAATACCCGCTTTTTCCATTCGTAACAGGGAGAGTATGACTCATGTTTCCTATTCGTTTTAAACGTCCGGCGTTGCTCTGTATGGCGATGCTGACGGTTGTTCTGAGTGGCTGCGGGCTGATTCAGAAAGTGGTGGATGAATCGAAAAGCGTGGCCTCAGCCGTTTTCTACAAACAAATCAAAATACTGCATCTCGATTTCTTCTCCCGCAGCGCCCTGAATACGGATGCGGAAGATACGCCGCTTTCCACGATGGTGCATGTCTGGCAACTGAAAACCCGCGAAGATTTTGACAAGGCGGATTACGACACCCTGTTTATGCAGGAAGAGAAGACGCTGGAGAAGGACGTACTGGCAAAACACACCGTCTGGGTAAAACCGGAAGGCACGGCATCCCTGAATGTGCCGCTGGATAAAGAGACGCAGTTTGTCGCCATTATTGGGCAGTTTTATCACCCTGATGAAAAAAGCGACAGCTGGCGTCTGGTGATCAAAAGGGACGAACTGGAGGCCGACAAGCCGCGCTCGATTGAACTGATGAGAAGCGACCTGCGACTGCTGCCTCTCAAGGATAAATAACCGATGTCGACACCTTCCTTATATGAAATGCTGACGTTCAGTTTCAGCGGCGAGTTACCGCTGGAACAGATCAGCGAGCGGGATCAGCTTATCCTTTCCGTGATGGACAATATGCAACGCATTATCAACTGCCGGGCAGGCACGCTGGCGCATTTGCCGGATTACGGTCTGCCGGATCTCAGTCTGATCCATCAGGGGATGGCTGCGGGTATTCATGGCCTGATGCGTCAGATTGAAGAAACACTGCTGCGTTATGAACCACGCCTGAGTCAGATACAGGTGGAATTACTCCCCCAGCCCCGTCCGGGGCATCTTAATTACCTGATCCACGCGCAGCTTCCCGATACCGGCTGGATACGCTTTGATGGCGTATTTTCTCCGGAAGGACGAATTGTTCTGCGTCATCTCAAACAACAGGAGCGGGCGTACTGATGGCAAGTAACGCGAATTTTATCAGCCAGTTCGTCATGGGCGGCGATCCCTGTACTTATAAGGAATCCGGTGAACTGCAGGCTGAAATGAGTAAACTGACTCACCCGGCCCGACCGGATGTGGACTGGCGTCAGGTGGAAAAACTCTGCCTCGCGCTGTTCCGGCAAAATGGCGTGGAACTACAGACGCTGGTCTGTTACGTACTGGCGATAACCAGACGGCAGGGGCTGGCAGGGATGGCAGACGGACTCGGTTCACTGGATATACTGCTCCAGCGCTGGGCTGACTTCTGGCCGGTACAGGTACATTCCAGAATATCACTGCTCAGCTGGGTCACAGAAAAAATGCAGCAGGCACTGAGAACGCTGGATATTCAGTATCAGGATCTGCCGCAGATTTACCGTTGTGTACAGCATCTTTCCGCCATCGAAACCACGCTGCAACAGTGTGAACTGTGGCATATGACGAAACTGGATCTACTGGCCGGGCAGTTTCGCAATACCGCATTGCGTCTGGAACGGCTGGCGCCTCAGGGAGCGGAAACCACTATCACTCCCCCTGAATTACCCCGCCGGGAAATGAATCAACCGAAAAAGTCAGAGGAAAGTCCACAGCCGGTTTTTGCAACCAGATCCGTTCAGCAAAACGATAAGGATGCCAGTCCACCCGTTCCATCCCCTGAAATCTCCCGGCAGCGGACATGGCCGATATTTATGGCCGGAATGGTTGTGATGGCCGGTCTCGGCGGAACAGGATTATGGGGCTGGTCGCAGCTTAATCAGCCGGACGCGCTAATCCAGCGAATACAACTGTCTGTCATGCCATTACCGCAGTCGCTGGAGAGCGGCGAACTGGCAAAGCTGGATGTAAAGGATAAGGCGCTGCTGGCTCAGGACAGAACAATTGCGGCAAGTCAGATGCAACTGGAGCAGTTAAACAAATTGCCTGCCCGCTGGCCACTGGAGCAGGGATATCGCCAGCTACGCCAGCTTGATGCCCTGTGGCCGGATAATCCTCAGGTCAGGGCGCTGAACGCGCAGTGGCGCAAACAGCGGGAGCTGAGCGCCCTGTCTGCTGAGGCACTGAATGGCTATGCTCAGGCGCAGAGCCAGCTACAGCGCCTGTCGGCGCAGCTGGATGCACTGGATGAACGTAAGGGGAGATATCTGACCGGTTCGGAACTAAAAACGGCGGTGTACGGCATCCGGCAGTCGTTAAAGGAGCCGCCGCTGGAAGAACTGCTTCGGCAACTGGAAGAGCAAAAACAGACCGGAGAGGTTTCGCCAACGCTGTTGACGCAAATTGATACCCGGTTAAATCAGTTGTTGAATCGCTATGTCATTTTACTGGATACGAAGGTGGAACAAAGTCAGTAAACATCGGGGGATTTATGTACCAATAAGGGATATGTGACCTTGCCATTTTTTAAAATGGAGTCTCTGTGTACAAAAAAAGAGAGGAACAGGCCATTCGATCTACTCGTTGATTCACATCAGATAATGAGTGTATATTTCGGTAGATAGCTTGGGTTCGGGAACAGTGAATACCTTAAGTTTCAAAAGATTGGATTAACCTCTTGACTGTGGCCCCCGCAACCAATTTATTAGAATGCTGACAAACCGCAATGTGTTCTACAAATTGCGGTTTTTTTGTATTTAAAATCTTTGTTCGCTGAACTCACAACACGTTTTTTATCTCCCTTCCTGCGAAGTAATCAATTATCGACTGGGCAACGTGTATCCCGGTTTGCTGGTATGACTCAACGGTGGCGGCCGCGATATGCGGCGTTGTAATGATATTTTTGGCATGTAGCAGTGGGCTAAATTGCGCCAACGGTTCAGAGCTAAACACATCCAGCGCCGCAAACACATTTCGTTCTTCAATCACCTGAAGTAAAGCGCCCTCATCCAGCAACTTTCCCCTTGCGGCATTGATGATTAGAGCACCATTGCGCATCATCGACAAATATTTATGACTAATGAAGTTCTCCAGCTCAGAAGAAAAAGGCAAAAGAACAATGATGACATGCGACTGCATAAAGATATCTTCAATTGATACAAACTGAACTCCAGCTTTGTCAGCAACCTGATAGTCGGGTTGTTTGTCAAAAGCTAAAAGCTCAACATCAAAACCGGATAACCTTTTCGCCAGAGTTTTACCTATATTACCGTAGCCAACCAGGCCAATCCGTTTCCCTTGTAATTCACAGCCATGCGACTCACCCCAGTAGCCATTTTGCATCGCATGATAGCTGCCAGGGATATTTCTCATGCTCGCGAAGATAAGTCCAATGATAAATTCCGCAACCGCATTTGAATTAATCCCAACCGCATTATTGACAACAATACCGGATTGCTGTGCCGCACGAAGATCAATATTGTCTATCCCCGTCCCGAATCTCGATATTATTCTCACACCAGGCAGCAATGATAGCGTGTCCGCCTGATAACCATCTTTTCCGGCGATGACCGCGCAAATAGATTCTCGTAATGCAGTGGATTCTGATTTAAGCAGATGCTCCACATTATTCTTAATAATAAGATTAAAATTATTCTCTCTTAGCAACTTGCTGGCGGAAACACAGCGTGCTGAAAAGCTGGGGACGGTGACCAGAACATTTTTCATAGCGGACACTCACTTCAAAGAACGCCACCCCAAAAGATGGCGTGACCGGTTACTGTATTTATATTTTGAAATTATGAATTTGCTTTAATGCCGAGTGCACCTCCTGGATGATATAAGCCGAAATCAGCACGAGTAAATTTTTTCAATTCAGAGAGTGCAAGCGCCACCGCATCACCAACAACCAGAACAACAGTCGACGAGCATGACGGTGCTAAACCTAAATTATCCGCCTCACTTTTGACGGGGATTTCAACAGATAAATCACAACTTATCGCAAGCGATGAGTGATGACTGCGGGTAAAAGAGATCAAATAATTACCCATTTTTTTCAGACTAGGCAGTGTCGCCAGGATTTCCGCCGTCTCACCACTGTTTGAAATAAGAATAACAACATCGTCTTTCGCCACCATTCCAAGGTCGCCGTGTACCGCTTCCGTACCGTGAACAAAAAACGAGGGAGTTCCGGTGCTGGCAAATGTTGCGGCGAGTTTCCTGGCAATAATACCAGACTTACCAACACCAATAAAAACAACTTTCCCCTGACAAGATTGTAATACTTTAATTAAATTTGCGACCTCCGAAAGAGGGGAATCAATAACTTCTTCAACTGCTTTATGTTCGTTACGCATAAAATGTTTAATGAGATGGATAAGATCCGTGTTATTCATTTTTATTCTCCCTGATTAATATTTTTAATTACACTCACAAGACGCGTAAGCCCCATATATAATTTTTCTCGACCGCAGGCCAGGTTCAGACGAAGGTAGCCCTCCCCCTCCGTTCCATAGACATGCCCCGCCATAATGCCCACTTTGCCTTCATGAATTAATCGACTGTAGAATTCATCAAAAGGATAACCAATAGCAGAACAATCTATCCAGGAAAAATAGCAACCATCAGCTGGCCTTACGATCAATTCTGGAATATTTTCATTCAGATACTGCTGGGTGAATTGAATGTTAGAGGCTATATGTGCCTTTAATGACTTTAACCATCCCTCACATTCGTTGTAGGCAATAATAGTTGCAATTATATTCAGTACTGATGGGGAGTTTACAAAATCGCGATACCTCGATATCGTTCTGAACTTATGATTAAAATTATCGTCAGTTGAAATCATATACGATCCTGTTAGTGCAGGAACATTAAATGTTTTCGATATCGAGTTAAATACTACTACTTTTTCTTTTTTTATTTTAAGCGCGGATGTAAAGCTACGATTAAAAACAAAATCACTATGGATTTCATCTGAACATAACCAGACATTATGCCTTGTACAGCTTGCAGCGATTTTATGCAGTTCTTCTTCCGACCAGACTGTTCCTGTCGGGTTATGAGGATTACATAATAACATCATCTTTGCGCTTTTAATCTTAAGATCAAAATCTTGCCAGTTGATAGCGTAGCCCCCCTCATTTTTTATAATCAAAGAGGCTGTCAGAATATTTCGCTCGCTATGTTTAATTACATCAAAAAATGCATTATAGACAGGTGTAAAAACGAGAATATTATCACCATGCGATGTCAATAACTCTATTGCTTTTGCAATAGAGTACATCACACTGGGGCTATAGGTTATCCATTCAGGTTTAATATCTGTTTGATATTGTTGATAATACCAGTTTACTATCGCATTCAGATATTCACCATGTTGCCAACGACTGTACCCTAAAATCGGGTGTTCCAGGCGTTTTTTTAATGCTCTGGTGATAGCGTCTGGTATCGGAAGATCCATATCTGAAATAGAGAATGGTAGTACATCTTTTACACCAAATCTGTCCTCGCAAAAGTCCCATTGGGTACAATATGTTCCTTTGCGGGAAACAGGAGTATTAAAAACATCCATCAGTATATCCCCATATAGTTATCCATATCCCGACGCAGGGCGATGACTTTAGTGCCGATAATGACTTGTAGGGTATTTTGATCAAGTTTTACAACCGCAATCCCGCCAGCTCTTTTTATTGCAACTTCGTCAATCAATCTCATATCTGCGATTGTTAAACGTAAACGAGTTACGCAATTATCCAGTGACTTAATATTCTCTTTACCACCAAGTGCCTTAACCATCTGCTCCGCCGCTTGCAGCTCTGATTTATCAGGAGTTGGGATATCCGCTATAGCCGTATCTTCGTGAGCGTTCAGCGTAACAGGACTGGACTCTTCACGGCCTACGGTCATCAGGTTAAATTTAAGGATGGTCCAACGGAACACAAAGTAATAAATGAAGAAATAGGCCACTTCGACACACACCGCGATCGGCCAACCTGTTCTTGTGCCACGCAATACGCCAAAGCTAATAAATTGAATCAGATCACCAGTAAATCCCATCTTCACCCCCATATATGGCAGAACCATGTTAGCGAATCCATTCATAAAGGCATGGAAGACAAACAGCAGTGGACTGACAAATAAGAACAGAAACTCAATCGGTTCGCTGACGCCGCCAATAATCACCGTAAGCACCCCGGAAATAAGCAATGCTTTGATAGCCTTTCTGTTTTGAGCATGAGCAGTGCGATACATCGCCAGCGCGGCACCAGCCAGACCATACTGAATCATCAGTTTGCCCTGCTCCATTTTCCCCGCCAAATCCAGCGGAATGACCGCATTCTCTTTGACGTATGCCATAAACATGTTCAGGGTGCCGTAATATTCTTCGCCGCCAATCACAGCCGAACCGCCGATTGGCGTAAAGCGGAAAACTGACGTCACCAGATGGTTTAAGCCAAAAGGAATCGTCACGCGTTCGGCAACTGCATAGAAGAAATAACCAACAGGACCGGAAGTTGAAATCCAGTGGCCAATGAGCATGAAAAGATTGAAAAACGGCGGCCAGATAAAAGGAATGATCAGACCAAATCCACTCATCACAATCAGTGTAATGATAGGCACCAGACGTGGGCCGCTATAAAAACCTAACGATTCAGGAATGCGTAAATTAACGATCTTTTTATACATGCTGGCGACTAATAACCCAGCAACAATTCCCCCCAACACGCTGGTATTGTAGGACTGGATCCCCAGAATGATGGTTTGCCCATGTGTCGACATTTGGTCAGCAACGACCAATAAGTCGTGCTGTTTAAGATAAAAGTTCGTTCCCAAATGCATCGCCATAAAACCAATTAAGCCAGAAAAAGCACCATAGGCTTTATCCTCTTTATCTTTTAATAATCCTAAGGGAATCGCTATCGCAAACAATACAGGTAAATTAACAAAGGCAAACAAACCAAGACTAACAATGAAATCAAGTATGGTTTTAATTATTGGAATAGCCAGAAATGGAATTAACTTTGCCATATCATCACTGGCTAAACCACTTCCCAGCCCTAGCATCATGCCACATACACTTAGCAGAGCAATGGGATACATAAATGCCTTCCCCAGGCTCTGAAAAAAACTCCAGGCTTTCTTTTGTTTCATGTGGGTTATCTCATATAAATGTTATATATAATTAGTCCATTAATACTTTGGTACGAATAGAGAGATATAATTTTTCTTCTAAAATTAATTCATATTTAAAAGTGGCATACAGATACCGTTCAATTTCATGAATTGCGCGCTGTAACAGGATGTCCTTTTCAAGAAACTGTTCATAGATATCACCAATATCTTTCTGTTTTATTTTTTCATTGCATAACACGCGACTTGAAAAATATTTAAGGTGCATCATAAATCTGGAATAGTTAAATGAACTTCTGTCCACCTTTCTGTTATAAACAACTTCAATAAGCTCCGTGATTATTTGCGACAACTCAATAATCCGTACTGATTCATAATCAACTGAATTTTCATAATTATTTAAAATATGCAATGCTATAAAACCAATCTCATCATCAGGAAGTTGAACGCTGAATTGCTCATTAATGATAGTTAATGCATCGCGACTTATCGCATACTCTGCTTTGTACAACGCTTTGATTTCATCAAGGAAAACATTATTAATTTGTATACCTGAAACGACTCGGGATATTGCATTCGAAATGTGATCCGCAAGAATCAATAGTAGCGATGGATTGAGATTTTTTTCGAGATTTTTCTCCGCATATTGCACTATTTTTTCGGCAACAAACACATACTCAATATCTACATGTTCAATCAATTTATAAAGTTTGTTTTTTTGTTCATTTCTGACATAAAAAATCCGGTTAGCCGGATGCTCAGGGACCGACATTCCATATTTTTTGTTGTAACCGACGCCAGGCCCAGAAATGATAACCTCCTGTCCATTCATCGATGCCTGTACACAATTATTGTTCATGACTTTTTCGATGATCATTCCATGGCTCCAAAAAAAAAGGCAAGGCACGTCAGAAGTAATAACTACTTCAAACATTGCCTTGCCTGATTTAACAGTTACAAGATGATTAACTAATGCGTATACATTACACGGAATTGTGCTTAATTAAAGAGATGGTCGGCTTATTTTTCAAGCCGACATTCAAATATCCGACATCAGTCACAAAACCAGCGTCTAATATTCAGGTAAATGTTATCTATTCAACGAAATATAAATTCATTGAATAAATAAAAACATTATCCCCTTCTCGCCAGCGTCGCCCCATCGGCAAAATACGCTTTAATTCCCGCAAGAATAGACTCCGCAACTTCCTGCTGGAAAGTCGCCGTTTTCAGTTTACGCTCTTCCTCAACGTTACTGATAAACGCCGTTTCGACCAGAATGGAGGGAATATCTGGTGCCTTTAGTACGGCAAACCCGGCCTGTTCAACTTGATTTTTATGCAGCTTGTTGATTTTACCGAGCTTATTCAGCACCGCTTTACCAAACTTAAGGCTGTCGGCAATGGTCAGCGACTGCACCATATCGAACATGGTGTGGTCGACATAGCGGTCACCGCTTTTGCTTACGCCACCAATCAAGTCCGAGGCGTTCTGGGTTTGTGCCAGATATTTTGCCGCAGTACTGGTTGCGCCTTTGGTTGAGAGCGCAAACACCGAGGAACCGCTCGGCTGGCGACTGGTAAAGGCGTCGGCATGGATAGAAACAAACAAGTCAGCGCGCTGTTTCTGGGCTTTTGCTACGCGCACTTGCAACGGAATGAAGATGTCTTCATTGCGCGTCATGTACACCTTCATATTGCCCTCTTTCTCGATCAGAGAGCGCAGACGGCGAGCTATTTGCAATACCACGTCTTTTTCGCGCGTTTTGTATTTCCCCACCGCACCGGAGTCTTCGCCACCGTGGCCAGGGTCAAGCATAATGACAATCGGACGATCCCGCCCAGCTTTACCCGGTTGTGGACCACTTTGTGCTGGCGGCACCTGCTTTTCGAGGTCGCCTTTGTTGTAATCCTCCAGCAGCGCCAGCAGCGGGTCCTGCATATCCTGTGCATTGGCCGGATAGAGGTCCATCACCAGACGCTCTTTAAACCCGGCGACCGGCGCAAGGGCAAACAGCTGCGGTTTTACGTTTTGCTTTAATTCAAAAACCATACGTACGGTTTGCGGGTCAAATTGCCCGACGCGCGCCGACTTGATGAACGGGTCGTCAGCGCGGATTTGCGCAGCCATCCCCTTGAGCACCGAGTTCAGGTTTACATCTTCGATATCCACCACCACGCGTTCAGGATTACTCAACGCGAACTGCTTATATTTCAGCTGACGATTTGATTCTACCGTCACGCGGGTGTAGCTGGACGCAGGCCAGACGCGCACCGCCACGACCTGGCTGACCGCAGCCAGGCTGACCTGACTTACGCTCAATAGCCACATGGCACCCGCGCCTTGCAGTAAACGACGACGGCTGATTGCAGTGTTGGATCCTGACATGCCTCTCCCGAGCAAAAGAAATCTAAGCTGTGTAACAAGTAAACGACCAATTTGACCGGAAACTTTAGCGAAAGACGCATAATCTGTCATCTATAAAACGGTAAACATTCTTTTTATATTCACGGTATTACTGATAAAAAACTCGCTCCCGCATAAAATTTACACTTGCACCCTGCGAAAAAACAGAATAAAAATACAATAATTTCGAATAATCATGCAAAGAGGTGTACCGTGGTAAAGGAACGTAAAACCGAGCTGGTCGAGGGATTCCGCCATTCGGTTCCCTATATCAATACCCACCGGGGAAAAACGTTTGTCATCATGCTCGGCGGTGAAGCCATTGAGCATGAGAATTTCTCCAGTATCGTTAATGATATCGGGTTGTTGCACAGCCTCGGCATCCGTCTGGTGGTGGTCTATGGCGCACGTCCGCAGATCGACGCAAATCTGGCTGCACATCACCACGAACCGCTGTATCACAAGAATATACGTGTGACCGACGCCAAAACACTGGAACTGGTGAAGCAGGCAGCGGGAACATTGCAACTGGATATTACTGCTCGCCTGTCGATGAGTCTCAATAACACACCGCTGCAGGGCGCGCATATCAACGTCGTCAGTGGTAATTTTATTATTGCCCAGCCGCTGGGCGTCGATGACGGCGTGGATTACTGTCATAGCGGGCGTATCCGGCGGATTGATGAAGACGCGATCCATCGTCAACTGGACAGCGGTGCAATAGTGCTAATGG +>test.0417.00002.0003 51012 +GGCCGGTCGCTGTTTCGGTCACTGGCGAGAGCTTTAATCTGACCTCGGAAGAGATTGCCACTCAACTGGCCATCAAACTGAAAGCTGAAAAAATGATTGGTTTTTGCTCTTCCCAGGGCGTCACTAATGACGACGGTGATATTGTCTCCGAACTTTTCCCTAACGAAGCGCAAGCACGGGTAGAAGCCCAGGAAGAGAAAGGCGATTACAACTCCGGTACGGTGCGCTTTTTGCGTGGCGCAGTGAAAGCCTGCCGCAGCGGCGTGCGTCGCTGTCATTTAATCAGTTATCAGGAAGATGGCGCGCTGTTGCAAGAGTTGTTCTCACGCGACGGTATCGGTACGCAGATTGTGATGGAAAGCGCCGAGCAGATTCGTCGCGCAACAATCAACGATATTGGCGGTATTCTGGAGTTGATTCGCCCGCTGGAGCAACAAGGTATTCTGGTACGCCGTTCTCGCGAGCAGCTGGAGATGGAAATCGACAAATTCACCATTATTCAGCGCGATAACACGACTATTGCCTGCGCCGCGCTCTATCCGTTCCCGGAAGAGAAGATTGGGGAAATGGCCTGTGTGGCAGTTCACCCGGATTACCGCAGTTCATCACGGGGCGAGGTTCTGCTGGAACGCATTGCCGCTCAGGCGAAGCAGAGCGGCTTAAGCAAATTGTTTGTGCTGACCACGCGCAGTATTCACTGGTTCCAGGAACGTGGATTTACCCCAGTGGATATTGATTTACTGCCCGAGAGCAAAAAGCAGTTGTACAACTACCAGCGTAAATCCAAAGTTTTGATGGCGGATTTAGGGTAAGCGATGAAAATCGCCGGATGCGACATGCGTAACACTCGTGCGTCGCATCAGGCAATTACGTTTATCCCCGTGAACTAAACAACGCCGCCAGACCACTGCGCCGCTCAGTACGAGTGGCGATTGCCGCACTTAATATGCGCTCATCGGCATACAGCGACAGACGGCGACGCGCGCGGGTCACCGCGGTGTAAACCAGCTCTCGCGTTACTACCGGCGTGCGTTGACTCGGTAAAATCAACGCCGCATGGTCGAACTCCGATCCCTGCGATTTATGTACCGTCATCGCCCACGTCGTTTCGTGCTCTGGCAGGCGACTCGGTTGCACAGACTTAATATTGCCGTCCGGCATCGCAAACCAGACGCGCGTCCCCTGCCCGCGATCCAGCGCAATACCAATATCGCCATTAAACAACCCAAGCGCGCTGTCATTACGGGCAATCATCACTGGTCGGCCTTCGTACCAACGAGAGTGCGGATGACGATGAATTTTGCGCTTCTGTTGCATAAACTGCTCAATTCGCTCATTCAGTCCAGCCACGCCAAACGGCCCTTCCCGCAGGGCGCACAAAAGCTGGTACTCATTGAACGCCTGAATGATTAAATCCGGCTCGGCACGCGCTTGCAGCAGATCCAGATAACGCCCGTAACCCGCAAGAGCTTCCTCAAGCATCGCAATATAATCTTCGCCACTCTGTAAAAGCCGTTTTTCGATATCAGTAAAATCCTGCTGAAAAACGGTTTTCACTGCCGTTTTATCACCACGGTTAATCGCCGCAGCTAACTGACCAATGCCAGAATCGCTGCCGAAACGATAGCTTTTTTGCAGCAGGCAGAGGCTGTCGCGCAAAGATGCCGCTTCTGTGCCAGTTCCTGCCGGAACGTGGCTTCCCGTCAGGCGGCTCAACTGCCCGGCACGCTCGGCGGTAAAGCCCGCGTTGGCATAAGCGCAGATATCGCCCAGCACAGCCCCAGCCTCAACCGAGGCCAGTTGATCACGATCGCCGAGAAAGATCACTCGCGCATGATCGGGCAAGGCGTCGATCAGTCTCGACATCATAGGAAGATCGATCATTGACGCTTCATCTACCACCAGCACATCAAGATGCAGCGGGTTACCGGCATGATGACGTAAACGCTGGCTACCCGGCTGCGCACCCAGCAATCGGTGCAAAGTGCTGGCATCTTCCGGAATGCGTTTCTTTTGTTCATCGGTCAGCGGTAATTGTCGCAAAGCCTTGCCGAGAGATTCGGTTAAGCGCGCGGCAGCTTTACCCGTTGGTGCAGCCAGACGGATACGGCAGCGTTCGCCGTCGGCCATTTGAATTAACGCTGCCAGTAACTTCGCTACGGTGGTCGTTTTACCGGTGCCAGGACCACCGGAAATCACCGAGATCCGCCGTGTCAGCGCCACTGCCGCCGCAACTTTTTGCCAGTTAATTTCATCGCTTACTGGAAAAAGTTTGTCCAGGGTTTGCGCCAGTAGAGCTTCATCAACCTCAATGGCATGATTCACTTCGTTGAAAAAGCGTGCCACTGTGCGCTCGTTACACCACATGCGATTCAAATAAAGACGATCGCCACAGAGGATCATCGGCGTTGGTTCATCTCCCCGGCTGACCGCTTGTGAAGCCAGCAAGCATTCTTCCCAATTTTGTAGCTCACCGATTTCACTGACACAGGTCGCCAACAGCGGATGCGATGCCTCGTTATTTTCCAGTCGTGAAAGCGGCAAACAAACGTGTCCCTCTCCGGCATCATGACTTAATAGTGCCGCCGCGAGGGTGACGGCAGGATGTTCATCTCCCGCCACGGTCAGGGCAAACTGCACGTCCAGCGGGCGTAGCTGTTTGTGCTCCACAGCTTCCAGTAATTGCTTTTGCAATTTCATTACGCCTCCTCCAGGGTCATACCGGCAAACATCTCATCCATCAGGTCAATCAACCCGGCGTTGGGTCGGGTCGCGTAGATCCCTTGTTGCGGATGTTCTTTATCAACGCCACGCAGGAACAGATAAATAACGCCGCCAAAGTGGCGCTCATAGTCGTAATCAGCAATACGATGGCGCAGATAACGGTGCAGCGCCAGGGTATAAAGCTGATATTGCAGATCATAGCGGTGTGCCTGCATTGCCGCTGCCATAGCCTGTTGGGTGTAAGCCGAACTGTCTTCACCCAACCAGTTGGATTTATAGTCGAGCAGGTAATAACGCCCTTCGTGGCGGAACACCAGATCGATAAAGCCTTTTAACATGCCACGTACCTGCATGAACTCCAGCGGCGGGCAGCCAGCGGATAGCGGGTCAAACTGGCGAATTAGTGCATCAAGCTGGCTGGCGATGAGCGGTTCGCTAATTGGCAGGTAAAACTCCATCTCCACCTGTTTATCGCGATCGGAAAGCTGATTCAGGCTAACACCCGTTTCATTGAGAGGTGCCTGGAGGACAGCCGTGATCCACTCAGTCAACACCGGTTCCCACTGCGGTTCAAAGCCACCGAGCTCCAGTTTTTCCTGTACCCAGTTCGGGTCAACCGGCTGGGTAAAATCGAGGTCTTCAAACAAACTGTGCAAGAATGTCCCCGGTGACGCACCGCGCGGGAACTGATGCGGTGTTAACGTCGGTTCTTCAACGACGCTGACCACGCCTGCGGCATCAACATCCAGCCGTGGCATCAGATCCTGAGCGATACCGTGACCACGCTGCTGCAAACCGGAGTAGCTGGTGACACGCCAGTTATCGCCGGGCAATCGTTGTAGCGTCCTCGCATTCAGTTCTGCAGTTAATGCATCATTAACCTGCCAGGGCTGGTTATCACCAATTTGTGCCGTTTGCCAGGCAATATCATCATCGCACAACGCTTCAATGCAGGTACGAAGCCCTGCCGCATCTTGCGGTTCTCCTTTTTGCAGCAAACGCCCGAGCGCACTTTGGTGGACGTCGGTATCACCTTTTTTATCGCCACGACGGCGCACCAGCGGTGCAACGCCGAGACTGCAATGCCAAACCGAACGCGTCAGCGCCACGTAAAGTAAACGCAGATCTTCCGCCAGACGTTCGGCCTCCGCGAGGTCGACGCTTTCTGGCGCAGCATTAAGATCCAGAACGGCCTCAAACGAGTGGCGATCGTGATAAAACGCCTGATCCTGGACGCGGAAATTGGTAATAAATGGCAACCAGACCAGCGGATATTCCAGCCCTTTTGATTTGTGTATCGTGACAATCTGCACCAGATGTTTATCACTTTCGAGGCGCATTTGTTGGCTGGAGGCATTACTGTCTGGCTCGAGGATATGTTGCGATAACCAGCGTACCAGCGCATGTTCACTTTCCAGCTGCGTTCCGGCTTCTTGTAGCAGTTCGCTGATATGCAAGATATCGGTAAGACGCCGCTCACCGCCTGCCGTTGCCAGCAAGTTTTCTGCAATGTTACGCGCCGACATCAGCGCCCGCAGCATCGGCATAACGCCACGTTTGCGCCAGATTTGCCGATAACCATCGAACTCTTCGACGACCGCATCCCACGCATGTTCGTCATTATTCAGCGTTTCAATATCCAGCGCATTCAGCCCCATCATTGACGTTGCCAGCGCACTGCGCAGGGTGTTCTCACGTTCGGGCGTCATCACCGCCTGCAACAGCCAAAGCATCTCCTGTGCTTCCAGAGTTTCAAAAACACTGTCGCGGTTCGAAAGGTAAACGGAAGGGATTTCCAGCAGCGTTAAGGCATCGCGCACCTGAGCGGCCTCCTGGCGGCTGCGCACCAGCACACTGATGTCCGAAGCACGCACCGGACGCGCATCGTCGCCGTTCATCAGCAACGCTTCGCCGCGTTGCCCGGCTTGTAGCCAGTCGCGGATTTGCGCAGCACATACCTGCGCCATGGTACTTTGATAGTCGCCAACGCCGCAGCTTTCGCCTTCCATCAGCCACATTTTCATCGCAGGCTGCGTTTCACCTTTAAATACAAAACGTAACGCCTGATTTTTGCCGGCAGATTTCACAGGAATAAACGGTATTTCACGAAACATGAACGCGTCATCAGTCTGGCTGAAAAGTTTGTTAACGCTGTTCACCATTCCCGGTGCGGAACGCCAGTTGGTATCTAAGGTGTAGTGAGCATGAACTTCGCTACGCGCCTTCATATAAGTGAAGATATCCGCACCCCGGAATGCATATATGGCCTGTTTCGGGTCGCCAATCAGCAACAATGCGGTTTCCGGCTGATGGTGCCAGATACGGCGAAAAATTCGATACTGTTGGGGGTCGGTATCCTGAAATTCATCGATCATTGCCACCGGGAATCGCGTACGGATCGCCGCTGCCAATACCTCGCCGCTTTCACTACGCAGCGCGGAATCGAGCCGACTTAACATGTCATCAAAACCCAATTCGCCACGGCGGCGTTTTTCACGCGCTACTGTTTCGCGGATCTCAGCCAATGCGCGAGTGATCACCAGATCGCGGATCGACAATGGTTCTGCAAGCAGTTGTTCGATCGCCTCAAACAGTGGATGTCGCGGGGTTTCCCCCCCGGCTTTCGTGCGATCTTCTAAGAAACGCTGAGAGAATTTTTCCAGCGACTCCGGCAACTGATAGCTGTTGGTCTCTTCTTCTGCCCAGGCGCTGATCTTCTCGATCCATTTAGCCTGATTGCTACGGTTAAACTTGCGTCGATCAATACCAGAAGATTCGATCAGCGCATCCAGTTCACCCACTGCGTCGCGCCACTGCTGTTTTACGGCATCAATACGCGCCACAATTTGCGCGTGGCGGGAAGCCAGCGTTTCATCATCGGGGGGCGGTGCTTTGATAACCGGCGCTTCGCCTTGCAGATAACGATTAATATCGCGCAGCAACGCCTGCGGCCCTTTCCAGGTTTCAAAGACGACCTGGGCAATTTCACGCGGCAGCGGGTAGCAGTGGCGACGCCAGAAATCGGCGCAGGCCTGGTAGCGTAGCAGAGACTCATCTTCAATCAGCTGCTGCTCAAACAGCATGCCGGATTCAAAGGCATTCAGGTTGAGCATGCGCTGGCAAAAGCCGTGAATAGTAAAGACTGCCGCTTCATCCATCTGCCGCTCGGCTAACAACAACCACTGCGCGGCTTGCGCTTTATCGTCGATCTCTTCCAGCAGGCGTTTGTACAGTGGATTGTCGGTGGTTTCACGCAGACAGGCGATGCGCAACTCGTGGATATTGCTACGGATACGACCACGCAATTCTGCCGTAGCAGCCTCGGTAAAGGTCACCACCAGCAGTTCTTCAACGGTCAGCGGGCGGGGAAAGGCGGCAGAACCGCCTAGTCCAAGTAACAGGCGCAAATAGAGCGCCGCAATCGTAAAGGTTTTGCCTGTGCCGGCAGAGGCTTCAATCAGGCGCTCGCCCTGTAAGGGCAAGCGCAAAGGATCTAGTGTCTCGGCGACATCACTCATTCTTTTCACTCATCAGGGGCATTGTTTGCTGCAACGCGCTGACGTTCTCCCACACTTTCCAGCCTTCAGGATGCACATATTCGGCTTTCCCGTTCTGGCTGCCGGAAATCTGCGACAGAATAGCCATACCTTGCGGCTCGACCACCGCCTGATGGAAGAAATCAGCAAGTTTTTGCGGCGTCAGCAGTTTTATCTGGGCCACGATTTTATCACGCGAATCGAAGCGCATATTGCCGCGATCGAAATCTTTACTTAACTTCGATGCTTCTTCGCCGAGCGTTTGCGGTGCCTGCAGCATCTGAGTAATTACCGCCTGCTGGATTTGCGCAAACTCCTCTGGCTTCATCGCCCGCAATTTTGCCTCTGCGGTTGGGAAAAACGCCTTGTAACGCTCCCACAAGAATGAAGGCTGTTTATCATTGCTTTGCAAAAGGAAGCCCATGCCCCACTGACGCCCCACGCTCATTGGAAACGCAAACACGGCATAGCCCAACTGTTCTTCGGTACGCAACTGATTGTAGAACCACGGCTGTACGATCTGCCCCAACAGAGAGCTATAGGCTGAGCTGGTGTATTCATCGTAGCCAGTCGGTACAAATATCGCTGCCAGTGCGGAGTCGGTGCTGTTACCAGCTTTTTCAAAGATGACGGATTGTTTTTTATCGACCACGACATCTTTGTTACGACACCACTCTGAACCATCAGCGCCCAACTGTTTTTGCACATGGCGTGCCAGCGTTGTTGCCTGGGCTTCAGTCATGTTGCCGATAACCATAAACTCTGGTCTAGCCCCTGATTTTAAGGCGTCGCGATAGGCCAGCACCTCTTTCAACGTAATGGAGGGCAAAATTTTGCGCCGTTCATCTCGCGAGAAGTACGGCACTTGCGAGAGCATCTGCGCGGGCATAATCGCCTGCTCAAACGCTTTGCCCTTTTCTGCGGAATCCATCATCTGGTTATACCAGGACTTCGCCTGCTCAAGCTGATCTTCCGTAGCGGTATAGCTAAAGTAGCCCTCCAGCAGAGCCTGGAACAGCTGCGGCAGGCGCTGAGTGTAACCATTGGCATTAACCATAAGGCCGTTGTTAGCATTGGTGGAAAAACTTATGCCACCAACCGACGCCTGGTTGCTTAACTGATCAAGCGCCAGCCCTGCGAGATAATCATTGAGCGCAAACATCACCTGATTGCGGGCGCTGTCCATGGCTTTCGGATTACGCAAAATCAGGCTGACATCAGCTTTGGGCTCACTGGCAAAATAACGGCTTGGCGCATACACCACGCGCAGATTCGACTCATCAACAATCAACTCTGGATGGTCGTATTTCTTCTCTGACTTAATCAGCGAGAAATCGTCAGGAATATAGGGGTTAAGCTCCGGTAAGGAGAGCGCAATATTGGCGGCTTTTTTCTGCCAGTCCGCGAAAGTTTGTGCGCTAATTTTATCGACCTGATACGGCGCATCGACAAAGTAAGCCGTTTTGTTGTGCGGCTCTTTCGGGCTGATATACCAGATACGCGCATTCTGCGGCGTCATCATCGCCAGACGTTCTTTTACTGCTTTAGCATCGTACCGATCGGCAATATTGACTGCATCCAGTGTATGCTCAACAGGAACGCGAATCATGGTATCAGCCAGCCATTCGACGTAATCCATATCACGGGTGATTGACGGATAACGGAAGTCGATATCCAGCACATTCGCCAGTTCATCGAAGTATTGTTTATCGATCCCTTTTTCACGTAACAGATTGAGGTAGCTAAAAATGGCCGCCACAACCTGATCGCGATTCGCCAGACCTTTATCGGTTAAAGACGCAGAGATCGCTAATACGCCGCTGTTGCCGTTGACGATAGGATCGGAATTGGCGCTAATGCCCTCAACTAATCCCTGCTTTTGCAGCCAGTCAGAAAGTGTACCAGGGCTGCGATTACCAATCAGATAGGTAATCAATTCATCCGTTTTACTACGGAACTTCGCTGAATTGTTATCGATGCGAAACTCAACGCGCAGAACTTTACGCGGCAACGCCGGGACGTAATGAATGATAATGCCCTTTTGCGCGTCGGTGACTACCGGCACGGTGATTTCCGGTTTTTTGCTCTCTTTGTTCGGCACGCGACCAAAGGTGTCCGCCGCCATTTTCGCCAACTCCGGCAACGGTTTATTGCTGTAAATAACCGCCTTCATCAGATTGGCGGAATAGTACTTCTCGTGGAAATCTTTCAGCGCCTGCTGTACCGGATTACCTGGTTTGTCGCTTAAAGTTTCGAGGTTACCACCAGAAAACTTTGAACCGGGGTGTGCCGGGTTAATGGTTTCTGCGCTGACCTGTGCCATGCGCATCCCGTCACGCGTACGCGCCATGGTTAATTCGGCATTCACTGCATTACGTTCACGTTCGGCGTATTTCTTGTCGAGCAAGGGTTCTGCAATAGCATCGGCCAGGCGGTCTACCGCACCGGGCAAGGCGTCGTTCTCAACTTCCAGATAGAAAGCCGTGCGATACGGTGCCGTGCTGGCATTGTGACTGCCGCCGTGCATTTTGAGATATTCGGCCAGACTGTCAGCCTGCGGATACTTTTTCGACCCCATCAGACTCATATGTTCAAGGTAATGTGCCAGCCCCTGGTACGCCTCAGGATCTTCCAGCGACCCAACGGGCACCACCAGCGCCGAGAGCGATTTAACTGCCTGCGGATCAGAAACCAGTAAGACCACCATACCGTTATCCAGACGTATAGCCTGATACTGGCGGTTATCTTTATCACTTTTACGGATGGTTTCCTGAATCGGCTGCCATCCCGTTTCTGCCTGACTTAAGGGTGCCCAGAGGGCAACAAACAACAATAATGCTTTGAACCAGATGCTGCGGGGCATTCACGGACCTCATAATCAACTTTATTTTCTGGCCAGATTCAACACGTTAACGCAAATCATCTGCCAGAATTTAATCTTGTGCTGCACGAGTCAGCCTATGTCTATATAACCATCAGTCCGTGACTGGTGCGCATCATAAAGTAAGCGGATAGATTGCGCAATTTTTATACAATACTCATGACTGATTAAAGCGAAACAGCGGTAACAGGAAACGTTGCGACTGTTCAACGATAGCCTCCATTGTCTCTGGTGTTAATTGCCGCCAGAGCCGTTGATACCAGATATCATCACCTTCGCCACGCACCATCATGTTGCCTTCGTAAGCCTGAAGGAATTTCGTACGGGCTTTTTGCAACGTGGAATCGTCATCCAGCATGGCATCGTTTTGCGCGTCATAACAGGTTTTTAGCCACGCGCCGCCACTTTCAGGTAACACCAGCAATGGCGCGGACATTCCTTCACGATACCCCTCAATCAGTTGTGAGAGGTAATGCAAAGCCTGTTCGGCTGCAAGCGGCGGAAAACGCCACTCGCCGTCTTTGCGTAGAAAAAGGCGACTTTCACCATTACCACCGCTGGCACAGTAGACAAGGTGTTCCAGCCAAAGTTGCATTCCCTGCGCCACACTTAATAAAGAGGGACACCAGCGCAACAGGCCATCCGGCTGCACCTGCGGCAACCAGCCAGTTATCTGCACACCGTTGCAGGCGAGATCAATCTCCATACTCTGCCCTGGCTGGCGACAGGCAATGACTCTGTCGGCAAGCTGCTGCATCTCCTGACACTGCGTTTCCCAGAAAATTTCACCAAAGGCACCATACGGCAAATCACCTGCCGCCCGGAATCGGCGGAACAAGCGTTCGGCATCATCCTGCTCAACCAGTACATTTAATAACTGCTGGTTGATTTGATAACGACTAAGCCCTTCAAGAATAAAAGGTTCAGTGTCGGGAATTTCGCTGTCTTCGGTACGGAAGTTCACCTGCAAACGCATCTGGAAAAACGCCCGCACCGGATGTGCCCAGAATCGTTGTAGCGTTTCCAGCGGCACGGTTTCCGGTAAGGTAAATGGCAGCGGCTGAACAAATTCAGAATGTGCTTTACCAGCCTGGCTGGCCGCAGGTAGCCACTCGCGCGCATAGCTTTGTAAGTTACCGGGCTGGTAGTTTTGCGGGTCAAACGGCATCCGGGTATGGTGGCAAGTAAGATGCGCTTTTACCCTTGCCTCGCTTTCATCACAGTTAAGCGCTTCATCGCCCGGTAGATAATGGCTTTGCCCGATGTAGTCGATCAGTTCCTGCACCAGTACCGACGGGAAACGTTCACTGTTATCCTGAATGGAACGCCCAATATAGCTGATATAGAGTTTTTGCTGCGCGGAAATTAACGCTTCCAGGAACAGATAGCGGTCGTCATCGCGACGGCTACGGTCGCCACGCTTCGGTTTCTGGCTCATCAGATCAAAGCCCAATGGCGCAAGCTGACGTGGATAAACGCCGTCGTTCATTCCCAGCAGGCAAACCACTTTGAACGGAATTGAACGCATTGGCATCAGAGTACAAATGTTAACCGGTCCGGCGAGAAAACGCTGGCTGATACGTTCTTGATCCAGGCGCAGTGCCAGTTCATCACGCAATAGTGACAGCGGCACCGCGTCGCCATACTGCGCGCCTAAACCTTCGGAGATAATCGCCTGCCATTGTTGTTCGATCAGCGTCATCGCCGCTTCGGTTTCCGCATCCGGCAGGAAAAAGGCGTTGAGCATATCGCGACAAACCGGCAACCACTCTTCCAGCGGACGCTCCTGCGCCAGCCCGCGACGCCAGATATTTAGCTGCATTAGCAGTGAAGCCAGATGCCCCACCAGTTCTGCAATTAAGCCGCTCGATTCATCATAAGGTAGAACCGATTGCCACTCGCCCTGCGCGCTCTCCATCGCGTAGCCCAGCAACATGCGCGTCAGGCCAAACCGCCAGGTGTGTTGACCGGTAGCGGGAAGTTCCAGCTCGCGAACGTTGTCGTCATCTATCCCCCAACGAATGCCGGATTCGTTGACCCACTGACGTAAATAACGCAGCCCTTCTTCGGTGATGTCAAACCGCGCTGCCAGCACCGGCACATCCAGTAATGCCAGCACGTCTTCCGACACAAAGCGGCTGTCTGGCAGCGATAACAGGCTGATAAACGCTTCAAGTACAGGATGCGACTGCCGCGCCCGACGGTCGGAAATGGCGTAAGGCAGGTAACGATCCGCAGGTGCACTACCAAACACAGCCTGAATAAACGGACTGTAGCTGTCGATATCAGCCACCATCACGATGATGTCGCGCGGAGTAAGTGTCGGGTCTTCCTCCAGCATCGCCAGCAGGCGATCGTGTAAAACTTCAACTTCACGCTGCGGGCTATGGCAAACGTGGAAGGTGATACTGCTATCCAGTGGATCAAGCGGGCGTTTGTTATCGCTACGGGAAAACTCTTCGATGTTCACACCAGCAACGGCGCGGTTTTCCAGTTCCAGAATGTCAGACTGAATATTATGCAGCAGGTTATCTGGCGTCACATCGACAAAAGCGTCCAGCTCCTGGCTGCTCTCCAGGTCAGAAAGGAGATAAATGTAGTCGCGCCCAAGCTTGCCCCATGAAGCCAGCAGCGGGTTGCCGACATCCTGTTCACCATCGCTGTTAAAGAGCTGCCCGGCATTTTCGCTGTCGCGAAATAGCGGTAATTCGCGATCTTCAAAACTGTGTCGGCGCTGGCGAGTCAGTAGTTTCGCCAGATAAGCTGGATCTTTAATGTCGCCCCAGTAATAACGGCAGGGGTTGGTAAACAGGAGATGGATTTCAATATGTTTACCCAGCGCCTGTAGCGCCTGGAGATAAACAGGCGGTAACGCGGAAATACCGCATATAAAGACGCGCGAAGGTAACCCCGGCGGGCAGGTCGTCGCGGACTCCAGCGTTTCGATAAAGCGCTGATAGAGATTGGCGCGGTGCCAGCGCGGTTGCCCAAGTTCGTCGGTATATTCCACCAACGCCTTCCACAACGGCGCTTGCCAGGCCTGTGCTTCTCCCAACCCTTCTACCAGATGTCCTGTTTCCCACTGTGCCAGCCAGTCCGGACGATAGACCAGATACTGGTCAAACAGGTCCGCCGCTTTTGAAGAAAGCTGGAACAGTTTTCGCTTGTCACTATCGTCAGTCAGATAATGCCGCAACAGGGTAAAGTCTTCGCGCTCCAACAGTTGCGGCAGCAGAGTCATCAGTTTCCAGCTCATGCTCTGTTTGTTAAAGGCGCTCTCTTTGGGGATCTCCGGTAACACCCGGACGAACATATCCCAGATAAAGCTCGCTGGCAGCGGAAAATCAATGTTTGCCGCAATACCAAACTTTTGCGACAGGGTCATTTGCAGCCACTGTGCCATACCGGTACTTTGCACCAGAATCATCTCTGGTTCGAAAGGATCGTCCAGCCGTTCGCGTTCGACAATAAACTCCATCAACGCTTCCAGCACGTCCAGACGATTGGAATGGTAGACCCTTAACATAGCGGCTCCTGACTACTGACGATTCGGGCAATGCAGGCGGGTCATCTCGCCTTCTCTGCCCCCGGGTGAAACTAGCGTAACGCTGATGCTGACACATCCCGCCTGCGATGTCTGCATTCGGTTGACCTGCCAGTTAGCAGGTGGCGAAATCGCGCGCAGTTGCGTTTGCTGCCAGCCATGCCGCCAGAGCTGTTGGTACTGGTTTCTGCTGGCAAGACTGTTCATTAATGTTCGCTGGAAACCCGATAACGCAGTGACAATCATCACCATCAACACCATCGCCAACATTACCTCCGGCAGACTAAAGCCTTGTTGATTCCTCAGGGAAGCTGACATAACGCCCTCTCTTTCAGCGGACAAAAATCGCTCCAGCCGCGTGGCGAAAAAACAATGTTTCCATCGATGACTTCGCCTGTTCGCCACAACGAAACGCCTTCATAACCAGCAATCAATAAGGCTTCATTATCTGCCAGTAAACGCAGACAAACCCGGGCACCGGTGGCAGCATACAGTAAGCACTGAACTGCGGGCTGCGTCTGCCAGGAGTGCATTTTTCCCCACTCCAGCGCCGACTGAACGATGGCCTGGCGGCTCAATGACTGACTTTCCATGCTCACGCGAGAAGCAAAACTGCGATCCTGCTGACTCATTCCTTGCAATAGCAAGCTACCCAAAATCAGCAGCATCAGGACCAGAGCCAGTGACGAAACTCCCTTTTCGCGGTTCACAGGTTGGCTCCTGTCACGCTATAGCTGGCATCCACCACGGTTTGCGGATCAGCCTTGCTGGCAGCGTGTATATTAACCGTCAACACCGGCGAGAAGCCGCTGACATCCTGACGTACGACCTGAAAAGTGTCGATAATGATGGCATCCGGATTAGTGACTTTATCCCAGCCCTTACCTTCACAGGATGTCGCACCGCGTAGCGTTTCCAGCACATGCTCCTTCAGACGAAATCCAATCTGGTCGGACTCTTTTACCGGTTCGCGATCCCAGATACCGTTACTGTTCGCATCCCACTGCACAATGACACAGTCACCCTGTCCGACAATTTCCAGCCCTTCGCCCGTACAGCTGCCATGGCAATAACCCGCCCTCTGGAGATGCTTCGCGACGGTAAATACCCGCAGCCAGATTTCATCTTCCAGCGCCAGTTTACGGGTGCTCGTTAAACTTTCACGCTGTAACGCAGGCAGAAAGCGTGCAGCCCCCAGCAACAATACGCTACTGATCGCCATAGCAATCAACACTTCCAGCAGAGAAAAACCTTGCTCTTTTACAGGCATCCTTCTGTTTCTCCTTGCTGACAAAGCCGGAGTCTTCCCCACGGCGAAACCACTAGCCACCACTCGCCCGTTGAGTTTTTGAAGCGAATATGCCCGGCCCATGCGGTATTGCGCAGGCCAAAGAAAGCAAGCGAAGGTGTCAGGTCGCTCATTTCGACTTCGGGCCAGCGCGGCACAAAGACCAATGGTGAACTGCCATGACAGGTATTCGCCCCAGCAACGGAACTGCCATGACAGGTATTCGCCCCAGCAACGGAACTCACAAGGCACCATAACGTCCCCTCCCTGATAAGACTGATACTGTGGTCGCGGTTATGCCAGTTGGCATCTTCACGTAAATAGAGCAAATAGTCCCGCGCCTGGCTGGCGGTTTGCCAAAGCCGTTGCGACTGCTGCCAGTATTGCCAGCCATAGAGCCCACTTGCGCTTAGCATGACCAGAATAAGCATCGCGACCAGCGTTTCAATCAGCGTATAACCACGTTGTGTTTTCATGCCGGCAGTATGGAGCGAGGAGAAAAAAAGACGAGGGCCAGTTTCTATTTCTTCGGCGCATCTTCCGGACTATTTACGCCGTTGCAGGACGTTGCAAAATTTCGGGAAGGTGTCTCGAAGAATTTAACGGAGGGCAAAAAAAACCGACGCACACTGGCGTCGGCTCTGGCAGGATGTTTCGTAATTAGATAGCCACCGGCGCTTTAATGCCCGGATGTGGATCGTATCCTTCAATCTCAAAGTCTTCGAAACGGTAGTCGAAGATGGATTCGGGTTTACGTTTGATAATCAACTTCGGCAGCGGACGCGGTTCGCGGCTTAATTGCAGATGAGTTTGATCCATATGGTTGCTGTAGAGATGCGTGTCGCCACCGGTCCAGACAAAATCACCCACTTCCAGATCGCACTGCTGCGCCATCATATGCACCAGTAACGCGTAGCTGGCAATGTTGAACGGCAGGCCGAGGAAGACGTCACAGGAGCGCTGATAAAGCTGGCAAGAGAGTTTGCCGTCTGCCACATAGAACTGGAAGAATGCATGGCACGGTGCCAGCGCCATTTTATCCAGTTCGCCTACGTTCCACGCTGAAACAATAATGCGGCGGGAATCCGGGTCGTTTTTCAGCTGGTTCAGTACCGTAGTGATCTGGTCAATATGACGACCATCCGGCGTTGGCCAGGCGCGCCACTGTTTACCATACACTGGCCCGAGGTCGCCGTTTTCATCGGCCCATTCGTCCCAGATGGTGACATTGTTTTCGTGTAGATAAGCAATGTTAGTGTCGCCCTGCAGGAACCACAGCAGTTCGTGGATGATGGAACGCAGGTGGCAACGTTTAGTTGTCACCAGCGGGAATCCATCCTGCAGGTTAAAACGCATCTGATGACCAAAAATGGAAAGCGTTCCGGTTCCGGTACGGTCGTTTTTCTGTGTGCCTTCGTCGAGCACTTTTTGCATCAGTTCTAAATACTGTTTCATGGTTCCTCAGGAAACGTGTTGCTGTGGGCTGCGACGATATGCCCAGACCATCATGATCACACCCGCGACAATCATCGGGATGGAAAGAATTTGCCCCATGCTGATGTACTGCACCCAGGCACCAGTAAACTGCGCGTCGGGCTGGCGGAAAAACTCAACAATGATGCGAAACGCGCCGTAACCAATCAGGAACAAGCCTGAGACAGCTCCCATTGGGCGCGGTTTACGAATATACAGGTTGAGGATAATAAACAGCACCACACCTTCCAGCAGCAGCTCGTAAAGCTGTGATGGGTGGCGCGGCAGCACACCGTAAGTGTCGAAAATGGATTGCCACTGCGGGTTGGTTTGCAGCAGCAAAATATCTTCTGTACGGGAGCCAGGGAACAGCATGGCAAACGGGAAGTTCGGGTCAACGCGGCCCCACAATTCACCGTTAATAAAGTTGCCCAGACGCCCGGCACCAAGACCAAACGGAATGAGTGGGGCAATAAAATCAGAGACCTGGAAGAAGGAACGTTTAGTACGGCGGGCGAAGATAATCATCACCACGATAACGCCAATCAGGCCGCCGTGGAAGGACATGCCGCCGTCCCATACACGGAAAAGATACAGCGGATCGGCCATAAACTGCGGGAAATTGTAGAACAGAACATAACCAATACGTCCACCGAGGAAGACGCCGAGGAAGCCCGCATAGAGTAAGTTTTCAACTTCATTTTTGGTCCAGCCACTGCCCGGACGATTCGCCCGTCGTGTTGCCAGCCACATTGCAAAAATGAAACCCACCAGATACATCAGGCCGTACCAGTGAAGCGCCACGGGTCCTATTGAGAAAATGACCGGATCAAACTCCGGAAAATGCAGATAGCTACTGGTCATCTGTCACCACAAGTTCTTGTTATTTCGCTGAAAGAGAACAGCGATTGAAATGCGCGCCGCAGGTTTCAGGCGCTCCAAAGGTGCGAATAATAGCACAAGGGGACCTGGCTGGTTGCCGGATACCGTTAAAAGATATGTATATGATCCGCGCTATAACCCCCCGCGAATCAACCCGCCCATGCCGCGACGCTCCATAAAGGCTGCAACCTGATGGCGAACTTCGGTCGCCAGTTGCGCTTCCAGACTACGCTGCGCAAGATTTTCTGCTTCAGCAAAATCAATGCGCCGCAGCAGGTATTTTACGCGCGCTACAGAACGTCCGTTCATAGACAGATGGCGATACCCAAGCCCAATGAGGATTGCCACGCACATCGGATCGCCCGCCATTTCACCGCACAAACGGAGATCGATTCCATGTATTTCCGCTTCCCGGGCGATCATCGCCAGAGCTCGTAACATTGCAGGATGAAGACTGTCATAAATGTTCGCCACCCGGGTATTGTTGCGATCAACGGCCAGGATGTATTGAGTCAGATCGTTGGTGCCAACAGAGATGAAATCGACCCGCTTTGCCAGATGCGGCAGCATAAATACCATTGACGGCACTTCCAGCATGATGCCGATACGTGGTTTGGGAATTTCGTAACCGATCATCTCCTCGACTTCACGTCCGGCACGTTCAATCAGGCGGCGTGCTTCGTCAACTTCATCGAGGCTTGTGACCATCGGCAACAGAATATTCAGGTTGCCCGTAGCGGCATTAGCACGCAGCATCGCCCGCACCTGGATCAAGAAGATCTCCGGCTGATCGAGCGTAATGCGAATCCCACGCCAACCCAGGCATGGATTCTCTTCGCTGATCGGCATGTAAGGCAGCTGCTTATCTGCTCCGACATCCAGCGTACGCAAGGTGACGGGTTTATCATTAAACATTTGCAGCATCCCCTGATACTGCGCCACCTGTTCTTCTTCCGACGGAAAACCACTTTGCAGCATGAATGGGATTTCAGTGCGATAAAGTCCTATGCCATCAATACGGCTGCCCAGTTTTTCTTCATGTTCCGGGCTTAAACCGGCATTGAGCATGACTTTAATGCGTTCGCCGCTTTTTAACTGGGCGGGTAAATTGACGTCATCTTCCGCCAGACGGCTAAGCTCGATCTCTTCACTAATTAGCCGCTGATATTCTTGCAGCAGTACCGGTTCCGGATCGACCAGCAATTCACCGCGATAACCATCGACGATCAGCGTCCGACGATGCAGTACCGAAGGCTGAATATCCGCGCCCATCACGGTAGGTATCCCCAGCGCACGTACCATGATCGCAGCATGGGAGTTGGCAGCGCCATCGCGCACGACAACACCGACTAAGCGATCCTGGGGCAGCTCAGCAAGCGTTGTCGCTGACAGTTCATCTGCCACCAGAATGAAACGTTCCGGCCAGGCGTTCGGCCCTTGATTAGCGTCATCAAGATGAAACAGCAATCGCTGACCCAGCGCACGTAAATCGCCAGCCCGCTCTTTGAGATAGTTATCGCTTAGCGCGGCAAACTGTTCGGCAAATTTTTCAATGACCGTTTTTACCGCCCACTCTGCCACCGAGCCTTTATCAACCTCGGCAAACAATTCGCGACGCAGCCGGGTATCCGAAAGCAGGTGTGAGTAAAGATCGAAAATAGCCGCCGTTTCTTTTTGTGCACCGGCAGCAAAGCGTTTGCTATAGCGGCGAAACTCGTTAGCCGCCTCTTCCAACGCCCCGGTCAGTCGTTCGCGTTCCAGAGCCGGATCCAGCGTTGATGCCTGATACACCTGTTCCATTAAAGGTAACGTGGCATCCTGCCAGCCTTCGGCAATCGCCACACCAGGTGCTGCCGGTAATGCACGGATTCGCGTCTGGCGATATTGCCCAAACAAGGCAGTCAACTGCGACTGAGAAAGAATAGCTGCCATCTGGGTGGCAAGCGTCACCAGGAAGGATTCTTCACTTTCGTCATACTGGCGCAACTCTCGTTGCTGTACCACCAGTACACCAAGCAACTGGCGACGTTGAATAATTGGTACGCCTAAAAACGCGCGGAAACGTTCTTCTTTTACGGAGGGGATGTATTTGAAGCTGGGGTGCTTTTGCGCATCTGCAAGGTTTATCGGTTCCGCCAGCCTGCCAACCAGGCCGACGATCCCTTCATCAAACGCGAGCGTTACAGTGCGACCGCGTGGTTTTTTCAGTCCCCGGGTCGCCATCAGGTAGTAACAACGTCGATCATGATCGGCCAGGTAGACCGAACAGACCTCGGTATCCATCGCAAGACAGATGTCGGTAACCAGAATATTTAACGCCTCATTCAGGCGTGGTGCGCTGGCTACCTTTTCGACTATTTCGCGCAGGCGAGTGAGCATAATTGGCGTGACTTAACCTCTTTTACGTCGATAAGCAGATGCGTTTTGTGGTTTTGGCGTATTTTCCTGCAGTGACATCACCACACTCGCGAACTCTTTCATTACCCTACGGTAGACATCACGTTTAAATGACACCACCTGTCTGACTGGATACCAGTAACTTACCCATCGCCAGCCGTCAAACTCTGGTGTACTGCTGGTTTGCATATTGATTTCTGCATCGCCGCTCACCAGCTGCAAGAGAAACCATTTTTGTTTTTGGCCGATACAAACCGGCTTCGTGTCCCAACGCACCAAACGTTTCGGTAATTTGTAGCGCAACCAGTTACGCGTTGAAGCAAGGATTCGAACGTCTTTGCGGCTTAATCCTACTTCTTCAAACAATTCACGGTACATCGCCTGCTCTGCGGATTCTCCGGGGTTGATTCCGCCTTGCGGAAATTGCCAGGAGTGCTGACCAAATCGCCGGGCCCACATTACCTGCCCCTGGCGATTACAAATCACGATACCTACGTTTGGGCGGTAGCCATCGTCATCAATCACCGGACTACCTCAAAATAAAGCTTTATATACGAATGATTGTTTCATACTCCAGGAAGACGGTAAACCACTCTCTGCAGGGCATTACACACTAATAACAATTGAATAACTCACAGTTATGTGCAGAGTTATAAACAGAGGAAGGGGTGGATAGCCGTTTTTATTCACCTTTTCTGTGGATAGAGTTGTGAAGAACTACGGAATTACTGCGGGAAAACCCGGAGCATTCTGAATAAGACAGATATAGAGATTTTAAAATATTCATTATCAGTCAATGCATTACATGTGATTTGAGTAATAAAAAAGAGTAATTCGTGACCCAGGTCACACCTCTCATTTACGGGTTGGCGAAAGATCAACCAATGCCGTATTTATCCACAGAATGTGCCACTAAGTTAAGCACTGAACCACTAAAAACTGGAGTTTCGTCGCACGTCAAGGCTGTAAATGGAAACAGTAGTGGAGGTTTTTCACAGTTATCCCAGCTTTCTGTGGATAACATGGTGTAAGATCCTGTTTATTTTCAGTGACCAGATTTGGAAAACCCGTTGCAGTGTTGCGCAACTCGATTACCGGAAACCTAAAAAGCAATATAAATCAGAGAATTGAACAACGCATGTGGAAAAAGTTACACTGCGAATATTCGGCACATAATTGCTGTTTGTTTTTTAACCAAGGTATCATGACATGTCCCAACCTCGCCCACTGCTCTCTCCTCCCGAAACTGAAGAACAATTGTTAGCGCAAGCACAACAACTTTCTGGTTATACATTGGGAGAACTGGCGGCACTTGCCGGGCTGGTTACGCCGGAGAATTTAAAACGCGATAAGGGCTGGATTGGCGTGTTACTGGAGATCTGGCTAGGTGCCAGCGCAGGGAGTAAACCTGAGCAAGATTTTGCTGCTCTGGGCGTGGAACTTAAAACTATCCCTGTGGATAGTCTTGGTCGTCCGCTGGAAACAACATTCGTTTGTGTTGCCCCGTTAACGGGCAATAGCGGGGTGACCTGGGAAACCAGCCACGTGCGCCACAAGCTCAAACGCGTGCTGTGGATACCGGTTGAAGGCGAGCGCAGCATCCCGCTGGCAAAGCGTCGCGTAGGATCACCGTTGCTGTGGAGCCCGAATGAAGAGGAAGACCGGCAGTTACGCGAAGACTGGGAAGAATTAATGGATATGATTGTTCTCGGTCAGGTTGAGCGGATCACCGCTCGGCACGGGGAATATTTACAGATACGACCGAAAGCAGCGAATGCGAAAGCGCTGACCGAAGCTATTGGTGCCCGGGGCGAACGGATTCTGACGCTGCCGCGCGGATTTTATTTGAAGAAGAATTTCACCAGTGCGCTACTGGCCCGTCATTTTCTGATCCAGTAGCCATCGCTTTGACCTGCCGCTTTCCGGGCATATAATTACCGCTTCATTTTTTTGGCAGGGCTTTTTAGATGTTATTTGCATGGATAACCGATCCTAACGCCTGGCTTGCGCTCGGTACACTGACGCTGCTGGAGATCGTTCTTGGGATCGACAATATTATTTTCCTTTCTCTGGTGGTGGCAAAGCTTCCCACAGCACAACGTGCTCATGCGCGCCGTCTGGGGTTGGCGGGAGCCATGGTTATGCGTCTGGCGCTGCTGGCATCCATCGCCTGGGTTACGCGCCTGACGAATCCGCTTTTTACAATATTCAGTCAGGAAATTTCCGCCCGTGATTTGATTCTGCTTCTGGGTGGCTTGTTCCTTATCTGGAAAGCCAGCAAGGAAATCCACGAATCCATCGAAGGTGAAGAAGAAGGGCTGAAAACACGCGTTTCATCATTCCTCGGCGCTATCGTGCAGATTATGCTGCTGGATATTATCTTCAGCCTCGACTCGGTGATTACCGCTGTGGGTCTGTCAGATCACCTGTTTATTATGATGGCAGCCGTGGTAATTGCCGTAGGCGTGATGATGTTCGCTGCGCGTTCGATTGGTGATTTTGTCGAGCGCCATCCTTCGGTAAAAATGCTGGCGCTCTCTTTCCTGATTCTGGTGGGCTTTACCCTGATTCTGGAAAGTTTCGACATCCACGTACCGAAAGGTTACATCTACTTCGCGATGTTCTTCTCTATTGCGGTTGAAAGCCTCAACCTGATTCGCAACAAAAAGAATCCGCTCTGATACTCCGTACGCTCTCCTGCGGGAGGGCGTACTCACTCCTGTTACCCTCACAGTTTAAGATTTTCCTGCTTTCAAGATATATAACGTCGGTTTATAAACAGACTATTATCATAGGTGGGCCAAATGAGGATAACCGGATGAAAAAATGGGCAGTAATAATTTCTGCAGTCGGACTGGCGTTTGCTGTTTCCGGGTGTTCCAGTGATTACGTCATGGCGACCAAAGATGGCCGTATGATTTTGACCGATGGAAAACCTGAAATTGATGATGATACCGGGCTGGTGAGTTATCACGATCAGCAAGGTAACGCGATGCAAATTAACCGTGATGATGTTTCGCAAATTATTGAACGTTAACAAATAAGGTCAGCATCCGGCTGGCCTTAAGATTTTTCTCTTTCCCTTTTCCCTTCCCTCTGCCATTTTTATATTCCTTATGTCGTGATTATAAAAAGGAAACGGCTATGCAATATCACCGTATACCCCACAGTTCGCTGGAAGTCAGCACGCTGGGGCTTGGCACGATGACGTTTGGTGAACAGAACAGCGAAGCCGACGCCCACGCACAACTCGACTATGCCGTCGCTCAGGGCATTAACCTTATCGACGTTGCCGAAATGTACCCAGTACCTCCGCGCCCCGAAACTCAAGGGCTAACCGAAACCTACGTCGGCAACTGGCTGGCGAAACATGGCAGCCGCGAAAAGTTAATTATCGCCTCCAAAGTGAGCGGACCGTCGCGCAATAATGACAAAGGCATCCGCCCGGATCAGGCGCTGGATCGGAAGAATATCCGCGAAGCGCTGCATGACAGCCTCAAGCGTCTGCAGACTGATTACCTCGATCTTTATCAGGTGCACTGGCCGCAGCGCCCAACCAACTGCTTCGGCAAACTCGGTTATAGCTGGACAGATTCTGCGCCTGCGGTTTCGCTGCTGGATACACTGGACGCACTGGCAGAGTACCAACGCGCGGGAAAAATTCGTTATATCGGCGTGTCGAACGAAACTGCATTTGGCGTAATGCGCTACCTGCATCTGGCGGACAAACACGATCTGCCGCGTATTGTCACCATTCAGAACCCCTACAGTCTGTTAAACCGCAGTTTTGAAGTAGGTCTGGCAGAAGTCAGCCAGTATGAAGGGGTCGAACTGCTGGCCTATTCGTGCCTGGGTTTCGGCACGCTGACCGGGAAATATCTCAACGGTGCAAAACCCGCTGGCGCACGTAATACGCTCTTTAGTCGGTTCACCCGCTATAGCGGTGAGCAAACGCAAAAAGCCGTCGCGGCGTATGTTGATATAGCCAGACGTCATGGCCTGGATCCTGCACAGATGGCGCTCGCTTTTGTACGCCGTCAACCGTTTGTTGCCAGCACTCTGCTGGGCGCAACCACGATGGAGCAGCTGAAAACTAACGTCGAAAGTTTGCATCTGGAGTTAAGCGAAGACGTGTTGGCAGAAATTGAAGCGGTGCATCAGGTTTACACTTATCCGGCACCATAAGATTAACGCCGGTTAAAACCGGCGTTAAATATTAATGACGGCGCTGCCAGATCCACAGCGCCGTTATTGCCAGCGCAAACAGCGCACCGAAGCCAATGCCAATGGGCACGACCGGGATGCCTACCATTACCGCCAGCGAGTAAATGCCCAGCATCAACAACATGGCGCTGTTTTCGCCAAGGTTTTGTACTGCAATCGCATTCCCCGCCCCGACGCTTTTTTTGCCCCGCTCCTGTAGCAACGCATTGAGCGGAACGACAAAAAAGCCCCCCAGCACGCCAATCAGCATCAACAAAGCATAGGCTGGCAGCAGCTCGTGTTGCAGGGAGAAAATCAGTACCACCACGCCAATCAAAATCCCGGCTGGCATACAGCGTGACACGGTTTCCAGCGTAACTAACTTCGCTGCCGCACCTGCACCAACCACGATACCAATCGCTACCATCGCGTTGAGATAGGTCGGCGTAGCGTTATCGGTAATACCCAGCGCCACCGGTACCCACAGCACCAACAGGAAACGCAGCGTGACACCCGCTCCCCAGAATAAACTGGTGCCCACCAGCGAAAAACGCGTTTCACCATTGCGCCATAGCGAGGTGCAGGCATTCAGGAAACTGCGGGTCATGCTGATGAGATTCCAGGACTGCCCCGGACGCGCCGCCGCCAGTTTGGGAATGTAGATATTGGCAACGACCGCGCCACCGTAGGCCAGTGCGCATGCGACCAGGGCAACCAGAATATGCCAGTCAGCCAGAACACCACCAGCTACGGAACCGAGCAAAATCGCCGCTATGGTAGACGCTTCCATTAAACCGTTAGCTTTTACTAACTTACTACCCGTGGTTAATTCGCCGAGAATACCGTATTTCGCCGGTGAATAGGCTGCAGCACCAACACCCACCAACGTATAGCCGAGAAACGGATTGATACCAAAGCAGATACTGGCTGCGCCCAGTAGCTTCAGGCCGTTGGCAAACATCATCACCCGGCCTTTGGCGAAGCTATCCGCCACCTGCCCGACAAACGGCGCAAAAAGAATGTAAGCACCTACAAACACCATTTGCAGGATGGGCTGGCTCCACTCCGGATAGAACTGCGCTTTCAGTAACGCCAGAGTGGCAAACAGTAGCGCATTATCGCCAAACGCAGAGAGAAACTGCGCCACGATAACCGCTTTCATCCCCTTCGACCACAACGAAGTGTTAGTGTGCACTGACTCACTCATCGTGTTGTTCCGCTTCGTCTACCCAGCTTTTCAAAGTGACAAAGTCAGGTTTGCCGCTGCCAAGTAATGGCATCTGTTTCAGATAGCGAATATCGCGCGGTACAGCAAGCTCCGGCACGCCGTGCTCGCGGGCATACTGTTGTAACTTATCGCGCGTCAGTTCGTTATCTGTGGTGAAAAGCACCAGTGCCTCGCCTTTGCTGGCATCGCTCTTAATCGCAGTGGCATGGACTTTATCTGGCGAAACACCAAGTGCCAGTTGTTCCACCATTTCCAGCGACACCATTTCGCCTGCAATTTTGGCAAAGCGTTTTGCGCGGCCCTGAATCTGCACAAAGCCCTGCTCGTCAAAACGCACAATATCGCCAGTGTCATACCAGTCGCGCTCCATTTCGCCGCGAATATTCTCGGCGGTGGGCACTTCCAGTACACCAGGCTTCTCCACCCGCAGATAGCCGTTCATTATGTTCGGCCCTTTCAGTTGCAGGCGTCCGCCCTCTTCGATACCAGGAACCGACAACAGGCGCGCATCCATTCCTGGTAGAATACGCCCTACCGTACCGGGTTTCGCCGCCATCGGTACGTTGATAGAAACGACAGGCGCGCATTCGGTCACACCGTAGCCTTCAAGGATGCGCAGGCCAAATTTATCCTGCCAAAGCTGTTTAGTACTTTCTTGTAGTTTTTCTGCGCCTGCCACCACATAGCGTAGACGATAGAAGTCATACGGGTTGGCGAAACGCGCGTAGTGACCGAGGAAAGTGGAGGTACCGAACAACACGGTGCAACTGCGGTCATACACCAACTCCGGCACAATACGGTAGTGCAGCGGGCTTGGATAAAGGAACACTTCTGCACCTGTGAGCAGTGGCGTAAACAGGCCTACCGTCAGCCCAAAGGAGTGAAACAGCGGTAACGCCGACATAAAGCGATCGTTGGTGGTGAAGTCGGCAATCGTTTTAATCTGCTCGACATTCGCCAGAATGCTTTTATGGCTATGGACGACGCCTTTCGGATGGCCTTCAGAACCGGAGGTAAAAAGGATCAGCGCCTCTTCTTCCGGCTGCTGTTTAACCTGTGCCAGACGCGGCATCAGCAAATGAGCGAAGATCCATACTTTGTCGGCAGTGGTGACATCTGCTTTTAAATCTTCCAGATAGACCCAGCGCACCTGAGTAAGTTGCTCCGGCAGATGCCAGAGTTTGCCTTTATCGAGAAACTGACGGGAAGTGAAAATGGTTTTGATTTCAGCCGCCGTAATAGCACTGGTCAACCCTTTTACCCCGGCGGTGTAGTTCATCATTGCGGGAATGCGGCGACGGGCGATGGCCCCAAAAATCACTGCAGCACTGATGCCTGCATTGGGCAGCATTAAGCCGATGCGTTCGCCTTCAACACTGTATTTTTCAAGGATGCGTCCAACAAACAGCGTTTTCGTAAGCAATTTGCGATAGGAGTCCGGGGTAAAGTTAACGTCTTCGACACATTTCTTCCCGGCTCCGAAGCGGTACATTGCGCTCAGTAAAGATTCGTACAGCGTTTCACGCGGGCGCACCGCCATACGCGCTTCCATCATTATTTGATGCAGCATTTCGCCAGCGATTTTGCGACGGTCACGGGCACGCGGCGCATCCGGCATCTCCACCTGCGTTGGTGGCAAAATATGCAGAGTAATTTGCGGGAACAAGCGACGTTTAACCAGACCTTTCAGGCGGCTGAAGTGCGTAAGTTCCGCCCCTTCAATACGCACAGGAATAACCGTTGCACCAGACTTCGCCGCGACAAATCCCGCGCCATCGTAGATTTTCATCAGCGAGCCAGTGGTGGTGATGCGTCCTTCAGGGAAAATCACCACTGGTCGGCCCTGTTCCACCAGACGTACCAGATGTTTAATCGCCATAGGTTGCGTCGGGTCGAGAGGAACAAAGTCGATAAATGATTTCAGCCAACGCATATACCACTGTTGGCTTATTGAGGTGTAAACGGCAAATACCGGACGTACGGGTAAAAACAATGCCAGCAGTATGCCATCAATAAAAGAGACGTGATTAGGCGTAATTAGAACGCGCTCGCCCTTCAGTGCCTTGGTGTCACCCGTAACGCGAACGCGATACAAAACACGGCACAAATTTCGAAAAAAGCTAAAAAGCATTCCAACTCCCTTTGCTCTGATTCAGTAAAAGCGAATGGAGGGAGATTACACGAGATAAAGAACGCGAGCGACAGTAAATTAGGTGCGAAAAAAAACCTGCGCATCCGCGCAGGTTGGTGCAAGAGACTGGGTACGAAGAGCGTACCGAATAATCTCACCAATCAATACCTCTGGGATCTTGATTGTGGTCTGCACAACGACTCTTCGCCAGCGAGAAAACGCAAAGGAATGAAGGGAAATGCAACGAGGTGTGTAAATTGTCGGTTACTGTTACAGATTGATGACCGGCAAAAAAAAACCTGCGCATCTGCGCAGGCTGGTGTAATTCATGTGCTCAACCCGAAGTTGACTTCACCTATCAATACCTCTGGGATCACCACTTTAGCAACCTGAAGCCAAACGCCACCAGCGGTCAATCGCAACAGCGTTTCGCAAAGTGTAACCAAAGGTTTGCAATCTCTTTTTTTGTCTTACTTATTTGCGTTTGGCTCACATTCCCACAATGAAAACACGCCGCCCCTTGAACCAACGGGCGTTTTCCGTAACACTGAAAGAATGTAAGCGTTTACCCACTAAGGTATTTTCATGGCGACCATAAAGGATGTAGCCCGACTGGCAGGCGTTTCAGTCGCCACCGTTTCCCGCGTCATTAATAATTCACCCAAAGCCAGCGAAGCTTCCCGGCTTGCTGTGCATAGTGCAATGGAGTCTCTTAGCTATCACCCGAACGCCAACGCCCGTGCTCTGGCGCAGCAGACCACTGAAACGATCGGTCTGGTCGTTGGTGATGTTTCCGATCCGTTTTTCGGCGCAATGGTGAAAGCGGTCGAACAGGTGGCTTATCACACTGGTAATTTTTTATTGATTGGCAACGGTTACCACAACGAACAAAAAGAGCGTCAGGCCATTGAGCAACTGATCCGCCATCGCTGTGCTGCGCTGGTTGTCCATGCCAAAATGATCCCGGATGCCGATTTAGCCTCATTAATGAAACAAATGCCCGGTATGGTGCTGATCAACCGTATCCTGCCTGGCTTTGAAAACCGTTGTATTGCTCTGGACGATCGTTACGGTGCCTGGCTGGCAACGCGTCATTTAATTCAGCAAGGTCATACCCGCATTGGTTATCTGTGCTCTAACCACTCTATTTCTGACGCCGAAGATCGTCTGCAAGGGTATTACGATGCCCTTGCTGAAAGTGGTATTCCGGCCAATGACCGGCTGGTGACATTTGGCGAACCAGACGAAAGCGGCGGCGAACAGGCAATGACCGAGCTTTTGGGACGAGGCAGAAATTTCACTGCGGTAGCCTGTTATAACGATTCAATGGCGGCGGGCGCGATGGGCGTGCTCAATGATAATGGTATTGATGTACCGGGTGAGATTTCGTTAATTGGCTTTGATGATGTGCTGGTGTCACGCTATGTGCGTCCGCGCCTGACCACCGTGCGTTACCCAATCGTGACGATGGCGACGCAGGCTGCCGAACTGGCTTTGGCGCTGGCGGATAATCGCCCTCTCCCGGAAATCACTAATGTCTTTAGTCCGACGCTGGTACGTCGCCATTCAGTGTCAACTCCGTCGCTGGAGGCAAGTCATCATGCAACCAGCGACTAACCGCAGTTAAAGCAATTCCAGCGCCAGTAATTCTTCAATGGTCTGGCGACGGCGAATCAACCGCGCCTGACCATTATCAAACAGAACTTCTGGTAACAGCGGACGGCTGTTGTAGTTGGATGACATTGATGCGCCATATGCCCCTGTATCATGCAGTACCAGATAATCACACGCCTTCACTTCCGGCAAGGCGCGGGTTTCAACATTTCCCCCTTCCTGCTGGGTAAAGACATCGCCCGATTCACATAACGGCCCGGCGACGACGGTTTCCACCGTTGGTGCGTGTTCCAGAGAACGACCATCAGCTGCCAGGGCACTGATATGGTGGTAACTACCGTACATTGCCGGGCGCATCAGATCGTTGAACCCGGCATCAACCAGCACAAAGTGGCGGCTACCCATTTGTTTGACGCTCCGCACTTGAGTAATTAATACGCCAGCCTGCGCTACCAGAAAGCGACCCGGTTCAATTTCCAGTTTCACAGGATGGCCCAAATGGCGGGCGATTTGCTCACGCGCGGCATTCCACAGACCATAATAATGTTCGGTATCAACCGCCTCTTCACCCTGTTGATAAGGAATAGAAAGCCCACCGCCCGCAGAAATAGCCTGTAAATCCTGACCGAATTCGAGGACCTGACGCACCATAGCACCACATACCTGTTCCAGATGGGCATAATCGACGCCAGAACCAATGTGCATGTGAATGCCGACCAGCTGTAGATGATGACGTTGTATCACGTCCAGTGCGGCGGGCAGATCGGTGTACCAGATACCGTGCTTGCTGTTTTCGCCACCGGTATTGGTTTTTTGGCTATGCCCGTGACCAAACCCCGGATTAACACGCAGCCATACCCGATGCCCTGGCGAAACCTGACCCAGTTGGTCGAGCATATCAACAGAACCCGCATTCACCGGAATTTGCAATTCACTGACGCGTTCAAGCGTCGCCTGATCGATAACATCTGCCGTAAAAACAATATCATCGGGGTGCGTTTGCGGATTGTAACCCGCCGCCAGTGCACGCTCTATTTCGCCTAACGAGACGGAATCCACTTTTACGCCCTGCTCACGCATTAAGCGCAAAATATGAATATTGGAACAGGCTTTCTGTGCAAAGCGCACCACATCAAACTGTTTCAGCGCTGCAATCTGCCGACGAATAATTTGCGCATCGTAGACCCACACCGGGCAGCCAAATTCTGCGGGCAAACGCAGCAGATTTTCGGCGGTGAGATCGGTATCAGTGCTGAACAGTGAATGTGGCATAACAAACTCCAGATAAGTGCTTTTTTATGATTACGCCACATCATAAAAAGAATAAAAAATATCGATTTATGTCGAGTCTATGCAAAAATGATATGGATTACCGGATTGCGAGAGAGCGCTAATGGCCGCCGTTAACTTACGTCATATTGAAATTTTTCATGCGGTAATGACCGCCGGAAGCCTGACTGAGGCGGCACACCTGCTACACACCTCACAGCCAACCGTCAGCCGCGAACTGGCGCGCTTTGAGAAGGTGATCGGGCTGAAATTGTTTGAGCGCATACGTGGACGATTACATCCTACCGTGCAAGGACTGCGTCTGTTTGAAGAAGTGCAACGATCCTGGTACGGACTGGATCGCATTGTCAGTGCCGCAGAAAGTCTGCGCGAGTTTCGCCAGGGAGAACTGTCTATTGCCTGCCTGCCGGTCTTTTCGCAATCTTTTTTACCGCAGCTCCTGCAACCCTTTCTGGCACGTTATCCCGATGTCAGCTTAAATATCGTGCCCCAGGAATCACCGCTACTTGAAGAGTGGCTCTCGGCCCAGCGTCATGATTTAGGACTCACTGAAACGCTCCATACGCCTGCGGGAACAGAACGTACCGAATTACTCTCTTTAGATGAAGTGTGTGTGTTACCTCCGGGCCATCCGCTGGCGGTAAAAAAGGTATTAACGCCGGATGATTTTCACGGTGAGAACTACATCAGCCTTTCCCGTACTGACAGCTATCGCCAGTTGCTGGATCAATTGTTTACTGAGAATCAGGTTAAACGACGCATGATCGTAGAAACCCACAGCGCCGCGTCAGTCTGCGCAATGGTACGGGCGGGGGTAGGCGTTTCGGTGGTTAACCCGCTCACCGCACTGGATTATGCGGCAAGCGGTTTAGTGGTGCGGCGGTTCAGCATTGCGGTTCCATTCACCGTCAGCCTGATCCGCCCCCTGCACCGCCCGTCATCAGCGCTGGTGCAGGCGTTTAGTGAGCATTTACAAGCGGGATTACCGAAACTGGTCACTTCTCTTGACACTATTTTGTCGTCAGCTACGACAGCATAAAAGCGACAGCATCCTCGGCATGGATCGCCGCGGTATCAAACACAGGCAGAACACTGCGCTCTTCTGGCACCAGTAAACCAATTTCTGTGCAGCCAAAAATGACGCCCTGTGCGCCCTGTTCTGCAAGGCGAGCAATCACTTGCGCATAATAAGCGCGTGACGCTTCGGTAAATTGCCCCAGACACAGTTCTTCAAAAATAATCTGATTAATTTTCGCCCGTTCATCCGCTTCAGGAATAAGACAGTTGATGGAAAATTGTTCCGTCAGCCGCCCGCGATAAAAATCCTGTTCCATGGTGTAACGTGTACCCAGCAGCGCCACACGAGTCATTCCTGCCCCGGTAATTGCACGTCCAGTGGCATCCGCTATGTGTAAGAAAGGCAGAGAGCAACGAGACTCAATGGCATCCGCCACTTTGTGCATCGTATTGGTGCATAACACAATACCTTCTGCGCCCGCCCGCTGTAAGCCAAGCGCCGCCTCAGCCAGAATATCCCCGGTTTTGTCCCACTCACCGCGACGCTGGCACTCTTCTATTTCATGAAAATCGACGCTATGTAGCAGCACTTGCGCAGAGTGAAGCCCACCAAGCCGCTGTTTAATGCCTTCATTTATCAGACGATAGTAAGGAATAGTGGATTCCCAGCTCATTCCTCCCAGCAAACCAATTGTTTTCATTCCTCTCTCCTGATGTGTGTTACCGCAACAAGGCTGAATAAGGAACGAGACAAACGCCTCAACGGCCAGGTGCCCAATCTCTATTAACGAAAAAAGGGCCGGATGTACAGCACATCCGGCCCGTGAAATCAGACGCCGATATTTCTCAACTTTTCGCCTGCCATCAGTTTGCGCTCGATATGTTCCAGCGTGACATTTTTGGTTTCCGGAATGAGCCAGAAAGTGATGCCCACAAACGCAATGTTCAGCGCAGTGTAGAGCCAGAACGTACCGGCAGCGCCAATGCTATCAAGCAGTGTCAGGAAGGTCGCGCCGATAATCATATTCGACACCCAGTTTGTCGTCGTTGAGCAGGTGATGCCAAAATCGCGGCATTTCAGCGGCTGAATTTCAGAGCACAAGATCCACACCACTGGCGCGGCGCTCATCGCATAACCGGCAATACACATCATCGTCATGCCAACAGAGAGCCAGGACAAGCCACTGGAAGCCGTACCGTTATCAAACTGCATCAGGCAGTAACCCAGCACCAGAGTGCCTAACGCCATCACGCTGAAACCAATTTTCAGAGCCGGCTTACGCCCTGCTTTATCTACCGTAAAGACCGCAATGAAGGTAGCGAACATAAAGGTCAGCCCCACGACCAGAGTCGCAATCATCTGTTGTTCTGTGGTCGTAAAGCCCGCCATTTTGAAGATACGTGGCGCGTAGTACATGATGATGTTCATACCGGTAAACTGCTGCATCGCCTGCAACAACATACCGAGAAATACAGCACGACGGACGTTACGGTTGATCTTAAACAGTGCCCAACCGCCCTGTTTTAACTTCAGGCTTTCACGAATTTCGTTGAGTTCTTCTCGCGCTTTTTCCGACGTATCGCGCAGCATACGCAACACTTCTTCCGCCTCAATATGACGCCCCTTTTCCGCCAGCCAGCGCGGGCTATTTGGCAGGAAGACCACCAGAATAATCAGCAGGACTGCTGGTAAAGCAAGAACCCCCAACATTGCGCGCCAGTTACCGCTATAACTGAACGCTGTATCGGATAAAAACGCCAGCACGATGCCGAGTGTGACCATCAACTGGTACATGCTGATCATCTTACCGCGAACGTTTTCACTTGCCATTTCAGAAAGATATAGAGGAGCGGTGTAAGACGCGATCCCAACAGCAATGCCCAACACCACACGAGCGGCGATTAACATCTCTACGCTGGTCGCAAAAGCGGACCCTATCGAACCGAGTACAAACAGGATGGCCCCCGCCATCAGGCTGTATTTACGCCCCAGGCGGAACGACAGCCACCCATTAAACAGCGCACCAATTGCTGCGCCGAGCATCATGCTACTGACCACCCATTCCTGCAAACGGCTGGTCAGCACAAAGTGATCGGTAATGAACGGCAACGCTCCGGCGATTACGCCGATATCAAGACCAAATAACAATCCTGCGACCGCAGCAGCTACCGAAACAAACATATTCATACGCCGCGTATCCCGCAGAGGACGTGGCGTTAAAGCAGATTCCGTATTGATAGTAACCATTTTTTCCTGCCAGCAGAGAGTAAGACATAGTGAAAAAATACGTGAACAATTCACACAGGTGTCAGGTCGGAAATAGCATAAATATGGATTAAATTGCTACGACATGTCGTTATGTGATGGATATTCCAATTTTCAAATTAAGTTGAATTATTGAGATTATTATTAACTACCTAATTTTAAAGCAGATAAAATTCATAAAGTTCATTAATTGATAATTGATATGGATTATTTCATAACCATGATATGGATTATGATGATCTACAGGTATAAAAAACCCTGCCATGCGGCAGGGTCATAAAAGTAAGAGGAATGAATTAACGCGCCAGCCAACCGCCATCCACAGCAATGGTATAACCATTTACATAATCTGAAGCGCTGGAGGCAAGAAACACTACCGGCCCCATCAGGTCACTCGGCAGTCCCCAACGGCCAGCTGGAATGCGGTCGAGAATTTCCGCGCTACGTTGTTCATCTGCCCGCAGTTGTTGAGTATTGTTGGTCGCCATGTAACCCGGAGCTATCGCATTAACATTAATGTTGTGTTTAGCCCATTCGTTCGCCATCAATCGCGTCACACCCATCACGCCGCTTTTTGATGCGGTATAAGAAGGCACACGGATCCCGCCCTGGAAGGAGAGCATTGACGCGATATTGATAATCTTGCCGCCATTGCCTTGCGCGATAAAGTGTTTCGCCGCTGCCTGAGACATGAAGAATACGCTCTTGATATTCAGGTTCATGACATCGTCCCAGTCTGTTTCGCTGAACTCGAGAGCGTCTTCGCGGCGAATCAATCCGGCGTTATTCACCAGGATATCAATATGACCAAACTCCGCTACCGCGCGATCCAGCAGTCCAGGAATGCCATCAATCTTTCGCAGATCGGCGGTCAGGCTTAAAAAACGACGCCCCTGCGCCGTGACCTGCTTGATGGTTTCAGTCGGTTCAACGATGTTAATGCCAACAATGTCACAGCCCGCTTGCGCCAGCCCCAACGCCATCCCCTGGCCCAGCCCAGTATCACAACCAGTGACGACCGCAACTTTACCTTCGAGAGAAAATGCATTTAAAATCATAACAATACCTTATTCGTTTATGCCCACAACTAGCGCAAATCTTTAACGGCCACATGGTCCATATCATCAAAAACCTGGTTTTCACCGACCATGCCCCAGATAAAGGTATAAGCTTTGGTTCCGACGCCGGAATGGATCGACCAGCTCGGGGAGATCACCGCCTGCTCGTTATGCATCACAATGTGACGCGTTTCTTGCGGTTGCCCCATCATGTGGAAAACGCAGGCGTCATCATCCATATTGAAATAGAAATAAACTTCCATCCGGCGCTCGTGGGTGTGACACGGCATGGTGTTCCACAAGTTACCTGGAGCCAGCTCCGTCAGCCCCATACTCAATTGGCAGGTTTCCAGCACATCCGGGACAAAATATTTGTTAATCGTGCGACGGTTACTGGTGAGGTTATCGCCTAACGTGACTGGAGATACTTCGTCCGGTGTGACTTTTTTGGTGGGATACGTCGTATGCGCGGGTGCGCAATTGTAATAAAACTTCGCCGGAGTGGCGGTATCAATACTGGCAAAGACAACTTCTTTTGCACCTTTACCAACATACAGGGCGTCGCGGTGACCGATTTCATAGCATTGACCATCGACAGTAATCGTACCGGCACCGCCAATATTGATAACACCTAACTCGCGACGTTCAAGGAAATAGCTTACGCCGAGTTGTTTACCAACTTCCCCGCCAACGGAAACCGTTTTAGTTACCGGCATAATGCCGCCAACAATAATACGGTCAATGTGGCTGTAAACCATGGTGTACTCATCGGCGACAAATACCTTTTCAACCAAAAATTCATTGCGCAGCCCCTGGGTATCCAGCGTTTTTGCGTGCGCACTGTGGATGCTCTGTCTTACGTCCACATCAACCTCCGATAATCAGTGAAGCGTGAAAATAGAAAACAATAATAAAACACTGTTTCGTTTTCTCTATGAGGGGATGATATGCCCATGGGATAGGGTTTTCAATTAAAAATAAAACAATGTTTCATTTTCAAGTTAAGGATTAAAAAAAGTGCAGTGTCGATCACGAATATGTCATGAGAATGGAAAAATCAGGGAGCCCTGAAAAGGTATGTCGACTCACCAGCCATCATTATTCAACAGATTAATGACGGCAGATATTTATCGGTAAGGAGGAAATGCAGAGCTACTCGTCACGTTCAATGGTCAATGCCACACCCTGGCCCCCGCCGATACAAAGCGTTGCCAGTCCTTTGCGGGCATTACGTTTCACCATTTCATGAACAAGAGAAACCAGGATTCGGCAACCGGAAGCGCCTATCGGATGACCGAGTGCGATCGCACCACCATTGACATTGACCCGACGCTCATCCCATTCAAGCATCTTGCCAACCGAAAGCGCCTGTGCAGCAAACGCTTCATTAGCCTCGATAAGATCGACATCAGCCAACTGCCAGCCAACACGCTCCAGGCAACGGCGGGTCGCATACACCGGCGCAATTCCCATCAATGCCGGATCCACACCAACGCTGGCAAATGCGCGGATGCGGGCCAGCACGGGTAAATTCAACGCTCGTGCTTTGGCTTCGCTCATCATCATTACTGCAGCTGCCCCATAGTTTATGGATGATGCATTACCCGCTGTCACAGAACCGAGACTATCAAATGAAGGATTTAAACGGGCTAAGGCTTCTGCGCTGGTGTCAGTGCGTGGCTGTTCATCGGTATCAACAACCAACGTCTGACCGTTACTTTGGGTTATTACCGGGACGATCTCATCTTTAAATCGTCCGGCGTCAATCGCCGCTCGCGCTTTTTGTTGCGAGCTAAGTGCGTAAGCATCCTGCAACTGACGGCTGATGCCATATTCGCGAGCCAGATTTTCGGCGGTGACACCAATATGATAATCATTGAAGGCATCCCACAACCCATCATGCACAAGACTATCAACCAACTGGCTATTGCCAAGCTGTGCGCCGGTGCGGCTATCAGTCAGAACATGTGGTGCGCGGCTCATGTTTTCCTGGCCACCGGCGATGACAATATCAGCCTCGCCACACTGTATCGCCTGAGTAGCCAGATGCAGTGCTTTAAGCCCGGAACCACAAACGTCATTAATAGTGATTGCAGAAACGCTATTAGGAAGACCACCTTTAATAGCCGATTGCCTTGCCGGATTCTGCCCTGCCCCTGCAGTCAACACCTGACCAAGAATCACTTCATCCACCGCATATGCAGGAACGCCGGTACGTTCTATTAACGCTTTGACGACCAGGCTGCCAAGTTCCACGGCGGAATGACCCGCTAACGCACCACGAAAGCAGCCGATAGGTGTCCGTAACGCCCCGACAATCACAACGTCTTTCATCACAACCTCGCACCAATTAACAGTGCAATAGTAAATGATTGTTAATTACAGTTATCTTAATTGTTTAAAAAAGGTGATTTTTATCACAAAGGAAATACGCCTGAGTAGCAGTCAGAGACATAACTGGCACGTAAGGTTTGCAACCACTAACCCACCAATAGAGAGGTAGATAGGGCGTTAATCTCCCATACTTAACCTGGTTTATGGTAAATTGCCCTCCATTTTGTTTAATTTGTAGATGATACGTTCAGATAATGTCTAATATTTGGTCAAAAGAAGAAACTCTGTGGAGTTTCGCGCTCTACGGCACAGCCGTTGGTGCAGGCACGCTCTTCCTTCCTATTCAGTTAGGTTCGGCGGGGGCTGTGGTCCTGTTTATTACTGCTCTGGTCGCCTGGCCTTTAACATATTGGCCACATAAAGCCTTATGCCAGTTCATCCTCTCATCGAAAACATCAGCAGGTGAAGGGATAACGGGCGCGGTAACACACTACTATGGCAAGAAGATTGGTAATCTGATTACCACGCTGTACTTCATCGCCTTTTTTGTCGTCGTGTTGATATATGCAGTGGCAATTACCAACTCACTTACAGAACAGCTGGCAAAGCATATGGTTATTGATCTTCGCATCCGTATGTTGGTGAGTCTGGGGGTTGTATTAATCCTGAATCTCATTTTTCTGATGGGACGCCATGCCACTATTCGGGTAATGGGATTTTTGGTATTCCCATTGATTGCCTATTTCTTATTTCTTTCTATTTACCTGGTCGGTAGTTGGCAACCTGATCTATTAACAACCCAGGTAGAGTTCAATCAGAATACCCTTCACCAGATATGGATATCGATTCCCGTGATGGTTTTCGCTTTTAGCCATACGCCCATTATTTCTACGTTTGCCATAGACAGACGTGAAAAATATGGCGAACACGCTATGGATAAATGCAAAAAAATTATGAAAGTCGCTTATCTCATCATCTGCATAAGTGTATTGTTCTTTGTCTTTAGCTGCCTGCTTTCTATTCCACCTTCGTATATTGAAGCGGCTAAAGAAGAAGGGGTTACCATTTTATCGGCGCTTTCTATGCTGCCGAACGCCCCAGCATGGTTGTCAATTTCCGGGATTATTGTCGCAGTAGTTGCGATGTCGAAATCATTCCTGGGTACGTACTTTGGCGTTATTGAAGGTGCCACAGAGGTCGTCAAAACAACATTACAGCAGGTTGGTGTAAAGAAAAGTCGTGCATTTAACCGCGCACTATCAATTATGTTGGTATCGCTGATTACCTTCATTGTTTGTTGCATTAACCCGAACGCGATTTCGATGATTTACGCGATCAGCGGCCCGCTCATTGCCATGATACTTTTCATCATGCCTACGCTGTCAACGTATCTCATCCCGGCGCTTAAACCCTGGCGTTCCATCGGAAATCTGATTACCCTGATCGTGGGTATCCTGTGCGTATCGGTAATGTTCTTTAGCTAATATCCGTTGTGGATGGTTCAAAATTGCTTCAATTTTGAACCATCCCAGTTTTCATAATGTTCATTTGTTATTATTCCGCCCTATCACTTCTCTCGTAATATTATATAATTATCAGCTAGTTAAACACACAAAGAGTTCTGAACATCTTAAATAAGACTATTTAAGATACATGACGATTGCATTGCGTAAACGCTTTTTATTTACAAAAAATGGGGAAGTATTACGGCGATTGCGAAAAGTCTGAAGCGCTTGAATTAAGATAATATAGAAAATCAGATACAACAAAAATGGCAGGTAGATGATGTGAAGATAAATTGGAGCGGGCGAAGGGAATCGAACCCTCGTATAGAGCTTGGGAAGCTCTCGTTCTACCATTGAACTACGCCCGCTTCGAGATGCGTAAGGCATTATAAACCTTACGCTCTCCTTAGCAAGTACCACGCTGCTGACTGCTGATTAATTCACCATCAGCATTTTGGCTTGCTGCCCTGAGGCGGCAAGTAACGTAGCGGATCAATTGCCGTTGCACGGTAACGAATCTGGAAATGCAGGCGAACAGATGCCGCATCAGTGCTCCCCATGGTGGCGATTTTTTGCCCAGCTTTCACGCTTTGCCCATTATTTACCAGCATCGTGTCATTATGAGCGTAAGCCGTAATGTAATCTTCACTGTGTTTAATCATGATGAGATTACCGTAGCCACGCAGCTGGTTGCCCACATACACCACCTTTCCTGCACCCGCGGCGTAAATAGGTGTACCCCGTGGAGCTGAGATATCAATTCCTTTATTGCCGCCATCTGCTGTCGAATACGGCATGATAACTTTCCCTGTCGTTGGCCATAACCAACAACGTTGCCCTACTGGCGGCCAGGAAGATTTCGGTACCGCTGATGACGGTGTAACCGATGCGGTTTTGGTCGTTGATTTGGCGGTTGATTTACGTGTACTACTGCTACTTTTCGCCCCACCCAGTTTTAGTTTCTGACCTACTTCAATGGTGTAAGGGGGGGAAATGCCGTTCAGTCGCGCCAGTTCTTTTACGCTGGTTCCCGTGGTGCGCGAAATACGATATAGCGTATCCCCCCGTTTCACGGTGTAAACGGAGCCGGAATACGTTCCTGTATCGGATGATTTGCTACCCGAACAGCCCGCCAAAAGCAGTCCAACCGATAACAACATCACGATACCCAGAGATTTTTTATTCAGGCGTCCCGCACTCAAAATCTTTCCTCGCTTAAAAAACAAGACGCCATATCATAGCAGCCGGCTTCTGGATACCCAATCTCTTGCTTCTGGAAAAGCGATGTAATAGAGAAAGAGGTTAATTTCATTTGGCAAAGGGAAGTATCATCAGCAAAATATTTGCTGTAGTGGTATCGAAGTTCCTGACTTTTACCCTATTTCCCACCTTGATGCGTAATAATCCTAATTTATCACATTGATTTTATCGCCACTCATATTGATACGTATCACTGTCCCTATTCAGAGTCCTGTTTCGTATCATATCTGTGTTTTTTTAACGTCATCACACTTCCTTCCTCCCCTCACGCATATAGTCGTTTCTGGCGTAATTCTTGCCTGCTAAGACTAAATCTTTGCCATAAGAACCAAATGTTCAAACCGAGGGGATTTCTATGGAAGCGCGGGAAGCAACCGCTACGGGTGAATCATGCATGCGCGTCGATGCCATTGCTAAGGTCACCGGGCGGGCACGATATACTGACGATTATGTTATGGCGGGCATGTGTTACGCGAAATATGTACGTAGCCCTATCGCACATGGTTATGCTGTAAGTATTAATGATGAACAAGCCAGGAGTTTGCCGGGCGTCCTGGCGATTTTTACCTGGGAAGATGTGCCAGAAATCCCATTCGCCACGGCAGGGCATGCCTGGACACTTGACGAAAACAAGCGCGATACCGCCGATCGCGCACTGCTAACTCGCCATGTTCGTCATCATGGCGACGCCGTTGCCATCGTCGTGGCCCGCGATGAACTCACGGCAGAAAAAGCGGCGCAATTGGTCAGCATTGAGTGGCAAGAATTACCCGTTATCACCTCGCCAGAAGCGGCGCTGGCAGAAGACGCTGCACCAATCCATAACGGTGGCAATTTACTGAAACAAAGCACGATGTCGACGGGTAATGTCCAACAAACAATCGATGCCGCCGACTACCAGGTACAGGGGCACTATCAGACTCCCGTTATTCAACATTGTCATATGGAAAGCGTGACATCGCTGGCATGGATGGAGGATGACTCGCGAATTACCATCGTTTCCAGCACCCAGATCCCGCACATTGTTCGCCGCGTGGTTGGTCAGGCGCTGGATATTCCCTGGTCATGCGTACGAGTCATCAAACCGTTTATCGGTGGCGGTTTTGGTAATAAACAGGATGTACTGGAAGAGCCAATGGCGGCATTCCTGACCAGCAAACTTGGCGGCATTCCGGTGAAAGTTTCCCTTAGCCGTGAAGAGTGTTTCCTCGCAACCCGTACCCGCCACGCTTTTACTATTGACGGGCAAATGGGCGTGAACCGCGACGGAACATTGAAAGGTTATAGTCTGGATGTTCTGTCTAACACCGGCGCTTATGCATCTCACGGGCACTCCATTGCTTCTGCTGGGGGGAATAAAGTCGCTTACCTTTATCCTCGTTGTGCCTACGCTTACAGTTCAAAGACCTGCTATACCAACCTCCCCTCGGCTGGTGCGATGCGTGGTTATGGCGCGCCACAAGTCGTATTTGCCGTTGAGTCTATGCTTGATGATGCCGCGACAGCGTTAGGTATTGATCCTGTTGAAATTCGTTTACGCAACGCCGCCCGCGAAGGAGATGCTAATCCGCTCACGGGAAAACGTATTTACAGCGCAGGGTTGCCGGAGTGTCTTGAAAAAGGCCGGAAAATCTTTGAATGGGAAAAACGCCGTGCAGAGTGCCAGAACCAGCAAGGCAATTTACGTCGTGGCGTTGGCGTCGCCTGTTTTAGCTACACCTCTAACACCTGGCCTGTCGGCGTAGAAATAGCAGGCGCGCGCCTGTTGATGAATCAGGATGGAACCATCAACGTGCAAAGCGGCGCGACGGAAATCGGTCAGGGTGCCGACACCGTCTTCTCGCAAATGGTGGCAGAAACCGTGGGGGTTCCGGTCAGCGACGTTCGCGTTATTTCAACACAAGATACCGATGTTACGCCGTTCGATCCCGGCGCATTTGCCTCACGCCAGAGCTATGTTGCCGCGCCTGCGCTGCGCAGTGCGGCACTGTTATTAAAAGAGAAAATCATCGCTCACGCCGCAGTCATGCTACATCAGTCAGCGATGAATCTGACCCTGATAAAAGGCCATATCGTGCTGATTGAACGACCGGAAGAACCGTTAATGTCGTTAAAAGATTTGGCGATGGACGCTTTCTACCACCCTGAACGCGGCGGGCAGCTCTCTGCTGAAAGCTCCATCAAAACCACCACTAACCCACCGGCGTTCGGCTGTACATTTGTTGATCTGACGGTCGATATTGCACTGTGCAAAGTCACCATCAACCGCATCCTCAACGTTCATGATTCGGGGCATATTCTAAATCCGCTGCTGGCAGAAGGTCAGGTACACGGCGGAATGGGAATGGGCATTGGCTGGGCGCTATTTGAAGAGATGATCATCGATGCGAAAAGCGGCGTGGTCCGTAACCCCAATCTGCTGGATTACAAAATGCCGACCATGCCGGATCTGCCACAACTGGAAAGCGCGTTCGTCGAAATCAATGAGCCGCAATCCGCATACGGACATAAGTCACTGGGTGAGCCACCAATAATTCCTGTTGCCGCTGCTATTCGTAACGCGGTGAAGATGGCTACCGGTGTTGCAATCAATACACTGCCGCTGACGCCAAAACGGTTATATGAAGAGTTCCATCTGGCAGGATTGATTTGAGGATAACATCATGTTTGATTTTGCTTCTTACCATCGCGCAGCAACCCTTGCCGATGCCATCACCCTGCTGGCTGACAATCCGCAGGCCAAATTGCTTGCCGGTGGCACTGACGTACTGATACAGCTTCACCATCACAATGACCGCTATCGCCATATTGTTGATATCCACAATCTGGCAGAGCTTCAGGGAATAACACAGGCGGAAGATGGCGCGCTGCGAATCGGCTCCGCGACAACATTTACTCAGCTCATTGAAGATCCCGTAATCCAACGCAATCTCCCGGCGTTATGTGCTGCGGCTGCATCAATCGCCGGGCCGCAGATCCGTAATGTCGCCACCTACGGCGGAAATATTTGCAACGGTGCCACCAGCGCAGATTCTGCCACGCCAACGCTAATTTATGACGCGAAACTGGAGCTCCACTCCCCACGCGGTGTTCGTTTCGTCCCGATTAATGGCTTTCACACCGGGCCGGGCAAAGTGTCTCTTGAGCATGACGAAATCCTTGTCGCCTTTCATTTTCCGCCACAGCCGAAAGAACACGCGGGCAGCGCACATTTTAAATATGCCATGCGCGACGCAATGGATATTTCAACAATTGGCTGCGCCGCACATTGCCGACTGGATAACGGCAATTTCAGCGAATTACGCCTGGCATTTGGTGTTGCCGCGCCAACGCCGATTCGCTGCCAACATGCCGAACAGACTGCACAAAATGCGCCATTAAACCTGCAAACGCTGGAAGCCATCAGCGAATCAGTCCTGCAAGATGTCGCCCCGCGTTCTTCATGGCGGGCCAGTAAAGAGTTTCGTCTGCATCTCATCCAGACGATGACCAAAAAAGTGATTAGCGAAGCCGTCGCCGCGGCGGGGGGAAAATTGCAATGAATCACAGCGAAACAATTACCATCGAATGCACCATTAACGGGATGCCTTTTCAGCTTCACGCCGCGCCAGGAATGCCGCTTTCGGAACTACTCCGAGAACAAGGGCTTCTTAGTGTCAAACAAGGTTGCTGCGTAGGCGAATGCGGTGCCTGTACGGTGCTGGTCGACGGCACTGCGATAGACAGTTGCTTATTCCTTGCGGCCTGGGCTGAAGGAAAAGAGATCCGCACGCTGGAAGGTGAAGCGAAAGGCGGTAAACTTTCTCATGTCCAACTGGCTTATGCGAAATCTGGTGCAGTGCAATGCGGGTTTTGTACGCCGGGCCTGATTATGGCTACCACGGCAATGCTGGCGAAACCACGCGAGAAGCCATTAACCATTACGGAAATTCGTCGTGGACTGGCGGGAAATCTTTGTCGCTGCACAGGGTATCAGATGATTGTAAATACAGTTCTGGATTGCGAGAAAACGAAGTAAAAGGATATCCGGCCTGAATTCAGGCCGGATTCTCAGAGGTTATGTGTTTAACAACTCATATTTCTTAATCTTGCGATAGAGCGTAGCAATGCCGATGCCCAGTTCATCAGCAACTTCCTTCTTGCTGTTATGACGTGAAAGCGCCTCGCGGATCATTTGCTTTTCCATCTCCTCCAGCGCCGTGCCGCCCGCATCATCGAGTGACAGGTGCGCCTCACTGACCTCTGTTACATCACTTTGCTCCGTTGTGCCATTATTCAGCAGATTTGGCGGCAATAGCGTGCTGTCGATAACTTCACCTGAAGGAACAACGTTAACCAGATATTCCATCAAATTGCTTAACTCGCGCAGGTTTCCGGGCCAACGATGCTTACGCAATATTTCGACGACATCAGGAGCAATGCCAGGATAAACCGATCCCAGACGACGGGTATGCAGATGTAAAAAGTAATGCACCAGTAATTCAATATCTTCCTGACGTTCACGCAGCGGTGGAAGAGTTATCGGGATAACATTAAGTCGGTAGAAGAGATCTTCGCGGAATTTACCTTCGGCAATGAACTGGGCCAAATTCTGATTAGTTGCAGAAATGATGCGGATGTCGACTTGTATTGGGCTACTGGCACCAATCGGCAGAATTTCACGCGCCTCAATAGCGCGCAGTAATTTAGCCTGCAACATTAATGGCATATCACCAATTTCATCGAGAAACAGCGTGCCCGTATTCGCCGCCTGAATCAACCCTGTTTTACCGTTGGCAGAAGCGCCAGTAAATGCGCCTTTAACATAACCGAACAGTTCGCTCTCCAGAAGCTGTTCCGGAATCGCAGCACAGTTGATAGCAATAAAGGGTTTATTCCGTCTTCCGCTCAACTTATGGATTGCACGGGCGACGACTTCTTTACCCGTGCCGCTTTCACCAACCACCATAACGCTGGATGGGCTGGGTGCAATACGGCTAATGAGTCGTTTTAATTGCCGCATAACACGGCACTCGCCAACCAATTGTTCAATATGCGGTTCATCAGGTGCATTTGCTACAGAAAAACTGGTATGCGATTGGTGAAACGCCATTAAAAATAGTTGTCGGCCCTGGATGTTATGCAACTGACCAATGATTAATTCACTTTTATCATCCCACGAAACAATATGTTGCATATGACCATGGGTAAAATTACTCTCAAATGTTAATGGTCTGAAACGAACAGGTTTTCCAATAATATTATTTTGTACAACACCGAGTGTTTTTAAAGCTGTCTGATTAACAAACTGAACCCGATTATCAGCATCAACCACTAACACGCCCTGATCCATATTATCGATCATGGTCGCGAATATTTTACTGATGTTATCTCCTGGTCCCTGATCCTCCAGAAGTTTAGAAACAAAAATGGTGGATATATGGCGAACGTAATCGGAAAATTCGCGTAAATTATCACTGATATGTTCTTGTTGCTCGTGGGTAACGGCAATCAAACTTATCACCCCAACACAACGATCCTGTAAAATGACAGGCGTACCCAGAAATGCTTTTTCGCGGCAATTTTCTTTACTATCGCAACCTTCACAAAGGGGATCGAAGCGAGACTGTGTCACAACTTTTTCAGTTTTCGTTTCCAGGACGTGGCGGAGCAGGCGTGAGTTGCCGCTCAACTGGCGGCCAAGAAACTTCCCATACGCGCCCGTTCCGGCGACGCGACACAAGTTTTCATCAACGATCTCAACCTCAAGCTGCAAAACGCTGGCAAGCATTCTGGCAAAACGCTGAATTGTCGGTTGAATTTGCATCAATACTGACTGCGTAGTCGCAAGCTCCATAGCTTTACCTTCCAGACTTACTTAAAAGTCGATCATTGAAGACGTTGATGGTTCACAGATCATGATGATATTAACTCAGGCGAAATTGGCTTTGATAAAAACATAAGATTTTTATCACTTTCTAATAAAATTATGGAAGAGATATCACATTTCTATATCAATATGAGAATTACAGCGGCAAGTTTATCAAACTGAAGAGAGATAGCCTGCCTCTTTATCTTATTTCTGATACTTAGCAGCAAATAAATAACGTGATAAAAAAAGCCAAACGTTTTCGTATTTTACAAACAACCGGAAACTGGCATCAATATGTGATCAACCCCACACATTATCCGTCAAATTAGCCTTTCGCAGCCGCGTGGATAATTCTGGCACACTTATTGTTAGTCCCAGGTATAGCTGTGAAAACACCAATCACTTTGGCACGTCACAGTGAAATAAACCACTTTGCCTGTCATTCCACTATCGGGACTTTATGATGAAAACTGTTAATGAGCTGATTAAGGATATCAATTCGCTGACCTCTCACCTGCATGAAAAAGATTTTTTGTTAACGTGGGAACAGACGCCAGACGAACTGAAACAAGTACTGGACGTTGCCGCCGCGTTAAAAGCACTGCGTGCTGAAAACATCTCAACCAAAGTCTTTAATAGTGGATTAGGTATTTCCGTCTTCCGCGACAACTCCACCCGTACCCGCTTCTCTTATGCTTCCGCGCTTAACCTGCTCGGCCTTGCACAACAAGATCTTGACGAAGGTAAATCACAAATCGCTCACGGCGAAACCGTGCGTGAAACCGCCAATATGATCTCCTTCTGCGCTGACGCTATCGGTATTCGCGACGATATGTATCTGGGCGCAGGCAACGCCTATATGCGTGAAGTTGGCGCGGCACTTGATGACGGCTACAAGCAGGGTGTGCTGCCGCAGCGTCCGGCTTTAGTGAACCTGCAATGCGATATTGACCACCCGACTCAGTCTATGGCTGACCTGGCATGGTTGCGTGAACACTTTGGTTCGCTGGAAAACCTGAAAGGCAAAAAAATCGCCATGACCTGGGCCTACTCCCCAAGCTATGGCAAACCGCTCTCTGTACCACAAGGCATCATAGGTCTGATGACCCGCTTCGGTATGGATGTCACCCTGGCCCATCCGGAAGGCTACGACCTGATCCCGGATGTCGTTGAAGTTGCTAAAAACAATGCTAAAGCCTCCGGTGGTAGCTTCCGTCAGGTCACCAGCATGGAAGAAGCCTTCAAAGACGCAGACATCGTTTATCCGAAGTCATGGGCACCTTACAAAGTGATGGAAGAGCGTACTGAATTGCTGCGTGCGAACGATCACGAAGGCTTAAAAGCACTGGAAAAACAGTGTCTGGCACAGAACGCGCAACACAAAGACTGGCATTGTACTGAAGAGATGATGGAACTGACCCGTGATGGCGAAGCCCTGTACATGCACTGCCTGCCAGCTGATATCAGCGGCGTATCCTGCAAAGAAGGTGAAGTGACTGAAGGCGTATTCGAAAAATACCGTATCGCTACCTACAAAGAAGCCAGCTGGAAGCCTTATATCATCGCCGCGATGATCCTGTCCCGTAAATACGCCAAACCAGGTGCACTGCTCGAGCAACTGCTGAAAGAAGCGCAAGAACGCGTGAAATAACCCCTCGGGCCGATCAGCTGGTCGGCCCTCTATTTCCAGAGGCCAAAAGGATAGGATATGTCCGTTTTCTCATTGAAGATTGATATCGCCGATAACAAATTTTTCAACGGCGAAACATCACCGCTTTTTTCGCAAAGCCAGGCAAAACTGGCACGCCAGTTCCACCAGAAAATTGCTGGTTATCACCCAACACCGCTTTGTGCGCTGGACGATCTCGCAAACCTGTTTGGTGTAAAGAAAATTCTCGTCAAAGACGAATCAAAACGATTCGGTCTGAACGCCTTCAAAATGCTCGGCGGTGCGTACGCCATCGCTCAATTATTGTGTGAAAAATATCATCTTGATATCGAAACGCTGTCATTTGAGCACCTGAAAAATGCCATCGGCGAAAAAATGACTTTCGCGACTACCACCGACGGCAACCACGGGCGCGGTGTGGCATGGGCAGCACAGCAACTCGGACAGAATGCGGTGATTTACATGCCGAAAGGTTCTGCTCAGGAACGCGTTGACGCCATTCTAAACCTCGGTGCCGAGTGCATCGTCACGGATATGAACTATGACGATACCGTTCGCCTGACCATGCAACACGCGCAGCAGCACGGCTGGGAAGTGGTACAGGACACGGCATGGGAAGGCTACACCAAAATCCCAACCTGGATCATGCAAGGCTACGCAACACTGGCGGATGAAGCCGTCGAGCAAATGCGTGAAATGGGCGTAACCCCGACACACGTTCTGCTACAAGCCGGTGTCGGTGCAATGGCCGGTGGTGTGCTGGGTTATCTGGTCGACGTCTATAGCCCGCAAAATCTGCACAGCATTATTGTTGAACCTGACAAAGCTGACTGTATTTATCGCTCCGGCGTCAAAGGCGACATCGTCAACGTTGGCGGTGATATGGCCACCATCATGGCGGGCCTGGCCTGCGGCGAACCTAACCCGCTGGGCTGGGAAATCCTACGTAACTGCGCCACCCAATTCATCTCCTGCCAGGACAGCGTTGCCGCATTAGGTATGCGCGTGCTGGGTAATCCGTATGGCAACGACCCGCGCATCATCTCCGGTGAATCCGGCGCTGTCGGTTTGGGCGTTCTCGCAGCGGTTCATTATCACCCGCAACGTCAAAGCCTGATGGAAAAACTGGCGCTGAACAAAGATGCCGTGGTGCTGGTTATCAGCACTGAAGGCGACACCGACGTGAAGCACTACCGCGAAGTTGTCTGGGAAGGCAAACACGCTGTAGCACCTTAATCACCCTATTGGAACTGCTCCCTGCAAAACGGGGAGTAAAAAATCTGGAGAAAAATAATGGCTAAGAATATTCCATTCAAACTGATTCTTGAAAAAGCAAAAGATTACCAGGCAGACATGACTCGCTTCCTACGCGATATGGTTGCTATTCCCAGTGAAAGCTGCGACGAGAAACGCGTAGTACATCGTATTAAAGAAGAGATGGAAAAAGTCGGCTTCGATAAAGTTGAAATCGACCCAATGGGCAACGTTCTCGGTTATATCGGCCACGGCCCGCGTCTGGTGGCAATGGACGCTCATATCGACACCGTCGGCATTGGCAACATCAAAAACTGGGACTTCGATCCGTATGAAGGCATGGAAACCGACGAGCTGATCGGTGGTCGCGGTACTTCCGACCAGGAAGGCGGCATGGCATCTATGGTTTATGCCGGTAAAATCATTAAAGACCTCGGTCTGGAAGATGAATATACCCTGCTGGTTACCGGTACTGTGCAGGAAGAAGACTGCGACGGTCTGTGCTGGCAATACATTATTGAACAATCCGGCATTCGCCCGGAATTTGTGGTCAGTACCGAACCAACCGACTGCCAGGTATACCGTGGTCAACGCGGTCGTATGGAAATTCGCATTGATGTTCAGGGTGTTAGCTGCCACGGTTCGGCACCAGAACGTGGTGATAACGCCATTTTCAAAATGGGTCCAATTCTTGGCGAATTACAGGAACTGTCTCAACGTCTGGGCTATGACGAATTCCTCGGCAAAGGTACGCTGACTGTTTCCGAAATTTTCTTCACCTCCCCAAGTCGTTGCGCTGTCGCAGATAGCTGCGCAGTTTCTATTGACCGCCGTCTCACCTGGGGCGAAACATGGGAAGGCGCGCTGGACGAGATCCGTGCCCTGCCTGCAGTACAAAAAGCGAATGCTGTCGTTTCTATGTACAACTACGACCGTCCGTCCTGGACTGGCCTGGTTTATCCAACCGAATGCTACTTCCCGACCTGGAAAGTGGAAGAAGATCACTTCACCGTTAAAGCACTGGTGAATGCTTATGAAGGGCTGTTTGGTAAAGCGCCTGTCGTTGATAAGTGGACCTTCTCAACTAACGGCGTATCCATCATGGGTCGCCACGGCATTCCGGTCATCGGTTTTGGCCCTGGTAAAGAACCGGAAGCGCACGCGCCAAACGAAAAAACCTGGAAATCTCACCTGGTAACCTGTGCCGCTATGTACGCTGCAATCCCATTAAGCTGGCTGGCAACCGAATAATTACTCTTCACTTATTCCCCTCCGGTTCGCCGGAGGGTTTTTGGAGTTTGCTATGCGCGTATTGATAAAAAACGGCATTGTTGTTAATGCAGATGGACAGGCGAAGCAGGATTTGCTGATTGAAAGCGGGATTGTTCGCCAGTTGGGTACCGATATTTCGCCGCAACTCCCTTGCGAAGAAATTGATGCCTCTGGCTGTTACGTTTTCCCTGGCGGCGTGGATGTCCATACGCATTTCAATATTGATGTCGGCATCGCGCGCAGTTGTGATGATTTTTTTACCGGTACCCGCGCTGCTGCGTGTGGCGGTACAACAACCATTATTGACCATATGGGATTTGGCCCAAATGGCTGCCGGTTACGCCATCAACTGGAAGTTTATCGCGGTTATGCCGCCCACAAAGCAGTCATCGACTACAGCTTTCACGGTGTCATTCAACATATTAATCACGCTATCCTCGACGAAATTCCGATGATGGTTGAGGAAGGACTGAGCAGCTTTAAACTCTATTTAACCTATCAATATAAACTCAACGATGATGAAGTGTTGCAGGCATTACGCCGCTTGCATGAGTCCGGCGCGCTGACCACCGTACACCCGGAAAATGACGCAGCTATCGCCAGCAAGCGGGCGGAGTTTATCGCCGCAGGGTTAACCGCGCCGCGTTATCATGCCTTGAGTCGACCTCTGGAATGCGAAGCGGAAGCCATCGCCCGCATGATTAACCTGGCACAAATTGCCGGTAACGCCCCGCTCTATATCGTGCACCTGTCTAACGGCTTAGGTCTAGATTATCTGCGTCTTGCCCGTGCGAATCACCAGCCAGTCTGGGTTGAAACCTGCCCACAATATCTCCTGTTGGACGAACGCAGTTACGATACAGAAGATGGCATGAAGTTCATTCTTAGCCCACCGCTGCGTAACGTACGCGAGCAGGACAAACTGTGGTGTGGCATCAGCGATGGTGCGATTGACGTGGTGGCAACCGATCACTGCACCTTCTCGATGGCTCAACGCCTGCAAATTTCTAAAGGCGATTTCAGCCGCTGCCCAAATGGCTTACCCGGTGTGGAGAACCGCATGCAACTGCTGTTCTCCAGTGGCGTGATGACGGGACGTATCTCACCGGAGCGTTTTGTTGAGTTAACCAGTGCAATGCCCGCCAGGCTGTTTGGCCTGTGGCCACAAAAAGGATTATTAGCGCCCGGTTCCGATGGCGACGTGGTGATTATAGACCCACGTCAGAGCCAACAAATTCAGCATCGCCATCTCCACGACAACGCTGACTACTCGCCATGGGAGGGTTTTACCTGTCAGGGCGCGATTGTCAGAACCTTATCTCGTGGTGAAACGATTTTCTGCGACAGCACCTTTACAGGCAAAGCCGGGCGAGGTCGTTTCCTGCGACGCAAACCGTTTGTCCCTCCCGTGCTCTAACCACTGCCAGGGATCTATACACAATCAAGAATGATGAGTGAGGAAAAATGAGTAAGAAAATTGTTCTCGCCCTGGGCGGGAATGCGCTGGGCGATGACCTGGCTGGGCAAATGAAAGCGGTAAAAATTACTTCTCAGGCAATTGTTGATTTAATTGCCCAGGGACATGAGGTCATCGTCACTCATGGCAACGGGCCACAGGTGGGCATGATTAACCAGGCCTTTGAAGCTGCAGCAAAAACTGAAGCGCACTCGCCAATGCTGCCGATGTCTGTCTGTGTTGCCTTAAGCCAGGGTTATATTGGTTACGATCTACAAAACGCCTTAAGAGAAGAACTGCTTTCTCGTGGCATTAATAAACCTGTAGCAACGCTGGTTACCCAGGTCGAAGTCGATGCTAACGATCCGGCATTCCTCACCCCGACCAAGCCGATCGGTTCGTTCTTTACCGAGCAAGAAGCAGAGCTACTGACAAAACAGGGTTACACTCTGAAAGAAGATGCGGGTCGCGGCTATCGCCGTGTCGTTGCTTCGCCAAAACCGGTTGATATCATTGAAAAAGAAACGGTTAAAGCTCTGGTAGATGCCGGACAGGTGGTGATCACCGTTGGCGGTGGTGGTATCCCTGTTATTCGTGAAGGTAACCATCTGCGTGGTGCCAGCGCGGTTATCGATAAAGACTGGGCCAGCGCCCGTTTAGCAGAAATGATTGATGCCGATATGCTGATCATTCTGACTGCGGTAGAAAAAGTGGCCATTAACTTCGGAAAAGAGAATGAACAGTGGCTCGATCGCCTGTCGTTAAGTGATGCTGAACGCTTTATCGAAGAAGGTCATTTTGCGAAAGGTTCTATGCTGCCTAAAGTGGAAGCTGCCGCCTCGTTTGCTCGCTCTCGCGCAGGTCGTGAAGCACTGATTA +>test.0417.00002.0004 31459 +CCGTATTGAGCAAAGCGAAAGAGGGGATTGAAGGCAAAACCGGAACGGTGATTTGTCAGTAATTTAAAGGCCGGATGGGTAATACCATCCGGCCATTTTCATTTAAGCCACTTCCAGCACTTCTTTTGTCGCTTTAACGCCCTGATGCATCAACATCATTAACGCCTCAAGTACGCCGCCGCCAATCGCCCGGGCTTTATCAGAAACGCTGGTGAAATCAGCCGTTTCACCACGAGGATCGATATCACCAATTTTAAAACCACCGACCACGGCCAGTCCGTCGTTCAACAAGCCACGCACCATCCCCGTCAACGGTGCTTTAATTTCATGCTCACCAATCCAGGCAATGACATCGCCCTCTTTCACCAGATCGCCTAATTTCACGTTGGATCGCATAATGCCTGCAGCAGGAGCGCGGATCACTCGTCGGGTGGTATGCCCCATAATATTGCCGGGAACACCGGTATTCTCCTGCGCACAACCTGAGTAAATCACCTGACCGAGCCAGTGCCCGCGATTTGTTTCAATTACCGCATGACAATCCTTCCCTGCAGTAAAGCCCGGCCCAAGCGCGATTGTTACTGGTGCCATATCTGCCCGCGTTCCCAAATTCTGTTTCGCCAGAATAGCGTCCACCACGCAAAGCGGTTTCAGTTCATCAAGCAATGAACAGGTGGGATCTACCATCACAGGGATAAATCCGCGTTCGGTAAGTTTCATCGCTTCCGCAGAGCTGGTTGCCAGGCGGGCGGTGACGCCTTCGACCGTCATTTCGCCATCGAACACGGCCTGGGCAAACGCCACGGTACAACGAATCACTGTCGGTTTTTCCACTTCCAACATGATCACTTTAAAACCCGCATGATACAGACGTAGCGCTACACCACTGGCGATATCCCCCGCACCGCGAATCACCACCAGCTGGTGTCCGGAAGGATGAGAAGGCTTCATCATCAGCCCACCCGGCGCGTTATTTTTCACCTGTAATATTTCTGCCAGCACGCTGATGGCGATCTCTTGCGGCGTTTCCGCACCTATATTGTAACCAACGGGCGCATGTAAACGGGCAATATGTTCTTCAGCCACGCCTTTCTCACGCAATTGGCGCAGGAAAAGCTGAACCTTGCGGCGACTTGCCAGCAACCCCAGCCATGCAATGGGTTGTTCAATGAGTTTGTCGAGGGCTTCACGATCCTGATTATTCGTGGCAATCAGGACAAAATTATCAGGGCGAATATCCAGTGCTTCCACTGCCGCACCAAACGACTCAGCATGGAGAAGCGTGGTTGATGGTGGGAATAGTTCAGGATTGAGGCTTTCGCGATAAATATCAGCAACGGCGATATCAAATCCTAATAGCGCCGCACTCTGGGCTATCGCCCGGTTGACATGCCCCGCACCAATCAACACCAGACGTGGACGCATACCATGGACGCTGATAAATACTGACATTGCACCTCCACAATCTGACCCGACAGCATCCGCACCGTTACGAGCCATACGTCCATGGAATAATCGCGGCTTACGTTCCTGCAATGCCTGAAGCGACTCTTCAATCACCTTCCGTTCAACCATTCCGCCACCAATTGTACCGACGATAGAACCATCGGCGCGCACTAACATTTGTGCAGAATGGCGGGGGGTTGAGCCTCGGCTATCAACAATTTGCGCCATCGCAAACGGACAATTTTGCTCTTCGAGTTTTGCAGCCTCTGTGAAAATATTCATACCAACCTCAATGGATATCCTTTCAGTAACCCGGAATACCCGGGCCGCTAATTCACAAATCTGCGCGCGATTGCAGGATGTTCTTGTATATCGCCCAGCCAGATTGCCTCTACGTTGTGTTGTTGCAGCGGTTGAAGGAGCTCGCTTTGCGCAATCGCATTCTCACATTGAGAAAAACGGTTAATGAACCAGACTCGCCGACAACCTTGTGGTACGTTTTTAAACGCCCCCTGAGGGTGGCGAACCAGCGCAACGAGATCGCTCAGTTGCAAGGGTGCAGCAGGTGTTAACCCAGTAATATCAGCAAACTGCGACCAGCGATGGACATTTTCTGTGCTCACTTTCGCACCCAAAATATGTCCTCCCATCACAGCAATCACGCAGCAACTGCTTTTAGGTATGCAAGGTTCGTGCTCATCAGGCGCTTTTAACGGCATTCCACGCGAGCCATCTGCCTCAATGAGAATTACGTCACACTCTGGTCGTTGTACCAGTGCATCAATCGCTTCTGGCGTAAATCCCTGCACTTTTCCCTGGTTCGCTTTCCAGCAGTGAAAACAAAATGAAATGGGGGATATAAAAGACGCATGAGGAAGCATGGCGGGATCACGACAGAAAACCACGGGCCAGTGAGATGTTGGCATAAACATATGTGTCGTCGTAGTGATTAATACACGCCTGCCACTCGCCTGGAACAGTTCTGCCAGCCAAAAAAGCAAGCTGGTTTTCCCCCCAGCACCAACAATAGAAATCACAGTGGGACGTTTCTGCGCGCCTAAATCAATGAATAATGCCGATGGGTCAATTATACTTTTCACGCGTCTTTATGGACCTCTCTGGGATAAATTACCCTCAACGTAATCCATCAGGAAGTAACGCAATTATCAGGCGTTATTAGCTCCTGTAAATAATGGAATCACTATGTCAGCCATCGACTGTATAATTACCGCCGCAGGATTATCATCAAGAATGGGGCAATGGAAAATGATGTTACCCTGGCAACAGGGAACAATTCTTGATACAAGTATCAAAAATGCGTTGCAGTTTTGTAGCCGAATTATTTTAGTCACCGGCTATCGTGGTAATGAACTGCACGAACGTTATGCGAACCAGAGCAATATCACTATTATCCACAACCCAGATTATGCGCAGGGTTTACTGACATCAGTAAAGGCCGCAGTACCCGCGGTACAAACAGAACATTGTTTTCTCACCCACGGAGATATGCCAACCCTCACCATCGATATTTTTAGAAAAATCTGGTCGTTACGAAATGATGGCGCAATACTGCCACTCCATAATGGCATCCCCGGCCATCCGATTTTAGTGTCAAAACCATGCCTGATGCAGGCAATCCAGCGACCCAATGTCACCAATATGCGTCAGGCACTCCTTATGGGAGAACATTATTCCGTCGAAATAGAAAATGCAGAAATAATTTTAGATATTGATACTCCGGACGACTTTATTACAGCGAAGAAAAGGTATACTGAAATTTAGAAAACGTAGTTAAACGATTGCGTTCAAATATCTAATCCCTCCAGCACTCTTTATCATAATGATAAGGAATCACTGATTTTGAGAAAAGAGAAAAAGTGATAAATGGGCTGGCAATAATAATTTTCAGGAGTGATTTTAATTCTCATTTGGCACCTGTGAGTTCATTCACAAAAAGCCATTAAGTTTCGAGCCGCCTCACATTTTTTTATATTTCCCGCCAAACCTGGCAAGAGTGGTGCGATTGTTGCTCTATCCCCCTAAACCACCGGATTTCTCAACACCGGTCACTCAATGATATCTGTATAAGCTAAGGAGAGGGTTATGGGGGATATTATGCGTCCCATTCCGTTTGAGGAACTTTTGACGCGCATATTTGATGAATACCAACAACAACGCTCAATCTTTGGTATTCCCGAGCAACAGTTTTACTCACCCGTAAAAGGTAAAACTGTTAGCGTCTTCGGTGAAACCTGTGCCACTCCCGTCGGCCCTGCCGCTGGCCCGCACACGCAACTTGCGCAAAACATCGTCACCTCCTGGCTGACTGGCGGACGCTTCATCGAACTAAAAACCGTCCAAATTCTTGACCGCCTGGAGCTGGAAAAGCCCTGTATCGATGCCGAAGACGAGTGCTTTAACACCGAATGGTCTACCGAATTTACCCTGCTTAAAGCCTGGGATGAATACCTCAAAGCCTGGTTTGCCCTGCACCTTCTCGAAGCGATGTTCCAGCCTTCTGATTCCGGTAAATCGTTCATCTTTAATATGAGCGTCGGTTACAACCTCGAAGGTATTAAGCAACCGCCGATGCAGCAGTTCATCGACAATATGATGGACGCATCTGACCATCCGAAATTCGCTCAATACCGCGATGCACTTAATAAGCTACTCCAGAATGAGGCATTTTTAGCCCGCCACGGATTGCAGGAAAAACGCGAAAGCTTGCAAGCCTTACCCGCTCGCATCCCCACCAGCATGGTACAAGGGGTTACCCTCTCCACCATGCACGGCTGTCCTCCGCATGAAATCGAAGCCATTTGCCGCTACATGCTGGAAGAAAAAGGGCTCAACACCTTTGTGAAACTCAACCCGACCTTACTGGGGTACGCGCGTGTTCGTGAGATCCTCGATGTCTGCGGTTTCGGTTACATCGGCTTAAAAGAAGAGTCATTTGATCACGACCTCAAGCTGACGCAAGCGCTGGAAATGCTGGAACGCCTGATGGCACTGGCAAAAGAAAAATCACTCGGCTTTGGCGTAAAACTGACTAACACTCTCGGCACCATTAATAACAAAGGCGCACTGCCTGGTGAAGAGATGTATATGTCAGGCCGTGCGCTGTTCCCGCTCTCCATCAACGTTGCAGCAGTTCTCTCTCGCGCCTTTGACGGCAAACTGCCCATTTCTTATTCCGGTGGTGCCAGTCAGCTGACTATCCGCGATATTTTTGATACTGGTATTCGCCCTATTACTATGGCAACCGACCTGCTGAAACCTGGCGGCTATCTGCGCTTAAGTGCCTGCATGCGCGAGCTGGAAGGCTCCGACGCCTGGGGACTTGACCATGTTGACGTCGAACGACTGAACAGACTGGCAGCAGACGCGTTAACCATGGAATACACCCAGAAACACTGGAAGCCAGAAGAGCGTATTGAAGTGGCTGAAGACCTGCCGCTGACCGATTGCTACGTTGCCCCCTGTGTTACTGCCTGCGCTATCAAGCAAGATATTCCGGAATACATCCGTCTGCTTGGCGAACACCGCTATGCCGACGCGCTGGAACTCATCTATCAACGCAACGCCCTGCCCGCCATTACCGGTCATATTTGCGATCACCAGTGCCAATACAACTGTACCCGCCTGGATTACGACAGTGCGCTGAATATCCGCGAACTGAAAAAAGTCGCGCTGGAAAAAGGTTGGGAGGAATATAAGCAACGCTGGCACAAACCAGCCGGTTCTGGTTCACGCCATCCGGTTGCCGTGATTGGTGCAGGTCCGGCGGGTCTGGCCGCAGGTTACTTCCTTGCCAGAGCGGGCCATCCGGTTACGCTGTTTGAACGCGAAGCCAATGCGGGCGGCGTGGTGAAAAATATCATTCCTCAGTTCCGTATTCCTGCAGAGTTAATTCAGCACGATATCGATTTTGTTGCCGATCACGGCGTGAAATTTGAGTACGGTTGCTCACCCGATTTGACCGTTGAACAGTTAAAAAATCAGGGCTTCCACTATGTTCTGATTGCCACCGGCACTGATAAAAATAGCGGTGTGAAACTGGCGGGCGACAACCAAAATGTCTGGAAATCACTCCCCTTCCTGCGTGAATACAACAAGGGCACAGCGCTCAAGCTGGGCAAACATGTGGTCGTTGTCGGGGCGGGTAACACGGCAATGGACTGCGCTCGTGCGGCGTTACGCGTTCCAGGCGTAGAAAAAGCAACGGTCGTTTACCGTCGTTCACTGCAAGAGATGCCAGCATGGCGCGAAGAGTATGAAGAAGCGTTGCACGACGGCGTGGAGTTCCGTTTCCTGAATAATCCGGAACGTTTCGATGCTGATGGCACCTTAACCTTGCGCGTTATGTCGCTTGGCGAACCTGATGAGAAAGGTCGTCGCCGTCCGGTTGAAACCAACGAAACAGTAACGCTGCATGTAGACAGCCTGATCACCGCCATTGGTGAACAGCAGGATACTGAAGCCCTGAATGCAATGGGCGTGCCGCTGGACAAAAACGGCTGGCCAGACGTCGACCATAATGGCGAAACGCGTCTGACTGACGTCTTTATGATCGGCGACGTACAGCGCGGACCATCCTCCATTGTCGCTGCTGTCGGAACCGCGCGTCGGGCGACCGATGCCATCCTGAGTCGGGAAAATATCCGTTCCCACCAGAACGATAAATACTGGAATAACGTCAATCCGGCGGAAATCTATCAACGTAAAGGCGATATCTCTGTCACTCTGGTGAACAGTGACGATCGTGATGCGTTTGTCGCGCAGGAAGCCGCTCGCTGCCTTGAATGTAACTACGTTTGCAGCAAGTGTGTGGATGTCTGCCCGAACCGCGCCAACGTATCCATTGCGGTCCCAGGCTTCCAGAACCGTTTCCAGACGCTGCACCTCGACGCTTACTGTAACGAATGTGGCAACTGCGCCCAATTCTGCCCGTGGAACGGTAAACCGTACAAAGACAAAATCACCGTCTTCAGCCTGTCGCAAGACTTTGATAACAGCAGCAACCCAGGCTTCCTTGTGGAAGATTGCCGGGTACGCGTACGTCTGAATAACCAAAGCTGGGTGTTAAACATCGACAGCGAAGGTCAGTTCAACAACGTACCACCGGAGCTGAACGATATGTGCCGCATCATTAGCCATGTCCACCAGCATCATCATTATCTGCTGGGCCGCGTGGAGGTGTAATCATGTTGATTCTGAAGAATGTCACCGCAGTGCAGTTACACCCGGCGAAAGTGCAGGAAGGCGTTGATATCGCCATCGAAAATGATGTGATTGTCGCTATCGACGATGCCCTGACGCAACGCTATCCCGATGCCAGCTACAAAGAGATGCATGGTCGGATTGTGATGCCGGGAATTGTCTGCTCGCATAACCATTTTTACTCGGGGCTTTCCCGCGGAATTATGGCAAACATCGCCCCCTGCCCGGATTTCATCTCAACGCTGAAAAATCTCTGGTGGCGGCTCGATCGCGCCCTTGATGAAGAGTCGCTCTATTACAGCGGACTGATTTGTTCCCTGGAAGCAATTAAGAGCGGATGTACATCGGTTATCGATCACCATGCCTCTCCAGCCTATATCGGCGGGTCGCTCTCCACATTGCGCGACGCATTTTTAAAAGTTGGCCTGCGCGCGATGACCTGTTTTGAAACTACTGACCGTAACAGCGGCATCAAAGAGTTGCAGGAAGGTGTAGAAGAAAACATCCGCTTCGCCCGTCAGATTGATGAGGCGAAGAAAGCAGCAACCGAGCCGTATCTGGTGGAAGCACATATCGGCGCTCACGCGCCGTTTACCGTACCGGATGCCGGTCTGGAGATGCTGTGTGAAGCCGTGAAAAGCACAGGTCGTGGTTTGCATATTCACGCTGCGGAAGACCTTTACGACGTTTCCTACAGTCACCATTGGTACGGCAAAGACCTGCTGGCACGACTGGCGCAATTCGATCTCATCGACAGCAAAACGCTGGTCGCTCATGGGCTGTACTTGTCGAAAGATGACATCGCCCTACTCAATCAGCGCGATGCGTTCCTGGTGCATAACGCCCGTTCAAACATGAACAACCATGTCGGCTACAACCATCACCTTAGCGACATCCGCAATCTGGCGTTGGGAACGGACGGCATTGGTTCGGACATGTTTGAAGAGATGAAATTTGCCTTCTTTAAACATCGCGATGCGGGTGGCCCGCTGTGGCCTGACAGTTTTGCCAAAGCACTGGCTAACGGCAACGAACTGATGAGCCGCAACTTTGGCGCGAAATTTGGGCTTCTGGAAGCCGGTTACAAAGCCGATTTAACCATTTGCGATTACAACTCGCCGACGCCGCTGCTGGCAGACAATATCGCCGGGCATATCGCTTTCGGTATGGGCTCAGGCAGCGTTCACAGCGTGATGGTCAATGGTGTGATGGTCTATGAAGACCGTCAGTTTAACTTCGATTGCGATTCCATTTATGCGCAAGCCAGAAAAGCCGCTGCCAGTATGTGGCGTCGGATGGATGCGCTGGCATAAATAACAGCTCCCCTCTTCTTTCAGAGAAGAGGGGAAATTAAGGAAAGACGATGATTGAACAATTTTTCAGACCCGACTCAGTCGAACAGGCGCTGGAACTGAAGCGCCGCTACCAGGATGAAGCCGTCTGGTTCGCCGGGGGCAGCAAACTCAACGCTACACCAACCCGTACCGATAAAAAGATTGCCATTTCCTTGCAGGATCTGGAGCTGGACTGGATTGACTGGGATAACGGTGCACTACGAATTGGCGCAATGTCTCGCTTGCAGCCACTGCGTGATGCGCGATTTATTCCTGCAGCACTGCGTGAAGCCCTCGGTTTTGTTTACTCACGCCATGTTCGTAATCAGTCGACCATTGGTGGTGAAATCGCCGCCCGGCAAGAAGAGTCAGTGCTGCTTCCCGTCCTGCTGGCACTGGATGCTGAACTGGTTTTTGGCAACGGCGAAACGCTGTCAATCGAGGACTACCTGGCCTGCCCATGCGATCGCCTGTTAACCGAAATTATCATTAAAGATCCGTATCGCACCTGTGCGACTCGCAAAATTAGCCGTTCTCAGGCAGGTTTAACCGTCGTGACGGCAGCCGTTGCAATAACAGACCACGACGGTATGCGAATTGCGCTGGATGGCGTCGCCAGTAAAGCACTGCGTCTGCACGATGTCGAAACTCAAAATCTGGAAGGCAATGCACTTGAACAGGCTGTCGCCAACGCCATTTTCCCGCAGGAAGATTTGCGGGGCAGCGTGGCCTATAAACGCTATATCACGGGAGTTCTGGTAGCCGATCTGTATGCCGACTGCCAACAGGCTGGGGAGGAAGCCGTATGATCATCCACTTTACTTTAAATGGCGCGCCTCAGGAGCTAACCGTTAATCCAGGCGAAAACGTGCAAAAGCTGTTGTTTAACATGGGAATGCACTCTGTACGCAACAGTGATGATGGTTTTGGGTTTGCCGGTTCTGACGCAATTATCTTTAACGGTAATATCGTTAACGCGTCCTTGCTTATCGCCGCACAGTTAGAGAAGGCAGATATTCGTACCGCAGAATCTCTGGGCAAATGGAATGAGTTAAGTCTGGTTCAACAGGCCATGGTTGATGTTGGCGTGGTGCAGTCTGGTTATAACGATCCAGCTGCGGCTCTGATTATCACCGATCTTCTCGATCGCATCGACGCACCTACCCGCGAAGAGATCGACGACGCACTCTCAGGTCTGTTTAGCCGCGATGCTGGCTGGCAGCAATACTATCAGGTCATTGAACTGGCGGTTGCACGTAAAAATAATCCGCAGGCCACCATTGATATCGCTCCGACTTTCCGTGACGACCTTGAAGTCATTGGCAAGCATTATCCTAAAACTGATGCCGCGAAAATGGTGCAGGCGAAACCCTGCTATGTTGAAGATCGAGTAACGGCTGACGCCTGCGTCATTAAAATGTTACGTAGCCCACACGCTCACGCACTGATTACTCATCTGGATGTCAGCAAAGCTGAAGCCTTACCGGGCGTCGTTCACGTTATTACTCACCTGAATTGCCCGGATATTTACTATACCCCGGGTGGTCAGAGCGCACCGGAACCGTCACCGCTTGACCGCCGAATGTTCGGCAAGAAAATGCGTCACGTCGGCGATCGCGTTGCTGCGGTAGTAGCCGAAAATGAAGACATTGCGCTCGAAGCACTGAAGCTCATCGACGTTGAATATGAAGTGCTTAAGCCGGTAATGTCGATTGACGAGGCAATGGCGGAAGATGCGCCTGTCGTGCACGATGAACCGGTGGTGTATGTTGCTGGTGCGCCAGATACTCTGGAAGATGATAACAGCCATGCAGCCCAGCGCGGCGAGCATATGATCATCAACTTCCCGATCGGTTCTCGCCCACGCAAAAATATCGCTGCCAGTATTCATGGTCATATTGGCGATATGGACAAAGGCTTTGCCGATGCCGATGTGATCATTGAGCGAACCTATAACTCAACGCAGGCGCAGCAGTGCCCGACTGAAACACATATCTGCTTTACCCGTATGGACGGCGATCGTCTGGTGATCCACGCCTCCACCCAGGTACCATGGCACTTACGCCGCCAGGTCGCGCGCCTCGTGGGCATGAAACAACATAAAGTTCATGTCATTAAAGAACGTGTAGGCGGCGGTTTTGGTTCCAAACAGGACATCCTGCTGGAAGAAGTGTGCGCCTGGGCAACCTGCGTGACCGGGCGTCCGGTACTGTTCCGCTACACCCGTGAAGAAGAGTTTATTGCTAACACCTCTCGTCACGTCGCGAAAGTCACCGTCAAACTGGGCGCGAAAAAAGATGGTCGCCTGACGGCAGTGAAGATGGATTTCCGCGCCAACACGGGTCCTTACGGTAACCACTCACTCACCGTACCGTGTAACGGACCGGCGCTGTCGCTGCCGTTATATCCATGCGATAACGTCGATTTTCAGGTCACCACCTACTACAGCAACATTTGCCCAAATGGTGCTTATCAGGGTTATGGCGCGCCGAAAGGTAACTTCGCTATCACCATGGCGTTAGCGGAACTGGCGGAACAATTGCAGATCGACCAACTGGAAATTATTGAACGTAATCGTGTACACGAAGGGCAAGAGCTGAAAATTCTCGGTGCGATTGGTGAAGGTAAAGCGCCGACATCCGTTCCTTCCGCCGCCAGCTGCGCACTGGAAGAGATCCTGCGTCAGGGTCGCGAGATGATCCAATGGTCTTCACCAAAACCACAAAACGGTGACTGGCACATCGGTCGTGGCGTCGCCATTATCATGCAGAAATCGGGTATCCCGGATATCGATCAGGCTAACTGCATGATCAAACTGGAATCAGACGGTACCTTTATCGTTCATTCTGGCGGTGCGGATATTGGTACTGGTTTGGATACTGTGGTGACGAAACTGGCAGCAGAAGTGCTGCACTGCCCCCCGCAGGACGTGCATGTTATCTCCGGTGATACCGATCATGCGTTGTTTGATAAAGGCGCATATGCCTCGTCCGGTACTTGCTTCTCGGGTAACGCTGCGCGTTTGGCAGCGGAAAATCTGCGGGAGAAAATCCTGTTCCACGGCGCGCAAATGTTGGGTGAGCCAGTGGCAGATGTTCAACTAGCAACGCCGGGCGTCGTTCGCGGCAAGAAAGGCGAAGTTAGTTTCGGAGAGATAGCCCATAAAGGCGAAACCGGCACCGGCTTTGGTTCACTGGTGGGAACTGGCAGTTATATCACGCCTGATTTCGCCTTCCCGTATGGCGCAAACTTCGCTGAAGTTGCCGTCAACACGCGTACGGGTGAAATCCGCCTGGATAAATTCTACGCCTTGCTGGACTGCGGTACACCGGTCAATCCAGAGTTAGCGCTGGGACAAATCTACGGTGCCACCCTGCGTGCTATCGGCCACAGTATGAGCGAAGAGATCATTTATGACGCCGAAGGTCACCCGTTAACGCGTGATTTACGCAGTTACGGCGCACCGAAAATTGGTGACATTCCGCGTGATTTCCGCGCTGTGCTGGTGCCGAGCGACGATAAAGTCGGCCCATTCGGGGCGAAATCGATCTCGGAAATCGGTGTAAATGGCGCCGCTCCGGCGATTGCTACCGCAATTCACGATGCCTGCGGCATCTGGTTACGCGAATGGCATTTCACACCGGAGAAAATACTCACCGCGCTGGAAAAAATATAAGTAATAAATGGCCGCTTCGGCGGCCTGTTTCTCTGTTTGAACGATGACTAAATAGTGACTGCGAAAATGAGATAAGCCGTTCTCAAGGCGTCCTGCGCCCCAAATTCGTGGGAATTTATTTTACTAATTCAGATGATCAAATTTACTTTAAAAGGAGTGAAGGGATGTCTGATATAAACCATGCAGGTTCTGACCTTATATTTGAACTGGAGGATCGCCCTCCCTTTCATCAGGCTCTCGTAGGTGCCATTACCCATCTGTTGGCAATTTTCGTTCCGATGGTAACCCCCGCGTTAATCGTGGGTGCGGCCTTACAGCTTTCCGCTGAAACAACTGCCTATCTTGTTTCTATGGCGATGATCGCCTCTGGTATTGGTACCTGGTTACAAGTAAACCGCTACGGCATCGTCGGTTCTGGTTTACTTTCAATTCAGTCAGTCAATTTTTCATTTGTTACGGTCATGATTGCGCTGGGTAGCAGCATGAAAAGCGACGGTTTTCACGAAGAGTTAATCATGTCGTCGCTCCTCGGCGTCTCCTTCGTTGGCGCATTTCTGGTTGTCGGCTCTTCTTTTATCCTGCCCTATTTACGTCGGGTTATTACGCCTACCGTCAGCGGCATTGTGGTGCTGATGATCGGCTTAAGCCTGATTAAAGTTGGCATTATTGATTTTGGCGGTGGTTTTGCAGCTAAAAGCAGCGGTACGTTCGGCAATTACGAGCATCTCGGCGTTGGCTTATTGGTTTTGATTGTGGTGATCGGCTTTAACTGCTGCAGCAGTCCGTTGCTACGCATGGGTGGGATCGCCATTGGGCTATGTGTCGGCTATATCGCATCGTTATGCCTGGGCATGGTGGATTTCAGCAGTGTGCGCAATTTGCCGTTAATCACCATCCCGCATCCGTTCAAATACGGCTTTAGTTTTAGCTTCCATCAGTTCCTGGTGGTTGGCACGATTTATCTGCTTAGCGTGCTGGAAGCTGTCGGCGATATCACCGCCACGGCAATGGTTTCCCGCCGTCCCATTCAGGGGGAAGAGTATCAGTCCCGACTGAAAGGCGGCGTGCTGGCAGATGGTCTGGTTTCTGTTATCGCCTCCGCTGTCGGTTCATTACCATTAACCACGTTTGCGCAAAATAATGGGGTTATTCAGATGACTGGCGTCGCTTCACGTTATGTCGGGCGAACCATCGCGGTAATGCTGGTTATCCTCGGCTTATTTCCGATGATTGGCGGCTTCTTCACGACCATTCCCTCAGCAGTTCTGGGAGGCGCAATGACGTTGATGTTTTCCATGATTGCCATCGCAGGGATTCGCATCATCATCACCAACGGTTTAAAGCGCCGAGAAACACTTATTGTCGCCACGTCTTTAGGTTTAGGGCTTGGCGTCTCCTACGATCCCGAAATTTTTAAAATATTGCCAGCCTCTATTTATGTATTAGTTGAAAACCCTATTTGTGCTGGCGGGTTAACTGCGATTTTATTAAATATTATCCTCCCTGGTGGCTACCGACAGGAAAACGTTCTGCCTGGTATTACCTCAGCGGAAGAGATGGATTAACAGTAAAGGAGTCAATGATGTCAGGAGAACACACGTTAAAAGCGGTACGAGGCAGTTTTATTGATGTCACCCGTACGGTCGATAACCCGGAAGAAATTGCCTCTGCGCTGCGGTTTATTGAGGATGGTTTATTACTCATTAAACAGGGAAAAGTGGAATGGTTTGGCGAATGGGAAGACGGAAAGCATCAAATTCCTGACACCATTCGCGTGCGCGACTATCGCGGCAAACTGATAGTACCGGGCTTTGTCGATACACATATCCATTATCCGCAAAGTGAAATGGTGGGGGCCTATGGTGAACAATTGCTGGAGTGGTTGAATAAACACACCTTCCCTACTGAACGTCGTTATGAGGATTTAGAGTACGCCCGCGAGATGTCGGCGTTCTTCATCAAGCAGCTTTTACGTAACGGAACCACCACGGCGCTGGTGTTTGGCACTGTTCATCCACAATCCGTTGATGCGCTGTTTGAAGCCGCCAGTCATATCAATATGCGTATGATTGCCGGTAAAGTGATGATGGACCGAAACGCACCGGATTATCTGCTCGACACTGCCGAAAGCAGCTATCACCAAAGCAAAGAACTGATTGAACGCTGGCACAAAAATGGTCGTCTGTTGTATGCGATTACGCCACGCTTCGCCCCTACCTCATCTCCTGAACAGATGGCGATGGCGCAACGCCTGAAAGAAGAATATCCGGATACATGGGTACATACCCATCTCTGTGAAAACAAAGATGAAATTGCCTGGGTGAAATTGCTTTATCCTGACCATGATGGTTATCTTGATGTTTACCATCAGTACGGCCTGACCGGTAAAAATTGTGTCTTTGCTCACTGCGTCCATCTCGAAGAAAAAGAGTGGGATCGTCTCAGCGAAACCAAATCCAGCATTGCTTTCTGTCCGACCTCCAACCTTTACCTCGGCAGCGGCTTATTCAACTTGAAAAAAGCATGGCAGAAGAAAGTCAAAGTGGGCATGGGAACAGATATCGGTGCCGGAACAACTTTTAACATGCTGCAAACGCTGAACGAAGCCTACAAGGTATTGCAATTACAAGGCTATCGCCTCTCGGCATATGAAGCGTTTTACCTGGCCACGCTCGGCGGAGCGAAATCTCTGGGCCTTGACGATTTGATTGGCAACTTTTTACCTGGCAAAGAGGCTGATTTCGTGGTGATGGAACCCACTGCCACTCCGCTACAGCAGCTGCGCTATGACAACTCTGTTTCTTTAGTCGACAAATTGTTCGTGATGATGACGTTGGGCGATGACCGTTCGATCTACCGCACCTACGTTGATGGTCGTCTGGTGTACGAACGCAACTAATAATAAAACTTTAACATCCTCGTGAGGACATCATTATGTCTGGAGACATCCTACAAACACCGGACGCACCAAAGCCACAGGGCGCGCTGGATAATTATTTTAAAATTACCGCTCGTGGCAGTACCGTTCGTCAGGAAGTACTGGCTGGCTTAACGACCTTTCTGGCCATGGTTTATTCCGTTATCGTCGTTCCGGGAATGCTGGGCAAAGCAGGTTTTCCTCCCGCAGCTGTGTTTGTTGCCACCTGTCTGGTCGCGGGCTTCGGCTCGTTGCTGATGGGGTTATGGGCCAATTTGCCAATGGCGATTGGTTGCGCTATTTCCTTGACGGCGTTTACCGCATTCAGTCTGGTACTCGGGCAACAAATTAGCGTTCCTGTCGCACTGGGCGCAGTCTTTCTGATGGGCGTCATCTTCACCGCTATTTCCGTAACCGGTGTGCGTACCTGGATCTTACGTAATTTGCCGATGGGGATCGCTCACGGTACAGGTATCGGTATCGGCCTGTTTCTGCTGCTGATTGCTGCTAACGGTGTGGGAATGGTTATCAAAAACCCGATTGAAGGCTTGCCAGTGGCGCTCGGTGCGTTTACCTCCTTCCCGGTGATGATGAGCTTACTGGGGCTGGCGGTCATCTTCGGTCTGGAAAAGTGCCGCGTACCCGGCGGGATCTTGTTGGTGATTATTGCAATTTCGATCATCGGCTTAATCTTTGACCCAGCGGTGAAGTACCACGGTCTGGTGGCAATGCCAAGCCTGACTGGCGAAGATGGTAAGTCTCTGATTTTCAGCCTCGATATTATGGGCGCACTCCAGCCAACTGTACTTCCGAGTGTACTGGCATTGGTGATGACCGCAGTGTTCGACGCCACTGGCACCATCCGTGCCGTCGCCGGTCAGGCGAATTTGTTGGATAAAGACAACCAGATCATCAACGGCGGCAAAGCCCTGACCAGTGACTCAGTAAGTTCAATATTCTCCGGCCTGGTGGGCGCAGCGCCCGCGGCGGTTTATATCGAATCAGCGGCAGGAACCGCCGCCGGGGGGAAAACCGGTTTAACCGCAACCGTGGTTGGTGTGTTGTTCCTGATGATTCTGTTTTTATCACCGTTATCGTTTCTGATCCCCGGTTATGCCACAGCTCCCGCACTGATGTACGTGGGTTTGCTGATGTTAAGCAACGTCTCGAAGCTGGATTTCAACGATTTTATTGACGCAATGGCTGGCCTGGTGTGTGCCGTGTTCATCGTTCTGACTTGTAATATCGTTACCGGTATTATGCTGGGCTTTGTAACACTGGTGGTGGGTCGCGTCTTTGCGCGCGAATGGCAAAAGCTGAATATTGGTACGGTGATCATTACTGCCGCACTGGTCGCGTTTTACGCGGGTGGTTGGGCAATCTAATAGATTCTCCGCGCCTTTCCGCGCGGAGATTTCTTTCAGAGAGGATTCTCACTGCTGGCAGCAATACGCTGCTGGCGGATACGCCTGAGTTCTCTTTCAGTCAGCAACTGCAGCGCCTGTGTCGGGCAAGATTCAACGCAGGCTGGCCCCTCTTCCCGCAGTTCACAGAGATCGCATTTCACGATTTGTTGCCGGGGATCACCCGGCAATGACTGAATGGTGATCATCCCAAACGGGCACGCGCTAACGCAACTCTGACAGCCAATACAACGGGCAGAATTGGCCTGCACCACCTGCTCGCCCATCGTCAGCGCCCCCACGGGGCAAGCGCCAACACAAGGGGCGTTTTCACACTGATGGCACATCACCGGCGCACTGATGCTATCCAGCCGTTGTACCTTCAGCCGGGGTAAAAAGATATCGGCATTCAACTCCTGTTCTGAAGGGTGAGCGACCACACAGGCCACTTCACAAGTACGGCAGCCAATACAGTCAGCCGGATTAACGATAATTAACGATTTCATCACGATGCCTTCGTATCAAACAGAGTTAACATATCGCGCGCCGCCTGCCTTCCTGCGGCCATTGCAGTGACAACCAGATCCGCGCCATGAACTGCATCACCACCAGCAAAGACTTTTTTCAGATGCGTCTGGGTAGGTAAATACCCGACGTCGCCGGTTTGAATCAGGCCCCATTTATCGAGTTTAATTCCGCTGCCCTGCAACCACGGCATGGTATGTGCCTGGAAACCAAAGGCCATAATGAGAACATCGGCGGGCAATTCAAACTCTGAACCCGCAACCGGACGAGGACGACGGCGACCATCCGGCCCCGGCTCACCCATAGCGGTACGAATCAGGCCCACCGCCGTTAAGCGTCCATCTTCATCACAAGCGATATATTGCGGCTGAACATTGAACTGAAACTCAACACCTTCCTCGCGGGCATTGACCACCTCTTTGCGCGAACCCGGCATACTGACTTCATCACGACGATACGCACAGGTCACGCTGGCAGCATTAAGGCGGATGGAAGTCCGCAAACAATCCATTGTCGTATCGCCACCGCCCAATACCACGACTCGCTTCCCTTCCACATCCGTCAGCGGATACTCTGCAGACTCCGGCAATCCCATGAGCTGGCGGGTATGGGCGGTCAGGAACGGTAACGCCTGAATGACACCAGGCGCATCTTCATGCGGCAGATCTGCTCGCATCATCCCGTAAGTCCCCACGCCGAGGAAAACAGCATCATATTCCGCCGTTAATTCGTTGAAAGAGATATCGCGGCCAATTTCACAGTTGAGATGGAAATCGATTCCCATTGCGGTGAATATCTCTCGCCGCTGGCTTAATACCGTTTTATCGAGTTTGAAAGGAGGAATGCCAAAAGTCAGCATACCGCCAATTTCTGGATGGCGATCAAAGACATCAACCTGAACTCCCGCGCGCGCCAGAATATCAGCACACCCTAATCCTGCAGGTCCAGCGCCAATCACCGCCACTTTTTCGCTACGGGGAACAACTTTGCTGACATCGGGACGCCAGCCCATCGCCAGCGCAGTATCGGTGATGTAGCGTTCCAGATTACCGATAGAGACTGCGCCAGAGTGATCTTTCAAAGTACATGCACCTTCACAAAGACGGTCCTGTGGACATACCCTGCCGCAGATTTCGGGTAAGGAACTGGTCTGGTGGCAAAGTTCTGCCGCTTCAATAATCTTTCCTTCCTGTACCAGACGGATGTAATCCGGAATAGCGTTATGCAGCGGACAATGCCAGTTGCAGTTAGCTTTTTCGGCACAATAAACACAGCGGTCACTCTCATAAGTCGCTTGTTGTGGATCCAGCCCGCAATAGATTTCGCCAAAGTGGGTTTTCCGTTCACTCGCTGAAATTTTATCTGCGCCTTTACGCGAGTTAACGGGGAGCAACGCTGCACTGCGAGATGGCTGAGCGTCTGATGACGCTTTTCCTGCTGCCGTTTTGCGCTGGCGGGCCACCTTTATCTGCTGCAACCCTTTATCGTCCATCAGCCGTAACGCCTGTGTTGGGCAGACGTCAATACAGGCTTGCGTGCCGGAACTGCGCTGGTTACAAAGGTCGCATTTCTGTGCAATCGTATCGACCATCTCAACGACGCCAAAGGGGCAAGCGATTGCGCATCTTTTACAACCAATACATTTTTGCTCGTCCAGTTGTACGCTATCGGACTGGAAAGTCAGAGCATTAACCGGACAAGCCGTAACGCAAGGGGCATTGTTGCAGTGATGGCAGGCCACCGGATTCGCAGCCTGGCCTTTCCCTACAACGTGGATACGCGGTCGAAAGTCACTGTGACTCAGCGGCCAGTTTTCTTGATTATGTGCCACCGCACAGGCAATTTCACAAGCATGGCAGCCTATACATTCCGCAGCTTCAGCAGCGATAAACTTATTCATTTGCATCCCTTTCATTTAATGAGTTATGTCTTCTCAAATTTCGCGATGCAATAAACGGGCATATATTAGGTAGCATGACCGTTTTAATTATAATTTTGCAACTGAGTTCAAATTATTGCCCCTCAATCTATGCCGCTTTCATTATTTCAACATTGCCGATCAAAAGAATGCTATCCAGATAAAAACGATTAAATGCGAGAGTGCGACATGCCAGAATGATTAATGAAATATCAATATGAGAAAATTACAGATAATTCCATTGTCAGGTTCTCTTCTCATAATCGTGGTTTAACCACGATTATGTGATTGCCTCCGCAATTCCTGTCTCTAACTCCCCTTCCTCGCAAAAACTGGCACTCCACGAGCATGTGTTTAGACAGTTTCATGAACATAAACGGTTGCTTTTTACTCTGGCGGGCGAAAGGAGAAACACTGATGAGCGCCATAGATTCCCAACTTCCCTCATCTTCTGGGCAAGACCGCCCAACTGATGAGGTTGACCGCATATTATCACCAGGAAAGCTGATCATACTCGGTCTGCAACACGTCCTTGTCATGTACGCAGGTGCAGTCGCTGTTCCTCTTATGATTGGTGACCGACTCGGCCTATCAAAAGAAGCTATTGCGATGCTCATCAGCTCGGATCTCTTTTGCTGCGGGATCGTCACATTATTGCAATGTATCGGTATCGGCCGCTTTATGGGGATCCGCCTGCCGGTGATTATGTCGGTGACCTTCGCCGCTGTAACACCAATGATAGCCATTGGTATGAACCCGGATATCGGCCTGCTGGGGATATTCGGTGCCACTATCGCCGCGGGTTTTATCACCACATTATTAGCGCCACTTATCGGTCGCTTGATGCCTTTATTCCCGCCACTGGTTACCGGTGTGGTGATTACTTCTATCGGGCTTAGCATCATTCAGGTGGGTATTGACTGGGCCGCCGGAGGTAAAGGGAATCCGCAATATGGTAATCCCGTTTATTTAGGTATCTCCTTTGCCGTCTTAATTTTTATCTTGCTCATTACTCGCTATGCGAAAGGATTTATGTCCAACGTCGCCGTATTACTGGGGATTGTATTTGGCTTTTTACTTTCGTGGATGATGAATGAAGTCAATTTATCCGGGCTACATGATGCTTCATGGTTTGCGATTGTCACGCCGATGTCATTTGGTATGCCGATTTTCGATCCCGTTTCCATTCTGACCATGACTGCCGTGTTAATCATCGTGTTTATCGAGTCGATGGGGATGTTCCTGGCACTGGGTGAAATAGTCGGTCGCAAACTCTCTTCCCAGGACATTATTCGTGGGTTACGCGTAGATGGGGTTGGGACAATGATTGGAGGCACGTTTAACAGCTTCCCACATACGTCATTTTCGCAGAACGTCGGGCTGGTCAGCGTGACGCGCGTCCACAGCCGCTGGGTGTGCATTGCTTCCGGTATCATTTTGATCCTGTTCGGCATGGTGCCCAAAATGGCGGTGCTGGTGGCCTCGATTCCGCAATTTGTGCTGGGCGGCGCGGGGCTGGTGATGTTCGGCATGGTACTGGCGACAGGGATTCGAATTCTGTCGCGCTGTAACTACACCACTAACCGTTACAACCTCTATATTGTGGCGATCAGTCTCGGTGTTGGCATGACGCCAACGCTCTCTCACGATTTCTTTTCTAAGTTACCGGCCGTACTGCAACCGTTGCTGCATAGCGGCATTATGCTCGCAACCCTTAGCGCCGTTGTGCTGAACGTCTTCTTTAATGGCTACCAGCATCATGCTGACCTGGTGAAGGAATCCGTCTCTGATAAAGATTTAAAAGTCAGGACAGTACGTATGTGGCTTCTGATGCGCAAGCTGAAGAAAAATGAGCATGGAGAATAATATGAATCTTTTAATGCGCGCTATATTCAGTCTGCTGTTGCTTTTTACTCTCTCTATTCCTGTCATTTCTGATTGTGTTGCAATGGCCATTGAAAGTCGCTTCAAATATATGATGCTGCTTTTTTAAATGGTTTTTACCTGTCGACATCCGCTCAAAACGGGCGGTTGTCGATAAACGCTCACTTGGTTAATCATTTCACTCTTCTATTATCTATAATGATGAGTGATCAGAATTACATGTGAGAAATTATGCAAACGGAACACGTCATTTTATTGAATGCACAGGGAGTTCCCACGGGTACGCTGGAAAAGTATGCCGCACACACGGCAGACACCCTCTTACATCTCGCGTTTTCCAGTTGGCTGTTTAATGCCAAAGGGCAATTATTAGTTACCCGCCGCGCCCTTAGCAAAAAAGCATGGCCTGGCGTGTGGACTAACTCGGTTTGTGGGCACCCACAACCGGGAGAAAGCAACGAAGAGGCGGTGATCCGCCGTTGCCGTTATGAGCTTGGCGTAGAAATTACGCCTCCTGAATCTATCTATCCTGACTTTCGCTACCGCGCCACCGATCCGAATGGCATTGTGGAAAATGAAGTGTGTCCGGTATTTGCCGCACGCACGACCAGTGCGTTACAGATCAACGATGATGAAGTGATGGATTATCAATGGTGTGATTTAGCAGCGGTTTTACGCGGTATTGATGCTACGCCGTGGGCGTTCAGTCCGTGGATGGTGATGCAGGCGACAAATCGCGAAGCCAGAAAACGATTATCTGCATTTACCCAGCTTAAATAAAAAACCCCGACGGTTGCCGGGGTTGTGAGCATAACGTAATGCTTATTTTACCGGACGCATCGCCGGGAACAGAATAACGTCGCGGATGGTATGGCTGTTGGTGAACAGCATTACCATACGGTCGATACCAATTCCCAGACCGGCTGTCGGTGGTAAGCCATGTTCCAGTGCGGTGACATAATCTTCGTCGTAGAACATCGCTTCGTCGTCACCTGCATCTTTCGCGGCAACCTGATCCAGGAAGCGCTGCGCCTGATCTTCCGCGTCATTCAGCTCGCTAAAGCCGTTACCGATTTCACGCCCACCAATGAAGAACTCAAAGCGGTCTGTGATTTCCGGGTTAACGTCGTTACGACGCGCCAGAGGAGAAACTTCTGCCGGATATTCAGTAATGAAGGTCGGCTGGATCAGATGTGCTTCTGCCACTTCTTCGAAGATCTCGGTAACGATACGGCCCAGACCCCAGCTCTTCTCAACGTGGATGCCGATAGATTCAGCAATCGCTTTCGCAGAGTCGAAGTTGTCCAGATCTGCCATGTCGGTTTCCGGGCGATATTTCTTGATCGCTTCACGCATGGTCAGTTTTTCGAACGGCTTACCGAAGTCCAGCGTTACGTCGCCGTAGGTCACTTCCGTCTTACCGAGAATATCCTGTGCCAGAGTACGGAACAGCGATTCGGTCAGCTCGATCAGATCTTTGTAATCTGCGTAAGCCATATAGAGTTCCATCATGGTGAACTCTGGGTTATGACGTACGGAAATACCTTCGTTACGGAAGTTACGGTTGATTTCGAATACACGCTCGAAGCCACCGACCACCAGACGCTTGAGGTACAGTTCCGGCGCGATACGCAGGTACATGTCGAGATCCAGCGCGTTATGGTGGGTGATGAACGGACGCGCAGCGGCACCGCCAGGGATCACCTGCATCATCGGCGTTTCAACTTCCATAAAGCCGCGATTCACCATGAACTGGCGAATACCAGAGAGGATCTGCGAGCGCACTTTAAAGGTGTTGCGGGATTCATCGTTAGAGATGAGATCCAGATAACGCTGACGATAGCGCGCTTCCTGATCCTGCAAGCCGTGGAATTTATCCGGCAGCGGACGCAGTGCTTTGGTCAGCAGACGCAGCTCGGTACAGTGGATAGACAGTTCGCCGGTTTTGGTTTTGAACAGTTTACCTTTCGCGCCGAGGATATCGCCGAGGTCCCATTTTTTGAACTGCTCGTTGTAAACGCCTTCCGGCAGATCGTCACGGGCAACGTACAACTGAATGCGACCGCCAACGTCCTGCAGGGTAACGAAAGACGCTTTACCCATAATACGACGGGTCATCATGCGGCCAGCAACGGCGACTTCGATGTTCAGCGCTTCCAGTTCTTCGTTCTCTTTACCGTCGAATTCTGCGTGCAATTGGTCAGAGGTATGATCGCGACGGAAATCGTTCGGGAAGGCAATCCCCTGCTCACGCAGGTTCGCCAGCTTCTCACGACGCGTTTTCAGTTCATTGTTAAGATCGACTACCGCGTCAGCGCCCTGTGCGTGTTGTTCAGACATGTTGGTTCCTCATAACCCTGCTTTCAAACTTGCTTCGATAAATTGATCCAGGCTGCCGTCCAGCACGGCCTGCGTGTTGCGGGTTTCTACCCCGGTACGCAGATCTTTAATGCGGGAGTCATCAAGGACATAAGAACGAATCTGGCTGCCCCAGCCGATGTCGGATTTGTTATCTTCCATCGCCTGTTTCTCGGCATTTTTCTTCTGCATCTCCAGTTCATAAAGCTTCGCTTTCATCTGCTTCATGGCCTGGTCTTTGTTCTTGTGCTGGGAACGGTCGTTCTGGCATTGGGTCACGATCCCGGTTGGGATGTGAGTAATACGCACCGCAGATTCGGTACGGTTAACGTGCTGACCGCCCGCGCCGGATGCGCGATAAACGTCGATGCGCAGATCCGCCGGATTGATTTCGATATCGATATCATCATCAACTTCCGGGTAAACAAACGCGGAGCTGAACGACGTGTGGCGACGACCACCGGAGTCAAACGGGCTCTTACGCACCAGGCGGTGAACGCCGGTTTCTGTACGCAGCCAGCCATAAGCGTAATCGCCGGAGATTTTGATCGTCACGGATTTAATACCCGCCACTTCACCTTCCGACTCTTCGATGATTTCAGTTTTGAAACCACGCGATTCAGCCCAGCGCAGATACATACGCTCAAGCATGCTCGCCCAGTCCTGTGCTTCCGTACCGCCAGACCCCGCCTGAATATCGAGGTAGCAGTCGGCGCTGTCATATTCGCCAGAGAACATACGGCGGAACTCAAGCTGCGCCAGTTTTTCTTCCAGGGCGTCGAGTTCAGCAACGGCTTCGTTAAAGGTTTCTTCGTCGTCAGCTTCTACAGCCAGTTCCAGCAGACCAGAAACATCTTCCAGCCCCTGTTTCATTTGGTCGAGGGTGTCGACAACGGCTTCGAGGGAGGAACGCTCTTTACCCAGCGCCTGTGCGCGTTCGGGTTCGTTCCAGACATCCGGCTGTTCCAGCTCGGCGTTTACTTCTTCCAGACGCTCTTTCTTGGCGTCATAGTCAAAGATACCCCCTAAGAACGTCGGAGCGTTCCGTGAGGTCCTGAATGCGATTATTTACCGGATTAATTTCAAACATGGTCTGATTTCTTTTATTGAGCTAGTCAAAATGCGGTGATTAGAGCGGGATTGTACCCAATCCACGCTCTTTTTTATAGAGAAGATGACGCTAAATTGGCCAGATATTGTCGATGATAATTTGCAGGCTGCGGTTGCCGCGAAACTCGTTGATATCGAGCTTGTAAGCCAGTTGCACTTCGCGCACGCCGTTATCCGGCCAGAGGGCGGTATCGACATTAAAAGCAATACCATCCAGCAGCGGACCGCCGCCGACCGGCTCGACCATGACTTTCAAATGACGCTCGCCCACCAGCCGCTGTTGCAGCAGACGGAAATGACCGTCAAACAACGGTTCCGGGAACATTTGTCCCCACGGGCCAGCATCACGCAGCAGTTGCGCCACTTCCATGGTCATCTCTGCCGCACTTAATGGGCCGTCTGATACCACTTCCCCTTGCAATAAAGAAGGATCTAACCACTCGGTAACCAGTTCGCCAAAGCGTTGCTGAAAGAGTTCGAATTTCTCCTCTTCCAGCGACAAACCCGCCGCCATCGCATGGCCGCCAAACTTGAGCATCATGCCGGGGTAAAGCGTGTCTAGCCGCTCCAGCGCATCGCGCATATGCAGCCCCTGAATGGAGCGACCGGAACCTTTCAGCGTACCGTCGCCCGCAGGCGCAAAGGCGATAACCGGACGGTGAAAACGCTCTTTGATACGCGATGCCAGAATGCCAACAACGCCCTGATGCCATTCAGGGTGATACATTGCCAGCCCACCTGGCAGCGTGTCGCGGCTACGTTCCAGCTTCTCGCACAGAGTGAGCGCTTCAACCTGCATTCCCTGTTCGATCTCTTTACGTGTTTGGTTTAGTGCATCGAGTTCATTCGCCAGCACACGCGCTTCGCCAATGTTGTCACACAACAACAGCGCCACGCCAACGGACATATCGTCCAGTCGCCCGGCAGCATTGAGACGTGGCCCCAGCGCAAAACCTAAATCGCTGGCGGCGAGTTTTTGTGGATCGCGATTGGCCACTTCCAGCAGCGCTTTAATCCCCGGACGGCACTTTCCGGCACGGATGCGACTCATCCCCTGCCAGGTCAGAATGCGATTATTAGCGTCCAGCGGCACGACGTCCGCCACTGTCCCCAACGCTACCAGATCCAGCAGTTCTGCCAGATTAGGAATTGCGATGCCGCGCTCATCAAACCAGCCCTGATCGCGCAAAAAGGTGCGCAGCGCCAGCATCAGATAAAACGCCACACCCACGCCTGCCAGTGATTTCGACGGGAAATTACAGTCGCGCAAGTTAGGGTTAATGATCGCTTCCGCTGCGGGTAATGTGTCGCCTGGCAAATGGTGATCGGTAACAATAACCGGAATGCCCAACGAACGAGCGTGTTCAACCCCCGCATGGGAGGAAATACCGTTATCCACCGTGACAATTAACTGCGCGCCACGGGCATGAGCCTGATCGACTACTTCCGGGCTTAAGCCGTAACCGTCTTCGAAACGGTTTGGAACCAGGTAGTCGATATTGCTGCAACCAAGCGAGCGCATCGCCAGCACGCTTAGAGCCGTGCTGGTCGCACCGTCGGCGTCGAAATCACCGACCACAATAATCCGCGTTCCTTCGCGAAAAGCGTTGTAAAGGATCTCAACGGCCTTTTCGACGCCGCTCAGTTGCTGCCAGGGCAGCATGCCTTTAACACTGCGTTCCAGTTCCTGCGCGCTACGCACACCCCGGCTGGCATATAAACGGCGCAGCAAGGGAGGCAATTCAGCGGGCAAGTCGGCCGTTTCATCGACTTCTCGGCGACGAAGTTGTATCTGTTGTTTCACGCGAATTATTTACCGCTGGTCATTTTTTGGTGTTCGTCGAGGAATTCTTTCATGTCTTTCGGCGGCTGGTAACCCGGAACAAGTGTGCCATTGCTCAGCACAACTGCCGGAGTACCGCTAACGCCAAGCTGGACGCCAAGTGCGTAATGGTCGGCAATATCCACGTCGCAGCTGGCTGGTGCGACGCTTTTACCTGCCATCACATCATCAAACGCTTTGTTTTTATCTTTCGCACACCAGATAGCTTTCATTTCTTTCTCTGCATCGCTGTCCAGCCCCTGGCGCGGGAAAGCAAGATAACGCACGGTGATCCCCAGCGCGTTATAGTCTGCCATTTGCTCATGCAGTTTGTGGCAGTAACCACAGGTAATATCAGTAAACACGGTGATGACGTGTTTTTCCTGCGGCGCTTTATAAACGATCATCTCTTTTTCAAGCGCATTCAACTGCTTTAACAGCATCTTATTGGTGACATTGACCGGAGCCGTGCCACTAACGTCATACATTGGCCCCTGAATGATATGTTTACCATCATCGGTGATGTACAACACACCGCTGTTAGTCAGAACTGTCTTCATGCCAGCTACGGGCGCGGGCTGAATATCGCTGCTTTTGATGCCCATTTTGGCTAACGTTTGTTGAATTGCCGCGTCATCAGCCTGAACAAAGCCTGAAAACGCTGCCAACAAGGTAAATAACATAAAACCTTTCTTCATAAATTTTCCTGTTCTTTTCAGACATCACGCCCGCGGGTGATGCTGTTGATGAAGTTGTCGCAGACGCTCGGTAGCGACATGCGTATAAATTTGCGTGGTGGAGAGATCGCTGTGGCCCAGTAGCATCTGCACCACGCGTAAATCCGCACCATGATTTAATAAGTGAGTGGCAAAAGCGTGACGCAACACATGCGGTGACAGCTTTTCGCTGTCGATACCCGCCAGCACGGCATAATGTTTAATGCGGTGCCAGAAGGTCTGTCGCGTCATCTGCTGCGCACGCTGGCTGGGAAACAACACGTCAATTGACACACCATTCAACAGCCACGGACGCCCATGTTCCAGATAGGTTTCCAGCCAGTAAACCGCCTCTTCACCTAACGGCACCAGGCGCTCTTTGTTGCCTTTACCAATGACCCGCACCACGCCCTGACGCAGGCTGATATCACTCATTGTCAGCCCGACCAGTTCAGAGACACGCAGTCCGGTAGCATACAACACTTCAAGCATGGCTTTATCGCGTAGCTCCAGTGGCTGATCAATTAATGGTGCCTGTAATAAACGTTCGACCTGCGCTTCGCTTAAATCTTTTGGCAAACGCTGGGGCAATTTCGGTGAAGCGAGATGCGCACTGGGATCATCTTCACGAAACTTTTCGCGATAAAGATACTGGAACAATCGGCGCACTGCACTCAGCAAACGCGCTGAGCTGGTGGCTTTATACCCGCCCTCCAGCCGTTCTGCCAGTAATGCCTGCAAATCGTCACTTTGCGCCGTCGCCAGCGTCAACCCGCGGTGATGCAACCACTCCACCATCATTGACAGATCGCGACGGTAAGCGTTCAACGTATTTTCAGCCAGATTTTTTTCCAGCCACAGAGCATCAAGAAACTGCTCGATGCGTGCCAGATCCTGTTTCACTTGCGCCCCTTATGGTCACTCATTTGATCCATTATGCCTTATTGTGCCGTGACTAAAGCGATTCTGATACACTAGCCGCAAAAGCCACAGCAGAATCGAGAAGCTTACGTTATGAATATGGGTCTTTTTTACGGTTCCAGCACCTGTTACACCGAAATGGCGGCAGAAAAAATCCGCGATATTATCGGCCCAGAACTGGTGACCTTACATAACCTCAAGGACGACTCCCCGAAATTAATGGAGCAGTACGATGTGCTCATTCTGGGTATCCCGACCTGGGATTTTGGCGAAATCCAGGAAGACTGGGAAGCCGTCTGGGATCAGCTCGACGACCTGAACCTCGAAGGTAAAATTGTTGCGCTGTATGGGCTTGGCGATCAACTGGGATACGGCGAGTGGTTCCTCGATGCGCTCGGTATGCTGCATGACAAACTCTCGACCAAAGGCGTGAAGTTCGTCGGCTACTGGCCAACGGAAGGATATGAATTTACCAGCCCGAAACCGGTGATTGCTGACGGGCAACTGTTCGTGGGTCTGGCGCTGGATGAAACTAACCAGTATGACCTTAGCGACGAGCGTATTCAGAGCTGGTGCGAGCAAATCCTCAACGAAATGGCAGAGCATTACGCCTGATGTCACTGACGGCTTAGCACATATGCTTTGCCGTCATCTTTATCTTTGCGTCTCTTGTTGTAACAATATCCGCCGTAAATCCCGCCATTCGGCTTCGTCCATGCTGTCAGCTGCCAGCCATAAATGTTGCCGTTTTCCGCTGTCAGAACGTAAACGCAGCATCATGCCGCTCTTAATCATCCACGGCGCTTTGACGATGCTCCACTCCTGCCCTTGCCAACGCAAACGCCCGTCCATCAACAAGCGAATTTCCCCCTGGCGAGCATTAATGCGCCGCTGGCTGCGAACGCAATCAAACACCACCAGCGAAAGTAACACCATCCATAACGGGGTGTAACTGAGCGGCCAGGGCATGAGTAAAATAACAGCGGCAACCAGCCCATGAATCAGCAAGGAAAGCCACTGTGCGCGCCAGGAGACGCGCAAATCAGATTGCCACAGGACCACGTTCCCGGTTCCGTGTCTGGATGAGTCGGACCATCATTTCCAGTTCTGCATCGGCTGGTTTACCGTGATTCATCAGCCAGTTAAACAGGTCCGGATCGTCACATTCCAGCAGACGAATAAAGATGCGTTTTTCGTCATCGCTTAAGCTGTCGTACTCATGTTCGAAAAACGGCATGATTGAAATATCGAGTTCGCGCATACCACGGCGGCATGCCCAATGAATGCGGGCTTTGTTGTTAATGTCCATCTTCTTCCTGTCTCACGAAAATCCAGTACCCGGCTATTGTAACGTGTTTTTCGACTTCTTTTACGGGAATATCAGTAAACACAATCGCGATCGCGAAATTAATTCACAACAATTCAAGGGCTTCATTTTTTTGGAAGTCGCCTCGCAGAAGGCACAGATCGCGTAGTGAAAGCACTTGCATTGCCTCATAGCTCTTTTACCATTAGTTATTAATACGCCGTTAAGCAACTCAGGACTCTATTATGGCTTTTACACCTTTTCCTCCCCGTCAGCCTACGGCTTCTGCCCGTTTGCCACTGACGCTGATGACGCTTGATGACTGGGCGCTTGCCACTATTACTGGCGCGGACAGCGAAAAATATATGCAAGGCCAGGTGACAGCAGATGTCAGCCAGATGACAGAAGATCAGCACCTGCTCGCCGCCCATTGCGACGCCAAAGGTAAAATGTGGAGCAATTTACGTCTGTTCCGCGACGGCGATGGCTTTGCATGGATTGAACGGCGCAGCGTGCGTGAACCACAGCTGACTGAACTGAAAAAATATGCGGTGTTCTCTAAAGTGACAATCGCGCCAGACGACGAGCGTGTGCTGCTTGGTGTTGCCGGTTTTCAGGCGCGCGCCGCGCTGGCAAATCTCTTTAGTGAACTGCCTTCGAAAGAAAAACAGGTAGTTAAAGAAGGCGCGACTACTCTGCTTTGGTTTGAACATCCGGCAGAACGTTTCCTGATCGTAACCGATGAAGCTACTGCCAATATGCTGACCGATAAACTGCGCGGTGAAGCGGAACTGAACAATAGCCAACAGTGGCTGGCATTAAACATTGAAGCGGGTTTCCCGGTGATTGATGCCGCCAACAGCGGGCAGTTTATCCCCCAGGCGACCAACCTCCAGGCGCTGGGCGGTATCAGCTTTAAGAAAGGCTGCTATACCGGACAAGAGATGGTGGCGCGAGCAAAATTCCGTGGTGCCAACAAACGCGCGCTCTGGTTGCTGAAGGGTAGCGCCAGCCGACTGCCGGAAGCTGGTGAAGACTTAGAGCTGAAAATGGGCGAGAACTGGCGTCGTACCGGTACGGTGCTGGCTGCGGTCAAACTGGAAGATGGTCAGGTTGTGGTGCAGGTTGTCATGAATAACGATATGGAACCGGACAGCATCTTCCGCGTGCGTGACGATGCGAATACATTGCGTATCGAGCCACTGCCATATTCGCTGGAAGAGTAAATCTCTGTATCGCATCAGGCATTTATCGCCTGATGCGACACTGGTGTGTCTTTTCAGGCCTACAAAGGCACGCCAATTACGCCTGCCCAATATACAAATAGATCGCCAGAAAGTGGCACACACTACCGCCGAGCACAAAGCCGTGCCAGATGGCATGATTGTATGGAATGCGCTTGCAGACGTAGAAAATCACCCCGAGCGAATAAACCACACCGCCTACCGCCAGTAAGGTAACGCTGCCCGCCGCGAGCTTAACTGCCATTTCATAAATTACCACCAGCGACAGCCAGCCCATCGCCAGATAGGTCACCAGAGATAAAATTTTGAATCGGTGCGCGATGGTCAGTTTAAACAGAATACCCAGCAATGCCAGGCTCCAGATAACAATCATCAACCCGCGCGCTAACGGAGAATCCAGCCCCACCAGCAAAAACGGCGTATAGGTTCCGGCAATCAACAGATAAATGGCACAGTGGTCAAATTTCTTCAGCCACATTTTTGCCCGTTGATGGGGAATGGCGTGATAGAGCGTCGAAGCGAGGAACAGCAGGATCATACTGCCGCCATAGAGGCTGTAACTGGTTATCGCCGTGGCGCTGGCATTGAGATCCACCGCCTGAACCAGTAGCAACACCAGCCCAACGATACCAAACACCAGCCCAATGCCGTGACTGACGCTGTTGGCAATTTCCTCTGCCAGCGAATATCCCTGCTTAATGAGGGGCTTCTGAACCATAACTTACTCCGGAAAAACGTACACGCACATGTATACCTCTCCAGCGTAACTGAGAATAGTTCCAGTGAACACCTGTTAGCTAAAATAAATTCTGATTTGAGATTAATCTCCGAAAAATCATGAAATTAAATGCGAAATTTCAACTAACAGGCGTGAGTTCAATTTAAAGACATTTAAATTCAATCACATAAAACTGTGTCTGGTCGGGATAGATGTCGGCAATGACCTTTTTCAGTTCAGTCAGGGTCATATTTTCCTGCTCTGCATGTTTTTCCGTCAGCGTATCCAGCGTTACGGTTGAGGTTGCGGTGACTTCAATCGTGCAAAAATAACCGTCATCTTCAAAACGTCCGACACGAAGCACATCACCCGTTTTGAAGTGCGATTCAGACTCGTCGCGGATGGTGATGGTTTTACGCCCAGCCAGAATGTCATCCTGGAAACGTTGAAAAAAAGTGATGTCGTTTGGCTGCATGGTAATATTTCCTGTAAGAATTGACTCATCTGGAGCCTATGATAGTGAAAAAACTCACCTTACCGAAAGATTTCTTATGGGGCGGCGCAGTTGCCGCTCATCAGGTCGAAGGCGGCTGGAACAAAGGCGGCAAAGGGCCGAGCATTTGTGACGTTTTGACCGGTGGCGCACACGGCGTGCCGCGCGAAATCACCAAAGAAGTTGTGCCTGGCAAATACTATCCAAACCATGAAGCCGTTGATTTTTATGGTCACTACAAGGAGGACATCAAGCTATTTGCCGAAATGGGCTTCAAATGTTTTCGTACTTCCATCGCCTGGACGCGCATTTTTCCAAAAGGCGATGAAGCTCAGCCAAACGAAGAAGGGCTGAAGTTCTACGATGATATGATCGATGAACTGCTGAAATACAACATCGAACCGGTGATCACCCTCTCCCACTTTGAAATGCCGCTGCATCTGGTGCA +>test.0417.00002.0005 6009 +GCAATATGGTAGCTGGACCAACCGTAAAGTGGTTGATTTCTTTGTCCGTTTCGCGGAAGTGGTATTTGAACGCTATAAGCATAAAGTCAAATACTGGATGACTTTCAACGAAATTAACAACCAGCGTAACTGGCGTGCACCGCTGTTCGGTTACTGCTGCTCCGGCGTGGTGTATACCGAGCATGAAAACCCGGAAGAGACGATGTATCAGGTGCTGCATCACCAGTTTGTCGCCAGCGCCCTGGCGGTGAAAGCCGCGCATCGCATCAACCCGGAGATGAAAGTCGGTTGTATGCTGGCGATGGTGCCGCTCTATCCTTACTCCTGTAACCCGGACGATGTGATGTTTGCCCAGGAGTCGATGCGCGAACGTTACGTCTTTACCGATGTGCAGTTGCGTGGCTATTACCCGTCCTATGTGTTGAACGAGTGGGAACGCCGCGGATTTAACATCAAAATGGAAGACGGCGATCTGGATGTACTGCGCGAAGGCACCTGCGATTATCTCGGCTTCAGCTATTACATGACCAACGCGGTGAAGGCCGAAGGTGGCACCGGCGATGCGATTTCTGGTTTCGAAGGCAGCGTACCGAATCCGTATGTTAAAGCGTCTGACTGGGGCTGGCAGATTGATCCGGTTGGTCTGCGCTACGCACTTTGCGAGCTGTATGAGCGTTACCAGAAGCCGCTGTTTATTGTCGAAAACGGTTTTGGCGCTTACGACAAAGTGGAAGATGATGGCAGCATCAATGACGATTACCGCATTGATTACCTGCGTGCCCATATTGAAGAGATGAAAAAAGCGGTGACTTACGATGGCGTGGACCTGATGGGCTACACGCCGTGGGGCTGCATCGACTGTGTGTCGTTCACCACCGGGCAGTACAGCAAACGCTACGGCTTTATCTATGTGAATAAACATGACGACGGTACTGGCGATATGTCGCGTTCACGTAAGAAGAGCTTTAACTGGTACAAAGAGGTGATTGCCAGCAACGGCGAGAATCTGTAATTAGCCGATGTGCCTGATGTGCTCCGCTCATCAGGCCTGGCACTCTTTTAATATATTGAGCTCGCAATATTTTATATTACGCCTCAGCCGAAACACACAAAGCGCACTTTATTAACAAGCGAAAAAGGCGCCGAAGCGCCTTTATAAGATAGTCGAATCAGTAAATTACTGGTATTCGCTAATCGGTACGCAGGAGCAGAACAGGTTACGGTCGCCGTAAACATCATCCAGACGTTTCACGGTCGGCCAGTATTTGTCTGCCACACCTGCCGGGAATACTGCAACTTCACGGCTGTACGGATGCGCCCACTCGGCGACCAGTTCGCTTTGAATGTGCGGCGCATTCACCAGCGGGTTATCTTCCAGCGGCCAGACACCGGCTTTCACCTGATCAATTTCTGCGCGGATAGCCAGCATCGCATCGATAAAGCGATCCAGTTCCACTTTGCTTTCAGATTCAGTCGGTTCAACCATCAGCGTACCCGCCACCGGGAACGACATGGTCGGCGCGTGGAAACCGTAGTCGATCAGGCGCTTGGCAATATCCAGCTCGCTGATGCCGGTTTCTTCTTTCAGCGGGCGAATATCGAGAATACATTCGTGCGCCACGCGACCGTCGCGACCGGTATACAGCACCGGGAAGGCATCCTGCAGACGGCTGGCAATATAGTTGGCGTTAAGAATTGCCACCTGGCTTGCTTTTTTCAGCCCTTCTGCGCCCATCATGCGGATGTACATCCAGCTGATTGGCAGGATAGAGGCACTACCGAACGGTGCCGCAGAAACCGCGCCCTGACGGGTTAACATGCCTTCGATTTGCACCACGCTATGACCCGGTACAAACGGAGCCAGATGCGCTTTCACACCGATCGGTCCCATACCCGGACCACCACCGCCATGCGGAATGCAGAAAGTTTTATGCAGGTTAAGGTGGGAAACGTCCGCACCAATAAAGCCCGGCGAGGTGATGCCAACCTGAGCGTTCATGTTCGCGCCATCAAGGTAAACCTGACCGCCGAACTGATGCACGACTTCACACACTTCACGGATCGTTTCTTCATACACGCCGTGGGTAGAAGGATAGGTCACCATGATACAGGAGAGGTTATCGCCCGCCTGTTCCGCTTTCGCGCGCAGATCAGTCAGATCGATGTTGCCGTTTTTATCACACGCCACAACCACCACCTGCATTCCTGCCATATGCGCGGAAGCCGGGTTAGTGCCGTGCGCAGAAGCCGGGATCAGGCAGATATCGCGATGCCCTTCGTTGCGGCTTTCATGATAATGACGAATCGCCAGCAGGCCCGCGTATTCGCCCTGTGCGCCAGAGTTCGGCTGCATACAAACGGCGTCGTAACCGGTCAGTTTCACCAGCCAGTCAGCCAGCTGCGCGATCATCTGCTGATAACCTTCAGCCTGTTCTGGCGGGCAAAACGGGTGCAGTTCGGCAAATTCCGGCCAGGTGATCGGGATCATCTCGGCGGCGGCGTTCAGTTTCATGGTGCAGGAACCCAGCGGGATCATCGCCTGATTCAGCGCCAGATCTTTACGCTCCAGCGAGTGCATATAGCGCATCATTTCGGTTTCGCTGTGGTAGCGATTAAACACCGGATGGGTGAGGATTTCGTCGTCGCGCAGCATCGCAGCCTGAATAGAGCGACTGTCGTGAGCCACGTCTTTGTCCAGTGTGTCGATGTCCAGCCCGTGGTTATCGCCCAACAGCACGCTGAAAAGCTGCATCACGTTTTCGCGCGTGGTTGTTTCATCAAGGGTGATCCCAACCGCGTTCAGAATATCGCTACGCAGGTTGATTTCAGCCGCTTCGGCACGCGCCAGCACGCCCGCTTTGTCGGCCACTTCCACACACAAAGTATCGAAATAGTGCGCATGGCGCAGCTTCAGACCTTTTTGTTGCAGGCCCGCCGCCAGGATATCGGTCAGACGGTGGATGCGATTAGCGATACGTTTCAGGCCAACCGGACCGTGATAAACGGCATACAGGCTGGCAATGTTTGCCAGCAGTACCTGGGAAGTACAAATGTTGGAGTTCGCTTTCTCACGACGAATATGTTGCTCGCGAGTCTGCATCGCCATGCGCAGAGCGGTGTTGCCAGCTGCATCTTTCGATACACCGATAATACGGCCCGGCATTGAGCGTTTGTATTCGTCTTTCGCCGCAAAGAATGCCGCGTGTGGGCCACCATAGCCCATCGGTACGCCAAAGCGTTGCGCCGAACCAAAAACAATATCCGCGCCCTGTTTACCTGGCGCAGTTAACAGCACCAGCGCCATAATATCGGCGGCAACGCTGACCACAATTTTGCGTGATTTCAGTTCGCTAATAAGCGCGGTGTAGTCGTGAATTTCACCAGTAGTGCCGACCTGCTGTAACAGCACGCCGAAAACGTCCTGATGGTCGAGCACTTTTTGCGCGTCATCGACAATCACTTCAAAACCAAAGGTTTCGGCACGAGTACGGACCACATCCAGCGTTTGCGGATGAACGTCAGAAGCAACAAAGAAGCGGTTGGCATTTTTCAGTTTGCTGACGCGTTTCGCCATCGCCATTGCTTCGGCGGCAGCGGTGGCTTCGTCAAGAAGAGAAGCAGAGGCCATATCCAGCCCGGTTAAATCCAGCGTTACCTGCTGGAAGTTGAGCAGTGCTTCAAGGCGGCCCTGGGAGACTTCAGGTTGATACGGAGTATACGCGGTATACCAGCCCGGATTTTCCAGCATGTTACGCAGGATAACCGGCGGTAGCTGCACGGCGGTGTAACCCATGCCGATGTAAGACGTGAAGCGTTTATTGCGACTGGCAATAGCCTTGAGTTCTGCCAGTGCGGCGTATTCGGTCGCCGGTGCGCCAACCTGCGGCGGAGTCGCAAGCTGAATATCTTTCGGCACAATCTGGCCGGTCAGCGCGTTTAACGATTGTGCGCCAACGGCATTCAGCATTTCTTGCTGTTGCGCGGCGTCCGGTCCGATATGGCGTTCAATAAAAGCGCCGCTGTTTTCAAGCTGGCTTAACGTCTGTGTCATGAGCGATGGTTCCTGAAACGTGCAGTGAATTGTGAACCTCTCTCCTTGCGAAGAGAGTGAGGGTGAGGCGTAAATTTCCTCACCCTGATCCTCTCCCGCAGAAGAGGAATAAAGCCGTTACTCGTCTTCTAACAATGCTTCGTATGCGGTTGCATCCAGCAGTGATTCCAGTTCGCTTTCATCGCTGGCTTTGATTTTGAAAATCCAGCCGCCTGCATACGGTTCGCTGTTCACCAGTTCCGGGAAATCGCTCAGTGCATCGTTTACCGCCACGATTTCACCGCTTACTGGCGCATAAATGTCTGACGCCGCTTTTACCGATTCGGCAACCGCGCAGTCATCGCCCGCGCTAACCGTTGCGCCCACTTCCGGTAGGTCAATAAACACCATATCGCCTAACAGCTCCTGAGCGTGTTCGGTGATGCCAACGGTGTAAGTGCCGTCGGCTTCTTTACGCAACCATTCGTGTTCTTTGCTGTATTTCAGTTCTGCTGGTATGTTGCTCATCAATCAATCTCCAAAAAAGTAAATCACGCGACGGCTTTGCCGTTACGCACAAAAACAGGTTTCGTCACTTTAACCGGCATTTCACGGTTGCGAATTTGCACAATCGCCGTTTCACCAATACCTTCCGGCACGCGCGCCAGCGCAATGCTATAACCCAGCGTTGGGGAGAAAGTACCGCTGGTGATAATGCCTTCATGCTGGTTGCCCTGCGCATCAGTAAAACGTACCGGCAGTTCATTACGCAGCACGCCTTTTTCGGTCATCACCAGACCAACCAGTTTTTCTGTGCCATGTTCACGCTGCGCTTCCAGAGCTTCACGACCGATAAAGTCACGATCTGCCGGTTCCCAGGCGATAGTCCAGCCCATATTGGCGGCTAAAGGAGAAATAGTTTCGTCCATCTCCTGGCTATACAAATTCATGCCCGCTTCCAGACGCAGCGTGTCACGCGCGCCCAGGCCACATGGCTTAACGCCAGCTTCCACCAGCGCGCGCCAGAAATCGGCCGCTTTTTCATTGGGCAGCGCAATTTCGTAGCCCGCTTCACCGGTGTAACCGGTGGTGGCAATAAACAGATCGCCCGCCTGCACGCCAAAGAACGGTTTCATCCCTTCCACCGCCTGACGCTGGGCGTCATTAAACAGTGTGGCAGCTTTTGCCTGCGCATTCGGCCCTTGTACGGCGATCATGGAAAGGTCATCACGAACAGTAATTTCGATGCCGAAAGGTTCAGCGTGTTGGGTAATCCAGGAGAGGTCTTTTTCGCGGGTGGCGGAGTTAACAACGAGGCGGAAGAAATCTTCAGTAAAGTAGTAGACGATGAGATCATCTATCACACCGCCAGAGGCATTCAACATCCCCGAGTAAAGGGCTTTGCCGCTTTTGGTGAGCTTCGCCACATCGTTCGCCAGCAGATAACGTAGAAACTCCCGGGTGCGGCTGCCGCGAAGATCGACGATGGTCATATGTGACACATCAAACATTCCGGCATCGGTACGTACCGCATGATGTTCGTCGATTTGCGAACCGTAATGCAGCGGCATCATCCAGCCGTGGAAATCCACCATGCGAGCGCCGCAAAGCGTGTGTTGTTCGTACAAAGGAGTCTGTTGTGCCATCTTGTCCTCATTGAATAAGCGGGGCTGACAACTTTTCCATGGCGAAATTATCACCACGAAACCCAGCATCGGAGCCACTCCCGGTCCCCAACGCAATCGTTCTCTTTTGCCTGAACTTACCACCGAAACAGACTGTTAACCATAAGGTAAAATTGATCATCACATTAGCTTATGGTTAAAAAACGCCAAAATCGTAACAGAATAAAAAACCAAAAAATGAACAAATCTCTATATAAAGATAAATAGATGAGAAAGTTAATTTGAATAAGACAACATTAAGAACTAAAAAAATGTCAAAAAACACTAAATCAAAAATTCGTGGCATTAGAAAAT diff --git a/test/data/annotate/exp_files/res_formatAll/prodigal/Replicons/test_runprokka_H299.fna b/test/data/annotate/exp_files/res_formatAll/prodigal/Replicons/test_runprokka_H299.fna new file mode 100644 index 0000000000000000000000000000000000000000..d3a4a1981ef3c007d131cf5d3b708a7a239ec122 --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prodigal/Replicons/test_runprokka_H299.fna @@ -0,0 +1,223 @@ +>test_runprokka_H299.0001 3480 +AGCAGCACGCTTTTTAATCCGTCCACCGGACCTTCAACCGGCCCTTCGCTGATGGCATCG +ATCACACTCAGCAGCTGCGTGGACTTCAGGTTGTCCTTCGCTTCGCGCGGGGTATGCCCC +TTACTGCTGCCTTTACCCATTCGTCATGCTCCATAAACGATAAAACCGCCCGGAGGCGGT +TTCACATAAAACATTTTGCATCAGCGACCAATCACCACAACCTGACCACCATCCCCTTCG +TCTGCCGTGCTGATCTCCTGAGAAACCACGCGTGACCCCACGCGCATTTCACCGTACAGA +ACCGGCAGAACATTGCCCTGGGCAACCATGTTATCCAGTGAAGAAAAATAGGTATTCTGT +TTGCCGTTATCCGTTGTCTGTGTGCGGGGGGTTTTGGGTTTAGGGGCCAGCATCTGTGCA +ACACCGCCAAGCGTCATACTGGCACCGAGAGAAAACAGCAGATTACTCGCCATAATTCCT +ACCCCCGGCATCCATATAGCAACCGCCATAACAGCCGCCCCCAGCACAGCCTGAAACACA +CCGCCACTTTTGGCTCCTGCCAGACGCGGCACGATATGGATCACGGCACCATTTTCCAGC +GGCTCATTAAGACGGGCAGACAATTCGGTTTCACCTGCATCACGCCCGGCAATGCGTACC +TGGTACCAGCCGTCGCTCAGTTTCTGACGAAATGCCGGGATCTGCATGGCCAGCGCCCGG +ATGGCTTCGGACCCCGTTTTCACTCGAAGGTCGATGCGGCGGCCAAATCGTTGTAAATCC +CCGTAAAGGCAGATGCGTGCCATGCCCGGTGACGCCAGAGGGAGTGTGTGCGTCGCTGCC +ATTTGTCGGTGTACCTCTCTCGTTTGCTCAGTTGTTCAGGAATATGGTGCAGCAGCTCGC +TGTCACCACAGTAAATGGCGGCATGATTCGGCACCGATGAACCAAAACAGCACAGCAGCA +CATCGCCCGGCTGCGCCGCTGACAACGGCACCTGATACAGCCCTGTGGCCTCCAGATTAT +CCAGATAGAGATTCTGACCGTTACGCCACCAGTCATCCCCGCGATGAAAATCCGGCATCT +CAATTCCCGCCAGATGGTAAGCGTCCCGGAACAGCGTGTAACAGTCCGTTACCCCGTGCT +CAAAGCGCCGCCCGGTGAGATGCGGCACACAGCGGAATTTATGAATCGCCCCCCGGCAGA +CCAGCCACCACGGCAAATCACTCTGTACCTGCAGCCGCCGGTCGGCCTCACTCAGCCAGG +GCAGACCACCGGGGTGGCTGTGGACCAGCGCCACAATCTCTCTCTGCATTTCTGCACTCA +GCCAGTCCTCCGGCGACATCCGGAAATACTCCTCCGGCTCACTGGAGATATTCACGCAGG +GAAAATATCTTTCCTCCTCCGGCGTTCTCACCACGAAGCCGCACGACTCCGCTGGCGCAC +ATCGCCGGGCGTGCGCCAGAATCGCTGATTCTGTCTCTGTCATGGGATTTACTGCGAAAG +TTTGTTAATGGAAAGGAAGCTGCCAAAGTTGCCGACATTATTGCGAAACTTACAGCCACT +CAGGCATTTGCTGCATTTATCCTTCGTGATATCGGACGTCGGCTGGTCATATTCATCCGC +GACCGCCGGACCGCTATAACCGCACTCATCGCCGCGATAGGTCCAGGTGCAGGTGTTGGC +CAGCATGATACGTCCCGGAAAAACAGCGCCATCCGTTTCAGTCGGCGTGGACAGTACAAA +AGAGGCACTGACCGCGCTCAGTTCGCTGCACTGCTCGATGCGCCAGCGGCTGATCACCTC +CTGCTCCGGATCGGCTTCGCTGTTTCCGTTGACGAAGTTCACCGCATCCAGAAAGCGGGC +GTAAACCTTACGCCGGACCACCGTTCCGCCGACCAGACTCTGCAGATCTTCCGCCATCCC +GGTGATCATGCCGTGCAGGTTAGAGACCGTCAGTGTCGGACGGGCAGCACTGCCCTTGCC +GTTCATCTCAAATCCACTCCCCTGAATGGGATAGGCCTGATACTGCCGACTCTGCCAGGT +GACAGACTCACCTTTTTCGTTCTGCTCATTACAGAAAAAGTAGCGATCCCCGCCTACCTC +GGTCAGGTCGATTTCCCAGAGCACCACGCTGGCCGACTGCTCCGCACGAATGCATTCATT +CAGCGTTTCCTGTTGTATGTCCTGCATCAGATCACCACTTCGTCAAACTGACACGAAAAA +TCGGTATAGGTGATATGTTCTGTCGCTGACCACGTTCGACACACCACTCTGATTTTTCTG +TTAATACCCGGCGGGCGCCAAAAAAAAGATTTATAGCCTTCATGCCGGGCTAAAAATTTT +TCAAATGAATCACGTTCATTCGCCTCAACTTTGAAATCACAGGTGAAAACGCGCAGAGAA +TGATTAAGTCCATTTGGACTTCGTTGCTCATAACCATCGCCAAATCTTACAGTTTTTATC +GATGGTTTATTTTCTGTTTTCATTCCATCCTCTGGTAACCAGTGAAATTCTTCCGTATTA +GCCACTTAACATTCCCCCATCACGTCGCATATTTAACAGATTGCCCTGCACCCGCTGATC +AACCATCCCCATAAGTGCTTTTATTGCCTGAGGGCCAATCTCTCCATTCTGGCCGTCATT +TTGAATAGTGATTTGGTATACAGGGGCATAGGTAATATCTCCGCCTCCATTACCACTTTT +ACTATTAATAGCTCTGACACCAAGAGAACCATCGGAAGTTCGTGTTAATGGCATAATGGC +TTCCGGTCCAGCCTCACCAAAAACACCAGCCCCTTTTGCAAAAGCAAAAAATTGCGGGGA +ATCATAAATACCGTTCGAATACGTGCTCAATGACGGAGACTCATAAACACCGCCCTTTGC +ATTCGGAATAAATTTACTAATAGCACTCCCGATAGTTCCTAAAATCCCCCCAGAAGAACT +GTTACTAATGCTGTCGAAAATCCCAGTAATTGAAGCCTTTAATGCTATTCGACTAAGATC +CGAAATCACGGAAGTAGCGAAAGAACGAAAATTTGCCTTGCCTGTCGTGACAAAATCACC +CAGCGCATCGGTCATCCCATCAAACATCTGAGTCGTGGTTGATTTTATCTGCTCACTGAT +ATCCTTAGTGTCATCCAGCCAGTTATTGAATCCCTGGGAGGCACCACTAACCCAGTCTCC +TGCCTGAATATCGAGCTGCTCGTTTTTCTGTCTGACAATTTCTTTTTCCCGTTCCAGAGC +ATCATTCAGAGCCTGCATTTTCTCTTGAAAAACATGATCTGACATTCCACGGGATTTATC +TGCATAGTCACGTTCAAGTTGCAGACGCTGATTGTTATATCCATGTTCAATCCGCAGTAA +TTCCTGCTGGCGTTGCTGATTTTTATCGCCAACCCCATAACCAGCAATCTGAATATCATA +CCCCTGCTGACGATTATCAATCGAAGCCTGCAATGAATCACGCCATGCTGTTATTTCGGC +>test_runprokka_H299.0002 7080 +AGCAGCACGCTTTTTAATCCATCCACCGGACCTTCAACCGGCCCTTCGCTGATGGCATCG +ATCACACTCAGCAGCTGCGTGGACTTCAGGTTGTCCTTCGCTTCGCGCGGGGTATGCCCC +TTACTGCTGCCTTTACCCATTCGTCATGCTCCATAAACGATAAAACCGCCCGGAGGCGGT +TTCACATAAAACGTTTTTCATCAGCGACCAATCACCACAACCTGACCACCATCACCTTCA +TCTGCTGTGCTGATCTCCTGAGATACCACACGTGATCCCACGCGCATTTCACCGTACAGA +ACGGGCAGAACATTGCCCTGGGCAACCATATTATCCAGTGAAGAAAAATAGGTGTTCTGT +TTGCCGTTATCCGTTGTCTGTGTGCTGGGGGTTTTGGGTTTAGGGGCCAGCATCTGTGCA +ACACCGCCAAGCGTCATACTGGCACCGAGAGAAAACAGCAGATTACTCGCCATAATTCCT +ACCCCCGGCATCCATATAGCAACCGCCATAACAGCCGCCCCCAGCACAGCCTGAAACACA +CCGCCACTTTTGGCTCCTGCCAGACGCGGCACGATATGGATCACAGCACCATTTGCCAGC +GGTTCATTAAGACGGGCTGATAATTCCGTTTCACCTGTATCACGCCCGGCAATCCGTACC +TGATACCAGCCGTCGCTCAGTTTCTGACGAAACGCCGGGAGCTGTGTGGCCAGCGCCCGG +ATGGCTTCAGCCCCCGTTTTCACACGAAGGTCGATGCGGCGACCAAATCGTTGTAAATCC +CCGTAAAGGCAGATGCGCGCCATGCCCGGTGACGCCAGAGGGAGTGTGTGCGTCGCTGCC +ATTTGTCGGTATACCTCTCTCGTTTGCTCAGTTGTTCAGGAATATGGTGCAGCAGCTCGC +CATCACCACAGTAAATGGCGGCATGATTCGGCACCGATGAACCAAAACAGCACAGCAGCA +CATCGCCCGGTTGTGCTGATGACAACGGCACCTGATACAACCCTGTGGCCTCCAGATTAT +CCAGATAGAGATTCTGACCGTGACGCCACCAGTCATCCTCGCGATGAAAATCCGGCATCT +CAATCCCCGCCAGATGATAAGCATCCCGGAACAGCGTGTAACAGTCCGTCACCCCGTGCT +CAAAGCGCCGCCCGGTGAGATGCGGCACACAGCGGAACTTATGAATCGTCCCCCGGCAGA +CCAGCCACCACGGCAAATCACTCTGCACCTGCAGCCGCCGGTCGGCCTCACTCAGCCAGG +GCAGACCACCGGGGTGGCTGTGGACCAGCGCCACAATCTCACCCTGCATCTCTGCCCGCA +GCCAGTCCTCCGGCGACATCCGGAAATACGCCTCCGGCTCACCGGAGATATTCACGCAGG +GGAAATATCTTTCCCCTTCCGGCGTTCTCACCACGAAGCCGCACGACTCCGCTGGCGCAC +ATCGCCGGGCGTGCGCCAGAATCGCTGATTCTGTCTCTGTCATGGGATTCACTGCGAAAG +TTTGTTAATGGAAAGGAAGCCGCCAAAGTTGCCGACGTTATTGCGAAACTTACAGCCATT +CAGGCATTTGCTGCATTTATCCTTCGTGATATCGGACGTCGGCTGATCATATTCATCCGC +GACAGCCGGACCGTGATAACCGCACTCATCACCGCGATAGGTCCAGGTGCAGGTATTAGC +CAGCATGATGCGCCCCGGAAAAACGGCACCATCCGTTTCCGTCGGCGTGGACAGTACAAA +GGAGGCACTGACCGCGCTCAGTTCGCTGCACTGCTCGATGCGCCAGCGGCTGATCACCTC +CTGCTCCGGATCGGCGTCGCTGTTTCCGTTGACGAAGTTCACCGCATCCAGAAAACGGGC +GTAAACCTTACGCCGGACCACCGTTCCGCCGACCAGACTCTGCATATCTTCCGCCATCCC +GGTGACCATACCGTACAGGTTAGAAACCGTCAGCGTGGGGCGTGTACTGGTGCCTTTGCC +ATTCAGTTCAAAACCGCTCCCCTGAATGGGATACGGCTGATACTGTCGCCCCTGCCAGGT +GACCGGCTCACCTTTTTCGTTCTGCTCATTACAGAAAAAATAACGTTCTCCACCGACCTC +TGTCAGGTCGATTTCCCAGAGCACCACGCTGGCCGACTGCTCCGCACGGGTGCATTCATT +CAGTGTTTCCTGCCGGATATCCTGCATCAGTTCACCACCTGTTCAAACTCTGCGCTGAAC +TCAACACGCAGCATACTGACCCGCGACGACCATTTTGCGCAGGTCACCTTTATCTGCCGC +CACTCATAAGGCGGCGTCCACAGAAAGGCTTTCCAGCCCCCGTGCTCTTCCAGAAACGAC +TCCAGTACCGTGGCCTCCCAACGGGGGACAGAAAGCGTCACGCTGTACGTTTTCAGGTTG +GCATTCAGCCCGGCAGGCGCTCGCTGGGAATAGCCATCACCAAAGCGCACCTTTCTTACA +GAAGGGGCCGAAGCCACATCCATACCGGGTTTCACTTTCCAGCGGAAGGTTTTCATCGTC +CACCTCCGGAGAACAGGCCACCATCGCGCATCTGCCCGGTCACAACATCCATTGCCGCCT +TACGGGCTACGTCATAAACAGCCTTCAGCGCCTGTGGCCCTATCTGCCCGTTCGTGCCGT +CGTTGTTAATCACCACATGGTTATTCTGCTCAAACGTCCCGGACGCCTGCGACCGGCTGT +CTGCCATGCTGCCCGGTGTACCGACATAACCGCCGGTGGCATAGCCGCGCATCAGCCGGT +AAAGATTCCCCACGCCAATCCGGCTGGTTGCCTCCTTCGTGAAGACAAACTCACCACGGT +GAACAATCCCCGCTGGCTCATATTTGCCGCCGGTTCCCGTAAATCCCCCAGTCGCAAAAT +GGAATTTCGCCGCAGCGGCCTGAATGGCTGTACCGCCTGACGCGGATGCGCCGCCACCAA +CAGCCCCGCCAATGGCGCTGCCGATACTCCCGACAATCCCCACCATTGCCTGCTTAAGCA +GAATTTCTGTCATCATGGACAGCACGGAACGGGTGAAGCTGCGCCAGTTCTGCTCACTGC +CGGTCAGCATCGCCGCCATATTCTGTGCAATACCATCAAAGGTCTGCGTGGCTGCACTTT +TTACCTGCGACATACTGTCCGTGGCGCTCTCTTCCCACTCACTCCAGCCGGACTTCAGGC +CTGCCATCCAGCTCCCGCGAAGCTGGTCTTCAGCCGCCCAGGTCTTTTTCTGCTCTGACA +TGACGTTATTCAGCGCCAGCGGATTATCGCCATACCGTTCCTTCAGGCGCTGTTCCGTGG +CTTCCCGTTCTGCCTGCCGGTCAGTCAGCCCCCGGCTTTTCGCATCAATGGCGGCCCGTT +TTGCCCGTTGCTGCTGTGCGAATTTATCCGCCTGCTGCGCCAGCGCGTTCAGGCGCTCCT +GATACGTAACCTTGTCGCCAAGTGCAGCCAGCTGGCGTTTGTACTCCAGCGTCTCATCTT +TATGCGCCAGCAGGGATTTCTCCTGTGCGGACAGCTGGCGACGTTGTGCCGCCTCCTCCA +GTACCGCGAACTGACTTTCTGCCTTCCACAAATCCCGGCGCTGCTGGCTGATTTTCTCAT +TCGCTCCGGCATGCTTCTCCAGCGTCCGGAGTTCTGCCTGAAGCGTCAGCAGGGCAGCAT +GAGCACTGTCTTCCTGACGATCGCCCGCAGACACCTTCACGCCGGACTGTTTCGGCTTTT +TCAGCGTCGCTTCATAATCCTTTTTCGCCGCCGCCATCAGCGTGTTGTAATCTGCCTGCA +GGATTTTCCCGTCTTTCAGTGCCTTGTTCAGTTCTTCCTGACGGGCGGTATATTTCTCCA +GCGGCGTCTGCAGGCGTTCGTAAGCCTTCTGCGCCTCTTCGGTATATTTCAGCCGTGATG +CCTCAGACTCGGCCCAGTCCTTTGCTGCCATCTCTCTGGCCTTTTCAAGATCGGCCTGCA +ACGTGGCGGCGGAAAGCCCAAGTTGCGCATTCGCTCTGTCCTCCCATGCTCCCCGGAGAT +TGGCAAGAAATGCTGAGGTTTTACCGCGCCGGTGGCTCCGGCTCTGATACCACTGCCATT +TTTTGTCCGCCTCATCAAAAGCCTTTTCTGCTTTCTCCAGCATTCCCTGGGCAGTGTCCG +GGCGACCAATATCCAGCACCGAATCCCACATGGATTTGAATGCCCGTGCTGTCCTGTCTG +CCCAGGTCTCCAGCGTGCCCATGTTCTCTTTCAGGCGTCGGGTCTGGTCATCAAACCCTT +TCGTTGCGGCCTCGTTCGCCGCCTGCAATGCCCCGGCTTCATCGCCGGAACGCTGCAACT +GAGCAACATACGCAATCTGTTCCGCCGTCACGTTATGGAACTGGCGTGCCATCGCCGTCA +ACCCCGACGTCGGGTCTGTGGTCAGCTTCCCGAAGGCTTCAGCGACCTTGTCCACCTCCA +CACCGGATGCAGAGGAGAAACGCGCCACACTCTGGCTGATCGCCTCAAACTGCTCACCAC +CACGCACACCGGCATTCACCAGCGCCGTCAGTGACTCGCTGGTCTGGTTAAACGTCAGCC +CTGCCGCCTGCCCGGCTCTGGACAGGACCAGCATACGATCTGCCGTCAGTCCCGCCTGAT +TGCCGGAAAGGACCAGCGTTTTGTTGAAATCGGACAGGGTTGAGTTACCCTGATACCAGG +CATACGCCAGCGCACCGGTCGCCACCGCCAGCGAGGTGGCCCCCACCATCGGCAGGGTGA +TCGCACCGGCAAGCCCCCTGAACATGGGGATCATCCCGCCGAAGGAGTCCTTCACCTGAC +CACCCTGTTGCAGCAGGATCAGCCACGGACTCTGCCCGCCTGCAAGCTGCGTGGCCACGT +CGGTGAACTGCGCAGGCAGCATACGCATGGCGGCTTTATACTGCCCGACGGAAATCCCCG +CTTTCTGTGCAGCCAGCGCCTGCCGGCTCATCGACTGTTCAACGACTGCCGCTGTTTTTT +TCGCATCACTTTCCGTACCGGAAAAATGACGCCTGACTCTGGCCATCTGCTCGTCAAATC +TGGCCGCATCCAGACTCAAATCAACGACCAGATCGCCTACCGGTTCAGCCATACCGGACT +CCTCCTGCGATCCCTTCTGATACTGTCATCAGCATTACGTCATCCTCCGTCATGTCCGCC +ACATCCGGGGAAGCGGGGATAACTTCATTCCCGTCCGGGCCAAAACGAACGCCTCCGGCA +AGCCCTGCCGCTTTCTGCATCAGCACATCATCTTCAGGCTCTTCGTCAGCCTCACGCCGG +TTCAGCAGACTGAAATCCAGCGGATGCATATCCGGATCGCTGAAAAACAGGCTGAGCACG +GTGTACGTCAGCCCGGAAAAGTGCATATCCAGCAGAACATCATGAAAATAATGGGTACTG +TAAAAGCGGTGCCAGTCGGCATACTCCGTGGATGACATCCCGGCAAGCATGGCGCGCCAG +TCGGGTCGCCCCATTTCACGCGCCAGTTTCAGGGCAAAACTCAGCTCACCGTCGAACACT +TTCCCGCAGAAACAGGCTCTGCAGGCCCGGCATCATCTGCCTGTTCAGGGGCATTATTCA +CAACAAACTCAGACATTCCGGACAGACGTAACACCACGTTTTCAGCCTGAGCAATTGCCT +CCGTGGGCCAGGTGGTAAGCACTTCCTGCTCAATCTGTTTAACGGCTTCATTCATGGACG +GCAGCTTTGTCTTCTGCGGATGGTTATGCCACAGAGACATCGCCACCAGAAACGCCCCGC +CTCTGATAAGATCCTCTACAGACACCTGCAGGTTGCCACTGGATTCAGCCTTTTTTTCCT +GCTCTTTCAACCAGGCAAGATGCTCAATACGCTGCAGGGCTGACAGTTCAGAAAGCGTGA +CGGTCACACCGTTATGTTCAAATGATTCGGTTTTCAGGAACATCGCTGACTCTCCGGATT +AGCTGTTGGTGACGTTGATTTCTGCAACCGCAGCAAGTTCACCATTACCGGATACGACCG +GAATGTTGACCTTGCCTGCAGCAACACCTTTCACGGTGATGGTCATACCACTGACCGACA +CGGTGGCTTTTGTTTTATCCGCAGACACCGCACGGAAGCTCTTGTCGGTTGCGCCTTCCG +GCTGGAATGCCACGGTCAGCGTGGTGCTCCGCCCTTTCACCACCGAAGTGCTGGCAGGCG +TCACGGTCATGCCGGTTGCCGCTGTGACCGTGCTGCGATCTTCTGCCATCGACGGACGTC +CCACGTTGGTGACTTTCACCGTGCGGGTGATCACTTCCTTCGCCGTCACCGCCTTACCGA +TACTGCTGACCCAGCCGCGGAACACATCGACCGTGCCGTTCGGGAAGCGGATTTTATAGG +CACGGGTATCCCCTTCATTAAACCACGCCAGCAGCGCCTGCTGCCCCTGCTCTCCGGGCA +TCCACGCCAGCGTGAAGCTGGTATCTCCGGCAGATTTCTGCCCCTGCCCGGTCGCAGCCC +AGTCCGCATCTTCATCATCGAGATAGCTGTCGTCATAGGACTCAGCGGTCAGTTCGCCGG +GCGTCAGGTCTTTAACTTTAGCCAGACGCGACCAGTCAACGTCTGAAAGCGGGTTCGCAT +AAGGGTCACCGCTCCCCTTATAAACCAACAGGGTGGTCCCGGCACCTTTCACCGGCATTG +TAGGATTTGGTACAGGCATAGCGTCCTCACATTTCATAGGTAATGACATACGTCAGATCG +GCTGAACTCCACAGGCCCGCATCATCGTCGCGCCGGTAGTCATAGCCACTGGCCACCATA +CTGGTGATCAAATCTGACAGCGCCGGGATATCGCTCATCACCGGATAAATCCGGGACTCC +ATCCACGAATCCAGCTCTGAATCCGGCACCTGAGCAGGCAGGAAAACTTCAATATGCAGC +TCTGCCTGCCAGGTATCGCTGTCCAGCTCTTCGCCCGTGTATTCAGCGCCGGTGAGATAA +ACGGCAATTGCCGGAAAATCTTCCTCATCAAAAACAGCGGGGCGACCATCAAAAAGCGTC +GCCCCGGTGTCATGCTTCTCCAGTGCATCCAGTACGGCTGCACGGAGTTCAGTATGTTTC +>test_runprokka_H299.0003 2583 +ATCATACAGTCATTTGTTAATATCTGTCTGACAAGGTACCAAGCAGAAAATAGGGTTAAG +ATATTTGTAGCCATAAATATCATATATACGTTAGCCTATTTTTTTGGGGTTTTATATTCC +TTATTTATAGATCACTGGGATAATGTTTGGAAAAATATTATTTTGTTTTATGTGCTTACA +ACAATAACAATGTTTTTCTTCTATTTTATACGAAAAGGGAAGGTTGTTAAGCTATTTTTC +TTTCATTATATCTCAAAAAATAAAGTTTACGAAACTTTTATTTTTGGCCTTTACCAGCTC +CCTCATGTTTTAAGCTCTTGGGTAAGGCTTGGATATGATAGACTGGTATTGGGGGAACTA +ATATCAATGAGCTATGTTGGCGGATATTCGGTTGCAGTTCAAATATCTCTTGTGTCTAGC +GTGATATTTCAATCATTAAATAGGTTTTGGACCCCTTTCTTTATTAAAAAATTAAAGGAG +AATAGTAAACAAAAAAAAATTATTGTTCTTGGAGGTTTTGGAATTATCTGCATAACAATA +CTTAATATACTATTTGGTTACGCATATTTTATTTTTTTCTTGCCCACAAATTATTCATCA +TTCTCCAATGCTCTTCCTATATTATGTATGGCATATATGTTTCAGGGGCTATATTTTTTG +ATTGTTAATTATATATATTATCATGATGGTAATAAATTGATATCAATTCCATCCGTTGCC +TCGATCGCTATACATATAGCTGTTGCCCCAGTTTTGATAAAACATATGGGATATTATGGA +GCTGCAATTTCCTTATTGATTAGTTGGATAGTTCTTTTTTTATTTACATGCGTCATTATA +TTTTATGTTAGAAGGGGGTATCGTGGGTAATATATTTATTGTTGAGTCTCCGTTTCAGCT +TTCAAATGCTTTACTTTATCATAAAAAAAATGATAGTGTTATTGTCAGGCTCAACGGAGA +AAATAAAAATGATTTTCAAATTGAAAAAATGTTATCGTCGTTTAATGGCAAGGTATATAT +AAAAAAAGCATCAAAAGAATCGAAATTCGATTTGATTAGATTTGTTTTATTTTTTGCCGT +CCCTGTATTGATTGCTAATTTAAATAAAAAAGTAATTATTGGGAATTATAATTCATTGTG +GATGAGAGTCATGGGATATTTGTTTAACCCATTTCATTTTGCCGTCCTTGATGATGGGTT +GATTACTATACGAACAATAAAAAGGTTGGATGATAATATATCGCGTTCTGGATCAATTAA +GAAACGGTTTTTATTACTGCTGGCACCAAGATTTATAACGCAATATAAGATATATTCCAA +CTTTATTCAGATATACAACCAAGAGATCAATAAGAGAAAAAGAACTACCCGAGCCATTAA +GGCAGGGCGAGTTTGTTTTATTGGCTCTCCATTATTTGACAAAAATGTTCTCACATTTGA +TTTCTATGTAAAGTGCTTGGCTGCGATAAGTGATAACCTTAAGCGTTGTGGATATAGCAT +TGAGTATTACCCTCATCGCTCAGAAAAAAACATCTCATATTTAAATGTTTTTTTTGACGA +TGTAATAAAATCAGATGATAGCATTGAAGTCTATTATTCAGCCAGTAATGAGTTGCCAGA +AATATTTGTATCATTTTATTCATCGGCCCTTTTAAATTTGAGAAGTGATTATCCAGAGTG +TAAATTTATATCTTATAAGTTAGATTGTAATGAAATCAATGGTAAGTTTAGGTATGAAAT +AATGGAGGCATATAACTTTTTGGCATTCTCTGGTATTGAGGTTGTAACTATATAGGAAAA +TAAGATAGAAAAGGGATATTGTTGGAGTCAATATAGAACAGAAATTATAGTCTAAACTAA +TTAATCACTATGAAGGTCTATGTAATTAAATGTTAACATATTCTGTCGTTAACTGGAAAG +CAAAATTATTATATTTCATTCTTTTTCTGAGTTTCCTTAATGCTGTTTTGAGGTTATCAG +AGGATGGATTGTCGATTTATCGATTATTTATCCCTTTGCAAATATTTTTAATTTATACAT +TAAGTGTCACCGAGTTCAAAAAGTTTATCGTAATTCTACTACTTTTATTATTGTTTGGTG +CTACTGGATGTATGATATCCACTTATTCTCTTAATGAGAATAATCTTGTATTTCTAATAC +ATTACTCTATACTTATACTCACTTTTTTCTCTTCTTCTGTGTTGATATCTATTACTGGTG +AAACTTGTTTTTACAAATTCACCGCGTTCTTTTTTGGTTTTTTAATTGTTACTGGTATTA +TGGATTTGTTTGGTGTTACATTTCCTAATATAGAACATATACCAGACGCTATACGAGGAA +TACATAGAATAGAGAATGATTATTCACTTGCGCTGGTTTCGTTTGTTTTTGTTGTGTTTT +CCATCTCTAGGAAAAAAATAACTGCTTCAATCCTTACTTTTTTTACGTCTGCGATTTGTT +TTTATAATGACTCTAAAGTTGCATTACTTTTTGTCGTTGCTGGTTATTTTTGTTTTATAT +TTAAAAATATAAGGTTTAGACAAAAGGAATTCAGGTGGATATTATTTCTTTTTGTCATAA +TGC diff --git a/test/data/annotate/exp_files/res_formatAll/prodigal/gff3/test.0417.00002.gff b/test/data/annotate/exp_files/res_formatAll/prodigal/gff3/test.0417.00002.gff new file mode 100644 index 0000000000000000000000000000000000000000..1529acfc565707d29e3a7751e2bb78a9509401d4 --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prodigal/gff3/test.0417.00002.gff @@ -0,0 +1,105 @@ +##gff-version 3 +##sequence-region test.0417.00002.0001 1 9603 +##sequence-region test.0417.00002.0002 1 22446 +##sequence-region test.0417.00002.0003 1 51012 +##sequence-region test.0417.00002.0004 1 31459 +##sequence-region test.0417.00002.0005 1 6009 +test.0417.00002.0001 Prodigal_v2.6.3 CDS 287 787 74.7 + 0 ID=test.0417.00002.0001b_00001;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.447;conf=100.00;score=74.71;cscore=55.73;sscore=18.98;rscore=11.74;uscore=3.46;tscore=3.78; +test.0417.00002.0001 Prodigal_v2.6.3 CDS 846 2384 201.9 + 0 ID=test.0417.00002.0001i_00002;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.511;conf=99.99;score=201.85;cscore=183.11;sscore=18.74;rscore=10.97;uscore=3.99;tscore=3.78; +test.0417.00002.0001 Prodigal_v2.6.3 CDS 2404 3741 183.3 + 0 ID=test.0417.00002.0001i_00003;partial=00;start_type=ATG;rbs_motif=GGxGG;rbs_spacer=5-10bp;gc_cont=0.594;conf=99.99;score=183.29;cscore=176.07;sscore=7.22;rscore=3.07;uscore=-0.69;tscore=3.78; +test.0417.00002.0001 Prodigal_v2.6.3 CDS 3738 4403 99.5 + 0 ID=test.0417.00002.0001i_00004;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.590;conf=100.00;score=99.49;cscore=92.74;sscore=6.75;rscore=-7.85;uscore=1.68;tscore=3.78; +test.0417.00002.0001 Prodigal_v2.6.3 CDS 4416 6068 155.5 + 0 ID=test.0417.00002.0001i_00005;partial=00;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.614;conf=100.00;score=155.52;cscore=148.73;sscore=6.79;rscore=11.74;uscore=-0.97;tscore=-5.12; +test.0417.00002.0001 Prodigal_v2.6.3 CDS 6126 6617 71.5 + 0 ID=test.0417.00002.0001i_00006;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.514;conf=100.00;score=71.54;cscore=51.54;sscore=20.00;rscore=16.41;uscore=-0.84;tscore=3.78; +test.0417.00002.0001 Prodigal_v2.6.3 CDS 6808 9444 460.8 + 0 ID=test.0417.00002.0001i_00007;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.603;conf=99.99;score=460.82;cscore=447.08;sscore=13.74;rscore=10.97;uscore=-0.35;tscore=3.78; +test.0417.00002.0001 Prodigal_v2.6.3 CDS 9456 9602 25.8 + 0 ID=test.0417.00002.0001b_00008;partial=01;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.531;conf=99.73;score=25.79;cscore=9.58;sscore=16.21;rscore=11.74;uscore=-0.45;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 2 1237 117.8 + 0 ID=test.0417.00002.0002b_00009;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.468;conf=100.00;score=117.78;cscore=114.56;sscore=3.22;rscore=0.00;uscore=0.00;tscore=3.22; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 1279 2346 121.8 + 0 ID=test.0417.00002.0002i_00010;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.547;conf=100.00;score=121.76;cscore=94.14;sscore=27.63;rscore=16.41;uscore=6.61;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 2419 2799 43.1 + 0 ID=test.0417.00002.0002i_00011;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.357;conf=100.00;score=43.08;cscore=18.83;sscore=24.25;rscore=16.41;uscore=4.06;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 3130 3393 18.9 + 0 ID=test.0417.00002.0002i_00012;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.424;conf=98.73;score=18.94;cscore=1.36;sscore=17.57;rscore=11.74;uscore=2.71;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 3399 4538 75.7 + 0 ID=test.0417.00002.0002i_00013;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.359;conf=100.00;score=75.70;cscore=65.66;sscore=10.04;rscore=3.05;uscore=2.00;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 4535 7888 489.9 + 0 ID=test.0417.00002.0002i_00014;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.592;conf=99.99;score=489.87;cscore=467.39;sscore=22.48;rscore=11.74;uscore=5.68;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 7854 9491 253.5 + 0 ID=test.0417.00002.0002i_00015;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.620;conf=99.99;score=253.49;cscore=237.24;sscore=16.25;rscore=16.41;uscore=-3.94;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 9525 11285 265.8 + 0 ID=test.0417.00002.0002i_00016;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.580;conf=99.99;score=265.85;cscore=245.51;sscore=20.33;rscore=10.97;uscore=4.68;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 11249 12328 117.6 + 0 ID=test.0417.00002.0002i_00017;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=11-12bp;gc_cont=0.591;conf=100.00;score=117.64;cscore=119.16;sscore=-1.52;rscore=-4.46;uscore=-0.83;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 12309 12845 91.7 + 0 ID=test.0417.00002.0002i_00018;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.508;conf=100.00;score=91.73;cscore=72.96;sscore=18.77;rscore=11.74;uscore=3.26;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 12849 13277 62.2 + 0 ID=test.0417.00002.0002i_00019;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.534;conf=100.00;score=62.20;cscore=50.13;sscore=12.07;rscore=10.97;uscore=-3.91;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 13277 14653 164.8 + 0 ID=test.0417.00002.0002i_00020;partial=00;start_type=ATG;rbs_motif=AGGAG/GGAGG;rbs_spacer=11-12bp;gc_cont=0.548;conf=100.00;score=164.84;cscore=146.97;sscore=17.86;rscore=9.87;uscore=2.93;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 14955 15902 78.5 - 0 ID=test.0417.00002.0002i_00021;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.444;conf=100.00;score=78.46;cscore=70.44;sscore=8.03;rscore=3.05;uscore=1.21;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 15974 16570 75.3 - 0 ID=test.0417.00002.0002i_00022;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.424;conf=100.00;score=75.28;cscore=50.53;sscore=24.75;rscore=11.74;uscore=7.99;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 16573 17748 86.1 - 0 ID=test.0417.00002.0002i_00023;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.378;conf=100.00;score=86.08;cscore=74.74;sscore=11.34;rscore=3.05;uscore=3.23;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 17748 19328 203.7 - 0 ID=test.0417.00002.0002i_00024;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.441;conf=99.99;score=203.65;cscore=190.82;sscore=12.83;rscore=3.05;uscore=5.07;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 19360 20184 84.5 - 0 ID=test.0417.00002.0002i_00025;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.336;conf=100.00;score=84.53;cscore=69.29;sscore=15.24;rscore=11.74;uscore=0.38;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 20442 21695 164.1 - 0 ID=test.0417.00002.0002i_00026;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.538;conf=100.00;score=164.07;cscore=156.88;sscore=7.19;rscore=3.05;uscore=1.02;tscore=3.78; +test.0417.00002.0002 Prodigal_v2.6.3 CDS 21927 22445 72.6 + 0 ID=test.0417.00002.0002b_00027;partial=01;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.526;conf=100.00;score=72.59;cscore=60.60;sscore=11.99;rscore=11.74;uscore=5.37;tscore=-5.12; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 3 812 115.2 + 0 ID=test.0417.00002.0003b_00028;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.520;conf=100.00;score=115.22;cscore=112.00;sscore=3.22;rscore=0.00;uscore=0.00;tscore=3.22; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 874 2700 231.4 - 0 ID=test.0417.00002.0003i_00029;partial=00;start_type=ATG;rbs_motif=AGGAGG;rbs_spacer=3-4bp;gc_cont=0.549;conf=99.99;score=231.42;cscore=206.60;sscore=24.83;rscore=17.40;uscore=2.37;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 2700 6242 545.6 - 0 ID=test.0417.00002.0003i_00030;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.544;conf=99.99;score=545.58;cscore=539.18;sscore=6.40;rscore=3.05;uscore=-1.67;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 6235 9123 425.3 - 0 ID=test.0417.00002.0003i_00031;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.510;conf=99.99;score=425.32;cscore=406.23;sscore=19.09;rscore=11.74;uscore=3.58;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 9299 12667 478.5 - 0 ID=test.0417.00002.0003i_00032;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.535;conf=99.99;score=478.50;cscore=456.96;sscore=21.54;rscore=16.41;uscore=0.20;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 12680 13003 15.4 - 0 ID=test.0417.00002.0003i_00033;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.543;conf=97.20;score=15.42;cscore=0.02;sscore=15.40;rscore=11.74;uscore=-1.28;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 12988 13395 39.6 - 0 ID=test.0417.00002.0003i_00034;partial=00;start_type=GTG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.527;conf=99.99;score=39.62;cscore=25.80;sscore=13.81;rscore=16.41;uscore=1.22;tscore=-5.12; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 13392 13955 82.2 - 0 ID=test.0417.00002.0003i_00035;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.532;conf=100.00;score=82.15;cscore=67.70;sscore=14.45;rscore=16.41;uscore=-6.97;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 13946 14449 19.0 - 0 ID=test.0417.00002.0003i_00036;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.544;conf=98.75;score=19.02;cscore=25.85;sscore=-6.83;rscore=-7.85;uscore=-2.11;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 14634 15428 116.3 - 0 ID=test.0417.00002.0003i_00037;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.516;conf=100.00;score=116.29;cscore=110.07;sscore=6.22;rscore=3.05;uscore=-1.81;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 15435 16310 123.2 - 0 ID=test.0417.00002.0003i_00038;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.525;conf=100.00;score=123.17;cscore=124.01;sscore=-0.84;rscore=-7.85;uscore=3.23;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 16461 18707 329.5 - 0 ID=test.0417.00002.0003i_00039;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.536;conf=99.99;score=329.51;cscore=328.26;sscore=1.25;rscore=-7.85;uscore=4.18;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 18720 19250 21.4 - 0 ID=test.0417.00002.0003i_00040;partial=00;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.493;conf=99.28;score=21.44;cscore=11.52;sscore=9.93;rscore=11.74;uscore=3.96;tscore=-5.12; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 19695 19856 0.8 + 0 ID=test.0417.00002.0003i_00041;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.395;conf=54.65;score=0.81;cscore=-1.33;sscore=2.14;rscore=1.94;uscore=-1.70;tscore=2.40; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 19935 20624 78.6 + 0 ID=test.0417.00002.0003i_00042;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.539;conf=100.00;score=78.61;cscore=70.83;sscore=7.78;rscore=3.05;uscore=0.95;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 20693 21406 109.2 + 0 ID=test.0417.00002.0003i_00043;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.503;conf=100.00;score=109.25;cscore=99.93;sscore=9.32;rscore=3.05;uscore=2.49;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 21544 21762 30.5 + 0 ID=test.0417.00002.0003i_00044;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.434;conf=99.91;score=30.51;cscore=17.61;sscore=12.90;rscore=10.14;uscore=-0.50;tscore=3.26; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 21870 22910 145.1 + 0 ID=test.0417.00002.0003i_00045;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.544;conf=100.00;score=145.07;cscore=124.82;sscore=20.26;rscore=10.97;uscore=5.52;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 22942 24135 159.5 - 0 ID=test.0417.00002.0003i_00046;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.553;conf=100.00;score=159.48;cscore=151.46;sscore=8.03;rscore=3.05;uscore=-0.05;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 24128 26287 327.5 - 0 ID=test.0417.00002.0003i_00047;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.522;conf=99.99;score=327.54;cscore=311.41;sscore=16.12;rscore=11.74;uscore=1.26;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 26873 27904 140.4 + 0 ID=test.0417.00002.0003i_00048;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.529;conf=100.00;score=140.40;cscore=133.05;sscore=7.35;rscore=3.05;uscore=0.52;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 27911 29173 190.3 - 0 ID=test.0417.00002.0003i_00049;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.525;conf=99.99;score=190.33;cscore=170.13;sscore=20.19;rscore=11.74;uscore=5.33;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 29295 30230 108.2 + 0 ID=test.0417.00002.0003i_00050;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.533;conf=100.00;score=108.23;cscore=100.48;sscore=7.75;rscore=3.05;uscore=0.92;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 30217 30909 102.7 - 0 ID=test.0417.00002.0003i_00051;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.506;conf=100.00;score=102.70;cscore=80.53;sscore=22.17;rscore=16.41;uscore=1.98;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 31038 32456 180.5 - 0 ID=test.0417.00002.0003i_00052;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.517;conf=99.99;score=180.47;cscore=168.51;sscore=11.95;rscore=3.05;uscore=5.78;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 32771 33532 108.0 - 0 ID=test.0417.00002.0003i_00053;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.521;conf=100.00;score=108.00;cscore=97.36;sscore=10.64;rscore=3.05;uscore=2.86;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 33562 34398 81.6 - 0 ID=test.0417.00002.0003i_00054;partial=00;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.495;conf=100.00;score=81.59;cscore=74.05;sscore=7.53;rscore=11.74;uscore=1.57;tscore=-5.12; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 34685 35866 141.4 - 0 ID=test.0417.00002.0003i_00055;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.531;conf=100.00;score=141.44;cscore=122.29;sscore=19.15;rscore=11.74;uscore=4.29;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 36121 37350 91.5 + 0 ID=test.0417.00002.0003i_00056;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.445;conf=100.00;score=91.51;cscore=88.23;sscore=3.28;rscore=-7.85;uscore=7.35;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 37507 37758 3.1 - 0 ID=test.0417.00002.0003i_00057;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.409;conf=66.99;score=3.08;cscore=-1.58;sscore=4.66;rscore=3.03;uscore=-1.63;tscore=3.76; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 37818 38168 23.0 - 0 ID=test.0417.00002.0003i_00058;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.501;conf=99.50;score=22.99;cscore=17.53;sscore=5.46;rscore=3.05;uscore=-0.71;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 38987 41284 296.5 + 0 ID=test.0417.00002.0003i_00059;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.529;conf=99.99;score=296.51;cscore=273.51;sscore=23.00;rscore=11.74;uscore=7.49;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 41295 42173 95.6 + 0 ID=test.0417.00002.0003i_00060;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.538;conf=100.00;score=95.62;cscore=77.05;sscore=18.58;rscore=11.74;uscore=1.90;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 42170 42649 39.7 + 0 ID=test.0417.00002.0003i_00061;partial=00;start_type=ATG;rbs_motif=GGxGG;rbs_spacer=5-10bp;gc_cont=0.512;conf=99.99;score=39.67;cscore=31.53;sscore=8.14;rscore=3.07;uscore=-0.55;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 42689 44467 193.4 - 0 ID=test.0417.00002.0003i_00062;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.459;conf=99.99;score=193.36;cscore=186.19;sscore=7.18;rscore=3.05;uscore=1.01;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 44946 46133 205.5 + 0 ID=test.0417.00002.0003i_00063;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.506;conf=99.99;score=205.51;cscore=195.16;sscore=10.35;rscore=3.05;uscore=3.53;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 46191 47387 171.5 + 0 ID=test.0417.00002.0003i_00064;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.531;conf=100.00;score=171.46;cscore=157.55;sscore=13.91;rscore=10.97;uscore=-1.48;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 47445 48656 208.4 + 0 ID=test.0417.00002.0003i_00065;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.507;conf=99.99;score=208.43;cscore=189.99;sscore=18.43;rscore=11.74;uscore=2.27;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 48709 50094 166.6 + 0 ID=test.0417.00002.0003i_00066;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.524;conf=100.00;score=166.59;cscore=153.37;sscore=13.22;rscore=11.74;uscore=-3.00;tscore=3.78; +test.0417.00002.0003 Prodigal_v2.6.3 CDS 50142 51011 154.4 + 0 ID=test.0417.00002.0003b_00067;partial=01;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.501;conf=100.00;score=154.44;cscore=146.98;sscore=7.46;rscore=3.05;uscore=-0.12;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 103 1728 218.8 - 0 ID=test.0417.00002.0004b_00068;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.523;conf=99.99;score=218.81;cscore=204.96;sscore=13.85;rscore=11.74;uscore=-2.43;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 1776 2255 20.3 - 0 ID=test.0417.00002.0004i_00069;partial=00;start_type=GTG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.504;conf=99.07;score=20.30;cscore=20.50;sscore=-0.20;rscore=3.05;uscore=2.52;tscore=-5.12; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 2650 3228 33.5 + 0 ID=test.0417.00002.0004i_00070;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.430;conf=99.95;score=33.50;cscore=25.82;sscore=7.68;rscore=3.05;uscore=0.86;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 3550 6648 419.0 + 0 ID=test.0417.00002.0004i_00071;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.526;conf=99.99;score=419.01;cscore=395.71;sscore=23.31;rscore=16.41;uscore=3.77;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 6651 7979 185.2 + 0 ID=test.0417.00002.0004i_00072;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.525;conf=99.99;score=185.17;cscore=167.95;sscore=17.22;rscore=11.74;uscore=0.46;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 8030 8809 122.1 + 0 ID=test.0417.00002.0004i_00073;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.538;conf=100.00;score=122.05;cscore=108.66;sscore=13.39;rscore=10.97;uscore=-2.08;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 8806 11676 402.0 + 0 ID=test.0417.00002.0004i_00074;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.527;conf=99.99;score=402.00;cscore=385.20;sscore=16.81;rscore=11.74;uscore=-2.65;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 11841 13241 176.3 + 0 ID=test.0417.00002.0004i_00075;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.490;conf=100.00;score=176.30;cscore=152.28;sscore=24.02;rscore=16.41;uscore=3.83;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 13259 14575 197.7 + 0 ID=test.0417.00002.0004i_00076;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.483;conf=99.99;score=197.74;cscore=175.68;sscore=22.06;rscore=16.41;uscore=0.78;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 14611 15978 180.7 + 0 ID=test.0417.00002.0004i_00077;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.531;conf=99.99;score=180.68;cscore=159.04;sscore=21.64;rscore=11.74;uscore=5.24;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 16014 16502 41.2 - 0 ID=test.0417.00002.0004i_00078;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.554;conf=99.99;score=41.17;cscore=32.25;sscore=8.92;rscore=3.05;uscore=0.81;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 16502 18421 189.2 - 0 ID=test.0417.00002.0004i_00079;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.528;conf=99.99;score=189.22;cscore=181.38;sscore=7.84;rscore=3.05;uscore=1.67;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 18857 20305 166.6 + 0 ID=test.0417.00002.0004i_00080;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.500;conf=100.00;score=166.60;cscore=145.19;sscore=21.41;rscore=16.41;uscore=1.22;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 20307 20432 10.8 + 0 ID=test.0417.00002.0004i_00081;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.357;conf=92.33;score=10.82;cscore=2.09;sscore=8.73;rscore=5.77;uscore=-0.16;tscore=1.86; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 20555 21103 63.0 + 0 ID=test.0417.00002.0004i_00082;partial=00;start_type=ATG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.506;conf=100.00;score=63.02;cscore=52.91;sscore=10.11;rscore=3.05;uscore=3.28;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 21146 22663 280.5 - 0 ID=test.0417.00002.0004i_00083;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.529;conf=99.99;score=280.49;cscore=263.97;sscore=16.51;rscore=11.74;uscore=-0.17;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 22673 23554 107.3 - 0 ID=test.0417.00002.0004i_00084;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.533;conf=100.00;score=107.32;cscore=112.92;sscore=-5.60;rscore=-7.85;uscore=-0.87;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 23862 25595 265.1 - 0 ID=test.0417.00002.0004i_00085;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.565;conf=99.99;score=265.09;cscore=277.76;sscore=-12.67;rscore=-7.85;uscore=-0.92;tscore=-5.12; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 25601 26311 106.2 - 0 ID=test.0417.00002.0004i_00086;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.482;conf=100.00;score=106.16;cscore=90.08;sscore=16.09;rscore=10.97;uscore=0.33;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 26336 27232 124.9 - 0 ID=test.0417.00002.0004i_00087;partial=00;start_type=GTG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.530;conf=100.00;score=124.93;cscore=123.85;sscore=1.08;rscore=3.05;uscore=3.80;tscore=-5.12; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 27344 27865 100.1 + 0 ID=test.0417.00002.0004i_00088;partial=00;start_type=ATG;rbs_motif=AGxAG;rbs_spacer=5-10bp;gc_cont=0.517;conf=100.00;score=100.10;cscore=91.65;sscore=8.45;rscore=0.31;uscore=4.36;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 27905 28312 18.1 - 0 ID=test.0417.00002.0004i_00089;partial=00;start_type=GTG;rbs_motif=GGA/GAG/AGG;rbs_spacer=5-10bp;gc_cont=0.539;conf=98.48;score=18.14;cscore=24.46;sscore=-6.32;rscore=3.05;uscore=-4.25;tscore=-5.12; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 28293 28559 41.4 - 0 ID=test.0417.00002.0004i_00090;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.491;conf=99.99;score=41.40;cscore=27.75;sscore=13.65;rscore=10.97;uscore=-0.44;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 28802 29782 160.3 + 0 ID=test.0417.00002.0004i_00091;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.539;conf=100.00;score=160.28;cscore=138.46;sscore=21.82;rscore=10.97;uscore=7.08;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 29859 30518 82.0 - 0 ID=test.0417.00002.0004i_00092;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.518;conf=100.00;score=82.01;cscore=64.74;sscore=17.27;rscore=11.74;uscore=1.76;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 30682 30993 51.1 - 0 ID=test.0417.00002.0004i_00093;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.455;conf=100.00;score=51.07;cscore=34.31;sscore=16.76;rscore=10.97;uscore=2.67;tscore=3.78; +test.0417.00002.0004 Prodigal_v2.6.3 CDS 31038 31457 69.8 + 0 ID=test.0417.00002.0004b_00094;partial=01;start_type=GTG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.500;conf=100.00;score=69.76;cscore=61.44;sscore=8.32;rscore=11.74;uscore=1.71;tscore=-5.12; +test.0417.00002.0005 Prodigal_v2.6.3 CDS 2 1012 128.5 + 0 ID=test.0417.00002.0005b_00095;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.515;conf=100.00;score=128.52;cscore=125.30;sscore=3.22;rscore=0.00;uscore=0.00;tscore=3.22; +test.0417.00002.0005 Prodigal_v2.6.3 CDS 1178 4051 498.0 - 0 ID=test.0417.00002.0005i_00096;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.554;conf=99.99;score=497.95;cscore=482.69;sscore=15.26;rscore=10.97;uscore=0.52;tscore=3.78; +test.0417.00002.0005 Prodigal_v2.6.3 CDS 4169 4558 70.2 - 0 ID=test.0417.00002.0005i_00097;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.515;conf=100.00;score=70.24;cscore=54.10;sscore=16.14;rscore=11.74;uscore=-0.40;tscore=3.78; +test.0417.00002.0005 Prodigal_v2.6.3 CDS 4582 5745 199.4 - 0 ID=test.0417.00002.0005i_00098;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.536;conf=99.99;score=199.43;cscore=182.40;sscore=17.03;rscore=11.74;uscore=1.52;tscore=3.78; +test.0417.00002.0005 Prodigal_v2.6.3 CDS 5852 6007 5.4 - 0 ID=test.0417.00002.0005b_00099;partial=01;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.231;conf=77.53;score=5.39;cscore=2.17;sscore=3.22;rscore=0.00;uscore=0.00;tscore=3.22; diff --git a/test/data/annotate/exp_files/res_formatAll/prodigal/gff3/test_runprokka_H299.gff b/test/data/annotate/exp_files/res_formatAll/prodigal/gff3/test_runprokka_H299.gff new file mode 100644 index 0000000000000000000000000000000000000000..dce3b0bc4a2d66000effce333ddf364d9761926f --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prodigal/gff3/test_runprokka_H299.gff @@ -0,0 +1,23 @@ +##gff-version 3 +##sequence-region test_runprokka_H299.0001 1 3480 +##sequence-region test_runprokka_H299.0002 1 7080 +##sequence-region test_runprokka_H299.0003 1 2583 +test_runprokka_H299.0001 Prodigal_v2.6.3 CDS 3 140 31.2 - 0 ID=test_runprokka_H299.0001b_00001;partial=10;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.580;conf=99.92;score=31.21;cscore=19.39;sscore=11.82;rscore=11.19;uscore=-3.31;tscore=3.95; +test_runprokka_H299.0001 Prodigal_v2.6.3 CDS 201 743 46.5 - 0 ID=test_runprokka_H299.0001i_00002;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.562;conf=100.00;score=58.53;cscore=63.87;sscore=-5.34;rscore=-8.50;uscore=-2.24;tscore=-6.63; +test_runprokka_H299.0001 Prodigal_v2.6.3 CDS 740 1339 47.1 - 0 ID=test_runprokka_H299.0001i_00003;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.593;conf=100.00;score=47.14;cscore=32.42;sscore=14.72;rscore=14.84;uscore=-4.07;tscore=3.95; +test_runprokka_H299.0001 Prodigal_v2.6.3 CDS 1489 2187 74.7 - 0 ID=test_runprokka_H299.0001i_00004;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.558;conf=100.00;score=84.47;cscore=78.63;sscore=5.84;rscore=-8.50;uscore=0.61;tscore=3.95; +test_runprokka_H299.0001 Prodigal_v2.6.3 CDS 2187 2483 13.5 - 0 ID=test_runprokka_H299.0001i_00005;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.404;conf=96.46;score=14.38;cscore=-0.78;sscore=15.17;rscore=11.19;uscore=-0.37;tscore=3.95; +test_runprokka_H299.0001 Prodigal_v2.6.3 CDS 2518 3480 73.0 - 0 ID=test_runprokka_H299.0001b_00006;partial=01;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.442;conf=100.00;score=72.99;cscore=69.77;sscore=3.22;rscore=0.00;uscore=0.00;tscore=3.22; +test_runprokka_H299.0002 Prodigal_v2.6.3 CDS 3 140 31.2 - 0 ID=test_runprokka_H299.0002b_00007;partial=10;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.572;conf=99.92;score=31.21;cscore=19.39;sscore=11.82;rscore=11.19;uscore=-3.31;tscore=3.95; +test_runprokka_H299.0002 Prodigal_v2.6.3 CDS 201 743 37.1 - 0 ID=test_runprokka_H299.0002i_00008;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.547;conf=100.00;score=48.29;cscore=53.62;sscore=-5.34;rscore=-8.50;uscore=-1.36;tscore=-6.63; +test_runprokka_H299.0002 Prodigal_v2.6.3 CDS 740 1483 38.0 - 0 ID=test_runprokka_H299.0002i_00009;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.594;conf=99.99;score=39.20;cscore=39.82;sscore=-0.63;rscore=-8.50;uscore=2.70;tscore=3.95; +test_runprokka_H299.0002 Prodigal_v2.6.3 CDS 1489 2187 85.4 - 0 ID=test_runprokka_H299.0002i_00010;partial=00;start_type=ATG;rbs_motif=AGxAGG/AGGxGG;rbs_spacer=5-10bp;gc_cont=0.557;conf=100.00;score=86.66;cscore=77.16;sscore=9.50;rscore=3.78;uscore=0.49;tscore=3.95; +test_runprokka_H299.0002 Prodigal_v2.6.3 CDS 2187 2516 31.9 - 0 ID=test_runprokka_H299.0002i_00011;partial=00;start_type=ATG;rbs_motif=GGAGG;rbs_spacer=5-10bp;gc_cont=0.567;conf=99.98;score=36.67;cscore=18.74;sscore=17.93;rscore=12.68;uscore=-3.44;tscore=3.95; +test_runprokka_H299.0002 Prodigal_v2.6.3 CDS 2513 5092 332.4 - 0 ID=test_runprokka_H299.0002i_00012;partial=00;start_type=ATG;rbs_motif=AGGAG;rbs_spacer=5-10bp;gc_cont=0.592;conf=99.99;score=333.66;cscore=315.29;sscore=18.37;rscore=14.84;uscore=-1.67;tscore=3.95; +test_runprokka_H299.0002 Prodigal_v2.6.3 CDS 5085 5519 30.7 - 0 ID=test_runprokka_H299.0002i_00013;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.559;conf=99.91;score=30.69;cscore=48.16;sscore=-17.47;rscore=-8.50;uscore=-2.34;tscore=-6.63; +test_runprokka_H299.0002 Prodigal_v2.6.3 CDS 5501 5923 58.7 - 0 ID=test_runprokka_H299.0002i_00014;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.515;conf=100.00;score=59.78;cscore=42.44;sscore=17.34;rscore=11.19;uscore=1.09;tscore=3.95; +test_runprokka_H299.0002 Prodigal_v2.6.3 CDS 5939 6679 106.6 - 0 ID=test_runprokka_H299.0002i_00015;partial=00;start_type=ATG;rbs_motif=GGAG/GAGG;rbs_spacer=5-10bp;gc_cont=0.583;conf=100.00;score=107.81;cscore=90.18;sscore=17.62;rscore=11.19;uscore=1.29;tscore=3.95; +test_runprokka_H299.0002 Prodigal_v2.6.3 CDS 6687 7079 53.2 - 0 ID=test_runprokka_H299.0002b_00016;partial=01;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.539;conf=100.00;score=53.16;cscore=49.94;sscore=3.22;rscore=0.00;uscore=0.00;tscore=3.22; +test_runprokka_H299.0003 Prodigal_v2.6.3 CDS 1 870 40.8 + 0 ID=test_runprokka_H299.0003b_00017;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.303;conf=99.99;score=40.81;cscore=37.59;sscore=3.22;rscore=0.00;uscore=0.00;tscore=3.22; +test_runprokka_H299.0003 Prodigal_v2.6.3 CDS 863 1795 65.9 + 0 ID=test_runprokka_H299.0003i_00018;partial=00;start_type=GTG;rbs_motif=AGxAGG/AGGxGG;rbs_spacer=5-10bp;gc_cont=0.309;conf=100.00;score=67.18;cscore=59.30;sscore=7.89;rscore=6.89;uscore=1.58;tscore=-1.84; +test_runprokka_H299.0003 Prodigal_v2.6.3 CDS 1890 2582 21.9 + 0 ID=test_runprokka_H299.0003b_00019;partial=01;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.289;conf=99.36;score=21.95;cscore=23.44;sscore=-1.49;rscore=-2.97;uscore=-0.41;tscore=1.88; diff --git a/test/data/annotate/exp_files/res_formatAll/prokka/Genes/test.0417.00002.gen b/test/data/annotate/exp_files/res_formatAll/prokka/Genes/test.0417.00002.gen new file mode 100644 index 0000000000000000000000000000000000000000..60062379692163fccdeaa2a0ab64d671cfa5a47f --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prokka/Genes/test.0417.00002.gen @@ -0,0 +1,1940 @@ +>test.0417.00002.0001b_00001 501 NA | hypothetical protein | NA | NA | NA +ATGGCCGACAGTTTCCAGAATGAAGTTCCCGCCGCTCGTGTAAATATCAAGCTTGATCTG +CATACAGGCAATGCTAAAAAGAAAGTTGAACTCCCCCTCAAGCTTCTTGCCGTAGGCGAT +TACAGTAACGGAAAAGAGCAACGTCCGCTGTCCGAACGGGACAAGGTTGATATCAATAAA +AACAACTTCAACAGCGTCATGGCTGAGTTTTCGCCTGCGGTTAATTTAACAGTAGAAGAT +ACGCTAAACGGAAACGGTAATGAACAAAATATCGCGCTTGAATTTAAAAGCCTGAAGGAT +TTTGAACCCGAACAGGTAGCAAAAAATATTCCGCAACTTCGTGTATTACTCGCTATGCGC +AATTTACTACGTGACCTGAAATCCAATCTGCTGGATAACGCAACGTTTCGCCGTGAACTG +GAAAATATCCTGAAAGACCCGACGCTCAGTTCAGAACTGCGTGATGAACTGGCGAAAATT +GCGCCGCAGGAGAACGTTTAA +>test.0417.00002.0001i_00002 1539 NA | hypothetical protein | NA | NA | NA +ATGTCTGTACAACAAGAACATGCCACCTCTGAAACTGCAACACTCACCACCACTGAGTCC +GGCGGCGTTTATCAGTCCCTGTTCGATAAAATTAATTTAACCCCGGTGTCTTCCATTCAG +GAAATCGATTTATGGCAAAACAGCGAAACGCTGGCCGATGCCTCACCCGATGAGCGCGTG +ACGGCGGCGATTCACGTTCTGCTTTCCTGTCTGGCGAAATCAGGCGAGGACGTGGTTAAG +CTCGACAAGAGCCTGCTGGATTTTCATATCGACGATCTGGATCAGAAAATCAGTAAACAG +CTTGATGCGGTCATGCACCACCCTGAATTCCAGAAAGTCGAGTCGCTGTGGCGTGGTACA +TGGTTCGTCGTACAGCGCACTGATTTTCGCAAAAATGTCAGAATTGAACTGCTGGATATC +AGTAAAGAACATCTGCGGCAGGACTTTGATGATTCTCCGGAAATCATTCAAAGTGGTTTA +TATCGCCATACATACATTCAGGAGTACGATACGCCGGGTGGCGAACCTGTTGCCTCATTA +ATTTCCAGCTATGAATTTGATAACAGCCCGCAGGATATTGCCCTGCTGCGTAATATTTCC +AGAGTGTCTGCCGCTTCCCATATGCCTTTTATCGGTTCTGTCGGACCGAAATTCTTCCTT +AAAAATTCGATGGAAGAAGTCGCCGCGATTAAAGATATCGGCAACTACTTTGACCGCGCA +GAATATATTAAATGGAAGTCGTTCCGCGATACGGATGACAGCCGCTATGTGGGATTAGTG +ATGCCGCGCGTGCTGGGCCGTCTGCCCTATGGGCCGGACACGGTGCCGGTACGCAGCTTT +AACTATGTGGAAGAAGTCAAAGGCCCGGATCACGAAAAATACCTGTGGACAAACGCCTCG +TTCGCCTTTGCCGCCAATATGGTGAAGAGCTTTGTTAATAATGGCTGGTGCGTGCAGATC +CGTGGCCCACAGGCGGGCGGCGCAGTGGCCGATCTGCCGATCCATCTTTACGATCTCGGC +ACCGGCAATCAGGTCAAAATTCCGTCCGAAGTGATGATCCCGGAAACCCGCGAATTTGAA +TTTGCCAACCTTGGCTTTATTCCGCTCTCTTATTATAAGAATCGCGATTACGCCTGCTTC +TTCTCGGCGAACTCTGCCCAGAAACCGGCGTTGTACGATACCGCTGACGCCACCGCCAAC +AGCCGTATCAATGCCCGTCTGCCTTACATCTTCCTGCTGTCCCGCATTGCGCATTACCTG +AAAATTATTCAGCGCGAGAATATCGGCACCACCAAAGACCGCCGCGTGCTGGAACTGGAG +CTGAATACCTGGATCCGCACGCTGGTGACGGAGATGACCGATCCTGGCGATGAACTTCAG +GCTTCGCATCCACTGCGCGACGGGAAAGTTATCGTCGAGGACATAGAGGACAATCCGGGC +TTCTTCCGCGTCAGACTCTTTGCCGTGCCGCATTTCCAGATTGAAGGGATGGATATCAAC +CTTTCTCTGGTTTCCCAGATGCCAAAAGCAAAAGCCTGA +>test.0417.00002.0001i_00003 1338 NA | hypothetical protein | NA | NA | NA +ATGAAAATTTGTCGACCACTGTGGGCTGAGGGGACATTCCTGTCTTCTCAGCAGTTTCAG +CAGCAGGCCCGCTGGGAAGCGTTCAGCAATGACTGTATTGCGCAGCTTTGTATTCGCCAT +CCGTGGGGGATCGCAAACGTGCTCTTTGACCGGGATGCCCTGACGCCCGGAAAGCTGAAA +ACGCAGGCAGTACGCCTGCGTTTTGCTGATGGCACGCTGATCGATTCAGACGTGAGTGAC +GTTCTGCCGCTCGCCTGCGATCTGCGCGCGCTGAAGAACGACAGCGCGATTGTTTTGCTG +GCGCTGCCGCTTGCACATGGTAACGGCGGTAATCTCGGTCAGGGTGAGCAGACTGAAAGA +CCGCTGCGCTATCGTCAGGAATGGCAAAAGGTGCAGGATATCTACGGCAGTGACAGTGAA +GATATGGCCGTTGAGCGTCATGCGCTGTCCCTGCGCTTTGCTCATGATAACAATCAGGAT +TACATCACCTGCCCACTGGCGCGTCTGGTGCGGGATGTTCAGGGCAACTGGACACAGGAT +GAGAGCTATATTCCGCCGTTACTGGCGTTTAACGCCCATGACGGGCTGGTACAGCGTCTG +GACACATTGCTGTTGCAGCTACGGGCGAAGTGCCAGCGTCTGATGGCGATGCGCCGGGAA +AGCAACCAGCGTATGGCGGACTTTGCCGTCGCCGATGTCTCCCTGTTCTGGCTGCTTAAC +GCGCTGAATTCCGCCGAGCCGGTGCTGAGCGATTTCCTGCGCTACCCGGCTGTCCACCCC +GAACTGGTCTGGCGGGAGCTGGCGAGGCTTGCCGGTGCGCTGCTGACGTTTTCCCTTGAG +CATAACGTCAGCGCCGTTCCGCCCTATGTCCACGAATCGCCGTCCACCGTCTTTCCGCCC +CTGTTCTCCCTGCTCAGCGAGCTGCTGGAAGCCAGCCTGCCGTCGCGGGTGATCGCGCTG +GATCTGGCGTCCCTGCCGGGCAACCGCTGGAAAGCCGACCTGCACGATCCGCGCCTGCGG +GAAGAGGCCGATTTTTATCTGTCCGTTCGTTCCTCACTGCCTGCGCATCAGGTACTGCAT +CAGCTACCGCTGGTCTGCAAAATCGGTGCGCCCGATGATGTCACGCTGCTTATCAACGTG +GCGCTGAACGGTGTTCAACTGGTGCCGCTTACCTCGGTTCCGGCGGCGCTGCCGCTGCGG +CTGGAGAACCAGTATTTTGCGCTGGATATGCACAGTGACGCGGCTAAATCGATGCTGGAG +TCCGGGAGCTGCATGATTTATGCGCCGGGAACCATGGGCGACCTGAAACCTGAACTGTTT +GCGGTGCTGCGCACATGA +>test.0417.00002.0001i_00004 666 NA | hypothetical protein | NA | NA | NA +ATGAAAAAAGATATGGATATCAATATCGATGCGCTGCTGCTCGACACGTTTCTGACGGTG +GTGGAACTGCGTCAGGGAACCACCGTGCGTCACGGTATCGAGCTGTATCGCCACTGTCAG +CGGCAGGTGGAACTGGTCCGCGAACGTCTGAAAGATGCCGGATTCAGTCGGGAGAACGTG +GAGCACATAACTTACGCGCAGTGCGCCCTGCTGGACGAAACGGTGCTCAGCCGTAGTGGC +ATGGACGACGGTCAGGCCATCTGGATGAAAAACCCACTCCAGTCGCATTTCTTCAACACC +CTGCAGGCAGGTGAGCTGCTGTACGAACGGATGAAGCAGGTGCTACAGGAACCCGCCCCC +GCGCAGGCCGTGCTGACCTGCTTTCACCGTGTCCTGCTGCTGGGATTTCGCGGGCGTTAT +CAGGATCCGGCAGCCCCGGAGCGCGACCAGCTTATTTCGACGCTCAACGGGCAGGTCGCG +CCATTTGGTGTGCTGCCGGAAACGGCGGTACTGAACGTGCCGTTATCCACCCGTCAGCAC +CCTTTGCTGCATTCGCCATTTTTCTGGCTGGTAACACTGGCGCTGCTACTGGCGGGCGTC +TGGTGGGGGCTACACCACTGGCTGAACGTGCTGGTGGATGAACTGCTGCCGCAAAGCCTG +CGTTAA +>test.0417.00002.0001i_00005 1653 ompA | Outer membrane protein A | NA | protein motif:HAMAP:MF_00842 | NA +GTGAGGAACACGCTGAAACAGGCCATCGTGCTGTGGGGAATGGTGTTACTGCTGGTGCTG +TGGTCAGTGTTTATCAGTCCGTCTGGCGTGCTGAGATGGGCCGGTGCGGCGGCTATCGTT +CTGGCGGTTGCTGCGTTGTTGATTTATCGGCGCAGGCAGGCGTGGACGGAGATGACCGGC +GATGCCGGGTTGTCATCGCTGCCGCCGGAAACCTACCGGCAGCCGGTAGTGCTGGTCTGC +GGCGGTCTGTCGGCGCACCTGTTCACTGACAGCCCGGTCCGGCAGGTTTCAGAAGGGCTG +TATCTGCATGTTCCTGATGAAGAACAGCTTGTGGCGCAGGTGGAGCGATTGCTGACCCTT +CGCCCGGCGTGGGCATCGCAGCTTGCCGTGGCGTATACCGTCATGCCCGGCATACACCGG +GATGTGGCGGTTCTGGCCGGACGGCTGCGACGGTTTGCCCACAGTATGGCGACGGTGCGT +CGCCGGGCGGGCGTAAACGTCCCCTGGCTTCTCTGGAGCGGGCTGTCCGGCTCGCCGTTG +CCGGAAAGAGCGAGTTCACCGTGGTTTATCTGTACCGGCGGCGAAGTTCAGGTAGCAACA +TCCACAGAGACCACCATGCCCGCGCAGTGGATTGCACAATCCGGCGTACAGGAGCGCAGT +CAGCGACTCTGTTACCTGCTGAAAGCTGAAAGCCTGATGCAGTGGCTGAATCTTAATGTG +CTGACGGCACTGAACGGCCCGGAGGCGAAATGCCCGCCACTGGCGATGGCCGTGGGGCTG +GTCACCTCGTTGCCAGCGGTGGATAACAACCTGTGGCAAGTGTGGATCACCGCCAGAACC +GGCCTGACGACGGATATCGCGGACACCGGCACAGACGCCACGCTGCCGTTTCCGGATGCT +CTGTTACGGCAGTTGCCGCGTCAGTCGGACTTTACCCCGCTGCGGCGGGCCTGCGTGACC +ATGCTGGGCATTACCACCGCGGCGGGTATCACCATGTTGTGCCTGTCAGCCACGGCAAAT +CGCCAGTTATTACGGCAGGTCGGTGACGATCTGCACCGGTTTTATGCCGTCCCGGTGGAG +GAATTTATCACCAAAGCCCGTCACCTGTCGGTGCTGAAAGACAATGCGACCATGCTCGAT +GGGTATTACCGGGAAGGAGAACCACTGCGCCTCGGTCTGGGGTTATACCCCGGCGAACGC +ATCCGCCAGCCGGTATTACGCGCCATTCGCGACTGGCGTCCGCCTGAACAAAAAATGGAG +GTGACGGCTTCGCTTCAGGTTCAGACCGTGCGTCTTGACAGTATGTCGCTGTTTGACGTC +GGACAGGCCCGCCTGAAAGACGGCTCGACAAAAGTGCTGGTGGATGCGCTGGTGAACATC +CGGGCAAAACCGGGCTGGCTGATCCTCGTGGCCGGATATACCGACGCCACCGGCGATGAA +AAAAGCAATCAGCAGTTATCGCTGCGGCGTGCCGAAGCGGTGCGCAACTGGATGCTGCAG +ACCAGCGACATCCCGGCCACCTGTTTTGCCGTACAGGGACTGGGCGAGAGCCAGCCTGCG +GCGACCAACGACACGCCACAGGGCCGGGCAGTCAACCGGCGTGTCGAAATCAGTCTTGTT +CCGCGTTCTGACGCCTGTCAGGACGTGAAATAA +>test.0417.00002.0001i_00006 492 hcpA | Major exported protein | NA | similar to AA sequence:UniProtKB:Q9HI36 | COG:COG3157 +ATGGCTATTCCTGCTTATCTCTGGCTGAAAGATGACGGCGGCGCGGATATCAAAGGTTCC +GTGGACGTTCAGGGGCGCGAAGGTAGCATCGAAGTGGTGGCGCTGGATCACGATGTGTAC +ATCCCGACCGACAATAACACCGGCAAACTGACCGGTACCCGTACTCACAAGCCCTTTACG +TTTACCAAAGAAATCGATGCCTCCAGCCCGTATCTCTACAAAGCTGTGACCACCGGACAG +ACCCTGAAAACGGCAGAATTTAAGTTTTACCGCATCAACGATGCCGGTCAGGAAGTGGAG +TACTTCAACATCACGCTTGATAACGTCAAGCTGGTCAGAGTCGCTCCGCTTATGCACGAC +ATCAAGGATCCTTCCAGAGAGAAGCATAACCACCTGGAACGTATTGAGTTCCGCTACGAG +AAAATCACCTGGACTTACAAAGACGGCAACATCATTCATTCCGACTCGTGGAATGAGCGT +CCTTCCGCCTGA +>test.0417.00002.0001b_00007 2637 clpV1 | Protein ClpV1 | NA | similar to AA sequence:UniProtKB:Q9I742 | COG:COG0542 +ATGACAGGAAATCACTCCGCCGCGCTGCTGCGTCGCCTTAACCCATACTGTGCACGGGCG +CTGGACGCTGCCGCCTCACTGTGTCAGACCCGCGCCCATGCGGAAATAACCATTGAACAC +TGGCTGCTGAAACTGCTGGAGCAGGGAGAAGGCGATATCACGGTGATTGCCCGCCGCTAT +GAATGGGATATCGACACGCTCTGGCAGTCTCTGCTGGCACATCTGGACACCTTACCCCGC +CCGGTCCGCGAACGTCCTCAACTTTCTGAACCGCTGGCAGCGCTTATCCGACAGGCGTGG +CTGATAGCGTCACTGGAAGGCGACGATCCACAAATCCGCAGCCAGCATCTGCTGATGGCG +CTGACAGAAAAACCGATGCTGCCCGCCTGTAATGACCTGTGGGTATTGCTGAGTCTGAGC +CGCGTGCAGCTTGAGCGGCTGCGTCCCCTGCTGGATGCGCAGTCGGATGAATGTCCGGCA +CGTCAGCCACAGGTCACCGAACCGCTGACCTCTGCACTGCCGGAGACGGCAACGGCGGAC +GCACCGGCAAAAACGCTGACGGAGAAACAGGATGACGCCCTGCTGGCGGTGCTTAACCGC +TTTACCGAAGACGTGACGGAAAAAGCCCGCAGCGGGCGAATCGACCCGGTATTCGGGCGC +GACACGGAAATTCGCCAGATGGTCGATATCCTCTCCCGTCGCCGCAAAAACAACCCGATT +CTGGTGGGAGAACCGGGGGTGGGCAAAACCGCGCTGGTGGAAGGGCTGGCGCTGCGTATC +ACCGAAGGCAACGTGCCGGACAGCCTGAAAACGGTGCATATCCGCACACTGGACCTCGGT +CTGTTACAGGCTGGCGCGGGCGTTAAAGGTGAATTTGAACAGCGGCTGAAAAATGTCATC +GATGCAGTGCAGAAATCACCGGAGCCGGTACTGCTGTTTATTGATGAAGCCCATACCATT +ATCGGTGCGGGTAATCAGGCAGGCGGCGCGGATGCGGCGAACCTGCTGAAACCGGCACTG +GCAAGGGGCGAACTGCGCACCATCGCGGCGACCACGTGGAGCGAATACAAACAGTATTTT +GAGCGCGACGCCGCGCTGGAGCGCCGCTTCCAGATGGTTAAGGTTGACGAGCCGGATGAT +GACACCGCCTGTCTGATGCTGCGGGGACTGAAGGCTCGCTATGCACAGCACCACGGCGTG +CATATGCTGGACAGCGCCATTCAGACCGCCGTGCGCCTGTCGCGCCGCTATCTGACCGGA +CGCCAGCTGCCGGACAAGGCGGTTGATTTGCTGGATACCGCCGGGGCAAGAGTCCGCATG +AGCCTTGACACCCTGCCGGAACCGTTGACGCAGCTTCATGCGCGACTGGCGGCACTGGAT +ATTGAGCGGGAAGCGATTGAGCAGGACAGCGTATTTTATCCCGAAGCCAGCCCGGAGCGG +CTGGCGGAACTGACCGATTTGCGTGATGAGCTACAGGCAGAAGCCGGGCATCTGGAAGCG +CAGTATCAGCAAGAAAAGGCACTGGCGCAGCAGATTATGACGTTGCGTCAGGAAGGAACA +GACAGCTCTGAACTGCAACAGCAACTGCGGACGCATCAGGGCTTTGCACCGCTGCTGGCG +CTGGATGTGGACGCCCGCGCCGTCGCCACGGTGGTGGCGGACTGGACCGGCATCCCGCTC +TCTTCCTTGCTCAAGGACGAGCAGAGCGACCTGCTCAGTATGGAACAGAGTCTTGAAAAC +CGCGTTGTCGGGCAAAGCCCGGCGCTCTGCGCCATCGCACAGCGGCTGCGGGCGGCTAAG +ACCGGCCTCACGCCGGAGAACGGCCCGCAGGGGGTATTCCTGCTGACCGGCCCCAGCGGC +ACCGGTAAAACCGAAACTGCGCTCACACTGGCCGACACTCTGTTTGGCGGTGAAAAATCC +CTTATCACCATTAATCTTTCGGAATATCAGGAACCGCATACCGTTTCCCAGTTGAAAGGT +TCGCCTCCGGGCTATGTCGGCTACGGTCAGGGCGGCGTGCTGACCGAAGCGGTACGCAAA +CGCCCTTACAGCGTGGTGCTGCTCGACGAAGTGGAAAAGGCGCATCGCGACGTGATGAAC +CTGTTCTATCAGGTGTTCGACCGGGGCTTTATGCGCGACGGCGAAGGGCGGGAAATCGAC +TTCCGTAACACCGTGATTCTGATGACCGCCAATCTGGGCAGCGACCACATCATGCAGCTG +CTGGAGGAAAAACCGGACGCCACGGACGCAGACCTGCATGAACTGCTGTACCCCCTGCTG +CGAGACCATTTTCAGCCTGCACTGATGGCGCGCTTTCAGACGGTGATTTACCGCCCGCTG +GGACAGGAGGCGATGCGCGCCATTGTGGAAATGAAACTGGCGCAGGTGGCCCGCCGTCTT +CACCAGCACTATGGGCTGGAAACGGAAATCAGTAACAGCCTGTACGACGCCCTGACCGCC +GCCTGCCTGCTGCCGGACACCGGTGCGCGTAATATCGACAGCCTGCTGAACCAGCAAATC +CTGCCGGTCTTAAGCCAGCAGTTGCTGGCGCAGCAGGCCGTGCATCATAAGCCTGCCCGA +CTGCGGCTTGACTGGGATGATGAAGACGGGATTGTGCTGGAATTTGATGAGAAATAA +>test.0417.00002.0002b_00008 1161 NA | hypothetical protein | NA | NA | NA +ATGATCCTGACACTGGTCGGTCTTATTCCAGTGGCAGGTTCTTTAATTAAAGGGATCTTC +AAAGTGCTGTTTAATTCGATAAGAAAGGCGGCGCTTTCCAGTAGGGATATTGTACGAGCG +ATTGATGCTTCCGTTTCCCTGTTTAATAAATTTATCGATTTGCCAGCCGTGCAGGCGACA +ATGAAGTGGATGAAGATTTATAACCCGTATACGTATGCTGAGAAGCAGGTCAGGGAACTG +ATGGCGCAACTTAACGTATCGGTGCTGTTAAGCAAGCTGGATGAGTTAATGGACGTCACT +GGTTCGCTACTCGAAAAGGCTAAATCTTGGGGGCCGGAGTCCATTCGCCAGCCGATAGAG +GTGATATGGGAACTGCTGGTGTCTATCCGCAGCCAAGCCAACACCATGCTTGCAAAAGCG +CTGGCACCGTTAAATGATGTGCTGGAAAAGCTGGCTGCCCGTCTGCACCGGGAAGGGGAC +GATTATTATAAAGCGCATACTGGTGCTAATCCGCATCGGCCTTCTCGCCTGAAAGATGCT +GAAGAGGTGGAATTGCTGGCTACCAAAAAGCCAGACTGGGCGGATATTGGGGGTAAAGAA +AAATATCCACAACTGGAAAAAGCCAGTGCGGAACAGAAAAGATTAATGGACCCGGAGAAT +AAGGAGGGCGGCTACCCGAATATTCCTGATGATAAAGTGCAGACTTTTCATCAGATGGCT +CCCGTTGAATTTAAAGAAGGCGAGAAACTCTACCGGGTGCTTGACCCTGGCAGTAGCGAT +AATAGTTTTTGCTGGATGCGTGAAGCAGAGTTTAAAGCACTGAAGAGTAAGTCTCAGTGG +CGACGACGCTTTGCGGTCTGGAAAAGCTGGAATGAAAATGGTGAGTATGTAGTTTATACC +GTGCCACCCGGTACAACAATGAAGGTTTGGGAAGGTCCAGCTGCCTCTCAGGTGCGTGAA +GTCACAGGTAAGAATGGAGAGAACATTAAAGTCGTGCTGGAAGGCGGATCACTTCAGATA +GTGATAGATCCGACCGTTCTGAATTTGGACTATTTGGGGAAACGTCAGTCTACAGGATGG +GGGTATAGAGATTTTTCTGATGAAGTGGATATGTATATAGGTGTGCCTCAGTTGCAAACA +AATATTTATGTACCTAAATAA +>test.0417.00002.0002i_00009 1068 NA | hypothetical protein | NA | NA | NA +ATGGCTATATTACATCCACAGGAGTGTTGGTTGCTGGAAAGAATAATGTCGCCGGAATAT +TATCGGCGCCGTTTTGAGGGCTGGCAGGCGTTTGTCGAGCTGTGCGAACGGCAAGTGGCG +GAGTGGAGCAAGACCATTCCGCTGGATGTGCGCCGTCGTCCGCTGTACGAGCAGATTGAC +GCCGTCTGGGGCGGGCGGGTGTTGCCCAATATCCGCAGCACTTTAAAGTCGGTACAGTAT +GACTTTATTCAGCTACAGCAGGGGGACCTGCGGGTACTGCAATCCGGGGGCAATATTAGC +AGTGATATGAAAGGACTGATTGATTATCCGCCGGACTGGATGTCACCCGCCGCGCAAAAA +CAGTATGACAGGCTGAAATGGCGAGGTGCACATTATAATAATCTAATCAGACGTACCTCG +GGCGGATACTGGTATGACGGCGAACTGACTTATTATTATGAGGAAAGTCTGCACGGCCCG +CTGGCCCTGCCGATGCAATTACCGTTGTATGAGCTGGATAGCAGCGTATACCTGCGTGAG +GATGACCCGGTAACGGTGGCTGGCCTGTATCTGCCGGATATCCCAGATGCCAGCGCCCAA +CTGTTGTACCGGAGTGAACATATTCCCGAGGCTTGGCAGGGGCGGGTACGAACGAAGTAT +GTCAACGAGGCTGGGATACAAGAATATTACTGGGAAAGCGGGGCGTGGGCAAAATGCAAC +TGGAAACGTATACGGCGGGTGGCAAACCGATTTATCAATGTGCCGCCGGAGGGATTTTTC +CCACAGGGCATGCCGGAGGAGTTGTACAACTGGCCACAGCGCGAAGCGCAGTATGTAACA +GACCGGCAGCGGATAGCGGCCTATAGCGGTGAAGCTTGTCCTCATAGCGGGGAGTGGTCG +ATTTTTGTAGAAGGTAGACAAGCGACGGAGACGCTGGAGCAGGGAGAGCAGATGCCGGAA +TGGACGGACAGGAAAATGGAGGGGGAGTATAAAAGAGGTGAGAAATTCCATGTGCTGTGG +TCGCTGATGAACCGCCACGATGGCGGGTCGGTGTGGGTGGAAGCGTAG +>test.0417.00002.0002i_00010 381 NA | hypothetical protein | NA | NA | NA +ATGAGGATATCACTGGCAAGCTTGTTTTTTCTTTGCTGTACAGTATCAGACAGTGTTTAT +GCGGATACAGATCAAACATATGATATTTTTTGGGGAATGCTGGTAAAGGATAAAAAGGAT +ACTATATTTGTTCGCTGTGACAGTCCGTTATTGAAAATGAAAATTGTGAGAATGGCGGAT +GCAAATACAGAAAACATTGATAAGGCATACCAGATATTTAATCAGAAAACGAAAAAATCA +ATTTATTTTGCTTTTATCGGTAATGTGACTGATGCCGGGAGTGGAAAGTATATTTTCAAT +ATGCTGGACGTGATGGAAACGAGAGAAGGCTATTGTAATCTGTCCGATGTGCTTAATGCA +ATAGATGAACAGTTTCGATAG +>test.0417.00002.0002i_00011 264 NA | hypothetical protein | NA | NA | NA +ATGAAAGGTATTGTTGTTCTGGGAGATAAGACAACGCATGGTGGGCAGGTTATATCTGTG +TCATCTTCGATGGTTATCAATGGAAAAAAAGTTGCGCTTGTAGGTGATAAGATAAACTGC +CCTGTTAAAGGGCATGGTATTAATACCATCATCGAGGGGAGTTTTGATTGGATTTCTGAT +GGCAAACAGGTCGTCGTGAATGGCTGCAGGTGTGAATGTGGCTGTGTTGTTATATCCAGT +ATTGCTGATGCCTTGATTGGATGA +>test.0417.00002.0002i_00012 1140 NA | hypothetical protein | NA | NA | NA +ATGGGATGGAAACGGACGTATACAGAAGAAATAGACAGGCCACAGGATATTTACTTTCAT +AAGTGGTTATTTTCTTTATTTATTTTATGTATATTATTACTCGTTATTTATTATTTTTTC +CATGAATTTGTTGTAGCTAATAACGCATCTTTGTTAGCATTCTTTTCCCCATTATTATTG +TGGGTATTGATTCTTTCAGTACAGGTAATATTTTATTCCAGAGCTATTCAGGATTATTCA +ATTTGGCTGGAGAACAGACTTAGTATCAACAGAGAGTGGGAGGCATGGGGATCAAGATAT +GTTTCTGTTATGAATAGTAGTCTTCATCTTCCTGGAAAAGTCGATGTTTTATTCTTGTCT +GGTGATGAATTAGAAACTCAGTATGGACTTGTCAATAAGTCAGATGATATCACATGGAAG +CAACATGATTGGTATGCCTGCTTTCAGACCCTTACTAATCATCTTGAACTTTATAAACTC +CCATATCAACTTACACAAGAATTTATTATTCTTACTGATTTTGATGAAAGTATGTACTCT +CAGATTGAAGAGGACTTTTTCAGAACAGTGGAGAAAACCAACAGAACAGAGGGGCATTTT +TTGTTGCATATTTCCCCTTCAATGTCCTTTGGAGAGCTTGATTTATGGTTAAAGGATTCC +GAAGAGAAAATATATATTGTCATGGTGTTGCAGATGGAGGAGCAAACATCCTGTTCGGAC +GCTATGGCTTGCCTTATGTTTGCAACTGATGATGTTACTGCTAAGTACAAACTCACTGAA +AAGGCCAGAATTTATCGCCCAATGGTAGTAAATAGTAATAATTTCAATAGTGACTTGAAT +ATTTTTATTGACACACAAAAAATATCCAAAAATGCCGCCGGGTTAGTTGGGGACAGTCAG +CGTCTGTTTTCTGTGAGTAGTAATGTATTGCAGTGTTTTAATGATAATAATGCTCAATTG +AAAATTGATAATATCCATCTTTTAGAAAGCCTTTGCGGATTACCAGGGGGAAATGCGGTC +TGGTTAACGGCAGCGCTGACTATTTCGGTGGTTGTTCACAAAAATTCAGATTACTTGATG +ATGTCCGAAAATAATGATGACTGGATCATTACCACCATTCATCCTATGGAGCATTCATGA +>test.0417.00002.0002i_00013 3354 NA | hypothetical protein | NA | NA | NA +ATGAAGAGAATAAATAAAAAAAGTGTTTTTATATCTAATGTACTTTTATTCTTGGTTATT +GTGGCCTTCGTGGGGGGGATCATCTGGCGTTTTGGTGATCATTTTGGACTGAAAGGGGAT +GAAAATAATTTTTTTGCGTGGTTGATATGCATTATGACCCTCATTTTTGTACGGGCATCC +TGGTATTTCTCTCGATTGTATCGCCTACGAAAGGAACAACATCACTCCGAAAAGGAAAGA +TTACGCCCGGAGAAAGAGGCTCGTATTGAATATGGCAAGGTCATAACCCTGAACATTGAG +CTAGCTGAGTATTTATGTGCCCTATACGGCCCATTCTGGCGGCGTAAAGTCCGCCTGCTG +CTGGTGACCGGCGAGCCTGAACAGGCAGAGGCCATCGCGCCGGGGCTGACCGGGCAACAC +TGGCTGGAGGGCGACCACAAGGTGCTGATATATGGCGGCAGGCCATCAGCGGAGCCTGAT +GTCGCGCTACTGACCGCCTTAAAAAAACTGCGCCGCAGCCGCCCGCTGGACGGCATCATC +TGGCCGCTGACAGAAGAACAGAGCCGCCAGACAGCGCAACTCGACAAAGGCTGGCGCGAA +CTGATAAACGGCGGTAAGCGACTCGGTTTTCAGGCTCCACTCTATTTGTGGCAGGTCTGT +GACAACGGTGATTATCAGACCGGACGCCCCCTGCAAAGCGTCGGCTGCCTGCTGCCGGAA +CGCTGTACCCCGGAACAACTGGCTGCAATGCTGGAAGCACAAACCCTGCCGCTGACGGAA +CAGGGCATGTCGCAACTGCTGGCAGATAACCGCCATGATTTCCTGCTGCGTCTGGCCCAT +ACCCTTGCAGAGCGGGGTATCGCTCACTGGCAAAGCGTTCTGAAACCGCTGCTGGCAGGC +GGCGCATTTTCTTCCCTGCGCCTGCGTGGCCTGATGTTCAGCCCGCCGCTTGCCGCCGTG +CCGGAGGCCGCACCTCATGCGTGGCTGCCGTCACCGGTCTGGGCGGGCGTGACGGGTGAT +AACGCGCGCGGGCGTGCAGTGGGCTTTCCGTGGCTACGCGCCGCGCTGATAACCAGCATC +TGCATGCTGGCGATATGGGGGGCCGGAATGACGACCTCGTTCTTCGCCAACCGCGCGCTT +GTTCAGGAAACCGGTATCCAGACGGCACGTGCGCTTGATACCCGCCTGCCGCTGGCAGAA +CAACTGGTGGCGCTGCATACCCTGCAGGGCGAACTGGAACGCCTGCAATATCGTATCCGC +GAAGGTGCGCCGTGGTATCAGCGTTTTGGCCTTGAACGTAACCAACAACTGCTCGCCGCC +GCTTTTCCCGGCTATGCGCAGGCGGCAAACCGGCTGGTGCGCGACGTGGCCGTTGACCAT +CTGCAACAGCAACTGAACGCCTTTGTCGCCCTGCCGCCCAACAGTCCTCAGCGTACCGCC +ACCGGTGAACAACGCTATAAGCAGCTTAAGGCATTGCTGATGACTTCCCGCCCGGAAAAG +GCCGACGCTGCCTTTTTCAGTACCACGCTGATGGCGGACGGTCTGCGCTACGAGAATATC +CCGGAAGGTGTGCGGCAGAGCGTGTTGCCGTCACTGCTGACCTTCTGGATGGCGAACCTG +CCGGAACACCCGCAGTGGAAAACCGCACCGCCGCCGGAACTGACCGGCGCGGTGCGTAAA +ATCCTGCTGCGCCAGATTGGTGTGCGTAATGCTGAAAACACCCTCTACCAGAACGTGCTG +CAACAGGTGTCCCGCAACTACGCCGATATGACGCTGGCGGACATGACCGGGGATACGCTC +ACCGAATCTCTTTTCAGTACGGAACAGACAGTGCCGGGGATGTTCACCCGTCAGGCGTGG +GAAGGACAGGTCAGGGAAGCCATCGAGCAGGTAGTGACGGCGCGGCGCGAGGAAATCGAC +TGGGTACTCAGCGACCGCCAGCAGGATACCTCTGCGGATATCTCGCCGGATACGCTGCGT +AACCGTCTCACCTCACGCTACTTTACCGACTTTGCCGGAAGCTGGCTGGCGTTTCTCAAC +AGCATTCGCTGGAAAAAGGAAGACTCGCTCTCCGGCATTCTCGACCAGCTGACACTGATG +GCCGATGCCCGTCAGTCGCCGCTGATTGCGCTGACCGATACCCTCGCGTGGCAGGCGGCG +GCTGGCAGGGAAAACCGTGGCCTGTCAGACTCGCTGGCGAAATCGGCACAGGAACTGTTT +AACGGCAAGGAGAAAACGCCGCAGCAATCCCGTGAAGGCAACGAGCCTGTCGGGCCGCTG +GATAAAACCTTCGCGCCGCTGCTGCGGTTGCTGGGCGATAAAGCCGGAGGCGGAGACAGC +CAGCTGAGTCTGCAGACCTACCTTACCCGCGTTACCCGCGTGCGCCTCAAACTGCAACAG +GTGACCAACGCTCCCGACCCACAGGAGATGACCCAACAACTGGCGCAGACAGTCTTGCAG +GGCAAAACCGTTGACCTCACCGACACCCGCGACTACGGACGGTTAATCGCCGCCAGTCTG +GGCGAGGAATGGAGTGGCTTCGGTCAGGCGCTGTTCGTCCGCCCGGTGGAACAGTCGTGG +CGGCAGGTGCTGACGCCTGCAGCGGACAGCCTGAACCGCCAGTGGCACCGGGCGATTGTC +AGCCACTGGAATCAGGACTTCGCCGGGCGCTATCCGTTCAAAGCCTCACAGAATGACGCT +TCCCTCCCCCTGCTGGCGCAGTACCTGCGCGATGACGGGCGCATCAACCAGTTTATTGCC +GCCAACCTTTCCGGCGTTCTGAAACGTGAAGGCCGCTACTGGGTGGCTGACGCCATGAAC +ACGCAGGGGCTGACGGTCAATCCGGACTTTATCCGCGCCCTGAACCGCCTGCGCGACGTG +GCCGATACCGCCTTTGCCAGCGGCGATGCCGGGATACATTTTGAACTGCGGGCAAAACCG +GCCCGAGACGTGATGAAAACACATCTGGTGATTGACGGGCAGGAACTGGAATATTTCAAC +CAGAAAGAACGCTGGCAGCGTTTTAACTGGCCGGATGAACAGTGGCAGCCCGGCGCATCG +CTGAGCTGGACCAGTACGCAGGCGATGGAGCGCATACTGGCGGATTATCGGGGAAGCTGG +AGCCTAATTCGTCTGCTGGAACAGGCGCAGGTGACACCGGTGGACAGCAGCACCTTTAAA +GTGGTGTGGAAAGCGCAGGACGGCCTGCCACTGAATTACCTGCTGCGGGTTGAACAGGGA +AAAGGGCCGCTGGCGCTGCTGGAACTGAAAAACTTCCGCCTGCCGGGACAGGTATTTCTG +ACCGGCAGGAGTATGAAGGATGCGGAAGAATACGGGGAAGACGCCGATGAGTGA +>test.0417.00002.0002i_00014 1638 NA | hypothetical protein | NA | NA | NA +ATGCGGAAGAATACGGGGAAGACGCCGATGAGTGAGCTGTTGCAAAAGCTGACCCGTAGC +TGTTTTGCCGACCGGGATGCACTGGATGTGGCGCGAACACAGGCGGCACTGTGGCAGACA +TGGCTGCTGCCGGTGACGGCAGACACGCCGGTCGGGGAAGACCCCGGCTACCACGACGAT +TTCCTGCGTATCCGCGACGAGATGAACAAACTTTCCGGCGCGGATACGGACCTCATCTGC +CAGCTTGCCGAATCCCTGCTGCTGACGCAGGCAAAAGACGTGCGCATCGCCACTTACTAC +ATCTGGGCGCGACTGCACCGCGACGGTGAGCGCGGACTGGCGGAAGGACTGGCGCTGCTG +ACCGGACTGGTGGAACGCTTCGGTACGCAACTGCTGCCCTCGCGTCCGGCCAGCCGGAAA +ATGGCGCTGGAGTGGCTGGCAGGGGAAAAGATGCTCGACAGCCTTGCCCGCTACCCGGAA +GTGGCAAAAGAGGATTTTGCGAACATTGTTGCTGCTCTTAATCAACTGACGGTTTCCTTC +GCCGCATGGCCCGAAGACCAGCATTCCCCCTCCCTGATGCCGCTGATTAACGCGCTGGAA +TCACGTCTGGCGCAGTCGGGTGGGATGAATGCGGTGGTGCCGCAAAACAGCAGCAGCGTT +CCTGCACCGTCATCCCCGGTGGATGCGCCACAGGTACAGACCATCACCTCCGGGCGCGAC +CTGCTCGACCAGGCGAAAGTGCTGGCCCGTTATCTGAACGAACAGCCGCAGGGCTGGCTT +TCAGCACACCGGCTGATGAAAACCCTGCGCTGGGACACGGTGCATGAACTGCCGCCGGAT +GTGGACGGCAAAACCCGGCTGGCCCCGCCGCGCACAGAATCGCGCAACCAGCTTAAGCGG +CTGTATGCCCAGCAGAACTGGACGGAACTGCTGGAGCAGGCCGACCTGATGTTCAGCACC +GGTGTCAGCCATTTCTGGCTGGACATTCAGTGGTATCTGCATCAGGCGCTGGCCAAGGCG +GGCGCACCGTGGGACAGGTGGACAGCCGTTATCCGTCAGGACCTGACGTTACTGCTGGAG +CGCCTGCCGGGACTGGAAAATCTGGCATGGAACGACGGCACACCGTTCGCCGACGAGGTG +ACGCGCAACTGGATAGCGCAGCAGGTCATGATGCGGGAAGACGGCGCATGGCTTGCGGGG +AAAGCCGCTGTACCGACAGACGACGCCACAAATGACGTACTGGCGCTGGAGCCGGAAGCA +CTGGCGATGGCAGACAGTCAGGGCGTGGAAGCGGCGCTGGGCTGGATACAGACCCGTCCG +GGCATCACCACGGCACGACAGCGCCTGTTATTGCGGCTGCTGATGGCACGGGTGGCGGAA +CAGTACGGTAAAAACGAGATGGCGCTCCTGCTGCTGGAAGAACTGGATACCGCCGCACAG +GGAATAACGCTGACGCAGTGGGAGCCAGAACTGCTGTTTGAAGTAAAAGCCCGGCAACTG +AAACTGCTGCGCCTGCGGGCACATCGCCACGCGGACAAGGCGGCGCTTGCCCGGAAAATG +GACGCTCTGCTGGGTTCGCTGGTGGCAATCGATCCGGCGCGGACAGCGGTACTGTGTGAT +ACGCAGCATAAGGACTGA +>test.0417.00002.0002i_00015 1761 NA | hypothetical protein | NA | NA | NA +ATGGACGACCTGACCCAACGCTACTTTGAGGCCGAAATGCGCTACCTGCGTGAAGCGGGT +AAAGAATTTGCGCAGGCTTACCCCGACCGCGCTGCGATGCTTAATCTTGATAAACCCGGC +GCACGCGATCCCTATGTGGAGCGCCTGTTCGAAGGCTTCGCCTTTTTAATGGGCCGCCTG +CGCGAAAAGCTGGACGACGATCTGCCGGAACTGACTGAAGGGCTGGTCAGCCTGCTGTGG +CCCCACTACCTGCGAACCATCCCGTCACTTTCCGTGGTTGAACTGTCGACAGATCACCGG +CAAATGAAGCAGAGCGAAACGCTGAGCGATTTTCAGGTATTGTCGCGCCCTGTTGGCGAG +CGCAGAACCCGCTGTTTCTACAGCGCCACGCGGGATATCACGCTGCATCCGCTGGCGTTG +CCGGACGTGTCATTGCAATATGAACCGGACGGACGTTCGGTTATCCGTCTGCGCTTTGAA +TGCGGCCCGCTGGTCGGCGACTGGTCGCAGATCGATTTATCCCGCCTGCCGCTCTATCTC +AATGCCGACAGCCCGGTAGCCTGTGCGTTGCACCGGGCTTTAACGCTTGGCACGCAGCAG +TTCTGGCTGCGTCTGCCGGGGCAGGATCGCCGGATGCTTGGCGCACACTTTTCCCCGATG +GGCTTTGAGGATGATGACAGGCTCTGGCCAAAAGGTGAGTCAGCCTTCAGCGGTTACCAG +TTGCTGCTGGAGTATTTCACCTTCCGCGAGAAGTTTATGTTCGTGGCGCTGAACGGGCTG +GAGCAGGTTGCATGGCCGGAGGGGATAACCGGCTTTGAGATTGACGTGGTGCTGAACGAG +AACTGGCCTCACGACCTGCCATTTGACAGCGATAATATCCGTCTGCACTGCGTGCCGGTC +ATCAACCTGTTCCCGCTCGAAGCCGATCCGTTACACCTTTCGCCACTGGAAAACGAATTT +CTGCTGCGCCCGATGCGCATTCAGGACGGGCATACCGAGATTTATTCCGTCGACAACATT +ATTTCTTCGCGCCATACCGGCAGTCAGGCATATGTCCCCTTTTCCAGCTTTCGTCACCGG +GGCGGGATGCTGCGCCACGATGCGCCGGAACGCTATTACCACACGCGGGTAAAGCGCGGC +CCTTCCGGCTTGCACGACACATGGCTGATTCTGGGCGGCGATGCGTTTGATTCCGACCGG +ATGCTGGAGGATGAAACCCTGTCCTTAAGTCTGACCGGCACCAACGGGCAGCTTCCCCGT +AAAGCCTTACAGAGCACCCTGCTCGATACGCCAGTTCATGCCTCACAGAACGTCCTGCGG +GTGCGCAACCTGTGCGCCCCGACGCAGCCCTGCTATCCCCCGGCGCGTGACCGCTTCCAC +TGGCGGGTGCTCAGCCACCTCGGTTCTAACTTTTTATCGATGATGGATAACGCCGAAATT +CTGCGCGGCACGCTGGCGCTGTACGACTGGACCGAAAGCGAGATGAACCGCCGTCGTCTG +GAGGCGATTGTCGACGTTCAGCACAGCCTGATACAGCGTTTTGAAAGAGGCTTTCTGCTG +CGTGGCGTGGATATTCAGGTGACGCTGGACAGTAACGGCTTTGCCGGAGAAGGTGATATC +ACGCTGTTTGGTGAACTGCTGCACCGCTTCTTCGCACTGTATGCCGATATCCACTTATTC +ACTCAACTGACCTTAATTCTGCAACCCACAGGAAAGTGCCTGCAATGGACAGAGCATCAC +AGCCAGCGCGTACCGGGCTGA +>test.0417.00002.0002i_00016 1080 NA | hypothetical protein | NA | NA | NA +ATGGACAGAGCATCACAGCCAGCGCGTACCGGGCTGACCGACCGGCTGGCCCCGGATATT +GCGCGGATCAATTTTTACCGTTTTTGCCAGTTGCTGGAACAGAGCCAGCAGAAAGCGCCG +CTGGGCAGTACCGACAACCCCGCCGCCGATGCGGTGCGTTTTCGCCCCCATCCCGGAATG +GGCTTTCCGGTCAGCGAGTTAAAGAACGTTGAACGTGACGTGGACAATCCCGACGCGCCA +CCCACGGTGCGCACCACCTTTCTCGGCCTGTACGGCGTGGATTCACCGCTGCCCACCGCC +TATCTGGACTACATTACCCAGCGTCATGACGGACATGACGCAGTGATGGCGTTTCTCGAT +ATTTTTAACCATCGCTTTATCACCCAGTATTACCGCATCTGGCGCAAATATAACTACCCG +GCGTCGTTTGAAGCAGGTGCCGTGGATGACATTTCCCGTTGTCTGCTGGGGTTAATCGGG +CTGGGTATTCCCGGCAGCGAGAACCATATCGCCACGCCTGTATCCCGTTTTCTGGCCCTG +CTCAGCGTGATGCGCCTGCCCACCCGCACGGCTGAAGGCGTCACGGCACTGGTGGGGCTG +CTTGCCCCGCTGACGAAAGCCACGGTGGTGCCTCACGATCCGCAGCCTGTAATTCTCCCG +GCCCCTGCGGGTCTGTCAAAAAATTCACGCATCAGCCTGAAAACGCGAACGCTGCTGGGG +CGTACCGGTACCGACGTCAACAGCCAGTTGCTGCTGAAACTGTATACCGAAGATGCCGCA +GAAGCACGTGGCTGGCTGCCCGGCGGGCAACTGCACAGCGATTTGCTGGTGCTGCTGCGC +GTTTATCTGGGCTGGCGCTGTCAGGCCCGTCTGCAACTGACGCTGCCCGTCAGCCTGTTG +CCTGCTGCCCGGCTGGGAAAACAGCGTGTACAGATTAGCCGTACCGGCATCCTTCTCGCC +TCCTTTGCCGCGCCCGCGACCGGAACAGTGACGGTCAGTCTGGGGCGTTATCAGGGATTA +ATACCCGCTTTTTCCATTCGTAACAGGGAGAGTATGACTCATGTTTCCTATTCGTTTTAA +>test.0417.00002.0002i_00017 537 NA | hypothetical protein | NA | NA | NA +ATGTTTCCTATTCGTTTTAAACGTCCGGCGTTGCTCTGTATGGCGATGCTGACGGTTGTT +CTGAGTGGCTGCGGGCTGATTCAGAAAGTGGTGGATGAATCGAAAAGCGTGGCCTCAGCC +GTTTTCTACAAACAAATCAAAATACTGCATCTCGATTTCTTCTCCCGCAGCGCCCTGAAT +ACGGATGCGGAAGATACGCCGCTTTCCACGATGGTGCATGTCTGGCAACTGAAAACCCGC +GAAGATTTTGACAAGGCGGATTACGACACCCTGTTTATGCAGGAAGAGAAGACGCTGGAG +AAGGACGTACTGGCAAAACACACCGTCTGGGTAAAACCGGAAGGCACGGCATCCCTGAAT +GTGCCGCTGGATAAAGAGACGCAGTTTGTCGCCATTATTGGGCAGTTTTATCACCCTGAT +GAAAAAAGCGACAGCTGGCGTCTGGTGATCAAAAGGGACGAACTGGAGGCCGACAAGCCG +CGCTCGATTGAACTGATGAGAAGCGACCTGCGACTGCTGCCTCTCAAGGATAAATAA +>test.0417.00002.0002i_00018 429 NA | hypothetical protein | NA | NA | NA +ATGTCGACACCTTCCTTATATGAAATGCTGACGTTCAGTTTCAGCGGCGAGTTACCGCTG +GAACAGATCAGCGAGCGGGATCAGCTTATCCTTTCCGTGATGGACAATATGCAACGCATT +ATCAACTGCCGGGCAGGCACGCTGGCGCATTTGCCGGATTACGGTCTGCCGGATCTCAGT +CTGATCCATCAGGGGATGGCTGCGGGTATTCATGGCCTGATGCGTCAGATTGAAGAAACA +CTGCTGCGTTATGAACCACGCCTGAGTCAGATACAGGTGGAATTACTCCCCCAGCCCCGT +CCGGGGCATCTTAATTACCTGATCCACGCGCAGCTTCCCGATACCGGCTGGATACGCTTT +GATGGCGTATTTTCTCCGGAAGGACGAATTGTTCTGCGTCATCTCAAACAACAGGAGCGG +GCGTACTGA +>test.0417.00002.0002i_00019 1377 NA | hypothetical protein | NA | NA | NA +ATGGCAAGTAACGCGAATTTTATCAGCCAGTTCGTCATGGGCGGCGATCCCTGTACTTAT +AAGGAATCCGGTGAACTGCAGGCTGAAATGAGTAAACTGACTCACCCGGCCCGACCGGAT +GTGGACTGGCGTCAGGTGGAAAAACTCTGCCTCGCGCTGTTCCGGCAAAATGGCGTGGAA +CTACAGACGCTGGTCTGTTACGTACTGGCGATAACCAGACGGCAGGGGCTGGCAGGGATG +GCAGACGGACTCGGTTCACTGGATATACTGCTCCAGCGCTGGGCTGACTTCTGGCCGGTA +CAGGTACATTCCAGAATATCACTGCTCAGCTGGGTCACAGAAAAAATGCAGCAGGCACTG +AGAACGCTGGATATTCAGTATCAGGATCTGCCGCAGATTTACCGTTGTGTACAGCATCTT +TCCGCCATCGAAACCACGCTGCAACAGTGTGAACTGTGGCATATGACGAAACTGGATCTA +CTGGCCGGGCAGTTTCGCAATACCGCATTGCGTCTGGAACGGCTGGCGCCTCAGGGAGCG +GAAACCACTATCACTCCCCCTGAATTACCCCGCCGGGAAATGAATCAACCGAAAAAGTCA +GAGGAAAGTCCACAGCCGGTTTTTGCAACCAGATCCGTTCAGCAAAACGATAAGGATGCC +AGTCCACCCGTTCCATCCCCTGAAATCTCCCGGCAGCGGACATGGCCGATATTTATGGCC +GGAATGGTTGTGATGGCCGGTCTCGGCGGAACAGGATTATGGGGCTGGTCGCAGCTTAAT +CAGCCGGACGCGCTAATCCAGCGAATACAACTGTCTGTCATGCCATTACCGCAGTCGCTG +GAGAGCGGCGAACTGGCAAAGCTGGATGTAAAGGATAAGGCGCTGCTGGCTCAGGACAGA +ACAATTGCGGCAAGTCAGATGCAACTGGAGCAGTTAAACAAATTGCCTGCCCGCTGGCCA +CTGGAGCAGGGATATCGCCAGCTACGCCAGCTTGATGCCCTGTGGCCGGATAATCCTCAG +GTCAGGGCGCTGAACGCGCAGTGGCGCAAACAGCGGGAGCTGAGCGCCCTGTCTGCTGAG +GCACTGAATGGCTATGCTCAGGCGCAGAGCCAGCTACAGCGCCTGTCGGCGCAGCTGGAT +GCACTGGATGAACGTAAGGGGAGATATCTGACCGGTTCGGAACTAAAAACGGCGGTGTAC +GGCATCCGGCAGTCGTTAAAGGAGCCGCCGCTGGAAGAACTGCTTCGGCAACTGGAAGAG +CAAAAACAGACCGGAGAGGTTTCGCCAACGCTGTTGACGCAAATTGATACCCGGTTAAAT +CAGTTGTTGAATCGCTATGTCATTTTACTGGATACGAAGGTGGAACAAAGTCAGTAA +>test.0417.00002.0002i_00020 948 NA | Hydroxypyruvate reductase | 1.1.1.81 | similar to AA sequence:UniProtKB:Q9X1C1 | COG:COG0111 +ATGAAAAATGTTCTGGTCACCGTCCCCAGCTTTTCAGCACGCTGTGTTTCCGCCAGCAAG +TTGCTAAGAGAGAATAATTTTAATCTTATTATTAAGAATAATGTGGAGCATCTGCTTAAA +TCAGAATCCACTGCATTACGAGAATCTATTTGCGCGGTCATCGCCGGAAAAGATGGTTAT +CAGGCGGACACGCTATCATTGCTGCCTGGTGTGAGAATAATATCGAGATTCGGGACGGGG +ATAGACAATATTGATCTTCGTGCGGCACAGCAATCCGGTATTGTTGTCAATAATGCGGTT +GGGATTAATTCAAATGCGGTTGCGGAATTTATCATTGGACTTATCTTCGCGAGCATGAGA +AATATCCCTGGCAGCTATCATGCGATGCAAAATGGCTACTGGGGTGAGTCGCATGGCTGT +GAATTACAAGGGAAACGGATTGGCCTGGTTGGCTACGGTAATATAGGTAAAACTCTGGCG +AAAAGGTTATCCGGTTTTGATGTTGAGCTTTTAGCTTTTGACAAACAACCCGACTATCAG +GTTGCTGACAAAGCTGGAGTTCAGTTTGTATCAATTGAAGATATCTTTATGCAGTCGCAT +GTCATCATTGTTCTTTTGCCTTTTTCTTCTGAGCTGGAGAACTTCATTAGTCATAAATAT +TTGTCGATGATGCGCAATGGTGCTCTAATCATCAATGCCGCAAGGGGAAAGTTGCTGGAT +GAGGGCGCTTTACTTCAGGTGATTGAAGAACGAAATGTGTTTGCGGCGCTGGATGTGTTT +AGCTCTGAACCGTTGGCGCAATTTAGCCCACTGCTACATGCCAAAAATATCATTACAACG +CCGCATATCGCGGCCGCCACCGTTGAGTCATACCAGCAAACCGGGATACACGTTGCCCAG +TCGATAATTGATTACTTCGCAGGAAGGGAGATAAAAAACGTGTTGTGA +>test.0417.00002.0002i_00021 597 kdsD | Arabinose 5-phosphate isomerase KdsD | 5.3.1.13 | similar to AA sequence:UniProtKB:Q9HVW0 | COG:COG0517 +ATGAATAACACGGATCTTATCCATCTCATTAAACATTTTATGCGTAACGAACATAAAGCA +GTTGAAGAAGTTATTGATTCCCCTCTTTCGGAGGTCGCAAATTTAATTAAAGTATTACAA +TCTTGTCAGGGGAAAGTTGTTTTTATTGGTGTTGGTAAGTCTGGTATTATTGCCAGGAAA +CTCGCCGCAACATTTGCCAGCACCGGAACTCCCTCGTTTTTTGTTCACGGTACGGAAGCG +GTACACGGCGACCTTGGAATGGTGGCGAAAGACGATGTTGTTATTCTTATTTCAAACAGT +GGTGAGACGGCGGAAATCCTGGCGACACTGCCTAGTCTGAAAAAAATGGGTAATTATTTG +ATCTCTTTTACCCGCAGTCATCACTCATCGCTTGCGATAAGTTGTGATTTATCTGTTGAA +ATCCCCGTCAAAAGTGAGGCGGATAATTTAGGTTTAGCACCGTCATGCTCGTCGACTGTT +GTTCTGGTTGTTGGTGATGCGGTGGCGCTTGCACTCTCTGAATTGAAAAAATTTACTCGT +GCTGATTTCGGCTTATATCATCCAGGAGGTGCACTCGGCATTAAAGCAAATTCATAA +>test.0417.00002.0002i_00022 1176 malY | Protein MalY | NA | similar to AA sequence:UniProtKB:P23256 | COG:COG1168 +ATGGATGTTTTTAATACTCCTGTTTCCCGCAAAGGAACATATTGTACCCAATGGGACTTT +TGCGAGGACAGATTTGGTGTAAAAGATGTACTACCATTCTCTATTTCAGATATGGATCTT +CCGATACCAGACGCTATCACCAGAGCATTAAAAAAACGCCTGGAACACCCGATTTTAGGG +TACAGTCGTTGGCAACATGGTGAATATCTGAATGCGATAGTAAACTGGTATTATCAACAA +TATCAAACAGATATTAAACCTGAATGGATAACCTATAGCCCCAGTGTGATGTACTCTATT +GCAAAAGCAATAGAGTTATTGACATCGCATGGTGATAATATTCTCGTTTTTACACCTGTC +TATAATGCATTTTTTGATGTAATTAAACATAGCGAGCGAAATATTCTGACAGCCTCTTTG +ATTATAAAAAATGAGGGGGGCTACGCTATCAACTGGCAAGATTTTGATCTTAAGATTAAA +AGCGCAAAGATGATGTTATTATGTAATCCTCATAACCCGACAGGAACAGTCTGGTCGGAA +GAAGAACTGCATAAAATCGCTGCAAGCTGTACAAGGCATAATGTCTGGTTATGTTCAGAT +GAAATCCATAGTGATTTTGTTTTTAATCGTAGCTTTACATCCGCGCTTAAAATAAAAAAA +GAAAAAGTAGTAGTATTTAACTCGATATCGAAAACATTTAATGTTCCTGCACTAACAGGA +TCGTATATGATTTCAACTGACGATAATTTTAATCATAAGTTCAGAACGATATCGAGGTAT +CGCGATTTTGTAAACTCCCCATCAGTACTGAATATAATTGCAACTATTATTGCCTACAAC +GAATGTGAGGGATGGTTAAAGTCATTAAAGGCACATATAGCCTCTAACATTCAATTCACC +CAGCAGTATCTGAATGAAAATATTCCAGAATTGATCGTAAGGCCAGCTGATGGTTGCTAT +TTTTCCTGGATAGATTGTTCTGCTATTGGTTATCCTTTTGATGAATTCTACAGTCGATTA +ATTCATGAAGGCAAAGTGGGCATTATGGCGGGGCATGTCTATGGAACGGAGGGGGAGGGC +TACCTTCGTCTGAACCTGGCCTGCGGTCGAGAAAAATTATATATGGGGCTTACGCGTCTT +GTGAGTGTAATTAAAAATATTAATCAGGGAGAATAA +>test.0417.00002.0002i_00023 1581 malX | PTS system maltose-specific EIICB component | NA | similar to AA sequence:UniProtKB:P19642 | COG:COG1263 +ATGAAACAAAAGAAAGCCTGGAGTTTTTTTCAGAGCCTGGGGAAGGCATTTATGTATCCC +ATTGCTCTGCTAAGTGTATGTGGCATGATGCTAGGGCTGGGAAGTGGTTTAGCCAGTGAT +GATATGGCAAAGTTAATTCCATTTCTGGCTATTCCAATAATTAAAACCATACTTGATTTC +ATTGTTAGTCTTGGTTTGTTTGCCTTTGTTAATTTACCTGTATTGTTTGCGATAGCGATT +CCCTTAGGATTATTAAAAGATAAAGAGGATAAAGCCTATGGTGCTTTTTCTGGCTTAATT +GGTTTTATGGCGATGCATTTGGGAACGAACTTTTATCTTAAACAGCACGACTTATTGGTC +GTTGCTGACCAAATGTCGACACATGGGCAAACCATCATTCTGGGGATCCAGTCCTACAAT +ACCAGCGTGTTGGGGGGAATTGTTGCTGGGTTATTAGTCGCCAGCATGTATAAAAAGATC +GTTAATTTACGCATTCCTGAATCGTTAGGTTTTTATAGCGGCCCACGTCTGGTGCCTATC +ATTACACTGATTGTGATGAGTGGATTTGGTCTGATCATTCCTTTTATCTGGCCGCCGTTT +TTCAATCTTTTCATGCTCATTGGCCACTGGATTTCAACTTCCGGTCCTGTTGGTTATTTC +TTCTATGCAGTTGCCGAACGCGTGACGATTCCTTTTGGCTTAAACCATCTGGTGACGTCA +GTTTTCCGCTTTACGCCAATCGGCGGTTCGGCTGTGATTGGCGGCGAAGAATATTACGGC +ACCCTGAACATGTTTATGGCATACGTCAAAGAGAATGCGGTCATTCCGCTGGATTTGGCG +GGGAAAATGGAGCAGGGCAAACTGATGATTCAGTATGGTCTGGCTGGTGCCGCGCTGGCG +ATGTATCGCACTGCTCATGCTCAAAACAGAAAGGCTATCAAAGCATTGCTTATTTCCGGG +GTGCTTACGGTGATTATTGGCGGCGTCAGCGAACCGATTGAGTTTCTGTTCTTATTTGTC +AGTCCACTGCTGTTTGTCTTCCATGCCTTTATGAATGGATTCGCTAACATGGTTCTGCCA +TATATGGGGGTGAAGATGGGATTTACTGGTGATCTGATTCAATTTATTAGCTTTGGCGTA +TTGCGTGGCACAAGAACAGGTTGGCCGATCGCGGTGTGTGTCGAAGTGGCCTATTTCTTC +ATTTATTACTTTGTGTTCCGTTGGACCATCCTTAAATTTAACCTGATGACCGTAGGCCGT +GAAGAGTCCAGTCCTGTTACGCTGAACGCTCACGAAGATACGGCTATAGCGGATATCCCA +ACTCCTGATAAATCAGAGCTGCAAGCGGCGGAGCAGATGGTTAAGGCACTTGGTGGTAAA +GAGAATATTAAGTCACTGGATAATTGCGTAACTCGTTTACGTTTAACAATCGCAGATATG +AGATTGATTGACGAAGTTGCAATAAAAAGAGCTGGCGGGATTGCGGTTGTAAAACTTGAT +CAAAATACCCTACAAGTCATTATCGGCACTAAAGTCATCGCCCTGCGTCGGGATATGGAT +AACTATATGGGGATATACTGA +>test.0417.00002.0002i_00024 825 licT | Transcription antiterminator LicT | NA | similar to AA sequence:UniProtKB:P39805 | COG:COG3711 +ATGATCATCGAAAAAGTCATGAACAATAATTGTGTACAGGCATCGATGAATGGACAGGAG +GTTATCATTTCTGGGCCTGGCGTCGGTTACAACAAAAAATATGGAATGTCGGTCCCTGAG +CATCCGGCTAACCGGATTTTTTATGTCAGAAATGAACAAAAAAACAAACTTTATAAATTG +ATTGAACATGTAGATATTGAGTATGTGTTTGTTGCCGAAAAAATAGTGCAATATGCGGAG +AAAAATCTCGAAAAAAATCTCAATCCATCGCTACTATTGATTCTTGCGGATCACATTTCG +AATGCAATATCCCGAGTCGTTTCAGGTATACAAATTAATAATGTTTTCCTTGATGAAATC +AAAGCGTTGTACAAAGCAGAGTATGCGATAAGTCGCGATGCATTAACTATCATTAATGAG +CAATTCAGCGTTCAACTTCCTGATGATGAGATTGGTTTTATAGCATTGCATATTTTAAAT +AATTATGAAAATTCAGTTGATTATGAATCAGTACGGATTATTGAGTTGTCGCAAATAATC +ACGGAGCTTATTGAAGTTGTTTATAACAGAAAGGTGGACAGAAGTTCATTTAACTATTCC +AGATTTATGATGCACCTTAAATATTTTTCAAGTCGCGTGTTATGCAATGAAAAAATAAAA +CAGAAAGATATTGGTGATATCTATGAACAGTTTCTTGAAAAGGACATCCTGTTACAGCGC +GCAATTCATGAAATTGAACGGTATCTGTATGCCACTTTTAAATATGAATTAATTTTAGAA +GAAAAATTATATCTCTCTATTCGTACCAAAGTATTAATGGACTAA +>test.0417.00002.0002i_00025 1254 amiC | N-acetylmuramoyl-L-alanine amidase AmiC | 3.5.1.28 | similar to AA sequence:UniProtKB:P63883 | COG:COG0860 +ATGTCAGGATCCAACACTGCAATCAGCCGTCGTCGTTTACTGCAAGGCGCGGGTGCCATG +TGGCTATTGAGCGTAAGTCAGGTCAGCCTGGCTGCGGTCAGCCAGGTCGTGGCGGTGCGC +GTCTGGCCTGCGTCCAGCTACACCCGCGTGACGGTAGAATCAAATCGTCAGCTGAAATAT +AAGCAGTTCGCGTTGAGTAATCCTGAACGCGTGGTGGTGGATATCGAAGATGTAAACCTG +AACTCGGTGCTCAAGGGGATGGCTGCGCAAATCCGCGCTGACGACCCGTTCATCAAGTCG +GCGCGCGTCGGGCAATTTGACCCGCAAACCGTACGTATGGTTTTTGAATTAAAGCAAAAC +GTAAAACCGCAGCTGTTTGCCCTTGCGCCGGTCGCCGGGTTTAAAGAGCGTCTGGTGATG +GACCTCTATCCGGCCAATGCACAGGATATGCAGGACCCGCTGCTGGCGCTGCTGGAGGAT +TACAACAAAGGCGACCTCGAAAAGCAGGTGCCGCCAGCACAAAGTGGTCCACAACCGGGT +AAAGCTGGGCGGGATCGTCCGATTGTCATTATGCTTGACCCTGGCCACGGTGGCGAAGAC +TCCGGTGCGGTGGGGAAATACAAAACGCGCGAAAAAGACGTGGTATTGCAAATAGCTCGC +CGTCTGCGCTCTCTGATCGAGAAAGAGGGCAATATGAAGGTGTACATGACGCGCAATGAA +GACATCTTCATTCCGTTGCAAGTGCGCGTAGCAAAAGCCCAGAAACAGCGCGCTGACTTG +TTTGTTTCTATCCATGCCGACGCCTTTACCAGTCGCCAGCCGAGCGGTTCCTCGGTGTTT +GCGCTCTCAACCAAAGGCGCAACCAGTACTGCGGCAAAATATCTGGCACAAACCCAGAAC +GCCTCGGACTTGATTGGTGGCGTAAGCAAAAGCGGTGACCGCTATGTCGACCACACCATG +TTCGATATGGTGCAGTCGCTGACCATTGCCGACAGCCTTAAGTTTGGTAAAGCGGTGCTG +AATAAGCTCGGTAAAATCAACAAGCTGCATAAAAATCAAGTTGAACAGGCCGGGTTTGCC +GTACTAAAGGCACCAGATATTCCCTCCATTCTGGTCGAAACGGCGTTTATCAGTAACGTT +GAGGAAGAGCGTAAACTGAAAACGGCGACTTTCCAGCAGGAAGTTGCGGAGTCTATTCTT +GCGGGAATTAAAGCGTATTTTGCCGATGGGGCGACGCTGGCGAGAAGGGGATAA +>test.0417.00002.0002b_00026 189 NA | hypothetical protein | NA | NA | NA +ATGCTCAATGGCTTCACCGCCGAGCATGATGACAAACGTTTTTCCCCGGTGGGTATTGAT +ATAGGGAACCGAATGGCGGAATCCCTCGACCAGCTCGGTTTTACGTTCCTTTACCACGGT +ACACCTCTTTGCATGATTATTCGAAATTATTGTATTTTTATTCTGTTTTTTCGCAGGGTG +CAAGTGTAA +>test.0417.00002.0003b_00027 720 argA | Amino-acid acetyltransferase | 2.3.1.1 | similar to AA sequence:UniProtKB:P0A6C5 | COG:COG0548 +ATGATTGGTTTTTGCTCTTCCCAGGGCGTCACTAATGACGACGGTGATATTGTCTCCGAA +CTTTTCCCTAACGAAGCGCAAGCACGGGTAGAAGCCCAGGAAGAGAAAGGCGATTACAAC +TCCGGTACGGTGCGCTTTTTGCGTGGCGCAGTGAAAGCCTGCCGCAGCGGCGTGCGTCGC +TGTCATTTAATCAGTTATCAGGAAGATGGCGCGCTGTTGCAAGAGTTGTTCTCACGCGAC +GGTATCGGTACGCAGATTGTGATGGAAAGCGCCGAGCAGATTCGTCGCGCAACAATCAAC +GATATTGGCGGTATTCTGGAGTTGATTCGCCCGCTGGAGCAACAAGGTATTCTGGTACGC +CGTTCTCGCGAGCAGCTGGAGATGGAAATCGACAAATTCACCATTATTCAGCGCGATAAC +ACGACTATTGCCTGCGCCGCGCTCTATCCGTTCCCGGAAGAGAAGATTGGGGAAATGGCC +TGTGTGGCAGTTCACCCGGATTACCGCAGTTCATCACGGGGCGAGGTTCTGCTGGAACGC +ATTGCCGCTCAGGCGAAGCAGAGCGGCTTAAGCAAATTGTTTGTGCTGACCACGCGCAGT +ATTCACTGGTTCCAGGAACGTGGATTTACCCCAGTGGATATTGATTTACTGCCCGAGAGC +AAAAAGCAGTTGTACAACTACCAGCGTAAATCCAAAGTTTTGATGGCGGATTTAGGGTAA +>test.0417.00002.0003i_00028 1827 recD | RecBCD enzyme subunit RecD | 3.1.11.5 | similar to AA sequence:UniProtKB:P04993 | COG:COG0507 +ATGAAATTGCAAAAGCAATTACTGGAAGCTGTGGAGCACAAACAGCTACGCCCGCTGGAC +GTGCAGTTTGCCCTGACCGTGGCGGGAGATGAACATCCTGCCGTCACCCTCGCGGCGGCA +CTATTAAGTCATGATGCCGGAGAGGGACACGTTTGTTTGCCGCTTTCACGACTGGAAAAT +AACGAGGCATCGCATCCGCTGTTGGCGACCTGTGTCAGTGAAATCGGTGAGCTACAAAAT +TGGGAAGAATGCTTGCTGGCTTCACAAGCGGTCAGCCGGGGAGATGAACCAACGCCGATG +ATCCTCTGTGGCGATCGTCTTTATTTGAATCGCATGTGGTGTAACGAGCGCACAGTGGCA +CGCTTTTTCAACGAAGTGAATCATGCCATTGAGGTTGATGAAGCTCTACTGGCGCAAACC +CTGGACAAACTTTTTCCAGTAAGCGATGAAATTAACTGGCAAAAAGTTGCGGCGGCAGTG +GCGCTGACACGGCGGATCTCGGTGATTTCCGGTGGTCCTGGCACCGGTAAAACGACCACC +GTAGCGAAGTTACTGGCAGCGTTAATTCAAATGGCCGACGGCGAACGCTGCCGTATCCGT +CTGGCTGCACCAACGGGTAAAGCTGCCGCGCGCTTAACCGAATCTCTCGGCAAGGCTTTG +CGACAATTACCGCTGACCGATGAACAAAAGAAACGCATTCCGGAAGATGCCAGCACTTTG +CACCGATTGCTGGGTGCGCAGCCGGGTAGCCAGCGTTTACGTCATCATGCCGGTAACCCG +CTGCATCTTGATGTGCTGGTGGTAGATGAAGCGTCAATGATCGATCTTCCTATGATGTCG +AGACTGATCGACGCCTTGCCCGATCATGCGCGAGTGATCTTTCTCGGCGATCGTGATCAA +CTGGCCTCGGTTGAGGCTGGGGCTGTGCTGGGCGATATCTGCGCTTATGCCAACGCGGGC +TTTACCGCCGAGCGTGCCGGGCAGTTGAGCCGCCTGACGGGAAGCCACGTTCCGGCAGGA +ACTGGCACAGAAGCGGCATCTTTGCGCGACAGCCTCTGCCTGCTGCAAAAAAGCTATCGT +TTCGGCAGCGATTCTGGCATTGGTCAGTTAGCTGCGGCGATTAACCGTGGTGATAAAACG +GCAGTGAAAACCGTTTTTCAGCAGGATTTTACTGATATCGAAAAACGGCTTTTACAGAGT +GGCGAAGATTATATTGCGATGCTTGAGGAAGCTCTTGCGGGTTACGGGCGTTATCTGGAT +CTGCTGCAAGCGCGTGCCGAGCCGGATTTAATCATTCAGGCGTTCAATGAGTACCAGCTT +TTGTGCGCCCTGCGGGAAGGGCCGTTTGGCGTGGCTGGACTGAATGAGCGAATTGAGCAG +TTTATGCAACAGAAGCGCAAAATTCATCGTCATCCGCACTCTCGTTGGTACGAAGGCCGA +CCAGTGATGATTGCCCGTAATGACAGCGCGCTTGGGTTGTTTAATGGCGATATTGGTATT +GCGCTGGATCGCGGGCAGGGGACGCGCGTCTGGTTTGCGATGCCGGACGGCAATATTAAG +TCTGTGCAACCGAGTCGCCTGCCAGAGCACGAAACGACGTGGGCGATGACGGTACATAAA +TCGCAGGGATCGGAGTTCGACCATGCGGCGTTGATTTTACCGAGTCAACGCACGCCGGTA +GTAACGCGAGAGCTGGTTTACACCGCGGTGACCCGCGCGCGTCGCCGTCTGTCGCTGTAT +GCCGATGAGCGCATATTAAGTGCGGCAATCGCCACTCGTACTGAGCGGCGCAGTGGTCTG +GCGGCGTTGTTTAGTTCACGGGGATAA +>test.0417.00002.0003i_00029 3543 recB | RecBCD enzyme subunit RecB | 3.1.11.5 | similar to AA sequence:UniProtKB:P08394 | COG:COG1074 +ATGAGTGATGTCGCCGAGACACTAGATCCTTTGCGCTTGCCCTTACAGGGCGAGCGCCTG +ATTGAAGCCTCTGCCGGCACAGGCAAAACCTTTACGATTGCGGCGCTCTATTTGCGCCTG +TTACTTGGACTAGGCGGTTCTGCCGCCTTTCCCCGCCCGCTGACCGTTGAAGAACTGCTG +GTGGTGACCTTTACCGAGGCTGCTACGGCAGAATTGCGTGGTCGTATCCGTAGCAATATC +CACGAGTTGCGCATCGCCTGTCTGCGTGAAACCACCGACAATCCACTGTACAAACGCCTG +CTGGAAGAGATCGACGATAAAGCGCAAGCCGCGCAGTGGTTGTTGTTAGCCGAGCGGCAG +ATGGATGAAGCGGCAGTCTTTACTATTCACGGCTTTTGCCAGCGCATGCTCAACCTGAAT +GCCTTTGAATCCGGCATGCTGTTTGAGCAGCAGCTGATTGAAGATGAGTCTCTGCTACGC +TACCAGGCCTGCGCCGATTTCTGGCGTCGCCACTGCTACCCGCTGCCGCGTGAAATTGCC +CAGGTCGTCTTTGAAACCTGGAAAGGGCCGCAGGCGTTGCTGCGCGATATTAATCGTTAT +CTGCAAGGCGAAGCGCCGGTTATCAAAGCACCGCCCCCCGATGATGAAACGCTGGCTTCC +CGCCACGCGCAAATTGTGGCGCGTATTGATGCCGTAAAACAGCAGTGGCGCGACGCAGTG +GGTGAACTGGATGCGCTGATCGAATCTTCTGGTATTGATCGACGCAAGTTTAACCGTAGC +AATCAGGCTAAATGGATCGAGAAGATCAGCGCCTGGGCAGAAGAAGAGACCAACAGCTAT +CAGTTGCCGGAGTCGCTGGAAAAATTCTCTCAGCGTTTCTTAGAAGATCGCACGAAAGCC +GGGGGGGAAACCCCGCGACATCCACTGTTTGAGGCGATCGAACAACTGCTTGCAGAACCA +TTGTCGATCCGCGATCTGGTGATCACTCGCGCATTGGCTGAGATCCGCGAAACAGTAGCG +CGTGAAAAACGCCGCCGTGGCGAATTGGGTTTTGATGACATGTTAAGTCGGCTCGATTCC +GCGCTGCGTAGTGAAAGCGGCGAGGTATTGGCAGCGGCGATCCGTACGCGATTCCCGGTG +GCAATGATCGATGAATTTCAGGATACCGACCCCCAACAGTATCGAATTTTTCGCCGTATC +TGGCACCATCAGCCGGAAACCGCATTGTTGCTGATTGGCGACCCGAAACAGGCCATATAT +GCATTCCGGGGTGCGGATATCTTCACTTATATGAAGGCGCGTAGCGAAGTTCATGCTCAC +TACACCTTAGATACCAACTGGCGTTCCGCACCGGGAATGGTGAACAGCGTTAACAAACTT +TTCAGCCAGACTGATGACGCGTTCATGTTTCGTGAAATACCGTTTATTCCTGTGAAATCT +GCCGGCAAAAATCAGGCGTTACGTTTTGTATTTAAAGGTGAAACGCAGCCTGCGATGAAA +ATGTGGCTGATGGAAGGCGAAAGCTGCGGCGTTGGCGACTATCAAAGTACCATGGCGCAG +GTATGTGCTGCGCAAATCCGCGACTGGCTACAAGCCGGGCAACGCGGCGAAGCGTTGCTG +ATGAACGGCGACGATGCGCGTCCGGTGCGTGCTTCGGACATCAGTGTGCTGGTGCGCAGC +CGCCAGGAGGCCGCTCAGGTGCGCGATGCCTTAACGCTGCTGGAAATCCCTTCCGTTTAC +CTTTCGAACCGCGACAGTGTTTTTGAAACTCTGGAAGCACAGGAGATGCTTTGGCTGTTG +CAGGCGGTGATGACGCCCGAACGTGAGAACACCCTGCGCAGTGCGCTGGCAACGTCAATG +ATGGGGCTGAATGCGCTGGATATTGAAACGCTGAATAATGACGAACATGCGTGGGATGCG +GTCGTCGAAGAGTTCGATGGTTATCGGCAAATCTGGCGCAAACGTGGCGTTATGCCGATG +CTGCGGGCGCTGATGTCGGCGCGTAACATTGCAGAAAACTTGCTGGCAACGGCAGGCGGT +GAGCGGCGTCTTACCGATATCTTGCATATCAGCGAACTGCTACAAGAAGCCGGAACGCAG +CTGGAAAGTGAACATGCGCTGGTACGCTGGTTATCGCAACATATCCTCGAGCCAGACAGT +AATGCCTCCAGCCAACAAATGCGCCTCGAAAGTGATAAACATCTGGTGCAGATTGTCACG +ATACACAAATCAAAAGGGCTGGAATATCCGCTGGTCTGGTTGCCATTTATTACCAATTTC +CGCGTCCAGGATCAGGCGTTTTATCACGATCGCCACTCGTTTGAGGCCGTTCTGGATCTT +AATGCTGCGCCAGAAAGCGTCGACCTCGCGGAGGCCGAACGTCTGGCGGAAGATCTGCGT +TTACTTTACGTGGCGCTGACGCGTTCGGTTTGGCATTGCAGTCTCGGCGTTGCACCGCTG +GTGCGCCGTCGTGGCGATAAAAAAGGTGATACCGACGTCCACCAAAGTGCGCTCGGGCGT +TTGCTGCAAAAAGGAGAACCGCAAGATGCGGCAGGGCTTCGTACCTGCATTGAAGCGTTG +TGCGATGATGATATTGCCTGGCAAACGGCACAAATTGGTGATAACCAGCCCTGGCAGGTT +AATGATGCATTAACTGCAGAACTGAATGCGAGGACGCTACAACGATTGCCCGGCGATAAC +TGGCGTGTCACCAGCTACTCCGGTTTGCAGCAGCGTGGTCACGGTATCGCTCAGGATCTG +ATGCCACGGCTGGATGTTGATGCCGCAGGCGTGGTCAGCGTCGTTGAAGAACCGACGTTA +ACACCGCATCAGTTCCCGCGCGGTGCGTCACCGGGGACATTCTTGCACAGTTTGTTTGAA +GACCTCGATTTTACCCAGCCGGTTGACCCGAACTGGGTACAGGAAAAACTGGAGCTCGGT +GGCTTTGAACCGCAGTGGGAACCGGTGTTGACTGAGTGGATCACGGCTGTCCTCCAGGCA +CCTCTCAATGAAACGGGTGTTAGCCTGAATCAGCTTTCCGATCGCGATAAACAGGTGGAG +ATGGAGTTTTACCTGCCAATTAGCGAACCGCTCATCGCCAGCCAGCTTGATGCACTAATT +CGCCAGTTTGACCCGCTATCCGCTGGCTGCCCGCCGCTGGAGTTCATGCAGGTACGTGGC +ATGTTAAAAGGCTTTATCGATCTGGTGTTCCGCCACGAAGGGCGTTATTACCTGCTCGAC +TATAAATCCAACTGGTTGGGTGAAGACAGTTCGGCTTACACCCAACAGGCTATGGCAGCG +GCAATGCAGGCACACCGCTATGATCTGCAATATCAGCTTTATACCCTGGCGCTGCACCGT +TATCTGCGCCATCGTATTGCTGATTACGACTATGAGCGCCACTTTGGCGGCGTTATTTAT +CTGTTCCTGCGTGGCGTTGATAAAGAACATCCGCAACAAGGGATCTACGCGACCCGACCC +AACGCCGGGTTGATTGACCTGATGGATGAGATGTTTGCCGGTATGACCCTGGAGGAGGCG +TAA +>test.0417.00002.0003i_00030 2889 ptrA | Protease 3 | 3.4.24.55 | similar to AA sequence:UniProtKB:P05458 | COG:COG1025 +ATGCCCCGCAGCATCTGGTTCAAAGCATTATTGTTGTTTGTTGCCCTCTGGGCACCCTTA +AGTCAGGCAGAAACGGGATGGCAGCCGATTCAGGAAACCATCCGTAAAAGTGATAAAGAT +AACCGCCAGTATCAGGCTATACGTCTGGATAACGGTATGGTGGTCTTACTGGTTTCTGAT +CCGCAGGCAGTTAAATCGCTCTCGGCGCTGGTGGTGCCCGTTGGGTCGCTGGAAGATCCT +GAGGCGTACCAGGGGCTGGCACATTACCTTGAACATATGAGTCTGATGGGGTCGAAAAAG +TATCCGCAGGCTGACAGTCTGGCCGAATATCTCAAAATGCACGGCGGCAGTCACAATGCC +AGCACGGCACCGTATCGCACGGCTTTCTATCTGGAAGTTGAGAACGACGCCTTGCCCGGT +GCGGTAGACCGCCTGGCCGATGCTATTGCAGAACCCTTGCTCGACAAGAAATACGCCGAA +CGTGAACGTAATGCAGTGAATGCCGAATTAACCATGGCGCGTACGCGTGACGGGATGCGC +ATGGCACAGGTCAGCGCAGAAACCATTAACCCGGCACACCCCGGTTCAAAGTTTTCTGGT +GGTAACCTCGAAACTTTAAGCGACAAACCAGGTAATCCGGTACAGCAGGCGCTGAAAGAT +TTCCACGAGAAGTACTATTCCGCCAATCTGATGAAGGCGGTTATTTACAGCAATAAACCG +TTGCCGGAGTTGGCGAAAATGGCGGCGGACACCTTTGGTCGCGTGCCGAACAAAGAGAGC +AAAAAACCGGAAATCACCGTGCCGGTAGTCACCGACGCGCAAAAGGGCATTATCATTCAT +TACGTCCCGGCGTTGCCGCGTAAAGTTCTGCGCGTTGAGTTTCGCATCGATAACAATTCA +GCGAAGTTCCGTAGTAAAACGGATGAATTGATTACCTATCTGATTGGTAATCGCAGCCCT +GGTACACTTTCTGACTGGCTGCAAAAGCAGGGATTAGTTGAGGGCATTAGCGCCAATTCC +GATCCTATCGTCAACGGCAACAGCGGCGTATTAGCGATCTCTGCGTCTTTAACCGATAAA +GGTCTGGCGAATCGCGATCAGGTTGTGGCGGCCATTTTTAGCTACCTCAATCTGTTACGT +GAAAAAGGGATCGATAAACAATACTTCGATGAACTGGCGAATGTGCTGGATATCGACTTC +CGTTATCCGTCAATCACCCGTGATATGGATTACGTCGAATGGCTGGCTGATACCATGATT +CGCGTTCCTGTTGAGCATACACTGGATGCAGTCAATATTGCCGATCGGTACGATGCTAAA +GCAGTAAAAGAACGTCTGGCGATGATGACGCCGCAGAATGCGCGTATCTGGTATATCAGC +CCGAAAGAGCCGCACAACAAAACGGCTTACTTTGTCGATGCGCCGTATCAGGTCGATAAA +ATTAGCGCACAAACTTTCGCGGACTGGCAGAAAAAAGCCGCCAATATTGCGCTCTCCTTA +CCGGAGCTTAACCCCTATATTCCTGACGATTTCTCGCTGATTAAGTCAGAGAAGAAATAC +GACCATCCAGAGTTGATTGTTGATGAGTCGAATCTGCGCGTGGTGTATGCGCCAAGCCGT +TATTTTGCCAGTGAGCCCAAAGCTGATGTCAGCCTGATTTTGCGTAATCCGAAAGCCATG +GACAGCGCCCGCAATCAGGTGATGTTTGCGCTCAATGATTATCTCGCAGGGCTGGCGCTT +GATCAGTTAAGCAACCAGGCGTCGGTTGGTGGCATAAGTTTTTCCACCAATGCTAACAAC +GGCCTTATGGTTAATGCCAATGGTTACACTCAGCGCCTGCCGCAGCTGTTCCAGGCTCTG +CTGGAGGGCTACTTTAGCTATACCGCTACGGAAGATCAGCTTGAGCAGGCGAAGTCCTGG +TATAACCAGATGATGGATTCCGCAGAAAAGGGCAAAGCGTTTGAGCAGGCGATTATGCCC +GCGCAGATGCTCTCGCAAGTGCCGTACTTCTCGCGAGATGAACGGCGCAAAATTTTGCCC +TCCATTACGTTGAAAGAGGTGCTGGCCTATCGCGACGCCTTAAAATCAGGGGCTAGACCA +GAGTTTATGGTTATCGGCAACATGACTGAAGCCCAGGCAACAACGCTGGCACGCCATGTG +CAAAAACAGTTGGGCGCTGATGGTTCAGAGTGGTGTCGTAACAAAGATGTCGTGGTCGAT +AAAAAACAATCCGTCATCTTTGAAAAAGCTGGTAACAGCACCGACTCCGCACTGGCAGCG +ATATTTGTACCGACTGGCTACGATGAATACACCAGCTCAGCCTATAGCTCTCTGTTGGGG +CAGATCGTACAGCCGTGGTTCTACAATCAGTTGCGTACCGAAGAACAGTTGGGCTATGCC +GTGTTTGCGTTTCCAATGAGCGTGGGGCGTCAGTGGGGCATGGGCTTCCTTTTGCAAAGC +AATGATAAACAGCCTTCATTCTTGTGGGAGCGTTACAAGGCGTTTTTCCCAACCGCAGAG +GCAAAATTGCGGGCGATGAAGCCAGAGGAGTTTGCGCAAATCCAGCAGGCGGTAATTACT +CAGATGCTGCAGGCACCGCAAACGCTCGGCGAAGAAGCATCGAAGTTAAGTAAAGATTTC +GATCGCGGCAATATGCGCTTCGATTCGCGTGATAAAATCGTGGCCCAGATAAAACTGCTG +ACGCCGCAAAAACTTGCTGATTTCTTCCATCAGGCGGTGGTCGAGCCGCAAGGTATGGCT +ATTCTGTCGCAGATTTCCGGCAGCCAGAACGGGAAAGCCGAATATGTGCATCCTGAAGGC +TGGAAAGTGTGGGAGAACGTCAGCGCGTTGCAGCAAACAATGCCCCTGATGAGTGAAAAG +AATGAGTGA +>test.0417.00002.0003i_00031 3369 recC | RecBCD enzyme subunit RecC | 3.1.11.5 | similar to AA sequence:UniProtKB:P07648 | COG:COG1330 +ATGTTAAGGGTCTACCATTCCAATCGTCTGGACGTGCTGGAAGCGTTGATGGAGTTTATT +GTCGAACGCGAACGGCTGGACGATCCTTTCGAACCAGAGATGATTCTGGTGCAAAGTACC +GGTATGGCACAGTGGCTGCAAATGACCCTGTCGCAAAAGTTTGGTATTGCGGCAAACATT +GATTTTCCGCTGCCAGCGAGCTTTATCTGGGATATGTTCGTCCGGGTGTTACCGGAGATC +CCCAAAGAGAGCGCCTTTAACAAACAGAGCATGAGCTGGAAACTGATGACTCTGCTGCCG +CAACTGTTGGAGCGCGAAGACTTTACCCTGTTGCGGCATTATCTGACTGACGATAGTGAC +AAGCGAAAACTGTTCCAGCTTTCTTCAAAAGCGGCGGACCTGTTTGACCAGTATCTGGTC +TATCGTCCGGACTGGCTGGCACAGTGGGAAACAGGACATCTGGTAGAAGGGTTGGGAGAA +GCACAGGCCTGGCAAGCGCCGTTGTGGAAGGCGTTGGTGGAATATACCGACGAACTTGGG +CAACCGCGCTGGCACCGCGCCAATCTCTATCAGCGCTTTATCGAAACGCTGGAGTCCGCG +ACGACCTGCCCGCCGGGGTTACCTTCGCGCGTCTTTATATGCGGTATTTCCGCGTTACCG +CCTGTTTATCTCCAGGCGCTACAGGCGCTGGGTAAACATATTGAAATCCATCTCCTGTTT +ACCAACCCCTGCCGTTATTACTGGGGCGACATTAAAGATCCAGCTTATCTGGCGAAACTA +CTGACTCGCCAGCGCCGACACAGTTTTGAAGATCGCGAATTACCGCTATTTCGCGACAGC +GAAAATGCCGGGCAGCTCTTTAACAGCGATGGTGAACAGGATGTCGGCAACCCGCTGCTG +GCTTCATGGGGCAAGCTTGGGCGCGACTACATTTATCTCCTTTCTGACCTGGAGAGCAGC +CAGGAGCTGGACGCTTTTGTCGATGTGACGCCAGATAACCTGCTGCATAATATTCAGTCT +GACATTCTGGAACTGGAAAACCGCGCCGTTGCTGGTGTGAACATCGAAGAGTTTTCCCGT +AGCGATAACAAACGCCCGCTTGATCCACTGGATAGCAGTATCACCTTCCACGTTTGCCAT +AGCCCGCAGCGTGAAGTTGAAGTTTTACACGATCGCCTGCTGGCGATGCTGGAGGAAGAC +CCGACACTTACTCCGCGCGACATCATCGTGATGGTGGCTGATATCGACAGCTACAGTCCG +TTTATTCAGGCTGTGTTTGGTAGTGCACCTGCGGATCGTTACCTGCCTTACGCCATTTCC +GACCGTCGGGCGCGGCAGTCGCATCCTGTACTTGAAGCGTTTATCAGCCTGTTATCGCTG +CCAGACAGCCGCTTTGTGTCGGAAGACGTGCTGGCATTACTGGATGTGCCGGTGCTGGCA +GCGCGGTTTGACATCACCGAAGAAGGGCTGCGTTATTTACGTCAGTGGGTCAACGAATCC +GGCATTCGTTGGGGGATAGATGACGACAACGTTCGCGAGCTGGAACTTCCCGCTACCGGT +CAACACACCTGGCGGTTTGGCCTGACGCGCATGTTGCTGGGCTACGCGATGGAGAGCGCG +CAGGGCGAGTGGCAATCGGTTCTACCTTATGATGAATCGAGCGGCTTAATTGCAGAACTG +GTGGGGCATCTGGCTTCACTGCTAATGCAGCTAAATATCTGGCGTCGCGGGCTGGCGCAG +GAGCGTCCGCTGGAAGAGTGGTTGCCGGTTTGTCGCGATATGCTCAACGCCTTTTTCCTG +CCGGATGCGGAAACCGAAGCGGCGATGACGCTGATCGAACAACAATGGCAGGCGATTATC +TCCGAAGGTTTAGGCGCGCAGTATGGCGACGCGGTGCCGCTGTCACTATTGCGTGATGAA +CTGGCACTGCGCCTGGATCAAGAACGTATCAGCCAGCGTTTTCTCGCCGGACCGGTTAAC +ATTTGTACTCTGATGCCAATGCGTTCAATTCCGTTCAAAGTGGTTTGCCTGCTGGGAATG +AACGACGGCGTTTATCCACGTCAGCTTGCGCCATTGGGCTTTGATCTGATGAGCCAGAAA +CCGAAGCGTGGCGACCGTAGCCGTCGCGATGACGACCGCTATCTGTTCCTGGAAGCGTTA +ATTTCCGCGCAGCAAAAACTCTATATCAGCTATATTGGGCGTTCCATTCAGGATAACAGT +GAACGTTTCCCGTCGGTACTGGTGCAGGAACTGATCGACTACATCGGGCAAAGCCATTAT +CTACCGGGCGATGAAGCGCTTAACTGTGATGAAAGCGAGGCAAGGGTAAAAGCGCATCTT +ACTTGCCACCATACCCGGATGCCGTTTGACCCGCAAAACTACCAGCCCGGTAACTTACAA +AGCTATGCGCGCGAGTGGCTACCTGCGGCCAGCCAGGCTGGTAAAGCACATTCTGAATTT +GTTCAGCCGCTGCCATTTACCTTACCGGAAACCGTGCCGCTGGAAACGCTACAACGATTC +TGGGCACATCCGGTGCGGGCGTTTTTCCAGATGCGTTTGCAGGTGAACTTCCGTACCGAA +GACAGCGAAATTCCCGACACTGAACCTTTTATTCTTGAAGGGCTTAGTCGTTATCAAATC +AACCAGCAGTTATTAAATGTACTGGTTGAGCAGGATGATGCCGAACGCTTGTTCCGCCGA +TTCCGGGCGGCAGGTGATTTGCCGTATGGTGCCTTTGGTGAAATTTTCTGGGAAACGCAG +TGTCAGGAGATGCAGCAGCTTGCCGACAGAGTCATTGCCTGTCGCCAGCCAGGGCAGAGT +ATGGAGATTGATCTCGCCTGCAACGGTGTGCAGATAACTGGCTGGTTGCCGCAGGTGCAG +CCGGATGGCCTGTTGCGCTGGTGTCCCTCTTTATTAAGTGTGGCGCAGGGAATGCAACTT +TGGCTGGAACACCTTGTCTACTGTGCCAGCGGTGGTAATGGTGAAAGTCGCCTTTTTCTA +CGCAAAGACGGCGAGTGGCGTTTTCCGCCGCTTGCAGCCGAACAGGCTTTGCATTACCTC +TCACAACTGATTGAGGGGTATCGTGAAGGAATGTCCGCGCCATTGCTGGTGTTACCTGAA +AGTGGCGGCGCGTGGCTAAAAACCTGTTATGACGCGCAAAACGATGCCATGCTGGATGAC +GATTCCACGTTGCAAAAAGCCCGTACGAAATTCCTTCAGGCTTACGAAGGCAACATGATG +GTGCGTGGCGAAGGTGATGATATCTGGTATCAACGGCTCTGGCGGCAATTAACACCAGAG +ACAATGGAGGCTATCGTTGAACAGTCGCAACGTTTCCTGTTACCGCTGTTTCGCTTTAAT +CAGTCATGA +>test.0417.00002.0003i_00032 324 NA | hypothetical protein | NA | NA | NA +ATGTCAGCTTCCCTGAGGAATCAACAAGGCTTTAGTCTGCCGGAGGTAATGTTGGCGATG +GTGTTGATGGTGATGATTGTCACTGCGTTATCGGGTTTCCAGCGAACATTAATGAACAGT +CTTGCCAGCAGAAACCAGTACCAACAGCTCTGGCGGCATGGCTGGCAGCAAACGCAACTG +CGCGCGATTTCGCCACCTGCTAACTGGCAGGTCAACCGAATGCAGACATCGCAGGCGGGA +TGTGTCAGCATCAGCGTTACGCTAGTTTCACCCGGGGGCAGAGAAGGCGAGATGACCCGC +CTGCATTGCCCGAATCGTCAGTAG +>test.0417.00002.0003i_00033 408 NA | hypothetical protein | NA | NA | NA +GTGAACCGCGAAAAGGGAGTTTCGTCACTGGCTCTGGTCCTGATGCTGCTGATTTTGGGT +AGCTTGCTATTGCAAGGAATGAGTCAGCAGGATCGCAGTTTTGCTTCTCGCGTGAGCATG +GAAAGTCAGTCATTGAGCCGCCAGGCCATCGTTCAGTCGGCGCTGGAGTGGGGAAAAATG +CACTCCTGGCAGACGCAGCCCGCAGTTCAGTGCTTACTGTATGCTGCCACCGGTGCCCGG +GTTTGTCTGCGTTTACTGGCAGATAATGAAGCCTTATTGATTGCTGGTTATGAAGGCGTT +TCGTTGTGGCGAACAGGCGAAGTCATCGATGGAAACATTGTTTTTTCGCCACGCGGCTGG +AGCGATTTTTGTCCGCTGAAAGAGAGGGCGTTATGTCAGCTTCCCTGA +>test.0417.00002.0003i_00034 564 NA | hypothetical protein | NA | NA | NA +ATGCCTGTAAAAGAGCAAGGTTTTTCTCTGCTGGAAGTGTTGATTGCTATGGCGATCAGT +AGCGTATTGTTGCTGGGGGCTGCACGCTTTCTGCCTGCGTTACAGCGTGAAAGTTTAACG +AGCACCCGTAAACTGGCGCTGGAAGATGAAATCTGGCTGCGGGTATTTACCGTCGCGAAG +CATCTCCAGAGGGCGGGTTATTGCCATGGCAGCTGTACGGGCGAAGGGCTGGAAATTGTC +GGACAGGGTGACTGTGTCATTGTGCAGTGGGATGCGAACAGTAACGGTATCTGGGATCGC +GAACCGGTAAAAGAGTCCGACCAGATTGGATTTCGTCTGAAGGAGCATGTGCTGGAAACG +CTACGCGGTGCGACATCCTGTGAAGGTAAGGGCTGGGATAAAGTCACTAATCCGGATGCC +ATCATTATCGACACTTTTCAGGTCGTACGTCAGGATGTCAGCGGCTTCTCGCCGGTGTTG +ACGGTTAATATACACGCTGCCAGCAAGGCTGATCCGCAAACCGTGGTGGATGCCAGCTAT +AGCGTGACAGGAGCCAACCTGTGA +>test.0417.00002.0003i_00035 504 NA | hypothetical protein | NA | NA | NA +ATGAAAACACAACGTGGTTATACGCTGATTGAAACGCTGGTCGCGATGCTTATTCTGGTC +ATGCTAAGCGCAAGTGGGCTCTATGGCTGGCAATACTGGCAGCAGTCGCAACGGCTTTGG +CAAACCGCCAGCCAGGCGCGGGACTATTTGCTCTATTTACGTGAAGATGCCAACTGGCAT +AACCGCGACCACAGTATCAGTCTTATCAGGGAGGGGACGTTATGGTGCCTTGTGAGTTCC +GTTGCTGGGGCGAATACCTGTCATGGCAGTTCCGTTGCTGGGGCGAATACCTGTCATGGC +AGTTCACCATTGGTCTTTGTGCCGCGCTGGCCCGAAGTCGAAATGAGCGACCTGACACCT +TCGCTTGCTTTCTTTGGCCTGCGCAATACCGCATGGGCCGGGCATATTCGCTTCAAAAAC +TCAACGGGCGAGTGGTGGCTAGTGGTTTCGCCGTGGGGAAGACTCCGGCTTTGTCAGCAA +GGAGAAACAGAAGGATGCCTGTAA +>test.0417.00002.0003i_00036 795 thyA | Thymidylate synthase | 2.1.1.45 | similar to AA sequence:UniProtKB:P48464 | COG:COG0207 +ATGAAACAGTATTTAGAACTGATGCAAAAAGTGCTCGACGAAGGCACACAGAAAAACGAC +CGTACCGGAACCGGAACGCTTTCCATTTTTGGTCATCAGATGCGTTTTAACCTGCAGGAT +GGATTCCCGCTGGTGACAACTAAACGTTGCCACCTGCGTTCCATCATCCACGAACTGCTG +TGGTTCCTGCAGGGCGACACTAACATTGCTTATCTACACGAAAACAATGTCACCATCTGG +GACGAATGGGCCGATGAAAACGGCGACCTCGGGCCAGTGTATGGTAAACAGTGGCGCGCC +TGGCCAACGCCGGATGGTCGTCATATTGACCAGATCACTACGGTACTGAACCAGCTGAAA +AACGACCCGGATTCCCGCCGCATTATTGTTTCAGCGTGGAACGTAGGCGAACTGGATAAA +ATGGCGCTGGCACCGTGCCATGCATTCTTCCAGTTCTATGTGGCAGACGGCAAACTCTCT +TGCCAGCTTTATCAGCGCTCCTGTGACGTCTTCCTCGGCCTGCCGTTCAACATTGCCAGC +TACGCGTTACTGGTGCATATGATGGCGCAGCAGTGCGATCTGGAAGTGGGTGATTTTGTC +TGGACCGGTGGCGACACGCATCTCTACAGCAACCATATGGATCAAACTCATCTGCAATTA +AGCCGCGAACCGCGTCCGCTGCCGAAGTTGATTATCAAACGTAAACCCGAATCCATCTTC +GACTACCGTTTCGAAGACTTTGAGATTGAAGGATACGATCCACATCCGGGCATTAAAGCG +CCGGTGGCTATCTAA +>test.0417.00002.0003i_00037 876 lgt | Phosphatidylglycerol--prolipoprotein diacylglyceryl transferase | 2.5.1.145 | similar to AA sequence:UniProtKB:P60955 | COG:COG0682 +ATGACCAGTAGCTATCTGCATTTTCCGGAGTTTGATCCGGTCATTTTCTCAATAGGACCC +GTGGCGCTTCACTGGTACGGCCTGATGTATCTGGTGGGTTTCATTTTTGCAATGTGGCTG +GCAACACGACGGGCGAATCGTCCGGGCAGTGGCTGGACCAAAAATGAAGTTGAAAACTTA +CTCTATGCGGGCTTCCTCGGCGTCTTCCTCGGTGGACGTATTGGTTATGTTCTGTTCTAC +AATTTCCCGCAGTTTATGGCCGATCCGCTGTATCTTTTCCGTGTATGGGACGGCGGCATG +TCCTTCCACGGCGGCCTGATTGGCGTTATCGTGGTGATGATTATCTTCGCCCGCCGTACT +AAACGTTCCTTCTTCCAGGTCTCTGATTTTATTGCCCCACTCATTCCGTTTGGTCTTGGT +GCCGGGCGTCTGGGCAACTTTATTAACGGTGAATTGTGGGGCCGCGTTGACCCGAACTTC +CCGTTTGCCATGCTGTTCCCTGGCTCCCGTACAGAAGATATTTTGCTGCTGCAAACCAAC +CCGCAGTGGCAATCCATTTTCGACACTTACGGTGTGCTGCCGCGCCACCCATCACAGCTT +TACGAGCTGCTGCTGGAAGGTGTGGTGCTGTTTATTATCCTCAACCTGTATATTCGTAAA +CCGCGCCCAATGGGAGCTGTCTCAGGCTTGTTCCTGATTGGTTACGGCGCGTTTCGCATC +ATTGTTGAGTTTTTCCGCCAGCCCGACGCGCAGTTTACTGGTGCCTGGGTGCAGTACATC +AGCATGGGGCAAATTCTTTCCATCCCGATGATTGTCGCGGGTGTGATCATGATGGTCTGG +GCATATCGTCGCAGCCCACAGCAACACGTTTCCTGA +>test.0417.00002.0003i_00038 2247 ptsP | Phosphoenolpyruvate-dependent phosphotransferase system | 2.7.3.9 | similar to AA sequence:UniProtKB:P37177 | COG:COG3605 +ATGCTCACTCGCCTGCGCGAAATAGTCGAAAAGGTAGCCAGCGCACCACGCCTGAATGAG +GCGTTAAATATTCTGGTTACCGACATCTGTCTTGCGATGGATACCGAGGTCTGTTCGGTC +TACCTGGCCGATCATGATCGACGTTGTTACTACCTGATGGCGACCCGGGGACTGAAAAAA +CCACGCGGTCGCACTGTAACGCTCGCGTTTGATGAAGGGATCGTCGGCCTGGTTGGCAGG +CTGGCGGAACCGATAAACCTTGCAGATGCGCAAAAGCACCCCAGCTTCAAATACATCCCC +TCCGTAAAAGAAGAACGTTTCCGCGCGTTTTTAGGCGTACCAATTATTCAACGTCGCCAG +TTGCTTGGTGTACTGGTGGTACAGCAACGAGAGTTGCGCCAGTATGACGAAAGTGAAGAA +TCCTTCCTGGTGACGCTTGCCACCCAGATGGCAGCTATTCTTTCTCAGTCGCAGTTGACT +GCCTTGTTTGGGCAATATCGCCAGACGCGAATCCGTGCATTACCGGCAGCACCTGGTGTG +GCGATTGCCGAAGGCTGGCAGGATGCCACGTTACCTTTAATGGAACAGGTGTATCAGGCA +TCAACGCTGGATCCGGCTCTGGAACGCGAACGACTGACCGGGGCGTTGGAAGAGGCGGCT +AACGAGTTTCGCCGCTATAGCAAACGCTTTGCTGCCGGTGCACAAAAAGAAACGGCGGCT +ATTTTCGATCTTTACTCACACCTGCTTTCGGATACCCGGCTGCGTCGCGAATTGTTTGCC +GAGGTTGATAAAGGCTCGGTGGCAGAGTGGGCGGTAAAAACGGTCATTGAAAAATTTGCC +GAACAGTTTGCCGCGCTAAGCGATAACTATCTCAAAGAGCGGGCTGGCGATTTACGTGCG +CTGGGTCAGCGATTGCTGTTTCATCTTGATGACGCTAATCAAGGGCCGAACGCCTGGCCG +GAACGTTTCATTCTGGTGGCAGATGAACTGTCAGCGACAACGCTTGCTGAGCTGCCCCAG +GATCGCTTAGTCGGTGTTGTCGTGCGCGATGGCGCTGCCAACTCCCATGCTGCGATCATG +GTACGTGCGCTGGGGATACCTACCGTGATGGGCGCGGATATTCAGCCTTCGGTACTGCAT +CGTCGGACGCTGATCGTCGATGGTTATCGCGGTGAATTGCTGGTCGATCCGGAACCGGTA +CTGCTGCAAGAATATCAGCGGCTAATTAGTGAAGAGATCGAGCTTAGCCGTCTGGCGGAA +GATGACGTCAATTTACCCGCCCAGTTAAAAAGCGGCGAACGCATTAAAGTCATGCTCAAT +GCCGGTTTAAGCCCGGAACATGAAGAAAAACTGGGCAGCCGTATTGATGGCATAGGACTT +TATCGCACTGAAATCCCATTCATGCTGCAAAGTGGTTTTCCGTCGGAAGAAGAACAGGTG +GCGCAGTATCAGGGGATGCTGCAAATGTTTAATGATAAACCCGTCACCTTGCGTACGCTG +GATGTCGGAGCAGATAAGCAGCTGCCTTACATGCCGATCAGCGAAGAGAATCCATGCCTG +GGTTGGCGTGGGATTCGCATTACGCTCGATCAGCCGGAGATCTTCTTGATCCAGGTGCGG +GCGATGCTGCGTGCTAATGCCGCTACGGGCAACCTGAATATTCTGTTGCCGATGGTCACA +AGCCTCGATGAAGTTGACGAAGCACGCCGCCTGATTGAACGTGCCGGACGTGAAGTCGAG +GAGATGATCGGTTACGAAATTCCCAAACCACGTATCGGCATCATGCTGGAAGTGCCGTCA +ATGGTATTTATGCTGCCGCATCTGGCAAAGCGGGTCGATTTCATCTCTGTTGGCACCAAC +GATCTGACTCAATACATCCTGGCCGTTGATCGCAACAATACCCGGGTGGCGAACATTTAT +GACAGTCTTCATCCTGCAATGTTACGAGCTCTGGCGATGATCGCCCGGGAAGCGGAAATA +CATGGAATCGATCTCCGTTTGTGCGGTGAAATGGCGGGCGATCCGATGTGCGTGGCAATC +CTCATTGGGCTTGGGTATCGCCATCTGTCTATGAACGGACGTTCTGTAGCGCGCGTAAAA +TACCTGCTGCGGCGCATTGATTTTGCTGAAGCAGAAAATCTTGCGCAGCGTAGTCTGGAA +GCGCAACTGGCGACCGAAGTTCGCCATCAGGTTGCAGCCTTTATGGAGCGTCGCGGCATG +GGCGGGTTGATTCGCGGGGGGTTATAG +>test.0417.00002.0003i_00039 531 rppH | RNA pyrophosphohydrolase | 3.6.1.- | similar to AA sequence:UniProtKB:P0A776 | COG:COG0494 +GTGATTGATGACGATGGCTACCGCCCAAACGTAGGTATCGTGATTTGTAATCGCCAGGGG +CAGGTAATGTGGGCCCGGCGATTTGGTCAGCACTCCTGGCAATTTCCGCAAGGCGGAATC +AACCCCGGAGAATCCGCAGAGCAGGCGATGTACCGTGAATTGTTTGAAGAAGTAGGATTA +AGCCGCAAAGACGTTCGAATCCTTGCTTCAACGCGTAACTGGTTGCGCTACAAATTACCG +AAACGTTTGGTGCGTTGGGACACGAAGCCGGTTTGTATCGGCCAAAAACAAAAATGGTTT +CTCTTGCAGCTGGTGAGCGGCGATGCAGAAATCAATATGCAAACCAGCAGTACACCAGAG +TTTGACGGCTGGCGATGGGTAAGTTACTGGTATCCAGTCAGACAGGTGGTGTCATTTAAA +CGTGATGTCTACCGTAGGGTAATGAAAGAGTTCGCGAGTGTGGTGATGTCACTGCAGGAA +AATACGCCAAAACCACAAAACGCATCTGCTTATCGACGTAAAAGAGGTTAA +>test.0417.00002.0003i_00040 162 NA | hypothetical protein | NA | NA | NA +ATGGAAACAGTAGTGGAGGTTTTTCACAGTTATCCCAGCTTTCTGTGGATAACATGGTGT +AAGATCCTGTTTATTTTCAGTGACCAGATTTGGAAAACCCGTTGCAGTGTTGCGCAACTC +GATTACCGGAAACCTAAAAAGCAATATAAATCAGAGAATTGA +>test.0417.00002.0003i_00041 690 mutH | DNA mismatch repair protein MutH | NA | similar to AA sequence:UniProtKB:P06722 | COG:COG3066 +ATGTCCCAACCTCGCCCACTGCTCTCTCCTCCCGAAACTGAAGAACAATTGTTAGCGCAA +GCACAACAACTTTCTGGTTATACATTGGGAGAACTGGCGGCACTTGCCGGGCTGGTTACG +CCGGAGAATTTAAAACGCGATAAGGGCTGGATTGGCGTGTTACTGGAGATCTGGCTAGGT +GCCAGCGCAGGGAGTAAACCTGAGCAAGATTTTGCTGCTCTGGGCGTGGAACTTAAAACT +ATCCCTGTGGATAGTCTTGGTCGTCCGCTGGAAACAACATTCGTTTGTGTTGCCCCGTTA +ACGGGCAATAGCGGGGTGACCTGGGAAACCAGCCACGTGCGCCACAAGCTCAAACGCGTG +CTGTGGATACCGGTTGAAGGCGAGCGCAGCATCCCGCTGGCAAAGCGTCGCGTAGGATCA +CCGTTGCTGTGGAGCCCGAATGAAGAGGAAGACCGGCAGTTACGCGAAGACTGGGAAGAA +TTAATGGATATGATTGTTCTCGGTCAGGTTGAGCGGATCACCGCTCGGCACGGGGAATAT +TTACAGATACGACCGAAAGCAGCGAATGCGAAAGCGCTGACCGAAGCTATTGGTGCCCGG +GGCGAACGGATTCTGACGCTGCCGCGCGGATTTTATTTGAAGAAGAATTTCACCAGTGCG +CTACTGGCCCGTCATTTTCTGATCCAGTAG +>test.0417.00002.0003i_00042 714 NA | hypothetical protein | NA | similar to AA sequence:UniProtKB:P67127 | NA +ATGTTATTTGCATGGATAACCGATCCTAACGCCTGGCTTGCGCTCGGTACACTGACGCTG +CTGGAGATCGTTCTTGGGATCGACAATATTATTTTCCTTTCTCTGGTGGTGGCAAAGCTT +CCCACAGCACAACGTGCTCATGCGCGCCGTCTGGGGTTGGCGGGAGCCATGGTTATGCGT +CTGGCGCTGCTGGCATCCATCGCCTGGGTTACGCGCCTGACGAATCCGCTTTTTACAATA +TTCAGTCAGGAAATTTCCGCCCGTGATTTGATTCTGCTTCTGGGTGGCTTGTTCCTTATC +TGGAAAGCCAGCAAGGAAATCCACGAATCCATCGAAGGTGAAGAAGAAGGGCTGAAAACA +CGCGTTTCATCATTCCTCGGCGCTATCGTGCAGATTATGCTGCTGGATATTATCTTCAGC +CTCGACTCGGTGATTACCGCTGTGGGTCTGTCAGATCACCTGTTTATTATGATGGCAGCC +GTGGTAATTGCCGTAGGCGTGATGATGTTCGCTGCGCGTTCGATTGGTGATTTTGTCGAG +CGCCATCCTTCGGTAAAAATGCTGGCGCTCTCTTTCCTGATTCTGGTGGGCTTTACCCTG +ATTCTGGAAAGTTTCGACATCCACGTACCGAAAGGTTACATCTACTTCGCGATGTTCTTC +TCTATTGCGGTTGAAAGCCTCAACCTGATTCGCAACAAAAAGAATCCGCTCTGA +>test.0417.00002.0003i_00043 219 ygdR | putative lipoprotein YgdR | NA | similar to AA sequence:UniProtKB:P65294 | NA +ATGAAAAAATGGGCAGTAATAATTTCTGCAGTCGGACTGGCGTTTGCTGTTTCCGGGTGT +TCCAGTGATTACGTCATGGCGACCAAAGATGGCCGTATGATTTTGACCGATGGAAAACCT +GAAATTGATGATGATACCGGGCTGGTGAGTTATCACGATCAGCAAGGTAACGCGATGCAA +ATTAACCGTGATGATGTTTCGCAAATTATTGAACGTTAA +>test.0417.00002.0003i_00044 1041 tas | Protein tas | NA | similar to AA sequence:UniProtKB:P0A9T4 | COG:COG0667 +ATGCAATATCACCGTATACCCCACAGTTCGCTGGAAGTCAGCACGCTGGGGCTTGGCACG +ATGACGTTTGGTGAACAGAACAGCGAAGCCGACGCCCACGCACAACTCGACTATGCCGTC +GCTCAGGGCATTAACCTTATCGACGTTGCCGAAATGTACCCAGTACCTCCGCGCCCCGAA +ACTCAAGGGCTAACCGAAACCTACGTCGGCAACTGGCTGGCGAAACATGGCAGCCGCGAA +AAGTTAATTATCGCCTCCAAAGTGAGCGGACCGTCGCGCAATAATGACAAAGGCATCCGC +CCGGATCAGGCGCTGGATCGGAAGAATATCCGCGAAGCGCTGCATGACAGCCTCAAGCGT +CTGCAGACTGATTACCTCGATCTTTATCAGGTGCACTGGCCGCAGCGCCCAACCAACTGC +TTCGGCAAACTCGGTTATAGCTGGACAGATTCTGCGCCTGCGGTTTCGCTGCTGGATACA +CTGGACGCACTGGCAGAGTACCAACGCGCGGGAAAAATTCGTTATATCGGCGTGTCGAAC +GAAACTGCATTTGGCGTAATGCGCTACCTGCATCTGGCGGACAAACACGATCTGCCGCGT +ATTGTCACCATTCAGAACCCCTACAGTCTGTTAAACCGCAGTTTTGAAGTAGGTCTGGCA +GAAGTCAGCCAGTATGAAGGGGTCGAACTGCTGGCCTATTCGTGCCTGGGTTTCGGCACG +CTGACCGGGAAATATCTCAACGGTGCAAAACCCGCTGGCGCACGTAATACGCTCTTTAGT +CGGTTCACCCGCTATAGCGGTGAGCAAACGCAAAAAGCCGTCGCGGCGTATGTTGATATA +GCCAGACGTCATGGCCTGGATCCTGCACAGATGGCGCTCGCTTTTGTACGCCGTCAACCG +TTTGTTGCCAGCACTCTGCTGGGCGCAACCACGATGGAGCAGCTGAAAACTAACGTCGAA +AGTTTGCATCTGGAGTTAAGCGAAGACGTGTTGGCAGAAATTGAAGCGGTGCATCAGGTT +TACACTTATCCGGCACCATAA +>test.0417.00002.0003i_00045 1194 lplT | Lysophospholipid transporter LplT | NA | similar to AA sequence:UniProtKB:P39196 | NA +ATGAGTGAGTCAGTGCACACTAACACTTCGTTGTGGTCGAAGGGGATGAAAGCGGTTATC +GTGGCGCAGTTTCTCTCTGCGTTTGGCGATAATGCGCTACTGTTTGCCACTCTGGCGTTA +CTGAAAGCGCAGTTCTATCCGGAGTGGAGCCAGCCCATCCTGCAAATGGTGTTTGTAGGT +GCTTACATTCTTTTTGCGCCGTTTGTCGGGCAGGTGGCGGATAGCTTCGCCAAAGGCCGG +GTGATGATGTTTGCCAACGGCCTGAAGCTACTGGGCGCAGCCAGTATCTGCTTTGGTATC +AATCCGTTTCTCGGCTATACGTTGGTGGGTGTTGGTGCTGCAGCCTATTCACCGGCGAAA +TACGGTATTCTCGGCGAATTAACCACGGGTAGTAAGTTAGTAAAAGCTAACGGTTTAATG +GAAGCGTCTACCATAGCGGCGATTTTGCTCGGTTCCGTAGCTGGTGGTGTTCTGGCTGAC +TGGCATATTCTGGTTGCCCTGGTCGCATGCGCACTGGCCTACGGTGGCGCGGTCGTTGCC +AATATCTACATTCCCAAACTGGCGGCGGCGCGTCCGGGGCAGTCCTGGAATCTCATCAGC +ATGACCCGCAGTTTCCTGAATGCCTGCACCTCGCTATGGCGCAATGGTGAAACGCGTTTT +TCGCTGGTGGGCACCAGTTTATTCTGGGGAGCGGGTGTCACGCTGCGTTTCCTGTTGGTG +CTGTGGGTACCGGTGGCGCTGGGTATTACCGATAACGCTACGCCGACCTATCTCAACGCG +ATGGTAGCGATTGGTATCGTGGTTGGTGCAGGTGCGGCAGCGAAGTTAGTTACGCTGGAA +ACCGTGTCACGCTGTATGCCAGCCGGGATTTTGATTGGCGTGGTGGTACTGATTTTCTCC +CTGCAACACGAGCTGCTGCCAGCCTATGCTTTGTTGATGCTGATTGGCGTGCTGGGGGGC +TTTTTTGTCGTTCCGCTCAATGCGTTGCTACAGGAGCGGGGCAAAAAAAGCGTCGGGGCG +GGGAATGCGATTGCAGTACAAAACCTTGGCGAAAACAGCGCCATGTTGTTGATGCTGGGC +ATTTACTCGCTGGCGGTAATGGTAGGCATCCCGGTCGTGCCCATTGGCATTGGCTTCGGT +GCGCTGTTTGCGCTGGCAATAACGGCGCTGTGGATCTGGCAGCGCCGTCATTAA +>test.0417.00002.0003i_00046 2160 aas | Bifunctional protein Aas | NA | similar to AA sequence:UniProtKB:P31119 | COG:COG0204 +ATGCTTTTTAGCTTTTTTCGAAATTTGTGCCGTGTTTTGTATCGCGTTCGCGTTACGGGT +GACACCAAGGCACTGAAGGGCGAGCGCGTTCTAATTACGCCTAATCACGTCTCTTTTATT +GATGGCATACTGCTGGCATTGTTTTTACCCGTACGTCCGGTATTTGCCGTTTACACCTCA +ATAAGCCAACAGTGGTATATGCGTTGGCTGAAATCATTTATCGACTTTGTTCCTCTCGAC +CCGACGCAACCTATGGCGATTAAACATCTGGTACGTCTGGTGGAACAGGGCCGACCAGTG +GTGATTTTCCCTGAAGGACGCATCACCACCACTGGCTCGCTGATGAAAATCTACGATGGC +GCGGGATTTGTCGCGGCGAAGTCTGGTGCAACGGTTATTCCTGTGCGTATTGAAGGGGCG +GAACTTACGCACTTCAGCCGCCTGAAAGGTCTGGTTAAACGTCGCTTGTTCCCGCAAATT +ACTCTGCATATTTTGCCACCAACGCAGGTGGAGATGCCGGATGCGCCGCGTGCCCGTGAC +CGTCGCAAAATCGCTGGCGAAATGCTGCATCAAATAATGATGGAAGCGCGTATGGCGGTG +CGCCCGCGTGAAACGCTGTACGAATCTTTACTGAGCGCAATGTACCGCTTCGGAGCCGGG +AAGAAATGTGTCGAAGACGTTAACTTTACCCCGGACTCCTATCGCAAATTGCTTACGAAA +ACGCTGTTTGTTGGACGCATCCTTGAAAAATACAGTGTTGAAGGCGAACGCATCGGCTTA +ATGCTGCCCAATGCAGGCATCAGTGCTGCAGTGATTTTTGGGGCCATCGCCCGTCGCCGC +ATTCCCGCAATGATGAACTACACCGCCGGGGTAAAAGGGTTGACCAGTGCTATTACGGCG +GCTGAAATCAAAACCATTTTCACTTCCCGTCAGTTTCTCGATAAAGGCAAACTCTGGCAT +CTGCCGGAGCAACTTACTCAGGTGCGCTGGGTCTATCTGGAAGATTTAAAAGCAGATGTC +ACCACTGCCGACAAAGTATGGATCTTCGCTCATTTGCTGATGCCGCGTCTGGCACAGGTT +AAACAGCAGCCGGAAGAAGAGGCGCTGATCCTTTTTACCTCCGGTTCTGAAGGCCATCCG +AAAGGCGTCGTCCATAGCCATAAAAGCATTCTGGCGAATGTCGAGCAGATTAAAACGATT +GCCGACTTCACCACCAACGATCGCTTTATGTCGGCGTTACCGCTGTTTCACTCCTTTGGG +CTGACGGTAGGCCTGTTTACGCCACTGCTCACAGGTGCAGAAGTGTTCCTTTATCCAAGC +CCGCTGCACTACCGTATTGTGCCGGAGTTGGTGTATGACCGCAGTTGCACCGTGTTGTTC +GGTACCTCCACTTTCCTCGGTCACTACGCGCGTTTCGCCAACCCGTATGACTTCTATCGT +CTACGCTATGTGGTGGCAGGCGCAGAAAAACTACAAGAAAGTACTAAACAGCTTTGGCAG +GATAAATTTGGCCTGCGCATCCTTGAAGGCTACGGTGTGACCGAATGCGCGCCTGTCGTT +TCTATCAACGTACCGATGGCGGCGAAACCCGGTACGGTAGGGCGTATTCTACCAGGAATG +GATGCGCGCCTGTTGTCGGTTCCTGGTATCGAAGAGGGCGGACGCCTGCAACTGAAAGGG +CCGAACATAATGAACGGCTATCTGCGGGTGGAGAAGCCTGGTGTACTGGAAGTGCCCACC +GCCGAGAATATTCGCGGCGAAATGGAGCGCGACTGGTATGACACTGGCGATATTGTGCGT +TTTGACGAGCAGGGCTTTGTGCAGATTCAGGGCCGCGCAAAACGCTTTGCCAAAATTGCA +GGCGAAATGGTGTCGCTGGAAATGGTGGAACAACTGGCACTTGGTGTTTCGCCAGATAAA +GTCCATGCCACTGCGATTAAGAGCGATGCCAGCAAAGGCGAGGCACTGGTGCTTTTCACC +ACAGATAACGAACTGACGCGCGATAAGTTACAACAGTATGCCCGCGAGCACGGCGTGCCG +GAGCTTGCTGTACCGCGCGATATTCGCTATCTGAAACAGATGCCATTACTTGGCAGCGGC +AAACCTGACTTTGTCACTTTGAAAAGCTGGGTAGACGAAGCGGAACAACACGATGAGTGA +>test.0417.00002.0003i_00047 1032 galR | HTH-type transcriptional regulator GalR | NA | similar to AA sequence:UniProtKB:P03024 | COG:COG1609 +ATGGCGACCATAAAGGATGTAGCCCGACTGGCAGGCGTTTCAGTCGCCACCGTTTCCCGC +GTCATTAATAATTCACCCAAAGCCAGCGAAGCTTCCCGGCTTGCTGTGCATAGTGCAATG +GAGTCTCTTAGCTATCACCCGAACGCCAACGCCCGTGCTCTGGCGCAGCAGACCACTGAA +ACGATCGGTCTGGTCGTTGGTGATGTTTCCGATCCGTTTTTCGGCGCAATGGTGAAAGCG +GTCGAACAGGTGGCTTATCACACTGGTAATTTTTTATTGATTGGCAACGGTTACCACAAC +GAACAAAAAGAGCGTCAGGCCATTGAGCAACTGATCCGCCATCGCTGTGCTGCGCTGGTT +GTCCATGCCAAAATGATCCCGGATGCCGATTTAGCCTCATTAATGAAACAAATGCCCGGT +ATGGTGCTGATCAACCGTATCCTGCCTGGCTTTGAAAACCGTTGTATTGCTCTGGACGAT +CGTTACGGTGCCTGGCTGGCAACGCGTCATTTAATTCAGCAAGGTCATACCCGCATTGGT +TATCTGTGCTCTAACCACTCTATTTCTGACGCCGAAGATCGTCTGCAAGGGTATTACGAT +GCCCTTGCTGAAAGTGGTATTCCGGCCAATGACCGGCTGGTGACATTTGGCGAACCAGAC +GAAAGCGGCGGCGAACAGGCAATGACCGAGCTTTTGGGACGAGGCAGAAATTTCACTGCG +GTAGCCTGTTATAACGATTCAATGGCGGCGGGCGCGATGGGCGTGCTCAATGATAATGGT +ATTGATGTACCGGGTGAGATTTCGTTAATTGGCTTTGATGATGTGCTGGTGTCACGCTAT +GTGCGTCCGCGCCTGACCACCGTGCGTTACCCAATCGTGACGATGGCGACGCAGGCTGCC +GAACTGGCTTTGGCGCTGGCGGATAATCGCCCTCTCCCGGAAATCACTAATGTCTTTAGT +CCGACGCTGGTACGTCGCCATTCAGTGTCAACTCCGTCGCTGGAGGCAAGTCATCATGCA +ACCAGCGACTAA +>test.0417.00002.0003i_00048 1263 lysA | Diaminopimelate decarboxylase | 4.1.1.20 | similar to AA sequence:UniProtKB:E0IWI3 | NA +ATGCCACATTCACTGTTCAGCACTGATACCGATCTCACCGCCGAAAATCTGCTGCGTTTG +CCCGCAGAATTTGGCTGCCCGGTGTGGGTCTACGATGCGCAAATTATTCGTCGGCAGATT +GCAGCGCTGAAACAGTTTGATGTGGTGCGCTTTGCACAGAAAGCCTGTTCCAATATTCAT +ATTTTGCGCTTAATGCGTGAGCAGGGCGTAAAAGTGGATTCCGTCTCGTTAGGCGAAATA +GAGCGTGCACTGGCGGCGGGTTACAATCCGCAAACGCACCCCGATGATATTGTTTTTACG +GCAGATGTTATCGATCAGGCGACGCTTGAACGCGTCAGTGAATTGCAAATTCCGGTGAAT +GCGGGTTCTGTTGATATGCTCGACCAACTGGGTCAGGTTTCGCCAGGGCATCGGGTATGG +CTGCGTGTTAATCCGGGGTTTGGTCACGGGCATAGCCAAAAAACCAATACCGGTGGCGAA +AACAGCAAGCACGGTATCTGGTACACCGATCTGCCCGCCGCACTGGACGTGATACAACGT +CATCATCTACAGCTGGTCGGCATTCACATGCACATTGGTTCTGGCGTCGATTATGCCCAT +CTGGAACAGGTATGTGGTGCTATGGTGCGTCAGGTCCTCGAATTCGGTCAGGATTTACAG +GCTATTTCTGCGGGCGGTGGGCTTTCTATTCCTTATCAACAGGGTGAAGAGGCGGTTGAT +ACCGAACATTATTATGGTCTGTGGAATGCCGCGCGTGAGCAAATCGCCCGCCATTTGGGC +CATCCTGTGAAACTGGAAATTGAACCGGGTCGCTTTCTGGTAGCGCAGGCTGGCGTATTA +ATTACTCAAGTGCGGAGCGTCAAACAAATGGGTAGCCGCCACTTTGTGCTGGTTGATGCC +GGGTTCAACGATCTGATGCGCCCGGCAATGTACGGTAGTTACCACCATATCAGTGCCCTG +GCAGCTGATGGTCGTTCTCTGGAACACGCACCAACGGTGGAAACCGTCGTCGCCGGGCCG +TTATGTGAATCGGGCGATGTCTTTACCCAGCAGGAAGGGGGAAATGTTGAAACCCGCGCC +TTGCCGGAAGTGAAGGCGTGTGATTATCTGGTACTGCATGATACAGGGGCATATGGCGCA +TCAATGTCATCCAACTACAACAGCCGTCCGCTGTTACCAGAAGTTCTGTTTGATAATGGT +CAGGCGCGGTTGATTCGCCGTCGCCAGACCATTGAAGAATTACTGGCGCTGGAATTGCTT +TAA +>test.0417.00002.0003i_00049 936 occR | Octopine catabolism/uptake operon regulatory protein OccR | NA | similar to AA sequence:UniProtKB:P0A4T3 | NA +ATGGCCGCCGTTAACTTACGTCATATTGAAATTTTTCATGCGGTAATGACCGCCGGAAGC +CTGACTGAGGCGGCACACCTGCTACACACCTCACAGCCAACCGTCAGCCGCGAACTGGCG +CGCTTTGAGAAGGTGATCGGGCTGAAATTGTTTGAGCGCATACGTGGACGATTACATCCT +ACCGTGCAAGGACTGCGTCTGTTTGAAGAAGTGCAACGATCCTGGTACGGACTGGATCGC +ATTGTCAGTGCCGCAGAAAGTCTGCGCGAGTTTCGCCAGGGAGAACTGTCTATTGCCTGC +CTGCCGGTCTTTTCGCAATCTTTTTTACCGCAGCTCCTGCAACCCTTTCTGGCACGTTAT +CCCGATGTCAGCTTAAATATCGTGCCCCAGGAATCACCGCTACTTGAAGAGTGGCTCTCG +GCCCAGCGTCATGATTTAGGACTCACTGAAACGCTCCATACGCCTGCGGGAACAGAACGT +ACCGAATTACTCTCTTTAGATGAAGTGTGTGTGTTACCTCCGGGCCATCCGCTGGCGGTA +AAAAAGGTATTAACGCCGGATGATTTTCACGGTGAGAACTACATCAGCCTTTCCCGTACT +GACAGCTATCGCCAGTTGCTGGATCAATTGTTTACTGAGAATCAGGTTAAACGACGCATG +ATCGTAGAAACCCACAGCGCCGCGTCAGTCTGCGCAATGGTACGGGCGGGGGTAGGCGTT +TCGGTGGTTAACCCGCTCACCGCACTGGATTATGCGGCAAGCGGTTTAGTGGTGCGGCGG +TTCAGCATTGCGGTTCCATTCACCGTCAGCCTGATCCGCCCCCTGCACCGCCCGTCATCA +GCGCTGGTGCAGGCGTTTAGTGAGCATTTACAAGCGGGATTACCGAAACTGGTCACTTCT +CTTGACACTATTTTGTCGTCAGCTACGACAGCATAA +>test.0417.00002.0003i_00050 693 ygeA | L-aspartate/glutamate-specific racemase | 5.1.1.13 | similar to AA sequence:UniProtKB:A0A140N890 | NA +ATGAAAACAATTGGTTTGCTGGGAGGAATGAGCTGGGAATCCACTATTCCTTACTATCGT +CTGATAAATGAAGGCATTAAACAGCGGCTTGGTGGGCTTCACTCTGCGCAAGTGCTGCTA +CATAGCGTCGATTTTCATGAAATAGAAGAGTGCCAGCGTCGCGGTGAGTGGGACAAAACC +GGGGATATTCTGGCTGAGGCGGCGCTTGGCTTACAGCGGGCGGGCGCAGAAGGTATTGTG +TTATGCACCAATACGATGCACAAAGTGGCGGATGCCATTGAGTCTCGTTGCTCTCTGCCT +TTCTTACACATAGCGGATGCCACTGGACGTGCAATTACCGGGGCAGGAATGACTCGTGTG +GCGCTGCTGGGTACACGTTACACCATGGAACAGGATTTTTATCGCGGGCGGCTGACGGAA +CAATTTTCCATCAACTGTCTTATTCCTGAAGCGGATGAACGGGCGAAAATTAATCAGATT +ATTTTTGAAGAACTGTGTCTGGGGCAATTTACCGAAGCGTCACGCGCTTATTATGCGCAA +GTGATTGCTCGCCTTGCAGAACAGGGCGCACAGGGCGTCATTTTTGGCTGCACAGAAATT +GGTTTACTGGTGCCAGAAGAGCGCAGTGTTCTGCCTGTGTTTGATACCGCGGCGATCCAT +GCCGAGGATGCTGTCGCTTTTATGCTGTCGTAG +>test.0417.00002.0003i_00051 1419 araE | Arabinose-proton symporter | NA | similar to AA sequence:UniProtKB:P0AE24 | NA +ATGGTTACTATCAATACGGAATCTGCTTTAACGCCACGTCCTCTGCGGGATACGCGGCGT +ATGAATATGTTTGTTTCGGTAGCTGCTGCGGTCGCAGGATTGTTATTTGGTCTTGATATC +GGCGTAATCGCCGGAGCGTTGCCGTTCATTACCGATCACTTTGTGCTGACCAGCCGTTTG +CAGGAATGGGTGGTCAGTAGCATGATGCTCGGCGCAGCAATTGGTGCGCTGTTTAATGGG +TGGCTGTCGTTCCGCCTGGGGCGTAAATACAGCCTGATGGCGGGGGCCATCCTGTTTGTA +CTCGGTTCGATAGGGTCCGCTTTTGCGACCAGCGTAGAGATGTTAATCGCCGCTCGTGTG +GTGTTGGGCATTGCTGTTGGGATCGCGTCTTACACCGCTCCTCTATATCTTTCTGAAATG +GCAAGTGAAAACGTTCGCGGTAAGATGATCAGCATGTACCAGTTGATGGTCACACTCGGC +ATCGTGCTGGCGTTTTTATCCGATACAGCGTTCAGTTATAGCGGTAACTGGCGCGCAATG +TTGGGGGTTCTTGCTTTACCAGCAGTCCTGCTGATTATTCTGGTGGTCTTCCTGCCAAAT +AGCCCGCGCTGGCTGGCGGAAAAGGGGCGTCATATTGAGGCGGAAGAAGTGTTGCGTATG +CTGCGCGATACGTCGGAAAAAGCGCGAGAAGAACTCAACGAAATTCGTGAAAGCCTGAAG +TTAAAACAGGGCGGTTGGGCACTGTTTAAGATCAACCGTAACGTCCGTCGTGCTGTATTT +CTCGGTATGTTGTTGCAGGCGATGCAGCAGTTTACCGGTATGAACATCATCATGTACTAC +GCGCCACGTATCTTCAAAATGGCGGGCTTTACGACCACAGAACAACAGATGATTGCGACT +CTGGTCGTGGGGCTGACCTTTATGTTCGCTACCTTCATTGCGGTCTTTACGGTAGATAAA +GCAGGGCGTAAGCCGGCTCTGAAAATTGGTTTCAGCGTGATGGCGTTAGGCACTCTGGTG +CTGGGTTACTGCCTGATGCAGTTTGATAACGGTACGGCTTCCAGTGGCTTGTCCTGGCTC +TCTGTTGGCATGACGATGATGTGTATTGCCGGTTATGCGATGAGCGCCGCGCCAGTGGTG +TGGATCTTGTGCTCTGAAATTCAGCCGCTGAAATGCCGCGATTTTGGCATCACCTGCTCA +ACGACGACAAACTGGGTGTCGAATATGATTATCGGCGCGACCTTCCTGACACTGCTTGAT +AGCATTGGCGCTGCCGGTACGTTCTGGCTCTACACTGCGCTGAACATTGCGTTTGTGGGC +ATCACTTTCTGGCTCATTCCGGAAACCAAAAATGTCACGCTGGAACATATCGAGCGCAAA +CTGATGGCAGGCGAAAAGTTGAGAAATATCGGCGTCTGA +>test.0417.00002.0003i_00052 762 kduD | 2-dehydro-3-deoxy-D-gluconate 5-dehydrogenase | 1.1.1.127 | similar to AA sequence:UniProtKB:P37769 | NA +ATGATTTTAAATGCATTTTCTCTCGAAGGTAAAGTTGCGGTCGTCACTGGTTGTGATACT +GGGCTGGGCCAGGGGATGGCGTTGGGGCTGGCGCAAGCGGGCTGTGACATTGTTGGCATT +AACATCGTTGAACCGACTGAAACCATCAAGCAGGTCACGGCGCAGGGGCGTCGTTTTTTA +AGCCTGACCGCCGATCTGCGAAAGATTGATGGCATTCCTGGACTGCTGGATCGCGCGGTA +GCGGAGTTTGGTCATATTGATATCCTGGTGAATAACGCCGGATTGATTCGCCGCGAAGAC +GCTCTCGAGTTCAGCGAAACAGACTGGGACGATGTCATGAACCTGAATATCAAGAGCGTA +TTCTTCATGTCTCAGGCAGCGGCGAAACACTTTATCGCGCAAGGCAATGGCGGCAAGATT +ATCAATATCGCGTCAATGCTCTCCTTCCAGGGCGGGATCCGTGTGCCTTCTTATACCGCA +TCAAAAAGCGGCGTGATGGGTGTGACGCGATTGATGGCGAACGAATGGGCTAAACACAAC +ATTAATGTTAATGCGATAGCTCCGGGTTACATGGCGACCAACAATACTCAACAACTGCGG +GCAGATGAACAACGTAGCGCGGAAATTCTCGACCGCATTCCAGCTGGCCGTTGGGGACTG +CCGAGTGACCTGATGGGGCCGGTAGTGTTTCTTGCCTCCAGCGCTTCAGATTATGTAAAT +GGTTATACCATTGCTGTGGATGGCGGTTGGCTGGCGCGTTAA +>test.0417.00002.0003i_00053 837 kduI | 4-deoxy-L-threo-5-hexosulose-uronate ketol-isomerase | 5.3.1.17 | similar to AA sequence:UniProtKB:Q46938 | COG:COG3717 +GTGGACGTAAGACAGAGCATCCACAGTGCGCACGCAAAAACGCTGGATACCCAGGGGCTG +CGCAATGAATTTTTGGTTGAAAAGGTATTTGTCGCCGATGAGTACACCATGGTTTACAGC +CACATTGACCGTATTATTGTTGGCGGCATTATGCCGGTAACTAAAACGGTTTCCGTTGGC +GGGGAAGTTGGTAAACAACTCGGCGTAAGCTATTTCCTTGAACGTCGCGAGTTAGGTGTT +ATCAATATTGGCGGTGCCGGTACGATTACTGTCGATGGTCAATGCTATGAAATCGGTCAC +CGCGACGCCCTGTATGTTGGTAAAGGTGCAAAAGAAGTTGTCTTTGCCAGTATTGATACC +GCCACTCCGGCGAAGTTTTATTACAATTGCGCACCCGCGCATACGACGTATCCCACCAAA +AAAGTCACACCGGACGAAGTATCTCCAGTCACGTTAGGCGATAACCTCACCAGTAACCGT +CGCACGATTAACAAATATTTTGTCCCGGATGTGCTGGAAACCTGCCAATTGAGTATGGGG +CTGACGGAGCTGGCTCCAGGTAACTTGTGGAACACCATGCCGTGTCACACCCACGAGCGC +CGGATGGAAGTTTATTTCTATTTCAATATGGATGATGACGCCTGCGTTTTCCACATGATG +GGGCAACCGCAAGAAACGCGTCACATTGTGATGCATAACGAGCAGGCGGTGATCTCCCCG +AGCTGGTCGATCCATTCCGGCGTCGGAACCAAAGCTTATACCTTTATCTGGGGCATGGTC +GGTGAAAACCAGGTTTTTGATGATATGGACCATGTGGCCGTTAAAGATTTGCGCTAG +>test.0417.00002.0003i_00054 1182 thlA | Acetyl-CoA acetyltransferase | 2.3.1.9 | similar to AA sequence:UniProtKB:P45359 | COG:COG0183 +ATGAAAGACGTTGTGATTGTCGGGGCGTTACGGACACCTATCGGCTGCTTTCGTGGTGCG +TTAGCGGGTCATTCCGCCGTGGAACTTGGCAGCCTGGTCGTCAAAGCGTTAATAGAACGT +ACCGGCGTTCCTGCATATGCGGTGGATGAAGTGATTCTTGGTCAGGTGTTGACTGCAGGG +GCAGGGCAGAATCCGGCAAGGCAATCGGCTATTAAAGGTGGTCTTCCTAATAGCGTTTCT +GCAATCACTATTAATGACGTTTGTGGTTCCGGGCTTAAAGCACTGCATCTGGCTACTCAG +GCGATACAGTGTGGCGAGGCTGATATTGTCATCGCCGGTGGCCAGGAAAACATGAGCCGC +GCACCACATGTTCTGACTGATAGCCGCACCGGCGCACAGCTTGGCAATAGCCAGTTGGTT +GATAGTCTTGTGCATGATGGGTTGTGGGATGCCTTCAATGATTATCATATTGGTGTCACC +GCCGAAAATCTGGCTCGCGAATATGGCATCAGCCGTCAGTTGCAGGATGCTTACGCACTT +AGCTCGCAACAAAAAGCGCGAGCGGCGATTGACGCCGGACGATTTAAAGATGAGATCGTC +CCGGTAATAACCCAAAGTAACGGTCAGACGTTGGTTGTTGATACCGATGAACAGCCACGC +ACTGACACCAGCGCAGAAGCCTTAGCCCGTTTAAATCCTTCATTTGATAGTCTCGGTTCT +GTGACAGCGGGTAATGCATCATCCATAAACTATGGGGCAGCTGCAGTAATGATGATGAGC +GAAGCCAAAGCACGAGCGTTGAATTTACCCGTGCTGGCCCGCATCCGCGCATTTGCCAGC +GTTGGTGTGGATCCGGCATTGATGGGAATTGCGCCGGTGTATGCGACCCGCCGTTGCCTG +GAGCGTGTTGGCTGGCAGTTGGCTGATGTCGATCTTATCGAGGCTAATGAAGCGTTTGCT +GCACAGGCGCTTTCGGTTGGCAAGATGCTTGAATGGGATGAGCGTCGGGTCAATGTCAAT +GGTGGTGCGATCGCACTCGGTCATCCGATAGGCGCTTCCGGTTGCCGAATCCTGGTTTCT +CTTGTTCATGAAATGGTGAAACGTAATGCCCGCAAAGGACTGGCAACGCTTTGTATCGGC +GGGGGCCAGGGTGTGGCATTGACCATTGAACGTGACGAGTAG +>test.0417.00002.0003i_00055 1230 yqeG | Inner membrane transport protein YqeG | NA | similar to AA sequence:UniProtKB:P63340 | COG:COG0814 +ATGTCTAATATTTGGTCAAAAGAAGAAACTCTGTGGAGTTTCGCGCTCTACGGCACAGCC +GTTGGTGCAGGCACGCTCTTCCTTCCTATTCAGTTAGGTTCGGCGGGGGCTGTGGTCCTG +TTTATTACTGCTCTGGTCGCCTGGCCTTTAACATATTGGCCACATAAAGCCTTATGCCAG +TTCATCCTCTCATCGAAAACATCAGCAGGTGAAGGGATAACGGGCGCGGTAACACACTAC +TATGGCAAGAAGATTGGTAATCTGATTACCACGCTGTACTTCATCGCCTTTTTTGTCGTC +GTGTTGATATATGCAGTGGCAATTACCAACTCACTTACAGAACAGCTGGCAAAGCATATG +GTTATTGATCTTCGCATCCGTATGTTGGTGAGTCTGGGGGTTGTATTAATCCTGAATCTC +ATTTTTCTGATGGGACGCCATGCCACTATTCGGGTAATGGGATTTTTGGTATTCCCATTG +ATTGCCTATTTCTTATTTCTTTCTATTTACCTGGTCGGTAGTTGGCAACCTGATCTATTA +ACAACCCAGGTAGAGTTCAATCAGAATACCCTTCACCAGATATGGATATCGATTCCCGTG +ATGGTTTTCGCTTTTAGCCATACGCCCATTATTTCTACGTTTGCCATAGACAGACGTGAA +AAATATGGCGAACACGCTATGGATAAATGCAAAAAAATTATGAAAGTCGCTTATCTCATC +ATCTGCATAAGTGTATTGTTCTTTGTCTTTAGCTGCCTGCTTTCTATTCCACCTTCGTAT +ATTGAAGCGGCTAAAGAAGAAGGGGTTACCATTTTATCGGCGCTTTCTATGCTGCCGAAC +GCCCCAGCATGGTTGTCAATTTCCGGGATTATTGTCGCAGTAGTTGCGATGTCGAAATCA +TTCCTGGGTACGTACTTTGGCGTTATTGAAGGTGCCACAGAGGTCGTCAAAACAACATTA +CAGCAGGTTGGTGTAAAGAAAAGTCGTGCATTTAACCGCGCACTATCAATTATGTTGGTA +TCGCTGATTACCTTCATTGTTTGTTGCATTAACCCGAACGCGATTTCGATGATTTACGCG +ATCAGCGGCCCGCTCATTGCCATGATACTTTTCATCATGCCTACGCTGTCAACGTATCTC +ATCCCGGCGCTTAAACCCTGGCGTTCCATCGGAAATCTGATTACCCTGATCGTGGGTATC +CTGTGCGTATCGGTAATGTTCTTTAGCTAA +>test.0417.00002.0003i_00056 74 NA | tRNA-Gly(ccc) | NA | COORDINATES:profile:Aragorn:001002 | NA +GCGGGCGTAGTTCAATGGTAGAACGAGAGCTTCCCAAGCTCTATACGAGGGTTCGATTCC +CTTCGCCCGCTCCA +>test.0417.00002.0003i_00057 351 nlpD | Murein hydrolase activator NlpD | NA | similar to AA sequence:UniProtKB:P39700 | NA +ATGCCGTATTCGACAGCAGATGGCGGCAATAAAGGAATTGATATCTCAGCTCCACGGGGT +ACACCTATTTACGCCGCGGGTGCAGGAAAGGTGGTGTATGTGGGCAACCAGCTGCGTGGC +TACGGTAATCTCATCATGATTAAACACAGTGAAGATTACATTACGGCTTACGCTCATAAT +GACACGATGCTGGTAAATAATGGGCAAAGCGTGAAAGCTGGGCAAAAAATCGCCACCATG +GGGAGCACTGATGCGGCATCTGTTCGCCTGCATTTCCAGATTCGTTACCGTGCAACGGCA +ATTGATCCGCTACGTTACTTGCCGCCTCAGGGCAGCAAGCCAAAATGCTGA +>test.0417.00002.0003i_00058 2298 xdhA_1 | Putative xanthine dehydrogenase molybdenum-binding subunit XdhA | 1.17.1.4 | similar to AA sequence:UniProtKB:Q46799 | COG:COG1529 +ATGGAAGCGCGGGAAGCAACCGCTACGGGTGAATCATGCATGCGCGTCGATGCCATTGCT +AAGGTCACCGGGCGGGCACGATATACTGACGATTATGTTATGGCGGGCATGTGTTACGCG +AAATATGTACGTAGCCCTATCGCACATGGTTATGCTGTAAGTATTAATGATGAACAAGCC +AGGAGTTTGCCGGGCGTCCTGGCGATTTTTACCTGGGAAGATGTGCCAGAAATCCCATTC +GCCACGGCAGGGCATGCCTGGACACTTGACGAAAACAAGCGCGATACCGCCGATCGCGCA +CTGCTAACTCGCCATGTTCGTCATCATGGCGACGCCGTTGCCATCGTCGTGGCCCGCGAT +GAACTCACGGCAGAAAAAGCGGCGCAATTGGTCAGCATTGAGTGGCAAGAATTACCCGTT +ATCACCTCGCCAGAAGCGGCGCTGGCAGAAGACGCTGCACCAATCCATAACGGTGGCAAT +TTACTGAAACAAAGCACGATGTCGACGGGTAATGTCCAACAAACAATCGATGCCGCCGAC +TACCAGGTACAGGGGCACTATCAGACTCCCGTTATTCAACATTGTCATATGGAAAGCGTG +ACATCGCTGGCATGGATGGAGGATGACTCGCGAATTACCATCGTTTCCAGCACCCAGATC +CCGCACATTGTTCGCCGCGTGGTTGGTCAGGCGCTGGATATTCCCTGGTCATGCGTACGA +GTCATCAAACCGTTTATCGGTGGCGGTTTTGGTAATAAACAGGATGTACTGGAAGAGCCA +ATGGCGGCATTCCTGACCAGCAAACTTGGCGGCATTCCGGTGAAAGTTTCCCTTAGCCGT +GAAGAGTGTTTCCTCGCAACCCGTACCCGCCACGCTTTTACTATTGACGGGCAAATGGGC +GTGAACCGCGACGGAACATTGAAAGGTTATAGTCTGGATGTTCTGTCTAACACCGGCGCT +TATGCATCTCACGGGCACTCCATTGCTTCTGCTGGGGGGAATAAAGTCGCTTACCTTTAT +CCTCGTTGTGCCTACGCTTACAGTTCAAAGACCTGCTATACCAACCTCCCCTCGGCTGGT +GCGATGCGTGGTTATGGCGCGCCACAAGTCGTATTTGCCGTTGAGTCTATGCTTGATGAT +GCCGCGACAGCGTTAGGTATTGATCCTGTTGAAATTCGTTTACGCAACGCCGCCCGCGAA +GGAGATGCTAATCCGCTCACGGGAAAACGTATTTACAGCGCAGGGTTGCCGGAGTGTCTT +GAAAAAGGCCGGAAAATCTTTGAATGGGAAAAACGCCGTGCAGAGTGCCAGAACCAGCAA +GGCAATTTACGTCGTGGCGTTGGCGTCGCCTGTTTTAGCTACACCTCTAACACCTGGCCT +GTCGGCGTAGAAATAGCAGGCGCGCGCCTGTTGATGAATCAGGATGGAACCATCAACGTG +CAAAGCGGCGCGACGGAAATCGGTCAGGGTGCCGACACCGTCTTCTCGCAAATGGTGGCA +GAAACCGTGGGGGTTCCGGTCAGCGACGTTCGCGTTATTTCAACACAAGATACCGATGTT +ACGCCGTTCGATCCCGGCGCATTTGCCTCACGCCAGAGCTATGTTGCCGCGCCTGCGCTG +CGCAGTGCGGCACTGTTATTAAAAGAGAAAATCATCGCTCACGCCGCAGTCATGCTACAT +CAGTCAGCGATGAATCTGACCCTGATAAAAGGCCATATCGTGCTGATTGAACGACCGGAA +GAACCGTTAATGTCGTTAAAAGATTTGGCGATGGACGCTTTCTACCACCCTGAACGCGGC +GGGCAGCTCTCTGCTGAAAGCTCCATCAAAACCACCACTAACCCACCGGCGTTCGGCTGT +ACATTTGTTGATCTGACGGTCGATATTGCACTGTGCAAAGTCACCATCAACCGCATCCTC +AACGTTCATGATTCGGGGCATATTCTAAATCCGCTGCTGGCAGAAGGTCAGGTACACGGC +GGAATGGGAATGGGCATTGGCTGGGCGCTATTTGAAGAGATGATCATCGATGCGAAAAGC +GGCGTGGTCCGTAACCCCAATCTGCTGGATTACAAAATGCCGACCATGCCGGATCTGCCA +CAACTGGAAAGCGCGTTCGTCGAAATCAATGAGCCGCAATCCGCATACGGACATAAGTCA +CTGGGTGAGCCACCAATAATTCCTGTTGCCGCTGCTATTCGTAACGCGGTGAAGATGGCT +ACCGGTGTTGCAATCAATACACTGCCGCTGACGCCAAAACGGTTATATGAAGAGTTCCAT +CTGGCAGGATTGATTTGA +>test.0417.00002.0003i_00059 879 ndhF | Nicotinate dehydrogenase FAD-subunit | 1.17.1.5 | similar to AA sequence:UniProtKB:Q0QLF4 | NA +ATGTTTGATTTTGCTTCTTACCATCGCGCAGCAACCCTTGCCGATGCCATCACCCTGCTG +GCTGACAATCCGCAGGCCAAATTGCTTGCCGGTGGCACTGACGTACTGATACAGCTTCAC +CATCACAATGACCGCTATCGCCATATTGTTGATATCCACAATCTGGCAGAGCTTCAGGGA +ATAACACAGGCGGAAGATGGCGCGCTGCGAATCGGCTCCGCGACAACATTTACTCAGCTC +ATTGAAGATCCCGTAATCCAACGCAATCTCCCGGCGTTATGTGCTGCGGCTGCATCAATC +GCCGGGCCGCAGATCCGTAATGTCGCCACCTACGGCGGAAATATTTGCAACGGTGCCACC +AGCGCAGATTCTGCCACGCCAACGCTAATTTATGACGCGAAACTGGAGCTCCACTCCCCA +CGCGGTGTTCGTTTCGTCCCGATTAATGGCTTTCACACCGGGCCGGGCAAAGTGTCTCTT +GAGCATGACGAAATCCTTGTCGCCTTTCATTTTCCGCCACAGCCGAAAGAACACGCGGGC +AGCGCACATTTTAAATATGCCATGCGCGACGCAATGGATATTTCAACAATTGGCTGCGCC +GCACATTGCCGACTGGATAACGGCAATTTCAGCGAATTACGCCTGGCATTTGGTGTTGCC +GCGCCAACGCCGATTCGCTGCCAACATGCCGAACAGACTGCACAAAATGCGCCATTAAAC +CTGCAAACGCTGGAAGCCATCAGCGAATCAGTCCTGCAAGATGTCGCCCCGCGTTCTTCA +TGGCGGGCCAGTAAAGAGTTTCGTCTGCATCTCATCCAGACGATGACCAAAAAAGTGATT +AGCGAAGCCGTCGCCGCGGCGGGGGGAAAATTGCAATGA +>test.0417.00002.0003i_00060 480 ndhS | Nicotinate dehydrogenase small FeS subunit | 1.17.1.5 | similar to AA sequence:UniProtKB:Q0QLF3 | NA +ATGAATCACAGCGAAACAATTACCATCGAATGCACCATTAACGGGATGCCTTTTCAGCTT +CACGCCGCGCCAGGAATGCCGCTTTCGGAACTACTCCGAGAACAAGGGCTTCTTAGTGTC +AAACAAGGTTGCTGCGTAGGCGAATGCGGTGCCTGTACGGTGCTGGTCGACGGCACTGCG +ATAGACAGTTGCTTATTCCTTGCGGCCTGGGCTGAAGGAAAAGAGATCCGCACGCTGGAA +GGTGAAGCGAAAGGCGGTAAACTTTCTCATGTCCAACTGGCTTATGCGAAATCTGGTGCA +GTGCAATGCGGGTTTTGTACGCCGGGCCTGATTATGGCTACCACGGCAATGCTGGCGAAA +CCACGCGAGAAGCCATTAACCATTACGGAAATTCGTCGTGGACTGGCGGGAAATCTTTGT +CGCTGCACAGGGTATCAGATGATTGTAAATACAGTTCTGGATTGCGAGAAAACGAAGTAA +>test.0417.00002.0003i_00061 1779 norR | Anaerobic nitric oxide reductase transcription regulator NorR | NA | protein motif:HAMAP:MF_01314 | NA +ATGGAGCTTGCGACTACGCAGTCAGTATTGATGCAAATTCAACCGACAATTCAGCGTTTT +GCCAGAATGCTTGCCAGCGTTTTGCAGCTTGAGGTTGAGATCGTTGATGAAAACTTGTGT +CGCGTCGCCGGAACGGGCGCGTATGGGAAGTTTCTTGGCCGCCAGTTGAGCGGCAACTCA +CGCCTGCTCCGCCACGTCCTGGAAACGAAAACTGAAAAAGTTGTGACACAGTCTCGCTTC +GATCCCCTTTGTGAAGGTTGCGATAGTAAAGAAAATTGCCGCGAAAAAGCATTTCTGGGT +ACGCCTGTCATTTTACAGGATCGTTGTGTTGGGGTGATAAGTTTGATTGCCGTTACCCAC +GAGCAACAAGAACATATCAGTGATAATTTACGCGAATTTTCCGATTACGTTCGCCATATA +TCCACCATTTTTGTTTCTAAACTTCTGGAGGATCAGGGACCAGGAGATAACATCAGTAAA +ATATTCGCGACCATGATCGATAATATGGATCAGGGCGTGTTAGTGGTTGATGCTGATAAT +CGGGTTCAGTTTGTTAATCAGACAGCTTTAAAAACACTCGGTGTTGTACAAAATAATATT +ATTGGAAAACCTGTTCGTTTCAGACCATTAACATTTGAGAGTAATTTTACCCATGGTCAT +ATGCAACATATTGTTTCGTGGGATGATAAAAGTGAATTAATCATTGGTCAGTTGCATAAC +ATCCAGGGCCGACAACTATTTTTAATGGCGTTTCACCAATCGCATACCAGTTTTTCTGTA +GCAAATGCACCTGATGAACCGCATATTGAACAATTGGTTGGCGAGTGCCGTGTTATGCGG +CAATTAAAACGACTCATTAGCCGTATTGCACCCAGCCCATCCAGCGTTATGGTGGTTGGT +GAAAGCGGCACGGGTAAAGAAGTCGTCGCCCGTGCAATCCATAAGTTGAGCGGAAGACGG +AATAAACCCTTTATTGCTATCAACTGTGCTGCGATTCCGGAACAGCTTCTGGAGAGCGAA +CTGTTCGGTTATGTTAAAGGCGCATTTACTGGCGCTTCTGCCAACGGTAAAACAGGGTTG +ATTCAGGCGGCGAATACGGGCACGCTGTTTCTCGATGAAATTGGTGATATGCCATTAATG +TTGCAGGCTAAATTACTGCGCGCTATTGAGGCGCGTGAAATTCTGCCGATTGGTGCCAGT +AGCCCAATACAAGTCGACATCCGCATCATTTCTGCAACTAATCAGAATTTGGCCCAGTTC +ATTGCCGAAGGTAAATTCCGCGAAGATCTCTTCTACCGACTTAATGTTATCCCGATAACT +CTTCCACCGCTGCGTGAACGTCAGGAAGATATTGAATTACTGGTGCATTACTTTTTACAT +CTGCATACCCGTCGTCTGGGATCGGTTTATCCTGGCATTGCTCCTGATGTCGTCGAAATA +TTGCGTAAGCATCGTTGGCCCGGAAACCTGCGCGAGTTAAGCAATTTGATGGAATATCTG +GTTAACGTTGTTCCTTCAGGTGAAGTTATCGACAGCACGCTATTGCCGCCAAATCTGCTG +AATAATGGCACAACGGAGCAAAGTGATGTAACAGAGGTCAGTGAGGCGCACCTGTCACTC +GATGATGCGGGCGGCACGGCGCTGGAGGAGATGGAAAAGCAAATGATCCGCGAGGCGCTT +TCACGTCATAACAGCAAGAAGGAAGTTGCTGATGAACTGGGCATCGGCATTGCTACGCTC +TATCGCAAGATTAAGAAATATGAGTTGTTAAACACATAA +>test.0417.00002.0003i_00062 1188 ygeW | Putative carbamoyltransferase YgeW | 2.1.3.- | similar to AA sequence:UniProtKB:Q46803 | COG:COG0078 +ATGAAAACTGTTAATGAGCTGATTAAGGATATCAATTCGCTGACCTCTCACCTGCATGAA +AAAGATTTTTTGTTAACGTGGGAACAGACGCCAGACGAACTGAAACAAGTACTGGACGTT +GCCGCCGCGTTAAAAGCACTGCGTGCTGAAAACATCTCAACCAAAGTCTTTAATAGTGGA +TTAGGTATTTCCGTCTTCCGCGACAACTCCACCCGTACCCGCTTCTCTTATGCTTCCGCG +CTTAACCTGCTCGGCCTTGCACAACAAGATCTTGACGAAGGTAAATCACAAATCGCTCAC +GGCGAAACCGTGCGTGAAACCGCCAATATGATCTCCTTCTGCGCTGACGCTATCGGTATT +CGCGACGATATGTATCTGGGCGCAGGCAACGCCTATATGCGTGAAGTTGGCGCGGCACTT +GATGACGGCTACAAGCAGGGTGTGCTGCCGCAGCGTCCGGCTTTAGTGAACCTGCAATGC +GATATTGACCACCCGACTCAGTCTATGGCTGACCTGGCATGGTTGCGTGAACACTTTGGT +TCGCTGGAAAACCTGAAAGGCAAAAAAATCGCCATGACCTGGGCCTACTCCCCAAGCTAT +GGCAAACCGCTCTCTGTACCACAAGGCATCATAGGTCTGATGACCCGCTTCGGTATGGAT +GTCACCCTGGCCCATCCGGAAGGCTACGACCTGATCCCGGATGTCGTTGAAGTTGCTAAA +AACAATGCTAAAGCCTCCGGTGGTAGCTTCCGTCAGGTCACCAGCATGGAAGAAGCCTTC +AAAGACGCAGACATCGTTTATCCGAAGTCATGGGCACCTTACAAAGTGATGGAAGAGCGT +ACTGAATTGCTGCGTGCGAACGATCACGAAGGCTTAAAAGCACTGGAAAAACAGTGTCTG +GCACAGAACGCGCAACACAAAGACTGGCATTGTACTGAAGAGATGATGGAACTGACCCGT +GATGGCGAAGCCCTGTACATGCACTGCCTGCCAGCTGATATCAGCGGCGTATCCTGCAAA +GAAGGTGAAGTGACTGAAGGCGTATTCGAAAAATACCGTATCGCTACCTACAAAGAAGCC +AGCTGGAAGCCTTATATCATCGCCGCGATGATCCTGTCCCGTAAATACGCCAAACCAGGT +GCACTGCTCGAGCAACTGCTGAAAGAAGCGCAAGAACGCGTGAAATAA +>test.0417.00002.0003i_00063 1197 ygeX | Diaminopropionate ammonia-lyase | 4.3.1.15 | similar to AA sequence:UniProtKB:P66899 | COG:COG1171 +ATGTCCGTTTTCTCATTGAAGATTGATATCGCCGATAACAAATTTTTCAACGGCGAAACA +TCACCGCTTTTTTCGCAAAGCCAGGCAAAACTGGCACGCCAGTTCCACCAGAAAATTGCT +GGTTATCACCCAACACCGCTTTGTGCGCTGGACGATCTCGCAAACCTGTTTGGTGTAAAG +AAAATTCTCGTCAAAGACGAATCAAAACGATTCGGTCTGAACGCCTTCAAAATGCTCGGC +GGTGCGTACGCCATCGCTCAATTATTGTGTGAAAAATATCATCTTGATATCGAAACGCTG +TCATTTGAGCACCTGAAAAATGCCATCGGCGAAAAAATGACTTTCGCGACTACCACCGAC +GGCAACCACGGGCGCGGTGTGGCATGGGCAGCACAGCAACTCGGACAGAATGCGGTGATT +TACATGCCGAAAGGTTCTGCTCAGGAACGCGTTGACGCCATTCTAAACCTCGGTGCCGAG +TGCATCGTCACGGATATGAACTATGACGATACCGTTCGCCTGACCATGCAACACGCGCAG +CAGCACGGCTGGGAAGTGGTACAGGACACGGCATGGGAAGGCTACACCAAAATCCCAACC +TGGATCATGCAAGGCTACGCAACACTGGCGGATGAAGCCGTCGAGCAAATGCGTGAAATG +GGCGTAACCCCGACACACGTTCTGCTACAAGCCGGTGTCGGTGCAATGGCCGGTGGTGTG +CTGGGTTATCTGGTCGACGTCTATAGCCCGCAAAATCTGCACAGCATTATTGTTGAACCT +GACAAAGCTGACTGTATTTATCGCTCCGGCGTCAAAGGCGACATCGTCAACGTTGGCGGT +GATATGGCCACCATCATGGCGGGCCTGGCCTGCGGCGAACCTAACCCGCTGGGCTGGGAA +ATCCTACGTAACTGCGCCACCCAATTCATCTCCTGCCAGGACAGCGTTGCCGCATTAGGT +ATGCGCGTGCTGGGTAATCCGTATGGCAACGACCCGCGCATCATCTCCGGTGAATCCGGC +GCTGTCGGTTTGGGCGTTCTCGCAGCGGTTCATTATCACCCGCAACGTCAAAGCCTGATG +GAAAAACTGGCGCTGAACAAAGATGCCGTGGTGCTGGTTATCAGCACTGAAGGCGACACC +GACGTGAAGCACTACCGCGAAGTTGTCTGGGAAGGCAAACACGCTGTAGCACCTTAA +>test.0417.00002.0003i_00064 1212 argE | Acetylornithine deacetylase | 3.5.1.16 | similar to AA sequence:UniProtKB:P23908 | COG:COG0624 +ATGGCTAAGAATATTCCATTCAAACTGATTCTTGAAAAAGCAAAAGATTACCAGGCAGAC +ATGACTCGCTTCCTACGCGATATGGTTGCTATTCCCAGTGAAAGCTGCGACGAGAAACGC +GTAGTACATCGTATTAAAGAAGAGATGGAAAAAGTCGGCTTCGATAAAGTTGAAATCGAC +CCAATGGGCAACGTTCTCGGTTATATCGGCCACGGCCCGCGTCTGGTGGCAATGGACGCT +CATATCGACACCGTCGGCATTGGCAACATCAAAAACTGGGACTTCGATCCGTATGAAGGC +ATGGAAACCGACGAGCTGATCGGTGGTCGCGGTACTTCCGACCAGGAAGGCGGCATGGCA +TCTATGGTTTATGCCGGTAAAATCATTAAAGACCTCGGTCTGGAAGATGAATATACCCTG +CTGGTTACCGGTACTGTGCAGGAAGAAGACTGCGACGGTCTGTGCTGGCAATACATTATT +GAACAATCCGGCATTCGCCCGGAATTTGTGGTCAGTACCGAACCAACCGACTGCCAGGTA +TACCGTGGTCAACGCGGTCGTATGGAAATTCGCATTGATGTTCAGGGTGTTAGCTGCCAC +GGTTCGGCACCAGAACGTGGTGATAACGCCATTTTCAAAATGGGTCCAATTCTTGGCGAA +TTACAGGAACTGTCTCAACGTCTGGGCTATGACGAATTCCTCGGCAAAGGTACGCTGACT +GTTTCCGAAATTTTCTTCACCTCCCCAAGTCGTTGCGCTGTCGCAGATAGCTGCGCAGTT +TCTATTGACCGCCGTCTCACCTGGGGCGAAACATGGGAAGGCGCGCTGGACGAGATCCGT +GCCCTGCCTGCAGTACAAAAAGCGAATGCTGTCGTTTCTATGTACAACTACGACCGTCCG +TCCTGGACTGGCCTGGTTTATCCAACCGAATGCTACTTCCCGACCTGGAAAGTGGAAGAA +GATCACTTCACCGTTAAAGCACTGGTGAATGCTTATGAAGGGCTGTTTGGTAAAGCGCCT +GTCGTTGATAAGTGGACCTTCTCAACTAACGGCGTATCCATCATGGGTCGCCACGGCATT +CCGGTCATCGGTTTTGGCCCTGGTAAAGAACCGGAAGCGCACGCGCCAAACGAAAAAACC +TGGAAATCTCACCTGGTAACCTGTGCCGCTATGTACGCTGCAATCCCATTAAGCTGGCTG +GCAACCGAATAA +>test.0417.00002.0003b_00065 1386 hyuA | D-phenylhydantoinase | 3.5.2.- | similar to AA sequence:UniProtKB:Q46806 | COG:COG0044 +ATGCGCGTATTGATAAAAAACGGCATTGTTGTTAATGCAGATGGACAGGCGAAGCAGGAT +TTGCTGATTGAAAGCGGGATTGTTCGCCAGTTGGGTACCGATATTTCGCCGCAACTCCCT +TGCGAAGAAATTGATGCCTCTGGCTGTTACGTTTTCCCTGGCGGCGTGGATGTCCATACG +CATTTCAATATTGATGTCGGCATCGCGCGCAGTTGTGATGATTTTTTTACCGGTACCCGC +GCTGCTGCGTGTGGCGGTACAACAACCATTATTGACCATATGGGATTTGGCCCAAATGGC +TGCCGGTTACGCCATCAACTGGAAGTTTATCGCGGTTATGCCGCCCACAAAGCAGTCATC +GACTACAGCTTTCACGGTGTCATTCAACATATTAATCACGCTATCCTCGACGAAATTCCG +ATGATGGTTGAGGAAGGACTGAGCAGCTTTAAACTCTATTTAACCTATCAATATAAACTC +AACGATGATGAAGTGTTGCAGGCATTACGCCGCTTGCATGAGTCCGGCGCGCTGACCACC +GTACACCCGGAAAATGACGCAGCTATCGCCAGCAAGCGGGCGGAGTTTATCGCCGCAGGG +TTAACCGCGCCGCGTTATCATGCCTTGAGTCGACCTCTGGAATGCGAAGCGGAAGCCATC +GCCCGCATGATTAACCTGGCACAAATTGCCGGTAACGCCCCGCTCTATATCGTGCACCTG +TCTAACGGCTTAGGTCTAGATTATCTGCGTCTTGCCCGTGCGAATCACCAGCCAGTCTGG +GTTGAAACCTGCCCACAATATCTCCTGTTGGACGAACGCAGTTACGATACAGAAGATGGC +ATGAAGTTCATTCTTAGCCCACCGCTGCGTAACGTACGCGAGCAGGACAAACTGTGGTGT +GGCATCAGCGATGGTGCGATTGACGTGGTGGCAACCGATCACTGCACCTTCTCGATGGCT +CAACGCCTGCAAATTTCTAAAGGCGATTTCAGCCGCTGCCCAAATGGCTTACCCGGTGTG +GAGAACCGCATGCAACTGCTGTTCTCCAGTGGCGTGATGACGGGACGTATCTCACCGGAG +CGTTTTGTTGAGTTAACCAGTGCAATGCCCGCCAGGCTGTTTGGCCTGTGGCCACAAAAA +GGATTATTAGCGCCCGGTTCCGATGGCGACGTGGTGATTATAGACCCACGTCAGAGCCAA +CAAATTCAGCATCGCCATCTCCACGACAACGCTGACTACTCGCCATGGGAGGGTTTTACC +TGTCAGGGCGCGATTGTCAGAACCTTATCTCGTGGTGAAACGATTTTCTGCGACAGCACC +TTTACAGGCAAAGCCGGGCGAGGTCGTTTCCTGCGACGCAAACCGTTTGTCCCTCCCGTG +CTCTAA +>test.0417.00002.0004b_00066 1626 NA | hypothetical protein | NA | NA | NA +ATGAATATTTTCACAGAGGCTGCAAAACTCGAAGAGCAAAATTGTCCGTTTGCGATGGCG +CAAATTGTTGATAGCCGAGGCTCAACCCCCCGCCATTCTGCACAAATGTTAGTGCGCGCC +GATGGTTCTATCGTCGGTACAATTGGTGGCGGAATGGTTGAACGGAAGGTGATTGAAGAG +TCGCTTCAGGCATTGCAGGAACGTAAGCCGCGATTATTCCATGGACGTATGGCTCGTAAC +GGTGCGGATGCTGTCGGGTCAGATTGTGGAGGTGCAATGTCAGTATTTATCAGCGTCCAT +GGTATGCGTCCACGTCTGGTGTTGATTGGTGCGGGGCATGTCAACCGGGCGATAGCCCAG +AGTGCGGCGCTATTAGGATTTGATATCGCCGTTGCTGATATTTATCGCGAAAGCCTCAAT +CCTGAACTATTCCCACCATCAACCACGCTTCTCCATGCTGAGTCGTTTGGTGCGGCAGTG +GAAGCACTGGATATTCGCCCTGATAATTTTGTCCTGATTGCCACGAATAATCAGGATCGT +GAAGCCCTCGACAAACTCATTGAACAACCCATTGCATGGCTGGGGTTGCTGGCAAGTCGC +CGCAAGGTTCAGCTTTTCCTGCGCCAATTGCGTGAGAAAGGCGTGGCTGAAGAACATATT +GCCCGTTTACATGCGCCCGTTGGTTACAATATAGGTGCGGAAACGCCGCAAGAGATCGCC +ATCAGCGTGCTGGCAGAAATATTACAGGTGAAAAATAACGCGCCGGGTGGGCTGATGATG +AAGCCTTCTCATCCTTCCGGACACCAGCTGGTGGTGATTCGCGGTGCGGGGGATATCGCC +AGTGGTGTAGCGCTACGTCTGTATCATGCGGGTTTTAAAGTGATCATGTTGGAAGTGGAA +AAACCGACAGTGATTCGTTGTACCGTGGCGTTTGCCCAGGCCGTGTTCGATGGCGAAATG +ACGGTCGAAGGCGTCACCGCCCGCCTGGCAACCAGCTCTGCGGAAGCGATGAAACTTACC +GAACGCGGATTTATCCCTGTGATGGTAGATCCCACCTGTTCATTGCTTGATGAACTGAAA +CCGCTTTGCGTGGTGGACGCTATTCTGGCGAAACAGAATTTGGGAACGCGGGCAGATATG +GCACCAGTAACAATCGCGCTTGGGCCGGGCTTTACTGCAGGGAAGGATTGTCATGCGGTA +ATTGAAACAAATCGCGGGCACTGGCTCGGTCAGGTGATTTACTCAGGTTGTGCGCAGGAG +AATACCGGTGTTCCCGGCAATATTATGGGGCATACCACCCGACGAGTGATCCGCGCTCCT +GCTGCAGGCATTATGCGATCCAACGTGAAATTAGGCGATCTGGTGAAAGAGGGCGATGTC +ATTGCCTGGATTGGTGAGCATGAAATTAAAGCACCGTTGACGGGGATGGTGCGTGGCTTG +TTGAACGACGGACTGGCCGTGGTCGGTGGTTTTAAAATTGGTGATATCGATCCTCGTGGT +GAAACGGCTGATTTCACCAGCGTTTCTGATAAAGCCCGGGCGATTGGCGGCGGCGTACTT +GAGGCGTTAATGATGTTGATGCATCAGGGCGTTAAAGCGACAAAAGAAGTGCTGGAAGTG +GCTTAA +>test.0417.00002.0004i_00067 480 NA | hypothetical protein | NA | NA | NA +GTGCAGGGATTTACGCCAGAAGCGATTGATGCACTGGTACAACGACCAGAGTGTGACGTA +ATTCTCATTGAGGCAGATGGCTCGCGTGGAATGCCGTTAAAAGCGCCTGATGAGCACGAA +CCTTGCATACCTAAAAGCAGTTGCTGCGTGATTGCTGTGATGGGAGGACATATTTTGGGT +GCGAAAGTGAGCACAGAAAATGTCCATCGCTGGTCGCAGTTTGCTGATATTACTGGGTTA +ACACCTGCTGCACCCTTGCAACTGAGCGATCTCGTTGCGCTGGTTCGCCACCCTCAGGGG +GCGTTTAAAAACGTACCACAAGGTTGTCGGCGAGTCTGGTTCATTAACCGTTTTTCTCAA +TGTGAGAATGCGATTGCGCAAAGCGAGCTCCTTCAACCGCTGCAACAACACAACGTAGAG +GCAATCTGGCTGGGCGATATACAAGAACATCCTGCAATCGCGCGCAGATTTGTGAATTAG +>test.0417.00002.0004i_00068 579 mocA | Molybdenum cofactor cytidylyltransferase | 2.7.7.76 | similar to AA sequence:UniProtKB:Q46810 | COG:COG2068 +ATGTCAGCCATCGACTGTATAATTACCGCCGCAGGATTATCATCAAGAATGGGGCAATGG +AAAATGATGTTACCCTGGCAACAGGGAACAATTCTTGATACAAGTATCAAAAATGCGTTG +CAGTTTTGTAGCCGAATTATTTTAGTCACCGGCTATCGTGGTAATGAACTGCACGAACGT +TATGCGAACCAGAGCAATATCACTATTATCCACAACCCAGATTATGCGCAGGGTTTACTG +ACATCAGTAAAGGCCGCAGTACCCGCGGTACAAACAGAACATTGTTTTCTCACCCACGGA +GATATGCCAACCCTCACCATCGATATTTTTAGAAAAATCTGGTCGTTACGAAATGATGGC +GCAATACTGCCACTCCATAATGGCATCCCCGGCCATCCGATTTTAGTGTCAAAACCATGC +CTGATGCAGGCAATCCAGCGACCCAATGTCACCAATATGCGTCAGGCACTCCTTATGGGA +GAACATTATTCCGTCGAAATAGAAAATGCAGAAATAATTTTAGATATTGATACTCCGGAC +GACTTTATTACAGCGAAGAAAAGGTATACTGAAATTTAG +>test.0417.00002.0004i_00069 3099 ygfK | Putative oxidoreductase YgfK | NA | similar to AA sequence:UniProtKB:Q46811 | COG:COG0493 +ATGGGGGATATTATGCGTCCCATTCCGTTTGAGGAACTTTTGACGCGCATATTTGATGAA +TACCAACAACAACGCTCAATCTTTGGTATTCCCGAGCAACAGTTTTACTCACCCGTAAAA +GGTAAAACTGTTAGCGTCTTCGGTGAAACCTGTGCCACTCCCGTCGGCCCTGCCGCTGGC +CCGCACACGCAACTTGCGCAAAACATCGTCACCTCCTGGCTGACTGGCGGACGCTTCATC +GAACTAAAAACCGTCCAAATTCTTGACCGCCTGGAGCTGGAAAAGCCCTGTATCGATGCC +GAAGACGAGTGCTTTAACACCGAATGGTCTACCGAATTTACCCTGCTTAAAGCCTGGGAT +GAATACCTCAAAGCCTGGTTTGCCCTGCACCTTCTCGAAGCGATGTTCCAGCCTTCTGAT +TCCGGTAAATCGTTCATCTTTAATATGAGCGTCGGTTACAACCTCGAAGGTATTAAGCAA +CCGCCGATGCAGCAGTTCATCGACAATATGATGGACGCATCTGACCATCCGAAATTCGCT +CAATACCGCGATGCACTTAATAAGCTACTCCAGAATGAGGCATTTTTAGCCCGCCACGGA +TTGCAGGAAAAACGCGAAAGCTTGCAAGCCTTACCCGCTCGCATCCCCACCAGCATGGTA +CAAGGGGTTACCCTCTCCACCATGCACGGCTGTCCTCCGCATGAAATCGAAGCCATTTGC +CGCTACATGCTGGAAGAAAAAGGGCTCAACACCTTTGTGAAACTCAACCCGACCTTACTG +GGGTACGCGCGTGTTCGTGAGATCCTCGATGTCTGCGGTTTCGGTTACATCGGCTTAAAA +GAAGAGTCATTTGATCACGACCTCAAGCTGACGCAAGCGCTGGAAATGCTGGAACGCCTG +ATGGCACTGGCAAAAGAAAAATCACTCGGCTTTGGCGTAAAACTGACTAACACTCTCGGC +ACCATTAATAACAAAGGCGCACTGCCTGGTGAAGAGATGTATATGTCAGGCCGTGCGCTG +TTCCCGCTCTCCATCAACGTTGCAGCAGTTCTCTCTCGCGCCTTTGACGGCAAACTGCCC +ATTTCTTATTCCGGTGGTGCCAGTCAGCTGACTATCCGCGATATTTTTGATACTGGTATT +CGCCCTATTACTATGGCAACCGACCTGCTGAAACCTGGCGGCTATCTGCGCTTAAGTGCC +TGCATGCGCGAGCTGGAAGGCTCCGACGCCTGGGGACTTGACCATGTTGACGTCGAACGA +CTGAACAGACTGGCAGCAGACGCGTTAACCATGGAATACACCCAGAAACACTGGAAGCCA +GAAGAGCGTATTGAAGTGGCTGAAGACCTGCCGCTGACCGATTGCTACGTTGCCCCCTGT +GTTACTGCCTGCGCTATCAAGCAAGATATTCCGGAATACATCCGTCTGCTTGGCGAACAC +CGCTATGCCGACGCGCTGGAACTCATCTATCAACGCAACGCCCTGCCCGCCATTACCGGT +CATATTTGCGATCACCAGTGCCAATACAACTGTACCCGCCTGGATTACGACAGTGCGCTG +AATATCCGCGAACTGAAAAAAGTCGCGCTGGAAAAAGGTTGGGAGGAATATAAGCAACGC +TGGCACAAACCAGCCGGTTCTGGTTCACGCCATCCGGTTGCCGTGATTGGTGCAGGTCCG +GCGGGTCTGGCCGCAGGTTACTTCCTTGCCAGAGCGGGCCATCCGGTTACGCTGTTTGAA +CGCGAAGCCAATGCGGGCGGCGTGGTGAAAAATATCATTCCTCAGTTCCGTATTCCTGCA +GAGTTAATTCAGCACGATATCGATTTTGTTGCCGATCACGGCGTGAAATTTGAGTACGGT +TGCTCACCCGATTTGACCGTTGAACAGTTAAAAAATCAGGGCTTCCACTATGTTCTGATT +GCCACCGGCACTGATAAAAATAGCGGTGTGAAACTGGCGGGCGACAACCAAAATGTCTGG +AAATCACTCCCCTTCCTGCGTGAATACAACAAGGGCACAGCGCTCAAGCTGGGCAAACAT +GTGGTCGTTGTCGGGGCGGGTAACACGGCAATGGACTGCGCTCGTGCGGCGTTACGCGTT +CCAGGCGTAGAAAAAGCAACGGTCGTTTACCGTCGTTCACTGCAAGAGATGCCAGCATGG +CGCGAAGAGTATGAAGAAGCGTTGCACGACGGCGTGGAGTTCCGTTTCCTGAATAATCCG +GAACGTTTCGATGCTGATGGCACCTTAACCTTGCGCGTTATGTCGCTTGGCGAACCTGAT +GAGAAAGGTCGTCGCCGTCCGGTTGAAACCAACGAAACAGTAACGCTGCATGTAGACAGC +CTGATCACCGCCATTGGTGAACAGCAGGATACTGAAGCCCTGAATGCAATGGGCGTGCCG +CTGGACAAAAACGGCTGGCCAGACGTCGACCATAATGGCGAAACGCGTCTGACTGACGTC +TTTATGATCGGCGACGTACAGCGCGGACCATCCTCCATTGTCGCTGCTGTCGGAACCGCG +CGTCGGGCGACCGATGCCATCCTGAGTCGGGAAAATATCCGTTCCCACCAGAACGATAAA +TACTGGAATAACGTCAATCCGGCGGAAATCTATCAACGTAAAGGCGATATCTCTGTCACT +CTGGTGAACAGTGACGATCGTGATGCGTTTGTCGCGCAGGAAGCCGCTCGCTGCCTTGAA +TGTAACTACGTTTGCAGCAAGTGTGTGGATGTCTGCCCGAACCGCGCCAACGTATCCATT +GCGGTCCCAGGCTTCCAGAACCGTTTCCAGACGCTGCACCTCGACGCTTACTGTAACGAA +TGTGGCAACTGCGCCCAATTCTGCCCGTGGAACGGTAAACCGTACAAAGACAAAATCACC +GTCTTCAGCCTGTCGCAAGACTTTGATAACAGCAGCAACCCAGGCTTCCTTGTGGAAGAT +TGCCGGGTACGCGTACGTCTGAATAACCAAAGCTGGGTGTTAAACATCGACAGCGAAGGT +CAGTTCAACAACGTACCACCGGAGCTGAACGATATGTGCCGCATCATTAGCCATGTCCAC +CAGCATCATCATTATCTGCTGGGCCGCGTGGAGGTGTAA +>test.0417.00002.0004i_00070 1329 ssnA | Putative aminohydrolase SsnA | 3.-.-.- | similar to AA sequence:UniProtKB:Q46812 | COG:COG0402 +ATGTTGATTCTGAAGAATGTCACCGCAGTGCAGTTACACCCGGCGAAAGTGCAGGAAGGC +GTTGATATCGCCATCGAAAATGATGTGATTGTCGCTATCGACGATGCCCTGACGCAACGC +TATCCCGATGCCAGCTACAAAGAGATGCATGGTCGGATTGTGATGCCGGGAATTGTCTGC +TCGCATAACCATTTTTACTCGGGGCTTTCCCGCGGAATTATGGCAAACATCGCCCCCTGC +CCGGATTTCATCTCAACGCTGAAAAATCTCTGGTGGCGGCTCGATCGCGCCCTTGATGAA +GAGTCGCTCTATTACAGCGGACTGATTTGTTCCCTGGAAGCAATTAAGAGCGGATGTACA +TCGGTTATCGATCACCATGCCTCTCCAGCCTATATCGGCGGGTCGCTCTCCACATTGCGC +GACGCATTTTTAAAAGTTGGCCTGCGCGCGATGACCTGTTTTGAAACTACTGACCGTAAC +AGCGGCATCAAAGAGTTGCAGGAAGGTGTAGAAGAAAACATCCGCTTCGCCCGTCAGATT +GATGAGGCGAAGAAAGCAGCAACCGAGCCGTATCTGGTGGAAGCACATATCGGCGCTCAC +GCGCCGTTTACCGTACCGGATGCCGGTCTGGAGATGCTGTGTGAAGCCGTGAAAAGCACA +GGTCGTGGTTTGCATATTCACGCTGCGGAAGACCTTTACGACGTTTCCTACAGTCACCAT +TGGTACGGCAAAGACCTGCTGGCACGACTGGCGCAATTCGATCTCATCGACAGCAAAACG +CTGGTCGCTCATGGGCTGTACTTGTCGAAAGATGACATCGCCCTACTCAATCAGCGCGAT +GCGTTCCTGGTGCATAACGCCCGTTCAAACATGAACAACCATGTCGGCTACAACCATCAC +CTTAGCGACATCCGCAATCTGGCGTTGGGAACGGACGGCATTGGTTCGGACATGTTTGAA +GAGATGAAATTTGCCTTCTTTAAACATCGCGATGCGGGTGGCCCGCTGTGGCCTGACAGT +TTTGCCAAAGCACTGGCTAACGGCAACGAACTGATGAGCCGCAACTTTGGCGCGAAATTT +GGGCTTCTGGAAGCCGGTTACAAAGCCGATTTAACCATTTGCGATTACAACTCGCCGACG +CCGCTGCTGGCAGACAATATCGCCGGGCATATCGCTTTCGGTATGGGCTCAGGCAGCGTT +CACAGCGTGATGGTCAATGGTGTGATGGTCTATGAAGACCGTCAGTTTAACTTCGATTGC +GATTCCATTTATGCGCAAGCCAGAAAAGCCGCTGCCAGTATGTGGCGTCGGATGGATGCG +CTGGCATAA +>test.0417.00002.0004i_00071 780 NA | hypothetical protein | NA | NA | NA +ATGATTGAACAATTTTTCAGACCCGACTCAGTCGAACAGGCGCTGGAACTGAAGCGCCGC +TACCAGGATGAAGCCGTCTGGTTCGCCGGGGGCAGCAAACTCAACGCTACACCAACCCGT +ACCGATAAAAAGATTGCCATTTCCTTGCAGGATCTGGAGCTGGACTGGATTGACTGGGAT +AACGGTGCACTACGAATTGGCGCAATGTCTCGCTTGCAGCCACTGCGTGATGCGCGATTT +ATTCCTGCAGCACTGCGTGAAGCCCTCGGTTTTGTTTACTCACGCCATGTTCGTAATCAG +TCGACCATTGGTGGTGAAATCGCCGCCCGGCAAGAAGAGTCAGTGCTGCTTCCCGTCCTG +CTGGCACTGGATGCTGAACTGGTTTTTGGCAACGGCGAAACGCTGTCAATCGAGGACTAC +CTGGCCTGCCCATGCGATCGCCTGTTAACCGAAATTATCATTAAAGATCCGTATCGCACC +TGTGCGACTCGCAAAATTAGCCGTTCTCAGGCAGGTTTAACCGTCGTGACGGCAGCCGTT +GCAATAACAGACCACGACGGTATGCGAATTGCGCTGGATGGCGTCGCCAGTAAAGCACTG +CGTCTGCACGATGTCGAAACTCAAAATCTGGAAGGCAATGCACTTGAACAGGCTGTCGCC +AACGCCATTTTCCCGCAGGAAGATTTGCGGGGCAGCGTGGCCTATAAACGCTATATCACG +GGAGTTCTGGTAGCCGATCTGTATGCCGACTGCCAACAGGCTGGGGAGGAAGCCGTATGA +>test.0417.00002.0004i_00072 2871 xdhA_2 | Putative xanthine dehydrogenase molybdenum-binding subunit XdhA | 1.17.1.4 | similar to AA sequence:UniProtKB:Q46799 | COG:COG1529 +ATGATCATCCACTTTACTTTAAATGGCGCGCCTCAGGAGCTAACCGTTAATCCAGGCGAA +AACGTGCAAAAGCTGTTGTTTAACATGGGAATGCACTCTGTACGCAACAGTGATGATGGT +TTTGGGTTTGCCGGTTCTGACGCAATTATCTTTAACGGTAATATCGTTAACGCGTCCTTG +CTTATCGCCGCACAGTTAGAGAAGGCAGATATTCGTACCGCAGAATCTCTGGGCAAATGG +AATGAGTTAAGTCTGGTTCAACAGGCCATGGTTGATGTTGGCGTGGTGCAGTCTGGTTAT +AACGATCCAGCTGCGGCTCTGATTATCACCGATCTTCTCGATCGCATCGACGCACCTACC +CGCGAAGAGATCGACGACGCACTCTCAGGTCTGTTTAGCCGCGATGCTGGCTGGCAGCAA +TACTATCAGGTCATTGAACTGGCGGTTGCACGTAAAAATAATCCGCAGGCCACCATTGAT +ATCGCTCCGACTTTCCGTGACGACCTTGAAGTCATTGGCAAGCATTATCCTAAAACTGAT +GCCGCGAAAATGGTGCAGGCGAAACCCTGCTATGTTGAAGATCGAGTAACGGCTGACGCC +TGCGTCATTAAAATGTTACGTAGCCCACACGCTCACGCACTGATTACTCATCTGGATGTC +AGCAAAGCTGAAGCCTTACCGGGCGTCGTTCACGTTATTACTCACCTGAATTGCCCGGAT +ATTTACTATACCCCGGGTGGTCAGAGCGCACCGGAACCGTCACCGCTTGACCGCCGAATG +TTCGGCAAGAAAATGCGTCACGTCGGCGATCGCGTTGCTGCGGTAGTAGCCGAAAATGAA +GACATTGCGCTCGAAGCACTGAAGCTCATCGACGTTGAATATGAAGTGCTTAAGCCGGTA +ATGTCGATTGACGAGGCAATGGCGGAAGATGCGCCTGTCGTGCACGATGAACCGGTGGTG +TATGTTGCTGGTGCGCCAGATACTCTGGAAGATGATAACAGCCATGCAGCCCAGCGCGGC +GAGCATATGATCATCAACTTCCCGATCGGTTCTCGCCCACGCAAAAATATCGCTGCCAGT +ATTCATGGTCATATTGGCGATATGGACAAAGGCTTTGCCGATGCCGATGTGATCATTGAG +CGAACCTATAACTCAACGCAGGCGCAGCAGTGCCCGACTGAAACACATATCTGCTTTACC +CGTATGGACGGCGATCGTCTGGTGATCCACGCCTCCACCCAGGTACCATGGCACTTACGC +CGCCAGGTCGCGCGCCTCGTGGGCATGAAACAACATAAAGTTCATGTCATTAAAGAACGT +GTAGGCGGCGGTTTTGGTTCCAAACAGGACATCCTGCTGGAAGAAGTGTGCGCCTGGGCA +ACCTGCGTGACCGGGCGTCCGGTACTGTTCCGCTACACCCGTGAAGAAGAGTTTATTGCT +AACACCTCTCGTCACGTCGCGAAAGTCACCGTCAAACTGGGCGCGAAAAAAGATGGTCGC +CTGACGGCAGTGAAGATGGATTTCCGCGCCAACACGGGTCCTTACGGTAACCACTCACTC +ACCGTACCGTGTAACGGACCGGCGCTGTCGCTGCCGTTATATCCATGCGATAACGTCGAT +TTTCAGGTCACCACCTACTACAGCAACATTTGCCCAAATGGTGCTTATCAGGGTTATGGC +GCGCCGAAAGGTAACTTCGCTATCACCATGGCGTTAGCGGAACTGGCGGAACAATTGCAG +ATCGACCAACTGGAAATTATTGAACGTAATCGTGTACACGAAGGGCAAGAGCTGAAAATT +CTCGGTGCGATTGGTGAAGGTAAAGCGCCGACATCCGTTCCTTCCGCCGCCAGCTGCGCA +CTGGAAGAGATCCTGCGTCAGGGTCGCGAGATGATCCAATGGTCTTCACCAAAACCACAA +AACGGTGACTGGCACATCGGTCGTGGCGTCGCCATTATCATGCAGAAATCGGGTATCCCG +GATATCGATCAGGCTAACTGCATGATCAAACTGGAATCAGACGGTACCTTTATCGTTCAT +TCTGGCGGTGCGGATATTGGTACTGGTTTGGATACTGTGGTGACGAAACTGGCAGCAGAA +GTGCTGCACTGCCCCCCGCAGGACGTGCATGTTATCTCCGGTGATACCGATCATGCGTTG +TTTGATAAAGGCGCATATGCCTCGTCCGGTACTTGCTTCTCGGGTAACGCTGCGCGTTTG +GCAGCGGAAAATCTGCGGGAGAAAATCCTGTTCCACGGCGCGCAAATGTTGGGTGAGCCA +GTGGCAGATGTTCAACTAGCAACGCCGGGCGTCGTTCGCGGCAAGAAAGGCGAAGTTAGT +TTCGGAGAGATAGCCCATAAAGGCGAAACCGGCACCGGCTTTGGTTCACTGGTGGGAACT +GGCAGTTATATCACGCCTGATTTCGCCTTCCCGTATGGCGCAAACTTCGCTGAAGTTGCC +GTCAACACGCGTACGGGTGAAATCCGCCTGGATAAATTCTACGCCTTGCTGGACTGCGGT +ACACCGGTCAATCCAGAGTTAGCGCTGGGACAAATCTACGGTGCCACCCTGCGTGCTATC +GGCCACAGTATGAGCGAAGAGATCATTTATGACGCCGAAGGTCACCCGTTAACGCGTGAT +TTACGCAGTTACGGCGCACCGAAAATTGGTGACATTCCGCGTGATTTCCGCGCTGTGCTG +GTGCCGAGCGACGATAAAGTCGGCCCATTCGGGGCGAAATCGATCTCGGAAATCGGTGTA +AATGGCGCCGCTCCGGCGATTGCTACCGCAATTCACGATGCCTGCGGCATCTGGTTACGC +GAATGGCATTTCACACCGGAGAAAATACTCACCGCGCTGGAAAAAATATAA +>test.0417.00002.0004i_00073 1401 xanQ | Xanthine permease XanQ | NA | similar to AA sequence:UniProtKB:P67444 | COG:COG2233 +ATGTCTGATATAAACCATGCAGGTTCTGACCTTATATTTGAACTGGAGGATCGCCCTCCC +TTTCATCAGGCTCTCGTAGGTGCCATTACCCATCTGTTGGCAATTTTCGTTCCGATGGTA +ACCCCCGCGTTAATCGTGGGTGCGGCCTTACAGCTTTCCGCTGAAACAACTGCCTATCTT +GTTTCTATGGCGATGATCGCCTCTGGTATTGGTACCTGGTTACAAGTAAACCGCTACGGC +ATCGTCGGTTCTGGTTTACTTTCAATTCAGTCAGTCAATTTTTCATTTGTTACGGTCATG +ATTGCGCTGGGTAGCAGCATGAAAAGCGACGGTTTTCACGAAGAGTTAATCATGTCGTCG +CTCCTCGGCGTCTCCTTCGTTGGCGCATTTCTGGTTGTCGGCTCTTCTTTTATCCTGCCC +TATTTACGTCGGGTTATTACGCCTACCGTCAGCGGCATTGTGGTGCTGATGATCGGCTTA +AGCCTGATTAAAGTTGGCATTATTGATTTTGGCGGTGGTTTTGCAGCTAAAAGCAGCGGT +ACGTTCGGCAATTACGAGCATCTCGGCGTTGGCTTATTGGTTTTGATTGTGGTGATCGGC +TTTAACTGCTGCAGCAGTCCGTTGCTACGCATGGGTGGGATCGCCATTGGGCTATGTGTC +GGCTATATCGCATCGTTATGCCTGGGCATGGTGGATTTCAGCAGTGTGCGCAATTTGCCG +TTAATCACCATCCCGCATCCGTTCAAATACGGCTTTAGTTTTAGCTTCCATCAGTTCCTG +GTGGTTGGCACGATTTATCTGCTTAGCGTGCTGGAAGCTGTCGGCGATATCACCGCCACG +GCAATGGTTTCCCGCCGTCCCATTCAGGGGGAAGAGTATCAGTCCCGACTGAAAGGCGGC +GTGCTGGCAGATGGTCTGGTTTCTGTTATCGCCTCCGCTGTCGGTTCATTACCATTAACC +ACGTTTGCGCAAAATAATGGGGTTATTCAGATGACTGGCGTCGCTTCACGTTATGTCGGG +CGAACCATCGCGGTAATGCTGGTTATCCTCGGCTTATTTCCGATGATTGGCGGCTTCTTC +ACGACCATTCCCTCAGCAGTTCTGGGAGGCGCAATGACGTTGATGTTTTCCATGATTGCC +ATCGCAGGGATTCGCATCATCATCACCAACGGTTTAAAGCGCCGAGAAACACTTATTGTC +GCCACGTCTTTAGGTTTAGGGCTTGGCGTCTCCTACGATCCCGAAATTTTTAAAATATTG +CCAGCCTCTATTTATGTATTAGTTGAAAACCCTATTTGTGCTGGCGGGTTAACTGCGATT +TTATTAAATATTATCCTCCCTGGTGGCTACCGACAGGAAAACGTTCTGCCTGGTATTACC +TCAGCGGAAGAGATGGATTAA +>test.0417.00002.0004i_00074 1317 guaD | Guanine deaminase | 3.5.4.3 | similar to AA sequence:UniProtKB:P76641 | COG:COG0402 +ATGTCAGGAGAACACACGTTAAAAGCGGTACGAGGCAGTTTTATTGATGTCACCCGTACG +GTCGATAACCCGGAAGAAATTGCCTCTGCGCTGCGGTTTATTGAGGATGGTTTATTACTC +ATTAAACAGGGAAAAGTGGAATGGTTTGGCGAATGGGAAGACGGAAAGCATCAAATTCCT +GACACCATTCGCGTGCGCGACTATCGCGGCAAACTGATAGTACCGGGCTTTGTCGATACA +CATATCCATTATCCGCAAAGTGAAATGGTGGGGGCCTATGGTGAACAATTGCTGGAGTGG +TTGAATAAACACACCTTCCCTACTGAACGTCGTTATGAGGATTTAGAGTACGCCCGCGAG +ATGTCGGCGTTCTTCATCAAGCAGCTTTTACGTAACGGAACCACCACGGCGCTGGTGTTT +GGCACTGTTCATCCACAATCCGTTGATGCGCTGTTTGAAGCCGCCAGTCATATCAATATG +CGTATGATTGCCGGTAAAGTGATGATGGACCGAAACGCACCGGATTATCTGCTCGACACT +GCCGAAAGCAGCTATCACCAAAGCAAAGAACTGATTGAACGCTGGCACAAAAATGGTCGT +CTGTTGTATGCGATTACGCCACGCTTCGCCCCTACCTCATCTCCTGAACAGATGGCGATG +GCGCAACGCCTGAAAGAAGAATATCCGGATACATGGGTACATACCCATCTCTGTGAAAAC +AAAGATGAAATTGCCTGGGTGAAATTGCTTTATCCTGACCATGATGGTTATCTTGATGTT +TACCATCAGTACGGCCTGACCGGTAAAAATTGTGTCTTTGCTCACTGCGTCCATCTCGAA +GAAAAAGAGTGGGATCGTCTCAGCGAAACCAAATCCAGCATTGCTTTCTGTCCGACCTCC +AACCTTTACCTCGGCAGCGGCTTATTCAACTTGAAAAAAGCATGGCAGAAGAAAGTCAAA +GTGGGCATGGGAACAGATATCGGTGCCGGAACAACTTTTAACATGCTGCAAACGCTGAAC +GAAGCCTACAAGGTATTGCAATTACAAGGCTATCGCCTCTCGGCATATGAAGCGTTTTAC +CTGGCCACGCTCGGCGGAGCGAAATCTCTGGGCCTTGACGATTTGATTGGCAACTTTTTA +CCTGGCAAAGAGGCTGATTTCGTGGTGATGGAACCCACTGCCACTCCGCTACAGCAGCTG +CGCTATGACAACTCTGTTTCTTTAGTCGACAAATTGTTCGTGATGATGACGTTGGGCGAT +GACCGTTCGATCTACCGCACCTACGTTGATGGTCGTCTGGTGTACGAACGCAACTAA +>test.0417.00002.0004i_00075 1368 ghxQ | Guanine/hypoxanthine permease GhxQ | NA | similar to AA sequence:UniProtKB:Q46817 | COG:COG2252 +ATGTCTGGAGACATCCTACAAACACCGGACGCACCAAAGCCACAGGGCGCGCTGGATAAT +TATTTTAAAATTACCGCTCGTGGCAGTACCGTTCGTCAGGAAGTACTGGCTGGCTTAACG +ACCTTTCTGGCCATGGTTTATTCCGTTATCGTCGTTCCGGGAATGCTGGGCAAAGCAGGT +TTTCCTCCCGCAGCTGTGTTTGTTGCCACCTGTCTGGTCGCGGGCTTCGGCTCGTTGCTG +ATGGGGTTATGGGCCAATTTGCCAATGGCGATTGGTTGCGCTATTTCCTTGACGGCGTTT +ACCGCATTCAGTCTGGTACTCGGGCAACAAATTAGCGTTCCTGTCGCACTGGGCGCAGTC +TTTCTGATGGGCGTCATCTTCACCGCTATTTCCGTAACCGGTGTGCGTACCTGGATCTTA +CGTAATTTGCCGATGGGGATCGCTCACGGTACAGGTATCGGTATCGGCCTGTTTCTGCTG +CTGATTGCTGCTAACGGTGTGGGAATGGTTATCAAAAACCCGATTGAAGGCTTGCCAGTG +GCGCTCGGTGCGTTTACCTCCTTCCCGGTGATGATGAGCTTACTGGGGCTGGCGGTCATC +TTCGGTCTGGAAAAGTGCCGCGTACCCGGCGGGATCTTGTTGGTGATTATTGCAATTTCG +ATCATCGGCTTAATCTTTGACCCAGCGGTGAAGTACCACGGTCTGGTGGCAATGCCAAGC +CTGACTGGCGAAGATGGTAAGTCTCTGATTTTCAGCCTCGATATTATGGGCGCACTCCAG +CCAACTGTACTTCCGAGTGTACTGGCATTGGTGATGACCGCAGTGTTCGACGCCACTGGC +ACCATCCGTGCCGTCGCCGGTCAGGCGAATTTGTTGGATAAAGACAACCAGATCATCAAC +GGCGGCAAAGCCCTGACCAGTGACTCAGTAAGTTCAATATTCTCCGGCCTGGTGGGCGCA +GCGCCCGCGGCGGTTTATATCGAATCAGCGGCAGGAACCGCCGCCGGGGGGAAAACCGGT +TTAACCGCAACCGTGGTTGGTGTGTTGTTCCTGATGATTCTGTTTTTATCACCGTTATCG +TTTCTGATCCCCGGTTATGCCACAGCTCCCGCACTGATGTACGTGGGTTTGCTGATGTTA +AGCAACGTCTCGAAGCTGGATTTCAACGATTTTATTGACGCAATGGCTGGCCTGGTGTGT +GCCGTGTTCATCGTTCTGACTTGTAATATCGTTACCGGTATTATGCTGGGCTTTGTAACA +CTGGTGGTGGGTCGCGTCTTTGCGCGCGAATGGCAAAAGCTGAATATTGGTACGGTGATC +ATTACTGCCGCACTGGTCGCGTTTTACGCGGGTGGTTGGGCAATCTAA +>test.0417.00002.0004i_00076 489 hyfA | Hydrogenase-4 component A | 1.-.-.- | similar to AA sequence:UniProtKB:P23481 | COG:COG1142 +ATGAAATCGTTAATTATCGTTAATCCGGCTGACTGTATTGGCTGCCGTACTTGTGAAGTG +GCCTGTGTGGTCGCTCACCCTTCAGAACAGGAGTTGAATGCCGATATCTTTTTACCCCGG +CTGAAGGTACAACGGCTGGATAGCATCAGTGCGCCGGTGATGTGCCATCAGTGTGAAAAC +GCCCCTTGTGTTGGCGCTTGCCCCGTGGGGGCGCTGACGATGGGCGAGCAGGTGGTGCAG +GCCAATTCTGCCCGTTGTATTGGCTGTCAGAGTTGCGTTAGCGCGTGCCCGTTTGGGATG +ATCACCATTCAGTCATTGCCGGGTGATCCCCGGCAACAAATCGTGAAATGCGATCTCTGT +GAACTGCGGGAAGAGGGGCCAGCCTGCGTTGAATCTTGCCCGACACAGGCGCTGCAGTTG +CTGACTGAAAGAGAACTCAGGCGTATCCGCCAGCAGCGTATTGCTGCCAGCAGTGAGAAT +CCTCTCTGA +>test.0417.00002.0004i_00077 1920 NA | Ferredoxin--NADP reductase | 1.18.1.2 | protein motif:HAMAP:MF_01685 | NA +ATGAATAAGTTTATCGCTGCTGAAGCTGCGGAATGTATAGGCTGCCATGCTTGTGAAATT +GCCTGTGCGGTGGCACATAATCAAGAAAACTGGCCGCTGAGTCACAGTGACTTTCGACCG +CGTATCCACGTTGTAGGGAAAGGCCAGGCTGCGAATCCGGTGGCCTGCCATCACTGCAAC +AATGCCCCTTGCGTTACGGCTTGTCCGGTTAATGCTCTGACTTTCCAGTCCGATAGCGTA +CAACTGGACGAGCAAAAATGTATTGGTTGTAAAAGATGCGCAATCGCTTGCCCCTTTGGC +GTCGTTGAGATGGTCGATACGATTGCACAGAAATGCGACCTTTGTAACCAGCGCAGTTCC +GGCACGCAAGCCTGTATTGACGTCTGCCCAACACAGGCGTTACGGCTGATGGACGATAAA +GGGTTGCAGCAGATAAAGGTGGCCCGCCAGCGCAAAACGGCAGCAGGAAAAGCGTCATCA +GACGCTCAGCCATCTCGCAGTGCAGCGTTGCTCCCCGTTAACTCGCGTAAAGGCGCAGAT +AAAATTTCAGCGAGTGAACGGAAAACCCACTTTGGCGAAATCTATTGCGGGCTGGATCCA +CAACAAGCGACTTATGAGAGTGACCGCTGTGTTTATTGTGCCGAAAAAGCTAACTGCAAC +TGGCATTGTCCGCTGCATAACGCTATTCCGGATTACATCCGTCTGGTACAGGAAGGAAAG +ATTATTGAAGCGGCAGAACTTTGCCACCAGACCAGTTCCTTACCCGAAATCTGCGGCAGG +GTATGTCCACAGGACCGTCTTTGTGAAGGTGCATGTACTTTGAAAGATCACTCTGGCGCA +GTCTCTATCGGTAATCTGGAACGCTACATCACCGATACTGCGCTGGCGATGGGCTGGCGT +CCCGATGTCAGCAAAGTTGTTCCCCGTAGCGAAAAAGTGGCGGTGATTGGCGCTGGACCT +GCAGGATTAGGGTGTGCTGATATTCTGGCGCGCGCGGGAGTTCAGGTTGATGTCTTTGAT +CGCCATCCAGAAATTGGCGGTATGCTGACTTTTGGCATTCCTCCTTTCAAACTCGATAAA +ACGGTATTAAGCCAGCGGCGAGAGATATTCACCGCAATGGGAATCGATTTCCATCTCAAC +TGTGAAATTGGCCGCGATATCTCTTTCAACGAATTAACGGCGGAATATGATGCTGTTTTC +CTCGGCGTGGGGACTTACGGGATGATGCGAGCAGATCTGCCGCATGAAGATGCGCCTGGT +GTCATTCAGGCGTTACCGTTCCTGACCGCCCATACCCGCCAGCTCATGGGATTGCCGGAG +TCTGCAGAGTATCCGCTGACGGATGTGGAAGGGAAGCGAGTCGTGGTATTGGGCGGTGGC +GATACGACAATGGATTGTTTGCGGACTTCCATCCGCCTTAATGCTGCCAGCGTGACCTGT +GCGTATCGTCGTGATGAAGTCAGTATGCCGGGTTCGCGCAAAGAGGTGGTCAATGCCCGC +GAGGAAGGTGTTGAGTTTCAGTTCAATGTTCAGCCGCAATATATCGCTTGTGATGAAGAT +GGACGCTTAACGGCGGTGGGCCTGATTCGTACCGCTATGGGTGAGCCGGGGCCGGATGGT +CGCCGTCGTCCTCGTCCGGTTGCGGGTTCAGAGTTTGAATTGCCCGCCGATGTTCTCATT +ATGGCCTTTGGTTTCCAGGCACATACCATGCCGTGGTTGCAGGGCAGCGGAATTAAACTC +GATAAATGGGGCCTGATTCAAACCGGCGACGTCGGGTATTTACCTACCCAGACGCATCTG +AAAAAAGTCTTTGCTGGTGGTGATGCAGTTCATGGCGCGGATCTGGTTGTCACTGCAATG +GCCGCAGGAAGGCAGGCGGCGCGCGATATGTTAACTCTGTTTGATACGAAGGCATCGTGA +>test.0417.00002.0004i_00078 1449 uacT | Uric acid transporter UacT | NA | similar to AA sequence:UniProtKB:Q46821 | COG:COG2233 +ATGAGCGCCATAGATTCCCAACTTCCCTCATCTTCTGGGCAAGACCGCCCAACTGATGAG +GTTGACCGCATATTATCACCAGGAAAGCTGATCATACTCGGTCTGCAACACGTCCTTGTC +ATGTACGCAGGTGCAGTCGCTGTTCCTCTTATGATTGGTGACCGACTCGGCCTATCAAAA +GAAGCTATTGCGATGCTCATCAGCTCGGATCTCTTTTGCTGCGGGATCGTCACATTATTG +CAATGTATCGGTATCGGCCGCTTTATGGGGATCCGCCTGCCGGTGATTATGTCGGTGACC +TTCGCCGCTGTAACACCAATGATAGCCATTGGTATGAACCCGGATATCGGCCTGCTGGGG +ATATTCGGTGCCACTATCGCCGCGGGTTTTATCACCACATTATTAGCGCCACTTATCGGT +CGCTTGATGCCTTTATTCCCGCCACTGGTTACCGGTGTGGTGATTACTTCTATCGGGCTT +AGCATCATTCAGGTGGGTATTGACTGGGCCGCCGGAGGTAAAGGGAATCCGCAATATGGT +AATCCCGTTTATTTAGGTATCTCCTTTGCCGTCTTAATTTTTATCTTGCTCATTACTCGC +TATGCGAAAGGATTTATGTCCAACGTCGCCGTATTACTGGGGATTGTATTTGGCTTTTTA +CTTTCGTGGATGATGAATGAAGTCAATTTATCCGGGCTACATGATGCTTCATGGTTTGCG +ATTGTCACGCCGATGTCATTTGGTATGCCGATTTTCGATCCCGTTTCCATTCTGACCATG +ACTGCCGTGTTAATCATCGTGTTTATCGAGTCGATGGGGATGTTCCTGGCACTGGGTGAA +ATAGTCGGTCGCAAACTCTCTTCCCAGGACATTATTCGTGGGTTACGCGTAGATGGGGTT +GGGACAATGATTGGAGGCACGTTTAACAGCTTCCCACATACGTCATTTTCGCAGAACGTC +GGGCTGGTCAGCGTGACGCGCGTCCACAGCCGCTGGGTGTGCATTGCTTCCGGTATCATT +TTGATCCTGTTCGGCATGGTGCCCAAAATGGCGGTGCTGGTGGCCTCGATTCCGCAATTT +GTGCTGGGCGGCGCGGGGCTGGTGATGTTCGGCATGGTACTGGCGACAGGGATTCGAATT +CTGTCGCGCTGTAACTACACCACTAACCGTTACAACCTCTATATTGTGGCGATCAGTCTC +GGTGTTGGCATGACGCCAACGCTCTCTCACGATTTCTTTTCTAAGTTACCGGCCGTACTG +CAACCGTTGCTGCATAGCGGCATTATGCTCGCAACCCTTAGCGCCGTTGTGCTGAACGTC +TTCTTTAATGGCTACCAGCATCATGCTGACCTGGTGAAGGAATCCGTCTCTGATAAAGAT +TTAAAAGTCAGGACAGTACGTATGTGGCTTCTGATGCGCAAGCTGAAGAAAAATGAGCAT +GGAGAATAA +>test.0417.00002.0004i_00079 126 yqfG | putative protein YqfG | NA | similar to AA sequence:UniProtKB:C1P614 | NA +ATGAATCTTTTAATGCGCGCTATATTCAGTCTGCTGTTGCTTTTTACTCTCTCTATTCCT +GTCATTTCTGATTGTGTTGCAATGGCCATTGAAAGTCGCTTCAAATATATGATGCTGCTT +TTTTAA +>test.0417.00002.0004i_00080 549 idi | Isopentenyl-diphosphate Delta-isomerase | 5.3.3.2 | similar to AA sequence:UniProtKB:Q46822 | COG:COG1443 +ATGCAAACGGAACACGTCATTTTATTGAATGCACAGGGAGTTCCCACGGGTACGCTGGAA +AAGTATGCCGCACACACGGCAGACACCCTCTTACATCTCGCGTTTTCCAGTTGGCTGTTT +AATGCCAAAGGGCAATTATTAGTTACCCGCCGCGCCCTTAGCAAAAAAGCATGGCCTGGC +GTGTGGACTAACTCGGTTTGTGGGCACCCACAACCGGGAGAAAGCAACGAAGAGGCGGTG +ATCCGCCGTTGCCGTTATGAGCTTGGCGTAGAAATTACGCCTCCTGAATCTATCTATCCT +GACTTTCGCTACCGCGCCACCGATCCGAATGGCATTGTGGAAAATGAAGTGTGTCCGGTA +TTTGCCGCACGCACGACCAGTGCGTTACAGATCAACGATGATGAAGTGATGGATTATCAA +TGGTGTGATTTAGCAGCGGTTTTACGCGGTATTGATGCTACGCCGTGGGCGTTCAGTCCG +TGGATGGTGATGCAGGCGACAAATCGCGAAGCCAGAAAACGATTATCTGCATTTACCCAG +CTTAAATAA +>test.0417.00002.0004i_00081 1518 lysS | Lysine--tRNA ligase | 6.1.1.6 | similar to AA sequence:UniProtKB:P0A8N3 | COG:COG1190 +ATGTCTGAACAACACGCACAGGGCGCTGACGCGGTAGTCGATCTTAACAATGAACTGAAA +ACGCGTCGTGAGAAGCTGGCGAACCTGCGTGAGCAGGGGATTGCCTTCCCGAACGATTTC +CGTCGCGATCATACCTCTGACCAATTGCACGCAGAATTCGACGGTAAAGAGAACGAAGAA +CTGGAAGCGCTGAACATCGAAGTCGCCGTTGCTGGCCGCATGATGACCCGTCGTATTATG +GGTAAAGCGTCTTTCGTTACCCTGCAGGACGTTGGCGGTCGCATTCAGTTGTACGTTGCC +CGTGACGATCTGCCGGAAGGCGTTTACAACGAGCAGTTCAAAAAATGGGACCTCGGCGAT +ATCCTCGGCGCGAAAGGTAAACTGTTCAAAACCAAAACCGGCGAACTGTCTATCCACTGT +ACCGAGCTGCGTCTGCTGACCAAAGCACTGCGTCCGCTGCCGGATAAATTCCACGGCTTG +CAGGATCAGGAAGCGCGCTATCGTCAGCGTTATCTGGATCTCATCTCTAACGATGAATCC +CGCAACACCTTTAAAGTGCGCTCGCAGATCCTCTCTGGTATTCGCCAGTTCATGGTGAAT +CGCGGCTTTATGGAAGTTGAAACGCCGATGATGCAGGTGATCCCTGGCGGTGCCGCTGCG +CGTCCGTTCATCACCCACCATAACGCGCTGGATCTCGACATGTACCTGCGTATCGCGCCG +GAACTGTACCTCAAGCGTCTGGTGGTCGGTGGCTTCGAGCGTGTATTCGAAATCAACCGT +AACTTCCGTAACGAAGGTATTTCCGTACGTCATAACCCAGAGTTCACCATGATGGAACTC +TATATGGCTTACGCAGATTACAAAGATCTGATCGAGCTGACCGAATCGCTGTTCCGTACT +CTGGCACAGGATATTCTCGGTAAGACGGAAGTGACCTACGGCGACGTAACGCTGGACTTC +GGTAAGCCGTTCGAAAAACTGACCATGCGTGAAGCGATCAAGAAATATCGCCCGGAAACC +GACATGGCAGATCTGGACAACTTCGACTCTGCGAAAGCGATTGCTGAATCTATCGGCATC +CACGTTGAGAAGAGCTGGGGTCTGGGCCGTATCGTTACCGAGATCTTCGAAGAAGTGGCA +GAAGCACATCTGATCCAGCCGACCTTCATTACTGAATATCCGGCAGAAGTTTCTCCTCTG +GCGCGTCGTAACGACGTTAACCCGGAAATCACAGACCGCTTTGAGTTCTTCATTGGTGGG +CGTGAAATCGGTAACGGCTTTAGCGAGCTGAATGACGCGGAAGATCAGGCGCAGCGCTTC +CTGGATCAGGTTGCCGCGAAAGATGCAGGTGACGACGAAGCGATGTTCTACGACGAAGAT +TATGTCACCGCACTGGAACATGGCTTACCACCGACAGCCGGTCTGGGAATTGGTATCGAC +CGTATGGTAATGCTGTTCACCAACAGCCATACCATCCGCGACGTTATTCTGTTCCCGGCG +ATGCGTCCGGTAAAATAA +>test.0417.00002.0004i_00082 882 prfB | Peptide chain release factor RF2 | NA | similar to AA sequence:UniProtKB:P07012 | COG:COG1186 +ATGAAACAGGGGCTGGAAGATGTTTCTGGTCTGCTGGAACTGGCTGTAGAAGCTGACGAC +GAAGAAACCTTTAACGAAGCCGTTGCTGAACTCGACGCCCTGGAAGAAAAACTGGCGCAG +CTTGAGTTCCGCCGTATGTTCTCTGGCGAATATGACAGCGCCGACTGCTACCTCGATATT +CAGGCGGGGTCTGGCGGTACGGAAGCACAGGACTGGGCGAGCATGCTTGAGCGTATGTAT +CTGCGCTGGGCTGAATCGCGTGGTTTCAAAACTGAAATCATCGAAGAGTCGGAAGGTGAA +GTGGCGGGTATTAAATCCGTGACGATCAAAATCTCCGGCGATTACGCTTATGGCTGGCTG +CGTACAGAAACCGGCGTTCACCGCCTGGTGCGTAAGAGCCCGTTTGACTCCGGTGGTCGT +CGCCACACGTCGTTCAGCTCCGCGTTTGTTTACCCGGAAGTTGATGATGATATCGATATC +GAAATCAATCCGGCGGATCTGCGCATCGACGTTTATCGCGCATCCGGCGCGGGCGGTCAG +CACGTTAACCGTACCGAATCTGCGGTGCGTATTACTCACATCCCAACCGGGATCGTGACC +CAATGCCAGAACGACCGTTCCCAGCACAAGAACAAAGACCAGGCCATGAAGCAGATGAAA +GCGAAGCTTTATGAACTGGAGATGCAGAAGAAAAATGCCGAGAAACAGGCGATGGAAGAT +AACAAATCCGACATCGGCTGGGGCAGCCAGATTCGTTCTTATGTCCTTGATGACTCCCGC +ATTAAAGATCTGCGTACCGGGGTAGAAACCCGCAACACGCAGGCCGTGCTGGACGGCAGC +CTGGATCAATTTATCGAAGCAAGTTTGAAAGCAGGGTTATGA +>test.0417.00002.0004i_00083 1734 recJ | Single-stranded-DNA-specific exonuclease RecJ | 3.1.-.- | similar to AA sequence:UniProtKB:P21893 | COG:COG0608 +GTGAAACAACAGATACAACTTCGTCGCCGAGAAGTCGATGAAACGGCCGACTTGCCCGCT +GAATTGCCTCCCTTGCTGCGCCGTTTATATGCCAGCCGGGGTGTGCGTAGCGCGCAGGAA +CTGGAACGCAGTGTTAAAGGCATGCTGCCCTGGCAGCAACTGAGCGGCGTCGAAAAGGCC +GTTGAGATCCTTTACAACGCTTTTCGCGAAGGAACGCGGATTATTGTGGTCGGTGATTTC +GACGCCGACGGTGCGACCAGCACGGCTCTAAGCGTGCTGGCGATGCGCTCGCTTGGTTGC +AGCAATATCGACTACCTGGTTCCAAACCGTTTCGAAGACGGTTACGGCTTAAGCCCGGAA +GTAGTCGATCAGGCTCATGCCCGTGGCGCGCAGTTAATTGTCACGGTGGATAACGGTATT +TCCTCCCATGCGGGGGTTGAACACGCTCGTTCGTTGGGCATTCCGGTTATTGTTACCGAT +CACCATTTGCCAGGCGACACATTACCCGCAGCGGAAGCGATCATTAACCCTAACTTGCGC +GACTGTAATTTCCCGTCGAAATCACTGGCAGGCGTGGGTGTGGCGTTTTATCTGATGCTG +GCGCTGCGCACCTTTTTGCGCGATCAGGGCTGGTTTGATGAGCGCGGCATCGCAATTCCT +AATCTGGCAGAACTGCTGGATCTGGTAGCGTTGGGGACAGTGGCGGACGTCGTGCCGCTG +GACGCTAATAATCGCATTCTGACCTGGCAGGGGATGAGTCGCATCCGTGCCGGAAAGTGC +CGTCCGGGGATTAAAGCGCTGCTGGAAGTGGCCAATCGCGATCCACAAAAACTCGCCGCC +AGCGATTTAGGTTTTGCGCTGGGGCCACGTCTCAATGCTGCCGGGCGACTGGACGATATG +TCCGTTGGCGTGGCGCTGTTGTTGTGTGACAACATTGGCGAAGCGCGTGTGCTGGCGAAT +GAACTCGATGCACTAAACCAAACACGTAAAGAGATCGAACAGGGAATGCAGGTTGAAGCG +CTCACTCTGTGCGAGAAGCTGGAACGTAGCCGCGACACGCTGCCAGGTGGGCTGGCAATG +TATCACCCTGAATGGCATCAGGGCGTTGTTGGCATTCTGGCATCGCGTATCAAAGAGCGT +TTTCACCGTCCGGTTATCGCCTTTGCGCCTGCGGGCGACGGTACGCTGAAAGGTTCCGGT +CGCTCCATTCAGGGGCTGCATATGCGCGATGCGCTGGAGCGGCTAGACACGCTTTACCCC +GGCATGATGCTCAAGTTTGGCGGCCATGCGATGGCGGCGGGTTTGTCGCTGGAAGAGGAG +AAATTCGAACTCTTTCAGCAACGCTTTGGCGAACTGGTTACCGAGTGGTTAGATCCTTCT +TTATTGCAAGGGGAAGTGGTATCAGACGGCCCATTAAGTGCGGCAGAGATGACCATGGAA +GTGGCGCAACTGCTGCGTGATGCTGGCCCGTGGGGACAAATGTTCCCGGAACCGTTGTTT +GACGGTCATTTCCGTCTGCTGCAACAGCGGCTGGTGGGCGAGCGTCATTTGAAAGTCATG +GTCGAGCCGGTCGGCGGCGGTCCGCTGCTGGATGGTATTGCTTTTAATGTCGATACCGCC +CTCTGGCCGGATAACGGCGTGCGCGAAGTGCAACTGGCTTACAAGCTCGATATCAACGAG +TTTCGCGGCAACCGCAGCCTGCAAATTATCATCGACAATATCTGGCCAATTTAG +>test.0417.00002.0004i_00084 711 dsbC | Thiol:disulfide interchange protein DsbC | NA | similar to AA sequence:UniProtKB:P0AEG6 | COG:COG1651 +ATGAAGAAAGGTTTTATGTTATTTACCTTGTTGGCAGCGTTTTCAGGCTTTGTTCAGGCT +GATGACGCGGCAATTCAACAAACGTTAGCCAAAATGGGCATCAAAAGCAGCGATATTCAG +CCCGCGCCCGTAGCTGGCATGAAGACAGTTCTGACTAACAGCGGTGTGTTGTACATCACC +GATGATGGTAAACATATCATTCAGGGGCCAATGTATGACGTTAGTGGCACGGCTCCGGTC +AATGTCACCAATAAGATGCTGTTAAAGCAGTTGAATGCGCTTGAAAAAGAGATGATCGTT +TATAAAGCGCCGCAGGAAAAACACGTCATCACCGTGTTTACTGATATTACCTGTGGTTAC +TGCCACAAACTGCATGAGCAAATGGCAGACTATAACGCGCTGGGGATCACCGTGCGTTAT +CTTGCTTTCCCGCGCCAGGGGCTGGACAGCGATGCAGAGAAAGAAATGAAAGCTATCTGG +TGTGCGAAAGATAAAAACAAAGCGTTTGATGATGTGATGGCAGGTAAAAGCGTCGCACCA +GCCAGCTGCGACGTGGATATTGCCGACCATTACGCACTTGGCGTCCAGCTTGGCGTTAGC +GGTACTCCGGCAGTTGTGCTGAGCAATGGCACACTTGTTCCGGGTTACCAGCCGCCGAAA +GACATGAAAGAATTCCTCGACGAACACCAAAAAATGACCAGCGGTAAATAA +>test.0417.00002.0004i_00085 897 xerD | Tyrosine recombinase XerD | NA | similar to AA sequence:UniProtKB:P0A8P8 | COG:COG4974 +GTGAAACAGGATCTGGCACGCATCGAGCAGTTTCTTGATGCTCTGTGGCTGGAAAAAAAT +CTGGCTGAAAATACGTTGAACGCTTACCGTCGCGATCTGTCAATGATGGTGGAGTGGTTG +CATCACCGCGGGTTGACGCTGGCGACGGCGCAAAGTGACGATTTGCAGGCATTACTGGCA +GAACGGCTGGAGGGCGGGTATAAAGCCACCAGCTCAGCGCGTTTGCTGAGTGCAGTGCGC +CGATTGTTCCAGTATCTTTATCGCGAAAAGTTTCGTGAAGATGATCCCAGTGCGCATCTC +GCTTCACCGAAATTGCCCCAGCGTTTGCCAAAAGATTTAAGCGAAGCGCAGGTCGAACGT +TTATTACAGGCACCATTAATTGATCAGCCACTGGAGCTACGCGATAAAGCCATGCTTGAA +GTGTTGTATGCTACCGGACTGCGTGTCTCTGAACTGGTCGGGCTGACAATGAGTGATATC +AGCCTGCGTCAGGGCGTGGTGCGGGTCATTGGTAAAGGCAACAAAGAGCGCCTGGTGCCG +TTAGGTGAAGAGGCGGTTTACTGGCTGGAAACCTATCTGGAACATGGGCGTCCGTGGCTG +TTGAATGGTGTGTCAATTGACGTGTTGTTTCCCAGCCAGCGTGCGCAGCAGATGACGCGA +CAGACCTTCTGGCACCGCATTAAACATTATGCCGTGCTGGCGGGTATCGACAGCGAAAAG +CTGTCACCGCATGTGTTGCGTCACGCTTTTGCCACTCACTTATTAAATCATGGTGCGGAT +TTACGCGTGGTGCAGATGCTACTGGGCCACAGCGATCTCTCCACCACGCAAATTTATACG +CATGTCGCTACCGAGCGTCTGCGACAACTTCATCAACAGCATCACCCGCGGGCGTGA +>test.0417.00002.0004i_00086 522 fldB | Flavodoxin 2 | NA | similar to AA sequence:UniProtKB:P0ABY4 | COG:COG0716 +ATGAATATGGGTCTTTTTTACGGTTCCAGCACCTGTTACACCGAAATGGCGGCAGAAAAA +ATCCGCGATATTATCGGCCCAGAACTGGTGACCTTACATAACCTCAAGGACGACTCCCCG +AAATTAATGGAGCAGTACGATGTGCTCATTCTGGGTATCCCGACCTGGGATTTTGGCGAA +ATCCAGGAAGACTGGGAAGCCGTCTGGGATCAGCTCGACGACCTGAACCTCGAAGGTAAA +ATTGTTGCGCTGTATGGGCTTGGCGATCAACTGGGATACGGCGAGTGGTTCCTCGATGCG +CTCGGTATGCTGCATGACAAACTCTCGACCAAAGGCGTGAAGTTCGTCGGCTACTGGCCA +ACGGAAGGATATGAATTTACCAGCCCGAAACCGGTGATTGCTGACGGGCAACTGTTCGTG +GGTCTGGCGCTGGATGAAACTAACCAGTATGACCTTAGCGACGAGCGTATTCAGAGCTGG +TGCGAGCAAATCCTCAACGAAATGGCAGAGCATTACGCCTGA +>test.0417.00002.0004i_00087 408 ygfX | Inner membrane protein YgfX | NA | similar to AA sequence:UniProtKB:Q46824 | NA +GTGGTCCTGTGGCAATCTGATTTGCGCGTCTCCTGGCGCGCACAGTGGCTTTCCTTGCTG +ATTCATGGGCTGGTTGCCGCTGTTATTTTACTCATGCCCTGGCCGCTCAGTTACACCCCG +TTATGGATGGTGTTACTTTCGCTGGTGGTGTTTGATTGCGTTCGCAGCCAGCGGCGCATT +AATGCTCGCCAGGGGGAAATTCGCTTGTTGATGGACGGGCGTTTGCGTTGGCAAGGGCAG +GAGTGGAGCATCGTCAAAGCGCCGTGGATGATTAAGAGCGGCATGATGCTGCGTTTACGT +TCTGACAGCGGAAAACGGCAACATTTATGGCTGGCAGCTGACAGCATGGACGAAGCCGAA +TGGCGGGATTTACGGCGGATATTGTTACAACAAGAGACGCAAAGATAA +>test.0417.00002.0004i_00088 267 sdhE | FAD assembly factor SdhE | NA | similar to AA sequence:UniProtKB:P64559 | COG:COG2938 +ATGGACATTAACAACAAAGCCCGCATTCATTGGGCATGCCGCCGTGGTATGCGCGAACTC +GATATTTCAATCATGCCGTTTTTCGAACATGAGTACGACAGCTTAAGCGATGACGAAAAA +CGCATCTTTATTCGTCTGCTGGAATGTGACGATCCGGACCTGTTTAACTGGCTGATGAAT +CACGGTAAACCAGCCGATGCAGAACTGGAAATGATGGTCCGACTCATCCAGACACGGAAC +CGGGAACGTGGTCCTGTGGCAATCTGA +>test.0417.00002.0004i_00089 981 ygfZ | tRNA-modifying protein YgfZ | NA | similar to AA sequence:UniProtKB:P0ADE8 | COG:COG0354 +ATGGCTTTTACACCTTTTCCTCCCCGTCAGCCTACGGCTTCTGCCCGTTTGCCACTGACG +CTGATGACGCTTGATGACTGGGCGCTTGCCACTATTACTGGCGCGGACAGCGAAAAATAT +ATGCAAGGCCAGGTGACAGCAGATGTCAGCCAGATGACAGAAGATCAGCACCTGCTCGCC +GCCCATTGCGACGCCAAAGGTAAAATGTGGAGCAATTTACGTCTGTTCCGCGACGGCGAT +GGCTTTGCATGGATTGAACGGCGCAGCGTGCGTGAACCACAGCTGACTGAACTGAAAAAA +TATGCGGTGTTCTCTAAAGTGACAATCGCGCCAGACGACGAGCGTGTGCTGCTTGGTGTT +GCCGGTTTTCAGGCGCGCGCCGCGCTGGCAAATCTCTTTAGTGAACTGCCTTCGAAAGAA +AAACAGGTAGTTAAAGAAGGCGCGACTACTCTGCTTTGGTTTGAACATCCGGCAGAACGT +TTCCTGATCGTAACCGATGAAGCTACTGCCAATATGCTGACCGATAAACTGCGCGGTGAA +GCGGAACTGAACAATAGCCAACAGTGGCTGGCATTAAACATTGAAGCGGGTTTCCCGGTG +ATTGATGCCGCCAACAGCGGGCAGTTTATCCCCCAGGCGACCAACCTCCAGGCGCTGGGC +GGTATCAGCTTTAAGAAAGGCTGCTATACCGGACAAGAGATGGTGGCGCGAGCAAAATTC +CGTGGTGCCAACAAACGCGCGCTCTGGTTGCTGAAGGGTAGCGCCAGCCGACTGCCGGAA +GCTGGTGAAGACTTAGAGCTGAAAATGGGCGAGAACTGGCGTCGTACCGGTACGGTGCTG +GCTGCGGTCAAACTGGAAGATGGTCAGGTTGTGGTGCAGGTTGTCATGAATAACGATATG +GAACCGGACAGCATCTTCCGCGTGCGTGACGATGCGAATACATTGCGTATCGAGCCACTG +CCATATTCGCTGGAAGAGTAA +>test.0417.00002.0004i_00090 660 NA | hypothetical protein | NA | similar to AA sequence:UniProtKB:P67153 | NA +ATGGTTCAGAAGCCCCTCATTAAGCAGGGATATTCGCTGGCAGAGGAAATTGCCAACAGC +GTCAGTCACGGCATTGGGCTGGTGTTTGGTATCGTTGGGCTGGTGTTGCTACTGGTTCAG +GCGGTGGATCTCAATGCCAGCGCCACGGCGATAACCAGTTACAGCCTCTATGGCGGCAGT +ATGATCCTGCTGTTCCTCGCTTCGACGCTCTATCACGCCATTCCCCATCAACGGGCAAAA +ATGTGGCTGAAGAAATTTGACCACTGTGCCATTTATCTGTTGATTGCCGGAACCTATACG +CCGTTTTTGCTGGTGGGGCTGGATTCTCCGTTAGCGCGCGGGTTGATGATTGTTATCTGG +AGCCTGGCATTGCTGGGTATTCTGTTTAAACTGACCATCGCGCACCGATTCAAAATTTTA +TCTCTGGTGACCTATCTGGCGATGGGCTGGCTGTCGCTGGTGGTAATTTATGAAATGGCA +GTTAAGCTCGCGGCGGGCAGCGTTACCTTACTGGCGGTAGGCGGTGTGGTTTATTCGCTC +GGGGTGATTTTCTACGTCTGCAAGCGCATTCCATACAATCATGCCATCTGGCACGGCTTT +GTGCTCGGCGGTAGTGTGTGCCACTTTCTGGCGATCTATTTGTATATTGGGCAGGCGTAA +>test.0417.00002.0004b_00091 312 NA | hypothetical protein | NA | similar to AA sequence:UniProtKB:P67603 | NA +ATGCAGCCAAACGACATCACTTTTTTTCAACGTTTCCAGGATGACATTCTGGCTGGGCGT +AAAACCATCACCATCCGCGACGAGTCTGAATCGCACTTCAAAACGGGTGATGTGCTTCGT +GTCGGACGTTTTGAAGATGACGGTTATTTTTGCACGATTGAAGTCACCGCAACCTCAACC +GTAACGCTGGATACGCTGACGGAAAAACATGCAGAGCAGGAAAATATGACCCTGACTGAA +CTGAAAAAGGTCATTGCCGACATCTATCCCGACCAGACACAGTTTTATGTGATTGAATTT +AAATGTCTTTAA +>test.0417.00002.0005b_00092 984 bglA | 6-phospho-beta-glucosidase BglA | 3.2.1.86 | similar to AA sequence:UniProtKB:Q46829 | COG:COG2723 +GTGGTTGATTTCTTTGTCCGTTTCGCGGAAGTGGTATTTGAACGCTATAAGCATAAAGTC +AAATACTGGATGACTTTCAACGAAATTAACAACCAGCGTAACTGGCGTGCACCGCTGTTC +GGTTACTGCTGCTCCGGCGTGGTGTATACCGAGCATGAAAACCCGGAAGAGACGATGTAT +CAGGTGCTGCATCACCAGTTTGTCGCCAGCGCCCTGGCGGTGAAAGCCGCGCATCGCATC +AACCCGGAGATGAAAGTCGGTTGTATGCTGGCGATGGTGCCGCTCTATCCTTACTCCTGT +AACCCGGACGATGTGATGTTTGCCCAGGAGTCGATGCGCGAACGTTACGTCTTTACCGAT +GTGCAGTTGCGTGGCTATTACCCGTCCTATGTGTTGAACGAGTGGGAACGCCGCGGATTT +AACATCAAAATGGAAGACGGCGATCTGGATGTACTGCGCGAAGGCACCTGCGATTATCTC +GGCTTCAGCTATTACATGACCAACGCGGTGAAGGCCGAAGGTGGCACCGGCGATGCGATT +TCTGGTTTCGAAGGCAGCGTACCGAATCCGTATGTTAAAGCGTCTGACTGGGGCTGGCAG +ATTGATCCGGTTGGTCTGCGCTACGCACTTTGCGAGCTGTATGAGCGTTACCAGAAGCCG +CTGTTTATTGTCGAAAACGGTTTTGGCGCTTACGACAAAGTGGAAGATGATGGCAGCATC +AATGACGATTACCGCATTGATTACCTGCGTGCCCATATTGAAGAGATGAAAAAAGCGGTG +ACTTACGATGGCGTGGACCTGATGGGCTACACGCCGTGGGGCTGCATCGACTGTGTGTCG +TTCACCACCGGGCAGTACAGCAAACGCTACGGCTTTATCTATGTGAATAAACATGACGAC +GGTACTGGCGATATGTCGCGTTCACGTAAGAAGAGCTTTAACTGGTACAAAGAGGTGATT +GCCAGCAACGGCGAGAATCTGTAA +>test.0417.00002.0005i_00093 2874 gcvP | Glycine dehydrogenase (decarboxylating) | 1.4.4.2 | similar to AA sequence:UniProtKB:P33195 | COG:COG0403 +ATGACACAGACGTTAAGCCAGCTTGAAAACAGCGGCGCTTTTATTGAACGCCATATCGGA +CCGGACGCCGCGCAACAGCAAGAAATGCTGAATGCCGTTGGCGCACAATCGTTAAACGCG +CTGACCGGCCAGATTGTGCCGAAAGATATTCAGCTTGCGACTCCGCCGCAGGTTGGCGCA +CCGGCGACCGAATACGCCGCACTGGCAGAACTCAAGGCTATTGCCAGTCGCAATAAACGC +TTCACGTCTTACATCGGCATGGGTTACACCGCCGTGCAGCTACCGCCGGTTATCCTGCGT +AACATGCTGGAAAATCCGGGCTGGTATACCGCGTATACTCCGTATCAACCTGAAGTCTCC +CAGGGCCGCCTTGAAGCACTGCTCAACTTCCAGCAGGTAACGCTGGATTTAACCGGGCTG +GATATGGCCTCTGCTTCTCTTCTTGACGAAGCCACCGCTGCCGCCGAAGCAATGGCGATG +GCGAAACGCGTCAGCAAACTGAAAAATGCCAACCGCTTCTTTGTTGCTTCTGACGTTCAT +CCGCAAACGCTGGATGTGGTCCGTACTCGTGCCGAAACCTTTGGTTTTGAAGTGATTGTC +GATGACGCGCAAAAAGTGCTCGACCATCAGGACGTTTTCGGCGTGCTGTTACAGCAGGTC +GGCACTACTGGTGAAATTCACGACTACACCGCGCTTATTAGCGAACTGAAATCACGCAAA +ATTGTGGTCAGCGTTGCCGCCGATATTATGGCGCTGGTGCTGTTAACTGCGCCAGGTAAA +CAGGGCGCGGATATTGTTTTTGGTTCGGCGCAACGCTTTGGCGTACCGATGGGCTATGGT +GGCCCACACGCGGCATTCTTTGCGGCGAAAGACGAATACAAACGCTCAATGCCGGGCCGT +ATTATCGGTGTATCGAAAGATGCAGCTGGCAACACCGCTCTGCGCATGGCGATGCAGACT +CGCGAGCAACATATTCGTCGTGAGAAAGCGAACTCCAACATTTGTACTTCCCAGGTACTG +CTGGCAAACATTGCCAGCCTGTATGCCGTTTATCACGGTCCGGTTGGCCTGAAACGTATC +GCTAATCGCATCCACCGTCTGACCGATATCCTGGCGGCGGGCCTGCAACAAAAAGGTCTG +AAGCTGCGCCATGCGCACTATTTCGATACTTTGTGTGTGGAAGTGGCCGACAAAGCGGGC +GTGCTGGCGCGTGCCGAAGCGGCTGAAATCAACCTGCGTAGCGATATTCTGAACGCGGTT +GGGATCACCCTTGATGAAACAACCACGCGCGAAAACGTGATGCAGCTTTTCAGCGTGCTG +TTGGGCGATAACCACGGGCTGGACATCGACACACTGGACAAAGACGTGGCTCACGACAGT +CGCTCTATTCAGGCTGCGATGCTGCGCGACGACGAAATCCTCACCCATCCGGTGTTTAAT +CGCTACCACAGCGAAACCGAAATGATGCGCTATATGCACTCGCTGGAGCGTAAAGATCTG +GCGCTGAATCAGGCGATGATCCCGCTGGGTTCCTGCACCATGAAACTGAACGCCGCCGCC +GAGATGATCCCGATCACCTGGCCGGAATTTGCCGAACTGCACCCGTTTTGCCCGCCAGAA +CAGGCTGAAGGTTATCAGCAGATGATCGCGCAGCTGGCTGACTGGCTGGTGAAACTGACC +GGTTACGACGCCGTTTGTATGCAGCCGAACTCTGGCGCACAGGGCGAATACGCGGGCCTG +CTGGCGATTCGTCATTATCATGAAAGCCGCAACGAAGGGCATCGCGATATCTGCCTGATC +CCGGCTTCTGCGCACGGCACTAACCCGGCTTCCGCGCATATGGCAGGAATGCAGGTGGTG +GTTGTGGCGTGTGATAAAAACGGCAACATCGATCTGACTGATCTGCGCGCGAAAGCGGAA +CAGGCGGGCGATAACCTCTCCTGTATCATGGTGACCTATCCTTCTACCCACGGCGTGTAT +GAAGAAACGATCCGTGAAGTGTGTGAAGTCGTGCATCAGTTCGGCGGTCAGGTTTACCTT +GATGGCGCGAACATGAACGCTCAGGTTGGCATCACCTCGCCGGGCTTTATTGGTGCGGAC +GTTTCCCACCTTAACCTGCATAAAACTTTCTGCATTCCGCATGGCGGTGGTGGTCCGGGT +ATGGGACCGATCGGTGTGAAAGCGCATCTGGCTCCGTTTGTACCGGGTCATAGCGTGGTG +CAAATCGAAGGCATGTTAACCCGTCAGGGCGCGGTTTCTGCGGCACCGTTCGGTAGTGCC +TCTATCCTGCCAATCAGCTGGATGTACATCCGCATGATGGGCGCAGAAGGGCTGAAAAAA +GCAAGCCAGGTGGCAATTCTTAACGCCAACTATATTGCCAGCCGTCTGCAGGATGCCTTC +CCGGTGCTGTATACCGGTCGCGACGGTCGCGTGGCGCACGAATGTATTCTCGATATTCGC +CCGCTGAAAGAAGAAACCGGCATCAGCGAGCTGGATATTGCCAAGCGCCTGATCGACTAC +GGTTTCCACGCGCCGACCATGTCGTTCCCGGTGGCGGGTACGCTGATGGTTGAACCGACT +GAATCTGAAAGCAAAGTGGAACTGGATCGCTTTATCGATGCGATGCTGGCTATCCGCGCA +GAAATTGATCAGGTGAAAGCCGGTGTCTGGCCGCTGGAAGATAACCCGCTGGTGAATGCG +CCGCACATTCAAAGCGAACTGGTCGCCGAGTGGGCGCATCCGTACAGCCGTGAAGTTGCA +GTATTCCCGGCAGGTGTGGCAGACAAATACTGGCCGACCGTGAAACGTCTGGATGATGTT +TACGGCGACCGTAACCTGTTCTGCTCCTGCGTACCGATTAGCGAATACCAGTAA +>test.0417.00002.0005i_00094 390 gcvH | Glycine cleavage system H protein | NA | similar to AA sequence:UniProtKB:P0A6T9 | COG:COG0509 +ATGAGCAACATACCAGCAGAACTGAAATACAGCAAAGAACACGAATGGTTGCGTAAAGAA +GCCGACGGCACTTACACCGTTGGCATCACCGAACACGCTCAGGAGCTGTTAGGCGATATG +GTGTTTATTGACCTACCGGAAGTGGGCGCAACGGTTAGCGCGGGCGATGACTGCGCGGTT +GCCGAATCGGTAAAAGCGGCGTCAGACATTTATGCGCCAGTAAGCGGTGAAATCGTGGCG +GTAAACGATGCACTGAGCGATTTCCCGGAACTGGTGAACAGCGAACCGTATGCAGGCGGC +TGGATTTTCAAAATCAAAGCCAGCGATGAAAGCGAACTGGAATCACTGCTGGATGCAACC +GCATACGAAGCATTGTTAGAAGACGAGTAA +>test.0417.00002.0005b_00095 1164 gcvT | Aminomethyltransferase | 2.1.2.10 | similar to AA sequence:UniProtKB:P27248 | COG:COG0404 +ATGCTGGGTTTCGTGGTGATAATTTCGCCATGGAAAAGTTGTCAGCCCCGCTTATTCAAT +GAGGACAAGATGGCACAACAGACTCCTTTGTACGAACAACACACGCTTTGCGGCGCTCGC +ATGGTGGATTTCCACGGCTGGATGATGCCGCTGCATTACGGTTCGCAAATCGACGAACAT +CATGCGGTACGTACCGATGCCGGAATGTTTGATGTGTCACATATGACCATCGTCGATCTT +CGCGGCAGCCGCACCCGGGAGTTTCTACGTTATCTGCTGGCGAACGATGTGGCGAAGCTC +ACCAAAAGCGGCAAAGCCCTTTACTCGGGGATGTTGAATGCCTCTGGCGGTGTGATAGAT +GATCTCATCGTCTACTACTTTACTGAAGATTTCTTCCGCCTCGTTGTTAACTCCGCCACC +CGCGAAAAAGACCTCTCCTGGATTACCCAACACGCTGAACCTTTCGGCATCGAAATTACT +GTTCGTGATGACCTTTCCATGATCGCCGTACAAGGGCCGAATGCGCAGGCAAAAGCTGCC +ACACTGTTTAATGACGCCCAGCGTCAGGCGGTGGAAGGGATGAAACCGTTCTTTGGCGTG +CAGGCGGGCGATCTGTTTATTGCCACCACCGGTTACACCGGTGAAGCGGGCTACGAAATT +GCGCTGCCCAATGAAAAAGCGGCCGATTTCTGGCGCGCGCTGGTGGAAGCTGGCGTTAAG +CCATGTGGCCTGGGCGCGCGTGACACGCTGCGTCTGGAAGCGGGCATGAATTTGTATAGC +CAGGAGATGGACGAAACTATTTCTCCTTTAGCCGCCAATATGGGCTGGACTATCGCCTGG +GAACCGGCAGATCGTGACTTTATCGGTCGTGAAGCTCTGGAAGCGCAGCGTGAACATGGC +ACAGAAAAACTGGTTGGTCTGGTGATGACCGAAAAAGGCGTGCTGCGTAATGAACTGCCG +GTACGTTTTACTGATGCGCAGGGCAACCAGCATGAAGGCATTATCACCAGCGGTACTTTC +TCCCCAACGCTGGGTTATAGCATTGCGCTGGCGCGCGTGCCGGAAGGTATTGGTGAAACG +GCGATTGTGCAAATTCGCAACCGTGAAATGCCGGTTAAAGTGACGAAACCTGTTTTTGTG +CGTAACGGCAAAGCCGTCGCGTGA diff --git a/test/data/annotate/exp_files/res_formatAll/prokka/Genes/test_runprokka_H299.gen b/test/data/annotate/exp_files/res_formatAll/prokka/Genes/test_runprokka_H299.gen new file mode 100644 index 0000000000000000000000000000000000000000..63213ba8c0e58ae157f95eafbe54438464d4209f --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prokka/Genes/test_runprokka_H299.gen @@ -0,0 +1,213 @@ +>test_runprokka_H299.0001b_00001 543 NA | hypothetical protein | NA | NA | NA +GTGAAAACGGGGTCCGAAGCCATCCGGGCGCTGGCCATGCAGATCCCGGCATTTCGTCAG +AAACTGAGCGACGGCTGGTACCAGGTACGCATTGCCGGGCGTGATGCAGGTGAAACCGAA +TTGTCTGCCCGTCTTAATGAGCCGCTGGAAAATGGTGCCGTGATCCATATCGTGCCGCGT +CTGGCAGGAGCCAAAAGTGGCGGTGTGTTTCAGGCTGTGCTGGGGGCGGCTGTTATGGCG +GTTGCTATATGGATGCCGGGGGTAGGAATTATGGCGAGTAATCTGCTGTTTTCTCTCGGT +GCCAGTATGACGCTTGGCGGTGTTGCACAGATGCTGGCCCCTAAACCCAAAACCCCCCGC +ACACAGACAACGGATAACGGCAAACAGAATACCTATTTTTCTTCACTGGATAACATGGTT +GCCCAGGGCAATGTTCTGCCGGTTCTGTACGGTGAAATGCGCGTGGGGTCACGCGTGGTT +TCTCAGGAGATCAGCACGGCAGACGAAGGGGATGGTGGTCAGGTTGTGGTGATTGGTCGC +TGA +>test_runprokka_H299.0001i_00002 600 NA | hypothetical protein | NA | NA | NA +ATGTCGCCGGAGGACTGGCTGAGTGCAGAAATGCAGAGAGAGATTGTGGCGCTGGTCCAC +AGCCACCCCGGTGGTCTGCCCTGGCTGAGTGAGGCCGACCGGCGGCTGCAGGTACAGAGT +GATTTGCCGTGGTGGCTGGTCTGCCGGGGGGCGATTCATAAATTCCGCTGTGTGCCGCAT +CTCACCGGGCGGCGCTTTGAGCACGGGGTAACGGACTGTTACACGCTGTTCCGGGACGCT +TACCATCTGGCGGGAATTGAGATGCCGGATTTTCATCGCGGGGATGACTGGTGGCGTAAC +GGTCAGAATCTCTATCTGGATAATCTGGAGGCCACAGGGCTGTATCAGGTGCCGTTGTCA +GCGGCGCAGCCGGGCGATGTGCTGCTGTGCTGTTTTGGTTCATCGGTGCCGAATCATGCC +GCCATTTACTGTGGTGACAGCGAGCTGCTGCACCATATTCCTGAACAACTGAGCAAACGA +GAGAGGTACACCGACAAATGGCAGCGACGCACACACTCCCTCTGGCGTCACCGGGCATGG +CACGCATCTGCCTTTACGGGGATTTACAACGATTTGGCCGCCGCATCGACCTTCGAGTGA +>test_runprokka_H299.0001i_00003 699 NA | hypothetical protein | NA | NA | NA +ATGCAGGACATACAACAGGAAACGCTGAATGAATGCATTCGTGCGGAGCAGTCGGCCAGC +GTGGTGCTCTGGGAAATCGACCTGACCGAGGTAGGCGGGGATCGCTACTTTTTCTGTAAT +GAGCAGAACGAAAAAGGTGAGTCTGTCACCTGGCAGAGTCGGCAGTATCAGGCCTATCCC +ATTCAGGGGAGTGGATTTGAGATGAACGGCAAGGGCAGTGCTGCCCGTCCGACACTGACG +GTCTCTAACCTGCACGGCATGATCACCGGGATGGCGGAAGATCTGCAGAGTCTGGTCGGC +GGAACGGTGGTCCGGCGTAAGGTTTACGCCCGCTTTCTGGATGCGGTGAACTTCGTCAAC +GGAAACAGCGAAGCCGATCCGGAGCAGGAGGTGATCAGCCGCTGGCGCATCGAGCAGTGC +AGCGAACTGAGCGCGGTCAGTGCCTCTTTTGTACTGTCCACGCCGACTGAAACGGATGGC +GCTGTTTTTCCGGGACGTATCATGCTGGCCAACACCTGCACCTGGACCTATCGCGGCGAT +GAGTGCGGTTATAGCGGTCCGGCGGTCGCGGATGAATATGACCAGCCGACGTCCGATATC +ACGAAGGATAAATGCAGCAAATGCCTGAGTGGCTGTAAGTTTCGCAATAATGTCGGCAAC +TTTGGCAGCTTCCTTTCCATTAACAAACTTTCGCAGTAA +>test_runprokka_H299.0001i_00004 297 NA | hypothetical protein | NA | NA | NA +ATGAAAACAGAAAATAAACCATCGATAAAAACTGTAAGATTTGGCGATGGTTATGAGCAA +CGAAGTCCAAATGGACTTAATCATTCTCTGCGCGTTTTCACCTGTGATTTCAAAGTTGAG +GCGAATGAACGTGATTCATTTGAAAAATTTTTAGCCCGGCATGAAGGCTATAAATCTTTT +TTTTGGCGCCCGCCGGGTATTAACAGAAAAATCAGAGTGGTGTGTCGAACGTGGTCAGCG +ACAGAACATATCACCTATACCGATTTTTCGTGTCAGTTTGACGAAGTGGTGATCTGA +>test_runprokka_H299.0001b_00005 936 NA | hypothetical protein | NA | NA | NA +TTGCAGGCTTCGATTGATAATCGTCAGCAGGGGTATGATATTCAGATTGCTGGTTATGGG +GTTGGCGATAAAAATCAGCAACGCCAGCAGGAATTACTGCGGATTGAACATGGATATAAC +AATCAGCGTCTGCAACTTGAACGTGACTATGCAGATAAATCCCGTGGAATGTCAGATCAT +GTTTTTCAAGAGAAAATGCAGGCTCTGAATGATGCTCTGGAACGGGAAAAAGAAATTGTC +AGACAGAAAAACGAGCAGCTCGATATTCAGGCAGGAGACTGGGTTAGTGGTGCCTCCCAG +GGATTCAATAACTGGCTGGATGACACTAAGGATATCAGTGAGCAGATAAAATCAACCACG +ACTCAGATGTTTGATGGGATGACCGATGCGCTGGGTGATTTTGTCACGACAGGCAAGGCA +AATTTTCGTTCTTTCGCTACTTCCGTGATTTCGGATCTTAGTCGAATAGCATTAAAGGCT +TCAATTACTGGGATTTTCGACAGCATTAGTAACAGTTCTTCTGGGGGGATTTTAGGAACT +ATCGGGAGTGCTATTAGTAAATTTATTCCGAATGCAAAGGGCGGTGTTTATGAGTCTCCG +TCATTGAGCACGTATTCGAACGGTATTTATGATTCCCCGCAATTTTTTGCTTTTGCAAAA +GGGGCTGGTGTTTTTGGTGAGGCTGGACCGGAAGCCATTATGCCATTAACACGAACTTCC +GATGGTTCTCTTGGTGTCAGAGCTATTAATAGTAAAAGTGGTAATGGAGGCGGAGATATT +ACCTATGCCCCTGTATACCAAATCACTATTCAAAATGACGGCCAGAATGGAGAGATTGGC +CCTCAGGCAATAAAAGCACTTATGGGGATGGTTGATCAGCGGGTGCAGGGCAATCTGTTA +AATATGCGACGTGATGGGGGAATGTTAAGTGGCTAA +>test_runprokka_H299.0002b_00006 543 NA | hypothetical protein | NA | NA | NA +GTGAAAACGGGGGCTGAAGCCATCCGGGCGCTGGCCACACAGCTCCCGGCGTTTCGTCAG +AAACTGAGCGACGGCTGGTATCAGGTACGGATTGCCGGGCGTGATACAGGTGAAACGGAA +TTATCAGCCCGTCTTAATGAACCGCTGGCAAATGGTGCTGTGATCCATATCGTGCCGCGT +CTGGCAGGAGCCAAAAGTGGCGGTGTGTTTCAGGCTGTGCTGGGGGCGGCTGTTATGGCG +GTTGCTATATGGATGCCGGGGGTAGGAATTATGGCGAGTAATCTGCTGTTTTCTCTCGGT +GCCAGTATGACGCTTGGCGGTGTTGCACAGATGCTGGCCCCTAAACCCAAAACCCCCAGC +ACACAGACAACGGATAACGGCAAACAGAACACCTATTTTTCTTCACTGGATAATATGGTT +GCCCAGGGCAATGTTCTGCCCGTTCTGTACGGTGAAATGCGCGTGGGATCACGTGTGGTA +TCTCAGGAGATCAGCACAGCAGATGAAGGTGATGGTGGTCAGGTTGTGGTGATTGGTCGC +TGA +>test_runprokka_H299.0002i_00007 744 NA | hypothetical protein | NA | NA | NA +ATGACAGAGACAGAATCAGCGATTCTGGCGCACGCCCGGCGATGTGCGCCAGCGGAGTCG +TGCGGCTTCGTGGTGAGAACGCCGGAAGGGGAAAGATATTTCCCCTGCGTGAATATCTCC +GGTGAGCCGGAGGCGTATTTCCGGATGTCGCCGGAGGACTGGCTGCGGGCAGAGATGCAG +GGTGAGATTGTGGCGCTGGTCCACAGCCACCCCGGTGGTCTGCCCTGGCTGAGTGAGGCC +GACCGGCGGCTGCAGGTGCAGAGTGATTTGCCGTGGTGGCTGGTCTGCCGGGGGACGATT +CATAAGTTCCGCTGTGTGCCGCATCTCACCGGGCGGCGCTTTGAGCACGGGGTGACGGAC +TGTTACACGCTGTTCCGGGATGCTTATCATCTGGCGGGGATTGAGATGCCGGATTTTCAT +CGCGAGGATGACTGGTGGCGTCACGGTCAGAATCTCTATCTGGATAATCTGGAGGCCACA +GGGTTGTATCAGGTGCCGTTGTCATCAGCACAACCGGGCGATGTGCTGCTGTGCTGTTTT +GGTTCATCGGTGCCGAATCATGCCGCCATTTACTGTGGTGATGGCGAGCTGCTGCACCAT +ATTCCTGAACAACTGAGCAAACGAGAGAGGTATACCGACAAATGGCAGCGACGCACACAC +TCCCTCTGGCGTCACCGGGCATGGCGCGCATCTGCCTTTACGGGGATTTACAACGATTTG +GTCGCCGCATCGACCTTCGTGTGA +>test_runprokka_H299.0002i_00008 699 NA | hypothetical protein | NA | NA | NA +ATGCAGGATATCCGGCAGGAAACACTGAATGAATGCACCCGTGCGGAGCAGTCGGCCAGC +GTGGTGCTCTGGGAAATCGACCTGACAGAGGTCGGTGGAGAACGTTATTTTTTCTGTAAT +GAGCAGAACGAAAAAGGTGAGCCGGTCACCTGGCAGGGGCGACAGTATCAGCCGTATCCC +ATTCAGGGGAGCGGTTTTGAACTGAATGGCAAAGGCACCAGTACACGCCCCACGCTGACG +GTTTCTAACCTGTACGGTATGGTCACCGGGATGGCGGAAGATATGCAGAGTCTGGTCGGC +GGAACGGTGGTCCGGCGTAAGGTTTACGCCCGTTTTCTGGATGCGGTGAACTTCGTCAAC +GGAAACAGCGACGCCGATCCGGAGCAGGAGGTGATCAGCCGCTGGCGCATCGAGCAGTGC +AGCGAACTGAGCGCGGTCAGTGCCTCCTTTGTACTGTCCACGCCGACGGAAACGGATGGT +GCCGTTTTTCCGGGGCGCATCATGCTGGCTAATACCTGCACCTGGACCTATCGCGGTGAT +GAGTGCGGTTATCACGGTCCGGCTGTCGCGGATGAATATGATCAGCCGACGTCCGATATC +ACGAAGGATAAATGCAGCAAATGCCTGAATGGCTGTAAGTTTCGCAATAACGTCGGCAAC +TTTGGCGGCTTCCTTTCCATTAACAAACTTTCGCAGTGA +>test_runprokka_H299.0002i_00009 330 NA | hypothetical protein | NA | NA | NA +ATGAAAACCTTCCGCTGGAAAGTGAAACCCGGTATGGATGTGGCTTCGGCCCCTTCTGTA +AGAAAGGTGCGCTTTGGTGATGGCTATTCCCAGCGAGCGCCTGCCGGGCTGAATGCCAAC +CTGAAAACGTACAGCGTGACGCTTTCTGTCCCCCGTTGGGAGGCCACGGTACTGGAGTCG +TTTCTGGAAGAGCACGGGGGCTGGAAAGCCTTTCTGTGGACGCCGCCTTATGAGTGGCGG +CAGATAAAGGTGACCTGCGCAAAATGGTCGTCGCGGGTCAGTATGCTGCGTGTTGAGTTC +AGCGCAGAGTTTGAACAGGTGGTGAACTGA +>test_runprokka_H299.0002i_00010 2580 NA | hypothetical protein | NA | NA | NA +ATGGCTGAACCGGTAGGCGATCTGGTCGTTGATTTGAGTCTGGATGCGGCCAGATTTGAC +GAGCAGATGGCCAGAGTCAGGCGTCATTTTTCCGGTACGGAAAGTGATGCGAAAAAAACA +GCGGCAGTCGTTGAACAGTCGATGAGCCGGCAGGCGCTGGCTGCACAGAAAGCGGGGATT +TCCGTCGGGCAGTATAAAGCCGCCATGCGTATGCTGCCTGCGCAGTTCACCGACGTGGCC +ACGCAGCTTGCAGGCGGGCAGAGTCCGTGGCTGATCCTGCTGCAACAGGGTGGTCAGGTG +AAGGACTCCTTCGGCGGGATGATCCCCATGTTCAGGGGGCTTGCCGGTGCGATCACCCTG +CCGATGGTGGGGGCCACCTCGCTGGCGGTGGCGACCGGTGCGCTGGCGTATGCCTGGTAT +CAGGGTAACTCAACCCTGTCCGATTTCAACAAAACGCTGGTCCTTTCCGGCAATCAGGCG +GGACTGACGGCAGATCGTATGCTGGTCCTGTCCAGAGCCGGGCAGGCGGCAGGGCTGACG +TTTAACCAGACCAGCGAGTCACTGACGGCGCTGGTGAATGCCGGTGTGCGTGGTGGTGAG +CAGTTTGAGGCGATCAGCCAGAGTGTGGCGCGTTTCTCCTCTGCATCCGGTGTGGAGGTG +GACAAGGTCGCTGAAGCCTTCGGGAAGCTGACCACAGACCCGACGTCGGGGTTGACGGCG +ATGGCACGCCAGTTCCATAACGTGACGGCGGAACAGATTGCGTATGTTGCTCAGTTGCAG +CGTTCCGGCGATGAAGCCGGGGCATTGCAGGCGGCGAACGAGGCCGCAACGAAAGGGTTT +GATGACCAGACCCGACGCCTGAAAGAGAACATGGGCACGCTGGAGACCTGGGCAGACAGG +ACAGCACGGGCATTCAAATCCATGTGGGATTCGGTGCTGGATATTGGTCGCCCGGACACT +GCCCAGGGAATGCTGGAGAAAGCAGAAAAGGCTTTTGATGAGGCGGACAAAAAATGGCAG +TGGTATCAGAGCCGGAGCCACCGGCGCGGTAAAACCTCAGCATTTCTTGCCAATCTCCGG +GGAGCATGGGAGGACAGAGCGAATGCGCAACTTGGGCTTTCCGCCGCCACGTTGCAGGCC +GATCTTGAAAAGGCCAGAGAGATGGCAGCAAAGGACTGGGCCGAGTCTGAGGCATCACGG +CTGAAATATACCGAAGAGGCGCAGAAGGCTTACGAACGCCTGCAGACGCCGCTGGAGAAA +TATACCGCCCGTCAGGAAGAACTGAACAAGGCACTGAAAGACGGGAAAATCCTGCAGGCA +GATTACAACACGCTGATGGCGGCGGCGAAAAAGGATTATGAAGCGACGCTGAAAAAGCCG +AAACAGTCCGGCGTGAAGGTGTCTGCGGGCGATCGTCAGGAAGACAGTGCTCATGCTGCC +CTGCTGACGCTTCAGGCAGAACTCCGGACGCTGGAGAAGCATGCCGGAGCGAATGAGAAA +ATCAGCCAGCAGCGCCGGGATTTGTGGAAGGCAGAAAGTCAGTTCGCGGTACTGGAGGAG +GCGGCACAACGTCGCCAGCTGTCCGCACAGGAGAAATCCCTGCTGGCGCATAAAGATGAG +ACGCTGGAGTACAAACGCCAGCTGGCTGCACTTGGCGACAAGGTTACGTATCAGGAGCGC +CTGAACGCGCTGGCGCAGCAGGCGGATAAATTCGCACAGCAGCAACGGGCAAAACGGGCC +GCCATTGATGCGAAAAGCCGGGGGCTGACTGACCGGCAGGCAGAACGGGAAGCCACGGAA +CAGCGCCTGAAGGAACGGTATGGCGATAATCCGCTGGCGCTGAATAACGTCATGTCAGAG +CAGAAAAAGACCTGGGCGGCTGAAGACCAGCTTCGCGGGAGCTGGATGGCAGGCCTGAAG +TCCGGCTGGAGTGAGTGGGAAGAGAGCGCCACGGACAGTATGTCGCAGGTAAAAAGTGCA +GCCACGCAGACCTTTGATGGTATTGCACAGAATATGGCGGCGATGCTGACCGGCAGTGAG +CAGAACTGGCGCAGCTTCACCCGTTCCGTGCTGTCCATGATGACAGAAATTCTGCTTAAG +CAGGCAATGGTGGGGATTGTCGGGAGTATCGGCAGCGCCATTGGCGGGGCTGTTGGTGGC +GGCGCATCCGCGTCAGGCGGTACAGCCATTCAGGCCGCTGCGGCGAAATTCCATTTTGCG +ACTGGGGGATTTACGGGAACCGGCGGCAAATATGAGCCAGCGGGGATTGTTCACCGTGGT +GAGTTTGTCTTCACGAAGGAGGCAACCAGCCGGATTGGCGTGGGGAATCTTTACCGGCTG +ATGCGCGGCTATGCCACCGGCGGTTATGTCGGTACACCGGGCAGCATGGCAGACAGCCGG +TCGCAGGCGTCCGGGACGTTTGAGCAGAATAACCATGTGGTGATTAACAACGACGGCACG +AACGGGCAGATAGGGCCACAGGCGCTGAAGGCTGTTTATGACGTAGCCCGTAAGGCGGCA +ATGGATGTTGTGACCGGGCAGATGCGCGATGGTGGCCTGTTCTCCGGAGGTGGACGATGA +>test_runprokka_H299.0002i_00011 435 NA | hypothetical protein | NA | NA | NA +GTGTTCGACGGTGAGCTGAGTTTTGCCCTGAAACTGGCGCGTGAAATGGGGCGACCCGAC +TGGCGCGCCATGCTTGCCGGGATGTCATCCACGGAGTATGCCGACTGGCACCGCTTTTAC +AGTACCCATTATTTTCATGATGTTCTGCTGGATATGCACTTTTCCGGGCTGACGTACACC +GTGCTCAGCCTGTTTTTCAGCGATCCGGATATGCATCCGCTGGATTTCAGTCTGCTGAAC +CGGCGTGAGGCTGACGAAGAGCCTGAAGATGATGTGCTGATGCAGAAAGCGGCAGGGCTT +GCCGGAGGCGTTCGTTTTGGCCCGGACGGGAATGAAGTTATCCCCGCTTCCCCGGATGTG +GCGGACATGACGGAGGATGACGTAATGCTGATGACAGTATCAGAAGGGATCGCAGGAGGA +GTCCGGTATGGCTGA +>test_runprokka_H299.0002i_00012 423 NA | hypothetical protein | NA | NA | NA +ATGTTCCTGAAAACCGAATCATTTGAACATAACGGTGTGACCGTCACGCTTTCTGAACTG +TCAGCCCTGCAGCGTATTGAGCATCTTGCCTGGTTGAAAGAGCAGGAAAAAAAGGCTGAA +TCCAGTGGCAACCTGCAGGTGTCTGTAGAGGATCTTATCAGAGGCGGGGCGTTTCTGGTG +GCGATGTCTCTGTGGCATAACCATCCGCAGAAGACAAAGCTGCCGTCCATGAATGAAGCC +GTTAAACAGATTGAGCAGGAAGTGCTTACCACCTGGCCCACGGAGGCAATTGCTCAGGCT +GAAAACGTGGTGTTACGTCTGTCCGGAATGTCTGAGTTTGTTGTGAATAATGCCCCTGAA +CAGGCAGATGATGCCGGGCCTGCAGAGCCTGTTTCTGCGGGAAAGTGTTCGACGGTGAGC +TGA +>test_runprokka_H299.0002i_00013 741 NA | hypothetical protein | NA | NA | NA +ATGCCTGTACCAAATCCTACAATGCCGGTGAAAGGTGCCGGGACCACCCTGTTGGTTTAT +AAGGGGAGCGGTGACCCTTATGCGAACCCGCTTTCAGACGTTGACTGGTCGCGTCTGGCT +AAAGTTAAAGACCTGACGCCCGGCGAACTGACCGCTGAGTCCTATGACGACAGCTATCTC +GATGATGAAGATGCGGACTGGGCTGCGACCGGGCAGGGGCAGAAATCTGCCGGAGATACC +AGCTTCACGCTGGCGTGGATGCCCGGAGAGCAGGGGCAGCAGGCGCTGCTGGCGTGGTTT +AATGAAGGGGATACCCGTGCCTATAAAATCCGCTTCCCGAACGGCACGGTCGATGTGTTC +CGCGGCTGGGTCAGCAGTATCGGTAAGGCGGTGACGGCGAAGGAAGTGATCACCCGCACG +GTGAAAGTCACCAACGTGGGACGTCCGTCGATGGCAGAAGATCGCAGCACGGTCACAGCG +GCAACCGGCATGACCGTGACGCCTGCCAGCACTTCGGTGGTGAAAGGGCGGAGCACCACG +CTGACCGTGGCATTCCAGCCGGAAGGCGCAACCGACAAGAGCTTCCGTGCGGTGTCTGCG +GATAAAACAAAAGCCACCGTGTCGGTCAGTGGTATGACCATCACCGTGAAAGGTGTTGCT +GCAGGCAAGGTCAACATTCCGGTCGTATCCGGTAATGGTGAACTTGCTGCGGTTGCAGAA +ATCAACGTCACCAACAGCTAA +>test_runprokka_H299.0002b_00014 156 NA | hypothetical protein | NA | NA | NA +ATGGAGTCCCGGATTTATCCGGTGATGAGCGATATCCCGGCGCTGTCAGATTTGATCACC +AGTATGGTGGCCAGTGGCTATGACTACCGGCGCGACGATGATGCGGGCCTGTGGAGTTCA +GCCGATCTGACGTATGTCATTACCTATGAAATGTGA +>test_runprokka_H299.0003b_00015 708 NA | hypothetical protein | NA | NA | NA +TTGTTTTATGTGCTTACAACAATAACAATGTTTTTCTTCTATTTTATACGAAAAGGGAAG +GTTGTTAAGCTATTTTTCTTTCATTATATCTCAAAAAATAAAGTTTACGAAACTTTTATT +TTTGGCCTTTACCAGCTCCCTCATGTTTTAAGCTCTTGGGTAAGGCTTGGATATGATAGA +CTGGTATTGGGGGAACTAATATCAATGAGCTATGTTGGCGGATATTCGGTTGCAGTTCAA +ATATCTCTTGTGTCTAGCGTGATATTTCAATCATTAAATAGGTTTTGGACCCCTTTCTTT +ATTAAAAAATTAAAGGAGAATAGTAAACAAAAAAAAATTATTGTTCTTGGAGGTTTTGGA +ATTATCTGCATAACAATACTTAATATACTATTTGGTTACGCATATTTTATTTTTTTCTTG +CCCACAAATTATTCATCATTCTCCAATGCTCTTCCTATATTATGTATGGCATATATGTTT +CAGGGGCTATATTTTTTGATTGTTAATTATATATATTATCATGATGGTAATAAATTGATA +TCAATTCCATCCGTTGCCTCGATCGCTATACATATAGCTGTTGCCCCAGTTTTGATAAAA +CATATGGGATATTATGGAGCTGCAATTTCCTTATTGATTAGTTGGATAGTTCTTTTTTTA +TTTACATGCGTCATTATATTTTATGTTAGAAGGGGGTATCGTGGGTAA +>test_runprokka_H299.0003b_00016 933 NA | hypothetical protein | NA | NA | NA +GTGGGTAATATATTTATTGTTGAGTCTCCGTTTCAGCTTTCAAATGCTTTACTTTATCAT +AAAAAAAATGATAGTGTTATTGTCAGGCTCAACGGAGAAAATAAAAATGATTTTCAAATT +GAAAAAATGTTATCGTCGTTTAATGGCAAGGTATATATAAAAAAAGCATCAAAAGAATCG +AAATTCGATTTGATTAGATTTGTTTTATTTTTTGCCGTCCCTGTATTGATTGCTAATTTA +AATAAAAAAGTAATTATTGGGAATTATAATTCATTGTGGATGAGAGTCATGGGATATTTG +TTTAACCCATTTCATTTTGCCGTCCTTGATGATGGGTTGATTACTATACGAACAATAAAA +AGGTTGGATGATAATATATCGCGTTCTGGATCAATTAAGAAACGGTTTTTATTACTGCTG +GCACCAAGATTTATAACGCAATATAAGATATATTCCAACTTTATTCAGATATACAACCAA +GAGATCAATAAGAGAAAAAGAACTACCCGAGCCATTAAGGCAGGGCGAGTTTGTTTTATT +GGCTCTCCATTATTTGACAAAAATGTTCTCACATTTGATTTCTATGTAAAGTGCTTGGCT +GCGATAAGTGATAACCTTAAGCGTTGTGGATATAGCATTGAGTATTACCCTCATCGCTCA +GAAAAAAACATCTCATATTTAAATGTTTTTTTTGACGATGTAATAAAATCAGATGATAGC +ATTGAAGTCTATTATTCAGCCAGTAATGAGTTGCCAGAAATATTTGTATCATTTTATTCA +TCGGCCCTTTTAAATTTGAGAAGTGATTATCCAGAGTGTAAATTTATATCTTATAAGTTA +GATTGTAATGAAATCAATGGTAAGTTTAGGTATGAAATAATGGAGGCATATAACTTTTTG +GCATTCTCTGGTATTGAGGTTGTAACTATATAG diff --git a/test/data/annotate/exp_files/res_formatAll/prokka/LSTINFO/test.0417.00002.lst b/test/data/annotate/exp_files/res_formatAll/prokka/LSTINFO/test.0417.00002.lst new file mode 100644 index 0000000000000000000000000000000000000000..b97a58eb455664c353ca952a0fc904eee9ee32d5 --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prokka/LSTINFO/test.0417.00002.lst @@ -0,0 +1,95 @@ +287 787 D CDS test.0417.00002.0001b_00001 NA | hypothetical protein | NA | NA | NA +846 2384 D CDS test.0417.00002.0001i_00002 NA | hypothetical protein | NA | NA | NA +2404 3741 D CDS test.0417.00002.0001i_00003 NA | hypothetical protein | NA | NA | NA +3738 4403 D CDS test.0417.00002.0001i_00004 NA | hypothetical protein | NA | NA | NA +4416 6068 D CDS test.0417.00002.0001i_00005 ompA | Outer membrane protein A | NA | protein motif:HAMAP:MF_00842 | NA +6126 6617 D CDS test.0417.00002.0001i_00006 hcpA | Major exported protein | NA | similar to AA sequence:UniProtKB:Q9HI36 | COG:COG3157 +6808 9444 D CDS test.0417.00002.0001b_00007 clpV1 | Protein ClpV1 | NA | similar to AA sequence:UniProtKB:Q9I742 | COG:COG0542 +77 1237 D CDS test.0417.00002.0002b_00008 NA | hypothetical protein | NA | NA | NA +1279 2346 D CDS test.0417.00002.0002i_00009 NA | hypothetical protein | NA | NA | NA +2419 2799 D CDS test.0417.00002.0002i_00010 NA | hypothetical protein | NA | NA | NA +3130 3393 D CDS test.0417.00002.0002i_00011 NA | hypothetical protein | NA | NA | NA +3399 4538 D CDS test.0417.00002.0002i_00012 NA | hypothetical protein | NA | NA | NA +4535 7888 D CDS test.0417.00002.0002i_00013 NA | hypothetical protein | NA | NA | NA +7854 9491 D CDS test.0417.00002.0002i_00014 NA | hypothetical protein | NA | NA | NA +9525 11285 D CDS test.0417.00002.0002i_00015 NA | hypothetical protein | NA | NA | NA +11249 12328 D CDS test.0417.00002.0002i_00016 NA | hypothetical protein | NA | NA | NA +12309 12845 D CDS test.0417.00002.0002i_00017 NA | hypothetical protein | NA | NA | NA +12849 13277 D CDS test.0417.00002.0002i_00018 NA | hypothetical protein | NA | NA | NA +13277 14653 D CDS test.0417.00002.0002i_00019 NA | hypothetical protein | NA | NA | NA +14955 15902 C CDS test.0417.00002.0002i_00020 NA | Hydroxypyruvate reductase | 1.1.1.81 | similar to AA sequence:UniProtKB:Q9X1C1 | COG:COG0111 +15974 16570 C CDS test.0417.00002.0002i_00021 kdsD | Arabinose 5-phosphate isomerase KdsD | 5.3.1.13 | similar to AA sequence:UniProtKB:Q9HVW0 | COG:COG0517 +16573 17748 C CDS test.0417.00002.0002i_00022 malY | Protein MalY | NA | similar to AA sequence:UniProtKB:P23256 | COG:COG1168 +17748 19328 C CDS test.0417.00002.0002i_00023 malX | PTS system maltose-specific EIICB component | NA | similar to AA sequence:UniProtKB:P19642 | COG:COG1263 +19360 20184 C CDS test.0417.00002.0002i_00024 licT | Transcription antiterminator LicT | NA | similar to AA sequence:UniProtKB:P39805 | COG:COG3711 +20442 21695 C CDS test.0417.00002.0002i_00025 amiC | N-acetylmuramoyl-L-alanine amidase AmiC | 3.5.1.28 | similar to AA sequence:UniProtKB:P63883 | COG:COG0860 +21855 22043 C CDS test.0417.00002.0002b_00026 NA | hypothetical protein | NA | NA | NA +93 812 D CDS test.0417.00002.0003b_00027 argA | Amino-acid acetyltransferase | 2.3.1.1 | similar to AA sequence:UniProtKB:P0A6C5 | COG:COG0548 +874 2700 C CDS test.0417.00002.0003i_00028 recD | RecBCD enzyme subunit RecD | 3.1.11.5 | similar to AA sequence:UniProtKB:P04993 | COG:COG0507 +2700 6242 C CDS test.0417.00002.0003i_00029 recB | RecBCD enzyme subunit RecB | 3.1.11.5 | similar to AA sequence:UniProtKB:P08394 | COG:COG1074 +6235 9123 C CDS test.0417.00002.0003i_00030 ptrA | Protease 3 | 3.4.24.55 | similar to AA sequence:UniProtKB:P05458 | COG:COG1025 +9299 12667 C CDS test.0417.00002.0003i_00031 recC | RecBCD enzyme subunit RecC | 3.1.11.5 | similar to AA sequence:UniProtKB:P07648 | COG:COG1330 +12680 13003 C CDS test.0417.00002.0003i_00032 NA | hypothetical protein | NA | NA | NA +12988 13395 C CDS test.0417.00002.0003i_00033 NA | hypothetical protein | NA | NA | NA +13392 13955 C CDS test.0417.00002.0003i_00034 NA | hypothetical protein | NA | NA | NA +13946 14449 C CDS test.0417.00002.0003i_00035 NA | hypothetical protein | NA | NA | NA +14634 15428 C CDS test.0417.00002.0003i_00036 thyA | Thymidylate synthase | 2.1.1.45 | similar to AA sequence:UniProtKB:P48464 | COG:COG0207 +15435 16310 C CDS test.0417.00002.0003i_00037 lgt | Phosphatidylglycerol--prolipoprotein diacylglyceryl transferase | 2.5.1.145 | similar to AA sequence:UniProtKB:P60955 | COG:COG0682 +16461 18707 C CDS test.0417.00002.0003i_00038 ptsP | Phosphoenolpyruvate-dependent phosphotransferase system | 2.7.3.9 | similar to AA sequence:UniProtKB:P37177 | COG:COG3605 +18720 19250 C CDS test.0417.00002.0003i_00039 rppH | RNA pyrophosphohydrolase | 3.6.1.- | similar to AA sequence:UniProtKB:P0A776 | COG:COG0494 +19695 19856 D CDS test.0417.00002.0003i_00040 NA | hypothetical protein | NA | NA | NA +19935 20624 D CDS test.0417.00002.0003i_00041 mutH | DNA mismatch repair protein MutH | NA | similar to AA sequence:UniProtKB:P06722 | COG:COG3066 +20693 21406 D CDS test.0417.00002.0003i_00042 NA | hypothetical protein | NA | similar to AA sequence:UniProtKB:P67127 | NA +21544 21762 D CDS test.0417.00002.0003i_00043 ygdR | putative lipoprotein YgdR | NA | similar to AA sequence:UniProtKB:P65294 | NA +21870 22910 D CDS test.0417.00002.0003i_00044 tas | Protein tas | NA | similar to AA sequence:UniProtKB:P0A9T4 | COG:COG0667 +22942 24135 C CDS test.0417.00002.0003i_00045 lplT | Lysophospholipid transporter LplT | NA | similar to AA sequence:UniProtKB:P39196 | NA +24128 26287 C CDS test.0417.00002.0003i_00046 aas | Bifunctional protein Aas | NA | similar to AA sequence:UniProtKB:P31119 | COG:COG0204 +26873 27904 D CDS test.0417.00002.0003i_00047 galR | HTH-type transcriptional regulator GalR | NA | similar to AA sequence:UniProtKB:P03024 | COG:COG1609 +27911 29173 C CDS test.0417.00002.0003i_00048 lysA | Diaminopimelate decarboxylase | 4.1.1.20 | similar to AA sequence:UniProtKB:E0IWI3 | NA +29295 30230 D CDS test.0417.00002.0003i_00049 occR | Octopine catabolism/uptake operon regulatory protein OccR | NA | similar to AA sequence:UniProtKB:P0A4T3 | NA +30217 30909 C CDS test.0417.00002.0003i_00050 ygeA | L-aspartate/glutamate-specific racemase | 5.1.1.13 | similar to AA sequence:UniProtKB:A0A140N890 | NA +31038 32456 C CDS test.0417.00002.0003i_00051 araE | Arabinose-proton symporter | NA | similar to AA sequence:UniProtKB:P0AE24 | NA +32771 33532 C CDS test.0417.00002.0003i_00052 kduD | 2-dehydro-3-deoxy-D-gluconate 5-dehydrogenase | 1.1.1.127 | similar to AA sequence:UniProtKB:P37769 | NA +33562 34398 C CDS test.0417.00002.0003i_00053 kduI | 4-deoxy-L-threo-5-hexosulose-uronate ketol-isomerase | 5.3.1.17 | similar to AA sequence:UniProtKB:Q46938 | COG:COG3717 +34685 35866 C CDS test.0417.00002.0003i_00054 thlA | Acetyl-CoA acetyltransferase | 2.3.1.9 | similar to AA sequence:UniProtKB:P45359 | COG:COG0183 +36121 37350 D CDS test.0417.00002.0003i_00055 yqeG | Inner membrane transport protein YqeG | NA | similar to AA sequence:UniProtKB:P63340 | COG:COG0814 +37666 37739 C tRNA test.0417.00002.0003i_00056 NA | tRNA-Gly(ccc) | NA | COORDINATES:profile:Aragorn:001002 | NA +37818 38168 C CDS test.0417.00002.0003i_00057 nlpD | Murein hydrolase activator NlpD | NA | similar to AA sequence:UniProtKB:P39700 | NA +38987 41284 D CDS test.0417.00002.0003i_00058 xdhA_1 | Putative xanthine dehydrogenase molybdenum-binding subunit XdhA | 1.17.1.4 | similar to AA sequence:UniProtKB:Q46799 | COG:COG1529 +41295 42173 D CDS test.0417.00002.0003i_00059 ndhF | Nicotinate dehydrogenase FAD-subunit | 1.17.1.5 | similar to AA sequence:UniProtKB:Q0QLF4 | NA +42170 42649 D CDS test.0417.00002.0003i_00060 ndhS | Nicotinate dehydrogenase small FeS subunit | 1.17.1.5 | similar to AA sequence:UniProtKB:Q0QLF3 | NA +42689 44467 C CDS test.0417.00002.0003i_00061 norR | Anaerobic nitric oxide reductase transcription regulator NorR | NA | protein motif:HAMAP:MF_01314 | NA +44946 46133 D CDS test.0417.00002.0003i_00062 ygeW | Putative carbamoyltransferase YgeW | 2.1.3.- | similar to AA sequence:UniProtKB:Q46803 | COG:COG0078 +46191 47387 D CDS test.0417.00002.0003i_00063 ygeX | Diaminopropionate ammonia-lyase | 4.3.1.15 | similar to AA sequence:UniProtKB:P66899 | COG:COG1171 +47445 48656 D CDS test.0417.00002.0003i_00064 argE | Acetylornithine deacetylase | 3.5.1.16 | similar to AA sequence:UniProtKB:P23908 | COG:COG0624 +48709 50094 D CDS test.0417.00002.0003b_00065 hyuA | D-phenylhydantoinase | 3.5.2.- | similar to AA sequence:UniProtKB:Q46806 | COG:COG0044 +103 1728 C CDS test.0417.00002.0004b_00066 NA | hypothetical protein | NA | NA | NA +1776 2255 C CDS test.0417.00002.0004i_00067 NA | hypothetical protein | NA | NA | NA +2650 3228 D CDS test.0417.00002.0004i_00068 mocA | Molybdenum cofactor cytidylyltransferase | 2.7.7.76 | similar to AA sequence:UniProtKB:Q46810 | COG:COG2068 +3550 6648 D CDS test.0417.00002.0004i_00069 ygfK | Putative oxidoreductase YgfK | NA | similar to AA sequence:UniProtKB:Q46811 | COG:COG0493 +6651 7979 D CDS test.0417.00002.0004i_00070 ssnA | Putative aminohydrolase SsnA | 3.-.-.- | similar to AA sequence:UniProtKB:Q46812 | COG:COG0402 +8030 8809 D CDS test.0417.00002.0004i_00071 NA | hypothetical protein | NA | NA | NA +8806 11676 D CDS test.0417.00002.0004i_00072 xdhA_2 | Putative xanthine dehydrogenase molybdenum-binding subunit XdhA | 1.17.1.4 | similar to AA sequence:UniProtKB:Q46799 | COG:COG1529 +11841 13241 D CDS test.0417.00002.0004i_00073 xanQ | Xanthine permease XanQ | NA | similar to AA sequence:UniProtKB:P67444 | COG:COG2233 +13259 14575 D CDS test.0417.00002.0004i_00074 guaD | Guanine deaminase | 3.5.4.3 | similar to AA sequence:UniProtKB:P76641 | COG:COG0402 +14611 15978 D CDS test.0417.00002.0004i_00075 ghxQ | Guanine/hypoxanthine permease GhxQ | NA | similar to AA sequence:UniProtKB:Q46817 | COG:COG2252 +16014 16502 C CDS test.0417.00002.0004i_00076 hyfA | Hydrogenase-4 component A | 1.-.-.- | similar to AA sequence:UniProtKB:P23481 | COG:COG1142 +16502 18421 C CDS test.0417.00002.0004i_00077 NA | Ferredoxin--NADP reductase | 1.18.1.2 | protein motif:HAMAP:MF_01685 | NA +18857 20305 D CDS test.0417.00002.0004i_00078 uacT | Uric acid transporter UacT | NA | similar to AA sequence:UniProtKB:Q46821 | COG:COG2233 +20307 20432 D CDS test.0417.00002.0004i_00079 yqfG | putative protein YqfG | NA | similar to AA sequence:UniProtKB:C1P614 | NA +20555 21103 D CDS test.0417.00002.0004i_00080 idi | Isopentenyl-diphosphate Delta-isomerase | 5.3.3.2 | similar to AA sequence:UniProtKB:Q46822 | COG:COG1443 +21146 22663 C CDS test.0417.00002.0004i_00081 lysS | Lysine--tRNA ligase | 6.1.1.6 | similar to AA sequence:UniProtKB:P0A8N3 | COG:COG1190 +22673 23554 C CDS test.0417.00002.0004i_00082 prfB | Peptide chain release factor RF2 | NA | similar to AA sequence:UniProtKB:P07012 | COG:COG1186 +23862 25595 C CDS test.0417.00002.0004i_00083 recJ | Single-stranded-DNA-specific exonuclease RecJ | 3.1.-.- | similar to AA sequence:UniProtKB:P21893 | COG:COG0608 +25601 26311 C CDS test.0417.00002.0004i_00084 dsbC | Thiol:disulfide interchange protein DsbC | NA | similar to AA sequence:UniProtKB:P0AEG6 | COG:COG1651 +26336 27232 C CDS test.0417.00002.0004i_00085 xerD | Tyrosine recombinase XerD | NA | similar to AA sequence:UniProtKB:P0A8P8 | COG:COG4974 +27344 27865 D CDS test.0417.00002.0004i_00086 fldB | Flavodoxin 2 | NA | similar to AA sequence:UniProtKB:P0ABY4 | COG:COG0716 +27905 28312 C CDS test.0417.00002.0004i_00087 ygfX | Inner membrane protein YgfX | NA | similar to AA sequence:UniProtKB:Q46824 | NA +28293 28559 C CDS test.0417.00002.0004i_00088 sdhE | FAD assembly factor SdhE | NA | similar to AA sequence:UniProtKB:P64559 | COG:COG2938 +28802 29782 D CDS test.0417.00002.0004i_00089 ygfZ | tRNA-modifying protein YgfZ | NA | similar to AA sequence:UniProtKB:P0ADE8 | COG:COG0354 +29859 30518 C CDS test.0417.00002.0004i_00090 NA | hypothetical protein | NA | similar to AA sequence:UniProtKB:P67153 | NA +30682 30993 C CDS test.0417.00002.0004b_00091 NA | hypothetical protein | NA | similar to AA sequence:UniProtKB:P67603 | NA +29 1012 D CDS test.0417.00002.0005b_00092 bglA | 6-phospho-beta-glucosidase BglA | 3.2.1.86 | similar to AA sequence:UniProtKB:Q46829 | COG:COG2723 +1178 4051 C CDS test.0417.00002.0005i_00093 gcvP | Glycine dehydrogenase (decarboxylating) | 1.4.4.2 | similar to AA sequence:UniProtKB:P33195 | COG:COG0403 +4169 4558 C CDS test.0417.00002.0005i_00094 gcvH | Glycine cleavage system H protein | NA | similar to AA sequence:UniProtKB:P0A6T9 | COG:COG0509 +4582 5745 C CDS test.0417.00002.0005b_00095 gcvT | Aminomethyltransferase | 2.1.2.10 | similar to AA sequence:UniProtKB:P27248 | COG:COG0404 diff --git a/test/data/annotate/exp_files/res_formatAll/prokka/LSTINFO/test_runprokka_H299.lst b/test/data/annotate/exp_files/res_formatAll/prokka/LSTINFO/test_runprokka_H299.lst new file mode 100644 index 0000000000000000000000000000000000000000..3591eaf3fdd79fe7e21304f949730d51558cc622 --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prokka/LSTINFO/test_runprokka_H299.lst @@ -0,0 +1,16 @@ +201 743 C CDS test_runprokka_H299.0001b_00001 NA | hypothetical protein | NA | NA | NA +740 1339 C CDS test_runprokka_H299.0001i_00002 NA | hypothetical protein | NA | NA | NA +1489 2187 C CDS test_runprokka_H299.0001i_00003 NA | hypothetical protein | NA | NA | NA +2187 2483 C CDS test_runprokka_H299.0001i_00004 NA | hypothetical protein | NA | NA | NA +2518 3453 C CDS test_runprokka_H299.0001b_00005 NA | hypothetical protein | NA | NA | NA +201 743 C CDS test_runprokka_H299.0002b_00006 NA | hypothetical protein | NA | NA | NA +740 1483 C CDS test_runprokka_H299.0002i_00007 NA | hypothetical protein | NA | NA | NA +1489 2187 C CDS test_runprokka_H299.0002i_00008 NA | hypothetical protein | NA | NA | NA +2187 2516 C CDS test_runprokka_H299.0002i_00009 NA | hypothetical protein | NA | NA | NA +2513 5092 C CDS test_runprokka_H299.0002i_00010 NA | hypothetical protein | NA | NA | NA +5085 5519 C CDS test_runprokka_H299.0002i_00011 NA | hypothetical protein | NA | NA | NA +5501 5923 C CDS test_runprokka_H299.0002i_00012 NA | hypothetical protein | NA | NA | NA +5939 6679 C CDS test_runprokka_H299.0002i_00013 NA | hypothetical protein | NA | NA | NA +6687 6842 C CDS test_runprokka_H299.0002b_00014 NA | hypothetical protein | NA | NA | NA +163 870 D CDS test_runprokka_H299.0003b_00015 NA | hypothetical protein | NA | NA | NA +863 1795 D CDS test_runprokka_H299.0003b_00016 NA | hypothetical protein | NA | NA | NA diff --git a/test/data/annotate/exp_files/res_formatAll/prokka/Proteins/test.0417.00002.prt b/test/data/annotate/exp_files/res_formatAll/prokka/Proteins/test.0417.00002.prt new file mode 100644 index 0000000000000000000000000000000000000000..c44ff5656428c3ad88dc6ec227d88886c21ab74e --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prokka/Proteins/test.0417.00002.prt @@ -0,0 +1,733 @@ +>test.0417.00002.0001b_00001 501 NA | hypothetical protein | NA | NA | NA +MADSFQNEVPAARVNIKLDLHTGNAKKKVELPLKLLAVGDYSNGKEQRPLSERDKVDINK +NNFNSVMAEFSPAVNLTVEDTLNGNGNEQNIALEFKSLKDFEPEQVAKNIPQLRVLLAMR +NLLRDLKSNLLDNATFRRELENILKDPTLSSELRDELAKIAPQENV +>test.0417.00002.0001i_00002 1539 NA | hypothetical protein | NA | NA | NA +MSVQQEHATSETATLTTTESGGVYQSLFDKINLTPVSSIQEIDLWQNSETLADASPDERV +TAAIHVLLSCLAKSGEDVVKLDKSLLDFHIDDLDQKISKQLDAVMHHPEFQKVESLWRGT +WFVVQRTDFRKNVRIELLDISKEHLRQDFDDSPEIIQSGLYRHTYIQEYDTPGGEPVASL +ISSYEFDNSPQDIALLRNISRVSAASHMPFIGSVGPKFFLKNSMEEVAAIKDIGNYFDRA +EYIKWKSFRDTDDSRYVGLVMPRVLGRLPYGPDTVPVRSFNYVEEVKGPDHEKYLWTNAS +FAFAANMVKSFVNNGWCVQIRGPQAGGAVADLPIHLYDLGTGNQVKIPSEVMIPETREFE +FANLGFIPLSYYKNRDYACFFSANSAQKPALYDTADATANSRINARLPYIFLLSRIAHYL +KIIQRENIGTTKDRRVLELELNTWIRTLVTEMTDPGDELQASHPLRDGKVIVEDIEDNPG +FFRVRLFAVPHFQIEGMDINLSLVSQMPKAKA +>test.0417.00002.0001i_00003 1338 NA | hypothetical protein | NA | NA | NA +MKICRPLWAEGTFLSSQQFQQQARWEAFSNDCIAQLCIRHPWGIANVLFDRDALTPGKLK +TQAVRLRFADGTLIDSDVSDVLPLACDLRALKNDSAIVLLALPLAHGNGGNLGQGEQTER +PLRYRQEWQKVQDIYGSDSEDMAVERHALSLRFAHDNNQDYITCPLARLVRDVQGNWTQD +ESYIPPLLAFNAHDGLVQRLDTLLLQLRAKCQRLMAMRRESNQRMADFAVADVSLFWLLN +ALNSAEPVLSDFLRYPAVHPELVWRELARLAGALLTFSLEHNVSAVPPYVHESPSTVFPP +LFSLLSELLEASLPSRVIALDLASLPGNRWKADLHDPRLREEADFYLSVRSSLPAHQVLH +QLPLVCKIGAPDDVTLLINVALNGVQLVPLTSVPAALPLRLENQYFALDMHSDAAKSMLE +SGSCMIYAPGTMGDLKPELFAVLRT +>test.0417.00002.0001i_00004 666 NA | hypothetical protein | NA | NA | NA +MKKDMDINIDALLLDTFLTVVELRQGTTVRHGIELYRHCQRQVELVRERLKDAGFSRENV +EHITYAQCALLDETVLSRSGMDDGQAIWMKNPLQSHFFNTLQAGELLYERMKQVLQEPAP +AQAVLTCFHRVLLLGFRGRYQDPAAPERDQLISTLNGQVAPFGVLPETAVLNVPLSTRQH +PLLHSPFFWLVTLALLLAGVWWGLHHWLNVLVDELLPQSLR +>test.0417.00002.0001i_00005 1653 ompA | Outer membrane protein A | NA | protein motif:HAMAP:MF_00842 | NA +MRNTLKQAIVLWGMVLLLVLWSVFISPSGVLRWAGAAAIVLAVAALLIYRRRQAWTEMTG +DAGLSSLPPETYRQPVVLVCGGLSAHLFTDSPVRQVSEGLYLHVPDEEQLVAQVERLLTL +RPAWASQLAVAYTVMPGIHRDVAVLAGRLRRFAHSMATVRRRAGVNVPWLLWSGLSGSPL +PERASSPWFICTGGEVQVATSTETTMPAQWIAQSGVQERSQRLCYLLKAESLMQWLNLNV +LTALNGPEAKCPPLAMAVGLVTSLPAVDNNLWQVWITARTGLTTDIADTGTDATLPFPDA +LLRQLPRQSDFTPLRRACVTMLGITTAAGITMLCLSATANRQLLRQVGDDLHRFYAVPVE +EFITKARHLSVLKDNATMLDGYYREGEPLRLGLGLYPGERIRQPVLRAIRDWRPPEQKME +VTASLQVQTVRLDSMSLFDVGQARLKDGSTKVLVDALVNIRAKPGWLILVAGYTDATGDE +KSNQQLSLRRAEAVRNWMLQTSDIPATCFAVQGLGESQPAATNDTPQGRAVNRRVEISLV +PRSDACQDVK +>test.0417.00002.0001i_00006 492 hcpA | Major exported protein | NA | similar to AA sequence:UniProtKB:Q9HI36 | COG:COG3157 +MAIPAYLWLKDDGGADIKGSVDVQGREGSIEVVALDHDVYIPTDNNTGKLTGTRTHKPFT +FTKEIDASSPYLYKAVTTGQTLKTAEFKFYRINDAGQEVEYFNITLDNVKLVRVAPLMHD +IKDPSREKHNHLERIEFRYEKITWTYKDGNIIHSDSWNERPSA +>test.0417.00002.0001b_00007 2637 clpV1 | Protein ClpV1 | NA | similar to AA sequence:UniProtKB:Q9I742 | COG:COG0542 +MTGNHSAALLRRLNPYCARALDAAASLCQTRAHAEITIEHWLLKLLEQGEGDITVIARRY +EWDIDTLWQSLLAHLDTLPRPVRERPQLSEPLAALIRQAWLIASLEGDDPQIRSQHLLMA +LTEKPMLPACNDLWVLLSLSRVQLERLRPLLDAQSDECPARQPQVTEPLTSALPETATAD +APAKTLTEKQDDALLAVLNRFTEDVTEKARSGRIDPVFGRDTEIRQMVDILSRRRKNNPI +LVGEPGVGKTALVEGLALRITEGNVPDSLKTVHIRTLDLGLLQAGAGVKGEFEQRLKNVI +DAVQKSPEPVLLFIDEAHTIIGAGNQAGGADAANLLKPALARGELRTIAATTWSEYKQYF +ERDAALERRFQMVKVDEPDDDTACLMLRGLKARYAQHHGVHMLDSAIQTAVRLSRRYLTG +RQLPDKAVDLLDTAGARVRMSLDTLPEPLTQLHARLAALDIEREAIEQDSVFYPEASPER +LAELTDLRDELQAEAGHLEAQYQQEKALAQQIMTLRQEGTDSSELQQQLRTHQGFAPLLA +LDVDARAVATVVADWTGIPLSSLLKDEQSDLLSMEQSLENRVVGQSPALCAIAQRLRAAK +TGLTPENGPQGVFLLTGPSGTGKTETALTLADTLFGGEKSLITINLSEYQEPHTVSQLKG +SPPGYVGYGQGGVLTEAVRKRPYSVVLLDEVEKAHRDVMNLFYQVFDRGFMRDGEGREID +FRNTVILMTANLGSDHIMQLLEEKPDATDADLHELLYPLLRDHFQPALMARFQTVIYRPL +GQEAMRAIVEMKLAQVARRLHQHYGLETEISNSLYDALTAACLLPDTGARNIDSLLNQQI +LPVLSQQLLAQQAVHHKPARLRLDWDDEDGIVLEFDEK +>test.0417.00002.0002b_00008 1161 NA | hypothetical protein | NA | NA | NA +MILTLVGLIPVAGSLIKGIFKVLFNSIRKAALSSRDIVRAIDASVSLFNKFIDLPAVQAT +MKWMKIYNPYTYAEKQVRELMAQLNVSVLLSKLDELMDVTGSLLEKAKSWGPESIRQPIE +VIWELLVSIRSQANTMLAKALAPLNDVLEKLAARLHREGDDYYKAHTGANPHRPSRLKDA +EEVELLATKKPDWADIGGKEKYPQLEKASAEQKRLMDPENKEGGYPNIPDDKVQTFHQMA +PVEFKEGEKLYRVLDPGSSDNSFCWMREAEFKALKSKSQWRRRFAVWKSWNENGEYVVYT +VPPGTTMKVWEGPAASQVREVTGKNGENIKVVLEGGSLQIVIDPTVLNLDYLGKRQSTGW +GYRDFSDEVDMYIGVPQLQTNIYVPK +>test.0417.00002.0002i_00009 1068 NA | hypothetical protein | NA | NA | NA +MAILHPQECWLLERIMSPEYYRRRFEGWQAFVELCERQVAEWSKTIPLDVRRRPLYEQID +AVWGGRVLPNIRSTLKSVQYDFIQLQQGDLRVLQSGGNISSDMKGLIDYPPDWMSPAAQK +QYDRLKWRGAHYNNLIRRTSGGYWYDGELTYYYEESLHGPLALPMQLPLYELDSSVYLRE +DDPVTVAGLYLPDIPDASAQLLYRSEHIPEAWQGRVRTKYVNEAGIQEYYWESGAWAKCN +WKRIRRVANRFINVPPEGFFPQGMPEELYNWPQREAQYVTDRQRIAAYSGEACPHSGEWS +IFVEGRQATETLEQGEQMPEWTDRKMEGEYKRGEKFHVLWSLMNRHDGGSVWVEA +>test.0417.00002.0002i_00010 381 NA | hypothetical protein | NA | NA | NA +MRISLASLFFLCCTVSDSVYADTDQTYDIFWGMLVKDKKDTIFVRCDSPLLKMKIVRMAD +ANTENIDKAYQIFNQKTKKSIYFAFIGNVTDAGSGKYIFNMLDVMETREGYCNLSDVLNA +IDEQFR +>test.0417.00002.0002i_00011 264 NA | hypothetical protein | NA | NA | NA +MKGIVVLGDKTTHGGQVISVSSSMVINGKKVALVGDKINCPVKGHGINTIIEGSFDWISD +GKQVVVNGCRCECGCVVISSIADALIG +>test.0417.00002.0002i_00012 1140 NA | hypothetical protein | NA | NA | NA +MGWKRTYTEEIDRPQDIYFHKWLFSLFILCILLLVIYYFFHEFVVANNASLLAFFSPLLL +WVLILSVQVIFYSRAIQDYSIWLENRLSINREWEAWGSRYVSVMNSSLHLPGKVDVLFLS +GDELETQYGLVNKSDDITWKQHDWYACFQTLTNHLELYKLPYQLTQEFIILTDFDESMYS +QIEEDFFRTVEKTNRTEGHFLLHISPSMSFGELDLWLKDSEEKIYIVMVLQMEEQTSCSD +AMACLMFATDDVTAKYKLTEKARIYRPMVVNSNNFNSDLNIFIDTQKISKNAAGLVGDSQ +RLFSVSSNVLQCFNDNNAQLKIDNIHLLESLCGLPGGNAVWLTAALTISVVVHKNSDYLM +MSENNDDWIITTIHPMEHS +>test.0417.00002.0002i_00013 3354 NA | hypothetical protein | NA | NA | NA +MKRINKKSVFISNVLLFLVIVAFVGGIIWRFGDHFGLKGDENNFFAWLICIMTLIFVRAS +WYFSRLYRLRKEQHHSEKERLRPEKEARIEYGKVITLNIELAEYLCALYGPFWRRKVRLL +LVTGEPEQAEAIAPGLTGQHWLEGDHKVLIYGGRPSAEPDVALLTALKKLRRSRPLDGII +WPLTEEQSRQTAQLDKGWRELINGGKRLGFQAPLYLWQVCDNGDYQTGRPLQSVGCLLPE +RCTPEQLAAMLEAQTLPLTEQGMSQLLADNRHDFLLRLAHTLAERGIAHWQSVLKPLLAG +GAFSSLRLRGLMFSPPLAAVPEAAPHAWLPSPVWAGVTGDNARGRAVGFPWLRAALITSI +CMLAIWGAGMTTSFFANRALVQETGIQTARALDTRLPLAEQLVALHTLQGELERLQYRIR +EGAPWYQRFGLERNQQLLAAAFPGYAQAANRLVRDVAVDHLQQQLNAFVALPPNSPQRTA +TGEQRYKQLKALLMTSRPEKADAAFFSTTLMADGLRYENIPEGVRQSVLPSLLTFWMANL +PEHPQWKTAPPPELTGAVRKILLRQIGVRNAENTLYQNVLQQVSRNYADMTLADMTGDTL +TESLFSTEQTVPGMFTRQAWEGQVREAIEQVVTARREEIDWVLSDRQQDTSADISPDTLR +NRLTSRYFTDFAGSWLAFLNSIRWKKEDSLSGILDQLTLMADARQSPLIALTDTLAWQAA +AGRENRGLSDSLAKSAQELFNGKEKTPQQSREGNEPVGPLDKTFAPLLRLLGDKAGGGDS +QLSLQTYLTRVTRVRLKLQQVTNAPDPQEMTQQLAQTVLQGKTVDLTDTRDYGRLIAASL +GEEWSGFGQALFVRPVEQSWRQVLTPAADSLNRQWHRAIVSHWNQDFAGRYPFKASQNDA +SLPLLAQYLRDDGRINQFIAANLSGVLKREGRYWVADAMNTQGLTVNPDFIRALNRLRDV +ADTAFASGDAGIHFELRAKPARDVMKTHLVIDGQELEYFNQKERWQRFNWPDEQWQPGAS +LSWTSTQAMERILADYRGSWSLIRLLEQAQVTPVDSSTFKVVWKAQDGLPLNYLLRVEQG +KGPLALLELKNFRLPGQVFLTGRSMKDAEEYGEDADE +>test.0417.00002.0002i_00014 1638 NA | hypothetical protein | NA | NA | NA +MRKNTGKTPMSELLQKLTRSCFADRDALDVARTQAALWQTWLLPVTADTPVGEDPGYHDD +FLRIRDEMNKLSGADTDLICQLAESLLLTQAKDVRIATYYIWARLHRDGERGLAEGLALL +TGLVERFGTQLLPSRPASRKMALEWLAGEKMLDSLARYPEVAKEDFANIVAALNQLTVSF +AAWPEDQHSPSLMPLINALESRLAQSGGMNAVVPQNSSSVPAPSSPVDAPQVQTITSGRD +LLDQAKVLARYLNEQPQGWLSAHRLMKTLRWDTVHELPPDVDGKTRLAPPRTESRNQLKR +LYAQQNWTELLEQADLMFSTGVSHFWLDIQWYLHQALAKAGAPWDRWTAVIRQDLTLLLE +RLPGLENLAWNDGTPFADEVTRNWIAQQVMMREDGAWLAGKAAVPTDDATNDVLALEPEA +LAMADSQGVEAALGWIQTRPGITTARQRLLLRLLMARVAEQYGKNEMALLLLEELDTAAQ +GITLTQWEPELLFEVKARQLKLLRLRAHRHADKAALARKMDALLGSLVAIDPARTAVLCD +TQHKD +>test.0417.00002.0002i_00015 1761 NA | hypothetical protein | NA | NA | NA +MDDLTQRYFEAEMRYLREAGKEFAQAYPDRAAMLNLDKPGARDPYVERLFEGFAFLMGRL +REKLDDDLPELTEGLVSLLWPHYLRTIPSLSVVELSTDHRQMKQSETLSDFQVLSRPVGE +RRTRCFYSATRDITLHPLALPDVSLQYEPDGRSVIRLRFECGPLVGDWSQIDLSRLPLYL +NADSPVACALHRALTLGTQQFWLRLPGQDRRMLGAHFSPMGFEDDDRLWPKGESAFSGYQ +LLLEYFTFREKFMFVALNGLEQVAWPEGITGFEIDVVLNENWPHDLPFDSDNIRLHCVPV +INLFPLEADPLHLSPLENEFLLRPMRIQDGHTEIYSVDNIISSRHTGSQAYVPFSSFRHR +GGMLRHDAPERYYHTRVKRGPSGLHDTWLILGGDAFDSDRMLEDETLSLSLTGTNGQLPR +KALQSTLLDTPVHASQNVLRVRNLCAPTQPCYPPARDRFHWRVLSHLGSNFLSMMDNAEI +LRGTLALYDWTESEMNRRRLEAIVDVQHSLIQRFERGFLLRGVDIQVTLDSNGFAGEGDI +TLFGELLHRFFALYADIHLFTQLTLILQPTGKCLQWTEHHSQRVPG +>test.0417.00002.0002i_00016 1080 NA | hypothetical protein | NA | NA | NA +MDRASQPARTGLTDRLAPDIARINFYRFCQLLEQSQQKAPLGSTDNPAADAVRFRPHPGM +GFPVSELKNVERDVDNPDAPPTVRTTFLGLYGVDSPLPTAYLDYITQRHDGHDAVMAFLD +IFNHRFITQYYRIWRKYNYPASFEAGAVDDISRCLLGLIGLGIPGSENHIATPVSRFLAL +LSVMRLPTRTAEGVTALVGLLAPLTKATVVPHDPQPVILPAPAGLSKNSRISLKTRTLLG +RTGTDVNSQLLLKLYTEDAAEARGWLPGGQLHSDLLVLLRVYLGWRCQARLQLTLPVSLL +PAARLGKQRVQISRTGILLASFAAPATGTVTVSLGRYQGLIPAFSIRNRESMTHVSYSF +>test.0417.00002.0002i_00017 537 NA | hypothetical protein | NA | NA | NA +MFPIRFKRPALLCMAMLTVVLSGCGLIQKVVDESKSVASAVFYKQIKILHLDFFSRSALN +TDAEDTPLSTMVHVWQLKTREDFDKADYDTLFMQEEKTLEKDVLAKHTVWVKPEGTASLN +VPLDKETQFVAIIGQFYHPDEKSDSWRLVIKRDELEADKPRSIELMRSDLRLLPLKDK +>test.0417.00002.0002i_00018 429 NA | hypothetical protein | NA | NA | NA +MSTPSLYEMLTFSFSGELPLEQISERDQLILSVMDNMQRIINCRAGTLAHLPDYGLPDLS +LIHQGMAAGIHGLMRQIEETLLRYEPRLSQIQVELLPQPRPGHLNYLIHAQLPDTGWIRF +DGVFSPEGRIVLRHLKQQERAY +>test.0417.00002.0002i_00019 1377 NA | hypothetical protein | NA | NA | NA +MASNANFISQFVMGGDPCTYKESGELQAEMSKLTHPARPDVDWRQVEKLCLALFRQNGVE +LQTLVCYVLAITRRQGLAGMADGLGSLDILLQRWADFWPVQVHSRISLLSWVTEKMQQAL +RTLDIQYQDLPQIYRCVQHLSAIETTLQQCELWHMTKLDLLAGQFRNTALRLERLAPQGA +ETTITPPELPRREMNQPKKSEESPQPVFATRSVQQNDKDASPPVPSPEISRQRTWPIFMA +GMVVMAGLGGTGLWGWSQLNQPDALIQRIQLSVMPLPQSLESGELAKLDVKDKALLAQDR +TIAASQMQLEQLNKLPARWPLEQGYRQLRQLDALWPDNPQVRALNAQWRKQRELSALSAE +ALNGYAQAQSQLQRLSAQLDALDERKGRYLTGSELKTAVYGIRQSLKEPPLEELLRQLEE +QKQTGEVSPTLLTQIDTRLNQLLNRYVILLDTKVEQSQ +>test.0417.00002.0002i_00020 948 NA | Hydroxypyruvate reductase | 1.1.1.81 | similar to AA sequence:UniProtKB:Q9X1C1 | COG:COG0111 +MKNVLVTVPSFSARCVSASKLLRENNFNLIIKNNVEHLLKSESTALRESICAVIAGKDGY +QADTLSLLPGVRIISRFGTGIDNIDLRAAQQSGIVVNNAVGINSNAVAEFIIGLIFASMR +NIPGSYHAMQNGYWGESHGCELQGKRIGLVGYGNIGKTLAKRLSGFDVELLAFDKQPDYQ +VADKAGVQFVSIEDIFMQSHVIIVLLPFSSELENFISHKYLSMMRNGALIINAARGKLLD +EGALLQVIEERNVFAALDVFSSEPLAQFSPLLHAKNIITTPHIAAATVESYQQTGIHVAQ +SIIDYFAGREIKNVL +>test.0417.00002.0002i_00021 597 kdsD | Arabinose 5-phosphate isomerase KdsD | 5.3.1.13 | similar to AA sequence:UniProtKB:Q9HVW0 | COG:COG0517 +MNNTDLIHLIKHFMRNEHKAVEEVIDSPLSEVANLIKVLQSCQGKVVFIGVGKSGIIARK +LAATFASTGTPSFFVHGTEAVHGDLGMVAKDDVVILISNSGETAEILATLPSLKKMGNYL +ISFTRSHHSSLAISCDLSVEIPVKSEADNLGLAPSCSSTVVLVVGDAVALALSELKKFTR +ADFGLYHPGGALGIKANS +>test.0417.00002.0002i_00022 1176 malY | Protein MalY | NA | similar to AA sequence:UniProtKB:P23256 | COG:COG1168 +MDVFNTPVSRKGTYCTQWDFCEDRFGVKDVLPFSISDMDLPIPDAITRALKKRLEHPILG +YSRWQHGEYLNAIVNWYYQQYQTDIKPEWITYSPSVMYSIAKAIELLTSHGDNILVFTPV +YNAFFDVIKHSERNILTASLIIKNEGGYAINWQDFDLKIKSAKMMLLCNPHNPTGTVWSE +EELHKIAASCTRHNVWLCSDEIHSDFVFNRSFTSALKIKKEKVVVFNSISKTFNVPALTG +SYMISTDDNFNHKFRTISRYRDFVNSPSVLNIIATIIAYNECEGWLKSLKAHIASNIQFT +QQYLNENIPELIVRPADGCYFSWIDCSAIGYPFDEFYSRLIHEGKVGIMAGHVYGTEGEG +YLRLNLACGREKLYMGLTRLVSVIKNINQGE +>test.0417.00002.0002i_00023 1581 malX | PTS system maltose-specific EIICB component | NA | similar to AA sequence:UniProtKB:P19642 | COG:COG1263 +MKQKKAWSFFQSLGKAFMYPIALLSVCGMMLGLGSGLASDDMAKLIPFLAIPIIKTILDF +IVSLGLFAFVNLPVLFAIAIPLGLLKDKEDKAYGAFSGLIGFMAMHLGTNFYLKQHDLLV +VADQMSTHGQTIILGIQSYNTSVLGGIVAGLLVASMYKKIVNLRIPESLGFYSGPRLVPI +ITLIVMSGFGLIIPFIWPPFFNLFMLIGHWISTSGPVGYFFYAVAERVTIPFGLNHLVTS +VFRFTPIGGSAVIGGEEYYGTLNMFMAYVKENAVIPLDLAGKMEQGKLMIQYGLAGAALA +MYRTAHAQNRKAIKALLISGVLTVIIGGVSEPIEFLFLFVSPLLFVFHAFMNGFANMVLP +YMGVKMGFTGDLIQFISFGVLRGTRTGWPIAVCVEVAYFFIYYFVFRWTILKFNLMTVGR +EESSPVTLNAHEDTAIADIPTPDKSELQAAEQMVKALGGKENIKSLDNCVTRLRLTIADM +RLIDEVAIKRAGGIAVVKLDQNTLQVIIGTKVIALRRDMDNYMGIY +>test.0417.00002.0002i_00024 825 licT | Transcription antiterminator LicT | NA | similar to AA sequence:UniProtKB:P39805 | COG:COG3711 +MIIEKVMNNNCVQASMNGQEVIISGPGVGYNKKYGMSVPEHPANRIFYVRNEQKNKLYKL +IEHVDIEYVFVAEKIVQYAEKNLEKNLNPSLLLILADHISNAISRVVSGIQINNVFLDEI +KALYKAEYAISRDALTIINEQFSVQLPDDEIGFIALHILNNYENSVDYESVRIIELSQII +TELIEVVYNRKVDRSSFNYSRFMMHLKYFSSRVLCNEKIKQKDIGDIYEQFLEKDILLQR +AIHEIERYLYATFKYELILEEKLYLSIRTKVLMD +>test.0417.00002.0002i_00025 1254 amiC | N-acetylmuramoyl-L-alanine amidase AmiC | 3.5.1.28 | similar to AA sequence:UniProtKB:P63883 | COG:COG0860 +MSGSNTAISRRRLLQGAGAMWLLSVSQVSLAAVSQVVAVRVWPASSYTRVTVESNRQLKY +KQFALSNPERVVVDIEDVNLNSVLKGMAAQIRADDPFIKSARVGQFDPQTVRMVFELKQN +VKPQLFALAPVAGFKERLVMDLYPANAQDMQDPLLALLEDYNKGDLEKQVPPAQSGPQPG +KAGRDRPIVIMLDPGHGGEDSGAVGKYKTREKDVVLQIARRLRSLIEKEGNMKVYMTRNE +DIFIPLQVRVAKAQKQRADLFVSIHADAFTSRQPSGSSVFALSTKGATSTAAKYLAQTQN +ASDLIGGVSKSGDRYVDHTMFDMVQSLTIADSLKFGKAVLNKLGKINKLHKNQVEQAGFA +VLKAPDIPSILVETAFISNVEEERKLKTATFQQEVAESILAGIKAYFADGATLARRG +>test.0417.00002.0002b_00026 189 NA | hypothetical protein | NA | NA | NA +MLNGFTAEHDDKRFSPVGIDIGNRMAESLDQLGFTFLYHGTPLCMIIRNYCIFILFFRRV +QV +>test.0417.00002.0003b_00027 720 argA | Amino-acid acetyltransferase | 2.3.1.1 | similar to AA sequence:UniProtKB:P0A6C5 | COG:COG0548 +MIGFCSSQGVTNDDGDIVSELFPNEAQARVEAQEEKGDYNSGTVRFLRGAVKACRSGVRR +CHLISYQEDGALLQELFSRDGIGTQIVMESAEQIRRATINDIGGILELIRPLEQQGILVR +RSREQLEMEIDKFTIIQRDNTTIACAALYPFPEEKIGEMACVAVHPDYRSSSRGEVLLER +IAAQAKQSGLSKLFVLTTRSIHWFQERGFTPVDIDLLPESKKQLYNYQRKSKVLMADLG +>test.0417.00002.0003i_00028 1827 recD | RecBCD enzyme subunit RecD | 3.1.11.5 | similar to AA sequence:UniProtKB:P04993 | COG:COG0507 +MKLQKQLLEAVEHKQLRPLDVQFALTVAGDEHPAVTLAAALLSHDAGEGHVCLPLSRLEN +NEASHPLLATCVSEIGELQNWEECLLASQAVSRGDEPTPMILCGDRLYLNRMWCNERTVA +RFFNEVNHAIEVDEALLAQTLDKLFPVSDEINWQKVAAAVALTRRISVISGGPGTGKTTT +VAKLLAALIQMADGERCRIRLAAPTGKAAARLTESLGKALRQLPLTDEQKKRIPEDASTL +HRLLGAQPGSQRLRHHAGNPLHLDVLVVDEASMIDLPMMSRLIDALPDHARVIFLGDRDQ +LASVEAGAVLGDICAYANAGFTAERAGQLSRLTGSHVPAGTGTEAASLRDSLCLLQKSYR +FGSDSGIGQLAAAINRGDKTAVKTVFQQDFTDIEKRLLQSGEDYIAMLEEALAGYGRYLD +LLQARAEPDLIIQAFNEYQLLCALREGPFGVAGLNERIEQFMQQKRKIHRHPHSRWYEGR +PVMIARNDSALGLFNGDIGIALDRGQGTRVWFAMPDGNIKSVQPSRLPEHETTWAMTVHK +SQGSEFDHAALILPSQRTPVVTRELVYTAVTRARRRLSLYADERILSAAIATRTERRSGL +AALFSSRG +>test.0417.00002.0003i_00029 3543 recB | RecBCD enzyme subunit RecB | 3.1.11.5 | similar to AA sequence:UniProtKB:P08394 | COG:COG1074 +MSDVAETLDPLRLPLQGERLIEASAGTGKTFTIAALYLRLLLGLGGSAAFPRPLTVEELL +VVTFTEAATAELRGRIRSNIHELRIACLRETTDNPLYKRLLEEIDDKAQAAQWLLLAERQ +MDEAAVFTIHGFCQRMLNLNAFESGMLFEQQLIEDESLLRYQACADFWRRHCYPLPREIA +QVVFETWKGPQALLRDINRYLQGEAPVIKAPPPDDETLASRHAQIVARIDAVKQQWRDAV +GELDALIESSGIDRRKFNRSNQAKWIEKISAWAEEETNSYQLPESLEKFSQRFLEDRTKA +GGETPRHPLFEAIEQLLAEPLSIRDLVITRALAEIRETVAREKRRRGELGFDDMLSRLDS +ALRSESGEVLAAAIRTRFPVAMIDEFQDTDPQQYRIFRRIWHHQPETALLLIGDPKQAIY +AFRGADIFTYMKARSEVHAHYTLDTNWRSAPGMVNSVNKLFSQTDDAFMFREIPFIPVKS +AGKNQALRFVFKGETQPAMKMWLMEGESCGVGDYQSTMAQVCAAQIRDWLQAGQRGEALL +MNGDDARPVRASDISVLVRSRQEAAQVRDALTLLEIPSVYLSNRDSVFETLEAQEMLWLL +QAVMTPERENTLRSALATSMMGLNALDIETLNNDEHAWDAVVEEFDGYRQIWRKRGVMPM +LRALMSARNIAENLLATAGGERRLTDILHISELLQEAGTQLESEHALVRWLSQHILEPDS +NASSQQMRLESDKHLVQIVTIHKSKGLEYPLVWLPFITNFRVQDQAFYHDRHSFEAVLDL +NAAPESVDLAEAERLAEDLRLLYVALTRSVWHCSLGVAPLVRRRGDKKGDTDVHQSALGR +LLQKGEPQDAAGLRTCIEALCDDDIAWQTAQIGDNQPWQVNDALTAELNARTLQRLPGDN +WRVTSYSGLQQRGHGIAQDLMPRLDVDAAGVVSVVEEPTLTPHQFPRGASPGTFLHSLFE +DLDFTQPVDPNWVQEKLELGGFEPQWEPVLTEWITAVLQAPLNETGVSLNQLSDRDKQVE +MEFYLPISEPLIASQLDALIRQFDPLSAGCPPLEFMQVRGMLKGFIDLVFRHEGRYYLLD +YKSNWLGEDSSAYTQQAMAAAMQAHRYDLQYQLYTLALHRYLRHRIADYDYERHFGGVIY +LFLRGVDKEHPQQGIYATRPNAGLIDLMDEMFAGMTLEEA +>test.0417.00002.0003i_00030 2889 ptrA | Protease 3 | 3.4.24.55 | similar to AA sequence:UniProtKB:P05458 | COG:COG1025 +MPRSIWFKALLLFVALWAPLSQAETGWQPIQETIRKSDKDNRQYQAIRLDNGMVVLLVSD +PQAVKSLSALVVPVGSLEDPEAYQGLAHYLEHMSLMGSKKYPQADSLAEYLKMHGGSHNA +STAPYRTAFYLEVENDALPGAVDRLADAIAEPLLDKKYAERERNAVNAELTMARTRDGMR +MAQVSAETINPAHPGSKFSGGNLETLSDKPGNPVQQALKDFHEKYYSANLMKAVIYSNKP +LPELAKMAADTFGRVPNKESKKPEITVPVVTDAQKGIIIHYVPALPRKVLRVEFRIDNNS +AKFRSKTDELITYLIGNRSPGTLSDWLQKQGLVEGISANSDPIVNGNSGVLAISASLTDK +GLANRDQVVAAIFSYLNLLREKGIDKQYFDELANVLDIDFRYPSITRDMDYVEWLADTMI +RVPVEHTLDAVNIADRYDAKAVKERLAMMTPQNARIWYISPKEPHNKTAYFVDAPYQVDK +ISAQTFADWQKKAANIALSLPELNPYIPDDFSLIKSEKKYDHPELIVDESNLRVVYAPSR +YFASEPKADVSLILRNPKAMDSARNQVMFALNDYLAGLALDQLSNQASVGGISFSTNANN +GLMVNANGYTQRLPQLFQALLEGYFSYTATEDQLEQAKSWYNQMMDSAEKGKAFEQAIMP +AQMLSQVPYFSRDERRKILPSITLKEVLAYRDALKSGARPEFMVIGNMTEAQATTLARHV +QKQLGADGSEWCRNKDVVVDKKQSVIFEKAGNSTDSALAAIFVPTGYDEYTSSAYSSLLG +QIVQPWFYNQLRTEEQLGYAVFAFPMSVGRQWGMGFLLQSNDKQPSFLWERYKAFFPTAE +AKLRAMKPEEFAQIQQAVITQMLQAPQTLGEEASKLSKDFDRGNMRFDSRDKIVAQIKLL +TPQKLADFFHQAVVEPQGMAILSQISGSQNGKAEYVHPEGWKVWENVSALQQTMPLMSEK +NE +>test.0417.00002.0003i_00031 3369 recC | RecBCD enzyme subunit RecC | 3.1.11.5 | similar to AA sequence:UniProtKB:P07648 | COG:COG1330 +MLRVYHSNRLDVLEALMEFIVERERLDDPFEPEMILVQSTGMAQWLQMTLSQKFGIAANI +DFPLPASFIWDMFVRVLPEIPKESAFNKQSMSWKLMTLLPQLLEREDFTLLRHYLTDDSD +KRKLFQLSSKAADLFDQYLVYRPDWLAQWETGHLVEGLGEAQAWQAPLWKALVEYTDELG +QPRWHRANLYQRFIETLESATTCPPGLPSRVFICGISALPPVYLQALQALGKHIEIHLLF +TNPCRYYWGDIKDPAYLAKLLTRQRRHSFEDRELPLFRDSENAGQLFNSDGEQDVGNPLL +ASWGKLGRDYIYLLSDLESSQELDAFVDVTPDNLLHNIQSDILELENRAVAGVNIEEFSR +SDNKRPLDPLDSSITFHVCHSPQREVEVLHDRLLAMLEEDPTLTPRDIIVMVADIDSYSP +FIQAVFGSAPADRYLPYAISDRRARQSHPVLEAFISLLSLPDSRFVSEDVLALLDVPVLA +ARFDITEEGLRYLRQWVNESGIRWGIDDDNVRELELPATGQHTWRFGLTRMLLGYAMESA +QGEWQSVLPYDESSGLIAELVGHLASLLMQLNIWRRGLAQERPLEEWLPVCRDMLNAFFL +PDAETEAAMTLIEQQWQAIISEGLGAQYGDAVPLSLLRDELALRLDQERISQRFLAGPVN +ICTLMPMRSIPFKVVCLLGMNDGVYPRQLAPLGFDLMSQKPKRGDRSRRDDDRYLFLEAL +ISAQQKLYISYIGRSIQDNSERFPSVLVQELIDYIGQSHYLPGDEALNCDESEARVKAHL +TCHHTRMPFDPQNYQPGNLQSYAREWLPAASQAGKAHSEFVQPLPFTLPETVPLETLQRF +WAHPVRAFFQMRLQVNFRTEDSEIPDTEPFILEGLSRYQINQQLLNVLVEQDDAERLFRR +FRAAGDLPYGAFGEIFWETQCQEMQQLADRVIACRQPGQSMEIDLACNGVQITGWLPQVQ +PDGLLRWCPSLLSVAQGMQLWLEHLVYCASGGNGESRLFLRKDGEWRFPPLAAEQALHYL +SQLIEGYREGMSAPLLVLPESGGAWLKTCYDAQNDAMLDDDSTLQKARTKFLQAYEGNMM +VRGEGDDIWYQRLWRQLTPETMEAIVEQSQRFLLPLFRFNQS +>test.0417.00002.0003i_00032 324 NA | hypothetical protein | NA | NA | NA +MSASLRNQQGFSLPEVMLAMVLMVMIVTALSGFQRTLMNSLASRNQYQQLWRHGWQQTQL +RAISPPANWQVNRMQTSQAGCVSISVTLVSPGGREGEMTRLHCPNRQ +>test.0417.00002.0003i_00033 408 NA | hypothetical protein | NA | NA | NA +MNREKGVSSLALVLMLLILGSLLLQGMSQQDRSFASRVSMESQSLSRQAIVQSALEWGKM +HSWQTQPAVQCLLYAATGARVCLRLLADNEALLIAGYEGVSLWRTGEVIDGNIVFSPRGW +SDFCPLKERALCQLP +>test.0417.00002.0003i_00034 564 NA | hypothetical protein | NA | NA | NA +MPVKEQGFSLLEVLIAMAISSVLLLGAARFLPALQRESLTSTRKLALEDEIWLRVFTVAK +HLQRAGYCHGSCTGEGLEIVGQGDCVIVQWDANSNGIWDREPVKESDQIGFRLKEHVLET +LRGATSCEGKGWDKVTNPDAIIIDTFQVVRQDVSGFSPVLTVNIHAASKADPQTVVDASY +SVTGANL +>test.0417.00002.0003i_00035 504 NA | hypothetical protein | NA | NA | NA +MKTQRGYTLIETLVAMLILVMLSASGLYGWQYWQQSQRLWQTASQARDYLLYLREDANWH +NRDHSISLIREGTLWCLVSSVAGANTCHGSSVAGANTCHGSSPLVFVPRWPEVEMSDLTP +SLAFFGLRNTAWAGHIRFKNSTGEWWLVVSPWGRLRLCQQGETEGCL +>test.0417.00002.0003i_00036 795 thyA | Thymidylate synthase | 2.1.1.45 | similar to AA sequence:UniProtKB:P48464 | COG:COG0207 +MKQYLELMQKVLDEGTQKNDRTGTGTLSIFGHQMRFNLQDGFPLVTTKRCHLRSIIHELL +WFLQGDTNIAYLHENNVTIWDEWADENGDLGPVYGKQWRAWPTPDGRHIDQITTVLNQLK +NDPDSRRIIVSAWNVGELDKMALAPCHAFFQFYVADGKLSCQLYQRSCDVFLGLPFNIAS +YALLVHMMAQQCDLEVGDFVWTGGDTHLYSNHMDQTHLQLSREPRPLPKLIIKRKPESIF +DYRFEDFEIEGYDPHPGIKAPVAI +>test.0417.00002.0003i_00037 876 lgt | Phosphatidylglycerol--prolipoprotein diacylglyceryl transferase | 2.5.1.145 | similar to AA sequence:UniProtKB:P60955 | COG:COG0682 +MTSSYLHFPEFDPVIFSIGPVALHWYGLMYLVGFIFAMWLATRRANRPGSGWTKNEVENL +LYAGFLGVFLGGRIGYVLFYNFPQFMADPLYLFRVWDGGMSFHGGLIGVIVVMIIFARRT +KRSFFQVSDFIAPLIPFGLGAGRLGNFINGELWGRVDPNFPFAMLFPGSRTEDILLLQTN +PQWQSIFDTYGVLPRHPSQLYELLLEGVVLFIILNLYIRKPRPMGAVSGLFLIGYGAFRI +IVEFFRQPDAQFTGAWVQYISMGQILSIPMIVAGVIMMVWAYRRSPQQHVS +>test.0417.00002.0003i_00038 2247 ptsP | Phosphoenolpyruvate-dependent phosphotransferase system | 2.7.3.9 | similar to AA sequence:UniProtKB:P37177 | COG:COG3605 +MLTRLREIVEKVASAPRLNEALNILVTDICLAMDTEVCSVYLADHDRRCYYLMATRGLKK +PRGRTVTLAFDEGIVGLVGRLAEPINLADAQKHPSFKYIPSVKEERFRAFLGVPIIQRRQ +LLGVLVVQQRELRQYDESEESFLVTLATQMAAILSQSQLTALFGQYRQTRIRALPAAPGV +AIAEGWQDATLPLMEQVYQASTLDPALERERLTGALEEAANEFRRYSKRFAAGAQKETAA +IFDLYSHLLSDTRLRRELFAEVDKGSVAEWAVKTVIEKFAEQFAALSDNYLKERAGDLRA +LGQRLLFHLDDANQGPNAWPERFILVADELSATTLAELPQDRLVGVVVRDGAANSHAAIM +VRALGIPTVMGADIQPSVLHRRTLIVDGYRGELLVDPEPVLLQEYQRLISEEIELSRLAE +DDVNLPAQLKSGERIKVMLNAGLSPEHEEKLGSRIDGIGLYRTEIPFMLQSGFPSEEEQV +AQYQGMLQMFNDKPVTLRTLDVGADKQLPYMPISEENPCLGWRGIRITLDQPEIFLIQVR +AMLRANAATGNLNILLPMVTSLDEVDEARRLIERAGREVEEMIGYEIPKPRIGIMLEVPS +MVFMLPHLAKRVDFISVGTNDLTQYILAVDRNNTRVANIYDSLHPAMLRALAMIAREAEI +HGIDLRLCGEMAGDPMCVAILIGLGYRHLSMNGRSVARVKYLLRRIDFAEAENLAQRSLE +AQLATEVRHQVAAFMERRGMGGLIRGGL +>test.0417.00002.0003i_00039 531 rppH | RNA pyrophosphohydrolase | 3.6.1.- | similar to AA sequence:UniProtKB:P0A776 | COG:COG0494 +MIDDDGYRPNVGIVICNRQGQVMWARRFGQHSWQFPQGGINPGESAEQAMYRELFEEVGL +SRKDVRILASTRNWLRYKLPKRLVRWDTKPVCIGQKQKWFLLQLVSGDAEINMQTSSTPE +FDGWRWVSYWYPVRQVVSFKRDVYRRVMKEFASVVMSLQENTPKPQNASAYRRKRG +>test.0417.00002.0003i_00040 162 NA | hypothetical protein | NA | NA | NA +METVVEVFHSYPSFLWITWCKILFIFSDQIWKTRCSVAQLDYRKPKKQYKSEN +>test.0417.00002.0003i_00041 690 mutH | DNA mismatch repair protein MutH | NA | similar to AA sequence:UniProtKB:P06722 | COG:COG3066 +MSQPRPLLSPPETEEQLLAQAQQLSGYTLGELAALAGLVTPENLKRDKGWIGVLLEIWLG +ASAGSKPEQDFAALGVELKTIPVDSLGRPLETTFVCVAPLTGNSGVTWETSHVRHKLKRV +LWIPVEGERSIPLAKRRVGSPLLWSPNEEEDRQLREDWEELMDMIVLGQVERITARHGEY +LQIRPKAANAKALTEAIGARGERILTLPRGFYLKKNFTSALLARHFLIQ +>test.0417.00002.0003i_00042 714 NA | hypothetical protein | NA | similar to AA sequence:UniProtKB:P67127 | NA +MLFAWITDPNAWLALGTLTLLEIVLGIDNIIFLSLVVAKLPTAQRAHARRLGLAGAMVMR +LALLASIAWVTRLTNPLFTIFSQEISARDLILLLGGLFLIWKASKEIHESIEGEEEGLKT +RVSSFLGAIVQIMLLDIIFSLDSVITAVGLSDHLFIMMAAVVIAVGVMMFAARSIGDFVE +RHPSVKMLALSFLILVGFTLILESFDIHVPKGYIYFAMFFSIAVESLNLIRNKKNPL +>test.0417.00002.0003i_00043 219 ygdR | putative lipoprotein YgdR | NA | similar to AA sequence:UniProtKB:P65294 | NA +MKKWAVIISAVGLAFAVSGCSSDYVMATKDGRMILTDGKPEIDDDTGLVSYHDQQGNAMQ +INRDDVSQIIER +>test.0417.00002.0003i_00044 1041 tas | Protein tas | NA | similar to AA sequence:UniProtKB:P0A9T4 | COG:COG0667 +MQYHRIPHSSLEVSTLGLGTMTFGEQNSEADAHAQLDYAVAQGINLIDVAEMYPVPPRPE +TQGLTETYVGNWLAKHGSREKLIIASKVSGPSRNNDKGIRPDQALDRKNIREALHDSLKR +LQTDYLDLYQVHWPQRPTNCFGKLGYSWTDSAPAVSLLDTLDALAEYQRAGKIRYIGVSN +ETAFGVMRYLHLADKHDLPRIVTIQNPYSLLNRSFEVGLAEVSQYEGVELLAYSCLGFGT +LTGKYLNGAKPAGARNTLFSRFTRYSGEQTQKAVAAYVDIARRHGLDPAQMALAFVRRQP +FVASTLLGATTMEQLKTNVESLHLELSEDVLAEIEAVHQVYTYPAP +>test.0417.00002.0003i_00045 1194 lplT | Lysophospholipid transporter LplT | NA | similar to AA sequence:UniProtKB:P39196 | NA +MSESVHTNTSLWSKGMKAVIVAQFLSAFGDNALLFATLALLKAQFYPEWSQPILQMVFVG +AYILFAPFVGQVADSFAKGRVMMFANGLKLLGAASICFGINPFLGYTLVGVGAAAYSPAK +YGILGELTTGSKLVKANGLMEASTIAAILLGSVAGGVLADWHILVALVACALAYGGAVVA +NIYIPKLAAARPGQSWNLISMTRSFLNACTSLWRNGETRFSLVGTSLFWGAGVTLRFLLV +LWVPVALGITDNATPTYLNAMVAIGIVVGAGAAAKLVTLETVSRCMPAGILIGVVVLIFS +LQHELLPAYALLMLIGVLGGFFVVPLNALLQERGKKSVGAGNAIAVQNLGENSAMLLMLG +IYSLAVMVGIPVVPIGIGFGALFALAITALWIWQRRH +>test.0417.00002.0003i_00046 2160 aas | Bifunctional protein Aas | NA | similar to AA sequence:UniProtKB:P31119 | COG:COG0204 +MLFSFFRNLCRVLYRVRVTGDTKALKGERVLITPNHVSFIDGILLALFLPVRPVFAVYTS +ISQQWYMRWLKSFIDFVPLDPTQPMAIKHLVRLVEQGRPVVIFPEGRITTTGSLMKIYDG +AGFVAAKSGATVIPVRIEGAELTHFSRLKGLVKRRLFPQITLHILPPTQVEMPDAPRARD +RRKIAGEMLHQIMMEARMAVRPRETLYESLLSAMYRFGAGKKCVEDVNFTPDSYRKLLTK +TLFVGRILEKYSVEGERIGLMLPNAGISAAVIFGAIARRRIPAMMNYTAGVKGLTSAITA +AEIKTIFTSRQFLDKGKLWHLPEQLTQVRWVYLEDLKADVTTADKVWIFAHLLMPRLAQV +KQQPEEEALILFTSGSEGHPKGVVHSHKSILANVEQIKTIADFTTNDRFMSALPLFHSFG +LTVGLFTPLLTGAEVFLYPSPLHYRIVPELVYDRSCTVLFGTSTFLGHYARFANPYDFYR +LRYVVAGAEKLQESTKQLWQDKFGLRILEGYGVTECAPVVSINVPMAAKPGTVGRILPGM +DARLLSVPGIEEGGRLQLKGPNIMNGYLRVEKPGVLEVPTAENIRGEMERDWYDTGDIVR +FDEQGFVQIQGRAKRFAKIAGEMVSLEMVEQLALGVSPDKVHATAIKSDASKGEALVLFT +TDNELTRDKLQQYAREHGVPELAVPRDIRYLKQMPLLGSGKPDFVTLKSWVDEAEQHDE +>test.0417.00002.0003i_00047 1032 galR | HTH-type transcriptional regulator GalR | NA | similar to AA sequence:UniProtKB:P03024 | COG:COG1609 +MATIKDVARLAGVSVATVSRVINNSPKASEASRLAVHSAMESLSYHPNANARALAQQTTE +TIGLVVGDVSDPFFGAMVKAVEQVAYHTGNFLLIGNGYHNEQKERQAIEQLIRHRCAALV +VHAKMIPDADLASLMKQMPGMVLINRILPGFENRCIALDDRYGAWLATRHLIQQGHTRIG +YLCSNHSISDAEDRLQGYYDALAESGIPANDRLVTFGEPDESGGEQAMTELLGRGRNFTA +VACYNDSMAAGAMGVLNDNGIDVPGEISLIGFDDVLVSRYVRPRLTTVRYPIVTMATQAA +ELALALADNRPLPEITNVFSPTLVRRHSVSTPSLEASHHATSD +>test.0417.00002.0003i_00048 1263 lysA | Diaminopimelate decarboxylase | 4.1.1.20 | similar to AA sequence:UniProtKB:E0IWI3 | NA +MPHSLFSTDTDLTAENLLRLPAEFGCPVWVYDAQIIRRQIAALKQFDVVRFAQKACSNIH +ILRLMREQGVKVDSVSLGEIERALAAGYNPQTHPDDIVFTADVIDQATLERVSELQIPVN +AGSVDMLDQLGQVSPGHRVWLRVNPGFGHGHSQKTNTGGENSKHGIWYTDLPAALDVIQR +HHLQLVGIHMHIGSGVDYAHLEQVCGAMVRQVLEFGQDLQAISAGGGLSIPYQQGEEAVD +TEHYYGLWNAAREQIARHLGHPVKLEIEPGRFLVAQAGVLITQVRSVKQMGSRHFVLVDA +GFNDLMRPAMYGSYHHISALAADGRSLEHAPTVETVVAGPLCESGDVFTQQEGGNVETRA +LPEVKACDYLVLHDTGAYGASMSSNYNSRPLLPEVLFDNGQARLIRRRQTIEELLALELL +>test.0417.00002.0003i_00049 936 occR | Octopine catabolism/uptake operon regulatory protein OccR | NA | similar to AA sequence:UniProtKB:P0A4T3 | NA +MAAVNLRHIEIFHAVMTAGSLTEAAHLLHTSQPTVSRELARFEKVIGLKLFERIRGRLHP +TVQGLRLFEEVQRSWYGLDRIVSAAESLREFRQGELSIACLPVFSQSFLPQLLQPFLARY +PDVSLNIVPQESPLLEEWLSAQRHDLGLTETLHTPAGTERTELLSLDEVCVLPPGHPLAV +KKVLTPDDFHGENYISLSRTDSYRQLLDQLFTENQVKRRMIVETHSAASVCAMVRAGVGV +SVVNPLTALDYAASGLVVRRFSIAVPFTVSLIRPLHRPSSALVQAFSEHLQAGLPKLVTS +LDTILSSATTA +>test.0417.00002.0003i_00050 693 ygeA | L-aspartate/glutamate-specific racemase | 5.1.1.13 | similar to AA sequence:UniProtKB:A0A140N890 | NA +MKTIGLLGGMSWESTIPYYRLINEGIKQRLGGLHSAQVLLHSVDFHEIEECQRRGEWDKT +GDILAEAALGLQRAGAEGIVLCTNTMHKVADAIESRCSLPFLHIADATGRAITGAGMTRV +ALLGTRYTMEQDFYRGRLTEQFSINCLIPEADERAKINQIIFEELCLGQFTEASRAYYAQ +VIARLAEQGAQGVIFGCTEIGLLVPEERSVLPVFDTAAIHAEDAVAFMLS +>test.0417.00002.0003i_00051 1419 araE | Arabinose-proton symporter | NA | similar to AA sequence:UniProtKB:P0AE24 | NA +MVTINTESALTPRPLRDTRRMNMFVSVAAAVAGLLFGLDIGVIAGALPFITDHFVLTSRL +QEWVVSSMMLGAAIGALFNGWLSFRLGRKYSLMAGAILFVLGSIGSAFATSVEMLIAARV +VLGIAVGIASYTAPLYLSEMASENVRGKMISMYQLMVTLGIVLAFLSDTAFSYSGNWRAM +LGVLALPAVLLIILVVFLPNSPRWLAEKGRHIEAEEVLRMLRDTSEKAREELNEIRESLK +LKQGGWALFKINRNVRRAVFLGMLLQAMQQFTGMNIIMYYAPRIFKMAGFTTTEQQMIAT +LVVGLTFMFATFIAVFTVDKAGRKPALKIGFSVMALGTLVLGYCLMQFDNGTASSGLSWL +SVGMTMMCIAGYAMSAAPVVWILCSEIQPLKCRDFGITCSTTTNWVSNMIIGATFLTLLD +SIGAAGTFWLYTALNIAFVGITFWLIPETKNVTLEHIERKLMAGEKLRNIGV +>test.0417.00002.0003i_00052 762 kduD | 2-dehydro-3-deoxy-D-gluconate 5-dehydrogenase | 1.1.1.127 | similar to AA sequence:UniProtKB:P37769 | NA +MILNAFSLEGKVAVVTGCDTGLGQGMALGLAQAGCDIVGINIVEPTETIKQVTAQGRRFL +SLTADLRKIDGIPGLLDRAVAEFGHIDILVNNAGLIRREDALEFSETDWDDVMNLNIKSV +FFMSQAAAKHFIAQGNGGKIINIASMLSFQGGIRVPSYTASKSGVMGVTRLMANEWAKHN +INVNAIAPGYMATNNTQQLRADEQRSAEILDRIPAGRWGLPSDLMGPVVFLASSASDYVN +GYTIAVDGGWLAR +>test.0417.00002.0003i_00053 837 kduI | 4-deoxy-L-threo-5-hexosulose-uronate ketol-isomerase | 5.3.1.17 | similar to AA sequence:UniProtKB:Q46938 | COG:COG3717 +MDVRQSIHSAHAKTLDTQGLRNEFLVEKVFVADEYTMVYSHIDRIIVGGIMPVTKTVSVG +GEVGKQLGVSYFLERRELGVINIGGAGTITVDGQCYEIGHRDALYVGKGAKEVVFASIDT +ATPAKFYYNCAPAHTTYPTKKVTPDEVSPVTLGDNLTSNRRTINKYFVPDVLETCQLSMG +LTELAPGNLWNTMPCHTHERRMEVYFYFNMDDDACVFHMMGQPQETRHIVMHNEQAVISP +SWSIHSGVGTKAYTFIWGMVGENQVFDDMDHVAVKDLR +>test.0417.00002.0003i_00054 1182 thlA | Acetyl-CoA acetyltransferase | 2.3.1.9 | similar to AA sequence:UniProtKB:P45359 | COG:COG0183 +MKDVVIVGALRTPIGCFRGALAGHSAVELGSLVVKALIERTGVPAYAVDEVILGQVLTAG +AGQNPARQSAIKGGLPNSVSAITINDVCGSGLKALHLATQAIQCGEADIVIAGGQENMSR +APHVLTDSRTGAQLGNSQLVDSLVHDGLWDAFNDYHIGVTAENLAREYGISRQLQDAYAL +SSQQKARAAIDAGRFKDEIVPVITQSNGQTLVVDTDEQPRTDTSAEALARLNPSFDSLGS +VTAGNASSINYGAAAVMMMSEAKARALNLPVLARIRAFASVGVDPALMGIAPVYATRRCL +ERVGWQLADVDLIEANEAFAAQALSVGKMLEWDERRVNVNGGAIALGHPIGASGCRILVS +LVHEMVKRNARKGLATLCIGGGQGVALTIERDE +>test.0417.00002.0003i_00055 1230 yqeG | Inner membrane transport protein YqeG | NA | similar to AA sequence:UniProtKB:P63340 | COG:COG0814 +MSNIWSKEETLWSFALYGTAVGAGTLFLPIQLGSAGAVVLFITALVAWPLTYWPHKALCQ +FILSSKTSAGEGITGAVTHYYGKKIGNLITTLYFIAFFVVVLIYAVAITNSLTEQLAKHM +VIDLRIRMLVSLGVVLILNLIFLMGRHATIRVMGFLVFPLIAYFLFLSIYLVGSWQPDLL +TTQVEFNQNTLHQIWISIPVMVFAFSHTPIISTFAIDRREKYGEHAMDKCKKIMKVAYLI +ICISVLFFVFSCLLSIPPSYIEAAKEEGVTILSALSMLPNAPAWLSISGIIVAVVAMSKS +FLGTYFGVIEGATEVVKTTLQQVGVKKSRAFNRALSIMLVSLITFIVCCINPNAISMIYA +ISGPLIAMILFIMPTLSTYLIPALKPWRSIGNLITLIVGILCVSVMFFS +>test.0417.00002.0003i_00057 351 nlpD | Murein hydrolase activator NlpD | NA | similar to AA sequence:UniProtKB:P39700 | NA +MPYSTADGGNKGIDISAPRGTPIYAAGAGKVVYVGNQLRGYGNLIMIKHSEDYITAYAHN +DTMLVNNGQSVKAGQKIATMGSTDAASVRLHFQIRYRATAIDPLRYLPPQGSKPKC +>test.0417.00002.0003i_00058 2298 xdhA_1 | Putative xanthine dehydrogenase molybdenum-binding subunit XdhA | 1.17.1.4 | similar to AA sequence:UniProtKB:Q46799 | COG:COG1529 +MEAREATATGESCMRVDAIAKVTGRARYTDDYVMAGMCYAKYVRSPIAHGYAVSINDEQA +RSLPGVLAIFTWEDVPEIPFATAGHAWTLDENKRDTADRALLTRHVRHHGDAVAIVVARD +ELTAEKAAQLVSIEWQELPVITSPEAALAEDAAPIHNGGNLLKQSTMSTGNVQQTIDAAD +YQVQGHYQTPVIQHCHMESVTSLAWMEDDSRITIVSSTQIPHIVRRVVGQALDIPWSCVR +VIKPFIGGGFGNKQDVLEEPMAAFLTSKLGGIPVKVSLSREECFLATRTRHAFTIDGQMG +VNRDGTLKGYSLDVLSNTGAYASHGHSIASAGGNKVAYLYPRCAYAYSSKTCYTNLPSAG +AMRGYGAPQVVFAVESMLDDAATALGIDPVEIRLRNAAREGDANPLTGKRIYSAGLPECL +EKGRKIFEWEKRRAECQNQQGNLRRGVGVACFSYTSNTWPVGVEIAGARLLMNQDGTINV +QSGATEIGQGADTVFSQMVAETVGVPVSDVRVISTQDTDVTPFDPGAFASRQSYVAAPAL +RSAALLLKEKIIAHAAVMLHQSAMNLTLIKGHIVLIERPEEPLMSLKDLAMDAFYHPERG +GQLSAESSIKTTTNPPAFGCTFVDLTVDIALCKVTINRILNVHDSGHILNPLLAEGQVHG +GMGMGIGWALFEEMIIDAKSGVVRNPNLLDYKMPTMPDLPQLESAFVEINEPQSAYGHKS +LGEPPIIPVAAAIRNAVKMATGVAINTLPLTPKRLYEEFHLAGLI +>test.0417.00002.0003i_00059 879 ndhF | Nicotinate dehydrogenase FAD-subunit | 1.17.1.5 | similar to AA sequence:UniProtKB:Q0QLF4 | NA +MFDFASYHRAATLADAITLLADNPQAKLLAGGTDVLIQLHHHNDRYRHIVDIHNLAELQG +ITQAEDGALRIGSATTFTQLIEDPVIQRNLPALCAAAASIAGPQIRNVATYGGNICNGAT +SADSATPTLIYDAKLELHSPRGVRFVPINGFHTGPGKVSLEHDEILVAFHFPPQPKEHAG +SAHFKYAMRDAMDISTIGCAAHCRLDNGNFSELRLAFGVAAPTPIRCQHAEQTAQNAPLN +LQTLEAISESVLQDVAPRSSWRASKEFRLHLIQTMTKKVISEAVAAAGGKLQ +>test.0417.00002.0003i_00060 480 ndhS | Nicotinate dehydrogenase small FeS subunit | 1.17.1.5 | similar to AA sequence:UniProtKB:Q0QLF3 | NA +MNHSETITIECTINGMPFQLHAAPGMPLSELLREQGLLSVKQGCCVGECGACTVLVDGTA +IDSCLFLAAWAEGKEIRTLEGEAKGGKLSHVQLAYAKSGAVQCGFCTPGLIMATTAMLAK +PREKPLTITEIRRGLAGNLCRCTGYQMIVNTVLDCEKTK +>test.0417.00002.0003i_00061 1779 norR | Anaerobic nitric oxide reductase transcription regulator NorR | NA | protein motif:HAMAP:MF_01314 | NA +MELATTQSVLMQIQPTIQRFARMLASVLQLEVEIVDENLCRVAGTGAYGKFLGRQLSGNS +RLLRHVLETKTEKVVTQSRFDPLCEGCDSKENCREKAFLGTPVILQDRCVGVISLIAVTH +EQQEHISDNLREFSDYVRHISTIFVSKLLEDQGPGDNISKIFATMIDNMDQGVLVVDADN +RVQFVNQTALKTLGVVQNNIIGKPVRFRPLTFESNFTHGHMQHIVSWDDKSELIIGQLHN +IQGRQLFLMAFHQSHTSFSVANAPDEPHIEQLVGECRVMRQLKRLISRIAPSPSSVMVVG +ESGTGKEVVARAIHKLSGRRNKPFIAINCAAIPEQLLESELFGYVKGAFTGASANGKTGL +IQAANTGTLFLDEIGDMPLMLQAKLLRAIEAREILPIGASSPIQVDIRIISATNQNLAQF +IAEGKFREDLFYRLNVIPITLPPLRERQEDIELLVHYFLHLHTRRLGSVYPGIAPDVVEI +LRKHRWPGNLRELSNLMEYLVNVVPSGEVIDSTLLPPNLLNNGTTEQSDVTEVSEAHLSL +DDAGGTALEEMEKQMIREALSRHNSKKEVADELGIGIATLYRKIKKYELLNT +>test.0417.00002.0003i_00062 1188 ygeW | Putative carbamoyltransferase YgeW | 2.1.3.- | similar to AA sequence:UniProtKB:Q46803 | COG:COG0078 +MKTVNELIKDINSLTSHLHEKDFLLTWEQTPDELKQVLDVAAALKALRAENISTKVFNSG +LGISVFRDNSTRTRFSYASALNLLGLAQQDLDEGKSQIAHGETVRETANMISFCADAIGI +RDDMYLGAGNAYMREVGAALDDGYKQGVLPQRPALVNLQCDIDHPTQSMADLAWLREHFG +SLENLKGKKIAMTWAYSPSYGKPLSVPQGIIGLMTRFGMDVTLAHPEGYDLIPDVVEVAK +NNAKASGGSFRQVTSMEEAFKDADIVYPKSWAPYKVMEERTELLRANDHEGLKALEKQCL +AQNAQHKDWHCTEEMMELTRDGEALYMHCLPADISGVSCKEGEVTEGVFEKYRIATYKEA +SWKPYIIAAMILSRKYAKPGALLEQLLKEAQERVK +>test.0417.00002.0003i_00063 1197 ygeX | Diaminopropionate ammonia-lyase | 4.3.1.15 | similar to AA sequence:UniProtKB:P66899 | COG:COG1171 +MSVFSLKIDIADNKFFNGETSPLFSQSQAKLARQFHQKIAGYHPTPLCALDDLANLFGVK +KILVKDESKRFGLNAFKMLGGAYAIAQLLCEKYHLDIETLSFEHLKNAIGEKMTFATTTD +GNHGRGVAWAAQQLGQNAVIYMPKGSAQERVDAILNLGAECIVTDMNYDDTVRLTMQHAQ +QHGWEVVQDTAWEGYTKIPTWIMQGYATLADEAVEQMREMGVTPTHVLLQAGVGAMAGGV +LGYLVDVYSPQNLHSIIVEPDKADCIYRSGVKGDIVNVGGDMATIMAGLACGEPNPLGWE +ILRNCATQFISCQDSVAALGMRVLGNPYGNDPRIISGESGAVGLGVLAAVHYHPQRQSLM +EKLALNKDAVVLVISTEGDTDVKHYREVVWEGKHAVAP +>test.0417.00002.0003i_00064 1212 argE | Acetylornithine deacetylase | 3.5.1.16 | similar to AA sequence:UniProtKB:P23908 | COG:COG0624 +MAKNIPFKLILEKAKDYQADMTRFLRDMVAIPSESCDEKRVVHRIKEEMEKVGFDKVEID +PMGNVLGYIGHGPRLVAMDAHIDTVGIGNIKNWDFDPYEGMETDELIGGRGTSDQEGGMA +SMVYAGKIIKDLGLEDEYTLLVTGTVQEEDCDGLCWQYIIEQSGIRPEFVVSTEPTDCQV +YRGQRGRMEIRIDVQGVSCHGSAPERGDNAIFKMGPILGELQELSQRLGYDEFLGKGTLT +VSEIFFTSPSRCAVADSCAVSIDRRLTWGETWEGALDEIRALPAVQKANAVVSMYNYDRP +SWTGLVYPTECYFPTWKVEEDHFTVKALVNAYEGLFGKAPVVDKWTFSTNGVSIMGRHGI +PVIGFGPGKEPEAHAPNEKTWKSHLVTCAAMYAAIPLSWLATE +>test.0417.00002.0003b_00065 1386 hyuA | D-phenylhydantoinase | 3.5.2.- | similar to AA sequence:UniProtKB:Q46806 | COG:COG0044 +MRVLIKNGIVVNADGQAKQDLLIESGIVRQLGTDISPQLPCEEIDASGCYVFPGGVDVHT +HFNIDVGIARSCDDFFTGTRAAACGGTTTIIDHMGFGPNGCRLRHQLEVYRGYAAHKAVI +DYSFHGVIQHINHAILDEIPMMVEEGLSSFKLYLTYQYKLNDDEVLQALRRLHESGALTT +VHPENDAAIASKRAEFIAAGLTAPRYHALSRPLECEAEAIARMINLAQIAGNAPLYIVHL +SNGLGLDYLRLARANHQPVWVETCPQYLLLDERSYDTEDGMKFILSPPLRNVREQDKLWC +GISDGAIDVVATDHCTFSMAQRLQISKGDFSRCPNGLPGVENRMQLLFSSGVMTGRISPE +RFVELTSAMPARLFGLWPQKGLLAPGSDGDVVIIDPRQSQQIQHRHLHDNADYSPWEGFT +CQGAIVRTLSRGETIFCDSTFTGKAGRGRFLRRKPFVPPVL +>test.0417.00002.0004b_00066 1626 NA | hypothetical protein | NA | NA | NA +MNIFTEAAKLEEQNCPFAMAQIVDSRGSTPRHSAQMLVRADGSIVGTIGGGMVERKVIEE +SLQALQERKPRLFHGRMARNGADAVGSDCGGAMSVFISVHGMRPRLVLIGAGHVNRAIAQ +SAALLGFDIAVADIYRESLNPELFPPSTTLLHAESFGAAVEALDIRPDNFVLIATNNQDR +EALDKLIEQPIAWLGLLASRRKVQLFLRQLREKGVAEEHIARLHAPVGYNIGAETPQEIA +ISVLAEILQVKNNAPGGLMMKPSHPSGHQLVVIRGAGDIASGVALRLYHAGFKVIMLEVE +KPTVIRCTVAFAQAVFDGEMTVEGVTARLATSSAEAMKLTERGFIPVMVDPTCSLLDELK +PLCVVDAILAKQNLGTRADMAPVTIALGPGFTAGKDCHAVIETNRGHWLGQVIYSGCAQE +NTGVPGNIMGHTTRRVIRAPAAGIMRSNVKLGDLVKEGDVIAWIGEHEIKAPLTGMVRGL +LNDGLAVVGGFKIGDIDPRGETADFTSVSDKARAIGGGVLEALMMLMHQGVKATKEVLEV +A +>test.0417.00002.0004i_00067 480 NA | hypothetical protein | NA | NA | NA +MQGFTPEAIDALVQRPECDVILIEADGSRGMPLKAPDEHEPCIPKSSCCVIAVMGGHILG +AKVSTENVHRWSQFADITGLTPAAPLQLSDLVALVRHPQGAFKNVPQGCRRVWFINRFSQ +CENAIAQSELLQPLQQHNVEAIWLGDIQEHPAIARRFVN +>test.0417.00002.0004i_00068 579 mocA | Molybdenum cofactor cytidylyltransferase | 2.7.7.76 | similar to AA sequence:UniProtKB:Q46810 | COG:COG2068 +MSAIDCIITAAGLSSRMGQWKMMLPWQQGTILDTSIKNALQFCSRIILVTGYRGNELHER +YANQSNITIIHNPDYAQGLLTSVKAAVPAVQTEHCFLTHGDMPTLTIDIFRKIWSLRNDG +AILPLHNGIPGHPILVSKPCLMQAIQRPNVTNMRQALLMGEHYSVEIENAEIILDIDTPD +DFITAKKRYTEI +>test.0417.00002.0004i_00069 3099 ygfK | Putative oxidoreductase YgfK | NA | similar to AA sequence:UniProtKB:Q46811 | COG:COG0493 +MGDIMRPIPFEELLTRIFDEYQQQRSIFGIPEQQFYSPVKGKTVSVFGETCATPVGPAAG +PHTQLAQNIVTSWLTGGRFIELKTVQILDRLELEKPCIDAEDECFNTEWSTEFTLLKAWD +EYLKAWFALHLLEAMFQPSDSGKSFIFNMSVGYNLEGIKQPPMQQFIDNMMDASDHPKFA +QYRDALNKLLQNEAFLARHGLQEKRESLQALPARIPTSMVQGVTLSTMHGCPPHEIEAIC +RYMLEEKGLNTFVKLNPTLLGYARVREILDVCGFGYIGLKEESFDHDLKLTQALEMLERL +MALAKEKSLGFGVKLTNTLGTINNKGALPGEEMYMSGRALFPLSINVAAVLSRAFDGKLP +ISYSGGASQLTIRDIFDTGIRPITMATDLLKPGGYLRLSACMRELEGSDAWGLDHVDVER +LNRLAADALTMEYTQKHWKPEERIEVAEDLPLTDCYVAPCVTACAIKQDIPEYIRLLGEH +RYADALELIYQRNALPAITGHICDHQCQYNCTRLDYDSALNIRELKKVALEKGWEEYKQR +WHKPAGSGSRHPVAVIGAGPAGLAAGYFLARAGHPVTLFEREANAGGVVKNIIPQFRIPA +ELIQHDIDFVADHGVKFEYGCSPDLTVEQLKNQGFHYVLIATGTDKNSGVKLAGDNQNVW +KSLPFLREYNKGTALKLGKHVVVVGAGNTAMDCARAALRVPGVEKATVVYRRSLQEMPAW +REEYEEALHDGVEFRFLNNPERFDADGTLTLRVMSLGEPDEKGRRRPVETNETVTLHVDS +LITAIGEQQDTEALNAMGVPLDKNGWPDVDHNGETRLTDVFMIGDVQRGPSSIVAAVGTA +RRATDAILSRENIRSHQNDKYWNNVNPAEIYQRKGDISVTLVNSDDRDAFVAQEAARCLE +CNYVCSKCVDVCPNRANVSIAVPGFQNRFQTLHLDAYCNECGNCAQFCPWNGKPYKDKIT +VFSLSQDFDNSSNPGFLVEDCRVRVRLNNQSWVLNIDSEGQFNNVPPELNDMCRIISHVH +QHHHYLLGRVEV +>test.0417.00002.0004i_00070 1329 ssnA | Putative aminohydrolase SsnA | 3.-.-.- | similar to AA sequence:UniProtKB:Q46812 | COG:COG0402 +MLILKNVTAVQLHPAKVQEGVDIAIENDVIVAIDDALTQRYPDASYKEMHGRIVMPGIVC +SHNHFYSGLSRGIMANIAPCPDFISTLKNLWWRLDRALDEESLYYSGLICSLEAIKSGCT +SVIDHHASPAYIGGSLSTLRDAFLKVGLRAMTCFETTDRNSGIKELQEGVEENIRFARQI +DEAKKAATEPYLVEAHIGAHAPFTVPDAGLEMLCEAVKSTGRGLHIHAAEDLYDVSYSHH +WYGKDLLARLAQFDLIDSKTLVAHGLYLSKDDIALLNQRDAFLVHNARSNMNNHVGYNHH +LSDIRNLALGTDGIGSDMFEEMKFAFFKHRDAGGPLWPDSFAKALANGNELMSRNFGAKF +GLLEAGYKADLTICDYNSPTPLLADNIAGHIAFGMGSGSVHSVMVNGVMVYEDRQFNFDC +DSIYAQARKAAASMWRRMDALA +>test.0417.00002.0004i_00071 780 NA | hypothetical protein | NA | NA | NA +MIEQFFRPDSVEQALELKRRYQDEAVWFAGGSKLNATPTRTDKKIAISLQDLELDWIDWD +NGALRIGAMSRLQPLRDARFIPAALREALGFVYSRHVRNQSTIGGEIAARQEESVLLPVL +LALDAELVFGNGETLSIEDYLACPCDRLLTEIIIKDPYRTCATRKISRSQAGLTVVTAAV +AITDHDGMRIALDGVASKALRLHDVETQNLEGNALEQAVANAIFPQEDLRGSVAYKRYIT +GVLVADLYADCQQAGEEAV +>test.0417.00002.0004i_00072 2871 xdhA_2 | Putative xanthine dehydrogenase molybdenum-binding subunit XdhA | 1.17.1.4 | similar to AA sequence:UniProtKB:Q46799 | COG:COG1529 +MIIHFTLNGAPQELTVNPGENVQKLLFNMGMHSVRNSDDGFGFAGSDAIIFNGNIVNASL +LIAAQLEKADIRTAESLGKWNELSLVQQAMVDVGVVQSGYNDPAAALIITDLLDRIDAPT +REEIDDALSGLFSRDAGWQQYYQVIELAVARKNNPQATIDIAPTFRDDLEVIGKHYPKTD +AAKMVQAKPCYVEDRVTADACVIKMLRSPHAHALITHLDVSKAEALPGVVHVITHLNCPD +IYYTPGGQSAPEPSPLDRRMFGKKMRHVGDRVAAVVAENEDIALEALKLIDVEYEVLKPV +MSIDEAMAEDAPVVHDEPVVYVAGAPDTLEDDNSHAAQRGEHMIINFPIGSRPRKNIAAS +IHGHIGDMDKGFADADVIIERTYNSTQAQQCPTETHICFTRMDGDRLVIHASTQVPWHLR +RQVARLVGMKQHKVHVIKERVGGGFGSKQDILLEEVCAWATCVTGRPVLFRYTREEEFIA +NTSRHVAKVTVKLGAKKDGRLTAVKMDFRANTGPYGNHSLTVPCNGPALSLPLYPCDNVD +FQVTTYYSNICPNGAYQGYGAPKGNFAITMALAELAEQLQIDQLEIIERNRVHEGQELKI +LGAIGEGKAPTSVPSAASCALEEILRQGREMIQWSSPKPQNGDWHIGRGVAIIMQKSGIP +DIDQANCMIKLESDGTFIVHSGGADIGTGLDTVVTKLAAEVLHCPPQDVHVISGDTDHAL +FDKGAYASSGTCFSGNAARLAAENLREKILFHGAQMLGEPVADVQLATPGVVRGKKGEVS +FGEIAHKGETGTGFGSLVGTGSYITPDFAFPYGANFAEVAVNTRTGEIRLDKFYALLDCG +TPVNPELALGQIYGATLRAIGHSMSEEIIYDAEGHPLTRDLRSYGAPKIGDIPRDFRAVL +VPSDDKVGPFGAKSISEIGVNGAAPAIATAIHDACGIWLREWHFTPEKILTALEKI +>test.0417.00002.0004i_00073 1401 xanQ | Xanthine permease XanQ | NA | similar to AA sequence:UniProtKB:P67444 | COG:COG2233 +MSDINHAGSDLIFELEDRPPFHQALVGAITHLLAIFVPMVTPALIVGAALQLSAETTAYL +VSMAMIASGIGTWLQVNRYGIVGSGLLSIQSVNFSFVTVMIALGSSMKSDGFHEELIMSS +LLGVSFVGAFLVVGSSFILPYLRRVITPTVSGIVVLMIGLSLIKVGIIDFGGGFAAKSSG +TFGNYEHLGVGLLVLIVVIGFNCCSSPLLRMGGIAIGLCVGYIASLCLGMVDFSSVRNLP +LITIPHPFKYGFSFSFHQFLVVGTIYLLSVLEAVGDITATAMVSRRPIQGEEYQSRLKGG +VLADGLVSVIASAVGSLPLTTFAQNNGVIQMTGVASRYVGRTIAVMLVILGLFPMIGGFF +TTIPSAVLGGAMTLMFSMIAIAGIRIIITNGLKRRETLIVATSLGLGLGVSYDPEIFKIL +PASIYVLVENPICAGGLTAILLNIILPGGYRQENVLPGITSAEEMD +>test.0417.00002.0004i_00074 1317 guaD | Guanine deaminase | 3.5.4.3 | similar to AA sequence:UniProtKB:P76641 | COG:COG0402 +MSGEHTLKAVRGSFIDVTRTVDNPEEIASALRFIEDGLLLIKQGKVEWFGEWEDGKHQIP +DTIRVRDYRGKLIVPGFVDTHIHYPQSEMVGAYGEQLLEWLNKHTFPTERRYEDLEYARE +MSAFFIKQLLRNGTTTALVFGTVHPQSVDALFEAASHINMRMIAGKVMMDRNAPDYLLDT +AESSYHQSKELIERWHKNGRLLYAITPRFAPTSSPEQMAMAQRLKEEYPDTWVHTHLCEN +KDEIAWVKLLYPDHDGYLDVYHQYGLTGKNCVFAHCVHLEEKEWDRLSETKSSIAFCPTS +NLYLGSGLFNLKKAWQKKVKVGMGTDIGAGTTFNMLQTLNEAYKVLQLQGYRLSAYEAFY +LATLGGAKSLGLDDLIGNFLPGKEADFVVMEPTATPLQQLRYDNSVSLVDKLFVMMTLGD +DRSIYRTYVDGRLVYERN +>test.0417.00002.0004i_00075 1368 ghxQ | Guanine/hypoxanthine permease GhxQ | NA | similar to AA sequence:UniProtKB:Q46817 | COG:COG2252 +MSGDILQTPDAPKPQGALDNYFKITARGSTVRQEVLAGLTTFLAMVYSVIVVPGMLGKAG +FPPAAVFVATCLVAGFGSLLMGLWANLPMAIGCAISLTAFTAFSLVLGQQISVPVALGAV +FLMGVIFTAISVTGVRTWILRNLPMGIAHGTGIGIGLFLLLIAANGVGMVIKNPIEGLPV +ALGAFTSFPVMMSLLGLAVIFGLEKCRVPGGILLVIIAISIIGLIFDPAVKYHGLVAMPS +LTGEDGKSLIFSLDIMGALQPTVLPSVLALVMTAVFDATGTIRAVAGQANLLDKDNQIIN +GGKALTSDSVSSIFSGLVGAAPAAVYIESAAGTAAGGKTGLTATVVGVLFLMILFLSPLS +FLIPGYATAPALMYVGLLMLSNVSKLDFNDFIDAMAGLVCAVFIVLTCNIVTGIMLGFVT +LVVGRVFAREWQKLNIGTVIITAALVAFYAGGWAI +>test.0417.00002.0004i_00076 489 hyfA | Hydrogenase-4 component A | 1.-.-.- | similar to AA sequence:UniProtKB:P23481 | COG:COG1142 +MKSLIIVNPADCIGCRTCEVACVVAHPSEQELNADIFLPRLKVQRLDSISAPVMCHQCEN +APCVGACPVGALTMGEQVVQANSARCIGCQSCVSACPFGMITIQSLPGDPRQQIVKCDLC +ELREEGPACVESCPTQALQLLTERELRRIRQQRIAASSENPL +>test.0417.00002.0004i_00077 1920 NA | Ferredoxin--NADP reductase | 1.18.1.2 | protein motif:HAMAP:MF_01685 | NA +MNKFIAAEAAECIGCHACEIACAVAHNQENWPLSHSDFRPRIHVVGKGQAANPVACHHCN +NAPCVTACPVNALTFQSDSVQLDEQKCIGCKRCAIACPFGVVEMVDTIAQKCDLCNQRSS +GTQACIDVCPTQALRLMDDKGLQQIKVARQRKTAAGKASSDAQPSRSAALLPVNSRKGAD +KISASERKTHFGEIYCGLDPQQATYESDRCVYCAEKANCNWHCPLHNAIPDYIRLVQEGK +IIEAAELCHQTSSLPEICGRVCPQDRLCEGACTLKDHSGAVSIGNLERYITDTALAMGWR +PDVSKVVPRSEKVAVIGAGPAGLGCADILARAGVQVDVFDRHPEIGGMLTFGIPPFKLDK +TVLSQRREIFTAMGIDFHLNCEIGRDISFNELTAEYDAVFLGVGTYGMMRADLPHEDAPG +VIQALPFLTAHTRQLMGLPESAEYPLTDVEGKRVVVLGGGDTTMDCLRTSIRLNAASVTC +AYRRDEVSMPGSRKEVVNAREEGVEFQFNVQPQYIACDEDGRLTAVGLIRTAMGEPGPDG +RRRPRPVAGSEFELPADVLIMAFGFQAHTMPWLQGSGIKLDKWGLIQTGDVGYLPTQTHL +KKVFAGGDAVHGADLVVTAMAAGRQAARDMLTLFDTKAS +>test.0417.00002.0004i_00078 1449 uacT | Uric acid transporter UacT | NA | similar to AA sequence:UniProtKB:Q46821 | COG:COG2233 +MSAIDSQLPSSSGQDRPTDEVDRILSPGKLIILGLQHVLVMYAGAVAVPLMIGDRLGLSK +EAIAMLISSDLFCCGIVTLLQCIGIGRFMGIRLPVIMSVTFAAVTPMIAIGMNPDIGLLG +IFGATIAAGFITTLLAPLIGRLMPLFPPLVTGVVITSIGLSIIQVGIDWAAGGKGNPQYG +NPVYLGISFAVLIFILLITRYAKGFMSNVAVLLGIVFGFLLSWMMNEVNLSGLHDASWFA +IVTPMSFGMPIFDPVSILTMTAVLIIVFIESMGMFLALGEIVGRKLSSQDIIRGLRVDGV +GTMIGGTFNSFPHTSFSQNVGLVSVTRVHSRWVCIASGIILILFGMVPKMAVLVASIPQF +VLGGAGLVMFGMVLATGIRILSRCNYTTNRYNLYIVAISLGVGMTPTLSHDFFSKLPAVL +QPLLHSGIMLATLSAVVLNVFFNGYQHHADLVKESVSDKDLKVRTVRMWLLMRKLKKNEH +GE +>test.0417.00002.0004i_00079 126 yqfG | putative protein YqfG | NA | similar to AA sequence:UniProtKB:C1P614 | NA +MNLLMRAIFSLLLLFTLSIPVISDCVAMAIESRFKYMMLLF +>test.0417.00002.0004i_00080 549 idi | Isopentenyl-diphosphate Delta-isomerase | 5.3.3.2 | similar to AA sequence:UniProtKB:Q46822 | COG:COG1443 +MQTEHVILLNAQGVPTGTLEKYAAHTADTLLHLAFSSWLFNAKGQLLVTRRALSKKAWPG +VWTNSVCGHPQPGESNEEAVIRRCRYELGVEITPPESIYPDFRYRATDPNGIVENEVCPV +FAARTTSALQINDDEVMDYQWCDLAAVLRGIDATPWAFSPWMVMQATNREARKRLSAFTQ +LK +>test.0417.00002.0004i_00081 1518 lysS | Lysine--tRNA ligase | 6.1.1.6 | similar to AA sequence:UniProtKB:P0A8N3 | COG:COG1190 +MSEQHAQGADAVVDLNNELKTRREKLANLREQGIAFPNDFRRDHTSDQLHAEFDGKENEE +LEALNIEVAVAGRMMTRRIMGKASFVTLQDVGGRIQLYVARDDLPEGVYNEQFKKWDLGD +ILGAKGKLFKTKTGELSIHCTELRLLTKALRPLPDKFHGLQDQEARYRQRYLDLISNDES +RNTFKVRSQILSGIRQFMVNRGFMEVETPMMQVIPGGAAARPFITHHNALDLDMYLRIAP +ELYLKRLVVGGFERVFEINRNFRNEGISVRHNPEFTMMELYMAYADYKDLIELTESLFRT +LAQDILGKTEVTYGDVTLDFGKPFEKLTMREAIKKYRPETDMADLDNFDSAKAIAESIGI +HVEKSWGLGRIVTEIFEEVAEAHLIQPTFITEYPAEVSPLARRNDVNPEITDRFEFFIGG +REIGNGFSELNDAEDQAQRFLDQVAAKDAGDDEAMFYDEDYVTALEHGLPPTAGLGIGID +RMVMLFTNSHTIRDVILFPAMRPVK +>test.0417.00002.0004i_00082 882 prfB | Peptide chain release factor RF2 | NA | similar to AA sequence:UniProtKB:P07012 | COG:COG1186 +MKQGLEDVSGLLELAVEADDEETFNEAVAELDALEEKLAQLEFRRMFSGEYDSADCYLDI +QAGSGGTEAQDWASMLERMYLRWAESRGFKTEIIEESEGEVAGIKSVTIKISGDYAYGWL +RTETGVHRLVRKSPFDSGGRRHTSFSSAFVYPEVDDDIDIEINPADLRIDVYRASGAGGQ +HVNRTESAVRITHIPTGIVTQCQNDRSQHKNKDQAMKQMKAKLYELEMQKKNAEKQAMED +NKSDIGWGSQIRSYVLDDSRIKDLRTGVETRNTQAVLDGSLDQFIEASLKAGL +>test.0417.00002.0004i_00083 1734 recJ | Single-stranded-DNA-specific exonuclease RecJ | 3.1.-.- | similar to AA sequence:UniProtKB:P21893 | COG:COG0608 +MKQQIQLRRREVDETADLPAELPPLLRRLYASRGVRSAQELERSVKGMLPWQQLSGVEKA +VEILYNAFREGTRIIVVGDFDADGATSTALSVLAMRSLGCSNIDYLVPNRFEDGYGLSPE +VVDQAHARGAQLIVTVDNGISSHAGVEHARSLGIPVIVTDHHLPGDTLPAAEAIINPNLR +DCNFPSKSLAGVGVAFYLMLALRTFLRDQGWFDERGIAIPNLAELLDLVALGTVADVVPL +DANNRILTWQGMSRIRAGKCRPGIKALLEVANRDPQKLAASDLGFALGPRLNAAGRLDDM +SVGVALLLCDNIGEARVLANELDALNQTRKEIEQGMQVEALTLCEKLERSRDTLPGGLAM +YHPEWHQGVVGILASRIKERFHRPVIAFAPAGDGTLKGSGRSIQGLHMRDALERLDTLYP +GMMLKFGGHAMAAGLSLEEEKFELFQQRFGELVTEWLDPSLLQGEVVSDGPLSAAEMTME +VAQLLRDAGPWGQMFPEPLFDGHFRLLQQRLVGERHLKVMVEPVGGGPLLDGIAFNVDTA +LWPDNGVREVQLAYKLDINEFRGNRSLQIIIDNIWPI +>test.0417.00002.0004i_00084 711 dsbC | Thiol:disulfide interchange protein DsbC | NA | similar to AA sequence:UniProtKB:P0AEG6 | COG:COG1651 +MKKGFMLFTLLAAFSGFVQADDAAIQQTLAKMGIKSSDIQPAPVAGMKTVLTNSGVLYIT +DDGKHIIQGPMYDVSGTAPVNVTNKMLLKQLNALEKEMIVYKAPQEKHVITVFTDITCGY +CHKLHEQMADYNALGITVRYLAFPRQGLDSDAEKEMKAIWCAKDKNKAFDDVMAGKSVAP +ASCDVDIADHYALGVQLGVSGTPAVVLSNGTLVPGYQPPKDMKEFLDEHQKMTSGK +>test.0417.00002.0004i_00085 897 xerD | Tyrosine recombinase XerD | NA | similar to AA sequence:UniProtKB:P0A8P8 | COG:COG4974 +MKQDLARIEQFLDALWLEKNLAENTLNAYRRDLSMMVEWLHHRGLTLATAQSDDLQALLA +ERLEGGYKATSSARLLSAVRRLFQYLYREKFREDDPSAHLASPKLPQRLPKDLSEAQVER +LLQAPLIDQPLELRDKAMLEVLYATGLRVSELVGLTMSDISLRQGVVRVIGKGNKERLVP +LGEEAVYWLETYLEHGRPWLLNGVSIDVLFPSQRAQQMTRQTFWHRIKHYAVLAGIDSEK +LSPHVLRHAFATHLLNHGADLRVVQMLLGHSDLSTTQIYTHVATERLRQLHQQHHPRA +>test.0417.00002.0004i_00086 522 fldB | Flavodoxin 2 | NA | similar to AA sequence:UniProtKB:P0ABY4 | COG:COG0716 +MNMGLFYGSSTCYTEMAAEKIRDIIGPELVTLHNLKDDSPKLMEQYDVLILGIPTWDFGE +IQEDWEAVWDQLDDLNLEGKIVALYGLGDQLGYGEWFLDALGMLHDKLSTKGVKFVGYWP +TEGYEFTSPKPVIADGQLFVGLALDETNQYDLSDERIQSWCEQILNEMAEHYA +>test.0417.00002.0004i_00087 408 ygfX | Inner membrane protein YgfX | NA | similar to AA sequence:UniProtKB:Q46824 | NA +MVLWQSDLRVSWRAQWLSLLIHGLVAAVILLMPWPLSYTPLWMVLLSLVVFDCVRSQRRI +NARQGEIRLLMDGRLRWQGQEWSIVKAPWMIKSGMMLRLRSDSGKRQHLWLAADSMDEAE +WRDLRRILLQQETQR +>test.0417.00002.0004i_00088 267 sdhE | FAD assembly factor SdhE | NA | similar to AA sequence:UniProtKB:P64559 | COG:COG2938 +MDINNKARIHWACRRGMRELDISIMPFFEHEYDSLSDDEKRIFIRLLECDDPDLFNWLMN +HGKPADAELEMMVRLIQTRNRERGPVAI +>test.0417.00002.0004i_00089 981 ygfZ | tRNA-modifying protein YgfZ | NA | similar to AA sequence:UniProtKB:P0ADE8 | COG:COG0354 +MAFTPFPPRQPTASARLPLTLMTLDDWALATITGADSEKYMQGQVTADVSQMTEDQHLLA +AHCDAKGKMWSNLRLFRDGDGFAWIERRSVREPQLTELKKYAVFSKVTIAPDDERVLLGV +AGFQARAALANLFSELPSKEKQVVKEGATTLLWFEHPAERFLIVTDEATANMLTDKLRGE +AELNNSQQWLALNIEAGFPVIDAANSGQFIPQATNLQALGGISFKKGCYTGQEMVARAKF +RGANKRALWLLKGSASRLPEAGEDLELKMGENWRRTGTVLAAVKLEDGQVVVQVVMNNDM +EPDSIFRVRDDANTLRIEPLPYSLEE +>test.0417.00002.0004i_00090 660 NA | hypothetical protein | NA | similar to AA sequence:UniProtKB:P67153 | NA +MVQKPLIKQGYSLAEEIANSVSHGIGLVFGIVGLVLLLVQAVDLNASATAITSYSLYGGS +MILLFLASTLYHAIPHQRAKMWLKKFDHCAIYLLIAGTYTPFLLVGLDSPLARGLMIVIW +SLALLGILFKLTIAHRFKILSLVTYLAMGWLSLVVIYEMAVKLAAGSVTLLAVGGVVYSL +GVIFYVCKRIPYNHAIWHGFVLGGSVCHFLAIYLYIGQA +>test.0417.00002.0004b_00091 312 NA | hypothetical protein | NA | similar to AA sequence:UniProtKB:P67603 | NA +MQPNDITFFQRFQDDILAGRKTITIRDESESHFKTGDVLRVGRFEDDGYFCTIEVTATST +VTLDTLTEKHAEQENMTLTELKKVIADIYPDQTQFYVIEFKCL +>test.0417.00002.0005b_00092 984 bglA | 6-phospho-beta-glucosidase BglA | 3.2.1.86 | similar to AA sequence:UniProtKB:Q46829 | COG:COG2723 +MVDFFVRFAEVVFERYKHKVKYWMTFNEINNQRNWRAPLFGYCCSGVVYTEHENPEETMY +QVLHHQFVASALAVKAAHRINPEMKVGCMLAMVPLYPYSCNPDDVMFAQESMRERYVFTD +VQLRGYYPSYVLNEWERRGFNIKMEDGDLDVLREGTCDYLGFSYYMTNAVKAEGGTGDAI +SGFEGSVPNPYVKASDWGWQIDPVGLRYALCELYERYQKPLFIVENGFGAYDKVEDDGSI +NDDYRIDYLRAHIEEMKKAVTYDGVDLMGYTPWGCIDCVSFTTGQYSKRYGFIYVNKHDD +GTGDMSRSRKKSFNWYKEVIASNGENL +>test.0417.00002.0005i_00093 2874 gcvP | Glycine dehydrogenase (decarboxylating) | 1.4.4.2 | similar to AA sequence:UniProtKB:P33195 | COG:COG0403 +MTQTLSQLENSGAFIERHIGPDAAQQQEMLNAVGAQSLNALTGQIVPKDIQLATPPQVGA +PATEYAALAELKAIASRNKRFTSYIGMGYTAVQLPPVILRNMLENPGWYTAYTPYQPEVS +QGRLEALLNFQQVTLDLTGLDMASASLLDEATAAAEAMAMAKRVSKLKNANRFFVASDVH +PQTLDVVRTRAETFGFEVIVDDAQKVLDHQDVFGVLLQQVGTTGEIHDYTALISELKSRK +IVVSVAADIMALVLLTAPGKQGADIVFGSAQRFGVPMGYGGPHAAFFAAKDEYKRSMPGR +IIGVSKDAAGNTALRMAMQTREQHIRREKANSNICTSQVLLANIASLYAVYHGPVGLKRI +ANRIHRLTDILAAGLQQKGLKLRHAHYFDTLCVEVADKAGVLARAEAAEINLRSDILNAV +GITLDETTTRENVMQLFSVLLGDNHGLDIDTLDKDVAHDSRSIQAAMLRDDEILTHPVFN +RYHSETEMMRYMHSLERKDLALNQAMIPLGSCTMKLNAAAEMIPITWPEFAELHPFCPPE +QAEGYQQMIAQLADWLVKLTGYDAVCMQPNSGAQGEYAGLLAIRHYHESRNEGHRDICLI +PASAHGTNPASAHMAGMQVVVVACDKNGNIDLTDLRAKAEQAGDNLSCIMVTYPSTHGVY +EETIREVCEVVHQFGGQVYLDGANMNAQVGITSPGFIGADVSHLNLHKTFCIPHGGGGPG +MGPIGVKAHLAPFVPGHSVVQIEGMLTRQGAVSAAPFGSASILPISWMYIRMMGAEGLKK +ASQVAILNANYIASRLQDAFPVLYTGRDGRVAHECILDIRPLKEETGISELDIAKRLIDY +GFHAPTMSFPVAGTLMVEPTESESKVELDRFIDAMLAIRAEIDQVKAGVWPLEDNPLVNA +PHIQSELVAEWAHPYSREVAVFPAGVADKYWPTVKRLDDVYGDRNLFCSCVPISEYQ +>test.0417.00002.0005i_00094 390 gcvH | Glycine cleavage system H protein | NA | similar to AA sequence:UniProtKB:P0A6T9 | COG:COG0509 +MSNIPAELKYSKEHEWLRKEADGTYTVGITEHAQELLGDMVFIDLPEVGATVSAGDDCAV +AESVKAASDIYAPVSGEIVAVNDALSDFPELVNSEPYAGGWIFKIKASDESELESLLDAT +AYEALLEDE +>test.0417.00002.0005b_00095 1164 gcvT | Aminomethyltransferase | 2.1.2.10 | similar to AA sequence:UniProtKB:P27248 | COG:COG0404 +MLGFVVIISPWKSCQPRLFNEDKMAQQTPLYEQHTLCGARMVDFHGWMMPLHYGSQIDEH +HAVRTDAGMFDVSHMTIVDLRGSRTREFLRYLLANDVAKLTKSGKALYSGMLNASGGVID +DLIVYYFTEDFFRLVVNSATREKDLSWITQHAEPFGIEITVRDDLSMIAVQGPNAQAKAA +TLFNDAQRQAVEGMKPFFGVQAGDLFIATTGYTGEAGYEIALPNEKAADFWRALVEAGVK +PCGLGARDTLRLEAGMNLYSQEMDETISPLAANMGWTIAWEPADRDFIGREALEAQREHG +TEKLVGLVMTEKGVLRNELPVRFTDAQGNQHEGIITSGTFSPTLGYSIALARVPEGIGET +AIVQIRNREMPVKVTKPVFVRNGKAVA diff --git a/test/data/annotate/exp_files/res_formatAll/prokka/Proteins/test_runprokka_H299.prt b/test/data/annotate/exp_files/res_formatAll/prokka/Proteins/test_runprokka_H299.prt new file mode 100644 index 0000000000000000000000000000000000000000..9339433511af66743d6800d48442963fe04816ba --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prokka/Proteins/test_runprokka_H299.prt @@ -0,0 +1,86 @@ +>test_runprokka_H299.0001b_00001 543 NA | hypothetical protein | NA | NA | NA +MKTGSEAIRALAMQIPAFRQKLSDGWYQVRIAGRDAGETELSARLNEPLENGAVIHIVPR +LAGAKSGGVFQAVLGAAVMAVAIWMPGVGIMASNLLFSLGASMTLGGVAQMLAPKPKTPR +TQTTDNGKQNTYFSSLDNMVAQGNVLPVLYGEMRVGSRVVSQEISTADEGDGGQVVVIGR +>test_runprokka_H299.0001i_00002 600 NA | hypothetical protein | NA | NA | NA +MSPEDWLSAEMQREIVALVHSHPGGLPWLSEADRRLQVQSDLPWWLVCRGAIHKFRCVPH +LTGRRFEHGVTDCYTLFRDAYHLAGIEMPDFHRGDDWWRNGQNLYLDNLEATGLYQVPLS +AAQPGDVLLCCFGSSVPNHAAIYCGDSELLHHIPEQLSKRERYTDKWQRRTHSLWRHRAW +HASAFTGIYNDLAAASTFE +>test_runprokka_H299.0001i_00003 699 NA | hypothetical protein | NA | NA | NA +MQDIQQETLNECIRAEQSASVVLWEIDLTEVGGDRYFFCNEQNEKGESVTWQSRQYQAYP +IQGSGFEMNGKGSAARPTLTVSNLHGMITGMAEDLQSLVGGTVVRRKVYARFLDAVNFVN +GNSEADPEQEVISRWRIEQCSELSAVSASFVLSTPTETDGAVFPGRIMLANTCTWTYRGD +ECGYSGPAVADEYDQPTSDITKDKCSKCLSGCKFRNNVGNFGSFLSINKLSQ +>test_runprokka_H299.0001i_00004 297 NA | hypothetical protein | NA | NA | NA +MKTENKPSIKTVRFGDGYEQRSPNGLNHSLRVFTCDFKVEANERDSFEKFLARHEGYKSF +FWRPPGINRKIRVVCRTWSATEHITYTDFSCQFDEVVI +>test_runprokka_H299.0001b_00005 936 NA | hypothetical protein | NA | NA | NA +MQASIDNRQQGYDIQIAGYGVGDKNQQRQQELLRIEHGYNNQRLQLERDYADKSRGMSDH +VFQEKMQALNDALEREKEIVRQKNEQLDIQAGDWVSGASQGFNNWLDDTKDISEQIKSTT +TQMFDGMTDALGDFVTTGKANFRSFATSVISDLSRIALKASITGIFDSISNSSSGGILGT +IGSAISKFIPNAKGGVYESPSLSTYSNGIYDSPQFFAFAKGAGVFGEAGPEAIMPLTRTS +DGSLGVRAINSKSGNGGGDITYAPVYQITIQNDGQNGEIGPQAIKALMGMVDQRVQGNLL +NMRRDGGMLSG +>test_runprokka_H299.0002b_00006 543 NA | hypothetical protein | NA | NA | NA +MKTGAEAIRALATQLPAFRQKLSDGWYQVRIAGRDTGETELSARLNEPLANGAVIHIVPR +LAGAKSGGVFQAVLGAAVMAVAIWMPGVGIMASNLLFSLGASMTLGGVAQMLAPKPKTPS +TQTTDNGKQNTYFSSLDNMVAQGNVLPVLYGEMRVGSRVVSQEISTADEGDGGQVVVIGR +>test_runprokka_H299.0002i_00007 744 NA | hypothetical protein | NA | NA | NA +MTETESAILAHARRCAPAESCGFVVRTPEGERYFPCVNISGEPEAYFRMSPEDWLRAEMQ +GEIVALVHSHPGGLPWLSEADRRLQVQSDLPWWLVCRGTIHKFRCVPHLTGRRFEHGVTD +CYTLFRDAYHLAGIEMPDFHREDDWWRHGQNLYLDNLEATGLYQVPLSSAQPGDVLLCCF +GSSVPNHAAIYCGDGELLHHIPEQLSKRERYTDKWQRRTHSLWRHRAWRASAFTGIYNDL +VAASTFV +>test_runprokka_H299.0002i_00008 699 NA | hypothetical protein | NA | NA | NA +MQDIRQETLNECTRAEQSASVVLWEIDLTEVGGERYFFCNEQNEKGEPVTWQGRQYQPYP +IQGSGFELNGKGTSTRPTLTVSNLYGMVTGMAEDMQSLVGGTVVRRKVYARFLDAVNFVN +GNSDADPEQEVISRWRIEQCSELSAVSASFVLSTPTETDGAVFPGRIMLANTCTWTYRGD +ECGYHGPAVADEYDQPTSDITKDKCSKCLNGCKFRNNVGNFGGFLSINKLSQ +>test_runprokka_H299.0002i_00009 330 NA | hypothetical protein | NA | NA | NA +MKTFRWKVKPGMDVASAPSVRKVRFGDGYSQRAPAGLNANLKTYSVTLSVPRWEATVLES +FLEEHGGWKAFLWTPPYEWRQIKVTCAKWSSRVSMLRVEFSAEFEQVVN +>test_runprokka_H299.0002i_00010 2580 NA | hypothetical protein | NA | NA | NA +MAEPVGDLVVDLSLDAARFDEQMARVRRHFSGTESDAKKTAAVVEQSMSRQALAAQKAGI +SVGQYKAAMRMLPAQFTDVATQLAGGQSPWLILLQQGGQVKDSFGGMIPMFRGLAGAITL +PMVGATSLAVATGALAYAWYQGNSTLSDFNKTLVLSGNQAGLTADRMLVLSRAGQAAGLT +FNQTSESLTALVNAGVRGGEQFEAISQSVARFSSASGVEVDKVAEAFGKLTTDPTSGLTA +MARQFHNVTAEQIAYVAQLQRSGDEAGALQAANEAATKGFDDQTRRLKENMGTLETWADR +TARAFKSMWDSVLDIGRPDTAQGMLEKAEKAFDEADKKWQWYQSRSHRRGKTSAFLANLR +GAWEDRANAQLGLSAATLQADLEKAREMAAKDWAESEASRLKYTEEAQKAYERLQTPLEK +YTARQEELNKALKDGKILQADYNTLMAAAKKDYEATLKKPKQSGVKVSAGDRQEDSAHAA +LLTLQAELRTLEKHAGANEKISQQRRDLWKAESQFAVLEEAAQRRQLSAQEKSLLAHKDE +TLEYKRQLAALGDKVTYQERLNALAQQADKFAQQQRAKRAAIDAKSRGLTDRQAEREATE +QRLKERYGDNPLALNNVMSEQKKTWAAEDQLRGSWMAGLKSGWSEWEESATDSMSQVKSA +ATQTFDGIAQNMAAMLTGSEQNWRSFTRSVLSMMTEILLKQAMVGIVGSIGSAIGGAVGG +GASASGGTAIQAAAAKFHFATGGFTGTGGKYEPAGIVHRGEFVFTKEATSRIGVGNLYRL +MRGYATGGYVGTPGSMADSRSQASGTFEQNNHVVINNDGTNGQIGPQALKAVYDVARKAA +MDVVTGQMRDGGLFSGGGR +>test_runprokka_H299.0002i_00011 435 NA | hypothetical protein | NA | NA | NA +MFDGELSFALKLAREMGRPDWRAMLAGMSSTEYADWHRFYSTHYFHDVLLDMHFSGLTYT +VLSLFFSDPDMHPLDFSLLNRREADEEPEDDVLMQKAAGLAGGVRFGPDGNEVIPASPDV +ADMTEDDVMLMTVSEGIAGGVRYG +>test_runprokka_H299.0002i_00012 423 NA | hypothetical protein | NA | NA | NA +MFLKTESFEHNGVTVTLSELSALQRIEHLAWLKEQEKKAESSGNLQVSVEDLIRGGAFLV +AMSLWHNHPQKTKLPSMNEAVKQIEQEVLTTWPTEAIAQAENVVLRLSGMSEFVVNNAPE +QADDAGPAEPVSAGKCSTVS +>test_runprokka_H299.0002i_00013 741 NA | hypothetical protein | NA | NA | NA +MPVPNPTMPVKGAGTTLLVYKGSGDPYANPLSDVDWSRLAKVKDLTPGELTAESYDDSYL +DDEDADWAATGQGQKSAGDTSFTLAWMPGEQGQQALLAWFNEGDTRAYKIRFPNGTVDVF +RGWVSSIGKAVTAKEVITRTVKVTNVGRPSMAEDRSTVTAATGMTVTPASTSVVKGRSTT +LTVAFQPEGATDKSFRAVSADKTKATVSVSGMTITVKGVAAGKVNIPVVSGNGELAAVAE +INVTNS +>test_runprokka_H299.0002b_00014 156 NA | hypothetical protein | NA | NA | NA +MESRIYPVMSDIPALSDLITSMVASGYDYRRDDDAGLWSSADLTYVITYEM +>test_runprokka_H299.0003b_00015 708 NA | hypothetical protein | NA | NA | NA +MFYVLTTITMFFFYFIRKGKVVKLFFFHYISKNKVYETFIFGLYQLPHVLSSWVRLGYDR +LVLGELISMSYVGGYSVAVQISLVSSVIFQSLNRFWTPFFIKKLKENSKQKKIIVLGGFG +IICITILNILFGYAYFIFFLPTNYSSFSNALPILCMAYMFQGLYFLIVNYIYYHDGNKLI +SIPSVASIAIHIAVAPVLIKHMGYYGAAISLLISWIVLFLFTCVIIFYVRRGYRG +>test_runprokka_H299.0003b_00016 933 NA | hypothetical protein | NA | NA | NA +MGNIFIVESPFQLSNALLYHKKNDSVIVRLNGENKNDFQIEKMLSSFNGKVYIKKASKES +KFDLIRFVLFFAVPVLIANLNKKVIIGNYNSLWMRVMGYLFNPFHFAVLDDGLITIRTIK +RLDDNISRSGSIKKRFLLLLAPRFITQYKIYSNFIQIYNQEINKRKRTTRAIKAGRVCFI +GSPLFDKNVLTFDFYVKCLAAISDNLKRCGYSIEYYPHRSEKNISYLNVFFDDVIKSDDS +IEVYYSASNELPEIFVSFYSSALLNLRSDYPECKFISYKLDCNEINGKFRYEIMEAYNFL +AFSGIEVVTI diff --git a/test/data/annotate/exp_files/res_formatAll/prokka/Replicons/test.0417.00002.fna b/test/data/annotate/exp_files/res_formatAll/prokka/Replicons/test.0417.00002.fna new file mode 100644 index 0000000000000000000000000000000000000000..1375f72fee07a61fed2a6a3100b9d5b67c88833f --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prokka/Replicons/test.0417.00002.fna @@ -0,0 +1,2018 @@ +>test.0417.00002.0001 9603 +TCTCATACTACCCAATTTCTTAAAAGTGCAAATTTGTGAAGCTTATCCTGTTATTATTTT +AAGTTTCATGCCAAATTCTCTCACCAGATAATGCCGCCCTCTTCCGAAAAATAATCAAGA +GGCCAAACAATATCTAAAATGATACAACTGTATCTATTCCCCTGAAAAATACATTATTCA +TTTGTATATTTTCCTCATCATTGCTTTTTATTTAAATCATCCGATAATCCCCTGAATATA +ATTATGTCAATAACCATCAGAAAAAGTGGATGATGAGGAAAAGGATATGGCCGACAGTTT +CCAGAATGAAGTTCCCGCCGCTCGTGTAAATATCAAGCTTGATCTGCATACAGGCAATGC +TAAAAAGAAAGTTGAACTCCCCCTCAAGCTTCTTGCCGTAGGCGATTACAGTAACGGAAA +AGAGCAACGTCCGCTGTCCGAACGGGACAAGGTTGATATCAATAAAAACAACTTCAACAG +CGTCATGGCTGAGTTTTCGCCTGCGGTTAATTTAACAGTAGAAGATACGCTAAACGGAAA +CGGTAATGAACAAAATATCGCGCTTGAATTTAAAAGCCTGAAGGATTTTGAACCCGAACA +GGTAGCAAAAAATATTCCGCAACTTCGTGTATTACTCGCTATGCGCAATTTACTACGTGA +CCTGAAATCCAATCTGCTGGATAACGCAACGTTTCGCCGTGAACTGGAAAATATCCTGAA +AGACCCGACGCTCAGTTCAGAACTGCGTGATGAACTGGCGAAAATTGCGCCGCAGGAGAA +CGTTTAACCCGAACGCGTATTCAGGTTAAACCGGAGAAGAAAGGATCACTGAAAAGGAAA +TGCTGATGTCTGTACAACAAGAACATGCCACCTCTGAAACTGCAACACTCACCACCACTG +AGTCCGGCGGCGTTTATCAGTCCCTGTTCGATAAAATTAATTTAACCCCGGTGTCTTCCA +TTCAGGAAATCGATTTATGGCAAAACAGCGAAACGCTGGCCGATGCCTCACCCGATGAGC +GCGTGACGGCGGCGATTCACGTTCTGCTTTCCTGTCTGGCGAAATCAGGCGAGGACGTGG +TTAAGCTCGACAAGAGCCTGCTGGATTTTCATATCGACGATCTGGATCAGAAAATCAGTA +AACAGCTTGATGCGGTCATGCACCACCCTGAATTCCAGAAAGTCGAGTCGCTGTGGCGTG +GTACATGGTTCGTCGTACAGCGCACTGATTTTCGCAAAAATGTCAGAATTGAACTGCTGG +ATATCAGTAAAGAACATCTGCGGCAGGACTTTGATGATTCTCCGGAAATCATTCAAAGTG +GTTTATATCGCCATACATACATTCAGGAGTACGATACGCCGGGTGGCGAACCTGTTGCCT +CATTAATTTCCAGCTATGAATTTGATAACAGCCCGCAGGATATTGCCCTGCTGCGTAATA +TTTCCAGAGTGTCTGCCGCTTCCCATATGCCTTTTATCGGTTCTGTCGGACCGAAATTCT +TCCTTAAAAATTCGATGGAAGAAGTCGCCGCGATTAAAGATATCGGCAACTACTTTGACC +GCGCAGAATATATTAAATGGAAGTCGTTCCGCGATACGGATGACAGCCGCTATGTGGGAT +TAGTGATGCCGCGCGTGCTGGGCCGTCTGCCCTATGGGCCGGACACGGTGCCGGTACGCA +GCTTTAACTATGTGGAAGAAGTCAAAGGCCCGGATCACGAAAAATACCTGTGGACAAACG +CCTCGTTCGCCTTTGCCGCCAATATGGTGAAGAGCTTTGTTAATAATGGCTGGTGCGTGC +AGATCCGTGGCCCACAGGCGGGCGGCGCAGTGGCCGATCTGCCGATCCATCTTTACGATC +TCGGCACCGGCAATCAGGTCAAAATTCCGTCCGAAGTGATGATCCCGGAAACCCGCGAAT +TTGAATTTGCCAACCTTGGCTTTATTCCGCTCTCTTATTATAAGAATCGCGATTACGCCT +GCTTCTTCTCGGCGAACTCTGCCCAGAAACCGGCGTTGTACGATACCGCTGACGCCACCG +CCAACAGCCGTATCAATGCCCGTCTGCCTTACATCTTCCTGCTGTCCCGCATTGCGCATT +ACCTGAAAATTATTCAGCGCGAGAATATCGGCACCACCAAAGACCGCCGCGTGCTGGAAC +TGGAGCTGAATACCTGGATCCGCACGCTGGTGACGGAGATGACCGATCCTGGCGATGAAC +TTCAGGCTTCGCATCCACTGCGCGACGGGAAAGTTATCGTCGAGGACATAGAGGACAATC +CGGGCTTCTTCCGCGTCAGACTCTTTGCCGTGCCGCATTTCCAGATTGAAGGGATGGATA +TCAACCTTTCTCTGGTTTCCCAGATGCCAAAAGCAAAAGCCTGATCGGGCGGTGGTGTGA +TGTATGAAAATTTGTCGACCACTGTGGGCTGAGGGGACATTCCTGTCTTCTCAGCAGTTT +CAGCAGCAGGCCCGCTGGGAAGCGTTCAGCAATGACTGTATTGCGCAGCTTTGTATTCGC +CATCCGTGGGGGATCGCAAACGTGCTCTTTGACCGGGATGCCCTGACGCCCGGAAAGCTG +AAAACGCAGGCAGTACGCCTGCGTTTTGCTGATGGCACGCTGATCGATTCAGACGTGAGT +GACGTTCTGCCGCTCGCCTGCGATCTGCGCGCGCTGAAGAACGACAGCGCGATTGTTTTG +CTGGCGCTGCCGCTTGCACATGGTAACGGCGGTAATCTCGGTCAGGGTGAGCAGACTGAA +AGACCGCTGCGCTATCGTCAGGAATGGCAAAAGGTGCAGGATATCTACGGCAGTGACAGT +GAAGATATGGCCGTTGAGCGTCATGCGCTGTCCCTGCGCTTTGCTCATGATAACAATCAG +GATTACATCACCTGCCCACTGGCGCGTCTGGTGCGGGATGTTCAGGGCAACTGGACACAG +GATGAGAGCTATATTCCGCCGTTACTGGCGTTTAACGCCCATGACGGGCTGGTACAGCGT +CTGGACACATTGCTGTTGCAGCTACGGGCGAAGTGCCAGCGTCTGATGGCGATGCGCCGG +GAAAGCAACCAGCGTATGGCGGACTTTGCCGTCGCCGATGTCTCCCTGTTCTGGCTGCTT +AACGCGCTGAATTCCGCCGAGCCGGTGCTGAGCGATTTCCTGCGCTACCCGGCTGTCCAC +CCCGAACTGGTCTGGCGGGAGCTGGCGAGGCTTGCCGGTGCGCTGCTGACGTTTTCCCTT +GAGCATAACGTCAGCGCCGTTCCGCCCTATGTCCACGAATCGCCGTCCACCGTCTTTCCG +CCCCTGTTCTCCCTGCTCAGCGAGCTGCTGGAAGCCAGCCTGCCGTCGCGGGTGATCGCG +CTGGATCTGGCGTCCCTGCCGGGCAACCGCTGGAAAGCCGACCTGCACGATCCGCGCCTG +CGGGAAGAGGCCGATTTTTATCTGTCCGTTCGTTCCTCACTGCCTGCGCATCAGGTACTG +CATCAGCTACCGCTGGTCTGCAAAATCGGTGCGCCCGATGATGTCACGCTGCTTATCAAC +GTGGCGCTGAACGGTGTTCAACTGGTGCCGCTTACCTCGGTTCCGGCGGCGCTGCCGCTG +CGGCTGGAGAACCAGTATTTTGCGCTGGATATGCACAGTGACGCGGCTAAATCGATGCTG +GAGTCCGGGAGCTGCATGATTTATGCGCCGGGAACCATGGGCGACCTGAAACCTGAACTG +TTTGCGGTGCTGCGCACATGAAAAAAGATATGGATATCAATATCGATGCGCTGCTGCTCG +ACACGTTTCTGACGGTGGTGGAACTGCGTCAGGGAACCACCGTGCGTCACGGTATCGAGC +TGTATCGCCACTGTCAGCGGCAGGTGGAACTGGTCCGCGAACGTCTGAAAGATGCCGGAT +TCAGTCGGGAGAACGTGGAGCACATAACTTACGCGCAGTGCGCCCTGCTGGACGAAACGG +TGCTCAGCCGTAGTGGCATGGACGACGGTCAGGCCATCTGGATGAAAAACCCACTCCAGT +CGCATTTCTTCAACACCCTGCAGGCAGGTGAGCTGCTGTACGAACGGATGAAGCAGGTGC +TACAGGAACCCGCCCCCGCGCAGGCCGTGCTGACCTGCTTTCACCGTGTCCTGCTGCTGG +GATTTCGCGGGCGTTATCAGGATCCGGCAGCCCCGGAGCGCGACCAGCTTATTTCGACGC +TCAACGGGCAGGTCGCGCCATTTGGTGTGCTGCCGGAAACGGCGGTACTGAACGTGCCGT +TATCCACCCGTCAGCACCCTTTGCTGCATTCGCCATTTTTCTGGCTGGTAACACTGGCGC +TGCTACTGGCGGGCGTCTGGTGGGGGCTACACCACTGGCTGAACGTGCTGGTGGATGAAC +TGCTGCCGCAAAGCCTGCGTTAAAGGGAGTCGTGAGTGAGGAACACGCTGAAACAGGCCA +TCGTGCTGTGGGGAATGGTGTTACTGCTGGTGCTGTGGTCAGTGTTTATCAGTCCGTCTG +GCGTGCTGAGATGGGCCGGTGCGGCGGCTATCGTTCTGGCGGTTGCTGCGTTGTTGATTT +ATCGGCGCAGGCAGGCGTGGACGGAGATGACCGGCGATGCCGGGTTGTCATCGCTGCCGC +CGGAAACCTACCGGCAGCCGGTAGTGCTGGTCTGCGGCGGTCTGTCGGCGCACCTGTTCA +CTGACAGCCCGGTCCGGCAGGTTTCAGAAGGGCTGTATCTGCATGTTCCTGATGAAGAAC +AGCTTGTGGCGCAGGTGGAGCGATTGCTGACCCTTCGCCCGGCGTGGGCATCGCAGCTTG +CCGTGGCGTATACCGTCATGCCCGGCATACACCGGGATGTGGCGGTTCTGGCCGGACGGC +TGCGACGGTTTGCCCACAGTATGGCGACGGTGCGTCGCCGGGCGGGCGTAAACGTCCCCT +GGCTTCTCTGGAGCGGGCTGTCCGGCTCGCCGTTGCCGGAAAGAGCGAGTTCACCGTGGT +TTATCTGTACCGGCGGCGAAGTTCAGGTAGCAACATCCACAGAGACCACCATGCCCGCGC +AGTGGATTGCACAATCCGGCGTACAGGAGCGCAGTCAGCGACTCTGTTACCTGCTGAAAG +CTGAAAGCCTGATGCAGTGGCTGAATCTTAATGTGCTGACGGCACTGAACGGCCCGGAGG +CGAAATGCCCGCCACTGGCGATGGCCGTGGGGCTGGTCACCTCGTTGCCAGCGGTGGATA +ACAACCTGTGGCAAGTGTGGATCACCGCCAGAACCGGCCTGACGACGGATATCGCGGACA +CCGGCACAGACGCCACGCTGCCGTTTCCGGATGCTCTGTTACGGCAGTTGCCGCGTCAGT +CGGACTTTACCCCGCTGCGGCGGGCCTGCGTGACCATGCTGGGCATTACCACCGCGGCGG +GTATCACCATGTTGTGCCTGTCAGCCACGGCAAATCGCCAGTTATTACGGCAGGTCGGTG +ACGATCTGCACCGGTTTTATGCCGTCCCGGTGGAGGAATTTATCACCAAAGCCCGTCACC +TGTCGGTGCTGAAAGACAATGCGACCATGCTCGATGGGTATTACCGGGAAGGAGAACCAC +TGCGCCTCGGTCTGGGGTTATACCCCGGCGAACGCATCCGCCAGCCGGTATTACGCGCCA +TTCGCGACTGGCGTCCGCCTGAACAAAAAATGGAGGTGACGGCTTCGCTTCAGGTTCAGA +CCGTGCGTCTTGACAGTATGTCGCTGTTTGACGTCGGACAGGCCCGCCTGAAAGACGGCT +CGACAAAAGTGCTGGTGGATGCGCTGGTGAACATCCGGGCAAAACCGGGCTGGCTGATCC +TCGTGGCCGGATATACCGACGCCACCGGCGATGAAAAAAGCAATCAGCAGTTATCGCTGC +GGCGTGCCGAAGCGGTGCGCAACTGGATGCTGCAGACCAGCGACATCCCGGCCACCTGTT +TTGCCGTACAGGGACTGGGCGAGAGCCAGCCTGCGGCGACCAACGACACGCCACAGGGCC +GGGCAGTCAACCGGCGTGTCGAAATCAGTCTTGTTCCGCGTTCTGACGCCTGTCAGGACG +TGAAATAAAACATACCGCCGGAAGAAGGCGGTGCTTCAATCACACTAACAAGGAGAGTAA +TTCTCATGGCTATTCCTGCTTATCTCTGGCTGAAAGATGACGGCGGCGCGGATATCAAAG +GTTCCGTGGACGTTCAGGGGCGCGAAGGTAGCATCGAAGTGGTGGCGCTGGATCACGATG +TGTACATCCCGACCGACAATAACACCGGCAAACTGACCGGTACCCGTACTCACAAGCCCT +TTACGTTTACCAAAGAAATCGATGCCTCCAGCCCGTATCTCTACAAAGCTGTGACCACCG +GACAGACCCTGAAAACGGCAGAATTTAAGTTTTACCGCATCAACGATGCCGGTCAGGAAG +TGGAGTACTTCAACATCACGCTTGATAACGTCAAGCTGGTCAGAGTCGCTCCGCTTATGC +ACGACATCAAGGATCCTTCCAGAGAGAAGCATAACCACCTGGAACGTATTGAGTTCCGCT +ACGAGAAAATCACCTGGACTTACAAAGACGGCAACATCATTCATTCCGACTCGTGGAATG +AGCGTCCTTCCGCCTGATAACTGCGGCAGACAGGAAACTGTCTGCCTTTTTGTTGTGTGC +TTTGTCCAGTGCCGCAGGCACCGGTACTGAGCAAAGCATACCCACAATCTGGTGAAACCT +GATGGGCCTGAGTGAGGTAACGGCTATGGGCGGTAGCGTGCCTGAACGCGGATCGCAGGA +ATACAGAACACGATAAGGAACCCTTCTATGACAGGAAATCACTCCGCCGCGCTGCTGCGT +CGCCTTAACCCATACTGTGCACGGGCGCTGGACGCTGCCGCCTCACTGTGTCAGACCCGC +GCCCATGCGGAAATAACCATTGAACACTGGCTGCTGAAACTGCTGGAGCAGGGAGAAGGC +GATATCACGGTGATTGCCCGCCGCTATGAATGGGATATCGACACGCTCTGGCAGTCTCTG +CTGGCACATCTGGACACCTTACCCCGCCCGGTCCGCGAACGTCCTCAACTTTCTGAACCG +CTGGCAGCGCTTATCCGACAGGCGTGGCTGATAGCGTCACTGGAAGGCGACGATCCACAA +ATCCGCAGCCAGCATCTGCTGATGGCGCTGACAGAAAAACCGATGCTGCCCGCCTGTAAT +GACCTGTGGGTATTGCTGAGTCTGAGCCGCGTGCAGCTTGAGCGGCTGCGTCCCCTGCTG +GATGCGCAGTCGGATGAATGTCCGGCACGTCAGCCACAGGTCACCGAACCGCTGACCTCT +GCACTGCCGGAGACGGCAACGGCGGACGCACCGGCAAAAACGCTGACGGAGAAACAGGAT +GACGCCCTGCTGGCGGTGCTTAACCGCTTTACCGAAGACGTGACGGAAAAAGCCCGCAGC +GGGCGAATCGACCCGGTATTCGGGCGCGACACGGAAATTCGCCAGATGGTCGATATCCTC +TCCCGTCGCCGCAAAAACAACCCGATTCTGGTGGGAGAACCGGGGGTGGGCAAAACCGCG +CTGGTGGAAGGGCTGGCGCTGCGTATCACCGAAGGCAACGTGCCGGACAGCCTGAAAACG +GTGCATATCCGCACACTGGACCTCGGTCTGTTACAGGCTGGCGCGGGCGTTAAAGGTGAA +TTTGAACAGCGGCTGAAAAATGTCATCGATGCAGTGCAGAAATCACCGGAGCCGGTACTG +CTGTTTATTGATGAAGCCCATACCATTATCGGTGCGGGTAATCAGGCAGGCGGCGCGGAT +GCGGCGAACCTGCTGAAACCGGCACTGGCAAGGGGCGAACTGCGCACCATCGCGGCGACC +ACGTGGAGCGAATACAAACAGTATTTTGAGCGCGACGCCGCGCTGGAGCGCCGCTTCCAG +ATGGTTAAGGTTGACGAGCCGGATGATGACACCGCCTGTCTGATGCTGCGGGGACTGAAG +GCTCGCTATGCACAGCACCACGGCGTGCATATGCTGGACAGCGCCATTCAGACCGCCGTG +CGCCTGTCGCGCCGCTATCTGACCGGACGCCAGCTGCCGGACAAGGCGGTTGATTTGCTG +GATACCGCCGGGGCAAGAGTCCGCATGAGCCTTGACACCCTGCCGGAACCGTTGACGCAG +CTTCATGCGCGACTGGCGGCACTGGATATTGAGCGGGAAGCGATTGAGCAGGACAGCGTA +TTTTATCCCGAAGCCAGCCCGGAGCGGCTGGCGGAACTGACCGATTTGCGTGATGAGCTA +CAGGCAGAAGCCGGGCATCTGGAAGCGCAGTATCAGCAAGAAAAGGCACTGGCGCAGCAG +ATTATGACGTTGCGTCAGGAAGGAACAGACAGCTCTGAACTGCAACAGCAACTGCGGACG +CATCAGGGCTTTGCACCGCTGCTGGCGCTGGATGTGGACGCCCGCGCCGTCGCCACGGTG +GTGGCGGACTGGACCGGCATCCCGCTCTCTTCCTTGCTCAAGGACGAGCAGAGCGACCTG +CTCAGTATGGAACAGAGTCTTGAAAACCGCGTTGTCGGGCAAAGCCCGGCGCTCTGCGCC +ATCGCACAGCGGCTGCGGGCGGCTAAGACCGGCCTCACGCCGGAGAACGGCCCGCAGGGG +GTATTCCTGCTGACCGGCCCCAGCGGCACCGGTAAAACCGAAACTGCGCTCACACTGGCC +GACACTCTGTTTGGCGGTGAAAAATCCCTTATCACCATTAATCTTTCGGAATATCAGGAA +CCGCATACCGTTTCCCAGTTGAAAGGTTCGCCTCCGGGCTATGTCGGCTACGGTCAGGGC +GGCGTGCTGACCGAAGCGGTACGCAAACGCCCTTACAGCGTGGTGCTGCTCGACGAAGTG +GAAAAGGCGCATCGCGACGTGATGAACCTGTTCTATCAGGTGTTCGACCGGGGCTTTATG +CGCGACGGCGAAGGGCGGGAAATCGACTTCCGTAACACCGTGATTCTGATGACCGCCAAT +CTGGGCAGCGACCACATCATGCAGCTGCTGGAGGAAAAACCGGACGCCACGGACGCAGAC +CTGCATGAACTGCTGTACCCCCTGCTGCGAGACCATTTTCAGCCTGCACTGATGGCGCGC +TTTCAGACGGTGATTTACCGCCCGCTGGGACAGGAGGCGATGCGCGCCATTGTGGAAATG +AAACTGGCGCAGGTGGCCCGCCGTCTTCACCAGCACTATGGGCTGGAAACGGAAATCAGT +AACAGCCTGTACGACGCCCTGACCGCCGCCTGCCTGCTGCCGGACACCGGTGCGCGTAAT +ATCGACAGCCTGCTGAACCAGCAAATCCTGCCGGTCTTAAGCCAGCAGTTGCTGGCGCAG +CAGGCCGTGCATCATAAGCCTGCCCGACTGCGGCTTGACTGGGATGATGAAGACGGGATT +GTGCTGGAATTTGATGAGAAATAATGGAGGCTCTTATGAACGTACAGTTCTTCGACCACG +CACACCACAAGCTCAAAATTCGCGGCCTGAAAAGCCCGGTGGACGTGCTGACGTTTACGG +GCCGGGAACAACTCAGCGCACCCTTCCGCTACGACATTGAATTTACCAGTACCGATAAAA +CCA +>test.0417.00002.0002 22446 +CGATCTGATAGCTAATTGTAAGAAGATAAAGGAAGGCAACGATAAAAACGAGGACACCAC +CTGGGCATGGGTAGCGATGATCCTGACACTGGTCGGTCTTATTCCAGTGGCAGGTTCTTT +AATTAAAGGGATCTTCAAAGTGCTGTTTAATTCGATAAGAAAGGCGGCGCTTTCCAGTAG +GGATATTGTACGAGCGATTGATGCTTCCGTTTCCCTGTTTAATAAATTTATCGATTTGCC +AGCCGTGCAGGCGACAATGAAGTGGATGAAGATTTATAACCCGTATACGTATGCTGAGAA +GCAGGTCAGGGAACTGATGGCGCAACTTAACGTATCGGTGCTGTTAAGCAAGCTGGATGA +GTTAATGGACGTCACTGGTTCGCTACTCGAAAAGGCTAAATCTTGGGGGCCGGAGTCCAT +TCGCCAGCCGATAGAGGTGATATGGGAACTGCTGGTGTCTATCCGCAGCCAAGCCAACAC +CATGCTTGCAAAAGCGCTGGCACCGTTAAATGATGTGCTGGAAAAGCTGGCTGCCCGTCT +GCACCGGGAAGGGGACGATTATTATAAAGCGCATACTGGTGCTAATCCGCATCGGCCTTC +TCGCCTGAAAGATGCTGAAGAGGTGGAATTGCTGGCTACCAAAAAGCCAGACTGGGCGGA +TATTGGGGGTAAAGAAAAATATCCACAACTGGAAAAAGCCAGTGCGGAACAGAAAAGATT +AATGGACCCGGAGAATAAGGAGGGCGGCTACCCGAATATTCCTGATGATAAAGTGCAGAC +TTTTCATCAGATGGCTCCCGTTGAATTTAAAGAAGGCGAGAAACTCTACCGGGTGCTTGA +CCCTGGCAGTAGCGATAATAGTTTTTGCTGGATGCGTGAAGCAGAGTTTAAAGCACTGAA +GAGTAAGTCTCAGTGGCGACGACGCTTTGCGGTCTGGAAAAGCTGGAATGAAAATGGTGA +GTATGTAGTTTATACCGTGCCACCCGGTACAACAATGAAGGTTTGGGAAGGTCCAGCTGC +CTCTCAGGTGCGTGAAGTCACAGGTAAGAATGGAGAGAACATTAAAGTCGTGCTGGAAGG +CGGATCACTTCAGATAGTGATAGATCCGACCGTTCTGAATTTGGACTATTTGGGGAAACG +TCAGTCTACAGGATGGGGGTATAGAGATTTTTCTGATGAAGTGGATATGTATATAGGTGT +GCCTCAGTTGCAAACAAATATTTATGTACCTAAATAAAAAGTATCAACAGACAATTAATT +GATAAATCAGGAGATAAAATGGCTATATTACATCCACAGGAGTGTTGGTTGCTGGAAAGA +ATAATGTCGCCGGAATATTATCGGCGCCGTTTTGAGGGCTGGCAGGCGTTTGTCGAGCTG +TGCGAACGGCAAGTGGCGGAGTGGAGCAAGACCATTCCGCTGGATGTGCGCCGTCGTCCG +CTGTACGAGCAGATTGACGCCGTCTGGGGCGGGCGGGTGTTGCCCAATATCCGCAGCACT +TTAAAGTCGGTACAGTATGACTTTATTCAGCTACAGCAGGGGGACCTGCGGGTACTGCAA +TCCGGGGGCAATATTAGCAGTGATATGAAAGGACTGATTGATTATCCGCCGGACTGGATG +TCACCCGCCGCGCAAAAACAGTATGACAGGCTGAAATGGCGAGGTGCACATTATAATAAT +CTAATCAGACGTACCTCGGGCGGATACTGGTATGACGGCGAACTGACTTATTATTATGAG +GAAAGTCTGCACGGCCCGCTGGCCCTGCCGATGCAATTACCGTTGTATGAGCTGGATAGC +AGCGTATACCTGCGTGAGGATGACCCGGTAACGGTGGCTGGCCTGTATCTGCCGGATATC +CCAGATGCCAGCGCCCAACTGTTGTACCGGAGTGAACATATTCCCGAGGCTTGGCAGGGG +CGGGTACGAACGAAGTATGTCAACGAGGCTGGGATACAAGAATATTACTGGGAAAGCGGG +GCGTGGGCAAAATGCAACTGGAAACGTATACGGCGGGTGGCAAACCGATTTATCAATGTG +CCGCCGGAGGGATTTTTCCCACAGGGCATGCCGGAGGAGTTGTACAACTGGCCACAGCGC +GAAGCGCAGTATGTAACAGACCGGCAGCGGATAGCGGCCTATAGCGGTGAAGCTTGTCCT +CATAGCGGGGAGTGGTCGATTTTTGTAGAAGGTAGACAAGCGACGGAGACGCTGGAGCAG +GGAGAGCAGATGCCGGAATGGACGGACAGGAAAATGGAGGGGGAGTATAAAAGAGGTGAG +AAATTCCATGTGCTGTGGTCGCTGATGAACCGCCACGATGGCGGGTCGGTGTGGGTGGAA +GCGTAGCGGTAGCTGGATGTACACGTAAAAACCGGGGAATGGGTGATTTTATTCTGGTTT +ATACAGGAGAGATGAATAATGAGGATATCACTGGCAAGCTTGTTTTTTCTTTGCTGTACA +GTATCAGACAGTGTTTATGCGGATACAGATCAAACATATGATATTTTTTGGGGAATGCTG +GTAAAGGATAAAAAGGATACTATATTTGTTCGCTGTGACAGTCCGTTATTGAAAATGAAA +ATTGTGAGAATGGCGGATGCAAATACAGAAAACATTGATAAGGCATACCAGATATTTAAT +CAGAAAACGAAAAAATCAATTTATTTTGCTTTTATCGGTAATGTGACTGATGCCGGGAGT +GGAAAGTATATTTTCAATATGCTGGACGTGATGGAAACGAGAGAAGGCTATTGTAATCTG +TCCGATGTGCTTAATGCAATAGATGAACAGTTTCGATAGTTTCGGATAAAATTGTTATTT +TATGCTTTCTTTTTTGATACGTTACGTCAGGTCGTTGTTTTTATAAATCAACAACCTCAT +TTATTAAATAACATAAATCAAAAGCAATGCCATTATGGCCAATGAATTTCAAGTGGATAT +TAAATCTGTTTATTATAAATTTTCCTATTTGTGTTGAAACACCTCTTAAGACTGAATGCT +GAATTACTATATCAAGAGTCACATCAATTCATTATTTCTGATATTAAATTTAATGTTTTA +TTATTTTTATAATATTTAATATTAAAACTGCAATTTCCGTAAAATTATAACATTATGGAG +GACTCAACCATGAAAGGTATTGTTGTTCTGGGAGATAAGACAACGCATGGTGGGCAGGTT +ATATCTGTGTCATCTTCGATGGTTATCAATGGAAAAAAAGTTGCGCTTGTAGGTGATAAG +ATAAACTGCCCTGTTAAAGGGCATGGTATTAATACCATCATCGAGGGGAGTTTTGATTGG +ATTTCTGATGGCAAACAGGTCGTCGTGAATGGCTGCAGGTGTGAATGTGGCTGTGTTGTT +ATATCCAGTATTGCTGATGCCTTGATTGGATGAATATTATGGGATGGAAACGGACGTATA +CAGAAGAAATAGACAGGCCACAGGATATTTACTTTCATAAGTGGTTATTTTCTTTATTTA +TTTTATGTATATTATTACTCGTTATTTATTATTTTTTCCATGAATTTGTTGTAGCTAATA +ACGCATCTTTGTTAGCATTCTTTTCCCCATTATTATTGTGGGTATTGATTCTTTCAGTAC +AGGTAATATTTTATTCCAGAGCTATTCAGGATTATTCAATTTGGCTGGAGAACAGACTTA +GTATCAACAGAGAGTGGGAGGCATGGGGATCAAGATATGTTTCTGTTATGAATAGTAGTC +TTCATCTTCCTGGAAAAGTCGATGTTTTATTCTTGTCTGGTGATGAATTAGAAACTCAGT +ATGGACTTGTCAATAAGTCAGATGATATCACATGGAAGCAACATGATTGGTATGCCTGCT +TTCAGACCCTTACTAATCATCTTGAACTTTATAAACTCCCATATCAACTTACACAAGAAT +TTATTATTCTTACTGATTTTGATGAAAGTATGTACTCTCAGATTGAAGAGGACTTTTTCA +GAACAGTGGAGAAAACCAACAGAACAGAGGGGCATTTTTTGTTGCATATTTCCCCTTCAA +TGTCCTTTGGAGAGCTTGATTTATGGTTAAAGGATTCCGAAGAGAAAATATATATTGTCA +TGGTGTTGCAGATGGAGGAGCAAACATCCTGTTCGGACGCTATGGCTTGCCTTATGTTTG +CAACTGATGATGTTACTGCTAAGTACAAACTCACTGAAAAGGCCAGAATTTATCGCCCAA +TGGTAGTAAATAGTAATAATTTCAATAGTGACTTGAATATTTTTATTGACACACAAAAAA +TATCCAAAAATGCCGCCGGGTTAGTTGGGGACAGTCAGCGTCTGTTTTCTGTGAGTAGTA +ATGTATTGCAGTGTTTTAATGATAATAATGCTCAATTGAAAATTGATAATATCCATCTTT +TAGAAAGCCTTTGCGGATTACCAGGGGGAAATGCGGTCTGGTTAACGGCAGCGCTGACTA +TTTCGGTGGTTGTTCACAAAAATTCAGATTACTTGATGATGTCCGAAAATAATGATGACT +GGATCATTACCACCATTCATCCTATGGAGCATTCATGAAGAGAATAAATAAAAAAAGTGT +TTTTATATCTAATGTACTTTTATTCTTGGTTATTGTGGCCTTCGTGGGGGGGATCATCTG +GCGTTTTGGTGATCATTTTGGACTGAAAGGGGATGAAAATAATTTTTTTGCGTGGTTGAT +ATGCATTATGACCCTCATTTTTGTACGGGCATCCTGGTATTTCTCTCGATTGTATCGCCT +ACGAAAGGAACAACATCACTCCGAAAAGGAAAGATTACGCCCGGAGAAAGAGGCTCGTAT +TGAATATGGCAAGGTCATAACCCTGAACATTGAGCTAGCTGAGTATTTATGTGCCCTATA +CGGCCCATTCTGGCGGCGTAAAGTCCGCCTGCTGCTGGTGACCGGCGAGCCTGAACAGGC +AGAGGCCATCGCGCCGGGGCTGACCGGGCAACACTGGCTGGAGGGCGACCACAAGGTGCT +GATATATGGCGGCAGGCCATCAGCGGAGCCTGATGTCGCGCTACTGACCGCCTTAAAAAA +ACTGCGCCGCAGCCGCCCGCTGGACGGCATCATCTGGCCGCTGACAGAAGAACAGAGCCG +CCAGACAGCGCAACTCGACAAAGGCTGGCGCGAACTGATAAACGGCGGTAAGCGACTCGG +TTTTCAGGCTCCACTCTATTTGTGGCAGGTCTGTGACAACGGTGATTATCAGACCGGACG +CCCCCTGCAAAGCGTCGGCTGCCTGCTGCCGGAACGCTGTACCCCGGAACAACTGGCTGC +AATGCTGGAAGCACAAACCCTGCCGCTGACGGAACAGGGCATGTCGCAACTGCTGGCAGA +TAACCGCCATGATTTCCTGCTGCGTCTGGCCCATACCCTTGCAGAGCGGGGTATCGCTCA +CTGGCAAAGCGTTCTGAAACCGCTGCTGGCAGGCGGCGCATTTTCTTCCCTGCGCCTGCG +TGGCCTGATGTTCAGCCCGCCGCTTGCCGCCGTGCCGGAGGCCGCACCTCATGCGTGGCT +GCCGTCACCGGTCTGGGCGGGCGTGACGGGTGATAACGCGCGCGGGCGTGCAGTGGGCTT +TCCGTGGCTACGCGCCGCGCTGATAACCAGCATCTGCATGCTGGCGATATGGGGGGCCGG +AATGACGACCTCGTTCTTCGCCAACCGCGCGCTTGTTCAGGAAACCGGTATCCAGACGGC +ACGTGCGCTTGATACCCGCCTGCCGCTGGCAGAACAACTGGTGGCGCTGCATACCCTGCA +GGGCGAACTGGAACGCCTGCAATATCGTATCCGCGAAGGTGCGCCGTGGTATCAGCGTTT +TGGCCTTGAACGTAACCAACAACTGCTCGCCGCCGCTTTTCCCGGCTATGCGCAGGCGGC +AAACCGGCTGGTGCGCGACGTGGCCGTTGACCATCTGCAACAGCAACTGAACGCCTTTGT +CGCCCTGCCGCCCAACAGTCCTCAGCGTACCGCCACCGGTGAACAACGCTATAAGCAGCT +TAAGGCATTGCTGATGACTTCCCGCCCGGAAAAGGCCGACGCTGCCTTTTTCAGTACCAC +GCTGATGGCGGACGGTCTGCGCTACGAGAATATCCCGGAAGGTGTGCGGCAGAGCGTGTT +GCCGTCACTGCTGACCTTCTGGATGGCGAACCTGCCGGAACACCCGCAGTGGAAAACCGC +ACCGCCGCCGGAACTGACCGGCGCGGTGCGTAAAATCCTGCTGCGCCAGATTGGTGTGCG +TAATGCTGAAAACACCCTCTACCAGAACGTGCTGCAACAGGTGTCCCGCAACTACGCCGA +TATGACGCTGGCGGACATGACCGGGGATACGCTCACCGAATCTCTTTTCAGTACGGAACA +GACAGTGCCGGGGATGTTCACCCGTCAGGCGTGGGAAGGACAGGTCAGGGAAGCCATCGA +GCAGGTAGTGACGGCGCGGCGCGAGGAAATCGACTGGGTACTCAGCGACCGCCAGCAGGA +TACCTCTGCGGATATCTCGCCGGATACGCTGCGTAACCGTCTCACCTCACGCTACTTTAC +CGACTTTGCCGGAAGCTGGCTGGCGTTTCTCAACAGCATTCGCTGGAAAAAGGAAGACTC +GCTCTCCGGCATTCTCGACCAGCTGACACTGATGGCCGATGCCCGTCAGTCGCCGCTGAT +TGCGCTGACCGATACCCTCGCGTGGCAGGCGGCGGCTGGCAGGGAAAACCGTGGCCTGTC +AGACTCGCTGGCGAAATCGGCACAGGAACTGTTTAACGGCAAGGAGAAAACGCCGCAGCA +ATCCCGTGAAGGCAACGAGCCTGTCGGGCCGCTGGATAAAACCTTCGCGCCGCTGCTGCG +GTTGCTGGGCGATAAAGCCGGAGGCGGAGACAGCCAGCTGAGTCTGCAGACCTACCTTAC +CCGCGTTACCCGCGTGCGCCTCAAACTGCAACAGGTGACCAACGCTCCCGACCCACAGGA +GATGACCCAACAACTGGCGCAGACAGTCTTGCAGGGCAAAACCGTTGACCTCACCGACAC +CCGCGACTACGGACGGTTAATCGCCGCCAGTCTGGGCGAGGAATGGAGTGGCTTCGGTCA +GGCGCTGTTCGTCCGCCCGGTGGAACAGTCGTGGCGGCAGGTGCTGACGCCTGCAGCGGA +CAGCCTGAACCGCCAGTGGCACCGGGCGATTGTCAGCCACTGGAATCAGGACTTCGCCGG +GCGCTATCCGTTCAAAGCCTCACAGAATGACGCTTCCCTCCCCCTGCTGGCGCAGTACCT +GCGCGATGACGGGCGCATCAACCAGTTTATTGCCGCCAACCTTTCCGGCGTTCTGAAACG +TGAAGGCCGCTACTGGGTGGCTGACGCCATGAACACGCAGGGGCTGACGGTCAATCCGGA +CTTTATCCGCGCCCTGAACCGCCTGCGCGACGTGGCCGATACCGCCTTTGCCAGCGGCGA +TGCCGGGATACATTTTGAACTGCGGGCAAAACCGGCCCGAGACGTGATGAAAACACATCT +GGTGATTGACGGGCAGGAACTGGAATATTTCAACCAGAAAGAACGCTGGCAGCGTTTTAA +CTGGCCGGATGAACAGTGGCAGCCCGGCGCATCGCTGAGCTGGACCAGTACGCAGGCGAT +GGAGCGCATACTGGCGGATTATCGGGGAAGCTGGAGCCTAATTCGTCTGCTGGAACAGGC +GCAGGTGACACCGGTGGACAGCAGCACCTTTAAAGTGGTGTGGAAAGCGCAGGACGGCCT +GCCACTGAATTACCTGCTGCGGGTTGAACAGGGAAAAGGGCCGCTGGCGCTGCTGGAACT +GAAAAACTTCCGCCTGCCGGGACAGGTATTTCTGACCGGCAGGAGTATGAAGGATGCGGA +AGAATACGGGGAAGACGCCGATGAGTGAGCTGTTGCAAAAGCTGACCCGTAGCTGTTTTG +CCGACCGGGATGCACTGGATGTGGCGCGAACACAGGCGGCACTGTGGCAGACATGGCTGC +TGCCGGTGACGGCAGACACGCCGGTCGGGGAAGACCCCGGCTACCACGACGATTTCCTGC +GTATCCGCGACGAGATGAACAAACTTTCCGGCGCGGATACGGACCTCATCTGCCAGCTTG +CCGAATCCCTGCTGCTGACGCAGGCAAAAGACGTGCGCATCGCCACTTACTACATCTGGG +CGCGACTGCACCGCGACGGTGAGCGCGGACTGGCGGAAGGACTGGCGCTGCTGACCGGAC +TGGTGGAACGCTTCGGTACGCAACTGCTGCCCTCGCGTCCGGCCAGCCGGAAAATGGCGC +TGGAGTGGCTGGCAGGGGAAAAGATGCTCGACAGCCTTGCCCGCTACCCGGAAGTGGCAA +AAGAGGATTTTGCGAACATTGTTGCTGCTCTTAATCAACTGACGGTTTCCTTCGCCGCAT +GGCCCGAAGACCAGCATTCCCCCTCCCTGATGCCGCTGATTAACGCGCTGGAATCACGTC +TGGCGCAGTCGGGTGGGATGAATGCGGTGGTGCCGCAAAACAGCAGCAGCGTTCCTGCAC +CGTCATCCCCGGTGGATGCGCCACAGGTACAGACCATCACCTCCGGGCGCGACCTGCTCG +ACCAGGCGAAAGTGCTGGCCCGTTATCTGAACGAACAGCCGCAGGGCTGGCTTTCAGCAC +ACCGGCTGATGAAAACCCTGCGCTGGGACACGGTGCATGAACTGCCGCCGGATGTGGACG +GCAAAACCCGGCTGGCCCCGCCGCGCACAGAATCGCGCAACCAGCTTAAGCGGCTGTATG +CCCAGCAGAACTGGACGGAACTGCTGGAGCAGGCCGACCTGATGTTCAGCACCGGTGTCA +GCCATTTCTGGCTGGACATTCAGTGGTATCTGCATCAGGCGCTGGCCAAGGCGGGCGCAC +CGTGGGACAGGTGGACAGCCGTTATCCGTCAGGACCTGACGTTACTGCTGGAGCGCCTGC +CGGGACTGGAAAATCTGGCATGGAACGACGGCACACCGTTCGCCGACGAGGTGACGCGCA +ACTGGATAGCGCAGCAGGTCATGATGCGGGAAGACGGCGCATGGCTTGCGGGGAAAGCCG +CTGTACCGACAGACGACGCCACAAATGACGTACTGGCGCTGGAGCCGGAAGCACTGGCGA +TGGCAGACAGTCAGGGCGTGGAAGCGGCGCTGGGCTGGATACAGACCCGTCCGGGCATCA +CCACGGCACGACAGCGCCTGTTATTGCGGCTGCTGATGGCACGGGTGGCGGAACAGTACG +GTAAAAACGAGATGGCGCTCCTGCTGCTGGAAGAACTGGATACCGCCGCACAGGGAATAA +CGCTGACGCAGTGGGAGCCAGAACTGCTGTTTGAAGTAAAAGCCCGGCAACTGAAACTGC +TGCGCCTGCGGGCACATCGCCACGCGGACAAGGCGGCGCTTGCCCGGAAAATGGACGCTC +TGCTGGGTTCGCTGGTGGCAATCGATCCGGCGCGGACAGCGGTACTGTGTGATACGCAGC +ATAAGGACTGATTTCTTATTTGTATTTCAGATTAAAGGACTTTGATGGACGACCTGACCC +AACGCTACTTTGAGGCCGAAATGCGCTACCTGCGTGAAGCGGGTAAAGAATTTGCGCAGG +CTTACCCCGACCGCGCTGCGATGCTTAATCTTGATAAACCCGGCGCACGCGATCCCTATG +TGGAGCGCCTGTTCGAAGGCTTCGCCTTTTTAATGGGCCGCCTGCGCGAAAAGCTGGACG +ACGATCTGCCGGAACTGACTGAAGGGCTGGTCAGCCTGCTGTGGCCCCACTACCTGCGAA +CCATCCCGTCACTTTCCGTGGTTGAACTGTCGACAGATCACCGGCAAATGAAGCAGAGCG +AAACGCTGAGCGATTTTCAGGTATTGTCGCGCCCTGTTGGCGAGCGCAGAACCCGCTGTT +TCTACAGCGCCACGCGGGATATCACGCTGCATCCGCTGGCGTTGCCGGACGTGTCATTGC +AATATGAACCGGACGGACGTTCGGTTATCCGTCTGCGCTTTGAATGCGGCCCGCTGGTCG +GCGACTGGTCGCAGATCGATTTATCCCGCCTGCCGCTCTATCTCAATGCCGACAGCCCGG +TAGCCTGTGCGTTGCACCGGGCTTTAACGCTTGGCACGCAGCAGTTCTGGCTGCGTCTGC +CGGGGCAGGATCGCCGGATGCTTGGCGCACACTTTTCCCCGATGGGCTTTGAGGATGATG +ACAGGCTCTGGCCAAAAGGTGAGTCAGCCTTCAGCGGTTACCAGTTGCTGCTGGAGTATT +TCACCTTCCGCGAGAAGTTTATGTTCGTGGCGCTGAACGGGCTGGAGCAGGTTGCATGGC +CGGAGGGGATAACCGGCTTTGAGATTGACGTGGTGCTGAACGAGAACTGGCCTCACGACC +TGCCATTTGACAGCGATAATATCCGTCTGCACTGCGTGCCGGTCATCAACCTGTTCCCGC +TCGAAGCCGATCCGTTACACCTTTCGCCACTGGAAAACGAATTTCTGCTGCGCCCGATGC +GCATTCAGGACGGGCATACCGAGATTTATTCCGTCGACAACATTATTTCTTCGCGCCATA +CCGGCAGTCAGGCATATGTCCCCTTTTCCAGCTTTCGTCACCGGGGCGGGATGCTGCGCC +ACGATGCGCCGGAACGCTATTACCACACGCGGGTAAAGCGCGGCCCTTCCGGCTTGCACG +ACACATGGCTGATTCTGGGCGGCGATGCGTTTGATTCCGACCGGATGCTGGAGGATGAAA +CCCTGTCCTTAAGTCTGACCGGCACCAACGGGCAGCTTCCCCGTAAAGCCTTACAGAGCA +CCCTGCTCGATACGCCAGTTCATGCCTCACAGAACGTCCTGCGGGTGCGCAACCTGTGCG +CCCCGACGCAGCCCTGCTATCCCCCGGCGCGTGACCGCTTCCACTGGCGGGTGCTCAGCC +ACCTCGGTTCTAACTTTTTATCGATGATGGATAACGCCGAAATTCTGCGCGGCACGCTGG +CGCTGTACGACTGGACCGAAAGCGAGATGAACCGCCGTCGTCTGGAGGCGATTGTCGACG +TTCAGCACAGCCTGATACAGCGTTTTGAAAGAGGCTTTCTGCTGCGTGGCGTGGATATTC +AGGTGACGCTGGACAGTAACGGCTTTGCCGGAGAAGGTGATATCACGCTGTTTGGTGAAC +TGCTGCACCGCTTCTTCGCACTGTATGCCGATATCCACTTATTCACTCAACTGACCTTAA +TTCTGCAACCCACAGGAAAGTGCCTGCAATGGACAGAGCATCACAGCCAGCGCGTACCGG +GCTGACCGACCGGCTGGCCCCGGATATTGCGCGGATCAATTTTTACCGTTTTTGCCAGTT +GCTGGAACAGAGCCAGCAGAAAGCGCCGCTGGGCAGTACCGACAACCCCGCCGCCGATGC +GGTGCGTTTTCGCCCCCATCCCGGAATGGGCTTTCCGGTCAGCGAGTTAAAGAACGTTGA +ACGTGACGTGGACAATCCCGACGCGCCACCCACGGTGCGCACCACCTTTCTCGGCCTGTA +CGGCGTGGATTCACCGCTGCCCACCGCCTATCTGGACTACATTACCCAGCGTCATGACGG +ACATGACGCAGTGATGGCGTTTCTCGATATTTTTAACCATCGCTTTATCACCCAGTATTA +CCGCATCTGGCGCAAATATAACTACCCGGCGTCGTTTGAAGCAGGTGCCGTGGATGACAT +TTCCCGTTGTCTGCTGGGGTTAATCGGGCTGGGTATTCCCGGCAGCGAGAACCATATCGC +CACGCCTGTATCCCGTTTTCTGGCCCTGCTCAGCGTGATGCGCCTGCCCACCCGCACGGC +TGAAGGCGTCACGGCACTGGTGGGGCTGCTTGCCCCGCTGACGAAAGCCACGGTGGTGCC +TCACGATCCGCAGCCTGTAATTCTCCCGGCCCCTGCGGGTCTGTCAAAAAATTCACGCAT +CAGCCTGAAAACGCGAACGCTGCTGGGGCGTACCGGTACCGACGTCAACAGCCAGTTGCT +GCTGAAACTGTATACCGAAGATGCCGCAGAAGCACGTGGCTGGCTGCCCGGCGGGCAACT +GCACAGCGATTTGCTGGTGCTGCTGCGCGTTTATCTGGGCTGGCGCTGTCAGGCCCGTCT +GCAACTGACGCTGCCCGTCAGCCTGTTGCCTGCTGCCCGGCTGGGAAAACAGCGTGTACA +GATTAGCCGTACCGGCATCCTTCTCGCCTCCTTTGCCGCGCCCGCGACCGGAACAGTGAC +GGTCAGTCTGGGGCGTTATCAGGGATTAATACCCGCTTTTTCCATTCGTAACAGGGAGAG +TATGACTCATGTTTCCTATTCGTTTTAAACGTCCGGCGTTGCTCTGTATGGCGATGCTGA +CGGTTGTTCTGAGTGGCTGCGGGCTGATTCAGAAAGTGGTGGATGAATCGAAAAGCGTGG +CCTCAGCCGTTTTCTACAAACAAATCAAAATACTGCATCTCGATTTCTTCTCCCGCAGCG +CCCTGAATACGGATGCGGAAGATACGCCGCTTTCCACGATGGTGCATGTCTGGCAACTGA +AAACCCGCGAAGATTTTGACAAGGCGGATTACGACACCCTGTTTATGCAGGAAGAGAAGA +CGCTGGAGAAGGACGTACTGGCAAAACACACCGTCTGGGTAAAACCGGAAGGCACGGCAT +CCCTGAATGTGCCGCTGGATAAAGAGACGCAGTTTGTCGCCATTATTGGGCAGTTTTATC +ACCCTGATGAAAAAAGCGACAGCTGGCGTCTGGTGATCAAAAGGGACGAACTGGAGGCCG +ACAAGCCGCGCTCGATTGAACTGATGAGAAGCGACCTGCGACTGCTGCCTCTCAAGGATA +AATAACCGATGTCGACACCTTCCTTATATGAAATGCTGACGTTCAGTTTCAGCGGCGAGT +TACCGCTGGAACAGATCAGCGAGCGGGATCAGCTTATCCTTTCCGTGATGGACAATATGC +AACGCATTATCAACTGCCGGGCAGGCACGCTGGCGCATTTGCCGGATTACGGTCTGCCGG +ATCTCAGTCTGATCCATCAGGGGATGGCTGCGGGTATTCATGGCCTGATGCGTCAGATTG +AAGAAACACTGCTGCGTTATGAACCACGCCTGAGTCAGATACAGGTGGAATTACTCCCCC +AGCCCCGTCCGGGGCATCTTAATTACCTGATCCACGCGCAGCTTCCCGATACCGGCTGGA +TACGCTTTGATGGCGTATTTTCTCCGGAAGGACGAATTGTTCTGCGTCATCTCAAACAAC +AGGAGCGGGCGTACTGATGGCAAGTAACGCGAATTTTATCAGCCAGTTCGTCATGGGCGG +CGATCCCTGTACTTATAAGGAATCCGGTGAACTGCAGGCTGAAATGAGTAAACTGACTCA +CCCGGCCCGACCGGATGTGGACTGGCGTCAGGTGGAAAAACTCTGCCTCGCGCTGTTCCG +GCAAAATGGCGTGGAACTACAGACGCTGGTCTGTTACGTACTGGCGATAACCAGACGGCA +GGGGCTGGCAGGGATGGCAGACGGACTCGGTTCACTGGATATACTGCTCCAGCGCTGGGC +TGACTTCTGGCCGGTACAGGTACATTCCAGAATATCACTGCTCAGCTGGGTCACAGAAAA +AATGCAGCAGGCACTGAGAACGCTGGATATTCAGTATCAGGATCTGCCGCAGATTTACCG +TTGTGTACAGCATCTTTCCGCCATCGAAACCACGCTGCAACAGTGTGAACTGTGGCATAT +GACGAAACTGGATCTACTGGCCGGGCAGTTTCGCAATACCGCATTGCGTCTGGAACGGCT +GGCGCCTCAGGGAGCGGAAACCACTATCACTCCCCCTGAATTACCCCGCCGGGAAATGAA +TCAACCGAAAAAGTCAGAGGAAAGTCCACAGCCGGTTTTTGCAACCAGATCCGTTCAGCA +AAACGATAAGGATGCCAGTCCACCCGTTCCATCCCCTGAAATCTCCCGGCAGCGGACATG +GCCGATATTTATGGCCGGAATGGTTGTGATGGCCGGTCTCGGCGGAACAGGATTATGGGG +CTGGTCGCAGCTTAATCAGCCGGACGCGCTAATCCAGCGAATACAACTGTCTGTCATGCC +ATTACCGCAGTCGCTGGAGAGCGGCGAACTGGCAAAGCTGGATGTAAAGGATAAGGCGCT +GCTGGCTCAGGACAGAACAATTGCGGCAAGTCAGATGCAACTGGAGCAGTTAAACAAATT +GCCTGCCCGCTGGCCACTGGAGCAGGGATATCGCCAGCTACGCCAGCTTGATGCCCTGTG +GCCGGATAATCCTCAGGTCAGGGCGCTGAACGCGCAGTGGCGCAAACAGCGGGAGCTGAG +CGCCCTGTCTGCTGAGGCACTGAATGGCTATGCTCAGGCGCAGAGCCAGCTACAGCGCCT +GTCGGCGCAGCTGGATGCACTGGATGAACGTAAGGGGAGATATCTGACCGGTTCGGAACT +AAAAACGGCGGTGTACGGCATCCGGCAGTCGTTAAAGGAGCCGCCGCTGGAAGAACTGCT +TCGGCAACTGGAAGAGCAAAAACAGACCGGAGAGGTTTCGCCAACGCTGTTGACGCAAAT +TGATACCCGGTTAAATCAGTTGTTGAATCGCTATGTCATTTTACTGGATACGAAGGTGGA +ACAAAGTCAGTAAACATCGGGGGATTTATGTACCAATAAGGGATATGTGACCTTGCCATT +TTTTAAAATGGAGTCTCTGTGTACAAAAAAAGAGAGGAACAGGCCATTCGATCTACTCGT +TGATTCACATCAGATAATGAGTGTATATTTCGGTAGATAGCTTGGGTTCGGGAACAGTGA +ATACCTTAAGTTTCAAAAGATTGGATTAACCTCTTGACTGTGGCCCCCGCAACCAATTTA +TTAGAATGCTGACAAACCGCAATGTGTTCTACAAATTGCGGTTTTTTTGTATTTAAAATC +TTTGTTCGCTGAACTCACAACACGTTTTTTATCTCCCTTCCTGCGAAGTAATCAATTATC +GACTGGGCAACGTGTATCCCGGTTTGCTGGTATGACTCAACGGTGGCGGCCGCGATATGC +GGCGTTGTAATGATATTTTTGGCATGTAGCAGTGGGCTAAATTGCGCCAACGGTTCAGAG +CTAAACACATCCAGCGCCGCAAACACATTTCGTTCTTCAATCACCTGAAGTAAAGCGCCC +TCATCCAGCAACTTTCCCCTTGCGGCATTGATGATTAGAGCACCATTGCGCATCATCGAC +AAATATTTATGACTAATGAAGTTCTCCAGCTCAGAAGAAAAAGGCAAAAGAACAATGATG +ACATGCGACTGCATAAAGATATCTTCAATTGATACAAACTGAACTCCAGCTTTGTCAGCA +ACCTGATAGTCGGGTTGTTTGTCAAAAGCTAAAAGCTCAACATCAAAACCGGATAACCTT +TTCGCCAGAGTTTTACCTATATTACCGTAGCCAACCAGGCCAATCCGTTTCCCTTGTAAT +TCACAGCCATGCGACTCACCCCAGTAGCCATTTTGCATCGCATGATAGCTGCCAGGGATA +TTTCTCATGCTCGCGAAGATAAGTCCAATGATAAATTCCGCAACCGCATTTGAATTAATC +CCAACCGCATTATTGACAACAATACCGGATTGCTGTGCCGCACGAAGATCAATATTGTCT +ATCCCCGTCCCGAATCTCGATATTATTCTCACACCAGGCAGCAATGATAGCGTGTCCGCC +TGATAACCATCTTTTCCGGCGATGACCGCGCAAATAGATTCTCGTAATGCAGTGGATTCT +GATTTAAGCAGATGCTCCACATTATTCTTAATAATAAGATTAAAATTATTCTCTCTTAGC +AACTTGCTGGCGGAAACACAGCGTGCTGAAAAGCTGGGGACGGTGACCAGAACATTTTTC +ATAGCGGACACTCACTTCAAAGAACGCCACCCCAAAAGATGGCGTGACCGGTTACTGTAT +TTATATTTTGAAATTATGAATTTGCTTTAATGCCGAGTGCACCTCCTGGATGATATAAGC +CGAAATCAGCACGAGTAAATTTTTTCAATTCAGAGAGTGCAAGCGCCACCGCATCACCAA +CAACCAGAACAACAGTCGACGAGCATGACGGTGCTAAACCTAAATTATCCGCCTCACTTT +TGACGGGGATTTCAACAGATAAATCACAACTTATCGCAAGCGATGAGTGATGACTGCGGG +TAAAAGAGATCAAATAATTACCCATTTTTTTCAGACTAGGCAGTGTCGCCAGGATTTCCG +CCGTCTCACCACTGTTTGAAATAAGAATAACAACATCGTCTTTCGCCACCATTCCAAGGT +CGCCGTGTACCGCTTCCGTACCGTGAACAAAAAACGAGGGAGTTCCGGTGCTGGCAAATG +TTGCGGCGAGTTTCCTGGCAATAATACCAGACTTACCAACACCAATAAAAACAACTTTCC +CCTGACAAGATTGTAATACTTTAATTAAATTTGCGACCTCCGAAAGAGGGGAATCAATAA +CTTCTTCAACTGCTTTATGTTCGTTACGCATAAAATGTTTAATGAGATGGATAAGATCCG +TGTTATTCATTTTTATTCTCCCTGATTAATATTTTTAATTACACTCACAAGACGCGTAAG +CCCCATATATAATTTTTCTCGACCGCAGGCCAGGTTCAGACGAAGGTAGCCCTCCCCCTC +CGTTCCATAGACATGCCCCGCCATAATGCCCACTTTGCCTTCATGAATTAATCGACTGTA +GAATTCATCAAAAGGATAACCAATAGCAGAACAATCTATCCAGGAAAAATAGCAACCATC +AGCTGGCCTTACGATCAATTCTGGAATATTTTCATTCAGATACTGCTGGGTGAATTGAAT +GTTAGAGGCTATATGTGCCTTTAATGACTTTAACCATCCCTCACATTCGTTGTAGGCAAT +AATAGTTGCAATTATATTCAGTACTGATGGGGAGTTTACAAAATCGCGATACCTCGATAT +CGTTCTGAACTTATGATTAAAATTATCGTCAGTTGAAATCATATACGATCCTGTTAGTGC +AGGAACATTAAATGTTTTCGATATCGAGTTAAATACTACTACTTTTTCTTTTTTTATTTT +AAGCGCGGATGTAAAGCTACGATTAAAAACAAAATCACTATGGATTTCATCTGAACATAA +CCAGACATTATGCCTTGTACAGCTTGCAGCGATTTTATGCAGTTCTTCTTCCGACCAGAC +TGTTCCTGTCGGGTTATGAGGATTACATAATAACATCATCTTTGCGCTTTTAATCTTAAG +ATCAAAATCTTGCCAGTTGATAGCGTAGCCCCCCTCATTTTTTATAATCAAAGAGGCTGT +CAGAATATTTCGCTCGCTATGTTTAATTACATCAAAAAATGCATTATAGACAGGTGTAAA +AACGAGAATATTATCACCATGCGATGTCAATAACTCTATTGCTTTTGCAATAGAGTACAT +CACACTGGGGCTATAGGTTATCCATTCAGGTTTAATATCTGTTTGATATTGTTGATAATA +CCAGTTTACTATCGCATTCAGATATTCACCATGTTGCCAACGACTGTACCCTAAAATCGG +GTGTTCCAGGCGTTTTTTTAATGCTCTGGTGATAGCGTCTGGTATCGGAAGATCCATATC +TGAAATAGAGAATGGTAGTACATCTTTTACACCAAATCTGTCCTCGCAAAAGTCCCATTG +GGTACAATATGTTCCTTTGCGGGAAACAGGAGTATTAAAAACATCCATCAGTATATCCCC +ATATAGTTATCCATATCCCGACGCAGGGCGATGACTTTAGTGCCGATAATGACTTGTAGG +GTATTTTGATCAAGTTTTACAACCGCAATCCCGCCAGCTCTTTTTATTGCAACTTCGTCA +ATCAATCTCATATCTGCGATTGTTAAACGTAAACGAGTTACGCAATTATCCAGTGACTTA +ATATTCTCTTTACCACCAAGTGCCTTAACCATCTGCTCCGCCGCTTGCAGCTCTGATTTA +TCAGGAGTTGGGATATCCGCTATAGCCGTATCTTCGTGAGCGTTCAGCGTAACAGGACTG +GACTCTTCACGGCCTACGGTCATCAGGTTAAATTTAAGGATGGTCCAACGGAACACAAAG +TAATAAATGAAGAAATAGGCCACTTCGACACACACCGCGATCGGCCAACCTGTTCTTGTG +CCACGCAATACGCCAAAGCTAATAAATTGAATCAGATCACCAGTAAATCCCATCTTCACC +CCCATATATGGCAGAACCATGTTAGCGAATCCATTCATAAAGGCATGGAAGACAAACAGC +AGTGGACTGACAAATAAGAACAGAAACTCAATCGGTTCGCTGACGCCGCCAATAATCACC +GTAAGCACCCCGGAAATAAGCAATGCTTTGATAGCCTTTCTGTTTTGAGCATGAGCAGTG +CGATACATCGCCAGCGCGGCACCAGCCAGACCATACTGAATCATCAGTTTGCCCTGCTCC +ATTTTCCCCGCCAAATCCAGCGGAATGACCGCATTCTCTTTGACGTATGCCATAAACATG +TTCAGGGTGCCGTAATATTCTTCGCCGCCAATCACAGCCGAACCGCCGATTGGCGTAAAG +CGGAAAACTGACGTCACCAGATGGTTTAAGCCAAAAGGAATCGTCACGCGTTCGGCAACT +GCATAGAAGAAATAACCAACAGGACCGGAAGTTGAAATCCAGTGGCCAATGAGCATGAAA +AGATTGAAAAACGGCGGCCAGATAAAAGGAATGATCAGACCAAATCCACTCATCACAATC +AGTGTAATGATAGGCACCAGACGTGGGCCGCTATAAAAACCTAACGATTCAGGAATGCGT +AAATTAACGATCTTTTTATACATGCTGGCGACTAATAACCCAGCAACAATTCCCCCCAAC +ACGCTGGTATTGTAGGACTGGATCCCCAGAATGATGGTTTGCCCATGTGTCGACATTTGG +TCAGCAACGACCAATAAGTCGTGCTGTTTAAGATAAAAGTTCGTTCCCAAATGCATCGCC +ATAAAACCAATTAAGCCAGAAAAAGCACCATAGGCTTTATCCTCTTTATCTTTTAATAAT +CCTAAGGGAATCGCTATCGCAAACAATACAGGTAAATTAACAAAGGCAAACAAACCAAGA +CTAACAATGAAATCAAGTATGGTTTTAATTATTGGAATAGCCAGAAATGGAATTAACTTT +GCCATATCATCACTGGCTAAACCACTTCCCAGCCCTAGCATCATGCCACATACACTTAGC +AGAGCAATGGGATACATAAATGCCTTCCCCAGGCTCTGAAAAAAACTCCAGGCTTTCTTT +TGTTTCATGTGGGTTATCTCATATAAATGTTATATATAATTAGTCCATTAATACTTTGGT +ACGAATAGAGAGATATAATTTTTCTTCTAAAATTAATTCATATTTAAAAGTGGCATACAG +ATACCGTTCAATTTCATGAATTGCGCGCTGTAACAGGATGTCCTTTTCAAGAAACTGTTC +ATAGATATCACCAATATCTTTCTGTTTTATTTTTTCATTGCATAACACGCGACTTGAAAA +ATATTTAAGGTGCATCATAAATCTGGAATAGTTAAATGAACTTCTGTCCACCTTTCTGTT +ATAAACAACTTCAATAAGCTCCGTGATTATTTGCGACAACTCAATAATCCGTACTGATTC +ATAATCAACTGAATTTTCATAATTATTTAAAATATGCAATGCTATAAAACCAATCTCATC +ATCAGGAAGTTGAACGCTGAATTGCTCATTAATGATAGTTAATGCATCGCGACTTATCGC +ATACTCTGCTTTGTACAACGCTTTGATTTCATCAAGGAAAACATTATTAATTTGTATACC +TGAAACGACTCGGGATATTGCATTCGAAATGTGATCCGCAAGAATCAATAGTAGCGATGG +ATTGAGATTTTTTTCGAGATTTTTCTCCGCATATTGCACTATTTTTTCGGCAACAAACAC +ATACTCAATATCTACATGTTCAATCAATTTATAAAGTTTGTTTTTTTGTTCATTTCTGAC +ATAAAAAATCCGGTTAGCCGGATGCTCAGGGACCGACATTCCATATTTTTTGTTGTAACC +GACGCCAGGCCCAGAAATGATAACCTCCTGTCCATTCATCGATGCCTGTACACAATTATT +GTTCATGACTTTTTCGATGATCATTCCATGGCTCCAAAAAAAAAGGCAAGGCACGTCAGA +AGTAATAACTACTTCAAACATTGCCTTGCCTGATTTAACAGTTACAAGATGATTAACTAA +TGCGTATACATTACACGGAATTGTGCTTAATTAAAGAGATGGTCGGCTTATTTTTCAAGC +CGACATTCAAATATCCGACATCAGTCACAAAACCAGCGTCTAATATTCAGGTAAATGTTA +TCTATTCAACGAAATATAAATTCATTGAATAAATAAAAACATTATCCCCTTCTCGCCAGC +GTCGCCCCATCGGCAAAATACGCTTTAATTCCCGCAAGAATAGACTCCGCAACTTCCTGC +TGGAAAGTCGCCGTTTTCAGTTTACGCTCTTCCTCAACGTTACTGATAAACGCCGTTTCG +ACCAGAATGGAGGGAATATCTGGTGCCTTTAGTACGGCAAACCCGGCCTGTTCAACTTGA +TTTTTATGCAGCTTGTTGATTTTACCGAGCTTATTCAGCACCGCTTTACCAAACTTAAGG +CTGTCGGCAATGGTCAGCGACTGCACCATATCGAACATGGTGTGGTCGACATAGCGGTCA +CCGCTTTTGCTTACGCCACCAATCAAGTCCGAGGCGTTCTGGGTTTGTGCCAGATATTTT +GCCGCAGTACTGGTTGCGCCTTTGGTTGAGAGCGCAAACACCGAGGAACCGCTCGGCTGG +CGACTGGTAAAGGCGTCGGCATGGATAGAAACAAACAAGTCAGCGCGCTGTTTCTGGGCT +TTTGCTACGCGCACTTGCAACGGAATGAAGATGTCTTCATTGCGCGTCATGTACACCTTC +ATATTGCCCTCTTTCTCGATCAGAGAGCGCAGACGGCGAGCTATTTGCAATACCACGTCT +TTTTCGCGCGTTTTGTATTTCCCCACCGCACCGGAGTCTTCGCCACCGTGGCCAGGGTCA +AGCATAATGACAATCGGACGATCCCGCCCAGCTTTACCCGGTTGTGGACCACTTTGTGCT +GGCGGCACCTGCTTTTCGAGGTCGCCTTTGTTGTAATCCTCCAGCAGCGCCAGCAGCGGG +TCCTGCATATCCTGTGCATTGGCCGGATAGAGGTCCATCACCAGACGCTCTTTAAACCCG +GCGACCGGCGCAAGGGCAAACAGCTGCGGTTTTACGTTTTGCTTTAATTCAAAAACCATA +CGTACGGTTTGCGGGTCAAATTGCCCGACGCGCGCCGACTTGATGAACGGGTCGTCAGCG +CGGATTTGCGCAGCCATCCCCTTGAGCACCGAGTTCAGGTTTACATCTTCGATATCCACC +ACCACGCGTTCAGGATTACTCAACGCGAACTGCTTATATTTCAGCTGACGATTTGATTCT +ACCGTCACGCGGGTGTAGCTGGACGCAGGCCAGACGCGCACCGCCACGACCTGGCTGACC +GCAGCCAGGCTGACCTGACTTACGCTCAATAGCCACATGGCACCCGCGCCTTGCAGTAAA +CGACGACGGCTGATTGCAGTGTTGGATCCTGACATGCCTCTCCCGAGCAAAAGAAATCTA +AGCTGTGTAACAAGTAAACGACCAATTTGACCGGAAACTTTAGCGAAAGACGCATAATCT +GTCATCTATAAAACGGTAAACATTCTTTTTATATTCACGGTATTACTGATAAAAAACTCG +CTCCCGCATAAAATTTACACTTGCACCCTGCGAAAAAACAGAATAAAAATACAATAATTT +CGAATAATCATGCAAAGAGGTGTACCGTGGTAAAGGAACGTAAAACCGAGCTGGTCGAGG +GATTCCGCCATTCGGTTCCCTATATCAATACCCACCGGGGAAAAACGTTTGTCATCATGC +TCGGCGGTGAAGCCATTGAGCATGAGAATTTCTCCAGTATCGTTAATGATATCGGGTTGT +TGCACAGCCTCGGCATCCGTCTGGTGGTGGTCTATGGCGCACGTCCGCAGATCGACGCAA +ATCTGGCTGCACATCACCACGAACCGCTGTATCACAAGAATATACGTGTGACCGACGCCA +AAACACTGGAACTGGTGAAGCAGGCAGCGGGAACATTGCAACTGGATATTACTGCTCGCC +TGTCGATGAGTCTCAATAACACACCGCTGCAGGGCGCGCATATCAACGTCGTCAGTGGTA +ATTTTATTATTGCCCAGCCGCTGGGCGTCGATGACGGCGTGGATTACTGTCATAGCGGGC +GTATCCGGCGGATTGATGAAGACGCGATCCATCGTCAACTGGACAGCGGTGCAATAGTGC +TAATGG +>test.0417.00002.0003 51012 +GGCCGGTCGCTGTTTCGGTCACTGGCGAGAGCTTTAATCTGACCTCGGAAGAGATTGCCA +CTCAACTGGCCATCAAACTGAAAGCTGAAAAAATGATTGGTTTTTGCTCTTCCCAGGGCG +TCACTAATGACGACGGTGATATTGTCTCCGAACTTTTCCCTAACGAAGCGCAAGCACGGG +TAGAAGCCCAGGAAGAGAAAGGCGATTACAACTCCGGTACGGTGCGCTTTTTGCGTGGCG +CAGTGAAAGCCTGCCGCAGCGGCGTGCGTCGCTGTCATTTAATCAGTTATCAGGAAGATG +GCGCGCTGTTGCAAGAGTTGTTCTCACGCGACGGTATCGGTACGCAGATTGTGATGGAAA +GCGCCGAGCAGATTCGTCGCGCAACAATCAACGATATTGGCGGTATTCTGGAGTTGATTC +GCCCGCTGGAGCAACAAGGTATTCTGGTACGCCGTTCTCGCGAGCAGCTGGAGATGGAAA +TCGACAAATTCACCATTATTCAGCGCGATAACACGACTATTGCCTGCGCCGCGCTCTATC +CGTTCCCGGAAGAGAAGATTGGGGAAATGGCCTGTGTGGCAGTTCACCCGGATTACCGCA +GTTCATCACGGGGCGAGGTTCTGCTGGAACGCATTGCCGCTCAGGCGAAGCAGAGCGGCT +TAAGCAAATTGTTTGTGCTGACCACGCGCAGTATTCACTGGTTCCAGGAACGTGGATTTA +CCCCAGTGGATATTGATTTACTGCCCGAGAGCAAAAAGCAGTTGTACAACTACCAGCGTA +AATCCAAAGTTTTGATGGCGGATTTAGGGTAAGCGATGAAAATCGCCGGATGCGACATGC +GTAACACTCGTGCGTCGCATCAGGCAATTACGTTTATCCCCGTGAACTAAACAACGCCGC +CAGACCACTGCGCCGCTCAGTACGAGTGGCGATTGCCGCACTTAATATGCGCTCATCGGC +ATACAGCGACAGACGGCGACGCGCGCGGGTCACCGCGGTGTAAACCAGCTCTCGCGTTAC +TACCGGCGTGCGTTGACTCGGTAAAATCAACGCCGCATGGTCGAACTCCGATCCCTGCGA +TTTATGTACCGTCATCGCCCACGTCGTTTCGTGCTCTGGCAGGCGACTCGGTTGCACAGA +CTTAATATTGCCGTCCGGCATCGCAAACCAGACGCGCGTCCCCTGCCCGCGATCCAGCGC +AATACCAATATCGCCATTAAACAACCCAAGCGCGCTGTCATTACGGGCAATCATCACTGG +TCGGCCTTCGTACCAACGAGAGTGCGGATGACGATGAATTTTGCGCTTCTGTTGCATAAA +CTGCTCAATTCGCTCATTCAGTCCAGCCACGCCAAACGGCCCTTCCCGCAGGGCGCACAA +AAGCTGGTACTCATTGAACGCCTGAATGATTAAATCCGGCTCGGCACGCGCTTGCAGCAG +ATCCAGATAACGCCCGTAACCCGCAAGAGCTTCCTCAAGCATCGCAATATAATCTTCGCC +ACTCTGTAAAAGCCGTTTTTCGATATCAGTAAAATCCTGCTGAAAAACGGTTTTCACTGC +CGTTTTATCACCACGGTTAATCGCCGCAGCTAACTGACCAATGCCAGAATCGCTGCCGAA +ACGATAGCTTTTTTGCAGCAGGCAGAGGCTGTCGCGCAAAGATGCCGCTTCTGTGCCAGT +TCCTGCCGGAACGTGGCTTCCCGTCAGGCGGCTCAACTGCCCGGCACGCTCGGCGGTAAA +GCCCGCGTTGGCATAAGCGCAGATATCGCCCAGCACAGCCCCAGCCTCAACCGAGGCCAG +TTGATCACGATCGCCGAGAAAGATCACTCGCGCATGATCGGGCAAGGCGTCGATCAGTCT +CGACATCATAGGAAGATCGATCATTGACGCTTCATCTACCACCAGCACATCAAGATGCAG +CGGGTTACCGGCATGATGACGTAAACGCTGGCTACCCGGCTGCGCACCCAGCAATCGGTG +CAAAGTGCTGGCATCTTCCGGAATGCGTTTCTTTTGTTCATCGGTCAGCGGTAATTGTCG +CAAAGCCTTGCCGAGAGATTCGGTTAAGCGCGCGGCAGCTTTACCCGTTGGTGCAGCCAG +ACGGATACGGCAGCGTTCGCCGTCGGCCATTTGAATTAACGCTGCCAGTAACTTCGCTAC +GGTGGTCGTTTTACCGGTGCCAGGACCACCGGAAATCACCGAGATCCGCCGTGTCAGCGC +CACTGCCGCCGCAACTTTTTGCCAGTTAATTTCATCGCTTACTGGAAAAAGTTTGTCCAG +GGTTTGCGCCAGTAGAGCTTCATCAACCTCAATGGCATGATTCACTTCGTTGAAAAAGCG +TGCCACTGTGCGCTCGTTACACCACATGCGATTCAAATAAAGACGATCGCCACAGAGGAT +CATCGGCGTTGGTTCATCTCCCCGGCTGACCGCTTGTGAAGCCAGCAAGCATTCTTCCCA +ATTTTGTAGCTCACCGATTTCACTGACACAGGTCGCCAACAGCGGATGCGATGCCTCGTT +ATTTTCCAGTCGTGAAAGCGGCAAACAAACGTGTCCCTCTCCGGCATCATGACTTAATAG +TGCCGCCGCGAGGGTGACGGCAGGATGTTCATCTCCCGCCACGGTCAGGGCAAACTGCAC +GTCCAGCGGGCGTAGCTGTTTGTGCTCCACAGCTTCCAGTAATTGCTTTTGCAATTTCAT +TACGCCTCCTCCAGGGTCATACCGGCAAACATCTCATCCATCAGGTCAATCAACCCGGCG +TTGGGTCGGGTCGCGTAGATCCCTTGTTGCGGATGTTCTTTATCAACGCCACGCAGGAAC +AGATAAATAACGCCGCCAAAGTGGCGCTCATAGTCGTAATCAGCAATACGATGGCGCAGA +TAACGGTGCAGCGCCAGGGTATAAAGCTGATATTGCAGATCATAGCGGTGTGCCTGCATT +GCCGCTGCCATAGCCTGTTGGGTGTAAGCCGAACTGTCTTCACCCAACCAGTTGGATTTA +TAGTCGAGCAGGTAATAACGCCCTTCGTGGCGGAACACCAGATCGATAAAGCCTTTTAAC +ATGCCACGTACCTGCATGAACTCCAGCGGCGGGCAGCCAGCGGATAGCGGGTCAAACTGG +CGAATTAGTGCATCAAGCTGGCTGGCGATGAGCGGTTCGCTAATTGGCAGGTAAAACTCC +ATCTCCACCTGTTTATCGCGATCGGAAAGCTGATTCAGGCTAACACCCGTTTCATTGAGA +GGTGCCTGGAGGACAGCCGTGATCCACTCAGTCAACACCGGTTCCCACTGCGGTTCAAAG +CCACCGAGCTCCAGTTTTTCCTGTACCCAGTTCGGGTCAACCGGCTGGGTAAAATCGAGG +TCTTCAAACAAACTGTGCAAGAATGTCCCCGGTGACGCACCGCGCGGGAACTGATGCGGT +GTTAACGTCGGTTCTTCAACGACGCTGACCACGCCTGCGGCATCAACATCCAGCCGTGGC +ATCAGATCCTGAGCGATACCGTGACCACGCTGCTGCAAACCGGAGTAGCTGGTGACACGC +CAGTTATCGCCGGGCAATCGTTGTAGCGTCCTCGCATTCAGTTCTGCAGTTAATGCATCA +TTAACCTGCCAGGGCTGGTTATCACCAATTTGTGCCGTTTGCCAGGCAATATCATCATCG +CACAACGCTTCAATGCAGGTACGAAGCCCTGCCGCATCTTGCGGTTCTCCTTTTTGCAGC +AAACGCCCGAGCGCACTTTGGTGGACGTCGGTATCACCTTTTTTATCGCCACGACGGCGC +ACCAGCGGTGCAACGCCGAGACTGCAATGCCAAACCGAACGCGTCAGCGCCACGTAAAGT +AAACGCAGATCTTCCGCCAGACGTTCGGCCTCCGCGAGGTCGACGCTTTCTGGCGCAGCA +TTAAGATCCAGAACGGCCTCAAACGAGTGGCGATCGTGATAAAACGCCTGATCCTGGACG +CGGAAATTGGTAATAAATGGCAACCAGACCAGCGGATATTCCAGCCCTTTTGATTTGTGT +ATCGTGACAATCTGCACCAGATGTTTATCACTTTCGAGGCGCATTTGTTGGCTGGAGGCA +TTACTGTCTGGCTCGAGGATATGTTGCGATAACCAGCGTACCAGCGCATGTTCACTTTCC +AGCTGCGTTCCGGCTTCTTGTAGCAGTTCGCTGATATGCAAGATATCGGTAAGACGCCGC +TCACCGCCTGCCGTTGCCAGCAAGTTTTCTGCAATGTTACGCGCCGACATCAGCGCCCGC +AGCATCGGCATAACGCCACGTTTGCGCCAGATTTGCCGATAACCATCGAACTCTTCGACG +ACCGCATCCCACGCATGTTCGTCATTATTCAGCGTTTCAATATCCAGCGCATTCAGCCCC +ATCATTGACGTTGCCAGCGCACTGCGCAGGGTGTTCTCACGTTCGGGCGTCATCACCGCC +TGCAACAGCCAAAGCATCTCCTGTGCTTCCAGAGTTTCAAAAACACTGTCGCGGTTCGAA +AGGTAAACGGAAGGGATTTCCAGCAGCGTTAAGGCATCGCGCACCTGAGCGGCCTCCTGG +CGGCTGCGCACCAGCACACTGATGTCCGAAGCACGCACCGGACGCGCATCGTCGCCGTTC +ATCAGCAACGCTTCGCCGCGTTGCCCGGCTTGTAGCCAGTCGCGGATTTGCGCAGCACAT +ACCTGCGCCATGGTACTTTGATAGTCGCCAACGCCGCAGCTTTCGCCTTCCATCAGCCAC +ATTTTCATCGCAGGCTGCGTTTCACCTTTAAATACAAAACGTAACGCCTGATTTTTGCCG +GCAGATTTCACAGGAATAAACGGTATTTCACGAAACATGAACGCGTCATCAGTCTGGCTG +AAAAGTTTGTTAACGCTGTTCACCATTCCCGGTGCGGAACGCCAGTTGGTATCTAAGGTG +TAGTGAGCATGAACTTCGCTACGCGCCTTCATATAAGTGAAGATATCCGCACCCCGGAAT +GCATATATGGCCTGTTTCGGGTCGCCAATCAGCAACAATGCGGTTTCCGGCTGATGGTGC +CAGATACGGCGAAAAATTCGATACTGTTGGGGGTCGGTATCCTGAAATTCATCGATCATT +GCCACCGGGAATCGCGTACGGATCGCCGCTGCCAATACCTCGCCGCTTTCACTACGCAGC +GCGGAATCGAGCCGACTTAACATGTCATCAAAACCCAATTCGCCACGGCGGCGTTTTTCA +CGCGCTACTGTTTCGCGGATCTCAGCCAATGCGCGAGTGATCACCAGATCGCGGATCGAC +AATGGTTCTGCAAGCAGTTGTTCGATCGCCTCAAACAGTGGATGTCGCGGGGTTTCCCCC +CCGGCTTTCGTGCGATCTTCTAAGAAACGCTGAGAGAATTTTTCCAGCGACTCCGGCAAC +TGATAGCTGTTGGTCTCTTCTTCTGCCCAGGCGCTGATCTTCTCGATCCATTTAGCCTGA +TTGCTACGGTTAAACTTGCGTCGATCAATACCAGAAGATTCGATCAGCGCATCCAGTTCA +CCCACTGCGTCGCGCCACTGCTGTTTTACGGCATCAATACGCGCCACAATTTGCGCGTGG +CGGGAAGCCAGCGTTTCATCATCGGGGGGCGGTGCTTTGATAACCGGCGCTTCGCCTTGC +AGATAACGATTAATATCGCGCAGCAACGCCTGCGGCCCTTTCCAGGTTTCAAAGACGACC +TGGGCAATTTCACGCGGCAGCGGGTAGCAGTGGCGACGCCAGAAATCGGCGCAGGCCTGG +TAGCGTAGCAGAGACTCATCTTCAATCAGCTGCTGCTCAAACAGCATGCCGGATTCAAAG +GCATTCAGGTTGAGCATGCGCTGGCAAAAGCCGTGAATAGTAAAGACTGCCGCTTCATCC +ATCTGCCGCTCGGCTAACAACAACCACTGCGCGGCTTGCGCTTTATCGTCGATCTCTTCC +AGCAGGCGTTTGTACAGTGGATTGTCGGTGGTTTCACGCAGACAGGCGATGCGCAACTCG +TGGATATTGCTACGGATACGACCACGCAATTCTGCCGTAGCAGCCTCGGTAAAGGTCACC +ACCAGCAGTTCTTCAACGGTCAGCGGGCGGGGAAAGGCGGCAGAACCGCCTAGTCCAAGT +AACAGGCGCAAATAGAGCGCCGCAATCGTAAAGGTTTTGCCTGTGCCGGCAGAGGCTTCA +ATCAGGCGCTCGCCCTGTAAGGGCAAGCGCAAAGGATCTAGTGTCTCGGCGACATCACTC +ATTCTTTTCACTCATCAGGGGCATTGTTTGCTGCAACGCGCTGACGTTCTCCCACACTTT +CCAGCCTTCAGGATGCACATATTCGGCTTTCCCGTTCTGGCTGCCGGAAATCTGCGACAG +AATAGCCATACCTTGCGGCTCGACCACCGCCTGATGGAAGAAATCAGCAAGTTTTTGCGG +CGTCAGCAGTTTTATCTGGGCCACGATTTTATCACGCGAATCGAAGCGCATATTGCCGCG +ATCGAAATCTTTACTTAACTTCGATGCTTCTTCGCCGAGCGTTTGCGGTGCCTGCAGCAT +CTGAGTAATTACCGCCTGCTGGATTTGCGCAAACTCCTCTGGCTTCATCGCCCGCAATTT +TGCCTCTGCGGTTGGGAAAAACGCCTTGTAACGCTCCCACAAGAATGAAGGCTGTTTATC +ATTGCTTTGCAAAAGGAAGCCCATGCCCCACTGACGCCCCACGCTCATTGGAAACGCAAA +CACGGCATAGCCCAACTGTTCTTCGGTACGCAACTGATTGTAGAACCACGGCTGTACGAT +CTGCCCCAACAGAGAGCTATAGGCTGAGCTGGTGTATTCATCGTAGCCAGTCGGTACAAA +TATCGCTGCCAGTGCGGAGTCGGTGCTGTTACCAGCTTTTTCAAAGATGACGGATTGTTT +TTTATCGACCACGACATCTTTGTTACGACACCACTCTGAACCATCAGCGCCCAACTGTTT +TTGCACATGGCGTGCCAGCGTTGTTGCCTGGGCTTCAGTCATGTTGCCGATAACCATAAA +CTCTGGTCTAGCCCCTGATTTTAAGGCGTCGCGATAGGCCAGCACCTCTTTCAACGTAAT +GGAGGGCAAAATTTTGCGCCGTTCATCTCGCGAGAAGTACGGCACTTGCGAGAGCATCTG +CGCGGGCATAATCGCCTGCTCAAACGCTTTGCCCTTTTCTGCGGAATCCATCATCTGGTT +ATACCAGGACTTCGCCTGCTCAAGCTGATCTTCCGTAGCGGTATAGCTAAAGTAGCCCTC +CAGCAGAGCCTGGAACAGCTGCGGCAGGCGCTGAGTGTAACCATTGGCATTAACCATAAG +GCCGTTGTTAGCATTGGTGGAAAAACTTATGCCACCAACCGACGCCTGGTTGCTTAACTG +ATCAAGCGCCAGCCCTGCGAGATAATCATTGAGCGCAAACATCACCTGATTGCGGGCGCT +GTCCATGGCTTTCGGATTACGCAAAATCAGGCTGACATCAGCTTTGGGCTCACTGGCAAA +ATAACGGCTTGGCGCATACACCACGCGCAGATTCGACTCATCAACAATCAACTCTGGATG +GTCGTATTTCTTCTCTGACTTAATCAGCGAGAAATCGTCAGGAATATAGGGGTTAAGCTC +CGGTAAGGAGAGCGCAATATTGGCGGCTTTTTTCTGCCAGTCCGCGAAAGTTTGTGCGCT +AATTTTATCGACCTGATACGGCGCATCGACAAAGTAAGCCGTTTTGTTGTGCGGCTCTTT +CGGGCTGATATACCAGATACGCGCATTCTGCGGCGTCATCATCGCCAGACGTTCTTTTAC +TGCTTTAGCATCGTACCGATCGGCAATATTGACTGCATCCAGTGTATGCTCAACAGGAAC +GCGAATCATGGTATCAGCCAGCCATTCGACGTAATCCATATCACGGGTGATTGACGGATA +ACGGAAGTCGATATCCAGCACATTCGCCAGTTCATCGAAGTATTGTTTATCGATCCCTTT +TTCACGTAACAGATTGAGGTAGCTAAAAATGGCCGCCACAACCTGATCGCGATTCGCCAG +ACCTTTATCGGTTAAAGACGCAGAGATCGCTAATACGCCGCTGTTGCCGTTGACGATAGG +ATCGGAATTGGCGCTAATGCCCTCAACTAATCCCTGCTTTTGCAGCCAGTCAGAAAGTGT +ACCAGGGCTGCGATTACCAATCAGATAGGTAATCAATTCATCCGTTTTACTACGGAACTT +CGCTGAATTGTTATCGATGCGAAACTCAACGCGCAGAACTTTACGCGGCAACGCCGGGAC +GTAATGAATGATAATGCCCTTTTGCGCGTCGGTGACTACCGGCACGGTGATTTCCGGTTT +TTTGCTCTCTTTGTTCGGCACGCGACCAAAGGTGTCCGCCGCCATTTTCGCCAACTCCGG +CAACGGTTTATTGCTGTAAATAACCGCCTTCATCAGATTGGCGGAATAGTACTTCTCGTG +GAAATCTTTCAGCGCCTGCTGTACCGGATTACCTGGTTTGTCGCTTAAAGTTTCGAGGTT +ACCACCAGAAAACTTTGAACCGGGGTGTGCCGGGTTAATGGTTTCTGCGCTGACCTGTGC +CATGCGCATCCCGTCACGCGTACGCGCCATGGTTAATTCGGCATTCACTGCATTACGTTC +ACGTTCGGCGTATTTCTTGTCGAGCAAGGGTTCTGCAATAGCATCGGCCAGGCGGTCTAC +CGCACCGGGCAAGGCGTCGTTCTCAACTTCCAGATAGAAAGCCGTGCGATACGGTGCCGT +GCTGGCATTGTGACTGCCGCCGTGCATTTTGAGATATTCGGCCAGACTGTCAGCCTGCGG +ATACTTTTTCGACCCCATCAGACTCATATGTTCAAGGTAATGTGCCAGCCCCTGGTACGC +CTCAGGATCTTCCAGCGACCCAACGGGCACCACCAGCGCCGAGAGCGATTTAACTGCCTG +CGGATCAGAAACCAGTAAGACCACCATACCGTTATCCAGACGTATAGCCTGATACTGGCG +GTTATCTTTATCACTTTTACGGATGGTTTCCTGAATCGGCTGCCATCCCGTTTCTGCCTG +ACTTAAGGGTGCCCAGAGGGCAACAAACAACAATAATGCTTTGAACCAGATGCTGCGGGG +CATTCACGGACCTCATAATCAACTTTATTTTCTGGCCAGATTCAACACGTTAACGCAAAT +CATCTGCCAGAATTTAATCTTGTGCTGCACGAGTCAGCCTATGTCTATATAACCATCAGT +CCGTGACTGGTGCGCATCATAAAGTAAGCGGATAGATTGCGCAATTTTTATACAATACTC +ATGACTGATTAAAGCGAAACAGCGGTAACAGGAAACGTTGCGACTGTTCAACGATAGCCT +CCATTGTCTCTGGTGTTAATTGCCGCCAGAGCCGTTGATACCAGATATCATCACCTTCGC +CACGCACCATCATGTTGCCTTCGTAAGCCTGAAGGAATTTCGTACGGGCTTTTTGCAACG +TGGAATCGTCATCCAGCATGGCATCGTTTTGCGCGTCATAACAGGTTTTTAGCCACGCGC +CGCCACTTTCAGGTAACACCAGCAATGGCGCGGACATTCCTTCACGATACCCCTCAATCA +GTTGTGAGAGGTAATGCAAAGCCTGTTCGGCTGCAAGCGGCGGAAAACGCCACTCGCCGT +CTTTGCGTAGAAAAAGGCGACTTTCACCATTACCACCGCTGGCACAGTAGACAAGGTGTT +CCAGCCAAAGTTGCATTCCCTGCGCCACACTTAATAAAGAGGGACACCAGCGCAACAGGC +CATCCGGCTGCACCTGCGGCAACCAGCCAGTTATCTGCACACCGTTGCAGGCGAGATCAA +TCTCCATACTCTGCCCTGGCTGGCGACAGGCAATGACTCTGTCGGCAAGCTGCTGCATCT +CCTGACACTGCGTTTCCCAGAAAATTTCACCAAAGGCACCATACGGCAAATCACCTGCCG +CCCGGAATCGGCGGAACAAGCGTTCGGCATCATCCTGCTCAACCAGTACATTTAATAACT +GCTGGTTGATTTGATAACGACTAAGCCCTTCAAGAATAAAAGGTTCAGTGTCGGGAATTT +CGCTGTCTTCGGTACGGAAGTTCACCTGCAAACGCATCTGGAAAAACGCCCGCACCGGAT +GTGCCCAGAATCGTTGTAGCGTTTCCAGCGGCACGGTTTCCGGTAAGGTAAATGGCAGCG +GCTGAACAAATTCAGAATGTGCTTTACCAGCCTGGCTGGCCGCAGGTAGCCACTCGCGCG +CATAGCTTTGTAAGTTACCGGGCTGGTAGTTTTGCGGGTCAAACGGCATCCGGGTATGGT +GGCAAGTAAGATGCGCTTTTACCCTTGCCTCGCTTTCATCACAGTTAAGCGCTTCATCGC +CCGGTAGATAATGGCTTTGCCCGATGTAGTCGATCAGTTCCTGCACCAGTACCGACGGGA +AACGTTCACTGTTATCCTGAATGGAACGCCCAATATAGCTGATATAGAGTTTTTGCTGCG +CGGAAATTAACGCTTCCAGGAACAGATAGCGGTCGTCATCGCGACGGCTACGGTCGCCAC +GCTTCGGTTTCTGGCTCATCAGATCAAAGCCCAATGGCGCAAGCTGACGTGGATAAACGC +CGTCGTTCATTCCCAGCAGGCAAACCACTTTGAACGGAATTGAACGCATTGGCATCAGAG +TACAAATGTTAACCGGTCCGGCGAGAAAACGCTGGCTGATACGTTCTTGATCCAGGCGCA +GTGCCAGTTCATCACGCAATAGTGACAGCGGCACCGCGTCGCCATACTGCGCGCCTAAAC +CTTCGGAGATAATCGCCTGCCATTGTTGTTCGATCAGCGTCATCGCCGCTTCGGTTTCCG +CATCCGGCAGGAAAAAGGCGTTGAGCATATCGCGACAAACCGGCAACCACTCTTCCAGCG +GACGCTCCTGCGCCAGCCCGCGACGCCAGATATTTAGCTGCATTAGCAGTGAAGCCAGAT +GCCCCACCAGTTCTGCAATTAAGCCGCTCGATTCATCATAAGGTAGAACCGATTGCCACT +CGCCCTGCGCGCTCTCCATCGCGTAGCCCAGCAACATGCGCGTCAGGCCAAACCGCCAGG +TGTGTTGACCGGTAGCGGGAAGTTCCAGCTCGCGAACGTTGTCGTCATCTATCCCCCAAC +GAATGCCGGATTCGTTGACCCACTGACGTAAATAACGCAGCCCTTCTTCGGTGATGTCAA +ACCGCGCTGCCAGCACCGGCACATCCAGTAATGCCAGCACGTCTTCCGACACAAAGCGGC +TGTCTGGCAGCGATAACAGGCTGATAAACGCTTCAAGTACAGGATGCGACTGCCGCGCCC +GACGGTCGGAAATGGCGTAAGGCAGGTAACGATCCGCAGGTGCACTACCAAACACAGCCT +GAATAAACGGACTGTAGCTGTCGATATCAGCCACCATCACGATGATGTCGCGCGGAGTAA +GTGTCGGGTCTTCCTCCAGCATCGCCAGCAGGCGATCGTGTAAAACTTCAACTTCACGCT +GCGGGCTATGGCAAACGTGGAAGGTGATACTGCTATCCAGTGGATCAAGCGGGCGTTTGT +TATCGCTACGGGAAAACTCTTCGATGTTCACACCAGCAACGGCGCGGTTTTCCAGTTCCA +GAATGTCAGACTGAATATTATGCAGCAGGTTATCTGGCGTCACATCGACAAAAGCGTCCA +GCTCCTGGCTGCTCTCCAGGTCAGAAAGGAGATAAATGTAGTCGCGCCCAAGCTTGCCCC +ATGAAGCCAGCAGCGGGTTGCCGACATCCTGTTCACCATCGCTGTTAAAGAGCTGCCCGG +CATTTTCGCTGTCGCGAAATAGCGGTAATTCGCGATCTTCAAAACTGTGTCGGCGCTGGC +GAGTCAGTAGTTTCGCCAGATAAGCTGGATCTTTAATGTCGCCCCAGTAATAACGGCAGG +GGTTGGTAAACAGGAGATGGATTTCAATATGTTTACCCAGCGCCTGTAGCGCCTGGAGAT +AAACAGGCGGTAACGCGGAAATACCGCATATAAAGACGCGCGAAGGTAACCCCGGCGGGC +AGGTCGTCGCGGACTCCAGCGTTTCGATAAAGCGCTGATAGAGATTGGCGCGGTGCCAGC +GCGGTTGCCCAAGTTCGTCGGTATATTCCACCAACGCCTTCCACAACGGCGCTTGCCAGG +CCTGTGCTTCTCCCAACCCTTCTACCAGATGTCCTGTTTCCCACTGTGCCAGCCAGTCCG +GACGATAGACCAGATACTGGTCAAACAGGTCCGCCGCTTTTGAAGAAAGCTGGAACAGTT +TTCGCTTGTCACTATCGTCAGTCAGATAATGCCGCAACAGGGTAAAGTCTTCGCGCTCCA +ACAGTTGCGGCAGCAGAGTCATCAGTTTCCAGCTCATGCTCTGTTTGTTAAAGGCGCTCT +CTTTGGGGATCTCCGGTAACACCCGGACGAACATATCCCAGATAAAGCTCGCTGGCAGCG +GAAAATCAATGTTTGCCGCAATACCAAACTTTTGCGACAGGGTCATTTGCAGCCACTGTG +CCATACCGGTACTTTGCACCAGAATCATCTCTGGTTCGAAAGGATCGTCCAGCCGTTCGC +GTTCGACAATAAACTCCATCAACGCTTCCAGCACGTCCAGACGATTGGAATGGTAGACCC +TTAACATAGCGGCTCCTGACTACTGACGATTCGGGCAATGCAGGCGGGTCATCTCGCCTT +CTCTGCCCCCGGGTGAAACTAGCGTAACGCTGATGCTGACACATCCCGCCTGCGATGTCT +GCATTCGGTTGACCTGCCAGTTAGCAGGTGGCGAAATCGCGCGCAGTTGCGTTTGCTGCC +AGCCATGCCGCCAGAGCTGTTGGTACTGGTTTCTGCTGGCAAGACTGTTCATTAATGTTC +GCTGGAAACCCGATAACGCAGTGACAATCATCACCATCAACACCATCGCCAACATTACCT +CCGGCAGACTAAAGCCTTGTTGATTCCTCAGGGAAGCTGACATAACGCCCTCTCTTTCAG +CGGACAAAAATCGCTCCAGCCGCGTGGCGAAAAAACAATGTTTCCATCGATGACTTCGCC +TGTTCGCCACAACGAAACGCCTTCATAACCAGCAATCAATAAGGCTTCATTATCTGCCAG +TAAACGCAGACAAACCCGGGCACCGGTGGCAGCATACAGTAAGCACTGAACTGCGGGCTG +CGTCTGCCAGGAGTGCATTTTTCCCCACTCCAGCGCCGACTGAACGATGGCCTGGCGGCT +CAATGACTGACTTTCCATGCTCACGCGAGAAGCAAAACTGCGATCCTGCTGACTCATTCC +TTGCAATAGCAAGCTACCCAAAATCAGCAGCATCAGGACCAGAGCCAGTGACGAAACTCC +CTTTTCGCGGTTCACAGGTTGGCTCCTGTCACGCTATAGCTGGCATCCACCACGGTTTGC +GGATCAGCCTTGCTGGCAGCGTGTATATTAACCGTCAACACCGGCGAGAAGCCGCTGACA +TCCTGACGTACGACCTGAAAAGTGTCGATAATGATGGCATCCGGATTAGTGACTTTATCC +CAGCCCTTACCTTCACAGGATGTCGCACCGCGTAGCGTTTCCAGCACATGCTCCTTCAGA +CGAAATCCAATCTGGTCGGACTCTTTTACCGGTTCGCGATCCCAGATACCGTTACTGTTC +GCATCCCACTGCACAATGACACAGTCACCCTGTCCGACAATTTCCAGCCCTTCGCCCGTA +CAGCTGCCATGGCAATAACCCGCCCTCTGGAGATGCTTCGCGACGGTAAATACCCGCAGC +CAGATTTCATCTTCCAGCGCCAGTTTACGGGTGCTCGTTAAACTTTCACGCTGTAACGCA +GGCAGAAAGCGTGCAGCCCCCAGCAACAATACGCTACTGATCGCCATAGCAATCAACACT +TCCAGCAGAGAAAAACCTTGCTCTTTTACAGGCATCCTTCTGTTTCTCCTTGCTGACAAA +GCCGGAGTCTTCCCCACGGCGAAACCACTAGCCACCACTCGCCCGTTGAGTTTTTGAAGC +GAATATGCCCGGCCCATGCGGTATTGCGCAGGCCAAAGAAAGCAAGCGAAGGTGTCAGGT +CGCTCATTTCGACTTCGGGCCAGCGCGGCACAAAGACCAATGGTGAACTGCCATGACAGG +TATTCGCCCCAGCAACGGAACTGCCATGACAGGTATTCGCCCCAGCAACGGAACTCACAA +GGCACCATAACGTCCCCTCCCTGATAAGACTGATACTGTGGTCGCGGTTATGCCAGTTGG +CATCTTCACGTAAATAGAGCAAATAGTCCCGCGCCTGGCTGGCGGTTTGCCAAAGCCGTT +GCGACTGCTGCCAGTATTGCCAGCCATAGAGCCCACTTGCGCTTAGCATGACCAGAATAA +GCATCGCGACCAGCGTTTCAATCAGCGTATAACCACGTTGTGTTTTCATGCCGGCAGTAT +GGAGCGAGGAGAAAAAAAGACGAGGGCCAGTTTCTATTTCTTCGGCGCATCTTCCGGACT +ATTTACGCCGTTGCAGGACGTTGCAAAATTTCGGGAAGGTGTCTCGAAGAATTTAACGGA +GGGCAAAAAAAACCGACGCACACTGGCGTCGGCTCTGGCAGGATGTTTCGTAATTAGATA +GCCACCGGCGCTTTAATGCCCGGATGTGGATCGTATCCTTCAATCTCAAAGTCTTCGAAA +CGGTAGTCGAAGATGGATTCGGGTTTACGTTTGATAATCAACTTCGGCAGCGGACGCGGT +TCGCGGCTTAATTGCAGATGAGTTTGATCCATATGGTTGCTGTAGAGATGCGTGTCGCCA +CCGGTCCAGACAAAATCACCCACTTCCAGATCGCACTGCTGCGCCATCATATGCACCAGT +AACGCGTAGCTGGCAATGTTGAACGGCAGGCCGAGGAAGACGTCACAGGAGCGCTGATAA +AGCTGGCAAGAGAGTTTGCCGTCTGCCACATAGAACTGGAAGAATGCATGGCACGGTGCC +AGCGCCATTTTATCCAGTTCGCCTACGTTCCACGCTGAAACAATAATGCGGCGGGAATCC +GGGTCGTTTTTCAGCTGGTTCAGTACCGTAGTGATCTGGTCAATATGACGACCATCCGGC +GTTGGCCAGGCGCGCCACTGTTTACCATACACTGGCCCGAGGTCGCCGTTTTCATCGGCC +CATTCGTCCCAGATGGTGACATTGTTTTCGTGTAGATAAGCAATGTTAGTGTCGCCCTGC +AGGAACCACAGCAGTTCGTGGATGATGGAACGCAGGTGGCAACGTTTAGTTGTCACCAGC +GGGAATCCATCCTGCAGGTTAAAACGCATCTGATGACCAAAAATGGAAAGCGTTCCGGTT +CCGGTACGGTCGTTTTTCTGTGTGCCTTCGTCGAGCACTTTTTGCATCAGTTCTAAATAC +TGTTTCATGGTTCCTCAGGAAACGTGTTGCTGTGGGCTGCGACGATATGCCCAGACCATC +ATGATCACACCCGCGACAATCATCGGGATGGAAAGAATTTGCCCCATGCTGATGTACTGC +ACCCAGGCACCAGTAAACTGCGCGTCGGGCTGGCGGAAAAACTCAACAATGATGCGAAAC +GCGCCGTAACCAATCAGGAACAAGCCTGAGACAGCTCCCATTGGGCGCGGTTTACGAATA +TACAGGTTGAGGATAATAAACAGCACCACACCTTCCAGCAGCAGCTCGTAAAGCTGTGAT +GGGTGGCGCGGCAGCACACCGTAAGTGTCGAAAATGGATTGCCACTGCGGGTTGGTTTGC +AGCAGCAAAATATCTTCTGTACGGGAGCCAGGGAACAGCATGGCAAACGGGAAGTTCGGG +TCAACGCGGCCCCACAATTCACCGTTAATAAAGTTGCCCAGACGCCCGGCACCAAGACCA +AACGGAATGAGTGGGGCAATAAAATCAGAGACCTGGAAGAAGGAACGTTTAGTACGGCGG +GCGAAGATAATCATCACCACGATAACGCCAATCAGGCCGCCGTGGAAGGACATGCCGCCG +TCCCATACACGGAAAAGATACAGCGGATCGGCCATAAACTGCGGGAAATTGTAGAACAGA +ACATAACCAATACGTCCACCGAGGAAGACGCCGAGGAAGCCCGCATAGAGTAAGTTTTCA +ACTTCATTTTTGGTCCAGCCACTGCCCGGACGATTCGCCCGTCGTGTTGCCAGCCACATT +GCAAAAATGAAACCCACCAGATACATCAGGCCGTACCAGTGAAGCGCCACGGGTCCTATT +GAGAAAATGACCGGATCAAACTCCGGAAAATGCAGATAGCTACTGGTCATCTGTCACCAC +AAGTTCTTGTTATTTCGCTGAAAGAGAACAGCGATTGAAATGCGCGCCGCAGGTTTCAGG +CGCTCCAAAGGTGCGAATAATAGCACAAGGGGACCTGGCTGGTTGCCGGATACCGTTAAA +AGATATGTATATGATCCGCGCTATAACCCCCCGCGAATCAACCCGCCCATGCCGCGACGC +TCCATAAAGGCTGCAACCTGATGGCGAACTTCGGTCGCCAGTTGCGCTTCCAGACTACGC +TGCGCAAGATTTTCTGCTTCAGCAAAATCAATGCGCCGCAGCAGGTATTTTACGCGCGCT +ACAGAACGTCCGTTCATAGACAGATGGCGATACCCAAGCCCAATGAGGATTGCCACGCAC +ATCGGATCGCCCGCCATTTCACCGCACAAACGGAGATCGATTCCATGTATTTCCGCTTCC +CGGGCGATCATCGCCAGAGCTCGTAACATTGCAGGATGAAGACTGTCATAAATGTTCGCC +ACCCGGGTATTGTTGCGATCAACGGCCAGGATGTATTGAGTCAGATCGTTGGTGCCAACA +GAGATGAAATCGACCCGCTTTGCCAGATGCGGCAGCATAAATACCATTGACGGCACTTCC +AGCATGATGCCGATACGTGGTTTGGGAATTTCGTAACCGATCATCTCCTCGACTTCACGT +CCGGCACGTTCAATCAGGCGGCGTGCTTCGTCAACTTCATCGAGGCTTGTGACCATCGGC +AACAGAATATTCAGGTTGCCCGTAGCGGCATTAGCACGCAGCATCGCCCGCACCTGGATC +AAGAAGATCTCCGGCTGATCGAGCGTAATGCGAATCCCACGCCAACCCAGGCATGGATTC +TCTTCGCTGATCGGCATGTAAGGCAGCTGCTTATCTGCTCCGACATCCAGCGTACGCAAG +GTGACGGGTTTATCATTAAACATTTGCAGCATCCCCTGATACTGCGCCACCTGTTCTTCT +TCCGACGGAAAACCACTTTGCAGCATGAATGGGATTTCAGTGCGATAAAGTCCTATGCCA +TCAATACGGCTGCCCAGTTTTTCTTCATGTTCCGGGCTTAAACCGGCATTGAGCATGACT +TTAATGCGTTCGCCGCTTTTTAACTGGGCGGGTAAATTGACGTCATCTTCCGCCAGACGG +CTAAGCTCGATCTCTTCACTAATTAGCCGCTGATATTCTTGCAGCAGTACCGGTTCCGGA +TCGACCAGCAATTCACCGCGATAACCATCGACGATCAGCGTCCGACGATGCAGTACCGAA +GGCTGAATATCCGCGCCCATCACGGTAGGTATCCCCAGCGCACGTACCATGATCGCAGCA +TGGGAGTTGGCAGCGCCATCGCGCACGACAACACCGACTAAGCGATCCTGGGGCAGCTCA +GCAAGCGTTGTCGCTGACAGTTCATCTGCCACCAGAATGAAACGTTCCGGCCAGGCGTTC +GGCCCTTGATTAGCGTCATCAAGATGAAACAGCAATCGCTGACCCAGCGCACGTAAATCG +CCAGCCCGCTCTTTGAGATAGTTATCGCTTAGCGCGGCAAACTGTTCGGCAAATTTTTCA +ATGACCGTTTTTACCGCCCACTCTGCCACCGAGCCTTTATCAACCTCGGCAAACAATTCG +CGACGCAGCCGGGTATCCGAAAGCAGGTGTGAGTAAAGATCGAAAATAGCCGCCGTTTCT +TTTTGTGCACCGGCAGCAAAGCGTTTGCTATAGCGGCGAAACTCGTTAGCCGCCTCTTCC +AACGCCCCGGTCAGTCGTTCGCGTTCCAGAGCCGGATCCAGCGTTGATGCCTGATACACC +TGTTCCATTAAAGGTAACGTGGCATCCTGCCAGCCTTCGGCAATCGCCACACCAGGTGCT +GCCGGTAATGCACGGATTCGCGTCTGGCGATATTGCCCAAACAAGGCAGTCAACTGCGAC +TGAGAAAGAATAGCTGCCATCTGGGTGGCAAGCGTCACCAGGAAGGATTCTTCACTTTCG +TCATACTGGCGCAACTCTCGTTGCTGTACCACCAGTACACCAAGCAACTGGCGACGTTGA +ATAATTGGTACGCCTAAAAACGCGCGGAAACGTTCTTCTTTTACGGAGGGGATGTATTTG +AAGCTGGGGTGCTTTTGCGCATCTGCAAGGTTTATCGGTTCCGCCAGCCTGCCAACCAGG +CCGACGATCCCTTCATCAAACGCGAGCGTTACAGTGCGACCGCGTGGTTTTTTCAGTCCC +CGGGTCGCCATCAGGTAGTAACAACGTCGATCATGATCGGCCAGGTAGACCGAACAGACC +TCGGTATCCATCGCAAGACAGATGTCGGTAACCAGAATATTTAACGCCTCATTCAGGCGT +GGTGCGCTGGCTACCTTTTCGACTATTTCGCGCAGGCGAGTGAGCATAATTGGCGTGACT +TAACCTCTTTTACGTCGATAAGCAGATGCGTTTTGTGGTTTTGGCGTATTTTCCTGCAGT +GACATCACCACACTCGCGAACTCTTTCATTACCCTACGGTAGACATCACGTTTAAATGAC +ACCACCTGTCTGACTGGATACCAGTAACTTACCCATCGCCAGCCGTCAAACTCTGGTGTA +CTGCTGGTTTGCATATTGATTTCTGCATCGCCGCTCACCAGCTGCAAGAGAAACCATTTT +TGTTTTTGGCCGATACAAACCGGCTTCGTGTCCCAACGCACCAAACGTTTCGGTAATTTG +TAGCGCAACCAGTTACGCGTTGAAGCAAGGATTCGAACGTCTTTGCGGCTTAATCCTACT +TCTTCAAACAATTCACGGTACATCGCCTGCTCTGCGGATTCTCCGGGGTTGATTCCGCCT +TGCGGAAATTGCCAGGAGTGCTGACCAAATCGCCGGGCCCACATTACCTGCCCCTGGCGA +TTACAAATCACGATACCTACGTTTGGGCGGTAGCCATCGTCATCAATCACCGGACTACCT +CAAAATAAAGCTTTATATACGAATGATTGTTTCATACTCCAGGAAGACGGTAAACCACTC +TCTGCAGGGCATTACACACTAATAACAATTGAATAACTCACAGTTATGTGCAGAGTTATA +AACAGAGGAAGGGGTGGATAGCCGTTTTTATTCACCTTTTCTGTGGATAGAGTTGTGAAG +AACTACGGAATTACTGCGGGAAAACCCGGAGCATTCTGAATAAGACAGATATAGAGATTT +TAAAATATTCATTATCAGTCAATGCATTACATGTGATTTGAGTAATAAAAAAGAGTAATT +CGTGACCCAGGTCACACCTCTCATTTACGGGTTGGCGAAAGATCAACCAATGCCGTATTT +ATCCACAGAATGTGCCACTAAGTTAAGCACTGAACCACTAAAAACTGGAGTTTCGTCGCA +CGTCAAGGCTGTAAATGGAAACAGTAGTGGAGGTTTTTCACAGTTATCCCAGCTTTCTGT +GGATAACATGGTGTAAGATCCTGTTTATTTTCAGTGACCAGATTTGGAAAACCCGTTGCA +GTGTTGCGCAACTCGATTACCGGAAACCTAAAAAGCAATATAAATCAGAGAATTGAACAA +CGCATGTGGAAAAAGTTACACTGCGAATATTCGGCACATAATTGCTGTTTGTTTTTTAAC +CAAGGTATCATGACATGTCCCAACCTCGCCCACTGCTCTCTCCTCCCGAAACTGAAGAAC +AATTGTTAGCGCAAGCACAACAACTTTCTGGTTATACATTGGGAGAACTGGCGGCACTTG +CCGGGCTGGTTACGCCGGAGAATTTAAAACGCGATAAGGGCTGGATTGGCGTGTTACTGG +AGATCTGGCTAGGTGCCAGCGCAGGGAGTAAACCTGAGCAAGATTTTGCTGCTCTGGGCG +TGGAACTTAAAACTATCCCTGTGGATAGTCTTGGTCGTCCGCTGGAAACAACATTCGTTT +GTGTTGCCCCGTTAACGGGCAATAGCGGGGTGACCTGGGAAACCAGCCACGTGCGCCACA +AGCTCAAACGCGTGCTGTGGATACCGGTTGAAGGCGAGCGCAGCATCCCGCTGGCAAAGC +GTCGCGTAGGATCACCGTTGCTGTGGAGCCCGAATGAAGAGGAAGACCGGCAGTTACGCG +AAGACTGGGAAGAATTAATGGATATGATTGTTCTCGGTCAGGTTGAGCGGATCACCGCTC +GGCACGGGGAATATTTACAGATACGACCGAAAGCAGCGAATGCGAAAGCGCTGACCGAAG +CTATTGGTGCCCGGGGCGAACGGATTCTGACGCTGCCGCGCGGATTTTATTTGAAGAAGA +ATTTCACCAGTGCGCTACTGGCCCGTCATTTTCTGATCCAGTAGCCATCGCTTTGACCTG +CCGCTTTCCGGGCATATAATTACCGCTTCATTTTTTTGGCAGGGCTTTTTAGATGTTATT +TGCATGGATAACCGATCCTAACGCCTGGCTTGCGCTCGGTACACTGACGCTGCTGGAGAT +CGTTCTTGGGATCGACAATATTATTTTCCTTTCTCTGGTGGTGGCAAAGCTTCCCACAGC +ACAACGTGCTCATGCGCGCCGTCTGGGGTTGGCGGGAGCCATGGTTATGCGTCTGGCGCT +GCTGGCATCCATCGCCTGGGTTACGCGCCTGACGAATCCGCTTTTTACAATATTCAGTCA +GGAAATTTCCGCCCGTGATTTGATTCTGCTTCTGGGTGGCTTGTTCCTTATCTGGAAAGC +CAGCAAGGAAATCCACGAATCCATCGAAGGTGAAGAAGAAGGGCTGAAAACACGCGTTTC +ATCATTCCTCGGCGCTATCGTGCAGATTATGCTGCTGGATATTATCTTCAGCCTCGACTC +GGTGATTACCGCTGTGGGTCTGTCAGATCACCTGTTTATTATGATGGCAGCCGTGGTAAT +TGCCGTAGGCGTGATGATGTTCGCTGCGCGTTCGATTGGTGATTTTGTCGAGCGCCATCC +TTCGGTAAAAATGCTGGCGCTCTCTTTCCTGATTCTGGTGGGCTTTACCCTGATTCTGGA +AAGTTTCGACATCCACGTACCGAAAGGTTACATCTACTTCGCGATGTTCTTCTCTATTGC +GGTTGAAAGCCTCAACCTGATTCGCAACAAAAAGAATCCGCTCTGATACTCCGTACGCTC +TCCTGCGGGAGGGCGTACTCACTCCTGTTACCCTCACAGTTTAAGATTTTCCTGCTTTCA +AGATATATAACGTCGGTTTATAAACAGACTATTATCATAGGTGGGCCAAATGAGGATAAC +CGGATGAAAAAATGGGCAGTAATAATTTCTGCAGTCGGACTGGCGTTTGCTGTTTCCGGG +TGTTCCAGTGATTACGTCATGGCGACCAAAGATGGCCGTATGATTTTGACCGATGGAAAA +CCTGAAATTGATGATGATACCGGGCTGGTGAGTTATCACGATCAGCAAGGTAACGCGATG +CAAATTAACCGTGATGATGTTTCGCAAATTATTGAACGTTAACAAATAAGGTCAGCATCC +GGCTGGCCTTAAGATTTTTCTCTTTCCCTTTTCCCTTCCCTCTGCCATTTTTATATTCCT +TATGTCGTGATTATAAAAAGGAAACGGCTATGCAATATCACCGTATACCCCACAGTTCGC +TGGAAGTCAGCACGCTGGGGCTTGGCACGATGACGTTTGGTGAACAGAACAGCGAAGCCG +ACGCCCACGCACAACTCGACTATGCCGTCGCTCAGGGCATTAACCTTATCGACGTTGCCG +AAATGTACCCAGTACCTCCGCGCCCCGAAACTCAAGGGCTAACCGAAACCTACGTCGGCA +ACTGGCTGGCGAAACATGGCAGCCGCGAAAAGTTAATTATCGCCTCCAAAGTGAGCGGAC +CGTCGCGCAATAATGACAAAGGCATCCGCCCGGATCAGGCGCTGGATCGGAAGAATATCC +GCGAAGCGCTGCATGACAGCCTCAAGCGTCTGCAGACTGATTACCTCGATCTTTATCAGG +TGCACTGGCCGCAGCGCCCAACCAACTGCTTCGGCAAACTCGGTTATAGCTGGACAGATT +CTGCGCCTGCGGTTTCGCTGCTGGATACACTGGACGCACTGGCAGAGTACCAACGCGCGG +GAAAAATTCGTTATATCGGCGTGTCGAACGAAACTGCATTTGGCGTAATGCGCTACCTGC +ATCTGGCGGACAAACACGATCTGCCGCGTATTGTCACCATTCAGAACCCCTACAGTCTGT +TAAACCGCAGTTTTGAAGTAGGTCTGGCAGAAGTCAGCCAGTATGAAGGGGTCGAACTGC +TGGCCTATTCGTGCCTGGGTTTCGGCACGCTGACCGGGAAATATCTCAACGGTGCAAAAC +CCGCTGGCGCACGTAATACGCTCTTTAGTCGGTTCACCCGCTATAGCGGTGAGCAAACGC +AAAAAGCCGTCGCGGCGTATGTTGATATAGCCAGACGTCATGGCCTGGATCCTGCACAGA +TGGCGCTCGCTTTTGTACGCCGTCAACCGTTTGTTGCCAGCACTCTGCTGGGCGCAACCA +CGATGGAGCAGCTGAAAACTAACGTCGAAAGTTTGCATCTGGAGTTAAGCGAAGACGTGT +TGGCAGAAATTGAAGCGGTGCATCAGGTTTACACTTATCCGGCACCATAAGATTAACGCC +GGTTAAAACCGGCGTTAAATATTAATGACGGCGCTGCCAGATCCACAGCGCCGTTATTGC +CAGCGCAAACAGCGCACCGAAGCCAATGCCAATGGGCACGACCGGGATGCCTACCATTAC +CGCCAGCGAGTAAATGCCCAGCATCAACAACATGGCGCTGTTTTCGCCAAGGTTTTGTAC +TGCAATCGCATTCCCCGCCCCGACGCTTTTTTTGCCCCGCTCCTGTAGCAACGCATTGAG +CGGAACGACAAAAAAGCCCCCCAGCACGCCAATCAGCATCAACAAAGCATAGGCTGGCAG +CAGCTCGTGTTGCAGGGAGAAAATCAGTACCACCACGCCAATCAAAATCCCGGCTGGCAT +ACAGCGTGACACGGTTTCCAGCGTAACTAACTTCGCTGCCGCACCTGCACCAACCACGAT +ACCAATCGCTACCATCGCGTTGAGATAGGTCGGCGTAGCGTTATCGGTAATACCCAGCGC +CACCGGTACCCACAGCACCAACAGGAAACGCAGCGTGACACCCGCTCCCCAGAATAAACT +GGTGCCCACCAGCGAAAAACGCGTTTCACCATTGCGCCATAGCGAGGTGCAGGCATTCAG +GAAACTGCGGGTCATGCTGATGAGATTCCAGGACTGCCCCGGACGCGCCGCCGCCAGTTT +GGGAATGTAGATATTGGCAACGACCGCGCCACCGTAGGCCAGTGCGCATGCGACCAGGGC +AACCAGAATATGCCAGTCAGCCAGAACACCACCAGCTACGGAACCGAGCAAAATCGCCGC +TATGGTAGACGCTTCCATTAAACCGTTAGCTTTTACTAACTTACTACCCGTGGTTAATTC +GCCGAGAATACCGTATTTCGCCGGTGAATAGGCTGCAGCACCAACACCCACCAACGTATA +GCCGAGAAACGGATTGATACCAAAGCAGATACTGGCTGCGCCCAGTAGCTTCAGGCCGTT +GGCAAACATCATCACCCGGCCTTTGGCGAAGCTATCCGCCACCTGCCCGACAAACGGCGC +AAAAAGAATGTAAGCACCTACAAACACCATTTGCAGGATGGGCTGGCTCCACTCCGGATA +GAACTGCGCTTTCAGTAACGCCAGAGTGGCAAACAGTAGCGCATTATCGCCAAACGCAGA +GAGAAACTGCGCCACGATAACCGCTTTCATCCCCTTCGACCACAACGAAGTGTTAGTGTG +CACTGACTCACTCATCGTGTTGTTCCGCTTCGTCTACCCAGCTTTTCAAAGTGACAAAGT +CAGGTTTGCCGCTGCCAAGTAATGGCATCTGTTTCAGATAGCGAATATCGCGCGGTACAG +CAAGCTCCGGCACGCCGTGCTCGCGGGCATACTGTTGTAACTTATCGCGCGTCAGTTCGT +TATCTGTGGTGAAAAGCACCAGTGCCTCGCCTTTGCTGGCATCGCTCTTAATCGCAGTGG +CATGGACTTTATCTGGCGAAACACCAAGTGCCAGTTGTTCCACCATTTCCAGCGACACCA +TTTCGCCTGCAATTTTGGCAAAGCGTTTTGCGCGGCCCTGAATCTGCACAAAGCCCTGCT +CGTCAAAACGCACAATATCGCCAGTGTCATACCAGTCGCGCTCCATTTCGCCGCGAATAT +TCTCGGCGGTGGGCACTTCCAGTACACCAGGCTTCTCCACCCGCAGATAGCCGTTCATTA +TGTTCGGCCCTTTCAGTTGCAGGCGTCCGCCCTCTTCGATACCAGGAACCGACAACAGGC +GCGCATCCATTCCTGGTAGAATACGCCCTACCGTACCGGGTTTCGCCGCCATCGGTACGT +TGATAGAAACGACAGGCGCGCATTCGGTCACACCGTAGCCTTCAAGGATGCGCAGGCCAA +ATTTATCCTGCCAAAGCTGTTTAGTACTTTCTTGTAGTTTTTCTGCGCCTGCCACCACAT +AGCGTAGACGATAGAAGTCATACGGGTTGGCGAAACGCGCGTAGTGACCGAGGAAAGTGG +AGGTACCGAACAACACGGTGCAACTGCGGTCATACACCAACTCCGGCACAATACGGTAGT +GCAGCGGGCTTGGATAAAGGAACACTTCTGCACCTGTGAGCAGTGGCGTAAACAGGCCTA +CCGTCAGCCCAAAGGAGTGAAACAGCGGTAACGCCGACATAAAGCGATCGTTGGTGGTGA +AGTCGGCAATCGTTTTAATCTGCTCGACATTCGCCAGAATGCTTTTATGGCTATGGACGA +CGCCTTTCGGATGGCCTTCAGAACCGGAGGTAAAAAGGATCAGCGCCTCTTCTTCCGGCT +GCTGTTTAACCTGTGCCAGACGCGGCATCAGCAAATGAGCGAAGATCCATACTTTGTCGG +CAGTGGTGACATCTGCTTTTAAATCTTCCAGATAGACCCAGCGCACCTGAGTAAGTTGCT +CCGGCAGATGCCAGAGTTTGCCTTTATCGAGAAACTGACGGGAAGTGAAAATGGTTTTGA +TTTCAGCCGCCGTAATAGCACTGGTCAACCCTTTTACCCCGGCGGTGTAGTTCATCATTG +CGGGAATGCGGCGACGGGCGATGGCCCCAAAAATCACTGCAGCACTGATGCCTGCATTGG +GCAGCATTAAGCCGATGCGTTCGCCTTCAACACTGTATTTTTCAAGGATGCGTCCAACAA +ACAGCGTTTTCGTAAGCAATTTGCGATAGGAGTCCGGGGTAAAGTTAACGTCTTCGACAC +ATTTCTTCCCGGCTCCGAAGCGGTACATTGCGCTCAGTAAAGATTCGTACAGCGTTTCAC +GCGGGCGCACCGCCATACGCGCTTCCATCATTATTTGATGCAGCATTTCGCCAGCGATTT +TGCGACGGTCACGGGCACGCGGCGCATCCGGCATCTCCACCTGCGTTGGTGGCAAAATAT +GCAGAGTAATTTGCGGGAACAAGCGACGTTTAACCAGACCTTTCAGGCGGCTGAAGTGCG +TAAGTTCCGCCCCTTCAATACGCACAGGAATAACCGTTGCACCAGACTTCGCCGCGACAA +ATCCCGCGCCATCGTAGATTTTCATCAGCGAGCCAGTGGTGGTGATGCGTCCTTCAGGGA +AAATCACCACTGGTCGGCCCTGTTCCACCAGACGTACCAGATGTTTAATCGCCATAGGTT +GCGTCGGGTCGAGAGGAACAAAGTCGATAAATGATTTCAGCCAACGCATATACCACTGTT +GGCTTATTGAGGTGTAAACGGCAAATACCGGACGTACGGGTAAAAACAATGCCAGCAGTA +TGCCATCAATAAAAGAGACGTGATTAGGCGTAATTAGAACGCGCTCGCCCTTCAGTGCCT +TGGTGTCACCCGTAACGCGAACGCGATACAAAACACGGCACAAATTTCGAAAAAAGCTAA +AAAGCATTCCAACTCCCTTTGCTCTGATTCAGTAAAAGCGAATGGAGGGAGATTACACGA +GATAAAGAACGCGAGCGACAGTAAATTAGGTGCGAAAAAAAACCTGCGCATCCGCGCAGG +TTGGTGCAAGAGACTGGGTACGAAGAGCGTACCGAATAATCTCACCAATCAATACCTCTG +GGATCTTGATTGTGGTCTGCACAACGACTCTTCGCCAGCGAGAAAACGCAAAGGAATGAA +GGGAAATGCAACGAGGTGTGTAAATTGTCGGTTACTGTTACAGATTGATGACCGGCAAAA +AAAAACCTGCGCATCTGCGCAGGCTGGTGTAATTCATGTGCTCAACCCGAAGTTGACTTC +ACCTATCAATACCTCTGGGATCACCACTTTAGCAACCTGAAGCCAAACGCCACCAGCGGT +CAATCGCAACAGCGTTTCGCAAAGTGTAACCAAAGGTTTGCAATCTCTTTTTTTGTCTTA +CTTATTTGCGTTTGGCTCACATTCCCACAATGAAAACACGCCGCCCCTTGAACCAACGGG +CGTTTTCCGTAACACTGAAAGAATGTAAGCGTTTACCCACTAAGGTATTTTCATGGCGAC +CATAAAGGATGTAGCCCGACTGGCAGGCGTTTCAGTCGCCACCGTTTCCCGCGTCATTAA +TAATTCACCCAAAGCCAGCGAAGCTTCCCGGCTTGCTGTGCATAGTGCAATGGAGTCTCT +TAGCTATCACCCGAACGCCAACGCCCGTGCTCTGGCGCAGCAGACCACTGAAACGATCGG +TCTGGTCGTTGGTGATGTTTCCGATCCGTTTTTCGGCGCAATGGTGAAAGCGGTCGAACA +GGTGGCTTATCACACTGGTAATTTTTTATTGATTGGCAACGGTTACCACAACGAACAAAA +AGAGCGTCAGGCCATTGAGCAACTGATCCGCCATCGCTGTGCTGCGCTGGTTGTCCATGC +CAAAATGATCCCGGATGCCGATTTAGCCTCATTAATGAAACAAATGCCCGGTATGGTGCT +GATCAACCGTATCCTGCCTGGCTTTGAAAACCGTTGTATTGCTCTGGACGATCGTTACGG +TGCCTGGCTGGCAACGCGTCATTTAATTCAGCAAGGTCATACCCGCATTGGTTATCTGTG +CTCTAACCACTCTATTTCTGACGCCGAAGATCGTCTGCAAGGGTATTACGATGCCCTTGC +TGAAAGTGGTATTCCGGCCAATGACCGGCTGGTGACATTTGGCGAACCAGACGAAAGCGG +CGGCGAACAGGCAATGACCGAGCTTTTGGGACGAGGCAGAAATTTCACTGCGGTAGCCTG +TTATAACGATTCAATGGCGGCGGGCGCGATGGGCGTGCTCAATGATAATGGTATTGATGT +ACCGGGTGAGATTTCGTTAATTGGCTTTGATGATGTGCTGGTGTCACGCTATGTGCGTCC +GCGCCTGACCACCGTGCGTTACCCAATCGTGACGATGGCGACGCAGGCTGCCGAACTGGC +TTTGGCGCTGGCGGATAATCGCCCTCTCCCGGAAATCACTAATGTCTTTAGTCCGACGCT +GGTACGTCGCCATTCAGTGTCAACTCCGTCGCTGGAGGCAAGTCATCATGCAACCAGCGA +CTAACCGCAGTTAAAGCAATTCCAGCGCCAGTAATTCTTCAATGGTCTGGCGACGGCGAA +TCAACCGCGCCTGACCATTATCAAACAGAACTTCTGGTAACAGCGGACGGCTGTTGTAGT +TGGATGACATTGATGCGCCATATGCCCCTGTATCATGCAGTACCAGATAATCACACGCCT +TCACTTCCGGCAAGGCGCGGGTTTCAACATTTCCCCCTTCCTGCTGGGTAAAGACATCGC +CCGATTCACATAACGGCCCGGCGACGACGGTTTCCACCGTTGGTGCGTGTTCCAGAGAAC +GACCATCAGCTGCCAGGGCACTGATATGGTGGTAACTACCGTACATTGCCGGGCGCATCA +GATCGTTGAACCCGGCATCAACCAGCACAAAGTGGCGGCTACCCATTTGTTTGACGCTCC +GCACTTGAGTAATTAATACGCCAGCCTGCGCTACCAGAAAGCGACCCGGTTCAATTTCCA +GTTTCACAGGATGGCCCAAATGGCGGGCGATTTGCTCACGCGCGGCATTCCACAGACCAT +AATAATGTTCGGTATCAACCGCCTCTTCACCCTGTTGATAAGGAATAGAAAGCCCACCGC +CCGCAGAAATAGCCTGTAAATCCTGACCGAATTCGAGGACCTGACGCACCATAGCACCAC +ATACCTGTTCCAGATGGGCATAATCGACGCCAGAACCAATGTGCATGTGAATGCCGACCA +GCTGTAGATGATGACGTTGTATCACGTCCAGTGCGGCGGGCAGATCGGTGTACCAGATAC +CGTGCTTGCTGTTTTCGCCACCGGTATTGGTTTTTTGGCTATGCCCGTGACCAAACCCCG +GATTAACACGCAGCCATACCCGATGCCCTGGCGAAACCTGACCCAGTTGGTCGAGCATAT +CAACAGAACCCGCATTCACCGGAATTTGCAATTCACTGACGCGTTCAAGCGTCGCCTGAT +CGATAACATCTGCCGTAAAAACAATATCATCGGGGTGCGTTTGCGGATTGTAACCCGCCG +CCAGTGCACGCTCTATTTCGCCTAACGAGACGGAATCCACTTTTACGCCCTGCTCACGCA +TTAAGCGCAAAATATGAATATTGGAACAGGCTTTCTGTGCAAAGCGCACCACATCAAACT +GTTTCAGCGCTGCAATCTGCCGACGAATAATTTGCGCATCGTAGACCCACACCGGGCAGC +CAAATTCTGCGGGCAAACGCAGCAGATTTTCGGCGGTGAGATCGGTATCAGTGCTGAACA +GTGAATGTGGCATAACAAACTCCAGATAAGTGCTTTTTTATGATTACGCCACATCATAAA +AAGAATAAAAAATATCGATTTATGTCGAGTCTATGCAAAAATGATATGGATTACCGGATT +GCGAGAGAGCGCTAATGGCCGCCGTTAACTTACGTCATATTGAAATTTTTCATGCGGTAA +TGACCGCCGGAAGCCTGACTGAGGCGGCACACCTGCTACACACCTCACAGCCAACCGTCA +GCCGCGAACTGGCGCGCTTTGAGAAGGTGATCGGGCTGAAATTGTTTGAGCGCATACGTG +GACGATTACATCCTACCGTGCAAGGACTGCGTCTGTTTGAAGAAGTGCAACGATCCTGGT +ACGGACTGGATCGCATTGTCAGTGCCGCAGAAAGTCTGCGCGAGTTTCGCCAGGGAGAAC +TGTCTATTGCCTGCCTGCCGGTCTTTTCGCAATCTTTTTTACCGCAGCTCCTGCAACCCT +TTCTGGCACGTTATCCCGATGTCAGCTTAAATATCGTGCCCCAGGAATCACCGCTACTTG +AAGAGTGGCTCTCGGCCCAGCGTCATGATTTAGGACTCACTGAAACGCTCCATACGCCTG +CGGGAACAGAACGTACCGAATTACTCTCTTTAGATGAAGTGTGTGTGTTACCTCCGGGCC +ATCCGCTGGCGGTAAAAAAGGTATTAACGCCGGATGATTTTCACGGTGAGAACTACATCA +GCCTTTCCCGTACTGACAGCTATCGCCAGTTGCTGGATCAATTGTTTACTGAGAATCAGG +TTAAACGACGCATGATCGTAGAAACCCACAGCGCCGCGTCAGTCTGCGCAATGGTACGGG +CGGGGGTAGGCGTTTCGGTGGTTAACCCGCTCACCGCACTGGATTATGCGGCAAGCGGTT +TAGTGGTGCGGCGGTTCAGCATTGCGGTTCCATTCACCGTCAGCCTGATCCGCCCCCTGC +ACCGCCCGTCATCAGCGCTGGTGCAGGCGTTTAGTGAGCATTTACAAGCGGGATTACCGA +AACTGGTCACTTCTCTTGACACTATTTTGTCGTCAGCTACGACAGCATAAAAGCGACAGC +ATCCTCGGCATGGATCGCCGCGGTATCAAACACAGGCAGAACACTGCGCTCTTCTGGCAC +CAGTAAACCAATTTCTGTGCAGCCAAAAATGACGCCCTGTGCGCCCTGTTCTGCAAGGCG +AGCAATCACTTGCGCATAATAAGCGCGTGACGCTTCGGTAAATTGCCCCAGACACAGTTC +TTCAAAAATAATCTGATTAATTTTCGCCCGTTCATCCGCTTCAGGAATAAGACAGTTGAT +GGAAAATTGTTCCGTCAGCCGCCCGCGATAAAAATCCTGTTCCATGGTGTAACGTGTACC +CAGCAGCGCCACACGAGTCATTCCTGCCCCGGTAATTGCACGTCCAGTGGCATCCGCTAT +GTGTAAGAAAGGCAGAGAGCAACGAGACTCAATGGCATCCGCCACTTTGTGCATCGTATT +GGTGCATAACACAATACCTTCTGCGCCCGCCCGCTGTAAGCCAAGCGCCGCCTCAGCCAG +AATATCCCCGGTTTTGTCCCACTCACCGCGACGCTGGCACTCTTCTATTTCATGAAAATC +GACGCTATGTAGCAGCACTTGCGCAGAGTGAAGCCCACCAAGCCGCTGTTTAATGCCTTC +ATTTATCAGACGATAGTAAGGAATAGTGGATTCCCAGCTCATTCCTCCCAGCAAACCAAT +TGTTTTCATTCCTCTCTCCTGATGTGTGTTACCGCAACAAGGCTGAATAAGGAACGAGAC +AAACGCCTCAACGGCCAGGTGCCCAATCTCTATTAACGAAAAAAGGGCCGGATGTACAGC +ACATCCGGCCCGTGAAATCAGACGCCGATATTTCTCAACTTTTCGCCTGCCATCAGTTTG +CGCTCGATATGTTCCAGCGTGACATTTTTGGTTTCCGGAATGAGCCAGAAAGTGATGCCC +ACAAACGCAATGTTCAGCGCAGTGTAGAGCCAGAACGTACCGGCAGCGCCAATGCTATCA +AGCAGTGTCAGGAAGGTCGCGCCGATAATCATATTCGACACCCAGTTTGTCGTCGTTGAG +CAGGTGATGCCAAAATCGCGGCATTTCAGCGGCTGAATTTCAGAGCACAAGATCCACACC +ACTGGCGCGGCGCTCATCGCATAACCGGCAATACACATCATCGTCATGCCAACAGAGAGC +CAGGACAAGCCACTGGAAGCCGTACCGTTATCAAACTGCATCAGGCAGTAACCCAGCACC +AGAGTGCCTAACGCCATCACGCTGAAACCAATTTTCAGAGCCGGCTTACGCCCTGCTTTA +TCTACCGTAAAGACCGCAATGAAGGTAGCGAACATAAAGGTCAGCCCCACGACCAGAGTC +GCAATCATCTGTTGTTCTGTGGTCGTAAAGCCCGCCATTTTGAAGATACGTGGCGCGTAG +TACATGATGATGTTCATACCGGTAAACTGCTGCATCGCCTGCAACAACATACCGAGAAAT +ACAGCACGACGGACGTTACGGTTGATCTTAAACAGTGCCCAACCGCCCTGTTTTAACTTC +AGGCTTTCACGAATTTCGTTGAGTTCTTCTCGCGCTTTTTCCGACGTATCGCGCAGCATA +CGCAACACTTCTTCCGCCTCAATATGACGCCCCTTTTCCGCCAGCCAGCGCGGGCTATTT +GGCAGGAAGACCACCAGAATAATCAGCAGGACTGCTGGTAAAGCAAGAACCCCCAACATT +GCGCGCCAGTTACCGCTATAACTGAACGCTGTATCGGATAAAAACGCCAGCACGATGCCG +AGTGTGACCATCAACTGGTACATGCTGATCATCTTACCGCGAACGTTTTCACTTGCCATT +TCAGAAAGATATAGAGGAGCGGTGTAAGACGCGATCCCAACAGCAATGCCCAACACCACA +CGAGCGGCGATTAACATCTCTACGCTGGTCGCAAAAGCGGACCCTATCGAACCGAGTACA +AACAGGATGGCCCCCGCCATCAGGCTGTATTTACGCCCCAGGCGGAACGACAGCCACCCA +TTAAACAGCGCACCAATTGCTGCGCCGAGCATCATGCTACTGACCACCCATTCCTGCAAA +CGGCTGGTCAGCACAAAGTGATCGGTAATGAACGGCAACGCTCCGGCGATTACGCCGATA +TCAAGACCAAATAACAATCCTGCGACCGCAGCAGCTACCGAAACAAACATATTCATACGC +CGCGTATCCCGCAGAGGACGTGGCGTTAAAGCAGATTCCGTATTGATAGTAACCATTTTT +TCCTGCCAGCAGAGAGTAAGACATAGTGAAAAAATACGTGAACAATTCACACAGGTGTCA +GGTCGGAAATAGCATAAATATGGATTAAATTGCTACGACATGTCGTTATGTGATGGATAT +TCCAATTTTCAAATTAAGTTGAATTATTGAGATTATTATTAACTACCTAATTTTAAAGCA +GATAAAATTCATAAAGTTCATTAATTGATAATTGATATGGATTATTTCATAACCATGATA +TGGATTATGATGATCTACAGGTATAAAAAACCCTGCCATGCGGCAGGGTCATAAAAGTAA +GAGGAATGAATTAACGCGCCAGCCAACCGCCATCCACAGCAATGGTATAACCATTTACAT +AATCTGAAGCGCTGGAGGCAAGAAACACTACCGGCCCCATCAGGTCACTCGGCAGTCCCC +AACGGCCAGCTGGAATGCGGTCGAGAATTTCCGCGCTACGTTGTTCATCTGCCCGCAGTT +GTTGAGTATTGTTGGTCGCCATGTAACCCGGAGCTATCGCATTAACATTAATGTTGTGTT +TAGCCCATTCGTTCGCCATCAATCGCGTCACACCCATCACGCCGCTTTTTGATGCGGTAT +AAGAAGGCACACGGATCCCGCCCTGGAAGGAGAGCATTGACGCGATATTGATAATCTTGC +CGCCATTGCCTTGCGCGATAAAGTGTTTCGCCGCTGCCTGAGACATGAAGAATACGCTCT +TGATATTCAGGTTCATGACATCGTCCCAGTCTGTTTCGCTGAACTCGAGAGCGTCTTCGC +GGCGAATCAATCCGGCGTTATTCACCAGGATATCAATATGACCAAACTCCGCTACCGCGC +GATCCAGCAGTCCAGGAATGCCATCAATCTTTCGCAGATCGGCGGTCAGGCTTAAAAAAC +GACGCCCCTGCGCCGTGACCTGCTTGATGGTTTCAGTCGGTTCAACGATGTTAATGCCAA +CAATGTCACAGCCCGCTTGCGCCAGCCCCAACGCCATCCCCTGGCCCAGCCCAGTATCAC +AACCAGTGACGACCGCAACTTTACCTTCGAGAGAAAATGCATTTAAAATCATAACAATAC +CTTATTCGTTTATGCCCACAACTAGCGCAAATCTTTAACGGCCACATGGTCCATATCATC +AAAAACCTGGTTTTCACCGACCATGCCCCAGATAAAGGTATAAGCTTTGGTTCCGACGCC +GGAATGGATCGACCAGCTCGGGGAGATCACCGCCTGCTCGTTATGCATCACAATGTGACG +CGTTTCTTGCGGTTGCCCCATCATGTGGAAAACGCAGGCGTCATCATCCATATTGAAATA +GAAATAAACTTCCATCCGGCGCTCGTGGGTGTGACACGGCATGGTGTTCCACAAGTTACC +TGGAGCCAGCTCCGTCAGCCCCATACTCAATTGGCAGGTTTCCAGCACATCCGGGACAAA +ATATTTGTTAATCGTGCGACGGTTACTGGTGAGGTTATCGCCTAACGTGACTGGAGATAC +TTCGTCCGGTGTGACTTTTTTGGTGGGATACGTCGTATGCGCGGGTGCGCAATTGTAATA +AAACTTCGCCGGAGTGGCGGTATCAATACTGGCAAAGACAACTTCTTTTGCACCTTTACC +AACATACAGGGCGTCGCGGTGACCGATTTCATAGCATTGACCATCGACAGTAATCGTACC +GGCACCGCCAATATTGATAACACCTAACTCGCGACGTTCAAGGAAATAGCTTACGCCGAG +TTGTTTACCAACTTCCCCGCCAACGGAAACCGTTTTAGTTACCGGCATAATGCCGCCAAC +AATAATACGGTCAATGTGGCTGTAAACCATGGTGTACTCATCGGCGACAAATACCTTTTC +AACCAAAAATTCATTGCGCAGCCCCTGGGTATCCAGCGTTTTTGCGTGCGCACTGTGGAT +GCTCTGTCTTACGTCCACATCAACCTCCGATAATCAGTGAAGCGTGAAAATAGAAAACAA +TAATAAAACACTGTTTCGTTTTCTCTATGAGGGGATGATATGCCCATGGGATAGGGTTTT +CAATTAAAAATAAAACAATGTTTCATTTTCAAGTTAAGGATTAAAAAAAGTGCAGTGTCG +ATCACGAATATGTCATGAGAATGGAAAAATCAGGGAGCCCTGAAAAGGTATGTCGACTCA +CCAGCCATCATTATTCAACAGATTAATGACGGCAGATATTTATCGGTAAGGAGGAAATGC +AGAGCTACTCGTCACGTTCAATGGTCAATGCCACACCCTGGCCCCCGCCGATACAAAGCG +TTGCCAGTCCTTTGCGGGCATTACGTTTCACCATTTCATGAACAAGAGAAACCAGGATTC +GGCAACCGGAAGCGCCTATCGGATGACCGAGTGCGATCGCACCACCATTGACATTGACCC +GACGCTCATCCCATTCAAGCATCTTGCCAACCGAAAGCGCCTGTGCAGCAAACGCTTCAT +TAGCCTCGATAAGATCGACATCAGCCAACTGCCAGCCAACACGCTCCAGGCAACGGCGGG +TCGCATACACCGGCGCAATTCCCATCAATGCCGGATCCACACCAACGCTGGCAAATGCGC +GGATGCGGGCCAGCACGGGTAAATTCAACGCTCGTGCTTTGGCTTCGCTCATCATCATTA +CTGCAGCTGCCCCATAGTTTATGGATGATGCATTACCCGCTGTCACAGAACCGAGACTAT +CAAATGAAGGATTTAAACGGGCTAAGGCTTCTGCGCTGGTGTCAGTGCGTGGCTGTTCAT +CGGTATCAACAACCAACGTCTGACCGTTACTTTGGGTTATTACCGGGACGATCTCATCTT +TAAATCGTCCGGCGTCAATCGCCGCTCGCGCTTTTTGTTGCGAGCTAAGTGCGTAAGCAT +CCTGCAACTGACGGCTGATGCCATATTCGCGAGCCAGATTTTCGGCGGTGACACCAATAT +GATAATCATTGAAGGCATCCCACAACCCATCATGCACAAGACTATCAACCAACTGGCTAT +TGCCAAGCTGTGCGCCGGTGCGGCTATCAGTCAGAACATGTGGTGCGCGGCTCATGTTTT +CCTGGCCACCGGCGATGACAATATCAGCCTCGCCACACTGTATCGCCTGAGTAGCCAGAT +GCAGTGCTTTAAGCCCGGAACCACAAACGTCATTAATAGTGATTGCAGAAACGCTATTAG +GAAGACCACCTTTAATAGCCGATTGCCTTGCCGGATTCTGCCCTGCCCCTGCAGTCAACA +CCTGACCAAGAATCACTTCATCCACCGCATATGCAGGAACGCCGGTACGTTCTATTAACG +CTTTGACGACCAGGCTGCCAAGTTCCACGGCGGAATGACCCGCTAACGCACCACGAAAGC +AGCCGATAGGTGTCCGTAACGCCCCGACAATCACAACGTCTTTCATCACAACCTCGCACC +AATTAACAGTGCAATAGTAAATGATTGTTAATTACAGTTATCTTAATTGTTTAAAAAAGG +TGATTTTTATCACAAAGGAAATACGCCTGAGTAGCAGTCAGAGACATAACTGGCACGTAA +GGTTTGCAACCACTAACCCACCAATAGAGAGGTAGATAGGGCGTTAATCTCCCATACTTA +ACCTGGTTTATGGTAAATTGCCCTCCATTTTGTTTAATTTGTAGATGATACGTTCAGATA +ATGTCTAATATTTGGTCAAAAGAAGAAACTCTGTGGAGTTTCGCGCTCTACGGCACAGCC +GTTGGTGCAGGCACGCTCTTCCTTCCTATTCAGTTAGGTTCGGCGGGGGCTGTGGTCCTG +TTTATTACTGCTCTGGTCGCCTGGCCTTTAACATATTGGCCACATAAAGCCTTATGCCAG +TTCATCCTCTCATCGAAAACATCAGCAGGTGAAGGGATAACGGGCGCGGTAACACACTAC +TATGGCAAGAAGATTGGTAATCTGATTACCACGCTGTACTTCATCGCCTTTTTTGTCGTC +GTGTTGATATATGCAGTGGCAATTACCAACTCACTTACAGAACAGCTGGCAAAGCATATG +GTTATTGATCTTCGCATCCGTATGTTGGTGAGTCTGGGGGTTGTATTAATCCTGAATCTC +ATTTTTCTGATGGGACGCCATGCCACTATTCGGGTAATGGGATTTTTGGTATTCCCATTG +ATTGCCTATTTCTTATTTCTTTCTATTTACCTGGTCGGTAGTTGGCAACCTGATCTATTA +ACAACCCAGGTAGAGTTCAATCAGAATACCCTTCACCAGATATGGATATCGATTCCCGTG +ATGGTTTTCGCTTTTAGCCATACGCCCATTATTTCTACGTTTGCCATAGACAGACGTGAA +AAATATGGCGAACACGCTATGGATAAATGCAAAAAAATTATGAAAGTCGCTTATCTCATC +ATCTGCATAAGTGTATTGTTCTTTGTCTTTAGCTGCCTGCTTTCTATTCCACCTTCGTAT +ATTGAAGCGGCTAAAGAAGAAGGGGTTACCATTTTATCGGCGCTTTCTATGCTGCCGAAC +GCCCCAGCATGGTTGTCAATTTCCGGGATTATTGTCGCAGTAGTTGCGATGTCGAAATCA +TTCCTGGGTACGTACTTTGGCGTTATTGAAGGTGCCACAGAGGTCGTCAAAACAACATTA +CAGCAGGTTGGTGTAAAGAAAAGTCGTGCATTTAACCGCGCACTATCAATTATGTTGGTA +TCGCTGATTACCTTCATTGTTTGTTGCATTAACCCGAACGCGATTTCGATGATTTACGCG +ATCAGCGGCCCGCTCATTGCCATGATACTTTTCATCATGCCTACGCTGTCAACGTATCTC +ATCCCGGCGCTTAAACCCTGGCGTTCCATCGGAAATCTGATTACCCTGATCGTGGGTATC +CTGTGCGTATCGGTAATGTTCTTTAGCTAATATCCGTTGTGGATGGTTCAAAATTGCTTC +AATTTTGAACCATCCCAGTTTTCATAATGTTCATTTGTTATTATTCCGCCCTATCACTTC +TCTCGTAATATTATATAATTATCAGCTAGTTAAACACACAAAGAGTTCTGAACATCTTAA +ATAAGACTATTTAAGATACATGACGATTGCATTGCGTAAACGCTTTTTATTTACAAAAAA +TGGGGAAGTATTACGGCGATTGCGAAAAGTCTGAAGCGCTTGAATTAAGATAATATAGAA +AATCAGATACAACAAAAATGGCAGGTAGATGATGTGAAGATAAATTGGAGCGGGCGAAGG +GAATCGAACCCTCGTATAGAGCTTGGGAAGCTCTCGTTCTACCATTGAACTACGCCCGCT +TCGAGATGCGTAAGGCATTATAAACCTTACGCTCTCCTTAGCAAGTACCACGCTGCTGAC +TGCTGATTAATTCACCATCAGCATTTTGGCTTGCTGCCCTGAGGCGGCAAGTAACGTAGC +GGATCAATTGCCGTTGCACGGTAACGAATCTGGAAATGCAGGCGAACAGATGCCGCATCA +GTGCTCCCCATGGTGGCGATTTTTTGCCCAGCTTTCACGCTTTGCCCATTATTTACCAGC +ATCGTGTCATTATGAGCGTAAGCCGTAATGTAATCTTCACTGTGTTTAATCATGATGAGA +TTACCGTAGCCACGCAGCTGGTTGCCCACATACACCACCTTTCCTGCACCCGCGGCGTAA +ATAGGTGTACCCCGTGGAGCTGAGATATCAATTCCTTTATTGCCGCCATCTGCTGTCGAA +TACGGCATGATAACTTTCCCTGTCGTTGGCCATAACCAACAACGTTGCCCTACTGGCGGC +CAGGAAGATTTCGGTACCGCTGATGACGGTGTAACCGATGCGGTTTTGGTCGTTGATTTG +GCGGTTGATTTACGTGTACTACTGCTACTTTTCGCCCCACCCAGTTTTAGTTTCTGACCT +ACTTCAATGGTGTAAGGGGGGGAAATGCCGTTCAGTCGCGCCAGTTCTTTTACGCTGGTT +CCCGTGGTGCGCGAAATACGATATAGCGTATCCCCCCGTTTCACGGTGTAAACGGAGCCG +GAATACGTTCCTGTATCGGATGATTTGCTACCCGAACAGCCCGCCAAAAGCAGTCCAACC +GATAACAACATCACGATACCCAGAGATTTTTTATTCAGGCGTCCCGCACTCAAAATCTTT +CCTCGCTTAAAAAACAAGACGCCATATCATAGCAGCCGGCTTCTGGATACCCAATCTCTT +GCTTCTGGAAAAGCGATGTAATAGAGAAAGAGGTTAATTTCATTTGGCAAAGGGAAGTAT +CATCAGCAAAATATTTGCTGTAGTGGTATCGAAGTTCCTGACTTTTACCCTATTTCCCAC +CTTGATGCGTAATAATCCTAATTTATCACATTGATTTTATCGCCACTCATATTGATACGT +ATCACTGTCCCTATTCAGAGTCCTGTTTCGTATCATATCTGTGTTTTTTTAACGTCATCA +CACTTCCTTCCTCCCCTCACGCATATAGTCGTTTCTGGCGTAATTCTTGCCTGCTAAGAC +TAAATCTTTGCCATAAGAACCAAATGTTCAAACCGAGGGGATTTCTATGGAAGCGCGGGA +AGCAACCGCTACGGGTGAATCATGCATGCGCGTCGATGCCATTGCTAAGGTCACCGGGCG +GGCACGATATACTGACGATTATGTTATGGCGGGCATGTGTTACGCGAAATATGTACGTAG +CCCTATCGCACATGGTTATGCTGTAAGTATTAATGATGAACAAGCCAGGAGTTTGCCGGG +CGTCCTGGCGATTTTTACCTGGGAAGATGTGCCAGAAATCCCATTCGCCACGGCAGGGCA +TGCCTGGACACTTGACGAAAACAAGCGCGATACCGCCGATCGCGCACTGCTAACTCGCCA +TGTTCGTCATCATGGCGACGCCGTTGCCATCGTCGTGGCCCGCGATGAACTCACGGCAGA +AAAAGCGGCGCAATTGGTCAGCATTGAGTGGCAAGAATTACCCGTTATCACCTCGCCAGA +AGCGGCGCTGGCAGAAGACGCTGCACCAATCCATAACGGTGGCAATTTACTGAAACAAAG +CACGATGTCGACGGGTAATGTCCAACAAACAATCGATGCCGCCGACTACCAGGTACAGGG +GCACTATCAGACTCCCGTTATTCAACATTGTCATATGGAAAGCGTGACATCGCTGGCATG +GATGGAGGATGACTCGCGAATTACCATCGTTTCCAGCACCCAGATCCCGCACATTGTTCG +CCGCGTGGTTGGTCAGGCGCTGGATATTCCCTGGTCATGCGTACGAGTCATCAAACCGTT +TATCGGTGGCGGTTTTGGTAATAAACAGGATGTACTGGAAGAGCCAATGGCGGCATTCCT +GACCAGCAAACTTGGCGGCATTCCGGTGAAAGTTTCCCTTAGCCGTGAAGAGTGTTTCCT +CGCAACCCGTACCCGCCACGCTTTTACTATTGACGGGCAAATGGGCGTGAACCGCGACGG +AACATTGAAAGGTTATAGTCTGGATGTTCTGTCTAACACCGGCGCTTATGCATCTCACGG +GCACTCCATTGCTTCTGCTGGGGGGAATAAAGTCGCTTACCTTTATCCTCGTTGTGCCTA +CGCTTACAGTTCAAAGACCTGCTATACCAACCTCCCCTCGGCTGGTGCGATGCGTGGTTA +TGGCGCGCCACAAGTCGTATTTGCCGTTGAGTCTATGCTTGATGATGCCGCGACAGCGTT +AGGTATTGATCCTGTTGAAATTCGTTTACGCAACGCCGCCCGCGAAGGAGATGCTAATCC +GCTCACGGGAAAACGTATTTACAGCGCAGGGTTGCCGGAGTGTCTTGAAAAAGGCCGGAA +AATCTTTGAATGGGAAAAACGCCGTGCAGAGTGCCAGAACCAGCAAGGCAATTTACGTCG +TGGCGTTGGCGTCGCCTGTTTTAGCTACACCTCTAACACCTGGCCTGTCGGCGTAGAAAT +AGCAGGCGCGCGCCTGTTGATGAATCAGGATGGAACCATCAACGTGCAAAGCGGCGCGAC +GGAAATCGGTCAGGGTGCCGACACCGTCTTCTCGCAAATGGTGGCAGAAACCGTGGGGGT +TCCGGTCAGCGACGTTCGCGTTATTTCAACACAAGATACCGATGTTACGCCGTTCGATCC +CGGCGCATTTGCCTCACGCCAGAGCTATGTTGCCGCGCCTGCGCTGCGCAGTGCGGCACT +GTTATTAAAAGAGAAAATCATCGCTCACGCCGCAGTCATGCTACATCAGTCAGCGATGAA +TCTGACCCTGATAAAAGGCCATATCGTGCTGATTGAACGACCGGAAGAACCGTTAATGTC +GTTAAAAGATTTGGCGATGGACGCTTTCTACCACCCTGAACGCGGCGGGCAGCTCTCTGC +TGAAAGCTCCATCAAAACCACCACTAACCCACCGGCGTTCGGCTGTACATTTGTTGATCT +GACGGTCGATATTGCACTGTGCAAAGTCACCATCAACCGCATCCTCAACGTTCATGATTC +GGGGCATATTCTAAATCCGCTGCTGGCAGAAGGTCAGGTACACGGCGGAATGGGAATGGG +CATTGGCTGGGCGCTATTTGAAGAGATGATCATCGATGCGAAAAGCGGCGTGGTCCGTAA +CCCCAATCTGCTGGATTACAAAATGCCGACCATGCCGGATCTGCCACAACTGGAAAGCGC +GTTCGTCGAAATCAATGAGCCGCAATCCGCATACGGACATAAGTCACTGGGTGAGCCACC +AATAATTCCTGTTGCCGCTGCTATTCGTAACGCGGTGAAGATGGCTACCGGTGTTGCAAT +CAATACACTGCCGCTGACGCCAAAACGGTTATATGAAGAGTTCCATCTGGCAGGATTGAT +TTGAGGATAACATCATGTTTGATTTTGCTTCTTACCATCGCGCAGCAACCCTTGCCGATG +CCATCACCCTGCTGGCTGACAATCCGCAGGCCAAATTGCTTGCCGGTGGCACTGACGTAC +TGATACAGCTTCACCATCACAATGACCGCTATCGCCATATTGTTGATATCCACAATCTGG +CAGAGCTTCAGGGAATAACACAGGCGGAAGATGGCGCGCTGCGAATCGGCTCCGCGACAA +CATTTACTCAGCTCATTGAAGATCCCGTAATCCAACGCAATCTCCCGGCGTTATGTGCTG +CGGCTGCATCAATCGCCGGGCCGCAGATCCGTAATGTCGCCACCTACGGCGGAAATATTT +GCAACGGTGCCACCAGCGCAGATTCTGCCACGCCAACGCTAATTTATGACGCGAAACTGG +AGCTCCACTCCCCACGCGGTGTTCGTTTCGTCCCGATTAATGGCTTTCACACCGGGCCGG +GCAAAGTGTCTCTTGAGCATGACGAAATCCTTGTCGCCTTTCATTTTCCGCCACAGCCGA +AAGAACACGCGGGCAGCGCACATTTTAAATATGCCATGCGCGACGCAATGGATATTTCAA +CAATTGGCTGCGCCGCACATTGCCGACTGGATAACGGCAATTTCAGCGAATTACGCCTGG +CATTTGGTGTTGCCGCGCCAACGCCGATTCGCTGCCAACATGCCGAACAGACTGCACAAA +ATGCGCCATTAAACCTGCAAACGCTGGAAGCCATCAGCGAATCAGTCCTGCAAGATGTCG +CCCCGCGTTCTTCATGGCGGGCCAGTAAAGAGTTTCGTCTGCATCTCATCCAGACGATGA +CCAAAAAAGTGATTAGCGAAGCCGTCGCCGCGGCGGGGGGAAAATTGCAATGAATCACAG +CGAAACAATTACCATCGAATGCACCATTAACGGGATGCCTTTTCAGCTTCACGCCGCGCC +AGGAATGCCGCTTTCGGAACTACTCCGAGAACAAGGGCTTCTTAGTGTCAAACAAGGTTG +CTGCGTAGGCGAATGCGGTGCCTGTACGGTGCTGGTCGACGGCACTGCGATAGACAGTTG +CTTATTCCTTGCGGCCTGGGCTGAAGGAAAAGAGATCCGCACGCTGGAAGGTGAAGCGAA +AGGCGGTAAACTTTCTCATGTCCAACTGGCTTATGCGAAATCTGGTGCAGTGCAATGCGG +GTTTTGTACGCCGGGCCTGATTATGGCTACCACGGCAATGCTGGCGAAACCACGCGAGAA +GCCATTAACCATTACGGAAATTCGTCGTGGACTGGCGGGAAATCTTTGTCGCTGCACAGG +GTATCAGATGATTGTAAATACAGTTCTGGATTGCGAGAAAACGAAGTAAAAGGATATCCG +GCCTGAATTCAGGCCGGATTCTCAGAGGTTATGTGTTTAACAACTCATATTTCTTAATCT +TGCGATAGAGCGTAGCAATGCCGATGCCCAGTTCATCAGCAACTTCCTTCTTGCTGTTAT +GACGTGAAAGCGCCTCGCGGATCATTTGCTTTTCCATCTCCTCCAGCGCCGTGCCGCCCG +CATCATCGAGTGACAGGTGCGCCTCACTGACCTCTGTTACATCACTTTGCTCCGTTGTGC +CATTATTCAGCAGATTTGGCGGCAATAGCGTGCTGTCGATAACTTCACCTGAAGGAACAA +CGTTAACCAGATATTCCATCAAATTGCTTAACTCGCGCAGGTTTCCGGGCCAACGATGCT +TACGCAATATTTCGACGACATCAGGAGCAATGCCAGGATAAACCGATCCCAGACGACGGG +TATGCAGATGTAAAAAGTAATGCACCAGTAATTCAATATCTTCCTGACGTTCACGCAGCG +GTGGAAGAGTTATCGGGATAACATTAAGTCGGTAGAAGAGATCTTCGCGGAATTTACCTT +CGGCAATGAACTGGGCCAAATTCTGATTAGTTGCAGAAATGATGCGGATGTCGACTTGTA +TTGGGCTACTGGCACCAATCGGCAGAATTTCACGCGCCTCAATAGCGCGCAGTAATTTAG +CCTGCAACATTAATGGCATATCACCAATTTCATCGAGAAACAGCGTGCCCGTATTCGCCG +CCTGAATCAACCCTGTTTTACCGTTGGCAGAAGCGCCAGTAAATGCGCCTTTAACATAAC +CGAACAGTTCGCTCTCCAGAAGCTGTTCCGGAATCGCAGCACAGTTGATAGCAATAAAGG +GTTTATTCCGTCTTCCGCTCAACTTATGGATTGCACGGGCGACGACTTCTTTACCCGTGC +CGCTTTCACCAACCACCATAACGCTGGATGGGCTGGGTGCAATACGGCTAATGAGTCGTT +TTAATTGCCGCATAACACGGCACTCGCCAACCAATTGTTCAATATGCGGTTCATCAGGTG +CATTTGCTACAGAAAAACTGGTATGCGATTGGTGAAACGCCATTAAAAATAGTTGTCGGC +CCTGGATGTTATGCAACTGACCAATGATTAATTCACTTTTATCATCCCACGAAACAATAT +GTTGCATATGACCATGGGTAAAATTACTCTCAAATGTTAATGGTCTGAAACGAACAGGTT +TTCCAATAATATTATTTTGTACAACACCGAGTGTTTTTAAAGCTGTCTGATTAACAAACT +GAACCCGATTATCAGCATCAACCACTAACACGCCCTGATCCATATTATCGATCATGGTCG +CGAATATTTTACTGATGTTATCTCCTGGTCCCTGATCCTCCAGAAGTTTAGAAACAAAAA +TGGTGGATATATGGCGAACGTAATCGGAAAATTCGCGTAAATTATCACTGATATGTTCTT +GTTGCTCGTGGGTAACGGCAATCAAACTTATCACCCCAACACAACGATCCTGTAAAATGA +CAGGCGTACCCAGAAATGCTTTTTCGCGGCAATTTTCTTTACTATCGCAACCTTCACAAA +GGGGATCGAAGCGAGACTGTGTCACAACTTTTTCAGTTTTCGTTTCCAGGACGTGGCGGA +GCAGGCGTGAGTTGCCGCTCAACTGGCGGCCAAGAAACTTCCCATACGCGCCCGTTCCGG +CGACGCGACACAAGTTTTCATCAACGATCTCAACCTCAAGCTGCAAAACGCTGGCAAGCA +TTCTGGCAAAACGCTGAATTGTCGGTTGAATTTGCATCAATACTGACTGCGTAGTCGCAA +GCTCCATAGCTTTACCTTCCAGACTTACTTAAAAGTCGATCATTGAAGACGTTGATGGTT +CACAGATCATGATGATATTAACTCAGGCGAAATTGGCTTTGATAAAAACATAAGATTTTT +ATCACTTTCTAATAAAATTATGGAAGAGATATCACATTTCTATATCAATATGAGAATTAC +AGCGGCAAGTTTATCAAACTGAAGAGAGATAGCCTGCCTCTTTATCTTATTTCTGATACT +TAGCAGCAAATAAATAACGTGATAAAAAAAGCCAAACGTTTTCGTATTTTACAAACAACC +GGAAACTGGCATCAATATGTGATCAACCCCACACATTATCCGTCAAATTAGCCTTTCGCA +GCCGCGTGGATAATTCTGGCACACTTATTGTTAGTCCCAGGTATAGCTGTGAAAACACCA +ATCACTTTGGCACGTCACAGTGAAATAAACCACTTTGCCTGTCATTCCACTATCGGGACT +TTATGATGAAAACTGTTAATGAGCTGATTAAGGATATCAATTCGCTGACCTCTCACCTGC +ATGAAAAAGATTTTTTGTTAACGTGGGAACAGACGCCAGACGAACTGAAACAAGTACTGG +ACGTTGCCGCCGCGTTAAAAGCACTGCGTGCTGAAAACATCTCAACCAAAGTCTTTAATA +GTGGATTAGGTATTTCCGTCTTCCGCGACAACTCCACCCGTACCCGCTTCTCTTATGCTT +CCGCGCTTAACCTGCTCGGCCTTGCACAACAAGATCTTGACGAAGGTAAATCACAAATCG +CTCACGGCGAAACCGTGCGTGAAACCGCCAATATGATCTCCTTCTGCGCTGACGCTATCG +GTATTCGCGACGATATGTATCTGGGCGCAGGCAACGCCTATATGCGTGAAGTTGGCGCGG +CACTTGATGACGGCTACAAGCAGGGTGTGCTGCCGCAGCGTCCGGCTTTAGTGAACCTGC +AATGCGATATTGACCACCCGACTCAGTCTATGGCTGACCTGGCATGGTTGCGTGAACACT +TTGGTTCGCTGGAAAACCTGAAAGGCAAAAAAATCGCCATGACCTGGGCCTACTCCCCAA +GCTATGGCAAACCGCTCTCTGTACCACAAGGCATCATAGGTCTGATGACCCGCTTCGGTA +TGGATGTCACCCTGGCCCATCCGGAAGGCTACGACCTGATCCCGGATGTCGTTGAAGTTG +CTAAAAACAATGCTAAAGCCTCCGGTGGTAGCTTCCGTCAGGTCACCAGCATGGAAGAAG +CCTTCAAAGACGCAGACATCGTTTATCCGAAGTCATGGGCACCTTACAAAGTGATGGAAG +AGCGTACTGAATTGCTGCGTGCGAACGATCACGAAGGCTTAAAAGCACTGGAAAAACAGT +GTCTGGCACAGAACGCGCAACACAAAGACTGGCATTGTACTGAAGAGATGATGGAACTGA +CCCGTGATGGCGAAGCCCTGTACATGCACTGCCTGCCAGCTGATATCAGCGGCGTATCCT +GCAAAGAAGGTGAAGTGACTGAAGGCGTATTCGAAAAATACCGTATCGCTACCTACAAAG +AAGCCAGCTGGAAGCCTTATATCATCGCCGCGATGATCCTGTCCCGTAAATACGCCAAAC +CAGGTGCACTGCTCGAGCAACTGCTGAAAGAAGCGCAAGAACGCGTGAAATAACCCCTCG +GGCCGATCAGCTGGTCGGCCCTCTATTTCCAGAGGCCAAAAGGATAGGATATGTCCGTTT +TCTCATTGAAGATTGATATCGCCGATAACAAATTTTTCAACGGCGAAACATCACCGCTTT +TTTCGCAAAGCCAGGCAAAACTGGCACGCCAGTTCCACCAGAAAATTGCTGGTTATCACC +CAACACCGCTTTGTGCGCTGGACGATCTCGCAAACCTGTTTGGTGTAAAGAAAATTCTCG +TCAAAGACGAATCAAAACGATTCGGTCTGAACGCCTTCAAAATGCTCGGCGGTGCGTACG +CCATCGCTCAATTATTGTGTGAAAAATATCATCTTGATATCGAAACGCTGTCATTTGAGC +ACCTGAAAAATGCCATCGGCGAAAAAATGACTTTCGCGACTACCACCGACGGCAACCACG +GGCGCGGTGTGGCATGGGCAGCACAGCAACTCGGACAGAATGCGGTGATTTACATGCCGA +AAGGTTCTGCTCAGGAACGCGTTGACGCCATTCTAAACCTCGGTGCCGAGTGCATCGTCA +CGGATATGAACTATGACGATACCGTTCGCCTGACCATGCAACACGCGCAGCAGCACGGCT +GGGAAGTGGTACAGGACACGGCATGGGAAGGCTACACCAAAATCCCAACCTGGATCATGC +AAGGCTACGCAACACTGGCGGATGAAGCCGTCGAGCAAATGCGTGAAATGGGCGTAACCC +CGACACACGTTCTGCTACAAGCCGGTGTCGGTGCAATGGCCGGTGGTGTGCTGGGTTATC +TGGTCGACGTCTATAGCCCGCAAAATCTGCACAGCATTATTGTTGAACCTGACAAAGCTG +ACTGTATTTATCGCTCCGGCGTCAAAGGCGACATCGTCAACGTTGGCGGTGATATGGCCA +CCATCATGGCGGGCCTGGCCTGCGGCGAACCTAACCCGCTGGGCTGGGAAATCCTACGTA +ACTGCGCCACCCAATTCATCTCCTGCCAGGACAGCGTTGCCGCATTAGGTATGCGCGTGC +TGGGTAATCCGTATGGCAACGACCCGCGCATCATCTCCGGTGAATCCGGCGCTGTCGGTT +TGGGCGTTCTCGCAGCGGTTCATTATCACCCGCAACGTCAAAGCCTGATGGAAAAACTGG +CGCTGAACAAAGATGCCGTGGTGCTGGTTATCAGCACTGAAGGCGACACCGACGTGAAGC +ACTACCGCGAAGTTGTCTGGGAAGGCAAACACGCTGTAGCACCTTAATCACCCTATTGGA +ACTGCTCCCTGCAAAACGGGGAGTAAAAAATCTGGAGAAAAATAATGGCTAAGAATATTC +CATTCAAACTGATTCTTGAAAAAGCAAAAGATTACCAGGCAGACATGACTCGCTTCCTAC +GCGATATGGTTGCTATTCCCAGTGAAAGCTGCGACGAGAAACGCGTAGTACATCGTATTA +AAGAAGAGATGGAAAAAGTCGGCTTCGATAAAGTTGAAATCGACCCAATGGGCAACGTTC +TCGGTTATATCGGCCACGGCCCGCGTCTGGTGGCAATGGACGCTCATATCGACACCGTCG +GCATTGGCAACATCAAAAACTGGGACTTCGATCCGTATGAAGGCATGGAAACCGACGAGC +TGATCGGTGGTCGCGGTACTTCCGACCAGGAAGGCGGCATGGCATCTATGGTTTATGCCG +GTAAAATCATTAAAGACCTCGGTCTGGAAGATGAATATACCCTGCTGGTTACCGGTACTG +TGCAGGAAGAAGACTGCGACGGTCTGTGCTGGCAATACATTATTGAACAATCCGGCATTC +GCCCGGAATTTGTGGTCAGTACCGAACCAACCGACTGCCAGGTATACCGTGGTCAACGCG +GTCGTATGGAAATTCGCATTGATGTTCAGGGTGTTAGCTGCCACGGTTCGGCACCAGAAC +GTGGTGATAACGCCATTTTCAAAATGGGTCCAATTCTTGGCGAATTACAGGAACTGTCTC +AACGTCTGGGCTATGACGAATTCCTCGGCAAAGGTACGCTGACTGTTTCCGAAATTTTCT +TCACCTCCCCAAGTCGTTGCGCTGTCGCAGATAGCTGCGCAGTTTCTATTGACCGCCGTC +TCACCTGGGGCGAAACATGGGAAGGCGCGCTGGACGAGATCCGTGCCCTGCCTGCAGTAC +AAAAAGCGAATGCTGTCGTTTCTATGTACAACTACGACCGTCCGTCCTGGACTGGCCTGG +TTTATCCAACCGAATGCTACTTCCCGACCTGGAAAGTGGAAGAAGATCACTTCACCGTTA +AAGCACTGGTGAATGCTTATGAAGGGCTGTTTGGTAAAGCGCCTGTCGTTGATAAGTGGA +CCTTCTCAACTAACGGCGTATCCATCATGGGTCGCCACGGCATTCCGGTCATCGGTTTTG +GCCCTGGTAAAGAACCGGAAGCGCACGCGCCAAACGAAAAAACCTGGAAATCTCACCTGG +TAACCTGTGCCGCTATGTACGCTGCAATCCCATTAAGCTGGCTGGCAACCGAATAATTAC +TCTTCACTTATTCCCCTCCGGTTCGCCGGAGGGTTTTTGGAGTTTGCTATGCGCGTATTG +ATAAAAAACGGCATTGTTGTTAATGCAGATGGACAGGCGAAGCAGGATTTGCTGATTGAA +AGCGGGATTGTTCGCCAGTTGGGTACCGATATTTCGCCGCAACTCCCTTGCGAAGAAATT +GATGCCTCTGGCTGTTACGTTTTCCCTGGCGGCGTGGATGTCCATACGCATTTCAATATT +GATGTCGGCATCGCGCGCAGTTGTGATGATTTTTTTACCGGTACCCGCGCTGCTGCGTGT +GGCGGTACAACAACCATTATTGACCATATGGGATTTGGCCCAAATGGCTGCCGGTTACGC +CATCAACTGGAAGTTTATCGCGGTTATGCCGCCCACAAAGCAGTCATCGACTACAGCTTT +CACGGTGTCATTCAACATATTAATCACGCTATCCTCGACGAAATTCCGATGATGGTTGAG +GAAGGACTGAGCAGCTTTAAACTCTATTTAACCTATCAATATAAACTCAACGATGATGAA +GTGTTGCAGGCATTACGCCGCTTGCATGAGTCCGGCGCGCTGACCACCGTACACCCGGAA +AATGACGCAGCTATCGCCAGCAAGCGGGCGGAGTTTATCGCCGCAGGGTTAACCGCGCCG +CGTTATCATGCCTTGAGTCGACCTCTGGAATGCGAAGCGGAAGCCATCGCCCGCATGATT +AACCTGGCACAAATTGCCGGTAACGCCCCGCTCTATATCGTGCACCTGTCTAACGGCTTA +GGTCTAGATTATCTGCGTCTTGCCCGTGCGAATCACCAGCCAGTCTGGGTTGAAACCTGC +CCACAATATCTCCTGTTGGACGAACGCAGTTACGATACAGAAGATGGCATGAAGTTCATT +CTTAGCCCACCGCTGCGTAACGTACGCGAGCAGGACAAACTGTGGTGTGGCATCAGCGAT +GGTGCGATTGACGTGGTGGCAACCGATCACTGCACCTTCTCGATGGCTCAACGCCTGCAA +ATTTCTAAAGGCGATTTCAGCCGCTGCCCAAATGGCTTACCCGGTGTGGAGAACCGCATG +CAACTGCTGTTCTCCAGTGGCGTGATGACGGGACGTATCTCACCGGAGCGTTTTGTTGAG +TTAACCAGTGCAATGCCCGCCAGGCTGTTTGGCCTGTGGCCACAAAAAGGATTATTAGCG +CCCGGTTCCGATGGCGACGTGGTGATTATAGACCCACGTCAGAGCCAACAAATTCAGCAT +CGCCATCTCCACGACAACGCTGACTACTCGCCATGGGAGGGTTTTACCTGTCAGGGCGCG +ATTGTCAGAACCTTATCTCGTGGTGAAACGATTTTCTGCGACAGCACCTTTACAGGCAAA +GCCGGGCGAGGTCGTTTCCTGCGACGCAAACCGTTTGTCCCTCCCGTGCTCTAACCACTG +CCAGGGATCTATACACAATCAAGAATGATGAGTGAGGAAAAATGAGTAAGAAAATTGTTC +TCGCCCTGGGCGGGAATGCGCTGGGCGATGACCTGGCTGGGCAAATGAAAGCGGTAAAAA +TTACTTCTCAGGCAATTGTTGATTTAATTGCCCAGGGACATGAGGTCATCGTCACTCATG +GCAACGGGCCACAGGTGGGCATGATTAACCAGGCCTTTGAAGCTGCAGCAAAAACTGAAG +CGCACTCGCCAATGCTGCCGATGTCTGTCTGTGTTGCCTTAAGCCAGGGTTATATTGGTT +ACGATCTACAAAACGCCTTAAGAGAAGAACTGCTTTCTCGTGGCATTAATAAACCTGTAG +CAACGCTGGTTACCCAGGTCGAAGTCGATGCTAACGATCCGGCATTCCTCACCCCGACCA +AGCCGATCGGTTCGTTCTTTACCGAGCAAGAAGCAGAGCTACTGACAAAACAGGGTTACA +CTCTGAAAGAAGATGCGGGTCGCGGCTATCGCCGTGTCGTTGCTTCGCCAAAACCGGTTG +ATATCATTGAAAAAGAAACGGTTAAAGCTCTGGTAGATGCCGGACAGGTGGTGATCACCG +TTGGCGGTGGTGGTATCCCTGTTATTCGTGAAGGTAACCATCTGCGTGGTGCCAGCGCGG +TTATCGATAAAGACTGGGCCAGCGCCCGTTTAGCAGAAATGATTGATGCCGATATGCTGA +TCATTCTGACTGCGGTAGAAAAAGTGGCCATTAACTTCGGAAAAGAGAATGAACAGTGGC +TCGATCGCCTGTCGTTAAGTGATGCTGAACGCTTTATCGAAGAAGGTCATTTTGCGAAAG +GTTCTATGCTGCCTAAAGTGGAAGCTGCCGCCTCGTTTGCTCGCTCTCGCGCAGGTCGTG +AAGCACTGATTA +>test.0417.00002.0004 31459 +CCGTATTGAGCAAAGCGAAAGAGGGGATTGAAGGCAAAACCGGAACGGTGATTTGTCAGT +AATTTAAAGGCCGGATGGGTAATACCATCCGGCCATTTTCATTTAAGCCACTTCCAGCAC +TTCTTTTGTCGCTTTAACGCCCTGATGCATCAACATCATTAACGCCTCAAGTACGCCGCC +GCCAATCGCCCGGGCTTTATCAGAAACGCTGGTGAAATCAGCCGTTTCACCACGAGGATC +GATATCACCAATTTTAAAACCACCGACCACGGCCAGTCCGTCGTTCAACAAGCCACGCAC +CATCCCCGTCAACGGTGCTTTAATTTCATGCTCACCAATCCAGGCAATGACATCGCCCTC +TTTCACCAGATCGCCTAATTTCACGTTGGATCGCATAATGCCTGCAGCAGGAGCGCGGAT +CACTCGTCGGGTGGTATGCCCCATAATATTGCCGGGAACACCGGTATTCTCCTGCGCACA +ACCTGAGTAAATCACCTGACCGAGCCAGTGCCCGCGATTTGTTTCAATTACCGCATGACA +ATCCTTCCCTGCAGTAAAGCCCGGCCCAAGCGCGATTGTTACTGGTGCCATATCTGCCCG +CGTTCCCAAATTCTGTTTCGCCAGAATAGCGTCCACCACGCAAAGCGGTTTCAGTTCATC +AAGCAATGAACAGGTGGGATCTACCATCACAGGGATAAATCCGCGTTCGGTAAGTTTCAT +CGCTTCCGCAGAGCTGGTTGCCAGGCGGGCGGTGACGCCTTCGACCGTCATTTCGCCATC +GAACACGGCCTGGGCAAACGCCACGGTACAACGAATCACTGTCGGTTTTTCCACTTCCAA +CATGATCACTTTAAAACCCGCATGATACAGACGTAGCGCTACACCACTGGCGATATCCCC +CGCACCGCGAATCACCACCAGCTGGTGTCCGGAAGGATGAGAAGGCTTCATCATCAGCCC +ACCCGGCGCGTTATTTTTCACCTGTAATATTTCTGCCAGCACGCTGATGGCGATCTCTTG +CGGCGTTTCCGCACCTATATTGTAACCAACGGGCGCATGTAAACGGGCAATATGTTCTTC +AGCCACGCCTTTCTCACGCAATTGGCGCAGGAAAAGCTGAACCTTGCGGCGACTTGCCAG +CAACCCCAGCCATGCAATGGGTTGTTCAATGAGTTTGTCGAGGGCTTCACGATCCTGATT +ATTCGTGGCAATCAGGACAAAATTATCAGGGCGAATATCCAGTGCTTCCACTGCCGCACC +AAACGACTCAGCATGGAGAAGCGTGGTTGATGGTGGGAATAGTTCAGGATTGAGGCTTTC +GCGATAAATATCAGCAACGGCGATATCAAATCCTAATAGCGCCGCACTCTGGGCTATCGC +CCGGTTGACATGCCCCGCACCAATCAACACCAGACGTGGACGCATACCATGGACGCTGAT +AAATACTGACATTGCACCTCCACAATCTGACCCGACAGCATCCGCACCGTTACGAGCCAT +ACGTCCATGGAATAATCGCGGCTTACGTTCCTGCAATGCCTGAAGCGACTCTTCAATCAC +CTTCCGTTCAACCATTCCGCCACCAATTGTACCGACGATAGAACCATCGGCGCGCACTAA +CATTTGTGCAGAATGGCGGGGGGTTGAGCCTCGGCTATCAACAATTTGCGCCATCGCAAA +CGGACAATTTTGCTCTTCGAGTTTTGCAGCCTCTGTGAAAATATTCATACCAACCTCAAT +GGATATCCTTTCAGTAACCCGGAATACCCGGGCCGCTAATTCACAAATCTGCGCGCGATT +GCAGGATGTTCTTGTATATCGCCCAGCCAGATTGCCTCTACGTTGTGTTGTTGCAGCGGT +TGAAGGAGCTCGCTTTGCGCAATCGCATTCTCACATTGAGAAAAACGGTTAATGAACCAG +ACTCGCCGACAACCTTGTGGTACGTTTTTAAACGCCCCCTGAGGGTGGCGAACCAGCGCA +ACGAGATCGCTCAGTTGCAAGGGTGCAGCAGGTGTTAACCCAGTAATATCAGCAAACTGC +GACCAGCGATGGACATTTTCTGTGCTCACTTTCGCACCCAAAATATGTCCTCCCATCACA +GCAATCACGCAGCAACTGCTTTTAGGTATGCAAGGTTCGTGCTCATCAGGCGCTTTTAAC +GGCATTCCACGCGAGCCATCTGCCTCAATGAGAATTACGTCACACTCTGGTCGTTGTACC +AGTGCATCAATCGCTTCTGGCGTAAATCCCTGCACTTTTCCCTGGTTCGCTTTCCAGCAG +TGAAAACAAAATGAAATGGGGGATATAAAAGACGCATGAGGAAGCATGGCGGGATCACGA +CAGAAAACCACGGGCCAGTGAGATGTTGGCATAAACATATGTGTCGTCGTAGTGATTAAT +ACACGCCTGCCACTCGCCTGGAACAGTTCTGCCAGCCAAAAAAGCAAGCTGGTTTTCCCC +CCAGCACCAACAATAGAAATCACAGTGGGACGTTTCTGCGCGCCTAAATCAATGAATAAT +GCCGATGGGTCAATTATACTTTTCACGCGTCTTTATGGACCTCTCTGGGATAAATTACCC +TCAACGTAATCCATCAGGAAGTAACGCAATTATCAGGCGTTATTAGCTCCTGTAAATAAT +GGAATCACTATGTCAGCCATCGACTGTATAATTACCGCCGCAGGATTATCATCAAGAATG +GGGCAATGGAAAATGATGTTACCCTGGCAACAGGGAACAATTCTTGATACAAGTATCAAA +AATGCGTTGCAGTTTTGTAGCCGAATTATTTTAGTCACCGGCTATCGTGGTAATGAACTG +CACGAACGTTATGCGAACCAGAGCAATATCACTATTATCCACAACCCAGATTATGCGCAG +GGTTTACTGACATCAGTAAAGGCCGCAGTACCCGCGGTACAAACAGAACATTGTTTTCTC +ACCCACGGAGATATGCCAACCCTCACCATCGATATTTTTAGAAAAATCTGGTCGTTACGA +AATGATGGCGCAATACTGCCACTCCATAATGGCATCCCCGGCCATCCGATTTTAGTGTCA +AAACCATGCCTGATGCAGGCAATCCAGCGACCCAATGTCACCAATATGCGTCAGGCACTC +CTTATGGGAGAACATTATTCCGTCGAAATAGAAAATGCAGAAATAATTTTAGATATTGAT +ACTCCGGACGACTTTATTACAGCGAAGAAAAGGTATACTGAAATTTAGAAAACGTAGTTA +AACGATTGCGTTCAAATATCTAATCCCTCCAGCACTCTTTATCATAATGATAAGGAATCA +CTGATTTTGAGAAAAGAGAAAAAGTGATAAATGGGCTGGCAATAATAATTTTCAGGAGTG +ATTTTAATTCTCATTTGGCACCTGTGAGTTCATTCACAAAAAGCCATTAAGTTTCGAGCC +GCCTCACATTTTTTTATATTTCCCGCCAAACCTGGCAAGAGTGGTGCGATTGTTGCTCTA +TCCCCCTAAACCACCGGATTTCTCAACACCGGTCACTCAATGATATCTGTATAAGCTAAG +GAGAGGGTTATGGGGGATATTATGCGTCCCATTCCGTTTGAGGAACTTTTGACGCGCATA +TTTGATGAATACCAACAACAACGCTCAATCTTTGGTATTCCCGAGCAACAGTTTTACTCA +CCCGTAAAAGGTAAAACTGTTAGCGTCTTCGGTGAAACCTGTGCCACTCCCGTCGGCCCT +GCCGCTGGCCCGCACACGCAACTTGCGCAAAACATCGTCACCTCCTGGCTGACTGGCGGA +CGCTTCATCGAACTAAAAACCGTCCAAATTCTTGACCGCCTGGAGCTGGAAAAGCCCTGT +ATCGATGCCGAAGACGAGTGCTTTAACACCGAATGGTCTACCGAATTTACCCTGCTTAAA +GCCTGGGATGAATACCTCAAAGCCTGGTTTGCCCTGCACCTTCTCGAAGCGATGTTCCAG +CCTTCTGATTCCGGTAAATCGTTCATCTTTAATATGAGCGTCGGTTACAACCTCGAAGGT +ATTAAGCAACCGCCGATGCAGCAGTTCATCGACAATATGATGGACGCATCTGACCATCCG +AAATTCGCTCAATACCGCGATGCACTTAATAAGCTACTCCAGAATGAGGCATTTTTAGCC +CGCCACGGATTGCAGGAAAAACGCGAAAGCTTGCAAGCCTTACCCGCTCGCATCCCCACC +AGCATGGTACAAGGGGTTACCCTCTCCACCATGCACGGCTGTCCTCCGCATGAAATCGAA +GCCATTTGCCGCTACATGCTGGAAGAAAAAGGGCTCAACACCTTTGTGAAACTCAACCCG +ACCTTACTGGGGTACGCGCGTGTTCGTGAGATCCTCGATGTCTGCGGTTTCGGTTACATC +GGCTTAAAAGAAGAGTCATTTGATCACGACCTCAAGCTGACGCAAGCGCTGGAAATGCTG +GAACGCCTGATGGCACTGGCAAAAGAAAAATCACTCGGCTTTGGCGTAAAACTGACTAAC +ACTCTCGGCACCATTAATAACAAAGGCGCACTGCCTGGTGAAGAGATGTATATGTCAGGC +CGTGCGCTGTTCCCGCTCTCCATCAACGTTGCAGCAGTTCTCTCTCGCGCCTTTGACGGC +AAACTGCCCATTTCTTATTCCGGTGGTGCCAGTCAGCTGACTATCCGCGATATTTTTGAT +ACTGGTATTCGCCCTATTACTATGGCAACCGACCTGCTGAAACCTGGCGGCTATCTGCGC +TTAAGTGCCTGCATGCGCGAGCTGGAAGGCTCCGACGCCTGGGGACTTGACCATGTTGAC +GTCGAACGACTGAACAGACTGGCAGCAGACGCGTTAACCATGGAATACACCCAGAAACAC +TGGAAGCCAGAAGAGCGTATTGAAGTGGCTGAAGACCTGCCGCTGACCGATTGCTACGTT +GCCCCCTGTGTTACTGCCTGCGCTATCAAGCAAGATATTCCGGAATACATCCGTCTGCTT +GGCGAACACCGCTATGCCGACGCGCTGGAACTCATCTATCAACGCAACGCCCTGCCCGCC +ATTACCGGTCATATTTGCGATCACCAGTGCCAATACAACTGTACCCGCCTGGATTACGAC +AGTGCGCTGAATATCCGCGAACTGAAAAAAGTCGCGCTGGAAAAAGGTTGGGAGGAATAT +AAGCAACGCTGGCACAAACCAGCCGGTTCTGGTTCACGCCATCCGGTTGCCGTGATTGGT +GCAGGTCCGGCGGGTCTGGCCGCAGGTTACTTCCTTGCCAGAGCGGGCCATCCGGTTACG +CTGTTTGAACGCGAAGCCAATGCGGGCGGCGTGGTGAAAAATATCATTCCTCAGTTCCGT +ATTCCTGCAGAGTTAATTCAGCACGATATCGATTTTGTTGCCGATCACGGCGTGAAATTT +GAGTACGGTTGCTCACCCGATTTGACCGTTGAACAGTTAAAAAATCAGGGCTTCCACTAT +GTTCTGATTGCCACCGGCACTGATAAAAATAGCGGTGTGAAACTGGCGGGCGACAACCAA +AATGTCTGGAAATCACTCCCCTTCCTGCGTGAATACAACAAGGGCACAGCGCTCAAGCTG +GGCAAACATGTGGTCGTTGTCGGGGCGGGTAACACGGCAATGGACTGCGCTCGTGCGGCG +TTACGCGTTCCAGGCGTAGAAAAAGCAACGGTCGTTTACCGTCGTTCACTGCAAGAGATG +CCAGCATGGCGCGAAGAGTATGAAGAAGCGTTGCACGACGGCGTGGAGTTCCGTTTCCTG +AATAATCCGGAACGTTTCGATGCTGATGGCACCTTAACCTTGCGCGTTATGTCGCTTGGC +GAACCTGATGAGAAAGGTCGTCGCCGTCCGGTTGAAACCAACGAAACAGTAACGCTGCAT +GTAGACAGCCTGATCACCGCCATTGGTGAACAGCAGGATACTGAAGCCCTGAATGCAATG +GGCGTGCCGCTGGACAAAAACGGCTGGCCAGACGTCGACCATAATGGCGAAACGCGTCTG +ACTGACGTCTTTATGATCGGCGACGTACAGCGCGGACCATCCTCCATTGTCGCTGCTGTC +GGAACCGCGCGTCGGGCGACCGATGCCATCCTGAGTCGGGAAAATATCCGTTCCCACCAG +AACGATAAATACTGGAATAACGTCAATCCGGCGGAAATCTATCAACGTAAAGGCGATATC +TCTGTCACTCTGGTGAACAGTGACGATCGTGATGCGTTTGTCGCGCAGGAAGCCGCTCGC +TGCCTTGAATGTAACTACGTTTGCAGCAAGTGTGTGGATGTCTGCCCGAACCGCGCCAAC +GTATCCATTGCGGTCCCAGGCTTCCAGAACCGTTTCCAGACGCTGCACCTCGACGCTTAC +TGTAACGAATGTGGCAACTGCGCCCAATTCTGCCCGTGGAACGGTAAACCGTACAAAGAC +AAAATCACCGTCTTCAGCCTGTCGCAAGACTTTGATAACAGCAGCAACCCAGGCTTCCTT +GTGGAAGATTGCCGGGTACGCGTACGTCTGAATAACCAAAGCTGGGTGTTAAACATCGAC +AGCGAAGGTCAGTTCAACAACGTACCACCGGAGCTGAACGATATGTGCCGCATCATTAGC +CATGTCCACCAGCATCATCATTATCTGCTGGGCCGCGTGGAGGTGTAATCATGTTGATTC +TGAAGAATGTCACCGCAGTGCAGTTACACCCGGCGAAAGTGCAGGAAGGCGTTGATATCG +CCATCGAAAATGATGTGATTGTCGCTATCGACGATGCCCTGACGCAACGCTATCCCGATG +CCAGCTACAAAGAGATGCATGGTCGGATTGTGATGCCGGGAATTGTCTGCTCGCATAACC +ATTTTTACTCGGGGCTTTCCCGCGGAATTATGGCAAACATCGCCCCCTGCCCGGATTTCA +TCTCAACGCTGAAAAATCTCTGGTGGCGGCTCGATCGCGCCCTTGATGAAGAGTCGCTCT +ATTACAGCGGACTGATTTGTTCCCTGGAAGCAATTAAGAGCGGATGTACATCGGTTATCG +ATCACCATGCCTCTCCAGCCTATATCGGCGGGTCGCTCTCCACATTGCGCGACGCATTTT +TAAAAGTTGGCCTGCGCGCGATGACCTGTTTTGAAACTACTGACCGTAACAGCGGCATCA +AAGAGTTGCAGGAAGGTGTAGAAGAAAACATCCGCTTCGCCCGTCAGATTGATGAGGCGA +AGAAAGCAGCAACCGAGCCGTATCTGGTGGAAGCACATATCGGCGCTCACGCGCCGTTTA +CCGTACCGGATGCCGGTCTGGAGATGCTGTGTGAAGCCGTGAAAAGCACAGGTCGTGGTT +TGCATATTCACGCTGCGGAAGACCTTTACGACGTTTCCTACAGTCACCATTGGTACGGCA +AAGACCTGCTGGCACGACTGGCGCAATTCGATCTCATCGACAGCAAAACGCTGGTCGCTC +ATGGGCTGTACTTGTCGAAAGATGACATCGCCCTACTCAATCAGCGCGATGCGTTCCTGG +TGCATAACGCCCGTTCAAACATGAACAACCATGTCGGCTACAACCATCACCTTAGCGACA +TCCGCAATCTGGCGTTGGGAACGGACGGCATTGGTTCGGACATGTTTGAAGAGATGAAAT +TTGCCTTCTTTAAACATCGCGATGCGGGTGGCCCGCTGTGGCCTGACAGTTTTGCCAAAG +CACTGGCTAACGGCAACGAACTGATGAGCCGCAACTTTGGCGCGAAATTTGGGCTTCTGG +AAGCCGGTTACAAAGCCGATTTAACCATTTGCGATTACAACTCGCCGACGCCGCTGCTGG +CAGACAATATCGCCGGGCATATCGCTTTCGGTATGGGCTCAGGCAGCGTTCACAGCGTGA +TGGTCAATGGTGTGATGGTCTATGAAGACCGTCAGTTTAACTTCGATTGCGATTCCATTT +ATGCGCAAGCCAGAAAAGCCGCTGCCAGTATGTGGCGTCGGATGGATGCGCTGGCATAAA +TAACAGCTCCCCTCTTCTTTCAGAGAAGAGGGGAAATTAAGGAAAGACGATGATTGAACA +ATTTTTCAGACCCGACTCAGTCGAACAGGCGCTGGAACTGAAGCGCCGCTACCAGGATGA +AGCCGTCTGGTTCGCCGGGGGCAGCAAACTCAACGCTACACCAACCCGTACCGATAAAAA +GATTGCCATTTCCTTGCAGGATCTGGAGCTGGACTGGATTGACTGGGATAACGGTGCACT +ACGAATTGGCGCAATGTCTCGCTTGCAGCCACTGCGTGATGCGCGATTTATTCCTGCAGC +ACTGCGTGAAGCCCTCGGTTTTGTTTACTCACGCCATGTTCGTAATCAGTCGACCATTGG +TGGTGAAATCGCCGCCCGGCAAGAAGAGTCAGTGCTGCTTCCCGTCCTGCTGGCACTGGA +TGCTGAACTGGTTTTTGGCAACGGCGAAACGCTGTCAATCGAGGACTACCTGGCCTGCCC +ATGCGATCGCCTGTTAACCGAAATTATCATTAAAGATCCGTATCGCACCTGTGCGACTCG +CAAAATTAGCCGTTCTCAGGCAGGTTTAACCGTCGTGACGGCAGCCGTTGCAATAACAGA +CCACGACGGTATGCGAATTGCGCTGGATGGCGTCGCCAGTAAAGCACTGCGTCTGCACGA +TGTCGAAACTCAAAATCTGGAAGGCAATGCACTTGAACAGGCTGTCGCCAACGCCATTTT +CCCGCAGGAAGATTTGCGGGGCAGCGTGGCCTATAAACGCTATATCACGGGAGTTCTGGT +AGCCGATCTGTATGCCGACTGCCAACAGGCTGGGGAGGAAGCCGTATGATCATCCACTTT +ACTTTAAATGGCGCGCCTCAGGAGCTAACCGTTAATCCAGGCGAAAACGTGCAAAAGCTG +TTGTTTAACATGGGAATGCACTCTGTACGCAACAGTGATGATGGTTTTGGGTTTGCCGGT +TCTGACGCAATTATCTTTAACGGTAATATCGTTAACGCGTCCTTGCTTATCGCCGCACAG +TTAGAGAAGGCAGATATTCGTACCGCAGAATCTCTGGGCAAATGGAATGAGTTAAGTCTG +GTTCAACAGGCCATGGTTGATGTTGGCGTGGTGCAGTCTGGTTATAACGATCCAGCTGCG +GCTCTGATTATCACCGATCTTCTCGATCGCATCGACGCACCTACCCGCGAAGAGATCGAC +GACGCACTCTCAGGTCTGTTTAGCCGCGATGCTGGCTGGCAGCAATACTATCAGGTCATT +GAACTGGCGGTTGCACGTAAAAATAATCCGCAGGCCACCATTGATATCGCTCCGACTTTC +CGTGACGACCTTGAAGTCATTGGCAAGCATTATCCTAAAACTGATGCCGCGAAAATGGTG +CAGGCGAAACCCTGCTATGTTGAAGATCGAGTAACGGCTGACGCCTGCGTCATTAAAATG +TTACGTAGCCCACACGCTCACGCACTGATTACTCATCTGGATGTCAGCAAAGCTGAAGCC +TTACCGGGCGTCGTTCACGTTATTACTCACCTGAATTGCCCGGATATTTACTATACCCCG +GGTGGTCAGAGCGCACCGGAACCGTCACCGCTTGACCGCCGAATGTTCGGCAAGAAAATG +CGTCACGTCGGCGATCGCGTTGCTGCGGTAGTAGCCGAAAATGAAGACATTGCGCTCGAA +GCACTGAAGCTCATCGACGTTGAATATGAAGTGCTTAAGCCGGTAATGTCGATTGACGAG +GCAATGGCGGAAGATGCGCCTGTCGTGCACGATGAACCGGTGGTGTATGTTGCTGGTGCG +CCAGATACTCTGGAAGATGATAACAGCCATGCAGCCCAGCGCGGCGAGCATATGATCATC +AACTTCCCGATCGGTTCTCGCCCACGCAAAAATATCGCTGCCAGTATTCATGGTCATATT +GGCGATATGGACAAAGGCTTTGCCGATGCCGATGTGATCATTGAGCGAACCTATAACTCA +ACGCAGGCGCAGCAGTGCCCGACTGAAACACATATCTGCTTTACCCGTATGGACGGCGAT +CGTCTGGTGATCCACGCCTCCACCCAGGTACCATGGCACTTACGCCGCCAGGTCGCGCGC +CTCGTGGGCATGAAACAACATAAAGTTCATGTCATTAAAGAACGTGTAGGCGGCGGTTTT +GGTTCCAAACAGGACATCCTGCTGGAAGAAGTGTGCGCCTGGGCAACCTGCGTGACCGGG +CGTCCGGTACTGTTCCGCTACACCCGTGAAGAAGAGTTTATTGCTAACACCTCTCGTCAC +GTCGCGAAAGTCACCGTCAAACTGGGCGCGAAAAAAGATGGTCGCCTGACGGCAGTGAAG +ATGGATTTCCGCGCCAACACGGGTCCTTACGGTAACCACTCACTCACCGTACCGTGTAAC +GGACCGGCGCTGTCGCTGCCGTTATATCCATGCGATAACGTCGATTTTCAGGTCACCACC +TACTACAGCAACATTTGCCCAAATGGTGCTTATCAGGGTTATGGCGCGCCGAAAGGTAAC +TTCGCTATCACCATGGCGTTAGCGGAACTGGCGGAACAATTGCAGATCGACCAACTGGAA +ATTATTGAACGTAATCGTGTACACGAAGGGCAAGAGCTGAAAATTCTCGGTGCGATTGGT +GAAGGTAAAGCGCCGACATCCGTTCCTTCCGCCGCCAGCTGCGCACTGGAAGAGATCCTG +CGTCAGGGTCGCGAGATGATCCAATGGTCTTCACCAAAACCACAAAACGGTGACTGGCAC +ATCGGTCGTGGCGTCGCCATTATCATGCAGAAATCGGGTATCCCGGATATCGATCAGGCT +AACTGCATGATCAAACTGGAATCAGACGGTACCTTTATCGTTCATTCTGGCGGTGCGGAT +ATTGGTACTGGTTTGGATACTGTGGTGACGAAACTGGCAGCAGAAGTGCTGCACTGCCCC +CCGCAGGACGTGCATGTTATCTCCGGTGATACCGATCATGCGTTGTTTGATAAAGGCGCA +TATGCCTCGTCCGGTACTTGCTTCTCGGGTAACGCTGCGCGTTTGGCAGCGGAAAATCTG +CGGGAGAAAATCCTGTTCCACGGCGCGCAAATGTTGGGTGAGCCAGTGGCAGATGTTCAA +CTAGCAACGCCGGGCGTCGTTCGCGGCAAGAAAGGCGAAGTTAGTTTCGGAGAGATAGCC +CATAAAGGCGAAACCGGCACCGGCTTTGGTTCACTGGTGGGAACTGGCAGTTATATCACG +CCTGATTTCGCCTTCCCGTATGGCGCAAACTTCGCTGAAGTTGCCGTCAACACGCGTACG +GGTGAAATCCGCCTGGATAAATTCTACGCCTTGCTGGACTGCGGTACACCGGTCAATCCA +GAGTTAGCGCTGGGACAAATCTACGGTGCCACCCTGCGTGCTATCGGCCACAGTATGAGC +GAAGAGATCATTTATGACGCCGAAGGTCACCCGTTAACGCGTGATTTACGCAGTTACGGC +GCACCGAAAATTGGTGACATTCCGCGTGATTTCCGCGCTGTGCTGGTGCCGAGCGACGAT +AAAGTCGGCCCATTCGGGGCGAAATCGATCTCGGAAATCGGTGTAAATGGCGCCGCTCCG +GCGATTGCTACCGCAATTCACGATGCCTGCGGCATCTGGTTACGCGAATGGCATTTCACA +CCGGAGAAAATACTCACCGCGCTGGAAAAAATATAAGTAATAAATGGCCGCTTCGGCGGC +CTGTTTCTCTGTTTGAACGATGACTAAATAGTGACTGCGAAAATGAGATAAGCCGTTCTC +AAGGCGTCCTGCGCCCCAAATTCGTGGGAATTTATTTTACTAATTCAGATGATCAAATTT +ACTTTAAAAGGAGTGAAGGGATGTCTGATATAAACCATGCAGGTTCTGACCTTATATTTG +AACTGGAGGATCGCCCTCCCTTTCATCAGGCTCTCGTAGGTGCCATTACCCATCTGTTGG +CAATTTTCGTTCCGATGGTAACCCCCGCGTTAATCGTGGGTGCGGCCTTACAGCTTTCCG +CTGAAACAACTGCCTATCTTGTTTCTATGGCGATGATCGCCTCTGGTATTGGTACCTGGT +TACAAGTAAACCGCTACGGCATCGTCGGTTCTGGTTTACTTTCAATTCAGTCAGTCAATT +TTTCATTTGTTACGGTCATGATTGCGCTGGGTAGCAGCATGAAAAGCGACGGTTTTCACG +AAGAGTTAATCATGTCGTCGCTCCTCGGCGTCTCCTTCGTTGGCGCATTTCTGGTTGTCG +GCTCTTCTTTTATCCTGCCCTATTTACGTCGGGTTATTACGCCTACCGTCAGCGGCATTG +TGGTGCTGATGATCGGCTTAAGCCTGATTAAAGTTGGCATTATTGATTTTGGCGGTGGTT +TTGCAGCTAAAAGCAGCGGTACGTTCGGCAATTACGAGCATCTCGGCGTTGGCTTATTGG +TTTTGATTGTGGTGATCGGCTTTAACTGCTGCAGCAGTCCGTTGCTACGCATGGGTGGGA +TCGCCATTGGGCTATGTGTCGGCTATATCGCATCGTTATGCCTGGGCATGGTGGATTTCA +GCAGTGTGCGCAATTTGCCGTTAATCACCATCCCGCATCCGTTCAAATACGGCTTTAGTT +TTAGCTTCCATCAGTTCCTGGTGGTTGGCACGATTTATCTGCTTAGCGTGCTGGAAGCTG +TCGGCGATATCACCGCCACGGCAATGGTTTCCCGCCGTCCCATTCAGGGGGAAGAGTATC +AGTCCCGACTGAAAGGCGGCGTGCTGGCAGATGGTCTGGTTTCTGTTATCGCCTCCGCTG +TCGGTTCATTACCATTAACCACGTTTGCGCAAAATAATGGGGTTATTCAGATGACTGGCG +TCGCTTCACGTTATGTCGGGCGAACCATCGCGGTAATGCTGGTTATCCTCGGCTTATTTC +CGATGATTGGCGGCTTCTTCACGACCATTCCCTCAGCAGTTCTGGGAGGCGCAATGACGT +TGATGTTTTCCATGATTGCCATCGCAGGGATTCGCATCATCATCACCAACGGTTTAAAGC +GCCGAGAAACACTTATTGTCGCCACGTCTTTAGGTTTAGGGCTTGGCGTCTCCTACGATC +CCGAAATTTTTAAAATATTGCCAGCCTCTATTTATGTATTAGTTGAAAACCCTATTTGTG +CTGGCGGGTTAACTGCGATTTTATTAAATATTATCCTCCCTGGTGGCTACCGACAGGAAA +ACGTTCTGCCTGGTATTACCTCAGCGGAAGAGATGGATTAACAGTAAAGGAGTCAATGAT +GTCAGGAGAACACACGTTAAAAGCGGTACGAGGCAGTTTTATTGATGTCACCCGTACGGT +CGATAACCCGGAAGAAATTGCCTCTGCGCTGCGGTTTATTGAGGATGGTTTATTACTCAT +TAAACAGGGAAAAGTGGAATGGTTTGGCGAATGGGAAGACGGAAAGCATCAAATTCCTGA +CACCATTCGCGTGCGCGACTATCGCGGCAAACTGATAGTACCGGGCTTTGTCGATACACA +TATCCATTATCCGCAAAGTGAAATGGTGGGGGCCTATGGTGAACAATTGCTGGAGTGGTT +GAATAAACACACCTTCCCTACTGAACGTCGTTATGAGGATTTAGAGTACGCCCGCGAGAT +GTCGGCGTTCTTCATCAAGCAGCTTTTACGTAACGGAACCACCACGGCGCTGGTGTTTGG +CACTGTTCATCCACAATCCGTTGATGCGCTGTTTGAAGCCGCCAGTCATATCAATATGCG +TATGATTGCCGGTAAAGTGATGATGGACCGAAACGCACCGGATTATCTGCTCGACACTGC +CGAAAGCAGCTATCACCAAAGCAAAGAACTGATTGAACGCTGGCACAAAAATGGTCGTCT +GTTGTATGCGATTACGCCACGCTTCGCCCCTACCTCATCTCCTGAACAGATGGCGATGGC +GCAACGCCTGAAAGAAGAATATCCGGATACATGGGTACATACCCATCTCTGTGAAAACAA +AGATGAAATTGCCTGGGTGAAATTGCTTTATCCTGACCATGATGGTTATCTTGATGTTTA +CCATCAGTACGGCCTGACCGGTAAAAATTGTGTCTTTGCTCACTGCGTCCATCTCGAAGA +AAAAGAGTGGGATCGTCTCAGCGAAACCAAATCCAGCATTGCTTTCTGTCCGACCTCCAA +CCTTTACCTCGGCAGCGGCTTATTCAACTTGAAAAAAGCATGGCAGAAGAAAGTCAAAGT +GGGCATGGGAACAGATATCGGTGCCGGAACAACTTTTAACATGCTGCAAACGCTGAACGA +AGCCTACAAGGTATTGCAATTACAAGGCTATCGCCTCTCGGCATATGAAGCGTTTTACCT +GGCCACGCTCGGCGGAGCGAAATCTCTGGGCCTTGACGATTTGATTGGCAACTTTTTACC +TGGCAAAGAGGCTGATTTCGTGGTGATGGAACCCACTGCCACTCCGCTACAGCAGCTGCG +CTATGACAACTCTGTTTCTTTAGTCGACAAATTGTTCGTGATGATGACGTTGGGCGATGA +CCGTTCGATCTACCGCACCTACGTTGATGGTCGTCTGGTGTACGAACGCAACTAATAATA +AAACTTTAACATCCTCGTGAGGACATCATTATGTCTGGAGACATCCTACAAACACCGGAC +GCACCAAAGCCACAGGGCGCGCTGGATAATTATTTTAAAATTACCGCTCGTGGCAGTACC +GTTCGTCAGGAAGTACTGGCTGGCTTAACGACCTTTCTGGCCATGGTTTATTCCGTTATC +GTCGTTCCGGGAATGCTGGGCAAAGCAGGTTTTCCTCCCGCAGCTGTGTTTGTTGCCACC +TGTCTGGTCGCGGGCTTCGGCTCGTTGCTGATGGGGTTATGGGCCAATTTGCCAATGGCG +ATTGGTTGCGCTATTTCCTTGACGGCGTTTACCGCATTCAGTCTGGTACTCGGGCAACAA +ATTAGCGTTCCTGTCGCACTGGGCGCAGTCTTTCTGATGGGCGTCATCTTCACCGCTATT +TCCGTAACCGGTGTGCGTACCTGGATCTTACGTAATTTGCCGATGGGGATCGCTCACGGT +ACAGGTATCGGTATCGGCCTGTTTCTGCTGCTGATTGCTGCTAACGGTGTGGGAATGGTT +ATCAAAAACCCGATTGAAGGCTTGCCAGTGGCGCTCGGTGCGTTTACCTCCTTCCCGGTG +ATGATGAGCTTACTGGGGCTGGCGGTCATCTTCGGTCTGGAAAAGTGCCGCGTACCCGGC +GGGATCTTGTTGGTGATTATTGCAATTTCGATCATCGGCTTAATCTTTGACCCAGCGGTG +AAGTACCACGGTCTGGTGGCAATGCCAAGCCTGACTGGCGAAGATGGTAAGTCTCTGATT +TTCAGCCTCGATATTATGGGCGCACTCCAGCCAACTGTACTTCCGAGTGTACTGGCATTG +GTGATGACCGCAGTGTTCGACGCCACTGGCACCATCCGTGCCGTCGCCGGTCAGGCGAAT +TTGTTGGATAAAGACAACCAGATCATCAACGGCGGCAAAGCCCTGACCAGTGACTCAGTA +AGTTCAATATTCTCCGGCCTGGTGGGCGCAGCGCCCGCGGCGGTTTATATCGAATCAGCG +GCAGGAACCGCCGCCGGGGGGAAAACCGGTTTAACCGCAACCGTGGTTGGTGTGTTGTTC +CTGATGATTCTGTTTTTATCACCGTTATCGTTTCTGATCCCCGGTTATGCCACAGCTCCC +GCACTGATGTACGTGGGTTTGCTGATGTTAAGCAACGTCTCGAAGCTGGATTTCAACGAT +TTTATTGACGCAATGGCTGGCCTGGTGTGTGCCGTGTTCATCGTTCTGACTTGTAATATC +GTTACCGGTATTATGCTGGGCTTTGTAACACTGGTGGTGGGTCGCGTCTTTGCGCGCGAA +TGGCAAAAGCTGAATATTGGTACGGTGATCATTACTGCCGCACTGGTCGCGTTTTACGCG +GGTGGTTGGGCAATCTAATAGATTCTCCGCGCCTTTCCGCGCGGAGATTTCTTTCAGAGA +GGATTCTCACTGCTGGCAGCAATACGCTGCTGGCGGATACGCCTGAGTTCTCTTTCAGTC +AGCAACTGCAGCGCCTGTGTCGGGCAAGATTCAACGCAGGCTGGCCCCTCTTCCCGCAGT +TCACAGAGATCGCATTTCACGATTTGTTGCCGGGGATCACCCGGCAATGACTGAATGGTG +ATCATCCCAAACGGGCACGCGCTAACGCAACTCTGACAGCCAATACAACGGGCAGAATTG +GCCTGCACCACCTGCTCGCCCATCGTCAGCGCCCCCACGGGGCAAGCGCCAACACAAGGG +GCGTTTTCACACTGATGGCACATCACCGGCGCACTGATGCTATCCAGCCGTTGTACCTTC +AGCCGGGGTAAAAAGATATCGGCATTCAACTCCTGTTCTGAAGGGTGAGCGACCACACAG +GCCACTTCACAAGTACGGCAGCCAATACAGTCAGCCGGATTAACGATAATTAACGATTTC +ATCACGATGCCTTCGTATCAAACAGAGTTAACATATCGCGCGCCGCCTGCCTTCCTGCGG +CCATTGCAGTGACAACCAGATCCGCGCCATGAACTGCATCACCACCAGCAAAGACTTTTT +TCAGATGCGTCTGGGTAGGTAAATACCCGACGTCGCCGGTTTGAATCAGGCCCCATTTAT +CGAGTTTAATTCCGCTGCCCTGCAACCACGGCATGGTATGTGCCTGGAAACCAAAGGCCA +TAATGAGAACATCGGCGGGCAATTCAAACTCTGAACCCGCAACCGGACGAGGACGACGGC +GACCATCCGGCCCCGGCTCACCCATAGCGGTACGAATCAGGCCCACCGCCGTTAAGCGTC +CATCTTCATCACAAGCGATATATTGCGGCTGAACATTGAACTGAAACTCAACACCTTCCT +CGCGGGCATTGACCACCTCTTTGCGCGAACCCGGCATACTGACTTCATCACGACGATACG +CACAGGTCACGCTGGCAGCATTAAGGCGGATGGAAGTCCGCAAACAATCCATTGTCGTAT +CGCCACCGCCCAATACCACGACTCGCTTCCCTTCCACATCCGTCAGCGGATACTCTGCAG +ACTCCGGCAATCCCATGAGCTGGCGGGTATGGGCGGTCAGGAACGGTAACGCCTGAATGA +CACCAGGCGCATCTTCATGCGGCAGATCTGCTCGCATCATCCCGTAAGTCCCCACGCCGA +GGAAAACAGCATCATATTCCGCCGTTAATTCGTTGAAAGAGATATCGCGGCCAATTTCAC +AGTTGAGATGGAAATCGATTCCCATTGCGGTGAATATCTCTCGCCGCTGGCTTAATACCG +TTTTATCGAGTTTGAAAGGAGGAATGCCAAAAGTCAGCATACCGCCAATTTCTGGATGGC +GATCAAAGACATCAACCTGAACTCCCGCGCGCGCCAGAATATCAGCACACCCTAATCCTG +CAGGTCCAGCGCCAATCACCGCCACTTTTTCGCTACGGGGAACAACTTTGCTGACATCGG +GACGCCAGCCCATCGCCAGCGCAGTATCGGTGATGTAGCGTTCCAGATTACCGATAGAGA +CTGCGCCAGAGTGATCTTTCAAAGTACATGCACCTTCACAAAGACGGTCCTGTGGACATA +CCCTGCCGCAGATTTCGGGTAAGGAACTGGTCTGGTGGCAAAGTTCTGCCGCTTCAATAA +TCTTTCCTTCCTGTACCAGACGGATGTAATCCGGAATAGCGTTATGCAGCGGACAATGCC +AGTTGCAGTTAGCTTTTTCGGCACAATAAACACAGCGGTCACTCTCATAAGTCGCTTGTT +GTGGATCCAGCCCGCAATAGATTTCGCCAAAGTGGGTTTTCCGTTCACTCGCTGAAATTT +TATCTGCGCCTTTACGCGAGTTAACGGGGAGCAACGCTGCACTGCGAGATGGCTGAGCGT +CTGATGACGCTTTTCCTGCTGCCGTTTTGCGCTGGCGGGCCACCTTTATCTGCTGCAACC +CTTTATCGTCCATCAGCCGTAACGCCTGTGTTGGGCAGACGTCAATACAGGCTTGCGTGC +CGGAACTGCGCTGGTTACAAAGGTCGCATTTCTGTGCAATCGTATCGACCATCTCAACGA +CGCCAAAGGGGCAAGCGATTGCGCATCTTTTACAACCAATACATTTTTGCTCGTCCAGTT +GTACGCTATCGGACTGGAAAGTCAGAGCATTAACCGGACAAGCCGTAACGCAAGGGGCAT +TGTTGCAGTGATGGCAGGCCACCGGATTCGCAGCCTGGCCTTTCCCTACAACGTGGATAC +GCGGTCGAAAGTCACTGTGACTCAGCGGCCAGTTTTCTTGATTATGTGCCACCGCACAGG +CAATTTCACAAGCATGGCAGCCTATACATTCCGCAGCTTCAGCAGCGATAAACTTATTCA +TTTGCATCCCTTTCATTTAATGAGTTATGTCTTCTCAAATTTCGCGATGCAATAAACGGG +CATATATTAGGTAGCATGACCGTTTTAATTATAATTTTGCAACTGAGTTCAAATTATTGC +CCCTCAATCTATGCCGCTTTCATTATTTCAACATTGCCGATCAAAAGAATGCTATCCAGA +TAAAAACGATTAAATGCGAGAGTGCGACATGCCAGAATGATTAATGAAATATCAATATGA +GAAAATTACAGATAATTCCATTGTCAGGTTCTCTTCTCATAATCGTGGTTTAACCACGAT +TATGTGATTGCCTCCGCAATTCCTGTCTCTAACTCCCCTTCCTCGCAAAAACTGGCACTC +CACGAGCATGTGTTTAGACAGTTTCATGAACATAAACGGTTGCTTTTTACTCTGGCGGGC +GAAAGGAGAAACACTGATGAGCGCCATAGATTCCCAACTTCCCTCATCTTCTGGGCAAGA +CCGCCCAACTGATGAGGTTGACCGCATATTATCACCAGGAAAGCTGATCATACTCGGTCT +GCAACACGTCCTTGTCATGTACGCAGGTGCAGTCGCTGTTCCTCTTATGATTGGTGACCG +ACTCGGCCTATCAAAAGAAGCTATTGCGATGCTCATCAGCTCGGATCTCTTTTGCTGCGG +GATCGTCACATTATTGCAATGTATCGGTATCGGCCGCTTTATGGGGATCCGCCTGCCGGT +GATTATGTCGGTGACCTTCGCCGCTGTAACACCAATGATAGCCATTGGTATGAACCCGGA +TATCGGCCTGCTGGGGATATTCGGTGCCACTATCGCCGCGGGTTTTATCACCACATTATT +AGCGCCACTTATCGGTCGCTTGATGCCTTTATTCCCGCCACTGGTTACCGGTGTGGTGAT +TACTTCTATCGGGCTTAGCATCATTCAGGTGGGTATTGACTGGGCCGCCGGAGGTAAAGG +GAATCCGCAATATGGTAATCCCGTTTATTTAGGTATCTCCTTTGCCGTCTTAATTTTTAT +CTTGCTCATTACTCGCTATGCGAAAGGATTTATGTCCAACGTCGCCGTATTACTGGGGAT +TGTATTTGGCTTTTTACTTTCGTGGATGATGAATGAAGTCAATTTATCCGGGCTACATGA +TGCTTCATGGTTTGCGATTGTCACGCCGATGTCATTTGGTATGCCGATTTTCGATCCCGT +TTCCATTCTGACCATGACTGCCGTGTTAATCATCGTGTTTATCGAGTCGATGGGGATGTT +CCTGGCACTGGGTGAAATAGTCGGTCGCAAACTCTCTTCCCAGGACATTATTCGTGGGTT +ACGCGTAGATGGGGTTGGGACAATGATTGGAGGCACGTTTAACAGCTTCCCACATACGTC +ATTTTCGCAGAACGTCGGGCTGGTCAGCGTGACGCGCGTCCACAGCCGCTGGGTGTGCAT +TGCTTCCGGTATCATTTTGATCCTGTTCGGCATGGTGCCCAAAATGGCGGTGCTGGTGGC +CTCGATTCCGCAATTTGTGCTGGGCGGCGCGGGGCTGGTGATGTTCGGCATGGTACTGGC +GACAGGGATTCGAATTCTGTCGCGCTGTAACTACACCACTAACCGTTACAACCTCTATAT +TGTGGCGATCAGTCTCGGTGTTGGCATGACGCCAACGCTCTCTCACGATTTCTTTTCTAA +GTTACCGGCCGTACTGCAACCGTTGCTGCATAGCGGCATTATGCTCGCAACCCTTAGCGC +CGTTGTGCTGAACGTCTTCTTTAATGGCTACCAGCATCATGCTGACCTGGTGAAGGAATC +CGTCTCTGATAAAGATTTAAAAGTCAGGACAGTACGTATGTGGCTTCTGATGCGCAAGCT +GAAGAAAAATGAGCATGGAGAATAATATGAATCTTTTAATGCGCGCTATATTCAGTCTGC +TGTTGCTTTTTACTCTCTCTATTCCTGTCATTTCTGATTGTGTTGCAATGGCCATTGAAA +GTCGCTTCAAATATATGATGCTGCTTTTTTAAATGGTTTTTACCTGTCGACATCCGCTCA +AAACGGGCGGTTGTCGATAAACGCTCACTTGGTTAATCATTTCACTCTTCTATTATCTAT +AATGATGAGTGATCAGAATTACATGTGAGAAATTATGCAAACGGAACACGTCATTTTATT +GAATGCACAGGGAGTTCCCACGGGTACGCTGGAAAAGTATGCCGCACACACGGCAGACAC +CCTCTTACATCTCGCGTTTTCCAGTTGGCTGTTTAATGCCAAAGGGCAATTATTAGTTAC +CCGCCGCGCCCTTAGCAAAAAAGCATGGCCTGGCGTGTGGACTAACTCGGTTTGTGGGCA +CCCACAACCGGGAGAAAGCAACGAAGAGGCGGTGATCCGCCGTTGCCGTTATGAGCTTGG +CGTAGAAATTACGCCTCCTGAATCTATCTATCCTGACTTTCGCTACCGCGCCACCGATCC +GAATGGCATTGTGGAAAATGAAGTGTGTCCGGTATTTGCCGCACGCACGACCAGTGCGTT +ACAGATCAACGATGATGAAGTGATGGATTATCAATGGTGTGATTTAGCAGCGGTTTTACG +CGGTATTGATGCTACGCCGTGGGCGTTCAGTCCGTGGATGGTGATGCAGGCGACAAATCG +CGAAGCCAGAAAACGATTATCTGCATTTACCCAGCTTAAATAAAAAACCCCGACGGTTGC +CGGGGTTGTGAGCATAACGTAATGCTTATTTTACCGGACGCATCGCCGGGAACAGAATAA +CGTCGCGGATGGTATGGCTGTTGGTGAACAGCATTACCATACGGTCGATACCAATTCCCA +GACCGGCTGTCGGTGGTAAGCCATGTTCCAGTGCGGTGACATAATCTTCGTCGTAGAACA +TCGCTTCGTCGTCACCTGCATCTTTCGCGGCAACCTGATCCAGGAAGCGCTGCGCCTGAT +CTTCCGCGTCATTCAGCTCGCTAAAGCCGTTACCGATTTCACGCCCACCAATGAAGAACT +CAAAGCGGTCTGTGATTTCCGGGTTAACGTCGTTACGACGCGCCAGAGGAGAAACTTCTG +CCGGATATTCAGTAATGAAGGTCGGCTGGATCAGATGTGCTTCTGCCACTTCTTCGAAGA +TCTCGGTAACGATACGGCCCAGACCCCAGCTCTTCTCAACGTGGATGCCGATAGATTCAG +CAATCGCTTTCGCAGAGTCGAAGTTGTCCAGATCTGCCATGTCGGTTTCCGGGCGATATT +TCTTGATCGCTTCACGCATGGTCAGTTTTTCGAACGGCTTACCGAAGTCCAGCGTTACGT +CGCCGTAGGTCACTTCCGTCTTACCGAGAATATCCTGTGCCAGAGTACGGAACAGCGATT +CGGTCAGCTCGATCAGATCTTTGTAATCTGCGTAAGCCATATAGAGTTCCATCATGGTGA +ACTCTGGGTTATGACGTACGGAAATACCTTCGTTACGGAAGTTACGGTTGATTTCGAATA +CACGCTCGAAGCCACCGACCACCAGACGCTTGAGGTACAGTTCCGGCGCGATACGCAGGT +ACATGTCGAGATCCAGCGCGTTATGGTGGGTGATGAACGGACGCGCAGCGGCACCGCCAG +GGATCACCTGCATCATCGGCGTTTCAACTTCCATAAAGCCGCGATTCACCATGAACTGGC +GAATACCAGAGAGGATCTGCGAGCGCACTTTAAAGGTGTTGCGGGATTCATCGTTAGAGA +TGAGATCCAGATAACGCTGACGATAGCGCGCTTCCTGATCCTGCAAGCCGTGGAATTTAT +CCGGCAGCGGACGCAGTGCTTTGGTCAGCAGACGCAGCTCGGTACAGTGGATAGACAGTT +CGCCGGTTTTGGTTTTGAACAGTTTACCTTTCGCGCCGAGGATATCGCCGAGGTCCCATT +TTTTGAACTGCTCGTTGTAAACGCCTTCCGGCAGATCGTCACGGGCAACGTACAACTGAA +TGCGACCGCCAACGTCCTGCAGGGTAACGAAAGACGCTTTACCCATAATACGACGGGTCA +TCATGCGGCCAGCAACGGCGACTTCGATGTTCAGCGCTTCCAGTTCTTCGTTCTCTTTAC +CGTCGAATTCTGCGTGCAATTGGTCAGAGGTATGATCGCGACGGAAATCGTTCGGGAAGG +CAATCCCCTGCTCACGCAGGTTCGCCAGCTTCTCACGACGCGTTTTCAGTTCATTGTTAA +GATCGACTACCGCGTCAGCGCCCTGTGCGTGTTGTTCAGACATGTTGGTTCCTCATAACC +CTGCTTTCAAACTTGCTTCGATAAATTGATCCAGGCTGCCGTCCAGCACGGCCTGCGTGT +TGCGGGTTTCTACCCCGGTACGCAGATCTTTAATGCGGGAGTCATCAAGGACATAAGAAC +GAATCTGGCTGCCCCAGCCGATGTCGGATTTGTTATCTTCCATCGCCTGTTTCTCGGCAT +TTTTCTTCTGCATCTCCAGTTCATAAAGCTTCGCTTTCATCTGCTTCATGGCCTGGTCTT +TGTTCTTGTGCTGGGAACGGTCGTTCTGGCATTGGGTCACGATCCCGGTTGGGATGTGAG +TAATACGCACCGCAGATTCGGTACGGTTAACGTGCTGACCGCCCGCGCCGGATGCGCGAT +AAACGTCGATGCGCAGATCCGCCGGATTGATTTCGATATCGATATCATCATCAACTTCCG +GGTAAACAAACGCGGAGCTGAACGACGTGTGGCGACGACCACCGGAGTCAAACGGGCTCT +TACGCACCAGGCGGTGAACGCCGGTTTCTGTACGCAGCCAGCCATAAGCGTAATCGCCGG +AGATTTTGATCGTCACGGATTTAATACCCGCCACTTCACCTTCCGACTCTTCGATGATTT +CAGTTTTGAAACCACGCGATTCAGCCCAGCGCAGATACATACGCTCAAGCATGCTCGCCC +AGTCCTGTGCTTCCGTACCGCCAGACCCCGCCTGAATATCGAGGTAGCAGTCGGCGCTGT +CATATTCGCCAGAGAACATACGGCGGAACTCAAGCTGCGCCAGTTTTTCTTCCAGGGCGT +CGAGTTCAGCAACGGCTTCGTTAAAGGTTTCTTCGTCGTCAGCTTCTACAGCCAGTTCCA +GCAGACCAGAAACATCTTCCAGCCCCTGTTTCATTTGGTCGAGGGTGTCGACAACGGCTT +CGAGGGAGGAACGCTCTTTACCCAGCGCCTGTGCGCGTTCGGGTTCGTTCCAGACATCCG +GCTGTTCCAGCTCGGCGTTTACTTCTTCCAGACGCTCTTTCTTGGCGTCATAGTCAAAGA +TACCCCCTAAGAACGTCGGAGCGTTCCGTGAGGTCCTGAATGCGATTATTTACCGGATTA +ATTTCAAACATGGTCTGATTTCTTTTATTGAGCTAGTCAAAATGCGGTGATTAGAGCGGG +ATTGTACCCAATCCACGCTCTTTTTTATAGAGAAGATGACGCTAAATTGGCCAGATATTG +TCGATGATAATTTGCAGGCTGCGGTTGCCGCGAAACTCGTTGATATCGAGCTTGTAAGCC +AGTTGCACTTCGCGCACGCCGTTATCCGGCCAGAGGGCGGTATCGACATTAAAAGCAATA +CCATCCAGCAGCGGACCGCCGCCGACCGGCTCGACCATGACTTTCAAATGACGCTCGCCC +ACCAGCCGCTGTTGCAGCAGACGGAAATGACCGTCAAACAACGGTTCCGGGAACATTTGT +CCCCACGGGCCAGCATCACGCAGCAGTTGCGCCACTTCCATGGTCATCTCTGCCGCACTT +AATGGGCCGTCTGATACCACTTCCCCTTGCAATAAAGAAGGATCTAACCACTCGGTAACC +AGTTCGCCAAAGCGTTGCTGAAAGAGTTCGAATTTCTCCTCTTCCAGCGACAAACCCGCC +GCCATCGCATGGCCGCCAAACTTGAGCATCATGCCGGGGTAAAGCGTGTCTAGCCGCTCC +AGCGCATCGCGCATATGCAGCCCCTGAATGGAGCGACCGGAACCTTTCAGCGTACCGTCG +CCCGCAGGCGCAAAGGCGATAACCGGACGGTGAAAACGCTCTTTGATACGCGATGCCAGA +ATGCCAACAACGCCCTGATGCCATTCAGGGTGATACATTGCCAGCCCACCTGGCAGCGTG +TCGCGGCTACGTTCCAGCTTCTCGCACAGAGTGAGCGCTTCAACCTGCATTCCCTGTTCG +ATCTCTTTACGTGTTTGGTTTAGTGCATCGAGTTCATTCGCCAGCACACGCGCTTCGCCA +ATGTTGTCACACAACAACAGCGCCACGCCAACGGACATATCGTCCAGTCGCCCGGCAGCA +TTGAGACGTGGCCCCAGCGCAAAACCTAAATCGCTGGCGGCGAGTTTTTGTGGATCGCGA +TTGGCCACTTCCAGCAGCGCTTTAATCCCCGGACGGCACTTTCCGGCACGGATGCGACTC +ATCCCCTGCCAGGTCAGAATGCGATTATTAGCGTCCAGCGGCACGACGTCCGCCACTGTC +CCCAACGCTACCAGATCCAGCAGTTCTGCCAGATTAGGAATTGCGATGCCGCGCTCATCA +AACCAGCCCTGATCGCGCAAAAAGGTGCGCAGCGCCAGCATCAGATAAAACGCCACACCC +ACGCCTGCCAGTGATTTCGACGGGAAATTACAGTCGCGCAAGTTAGGGTTAATGATCGCT +TCCGCTGCGGGTAATGTGTCGCCTGGCAAATGGTGATCGGTAACAATAACCGGAATGCCC +AACGAACGAGCGTGTTCAACCCCCGCATGGGAGGAAATACCGTTATCCACCGTGACAATT +AACTGCGCGCCACGGGCATGAGCCTGATCGACTACTTCCGGGCTTAAGCCGTAACCGTCT +TCGAAACGGTTTGGAACCAGGTAGTCGATATTGCTGCAACCAAGCGAGCGCATCGCCAGC +ACGCTTAGAGCCGTGCTGGTCGCACCGTCGGCGTCGAAATCACCGACCACAATAATCCGC +GTTCCTTCGCGAAAAGCGTTGTAAAGGATCTCAACGGCCTTTTCGACGCCGCTCAGTTGC +TGCCAGGGCAGCATGCCTTTAACACTGCGTTCCAGTTCCTGCGCGCTACGCACACCCCGG +CTGGCATATAAACGGCGCAGCAAGGGAGGCAATTCAGCGGGCAAGTCGGCCGTTTCATCG +ACTTCTCGGCGACGAAGTTGTATCTGTTGTTTCACGCGAATTATTTACCGCTGGTCATTT +TTTGGTGTTCGTCGAGGAATTCTTTCATGTCTTTCGGCGGCTGGTAACCCGGAACAAGTG +TGCCATTGCTCAGCACAACTGCCGGAGTACCGCTAACGCCAAGCTGGACGCCAAGTGCGT +AATGGTCGGCAATATCCACGTCGCAGCTGGCTGGTGCGACGCTTTTACCTGCCATCACAT +CATCAAACGCTTTGTTTTTATCTTTCGCACACCAGATAGCTTTCATTTCTTTCTCTGCAT +CGCTGTCCAGCCCCTGGCGCGGGAAAGCAAGATAACGCACGGTGATCCCCAGCGCGTTAT +AGTCTGCCATTTGCTCATGCAGTTTGTGGCAGTAACCACAGGTAATATCAGTAAACACGG +TGATGACGTGTTTTTCCTGCGGCGCTTTATAAACGATCATCTCTTTTTCAAGCGCATTCA +ACTGCTTTAACAGCATCTTATTGGTGACATTGACCGGAGCCGTGCCACTAACGTCATACA +TTGGCCCCTGAATGATATGTTTACCATCATCGGTGATGTACAACACACCGCTGTTAGTCA +GAACTGTCTTCATGCCAGCTACGGGCGCGGGCTGAATATCGCTGCTTTTGATGCCCATTT +TGGCTAACGTTTGTTGAATTGCCGCGTCATCAGCCTGAACAAAGCCTGAAAACGCTGCCA +ACAAGGTAAATAACATAAAACCTTTCTTCATAAATTTTCCTGTTCTTTTCAGACATCACG +CCCGCGGGTGATGCTGTTGATGAAGTTGTCGCAGACGCTCGGTAGCGACATGCGTATAAA +TTTGCGTGGTGGAGAGATCGCTGTGGCCCAGTAGCATCTGCACCACGCGTAAATCCGCAC +CATGATTTAATAAGTGAGTGGCAAAAGCGTGACGCAACACATGCGGTGACAGCTTTTCGC +TGTCGATACCCGCCAGCACGGCATAATGTTTAATGCGGTGCCAGAAGGTCTGTCGCGTCA +TCTGCTGCGCACGCTGGCTGGGAAACAACACGTCAATTGACACACCATTCAACAGCCACG +GACGCCCATGTTCCAGATAGGTTTCCAGCCAGTAAACCGCCTCTTCACCTAACGGCACCA +GGCGCTCTTTGTTGCCTTTACCAATGACCCGCACCACGCCCTGACGCAGGCTGATATCAC +TCATTGTCAGCCCGACCAGTTCAGAGACACGCAGTCCGGTAGCATACAACACTTCAAGCA +TGGCTTTATCGCGTAGCTCCAGTGGCTGATCAATTAATGGTGCCTGTAATAAACGTTCGA +CCTGCGCTTCGCTTAAATCTTTTGGCAAACGCTGGGGCAATTTCGGTGAAGCGAGATGCG +CACTGGGATCATCTTCACGAAACTTTTCGCGATAAAGATACTGGAACAATCGGCGCACTG +CACTCAGCAAACGCGCTGAGCTGGTGGCTTTATACCCGCCCTCCAGCCGTTCTGCCAGTA +ATGCCTGCAAATCGTCACTTTGCGCCGTCGCCAGCGTCAACCCGCGGTGATGCAACCACT +CCACCATCATTGACAGATCGCGACGGTAAGCGTTCAACGTATTTTCAGCCAGATTTTTTT +CCAGCCACAGAGCATCAAGAAACTGCTCGATGCGTGCCAGATCCTGTTTCACTTGCGCCC +CTTATGGTCACTCATTTGATCCATTATGCCTTATTGTGCCGTGACTAAAGCGATTCTGAT +ACACTAGCCGCAAAAGCCACAGCAGAATCGAGAAGCTTACGTTATGAATATGGGTCTTTT +TTACGGTTCCAGCACCTGTTACACCGAAATGGCGGCAGAAAAAATCCGCGATATTATCGG +CCCAGAACTGGTGACCTTACATAACCTCAAGGACGACTCCCCGAAATTAATGGAGCAGTA +CGATGTGCTCATTCTGGGTATCCCGACCTGGGATTTTGGCGAAATCCAGGAAGACTGGGA +AGCCGTCTGGGATCAGCTCGACGACCTGAACCTCGAAGGTAAAATTGTTGCGCTGTATGG +GCTTGGCGATCAACTGGGATACGGCGAGTGGTTCCTCGATGCGCTCGGTATGCTGCATGA +CAAACTCTCGACCAAAGGCGTGAAGTTCGTCGGCTACTGGCCAACGGAAGGATATGAATT +TACCAGCCCGAAACCGGTGATTGCTGACGGGCAACTGTTCGTGGGTCTGGCGCTGGATGA +AACTAACCAGTATGACCTTAGCGACGAGCGTATTCAGAGCTGGTGCGAGCAAATCCTCAA +CGAAATGGCAGAGCATTACGCCTGATGTCACTGACGGCTTAGCACATATGCTTTGCCGTC +ATCTTTATCTTTGCGTCTCTTGTTGTAACAATATCCGCCGTAAATCCCGCCATTCGGCTT +CGTCCATGCTGTCAGCTGCCAGCCATAAATGTTGCCGTTTTCCGCTGTCAGAACGTAAAC +GCAGCATCATGCCGCTCTTAATCATCCACGGCGCTTTGACGATGCTCCACTCCTGCCCTT +GCCAACGCAAACGCCCGTCCATCAACAAGCGAATTTCCCCCTGGCGAGCATTAATGCGCC +GCTGGCTGCGAACGCAATCAAACACCACCAGCGAAAGTAACACCATCCATAACGGGGTGT +AACTGAGCGGCCAGGGCATGAGTAAAATAACAGCGGCAACCAGCCCATGAATCAGCAAGG +AAAGCCACTGTGCGCGCCAGGAGACGCGCAAATCAGATTGCCACAGGACCACGTTCCCGG +TTCCGTGTCTGGATGAGTCGGACCATCATTTCCAGTTCTGCATCGGCTGGTTTACCGTGA +TTCATCAGCCAGTTAAACAGGTCCGGATCGTCACATTCCAGCAGACGAATAAAGATGCGT +TTTTCGTCATCGCTTAAGCTGTCGTACTCATGTTCGAAAAACGGCATGATTGAAATATCG +AGTTCGCGCATACCACGGCGGCATGCCCAATGAATGCGGGCTTTGTTGTTAATGTCCATC +TTCTTCCTGTCTCACGAAAATCCAGTACCCGGCTATTGTAACGTGTTTTTCGACTTCTTT +TACGGGAATATCAGTAAACACAATCGCGATCGCGAAATTAATTCACAACAATTCAAGGGC +TTCATTTTTTTGGAAGTCGCCTCGCAGAAGGCACAGATCGCGTAGTGAAAGCACTTGCAT +TGCCTCATAGCTCTTTTACCATTAGTTATTAATACGCCGTTAAGCAACTCAGGACTCTAT +TATGGCTTTTACACCTTTTCCTCCCCGTCAGCCTACGGCTTCTGCCCGTTTGCCACTGAC +GCTGATGACGCTTGATGACTGGGCGCTTGCCACTATTACTGGCGCGGACAGCGAAAAATA +TATGCAAGGCCAGGTGACAGCAGATGTCAGCCAGATGACAGAAGATCAGCACCTGCTCGC +CGCCCATTGCGACGCCAAAGGTAAAATGTGGAGCAATTTACGTCTGTTCCGCGACGGCGA +TGGCTTTGCATGGATTGAACGGCGCAGCGTGCGTGAACCACAGCTGACTGAACTGAAAAA +ATATGCGGTGTTCTCTAAAGTGACAATCGCGCCAGACGACGAGCGTGTGCTGCTTGGTGT +TGCCGGTTTTCAGGCGCGCGCCGCGCTGGCAAATCTCTTTAGTGAACTGCCTTCGAAAGA +AAAACAGGTAGTTAAAGAAGGCGCGACTACTCTGCTTTGGTTTGAACATCCGGCAGAACG +TTTCCTGATCGTAACCGATGAAGCTACTGCCAATATGCTGACCGATAAACTGCGCGGTGA +AGCGGAACTGAACAATAGCCAACAGTGGCTGGCATTAAACATTGAAGCGGGTTTCCCGGT +GATTGATGCCGCCAACAGCGGGCAGTTTATCCCCCAGGCGACCAACCTCCAGGCGCTGGG +CGGTATCAGCTTTAAGAAAGGCTGCTATACCGGACAAGAGATGGTGGCGCGAGCAAAATT +CCGTGGTGCCAACAAACGCGCGCTCTGGTTGCTGAAGGGTAGCGCCAGCCGACTGCCGGA +AGCTGGTGAAGACTTAGAGCTGAAAATGGGCGAGAACTGGCGTCGTACCGGTACGGTGCT +GGCTGCGGTCAAACTGGAAGATGGTCAGGTTGTGGTGCAGGTTGTCATGAATAACGATAT +GGAACCGGACAGCATCTTCCGCGTGCGTGACGATGCGAATACATTGCGTATCGAGCCACT +GCCATATTCGCTGGAAGAGTAAATCTCTGTATCGCATCAGGCATTTATCGCCTGATGCGA +CACTGGTGTGTCTTTTCAGGCCTACAAAGGCACGCCAATTACGCCTGCCCAATATACAAA +TAGATCGCCAGAAAGTGGCACACACTACCGCCGAGCACAAAGCCGTGCCAGATGGCATGA +TTGTATGGAATGCGCTTGCAGACGTAGAAAATCACCCCGAGCGAATAAACCACACCGCCT +ACCGCCAGTAAGGTAACGCTGCCCGCCGCGAGCTTAACTGCCATTTCATAAATTACCACC +AGCGACAGCCAGCCCATCGCCAGATAGGTCACCAGAGATAAAATTTTGAATCGGTGCGCG +ATGGTCAGTTTAAACAGAATACCCAGCAATGCCAGGCTCCAGATAACAATCATCAACCCG +CGCGCTAACGGAGAATCCAGCCCCACCAGCAAAAACGGCGTATAGGTTCCGGCAATCAAC +AGATAAATGGCACAGTGGTCAAATTTCTTCAGCCACATTTTTGCCCGTTGATGGGGAATG +GCGTGATAGAGCGTCGAAGCGAGGAACAGCAGGATCATACTGCCGCCATAGAGGCTGTAA +CTGGTTATCGCCGTGGCGCTGGCATTGAGATCCACCGCCTGAACCAGTAGCAACACCAGC +CCAACGATACCAAACACCAGCCCAATGCCGTGACTGACGCTGTTGGCAATTTCCTCTGCC +AGCGAATATCCCTGCTTAATGAGGGGCTTCTGAACCATAACTTACTCCGGAAAAACGTAC +ACGCACATGTATACCTCTCCAGCGTAACTGAGAATAGTTCCAGTGAACACCTGTTAGCTA +AAATAAATTCTGATTTGAGATTAATCTCCGAAAAATCATGAAATTAAATGCGAAATTTCA +ACTAACAGGCGTGAGTTCAATTTAAAGACATTTAAATTCAATCACATAAAACTGTGTCTG +GTCGGGATAGATGTCGGCAATGACCTTTTTCAGTTCAGTCAGGGTCATATTTTCCTGCTC +TGCATGTTTTTCCGTCAGCGTATCCAGCGTTACGGTTGAGGTTGCGGTGACTTCAATCGT +GCAAAAATAACCGTCATCTTCAAAACGTCCGACACGAAGCACATCACCCGTTTTGAAGTG +CGATTCAGACTCGTCGCGGATGGTGATGGTTTTACGCCCAGCCAGAATGTCATCCTGGAA +ACGTTGAAAAAAAGTGATGTCGTTTGGCTGCATGGTAATATTTCCTGTAAGAATTGACTC +ATCTGGAGCCTATGATAGTGAAAAAACTCACCTTACCGAAAGATTTCTTATGGGGCGGCG +CAGTTGCCGCTCATCAGGTCGAAGGCGGCTGGAACAAAGGCGGCAAAGGGCCGAGCATTT +GTGACGTTTTGACCGGTGGCGCACACGGCGTGCCGCGCGAAATCACCAAAGAAGTTGTGC +CTGGCAAATACTATCCAAACCATGAAGCCGTTGATTTTTATGGTCACTACAAGGAGGACA +TCAAGCTATTTGCCGAAATGGGCTTCAAATGTTTTCGTACTTCCATCGCCTGGACGCGCA +TTTTTCCAAAAGGCGATGAAGCTCAGCCAAACGAAGAAGGGCTGAAGTTCTACGATGATA +TGATCGATGAACTGCTGAAATACAACATCGAACCGGTGATCACCCTCTCCCACTTTGAAA +TGCCGCTGCATCTGGTGCA +>test.0417.00002.0005 6009 +GCAATATGGTAGCTGGACCAACCGTAAAGTGGTTGATTTCTTTGTCCGTTTCGCGGAAGT +GGTATTTGAACGCTATAAGCATAAAGTCAAATACTGGATGACTTTCAACGAAATTAACAA +CCAGCGTAACTGGCGTGCACCGCTGTTCGGTTACTGCTGCTCCGGCGTGGTGTATACCGA +GCATGAAAACCCGGAAGAGACGATGTATCAGGTGCTGCATCACCAGTTTGTCGCCAGCGC +CCTGGCGGTGAAAGCCGCGCATCGCATCAACCCGGAGATGAAAGTCGGTTGTATGCTGGC +GATGGTGCCGCTCTATCCTTACTCCTGTAACCCGGACGATGTGATGTTTGCCCAGGAGTC +GATGCGCGAACGTTACGTCTTTACCGATGTGCAGTTGCGTGGCTATTACCCGTCCTATGT +GTTGAACGAGTGGGAACGCCGCGGATTTAACATCAAAATGGAAGACGGCGATCTGGATGT +ACTGCGCGAAGGCACCTGCGATTATCTCGGCTTCAGCTATTACATGACCAACGCGGTGAA +GGCCGAAGGTGGCACCGGCGATGCGATTTCTGGTTTCGAAGGCAGCGTACCGAATCCGTA +TGTTAAAGCGTCTGACTGGGGCTGGCAGATTGATCCGGTTGGTCTGCGCTACGCACTTTG +CGAGCTGTATGAGCGTTACCAGAAGCCGCTGTTTATTGTCGAAAACGGTTTTGGCGCTTA +CGACAAAGTGGAAGATGATGGCAGCATCAATGACGATTACCGCATTGATTACCTGCGTGC +CCATATTGAAGAGATGAAAAAAGCGGTGACTTACGATGGCGTGGACCTGATGGGCTACAC +GCCGTGGGGCTGCATCGACTGTGTGTCGTTCACCACCGGGCAGTACAGCAAACGCTACGG +CTTTATCTATGTGAATAAACATGACGACGGTACTGGCGATATGTCGCGTTCACGTAAGAA +GAGCTTTAACTGGTACAAAGAGGTGATTGCCAGCAACGGCGAGAATCTGTAATTAGCCGA +TGTGCCTGATGTGCTCCGCTCATCAGGCCTGGCACTCTTTTAATATATTGAGCTCGCAAT +ATTTTATATTACGCCTCAGCCGAAACACACAAAGCGCACTTTATTAACAAGCGAAAAAGG +CGCCGAAGCGCCTTTATAAGATAGTCGAATCAGTAAATTACTGGTATTCGCTAATCGGTA +CGCAGGAGCAGAACAGGTTACGGTCGCCGTAAACATCATCCAGACGTTTCACGGTCGGCC +AGTATTTGTCTGCCACACCTGCCGGGAATACTGCAACTTCACGGCTGTACGGATGCGCCC +ACTCGGCGACCAGTTCGCTTTGAATGTGCGGCGCATTCACCAGCGGGTTATCTTCCAGCG +GCCAGACACCGGCTTTCACCTGATCAATTTCTGCGCGGATAGCCAGCATCGCATCGATAA +AGCGATCCAGTTCCACTTTGCTTTCAGATTCAGTCGGTTCAACCATCAGCGTACCCGCCA +CCGGGAACGACATGGTCGGCGCGTGGAAACCGTAGTCGATCAGGCGCTTGGCAATATCCA +GCTCGCTGATGCCGGTTTCTTCTTTCAGCGGGCGAATATCGAGAATACATTCGTGCGCCA +CGCGACCGTCGCGACCGGTATACAGCACCGGGAAGGCATCCTGCAGACGGCTGGCAATAT +AGTTGGCGTTAAGAATTGCCACCTGGCTTGCTTTTTTCAGCCCTTCTGCGCCCATCATGC +GGATGTACATCCAGCTGATTGGCAGGATAGAGGCACTACCGAACGGTGCCGCAGAAACCG +CGCCCTGACGGGTTAACATGCCTTCGATTTGCACCACGCTATGACCCGGTACAAACGGAG +CCAGATGCGCTTTCACACCGATCGGTCCCATACCCGGACCACCACCGCCATGCGGAATGC +AGAAAGTTTTATGCAGGTTAAGGTGGGAAACGTCCGCACCAATAAAGCCCGGCGAGGTGA +TGCCAACCTGAGCGTTCATGTTCGCGCCATCAAGGTAAACCTGACCGCCGAACTGATGCA +CGACTTCACACACTTCACGGATCGTTTCTTCATACACGCCGTGGGTAGAAGGATAGGTCA +CCATGATACAGGAGAGGTTATCGCCCGCCTGTTCCGCTTTCGCGCGCAGATCAGTCAGAT +CGATGTTGCCGTTTTTATCACACGCCACAACCACCACCTGCATTCCTGCCATATGCGCGG +AAGCCGGGTTAGTGCCGTGCGCAGAAGCCGGGATCAGGCAGATATCGCGATGCCCTTCGT +TGCGGCTTTCATGATAATGACGAATCGCCAGCAGGCCCGCGTATTCGCCCTGTGCGCCAG +AGTTCGGCTGCATACAAACGGCGTCGTAACCGGTCAGTTTCACCAGCCAGTCAGCCAGCT +GCGCGATCATCTGCTGATAACCTTCAGCCTGTTCTGGCGGGCAAAACGGGTGCAGTTCGG +CAAATTCCGGCCAGGTGATCGGGATCATCTCGGCGGCGGCGTTCAGTTTCATGGTGCAGG +AACCCAGCGGGATCATCGCCTGATTCAGCGCCAGATCTTTACGCTCCAGCGAGTGCATAT +AGCGCATCATTTCGGTTTCGCTGTGGTAGCGATTAAACACCGGATGGGTGAGGATTTCGT +CGTCGCGCAGCATCGCAGCCTGAATAGAGCGACTGTCGTGAGCCACGTCTTTGTCCAGTG +TGTCGATGTCCAGCCCGTGGTTATCGCCCAACAGCACGCTGAAAAGCTGCATCACGTTTT +CGCGCGTGGTTGTTTCATCAAGGGTGATCCCAACCGCGTTCAGAATATCGCTACGCAGGT +TGATTTCAGCCGCTTCGGCACGCGCCAGCACGCCCGCTTTGTCGGCCACTTCCACACACA +AAGTATCGAAATAGTGCGCATGGCGCAGCTTCAGACCTTTTTGTTGCAGGCCCGCCGCCA +GGATATCGGTCAGACGGTGGATGCGATTAGCGATACGTTTCAGGCCAACCGGACCGTGAT +AAACGGCATACAGGCTGGCAATGTTTGCCAGCAGTACCTGGGAAGTACAAATGTTGGAGT +TCGCTTTCTCACGACGAATATGTTGCTCGCGAGTCTGCATCGCCATGCGCAGAGCGGTGT +TGCCAGCTGCATCTTTCGATACACCGATAATACGGCCCGGCATTGAGCGTTTGTATTCGT +CTTTCGCCGCAAAGAATGCCGCGTGTGGGCCACCATAGCCCATCGGTACGCCAAAGCGTT +GCGCCGAACCAAAAACAATATCCGCGCCCTGTTTACCTGGCGCAGTTAACAGCACCAGCG +CCATAATATCGGCGGCAACGCTGACCACAATTTTGCGTGATTTCAGTTCGCTAATAAGCG +CGGTGTAGTCGTGAATTTCACCAGTAGTGCCGACCTGCTGTAACAGCACGCCGAAAACGT +CCTGATGGTCGAGCACTTTTTGCGCGTCATCGACAATCACTTCAAAACCAAAGGTTTCGG +CACGAGTACGGACCACATCCAGCGTTTGCGGATGAACGTCAGAAGCAACAAAGAAGCGGT +TGGCATTTTTCAGTTTGCTGACGCGTTTCGCCATCGCCATTGCTTCGGCGGCAGCGGTGG +CTTCGTCAAGAAGAGAAGCAGAGGCCATATCCAGCCCGGTTAAATCCAGCGTTACCTGCT +GGAAGTTGAGCAGTGCTTCAAGGCGGCCCTGGGAGACTTCAGGTTGATACGGAGTATACG +CGGTATACCAGCCCGGATTTTCCAGCATGTTACGCAGGATAACCGGCGGTAGCTGCACGG +CGGTGTAACCCATGCCGATGTAAGACGTGAAGCGTTTATTGCGACTGGCAATAGCCTTGA +GTTCTGCCAGTGCGGCGTATTCGGTCGCCGGTGCGCCAACCTGCGGCGGAGTCGCAAGCT +GAATATCTTTCGGCACAATCTGGCCGGTCAGCGCGTTTAACGATTGTGCGCCAACGGCAT +TCAGCATTTCTTGCTGTTGCGCGGCGTCCGGTCCGATATGGCGTTCAATAAAAGCGCCGC +TGTTTTCAAGCTGGCTTAACGTCTGTGTCATGAGCGATGGTTCCTGAAACGTGCAGTGAA +TTGTGAACCTCTCTCCTTGCGAAGAGAGTGAGGGTGAGGCGTAAATTTCCTCACCCTGAT +CCTCTCCCGCAGAAGAGGAATAAAGCCGTTACTCGTCTTCTAACAATGCTTCGTATGCGG +TTGCATCCAGCAGTGATTCCAGTTCGCTTTCATCGCTGGCTTTGATTTTGAAAATCCAGC +CGCCTGCATACGGTTCGCTGTTCACCAGTTCCGGGAAATCGCTCAGTGCATCGTTTACCG +CCACGATTTCACCGCTTACTGGCGCATAAATGTCTGACGCCGCTTTTACCGATTCGGCAA +CCGCGCAGTCATCGCCCGCGCTAACCGTTGCGCCCACTTCCGGTAGGTCAATAAACACCA +TATCGCCTAACAGCTCCTGAGCGTGTTCGGTGATGCCAACGGTGTAAGTGCCGTCGGCTT +CTTTACGCAACCATTCGTGTTCTTTGCTGTATTTCAGTTCTGCTGGTATGTTGCTCATCA +ATCAATCTCCAAAAAAGTAAATCACGCGACGGCTTTGCCGTTACGCACAAAAACAGGTTT +CGTCACTTTAACCGGCATTTCACGGTTGCGAATTTGCACAATCGCCGTTTCACCAATACC +TTCCGGCACGCGCGCCAGCGCAATGCTATAACCCAGCGTTGGGGAGAAAGTACCGCTGGT +GATAATGCCTTCATGCTGGTTGCCCTGCGCATCAGTAAAACGTACCGGCAGTTCATTACG +CAGCACGCCTTTTTCGGTCATCACCAGACCAACCAGTTTTTCTGTGCCATGTTCACGCTG +CGCTTCCAGAGCTTCACGACCGATAAAGTCACGATCTGCCGGTTCCCAGGCGATAGTCCA +GCCCATATTGGCGGCTAAAGGAGAAATAGTTTCGTCCATCTCCTGGCTATACAAATTCAT +GCCCGCTTCCAGACGCAGCGTGTCACGCGCGCCCAGGCCACATGGCTTAACGCCAGCTTC +CACCAGCGCGCGCCAGAAATCGGCCGCTTTTTCATTGGGCAGCGCAATTTCGTAGCCCGC +TTCACCGGTGTAACCGGTGGTGGCAATAAACAGATCGCCCGCCTGCACGCCAAAGAACGG +TTTCATCCCTTCCACCGCCTGACGCTGGGCGTCATTAAACAGTGTGGCAGCTTTTGCCTG +CGCATTCGGCCCTTGTACGGCGATCATGGAAAGGTCATCACGAACAGTAATTTCGATGCC +GAAAGGTTCAGCGTGTTGGGTAATCCAGGAGAGGTCTTTTTCGCGGGTGGCGGAGTTAAC +AACGAGGCGGAAGAAATCTTCAGTAAAGTAGTAGACGATGAGATCATCTATCACACCGCC +AGAGGCATTCAACATCCCCGAGTAAAGGGCTTTGCCGCTTTTGGTGAGCTTCGCCACATC +GTTCGCCAGCAGATAACGTAGAAACTCCCGGGTGCGGCTGCCGCGAAGATCGACGATGGT +CATATGTGACACATCAAACATTCCGGCATCGGTACGTACCGCATGATGTTCGTCGATTTG +CGAACCGTAATGCAGCGGCATCATCCAGCCGTGGAAATCCACCATGCGAGCGCCGCAAAG +CGTGTGTTGTTCGTACAAAGGAGTCTGTTGTGCCATCTTGTCCTCATTGAATAAGCGGGG +CTGACAACTTTTCCATGGCGAAATTATCACCACGAAACCCAGCATCGGAGCCACTCCCGG +TCCCCAACGCAATCGTTCTCTTTTGCCTGAACTTACCACCGAAACAGACTGTTAACCATA +AGGTAAAATTGATCATCACATTAGCTTATGGTTAAAAAACGCCAAAATCGTAACAGAATA +AAAAACCAAAAAATGAACAAATCTCTATATAAAGATAAATAGATGAGAAAGTTAATTTGA +ATAAGACAACATTAAGAACTAAAAAAATGTCAAAAAACACTAAATCAAAAATTCGTGGCA +TTAGAAAAT diff --git a/test/data/annotate/exp_files/res_formatAll/prokka/Replicons/test_runprokka_H299.fna b/test/data/annotate/exp_files/res_formatAll/prokka/Replicons/test_runprokka_H299.fna new file mode 100644 index 0000000000000000000000000000000000000000..d3a4a1981ef3c007d131cf5d3b708a7a239ec122 --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prokka/Replicons/test_runprokka_H299.fna @@ -0,0 +1,223 @@ +>test_runprokka_H299.0001 3480 +AGCAGCACGCTTTTTAATCCGTCCACCGGACCTTCAACCGGCCCTTCGCTGATGGCATCG +ATCACACTCAGCAGCTGCGTGGACTTCAGGTTGTCCTTCGCTTCGCGCGGGGTATGCCCC +TTACTGCTGCCTTTACCCATTCGTCATGCTCCATAAACGATAAAACCGCCCGGAGGCGGT +TTCACATAAAACATTTTGCATCAGCGACCAATCACCACAACCTGACCACCATCCCCTTCG +TCTGCCGTGCTGATCTCCTGAGAAACCACGCGTGACCCCACGCGCATTTCACCGTACAGA +ACCGGCAGAACATTGCCCTGGGCAACCATGTTATCCAGTGAAGAAAAATAGGTATTCTGT +TTGCCGTTATCCGTTGTCTGTGTGCGGGGGGTTTTGGGTTTAGGGGCCAGCATCTGTGCA +ACACCGCCAAGCGTCATACTGGCACCGAGAGAAAACAGCAGATTACTCGCCATAATTCCT +ACCCCCGGCATCCATATAGCAACCGCCATAACAGCCGCCCCCAGCACAGCCTGAAACACA +CCGCCACTTTTGGCTCCTGCCAGACGCGGCACGATATGGATCACGGCACCATTTTCCAGC +GGCTCATTAAGACGGGCAGACAATTCGGTTTCACCTGCATCACGCCCGGCAATGCGTACC +TGGTACCAGCCGTCGCTCAGTTTCTGACGAAATGCCGGGATCTGCATGGCCAGCGCCCGG +ATGGCTTCGGACCCCGTTTTCACTCGAAGGTCGATGCGGCGGCCAAATCGTTGTAAATCC +CCGTAAAGGCAGATGCGTGCCATGCCCGGTGACGCCAGAGGGAGTGTGTGCGTCGCTGCC +ATTTGTCGGTGTACCTCTCTCGTTTGCTCAGTTGTTCAGGAATATGGTGCAGCAGCTCGC +TGTCACCACAGTAAATGGCGGCATGATTCGGCACCGATGAACCAAAACAGCACAGCAGCA +CATCGCCCGGCTGCGCCGCTGACAACGGCACCTGATACAGCCCTGTGGCCTCCAGATTAT +CCAGATAGAGATTCTGACCGTTACGCCACCAGTCATCCCCGCGATGAAAATCCGGCATCT +CAATTCCCGCCAGATGGTAAGCGTCCCGGAACAGCGTGTAACAGTCCGTTACCCCGTGCT +CAAAGCGCCGCCCGGTGAGATGCGGCACACAGCGGAATTTATGAATCGCCCCCCGGCAGA +CCAGCCACCACGGCAAATCACTCTGTACCTGCAGCCGCCGGTCGGCCTCACTCAGCCAGG +GCAGACCACCGGGGTGGCTGTGGACCAGCGCCACAATCTCTCTCTGCATTTCTGCACTCA +GCCAGTCCTCCGGCGACATCCGGAAATACTCCTCCGGCTCACTGGAGATATTCACGCAGG +GAAAATATCTTTCCTCCTCCGGCGTTCTCACCACGAAGCCGCACGACTCCGCTGGCGCAC +ATCGCCGGGCGTGCGCCAGAATCGCTGATTCTGTCTCTGTCATGGGATTTACTGCGAAAG +TTTGTTAATGGAAAGGAAGCTGCCAAAGTTGCCGACATTATTGCGAAACTTACAGCCACT +CAGGCATTTGCTGCATTTATCCTTCGTGATATCGGACGTCGGCTGGTCATATTCATCCGC +GACCGCCGGACCGCTATAACCGCACTCATCGCCGCGATAGGTCCAGGTGCAGGTGTTGGC +CAGCATGATACGTCCCGGAAAAACAGCGCCATCCGTTTCAGTCGGCGTGGACAGTACAAA +AGAGGCACTGACCGCGCTCAGTTCGCTGCACTGCTCGATGCGCCAGCGGCTGATCACCTC +CTGCTCCGGATCGGCTTCGCTGTTTCCGTTGACGAAGTTCACCGCATCCAGAAAGCGGGC +GTAAACCTTACGCCGGACCACCGTTCCGCCGACCAGACTCTGCAGATCTTCCGCCATCCC +GGTGATCATGCCGTGCAGGTTAGAGACCGTCAGTGTCGGACGGGCAGCACTGCCCTTGCC +GTTCATCTCAAATCCACTCCCCTGAATGGGATAGGCCTGATACTGCCGACTCTGCCAGGT +GACAGACTCACCTTTTTCGTTCTGCTCATTACAGAAAAAGTAGCGATCCCCGCCTACCTC +GGTCAGGTCGATTTCCCAGAGCACCACGCTGGCCGACTGCTCCGCACGAATGCATTCATT +CAGCGTTTCCTGTTGTATGTCCTGCATCAGATCACCACTTCGTCAAACTGACACGAAAAA +TCGGTATAGGTGATATGTTCTGTCGCTGACCACGTTCGACACACCACTCTGATTTTTCTG +TTAATACCCGGCGGGCGCCAAAAAAAAGATTTATAGCCTTCATGCCGGGCTAAAAATTTT +TCAAATGAATCACGTTCATTCGCCTCAACTTTGAAATCACAGGTGAAAACGCGCAGAGAA +TGATTAAGTCCATTTGGACTTCGTTGCTCATAACCATCGCCAAATCTTACAGTTTTTATC +GATGGTTTATTTTCTGTTTTCATTCCATCCTCTGGTAACCAGTGAAATTCTTCCGTATTA +GCCACTTAACATTCCCCCATCACGTCGCATATTTAACAGATTGCCCTGCACCCGCTGATC +AACCATCCCCATAAGTGCTTTTATTGCCTGAGGGCCAATCTCTCCATTCTGGCCGTCATT +TTGAATAGTGATTTGGTATACAGGGGCATAGGTAATATCTCCGCCTCCATTACCACTTTT +ACTATTAATAGCTCTGACACCAAGAGAACCATCGGAAGTTCGTGTTAATGGCATAATGGC +TTCCGGTCCAGCCTCACCAAAAACACCAGCCCCTTTTGCAAAAGCAAAAAATTGCGGGGA +ATCATAAATACCGTTCGAATACGTGCTCAATGACGGAGACTCATAAACACCGCCCTTTGC +ATTCGGAATAAATTTACTAATAGCACTCCCGATAGTTCCTAAAATCCCCCCAGAAGAACT +GTTACTAATGCTGTCGAAAATCCCAGTAATTGAAGCCTTTAATGCTATTCGACTAAGATC +CGAAATCACGGAAGTAGCGAAAGAACGAAAATTTGCCTTGCCTGTCGTGACAAAATCACC +CAGCGCATCGGTCATCCCATCAAACATCTGAGTCGTGGTTGATTTTATCTGCTCACTGAT +ATCCTTAGTGTCATCCAGCCAGTTATTGAATCCCTGGGAGGCACCACTAACCCAGTCTCC +TGCCTGAATATCGAGCTGCTCGTTTTTCTGTCTGACAATTTCTTTTTCCCGTTCCAGAGC +ATCATTCAGAGCCTGCATTTTCTCTTGAAAAACATGATCTGACATTCCACGGGATTTATC +TGCATAGTCACGTTCAAGTTGCAGACGCTGATTGTTATATCCATGTTCAATCCGCAGTAA +TTCCTGCTGGCGTTGCTGATTTTTATCGCCAACCCCATAACCAGCAATCTGAATATCATA +CCCCTGCTGACGATTATCAATCGAAGCCTGCAATGAATCACGCCATGCTGTTATTTCGGC +>test_runprokka_H299.0002 7080 +AGCAGCACGCTTTTTAATCCATCCACCGGACCTTCAACCGGCCCTTCGCTGATGGCATCG +ATCACACTCAGCAGCTGCGTGGACTTCAGGTTGTCCTTCGCTTCGCGCGGGGTATGCCCC +TTACTGCTGCCTTTACCCATTCGTCATGCTCCATAAACGATAAAACCGCCCGGAGGCGGT +TTCACATAAAACGTTTTTCATCAGCGACCAATCACCACAACCTGACCACCATCACCTTCA +TCTGCTGTGCTGATCTCCTGAGATACCACACGTGATCCCACGCGCATTTCACCGTACAGA +ACGGGCAGAACATTGCCCTGGGCAACCATATTATCCAGTGAAGAAAAATAGGTGTTCTGT +TTGCCGTTATCCGTTGTCTGTGTGCTGGGGGTTTTGGGTTTAGGGGCCAGCATCTGTGCA +ACACCGCCAAGCGTCATACTGGCACCGAGAGAAAACAGCAGATTACTCGCCATAATTCCT +ACCCCCGGCATCCATATAGCAACCGCCATAACAGCCGCCCCCAGCACAGCCTGAAACACA +CCGCCACTTTTGGCTCCTGCCAGACGCGGCACGATATGGATCACAGCACCATTTGCCAGC +GGTTCATTAAGACGGGCTGATAATTCCGTTTCACCTGTATCACGCCCGGCAATCCGTACC +TGATACCAGCCGTCGCTCAGTTTCTGACGAAACGCCGGGAGCTGTGTGGCCAGCGCCCGG +ATGGCTTCAGCCCCCGTTTTCACACGAAGGTCGATGCGGCGACCAAATCGTTGTAAATCC +CCGTAAAGGCAGATGCGCGCCATGCCCGGTGACGCCAGAGGGAGTGTGTGCGTCGCTGCC +ATTTGTCGGTATACCTCTCTCGTTTGCTCAGTTGTTCAGGAATATGGTGCAGCAGCTCGC +CATCACCACAGTAAATGGCGGCATGATTCGGCACCGATGAACCAAAACAGCACAGCAGCA +CATCGCCCGGTTGTGCTGATGACAACGGCACCTGATACAACCCTGTGGCCTCCAGATTAT +CCAGATAGAGATTCTGACCGTGACGCCACCAGTCATCCTCGCGATGAAAATCCGGCATCT +CAATCCCCGCCAGATGATAAGCATCCCGGAACAGCGTGTAACAGTCCGTCACCCCGTGCT +CAAAGCGCCGCCCGGTGAGATGCGGCACACAGCGGAACTTATGAATCGTCCCCCGGCAGA +CCAGCCACCACGGCAAATCACTCTGCACCTGCAGCCGCCGGTCGGCCTCACTCAGCCAGG +GCAGACCACCGGGGTGGCTGTGGACCAGCGCCACAATCTCACCCTGCATCTCTGCCCGCA +GCCAGTCCTCCGGCGACATCCGGAAATACGCCTCCGGCTCACCGGAGATATTCACGCAGG +GGAAATATCTTTCCCCTTCCGGCGTTCTCACCACGAAGCCGCACGACTCCGCTGGCGCAC +ATCGCCGGGCGTGCGCCAGAATCGCTGATTCTGTCTCTGTCATGGGATTCACTGCGAAAG +TTTGTTAATGGAAAGGAAGCCGCCAAAGTTGCCGACGTTATTGCGAAACTTACAGCCATT +CAGGCATTTGCTGCATTTATCCTTCGTGATATCGGACGTCGGCTGATCATATTCATCCGC +GACAGCCGGACCGTGATAACCGCACTCATCACCGCGATAGGTCCAGGTGCAGGTATTAGC +CAGCATGATGCGCCCCGGAAAAACGGCACCATCCGTTTCCGTCGGCGTGGACAGTACAAA +GGAGGCACTGACCGCGCTCAGTTCGCTGCACTGCTCGATGCGCCAGCGGCTGATCACCTC +CTGCTCCGGATCGGCGTCGCTGTTTCCGTTGACGAAGTTCACCGCATCCAGAAAACGGGC +GTAAACCTTACGCCGGACCACCGTTCCGCCGACCAGACTCTGCATATCTTCCGCCATCCC +GGTGACCATACCGTACAGGTTAGAAACCGTCAGCGTGGGGCGTGTACTGGTGCCTTTGCC +ATTCAGTTCAAAACCGCTCCCCTGAATGGGATACGGCTGATACTGTCGCCCCTGCCAGGT +GACCGGCTCACCTTTTTCGTTCTGCTCATTACAGAAAAAATAACGTTCTCCACCGACCTC +TGTCAGGTCGATTTCCCAGAGCACCACGCTGGCCGACTGCTCCGCACGGGTGCATTCATT +CAGTGTTTCCTGCCGGATATCCTGCATCAGTTCACCACCTGTTCAAACTCTGCGCTGAAC +TCAACACGCAGCATACTGACCCGCGACGACCATTTTGCGCAGGTCACCTTTATCTGCCGC +CACTCATAAGGCGGCGTCCACAGAAAGGCTTTCCAGCCCCCGTGCTCTTCCAGAAACGAC +TCCAGTACCGTGGCCTCCCAACGGGGGACAGAAAGCGTCACGCTGTACGTTTTCAGGTTG +GCATTCAGCCCGGCAGGCGCTCGCTGGGAATAGCCATCACCAAAGCGCACCTTTCTTACA +GAAGGGGCCGAAGCCACATCCATACCGGGTTTCACTTTCCAGCGGAAGGTTTTCATCGTC +CACCTCCGGAGAACAGGCCACCATCGCGCATCTGCCCGGTCACAACATCCATTGCCGCCT +TACGGGCTACGTCATAAACAGCCTTCAGCGCCTGTGGCCCTATCTGCCCGTTCGTGCCGT +CGTTGTTAATCACCACATGGTTATTCTGCTCAAACGTCCCGGACGCCTGCGACCGGCTGT +CTGCCATGCTGCCCGGTGTACCGACATAACCGCCGGTGGCATAGCCGCGCATCAGCCGGT +AAAGATTCCCCACGCCAATCCGGCTGGTTGCCTCCTTCGTGAAGACAAACTCACCACGGT +GAACAATCCCCGCTGGCTCATATTTGCCGCCGGTTCCCGTAAATCCCCCAGTCGCAAAAT +GGAATTTCGCCGCAGCGGCCTGAATGGCTGTACCGCCTGACGCGGATGCGCCGCCACCAA +CAGCCCCGCCAATGGCGCTGCCGATACTCCCGACAATCCCCACCATTGCCTGCTTAAGCA +GAATTTCTGTCATCATGGACAGCACGGAACGGGTGAAGCTGCGCCAGTTCTGCTCACTGC +CGGTCAGCATCGCCGCCATATTCTGTGCAATACCATCAAAGGTCTGCGTGGCTGCACTTT +TTACCTGCGACATACTGTCCGTGGCGCTCTCTTCCCACTCACTCCAGCCGGACTTCAGGC +CTGCCATCCAGCTCCCGCGAAGCTGGTCTTCAGCCGCCCAGGTCTTTTTCTGCTCTGACA +TGACGTTATTCAGCGCCAGCGGATTATCGCCATACCGTTCCTTCAGGCGCTGTTCCGTGG +CTTCCCGTTCTGCCTGCCGGTCAGTCAGCCCCCGGCTTTTCGCATCAATGGCGGCCCGTT +TTGCCCGTTGCTGCTGTGCGAATTTATCCGCCTGCTGCGCCAGCGCGTTCAGGCGCTCCT +GATACGTAACCTTGTCGCCAAGTGCAGCCAGCTGGCGTTTGTACTCCAGCGTCTCATCTT +TATGCGCCAGCAGGGATTTCTCCTGTGCGGACAGCTGGCGACGTTGTGCCGCCTCCTCCA +GTACCGCGAACTGACTTTCTGCCTTCCACAAATCCCGGCGCTGCTGGCTGATTTTCTCAT +TCGCTCCGGCATGCTTCTCCAGCGTCCGGAGTTCTGCCTGAAGCGTCAGCAGGGCAGCAT +GAGCACTGTCTTCCTGACGATCGCCCGCAGACACCTTCACGCCGGACTGTTTCGGCTTTT +TCAGCGTCGCTTCATAATCCTTTTTCGCCGCCGCCATCAGCGTGTTGTAATCTGCCTGCA +GGATTTTCCCGTCTTTCAGTGCCTTGTTCAGTTCTTCCTGACGGGCGGTATATTTCTCCA +GCGGCGTCTGCAGGCGTTCGTAAGCCTTCTGCGCCTCTTCGGTATATTTCAGCCGTGATG +CCTCAGACTCGGCCCAGTCCTTTGCTGCCATCTCTCTGGCCTTTTCAAGATCGGCCTGCA +ACGTGGCGGCGGAAAGCCCAAGTTGCGCATTCGCTCTGTCCTCCCATGCTCCCCGGAGAT +TGGCAAGAAATGCTGAGGTTTTACCGCGCCGGTGGCTCCGGCTCTGATACCACTGCCATT +TTTTGTCCGCCTCATCAAAAGCCTTTTCTGCTTTCTCCAGCATTCCCTGGGCAGTGTCCG +GGCGACCAATATCCAGCACCGAATCCCACATGGATTTGAATGCCCGTGCTGTCCTGTCTG +CCCAGGTCTCCAGCGTGCCCATGTTCTCTTTCAGGCGTCGGGTCTGGTCATCAAACCCTT +TCGTTGCGGCCTCGTTCGCCGCCTGCAATGCCCCGGCTTCATCGCCGGAACGCTGCAACT +GAGCAACATACGCAATCTGTTCCGCCGTCACGTTATGGAACTGGCGTGCCATCGCCGTCA +ACCCCGACGTCGGGTCTGTGGTCAGCTTCCCGAAGGCTTCAGCGACCTTGTCCACCTCCA +CACCGGATGCAGAGGAGAAACGCGCCACACTCTGGCTGATCGCCTCAAACTGCTCACCAC +CACGCACACCGGCATTCACCAGCGCCGTCAGTGACTCGCTGGTCTGGTTAAACGTCAGCC +CTGCCGCCTGCCCGGCTCTGGACAGGACCAGCATACGATCTGCCGTCAGTCCCGCCTGAT +TGCCGGAAAGGACCAGCGTTTTGTTGAAATCGGACAGGGTTGAGTTACCCTGATACCAGG +CATACGCCAGCGCACCGGTCGCCACCGCCAGCGAGGTGGCCCCCACCATCGGCAGGGTGA +TCGCACCGGCAAGCCCCCTGAACATGGGGATCATCCCGCCGAAGGAGTCCTTCACCTGAC +CACCCTGTTGCAGCAGGATCAGCCACGGACTCTGCCCGCCTGCAAGCTGCGTGGCCACGT +CGGTGAACTGCGCAGGCAGCATACGCATGGCGGCTTTATACTGCCCGACGGAAATCCCCG +CTTTCTGTGCAGCCAGCGCCTGCCGGCTCATCGACTGTTCAACGACTGCCGCTGTTTTTT +TCGCATCACTTTCCGTACCGGAAAAATGACGCCTGACTCTGGCCATCTGCTCGTCAAATC +TGGCCGCATCCAGACTCAAATCAACGACCAGATCGCCTACCGGTTCAGCCATACCGGACT +CCTCCTGCGATCCCTTCTGATACTGTCATCAGCATTACGTCATCCTCCGTCATGTCCGCC +ACATCCGGGGAAGCGGGGATAACTTCATTCCCGTCCGGGCCAAAACGAACGCCTCCGGCA +AGCCCTGCCGCTTTCTGCATCAGCACATCATCTTCAGGCTCTTCGTCAGCCTCACGCCGG +TTCAGCAGACTGAAATCCAGCGGATGCATATCCGGATCGCTGAAAAACAGGCTGAGCACG +GTGTACGTCAGCCCGGAAAAGTGCATATCCAGCAGAACATCATGAAAATAATGGGTACTG +TAAAAGCGGTGCCAGTCGGCATACTCCGTGGATGACATCCCGGCAAGCATGGCGCGCCAG +TCGGGTCGCCCCATTTCACGCGCCAGTTTCAGGGCAAAACTCAGCTCACCGTCGAACACT +TTCCCGCAGAAACAGGCTCTGCAGGCCCGGCATCATCTGCCTGTTCAGGGGCATTATTCA +CAACAAACTCAGACATTCCGGACAGACGTAACACCACGTTTTCAGCCTGAGCAATTGCCT +CCGTGGGCCAGGTGGTAAGCACTTCCTGCTCAATCTGTTTAACGGCTTCATTCATGGACG +GCAGCTTTGTCTTCTGCGGATGGTTATGCCACAGAGACATCGCCACCAGAAACGCCCCGC +CTCTGATAAGATCCTCTACAGACACCTGCAGGTTGCCACTGGATTCAGCCTTTTTTTCCT +GCTCTTTCAACCAGGCAAGATGCTCAATACGCTGCAGGGCTGACAGTTCAGAAAGCGTGA +CGGTCACACCGTTATGTTCAAATGATTCGGTTTTCAGGAACATCGCTGACTCTCCGGATT +AGCTGTTGGTGACGTTGATTTCTGCAACCGCAGCAAGTTCACCATTACCGGATACGACCG +GAATGTTGACCTTGCCTGCAGCAACACCTTTCACGGTGATGGTCATACCACTGACCGACA +CGGTGGCTTTTGTTTTATCCGCAGACACCGCACGGAAGCTCTTGTCGGTTGCGCCTTCCG +GCTGGAATGCCACGGTCAGCGTGGTGCTCCGCCCTTTCACCACCGAAGTGCTGGCAGGCG +TCACGGTCATGCCGGTTGCCGCTGTGACCGTGCTGCGATCTTCTGCCATCGACGGACGTC +CCACGTTGGTGACTTTCACCGTGCGGGTGATCACTTCCTTCGCCGTCACCGCCTTACCGA +TACTGCTGACCCAGCCGCGGAACACATCGACCGTGCCGTTCGGGAAGCGGATTTTATAGG +CACGGGTATCCCCTTCATTAAACCACGCCAGCAGCGCCTGCTGCCCCTGCTCTCCGGGCA +TCCACGCCAGCGTGAAGCTGGTATCTCCGGCAGATTTCTGCCCCTGCCCGGTCGCAGCCC +AGTCCGCATCTTCATCATCGAGATAGCTGTCGTCATAGGACTCAGCGGTCAGTTCGCCGG +GCGTCAGGTCTTTAACTTTAGCCAGACGCGACCAGTCAACGTCTGAAAGCGGGTTCGCAT +AAGGGTCACCGCTCCCCTTATAAACCAACAGGGTGGTCCCGGCACCTTTCACCGGCATTG +TAGGATTTGGTACAGGCATAGCGTCCTCACATTTCATAGGTAATGACATACGTCAGATCG +GCTGAACTCCACAGGCCCGCATCATCGTCGCGCCGGTAGTCATAGCCACTGGCCACCATA +CTGGTGATCAAATCTGACAGCGCCGGGATATCGCTCATCACCGGATAAATCCGGGACTCC +ATCCACGAATCCAGCTCTGAATCCGGCACCTGAGCAGGCAGGAAAACTTCAATATGCAGC +TCTGCCTGCCAGGTATCGCTGTCCAGCTCTTCGCCCGTGTATTCAGCGCCGGTGAGATAA +ACGGCAATTGCCGGAAAATCTTCCTCATCAAAAACAGCGGGGCGACCATCAAAAAGCGTC +GCCCCGGTGTCATGCTTCTCCAGTGCATCCAGTACGGCTGCACGGAGTTCAGTATGTTTC +>test_runprokka_H299.0003 2583 +ATCATACAGTCATTTGTTAATATCTGTCTGACAAGGTACCAAGCAGAAAATAGGGTTAAG +ATATTTGTAGCCATAAATATCATATATACGTTAGCCTATTTTTTTGGGGTTTTATATTCC +TTATTTATAGATCACTGGGATAATGTTTGGAAAAATATTATTTTGTTTTATGTGCTTACA +ACAATAACAATGTTTTTCTTCTATTTTATACGAAAAGGGAAGGTTGTTAAGCTATTTTTC +TTTCATTATATCTCAAAAAATAAAGTTTACGAAACTTTTATTTTTGGCCTTTACCAGCTC +CCTCATGTTTTAAGCTCTTGGGTAAGGCTTGGATATGATAGACTGGTATTGGGGGAACTA +ATATCAATGAGCTATGTTGGCGGATATTCGGTTGCAGTTCAAATATCTCTTGTGTCTAGC +GTGATATTTCAATCATTAAATAGGTTTTGGACCCCTTTCTTTATTAAAAAATTAAAGGAG +AATAGTAAACAAAAAAAAATTATTGTTCTTGGAGGTTTTGGAATTATCTGCATAACAATA +CTTAATATACTATTTGGTTACGCATATTTTATTTTTTTCTTGCCCACAAATTATTCATCA +TTCTCCAATGCTCTTCCTATATTATGTATGGCATATATGTTTCAGGGGCTATATTTTTTG +ATTGTTAATTATATATATTATCATGATGGTAATAAATTGATATCAATTCCATCCGTTGCC +TCGATCGCTATACATATAGCTGTTGCCCCAGTTTTGATAAAACATATGGGATATTATGGA +GCTGCAATTTCCTTATTGATTAGTTGGATAGTTCTTTTTTTATTTACATGCGTCATTATA +TTTTATGTTAGAAGGGGGTATCGTGGGTAATATATTTATTGTTGAGTCTCCGTTTCAGCT +TTCAAATGCTTTACTTTATCATAAAAAAAATGATAGTGTTATTGTCAGGCTCAACGGAGA +AAATAAAAATGATTTTCAAATTGAAAAAATGTTATCGTCGTTTAATGGCAAGGTATATAT +AAAAAAAGCATCAAAAGAATCGAAATTCGATTTGATTAGATTTGTTTTATTTTTTGCCGT +CCCTGTATTGATTGCTAATTTAAATAAAAAAGTAATTATTGGGAATTATAATTCATTGTG +GATGAGAGTCATGGGATATTTGTTTAACCCATTTCATTTTGCCGTCCTTGATGATGGGTT +GATTACTATACGAACAATAAAAAGGTTGGATGATAATATATCGCGTTCTGGATCAATTAA +GAAACGGTTTTTATTACTGCTGGCACCAAGATTTATAACGCAATATAAGATATATTCCAA +CTTTATTCAGATATACAACCAAGAGATCAATAAGAGAAAAAGAACTACCCGAGCCATTAA +GGCAGGGCGAGTTTGTTTTATTGGCTCTCCATTATTTGACAAAAATGTTCTCACATTTGA +TTTCTATGTAAAGTGCTTGGCTGCGATAAGTGATAACCTTAAGCGTTGTGGATATAGCAT +TGAGTATTACCCTCATCGCTCAGAAAAAAACATCTCATATTTAAATGTTTTTTTTGACGA +TGTAATAAAATCAGATGATAGCATTGAAGTCTATTATTCAGCCAGTAATGAGTTGCCAGA +AATATTTGTATCATTTTATTCATCGGCCCTTTTAAATTTGAGAAGTGATTATCCAGAGTG +TAAATTTATATCTTATAAGTTAGATTGTAATGAAATCAATGGTAAGTTTAGGTATGAAAT +AATGGAGGCATATAACTTTTTGGCATTCTCTGGTATTGAGGTTGTAACTATATAGGAAAA +TAAGATAGAAAAGGGATATTGTTGGAGTCAATATAGAACAGAAATTATAGTCTAAACTAA +TTAATCACTATGAAGGTCTATGTAATTAAATGTTAACATATTCTGTCGTTAACTGGAAAG +CAAAATTATTATATTTCATTCTTTTTCTGAGTTTCCTTAATGCTGTTTTGAGGTTATCAG +AGGATGGATTGTCGATTTATCGATTATTTATCCCTTTGCAAATATTTTTAATTTATACAT +TAAGTGTCACCGAGTTCAAAAAGTTTATCGTAATTCTACTACTTTTATTATTGTTTGGTG +CTACTGGATGTATGATATCCACTTATTCTCTTAATGAGAATAATCTTGTATTTCTAATAC +ATTACTCTATACTTATACTCACTTTTTTCTCTTCTTCTGTGTTGATATCTATTACTGGTG +AAACTTGTTTTTACAAATTCACCGCGTTCTTTTTTGGTTTTTTAATTGTTACTGGTATTA +TGGATTTGTTTGGTGTTACATTTCCTAATATAGAACATATACCAGACGCTATACGAGGAA +TACATAGAATAGAGAATGATTATTCACTTGCGCTGGTTTCGTTTGTTTTTGTTGTGTTTT +CCATCTCTAGGAAAAAAATAACTGCTTCAATCCTTACTTTTTTTACGTCTGCGATTTGTT +TTTATAATGACTCTAAAGTTGCATTACTTTTTGTCGTTGCTGGTTATTTTTGTTTTATAT +TTAAAAATATAAGGTTTAGACAAAAGGAATTCAGGTGGATATTATTTCTTTTTGTCATAA +TGC diff --git a/test/data/annotate/exp_files/res_formatAll/prokka/gff3/test.0417.00002.gff b/test/data/annotate/exp_files/res_formatAll/prokka/gff3/test.0417.00002.gff new file mode 100644 index 0000000000000000000000000000000000000000..de76a5c3e7501d25b4720044a5b573fa3728f66f --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prokka/gff3/test.0417.00002.gff @@ -0,0 +1,101 @@ +##gff-version 3 +##sequence-region test.0417.00002.0001 1 9603 +##sequence-region test.0417.00002.0002 1 22446 +##sequence-region test.0417.00002.0003 1 51012 +##sequence-region test.0417.00002.0004 1 31459 +##sequence-region test.0417.00002.0005 1 6009 +test.0417.00002.0001 Prodigal:002006 CDS 287 787 . + 0 ID=test.0417.00002.0001b_00001;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0001b_00001;product=hypothetical protein +test.0417.00002.0001 Prodigal:002006 CDS 846 2384 . + 0 ID=test.0417.00002.0001i_00002;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0001i_00002;product=hypothetical protein +test.0417.00002.0001 Prodigal:002006 CDS 2404 3741 . + 0 ID=test.0417.00002.0001i_00003;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0001i_00003;product=hypothetical protein +test.0417.00002.0001 Prodigal:002006 CDS 3738 4403 . + 0 ID=test.0417.00002.0001i_00004;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0001i_00004;product=hypothetical protein +test.0417.00002.0001 Prodigal:002006 CDS 4416 6068 . + 0 ID=test.0417.00002.0001i_00005;Name=ompA;gene=ompA;inference=ab initio prediction:Prodigal:002006,protein motif:HAMAP:MF_00842;locus_tag=test.0417.00002.0001i_00005;product=Outer membrane protein A +test.0417.00002.0001 Prodigal:002006 CDS 6126 6617 . + 0 ID=test.0417.00002.0001i_00006;Name=hcpA;db_xref=COG:COG3157;gene=hcpA;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q9HI36;locus_tag=test.0417.00002.0001i_00006;product=Major exported protein +test.0417.00002.0001 Prodigal:002006 CDS 6808 9444 . + 0 ID=test.0417.00002.0001b_00007;Name=clpV1;db_xref=COG:COG0542;gene=clpV1;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q9I742;locus_tag=test.0417.00002.0001b_00007;product=Protein ClpV1 +test.0417.00002.0002 Prodigal:002006 CDS 77 1237 . + 0 ID=test.0417.00002.0002b_00008;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0002b_00008;product=hypothetical protein +test.0417.00002.0002 Prodigal:002006 CDS 1279 2346 . + 0 ID=test.0417.00002.0002i_00009;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0002i_00009;product=hypothetical protein +test.0417.00002.0002 Prodigal:002006 CDS 2419 2799 . + 0 ID=test.0417.00002.0002i_00010;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0002i_00010;product=hypothetical protein +test.0417.00002.0002 Prodigal:002006 CDS 3130 3393 . + 0 ID=test.0417.00002.0002i_00011;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0002i_00011;product=hypothetical protein +test.0417.00002.0002 Prodigal:002006 CDS 3399 4538 . + 0 ID=test.0417.00002.0002i_00012;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0002i_00012;product=hypothetical protein +test.0417.00002.0002 Prodigal:002006 CDS 4535 7888 . + 0 ID=test.0417.00002.0002i_00013;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0002i_00013;product=hypothetical protein +test.0417.00002.0002 Prodigal:002006 CDS 7854 9491 . + 0 ID=test.0417.00002.0002i_00014;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0002i_00014;product=hypothetical protein +test.0417.00002.0002 Prodigal:002006 CDS 9525 11285 . + 0 ID=test.0417.00002.0002i_00015;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0002i_00015;product=hypothetical protein +test.0417.00002.0002 Prodigal:002006 CDS 11249 12328 . + 0 ID=test.0417.00002.0002i_00016;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0002i_00016;product=hypothetical protein +test.0417.00002.0002 Prodigal:002006 CDS 12309 12845 . + 0 ID=test.0417.00002.0002i_00017;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0002i_00017;product=hypothetical protein +test.0417.00002.0002 Prodigal:002006 CDS 12849 13277 . + 0 ID=test.0417.00002.0002i_00018;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0002i_00018;product=hypothetical protein +test.0417.00002.0002 Prodigal:002006 CDS 13277 14653 . + 0 ID=test.0417.00002.0002i_00019;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0002i_00019;product=hypothetical protein +test.0417.00002.0002 Prodigal:002006 CDS 14955 15902 . - 0 ID=test.0417.00002.0002i_00020;eC_number=1.1.1.81;db_xref=COG:COG0111;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q9X1C1;locus_tag=test.0417.00002.0002i_00020;product=Hydroxypyruvate reductase +test.0417.00002.0002 Prodigal:002006 CDS 15974 16570 . - 0 ID=test.0417.00002.0002i_00021;eC_number=5.3.1.13;Name=kdsD;db_xref=COG:COG0517;gene=kdsD;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q9HVW0;locus_tag=test.0417.00002.0002i_00021;product=Arabinose 5-phosphate isomerase KdsD +test.0417.00002.0002 Prodigal:002006 CDS 16573 17748 . - 0 ID=test.0417.00002.0002i_00022;Name=malY;db_xref=COG:COG1168;gene=malY;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P23256;locus_tag=test.0417.00002.0002i_00022;product=Protein MalY +test.0417.00002.0002 Prodigal:002006 CDS 17748 19328 . - 0 ID=test.0417.00002.0002i_00023;Name=malX;db_xref=COG:COG1263;gene=malX;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P19642;locus_tag=test.0417.00002.0002i_00023;product=PTS system maltose-specific EIICB component +test.0417.00002.0002 Prodigal:002006 CDS 19360 20184 . - 0 ID=test.0417.00002.0002i_00024;Name=licT;db_xref=COG:COG3711;gene=licT;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P39805;locus_tag=test.0417.00002.0002i_00024;product=Transcription antiterminator LicT +test.0417.00002.0002 Prodigal:002006 CDS 20442 21695 . - 0 ID=test.0417.00002.0002i_00025;eC_number=3.5.1.28;Name=amiC;db_xref=COG:COG0860;gene=amiC;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P63883;locus_tag=test.0417.00002.0002i_00025;product=N-acetylmuramoyl-L-alanine amidase AmiC +test.0417.00002.0002 Prodigal:002006 CDS 21855 22043 . - 0 ID=test.0417.00002.0002b_00026;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0002b_00026;product=hypothetical protein +test.0417.00002.0003 Prodigal:002006 CDS 93 812 . + 0 ID=test.0417.00002.0003b_00027;eC_number=2.3.1.1;Name=argA;db_xref=COG:COG0548;gene=argA;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P0A6C5;locus_tag=test.0417.00002.0003b_00027;product=Amino-acid acetyltransferase +test.0417.00002.0003 Prodigal:002006 CDS 874 2700 . - 0 ID=test.0417.00002.0003i_00028;eC_number=3.1.11.5;Name=recD;db_xref=COG:COG0507;gene=recD;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P04993;locus_tag=test.0417.00002.0003i_00028;product=RecBCD enzyme subunit RecD +test.0417.00002.0003 Prodigal:002006 CDS 2700 6242 . - 0 ID=test.0417.00002.0003i_00029;eC_number=3.1.11.5;Name=recB;db_xref=COG:COG1074;gene=recB;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P08394;locus_tag=test.0417.00002.0003i_00029;product=RecBCD enzyme subunit RecB +test.0417.00002.0003 Prodigal:002006 CDS 6235 9123 . - 0 ID=test.0417.00002.0003i_00030;eC_number=3.4.24.55;Name=ptrA;db_xref=COG:COG1025;gene=ptrA;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P05458;locus_tag=test.0417.00002.0003i_00030;product=Protease 3 +test.0417.00002.0003 Prodigal:002006 CDS 9299 12667 . - 0 ID=test.0417.00002.0003i_00031;eC_number=3.1.11.5;Name=recC;db_xref=COG:COG1330;gene=recC;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P07648;locus_tag=test.0417.00002.0003i_00031;product=RecBCD enzyme subunit RecC +test.0417.00002.0003 Prodigal:002006 CDS 12680 13003 . - 0 ID=test.0417.00002.0003i_00032;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0003i_00032;product=hypothetical protein +test.0417.00002.0003 Prodigal:002006 CDS 12988 13395 . - 0 ID=test.0417.00002.0003i_00033;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0003i_00033;product=hypothetical protein +test.0417.00002.0003 Prodigal:002006 CDS 13392 13955 . - 0 ID=test.0417.00002.0003i_00034;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0003i_00034;product=hypothetical protein +test.0417.00002.0003 Prodigal:002006 CDS 13946 14449 . - 0 ID=test.0417.00002.0003i_00035;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0003i_00035;product=hypothetical protein +test.0417.00002.0003 Prodigal:002006 CDS 14634 15428 . - 0 ID=test.0417.00002.0003i_00036;eC_number=2.1.1.45;Name=thyA;db_xref=COG:COG0207;gene=thyA;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P48464;locus_tag=test.0417.00002.0003i_00036;product=Thymidylate synthase +test.0417.00002.0003 Prodigal:002006 CDS 15435 16310 . - 0 ID=test.0417.00002.0003i_00037;eC_number=2.5.1.145;Name=lgt;db_xref=COG:COG0682;gene=lgt;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P60955;locus_tag=test.0417.00002.0003i_00037;product=Phosphatidylglycerol--prolipoprotein diacylglyceryl transferase +test.0417.00002.0003 Prodigal:002006 CDS 16461 18707 . - 0 ID=test.0417.00002.0003i_00038;eC_number=2.7.3.9;Name=ptsP;db_xref=COG:COG3605;gene=ptsP;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P37177;locus_tag=test.0417.00002.0003i_00038;product=Phosphoenolpyruvate-dependent phosphotransferase system +test.0417.00002.0003 Prodigal:002006 CDS 18720 19250 . - 0 ID=test.0417.00002.0003i_00039;eC_number=3.6.1.-;Name=rppH;db_xref=COG:COG0494;gene=rppH;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P0A776;locus_tag=test.0417.00002.0003i_00039;product=RNA pyrophosphohydrolase +test.0417.00002.0003 Prodigal:002006 CDS 19695 19856 . + 0 ID=test.0417.00002.0003i_00040;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0003i_00040;product=hypothetical protein +test.0417.00002.0003 Prodigal:002006 CDS 19935 20624 . + 0 ID=test.0417.00002.0003i_00041;Name=mutH;db_xref=COG:COG3066;gene=mutH;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P06722;locus_tag=test.0417.00002.0003i_00041;product=DNA mismatch repair protein MutH +test.0417.00002.0003 Prodigal:002006 CDS 20693 21406 . + 0 ID=test.0417.00002.0003i_00042;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P67127;locus_tag=test.0417.00002.0003i_00042;note=UPF0053 inner membrane protein YgdQ;product=hypothetical protein +test.0417.00002.0003 Prodigal:002006 CDS 21544 21762 . + 0 ID=test.0417.00002.0003i_00043;Name=ygdR;gene=ygdR;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P65294;locus_tag=test.0417.00002.0003i_00043;product=putative lipoprotein YgdR +test.0417.00002.0003 Prodigal:002006 CDS 21870 22910 . + 0 ID=test.0417.00002.0003i_00044;Name=tas;db_xref=COG:COG0667;gene=tas;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P0A9T4;locus_tag=test.0417.00002.0003i_00044;product=Protein tas +test.0417.00002.0003 Prodigal:002006 CDS 22942 24135 . - 0 ID=test.0417.00002.0003i_00045;Name=lplT;gene=lplT;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P39196;locus_tag=test.0417.00002.0003i_00045;product=Lysophospholipid transporter LplT +test.0417.00002.0003 Prodigal:002006 CDS 24128 26287 . - 0 ID=test.0417.00002.0003i_00046;Name=aas;db_xref=COG:COG0204;gene=aas;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P31119;locus_tag=test.0417.00002.0003i_00046;product=Bifunctional protein Aas +test.0417.00002.0003 Prodigal:002006 CDS 26873 27904 . + 0 ID=test.0417.00002.0003i_00047;Name=galR;db_xref=COG:COG1609;gene=galR;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P03024;locus_tag=test.0417.00002.0003i_00047;product=HTH-type transcriptional regulator GalR +test.0417.00002.0003 Prodigal:002006 CDS 27911 29173 . - 0 ID=test.0417.00002.0003i_00048;eC_number=4.1.1.20;Name=lysA;gene=lysA;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:E0IWI3;locus_tag=test.0417.00002.0003i_00048;product=Diaminopimelate decarboxylase +test.0417.00002.0003 Prodigal:002006 CDS 29295 30230 . + 0 ID=test.0417.00002.0003i_00049;Name=occR;gene=occR;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P0A4T3;locus_tag=test.0417.00002.0003i_00049;product=Octopine catabolism/uptake operon regulatory protein OccR +test.0417.00002.0003 Prodigal:002006 CDS 30217 30909 . - 0 ID=test.0417.00002.0003i_00050;eC_number=5.1.1.13;Name=ygeA;gene=ygeA;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:A0A140N890;locus_tag=test.0417.00002.0003i_00050;product=L-aspartate/glutamate-specific racemase +test.0417.00002.0003 Prodigal:002006 CDS 31038 32456 . - 0 ID=test.0417.00002.0003i_00051;Name=araE;gene=araE;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P0AE24;locus_tag=test.0417.00002.0003i_00051;product=Arabinose-proton symporter +test.0417.00002.0003 Prodigal:002006 CDS 32771 33532 . - 0 ID=test.0417.00002.0003i_00052;eC_number=1.1.1.127;Name=kduD;gene=kduD;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P37769;locus_tag=test.0417.00002.0003i_00052;product=2-dehydro-3-deoxy-D-gluconate 5-dehydrogenase +test.0417.00002.0003 Prodigal:002006 CDS 33562 34398 . - 0 ID=test.0417.00002.0003i_00053;eC_number=5.3.1.17;Name=kduI;db_xref=COG:COG3717;gene=kduI;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q46938;locus_tag=test.0417.00002.0003i_00053;product=4-deoxy-L-threo-5-hexosulose-uronate ketol-isomerase +test.0417.00002.0003 Prodigal:002006 CDS 34685 35866 . - 0 ID=test.0417.00002.0003i_00054;eC_number=2.3.1.9;Name=thlA;db_xref=COG:COG0183;gene=thlA;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P45359;locus_tag=test.0417.00002.0003i_00054;product=Acetyl-CoA acetyltransferase +test.0417.00002.0003 Prodigal:002006 CDS 36121 37350 . + 0 ID=test.0417.00002.0003i_00055;Name=yqeG;db_xref=COG:COG0814;gene=yqeG;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P63340;locus_tag=test.0417.00002.0003i_00055;product=Inner membrane transport protein YqeG +test.0417.00002.0003 Aragorn:001002 tRNA 37666 37739 . - . ID=test.0417.00002.0003i_00056;inference=COORDINATES:profile:Aragorn:001002;locus_tag=test.0417.00002.0003i_00056;product=tRNA-Gly(ccc) +test.0417.00002.0003 Prodigal:002006 CDS 37818 38168 . - 0 ID=test.0417.00002.0003i_00057;Name=nlpD;gene=nlpD;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P39700;locus_tag=test.0417.00002.0003i_00057;product=Murein hydrolase activator NlpD +test.0417.00002.0003 Prodigal:002006 CDS 38987 41284 . + 0 ID=test.0417.00002.0003i_00058;eC_number=1.17.1.4;Name=xdhA_1;db_xref=COG:COG1529;gene=xdhA_1;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q46799;locus_tag=test.0417.00002.0003i_00058;product=Putative xanthine dehydrogenase molybdenum-binding subunit XdhA +test.0417.00002.0003 Prodigal:002006 CDS 41295 42173 . + 0 ID=test.0417.00002.0003i_00059;eC_number=1.17.1.5;Name=ndhF;gene=ndhF;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q0QLF4;locus_tag=test.0417.00002.0003i_00059;product=Nicotinate dehydrogenase FAD-subunit +test.0417.00002.0003 Prodigal:002006 CDS 42170 42649 . + 0 ID=test.0417.00002.0003i_00060;eC_number=1.17.1.5;Name=ndhS;gene=ndhS;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q0QLF3;locus_tag=test.0417.00002.0003i_00060;product=Nicotinate dehydrogenase small FeS subunit +test.0417.00002.0003 Prodigal:002006 CDS 42689 44467 . - 0 ID=test.0417.00002.0003i_00061;Name=norR;gene=norR;inference=ab initio prediction:Prodigal:002006,protein motif:HAMAP:MF_01314;locus_tag=test.0417.00002.0003i_00061;product=Anaerobic nitric oxide reductase transcription regulator NorR +test.0417.00002.0003 Prodigal:002006 CDS 44946 46133 . + 0 ID=test.0417.00002.0003i_00062;eC_number=2.1.3.-;Name=ygeW;db_xref=COG:COG0078;gene=ygeW;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q46803;locus_tag=test.0417.00002.0003i_00062;product=Putative carbamoyltransferase YgeW +test.0417.00002.0003 Prodigal:002006 CDS 46191 47387 . + 0 ID=test.0417.00002.0003i_00063;eC_number=4.3.1.15;Name=ygeX;db_xref=COG:COG1171;gene=ygeX;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P66899;locus_tag=test.0417.00002.0003i_00063;product=Diaminopropionate ammonia-lyase +test.0417.00002.0003 Prodigal:002006 CDS 47445 48656 . + 0 ID=test.0417.00002.0003i_00064;eC_number=3.5.1.16;Name=argE;db_xref=COG:COG0624;gene=argE;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P23908;locus_tag=test.0417.00002.0003i_00064;product=Acetylornithine deacetylase +test.0417.00002.0003 Prodigal:002006 CDS 48709 50094 . + 0 ID=test.0417.00002.0003b_00065;eC_number=3.5.2.-;Name=hyuA;db_xref=COG:COG0044;gene=hyuA;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q46806;locus_tag=test.0417.00002.0003b_00065;product=D-phenylhydantoinase +test.0417.00002.0004 Prodigal:002006 CDS 103 1728 . - 0 ID=test.0417.00002.0004b_00066;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0004b_00066;product=hypothetical protein +test.0417.00002.0004 Prodigal:002006 CDS 1776 2255 . - 0 ID=test.0417.00002.0004i_00067;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0004i_00067;product=hypothetical protein +test.0417.00002.0004 Prodigal:002006 CDS 2650 3228 . + 0 ID=test.0417.00002.0004i_00068;eC_number=2.7.7.76;Name=mocA;db_xref=COG:COG2068;gene=mocA;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q46810;locus_tag=test.0417.00002.0004i_00068;product=Molybdenum cofactor cytidylyltransferase +test.0417.00002.0004 Prodigal:002006 CDS 3550 6648 . + 0 ID=test.0417.00002.0004i_00069;Name=ygfK;db_xref=COG:COG0493;gene=ygfK;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q46811;locus_tag=test.0417.00002.0004i_00069;product=Putative oxidoreductase YgfK +test.0417.00002.0004 Prodigal:002006 CDS 6651 7979 . + 0 ID=test.0417.00002.0004i_00070;eC_number=3.-.-.-;Name=ssnA;db_xref=COG:COG0402;gene=ssnA;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q46812;locus_tag=test.0417.00002.0004i_00070;product=Putative aminohydrolase SsnA +test.0417.00002.0004 Prodigal:002006 CDS 8030 8809 . + 0 ID=test.0417.00002.0004i_00071;inference=ab initio prediction:Prodigal:002006;locus_tag=test.0417.00002.0004i_00071;product=hypothetical protein +test.0417.00002.0004 Prodigal:002006 CDS 8806 11676 . + 0 ID=test.0417.00002.0004i_00072;eC_number=1.17.1.4;Name=xdhA_2;db_xref=COG:COG1529;gene=xdhA_2;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q46799;locus_tag=test.0417.00002.0004i_00072;product=Putative xanthine dehydrogenase molybdenum-binding subunit XdhA +test.0417.00002.0004 Prodigal:002006 CDS 11841 13241 . + 0 ID=test.0417.00002.0004i_00073;Name=xanQ;db_xref=COG:COG2233;gene=xanQ;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P67444;locus_tag=test.0417.00002.0004i_00073;product=Xanthine permease XanQ +test.0417.00002.0004 Prodigal:002006 CDS 13259 14575 . + 0 ID=test.0417.00002.0004i_00074;eC_number=3.5.4.3;Name=guaD;db_xref=COG:COG0402;gene=guaD;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P76641;locus_tag=test.0417.00002.0004i_00074;product=Guanine deaminase +test.0417.00002.0004 Prodigal:002006 CDS 14611 15978 . + 0 ID=test.0417.00002.0004i_00075;Name=ghxQ;db_xref=COG:COG2252;gene=ghxQ;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q46817;locus_tag=test.0417.00002.0004i_00075;product=Guanine/hypoxanthine permease GhxQ +test.0417.00002.0004 Prodigal:002006 CDS 16014 16502 . - 0 ID=test.0417.00002.0004i_00076;eC_number=1.-.-.-;Name=hyfA;db_xref=COG:COG1142;gene=hyfA;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P23481;locus_tag=test.0417.00002.0004i_00076;product=Hydrogenase-4 component A +test.0417.00002.0004 Prodigal:002006 CDS 16502 18421 . - 0 ID=test.0417.00002.0004i_00077;eC_number=1.18.1.2;inference=ab initio prediction:Prodigal:002006,protein motif:HAMAP:MF_01685;locus_tag=test.0417.00002.0004i_00077;product=Ferredoxin--NADP reductase +test.0417.00002.0004 Prodigal:002006 CDS 18857 20305 . + 0 ID=test.0417.00002.0004i_00078;Name=uacT;db_xref=COG:COG2233;gene=uacT;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q46821;locus_tag=test.0417.00002.0004i_00078;product=Uric acid transporter UacT +test.0417.00002.0004 Prodigal:002006 CDS 20307 20432 . + 0 ID=test.0417.00002.0004i_00079;Name=yqfG;gene=yqfG;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:C1P614;locus_tag=test.0417.00002.0004i_00079;product=putative protein YqfG +test.0417.00002.0004 Prodigal:002006 CDS 20555 21103 . + 0 ID=test.0417.00002.0004i_00080;eC_number=5.3.3.2;Name=idi;db_xref=COG:COG1443;gene=idi;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q46822;locus_tag=test.0417.00002.0004i_00080;product=Isopentenyl-diphosphate Delta-isomerase +test.0417.00002.0004 Prodigal:002006 CDS 21146 22663 . - 0 ID=test.0417.00002.0004i_00081;eC_number=6.1.1.6;Name=lysS;db_xref=COG:COG1190;gene=lysS;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P0A8N3;locus_tag=test.0417.00002.0004i_00081;product=Lysine--tRNA ligase +test.0417.00002.0004 Prodigal:002006 CDS 22673 23554 . - 0 ID=test.0417.00002.0004i_00082;Name=prfB;db_xref=COG:COG1186;gene=prfB;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P07012;locus_tag=test.0417.00002.0004i_00082;product=Peptide chain release factor RF2 +test.0417.00002.0004 Prodigal:002006 CDS 23862 25595 . - 0 ID=test.0417.00002.0004i_00083;eC_number=3.1.-.-;Name=recJ;db_xref=COG:COG0608;gene=recJ;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P21893;locus_tag=test.0417.00002.0004i_00083;product=Single-stranded-DNA-specific exonuclease RecJ +test.0417.00002.0004 Prodigal:002006 CDS 25601 26311 . - 0 ID=test.0417.00002.0004i_00084;Name=dsbC;db_xref=COG:COG1651;gene=dsbC;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P0AEG6;locus_tag=test.0417.00002.0004i_00084;product=Thiol:disulfide interchange protein DsbC +test.0417.00002.0004 Prodigal:002006 CDS 26336 27232 . - 0 ID=test.0417.00002.0004i_00085;Name=xerD;db_xref=COG:COG4974;gene=xerD;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P0A8P8;locus_tag=test.0417.00002.0004i_00085;product=Tyrosine recombinase XerD +test.0417.00002.0004 Prodigal:002006 CDS 27344 27865 . + 0 ID=test.0417.00002.0004i_00086;Name=fldB;db_xref=COG:COG0716;gene=fldB;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P0ABY4;locus_tag=test.0417.00002.0004i_00086;product=Flavodoxin 2 +test.0417.00002.0004 Prodigal:002006 CDS 27905 28312 . - 0 ID=test.0417.00002.0004i_00087;Name=ygfX;gene=ygfX;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q46824;locus_tag=test.0417.00002.0004i_00087;product=Inner membrane protein YgfX +test.0417.00002.0004 Prodigal:002006 CDS 28293 28559 . - 0 ID=test.0417.00002.0004i_00088;Name=sdhE;db_xref=COG:COG2938;gene=sdhE;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P64559;locus_tag=test.0417.00002.0004i_00088;product=FAD assembly factor SdhE +test.0417.00002.0004 Prodigal:002006 CDS 28802 29782 . + 0 ID=test.0417.00002.0004i_00089;Name=ygfZ;db_xref=COG:COG0354;gene=ygfZ;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P0ADE8;locus_tag=test.0417.00002.0004i_00089;product=tRNA-modifying protein YgfZ +test.0417.00002.0004 Prodigal:002006 CDS 29859 30518 . - 0 ID=test.0417.00002.0004i_00090;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P67153;locus_tag=test.0417.00002.0004i_00090;note=UPF0073 inner membrane protein YqfA;product=hypothetical protein +test.0417.00002.0004 Prodigal:002006 CDS 30682 30993 . - 0 ID=test.0417.00002.0004b_00091;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P67603;locus_tag=test.0417.00002.0004b_00091;note=UPF0267 protein YqfB;product=hypothetical protein +test.0417.00002.0005 Prodigal:002006 CDS 29 1012 . + 0 ID=test.0417.00002.0005b_00092;eC_number=3.2.1.86;Name=bglA;db_xref=COG:COG2723;gene=bglA;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:Q46829;locus_tag=test.0417.00002.0005b_00092;product=6-phospho-beta-glucosidase BglA +test.0417.00002.0005 Prodigal:002006 CDS 1178 4051 . - 0 ID=test.0417.00002.0005i_00093;eC_number=1.4.4.2;Name=gcvP;db_xref=COG:COG0403;gene=gcvP;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P33195;locus_tag=test.0417.00002.0005i_00093;product=Glycine dehydrogenase (decarboxylating) +test.0417.00002.0005 Prodigal:002006 CDS 4169 4558 . - 0 ID=test.0417.00002.0005i_00094;Name=gcvH;db_xref=COG:COG0509;gene=gcvH;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P0A6T9;locus_tag=test.0417.00002.0005i_00094;product=Glycine cleavage system H protein +test.0417.00002.0005 Prodigal:002006 CDS 4582 5745 . - 0 ID=test.0417.00002.0005b_00095;eC_number=2.1.2.10;Name=gcvT;db_xref=COG:COG0404;gene=gcvT;inference=ab initio prediction:Prodigal:002006,similar to AA sequence:UniProtKB:P27248;locus_tag=test.0417.00002.0005b_00095;product=Aminomethyltransferase diff --git a/test/data/annotate/exp_files/res_formatAll/prokka/gff3/test_runprokka_H299.gff b/test/data/annotate/exp_files/res_formatAll/prokka/gff3/test_runprokka_H299.gff new file mode 100644 index 0000000000000000000000000000000000000000..aa8c22d7d40a1e32bb0ddcba3c61177a84c5faf7 --- /dev/null +++ b/test/data/annotate/exp_files/res_formatAll/prokka/gff3/test_runprokka_H299.gff @@ -0,0 +1,20 @@ +##gff-version 3 +##sequence-region test_runprokka_H299.0001 1 3480 +##sequence-region test_runprokka_H299.0002 1 7080 +##sequence-region test_runprokka_H299.0003 1 2583 +test_runprokka_H299.0001 Prodigal:002006 CDS 201 743 . - 0 ID=test_runprokka_H299.0001b_00001;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0001b_00001;product=hypothetical protein +test_runprokka_H299.0001 Prodigal:002006 CDS 740 1339 . - 0 ID=test_runprokka_H299.0001i_00002;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0001i_00002;product=hypothetical protein +test_runprokka_H299.0001 Prodigal:002006 CDS 1489 2187 . - 0 ID=test_runprokka_H299.0001i_00003;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0001i_00003;product=hypothetical protein +test_runprokka_H299.0001 Prodigal:002006 CDS 2187 2483 . - 0 ID=test_runprokka_H299.0001i_00004;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0001i_00004;product=hypothetical protein +test_runprokka_H299.0001 Prodigal:002006 CDS 2518 3453 . - 0 ID=test_runprokka_H299.0001b_00005;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0001b_00005;product=hypothetical protein +test_runprokka_H299.0002 Prodigal:002006 CDS 201 743 . - 0 ID=test_runprokka_H299.0002b_00006;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0002b_00006;product=hypothetical protein +test_runprokka_H299.0002 Prodigal:002006 CDS 740 1483 . - 0 ID=test_runprokka_H299.0002i_00007;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0002i_00007;product=hypothetical protein +test_runprokka_H299.0002 Prodigal:002006 CDS 1489 2187 . - 0 ID=test_runprokka_H299.0002i_00008;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0002i_00008;product=hypothetical protein +test_runprokka_H299.0002 Prodigal:002006 CDS 2187 2516 . - 0 ID=test_runprokka_H299.0002i_00009;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0002i_00009;product=hypothetical protein +test_runprokka_H299.0002 Prodigal:002006 CDS 2513 5092 . - 0 ID=test_runprokka_H299.0002i_00010;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0002i_00010;product=hypothetical protein +test_runprokka_H299.0002 Prodigal:002006 CDS 5085 5519 . - 0 ID=test_runprokka_H299.0002i_00011;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0002i_00011;product=hypothetical protein +test_runprokka_H299.0002 Prodigal:002006 CDS 5501 5923 . - 0 ID=test_runprokka_H299.0002i_00012;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0002i_00012;product=hypothetical protein +test_runprokka_H299.0002 Prodigal:002006 CDS 5939 6679 . - 0 ID=test_runprokka_H299.0002i_00013;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0002i_00013;product=hypothetical protein +test_runprokka_H299.0002 Prodigal:002006 CDS 6687 6842 . - 0 ID=test_runprokka_H299.0002b_00014;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0002b_00014;product=hypothetical protein +test_runprokka_H299.0003 Prodigal:002006 CDS 163 870 . + 0 ID=test_runprokka_H299.0003b_00015;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0003b_00015;product=hypothetical protein +test_runprokka_H299.0003 Prodigal:002006 CDS 863 1795 . + 0 ID=test_runprokka_H299.0003b_00016;inference=ab initio prediction:Prodigal:002006;locus_tag=test_runprokka_H299.0003b_00016;product=hypothetical protein diff --git a/test/data/annotate/exp_files/res_genome_short-long_header.fst b/test/data/annotate/exp_files/res_genome_short-long_header.fst index 4a61e3778bead6eea69d1b93760ecd2c1a6bbf0d..aaccf955b76f8a50a51a6f81d95ce1860ee107f0 100755 --- a/test/data/annotate/exp_files/res_genome_short-long_header.fst +++ b/test/data/annotate/exp_files/res_genome_short-long_header.fst @@ -1,6 +1,6 @@ ->Long_header_with_same_1_1 +>1_Long_header_with_same_1 AATTGCGCTAGCGCTAGGCGCTAGCGCGCTAGAGCCGCTAGGCGCCATTACGGCGCTATCCGCACGCGCATGCCACCGTTAG ->Long_header_with_same_2_2 +>2_Long_header_with_same_2 AACCGTTGGGGGGGGGGCCCCATTAGGCGCGGAATTTTCG ->Long_header_with_same_3_3 +>3_Long_header_with_same_3 ACGGCTCGCGGAGAGAGAGAGCTCGCGCA diff --git a/test/data/annotate/genomes/A_H738-and-B2_A3_5.fna b/test/data/annotate/genomes/A_H738-and-B2_A3_5.fna index 01bbdab82c8292cc6e762fd9f4d4bfce5168dd98..45fe156268d8705dd7f0cc87c3e8bac10ebaf169 100755 --- a/test/data/annotate/genomes/A_H738-and-B2_A3_5.fna +++ b/test/data/annotate/genomes/A_H738-and-B2_A3_5.fna @@ -51,7 +51,7 @@ TTCTGAATTGATGTGGGTGTGGTTGCCGGGGATGCTACTGATGGGAATGTTGTGGTGGCG CAGACGATAACCGGATGCGAAAACTCGCATCCGGCAATAGCGCAATTACTTACGACGCCA GGTGGTCCCTTGCGGGCCATCTTCCAGCACGATCCCCATCTCGTTAAGACGATCACGCGC CGCATCCGCCGCCGCCCAGTCTTTCGCTTTACGGGCATCCAGACGCTGTTGAATTAACGC -TTCAATCTCAGCCACTTCGCTGTCGTCTGCCTGCGCGCCGCTTTGCAGGAACGCTTCCGG +TTCAATCTCAGCCACTTCGCTNNNNNNNNNGTCGTCTGCCTGCGCGCCGCTTTGCAGGAACGCTTCCGG TTCTTGCTCCAGCAGGCCCAATACAGCGGAAAGTTTACGCAGGTGAGATGCCATTGCATT CGCCGCTGCCATATCTTCTGCTTTCAGACGGTTTACTTCACGCGCCATATCAAACAGTAC GGAATAGGCTTCCGGGGTGTTGAAATCGTCGTCCATCGCTTCAATAAAGCGCGCTTCAAA @@ -122,7 +122,7 @@ AACGGTGCCAGCATCAGCCAGTTTGAGCTGCATCTGCGGGCGATTACCGATCTGCCGTTA CCGCAACCAGTGGTGAATAATCCGTCGGTGATGATCAATCTGATTGGTAGCGATGTGAAT TATGACTGGCTGAAACTGCCGCTGGTGCATCTGCACTGGTACGACAAAGAAGTCCGTCCG GGGCGTAAAGTGGGGCATCTGAATTTGACCGACAGCGACACATCGCGTCTGACTGCGACG -CTGGAAGCCTTAATCCCGCTGCTGCCGCCGGAATATGCCAGCGGCGTGATTTGGGCGCAG +CTGGAAGCCTTAATCCNNNNNNNNNNNNNNNNNNNNNNNNNNCGCTGCTGCCGCCGGAATATGCCAGCGGCGTGATTTGGGCGCAG AGTAAGTTCGGTTAACTGGTGCTCTATTCTTGCCGGATGCGGCGTAAACGCCTTATCCGG CCTACCGATCCGGTACCCATTGTAGGCCTGATAAGATGCGTCAAGCATCGCATCAGGCAT TGTGCACCAATTGCCGGATGCGGCACCGGTTGTAGGCCTGATAAGACGCGTCAAGCGTCG diff --git a/test/data/annotate/genomes/A_H738-and-genome1.fna b/test/data/annotate/genomes/A_H738-and-genome1.fna index f3d384b5cb0c46941de12bbbc2e1d25843a95ea8..30aa864b63262727f699d23960eeb8905e77d5d8 100755 --- a/test/data/annotate/genomes/A_H738-and-genome1.fna +++ b/test/data/annotate/genomes/A_H738-and-genome1.fna @@ -51,7 +51,7 @@ TTCTGAATTGATGTGGGTGTGGTTGCCGGGGATGCTACTGATGGGAATGTTGTGGTGGCG CAGACGATAACCGGATGCGAAAACTCGCATCCGGCAATAGCGCAATTACTTACGACGCCA GGTGGTCCCTTGCGGGCCATCTTCCAGCACGATCCCCATCTCGTTAAGACGATCACGCGC CGCATCCGCCGCCGCCCAGTCTTTCGCTTTACGGGCATCCAGACGCTGTTGAATTAACGC -TTCAATCTCAGCCACTTCGCTGTCGTCTGCCTGCGCGCCGCTTTGCAGGAACGCTTCCGG +TTCAATCTCAGCCACTTCGCTNNNNNNNNNGTCGTCTGCCTGCGCGCCGCTTTGCAGGAACGCTTCCGG TTCTTGCTCCAGCAGGCCCAATACAGCGGAAAGTTTACGCAGGTGAGATGCCATTGCATT CGCCGCTGCCATATCTTCTGCTTTCAGACGGTTTACTTCACGCGCCATATCAAACAGTAC GGAATAGGCTTCCGGGGTGTTGAAATCGTCGTCCATCGCTTCAATAAAGCGCGCTTCAAA @@ -122,7 +122,7 @@ AACGGTGCCAGCATCAGCCAGTTTGAGCTGCATCTGCGGGCGATTACCGATCTGCCGTTA CCGCAACCAGTGGTGAATAATCCGTCGGTGATGATCAATCTGATTGGTAGCGATGTGAAT TATGACTGGCTGAAACTGCCGCTGGTGCATCTGCACTGGTACGACAAAGAAGTCCGTCCG GGGCGTAAAGTGGGGCATCTGAATTTGACCGACAGCGACACATCGCGTCTGACTGCGACG -CTGGAAGCCTTAATCCCGCTGCTGCCGCCGGAATATGCCAGCGGCGTGATTTGGGCGCAG +CTGGAAGCCTTAATCCNNNNNNNNNNNNNNNNNNNNNNNNNNCGCTGCTGCCGCCGGAATATGCCAGCGGCGTGATTTGGGCGCAG AGTAAGTTCGGTTAACTGGTGCTCTATTCTTGCCGGATGCGGCGTAAACGCCTTATCCGG CCTACCGATCCGGTACCCATTGTAGGCCTGATAAGATGCGTCAAGCATCGCATCAGGCAT TGTGCACCAATTGCCGGATGCGGCACCGGTTGTAGGCCTGATAAGACGCGTCAAGCGTCG diff --git a/test/data/annotate/genomes/A_H738.fasta b/test/data/annotate/genomes/A_H738.fasta index 279640c2a0dce53162a643f852636f5fbd2779f7..d4e777a5beede0b80cbed518ace578d27777050e 100755 --- a/test/data/annotate/genomes/A_H738.fasta +++ b/test/data/annotate/genomes/A_H738.fasta @@ -51,7 +51,7 @@ TTCTGAATTGATGTGGGTGTGGTTGCCGGGGATGCTACTGATGGGAATGTTGTGGTGGCG CAGACGATAACCGGATGCGAAAACTCGCATCCGGCAATAGCGCAATTACTTACGACGCCA GGTGGTCCCTTGCGGGCCATCTTCCAGCACGATCCCCATCTCGTTAAGACGATCACGCGC CGCATCCGCCGCCGCCCAGTCTTTCGCTTTACGGGCATCCAGACGCTGTTGAATTAACGC -TTCAATCTCAGCCACTTCGCTGTCGTCTGCCTGCGCGCCGCTTTGCAGGAACGCTTCCGG +TTCAATCTCAGCCACTTCGCTNNNNNNNNNGTCGTCTGCCTGCGCGCCGCTTTGCAGGAACGCTTCCGG TTCTTGCTCCAGCAGGCCCAATACAGCGGAAAGTTTACGCAGGTGAGATGCCATTGCATT CGCCGCTGCCATATCTTCTGCTTTCAGACGGTTTACTTCACGCGCCATATCAAACAGTAC GGAATAGGCTTCCGGGGTGTTGAAATCGTCGTCCATCGCTTCAATAAAGCGCGCTTCAAA @@ -122,7 +122,7 @@ AACGGTGCCAGCATCAGCCAGTTTGAGCTGCATCTGCGGGCGATTACCGATCTGCCGTTA CCGCAACCAGTGGTGAATAATCCGTCGGTGATGATCAATCTGATTGGTAGCGATGTGAAT TATGACTGGCTGAAACTGCCGCTGGTGCATCTGCACTGGTACGACAAAGAAGTCCGTCCG GGGCGTAAAGTGGGGCATCTGAATTTGACCGACAGCGACACATCGCGTCTGACTGCGACG -CTGGAAGCCTTAATCCCGCTGCTGCCGCCGGAATATGCCAGCGGCGTGATTTGGGCGCAG +CTGGAAGCCTTAATCCNNNNNNNNNNNNNNNNNNNNNNNNNNCGCTGCTGCCGCCGGAATATGCCAGCGGCGTGATTTGGGCGCAG AGTAAGTTCGGTTAACTGGTGCTCTATTCTTGCCGGATGCGGCGTAAACGCCTTATCCGG CCTACCGATCCGGTACCCATTGTAGGCCTGATAAGATGCGTCAAGCATCGCATCAGGCAT TGTGCACCAATTGCCGGATGCGGCACCGGTTGTAGGCCTGATAAGACGCGTCAAGCGTCG diff --git a/test/data/annotate/genomes/complete_genome.fna b/test/data/annotate/genomes/complete_genome.fna new file mode 100644 index 0000000000000000000000000000000000000000..583e7b872877fbcb80e4a89ece5a0ce0371588ee --- /dev/null +++ b/test/data/annotate/genomes/complete_genome.fna @@ -0,0 +1,5 @@ +>complete +CCGCTTAGGCTAGCGCC +AGCTAGGAGCGCTCGAGAGACA +CAGCATTACNCCGATATTATAGAGGCCGCGCTTAGC +ACGCTAGGACGCG \ No newline at end of file diff --git a/test/data/annotate/test_files/list_genomes-func-test-default.txt b/test/data/annotate/test_files/list_genomes-func-test-default.txt index 0b6751d4ffbbbb196367df00254a07af68e0495e..ddd2dfb23d4a8ead62a49fb552101e7a03e377eb 100755 --- a/test/data/annotate/test_files/list_genomes-func-test-default.txt +++ b/test/data/annotate/test_files/list_genomes-func-test-default.txt @@ -1,3 +1,4 @@ B2_A3_5.fasta-changeName.fna::ESCO.1116 H299_H561.fasta genome6.fasta :: ESCO.1015 A_H738.fasta genome1.fasta toto.fst ::.1015 +complete_genome.fna \ No newline at end of file diff --git a/test/data/annotate/test_files/non-fasta.seq b/test/data/annotate/test_files/non-fasta.seq new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/test/data/annotate/test_files/original_name.fna-prodigalRes/prodigal.outtest.ok.ffn b/test/data/annotate/test_files/original_name.fna-prodigalRes/prodigal.outtest.ok.ffn index 411b6c3092ce8c15a13cbce1b4f2814fd47952a3..512c2808013767ba0e436e66d01cf038c7b0881e 100644 --- a/test/data/annotate/test_files/original_name.fna-prodigalRes/prodigal.outtest.ok.ffn +++ b/test/data/annotate/test_files/original_name.fna-prodigalRes/prodigal.outtest.ok.ffn @@ -13,11 +13,11 @@ acgctagagagctcgcgctaagagatc CCGAATAGCGCGCTCAGAGAGAGAGGA CGATAGCTCTCGCA CCGCATAGC ->toto_00011 # 2419 # 3000 # 1 # a +>toto # 2419 # 3000 # 1 # a AAGCTCGCTAGACNNCTCGATACNNCTCGGATAGC ->toto_00011 # 3500 # 4000 # 1 # vfvfdv +>toto # 3500 # 4000 # 1 # vfvfdv CAGATAGCNNCGCTAGAGGAGAGCTCTCGGAGA ->toto_00011 # 4632 # 5000 # -1 # fdf +>toto # 4632 # 5000 # -1 # fdf CCGAGATCGCGCGCGCTCTTCTCGAGA >other_header_00013 # 3399 # 4538 # 1 # fdfd AGCTCTCGAGAGGAGCGCTCGA diff --git a/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.faa b/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.faa index 83b9ead08b3d0068c58b6c06e4af5c82a0e8f19a..99568dd72b7890b01dcff2225e1e8f77e146841b 100755 --- a/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.faa +++ b/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.faa @@ -25,6 +25,8 @@ CGCTCGCGCA CCTATAGGAACCACCGGGG >zdsdf_00014 CAGGATAGCGCGCTCAGAG +>JGIKIPIJ_00016 +CCGAGGTGCGAGGTGTGTTGTGTGCG >JGIKIPIJ_03015 AGATCCGCGCGCTATAGAGC >JGIKIPIJ_03016 diff --git a/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.ffn b/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.ffn index da0303699ad58f2da76a3f28be2f82b9a91c452d..c68302f21a81747a5fcf87e64b0e7b84e91ceef6 100755 --- a/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.ffn +++ b/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.ffn @@ -19,15 +19,17 @@ AAGCTCGCTAGACNNCTCGATACNNCTCGGATAGC CAGATAGCNNCGCTAGAGGAGAGCTCTCGGAGA >JGIKIPIJ_00011 CCGAGATCGCGCGCGCTCTTCTCGAGA ->prokka_out_for_test -aagcgctctgcg -cgctcg >JGIKIPIJ_00013 AGCTCTCGAGAGGAGCGCTCGA CGCTCGCGCA CCTATAGGAACCACCGGGG >JGIKIPIJ_00014 CAGGATAGCGCGCTCAGAG +>JGIKIPIJ_00016 +AAGGGATATGGCCACACAGTT +>CRISPR_toto +CCGAGGTGTGCG +CCGGTGTGCGCG >PROKKA_02927 CCAGAGATCGCGCGC >PROKKA_02928 @@ -36,7 +38,5 @@ AGATATGGCGCGCTCTCTC AGATCCGCGCGCTATAGAGC >JGIKIPIJ_03016 AAGGATCTCTCGCGAGAGGA ->prokka_out_for_test -AAACCGGCTCGGGCA >JGIKIPIJ_03017 CCAGGATAGCGCGCGC diff --git a/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.fna b/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.fna new file mode 100644 index 0000000000000000000000000000000000000000..f207a5619240b74e2cfdc6aa6b3d986362af4d4c --- /dev/null +++ b/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.fna @@ -0,0 +1,28 @@ +>JGIKIPgffgIJ +aacgcgcatccagcgctagagacgctctcgacgagc +cagatctgca +cacaacaggtcgcgctcg +cagagatgcccc +ccgcgttt +>toto +aaccggcctcgcgcatcgcatcagcagAAGCGCGGTTGTGTTNTNTNGGAGCGCGAGGTGTGTG +CCAGGTGTTGTGTNNNCGCCGAGGTGTGAGAGGGTGTGT +>other_header +acgctagagagctcgcgctaagagatcAGCGCGTGTGTGTNTNTTGTGTGCGAGAGCGCGAGTGTGGAGCGC +CCGAATAGCGCGCTCAGAGAGAGAGGA +CGATAGCTCTCGCA +CCGCATAGC +>my_contig +AAGCTCGCTAGACNNCTCGATACNNCTCGGATAGC +>bis +CAGATAGCNNCGCTAGAGGAGAGCTCTCGGAGACAGATAGCNNCGCTAGAGGAGAGCTCTCGGAGA +CAGATAGCNNCGCTAGAGGAGAGCTCTCGGAGACAGATAGCNNCGCTAGAGGAGAGCTCTCGGAGA +CAGATAGCNNCGCTAGAGGAGAGCTCTCGGAGACAGATAGCNNCGCTAGAGGAGAGCTCTCGGAGA +>ter +CCGAGATCGCGCGCGCTCTTCTCGAGACAGATAGCNNCGCTAGAGGAGAGCTCTCGGAGA +GCCGAGGTGTGAGAGGGGCCGAGGTGTGAGAGGGGCCGAGGTGTGAGAGGG +GCCGAGGTGTGAGAGGG +>contname +AGCTCTCGAGAGGAGCGCTCGAGCCGAGGTGTGAGAGGGGCCGAGGTGTGAGAGGG +CGCTCGCGCA +CCTATAGGAACCACCGGGG diff --git a/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.gff b/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.gff index 51ad5ef01a8cc9cb608503d1fc87ad8de8a2442e..72133def73122882f7a9442633fb8e73d88e00ac 100755 --- a/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.gff +++ b/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.gff @@ -8,20 +8,21 @@ ##sequence-region contname 1 6009 JGIKIPgffgIJ Prodigal:2.6 CDS 287 787 . + 0 ID=EPKOMDHM_00001;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00001;product=hypothetical protein JGIKIPgffgIJ Prodigal:2.6 CDS 4416 6068 . + 0 ID=EPKOMDHM_00005;Name=yiaD;gene=yiaD;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P37665;locus_tag=EPKOMDHM_00005;product=putative lipoprotein YiaD -JGIKIPgffgIJ Prodigal:2.6 CDS 9000 12000 . - 0 ID=EPKOMDHM_00006;Name=vgrG1;gene=vgrG1;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:Q9HI36;locus_tag=EPKOMDHM_00006;product=Major exported protein -toto Prodigal:2.6 CDS 77 1237 . + 0 ID=EPKOMDHM_00008;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00008;product=hypothetical protein -toto Prodigal:2.6 CDS 1279 2346 . + 0 ID=EPKOMDHM_00009;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00009;product=hypothetical protein -toto Prodigal:2.6 CDS 2419 3000 . + 0 ID=EPKOMDHM_00010;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00010;product=hypothetical protein +JGIKIPgffgIJ Prodigal:2.6 CDS 9000 12000 . - 0 ID=EPKOMDHM_00008;Name=vgrG1;gene=vgrG1;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:Q9HI36;locus_tag=EPKOMDHM_00008;product=Major exported protein +toto Prodigal:2.6 CDS 77 1237 . + 0 ID=EPKOMDHM_00009;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00009;product=hypothetical protein +toto Prodigal:2.6 CDS 1279 2346 . + 0 ID=EPKOMDHM_00010;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00010;product=hypothetical protein +toto Prodigal:2.6 CDS 2419 3000 . + 0 ID=EPKOMDHM_00011;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00011;product=hypothetical protein toto Prodigal:2.6 CDS 3500 4000 . + 0 ID=EPKOMDHM_00011;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00011;product=hypothetical protein -toto Prodigal:2.6 CDS 4632 5000 . - 0 ID=EPKOMDHM_00012;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00012;product=hypothetical protein -other_header Prodigal:2.6 repeat_region 296902 2968265 . - 0 ID=EPKOMDHM_00027;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P0A6C5;locus_tag=EPKOMDHM_00027 +toto Prodigal:2.6 CDS 4632 5000 . - 0 ID=EPKOMDHM_00011;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00011;product=hypothetical protein +other_header minced:0.2.0 CRISPR 296902 2968265 . . . note=CRISPR with 3 repeat units;rpt_family=CRISPR;rpt_type=direct other_header Prodigal:2.6 CDS 3399 4538 . + 0 ID=EPKOMDHM_00028;eC_number=3.1.11.5;Name=recD;gene=recD;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P04993;locus_tag=EPKOMDHM_00028;product=RecBCD enzyme subunit RecD my_contig Prodigal:2.6 CDS 4535 7888 . + 0 ID=EPKOMDHM_00029;eC_number=3.1.11.5;Name=recB;gene=recB;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P08394;locus_tag=EPKOMDHM_00029;product=RecBCD enzyme subunit RecB +my_contig Prodigal:2.6 CDS 888 45015 . - 0 ID=EPKOMDHM_00030;eC_number=56;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P08394;locus_tag=EPKOMDHM_00030 contname Prodigal:2.6 tRNA 3039279 3039355 . + 0 ID=EPKOMDHM_00030;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P05458;locus_tag=EPKOMDHM_00030 contname Prodigal:2.6 tRNA 3039389 3039465 . + 0 ID=EPKOMDHM_00031;eC_number=3.1.11.5;Name=recC;gene=recC;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P07648;locus_tag=EPKOMDHM_00031;product=RecBCD enzyme subunit RecC contname Prodigal:2.6 CDS 7854 9491 . + 0 ID=EPKOMDHM_00032;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00032;product=hypothetical protein contname Prodigal:2.6 CDS 9525 11285 . + 0 ID=EPKOMDHM_00033;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00033;product=hypothetical protein -contname Prodigal:2.6 repeat_region 2994578 2994971 . + 0 ID=EPKOMDHM_00034;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00034;product=hypothetical protein +contname minced:0.1.6 repeat_region 2994578 2994971 7 . . rpt_family=CRISPR contname Prodigal:2.6 CDS 11249 12328 . + 0 ID=EPKOMDHM_00035;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00035;product=hypothetical protein ##FASTA >JGIKIPgffgIJ diff --git a/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.tbl b/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.tbl index 1d0e1027e1acd34f2ea8e6d83742262f4271a9b0..5ad8010d9e82d0aed9a3c26dc29455433492e9f5 100755 --- a/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.tbl +++ b/test/data/annotate/test_files/original_name.fna-prokkaRes/prokka_out_for_test.tbl @@ -38,9 +38,9 @@ locus_tag JGIKIPIJ_00011 product hypothetical protein >Feature other_header -2968265 296902 repeat_region +2968265 296902 CRISPR + note CRISPR with 3 repeat units rpt_family CRISPR - score 13 3399 4538 CDS inference ab initio prediction:Prodigal:2.6 locus_tag JGIKIPIJ_00013 @@ -51,6 +51,13 @@ locus_tag JGIKIPIJ_00014 product hypothetical protein db_xref 12345 +45015 888 CDS + inference ab initio prediction:Prodigal:2.6 + locus_tag JGIKIPIJ_00016 + product hypothetical protein + inference ab initio prediction:Prodigal:2.6 + inference similar to AA sequence:UniProtKB:P32 + db_xref 56 >Feature bis >Feature contname 3039279 3039355 tRNA diff --git a/test/data/annotate/test_files/prodigal.outtest.wrong-end.gff b/test/data/annotate/test_files/prodigal.outtest.wrong-end.gff new file mode 100644 index 0000000000000000000000000000000000000000..6fc1afe3b6959671a608d1f49b4d922020c48d74 --- /dev/null +++ b/test/data/annotate/test_files/prodigal.outtest.wrong-end.gff @@ -0,0 +1,2084 @@ +##gff-version 3 +##sequence-region JGIKIPgffgIJ 1 9603 +##sequence-region toto 1 22446 +##sequence-region other_header 1 51012 +##sequence-region my_contig 1 31459 +##sequence-region bis 1 6009 +##sequence-region ter 1 6009 +##sequence-region contname 1 6009 +JGIKIPgffgIJ Prodigal:2.6 CDS 287 787 . + 0 ID=EPKOMDHM_00001;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00001;product=hypothetical protein +JGIKIPgffgIJ Prodigal:2.6 CDS 4416 6068 . + 0 ID=EPKOMDHM_00005;Name=yiaD;gene=yiaD;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P37665;locus_tag=EPKOMDHM_00005;product=putative lipoprotein YiaD +JGIKIPgffgIJ Prodigal:2.6 CDS 9000 12002 . - 0 ID=EPKOMDHM_00006;Name=vgrG1;gene=vgrG1;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:Q9HI36;locus_tag=EPKOMDHM_00006;product=Major exported protein +toto Prodigal:2.6 CDS 77 1237 . + 0 ID=EPKOMDHM_00008;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00008;product=hypothetical protein +toto Prodigal:2.6 CDS 1279 2347 . + 0 ID=EPKOMDHM_00009;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00009;product=hypothetical protein +toto Prodigal:2.6 CDS 2419 3000 . + 0 ID=EPKOMDHM_00010;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00010;product=hypothetical protein +toto Prodigal:2.6 CDS 3500 4000 . + 0 ID=EPKOMDHM_00011;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00011;product=hypothetical protein +toto Prodigal:2.6 CDS 4632 5000 . - 0 ID=EPKOMDHM_00012;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00012;product=hypothetical protein +other_header Prodigal:2.6 CDS 3399 4538 . + 0 ID=EPKOMDHM_00028;eC_number=3.1.11.5;Name=recD;gene=recD;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P04993;locus_tag=EPKOMDHM_00028;product=RecBCD enzyme subunit RecD +my_contig Prodigal:2.6 CDS 4535 7888 . + 0 ID=EPKOMDHM_00029;eC_number=3.1.11.5;Name=recB;gene=recB;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P08394;locus_tag=EPKOMDHM_00029;product=RecBCD enzyme subunit RecB +contname Prodigal:2.6 CDS 7854 9491 . + 0 ID=EPKOMDHM_00032;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00032;product=hypothetical protein +contname Prodigal:2.6 CDS 9525 11285 . + 0 ID=EPKOMDHM_00033;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00033;product=hypothetical protein +contname Prodigal:2.6 CDS 11249 12328 . + 0 ID=EPKOMDHM_00035;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00035;product=hypothetical protein +##FASTA +>JGIKIPgffgIJ +TCTCATACTACCCAATTTCTTAAAAGTGCAAATTTGTGAAGCTTATCCTGTTATTATTTT +AAGTTTCATGCCAAATTCTCTCACCAGATAATGCCGCCCTCTTCCGAAAAATAATCAAGA +GGCCAAACAATATCTAAAATGATACAACTGTATCTATTCCCCTGAAAAATACATTATTCA +TTTGTATATTTTCCTCATCATTGCTTTTTATTTAAATCATCCGATAATCCCCTGAATATA +ATTATGTCAATAACCATCAGAAAAAGTGGATGATGAGGAAAAGGATATGGCCGACAGTTT +CCAGAATGAAGTTCCCGCCGCTCGTGTAAATATCAAGCTTGATCTGCATACAGGCAATGC +TAAAAAGAAAGTTGAACTCCCCCTCAAGCTTCTTGCCGTAGGCGATTACAGTAACGGAAA +AGAGCAACGTCCGCTGTCCGAACGGGACAAGGTTGATATCAATAAAAACAACTTCAACAG +CGTCATGGCTGAGTTTTCGCCTGCGGTTAATTTAACAGTAGAAGATACGCTAAACGGAAA +CGGTAATGAACAAAATATCGCGCTTGAATTTAAAAGCCTGAAGGATTTTGAACCCGAACA +GGTAGCAAAAAATATTCCGCAACTTCGTGTATTACTCGCTATGCGCAATTTACTACGTGA +CCTGAAATCCAATCTGCTGGATAACGCAACGTTTCGCCGTGAACTGGAAAATATCCTGAA +AGACCCGACGCTCAGTTCAGAACTGCGTGATGAACTGGCGAAAATTGCGCCGCAGGAGAA +CGTTTAACCCGAACGCGTATTCAGGTTAAACCGGAGAAGAAAGGATCACTGAAAAGGAAA +TGCTGATGTCTGTACAACAAGAACATGCCACCTCTGAAACTGCAACACTCACCACCACTG +AGTCCGGCGGCGTTTATCAGTCCCTGTTCGATAAAATTAATTTAACCCCGGTGTCTTCCA +TTCAGGAAATCGATTTATGGCAAAACAGCGAAACGCTGGCCGATGCCTCACCCGATGAGC +GCGTGACGGCGGCGATTCACGTTCTGCTTTCCTGTCTGGCGAAATCAGGCGAGGACGTGG +TTAAGCTCGACAAGAGCCTGCTGGATTTTCATATCGACGATCTGGATCAGAAAATCAGTA +AACAGCTTGATGCGGTCATGCACCACCCTGAATTCCAGAAAGTCGAGTCGCTGTGGCGTG +GTACATGGTTCGTCGTACAGCGCACTGATTTTCGCAAAAATGTCAGAATTGAACTGCTGG +ATATCAGTAAAGAACATCTGCGGCAGGACTTTGATGATTCTCCGGAAATCATTCAAAGTG +GTTTATATCGCCATACATACATTCAGGAGTACGATACGCCGGGTGGCGAACCTGTTGCCT +CATTAATTTCCAGCTATGAATTTGATAACAGCCCGCAGGATATTGCCCTGCTGCGTAATA +TTTCCAGAGTGTCTGCCGCTTCCCATATGCCTTTTATCGGTTCTGTCGGACCGAAATTCT +TCCTTAAAAATTCGATGGAAGAAGTCGCCGCGATTAAAGATATCGGCAACTACTTTGACC +GCGCAGAATATATTAAATGGAAGTCGTTCCGCGATACGGATGACAGCCGCTATGTGGGAT +TAGTGATGCCGCGCGTGCTGGGCCGTCTGCCCTATGGGCCGGACACGGTGCCGGTACGCA +GCTTTAACTATGTGGAAGAAGTCAAAGGCCCGGATCACGAAAAATACCTGTGGACAAACG +CCTCGTTCGCCTTTGCCGCCAATATGGTGAAGAGCTTTGTTAATAATGGCTGGTGCGTGC +AGATCCGTGGCCCACAGGCGGGCGGCGCAGTGGCCGATCTGCCGATCCATCTTTACGATC +TCGGCACCGGCAATCAGGTCAAAATTCCGTCCGAAGTGATGATCCCGGAAACCCGCGAAT +TTGAATTTGCCAACCTTGGCTTTATTCCGCTCTCTTATTATAAGAATCGCGATTACGCCT +GCTTCTTCTCGGCGAACTCTGCCCAGAAACCGGCGTTGTACGATACCGCTGACGCCACCG +CCAACAGCCGTATCAATGCCCGTCTGCCTTACATCTTCCTGCTGTCCCGCATTGCGCATT +ACCTGAAAATTATTCAGCGCGAGAATATCGGCACCACCAAAGACCGCCGCGTGCTGGAAC +TGGAGCTGAATACCTGGATCCGCACGCTGGTGACGGAGATGACCGATCCTGGCGATGAAC +TTCAGGCTTCGCATCCACTGCGCGACGGGAAAGTTATCGTCGAGGACATAGAGGACAATC +CGGGCTTCTTCCGCGTCAGACTCTTTGCCGTGCCGCATTTCCAGATTGAAGGGATGGATA +TCAACCTTTCTCTGGTTTCCCAGATGCCAAAAGCAAAAGCCTGATCGGGCGGTGGTGTGA +TGTATGAAAATTTGTCGACCACTGTGGGCTGAGGGGACATTCCTGTCTTCTCAGCAGTTT +CAGCAGCAGGCCCGCTGGGAAGCGTTCAGCAATGACTGTATTGCGCAGCTTTGTATTCGC +CATCCGTGGGGGATCGCAAACGTGCTCTTTGACCGGGATGCCCTGACGCCCGGAAAGCTG +AAAACGCAGGCAGTACGCCTGCGTTTTGCTGATGGCACGCTGATCGATTCAGACGTGAGT +GACGTTCTGCCGCTCGCCTGCGATCTGCGCGCGCTGAAGAACGACAGCGCGATTGTTTTG +CTGGCGCTGCCGCTTGCACATGGTAACGGCGGTAATCTCGGTCAGGGTGAGCAGACTGAA +AGACCGCTGCGCTATCGTCAGGAATGGCAAAAGGTGCAGGATATCTACGGCAGTGACAGT +GAAGATATGGCCGTTGAGCGTCATGCGCTGTCCCTGCGCTTTGCTCATGATAACAATCAG +GATTACATCACCTGCCCACTGGCGCGTCTGGTGCGGGATGTTCAGGGCAACTGGACACAG +GATGAGAGCTATATTCCGCCGTTACTGGCGTTTAACGCCCATGACGGGCTGGTACAGCGT +CTGGACACATTGCTGTTGCAGCTACGGGCGAAGTGCCAGCGTCTGATGGCGATGCGCCGG +GAAAGCAACCAGCGTATGGCGGACTTTGCCGTCGCCGATGTCTCCCTGTTCTGGCTGCTT +AACGCGCTGAATTCCGCCGAGCCGGTGCTGAGCGATTTCCTGCGCTACCCGGCTGTCCAC +CCCGAACTGGTCTGGCGGGAGCTGGCGAGGCTTGCCGGTGCGCTGCTGACGTTTTCCCTT +GAGCATAACGTCAGCGCCGTTCCGCCCTATGTCCACGAATCGCCGTCCACCGTCTTTCCG +CCCCTGTTCTCCCTGCTCAGCGAGCTGCTGGAAGCCAGCCTGCCGTCGCGGGTGATCGCG +CTGGATCTGGCGTCCCTGCCGGGCAACCGCTGGAAAGCCGACCTGCACGATCCGCGCCTG +CGGGAAGAGGCCGATTTTTATCTGTCCGTTCGTTCCTCACTGCCTGCGCATCAGGTACTG +CATCAGCTACCGCTGGTCTGCAAAATCGGTGCGCCCGATGATGTCACGCTGCTTATCAAC +GTGGCGCTGAACGGTGTTCAACTGGTGCCGCTTACCTCGGTTCCGGCGGCGCTGCCGCTG +CGGCTGGAGAACCAGTATTTTGCGCTGGATATGCACAGTGACGCGGCTAAATCGATGCTG +GAGTCCGGGAGCTGCATGATTTATGCGCCGGGAACCATGGGCGACCTGAAACCTGAACTG +TTTGCGGTGCTGCGCACATGAAAAAAGATATGGATATCAATATCGATGCGCTGCTGCTCG +ACACGTTTCTGACGGTGGTGGAACTGCGTCAGGGAACCACCGTGCGTCACGGTATCGAGC +TGTATCGCCACTGTCAGCGGCAGGTGGAACTGGTCCGCGAACGTCTGAAAGATGCCGGAT +TCAGTCGGGAGAACGTGGAGCACATAACTTACGCGCAGTGCGCCCTGCTGGACGAAACGG +TGCTCAGCCGTAGTGGCATGGACGACGGTCAGGCCATCTGGATGAAAAACCCACTCCAGT +CGCATTTCTTCAACACCCTGCAGGCAGGTGAGCTGCTGTACGAACGGATGAAGCAGGTGC +TACAGGAACCCGCCCCCGCGCAGGCCGTGCTGACCTGCTTTCACCGTGTCCTGCTGCTGG +GATTTCGCGGGCGTTATCAGGATCCGGCAGCCCCGGAGCGCGACCAGCTTATTTCGACGC +TCAACGGGCAGGTCGCGCCATTTGGTGTGCTGCCGGAAACGGCGGTACTGAACGTGCCGT +TATCCACCCGTCAGCACCCTTTGCTGCATTCGCCATTTTTCTGGCTGGTAACACTGGCGC +TGCTACTGGCGGGCGTCTGGTGGGGGCTACACCACTGGCTGAACGTGCTGGTGGATGAAC +TGCTGCCGCAAAGCCTGCGTTAAAGGGAGTCGTGAGTGAGGAACACGCTGAAACAGGCCA +TCGTGCTGTGGGGAATGGTGTTACTGCTGGTGCTGTGGTCAGTGTTTATCAGTCCGTCTG +GCGTGCTGAGATGGGCCGGTGCGGCGGCTATCGTTCTGGCGGTTGCTGCGTTGTTGATTT +ATCGGCGCAGGCAGGCGTGGACGGAGATGACCGGCGATGCCGGGTTGTCATCGCTGCCGC +CGGAAACCTACCGGCAGCCGGTAGTGCTGGTCTGCGGCGGTCTGTCGGCGCACCTGTTCA +CTGACAGCCCGGTCCGGCAGGTTTCAGAAGGGCTGTATCTGCATGTTCCTGATGAAGAAC +AGCTTGTGGCGCAGGTGGAGCGATTGCTGACCCTTCGCCCGGCGTGGGCATCGCAGCTTG +CCGTGGCGTATACCGTCATGCCCGGCATACACCGGGATGTGGCGGTTCTGGCCGGACGGC +TGCGACGGTTTGCCCACAGTATGGCGACGGTGCGTCGCCGGGCGGGCGTAAACGTCCCCT +GGCTTCTCTGGAGCGGGCTGTCCGGCTCGCCGTTGCCGGAAAGAGCGAGTTCACCGTGGT +TTATCTGTACCGGCGGCGAAGTTCAGGTAGCAACATCCACAGAGACCACCATGCCCGCGC +AGTGGATTGCACAATCCGGCGTACAGGAGCGCAGTCAGCGACTCTGTTACCTGCTGAAAG +CTGAAAGCCTGATGCAGTGGCTGAATCTTAATGTGCTGACGGCACTGAACGGCCCGGAGG +CGAAATGCCCGCCACTGGCGATGGCCGTGGGGCTGGTCACCTCGTTGCCAGCGGTGGATA +ACAACCTGTGGCAAGTGTGGATCACCGCCAGAACCGGCCTGACGACGGATATCGCGGACA +CCGGCACAGACGCCACGCTGCCGTTTCCGGATGCTCTGTTACGGCAGTTGCCGCGTCAGT +CGGACTTTACCCCGCTGCGGCGGGCCTGCGTGACCATGCTGGGCATTACCACCGCGGCGG +GTATCACCATGTTGTGCCTGTCAGCCACGGCAAATCGCCAGTTATTACGGCAGGTCGGTG +ACGATCTGCACCGGTTTTATGCCGTCCCGGTGGAGGAATTTATCACCAAAGCCCGTCACC +TGTCGGTGCTGAAAGACAATGCGACCATGCTCGATGGGTATTACCGGGAAGGAGAACCAC +TGCGCCTCGGTCTGGGGTTATACCCCGGCGAACGCATCCGCCAGCCGGTATTACGCGCCA +TTCGCGACTGGCGTCCGCCTGAACAAAAAATGGAGGTGACGGCTTCGCTTCAGGTTCAGA +CCGTGCGTCTTGACAGTATGTCGCTGTTTGACGTCGGACAGGCCCGCCTGAAAGACGGCT +CGACAAAAGTGCTGGTGGATGCGCTGGTGAACATCCGGGCAAAACCGGGCTGGCTGATCC +TCGTGGCCGGATATACCGACGCCACCGGCGATGAAAAAAGCAATCAGCAGTTATCGCTGC +GGCGTGCCGAAGCGGTGCGCAACTGGATGCTGCAGACCAGCGACATCCCGGCCACCTGTT +TTGCCGTACAGGGACTGGGCGAGAGCCAGCCTGCGGCGACCAACGACACGCCACAGGGCC +GGGCAGTCAACCGGCGTGTCGAAATCAGTCTTGTTCCGCGTTCTGACGCCTGTCAGGACG +TGAAATAAAACATACCGCCGGAAGAAGGCGGTGCTTCAATCACACTAACAAGGAGAGTAA +TTCTCATGGCTATTCCTGCTTATCTCTGGCTGAAAGATGACGGCGGCGCGGATATCAAAG +GTTCCGTGGACGTTCAGGGGCGCGAAGGTAGCATCGAAGTGGTGGCGCTGGATCACGATG +TGTACATCCCGACCGACAATAACACCGGCAAACTGACCGGTACCCGTACTCACAAGCCCT +TTACGTTTACCAAAGAAATCGATGCCTCCAGCCCGTATCTCTACAAAGCTGTGACCACCG +GACAGACCCTGAAAACGGCAGAATTTAAGTTTTACCGCATCAACGATGCCGGTCAGGAAG +TGGAGTACTTCAACATCACGCTTGATAACGTCAAGCTGGTCAGAGTCGCTCCGCTTATGC +ACGACATCAAGGATCCTTCCAGAGAGAAGCATAACCACCTGGAACGTATTGAGTTCCGCT +ACGAGAAAATCACCTGGACTTACAAAGACGGCAACATCATTCATTCCGACTCGTGGAATG +AGCGTCCTTCCGCCTGATAACTGCGGCAGACAGGAAACTGTCTGCCTTTTTGTTGTGTGC +TTTGTCCAGTGCCGCAGGCACCGGTACTGAGCAAAGCATACCCACAATCTGGTGAAACCT +GATGGGCCTGAGTGAGGTAACGGCTATGGGCGGTAGCGTGCCTGAACGCGGATCGCAGGA +ATACAGAACACGATAAGGAACCCTTCTATGACAGGAAATCACTCCGCCGCGCTGCTGCGT +CGCCTTAACCCATACTGTGCACGGGCGCTGGACGCTGCCGCCTCACTGTGTCAGACCCGC +GCCCATGCGGAAATAACCATTGAACACTGGCTGCTGAAACTGCTGGAGCAGGGAGAAGGC +GATATCACGGTGATTGCCCGCCGCTATGAATGGGATATCGACACGCTCTGGCAGTCTCTG +CTGGCACATCTGGACACCTTACCCCGCCCGGTCCGCGAACGTCCTCAACTTTCTGAACCG +CTGGCAGCGCTTATCCGACAGGCGTGGCTGATAGCGTCACTGGAAGGCGACGATCCACAA +ATCCGCAGCCAGCATCTGCTGATGGCGCTGACAGAAAAACCGATGCTGCCCGCCTGTAAT +GACCTGTGGGTATTGCTGAGTCTGAGCCGCGTGCAGCTTGAGCGGCTGCGTCCCCTGCTG +GATGCGCAGTCGGATGAATGTCCGGCACGTCAGCCACAGGTCACCGAACCGCTGACCTCT +GCACTGCCGGAGACGGCAACGGCGGACGCACCGGCAAAAACGCTGACGGAGAAACAGGAT +GACGCCCTGCTGGCGGTGCTTAACCGCTTTACCGAAGACGTGACGGAAAAAGCCCGCAGC +GGGCGAATCGACCCGGTATTCGGGCGCGACACGGAAATTCGCCAGATGGTCGATATCCTC +TCCCGTCGCCGCAAAAACAACCCGATTCTGGTGGGAGAACCGGGGGTGGGCAAAACCGCG +CTGGTGGAAGGGCTGGCGCTGCGTATCACCGAAGGCAACGTGCCGGACAGCCTGAAAACG +GTGCATATCCGCACACTGGACCTCGGTCTGTTACAGGCTGGCGCGGGCGTTAAAGGTGAA +TTTGAACAGCGGCTGAAAAATGTCATCGATGCAGTGCAGAAATCACCGGAGCCGGTACTG +CTGTTTATTGATGAAGCCCATACCATTATCGGTGCGGGTAATCAGGCAGGCGGCGCGGAT +GCGGCGAACCTGCTGAAACCGGCACTGGCAAGGGGCGAACTGCGCACCATCGCGGCGACC +ACGTGGAGCGAATACAAACAGTATTTTGAGCGCGACGCCGCGCTGGAGCGCCGCTTCCAG +ATGGTTAAGGTTGACGAGCCGGATGATGACACCGCCTGTCTGATGCTGCGGGGACTGAAG +GCTCGCTATGCACAGCACCACGGCGTGCATATGCTGGACAGCGCCATTCAGACCGCCGTG +CGCCTGTCGCGCCGCTATCTGACCGGACGCCAGCTGCCGGACAAGGCGGTTGATTTGCTG +GATACCGCCGGGGCAAGAGTCCGCATGAGCCTTGACACCCTGCCGGAACCGTTGACGCAG +CTTCATGCGCGACTGGCGGCACTGGATATTGAGCGGGAAGCGATTGAGCAGGACAGCGTA +TTTTATCCCGAAGCCAGCCCGGAGCGGCTGGCGGAACTGACCGATTTGCGTGATGAGCTA +CAGGCAGAAGCCGGGCATCTGGAAGCGCAGTATCAGCAAGAAAAGGCACTGGCGCAGCAG +ATTATGACGTTGCGTCAGGAAGGAACAGACAGCTCTGAACTGCAACAGCAACTGCGGACG +CATCAGGGCTTTGCACCGCTGCTGGCGCTGGATGTGGACGCCCGCGCCGTCGCCACGGTG +GTGGCGGACTGGACCGGCATCCCGCTCTCTTCCTTGCTCAAGGACGAGCAGAGCGACCTG +CTCAGTATGGAACAGAGTCTTGAAAACCGCGTTGTCGGGCAAAGCCCGGCGCTCTGCGCC +ATCGCACAGCGGCTGCGGGCGGCTAAGACCGGCCTCACGCCGGAGAACGGCCCGCAGGGG +GTATTCCTGCTGACCGGCCCCAGCGGCACCGGTAAAACCGAAACTGCGCTCACACTGGCC +GACACTCTGTTTGGCGGTGAAAAATCCCTTATCACCATTAATCTTTCGGAATATCAGGAA +CCGCATACCGTTTCCCAGTTGAAAGGTTCGCCTCCGGGCTATGTCGGCTACGGTCAGGGC +GGCGTGCTGACCGAAGCGGTACGCAAACGCCCTTACAGCGTGGTGCTGCTCGACGAAGTG +GAAAAGGCGCATCGCGACGTGATGAACCTGTTCTATCAGGTGTTCGACCGGGGCTTTATG +CGCGACGGCGAAGGGCGGGAAATCGACTTCCGTAACACCGTGATTCTGATGACCGCCAAT +CTGGGCAGCGACCACATCATGCAGCTGCTGGAGGAAAAACCGGACGCCACGGACGCAGAC +CTGCATGAACTGCTGTACCCCCTGCTGCGAGACCATTTTCAGCCTGCACTGATGGCGCGC +TTTCAGACGGTGATTTACCGCCCGCTGGGACAGGAGGCGATGCGCGCCATTGTGGAAATG +AAACTGGCGCAGGTGGCCCGCCGTCTTCACCAGCACTATGGGCTGGAAACGGAAATCAGT +AACAGCCTGTACGACGCCCTGACCGCCGCCTGCCTGCTGCCGGACACCGGTGCGCGTAAT +ATCGACAGCCTGCTGAACCAGCAAATCCTGCCGGTCTTAAGCCAGCAGTTGCTGGCGCAG +CAGGCCGTGCATCATAAGCCTGCCCGACTGCGGCTTGACTGGGATGATGAAGACGGGATT +GTGCTGGAATTTGATGAGAAATAATGGAGGCTCTTATGAACGTACAGTTCTTCGACCACG +CACACCACAAGCTCAAAATTCGCGGCCTGAAAAGCCCGGTGGACGTGCTGACGTTTACGG +GCCGGGAACAACTCAGCGCACCCTTCCGCTACGACATTGAATTTACCAGTACCGATAAAA +CCA +>toto +CGATCTGATAGCTAATTGTAAGAAGATAAAGGAAGGCAACGATAAAAACGAGGACACCAC +CTGGGCATGGGTAGCGATGATCCTGACACTGGTCGGTCTTATTCCAGTGGCAGGTTCTTT +AATTAAAGGGATCTTCAAAGTGCTGTTTAATTCGATAAGAAAGGCGGCGCTTTCCAGTAG +GGATATTGTACGAGCGATTGATGCTTCCGTTTCCCTGTTTAATAAATTTATCGATTTGCC +AGCCGTGCAGGCGACAATGAAGTGGATGAAGATTTATAACCCGTATACGTATGCTGAGAA +GCAGGTCAGGGAACTGATGGCGCAACTTAACGTATCGGTGCTGTTAAGCAAGCTGGATGA +GTTAATGGACGTCACTGGTTCGCTACTCGAAAAGGCTAAATCTTGGGGGCCGGAGTCCAT +TCGCCAGCCGATAGAGGTGATATGGGAACTGCTGGTGTCTATCCGCAGCCAAGCCAACAC +CATGCTTGCAAAAGCGCTGGCACCGTTAAATGATGTGCTGGAAAAGCTGGCTGCCCGTCT +GCACCGGGAAGGGGACGATTATTATAAAGCGCATACTGGTGCTAATCCGCATCGGCCTTC +TCGCCTGAAAGATGCTGAAGAGGTGGAATTGCTGGCTACCAAAAAGCCAGACTGGGCGGA +TATTGGGGGTAAAGAAAAATATCCACAACTGGAAAAAGCCAGTGCGGAACAGAAAAGATT +AATGGACCCGGAGAATAAGGAGGGCGGCTACCCGAATATTCCTGATGATAAAGTGCAGAC +TTTTCATCAGATGGCTCCCGTTGAATTTAAAGAAGGCGAGAAACTCTACCGGGTGCTTGA +CCCTGGCAGTAGCGATAATAGTTTTTGCTGGATGCGTGAAGCAGAGTTTAAAGCACTGAA +GAGTAAGTCTCAGTGGCGACGACGCTTTGCGGTCTGGAAAAGCTGGAATGAAAATGGTGA +GTATGTAGTTTATACCGTGCCACCCGGTACAACAATGAAGGTTTGGGAAGGTCCAGCTGC +CTCTCAGGTGCGTGAAGTCACAGGTAAGAATGGAGAGAACATTAAAGTCGTGCTGGAAGG +CGGATCACTTCAGATAGTGATAGATCCGACCGTTCTGAATTTGGACTATTTGGGGAAACG +TCAGTCTACAGGATGGGGGTATAGAGATTTTTCTGATGAAGTGGATATGTATATAGGTGT +GCCTCAGTTGCAAACAAATATTTATGTACCTAAATAAAAAGTATCAACAGACAATTAATT +GATAAATCAGGAGATAAAATGGCTATATTACATCCACAGGAGTGTTGGTTGCTGGAAAGA +ATAATGTCGCCGGAATATTATCGGCGCCGTTTTGAGGGCTGGCAGGCGTTTGTCGAGCTG +TGCGAACGGCAAGTGGCGGAGTGGAGCAAGACCATTCCGCTGGATGTGCGCCGTCGTCCG +CTGTACGAGCAGATTGACGCCGTCTGGGGCGGGCGGGTGTTGCCCAATATCCGCAGCACT +TTAAAGTCGGTACAGTATGACTTTATTCAGCTACAGCAGGGGGACCTGCGGGTACTGCAA +TCCGGGGGCAATATTAGCAGTGATATGAAAGGACTGATTGATTATCCGCCGGACTGGATG +TCACCCGCCGCGCAAAAACAGTATGACAGGCTGAAATGGCGAGGTGCACATTATAATAAT +CTAATCAGACGTACCTCGGGCGGATACTGGTATGACGGCGAACTGACTTATTATTATGAG +GAAAGTCTGCACGGCCCGCTGGCCCTGCCGATGCAATTACCGTTGTATGAGCTGGATAGC +AGCGTATACCTGCGTGAGGATGACCCGGTAACGGTGGCTGGCCTGTATCTGCCGGATATC +CCAGATGCCAGCGCCCAACTGTTGTACCGGAGTGAACATATTCCCGAGGCTTGGCAGGGG +CGGGTACGAACGAAGTATGTCAACGAGGCTGGGATACAAGAATATTACTGGGAAAGCGGG +GCGTGGGCAAAATGCAACTGGAAACGTATACGGCGGGTGGCAAACCGATTTATCAATGTG +CCGCCGGAGGGATTTTTCCCACAGGGCATGCCGGAGGAGTTGTACAACTGGCCACAGCGC +GAAGCGCAGTATGTAACAGACCGGCAGCGGATAGCGGCCTATAGCGGTGAAGCTTGTCCT +CATAGCGGGGAGTGGTCGATTTTTGTAGAAGGTAGACAAGCGACGGAGACGCTGGAGCAG +GGAGAGCAGATGCCGGAATGGACGGACAGGAAAATGGAGGGGGAGTATAAAAGAGGTGAG +AAATTCCATGTGCTGTGGTCGCTGATGAACCGCCACGATGGCGGGTCGGTGTGGGTGGAA +GCGTAGCGGTAGCTGGATGTACACGTAAAAACCGGGGAATGGGTGATTTTATTCTGGTTT +ATACAGGAGAGATGAATAATGAGGATATCACTGGCAAGCTTGTTTTTTCTTTGCTGTACA +GTATCAGACAGTGTTTATGCGGATACAGATCAAACATATGATATTTTTTGGGGAATGCTG +GTAAAGGATAAAAAGGATACTATATTTGTTCGCTGTGACAGTCCGTTATTGAAAATGAAA +ATTGTGAGAATGGCGGATGCAAATACAGAAAACATTGATAAGGCATACCAGATATTTAAT +CAGAAAACGAAAAAATCAATTTATTTTGCTTTTATCGGTAATGTGACTGATGCCGGGAGT +GGAAAGTATATTTTCAATATGCTGGACGTGATGGAAACGAGAGAAGGCTATTGTAATCTG +TCCGATGTGCTTAATGCAATAGATGAACAGTTTCGATAGTTTCGGATAAAATTGTTATTT +TATGCTTTCTTTTTTGATACGTTACGTCAGGTCGTTGTTTTTATAAATCAACAACCTCAT +TTATTAAATAACATAAATCAAAAGCAATGCCATTATGGCCAATGAATTTCAAGTGGATAT +TAAATCTGTTTATTATAAATTTTCCTATTTGTGTTGAAACACCTCTTAAGACTGAATGCT +GAATTACTATATCAAGAGTCACATCAATTCATTATTTCTGATATTAAATTTAATGTTTTA +TTATTTTTATAATATTTAATATTAAAACTGCAATTTCCGTAAAATTATAACATTATGGAG +GACTCAACCATGAAAGGTATTGTTGTTCTGGGAGATAAGACAACGCATGGTGGGCAGGTT +ATATCTGTGTCATCTTCGATGGTTATCAATGGAAAAAAAGTTGCGCTTGTAGGTGATAAG +ATAAACTGCCCTGTTAAAGGGCATGGTATTAATACCATCATCGAGGGGAGTTTTGATTGG +ATTTCTGATGGCAAACAGGTCGTCGTGAATGGCTGCAGGTGTGAATGTGGCTGTGTTGTT +ATATCCAGTATTGCTGATGCCTTGATTGGATGAATATTATGGGATGGAAACGGACGTATA +CAGAAGAAATAGACAGGCCACAGGATATTTACTTTCATAAGTGGTTATTTTCTTTATTTA +TTTTATGTATATTATTACTCGTTATTTATTATTTTTTCCATGAATTTGTTGTAGCTAATA +ACGCATCTTTGTTAGCATTCTTTTCCCCATTATTATTGTGGGTATTGATTCTTTCAGTAC +AGGTAATATTTTATTCCAGAGCTATTCAGGATTATTCAATTTGGCTGGAGAACAGACTTA +GTATCAACAGAGAGTGGGAGGCATGGGGATCAAGATATGTTTCTGTTATGAATAGTAGTC +TTCATCTTCCTGGAAAAGTCGATGTTTTATTCTTGTCTGGTGATGAATTAGAAACTCAGT +ATGGACTTGTCAATAAGTCAGATGATATCACATGGAAGCAACATGATTGGTATGCCTGCT +TTCAGACCCTTACTAATCATCTTGAACTTTATAAACTCCCATATCAACTTACACAAGAAT +TTATTATTCTTACTGATTTTGATGAAAGTATGTACTCTCAGATTGAAGAGGACTTTTTCA +GAACAGTGGAGAAAACCAACAGAACAGAGGGGCATTTTTTGTTGCATATTTCCCCTTCAA +TGTCCTTTGGAGAGCTTGATTTATGGTTAAAGGATTCCGAAGAGAAAATATATATTGTCA +TGGTGTTGCAGATGGAGGAGCAAACATCCTGTTCGGACGCTATGGCTTGCCTTATGTTTG +CAACTGATGATGTTACTGCTAAGTACAAACTCACTGAAAAGGCCAGAATTTATCGCCCAA +TGGTAGTAAATAGTAATAATTTCAATAGTGACTTGAATATTTTTATTGACACACAAAAAA +TATCCAAAAATGCCGCCGGGTTAGTTGGGGACAGTCAGCGTCTGTTTTCTGTGAGTAGTA +ATGTATTGCAGTGTTTTAATGATAATAATGCTCAATTGAAAATTGATAATATCCATCTTT +TAGAAAGCCTTTGCGGATTACCAGGGGGAAATGCGGTCTGGTTAACGGCAGCGCTGACTA +TTTCGGTGGTTGTTCACAAAAATTCAGATTACTTGATGATGTCCGAAAATAATGATGACT +GGATCATTACCACCATTCATCCTATGGAGCATTCATGAAGAGAATAAATAAAAAAAGTGT +TTTTATATCTAATGTACTTTTATTCTTGGTTATTGTGGCCTTCGTGGGGGGGATCATCTG +GCGTTTTGGTGATCATTTTGGACTGAAAGGGGATGAAAATAATTTTTTTGCGTGGTTGAT +ATGCATTATGACCCTCATTTTTGTACGGGCATCCTGGTATTTCTCTCGATTGTATCGCCT +ACGAAAGGAACAACATCACTCCGAAAAGGAAAGATTACGCCCGGAGAAAGAGGCTCGTAT +TGAATATGGCAAGGTCATAACCCTGAACATTGAGCTAGCTGAGTATTTATGTGCCCTATA +CGGCCCATTCTGGCGGCGTAAAGTCCGCCTGCTGCTGGTGACCGGCGAGCCTGAACAGGC +AGAGGCCATCGCGCCGGGGCTGACCGGGCAACACTGGCTGGAGGGCGACCACAAGGTGCT +GATATATGGCGGCAGGCCATCAGCGGAGCCTGATGTCGCGCTACTGACCGCCTTAAAAAA +ACTGCGCCGCAGCCGCCCGCTGGACGGCATCATCTGGCCGCTGACAGAAGAACAGAGCCG +CCAGACAGCGCAACTCGACAAAGGCTGGCGCGAACTGATAAACGGCGGTAAGCGACTCGG +TTTTCAGGCTCCACTCTATTTGTGGCAGGTCTGTGACAACGGTGATTATCAGACCGGACG +CCCCCTGCAAAGCGTCGGCTGCCTGCTGCCGGAACGCTGTACCCCGGAACAACTGGCTGC +AATGCTGGAAGCACAAACCCTGCCGCTGACGGAACAGGGCATGTCGCAACTGCTGGCAGA +TAACCGCCATGATTTCCTGCTGCGTCTGGCCCATACCCTTGCAGAGCGGGGTATCGCTCA +CTGGCAAAGCGTTCTGAAACCGCTGCTGGCAGGCGGCGCATTTTCTTCCCTGCGCCTGCG +TGGCCTGATGTTCAGCCCGCCGCTTGCCGCCGTGCCGGAGGCCGCACCTCATGCGTGGCT +GCCGTCACCGGTCTGGGCGGGCGTGACGGGTGATAACGCGCGCGGGCGTGCAGTGGGCTT +TCCGTGGCTACGCGCCGCGCTGATAACCAGCATCTGCATGCTGGCGATATGGGGGGCCGG +AATGACGACCTCGTTCTTCGCCAACCGCGCGCTTGTTCAGGAAACCGGTATCCAGACGGC +ACGTGCGCTTGATACCCGCCTGCCGCTGGCAGAACAACTGGTGGCGCTGCATACCCTGCA +GGGCGAACTGGAACGCCTGCAATATCGTATCCGCGAAGGTGCGCCGTGGTATCAGCGTTT +TGGCCTTGAACGTAACCAACAACTGCTCGCCGCCGCTTTTCCCGGCTATGCGCAGGCGGC +AAACCGGCTGGTGCGCGACGTGGCCGTTGACCATCTGCAACAGCAACTGAACGCCTTTGT +CGCCCTGCCGCCCAACAGTCCTCAGCGTACCGCCACCGGTGAACAACGCTATAAGCAGCT +TAAGGCATTGCTGATGACTTCCCGCCCGGAAAAGGCCGACGCTGCCTTTTTCAGTACCAC +GCTGATGGCGGACGGTCTGCGCTACGAGAATATCCCGGAAGGTGTGCGGCAGAGCGTGTT +GCCGTCACTGCTGACCTTCTGGATGGCGAACCTGCCGGAACACCCGCAGTGGAAAACCGC +ACCGCCGCCGGAACTGACCGGCGCGGTGCGTAAAATCCTGCTGCGCCAGATTGGTGTGCG +TAATGCTGAAAACACCCTCTACCAGAACGTGCTGCAACAGGTGTCCCGCAACTACGCCGA +TATGACGCTGGCGGACATGACCGGGGATACGCTCACCGAATCTCTTTTCAGTACGGAACA +GACAGTGCCGGGGATGTTCACCCGTCAGGCGTGGGAAGGACAGGTCAGGGAAGCCATCGA +GCAGGTAGTGACGGCGCGGCGCGAGGAAATCGACTGGGTACTCAGCGACCGCCAGCAGGA +TACCTCTGCGGATATCTCGCCGGATACGCTGCGTAACCGTCTCACCTCACGCTACTTTAC +CGACTTTGCCGGAAGCTGGCTGGCGTTTCTCAACAGCATTCGCTGGAAAAAGGAAGACTC +GCTCTCCGGCATTCTCGACCAGCTGACACTGATGGCCGATGCCCGTCAGTCGCCGCTGAT +TGCGCTGACCGATACCCTCGCGTGGCAGGCGGCGGCTGGCAGGGAAAACCGTGGCCTGTC +AGACTCGCTGGCGAAATCGGCACAGGAACTGTTTAACGGCAAGGAGAAAACGCCGCAGCA +ATCCCGTGAAGGCAACGAGCCTGTCGGGCCGCTGGATAAAACCTTCGCGCCGCTGCTGCG +GTTGCTGGGCGATAAAGCCGGAGGCGGAGACAGCCAGCTGAGTCTGCAGACCTACCTTAC +CCGCGTTACCCGCGTGCGCCTCAAACTGCAACAGGTGACCAACGCTCCCGACCCACAGGA +GATGACCCAACAACTGGCGCAGACAGTCTTGCAGGGCAAAACCGTTGACCTCACCGACAC +CCGCGACTACGGACGGTTAATCGCCGCCAGTCTGGGCGAGGAATGGAGTGGCTTCGGTCA +GGCGCTGTTCGTCCGCCCGGTGGAACAGTCGTGGCGGCAGGTGCTGACGCCTGCAGCGGA +CAGCCTGAACCGCCAGTGGCACCGGGCGATTGTCAGCCACTGGAATCAGGACTTCGCCGG +GCGCTATCCGTTCAAAGCCTCACAGAATGACGCTTCCCTCCCCCTGCTGGCGCAGTACCT +GCGCGATGACGGGCGCATCAACCAGTTTATTGCCGCCAACCTTTCCGGCGTTCTGAAACG +TGAAGGCCGCTACTGGGTGGCTGACGCCATGAACACGCAGGGGCTGACGGTCAATCCGGA +CTTTATCCGCGCCCTGAACCGCCTGCGCGACGTGGCCGATACCGCCTTTGCCAGCGGCGA +TGCCGGGATACATTTTGAACTGCGGGCAAAACCGGCCCGAGACGTGATGAAAACACATCT +GGTGATTGACGGGCAGGAACTGGAATATTTCAACCAGAAAGAACGCTGGCAGCGTTTTAA +CTGGCCGGATGAACAGTGGCAGCCCGGCGCATCGCTGAGCTGGACCAGTACGCAGGCGAT +GGAGCGCATACTGGCGGATTATCGGGGAAGCTGGAGCCTAATTCGTCTGCTGGAACAGGC +GCAGGTGACACCGGTGGACAGCAGCACCTTTAAAGTGGTGTGGAAAGCGCAGGACGGCCT +GCCACTGAATTACCTGCTGCGGGTTGAACAGGGAAAAGGGCCGCTGGCGCTGCTGGAACT +GAAAAACTTCCGCCTGCCGGGACAGGTATTTCTGACCGGCAGGAGTATGAAGGATGCGGA +AGAATACGGGGAAGACGCCGATGAGTGAGCTGTTGCAAAAGCTGACCCGTAGCTGTTTTG +CCGACCGGGATGCACTGGATGTGGCGCGAACACAGGCGGCACTGTGGCAGACATGGCTGC +TGCCGGTGACGGCAGACACGCCGGTCGGGGAAGACCCCGGCTACCACGACGATTTCCTGC +GTATCCGCGACGAGATGAACAAACTTTCCGGCGCGGATACGGACCTCATCTGCCAGCTTG +CCGAATCCCTGCTGCTGACGCAGGCAAAAGACGTGCGCATCGCCACTTACTACATCTGGG +CGCGACTGCACCGCGACGGTGAGCGCGGACTGGCGGAAGGACTGGCGCTGCTGACCGGAC +TGGTGGAACGCTTCGGTACGCAACTGCTGCCCTCGCGTCCGGCCAGCCGGAAAATGGCGC +TGGAGTGGCTGGCAGGGGAAAAGATGCTCGACAGCCTTGCCCGCTACCCGGAAGTGGCAA +AAGAGGATTTTGCGAACATTGTTGCTGCTCTTAATCAACTGACGGTTTCCTTCGCCGCAT +GGCCCGAAGACCAGCATTCCCCCTCCCTGATGCCGCTGATTAACGCGCTGGAATCACGTC +TGGCGCAGTCGGGTGGGATGAATGCGGTGGTGCCGCAAAACAGCAGCAGCGTTCCTGCAC +CGTCATCCCCGGTGGATGCGCCACAGGTACAGACCATCACCTCCGGGCGCGACCTGCTCG +ACCAGGCGAAAGTGCTGGCCCGTTATCTGAACGAACAGCCGCAGGGCTGGCTTTCAGCAC +ACCGGCTGATGAAAACCCTGCGCTGGGACACGGTGCATGAACTGCCGCCGGATGTGGACG +GCAAAACCCGGCTGGCCCCGCCGCGCACAGAATCGCGCAACCAGCTTAAGCGGCTGTATG +CCCAGCAGAACTGGACGGAACTGCTGGAGCAGGCCGACCTGATGTTCAGCACCGGTGTCA +GCCATTTCTGGCTGGACATTCAGTGGTATCTGCATCAGGCGCTGGCCAAGGCGGGCGCAC +CGTGGGACAGGTGGACAGCCGTTATCCGTCAGGACCTGACGTTACTGCTGGAGCGCCTGC +CGGGACTGGAAAATCTGGCATGGAACGACGGCACACCGTTCGCCGACGAGGTGACGCGCA +ACTGGATAGCGCAGCAGGTCATGATGCGGGAAGACGGCGCATGGCTTGCGGGGAAAGCCG +CTGTACCGACAGACGACGCCACAAATGACGTACTGGCGCTGGAGCCGGAAGCACTGGCGA +TGGCAGACAGTCAGGGCGTGGAAGCGGCGCTGGGCTGGATACAGACCCGTCCGGGCATCA +CCACGGCACGACAGCGCCTGTTATTGCGGCTGCTGATGGCACGGGTGGCGGAACAGTACG +GTAAAAACGAGATGGCGCTCCTGCTGCTGGAAGAACTGGATACCGCCGCACAGGGAATAA +CGCTGACGCAGTGGGAGCCAGAACTGCTGTTTGAAGTAAAAGCCCGGCAACTGAAACTGC +TGCGCCTGCGGGCACATCGCCACGCGGACAAGGCGGCGCTTGCCCGGAAAATGGACGCTC +TGCTGGGTTCGCTGGTGGCAATCGATCCGGCGCGGACAGCGGTACTGTGTGATACGCAGC +ATAAGGACTGATTTCTTATTTGTATTTCAGATTAAAGGACTTTGATGGACGACCTGACCC +AACGCTACTTTGAGGCCGAAATGCGCTACCTGCGTGAAGCGGGTAAAGAATTTGCGCAGG +CTTACCCCGACCGCGCTGCGATGCTTAATCTTGATAAACCCGGCGCACGCGATCCCTATG +TGGAGCGCCTGTTCGAAGGCTTCGCCTTTTTAATGGGCCGCCTGCGCGAAAAGCTGGACG +ACGATCTGCCGGAACTGACTGAAGGGCTGGTCAGCCTGCTGTGGCCCCACTACCTGCGAA +CCATCCCGTCACTTTCCGTGGTTGAACTGTCGACAGATCACCGGCAAATGAAGCAGAGCG +AAACGCTGAGCGATTTTCAGGTATTGTCGCGCCCTGTTGGCGAGCGCAGAACCCGCTGTT +TCTACAGCGCCACGCGGGATATCACGCTGCATCCGCTGGCGTTGCCGGACGTGTCATTGC +AATATGAACCGGACGGACGTTCGGTTATCCGTCTGCGCTTTGAATGCGGCCCGCTGGTCG +GCGACTGGTCGCAGATCGATTTATCCCGCCTGCCGCTCTATCTCAATGCCGACAGCCCGG +TAGCCTGTGCGTTGCACCGGGCTTTAACGCTTGGCACGCAGCAGTTCTGGCTGCGTCTGC +CGGGGCAGGATCGCCGGATGCTTGGCGCACACTTTTCCCCGATGGGCTTTGAGGATGATG +ACAGGCTCTGGCCAAAAGGTGAGTCAGCCTTCAGCGGTTACCAGTTGCTGCTGGAGTATT +TCACCTTCCGCGAGAAGTTTATGTTCGTGGCGCTGAACGGGCTGGAGCAGGTTGCATGGC +CGGAGGGGATAACCGGCTTTGAGATTGACGTGGTGCTGAACGAGAACTGGCCTCACGACC +TGCCATTTGACAGCGATAATATCCGTCTGCACTGCGTGCCGGTCATCAACCTGTTCCCGC +TCGAAGCCGATCCGTTACACCTTTCGCCACTGGAAAACGAATTTCTGCTGCGCCCGATGC +GCATTCAGGACGGGCATACCGAGATTTATTCCGTCGACAACATTATTTCTTCGCGCCATA +CCGGCAGTCAGGCATATGTCCCCTTTTCCAGCTTTCGTCACCGGGGCGGGATGCTGCGCC +ACGATGCGCCGGAACGCTATTACCACACGCGGGTAAAGCGCGGCCCTTCCGGCTTGCACG +ACACATGGCTGATTCTGGGCGGCGATGCGTTTGATTCCGACCGGATGCTGGAGGATGAAA +CCCTGTCCTTAAGTCTGACCGGCACCAACGGGCAGCTTCCCCGTAAAGCCTTACAGAGCA +CCCTGCTCGATACGCCAGTTCATGCCTCACAGAACGTCCTGCGGGTGCGCAACCTGTGCG +CCCCGACGCAGCCCTGCTATCCCCCGGCGCGTGACCGCTTCCACTGGCGGGTGCTCAGCC +ACCTCGGTTCTAACTTTTTATCGATGATGGATAACGCCGAAATTCTGCGCGGCACGCTGG +CGCTGTACGACTGGACCGAAAGCGAGATGAACCGCCGTCGTCTGGAGGCGATTGTCGACG +TTCAGCACAGCCTGATACAGCGTTTTGAAAGAGGCTTTCTGCTGCGTGGCGTGGATATTC +AGGTGACGCTGGACAGTAACGGCTTTGCCGGAGAAGGTGATATCACGCTGTTTGGTGAAC +TGCTGCACCGCTTCTTCGCACTGTATGCCGATATCCACTTATTCACTCAACTGACCTTAA +TTCTGCAACCCACAGGAAAGTGCCTGCAATGGACAGAGCATCACAGCCAGCGCGTACCGG +GCTGACCGACCGGCTGGCCCCGGATATTGCGCGGATCAATTTTTACCGTTTTTGCCAGTT +GCTGGAACAGAGCCAGCAGAAAGCGCCGCTGGGCAGTACCGACAACCCCGCCGCCGATGC +GGTGCGTTTTCGCCCCCATCCCGGAATGGGCTTTCCGGTCAGCGAGTTAAAGAACGTTGA +ACGTGACGTGGACAATCCCGACGCGCCACCCACGGTGCGCACCACCTTTCTCGGCCTGTA +CGGCGTGGATTCACCGCTGCCCACCGCCTATCTGGACTACATTACCCAGCGTCATGACGG +ACATGACGCAGTGATGGCGTTTCTCGATATTTTTAACCATCGCTTTATCACCCAGTATTA +CCGCATCTGGCGCAAATATAACTACCCGGCGTCGTTTGAAGCAGGTGCCGTGGATGACAT +TTCCCGTTGTCTGCTGGGGTTAATCGGGCTGGGTATTCCCGGCAGCGAGAACCATATCGC +CACGCCTGTATCCCGTTTTCTGGCCCTGCTCAGCGTGATGCGCCTGCCCACCCGCACGGC +TGAAGGCGTCACGGCACTGGTGGGGCTGCTTGCCCCGCTGACGAAAGCCACGGTGGTGCC +TCACGATCCGCAGCCTGTAATTCTCCCGGCCCCTGCGGGTCTGTCAAAAAATTCACGCAT +CAGCCTGAAAACGCGAACGCTGCTGGGGCGTACCGGTACCGACGTCAACAGCCAGTTGCT +GCTGAAACTGTATACCGAAGATGCCGCAGAAGCACGTGGCTGGCTGCCCGGCGGGCAACT +GCACAGCGATTTGCTGGTGCTGCTGCGCGTTTATCTGGGCTGGCGCTGTCAGGCCCGTCT +GCAACTGACGCTGCCCGTCAGCCTGTTGCCTGCTGCCCGGCTGGGAAAACAGCGTGTACA +GATTAGCCGTACCGGCATCCTTCTCGCCTCCTTTGCCGCGCCCGCGACCGGAACAGTGAC +GGTCAGTCTGGGGCGTTATCAGGGATTAATACCCGCTTTTTCCATTCGTAACAGGGAGAG +TATGACTCATGTTTCCTATTCGTTTTAAACGTCCGGCGTTGCTCTGTATGGCGATGCTGA +CGGTTGTTCTGAGTGGCTGCGGGCTGATTCAGAAAGTGGTGGATGAATCGAAAAGCGTGG +CCTCAGCCGTTTTCTACAAACAAATCAAAATACTGCATCTCGATTTCTTCTCCCGCAGCG +CCCTGAATACGGATGCGGAAGATACGCCGCTTTCCACGATGGTGCATGTCTGGCAACTGA +AAACCCGCGAAGATTTTGACAAGGCGGATTACGACACCCTGTTTATGCAGGAAGAGAAGA +CGCTGGAGAAGGACGTACTGGCAAAACACACCGTCTGGGTAAAACCGGAAGGCACGGCAT +CCCTGAATGTGCCGCTGGATAAAGAGACGCAGTTTGTCGCCATTATTGGGCAGTTTTATC +ACCCTGATGAAAAAAGCGACAGCTGGCGTCTGGTGATCAAAAGGGACGAACTGGAGGCCG +ACAAGCCGCGCTCGATTGAACTGATGAGAAGCGACCTGCGACTGCTGCCTCTCAAGGATA +AATAACCGATGTCGACACCTTCCTTATATGAAATGCTGACGTTCAGTTTCAGCGGCGAGT +TACCGCTGGAACAGATCAGCGAGCGGGATCAGCTTATCCTTTCCGTGATGGACAATATGC +AACGCATTATCAACTGCCGGGCAGGCACGCTGGCGCATTTGCCGGATTACGGTCTGCCGG +ATCTCAGTCTGATCCATCAGGGGATGGCTGCGGGTATTCATGGCCTGATGCGTCAGATTG +AAGAAACACTGCTGCGTTATGAACCACGCCTGAGTCAGATACAGGTGGAATTACTCCCCC +AGCCCCGTCCGGGGCATCTTAATTACCTGATCCACGCGCAGCTTCCCGATACCGGCTGGA +TACGCTTTGATGGCGTATTTTCTCCGGAAGGACGAATTGTTCTGCGTCATCTCAAACAAC +AGGAGCGGGCGTACTGATGGCAAGTAACGCGAATTTTATCAGCCAGTTCGTCATGGGCGG +CGATCCCTGTACTTATAAGGAATCCGGTGAACTGCAGGCTGAAATGAGTAAACTGACTCA +CCCGGCCCGACCGGATGTGGACTGGCGTCAGGTGGAAAAACTCTGCCTCGCGCTGTTCCG +GCAAAATGGCGTGGAACTACAGACGCTGGTCTGTTACGTACTGGCGATAACCAGACGGCA +GGGGCTGGCAGGGATGGCAGACGGACTCGGTTCACTGGATATACTGCTCCAGCGCTGGGC +TGACTTCTGGCCGGTACAGGTACATTCCAGAATATCACTGCTCAGCTGGGTCACAGAAAA +AATGCAGCAGGCACTGAGAACGCTGGATATTCAGTATCAGGATCTGCCGCAGATTTACCG +TTGTGTACAGCATCTTTCCGCCATCGAAACCACGCTGCAACAGTGTGAACTGTGGCATAT +GACGAAACTGGATCTACTGGCCGGGCAGTTTCGCAATACCGCATTGCGTCTGGAACGGCT +GGCGCCTCAGGGAGCGGAAACCACTATCACTCCCCCTGAATTACCCCGCCGGGAAATGAA +TCAACCGAAAAAGTCAGAGGAAAGTCCACAGCCGGTTTTTGCAACCAGATCCGTTCAGCA +AAACGATAAGGATGCCAGTCCACCCGTTCCATCCCCTGAAATCTCCCGGCAGCGGACATG +GCCGATATTTATGGCCGGAATGGTTGTGATGGCCGGTCTCGGCGGAACAGGATTATGGGG +CTGGTCGCAGCTTAATCAGCCGGACGCGCTAATCCAGCGAATACAACTGTCTGTCATGCC +ATTACCGCAGTCGCTGGAGAGCGGCGAACTGGCAAAGCTGGATGTAAAGGATAAGGCGCT +GCTGGCTCAGGACAGAACAATTGCGGCAAGTCAGATGCAACTGGAGCAGTTAAACAAATT +GCCTGCCCGCTGGCCACTGGAGCAGGGATATCGCCAGCTACGCCAGCTTGATGCCCTGTG +GCCGGATAATCCTCAGGTCAGGGCGCTGAACGCGCAGTGGCGCAAACAGCGGGAGCTGAG +CGCCCTGTCTGCTGAGGCACTGAATGGCTATGCTCAGGCGCAGAGCCAGCTACAGCGCCT +GTCGGCGCAGCTGGATGCACTGGATGAACGTAAGGGGAGATATCTGACCGGTTCGGAACT +AAAAACGGCGGTGTACGGCATCCGGCAGTCGTTAAAGGAGCCGCCGCTGGAAGAACTGCT +TCGGCAACTGGAAGAGCAAAAACAGACCGGAGAGGTTTCGCCAACGCTGTTGACGCAAAT +TGATACCCGGTTAAATCAGTTGTTGAATCGCTATGTCATTTTACTGGATACGAAGGTGGA +ACAAAGTCAGTAAACATCGGGGGATTTATGTACCAATAAGGGATATGTGACCTTGCCATT +TTTTAAAATGGAGTCTCTGTGTACAAAAAAAGAGAGGAACAGGCCATTCGATCTACTCGT +TGATTCACATCAGATAATGAGTGTATATTTCGGTAGATAGCTTGGGTTCGGGAACAGTGA +ATACCTTAAGTTTCAAAAGATTGGATTAACCTCTTGACTGTGGCCCCCGCAACCAATTTA +TTAGAATGCTGACAAACCGCAATGTGTTCTACAAATTGCGGTTTTTTTGTATTTAAAATC +TTTGTTCGCTGAACTCACAACACGTTTTTTATCTCCCTTCCTGCGAAGTAATCAATTATC +GACTGGGCAACGTGTATCCCGGTTTGCTGGTATGACTCAACGGTGGCGGCCGCGATATGC +GGCGTTGTAATGATATTTTTGGCATGTAGCAGTGGGCTAAATTGCGCCAACGGTTCAGAG +CTAAACACATCCAGCGCCGCAAACACATTTCGTTCTTCAATCACCTGAAGTAAAGCGCCC +TCATCCAGCAACTTTCCCCTTGCGGCATTGATGATTAGAGCACCATTGCGCATCATCGAC +AAATATTTATGACTAATGAAGTTCTCCAGCTCAGAAGAAAAAGGCAAAAGAACAATGATG +ACATGCGACTGCATAAAGATATCTTCAATTGATACAAACTGAACTCCAGCTTTGTCAGCA +ACCTGATAGTCGGGTTGTTTGTCAAAAGCTAAAAGCTCAACATCAAAACCGGATAACCTT +TTCGCCAGAGTTTTACCTATATTACCGTAGCCAACCAGGCCAATCCGTTTCCCTTGTAAT +TCACAGCCATGCGACTCACCCCAGTAGCCATTTTGCATCGCATGATAGCTGCCAGGGATA +TTTCTCATGCTCGCGAAGATAAGTCCAATGATAAATTCCGCAACCGCATTTGAATTAATC +CCAACCGCATTATTGACAACAATACCGGATTGCTGTGCCGCACGAAGATCAATATTGTCT +ATCCCCGTCCCGAATCTCGATATTATTCTCACACCAGGCAGCAATGATAGCGTGTCCGCC +TGATAACCATCTTTTCCGGCGATGACCGCGCAAATAGATTCTCGTAATGCAGTGGATTCT +GATTTAAGCAGATGCTCCACATTATTCTTAATAATAAGATTAAAATTATTCTCTCTTAGC +AACTTGCTGGCGGAAACACAGCGTGCTGAAAAGCTGGGGACGGTGACCAGAACATTTTTC +ATAGCGGACACTCACTTCAAAGAACGCCACCCCAAAAGATGGCGTGACCGGTTACTGTAT +TTATATTTTGAAATTATGAATTTGCTTTAATGCCGAGTGCACCTCCTGGATGATATAAGC +CGAAATCAGCACGAGTAAATTTTTTCAATTCAGAGAGTGCAAGCGCCACCGCATCACCAA +CAACCAGAACAACAGTCGACGAGCATGACGGTGCTAAACCTAAATTATCCGCCTCACTTT +TGACGGGGATTTCAACAGATAAATCACAACTTATCGCAAGCGATGAGTGATGACTGCGGG +TAAAAGAGATCAAATAATTACCCATTTTTTTCAGACTAGGCAGTGTCGCCAGGATTTCCG +CCGTCTCACCACTGTTTGAAATAAGAATAACAACATCGTCTTTCGCCACCATTCCAAGGT +CGCCGTGTACCGCTTCCGTACCGTGAACAAAAAACGAGGGAGTTCCGGTGCTGGCAAATG +TTGCGGCGAGTTTCCTGGCAATAATACCAGACTTACCAACACCAATAAAAACAACTTTCC +CCTGACAAGATTGTAATACTTTAATTAAATTTGCGACCTCCGAAAGAGGGGAATCAATAA +CTTCTTCAACTGCTTTATGTTCGTTACGCATAAAATGTTTAATGAGATGGATAAGATCCG +TGTTATTCATTTTTATTCTCCCTGATTAATATTTTTAATTACACTCACAAGACGCGTAAG +CCCCATATATAATTTTTCTCGACCGCAGGCCAGGTTCAGACGAAGGTAGCCCTCCCCCTC +CGTTCCATAGACATGCCCCGCCATAATGCCCACTTTGCCTTCATGAATTAATCGACTGTA +GAATTCATCAAAAGGATAACCAATAGCAGAACAATCTATCCAGGAAAAATAGCAACCATC +AGCTGGCCTTACGATCAATTCTGGAATATTTTCATTCAGATACTGCTGGGTGAATTGAAT +GTTAGAGGCTATATGTGCCTTTAATGACTTTAACCATCCCTCACATTCGTTGTAGGCAAT +AATAGTTGCAATTATATTCAGTACTGATGGGGAGTTTACAAAATCGCGATACCTCGATAT +CGTTCTGAACTTATGATTAAAATTATCGTCAGTTGAAATCATATACGATCCTGTTAGTGC +AGGAACATTAAATGTTTTCGATATCGAGTTAAATACTACTACTTTTTCTTTTTTTATTTT +AAGCGCGGATGTAAAGCTACGATTAAAAACAAAATCACTATGGATTTCATCTGAACATAA +CCAGACATTATGCCTTGTACAGCTTGCAGCGATTTTATGCAGTTCTTCTTCCGACCAGAC +TGTTCCTGTCGGGTTATGAGGATTACATAATAACATCATCTTTGCGCTTTTAATCTTAAG +ATCAAAATCTTGCCAGTTGATAGCGTAGCCCCCCTCATTTTTTATAATCAAAGAGGCTGT +CAGAATATTTCGCTCGCTATGTTTAATTACATCAAAAAATGCATTATAGACAGGTGTAAA +AACGAGAATATTATCACCATGCGATGTCAATAACTCTATTGCTTTTGCAATAGAGTACAT +CACACTGGGGCTATAGGTTATCCATTCAGGTTTAATATCTGTTTGATATTGTTGATAATA +CCAGTTTACTATCGCATTCAGATATTCACCATGTTGCCAACGACTGTACCCTAAAATCGG +GTGTTCCAGGCGTTTTTTTAATGCTCTGGTGATAGCGTCTGGTATCGGAAGATCCATATC +TGAAATAGAGAATGGTAGTACATCTTTTACACCAAATCTGTCCTCGCAAAAGTCCCATTG +GGTACAATATGTTCCTTTGCGGGAAACAGGAGTATTAAAAACATCCATCAGTATATCCCC +ATATAGTTATCCATATCCCGACGCAGGGCGATGACTTTAGTGCCGATAATGACTTGTAGG +GTATTTTGATCAAGTTTTACAACCGCAATCCCGCCAGCTCTTTTTATTGCAACTTCGTCA +ATCAATCTCATATCTGCGATTGTTAAACGTAAACGAGTTACGCAATTATCCAGTGACTTA +ATATTCTCTTTACCACCAAGTGCCTTAACCATCTGCTCCGCCGCTTGCAGCTCTGATTTA +TCAGGAGTTGGGATATCCGCTATAGCCGTATCTTCGTGAGCGTTCAGCGTAACAGGACTG +GACTCTTCACGGCCTACGGTCATCAGGTTAAATTTAAGGATGGTCCAACGGAACACAAAG +TAATAAATGAAGAAATAGGCCACTTCGACACACACCGCGATCGGCCAACCTGTTCTTGTG +CCACGCAATACGCCAAAGCTAATAAATTGAATCAGATCACCAGTAAATCCCATCTTCACC +CCCATATATGGCAGAACCATGTTAGCGAATCCATTCATAAAGGCATGGAAGACAAACAGC +AGTGGACTGACAAATAAGAACAGAAACTCAATCGGTTCGCTGACGCCGCCAATAATCACC +GTAAGCACCCCGGAAATAAGCAATGCTTTGATAGCCTTTCTGTTTTGAGCATGAGCAGTG +CGATACATCGCCAGCGCGGCACCAGCCAGACCATACTGAATCATCAGTTTGCCCTGCTCC +ATTTTCCCCGCCAAATCCAGCGGAATGACCGCATTCTCTTTGACGTATGCCATAAACATG +TTCAGGGTGCCGTAATATTCTTCGCCGCCAATCACAGCCGAACCGCCGATTGGCGTAAAG +CGGAAAACTGACGTCACCAGATGGTTTAAGCCAAAAGGAATCGTCACGCGTTCGGCAACT +GCATAGAAGAAATAACCAACAGGACCGGAAGTTGAAATCCAGTGGCCAATGAGCATGAAA +AGATTGAAAAACGGCGGCCAGATAAAAGGAATGATCAGACCAAATCCACTCATCACAATC +AGTGTAATGATAGGCACCAGACGTGGGCCGCTATAAAAACCTAACGATTCAGGAATGCGT +AAATTAACGATCTTTTTATACATGCTGGCGACTAATAACCCAGCAACAATTCCCCCCAAC +ACGCTGGTATTGTAGGACTGGATCCCCAGAATGATGGTTTGCCCATGTGTCGACATTTGG +TCAGCAACGACCAATAAGTCGTGCTGTTTAAGATAAAAGTTCGTTCCCAAATGCATCGCC +ATAAAACCAATTAAGCCAGAAAAAGCACCATAGGCTTTATCCTCTTTATCTTTTAATAAT +CCTAAGGGAATCGCTATCGCAAACAATACAGGTAAATTAACAAAGGCAAACAAACCAAGA +CTAACAATGAAATCAAGTATGGTTTTAATTATTGGAATAGCCAGAAATGGAATTAACTTT +GCCATATCATCACTGGCTAAACCACTTCCCAGCCCTAGCATCATGCCACATACACTTAGC +AGAGCAATGGGATACATAAATGCCTTCCCCAGGCTCTGAAAAAAACTCCAGGCTTTCTTT +TGTTTCATGTGGGTTATCTCATATAAATGTTATATATAATTAGTCCATTAATACTTTGGT +ACGAATAGAGAGATATAATTTTTCTTCTAAAATTAATTCATATTTAAAAGTGGCATACAG +ATACCGTTCAATTTCATGAATTGCGCGCTGTAACAGGATGTCCTTTTCAAGAAACTGTTC +ATAGATATCACCAATATCTTTCTGTTTTATTTTTTCATTGCATAACACGCGACTTGAAAA +ATATTTAAGGTGCATCATAAATCTGGAATAGTTAAATGAACTTCTGTCCACCTTTCTGTT +ATAAACAACTTCAATAAGCTCCGTGATTATTTGCGACAACTCAATAATCCGTACTGATTC +ATAATCAACTGAATTTTCATAATTATTTAAAATATGCAATGCTATAAAACCAATCTCATC +ATCAGGAAGTTGAACGCTGAATTGCTCATTAATGATAGTTAATGCATCGCGACTTATCGC +ATACTCTGCTTTGTACAACGCTTTGATTTCATCAAGGAAAACATTATTAATTTGTATACC +TGAAACGACTCGGGATATTGCATTCGAAATGTGATCCGCAAGAATCAATAGTAGCGATGG +ATTGAGATTTTTTTCGAGATTTTTCTCCGCATATTGCACTATTTTTTCGGCAACAAACAC +ATACTCAATATCTACATGTTCAATCAATTTATAAAGTTTGTTTTTTTGTTCATTTCTGAC +ATAAAAAATCCGGTTAGCCGGATGCTCAGGGACCGACATTCCATATTTTTTGTTGTAACC +GACGCCAGGCCCAGAAATGATAACCTCCTGTCCATTCATCGATGCCTGTACACAATTATT +GTTCATGACTTTTTCGATGATCATTCCATGGCTCCAAAAAAAAAGGCAAGGCACGTCAGA +AGTAATAACTACTTCAAACATTGCCTTGCCTGATTTAACAGTTACAAGATGATTAACTAA +TGCGTATACATTACACGGAATTGTGCTTAATTAAAGAGATGGTCGGCTTATTTTTCAAGC +CGACATTCAAATATCCGACATCAGTCACAAAACCAGCGTCTAATATTCAGGTAAATGTTA +TCTATTCAACGAAATATAAATTCATTGAATAAATAAAAACATTATCCCCTTCTCGCCAGC +GTCGCCCCATCGGCAAAATACGCTTTAATTCCCGCAAGAATAGACTCCGCAACTTCCTGC +TGGAAAGTCGCCGTTTTCAGTTTACGCTCTTCCTCAACGTTACTGATAAACGCCGTTTCG +ACCAGAATGGAGGGAATATCTGGTGCCTTTAGTACGGCAAACCCGGCCTGTTCAACTTGA +TTTTTATGCAGCTTGTTGATTTTACCGAGCTTATTCAGCACCGCTTTACCAAACTTAAGG +CTGTCGGCAATGGTCAGCGACTGCACCATATCGAACATGGTGTGGTCGACATAGCGGTCA +CCGCTTTTGCTTACGCCACCAATCAAGTCCGAGGCGTTCTGGGTTTGTGCCAGATATTTT +GCCGCAGTACTGGTTGCGCCTTTGGTTGAGAGCGCAAACACCGAGGAACCGCTCGGCTGG +CGACTGGTAAAGGCGTCGGCATGGATAGAAACAAACAAGTCAGCGCGCTGTTTCTGGGCT +TTTGCTACGCGCACTTGCAACGGAATGAAGATGTCTTCATTGCGCGTCATGTACACCTTC +ATATTGCCCTCTTTCTCGATCAGAGAGCGCAGACGGCGAGCTATTTGCAATACCACGTCT +TTTTCGCGCGTTTTGTATTTCCCCACCGCACCGGAGTCTTCGCCACCGTGGCCAGGGTCA +AGCATAATGACAATCGGACGATCCCGCCCAGCTTTACCCGGTTGTGGACCACTTTGTGCT +GGCGGCACCTGCTTTTCGAGGTCGCCTTTGTTGTAATCCTCCAGCAGCGCCAGCAGCGGG +TCCTGCATATCCTGTGCATTGGCCGGATAGAGGTCCATCACCAGACGCTCTTTAAACCCG +GCGACCGGCGCAAGGGCAAACAGCTGCGGTTTTACGTTTTGCTTTAATTCAAAAACCATA +CGTACGGTTTGCGGGTCAAATTGCCCGACGCGCGCCGACTTGATGAACGGGTCGTCAGCG +CGGATTTGCGCAGCCATCCCCTTGAGCACCGAGTTCAGGTTTACATCTTCGATATCCACC +ACCACGCGTTCAGGATTACTCAACGCGAACTGCTTATATTTCAGCTGACGATTTGATTCT +ACCGTCACGCGGGTGTAGCTGGACGCAGGCCAGACGCGCACCGCCACGACCTGGCTGACC +GCAGCCAGGCTGACCTGACTTACGCTCAATAGCCACATGGCACCCGCGCCTTGCAGTAAA +CGACGACGGCTGATTGCAGTGTTGGATCCTGACATGCCTCTCCCGAGCAAAAGAAATCTA +AGCTGTGTAACAAGTAAACGACCAATTTGACCGGAAACTTTAGCGAAAGACGCATAATCT +GTCATCTATAAAACGGTAAACATTCTTTTTATATTCACGGTATTACTGATAAAAAACTCG +CTCCCGCATAAAATTTACACTTGCACCCTGCGAAAAAACAGAATAAAAATACAATAATTT +CGAATAATCATGCAAAGAGGTGTACCGTGGTAAAGGAACGTAAAACCGAGCTGGTCGAGG +GATTCCGCCATTCGGTTCCCTATATCAATACCCACCGGGGAAAAACGTTTGTCATCATGC +TCGGCGGTGAAGCCATTGAGCATGAGAATTTCTCCAGTATCGTTAATGATATCGGGTTGT +TGCACAGCCTCGGCATCCGTCTGGTGGTGGTCTATGGCGCACGTCCGCAGATCGACGCAA +ATCTGGCTGCACATCACCACGAACCGCTGTATCACAAGAATATACGTGTGACCGACGCCA +AAACACTGGAACTGGTGAAGCAGGCAGCGGGAACATTGCAACTGGATATTACTGCTCGCC +TGTCGATGAGTCTCAATAACACACCGCTGCAGGGCGCGCATATCAACGTCGTCAGTGGTA +ATTTTATTATTGCCCAGCCGCTGGGCGTCGATGACGGCGTGGATTACTGTCATAGCGGGC +GTATCCGGCGGATTGATGAAGACGCGATCCATCGTCAACTGGACAGCGGTGCAATAGTGC +TAATGG +>other_header +GGCCGGTCGCTGTTTCGGTCACTGGCGAGAGCTTTAATCTGACCTCGGAAGAGATTGCCA +CTCAACTGGCCATCAAACTGAAAGCTGAAAAAATGATTGGTTTTTGCTCTTCCCAGGGCG +TCACTAATGACGACGGTGATATTGTCTCCGAACTTTTCCCTAACGAAGCGCAAGCACGGG +TAGAAGCCCAGGAAGAGAAAGGCGATTACAACTCCGGTACGGTGCGCTTTTTGCGTGGCG +CAGTGAAAGCCTGCCGCAGCGGCGTGCGTCGCTGTCATTTAATCAGTTATCAGGAAGATG +GCGCGCTGTTGCAAGAGTTGTTCTCACGCGACGGTATCGGTACGCAGATTGTGATGGAAA +GCGCCGAGCAGATTCGTCGCGCAACAATCAACGATATTGGCGGTATTCTGGAGTTGATTC +GCCCGCTGGAGCAACAAGGTATTCTGGTACGCCGTTCTCGCGAGCAGCTGGAGATGGAAA +TCGACAAATTCACCATTATTCAGCGCGATAACACGACTATTGCCTGCGCCGCGCTCTATC +CGTTCCCGGAAGAGAAGATTGGGGAAATGGCCTGTGTGGCAGTTCACCCGGATTACCGCA +GTTCATCACGGGGCGAGGTTCTGCTGGAACGCATTGCCGCTCAGGCGAAGCAGAGCGGCT +TAAGCAAATTGTTTGTGCTGACCACGCGCAGTATTCACTGGTTCCAGGAACGTGGATTTA +CCCCAGTGGATATTGATTTACTGCCCGAGAGCAAAAAGCAGTTGTACAACTACCAGCGTA +AATCCAAAGTTTTGATGGCGGATTTAGGGTAAGCGATGAAAATCGCCGGATGCGACATGC +GTAACACTCGTGCGTCGCATCAGGCAATTACGTTTATCCCCGTGAACTAAACAACGCCGC +CAGACCACTGCGCCGCTCAGTACGAGTGGCGATTGCCGCACTTAATATGCGCTCATCGGC +ATACAGCGACAGACGGCGACGCGCGCGGGTCACCGCGGTGTAAACCAGCTCTCGCGTTAC +TACCGGCGTGCGTTGACTCGGTAAAATCAACGCCGCATGGTCGAACTCCGATCCCTGCGA +TTTATGTACCGTCATCGCCCACGTCGTTTCGTGCTCTGGCAGGCGACTCGGTTGCACAGA +CTTAATATTGCCGTCCGGCATCGCAAACCAGACGCGCGTCCCCTGCCCGCGATCCAGCGC +AATACCAATATCGCCATTAAACAACCCAAGCGCGCTGTCATTACGGGCAATCATCACTGG +TCGGCCTTCGTACCAACGAGAGTGCGGATGACGATGAATTTTGCGCTTCTGTTGCATAAA +CTGCTCAATTCGCTCATTCAGTCCAGCCACGCCAAACGGCCCTTCCCGCAGGGCGCACAA +AAGCTGGTACTCATTGAACGCCTGAATGATTAAATCCGGCTCGGCACGCGCTTGCAGCAG +ATCCAGATAACGCCCGTAACCCGCAAGAGCTTCCTCAAGCATCGCAATATAATCTTCGCC +ACTCTGTAAAAGCCGTTTTTCGATATCAGTAAAATCCTGCTGAAAAACGGTTTTCACTGC +CGTTTTATCACCACGGTTAATCGCCGCAGCTAACTGACCAATGCCAGAATCGCTGCCGAA +ACGATAGCTTTTTTGCAGCAGGCAGAGGCTGTCGCGCAAAGATGCCGCTTCTGTGCCAGT +TCCTGCCGGAACGTGGCTTCCCGTCAGGCGGCTCAACTGCCCGGCACGCTCGGCGGTAAA +GCCCGCGTTGGCATAAGCGCAGATATCGCCCAGCACAGCCCCAGCCTCAACCGAGGCCAG +TTGATCACGATCGCCGAGAAAGATCACTCGCGCATGATCGGGCAAGGCGTCGATCAGTCT +CGACATCATAGGAAGATCGATCATTGACGCTTCATCTACCACCAGCACATCAAGATGCAG +CGGGTTACCGGCATGATGACGTAAACGCTGGCTACCCGGCTGCGCACCCAGCAATCGGTG +CAAAGTGCTGGCATCTTCCGGAATGCGTTTCTTTTGTTCATCGGTCAGCGGTAATTGTCG +CAAAGCCTTGCCGAGAGATTCGGTTAAGCGCGCGGCAGCTTTACCCGTTGGTGCAGCCAG +ACGGATACGGCAGCGTTCGCCGTCGGCCATTTGAATTAACGCTGCCAGTAACTTCGCTAC +GGTGGTCGTTTTACCGGTGCCAGGACCACCGGAAATCACCGAGATCCGCCGTGTCAGCGC +CACTGCCGCCGCAACTTTTTGCCAGTTAATTTCATCGCTTACTGGAAAAAGTTTGTCCAG +GGTTTGCGCCAGTAGAGCTTCATCAACCTCAATGGCATGATTCACTTCGTTGAAAAAGCG +TGCCACTGTGCGCTCGTTACACCACATGCGATTCAAATAAAGACGATCGCCACAGAGGAT +CATCGGCGTTGGTTCATCTCCCCGGCTGACCGCTTGTGAAGCCAGCAAGCATTCTTCCCA +ATTTTGTAGCTCACCGATTTCACTGACACAGGTCGCCAACAGCGGATGCGATGCCTCGTT +ATTTTCCAGTCGTGAAAGCGGCAAACAAACGTGTCCCTCTCCGGCATCATGACTTAATAG +TGCCGCCGCGAGGGTGACGGCAGGATGTTCATCTCCCGCCACGGTCAGGGCAAACTGCAC +GTCCAGCGGGCGTAGCTGTTTGTGCTCCACAGCTTCCAGTAATTGCTTTTGCAATTTCAT +TACGCCTCCTCCAGGGTCATACCGGCAAACATCTCATCCATCAGGTCAATCAACCCGGCG +TTGGGTCGGGTCGCGTAGATCCCTTGTTGCGGATGTTCTTTATCAACGCCACGCAGGAAC +AGATAAATAACGCCGCCAAAGTGGCGCTCATAGTCGTAATCAGCAATACGATGGCGCAGA +TAACGGTGCAGCGCCAGGGTATAAAGCTGATATTGCAGATCATAGCGGTGTGCCTGCATT +GCCGCTGCCATAGCCTGTTGGGTGTAAGCCGAACTGTCTTCACCCAACCAGTTGGATTTA +TAGTCGAGCAGGTAATAACGCCCTTCGTGGCGGAACACCAGATCGATAAAGCCTTTTAAC +ATGCCACGTACCTGCATGAACTCCAGCGGCGGGCAGCCAGCGGATAGCGGGTCAAACTGG +CGAATTAGTGCATCAAGCTGGCTGGCGATGAGCGGTTCGCTAATTGGCAGGTAAAACTCC +ATCTCCACCTGTTTATCGCGATCGGAAAGCTGATTCAGGCTAACACCCGTTTCATTGAGA +GGTGCCTGGAGGACAGCCGTGATCCACTCAGTCAACACCGGTTCCCACTGCGGTTCAAAG +CCACCGAGCTCCAGTTTTTCCTGTACCCAGTTCGGGTCAACCGGCTGGGTAAAATCGAGG +TCTTCAAACAAACTGTGCAAGAATGTCCCCGGTGACGCACCGCGCGGGAACTGATGCGGT +GTTAACGTCGGTTCTTCAACGACGCTGACCACGCCTGCGGCATCAACATCCAGCCGTGGC +ATCAGATCCTGAGCGATACCGTGACCACGCTGCTGCAAACCGGAGTAGCTGGTGACACGC +CAGTTATCGCCGGGCAATCGTTGTAGCGTCCTCGCATTCAGTTCTGCAGTTAATGCATCA +TTAACCTGCCAGGGCTGGTTATCACCAATTTGTGCCGTTTGCCAGGCAATATCATCATCG +CACAACGCTTCAATGCAGGTACGAAGCCCTGCCGCATCTTGCGGTTCTCCTTTTTGCAGC +AAACGCCCGAGCGCACTTTGGTGGACGTCGGTATCACCTTTTTTATCGCCACGACGGCGC +ACCAGCGGTGCAACGCCGAGACTGCAATGCCAAACCGAACGCGTCAGCGCCACGTAAAGT +AAACGCAGATCTTCCGCCAGACGTTCGGCCTCCGCGAGGTCGACGCTTTCTGGCGCAGCA +TTAAGATCCAGAACGGCCTCAAACGAGTGGCGATCGTGATAAAACGCCTGATCCTGGACG +CGGAAATTGGTAATAAATGGCAACCAGACCAGCGGATATTCCAGCCCTTTTGATTTGTGT +ATCGTGACAATCTGCACCAGATGTTTATCACTTTCGAGGCGCATTTGTTGGCTGGAGGCA +TTACTGTCTGGCTCGAGGATATGTTGCGATAACCAGCGTACCAGCGCATGTTCACTTTCC +AGCTGCGTTCCGGCTTCTTGTAGCAGTTCGCTGATATGCAAGATATCGGTAAGACGCCGC +TCACCGCCTGCCGTTGCCAGCAAGTTTTCTGCAATGTTACGCGCCGACATCAGCGCCCGC +AGCATCGGCATAACGCCACGTTTGCGCCAGATTTGCCGATAACCATCGAACTCTTCGACG +ACCGCATCCCACGCATGTTCGTCATTATTCAGCGTTTCAATATCCAGCGCATTCAGCCCC +ATCATTGACGTTGCCAGCGCACTGCGCAGGGTGTTCTCACGTTCGGGCGTCATCACCGCC +TGCAACAGCCAAAGCATCTCCTGTGCTTCCAGAGTTTCAAAAACACTGTCGCGGTTCGAA +AGGTAAACGGAAGGGATTTCCAGCAGCGTTAAGGCATCGCGCACCTGAGCGGCCTCCTGG +CGGCTGCGCACCAGCACACTGATGTCCGAAGCACGCACCGGACGCGCATCGTCGCCGTTC +ATCAGCAACGCTTCGCCGCGTTGCCCGGCTTGTAGCCAGTCGCGGATTTGCGCAGCACAT +ACCTGCGCCATGGTACTTTGATAGTCGCCAACGCCGCAGCTTTCGCCTTCCATCAGCCAC +ATTTTCATCGCAGGCTGCGTTTCACCTTTAAATACAAAACGTAACGCCTGATTTTTGCCG +GCAGATTTCACAGGAATAAACGGTATTTCACGAAACATGAACGCGTCATCAGTCTGGCTG +AAAAGTTTGTTAACGCTGTTCACCATTCCCGGTGCGGAACGCCAGTTGGTATCTAAGGTG +TAGTGAGCATGAACTTCGCTACGCGCCTTCATATAAGTGAAGATATCCGCACCCCGGAAT +GCATATATGGCCTGTTTCGGGTCGCCAATCAGCAACAATGCGGTTTCCGGCTGATGGTGC +CAGATACGGCGAAAAATTCGATACTGTTGGGGGTCGGTATCCTGAAATTCATCGATCATT +GCCACCGGGAATCGCGTACGGATCGCCGCTGCCAATACCTCGCCGCTTTCACTACGCAGC +GCGGAATCGAGCCGACTTAACATGTCATCAAAACCCAATTCGCCACGGCGGCGTTTTTCA +CGCGCTACTGTTTCGCGGATCTCAGCCAATGCGCGAGTGATCACCAGATCGCGGATCGAC +AATGGTTCTGCAAGCAGTTGTTCGATCGCCTCAAACAGTGGATGTCGCGGGGTTTCCCCC +CCGGCTTTCGTGCGATCTTCTAAGAAACGCTGAGAGAATTTTTCCAGCGACTCCGGCAAC +TGATAGCTGTTGGTCTCTTCTTCTGCCCAGGCGCTGATCTTCTCGATCCATTTAGCCTGA +TTGCTACGGTTAAACTTGCGTCGATCAATACCAGAAGATTCGATCAGCGCATCCAGTTCA +CCCACTGCGTCGCGCCACTGCTGTTTTACGGCATCAATACGCGCCACAATTTGCGCGTGG +CGGGAAGCCAGCGTTTCATCATCGGGGGGCGGTGCTTTGATAACCGGCGCTTCGCCTTGC +AGATAACGATTAATATCGCGCAGCAACGCCTGCGGCCCTTTCCAGGTTTCAAAGACGACC +TGGGCAATTTCACGCGGCAGCGGGTAGCAGTGGCGACGCCAGAAATCGGCGCAGGCCTGG +TAGCGTAGCAGAGACTCATCTTCAATCAGCTGCTGCTCAAACAGCATGCCGGATTCAAAG +GCATTCAGGTTGAGCATGCGCTGGCAAAAGCCGTGAATAGTAAAGACTGCCGCTTCATCC +ATCTGCCGCTCGGCTAACAACAACCACTGCGCGGCTTGCGCTTTATCGTCGATCTCTTCC +AGCAGGCGTTTGTACAGTGGATTGTCGGTGGTTTCACGCAGACAGGCGATGCGCAACTCG +TGGATATTGCTACGGATACGACCACGCAATTCTGCCGTAGCAGCCTCGGTAAAGGTCACC +ACCAGCAGTTCTTCAACGGTCAGCGGGCGGGGAAAGGCGGCAGAACCGCCTAGTCCAAGT +AACAGGCGCAAATAGAGCGCCGCAATCGTAAAGGTTTTGCCTGTGCCGGCAGAGGCTTCA +ATCAGGCGCTCGCCCTGTAAGGGCAAGCGCAAAGGATCTAGTGTCTCGGCGACATCACTC +ATTCTTTTCACTCATCAGGGGCATTGTTTGCTGCAACGCGCTGACGTTCTCCCACACTTT +CCAGCCTTCAGGATGCACATATTCGGCTTTCCCGTTCTGGCTGCCGGAAATCTGCGACAG +AATAGCCATACCTTGCGGCTCGACCACCGCCTGATGGAAGAAATCAGCAAGTTTTTGCGG +CGTCAGCAGTTTTATCTGGGCCACGATTTTATCACGCGAATCGAAGCGCATATTGCCGCG +ATCGAAATCTTTACTTAACTTCGATGCTTCTTCGCCGAGCGTTTGCGGTGCCTGCAGCAT +CTGAGTAATTACCGCCTGCTGGATTTGCGCAAACTCCTCTGGCTTCATCGCCCGCAATTT +TGCCTCTGCGGTTGGGAAAAACGCCTTGTAACGCTCCCACAAGAATGAAGGCTGTTTATC +ATTGCTTTGCAAAAGGAAGCCCATGCCCCACTGACGCCCCACGCTCATTGGAAACGCAAA +CACGGCATAGCCCAACTGTTCTTCGGTACGCAACTGATTGTAGAACCACGGCTGTACGAT +CTGCCCCAACAGAGAGCTATAGGCTGAGCTGGTGTATTCATCGTAGCCAGTCGGTACAAA +TATCGCTGCCAGTGCGGAGTCGGTGCTGTTACCAGCTTTTTCAAAGATGACGGATTGTTT +TTTATCGACCACGACATCTTTGTTACGACACCACTCTGAACCATCAGCGCCCAACTGTTT +TTGCACATGGCGTGCCAGCGTTGTTGCCTGGGCTTCAGTCATGTTGCCGATAACCATAAA +CTCTGGTCTAGCCCCTGATTTTAAGGCGTCGCGATAGGCCAGCACCTCTTTCAACGTAAT +GGAGGGCAAAATTTTGCGCCGTTCATCTCGCGAGAAGTACGGCACTTGCGAGAGCATCTG +CGCGGGCATAATCGCCTGCTCAAACGCTTTGCCCTTTTCTGCGGAATCCATCATCTGGTT +ATACCAGGACTTCGCCTGCTCAAGCTGATCTTCCGTAGCGGTATAGCTAAAGTAGCCCTC +CAGCAGAGCCTGGAACAGCTGCGGCAGGCGCTGAGTGTAACCATTGGCATTAACCATAAG +GCCGTTGTTAGCATTGGTGGAAAAACTTATGCCACCAACCGACGCCTGGTTGCTTAACTG +ATCAAGCGCCAGCCCTGCGAGATAATCATTGAGCGCAAACATCACCTGATTGCGGGCGCT +GTCCATGGCTTTCGGATTACGCAAAATCAGGCTGACATCAGCTTTGGGCTCACTGGCAAA +ATAACGGCTTGGCGCATACACCACGCGCAGATTCGACTCATCAACAATCAACTCTGGATG +GTCGTATTTCTTCTCTGACTTAATCAGCGAGAAATCGTCAGGAATATAGGGGTTAAGCTC +CGGTAAGGAGAGCGCAATATTGGCGGCTTTTTTCTGCCAGTCCGCGAAAGTTTGTGCGCT +AATTTTATCGACCTGATACGGCGCATCGACAAAGTAAGCCGTTTTGTTGTGCGGCTCTTT +CGGGCTGATATACCAGATACGCGCATTCTGCGGCGTCATCATCGCCAGACGTTCTTTTAC +TGCTTTAGCATCGTACCGATCGGCAATATTGACTGCATCCAGTGTATGCTCAACAGGAAC +GCGAATCATGGTATCAGCCAGCCATTCGACGTAATCCATATCACGGGTGATTGACGGATA +ACGGAAGTCGATATCCAGCACATTCGCCAGTTCATCGAAGTATTGTTTATCGATCCCTTT +TTCACGTAACAGATTGAGGTAGCTAAAAATGGCCGCCACAACCTGATCGCGATTCGCCAG +ACCTTTATCGGTTAAAGACGCAGAGATCGCTAATACGCCGCTGTTGCCGTTGACGATAGG +ATCGGAATTGGCGCTAATGCCCTCAACTAATCCCTGCTTTTGCAGCCAGTCAGAAAGTGT +ACCAGGGCTGCGATTACCAATCAGATAGGTAATCAATTCATCCGTTTTACTACGGAACTT +CGCTGAATTGTTATCGATGCGAAACTCAACGCGCAGAACTTTACGCGGCAACGCCGGGAC +GTAATGAATGATAATGCCCTTTTGCGCGTCGGTGACTACCGGCACGGTGATTTCCGGTTT +TTTGCTCTCTTTGTTCGGCACGCGACCAAAGGTGTCCGCCGCCATTTTCGCCAACTCCGG +CAACGGTTTATTGCTGTAAATAACCGCCTTCATCAGATTGGCGGAATAGTACTTCTCGTG +GAAATCTTTCAGCGCCTGCTGTACCGGATTACCTGGTTTGTCGCTTAAAGTTTCGAGGTT +ACCACCAGAAAACTTTGAACCGGGGTGTGCCGGGTTAATGGTTTCTGCGCTGACCTGTGC +CATGCGCATCCCGTCACGCGTACGCGCCATGGTTAATTCGGCATTCACTGCATTACGTTC +ACGTTCGGCGTATTTCTTGTCGAGCAAGGGTTCTGCAATAGCATCGGCCAGGCGGTCTAC +CGCACCGGGCAAGGCGTCGTTCTCAACTTCCAGATAGAAAGCCGTGCGATACGGTGCCGT +GCTGGCATTGTGACTGCCGCCGTGCATTTTGAGATATTCGGCCAGACTGTCAGCCTGCGG +ATACTTTTTCGACCCCATCAGACTCATATGTTCAAGGTAATGTGCCAGCCCCTGGTACGC +CTCAGGATCTTCCAGCGACCCAACGGGCACCACCAGCGCCGAGAGCGATTTAACTGCCTG +CGGATCAGAAACCAGTAAGACCACCATACCGTTATCCAGACGTATAGCCTGATACTGGCG +GTTATCTTTATCACTTTTACGGATGGTTTCCTGAATCGGCTGCCATCCCGTTTCTGCCTG +ACTTAAGGGTGCCCAGAGGGCAACAAACAACAATAATGCTTTGAACCAGATGCTGCGGGG +CATTCACGGACCTCATAATCAACTTTATTTTCTGGCCAGATTCAACACGTTAACGCAAAT +CATCTGCCAGAATTTAATCTTGTGCTGCACGAGTCAGCCTATGTCTATATAACCATCAGT +CCGTGACTGGTGCGCATCATAAAGTAAGCGGATAGATTGCGCAATTTTTATACAATACTC +ATGACTGATTAAAGCGAAACAGCGGTAACAGGAAACGTTGCGACTGTTCAACGATAGCCT +CCATTGTCTCTGGTGTTAATTGCCGCCAGAGCCGTTGATACCAGATATCATCACCTTCGC +CACGCACCATCATGTTGCCTTCGTAAGCCTGAAGGAATTTCGTACGGGCTTTTTGCAACG +TGGAATCGTCATCCAGCATGGCATCGTTTTGCGCGTCATAACAGGTTTTTAGCCACGCGC +CGCCACTTTCAGGTAACACCAGCAATGGCGCGGACATTCCTTCACGATACCCCTCAATCA +GTTGTGAGAGGTAATGCAAAGCCTGTTCGGCTGCAAGCGGCGGAAAACGCCACTCGCCGT +CTTTGCGTAGAAAAAGGCGACTTTCACCATTACCACCGCTGGCACAGTAGACAAGGTGTT +CCAGCCAAAGTTGCATTCCCTGCGCCACACTTAATAAAGAGGGACACCAGCGCAACAGGC +CATCCGGCTGCACCTGCGGCAACCAGCCAGTTATCTGCACACCGTTGCAGGCGAGATCAA +TCTCCATACTCTGCCCTGGCTGGCGACAGGCAATGACTCTGTCGGCAAGCTGCTGCATCT +CCTGACACTGCGTTTCCCAGAAAATTTCACCAAAGGCACCATACGGCAAATCACCTGCCG +CCCGGAATCGGCGGAACAAGCGTTCGGCATCATCCTGCTCAACCAGTACATTTAATAACT +GCTGGTTGATTTGATAACGACTAAGCCCTTCAAGAATAAAAGGTTCAGTGTCGGGAATTT +CGCTGTCTTCGGTACGGAAGTTCACCTGCAAACGCATCTGGAAAAACGCCCGCACCGGAT +GTGCCCAGAATCGTTGTAGCGTTTCCAGCGGCACGGTTTCCGGTAAGGTAAATGGCAGCG +GCTGAACAAATTCAGAATGTGCTTTACCAGCCTGGCTGGCCGCAGGTAGCCACTCGCGCG +CATAGCTTTGTAAGTTACCGGGCTGGTAGTTTTGCGGGTCAAACGGCATCCGGGTATGGT +GGCAAGTAAGATGCGCTTTTACCCTTGCCTCGCTTTCATCACAGTTAAGCGCTTCATCGC +CCGGTAGATAATGGCTTTGCCCGATGTAGTCGATCAGTTCCTGCACCAGTACCGACGGGA +AACGTTCACTGTTATCCTGAATGGAACGCCCAATATAGCTGATATAGAGTTTTTGCTGCG +CGGAAATTAACGCTTCCAGGAACAGATAGCGGTCGTCATCGCGACGGCTACGGTCGCCAC +GCTTCGGTTTCTGGCTCATCAGATCAAAGCCCAATGGCGCAAGCTGACGTGGATAAACGC +CGTCGTTCATTCCCAGCAGGCAAACCACTTTGAACGGAATTGAACGCATTGGCATCAGAG +TACAAATGTTAACCGGTCCGGCGAGAAAACGCTGGCTGATACGTTCTTGATCCAGGCGCA +GTGCCAGTTCATCACGCAATAGTGACAGCGGCACCGCGTCGCCATACTGCGCGCCTAAAC +CTTCGGAGATAATCGCCTGCCATTGTTGTTCGATCAGCGTCATCGCCGCTTCGGTTTCCG +CATCCGGCAGGAAAAAGGCGTTGAGCATATCGCGACAAACCGGCAACCACTCTTCCAGCG +GACGCTCCTGCGCCAGCCCGCGACGCCAGATATTTAGCTGCATTAGCAGTGAAGCCAGAT +GCCCCACCAGTTCTGCAATTAAGCCGCTCGATTCATCATAAGGTAGAACCGATTGCCACT +CGCCCTGCGCGCTCTCCATCGCGTAGCCCAGCAACATGCGCGTCAGGCCAAACCGCCAGG +TGTGTTGACCGGTAGCGGGAAGTTCCAGCTCGCGAACGTTGTCGTCATCTATCCCCCAAC +GAATGCCGGATTCGTTGACCCACTGACGTAAATAACGCAGCCCTTCTTCGGTGATGTCAA +ACCGCGCTGCCAGCACCGGCACATCCAGTAATGCCAGCACGTCTTCCGACACAAAGCGGC +TGTCTGGCAGCGATAACAGGCTGATAAACGCTTCAAGTACAGGATGCGACTGCCGCGCCC +GACGGTCGGAAATGGCGTAAGGCAGGTAACGATCCGCAGGTGCACTACCAAACACAGCCT +GAATAAACGGACTGTAGCTGTCGATATCAGCCACCATCACGATGATGTCGCGCGGAGTAA +GTGTCGGGTCTTCCTCCAGCATCGCCAGCAGGCGATCGTGTAAAACTTCAACTTCACGCT +GCGGGCTATGGCAAACGTGGAAGGTGATACTGCTATCCAGTGGATCAAGCGGGCGTTTGT +TATCGCTACGGGAAAACTCTTCGATGTTCACACCAGCAACGGCGCGGTTTTCCAGTTCCA +GAATGTCAGACTGAATATTATGCAGCAGGTTATCTGGCGTCACATCGACAAAAGCGTCCA +GCTCCTGGCTGCTCTCCAGGTCAGAAAGGAGATAAATGTAGTCGCGCCCAAGCTTGCCCC +ATGAAGCCAGCAGCGGGTTGCCGACATCCTGTTCACCATCGCTGTTAAAGAGCTGCCCGG +CATTTTCGCTGTCGCGAAATAGCGGTAATTCGCGATCTTCAAAACTGTGTCGGCGCTGGC +GAGTCAGTAGTTTCGCCAGATAAGCTGGATCTTTAATGTCGCCCCAGTAATAACGGCAGG +GGTTGGTAAACAGGAGATGGATTTCAATATGTTTACCCAGCGCCTGTAGCGCCTGGAGAT +AAACAGGCGGTAACGCGGAAATACCGCATATAAAGACGCGCGAAGGTAACCCCGGCGGGC +AGGTCGTCGCGGACTCCAGCGTTTCGATAAAGCGCTGATAGAGATTGGCGCGGTGCCAGC +GCGGTTGCCCAAGTTCGTCGGTATATTCCACCAACGCCTTCCACAACGGCGCTTGCCAGG +CCTGTGCTTCTCCCAACCCTTCTACCAGATGTCCTGTTTCCCACTGTGCCAGCCAGTCCG +GACGATAGACCAGATACTGGTCAAACAGGTCCGCCGCTTTTGAAGAAAGCTGGAACAGTT +TTCGCTTGTCACTATCGTCAGTCAGATAATGCCGCAACAGGGTAAAGTCTTCGCGCTCCA +ACAGTTGCGGCAGCAGAGTCATCAGTTTCCAGCTCATGCTCTGTTTGTTAAAGGCGCTCT +CTTTGGGGATCTCCGGTAACACCCGGACGAACATATCCCAGATAAAGCTCGCTGGCAGCG +GAAAATCAATGTTTGCCGCAATACCAAACTTTTGCGACAGGGTCATTTGCAGCCACTGTG +CCATACCGGTACTTTGCACCAGAATCATCTCTGGTTCGAAAGGATCGTCCAGCCGTTCGC +GTTCGACAATAAACTCCATCAACGCTTCCAGCACGTCCAGACGATTGGAATGGTAGACCC +TTAACATAGCGGCTCCTGACTACTGACGATTCGGGCAATGCAGGCGGGTCATCTCGCCTT +CTCTGCCCCCGGGTGAAACTAGCGTAACGCTGATGCTGACACATCCCGCCTGCGATGTCT +GCATTCGGTTGACCTGCCAGTTAGCAGGTGGCGAAATCGCGCGCAGTTGCGTTTGCTGCC +AGCCATGCCGCCAGAGCTGTTGGTACTGGTTTCTGCTGGCAAGACTGTTCATTAATGTTC +GCTGGAAACCCGATAACGCAGTGACAATCATCACCATCAACACCATCGCCAACATTACCT +CCGGCAGACTAAAGCCTTGTTGATTCCTCAGGGAAGCTGACATAACGCCCTCTCTTTCAG +CGGACAAAAATCGCTCCAGCCGCGTGGCGAAAAAACAATGTTTCCATCGATGACTTCGCC +TGTTCGCCACAACGAAACGCCTTCATAACCAGCAATCAATAAGGCTTCATTATCTGCCAG +TAAACGCAGACAAACCCGGGCACCGGTGGCAGCATACAGTAAGCACTGAACTGCGGGCTG +CGTCTGCCAGGAGTGCATTTTTCCCCACTCCAGCGCCGACTGAACGATGGCCTGGCGGCT +CAATGACTGACTTTCCATGCTCACGCGAGAAGCAAAACTGCGATCCTGCTGACTCATTCC +TTGCAATAGCAAGCTACCCAAAATCAGCAGCATCAGGACCAGAGCCAGTGACGAAACTCC +CTTTTCGCGGTTCACAGGTTGGCTCCTGTCACGCTATAGCTGGCATCCACCACGGTTTGC +GGATCAGCCTTGCTGGCAGCGTGTATATTAACCGTCAACACCGGCGAGAAGCCGCTGACA +TCCTGACGTACGACCTGAAAAGTGTCGATAATGATGGCATCCGGATTAGTGACTTTATCC +CAGCCCTTACCTTCACAGGATGTCGCACCGCGTAGCGTTTCCAGCACATGCTCCTTCAGA +CGAAATCCAATCTGGTCGGACTCTTTTACCGGTTCGCGATCCCAGATACCGTTACTGTTC +GCATCCCACTGCACAATGACACAGTCACCCTGTCCGACAATTTCCAGCCCTTCGCCCGTA +CAGCTGCCATGGCAATAACCCGCCCTCTGGAGATGCTTCGCGACGGTAAATACCCGCAGC +CAGATTTCATCTTCCAGCGCCAGTTTACGGGTGCTCGTTAAACTTTCACGCTGTAACGCA +GGCAGAAAGCGTGCAGCCCCCAGCAACAATACGCTACTGATCGCCATAGCAATCAACACT +TCCAGCAGAGAAAAACCTTGCTCTTTTACAGGCATCCTTCTGTTTCTCCTTGCTGACAAA +GCCGGAGTCTTCCCCACGGCGAAACCACTAGCCACCACTCGCCCGTTGAGTTTTTGAAGC +GAATATGCCCGGCCCATGCGGTATTGCGCAGGCCAAAGAAAGCAAGCGAAGGTGTCAGGT +CGCTCATTTCGACTTCGGGCCAGCGCGGCACAAAGACCAATGGTGAACTGCCATGACAGG +TATTCGCCCCAGCAACGGAACTGCCATGACAGGTATTCGCCCCAGCAACGGAACTCACAA +GGCACCATAACGTCCCCTCCCTGATAAGACTGATACTGTGGTCGCGGTTATGCCAGTTGG +CATCTTCACGTAAATAGAGCAAATAGTCCCGCGCCTGGCTGGCGGTTTGCCAAAGCCGTT +GCGACTGCTGCCAGTATTGCCAGCCATAGAGCCCACTTGCGCTTAGCATGACCAGAATAA +GCATCGCGACCAGCGTTTCAATCAGCGTATAACCACGTTGTGTTTTCATGCCGGCAGTAT +GGAGCGAGGAGAAAAAAAGACGAGGGCCAGTTTCTATTTCTTCGGCGCATCTTCCGGACT +ATTTACGCCGTTGCAGGACGTTGCAAAATTTCGGGAAGGTGTCTCGAAGAATTTAACGGA +GGGCAAAAAAAACCGACGCACACTGGCGTCGGCTCTGGCAGGATGTTTCGTAATTAGATA +GCCACCGGCGCTTTAATGCCCGGATGTGGATCGTATCCTTCAATCTCAAAGTCTTCGAAA +CGGTAGTCGAAGATGGATTCGGGTTTACGTTTGATAATCAACTTCGGCAGCGGACGCGGT +TCGCGGCTTAATTGCAGATGAGTTTGATCCATATGGTTGCTGTAGAGATGCGTGTCGCCA +CCGGTCCAGACAAAATCACCCACTTCCAGATCGCACTGCTGCGCCATCATATGCACCAGT +AACGCGTAGCTGGCAATGTTGAACGGCAGGCCGAGGAAGACGTCACAGGAGCGCTGATAA +AGCTGGCAAGAGAGTTTGCCGTCTGCCACATAGAACTGGAAGAATGCATGGCACGGTGCC +AGCGCCATTTTATCCAGTTCGCCTACGTTCCACGCTGAAACAATAATGCGGCGGGAATCC +GGGTCGTTTTTCAGCTGGTTCAGTACCGTAGTGATCTGGTCAATATGACGACCATCCGGC +GTTGGCCAGGCGCGCCACTGTTTACCATACACTGGCCCGAGGTCGCCGTTTTCATCGGCC +CATTCGTCCCAGATGGTGACATTGTTTTCGTGTAGATAAGCAATGTTAGTGTCGCCCTGC +AGGAACCACAGCAGTTCGTGGATGATGGAACGCAGGTGGCAACGTTTAGTTGTCACCAGC +GGGAATCCATCCTGCAGGTTAAAACGCATCTGATGACCAAAAATGGAAAGCGTTCCGGTT +CCGGTACGGTCGTTTTTCTGTGTGCCTTCGTCGAGCACTTTTTGCATCAGTTCTAAATAC +TGTTTCATGGTTCCTCAGGAAACGTGTTGCTGTGGGCTGCGACGATATGCCCAGACCATC +ATGATCACACCCGCGACAATCATCGGGATGGAAAGAATTTGCCCCATGCTGATGTACTGC +ACCCAGGCACCAGTAAACTGCGCGTCGGGCTGGCGGAAAAACTCAACAATGATGCGAAAC +GCGCCGTAACCAATCAGGAACAAGCCTGAGACAGCTCCCATTGGGCGCGGTTTACGAATA +TACAGGTTGAGGATAATAAACAGCACCACACCTTCCAGCAGCAGCTCGTAAAGCTGTGAT +GGGTGGCGCGGCAGCACACCGTAAGTGTCGAAAATGGATTGCCACTGCGGGTTGGTTTGC +AGCAGCAAAATATCTTCTGTACGGGAGCCAGGGAACAGCATGGCAAACGGGAAGTTCGGG +TCAACGCGGCCCCACAATTCACCGTTAATAAAGTTGCCCAGACGCCCGGCACCAAGACCA +AACGGAATGAGTGGGGCAATAAAATCAGAGACCTGGAAGAAGGAACGTTTAGTACGGCGG +GCGAAGATAATCATCACCACGATAACGCCAATCAGGCCGCCGTGGAAGGACATGCCGCCG +TCCCATACACGGAAAAGATACAGCGGATCGGCCATAAACTGCGGGAAATTGTAGAACAGA +ACATAACCAATACGTCCACCGAGGAAGACGCCGAGGAAGCCCGCATAGAGTAAGTTTTCA +ACTTCATTTTTGGTCCAGCCACTGCCCGGACGATTCGCCCGTCGTGTTGCCAGCCACATT +GCAAAAATGAAACCCACCAGATACATCAGGCCGTACCAGTGAAGCGCCACGGGTCCTATT +GAGAAAATGACCGGATCAAACTCCGGAAAATGCAGATAGCTACTGGTCATCTGTCACCAC +AAGTTCTTGTTATTTCGCTGAAAGAGAACAGCGATTGAAATGCGCGCCGCAGGTTTCAGG +CGCTCCAAAGGTGCGAATAATAGCACAAGGGGACCTGGCTGGTTGCCGGATACCGTTAAA +AGATATGTATATGATCCGCGCTATAACCCCCCGCGAATCAACCCGCCCATGCCGCGACGC +TCCATAAAGGCTGCAACCTGATGGCGAACTTCGGTCGCCAGTTGCGCTTCCAGACTACGC +TGCGCAAGATTTTCTGCTTCAGCAAAATCAATGCGCCGCAGCAGGTATTTTACGCGCGCT +ACAGAACGTCCGTTCATAGACAGATGGCGATACCCAAGCCCAATGAGGATTGCCACGCAC +ATCGGATCGCCCGCCATTTCACCGCACAAACGGAGATCGATTCCATGTATTTCCGCTTCC +CGGGCGATCATCGCCAGAGCTCGTAACATTGCAGGATGAAGACTGTCATAAATGTTCGCC +ACCCGGGTATTGTTGCGATCAACGGCCAGGATGTATTGAGTCAGATCGTTGGTGCCAACA +GAGATGAAATCGACCCGCTTTGCCAGATGCGGCAGCATAAATACCATTGACGGCACTTCC +AGCATGATGCCGATACGTGGTTTGGGAATTTCGTAACCGATCATCTCCTCGACTTCACGT +CCGGCACGTTCAATCAGGCGGCGTGCTTCGTCAACTTCATCGAGGCTTGTGACCATCGGC +AACAGAATATTCAGGTTGCCCGTAGCGGCATTAGCACGCAGCATCGCCCGCACCTGGATC +AAGAAGATCTCCGGCTGATCGAGCGTAATGCGAATCCCACGCCAACCCAGGCATGGATTC +TCTTCGCTGATCGGCATGTAAGGCAGCTGCTTATCTGCTCCGACATCCAGCGTACGCAAG +GTGACGGGTTTATCATTAAACATTTGCAGCATCCCCTGATACTGCGCCACCTGTTCTTCT +TCCGACGGAAAACCACTTTGCAGCATGAATGGGATTTCAGTGCGATAAAGTCCTATGCCA +TCAATACGGCTGCCCAGTTTTTCTTCATGTTCCGGGCTTAAACCGGCATTGAGCATGACT +TTAATGCGTTCGCCGCTTTTTAACTGGGCGGGTAAATTGACGTCATCTTCCGCCAGACGG +CTAAGCTCGATCTCTTCACTAATTAGCCGCTGATATTCTTGCAGCAGTACCGGTTCCGGA +TCGACCAGCAATTCACCGCGATAACCATCGACGATCAGCGTCCGACGATGCAGTACCGAA +GGCTGAATATCCGCGCCCATCACGGTAGGTATCCCCAGCGCACGTACCATGATCGCAGCA +TGGGAGTTGGCAGCGCCATCGCGCACGACAACACCGACTAAGCGATCCTGGGGCAGCTCA +GCAAGCGTTGTCGCTGACAGTTCATCTGCCACCAGAATGAAACGTTCCGGCCAGGCGTTC +GGCCCTTGATTAGCGTCATCAAGATGAAACAGCAATCGCTGACCCAGCGCACGTAAATCG +CCAGCCCGCTCTTTGAGATAGTTATCGCTTAGCGCGGCAAACTGTTCGGCAAATTTTTCA +ATGACCGTTTTTACCGCCCACTCTGCCACCGAGCCTTTATCAACCTCGGCAAACAATTCG +CGACGCAGCCGGGTATCCGAAAGCAGGTGTGAGTAAAGATCGAAAATAGCCGCCGTTTCT +TTTTGTGCACCGGCAGCAAAGCGTTTGCTATAGCGGCGAAACTCGTTAGCCGCCTCTTCC +AACGCCCCGGTCAGTCGTTCGCGTTCCAGAGCCGGATCCAGCGTTGATGCCTGATACACC +TGTTCCATTAAAGGTAACGTGGCATCCTGCCAGCCTTCGGCAATCGCCACACCAGGTGCT +GCCGGTAATGCACGGATTCGCGTCTGGCGATATTGCCCAAACAAGGCAGTCAACTGCGAC +TGAGAAAGAATAGCTGCCATCTGGGTGGCAAGCGTCACCAGGAAGGATTCTTCACTTTCG +TCATACTGGCGCAACTCTCGTTGCTGTACCACCAGTACACCAAGCAACTGGCGACGTTGA +ATAATTGGTACGCCTAAAAACGCGCGGAAACGTTCTTCTTTTACGGAGGGGATGTATTTG +AAGCTGGGGTGCTTTTGCGCATCTGCAAGGTTTATCGGTTCCGCCAGCCTGCCAACCAGG +CCGACGATCCCTTCATCAAACGCGAGCGTTACAGTGCGACCGCGTGGTTTTTTCAGTCCC +CGGGTCGCCATCAGGTAGTAACAACGTCGATCATGATCGGCCAGGTAGACCGAACAGACC +TCGGTATCCATCGCAAGACAGATGTCGGTAACCAGAATATTTAACGCCTCATTCAGGCGT +GGTGCGCTGGCTACCTTTTCGACTATTTCGCGCAGGCGAGTGAGCATAATTGGCGTGACT +TAACCTCTTTTACGTCGATAAGCAGATGCGTTTTGTGGTTTTGGCGTATTTTCCTGCAGT +GACATCACCACACTCGCGAACTCTTTCATTACCCTACGGTAGACATCACGTTTAAATGAC +ACCACCTGTCTGACTGGATACCAGTAACTTACCCATCGCCAGCCGTCAAACTCTGGTGTA +CTGCTGGTTTGCATATTGATTTCTGCATCGCCGCTCACCAGCTGCAAGAGAAACCATTTT +TGTTTTTGGCCGATACAAACCGGCTTCGTGTCCCAACGCACCAAACGTTTCGGTAATTTG +TAGCGCAACCAGTTACGCGTTGAAGCAAGGATTCGAACGTCTTTGCGGCTTAATCCTACT +TCTTCAAACAATTCACGGTACATCGCCTGCTCTGCGGATTCTCCGGGGTTGATTCCGCCT +TGCGGAAATTGCCAGGAGTGCTGACCAAATCGCCGGGCCCACATTACCTGCCCCTGGCGA +TTACAAATCACGATACCTACGTTTGGGCGGTAGCCATCGTCATCAATCACCGGACTACCT +CAAAATAAAGCTTTATATACGAATGATTGTTTCATACTCCAGGAAGACGGTAAACCACTC +TCTGCAGGGCATTACACACTAATAACAATTGAATAACTCACAGTTATGTGCAGAGTTATA +AACAGAGGAAGGGGTGGATAGCCGTTTTTATTCACCTTTTCTGTGGATAGAGTTGTGAAG +AACTACGGAATTACTGCGGGAAAACCCGGAGCATTCTGAATAAGACAGATATAGAGATTT +TAAAATATTCATTATCAGTCAATGCATTACATGTGATTTGAGTAATAAAAAAGAGTAATT +CGTGACCCAGGTCACACCTCTCATTTACGGGTTGGCGAAAGATCAACCAATGCCGTATTT +ATCCACAGAATGTGCCACTAAGTTAAGCACTGAACCACTAAAAACTGGAGTTTCGTCGCA +CGTCAAGGCTGTAAATGGAAACAGTAGTGGAGGTTTTTCACAGTTATCCCAGCTTTCTGT +GGATAACATGGTGTAAGATCCTGTTTATTTTCAGTGACCAGATTTGGAAAACCCGTTGCA +GTGTTGCGCAACTCGATTACCGGAAACCTAAAAAGCAATATAAATCAGAGAATTGAACAA +CGCATGTGGAAAAAGTTACACTGCGAATATTCGGCACATAATTGCTGTTTGTTTTTTAAC +CAAGGTATCATGACATGTCCCAACCTCGCCCACTGCTCTCTCCTCCCGAAACTGAAGAAC +AATTGTTAGCGCAAGCACAACAACTTTCTGGTTATACATTGGGAGAACTGGCGGCACTTG +CCGGGCTGGTTACGCCGGAGAATTTAAAACGCGATAAGGGCTGGATTGGCGTGTTACTGG +AGATCTGGCTAGGTGCCAGCGCAGGGAGTAAACCTGAGCAAGATTTTGCTGCTCTGGGCG +TGGAACTTAAAACTATCCCTGTGGATAGTCTTGGTCGTCCGCTGGAAACAACATTCGTTT +GTGTTGCCCCGTTAACGGGCAATAGCGGGGTGACCTGGGAAACCAGCCACGTGCGCCACA +AGCTCAAACGCGTGCTGTGGATACCGGTTGAAGGCGAGCGCAGCATCCCGCTGGCAAAGC +GTCGCGTAGGATCACCGTTGCTGTGGAGCCCGAATGAAGAGGAAGACCGGCAGTTACGCG +AAGACTGGGAAGAATTAATGGATATGATTGTTCTCGGTCAGGTTGAGCGGATCACCGCTC +GGCACGGGGAATATTTACAGATACGACCGAAAGCAGCGAATGCGAAAGCGCTGACCGAAG +CTATTGGTGCCCGGGGCGAACGGATTCTGACGCTGCCGCGCGGATTTTATTTGAAGAAGA +ATTTCACCAGTGCGCTACTGGCCCGTCATTTTCTGATCCAGTAGCCATCGCTTTGACCTG +CCGCTTTCCGGGCATATAATTACCGCTTCATTTTTTTGGCAGGGCTTTTTAGATGTTATT +TGCATGGATAACCGATCCTAACGCCTGGCTTGCGCTCGGTACACTGACGCTGCTGGAGAT +CGTTCTTGGGATCGACAATATTATTTTCCTTTCTCTGGTGGTGGCAAAGCTTCCCACAGC +ACAACGTGCTCATGCGCGCCGTCTGGGGTTGGCGGGAGCCATGGTTATGCGTCTGGCGCT +GCTGGCATCCATCGCCTGGGTTACGCGCCTGACGAATCCGCTTTTTACAATATTCAGTCA +GGAAATTTCCGCCCGTGATTTGATTCTGCTTCTGGGTGGCTTGTTCCTTATCTGGAAAGC +CAGCAAGGAAATCCACGAATCCATCGAAGGTGAAGAAGAAGGGCTGAAAACACGCGTTTC +ATCATTCCTCGGCGCTATCGTGCAGATTATGCTGCTGGATATTATCTTCAGCCTCGACTC +GGTGATTACCGCTGTGGGTCTGTCAGATCACCTGTTTATTATGATGGCAGCCGTGGTAAT +TGCCGTAGGCGTGATGATGTTCGCTGCGCGTTCGATTGGTGATTTTGTCGAGCGCCATCC +TTCGGTAAAAATGCTGGCGCTCTCTTTCCTGATTCTGGTGGGCTTTACCCTGATTCTGGA +AAGTTTCGACATCCACGTACCGAAAGGTTACATCTACTTCGCGATGTTCTTCTCTATTGC +GGTTGAAAGCCTCAACCTGATTCGCAACAAAAAGAATCCGCTCTGATACTCCGTACGCTC +TCCTGCGGGAGGGCGTACTCACTCCTGTTACCCTCACAGTTTAAGATTTTCCTGCTTTCA +AGATATATAACGTCGGTTTATAAACAGACTATTATCATAGGTGGGCCAAATGAGGATAAC +CGGATGAAAAAATGGGCAGTAATAATTTCTGCAGTCGGACTGGCGTTTGCTGTTTCCGGG +TGTTCCAGTGATTACGTCATGGCGACCAAAGATGGCCGTATGATTTTGACCGATGGAAAA +CCTGAAATTGATGATGATACCGGGCTGGTGAGTTATCACGATCAGCAAGGTAACGCGATG +CAAATTAACCGTGATGATGTTTCGCAAATTATTGAACGTTAACAAATAAGGTCAGCATCC +GGCTGGCCTTAAGATTTTTCTCTTTCCCTTTTCCCTTCCCTCTGCCATTTTTATATTCCT +TATGTCGTGATTATAAAAAGGAAACGGCTATGCAATATCACCGTATACCCCACAGTTCGC +TGGAAGTCAGCACGCTGGGGCTTGGCACGATGACGTTTGGTGAACAGAACAGCGAAGCCG +ACGCCCACGCACAACTCGACTATGCCGTCGCTCAGGGCATTAACCTTATCGACGTTGCCG +AAATGTACCCAGTACCTCCGCGCCCCGAAACTCAAGGGCTAACCGAAACCTACGTCGGCA +ACTGGCTGGCGAAACATGGCAGCCGCGAAAAGTTAATTATCGCCTCCAAAGTGAGCGGAC +CGTCGCGCAATAATGACAAAGGCATCCGCCCGGATCAGGCGCTGGATCGGAAGAATATCC +GCGAAGCGCTGCATGACAGCCTCAAGCGTCTGCAGACTGATTACCTCGATCTTTATCAGG +TGCACTGGCCGCAGCGCCCAACCAACTGCTTCGGCAAACTCGGTTATAGCTGGACAGATT +CTGCGCCTGCGGTTTCGCTGCTGGATACACTGGACGCACTGGCAGAGTACCAACGCGCGG +GAAAAATTCGTTATATCGGCGTGTCGAACGAAACTGCATTTGGCGTAATGCGCTACCTGC +ATCTGGCGGACAAACACGATCTGCCGCGTATTGTCACCATTCAGAACCCCTACAGTCTGT +TAAACCGCAGTTTTGAAGTAGGTCTGGCAGAAGTCAGCCAGTATGAAGGGGTCGAACTGC +TGGCCTATTCGTGCCTGGGTTTCGGCACGCTGACCGGGAAATATCTCAACGGTGCAAAAC +CCGCTGGCGCACGTAATACGCTCTTTAGTCGGTTCACCCGCTATAGCGGTGAGCAAACGC +AAAAAGCCGTCGCGGCGTATGTTGATATAGCCAGACGTCATGGCCTGGATCCTGCACAGA +TGGCGCTCGCTTTTGTACGCCGTCAACCGTTTGTTGCCAGCACTCTGCTGGGCGCAACCA +CGATGGAGCAGCTGAAAACTAACGTCGAAAGTTTGCATCTGGAGTTAAGCGAAGACGTGT +TGGCAGAAATTGAAGCGGTGCATCAGGTTTACACTTATCCGGCACCATAAGATTAACGCC +GGTTAAAACCGGCGTTAAATATTAATGACGGCGCTGCCAGATCCACAGCGCCGTTATTGC +CAGCGCAAACAGCGCACCGAAGCCAATGCCAATGGGCACGACCGGGATGCCTACCATTAC +CGCCAGCGAGTAAATGCCCAGCATCAACAACATGGCGCTGTTTTCGCCAAGGTTTTGTAC +TGCAATCGCATTCCCCGCCCCGACGCTTTTTTTGCCCCGCTCCTGTAGCAACGCATTGAG +CGGAACGACAAAAAAGCCCCCCAGCACGCCAATCAGCATCAACAAAGCATAGGCTGGCAG +CAGCTCGTGTTGCAGGGAGAAAATCAGTACCACCACGCCAATCAAAATCCCGGCTGGCAT +ACAGCGTGACACGGTTTCCAGCGTAACTAACTTCGCTGCCGCACCTGCACCAACCACGAT +ACCAATCGCTACCATCGCGTTGAGATAGGTCGGCGTAGCGTTATCGGTAATACCCAGCGC +CACCGGTACCCACAGCACCAACAGGAAACGCAGCGTGACACCCGCTCCCCAGAATAAACT +GGTGCCCACCAGCGAAAAACGCGTTTCACCATTGCGCCATAGCGAGGTGCAGGCATTCAG +GAAACTGCGGGTCATGCTGATGAGATTCCAGGACTGCCCCGGACGCGCCGCCGCCAGTTT +GGGAATGTAGATATTGGCAACGACCGCGCCACCGTAGGCCAGTGCGCATGCGACCAGGGC +AACCAGAATATGCCAGTCAGCCAGAACACCACCAGCTACGGAACCGAGCAAAATCGCCGC +TATGGTAGACGCTTCCATTAAACCGTTAGCTTTTACTAACTTACTACCCGTGGTTAATTC +GCCGAGAATACCGTATTTCGCCGGTGAATAGGCTGCAGCACCAACACCCACCAACGTATA +GCCGAGAAACGGATTGATACCAAAGCAGATACTGGCTGCGCCCAGTAGCTTCAGGCCGTT +GGCAAACATCATCACCCGGCCTTTGGCGAAGCTATCCGCCACCTGCCCGACAAACGGCGC +AAAAAGAATGTAAGCACCTACAAACACCATTTGCAGGATGGGCTGGCTCCACTCCGGATA +GAACTGCGCTTTCAGTAACGCCAGAGTGGCAAACAGTAGCGCATTATCGCCAAACGCAGA +GAGAAACTGCGCCACGATAACCGCTTTCATCCCCTTCGACCACAACGAAGTGTTAGTGTG +CACTGACTCACTCATCGTGTTGTTCCGCTTCGTCTACCCAGCTTTTCAAAGTGACAAAGT +CAGGTTTGCCGCTGCCAAGTAATGGCATCTGTTTCAGATAGCGAATATCGCGCGGTACAG +CAAGCTCCGGCACGCCGTGCTCGCGGGCATACTGTTGTAACTTATCGCGCGTCAGTTCGT +TATCTGTGGTGAAAAGCACCAGTGCCTCGCCTTTGCTGGCATCGCTCTTAATCGCAGTGG +CATGGACTTTATCTGGCGAAACACCAAGTGCCAGTTGTTCCACCATTTCCAGCGACACCA +TTTCGCCTGCAATTTTGGCAAAGCGTTTTGCGCGGCCCTGAATCTGCACAAAGCCCTGCT +CGTCAAAACGCACAATATCGCCAGTGTCATACCAGTCGCGCTCCATTTCGCCGCGAATAT +TCTCGGCGGTGGGCACTTCCAGTACACCAGGCTTCTCCACCCGCAGATAGCCGTTCATTA +TGTTCGGCCCTTTCAGTTGCAGGCGTCCGCCCTCTTCGATACCAGGAACCGACAACAGGC +GCGCATCCATTCCTGGTAGAATACGCCCTACCGTACCGGGTTTCGCCGCCATCGGTACGT +TGATAGAAACGACAGGCGCGCATTCGGTCACACCGTAGCCTTCAAGGATGCGCAGGCCAA +ATTTATCCTGCCAAAGCTGTTTAGTACTTTCTTGTAGTTTTTCTGCGCCTGCCACCACAT +AGCGTAGACGATAGAAGTCATACGGGTTGGCGAAACGCGCGTAGTGACCGAGGAAAGTGG +AGGTACCGAACAACACGGTGCAACTGCGGTCATACACCAACTCCGGCACAATACGGTAGT +GCAGCGGGCTTGGATAAAGGAACACTTCTGCACCTGTGAGCAGTGGCGTAAACAGGCCTA +CCGTCAGCCCAAAGGAGTGAAACAGCGGTAACGCCGACATAAAGCGATCGTTGGTGGTGA +AGTCGGCAATCGTTTTAATCTGCTCGACATTCGCCAGAATGCTTTTATGGCTATGGACGA +CGCCTTTCGGATGGCCTTCAGAACCGGAGGTAAAAAGGATCAGCGCCTCTTCTTCCGGCT +GCTGTTTAACCTGTGCCAGACGCGGCATCAGCAAATGAGCGAAGATCCATACTTTGTCGG +CAGTGGTGACATCTGCTTTTAAATCTTCCAGATAGACCCAGCGCACCTGAGTAAGTTGCT +CCGGCAGATGCCAGAGTTTGCCTTTATCGAGAAACTGACGGGAAGTGAAAATGGTTTTGA +TTTCAGCCGCCGTAATAGCACTGGTCAACCCTTTTACCCCGGCGGTGTAGTTCATCATTG +CGGGAATGCGGCGACGGGCGATGGCCCCAAAAATCACTGCAGCACTGATGCCTGCATTGG +GCAGCATTAAGCCGATGCGTTCGCCTTCAACACTGTATTTTTCAAGGATGCGTCCAACAA +ACAGCGTTTTCGTAAGCAATTTGCGATAGGAGTCCGGGGTAAAGTTAACGTCTTCGACAC +ATTTCTTCCCGGCTCCGAAGCGGTACATTGCGCTCAGTAAAGATTCGTACAGCGTTTCAC +GCGGGCGCACCGCCATACGCGCTTCCATCATTATTTGATGCAGCATTTCGCCAGCGATTT +TGCGACGGTCACGGGCACGCGGCGCATCCGGCATCTCCACCTGCGTTGGTGGCAAAATAT +GCAGAGTAATTTGCGGGAACAAGCGACGTTTAACCAGACCTTTCAGGCGGCTGAAGTGCG +TAAGTTCCGCCCCTTCAATACGCACAGGAATAACCGTTGCACCAGACTTCGCCGCGACAA +ATCCCGCGCCATCGTAGATTTTCATCAGCGAGCCAGTGGTGGTGATGCGTCCTTCAGGGA +AAATCACCACTGGTCGGCCCTGTTCCACCAGACGTACCAGATGTTTAATCGCCATAGGTT +GCGTCGGGTCGAGAGGAACAAAGTCGATAAATGATTTCAGCCAACGCATATACCACTGTT +GGCTTATTGAGGTGTAAACGGCAAATACCGGACGTACGGGTAAAAACAATGCCAGCAGTA +TGCCATCAATAAAAGAGACGTGATTAGGCGTAATTAGAACGCGCTCGCCCTTCAGTGCCT +TGGTGTCACCCGTAACGCGAACGCGATACAAAACACGGCACAAATTTCGAAAAAAGCTAA +AAAGCATTCCAACTCCCTTTGCTCTGATTCAGTAAAAGCGAATGGAGGGAGATTACACGA +GATAAAGAACGCGAGCGACAGTAAATTAGGTGCGAAAAAAAACCTGCGCATCCGCGCAGG +TTGGTGCAAGAGACTGGGTACGAAGAGCGTACCGAATAATCTCACCAATCAATACCTCTG +GGATCTTGATTGTGGTCTGCACAACGACTCTTCGCCAGCGAGAAAACGCAAAGGAATGAA +GGGAAATGCAACGAGGTGTGTAAATTGTCGGTTACTGTTACAGATTGATGACCGGCAAAA +AAAAACCTGCGCATCTGCGCAGGCTGGTGTAATTCATGTGCTCAACCCGAAGTTGACTTC +ACCTATCAATACCTCTGGGATCACCACTTTAGCAACCTGAAGCCAAACGCCACCAGCGGT +CAATCGCAACAGCGTTTCGCAAAGTGTAACCAAAGGTTTGCAATCTCTTTTTTTGTCTTA +CTTATTTGCGTTTGGCTCACATTCCCACAATGAAAACACGCCGCCCCTTGAACCAACGGG +CGTTTTCCGTAACACTGAAAGAATGTAAGCGTTTACCCACTAAGGTATTTTCATGGCGAC +CATAAAGGATGTAGCCCGACTGGCAGGCGTTTCAGTCGCCACCGTTTCCCGCGTCATTAA +TAATTCACCCAAAGCCAGCGAAGCTTCCCGGCTTGCTGTGCATAGTGCAATGGAGTCTCT +TAGCTATCACCCGAACGCCAACGCCCGTGCTCTGGCGCAGCAGACCACTGAAACGATCGG +TCTGGTCGTTGGTGATGTTTCCGATCCGTTTTTCGGCGCAATGGTGAAAGCGGTCGAACA +GGTGGCTTATCACACTGGTAATTTTTTATTGATTGGCAACGGTTACCACAACGAACAAAA +AGAGCGTCAGGCCATTGAGCAACTGATCCGCCATCGCTGTGCTGCGCTGGTTGTCCATGC +CAAAATGATCCCGGATGCCGATTTAGCCTCATTAATGAAACAAATGCCCGGTATGGTGCT +GATCAACCGTATCCTGCCTGGCTTTGAAAACCGTTGTATTGCTCTGGACGATCGTTACGG +TGCCTGGCTGGCAACGCGTCATTTAATTCAGCAAGGTCATACCCGCATTGGTTATCTGTG +CTCTAACCACTCTATTTCTGACGCCGAAGATCGTCTGCAAGGGTATTACGATGCCCTTGC +TGAAAGTGGTATTCCGGCCAATGACCGGCTGGTGACATTTGGCGAACCAGACGAAAGCGG +CGGCGAACAGGCAATGACCGAGCTTTTGGGACGAGGCAGAAATTTCACTGCGGTAGCCTG +TTATAACGATTCAATGGCGGCGGGCGCGATGGGCGTGCTCAATGATAATGGTATTGATGT +ACCGGGTGAGATTTCGTTAATTGGCTTTGATGATGTGCTGGTGTCACGCTATGTGCGTCC +GCGCCTGACCACCGTGCGTTACCCAATCGTGACGATGGCGACGCAGGCTGCCGAACTGGC +TTTGGCGCTGGCGGATAATCGCCCTCTCCCGGAAATCACTAATGTCTTTAGTCCGACGCT +GGTACGTCGCCATTCAGTGTCAACTCCGTCGCTGGAGGCAAGTCATCATGCAACCAGCGA +CTAACCGCAGTTAAAGCAATTCCAGCGCCAGTAATTCTTCAATGGTCTGGCGACGGCGAA +TCAACCGCGCCTGACCATTATCAAACAGAACTTCTGGTAACAGCGGACGGCTGTTGTAGT +TGGATGACATTGATGCGCCATATGCCCCTGTATCATGCAGTACCAGATAATCACACGCCT +TCACTTCCGGCAAGGCGCGGGTTTCAACATTTCCCCCTTCCTGCTGGGTAAAGACATCGC +CCGATTCACATAACGGCCCGGCGACGACGGTTTCCACCGTTGGTGCGTGTTCCAGAGAAC +GACCATCAGCTGCCAGGGCACTGATATGGTGGTAACTACCGTACATTGCCGGGCGCATCA +GATCGTTGAACCCGGCATCAACCAGCACAAAGTGGCGGCTACCCATTTGTTTGACGCTCC +GCACTTGAGTAATTAATACGCCAGCCTGCGCTACCAGAAAGCGACCCGGTTCAATTTCCA +GTTTCACAGGATGGCCCAAATGGCGGGCGATTTGCTCACGCGCGGCATTCCACAGACCAT +AATAATGTTCGGTATCAACCGCCTCTTCACCCTGTTGATAAGGAATAGAAAGCCCACCGC +CCGCAGAAATAGCCTGTAAATCCTGACCGAATTCGAGGACCTGACGCACCATAGCACCAC +ATACCTGTTCCAGATGGGCATAATCGACGCCAGAACCAATGTGCATGTGAATGCCGACCA +GCTGTAGATGATGACGTTGTATCACGTCCAGTGCGGCGGGCAGATCGGTGTACCAGATAC +CGTGCTTGCTGTTTTCGCCACCGGTATTGGTTTTTTGGCTATGCCCGTGACCAAACCCCG +GATTAACACGCAGCCATACCCGATGCCCTGGCGAAACCTGACCCAGTTGGTCGAGCATAT +CAACAGAACCCGCATTCACCGGAATTTGCAATTCACTGACGCGTTCAAGCGTCGCCTGAT +CGATAACATCTGCCGTAAAAACAATATCATCGGGGTGCGTTTGCGGATTGTAACCCGCCG +CCAGTGCACGCTCTATTTCGCCTAACGAGACGGAATCCACTTTTACGCCCTGCTCACGCA +TTAAGCGCAAAATATGAATATTGGAACAGGCTTTCTGTGCAAAGCGCACCACATCAAACT +GTTTCAGCGCTGCAATCTGCCGACGAATAATTTGCGCATCGTAGACCCACACCGGGCAGC +CAAATTCTGCGGGCAAACGCAGCAGATTTTCGGCGGTGAGATCGGTATCAGTGCTGAACA +GTGAATGTGGCATAACAAACTCCAGATAAGTGCTTTTTTATGATTACGCCACATCATAAA +AAGAATAAAAAATATCGATTTATGTCGAGTCTATGCAAAAATGATATGGATTACCGGATT +GCGAGAGAGCGCTAATGGCCGCCGTTAACTTACGTCATATTGAAATTTTTCATGCGGTAA +TGACCGCCGGAAGCCTGACTGAGGCGGCACACCTGCTACACACCTCACAGCCAACCGTCA +GCCGCGAACTGGCGCGCTTTGAGAAGGTGATCGGGCTGAAATTGTTTGAGCGCATACGTG +GACGATTACATCCTACCGTGCAAGGACTGCGTCTGTTTGAAGAAGTGCAACGATCCTGGT +ACGGACTGGATCGCATTGTCAGTGCCGCAGAAAGTCTGCGCGAGTTTCGCCAGGGAGAAC +TGTCTATTGCCTGCCTGCCGGTCTTTTCGCAATCTTTTTTACCGCAGCTCCTGCAACCCT +TTCTGGCACGTTATCCCGATGTCAGCTTAAATATCGTGCCCCAGGAATCACCGCTACTTG +AAGAGTGGCTCTCGGCCCAGCGTCATGATTTAGGACTCACTGAAACGCTCCATACGCCTG +CGGGAACAGAACGTACCGAATTACTCTCTTTAGATGAAGTGTGTGTGTTACCTCCGGGCC +ATCCGCTGGCGGTAAAAAAGGTATTAACGCCGGATGATTTTCACGGTGAGAACTACATCA +GCCTTTCCCGTACTGACAGCTATCGCCAGTTGCTGGATCAATTGTTTACTGAGAATCAGG +TTAAACGACGCATGATCGTAGAAACCCACAGCGCCGCGTCAGTCTGCGCAATGGTACGGG +CGGGGGTAGGCGTTTCGGTGGTTAACCCGCTCACCGCACTGGATTATGCGGCAAGCGGTT +TAGTGGTGCGGCGGTTCAGCATTGCGGTTCCATTCACCGTCAGCCTGATCCGCCCCCTGC +ACCGCCCGTCATCAGCGCTGGTGCAGGCGTTTAGTGAGCATTTACAAGCGGGATTACCGA +AACTGGTCACTTCTCTTGACACTATTTTGTCGTCAGCTACGACAGCATAAAAGCGACAGC +ATCCTCGGCATGGATCGCCGCGGTATCAAACACAGGCAGAACACTGCGCTCTTCTGGCAC +CAGTAAACCAATTTCTGTGCAGCCAAAAATGACGCCCTGTGCGCCCTGTTCTGCAAGGCG +AGCAATCACTTGCGCATAATAAGCGCGTGACGCTTCGGTAAATTGCCCCAGACACAGTTC +TTCAAAAATAATCTGATTAATTTTCGCCCGTTCATCCGCTTCAGGAATAAGACAGTTGAT +GGAAAATTGTTCCGTCAGCCGCCCGCGATAAAAATCCTGTTCCATGGTGTAACGTGTACC +CAGCAGCGCCACACGAGTCATTCCTGCCCCGGTAATTGCACGTCCAGTGGCATCCGCTAT +GTGTAAGAAAGGCAGAGAGCAACGAGACTCAATGGCATCCGCCACTTTGTGCATCGTATT +GGTGCATAACACAATACCTTCTGCGCCCGCCCGCTGTAAGCCAAGCGCCGCCTCAGCCAG +AATATCCCCGGTTTTGTCCCACTCACCGCGACGCTGGCACTCTTCTATTTCATGAAAATC +GACGCTATGTAGCAGCACTTGCGCAGAGTGAAGCCCACCAAGCCGCTGTTTAATGCCTTC +ATTTATCAGACGATAGTAAGGAATAGTGGATTCCCAGCTCATTCCTCCCAGCAAACCAAT +TGTTTTCATTCCTCTCTCCTGATGTGTGTTACCGCAACAAGGCTGAATAAGGAACGAGAC +AAACGCCTCAACGGCCAGGTGCCCAATCTCTATTAACGAAAAAAGGGCCGGATGTACAGC +ACATCCGGCCCGTGAAATCAGACGCCGATATTTCTCAACTTTTCGCCTGCCATCAGTTTG +CGCTCGATATGTTCCAGCGTGACATTTTTGGTTTCCGGAATGAGCCAGAAAGTGATGCCC +ACAAACGCAATGTTCAGCGCAGTGTAGAGCCAGAACGTACCGGCAGCGCCAATGCTATCA +AGCAGTGTCAGGAAGGTCGCGCCGATAATCATATTCGACACCCAGTTTGTCGTCGTTGAG +CAGGTGATGCCAAAATCGCGGCATTTCAGCGGCTGAATTTCAGAGCACAAGATCCACACC +ACTGGCGCGGCGCTCATCGCATAACCGGCAATACACATCATCGTCATGCCAACAGAGAGC +CAGGACAAGCCACTGGAAGCCGTACCGTTATCAAACTGCATCAGGCAGTAACCCAGCACC +AGAGTGCCTAACGCCATCACGCTGAAACCAATTTTCAGAGCCGGCTTACGCCCTGCTTTA +TCTACCGTAAAGACCGCAATGAAGGTAGCGAACATAAAGGTCAGCCCCACGACCAGAGTC +GCAATCATCTGTTGTTCTGTGGTCGTAAAGCCCGCCATTTTGAAGATACGTGGCGCGTAG +TACATGATGATGTTCATACCGGTAAACTGCTGCATCGCCTGCAACAACATACCGAGAAAT +ACAGCACGACGGACGTTACGGTTGATCTTAAACAGTGCCCAACCGCCCTGTTTTAACTTC +AGGCTTTCACGAATTTCGTTGAGTTCTTCTCGCGCTTTTTCCGACGTATCGCGCAGCATA +CGCAACACTTCTTCCGCCTCAATATGACGCCCCTTTTCCGCCAGCCAGCGCGGGCTATTT +GGCAGGAAGACCACCAGAATAATCAGCAGGACTGCTGGTAAAGCAAGAACCCCCAACATT +GCGCGCCAGTTACCGCTATAACTGAACGCTGTATCGGATAAAAACGCCAGCACGATGCCG +AGTGTGACCATCAACTGGTACATGCTGATCATCTTACCGCGAACGTTTTCACTTGCCATT +TCAGAAAGATATAGAGGAGCGGTGTAAGACGCGATCCCAACAGCAATGCCCAACACCACA +CGAGCGGCGATTAACATCTCTACGCTGGTCGCAAAAGCGGACCCTATCGAACCGAGTACA +AACAGGATGGCCCCCGCCATCAGGCTGTATTTACGCCCCAGGCGGAACGACAGCCACCCA +TTAAACAGCGCACCAATTGCTGCGCCGAGCATCATGCTACTGACCACCCATTCCTGCAAA +CGGCTGGTCAGCACAAAGTGATCGGTAATGAACGGCAACGCTCCGGCGATTACGCCGATA +TCAAGACCAAATAACAATCCTGCGACCGCAGCAGCTACCGAAACAAACATATTCATACGC +CGCGTATCCCGCAGAGGACGTGGCGTTAAAGCAGATTCCGTATTGATAGTAACCATTTTT +TCCTGCCAGCAGAGAGTAAGACATAGTGAAAAAATACGTGAACAATTCACACAGGTGTCA +GGTCGGAAATAGCATAAATATGGATTAAATTGCTACGACATGTCGTTATGTGATGGATAT +TCCAATTTTCAAATTAAGTTGAATTATTGAGATTATTATTAACTACCTAATTTTAAAGCA +GATAAAATTCATAAAGTTCATTAATTGATAATTGATATGGATTATTTCATAACCATGATA +TGGATTATGATGATCTACAGGTATAAAAAACCCTGCCATGCGGCAGGGTCATAAAAGTAA +GAGGAATGAATTAACGCGCCAGCCAACCGCCATCCACAGCAATGGTATAACCATTTACAT +AATCTGAAGCGCTGGAGGCAAGAAACACTACCGGCCCCATCAGGTCACTCGGCAGTCCCC +AACGGCCAGCTGGAATGCGGTCGAGAATTTCCGCGCTACGTTGTTCATCTGCCCGCAGTT +GTTGAGTATTGTTGGTCGCCATGTAACCCGGAGCTATCGCATTAACATTAATGTTGTGTT +TAGCCCATTCGTTCGCCATCAATCGCGTCACACCCATCACGCCGCTTTTTGATGCGGTAT +AAGAAGGCACACGGATCCCGCCCTGGAAGGAGAGCATTGACGCGATATTGATAATCTTGC +CGCCATTGCCTTGCGCGATAAAGTGTTTCGCCGCTGCCTGAGACATGAAGAATACGCTCT +TGATATTCAGGTTCATGACATCGTCCCAGTCTGTTTCGCTGAACTCGAGAGCGTCTTCGC +GGCGAATCAATCCGGCGTTATTCACCAGGATATCAATATGACCAAACTCCGCTACCGCGC +GATCCAGCAGTCCAGGAATGCCATCAATCTTTCGCAGATCGGCGGTCAGGCTTAAAAAAC +GACGCCCCTGCGCCGTGACCTGCTTGATGGTTTCAGTCGGTTCAACGATGTTAATGCCAA +CAATGTCACAGCCCGCTTGCGCCAGCCCCAACGCCATCCCCTGGCCCAGCCCAGTATCAC +AACCAGTGACGACCGCAACTTTACCTTCGAGAGAAAATGCATTTAAAATCATAACAATAC +CTTATTCGTTTATGCCCACAACTAGCGCAAATCTTTAACGGCCACATGGTCCATATCATC +AAAAACCTGGTTTTCACCGACCATGCCCCAGATAAAGGTATAAGCTTTGGTTCCGACGCC +GGAATGGATCGACCAGCTCGGGGAGATCACCGCCTGCTCGTTATGCATCACAATGTGACG +CGTTTCTTGCGGTTGCCCCATCATGTGGAAAACGCAGGCGTCATCATCCATATTGAAATA +GAAATAAACTTCCATCCGGCGCTCGTGGGTGTGACACGGCATGGTGTTCCACAAGTTACC +TGGAGCCAGCTCCGTCAGCCCCATACTCAATTGGCAGGTTTCCAGCACATCCGGGACAAA +ATATTTGTTAATCGTGCGACGGTTACTGGTGAGGTTATCGCCTAACGTGACTGGAGATAC +TTCGTCCGGTGTGACTTTTTTGGTGGGATACGTCGTATGCGCGGGTGCGCAATTGTAATA +AAACTTCGCCGGAGTGGCGGTATCAATACTGGCAAAGACAACTTCTTTTGCACCTTTACC +AACATACAGGGCGTCGCGGTGACCGATTTCATAGCATTGACCATCGACAGTAATCGTACC +GGCACCGCCAATATTGATAACACCTAACTCGCGACGTTCAAGGAAATAGCTTACGCCGAG +TTGTTTACCAACTTCCCCGCCAACGGAAACCGTTTTAGTTACCGGCATAATGCCGCCAAC +AATAATACGGTCAATGTGGCTGTAAACCATGGTGTACTCATCGGCGACAAATACCTTTTC +AACCAAAAATTCATTGCGCAGCCCCTGGGTATCCAGCGTTTTTGCGTGCGCACTGTGGAT +GCTCTGTCTTACGTCCACATCAACCTCCGATAATCAGTGAAGCGTGAAAATAGAAAACAA +TAATAAAACACTGTTTCGTTTTCTCTATGAGGGGATGATATGCCCATGGGATAGGGTTTT +CAATTAAAAATAAAACAATGTTTCATTTTCAAGTTAAGGATTAAAAAAAGTGCAGTGTCG +ATCACGAATATGTCATGAGAATGGAAAAATCAGGGAGCCCTGAAAAGGTATGTCGACTCA +CCAGCCATCATTATTCAACAGATTAATGACGGCAGATATTTATCGGTAAGGAGGAAATGC +AGAGCTACTCGTCACGTTCAATGGTCAATGCCACACCCTGGCCCCCGCCGATACAAAGCG +TTGCCAGTCCTTTGCGGGCATTACGTTTCACCATTTCATGAACAAGAGAAACCAGGATTC +GGCAACCGGAAGCGCCTATCGGATGACCGAGTGCGATCGCACCACCATTGACATTGACCC +GACGCTCATCCCATTCAAGCATCTTGCCAACCGAAAGCGCCTGTGCAGCAAACGCTTCAT +TAGCCTCGATAAGATCGACATCAGCCAACTGCCAGCCAACACGCTCCAGGCAACGGCGGG +TCGCATACACCGGCGCAATTCCCATCAATGCCGGATCCACACCAACGCTGGCAAATGCGC +GGATGCGGGCCAGCACGGGTAAATTCAACGCTCGTGCTTTGGCTTCGCTCATCATCATTA +CTGCAGCTGCCCCATAGTTTATGGATGATGCATTACCCGCTGTCACAGAACCGAGACTAT +CAAATGAAGGATTTAAACGGGCTAAGGCTTCTGCGCTGGTGTCAGTGCGTGGCTGTTCAT +CGGTATCAACAACCAACGTCTGACCGTTACTTTGGGTTATTACCGGGACGATCTCATCTT +TAAATCGTCCGGCGTCAATCGCCGCTCGCGCTTTTTGTTGCGAGCTAAGTGCGTAAGCAT +CCTGCAACTGACGGCTGATGCCATATTCGCGAGCCAGATTTTCGGCGGTGACACCAATAT +GATAATCATTGAAGGCATCCCACAACCCATCATGCACAAGACTATCAACCAACTGGCTAT +TGCCAAGCTGTGCGCCGGTGCGGCTATCAGTCAGAACATGTGGTGCGCGGCTCATGTTTT +CCTGGCCACCGGCGATGACAATATCAGCCTCGCCACACTGTATCGCCTGAGTAGCCAGAT +GCAGTGCTTTAAGCCCGGAACCACAAACGTCATTAATAGTGATTGCAGAAACGCTATTAG +GAAGACCACCTTTAATAGCCGATTGCCTTGCCGGATTCTGCCCTGCCCCTGCAGTCAACA +CCTGACCAAGAATCACTTCATCCACCGCATATGCAGGAACGCCGGTACGTTCTATTAACG +CTTTGACGACCAGGCTGCCAAGTTCCACGGCGGAATGACCCGCTAACGCACCACGAAAGC +AGCCGATAGGTGTCCGTAACGCCCCGACAATCACAACGTCTTTCATCACAACCTCGCACC +AATTAACAGTGCAATAGTAAATGATTGTTAATTACAGTTATCTTAATTGTTTAAAAAAGG +TGATTTTTATCACAAAGGAAATACGCCTGAGTAGCAGTCAGAGACATAACTGGCACGTAA +GGTTTGCAACCACTAACCCACCAATAGAGAGGTAGATAGGGCGTTAATCTCCCATACTTA +ACCTGGTTTATGGTAAATTGCCCTCCATTTTGTTTAATTTGTAGATGATACGTTCAGATA +ATGTCTAATATTTGGTCAAAAGAAGAAACTCTGTGGAGTTTCGCGCTCTACGGCACAGCC +GTTGGTGCAGGCACGCTCTTCCTTCCTATTCAGTTAGGTTCGGCGGGGGCTGTGGTCCTG +TTTATTACTGCTCTGGTCGCCTGGCCTTTAACATATTGGCCACATAAAGCCTTATGCCAG +TTCATCCTCTCATCGAAAACATCAGCAGGTGAAGGGATAACGGGCGCGGTAACACACTAC +TATGGCAAGAAGATTGGTAATCTGATTACCACGCTGTACTTCATCGCCTTTTTTGTCGTC +GTGTTGATATATGCAGTGGCAATTACCAACTCACTTACAGAACAGCTGGCAAAGCATATG +GTTATTGATCTTCGCATCCGTATGTTGGTGAGTCTGGGGGTTGTATTAATCCTGAATCTC +ATTTTTCTGATGGGACGCCATGCCACTATTCGGGTAATGGGATTTTTGGTATTCCCATTG +ATTGCCTATTTCTTATTTCTTTCTATTTACCTGGTCGGTAGTTGGCAACCTGATCTATTA +ACAACCCAGGTAGAGTTCAATCAGAATACCCTTCACCAGATATGGATATCGATTCCCGTG +ATGGTTTTCGCTTTTAGCCATACGCCCATTATTTCTACGTTTGCCATAGACAGACGTGAA +AAATATGGCGAACACGCTATGGATAAATGCAAAAAAATTATGAAAGTCGCTTATCTCATC +ATCTGCATAAGTGTATTGTTCTTTGTCTTTAGCTGCCTGCTTTCTATTCCACCTTCGTAT +ATTGAAGCGGCTAAAGAAGAAGGGGTTACCATTTTATCGGCGCTTTCTATGCTGCCGAAC +GCCCCAGCATGGTTGTCAATTTCCGGGATTATTGTCGCAGTAGTTGCGATGTCGAAATCA +TTCCTGGGTACGTACTTTGGCGTTATTGAAGGTGCCACAGAGGTCGTCAAAACAACATTA +CAGCAGGTTGGTGTAAAGAAAAGTCGTGCATTTAACCGCGCACTATCAATTATGTTGGTA +TCGCTGATTACCTTCATTGTTTGTTGCATTAACCCGAACGCGATTTCGATGATTTACGCG +ATCAGCGGCCCGCTCATTGCCATGATACTTTTCATCATGCCTACGCTGTCAACGTATCTC +ATCCCGGCGCTTAAACCCTGGCGTTCCATCGGAAATCTGATTACCCTGATCGTGGGTATC +CTGTGCGTATCGGTAATGTTCTTTAGCTAATATCCGTTGTGGATGGTTCAAAATTGCTTC +AATTTTGAACCATCCCAGTTTTCATAATGTTCATTTGTTATTATTCCGCCCTATCACTTC +TCTCGTAATATTATATAATTATCAGCTAGTTAAACACACAAAGAGTTCTGAACATCTTAA +ATAAGACTATTTAAGATACATGACGATTGCATTGCGTAAACGCTTTTTATTTACAAAAAA +TGGGGAAGTATTACGGCGATTGCGAAAAGTCTGAAGCGCTTGAATTAAGATAATATAGAA +AATCAGATACAACAAAAATGGCAGGTAGATGATGTGAAGATAAATTGGAGCGGGCGAAGG +GAATCGAACCCTCGTATAGAGCTTGGGAAGCTCTCGTTCTACCATTGAACTACGCCCGCT +TCGAGATGCGTAAGGCATTATAAACCTTACGCTCTCCTTAGCAAGTACCACGCTGCTGAC +TGCTGATTAATTCACCATCAGCATTTTGGCTTGCTGCCCTGAGGCGGCAAGTAACGTAGC +GGATCAATTGCCGTTGCACGGTAACGAATCTGGAAATGCAGGCGAACAGATGCCGCATCA +GTGCTCCCCATGGTGGCGATTTTTTGCCCAGCTTTCACGCTTTGCCCATTATTTACCAGC +ATCGTGTCATTATGAGCGTAAGCCGTAATGTAATCTTCACTGTGTTTAATCATGATGAGA +TTACCGTAGCCACGCAGCTGGTTGCCCACATACACCACCTTTCCTGCACCCGCGGCGTAA +ATAGGTGTACCCCGTGGAGCTGAGATATCAATTCCTTTATTGCCGCCATCTGCTGTCGAA +TACGGCATGATAACTTTCCCTGTCGTTGGCCATAACCAACAACGTTGCCCTACTGGCGGC +CAGGAAGATTTCGGTACCGCTGATGACGGTGTAACCGATGCGGTTTTGGTCGTTGATTTG +GCGGTTGATTTACGTGTACTACTGCTACTTTTCGCCCCACCCAGTTTTAGTTTCTGACCT +ACTTCAATGGTGTAAGGGGGGGAAATGCCGTTCAGTCGCGCCAGTTCTTTTACGCTGGTT +CCCGTGGTGCGCGAAATACGATATAGCGTATCCCCCCGTTTCACGGTGTAAACGGAGCCG +GAATACGTTCCTGTATCGGATGATTTGCTACCCGAACAGCCCGCCAAAAGCAGTCCAACC +GATAACAACATCACGATACCCAGAGATTTTTTATTCAGGCGTCCCGCACTCAAAATCTTT +CCTCGCTTAAAAAACAAGACGCCATATCATAGCAGCCGGCTTCTGGATACCCAATCTCTT +GCTTCTGGAAAAGCGATGTAATAGAGAAAGAGGTTAATTTCATTTGGCAAAGGGAAGTAT +CATCAGCAAAATATTTGCTGTAGTGGTATCGAAGTTCCTGACTTTTACCCTATTTCCCAC +CTTGATGCGTAATAATCCTAATTTATCACATTGATTTTATCGCCACTCATATTGATACGT +ATCACTGTCCCTATTCAGAGTCCTGTTTCGTATCATATCTGTGTTTTTTTAACGTCATCA +CACTTCCTTCCTCCCCTCACGCATATAGTCGTTTCTGGCGTAATTCTTGCCTGCTAAGAC +TAAATCTTTGCCATAAGAACCAAATGTTCAAACCGAGGGGATTTCTATGGAAGCGCGGGA +AGCAACCGCTACGGGTGAATCATGCATGCGCGTCGATGCCATTGCTAAGGTCACCGGGCG +GGCACGATATACTGACGATTATGTTATGGCGGGCATGTGTTACGCGAAATATGTACGTAG +CCCTATCGCACATGGTTATGCTGTAAGTATTAATGATGAACAAGCCAGGAGTTTGCCGGG +CGTCCTGGCGATTTTTACCTGGGAAGATGTGCCAGAAATCCCATTCGCCACGGCAGGGCA +TGCCTGGACACTTGACGAAAACAAGCGCGATACCGCCGATCGCGCACTGCTAACTCGCCA +TGTTCGTCATCATGGCGACGCCGTTGCCATCGTCGTGGCCCGCGATGAACTCACGGCAGA +AAAAGCGGCGCAATTGGTCAGCATTGAGTGGCAAGAATTACCCGTTATCACCTCGCCAGA +AGCGGCGCTGGCAGAAGACGCTGCACCAATCCATAACGGTGGCAATTTACTGAAACAAAG +CACGATGTCGACGGGTAATGTCCAACAAACAATCGATGCCGCCGACTACCAGGTACAGGG +GCACTATCAGACTCCCGTTATTCAACATTGTCATATGGAAAGCGTGACATCGCTGGCATG +GATGGAGGATGACTCGCGAATTACCATCGTTTCCAGCACCCAGATCCCGCACATTGTTCG +CCGCGTGGTTGGTCAGGCGCTGGATATTCCCTGGTCATGCGTACGAGTCATCAAACCGTT +TATCGGTGGCGGTTTTGGTAATAAACAGGATGTACTGGAAGAGCCAATGGCGGCATTCCT +GACCAGCAAACTTGGCGGCATTCCGGTGAAAGTTTCCCTTAGCCGTGAAGAGTGTTTCCT +CGCAACCCGTACCCGCCACGCTTTTACTATTGACGGGCAAATGGGCGTGAACCGCGACGG +AACATTGAAAGGTTATAGTCTGGATGTTCTGTCTAACACCGGCGCTTATGCATCTCACGG +GCACTCCATTGCTTCTGCTGGGGGGAATAAAGTCGCTTACCTTTATCCTCGTTGTGCCTA +CGCTTACAGTTCAAAGACCTGCTATACCAACCTCCCCTCGGCTGGTGCGATGCGTGGTTA +TGGCGCGCCACAAGTCGTATTTGCCGTTGAGTCTATGCTTGATGATGCCGCGACAGCGTT +AGGTATTGATCCTGTTGAAATTCGTTTACGCAACGCCGCCCGCGAAGGAGATGCTAATCC +GCTCACGGGAAAACGTATTTACAGCGCAGGGTTGCCGGAGTGTCTTGAAAAAGGCCGGAA +AATCTTTGAATGGGAAAAACGCCGTGCAGAGTGCCAGAACCAGCAAGGCAATTTACGTCG +TGGCGTTGGCGTCGCCTGTTTTAGCTACACCTCTAACACCTGGCCTGTCGGCGTAGAAAT +AGCAGGCGCGCGCCTGTTGATGAATCAGGATGGAACCATCAACGTGCAAAGCGGCGCGAC +GGAAATCGGTCAGGGTGCCGACACCGTCTTCTCGCAAATGGTGGCAGAAACCGTGGGGGT +TCCGGTCAGCGACGTTCGCGTTATTTCAACACAAGATACCGATGTTACGCCGTTCGATCC +CGGCGCATTTGCCTCACGCCAGAGCTATGTTGCCGCGCCTGCGCTGCGCAGTGCGGCACT +GTTATTAAAAGAGAAAATCATCGCTCACGCCGCAGTCATGCTACATCAGTCAGCGATGAA +TCTGACCCTGATAAAAGGCCATATCGTGCTGATTGAACGACCGGAAGAACCGTTAATGTC +GTTAAAAGATTTGGCGATGGACGCTTTCTACCACCCTGAACGCGGCGGGCAGCTCTCTGC +TGAAAGCTCCATCAAAACCACCACTAACCCACCGGCGTTCGGCTGTACATTTGTTGATCT +GACGGTCGATATTGCACTGTGCAAAGTCACCATCAACCGCATCCTCAACGTTCATGATTC +GGGGCATATTCTAAATCCGCTGCTGGCAGAAGGTCAGGTACACGGCGGAATGGGAATGGG +CATTGGCTGGGCGCTATTTGAAGAGATGATCATCGATGCGAAAAGCGGCGTGGTCCGTAA +CCCCAATCTGCTGGATTACAAAATGCCGACCATGCCGGATCTGCCACAACTGGAAAGCGC +GTTCGTCGAAATCAATGAGCCGCAATCCGCATACGGACATAAGTCACTGGGTGAGCCACC +AATAATTCCTGTTGCCGCTGCTATTCGTAACGCGGTGAAGATGGCTACCGGTGTTGCAAT +CAATACACTGCCGCTGACGCCAAAACGGTTATATGAAGAGTTCCATCTGGCAGGATTGAT +TTGAGGATAACATCATGTTTGATTTTGCTTCTTACCATCGCGCAGCAACCCTTGCCGATG +CCATCACCCTGCTGGCTGACAATCCGCAGGCCAAATTGCTTGCCGGTGGCACTGACGTAC +TGATACAGCTTCACCATCACAATGACCGCTATCGCCATATTGTTGATATCCACAATCTGG +CAGAGCTTCAGGGAATAACACAGGCGGAAGATGGCGCGCTGCGAATCGGCTCCGCGACAA +CATTTACTCAGCTCATTGAAGATCCCGTAATCCAACGCAATCTCCCGGCGTTATGTGCTG +CGGCTGCATCAATCGCCGGGCCGCAGATCCGTAATGTCGCCACCTACGGCGGAAATATTT +GCAACGGTGCCACCAGCGCAGATTCTGCCACGCCAACGCTAATTTATGACGCGAAACTGG +AGCTCCACTCCCCACGCGGTGTTCGTTTCGTCCCGATTAATGGCTTTCACACCGGGCCGG +GCAAAGTGTCTCTTGAGCATGACGAAATCCTTGTCGCCTTTCATTTTCCGCCACAGCCGA +AAGAACACGCGGGCAGCGCACATTTTAAATATGCCATGCGCGACGCAATGGATATTTCAA +CAATTGGCTGCGCCGCACATTGCCGACTGGATAACGGCAATTTCAGCGAATTACGCCTGG +CATTTGGTGTTGCCGCGCCAACGCCGATTCGCTGCCAACATGCCGAACAGACTGCACAAA +ATGCGCCATTAAACCTGCAAACGCTGGAAGCCATCAGCGAATCAGTCCTGCAAGATGTCG +CCCCGCGTTCTTCATGGCGGGCCAGTAAAGAGTTTCGTCTGCATCTCATCCAGACGATGA +CCAAAAAAGTGATTAGCGAAGCCGTCGCCGCGGCGGGGGGAAAATTGCAATGAATCACAG +CGAAACAATTACCATCGAATGCACCATTAACGGGATGCCTTTTCAGCTTCACGCCGCGCC +AGGAATGCCGCTTTCGGAACTACTCCGAGAACAAGGGCTTCTTAGTGTCAAACAAGGTTG +CTGCGTAGGCGAATGCGGTGCCTGTACGGTGCTGGTCGACGGCACTGCGATAGACAGTTG +CTTATTCCTTGCGGCCTGGGCTGAAGGAAAAGAGATCCGCACGCTGGAAGGTGAAGCGAA +AGGCGGTAAACTTTCTCATGTCCAACTGGCTTATGCGAAATCTGGTGCAGTGCAATGCGG +GTTTTGTACGCCGGGCCTGATTATGGCTACCACGGCAATGCTGGCGAAACCACGCGAGAA +GCCATTAACCATTACGGAAATTCGTCGTGGACTGGCGGGAAATCTTTGTCGCTGCACAGG +GTATCAGATGATTGTAAATACAGTTCTGGATTGCGAGAAAACGAAGTAAAAGGATATCCG +GCCTGAATTCAGGCCGGATTCTCAGAGGTTATGTGTTTAACAACTCATATTTCTTAATCT +TGCGATAGAGCGTAGCAATGCCGATGCCCAGTTCATCAGCAACTTCCTTCTTGCTGTTAT +GACGTGAAAGCGCCTCGCGGATCATTTGCTTTTCCATCTCCTCCAGCGCCGTGCCGCCCG +CATCATCGAGTGACAGGTGCGCCTCACTGACCTCTGTTACATCACTTTGCTCCGTTGTGC +CATTATTCAGCAGATTTGGCGGCAATAGCGTGCTGTCGATAACTTCACCTGAAGGAACAA +CGTTAACCAGATATTCCATCAAATTGCTTAACTCGCGCAGGTTTCCGGGCCAACGATGCT +TACGCAATATTTCGACGACATCAGGAGCAATGCCAGGATAAACCGATCCCAGACGACGGG +TATGCAGATGTAAAAAGTAATGCACCAGTAATTCAATATCTTCCTGACGTTCACGCAGCG +GTGGAAGAGTTATCGGGATAACATTAAGTCGGTAGAAGAGATCTTCGCGGAATTTACCTT +CGGCAATGAACTGGGCCAAATTCTGATTAGTTGCAGAAATGATGCGGATGTCGACTTGTA +TTGGGCTACTGGCACCAATCGGCAGAATTTCACGCGCCTCAATAGCGCGCAGTAATTTAG +CCTGCAACATTAATGGCATATCACCAATTTCATCGAGAAACAGCGTGCCCGTATTCGCCG +CCTGAATCAACCCTGTTTTACCGTTGGCAGAAGCGCCAGTAAATGCGCCTTTAACATAAC +CGAACAGTTCGCTCTCCAGAAGCTGTTCCGGAATCGCAGCACAGTTGATAGCAATAAAGG +GTTTATTCCGTCTTCCGCTCAACTTATGGATTGCACGGGCGACGACTTCTTTACCCGTGC +CGCTTTCACCAACCACCATAACGCTGGATGGGCTGGGTGCAATACGGCTAATGAGTCGTT +TTAATTGCCGCATAACACGGCACTCGCCAACCAATTGTTCAATATGCGGTTCATCAGGTG +CATTTGCTACAGAAAAACTGGTATGCGATTGGTGAAACGCCATTAAAAATAGTTGTCGGC +CCTGGATGTTATGCAACTGACCAATGATTAATTCACTTTTATCATCCCACGAAACAATAT +GTTGCATATGACCATGGGTAAAATTACTCTCAAATGTTAATGGTCTGAAACGAACAGGTT +TTCCAATAATATTATTTTGTACAACACCGAGTGTTTTTAAAGCTGTCTGATTAACAAACT +GAACCCGATTATCAGCATCAACCACTAACACGCCCTGATCCATATTATCGATCATGGTCG +CGAATATTTTACTGATGTTATCTCCTGGTCCCTGATCCTCCAGAAGTTTAGAAACAAAAA +TGGTGGATATATGGCGAACGTAATCGGAAAATTCGCGTAAATTATCACTGATATGTTCTT +GTTGCTCGTGGGTAACGGCAATCAAACTTATCACCCCAACACAACGATCCTGTAAAATGA +CAGGCGTACCCAGAAATGCTTTTTCGCGGCAATTTTCTTTACTATCGCAACCTTCACAAA +GGGGATCGAAGCGAGACTGTGTCACAACTTTTTCAGTTTTCGTTTCCAGGACGTGGCGGA +GCAGGCGTGAGTTGCCGCTCAACTGGCGGCCAAGAAACTTCCCATACGCGCCCGTTCCGG +CGACGCGACACAAGTTTTCATCAACGATCTCAACCTCAAGCTGCAAAACGCTGGCAAGCA +TTCTGGCAAAACGCTGAATTGTCGGTTGAATTTGCATCAATACTGACTGCGTAGTCGCAA +GCTCCATAGCTTTACCTTCCAGACTTACTTAAAAGTCGATCATTGAAGACGTTGATGGTT +CACAGATCATGATGATATTAACTCAGGCGAAATTGGCTTTGATAAAAACATAAGATTTTT +ATCACTTTCTAATAAAATTATGGAAGAGATATCACATTTCTATATCAATATGAGAATTAC +AGCGGCAAGTTTATCAAACTGAAGAGAGATAGCCTGCCTCTTTATCTTATTTCTGATACT +TAGCAGCAAATAAATAACGTGATAAAAAAAGCCAAACGTTTTCGTATTTTACAAACAACC +GGAAACTGGCATCAATATGTGATCAACCCCACACATTATCCGTCAAATTAGCCTTTCGCA +GCCGCGTGGATAATTCTGGCACACTTATTGTTAGTCCCAGGTATAGCTGTGAAAACACCA +ATCACTTTGGCACGTCACAGTGAAATAAACCACTTTGCCTGTCATTCCACTATCGGGACT +TTATGATGAAAACTGTTAATGAGCTGATTAAGGATATCAATTCGCTGACCTCTCACCTGC +ATGAAAAAGATTTTTTGTTAACGTGGGAACAGACGCCAGACGAACTGAAACAAGTACTGG +ACGTTGCCGCCGCGTTAAAAGCACTGCGTGCTGAAAACATCTCAACCAAAGTCTTTAATA +GTGGATTAGGTATTTCCGTCTTCCGCGACAACTCCACCCGTACCCGCTTCTCTTATGCTT +CCGCGCTTAACCTGCTCGGCCTTGCACAACAAGATCTTGACGAAGGTAAATCACAAATCG +CTCACGGCGAAACCGTGCGTGAAACCGCCAATATGATCTCCTTCTGCGCTGACGCTATCG +GTATTCGCGACGATATGTATCTGGGCGCAGGCAACGCCTATATGCGTGAAGTTGGCGCGG +CACTTGATGACGGCTACAAGCAGGGTGTGCTGCCGCAGCGTCCGGCTTTAGTGAACCTGC +AATGCGATATTGACCACCCGACTCAGTCTATGGCTGACCTGGCATGGTTGCGTGAACACT +TTGGTTCGCTGGAAAACCTGAAAGGCAAAAAAATCGCCATGACCTGGGCCTACTCCCCAA +GCTATGGCAAACCGCTCTCTGTACCACAAGGCATCATAGGTCTGATGACCCGCTTCGGTA +TGGATGTCACCCTGGCCCATCCGGAAGGCTACGACCTGATCCCGGATGTCGTTGAAGTTG +CTAAAAACAATGCTAAAGCCTCCGGTGGTAGCTTCCGTCAGGTCACCAGCATGGAAGAAG +CCTTCAAAGACGCAGACATCGTTTATCCGAAGTCATGGGCACCTTACAAAGTGATGGAAG +AGCGTACTGAATTGCTGCGTGCGAACGATCACGAAGGCTTAAAAGCACTGGAAAAACAGT +GTCTGGCACAGAACGCGCAACACAAAGACTGGCATTGTACTGAAGAGATGATGGAACTGA +CCCGTGATGGCGAAGCCCTGTACATGCACTGCCTGCCAGCTGATATCAGCGGCGTATCCT +GCAAAGAAGGTGAAGTGACTGAAGGCGTATTCGAAAAATACCGTATCGCTACCTACAAAG +AAGCCAGCTGGAAGCCTTATATCATCGCCGCGATGATCCTGTCCCGTAAATACGCCAAAC +CAGGTGCACTGCTCGAGCAACTGCTGAAAGAAGCGCAAGAACGCGTGAAATAACCCCTCG +GGCCGATCAGCTGGTCGGCCCTCTATTTCCAGAGGCCAAAAGGATAGGATATGTCCGTTT +TCTCATTGAAGATTGATATCGCCGATAACAAATTTTTCAACGGCGAAACATCACCGCTTT +TTTCGCAAAGCCAGGCAAAACTGGCACGCCAGTTCCACCAGAAAATTGCTGGTTATCACC +CAACACCGCTTTGTGCGCTGGACGATCTCGCAAACCTGTTTGGTGTAAAGAAAATTCTCG +TCAAAGACGAATCAAAACGATTCGGTCTGAACGCCTTCAAAATGCTCGGCGGTGCGTACG +CCATCGCTCAATTATTGTGTGAAAAATATCATCTTGATATCGAAACGCTGTCATTTGAGC +ACCTGAAAAATGCCATCGGCGAAAAAATGACTTTCGCGACTACCACCGACGGCAACCACG +GGCGCGGTGTGGCATGGGCAGCACAGCAACTCGGACAGAATGCGGTGATTTACATGCCGA +AAGGTTCTGCTCAGGAACGCGTTGACGCCATTCTAAACCTCGGTGCCGAGTGCATCGTCA +CGGATATGAACTATGACGATACCGTTCGCCTGACCATGCAACACGCGCAGCAGCACGGCT +GGGAAGTGGTACAGGACACGGCATGGGAAGGCTACACCAAAATCCCAACCTGGATCATGC +AAGGCTACGCAACACTGGCGGATGAAGCCGTCGAGCAAATGCGTGAAATGGGCGTAACCC +CGACACACGTTCTGCTACAAGCCGGTGTCGGTGCAATGGCCGGTGGTGTGCTGGGTTATC +TGGTCGACGTCTATAGCCCGCAAAATCTGCACAGCATTATTGTTGAACCTGACAAAGCTG +ACTGTATTTATCGCTCCGGCGTCAAAGGCGACATCGTCAACGTTGGCGGTGATATGGCCA +CCATCATGGCGGGCCTGGCCTGCGGCGAACCTAACCCGCTGGGCTGGGAAATCCTACGTA +ACTGCGCCACCCAATTCATCTCCTGCCAGGACAGCGTTGCCGCATTAGGTATGCGCGTGC +TGGGTAATCCGTATGGCAACGACCCGCGCATCATCTCCGGTGAATCCGGCGCTGTCGGTT +TGGGCGTTCTCGCAGCGGTTCATTATCACCCGCAACGTCAAAGCCTGATGGAAAAACTGG +CGCTGAACAAAGATGCCGTGGTGCTGGTTATCAGCACTGAAGGCGACACCGACGTGAAGC +ACTACCGCGAAGTTGTCTGGGAAGGCAAACACGCTGTAGCACCTTAATCACCCTATTGGA +ACTGCTCCCTGCAAAACGGGGAGTAAAAAATCTGGAGAAAAATAATGGCTAAGAATATTC +CATTCAAACTGATTCTTGAAAAAGCAAAAGATTACCAGGCAGACATGACTCGCTTCCTAC +GCGATATGGTTGCTATTCCCAGTGAAAGCTGCGACGAGAAACGCGTAGTACATCGTATTA +AAGAAGAGATGGAAAAAGTCGGCTTCGATAAAGTTGAAATCGACCCAATGGGCAACGTTC +TCGGTTATATCGGCCACGGCCCGCGTCTGGTGGCAATGGACGCTCATATCGACACCGTCG +GCATTGGCAACATCAAAAACTGGGACTTCGATCCGTATGAAGGCATGGAAACCGACGAGC +TGATCGGTGGTCGCGGTACTTCCGACCAGGAAGGCGGCATGGCATCTATGGTTTATGCCG +GTAAAATCATTAAAGACCTCGGTCTGGAAGATGAATATACCCTGCTGGTTACCGGTACTG +TGCAGGAAGAAGACTGCGACGGTCTGTGCTGGCAATACATTATTGAACAATCCGGCATTC +GCCCGGAATTTGTGGTCAGTACCGAACCAACCGACTGCCAGGTATACCGTGGTCAACGCG +GTCGTATGGAAATTCGCATTGATGTTCAGGGTGTTAGCTGCCACGGTTCGGCACCAGAAC +GTGGTGATAACGCCATTTTCAAAATGGGTCCAATTCTTGGCGAATTACAGGAACTGTCTC +AACGTCTGGGCTATGACGAATTCCTCGGCAAAGGTACGCTGACTGTTTCCGAAATTTTCT +TCACCTCCCCAAGTCGTTGCGCTGTCGCAGATAGCTGCGCAGTTTCTATTGACCGCCGTC +TCACCTGGGGCGAAACATGGGAAGGCGCGCTGGACGAGATCCGTGCCCTGCCTGCAGTAC +AAAAAGCGAATGCTGTCGTTTCTATGTACAACTACGACCGTCCGTCCTGGACTGGCCTGG +TTTATCCAACCGAATGCTACTTCCCGACCTGGAAAGTGGAAGAAGATCACTTCACCGTTA +AAGCACTGGTGAATGCTTATGAAGGGCTGTTTGGTAAAGCGCCTGTCGTTGATAAGTGGA +CCTTCTCAACTAACGGCGTATCCATCATGGGTCGCCACGGCATTCCGGTCATCGGTTTTG +GCCCTGGTAAAGAACCGGAAGCGCACGCGCCAAACGAAAAAACCTGGAAATCTCACCTGG +TAACCTGTGCCGCTATGTACGCTGCAATCCCATTAAGCTGGCTGGCAACCGAATAATTAC +TCTTCACTTATTCCCCTCCGGTTCGCCGGAGGGTTTTTGGAGTTTGCTATGCGCGTATTG +ATAAAAAACGGCATTGTTGTTAATGCAGATGGACAGGCGAAGCAGGATTTGCTGATTGAA +AGCGGGATTGTTCGCCAGTTGGGTACCGATATTTCGCCGCAACTCCCTTGCGAAGAAATT +GATGCCTCTGGCTGTTACGTTTTCCCTGGCGGCGTGGATGTCCATACGCATTTCAATATT +GATGTCGGCATCGCGCGCAGTTGTGATGATTTTTTTACCGGTACCCGCGCTGCTGCGTGT +GGCGGTACAACAACCATTATTGACCATATGGGATTTGGCCCAAATGGCTGCCGGTTACGC +CATCAACTGGAAGTTTATCGCGGTTATGCCGCCCACAAAGCAGTCATCGACTACAGCTTT +CACGGTGTCATTCAACATATTAATCACGCTATCCTCGACGAAATTCCGATGATGGTTGAG +GAAGGACTGAGCAGCTTTAAACTCTATTTAACCTATCAATATAAACTCAACGATGATGAA +GTGTTGCAGGCATTACGCCGCTTGCATGAGTCCGGCGCGCTGACCACCGTACACCCGGAA +AATGACGCAGCTATCGCCAGCAAGCGGGCGGAGTTTATCGCCGCAGGGTTAACCGCGCCG +CGTTATCATGCCTTGAGTCGACCTCTGGAATGCGAAGCGGAAGCCATCGCCCGCATGATT +AACCTGGCACAAATTGCCGGTAACGCCCCGCTCTATATCGTGCACCTGTCTAACGGCTTA +GGTCTAGATTATCTGCGTCTTGCCCGTGCGAATCACCAGCCAGTCTGGGTTGAAACCTGC +CCACAATATCTCCTGTTGGACGAACGCAGTTACGATACAGAAGATGGCATGAAGTTCATT +CTTAGCCCACCGCTGCGTAACGTACGCGAGCAGGACAAACTGTGGTGTGGCATCAGCGAT +GGTGCGATTGACGTGGTGGCAACCGATCACTGCACCTTCTCGATGGCTCAACGCCTGCAA +ATTTCTAAAGGCGATTTCAGCCGCTGCCCAAATGGCTTACCCGGTGTGGAGAACCGCATG +CAACTGCTGTTCTCCAGTGGCGTGATGACGGGACGTATCTCACCGGAGCGTTTTGTTGAG +TTAACCAGTGCAATGCCCGCCAGGCTGTTTGGCCTGTGGCCACAAAAAGGATTATTAGCG +CCCGGTTCCGATGGCGACGTGGTGATTATAGACCCACGTCAGAGCCAACAAATTCAGCAT +CGCCATCTCCACGACAACGCTGACTACTCGCCATGGGAGGGTTTTACCTGTCAGGGCGCG +ATTGTCAGAACCTTATCTCGTGGTGAAACGATTTTCTGCGACAGCACCTTTACAGGCAAA +GCCGGGCGAGGTCGTTTCCTGCGACGCAAACCGTTTGTCCCTCCCGTGCTCTAACCACTG +CCAGGGATCTATACACAATCAAGAATGATGAGTGAGGAAAAATGAGTAAGAAAATTGTTC +TCGCCCTGGGCGGGAATGCGCTGGGCGATGACCTGGCTGGGCAAATGAAAGCGGTAAAAA +TTACTTCTCAGGCAATTGTTGATTTAATTGCCCAGGGACATGAGGTCATCGTCACTCATG +GCAACGGGCCACAGGTGGGCATGATTAACCAGGCCTTTGAAGCTGCAGCAAAAACTGAAG +CGCACTCGCCAATGCTGCCGATGTCTGTCTGTGTTGCCTTAAGCCAGGGTTATATTGGTT +ACGATCTACAAAACGCCTTAAGAGAAGAACTGCTTTCTCGTGGCATTAATAAACCTGTAG +CAACGCTGGTTACCCAGGTCGAAGTCGATGCTAACGATCCGGCATTCCTCACCCCGACCA +AGCCGATCGGTTCGTTCTTTACCGAGCAAGAAGCAGAGCTACTGACAAAACAGGGTTACA +CTCTGAAAGAAGATGCGGGTCGCGGCTATCGCCGTGTCGTTGCTTCGCCAAAACCGGTTG +ATATCATTGAAAAAGAAACGGTTAAAGCTCTGGTAGATGCCGGACAGGTGGTGATCACCG +TTGGCGGTGGTGGTATCCCTGTTATTCGTGAAGGTAACCATCTGCGTGGTGCCAGCGCGG +TTATCGATAAAGACTGGGCCAGCGCCCGTTTAGCAGAAATGATTGATGCCGATATGCTGA +TCATTCTGACTGCGGTAGAAAAAGTGGCCATTAACTTCGGAAAAGAGAATGAACAGTGGC +TCGATCGCCTGTCGTTAAGTGATGCTGAACGCTTTATCGAAGAAGGTCATTTTGCGAAAG +GTTCTATGCTGCCTAAAGTGGAAGCTGCCGCCTCGTTTGCTCGCTCTCGCGCAGGTCGTG +AAGCACTGATTA +>my_contig +CCGTATTGAGCAAAGCGAAAGAGGGGATTGAAGGCAAAACCGGAACGGTGATTTGTCAGT +AATTTAAAGGCCGGATGGGTAATACCATCCGGCCATTTTCATTTAAGCCACTTCCAGCAC +TTCTTTTGTCGCTTTAACGCCCTGATGCATCAACATCATTAACGCCTCAAGTACGCCGCC +GCCAATCGCCCGGGCTTTATCAGAAACGCTGGTGAAATCAGCCGTTTCACCACGAGGATC +GATATCACCAATTTTAAAACCACCGACCACGGCCAGTCCGTCGTTCAACAAGCCACGCAC +CATCCCCGTCAACGGTGCTTTAATTTCATGCTCACCAATCCAGGCAATGACATCGCCCTC +TTTCACCAGATCGCCTAATTTCACGTTGGATCGCATAATGCCTGCAGCAGGAGCGCGGAT +CACTCGTCGGGTGGTATGCCCCATAATATTGCCGGGAACACCGGTATTCTCCTGCGCACA +ACCTGAGTAAATCACCTGACCGAGCCAGTGCCCGCGATTTGTTTCAATTACCGCATGACA +ATCCTTCCCTGCAGTAAAGCCCGGCCCAAGCGCGATTGTTACTGGTGCCATATCTGCCCG +CGTTCCCAAATTCTGTTTCGCCAGAATAGCGTCCACCACGCAAAGCGGTTTCAGTTCATC +AAGCAATGAACAGGTGGGATCTACCATCACAGGGATAAATCCGCGTTCGGTAAGTTTCAT +CGCTTCCGCAGAGCTGGTTGCCAGGCGGGCGGTGACGCCTTCGACCGTCATTTCGCCATC +GAACACGGCCTGGGCAAACGCCACGGTACAACGAATCACTGTCGGTTTTTCCACTTCCAA +CATGATCACTTTAAAACCCGCATGATACAGACGTAGCGCTACACCACTGGCGATATCCCC +CGCACCGCGAATCACCACCAGCTGGTGTCCGGAAGGATGAGAAGGCTTCATCATCAGCCC +ACCCGGCGCGTTATTTTTCACCTGTAATATTTCTGCCAGCACGCTGATGGCGATCTCTTG +CGGCGTTTCCGCACCTATATTGTAACCAACGGGCGCATGTAAACGGGCAATATGTTCTTC +AGCCACGCCTTTCTCACGCAATTGGCGCAGGAAAAGCTGAACCTTGCGGCGACTTGCCAG +CAACCCCAGCCATGCAATGGGTTGTTCAATGAGTTTGTCGAGGGCTTCACGATCCTGATT +ATTCGTGGCAATCAGGACAAAATTATCAGGGCGAATATCCAGTGCTTCCACTGCCGCACC +AAACGACTCAGCATGGAGAAGCGTGGTTGATGGTGGGAATAGTTCAGGATTGAGGCTTTC +GCGATAAATATCAGCAACGGCGATATCAAATCCTAATAGCGCCGCACTCTGGGCTATCGC +CCGGTTGACATGCCCCGCACCAATCAACACCAGACGTGGACGCATACCATGGACGCTGAT +AAATACTGACATTGCACCTCCACAATCTGACCCGACAGCATCCGCACCGTTACGAGCCAT +ACGTCCATGGAATAATCGCGGCTTACGTTCCTGCAATGCCTGAAGCGACTCTTCAATCAC +CTTCCGTTCAACCATTCCGCCACCAATTGTACCGACGATAGAACCATCGGCGCGCACTAA +CATTTGTGCAGAATGGCGGGGGGTTGAGCCTCGGCTATCAACAATTTGCGCCATCGCAAA +CGGACAATTTTGCTCTTCGAGTTTTGCAGCCTCTGTGAAAATATTCATACCAACCTCAAT +GGATATCCTTTCAGTAACCCGGAATACCCGGGCCGCTAATTCACAAATCTGCGCGCGATT +GCAGGATGTTCTTGTATATCGCCCAGCCAGATTGCCTCTACGTTGTGTTGTTGCAGCGGT +TGAAGGAGCTCGCTTTGCGCAATCGCATTCTCACATTGAGAAAAACGGTTAATGAACCAG +ACTCGCCGACAACCTTGTGGTACGTTTTTAAACGCCCCCTGAGGGTGGCGAACCAGCGCA +ACGAGATCGCTCAGTTGCAAGGGTGCAGCAGGTGTTAACCCAGTAATATCAGCAAACTGC +GACCAGCGATGGACATTTTCTGTGCTCACTTTCGCACCCAAAATATGTCCTCCCATCACA +GCAATCACGCAGCAACTGCTTTTAGGTATGCAAGGTTCGTGCTCATCAGGCGCTTTTAAC +GGCATTCCACGCGAGCCATCTGCCTCAATGAGAATTACGTCACACTCTGGTCGTTGTACC +AGTGCATCAATCGCTTCTGGCGTAAATCCCTGCACTTTTCCCTGGTTCGCTTTCCAGCAG +TGAAAACAAAATGAAATGGGGGATATAAAAGACGCATGAGGAAGCATGGCGGGATCACGA +CAGAAAACCACGGGCCAGTGAGATGTTGGCATAAACATATGTGTCGTCGTAGTGATTAAT +ACACGCCTGCCACTCGCCTGGAACAGTTCTGCCAGCCAAAAAAGCAAGCTGGTTTTCCCC +CCAGCACCAACAATAGAAATCACAGTGGGACGTTTCTGCGCGCCTAAATCAATGAATAAT +GCCGATGGGTCAATTATACTTTTCACGCGTCTTTATGGACCTCTCTGGGATAAATTACCC +TCAACGTAATCCATCAGGAAGTAACGCAATTATCAGGCGTTATTAGCTCCTGTAAATAAT +GGAATCACTATGTCAGCCATCGACTGTATAATTACCGCCGCAGGATTATCATCAAGAATG +GGGCAATGGAAAATGATGTTACCCTGGCAACAGGGAACAATTCTTGATACAAGTATCAAA +AATGCGTTGCAGTTTTGTAGCCGAATTATTTTAGTCACCGGCTATCGTGGTAATGAACTG +CACGAACGTTATGCGAACCAGAGCAATATCACTATTATCCACAACCCAGATTATGCGCAG +GGTTTACTGACATCAGTAAAGGCCGCAGTACCCGCGGTACAAACAGAACATTGTTTTCTC +ACCCACGGAGATATGCCAACCCTCACCATCGATATTTTTAGAAAAATCTGGTCGTTACGA +AATGATGGCGCAATACTGCCACTCCATAATGGCATCCCCGGCCATCCGATTTTAGTGTCA +AAACCATGCCTGATGCAGGCAATCCAGCGACCCAATGTCACCAATATGCGTCAGGCACTC +CTTATGGGAGAACATTATTCCGTCGAAATAGAAAATGCAGAAATAATTTTAGATATTGAT +ACTCCGGACGACTTTATTACAGCGAAGAAAAGGTATACTGAAATTTAGAAAACGTAGTTA +AACGATTGCGTTCAAATATCTAATCCCTCCAGCACTCTTTATCATAATGATAAGGAATCA +CTGATTTTGAGAAAAGAGAAAAAGTGATAAATGGGCTGGCAATAATAATTTTCAGGAGTG +ATTTTAATTCTCATTTGGCACCTGTGAGTTCATTCACAAAAAGCCATTAAGTTTCGAGCC +GCCTCACATTTTTTTATATTTCCCGCCAAACCTGGCAAGAGTGGTGCGATTGTTGCTCTA +TCCCCCTAAACCACCGGATTTCTCAACACCGGTCACTCAATGATATCTGTATAAGCTAAG +GAGAGGGTTATGGGGGATATTATGCGTCCCATTCCGTTTGAGGAACTTTTGACGCGCATA +TTTGATGAATACCAACAACAACGCTCAATCTTTGGTATTCCCGAGCAACAGTTTTACTCA +CCCGTAAAAGGTAAAACTGTTAGCGTCTTCGGTGAAACCTGTGCCACTCCCGTCGGCCCT +GCCGCTGGCCCGCACACGCAACTTGCGCAAAACATCGTCACCTCCTGGCTGACTGGCGGA +CGCTTCATCGAACTAAAAACCGTCCAAATTCTTGACCGCCTGGAGCTGGAAAAGCCCTGT +ATCGATGCCGAAGACGAGTGCTTTAACACCGAATGGTCTACCGAATTTACCCTGCTTAAA +GCCTGGGATGAATACCTCAAAGCCTGGTTTGCCCTGCACCTTCTCGAAGCGATGTTCCAG +CCTTCTGATTCCGGTAAATCGTTCATCTTTAATATGAGCGTCGGTTACAACCTCGAAGGT +ATTAAGCAACCGCCGATGCAGCAGTTCATCGACAATATGATGGACGCATCTGACCATCCG +AAATTCGCTCAATACCGCGATGCACTTAATAAGCTACTCCAGAATGAGGCATTTTTAGCC +CGCCACGGATTGCAGGAAAAACGCGAAAGCTTGCAAGCCTTACCCGCTCGCATCCCCACC +AGCATGGTACAAGGGGTTACCCTCTCCACCATGCACGGCTGTCCTCCGCATGAAATCGAA +GCCATTTGCCGCTACATGCTGGAAGAAAAAGGGCTCAACACCTTTGTGAAACTCAACCCG +ACCTTACTGGGGTACGCGCGTGTTCGTGAGATCCTCGATGTCTGCGGTTTCGGTTACATC +GGCTTAAAAGAAGAGTCATTTGATCACGACCTCAAGCTGACGCAAGCGCTGGAAATGCTG +GAACGCCTGATGGCACTGGCAAAAGAAAAATCACTCGGCTTTGGCGTAAAACTGACTAAC +ACTCTCGGCACCATTAATAACAAAGGCGCACTGCCTGGTGAAGAGATGTATATGTCAGGC +CGTGCGCTGTTCCCGCTCTCCATCAACGTTGCAGCAGTTCTCTCTCGCGCCTTTGACGGC +AAACTGCCCATTTCTTATTCCGGTGGTGCCAGTCAGCTGACTATCCGCGATATTTTTGAT +ACTGGTATTCGCCCTATTACTATGGCAACCGACCTGCTGAAACCTGGCGGCTATCTGCGC +TTAAGTGCCTGCATGCGCGAGCTGGAAGGCTCCGACGCCTGGGGACTTGACCATGTTGAC +GTCGAACGACTGAACAGACTGGCAGCAGACGCGTTAACCATGGAATACACCCAGAAACAC +TGGAAGCCAGAAGAGCGTATTGAAGTGGCTGAAGACCTGCCGCTGACCGATTGCTACGTT +GCCCCCTGTGTTACTGCCTGCGCTATCAAGCAAGATATTCCGGAATACATCCGTCTGCTT +GGCGAACACCGCTATGCCGACGCGCTGGAACTCATCTATCAACGCAACGCCCTGCCCGCC +ATTACCGGTCATATTTGCGATCACCAGTGCCAATACAACTGTACCCGCCTGGATTACGAC +AGTGCGCTGAATATCCGCGAACTGAAAAAAGTCGCGCTGGAAAAAGGTTGGGAGGAATAT +AAGCAACGCTGGCACAAACCAGCCGGTTCTGGTTCACGCCATCCGGTTGCCGTGATTGGT +GCAGGTCCGGCGGGTCTGGCCGCAGGTTACTTCCTTGCCAGAGCGGGCCATCCGGTTACG +CTGTTTGAACGCGAAGCCAATGCGGGCGGCGTGGTGAAAAATATCATTCCTCAGTTCCGT +ATTCCTGCAGAGTTAATTCAGCACGATATCGATTTTGTTGCCGATCACGGCGTGAAATTT +GAGTACGGTTGCTCACCCGATTTGACCGTTGAACAGTTAAAAAATCAGGGCTTCCACTAT +GTTCTGATTGCCACCGGCACTGATAAAAATAGCGGTGTGAAACTGGCGGGCGACAACCAA +AATGTCTGGAAATCACTCCCCTTCCTGCGTGAATACAACAAGGGCACAGCGCTCAAGCTG +GGCAAACATGTGGTCGTTGTCGGGGCGGGTAACACGGCAATGGACTGCGCTCGTGCGGCG +TTACGCGTTCCAGGCGTAGAAAAAGCAACGGTCGTTTACCGTCGTTCACTGCAAGAGATG +CCAGCATGGCGCGAAGAGTATGAAGAAGCGTTGCACGACGGCGTGGAGTTCCGTTTCCTG +AATAATCCGGAACGTTTCGATGCTGATGGCACCTTAACCTTGCGCGTTATGTCGCTTGGC +GAACCTGATGAGAAAGGTCGTCGCCGTCCGGTTGAAACCAACGAAACAGTAACGCTGCAT +GTAGACAGCCTGATCACCGCCATTGGTGAACAGCAGGATACTGAAGCCCTGAATGCAATG +GGCGTGCCGCTGGACAAAAACGGCTGGCCAGACGTCGACCATAATGGCGAAACGCGTCTG +ACTGACGTCTTTATGATCGGCGACGTACAGCGCGGACCATCCTCCATTGTCGCTGCTGTC +GGAACCGCGCGTCGGGCGACCGATGCCATCCTGAGTCGGGAAAATATCCGTTCCCACCAG +AACGATAAATACTGGAATAACGTCAATCCGGCGGAAATCTATCAACGTAAAGGCGATATC +TCTGTCACTCTGGTGAACAGTGACGATCGTGATGCGTTTGTCGCGCAGGAAGCCGCTCGC +TGCCTTGAATGTAACTACGTTTGCAGCAAGTGTGTGGATGTCTGCCCGAACCGCGCCAAC +GTATCCATTGCGGTCCCAGGCTTCCAGAACCGTTTCCAGACGCTGCACCTCGACGCTTAC +TGTAACGAATGTGGCAACTGCGCCCAATTCTGCCCGTGGAACGGTAAACCGTACAAAGAC +AAAATCACCGTCTTCAGCCTGTCGCAAGACTTTGATAACAGCAGCAACCCAGGCTTCCTT +GTGGAAGATTGCCGGGTACGCGTACGTCTGAATAACCAAAGCTGGGTGTTAAACATCGAC +AGCGAAGGTCAGTTCAACAACGTACCACCGGAGCTGAACGATATGTGCCGCATCATTAGC +CATGTCCACCAGCATCATCATTATCTGCTGGGCCGCGTGGAGGTGTAATCATGTTGATTC +TGAAGAATGTCACCGCAGTGCAGTTACACCCGGCGAAAGTGCAGGAAGGCGTTGATATCG +CCATCGAAAATGATGTGATTGTCGCTATCGACGATGCCCTGACGCAACGCTATCCCGATG +CCAGCTACAAAGAGATGCATGGTCGGATTGTGATGCCGGGAATTGTCTGCTCGCATAACC +ATTTTTACTCGGGGCTTTCCCGCGGAATTATGGCAAACATCGCCCCCTGCCCGGATTTCA +TCTCAACGCTGAAAAATCTCTGGTGGCGGCTCGATCGCGCCCTTGATGAAGAGTCGCTCT +ATTACAGCGGACTGATTTGTTCCCTGGAAGCAATTAAGAGCGGATGTACATCGGTTATCG +ATCACCATGCCTCTCCAGCCTATATCGGCGGGTCGCTCTCCACATTGCGCGACGCATTTT +TAAAAGTTGGCCTGCGCGCGATGACCTGTTTTGAAACTACTGACCGTAACAGCGGCATCA +AAGAGTTGCAGGAAGGTGTAGAAGAAAACATCCGCTTCGCCCGTCAGATTGATGAGGCGA +AGAAAGCAGCAACCGAGCCGTATCTGGTGGAAGCACATATCGGCGCTCACGCGCCGTTTA +CCGTACCGGATGCCGGTCTGGAGATGCTGTGTGAAGCCGTGAAAAGCACAGGTCGTGGTT +TGCATATTCACGCTGCGGAAGACCTTTACGACGTTTCCTACAGTCACCATTGGTACGGCA +AAGACCTGCTGGCACGACTGGCGCAATTCGATCTCATCGACAGCAAAACGCTGGTCGCTC +ATGGGCTGTACTTGTCGAAAGATGACATCGCCCTACTCAATCAGCGCGATGCGTTCCTGG +TGCATAACGCCCGTTCAAACATGAACAACCATGTCGGCTACAACCATCACCTTAGCGACA +TCCGCAATCTGGCGTTGGGAACGGACGGCATTGGTTCGGACATGTTTGAAGAGATGAAAT +TTGCCTTCTTTAAACATCGCGATGCGGGTGGCCCGCTGTGGCCTGACAGTTTTGCCAAAG +CACTGGCTAACGGCAACGAACTGATGAGCCGCAACTTTGGCGCGAAATTTGGGCTTCTGG +AAGCCGGTTACAAAGCCGATTTAACCATTTGCGATTACAACTCGCCGACGCCGCTGCTGG +CAGACAATATCGCCGGGCATATCGCTTTCGGTATGGGCTCAGGCAGCGTTCACAGCGTGA +TGGTCAATGGTGTGATGGTCTATGAAGACCGTCAGTTTAACTTCGATTGCGATTCCATTT +ATGCGCAAGCCAGAAAAGCCGCTGCCAGTATGTGGCGTCGGATGGATGCGCTGGCATAAA +TAACAGCTCCCCTCTTCTTTCAGAGAAGAGGGGAAATTAAGGAAAGACGATGATTGAACA +ATTTTTCAGACCCGACTCAGTCGAACAGGCGCTGGAACTGAAGCGCCGCTACCAGGATGA +AGCCGTCTGGTTCGCCGGGGGCAGCAAACTCAACGCTACACCAACCCGTACCGATAAAAA +GATTGCCATTTCCTTGCAGGATCTGGAGCTGGACTGGATTGACTGGGATAACGGTGCACT +ACGAATTGGCGCAATGTCTCGCTTGCAGCCACTGCGTGATGCGCGATTTATTCCTGCAGC +ACTGCGTGAAGCCCTCGGTTTTGTTTACTCACGCCATGTTCGTAATCAGTCGACCATTGG +TGGTGAAATCGCCGCCCGGCAAGAAGAGTCAGTGCTGCTTCCCGTCCTGCTGGCACTGGA +TGCTGAACTGGTTTTTGGCAACGGCGAAACGCTGTCAATCGAGGACTACCTGGCCTGCCC +ATGCGATCGCCTGTTAACCGAAATTATCATTAAAGATCCGTATCGCACCTGTGCGACTCG +CAAAATTAGCCGTTCTCAGGCAGGTTTAACCGTCGTGACGGCAGCCGTTGCAATAACAGA +CCACGACGGTATGCGAATTGCGCTGGATGGCGTCGCCAGTAAAGCACTGCGTCTGCACGA +TGTCGAAACTCAAAATCTGGAAGGCAATGCACTTGAACAGGCTGTCGCCAACGCCATTTT +CCCGCAGGAAGATTTGCGGGGCAGCGTGGCCTATAAACGCTATATCACGGGAGTTCTGGT +AGCCGATCTGTATGCCGACTGCCAACAGGCTGGGGAGGAAGCCGTATGATCATCCACTTT +ACTTTAAATGGCGCGCCTCAGGAGCTAACCGTTAATCCAGGCGAAAACGTGCAAAAGCTG +TTGTTTAACATGGGAATGCACTCTGTACGCAACAGTGATGATGGTTTTGGGTTTGCCGGT +TCTGACGCAATTATCTTTAACGGTAATATCGTTAACGCGTCCTTGCTTATCGCCGCACAG +TTAGAGAAGGCAGATATTCGTACCGCAGAATCTCTGGGCAAATGGAATGAGTTAAGTCTG +GTTCAACAGGCCATGGTTGATGTTGGCGTGGTGCAGTCTGGTTATAACGATCCAGCTGCG +GCTCTGATTATCACCGATCTTCTCGATCGCATCGACGCACCTACCCGCGAAGAGATCGAC +GACGCACTCTCAGGTCTGTTTAGCCGCGATGCTGGCTGGCAGCAATACTATCAGGTCATT +GAACTGGCGGTTGCACGTAAAAATAATCCGCAGGCCACCATTGATATCGCTCCGACTTTC +CGTGACGACCTTGAAGTCATTGGCAAGCATTATCCTAAAACTGATGCCGCGAAAATGGTG +CAGGCGAAACCCTGCTATGTTGAAGATCGAGTAACGGCTGACGCCTGCGTCATTAAAATG +TTACGTAGCCCACACGCTCACGCACTGATTACTCATCTGGATGTCAGCAAAGCTGAAGCC +TTACCGGGCGTCGTTCACGTTATTACTCACCTGAATTGCCCGGATATTTACTATACCCCG +GGTGGTCAGAGCGCACCGGAACCGTCACCGCTTGACCGCCGAATGTTCGGCAAGAAAATG +CGTCACGTCGGCGATCGCGTTGCTGCGGTAGTAGCCGAAAATGAAGACATTGCGCTCGAA +GCACTGAAGCTCATCGACGTTGAATATGAAGTGCTTAAGCCGGTAATGTCGATTGACGAG +GCAATGGCGGAAGATGCGCCTGTCGTGCACGATGAACCGGTGGTGTATGTTGCTGGTGCG +CCAGATACTCTGGAAGATGATAACAGCCATGCAGCCCAGCGCGGCGAGCATATGATCATC +AACTTCCCGATCGGTTCTCGCCCACGCAAAAATATCGCTGCCAGTATTCATGGTCATATT +GGCGATATGGACAAAGGCTTTGCCGATGCCGATGTGATCATTGAGCGAACCTATAACTCA +ACGCAGGCGCAGCAGTGCCCGACTGAAACACATATCTGCTTTACCCGTATGGACGGCGAT +CGTCTGGTGATCCACGCCTCCACCCAGGTACCATGGCACTTACGCCGCCAGGTCGCGCGC +CTCGTGGGCATGAAACAACATAAAGTTCATGTCATTAAAGAACGTGTAGGCGGCGGTTTT +GGTTCCAAACAGGACATCCTGCTGGAAGAAGTGTGCGCCTGGGCAACCTGCGTGACCGGG +CGTCCGGTACTGTTCCGCTACACCCGTGAAGAAGAGTTTATTGCTAACACCTCTCGTCAC +GTCGCGAAAGTCACCGTCAAACTGGGCGCGAAAAAAGATGGTCGCCTGACGGCAGTGAAG +ATGGATTTCCGCGCCAACACGGGTCCTTACGGTAACCACTCACTCACCGTACCGTGTAAC +GGACCGGCGCTGTCGCTGCCGTTATATCCATGCGATAACGTCGATTTTCAGGTCACCACC +TACTACAGCAACATTTGCCCAAATGGTGCTTATCAGGGTTATGGCGCGCCGAAAGGTAAC +TTCGCTATCACCATGGCGTTAGCGGAACTGGCGGAACAATTGCAGATCGACCAACTGGAA +ATTATTGAACGTAATCGTGTACACGAAGGGCAAGAGCTGAAAATTCTCGGTGCGATTGGT +GAAGGTAAAGCGCCGACATCCGTTCCTTCCGCCGCCAGCTGCGCACTGGAAGAGATCCTG +CGTCAGGGTCGCGAGATGATCCAATGGTCTTCACCAAAACCACAAAACGGTGACTGGCAC +ATCGGTCGTGGCGTCGCCATTATCATGCAGAAATCGGGTATCCCGGATATCGATCAGGCT +AACTGCATGATCAAACTGGAATCAGACGGTACCTTTATCGTTCATTCTGGCGGTGCGGAT +ATTGGTACTGGTTTGGATACTGTGGTGACGAAACTGGCAGCAGAAGTGCTGCACTGCCCC +CCGCAGGACGTGCATGTTATCTCCGGTGATACCGATCATGCGTTGTTTGATAAAGGCGCA +TATGCCTCGTCCGGTACTTGCTTCTCGGGTAACGCTGCGCGTTTGGCAGCGGAAAATCTG +CGGGAGAAAATCCTGTTCCACGGCGCGCAAATGTTGGGTGAGCCAGTGGCAGATGTTCAA +CTAGCAACGCCGGGCGTCGTTCGCGGCAAGAAAGGCGAAGTTAGTTTCGGAGAGATAGCC +CATAAAGGCGAAACCGGCACCGGCTTTGGTTCACTGGTGGGAACTGGCAGTTATATCACG +CCTGATTTCGCCTTCCCGTATGGCGCAAACTTCGCTGAAGTTGCCGTCAACACGCGTACG +GGTGAAATCCGCCTGGATAAATTCTACGCCTTGCTGGACTGCGGTACACCGGTCAATCCA +GAGTTAGCGCTGGGACAAATCTACGGTGCCACCCTGCGTGCTATCGGCCACAGTATGAGC +GAAGAGATCATTTATGACGCCGAAGGTCACCCGTTAACGCGTGATTTACGCAGTTACGGC +GCACCGAAAATTGGTGACATTCCGCGTGATTTCCGCGCTGTGCTGGTGCCGAGCGACGAT +AAAGTCGGCCCATTCGGGGCGAAATCGATCTCGGAAATCGGTGTAAATGGCGCCGCTCCG +GCGATTGCTACCGCAATTCACGATGCCTGCGGCATCTGGTTACGCGAATGGCATTTCACA +CCGGAGAAAATACTCACCGCGCTGGAAAAAATATAAGTAATAAATGGCCGCTTCGGCGGC +CTGTTTCTCTGTTTGAACGATGACTAAATAGTGACTGCGAAAATGAGATAAGCCGTTCTC +AAGGCGTCCTGCGCCCCAAATTCGTGGGAATTTATTTTACTAATTCAGATGATCAAATTT +ACTTTAAAAGGAGTGAAGGGATGTCTGATATAAACCATGCAGGTTCTGACCTTATATTTG +AACTGGAGGATCGCCCTCCCTTTCATCAGGCTCTCGTAGGTGCCATTACCCATCTGTTGG +CAATTTTCGTTCCGATGGTAACCCCCGCGTTAATCGTGGGTGCGGCCTTACAGCTTTCCG +CTGAAACAACTGCCTATCTTGTTTCTATGGCGATGATCGCCTCTGGTATTGGTACCTGGT +TACAAGTAAACCGCTACGGCATCGTCGGTTCTGGTTTACTTTCAATTCAGTCAGTCAATT +TTTCATTTGTTACGGTCATGATTGCGCTGGGTAGCAGCATGAAAAGCGACGGTTTTCACG +AAGAGTTAATCATGTCGTCGCTCCTCGGCGTCTCCTTCGTTGGCGCATTTCTGGTTGTCG +GCTCTTCTTTTATCCTGCCCTATTTACGTCGGGTTATTACGCCTACCGTCAGCGGCATTG +TGGTGCTGATGATCGGCTTAAGCCTGATTAAAGTTGGCATTATTGATTTTGGCGGTGGTT +TTGCAGCTAAAAGCAGCGGTACGTTCGGCAATTACGAGCATCTCGGCGTTGGCTTATTGG +TTTTGATTGTGGTGATCGGCTTTAACTGCTGCAGCAGTCCGTTGCTACGCATGGGTGGGA +TCGCCATTGGGCTATGTGTCGGCTATATCGCATCGTTATGCCTGGGCATGGTGGATTTCA +GCAGTGTGCGCAATTTGCCGTTAATCACCATCCCGCATCCGTTCAAATACGGCTTTAGTT +TTAGCTTCCATCAGTTCCTGGTGGTTGGCACGATTTATCTGCTTAGCGTGCTGGAAGCTG +TCGGCGATATCACCGCCACGGCAATGGTTTCCCGCCGTCCCATTCAGGGGGAAGAGTATC +AGTCCCGACTGAAAGGCGGCGTGCTGGCAGATGGTCTGGTTTCTGTTATCGCCTCCGCTG +TCGGTTCATTACCATTAACCACGTTTGCGCAAAATAATGGGGTTATTCAGATGACTGGCG +TCGCTTCACGTTATGTCGGGCGAACCATCGCGGTAATGCTGGTTATCCTCGGCTTATTTC +CGATGATTGGCGGCTTCTTCACGACCATTCCCTCAGCAGTTCTGGGAGGCGCAATGACGT +TGATGTTTTCCATGATTGCCATCGCAGGGATTCGCATCATCATCACCAACGGTTTAAAGC +GCCGAGAAACACTTATTGTCGCCACGTCTTTAGGTTTAGGGCTTGGCGTCTCCTACGATC +CCGAAATTTTTAAAATATTGCCAGCCTCTATTTATGTATTAGTTGAAAACCCTATTTGTG +CTGGCGGGTTAACTGCGATTTTATTAAATATTATCCTCCCTGGTGGCTACCGACAGGAAA +ACGTTCTGCCTGGTATTACCTCAGCGGAAGAGATGGATTAACAGTAAAGGAGTCAATGAT +GTCAGGAGAACACACGTTAAAAGCGGTACGAGGCAGTTTTATTGATGTCACCCGTACGGT +CGATAACCCGGAAGAAATTGCCTCTGCGCTGCGGTTTATTGAGGATGGTTTATTACTCAT +TAAACAGGGAAAAGTGGAATGGTTTGGCGAATGGGAAGACGGAAAGCATCAAATTCCTGA +CACCATTCGCGTGCGCGACTATCGCGGCAAACTGATAGTACCGGGCTTTGTCGATACACA +TATCCATTATCCGCAAAGTGAAATGGTGGGGGCCTATGGTGAACAATTGCTGGAGTGGTT +GAATAAACACACCTTCCCTACTGAACGTCGTTATGAGGATTTAGAGTACGCCCGCGAGAT +GTCGGCGTTCTTCATCAAGCAGCTTTTACGTAACGGAACCACCACGGCGCTGGTGTTTGG +CACTGTTCATCCACAATCCGTTGATGCGCTGTTTGAAGCCGCCAGTCATATCAATATGCG +TATGATTGCCGGTAAAGTGATGATGGACCGAAACGCACCGGATTATCTGCTCGACACTGC +CGAAAGCAGCTATCACCAAAGCAAAGAACTGATTGAACGCTGGCACAAAAATGGTCGTCT +GTTGTATGCGATTACGCCACGCTTCGCCCCTACCTCATCTCCTGAACAGATGGCGATGGC +GCAACGCCTGAAAGAAGAATATCCGGATACATGGGTACATACCCATCTCTGTGAAAACAA +AGATGAAATTGCCTGGGTGAAATTGCTTTATCCTGACCATGATGGTTATCTTGATGTTTA +CCATCAGTACGGCCTGACCGGTAAAAATTGTGTCTTTGCTCACTGCGTCCATCTCGAAGA +AAAAGAGTGGGATCGTCTCAGCGAAACCAAATCCAGCATTGCTTTCTGTCCGACCTCCAA +CCTTTACCTCGGCAGCGGCTTATTCAACTTGAAAAAAGCATGGCAGAAGAAAGTCAAAGT +GGGCATGGGAACAGATATCGGTGCCGGAACAACTTTTAACATGCTGCAAACGCTGAACGA +AGCCTACAAGGTATTGCAATTACAAGGCTATCGCCTCTCGGCATATGAAGCGTTTTACCT +GGCCACGCTCGGCGGAGCGAAATCTCTGGGCCTTGACGATTTGATTGGCAACTTTTTACC +TGGCAAAGAGGCTGATTTCGTGGTGATGGAACCCACTGCCACTCCGCTACAGCAGCTGCG +CTATGACAACTCTGTTTCTTTAGTCGACAAATTGTTCGTGATGATGACGTTGGGCGATGA +CCGTTCGATCTACCGCACCTACGTTGATGGTCGTCTGGTGTACGAACGCAACTAATAATA +AAACTTTAACATCCTCGTGAGGACATCATTATGTCTGGAGACATCCTACAAACACCGGAC +GCACCAAAGCCACAGGGCGCGCTGGATAATTATTTTAAAATTACCGCTCGTGGCAGTACC +GTTCGTCAGGAAGTACTGGCTGGCTTAACGACCTTTCTGGCCATGGTTTATTCCGTTATC +GTCGTTCCGGGAATGCTGGGCAAAGCAGGTTTTCCTCCCGCAGCTGTGTTTGTTGCCACC +TGTCTGGTCGCGGGCTTCGGCTCGTTGCTGATGGGGTTATGGGCCAATTTGCCAATGGCG +ATTGGTTGCGCTATTTCCTTGACGGCGTTTACCGCATTCAGTCTGGTACTCGGGCAACAA +ATTAGCGTTCCTGTCGCACTGGGCGCAGTCTTTCTGATGGGCGTCATCTTCACCGCTATT +TCCGTAACCGGTGTGCGTACCTGGATCTTACGTAATTTGCCGATGGGGATCGCTCACGGT +ACAGGTATCGGTATCGGCCTGTTTCTGCTGCTGATTGCTGCTAACGGTGTGGGAATGGTT +ATCAAAAACCCGATTGAAGGCTTGCCAGTGGCGCTCGGTGCGTTTACCTCCTTCCCGGTG +ATGATGAGCTTACTGGGGCTGGCGGTCATCTTCGGTCTGGAAAAGTGCCGCGTACCCGGC +GGGATCTTGTTGGTGATTATTGCAATTTCGATCATCGGCTTAATCTTTGACCCAGCGGTG +AAGTACCACGGTCTGGTGGCAATGCCAAGCCTGACTGGCGAAGATGGTAAGTCTCTGATT +TTCAGCCTCGATATTATGGGCGCACTCCAGCCAACTGTACTTCCGAGTGTACTGGCATTG +GTGATGACCGCAGTGTTCGACGCCACTGGCACCATCCGTGCCGTCGCCGGTCAGGCGAAT +TTGTTGGATAAAGACAACCAGATCATCAACGGCGGCAAAGCCCTGACCAGTGACTCAGTA +AGTTCAATATTCTCCGGCCTGGTGGGCGCAGCGCCCGCGGCGGTTTATATCGAATCAGCG +GCAGGAACCGCCGCCGGGGGGAAAACCGGTTTAACCGCAACCGTGGTTGGTGTGTTGTTC +CTGATGATTCTGTTTTTATCACCGTTATCGTTTCTGATCCCCGGTTATGCCACAGCTCCC +GCACTGATGTACGTGGGTTTGCTGATGTTAAGCAACGTCTCGAAGCTGGATTTCAACGAT +TTTATTGACGCAATGGCTGGCCTGGTGTGTGCCGTGTTCATCGTTCTGACTTGTAATATC +GTTACCGGTATTATGCTGGGCTTTGTAACACTGGTGGTGGGTCGCGTCTTTGCGCGCGAA +TGGCAAAAGCTGAATATTGGTACGGTGATCATTACTGCCGCACTGGTCGCGTTTTACGCG +GGTGGTTGGGCAATCTAATAGATTCTCCGCGCCTTTCCGCGCGGAGATTTCTTTCAGAGA +GGATTCTCACTGCTGGCAGCAATACGCTGCTGGCGGATACGCCTGAGTTCTCTTTCAGTC +AGCAACTGCAGCGCCTGTGTCGGGCAAGATTCAACGCAGGCTGGCCCCTCTTCCCGCAGT +TCACAGAGATCGCATTTCACGATTTGTTGCCGGGGATCACCCGGCAATGACTGAATGGTG +ATCATCCCAAACGGGCACGCGCTAACGCAACTCTGACAGCCAATACAACGGGCAGAATTG +GCCTGCACCACCTGCTCGCCCATCGTCAGCGCCCCCACGGGGCAAGCGCCAACACAAGGG +GCGTTTTCACACTGATGGCACATCACCGGCGCACTGATGCTATCCAGCCGTTGTACCTTC +AGCCGGGGTAAAAAGATATCGGCATTCAACTCCTGTTCTGAAGGGTGAGCGACCACACAG +GCCACTTCACAAGTACGGCAGCCAATACAGTCAGCCGGATTAACGATAATTAACGATTTC +ATCACGATGCCTTCGTATCAAACAGAGTTAACATATCGCGCGCCGCCTGCCTTCCTGCGG +CCATTGCAGTGACAACCAGATCCGCGCCATGAACTGCATCACCACCAGCAAAGACTTTTT +TCAGATGCGTCTGGGTAGGTAAATACCCGACGTCGCCGGTTTGAATCAGGCCCCATTTAT +CGAGTTTAATTCCGCTGCCCTGCAACCACGGCATGGTATGTGCCTGGAAACCAAAGGCCA +TAATGAGAACATCGGCGGGCAATTCAAACTCTGAACCCGCAACCGGACGAGGACGACGGC +GACCATCCGGCCCCGGCTCACCCATAGCGGTACGAATCAGGCCCACCGCCGTTAAGCGTC +CATCTTCATCACAAGCGATATATTGCGGCTGAACATTGAACTGAAACTCAACACCTTCCT +CGCGGGCATTGACCACCTCTTTGCGCGAACCCGGCATACTGACTTCATCACGACGATACG +CACAGGTCACGCTGGCAGCATTAAGGCGGATGGAAGTCCGCAAACAATCCATTGTCGTAT +CGCCACCGCCCAATACCACGACTCGCTTCCCTTCCACATCCGTCAGCGGATACTCTGCAG +ACTCCGGCAATCCCATGAGCTGGCGGGTATGGGCGGTCAGGAACGGTAACGCCTGAATGA +CACCAGGCGCATCTTCATGCGGCAGATCTGCTCGCATCATCCCGTAAGTCCCCACGCCGA +GGAAAACAGCATCATATTCCGCCGTTAATTCGTTGAAAGAGATATCGCGGCCAATTTCAC +AGTTGAGATGGAAATCGATTCCCATTGCGGTGAATATCTCTCGCCGCTGGCTTAATACCG +TTTTATCGAGTTTGAAAGGAGGAATGCCAAAAGTCAGCATACCGCCAATTTCTGGATGGC +GATCAAAGACATCAACCTGAACTCCCGCGCGCGCCAGAATATCAGCACACCCTAATCCTG +CAGGTCCAGCGCCAATCACCGCCACTTTTTCGCTACGGGGAACAACTTTGCTGACATCGG +GACGCCAGCCCATCGCCAGCGCAGTATCGGTGATGTAGCGTTCCAGATTACCGATAGAGA +CTGCGCCAGAGTGATCTTTCAAAGTACATGCACCTTCACAAAGACGGTCCTGTGGACATA +CCCTGCCGCAGATTTCGGGTAAGGAACTGGTCTGGTGGCAAAGTTCTGCCGCTTCAATAA +TCTTTCCTTCCTGTACCAGACGGATGTAATCCGGAATAGCGTTATGCAGCGGACAATGCC +AGTTGCAGTTAGCTTTTTCGGCACAATAAACACAGCGGTCACTCTCATAAGTCGCTTGTT +GTGGATCCAGCCCGCAATAGATTTCGCCAAAGTGGGTTTTCCGTTCACTCGCTGAAATTT +TATCTGCGCCTTTACGCGAGTTAACGGGGAGCAACGCTGCACTGCGAGATGGCTGAGCGT +CTGATGACGCTTTTCCTGCTGCCGTTTTGCGCTGGCGGGCCACCTTTATCTGCTGCAACC +CTTTATCGTCCATCAGCCGTAACGCCTGTGTTGGGCAGACGTCAATACAGGCTTGCGTGC +CGGAACTGCGCTGGTTACAAAGGTCGCATTTCTGTGCAATCGTATCGACCATCTCAACGA +CGCCAAAGGGGCAAGCGATTGCGCATCTTTTACAACCAATACATTTTTGCTCGTCCAGTT +GTACGCTATCGGACTGGAAAGTCAGAGCATTAACCGGACAAGCCGTAACGCAAGGGGCAT +TGTTGCAGTGATGGCAGGCCACCGGATTCGCAGCCTGGCCTTTCCCTACAACGTGGATAC +GCGGTCGAAAGTCACTGTGACTCAGCGGCCAGTTTTCTTGATTATGTGCCACCGCACAGG +CAATTTCACAAGCATGGCAGCCTATACATTCCGCAGCTTCAGCAGCGATAAACTTATTCA +TTTGCATCCCTTTCATTTAATGAGTTATGTCTTCTCAAATTTCGCGATGCAATAAACGGG +CATATATTAGGTAGCATGACCGTTTTAATTATAATTTTGCAACTGAGTTCAAATTATTGC +CCCTCAATCTATGCCGCTTTCATTATTTCAACATTGCCGATCAAAAGAATGCTATCCAGA +TAAAAACGATTAAATGCGAGAGTGCGACATGCCAGAATGATTAATGAAATATCAATATGA +GAAAATTACAGATAATTCCATTGTCAGGTTCTCTTCTCATAATCGTGGTTTAACCACGAT +TATGTGATTGCCTCCGCAATTCCTGTCTCTAACTCCCCTTCCTCGCAAAAACTGGCACTC +CACGAGCATGTGTTTAGACAGTTTCATGAACATAAACGGTTGCTTTTTACTCTGGCGGGC +GAAAGGAGAAACACTGATGAGCGCCATAGATTCCCAACTTCCCTCATCTTCTGGGCAAGA +CCGCCCAACTGATGAGGTTGACCGCATATTATCACCAGGAAAGCTGATCATACTCGGTCT +GCAACACGTCCTTGTCATGTACGCAGGTGCAGTCGCTGTTCCTCTTATGATTGGTGACCG +ACTCGGCCTATCAAAAGAAGCTATTGCGATGCTCATCAGCTCGGATCTCTTTTGCTGCGG +GATCGTCACATTATTGCAATGTATCGGTATCGGCCGCTTTATGGGGATCCGCCTGCCGGT +GATTATGTCGGTGACCTTCGCCGCTGTAACACCAATGATAGCCATTGGTATGAACCCGGA +TATCGGCCTGCTGGGGATATTCGGTGCCACTATCGCCGCGGGTTTTATCACCACATTATT +AGCGCCACTTATCGGTCGCTTGATGCCTTTATTCCCGCCACTGGTTACCGGTGTGGTGAT +TACTTCTATCGGGCTTAGCATCATTCAGGTGGGTATTGACTGGGCCGCCGGAGGTAAAGG +GAATCCGCAATATGGTAATCCCGTTTATTTAGGTATCTCCTTTGCCGTCTTAATTTTTAT +CTTGCTCATTACTCGCTATGCGAAAGGATTTATGTCCAACGTCGCCGTATTACTGGGGAT +TGTATTTGGCTTTTTACTTTCGTGGATGATGAATGAAGTCAATTTATCCGGGCTACATGA +TGCTTCATGGTTTGCGATTGTCACGCCGATGTCATTTGGTATGCCGATTTTCGATCCCGT +TTCCATTCTGACCATGACTGCCGTGTTAATCATCGTGTTTATCGAGTCGATGGGGATGTT +CCTGGCACTGGGTGAAATAGTCGGTCGCAAACTCTCTTCCCAGGACATTATTCGTGGGTT +ACGCGTAGATGGGGTTGGGACAATGATTGGAGGCACGTTTAACAGCTTCCCACATACGTC +ATTTTCGCAGAACGTCGGGCTGGTCAGCGTGACGCGCGTCCACAGCCGCTGGGTGTGCAT +TGCTTCCGGTATCATTTTGATCCTGTTCGGCATGGTGCCCAAAATGGCGGTGCTGGTGGC +CTCGATTCCGCAATTTGTGCTGGGCGGCGCGGGGCTGGTGATGTTCGGCATGGTACTGGC +GACAGGGATTCGAATTCTGTCGCGCTGTAACTACACCACTAACCGTTACAACCTCTATAT +TGTGGCGATCAGTCTCGGTGTTGGCATGACGCCAACGCTCTCTCACGATTTCTTTTCTAA +GTTACCGGCCGTACTGCAACCGTTGCTGCATAGCGGCATTATGCTCGCAACCCTTAGCGC +CGTTGTGCTGAACGTCTTCTTTAATGGCTACCAGCATCATGCTGACCTGGTGAAGGAATC +CGTCTCTGATAAAGATTTAAAAGTCAGGACAGTACGTATGTGGCTTCTGATGCGCAAGCT +GAAGAAAAATGAGCATGGAGAATAATATGAATCTTTTAATGCGCGCTATATTCAGTCTGC +TGTTGCTTTTTACTCTCTCTATTCCTGTCATTTCTGATTGTGTTGCAATGGCCATTGAAA +GTCGCTTCAAATATATGATGCTGCTTTTTTAAATGGTTTTTACCTGTCGACATCCGCTCA +AAACGGGCGGTTGTCGATAAACGCTCACTTGGTTAATCATTTCACTCTTCTATTATCTAT +AATGATGAGTGATCAGAATTACATGTGAGAAATTATGCAAACGGAACACGTCATTTTATT +GAATGCACAGGGAGTTCCCACGGGTACGCTGGAAAAGTATGCCGCACACACGGCAGACAC +CCTCTTACATCTCGCGTTTTCCAGTTGGCTGTTTAATGCCAAAGGGCAATTATTAGTTAC +CCGCCGCGCCCTTAGCAAAAAAGCATGGCCTGGCGTGTGGACTAACTCGGTTTGTGGGCA +CCCACAACCGGGAGAAAGCAACGAAGAGGCGGTGATCCGCCGTTGCCGTTATGAGCTTGG +CGTAGAAATTACGCCTCCTGAATCTATCTATCCTGACTTTCGCTACCGCGCCACCGATCC +GAATGGCATTGTGGAAAATGAAGTGTGTCCGGTATTTGCCGCACGCACGACCAGTGCGTT +ACAGATCAACGATGATGAAGTGATGGATTATCAATGGTGTGATTTAGCAGCGGTTTTACG +CGGTATTGATGCTACGCCGTGGGCGTTCAGTCCGTGGATGGTGATGCAGGCGACAAATCG +CGAAGCCAGAAAACGATTATCTGCATTTACCCAGCTTAAATAAAAAACCCCGACGGTTGC +CGGGGTTGTGAGCATAACGTAATGCTTATTTTACCGGACGCATCGCCGGGAACAGAATAA +CGTCGCGGATGGTATGGCTGTTGGTGAACAGCATTACCATACGGTCGATACCAATTCCCA +GACCGGCTGTCGGTGGTAAGCCATGTTCCAGTGCGGTGACATAATCTTCGTCGTAGAACA +TCGCTTCGTCGTCACCTGCATCTTTCGCGGCAACCTGATCCAGGAAGCGCTGCGCCTGAT +CTTCCGCGTCATTCAGCTCGCTAAAGCCGTTACCGATTTCACGCCCACCAATGAAGAACT +CAAAGCGGTCTGTGATTTCCGGGTTAACGTCGTTACGACGCGCCAGAGGAGAAACTTCTG +CCGGATATTCAGTAATGAAGGTCGGCTGGATCAGATGTGCTTCTGCCACTTCTTCGAAGA +TCTCGGTAACGATACGGCCCAGACCCCAGCTCTTCTCAACGTGGATGCCGATAGATTCAG +CAATCGCTTTCGCAGAGTCGAAGTTGTCCAGATCTGCCATGTCGGTTTCCGGGCGATATT +TCTTGATCGCTTCACGCATGGTCAGTTTTTCGAACGGCTTACCGAAGTCCAGCGTTACGT +CGCCGTAGGTCACTTCCGTCTTACCGAGAATATCCTGTGCCAGAGTACGGAACAGCGATT +CGGTCAGCTCGATCAGATCTTTGTAATCTGCGTAAGCCATATAGAGTTCCATCATGGTGA +ACTCTGGGTTATGACGTACGGAAATACCTTCGTTACGGAAGTTACGGTTGATTTCGAATA +CACGCTCGAAGCCACCGACCACCAGACGCTTGAGGTACAGTTCCGGCGCGATACGCAGGT +ACATGTCGAGATCCAGCGCGTTATGGTGGGTGATGAACGGACGCGCAGCGGCACCGCCAG +GGATCACCTGCATCATCGGCGTTTCAACTTCCATAAAGCCGCGATTCACCATGAACTGGC +GAATACCAGAGAGGATCTGCGAGCGCACTTTAAAGGTGTTGCGGGATTCATCGTTAGAGA +TGAGATCCAGATAACGCTGACGATAGCGCGCTTCCTGATCCTGCAAGCCGTGGAATTTAT +CCGGCAGCGGACGCAGTGCTTTGGTCAGCAGACGCAGCTCGGTACAGTGGATAGACAGTT +CGCCGGTTTTGGTTTTGAACAGTTTACCTTTCGCGCCGAGGATATCGCCGAGGTCCCATT +TTTTGAACTGCTCGTTGTAAACGCCTTCCGGCAGATCGTCACGGGCAACGTACAACTGAA +TGCGACCGCCAACGTCCTGCAGGGTAACGAAAGACGCTTTACCCATAATACGACGGGTCA +TCATGCGGCCAGCAACGGCGACTTCGATGTTCAGCGCTTCCAGTTCTTCGTTCTCTTTAC +CGTCGAATTCTGCGTGCAATTGGTCAGAGGTATGATCGCGACGGAAATCGTTCGGGAAGG +CAATCCCCTGCTCACGCAGGTTCGCCAGCTTCTCACGACGCGTTTTCAGTTCATTGTTAA +GATCGACTACCGCGTCAGCGCCCTGTGCGTGTTGTTCAGACATGTTGGTTCCTCATAACC +CTGCTTTCAAACTTGCTTCGATAAATTGATCCAGGCTGCCGTCCAGCACGGCCTGCGTGT +TGCGGGTTTCTACCCCGGTACGCAGATCTTTAATGCGGGAGTCATCAAGGACATAAGAAC +GAATCTGGCTGCCCCAGCCGATGTCGGATTTGTTATCTTCCATCGCCTGTTTCTCGGCAT +TTTTCTTCTGCATCTCCAGTTCATAAAGCTTCGCTTTCATCTGCTTCATGGCCTGGTCTT +TGTTCTTGTGCTGGGAACGGTCGTTCTGGCATTGGGTCACGATCCCGGTTGGGATGTGAG +TAATACGCACCGCAGATTCGGTACGGTTAACGTGCTGACCGCCCGCGCCGGATGCGCGAT +AAACGTCGATGCGCAGATCCGCCGGATTGATTTCGATATCGATATCATCATCAACTTCCG +GGTAAACAAACGCGGAGCTGAACGACGTGTGGCGACGACCACCGGAGTCAAACGGGCTCT +TACGCACCAGGCGGTGAACGCCGGTTTCTGTACGCAGCCAGCCATAAGCGTAATCGCCGG +AGATTTTGATCGTCACGGATTTAATACCCGCCACTTCACCTTCCGACTCTTCGATGATTT +CAGTTTTGAAACCACGCGATTCAGCCCAGCGCAGATACATACGCTCAAGCATGCTCGCCC +AGTCCTGTGCTTCCGTACCGCCAGACCCCGCCTGAATATCGAGGTAGCAGTCGGCGCTGT +CATATTCGCCAGAGAACATACGGCGGAACTCAAGCTGCGCCAGTTTTTCTTCCAGGGCGT +CGAGTTCAGCAACGGCTTCGTTAAAGGTTTCTTCGTCGTCAGCTTCTACAGCCAGTTCCA +GCAGACCAGAAACATCTTCCAGCCCCTGTTTCATTTGGTCGAGGGTGTCGACAACGGCTT +CGAGGGAGGAACGCTCTTTACCCAGCGCCTGTGCGCGTTCGGGTTCGTTCCAGACATCCG +GCTGTTCCAGCTCGGCGTTTACTTCTTCCAGACGCTCTTTCTTGGCGTCATAGTCAAAGA +TACCCCCTAAGAACGTCGGAGCGTTCCGTGAGGTCCTGAATGCGATTATTTACCGGATTA +ATTTCAAACATGGTCTGATTTCTTTTATTGAGCTAGTCAAAATGCGGTGATTAGAGCGGG +ATTGTACCCAATCCACGCTCTTTTTTATAGAGAAGATGACGCTAAATTGGCCAGATATTG +TCGATGATAATTTGCAGGCTGCGGTTGCCGCGAAACTCGTTGATATCGAGCTTGTAAGCC +AGTTGCACTTCGCGCACGCCGTTATCCGGCCAGAGGGCGGTATCGACATTAAAAGCAATA +CCATCCAGCAGCGGACCGCCGCCGACCGGCTCGACCATGACTTTCAAATGACGCTCGCCC +ACCAGCCGCTGTTGCAGCAGACGGAAATGACCGTCAAACAACGGTTCCGGGAACATTTGT +CCCCACGGGCCAGCATCACGCAGCAGTTGCGCCACTTCCATGGTCATCTCTGCCGCACTT +AATGGGCCGTCTGATACCACTTCCCCTTGCAATAAAGAAGGATCTAACCACTCGGTAACC +AGTTCGCCAAAGCGTTGCTGAAAGAGTTCGAATTTCTCCTCTTCCAGCGACAAACCCGCC +GCCATCGCATGGCCGCCAAACTTGAGCATCATGCCGGGGTAAAGCGTGTCTAGCCGCTCC +AGCGCATCGCGCATATGCAGCCCCTGAATGGAGCGACCGGAACCTTTCAGCGTACCGTCG +CCCGCAGGCGCAAAGGCGATAACCGGACGGTGAAAACGCTCTTTGATACGCGATGCCAGA +ATGCCAACAACGCCCTGATGCCATTCAGGGTGATACATTGCCAGCCCACCTGGCAGCGTG +TCGCGGCTACGTTCCAGCTTCTCGCACAGAGTGAGCGCTTCAACCTGCATTCCCTGTTCG +ATCTCTTTACGTGTTTGGTTTAGTGCATCGAGTTCATTCGCCAGCACACGCGCTTCGCCA +ATGTTGTCACACAACAACAGCGCCACGCCAACGGACATATCGTCCAGTCGCCCGGCAGCA +TTGAGACGTGGCCCCAGCGCAAAACCTAAATCGCTGGCGGCGAGTTTTTGTGGATCGCGA +TTGGCCACTTCCAGCAGCGCTTTAATCCCCGGACGGCACTTTCCGGCACGGATGCGACTC +ATCCCCTGCCAGGTCAGAATGCGATTATTAGCGTCCAGCGGCACGACGTCCGCCACTGTC +CCCAACGCTACCAGATCCAGCAGTTCTGCCAGATTAGGAATTGCGATGCCGCGCTCATCA +AACCAGCCCTGATCGCGCAAAAAGGTGCGCAGCGCCAGCATCAGATAAAACGCCACACCC +ACGCCTGCCAGTGATTTCGACGGGAAATTACAGTCGCGCAAGTTAGGGTTAATGATCGCT +TCCGCTGCGGGTAATGTGTCGCCTGGCAAATGGTGATCGGTAACAATAACCGGAATGCCC +AACGAACGAGCGTGTTCAACCCCCGCATGGGAGGAAATACCGTTATCCACCGTGACAATT +AACTGCGCGCCACGGGCATGAGCCTGATCGACTACTTCCGGGCTTAAGCCGTAACCGTCT +TCGAAACGGTTTGGAACCAGGTAGTCGATATTGCTGCAACCAAGCGAGCGCATCGCCAGC +ACGCTTAGAGCCGTGCTGGTCGCACCGTCGGCGTCGAAATCACCGACCACAATAATCCGC +GTTCCTTCGCGAAAAGCGTTGTAAAGGATCTCAACGGCCTTTTCGACGCCGCTCAGTTGC +TGCCAGGGCAGCATGCCTTTAACACTGCGTTCCAGTTCCTGCGCGCTACGCACACCCCGG +CTGGCATATAAACGGCGCAGCAAGGGAGGCAATTCAGCGGGCAAGTCGGCCGTTTCATCG +ACTTCTCGGCGACGAAGTTGTATCTGTTGTTTCACGCGAATTATTTACCGCTGGTCATTT +TTTGGTGTTCGTCGAGGAATTCTTTCATGTCTTTCGGCGGCTGGTAACCCGGAACAAGTG +TGCCATTGCTCAGCACAACTGCCGGAGTACCGCTAACGCCAAGCTGGACGCCAAGTGCGT +AATGGTCGGCAATATCCACGTCGCAGCTGGCTGGTGCGACGCTTTTACCTGCCATCACAT +CATCAAACGCTTTGTTTTTATCTTTCGCACACCAGATAGCTTTCATTTCTTTCTCTGCAT +CGCTGTCCAGCCCCTGGCGCGGGAAAGCAAGATAACGCACGGTGATCCCCAGCGCGTTAT +AGTCTGCCATTTGCTCATGCAGTTTGTGGCAGTAACCACAGGTAATATCAGTAAACACGG +TGATGACGTGTTTTTCCTGCGGCGCTTTATAAACGATCATCTCTTTTTCAAGCGCATTCA +ACTGCTTTAACAGCATCTTATTGGTGACATTGACCGGAGCCGTGCCACTAACGTCATACA +TTGGCCCCTGAATGATATGTTTACCATCATCGGTGATGTACAACACACCGCTGTTAGTCA +GAACTGTCTTCATGCCAGCTACGGGCGCGGGCTGAATATCGCTGCTTTTGATGCCCATTT +TGGCTAACGTTTGTTGAATTGCCGCGTCATCAGCCTGAACAAAGCCTGAAAACGCTGCCA +ACAAGGTAAATAACATAAAACCTTTCTTCATAAATTTTCCTGTTCTTTTCAGACATCACG +CCCGCGGGTGATGCTGTTGATGAAGTTGTCGCAGACGCTCGGTAGCGACATGCGTATAAA +TTTGCGTGGTGGAGAGATCGCTGTGGCCCAGTAGCATCTGCACCACGCGTAAATCCGCAC +CATGATTTAATAAGTGAGTGGCAAAAGCGTGACGCAACACATGCGGTGACAGCTTTTCGC +TGTCGATACCCGCCAGCACGGCATAATGTTTAATGCGGTGCCAGAAGGTCTGTCGCGTCA +TCTGCTGCGCACGCTGGCTGGGAAACAACACGTCAATTGACACACCATTCAACAGCCACG +GACGCCCATGTTCCAGATAGGTTTCCAGCCAGTAAACCGCCTCTTCACCTAACGGCACCA +GGCGCTCTTTGTTGCCTTTACCAATGACCCGCACCACGCCCTGACGCAGGCTGATATCAC +TCATTGTCAGCCCGACCAGTTCAGAGACACGCAGTCCGGTAGCATACAACACTTCAAGCA +TGGCTTTATCGCGTAGCTCCAGTGGCTGATCAATTAATGGTGCCTGTAATAAACGTTCGA +CCTGCGCTTCGCTTAAATCTTTTGGCAAACGCTGGGGCAATTTCGGTGAAGCGAGATGCG +CACTGGGATCATCTTCACGAAACTTTTCGCGATAAAGATACTGGAACAATCGGCGCACTG +CACTCAGCAAACGCGCTGAGCTGGTGGCTTTATACCCGCCCTCCAGCCGTTCTGCCAGTA +ATGCCTGCAAATCGTCACTTTGCGCCGTCGCCAGCGTCAACCCGCGGTGATGCAACCACT +CCACCATCATTGACAGATCGCGACGGTAAGCGTTCAACGTATTTTCAGCCAGATTTTTTT +CCAGCCACAGAGCATCAAGAAACTGCTCGATGCGTGCCAGATCCTGTTTCACTTGCGCCC +CTTATGGTCACTCATTTGATCCATTATGCCTTATTGTGCCGTGACTAAAGCGATTCTGAT +ACACTAGCCGCAAAAGCCACAGCAGAATCGAGAAGCTTACGTTATGAATATGGGTCTTTT +TTACGGTTCCAGCACCTGTTACACCGAAATGGCGGCAGAAAAAATCCGCGATATTATCGG +CCCAGAACTGGTGACCTTACATAACCTCAAGGACGACTCCCCGAAATTAATGGAGCAGTA +CGATGTGCTCATTCTGGGTATCCCGACCTGGGATTTTGGCGAAATCCAGGAAGACTGGGA +AGCCGTCTGGGATCAGCTCGACGACCTGAACCTCGAAGGTAAAATTGTTGCGCTGTATGG +GCTTGGCGATCAACTGGGATACGGCGAGTGGTTCCTCGATGCGCTCGGTATGCTGCATGA +CAAACTCTCGACCAAAGGCGTGAAGTTCGTCGGCTACTGGCCAACGGAAGGATATGAATT +TACCAGCCCGAAACCGGTGATTGCTGACGGGCAACTGTTCGTGGGTCTGGCGCTGGATGA +AACTAACCAGTATGACCTTAGCGACGAGCGTATTCAGAGCTGGTGCGAGCAAATCCTCAA +CGAAATGGCAGAGCATTACGCCTGATGTCACTGACGGCTTAGCACATATGCTTTGCCGTC +ATCTTTATCTTTGCGTCTCTTGTTGTAACAATATCCGCCGTAAATCCCGCCATTCGGCTT +CGTCCATGCTGTCAGCTGCCAGCCATAAATGTTGCCGTTTTCCGCTGTCAGAACGTAAAC +GCAGCATCATGCCGCTCTTAATCATCCACGGCGCTTTGACGATGCTCCACTCCTGCCCTT +GCCAACGCAAACGCCCGTCCATCAACAAGCGAATTTCCCCCTGGCGAGCATTAATGCGCC +GCTGGCTGCGAACGCAATCAAACACCACCAGCGAAAGTAACACCATCCATAACGGGGTGT +AACTGAGCGGCCAGGGCATGAGTAAAATAACAGCGGCAACCAGCCCATGAATCAGCAAGG +AAAGCCACTGTGCGCGCCAGGAGACGCGCAAATCAGATTGCCACAGGACCACGTTCCCGG +TTCCGTGTCTGGATGAGTCGGACCATCATTTCCAGTTCTGCATCGGCTGGTTTACCGTGA +TTCATCAGCCAGTTAAACAGGTCCGGATCGTCACATTCCAGCAGACGAATAAAGATGCGT +TTTTCGTCATCGCTTAAGCTGTCGTACTCATGTTCGAAAAACGGCATGATTGAAATATCG +AGTTCGCGCATACCACGGCGGCATGCCCAATGAATGCGGGCTTTGTTGTTAATGTCCATC +TTCTTCCTGTCTCACGAAAATCCAGTACCCGGCTATTGTAACGTGTTTTTCGACTTCTTT +TACGGGAATATCAGTAAACACAATCGCGATCGCGAAATTAATTCACAACAATTCAAGGGC +TTCATTTTTTTGGAAGTCGCCTCGCAGAAGGCACAGATCGCGTAGTGAAAGCACTTGCAT +TGCCTCATAGCTCTTTTACCATTAGTTATTAATACGCCGTTAAGCAACTCAGGACTCTAT +TATGGCTTTTACACCTTTTCCTCCCCGTCAGCCTACGGCTTCTGCCCGTTTGCCACTGAC +GCTGATGACGCTTGATGACTGGGCGCTTGCCACTATTACTGGCGCGGACAGCGAAAAATA +TATGCAAGGCCAGGTGACAGCAGATGTCAGCCAGATGACAGAAGATCAGCACCTGCTCGC +CGCCCATTGCGACGCCAAAGGTAAAATGTGGAGCAATTTACGTCTGTTCCGCGACGGCGA +TGGCTTTGCATGGATTGAACGGCGCAGCGTGCGTGAACCACAGCTGACTGAACTGAAAAA +ATATGCGGTGTTCTCTAAAGTGACAATCGCGCCAGACGACGAGCGTGTGCTGCTTGGTGT +TGCCGGTTTTCAGGCGCGCGCCGCGCTGGCAAATCTCTTTAGTGAACTGCCTTCGAAAGA +AAAACAGGTAGTTAAAGAAGGCGCGACTACTCTGCTTTGGTTTGAACATCCGGCAGAACG +TTTCCTGATCGTAACCGATGAAGCTACTGCCAATATGCTGACCGATAAACTGCGCGGTGA +AGCGGAACTGAACAATAGCCAACAGTGGCTGGCATTAAACATTGAAGCGGGTTTCCCGGT +GATTGATGCCGCCAACAGCGGGCAGTTTATCCCCCAGGCGACCAACCTCCAGGCGCTGGG +CGGTATCAGCTTTAAGAAAGGCTGCTATACCGGACAAGAGATGGTGGCGCGAGCAAAATT +CCGTGGTGCCAACAAACGCGCGCTCTGGTTGCTGAAGGGTAGCGCCAGCCGACTGCCGGA +AGCTGGTGAAGACTTAGAGCTGAAAATGGGCGAGAACTGGCGTCGTACCGGTACGGTGCT +GGCTGCGGTCAAACTGGAAGATGGTCAGGTTGTGGTGCAGGTTGTCATGAATAACGATAT +GGAACCGGACAGCATCTTCCGCGTGCGTGACGATGCGAATACATTGCGTATCGAGCCACT +GCCATATTCGCTGGAAGAGTAAATCTCTGTATCGCATCAGGCATTTATCGCCTGATGCGA +CACTGGTGTGTCTTTTCAGGCCTACAAAGGCACGCCAATTACGCCTGCCCAATATACAAA +TAGATCGCCAGAAAGTGGCACACACTACCGCCGAGCACAAAGCCGTGCCAGATGGCATGA +TTGTATGGAATGCGCTTGCAGACGTAGAAAATCACCCCGAGCGAATAAACCACACCGCCT +ACCGCCAGTAAGGTAACGCTGCCCGCCGCGAGCTTAACTGCCATTTCATAAATTACCACC +AGCGACAGCCAGCCCATCGCCAGATAGGTCACCAGAGATAAAATTTTGAATCGGTGCGCG +ATGGTCAGTTTAAACAGAATACCCAGCAATGCCAGGCTCCAGATAACAATCATCAACCCG +CGCGCTAACGGAGAATCCAGCCCCACCAGCAAAAACGGCGTATAGGTTCCGGCAATCAAC +AGATAAATGGCACAGTGGTCAAATTTCTTCAGCCACATTTTTGCCCGTTGATGGGGAATG +GCGTGATAGAGCGTCGAAGCGAGGAACAGCAGGATCATACTGCCGCCATAGAGGCTGTAA +CTGGTTATCGCCGTGGCGCTGGCATTGAGATCCACCGCCTGAACCAGTAGCAACACCAGC +CCAACGATACCAAACACCAGCCCAATGCCGTGACTGACGCTGTTGGCAATTTCCTCTGCC +AGCGAATATCCCTGCTTAATGAGGGGCTTCTGAACCATAACTTACTCCGGAAAAACGTAC +ACGCACATGTATACCTCTCCAGCGTAACTGAGAATAGTTCCAGTGAACACCTGTTAGCTA +AAATAAATTCTGATTTGAGATTAATCTCCGAAAAATCATGAAATTAAATGCGAAATTTCA +ACTAACAGGCGTGAGTTCAATTTAAAGACATTTAAATTCAATCACATAAAACTGTGTCTG +GTCGGGATAGATGTCGGCAATGACCTTTTTCAGTTCAGTCAGGGTCATATTTTCCTGCTC +TGCATGTTTTTCCGTCAGCGTATCCAGCGTTACGGTTGAGGTTGCGGTGACTTCAATCGT +GCAAAAATAACCGTCATCTTCAAAACGTCCGACACGAAGCACATCACCCGTTTTGAAGTG +CGATTCAGACTCGTCGCGGATGGTGATGGTTTTACGCCCAGCCAGAATGTCATCCTGGAA +ACGTTGAAAAAAAGTGATGTCGTTTGGCTGCATGGTAATATTTCCTGTAAGAATTGACTC +ATCTGGAGCCTATGATAGTGAAAAAACTCACCTTACCGAAAGATTTCTTATGGGGCGGCG +CAGTTGCCGCTCATCAGGTCGAAGGCGGCTGGAACAAAGGCGGCAAAGGGCCGAGCATTT +GTGACGTTTTGACCGGTGGCGCACACGGCGTGCCGCGCGAAATCACCAAAGAAGTTGTGC +CTGGCAAATACTATCCAAACCATGAAGCCGTTGATTTTTATGGTCACTACAAGGAGGACA +TCAAGCTATTTGCCGAAATGGGCTTCAAATGTTTTCGTACTTCCATCGCCTGGACGCGCA +TTTTTCCAAAAGGCGATGAAGCTCAGCCAAACGAAGAAGGGCTGAAGTTCTACGATGATA +TGATCGATGAACTGCTGAAATACAACATCGAACCGGTGATCACCCTCTCCCACTTTGAAA +TGCCGCTGCATCTGGTGCA +>bis +GCAATATGGTAGCTGGACCAACCGTAAAGTGGTTGATTTCTTTGTCCGTTTCGCGGAAGT +GGTATTTGAACGCTATAAGCATAAAGTCAAATACTGGATGACTTTCAACGAAATTAACAA +CCAGCGTAACTGGCGTGCACCGCTGTTCGGTTACTGCTGCTCCGGCGTGGTGTATACCGA +GCATGAAAACCCGGAAGAGACGATGTATCAGGTGCTGCATCACCAGTTTGTCGCCAGCGC +CCTGGCGGTGAAAGCCGCGCATCGCATCAACCCGGAGATGAAAGTCGGTTGTATGCTGGC +GATGGTGCCGCTCTATCCTTACTCCTGTAACCCGGACGATGTGATGTTTGCCCAGGAGTC +GATGCGCGAACGTTACGTCTTTACCGATGTGCAGTTGCGTGGCTATTACCCGTCCTATGT +GTTGAACGAGTGGGAACGCCGCGGATTTAACATCAAAATGGAAGACGGCGATCTGGATGT +ACTGCGCGAAGGCACCTGCGATTATCTCGGCTTCAGCTATTACATGACCAACGCGGTGAA +GGCCGAAGGTGGCACCGGCGATGCGATTTCTGGTTTCGAAGGCAGCGTACCGAATCCGTA +TGTTAAAGCGTCTGACTGGGGCTGGCAGATTGATCCGGTTGGTCTGCGCTACGCACTTTG +CGAGCTGTATGAGCGTTACCAGAAGCCGCTGTTTATTGTCGAAAACGGTTTTGGCGCTTA +CGACAAAGTGGAAGATGATGGCAGCATCAATGACGATTACCGCATTGATTACCTGCGTGC +CCATATTGAAGAGATGAAAAAAGCGGTGACTTACGATGGCGTGGACCTGATGGGCTACAC +GCCGTGGGGCTGCATCGACTGTGTGTCGTTCACCACCGGGCAGTACAGCAAACGCTACGG +CTTTATCTATGTGAATAAACATGACGACGGTACTGGCGATATGTCGCGTTCACGTAAGAA +GAGCTTTAACTGGTACAAAGAGGTGATTGCCAGCAACGGCGAGAATCTGTAATTAGCCGA +TGTGCCTGATGTGCTCCGCTCATCAGGCCTGGCACTCTTTTAATATATTGAGCTCGCAAT +ATTTTATATTACGCCTCAGCCGAAACACACAAAGCGCACTTTATTAACAAGCGAAAAAGG +CGCCGAAGCGCCTTTATAAGATAGTCGAATCAGTAAATTACTGGTATTCGCTAATCGGTA +CGCAGGAGCAGAACAGGTTACGGTCGCCGTAAACATCATCCAGACGTTTCACGGTCGGCC +AGTATTTGTCTGCCACACCTGCCGGGAATACTGCAACTTCACGGCTGTACGGATGCGCCC +ACTCGGCGACCAGTTCGCTTTGAATGTGCGGCGCATTCACCAGCGGGTTATCTTCCAGCG +GCCAGACACCGGCTTTCACCTGATCAATTTCTGCGCGGATAGCCAGCATCGCATCGATAA +AGCGATCCAGTTCCACTTTGCTTTCAGATTCAGTCGGTTCAACCATCAGCGTACCCGCCA +CCGGGAACGACATGGTCGGCGCGTGGAAACCGTAGTCGATCAGGCGCTTGGCAATATCCA +GCTCGCTGATGCCGGTTTCTTCTTTCAGCGGGCGAATATCGAGAATACATTCGTGCGCCA +CGCGACCGTCGCGACCGGTATACAGCACCGGGAAGGCATCCTGCAGACGGCTGGCAATAT +AGTTGGCGTTAAGAATTGCCACCTGGCTTGCTTTTTTCAGCCCTTCTGCGCCCATCATGC +GGATGTACATCCAGCTGATTGGCAGGATAGAGGCACTACCGAACGGTGCCGCAGAAACCG +CGCCCTGACGGGTTAACATGCCTTCGATTTGCACCACGCTATGACCCGGTACAAACGGAG +CCAGATGCGCTTTCACACCGATCGGTCCCATACCCGGACCACCACCGCCATGCGGAATGC +AGAAAGTTTTATGCAGGTTAAGGTGGGAAACGTCCGCACCAATAAAGCCCGGCGAGGTGA +TGCCAACCTGAGCGTTCATGTTCGCGCCATCAAGGTAAACCTGACCGCCGAACTGATGCA +CGACTTCACACACTTCACGGATCGTTTCTTCATACACGCCGTGGGTAGAAGGATAGGTCA +CCATGATACAGGAGAGGTTATCGCCCGCCTGTTCCGCTTTCGCGCGCAGATCAGTCAGAT +CGATGTTGCCGTTTTTATCACACGCCACAACCACCACCTGCATTCCTGCCATATGCGCGG +AAGCCGGGTTAGTGCCGTGCGCAGAAGCCGGGATCAGGCAGATATCGCGATGCCCTTCGT +TGCGGCTTTCATGATAATGACGAATCGCCAGCAGGCCCGCGTATTCGCCCTGTGCGCCAG +AGTTCGGCTGCATACAAACGGCGTCGTAACCGGTCAGTTTCACCAGCCAGTCAGCCAGCT +GCGCGATCATCTGCTGATAACCTTCAGCCTGTTCTGGCGGGCAAAACGGGTGCAGTTCGG +CAAATTCCGGCCAGGTGATCGGGATCATCTCGGCGGCGGCGTTCAGTTTCATGGTGCAGG +AACCCAGCGGGATCATCGCCTGATTCAGCGCCAGATCTTTACGCTCCAGCGAGTGCATAT +AGCGCATCATTTCGGTTTCGCTGTGGTAGCGATTAAACACCGGATGGGTGAGGATTTCGT +CGTCGCGCAGCATCGCAGCCTGAATAGAGCGACTGTCGTGAGCCACGTCTTTGTCCAGTG +TGTCGATGTCCAGCCCGTGGTTATCGCCCAACAGCACGCTGAAAAGCTGCATCACGTTTT +CGCGCGTGGTTGTTTCATCAAGGGTGATCCCAACCGCGTTCAGAATATCGCTACGCAGGT +TGATTTCAGCCGCTTCGGCACGCGCCAGCACGCCCGCTTTGTCGGCCACTTCCACACACA +AAGTATCGAAATAGTGCGCATGGCGCAGCTTCAGACCTTTTTGTTGCAGGCCCGCCGCCA +GGATATCGGTCAGACGGTGGATGCGATTAGCGATACGTTTCAGGCCAACCGGACCGTGAT +AAACGGCATACAGGCTGGCAATGTTTGCCAGCAGTACCTGGGAAGTACAAATGTTGGAGT +TCGCTTTCTCACGACGAATATGTTGCTCGCGAGTCTGCATCGCCATGCGCAGAGCGGTGT +TGCCAGCTGCATCTTTCGATACACCGATAATACGGCCCGGCATTGAGCGTTTGTATTCGT +CTTTCGCCGCAAAGAATGCCGCGTGTGGGCCACCATAGCCCATCGGTACGCCAAAGCGTT +GCGCCGAACCAAAAACAATATCCGCGCCCTGTTTACCTGGCGCAGTTAACAGCACCAGCG +CCATAATATCGGCGGCAACGCTGACCACAATTTTGCGTGATTTCAGTTCGCTAATAAGCG +CGGTGTAGTCGTGAATTTCACCAGTAGTGCCGACCTGCTGTAACAGCACGCCGAAAACGT +CCTGATGGTCGAGCACTTTTTGCGCGTCATCGACAATCACTTCAAAACCAAAGGTTTCGG +CACGAGTACGGACCACATCCAGCGTTTGCGGATGAACGTCAGAAGCAACAAAGAAGCGGT +TGGCATTTTTCAGTTTGCTGACGCGTTTCGCCATCGCCATTGCTTCGGCGGCAGCGGTGG +CTTCGTCAAGAAGAGAAGCAGAGGCCATATCCAGCCCGGTTAAATCCAGCGTTACCTGCT +GGAAGTTGAGCAGTGCTTCAAGGCGGCCCTGGGAGACTTCAGGTTGATACGGAGTATACG +CGGTATACCAGCCCGGATTTTCCAGCATGTTACGCAGGATAACCGGCGGTAGCTGCACGG +CGGTGTAACCCATGCCGATGTAAGACGTGAAGCGTTTATTGCGACTGGCAATAGCCTTGA +GTTCTGCCAGTGCGGCGTATTCGGTCGCCGGTGCGCCAACCTGCGGCGGAGTCGCAAGCT +GAATATCTTTCGGCACAATCTGGCCGGTCAGCGCGTTTAACGATTGTGCGCCAACGGCAT +TCAGCATTTCTTGCTGTTGCGCGGCGTCCGGTCCGATATGGCGTTCAATAAAAGCGCCGC +TGTTTTCAAGCTGGCTTAACGTCTGTGTCATGAGCGATGGTTCCTGAAACGTGCAGTGAA +TTGTGAACCTCTCTCCTTGCGAAGAGAGTGAGGGTGAGGCGTAAATTTCCTCACCCTGAT +CCTCTCCCGCAGAAGAGGAATAAAGCCGTTACTCGTCTTCTAACAATGCTTCGTATGCGG +TTGCATCCAGCAGTGATTCCAGTTCGCTTTCATCGCTGGCTTTGATTTTGAAAATCCAGC +CGCCTGCATACGGTTCGCTGTTCACCAGTTCCGGGAAATCGCTCAGTGCATCGTTTACCG +CCACGATTTCACCGCTTACTGGCGCATAAATGTCTGACGCCGCTTTTACCGATTCGGCAA +CCGCGCAGTCATCGCCCGCGCTAACCGTTGCGCCCACTTCCGGTAGGTCAATAAACACCA +TATCGCCTAACAGCTCCTGAGCGTGTTCGGTGATGCCAACGGTGTAAGTGCCGTCGGCTT +CTTTACGCAACCATTCGTGTTCTTTGCTGTATTTCAGTTCTGCTGGTATGTTGCTCATCA +ATCAATCTCCAAAAAAGTAAATCACGCGACGGCTTTGCCGTTACGCACAAAAACAGGTTT +CGTCACTTTAACCGGCATTTCACGGTTGCGAATTTGCACAATCGCCGTTTCACCAATACC +TTCCGGCACGCGCGCCAGCGCAATGCTATAACCCAGCGTTGGGGAGAAAGTACCGCTGGT +GATAATGCCTTCATGCTGGTTGCCCTGCGCATCAGTAAAACGTACCGGCAGTTCATTACG +CAGCACGCCTTTTTCGGTCATCACCAGACCAACCAGTTTTTCTGTGCCATGTTCACGCTG +CGCTTCCAGAGCTTCACGACCGATAAAGTCACGATCTGCCGGTTCCCAGGCGATAGTCCA +GCCCATATTGGCGGCTAAAGGAGAAATAGTTTCGTCCATCTCCTGGCTATACAAATTCAT +GCCCGCTTCCAGACGCAGCGTGTCACGCGCGCCCAGGCCACATGGCTTAACGCCAGCTTC +CACCAGCGCGCGCCAGAAATCGGCCGCTTTTTCATTGGGCAGCGCAATTTCGTAGCCCGC +TTCACCGGTGTAACCGGTGGTGGCAATAAACAGATCGCCCGCCTGCACGCCAAAGAACGG +TTTCATCCCTTCCACCGCCTGACGCTGGGCGTCATTAAACAGTGTGGCAGCTTTTGCCTG +CGCATTCGGCCCTTGTACGGCGATCATGGAAAGGTCATCACGAACAGTAATTTCGATGCC +GAAAGGTTCAGCGTGTTGGGTAATCCAGGAGAGGTCTTTTTCGCGGGTGGCGGAGTTAAC +AACGAGGCGGAAGAAATCTTCAGTAAAGTAGTAGACGATGAGATCATCTATCACACCGCC +AGAGGCATTCAACATCCCCGAGTAAAGGGCTTTGCCGCTTTTGGTGAGCTTCGCCACATC +GTTCGCCAGCAGATAACGTAGAAACTCCCGGGTGCGGCTGCCGCGAAGATCGACGATGGT +CATATGTGACACATCAAACATTCCGGCATCGGTACGTACCGCATGATGTTCGTCGATTTG +CGAACCGTAATGCAGCGGCATCATCCAGCCGTGGAAATCCACCATGCGAGCGCCGCAAAG +CGTGTGTTGTTCGTACAAAGGAGTCTGTTGTGCCATCTTGTCCTCATTGAATAAGCGGGG +CTGACAACTTTTCCATGGCGAAATTATCACCACGAAACCCAGCATCGGAGCCACTCCCGG +TCCCCAACGCAATCGTTCTCTTTTGCCTGAACTTACCACCGAAACAGACTGTTAACCATA +AGGTAAAATTGATCATCACATTAGCTTATGGTTAAAAAACGCCAAAATCGTAACAGAATA +AAAAACCAAAAAATGAACAAATCTCTATATAAAGATAAATAGATGAGAAAGTTAATTTGA +ATAAGACAACATTAAGAACTAAAAAAATGTCAAAAAACACTAAATCAAAAATTCGTGGCA +TTAGAAAAT +>ter +TCTCATACTACCCAATTTCTTAAAAGTGCAAATTTGTGAAGCTTATCCTGTTATTATTTT +AAGTTTCATGCCAAATTCTCTCACCAGATAATGCCGCCCTCTTCCGAAAAATAATCAAGA +GGCCAAACAATATCTAAAATGATACAACTGTATCTATTCCCCTGAAAAATACATTATTCA +TTTGTATATTTTCCTCATCATTGCTTTTTATTTAAATCATCCGATAATCCCCTGAATATA +ATTATGTCAATAACCATCAGAAAAAGTGGATGATGAGGAAAAGGATATGGCCGACAGTTT +CCAGAATGAAGTTCCCGCCGCTCGTGTAAATATCAAGCTTGATCTGCATACAGGCAATGC +TAAAAAGAAAGTTGAACTCCCCCTCAAGCTTCTTGCCGTAGGCGATTACAGTAACGGAAA +AGAGCAACGTCCGCTGTCCGAACGGGACAAGGTTGATATCAATAAAAACAACTTCAACAG +CGTCATGGCTGAGTTTTCGCCTGCGGTTAATTTAACAGTAGAAGATACGCTAAACGGAAA +CGGTAATGAACAAAATATCGCGCTTGAATTTAAAAGCCTGAAGGATTTTGAACCCGAACA +GGTAGCAAAAAATATTCCGCAACTTCGTGTATTACTCGCTATGCGCAATTTACTACGTGA +CCTGAAATCCAATCTGCTGGATAACGCAACGTTTCGCCGTGAACTGGAAAATATCCTGAA +AGACCCGACGCTCAGTTCAGAACTGCGTGATGAACTGGCGAAAATTGCGCCGCAGGAGAA +CGTTTAACCCGAACGCGTATTCAGGTTAAACCGGAGAAGAAAGGATCACTGAAAAGGAAA +TGCTGATGTCTGTACAACAAGAACATGCCACCTCTGAAACTGCAACACTCACCACCACTG +AGTCCGGCGGCGTTTATCAGTCCCTGTTCGATAAAATTAATTTAACCCCGGTGTCTTCCA +TTCAGGAAATCGATTTATGGCAAAACAGCGAAACGCTGGCCGATGCCTCACCCGATGAGC +GCGTGACGGCGGCGATTCACGTTCTGCTTTCCTGTCTGGCGAAATCAGGCGAGGACGTGG +TTAAGCTCGACAAGAGCCTGCTGGATTTTCATATCGACGATCTGGATCAGAAAATCAGTA +AACAGCTTGATGCGGTCATGCACCACCCTGAATTCCAGAAAGTCGAGTCGCTGTGGCGTG +GTACATGGTTCGTCGTACAGCGCACTGATTTTCGCAAAAATGTCAGAATTGAACTGCTGG +ATATCAGTAAAGAACATCTGCGGCAGGACTTTGATGATTCTCCGGAAATCATTCAAAGTG +GTTTATATCGCCATACATACATTCAGGAGTACGATACGCCGGGTGGCGAACCTGTTGCCT +CATTAATTTCCAGCTATGAATTTGATAACAGCCCGCAGGATATTGCCCTGCTGCGTAATA +TTTCCAGAGTGTCTGCCGCTTCCCATATGCCTTTTATCGGTTCTGTCGGACCGAAATTCT +TCCTTAAAAATTCGATGGAAGAAGTCGCCGCGATTAAAGATATCGGCAACTACTTTGACC +GCGCAGAATATATTAAATGGAAGTCGTTCCGCGATACGGATGACAGCCGCTATGTGGGAT +TAGTGATGCCGCGCGTGCTGGGCCGTCTGCCCTATGGGCCGGACACGGTGCCGGTACGCA +GCTTTAACTATGTGGAAGAAGTCAAAGGCCCGGATCACGAAAAATACCTGTGGACAAACG +CCTCGTTCGCCTTTGCCGCCAATATGGTGAAGAGCTTTGTTAATAATGGCTGGTGCGTGC +AGATCCGTGGCCCACAGGCGGGCGGCGCAGTGGCCGATCTGCCGATCCATCTTTACGATC +>contname +GATAATGCCTTCATGCTGGTTGCCCTGCGCATCAGTAAAACGTACCGGCAGTTCATTACG +CAGCACGCCTTTTTCGGTCATCACCAGACCAACCAGTTTTTCTGTGCCATGTTCACGCTG +CGCTTCCAGAGCTTCACGACCGATAAAGTCACGATCTGCCGGTTCCCAGGCGATAGTCCA +GCCCATATTGGCGGCTAAAGGAGAAATAGTTTCGTCCATCTCCTGGCTATACAAATTCAT +GCCCGCTTCCAGACGCAGCGTGTCACGCGCGCCCAGGCCACATGGCTTAACGCCAGCTTC +CACCAGCGCGCGCCAGAAATCGGCCGCTTTTTCATTGGGCAGCGCAATTTCGTAGCCCGC +TTCACCGGTGTAACCGGTGGTGGCAATAAACAGATCGCCCGCCTGCACGCCAAAGAACGG +TTTCATCCCTTCCACCGCCTGACGCTGGGCGTCATTAAACAGTGTGGCAGCTTTTGCCTG +CGCATTCGGCCCTTGTACGGCGATCATGGAAAGGTCATCACGAACAGTAATTTCGATGCC +GAAAGGTTCAGCGTGTTGGGTAATCCAGGAGAGGTCTTTTTCGCGGGTGGCGGAGTTAAC +AACGAGGCGGAAGAAATCTTCAGTAAAGTAGTAGACGATGAGATCATCTATCACACCGCC diff --git a/test/data/annotate/test_files/original_name.fna-prodigalRes/prodigal.outtest.wrong-start.gff b/test/data/annotate/test_files/prodigal.outtest.wrong-start.gff similarity index 100% rename from test/data/annotate/test_files/original_name.fna-prodigalRes/prodigal.outtest.wrong-start.gff rename to test/data/annotate/test_files/prodigal.outtest.wrong-start.gff diff --git a/test/data/annotate/test_files/prodigal.outtest.wrong-type.gff b/test/data/annotate/test_files/prodigal.outtest.wrong-type.gff new file mode 100644 index 0000000000000000000000000000000000000000..164c71e2b1b5daf3036df812883eadb6b5d7f8df --- /dev/null +++ b/test/data/annotate/test_files/prodigal.outtest.wrong-type.gff @@ -0,0 +1,2084 @@ +##gff-version 3 +##sequence-region JGIKIPgffgIJ 1 9603 +##sequence-region toto 1 22446 +##sequence-region other_header 1 51012 +##sequence-region my_contig 1 31459 +##sequence-region bis 1 6009 +##sequence-region ter 1 6009 +##sequence-region contname 1 6009 +JGIKIPgffgIJ Prodigal:2.6 CDS 287 787 . + 0 ID=EPKOMDHM_00001;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00001;product=hypothetical protein +JGIKIPgffgIJ Prodigal:2.6 CDS 4416 6068 . + 0 ID=EPKOMDHM_00005;Name=yiaD;gene=yiaD;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P37665;locus_tag=EPKOMDHM_00005;product=putative lipoprotein YiaD +JGIKIPgffgIJ Prodigal:2.6 CDS 9000 12002 . - 0 ID=EPKOMDHM_00006;Name=vgrG1;gene=vgrG1;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:Q9HI36;locus_tag=EPKOMDHM_00006;product=Major exported protein +toto Prodigal:2.6 tRNA 77 1237 . + 0 ID=EPKOMDHM_00008;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00008;product=hypothetical protein +toto Prodigal:2.6 CDS 1279 2347 . + 0 ID=EPKOMDHM_00009;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00009;product=hypothetical protein +toto Prodigal:2.6 CDS 2419 3000 . + 0 ID=EPKOMDHM_00010;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00010;product=hypothetical protein +toto Prodigal:2.6 CDS 3500 4000 . + 0 ID=EPKOMDHM_00011;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00011;product=hypothetical protein +toto Prodigal:2.6 CDS 4632 5000 . - 0 ID=EPKOMDHM_00012;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00012;product=hypothetical protein +other_header Prodigal:2.6 CDS 3399 4538 . + 0 ID=EPKOMDHM_00028;eC_number=3.1.11.5;Name=recD;gene=recD;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P04993;locus_tag=EPKOMDHM_00028;product=RecBCD enzyme subunit RecD +my_contig Prodigal:2.6 CDS 4535 7888 . + 0 ID=EPKOMDHM_00029;eC_number=3.1.11.5;Name=recB;gene=recB;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P08394;locus_tag=EPKOMDHM_00029;product=RecBCD enzyme subunit RecB +contname Prodigal:2.6 CDS 7854 9491 . + 0 ID=EPKOMDHM_00032;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00032;product=hypothetical protein +contname Prodigal:2.6 CDS 9525 11285 . + 0 ID=EPKOMDHM_00033;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00033;product=hypothetical protein +contname Prodigal:2.6 CDS 11249 12328 . + 0 ID=EPKOMDHM_00035;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00035;product=hypothetical protein +##FASTA +>JGIKIPgffgIJ +TCTCATACTACCCAATTTCTTAAAAGTGCAAATTTGTGAAGCTTATCCTGTTATTATTTT +AAGTTTCATGCCAAATTCTCTCACCAGATAATGCCGCCCTCTTCCGAAAAATAATCAAGA +GGCCAAACAATATCTAAAATGATACAACTGTATCTATTCCCCTGAAAAATACATTATTCA +TTTGTATATTTTCCTCATCATTGCTTTTTATTTAAATCATCCGATAATCCCCTGAATATA +ATTATGTCAATAACCATCAGAAAAAGTGGATGATGAGGAAAAGGATATGGCCGACAGTTT +CCAGAATGAAGTTCCCGCCGCTCGTGTAAATATCAAGCTTGATCTGCATACAGGCAATGC +TAAAAAGAAAGTTGAACTCCCCCTCAAGCTTCTTGCCGTAGGCGATTACAGTAACGGAAA +AGAGCAACGTCCGCTGTCCGAACGGGACAAGGTTGATATCAATAAAAACAACTTCAACAG +CGTCATGGCTGAGTTTTCGCCTGCGGTTAATTTAACAGTAGAAGATACGCTAAACGGAAA +CGGTAATGAACAAAATATCGCGCTTGAATTTAAAAGCCTGAAGGATTTTGAACCCGAACA +GGTAGCAAAAAATATTCCGCAACTTCGTGTATTACTCGCTATGCGCAATTTACTACGTGA +CCTGAAATCCAATCTGCTGGATAACGCAACGTTTCGCCGTGAACTGGAAAATATCCTGAA +AGACCCGACGCTCAGTTCAGAACTGCGTGATGAACTGGCGAAAATTGCGCCGCAGGAGAA +CGTTTAACCCGAACGCGTATTCAGGTTAAACCGGAGAAGAAAGGATCACTGAAAAGGAAA +TGCTGATGTCTGTACAACAAGAACATGCCACCTCTGAAACTGCAACACTCACCACCACTG +AGTCCGGCGGCGTTTATCAGTCCCTGTTCGATAAAATTAATTTAACCCCGGTGTCTTCCA +TTCAGGAAATCGATTTATGGCAAAACAGCGAAACGCTGGCCGATGCCTCACCCGATGAGC +GCGTGACGGCGGCGATTCACGTTCTGCTTTCCTGTCTGGCGAAATCAGGCGAGGACGTGG +TTAAGCTCGACAAGAGCCTGCTGGATTTTCATATCGACGATCTGGATCAGAAAATCAGTA +AACAGCTTGATGCGGTCATGCACCACCCTGAATTCCAGAAAGTCGAGTCGCTGTGGCGTG +GTACATGGTTCGTCGTACAGCGCACTGATTTTCGCAAAAATGTCAGAATTGAACTGCTGG +ATATCAGTAAAGAACATCTGCGGCAGGACTTTGATGATTCTCCGGAAATCATTCAAAGTG +GTTTATATCGCCATACATACATTCAGGAGTACGATACGCCGGGTGGCGAACCTGTTGCCT +CATTAATTTCCAGCTATGAATTTGATAACAGCCCGCAGGATATTGCCCTGCTGCGTAATA +TTTCCAGAGTGTCTGCCGCTTCCCATATGCCTTTTATCGGTTCTGTCGGACCGAAATTCT +TCCTTAAAAATTCGATGGAAGAAGTCGCCGCGATTAAAGATATCGGCAACTACTTTGACC +GCGCAGAATATATTAAATGGAAGTCGTTCCGCGATACGGATGACAGCCGCTATGTGGGAT +TAGTGATGCCGCGCGTGCTGGGCCGTCTGCCCTATGGGCCGGACACGGTGCCGGTACGCA +GCTTTAACTATGTGGAAGAAGTCAAAGGCCCGGATCACGAAAAATACCTGTGGACAAACG +CCTCGTTCGCCTTTGCCGCCAATATGGTGAAGAGCTTTGTTAATAATGGCTGGTGCGTGC +AGATCCGTGGCCCACAGGCGGGCGGCGCAGTGGCCGATCTGCCGATCCATCTTTACGATC +TCGGCACCGGCAATCAGGTCAAAATTCCGTCCGAAGTGATGATCCCGGAAACCCGCGAAT +TTGAATTTGCCAACCTTGGCTTTATTCCGCTCTCTTATTATAAGAATCGCGATTACGCCT +GCTTCTTCTCGGCGAACTCTGCCCAGAAACCGGCGTTGTACGATACCGCTGACGCCACCG +CCAACAGCCGTATCAATGCCCGTCTGCCTTACATCTTCCTGCTGTCCCGCATTGCGCATT +ACCTGAAAATTATTCAGCGCGAGAATATCGGCACCACCAAAGACCGCCGCGTGCTGGAAC +TGGAGCTGAATACCTGGATCCGCACGCTGGTGACGGAGATGACCGATCCTGGCGATGAAC +TTCAGGCTTCGCATCCACTGCGCGACGGGAAAGTTATCGTCGAGGACATAGAGGACAATC +CGGGCTTCTTCCGCGTCAGACTCTTTGCCGTGCCGCATTTCCAGATTGAAGGGATGGATA +TCAACCTTTCTCTGGTTTCCCAGATGCCAAAAGCAAAAGCCTGATCGGGCGGTGGTGTGA +TGTATGAAAATTTGTCGACCACTGTGGGCTGAGGGGACATTCCTGTCTTCTCAGCAGTTT +CAGCAGCAGGCCCGCTGGGAAGCGTTCAGCAATGACTGTATTGCGCAGCTTTGTATTCGC +CATCCGTGGGGGATCGCAAACGTGCTCTTTGACCGGGATGCCCTGACGCCCGGAAAGCTG +AAAACGCAGGCAGTACGCCTGCGTTTTGCTGATGGCACGCTGATCGATTCAGACGTGAGT +GACGTTCTGCCGCTCGCCTGCGATCTGCGCGCGCTGAAGAACGACAGCGCGATTGTTTTG +CTGGCGCTGCCGCTTGCACATGGTAACGGCGGTAATCTCGGTCAGGGTGAGCAGACTGAA +AGACCGCTGCGCTATCGTCAGGAATGGCAAAAGGTGCAGGATATCTACGGCAGTGACAGT +GAAGATATGGCCGTTGAGCGTCATGCGCTGTCCCTGCGCTTTGCTCATGATAACAATCAG +GATTACATCACCTGCCCACTGGCGCGTCTGGTGCGGGATGTTCAGGGCAACTGGACACAG +GATGAGAGCTATATTCCGCCGTTACTGGCGTTTAACGCCCATGACGGGCTGGTACAGCGT +CTGGACACATTGCTGTTGCAGCTACGGGCGAAGTGCCAGCGTCTGATGGCGATGCGCCGG +GAAAGCAACCAGCGTATGGCGGACTTTGCCGTCGCCGATGTCTCCCTGTTCTGGCTGCTT +AACGCGCTGAATTCCGCCGAGCCGGTGCTGAGCGATTTCCTGCGCTACCCGGCTGTCCAC +CCCGAACTGGTCTGGCGGGAGCTGGCGAGGCTTGCCGGTGCGCTGCTGACGTTTTCCCTT +GAGCATAACGTCAGCGCCGTTCCGCCCTATGTCCACGAATCGCCGTCCACCGTCTTTCCG +CCCCTGTTCTCCCTGCTCAGCGAGCTGCTGGAAGCCAGCCTGCCGTCGCGGGTGATCGCG +CTGGATCTGGCGTCCCTGCCGGGCAACCGCTGGAAAGCCGACCTGCACGATCCGCGCCTG +CGGGAAGAGGCCGATTTTTATCTGTCCGTTCGTTCCTCACTGCCTGCGCATCAGGTACTG +CATCAGCTACCGCTGGTCTGCAAAATCGGTGCGCCCGATGATGTCACGCTGCTTATCAAC +GTGGCGCTGAACGGTGTTCAACTGGTGCCGCTTACCTCGGTTCCGGCGGCGCTGCCGCTG +CGGCTGGAGAACCAGTATTTTGCGCTGGATATGCACAGTGACGCGGCTAAATCGATGCTG +GAGTCCGGGAGCTGCATGATTTATGCGCCGGGAACCATGGGCGACCTGAAACCTGAACTG +TTTGCGGTGCTGCGCACATGAAAAAAGATATGGATATCAATATCGATGCGCTGCTGCTCG +ACACGTTTCTGACGGTGGTGGAACTGCGTCAGGGAACCACCGTGCGTCACGGTATCGAGC +TGTATCGCCACTGTCAGCGGCAGGTGGAACTGGTCCGCGAACGTCTGAAAGATGCCGGAT +TCAGTCGGGAGAACGTGGAGCACATAACTTACGCGCAGTGCGCCCTGCTGGACGAAACGG +TGCTCAGCCGTAGTGGCATGGACGACGGTCAGGCCATCTGGATGAAAAACCCACTCCAGT +CGCATTTCTTCAACACCCTGCAGGCAGGTGAGCTGCTGTACGAACGGATGAAGCAGGTGC +TACAGGAACCCGCCCCCGCGCAGGCCGTGCTGACCTGCTTTCACCGTGTCCTGCTGCTGG +GATTTCGCGGGCGTTATCAGGATCCGGCAGCCCCGGAGCGCGACCAGCTTATTTCGACGC +TCAACGGGCAGGTCGCGCCATTTGGTGTGCTGCCGGAAACGGCGGTACTGAACGTGCCGT +TATCCACCCGTCAGCACCCTTTGCTGCATTCGCCATTTTTCTGGCTGGTAACACTGGCGC +TGCTACTGGCGGGCGTCTGGTGGGGGCTACACCACTGGCTGAACGTGCTGGTGGATGAAC +TGCTGCCGCAAAGCCTGCGTTAAAGGGAGTCGTGAGTGAGGAACACGCTGAAACAGGCCA +TCGTGCTGTGGGGAATGGTGTTACTGCTGGTGCTGTGGTCAGTGTTTATCAGTCCGTCTG +GCGTGCTGAGATGGGCCGGTGCGGCGGCTATCGTTCTGGCGGTTGCTGCGTTGTTGATTT +ATCGGCGCAGGCAGGCGTGGACGGAGATGACCGGCGATGCCGGGTTGTCATCGCTGCCGC +CGGAAACCTACCGGCAGCCGGTAGTGCTGGTCTGCGGCGGTCTGTCGGCGCACCTGTTCA +CTGACAGCCCGGTCCGGCAGGTTTCAGAAGGGCTGTATCTGCATGTTCCTGATGAAGAAC +AGCTTGTGGCGCAGGTGGAGCGATTGCTGACCCTTCGCCCGGCGTGGGCATCGCAGCTTG +CCGTGGCGTATACCGTCATGCCCGGCATACACCGGGATGTGGCGGTTCTGGCCGGACGGC +TGCGACGGTTTGCCCACAGTATGGCGACGGTGCGTCGCCGGGCGGGCGTAAACGTCCCCT +GGCTTCTCTGGAGCGGGCTGTCCGGCTCGCCGTTGCCGGAAAGAGCGAGTTCACCGTGGT +TTATCTGTACCGGCGGCGAAGTTCAGGTAGCAACATCCACAGAGACCACCATGCCCGCGC +AGTGGATTGCACAATCCGGCGTACAGGAGCGCAGTCAGCGACTCTGTTACCTGCTGAAAG +CTGAAAGCCTGATGCAGTGGCTGAATCTTAATGTGCTGACGGCACTGAACGGCCCGGAGG +CGAAATGCCCGCCACTGGCGATGGCCGTGGGGCTGGTCACCTCGTTGCCAGCGGTGGATA +ACAACCTGTGGCAAGTGTGGATCACCGCCAGAACCGGCCTGACGACGGATATCGCGGACA +CCGGCACAGACGCCACGCTGCCGTTTCCGGATGCTCTGTTACGGCAGTTGCCGCGTCAGT +CGGACTTTACCCCGCTGCGGCGGGCCTGCGTGACCATGCTGGGCATTACCACCGCGGCGG +GTATCACCATGTTGTGCCTGTCAGCCACGGCAAATCGCCAGTTATTACGGCAGGTCGGTG +ACGATCTGCACCGGTTTTATGCCGTCCCGGTGGAGGAATTTATCACCAAAGCCCGTCACC +TGTCGGTGCTGAAAGACAATGCGACCATGCTCGATGGGTATTACCGGGAAGGAGAACCAC +TGCGCCTCGGTCTGGGGTTATACCCCGGCGAACGCATCCGCCAGCCGGTATTACGCGCCA +TTCGCGACTGGCGTCCGCCTGAACAAAAAATGGAGGTGACGGCTTCGCTTCAGGTTCAGA +CCGTGCGTCTTGACAGTATGTCGCTGTTTGACGTCGGACAGGCCCGCCTGAAAGACGGCT +CGACAAAAGTGCTGGTGGATGCGCTGGTGAACATCCGGGCAAAACCGGGCTGGCTGATCC +TCGTGGCCGGATATACCGACGCCACCGGCGATGAAAAAAGCAATCAGCAGTTATCGCTGC +GGCGTGCCGAAGCGGTGCGCAACTGGATGCTGCAGACCAGCGACATCCCGGCCACCTGTT +TTGCCGTACAGGGACTGGGCGAGAGCCAGCCTGCGGCGACCAACGACACGCCACAGGGCC +GGGCAGTCAACCGGCGTGTCGAAATCAGTCTTGTTCCGCGTTCTGACGCCTGTCAGGACG +TGAAATAAAACATACCGCCGGAAGAAGGCGGTGCTTCAATCACACTAACAAGGAGAGTAA +TTCTCATGGCTATTCCTGCTTATCTCTGGCTGAAAGATGACGGCGGCGCGGATATCAAAG +GTTCCGTGGACGTTCAGGGGCGCGAAGGTAGCATCGAAGTGGTGGCGCTGGATCACGATG +TGTACATCCCGACCGACAATAACACCGGCAAACTGACCGGTACCCGTACTCACAAGCCCT +TTACGTTTACCAAAGAAATCGATGCCTCCAGCCCGTATCTCTACAAAGCTGTGACCACCG +GACAGACCCTGAAAACGGCAGAATTTAAGTTTTACCGCATCAACGATGCCGGTCAGGAAG +TGGAGTACTTCAACATCACGCTTGATAACGTCAAGCTGGTCAGAGTCGCTCCGCTTATGC +ACGACATCAAGGATCCTTCCAGAGAGAAGCATAACCACCTGGAACGTATTGAGTTCCGCT +ACGAGAAAATCACCTGGACTTACAAAGACGGCAACATCATTCATTCCGACTCGTGGAATG +AGCGTCCTTCCGCCTGATAACTGCGGCAGACAGGAAACTGTCTGCCTTTTTGTTGTGTGC +TTTGTCCAGTGCCGCAGGCACCGGTACTGAGCAAAGCATACCCACAATCTGGTGAAACCT +GATGGGCCTGAGTGAGGTAACGGCTATGGGCGGTAGCGTGCCTGAACGCGGATCGCAGGA +ATACAGAACACGATAAGGAACCCTTCTATGACAGGAAATCACTCCGCCGCGCTGCTGCGT +CGCCTTAACCCATACTGTGCACGGGCGCTGGACGCTGCCGCCTCACTGTGTCAGACCCGC +GCCCATGCGGAAATAACCATTGAACACTGGCTGCTGAAACTGCTGGAGCAGGGAGAAGGC +GATATCACGGTGATTGCCCGCCGCTATGAATGGGATATCGACACGCTCTGGCAGTCTCTG +CTGGCACATCTGGACACCTTACCCCGCCCGGTCCGCGAACGTCCTCAACTTTCTGAACCG +CTGGCAGCGCTTATCCGACAGGCGTGGCTGATAGCGTCACTGGAAGGCGACGATCCACAA +ATCCGCAGCCAGCATCTGCTGATGGCGCTGACAGAAAAACCGATGCTGCCCGCCTGTAAT +GACCTGTGGGTATTGCTGAGTCTGAGCCGCGTGCAGCTTGAGCGGCTGCGTCCCCTGCTG +GATGCGCAGTCGGATGAATGTCCGGCACGTCAGCCACAGGTCACCGAACCGCTGACCTCT +GCACTGCCGGAGACGGCAACGGCGGACGCACCGGCAAAAACGCTGACGGAGAAACAGGAT +GACGCCCTGCTGGCGGTGCTTAACCGCTTTACCGAAGACGTGACGGAAAAAGCCCGCAGC +GGGCGAATCGACCCGGTATTCGGGCGCGACACGGAAATTCGCCAGATGGTCGATATCCTC +TCCCGTCGCCGCAAAAACAACCCGATTCTGGTGGGAGAACCGGGGGTGGGCAAAACCGCG +CTGGTGGAAGGGCTGGCGCTGCGTATCACCGAAGGCAACGTGCCGGACAGCCTGAAAACG +GTGCATATCCGCACACTGGACCTCGGTCTGTTACAGGCTGGCGCGGGCGTTAAAGGTGAA +TTTGAACAGCGGCTGAAAAATGTCATCGATGCAGTGCAGAAATCACCGGAGCCGGTACTG +CTGTTTATTGATGAAGCCCATACCATTATCGGTGCGGGTAATCAGGCAGGCGGCGCGGAT +GCGGCGAACCTGCTGAAACCGGCACTGGCAAGGGGCGAACTGCGCACCATCGCGGCGACC +ACGTGGAGCGAATACAAACAGTATTTTGAGCGCGACGCCGCGCTGGAGCGCCGCTTCCAG +ATGGTTAAGGTTGACGAGCCGGATGATGACACCGCCTGTCTGATGCTGCGGGGACTGAAG +GCTCGCTATGCACAGCACCACGGCGTGCATATGCTGGACAGCGCCATTCAGACCGCCGTG +CGCCTGTCGCGCCGCTATCTGACCGGACGCCAGCTGCCGGACAAGGCGGTTGATTTGCTG +GATACCGCCGGGGCAAGAGTCCGCATGAGCCTTGACACCCTGCCGGAACCGTTGACGCAG +CTTCATGCGCGACTGGCGGCACTGGATATTGAGCGGGAAGCGATTGAGCAGGACAGCGTA +TTTTATCCCGAAGCCAGCCCGGAGCGGCTGGCGGAACTGACCGATTTGCGTGATGAGCTA +CAGGCAGAAGCCGGGCATCTGGAAGCGCAGTATCAGCAAGAAAAGGCACTGGCGCAGCAG +ATTATGACGTTGCGTCAGGAAGGAACAGACAGCTCTGAACTGCAACAGCAACTGCGGACG +CATCAGGGCTTTGCACCGCTGCTGGCGCTGGATGTGGACGCCCGCGCCGTCGCCACGGTG +GTGGCGGACTGGACCGGCATCCCGCTCTCTTCCTTGCTCAAGGACGAGCAGAGCGACCTG +CTCAGTATGGAACAGAGTCTTGAAAACCGCGTTGTCGGGCAAAGCCCGGCGCTCTGCGCC +ATCGCACAGCGGCTGCGGGCGGCTAAGACCGGCCTCACGCCGGAGAACGGCCCGCAGGGG +GTATTCCTGCTGACCGGCCCCAGCGGCACCGGTAAAACCGAAACTGCGCTCACACTGGCC +GACACTCTGTTTGGCGGTGAAAAATCCCTTATCACCATTAATCTTTCGGAATATCAGGAA +CCGCATACCGTTTCCCAGTTGAAAGGTTCGCCTCCGGGCTATGTCGGCTACGGTCAGGGC +GGCGTGCTGACCGAAGCGGTACGCAAACGCCCTTACAGCGTGGTGCTGCTCGACGAAGTG +GAAAAGGCGCATCGCGACGTGATGAACCTGTTCTATCAGGTGTTCGACCGGGGCTTTATG +CGCGACGGCGAAGGGCGGGAAATCGACTTCCGTAACACCGTGATTCTGATGACCGCCAAT +CTGGGCAGCGACCACATCATGCAGCTGCTGGAGGAAAAACCGGACGCCACGGACGCAGAC +CTGCATGAACTGCTGTACCCCCTGCTGCGAGACCATTTTCAGCCTGCACTGATGGCGCGC +TTTCAGACGGTGATTTACCGCCCGCTGGGACAGGAGGCGATGCGCGCCATTGTGGAAATG +AAACTGGCGCAGGTGGCCCGCCGTCTTCACCAGCACTATGGGCTGGAAACGGAAATCAGT +AACAGCCTGTACGACGCCCTGACCGCCGCCTGCCTGCTGCCGGACACCGGTGCGCGTAAT +ATCGACAGCCTGCTGAACCAGCAAATCCTGCCGGTCTTAAGCCAGCAGTTGCTGGCGCAG +CAGGCCGTGCATCATAAGCCTGCCCGACTGCGGCTTGACTGGGATGATGAAGACGGGATT +GTGCTGGAATTTGATGAGAAATAATGGAGGCTCTTATGAACGTACAGTTCTTCGACCACG +CACACCACAAGCTCAAAATTCGCGGCCTGAAAAGCCCGGTGGACGTGCTGACGTTTACGG +GCCGGGAACAACTCAGCGCACCCTTCCGCTACGACATTGAATTTACCAGTACCGATAAAA +CCA +>toto +CGATCTGATAGCTAATTGTAAGAAGATAAAGGAAGGCAACGATAAAAACGAGGACACCAC +CTGGGCATGGGTAGCGATGATCCTGACACTGGTCGGTCTTATTCCAGTGGCAGGTTCTTT +AATTAAAGGGATCTTCAAAGTGCTGTTTAATTCGATAAGAAAGGCGGCGCTTTCCAGTAG +GGATATTGTACGAGCGATTGATGCTTCCGTTTCCCTGTTTAATAAATTTATCGATTTGCC +AGCCGTGCAGGCGACAATGAAGTGGATGAAGATTTATAACCCGTATACGTATGCTGAGAA +GCAGGTCAGGGAACTGATGGCGCAACTTAACGTATCGGTGCTGTTAAGCAAGCTGGATGA +GTTAATGGACGTCACTGGTTCGCTACTCGAAAAGGCTAAATCTTGGGGGCCGGAGTCCAT +TCGCCAGCCGATAGAGGTGATATGGGAACTGCTGGTGTCTATCCGCAGCCAAGCCAACAC +CATGCTTGCAAAAGCGCTGGCACCGTTAAATGATGTGCTGGAAAAGCTGGCTGCCCGTCT +GCACCGGGAAGGGGACGATTATTATAAAGCGCATACTGGTGCTAATCCGCATCGGCCTTC +TCGCCTGAAAGATGCTGAAGAGGTGGAATTGCTGGCTACCAAAAAGCCAGACTGGGCGGA +TATTGGGGGTAAAGAAAAATATCCACAACTGGAAAAAGCCAGTGCGGAACAGAAAAGATT +AATGGACCCGGAGAATAAGGAGGGCGGCTACCCGAATATTCCTGATGATAAAGTGCAGAC +TTTTCATCAGATGGCTCCCGTTGAATTTAAAGAAGGCGAGAAACTCTACCGGGTGCTTGA +CCCTGGCAGTAGCGATAATAGTTTTTGCTGGATGCGTGAAGCAGAGTTTAAAGCACTGAA +GAGTAAGTCTCAGTGGCGACGACGCTTTGCGGTCTGGAAAAGCTGGAATGAAAATGGTGA +GTATGTAGTTTATACCGTGCCACCCGGTACAACAATGAAGGTTTGGGAAGGTCCAGCTGC +CTCTCAGGTGCGTGAAGTCACAGGTAAGAATGGAGAGAACATTAAAGTCGTGCTGGAAGG +CGGATCACTTCAGATAGTGATAGATCCGACCGTTCTGAATTTGGACTATTTGGGGAAACG +TCAGTCTACAGGATGGGGGTATAGAGATTTTTCTGATGAAGTGGATATGTATATAGGTGT +GCCTCAGTTGCAAACAAATATTTATGTACCTAAATAAAAAGTATCAACAGACAATTAATT +GATAAATCAGGAGATAAAATGGCTATATTACATCCACAGGAGTGTTGGTTGCTGGAAAGA +ATAATGTCGCCGGAATATTATCGGCGCCGTTTTGAGGGCTGGCAGGCGTTTGTCGAGCTG +TGCGAACGGCAAGTGGCGGAGTGGAGCAAGACCATTCCGCTGGATGTGCGCCGTCGTCCG +CTGTACGAGCAGATTGACGCCGTCTGGGGCGGGCGGGTGTTGCCCAATATCCGCAGCACT +TTAAAGTCGGTACAGTATGACTTTATTCAGCTACAGCAGGGGGACCTGCGGGTACTGCAA +TCCGGGGGCAATATTAGCAGTGATATGAAAGGACTGATTGATTATCCGCCGGACTGGATG +TCACCCGCCGCGCAAAAACAGTATGACAGGCTGAAATGGCGAGGTGCACATTATAATAAT +CTAATCAGACGTACCTCGGGCGGATACTGGTATGACGGCGAACTGACTTATTATTATGAG +GAAAGTCTGCACGGCCCGCTGGCCCTGCCGATGCAATTACCGTTGTATGAGCTGGATAGC +AGCGTATACCTGCGTGAGGATGACCCGGTAACGGTGGCTGGCCTGTATCTGCCGGATATC +CCAGATGCCAGCGCCCAACTGTTGTACCGGAGTGAACATATTCCCGAGGCTTGGCAGGGG +CGGGTACGAACGAAGTATGTCAACGAGGCTGGGATACAAGAATATTACTGGGAAAGCGGG +GCGTGGGCAAAATGCAACTGGAAACGTATACGGCGGGTGGCAAACCGATTTATCAATGTG +CCGCCGGAGGGATTTTTCCCACAGGGCATGCCGGAGGAGTTGTACAACTGGCCACAGCGC +GAAGCGCAGTATGTAACAGACCGGCAGCGGATAGCGGCCTATAGCGGTGAAGCTTGTCCT +CATAGCGGGGAGTGGTCGATTTTTGTAGAAGGTAGACAAGCGACGGAGACGCTGGAGCAG +GGAGAGCAGATGCCGGAATGGACGGACAGGAAAATGGAGGGGGAGTATAAAAGAGGTGAG +AAATTCCATGTGCTGTGGTCGCTGATGAACCGCCACGATGGCGGGTCGGTGTGGGTGGAA +GCGTAGCGGTAGCTGGATGTACACGTAAAAACCGGGGAATGGGTGATTTTATTCTGGTTT +ATACAGGAGAGATGAATAATGAGGATATCACTGGCAAGCTTGTTTTTTCTTTGCTGTACA +GTATCAGACAGTGTTTATGCGGATACAGATCAAACATATGATATTTTTTGGGGAATGCTG +GTAAAGGATAAAAAGGATACTATATTTGTTCGCTGTGACAGTCCGTTATTGAAAATGAAA +ATTGTGAGAATGGCGGATGCAAATACAGAAAACATTGATAAGGCATACCAGATATTTAAT +CAGAAAACGAAAAAATCAATTTATTTTGCTTTTATCGGTAATGTGACTGATGCCGGGAGT +GGAAAGTATATTTTCAATATGCTGGACGTGATGGAAACGAGAGAAGGCTATTGTAATCTG +TCCGATGTGCTTAATGCAATAGATGAACAGTTTCGATAGTTTCGGATAAAATTGTTATTT +TATGCTTTCTTTTTTGATACGTTACGTCAGGTCGTTGTTTTTATAAATCAACAACCTCAT +TTATTAAATAACATAAATCAAAAGCAATGCCATTATGGCCAATGAATTTCAAGTGGATAT +TAAATCTGTTTATTATAAATTTTCCTATTTGTGTTGAAACACCTCTTAAGACTGAATGCT +GAATTACTATATCAAGAGTCACATCAATTCATTATTTCTGATATTAAATTTAATGTTTTA +TTATTTTTATAATATTTAATATTAAAACTGCAATTTCCGTAAAATTATAACATTATGGAG +GACTCAACCATGAAAGGTATTGTTGTTCTGGGAGATAAGACAACGCATGGTGGGCAGGTT +ATATCTGTGTCATCTTCGATGGTTATCAATGGAAAAAAAGTTGCGCTTGTAGGTGATAAG +ATAAACTGCCCTGTTAAAGGGCATGGTATTAATACCATCATCGAGGGGAGTTTTGATTGG +ATTTCTGATGGCAAACAGGTCGTCGTGAATGGCTGCAGGTGTGAATGTGGCTGTGTTGTT +ATATCCAGTATTGCTGATGCCTTGATTGGATGAATATTATGGGATGGAAACGGACGTATA +CAGAAGAAATAGACAGGCCACAGGATATTTACTTTCATAAGTGGTTATTTTCTTTATTTA +TTTTATGTATATTATTACTCGTTATTTATTATTTTTTCCATGAATTTGTTGTAGCTAATA +ACGCATCTTTGTTAGCATTCTTTTCCCCATTATTATTGTGGGTATTGATTCTTTCAGTAC +AGGTAATATTTTATTCCAGAGCTATTCAGGATTATTCAATTTGGCTGGAGAACAGACTTA +GTATCAACAGAGAGTGGGAGGCATGGGGATCAAGATATGTTTCTGTTATGAATAGTAGTC +TTCATCTTCCTGGAAAAGTCGATGTTTTATTCTTGTCTGGTGATGAATTAGAAACTCAGT +ATGGACTTGTCAATAAGTCAGATGATATCACATGGAAGCAACATGATTGGTATGCCTGCT +TTCAGACCCTTACTAATCATCTTGAACTTTATAAACTCCCATATCAACTTACACAAGAAT +TTATTATTCTTACTGATTTTGATGAAAGTATGTACTCTCAGATTGAAGAGGACTTTTTCA +GAACAGTGGAGAAAACCAACAGAACAGAGGGGCATTTTTTGTTGCATATTTCCCCTTCAA +TGTCCTTTGGAGAGCTTGATTTATGGTTAAAGGATTCCGAAGAGAAAATATATATTGTCA +TGGTGTTGCAGATGGAGGAGCAAACATCCTGTTCGGACGCTATGGCTTGCCTTATGTTTG +CAACTGATGATGTTACTGCTAAGTACAAACTCACTGAAAAGGCCAGAATTTATCGCCCAA +TGGTAGTAAATAGTAATAATTTCAATAGTGACTTGAATATTTTTATTGACACACAAAAAA +TATCCAAAAATGCCGCCGGGTTAGTTGGGGACAGTCAGCGTCTGTTTTCTGTGAGTAGTA +ATGTATTGCAGTGTTTTAATGATAATAATGCTCAATTGAAAATTGATAATATCCATCTTT +TAGAAAGCCTTTGCGGATTACCAGGGGGAAATGCGGTCTGGTTAACGGCAGCGCTGACTA +TTTCGGTGGTTGTTCACAAAAATTCAGATTACTTGATGATGTCCGAAAATAATGATGACT +GGATCATTACCACCATTCATCCTATGGAGCATTCATGAAGAGAATAAATAAAAAAAGTGT +TTTTATATCTAATGTACTTTTATTCTTGGTTATTGTGGCCTTCGTGGGGGGGATCATCTG +GCGTTTTGGTGATCATTTTGGACTGAAAGGGGATGAAAATAATTTTTTTGCGTGGTTGAT +ATGCATTATGACCCTCATTTTTGTACGGGCATCCTGGTATTTCTCTCGATTGTATCGCCT +ACGAAAGGAACAACATCACTCCGAAAAGGAAAGATTACGCCCGGAGAAAGAGGCTCGTAT +TGAATATGGCAAGGTCATAACCCTGAACATTGAGCTAGCTGAGTATTTATGTGCCCTATA +CGGCCCATTCTGGCGGCGTAAAGTCCGCCTGCTGCTGGTGACCGGCGAGCCTGAACAGGC +AGAGGCCATCGCGCCGGGGCTGACCGGGCAACACTGGCTGGAGGGCGACCACAAGGTGCT +GATATATGGCGGCAGGCCATCAGCGGAGCCTGATGTCGCGCTACTGACCGCCTTAAAAAA +ACTGCGCCGCAGCCGCCCGCTGGACGGCATCATCTGGCCGCTGACAGAAGAACAGAGCCG +CCAGACAGCGCAACTCGACAAAGGCTGGCGCGAACTGATAAACGGCGGTAAGCGACTCGG +TTTTCAGGCTCCACTCTATTTGTGGCAGGTCTGTGACAACGGTGATTATCAGACCGGACG +CCCCCTGCAAAGCGTCGGCTGCCTGCTGCCGGAACGCTGTACCCCGGAACAACTGGCTGC +AATGCTGGAAGCACAAACCCTGCCGCTGACGGAACAGGGCATGTCGCAACTGCTGGCAGA +TAACCGCCATGATTTCCTGCTGCGTCTGGCCCATACCCTTGCAGAGCGGGGTATCGCTCA +CTGGCAAAGCGTTCTGAAACCGCTGCTGGCAGGCGGCGCATTTTCTTCCCTGCGCCTGCG +TGGCCTGATGTTCAGCCCGCCGCTTGCCGCCGTGCCGGAGGCCGCACCTCATGCGTGGCT +GCCGTCACCGGTCTGGGCGGGCGTGACGGGTGATAACGCGCGCGGGCGTGCAGTGGGCTT +TCCGTGGCTACGCGCCGCGCTGATAACCAGCATCTGCATGCTGGCGATATGGGGGGCCGG +AATGACGACCTCGTTCTTCGCCAACCGCGCGCTTGTTCAGGAAACCGGTATCCAGACGGC +ACGTGCGCTTGATACCCGCCTGCCGCTGGCAGAACAACTGGTGGCGCTGCATACCCTGCA +GGGCGAACTGGAACGCCTGCAATATCGTATCCGCGAAGGTGCGCCGTGGTATCAGCGTTT +TGGCCTTGAACGTAACCAACAACTGCTCGCCGCCGCTTTTCCCGGCTATGCGCAGGCGGC +AAACCGGCTGGTGCGCGACGTGGCCGTTGACCATCTGCAACAGCAACTGAACGCCTTTGT +CGCCCTGCCGCCCAACAGTCCTCAGCGTACCGCCACCGGTGAACAACGCTATAAGCAGCT +TAAGGCATTGCTGATGACTTCCCGCCCGGAAAAGGCCGACGCTGCCTTTTTCAGTACCAC +GCTGATGGCGGACGGTCTGCGCTACGAGAATATCCCGGAAGGTGTGCGGCAGAGCGTGTT +GCCGTCACTGCTGACCTTCTGGATGGCGAACCTGCCGGAACACCCGCAGTGGAAAACCGC +ACCGCCGCCGGAACTGACCGGCGCGGTGCGTAAAATCCTGCTGCGCCAGATTGGTGTGCG +TAATGCTGAAAACACCCTCTACCAGAACGTGCTGCAACAGGTGTCCCGCAACTACGCCGA +TATGACGCTGGCGGACATGACCGGGGATACGCTCACCGAATCTCTTTTCAGTACGGAACA +GACAGTGCCGGGGATGTTCACCCGTCAGGCGTGGGAAGGACAGGTCAGGGAAGCCATCGA +GCAGGTAGTGACGGCGCGGCGCGAGGAAATCGACTGGGTACTCAGCGACCGCCAGCAGGA +TACCTCTGCGGATATCTCGCCGGATACGCTGCGTAACCGTCTCACCTCACGCTACTTTAC +CGACTTTGCCGGAAGCTGGCTGGCGTTTCTCAACAGCATTCGCTGGAAAAAGGAAGACTC +GCTCTCCGGCATTCTCGACCAGCTGACACTGATGGCCGATGCCCGTCAGTCGCCGCTGAT +TGCGCTGACCGATACCCTCGCGTGGCAGGCGGCGGCTGGCAGGGAAAACCGTGGCCTGTC +AGACTCGCTGGCGAAATCGGCACAGGAACTGTTTAACGGCAAGGAGAAAACGCCGCAGCA +ATCCCGTGAAGGCAACGAGCCTGTCGGGCCGCTGGATAAAACCTTCGCGCCGCTGCTGCG +GTTGCTGGGCGATAAAGCCGGAGGCGGAGACAGCCAGCTGAGTCTGCAGACCTACCTTAC +CCGCGTTACCCGCGTGCGCCTCAAACTGCAACAGGTGACCAACGCTCCCGACCCACAGGA +GATGACCCAACAACTGGCGCAGACAGTCTTGCAGGGCAAAACCGTTGACCTCACCGACAC +CCGCGACTACGGACGGTTAATCGCCGCCAGTCTGGGCGAGGAATGGAGTGGCTTCGGTCA +GGCGCTGTTCGTCCGCCCGGTGGAACAGTCGTGGCGGCAGGTGCTGACGCCTGCAGCGGA +CAGCCTGAACCGCCAGTGGCACCGGGCGATTGTCAGCCACTGGAATCAGGACTTCGCCGG +GCGCTATCCGTTCAAAGCCTCACAGAATGACGCTTCCCTCCCCCTGCTGGCGCAGTACCT +GCGCGATGACGGGCGCATCAACCAGTTTATTGCCGCCAACCTTTCCGGCGTTCTGAAACG +TGAAGGCCGCTACTGGGTGGCTGACGCCATGAACACGCAGGGGCTGACGGTCAATCCGGA +CTTTATCCGCGCCCTGAACCGCCTGCGCGACGTGGCCGATACCGCCTTTGCCAGCGGCGA +TGCCGGGATACATTTTGAACTGCGGGCAAAACCGGCCCGAGACGTGATGAAAACACATCT +GGTGATTGACGGGCAGGAACTGGAATATTTCAACCAGAAAGAACGCTGGCAGCGTTTTAA +CTGGCCGGATGAACAGTGGCAGCCCGGCGCATCGCTGAGCTGGACCAGTACGCAGGCGAT +GGAGCGCATACTGGCGGATTATCGGGGAAGCTGGAGCCTAATTCGTCTGCTGGAACAGGC +GCAGGTGACACCGGTGGACAGCAGCACCTTTAAAGTGGTGTGGAAAGCGCAGGACGGCCT +GCCACTGAATTACCTGCTGCGGGTTGAACAGGGAAAAGGGCCGCTGGCGCTGCTGGAACT +GAAAAACTTCCGCCTGCCGGGACAGGTATTTCTGACCGGCAGGAGTATGAAGGATGCGGA +AGAATACGGGGAAGACGCCGATGAGTGAGCTGTTGCAAAAGCTGACCCGTAGCTGTTTTG +CCGACCGGGATGCACTGGATGTGGCGCGAACACAGGCGGCACTGTGGCAGACATGGCTGC +TGCCGGTGACGGCAGACACGCCGGTCGGGGAAGACCCCGGCTACCACGACGATTTCCTGC +GTATCCGCGACGAGATGAACAAACTTTCCGGCGCGGATACGGACCTCATCTGCCAGCTTG +CCGAATCCCTGCTGCTGACGCAGGCAAAAGACGTGCGCATCGCCACTTACTACATCTGGG +CGCGACTGCACCGCGACGGTGAGCGCGGACTGGCGGAAGGACTGGCGCTGCTGACCGGAC +TGGTGGAACGCTTCGGTACGCAACTGCTGCCCTCGCGTCCGGCCAGCCGGAAAATGGCGC +TGGAGTGGCTGGCAGGGGAAAAGATGCTCGACAGCCTTGCCCGCTACCCGGAAGTGGCAA +AAGAGGATTTTGCGAACATTGTTGCTGCTCTTAATCAACTGACGGTTTCCTTCGCCGCAT +GGCCCGAAGACCAGCATTCCCCCTCCCTGATGCCGCTGATTAACGCGCTGGAATCACGTC +TGGCGCAGTCGGGTGGGATGAATGCGGTGGTGCCGCAAAACAGCAGCAGCGTTCCTGCAC +CGTCATCCCCGGTGGATGCGCCACAGGTACAGACCATCACCTCCGGGCGCGACCTGCTCG +ACCAGGCGAAAGTGCTGGCCCGTTATCTGAACGAACAGCCGCAGGGCTGGCTTTCAGCAC +ACCGGCTGATGAAAACCCTGCGCTGGGACACGGTGCATGAACTGCCGCCGGATGTGGACG +GCAAAACCCGGCTGGCCCCGCCGCGCACAGAATCGCGCAACCAGCTTAAGCGGCTGTATG +CCCAGCAGAACTGGACGGAACTGCTGGAGCAGGCCGACCTGATGTTCAGCACCGGTGTCA +GCCATTTCTGGCTGGACATTCAGTGGTATCTGCATCAGGCGCTGGCCAAGGCGGGCGCAC +CGTGGGACAGGTGGACAGCCGTTATCCGTCAGGACCTGACGTTACTGCTGGAGCGCCTGC +CGGGACTGGAAAATCTGGCATGGAACGACGGCACACCGTTCGCCGACGAGGTGACGCGCA +ACTGGATAGCGCAGCAGGTCATGATGCGGGAAGACGGCGCATGGCTTGCGGGGAAAGCCG +CTGTACCGACAGACGACGCCACAAATGACGTACTGGCGCTGGAGCCGGAAGCACTGGCGA +TGGCAGACAGTCAGGGCGTGGAAGCGGCGCTGGGCTGGATACAGACCCGTCCGGGCATCA +CCACGGCACGACAGCGCCTGTTATTGCGGCTGCTGATGGCACGGGTGGCGGAACAGTACG +GTAAAAACGAGATGGCGCTCCTGCTGCTGGAAGAACTGGATACCGCCGCACAGGGAATAA +CGCTGACGCAGTGGGAGCCAGAACTGCTGTTTGAAGTAAAAGCCCGGCAACTGAAACTGC +TGCGCCTGCGGGCACATCGCCACGCGGACAAGGCGGCGCTTGCCCGGAAAATGGACGCTC +TGCTGGGTTCGCTGGTGGCAATCGATCCGGCGCGGACAGCGGTACTGTGTGATACGCAGC +ATAAGGACTGATTTCTTATTTGTATTTCAGATTAAAGGACTTTGATGGACGACCTGACCC +AACGCTACTTTGAGGCCGAAATGCGCTACCTGCGTGAAGCGGGTAAAGAATTTGCGCAGG +CTTACCCCGACCGCGCTGCGATGCTTAATCTTGATAAACCCGGCGCACGCGATCCCTATG +TGGAGCGCCTGTTCGAAGGCTTCGCCTTTTTAATGGGCCGCCTGCGCGAAAAGCTGGACG +ACGATCTGCCGGAACTGACTGAAGGGCTGGTCAGCCTGCTGTGGCCCCACTACCTGCGAA +CCATCCCGTCACTTTCCGTGGTTGAACTGTCGACAGATCACCGGCAAATGAAGCAGAGCG +AAACGCTGAGCGATTTTCAGGTATTGTCGCGCCCTGTTGGCGAGCGCAGAACCCGCTGTT +TCTACAGCGCCACGCGGGATATCACGCTGCATCCGCTGGCGTTGCCGGACGTGTCATTGC +AATATGAACCGGACGGACGTTCGGTTATCCGTCTGCGCTTTGAATGCGGCCCGCTGGTCG +GCGACTGGTCGCAGATCGATTTATCCCGCCTGCCGCTCTATCTCAATGCCGACAGCCCGG +TAGCCTGTGCGTTGCACCGGGCTTTAACGCTTGGCACGCAGCAGTTCTGGCTGCGTCTGC +CGGGGCAGGATCGCCGGATGCTTGGCGCACACTTTTCCCCGATGGGCTTTGAGGATGATG +ACAGGCTCTGGCCAAAAGGTGAGTCAGCCTTCAGCGGTTACCAGTTGCTGCTGGAGTATT +TCACCTTCCGCGAGAAGTTTATGTTCGTGGCGCTGAACGGGCTGGAGCAGGTTGCATGGC +CGGAGGGGATAACCGGCTTTGAGATTGACGTGGTGCTGAACGAGAACTGGCCTCACGACC +TGCCATTTGACAGCGATAATATCCGTCTGCACTGCGTGCCGGTCATCAACCTGTTCCCGC +TCGAAGCCGATCCGTTACACCTTTCGCCACTGGAAAACGAATTTCTGCTGCGCCCGATGC +GCATTCAGGACGGGCATACCGAGATTTATTCCGTCGACAACATTATTTCTTCGCGCCATA +CCGGCAGTCAGGCATATGTCCCCTTTTCCAGCTTTCGTCACCGGGGCGGGATGCTGCGCC +ACGATGCGCCGGAACGCTATTACCACACGCGGGTAAAGCGCGGCCCTTCCGGCTTGCACG +ACACATGGCTGATTCTGGGCGGCGATGCGTTTGATTCCGACCGGATGCTGGAGGATGAAA +CCCTGTCCTTAAGTCTGACCGGCACCAACGGGCAGCTTCCCCGTAAAGCCTTACAGAGCA +CCCTGCTCGATACGCCAGTTCATGCCTCACAGAACGTCCTGCGGGTGCGCAACCTGTGCG +CCCCGACGCAGCCCTGCTATCCCCCGGCGCGTGACCGCTTCCACTGGCGGGTGCTCAGCC +ACCTCGGTTCTAACTTTTTATCGATGATGGATAACGCCGAAATTCTGCGCGGCACGCTGG +CGCTGTACGACTGGACCGAAAGCGAGATGAACCGCCGTCGTCTGGAGGCGATTGTCGACG +TTCAGCACAGCCTGATACAGCGTTTTGAAAGAGGCTTTCTGCTGCGTGGCGTGGATATTC +AGGTGACGCTGGACAGTAACGGCTTTGCCGGAGAAGGTGATATCACGCTGTTTGGTGAAC +TGCTGCACCGCTTCTTCGCACTGTATGCCGATATCCACTTATTCACTCAACTGACCTTAA +TTCTGCAACCCACAGGAAAGTGCCTGCAATGGACAGAGCATCACAGCCAGCGCGTACCGG +GCTGACCGACCGGCTGGCCCCGGATATTGCGCGGATCAATTTTTACCGTTTTTGCCAGTT +GCTGGAACAGAGCCAGCAGAAAGCGCCGCTGGGCAGTACCGACAACCCCGCCGCCGATGC +GGTGCGTTTTCGCCCCCATCCCGGAATGGGCTTTCCGGTCAGCGAGTTAAAGAACGTTGA +ACGTGACGTGGACAATCCCGACGCGCCACCCACGGTGCGCACCACCTTTCTCGGCCTGTA +CGGCGTGGATTCACCGCTGCCCACCGCCTATCTGGACTACATTACCCAGCGTCATGACGG +ACATGACGCAGTGATGGCGTTTCTCGATATTTTTAACCATCGCTTTATCACCCAGTATTA +CCGCATCTGGCGCAAATATAACTACCCGGCGTCGTTTGAAGCAGGTGCCGTGGATGACAT +TTCCCGTTGTCTGCTGGGGTTAATCGGGCTGGGTATTCCCGGCAGCGAGAACCATATCGC +CACGCCTGTATCCCGTTTTCTGGCCCTGCTCAGCGTGATGCGCCTGCCCACCCGCACGGC +TGAAGGCGTCACGGCACTGGTGGGGCTGCTTGCCCCGCTGACGAAAGCCACGGTGGTGCC +TCACGATCCGCAGCCTGTAATTCTCCCGGCCCCTGCGGGTCTGTCAAAAAATTCACGCAT +CAGCCTGAAAACGCGAACGCTGCTGGGGCGTACCGGTACCGACGTCAACAGCCAGTTGCT +GCTGAAACTGTATACCGAAGATGCCGCAGAAGCACGTGGCTGGCTGCCCGGCGGGCAACT +GCACAGCGATTTGCTGGTGCTGCTGCGCGTTTATCTGGGCTGGCGCTGTCAGGCCCGTCT +GCAACTGACGCTGCCCGTCAGCCTGTTGCCTGCTGCCCGGCTGGGAAAACAGCGTGTACA +GATTAGCCGTACCGGCATCCTTCTCGCCTCCTTTGCCGCGCCCGCGACCGGAACAGTGAC +GGTCAGTCTGGGGCGTTATCAGGGATTAATACCCGCTTTTTCCATTCGTAACAGGGAGAG +TATGACTCATGTTTCCTATTCGTTTTAAACGTCCGGCGTTGCTCTGTATGGCGATGCTGA +CGGTTGTTCTGAGTGGCTGCGGGCTGATTCAGAAAGTGGTGGATGAATCGAAAAGCGTGG +CCTCAGCCGTTTTCTACAAACAAATCAAAATACTGCATCTCGATTTCTTCTCCCGCAGCG +CCCTGAATACGGATGCGGAAGATACGCCGCTTTCCACGATGGTGCATGTCTGGCAACTGA +AAACCCGCGAAGATTTTGACAAGGCGGATTACGACACCCTGTTTATGCAGGAAGAGAAGA +CGCTGGAGAAGGACGTACTGGCAAAACACACCGTCTGGGTAAAACCGGAAGGCACGGCAT +CCCTGAATGTGCCGCTGGATAAAGAGACGCAGTTTGTCGCCATTATTGGGCAGTTTTATC +ACCCTGATGAAAAAAGCGACAGCTGGCGTCTGGTGATCAAAAGGGACGAACTGGAGGCCG +ACAAGCCGCGCTCGATTGAACTGATGAGAAGCGACCTGCGACTGCTGCCTCTCAAGGATA +AATAACCGATGTCGACACCTTCCTTATATGAAATGCTGACGTTCAGTTTCAGCGGCGAGT +TACCGCTGGAACAGATCAGCGAGCGGGATCAGCTTATCCTTTCCGTGATGGACAATATGC +AACGCATTATCAACTGCCGGGCAGGCACGCTGGCGCATTTGCCGGATTACGGTCTGCCGG +ATCTCAGTCTGATCCATCAGGGGATGGCTGCGGGTATTCATGGCCTGATGCGTCAGATTG +AAGAAACACTGCTGCGTTATGAACCACGCCTGAGTCAGATACAGGTGGAATTACTCCCCC +AGCCCCGTCCGGGGCATCTTAATTACCTGATCCACGCGCAGCTTCCCGATACCGGCTGGA +TACGCTTTGATGGCGTATTTTCTCCGGAAGGACGAATTGTTCTGCGTCATCTCAAACAAC +AGGAGCGGGCGTACTGATGGCAAGTAACGCGAATTTTATCAGCCAGTTCGTCATGGGCGG +CGATCCCTGTACTTATAAGGAATCCGGTGAACTGCAGGCTGAAATGAGTAAACTGACTCA +CCCGGCCCGACCGGATGTGGACTGGCGTCAGGTGGAAAAACTCTGCCTCGCGCTGTTCCG +GCAAAATGGCGTGGAACTACAGACGCTGGTCTGTTACGTACTGGCGATAACCAGACGGCA +GGGGCTGGCAGGGATGGCAGACGGACTCGGTTCACTGGATATACTGCTCCAGCGCTGGGC +TGACTTCTGGCCGGTACAGGTACATTCCAGAATATCACTGCTCAGCTGGGTCACAGAAAA +AATGCAGCAGGCACTGAGAACGCTGGATATTCAGTATCAGGATCTGCCGCAGATTTACCG +TTGTGTACAGCATCTTTCCGCCATCGAAACCACGCTGCAACAGTGTGAACTGTGGCATAT +GACGAAACTGGATCTACTGGCCGGGCAGTTTCGCAATACCGCATTGCGTCTGGAACGGCT +GGCGCCTCAGGGAGCGGAAACCACTATCACTCCCCCTGAATTACCCCGCCGGGAAATGAA +TCAACCGAAAAAGTCAGAGGAAAGTCCACAGCCGGTTTTTGCAACCAGATCCGTTCAGCA +AAACGATAAGGATGCCAGTCCACCCGTTCCATCCCCTGAAATCTCCCGGCAGCGGACATG +GCCGATATTTATGGCCGGAATGGTTGTGATGGCCGGTCTCGGCGGAACAGGATTATGGGG +CTGGTCGCAGCTTAATCAGCCGGACGCGCTAATCCAGCGAATACAACTGTCTGTCATGCC +ATTACCGCAGTCGCTGGAGAGCGGCGAACTGGCAAAGCTGGATGTAAAGGATAAGGCGCT +GCTGGCTCAGGACAGAACAATTGCGGCAAGTCAGATGCAACTGGAGCAGTTAAACAAATT +GCCTGCCCGCTGGCCACTGGAGCAGGGATATCGCCAGCTACGCCAGCTTGATGCCCTGTG +GCCGGATAATCCTCAGGTCAGGGCGCTGAACGCGCAGTGGCGCAAACAGCGGGAGCTGAG +CGCCCTGTCTGCTGAGGCACTGAATGGCTATGCTCAGGCGCAGAGCCAGCTACAGCGCCT +GTCGGCGCAGCTGGATGCACTGGATGAACGTAAGGGGAGATATCTGACCGGTTCGGAACT +AAAAACGGCGGTGTACGGCATCCGGCAGTCGTTAAAGGAGCCGCCGCTGGAAGAACTGCT +TCGGCAACTGGAAGAGCAAAAACAGACCGGAGAGGTTTCGCCAACGCTGTTGACGCAAAT +TGATACCCGGTTAAATCAGTTGTTGAATCGCTATGTCATTTTACTGGATACGAAGGTGGA +ACAAAGTCAGTAAACATCGGGGGATTTATGTACCAATAAGGGATATGTGACCTTGCCATT +TTTTAAAATGGAGTCTCTGTGTACAAAAAAAGAGAGGAACAGGCCATTCGATCTACTCGT +TGATTCACATCAGATAATGAGTGTATATTTCGGTAGATAGCTTGGGTTCGGGAACAGTGA +ATACCTTAAGTTTCAAAAGATTGGATTAACCTCTTGACTGTGGCCCCCGCAACCAATTTA +TTAGAATGCTGACAAACCGCAATGTGTTCTACAAATTGCGGTTTTTTTGTATTTAAAATC +TTTGTTCGCTGAACTCACAACACGTTTTTTATCTCCCTTCCTGCGAAGTAATCAATTATC +GACTGGGCAACGTGTATCCCGGTTTGCTGGTATGACTCAACGGTGGCGGCCGCGATATGC +GGCGTTGTAATGATATTTTTGGCATGTAGCAGTGGGCTAAATTGCGCCAACGGTTCAGAG +CTAAACACATCCAGCGCCGCAAACACATTTCGTTCTTCAATCACCTGAAGTAAAGCGCCC +TCATCCAGCAACTTTCCCCTTGCGGCATTGATGATTAGAGCACCATTGCGCATCATCGAC +AAATATTTATGACTAATGAAGTTCTCCAGCTCAGAAGAAAAAGGCAAAAGAACAATGATG +ACATGCGACTGCATAAAGATATCTTCAATTGATACAAACTGAACTCCAGCTTTGTCAGCA +ACCTGATAGTCGGGTTGTTTGTCAAAAGCTAAAAGCTCAACATCAAAACCGGATAACCTT +TTCGCCAGAGTTTTACCTATATTACCGTAGCCAACCAGGCCAATCCGTTTCCCTTGTAAT +TCACAGCCATGCGACTCACCCCAGTAGCCATTTTGCATCGCATGATAGCTGCCAGGGATA +TTTCTCATGCTCGCGAAGATAAGTCCAATGATAAATTCCGCAACCGCATTTGAATTAATC +CCAACCGCATTATTGACAACAATACCGGATTGCTGTGCCGCACGAAGATCAATATTGTCT +ATCCCCGTCCCGAATCTCGATATTATTCTCACACCAGGCAGCAATGATAGCGTGTCCGCC +TGATAACCATCTTTTCCGGCGATGACCGCGCAAATAGATTCTCGTAATGCAGTGGATTCT +GATTTAAGCAGATGCTCCACATTATTCTTAATAATAAGATTAAAATTATTCTCTCTTAGC +AACTTGCTGGCGGAAACACAGCGTGCTGAAAAGCTGGGGACGGTGACCAGAACATTTTTC +ATAGCGGACACTCACTTCAAAGAACGCCACCCCAAAAGATGGCGTGACCGGTTACTGTAT +TTATATTTTGAAATTATGAATTTGCTTTAATGCCGAGTGCACCTCCTGGATGATATAAGC +CGAAATCAGCACGAGTAAATTTTTTCAATTCAGAGAGTGCAAGCGCCACCGCATCACCAA +CAACCAGAACAACAGTCGACGAGCATGACGGTGCTAAACCTAAATTATCCGCCTCACTTT +TGACGGGGATTTCAACAGATAAATCACAACTTATCGCAAGCGATGAGTGATGACTGCGGG +TAAAAGAGATCAAATAATTACCCATTTTTTTCAGACTAGGCAGTGTCGCCAGGATTTCCG +CCGTCTCACCACTGTTTGAAATAAGAATAACAACATCGTCTTTCGCCACCATTCCAAGGT +CGCCGTGTACCGCTTCCGTACCGTGAACAAAAAACGAGGGAGTTCCGGTGCTGGCAAATG +TTGCGGCGAGTTTCCTGGCAATAATACCAGACTTACCAACACCAATAAAAACAACTTTCC +CCTGACAAGATTGTAATACTTTAATTAAATTTGCGACCTCCGAAAGAGGGGAATCAATAA +CTTCTTCAACTGCTTTATGTTCGTTACGCATAAAATGTTTAATGAGATGGATAAGATCCG +TGTTATTCATTTTTATTCTCCCTGATTAATATTTTTAATTACACTCACAAGACGCGTAAG +CCCCATATATAATTTTTCTCGACCGCAGGCCAGGTTCAGACGAAGGTAGCCCTCCCCCTC +CGTTCCATAGACATGCCCCGCCATAATGCCCACTTTGCCTTCATGAATTAATCGACTGTA +GAATTCATCAAAAGGATAACCAATAGCAGAACAATCTATCCAGGAAAAATAGCAACCATC +AGCTGGCCTTACGATCAATTCTGGAATATTTTCATTCAGATACTGCTGGGTGAATTGAAT +GTTAGAGGCTATATGTGCCTTTAATGACTTTAACCATCCCTCACATTCGTTGTAGGCAAT +AATAGTTGCAATTATATTCAGTACTGATGGGGAGTTTACAAAATCGCGATACCTCGATAT +CGTTCTGAACTTATGATTAAAATTATCGTCAGTTGAAATCATATACGATCCTGTTAGTGC +AGGAACATTAAATGTTTTCGATATCGAGTTAAATACTACTACTTTTTCTTTTTTTATTTT +AAGCGCGGATGTAAAGCTACGATTAAAAACAAAATCACTATGGATTTCATCTGAACATAA +CCAGACATTATGCCTTGTACAGCTTGCAGCGATTTTATGCAGTTCTTCTTCCGACCAGAC +TGTTCCTGTCGGGTTATGAGGATTACATAATAACATCATCTTTGCGCTTTTAATCTTAAG +ATCAAAATCTTGCCAGTTGATAGCGTAGCCCCCCTCATTTTTTATAATCAAAGAGGCTGT +CAGAATATTTCGCTCGCTATGTTTAATTACATCAAAAAATGCATTATAGACAGGTGTAAA +AACGAGAATATTATCACCATGCGATGTCAATAACTCTATTGCTTTTGCAATAGAGTACAT +CACACTGGGGCTATAGGTTATCCATTCAGGTTTAATATCTGTTTGATATTGTTGATAATA +CCAGTTTACTATCGCATTCAGATATTCACCATGTTGCCAACGACTGTACCCTAAAATCGG +GTGTTCCAGGCGTTTTTTTAATGCTCTGGTGATAGCGTCTGGTATCGGAAGATCCATATC +TGAAATAGAGAATGGTAGTACATCTTTTACACCAAATCTGTCCTCGCAAAAGTCCCATTG +GGTACAATATGTTCCTTTGCGGGAAACAGGAGTATTAAAAACATCCATCAGTATATCCCC +ATATAGTTATCCATATCCCGACGCAGGGCGATGACTTTAGTGCCGATAATGACTTGTAGG +GTATTTTGATCAAGTTTTACAACCGCAATCCCGCCAGCTCTTTTTATTGCAACTTCGTCA +ATCAATCTCATATCTGCGATTGTTAAACGTAAACGAGTTACGCAATTATCCAGTGACTTA +ATATTCTCTTTACCACCAAGTGCCTTAACCATCTGCTCCGCCGCTTGCAGCTCTGATTTA +TCAGGAGTTGGGATATCCGCTATAGCCGTATCTTCGTGAGCGTTCAGCGTAACAGGACTG +GACTCTTCACGGCCTACGGTCATCAGGTTAAATTTAAGGATGGTCCAACGGAACACAAAG +TAATAAATGAAGAAATAGGCCACTTCGACACACACCGCGATCGGCCAACCTGTTCTTGTG +CCACGCAATACGCCAAAGCTAATAAATTGAATCAGATCACCAGTAAATCCCATCTTCACC +CCCATATATGGCAGAACCATGTTAGCGAATCCATTCATAAAGGCATGGAAGACAAACAGC +AGTGGACTGACAAATAAGAACAGAAACTCAATCGGTTCGCTGACGCCGCCAATAATCACC +GTAAGCACCCCGGAAATAAGCAATGCTTTGATAGCCTTTCTGTTTTGAGCATGAGCAGTG +CGATACATCGCCAGCGCGGCACCAGCCAGACCATACTGAATCATCAGTTTGCCCTGCTCC +ATTTTCCCCGCCAAATCCAGCGGAATGACCGCATTCTCTTTGACGTATGCCATAAACATG +TTCAGGGTGCCGTAATATTCTTCGCCGCCAATCACAGCCGAACCGCCGATTGGCGTAAAG +CGGAAAACTGACGTCACCAGATGGTTTAAGCCAAAAGGAATCGTCACGCGTTCGGCAACT +GCATAGAAGAAATAACCAACAGGACCGGAAGTTGAAATCCAGTGGCCAATGAGCATGAAA +AGATTGAAAAACGGCGGCCAGATAAAAGGAATGATCAGACCAAATCCACTCATCACAATC +AGTGTAATGATAGGCACCAGACGTGGGCCGCTATAAAAACCTAACGATTCAGGAATGCGT +AAATTAACGATCTTTTTATACATGCTGGCGACTAATAACCCAGCAACAATTCCCCCCAAC +ACGCTGGTATTGTAGGACTGGATCCCCAGAATGATGGTTTGCCCATGTGTCGACATTTGG +TCAGCAACGACCAATAAGTCGTGCTGTTTAAGATAAAAGTTCGTTCCCAAATGCATCGCC +ATAAAACCAATTAAGCCAGAAAAAGCACCATAGGCTTTATCCTCTTTATCTTTTAATAAT +CCTAAGGGAATCGCTATCGCAAACAATACAGGTAAATTAACAAAGGCAAACAAACCAAGA +CTAACAATGAAATCAAGTATGGTTTTAATTATTGGAATAGCCAGAAATGGAATTAACTTT +GCCATATCATCACTGGCTAAACCACTTCCCAGCCCTAGCATCATGCCACATACACTTAGC +AGAGCAATGGGATACATAAATGCCTTCCCCAGGCTCTGAAAAAAACTCCAGGCTTTCTTT +TGTTTCATGTGGGTTATCTCATATAAATGTTATATATAATTAGTCCATTAATACTTTGGT +ACGAATAGAGAGATATAATTTTTCTTCTAAAATTAATTCATATTTAAAAGTGGCATACAG +ATACCGTTCAATTTCATGAATTGCGCGCTGTAACAGGATGTCCTTTTCAAGAAACTGTTC +ATAGATATCACCAATATCTTTCTGTTTTATTTTTTCATTGCATAACACGCGACTTGAAAA +ATATTTAAGGTGCATCATAAATCTGGAATAGTTAAATGAACTTCTGTCCACCTTTCTGTT +ATAAACAACTTCAATAAGCTCCGTGATTATTTGCGACAACTCAATAATCCGTACTGATTC +ATAATCAACTGAATTTTCATAATTATTTAAAATATGCAATGCTATAAAACCAATCTCATC +ATCAGGAAGTTGAACGCTGAATTGCTCATTAATGATAGTTAATGCATCGCGACTTATCGC +ATACTCTGCTTTGTACAACGCTTTGATTTCATCAAGGAAAACATTATTAATTTGTATACC +TGAAACGACTCGGGATATTGCATTCGAAATGTGATCCGCAAGAATCAATAGTAGCGATGG +ATTGAGATTTTTTTCGAGATTTTTCTCCGCATATTGCACTATTTTTTCGGCAACAAACAC +ATACTCAATATCTACATGTTCAATCAATTTATAAAGTTTGTTTTTTTGTTCATTTCTGAC +ATAAAAAATCCGGTTAGCCGGATGCTCAGGGACCGACATTCCATATTTTTTGTTGTAACC +GACGCCAGGCCCAGAAATGATAACCTCCTGTCCATTCATCGATGCCTGTACACAATTATT +GTTCATGACTTTTTCGATGATCATTCCATGGCTCCAAAAAAAAAGGCAAGGCACGTCAGA +AGTAATAACTACTTCAAACATTGCCTTGCCTGATTTAACAGTTACAAGATGATTAACTAA +TGCGTATACATTACACGGAATTGTGCTTAATTAAAGAGATGGTCGGCTTATTTTTCAAGC +CGACATTCAAATATCCGACATCAGTCACAAAACCAGCGTCTAATATTCAGGTAAATGTTA +TCTATTCAACGAAATATAAATTCATTGAATAAATAAAAACATTATCCCCTTCTCGCCAGC +GTCGCCCCATCGGCAAAATACGCTTTAATTCCCGCAAGAATAGACTCCGCAACTTCCTGC +TGGAAAGTCGCCGTTTTCAGTTTACGCTCTTCCTCAACGTTACTGATAAACGCCGTTTCG +ACCAGAATGGAGGGAATATCTGGTGCCTTTAGTACGGCAAACCCGGCCTGTTCAACTTGA +TTTTTATGCAGCTTGTTGATTTTACCGAGCTTATTCAGCACCGCTTTACCAAACTTAAGG +CTGTCGGCAATGGTCAGCGACTGCACCATATCGAACATGGTGTGGTCGACATAGCGGTCA +CCGCTTTTGCTTACGCCACCAATCAAGTCCGAGGCGTTCTGGGTTTGTGCCAGATATTTT +GCCGCAGTACTGGTTGCGCCTTTGGTTGAGAGCGCAAACACCGAGGAACCGCTCGGCTGG +CGACTGGTAAAGGCGTCGGCATGGATAGAAACAAACAAGTCAGCGCGCTGTTTCTGGGCT +TTTGCTACGCGCACTTGCAACGGAATGAAGATGTCTTCATTGCGCGTCATGTACACCTTC +ATATTGCCCTCTTTCTCGATCAGAGAGCGCAGACGGCGAGCTATTTGCAATACCACGTCT +TTTTCGCGCGTTTTGTATTTCCCCACCGCACCGGAGTCTTCGCCACCGTGGCCAGGGTCA +AGCATAATGACAATCGGACGATCCCGCCCAGCTTTACCCGGTTGTGGACCACTTTGTGCT +GGCGGCACCTGCTTTTCGAGGTCGCCTTTGTTGTAATCCTCCAGCAGCGCCAGCAGCGGG +TCCTGCATATCCTGTGCATTGGCCGGATAGAGGTCCATCACCAGACGCTCTTTAAACCCG +GCGACCGGCGCAAGGGCAAACAGCTGCGGTTTTACGTTTTGCTTTAATTCAAAAACCATA +CGTACGGTTTGCGGGTCAAATTGCCCGACGCGCGCCGACTTGATGAACGGGTCGTCAGCG +CGGATTTGCGCAGCCATCCCCTTGAGCACCGAGTTCAGGTTTACATCTTCGATATCCACC +ACCACGCGTTCAGGATTACTCAACGCGAACTGCTTATATTTCAGCTGACGATTTGATTCT +ACCGTCACGCGGGTGTAGCTGGACGCAGGCCAGACGCGCACCGCCACGACCTGGCTGACC +GCAGCCAGGCTGACCTGACTTACGCTCAATAGCCACATGGCACCCGCGCCTTGCAGTAAA +CGACGACGGCTGATTGCAGTGTTGGATCCTGACATGCCTCTCCCGAGCAAAAGAAATCTA +AGCTGTGTAACAAGTAAACGACCAATTTGACCGGAAACTTTAGCGAAAGACGCATAATCT +GTCATCTATAAAACGGTAAACATTCTTTTTATATTCACGGTATTACTGATAAAAAACTCG +CTCCCGCATAAAATTTACACTTGCACCCTGCGAAAAAACAGAATAAAAATACAATAATTT +CGAATAATCATGCAAAGAGGTGTACCGTGGTAAAGGAACGTAAAACCGAGCTGGTCGAGG +GATTCCGCCATTCGGTTCCCTATATCAATACCCACCGGGGAAAAACGTTTGTCATCATGC +TCGGCGGTGAAGCCATTGAGCATGAGAATTTCTCCAGTATCGTTAATGATATCGGGTTGT +TGCACAGCCTCGGCATCCGTCTGGTGGTGGTCTATGGCGCACGTCCGCAGATCGACGCAA +ATCTGGCTGCACATCACCACGAACCGCTGTATCACAAGAATATACGTGTGACCGACGCCA +AAACACTGGAACTGGTGAAGCAGGCAGCGGGAACATTGCAACTGGATATTACTGCTCGCC +TGTCGATGAGTCTCAATAACACACCGCTGCAGGGCGCGCATATCAACGTCGTCAGTGGTA +ATTTTATTATTGCCCAGCCGCTGGGCGTCGATGACGGCGTGGATTACTGTCATAGCGGGC +GTATCCGGCGGATTGATGAAGACGCGATCCATCGTCAACTGGACAGCGGTGCAATAGTGC +TAATGG +>other_header +GGCCGGTCGCTGTTTCGGTCACTGGCGAGAGCTTTAATCTGACCTCGGAAGAGATTGCCA +CTCAACTGGCCATCAAACTGAAAGCTGAAAAAATGATTGGTTTTTGCTCTTCCCAGGGCG +TCACTAATGACGACGGTGATATTGTCTCCGAACTTTTCCCTAACGAAGCGCAAGCACGGG +TAGAAGCCCAGGAAGAGAAAGGCGATTACAACTCCGGTACGGTGCGCTTTTTGCGTGGCG +CAGTGAAAGCCTGCCGCAGCGGCGTGCGTCGCTGTCATTTAATCAGTTATCAGGAAGATG +GCGCGCTGTTGCAAGAGTTGTTCTCACGCGACGGTATCGGTACGCAGATTGTGATGGAAA +GCGCCGAGCAGATTCGTCGCGCAACAATCAACGATATTGGCGGTATTCTGGAGTTGATTC +GCCCGCTGGAGCAACAAGGTATTCTGGTACGCCGTTCTCGCGAGCAGCTGGAGATGGAAA +TCGACAAATTCACCATTATTCAGCGCGATAACACGACTATTGCCTGCGCCGCGCTCTATC +CGTTCCCGGAAGAGAAGATTGGGGAAATGGCCTGTGTGGCAGTTCACCCGGATTACCGCA +GTTCATCACGGGGCGAGGTTCTGCTGGAACGCATTGCCGCTCAGGCGAAGCAGAGCGGCT +TAAGCAAATTGTTTGTGCTGACCACGCGCAGTATTCACTGGTTCCAGGAACGTGGATTTA +CCCCAGTGGATATTGATTTACTGCCCGAGAGCAAAAAGCAGTTGTACAACTACCAGCGTA +AATCCAAAGTTTTGATGGCGGATTTAGGGTAAGCGATGAAAATCGCCGGATGCGACATGC +GTAACACTCGTGCGTCGCATCAGGCAATTACGTTTATCCCCGTGAACTAAACAACGCCGC +CAGACCACTGCGCCGCTCAGTACGAGTGGCGATTGCCGCACTTAATATGCGCTCATCGGC +ATACAGCGACAGACGGCGACGCGCGCGGGTCACCGCGGTGTAAACCAGCTCTCGCGTTAC +TACCGGCGTGCGTTGACTCGGTAAAATCAACGCCGCATGGTCGAACTCCGATCCCTGCGA +TTTATGTACCGTCATCGCCCACGTCGTTTCGTGCTCTGGCAGGCGACTCGGTTGCACAGA +CTTAATATTGCCGTCCGGCATCGCAAACCAGACGCGCGTCCCCTGCCCGCGATCCAGCGC +AATACCAATATCGCCATTAAACAACCCAAGCGCGCTGTCATTACGGGCAATCATCACTGG +TCGGCCTTCGTACCAACGAGAGTGCGGATGACGATGAATTTTGCGCTTCTGTTGCATAAA +CTGCTCAATTCGCTCATTCAGTCCAGCCACGCCAAACGGCCCTTCCCGCAGGGCGCACAA +AAGCTGGTACTCATTGAACGCCTGAATGATTAAATCCGGCTCGGCACGCGCTTGCAGCAG +ATCCAGATAACGCCCGTAACCCGCAAGAGCTTCCTCAAGCATCGCAATATAATCTTCGCC +ACTCTGTAAAAGCCGTTTTTCGATATCAGTAAAATCCTGCTGAAAAACGGTTTTCACTGC +CGTTTTATCACCACGGTTAATCGCCGCAGCTAACTGACCAATGCCAGAATCGCTGCCGAA +ACGATAGCTTTTTTGCAGCAGGCAGAGGCTGTCGCGCAAAGATGCCGCTTCTGTGCCAGT +TCCTGCCGGAACGTGGCTTCCCGTCAGGCGGCTCAACTGCCCGGCACGCTCGGCGGTAAA +GCCCGCGTTGGCATAAGCGCAGATATCGCCCAGCACAGCCCCAGCCTCAACCGAGGCCAG +TTGATCACGATCGCCGAGAAAGATCACTCGCGCATGATCGGGCAAGGCGTCGATCAGTCT +CGACATCATAGGAAGATCGATCATTGACGCTTCATCTACCACCAGCACATCAAGATGCAG +CGGGTTACCGGCATGATGACGTAAACGCTGGCTACCCGGCTGCGCACCCAGCAATCGGTG +CAAAGTGCTGGCATCTTCCGGAATGCGTTTCTTTTGTTCATCGGTCAGCGGTAATTGTCG +CAAAGCCTTGCCGAGAGATTCGGTTAAGCGCGCGGCAGCTTTACCCGTTGGTGCAGCCAG +ACGGATACGGCAGCGTTCGCCGTCGGCCATTTGAATTAACGCTGCCAGTAACTTCGCTAC +GGTGGTCGTTTTACCGGTGCCAGGACCACCGGAAATCACCGAGATCCGCCGTGTCAGCGC +CACTGCCGCCGCAACTTTTTGCCAGTTAATTTCATCGCTTACTGGAAAAAGTTTGTCCAG +GGTTTGCGCCAGTAGAGCTTCATCAACCTCAATGGCATGATTCACTTCGTTGAAAAAGCG +TGCCACTGTGCGCTCGTTACACCACATGCGATTCAAATAAAGACGATCGCCACAGAGGAT +CATCGGCGTTGGTTCATCTCCCCGGCTGACCGCTTGTGAAGCCAGCAAGCATTCTTCCCA +ATTTTGTAGCTCACCGATTTCACTGACACAGGTCGCCAACAGCGGATGCGATGCCTCGTT +ATTTTCCAGTCGTGAAAGCGGCAAACAAACGTGTCCCTCTCCGGCATCATGACTTAATAG +TGCCGCCGCGAGGGTGACGGCAGGATGTTCATCTCCCGCCACGGTCAGGGCAAACTGCAC +GTCCAGCGGGCGTAGCTGTTTGTGCTCCACAGCTTCCAGTAATTGCTTTTGCAATTTCAT +TACGCCTCCTCCAGGGTCATACCGGCAAACATCTCATCCATCAGGTCAATCAACCCGGCG +TTGGGTCGGGTCGCGTAGATCCCTTGTTGCGGATGTTCTTTATCAACGCCACGCAGGAAC +AGATAAATAACGCCGCCAAAGTGGCGCTCATAGTCGTAATCAGCAATACGATGGCGCAGA +TAACGGTGCAGCGCCAGGGTATAAAGCTGATATTGCAGATCATAGCGGTGTGCCTGCATT +GCCGCTGCCATAGCCTGTTGGGTGTAAGCCGAACTGTCTTCACCCAACCAGTTGGATTTA +TAGTCGAGCAGGTAATAACGCCCTTCGTGGCGGAACACCAGATCGATAAAGCCTTTTAAC +ATGCCACGTACCTGCATGAACTCCAGCGGCGGGCAGCCAGCGGATAGCGGGTCAAACTGG +CGAATTAGTGCATCAAGCTGGCTGGCGATGAGCGGTTCGCTAATTGGCAGGTAAAACTCC +ATCTCCACCTGTTTATCGCGATCGGAAAGCTGATTCAGGCTAACACCCGTTTCATTGAGA +GGTGCCTGGAGGACAGCCGTGATCCACTCAGTCAACACCGGTTCCCACTGCGGTTCAAAG +CCACCGAGCTCCAGTTTTTCCTGTACCCAGTTCGGGTCAACCGGCTGGGTAAAATCGAGG +TCTTCAAACAAACTGTGCAAGAATGTCCCCGGTGACGCACCGCGCGGGAACTGATGCGGT +GTTAACGTCGGTTCTTCAACGACGCTGACCACGCCTGCGGCATCAACATCCAGCCGTGGC +ATCAGATCCTGAGCGATACCGTGACCACGCTGCTGCAAACCGGAGTAGCTGGTGACACGC +CAGTTATCGCCGGGCAATCGTTGTAGCGTCCTCGCATTCAGTTCTGCAGTTAATGCATCA +TTAACCTGCCAGGGCTGGTTATCACCAATTTGTGCCGTTTGCCAGGCAATATCATCATCG +CACAACGCTTCAATGCAGGTACGAAGCCCTGCCGCATCTTGCGGTTCTCCTTTTTGCAGC +AAACGCCCGAGCGCACTTTGGTGGACGTCGGTATCACCTTTTTTATCGCCACGACGGCGC +ACCAGCGGTGCAACGCCGAGACTGCAATGCCAAACCGAACGCGTCAGCGCCACGTAAAGT +AAACGCAGATCTTCCGCCAGACGTTCGGCCTCCGCGAGGTCGACGCTTTCTGGCGCAGCA +TTAAGATCCAGAACGGCCTCAAACGAGTGGCGATCGTGATAAAACGCCTGATCCTGGACG +CGGAAATTGGTAATAAATGGCAACCAGACCAGCGGATATTCCAGCCCTTTTGATTTGTGT +ATCGTGACAATCTGCACCAGATGTTTATCACTTTCGAGGCGCATTTGTTGGCTGGAGGCA +TTACTGTCTGGCTCGAGGATATGTTGCGATAACCAGCGTACCAGCGCATGTTCACTTTCC +AGCTGCGTTCCGGCTTCTTGTAGCAGTTCGCTGATATGCAAGATATCGGTAAGACGCCGC +TCACCGCCTGCCGTTGCCAGCAAGTTTTCTGCAATGTTACGCGCCGACATCAGCGCCCGC +AGCATCGGCATAACGCCACGTTTGCGCCAGATTTGCCGATAACCATCGAACTCTTCGACG +ACCGCATCCCACGCATGTTCGTCATTATTCAGCGTTTCAATATCCAGCGCATTCAGCCCC +ATCATTGACGTTGCCAGCGCACTGCGCAGGGTGTTCTCACGTTCGGGCGTCATCACCGCC +TGCAACAGCCAAAGCATCTCCTGTGCTTCCAGAGTTTCAAAAACACTGTCGCGGTTCGAA +AGGTAAACGGAAGGGATTTCCAGCAGCGTTAAGGCATCGCGCACCTGAGCGGCCTCCTGG +CGGCTGCGCACCAGCACACTGATGTCCGAAGCACGCACCGGACGCGCATCGTCGCCGTTC +ATCAGCAACGCTTCGCCGCGTTGCCCGGCTTGTAGCCAGTCGCGGATTTGCGCAGCACAT +ACCTGCGCCATGGTACTTTGATAGTCGCCAACGCCGCAGCTTTCGCCTTCCATCAGCCAC +ATTTTCATCGCAGGCTGCGTTTCACCTTTAAATACAAAACGTAACGCCTGATTTTTGCCG +GCAGATTTCACAGGAATAAACGGTATTTCACGAAACATGAACGCGTCATCAGTCTGGCTG +AAAAGTTTGTTAACGCTGTTCACCATTCCCGGTGCGGAACGCCAGTTGGTATCTAAGGTG +TAGTGAGCATGAACTTCGCTACGCGCCTTCATATAAGTGAAGATATCCGCACCCCGGAAT +GCATATATGGCCTGTTTCGGGTCGCCAATCAGCAACAATGCGGTTTCCGGCTGATGGTGC +CAGATACGGCGAAAAATTCGATACTGTTGGGGGTCGGTATCCTGAAATTCATCGATCATT +GCCACCGGGAATCGCGTACGGATCGCCGCTGCCAATACCTCGCCGCTTTCACTACGCAGC +GCGGAATCGAGCCGACTTAACATGTCATCAAAACCCAATTCGCCACGGCGGCGTTTTTCA +CGCGCTACTGTTTCGCGGATCTCAGCCAATGCGCGAGTGATCACCAGATCGCGGATCGAC +AATGGTTCTGCAAGCAGTTGTTCGATCGCCTCAAACAGTGGATGTCGCGGGGTTTCCCCC +CCGGCTTTCGTGCGATCTTCTAAGAAACGCTGAGAGAATTTTTCCAGCGACTCCGGCAAC +TGATAGCTGTTGGTCTCTTCTTCTGCCCAGGCGCTGATCTTCTCGATCCATTTAGCCTGA +TTGCTACGGTTAAACTTGCGTCGATCAATACCAGAAGATTCGATCAGCGCATCCAGTTCA +CCCACTGCGTCGCGCCACTGCTGTTTTACGGCATCAATACGCGCCACAATTTGCGCGTGG +CGGGAAGCCAGCGTTTCATCATCGGGGGGCGGTGCTTTGATAACCGGCGCTTCGCCTTGC +AGATAACGATTAATATCGCGCAGCAACGCCTGCGGCCCTTTCCAGGTTTCAAAGACGACC +TGGGCAATTTCACGCGGCAGCGGGTAGCAGTGGCGACGCCAGAAATCGGCGCAGGCCTGG +TAGCGTAGCAGAGACTCATCTTCAATCAGCTGCTGCTCAAACAGCATGCCGGATTCAAAG +GCATTCAGGTTGAGCATGCGCTGGCAAAAGCCGTGAATAGTAAAGACTGCCGCTTCATCC +ATCTGCCGCTCGGCTAACAACAACCACTGCGCGGCTTGCGCTTTATCGTCGATCTCTTCC +AGCAGGCGTTTGTACAGTGGATTGTCGGTGGTTTCACGCAGACAGGCGATGCGCAACTCG +TGGATATTGCTACGGATACGACCACGCAATTCTGCCGTAGCAGCCTCGGTAAAGGTCACC +ACCAGCAGTTCTTCAACGGTCAGCGGGCGGGGAAAGGCGGCAGAACCGCCTAGTCCAAGT +AACAGGCGCAAATAGAGCGCCGCAATCGTAAAGGTTTTGCCTGTGCCGGCAGAGGCTTCA +ATCAGGCGCTCGCCCTGTAAGGGCAAGCGCAAAGGATCTAGTGTCTCGGCGACATCACTC +ATTCTTTTCACTCATCAGGGGCATTGTTTGCTGCAACGCGCTGACGTTCTCCCACACTTT +CCAGCCTTCAGGATGCACATATTCGGCTTTCCCGTTCTGGCTGCCGGAAATCTGCGACAG +AATAGCCATACCTTGCGGCTCGACCACCGCCTGATGGAAGAAATCAGCAAGTTTTTGCGG +CGTCAGCAGTTTTATCTGGGCCACGATTTTATCACGCGAATCGAAGCGCATATTGCCGCG +ATCGAAATCTTTACTTAACTTCGATGCTTCTTCGCCGAGCGTTTGCGGTGCCTGCAGCAT +CTGAGTAATTACCGCCTGCTGGATTTGCGCAAACTCCTCTGGCTTCATCGCCCGCAATTT +TGCCTCTGCGGTTGGGAAAAACGCCTTGTAACGCTCCCACAAGAATGAAGGCTGTTTATC +ATTGCTTTGCAAAAGGAAGCCCATGCCCCACTGACGCCCCACGCTCATTGGAAACGCAAA +CACGGCATAGCCCAACTGTTCTTCGGTACGCAACTGATTGTAGAACCACGGCTGTACGAT +CTGCCCCAACAGAGAGCTATAGGCTGAGCTGGTGTATTCATCGTAGCCAGTCGGTACAAA +TATCGCTGCCAGTGCGGAGTCGGTGCTGTTACCAGCTTTTTCAAAGATGACGGATTGTTT +TTTATCGACCACGACATCTTTGTTACGACACCACTCTGAACCATCAGCGCCCAACTGTTT +TTGCACATGGCGTGCCAGCGTTGTTGCCTGGGCTTCAGTCATGTTGCCGATAACCATAAA +CTCTGGTCTAGCCCCTGATTTTAAGGCGTCGCGATAGGCCAGCACCTCTTTCAACGTAAT +GGAGGGCAAAATTTTGCGCCGTTCATCTCGCGAGAAGTACGGCACTTGCGAGAGCATCTG +CGCGGGCATAATCGCCTGCTCAAACGCTTTGCCCTTTTCTGCGGAATCCATCATCTGGTT +ATACCAGGACTTCGCCTGCTCAAGCTGATCTTCCGTAGCGGTATAGCTAAAGTAGCCCTC +CAGCAGAGCCTGGAACAGCTGCGGCAGGCGCTGAGTGTAACCATTGGCATTAACCATAAG +GCCGTTGTTAGCATTGGTGGAAAAACTTATGCCACCAACCGACGCCTGGTTGCTTAACTG +ATCAAGCGCCAGCCCTGCGAGATAATCATTGAGCGCAAACATCACCTGATTGCGGGCGCT +GTCCATGGCTTTCGGATTACGCAAAATCAGGCTGACATCAGCTTTGGGCTCACTGGCAAA +ATAACGGCTTGGCGCATACACCACGCGCAGATTCGACTCATCAACAATCAACTCTGGATG +GTCGTATTTCTTCTCTGACTTAATCAGCGAGAAATCGTCAGGAATATAGGGGTTAAGCTC +CGGTAAGGAGAGCGCAATATTGGCGGCTTTTTTCTGCCAGTCCGCGAAAGTTTGTGCGCT +AATTTTATCGACCTGATACGGCGCATCGACAAAGTAAGCCGTTTTGTTGTGCGGCTCTTT +CGGGCTGATATACCAGATACGCGCATTCTGCGGCGTCATCATCGCCAGACGTTCTTTTAC +TGCTTTAGCATCGTACCGATCGGCAATATTGACTGCATCCAGTGTATGCTCAACAGGAAC +GCGAATCATGGTATCAGCCAGCCATTCGACGTAATCCATATCACGGGTGATTGACGGATA +ACGGAAGTCGATATCCAGCACATTCGCCAGTTCATCGAAGTATTGTTTATCGATCCCTTT +TTCACGTAACAGATTGAGGTAGCTAAAAATGGCCGCCACAACCTGATCGCGATTCGCCAG +ACCTTTATCGGTTAAAGACGCAGAGATCGCTAATACGCCGCTGTTGCCGTTGACGATAGG +ATCGGAATTGGCGCTAATGCCCTCAACTAATCCCTGCTTTTGCAGCCAGTCAGAAAGTGT +ACCAGGGCTGCGATTACCAATCAGATAGGTAATCAATTCATCCGTTTTACTACGGAACTT +CGCTGAATTGTTATCGATGCGAAACTCAACGCGCAGAACTTTACGCGGCAACGCCGGGAC +GTAATGAATGATAATGCCCTTTTGCGCGTCGGTGACTACCGGCACGGTGATTTCCGGTTT +TTTGCTCTCTTTGTTCGGCACGCGACCAAAGGTGTCCGCCGCCATTTTCGCCAACTCCGG +CAACGGTTTATTGCTGTAAATAACCGCCTTCATCAGATTGGCGGAATAGTACTTCTCGTG +GAAATCTTTCAGCGCCTGCTGTACCGGATTACCTGGTTTGTCGCTTAAAGTTTCGAGGTT +ACCACCAGAAAACTTTGAACCGGGGTGTGCCGGGTTAATGGTTTCTGCGCTGACCTGTGC +CATGCGCATCCCGTCACGCGTACGCGCCATGGTTAATTCGGCATTCACTGCATTACGTTC +ACGTTCGGCGTATTTCTTGTCGAGCAAGGGTTCTGCAATAGCATCGGCCAGGCGGTCTAC +CGCACCGGGCAAGGCGTCGTTCTCAACTTCCAGATAGAAAGCCGTGCGATACGGTGCCGT +GCTGGCATTGTGACTGCCGCCGTGCATTTTGAGATATTCGGCCAGACTGTCAGCCTGCGG +ATACTTTTTCGACCCCATCAGACTCATATGTTCAAGGTAATGTGCCAGCCCCTGGTACGC +CTCAGGATCTTCCAGCGACCCAACGGGCACCACCAGCGCCGAGAGCGATTTAACTGCCTG +CGGATCAGAAACCAGTAAGACCACCATACCGTTATCCAGACGTATAGCCTGATACTGGCG +GTTATCTTTATCACTTTTACGGATGGTTTCCTGAATCGGCTGCCATCCCGTTTCTGCCTG +ACTTAAGGGTGCCCAGAGGGCAACAAACAACAATAATGCTTTGAACCAGATGCTGCGGGG +CATTCACGGACCTCATAATCAACTTTATTTTCTGGCCAGATTCAACACGTTAACGCAAAT +CATCTGCCAGAATTTAATCTTGTGCTGCACGAGTCAGCCTATGTCTATATAACCATCAGT +CCGTGACTGGTGCGCATCATAAAGTAAGCGGATAGATTGCGCAATTTTTATACAATACTC +ATGACTGATTAAAGCGAAACAGCGGTAACAGGAAACGTTGCGACTGTTCAACGATAGCCT +CCATTGTCTCTGGTGTTAATTGCCGCCAGAGCCGTTGATACCAGATATCATCACCTTCGC +CACGCACCATCATGTTGCCTTCGTAAGCCTGAAGGAATTTCGTACGGGCTTTTTGCAACG +TGGAATCGTCATCCAGCATGGCATCGTTTTGCGCGTCATAACAGGTTTTTAGCCACGCGC +CGCCACTTTCAGGTAACACCAGCAATGGCGCGGACATTCCTTCACGATACCCCTCAATCA +GTTGTGAGAGGTAATGCAAAGCCTGTTCGGCTGCAAGCGGCGGAAAACGCCACTCGCCGT +CTTTGCGTAGAAAAAGGCGACTTTCACCATTACCACCGCTGGCACAGTAGACAAGGTGTT +CCAGCCAAAGTTGCATTCCCTGCGCCACACTTAATAAAGAGGGACACCAGCGCAACAGGC +CATCCGGCTGCACCTGCGGCAACCAGCCAGTTATCTGCACACCGTTGCAGGCGAGATCAA +TCTCCATACTCTGCCCTGGCTGGCGACAGGCAATGACTCTGTCGGCAAGCTGCTGCATCT +CCTGACACTGCGTTTCCCAGAAAATTTCACCAAAGGCACCATACGGCAAATCACCTGCCG +CCCGGAATCGGCGGAACAAGCGTTCGGCATCATCCTGCTCAACCAGTACATTTAATAACT +GCTGGTTGATTTGATAACGACTAAGCCCTTCAAGAATAAAAGGTTCAGTGTCGGGAATTT +CGCTGTCTTCGGTACGGAAGTTCACCTGCAAACGCATCTGGAAAAACGCCCGCACCGGAT +GTGCCCAGAATCGTTGTAGCGTTTCCAGCGGCACGGTTTCCGGTAAGGTAAATGGCAGCG +GCTGAACAAATTCAGAATGTGCTTTACCAGCCTGGCTGGCCGCAGGTAGCCACTCGCGCG +CATAGCTTTGTAAGTTACCGGGCTGGTAGTTTTGCGGGTCAAACGGCATCCGGGTATGGT +GGCAAGTAAGATGCGCTTTTACCCTTGCCTCGCTTTCATCACAGTTAAGCGCTTCATCGC +CCGGTAGATAATGGCTTTGCCCGATGTAGTCGATCAGTTCCTGCACCAGTACCGACGGGA +AACGTTCACTGTTATCCTGAATGGAACGCCCAATATAGCTGATATAGAGTTTTTGCTGCG +CGGAAATTAACGCTTCCAGGAACAGATAGCGGTCGTCATCGCGACGGCTACGGTCGCCAC +GCTTCGGTTTCTGGCTCATCAGATCAAAGCCCAATGGCGCAAGCTGACGTGGATAAACGC +CGTCGTTCATTCCCAGCAGGCAAACCACTTTGAACGGAATTGAACGCATTGGCATCAGAG +TACAAATGTTAACCGGTCCGGCGAGAAAACGCTGGCTGATACGTTCTTGATCCAGGCGCA +GTGCCAGTTCATCACGCAATAGTGACAGCGGCACCGCGTCGCCATACTGCGCGCCTAAAC +CTTCGGAGATAATCGCCTGCCATTGTTGTTCGATCAGCGTCATCGCCGCTTCGGTTTCCG +CATCCGGCAGGAAAAAGGCGTTGAGCATATCGCGACAAACCGGCAACCACTCTTCCAGCG +GACGCTCCTGCGCCAGCCCGCGACGCCAGATATTTAGCTGCATTAGCAGTGAAGCCAGAT +GCCCCACCAGTTCTGCAATTAAGCCGCTCGATTCATCATAAGGTAGAACCGATTGCCACT +CGCCCTGCGCGCTCTCCATCGCGTAGCCCAGCAACATGCGCGTCAGGCCAAACCGCCAGG +TGTGTTGACCGGTAGCGGGAAGTTCCAGCTCGCGAACGTTGTCGTCATCTATCCCCCAAC +GAATGCCGGATTCGTTGACCCACTGACGTAAATAACGCAGCCCTTCTTCGGTGATGTCAA +ACCGCGCTGCCAGCACCGGCACATCCAGTAATGCCAGCACGTCTTCCGACACAAAGCGGC +TGTCTGGCAGCGATAACAGGCTGATAAACGCTTCAAGTACAGGATGCGACTGCCGCGCCC +GACGGTCGGAAATGGCGTAAGGCAGGTAACGATCCGCAGGTGCACTACCAAACACAGCCT +GAATAAACGGACTGTAGCTGTCGATATCAGCCACCATCACGATGATGTCGCGCGGAGTAA +GTGTCGGGTCTTCCTCCAGCATCGCCAGCAGGCGATCGTGTAAAACTTCAACTTCACGCT +GCGGGCTATGGCAAACGTGGAAGGTGATACTGCTATCCAGTGGATCAAGCGGGCGTTTGT +TATCGCTACGGGAAAACTCTTCGATGTTCACACCAGCAACGGCGCGGTTTTCCAGTTCCA +GAATGTCAGACTGAATATTATGCAGCAGGTTATCTGGCGTCACATCGACAAAAGCGTCCA +GCTCCTGGCTGCTCTCCAGGTCAGAAAGGAGATAAATGTAGTCGCGCCCAAGCTTGCCCC +ATGAAGCCAGCAGCGGGTTGCCGACATCCTGTTCACCATCGCTGTTAAAGAGCTGCCCGG +CATTTTCGCTGTCGCGAAATAGCGGTAATTCGCGATCTTCAAAACTGTGTCGGCGCTGGC +GAGTCAGTAGTTTCGCCAGATAAGCTGGATCTTTAATGTCGCCCCAGTAATAACGGCAGG +GGTTGGTAAACAGGAGATGGATTTCAATATGTTTACCCAGCGCCTGTAGCGCCTGGAGAT +AAACAGGCGGTAACGCGGAAATACCGCATATAAAGACGCGCGAAGGTAACCCCGGCGGGC +AGGTCGTCGCGGACTCCAGCGTTTCGATAAAGCGCTGATAGAGATTGGCGCGGTGCCAGC +GCGGTTGCCCAAGTTCGTCGGTATATTCCACCAACGCCTTCCACAACGGCGCTTGCCAGG +CCTGTGCTTCTCCCAACCCTTCTACCAGATGTCCTGTTTCCCACTGTGCCAGCCAGTCCG +GACGATAGACCAGATACTGGTCAAACAGGTCCGCCGCTTTTGAAGAAAGCTGGAACAGTT +TTCGCTTGTCACTATCGTCAGTCAGATAATGCCGCAACAGGGTAAAGTCTTCGCGCTCCA +ACAGTTGCGGCAGCAGAGTCATCAGTTTCCAGCTCATGCTCTGTTTGTTAAAGGCGCTCT +CTTTGGGGATCTCCGGTAACACCCGGACGAACATATCCCAGATAAAGCTCGCTGGCAGCG +GAAAATCAATGTTTGCCGCAATACCAAACTTTTGCGACAGGGTCATTTGCAGCCACTGTG +CCATACCGGTACTTTGCACCAGAATCATCTCTGGTTCGAAAGGATCGTCCAGCCGTTCGC +GTTCGACAATAAACTCCATCAACGCTTCCAGCACGTCCAGACGATTGGAATGGTAGACCC +TTAACATAGCGGCTCCTGACTACTGACGATTCGGGCAATGCAGGCGGGTCATCTCGCCTT +CTCTGCCCCCGGGTGAAACTAGCGTAACGCTGATGCTGACACATCCCGCCTGCGATGTCT +GCATTCGGTTGACCTGCCAGTTAGCAGGTGGCGAAATCGCGCGCAGTTGCGTTTGCTGCC +AGCCATGCCGCCAGAGCTGTTGGTACTGGTTTCTGCTGGCAAGACTGTTCATTAATGTTC +GCTGGAAACCCGATAACGCAGTGACAATCATCACCATCAACACCATCGCCAACATTACCT +CCGGCAGACTAAAGCCTTGTTGATTCCTCAGGGAAGCTGACATAACGCCCTCTCTTTCAG +CGGACAAAAATCGCTCCAGCCGCGTGGCGAAAAAACAATGTTTCCATCGATGACTTCGCC +TGTTCGCCACAACGAAACGCCTTCATAACCAGCAATCAATAAGGCTTCATTATCTGCCAG +TAAACGCAGACAAACCCGGGCACCGGTGGCAGCATACAGTAAGCACTGAACTGCGGGCTG +CGTCTGCCAGGAGTGCATTTTTCCCCACTCCAGCGCCGACTGAACGATGGCCTGGCGGCT +CAATGACTGACTTTCCATGCTCACGCGAGAAGCAAAACTGCGATCCTGCTGACTCATTCC +TTGCAATAGCAAGCTACCCAAAATCAGCAGCATCAGGACCAGAGCCAGTGACGAAACTCC +CTTTTCGCGGTTCACAGGTTGGCTCCTGTCACGCTATAGCTGGCATCCACCACGGTTTGC +GGATCAGCCTTGCTGGCAGCGTGTATATTAACCGTCAACACCGGCGAGAAGCCGCTGACA +TCCTGACGTACGACCTGAAAAGTGTCGATAATGATGGCATCCGGATTAGTGACTTTATCC +CAGCCCTTACCTTCACAGGATGTCGCACCGCGTAGCGTTTCCAGCACATGCTCCTTCAGA +CGAAATCCAATCTGGTCGGACTCTTTTACCGGTTCGCGATCCCAGATACCGTTACTGTTC +GCATCCCACTGCACAATGACACAGTCACCCTGTCCGACAATTTCCAGCCCTTCGCCCGTA +CAGCTGCCATGGCAATAACCCGCCCTCTGGAGATGCTTCGCGACGGTAAATACCCGCAGC +CAGATTTCATCTTCCAGCGCCAGTTTACGGGTGCTCGTTAAACTTTCACGCTGTAACGCA +GGCAGAAAGCGTGCAGCCCCCAGCAACAATACGCTACTGATCGCCATAGCAATCAACACT +TCCAGCAGAGAAAAACCTTGCTCTTTTACAGGCATCCTTCTGTTTCTCCTTGCTGACAAA +GCCGGAGTCTTCCCCACGGCGAAACCACTAGCCACCACTCGCCCGTTGAGTTTTTGAAGC +GAATATGCCCGGCCCATGCGGTATTGCGCAGGCCAAAGAAAGCAAGCGAAGGTGTCAGGT +CGCTCATTTCGACTTCGGGCCAGCGCGGCACAAAGACCAATGGTGAACTGCCATGACAGG +TATTCGCCCCAGCAACGGAACTGCCATGACAGGTATTCGCCCCAGCAACGGAACTCACAA +GGCACCATAACGTCCCCTCCCTGATAAGACTGATACTGTGGTCGCGGTTATGCCAGTTGG +CATCTTCACGTAAATAGAGCAAATAGTCCCGCGCCTGGCTGGCGGTTTGCCAAAGCCGTT +GCGACTGCTGCCAGTATTGCCAGCCATAGAGCCCACTTGCGCTTAGCATGACCAGAATAA +GCATCGCGACCAGCGTTTCAATCAGCGTATAACCACGTTGTGTTTTCATGCCGGCAGTAT +GGAGCGAGGAGAAAAAAAGACGAGGGCCAGTTTCTATTTCTTCGGCGCATCTTCCGGACT +ATTTACGCCGTTGCAGGACGTTGCAAAATTTCGGGAAGGTGTCTCGAAGAATTTAACGGA +GGGCAAAAAAAACCGACGCACACTGGCGTCGGCTCTGGCAGGATGTTTCGTAATTAGATA +GCCACCGGCGCTTTAATGCCCGGATGTGGATCGTATCCTTCAATCTCAAAGTCTTCGAAA +CGGTAGTCGAAGATGGATTCGGGTTTACGTTTGATAATCAACTTCGGCAGCGGACGCGGT +TCGCGGCTTAATTGCAGATGAGTTTGATCCATATGGTTGCTGTAGAGATGCGTGTCGCCA +CCGGTCCAGACAAAATCACCCACTTCCAGATCGCACTGCTGCGCCATCATATGCACCAGT +AACGCGTAGCTGGCAATGTTGAACGGCAGGCCGAGGAAGACGTCACAGGAGCGCTGATAA +AGCTGGCAAGAGAGTTTGCCGTCTGCCACATAGAACTGGAAGAATGCATGGCACGGTGCC +AGCGCCATTTTATCCAGTTCGCCTACGTTCCACGCTGAAACAATAATGCGGCGGGAATCC +GGGTCGTTTTTCAGCTGGTTCAGTACCGTAGTGATCTGGTCAATATGACGACCATCCGGC +GTTGGCCAGGCGCGCCACTGTTTACCATACACTGGCCCGAGGTCGCCGTTTTCATCGGCC +CATTCGTCCCAGATGGTGACATTGTTTTCGTGTAGATAAGCAATGTTAGTGTCGCCCTGC +AGGAACCACAGCAGTTCGTGGATGATGGAACGCAGGTGGCAACGTTTAGTTGTCACCAGC +GGGAATCCATCCTGCAGGTTAAAACGCATCTGATGACCAAAAATGGAAAGCGTTCCGGTT +CCGGTACGGTCGTTTTTCTGTGTGCCTTCGTCGAGCACTTTTTGCATCAGTTCTAAATAC +TGTTTCATGGTTCCTCAGGAAACGTGTTGCTGTGGGCTGCGACGATATGCCCAGACCATC +ATGATCACACCCGCGACAATCATCGGGATGGAAAGAATTTGCCCCATGCTGATGTACTGC +ACCCAGGCACCAGTAAACTGCGCGTCGGGCTGGCGGAAAAACTCAACAATGATGCGAAAC +GCGCCGTAACCAATCAGGAACAAGCCTGAGACAGCTCCCATTGGGCGCGGTTTACGAATA +TACAGGTTGAGGATAATAAACAGCACCACACCTTCCAGCAGCAGCTCGTAAAGCTGTGAT +GGGTGGCGCGGCAGCACACCGTAAGTGTCGAAAATGGATTGCCACTGCGGGTTGGTTTGC +AGCAGCAAAATATCTTCTGTACGGGAGCCAGGGAACAGCATGGCAAACGGGAAGTTCGGG +TCAACGCGGCCCCACAATTCACCGTTAATAAAGTTGCCCAGACGCCCGGCACCAAGACCA +AACGGAATGAGTGGGGCAATAAAATCAGAGACCTGGAAGAAGGAACGTTTAGTACGGCGG +GCGAAGATAATCATCACCACGATAACGCCAATCAGGCCGCCGTGGAAGGACATGCCGCCG +TCCCATACACGGAAAAGATACAGCGGATCGGCCATAAACTGCGGGAAATTGTAGAACAGA +ACATAACCAATACGTCCACCGAGGAAGACGCCGAGGAAGCCCGCATAGAGTAAGTTTTCA +ACTTCATTTTTGGTCCAGCCACTGCCCGGACGATTCGCCCGTCGTGTTGCCAGCCACATT +GCAAAAATGAAACCCACCAGATACATCAGGCCGTACCAGTGAAGCGCCACGGGTCCTATT +GAGAAAATGACCGGATCAAACTCCGGAAAATGCAGATAGCTACTGGTCATCTGTCACCAC +AAGTTCTTGTTATTTCGCTGAAAGAGAACAGCGATTGAAATGCGCGCCGCAGGTTTCAGG +CGCTCCAAAGGTGCGAATAATAGCACAAGGGGACCTGGCTGGTTGCCGGATACCGTTAAA +AGATATGTATATGATCCGCGCTATAACCCCCCGCGAATCAACCCGCCCATGCCGCGACGC +TCCATAAAGGCTGCAACCTGATGGCGAACTTCGGTCGCCAGTTGCGCTTCCAGACTACGC +TGCGCAAGATTTTCTGCTTCAGCAAAATCAATGCGCCGCAGCAGGTATTTTACGCGCGCT +ACAGAACGTCCGTTCATAGACAGATGGCGATACCCAAGCCCAATGAGGATTGCCACGCAC +ATCGGATCGCCCGCCATTTCACCGCACAAACGGAGATCGATTCCATGTATTTCCGCTTCC +CGGGCGATCATCGCCAGAGCTCGTAACATTGCAGGATGAAGACTGTCATAAATGTTCGCC +ACCCGGGTATTGTTGCGATCAACGGCCAGGATGTATTGAGTCAGATCGTTGGTGCCAACA +GAGATGAAATCGACCCGCTTTGCCAGATGCGGCAGCATAAATACCATTGACGGCACTTCC +AGCATGATGCCGATACGTGGTTTGGGAATTTCGTAACCGATCATCTCCTCGACTTCACGT +CCGGCACGTTCAATCAGGCGGCGTGCTTCGTCAACTTCATCGAGGCTTGTGACCATCGGC +AACAGAATATTCAGGTTGCCCGTAGCGGCATTAGCACGCAGCATCGCCCGCACCTGGATC +AAGAAGATCTCCGGCTGATCGAGCGTAATGCGAATCCCACGCCAACCCAGGCATGGATTC +TCTTCGCTGATCGGCATGTAAGGCAGCTGCTTATCTGCTCCGACATCCAGCGTACGCAAG +GTGACGGGTTTATCATTAAACATTTGCAGCATCCCCTGATACTGCGCCACCTGTTCTTCT +TCCGACGGAAAACCACTTTGCAGCATGAATGGGATTTCAGTGCGATAAAGTCCTATGCCA +TCAATACGGCTGCCCAGTTTTTCTTCATGTTCCGGGCTTAAACCGGCATTGAGCATGACT +TTAATGCGTTCGCCGCTTTTTAACTGGGCGGGTAAATTGACGTCATCTTCCGCCAGACGG +CTAAGCTCGATCTCTTCACTAATTAGCCGCTGATATTCTTGCAGCAGTACCGGTTCCGGA +TCGACCAGCAATTCACCGCGATAACCATCGACGATCAGCGTCCGACGATGCAGTACCGAA +GGCTGAATATCCGCGCCCATCACGGTAGGTATCCCCAGCGCACGTACCATGATCGCAGCA +TGGGAGTTGGCAGCGCCATCGCGCACGACAACACCGACTAAGCGATCCTGGGGCAGCTCA +GCAAGCGTTGTCGCTGACAGTTCATCTGCCACCAGAATGAAACGTTCCGGCCAGGCGTTC +GGCCCTTGATTAGCGTCATCAAGATGAAACAGCAATCGCTGACCCAGCGCACGTAAATCG +CCAGCCCGCTCTTTGAGATAGTTATCGCTTAGCGCGGCAAACTGTTCGGCAAATTTTTCA +ATGACCGTTTTTACCGCCCACTCTGCCACCGAGCCTTTATCAACCTCGGCAAACAATTCG +CGACGCAGCCGGGTATCCGAAAGCAGGTGTGAGTAAAGATCGAAAATAGCCGCCGTTTCT +TTTTGTGCACCGGCAGCAAAGCGTTTGCTATAGCGGCGAAACTCGTTAGCCGCCTCTTCC +AACGCCCCGGTCAGTCGTTCGCGTTCCAGAGCCGGATCCAGCGTTGATGCCTGATACACC +TGTTCCATTAAAGGTAACGTGGCATCCTGCCAGCCTTCGGCAATCGCCACACCAGGTGCT +GCCGGTAATGCACGGATTCGCGTCTGGCGATATTGCCCAAACAAGGCAGTCAACTGCGAC +TGAGAAAGAATAGCTGCCATCTGGGTGGCAAGCGTCACCAGGAAGGATTCTTCACTTTCG +TCATACTGGCGCAACTCTCGTTGCTGTACCACCAGTACACCAAGCAACTGGCGACGTTGA +ATAATTGGTACGCCTAAAAACGCGCGGAAACGTTCTTCTTTTACGGAGGGGATGTATTTG +AAGCTGGGGTGCTTTTGCGCATCTGCAAGGTTTATCGGTTCCGCCAGCCTGCCAACCAGG +CCGACGATCCCTTCATCAAACGCGAGCGTTACAGTGCGACCGCGTGGTTTTTTCAGTCCC +CGGGTCGCCATCAGGTAGTAACAACGTCGATCATGATCGGCCAGGTAGACCGAACAGACC +TCGGTATCCATCGCAAGACAGATGTCGGTAACCAGAATATTTAACGCCTCATTCAGGCGT +GGTGCGCTGGCTACCTTTTCGACTATTTCGCGCAGGCGAGTGAGCATAATTGGCGTGACT +TAACCTCTTTTACGTCGATAAGCAGATGCGTTTTGTGGTTTTGGCGTATTTTCCTGCAGT +GACATCACCACACTCGCGAACTCTTTCATTACCCTACGGTAGACATCACGTTTAAATGAC +ACCACCTGTCTGACTGGATACCAGTAACTTACCCATCGCCAGCCGTCAAACTCTGGTGTA +CTGCTGGTTTGCATATTGATTTCTGCATCGCCGCTCACCAGCTGCAAGAGAAACCATTTT +TGTTTTTGGCCGATACAAACCGGCTTCGTGTCCCAACGCACCAAACGTTTCGGTAATTTG +TAGCGCAACCAGTTACGCGTTGAAGCAAGGATTCGAACGTCTTTGCGGCTTAATCCTACT +TCTTCAAACAATTCACGGTACATCGCCTGCTCTGCGGATTCTCCGGGGTTGATTCCGCCT +TGCGGAAATTGCCAGGAGTGCTGACCAAATCGCCGGGCCCACATTACCTGCCCCTGGCGA +TTACAAATCACGATACCTACGTTTGGGCGGTAGCCATCGTCATCAATCACCGGACTACCT +CAAAATAAAGCTTTATATACGAATGATTGTTTCATACTCCAGGAAGACGGTAAACCACTC +TCTGCAGGGCATTACACACTAATAACAATTGAATAACTCACAGTTATGTGCAGAGTTATA +AACAGAGGAAGGGGTGGATAGCCGTTTTTATTCACCTTTTCTGTGGATAGAGTTGTGAAG +AACTACGGAATTACTGCGGGAAAACCCGGAGCATTCTGAATAAGACAGATATAGAGATTT +TAAAATATTCATTATCAGTCAATGCATTACATGTGATTTGAGTAATAAAAAAGAGTAATT +CGTGACCCAGGTCACACCTCTCATTTACGGGTTGGCGAAAGATCAACCAATGCCGTATTT +ATCCACAGAATGTGCCACTAAGTTAAGCACTGAACCACTAAAAACTGGAGTTTCGTCGCA +CGTCAAGGCTGTAAATGGAAACAGTAGTGGAGGTTTTTCACAGTTATCCCAGCTTTCTGT +GGATAACATGGTGTAAGATCCTGTTTATTTTCAGTGACCAGATTTGGAAAACCCGTTGCA +GTGTTGCGCAACTCGATTACCGGAAACCTAAAAAGCAATATAAATCAGAGAATTGAACAA +CGCATGTGGAAAAAGTTACACTGCGAATATTCGGCACATAATTGCTGTTTGTTTTTTAAC +CAAGGTATCATGACATGTCCCAACCTCGCCCACTGCTCTCTCCTCCCGAAACTGAAGAAC +AATTGTTAGCGCAAGCACAACAACTTTCTGGTTATACATTGGGAGAACTGGCGGCACTTG +CCGGGCTGGTTACGCCGGAGAATTTAAAACGCGATAAGGGCTGGATTGGCGTGTTACTGG +AGATCTGGCTAGGTGCCAGCGCAGGGAGTAAACCTGAGCAAGATTTTGCTGCTCTGGGCG +TGGAACTTAAAACTATCCCTGTGGATAGTCTTGGTCGTCCGCTGGAAACAACATTCGTTT +GTGTTGCCCCGTTAACGGGCAATAGCGGGGTGACCTGGGAAACCAGCCACGTGCGCCACA +AGCTCAAACGCGTGCTGTGGATACCGGTTGAAGGCGAGCGCAGCATCCCGCTGGCAAAGC +GTCGCGTAGGATCACCGTTGCTGTGGAGCCCGAATGAAGAGGAAGACCGGCAGTTACGCG +AAGACTGGGAAGAATTAATGGATATGATTGTTCTCGGTCAGGTTGAGCGGATCACCGCTC +GGCACGGGGAATATTTACAGATACGACCGAAAGCAGCGAATGCGAAAGCGCTGACCGAAG +CTATTGGTGCCCGGGGCGAACGGATTCTGACGCTGCCGCGCGGATTTTATTTGAAGAAGA +ATTTCACCAGTGCGCTACTGGCCCGTCATTTTCTGATCCAGTAGCCATCGCTTTGACCTG +CCGCTTTCCGGGCATATAATTACCGCTTCATTTTTTTGGCAGGGCTTTTTAGATGTTATT +TGCATGGATAACCGATCCTAACGCCTGGCTTGCGCTCGGTACACTGACGCTGCTGGAGAT +CGTTCTTGGGATCGACAATATTATTTTCCTTTCTCTGGTGGTGGCAAAGCTTCCCACAGC +ACAACGTGCTCATGCGCGCCGTCTGGGGTTGGCGGGAGCCATGGTTATGCGTCTGGCGCT +GCTGGCATCCATCGCCTGGGTTACGCGCCTGACGAATCCGCTTTTTACAATATTCAGTCA +GGAAATTTCCGCCCGTGATTTGATTCTGCTTCTGGGTGGCTTGTTCCTTATCTGGAAAGC +CAGCAAGGAAATCCACGAATCCATCGAAGGTGAAGAAGAAGGGCTGAAAACACGCGTTTC +ATCATTCCTCGGCGCTATCGTGCAGATTATGCTGCTGGATATTATCTTCAGCCTCGACTC +GGTGATTACCGCTGTGGGTCTGTCAGATCACCTGTTTATTATGATGGCAGCCGTGGTAAT +TGCCGTAGGCGTGATGATGTTCGCTGCGCGTTCGATTGGTGATTTTGTCGAGCGCCATCC +TTCGGTAAAAATGCTGGCGCTCTCTTTCCTGATTCTGGTGGGCTTTACCCTGATTCTGGA +AAGTTTCGACATCCACGTACCGAAAGGTTACATCTACTTCGCGATGTTCTTCTCTATTGC +GGTTGAAAGCCTCAACCTGATTCGCAACAAAAAGAATCCGCTCTGATACTCCGTACGCTC +TCCTGCGGGAGGGCGTACTCACTCCTGTTACCCTCACAGTTTAAGATTTTCCTGCTTTCA +AGATATATAACGTCGGTTTATAAACAGACTATTATCATAGGTGGGCCAAATGAGGATAAC +CGGATGAAAAAATGGGCAGTAATAATTTCTGCAGTCGGACTGGCGTTTGCTGTTTCCGGG +TGTTCCAGTGATTACGTCATGGCGACCAAAGATGGCCGTATGATTTTGACCGATGGAAAA +CCTGAAATTGATGATGATACCGGGCTGGTGAGTTATCACGATCAGCAAGGTAACGCGATG +CAAATTAACCGTGATGATGTTTCGCAAATTATTGAACGTTAACAAATAAGGTCAGCATCC +GGCTGGCCTTAAGATTTTTCTCTTTCCCTTTTCCCTTCCCTCTGCCATTTTTATATTCCT +TATGTCGTGATTATAAAAAGGAAACGGCTATGCAATATCACCGTATACCCCACAGTTCGC +TGGAAGTCAGCACGCTGGGGCTTGGCACGATGACGTTTGGTGAACAGAACAGCGAAGCCG +ACGCCCACGCACAACTCGACTATGCCGTCGCTCAGGGCATTAACCTTATCGACGTTGCCG +AAATGTACCCAGTACCTCCGCGCCCCGAAACTCAAGGGCTAACCGAAACCTACGTCGGCA +ACTGGCTGGCGAAACATGGCAGCCGCGAAAAGTTAATTATCGCCTCCAAAGTGAGCGGAC +CGTCGCGCAATAATGACAAAGGCATCCGCCCGGATCAGGCGCTGGATCGGAAGAATATCC +GCGAAGCGCTGCATGACAGCCTCAAGCGTCTGCAGACTGATTACCTCGATCTTTATCAGG +TGCACTGGCCGCAGCGCCCAACCAACTGCTTCGGCAAACTCGGTTATAGCTGGACAGATT +CTGCGCCTGCGGTTTCGCTGCTGGATACACTGGACGCACTGGCAGAGTACCAACGCGCGG +GAAAAATTCGTTATATCGGCGTGTCGAACGAAACTGCATTTGGCGTAATGCGCTACCTGC +ATCTGGCGGACAAACACGATCTGCCGCGTATTGTCACCATTCAGAACCCCTACAGTCTGT +TAAACCGCAGTTTTGAAGTAGGTCTGGCAGAAGTCAGCCAGTATGAAGGGGTCGAACTGC +TGGCCTATTCGTGCCTGGGTTTCGGCACGCTGACCGGGAAATATCTCAACGGTGCAAAAC +CCGCTGGCGCACGTAATACGCTCTTTAGTCGGTTCACCCGCTATAGCGGTGAGCAAACGC +AAAAAGCCGTCGCGGCGTATGTTGATATAGCCAGACGTCATGGCCTGGATCCTGCACAGA +TGGCGCTCGCTTTTGTACGCCGTCAACCGTTTGTTGCCAGCACTCTGCTGGGCGCAACCA +CGATGGAGCAGCTGAAAACTAACGTCGAAAGTTTGCATCTGGAGTTAAGCGAAGACGTGT +TGGCAGAAATTGAAGCGGTGCATCAGGTTTACACTTATCCGGCACCATAAGATTAACGCC +GGTTAAAACCGGCGTTAAATATTAATGACGGCGCTGCCAGATCCACAGCGCCGTTATTGC +CAGCGCAAACAGCGCACCGAAGCCAATGCCAATGGGCACGACCGGGATGCCTACCATTAC +CGCCAGCGAGTAAATGCCCAGCATCAACAACATGGCGCTGTTTTCGCCAAGGTTTTGTAC +TGCAATCGCATTCCCCGCCCCGACGCTTTTTTTGCCCCGCTCCTGTAGCAACGCATTGAG +CGGAACGACAAAAAAGCCCCCCAGCACGCCAATCAGCATCAACAAAGCATAGGCTGGCAG +CAGCTCGTGTTGCAGGGAGAAAATCAGTACCACCACGCCAATCAAAATCCCGGCTGGCAT +ACAGCGTGACACGGTTTCCAGCGTAACTAACTTCGCTGCCGCACCTGCACCAACCACGAT +ACCAATCGCTACCATCGCGTTGAGATAGGTCGGCGTAGCGTTATCGGTAATACCCAGCGC +CACCGGTACCCACAGCACCAACAGGAAACGCAGCGTGACACCCGCTCCCCAGAATAAACT +GGTGCCCACCAGCGAAAAACGCGTTTCACCATTGCGCCATAGCGAGGTGCAGGCATTCAG +GAAACTGCGGGTCATGCTGATGAGATTCCAGGACTGCCCCGGACGCGCCGCCGCCAGTTT +GGGAATGTAGATATTGGCAACGACCGCGCCACCGTAGGCCAGTGCGCATGCGACCAGGGC +AACCAGAATATGCCAGTCAGCCAGAACACCACCAGCTACGGAACCGAGCAAAATCGCCGC +TATGGTAGACGCTTCCATTAAACCGTTAGCTTTTACTAACTTACTACCCGTGGTTAATTC +GCCGAGAATACCGTATTTCGCCGGTGAATAGGCTGCAGCACCAACACCCACCAACGTATA +GCCGAGAAACGGATTGATACCAAAGCAGATACTGGCTGCGCCCAGTAGCTTCAGGCCGTT +GGCAAACATCATCACCCGGCCTTTGGCGAAGCTATCCGCCACCTGCCCGACAAACGGCGC +AAAAAGAATGTAAGCACCTACAAACACCATTTGCAGGATGGGCTGGCTCCACTCCGGATA +GAACTGCGCTTTCAGTAACGCCAGAGTGGCAAACAGTAGCGCATTATCGCCAAACGCAGA +GAGAAACTGCGCCACGATAACCGCTTTCATCCCCTTCGACCACAACGAAGTGTTAGTGTG +CACTGACTCACTCATCGTGTTGTTCCGCTTCGTCTACCCAGCTTTTCAAAGTGACAAAGT +CAGGTTTGCCGCTGCCAAGTAATGGCATCTGTTTCAGATAGCGAATATCGCGCGGTACAG +CAAGCTCCGGCACGCCGTGCTCGCGGGCATACTGTTGTAACTTATCGCGCGTCAGTTCGT +TATCTGTGGTGAAAAGCACCAGTGCCTCGCCTTTGCTGGCATCGCTCTTAATCGCAGTGG +CATGGACTTTATCTGGCGAAACACCAAGTGCCAGTTGTTCCACCATTTCCAGCGACACCA +TTTCGCCTGCAATTTTGGCAAAGCGTTTTGCGCGGCCCTGAATCTGCACAAAGCCCTGCT +CGTCAAAACGCACAATATCGCCAGTGTCATACCAGTCGCGCTCCATTTCGCCGCGAATAT +TCTCGGCGGTGGGCACTTCCAGTACACCAGGCTTCTCCACCCGCAGATAGCCGTTCATTA +TGTTCGGCCCTTTCAGTTGCAGGCGTCCGCCCTCTTCGATACCAGGAACCGACAACAGGC +GCGCATCCATTCCTGGTAGAATACGCCCTACCGTACCGGGTTTCGCCGCCATCGGTACGT +TGATAGAAACGACAGGCGCGCATTCGGTCACACCGTAGCCTTCAAGGATGCGCAGGCCAA +ATTTATCCTGCCAAAGCTGTTTAGTACTTTCTTGTAGTTTTTCTGCGCCTGCCACCACAT +AGCGTAGACGATAGAAGTCATACGGGTTGGCGAAACGCGCGTAGTGACCGAGGAAAGTGG +AGGTACCGAACAACACGGTGCAACTGCGGTCATACACCAACTCCGGCACAATACGGTAGT +GCAGCGGGCTTGGATAAAGGAACACTTCTGCACCTGTGAGCAGTGGCGTAAACAGGCCTA +CCGTCAGCCCAAAGGAGTGAAACAGCGGTAACGCCGACATAAAGCGATCGTTGGTGGTGA +AGTCGGCAATCGTTTTAATCTGCTCGACATTCGCCAGAATGCTTTTATGGCTATGGACGA +CGCCTTTCGGATGGCCTTCAGAACCGGAGGTAAAAAGGATCAGCGCCTCTTCTTCCGGCT +GCTGTTTAACCTGTGCCAGACGCGGCATCAGCAAATGAGCGAAGATCCATACTTTGTCGG +CAGTGGTGACATCTGCTTTTAAATCTTCCAGATAGACCCAGCGCACCTGAGTAAGTTGCT +CCGGCAGATGCCAGAGTTTGCCTTTATCGAGAAACTGACGGGAAGTGAAAATGGTTTTGA +TTTCAGCCGCCGTAATAGCACTGGTCAACCCTTTTACCCCGGCGGTGTAGTTCATCATTG +CGGGAATGCGGCGACGGGCGATGGCCCCAAAAATCACTGCAGCACTGATGCCTGCATTGG +GCAGCATTAAGCCGATGCGTTCGCCTTCAACACTGTATTTTTCAAGGATGCGTCCAACAA +ACAGCGTTTTCGTAAGCAATTTGCGATAGGAGTCCGGGGTAAAGTTAACGTCTTCGACAC +ATTTCTTCCCGGCTCCGAAGCGGTACATTGCGCTCAGTAAAGATTCGTACAGCGTTTCAC +GCGGGCGCACCGCCATACGCGCTTCCATCATTATTTGATGCAGCATTTCGCCAGCGATTT +TGCGACGGTCACGGGCACGCGGCGCATCCGGCATCTCCACCTGCGTTGGTGGCAAAATAT +GCAGAGTAATTTGCGGGAACAAGCGACGTTTAACCAGACCTTTCAGGCGGCTGAAGTGCG +TAAGTTCCGCCCCTTCAATACGCACAGGAATAACCGTTGCACCAGACTTCGCCGCGACAA +ATCCCGCGCCATCGTAGATTTTCATCAGCGAGCCAGTGGTGGTGATGCGTCCTTCAGGGA +AAATCACCACTGGTCGGCCCTGTTCCACCAGACGTACCAGATGTTTAATCGCCATAGGTT +GCGTCGGGTCGAGAGGAACAAAGTCGATAAATGATTTCAGCCAACGCATATACCACTGTT +GGCTTATTGAGGTGTAAACGGCAAATACCGGACGTACGGGTAAAAACAATGCCAGCAGTA +TGCCATCAATAAAAGAGACGTGATTAGGCGTAATTAGAACGCGCTCGCCCTTCAGTGCCT +TGGTGTCACCCGTAACGCGAACGCGATACAAAACACGGCACAAATTTCGAAAAAAGCTAA +AAAGCATTCCAACTCCCTTTGCTCTGATTCAGTAAAAGCGAATGGAGGGAGATTACACGA +GATAAAGAACGCGAGCGACAGTAAATTAGGTGCGAAAAAAAACCTGCGCATCCGCGCAGG +TTGGTGCAAGAGACTGGGTACGAAGAGCGTACCGAATAATCTCACCAATCAATACCTCTG +GGATCTTGATTGTGGTCTGCACAACGACTCTTCGCCAGCGAGAAAACGCAAAGGAATGAA +GGGAAATGCAACGAGGTGTGTAAATTGTCGGTTACTGTTACAGATTGATGACCGGCAAAA +AAAAACCTGCGCATCTGCGCAGGCTGGTGTAATTCATGTGCTCAACCCGAAGTTGACTTC +ACCTATCAATACCTCTGGGATCACCACTTTAGCAACCTGAAGCCAAACGCCACCAGCGGT +CAATCGCAACAGCGTTTCGCAAAGTGTAACCAAAGGTTTGCAATCTCTTTTTTTGTCTTA +CTTATTTGCGTTTGGCTCACATTCCCACAATGAAAACACGCCGCCCCTTGAACCAACGGG +CGTTTTCCGTAACACTGAAAGAATGTAAGCGTTTACCCACTAAGGTATTTTCATGGCGAC +CATAAAGGATGTAGCCCGACTGGCAGGCGTTTCAGTCGCCACCGTTTCCCGCGTCATTAA +TAATTCACCCAAAGCCAGCGAAGCTTCCCGGCTTGCTGTGCATAGTGCAATGGAGTCTCT +TAGCTATCACCCGAACGCCAACGCCCGTGCTCTGGCGCAGCAGACCACTGAAACGATCGG +TCTGGTCGTTGGTGATGTTTCCGATCCGTTTTTCGGCGCAATGGTGAAAGCGGTCGAACA +GGTGGCTTATCACACTGGTAATTTTTTATTGATTGGCAACGGTTACCACAACGAACAAAA +AGAGCGTCAGGCCATTGAGCAACTGATCCGCCATCGCTGTGCTGCGCTGGTTGTCCATGC +CAAAATGATCCCGGATGCCGATTTAGCCTCATTAATGAAACAAATGCCCGGTATGGTGCT +GATCAACCGTATCCTGCCTGGCTTTGAAAACCGTTGTATTGCTCTGGACGATCGTTACGG +TGCCTGGCTGGCAACGCGTCATTTAATTCAGCAAGGTCATACCCGCATTGGTTATCTGTG +CTCTAACCACTCTATTTCTGACGCCGAAGATCGTCTGCAAGGGTATTACGATGCCCTTGC +TGAAAGTGGTATTCCGGCCAATGACCGGCTGGTGACATTTGGCGAACCAGACGAAAGCGG +CGGCGAACAGGCAATGACCGAGCTTTTGGGACGAGGCAGAAATTTCACTGCGGTAGCCTG +TTATAACGATTCAATGGCGGCGGGCGCGATGGGCGTGCTCAATGATAATGGTATTGATGT +ACCGGGTGAGATTTCGTTAATTGGCTTTGATGATGTGCTGGTGTCACGCTATGTGCGTCC +GCGCCTGACCACCGTGCGTTACCCAATCGTGACGATGGCGACGCAGGCTGCCGAACTGGC +TTTGGCGCTGGCGGATAATCGCCCTCTCCCGGAAATCACTAATGTCTTTAGTCCGACGCT +GGTACGTCGCCATTCAGTGTCAACTCCGTCGCTGGAGGCAAGTCATCATGCAACCAGCGA +CTAACCGCAGTTAAAGCAATTCCAGCGCCAGTAATTCTTCAATGGTCTGGCGACGGCGAA +TCAACCGCGCCTGACCATTATCAAACAGAACTTCTGGTAACAGCGGACGGCTGTTGTAGT +TGGATGACATTGATGCGCCATATGCCCCTGTATCATGCAGTACCAGATAATCACACGCCT +TCACTTCCGGCAAGGCGCGGGTTTCAACATTTCCCCCTTCCTGCTGGGTAAAGACATCGC +CCGATTCACATAACGGCCCGGCGACGACGGTTTCCACCGTTGGTGCGTGTTCCAGAGAAC +GACCATCAGCTGCCAGGGCACTGATATGGTGGTAACTACCGTACATTGCCGGGCGCATCA +GATCGTTGAACCCGGCATCAACCAGCACAAAGTGGCGGCTACCCATTTGTTTGACGCTCC +GCACTTGAGTAATTAATACGCCAGCCTGCGCTACCAGAAAGCGACCCGGTTCAATTTCCA +GTTTCACAGGATGGCCCAAATGGCGGGCGATTTGCTCACGCGCGGCATTCCACAGACCAT +AATAATGTTCGGTATCAACCGCCTCTTCACCCTGTTGATAAGGAATAGAAAGCCCACCGC +CCGCAGAAATAGCCTGTAAATCCTGACCGAATTCGAGGACCTGACGCACCATAGCACCAC +ATACCTGTTCCAGATGGGCATAATCGACGCCAGAACCAATGTGCATGTGAATGCCGACCA +GCTGTAGATGATGACGTTGTATCACGTCCAGTGCGGCGGGCAGATCGGTGTACCAGATAC +CGTGCTTGCTGTTTTCGCCACCGGTATTGGTTTTTTGGCTATGCCCGTGACCAAACCCCG +GATTAACACGCAGCCATACCCGATGCCCTGGCGAAACCTGACCCAGTTGGTCGAGCATAT +CAACAGAACCCGCATTCACCGGAATTTGCAATTCACTGACGCGTTCAAGCGTCGCCTGAT +CGATAACATCTGCCGTAAAAACAATATCATCGGGGTGCGTTTGCGGATTGTAACCCGCCG +CCAGTGCACGCTCTATTTCGCCTAACGAGACGGAATCCACTTTTACGCCCTGCTCACGCA +TTAAGCGCAAAATATGAATATTGGAACAGGCTTTCTGTGCAAAGCGCACCACATCAAACT +GTTTCAGCGCTGCAATCTGCCGACGAATAATTTGCGCATCGTAGACCCACACCGGGCAGC +CAAATTCTGCGGGCAAACGCAGCAGATTTTCGGCGGTGAGATCGGTATCAGTGCTGAACA +GTGAATGTGGCATAACAAACTCCAGATAAGTGCTTTTTTATGATTACGCCACATCATAAA +AAGAATAAAAAATATCGATTTATGTCGAGTCTATGCAAAAATGATATGGATTACCGGATT +GCGAGAGAGCGCTAATGGCCGCCGTTAACTTACGTCATATTGAAATTTTTCATGCGGTAA +TGACCGCCGGAAGCCTGACTGAGGCGGCACACCTGCTACACACCTCACAGCCAACCGTCA +GCCGCGAACTGGCGCGCTTTGAGAAGGTGATCGGGCTGAAATTGTTTGAGCGCATACGTG +GACGATTACATCCTACCGTGCAAGGACTGCGTCTGTTTGAAGAAGTGCAACGATCCTGGT +ACGGACTGGATCGCATTGTCAGTGCCGCAGAAAGTCTGCGCGAGTTTCGCCAGGGAGAAC +TGTCTATTGCCTGCCTGCCGGTCTTTTCGCAATCTTTTTTACCGCAGCTCCTGCAACCCT +TTCTGGCACGTTATCCCGATGTCAGCTTAAATATCGTGCCCCAGGAATCACCGCTACTTG +AAGAGTGGCTCTCGGCCCAGCGTCATGATTTAGGACTCACTGAAACGCTCCATACGCCTG +CGGGAACAGAACGTACCGAATTACTCTCTTTAGATGAAGTGTGTGTGTTACCTCCGGGCC +ATCCGCTGGCGGTAAAAAAGGTATTAACGCCGGATGATTTTCACGGTGAGAACTACATCA +GCCTTTCCCGTACTGACAGCTATCGCCAGTTGCTGGATCAATTGTTTACTGAGAATCAGG +TTAAACGACGCATGATCGTAGAAACCCACAGCGCCGCGTCAGTCTGCGCAATGGTACGGG +CGGGGGTAGGCGTTTCGGTGGTTAACCCGCTCACCGCACTGGATTATGCGGCAAGCGGTT +TAGTGGTGCGGCGGTTCAGCATTGCGGTTCCATTCACCGTCAGCCTGATCCGCCCCCTGC +ACCGCCCGTCATCAGCGCTGGTGCAGGCGTTTAGTGAGCATTTACAAGCGGGATTACCGA +AACTGGTCACTTCTCTTGACACTATTTTGTCGTCAGCTACGACAGCATAAAAGCGACAGC +ATCCTCGGCATGGATCGCCGCGGTATCAAACACAGGCAGAACACTGCGCTCTTCTGGCAC +CAGTAAACCAATTTCTGTGCAGCCAAAAATGACGCCCTGTGCGCCCTGTTCTGCAAGGCG +AGCAATCACTTGCGCATAATAAGCGCGTGACGCTTCGGTAAATTGCCCCAGACACAGTTC +TTCAAAAATAATCTGATTAATTTTCGCCCGTTCATCCGCTTCAGGAATAAGACAGTTGAT +GGAAAATTGTTCCGTCAGCCGCCCGCGATAAAAATCCTGTTCCATGGTGTAACGTGTACC +CAGCAGCGCCACACGAGTCATTCCTGCCCCGGTAATTGCACGTCCAGTGGCATCCGCTAT +GTGTAAGAAAGGCAGAGAGCAACGAGACTCAATGGCATCCGCCACTTTGTGCATCGTATT +GGTGCATAACACAATACCTTCTGCGCCCGCCCGCTGTAAGCCAAGCGCCGCCTCAGCCAG +AATATCCCCGGTTTTGTCCCACTCACCGCGACGCTGGCACTCTTCTATTTCATGAAAATC +GACGCTATGTAGCAGCACTTGCGCAGAGTGAAGCCCACCAAGCCGCTGTTTAATGCCTTC +ATTTATCAGACGATAGTAAGGAATAGTGGATTCCCAGCTCATTCCTCCCAGCAAACCAAT +TGTTTTCATTCCTCTCTCCTGATGTGTGTTACCGCAACAAGGCTGAATAAGGAACGAGAC +AAACGCCTCAACGGCCAGGTGCCCAATCTCTATTAACGAAAAAAGGGCCGGATGTACAGC +ACATCCGGCCCGTGAAATCAGACGCCGATATTTCTCAACTTTTCGCCTGCCATCAGTTTG +CGCTCGATATGTTCCAGCGTGACATTTTTGGTTTCCGGAATGAGCCAGAAAGTGATGCCC +ACAAACGCAATGTTCAGCGCAGTGTAGAGCCAGAACGTACCGGCAGCGCCAATGCTATCA +AGCAGTGTCAGGAAGGTCGCGCCGATAATCATATTCGACACCCAGTTTGTCGTCGTTGAG +CAGGTGATGCCAAAATCGCGGCATTTCAGCGGCTGAATTTCAGAGCACAAGATCCACACC +ACTGGCGCGGCGCTCATCGCATAACCGGCAATACACATCATCGTCATGCCAACAGAGAGC +CAGGACAAGCCACTGGAAGCCGTACCGTTATCAAACTGCATCAGGCAGTAACCCAGCACC +AGAGTGCCTAACGCCATCACGCTGAAACCAATTTTCAGAGCCGGCTTACGCCCTGCTTTA +TCTACCGTAAAGACCGCAATGAAGGTAGCGAACATAAAGGTCAGCCCCACGACCAGAGTC +GCAATCATCTGTTGTTCTGTGGTCGTAAAGCCCGCCATTTTGAAGATACGTGGCGCGTAG +TACATGATGATGTTCATACCGGTAAACTGCTGCATCGCCTGCAACAACATACCGAGAAAT +ACAGCACGACGGACGTTACGGTTGATCTTAAACAGTGCCCAACCGCCCTGTTTTAACTTC +AGGCTTTCACGAATTTCGTTGAGTTCTTCTCGCGCTTTTTCCGACGTATCGCGCAGCATA +CGCAACACTTCTTCCGCCTCAATATGACGCCCCTTTTCCGCCAGCCAGCGCGGGCTATTT +GGCAGGAAGACCACCAGAATAATCAGCAGGACTGCTGGTAAAGCAAGAACCCCCAACATT +GCGCGCCAGTTACCGCTATAACTGAACGCTGTATCGGATAAAAACGCCAGCACGATGCCG +AGTGTGACCATCAACTGGTACATGCTGATCATCTTACCGCGAACGTTTTCACTTGCCATT +TCAGAAAGATATAGAGGAGCGGTGTAAGACGCGATCCCAACAGCAATGCCCAACACCACA +CGAGCGGCGATTAACATCTCTACGCTGGTCGCAAAAGCGGACCCTATCGAACCGAGTACA +AACAGGATGGCCCCCGCCATCAGGCTGTATTTACGCCCCAGGCGGAACGACAGCCACCCA +TTAAACAGCGCACCAATTGCTGCGCCGAGCATCATGCTACTGACCACCCATTCCTGCAAA +CGGCTGGTCAGCACAAAGTGATCGGTAATGAACGGCAACGCTCCGGCGATTACGCCGATA +TCAAGACCAAATAACAATCCTGCGACCGCAGCAGCTACCGAAACAAACATATTCATACGC +CGCGTATCCCGCAGAGGACGTGGCGTTAAAGCAGATTCCGTATTGATAGTAACCATTTTT +TCCTGCCAGCAGAGAGTAAGACATAGTGAAAAAATACGTGAACAATTCACACAGGTGTCA +GGTCGGAAATAGCATAAATATGGATTAAATTGCTACGACATGTCGTTATGTGATGGATAT +TCCAATTTTCAAATTAAGTTGAATTATTGAGATTATTATTAACTACCTAATTTTAAAGCA +GATAAAATTCATAAAGTTCATTAATTGATAATTGATATGGATTATTTCATAACCATGATA +TGGATTATGATGATCTACAGGTATAAAAAACCCTGCCATGCGGCAGGGTCATAAAAGTAA +GAGGAATGAATTAACGCGCCAGCCAACCGCCATCCACAGCAATGGTATAACCATTTACAT +AATCTGAAGCGCTGGAGGCAAGAAACACTACCGGCCCCATCAGGTCACTCGGCAGTCCCC +AACGGCCAGCTGGAATGCGGTCGAGAATTTCCGCGCTACGTTGTTCATCTGCCCGCAGTT +GTTGAGTATTGTTGGTCGCCATGTAACCCGGAGCTATCGCATTAACATTAATGTTGTGTT +TAGCCCATTCGTTCGCCATCAATCGCGTCACACCCATCACGCCGCTTTTTGATGCGGTAT +AAGAAGGCACACGGATCCCGCCCTGGAAGGAGAGCATTGACGCGATATTGATAATCTTGC +CGCCATTGCCTTGCGCGATAAAGTGTTTCGCCGCTGCCTGAGACATGAAGAATACGCTCT +TGATATTCAGGTTCATGACATCGTCCCAGTCTGTTTCGCTGAACTCGAGAGCGTCTTCGC +GGCGAATCAATCCGGCGTTATTCACCAGGATATCAATATGACCAAACTCCGCTACCGCGC +GATCCAGCAGTCCAGGAATGCCATCAATCTTTCGCAGATCGGCGGTCAGGCTTAAAAAAC +GACGCCCCTGCGCCGTGACCTGCTTGATGGTTTCAGTCGGTTCAACGATGTTAATGCCAA +CAATGTCACAGCCCGCTTGCGCCAGCCCCAACGCCATCCCCTGGCCCAGCCCAGTATCAC +AACCAGTGACGACCGCAACTTTACCTTCGAGAGAAAATGCATTTAAAATCATAACAATAC +CTTATTCGTTTATGCCCACAACTAGCGCAAATCTTTAACGGCCACATGGTCCATATCATC +AAAAACCTGGTTTTCACCGACCATGCCCCAGATAAAGGTATAAGCTTTGGTTCCGACGCC +GGAATGGATCGACCAGCTCGGGGAGATCACCGCCTGCTCGTTATGCATCACAATGTGACG +CGTTTCTTGCGGTTGCCCCATCATGTGGAAAACGCAGGCGTCATCATCCATATTGAAATA +GAAATAAACTTCCATCCGGCGCTCGTGGGTGTGACACGGCATGGTGTTCCACAAGTTACC +TGGAGCCAGCTCCGTCAGCCCCATACTCAATTGGCAGGTTTCCAGCACATCCGGGACAAA +ATATTTGTTAATCGTGCGACGGTTACTGGTGAGGTTATCGCCTAACGTGACTGGAGATAC +TTCGTCCGGTGTGACTTTTTTGGTGGGATACGTCGTATGCGCGGGTGCGCAATTGTAATA +AAACTTCGCCGGAGTGGCGGTATCAATACTGGCAAAGACAACTTCTTTTGCACCTTTACC +AACATACAGGGCGTCGCGGTGACCGATTTCATAGCATTGACCATCGACAGTAATCGTACC +GGCACCGCCAATATTGATAACACCTAACTCGCGACGTTCAAGGAAATAGCTTACGCCGAG +TTGTTTACCAACTTCCCCGCCAACGGAAACCGTTTTAGTTACCGGCATAATGCCGCCAAC +AATAATACGGTCAATGTGGCTGTAAACCATGGTGTACTCATCGGCGACAAATACCTTTTC +AACCAAAAATTCATTGCGCAGCCCCTGGGTATCCAGCGTTTTTGCGTGCGCACTGTGGAT +GCTCTGTCTTACGTCCACATCAACCTCCGATAATCAGTGAAGCGTGAAAATAGAAAACAA +TAATAAAACACTGTTTCGTTTTCTCTATGAGGGGATGATATGCCCATGGGATAGGGTTTT +CAATTAAAAATAAAACAATGTTTCATTTTCAAGTTAAGGATTAAAAAAAGTGCAGTGTCG +ATCACGAATATGTCATGAGAATGGAAAAATCAGGGAGCCCTGAAAAGGTATGTCGACTCA +CCAGCCATCATTATTCAACAGATTAATGACGGCAGATATTTATCGGTAAGGAGGAAATGC +AGAGCTACTCGTCACGTTCAATGGTCAATGCCACACCCTGGCCCCCGCCGATACAAAGCG +TTGCCAGTCCTTTGCGGGCATTACGTTTCACCATTTCATGAACAAGAGAAACCAGGATTC +GGCAACCGGAAGCGCCTATCGGATGACCGAGTGCGATCGCACCACCATTGACATTGACCC +GACGCTCATCCCATTCAAGCATCTTGCCAACCGAAAGCGCCTGTGCAGCAAACGCTTCAT +TAGCCTCGATAAGATCGACATCAGCCAACTGCCAGCCAACACGCTCCAGGCAACGGCGGG +TCGCATACACCGGCGCAATTCCCATCAATGCCGGATCCACACCAACGCTGGCAAATGCGC +GGATGCGGGCCAGCACGGGTAAATTCAACGCTCGTGCTTTGGCTTCGCTCATCATCATTA +CTGCAGCTGCCCCATAGTTTATGGATGATGCATTACCCGCTGTCACAGAACCGAGACTAT +CAAATGAAGGATTTAAACGGGCTAAGGCTTCTGCGCTGGTGTCAGTGCGTGGCTGTTCAT +CGGTATCAACAACCAACGTCTGACCGTTACTTTGGGTTATTACCGGGACGATCTCATCTT +TAAATCGTCCGGCGTCAATCGCCGCTCGCGCTTTTTGTTGCGAGCTAAGTGCGTAAGCAT +CCTGCAACTGACGGCTGATGCCATATTCGCGAGCCAGATTTTCGGCGGTGACACCAATAT +GATAATCATTGAAGGCATCCCACAACCCATCATGCACAAGACTATCAACCAACTGGCTAT +TGCCAAGCTGTGCGCCGGTGCGGCTATCAGTCAGAACATGTGGTGCGCGGCTCATGTTTT +CCTGGCCACCGGCGATGACAATATCAGCCTCGCCACACTGTATCGCCTGAGTAGCCAGAT +GCAGTGCTTTAAGCCCGGAACCACAAACGTCATTAATAGTGATTGCAGAAACGCTATTAG +GAAGACCACCTTTAATAGCCGATTGCCTTGCCGGATTCTGCCCTGCCCCTGCAGTCAACA +CCTGACCAAGAATCACTTCATCCACCGCATATGCAGGAACGCCGGTACGTTCTATTAACG +CTTTGACGACCAGGCTGCCAAGTTCCACGGCGGAATGACCCGCTAACGCACCACGAAAGC +AGCCGATAGGTGTCCGTAACGCCCCGACAATCACAACGTCTTTCATCACAACCTCGCACC +AATTAACAGTGCAATAGTAAATGATTGTTAATTACAGTTATCTTAATTGTTTAAAAAAGG +TGATTTTTATCACAAAGGAAATACGCCTGAGTAGCAGTCAGAGACATAACTGGCACGTAA +GGTTTGCAACCACTAACCCACCAATAGAGAGGTAGATAGGGCGTTAATCTCCCATACTTA +ACCTGGTTTATGGTAAATTGCCCTCCATTTTGTTTAATTTGTAGATGATACGTTCAGATA +ATGTCTAATATTTGGTCAAAAGAAGAAACTCTGTGGAGTTTCGCGCTCTACGGCACAGCC +GTTGGTGCAGGCACGCTCTTCCTTCCTATTCAGTTAGGTTCGGCGGGGGCTGTGGTCCTG +TTTATTACTGCTCTGGTCGCCTGGCCTTTAACATATTGGCCACATAAAGCCTTATGCCAG +TTCATCCTCTCATCGAAAACATCAGCAGGTGAAGGGATAACGGGCGCGGTAACACACTAC +TATGGCAAGAAGATTGGTAATCTGATTACCACGCTGTACTTCATCGCCTTTTTTGTCGTC +GTGTTGATATATGCAGTGGCAATTACCAACTCACTTACAGAACAGCTGGCAAAGCATATG +GTTATTGATCTTCGCATCCGTATGTTGGTGAGTCTGGGGGTTGTATTAATCCTGAATCTC +ATTTTTCTGATGGGACGCCATGCCACTATTCGGGTAATGGGATTTTTGGTATTCCCATTG +ATTGCCTATTTCTTATTTCTTTCTATTTACCTGGTCGGTAGTTGGCAACCTGATCTATTA +ACAACCCAGGTAGAGTTCAATCAGAATACCCTTCACCAGATATGGATATCGATTCCCGTG +ATGGTTTTCGCTTTTAGCCATACGCCCATTATTTCTACGTTTGCCATAGACAGACGTGAA +AAATATGGCGAACACGCTATGGATAAATGCAAAAAAATTATGAAAGTCGCTTATCTCATC +ATCTGCATAAGTGTATTGTTCTTTGTCTTTAGCTGCCTGCTTTCTATTCCACCTTCGTAT +ATTGAAGCGGCTAAAGAAGAAGGGGTTACCATTTTATCGGCGCTTTCTATGCTGCCGAAC +GCCCCAGCATGGTTGTCAATTTCCGGGATTATTGTCGCAGTAGTTGCGATGTCGAAATCA +TTCCTGGGTACGTACTTTGGCGTTATTGAAGGTGCCACAGAGGTCGTCAAAACAACATTA +CAGCAGGTTGGTGTAAAGAAAAGTCGTGCATTTAACCGCGCACTATCAATTATGTTGGTA +TCGCTGATTACCTTCATTGTTTGTTGCATTAACCCGAACGCGATTTCGATGATTTACGCG +ATCAGCGGCCCGCTCATTGCCATGATACTTTTCATCATGCCTACGCTGTCAACGTATCTC +ATCCCGGCGCTTAAACCCTGGCGTTCCATCGGAAATCTGATTACCCTGATCGTGGGTATC +CTGTGCGTATCGGTAATGTTCTTTAGCTAATATCCGTTGTGGATGGTTCAAAATTGCTTC +AATTTTGAACCATCCCAGTTTTCATAATGTTCATTTGTTATTATTCCGCCCTATCACTTC +TCTCGTAATATTATATAATTATCAGCTAGTTAAACACACAAAGAGTTCTGAACATCTTAA +ATAAGACTATTTAAGATACATGACGATTGCATTGCGTAAACGCTTTTTATTTACAAAAAA +TGGGGAAGTATTACGGCGATTGCGAAAAGTCTGAAGCGCTTGAATTAAGATAATATAGAA +AATCAGATACAACAAAAATGGCAGGTAGATGATGTGAAGATAAATTGGAGCGGGCGAAGG +GAATCGAACCCTCGTATAGAGCTTGGGAAGCTCTCGTTCTACCATTGAACTACGCCCGCT +TCGAGATGCGTAAGGCATTATAAACCTTACGCTCTCCTTAGCAAGTACCACGCTGCTGAC +TGCTGATTAATTCACCATCAGCATTTTGGCTTGCTGCCCTGAGGCGGCAAGTAACGTAGC +GGATCAATTGCCGTTGCACGGTAACGAATCTGGAAATGCAGGCGAACAGATGCCGCATCA +GTGCTCCCCATGGTGGCGATTTTTTGCCCAGCTTTCACGCTTTGCCCATTATTTACCAGC +ATCGTGTCATTATGAGCGTAAGCCGTAATGTAATCTTCACTGTGTTTAATCATGATGAGA +TTACCGTAGCCACGCAGCTGGTTGCCCACATACACCACCTTTCCTGCACCCGCGGCGTAA +ATAGGTGTACCCCGTGGAGCTGAGATATCAATTCCTTTATTGCCGCCATCTGCTGTCGAA +TACGGCATGATAACTTTCCCTGTCGTTGGCCATAACCAACAACGTTGCCCTACTGGCGGC +CAGGAAGATTTCGGTACCGCTGATGACGGTGTAACCGATGCGGTTTTGGTCGTTGATTTG +GCGGTTGATTTACGTGTACTACTGCTACTTTTCGCCCCACCCAGTTTTAGTTTCTGACCT +ACTTCAATGGTGTAAGGGGGGGAAATGCCGTTCAGTCGCGCCAGTTCTTTTACGCTGGTT +CCCGTGGTGCGCGAAATACGATATAGCGTATCCCCCCGTTTCACGGTGTAAACGGAGCCG +GAATACGTTCCTGTATCGGATGATTTGCTACCCGAACAGCCCGCCAAAAGCAGTCCAACC +GATAACAACATCACGATACCCAGAGATTTTTTATTCAGGCGTCCCGCACTCAAAATCTTT +CCTCGCTTAAAAAACAAGACGCCATATCATAGCAGCCGGCTTCTGGATACCCAATCTCTT +GCTTCTGGAAAAGCGATGTAATAGAGAAAGAGGTTAATTTCATTTGGCAAAGGGAAGTAT +CATCAGCAAAATATTTGCTGTAGTGGTATCGAAGTTCCTGACTTTTACCCTATTTCCCAC +CTTGATGCGTAATAATCCTAATTTATCACATTGATTTTATCGCCACTCATATTGATACGT +ATCACTGTCCCTATTCAGAGTCCTGTTTCGTATCATATCTGTGTTTTTTTAACGTCATCA +CACTTCCTTCCTCCCCTCACGCATATAGTCGTTTCTGGCGTAATTCTTGCCTGCTAAGAC +TAAATCTTTGCCATAAGAACCAAATGTTCAAACCGAGGGGATTTCTATGGAAGCGCGGGA +AGCAACCGCTACGGGTGAATCATGCATGCGCGTCGATGCCATTGCTAAGGTCACCGGGCG +GGCACGATATACTGACGATTATGTTATGGCGGGCATGTGTTACGCGAAATATGTACGTAG +CCCTATCGCACATGGTTATGCTGTAAGTATTAATGATGAACAAGCCAGGAGTTTGCCGGG +CGTCCTGGCGATTTTTACCTGGGAAGATGTGCCAGAAATCCCATTCGCCACGGCAGGGCA +TGCCTGGACACTTGACGAAAACAAGCGCGATACCGCCGATCGCGCACTGCTAACTCGCCA +TGTTCGTCATCATGGCGACGCCGTTGCCATCGTCGTGGCCCGCGATGAACTCACGGCAGA +AAAAGCGGCGCAATTGGTCAGCATTGAGTGGCAAGAATTACCCGTTATCACCTCGCCAGA +AGCGGCGCTGGCAGAAGACGCTGCACCAATCCATAACGGTGGCAATTTACTGAAACAAAG +CACGATGTCGACGGGTAATGTCCAACAAACAATCGATGCCGCCGACTACCAGGTACAGGG +GCACTATCAGACTCCCGTTATTCAACATTGTCATATGGAAAGCGTGACATCGCTGGCATG +GATGGAGGATGACTCGCGAATTACCATCGTTTCCAGCACCCAGATCCCGCACATTGTTCG +CCGCGTGGTTGGTCAGGCGCTGGATATTCCCTGGTCATGCGTACGAGTCATCAAACCGTT +TATCGGTGGCGGTTTTGGTAATAAACAGGATGTACTGGAAGAGCCAATGGCGGCATTCCT +GACCAGCAAACTTGGCGGCATTCCGGTGAAAGTTTCCCTTAGCCGTGAAGAGTGTTTCCT +CGCAACCCGTACCCGCCACGCTTTTACTATTGACGGGCAAATGGGCGTGAACCGCGACGG +AACATTGAAAGGTTATAGTCTGGATGTTCTGTCTAACACCGGCGCTTATGCATCTCACGG +GCACTCCATTGCTTCTGCTGGGGGGAATAAAGTCGCTTACCTTTATCCTCGTTGTGCCTA +CGCTTACAGTTCAAAGACCTGCTATACCAACCTCCCCTCGGCTGGTGCGATGCGTGGTTA +TGGCGCGCCACAAGTCGTATTTGCCGTTGAGTCTATGCTTGATGATGCCGCGACAGCGTT +AGGTATTGATCCTGTTGAAATTCGTTTACGCAACGCCGCCCGCGAAGGAGATGCTAATCC +GCTCACGGGAAAACGTATTTACAGCGCAGGGTTGCCGGAGTGTCTTGAAAAAGGCCGGAA +AATCTTTGAATGGGAAAAACGCCGTGCAGAGTGCCAGAACCAGCAAGGCAATTTACGTCG +TGGCGTTGGCGTCGCCTGTTTTAGCTACACCTCTAACACCTGGCCTGTCGGCGTAGAAAT +AGCAGGCGCGCGCCTGTTGATGAATCAGGATGGAACCATCAACGTGCAAAGCGGCGCGAC +GGAAATCGGTCAGGGTGCCGACACCGTCTTCTCGCAAATGGTGGCAGAAACCGTGGGGGT +TCCGGTCAGCGACGTTCGCGTTATTTCAACACAAGATACCGATGTTACGCCGTTCGATCC +CGGCGCATTTGCCTCACGCCAGAGCTATGTTGCCGCGCCTGCGCTGCGCAGTGCGGCACT +GTTATTAAAAGAGAAAATCATCGCTCACGCCGCAGTCATGCTACATCAGTCAGCGATGAA +TCTGACCCTGATAAAAGGCCATATCGTGCTGATTGAACGACCGGAAGAACCGTTAATGTC +GTTAAAAGATTTGGCGATGGACGCTTTCTACCACCCTGAACGCGGCGGGCAGCTCTCTGC +TGAAAGCTCCATCAAAACCACCACTAACCCACCGGCGTTCGGCTGTACATTTGTTGATCT +GACGGTCGATATTGCACTGTGCAAAGTCACCATCAACCGCATCCTCAACGTTCATGATTC +GGGGCATATTCTAAATCCGCTGCTGGCAGAAGGTCAGGTACACGGCGGAATGGGAATGGG +CATTGGCTGGGCGCTATTTGAAGAGATGATCATCGATGCGAAAAGCGGCGTGGTCCGTAA +CCCCAATCTGCTGGATTACAAAATGCCGACCATGCCGGATCTGCCACAACTGGAAAGCGC +GTTCGTCGAAATCAATGAGCCGCAATCCGCATACGGACATAAGTCACTGGGTGAGCCACC +AATAATTCCTGTTGCCGCTGCTATTCGTAACGCGGTGAAGATGGCTACCGGTGTTGCAAT +CAATACACTGCCGCTGACGCCAAAACGGTTATATGAAGAGTTCCATCTGGCAGGATTGAT +TTGAGGATAACATCATGTTTGATTTTGCTTCTTACCATCGCGCAGCAACCCTTGCCGATG +CCATCACCCTGCTGGCTGACAATCCGCAGGCCAAATTGCTTGCCGGTGGCACTGACGTAC +TGATACAGCTTCACCATCACAATGACCGCTATCGCCATATTGTTGATATCCACAATCTGG +CAGAGCTTCAGGGAATAACACAGGCGGAAGATGGCGCGCTGCGAATCGGCTCCGCGACAA +CATTTACTCAGCTCATTGAAGATCCCGTAATCCAACGCAATCTCCCGGCGTTATGTGCTG +CGGCTGCATCAATCGCCGGGCCGCAGATCCGTAATGTCGCCACCTACGGCGGAAATATTT +GCAACGGTGCCACCAGCGCAGATTCTGCCACGCCAACGCTAATTTATGACGCGAAACTGG +AGCTCCACTCCCCACGCGGTGTTCGTTTCGTCCCGATTAATGGCTTTCACACCGGGCCGG +GCAAAGTGTCTCTTGAGCATGACGAAATCCTTGTCGCCTTTCATTTTCCGCCACAGCCGA +AAGAACACGCGGGCAGCGCACATTTTAAATATGCCATGCGCGACGCAATGGATATTTCAA +CAATTGGCTGCGCCGCACATTGCCGACTGGATAACGGCAATTTCAGCGAATTACGCCTGG +CATTTGGTGTTGCCGCGCCAACGCCGATTCGCTGCCAACATGCCGAACAGACTGCACAAA +ATGCGCCATTAAACCTGCAAACGCTGGAAGCCATCAGCGAATCAGTCCTGCAAGATGTCG +CCCCGCGTTCTTCATGGCGGGCCAGTAAAGAGTTTCGTCTGCATCTCATCCAGACGATGA +CCAAAAAAGTGATTAGCGAAGCCGTCGCCGCGGCGGGGGGAAAATTGCAATGAATCACAG +CGAAACAATTACCATCGAATGCACCATTAACGGGATGCCTTTTCAGCTTCACGCCGCGCC +AGGAATGCCGCTTTCGGAACTACTCCGAGAACAAGGGCTTCTTAGTGTCAAACAAGGTTG +CTGCGTAGGCGAATGCGGTGCCTGTACGGTGCTGGTCGACGGCACTGCGATAGACAGTTG +CTTATTCCTTGCGGCCTGGGCTGAAGGAAAAGAGATCCGCACGCTGGAAGGTGAAGCGAA +AGGCGGTAAACTTTCTCATGTCCAACTGGCTTATGCGAAATCTGGTGCAGTGCAATGCGG +GTTTTGTACGCCGGGCCTGATTATGGCTACCACGGCAATGCTGGCGAAACCACGCGAGAA +GCCATTAACCATTACGGAAATTCGTCGTGGACTGGCGGGAAATCTTTGTCGCTGCACAGG +GTATCAGATGATTGTAAATACAGTTCTGGATTGCGAGAAAACGAAGTAAAAGGATATCCG +GCCTGAATTCAGGCCGGATTCTCAGAGGTTATGTGTTTAACAACTCATATTTCTTAATCT +TGCGATAGAGCGTAGCAATGCCGATGCCCAGTTCATCAGCAACTTCCTTCTTGCTGTTAT +GACGTGAAAGCGCCTCGCGGATCATTTGCTTTTCCATCTCCTCCAGCGCCGTGCCGCCCG +CATCATCGAGTGACAGGTGCGCCTCACTGACCTCTGTTACATCACTTTGCTCCGTTGTGC +CATTATTCAGCAGATTTGGCGGCAATAGCGTGCTGTCGATAACTTCACCTGAAGGAACAA +CGTTAACCAGATATTCCATCAAATTGCTTAACTCGCGCAGGTTTCCGGGCCAACGATGCT +TACGCAATATTTCGACGACATCAGGAGCAATGCCAGGATAAACCGATCCCAGACGACGGG +TATGCAGATGTAAAAAGTAATGCACCAGTAATTCAATATCTTCCTGACGTTCACGCAGCG +GTGGAAGAGTTATCGGGATAACATTAAGTCGGTAGAAGAGATCTTCGCGGAATTTACCTT +CGGCAATGAACTGGGCCAAATTCTGATTAGTTGCAGAAATGATGCGGATGTCGACTTGTA +TTGGGCTACTGGCACCAATCGGCAGAATTTCACGCGCCTCAATAGCGCGCAGTAATTTAG +CCTGCAACATTAATGGCATATCACCAATTTCATCGAGAAACAGCGTGCCCGTATTCGCCG +CCTGAATCAACCCTGTTTTACCGTTGGCAGAAGCGCCAGTAAATGCGCCTTTAACATAAC +CGAACAGTTCGCTCTCCAGAAGCTGTTCCGGAATCGCAGCACAGTTGATAGCAATAAAGG +GTTTATTCCGTCTTCCGCTCAACTTATGGATTGCACGGGCGACGACTTCTTTACCCGTGC +CGCTTTCACCAACCACCATAACGCTGGATGGGCTGGGTGCAATACGGCTAATGAGTCGTT +TTAATTGCCGCATAACACGGCACTCGCCAACCAATTGTTCAATATGCGGTTCATCAGGTG +CATTTGCTACAGAAAAACTGGTATGCGATTGGTGAAACGCCATTAAAAATAGTTGTCGGC +CCTGGATGTTATGCAACTGACCAATGATTAATTCACTTTTATCATCCCACGAAACAATAT +GTTGCATATGACCATGGGTAAAATTACTCTCAAATGTTAATGGTCTGAAACGAACAGGTT +TTCCAATAATATTATTTTGTACAACACCGAGTGTTTTTAAAGCTGTCTGATTAACAAACT +GAACCCGATTATCAGCATCAACCACTAACACGCCCTGATCCATATTATCGATCATGGTCG +CGAATATTTTACTGATGTTATCTCCTGGTCCCTGATCCTCCAGAAGTTTAGAAACAAAAA +TGGTGGATATATGGCGAACGTAATCGGAAAATTCGCGTAAATTATCACTGATATGTTCTT +GTTGCTCGTGGGTAACGGCAATCAAACTTATCACCCCAACACAACGATCCTGTAAAATGA +CAGGCGTACCCAGAAATGCTTTTTCGCGGCAATTTTCTTTACTATCGCAACCTTCACAAA +GGGGATCGAAGCGAGACTGTGTCACAACTTTTTCAGTTTTCGTTTCCAGGACGTGGCGGA +GCAGGCGTGAGTTGCCGCTCAACTGGCGGCCAAGAAACTTCCCATACGCGCCCGTTCCGG +CGACGCGACACAAGTTTTCATCAACGATCTCAACCTCAAGCTGCAAAACGCTGGCAAGCA +TTCTGGCAAAACGCTGAATTGTCGGTTGAATTTGCATCAATACTGACTGCGTAGTCGCAA +GCTCCATAGCTTTACCTTCCAGACTTACTTAAAAGTCGATCATTGAAGACGTTGATGGTT +CACAGATCATGATGATATTAACTCAGGCGAAATTGGCTTTGATAAAAACATAAGATTTTT +ATCACTTTCTAATAAAATTATGGAAGAGATATCACATTTCTATATCAATATGAGAATTAC +AGCGGCAAGTTTATCAAACTGAAGAGAGATAGCCTGCCTCTTTATCTTATTTCTGATACT +TAGCAGCAAATAAATAACGTGATAAAAAAAGCCAAACGTTTTCGTATTTTACAAACAACC +GGAAACTGGCATCAATATGTGATCAACCCCACACATTATCCGTCAAATTAGCCTTTCGCA +GCCGCGTGGATAATTCTGGCACACTTATTGTTAGTCCCAGGTATAGCTGTGAAAACACCA +ATCACTTTGGCACGTCACAGTGAAATAAACCACTTTGCCTGTCATTCCACTATCGGGACT +TTATGATGAAAACTGTTAATGAGCTGATTAAGGATATCAATTCGCTGACCTCTCACCTGC +ATGAAAAAGATTTTTTGTTAACGTGGGAACAGACGCCAGACGAACTGAAACAAGTACTGG +ACGTTGCCGCCGCGTTAAAAGCACTGCGTGCTGAAAACATCTCAACCAAAGTCTTTAATA +GTGGATTAGGTATTTCCGTCTTCCGCGACAACTCCACCCGTACCCGCTTCTCTTATGCTT +CCGCGCTTAACCTGCTCGGCCTTGCACAACAAGATCTTGACGAAGGTAAATCACAAATCG +CTCACGGCGAAACCGTGCGTGAAACCGCCAATATGATCTCCTTCTGCGCTGACGCTATCG +GTATTCGCGACGATATGTATCTGGGCGCAGGCAACGCCTATATGCGTGAAGTTGGCGCGG +CACTTGATGACGGCTACAAGCAGGGTGTGCTGCCGCAGCGTCCGGCTTTAGTGAACCTGC +AATGCGATATTGACCACCCGACTCAGTCTATGGCTGACCTGGCATGGTTGCGTGAACACT +TTGGTTCGCTGGAAAACCTGAAAGGCAAAAAAATCGCCATGACCTGGGCCTACTCCCCAA +GCTATGGCAAACCGCTCTCTGTACCACAAGGCATCATAGGTCTGATGACCCGCTTCGGTA +TGGATGTCACCCTGGCCCATCCGGAAGGCTACGACCTGATCCCGGATGTCGTTGAAGTTG +CTAAAAACAATGCTAAAGCCTCCGGTGGTAGCTTCCGTCAGGTCACCAGCATGGAAGAAG +CCTTCAAAGACGCAGACATCGTTTATCCGAAGTCATGGGCACCTTACAAAGTGATGGAAG +AGCGTACTGAATTGCTGCGTGCGAACGATCACGAAGGCTTAAAAGCACTGGAAAAACAGT +GTCTGGCACAGAACGCGCAACACAAAGACTGGCATTGTACTGAAGAGATGATGGAACTGA +CCCGTGATGGCGAAGCCCTGTACATGCACTGCCTGCCAGCTGATATCAGCGGCGTATCCT +GCAAAGAAGGTGAAGTGACTGAAGGCGTATTCGAAAAATACCGTATCGCTACCTACAAAG +AAGCCAGCTGGAAGCCTTATATCATCGCCGCGATGATCCTGTCCCGTAAATACGCCAAAC +CAGGTGCACTGCTCGAGCAACTGCTGAAAGAAGCGCAAGAACGCGTGAAATAACCCCTCG +GGCCGATCAGCTGGTCGGCCCTCTATTTCCAGAGGCCAAAAGGATAGGATATGTCCGTTT +TCTCATTGAAGATTGATATCGCCGATAACAAATTTTTCAACGGCGAAACATCACCGCTTT +TTTCGCAAAGCCAGGCAAAACTGGCACGCCAGTTCCACCAGAAAATTGCTGGTTATCACC +CAACACCGCTTTGTGCGCTGGACGATCTCGCAAACCTGTTTGGTGTAAAGAAAATTCTCG +TCAAAGACGAATCAAAACGATTCGGTCTGAACGCCTTCAAAATGCTCGGCGGTGCGTACG +CCATCGCTCAATTATTGTGTGAAAAATATCATCTTGATATCGAAACGCTGTCATTTGAGC +ACCTGAAAAATGCCATCGGCGAAAAAATGACTTTCGCGACTACCACCGACGGCAACCACG +GGCGCGGTGTGGCATGGGCAGCACAGCAACTCGGACAGAATGCGGTGATTTACATGCCGA +AAGGTTCTGCTCAGGAACGCGTTGACGCCATTCTAAACCTCGGTGCCGAGTGCATCGTCA +CGGATATGAACTATGACGATACCGTTCGCCTGACCATGCAACACGCGCAGCAGCACGGCT +GGGAAGTGGTACAGGACACGGCATGGGAAGGCTACACCAAAATCCCAACCTGGATCATGC +AAGGCTACGCAACACTGGCGGATGAAGCCGTCGAGCAAATGCGTGAAATGGGCGTAACCC +CGACACACGTTCTGCTACAAGCCGGTGTCGGTGCAATGGCCGGTGGTGTGCTGGGTTATC +TGGTCGACGTCTATAGCCCGCAAAATCTGCACAGCATTATTGTTGAACCTGACAAAGCTG +ACTGTATTTATCGCTCCGGCGTCAAAGGCGACATCGTCAACGTTGGCGGTGATATGGCCA +CCATCATGGCGGGCCTGGCCTGCGGCGAACCTAACCCGCTGGGCTGGGAAATCCTACGTA +ACTGCGCCACCCAATTCATCTCCTGCCAGGACAGCGTTGCCGCATTAGGTATGCGCGTGC +TGGGTAATCCGTATGGCAACGACCCGCGCATCATCTCCGGTGAATCCGGCGCTGTCGGTT +TGGGCGTTCTCGCAGCGGTTCATTATCACCCGCAACGTCAAAGCCTGATGGAAAAACTGG +CGCTGAACAAAGATGCCGTGGTGCTGGTTATCAGCACTGAAGGCGACACCGACGTGAAGC +ACTACCGCGAAGTTGTCTGGGAAGGCAAACACGCTGTAGCACCTTAATCACCCTATTGGA +ACTGCTCCCTGCAAAACGGGGAGTAAAAAATCTGGAGAAAAATAATGGCTAAGAATATTC +CATTCAAACTGATTCTTGAAAAAGCAAAAGATTACCAGGCAGACATGACTCGCTTCCTAC +GCGATATGGTTGCTATTCCCAGTGAAAGCTGCGACGAGAAACGCGTAGTACATCGTATTA +AAGAAGAGATGGAAAAAGTCGGCTTCGATAAAGTTGAAATCGACCCAATGGGCAACGTTC +TCGGTTATATCGGCCACGGCCCGCGTCTGGTGGCAATGGACGCTCATATCGACACCGTCG +GCATTGGCAACATCAAAAACTGGGACTTCGATCCGTATGAAGGCATGGAAACCGACGAGC +TGATCGGTGGTCGCGGTACTTCCGACCAGGAAGGCGGCATGGCATCTATGGTTTATGCCG +GTAAAATCATTAAAGACCTCGGTCTGGAAGATGAATATACCCTGCTGGTTACCGGTACTG +TGCAGGAAGAAGACTGCGACGGTCTGTGCTGGCAATACATTATTGAACAATCCGGCATTC +GCCCGGAATTTGTGGTCAGTACCGAACCAACCGACTGCCAGGTATACCGTGGTCAACGCG +GTCGTATGGAAATTCGCATTGATGTTCAGGGTGTTAGCTGCCACGGTTCGGCACCAGAAC +GTGGTGATAACGCCATTTTCAAAATGGGTCCAATTCTTGGCGAATTACAGGAACTGTCTC +AACGTCTGGGCTATGACGAATTCCTCGGCAAAGGTACGCTGACTGTTTCCGAAATTTTCT +TCACCTCCCCAAGTCGTTGCGCTGTCGCAGATAGCTGCGCAGTTTCTATTGACCGCCGTC +TCACCTGGGGCGAAACATGGGAAGGCGCGCTGGACGAGATCCGTGCCCTGCCTGCAGTAC +AAAAAGCGAATGCTGTCGTTTCTATGTACAACTACGACCGTCCGTCCTGGACTGGCCTGG +TTTATCCAACCGAATGCTACTTCCCGACCTGGAAAGTGGAAGAAGATCACTTCACCGTTA +AAGCACTGGTGAATGCTTATGAAGGGCTGTTTGGTAAAGCGCCTGTCGTTGATAAGTGGA +CCTTCTCAACTAACGGCGTATCCATCATGGGTCGCCACGGCATTCCGGTCATCGGTTTTG +GCCCTGGTAAAGAACCGGAAGCGCACGCGCCAAACGAAAAAACCTGGAAATCTCACCTGG +TAACCTGTGCCGCTATGTACGCTGCAATCCCATTAAGCTGGCTGGCAACCGAATAATTAC +TCTTCACTTATTCCCCTCCGGTTCGCCGGAGGGTTTTTGGAGTTTGCTATGCGCGTATTG +ATAAAAAACGGCATTGTTGTTAATGCAGATGGACAGGCGAAGCAGGATTTGCTGATTGAA +AGCGGGATTGTTCGCCAGTTGGGTACCGATATTTCGCCGCAACTCCCTTGCGAAGAAATT +GATGCCTCTGGCTGTTACGTTTTCCCTGGCGGCGTGGATGTCCATACGCATTTCAATATT +GATGTCGGCATCGCGCGCAGTTGTGATGATTTTTTTACCGGTACCCGCGCTGCTGCGTGT +GGCGGTACAACAACCATTATTGACCATATGGGATTTGGCCCAAATGGCTGCCGGTTACGC +CATCAACTGGAAGTTTATCGCGGTTATGCCGCCCACAAAGCAGTCATCGACTACAGCTTT +CACGGTGTCATTCAACATATTAATCACGCTATCCTCGACGAAATTCCGATGATGGTTGAG +GAAGGACTGAGCAGCTTTAAACTCTATTTAACCTATCAATATAAACTCAACGATGATGAA +GTGTTGCAGGCATTACGCCGCTTGCATGAGTCCGGCGCGCTGACCACCGTACACCCGGAA +AATGACGCAGCTATCGCCAGCAAGCGGGCGGAGTTTATCGCCGCAGGGTTAACCGCGCCG +CGTTATCATGCCTTGAGTCGACCTCTGGAATGCGAAGCGGAAGCCATCGCCCGCATGATT +AACCTGGCACAAATTGCCGGTAACGCCCCGCTCTATATCGTGCACCTGTCTAACGGCTTA +GGTCTAGATTATCTGCGTCTTGCCCGTGCGAATCACCAGCCAGTCTGGGTTGAAACCTGC +CCACAATATCTCCTGTTGGACGAACGCAGTTACGATACAGAAGATGGCATGAAGTTCATT +CTTAGCCCACCGCTGCGTAACGTACGCGAGCAGGACAAACTGTGGTGTGGCATCAGCGAT +GGTGCGATTGACGTGGTGGCAACCGATCACTGCACCTTCTCGATGGCTCAACGCCTGCAA +ATTTCTAAAGGCGATTTCAGCCGCTGCCCAAATGGCTTACCCGGTGTGGAGAACCGCATG +CAACTGCTGTTCTCCAGTGGCGTGATGACGGGACGTATCTCACCGGAGCGTTTTGTTGAG +TTAACCAGTGCAATGCCCGCCAGGCTGTTTGGCCTGTGGCCACAAAAAGGATTATTAGCG +CCCGGTTCCGATGGCGACGTGGTGATTATAGACCCACGTCAGAGCCAACAAATTCAGCAT +CGCCATCTCCACGACAACGCTGACTACTCGCCATGGGAGGGTTTTACCTGTCAGGGCGCG +ATTGTCAGAACCTTATCTCGTGGTGAAACGATTTTCTGCGACAGCACCTTTACAGGCAAA +GCCGGGCGAGGTCGTTTCCTGCGACGCAAACCGTTTGTCCCTCCCGTGCTCTAACCACTG +CCAGGGATCTATACACAATCAAGAATGATGAGTGAGGAAAAATGAGTAAGAAAATTGTTC +TCGCCCTGGGCGGGAATGCGCTGGGCGATGACCTGGCTGGGCAAATGAAAGCGGTAAAAA +TTACTTCTCAGGCAATTGTTGATTTAATTGCCCAGGGACATGAGGTCATCGTCACTCATG +GCAACGGGCCACAGGTGGGCATGATTAACCAGGCCTTTGAAGCTGCAGCAAAAACTGAAG +CGCACTCGCCAATGCTGCCGATGTCTGTCTGTGTTGCCTTAAGCCAGGGTTATATTGGTT +ACGATCTACAAAACGCCTTAAGAGAAGAACTGCTTTCTCGTGGCATTAATAAACCTGTAG +CAACGCTGGTTACCCAGGTCGAAGTCGATGCTAACGATCCGGCATTCCTCACCCCGACCA +AGCCGATCGGTTCGTTCTTTACCGAGCAAGAAGCAGAGCTACTGACAAAACAGGGTTACA +CTCTGAAAGAAGATGCGGGTCGCGGCTATCGCCGTGTCGTTGCTTCGCCAAAACCGGTTG +ATATCATTGAAAAAGAAACGGTTAAAGCTCTGGTAGATGCCGGACAGGTGGTGATCACCG +TTGGCGGTGGTGGTATCCCTGTTATTCGTGAAGGTAACCATCTGCGTGGTGCCAGCGCGG +TTATCGATAAAGACTGGGCCAGCGCCCGTTTAGCAGAAATGATTGATGCCGATATGCTGA +TCATTCTGACTGCGGTAGAAAAAGTGGCCATTAACTTCGGAAAAGAGAATGAACAGTGGC +TCGATCGCCTGTCGTTAAGTGATGCTGAACGCTTTATCGAAGAAGGTCATTTTGCGAAAG +GTTCTATGCTGCCTAAAGTGGAAGCTGCCGCCTCGTTTGCTCGCTCTCGCGCAGGTCGTG +AAGCACTGATTA +>my_contig +CCGTATTGAGCAAAGCGAAAGAGGGGATTGAAGGCAAAACCGGAACGGTGATTTGTCAGT +AATTTAAAGGCCGGATGGGTAATACCATCCGGCCATTTTCATTTAAGCCACTTCCAGCAC +TTCTTTTGTCGCTTTAACGCCCTGATGCATCAACATCATTAACGCCTCAAGTACGCCGCC +GCCAATCGCCCGGGCTTTATCAGAAACGCTGGTGAAATCAGCCGTTTCACCACGAGGATC +GATATCACCAATTTTAAAACCACCGACCACGGCCAGTCCGTCGTTCAACAAGCCACGCAC +CATCCCCGTCAACGGTGCTTTAATTTCATGCTCACCAATCCAGGCAATGACATCGCCCTC +TTTCACCAGATCGCCTAATTTCACGTTGGATCGCATAATGCCTGCAGCAGGAGCGCGGAT +CACTCGTCGGGTGGTATGCCCCATAATATTGCCGGGAACACCGGTATTCTCCTGCGCACA +ACCTGAGTAAATCACCTGACCGAGCCAGTGCCCGCGATTTGTTTCAATTACCGCATGACA +ATCCTTCCCTGCAGTAAAGCCCGGCCCAAGCGCGATTGTTACTGGTGCCATATCTGCCCG +CGTTCCCAAATTCTGTTTCGCCAGAATAGCGTCCACCACGCAAAGCGGTTTCAGTTCATC +AAGCAATGAACAGGTGGGATCTACCATCACAGGGATAAATCCGCGTTCGGTAAGTTTCAT +CGCTTCCGCAGAGCTGGTTGCCAGGCGGGCGGTGACGCCTTCGACCGTCATTTCGCCATC +GAACACGGCCTGGGCAAACGCCACGGTACAACGAATCACTGTCGGTTTTTCCACTTCCAA +CATGATCACTTTAAAACCCGCATGATACAGACGTAGCGCTACACCACTGGCGATATCCCC +CGCACCGCGAATCACCACCAGCTGGTGTCCGGAAGGATGAGAAGGCTTCATCATCAGCCC +ACCCGGCGCGTTATTTTTCACCTGTAATATTTCTGCCAGCACGCTGATGGCGATCTCTTG +CGGCGTTTCCGCACCTATATTGTAACCAACGGGCGCATGTAAACGGGCAATATGTTCTTC +AGCCACGCCTTTCTCACGCAATTGGCGCAGGAAAAGCTGAACCTTGCGGCGACTTGCCAG +CAACCCCAGCCATGCAATGGGTTGTTCAATGAGTTTGTCGAGGGCTTCACGATCCTGATT +ATTCGTGGCAATCAGGACAAAATTATCAGGGCGAATATCCAGTGCTTCCACTGCCGCACC +AAACGACTCAGCATGGAGAAGCGTGGTTGATGGTGGGAATAGTTCAGGATTGAGGCTTTC +GCGATAAATATCAGCAACGGCGATATCAAATCCTAATAGCGCCGCACTCTGGGCTATCGC +CCGGTTGACATGCCCCGCACCAATCAACACCAGACGTGGACGCATACCATGGACGCTGAT +AAATACTGACATTGCACCTCCACAATCTGACCCGACAGCATCCGCACCGTTACGAGCCAT +ACGTCCATGGAATAATCGCGGCTTACGTTCCTGCAATGCCTGAAGCGACTCTTCAATCAC +CTTCCGTTCAACCATTCCGCCACCAATTGTACCGACGATAGAACCATCGGCGCGCACTAA +CATTTGTGCAGAATGGCGGGGGGTTGAGCCTCGGCTATCAACAATTTGCGCCATCGCAAA +CGGACAATTTTGCTCTTCGAGTTTTGCAGCCTCTGTGAAAATATTCATACCAACCTCAAT +GGATATCCTTTCAGTAACCCGGAATACCCGGGCCGCTAATTCACAAATCTGCGCGCGATT +GCAGGATGTTCTTGTATATCGCCCAGCCAGATTGCCTCTACGTTGTGTTGTTGCAGCGGT +TGAAGGAGCTCGCTTTGCGCAATCGCATTCTCACATTGAGAAAAACGGTTAATGAACCAG +ACTCGCCGACAACCTTGTGGTACGTTTTTAAACGCCCCCTGAGGGTGGCGAACCAGCGCA +ACGAGATCGCTCAGTTGCAAGGGTGCAGCAGGTGTTAACCCAGTAATATCAGCAAACTGC +GACCAGCGATGGACATTTTCTGTGCTCACTTTCGCACCCAAAATATGTCCTCCCATCACA +GCAATCACGCAGCAACTGCTTTTAGGTATGCAAGGTTCGTGCTCATCAGGCGCTTTTAAC +GGCATTCCACGCGAGCCATCTGCCTCAATGAGAATTACGTCACACTCTGGTCGTTGTACC +AGTGCATCAATCGCTTCTGGCGTAAATCCCTGCACTTTTCCCTGGTTCGCTTTCCAGCAG +TGAAAACAAAATGAAATGGGGGATATAAAAGACGCATGAGGAAGCATGGCGGGATCACGA +CAGAAAACCACGGGCCAGTGAGATGTTGGCATAAACATATGTGTCGTCGTAGTGATTAAT +ACACGCCTGCCACTCGCCTGGAACAGTTCTGCCAGCCAAAAAAGCAAGCTGGTTTTCCCC +CCAGCACCAACAATAGAAATCACAGTGGGACGTTTCTGCGCGCCTAAATCAATGAATAAT +GCCGATGGGTCAATTATACTTTTCACGCGTCTTTATGGACCTCTCTGGGATAAATTACCC +TCAACGTAATCCATCAGGAAGTAACGCAATTATCAGGCGTTATTAGCTCCTGTAAATAAT +GGAATCACTATGTCAGCCATCGACTGTATAATTACCGCCGCAGGATTATCATCAAGAATG +GGGCAATGGAAAATGATGTTACCCTGGCAACAGGGAACAATTCTTGATACAAGTATCAAA +AATGCGTTGCAGTTTTGTAGCCGAATTATTTTAGTCACCGGCTATCGTGGTAATGAACTG +CACGAACGTTATGCGAACCAGAGCAATATCACTATTATCCACAACCCAGATTATGCGCAG +GGTTTACTGACATCAGTAAAGGCCGCAGTACCCGCGGTACAAACAGAACATTGTTTTCTC +ACCCACGGAGATATGCCAACCCTCACCATCGATATTTTTAGAAAAATCTGGTCGTTACGA +AATGATGGCGCAATACTGCCACTCCATAATGGCATCCCCGGCCATCCGATTTTAGTGTCA +AAACCATGCCTGATGCAGGCAATCCAGCGACCCAATGTCACCAATATGCGTCAGGCACTC +CTTATGGGAGAACATTATTCCGTCGAAATAGAAAATGCAGAAATAATTTTAGATATTGAT +ACTCCGGACGACTTTATTACAGCGAAGAAAAGGTATACTGAAATTTAGAAAACGTAGTTA +AACGATTGCGTTCAAATATCTAATCCCTCCAGCACTCTTTATCATAATGATAAGGAATCA +CTGATTTTGAGAAAAGAGAAAAAGTGATAAATGGGCTGGCAATAATAATTTTCAGGAGTG +ATTTTAATTCTCATTTGGCACCTGTGAGTTCATTCACAAAAAGCCATTAAGTTTCGAGCC +GCCTCACATTTTTTTATATTTCCCGCCAAACCTGGCAAGAGTGGTGCGATTGTTGCTCTA +TCCCCCTAAACCACCGGATTTCTCAACACCGGTCACTCAATGATATCTGTATAAGCTAAG +GAGAGGGTTATGGGGGATATTATGCGTCCCATTCCGTTTGAGGAACTTTTGACGCGCATA +TTTGATGAATACCAACAACAACGCTCAATCTTTGGTATTCCCGAGCAACAGTTTTACTCA +CCCGTAAAAGGTAAAACTGTTAGCGTCTTCGGTGAAACCTGTGCCACTCCCGTCGGCCCT +GCCGCTGGCCCGCACACGCAACTTGCGCAAAACATCGTCACCTCCTGGCTGACTGGCGGA +CGCTTCATCGAACTAAAAACCGTCCAAATTCTTGACCGCCTGGAGCTGGAAAAGCCCTGT +ATCGATGCCGAAGACGAGTGCTTTAACACCGAATGGTCTACCGAATTTACCCTGCTTAAA +GCCTGGGATGAATACCTCAAAGCCTGGTTTGCCCTGCACCTTCTCGAAGCGATGTTCCAG +CCTTCTGATTCCGGTAAATCGTTCATCTTTAATATGAGCGTCGGTTACAACCTCGAAGGT +ATTAAGCAACCGCCGATGCAGCAGTTCATCGACAATATGATGGACGCATCTGACCATCCG +AAATTCGCTCAATACCGCGATGCACTTAATAAGCTACTCCAGAATGAGGCATTTTTAGCC +CGCCACGGATTGCAGGAAAAACGCGAAAGCTTGCAAGCCTTACCCGCTCGCATCCCCACC +AGCATGGTACAAGGGGTTACCCTCTCCACCATGCACGGCTGTCCTCCGCATGAAATCGAA +GCCATTTGCCGCTACATGCTGGAAGAAAAAGGGCTCAACACCTTTGTGAAACTCAACCCG +ACCTTACTGGGGTACGCGCGTGTTCGTGAGATCCTCGATGTCTGCGGTTTCGGTTACATC +GGCTTAAAAGAAGAGTCATTTGATCACGACCTCAAGCTGACGCAAGCGCTGGAAATGCTG +GAACGCCTGATGGCACTGGCAAAAGAAAAATCACTCGGCTTTGGCGTAAAACTGACTAAC +ACTCTCGGCACCATTAATAACAAAGGCGCACTGCCTGGTGAAGAGATGTATATGTCAGGC +CGTGCGCTGTTCCCGCTCTCCATCAACGTTGCAGCAGTTCTCTCTCGCGCCTTTGACGGC +AAACTGCCCATTTCTTATTCCGGTGGTGCCAGTCAGCTGACTATCCGCGATATTTTTGAT +ACTGGTATTCGCCCTATTACTATGGCAACCGACCTGCTGAAACCTGGCGGCTATCTGCGC +TTAAGTGCCTGCATGCGCGAGCTGGAAGGCTCCGACGCCTGGGGACTTGACCATGTTGAC +GTCGAACGACTGAACAGACTGGCAGCAGACGCGTTAACCATGGAATACACCCAGAAACAC +TGGAAGCCAGAAGAGCGTATTGAAGTGGCTGAAGACCTGCCGCTGACCGATTGCTACGTT +GCCCCCTGTGTTACTGCCTGCGCTATCAAGCAAGATATTCCGGAATACATCCGTCTGCTT +GGCGAACACCGCTATGCCGACGCGCTGGAACTCATCTATCAACGCAACGCCCTGCCCGCC +ATTACCGGTCATATTTGCGATCACCAGTGCCAATACAACTGTACCCGCCTGGATTACGAC +AGTGCGCTGAATATCCGCGAACTGAAAAAAGTCGCGCTGGAAAAAGGTTGGGAGGAATAT +AAGCAACGCTGGCACAAACCAGCCGGTTCTGGTTCACGCCATCCGGTTGCCGTGATTGGT +GCAGGTCCGGCGGGTCTGGCCGCAGGTTACTTCCTTGCCAGAGCGGGCCATCCGGTTACG +CTGTTTGAACGCGAAGCCAATGCGGGCGGCGTGGTGAAAAATATCATTCCTCAGTTCCGT +ATTCCTGCAGAGTTAATTCAGCACGATATCGATTTTGTTGCCGATCACGGCGTGAAATTT +GAGTACGGTTGCTCACCCGATTTGACCGTTGAACAGTTAAAAAATCAGGGCTTCCACTAT +GTTCTGATTGCCACCGGCACTGATAAAAATAGCGGTGTGAAACTGGCGGGCGACAACCAA +AATGTCTGGAAATCACTCCCCTTCCTGCGTGAATACAACAAGGGCACAGCGCTCAAGCTG +GGCAAACATGTGGTCGTTGTCGGGGCGGGTAACACGGCAATGGACTGCGCTCGTGCGGCG +TTACGCGTTCCAGGCGTAGAAAAAGCAACGGTCGTTTACCGTCGTTCACTGCAAGAGATG +CCAGCATGGCGCGAAGAGTATGAAGAAGCGTTGCACGACGGCGTGGAGTTCCGTTTCCTG +AATAATCCGGAACGTTTCGATGCTGATGGCACCTTAACCTTGCGCGTTATGTCGCTTGGC +GAACCTGATGAGAAAGGTCGTCGCCGTCCGGTTGAAACCAACGAAACAGTAACGCTGCAT +GTAGACAGCCTGATCACCGCCATTGGTGAACAGCAGGATACTGAAGCCCTGAATGCAATG +GGCGTGCCGCTGGACAAAAACGGCTGGCCAGACGTCGACCATAATGGCGAAACGCGTCTG +ACTGACGTCTTTATGATCGGCGACGTACAGCGCGGACCATCCTCCATTGTCGCTGCTGTC +GGAACCGCGCGTCGGGCGACCGATGCCATCCTGAGTCGGGAAAATATCCGTTCCCACCAG +AACGATAAATACTGGAATAACGTCAATCCGGCGGAAATCTATCAACGTAAAGGCGATATC +TCTGTCACTCTGGTGAACAGTGACGATCGTGATGCGTTTGTCGCGCAGGAAGCCGCTCGC +TGCCTTGAATGTAACTACGTTTGCAGCAAGTGTGTGGATGTCTGCCCGAACCGCGCCAAC +GTATCCATTGCGGTCCCAGGCTTCCAGAACCGTTTCCAGACGCTGCACCTCGACGCTTAC +TGTAACGAATGTGGCAACTGCGCCCAATTCTGCCCGTGGAACGGTAAACCGTACAAAGAC +AAAATCACCGTCTTCAGCCTGTCGCAAGACTTTGATAACAGCAGCAACCCAGGCTTCCTT +GTGGAAGATTGCCGGGTACGCGTACGTCTGAATAACCAAAGCTGGGTGTTAAACATCGAC +AGCGAAGGTCAGTTCAACAACGTACCACCGGAGCTGAACGATATGTGCCGCATCATTAGC +CATGTCCACCAGCATCATCATTATCTGCTGGGCCGCGTGGAGGTGTAATCATGTTGATTC +TGAAGAATGTCACCGCAGTGCAGTTACACCCGGCGAAAGTGCAGGAAGGCGTTGATATCG +CCATCGAAAATGATGTGATTGTCGCTATCGACGATGCCCTGACGCAACGCTATCCCGATG +CCAGCTACAAAGAGATGCATGGTCGGATTGTGATGCCGGGAATTGTCTGCTCGCATAACC +ATTTTTACTCGGGGCTTTCCCGCGGAATTATGGCAAACATCGCCCCCTGCCCGGATTTCA +TCTCAACGCTGAAAAATCTCTGGTGGCGGCTCGATCGCGCCCTTGATGAAGAGTCGCTCT +ATTACAGCGGACTGATTTGTTCCCTGGAAGCAATTAAGAGCGGATGTACATCGGTTATCG +ATCACCATGCCTCTCCAGCCTATATCGGCGGGTCGCTCTCCACATTGCGCGACGCATTTT +TAAAAGTTGGCCTGCGCGCGATGACCTGTTTTGAAACTACTGACCGTAACAGCGGCATCA +AAGAGTTGCAGGAAGGTGTAGAAGAAAACATCCGCTTCGCCCGTCAGATTGATGAGGCGA +AGAAAGCAGCAACCGAGCCGTATCTGGTGGAAGCACATATCGGCGCTCACGCGCCGTTTA +CCGTACCGGATGCCGGTCTGGAGATGCTGTGTGAAGCCGTGAAAAGCACAGGTCGTGGTT +TGCATATTCACGCTGCGGAAGACCTTTACGACGTTTCCTACAGTCACCATTGGTACGGCA +AAGACCTGCTGGCACGACTGGCGCAATTCGATCTCATCGACAGCAAAACGCTGGTCGCTC +ATGGGCTGTACTTGTCGAAAGATGACATCGCCCTACTCAATCAGCGCGATGCGTTCCTGG +TGCATAACGCCCGTTCAAACATGAACAACCATGTCGGCTACAACCATCACCTTAGCGACA +TCCGCAATCTGGCGTTGGGAACGGACGGCATTGGTTCGGACATGTTTGAAGAGATGAAAT +TTGCCTTCTTTAAACATCGCGATGCGGGTGGCCCGCTGTGGCCTGACAGTTTTGCCAAAG +CACTGGCTAACGGCAACGAACTGATGAGCCGCAACTTTGGCGCGAAATTTGGGCTTCTGG +AAGCCGGTTACAAAGCCGATTTAACCATTTGCGATTACAACTCGCCGACGCCGCTGCTGG +CAGACAATATCGCCGGGCATATCGCTTTCGGTATGGGCTCAGGCAGCGTTCACAGCGTGA +TGGTCAATGGTGTGATGGTCTATGAAGACCGTCAGTTTAACTTCGATTGCGATTCCATTT +ATGCGCAAGCCAGAAAAGCCGCTGCCAGTATGTGGCGTCGGATGGATGCGCTGGCATAAA +TAACAGCTCCCCTCTTCTTTCAGAGAAGAGGGGAAATTAAGGAAAGACGATGATTGAACA +ATTTTTCAGACCCGACTCAGTCGAACAGGCGCTGGAACTGAAGCGCCGCTACCAGGATGA +AGCCGTCTGGTTCGCCGGGGGCAGCAAACTCAACGCTACACCAACCCGTACCGATAAAAA +GATTGCCATTTCCTTGCAGGATCTGGAGCTGGACTGGATTGACTGGGATAACGGTGCACT +ACGAATTGGCGCAATGTCTCGCTTGCAGCCACTGCGTGATGCGCGATTTATTCCTGCAGC +ACTGCGTGAAGCCCTCGGTTTTGTTTACTCACGCCATGTTCGTAATCAGTCGACCATTGG +TGGTGAAATCGCCGCCCGGCAAGAAGAGTCAGTGCTGCTTCCCGTCCTGCTGGCACTGGA +TGCTGAACTGGTTTTTGGCAACGGCGAAACGCTGTCAATCGAGGACTACCTGGCCTGCCC +ATGCGATCGCCTGTTAACCGAAATTATCATTAAAGATCCGTATCGCACCTGTGCGACTCG +CAAAATTAGCCGTTCTCAGGCAGGTTTAACCGTCGTGACGGCAGCCGTTGCAATAACAGA +CCACGACGGTATGCGAATTGCGCTGGATGGCGTCGCCAGTAAAGCACTGCGTCTGCACGA +TGTCGAAACTCAAAATCTGGAAGGCAATGCACTTGAACAGGCTGTCGCCAACGCCATTTT +CCCGCAGGAAGATTTGCGGGGCAGCGTGGCCTATAAACGCTATATCACGGGAGTTCTGGT +AGCCGATCTGTATGCCGACTGCCAACAGGCTGGGGAGGAAGCCGTATGATCATCCACTTT +ACTTTAAATGGCGCGCCTCAGGAGCTAACCGTTAATCCAGGCGAAAACGTGCAAAAGCTG +TTGTTTAACATGGGAATGCACTCTGTACGCAACAGTGATGATGGTTTTGGGTTTGCCGGT +TCTGACGCAATTATCTTTAACGGTAATATCGTTAACGCGTCCTTGCTTATCGCCGCACAG +TTAGAGAAGGCAGATATTCGTACCGCAGAATCTCTGGGCAAATGGAATGAGTTAAGTCTG +GTTCAACAGGCCATGGTTGATGTTGGCGTGGTGCAGTCTGGTTATAACGATCCAGCTGCG +GCTCTGATTATCACCGATCTTCTCGATCGCATCGACGCACCTACCCGCGAAGAGATCGAC +GACGCACTCTCAGGTCTGTTTAGCCGCGATGCTGGCTGGCAGCAATACTATCAGGTCATT +GAACTGGCGGTTGCACGTAAAAATAATCCGCAGGCCACCATTGATATCGCTCCGACTTTC +CGTGACGACCTTGAAGTCATTGGCAAGCATTATCCTAAAACTGATGCCGCGAAAATGGTG +CAGGCGAAACCCTGCTATGTTGAAGATCGAGTAACGGCTGACGCCTGCGTCATTAAAATG +TTACGTAGCCCACACGCTCACGCACTGATTACTCATCTGGATGTCAGCAAAGCTGAAGCC +TTACCGGGCGTCGTTCACGTTATTACTCACCTGAATTGCCCGGATATTTACTATACCCCG +GGTGGTCAGAGCGCACCGGAACCGTCACCGCTTGACCGCCGAATGTTCGGCAAGAAAATG +CGTCACGTCGGCGATCGCGTTGCTGCGGTAGTAGCCGAAAATGAAGACATTGCGCTCGAA +GCACTGAAGCTCATCGACGTTGAATATGAAGTGCTTAAGCCGGTAATGTCGATTGACGAG +GCAATGGCGGAAGATGCGCCTGTCGTGCACGATGAACCGGTGGTGTATGTTGCTGGTGCG +CCAGATACTCTGGAAGATGATAACAGCCATGCAGCCCAGCGCGGCGAGCATATGATCATC +AACTTCCCGATCGGTTCTCGCCCACGCAAAAATATCGCTGCCAGTATTCATGGTCATATT +GGCGATATGGACAAAGGCTTTGCCGATGCCGATGTGATCATTGAGCGAACCTATAACTCA +ACGCAGGCGCAGCAGTGCCCGACTGAAACACATATCTGCTTTACCCGTATGGACGGCGAT +CGTCTGGTGATCCACGCCTCCACCCAGGTACCATGGCACTTACGCCGCCAGGTCGCGCGC +CTCGTGGGCATGAAACAACATAAAGTTCATGTCATTAAAGAACGTGTAGGCGGCGGTTTT +GGTTCCAAACAGGACATCCTGCTGGAAGAAGTGTGCGCCTGGGCAACCTGCGTGACCGGG +CGTCCGGTACTGTTCCGCTACACCCGTGAAGAAGAGTTTATTGCTAACACCTCTCGTCAC +GTCGCGAAAGTCACCGTCAAACTGGGCGCGAAAAAAGATGGTCGCCTGACGGCAGTGAAG +ATGGATTTCCGCGCCAACACGGGTCCTTACGGTAACCACTCACTCACCGTACCGTGTAAC +GGACCGGCGCTGTCGCTGCCGTTATATCCATGCGATAACGTCGATTTTCAGGTCACCACC +TACTACAGCAACATTTGCCCAAATGGTGCTTATCAGGGTTATGGCGCGCCGAAAGGTAAC +TTCGCTATCACCATGGCGTTAGCGGAACTGGCGGAACAATTGCAGATCGACCAACTGGAA +ATTATTGAACGTAATCGTGTACACGAAGGGCAAGAGCTGAAAATTCTCGGTGCGATTGGT +GAAGGTAAAGCGCCGACATCCGTTCCTTCCGCCGCCAGCTGCGCACTGGAAGAGATCCTG +CGTCAGGGTCGCGAGATGATCCAATGGTCTTCACCAAAACCACAAAACGGTGACTGGCAC +ATCGGTCGTGGCGTCGCCATTATCATGCAGAAATCGGGTATCCCGGATATCGATCAGGCT +AACTGCATGATCAAACTGGAATCAGACGGTACCTTTATCGTTCATTCTGGCGGTGCGGAT +ATTGGTACTGGTTTGGATACTGTGGTGACGAAACTGGCAGCAGAAGTGCTGCACTGCCCC +CCGCAGGACGTGCATGTTATCTCCGGTGATACCGATCATGCGTTGTTTGATAAAGGCGCA +TATGCCTCGTCCGGTACTTGCTTCTCGGGTAACGCTGCGCGTTTGGCAGCGGAAAATCTG +CGGGAGAAAATCCTGTTCCACGGCGCGCAAATGTTGGGTGAGCCAGTGGCAGATGTTCAA +CTAGCAACGCCGGGCGTCGTTCGCGGCAAGAAAGGCGAAGTTAGTTTCGGAGAGATAGCC +CATAAAGGCGAAACCGGCACCGGCTTTGGTTCACTGGTGGGAACTGGCAGTTATATCACG +CCTGATTTCGCCTTCCCGTATGGCGCAAACTTCGCTGAAGTTGCCGTCAACACGCGTACG +GGTGAAATCCGCCTGGATAAATTCTACGCCTTGCTGGACTGCGGTACACCGGTCAATCCA +GAGTTAGCGCTGGGACAAATCTACGGTGCCACCCTGCGTGCTATCGGCCACAGTATGAGC +GAAGAGATCATTTATGACGCCGAAGGTCACCCGTTAACGCGTGATTTACGCAGTTACGGC +GCACCGAAAATTGGTGACATTCCGCGTGATTTCCGCGCTGTGCTGGTGCCGAGCGACGAT +AAAGTCGGCCCATTCGGGGCGAAATCGATCTCGGAAATCGGTGTAAATGGCGCCGCTCCG +GCGATTGCTACCGCAATTCACGATGCCTGCGGCATCTGGTTACGCGAATGGCATTTCACA +CCGGAGAAAATACTCACCGCGCTGGAAAAAATATAAGTAATAAATGGCCGCTTCGGCGGC +CTGTTTCTCTGTTTGAACGATGACTAAATAGTGACTGCGAAAATGAGATAAGCCGTTCTC +AAGGCGTCCTGCGCCCCAAATTCGTGGGAATTTATTTTACTAATTCAGATGATCAAATTT +ACTTTAAAAGGAGTGAAGGGATGTCTGATATAAACCATGCAGGTTCTGACCTTATATTTG +AACTGGAGGATCGCCCTCCCTTTCATCAGGCTCTCGTAGGTGCCATTACCCATCTGTTGG +CAATTTTCGTTCCGATGGTAACCCCCGCGTTAATCGTGGGTGCGGCCTTACAGCTTTCCG +CTGAAACAACTGCCTATCTTGTTTCTATGGCGATGATCGCCTCTGGTATTGGTACCTGGT +TACAAGTAAACCGCTACGGCATCGTCGGTTCTGGTTTACTTTCAATTCAGTCAGTCAATT +TTTCATTTGTTACGGTCATGATTGCGCTGGGTAGCAGCATGAAAAGCGACGGTTTTCACG +AAGAGTTAATCATGTCGTCGCTCCTCGGCGTCTCCTTCGTTGGCGCATTTCTGGTTGTCG +GCTCTTCTTTTATCCTGCCCTATTTACGTCGGGTTATTACGCCTACCGTCAGCGGCATTG +TGGTGCTGATGATCGGCTTAAGCCTGATTAAAGTTGGCATTATTGATTTTGGCGGTGGTT +TTGCAGCTAAAAGCAGCGGTACGTTCGGCAATTACGAGCATCTCGGCGTTGGCTTATTGG +TTTTGATTGTGGTGATCGGCTTTAACTGCTGCAGCAGTCCGTTGCTACGCATGGGTGGGA +TCGCCATTGGGCTATGTGTCGGCTATATCGCATCGTTATGCCTGGGCATGGTGGATTTCA +GCAGTGTGCGCAATTTGCCGTTAATCACCATCCCGCATCCGTTCAAATACGGCTTTAGTT +TTAGCTTCCATCAGTTCCTGGTGGTTGGCACGATTTATCTGCTTAGCGTGCTGGAAGCTG +TCGGCGATATCACCGCCACGGCAATGGTTTCCCGCCGTCCCATTCAGGGGGAAGAGTATC +AGTCCCGACTGAAAGGCGGCGTGCTGGCAGATGGTCTGGTTTCTGTTATCGCCTCCGCTG +TCGGTTCATTACCATTAACCACGTTTGCGCAAAATAATGGGGTTATTCAGATGACTGGCG +TCGCTTCACGTTATGTCGGGCGAACCATCGCGGTAATGCTGGTTATCCTCGGCTTATTTC +CGATGATTGGCGGCTTCTTCACGACCATTCCCTCAGCAGTTCTGGGAGGCGCAATGACGT +TGATGTTTTCCATGATTGCCATCGCAGGGATTCGCATCATCATCACCAACGGTTTAAAGC +GCCGAGAAACACTTATTGTCGCCACGTCTTTAGGTTTAGGGCTTGGCGTCTCCTACGATC +CCGAAATTTTTAAAATATTGCCAGCCTCTATTTATGTATTAGTTGAAAACCCTATTTGTG +CTGGCGGGTTAACTGCGATTTTATTAAATATTATCCTCCCTGGTGGCTACCGACAGGAAA +ACGTTCTGCCTGGTATTACCTCAGCGGAAGAGATGGATTAACAGTAAAGGAGTCAATGAT +GTCAGGAGAACACACGTTAAAAGCGGTACGAGGCAGTTTTATTGATGTCACCCGTACGGT +CGATAACCCGGAAGAAATTGCCTCTGCGCTGCGGTTTATTGAGGATGGTTTATTACTCAT +TAAACAGGGAAAAGTGGAATGGTTTGGCGAATGGGAAGACGGAAAGCATCAAATTCCTGA +CACCATTCGCGTGCGCGACTATCGCGGCAAACTGATAGTACCGGGCTTTGTCGATACACA +TATCCATTATCCGCAAAGTGAAATGGTGGGGGCCTATGGTGAACAATTGCTGGAGTGGTT +GAATAAACACACCTTCCCTACTGAACGTCGTTATGAGGATTTAGAGTACGCCCGCGAGAT +GTCGGCGTTCTTCATCAAGCAGCTTTTACGTAACGGAACCACCACGGCGCTGGTGTTTGG +CACTGTTCATCCACAATCCGTTGATGCGCTGTTTGAAGCCGCCAGTCATATCAATATGCG +TATGATTGCCGGTAAAGTGATGATGGACCGAAACGCACCGGATTATCTGCTCGACACTGC +CGAAAGCAGCTATCACCAAAGCAAAGAACTGATTGAACGCTGGCACAAAAATGGTCGTCT +GTTGTATGCGATTACGCCACGCTTCGCCCCTACCTCATCTCCTGAACAGATGGCGATGGC +GCAACGCCTGAAAGAAGAATATCCGGATACATGGGTACATACCCATCTCTGTGAAAACAA +AGATGAAATTGCCTGGGTGAAATTGCTTTATCCTGACCATGATGGTTATCTTGATGTTTA +CCATCAGTACGGCCTGACCGGTAAAAATTGTGTCTTTGCTCACTGCGTCCATCTCGAAGA +AAAAGAGTGGGATCGTCTCAGCGAAACCAAATCCAGCATTGCTTTCTGTCCGACCTCCAA +CCTTTACCTCGGCAGCGGCTTATTCAACTTGAAAAAAGCATGGCAGAAGAAAGTCAAAGT +GGGCATGGGAACAGATATCGGTGCCGGAACAACTTTTAACATGCTGCAAACGCTGAACGA +AGCCTACAAGGTATTGCAATTACAAGGCTATCGCCTCTCGGCATATGAAGCGTTTTACCT +GGCCACGCTCGGCGGAGCGAAATCTCTGGGCCTTGACGATTTGATTGGCAACTTTTTACC +TGGCAAAGAGGCTGATTTCGTGGTGATGGAACCCACTGCCACTCCGCTACAGCAGCTGCG +CTATGACAACTCTGTTTCTTTAGTCGACAAATTGTTCGTGATGATGACGTTGGGCGATGA +CCGTTCGATCTACCGCACCTACGTTGATGGTCGTCTGGTGTACGAACGCAACTAATAATA +AAACTTTAACATCCTCGTGAGGACATCATTATGTCTGGAGACATCCTACAAACACCGGAC +GCACCAAAGCCACAGGGCGCGCTGGATAATTATTTTAAAATTACCGCTCGTGGCAGTACC +GTTCGTCAGGAAGTACTGGCTGGCTTAACGACCTTTCTGGCCATGGTTTATTCCGTTATC +GTCGTTCCGGGAATGCTGGGCAAAGCAGGTTTTCCTCCCGCAGCTGTGTTTGTTGCCACC +TGTCTGGTCGCGGGCTTCGGCTCGTTGCTGATGGGGTTATGGGCCAATTTGCCAATGGCG +ATTGGTTGCGCTATTTCCTTGACGGCGTTTACCGCATTCAGTCTGGTACTCGGGCAACAA +ATTAGCGTTCCTGTCGCACTGGGCGCAGTCTTTCTGATGGGCGTCATCTTCACCGCTATT +TCCGTAACCGGTGTGCGTACCTGGATCTTACGTAATTTGCCGATGGGGATCGCTCACGGT +ACAGGTATCGGTATCGGCCTGTTTCTGCTGCTGATTGCTGCTAACGGTGTGGGAATGGTT +ATCAAAAACCCGATTGAAGGCTTGCCAGTGGCGCTCGGTGCGTTTACCTCCTTCCCGGTG +ATGATGAGCTTACTGGGGCTGGCGGTCATCTTCGGTCTGGAAAAGTGCCGCGTACCCGGC +GGGATCTTGTTGGTGATTATTGCAATTTCGATCATCGGCTTAATCTTTGACCCAGCGGTG +AAGTACCACGGTCTGGTGGCAATGCCAAGCCTGACTGGCGAAGATGGTAAGTCTCTGATT +TTCAGCCTCGATATTATGGGCGCACTCCAGCCAACTGTACTTCCGAGTGTACTGGCATTG +GTGATGACCGCAGTGTTCGACGCCACTGGCACCATCCGTGCCGTCGCCGGTCAGGCGAAT +TTGTTGGATAAAGACAACCAGATCATCAACGGCGGCAAAGCCCTGACCAGTGACTCAGTA +AGTTCAATATTCTCCGGCCTGGTGGGCGCAGCGCCCGCGGCGGTTTATATCGAATCAGCG +GCAGGAACCGCCGCCGGGGGGAAAACCGGTTTAACCGCAACCGTGGTTGGTGTGTTGTTC +CTGATGATTCTGTTTTTATCACCGTTATCGTTTCTGATCCCCGGTTATGCCACAGCTCCC +GCACTGATGTACGTGGGTTTGCTGATGTTAAGCAACGTCTCGAAGCTGGATTTCAACGAT +TTTATTGACGCAATGGCTGGCCTGGTGTGTGCCGTGTTCATCGTTCTGACTTGTAATATC +GTTACCGGTATTATGCTGGGCTTTGTAACACTGGTGGTGGGTCGCGTCTTTGCGCGCGAA +TGGCAAAAGCTGAATATTGGTACGGTGATCATTACTGCCGCACTGGTCGCGTTTTACGCG +GGTGGTTGGGCAATCTAATAGATTCTCCGCGCCTTTCCGCGCGGAGATTTCTTTCAGAGA +GGATTCTCACTGCTGGCAGCAATACGCTGCTGGCGGATACGCCTGAGTTCTCTTTCAGTC +AGCAACTGCAGCGCCTGTGTCGGGCAAGATTCAACGCAGGCTGGCCCCTCTTCCCGCAGT +TCACAGAGATCGCATTTCACGATTTGTTGCCGGGGATCACCCGGCAATGACTGAATGGTG +ATCATCCCAAACGGGCACGCGCTAACGCAACTCTGACAGCCAATACAACGGGCAGAATTG +GCCTGCACCACCTGCTCGCCCATCGTCAGCGCCCCCACGGGGCAAGCGCCAACACAAGGG +GCGTTTTCACACTGATGGCACATCACCGGCGCACTGATGCTATCCAGCCGTTGTACCTTC +AGCCGGGGTAAAAAGATATCGGCATTCAACTCCTGTTCTGAAGGGTGAGCGACCACACAG +GCCACTTCACAAGTACGGCAGCCAATACAGTCAGCCGGATTAACGATAATTAACGATTTC +ATCACGATGCCTTCGTATCAAACAGAGTTAACATATCGCGCGCCGCCTGCCTTCCTGCGG +CCATTGCAGTGACAACCAGATCCGCGCCATGAACTGCATCACCACCAGCAAAGACTTTTT +TCAGATGCGTCTGGGTAGGTAAATACCCGACGTCGCCGGTTTGAATCAGGCCCCATTTAT +CGAGTTTAATTCCGCTGCCCTGCAACCACGGCATGGTATGTGCCTGGAAACCAAAGGCCA +TAATGAGAACATCGGCGGGCAATTCAAACTCTGAACCCGCAACCGGACGAGGACGACGGC +GACCATCCGGCCCCGGCTCACCCATAGCGGTACGAATCAGGCCCACCGCCGTTAAGCGTC +CATCTTCATCACAAGCGATATATTGCGGCTGAACATTGAACTGAAACTCAACACCTTCCT +CGCGGGCATTGACCACCTCTTTGCGCGAACCCGGCATACTGACTTCATCACGACGATACG +CACAGGTCACGCTGGCAGCATTAAGGCGGATGGAAGTCCGCAAACAATCCATTGTCGTAT +CGCCACCGCCCAATACCACGACTCGCTTCCCTTCCACATCCGTCAGCGGATACTCTGCAG +ACTCCGGCAATCCCATGAGCTGGCGGGTATGGGCGGTCAGGAACGGTAACGCCTGAATGA +CACCAGGCGCATCTTCATGCGGCAGATCTGCTCGCATCATCCCGTAAGTCCCCACGCCGA +GGAAAACAGCATCATATTCCGCCGTTAATTCGTTGAAAGAGATATCGCGGCCAATTTCAC +AGTTGAGATGGAAATCGATTCCCATTGCGGTGAATATCTCTCGCCGCTGGCTTAATACCG +TTTTATCGAGTTTGAAAGGAGGAATGCCAAAAGTCAGCATACCGCCAATTTCTGGATGGC +GATCAAAGACATCAACCTGAACTCCCGCGCGCGCCAGAATATCAGCACACCCTAATCCTG +CAGGTCCAGCGCCAATCACCGCCACTTTTTCGCTACGGGGAACAACTTTGCTGACATCGG +GACGCCAGCCCATCGCCAGCGCAGTATCGGTGATGTAGCGTTCCAGATTACCGATAGAGA +CTGCGCCAGAGTGATCTTTCAAAGTACATGCACCTTCACAAAGACGGTCCTGTGGACATA +CCCTGCCGCAGATTTCGGGTAAGGAACTGGTCTGGTGGCAAAGTTCTGCCGCTTCAATAA +TCTTTCCTTCCTGTACCAGACGGATGTAATCCGGAATAGCGTTATGCAGCGGACAATGCC +AGTTGCAGTTAGCTTTTTCGGCACAATAAACACAGCGGTCACTCTCATAAGTCGCTTGTT +GTGGATCCAGCCCGCAATAGATTTCGCCAAAGTGGGTTTTCCGTTCACTCGCTGAAATTT +TATCTGCGCCTTTACGCGAGTTAACGGGGAGCAACGCTGCACTGCGAGATGGCTGAGCGT +CTGATGACGCTTTTCCTGCTGCCGTTTTGCGCTGGCGGGCCACCTTTATCTGCTGCAACC +CTTTATCGTCCATCAGCCGTAACGCCTGTGTTGGGCAGACGTCAATACAGGCTTGCGTGC +CGGAACTGCGCTGGTTACAAAGGTCGCATTTCTGTGCAATCGTATCGACCATCTCAACGA +CGCCAAAGGGGCAAGCGATTGCGCATCTTTTACAACCAATACATTTTTGCTCGTCCAGTT +GTACGCTATCGGACTGGAAAGTCAGAGCATTAACCGGACAAGCCGTAACGCAAGGGGCAT +TGTTGCAGTGATGGCAGGCCACCGGATTCGCAGCCTGGCCTTTCCCTACAACGTGGATAC +GCGGTCGAAAGTCACTGTGACTCAGCGGCCAGTTTTCTTGATTATGTGCCACCGCACAGG +CAATTTCACAAGCATGGCAGCCTATACATTCCGCAGCTTCAGCAGCGATAAACTTATTCA +TTTGCATCCCTTTCATTTAATGAGTTATGTCTTCTCAAATTTCGCGATGCAATAAACGGG +CATATATTAGGTAGCATGACCGTTTTAATTATAATTTTGCAACTGAGTTCAAATTATTGC +CCCTCAATCTATGCCGCTTTCATTATTTCAACATTGCCGATCAAAAGAATGCTATCCAGA +TAAAAACGATTAAATGCGAGAGTGCGACATGCCAGAATGATTAATGAAATATCAATATGA +GAAAATTACAGATAATTCCATTGTCAGGTTCTCTTCTCATAATCGTGGTTTAACCACGAT +TATGTGATTGCCTCCGCAATTCCTGTCTCTAACTCCCCTTCCTCGCAAAAACTGGCACTC +CACGAGCATGTGTTTAGACAGTTTCATGAACATAAACGGTTGCTTTTTACTCTGGCGGGC +GAAAGGAGAAACACTGATGAGCGCCATAGATTCCCAACTTCCCTCATCTTCTGGGCAAGA +CCGCCCAACTGATGAGGTTGACCGCATATTATCACCAGGAAAGCTGATCATACTCGGTCT +GCAACACGTCCTTGTCATGTACGCAGGTGCAGTCGCTGTTCCTCTTATGATTGGTGACCG +ACTCGGCCTATCAAAAGAAGCTATTGCGATGCTCATCAGCTCGGATCTCTTTTGCTGCGG +GATCGTCACATTATTGCAATGTATCGGTATCGGCCGCTTTATGGGGATCCGCCTGCCGGT +GATTATGTCGGTGACCTTCGCCGCTGTAACACCAATGATAGCCATTGGTATGAACCCGGA +TATCGGCCTGCTGGGGATATTCGGTGCCACTATCGCCGCGGGTTTTATCACCACATTATT +AGCGCCACTTATCGGTCGCTTGATGCCTTTATTCCCGCCACTGGTTACCGGTGTGGTGAT +TACTTCTATCGGGCTTAGCATCATTCAGGTGGGTATTGACTGGGCCGCCGGAGGTAAAGG +GAATCCGCAATATGGTAATCCCGTTTATTTAGGTATCTCCTTTGCCGTCTTAATTTTTAT +CTTGCTCATTACTCGCTATGCGAAAGGATTTATGTCCAACGTCGCCGTATTACTGGGGAT +TGTATTTGGCTTTTTACTTTCGTGGATGATGAATGAAGTCAATTTATCCGGGCTACATGA +TGCTTCATGGTTTGCGATTGTCACGCCGATGTCATTTGGTATGCCGATTTTCGATCCCGT +TTCCATTCTGACCATGACTGCCGTGTTAATCATCGTGTTTATCGAGTCGATGGGGATGTT +CCTGGCACTGGGTGAAATAGTCGGTCGCAAACTCTCTTCCCAGGACATTATTCGTGGGTT +ACGCGTAGATGGGGTTGGGACAATGATTGGAGGCACGTTTAACAGCTTCCCACATACGTC +ATTTTCGCAGAACGTCGGGCTGGTCAGCGTGACGCGCGTCCACAGCCGCTGGGTGTGCAT +TGCTTCCGGTATCATTTTGATCCTGTTCGGCATGGTGCCCAAAATGGCGGTGCTGGTGGC +CTCGATTCCGCAATTTGTGCTGGGCGGCGCGGGGCTGGTGATGTTCGGCATGGTACTGGC +GACAGGGATTCGAATTCTGTCGCGCTGTAACTACACCACTAACCGTTACAACCTCTATAT +TGTGGCGATCAGTCTCGGTGTTGGCATGACGCCAACGCTCTCTCACGATTTCTTTTCTAA +GTTACCGGCCGTACTGCAACCGTTGCTGCATAGCGGCATTATGCTCGCAACCCTTAGCGC +CGTTGTGCTGAACGTCTTCTTTAATGGCTACCAGCATCATGCTGACCTGGTGAAGGAATC +CGTCTCTGATAAAGATTTAAAAGTCAGGACAGTACGTATGTGGCTTCTGATGCGCAAGCT +GAAGAAAAATGAGCATGGAGAATAATATGAATCTTTTAATGCGCGCTATATTCAGTCTGC +TGTTGCTTTTTACTCTCTCTATTCCTGTCATTTCTGATTGTGTTGCAATGGCCATTGAAA +GTCGCTTCAAATATATGATGCTGCTTTTTTAAATGGTTTTTACCTGTCGACATCCGCTCA +AAACGGGCGGTTGTCGATAAACGCTCACTTGGTTAATCATTTCACTCTTCTATTATCTAT +AATGATGAGTGATCAGAATTACATGTGAGAAATTATGCAAACGGAACACGTCATTTTATT +GAATGCACAGGGAGTTCCCACGGGTACGCTGGAAAAGTATGCCGCACACACGGCAGACAC +CCTCTTACATCTCGCGTTTTCCAGTTGGCTGTTTAATGCCAAAGGGCAATTATTAGTTAC +CCGCCGCGCCCTTAGCAAAAAAGCATGGCCTGGCGTGTGGACTAACTCGGTTTGTGGGCA +CCCACAACCGGGAGAAAGCAACGAAGAGGCGGTGATCCGCCGTTGCCGTTATGAGCTTGG +CGTAGAAATTACGCCTCCTGAATCTATCTATCCTGACTTTCGCTACCGCGCCACCGATCC +GAATGGCATTGTGGAAAATGAAGTGTGTCCGGTATTTGCCGCACGCACGACCAGTGCGTT +ACAGATCAACGATGATGAAGTGATGGATTATCAATGGTGTGATTTAGCAGCGGTTTTACG +CGGTATTGATGCTACGCCGTGGGCGTTCAGTCCGTGGATGGTGATGCAGGCGACAAATCG +CGAAGCCAGAAAACGATTATCTGCATTTACCCAGCTTAAATAAAAAACCCCGACGGTTGC +CGGGGTTGTGAGCATAACGTAATGCTTATTTTACCGGACGCATCGCCGGGAACAGAATAA +CGTCGCGGATGGTATGGCTGTTGGTGAACAGCATTACCATACGGTCGATACCAATTCCCA +GACCGGCTGTCGGTGGTAAGCCATGTTCCAGTGCGGTGACATAATCTTCGTCGTAGAACA +TCGCTTCGTCGTCACCTGCATCTTTCGCGGCAACCTGATCCAGGAAGCGCTGCGCCTGAT +CTTCCGCGTCATTCAGCTCGCTAAAGCCGTTACCGATTTCACGCCCACCAATGAAGAACT +CAAAGCGGTCTGTGATTTCCGGGTTAACGTCGTTACGACGCGCCAGAGGAGAAACTTCTG +CCGGATATTCAGTAATGAAGGTCGGCTGGATCAGATGTGCTTCTGCCACTTCTTCGAAGA +TCTCGGTAACGATACGGCCCAGACCCCAGCTCTTCTCAACGTGGATGCCGATAGATTCAG +CAATCGCTTTCGCAGAGTCGAAGTTGTCCAGATCTGCCATGTCGGTTTCCGGGCGATATT +TCTTGATCGCTTCACGCATGGTCAGTTTTTCGAACGGCTTACCGAAGTCCAGCGTTACGT +CGCCGTAGGTCACTTCCGTCTTACCGAGAATATCCTGTGCCAGAGTACGGAACAGCGATT +CGGTCAGCTCGATCAGATCTTTGTAATCTGCGTAAGCCATATAGAGTTCCATCATGGTGA +ACTCTGGGTTATGACGTACGGAAATACCTTCGTTACGGAAGTTACGGTTGATTTCGAATA +CACGCTCGAAGCCACCGACCACCAGACGCTTGAGGTACAGTTCCGGCGCGATACGCAGGT +ACATGTCGAGATCCAGCGCGTTATGGTGGGTGATGAACGGACGCGCAGCGGCACCGCCAG +GGATCACCTGCATCATCGGCGTTTCAACTTCCATAAAGCCGCGATTCACCATGAACTGGC +GAATACCAGAGAGGATCTGCGAGCGCACTTTAAAGGTGTTGCGGGATTCATCGTTAGAGA +TGAGATCCAGATAACGCTGACGATAGCGCGCTTCCTGATCCTGCAAGCCGTGGAATTTAT +CCGGCAGCGGACGCAGTGCTTTGGTCAGCAGACGCAGCTCGGTACAGTGGATAGACAGTT +CGCCGGTTTTGGTTTTGAACAGTTTACCTTTCGCGCCGAGGATATCGCCGAGGTCCCATT +TTTTGAACTGCTCGTTGTAAACGCCTTCCGGCAGATCGTCACGGGCAACGTACAACTGAA +TGCGACCGCCAACGTCCTGCAGGGTAACGAAAGACGCTTTACCCATAATACGACGGGTCA +TCATGCGGCCAGCAACGGCGACTTCGATGTTCAGCGCTTCCAGTTCTTCGTTCTCTTTAC +CGTCGAATTCTGCGTGCAATTGGTCAGAGGTATGATCGCGACGGAAATCGTTCGGGAAGG +CAATCCCCTGCTCACGCAGGTTCGCCAGCTTCTCACGACGCGTTTTCAGTTCATTGTTAA +GATCGACTACCGCGTCAGCGCCCTGTGCGTGTTGTTCAGACATGTTGGTTCCTCATAACC +CTGCTTTCAAACTTGCTTCGATAAATTGATCCAGGCTGCCGTCCAGCACGGCCTGCGTGT +TGCGGGTTTCTACCCCGGTACGCAGATCTTTAATGCGGGAGTCATCAAGGACATAAGAAC +GAATCTGGCTGCCCCAGCCGATGTCGGATTTGTTATCTTCCATCGCCTGTTTCTCGGCAT +TTTTCTTCTGCATCTCCAGTTCATAAAGCTTCGCTTTCATCTGCTTCATGGCCTGGTCTT +TGTTCTTGTGCTGGGAACGGTCGTTCTGGCATTGGGTCACGATCCCGGTTGGGATGTGAG +TAATACGCACCGCAGATTCGGTACGGTTAACGTGCTGACCGCCCGCGCCGGATGCGCGAT +AAACGTCGATGCGCAGATCCGCCGGATTGATTTCGATATCGATATCATCATCAACTTCCG +GGTAAACAAACGCGGAGCTGAACGACGTGTGGCGACGACCACCGGAGTCAAACGGGCTCT +TACGCACCAGGCGGTGAACGCCGGTTTCTGTACGCAGCCAGCCATAAGCGTAATCGCCGG +AGATTTTGATCGTCACGGATTTAATACCCGCCACTTCACCTTCCGACTCTTCGATGATTT +CAGTTTTGAAACCACGCGATTCAGCCCAGCGCAGATACATACGCTCAAGCATGCTCGCCC +AGTCCTGTGCTTCCGTACCGCCAGACCCCGCCTGAATATCGAGGTAGCAGTCGGCGCTGT +CATATTCGCCAGAGAACATACGGCGGAACTCAAGCTGCGCCAGTTTTTCTTCCAGGGCGT +CGAGTTCAGCAACGGCTTCGTTAAAGGTTTCTTCGTCGTCAGCTTCTACAGCCAGTTCCA +GCAGACCAGAAACATCTTCCAGCCCCTGTTTCATTTGGTCGAGGGTGTCGACAACGGCTT +CGAGGGAGGAACGCTCTTTACCCAGCGCCTGTGCGCGTTCGGGTTCGTTCCAGACATCCG +GCTGTTCCAGCTCGGCGTTTACTTCTTCCAGACGCTCTTTCTTGGCGTCATAGTCAAAGA +TACCCCCTAAGAACGTCGGAGCGTTCCGTGAGGTCCTGAATGCGATTATTTACCGGATTA +ATTTCAAACATGGTCTGATTTCTTTTATTGAGCTAGTCAAAATGCGGTGATTAGAGCGGG +ATTGTACCCAATCCACGCTCTTTTTTATAGAGAAGATGACGCTAAATTGGCCAGATATTG +TCGATGATAATTTGCAGGCTGCGGTTGCCGCGAAACTCGTTGATATCGAGCTTGTAAGCC +AGTTGCACTTCGCGCACGCCGTTATCCGGCCAGAGGGCGGTATCGACATTAAAAGCAATA +CCATCCAGCAGCGGACCGCCGCCGACCGGCTCGACCATGACTTTCAAATGACGCTCGCCC +ACCAGCCGCTGTTGCAGCAGACGGAAATGACCGTCAAACAACGGTTCCGGGAACATTTGT +CCCCACGGGCCAGCATCACGCAGCAGTTGCGCCACTTCCATGGTCATCTCTGCCGCACTT +AATGGGCCGTCTGATACCACTTCCCCTTGCAATAAAGAAGGATCTAACCACTCGGTAACC +AGTTCGCCAAAGCGTTGCTGAAAGAGTTCGAATTTCTCCTCTTCCAGCGACAAACCCGCC +GCCATCGCATGGCCGCCAAACTTGAGCATCATGCCGGGGTAAAGCGTGTCTAGCCGCTCC +AGCGCATCGCGCATATGCAGCCCCTGAATGGAGCGACCGGAACCTTTCAGCGTACCGTCG +CCCGCAGGCGCAAAGGCGATAACCGGACGGTGAAAACGCTCTTTGATACGCGATGCCAGA +ATGCCAACAACGCCCTGATGCCATTCAGGGTGATACATTGCCAGCCCACCTGGCAGCGTG +TCGCGGCTACGTTCCAGCTTCTCGCACAGAGTGAGCGCTTCAACCTGCATTCCCTGTTCG +ATCTCTTTACGTGTTTGGTTTAGTGCATCGAGTTCATTCGCCAGCACACGCGCTTCGCCA +ATGTTGTCACACAACAACAGCGCCACGCCAACGGACATATCGTCCAGTCGCCCGGCAGCA +TTGAGACGTGGCCCCAGCGCAAAACCTAAATCGCTGGCGGCGAGTTTTTGTGGATCGCGA +TTGGCCACTTCCAGCAGCGCTTTAATCCCCGGACGGCACTTTCCGGCACGGATGCGACTC +ATCCCCTGCCAGGTCAGAATGCGATTATTAGCGTCCAGCGGCACGACGTCCGCCACTGTC +CCCAACGCTACCAGATCCAGCAGTTCTGCCAGATTAGGAATTGCGATGCCGCGCTCATCA +AACCAGCCCTGATCGCGCAAAAAGGTGCGCAGCGCCAGCATCAGATAAAACGCCACACCC +ACGCCTGCCAGTGATTTCGACGGGAAATTACAGTCGCGCAAGTTAGGGTTAATGATCGCT +TCCGCTGCGGGTAATGTGTCGCCTGGCAAATGGTGATCGGTAACAATAACCGGAATGCCC +AACGAACGAGCGTGTTCAACCCCCGCATGGGAGGAAATACCGTTATCCACCGTGACAATT +AACTGCGCGCCACGGGCATGAGCCTGATCGACTACTTCCGGGCTTAAGCCGTAACCGTCT +TCGAAACGGTTTGGAACCAGGTAGTCGATATTGCTGCAACCAAGCGAGCGCATCGCCAGC +ACGCTTAGAGCCGTGCTGGTCGCACCGTCGGCGTCGAAATCACCGACCACAATAATCCGC +GTTCCTTCGCGAAAAGCGTTGTAAAGGATCTCAACGGCCTTTTCGACGCCGCTCAGTTGC +TGCCAGGGCAGCATGCCTTTAACACTGCGTTCCAGTTCCTGCGCGCTACGCACACCCCGG +CTGGCATATAAACGGCGCAGCAAGGGAGGCAATTCAGCGGGCAAGTCGGCCGTTTCATCG +ACTTCTCGGCGACGAAGTTGTATCTGTTGTTTCACGCGAATTATTTACCGCTGGTCATTT +TTTGGTGTTCGTCGAGGAATTCTTTCATGTCTTTCGGCGGCTGGTAACCCGGAACAAGTG +TGCCATTGCTCAGCACAACTGCCGGAGTACCGCTAACGCCAAGCTGGACGCCAAGTGCGT +AATGGTCGGCAATATCCACGTCGCAGCTGGCTGGTGCGACGCTTTTACCTGCCATCACAT +CATCAAACGCTTTGTTTTTATCTTTCGCACACCAGATAGCTTTCATTTCTTTCTCTGCAT +CGCTGTCCAGCCCCTGGCGCGGGAAAGCAAGATAACGCACGGTGATCCCCAGCGCGTTAT +AGTCTGCCATTTGCTCATGCAGTTTGTGGCAGTAACCACAGGTAATATCAGTAAACACGG +TGATGACGTGTTTTTCCTGCGGCGCTTTATAAACGATCATCTCTTTTTCAAGCGCATTCA +ACTGCTTTAACAGCATCTTATTGGTGACATTGACCGGAGCCGTGCCACTAACGTCATACA +TTGGCCCCTGAATGATATGTTTACCATCATCGGTGATGTACAACACACCGCTGTTAGTCA +GAACTGTCTTCATGCCAGCTACGGGCGCGGGCTGAATATCGCTGCTTTTGATGCCCATTT +TGGCTAACGTTTGTTGAATTGCCGCGTCATCAGCCTGAACAAAGCCTGAAAACGCTGCCA +ACAAGGTAAATAACATAAAACCTTTCTTCATAAATTTTCCTGTTCTTTTCAGACATCACG +CCCGCGGGTGATGCTGTTGATGAAGTTGTCGCAGACGCTCGGTAGCGACATGCGTATAAA +TTTGCGTGGTGGAGAGATCGCTGTGGCCCAGTAGCATCTGCACCACGCGTAAATCCGCAC +CATGATTTAATAAGTGAGTGGCAAAAGCGTGACGCAACACATGCGGTGACAGCTTTTCGC +TGTCGATACCCGCCAGCACGGCATAATGTTTAATGCGGTGCCAGAAGGTCTGTCGCGTCA +TCTGCTGCGCACGCTGGCTGGGAAACAACACGTCAATTGACACACCATTCAACAGCCACG +GACGCCCATGTTCCAGATAGGTTTCCAGCCAGTAAACCGCCTCTTCACCTAACGGCACCA +GGCGCTCTTTGTTGCCTTTACCAATGACCCGCACCACGCCCTGACGCAGGCTGATATCAC +TCATTGTCAGCCCGACCAGTTCAGAGACACGCAGTCCGGTAGCATACAACACTTCAAGCA +TGGCTTTATCGCGTAGCTCCAGTGGCTGATCAATTAATGGTGCCTGTAATAAACGTTCGA +CCTGCGCTTCGCTTAAATCTTTTGGCAAACGCTGGGGCAATTTCGGTGAAGCGAGATGCG +CACTGGGATCATCTTCACGAAACTTTTCGCGATAAAGATACTGGAACAATCGGCGCACTG +CACTCAGCAAACGCGCTGAGCTGGTGGCTTTATACCCGCCCTCCAGCCGTTCTGCCAGTA +ATGCCTGCAAATCGTCACTTTGCGCCGTCGCCAGCGTCAACCCGCGGTGATGCAACCACT +CCACCATCATTGACAGATCGCGACGGTAAGCGTTCAACGTATTTTCAGCCAGATTTTTTT +CCAGCCACAGAGCATCAAGAAACTGCTCGATGCGTGCCAGATCCTGTTTCACTTGCGCCC +CTTATGGTCACTCATTTGATCCATTATGCCTTATTGTGCCGTGACTAAAGCGATTCTGAT +ACACTAGCCGCAAAAGCCACAGCAGAATCGAGAAGCTTACGTTATGAATATGGGTCTTTT +TTACGGTTCCAGCACCTGTTACACCGAAATGGCGGCAGAAAAAATCCGCGATATTATCGG +CCCAGAACTGGTGACCTTACATAACCTCAAGGACGACTCCCCGAAATTAATGGAGCAGTA +CGATGTGCTCATTCTGGGTATCCCGACCTGGGATTTTGGCGAAATCCAGGAAGACTGGGA +AGCCGTCTGGGATCAGCTCGACGACCTGAACCTCGAAGGTAAAATTGTTGCGCTGTATGG +GCTTGGCGATCAACTGGGATACGGCGAGTGGTTCCTCGATGCGCTCGGTATGCTGCATGA +CAAACTCTCGACCAAAGGCGTGAAGTTCGTCGGCTACTGGCCAACGGAAGGATATGAATT +TACCAGCCCGAAACCGGTGATTGCTGACGGGCAACTGTTCGTGGGTCTGGCGCTGGATGA +AACTAACCAGTATGACCTTAGCGACGAGCGTATTCAGAGCTGGTGCGAGCAAATCCTCAA +CGAAATGGCAGAGCATTACGCCTGATGTCACTGACGGCTTAGCACATATGCTTTGCCGTC +ATCTTTATCTTTGCGTCTCTTGTTGTAACAATATCCGCCGTAAATCCCGCCATTCGGCTT +CGTCCATGCTGTCAGCTGCCAGCCATAAATGTTGCCGTTTTCCGCTGTCAGAACGTAAAC +GCAGCATCATGCCGCTCTTAATCATCCACGGCGCTTTGACGATGCTCCACTCCTGCCCTT +GCCAACGCAAACGCCCGTCCATCAACAAGCGAATTTCCCCCTGGCGAGCATTAATGCGCC +GCTGGCTGCGAACGCAATCAAACACCACCAGCGAAAGTAACACCATCCATAACGGGGTGT +AACTGAGCGGCCAGGGCATGAGTAAAATAACAGCGGCAACCAGCCCATGAATCAGCAAGG +AAAGCCACTGTGCGCGCCAGGAGACGCGCAAATCAGATTGCCACAGGACCACGTTCCCGG +TTCCGTGTCTGGATGAGTCGGACCATCATTTCCAGTTCTGCATCGGCTGGTTTACCGTGA +TTCATCAGCCAGTTAAACAGGTCCGGATCGTCACATTCCAGCAGACGAATAAAGATGCGT +TTTTCGTCATCGCTTAAGCTGTCGTACTCATGTTCGAAAAACGGCATGATTGAAATATCG +AGTTCGCGCATACCACGGCGGCATGCCCAATGAATGCGGGCTTTGTTGTTAATGTCCATC +TTCTTCCTGTCTCACGAAAATCCAGTACCCGGCTATTGTAACGTGTTTTTCGACTTCTTT +TACGGGAATATCAGTAAACACAATCGCGATCGCGAAATTAATTCACAACAATTCAAGGGC +TTCATTTTTTTGGAAGTCGCCTCGCAGAAGGCACAGATCGCGTAGTGAAAGCACTTGCAT +TGCCTCATAGCTCTTTTACCATTAGTTATTAATACGCCGTTAAGCAACTCAGGACTCTAT +TATGGCTTTTACACCTTTTCCTCCCCGTCAGCCTACGGCTTCTGCCCGTTTGCCACTGAC +GCTGATGACGCTTGATGACTGGGCGCTTGCCACTATTACTGGCGCGGACAGCGAAAAATA +TATGCAAGGCCAGGTGACAGCAGATGTCAGCCAGATGACAGAAGATCAGCACCTGCTCGC +CGCCCATTGCGACGCCAAAGGTAAAATGTGGAGCAATTTACGTCTGTTCCGCGACGGCGA +TGGCTTTGCATGGATTGAACGGCGCAGCGTGCGTGAACCACAGCTGACTGAACTGAAAAA +ATATGCGGTGTTCTCTAAAGTGACAATCGCGCCAGACGACGAGCGTGTGCTGCTTGGTGT +TGCCGGTTTTCAGGCGCGCGCCGCGCTGGCAAATCTCTTTAGTGAACTGCCTTCGAAAGA +AAAACAGGTAGTTAAAGAAGGCGCGACTACTCTGCTTTGGTTTGAACATCCGGCAGAACG +TTTCCTGATCGTAACCGATGAAGCTACTGCCAATATGCTGACCGATAAACTGCGCGGTGA +AGCGGAACTGAACAATAGCCAACAGTGGCTGGCATTAAACATTGAAGCGGGTTTCCCGGT +GATTGATGCCGCCAACAGCGGGCAGTTTATCCCCCAGGCGACCAACCTCCAGGCGCTGGG +CGGTATCAGCTTTAAGAAAGGCTGCTATACCGGACAAGAGATGGTGGCGCGAGCAAAATT +CCGTGGTGCCAACAAACGCGCGCTCTGGTTGCTGAAGGGTAGCGCCAGCCGACTGCCGGA +AGCTGGTGAAGACTTAGAGCTGAAAATGGGCGAGAACTGGCGTCGTACCGGTACGGTGCT +GGCTGCGGTCAAACTGGAAGATGGTCAGGTTGTGGTGCAGGTTGTCATGAATAACGATAT +GGAACCGGACAGCATCTTCCGCGTGCGTGACGATGCGAATACATTGCGTATCGAGCCACT +GCCATATTCGCTGGAAGAGTAAATCTCTGTATCGCATCAGGCATTTATCGCCTGATGCGA +CACTGGTGTGTCTTTTCAGGCCTACAAAGGCACGCCAATTACGCCTGCCCAATATACAAA +TAGATCGCCAGAAAGTGGCACACACTACCGCCGAGCACAAAGCCGTGCCAGATGGCATGA +TTGTATGGAATGCGCTTGCAGACGTAGAAAATCACCCCGAGCGAATAAACCACACCGCCT +ACCGCCAGTAAGGTAACGCTGCCCGCCGCGAGCTTAACTGCCATTTCATAAATTACCACC +AGCGACAGCCAGCCCATCGCCAGATAGGTCACCAGAGATAAAATTTTGAATCGGTGCGCG +ATGGTCAGTTTAAACAGAATACCCAGCAATGCCAGGCTCCAGATAACAATCATCAACCCG +CGCGCTAACGGAGAATCCAGCCCCACCAGCAAAAACGGCGTATAGGTTCCGGCAATCAAC +AGATAAATGGCACAGTGGTCAAATTTCTTCAGCCACATTTTTGCCCGTTGATGGGGAATG +GCGTGATAGAGCGTCGAAGCGAGGAACAGCAGGATCATACTGCCGCCATAGAGGCTGTAA +CTGGTTATCGCCGTGGCGCTGGCATTGAGATCCACCGCCTGAACCAGTAGCAACACCAGC +CCAACGATACCAAACACCAGCCCAATGCCGTGACTGACGCTGTTGGCAATTTCCTCTGCC +AGCGAATATCCCTGCTTAATGAGGGGCTTCTGAACCATAACTTACTCCGGAAAAACGTAC +ACGCACATGTATACCTCTCCAGCGTAACTGAGAATAGTTCCAGTGAACACCTGTTAGCTA +AAATAAATTCTGATTTGAGATTAATCTCCGAAAAATCATGAAATTAAATGCGAAATTTCA +ACTAACAGGCGTGAGTTCAATTTAAAGACATTTAAATTCAATCACATAAAACTGTGTCTG +GTCGGGATAGATGTCGGCAATGACCTTTTTCAGTTCAGTCAGGGTCATATTTTCCTGCTC +TGCATGTTTTTCCGTCAGCGTATCCAGCGTTACGGTTGAGGTTGCGGTGACTTCAATCGT +GCAAAAATAACCGTCATCTTCAAAACGTCCGACACGAAGCACATCACCCGTTTTGAAGTG +CGATTCAGACTCGTCGCGGATGGTGATGGTTTTACGCCCAGCCAGAATGTCATCCTGGAA +ACGTTGAAAAAAAGTGATGTCGTTTGGCTGCATGGTAATATTTCCTGTAAGAATTGACTC +ATCTGGAGCCTATGATAGTGAAAAAACTCACCTTACCGAAAGATTTCTTATGGGGCGGCG +CAGTTGCCGCTCATCAGGTCGAAGGCGGCTGGAACAAAGGCGGCAAAGGGCCGAGCATTT +GTGACGTTTTGACCGGTGGCGCACACGGCGTGCCGCGCGAAATCACCAAAGAAGTTGTGC +CTGGCAAATACTATCCAAACCATGAAGCCGTTGATTTTTATGGTCACTACAAGGAGGACA +TCAAGCTATTTGCCGAAATGGGCTTCAAATGTTTTCGTACTTCCATCGCCTGGACGCGCA +TTTTTCCAAAAGGCGATGAAGCTCAGCCAAACGAAGAAGGGCTGAAGTTCTACGATGATA +TGATCGATGAACTGCTGAAATACAACATCGAACCGGTGATCACCCTCTCCCACTTTGAAA +TGCCGCTGCATCTGGTGCA +>bis +GCAATATGGTAGCTGGACCAACCGTAAAGTGGTTGATTTCTTTGTCCGTTTCGCGGAAGT +GGTATTTGAACGCTATAAGCATAAAGTCAAATACTGGATGACTTTCAACGAAATTAACAA +CCAGCGTAACTGGCGTGCACCGCTGTTCGGTTACTGCTGCTCCGGCGTGGTGTATACCGA +GCATGAAAACCCGGAAGAGACGATGTATCAGGTGCTGCATCACCAGTTTGTCGCCAGCGC +CCTGGCGGTGAAAGCCGCGCATCGCATCAACCCGGAGATGAAAGTCGGTTGTATGCTGGC +GATGGTGCCGCTCTATCCTTACTCCTGTAACCCGGACGATGTGATGTTTGCCCAGGAGTC +GATGCGCGAACGTTACGTCTTTACCGATGTGCAGTTGCGTGGCTATTACCCGTCCTATGT +GTTGAACGAGTGGGAACGCCGCGGATTTAACATCAAAATGGAAGACGGCGATCTGGATGT +ACTGCGCGAAGGCACCTGCGATTATCTCGGCTTCAGCTATTACATGACCAACGCGGTGAA +GGCCGAAGGTGGCACCGGCGATGCGATTTCTGGTTTCGAAGGCAGCGTACCGAATCCGTA +TGTTAAAGCGTCTGACTGGGGCTGGCAGATTGATCCGGTTGGTCTGCGCTACGCACTTTG +CGAGCTGTATGAGCGTTACCAGAAGCCGCTGTTTATTGTCGAAAACGGTTTTGGCGCTTA +CGACAAAGTGGAAGATGATGGCAGCATCAATGACGATTACCGCATTGATTACCTGCGTGC +CCATATTGAAGAGATGAAAAAAGCGGTGACTTACGATGGCGTGGACCTGATGGGCTACAC +GCCGTGGGGCTGCATCGACTGTGTGTCGTTCACCACCGGGCAGTACAGCAAACGCTACGG +CTTTATCTATGTGAATAAACATGACGACGGTACTGGCGATATGTCGCGTTCACGTAAGAA +GAGCTTTAACTGGTACAAAGAGGTGATTGCCAGCAACGGCGAGAATCTGTAATTAGCCGA +TGTGCCTGATGTGCTCCGCTCATCAGGCCTGGCACTCTTTTAATATATTGAGCTCGCAAT +ATTTTATATTACGCCTCAGCCGAAACACACAAAGCGCACTTTATTAACAAGCGAAAAAGG +CGCCGAAGCGCCTTTATAAGATAGTCGAATCAGTAAATTACTGGTATTCGCTAATCGGTA +CGCAGGAGCAGAACAGGTTACGGTCGCCGTAAACATCATCCAGACGTTTCACGGTCGGCC +AGTATTTGTCTGCCACACCTGCCGGGAATACTGCAACTTCACGGCTGTACGGATGCGCCC +ACTCGGCGACCAGTTCGCTTTGAATGTGCGGCGCATTCACCAGCGGGTTATCTTCCAGCG +GCCAGACACCGGCTTTCACCTGATCAATTTCTGCGCGGATAGCCAGCATCGCATCGATAA +AGCGATCCAGTTCCACTTTGCTTTCAGATTCAGTCGGTTCAACCATCAGCGTACCCGCCA +CCGGGAACGACATGGTCGGCGCGTGGAAACCGTAGTCGATCAGGCGCTTGGCAATATCCA +GCTCGCTGATGCCGGTTTCTTCTTTCAGCGGGCGAATATCGAGAATACATTCGTGCGCCA +CGCGACCGTCGCGACCGGTATACAGCACCGGGAAGGCATCCTGCAGACGGCTGGCAATAT +AGTTGGCGTTAAGAATTGCCACCTGGCTTGCTTTTTTCAGCCCTTCTGCGCCCATCATGC +GGATGTACATCCAGCTGATTGGCAGGATAGAGGCACTACCGAACGGTGCCGCAGAAACCG +CGCCCTGACGGGTTAACATGCCTTCGATTTGCACCACGCTATGACCCGGTACAAACGGAG +CCAGATGCGCTTTCACACCGATCGGTCCCATACCCGGACCACCACCGCCATGCGGAATGC +AGAAAGTTTTATGCAGGTTAAGGTGGGAAACGTCCGCACCAATAAAGCCCGGCGAGGTGA +TGCCAACCTGAGCGTTCATGTTCGCGCCATCAAGGTAAACCTGACCGCCGAACTGATGCA +CGACTTCACACACTTCACGGATCGTTTCTTCATACACGCCGTGGGTAGAAGGATAGGTCA +CCATGATACAGGAGAGGTTATCGCCCGCCTGTTCCGCTTTCGCGCGCAGATCAGTCAGAT +CGATGTTGCCGTTTTTATCACACGCCACAACCACCACCTGCATTCCTGCCATATGCGCGG +AAGCCGGGTTAGTGCCGTGCGCAGAAGCCGGGATCAGGCAGATATCGCGATGCCCTTCGT +TGCGGCTTTCATGATAATGACGAATCGCCAGCAGGCCCGCGTATTCGCCCTGTGCGCCAG +AGTTCGGCTGCATACAAACGGCGTCGTAACCGGTCAGTTTCACCAGCCAGTCAGCCAGCT +GCGCGATCATCTGCTGATAACCTTCAGCCTGTTCTGGCGGGCAAAACGGGTGCAGTTCGG +CAAATTCCGGCCAGGTGATCGGGATCATCTCGGCGGCGGCGTTCAGTTTCATGGTGCAGG +AACCCAGCGGGATCATCGCCTGATTCAGCGCCAGATCTTTACGCTCCAGCGAGTGCATAT +AGCGCATCATTTCGGTTTCGCTGTGGTAGCGATTAAACACCGGATGGGTGAGGATTTCGT +CGTCGCGCAGCATCGCAGCCTGAATAGAGCGACTGTCGTGAGCCACGTCTTTGTCCAGTG +TGTCGATGTCCAGCCCGTGGTTATCGCCCAACAGCACGCTGAAAAGCTGCATCACGTTTT +CGCGCGTGGTTGTTTCATCAAGGGTGATCCCAACCGCGTTCAGAATATCGCTACGCAGGT +TGATTTCAGCCGCTTCGGCACGCGCCAGCACGCCCGCTTTGTCGGCCACTTCCACACACA +AAGTATCGAAATAGTGCGCATGGCGCAGCTTCAGACCTTTTTGTTGCAGGCCCGCCGCCA +GGATATCGGTCAGACGGTGGATGCGATTAGCGATACGTTTCAGGCCAACCGGACCGTGAT +AAACGGCATACAGGCTGGCAATGTTTGCCAGCAGTACCTGGGAAGTACAAATGTTGGAGT +TCGCTTTCTCACGACGAATATGTTGCTCGCGAGTCTGCATCGCCATGCGCAGAGCGGTGT +TGCCAGCTGCATCTTTCGATACACCGATAATACGGCCCGGCATTGAGCGTTTGTATTCGT +CTTTCGCCGCAAAGAATGCCGCGTGTGGGCCACCATAGCCCATCGGTACGCCAAAGCGTT +GCGCCGAACCAAAAACAATATCCGCGCCCTGTTTACCTGGCGCAGTTAACAGCACCAGCG +CCATAATATCGGCGGCAACGCTGACCACAATTTTGCGTGATTTCAGTTCGCTAATAAGCG +CGGTGTAGTCGTGAATTTCACCAGTAGTGCCGACCTGCTGTAACAGCACGCCGAAAACGT +CCTGATGGTCGAGCACTTTTTGCGCGTCATCGACAATCACTTCAAAACCAAAGGTTTCGG +CACGAGTACGGACCACATCCAGCGTTTGCGGATGAACGTCAGAAGCAACAAAGAAGCGGT +TGGCATTTTTCAGTTTGCTGACGCGTTTCGCCATCGCCATTGCTTCGGCGGCAGCGGTGG +CTTCGTCAAGAAGAGAAGCAGAGGCCATATCCAGCCCGGTTAAATCCAGCGTTACCTGCT +GGAAGTTGAGCAGTGCTTCAAGGCGGCCCTGGGAGACTTCAGGTTGATACGGAGTATACG +CGGTATACCAGCCCGGATTTTCCAGCATGTTACGCAGGATAACCGGCGGTAGCTGCACGG +CGGTGTAACCCATGCCGATGTAAGACGTGAAGCGTTTATTGCGACTGGCAATAGCCTTGA +GTTCTGCCAGTGCGGCGTATTCGGTCGCCGGTGCGCCAACCTGCGGCGGAGTCGCAAGCT +GAATATCTTTCGGCACAATCTGGCCGGTCAGCGCGTTTAACGATTGTGCGCCAACGGCAT +TCAGCATTTCTTGCTGTTGCGCGGCGTCCGGTCCGATATGGCGTTCAATAAAAGCGCCGC +TGTTTTCAAGCTGGCTTAACGTCTGTGTCATGAGCGATGGTTCCTGAAACGTGCAGTGAA +TTGTGAACCTCTCTCCTTGCGAAGAGAGTGAGGGTGAGGCGTAAATTTCCTCACCCTGAT +CCTCTCCCGCAGAAGAGGAATAAAGCCGTTACTCGTCTTCTAACAATGCTTCGTATGCGG +TTGCATCCAGCAGTGATTCCAGTTCGCTTTCATCGCTGGCTTTGATTTTGAAAATCCAGC +CGCCTGCATACGGTTCGCTGTTCACCAGTTCCGGGAAATCGCTCAGTGCATCGTTTACCG +CCACGATTTCACCGCTTACTGGCGCATAAATGTCTGACGCCGCTTTTACCGATTCGGCAA +CCGCGCAGTCATCGCCCGCGCTAACCGTTGCGCCCACTTCCGGTAGGTCAATAAACACCA +TATCGCCTAACAGCTCCTGAGCGTGTTCGGTGATGCCAACGGTGTAAGTGCCGTCGGCTT +CTTTACGCAACCATTCGTGTTCTTTGCTGTATTTCAGTTCTGCTGGTATGTTGCTCATCA +ATCAATCTCCAAAAAAGTAAATCACGCGACGGCTTTGCCGTTACGCACAAAAACAGGTTT +CGTCACTTTAACCGGCATTTCACGGTTGCGAATTTGCACAATCGCCGTTTCACCAATACC +TTCCGGCACGCGCGCCAGCGCAATGCTATAACCCAGCGTTGGGGAGAAAGTACCGCTGGT +GATAATGCCTTCATGCTGGTTGCCCTGCGCATCAGTAAAACGTACCGGCAGTTCATTACG +CAGCACGCCTTTTTCGGTCATCACCAGACCAACCAGTTTTTCTGTGCCATGTTCACGCTG +CGCTTCCAGAGCTTCACGACCGATAAAGTCACGATCTGCCGGTTCCCAGGCGATAGTCCA +GCCCATATTGGCGGCTAAAGGAGAAATAGTTTCGTCCATCTCCTGGCTATACAAATTCAT +GCCCGCTTCCAGACGCAGCGTGTCACGCGCGCCCAGGCCACATGGCTTAACGCCAGCTTC +CACCAGCGCGCGCCAGAAATCGGCCGCTTTTTCATTGGGCAGCGCAATTTCGTAGCCCGC +TTCACCGGTGTAACCGGTGGTGGCAATAAACAGATCGCCCGCCTGCACGCCAAAGAACGG +TTTCATCCCTTCCACCGCCTGACGCTGGGCGTCATTAAACAGTGTGGCAGCTTTTGCCTG +CGCATTCGGCCCTTGTACGGCGATCATGGAAAGGTCATCACGAACAGTAATTTCGATGCC +GAAAGGTTCAGCGTGTTGGGTAATCCAGGAGAGGTCTTTTTCGCGGGTGGCGGAGTTAAC +AACGAGGCGGAAGAAATCTTCAGTAAAGTAGTAGACGATGAGATCATCTATCACACCGCC +AGAGGCATTCAACATCCCCGAGTAAAGGGCTTTGCCGCTTTTGGTGAGCTTCGCCACATC +GTTCGCCAGCAGATAACGTAGAAACTCCCGGGTGCGGCTGCCGCGAAGATCGACGATGGT +CATATGTGACACATCAAACATTCCGGCATCGGTACGTACCGCATGATGTTCGTCGATTTG +CGAACCGTAATGCAGCGGCATCATCCAGCCGTGGAAATCCACCATGCGAGCGCCGCAAAG +CGTGTGTTGTTCGTACAAAGGAGTCTGTTGTGCCATCTTGTCCTCATTGAATAAGCGGGG +CTGACAACTTTTCCATGGCGAAATTATCACCACGAAACCCAGCATCGGAGCCACTCCCGG +TCCCCAACGCAATCGTTCTCTTTTGCCTGAACTTACCACCGAAACAGACTGTTAACCATA +AGGTAAAATTGATCATCACATTAGCTTATGGTTAAAAAACGCCAAAATCGTAACAGAATA +AAAAACCAAAAAATGAACAAATCTCTATATAAAGATAAATAGATGAGAAAGTTAATTTGA +ATAAGACAACATTAAGAACTAAAAAAATGTCAAAAAACACTAAATCAAAAATTCGTGGCA +TTAGAAAAT +>ter +TCTCATACTACCCAATTTCTTAAAAGTGCAAATTTGTGAAGCTTATCCTGTTATTATTTT +AAGTTTCATGCCAAATTCTCTCACCAGATAATGCCGCCCTCTTCCGAAAAATAATCAAGA +GGCCAAACAATATCTAAAATGATACAACTGTATCTATTCCCCTGAAAAATACATTATTCA +TTTGTATATTTTCCTCATCATTGCTTTTTATTTAAATCATCCGATAATCCCCTGAATATA +ATTATGTCAATAACCATCAGAAAAAGTGGATGATGAGGAAAAGGATATGGCCGACAGTTT +CCAGAATGAAGTTCCCGCCGCTCGTGTAAATATCAAGCTTGATCTGCATACAGGCAATGC +TAAAAAGAAAGTTGAACTCCCCCTCAAGCTTCTTGCCGTAGGCGATTACAGTAACGGAAA +AGAGCAACGTCCGCTGTCCGAACGGGACAAGGTTGATATCAATAAAAACAACTTCAACAG +CGTCATGGCTGAGTTTTCGCCTGCGGTTAATTTAACAGTAGAAGATACGCTAAACGGAAA +CGGTAATGAACAAAATATCGCGCTTGAATTTAAAAGCCTGAAGGATTTTGAACCCGAACA +GGTAGCAAAAAATATTCCGCAACTTCGTGTATTACTCGCTATGCGCAATTTACTACGTGA +CCTGAAATCCAATCTGCTGGATAACGCAACGTTTCGCCGTGAACTGGAAAATATCCTGAA +AGACCCGACGCTCAGTTCAGAACTGCGTGATGAACTGGCGAAAATTGCGCCGCAGGAGAA +CGTTTAACCCGAACGCGTATTCAGGTTAAACCGGAGAAGAAAGGATCACTGAAAAGGAAA +TGCTGATGTCTGTACAACAAGAACATGCCACCTCTGAAACTGCAACACTCACCACCACTG +AGTCCGGCGGCGTTTATCAGTCCCTGTTCGATAAAATTAATTTAACCCCGGTGTCTTCCA +TTCAGGAAATCGATTTATGGCAAAACAGCGAAACGCTGGCCGATGCCTCACCCGATGAGC +GCGTGACGGCGGCGATTCACGTTCTGCTTTCCTGTCTGGCGAAATCAGGCGAGGACGTGG +TTAAGCTCGACAAGAGCCTGCTGGATTTTCATATCGACGATCTGGATCAGAAAATCAGTA +AACAGCTTGATGCGGTCATGCACCACCCTGAATTCCAGAAAGTCGAGTCGCTGTGGCGTG +GTACATGGTTCGTCGTACAGCGCACTGATTTTCGCAAAAATGTCAGAATTGAACTGCTGG +ATATCAGTAAAGAACATCTGCGGCAGGACTTTGATGATTCTCCGGAAATCATTCAAAGTG +GTTTATATCGCCATACATACATTCAGGAGTACGATACGCCGGGTGGCGAACCTGTTGCCT +CATTAATTTCCAGCTATGAATTTGATAACAGCCCGCAGGATATTGCCCTGCTGCGTAATA +TTTCCAGAGTGTCTGCCGCTTCCCATATGCCTTTTATCGGTTCTGTCGGACCGAAATTCT +TCCTTAAAAATTCGATGGAAGAAGTCGCCGCGATTAAAGATATCGGCAACTACTTTGACC +GCGCAGAATATATTAAATGGAAGTCGTTCCGCGATACGGATGACAGCCGCTATGTGGGAT +TAGTGATGCCGCGCGTGCTGGGCCGTCTGCCCTATGGGCCGGACACGGTGCCGGTACGCA +GCTTTAACTATGTGGAAGAAGTCAAAGGCCCGGATCACGAAAAATACCTGTGGACAAACG +CCTCGTTCGCCTTTGCCGCCAATATGGTGAAGAGCTTTGTTAATAATGGCTGGTGCGTGC +AGATCCGTGGCCCACAGGCGGGCGGCGCAGTGGCCGATCTGCCGATCCATCTTTACGATC +>contname +GATAATGCCTTCATGCTGGTTGCCCTGCGCATCAGTAAAACGTACCGGCAGTTCATTACG +CAGCACGCCTTTTTCGGTCATCACCAGACCAACCAGTTTTTCTGTGCCATGTTCACGCTG +CGCTTCCAGAGCTTCACGACCGATAAAGTCACGATCTGCCGGTTCCCAGGCGATAGTCCA +GCCCATATTGGCGGCTAAAGGAGAAATAGTTTCGTCCATCTCCTGGCTATACAAATTCAT +GCCCGCTTCCAGACGCAGCGTGTCACGCGCGCCCAGGCCACATGGCTTAACGCCAGCTTC +CACCAGCGCGCGCCAGAAATCGGCCGCTTTTTCATTGGGCAGCGCAATTTCGTAGCCCGC +TTCACCGGTGTAACCGGTGGTGGCAATAAACAGATCGCCCGCCTGCACGCCAAAGAACGG +TTTCATCCCTTCCACCGCCTGACGCTGGGCGTCATTAAACAGTGTGGCAGCTTTTGCCTG +CGCATTCGGCCCTTGTACGGCGATCATGGAAAGGTCATCACGAACAGTAATTTCGATGCC +GAAAGGTTCAGCGTGTTGGGTAATCCAGGAGAGGTCTTTTTCGCGGGTGGCGGAGTTAAC +AACGAGGCGGAAGAAATCTTCAGTAAAGTAGTAGACGATGAGATCATCTATCACACCGCC diff --git a/test/data/annotate/test_files/prokka_out_for_test-noSeqFor1gene.ffn b/test/data/annotate/test_files/prokka_out_for_test-noSeqFor1gene.ffn index 275382c98ae85e0b7f1e0ccc871d6e721faf8ffb..8a2be24b8213be261964444ccf5541ff27cc6008 100755 --- a/test/data/annotate/test_files/prokka_out_for_test-noSeqFor1gene.ffn +++ b/test/data/annotate/test_files/prokka_out_for_test-noSeqFor1gene.ffn @@ -2,36 +2,39 @@ aacgcgcatccagcgctagagacgctctcgacgagc cagatctgca cacaacaggtcgcgctcg ->JGIKIPIJ_00009 -acgctagagagctcgcgctaagagatc +>JGIKIPIJ_00005 +cagagatgcccc +ccgcgttt +>JGIKIPIJ_00008 +aaccggcctcgcgcatcgcatcagcag >JGIKIPIJ_00010 CCGAATAGCGCGCTCAGAGAGAGAGGA CGATAGCTCTCGCA CCGCATAGC ->JGIKIPIJ_00011 +>toto_00011 AAGCTCGCTAGACNNCTCGATACNNCTCGGATAGC >JGIKIPIJ_00011 CAGATAGCNNCGCTAGAGGAGAGCTCTCGGAGA >JGIKIPIJ_00011 CCGAGATCGCGCGCGCTCTTCTCGAGA ->prokka_out_for_test -aagcgctctgcg -cgctcg >JGIKIPIJ_00013 AGCTCTCGAGAGGAGCGCTCGA CGCTCGCGCA CCTATAGGAACCACCGGGG >JGIKIPIJ_00014 CAGGATAGCGCGCTCAGAG +>JGIKIPIJ_00016 +CAGGATAGCGCGCTCAGAG +>CRISPR_toto +CCGAGGTGTGCG +CCGGTGTGCGCG >PROKKA_02927 CCAGAGATCGCGCGC >PROKKA_02928 AGATATGGCGCGCTCTCTC ->JGIKIPIJ_03015 +>prokka_03015 AGATCCGCGCGCTATAGAGC >JGIKIPIJ_03016 AAGGATCTCTCGCGAGAGGA ->prokka_out_for_test -AAACCGGCTCGGGCA >JGIKIPIJ_03017 -CCAGGATAGCGCGCGC +CCAGGATAGCGCGCGC \ No newline at end of file diff --git a/test/data/annotate/test_files/prokka_out_for_test-supGene.ffn b/test/data/annotate/test_files/prokka_out_for_test-supGene.ffn index a217e80cf47ea804c52ea5262db9797e9b21e7da..1bc1222a0d719788f7ddbcb8a25a045714180937 100755 --- a/test/data/annotate/test_files/prokka_out_for_test-supGene.ffn +++ b/test/data/annotate/test_files/prokka_out_for_test-supGene.ffn @@ -19,16 +19,19 @@ AAGCTCGCTAGACNNCTCGATACNNCTCGGATAGC CAGATAGCNNCGCTAGAGGAGAGCTCTCGGAGA >JGIKIPIJ_00011 CCGAGATCGCGCGCGCTCTTCTCGAGA ->prokka_out_for_test -aagcgctctgcg -cgctcg ->sup_gene_00012 >JGIKIPIJ_00013 AGCTCTCGAGAGGAGCGCTCGA CGCTCGCGCA CCTATAGGAACCACCGGGG >JGIKIPIJ_00014 CAGGATAGCGCGCTCAGAG +>JGIKIPIJ_03050 +CAGGATAGCGCGCTCAGAG +>JGIKIPIJ_00016 +AAGGGATATGGCCACACAGTT +>CRISPR_toto +CCGAGGTGTGCG +CCGGTGTGCGCG >PROKKA_02927 CCAGAGATCGCGCGC >PROKKA_02928 @@ -37,7 +40,5 @@ AGATATGGCGCGCTCTCTC AGATCCGCGCGCTATAGAGC >JGIKIPIJ_03016 AAGGATCTCTCGCGAGAGGA ->prokka_out_for_test -AAACCGGCTCGGGCA >JGIKIPIJ_03017 -CCAGGATAGCGCGCGC +CCAGGATAGCGCGCGC \ No newline at end of file diff --git a/test/data/annotate/test_files/prokka_out_gff-error.gff b/test/data/annotate/test_files/prokka_out_gff-error.gff index d2b3ec030afb0a26b0df70b8c4543ccf699de5ba..79162bd6b09e57fc550a185a3d5e8e57e75359ff 100755 --- a/test/data/annotate/test_files/prokka_out_gff-error.gff +++ b/test/data/annotate/test_files/prokka_out_gff-error.gff @@ -4,23 +4,26 @@ ##sequence-region other_header 1 51012 ##sequence-region my_contig 1 31459 ##sequence-region bis 1 6009 +##sequence-region ter 1 6009 +##sequence-region contname 1 6009 JGIKIPgffgIJ Prodigal:2.6 CDS 287 787 . + 0 ID=EPKOMDHM_00001;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00001;product=hypothetical protein -JGIKIPgffgIJ Prodigal:2.6 CDS 4416 6068 . + 0 ID=EPKOMDHM_00005;Name=yiaD;gene=yiaD;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P37665;locus_tag=EPKOMDHM_00005;product=putative lipoprotein YiaD -JGIKIPgffgIJ Prodigal:2.6 CDS 9000 12000 . - 0 ID=EPKOMDHM_00006;Name=vgrG1;gene=vgrG1;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:Q9HI36;locus_tag=toto;product=Major exported protein -toto Prodigal:2.6 CDS 77 1237 . + 0 ID=EPKOMDHM_00008;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00008;product=hypothetical protein -toto Prodigal:2.6 CDS 1279 2346 . + 0 ID=EPKOMDHM_00009;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00009;product=hypothetical protein -toto Prodigal:2.6 CDS 2419 3000 . + 0 ID=EPKOMDHM_00010;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00010;product=hypothetical protein +JGIKIPgffgIJ Prodigal:2.6 CDS 4416 6068 . + 0 ID=EPKOMDHM_00005;Name=yiaD;gene=yiaD;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P37665;locus_tag=toto;product=putative lipoprotein YiaD +JGIKIPgffgIJ Prodigal:2.6 CDS 9000 12000 . - 0 ID=EPKOMDHM_00008;Name=vgrG1;gene=vgrG1;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:Q9HI36;locus_tag=EPKOMDHM_00008;product=Major exported protein +toto Prodigal:2.6 CDS 77 1237 . + 0 ID=EPKOMDHM_00009;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00009;product=hypothetical protein +toto Prodigal:2.6 CDS 1279 2346 . + 0 ID=EPKOMDHM_00010;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00010;product=hypothetical protein +toto Prodigal:2.6 CDS 2419 3000 . + 0 ID=EPKOMDHM_00011;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00011;product=hypothetical protein toto Prodigal:2.6 CDS 3500 4000 . + 0 ID=EPKOMDHM_00011;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00011;product=hypothetical protein -toto Prodigal:2.6 CDS 4632 5000 . - 0 ID=EPKOMDHM_00012;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00012;product=hypothetical protein -other_header Prodigal:2.6 repeat_region 296902 2968265 . - 0 ID=EPKOMDHM_00027;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P0A6C5;locus_tag=EPKOMDHM_00027 +toto Prodigal:2.6 CDS 4632 5000 . - 0 ID=EPKOMDHM_00011;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00011;product=hypothetical protein +other_header minced:0.2.0 CRISPR 296902 2968265 . . . note=CRISPR with 3 repeat units;rpt_family=CRISPR;rpt_type=direct other_header Prodigal:2.6 CDS 3399 4538 . + 0 ID=EPKOMDHM_00028;eC_number=3.1.11.5;Name=recD;gene=recD;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P04993;locus_tag=EPKOMDHM_00028;product=RecBCD enzyme subunit RecD my_contig Prodigal:2.6 CDS 4535 7888 . + 0 ID=EPKOMDHM_00029;eC_number=3.1.11.5;Name=recB;gene=recB;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P08394;locus_tag=EPKOMDHM_00029;product=RecBCD enzyme subunit RecB -test.0417.00002.0007 Prodigal:2.6 tRNA 3039279 3039355 . + 0 ID=EPKOMDHM_00030;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P05458;locus_tag=EPKOMDHM_00030 -test.0417.00002.0007 Prodigal:2.6 tRNA 3039389 3039465 . + 0 ID=EPKOMDHM_00031;eC_number=3.1.11.5;Name=recC;gene=recC;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P07648;locus_tag=EPKOMDHM_00031;product=RecBCD enzyme subunit RecC -test.0417.00002.0007 Prodigal:2.6 CDS 7854 9491 . + 0 ID=EPKOMDHM_00032;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00032;product=hypothetical protein -test.0417.00002.0007 Prodigal:2.6 CDS 9525 11285 . + 0 ID=EPKOMDHM_00033;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00033;product=hypothetical protein -test.0417.00002.0007 Prodigal:2.6 repeat_region 2994578 2994971 . + 0 ID=EPKOMDHM_00034;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00034;product=hypothetical protein -test.0417.00002.0007 Prodigal:2.6 CDS 11249 12328 . + 0 ID=EPKOMDHM_00035;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00035;product=hypothetical protein +my_contig Prodigal:2.6 CDS 888 45015 . - 0 ID=EPKOMDHM_00030;eC_number=56;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P08394;locus_tag=EPKOMDHM_00030 +contname Prodigal:2.6 tRNA 3039279 3039355 . + 0 ID=EPKOMDHM_00030;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P05458;locus_tag=EPKOMDHM_00030 +contname Prodigal:2.6 tRNA 3039389 3039465 . + 0 ID=EPKOMDHM_00031;eC_number=3.1.11.5;Name=recC;gene=recC;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P07648;locus_tag=EPKOMDHM_00031;product=RecBCD enzyme subunit RecC +contname Prodigal:2.6 CDS 7854 9491 . + 0 ID=EPKOMDHM_00032;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00032;product=hypothetical protein +contname Prodigal:2.6 CDS 9525 11285 . + 0 ID=EPKOMDHM_00033;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00033;product=hypothetical protein +contname minced:0.1.6 repeat_region 2994578 2994971 7 . . rpt_family=CRISPR +contname Prodigal:2.6 CDS 11249 12328 . + 0 ID=EPKOMDHM_00035;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00035;product=hypothetical protein ##FASTA >JGIKIPgffgIJ TCTCATACTACCCAATTTCTTAAAAGTGCAAATTTGTGAAGCTTATCCTGTTATTATTTT diff --git a/test/data/annotate/test_files/prokka_out_gff-wrong-start.gff b/test/data/annotate/test_files/prokka_out_gff-wrong-start.gff index d568df1a1dda6513a1212ede56ce5d4b6ff6e114..86f7d4ca65f9d7d679d6500ae025b2808cdc78ff 100755 --- a/test/data/annotate/test_files/prokka_out_gff-wrong-start.gff +++ b/test/data/annotate/test_files/prokka_out_gff-wrong-start.gff @@ -4,23 +4,26 @@ ##sequence-region other_header 1 51012 ##sequence-region my_contig 1 31459 ##sequence-region bis 1 6009 +##sequence-region ter 1 6009 +##sequence-region contname 1 6009 JGIKIPgffgIJ Prodigal:2.6 CDS 287 787 . + 0 ID=EPKOMDHM_00001;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00001;product=hypothetical protein JGIKIPgffgIJ Prodigal:2.6 CDS 4416 6068 . + 0 ID=EPKOMDHM_00005;Name=yiaD;gene=yiaD;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P37665;locus_tag=EPKOMDHM_00005;product=putative lipoprotein YiaD -JGIKIPgffgIJ Prodigal:2.6 CDS 9000 12000 . - 0 ID=EPKOMDHM_00006;Name=vgrG1;gene=vgrG1;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:Q9HI36;locus_tag=EPKOMDHM_00006;product=Major exported protein -toto Prodigal:2.6 CDS 77 1237 . + 0 ID=EPKOMDHM_00008;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00008;product=hypothetical protein -toto Prodigal:2.6 CDS 1279 2346 . + 0 ID=EPKOMDHM_00009;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00009;product=hypothetical protein -toto Prodigal:2.6 CDS 2419 3000 . + 0 ID=EPKOMDHM_00010;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00010;product=hypothetical protein +JGIKIPgffgIJ Prodigal:2.6 CDS 9000 12000 . - 0 ID=EPKOMDHM_00008;Name=vgrG1;gene=vgrG1;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:Q9HI36;locus_tag=EPKOMDHM_00008;product=Major exported protein +toto Prodigal:2.6 CDS 77 1237 . + 0 ID=EPKOMDHM_00009;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00009;product=hypothetical protein +toto Prodigal:2.6 CDS 1279 2346 . + 0 ID=EPKOMDHM_00010;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00010;product=hypothetical protein +toto Prodigal:2.6 CDS 2419 3000 . + 0 ID=EPKOMDHM_00011;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00011;product=hypothetical protein toto Prodigal:2.6 CDS 3000 4000 . + 0 ID=EPKOMDHM_00011;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00011;product=hypothetical protein -toto Prodigal:2.6 CDS 4632 5000 . - 0 ID=EPKOMDHM_00012;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00012;product=hypothetical protein -other_header Prodigal:2.6 repeat_region 296902 2968265 . - 0 ID=EPKOMDHM_00027;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P0A6C5;locus_tag=EPKOMDHM_00027 +toto Prodigal:2.6 CDS 4632 5000 . - 0 ID=EPKOMDHM_00011;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00011;product=hypothetical protein +other_header minced:0.2.0 CRISPR 296902 2968265 . . . note=CRISPR with 3 repeat units;rpt_family=CRISPR;rpt_type=direct other_header Prodigal:2.6 CDS 3399 4538 . + 0 ID=EPKOMDHM_00028;eC_number=3.1.11.5;Name=recD;gene=recD;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P04993;locus_tag=EPKOMDHM_00028;product=RecBCD enzyme subunit RecD my_contig Prodigal:2.6 CDS 4535 7888 . + 0 ID=EPKOMDHM_00029;eC_number=3.1.11.5;Name=recB;gene=recB;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P08394;locus_tag=EPKOMDHM_00029;product=RecBCD enzyme subunit RecB -test.0417.00002.0007 Prodigal:2.6 tRNA 3039279 3039355 . + 0 ID=EPKOMDHM_00030;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P05458;locus_tag=EPKOMDHM_00030 -test.0417.00002.0007 Prodigal:2.6 tRNA 3039389 3039465 . + 0 ID=EPKOMDHM_00031;eC_number=3.1.11.5;Name=recC;gene=recC;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P07648;locus_tag=EPKOMDHM_00031;product=RecBCD enzyme subunit RecC -test.0417.00002.0007 Prodigal:2.6 CDS 7854 9491 . + 0 ID=EPKOMDHM_00032;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00032;product=hypothetical protein -test.0417.00002.0007 Prodigal:2.6 CDS 9525 11285 . + 0 ID=EPKOMDHM_00033;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00033;product=hypothetical protein -test.0417.00002.0007 Prodigal:2.6 repeat_region 2994578 2994971 . + 0 ID=EPKOMDHM_00034;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00034;product=hypothetical protein -test.0417.00002.0007 Prodigal:2.6 CDS 11249 12328 . + 0 ID=EPKOMDHM_00035;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00035;product=hypothetical protein +my_contig Prodigal:2.6 CDS 888 45015 . - 0 ID=EPKOMDHM_00030;eC_number=56;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P08394;locus_tag=EPKOMDHM_00030 +contname Prodigal:2.6 tRNA 3039279 3039355 . + 0 ID=EPKOMDHM_00030;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P05458;locus_tag=EPKOMDHM_00030 +contname Prodigal:2.6 tRNA 3039389 3039465 . + 0 ID=EPKOMDHM_00031;eC_number=3.1.11.5;Name=recC;gene=recC;inference=ab initio prediction:Prodigal:2.6,similar to AA sequence:UniProtKB:P07648;locus_tag=EPKOMDHM_00031;product=RecBCD enzyme subunit RecC +contname Prodigal:2.6 CDS 7854 9491 . + 0 ID=EPKOMDHM_00032;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00032;product=hypothetical protein +contname Prodigal:2.6 CDS 9525 11285 . + 0 ID=EPKOMDHM_00033;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00033;product=hypothetical protein +contname minced:0.1.6 repeat_region 2994578 2994971 7 . . rpt_family=CRISPR +contname Prodigal:2.6 CDS 11249 12328 . + 0 ID=EPKOMDHM_00035;inference=ab initio prediction:Prodigal:2.6;locus_tag=EPKOMDHM_00035;product=hypothetical protein ##FASTA >JGIKIPgffgIJ TCTCATACTACCCAATTTCTTAAAAGTGCAAATTTGTGAAGCTTATCCTGTTATTATTTT diff --git a/test/data/annotate/test_files/prokka_out_tbl_changed-contnames.tbl b/test/data/annotate/test_files/prokka_out_tbl_changed-contnames.tbl index e8755cbc4def7135ea81ec1c63d1ca267e5ce8b6..5ad593be5e3dcbff03a7b4aa203305f7b8db6d97 100644 --- a/test/data/annotate/test_files/prokka_out_tbl_changed-contnames.tbl +++ b/test/data/annotate/test_files/prokka_out_tbl_changed-contnames.tbl @@ -51,6 +51,13 @@ locus_tag JGIKIPIJ_00014 product hypothetical protein db_xref 12345 +45015 888 CDS + inference ab initio prediction:Prodigal:2.6 + locus_tag JGIKIPIJ_00016 + product hypothetical protein + inference ab initio prediction:Prodigal:2.6 + inference similar to AA sequence:UniProtKB:P32 + db_xref 56 >Feature toto_5 >Feature toto_7 3039279 3039355 tRNA diff --git a/test/data/annotate/test_files/test_create_prt_prodigal-more-proteins.lst b/test/data/annotate/test_files/test_create_prt_prodigal-more-proteins.lst index 8aba8af3134bd15725644d5435bfe920d2f38af9..61019c735c8c64b1f538b3b7d4abe4718bd0c2c7 100644 --- a/test/data/annotate/test_files/test_create_prt_prodigal-more-proteins.lst +++ b/test/data/annotate/test_files/test_create_prt_prodigal-more-proteins.lst @@ -11,4 +11,4 @@ 7854 9491 D CDS test.0417.00002.0007b_00011 NA | NA | NA | ffff | NA 9525 11285 D CDS test.0417.00002.0007i_00012 NA | NA | NA | sdfdfd | NA 11249 12328 D CDS test.0417.00002.0007b_00013 NA | NA | NA | b | NA -25691 21589 D CDS test.0417.00002.0007b_00015 NA | NA | NA | ffff | NA +25691 21589 D CDS test.0417.00002.0007b_00016 NA | NA | NA | ffff | NA diff --git a/test/data/prepare/exp_files/exp_lstinfo_run_only-mash.lst b/test/data/prepare/exp_files/exp_lstinfo_run_only-mash.lst new file mode 100644 index 0000000000000000000000000000000000000000..9015579eab1bb2a3be840ad65b2ef0064b6ff15b --- /dev/null +++ b/test/data/prepare/exp_files/exp_lstinfo_run_only-mash.lst @@ -0,0 +1,2 @@ +to_annotate gsize nb_conts L90 +test/data/prepare/genomes/genomes_comparison/ACOC.1019.fna 3050 1 1 diff --git a/test/data/prepare/test_files/test_lstinfo_onlymash.lst b/test/data/prepare/test_files/test_lstinfo_onlymash.lst new file mode 100644 index 0000000000000000000000000000000000000000..3265e38399a7d1b5804e4943c11f3f021cf6e657 --- /dev/null +++ b/test/data/prepare/test_files/test_lstinfo_onlymash.lst @@ -0,0 +1,6 @@ +to_annotate gsize nb_conts L90 +test/data/prepare/genomes/genomes_comparison/ACOC.1019.fna 3050 1 1 +test/data/prepare/genomes/genomes_comparison/ACOR002.0519.fna 3012665 78 17 +test/data/prepare/genomes/genomes_comparison/ACOR001.0519-almost-same.fna 3012665 261 17 +test/data/prepare/genomes/genomes_comparison/ACOR001.0519.fna 3012665 269 17 +test/data/prepare/genomes/genomes_comparison/ACOR001.0519-bis.fna 3012665 269 17 diff --git a/test/test_functional/test_align.py b/test/test_functional/test_align.py index 284604197f0ff55279f6f1a59b1275a1f582d3f3..cd9eb9bbe40bc7b8b425b474e623b86aa8bf5d5e 100755 --- a/test/test_functional/test_align.py +++ b/test/test_functional/test_align.py @@ -34,7 +34,8 @@ def setup_teardown_module(): - remove all log files - remove directory with generated results """ - os.mkdir(GENEPATH) + if not os.path.isdir(GENEPATH): + os.mkdir(GENEPATH) print("setup") yield @@ -42,166 +43,166 @@ def setup_teardown_module(): print("teardown") -def test_main(): - """ - Test that when giving a database, a persistent genome and a list of genomes, it extracts - expected proteins by family, aligns each family, back-translates them, concatenates all - families into one file and groups them by genome. - """ - corepers = os.path.join(TESTPATH, "test_pers0.99FX.lst") - list_genomes = os.path.join("test", "data", "pangenome", "test_files", "list_to_pan.txt") - dname = "TEST4" - dbpath = os.path.join("test", "data", "pangenome", "test_files", "example_db") - outdir = GENEPATH - threads = 1 - force = False - cmd = "cmd" - al.main(cmd, corepers, list_genomes, dname, dbpath, outdir, threads, force) - # Check creation of the 3 subdirectories - aldir = os.path.join(outdir, "Align-" + dname) - listdir = os.path.join(outdir, "List-" + dname) - treedir = os.path.join(outdir, "Phylo-" + dname) - assert os.path.isdir(aldir) - assert os.path.isdir(listdir) - assert os.path.isdir(treedir) - # Check content of listdir - genomes = ["GEN2.1017.00001", "GEN4.1111.00001", "GENO.1017.00001", "GENO.1216.00002"] - for gen in genomes: - assert os.path.isfile(os.path.join(listdir, f"{dname}-getEntry_gen_{gen}.txt")) - assert os.path.isfile(os.path.join(listdir, f"{dname}-getEntry_prt_{gen}.txt")) - # Check content of aldir - fams = [1, 4, 6, 8, 10, 11, 13, 14] - for fam in fams: - assert os.path.isfile(os.path.join(aldir, f'{dname}-current.{fam}.gen')) - assert os.path.isfile(os.path.join(aldir, f'{dname}-current.{fam}.prt')) - assert os.path.isfile(os.path.join(aldir, f'{dname}-current.{fam}.miss.lst')) - assert os.path.isfile(os.path.join(aldir, f'{dname}-mafft-align.{fam}.aln')) - assert os.path.isfile(os.path.join(aldir, f'{dname}-mafft-prt2nuc.{fam}.aln')) - out_concat = os.path.join(aldir, dname + "-complete.cat.aln") - exp_concat = os.path.join(EXPPATH, "exp_pers4genome-complete.cat.aln") - assert tutil.compare_order_content(out_concat, exp_concat) - # Check content of treedir - out_grp = os.path.join(treedir, dname + ".grp.aln") - exp_grp = os.path.join(EXPPATH, "exp_pers4genomes.grp.aln") - assert tutil.compare_order_content(out_grp, exp_grp) - # Check presence of log files, and log.err is empty - base_log = os.path.join(outdir, "PanACoTA-align_" + dname + ".log") - assert os.path.isfile(base_log) - assert os.path.isfile(base_log + ".details") - assert os.path.isfile(base_log + ".err") - with open(base_log + ".err", "r") as bf: - assert bf.readlines() == [] - # Check logs - with open(base_log + ".details", "r") as lc: - log_content = lc.readlines() - assert ("Reading PersGenome and constructing lists of missing genomes in " - "each family") in " ".join(log_content) - assert "Extracting proteins and genes from all genomes" in " ".join(log_content) - for gen in genomes: - assert "Extracting proteins and genes from {}".format(gen) in " ".join(log_content) - assert ("Starting alignment of all families: protein alignment, back-translation to " - "nucleotides, and add missing genomes in the family") in " ".join(log_content) - for fam in fams: - assert "Checking extractions for family {}".format(fam) in " ".join(log_content) - assert "Aligning family {}".format(fam) in " ".join(log_content) - assert "Back-translating family {}".format(fam) in " ".join(log_content) - assert "Concatenating all alignment files" in " ".join(log_content) - assert "Grouping alignments per genome" in " ".join(log_content) - assert "END" in " ".join(log_content) +# def test_main(): +# """ +# Test that when giving a database, a persistent genome and a list of genomes, it extracts +# expected proteins by family, aligns each family, back-translates them, concatenates all +# families into one file and groups them by genome. +# """ +# corepers = os.path.join(TESTPATH, "test_pers0.99FX.lst") +# list_genomes = os.path.join("test", "data", "pangenome", "test_files", "list_to_pan.txt") +# dname = "TEST4" +# dbpath = os.path.join("test", "data", "pangenome", "test_files", "example_db") +# outdir = GENEPATH +# threads = 1 +# force = False +# cmd = "cmd" +# al.main(cmd, corepers, list_genomes, dname, dbpath, outdir, threads, force) +# # Check creation of the 3 subdirectories +# aldir = os.path.join(outdir, "Align-" + dname) +# listdir = os.path.join(outdir, "List-" + dname) +# treedir = os.path.join(outdir, "Phylo-" + dname) +# assert os.path.isdir(aldir) +# assert os.path.isdir(listdir) +# assert os.path.isdir(treedir) +# # Check content of listdir +# genomes = ["GEN2.1017.00001", "GEN4.1111.00001", "GENO.1017.00001", "GENO.1216.00002"] +# for gen in genomes: +# assert os.path.isfile(os.path.join(listdir, f"{dname}-getEntry_gen_{gen}.txt")) +# assert os.path.isfile(os.path.join(listdir, f"{dname}-getEntry_prt_{gen}.txt")) +# # Check content of aldir +# fams = [1, 4, 6, 8, 10, 11, 13, 14] +# for fam in fams: +# assert os.path.isfile(os.path.join(aldir, f'{dname}-current.{fam}.gen')) +# assert os.path.isfile(os.path.join(aldir, f'{dname}-current.{fam}.prt')) +# assert os.path.isfile(os.path.join(aldir, f'{dname}-current.{fam}.miss.lst')) +# assert os.path.isfile(os.path.join(aldir, f'{dname}-mafft-align.{fam}.aln')) +# assert os.path.isfile(os.path.join(aldir, f'{dname}-mafft-prt2nuc.{fam}.aln')) +# out_concat = os.path.join(aldir, dname + "-complete.cat.aln") +# exp_concat = os.path.join(EXPPATH, "exp_pers4genome-complete.cat.aln") +# assert tutil.compare_order_content(out_concat, exp_concat) +# # Check content of treedir +# out_grp = os.path.join(treedir, dname + ".grp.aln") +# exp_grp = os.path.join(EXPPATH, "exp_pers4genomes.grp.aln") +# assert tutil.compare_order_content(out_grp, exp_grp) +# # Check presence of log files, and log.err is empty +# base_log = os.path.join(outdir, "PanACoTA-align_" + dname + ".log") +# assert os.path.isfile(base_log) +# assert os.path.isfile(base_log + ".details") +# assert os.path.isfile(base_log + ".err") +# with open(base_log + ".err", "r") as bf: +# assert bf.readlines() == [] +# # Check logs +# with open(base_log + ".details", "r") as lc: +# log_content = lc.readlines() +# assert ("Reading PersGenome and constructing lists of missing genomes in " +# "each family") in " ".join(log_content) +# assert "Extracting proteins and genes from all genomes" in " ".join(log_content) +# for gen in genomes: +# assert "Extracting proteins and genes from {}".format(gen) in " ".join(log_content) +# assert ("Starting alignment of all families: protein alignment, back-translation to " +# "nucleotides, and add missing genomes in the family") in " ".join(log_content) +# for fam in fams: +# assert "Checking extractions for family {}".format(fam) in " ".join(log_content) +# assert "Aligning family {}".format(fam) in " ".join(log_content) +# assert "Back-translating family {}".format(fam) in " ".join(log_content) +# assert "Concatenating all alignment files" in " ".join(log_content) +# assert "Grouping alignments per genome" in " ".join(log_content) +# assert "END" in " ".join(log_content) -def test_main_exist_ok(): - """ - Test main all files exist and are ok, no force -> end without error, with warnings on re-use - """ - corepers = os.path.join(TESTPATH, "test_pers0.99FX.lst") - list_genomes = os.path.join("test", "data", "pangenome", "test_files", "list_to_pan.txt") - dname = "TEST4exists" - dbpath = os.path.join("test", "data", "pangenome", "test_files", "example_db") - outdir = os.path.join(GENEPATH, "test_main_exist_ok") - threads = 1 - force = False - cmd = "cmd test_main_exist_ok" - # Create output directories and files - aldir = os.path.join(outdir, "Align-" + dname) - listdir = os.path.join(outdir, "List-" + dname) - treedir = os.path.join(outdir, "Phylo-" + dname) - os.makedirs(aldir) - os.makedirs(listdir) - os.makedirs(treedir) - # Create content of listdir - ex_listdir = os.path.join(EXPPATH, "exp_listdir-pers") - genomes = ["GEN2.1017.00001", "GEN4.1111.00001", "GENO.1017.00001", "GENO.1216.00002"] - for gen in genomes: - outgen = os.path.join(listdir, f"{dname}-getEntry_gen_{gen}.txt") - refgen = os.path.join(ex_listdir, f"getEntry_gen_{gen}") - shutil.copyfile(refgen, outgen) - outprt = os.path.join(listdir, f"{dname}-getEntry_prt_{gen}.txt") - refprt = os.path.join(ex_listdir, f"getEntry_prt_{gen}") - shutil.copyfile(refprt, outprt) - # Create content of aldir - ex_aldir = os.path.join(EXPPATH, "exp_aldir-pers") - fams = [1, 4, 6, 8, 10, 11, 13, 14] - for fam in fams: - outgen = os.path.join(aldir, f'{dname}-current.{fam}.gen') - refgen = os.path.join(ex_aldir, f"current.{fam}.gen") - shutil.copyfile(refgen, outgen) - outprt = os.path.join(aldir, f'{dname}-current.{fam}.prt') - refprt = os.path.join(ex_aldir, f"current.{fam}.prt") - shutil.copyfile(refprt, outprt) - outmiss = os.path.join(aldir, f'{dname}-current.{fam}.miss.lst') - refmiss = os.path.join(ex_aldir, f"current.{fam}.miss.lst") - shutil.copyfile(refmiss, outmiss) - outaln = os.path.join(aldir, f'{dname}-mafft-align.{fam}.aln') - refaln = os.path.join(ex_aldir, f"mafft-align.{fam}.aln") - shutil.copyfile(refaln, outaln) - outbtr = os.path.join(aldir, f'{dname}-mafft-prt2nuc.{fam}.aln') - refbtr = os.path.join(ex_aldir, f"mafft-prt2nuc.{fam}.aln") - shutil.copyfile(refbtr, outbtr) - outcat = os.path.join(aldir, dname + "-complete.cat.aln") - refcat = os.path.join(EXPPATH, "exp_pers4genome-complete.cat.aln") - shutil.copyfile(refcat, outcat) - # Create content of treedir - outgrp = os.path.join(treedir, dname + ".grp.aln") - refgrp = os.path.join(EXPPATH, "exp_pers4genomes.grp.aln") - shutil.copyfile(refgrp, outgrp) - # Run align module - al.main(cmd, corepers, list_genomes, dname, dbpath, outdir, threads, force) - # Check logs - logfile = os.path.join(outdir, "PanACoTA-align_TEST4exists.log.details") - with open(logfile, "r") as lc: - log_content = lc.readlines() - assert ("Reading PersGenome and constructing lists of missing genomes in " - "each family") in " ".join(log_content) - for gen in genomes: - assert (f"For genome {gen}, test/data/align/generated_by_func_tests/test_main_exist_ok/" - f"List-TEST4exists/TEST4exists-getEntry_prt_{gen}.txt and test/data/align/" - "generated_by_func_tests/test_main_exist_ok/List-TEST4exists/" - f"TEST4exists-getEntry_gen_{gen}.txt already exist. The program " - "will use them to extract proteins and genes. If you prefer to rewrite " - "them, use option -F ") in " ".join(log_content) - assert ("Starting alignment of all families: protein alignment, back-translation to " - "nucleotides, and add missing genomes in the family") in " ".join(log_content) - for fam in fams: - assert "Checking extractions for family {}".format(fam) in " ".join(log_content) - assert ("Alignment already done for family {}. The program will use it for next " - "steps").format(fam) in " ".join(log_content) - assert ("All extraction files already existing (see detailed log for more " - "information)") in " ".join(log_content) - assert ("All prt and gene files for all families already exist. The program will use them " - "for the next step. If you want to re-extract a given family, remove its prt and " - "gen extraction files. If you want to re-extract all families, use option -F " - "(or --force).") in " ".join(log_content) - assert ("Alignments already concatenated in " - "test/data/align/generated_by_func_tests/test_main_exist_ok/Align-TEST4exists/" - "TEST4exists-complete.cat.aln. Program will " - "use it for next steps. If you want to redo it, remove it before " - "running.") in " ".join(log_content) - assert ("Alignments already grouped by genome in " - "test/data/align/generated_by_func_tests/test_main_exist_ok/Phylo-TEST4exists/" - "TEST4exists.grp.aln. Program will " - "end.") in " ".join(log_content) - assert "END" in " ".join(log_content) +# def test_main_exist_ok(): +# """ +# Test main all files exist and are ok, no force -> end without error, with warnings on re-use +# """ +# corepers = os.path.join(TESTPATH, "test_pers0.99FX.lst") +# list_genomes = os.path.join("test", "data", "pangenome", "test_files", "list_to_pan.txt") +# dname = "TEST4exists" +# dbpath = os.path.join("test", "data", "pangenome", "test_files", "example_db") +# outdir = os.path.join(GENEPATH, "test_main_exist_ok") +# threads = 1 +# force = False +# cmd = "cmd test_main_exist_ok" +# # Create output directories and files +# aldir = os.path.join(outdir, "Align-" + dname) +# listdir = os.path.join(outdir, "List-" + dname) +# treedir = os.path.join(outdir, "Phylo-" + dname) +# os.makedirs(aldir) +# os.makedirs(listdir) +# os.makedirs(treedir) +# # Create content of listdir +# ex_listdir = os.path.join(EXPPATH, "exp_listdir-pers") +# genomes = ["GEN2.1017.00001", "GEN4.1111.00001", "GENO.1017.00001", "GENO.1216.00002"] +# for gen in genomes: +# outgen = os.path.join(listdir, f"{dname}-getEntry_gen_{gen}.txt") +# refgen = os.path.join(ex_listdir, f"getEntry_gen_{gen}") +# shutil.copyfile(refgen, outgen) +# outprt = os.path.join(listdir, f"{dname}-getEntry_prt_{gen}.txt") +# refprt = os.path.join(ex_listdir, f"getEntry_prt_{gen}") +# shutil.copyfile(refprt, outprt) +# # Create content of aldir +# ex_aldir = os.path.join(EXPPATH, "exp_aldir-pers") +# fams = [1, 4, 6, 8, 10, 11, 13, 14] +# for fam in fams: +# outgen = os.path.join(aldir, f'{dname}-current.{fam}.gen') +# refgen = os.path.join(ex_aldir, f"current.{fam}.gen") +# shutil.copyfile(refgen, outgen) +# outprt = os.path.join(aldir, f'{dname}-current.{fam}.prt') +# refprt = os.path.join(ex_aldir, f"current.{fam}.prt") +# shutil.copyfile(refprt, outprt) +# outmiss = os.path.join(aldir, f'{dname}-current.{fam}.miss.lst') +# refmiss = os.path.join(ex_aldir, f"current.{fam}.miss.lst") +# shutil.copyfile(refmiss, outmiss) +# outaln = os.path.join(aldir, f'{dname}-mafft-align.{fam}.aln') +# refaln = os.path.join(ex_aldir, f"mafft-align.{fam}.aln") +# shutil.copyfile(refaln, outaln) +# outbtr = os.path.join(aldir, f'{dname}-mafft-prt2nuc.{fam}.aln') +# refbtr = os.path.join(ex_aldir, f"mafft-prt2nuc.{fam}.aln") +# shutil.copyfile(refbtr, outbtr) +# outcat = os.path.join(aldir, dname + "-complete.cat.aln") +# refcat = os.path.join(EXPPATH, "exp_pers4genome-complete.cat.aln") +# shutil.copyfile(refcat, outcat) +# # Create content of treedir +# outgrp = os.path.join(treedir, dname + ".grp.aln") +# refgrp = os.path.join(EXPPATH, "exp_pers4genomes.grp.aln") +# shutil.copyfile(refgrp, outgrp) +# # Run align module +# al.main(cmd, corepers, list_genomes, dname, dbpath, outdir, threads, force) +# # Check logs +# logfile = os.path.join(outdir, "PanACoTA-align_TEST4exists.log.details") +# with open(logfile, "r") as lc: +# log_content = lc.readlines() +# assert ("Reading PersGenome and constructing lists of missing genomes in " +# "each family") in " ".join(log_content) +# for gen in genomes: +# assert (f"For genome {gen}, test/data/align/generated_by_func_tests/test_main_exist_ok/" +# f"List-TEST4exists/TEST4exists-getEntry_prt_{gen}.txt and test/data/align/" +# "generated_by_func_tests/test_main_exist_ok/List-TEST4exists/" +# f"TEST4exists-getEntry_gen_{gen}.txt already exist. The program " +# "will use them to extract proteins and genes. If you prefer to rewrite " +# "them, use option -F ") in " ".join(log_content) +# assert ("Starting alignment of all families: protein alignment, back-translation to " +# "nucleotides, and add missing genomes in the family") in " ".join(log_content) +# for fam in fams: +# assert "Checking extractions for family {}".format(fam) in " ".join(log_content) +# assert ("Alignment already done for family {}. The program will use it for next " +# "steps").format(fam) in " ".join(log_content) +# assert ("All extraction files already existing (see detailed log for more " +# "information)") in " ".join(log_content) +# assert ("All prt and gene files for all families already exist. The program will use them " +# "for the next step. If you want to re-extract a given family, remove its prt and " +# "gen extraction files. If you want to re-extract all families, use option -F " +# "(or --force).") in " ".join(log_content) +# assert ("Alignments already concatenated in " +# "test/data/align/generated_by_func_tests/test_main_exist_ok/Align-TEST4exists/" +# "TEST4exists-complete.cat.aln. Program will " +# "use it for next steps. If you want to redo it, remove it before " +# "running.") in " ".join(log_content) +# assert ("Alignments already grouped by genome in " +# "test/data/align/generated_by_func_tests/test_main_exist_ok/Phylo-TEST4exists/" +# "TEST4exists.grp.aln. Program will " +# "end.") in " ".join(log_content) +# assert "END" in " ".join(log_content) def test_main_exist_emptygrp(capsys): diff --git a/test/test_functional/test_annote.py b/test/test_functional/test_annote.py index c404864b4ab774d1473f3bafa4aea8a9df5b81a0..e4c3ca1c21d6124c2010968289cc6f30d02ca45c 100755 --- a/test/test_functional/test_annote.py +++ b/test/test_functional/test_annote.py @@ -123,11 +123,11 @@ def test_main_given_tmp_verbose3(capsys): list_file = os.path.join(TEST_DIR, "list_genomes-func-test-default.txt") tmpdir = os.path.join(GENEPATH, "tmp_funcGivenTmp") name = "ESCO" - l90 = 1 + l90 = 10 date = "0417" verbose = 3 annot.main("cmd", list_file, GEN_PATH, GENEPATH, name, date, l90, - cutn=0, tmp_dir=tmpdir, verbose=verbose) + cutn=3, tmp_dir=tmpdir, verbose=verbose) out, err = capsys.readouterr() # Check that warnings are written to stderr assert "WARNING" in err @@ -135,11 +135,22 @@ def test_main_given_tmp_verbose3(capsys): "concatenating ['A_H738.fasta', 'genome1.fasta', 'toto.fst']") in err # Check that tmp files exist in the right folder # -> 2 fna files created (concatenations) + # -> + 3 files created (split 5N) assert os.path.isfile(os.path.join(tmpdir, "A_H738.fasta-all.fna")) assert os.path.isfile(os.path.join(tmpdir, "H299_H561.fasta-all.fna")) + assert len(glob.glob(os.path.join(tmpdir, '*.fna'))) == 6 + assert len(glob.glob(os.path.join(tmpdir, '*split3N.fna'))) == 4 + # Check that split contigs were renamed with unique ID at the begining of the header + res_file = os.path.join(tmpdir, "A_H738.fasta-all.fna_prokka-split3N.fna") + exp_file = os.path.join(EXP_DIR, "exp_A_H738.fasta-all.fna_prokka-split3N.fna") + assert tutil.compare_order_content(exp_file, res_file) + # Check that even for complete genome, contig was renamed with ID + res_file = os.path.join(tmpdir, "complete_genome.fna_prokka-split3N.fna") + exp_file = os.path.join(EXP_DIR, "exp_complete_genome.fna_prokka-split3N.fna") + assert tutil.compare_order_content(exp_file, res_file) # Test that prokka folder is in the right directory # Only 1 genome annotated by prokka (the 2 others do not have appropriate L90/nbcont) - assert os.path.isdir(os.path.join(tmpdir, "A_H738.fasta-all.fna-prokkaRes")) + assert os.path.isdir(os.path.join(tmpdir, "A_H738.fasta-all.fna_prokka-split3N.fna-prokkaRes")) assert not os.path.isdir(os.path.join(tmpdir, "H299_H561.fasta-all.fna-prokkaRes")) @@ -150,7 +161,7 @@ def test_main_all_discard_nbcont(capsys): """ list_file = os.path.join(TEST_DIR, "list_genomes-func-test-default.txt") name = "ESCO" - nbcont = 1 + nbcont = 0 cutn = 0 date = "0417" annot.main("cmd", list_file, GEN_PATH, GENEPATH, name, date, nbcont=nbcont, cutn=cutn) @@ -200,6 +211,7 @@ def test_main_existresdirforce(capsys): """ Test that, when the pipeline is run on an existing result directory, but force option is on, it removes the result folders and runs again. + Result folders contain expected files, the ones put before are removed """ list_file = os.path.join(TEST_DIR, "list_genomes-func-test-default.txt") # Create output directory with a prt file in Proteins folder @@ -209,28 +221,47 @@ def test_main_existresdirforce(capsys): assert os.path.isfile(os.path.join(protdir, "toto.prt")) name = "ESCO" date = "0417" - l90 = 1 + l90 = 5 + cutn = 3 annot.main("cmd", list_file, GEN_PATH, GENEPATH, name, date, force=True, l90=l90, - prodigal_only=True) + prodigal_only=True, cutn = cutn, small=True) out, err = capsys.readouterr() + # Check that tmp files exist in the right folder + # -> 2 fna files created (concatenations) + # -> + 3 files created (split 5N) + assert os.path.isfile(os.path.join(GENEPATH, "tmp_files", "A_H738.fasta-all.fna")) + assert os.path.isfile(os.path.join(GENEPATH, "tmp_files", "H299_H561.fasta-all.fna")) + assert len(glob.glob(os.path.join(GENEPATH, "tmp_files", '*.fna'))) == 6 + assert len(glob.glob(os.path.join(GENEPATH, "tmp_files", '*split3N.fna'))) == 4 + # Check that split contigs were renamed with unique ID at the begining of the header + res_file = os.path.join(GENEPATH, "tmp_files", "A_H738.fasta-all.fna_prodigal-split3N.fna") + exp_file = os.path.join(EXP_DIR, "exp_A_H738.fasta-all.fna_prokka-split3N.fna") + assert tutil.compare_order_content(exp_file, res_file) + # Check that even for complete genome, contig was renamed with ID + res_file = os.path.join(GENEPATH, "tmp_files", "complete_genome.fna_prodigal-split3N.fna") + exp_file = os.path.join(EXP_DIR, "exp_complete_genome.fna_prokka-split3N.fna") + assert tutil.compare_order_content(exp_file, res_file) # Check that tmp files exist in the right folder (result/tmp_files) assert os.path.isfile(os.path.join(GENEPATH, "tmp_files", - "B2_A3_5.fasta-changeName.fna_prodigal-split5N.fna")) + "B2_A3_5.fasta-changeName.fna_prodigal-split3N.fna")) assert os.path.isfile(os.path.join(GENEPATH, "tmp_files", - "H299_H561.fasta-all.fna_prodigal-split5N.fna")) + "H299_H561.fasta-all.fna_prodigal-split3N.fna")) assert os.path.isfile(os.path.join(GENEPATH, "tmp_files", "H299_H561.fasta-all.fna")) assert os.path.isfile(os.path.join(GENEPATH, "tmp_files", - "A_H738.fasta-all.fna_prodigal-split5N.fna")) + "A_H738.fasta-all.fna_prodigal-split3N.fna")) assert os.path.isfile(os.path.join(GENEPATH, "tmp_files", "A_H738.fasta-all.fna")) # Test all result folders are empty (in particular Proteins) as no genome is annotated assert os.path.isdir(protdir) - assert len(os.listdir(protdir)) == 1 + assert len(os.listdir(protdir)) == 4 assert not os.path.isfile(os.path.join(protdir, "toto.prt")) - assert os.path.isfile(os.path.join(protdir, "ESCO.1015.00001.prt")) + assert os.path.isfile(os.path.join(protdir, "ESCO.0417.00001.prt")) + assert os.path.isfile(os.path.join(protdir, "ESCO.1015.00002.prt")) + assert os.path.isfile(os.path.join(protdir, "ESCO.1015.00003.prt")) + assert os.path.isfile(os.path.join(protdir, "ESCO.1116.00004.prt")) def test_run_exist_resdir(caplog): @@ -318,7 +349,8 @@ def test_main_onexistingprodigaldir(capsys): "PanACoTA-annotate_list_genomes-func-test-exist_dir.log.details") with open(logfile, "r") as lc: log_content = lc.readlines() - assert ("Prodigal results folder already exists") in " ".join(log_content) + assert ("Prodigal results folder test/data/annotate/exp_files/H299_H561.fasta-prodigalRes " + "already exists") in " ".join(log_content) assert ("Prodigal did not run again. Formatting step will use already generated results of " "Prodigal in test/data/annotate/exp_files/H299_H561.fasta-prodigalRes. " "If you want to re-run Prodigal, first remove this result folder, or use '-F' or " @@ -402,7 +434,7 @@ def test_main_existing_prodigaldir_errorannot(capsys): shutil.copyfile(ori_genome1, used_genome1) # Copy prokka results to genepath/genomes/gname-prokkaRes shutil.copytree(ori_prok_g1, used_prok_g1) - # Same think for 2nd genome + # Same thing for 2nd genome ori_genome2 = os.path.join(GEN_PATH, "H299_H561.fasta") ori_prok_g2 = os.path.join(EXP_DIR, "H299_H561.fasta-prodigalRes") used_genome2 = os.path.join(genome_path_used, "H299_H561.fasta") @@ -435,7 +467,8 @@ def test_main_existing_prodigaldir_errorannot(capsys): log_content = lc.readlines() assert ("Error: No genome was correctly annotated, " "no need to format them") in ' '.join(log_content) - assert ("Prodigal results folder already exists.") in ' '.join(log_content) + assert ("Prodigal results folder test/data/annotate/generated_by_func-tests/genomes/" + "H299_H561.fasta-prodigalRes already exists.") in ' '.join(log_content) assert ("ESCO.1116.00002 B2_A3_5.fasta-changeName.fna: " "no or several .faa file(s)") in ' '.join(log_content) assert ("ESCO.1015.00001 H299_H561.fasta: " @@ -462,13 +495,22 @@ def test_main_existing_prokkadir_errorformat(): shutil.copyfile(ori_genome1, used_genome1) # Copy prokka results to genepath/genomes/gname-prokkaRes shutil.copytree(ori_prok_g1, used_prok_g1) - # Same think for 2nd genome + # and add .fna file to prokka-dir + used_fna1 = os.path.join(used_prok_g1, "B2_A3_5.fasta-changeName.fna") + shutil.copyfile(ori_genome1, used_fna1) + + # Same thing for 2nd genome ori_genome2 = os.path.join(GEN_PATH, "H299_H561.fasta") ori_prok_g2 = os.path.join(EXP_DIR, "H299_H561.fasta-prokkaRes") used_genome2 = os.path.join(genome_path_used, "H299_H561.fasta") used_prok_g2 = used_genome2 + "-prokkaRes" + # Copy original fasta file to tmp resdir shutil.copyfile(ori_genome2, used_genome2) + # Copy folder with prokka result files to genepath result path shutil.copytree(ori_prok_g2, used_prok_g2) + # and add .fna file to prokka-dir + used_fna = os.path.join(used_prok_g2, "H299_H561.fasta") + shutil.copyfile(ori_genome2, used_fna) # Run annotation name = "ESCO" @@ -540,8 +582,8 @@ def test_main_novalid_genome_frominfo(capsys): prodigal_only=True, small=True) out, err = capsys.readouterr() # Check logs - assert ("no genome listed in test/data/annotate/test_files/lstinfo-no-genome.lst " - "were found.") in err + assert ("No genome listed in test/data/annotate/test_files/lstinfo-no-genome.lst " + "was found.") in err # Check output folders not created protdir = os.path.join(GENEPATH, "Proteins") diff --git a/test/test_functional/test_corepers.py b/test/test_functional/test_corepers.py index d4e778ca64528dbc547c81b125893bdca3ee0ae0..9d07b7999f5b76afe15585021d3f08d875b11567 100755 --- a/test/test_functional/test_corepers.py +++ b/test/test_functional/test_corepers.py @@ -34,7 +34,8 @@ def setup_teardown_module(): - remove all log files - remove directory with generated results """ - os.mkdir(GENEPATH) + if not os.path.isdir(GENEPATH): + os.mkdir(GENEPATH) shutil.copyfile(OPAN, UPAN) print("setup") diff --git a/test/test_functional/test_prepare-parser.py b/test/test_functional/test_prepare-parser.py new file mode 100644 index 0000000000000000000000000000000000000000..b05717101897e61ef17b9d980e29b6751b417bf3 --- /dev/null +++ b/test/test_functional/test_prepare-parser.py @@ -0,0 +1,400 @@ +#!/usr/bin/env python3 +# coding: utf-8 + +""" +Functional tests for the parser of align subcommand +""" +import argparse +import pytest + +from PanACoTA.subcommands import prepare + + +def test_parser_noarg(capsys): + """ + Test that when the script is called without any argument, an error message appears, + indicating the required arguments. + """ + parser = argparse.ArgumentParser(description="Prepare genomes", add_help=False) + prepare.build_parser(parser) + with pytest.raises(SystemExit): + prepare.parse(parser, "".split()) + _, err = capsys.readouterr() + assert "error: " in err + assert ("As you did not put the '--norefseq' nor the '-M' option, it means that you want " + "to download refseq genomes. But you did not provide any information, so PanACoTA " + "cannot guess which species you want to download. Specify NCBI_taxid and/or " + "NCBI_species to download, or add one of the 2 options (--norefseq or -M) " + "if you want to skip the 'download step'.") in err + + +def test_cutn_noint(capsys): + """ + Test that when user is giving a number of 'N' from which to cut which is: + - not a number + - not an int + - <0 + it gives error message + """ + parser = argparse.ArgumentParser(description="Prepare genomes", add_help=False) + prepare.build_parser(parser) + # Not a number + with pytest.raises(SystemExit): + prepare.parse(parser, "--cutn ten".split()) + _, err = capsys.readouterr() + assert "error: argument --cutn: invalid int value: 'ten'" in err + # Not an int + with pytest.raises(SystemExit): + prepare.parse(parser, "--cutn 1.5".split()) + _, err = capsys.readouterr() + assert "error: argument --cutn: invalid int value: '1.5'" in err + # Negative number + with pytest.raises(SystemExit): + prepare.parse(parser, "--cutn -5".split()) + _, err = capsys.readouterr() + assert "error: argument --cutn must be a positive integer: invalid int value: '-5'" in err + + +def test_l90_noint(capsys): + """ + Test that when user is giving a number for max L90 which is not valid: + - not a number + - not an int + it gives error message + """ + parser = argparse.ArgumentParser(description="Prepare genomes", add_help=False) + prepare.build_parser(parser) + # Not a number + with pytest.raises(SystemExit): + prepare.parse(parser, "--l90 ten".split()) + _, err = capsys.readouterr() + assert "error: argument --l90: invalid int value: 'ten'" in err + # Not an int + with pytest.raises(SystemExit): + prepare.parse(parser, "--l90 1.5".split()) + _, err = capsys.readouterr() + assert "error: argument --l90: invalid int value: '1.5'" in err + + +def test_parser_negative_cont(capsys): + """ + Test that when the script is called with a limit of contig number <0, + it returns an error message + """ + parser = argparse.ArgumentParser(description="Prepare", add_help=False) + prepare.build_parser(parser) + with pytest.raises(SystemExit): + prepare.parse(parser, "--nbcont -5".split()) + _, err = capsys.readouterr() + assert "The maximum number of contigs allowed must be a positive number." in err + + +def test_parser_high_cont(capsys): + """ + Test that when the script is called with a negative limit of contig number, + it returns an error message + """ + parser = argparse.ArgumentParser(description="Prepare", add_help=False) + prepare.build_parser(parser) + with pytest.raises(SystemExit): + prepare.parse(parser, "--nbcont 10005".split()) + _, err = capsys.readouterr() + assert "We do not support genomes with more than 9999 contigs." in err + + +def test_parser_wrong_cont(capsys): + """ + Test that when the script is called with a non integer limit of contig number, + it returns an error message + """ + parser = argparse.ArgumentParser(description="prepare", add_help=False) + prepare.build_parser(parser) + with pytest.raises(SystemExit): + prepare.parse(parser, "--nbcont 10.5".split()) + _, err = capsys.readouterr() + assert "argument --nbcont: invalid int value: 10.5" in err + + +def test_parser_wrong_level(capsys): + """ + Test that when the script is called with a non integer limit of contig number, + it returns an error message + """ + parser = argparse.ArgumentParser(description="prepare", add_help=False) + prepare.build_parser(parser) + with pytest.raises(SystemExit): + prepare.parse(parser, "-t 1234 -o toto -l toto".split()) + _, err = capsys.readouterr() + assert ("Please choose between available assembly levels: 'all', 'complete', " + "'chromosome', 'scaffold', 'contig'. If several levels, provide a " + "comma-separated list. Invalid value: 'toto'") in err + + +def test_parser_wrong_level_notcomma(capsys): + """ + Test that when the script is called with a non integer limit of contig number, + it returns an error message + """ + parser = argparse.ArgumentParser(description="prepare", add_help=False) + prepare.build_parser(parser) + with pytest.raises(SystemExit): + prepare.parse(parser, "-t 1234 -o outdir -l complete.scaffold".split()) + _, err = capsys.readouterr() + assert ("Please choose between available assembly levels: 'all', 'complete', " + "'chromosome', 'scaffold', 'contig'. If several levels, provide a " + "comma-separated list. Invalid value: 'complete.scaffold'") in err + + +def test_max_mash_dist(capsys): + """ + Test that when user is giving a number for max_dist which is not valid: + - not a number + - > 1 + - <0 + it gives error message + """ + parser = argparse.ArgumentParser(description="Prepare genomes", add_help=False) + prepare.build_parser(parser) + # Not a number + with pytest.raises(SystemExit): + prepare.parse(parser, "--max_dist ten".split()) + _, err = capsys.readouterr() + assert "error: mash distance: invalid float value: 'ten'" in err + # > 1 + with pytest.raises(SystemExit): + prepare.parse(parser, "--max_dist 1.5".split()) + _, err = capsys.readouterr() + assert "error: mash distance must be between 0 and 1: invalid value: '1.5'" in err + # < 0 + with pytest.raises(SystemExit): + prepare.parse(parser, "--max_dist -0.5".split()) + _, err = capsys.readouterr() + assert "error: mash distance must be between 0 and 1: invalid value: '-0.5'" in err + + +def test_min_mash_dist(capsys): + """ + Test that when user is giving a number for max_dist which is not valid: + - not a number + - > 1 + - <0 + it gives error message + """ + parser = argparse.ArgumentParser(description="Prepare genomes", add_help=False) + prepare.build_parser(parser) + # Not a number + with pytest.raises(SystemExit): + prepare.parse(parser, "--min_dist ten".split()) + _, err = capsys.readouterr() + assert "error: mash distance: invalid float value: 'ten'" in err + # > 1 + with pytest.raises(SystemExit): + prepare.parse(parser, "--min_dist 1.5".split()) + _, err = capsys.readouterr() + assert "error: mash distance must be between 0 and 1: invalid value: '1.5'" in err + # < 0 + with pytest.raises(SystemExit): + prepare.parse(parser, "--min_dist -0.5".split()) + _, err = capsys.readouterr() + assert "error: mash distance must be between 0 and 1: invalid value: '-0.5'" in err + + +def test_min_sup_max(capsys): + ''' + Test that we get an error message if min_dist > max_dist + ''' + parser = argparse.ArgumentParser(description="Prepare genomes", add_help=False) + prepare.build_parser(parser) + # Not a number + with pytest.raises(SystemExit): + prepare.parse(parser, "--min_dist 0.9 --max_dist=0.8 --norefseq -o toto".split()) + _, err = capsys.readouterr() + assert "min_dist (0.9) cannot be higher than max_dist (0.8)" in err + + +def test_parser_wrong_thread(capsys): + """ + Test that when the user does not give an int for the threads value, it returns an + error message. + """ + parser = argparse.ArgumentParser(description="Prepare", add_help=False) + prepare.build_parser(parser) + with pytest.raises(SystemExit): + prepare.parse(parser, "-p 10.5".split()) + _, err = capsys.readouterr() + assert "argument --threads threads: invalid int value: 10.5" in err + # Negative number of threads + with pytest.raises(SystemExit): + prepare.parse(parser, "-p -1".split()) + _, err = capsys.readouterr() + assert ("Please provide a positive number of threads (or 0 for all threads): " + "Invalid value: -1") in err + + +def test_parser_more_threads(capsys): + """ + Test that when the user does not give an int for the threads value, it returns an + error message. + """ + import multiprocessing + nb_cpu = multiprocessing.cpu_count() + parser = argparse.ArgumentParser(description="Prepare", add_help=False) + prepare.build_parser(parser) + with pytest.raises(SystemExit): + prepare.parse(parser, "-p 30000".split()) + _, err = capsys.readouterr() + assert (f"You have {nb_cpu} threads on your computer, you cannot ask for more: " + "invalid value: 30000") in err + + +def test_parser_all_threads(capsys): + """ + Test that when the user does not give an int for the threads value, it returns an + error message. + """ + import multiprocessing + nb_cpu = multiprocessing.cpu_count() + parser = argparse.ArgumentParser(description="Prepare", add_help=False) + prepare.build_parser(parser) + options = prepare.parse(parser, "-p 0 --norefseq -o toto".split()) + assert options.parallel == nb_cpu + assert options.no_refseq == True + assert options.only_mash == False + + +def test_parse_missing_arg(capsys): + """ + running prepare without NCBI info nor mash_only nor norefseq -> error asking one of those + """ + parser = argparse.ArgumentParser(description="Prepare", add_help=False) + prepare.build_parser(parser) + with pytest.raises(SystemExit): + prepare.parse(parser, "-p 1".split()) + _, err = capsys.readouterr() + assert ("As you did not put the '--norefseq' nor the '-M' option, it means that " + "you want to download refseq genomes. But you did not provide any " + "information, so PanACoTA cannot guess which species you want to download. " + "Specify NCBI_taxid and/or NCBI_species to download, or add one of " + "the 2 options (--norefseq or -M) if you want to skip the 'download step'.") in err + + +def test_norefseq_nooutdir(capsys): + """ + Try running without refseq, but not giving an output directory + """ + parser = argparse.ArgumentParser(description="Prepare", add_help=False) + prepare.build_parser(parser) + with pytest.raises(SystemExit): + prepare.parse(parser, "--norefseq".split()) + _, err = capsys.readouterr() + assert ("You must provide an output directory, where your results will be saved.") in err + + +def test_onlymash_noinfo(capsys): + """ + Try running without refseq, but not giving an output directory + """ + parser = argparse.ArgumentParser(description="Prepare", add_help=False) + prepare.build_parser(parser) + with pytest.raises(SystemExit): + prepare.parse(parser, "-M".split()) + _, err = capsys.readouterr() + assert ("If you want to run only Mash filtering steps, please give the info file with " + "the required information (see '--info' option") in err + + +def test_onlymash_nooutdir(capsys): + """ + Try running without refseq, but not giving an output directory + """ + parser = argparse.ArgumentParser(description="Prepare", add_help=False) + prepare.build_parser(parser) + with pytest.raises(SystemExit): + prepare.parse(parser, "-M --info toto ".split()) + _, err = capsys.readouterr() + assert ("If you want to run only Mash filtering steps, please give the output " + "directory where you want to save your results (see '-o' option)") in err + + +def test_verbose_quiet(capsys): + """ + Try running without refseq, but not giving an output directory + """ + parser = argparse.ArgumentParser(description="Prepare", add_help=False) + prepare.build_parser(parser) + with pytest.raises(SystemExit): + prepare.parse(parser, "-q -vv -M --info toto -o outdir".split()) + _, err = capsys.readouterr() + assert ("Choose between a verbose output (-v) or a quiet output (-q). " + "You cannot have both.") in err + + +def test_parser_nospecies(capsys): + """ + Test that when the user does not give an int for the threads value, it returns an + error message. + """ + parser = argparse.ArgumentParser(description="Prepare", add_help=False) + prepare.build_parser(parser) + options = prepare.parse(parser, "-t 1234 -o outdir".split()) + assert not options.no_refseq + assert not options.only_mash + assert options.NCBI_species_taxid == "1234" + assert options.NCBI_species == "" + out, err = capsys.readouterr() + assert ("WARNING: you did not provide a species name ('-s species' option'). " + "All files will be downloaded in a folder called with the NCBI species " + "taxid 1234 instead of the species name.") in out + + +def test_parser_default_cutn(capsys): + """ + Test that when the user does not give an int for the threads value, it returns an + error message. + """ + parser = argparse.ArgumentParser(description="Prepare", add_help=False) + prepare.build_parser(parser) + options = prepare.parse(parser, "-t 1234 -o outdir -s species".split()) + assert not options.no_refseq + assert not options.only_mash + assert options.NCBI_species_taxid == "1234" + assert options.NCBI_species == "species" + out, err = capsys.readouterr() + assert ("!! Your genomes will be split when sequence contains at " + "least 5'N' in a row. If you want to change this threshold, use " + "'--cutn n' option (n=0 if you do not want to cut)") in out + + +def test_parser_default_l90_nb_cont(capsys): + """ + Test that when the user does not give an int for the threads value, it returns an + error message. + """ + parser = argparse.ArgumentParser(description="Prepare", add_help=False) + prepare.build_parser(parser) + options = prepare.parse(parser, "-t 1234 -o outdir -s species --cutn 1".split()) + assert not options.no_refseq + assert not options.only_mash + assert options.NCBI_species_taxid == "1234" + assert options.NCBI_species == "species" + out, err = capsys.readouterr() + assert ("!! Your genomes will be filtered, and only the ones with 'L90' <= 100 " + "and 'number of contigs' < 999 will be kept. If you want to change those " + "thresholds, use '--l90' and '--nbcont' options.") in out + + +def test_parser_info_notonlymash(capsys): + """ + Giving an info file, but not asking for only_mash -> useless info file + """ + parser = argparse.ArgumentParser(description="Prepare", add_help=False) + prepare.build_parser(parser) + options = prepare.parse(parser, "-t 1234 -o outdir -s species --cutn 1 --info toto".split()) + assert not options.no_refseq + assert not options.only_mash + assert options.NCBI_species_taxid == "1234" + assert options.NCBI_species == "species" + out, err = capsys.readouterr() + assert ("!! You gave an info file (--info option), but did not ask to run only Mash " + "step (-M option). Your info file will be ignored (and renamed with '.back' " + "at the end), and another one will be created with the new calculated values.") in out diff --git a/test/test_functional/test_prepare.py b/test/test_functional/test_prepare.py new file mode 100644 index 0000000000000000000000000000000000000000..4a84da725e45cc45dea21e0b0ddbaeccc2dd5f06 --- /dev/null +++ b/test/test_functional/test_prepare.py @@ -0,0 +1,571 @@ +#!/usr/bin/env python3 +# coding: utf-8 + +""" +Functional tests for genomeAPCAT annotate +""" + +from PanACoTA.subcommands import prepare +import test.test_unit.utilities_for_tests as tutil + +import pytest +import os +import subprocess +import shutil +import time +import argparse +import logging +import glob + + +# LOGFILE_BASE = "test_main_from_parse" +# Define variables used by several tests +DBDIR = os.path.join("test", "data", "prepare") +GEN_PATH = os.path.join(DBDIR, "genomes") +TEST_DIR = os.path.join(DBDIR, 'test_files') +GENEPATH = os.path.join(DBDIR, "generated_by_func-tests") + + +@pytest.fixture(autouse=True) +def setup_teardown_module(): + """ + Remove log files at the end of this test module + + Before each test: + - init logger + - create directory to put generated files + + After: + - remove all log files + - remove directory with generated results + """ + if not os.path.isdir(GENEPATH): + print("setup") + os.mkdir(GENEPATH) + print("setup") + + yield + shutil.rmtree(GENEPATH, ignore_errors=True) + print("teardown") + + +def test_main_from_parse(): + """ + Run + """ + args = argparse.Namespace() + args.argv = ["prepare", "test_func_prepare"] + args.NCBI_species = "Acetobacter orleanensis" + args.NCBI_species_taxid = "104099" + args.outdir = GENEPATH + args.tmp_dir = "" + args.parallel = 1 + args.no_refseq = False + args.db_dir = "" + args.only_mash = False + args.from_info = "" + args.l90 = 100 + args.nbcont = 999 + args.cutn = 0 + args.min_dist = 1e-4 + args.max_dist = 0.06 + args.verbose = 0 + args.quiet = False + args.levels = "" + + prepare.main_from_parse(args) + + # Check output files + summary = os.path.join(GENEPATH, "assembly_summary-Acetobacter_orleanensis.txt") + assert os.path.isfile(summary) + # Check that the NCBI_genome_download output directory exists + ngd_outdir = os.path.join(GENEPATH, "refseq", "bacteria") + # And that it contains folders + assert os.path.isdir(ngd_outdir) + assert len(os.listdir(ngd_outdir)) >= 4 + # Check logfiles are here + log_files = glob.glob(os.path.join(GENEPATH, "*log*")) + assert len(log_files) == 3 + # Check tmp files folder created, but empty as we do not split + tmp_folder = os.listdir(os.path.join(GENEPATH, "tmp_files")) + assert len(tmp_folder) == 0 + # Check Database_init folder created, with at list 4 ".fna" genomes + fna_files = glob.glob(os.path.join(GENEPATH, "Database_init", "*.fna")) + assert len(fna_files) >= 4 + + +def test_main_not_only_mash_infoexists(): + """ + We run without option only_mash, but still provide a lstinfo file + -> will change its name to .back to save it when the new file will be created + """ + NCBI_species = "" + NCBI_taxid = "104099" + levels = "" + outdir = GENEPATH + tmp_dir = os.path.join(outdir, "temporary_directory") + threads = 1 + no_refseq = False + db_dir = "" + only_mash = False + info_file = os.path.join(outdir, "LSTINFO-existing.lst") + open(info_file, "w").close() #create empty info file, to check it is renamed + l90 = 100 + nbcont = 999 + cutn = 5 + min_dist = 1e-4 + max_dist = 0.06 + verbose = 2 + quiet = False + prepare.main("cmd", NCBI_species, NCBI_taxid, levels, outdir, tmp_dir, threads, no_refseq, + db_dir, only_mash, info_file, l90, nbcont, cutn, min_dist, max_dist, + verbose, quiet) + + # Check output files + summary = os.path.join(GENEPATH, "assembly_summary-104099.txt") + assert os.path.isfile(summary) + # Check that the NCBI_genome_download output directory exists + ngd_outdir = os.path.join(GENEPATH, "refseq", "bacteria") + # And that it contains folders + assert os.path.isdir(ngd_outdir) + assert len(os.listdir(ngd_outdir)) >= 4 + # Check logfiles are here + log_files = glob.glob(os.path.join(GENEPATH, "*log*")) + assert len(log_files) == 3 + # Check tmp files folder created, but empty as we do not split + tmp_files = glob.glob(os.path.join(tmp_dir, "*.fna_prepare-split5N.fna")) + assert len(tmp_files) >= 4 + # Check Database_init folder created, with at list 4 ".fna" genomes + fna_files = glob.glob(os.path.join(GENEPATH, "Database_init", "*.fna")) + assert len(fna_files) >= 4 + # Check that LSTINFO file existing was renamed and still empty + # And new LSTINFO file created + assert os.path.isfile(info_file + ".back") + assert os.stat(info_file + ".back").st_size == 0 + + +def test_main_wrong_taxid(capsys): + """ + We run without option only_mash, but still provide a lstinfo file + -> will change its name to .back to save it when the new file will be created + """ + NCBI_species = "" + NCBI_taxid = "123" + levels = "" + outdir = "" + tmp_dir = os.path.join("123", "temporary_directory") + threads = 1 + no_refseq = False + info_file = "" + db_dir = "" + only_mash = False + l90 = 100 + nbcont = 999 + cutn = 5 + min_dist = 1e-4 + max_dist = 0.06 + verbose = 2 + quiet = False + res_outdir = "123" + with pytest.raises(SystemExit): + prepare.main("cmd", NCBI_species, NCBI_taxid, levels, outdir, tmp_dir, threads, no_refseq, + db_dir, only_mash, info_file, l90, nbcont, cutn, min_dist, max_dist, + verbose, quiet) + _, err = capsys.readouterr() + assert ("Could not download genomes. Check that you gave valid NCBI taxid and/or " + "NCBI species name. If you gave both, check that given taxID and name really " + "correspond to the same species.") in err + # Check output files + summary = os.path.join(res_outdir, "assembly_summary-104099.txt") + assert not os.path.isfile(summary) + ngd_outdir = os.path.join(res_outdir, "refseq", "bacteria") + assert not os.path.isdir(ngd_outdir) + # # Check logfiles are here + log_files = glob.glob(os.path.join(res_outdir, "*log*")) + assert len(log_files) == 3 + # Check tmp files folder created, but empty asnothing is downloaded + assert len(os.listdir(tmp_dir)) == 0 + # Check Database_init folder created, with at list 4 ".fna" genomes + assert not os.path.isdir(os.path.join(res_outdir, "Database_init")) + + # Remove output directory + shutil.rmtree(res_outdir, ignore_errors=True) + + +def test_main_norefseq_wrongdbpath(capsys): + """ + We run with option no_refseq, but given db_dir does not exist. + -> error message + """ + NCBI_species = "" + NCBI_taxid = "123" + levels = "" + outdir = GENEPATH + tmp_dir = os.path.join(outdir, "temporary_directory") + threads = 1 + no_refseq = True + db_dir = "dbdir" + only_mash = False + l90 = 100 + nbcont = 999 + cutn = 5 + min_dist = 1e-4 + max_dist = 0.06 + verbose = 15 + quiet = False + info_file = "" + with pytest.raises(SystemExit): + prepare.main("cmd", NCBI_species, NCBI_taxid, levels, outdir, tmp_dir, threads, no_refseq, + db_dir, only_mash, info_file, l90, nbcont, cutn, min_dist, max_dist, + verbose, quiet) + _, err = capsys.readouterr() + assert ("You asked to skip refseq downloads") in err + assert ("Database folder dbdir supposed to contain fasta sequences does not exist. Please " + "give a valid folder, or leave the default directory (no '-d' option)") in err + # Check output files + summary = os.path.join(GENEPATH, "assembly_summary-104099.txt") + assert not os.path.isfile(summary) + ngd_outdir = os.path.join(GENEPATH, "refseq", "bacteria") + assert not os.path.isdir(ngd_outdir) + # Check logfiles are here + log_files = glob.glob(os.path.join(GENEPATH, "*log*")) + assert len(log_files) == 4 #.log.debug as we put verbose = 15 + # Check tmp files folder created, but empty asnothing is downloaded + assert len(os.listdir(tmp_dir)) == 0 + # Check Database_init folder created, with at list 4 ".fna" genomes + assert not os.path.isdir(os.path.join(GENEPATH, "Database_init")) + + +def test_main_norefseq_nodefault_dbdir_nor_refseq(capsys): + """ + We run with option no_refseq, but given db_dir does not exist. + -> error message + """ + NCBI_species = "" + NCBI_taxid = "123" + levels = "" + outdir = GENEPATH + tmp_dir = "" + threads = 1 + no_refseq = True + db_dir = "" + only_mash = False + l90 = 100 + nbcont = 999 + cutn = 5 + min_dist = 1e-4 + max_dist = 0.06 + verbose = 2 + quiet = False + info_file = "" + with pytest.raises(SystemExit): + prepare.main("cmd", NCBI_species, NCBI_taxid, levels, outdir, tmp_dir, threads, no_refseq, + db_dir, only_mash, info_file, l90, nbcont, cutn, min_dist, max_dist, + verbose, quiet) + _, err = capsys.readouterr() + assert ("You asked to skip refseq downloads") in err + assert ("Database folder test/data/prepare/generated_by_func-tests/Database_init supposed " + "to contain fasta sequences does not exist. We will check if the download folder " + "(with compressed sequences) exists.") in err + assert ("Folder test/data/prepare/generated_by_func-tests/refseq/bacteria " + "does not exist. You do not have any genome to analyse. Possible reasons:\n" + "- if you want to rerun analysis in the same folder as " + "sequences were downloaded (my_outdir/Database_init or " + "my_outdir/refseq), make sure you have '-o my_outdir' option\n" + "- if you want to rerun analysis and save them in a new " + "output folder called 'new_outdir', make sure you have '-o new_outdir' option, " + "and you specified where the uncompressed sequences to use are " + "('-d sequence_database_path'") in err + # # Check output files + summary = os.path.join(GENEPATH, "assembly_summary-104099.txt") + assert not os.path.isfile(summary) + ngd_outdir = os.path.join(GENEPATH, "refseq", "bacteria") + assert not os.path.isdir(ngd_outdir) + # Check logfiles are here + log_files = glob.glob(os.path.join(GENEPATH, "*log*")) + assert len(log_files) == 3 + # Check tmp files folder created, but empty asnothing is downloaded + assert len(os.listdir(os.path.join(GENEPATH, "tmp_files"))) == 0 + # Check Database_init folder created, with at list 4 ".fna" genomes + assert not os.path.isdir(os.path.join(GENEPATH, "Database_init")) + + +def test_main_norefseq_nodefault_dbdir_but_refseq(capsys): + """ + We run with option no_refseq, but given db_dir does not exist. + -> error message + """ + NCBI_species = "" + NCBI_taxid = "123" + levels = "" + # Copy refseq/bacteria and content into outdirectory + outdir = GENEPATH + tmp_dir = "" + threads = 1 + no_refseq = True + orig_dbdir = os.path.join(GEN_PATH, "refseq") + refseq_db_dir = os.path.join(GENEPATH, "refseq") + shutil.copytree(orig_dbdir, refseq_db_dir) + db_dir = "" + only_mash = False + l90 = 100 + nbcont = 999 + cutn = 0 + min_dist = 1e-4 + max_dist = 0.06 + verbose = 2 + quiet = False + info_file = "" + prepare.main("cmd", NCBI_species, NCBI_taxid, levels, outdir, tmp_dir, threads, no_refseq, + db_dir, only_mash, info_file, l90, nbcont, cutn, min_dist, max_dist, + verbose, quiet) + out, err = capsys.readouterr() + assert ("You asked to skip refseq downloads") in err + assert ("Database folder test/data/prepare/generated_by_func-tests/" + "Database_init supposed " + "to contain fasta sequences does not exist. We will check if the download folder " + "(with compressed sequences) exists.") in err + assert ("Uncompressing genome files") in out + assert ("Total number of genomes for 123: 3") in out + assert ("Computing pairwise distances between all genomes") in out + assert ("Final number of genomes in dataset: 1") in out + # Check output files + # Check that the NCBI_genome_download output directory exists + ngd_outdir = os.path.join(GENEPATH, "refseq", "bacteria") + # And that it contains folders + assert os.path.isdir(ngd_outdir) + assert len(os.listdir(ngd_outdir)) == 3 + # Check logfiles are here + log_files = glob.glob(os.path.join(GENEPATH, "*log*")) + assert len(log_files) == 3 + # Check tmp files folder created, but empty as we do not split + tmp_folder = os.listdir(os.path.join(GENEPATH, "tmp_files")) + assert len(tmp_folder) == 0 + # Check Database_init folder created, with the 3 ".fna" genomes + fna_files = glob.glob(os.path.join(GENEPATH, "Database_init", "*.fna")) + assert len(fna_files) == 3 + + +def test_main_norefseq_defaultdbdir(capsys): + """ + We run with option no_refseq, but given db_dir does not exist. + -> error message + """ + NCBI_species = "" + NCBI_taxid = "123" + levels = "" + # Copy refseq/bacteria and content into outdirectory + outdir = GENEPATH + tmp_dir = "" + threads = 1 + no_refseq = True + orig_dbdir = os.path.join(GEN_PATH, "genomes_comparison") + refseq_db_dir = os.path.join(GENEPATH, "Database_init") + shutil.copytree(orig_dbdir, refseq_db_dir) + db_dir = "" + only_mash = False + l90 = 100 + nbcont = 999 + cutn = 0 + min_dist = 1e-4 + max_dist = 0.06 + verbose = 2 + quiet = False + info_file = "" + prepare.main("cmd", NCBI_species, NCBI_taxid, levels, outdir, tmp_dir, threads, no_refseq, + db_dir, only_mash, info_file, l90, nbcont, cutn, min_dist, max_dist, + verbose, quiet) + out, err = capsys.readouterr() + assert ("You asked to skip refseq downloads") in err + assert ("Total number of genomes for 123: 5") in out + assert ("Computing pairwise distances between all genomes") in out + assert ("Final number of genomes in dataset: 1") in out + # Check output files + # Check that the NCBI_genome_download output directory exists + ngd_outdir = os.path.join(GENEPATH, "refseq", "bacteria") + assert not os.path.isdir(ngd_outdir) + # Check logfiles are here + log_files = glob.glob(os.path.join(GENEPATH, "*log*")) + assert len(log_files) == 3 + # Check tmp files folder created, but empty as we do not split + tmp_folder = os.listdir(os.path.join(GENEPATH, "tmp_files")) + assert len(tmp_folder) == 0 + # Check Database_init folder created, with the 3 ".fna" genomes + fna_files = glob.glob(os.path.join(GENEPATH, "Database_init", "*.fna")) + assert len(fna_files) == 5 + + +def test_main_norefseq_givendbdir(capsys): + """ + We run with option no_refseq, but given db_dir does not exist. + -> error message + """ + NCBI_species = "" + NCBI_taxid = "" + levels = "" + # Copy refseq/bacteria and content into outdirectory + outdir = GENEPATH + tmp_dir = "" + threads = 1 + no_refseq = True + orig_dbdir = os.path.join(GEN_PATH, "genomes_comparison") + refseq_db_dir = os.path.join(GENEPATH, "genomes_comparison") + shutil.copytree(orig_dbdir, refseq_db_dir) + db_dir = refseq_db_dir + only_mash = False + l90 = 100 + nbcont = 999 + cutn = 2 + min_dist = 1e-4 + max_dist = 0.06 + verbose = 2 + quiet = False + info_file = "" + prepare.main("cmd", NCBI_species, NCBI_taxid, levels, outdir, tmp_dir, threads, no_refseq, + db_dir, only_mash, info_file, l90, nbcont, cutn, min_dist, max_dist, + verbose, quiet) + out, err = capsys.readouterr() + assert ("You asked to skip refseq downloads") in err + assert ("Total number of genomes for NA: 5") in out + assert ("Computing pairwise distances between all genomes") in out + assert ("Final number of genomes in dataset: 1") in out + # Check output files + # Check that the NCBI_genome_download output directory exists + ngd_outdir = os.path.join(GENEPATH, "refseq", "bacteria") + assert not os.path.isdir(ngd_outdir) + # Check logfiles are here + log_files = glob.glob(os.path.join(GENEPATH, "*log*")) + assert len(log_files) == 3 + # Check tmp files folder created, but empty as we do not split + tmp_files = glob.glob(os.path.join(GENEPATH, "tmp_files", "*.fna_prepare-split2N.fna")) + assert len(tmp_files) == 5 + + +def test_only_mash(capsys): + """ + Running only mash step (giving genomes and corresponding LSTINFO file) + """ + NCBI_species = "" + NCBI_taxid = "" + levels = "" + outdir = GENEPATH + tmp_dir = "" + threads = 1 + no_refseq = False + db_dir = "" + only_mash = True + info_file = os.path.join(TEST_DIR, "test_lstinfo_onlymash.lst") + l90 = 100 + nbcont = 999 + cutn = 5 + min_dist = 1e-4 + max_dist = 0.06 + verbose = 1 + quiet = False + prepare.main("cmd", NCBI_species, NCBI_taxid, levels, outdir, tmp_dir, threads, no_refseq, + db_dir, only_mash, info_file, l90, nbcont, cutn, min_dist, max_dist, + verbose, quiet) + out, err = capsys.readouterr() + assert ("You asked to run only mash steps") in err + assert ("You want to run only mash steps. Getting information from " + "test/data/prepare/test_files/test_lstinfo_onlymash.lst") in out + assert ("Found 5 genomes in total") in out + assert ("Computing pairwise distances between all genomes") in out + assert ("Sorting all 5 genomes by quality") in out + assert ("Final number of genomes in dataset: 1") in out + + # Check output files + assert len(os.listdir(os.path.join(outdir, "tmp_files"))) == 0 + # Check logfiles are here + log_files = glob.glob(os.path.join(outdir, "*log*")) + assert len(log_files) == 3 + # Check content of output lstinfo file + out_lst = os.path.join(outdir, "LSTINFO-NA-filtered-0.0001_0.06.txt") + exp_lst = os.path.join(DBDIR, "exp_files", "exp_lstinfo_run_only-mash.lst") + assert tutil.compare_order_content(out_lst, exp_lst) + + +def test_only_mash_empty_lstinfo(capsys): + """ + Running only mash step giving an empty lstinfo file -> error, no genome found + """ + NCBI_species = "" + NCBI_taxid = "" + levels = "" + outdir = GENEPATH + tmp_dir = "" + threads = 1 + no_refseq = False + db_dir = "" + only_mash = True + # Create empty lstinfo file + info_file = os.path.join(GENEPATH, "LSTINFO-empty.lst") + open(info_file, "w").close() + l90 = 100 + nbcont = 999 + cutn = 5 + min_dist = 1e-4 + max_dist = 0.06 + verbose = 1 + quiet = False + with pytest.raises(SystemExit): + prepare.main("cmd", NCBI_species, NCBI_taxid, levels, outdir, tmp_dir, threads, no_refseq, + db_dir, only_mash, info_file, l90, nbcont, cutn, min_dist, max_dist, + verbose, quiet) + out, err = capsys.readouterr() + assert ("You asked to run only mash steps") in err + assert ("You want to run only mash steps. Getting information from " + "test/data/prepare/generated_by_func-tests/LSTINFO-empty.lst") in out + assert ("No genome listed in test/data/prepare/generated_by_func-tests/LSTINFO-empty.lst " + "was found.") in err + + # Check output files + assert len(os.listdir(os.path.join(outdir, "tmp_files"))) == 0 + # Check logfiles are here + log_files = glob.glob(os.path.join(outdir, "*log*")) + assert len(log_files) == 3 + # Check lstinfo file is still here and still empty + assert os.stat(info_file).st_size == 0 + + +def test_only_mash_no_lstinfo(capsys): + """ + Running only mash step giving an info file which does not exist -> error missing infofile + """ + NCBI_species = "" + NCBI_taxid = "" + levels = "" + outdir = GENEPATH + tmp_dir = "" + threads = 1 + no_refseq = False + db_dir = "" + only_mash = True + # Create empty lstinfo file + info_file = "info_file.lst" + l90 = 100 + nbcont = 999 + cutn = 5 + min_dist = 1e-4 + max_dist = 0.06 + verbose = 1 + quiet = False + with pytest.raises(SystemExit): + prepare.main("cmd", NCBI_species, NCBI_taxid, levels, outdir, tmp_dir, threads, no_refseq, + db_dir, only_mash, info_file, l90, nbcont, cutn, min_dist, max_dist, + verbose, quiet) + out, err = capsys.readouterr() + assert ("You asked to run only mash steps") in err + assert ("Your info file info_file.lst does not exist. Please provide the " + "right name/path, or remove the '--mash-only option to rerun " + "quality control.") in err + + # Check output files + assert len(os.listdir(os.path.join(outdir, "tmp_files"))) == 0 + # Check logfiles are here + log_files = glob.glob(os.path.join(outdir, "*log*")) + assert len(log_files) == 3 + # Check that outdir contains only 4 elements: 3 logs + tmp_files repo + files = os.listdir(outdir) + files = [f for f in files if "fuse" not in f] + assert len(files) == 4 diff --git a/test/test_unit/test_annotate/test_annotation_functions-prodigal.py b/test/test_unit/test_annotate/test_annotation_functions-prodigal.py index 027e4c46eabee71815216bc287a558f1ab3b7ca0..5efd57fc152e0081b685cce3124bfaaca1c79ec9 100644 --- a/test/test_unit/test_annotate/test_annotation_functions-prodigal.py +++ b/test/test_unit/test_annotate/test_annotation_functions-prodigal.py @@ -12,7 +12,7 @@ import shutil import test.test_unit.utilities_for_tests as tutil import PanACoTA.utils as utils -import PanACoTA.annotate_module.annotation_functions as afunc +from PanACoTA.annotate_module import annotation_functions as afunc # Define variables used by several tests @@ -39,14 +39,19 @@ def setup_teardown_module(): - remove all log files - remove directory with generated results """ - os.mkdir(GENEPATH) + if os.path.isdir(GENEPATH): + content = os.listdir(GENEPATH) + for f in content: + assert f.startswith(".fuse") + else: + os.mkdir(GENEPATH) print("setup") yield for f in LOGFILES: if os.path.exists(f): os.remove(f) - shutil.rmtree(GENEPATH) + shutil.rmtree(GENEPATH, ignore_errors=True) print("teardown") @@ -89,494 +94,438 @@ def test_check_prodigal_nofaa(): assert not afunc.check_prodigal(gpath, name, out_dir, logger[1]) msg = "prodigal_out_for_test-missfaa original_name.fna: no or several .faa file(s)" q = logger[0] - assert q.qsize() == 2 + assert q.qsize() == 1 assert q.get().message == msg - assert q.get().message == "no faa" - - -# def test_check_prodigal_sevfaa(): -# """ -# Check that check_prodigal returns false when there is more than 1 faa file, -# and an error message -# """ -# logger = my_logger("test_check_prodigal_sevfaa") -# ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") -# ori_name = "prodigal_out_for_test" -# out_dir = os.path.join(GENEPATH, "out_test_nofaa") -# name = "prodigal_out_for_test-missfaa" -# os.makedirs(out_dir) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".tbl"), -# os.path.join(out_dir, name + ".tbl")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), -# os.path.join(out_dir, name + ".ffn")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), -# os.path.join(out_dir, name + ".faa")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), -# os.path.join(out_dir, name + "2.faa")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), -# os.path.join(out_dir, name + ".gff")) -# logf = os.path.join(GENEPATH, "prodigal.log") -# gpath = "path/to/nogenome/original_name.fna" -# nbcont = 7 -# assert not afunc.check_prodigal(out_dir, logf, name, gpath, nbcont, logger[1]) -# msg = "prodigal_out_for_test-missfaa original_name.fna: several .faa files" -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_check_prodigal_noffn(): -# """ -# Check that check_prodigal returns false when a ffn file is missing, and an error message -# """ -# logger = my_logger("test_check_prodigal_noffn") -# ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") -# ori_name = "prodigal_out_for_test" -# out_dir = os.path.join(GENEPATH, "out_test_noffn") -# name = "prodigal_out_for_test-missffn" -# os.makedirs(out_dir) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".tbl"), -# os.path.join(out_dir, name + ".tbl")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), -# os.path.join(out_dir, name + ".faa")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), -# os.path.join(out_dir, name + ".gff")) -# logf = os.path.join(GENEPATH, "prodigal.log") -# gpath = "path/to/nogenome/original_name.fna" -# nbcont = 7 -# assert not afunc.check_prodigal(out_dir, logf, name, gpath, nbcont, logger[1]) -# msg = "prodigal_out_for_test-missffn original_name.fna: no .ffn file" -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_check_prodigal_sevffn(): -# """ -# Check that check_prodigal returns false when there is more than 1 ffn file, -# and an error message -# """ -# logger = my_logger("test_check_prodigal_sevffn") -# ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") -# ori_name = "prodigal_out_for_test" -# out_dir = os.path.join(GENEPATH, "out_test_noffn") -# name = "prodigal_out_for_test-missffn" -# os.makedirs(out_dir) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".tbl"), -# os.path.join(out_dir, name + ".tbl")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), -# os.path.join(out_dir, name + ".faa")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), -# os.path.join(out_dir, name + ".ffn")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), -# os.path.join(out_dir, name + "2.ffn")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), -# os.path.join(out_dir, name + ".gff")) -# logf = os.path.join(GENEPATH, "prodigal.log") -# gpath = "path/to/nogenome/original_name.fna" -# nbcont = 7 -# assert not afunc.check_prodigal(out_dir, logf, name, gpath, nbcont, logger[1]) -# msg = "prodigal_out_for_test-missffn original_name.fna: several .ffn files" -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_check_prodigal_nogff(): -# """ -# Check that check_prodigal returns false when a ffn file is missing, and an error message -# """ -# logger = my_logger("test_check_prodigal_nogff") -# ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") -# ori_name = "prodigal_out_for_test" -# out_dir = os.path.join(GENEPATH, "out_test_noffn") -# name = "prodigal_out_for_test-missgff" -# os.makedirs(out_dir) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".tbl"), -# os.path.join(out_dir, name + ".tbl")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), -# os.path.join(out_dir, name + ".faa")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), -# os.path.join(out_dir, name + ".ffn")) -# logf = os.path.join(GENEPATH, "prodigal.log") -# gpath = "path/to/nogenome/original_name.fna" -# nbcont = 7 -# assert not afunc.check_prodigal(out_dir, logf, name, gpath, nbcont, logger[1]) -# msg = "prodigal_out_for_test-missgff original_name.fna: no .gff file" -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_check_prodigal_sevgff(): -# """ -# Check that check_prodigal returns false when there is more than 1 ffn file, -# and an error message -# """ -# logger = my_logger("test_check_prodigal_sevgff") -# ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") -# ori_name = "prodigal_out_for_test" -# out_dir = os.path.join(GENEPATH, "out_test_noffn") -# name = "prodigal_out_for_test-sevgff" -# os.makedirs(out_dir) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".tbl"), -# os.path.join(out_dir, name + ".tbl")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), -# os.path.join(out_dir, name + ".faa")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), -# os.path.join(out_dir, name + ".ffn")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), -# os.path.join(out_dir, name + "2.gff")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), -# os.path.join(out_dir, name + ".gff")) -# logf = os.path.join(GENEPATH, "prodigal.log") -# gpath = "path/to/nogenome/original_name.fna" -# nbcont = 7 -# assert not afunc.check_prodigal(out_dir, logf, name, gpath, nbcont, logger[1]) -# msg = "prodigal_out_for_test-sevgff original_name.fna: several .gff files" -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_check_prodigal_wrong_cont(): -# """ -# Check that check_prodigal returns an error message when the number of contigs in tbl -# file is not as expected -# """ -# logger = my_logger("test_check_prodigal_wrong_cont") -# outdir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") -# name = "prodigal_out_for_test" -# logf = os.path.join(GENEPATH, "prodigal.log") -# gpath = "path/to/nogenome/original_name.fna" -# nbcont = 10 -# assert not afunc.check_prodigal(outdir, logf, name, gpath, nbcont, logger[1]) -# msg = ("prodigal_out_for_test original_name.fna: no matching number of contigs; " -# "nbcontig=10; in tbl =7") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_check_prodigal_wrong_tbl_cds(): -# """ -# Check that check_prodigal returns an error message when the number of CDS in tbl -# file is different from the number of headers in faa file -# """ -# logger = my_logger("test_check_prodigal_wrong_tbl_cds") -# ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") -# ori_name = "prodigal_out_for_test" -# out_dir = os.path.join(GENEPATH, "res_checkprodigalWrongTbl") -# os.makedirs(out_dir) -# name = "prodigal_out_for_test-wrongCDS" -# tblfile = os.path.join(TEST_DIR, name + ".tbl") -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), -# os.path.join(out_dir, name + ".ffn")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), -# os.path.join(out_dir, name + ".faa")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), -# os.path.join(out_dir, name + ".gff")) - -# shutil.copyfile(tblfile, os.path.join(out_dir, name + ".tbl")) -# logf = os.path.join(GENEPATH, "prodigal.log") -# gpath = "path/to/nogenome/original_name.fna" -# nbcont = 7 -# assert not afunc.check_prodigal(out_dir, logf, name, gpath, nbcont, logger[1]) -# msg1 = ("prodigal_out_for_test-wrongCDS original_name.fna: " -# "no matching number of proteins between tbl and faa; " -# "faa=13; in tbl =12") -# msg2 = ("prodigal_out_for_test-wrongCDS original_name.fna: " -# "no matching number of genes between tbl and ffn; " -# "ffn=17; in tbl =14genes 2CRISPR") -# q = logger[0] -# assert q.qsize() == 2 -# assert q.get().message == msg1 -# assert q.get().message == msg2 - - -# def test_check_prodigal_wrong_tbl_crispr(): -# """ -# Check that check_prodigal returns an error message when the number of headers in ffn -# file is different from the number of CDS + CRISPR in tbl file (1CRISPR in tbl, 2 in ffn) -# """ -# logger = my_logger("test_check_prodigal_wrong_tbl_crispr") -# ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") -# ori_name = "prodigal_out_for_test" -# out_dir = os.path.join(GENEPATH, "res_checkprodigalWrongCRISPR") -# os.makedirs(out_dir) -# name = "prodigal_out_for_test-wrongtblCRISP" -# tblfile = os.path.join(TEST_DIR, name + ".tbl") -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), -# os.path.join(out_dir, name + ".ffn")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), -# os.path.join(out_dir, name + ".faa")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), -# os.path.join(out_dir, name + ".gff")) -# shutil.copyfile(tblfile, os.path.join(out_dir, name + ".tbl")) -# logf = "prodigal.log" -# gpath = "path/to/nogenome/original_name.fna" -# nbcont = 7 -# assert not afunc.check_prodigal(out_dir, logf, name, gpath, nbcont, logger[1]) -# msg = ("prodigal_out_for_test-wrongtblCRISP original_name.fna: " -# "no matching number of genes between tbl and ffn; " -# "ffn=17; in tbl =15genes 1CRISPR") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_check_prodigal_tbl_crispr_newversion(): -# """ -# Check that check_prodigal does not return an error message when the number of headers in ffn -# file is equal to the number of CDS in tbl file (1CRISPR in tbl, 0 in ffn), but -# does not contain the CRISPRs found in tbl -# As the new version of prodigal (1.12) does not put crisprs in .ffn -# """ -# logger = my_logger("test_check_prodigal_tbl_crispr_newversion") -# ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") -# ori_name = "prodigal_out_for_test" -# out_dir = os.path.join(GENEPATH, "res_checkprodigalWrongCRISPRnewversion") -# os.makedirs(out_dir) -# name = "prodigal_out_for_test-wrongtblCRISPnewversion" -# ffnfile = os.path.join(TEST_DIR, name + ".ffn") -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".tbl"), -# os.path.join(out_dir, name + ".tbl")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), -# os.path.join(out_dir, name + ".faa")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), -# os.path.join(out_dir, name + ".gff")) -# shutil.copyfile(ffnfile, os.path.join(out_dir, name + ".ffn")) -# logf = os.path.join(GENEPATH, "prodigal.log") -# gpath = "path/to/nogenome/original_name.fna" -# nbcont = 7 -# assert afunc.check_prodigal(out_dir, logf, name, gpath, nbcont, logger[1]) - - -# def test_check_prodigal_ok(): -# """ -# Check that everything is ok with prodigal results (tbl, faa and ffn files exist, -# and number of CDS, CRISPR and genes correspond between them) -# """ -# logger = my_logger("test_check_prodigal_ok") -# outdir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") -# name = "prodigal_out_for_test" -# logf = os.path.join(GENEPATH, "prodigal.log") -# gpath = "path/to/nogenome/original_name.fna" -# nbcont = 7 -# assert afunc.check_prodigal(outdir, logf, name, gpath, nbcont, logger[1]) - - -# def test_run_prodigal_out_exists_ok(): -# """ -# Test that when the output directory already exists, and files inside are OK, -# run_prodigal returns True, with a warning message indicating that prodigal did not rerun. -# """ -# logger = my_logger("test_run_prodigal_out_exists_ok") -# utils.init_logger(LOGFILE_BASE, 0, 'prodigal_out_exists_ok') -# gpath = "path/to/nogenome/original_name.fna" -# cores_prodigal = 1 -# name = "prodigal_out_for_test" -# force = False -# nbcont = 7 -# arguments = (gpath, TEST_DIR, cores_prodigal, name, force, nbcont, None, logger[0]) -# assert afunc.run_prodigal(arguments) - -# q = logger[0] -# assert q.qsize() == 4 -# # start annotating : -# assert q.get().message.startswith("Start annotating") -# # # warning prodigal results folder exists: -# assert q.get().message.startswith("prodigal results folder test/data/annotate/test_files/" -# "original_name.fna-prodigalRes already exists.") -# # Results in result folder are ok -# assert q.get().message.startswith("prodigal did not run again, formatting step used already " -# "generated results of prodigal in " -# "test/data/annotate/test_files/original_name.fna-prodigalRes.") -# # End annotation: -# assert q.get().message.startswith("End annotating") - - -# def test_run_prodigal_out_exists_error(): -# """ -# Test that when the output directory already exists, and 1 file is missing, -# run_prodigal returns False, and writes the warning message saying that prodigal did not -# rerun, + the warning message for the missing file(s). -# """ -# logger = my_logger("test_run_prodigal_out_exists_error") -# utils.init_logger(LOGFILE_BASE, 0, 'prodigal_out_error') -# ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") -# ori_name = "prodigal_out_for_test" -# new_prok_dir = os.path.join(GENEPATH, "original_name-error-prodigalRes") -# name = "prodigal_out_for_test-wrongCDS" -# os.makedirs(new_prok_dir) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), -# os.path.join(new_prok_dir, name + ".ffn")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), -# os.path.join(new_prok_dir, name + ".faa")) -# shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), -# os.path.join(new_prok_dir, name + ".gff")) -# gpath = "path/to/nogenome/original_name-error" -# cores_prodigal = 1 -# force = False -# nbcont = 7 -# arguments = (gpath, GENEPATH, cores_prodigal, name, force, nbcont, None, logger[0]) -# assert not afunc.run_prodigal(arguments) -# q = logger[0] -# # assert q.qsize() == 4 -# # start annotating : -# assert q.get().message.startswith("Start annotating") -# # warning prodigal results folder exists: -# assert q.get().message == ("prodigal results folder test/data/annotate/generated_by_unit-tests/" -# "original_name-error-prodigalRes already exists.") -# # error, no tbl file -# msg = "prodigal_out_for_test-wrongCDS original_name-error: no .tbl file" -# assert q.get().message == msg -# # warning, files in outdir are not as expected -# assert q.get().message.startswith("Problems in the files contained in your already existing " -# "output dir ") - - -# def test_run_prodigal_out_exists_force(): -# """ -# Test that when the output directory already exists with wrong files, but force is on, -# prodigal is rerun and outputs the right files -# """ -# logger = my_logger("test_run_prodigal_out_exists_force") -# utils.init_logger(LOGFILE_BASE, 0, 'force') -# gpath = os.path.join(GEN_PATH, "H299_H561.fasta") -# out_prokdir = os.path.join(GENEPATH, "H299_H561.fasta-prodigalRes") -# name = "test_runprodigal_H299" -# # Put empty tbl, faa, ffn files in prodigal output dir, to check that they are overridden -# os.makedirs(out_prokdir) -# open(os.path.join(out_prokdir, name + ".tbl"), "w").close() -# open(os.path.join(out_prokdir, name + ".faa"), "w").close() -# open(os.path.join(out_prokdir, name + ".ffn"), "w").close() -# cores_prodigal = 2 -# force = True -# nbcont = 3 -# arguments = (gpath, GENEPATH, cores_prodigal, name, force, nbcont, None, logger[0]) -# assert afunc.run_prodigal(arguments) -# # As we used 'force', tbl, faa and ffn files, which were empty, must have been replaced -# # by the prodigal output -# exp_dir = os.path.join(EXP_DIR, "H299_H561.fasta-short-contig.fna-prodigalRes", -# "test_runprodigal_H299") -# out_tbl = os.path.join(out_prokdir, name + ".tbl") -# out_faa = os.path.join(out_prokdir, name + ".faa") -# out_ffn = os.path.join(out_prokdir, name + ".ffn") -# assert os.path.isfile(out_tbl) -# # For tbl file, check that, at least, the 3 contigs were considered, -# # and that the number of CDS is as expected. -# # Before, we checked that the output -# # was exactly as expected. But it changes with the different versions of prodigal, so -# # we cannot compare the whole file. -# with open(out_tbl, "r") as outt: -# lines = [line.strip() for line in outt.readlines()] -# assert ">Feature H561_S27" in lines -# assert ">Feature H561_S28" in lines -# assert ">Feature H561_S29" in lines -# CDS = 0 -# for line in lines: -# if "CDS" in line: -# CDS += 1 -# assert CDS == 16 -# # Check that faa and ffn files are as expected -# assert os.path.isfile(out_faa) -# tutil.compare_order_content(exp_dir + ".faa", out_faa) -# assert os.path.isfile(out_ffn) -# tutil.compare_order_content(exp_dir + ".ffn", out_ffn) -# q = logger[0] -# # assert q.qsize() == 3 -# assert q.get() .message.startswith("Start annotating test_runprodigal_H299 from test/data/" -# "annotate/genomes/H299_H561.fasta with prodigal") -# assert q.get() .message == ("prodigal results folder already exists, but removed because " -# "--force option used") -# assert q.get().message == ("prodigal command: prodigal " -# "--outdir test/data/annotate/generated_by_unit-tests/" -# "H299_H561.fasta-prodigalRes --cpus 2 --prefix test_runprodigal_H299 " -# "test/data/annotate/genomes/H299_H561.fasta") -# assert q.get() .message.startswith("End annotating test_runprodigal_H299 " -# "from test/data/annotate/genomes/H299_H561.fasta") - - -# def test_run_prodigal_out_doesnt_exist(): -# """ -# Test that when the output directory does not exist, it creates it, and runs prodigal -# with all expected outfiles -# """ -# logger = my_logger("test_run_prodigal_out_doesnt_exist") -# utils.init_logger(LOGFILE_BASE, 0, 'test_run_prodigal_out_doesnt_exist') -# gpath = os.path.join(GEN_PATH, "H299_H561.fasta") -# out_dir = os.path.join(GENEPATH, "H299_H561.fasta-prodigalRes") -# cores_prodigal = 2 -# name = "test_runprodigal_H299" -# force = False -# nbcont = 3 -# arguments = (gpath, GENEPATH, cores_prodigal, name, force, nbcont, None, logger[0]) -# assert afunc.run_prodigal(arguments) -# # Check content of tbl, ffn and faa files -# exp_dir = os.path.join(EXP_DIR, "H299_H561.fasta-short-contig.fna-prodigalRes", -# "test_runprodigal_H299") -# out_tbl = os.path.join(out_dir, name + ".tbl") -# out_faa = os.path.join(out_dir, name + ".faa") -# out_ffn = os.path.join(out_dir, name + ".ffn") -# out_gff = os.path.join(out_dir, name + ".gff") -# assert os.path.isfile(out_tbl) -# # For tbl file, check that, at least, the 3 contigs were considered, -# # and that the number of CDS is as expected. -# # Before, we checked that the output -# # was exactly as expected. But it changes with the different versions of prodigal, so -# # we cannot compare the whole file. -# with open(out_tbl, "r") as outt: -# lines = [line.strip() for line in outt.readlines()] -# assert ">Feature H561_S27" in lines -# assert ">Feature H561_S28" in lines -# assert ">Feature H561_S29" in lines -# CDS = 0 -# for line in lines: -# if "CDS" in line: -# CDS += 1 -# assert CDS == 16 -# assert os.path.isfile(out_faa) -# with open(exp_dir + ".faa", "r") as expf, open(out_faa, "r") as outf: -# for line_exp, line_out in zip(expf, outf): -# assert line_exp == line_out -# # Check that faa and ffn files are as expected -# assert os.path.isfile(out_faa) -# tutil.compare_order_content(exp_dir + ".faa", out_faa) -# assert os.path.isfile(out_ffn) -# tutil.compare_order_content(exp_dir + ".ffn", out_ffn) -# q = logger[0] -# assert q.qsize() == 3 -# assert q.get().message.startswith("Start annotating") -# assert q.get().message == ("prodigal command: prodigal " -# "--outdir test/data/annotate/generated_by_unit-tests/" -# "H299_H561.fasta-prodigalRes --cpus 2 --prefix test_runprodigal_H299 " -# "test/data/annotate/genomes/H299_H561.fasta") -# assert q.get().message.startswith("End annotating") - - -# def test_run_prodigal_out_problem_running(): -# """ -# Check that when a problem occurs while trying to run prodigal, run_prodigal returns False, -# and the error message indicating to read in the log why it couldn't run -# """ -# logger = my_logger("test_run_prodigal_out_problem_running") -# utils.init_logger(LOGFILE_BASE, 0, 'test_run_prodigal_out_problem_running') -# gpath = os.path.join(GEN_PATH, "H299 H561.fasta") -# cores_prodigal = 2 -# name = "test_runprodigal_H299-error" -# force = False -# nbcont = 3 -# logf = os.path.join(GENEPATH, "H299 H561.fasta-prodigal.log") -# arguments = (gpath, GENEPATH, cores_prodigal, name, force, nbcont, None, logger[0]) -# assert not afunc.run_prodigal(arguments) -# q = logger[0] -# assert q.qsize() == 3 -# assert q.get().message.startswith("Start annotating") -# assert q.get().message == ("prodigal command: prodigal " -# "--outdir test/data/annotate/generated_by_unit-tests/" -# "H299 H561.fasta-prodigalRes --cpus 2 " -# "--prefix test_runprodigal_H299-error " -# "test/data/annotate/genomes/H299 H561.fasta") -# assert q.get().message == ("Error while trying to run prodigal on test_runprodigal_H299-error " -# "from test/data/annotate/genomes/H299 H561.fasta") + + +def test_check_prodigal_sevfaa(): + """ + Check that check_prodigal returns false when there is more than 1 faa file, + and an error message + """ + logger = my_logger("test_check_prodigal_sevfaa") + ori_prod_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") + ori_name = "prodigal.outtest.ok" + out_dir = os.path.join(GENEPATH, "out_test_nofaa") + name = "prodigal_out_for_test-missfaa" + os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prod_dir, ori_name + ".ffn"), + os.path.join(out_dir, name + ".ffn")) + shutil.copyfile(os.path.join(ori_prod_dir, ori_name + ".faa"), + os.path.join(out_dir, name + ".faa")) + shutil.copyfile(os.path.join(ori_prod_dir, ori_name + ".faa"), + os.path.join(out_dir, name + "2.faa")) + shutil.copyfile(os.path.join(ori_prod_dir, ori_name + ".gff"), + os.path.join(out_dir, name + ".gff")) + logf = os.path.join(GENEPATH, "prodigal.log") + gpath = "path/to/nogenome/original_name.fna" + nbcont = 7 + assert not afunc.check_prodigal(gpath, name, out_dir, logger[1]) + msg = "prodigal_out_for_test-missfaa original_name.fna: no or several .faa file(s)" + q = logger[0] + assert q.qsize() == 1 + assert q.get().message == msg + + +def test_check_prodigal_noffn(): + """ + Check that check_prodigal returns false when a ffn file is missing, and an error message + """ + logger = my_logger("test_check_prodigal_noffn") + ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") + ori_name = "prodigal.outtest.ok" + out_dir = os.path.join(GENEPATH, "out_test_noffn") + name = "prodigal_out_for_test-missffn" + os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), + os.path.join(out_dir, name + ".faa")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), + os.path.join(out_dir, name + ".gff")) + logf = os.path.join(GENEPATH, "prodigal.log") + gpath = "path/to/nogenome/original_name.fna" + nbcont = 7 + assert not afunc.check_prodigal(gpath, name, out_dir, logger[1]) + msg = "prodigal_out_for_test-missffn original_name.fna: no or several .ffn file" + q = logger[0] + assert q.qsize() == 1 + assert msg in q.get().message + + +def test_check_prodigal_sevffn(): + """ + Check that check_prodigal returns false when there is more than 1 ffn file, + and an error message + """ + logger = my_logger("test_check_prodigal_sevffn") + ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") + ori_name = "prodigal.outtest.ok" + out_dir = os.path.join(GENEPATH, "out_test_noffn") + name = "prodigal_out_for_test-sevffn" + os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), + os.path.join(out_dir, name + ".faa")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), + os.path.join(out_dir, name + ".ffn")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), + os.path.join(out_dir, name + "2.ffn")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), + os.path.join(out_dir, name + ".gff")) + logf = os.path.join(GENEPATH, "prodigal.log") + gpath = "path/to/nogenome/original_name.fna" + nbcont = 7 + assert not afunc.check_prodigal(gpath, name, out_dir, logger[1]) + msg = "prodigal_out_for_test-sevffn original_name.fna: no or several .ffn file" + q = logger[0] + assert q.qsize() == 1 + assert msg in q.get().message + + +def test_check_prodigal_nogff(): + """ + Check that check_prodigal returns false when a ffn file is missing, and an error message + """ + logger = my_logger("test_check_prodigal_nogff") + ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") + ori_name = "prodigal.outtest.ok" + out_dir = os.path.join(GENEPATH, "out_test_noffn") + name = "prodigal_out_for_test-missgff" + os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), + os.path.join(out_dir, name + ".faa")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), + os.path.join(out_dir, name + ".ffn")) + logf = os.path.join(GENEPATH, "prodigal.log") + gpath = "path/to/nogenome/original_name.fna" + nbcont = 7 + assert not afunc.check_prodigal(gpath, name, out_dir, logger[1]) + msg = "prodigal_out_for_test-missgff original_name.fna: no or several .gff file" + q = logger[0] + assert q.qsize() == 1 + assert msg in q.get().message + + +def test_check_prodigal_sevgff(): + """ + Check that check_prodigal returns false when there is more than 1 ffn file, + and an error message + """ + logger = my_logger("test_check_prodigal_sevgff") + ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") + ori_name = "prodigal.outtest.ok" + out_dir = os.path.join(GENEPATH, "out_test_noffn") + name = "prodigal_out_for_test-sevgff" + os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), + os.path.join(out_dir, name + ".faa")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), + os.path.join(out_dir, name + ".ffn")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), + os.path.join(out_dir, name + "2.gff")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), + os.path.join(out_dir, name + ".gff")) + logf = os.path.join(GENEPATH, "prodigal.log") + gpath = "path/to/nogenome/original_name.fna" + assert not afunc.check_prodigal(gpath, name, out_dir, logger[1]) + msg = "prodigal_out_for_test-sevgff original_name.fna: no or several .gff file" + q = logger[0] + assert q.qsize() == 1 + assert msg in q.get().message + + +def test_check_prodigal_emptyfaa(): + """ + Check that check_prodigal returns false when there are all expected files, but faa + file is empty + """ + logger = my_logger("test_check_prodigal_ok") + ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") + ori_name = "prodigal.outtest.ok" + out_dir = os.path.join(GENEPATH, "out_test_noffn") + name = "prodigal_out_for_test" + logf = os.path.join(GENEPATH, "prodigal.log") + os.makedirs(out_dir) + open(os.path.join(out_dir, name + ".faa"), "w").close() + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), + os.path.join(out_dir, name + ".ffn")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), + os.path.join(out_dir, name + ".gff")) + gpath = "path/to/nogenome/original_name.fna" + assert not afunc.check_prodigal(gpath, name, out_dir, logger[1]) + msg = "Genome prodigal_out_for_test (from original_name.fna): At least one of your Prodigal result file is empty." + q = logger[0] + assert q.qsize() == 1 + assert msg in q.get().message + + +def test_check_prodigal_emptyffn(): + """ + Check that check_prodigal returns false when there are all expected files, but ffn + file is empty + """ + logger = my_logger("test_check_prodigal_ok") + ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") + ori_name = "prodigal.outtest.ok" + out_dir = os.path.join(GENEPATH, "out_test_noffn") + name = "prodigal_out_for_test" + logf = os.path.join(GENEPATH, "prodigal.log") + os.makedirs(out_dir) + open(os.path.join(out_dir, name + ".ffn"), "w").close() + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), + os.path.join(out_dir, name + ".faa")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), + os.path.join(out_dir, name + ".gff")) + gpath = "path/to/nogenome/original_name.fna" + assert not afunc.check_prodigal(gpath, name, out_dir, logger[1]) + msg = "Genome prodigal_out_for_test (from original_name.fna): At least one of your Prodigal result file is empty." + q = logger[0] + assert q.qsize() == 1 + assert msg in q.get().message + + +def test_check_prodigal_emptygff(): + """ + Check that check_prodigal returns false when there are all expected files, but gff + file is empty + """ + logger = my_logger("test_check_prodigal_ok") + ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") + ori_name = "prodigal.outtest.ok" + out_dir = os.path.join(GENEPATH, "out_test_noffn") + name = "prodigal_out_for_test" + logf = os.path.join(GENEPATH, "prodigal.log") + os.makedirs(out_dir) + open(os.path.join(out_dir, name + ".gff"), "w").close() + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), + os.path.join(out_dir, name + ".faa")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), + os.path.join(out_dir, name + ".ffn")) + gpath = "path/to/nogenome/original_name.fna" + assert not afunc.check_prodigal(gpath, name, out_dir, logger[1]) + msg = "Genome prodigal_out_for_test (from original_name.fna): At least one of your Prodigal result file is empty." + q = logger[0] + assert q.qsize() == 1 + assert msg in q.get().message + + +def test_check_prodigal_ok(): + """ + Check that everything is ok with prodigal results (tbl, faa and ffn files exist, + and number of CDS, CRISPR and genes correspond between them) + """ + logger = my_logger("test_check_prodigal_ok") + ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") + ori_name = "prodigal.outtest.ok" + out_dir = os.path.join(GENEPATH, "out_test_noffn") + name = "prodigal_out_for_test" + logf = os.path.join(GENEPATH, "prodigal.log") + os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), + os.path.join(out_dir, name + ".faa")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), + os.path.join(out_dir, name + ".ffn")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), + os.path.join(out_dir, name + ".gff")) + gpath = "path/to/nogenome/original_name.fna" + assert afunc.check_prodigal(gpath, name, out_dir, logger[1]) + + +def test_run_prodigal_out_exists_ok(): + """ + Test that when the output directory already exists, and files inside are OK, + run_prodigal returns True, with a warning message indicating that prodigal did not rerun. + """ + logger = my_logger("test_run_prodigal_out_exists_ok") + utils.init_logger(LOGFILE_BASE, 0, 'prodigal_out_exists_ok') + gpath = "path/to/nogenome/original_name.fna" + cores_prodigal = 1 + name = "prodigal.outtest.ok" + force = False + nbcont = 7 + arguments = (gpath, TEST_DIR, cores_prodigal, name, force, nbcont, None, logger[0]) + assert afunc.run_prodigal(arguments) + + q = logger[0] + assert q.qsize() == 4 + # start annotating : + assert q.get().message.startswith("Start annotating prodigal.outtest.ok (from " + "path/to/nogenome/original_name.fna sequence) with Prodigal") + # # warning prodigal results folder exists: + assert q.get().message.startswith("Prodigal results folder test/data/annotate/test_files/" + "original_name.fna-prodigalRes already exists.") + # Results in result folder are ok + assert q.get().message.startswith("Prodigal did not run again. Formatting step will use " + "already generated results of Prodigal in " + "test/data/annotate/test_files/" + "original_name.fna-prodigalRes.") + # End annotation: + assert q.get().message.startswith("End annotating") + + +def test_run_prodigal_out_exists_error(): + """ + Test that when the output directory already exists, and 1 file is missing, + run_prodigal returns False, and writes the warning message saying that prodigal did not + rerun, + the warning message for the missing file(s). + """ + logger = my_logger("test_run_prodigal_out_exists_error") + utils.init_logger(LOGFILE_BASE, 0, 'prodigal_out_error') + ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prodigalRes") + ori_name = "prodigal.outtest.ok" + new_prok_dir = os.path.join(GENEPATH, "original_name-error-prodigalRes") + name = "prodigal_out_for_test-wrongCDS" + os.makedirs(new_prok_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), + os.path.join(new_prok_dir, name + ".ffn")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), + os.path.join(new_prok_dir, name + ".faa")) + open(os.path.join(new_prok_dir, name + ".gff"), "w").close() + gpath = "path/to/nogenome/original_name-error" + cores_prodigal = 1 + force = False + nbcont = 7 + arguments = (gpath, GENEPATH, cores_prodigal, name, force, nbcont, None, logger[0]) + assert not afunc.run_prodigal(arguments) + q = logger[0] + assert q.qsize() == 4 + # start annotating : + assert q.get().message.startswith("Start annotating") + # warning prodigal results folder exists: + assert q.get().message == ("Prodigal results folder test/data/annotate/" + "generated_by_unit-tests/" + "original_name-error-prodigalRes already exists.") + # error, empty gff + msg = ("Genome prodigal_out_for_test-wrongCDS (from original_name-error): " + "At least one of your Prodigal result file is empty.") + assert q.get().message == msg + # warning, files in outdir are not as expected + assert q.get().message.startswith("Problems in the files contained in your already existing " + "output dir (test/data/annotate/generated_by_unit-tests/" + "original_name-error-prodigalRes") + + +def test_run_prodigal_out_exists_force(): + """ + Test that when the output directory already exists with wrong files, but force is on, + prodigal is rerun and outputs the right files + """ + logger = my_logger("test_run_prodigal_out_exists_force") + utils.init_logger(LOGFILE_BASE, 0, 'force') + gpath = os.path.join(GEN_PATH, "H299_H561.fasta") + out_prokdir = os.path.join(GENEPATH, "H299_H561.fasta-prodigalRes") + name = "test_runprodigal_H299" + # Put empty tbl, faa, ffn files in prodigal output dir, to check that they are overridden + os.makedirs(out_prokdir) + open(os.path.join(out_prokdir, name + ".gff"), "w").close() + open(os.path.join(out_prokdir, name + ".faa"), "w").close() + open(os.path.join(out_prokdir, name + ".ffn"), "w").close() + cores_prodigal = 2 + force = True + nbcont = 3 + arguments = (gpath, GENEPATH, cores_prodigal, name, force, nbcont, True, logger[0]) + assert afunc.run_prodigal(arguments) + # As we used 'force', tbl, faa and ffn files, which were empty, must have been replaced + # by the prodigal output + exp_dir = os.path.join(EXP_DIR, "H299_H561.fasta-prodigalRes", + "ESCO.1015.00001") + out_gff = os.path.join(out_prokdir, name + ".gff") + out_faa = os.path.join(out_prokdir, name + ".faa") + out_ffn = os.path.join(out_prokdir, name + ".ffn") + # Check that faa and ffn files are as expected + assert os.path.isfile(out_faa) + tutil.compare_order_content(exp_dir + ".faa", out_faa) + assert os.path.isfile(out_ffn) + tutil.compare_order_content(exp_dir + ".ffn", out_ffn) + q = logger[0] + # assert q.qsize() == 3 + assert q.get() .message.startswith("Start annotating test_runprodigal_H299 (from test/data/" + "annotate/genomes/H299_H561.fasta sequence) " + "with Prodigal") + assert q.get() .message.startswith("Prodigal results folder already exists, but is " + "removed because --force option was used") + assert q.get().message.startswith("Prodigal command: prodigal -i test/data/annotate/genomes/" + "H299_H561.fasta -d test/data/annotate/" + "generated_by_unit-tests/H299_H561.fasta-prodigalRes/" + "test_runprodigal_H299.ffn -a test/data/annotate/" + "generated_by_unit-tests/H299_H561.fasta-prodigalRes/" + "test_runprodigal_H299.faa -f gff -o test/data/annotate/" + "generated_by_unit-tests/H299_H561.fasta-prodigalRes/" + "test_runprodigal_H299.gff -q -p meta") + assert q.get() .message.startswith("End annotating test_runprodigal_H299 " + "(from test/data/annotate/genomes/H299_H561.fasta)") + + +def test_run_prodigal_out_doesnt_exist(): + """ + Test that when the output directory does not exist, it creates it, and runs prodigal + with all expected outfiles + """ + logger = my_logger("test_run_prodigal_out_doesnt_exist") + utils.init_logger(LOGFILE_BASE, 0, 'test_run_prodigal_out_doesnt_exist') + gpath = os.path.join(GEN_PATH, "H299_H561.fasta") + out_dir = os.path.join(GENEPATH, "H299_H561.fasta-prodigalRes") + cores_prodigal = 2 + name = "test_runprodigal_H299" + force = False + nbcont = 3 + arguments = (gpath, GENEPATH, cores_prodigal, name, force, nbcont, True, logger[0]) + assert afunc.run_prodigal(arguments) + # Check content of tbl, ffn and faa files + exp_dir = os.path.join(EXP_DIR, "H299_H561.fasta-prodigalRes", + "ESCO.1015.00001") + out_faa = os.path.join(out_dir, name + ".faa") + out_ffn = os.path.join(out_dir, name + ".ffn") + out_gff = os.path.join(out_dir, name + ".gff") + # Check that faa and ffn files are as expected + assert os.path.isfile(out_faa) + tutil.compare_order_content(exp_dir + ".faa", out_faa) + assert os.path.isfile(out_ffn) + tutil.compare_order_content(exp_dir + ".ffn", out_ffn) + assert os.path.isfile(out_ffn) + tutil.compare_order_content(exp_dir + ".gff", out_gff) + q = logger[0] + assert q.qsize() == 3 + assert q.get().message.startswith("Start annotating") + assert q.get().message == ("Prodigal command: prodigal -i test/data/annotate/genomes/" + "H299_H561.fasta -d test/data/annotate/" + "generated_by_unit-tests/H299_H561.fasta-prodigalRes/" + "test_runprodigal_H299.ffn -a test/data/annotate/" + "generated_by_unit-tests/H299_H561.fasta-prodigalRes/" + "test_runprodigal_H299.faa -f gff -o test/data/annotate/" + "generated_by_unit-tests/H299_H561.fasta-prodigalRes/" + "test_runprodigal_H299.gff -q -p meta") + assert q.get().message.startswith("End annotating") + + +def test_run_prodigal_out_problem_running(): + """ + Check that when a problem occurs while trying to run prodigal, run_prodigal returns False, + and the error message indicating to read in the log why it couldn't run + """ + logger = my_logger("test_run_prodigal_out_problem_running") + utils.init_logger(LOGFILE_BASE, 0, 'test_run_prodigal_out_problem_running') + gpath = os.path.join(GEN_PATH, "H299_H561bis.fasta") + cores_prodigal = 2 + name = "test_runprodigal_H299-error" + force = False + nbcont = 3 + logf = os.path.join(GENEPATH, "H299_H561bis.fasta-prodigal.log") + arguments = (gpath, GENEPATH, cores_prodigal, name, force, nbcont, False, logger[0]) + assert not afunc.run_prodigal(arguments) + q = logger[0] + assert q.qsize() == 3 + assert q.get().message.startswith("Start annotating") + assert q.get().message.startswith("Prodigal command: prodigal -i test/data/annotate/genomes/" + "H299_H561bis.fasta -d test/data/annotate/" + "generated_by_unit-tests/H299_H561bis.fasta-prodigalRes/" + "test_runprodigal_H299-error.ffn -a test/data/annotate/" + "generated_by_unit-tests/H299_H561bis.fasta-prodigalRes/" + "test_runprodigal_H299-error.faa -f gff -o test/data/annotate/" + "generated_by_unit-tests/H299_H561bis.fasta-prodigalRes/" + "test_runprodigal_H299-error.gff -q") + assert q.get().message.startswith("Error while trying to run prodigal. See test/data/" + "annotate/generated_by_unit-tests/" + "H299_H561bis.fasta-prodigal.log.err. " + "If it mentions that your genome sequences " + "are too small, add '--small' option to your " + "PanACoTA command.") + diff --git a/test/test_unit/test_annotate/test_annotation_functions-prokka.py b/test/test_unit/test_annotate/test_annotation_functions-prokka.py index 6abac82d74a1792088e6cf577d5e378b5a334e73..e1aa2635855231743e7c20614ea170dd9e8dce45 100644 --- a/test/test_unit/test_annotate/test_annotation_functions-prokka.py +++ b/test/test_unit/test_annotate/test_annotation_functions-prokka.py @@ -9,10 +9,11 @@ import pytest import os import logging import shutil +import multiprocessing import test.test_unit.utilities_for_tests as tutil import PanACoTA.utils as utils -import PanACoTA.annotate_module.annotation_functions as afunc +from PanACoTA.annotate_module import annotation_functions as afunc # Define variables used by several tests @@ -39,14 +40,19 @@ def setup_teardown_module(): - remove all log files - remove directory with generated results """ - os.mkdir(GENEPATH) + if os.path.isdir(GENEPATH): + content = os.listdir(GENEPATH) + for f in content: + assert f.startswith(".fuse") + else: + os.mkdir(GENEPATH) print("setup") yield for f in LOGFILES: if os.path.exists(f): os.remove(f) - shutil.rmtree(GENEPATH) + shutil.rmtree(GENEPATH, ignore_errors=True) print("teardown") @@ -55,7 +61,6 @@ def my_logger(name): """ logger given to function called by a subprocess """ - import multiprocessing m = multiprocessing.Manager() q = m.Queue() qh = logging.handlers.QueueHandler(q) @@ -72,10 +77,10 @@ def test_check_prokka_no_outdir(): Test that prokka returns the right error message when output directory does not exist """ logger = my_logger("test_check_prokka_no_outdir") - outdir = "toto" + outdir = "outdir" name = "prokka_out_for_test" logf = "prokka.log" - gpath = "path/to/nogenome/original_name.fna" + gpath = os.path.join(GENEPATH, "toto.fna") nbcont = 7 assert not afunc.check_prokka(outdir, logf, name, gpath, nbcont, logger[1]) q = logger[0] @@ -84,6 +89,67 @@ def test_check_prokka_no_outdir(): assert q.get().message == msg +def test_check_prokka_nofna(): + """ + Check that check_prokka returns false when a tbl file is missing, and an error message + """ + logger = my_logger("test_check_prokka_nofna") + ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prokkaRes") + ori_name = "prokka_out_for_test" + out_dir = os.path.join(GENEPATH, "out_test_nofna") + name = "prokka_out_for_test-missfna" + gpath = "path/to/nogenome/original_name-error.fna" + os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".tbl"), + os.path.join(out_dir, name + ".tbl")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), + os.path.join(out_dir, name + ".faa")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), + os.path.join(out_dir, name + ".ffn")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), + os.path.join(out_dir, name + ".gff")) + logf = os.path.join(GENEPATH, "prokka.log") + nbcont = 7 + assert not afunc.check_prokka(out_dir, logf, name, gpath, nbcont, logger[1]) + msg = "prokka_out_for_test-missfna original_name-error.fna: no .fna file" + q = logger[0] + assert q.qsize() == 1 + assert q.get().message == msg + + +def test_check_prokka_sevfna(): + """ + Check that check_prokka returns false when there is more than 1 tbl file, + and an error message + """ + logger = my_logger("test_check_prokka_sevfna") + ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prokkaRes") + ori_name = "prokka_out_for_test" + out_dir = os.path.join(GENEPATH, "out_test_sevfna") + name = "prokka_out_for_test-sevfna" + gpath = "path/to/nogenome/original_name-error.fna" + os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".tbl"), + os.path.join(out_dir, name + ".tbl")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), + os.path.join(out_dir, name + ".faa")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), + os.path.join(out_dir, name + ".ffn")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".fna"), + os.path.join(out_dir, name + ".fna")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".fna"), + os.path.join(out_dir, name + "2.fna")) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), + os.path.join(out_dir, name + ".gff")) + logf = os.path.join(GENEPATH, "prokka.log") + nbcont = 7 + assert not afunc.check_prokka(out_dir, logf, name, gpath, nbcont, logger[1]) + msg = "prokka_out_for_test-sevfna original_name-error.fna: several .fna files" + q = logger[0] + assert q.qsize() == 1 + assert q.get().message == msg + + def test_check_prokka_notbl(): """ Check that check_prokka returns false when a tbl file is missing, and an error message @@ -95,6 +161,8 @@ def test_check_prokka_notbl(): name = "prokka_out_for_test-misstbl" gpath = "path/to/nogenome/original_name-error.fna" os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".fna"), + os.path.join(out_dir, name + ".fna")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), os.path.join(out_dir, name + ".faa")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), @@ -122,6 +190,8 @@ def test_check_prokka_sevtbl(): name = "prokka_out_for_test-misstbl" gpath = "path/to/nogenome/original_name-error.fna" os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".fna"), + os.path.join(out_dir, name + ".fna")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), os.path.join(out_dir, name + ".faa")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), @@ -151,6 +221,8 @@ def test_check_prokka_nofaa(): out_dir = os.path.join(GENEPATH, "out_test_nofaa") name = "prokka_out_for_test-missfaa" os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".fna"), + os.path.join(out_dir, name + ".fna")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".tbl"), os.path.join(out_dir, name + ".tbl")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), @@ -178,6 +250,8 @@ def test_check_prokka_sevfaa(): out_dir = os.path.join(GENEPATH, "out_test_nofaa") name = "prokka_out_for_test-missfaa" os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".fna"), + os.path.join(out_dir, name + ".fna")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".tbl"), os.path.join(out_dir, name + ".tbl")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), @@ -208,6 +282,8 @@ def test_check_prokka_noffn(): out_dir = os.path.join(GENEPATH, "out_test_noffn") name = "prokka_out_for_test-missffn" os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".fna"), + os.path.join(out_dir, name + ".fna")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".tbl"), os.path.join(out_dir, name + ".tbl")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), @@ -235,6 +311,8 @@ def test_check_prokka_sevffn(): out_dir = os.path.join(GENEPATH, "out_test_noffn") name = "prokka_out_for_test-missffn" os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".fna"), + os.path.join(out_dir, name + ".fna")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".tbl"), os.path.join(out_dir, name + ".tbl")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), @@ -265,6 +343,8 @@ def test_check_prokka_nogff(): out_dir = os.path.join(GENEPATH, "out_test_noffn") name = "prokka_out_for_test-missgff" os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".fna"), + os.path.join(out_dir, name + ".fna")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".tbl"), os.path.join(out_dir, name + ".tbl")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), @@ -292,6 +372,8 @@ def test_check_prokka_sevgff(): out_dir = os.path.join(GENEPATH, "out_test_noffn") name = "prokka_out_for_test-sevgff" os.makedirs(out_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".fna"), + os.path.join(out_dir, name + ".fna")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".tbl"), os.path.join(out_dir, name + ".tbl")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), @@ -343,6 +425,8 @@ def test_check_prokka_wrong_tbl_cds(): os.makedirs(out_dir) name = "prokka_out_for_test-wrongCDS" tblfile = os.path.join(TEST_DIR, name + ".tbl") + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".fna"), + os.path.join(out_dir, name + ".fna")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), os.path.join(out_dir, name + ".ffn")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), @@ -357,72 +441,10 @@ def test_check_prokka_wrong_tbl_cds(): assert not afunc.check_prokka(out_dir, logf, name, gpath, nbcont, logger[1]) msg1 = ("prokka_out_for_test-wrongCDS original_name.fna: " "no matching number of proteins between tbl and faa; " - "faa=13; in tbl =12") - msg2 = ("prokka_out_for_test-wrongCDS original_name.fna: " - "no matching number of genes between tbl and ffn; " - "ffn=17; in tbl =14genes 2CRISPR") - q = logger[0] - assert q.qsize() == 2 - assert q.get().message == msg1 - assert q.get().message == msg2 - - -def test_check_prokka_wrong_tbl_crispr(): - """ - Check that check_prokka returns an error message when the number of headers in ffn - file is different from the number of CDS + CRISPR in tbl file (1CRISPR in tbl, 2 in ffn) - """ - logger = my_logger("test_check_prokka_wrong_tbl_crispr") - ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prokkaRes") - ori_name = "prokka_out_for_test" - out_dir = os.path.join(GENEPATH, "res_checkProkkaWrongCRISPR") - os.makedirs(out_dir) - name = "prokka_out_for_test-wrongtblCRISP" - tblfile = os.path.join(TEST_DIR, name + ".tbl") - shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), - os.path.join(out_dir, name + ".ffn")) - shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), - os.path.join(out_dir, name + ".faa")) - shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), - os.path.join(out_dir, name + ".gff")) - shutil.copyfile(tblfile, os.path.join(out_dir, name + ".tbl")) - logf = "prokka.log" - gpath = "path/to/nogenome/original_name.fna" - nbcont = 7 - assert not afunc.check_prokka(out_dir, logf, name, gpath, nbcont, logger[1]) - msg = ("prokka_out_for_test-wrongtblCRISP original_name.fna: " - "no matching number of genes between tbl and ffn; " - "ffn=17; in tbl =15genes 1CRISPR") + "faa=14; in tbl =12") q = logger[0] assert q.qsize() == 1 - assert q.get().message == msg - - -def test_check_prokka_tbl_crispr_newversion(): - """ - Check that check_prokka does not return an error message when the number of headers in ffn - file is equal to the number of CDS in tbl file (1CRISPR in tbl, 0 in ffn), but - does not contain the CRISPRs found in tbl - As the new version of prokka (1.12) does not put crisprs in .ffn - """ - logger = my_logger("test_check_prokka_tbl_crispr_newversion") - ori_prok_dir = os.path.join(TEST_DIR, "original_name.fna-prokkaRes") - ori_name = "prokka_out_for_test" - out_dir = os.path.join(GENEPATH, "res_checkProkkaWrongCRISPRnewversion") - os.makedirs(out_dir) - name = "prokka_out_for_test-wrongtblCRISPnewversion" - ffnfile = os.path.join(TEST_DIR, name + ".ffn") - shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".tbl"), - os.path.join(out_dir, name + ".tbl")) - shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), - os.path.join(out_dir, name + ".faa")) - shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".gff"), - os.path.join(out_dir, name + ".gff")) - shutil.copyfile(ffnfile, os.path.join(out_dir, name + ".ffn")) - logf = os.path.join(GENEPATH, "prokka.log") - gpath = "path/to/nogenome/original_name.fna" - nbcont = 6 - assert afunc.check_prokka(out_dir, logf, name, gpath, nbcont, logger[1]) + assert q.get().message == msg1 def test_check_prokka_ok(): @@ -437,6 +459,8 @@ def test_check_prokka_ok(): gpath = "path/to/nogenome/original_name.fna" nbcont = 6 assert afunc.check_prokka(outdir, logf, name, gpath, nbcont, logger[1]) + q = logger[0] + assert q.qsize() == 0 def test_run_prokka_out_exists_ok(): @@ -458,8 +482,9 @@ def test_run_prokka_out_exists_ok(): assert q.qsize() == 4 # start annotating : assert q.get().message.startswith("Start annotating") - # # warning prokka results folder exists: - assert q.get().message.startswith("Prokka results folder test/data/annotate/test_files/" + # warning prokka results folder exists: + assert q.get().message.startswith("Prokka results folder test/data/annotate/" + "test_files/" "original_name.fna-prokkaRes already exists.") # Results in result folder are ok assert q.get().message.startswith("Prokka did not run again, formatting step used already " @@ -482,6 +507,8 @@ def test_run_prokka_out_exists_error(): new_prok_dir = os.path.join(GENEPATH, "original_name-error-prokkaRes") name = "prokka_out_for_test-wrongCDS" os.makedirs(new_prok_dir) + shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".fna"), + os.path.join(new_prok_dir, name + ".fna")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".ffn"), os.path.join(new_prok_dir, name + ".ffn")) shutil.copyfile(os.path.join(ori_prok_dir, ori_name + ".faa"), @@ -495,18 +522,18 @@ def test_run_prokka_out_exists_error(): arguments = (gpath, GENEPATH, cores_prokka, name, force, nbcont, None, logger[0]) assert not afunc.run_prokka(arguments) q = logger[0] - # assert q.qsize() == 4 + assert q.qsize() == 4 # start annotating : assert q.get().message.startswith("Start annotating") # warning prokka results folder exists: assert q.get().message == ("Prokka results folder test/data/annotate/generated_by_unit-tests/" "original_name-error-prokkaRes already exists.") # error, no tbl file - msg = "prokka_out_for_test-wrongCDS original_name-error: no .tbl file" - assert q.get().message == msg + assert q.get().message == "prokka_out_for_test-wrongCDS original_name-error: no .tbl file" # warning, files in outdir are not as expected assert q.get().message.startswith("Problems in the files contained in your already existing " - "output dir ") + "output dir (test/data/annotate/generated_by_unit-tests/" + "original_name-error-prokkaRes)") def test_run_prokka_out_exists_force(): @@ -544,9 +571,13 @@ def test_run_prokka_out_exists_force(): # we cannot compare the whole file. with open(out_tbl, "r") as outt: lines = [line.strip() for line in outt.readlines()] - assert ">Feature H561_S27" in lines - assert ">Feature H561_S28" in lines - assert ">Feature H561_S29" in lines + # Check that there are 3 contigs + feature = 0 + for line in lines: + if 'Feature' in line: + feature += 1 + assert feature == 3 + # Check that there are 16 CDS CDS = 0 for line in lines: if "CDS" in line: @@ -554,11 +585,11 @@ def test_run_prokka_out_exists_force(): assert CDS == 16 # Check that faa and ffn files are as expected assert os.path.isfile(out_faa) - tutil.compare_order_content(exp_dir + ".faa", out_faa) + assert tutil.compare_order_content(exp_dir + ".faa", out_faa) assert os.path.isfile(out_ffn) - tutil.compare_order_content(exp_dir + ".ffn", out_ffn) + assert tutil.compare_order_content(exp_dir + ".ffn", out_ffn) q = logger[0] - # assert q.qsize() == 3 + assert q.qsize() == 4 assert q.get() .message.startswith("Start annotating test_runprokka_H299 from test/data/" "annotate/genomes/H299_H561.fasta with Prokka") assert q.get() .message == ("Prokka results folder already exists, but removed because " @@ -566,12 +597,12 @@ def test_run_prokka_out_exists_force(): assert q.get().message == ("Prokka command: prokka " "--outdir test/data/annotate/generated_by_unit-tests/" "H299_H561.fasta-prokkaRes --cpus 2 --prefix test_runprokka_H299 " - "test/data/annotate/genomes/H299_H561.fasta") + "--centre prokka test/data/annotate/genomes/H299_H561.fasta") assert q.get() .message.startswith("End annotating test_runprokka_H299 " "from test/data/annotate/genomes/H299_H561.fasta") -def test_run_prokka_out_doesnt_exist(): +def test_run_prokka_out_doesnt_exist_ok(): """ Test that when the output directory does not exist, it creates it, and runs prokka with all expected outfiles @@ -601,30 +632,30 @@ def test_run_prokka_out_doesnt_exist(): # we cannot compare the whole file. with open(out_tbl, "r") as outt: lines = [line.strip() for line in outt.readlines()] - assert ">Feature H561_S27" in lines - assert ">Feature H561_S28" in lines - assert ">Feature H561_S29" in lines + # Check that there are 3 contigs + feature = 0 + for line in lines: + if 'Feature' in line: + feature += 1 + assert feature == 3 + # Check that there are 16 CDS CDS = 0 for line in lines: if "CDS" in line: CDS += 1 assert CDS == 16 - assert os.path.isfile(out_faa) - with open(exp_dir + ".faa", "r") as expf, open(out_faa, "r") as outf: - for line_exp, line_out in zip(expf, outf): - assert line_exp == line_out # Check that faa and ffn files are as expected assert os.path.isfile(out_faa) - tutil.compare_order_content(exp_dir + ".faa", out_faa) + assert tutil.compare_order_content(exp_dir + ".faa", out_faa) assert os.path.isfile(out_ffn) - tutil.compare_order_content(exp_dir + ".ffn", out_ffn) + assert tutil.compare_order_content(exp_dir + ".ffn", out_ffn) q = logger[0] assert q.qsize() == 3 assert q.get().message.startswith("Start annotating") assert q.get().message == ("Prokka command: prokka " "--outdir test/data/annotate/generated_by_unit-tests/" "H299_H561.fasta-prokkaRes --cpus 2 --prefix test_runprokka_H299 " - "test/data/annotate/genomes/H299_H561.fasta") + "--centre prokka test/data/annotate/genomes/H299_H561.fasta") assert q.get().message.startswith("End annotating") @@ -635,12 +666,12 @@ def test_run_prokka_out_problem_running(): """ logger = my_logger("test_run_prokka_out_problem_running") utils.init_logger(LOGFILE_BASE, 0, 'test_run_prokka_out_problem_running') - gpath = os.path.join(GEN_PATH, "H299 H561.fasta") + gpath = os.path.join(GEN_PATH, "H299_H561bis.fasta") cores_prokka = 2 name = "test_runprokka_H299-error" force = False nbcont = 3 - logf = os.path.join(GENEPATH, "H299 H561.fasta-prokka.log") + logf = os.path.join(GENEPATH, "H299_H561.fasta-prokka.log") arguments = (gpath, GENEPATH, cores_prokka, name, force, nbcont, None, logger[0]) assert not afunc.run_prokka(arguments) q = logger[0] @@ -648,8 +679,8 @@ def test_run_prokka_out_problem_running(): assert q.get().message.startswith("Start annotating") assert q.get().message == ("Prokka command: prokka " "--outdir test/data/annotate/generated_by_unit-tests/" - "H299 H561.fasta-prokkaRes --cpus 2 " + "H299_H561bis.fasta-prokkaRes --cpus 2 " "--prefix test_runprokka_H299-error " - "test/data/annotate/genomes/H299 H561.fasta") + "--centre prokka test/data/annotate/genomes/H299_H561bis.fasta") assert q.get().message == ("Error while trying to run prokka on test_runprokka_H299-error " - "from test/data/annotate/genomes/H299 H561.fasta") + "from test/data/annotate/genomes/H299_H561bis.fasta") diff --git a/test/test_unit/test_annotate/test_annotation_general.py b/test/test_unit/test_annotate/test_annotation_general.py index 16042264cd46eeb5d4527622d7ee6b4eb8c5a299..9fc5612945b0dd56f44c8ac0e0a5593e81294dfb 100644 --- a/test/test_unit/test_annotate/test_annotation_general.py +++ b/test/test_unit/test_annotate/test_annotation_general.py @@ -37,15 +37,20 @@ def setup_teardown_module(): - remove all log files - remove directory with generated results """ - os.mkdir(GENEPATH) + if os.path.isdir(GENEPATH): + content = os.listdir(GENEPATH) + for f in content: + assert f.startswith(".fuse") + else: + os.mkdir(GENEPATH) print("setup") yield - + for f in LOGFILES: if os.path.exists(f): os.remove(f) - shutil.rmtree(GENEPATH) + shutil.rmtree(GENEPATH, ignore_errors=True) print("teardown") @@ -81,11 +86,10 @@ def test_count_tbl(): nbcont, nbCDS, nbGene, nbCRISPR """ tblfile = os.path.join(TEST_DIR, "original_name.fna-prokkaRes", "prokka_out_for_test.tbl") - ncont, ncds, ngene, ncris = afunc.count_tbl(tblfile) + ncont, ncds, ngene = afunc.count_tbl(tblfile) assert ncont == 6 - assert ncds == 13 - assert ngene == 15 - assert ncris == 2 + assert ncds == 14 + assert ngene == 16 def test_run_all_1by1(): @@ -127,6 +131,8 @@ def test_run_all_1by1(): message_end_annot2 = ("End annotating test_runall_1by1_2 from test/data/annotate/genomes/" "A_H738.fasta.") qget = q.get().message + # Check logs. Given that it is executed in parallel, we cannot know in which order messages + # will appear assert qget == message_start_annot1 or message_start_annot2 if qget == message_start_annot1: # Ending annotation of first genome (same genome as started because running 1by1) @@ -214,7 +220,8 @@ def test_run_all_parallel_less_threads(): Genomes H299 and A_H738 should run well, but genomes genome* have problems (no CDS found), so check_prokka should return false. """ - utils.init_logger(LOGFILE_BASE, 0, 'test_run_all_parallel_less_threads') + logger = my_logger("test_run_all_parallel_more_threads") + utils.init_logger(LOGFILE_BASE, 0, 'test_run_all_parallel_more_threads') # genomes = {genome: [name, gpath, size, nbcont, l90]} gnames = ["H299_H561.fasta", "A_H738.fasta", "genome1.fasta", "genome2.fasta", "genome3.fasta"] gpaths = [os.path.join(GEN_PATH, name) for name in gnames] @@ -232,3 +239,14 @@ def test_run_all_parallel_less_threads(): assert not final[gnames[2]] assert not final[gnames[3]] assert not final[gnames[4]] + q = logger[0] + # Check size of logs + # -> starting log -> 1 log + # -> for each genome ok (2 first ones): start annotate, prokka cmd, end annotate -> 6 logs + # -> for each genome not ok (3 others): + # start annotate, prokka cmd, problem, end annotate -> 12 logs + assert q.qsize() == 19 + # Check at least 1st log + assert q.get().message == "Annotating all genomes with prokka" + + diff --git a/test/test_unit/test_annotate/test_format_func.py b/test/test_unit/test_annotate/test_format_func.py index 2f6258d1de7b3f6eb025ad0e67276a3988d50027..7f652f5e1d577480146825039d6729d95b20444c 100755 --- a/test/test_unit/test_annotate/test_format_func.py +++ b/test/test_unit/test_annotate/test_format_func.py @@ -35,16 +35,19 @@ def setup_teardown_module(): - remove directory with generated results """ # utils.init_logger(LOGFILE_BASE, 0, 'test_fastme', verbose=1) - os.mkdir(GENEPATH) + if os.path.isdir(GENEPATH): + content = os.listdir(GENEPATH) + for f in content: + assert f.startswith(".fuse") + else: + os.mkdir(GENEPATH) print("setup") yield - # for f in LOGFILES: - # if os.path.exists(f): - # os.remove(f) shutil.rmtree(GENEPATH) print("teardown") + # Define variables and functions used by several tests def my_logger(): """ @@ -66,13 +69,12 @@ def my_logger(): def test_write_gene(): """ Test that lstinfo line is written as expected when writing info for - a gene (CDS). Also check that crispr number is not changed + a gene (CDS). """ gtype = "CDS" locus_num = "5621221" gene_name = "abc" product = "new product" - crispr_num = 1 cont_loc = "i" genome = "ESCO.0216.00005" cont_num = 15 @@ -84,11 +86,10 @@ def test_write_gene(): end = str(656) lstfile = os.path.join(GENEPATH, "toto.lst") lstopenfile = open(lstfile, "w") - crispres, lst_line = ffunc.write_gene(gtype, locus_num, gene_name, product, crispr_num, - cont_loc, genome, cont_num, ecnum, inf2, db_xref, strand, - start, end, lstopenfile) + lst_line = ffunc.write_gene(gtype, locus_num, gene_name, product, + cont_loc, genome, cont_num, ecnum, inf2, db_xref, strand, + start, end, lstopenfile) lstopenfile.close() - assert crispres == crispr_num assert lst_line == ("154\t656\tC\tCDS\tESCO.0216.00005.0015i_5621221\tabc\t| new product " "| 454.12.5 | more information... dfd _ with _ pipe_characters... | " "mydb_pipe") @@ -96,39 +97,6 @@ def test_write_gene(): assert tutil.compare_order_content(exp_file, lstfile) -def test_write_crispr(): - """ - Test that lstinfo line is written as expected when writing info for CRISPR, - and that crispr num increased by 1 - """ - gtype = "repeat_region" - locus_num = "465" - gene_name = "NA" - product = "NA" - crispr_num = 1 - cont_loc = "b" - genome = "ESCO.0216.00005" - cont_num = 15 - ecnum = "NA" - inf2 = "more information... dfd | with | pipe|characters..." - db_xref = "mydb|pipe" - strand = "D" - start = str(154) - end = str(656) - lstfile = os.path.join(GENEPATH, "toto.lst") - lstopenfile = open(lstfile, "w") - crispres, lstline = ffunc.write_gene(gtype, locus_num, gene_name, product, crispr_num, - cont_loc, genome, cont_num, ecnum, inf2, db_xref, strand, - start, end, lstopenfile) - lstopenfile.close() - exp_file = os.path.join(EXP_ANNOTE, "res_test_write_geneCRISPR.lst") - assert crispres == 2 - assert lstline == ("154\t656\tD\tCRISPR\tESCO.0216.00005.0015b_CRISPR1\tcrispr\t| " - "crispr-array | NA | more information... dfd _ with _ pipe_characters... | " - "mydb_pipe") - assert tutil.compare_order_content(exp_file, lstfile) - - def test_contig_name(): """ test that when we give a genome name and a contig number, it returns the expected fasta header @@ -173,1036 +141,326 @@ def test_write_header_gene_no_name(): outfile.close() -def test_write_header_crispr(): +def test_handle_genome_badprok(): """ - From a given line of lstinfo file, giving info for a CRISPR check that the header - line of the protein and gene files are generated as expected. + Test that when we try to format a genome which was annotated by prokka, but original genome + is empty -> cannot format genome -> returns False associated with genome name """ - outfile = StringIO() - lstline = ("296902\t2968265\tC\tCRISPR\ttest.0417.00002.0003b_CRISPR1\tcrispr\t| " - "crispr-array | NA | NA") - ffunc.write_header(lstline, outfile) - res = outfile.getvalue() - exp = ">test.0417.00002.0003b_CRISPR1 2671364 crispr | crispr-array | NA | NA\n" - assert res == exp - outfile.close() - - -# def test_handle_genome_nores(): -# """ -# Test that when we try to format a genome which is not in results, -# it returns a tuple with "no_res" and the genome name. -# """ -# results = {"abcd.fasta": True} -# prodigal_only = False -# args = ("toto.fasta", "name", "genome/path", "prokka/path", "lst/dir", "prot/dir", -# "gene/dir", "rep/dir", "gff/dir", prodigal_only, my_logger()[0]) -# res = ffunc.handle_genome(args) -# assert res == ("no_res", "toto.fasta") - - -# def test_handle_genome_badprok(): -# """ -# Test that when we try to format a genome which is in results, but with False, -# it returns a tuple with "bad_prokka" and the genome name. -# """ -# results = {"abcd.fasta": True, "toto.fasta": False} -# args = ("toto.fasta", "name", "genome/path", "prokka/path", "lst/dir", "prot/dir", -# "gene/dir", "rep/dir", "gff/dir", False, my_logger()[0]) -# res = ffunc.handle_genome(args) -# assert res == ("bad_prokka", "toto.fasta") - - -# def test_handle_genome_formatok(): -# """ -# Test that when we try to format a genome which is in results, with True, -# it returns a tuple with "True" and the genome name. -# """ -# gpath = os.path.join("test", "data", "annotate", "genomes", -# "B2_A3_5.fasta-split5N.fna-short-contig.fna") -# name = "test.0417.00002" -# prok_path = os.path.join("test", "data", "annotate", "exp_files") -# lst_dir = os.path.join("test", "data", "annotate") -# prot_dir = lst_dir -# gene_dir = lst_dir -# rep_dir = lst_dir -# gff_dir = lst_dir -# results = {"B2_A3_5.fasta-split5N.fna-short-contig.fna": True, "toto.fasta": False} -# args = ("B2_A3_5.fasta-split5N.fna-short-contig.fna", name, gpath, prok_path, -# lst_dir, prot_dir, -# gene_dir, rep_dir, gff_dir, results, my_logger()[0]) -# res = ffunc.handle_genome(args) -# assert res == (True, "B2_A3_5.fasta-split5N.fna-short-contig.fna") -# os.remove(os.path.join(lst_dir, name + ".prt")) -# os.remove(os.path.join(lst_dir, name + ".fna")) -# os.remove(os.path.join(lst_dir, name + ".gen")) -# os.remove(os.path.join(lst_dir, name + ".lst")) -# os.remove(os.path.join(lst_dir, name + ".gff")) - - -# def test_handle_genome_formaterror(): -# """ -# Test that when we try to format a genome which is in results, but with False, -# it returns a tuple with "bad_prokka" and the genome name. -# """ -# logger = my_logger() -# gpath = os.path.join("test", "data", "annotate", "genomes", -# "B2_A3_5.fasta-problems.fna-short-contig.fna") -# name = "test.0417.00002" -# prok_path = os.path.join("test", "data", "annotate", "exp_files") -# tbl_init = os.path.join(prok_path, "B2_A3_5.fasta-split5N.fna-short-contig.fna-prokkaRes", -# name + ".tbl") -# tblout = os.path.join(prok_path, "B2_A3_5.fasta-problems.fna-short-contig.fna-prokkaRes", -# name + ".tbl") -# shutil.copyfile(tbl_init, tblout) -# gff_init = os.path.join(prok_path, "B2_A3_5.fasta-split5N.fna-short-contig.fna-prokkaRes", -# name + ".gff") -# gffout = os.path.join(prok_path, "B2_A3_5.fasta-problems.fna-short-contig.fna-prokkaRes", -# name + ".gff") -# shutil.copyfile(gff_init, gffout) -# lst_dir = os.path.join("test", "data", "annotate") -# prot_dir = lst_dir -# gene_dir = lst_dir -# rep_dir = lst_dir -# gff_dir = lst_dir -# results = {"B2_A3_5.fasta-problems.fna-short-contig.fna": True, "toto.fasta": False} -# args = ("B2_A3_5.fasta-problems.fna-short-contig.fna", name, gpath, -# prok_path, lst_dir, prot_dir, gene_dir, rep_dir, gff_dir, results, logger[0]) -# res = ffunc.handle_genome(args) -# assert res == (False, "B2_A3_5.fasta-problems.fna-short-contig.fna") -# msg = ("Unknown header format >EPKOMDHM_i00002 hypothetical protein in " -# "test/data/annotate/exp_files/B2_A3_5.fasta-problems.fna-short-contig.fna-prokkaRes/" -# "test.0417.00002.ffn.\n" -# "Gen file will not be created.") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg -# # remove tblout which was copied for this test -# assert not os.path.isfile(os.path.join(lst_dir, name + ".prt")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".gen")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".fna")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".lst")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".gff")) -# os.remove(tblout) -# os.remove(gffout) - - -# def test_tbl_to_lst_new_name(): -# """ -# Check that generated lstinfo file is as expected, when the genome name has changed between -# the one given to prokka, and the name given now. -# The test tblfile contains the following aspects: -# - gene in D strand (start < end) -# - gene in C strand (start > end) -# - CDS features (some with all info = ECnumber, gene name, product etc. ; -# some with missing info) -# - tRNA type -# - repeat_region type (*2) -# - contigs with more than 2 genes -# - contig with only 2 genes (both 'b' loc) -# - contig with 1 gene ('b' loc) -# - contig without gene (should be skipped) -# """ -# tblfile = os.path.join("test", "data", "annotate", "test_files", "original_name.fna-prokkaRes", -# "prokka_out_for_test.tbl") -# lstfile = os.path.join("test", "data", "annotate", "test_tbl2lstNewName.lst") -# exp_lst = os.path.join("test", "data", "annotate", "exp_files", "res_tbl2lst-newName.lst") -# name = "test.0417.00010" -# assert not ffunc.tbl2lst(tblfile, lstfile, name) -# with open(exp_lst, "r") as expf, open(lstfile, "r") as lstf: -# for line_exp, line_out in zip(expf, lstf): -# assert line_exp == line_out -# os.remove(lstfile) - - - - - - - -# def test_create_prt_wrong_header_sep(): -# """ -# Test that, when creating prt file from faa and lst, if a header of faa file is -# not in the right format (protein name and number are not separated by '_'), -# it writes an error, erases prt file, and returns False. -# """ -# logger = my_logger() -# faaseq = os.path.join("test", "data", "annotate", "test_files", -# "prokka_out_for_test-wrongHeaderSep.faa") -# lstfile = os.path.join("test", "data", "annotate", "exp_files", "res_tbl2lst.lst") -# prtseq = os.path.join("test", "data", "annotate", "test_create_prt-wrongHeadSep.prt") -# assert not ffunc.create_prt(faaseq, lstfile, prtseq, logger[1]) -# assert not os.path.isfile(prtseq) -# msg = ("Unknown header format >JGIKIPIJ00008 in test/data/annotate/test_files/" -# "prokka_out_for_test-wrongHeaderSep.faa. Error: invalid literal for int() " -# "with base 10: '>JGIKIPIJ00008'\nPrt file not created from " -# "test/data/annotate/test_files/prokka_out_for_test-wrongHeaderSep.faa.") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_create_prt_wrong_header_int(): -# """ -# Test that, when creating prt file from faa and lst, if a header of faa file is -# not in the right format (protein name and number are separated by '_', but protein num -# contains a letter), it writes an error, erases prt file, and returns False. -# """ -# logger = my_logger() -# faaseq = os.path.join("test", "data", "annotate", "test_files", -# "prokka_out_for_test-wrongHeaderInt.faa") -# lstfile = os.path.join("test", "data", "annotate", "exp_files", "res_tbl2lst.lst") -# prtseq = os.path.join("test", "data", "annotate", "test_create_prt-wrongHeadInt.prt") -# assert not ffunc.create_prt(faaseq, lstfile, prtseq, logger[1]) -# assert not os.path.isfile(prtseq) -# msg = ("Unknown header format >JGIKIPIJ_d0008 in test/data/annotate/test_files/" -# "prokka_out_for_test-wrongHeaderInt.faa. Error: invalid literal for int() " -# "with base 10: 'd0008'\nPrt file not created from " -# "test/data/annotate/test_files/prokka_out_for_test-wrongHeaderInt.faa.") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_create_prt_miss_lst(): -# """ -# Test that, when creating prt file from faa and lst, if a protein of faa file is not present in -# the lst file, it writes an error, removes the prt file, and returns False. -# """ -# logger = my_logger() -# faaseq = os.path.join("test", "data", "annotate", "test_files", -# "prokka_out_for_test-supHeader.faa") -# lstfile = os.path.join("test", "data", "annotate", "exp_files", "res_tbl2lst.lst") -# prtseq = os.path.join("test", "data", "annotate", "test_create_prt-missLst.prt") -# assert not ffunc.create_prt(faaseq, lstfile, prtseq, logger[1]) -# assert not os.path.isfile(prtseq) -# msg = ("Missing info for protein >sup-prot_00012 in " -# "test/data/annotate/exp_files/res_tbl2lst.lst. If it is " -# "actually present in the lst file, check that proteins are ordered by " -# "increasing number in both lst and faa files.\n" -# "Prt file not created from test/data/annotate/test_files/" -# "prokka_out_for_test-supHeader.faa.") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_create_prt_wrong_order(): -# """ -# Test that, when creating prt file from faa and lst, if a protein of faa file is not in -# increasing protein number, so that it does not correspond to the protein in the lstinfo file, -# it writes an error, removes the prt file, and returns False. -# """ -# logger = my_logger() -# faaseq = os.path.join("test", "data", "annotate", "test_files", -# "prokka_out_for_test-wrongOrder.faa") -# lstfile = os.path.join("test", "data", "annotate", "exp_files", "res_tbl2lst.lst") -# prtseq = os.path.join("test", "data", "annotate", "test_create_prt-wrongOrder.prt") -# assert not ffunc.create_prt(faaseq, lstfile, prtseq, logger[1]) -# assert not os.path.isfile(prtseq) -# msg = ("Missing info for protein >appears_after_13_00011 in " -# "test/data/annotate/exp_files/res_tbl2lst.lst. If it is " -# "actually present in the lst file, check that proteins are ordered by " -# "increasing number in both lst and faa files.\n" -# "Prt file not created from test/data/annotate/test_files/" -# "prokka_out_for_test-wrongOrder.faa.") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_create_prt_ok(): -# """ -# Test that when everything is ok in both faa and lst files, the prt file is -# created as expected. -# """ -# logger = my_logger() -# faaseq = os.path.join("test", "data", "annotate", "test_files", "original_name.fna-prokkaRes", -# "prokka_out_for_test.faa") -# lstfile = os.path.join("test", "data", "annotate", "exp_files", "res_tbl2lst.lst") -# prtseq = os.path.join("test", "data", "annotate", "test_create_prt.prt") -# assert ffunc.create_prt(faaseq, lstfile, prtseq, logger[1]) -# exp_file = os.path.join("test", "data", "annotate", "exp_files", "res_create_prt.faa") -# with open(exp_file, "r") as expf, open(prtseq, "r") as prtf: -# for line_exp, line_out in zip(expf, prtf): -# assert line_exp == line_out -# os.remove(prtseq) - - -# def test_create_gen_sup_crispr(): -# """ -# Test that when there is a CRISPR in the ffn file, but not in lstinfo, -# it generates an error, because the CRISPR ID does not correspond to the gene ID in lstinfo. -# It should return False, write an error message, and remove the .gen file. -# Moreover, the CRISPR ID is not in the same format as a gene ID, so the error should -# be on the format. -# """ -# logger = my_logger() -# ffnseq = os.path.join("test", "data", "annotate", "test_files", -# "prokka_out_for_test-supCRISPR.ffn") -# lstfile = os.path.join("test", "data", "annotate", "exp_files", "res_tbl2lst.lst") -# genseq = os.path.join("test", "data", "annotate", "test_create_gen_supCRISPR.gen") -# assert not ffunc.create_gen(ffnseq, lstfile, genseq, logger[1]) -# assert not os.path.isfile(genseq) -# msg = ("Unknown header format >prokka_out_for_test in test/data/annotate/test_files/" -# "prokka_out_for_test-supCRISPR.ffn.\nGen file will not be created.") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_create_gen_sup_gene(): -# """ -# Test that, when creating gen file from ffn and lst, if a gene of ffn file is not present in -# the lst file, it writes an error, removes the gen file, and returns False. -# """ -# logger = my_logger() -# ffnseq = os.path.join("test", "data", "annotate", "test_files", -# "prokka_out_for_test-supGene.ffn") -# lstfile = os.path.join("test", "data", "annotate", "exp_files", "res_tbl2lst.lst") -# prtseq = os.path.join("test", "data", "annotate", "test_create_gen-supgene.prt") -# assert not ffunc.create_gen(ffnseq, lstfile, prtseq, logger[1]) -# assert not os.path.isfile(prtseq) -# msg = ("Missing info for gene >sup_gene_00012 in test/data/annotate/exp_files/" -# "res_tbl2lst.lst. If it is actually present " -# "in the lst file, check that genes are ordered by increasing " -# "number in both lst and ffn files.\nGen file not created" -# " from test/data/annotate/test_files/prokka_out_for_test-supGene.ffn.") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_create_gen_miss_crispr(): -# """ -# Test for situation where there are 2 CRISPRs in the lstinfo file, the first one -# is not in the ffn file, while the second one is in the ffn file. -# It should return an error message about CRISPR number not corresponding, as -# the first CRISPR found in ffn (CRISPR 1) corresponds to CRISPR2 in lstinfo file. -# Gene file should be removed, and the function should return False -# """ -# logger = my_logger() -# ffnseq = os.path.join("test", "data", "annotate", "test_files", -# "prokka_out_for_test-missCRISPR.ffn") -# lstfile = os.path.join("test", "data", "annotate", "exp_files", "res_tbl2lst.lst") -# genseq = os.path.join("test", "data", "annotate", "test_create_gen_missCRISPR.gen") -# assert not ffunc.create_gen(ffnseq, lstfile, genseq, logger[1]) -# assert not os.path.isfile(genseq) -# msg = ("Problem with CRISPR numbers in test/data/annotate/exp_files/res_tbl2lst.lst. " -# "CRISPR >prokka_out_for_test in ffn is CRISPR num 1, whereas it is annotated " -# "as CRISPR num 2 in lst file.") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_create_gen_no_crispr_ffn(): -# """ -# Test that when the there is a CRISPR in the lst file, but not in the ffn file, -# everything goes well, as in some versions of prokka (1.12)n CRISPRs are not in ffn while -# they are specified in lst. Function should return True, and gene file created. -# """ -# ffnseq = os.path.join("test", "data", "annotate", "test_files", -# "prokka_out_for_test-noCRISPRffn.ffn") -# lstfile = os.path.join("test", "data", "annotate", "exp_files", "res_tbl2lst.lst") -# genseq = os.path.join("test", "data", "annotate", "test_create_gen_noCRISPRffn.gen") -# assert ffunc.create_gen(ffnseq, lstfile, genseq, my_logger()[1]) -# assert os.path.isfile(genseq) -# exp_file = os.path.join("test", "data", "annotate", "exp_files", -# "res_create_gen_noCRISPRffn.gen") -# with open(exp_file, "r") as expf, open(genseq, "r") as prtf: -# for line_exp, line_out in zip(expf, prtf): -# assert line_exp == line_out -# os.remove(genseq) - - -# def test_create_gen_wrong_header_sep(): -# """ -# Test that, when creating gen file from ffn and lst, if a header of ffn file is -# not in the right format (gene name and number are not separated by '_'), -# it writes an error, erases gen file, and returns False. -# """ -# logger = my_logger() -# ffnseq = os.path.join("test", "data", "annotate", "test_files", -# "prokka_out_for_test-wrongFormat.ffn") -# lstfile = os.path.join("test", "data", "annotate", "exp_files", "res_tbl2lst.lst") -# genseq = os.path.join("test", "data", "annotate", "test_create_gen_wrongHeadSep.gen") -# assert not ffunc.create_gen(ffnseq, lstfile, genseq, logger[1]) -# assert not os.path.isfile(genseq) -# msg = ("Unknown header format >JGIKIPIJ-00005 in test/data/annotate/test_files/" -# "prokka_out_for_test-wrongFormat.ffn.\n" -# "Gen file will not be created.") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_create_gen_wrong_header_int(): -# """ -# Test that, when creating gen file from ffn and lst, if a header of ffn file is -# not in the right format (gene name and number are separated by '_', but gene num -# contains a letter), it writes an error, erases gen file, and returns False. -# """ -# logger = my_logger() -# ffnseq = os.path.join("test", "data", "annotate", "test_files", -# "prokka_out_for_test-wrongInt.ffn") -# lstfile = os.path.join("test", "data", "annotate", "exp_files", "res_tbl2lst.lst") -# genseq = os.path.join("test", "data", "annotate", "test_create_gen_wrongHeadInt.gen") -# assert not ffunc.create_gen(ffnseq, lstfile, genseq, logger[1]) -# assert not os.path.isfile(genseq) -# msg = ("Unknown header format >JGIKIPIJ_a00005 in test/data/annotate/test_files/" -# "prokka_out_for_test-wrongInt.ffn.\n" -# "Gen file will not be created.") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_create_gen_wrong_lst_int(): -# """ -# Test that, when creating gen file from ffn and lst, if a gene name in lst file is -# not in the right format (gene name and number are separated by '_', but gene num -# contains a letter), it writes an error, erases gen file, and returns False. -# Because the gene name in ffn won't be found in lst (a it contains an error in lst). -# """ -# logger = my_logger() -# ffnseq = os.path.join("test", "data", "annotate", "test_files", "original_name.fna-prokkaRes", -# "prokka_out_for_test.ffn") -# lstfile = os.path.join("test", "data", "annotate", "exp_files", "res_tbl2lst-wrongGeneName.lst") -# genseq = os.path.join("test", "data", "annotate", "test_create_gen_wrongLstHeadInt.gen") -# assert not ffunc.create_gen(ffnseq, lstfile, genseq, logger[1]) -# assert not os.path.isfile(genseq) -# msg = ("Missing info for gene >JGIKIPIJ_00009 in test/data/annotate/exp_files/" -# "res_tbl2lst-wrongGeneName.lst. If it is actually present " -# "in the lst file, check that genes are ordered by increasing " -# "number in both lst and ffn files.\nGen file not created " -# "from test/data/annotate/test_files/original_name.fna-prokkaRes/" -# "prokka_out_for_test.ffn.") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg - - -# def test_create_gen_ok(): -# """ -# Test that when everything is ok in both ffn and lst files, the gen file is -# created as expected. -# """ -# faaseq = os.path.join("test", "data", "annotate", "test_files", "original_name.fna-prokkaRes", -# "prokka_out_for_test.ffn") -# lstfile = os.path.join("test", "data", "annotate", "exp_files", "res_tbl2lst.lst") -# genseq = os.path.join("test", "data", "annotate", "test_create_gen.gen") -# assert ffunc.create_gen(faaseq, lstfile, genseq, my_logger()[1]) -# exp_file = os.path.join("test", "data", "annotate", "exp_files", "res_create_gen.gen") -# with open(exp_file, "r") as expf, open(genseq, "r") as prtf: -# for line_exp, line_out in zip(expf, prtf): -# assert line_exp == line_out -# os.remove(genseq) - - -# def test_handle_line_gff(): -# """ -# Check that given a line in lstinfo with no information (gene name, ecnumber, product, -# inference), it returns the good gff line -# """ -# line_lst = ("201\t743\tC\tCDS\tESCO.1015.00001.b0001_00001\tNA\t" -# "| NA | NA | NA") -# line_gff = ("H561_S27_L001__1\tProdigal:2.6\tCDS\t201\t743\t.\t-\t0\t" -# "ID=ONKACNIE_00001;inference=ab initio " -# "prediction:Prodigal:2.6;locus_tag=ONKACNIE_00001;product=hypothetical protein") -# outgff = "test_handle_line_gff.gff" -# gfff = open(outgff, "w") -# ffunc.handle_line_gff(line_lst, line_gff, gfff) -# gfff.close() -# with open(outgff, "r") as gf: -# lines = gf.readlines() -# assert len(lines) == 1 -# exp_line = ("ESCO.1015.00001.0001\tProdigal:2.6\tCDS\t201\t743\t.\t-\t.\t" -# "ID=ESCO.1015.00001.b0001_00001;locus_tag=ESCO.1015.00001.b0001_00001\n") -# assert lines[0] == exp_line -# os.remove(outgff) - - -# def test_handle_line_gff_ecnum(): -# """ -# Check that given a line in lstinfo with only ec_number information, -# it returns the good gff line -# """ -# line_lst = ("201\t743\tC\tCDS\tESCO.1015.00001.b0001_00001\tNA\t" -# "| NA | 123.995.4546 | NA") -# line_gff = ("H561_S27_L001__1\tProdigal:2.6\tCDS\t201\t743\t.\t-\t0\t" -# "ID=ONKACNIE_00001;inference=ab initio " -# "prediction:Prodigal:2.6;locus_tag=ONKACNIE_00001;product=hypothetical protein") -# outgff = "test_handle_line_gff-ecnum.gff" -# gfff = open(outgff, "w") -# ffunc.handle_line_gff(line_lst, line_gff, gfff) -# gfff.close() -# with open(outgff, "r") as gf: -# lines = gf.readlines() -# assert len(lines) == 1 -# exp_line = ("ESCO.1015.00001.0001\tProdigal:2.6\tCDS\t201\t743\t.\t-\t.\t" -# "ID=ESCO.1015.00001.b0001_00001;eC_number=123.995.4546;" -# "locus_tag=ESCO.1015.00001.b0001_00001\n") -# assert lines[0] == exp_line -# os.remove(outgff) - - -# def test_handle_line_gff_gene(): -# """ -# Check that given a line in lstinfo with only gene name information, -# it returns the good gff line -# """ -# line_lst = ("201\t743\tC\tCDS\tESCO.1015.00001.b0001_00001\tge4a\t" -# "| NA | NA | NA") -# line_gff = ("H561_S27_L001__1\tProdigal:2.6\tCDS\t201\t743\t.\t-\t0\t" -# "ID=ONKACNIE_00001;inference=ab initio " -# "prediction:Prodigal:2.6;locus_tag=ONKACNIE_00001;product=hypothetical protein") -# outgff = "test_handle_line_gff-gene.gff" -# gfff = open(outgff, "w") -# ffunc.handle_line_gff(line_lst, line_gff, gfff) -# gfff.close() -# with open(outgff, "r") as gf: -# lines = gf.readlines() -# assert len(lines) == 1 -# exp_line = ("ESCO.1015.00001.0001\tProdigal:2.6\tCDS\t201\t743\t.\t-\t.\t" -# "ID=ESCO.1015.00001.b0001_00001;Name=ge4a;gene=ge4a;" -# "locus_tag=ESCO.1015.00001.b0001_00001\n") -# assert lines[0] == exp_line -# os.remove(outgff) - - -# def test_handle_line_gff_inf(): -# """ -# Check that given a line in lstinfo with only inference information, -# it returns the good gff line -# """ -# line_lst = ("201\t743\tC\tCDS\tESCO.1015.00001.b0001_00001\tNA\t" -# "| NA | NA | ab initio prediction:Prodigal:2.6") -# line_gff = ("H561_S27_L001__1\tProdigal:2.6\tCDS\t201\t743\t.\t-\t0\t" -# "ID=ONKACNIE_00001;inference=ab initio " -# "prediction:Prodigal:2.6;locus_tag=ONKACNIE_00001;product=hypothetical protein") -# outgff = "test_handle_line_gff-inf.gff" -# gfff = open(outgff, "w") -# ffunc.handle_line_gff(line_lst, line_gff, gfff) -# gfff.close() -# with open(outgff, "r") as gf: -# lines = gf.readlines() -# assert len(lines) == 1 -# exp_line = ("ESCO.1015.00001.0001\tProdigal:2.6\tCDS\t201\t743\t.\t-\t.\t" -# "ID=ESCO.1015.00001.b0001_00001;inference=ab initio " -# "prediction:Prodigal:2.6;locus_tag=ESCO.1015.00001.b0001_00001\n") -# assert lines[0] == exp_line -# os.remove(outgff) - - -# def test_handle_line_gff_prod(): -# """ -# Check that given a line in lstinfo with only product information, -# it returns the good gff line -# """ -# line_lst = ("201\t743\tC\tCDS\tESCO.1015.00001.b0001_00001\tNA\t" -# "| hypothetical protein | NA | NA") -# line_gff = ("H561_S27_L001__1\tProdigal:2.6\tCDS\t201\t743\t.\t-\t0\t" -# "ID=ONKACNIE_00001;inference=ab initio " -# "prediction:Prodigal:2.6;locus_tag=ONKACNIE_00001;product=hypothetical protein") -# outgff = "test_handle_line_gff-prod.gff" -# gfff = open(outgff, "w") -# ffunc.handle_line_gff(line_lst, line_gff, gfff) -# gfff.close() -# with open(outgff, "r") as gf: -# lines = gf.readlines() -# assert len(lines) == 1 -# exp_line = ("ESCO.1015.00001.0001\tProdigal:2.6\tCDS\t201\t743\t.\t-\t.\t" -# "ID=ESCO.1015.00001.b0001_00001;locus_tag=ESCO.1015.00001.b0001_00001;" -# "product=hypothetical protein\n") -# assert lines[0] == exp_line -# os.remove(outgff) - - -# def test_generate_gff(): -# """ -# Test creating gff file. -# """ -# prokgff = os.path.join("test", "data", "annotate", "test_files", "prokka_out_gff.gff") -# gffout = os.path.join("test", "data", "annotate", "test_creategff.gff") -# lstgenome = os.path.join("test", "data", "annotate", "test_files", "lstinfo_for_gff.lst") -# assert ffunc.generate_gff(prokgff, gffout, lstgenome, my_logger()[1]) -# exp_gff = os.path.join("test", "data", "annotate", "exp_files", "res_create_gff.gff") -# with open(gffout, "r") as gffo, open(exp_gff, "r") as expf: -# for line_exp, line_out in zip(expf, gffo): -# assert line_exp == line_out -# os.remove(gffout) - - -# def test_generate_gff_error(): -# """ -# Test creating gff file. -# """ -# logger = my_logger() -# prokgff = os.path.join("test", "data", "annotate", "test_files", "prokka_out_gff-error.gff") -# lstgenome = os.path.join("test", "data", "annotate", "test_files", "lstinfo_for_gff.lst") -# gffout = os.path.join("test", "data", "annotate", "test_creategff.gff") -# assert not ffunc.generate_gff(prokgff, gffout, lstgenome, logger[1]) -# os.remove(gffout) -# q = logger[0] -# assert q.qsize() == 1 -# logfound = q.get() -# msg = ("Problem with your gff file. '##FASTA' is not a gff entry line, whereas it should " -# "correspond to '863\t1795\tD\tCDS\tESCO.1015.00001.b0003_00016\tNA\t" -# "| hypothetical protein | NA | NA'") -# assert msg in logfound.message -# assert logfound.levelname == "ERROR" - - - - -# def test_format1genome(): -# """ -# Test that formatting a genome (making .prt, .gen, .fna, .lst) works, with a genome -# which did not change name between prokka run and format step. -# """ -# gpath = os.path.join("test", "data", "annotate", "genomes", -# "B2_A3_5.fasta-split5N.fna-short-contig.fna") -# name = "test.0417.00002" -# prok_path = os.path.join("test", "data", "annotate", "exp_files") -# lst_dir = os.path.join("test", "data", "annotate") -# prot_dir = lst_dir -# gene_dir = lst_dir -# rep_dir = lst_dir -# gff_dir = lst_dir -# assert ffunc.format_one_genome(gpath, name, prok_path, lst_dir, prot_dir, -# gene_dir, rep_dir, gff_dir, my_logger()[1]) -# # Check that all files were created -# assert os.path.isfile(os.path.join(lst_dir, name + ".lst")) -# assert os.path.isfile(os.path.join(lst_dir, name + ".fna")) -# assert os.path.isfile(os.path.join(lst_dir, name + ".prt")) -# assert os.path.isfile(os.path.join(lst_dir, name + ".gen")) -# assert os.path.isfile(os.path.join(lst_dir, name + ".gff")) -# # Check the contents of the files -# explst = os.path.join(prok_path, "res_format-B2.lst") -# expprt = os.path.join(prok_path, "res_format-B2.prt") -# expgen = os.path.join(prok_path, "res_format-B2.gen") -# expgff = os.path.join(prok_path, "res_format-B2.gff") -# with open(explst, "r") as lstf, open(os.path.join(lst_dir, name + ".lst"), "r") as lsto: -# for line_exp, line_out in zip(lstf, lsto): -# assert line_exp == line_out -# with open(expprt, "r") as expf, open(os.path.join(lst_dir, name + ".prt"), "r") as outf: -# for line_exp, line_out in zip(expf, outf): -# assert line_exp == line_out -# with open(expgen, "r") as expf, open(os.path.join(lst_dir, name + ".gen"), "r") as outf: -# for line_exp, line_out in zip(expf, outf): -# assert line_exp == line_out -# with open(gpath, "r") as expf, open(os.path.join(lst_dir, name + ".fna"), "r") as outf: -# for line_exp, line_out in zip(expf, outf): -# assert line_exp == line_out -# with open(expgff, "r") as expf, open(os.path.join(lst_dir, name + ".gff"), "r") as outf: -# for line_exp, line_out in zip(expf, outf): -# assert line_exp == line_out -# os.remove(os.path.join(lst_dir, name + ".lst")) -# os.remove(os.path.join(lst_dir, name + ".prt")) -# os.remove(os.path.join(lst_dir, name + ".fna")) -# os.remove(os.path.join(lst_dir, name + ".gen")) -# os.remove(os.path.join(lst_dir, name + ".gff")) - - -# def test_format1genome_change_head(): -# """ -# Test that formatting a genome (making .prt, .gen, .fna, .lst) works, with a genome -# which changed its name between prokka and format step. -# """ -# ginit = os.path.join("test", "data", "annotate", "genomes", "B2_A3_5.fasta-changeName.fna") -# gpath = os.path.join("test", "data", "annotate", "genomes", -# "B2_A3_5.fasta-changeName.fna-short-contig.fna") -# shutil.copyfile(ginit, gpath) -# name = "test.0417.00002" -# prok_path = os.path.join("test", "data", "annotate", "exp_files") -# lst_dir = os.path.join("test", "data", "annotate") -# prot_dir = lst_dir -# gene_dir = lst_dir -# rep_dir = lst_dir -# gff_dir = lst_dir -# assert ffunc.format_one_genome(gpath, name, prok_path, lst_dir, -# prot_dir, gene_dir, rep_dir, gff_dir, my_logger()[1]) -# # Check that all files were created -# assert os.path.isfile(os.path.join(lst_dir, name + ".lst")) -# assert os.path.isfile(os.path.join(lst_dir, name + ".fna")) -# assert os.path.isfile(os.path.join(lst_dir, name + ".prt")) -# assert os.path.isfile(os.path.join(lst_dir, name + ".gen")) -# assert os.path.isfile(os.path.join(lst_dir, name + ".gff")) -# # Check the contents of the files -# explst = os.path.join(prok_path, "res_format-B2.lst") -# expprt = os.path.join(prok_path, "res_format-B2.prt") -# expgen = os.path.join(prok_path, "res_format-B2.gen") -# expgff = os.path.join(prok_path, "res_format-B2.gff") -# expreplicons = os.path.join("test", "data", "annotate", "genomes", -# "B2_A3_5.fasta-split5N.fna-short-contig.fna") -# with open(explst, "r") as lstf, open(os.path.join(lst_dir, name + ".lst"), "r") as lsto: -# for line_exp, line_out in zip(lstf, lsto): -# assert line_exp == line_out -# with open(expprt, "r") as expf, open(os.path.join(lst_dir, name + ".prt"), "r") as outf: -# for line_exp, line_out in zip(expf, outf): -# assert line_exp == line_out -# with open(expgen, "r") as expf, open(os.path.join(lst_dir, name + ".gen"), "r") as outf: -# for line_exp, line_out in zip(expf, outf): -# assert line_exp == line_out -# with open(expgff, "r") as expf, open(os.path.join(lst_dir, name + ".gff"), "r") as outf: -# for line_exp, line_out in zip(expf, outf): -# assert line_exp == line_out -# with open(expreplicons, "r") as expf, open(os.path.join(lst_dir, name + ".fna"), "r") as outf: -# for line_exp, line_out in zip(expf, outf): -# assert line_exp == line_out -# os.remove(os.path.join(lst_dir, name + ".lst")) -# os.remove(os.path.join(lst_dir, name + ".prt")) -# os.remove(os.path.join(lst_dir, name + ".fna")) -# os.remove(os.path.join(lst_dir, name + ".gen")) -# os.remove(os.path.join(lst_dir, name + ".gff")) -# os.remove(gpath) - - -# def test_format1genome_problemgen(): -# """ -# Test that formatting a genome (making .prt, .gen, .fna, .lst) returns an error message -# and does not create any output file if there is a problem while converting the -# .ffn to .gen -# """ -# logger = my_logger() -# gpath = os.path.join("test", "data", "annotate", "genomes", -# "B2_A3_5.fasta-problems.fna-short-contig.fna") -# name = "test.0417.00002" -# prok_path = os.path.join("test", "data", "annotate", "exp_files") -# tbl_init = os.path.join(prok_path, "B2_A3_5.fasta-split5N.fna-short-contig.fna-prokkaRes", -# name + ".tbl") -# tblout = os.path.join(prok_path, "B2_A3_5.fasta-problems.fna-short-contig.fna-prokkaRes", -# name + ".tbl") -# shutil.copyfile(tbl_init, tblout) -# gff_init = os.path.join(prok_path, "B2_A3_5.fasta-split5N.fna-short-contig.fna-prokkaRes", -# name + ".gff") -# gffout = os.path.join(prok_path, "B2_A3_5.fasta-problems.fna-short-contig.fna-prokkaRes", -# name + ".gff") -# shutil.copyfile(gff_init, gffout) -# lst_dir = os.path.join("test", "data", "annotate") -# prot_dir = lst_dir -# gene_dir = lst_dir -# rep_dir = lst_dir -# gff_dir = lst_dir -# assert not ffunc.format_one_genome(gpath, name, prok_path, lst_dir, prot_dir, -# gene_dir, rep_dir, gff_dir, logger[1]) -# # Check that all files were not created -# assert not os.path.isfile(os.path.join(lst_dir, name + ".lst")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".fna")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".prt")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".gen")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".gff")) -# msg = ("Unknown header format >EPKOMDHM_i00002 hypothetical protein in " -# "test/data/annotate/exp_files/B2_A3_5.fasta-problems.fna-short-contig.fna-prokkaRes/" -# "test.0417.00002.ffn.\n" -# "Gen file will not be created.") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg -# # remove tblout which was copied for this test -# os.remove(tblout) -# os.remove(gffout) - - -# def test_format1genome_problemprt(): -# """ -# Test that formatting a genome (making .prt, .gen, .fna, .lst) works, with a genome -# which did not change name between prokka run and format step. -# """ -# logger = my_logger() -# gpath = os.path.join("test", "data", "annotate", "genomes", -# "B2_A3_5.fasta-problems.fna-short-contig.fna") -# name = "test.0417.00002" -# prok_path = os.path.join("test", "data", "annotate", "exp_files") -# # copy tbl without errors to error prokka dir -# tbl_init = os.path.join(prok_path, "B2_A3_5.fasta-split5N.fna-short-contig.fna-prokkaRes", -# name + ".tbl") -# tblout = os.path.join(prok_path, "B2_A3_5.fasta-problems.fna-short-contig.fna-prokkaRes", -# name + ".tbl") -# shutil.copyfile(tbl_init, tblout) -# # copy gff without errors to error prokka dir -# gff_init = os.path.join(prok_path, "B2_A3_5.fasta-split5N.fna-short-contig.fna-prokkaRes", -# name + ".gff") -# gffout = os.path.join(prok_path, "B2_A3_5.fasta-problems.fna-short-contig.fna-prokkaRes", -# name + ".gff") -# shutil.copyfile(gff_init, gffout) -# # copy ffn without error to error prokka dir -# ffn_init = os.path.join(prok_path, "B2_A3_5.fasta-split5N.fna-short-contig.fna-prokkaRes", -# name + ".ffn") -# ffn_ok = os.path.join(prok_path, "B2_A3_5.fasta-problems.fna-short-contig.fna-prokkaRes", -# name + ".ffn") -# ffn_error = ffn_ok + "-error" -# # change name of ffn file with error to keep it for later (used for tests) -# shutil.copyfile(ffn_ok, ffn_error) -# # copy ffn without error to prokka res (erasing ffn with error) -# shutil.copyfile(ffn_init, ffn_ok) -# lst_dir = os.path.join("test", "data", "annotate") -# prot_dir = lst_dir -# gene_dir = lst_dir -# rep_dir = lst_dir -# gff_dir = lst_dir -# assert not ffunc.format_one_genome(gpath, name, prok_path, lst_dir, prot_dir, -# gene_dir, rep_dir, gff_dir, logger[1]) -# # Check that all files were not created -# assert not os.path.isfile(os.path.join(lst_dir, name + ".lst")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".fna")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".prt")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".gen")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".gff")) -# msg = ("Unknown header format >EPKOMDHM00003 hypothetical protein in " -# "test/data/annotate/exp_files/B2_A3_5.fasta-problems.fna-short-contig.fna-prokkaRes/" -# "test.0417.00002.faa. " -# "Error: invalid literal for int() with base 10: '>EPKOMDHM00003'\n" -# "Prt file not created from test/data/annotate/exp_files/" -# "B2_A3_5.fasta-problems.fna-short-contig.fna-prokkaRes/test.0417.00002.faa.") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg -# # remove files which were copied for this test (tblout). And rename ffn with errors -# # to its original name. -# os.rename(ffn_error, ffn_ok) -# os.remove(tblout) -# os.remove(gffout) - - -# def test_format1genome_problemgff(): -# """ -# Test that formatting a genome (making .prt, .gen, .fna, .lst) returns an error message -# and does not create any output file if there is a problem while converting the -# .ffn to .gen -# """ -# logger = my_logger() -# gpath = os.path.join("test", "data", "annotate", "genomes", -# "B2_A3_5.fasta-problems.fna-short-contig.fna") -# name = "test.0417.00002" -# prok_path = os.path.join("test", "data", "annotate", "exp_files") -# tbl_init = os.path.join(prok_path, "B2_A3_5.fasta-split5N.fna-short-contig.fna-prokkaRes", -# name + ".tbl") -# tblout = os.path.join(prok_path, "B2_A3_5.fasta-problems.fna-short-contig.fna-prokkaRes", -# name + ".tbl") -# shutil.copyfile(tbl_init, tblout) -# gff_init = os.path.join("test", "data", "annotate", "test_files", "prokka_out_gff-error.gff") -# gffout = os.path.join(prok_path, "B2_A3_5.fasta-problems.fna-short-contig.fna-prokkaRes", -# name + ".gff") -# shutil.copyfile(gff_init, gffout) -# lst_dir = os.path.join("test", "data", "annotate") -# prot_dir = lst_dir -# gene_dir = lst_dir -# rep_dir = lst_dir -# gff_dir = lst_dir -# assert not ffunc.format_one_genome(gpath, name, prok_path, lst_dir, prot_dir, -# gene_dir, rep_dir, gff_dir, logger[1]) -# # Check that all files were not created -# assert not os.path.isfile(os.path.join(lst_dir, name + ".lst")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".fna")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".prt")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".gen")) -# assert not os.path.isfile(os.path.join(lst_dir, name + ".gff")) -# msg = ("Problem with your gff file. '##FASTA' is not a gff entry line, whereas it should " -# "correspond to '11249\t12328\tD\tCDS\ttest.0417.00002.i0002_00016\tNA\t" -# "| hypothetical protein | NA | NA'") -# q = logger[0] -# assert q.qsize() == 1 -# assert q.get().message == msg -# # remove tblout which was copied for this test -# os.remove(tblout) -# os.remove(gffout) - - -# def test_format_all(): -# """ -# Test that when giving a list of genomes, for which prokka ran without problem, -# they are formatted, with all expected files created. -# """ -# # genomes = {genome: [name, gpath, size, nbcont, l90]} -# initnames = ["H299_H561.fasta", "B2_A3_5.fasta-changeName.fna"] -# initpaths = [os.path.join("test", "data", "annotate", "genomes", name) for name in initnames] -# gnames = ["H299_H561.fasta-short-contig.fna", "B2_A3_5.fasta-changeName.fna-short-contig.fna"] -# onames = ["test_runprokka_H299", "test.0417.00002"] -# gpaths = [os.path.join("test", "data", "annotate", "genomes", name) for name in gnames] -# for f1, f2 in zip(initpaths, gpaths): -# shutil.copyfile(f1, f2) -# genomes = {gnames[0]: [onames[0], gpaths[0], 12656, 3, 1], -# gnames[1]: [onames[1], gpaths[1], 456464645, 5, 1] -# } -# prok_path = os.path.join("test", "data", "annotate", "exp_files") -# res_path = os.path.join("test", "data", "annotate") -# results = {gname: True for gname in gnames} -# skipped, skipped_format = ffunc.format_genomes(genomes, results, res_path, -# prok_path, threads=4) -# assert skipped == [] -# assert skipped_format == [] -# lstfiles = [os.path.join(res_path, "LSTINFO", name + ".lst") for name in onames] -# prtfiles = [os.path.join(res_path, "Proteins", name + ".prt") for name in onames] -# genfiles = [os.path.join(res_path, "Genes", name + ".gen") for name in onames] -# repfiles = [os.path.join(res_path, "Replicons", name + ".fna") for name in onames] -# gfffiles = [os.path.join(res_path, "gff3", name + ".gff") for name in onames] -# for f in lstfiles + prtfiles + genfiles + repfiles + gfffiles: -# assert os.path.isfile(f) -# shutil.rmtree(os.path.join(res_path, "LSTINFO")) -# shutil.rmtree(os.path.join(res_path, "Proteins")) -# shutil.rmtree(os.path.join(res_path, "Genes")) -# shutil.rmtree(os.path.join(res_path, "Replicons")) -# shutil.rmtree(os.path.join(res_path, "gff3")) -# for f in gpaths: -# os.remove(f) - - -# def test_format_all_result_false(): -# """ -# Test that when giving a list of 2 genomes, 1 for which prokka ran without problem, -# 1 for which prokka had problems (given with False in results), -# the correct genome is formatted, with all -# expected files created, and the genome with problems is not formatted. -# """ -# # genomes = {genome: [name, gpath, size, nbcont, l90]} -# initnames = ["H299_H561.fasta", "B2_A3_5.fasta-changeName.fna"] -# initpaths = [os.path.join("test", "data", "annotate", "genomes", name) for name in initnames] -# gnames = ["H299_H561.fasta-short-contig.fna", "B2_A3_5.fasta-changeName.fna-short-contig.fna"] -# onames = ["test_runprokka_H299", "test.0417.00002"] -# gpaths = [os.path.join("test", "data", "annotate", "genomes", name) for name in gnames] -# for f1, f2 in zip(initpaths, gpaths): -# shutil.copyfile(f1, f2) -# genomes = {gnames[0]: [onames[0], gpaths[0], 12656, 3, 1], -# gnames[1]: [onames[1], gpaths[1], 456464645, 5, 1] -# } -# prok_path = os.path.join("test", "data", "annotate", "exp_files") -# res_path = os.path.join("test", "data", "annotate") -# results = {gnames[0]: True, gnames[1]: False} -# skipped, skipped_format = ffunc.format_genomes(genomes, results, res_path, prok_path) -# assert skipped == ["B2_A3_5.fasta-changeName.fna-short-contig.fna"] -# assert skipped_format == [] -# lstfiles = os.path.join(res_path, "LSTINFO") -# prtfiles = os.path.join(res_path, "Proteins") -# genfiles = os.path.join(res_path, "Genes") -# repfiles = os.path.join(res_path, "Replicons") -# gfffiles = os.path.join(res_path, "gff3") -# assert os.path.isfile(os.path.join(lstfiles, onames[0] + ".lst")) -# assert not os.path.isfile(os.path.join(lstfiles, onames[1] + ".lst")) -# assert os.path.isfile(os.path.join(prtfiles, onames[0] + ".prt")) -# assert not os.path.isfile(os.path.join(prtfiles, onames[1] + ".prt")) -# assert os.path.isfile(os.path.join(genfiles, onames[0] + ".gen")) -# assert not os.path.isfile(os.path.join(genfiles, onames[1] + ".gen")) -# assert os.path.isfile(os.path.join(repfiles, onames[0] + ".fna")) -# assert not os.path.isfile(os.path.join(repfiles, onames[1] + ".fna")) -# assert os.path.isfile(os.path.join(gfffiles, onames[0] + ".gff")) -# assert not os.path.isfile(os.path.join(gfffiles, onames[1] + ".gff")) -# shutil.rmtree(os.path.join(res_path, "LSTINFO")) -# shutil.rmtree(os.path.join(res_path, "Proteins")) -# shutil.rmtree(os.path.join(res_path, "Genes")) -# shutil.rmtree(os.path.join(res_path, "Replicons")) -# shutil.rmtree(os.path.join(res_path, "gff3")) -# for f in gpaths: -# os.remove(f) - - -# def test_format_all_not_result(): -# """ -# Test that when giving a list of 2 genomes, but only 1 is in the results list (and prokka ran -# without problems for it), the correct genome is formatted, with all -# expected files created, and the other genome is not formatted, and does not appear in -# skipped list (as it was removed from the study before annotation step, probably by QC). -# """ -# # genomes = {genome: [name, gpath, size, nbcont, l90]} -# initnames = ["H299_H561.fasta", "B2_A3_5.fasta-changeName.fna"] -# initpaths = [os.path.join("test", "data", "annotate", "genomes", name) for name in initnames] -# gnames = ["H299_H561.fasta-short-contig.fna", "B2_A3_5.fasta-changeName.fna-short-contig.fna"] -# onames = ["test_runprokka_H299", "test.0417.00002"] -# gpaths = [os.path.join("test", "data", "annotate", "genomes", name) for name in gnames] -# for f1, f2 in zip(initpaths, gpaths): -# shutil.copyfile(f1, f2) -# genomes = {gnames[0]: [onames[0], gpaths[0], 12656, 3, 1], -# gnames[1]: [onames[1], gpaths[1], 456464645, 5, 1] -# } -# prok_path = os.path.join("test", "data", "annotate", "exp_files") -# res_path = os.path.join("test", "data", "annotate") -# results = {gnames[0]: True} -# skipped, skipped_format = ffunc.format_genomes(genomes, results, res_path, prok_path) -# assert skipped == [] -# assert skipped_format == [] -# lstfiles = os.path.join(res_path, "LSTINFO") -# prtfiles = os.path.join(res_path, "Proteins") -# genfiles = os.path.join(res_path, "Genes") -# repfiles = os.path.join(res_path, "Replicons") -# gfffiles = os.path.join(res_path, "gff3") -# assert os.path.isfile(os.path.join(lstfiles, onames[0] + ".lst")) -# assert not os.path.isfile(os.path.join(lstfiles, onames[1] + ".lst")) -# assert os.path.isfile(os.path.join(prtfiles, onames[0] + ".prt")) -# assert not os.path.isfile(os.path.join(prtfiles, onames[1] + ".prt")) -# assert os.path.isfile(os.path.join(genfiles, onames[0] + ".gen")) -# assert not os.path.isfile(os.path.join(genfiles, onames[1] + ".gen")) -# assert os.path.isfile(os.path.join(repfiles, onames[0] + ".fna")) -# assert not os.path.isfile(os.path.join(repfiles, onames[1] + ".fna")) -# assert os.path.isfile(os.path.join(gfffiles, onames[0] + ".gff")) -# assert not os.path.isfile(os.path.join(gfffiles, onames[1] + ".gff")) -# shutil.rmtree(os.path.join(res_path, "LSTINFO")) -# shutil.rmtree(os.path.join(res_path, "Proteins")) -# shutil.rmtree(os.path.join(res_path, "Genes")) -# shutil.rmtree(os.path.join(res_path, "Replicons")) -# shutil.rmtree(os.path.join(res_path, "gff3")) -# for f in gpaths: -# os.remove(f) - -# # probleme avec .fna de onames[0] qui n'est pas créé... - - -# def test_format_all_error(): -# """ -# Test that when giving a list of 2 genomes, prokka ran without problem for both. -# But a problem appears while formatting the 2nd one. So, the 2nd one is not formatted, -# and appears in skipped_format. The first one is formated, and check that all -# output files are created. -# """ -# # genomes = {genome: [name, gpath, size, nbcont, l90]} -# name = "test.0417.00002" -# initnames = ["H299_H561.fasta", "B2_A3_5.fasta-changeName.fna"] -# initpaths = [os.path.join("test", "data", "annotate", "genomes", name) for name in initnames] -# gnames = ["H299_H561.fasta-short-contig.fna", "B2_A3_5.fasta-problems.fna-short-contig.fna"] -# onames = ["test_runprokka_H299", "test.0417.00002"] -# gpaths = [os.path.join("test", "data", "annotate", "genomes", name) for name in gnames] -# for f1, f2 in zip(initpaths, gpaths): -# shutil.copyfile(f1, f2) -# genomes = {gnames[0]: [onames[0], gpaths[0], 12656, 3, 1], -# gnames[1]: [onames[1], gpaths[1], 456464645, 5, 1] -# } -# prok_path = os.path.join("test", "data", "annotate", "exp_files") -# res_path = os.path.join("test", "data", "annotate") -# tbl_init = os.path.join(prok_path, "B2_A3_5.fasta-split5N.fna-short-contig.fna-prokkaRes", -# name + ".tbl") -# tblout = os.path.join(prok_path, "B2_A3_5.fasta-problems.fna-short-contig.fna-prokkaRes", -# name + ".tbl") -# shutil.copyfile(tbl_init, tblout) -# gff_init = os.path.join(prok_path, "B2_A3_5.fasta-split5N.fna-short-contig.fna-prokkaRes", -# name + ".gff") -# gffout = os.path.join(prok_path, "B2_A3_5.fasta-problems.fna-short-contig.fna-prokkaRes", -# name + ".gff") -# shutil.copyfile(gff_init, gffout) -# results = {gnames[0]: True, gnames[1]: True} -# skipped, skipped_format = ffunc.format_genomes(genomes, results, res_path, prok_path) -# assert skipped == [] -# assert skipped_format == ["B2_A3_5.fasta-problems.fna-short-contig.fna"] -# lstfiles = os.path.join(res_path, "LSTINFO") -# prtfiles = os.path.join(res_path, "Proteins") -# genfiles = os.path.join(res_path, "Genes") -# repfiles = os.path.join(res_path, "Replicons") -# gfffiles = os.path.join(res_path, "gff3") -# assert os.path.isfile(os.path.join(lstfiles, onames[0] + ".lst")) -# assert not os.path.isfile(os.path.join(lstfiles, onames[1] + ".lst")) -# assert os.path.isfile(os.path.join(prtfiles, onames[0] + ".prt")) -# assert not os.path.isfile(os.path.join(prtfiles, onames[1] + ".prt")) -# assert os.path.isfile(os.path.join(genfiles, onames[0] + ".gen")) -# assert not os.path.isfile(os.path.join(genfiles, onames[1] + ".gen")) -# assert os.path.isfile(os.path.join(repfiles, onames[0] + ".fna")) -# assert not os.path.isfile(os.path.join(repfiles, onames[1] + ".fna")) -# assert os.path.isfile(os.path.join(gfffiles, onames[0] + ".gff")) -# assert not os.path.isfile(os.path.join(gfffiles, onames[1] + ".gff")) -# shutil.rmtree(os.path.join(res_path, "LSTINFO")) -# shutil.rmtree(os.path.join(res_path, "Proteins")) -# shutil.rmtree(os.path.join(res_path, "Genes")) -# shutil.rmtree(os.path.join(res_path, "Replicons")) -# shutil.rmtree(os.path.join(res_path, "gff3")) -# os.remove(tblout) -# os.remove(gffout) -# for f in gpaths: -# os.remove(f) + # Create prokka output dir and pur expected files (empty, we want to generate an error) + gpath = os.path.join(GENEPATH, "toto.fasta") + open(gpath, "w").close() + prok_path = gpath + "-prokkaRes" + os.makedirs(prok_path) + fna_res = os.path.join(prok_path, " toto.fna") + tbl_res = os.path.join(prok_path, " toto.tbl") + gff_res = os.path.join(prok_path, "toto.gff") + ffn_res = os.path.join(prok_path, "toto.ffn") + faa_res = os.path.join(prok_path, "toto.faa") + for file in [fna_res, tbl_res, gff_res, ffn_res, faa_res]: + open(file, "w").close() + # Create output directory for .fna file + rep_dir = os.path.join(GENEPATH, "Replicons") + os.makedirs(rep_dir) + # Get args for function + args = ("toto.fasta", "name", gpath, GENEPATH, "lst/dir", "prot/dir", + "gene/dir", rep_dir, "gff/dir", False, my_logger()[0]) + ok_format, genome = ffunc.handle_genome(args) + assert ok_format == False + assert genome == "toto.fasta" + + +def test_handle_genome_badprodigal(): + """ + Test that when we try to format a genome which was annotated by prokka, but original genome + is empty -> cannot format genome -> returns False associated with genome name + """ + # Create prokka output dir and pur expected files (empty, we want to generate an error) + gpath = os.path.join(GENEPATH, "wrong.fasta") + open(gpath, "w").close() + prodi_path = gpath + "-prodigalRes" + os.makedirs(prodi_path) + gff_res = os.path.join(prodi_path, "toto.gff") + ffn_res = os.path.join(prodi_path, "toto.ffn") + faa_res = os.path.join(prodi_path, "toto.faa") + for file in [gff_res, ffn_res, faa_res]: + open(file, "w").close() + # Create output directory for .fna file + rep_dir = os.path.join(GENEPATH, "Replicons") + os.makedirs(rep_dir) + # Get args for function + args = ("wrong.fasta", "name", gpath, GENEPATH, "lst/dir", "prot/dir", + "gene/dir", rep_dir, "gff/dir", True, my_logger()[0]) + ok_format, genome = ffunc.handle_genome(args) + assert ok_format == False + assert genome == "wrong.fasta" + + +def test_handle_genome_formatok(caplog): + """ + Test that when we try to format a genome which was annotated by prokka without any problem + It returns True associated with the genome name + """ + caplog.set_level(logging.DEBUG) + name = "test.0417.00002" + # path to original genome, given to prodigal for annotation + gpath = os.path.join(ANNOTEDIR, "test_files", "original_name.fna") + prok_path = os.path.join(ANNOTEDIR, "test_files") + # Create result directories + prot_dir = os.path.join(GENEPATH, "Proteins") + lst_dir = os.path.join(GENEPATH, "LSTINFO") + rep_dir = os.path.join(GENEPATH, "Replicons") + gene_dir = os.path.join(GENEPATH, "Genes") + gff_dir = os.path.join(GENEPATH, "gff") + os.makedirs(prot_dir) + os.makedirs(lst_dir) + os.makedirs(rep_dir) + os.makedirs(gene_dir) + os.makedirs(gff_dir) + # Get args for function + args = ("original_name", name, gpath, prok_path, lst_dir, prot_dir, + gene_dir, rep_dir, gff_dir, False, my_logger()[0]) + ok_format, genome = ffunc.handle_genome(args) + assert ok_format == True + assert genome == "original_name" + # Check generated files + exp_rep = os.path.join(EXP_ANNOTE, "res_created_rep-prokka.fna") + res_rep_file = os.path.join(rep_dir, "test.0417.00002.fna") + assert tutil.compare_order_content(exp_rep, res_rep_file) + # Proteins + exp_prt = os.path.join(EXP_ANNOTE, "res_create_prt_prokka.faa") + res_prt_file = os.path.join(prot_dir, "test.0417.00002.prt") + assert tutil.compare_order_content(exp_prt, res_prt_file) + # Genes + exp_gen = os.path.join(EXP_ANNOTE, "res_create_gene_prokka.gen") + res_gen_file = os.path.join(gene_dir, "test.0417.00002.gen") + assert tutil.compare_order_content(exp_gen, res_gen_file) + # LSTINFO + exp_lst = os.path.join(EXP_ANNOTE, "res_create_lst-prokka.lst") + res_lst_file = os.path.join(lst_dir, "test.0417.00002.lst") + assert tutil.compare_order_content(exp_lst, res_lst_file) + # gff + exp_gff = os.path.join(EXP_ANNOTE, "res_create_gff-prokka.gff") + res_gff_file = os.path.join(gff_dir, "test.0417.00002.gff") + assert tutil.compare_order_content(exp_gff, res_gff_file) + + +def test_handle_genome_formatok_prodigal(caplog): + """ + Test that when we try to format a genome which was annotated by prodigal without any problem + It returns True associated with the genome name + """ + caplog.set_level(logging.DEBUG) + name_orig = "prodigal.outtest.ok" + name = "test.0417.00002" + # path to original genome, given to prodigal for annotation + gpath = os.path.join(ANNOTEDIR, "test_files", "original_name.fna") + prodi_path = os.path.join(ANNOTEDIR, "test_files") + # Create result directories + prot_dir = os.path.join(GENEPATH, "Proteins") + lst_dir = os.path.join(GENEPATH, "LSTINFO") + rep_dir = os.path.join(GENEPATH, "Replicons") + gene_dir = os.path.join(GENEPATH, "Genes") + gff_dir = os.path.join(GENEPATH, "gff") + os.makedirs(prot_dir) + os.makedirs(lst_dir) + os.makedirs(rep_dir) + os.makedirs(gene_dir) + os.makedirs(gff_dir) + # Get args for function + args = (name_orig, name, gpath, prodi_path, lst_dir, prot_dir, + gene_dir, rep_dir, gff_dir, True, my_logger()[0]) + ok_format, genome = ffunc.handle_genome(args) + assert ok_format == True + assert genome == name_orig + # Check generated files + exp_rep = os.path.join(EXP_ANNOTE, "res_created_rep-prokka.fna") + res_rep_file = os.path.join(rep_dir, "test.0417.00002.fna") + assert tutil.compare_order_content(exp_rep, res_rep_file) + # Proteins + exp_prt = os.path.join(EXP_ANNOTE, "res_create_prt_prodigal.faa") + res_prt_file = os.path.join(prot_dir, "test.0417.00002.prt") + assert tutil.compare_order_content(exp_prt, res_prt_file) + # Genes + exp_gen = os.path.join(EXP_ANNOTE, "res_create_gene_lst_prodigal.gen") + res_gen_file = os.path.join(gene_dir, "test.0417.00002.gen") + assert tutil.compare_order_content(exp_gen, res_gen_file) + # LSTINFO + exp_lst = os.path.join(EXP_ANNOTE, "res_create_gene_lst_prodigal.lst") + res_lst_file = os.path.join(lst_dir, "test.0417.00002.lst") + assert tutil.compare_order_content(exp_lst, res_lst_file) + # gff + exp_gff = os.path.join(EXP_ANNOTE, "res_create_gff_prodigal.gff") + res_gff_file = os.path.join(gff_dir, "test.0417.00002.gff") + assert tutil.compare_order_content(exp_gff, res_gff_file) + + +def test_format_all_prokka(caplog): + """ + Test that when giving a list of genomes, for which prokka ran without problem, + they are formatted, with all expected files created. + """ + caplog.set_level(logging.DEBUG) + # genomes = {genome: [name, gpath, to_annot, size, nbcont, l90]} + # Get genome names we want to format (with their path) + gnames = ["H299_H561.fasta", "B2_A3_5.fasta-changeName.fna"] + gpaths = [os.path.join(ANNOTEDIR, "genomes", name) for name in gnames] + onames = ["test_runprokka_H299", "test.0417.00002"] + genomes = {gnames[0]: [onames[0], gpaths[0], gpaths[0], 12656, 3, 1], + gnames[1]: [onames[1], gpaths[1], gpaths[1], 456464645, 5, 1] + } + res_path = GENEPATH + annotated_path = os.path.join(ANNOTEDIR, "exp_files") + # Format both genomes + skipped_format = ffunc.format_genomes(genomes, res_path, annotated_path, False, threads=2) + assert skipped_format == [] + # Get all names of expected output files + exp_dir = os.path.join(EXP_ANNOTE, "res_formatAll", "prokka") + exp_folders = ["LSTINFO", "Proteins", "Genes", "Replicons", "gff3"] + exp_extensions = [".lst", ".prt", ".gen", ".fna", ".gff"] + # Check that output files are created, and contain what is expected + for fol, ext in zip(exp_folders, exp_extensions): + exp_files = [os.path.join(exp_dir, fol, name + ext) for name in onames] + res_files = [os.path.join(res_path, fol, name + ext) for name in onames] + for res, exp in zip(res_files, exp_files): + assert os.path.isfile(res) + assert tutil.compare_order_content(res, exp) + # Check log + assert "Formatting all genomes" in caplog.text + + +def test_format_all_prodigal(caplog): + """ + Test that when giving a list of genomes, for which prokka ran without problem, + they are formatted, with all expected files created. + """ + caplog.set_level(logging.DEBUG) + # genomes = {genome: [name, gpath, to_annot, size, nbcont, l90]} + # Get genome names we want to format (with their path) + gnames = ["H299_H561.fasta", "B2_A3_5.fasta-changeName.fna"] + gpaths = [os.path.join(ANNOTEDIR, "genomes", name) for name in gnames] + onames = ["test_runprokka_H299", "test.0417.00002"] + genomes = {gnames[0]: [onames[0], gpaths[0], gpaths[0], 12656, 3, 1], + gnames[1]: [onames[1], gpaths[1], gpaths[1], 456464645, 5, 1] + } + res_path = GENEPATH + annotated_path = os.path.join(ANNOTEDIR, "exp_files") + # Format both genomes + skipped_format = ffunc.format_genomes(genomes, res_path, annotated_path, True, threads=2) + assert skipped_format == [] + # Get all names of expected output files + exp_dir = os.path.join(EXP_ANNOTE, "res_formatAll", "prodigal") + exp_folders = ["LSTINFO", "Proteins", "Genes", "Replicons", "gff3"] + exp_extensions = [".lst", ".prt", ".gen", ".fna", ".gff"] + # Check that output files are created, and contain what is expected + for fol, ext in zip(exp_folders, exp_extensions): + exp_files = [os.path.join(exp_dir, fol, name + ext) for name in onames] + res_files = [os.path.join(res_path, fol, name + ext) for name in onames] + for res, exp in zip(res_files, exp_files): + assert os.path.isfile(res) + assert tutil.compare_order_content(res, exp) + # Check log + assert "Formatting all genomes" in caplog.text + + +def test_format_allpb_prokka(caplog): + """ + Test that when giving a list of genomes, 1 that is correctly formatted, and 1 has a pb, + it returns the last one in skipped_format + """ + caplog.set_level(logging.DEBUG) + # Create empty original sequence files + genomes = ["wrong.fasta", "error.fasta"] + gpaths = [os.path.join(GENEPATH, name) for name in genomes] + for file in gpaths: + open(file, "w").close() + # Add prokka (empty) result files to prokkaRes directory + prok_paths = [gpath + "-prokkaRes" for gpath in gpaths] + for prok_path in prok_paths: + os.makedirs(prok_path) + tbl_res = os.path.join(prok_path, "toto.tbl") + gff_res = os.path.join(prok_path, "toto.gff") + ffn_res = os.path.join(prok_path, "toto.ffn") + faa_res = os.path.join(prok_path, "toto.faa") + fna_res = os.path.join(prok_path, "toto.fna") + for file in [fna_res, tbl_res, gff_res, ffn_res, faa_res]: + open(file, "w").close() + # Create output directory for .fna files + rep_dir = os.path.join(GENEPATH, "Replicons") + os.makedirs(rep_dir) + # genomes = {genome: [name, gpath, to_annot, size, nbcont, l90]} + genomes = {genomes[0]: ["test_wrong-fasta", gpaths[0], gpaths[0], 12656, 3, 1], + genomes[1]: ["test_error-fasta", gpaths[1], gpaths[1], 456464645, 5, 1] + } + res_path = GENEPATH + annotated_path = GENEPATH + # Try to format both genomes + skipped_format = ffunc.format_genomes(genomes, res_path, annotated_path, False, threads=1) + assert skipped_format == ["wrong.fasta", "error.fasta"] + # Get all names of expected output files + exp_folders = ["LSTINFO", "Proteins", "Genes", "Replicons", "gff3"] + for res_folder in [os.path.join(res_path, folder) for folder in exp_folders]: + assert len(os.listdir(res_folder)) == 0 + # Check log + assert "Formatting all genomes" in caplog.text + assert ("Your genome test/data/annotate/generated_by_unit-tests/" + "wrong.fasta-prokkaRes/toto.fna does not " + "contain any sequence, or is not in fasta format.") in caplog.text + assert ("Your genome test/data/annotate/generated_by_unit-tests/" + "error.fasta-prokkaRes/toto.fna does not " + "contain any sequence, or is not in fasta format.") in caplog.text + assert "Problems while generating Replicon file for test_wrong-fasta" in caplog.text + assert "Problems while generating Replicon file for test_error-fasta" in caplog.text + + +def test_format_1pb_prodigal(caplog): + """ + Test that when giving a list of genomes, 1 that is correctly formatted, and 1 has a pb, + it returns the last one in skipped_format + """ + caplog.set_level(logging.DEBUG) + # GENOME 2: Create empty original genome file + genome1 = "wrong.fasta" + gpath1 = os.path.join(GENEPATH, "wrong.fasta") + open(gpath1, "w").close() + # Add prodigal (empty) result files to prodigalRes directory + prodi_path = gpath1 + "-prodigalRes" + os.makedirs(prodi_path) + gff_res = os.path.join(prodi_path, "toto.gff") + ffn_res = os.path.join(prodi_path, "toto.ffn") + faa_res = os.path.join(prodi_path, "toto.faa") + for file in [gff_res, ffn_res, faa_res]: + open(file, "w").close() + # Create output directory for .fna file + rep_dir = os.path.join(GENEPATH, "Replicons") + os.makedirs(rep_dir) + # GENOME 2 + genome2 = "H299_H561.fasta" + gpath2 = os.path.join(ANNOTEDIR, "genomes", genome2) + # Copy results of prodigal for this genome to output dir (GENEPATH) + orig_res_files = os.path.join(EXP_ANNOTE, genome2 + '-prodigalRes') + used_res_path = os.path.join(GENEPATH, genome2 + "-prodigalRes") + shutil.copytree(orig_res_files, used_res_path) + # genomes = {genome: [name, gpath, to_annot, size, nbcont, l90]} + genomes = {genome1: ["test_genome1", gpath1, gpath1, 12656, 3, 1], + genome2: ["test_runprokka_H299", gpath2, gpath2, 456464645, 5, 1] + } + res_path = GENEPATH + annotated_path = GENEPATH + # Format both genomes + skipped_format = ffunc.format_genomes(genomes, res_path, annotated_path, True, threads=2) + assert skipped_format == ["wrong.fasta"] + # Get all names of expected output files + exp_dir = os.path.join(EXP_ANNOTE, "res_formatAll", "prodigal") + exp_folders = ["LSTINFO", "Proteins", "Genes", "Replicons", "gff3"] + exp_extensions = [".lst", ".prt", ".gen", ".fna", ".gff"] + # Check that output files are created, and contain what is expected + for fol, ext in zip(exp_folders, exp_extensions): + exp_file = os.path.join(exp_dir, fol, "test_runprokka_H299" + ext) + res_file = os.path.join(res_path, fol, "test_runprokka_H299" + ext) + assert os.path.isfile(res_file) + assert tutil.compare_order_content(res_file, exp_file) + # Check log + assert "Formatting all genomes" in caplog.text + assert ("Your genome test/data/annotate/generated_by_unit-tests/wrong.fasta does not " + "contain any sequence, or is not in fasta format.") in caplog.text + assert "Problems while generating Replicon file for test_genome1" in caplog.text diff --git a/test/test_unit/test_annotate/test_format_prodigal.py b/test/test_unit/test_annotate/test_format_prodigal.py index 00d2b2171385b28c00d4fb19e97601b1984135ee..9644df5e6ffd5acfe5d23e46fc1148161740820e 100644 --- a/test/test_unit/test_annotate/test_format_prodigal.py +++ b/test/test_unit/test_annotate/test_format_prodigal.py @@ -11,9 +11,9 @@ import shutil from io import StringIO import pytest -import PanACoTA.annotate_module.format_prodigal as prodigalfunc -import PanACoTA.utils as utils import test.test_unit.utilities_for_tests as tutil +import PanACoTA.utils as utils +from PanACoTA.annotate_module import format_prodigal as prodigalfunc ANNOTEDIR = os.path.join("test", "data", "annotate") GENOMES_DIR = os.path.join(ANNOTEDIR, "genomes") @@ -129,15 +129,14 @@ def test_create_gff(caplog): "ter": "test.0417.00002.0006", "contname": "test.0417.00002.0007" } - sizes = {"test.0417.00002.0001": 14000, - "test.0417.00002.0002": 5000, - "test.0417.00002.0003": 4600, - "test.0417.00002.0004": 8000, - "test.0417.00002.0005": 1, - "test.0417.00002.0006": 10, - "test.0417.00002.0007": 15000, + sizes = {"test.0417.00002.0001": 84, + "test.0417.00002.0002": 103, + "test.0417.00002.0003": 122, + "test.0417.00002.0004": 35, + "test.0417.00002.0005": 198, + "test.0417.00002.0006": 128, + "test.0417.00002.0007": 85, } - name = "test.0417.00002" res_gff_file = os.path.join(GENEPATH, "prodigal_res.gff") exp_lst = os.path.join(EXP_ANNOTE, "res_create_gene_lst_prodigal.lst") gpath = "original_genome_name" @@ -155,8 +154,7 @@ def test_create_gff_wrong_start(caplog): """ caplog.set_level(logging.DEBUG) logger = logging.getLogger("test_prodigal") - gfffile = os.path.join(TEST_ANNOTE, "original_name.fna-prodigalRes", - "prodigal.outtest.wrong-start.gff") + gfffile = os.path.join(TEST_ANNOTE, "prodigal.outtest.wrong-start.gff") contigs = {"JGIKIPgffgIJ": "test.0417.00002.0001", "toto": "test.0417.00002.0002", "other_header": "test.0417.00002.0003", @@ -185,6 +183,80 @@ def test_create_gff_wrong_start(caplog): "(78 in gff, 77 in ffn") in caplog.text +def test_create_gff_wrong_end(caplog): + """ + Check that when trying to generate gff, if problem, exits with expected message + Here, the start position in the gff file generated by prodigal is not the same as + the start position in the lstinfo file (which was taken from the ffn + file generated by prodigal) + """ + caplog.set_level(logging.DEBUG) + logger = logging.getLogger("test_prodigal") + gfffile = os.path.join(TEST_ANNOTE, "prodigal.outtest.wrong-end.gff") + contigs = {"JGIKIPgffgIJ": "test.0417.00002.0001", + "toto": "test.0417.00002.0002", + "other_header": "test.0417.00002.0003", + "my_contig": "test.0417.00002.0004", + "bis": "test.0417.00002.0005", + "ter": "test.0417.00002.0006", + "contname": "test.0417.00002.0007" + } + sizes = {"test.0417.00002.0001": 14000, + "test.0417.00002.0002": 5000, + "test.0417.00002.0003": 4600, + "test.0417.00002.0004": 8000, + "test.0417.00002.0005": 1, + "test.0417.00002.0006": 10, + "test.0417.00002.0007": 15000, + } + res_gff_file = os.path.join(GENEPATH, "prodigal_res.gff") + exp_lst = os.path.join(EXP_ANNOTE, "res_create_gene_lst_prodigal.lst") + gpath = "original_genome_name" + assert not prodigalfunc.create_gff(gpath, gfffile, res_gff_file, exp_lst, contigs, sizes) + assert ("Files prodigal.outtest.wrong-end.ffn and " + "prodigal.outtest.wrong-end.gff " + "(in prodigal tmp_files: original_genome_name-prodigalRes) " + "do not have the same end value for gene EPKOMDHM_00009 " + "(2347 in gff, 2346 in ffn") in caplog.text + + +def test_create_gff_wrong_type(caplog): + """ + Check that when trying to generate gff, if problem, exits with expected message + Here, the start position in the gff file generated by prodigal is not the same as + the start position in the lstinfo file (which was taken from the ffn + file generated by prodigal) + """ + caplog.set_level(logging.DEBUG) + logger = logging.getLogger("test_prodigal") + gfffile = os.path.join(TEST_ANNOTE, "prodigal.outtest.wrong-type.gff") + contigs = {"JGIKIPgffgIJ": "test.0417.00002.0001", + "toto": "test.0417.00002.0002", + "other_header": "test.0417.00002.0003", + "my_contig": "test.0417.00002.0004", + "bis": "test.0417.00002.0005", + "ter": "test.0417.00002.0006", + "contname": "test.0417.00002.0007" + } + sizes = {"test.0417.00002.0001": 14000, + "test.0417.00002.0002": 5000, + "test.0417.00002.0003": 4600, + "test.0417.00002.0004": 8000, + "test.0417.00002.0005": 1, + "test.0417.00002.0006": 10, + "test.0417.00002.0007": 15000, + } + res_gff_file = os.path.join(GENEPATH, "prodigal_res.gff") + exp_lst = os.path.join(EXP_ANNOTE, "res_create_gene_lst_prodigal.lst") + gpath = "original_genome_name" + assert not prodigalfunc.create_gff(gpath, gfffile, res_gff_file, exp_lst, contigs, sizes) + assert ("Files prodigal.outtest.wrong-type.ffn and " + "prodigal.outtest.wrong-type.gff " + "(in prodigal tmp_files: original_genome_name-prodigalRes) " + "do not have the same type value for gene EPKOMDHM_00008 " + "(tRNA in gff, CDS in ffn") in caplog.text + + def test_create_prt(caplog): """ Check that prt file is generated as expected @@ -201,7 +273,7 @@ def test_create_prt(caplog): def test_create_prt_wrong_lst(caplog): """ - Check that prt file is generated as expected + Check that prt file is not generated if there is a problem in the lst file """ caplog.set_level(logging.DEBUG) protfile = os.path.join(TEST_ANNOTE, "original_name.fna-prodigalRes", @@ -215,7 +287,7 @@ def test_create_prt_wrong_lst(caplog): def test_create_prt_short_lst(caplog): """ - Check that prt file is generated as expected + Check that prt file is not generated when there are more proteins in faa than in lst """ caplog.set_level(logging.DEBUG) protfile = os.path.join(TEST_ANNOTE, "original_name.fna-prodigalRes", @@ -230,7 +302,7 @@ def test_create_prt_short_lst(caplog): def test_create_prt_end_not_int_lst(caplog): """ - Check that prt file is generated as expected + Check that prt file is not generated when an end value of a protein in lst file is not an int """ caplog.set_level(logging.DEBUG) protfile = os.path.join(TEST_ANNOTE, "original_name.fna-prodigalRes", @@ -244,7 +316,8 @@ def test_create_prt_end_not_int_lst(caplog): def test_create_prt_not_divisible3_lst(caplog): """ - Check that prt file is generated as expected + Check that prt file is not generated when there is a gene which length is not + divisible by 3 """ caplog.set_level(logging.DEBUG) protfile = os.path.join(TEST_ANNOTE, "original_name.fna-prodigalRes", @@ -258,7 +331,7 @@ def test_create_prt_not_divisible3_lst(caplog): def test_create_prt_not_moreprots_lst(caplog): """ - Check that prt file is generated as expected + Check that prt file is not generated when there are more proteins in lst than in faa """ caplog.set_level(logging.DEBUG) protfile = os.path.join(TEST_ANNOTE, "original_name.fna-prodigalRes", @@ -266,7 +339,7 @@ def test_create_prt_not_moreprots_lst(caplog): res_prt_file = os.path.join(GENEPATH, "prodigal_res.gff") exp_lst = os.path.join(TEST_ANNOTE, "test_create_prt_prodigal-more-proteins.lst") assert not prodigalfunc.create_prt(protfile, res_prt_file, exp_lst) - assert ("Protein test.0417.00002.0007b_00015 is in .lst file but its sequence is not " + assert ("Protein test.0417.00002.0007b_00016 is in .lst file but its sequence is not " "in the protein file generated by prodigal.") in caplog.text @@ -279,12 +352,12 @@ def test_format_1genome(caplog): name = "prodigal.outtest.ok" gpath = os.path.join(TEST_ANNOTE, "original_name.fna") # path to original genome, given to prodigal for annotation prod_path = TEST_ANNOTE + # Generate result folders prot_dir = os.path.join(GENEPATH, "Proteins") lst_dir = os.path.join(GENEPATH, "LSTINFO") rep_dir = os.path.join(GENEPATH, "Replicons") gene_dir = os.path.join(GENEPATH, "Genes") gff_dir = os.path.join(GENEPATH, "gff") - os.makedirs(prot_dir) os.makedirs(lst_dir) os.makedirs(rep_dir) @@ -293,6 +366,11 @@ def test_format_1genome(caplog): assert prodigalfunc.format_one_genome(gpath, name, prod_path, lst_dir, prot_dir, gene_dir, rep_dir, gff_dir) + assert os.path.isfile(os.path.join(prot_dir, "prodigal.outtest.ok.prt")) + assert os.path.isfile(os.path.join(lst_dir, "prodigal.outtest.ok.lst")) + assert os.path.isfile(os.path.join(rep_dir, "prodigal.outtest.ok.fna")) + assert os.path.isfile(os.path.join(gene_dir, "prodigal.outtest.ok.gen")) + assert os.path.isfile(os.path.join(gff_dir, "prodigal.outtest.ok.gff")) def test_format_1genome_emptygpath(caplog): @@ -305,7 +383,16 @@ def test_format_1genome_emptygpath(caplog): # Create empty file, that we give to prodigal for formatting step gpath = os.path.join(GENEPATH, "original_name-empty.fna") open(gpath, "w").close() - prod_path = TEST_ANNOTE + prod_path = GENEPATH + # Create prodigal result files (empty, then won't be read) + prodigal_dir = gpath + "-prodigalRes" + os.makedirs(prodigal_dir) + prodigal_faa = os.path.join(gpath + "-prodigalRes", "notread.faa") + prodigal_ffn = os.path.join(gpath + "-prodigalRes", "notread.ffn") + prodigal_gff = os.path.join(gpath + "-prodigalRes", "notread.gff") + for file in [prodigal_faa, prodigal_gff, prodigal_ffn]: + open(file, "w").close() + # Generate result folders prot_dir = os.path.join(GENEPATH, "Proteins") lst_dir = os.path.join(GENEPATH, "LSTINFO") rep_dir = os.path.join(GENEPATH, "Replicons") @@ -333,12 +420,15 @@ def test_format_1genome_emptygpath(caplog): assert len(os.listdir(lst_dir) ) == 0 assert len(os.listdir(gff_dir) ) == 0 assert len(os.listdir(gen_dir) ) == 0 + assert ("Your genome test/data/annotate/generated_by_unit-tests/original_name-empty.fna " + "does not contain any sequence, or is not in fasta format.") in caplog.text assert ("Problems while generating Replicon file for prodigal.outtest.ok") in caplog.text def test_format_1genome_wrongffn(caplog): """ - Test on formatting prodigal results, when the file given to prodigal was empty + Test on formatting prodigal results, when the ffn file generated by prodigal does + not have the same contig name as in original fna file -> error message, -> no file generated """ @@ -346,16 +436,19 @@ def test_format_1genome_wrongffn(caplog): name = "prodigal.outtest.ok" # path to original genome, given to prodigal for annotation orig_gpath = os.path.join(TEST_ANNOTE, "original_name.fna") - # In generated_by_tests folder, create the original genome given to prodigal - # (copy from test_file) + orig_prodpath = orig_gpath + "-prodigalRes" used_gpath = os.path.join(GENEPATH, "original_name.fna") used_respath = used_gpath + "-prodigalRes" - os.makedirs(used_respath) + # Add original genome, and prodigal results to result folder shutil.copyfile(orig_gpath, used_gpath) + shutil.copytree(orig_prodpath, used_respath) + # In GENEPATH folder, create the original genome given to prodigal + # (copy from test_file) # Create gen_file with a header not existing with open(os.path.join(used_respath, "prodigal.outtest.ok.ffn"), "w") as ori: ori.write(">wrongheader # 1 # 2 # 1 # toto") prod_path = GENEPATH + # Generate result folders prot_dir = os.path.join(GENEPATH, "Proteins") lst_dir = os.path.join(GENEPATH, "LSTINFO") rep_dir = os.path.join(GENEPATH, "Replicons") @@ -365,16 +458,18 @@ def test_format_1genome_wrongffn(caplog): os.makedirs(gene_dir) os.makedirs(lst_dir) os.makedirs(gff_dir) + os.makedirs(prot_dir) # Add empty res gff file, to check that it is removed at the end res_gff_file = os.path.join(gff_dir, "prodigal.outtest.ok.gff") open(res_gff_file, "w").close() assert len(os.listdir(gff_dir) ) == 1 - + # Run formatting assert not prodigalfunc.format_one_genome(used_gpath, name, prod_path, lst_dir, prot_dir, gene_dir, rep_dir, gff_dir) # Check that all files were removed assert len(os.listdir(rep_dir) ) == 0 assert len(os.listdir(gene_dir) ) == 0 + assert len(os.listdir(prot_dir) ) == 0 assert len(os.listdir(lst_dir) ) == 0 assert len(os.listdir(gff_dir) ) == 0 assert ("'wrongheader' found in test/data/annotate/generated_by_unit-tests/" @@ -383,9 +478,10 @@ def test_format_1genome_wrongffn(caplog): assert ("Problems while generating .gen and .lst files for prodigal.outtest.ok") in caplog.text -def test_format_1genome_wronglst(caplog): +def test_format_1genome_wronggff(caplog): """ - Test on formatting prodigal results, when the file given to prodigal was empty + Test on formatting prodigal results, when the gff file generated by prodigal + does not have same info as ffn file generated by prodigal (= lst file generated by panacota) -> error message, -> no file generated """ @@ -395,16 +491,14 @@ def test_format_1genome_wronglst(caplog): # path to original genome, given to prodigal for annotation orig_gpath = os.path.join(TEST_ANNOTE, "original_name.fna") + orig_prodpath = orig_gpath + "-prodigalRes" # In generated_by_tests folder, create the original genome given to prodigal # (copy from test_file) used_gpath = os.path.join(GENEPATH, "original_name.fna") used_respath = used_gpath + "-prodigalRes" - os.makedirs(used_respath) + # Add original genome, and prodigal results to result folder shutil.copyfile(orig_gpath, used_gpath) - # Copy ffn file generated by prodigal: - orig_ffn = os.path.join(orig_gpath + "-prodigalRes", "prodigal.outtest.ok.ffn") - used_ffn = os.path.join(used_respath, "prodigal.outtest.ok.ffn") - shutil.copyfile(orig_ffn, used_ffn) + shutil.copytree(orig_prodpath, used_respath) # Copy gff file, but modify to get wrong start position orig_gff = os.path.join(orig_gpath + "-prodigalRes", "prodigal.outtest.ok.gff") used_gff = os.path.join(used_respath, "prodigal.outtest.ok.gff") @@ -420,6 +514,7 @@ def test_format_1genome_wronglst(caplog): phase, attributes])) break prod_path = GENEPATH + # Generate result folders prot_dir = os.path.join(GENEPATH, "Proteins") lst_dir = os.path.join(GENEPATH, "LSTINFO") rep_dir = os.path.join(GENEPATH, "Replicons") @@ -427,17 +522,17 @@ def test_format_1genome_wronglst(caplog): gff_dir = os.path.join(GENEPATH, "gff3") os.makedirs(rep_dir) os.makedirs(gene_dir) + os.makedirs(prot_dir) os.makedirs(lst_dir) os.makedirs(gff_dir) - # Copy generated lstfile, but modify first line to have a difference between gff and lst starts - assert not prodigalfunc.format_one_genome(used_gpath, name, prod_path, lst_dir, prot_dir, gene_dir, rep_dir, gff_dir) - # # # Check that replicon file was removed + # Check that replicon and gff files were removed assert len(os.listdir(rep_dir) ) == 0 assert len(os.listdir(gene_dir) ) == 0 assert len(os.listdir(lst_dir) ) == 0 assert len(os.listdir(gff_dir) ) == 0 + assert len(os.listdir(prot_dir) ) == 0 assert ("Files prodigal.outtest.ok.ffn and prodigal.outtest.ok.gff (in prodigal tmp_files: " "test/data/annotate/generated_by_unit-tests/original_name.fna-prodigalRes) do " "not have the same start value for gene EPKOMDHM_00001 " @@ -449,7 +544,9 @@ def test_format_1genome_wronglst(caplog): def test_format_1genome_wrongprt(caplog): """ - Test on formatting prodigal results, when the file given to prodigal was empty + Test on formatting prodigal results, when the faa file generated by prodigal does + not have as many proteins as the ffn file generated by prodigal (=lst file generated + by panacota) -> error message, -> no file generated """ @@ -459,21 +556,14 @@ def test_format_1genome_wrongprt(caplog): # path to original genome, given to prodigal for annotation orig_gpath = os.path.join(TEST_ANNOTE, "original_name.fna") + orig_prodpath = orig_gpath + "-prodigalRes" # In generated_by_tests folder, create the original genome given to prodigal # (copy from test_file) used_gpath = os.path.join(GENEPATH, "original_name.fna") used_respath = used_gpath + "-prodigalRes" - os.makedirs(used_respath) + # Add original genome, and prodigal results to result folder shutil.copyfile(orig_gpath, used_gpath) - # Copy ffn file generated by prodigal: - orig_ffn = os.path.join(orig_gpath + "-prodigalRes", "prodigal.outtest.ok.ffn") - used_ffn = os.path.join(used_respath, "prodigal.outtest.ok.ffn") - shutil.copyfile(orig_ffn, used_ffn) - # Copy gff file generated by prodigal: - orig_gff = os.path.join(orig_gpath + "-prodigalRes", "prodigal.outtest.ok.gff") - used_gff = os.path.join(used_respath, "prodigal.outtest.ok.gff") - shutil.copyfile(orig_gff, used_gff) - # Copy prt file, but removing first protein + shutil.copytree(orig_prodpath, used_respath) orig_faa = os.path.join(orig_gpath + "-prodigalRes", "prodigal.outtest.ok.faa") used_faa = os.path.join(used_respath, "prodigal.outtest.ok.faa") with open(orig_faa, "r") as faa, open(used_faa, "w") as faar: @@ -481,24 +571,28 @@ def test_format_1genome_wrongprt(caplog): faa.readline() for line in faa: faar.write(line) - + # Generate result folders prod_path = GENEPATH prot_dir = os.path.join(GENEPATH, "Proteins") lst_dir = os.path.join(GENEPATH, "LSTINFO") rep_dir = os.path.join(GENEPATH, "Replicons") gene_dir = os.path.join(GENEPATH, "Genes") gff_dir = os.path.join(GENEPATH, "gff3") - gff_dir = os.path.join(GENEPATH, "Proteins") os.makedirs(rep_dir) os.makedirs(gene_dir) os.makedirs(lst_dir) os.makedirs(gff_dir) + os.makedirs(prot_dir) # Copy generated lstfile, but modify first line to have a difference between gff and lst starts assert not prodigalfunc.format_one_genome(used_gpath, name, prod_path, lst_dir, prot_dir, gene_dir, rep_dir, gff_dir) - # # # Check that replicon file was removed - # # assert len(os.listdir(rep_dir) ) == 0 + # Check that replicon file was removed + assert len(os.listdir(rep_dir) ) == 0 + assert len(os.listdir(gene_dir) ) == 0 + assert len(os.listdir(lst_dir) ) == 0 + assert len(os.listdir(gff_dir) ) == 0 + assert len(os.listdir(prot_dir) ) == 0 assert ("Protein prodigal.outtest.ok.0007b_00013 is in .lst file but its sequence is not in " "the protein file generated by prodigal.") in caplog.text assert ("Problems while generating .prt file (Proteins folder) for " diff --git a/test/test_unit/test_annotate/test_format_prokka.py b/test/test_unit/test_annotate/test_format_prokka.py index d9f85df90e004bb92ac070877dce3ed33dfe2874..c88b8f50a06e4d9aa08dc8d8152c1440fea70d2b 100644 --- a/test/test_unit/test_annotate/test_format_prokka.py +++ b/test/test_unit/test_annotate/test_format_prokka.py @@ -11,7 +11,7 @@ import shutil from io import StringIO import pytest -import PanACoTA.annotate_module.format_prokka as prokkafunc +from PanACoTA.annotate_module import format_prokka as prokkafunc import PanACoTA.utils as utils import test.test_unit.utilities_for_tests as tutil @@ -23,6 +23,7 @@ GENEPATH = os.path.join(ANNOTEDIR, "generated_by_unit-tests") LOGFILE_BASE = os.path.join(GENEPATH, "logfile") LOGFILES = [LOGFILE_BASE + ext for ext in [".log", ".log.debug", ".log.details", ".log.err"]] + @pytest.fixture(autouse=True) def setup_teardown_module(): """ @@ -54,7 +55,13 @@ def test_tbl_to_lst_not_changed_names(caplog): - CDS features (some with all info = ECnumber, gene name, product etc. ; some with missing info) - tRNA type - - repeat_region type (*2) + - repeat_region type (*2) -> should be ignored in .lst + * 1 in prokka1 version (start end repeat_region + rpt_family CRISPR + score 7) + * 1 in prokka2 version (start end CRISPR + note CRISPR with x repeat units + rpt_family CRISPR) - contigs with more than 2 genes - contig with only 2 genes (both 'b' loc) - contig with 1 gene ('b' loc) @@ -278,62 +285,64 @@ def test_create_gff_error_gff(caplog): res_lst = os.path.join(EXP_ANNOTE, "res_create_lst-prokka.lst") gpath = "original_genome_name" assert not prokkafunc.generate_gff(gpath, gfffile, res_gff_file, res_lst, sizes, contigs) - assert ("Problem in prokka_out_gff-error.gff: ID=EPKOMDHM_00006 whereas " + assert ("Problem in prokka_out_gff-error.gff: ID=EPKOMDHM_00005 whereas " "locus_tag=toto") in caplog.text -def test_create_gen(caplog): +def test_create_gff_wrong_format(caplog): """ - Check create gen file. + Check generated gff file. The prokka output gff file has a problem (locus_tag != ID) + -> returns False with error message """ caplog.set_level(logging.DEBUG) logger = logging.getLogger("test_prodigal") - ffnfile = os.path.join(TEST_ANNOTE, "original_name.fna-prokkaRes", - "prokka_out_for_test.ffn") - lstfile = os.path.join(EXP_ANNOTE, "res_create_lst-prokka.lst") - res_gen_file = os.path.join(GENEPATH, "prodigal_res.gen") - assert prokkafunc.create_gen(ffnfile, lstfile, res_gen_file) - exp_gen = os.path.join(EXP_ANNOTE, "res_create_gene_prokka.gen") - assert tutil.compare_order_content(exp_gen, res_gen_file) + gfffile = os.path.join(GENEPATH, "prokka_out_wrong_format.gff") + with open(gfffile, "w") as gfff: + gfff.write("##gff-version3\n") + gfff.write("##sequence-region bis 1 600\n") + gfff.write("JGIKIPgffgIJ Prodigal:2.6 CDS 287 787\n") + contigs = {"JGIKIPgffgIJ": "test.0417.00002.0001", + "toto": "test.0417.00002.0002", + "other_header": "test.0417.00002.0003", + "my_contig": "test.0417.00002.0004", + "bis": "test.0417.00002.0005", + "ter": "test.0417.00002.0006", + "contname": "test.0417.00002.0007", + } + sizes = {"test.0417.00002.0001": 84, + "test.0417.00002.0002": 103, + "test.0417.00002.0003": 122, + "test.0417.00002.0004": 35, + "test.0417.00002.0005": 198, + "test.0417.00002.0006": 128, + "test.0417.00002.0007": 85 + } + res_gff_file = os.path.join(GENEPATH, "prodigal_res.gff") + res_lst = os.path.join(EXP_ANNOTE, "res_create_lst-prokka.lst") + gpath = "original_genome_name" + assert not prokkafunc.generate_gff(gpath, gfffile, res_gff_file, res_lst, sizes, contigs) + assert ("Wrong format for test/data/annotate/generated_by_unit-tests/" + "prokka_out_wrong_format.gff") in caplog.text -def test_create_gen_wrong_crispr(caplog): +def test_create_gen(caplog): """ - Check create gen file, but CRISPR number in lst is not the same as - expected from ffn -> error and returns False + Check create gen file. """ caplog.set_level(logging.DEBUG) logger = logging.getLogger("test_prodigal") ffnfile = os.path.join(TEST_ANNOTE, "original_name.fna-prokkaRes", "prokka_out_for_test.ffn") - lstfile = os.path.join(TEST_ANNOTE, "test_create_gene_prokka-wrongCRISPRnum.lst") - res_gen_file = os.path.join(GENEPATH, "prodigal_res.gen") - assert not prokkafunc.create_gen(ffnfile, lstfile, res_gen_file) - assert ("Problem with CRISPR numbers in test/data/annotate/test_files/" - "test_create_gene_prokka-wrongCRISPRnum.lst. CRISPR >prokka_out_for_test " - "in ffn is CRISPR num 1, whereas it is annotated as CRISPR num 2 " - "in lst file.") in caplog.text - - -def test_create_gen_wrong_format(caplog): - """ - Check create gen file, but 1 header has a wrong format - -> error message and returns False - """ - caplog.set_level(logging.DEBUG) - logger = logging.getLogger("test_prodigal") - ffnfile = os.path.join(TEST_ANNOTE, "prokka_out_for_test-wrongFormat.ffn") lstfile = os.path.join(EXP_ANNOTE, "res_create_lst-prokka.lst") res_gen_file = os.path.join(GENEPATH, "prodigal_res.gen") - assert not prokkafunc.create_gen(ffnfile, lstfile, res_gen_file) - assert ("Unknown header format >JGIKIPIJ-00005 in test/data/annotate/test_files/" - "prokka_out_for_test-wrongFormat.ffn.\nGen file will not be created.") in caplog.text + assert prokkafunc.create_gen(ffnfile, lstfile, res_gen_file) + exp_gen = os.path.join(EXP_ANNOTE, "res_create_gene_prokka.gen") + assert tutil.compare_order_content(exp_gen, res_gen_file) -def test_create_gen_unknown_gene(caplog): +def test_create_gen_supgen(caplog): """ - Check create gen file, but 1 gene is present in ffn, but not in lst - -> error message and returns False + Check create gen file. But there is a gene in ffn that is not in lst -> error """ caplog.set_level(logging.DEBUG) logger = logging.getLogger("test_prodigal") @@ -341,11 +350,7 @@ def test_create_gen_unknown_gene(caplog): lstfile = os.path.join(EXP_ANNOTE, "res_create_lst-prokka.lst") res_gen_file = os.path.join(GENEPATH, "prodigal_res.gen") assert not prokkafunc.create_gen(ffnfile, lstfile, res_gen_file) - assert ("Missing info for gene >sup_gene_00012 (from test/data/annotate/test_files/" - "prokka_out_for_test-supGene.ffn) in test/data/annotate/exp_files/" - "res_create_lst-prokka.lst. If it is actually present in the lst file, " - "check that genes are ordered by increasing number in both " - "lst and ffn files.") in caplog.text + assert ("Missing info for gene >JGIKIPIJ_03050 (from test/data/annotate/test_files/prokka_out_for_test-supGene.ffn) in test/data/annotate/exp_files/res_create_lst-prokka.lst. If it is actually present in the lst file, check that genes are ordered by increasing number in both lst and ffn files.") in caplog.text def test_create_gen_missingSeq(caplog): @@ -359,28 +364,10 @@ def test_create_gen_missingSeq(caplog): lstfile = os.path.join(EXP_ANNOTE, "res_create_lst-prokka.lst") res_gen_file = os.path.join(GENEPATH, "prodigal_res.gen") assert prokkafunc.create_gen(ffnfile, lstfile, res_gen_file) - exp_gen = os.path.join(EXP_ANNOTE, "res_create_gene_prokka-missingSeq.gen") + exp_gen = os.path.join(EXP_ANNOTE, "res_create_gene_prokka-missGene.gen") assert tutil.compare_order_content(exp_gen, res_gen_file) -def test_create_gen_missingLst(caplog): - """ - Check create gen file, but there is 1 gene in ffn which does not exist in lst - Error message and returns false - """ - caplog.set_level(logging.DEBUG) - logger = logging.getLogger("test_prodigal") - ffnfile = os.path.join(TEST_ANNOTE, "prokka_out_for_test-noLstFor1gene.ffn") - lstfile = os.path.join(EXP_ANNOTE, "res_create_lst-prokka.lst") - res_gen_file = os.path.join(GENEPATH, "prodigal_res.gen") - assert not prokkafunc.create_gen(ffnfile, lstfile, res_gen_file) - assert ("Missing info for gene >JGIKIPIJ_003018 (from test/data/annotate/test_files/" - "prokka_out_for_test-noLstFor1gene.ffn) in test/data/annotate/exp_files/" - "res_create_lst-prokka.lst. If it is actually present in the lst file, " - "check that genes are ordered by increasing number in both lst " - "and ffn files.") in caplog.text - - def test_create_prt(caplog): """ Check that prt file is generated as expected @@ -450,20 +437,20 @@ def test_format_1genome(caplog): name = "test.0417.00002" # path to original genome, given to prodigal for annotation gpath = os.path.join(TEST_ANNOTE, "original_name.fna") - prod_path = TEST_ANNOTE + prok_path = TEST_ANNOTE + # Create result directories prot_dir = os.path.join(GENEPATH, "Proteins") lst_dir = os.path.join(GENEPATH, "LSTINFO") rep_dir = os.path.join(GENEPATH, "Replicons") gene_dir = os.path.join(GENEPATH, "Genes") gff_dir = os.path.join(GENEPATH, "gff") - os.makedirs(prot_dir) os.makedirs(lst_dir) os.makedirs(rep_dir) os.makedirs(gene_dir) os.makedirs(gff_dir) - assert prokkafunc.format_one_genome(gpath, name, prod_path, lst_dir, prot_dir, gene_dir, + assert prokkafunc.format_one_genome(gpath, name, prok_path, lst_dir, prot_dir, gene_dir, rep_dir, gff_dir) # Check output files content @@ -502,6 +489,8 @@ def test_format_1genome_emptygpath(caplog): # Create prokka result files (empty files, will not be read) gpath_prokres = gpath + "-prokkaRes" os.makedirs(gpath_prokres) + fna_prokres = os.path.join(gpath_prokres, "prokka_out_for_test.fna") + open(fna_prokres, "w").close() tbl_prokres = os.path.join(gpath_prokres, "prokka_out_for_test.tbl") open(tbl_prokres, "w").close() gff_prokres = os.path.join(gpath_prokres, "prokka_out_for_test.gff") @@ -510,7 +499,7 @@ def test_format_1genome_emptygpath(caplog): open(ffn_prokres, "w").close() faa_prokres = os.path.join(gpath_prokres, "prokka_out_for_test.faa") open(faa_prokres, "w").close() - + # Create result directories prok_path = GENEPATH prot_dir = os.path.join(GENEPATH, "Proteins") lst_dir = os.path.join(GENEPATH, "LSTINFO") @@ -542,6 +531,7 @@ def test_format_1genome_emptygpath(caplog): assert len(os.listdir(lst_dir) ) == 0 assert len(os.listdir(gff_dir) ) == 0 assert len(os.listdir(gen_dir) ) == 0 + # Check log assert ("Problems while generating Replicon file for prokka_out_for_test") in caplog.text @@ -566,6 +556,9 @@ def test_format_1genome_pb_tbl(caplog): ori.write(">wrongheader # 1 # 2 # 1 # toto") # Add empty prokka res gff ffn and faa files (they won't be read, as it will stop # at tbl2lst) + orig_fna = os.path.join(TEST_ANNOTE, "original_name.fna-prokkaRes", "prokka_out_for_test.fna") + fna_prokres = os.path.join(used_respath, "prokka_out_for_test.fna") + shutil.copyfile(orig_fna, fna_prokres) res_gff_file = os.path.join(used_respath, "prokka_out_for_test.gff") open(res_gff_file, "w").close() res_ffn_file = os.path.join(used_respath, "prokka_out_for_test.ffn") @@ -629,6 +622,9 @@ def test_format_1genome_pb_gff(caplog): "prokka_out_for_test.tbl") used_tbl = os.path.join(used_respath, "prokka_out_for_test.tbl") shutil.copyfile(orig_tbl, used_tbl) + orig_fna = os.path.join(orig_gpath + "-prokkaRes", "prokka_out_for_test.fna") + fna_prokres = os.path.join(used_respath, "prokka_out_for_test.fna") + shutil.copyfile(orig_fna, fna_prokres) # Create gff_file with a wrong format with open(os.path.join(used_respath, "prokka_out_for_test.gff"), "w") as ori: @@ -675,7 +671,6 @@ def test_format_1genome_pb_gff(caplog): assert ("Problems while generating .gff file for test.0417.00002") in caplog.text - def test_format_1genome_pb_ffn(caplog): """ Test on formatting prokka results, when prokka output ffn file does not have @@ -700,9 +695,12 @@ def test_format_1genome_pb_ffn(caplog): "prokka_out_for_test.gff") used_gff = os.path.join(used_respath, "prokka_out_for_test.gff") shutil.copyfile(orig_gff, used_gff) + orig_fna = os.path.join(orig_gpath + "-prokkaRes", "prokka_out_for_test.fna") + fna_prokres = os.path.join(used_respath, "prokka_out_for_test.fna") + shutil.copyfile(orig_fna, fna_prokres) # Create ffn_file with a wrong format - orig_ffn = os.path.join(TEST_ANNOTE, "prokka_out_for_test-wrongFormat.ffn") + orig_ffn = os.path.join(TEST_ANNOTE, "prokka_out_for_test-supGene.ffn") used_ffn = os.path.join(used_respath, "prokka_out_for_test.ffn") shutil.copyfile(orig_ffn, used_ffn) # Add empty prokka res faa file @@ -740,9 +738,12 @@ def test_format_1genome_pb_ffn(caplog): assert len(os.listdir(lst_dir) ) == 0 assert len(os.listdir(gff_dir) ) == 0 assert len(os.listdir(gen_dir) ) == 0 - assert("Unknown header format >JGIKIPIJ-00005 in test/data/annotate/generated_by_unit-tests/" - "original_name.fna-prokkaRes/prokka_out_for_test.ffn.\n" - "Gen file will not be created.") in caplog.text + assert("Missing info for gene >JGIKIPIJ_03050 (from test/data/annotate/" + "generated_by_unit-tests/original_name.fna-prokkaRes/prokka_out_for_test.ffn) " + "in test/data/annotate/generated_by_unit-tests/LSTINFO/test.0417.00002.lst. " + "If it is actually present in the lst file, " + "check that genes are ordered by increasing number in both lst and " + "ffn files.") in caplog.text assert ("Problems while generating .gen file for test.0417.00002") in caplog.text @@ -762,6 +763,9 @@ def test_format_1genome_pb_faa(caplog): os.makedirs(used_respath) shutil.copyfile(orig_gpath, used_gpath) # Copy tbl and gff files, which is as expected (tbl2lst and generate_gff must succeed) + orig_fna = os.path.join(orig_gpath + "-prokkaRes", "prokka_out_for_test.fna") + fna_prokres = os.path.join(used_respath, "prokka_out_for_test.fna") + shutil.copyfile(orig_fna, fna_prokres) orig_tbl = os.path.join(orig_gpath + "-prokkaRes", "prokka_out_for_test.tbl") used_tbl = os.path.join(used_respath, "prokka_out_for_test.tbl") diff --git a/test/test_unit/test_annotate/test_genome_func.py b/test/test_unit/test_annotate/test_genome_func.py index 779c7d011264b482fc7d05abf111765f2e6502cf..b17924218c33dc9c60616fc9ea55411ac11eec08 100755 --- a/test/test_unit/test_annotate/test_genome_func.py +++ b/test/test_unit/test_annotate/test_genome_func.py @@ -40,14 +40,16 @@ def setup_teardown_module(): - remove directory with generated results """ # utils.init_logger(LOGFILE_BASE, 0, 'test_postalign', verbose=1) - os.mkdir(GENEPATH) + if os.path.isdir(GENEPATH): + content = os.listdir(GENEPATH) + for f in content: + assert f.startswith(".fuse") + else: + os.mkdir(GENEPATH) print("setup") yield - shutil.rmtree(GENEPATH) - # for f in LOGFILES: - # if os.path.exists(f): - # os.remove(f) + shutil.rmtree(GENEPATH, ignore_errors=True) print("teardown") @@ -125,7 +127,7 @@ def test_split_contig_nocut(): """ pat = None whole_seq = "AACTGCTTTTTAAGCGCGCTCCTGCGNNNNNGGTTGTGTGGGCCCAGAGCGAGNCG" - cur_contig_name = ">my_contig_name_for_my_sequence" + cur_contig_name = ">my_contig name for my_sequence" contig_sizes = {"contig_1": 10} resfile = os.path.join(GENEPATH, "test_split_contig_nocut.fna") gresf = open(resfile, "w") @@ -149,7 +151,7 @@ def test_split_contig_cut(): """ pat = "NNN+" whole_seq = "AACTGCTTTTTAAGCGCGCTCCTGCGNNNNNGGTTGTGTGGGCCCAGAGCGAGNCG" - cur_contig_name = ">my_contig_name_for_my_sequence" + cur_contig_name = ">my_contig_name for_my_sequence" contig_sizes = {">contig_1": 10} resfile = os.path.join(GENEPATH, "test_split_contig_nocut.fna") gresf = open(resfile, "w") @@ -195,7 +197,7 @@ def test_format_contig_cut(): cut = True pat = 'NNNNN+' cur_seq = "AACTGCTTTTTAAGCGCGCTCCTGCGNNNNNGGTTGTGTGGGCCCAGAGCGAGNCG" - cur_contig_name = ">my_contig_name_for_my_sequence" + cur_contig_name = ">my_contig_name for_my_sequence" contig_sizes = {} resfile = os.path.join(GENEPATH, "test_format_cont_cut5N.fna") gresf = open(resfile, "w") @@ -208,38 +210,36 @@ def test_format_contig_cut(): exp_file = os.path.join(EXP_DIR, "exp_split_contig_cut3N.fna") assert os.path.exists(resfile) assert tutil.compare_order_content(resfile, exp_file) - assert contig_sizes == {">my_contig_name_for_my_sequence_2\n": 26, - ">my_contig_name_for_my_sequence_3\n": 25} + assert contig_sizes == {">2_my_contig_name for_my_sequence\n": 26, + ">3_my_contig_name for_my_sequence\n": 25} def test_format_contig_nocut(): """ - For a given contig, if we want to annotate it with prokka, and do not cut at each stretch of + For a given contig, if we want to annotate it with prokka, and do not cut at each stretch of 5 'N'check that it writes this contig as given """ cut = False pat = None cur_seq = "AACTGCTTTTTAAGCGCGCTCCTGCGNNNNNGGTTGTGTGGGCCCAGAGCGAGNCG" - cur_contig_name = ">my_contig_name_for_my_sequence" + cur_contig_name = ">my_contig_name_for_my_sequence\n" contig_sizes = {} resfile = os.path.join(GENEPATH, "test_format_cont_nocut_prokka.fna") - gresf = open(resfile, "w") + gresf = None num = 2 assert gfunc.format_contig(cut, pat, cur_seq, cur_contig_name, contig_sizes, gresf, - num, logger=None) == 3 - gresf.close() + num, logger=None) == 2 exp_file = os.path.join(EXP_DIR, "exp_split_contig_nocut.fna") - assert os.path.exists(resfile) - assert tutil.compare_order_content(resfile, exp_file) - assert contig_sizes == {">my_contig_name_for_my_sequence_2\n": 56} + assert not os.path.exists(resfile) + assert contig_sizes == {">my_contig_name_for_my_sequence\n": 56} -def test_format_contig_nocut_prodigal_notSameName(): +def test_format_contig_nocut_notDuplicateName(): """ - For a given contig, if we want to annotate it with prodigal, and do not cut, - then we keep the same file (no need to split at 20 characters) + For a given contig, if we want to annotate it with prodigal, and do not cut, + then we keep the same file (no need to split at 20 characters) However, we must check that contig names are all different. Add 2 contigs, to be sure the 'num' parameter is not increased. """ @@ -262,7 +262,7 @@ def test_format_contig_nocut_prodigal_notSameName(): ">mycontig": 155} -def test_format_contig_nocut_prodigal_SameName(caplog): +def test_format_contig_nocut_DuplicateName(caplog): """ For a given contig, if we want to annotate it with prodigal, and do not cut, then we keep the same file. However, we must check that contig names are all different. Try to add a contig which name is already used, check that it prints the expected error, @@ -400,7 +400,7 @@ def test_analyse1genome_nocut_prodigal(): def test_analyse1genome_cut_prodigal(): ''' Analyse the given genome, cutting at stretches of 5N, in order to annotate it - Create new genome file in outdir, calculate genome size, nb contigs and L90, and add it + Create new genome file in outdir, calculate genome size, nb contigs and L90, and add it to the genomes dict, as well as the path to the genome file. ''' gs = ["genome1.fasta", "genome2.fasta", "genome3.fasta"] @@ -429,8 +429,8 @@ def test_analyse1genome_cut_prodigal(): def test_analyse1genome_cut_prokka(): ''' Analyse the given genome, cutting at stretches of 5N, in order to annotate it with prokka - Create new genome file in outdir, with shortened contig names, calculate genome size, - nb contigs and L90, and add it + Create new genome file in outdir, with shortened contig names, calculate genome size, + nb contigs and L90, and add it to the genomes dict, as well as the path to the genome file. ''' gs = ["genome1.fasta", "genome2.fasta", "genome3.fasta"] @@ -460,7 +460,7 @@ def test_analyse1genome_cut_same_names(): """ Analyse a genome. Its contig names all have the same first 20 characters. There is no stretch of at least 5N, so contigs are not split. - New contig names should be uniq, and not all ending with _0! + New contig names should be uniq, and not all starting with '1_'! """ genome = "genome_long_header.fst" genomes = {genome: ["SAEN.1015.0117"]} @@ -485,7 +485,7 @@ def test_analyse1genome_same_names_nocut(caplog): genomes = {genome: ["SAEN.1015.0117"]} cut = False pat = None - assert not gfunc.analyse_genome(genome, GEN_PATH, GENEPATH, cut, pat, genomes, + assert not gfunc.analyse_genome(genome, GEN_PATH, GENEPATH, cut, pat, genomes, "prodigal", logger) assert ("myheader contig name is used for several contigs. Please put different names for " "each contig. This genome will be ignored") in caplog.text @@ -501,7 +501,7 @@ def test_analyse1genome_same_last_name_nocut(caplog): genomes = {genome: ["SAEN.1015.0117"]} cut = False pat = None - assert not gfunc.analyse_genome(genome, GEN_PATH, GENEPATH, cut, pat, genomes, + assert not gfunc.analyse_genome(genome, GEN_PATH, GENEPATH, cut, pat, genomes, "prodigal", logger) assert ("myheader contig name is used for several contigs. Please put different names for " "each contig. This genome will be ignored") in caplog.text @@ -509,7 +509,7 @@ def test_analyse1genome_same_last_name_nocut(caplog): def test_analyse1genome_nofile(caplog): ''' - Test that when we ask to analyse a genome whose sequence file does not exist, it returns false + Test that when we ask to analyse a genome whose sequence file does not exist, it returns false with corresponding error message. ''' caplog.set_level(logging.DEBUG) @@ -527,7 +527,7 @@ def test_analyse1genome_nofile(caplog): def test_analyse1genome_empty(caplog): ''' - Test that when we ask to analyse a genome whose sequence file does not exist, it returns false + Test that when we ask to analyse a genome whose sequence file does not exist, it returns false with corresponding error message. ''' caplog.set_level(logging.DEBUG) @@ -592,7 +592,7 @@ def test_analyse_all_genomes_cut(caplog): gs[1]: ["SAEN.1114", gpaths[1], opaths[1], 51, 6, 5], gs[2]: ["ESCO.0416", gpaths[2], opaths[2], 70, 4, 1]} assert exp_genomes == genomes - assert ("Cutting genomes at each time there are at least 3 'N' in a row, " + assert ("Cutting genomes at each time there are at least 3 'N' in a row, " "and then, calculating genome size, number of contigs and L90.") in caplog.text @@ -654,7 +654,7 @@ def test_analyse_all_genomes_cut_empty(caplog): gs[1]: ["SAEN.1114", gpaths[1], opaths[1], 51, 6, 5], gs[3]: ["ESCO.0123", gpaths[3], opaths[3], 70, 4, 1]} assert exp_genomes == genomes - assert ("Cutting genomes at each time there are at least 3 'N' in a row, " + assert ("Cutting genomes at each time there are at least 3 'N' in a row, " "and then, calculating genome size, number of contigs and L90.") in caplog.text assert ("Your file test/data/annotate/genomes/empty.fasta " "does not contain any gene. Please check that you really gave a " @@ -679,7 +679,7 @@ def test_analyse_all_genomes_noseq(caplog): # Run analysis with pytest.raises(SystemExit): gfunc.analyse_all_genomes(genomes, "toto", GENEPATH, nbn, "prokka", logger, quiet=True) - assert ("No genome was found in the database folder toto. See logfile " + assert ("No genome was found in the database folder toto. See logfile " "for more information.") in caplog.text diff --git a/test/test_unit/test_prepare/test_download.py b/test/test_unit/test_prepare/test_download.py index 4e7a86758ebc0ef684c87522fffb78e08185e455..58525032cd163b545e7341e5e238c706fdf9faee 100755 --- a/test/test_unit/test_prepare/test_download.py +++ b/test/test_unit/test_prepare/test_download.py @@ -14,6 +14,33 @@ import PanACoTA.prepare_module.download_genomes_func as downg DATA_TEST_DIR = os.path.join("test", "data", "prepare") +GENEPATH = os.path.join(DATA_TEST_DIR, "generated_by_unit-tests") + + +@pytest.fixture(autouse=True) +def setup_teardown_module(): + """ + Remove log files at the end of this test module + + Before each test: + - init logger + - create directory to put generated files + + After: + - remove all log files + - remove directory with generated results + """ + if os.path.isdir(GENEPATH): + content = os.listdir(GENEPATH) + for f in content: + assert f.startswith(".fuse") + else: + os.mkdir(GENEPATH) + print("setup") + + yield + shutil.rmtree(GENEPATH, ignore_errors=True) + print("teardown") def test_to_database(): @@ -38,7 +65,6 @@ def test_to_database(): assert os.path.isfile(os.path.join(db_dir, "ACOR002.0519.fna")) assert os.path.isfile(os.path.join(db_dir, "ACOR003.0519.fna")) - # Remove database created shutil.rmtree(db_dir) @@ -49,11 +75,12 @@ def test_to_database_nofolder_refseq(caplog): """ caplog.set_level(logging.DEBUG) with pytest.raises(SystemExit): - downg.to_database(DATA_TEST_DIR) + downg.to_database(GENEPATH) assert "ERROR" in caplog.text assert ("The folder containing genomes downloaded from NCBI refseq " - "(test/data/prepare/refseq/bacteria) does not exist.") in caplog.text + "(test/data/prepare/generated_by_unit-tests/refseq/bacteria) " + "does not exist.") in caplog.text assert ("Check that you really downloaded sequences (fna.gz) and that they are " "in this folder") in caplog.text @@ -63,52 +90,45 @@ def test_to_database_nofolder_per_genome(caplog): Test behavior when the folder refseq/bacteria exists, but there are no folders inside -> should exit with error message """ - empty_dir = os.path.join(DATA_TEST_DIR, "refseq", "bacteria") + empty_dir = os.path.join(GENEPATH, "refseq", "bacteria") os.makedirs(empty_dir) caplog.set_level(logging.DEBUG) with pytest.raises(SystemExit): - downg.to_database(DATA_TEST_DIR) + downg.to_database(GENEPATH) # Check error message is as expected assert "ERROR" in caplog.text assert ("The folder supposed to contain genomes downloaded from NCBI refseq " - "(test/data/prepare/refseq/bacteria) exists but is empty") in caplog.text + "(test/data/prepare/generated_by_unit-tests/refseq/bacteria) " + "exists but is empty") in caplog.text assert ("Check that you really downloaded sequences (fna.gz)") in caplog.text - # Remove files/folders specific to test - shutil.rmtree(os.path.join(DATA_TEST_DIR, "refseq")) - def test_to_database_1empty_genome_folder(caplog): """ Test behavior when the folder refseq/bacteria exists, there are subfolders inside, but 1 of them is empty: warning message informing that this genome will be ignored """ - out_dir = os.path.join(DATA_TEST_DIR, "genomes") - gz_genomes_folder = os.path.join(out_dir, "refseq", "bacteria") + caplog.set_level(logging.DEBUG) + out_dir = os.path.join(GENEPATH, "genomes") + refseq_dir = os.path.join(DATA_TEST_DIR, "genomes") + # Copy content of refseq in genomes test data to output folder that will be used + shutil.copytree(refseq_dir, out_dir) # Empty 1 directory: move its file to 'out_dir' - to_move_filename = "ACOR002.0519.fna.gz" # File that must be moved - to_empty_dir = "ACOR002" # Directory containing file to move - to_move_file = os.path.join(gz_genomes_folder, to_empty_dir, to_move_filename) - shutil.move(to_move_file, os.path.join(out_dir, to_move_filename)) - + to_remove = os.path.join(out_dir, "refseq", "bacteria", "ACOR003", "ACOR003.0519.fna.gz") + os.remove(to_remove) # Run to_database nb_gen, db_dir = downg.to_database(out_dir) assert nb_gen == 2 assert db_dir == os.path.join(out_dir, "Database_init") # Check that a warning message was raised, indicating that genome is ignored - caplog.set_level(logging.DEBUG) assert "WARNING" in caplog.text - assert ("Problem with genome in ACOR002: no compressed fasta file downloaded. " + assert ("Problem with genome in ACOR003: no compressed fasta file downloaded. " "This genome will be ignored.") in caplog.text - assert not os.path.isfile(os.path.join(db_dir, "ACOR002.0519.fna")) + assert not os.path.isfile(os.path.join(db_dir, "ACOR003.0519.fna")) assert os.path.isfile(os.path.join(db_dir, "ACOR001.0519.fna")) - assert os.path.isfile(os.path.join(db_dir, "ACOR003.0519.fna")) - - # Remove files/folders specific to test - shutil.move(os.path.join(out_dir, to_move_filename), to_move_file) - shutil.rmtree(db_dir) + assert os.path.isfile(os.path.join(db_dir, "ACOR002.0519.fna")) def test_to_database_several_genomes(caplog): @@ -117,13 +137,15 @@ def test_to_database_several_genomes(caplog): but 1 of them contains more than 1 genome: warning message informing that this genome will be ignored """ - out_dir = os.path.join(DATA_TEST_DIR, "genomes") - gz_genomes_folder = os.path.join(out_dir, "refseq", "bacteria") + out_dir = os.path.join(GENEPATH, "genomes") + refseq_dir = os.path.join(DATA_TEST_DIR, "genomes") + # Copy content of refseq in genomes test data to output folder that will be used + shutil.copytree(refseq_dir, out_dir) # Create a new gz file in one of the genome directories to_create_filename = "ACOR002.0519.bis.fna.gz" # Name of file that must be created to_fill_dir = "ACOR002" # Directory containing file to create - to_create_path = os.path.join(gz_genomes_folder, to_fill_dir, to_create_filename) + to_create_path = os.path.join(out_dir, "refseq", "bacteria", to_fill_dir, to_create_filename) # Create empty gz file open(to_create_path, "w").close() @@ -141,29 +163,27 @@ def test_to_database_several_genomes(caplog): assert os.path.isfile(os.path.join(db_dir, "ACOR001.0519.fna")) assert os.path.isfile(os.path.join(db_dir, "ACOR003.0519.fna")) - # Remove test files/folders - os.remove(to_create_path) - shutil.rmtree(db_dir) - def test_to_database_1genome_wrong_format(caplog): """ Test behavior when the folder refseq/bacteria exists, there is 1 genome per subfolder, but 1 genome cannot be unzipped """ - out_dir = os.path.join(DATA_TEST_DIR, "genomes") - gz_genomes_folder = os.path.join(out_dir, "refseq", "bacteria") + # out_dir = os.path.join(DATA_TEST_DIR, "genomes") + # gz_genomes_folder = os.path.join(out_dir, "refseq", "bacteria") + + out_dir = os.path.join(GENEPATH, "genomes") + refseq_dir = os.path.join(DATA_TEST_DIR, "genomes") + # Copy content of refseq in genomes test data to output folder that will be used + shutil.copytree(refseq_dir, out_dir) # Name of directory directly containing the original gz file to_corrupt_dir = "ACOR001" - # Name of original gz file that must be moved to be saved - to_empty_filename = "ACOR001.0519.fna.gz" - # Complete path to this original gz file - to_empty_path = os.path.join(gz_genomes_folder, to_corrupt_dir, to_empty_filename) # - # copy real gz genome file to outdir to save it, and create a fake one in place of it - shutil.copy(to_empty_path, os.path.join(out_dir, to_empty_filename)) + to_corrupt_filename = "ACOR001.0519.fna.gz" + to_corrupt_path = os.path.join(out_dir, "refseq", "bacteria", to_corrupt_dir, + to_corrupt_filename) # Create fake gz file (txt file) - false_gz = open(to_empty_path, "w") + false_gz = open(to_corrupt_path, "w") false_gz.write("This is not a gz file") false_gz.close() @@ -176,22 +196,18 @@ def test_to_database_1genome_wrong_format(caplog): caplog.set_level(logging.DEBUG) assert "ERROR" in caplog.text assert ("Error while trying to uncompress " - "test/data/prepare/genomes/Database_init/ACOR001.0519.fna.gz. " + "test/data/prepare/generated_by_unit-tests/genomes/Database_init/ACOR001.0519.fna.gz. " "This genome will be ignored") in caplog.text # Check that there are only 2 files in the database, and that they correspond # to uncompressed gz files list_db = os.listdir(db_dir) assert len(list_db) == 2 - assert not os.path.isfile(os.path.join(db_dir, to_empty_filename)) + assert not os.path.isfile(os.path.join(db_dir, to_corrupt_filename)) assert os.path.isfile(os.path.join(db_dir, "ACOR002.0519.fna")) assert os.path.isfile(os.path.join(db_dir, "ACOR003.0519.fna")) - # Remove test files/Folders - shutil.move(os.path.join(out_dir, to_empty_filename), to_empty_path) - shutil.rmtree(db_dir) - -def test_download(): +def test_download_specify_level(): """ Test that, given a taxid, and a species name, it downloads genomes in .gz, and uncompress them in the @@ -202,14 +218,16 @@ def test_download(): species_linked = "Acetobacter_orleanensis" NCBI_species = "Acetobacter orleanensis" NCBI_taxid = "104099" - outdir = os.path.join(DATA_TEST_DIR, "test_download_refseq") + outdir = os.path.join(GENEPATH, "test_download_refseq") threads = 1 + levels = "" - db_dir, nb_gen = downg.download_from_refseq(species_linked, NCBI_species, NCBI_taxid, - outdir, threads) + db_dir, nb_gen = downg.download_from_refseq(species_linked, NCBI_species, NCBI_taxid, levels, + outdir, threads) # Check path to uncompressed files is as expected assert db_dir == os.path.join(outdir, "Database_init") - # Check number of genomes downloaded. We cannot know the exact value, as it is updated everyday. But in nov. 2019, there are 4 genomes. So, there must be at least those 4 genomes + # Check number of genomes downloaded. We cannot know the exact value, as it is updated + # everyday. But in nov. 2019, there are 4 genomes. So, there must be at least those 4 genomes assert nb_gen >= 4 # And that db_dir exists and contains nb_gen files assert os.path.isdir(db_dir) @@ -218,15 +236,35 @@ def test_download(): # Check that assembly summary file wwas donwloaded as expected sum_file = os.path.join(outdir, "assembly_summary-Acetobacter_orleanensis.txt" ) assert os.path.isfile(sum_file) + # Check number of genomes in summary file, and how many with scaffold or complete + # assembly level -> will check that when asking only for those levels, we get the same number + other = 0 + scaf = 0 + comp = 0 + with open(sum_file, "r") as sf: + sf.readline() # skip header + for line in sf: + if "complete" in line.split("\t")[13].lower(): + comp += 1 + elif "scaffold" in line.split("\t")[13].lower(): + scaf += 1 + else: + other += 1 + assert other + scaf + comp == nb_gen # Check that the NCBI_genome_download output directory exists ngd_outdir = os.path.join(outdir, "refseq", "bacteria") # And that it contains folders assert os.path.isdir(ngd_outdir) - assert len(os.listdir(ngd_outdir)) >= 3 + assert len(os.listdir(ngd_outdir)) >= 4 - # Remove test ouput dir - shutil.rmtree(outdir) + # Re-run, but only asking for complete and scaffold + outdir2 = os.path.join(GENEPATH, "test_download_refseq_only-scaf") + levels2 = "scaffold,complete" + db_dir2, nb_gen2 = downg.download_from_refseq(species_linked, NCBI_species, NCBI_taxid, + levels2, outdir2, threads) + assert scaf + comp == nb_gen2 + assert db_dir2 == os.path.join(outdir2, "Database_init") def test_download_noSpeName(): @@ -239,10 +277,11 @@ def test_download_noSpeName(): species_linked = "toto" NCBI_species = None NCBI_taxid = "104099" - outdir = os.path.join(DATA_TEST_DIR, "test_download_refseq_noSpe") + outdir = os.path.join(GENEPATH, "test_download_refseq_noSpe") threads = 1 + levels = "" - db_dir, nb_gen = downg.download_from_refseq(species_linked, NCBI_species, NCBI_taxid, + db_dir, nb_gen = downg.download_from_refseq(species_linked, NCBI_species, NCBI_taxid, levels, outdir, threads) # Check path to uncompressed files is as expected @@ -261,9 +300,7 @@ def test_download_noSpeName(): ngd_outdir = os.path.join(outdir, "refseq", "bacteria") # And that it contains folders assert os.path.isdir(ngd_outdir) - assert len(os.listdir(ngd_outdir)) >= 3 - # Remove test ouput dir - shutil.rmtree(outdir) + assert len(os.listdir(ngd_outdir)) >= 4 def test_download_wrongTaxID(caplog): @@ -275,10 +312,11 @@ def test_download_wrongTaxID(caplog): species_linked = "Acetobacter_orleanensis" NCBI_species = None NCBI_taxid = "10409" - outdir = os.path.join(DATA_TEST_DIR, "test_download_refseq_wrongTaxID") + outdir = os.path.join(GENEPATH, "test_download_refseq_wrongTaxID") threads = 1 + levels = "" with pytest.raises(SystemExit): - downg.download_from_refseq(species_linked, NCBI_species, NCBI_taxid, + downg.download_from_refseq(species_linked, NCBI_species, NCBI_taxid, levels, outdir, threads) # Check path to uncompressed files does not exist @@ -309,10 +347,11 @@ def test_download_diffSpeTaxID(caplog): species_linked = "Acetobacter_orleanensis" NCBI_species = "Acetobacter fabarum" NCBI_taxid = "104099" - outdir = os.path.join(DATA_TEST_DIR, "test_download_refseq_wrongTaxID") + outdir = os.path.join(GENEPATH, "test_download_refseq_wrongTaxID") threads = 1 + levels = "" with pytest.raises(SystemExit): - downg.download_from_refseq(species_linked, NCBI_species, NCBI_taxid, + downg.download_from_refseq(species_linked, NCBI_species, NCBI_taxid, levels, outdir, threads) # Check path to uncompressed files does not exist diff --git a/test/test_unit/test_utils-argparse.py b/test/test_unit/test_utils-argparse.py new file mode 100644 index 0000000000000000000000000000000000000000..fb2a35cc3b940a22f2ddd0e41261ba6d41189c65 --- /dev/null +++ b/test/test_unit/test_utils-argparse.py @@ -0,0 +1,135 @@ +#!/usr/bin/env python3 +# coding: utf-8 + +""" +Unit tests for the functions of utils-argparse.py dealing with checking arguments given to argparse +""" + +import logging +import os +import pytest +import shutil +import argparse +import multiprocessing + +import PanACoTA.utils_argparse as autils + + +def test_gen_name(): + """ + Test that, when giving a gene name, if it does not have 4 characters (letters or num), + it returns an error message + """ + assert autils.gen_name("TOTO") == "TOTO" + assert autils.gen_name("1234") == "1234" + assert autils.gen_name("T1O2") == "T1O2" + with pytest.raises(argparse.ArgumentTypeError) as err: + autils.gen_name("a long name") + assert ("The genome name must contain 4 characters. For example, this name " + "can correspond to the 2 first letters of genus, and 2 first letters of " + "species, e.g. ESCO for Escherichia Coli") in str(err.value) + with pytest.raises(argparse.ArgumentTypeError) as err: + autils.gen_name("-gdd") + assert ("The genome name must contain 4 characters. For example, this name can correspond " + "to the 2 first letters of genus, and 2 first letters of species, e.g. " + "ESCO for Escherichia Coli") in str(err.value) + + +def test_date_name(capsys): + """ + Test that when a date is given, it returns expected message + """ + assert autils.date_name("0920") == "0920" + assert autils.date_name("se20") == "se20" + with pytest.raises(argparse.ArgumentTypeError) as err: + autils.date_name("september 2020") + assert ("The date must contain 4 characters. Usually, it contains 4 digits, " + "corresponding to the month (2 digits) and year (2 digits)") in str(err.value) + + +def test_get_date(): + """ + test that it returns current date + """ + import time + t = time.strftime("%m%y") + assert autils.get_date() == t + + +def test_cont_num(): + """ + Test that given value of contig number is valid + """ + assert autils.cont_num(10) == 10 + with pytest.raises(argparse.ArgumentTypeError) as raised_err: + autils.cont_num("-2") + assert ("The maximum number of contigs allowed must be a " + "positive number") in str(raised_err.value) + with pytest.raises(argparse.ArgumentTypeError) as err: + autils.cont_num("10000") + assert ("We do not support genomes with more than 9999 contigs") in str(err.value) + with pytest.raises(argparse.ArgumentTypeError) as err: + autils.cont_num("a") + assert ("argument --nbcont: invalid int value: a") in str(err.value) + with pytest.raises(argparse.ArgumentTypeError) as err: + autils.cont_num("1.1") + assert ("argument --nbcont: invalid int value: 1.") in str(err.value) + + +def test_thread_num(): + """ + Test that given number of threads is as expected + """ + assert autils.thread_num("1") == 1 + with pytest.raises(argparse.ArgumentTypeError) as err: + a = autils.thread_num("1.1") + assert ("argument --threads threads: invalid int value: 1.1") in str(err.value) + with pytest.raises(argparse.ArgumentTypeError) as err: + a = autils.thread_num("a") + assert ("argument --threads threads: invalid int value: a") in str(err.value) + nb_cpu = multiprocessing.cpu_count() + with pytest.raises(argparse.ArgumentTypeError) as err: + a = autils.thread_num(str(nb_cpu*2)) + assert (f"You have {nb_cpu} threads on your computer, you cannot ask for more: invalid value: " + f"{nb_cpu*2}") in str(err.value) + with pytest.raises(argparse.ArgumentTypeError) as err: + a = autils.thread_num("-1") + assert ("Please provide a positive number of threads (or 0 for all threads): " + "Invalid value: -1") in str(err.value) + assert autils.thread_num(0) == nb_cpu + + +def test_positive_int(): + """ + Test checking that given argument is a positive integer + """ + assert autils.positive_int("1") == 1 + with pytest.raises(argparse.ArgumentTypeError) as err: + a = autils.positive_int("1.1") + assert ("argument --cutn: invalid int value: '1.1'") in str(err.value) + with pytest.raises(argparse.ArgumentTypeError) as err: + a = autils.positive_int("-1") + assert ("error: argument --cutn must be a positive integer: " + "invalid int value: '-1'") in str(err.value) + + +def test_mash_dist(): + """ + Test checking that given value is ok for a mash distance + """ + assert autils.mash_dist("0.05") == 0.05 + assert autils.mash_dist("1e-4") == 0.0001 + with pytest.raises(argparse.ArgumentTypeError) as err: + a = autils.mash_dist("1.1.1") + assert ("error: mash distance: invalid float value: '1.1.1'") in str(err.value) + with pytest.raises(argparse.ArgumentTypeError) as err: + a = autils.mash_dist("one") + assert ("error: mash distance: invalid float value: 'one'") in str(err.value) + with pytest.raises(argparse.ArgumentTypeError) as err: + a = autils.mash_dist("1.000001") + assert ("error: mash distance must be between 0 and 1: " + "invalid value: '1.000001'") in str(err.value) + with pytest.raises(argparse.ArgumentTypeError) as err: + a = autils.mash_dist("-1e-4") + assert ("error: mash distance must be between 0 and 1: " + "invalid value: '-0.0001'") in str(err.value) diff --git a/test/test_unit/test_utils-logging.py b/test/test_unit/test_utils-logging.py index 0f093f93fcb4b9557267740cb1c17f41823141c9..8c59c708d49372ab32d7316040cf6c8d553b1422 100755 --- a/test/test_unit/test_utils-logging.py +++ b/test/test_unit/test_utils-logging.py @@ -20,11 +20,16 @@ def setup_teardown_module(): """ # Init logger to level detail (15) # utils.init_logger(LOGFILE_BASE, logging.DEBUG, 'test_utils', verbose=1) - os.mkdir(GENEPATH) + if os.path.isdir(GENEPATH): + content = os.listdir(GENEPATH) + for f in content: + assert f.startswith(".fuse") + else: + os.mkdir(GENEPATH) print("setup") yield - shutil.rmtree(GENEPATH) + shutil.rmtree(GENEPATH, ignore_errors=True) print("teardown") @@ -288,7 +293,9 @@ def test_logger_info_verbose1(capsys): assert "info warning" in err assert "info error" in err assert "info critical" in err - assert len(os.listdir(GENEPATH)) == 2 + files = os.listdir(GENEPATH) + files = [f for f in files if "fuse" not in f] + assert len(files) == 2 with open(logfile + ".log", "r") as logf: assert logf.readline().endswith(" :: INFO :: info info\n") assert logf.readline().endswith(" :: WARNING :: info warning\n") @@ -322,7 +329,9 @@ def test_logger_info_verbose2(capsys): assert "info warning" in err assert "info error" in err assert "info critical" in err - assert len(os.listdir(GENEPATH)) == 2 + files = os.listdir(GENEPATH) + files = [f for f in files if "fuse" not in f] + assert len(files) == 2 with open(logfile + ".log", "r") as logf: assert logf.readline().endswith(" :: INFO :: info info\n") assert logf.readline().endswith(" :: WARNING :: info warning\n") @@ -354,7 +363,9 @@ def test_logger_warning(capsys): assert "info info" in out assert "info error" in err assert "info critical" in err - assert len(os.listdir(GENEPATH)) == 2 + files = os.listdir(GENEPATH) + files = [f for f in files if "fuse" not in f] + assert len(files) == 2 with open(logfile + ".log", "r") as logf: assert logf.readline().endswith(" :: INFO :: info info\n") assert logf.readline().endswith(" :: WARNING :: info warning\n") @@ -387,7 +398,9 @@ def test_logger_warning_verbose1(capsys): assert "info error" in err assert "info warning" in err assert "info critical" in err - assert len(os.listdir(GENEPATH)) == 2 + files = os.listdir(GENEPATH) + files = [f for f in files if "fuse" not in f] + assert len(files) == 2 with open(logfile + ".log", "r") as logf: assert logf.readline().endswith(" :: INFO :: info info\n") assert logf.readline().endswith(" :: WARNING :: info warning\n") @@ -421,7 +434,9 @@ def test_logger_warning_verbose2(capsys): assert "info error" in err assert "info warning" in err assert "info critical" in err - assert len(os.listdir(GENEPATH)) == 2 + files = os.listdir(GENEPATH) + files = [f for f in files if "fuse" not in f] + assert len(files) == 2 with open(logfile + ".log", "r") as logf: assert logf.readline().endswith(" :: INFO :: info info\n") assert logf.readline().endswith(" :: WARNING :: info warning\n") @@ -454,7 +469,9 @@ def test_logger_critical(capsys): assert "info info" in out assert "info error" in err assert "info critical" in err - assert len(os.listdir(GENEPATH)) == 2 + files = os.listdir(GENEPATH) + files = [f for f in files if "fuse" not in f] + assert len(files) == 2 with open(logfile + ".log", "r") as logf: assert logf.readline().endswith(" :: INFO :: info info\n") assert logf.readline().endswith(" :: WARNING :: info warning\n") diff --git a/test/test_unit/test_utils.py b/test/test_unit/test_utils.py index a1a7970765f62efa48d05532ba63b7b9efc513d4..cd653d4ed87a32ff1d392d4e8e872f3938454942 100755 --- a/test/test_unit/test_utils.py +++ b/test/test_unit/test_utils.py @@ -17,6 +17,7 @@ matplotlib.use('AGG') # Define variables used by several tests DATA_DIR = os.path.join("test", "data", "annotate") +TEST_DIR = os.path.join(DATA_DIR, "test_files") BASELINE_DIR = os.path.abspath(os.path.join(DATA_DIR, "exp_files", "baseline")) GENEPATH = os.path.join(DATA_DIR, "generated_by_unit-tests") LOGFILE_BASE = "test_prokka" @@ -659,8 +660,8 @@ def test_read_genomes_info_no_genomes(caplog): utils.read_genomes_info(lstinfo_file, name) assert ("Reading given information on your genomes in " "test/data/annotate/test_files/lstinfo-no-genome.lst") in caplog.text - assert ("no genome listed in test/data/annotate/test_files/lstinfo-no-genome.lst " - "were found.") in caplog.text + assert ("No genome listed in test/data/annotate/test_files/lstinfo-no-genome.lst " + "was found.") in caplog.text def test_read_genomes_info_ok(caplog): @@ -918,6 +919,52 @@ def test_rename_contigs(): assert utilities.compare_order_content(outfile, exp_file) +def test_rename_contigs_empty_fasta(caplog): + """ + From an empty fasta file, ask to rename contigs. Should return empty tuple of dict, and error + message. + """ + logger = logging.getLogger("default") + gpath = os.path.join(GENEPATH, "empty.fasta") + # Create empty fasta file + open(gpath, "w").close() + gembase_name = "ESCO.0216.00005" + outfile = os.path.join(GENEPATH, "H299_H561.fasta-short-contig.fna") + exp_file = os.path.join(DATA_DIR, "exp_files", "res_H299_H561-ESCO00005.fna") + contigs, sizes = utils.get_genome_contigs_and_rename(gembase_name, gpath, outfile, logger) + assert contigs == {} + assert sizes == {} + # Check that outfile is empty + with open(outfile, "r") as of: + assert len(of.readlines()) == 0 + # Check error message + assert ("Your genome test/data/annotate/generated_by_unit-tests/empty.fasta does " + "not contain any sequence, or is not in fasta format") in caplog.text + + +def test_rename_contigs_non_fasta(caplog): + """ + From an file which is not empty, but not in fasta format (no headers starting with '>'), + check that contigs, sizes and outfile are empty, and error message is ok + """ + logger = logging.getLogger("default") + gpath = os.path.join(TEST_DIR, "non-fasta.seq") + # Create empty fasta file + open(gpath, "w").close() + gembase_name = "ESCO.0216.00005" + outfile = os.path.join(GENEPATH, "H299_H561.fasta-short-contig.fna") + exp_file = os.path.join(DATA_DIR, "exp_files", "res_H299_H561-ESCO00005.fna") + contigs, sizes = utils.get_genome_contigs_and_rename(gembase_name, gpath, outfile, logger) + assert contigs == {} + assert sizes == {} + # Check that outfile is empty + with open(outfile, "r") as of: + assert len(of.readlines()) == 0 + # Check error message + assert ("Your genome test/data/annotate/test_files/non-fasta.seq does " + "not contain any sequence, or is not in fasta format") in caplog.text + + def test_rename_contigs_duplicate(caplog): """ From a given sequence, there are 2 contigs named "contig2". Stops and returns false