# HG changeset patch # User tduigou # Date 1754467378 0 # Node ID 4bde3e90ee9857ada445115f0ee897657befc237 planemo upload for repository https://github.com/Edinburgh-Genome-Foundry/Plateo commit 98d5e65b8008dbca117b2e0655cfdd54655fac48-dirty diff -r 000000000000 -r 4bde3e90ee98 CreateAssemblyPicklists_script.py --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/CreateAssemblyPicklists_script.py Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,588 @@ +#!/usr/bin/env python +# coding: utf-8 +# Code copied from CUBA backend tools.py and create_assembly_picklists/CreateAssemblyPicklistsView.py +# Code modified for running in a script in Galaxy. +############################################################################## +############################################################################## +# App code +## EGF Galaxy Create assembly picklists -- script + +############################################################################## +# IMPORTS +import argparse +import os +from io import StringIO, BytesIO +import re +from base64 import b64encode, b64decode +from copy import deepcopy +import sys + +from collections import OrderedDict +from fuzzywuzzy import process +import matplotlib.pyplot as plt +from matplotlib.backends.backend_pdf import PdfPages +import pandas + +from Bio import SeqIO +from Bio.SeqRecord import SeqRecord +from Bio.Seq import Seq + +import bandwagon as bw +import crazydoc +from dnachisel.biotools import sequence_to_biopython_record +import dnacauldron +import flametree +from plateo import AssemblyPlan +from plateo.parsers import plate_from_content_spreadsheet +from plateo.containers import Plate4ti0960 +from plateo.exporters import AssemblyPicklistGenerator, picklist_to_assembly_mix_report +from plateo.exporters import ( + picklist_to_labcyte_echo_picklist_file, + picklist_to_tecan_evo_picklist_file, + plate_to_platemap_spreadsheet, + PlateTextPlotter, +) +from plateo.tools import human_volume +from snapgene_reader import snapgene_file_to_seqrecord + + +############################################################################## +# FUNCTIONS + +def fix_and_rename_paths(paths): + fixed_paths = [] + for path in paths: + new_path = path.replace("__sq__", "'") + if new_path != path: + os.rename(path, new_path) + fixed_paths.append(new_path) + return fixed_paths + + +def did_you_mean(name, other_names, limit=5, min_score=50): # test + results = process.extract(name, list(other_names), limit=limit) + return [e for (e, score) in results if score >= min_score] + + +def fix_ice_genbank(genbank_txt): + lines = genbank_txt.splitlines() + lines[0] += max(0, 80 - len(lines[0])) * " " + return "\n".join(lines) + + +def write_record(record, target, fmt="genbank"): + """Write a record as genbank, fasta, etc. via Biopython, with fixes""" + record = deepcopy(record) + if fmt == "genbank": + if isinstance(record, (list, tuple)): + for r in record: + r.name = r.name[:20] + else: + record.name = record.name[:20] + if hasattr(target, "open"): + target = target.open("w") + SeqIO.write(record, target, fmt) + + +def autoname_genbank_file(record): + return record.id.replace(".", "_") + ".gb" + + +def string_to_records(string): + """Convert a string of a fasta, genbank... into a simple ATGC string. + + Can also be used to detect a format. + """ + matches = re.match("([ATGC][ATGC]*)", string) + # print("============", len(matches.groups()[0]), len(string)) + # print (matches.groups()[0] == string) + if (matches is not None) and (matches.groups()[0] == string): + return [SeqRecord(Seq(string))], "ATGC" + + for fmt in ("fasta", "genbank"): + if fmt == "genbank": + string = fix_ice_genbank(string) + try: + stringio = StringIO(string) + records = list(SeqIO.parse(stringio, fmt)) + if len(records) > 0: + return (records, fmt) + except: + pass + try: + record = snapgene_file_to_seqrecord(filecontent=StringIO(string)) + return [record] + except: + pass + raise ValueError("Invalid sequence format") + + +def file_to_filelike_object(file_, type="byte"): + content = file_.content.split("base64,")[1] + filelike = BytesIO if (type == "byte") else StringIO + return filelike(b64decode(content)) + + +def spreadsheet_file_to_dataframe(filedict, header="infer"): + filelike = file_to_filelike_object(filedict) + if filedict.name.endswith(".csv"): + return pandas.read_csv(filelike, header=header) + else: + return pandas.read_excel(filelike, header=header) + + +def records_from_zip_file(zip_file, use_file_names_as_ids=False): + zip_name = zip_file.name + zip_file = flametree.file_tree(file_to_filelike_object(zip_file)) + records = [] + for f in zip_file._all_files: + ext = f._extension.lower() + if ext in ["gb", "gbk", "fa", "dna"]: + try: + new_records, fmt = string_to_records(f.read()) + if not isinstance(new_records, list): + new_records = [new_records] + except: + content_stream = BytesIO(f.read("rb")) + try: + record = snapgene_file_to_seqrecord(fileobject=content_stream) + new_records, fmt = [record], "snapgene" + except: + try: + parser = crazydoc.CrazydocParser( + ["highlight_color", "bold", "underline"] + ) + new_records = parser.parse_doc_file(content_stream) + fmt = "doc" + except: + raise ValueError("Format not recognized for file " + f._path) + + single_record = len(new_records) == 1 + for i, record in enumerate(new_records): + name = record.id + if name in [ + None, + "", + "", + ".", + " ", + "", + ]: + number = "" if single_record else ("%04d" % i) + name = f._name_no_extension.replace(" ", "_") + number + record.id = name + record.name = name + record.file_name = f._name_no_extension + record.zip_file_name = zip_name + if use_file_names_as_ids and single_record: + basename = os.path.basename(record.file_name) + basename_no_extension = os.path.splitext(basename)[0] + record.id = basename_no_extension + records += new_records + return records + + +def records_from_data_file(data_file): + content = b64decode(data_file.content.split("base64,")[1]) + try: + records, fmt = string_to_records(content.decode("utf-8")) + except: + try: + record = snapgene_file_to_seqrecord(fileobject=BytesIO(content)) + records, fmt = [record], "snapgene" + except: + try: + parser = crazydoc.CrazydocParser( + ["highlight_color", "bold", "underline"] + ) + records = parser.parse_doc_file(BytesIO(content)) + fmt = "doc" + except: + try: + df = spreadsheet_file_to_dataframe(data_file, header=None) + records = [ + sequence_to_biopython_record(sequence=seq, id=name, name=name) + for name, seq in df.values + ] + fmt = "spreadsheet" + except: + raise ValueError("Format not recognized for file " + data_file.name) + if not isinstance(records, list): + records = [records] + return records, fmt + + +def record_to_formated_string(record, fmt="genbank", remove_descr=False): + if remove_descr: + record = deepcopy(record) + if isinstance(record, (list, tuple)): + for r in record: + r.description = "" + else: + record.description = "" + fileobject = StringIO() + write_record(record, fileobject, fmt) + return fileobject.getvalue().encode("utf-8") + + +def records_from_data_files(data_files, use_file_names_as_ids=False): + records = [] + for file_ in data_files: + circular = ("circular" not in file_) or file_.circular + if file_.name.lower().endswith("zip"): + records += records_from_zip_file( + file_, use_file_names_as_ids=use_file_names_as_ids + ) + continue + recs, fmt = records_from_data_file(file_) + single_record = len(recs) == 1 + for i, record in enumerate(recs): + record.circular = circular + record.linear = not circular + name_no_extension = "".join(file_.name.split(".")[:-1]) + name = name_no_extension + ("" if single_record else ("%04d" % i)) + name = name.replace(" ", "_") + UNKNOWN_IDS = [ + "None", + "", + "", + ".", + "EXPORTED", + "", + "Exported", + ] + # Sorry for this parts, it took a lot of "whatever works". + # keep your part names under 20c and pointless, and everything + # will be good + if str(record.id).strip() in UNKNOWN_IDS: + record.id = name + if str(record.name).strip() in UNKNOWN_IDS: + record.name = name + record.file_name = name_no_extension + if use_file_names_as_ids and single_record: + basename = os.path.basename(record.source_file) + basename_no_extension = os.path.splitext(basename)[0] + record.id = basename_no_extension + records += recs + return records + + +def data_to_html_data(data, datatype, filename=None): + """Data types: zip, genbank, fasta, pdf""" + datatype = { + "zip": "application/zip", + "genbank": "application/genbank", + "fasta": "application/fasta", + "pdf": "application/pdf", + "xlsx": "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet", + }.get(datatype, datatype) + datatype = "data:%s;" % datatype + data64 = "base64,%s" % b64encode(data).decode("utf-8") + headers = "" + if filename is not None: + headers += "headers=filename%3D" + filename + ";" + return datatype + headers + data64 + + +def zip_data_to_html_data(data): + return data_to_html_data(data, "application/zip") + + +LADDERS = {"100_to_4k": bw.ladders.LADDER_100_to_4k} + + +def matplotlib_figure_to_svg_base64_data(fig, **kwargs): + """Return a string of the form 'data:image/svg+xml;base64,XXX' where XXX + is the base64-encoded svg version of the figure.""" + output = BytesIO() + fig.savefig(output, format="svg", **kwargs) + svg_txt = output.getvalue().decode("utf-8") + svg_txt = "\n".join(svg_txt.split("\n")[4:]) + svg_txt = "".join(svg_txt.split("\n")) + + content = b64encode(svg_txt.encode("utf-8")) + result = (b"data:image/svg+xml;base64," + content).decode("utf-8") + + return result + + +def matplotlib_figure_to_bitmap_base64_data(fig, fmt="png", **kwargs): + """Return a string of the form 'data:image/png;base64,XXX' where XXX + is the base64-encoded svg version of the figure.""" + output = BytesIO() + fig.savefig(output, format=fmt, **kwargs) + bitmap = output.getvalue() + content = b64encode(bitmap) + result = (b"data:image/%s;base64,%s" % (fmt.encode("utf-8"), content)).decode( + "utf-8" + ) + return result + + +def figures_to_pdf_report_data(figures, filename="report.pdf"): + pdf_io = BytesIO() + with PdfPages(pdf_io) as pdf: + for fig in figures: + pdf.savefig(fig, bbox_inches="tight") + return { + "data": ( + "data:application/pdf;base64," + + b64encode(pdf_io.getvalue()).decode("utf-8") + ), + "name": filename, + "mimetype": "application/pdf", + } + + +def csv_to_list(csv_string, sep=","): + return [ + element.strip() + for line in csv_string.split("\n") + for element in line.split(sep) + if len(element.strip()) + ] + + +def set_record_topology(record, topology): + """Set the Biopython record's topology, possibly passing if already set. + + This actually sets the ``record.annotations['topology']``.The ``topology`` + parameter can be "circular", "linear", "default_to_circular" (will default + to circular if ``annotations['topology']`` is not already set) or + "default_to_linear". + """ + valid_topologies = [ + "circular", + "linear", + "default_to_circular", + "default_to_linear", + ] + if topology not in valid_topologies: + raise ValueError( + "topology (%s) should be one of %s." + % (topology, ", ".join(valid_topologies)) + ) + annotations = record.annotations + default_prefix = "default_to_" + if topology.startswith(default_prefix): + if "topology" not in annotations: + annotations["topology"] = topology[len(default_prefix) :] + else: + annotations["topology"] = topology + + +############################################################################## +def main(): + + parser = argparse.ArgumentParser(description="Generate picklist for DNA assembly.") + parser.add_argument("--parts_files", help="Directory with parts data or file with part sizes") + parser.add_argument("--picklist", type=str, help="Path to the assembly plan CSV or Excel file") + parser.add_argument("--source_plate", help="Source plate file (CSV or Excel)") + parser.add_argument("--backbone_name", help="Name of the backbone") + parser.add_argument("--result_zip", help="Name of the output zip file") + parser.add_argument("--part_backbone_ratio", type=float, help="Part to backbone molar ratio") + parser.add_argument("--quantity_unit", choices=["fmol", "nM", "ng"], help="Quantity unit") + parser.add_argument("--part_quantity", type=float, help="Quantity of each part") + parser.add_argument("--buffer_volume", type=float, help="Buffer volume in µL") + parser.add_argument("--total_volume", type=float, help="Total reaction volume in µL") + parser.add_argument("--dispenser", choices=["labcyte_echo", "tecan_evo"], help="Dispenser machine") + + args = parser.parse_args() + + # Parameters: + picklist = args.picklist # assembly plan + # directory or can be a csv/Excel with part sizes + if isinstance(args.parts_files, str): + args.parts_files = args.parts_files.split(",") + parts_dir = fix_and_rename_paths(args.parts_files) + source_plate_path = args.source_plate + backbone_name = args.backbone_name + part_backbone_ratio = args.part_backbone_ratio + result_zip_file = args.result_zip # output file name "picklist.zip" + ############################################################################## + # Defaults: + destination_plate = None + destination_type = "new" # this parameter is not actually used + destination_size = 96 # this parameter is not actually used + fill_by = "column" # this parameter is not actually used + quantity_unit = args.quantity_unit + part_quantity = args.part_quantity # 1.3 + buffer_volume = args.buffer_volume # 0.3 # (µL) + total_volume = args.total_volume # 1 # (µL) + dispenser_machine = args.dispenser + dispenser_min_volume = 0.5 # (nL), this parameter is not actually used + dispenser_max_volume = 5 # (µL), this parameter is not actually used + dispenser_resolution = 2.5 # (nL), this parameter is not actually used + dispenser_dead_volume = 8 # (µL), this parameter is not actually used + use_file_names_as_ids = True + + # CODE + if picklist.endswith(".csv"): + csv = picklist.read().decode() + rows = [line.split(",") for line in csv.split("\n") if len(line)] + else: + dataframe = pandas.read_excel(picklist) + rows = [row for i, row in dataframe.iterrows()] + + assembly_plan = AssemblyPlan( + OrderedDict( + [ + ( + row[0], + [ + str(e).strip() + for e in row[1:] + if str(e).strip() not in ["-", "nan", ""] + ], + ) + for row in rows + if row[0] not in ["nan", "Construct name", "constructs", "construct"] + ] + ) + ) + for assembly, parts in assembly_plan.assemblies.items(): + assembly_plan.assemblies[assembly] = [part.replace(" ", "_") for part in parts] + + # Reading part infos + if not isinstance(parts_dir, list): + if parts_dir.endswith((".csv", ".xls", ".xlsx")): # part sizes specified in table + if parts_dir.endswith(".csv"): + dataframe = pandas.read_csv(parts_dir) + else: + dataframe = pandas.read_excel(parts_dir) + parts_data = {row.part: {"size": row["size"]} for i, row in dataframe.iterrows()} + else: # input records + records = dnacauldron.biotools.load_records_from_files( + files=parts_dir, use_file_names_as_ids=use_file_names_as_ids + ) + parts_data = {rec.id.replace(" ", "_").lower(): {"record": rec} for rec in records} + #parts_data = process_parts_with_mapping(records, args.file_name_mapping) + assembly_plan.parts_data = parts_data + parts_without_data = assembly_plan.parts_without_data() + if len(parts_without_data): + print("success: False") + print("message: Some parts have no provided record or data.") + print("missing_parts: ", parts_without_data) + sys.exit() + # Reading protocol + if quantity_unit == "fmol": + part_mol = part_quantity * 1e-15 + part_g = None + if quantity_unit == "nM": + part_mol = part_quantity * total_volume * 1e-15 + part_g = None + if quantity_unit == "ng": + part_mol = None + part_g = part_quantity * 1e-9 + # Backbone:part molar ratio calculation is not performed in this case. + # This ensures no change regardless of form input: + part_backbone_ratio = 1 + print("Generating picklist") + picklist_generator = AssemblyPicklistGenerator( + part_mol=part_mol, + part_g=part_g, + complement_to=total_volume * 1e-6, # convert uL to L + buffer_volume=buffer_volume * 1e-6, + volume_rounding=2.5e-9, # not using parameter from form + minimal_dispense_volume=5e-9, # Echo machine's minimum dispense - + ) + backbone_name_list = backbone_name.split(",") + source_plate = plate_from_content_spreadsheet(source_plate_path) + + for well in source_plate.iter_wells(): + if well.is_empty: + continue + quantities = well.content.quantities + part, quantity = list(quantities.items())[0] + quantities.pop(part) + quantities[part.replace(" ", "_")] = quantity + + if part in backbone_name_list: + # This section multiplies the backbone concentration with the + # part:backbone molar ratio. This tricks the calculator into making + # a picklist with the desired ratio. + # For example, a part:backbone = 2:1 will multiply the + # backbone concentration by 2, therefore half as much of it will be + # added to the well. + quantities[part.replace(" ", "_")] = quantity * part_backbone_ratio + else: + quantities[part.replace(" ", "_")] = quantity + + source_plate.name = "Source" + if destination_plate: + dest_filelike = file_to_filelike_object(destination_plate) + destination_plate = plate_from_content_spreadsheet(destination_plate) + else: + destination_plate = Plate4ti0960("Mixplate") + destination_wells = ( + well for well in destination_plate.iter_wells(direction="column") if well.is_empty + ) + picklist, picklist_data = picklist_generator.make_picklist( + assembly_plan, + source_wells=source_plate.iter_wells(), + destination_wells=destination_wells, + ) + if picklist is None: + print("success: False") + print("message: Some parts in the assembly plan have no corresponding well.") + print("picklist_data: ", picklist_data) + print("missing_parts:", picklist_data.get("missing_parts", None)) + sys.exit() + + future_plates = picklist.simulate(inplace=False) + + + def text(w): + txt = human_volume(w.content.volume) + if "construct" in w.data: + txt = "\n".join([w.data["construct"], txt]) + return txt + + + plotter = PlateTextPlotter(text) + ax, _ = plotter.plot_plate(future_plates[destination_plate], figsize=(20, 8)) + + ziproot = flametree.file_tree(result_zip_file, replace=True) + + # MIXPLATE MAP PLOT + ax.figure.savefig( + ziproot._file("final_mixplate.pdf").open("wb"), + format="pdf", + bbox_inches="tight", + ) + plt.close(ax.figure) + plate_to_platemap_spreadsheet( + future_plates[destination_plate], + lambda w: w.data.get("construct", ""), + filepath=ziproot._file("final_mixplate.xls").open("wb"), + ) + + # ASSEMBLY REPORT + print("Writing report...") + picklist_to_assembly_mix_report( + picklist, + ziproot._file("assembly_mix_picklist_report.pdf").open("wb"), + data=picklist_data, + ) + assembly_plan.write_report(ziproot._file("assembly_plan_summary.pdf").open("wb")) + + # MACHINE PICKLIST + + if dispenser_machine == "labcyte_echo": + picklist_to_labcyte_echo_picklist_file( + picklist, ziproot._file("ECHO_picklist.csv").open("w") + ) + else: + picklist_to_tecan_evo_picklist_file( + picklist, ziproot._file("EVO_picklist.gwl").open("w") + ) + # We'll not write the input source plate. + # raw = file_to_filelike_object(source_plate_path).read() + # f = ziproot.copy(source_plate_path) + # f.write(raw, mode="wb") + ziproot._close() + print("success: True") + + +if __name__ == "__main__": + main() diff -r 000000000000 -r 4bde3e90ee98 create_assembly_picklists.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/create_assembly_picklists.xml Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,206 @@ + + Provide a source plate map and an assembly plan, get a robotic picklist spreadsheet for Tecan EVO or Labcyte Echo + + 0 + 0.1.0 + + + fuzzywuzzy + bandwagon + biopython + crazydoc + dnacauldron + dnachisel + flametree + plateo + snapgene-reader + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + `_ + + ]]> + + + @unpublished{create_assembly_picklists + author = {Ramiz Khaled}, + title = {{create_assembly_picklists}}, + url = {https://github.com/Edinburgh-Genome-Foundry/CUBA/blob/master/backend/app/views/create_assembly_picklists/CreateAssemblyPicklistsView.py}, + } + + + diff -r 000000000000 -r 4bde3e90ee98 output.html --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/output.html Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,291 @@ + + + + + + + Test Results (powered by Planemo) + + + + + + + + + + +
+
+
+
+ + + + + + + \ No newline at end of file diff -r 000000000000 -r 4bde3e90ee98 output.json --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/output.json Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,559 @@ +{ + "summary": { + "num_errors": 0, + "num_failures": 0, + "num_skips": 0, + "num_tests": 1 + }, + "tests": [ + { + "data": { + "inputs": { + "backbone_name": "HC_Amp_ccdB", + "buffer_volume": "0.3", + "dispenser": "labcyte_echo", + "genbank_files": { + "id": "22956832477b7615", + "src": "hdca" + }, + "part_backbone_ratio": "1", + "part_quantity": "1.3", + "picklist": { + "id": "4a52c33acfdf00c5", + "src": "hda" + }, + "quantity_unit": "fmol", + "source_plate": { + "id": "96bb517ec4711730", + "src": "hda" + }, + "total_volume": "1.0" + }, + "job": { + "command_line": "mkdir renamed_parts && touch 'picklist.zip' && touch 'source_plate.xlsx' && cp '/tmp/tmpi_f681b6/files/6/5/a/dataset_65ad9574-cb7e-4ed9-ad0c-017016d8e92f.dat' 'renamed_parts/HC_Amp_ccdB.gb' && cp '/tmp/tmpi_f681b6/files/1/f/a/dataset_1faa2257-725e-44e8-b913-740b6a05f8b2.dat' 'renamed_parts/conn a-c.gb' && cp '/tmp/tmpi_f681b6/files/f/f/a/dataset_ffa5bc2e-4322-4782-b1d2-c7dc9ba04350.dat' 'renamed_parts/conn b-e.gb' && cp '/tmp/tmpi_f681b6/files/9/9/1/dataset_9919b791-4b3f-47c6-a20a-a5c2d697fabc.dat' 'renamed_parts/conn b-l.gb' && cp '/tmp/tmpi_f681b6/files/f/0/b/dataset_f0b15343-39ee-40cb-8765-a4a84b7e0ea4.dat' 'renamed_parts/conn d-e.gb' && cp '/tmp/tmpi_f681b6/files/5/3/0/dataset_53023c35-65f6-4008-b84d-72fb7ecc4cba.dat' 'renamed_parts/conn d-f.gb' && cp '/tmp/tmpi_f681b6/files/4/3/4/dataset_4345db76-3776-4c15-a608-cbfcbf1755ce.dat' 'renamed_parts/conn h-ha.gb' && cp '/tmp/tmpi_f681b6/files/2/f/9/dataset_2f98e110-7de4-422d-938e-177083ccfe5e.dat' 'renamed_parts/conn h-j.gb' && cp '/tmp/tmpi_f681b6/files/7/2/d/dataset_72d9fac0-2dc0-4147-92fb-e2bf5f75ed19.dat' 'renamed_parts/conn h-k.gb' && cp '/tmp/tmpi_f681b6/files/d/9/b/dataset_d9be0a23-55cb-4592-b3d9-eafb7a36220a.dat' 'renamed_parts/conn j-k.gb' && cp '/tmp/tmpi_f681b6/files/6/d/6/dataset_6d658022-b983-478e-8bc2-5e48f4e9c43b.dat' 'renamed_parts/conn l-n.gb' && cp '/tmp/tmpi_f681b6/files/5/7/8/dataset_5782320b-be5f-42fe-84af-f18bf7fa7ff2.dat' 'renamed_parts/conn l-r.gb' && cp '/tmp/tmpi_f681b6/files/b/7/6/dataset_b76e327a-3d5f-46b9-8d8d-b6b1c674db62.dat' 'renamed_parts/conn l-w.gb' && cp '/tmp/tmpi_f681b6/files/e/5/8/dataset_e58ab596-bdd8-4979-b1b4-99de2bf5b786.dat' 'renamed_parts/conn l-y.gb' && cp '/tmp/tmpi_f681b6/files/0/2/2/dataset_0224af58-bad1-42aa-becf-782d052b9730.dat' 'renamed_parts/conn q-r.gb' && cp '/tmp/tmpi_f681b6/files/e/d/c/dataset_edc15a94-7091-49ef-a34a-8eb3cd7ca528.dat' 'renamed_parts/conn r-w.gb' && cp '/tmp/tmpi_f681b6/files/8/e/3/dataset_8e3e7394-9770-4b0d-ac91-8327bd03f38c.dat' 'renamed_parts/conn t-v.gb' && cp '/tmp/tmpi_f681b6/files/d/d/2/dataset_dd245a49-5f5a-4d4e-b031-9cfff85b2ca8.dat' 'renamed_parts/conn w-x.gb' && cp '/tmp/tmpi_f681b6/files/a/f/e/dataset_afe91b71-315b-42e5-8caa-baf20351c00e.dat' 'renamed_parts/conn w-y.gb' && cp '/tmp/tmpi_f681b6/files/5/6/9/dataset_569452b3-a597-4dae-8353-5698bb45e241.dat' 'renamed_parts/conn w-z.gb' && cp '/tmp/tmpi_f681b6/files/c/1/d/dataset_c1d1c48c-5a8d-4e02-bb7d-46709b68de02.dat' 'renamed_parts/conn y-z.gb' && cp '/tmp/tmpi_f681b6/files/1/7/2/dataset_1722a1aa-e93a-4dea-a12d-adf2cff1d731.dat' 'renamed_parts/p10_tet-aptazyme.gb' && cp '/tmp/tmpi_f681b6/files/b/7/5/dataset_b75067eb-fc50-4b79-8bc5-73d73d9781ef.dat' 'renamed_parts/p11_sv40polya.gb' && cp '/tmp/tmpi_f681b6/files/e/a/0/dataset_ea0ef964-5b83-461c-8f1e-37f12a58dd38.dat' 'renamed_parts/p14_cmvp.gb' && cp '/tmp/tmpi_f681b6/files/3/8/1/dataset_381711b9-d963-4d77-bd66-b878668cde1c.dat' 'renamed_parts/p14_sv40p.gb' && cp '/tmp/tmpi_f681b6/files/e/3/f/dataset_e3f44043-cf5b-4bd2-b979-ed700373c731.dat' 'renamed_parts/p15_puror.gb' && cp '/tmp/tmpi_f681b6/files/1/d/6/dataset_1d69d1c7-6187-4bbe-aa06-c6c0ea9f1950.dat' 'renamed_parts/p16_bghpolya.gb' && cp '/tmp/tmpi_f681b6/files/7/a/5/dataset_7a5296ca-c574-4acf-b3e3-091fb9c2990e.dat' 'renamed_parts/p18_cmvp.gb' && cp '/tmp/tmpi_f681b6/files/4/4/9/dataset_449256af-869e-4132-9b78-4b176ea4926b.dat' 'renamed_parts/p18_ef1ap.gb' && cp '/tmp/tmpi_f681b6/files/b/9/b/dataset_b9b9cbf1-2afe-44ee-a71a-afebbf0187dc.dat' 'renamed_parts/p19_mneogreen.gb' && cp '/tmp/tmpi_f681b6/files/3/a/6/dataset_3a6792a7-38c1-42dd-8305-dd93c32d7752.dat' 'renamed_parts/p19_mruby2.gb' && cp '/tmp/tmpi_f681b6/files/3/5/1/dataset_35150438-cb43-4514-ba03-53e8fc4f2d62.dat' 'renamed_parts/p19_mtagbfp2.gb' && cp '/tmp/tmpi_f681b6/files/0/a/2/dataset_0a225817-00b7-45f7-961a-c767931ae92a.dat' 'renamed_parts/p19_tet-on-3g.gb' && cp '/tmp/tmpi_f681b6/files/1/3/f/dataset_13f22279-3a7a-481e-90a1-582485b0b90b.dat' 'renamed_parts/p1_5__sq__-itr-pb.gb' && cp '/tmp/tmpi_f681b6/files/0/4/c/dataset_04c05bd3-d589-4b86-8dcf-2a510f7df24f.dat' 'renamed_parts/p1_5__sq__ha-haavs1.gb' && cp '/tmp/tmpi_f681b6/files/6/8/7/dataset_68796f1c-a5e8-4865-b648-a6f1cfe8e10e.dat' 'renamed_parts/p20_ct-minute-nes.gb' && cp '/tmp/tmpi_f681b6/files/a/1/d/dataset_a1d6d6e9-0b10-47c3-b209-f003b1af9ec7.dat' 'renamed_parts/p20_ct-nes.gb' && cp '/tmp/tmpi_f681b6/files/d/7/0/dataset_d7061143-d1cd-4a08-a0c7-b1ccc9e4368b.dat' 'renamed_parts/p20_linker3.gb' && cp '/tmp/tmpi_f681b6/files/2/6/a/dataset_26a8e2e7-3757-47f5-a3b3-d957b7989b06.dat' 'renamed_parts/p20_p2a.gb' && cp '/tmp/tmpi_f681b6/files/6/7/3/dataset_673db7f6-df1b-46e4-923d-7a4b284fe47d.dat' 'renamed_parts/p21_dmra.gb' && cp '/tmp/tmpi_f681b6/files/5/1/9/dataset_519edf0f-9bc9-44c8-9bc4-9b1e6424d39c.dat' 'renamed_parts/p21_mkate2.gb' && cp '/tmp/tmpi_f681b6/files/f/d/5/dataset_fd517323-7c60-4f3e-a05d-266834a5393c.dat' 'renamed_parts/p21_mneogreen.gb' && cp '/tmp/tmpi_f681b6/files/0/6/c/dataset_06c5513c-abd2-4bfd-8519-668f761bd209.dat' 'renamed_parts/p21_mruby2.gb' && cp '/tmp/tmpi_f681b6/files/e/6/1/dataset_e61642a5-7006-4448-9cbe-e2d1572f1e80.dat' 'renamed_parts/p21_mtagbfp2.gb' && cp '/tmp/tmpi_f681b6/files/1/a/3/dataset_1a39752e-bc76-4f46-af81-a49926ff7224.dat' 'renamed_parts/p21_puror.gb' && cp '/tmp/tmpi_f681b6/files/f/d/3/dataset_fd351f42-4e3e-42ef-9725-4519573160c1.dat' 'renamed_parts/p22_pgkpolya.gb' && cp '/tmp/tmpi_f681b6/files/d/8/3/dataset_d8375e27-175d-49bd-b07a-2bdfd106f91a.dat' 'renamed_parts/p23_insulatorfb.gb' && cp '/tmp/tmpi_f681b6/files/7/c/4/dataset_7c405a03-cda8-4a5b-a966-a7da9ae36c90.dat' 'renamed_parts/p24_3__sq__ha_haavs1.gb' && cp '/tmp/tmpi_f681b6/files/6/e/7/dataset_6e7c3d1a-4b60-445a-a096-6ffa32d1b8cf.dat' 'renamed_parts/p24_3__sq__pb.gb' && cp '/tmp/tmpi_f681b6/files/8/4/8/dataset_848133c3-608d-4627-bbdd-ed937d1b009b.dat' 'renamed_parts/p25_sv40-ori.gb' && cp '/tmp/tmpi_f681b6/files/9/6/2/dataset_962361d5-701f-4da5-a707-427069091566.dat' 'renamed_parts/p2_insulatorfb.gb' && cp '/tmp/tmpi_f681b6/files/7/c/6/dataset_7c6f7c5d-19e3-4bee-9983-7ff75d39a153.dat' 'renamed_parts/p3_cagp.gb' && cp '/tmp/tmpi_f681b6/files/1/0/4/dataset_1042cf17-45cf-442e-b581-96bc3a5697ef.dat' 'renamed_parts/p3_cmvp_tet.gb' && cp '/tmp/tmpi_f681b6/files/c/1/1/dataset_c1115334-9b18-450e-ae1b-05e6706ee51b.dat' 'renamed_parts/p3_ef1ap.gb' && cp '/tmp/tmpi_f681b6/files/c/5/7/dataset_c570d71e-f33b-409d-a2d0-14f18b0d10ae.dat' 'renamed_parts/p3_tre3gp.gb' && cp '/tmp/tmpi_f681b6/files/4/8/d/dataset_48dd67ab-6056-4031-a5d1-427d923f56eb.dat' 'renamed_parts/p4_kt-l7ae -weiss.gb' && cp '/tmp/tmpi_f681b6/files/9/0/2/dataset_902c955b-e1b8-4afd-92d3-457a80da0742.dat' 'renamed_parts/p4_lac-o.gb' && cp '/tmp/tmpi_f681b6/files/4/f/3/dataset_4f383ead-bfd0-4985-bf88-8d2ae49772cc.dat' 'renamed_parts/p5_attb-bxb1.gb' && cp '/tmp/tmpi_f681b6/files/6/9/6/dataset_6965cbd4-0f66-43ad-a070-bed75261ba22.dat' 'renamed_parts/p5_attp-bxb1.gb' && cp '/tmp/tmpi_f681b6/files/a/1/e/dataset_a1e9dbf9-630b-4bb0-9aa7-b2e6fd221e1e.dat' 'renamed_parts/p5_k1-k1.gb' && cp '/tmp/tmpi_f681b6/files/5/0/2/dataset_50264e85-1143-4c12-9480-92a65c32e337.dat' 'renamed_parts/p5_kt-weiss.gb' && cp '/tmp/tmpi_f681b6/files/d/6/c/dataset_d6c9799f-e997-4941-8fe1-542759627558.dat' 'renamed_parts/p6_atg_boxc.gb' && cp '/tmp/tmpi_f681b6/files/6/f/8/dataset_6f86fba6-a5c1-44b4-b120-5016be553d5f.dat' 'renamed_parts/p6_kozak-atg.gb' && cp '/tmp/tmpi_f681b6/files/5/b/f/dataset_5bfaae1d-572d-4b11-ab85-f631cad39c43.dat' 'renamed_parts/p6_nt-igkl sequence.gb' && cp '/tmp/tmpi_f681b6/files/2/4/a/dataset_24ac6f21-53b5-43df-b49a-45639e939b5a.dat' 'renamed_parts/p6_nt-mls.gb' && cp '/tmp/tmpi_f681b6/files/8/1/8/dataset_8189baf0-93d3-4154-88f6-36203604b72f.dat' 'renamed_parts/p6_nt-myristoylation signal.gb' && cp '/tmp/tmpi_f681b6/files/7/1/b/dataset_71b1daec-ec14-4573-b1df-3e58bc4f0281.dat' 'renamed_parts/p6_nt-palm sequence.gb' && cp '/tmp/tmpi_f681b6/files/8/c/2/dataset_8c2bc0ea-6597-4734-9b07-1d8725b16872.dat' 'renamed_parts/p6_nt-sv40_nls.gb' && cp '/tmp/tmpi_f681b6/files/5/d/c/dataset_5dcc9d84-fcfa-4e4d-8c36-e07d9d6b4242.dat' 'renamed_parts/p7_bxb1.gb' && cp '/tmp/tmpi_f681b6/files/1/c/b/dataset_1cb6cb47-5783-4105-9401-4de98f7c6bc4.dat' 'renamed_parts/p7_l7ae-weiss.gb' && cp '/tmp/tmpi_f681b6/files/0/6/2/dataset_0623f4b7-0f93-459b-b0d7-8f4447eaa364.dat' 'renamed_parts/p7_l7ae.gb' && cp '/tmp/tmpi_f681b6/files/3/8/0/dataset_380607e0-8ad8-42a9-9e23-8d6072f908b6.dat' 'renamed_parts/p7_laci.gb' && cp '/tmp/tmpi_f681b6/files/b/7/a/dataset_b7a0879c-cef5-4258-8aca-7ef791bf490e.dat' 'renamed_parts/p7_mcherry.gb' && cp '/tmp/tmpi_f681b6/files/1/8/6/dataset_1862996f-08df-43f9-b5a6-4f3a575fe15e.dat' 'renamed_parts/p7_mkate2.gb' && cp '/tmp/tmpi_f681b6/files/2/6/e/dataset_26e3c60c-a237-4788-bedf-0548f92609f8.dat' 'renamed_parts/p7_mneogreen.gb' && cp '/tmp/tmpi_f681b6/files/0/9/7/dataset_09796d17-4be1-4d23-adae-afe292ccaade.dat' 'renamed_parts/p7_mruby2.gb' && cp '/tmp/tmpi_f681b6/files/9/d/1/dataset_9d1be7f1-28b6-48f7-ae0a-cbd2539d46c9.dat' 'renamed_parts/p7_mtagbfp2.gb' && cp '/tmp/tmpi_f681b6/files/d/6/c/dataset_d6cc98fa-6c64-4142-b743-bf285efb60b2.dat' 'renamed_parts/p8_linker1.gb' && cp '/tmp/tmpi_f681b6/files/b/f/d/dataset_bfdb38df-269b-45ea-8d6a-2694c36e17e6.dat' 'renamed_parts/p8_linker2.gb' && cp '/tmp/tmpi_f681b6/files/c/8/9/dataset_c89959ed-0b3f-4f53-b9d9-586f22a1af09.dat' 'renamed_parts/p8_p2a.gb' && cp '/tmp/tmpi_f681b6/files/d/f/e/dataset_dfea1759-69a9-4153-9464-1dca6276ceab.dat' 'renamed_parts/p8a_ct-kdel.gb' && cp '/tmp/tmpi_f681b6/files/b/3/7/dataset_b37d1c2e-0398-4e9e-b9b4-278d94fc4c0f.dat' 'renamed_parts/p8b_ires2.gb' && cp '/tmp/tmpi_f681b6/files/4/1/b/dataset_41ba1b68-ae25-48b4-a111-d7b89adf08d1.dat' 'renamed_parts/p9_a-tubulin.gb' && cp '/tmp/tmpi_f681b6/files/b/f/3/dataset_bf38856e-5049-4935-8e4a-72c2d8a951b7.dat' 'renamed_parts/p9_bsdr.gb' && cp '/tmp/tmpi_f681b6/files/2/b/0/dataset_2b022cd4-7278-4f6c-9080-4c6ff76217af.dat' 'renamed_parts/p9_dmrc.gb' && cp '/tmp/tmpi_f681b6/files/9/b/6/dataset_9b6085ca-d78d-42ef-90f1-efe5818c89eb.dat' 'renamed_parts/p9_firefly luciferase.gb' && cp '/tmp/tmpi_f681b6/files/e/8/d/dataset_e8d37f0f-fa56-4630-8829-1428ed44aff8.dat' 'renamed_parts/p9_mneogreen.gb' && cp '/tmp/tmpi_f681b6/files/5/5/f/dataset_55f63be7-f651-4029-8fb0-10853d6485a5.dat' 'renamed_parts/p9_mruby2.gb' && cp '/tmp/tmpi_f681b6/files/a/d/e/dataset_adea274e-bd6b-49de-84e6-967c9eddabb0.dat' 'renamed_parts/p9_mtagbfp2.gb' && cp '/tmp/tmpi_f681b6/files/5/b/4/dataset_5b424011-b574-4059-afe3-5a241314eff1.dat' 'renamed_parts/p9_neor.gb' && cp '/tmp/tmpi_f681b6/files/9/e/e/dataset_9eeff8cb-fa3a-4c17-b006-2ba69cb7c047.dat' 'renamed_parts/p9_puror.gb' && cp '/tmp/tmpi_f681b6/files/3/0/0/dataset_300aad29-8d06-4ab2-9142-91a91c247985.dat' 'source_plate.xlsx' && python '/home/rkhaled/galaxytools/tools/create_assembly_picklists/CreateAssemblyPicklists_script.py' --parts_files 'renamed_parts/HC_Amp_ccdB.gb,renamed_parts/conn a-c.gb,renamed_parts/conn b-e.gb,renamed_parts/conn b-l.gb,renamed_parts/conn d-e.gb,renamed_parts/conn d-f.gb,renamed_parts/conn h-ha.gb,renamed_parts/conn h-j.gb,renamed_parts/conn h-k.gb,renamed_parts/conn j-k.gb,renamed_parts/conn l-n.gb,renamed_parts/conn l-r.gb,renamed_parts/conn l-w.gb,renamed_parts/conn l-y.gb,renamed_parts/conn q-r.gb,renamed_parts/conn r-w.gb,renamed_parts/conn t-v.gb,renamed_parts/conn w-x.gb,renamed_parts/conn w-y.gb,renamed_parts/conn w-z.gb,renamed_parts/conn y-z.gb,renamed_parts/p10_tet-aptazyme.gb,renamed_parts/p11_sv40polya.gb,renamed_parts/p14_cmvp.gb,renamed_parts/p14_sv40p.gb,renamed_parts/p15_puror.gb,renamed_parts/p16_bghpolya.gb,renamed_parts/p18_cmvp.gb,renamed_parts/p18_ef1ap.gb,renamed_parts/p19_mneogreen.gb,renamed_parts/p19_mruby2.gb,renamed_parts/p19_mtagbfp2.gb,renamed_parts/p19_tet-on-3g.gb,renamed_parts/p1_5__sq__-itr-pb.gb,renamed_parts/p1_5__sq__ha-haavs1.gb,renamed_parts/p20_ct-minute-nes.gb,renamed_parts/p20_ct-nes.gb,renamed_parts/p20_linker3.gb,renamed_parts/p20_p2a.gb,renamed_parts/p21_dmra.gb,renamed_parts/p21_mkate2.gb,renamed_parts/p21_mneogreen.gb,renamed_parts/p21_mruby2.gb,renamed_parts/p21_mtagbfp2.gb,renamed_parts/p21_puror.gb,renamed_parts/p22_pgkpolya.gb,renamed_parts/p23_insulatorfb.gb,renamed_parts/p24_3__sq__ha_haavs1.gb,renamed_parts/p24_3__sq__pb.gb,renamed_parts/p25_sv40-ori.gb,renamed_parts/p2_insulatorfb.gb,renamed_parts/p3_cagp.gb,renamed_parts/p3_cmvp_tet.gb,renamed_parts/p3_ef1ap.gb,renamed_parts/p3_tre3gp.gb,renamed_parts/p4_kt-l7ae -weiss.gb,renamed_parts/p4_lac-o.gb,renamed_parts/p5_attb-bxb1.gb,renamed_parts/p5_attp-bxb1.gb,renamed_parts/p5_k1-k1.gb,renamed_parts/p5_kt-weiss.gb,renamed_parts/p6_atg_boxc.gb,renamed_parts/p6_kozak-atg.gb,renamed_parts/p6_nt-igkl sequence.gb,renamed_parts/p6_nt-mls.gb,renamed_parts/p6_nt-myristoylation signal.gb,renamed_parts/p6_nt-palm sequence.gb,renamed_parts/p6_nt-sv40_nls.gb,renamed_parts/p7_bxb1.gb,renamed_parts/p7_l7ae-weiss.gb,renamed_parts/p7_l7ae.gb,renamed_parts/p7_laci.gb,renamed_parts/p7_mcherry.gb,renamed_parts/p7_mkate2.gb,renamed_parts/p7_mneogreen.gb,renamed_parts/p7_mruby2.gb,renamed_parts/p7_mtagbfp2.gb,renamed_parts/p8_linker1.gb,renamed_parts/p8_linker2.gb,renamed_parts/p8_p2a.gb,renamed_parts/p8a_ct-kdel.gb,renamed_parts/p8b_ires2.gb,renamed_parts/p9_a-tubulin.gb,renamed_parts/p9_bsdr.gb,renamed_parts/p9_dmrc.gb,renamed_parts/p9_firefly luciferase.gb,renamed_parts/p9_mneogreen.gb,renamed_parts/p9_mruby2.gb,renamed_parts/p9_mtagbfp2.gb,renamed_parts/p9_neor.gb,renamed_parts/p9_puror.gb' --picklist '/tmp/tmpi_f681b6/files/9/9/7/dataset_997a41d8-270e-4c30-b18d-9977d95beda7.dat' --source_plate 'source_plate.xlsx' --backbone_name 'HC_Amp_ccdB' --part_backbone_ratio '1.0' --quantity_unit 'fmol' --part_quantity '1.3' --buffer_volume '0.3' --total_volume '1.0' --dispenser 'labcyte_echo' --result_zip 'picklist.zip' && cp 'picklist.zip' '/tmp/tmpi_f681b6/job_working_directory/000/94/outputs/dataset_bfec1bb4-30fa-42e4-ab22-8d435fad7ba2.dat'", + "command_version": "", + "copied_from_job_id": null, + "create_time": "2025-08-06T07:38:06.620229", + "dependencies": [], + "exit_code": 0, + "external_id": "17345", + "galaxy_version": "25.0", + "handler": null, + "history_id": "22956832477b7615", + "id": "9dd0ea47016230b4", + "inputs": { + "genbank_files1": { + "id": "22956832477b7615", + "src": "hda", + "uuid": "65ad9574-cb7e-4ed9-ad0c-017016d8e92f" + }, + "genbank_files10": { + "id": "1d32f3448e626e7f", + "src": "hda", + "uuid": "d9be0a23-55cb-4592-b3d9-eafb7a36220a" + }, + "genbank_files11": { + "id": "373d193f79dd8d7d", + "src": "hda", + "uuid": "6d658022-b983-478e-8bc2-5e48f4e9c43b" + }, + "genbank_files12": { + "id": "eb75b2de0fb16a3c", + "src": "hda", + "uuid": "5782320b-be5f-42fe-84af-f18bf7fa7ff2" + }, + "genbank_files13": { + "id": "85ab0526df6ef8db", + "src": "hda", + "uuid": "b76e327a-3d5f-46b9-8d8d-b6b1c674db62" + }, + "genbank_files14": { + "id": "cce9321c6ea3102e", + "src": "hda", + "uuid": "e58ab596-bdd8-4979-b1b4-99de2bf5b786" + }, + "genbank_files15": { + "id": "3ea9418692598539", + "src": "hda", + "uuid": "0224af58-bad1-42aa-becf-782d052b9730" + }, + "genbank_files16": { + "id": "2cbac7715efa3597", + "src": "hda", + "uuid": "edc15a94-7091-49ef-a34a-8eb3cd7ca528" + }, + "genbank_files17": { + "id": "3049bac1d45e974b", + "src": "hda", + "uuid": "8e3e7394-9770-4b0d-ac91-8327bd03f38c" + }, + "genbank_files18": { + "id": "45eab7b60225d246", + "src": "hda", + "uuid": "dd245a49-5f5a-4d4e-b031-9cfff85b2ca8" + }, + "genbank_files19": { + "id": "ef0c6e7e7bcb0c5e", + "src": "hda", + "uuid": "afe91b71-315b-42e5-8caa-baf20351c00e" + }, + "genbank_files2": { + "id": "c9e3c7b3dcd8d1f2", + "src": "hda", + "uuid": "1faa2257-725e-44e8-b913-740b6a05f8b2" + }, + "genbank_files20": { + "id": "129e875a270d5718", + "src": "hda", + "uuid": "569452b3-a597-4dae-8353-5698bb45e241" + }, + "genbank_files21": { + "id": "df7adf6389815b6f", + "src": "hda", + "uuid": "c1d1c48c-5a8d-4e02-bb7d-46709b68de02" + }, + "genbank_files22": { + "id": "5172734b6aff2f70", + "src": "hda", + "uuid": "1722a1aa-e93a-4dea-a12d-adf2cff1d731" + }, + "genbank_files23": { + "id": "035a795ab5a563c2", + "src": "hda", + "uuid": "b75067eb-fc50-4b79-8bc5-73d73d9781ef" + }, + "genbank_files24": { + "id": "d58f046df9fad923", + "src": "hda", + "uuid": "ea0ef964-5b83-461c-8f1e-37f12a58dd38" + }, + "genbank_files25": { + "id": "5910d88c6d113067", + "src": "hda", + "uuid": "381711b9-d963-4d77-bd66-b878668cde1c" + }, + "genbank_files26": { + "id": "8942cb5a8dbebb47", + "src": "hda", + "uuid": "e3f44043-cf5b-4bd2-b979-ed700373c731" + }, + "genbank_files27": { + "id": "ad8b2b5561141cbf", + "src": "hda", + "uuid": "1d69d1c7-6187-4bbe-aa06-c6c0ea9f1950" + }, + "genbank_files28": { + "id": "1c8fd2442e00a371", + "src": "hda", + "uuid": "7a5296ca-c574-4acf-b3e3-091fb9c2990e" + }, + "genbank_files29": { + "id": "9ffc43bac51ce8d8", + "src": "hda", + "uuid": "449256af-869e-4132-9b78-4b176ea4926b" + }, + "genbank_files3": { + "id": "4a47d23da8498ffe", + "src": "hda", + "uuid": "ffa5bc2e-4322-4782-b1d2-c7dc9ba04350" + }, + "genbank_files30": { + "id": "246bad70b00d28d5", + "src": "hda", + "uuid": "b9b9cbf1-2afe-44ee-a71a-afebbf0187dc" + }, + "genbank_files31": { + "id": "d4a3726e81ef4745", + "src": "hda", + "uuid": "3a6792a7-38c1-42dd-8305-dd93c32d7752" + }, + "genbank_files32": { + "id": "b886375aed9e1f6f", + "src": "hda", + "uuid": "35150438-cb43-4514-ba03-53e8fc4f2d62" + }, + "genbank_files33": { + "id": "379b551b2d42a3c8", + "src": "hda", + "uuid": "0a225817-00b7-45f7-961a-c767931ae92a" + }, + "genbank_files34": { + "id": "2659057ec51db8fa", + "src": "hda", + "uuid": "13f22279-3a7a-481e-90a1-582485b0b90b" + }, + "genbank_files35": { + "id": "0a584ced6f6a7572", + "src": "hda", + "uuid": "04c05bd3-d589-4b86-8dcf-2a510f7df24f" + }, + "genbank_files36": { + "id": "8f98981c884780d7", + "src": "hda", + "uuid": "68796f1c-a5e8-4865-b648-a6f1cfe8e10e" + }, + "genbank_files37": { + "id": "37425fa6ccad77d1", + "src": "hda", + "uuid": "a1d6d6e9-0b10-47c3-b209-f003b1af9ec7" + }, + "genbank_files38": { + "id": "6f16b98a74bc8e00", + "src": "hda", + "uuid": "d7061143-d1cd-4a08-a0c7-b1ccc9e4368b" + }, + "genbank_files39": { + "id": "c688dcee3b6937db", + "src": "hda", + "uuid": "26a8e2e7-3757-47f5-a3b3-d957b7989b06" + }, + "genbank_files4": { + "id": "5c77c8404c25bb2d", + "src": "hda", + "uuid": "9919b791-4b3f-47c6-a20a-a5c2d697fabc" + }, + "genbank_files40": { + "id": "8437e75f835ccb82", + "src": "hda", + "uuid": "673db7f6-df1b-46e4-923d-7a4b284fe47d" + }, + "genbank_files41": { + "id": "efb13fa079504263", + "src": "hda", + "uuid": "519edf0f-9bc9-44c8-9bc4-9b1e6424d39c" + }, + "genbank_files42": { + "id": "7e4c20be7b251653", + "src": "hda", + "uuid": "fd517323-7c60-4f3e-a05d-266834a5393c" + }, + "genbank_files43": { + "id": "1305f27defee0803", + "src": "hda", + "uuid": "06c5513c-abd2-4bfd-8519-668f761bd209" + }, + "genbank_files44": { + "id": "000b996b18656356", + "src": "hda", + "uuid": "e61642a5-7006-4448-9cbe-e2d1572f1e80" + }, + "genbank_files45": { + "id": "ba2fb4b2edb60418", + "src": "hda", + "uuid": "1a39752e-bc76-4f46-af81-a49926ff7224" + }, + "genbank_files46": { + "id": "1e767f185385202b", + "src": "hda", + "uuid": "fd351f42-4e3e-42ef-9725-4519573160c1" + }, + "genbank_files47": { + "id": "f7acfab5ba93c5b5", + "src": "hda", + "uuid": "d8375e27-175d-49bd-b07a-2bdfd106f91a" + }, + "genbank_files48": { + "id": "4915ed4ffacdd1c2", + "src": "hda", + "uuid": "7c405a03-cda8-4a5b-a966-a7da9ae36c90" + }, + "genbank_files49": { + "id": "36d78695b12c4628", + "src": "hda", + "uuid": "6e7c3d1a-4b60-445a-a096-6ffa32d1b8cf" + }, + "genbank_files5": { + "id": "9c375d59650da59b", + "src": "hda", + "uuid": "f0b15343-39ee-40cb-8765-a4a84b7e0ea4" + }, + "genbank_files50": { + "id": "6b747ad6c9cee45c", + "src": "hda", + "uuid": "848133c3-608d-4627-bbdd-ed937d1b009b" + }, + "genbank_files51": { + "id": "383eaae012fdf9c2", + "src": "hda", + "uuid": "962361d5-701f-4da5-a707-427069091566" + }, + "genbank_files52": { + "id": "244652812bc3a160", + "src": "hda", + "uuid": "7c6f7c5d-19e3-4bee-9983-7ff75d39a153" + }, + "genbank_files53": { + "id": "e1f1ba4c1200e127", + "src": "hda", + "uuid": "1042cf17-45cf-442e-b581-96bc3a5697ef" + }, + "genbank_files54": { + "id": "49c89262a579f642", + "src": "hda", + "uuid": "c1115334-9b18-450e-ae1b-05e6706ee51b" + }, + "genbank_files55": { + "id": "f31913ae37b613d3", + "src": "hda", + "uuid": "c570d71e-f33b-409d-a2d0-14f18b0d10ae" + }, + "genbank_files56": { + "id": "e1303d6b58429931", + "src": "hda", + "uuid": "48dd67ab-6056-4031-a5d1-427d923f56eb" + }, + "genbank_files57": { + "id": "aa7ac43781a79b2a", + "src": "hda", + "uuid": "902c955b-e1b8-4afd-92d3-457a80da0742" + }, + "genbank_files58": { + "id": "3a1b1b5978c4e950", + "src": "hda", + "uuid": "4f383ead-bfd0-4985-bf88-8d2ae49772cc" + }, + "genbank_files59": { + "id": "0c4962b2ae5d171f", + "src": "hda", + "uuid": "6965cbd4-0f66-43ad-a070-bed75261ba22" + }, + "genbank_files6": { + "id": "90821679061f5d56", + "src": "hda", + "uuid": "53023c35-65f6-4008-b84d-72fb7ecc4cba" + }, + "genbank_files60": { + "id": "c3699454511b65cd", + "src": "hda", + "uuid": "a1e9dbf9-630b-4bb0-9aa7-b2e6fd221e1e" + }, + "genbank_files61": { + "id": "7a4e651dae1f637e", + "src": "hda", + "uuid": "50264e85-1143-4c12-9480-92a65c32e337" + }, + "genbank_files62": { + "id": "63a114c57a09ece2", + "src": "hda", + "uuid": "d6c9799f-e997-4941-8fe1-542759627558" + }, + "genbank_files63": { + "id": "841706915b868401", + "src": "hda", + "uuid": "6f86fba6-a5c1-44b4-b120-5016be553d5f" + }, + "genbank_files64": { + "id": "e99bfa41665be298", + "src": "hda", + "uuid": "5bfaae1d-572d-4b11-ab85-f631cad39c43" + }, + "genbank_files65": { + "id": "9c3c4a4fff67573c", + "src": "hda", + "uuid": "24ac6f21-53b5-43df-b49a-45639e939b5a" + }, + "genbank_files66": { + "id": "ff0e587c81161b2c", + "src": "hda", + "uuid": "8189baf0-93d3-4154-88f6-36203604b72f" + }, + "genbank_files67": { + "id": "fe70f0b27d923f25", + "src": "hda", + "uuid": "71b1daec-ec14-4573-b1df-3e58bc4f0281" + }, + "genbank_files68": { + "id": "4faf474a2c8f3c64", + "src": "hda", + "uuid": "8c2bc0ea-6597-4734-9b07-1d8725b16872" + }, + "genbank_files69": { + "id": "2b00b014be500121", + "src": "hda", + "uuid": "5dcc9d84-fcfa-4e4d-8c36-e07d9d6b4242" + }, + "genbank_files7": { + "id": "6d1080b1996a1abf", + "src": "hda", + "uuid": "4345db76-3776-4c15-a608-cbfcbf1755ce" + }, + "genbank_files70": { + "id": "dabb0e22039e1e30", + "src": "hda", + "uuid": "1cb6cb47-5783-4105-9401-4de98f7c6bc4" + }, + "genbank_files71": { + "id": "b3b3ff8447bc5856", + "src": "hda", + "uuid": "0623f4b7-0f93-459b-b0d7-8f4447eaa364" + }, + "genbank_files72": { + "id": "5dea811d5323ae83", + "src": "hda", + "uuid": "380607e0-8ad8-42a9-9e23-8d6072f908b6" + }, + "genbank_files73": { + "id": "a7d43d2a9ea42d32", + "src": "hda", + "uuid": "b7a0879c-cef5-4258-8aca-7ef791bf490e" + }, + "genbank_files74": { + "id": "bb42b49cda58bf10", + "src": "hda", + "uuid": "1862996f-08df-43f9-b5a6-4f3a575fe15e" + }, + "genbank_files75": { + "id": "da38245ea35cc47d", + "src": "hda", + "uuid": "26e3c60c-a237-4788-bedf-0548f92609f8" + }, + "genbank_files76": { + "id": "6b74d372e476dd97", + "src": "hda", + "uuid": "09796d17-4be1-4d23-adae-afe292ccaade" + }, + "genbank_files77": { + "id": "20ed3b370dde2253", + "src": "hda", + "uuid": "9d1be7f1-28b6-48f7-ae0a-cbd2539d46c9" + }, + "genbank_files78": { + "id": "f61cc883a97b71d4", + "src": "hda", + "uuid": "d6cc98fa-6c64-4142-b743-bf285efb60b2" + }, + "genbank_files79": { + "id": "e604810e2ac4bd19", + "src": "hda", + "uuid": "bfdb38df-269b-45ea-8d6a-2694c36e17e6" + }, + "genbank_files8": { + "id": "84b4c081a2c5daff", + "src": "hda", + "uuid": "2f98e110-7de4-422d-938e-177083ccfe5e" + }, + "genbank_files80": { + "id": "3555e3ab6f4baab2", + "src": "hda", + "uuid": "c89959ed-0b3f-4f53-b9d9-586f22a1af09" + }, + "genbank_files81": { + "id": "837f19907e6e019d", + "src": "hda", + "uuid": "dfea1759-69a9-4153-9464-1dca6276ceab" + }, + "genbank_files82": { + "id": "f4384539d1a180e7", + "src": "hda", + "uuid": "b37d1c2e-0398-4e9e-b9b4-278d94fc4c0f" + }, + "genbank_files83": { + "id": "c278cedeebcc4b72", + "src": "hda", + "uuid": "41ba1b68-ae25-48b4-a111-d7b89adf08d1" + }, + "genbank_files84": { + "id": "609c0533b2b6aace", + "src": "hda", + "uuid": "bf38856e-5049-4935-8e4a-72c2d8a951b7" + }, + "genbank_files85": { + "id": "278bf972c860f4d3", + "src": "hda", + "uuid": "2b022cd4-7278-4f6c-9080-4c6ff76217af" + }, + "genbank_files86": { + "id": "90f32e860d099bb6", + "src": "hda", + "uuid": "9b6085ca-d78d-42ef-90f1-efe5818c89eb" + }, + "genbank_files87": { + "id": "6410822008faeb8e", + "src": "hda", + "uuid": "e8d37f0f-fa56-4630-8829-1428ed44aff8" + }, + "genbank_files88": { + "id": "61cacbd5a45b2941", + "src": "hda", + "uuid": "55f63be7-f651-4029-8fb0-10853d6485a5" + }, + "genbank_files89": { + "id": "4f0f19657ee38b4d", + "src": "hda", + "uuid": "adea274e-bd6b-49de-84e6-967c9eddabb0" + }, + "genbank_files9": { + "id": "3378e63b77969eee", + "src": "hda", + "uuid": "72d9fac0-2dc0-4147-92fb-e2bf5f75ed19" + }, + "genbank_files90": { + "id": "2eb1540106f06799", + "src": "hda", + "uuid": "5b424011-b574-4059-afe3-5a241314eff1" + }, + "genbank_files91": { + "id": "c492414f61190e0e", + "src": "hda", + "uuid": "9eeff8cb-fa3a-4c17-b006-2ba69cb7c047" + }, + "picklist": { + "id": "4a52c33acfdf00c5", + "src": "hda", + "uuid": "997a41d8-270e-4c30-b18d-9977d95beda7" + }, + "source_plate": { + "id": "96bb517ec4711730", + "src": "hda", + "uuid": "300aad29-8d06-4ab2-9142-91a91c247985" + } + }, + "job_messages": [], + "job_metrics": [], + "job_runner_name": null, + "job_stderr": "", + "job_stdout": "", + "model_class": "Job", + "output_collections": {}, + "outputs": { + "output_zip": { + "id": "9dd0ea47016230b4", + "src": "hda", + "uuid": "bfec1bb4-30fa-42e4-ab22-8d435fad7ba2" + } + }, + "params": { + "__input_ext": "\"input\"", + "backbone_name": "\"HC_Amp_ccdB\"", + "buffer_volume": "\"0.3\"", + "chromInfo": "\"/tmp/tmpi_f681b6/galaxy-dev/tool-data/shared/ucsc/chrom/?.len\"", + "dbkey": "\"?\"", + "dispenser": "\"labcyte_echo\"", + "genbank_files": "{\"values\": [{\"id\": 1, \"src\": \"hdca\"}]}", + "part_backbone_ratio": "\"1.0\"", + "part_quantity": "\"1.3\"", + "quantity_unit": "\"fmol\"", + "total_volume": "\"1.0\"" + }, + "state": "ok", + "stderr": "", + "stdout": "Generating picklist\nDEBUG : source_plate.xlsx\nWriting report...\nsuccess: True\n", + "tool_id": "create_assembly_picklists", + "tool_stderr": "", + "tool_stdout": "Generating picklist\nDEBUG : source_plate.xlsx\nWriting report...\nsuccess: True\n", + "update_time": "2025-08-06T07:38:19.249975", + "user_email": "planemo@galaxyproject.org", + "user_id": "22956832477b7615" + }, + "status": "success", + "test_index": 0, + "time_seconds": 263.1747727394104, + "tool_id": "create_assembly_picklists", + "tool_version": "0.1.0+galaxy0" + }, + "has_data": true, + "id": "create_assembly_picklists-0" + } + ], + "version": "0.1" +} \ No newline at end of file diff -r 000000000000 -r 4bde3e90ee98 picklist/ECHO_picklist.csv --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/picklist/ECHO_picklist.csv Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,104 @@ +Source Well,Destination Well,Transfer Volume +E2,A1,40.0 +D3,A1,27.5 +C1,A1,32.5 +L1,A1,15.0 +P3,A1,22.5 +B4,A1,32.5 +D2,A1,22.5 +E2,B1,40.0 +C3,B1,27.5 +B1,B1,30.0 +N4,B1,20.0 +E5,B1,27.5 +G5,B1,40.0 +H1,B1,22.5 +H2,B1,27.5 +K1,B1,20.0 +O1,B1,20.0 +C2,B1,22.5 +E2,C1,40.0 +C3,C1,27.5 +B1,C1,30.0 +M4,C1,20.0 +P4,C1,32.5 +G5,C1,40.0 +H1,C1,22.5 +H2,C1,27.5 +M1,C1,20.0 +C4,C1,35.0 +E2,D1,40.0 +D3,D1,27.5 +B1,D1,30.0 +N4,D1,20.0 +O4,D1,20.0 +M5,D1,35.0 +H1,D1,22.5 +H2,D1,27.5 +M1,D1,20.0 +C4,D1,35.0 +E2,E1,40.0 +D3,E1,27.5 +B1,E1,30.0 +M4,E1,20.0 +P4,E1,32.5 +L5,E1,45.0 +H1,E1,22.5 +H2,E1,27.5 +L1,E1,15.0 +A2,E1,22.5 +B4,E1,32.5 +D2,E1,22.5 +E2,F1,40.0 +D3,F1,27.5 +B1,F1,30.0 +N4,F1,20.0 +O4,F1,20.0 +M5,F1,35.0 +O5,F1,15.0 +G6,F1,40.0 +G2,F1,37.5 +H2,F1,27.5 +J1,F1,22.5 +I2,F1,10.0 +K2,F1,40.0 +L2,F1,37.5 +N1,F1,20.0 +N2,F1,35.0 +O2,F1,20.0 +P1,F1,32.5 +O3,F1,15.0 +B2,F1,17.5 +D2,F1,22.5 +E2,G1,40.0 +D3,G1,27.5 +B1,G1,30.0 +N4,G1,20.0 +O4,G1,20.0 +M5,G1,35.0 +O5,G1,15.0 +G6,G1,40.0 +G2,G1,37.5 +H2,G1,27.5 +K1,G1,20.0 +N2,G1,35.0 +P2,G1,30.0 +P1,G1,32.5 +O3,G1,15.0 +B2,G1,17.5 +D2,G1,22.5 +O24,A1,500.0 +O24,A1,7.5 +O24,B1,402.5 +O24,C1,405.0 +O24,D1,422.5 +O24,E1,362.5 +O24,F1,135.0 +O24,G1,235.0 +P24,A1,300.0 +P24,B1,300.0 +P24,C1,300.0 +P24,D1,300.0 +P24,E1,300.0 +P24,F1,300.0 +P24,G1,300.0 diff -r 000000000000 -r 4bde3e90ee98 picklist/assembly_mix_picklist_report.pdf Binary file picklist/assembly_mix_picklist_report.pdf has changed diff -r 000000000000 -r 4bde3e90ee98 picklist/assembly_plan_summary.pdf Binary file picklist/assembly_plan_summary.pdf has changed diff -r 000000000000 -r 4bde3e90ee98 picklist/final_mixplate.pdf Binary file picklist/final_mixplate.pdf has changed diff -r 000000000000 -r 4bde3e90ee98 picklist/final_mixplate.xls Binary file picklist/final_mixplate.xls has changed diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/HC_Amp_ccdB.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/HC_Amp_ccdB.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,109 @@ +LOCUS Exported 2721 bp ds-DNA circular SYN 14-SEP-2017 +DEFINITION synthetic circular DNA. +ACCESSION . +VERSION . +KEYWORDS HC_Amp_ccdB(1-25).gb +SOURCE synthetic DNA construct + ORGANISM synthetic DNA construct +REFERENCE 1 (bases 1 to 2721) + AUTHORS Trial User + TITLE Direct Submission + JOURNAL Exported Sep 14, 2017 from SnapGene Viewer 4.0.2 + http://www.snapgene.com +FEATURES Location/Qualifiers + source 1..2721 + /organism="synthetic DNA construct" + /mol_type="other DNA" + misc_feature complement(73..78) + /label=BsmBI + misc_feature 129..462 + /label=*ccdB promoter* + exon 463..768 + /label=ccdB + /note="ccdB" + terminator 809..880 + /note="rrnB T1 terminator + transcription terminator T1 from the E. coli rrnB gene" + terminator 896..923 + /note="T7Te terminator + phage T7 early transcription terminator" + misc_feature 930..942 + /label=BioBrick suffix + /note="universal suffix for all parts" + misc_feature 943..948 + /label=BsmBI + terminator 1027..1056 + /note="T3Te terminator + phage T3 early transcription terminator" + rep_origin 1078..1665 + /direction=RIGHT + /label=ori + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1677..1704 + /note="T7Te terminator + phage T7 early transcription terminator" + CDS complement(1728..2588) + /codon_start=1 + /gene="bla" + /product="beta-lactamase" + /note="AmpR + confers resistance to ampicillin, carbenicillin, and + related antibiotics" + /translation="MSIQHFRVALIPFFAAFCLPVFAHPETLVKVKDAEDQLGARVGYI + ELDLNSGKILESLRPEERFPMMSTFKVLLCGAVLSRIDAGQEQLGRRIHYSQNDLVEYS + PVTEKHLTDGMTVRELCSAAITMSDNTAANLLLATIGGPKELTAFLHNMGDHVTRLDRW + EPELNEAIPNDERDTTMPVAMATTLRKLLTGELLTLASRQQLIDWMEADKVAGSLLRSA + LPAGWFIADKSGAGERGSRGIIAALGPDGKPSRIVVIYTTGSQATMDERNRQIAEIGAS + LIKHW" + promoter complement(2589..2691) + /note="cat promoter + promoter of the E. coli cat gene" +ORIGIN + 1 ctttctgcta tggaggtcag gtatgattta aatggtcagt attgagcgat atctagagaa + 61 ttcgtcatag gagagacgca atacgcaaac cgcctctccc cgcgcgttgg ccgattcatt + 121 aatgcaggga tccggcttac taaaagccag ataacagtat gcgtatttgc gcgctgattt + 181 ttgcggtata agaatatata ctgatatgta tacccgaagt atgtcaaaaa gaggtatgct + 241 atgaagcagc gtattacagt gacagttgac agcgacagct atcagttgct caaggcatat + 301 atgatgtcaa tatctccggt ctggtaagca caaccatgca gaatgaagcc cgtcgtctgc + 361 gtgccgaacg ctggaaagcg gaaaatcagg aagggatggc tgaggtcgcc cggtttattg + 421 aaatgaacgg ctcttttgct gacgagaaca ggggctggtg aaatgcagtt taaggtttac + 481 acctataaaa gagagagccg ttatcgtctg tttgtggatg tacagagtga tattattgac + 541 acgcccgggc gacggatggt gatccccctg gccagtgcac gtctgctgtc agataaagtc + 601 ccccgtgaac tttacccggt ggtgcatatc ggggatgaaa gctggcgcat gatgaccacc + 661 gatatggcca gtgtgccggt ctccgttatc ggggaagaag tggctgatct cagccaccgc + 721 gaaaatgaca tcaaaaacgc cattaacctg atgttctggg gaatataagc tgatagtgct + 781 agtgtagatc gctactagag ccaggcatca aataaaacga aaggctcagt cgaaagactg + 841 ggcctttcgt tttatctgtt gtttgtcggt gaacgctctc tactagagtc acactggctc + 901 accttcgggt gggcctttct gcgtttatat actagtagcg gccgtctcaa cgataacgaa + 961 ttcaagcttg atatcattca ggacgagcct cagactccag cgtaactgga ctgcaatcaa + 1021 ctcactggct caccttcacg ggtgggcctt tcttcggtag aaaatcaaag gatcttcttg + 1081 agatcctttt tttctgcgcg taatctgctg cttgcaaaca aaaaaaccac cgctaccagc + 1141 ggtggtttgt ttgccggatc aagagctacc aactcttttt ccgaggtaac tggcttcagc + 1201 agagcgcaga taccaaatac tgttcttcta gtgtagccgt agttaggcca ccacttcaag + 1261 aactctgtag caccgcctac atacctcgct ctgctaatcc tgttaccagt ggctgctgcc + 1321 agtggcgata agtcgtgtct taccgggttg gactcaagac gatagttacc ggataaggcg + 1381 cagcggtcgg gctgaacggg gggttcgtgc acacagccca gcttggagcg aacgacctac + 1441 accgaactga gatacctaca gcgtgagcta tgagaaagcg ccacgcttcc cgaagggaga + 1501 aaggcggaca ggtatccggt aagcggcagg gtcggaacag gagagcgcac gagggagctt + 1561 ccagggggaa acgcctggta tctttatagt cctgtcgggt ttcgccacct ctgacttgag + 1621 catcgatttt tgtgatgctc gtcagggggg cggagcctat ggaaaaacgc cagcaacgca + 1681 gaaaggccca cccgaaggtg agccaggtga ttacatttgg gccctcatta ccaatgctta + 1741 atcagtgagg cacctatctc agcgatctgt ctatttcgtt catccatagt tgcctgactc + 1801 cccgtcgtgt agataactac gatgcgggag ggcttaccat ctggccccag tgctgcaatg + 1861 ataccgcgag aaccacgctc accggctcca gatttatcag caataaacca gccagccggg + 1921 agggccgagc gcagaagtga tcctgcaact ttatccgcct ccatccagtc tattaattgt + 1981 tgccgggaag ctagagtaag tagttcgcca gttaatagtt tgcgcaacgt tgttgccatt + 2041 gctacaggca tcgtggtgtc acgctcgtcg tttggtatgg cttcattcag ctccggttcc + 2101 caacgatcaa ggcgagttac atgatccccc atgttgtgca aaaaagcggt tagctccttc + 2161 ggtcctccga tcgttgccag aagtaagttg gccgcagtgt tatcactcat ggttatggca + 2221 gcactgcata attctcttac tgtcatgcca tccgtgagat gcttttctgt gactggtgag + 2281 tactcaacca agtcattctg agaatagtgt atgcggcgac cgagttgctc ttgcccggcg + 2341 tcaatacggg ataataccgc gccacatagc agaactttaa aagtgctcat cattggaaaa + 2401 cgttcttcgg ggcgtaaact ctcaaggatc ttaccgctgt tgagatccag ttcgatgtaa + 2461 cccactcgtg cacccaactg atcttcagca tcttttactt tcaccagcgt ttctgggtga + 2521 gcaaaaacag gaaggcaaaa tgccgcaaaa aagggaataa gggcgacacg gaaatgttga + 2581 atactcattt tagcttcctt agctcctgaa aatctcgata actcaaaaaa tacgcccggt + 2641 agtgatctta tttcattatg gtgaaagttg gaacctctta cgtgccgatc aagtcaaaag + 2701 cctccggtcg gaggcttttg a +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn a-c.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn a-c.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,76 @@ +LOCUS . 1905 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1245) + /note="conn A-C" + source complement(1154..1245) + /note="From Exported" + /source="Exported" + misc_feature complement(1251..1256) + /note="BsmBI" + terminator 1323..1354 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1355..1457 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1250..1905 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcga gtccagatag acaggaagaa tcgacagaac atccgacgaa tagaggacca + 1201 cgggcagcag aagaccatgt ctaaagtgcg agactgaata caagacctac gagacgaaga + 1261 cgaattctct agatatcgct caatactgac catttaaatc atacctgacc tccatagcag + 1321 aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg gcacgtaaga ggttccaact + 1381 ttcaccataa tgaaataaga tcactaccgg gcgtattttt tgagttatcg agattttcag + 1441 gagctaagga agctaaaatg agccatattc aacgggaaac gtcttgctcg aggccgcgat + 1501 taaattccaa catggatgct gatttatatg ggtataaatg ggctcgcgat aatgtcgggc + 1561 aatcaggtgc gacaatctat cgattgtatg ggaagcccga tgcgccagag ttgtttctga + 1621 aacatggcaa aggtagcgtt gccaatgatg ttacagatga gatggtcagg ctaaactggc + 1681 tgacggaatt tatgcctctt ccgaccatca agcattttat ccgtactcct gatgatgcat + 1741 ggttactcac cactgcgatc ccagggaaaa cagcattcca ggtattagaa gaatatcctg + 1801 attcaggtga aaatattgtt gatgcgctgg cagtgttcct gcgccggttg cattcgattc + 1861 ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn b-e.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn b-e.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,75 @@ +LOCUS . 1853 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1193) + /note="conn B-E" + source complement(1154..1193) + /note="From Exported" + /source="Exported" + misc_feature complement(1199..1204) + /note="BsmBI" + terminator 1271..1302 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1303..1405 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1198..1853 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc ggatctctca atctccttct aagtctcttt caccgtagtt agtccatcga + 1201 gacgaagacg aattctctag atatcgctca atactgacca tttaaatcat acctgacctc + 1261 catagcagaa agtcaaaagc ctccgaccgg aggcttttga cttgatcggc acgtaagagg + 1321 ttccaacttt caccataatg aaataagatc actaccgggc gtattttttg agttatcgag + 1381 attttcagga gctaaggaag ctaaaatgag ccatattcaa cgggaaacgt cttgctcgag + 1441 gccgcgatta aattccaaca tggatgctga tttatatggg tataaatggg ctcgcgataa + 1501 tgtcgggcaa tcaggtgcga caatctatcg attgtatggg aagcccgatg cgccagagtt + 1561 gtttctgaaa catggcaaag gtagcgttgc caatgatgtt acagatgaga tggtcaggct + 1621 aaactggctg acggaattta tgcctcttcc gaccatcaag cattttatcc gtactcctga + 1681 tgatgcatgg ttactcacca ctgcgatccc agggaaaaca gcattccagg tattagaaga + 1741 atatcctgat tcaggtgaaa atattgttga tgcgctggca gtgttcctgc gccggttgca + 1801 ttcgattcct gtttgtaatt gtccttttaa cggcgatcgc gtatttcgtc tcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn b-l.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn b-l.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,75 @@ +LOCUS . 1853 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1193) + /note="conn B-L" + source complement(1154..1193) + /note="From Exported" + /source="Exported" + misc_feature complement(1199..1204) + /note="BsmBI" + terminator 1271..1302 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1303..1405 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1198..1853 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgg acgtaaatgg gaggcaggta agtggagatt ccaagcgacc agtccatcga + 1201 gacgaagacg aattctctag atatcgctca atactgacca tttaaatcat acctgacctc + 1261 catagcagaa agtcaaaagc ctccgaccgg aggcttttga cttgatcggc acgtaagagg + 1321 ttccaacttt caccataatg aaataagatc actaccgggc gtattttttg agttatcgag + 1381 attttcagga gctaaggaag ctaaaatgag ccatattcaa cgggaaacgt cttgctcgag + 1441 gccgcgatta aattccaaca tggatgctga tttatatggg tataaatggg ctcgcgataa + 1501 tgtcgggcaa tcaggtgcga caatctatcg attgtatggg aagcccgatg cgccagagtt + 1561 gtttctgaaa catggcaaag gtagcgttgc caatgatgtt acagatgaga tggtcaggct + 1621 aaactggctg acggaattta tgcctcttcc gaccatcaag cattttatcc gtactcctga + 1681 tgatgcatgg ttactcacca ctgcgatccc agggaaaaca gcattccagg tattagaaga + 1741 atatcctgat tcaggtgaaa atattgttga tgcgctggca gtgttcctgc gccggttgca + 1801 ttcgattcct gtttgtaatt gtccttttaa cggcgatcgc gtatttcgtc tcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn d-e.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn d-e.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,75 @@ +LOCUS . 1855 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1195) + /note="conn D-E" + source complement(1154..1195) + /note="From Exported" + /source="Exported" + misc_feature complement(1201..1206) + /note="BsmBI" + terminator 1273..1304 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1305..1407 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1200..1855 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc ggatagatcg atctgaatta attctgacgg ttcactaaag gctaagtccc + 1201 gagacgaaga cgaattctct agatatcgct caatactgac catttaaatc atacctgacc + 1261 tccatagcag aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg gcacgtaaga + 1321 ggttccaact ttcaccataa tgaaataaga tcactaccgg gcgtattttt tgagttatcg + 1381 agattttcag gagctaagga agctaaaatg agccatattc aacgggaaac gtcttgctcg + 1441 aggccgcgat taaattccaa catggatgct gatttatatg ggtataaatg ggctcgcgat + 1501 aatgtcgggc aatcaggtgc gacaatctat cgattgtatg ggaagcccga tgcgccagag + 1561 ttgtttctga aacatggcaa aggtagcgtt gccaatgatg ttacagatga gatggtcagg + 1621 ctaaactggc tgacggaatt tatgcctctt ccgaccatca agcattttat ccgtactcct + 1681 gatgatgcat ggttactcac cactgcgatc ccagggaaaa cagcattcca ggtattagaa + 1741 gaatatcctg attcaggtga aaatattgtt gatgcgctgg cagtgttcct gcgccggttg + 1801 cattcgattc ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn d-f.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn d-f.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,75 @@ +LOCUS . 1855 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1195) + /note="conn D-F" + source complement(1154..1195) + /note="From Exported" + /source="Exported" + misc_feature complement(1201..1206) + /note="BsmBI" + terminator 1273..1304 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1305..1407 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1200..1855 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc tggtagatcg atctgaatta attctgacgg ttcactaaag gctaagtccc + 1201 gagacgaaga cgaattctct agatatcgct caatactgac catttaaatc atacctgacc + 1261 tccatagcag aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg gcacgtaaga + 1321 ggttccaact ttcaccataa tgaaataaga tcactaccgg gcgtattttt tgagttatcg + 1381 agattttcag gagctaagga agctaaaatg agccatattc aacgggaaac gtcttgctcg + 1441 aggccgcgat taaattccaa catggatgct gatttatatg ggtataaatg ggctcgcgat + 1501 aatgtcgggc aatcaggtgc gacaatctat cgattgtatg ggaagcccga tgcgccagag + 1561 ttgtttctga aacatggcaa aggtagcgtt gccaatgatg ttacagatga gatggtcagg + 1621 ctaaactggc tgacggaatt tatgcctctt ccgaccatca agcattttat ccgtactcct + 1681 gatgatgcat ggttactcac cactgcgatc ccagggaaaa cagcattcca ggtattagaa + 1741 gaatatcctg attcaggtga aaatattgtt gatgcgctgg cagtgttcct gcgccggttg + 1801 cattcgattc ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn h-ha.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn h-ha.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,80 @@ +LOCUS . 1861 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1201) + /note="conn H-Ha" + source complement(1154..1201) + /note="From Exported" + /source="Exported" + CDS complement(1199..1201) + /codon_start=1 + /note="STOP" + /translation="" + misc_feature complement(1207..1212) + /note="BsmBI" + terminator 1279..1310 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1311..1413 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1206..1861 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgg gatcgaggat atcacctgta gggatgttct agagtccgga agctgttatt + 1201 agcctcgaga cgaagacgaa ttctctagat atcgctcaat actgaccatt taaatcatac + 1261 ctgacctcca tagcagaaag tcaaaagcct ccgaccggag gcttttgact tgatcggcac + 1321 gtaagaggtt ccaactttca ccataatgaa ataagatcac taccgggcgt attttttgag + 1381 ttatcgagat tttcaggagc taaggaagct aaaatgagcc atattcaacg ggaaacgtct + 1441 tgctcgaggc cgcgattaaa ttccaacatg gatgctgatt tatatgggta taaatgggct + 1501 cgcgataatg tcgggcaatc aggtgcgaca atctatcgat tgtatgggaa gcccgatgcg + 1561 ccagagttgt ttctgaaaca tggcaaaggt agcgttgcca atgatgttac agatgagatg + 1621 gtcaggctaa actggctgac ggaatttatg cctcttccga ccatcaagca ttttatccgt + 1681 actcctgatg atgcatggtt actcaccact gcgatcccag ggaaaacagc attccaggta + 1741 ttagaagaat atcctgattc aggtgaaaat attgttgatg cgctggcagt gttcctgcgc + 1801 cggttgcatt cgattcctgt ttgtaattgt ccttttaacg gcgatcgcgt atttcgtctc + 1861 g +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn h-j.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn h-j.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,80 @@ +LOCUS . 1861 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1201) + /note="conn H-J" + source complement(1154..1201) + /note="From Exported" + /source="Exported" + CDS complement(1199..1201) + /codon_start=1 + /note="STOP" + /translation="" + misc_feature complement(1207..1212) + /note="BsmBI" + terminator 1279..1310 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1311..1413 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1206..1861 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcga gcacgaggat atcacctgta gggatgttct agagtccgga agctgttatt + 1201 agcctcgaga cgaagacgaa ttctctagat atcgctcaat actgaccatt taaatcatac + 1261 ctgacctcca tagcagaaag tcaaaagcct ccgaccggag gcttttgact tgatcggcac + 1321 gtaagaggtt ccaactttca ccataatgaa ataagatcac taccgggcgt attttttgag + 1381 ttatcgagat tttcaggagc taaggaagct aaaatgagcc atattcaacg ggaaacgtct + 1441 tgctcgaggc cgcgattaaa ttccaacatg gatgctgatt tatatgggta taaatgggct + 1501 cgcgataatg tcgggcaatc aggtgcgaca atctatcgat tgtatgggaa gcccgatgcg + 1561 ccagagttgt ttctgaaaca tggcaaaggt agcgttgcca atgatgttac agatgagatg + 1621 gtcaggctaa actggctgac ggaatttatg cctcttccga ccatcaagca ttttatccgt + 1681 actcctgatg atgcatggtt actcaccact gcgatcccag ggaaaacagc attccaggta + 1741 ttagaagaat atcctgattc aggtgaaaat attgttgatg cgctggcagt gttcctgcgc + 1801 cggttgcatt cgattcctgt ttgtaattgt ccttttaacg gcgatcgcgt atttcgtctc + 1861 g +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn h-k.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn h-k.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,80 @@ +LOCUS . 1861 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1201) + /note="conn H-K" + source complement(1154..1201) + /note="From Exported" + /source="Exported" + CDS complement(1199..1201) + /codon_start=1 + /note="STOP" + /translation="" + misc_feature complement(1207..1212) + /note="BsmBI" + terminator 1279..1310 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1311..1413 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1206..1861 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgt acccgaggat atcacctgta gggatgttct agagtccgga agctgttatt + 1201 agcctcgaga cgaagacgaa ttctctagat atcgctcaat actgaccatt taaatcatac + 1261 ctgacctcca tagcagaaag tcaaaagcct ccgaccggag gcttttgact tgatcggcac + 1321 gtaagaggtt ccaactttca ccataatgaa ataagatcac taccgggcgt attttttgag + 1381 ttatcgagat tttcaggagc taaggaagct aaaatgagcc atattcaacg ggaaacgtct + 1441 tgctcgaggc cgcgattaaa ttccaacatg gatgctgatt tatatgggta taaatgggct + 1501 cgcgataatg tcgggcaatc aggtgcgaca atctatcgat tgtatgggaa gcccgatgcg + 1561 ccagagttgt ttctgaaaca tggcaaaggt agcgttgcca atgatgttac agatgagatg + 1621 gtcaggctaa actggctgac ggaatttatg cctcttccga ccatcaagca ttttatccgt + 1681 actcctgatg atgcatggtt actcaccact gcgatcccag ggaaaacagc attccaggta + 1741 ttagaagaat atcctgattc aggtgaaaat attgttgatg cgctggcagt gttcctgcgc + 1801 cggttgcatt cgattcctgt ttgtaattgt ccttttaacg gcgatcgcgt atttcgtctc + 1861 g +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn j-k.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn j-k.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,75 @@ +LOCUS . 1855 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1195) + /note="conn J-K" + source complement(1154..1195) + /note="From Exported" + /source="Exported" + misc_feature complement(1201..1206) + /note="BsmBI" + terminator 1273..1304 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1305..1407 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1200..1855 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgt accgttcctt cctgtattgt ctccttccgt gtttcagtta gcctcagcac + 1201 gagacgaaga cgaattctct agatatcgct caatactgac catttaaatc atacctgacc + 1261 tccatagcag aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg gcacgtaaga + 1321 ggttccaact ttcaccataa tgaaataaga tcactaccgg gcgtattttt tgagttatcg + 1381 agattttcag gagctaagga agctaaaatg agccatattc aacgggaaac gtcttgctcg + 1441 aggccgcgat taaattccaa catggatgct gatttatatg ggtataaatg ggctcgcgat + 1501 aatgtcgggc aatcaggtgc gacaatctat cgattgtatg ggaagcccga tgcgccagag + 1561 ttgtttctga aacatggcaa aggtagcgtt gccaatgatg ttacagatga gatggtcagg + 1621 ctaaactggc tgacggaatt tatgcctctt ccgaccatca agcattttat ccgtactcct + 1681 gatgatgcat ggttactcac cactgcgatc ccagggaaaa cagcattcca ggtattagaa + 1741 gaatatcctg attcaggtga aaatattgtt gatgcgctgg cagtgttcct gcgccggttg + 1801 cattcgattc ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn l-n.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn l-n.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,76 @@ +LOCUS . 1905 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1245) + /note="conn L-N" + source complement(1154..1245) + /note="From Exported" + /source="Exported" + misc_feature complement(1251..1256) + /note="BsmBI" + terminator 1323..1354 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1355..1457 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1250..1905 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgg tagcctcctc ctatcctcat cacttcaacc ggatctactc tacaaccttc + 1201 cctatccact tcctccacat gctctccacc aacatcctca tcatagacgc gagacgaaga + 1261 cgaattctct agatatcgct caatactgac catttaaatc atacctgacc tccatagcag + 1321 aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg gcacgtaaga ggttccaact + 1381 ttcaccataa tgaaataaga tcactaccgg gcgtattttt tgagttatcg agattttcag + 1441 gagctaagga agctaaaatg agccatattc aacgggaaac gtcttgctcg aggccgcgat + 1501 taaattccaa catggatgct gatttatatg ggtataaatg ggctcgcgat aatgtcgggc + 1561 aatcaggtgc gacaatctat cgattgtatg ggaagcccga tgcgccagag ttgtttctga + 1621 aacatggcaa aggtagcgtt gccaatgatg ttacagatga gatggtcagg ctaaactggc + 1681 tgacggaatt tatgcctctt ccgaccatca agcattttat ccgtactcct gatgatgcat + 1741 ggttactcac cactgcgatc ccagggaaaa cagcattcca ggtattagaa gaatatcctg + 1801 attcaggtga aaatattgtt gatgcgctgg cagtgttcct gcgccggttg cattcgattc + 1861 ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn l-r.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn l-r.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,76 @@ +LOCUS . 1905 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1245) + /note="conn L-R" + source complement(1154..1245) + /note="From Exported" + /source="Exported" + misc_feature complement(1251..1256) + /note="BsmBI" + terminator 1323..1354 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1355..1457 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1250..1905 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcga ccgcctcctc ctatcctcat cacttcaacc ggatctactc tacaaccttc + 1201 cctatccact tcctccacat gctctccacc aacatcctca tcatagacgc gagacgaaga + 1261 cgaattctct agatatcgct caatactgac catttaaatc atacctgacc tccatagcag + 1321 aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg gcacgtaaga ggttccaact + 1381 ttcaccataa tgaaataaga tcactaccgg gcgtattttt tgagttatcg agattttcag + 1441 gagctaagga agctaaaatg agccatattc aacgggaaac gtcttgctcg aggccgcgat + 1501 taaattccaa catggatgct gatttatatg ggtataaatg ggctcgcgat aatgtcgggc + 1561 aatcaggtgc gacaatctat cgattgtatg ggaagcccga tgcgccagag ttgtttctga + 1621 aacatggcaa aggtagcgtt gccaatgatg ttacagatga gatggtcagg ctaaactggc + 1681 tgacggaatt tatgcctctt ccgaccatca agcattttat ccgtactcct gatgatgcat + 1741 ggttactcac cactgcgatc ccagggaaaa cagcattcca ggtattagaa gaatatcctg + 1801 attcaggtga aaatattgtt gatgcgctgg cagtgttcct gcgccggttg cattcgattc + 1861 ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn l-w.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn l-w.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,76 @@ +LOCUS . 1905 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1245) + /note="conn L-W" + source complement(1154..1245) + /note="From Exported" + /source="Exported" + misc_feature complement(1251..1256) + /note="BsmBI" + terminator 1323..1354 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1355..1457 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1250..1905 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgt tcgcctcctc ctatcctcat cacttcaacc ggatctactc tacaaccttc + 1201 cctatccact tcctccacat gctctccacc aacatcctca tcatagacgc gagacgaaga + 1261 cgaattctct agatatcgct caatactgac catttaaatc atacctgacc tccatagcag + 1321 aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg gcacgtaaga ggttccaact + 1381 ttcaccataa tgaaataaga tcactaccgg gcgtattttt tgagttatcg agattttcag + 1441 gagctaagga agctaaaatg agccatattc aacgggaaac gtcttgctcg aggccgcgat + 1501 taaattccaa catggatgct gatttatatg ggtataaatg ggctcgcgat aatgtcgggc + 1561 aatcaggtgc gacaatctat cgattgtatg ggaagcccga tgcgccagag ttgtttctga + 1621 aacatggcaa aggtagcgtt gccaatgatg ttacagatga gatggtcagg ctaaactggc + 1681 tgacggaatt tatgcctctt ccgaccatca agcattttat ccgtactcct gatgatgcat + 1741 ggttactcac cactgcgatc ccagggaaaa cagcattcca ggtattagaa gaatatcctg + 1801 attcaggtga aaatattgtt gatgcgctgg cagtgttcct gcgccggttg cattcgattc + 1861 ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn l-y.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn l-y.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,76 @@ +LOCUS . 1905 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1245) + /note="conn L-Y" + source complement(1154..1245) + /note="From Exported" + /source="Exported" + misc_feature complement(1251..1256) + /note="BsmBI" + terminator 1323..1354 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1355..1457 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1250..1905 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc agtcctcctc ctatcctcat cacttcaacc ggatctactc tacaaccttc + 1201 cctatccact tcctccacat gctctccacc aacatcctca tcatagacgc gagacgaaga + 1261 cgaattctct agatatcgct caatactgac catttaaatc atacctgacc tccatagcag + 1321 aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg gcacgtaaga ggttccaact + 1381 ttcaccataa tgaaataaga tcactaccgg gcgtattttt tgagttatcg agattttcag + 1441 gagctaagga agctaaaatg agccatattc aacgggaaac gtcttgctcg aggccgcgat + 1501 taaattccaa catggatgct gatttatatg ggtataaatg ggctcgcgat aatgtcgggc + 1561 aatcaggtgc gacaatctat cgattgtatg ggaagcccga tgcgccagag ttgtttctga + 1621 aacatggcaa aggtagcgtt gccaatgatg ttacagatga gatggtcagg ctaaactggc + 1681 tgacggaatt tatgcctctt ccgaccatca agcattttat ccgtactcct gatgatgcat + 1741 ggttactcac cactgcgatc ccagggaaaa cagcattcca ggtattagaa gaatatcctg + 1801 attcaggtga aaatattgtt gatgcgctgg cagtgttcct gcgccggttg cattcgattc + 1861 ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn q-r.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn q-r.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,76 @@ +LOCUS . 1905 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1245) + /note="conn Q-R" + source complement(1154..1245) + /note="From Exported" + /source="Exported" + misc_feature complement(1251..1256) + /note="BsmBI" + terminator 1323..1354 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1355..1457 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1250..1905 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcga ccggcttgtt ctgggctagg tgttgaggtt cgattaccac taacgtctga + 1201 gggaaagttg ttgactggac ttgcatgttg atggtggatt atgtcgagcc gagacgaaga + 1261 cgaattctct agatatcgct caatactgac catttaaatc atacctgacc tccatagcag + 1321 aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg gcacgtaaga ggttccaact + 1381 ttcaccataa tgaaataaga tcactaccgg gcgtattttt tgagttatcg agattttcag + 1441 gagctaagga agctaaaatg agccatattc aacgggaaac gtcttgctcg aggccgcgat + 1501 taaattccaa catggatgct gatttatatg ggtataaatg ggctcgcgat aatgtcgggc + 1561 aatcaggtgc gacaatctat cgattgtatg ggaagcccga tgcgccagag ttgtttctga + 1621 aacatggcaa aggtagcgtt gccaatgatg ttacagatga gatggtcagg ctaaactggc + 1681 tgacggaatt tatgcctctt ccgaccatca agcattttat ccgtactcct gatgatgcat + 1741 ggttactcac cactgcgatc ccagggaaaa cagcattcca ggtattagaa gaatatcctg + 1801 attcaggtga aaatattgtt gatgcgctgg cagtgttcct gcgccggttg cattcgattc + 1861 ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn r-w.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn r-w.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,75 @@ +LOCUS . 1853 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1193) + /note="R-W" + source complement(1154..1193) + /note="From Exported" + /source="Exported" + misc_feature complement(1199..1204) + /note="BsmBI" + terminator 1271..1302 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1303..1405 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1198..1853 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgt tcggagctgg tagggacttc ggagggcttt gtagttgggt aggaccgcga + 1201 gacgaagacg aattctctag atatcgctca atactgacca tttaaatcat acctgacctc + 1261 catagcagaa agtcaaaagc ctccgaccgg aggcttttga cttgatcggc acgtaagagg + 1321 ttccaacttt caccataatg aaataagatc actaccgggc gtattttttg agttatcgag + 1381 attttcagga gctaaggaag ctaaaatgag ccatattcaa cgggaaacgt cttgctcgag + 1441 gccgcgatta aattccaaca tggatgctga tttatatggg tataaatggg ctcgcgataa + 1501 tgtcgggcaa tcaggtgcga caatctatcg attgtatggg aagcccgatg cgccagagtt + 1561 gtttctgaaa catggcaaag gtagcgttgc caatgatgtt acagatgaga tggtcaggct + 1621 aaactggctg acggaattta tgcctcttcc gaccatcaag cattttatcc gtactcctga + 1681 tgatgcatgg ttactcacca ctgcgatccc agggaaaaca gcattccagg tattagaaga + 1741 atatcctgat tcaggtgaaa atattgttga tgcgctggca gtgttcctgc gccggttgca + 1801 ttcgattcct gtttgtaatt gtccttttaa cggcgatcgc gtatttcgtc tcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn t-v.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn t-v.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,79 @@ +LOCUS . 1853 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1193) + /note="conn T-V" + source complement(1154..1193) + /note="From Exported" + /source="Exported" + CDS complement(1189..1191) + /codon_start=1 + /note="STOP" + /translation="" + misc_feature complement(1199..1204) + /note="BsmBI" + terminator 1271..1302 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1303..1405 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1198..1853 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc aacgggagta tgaagaggcg accaggagga gtgaattatt agccgctcga + 1201 gacgaagacg aattctctag atatcgctca atactgacca tttaaatcat acctgacctc + 1261 catagcagaa agtcaaaagc ctccgaccgg aggcttttga cttgatcggc acgtaagagg + 1321 ttccaacttt caccataatg aaataagatc actaccgggc gtattttttg agttatcgag + 1381 attttcagga gctaaggaag ctaaaatgag ccatattcaa cgggaaacgt cttgctcgag + 1441 gccgcgatta aattccaaca tggatgctga tttatatggg tataaatggg ctcgcgataa + 1501 tgtcgggcaa tcaggtgcga caatctatcg attgtatggg aagcccgatg cgccagagtt + 1561 gtttctgaaa catggcaaag gtagcgttgc caatgatgtt acagatgaga tggtcaggct + 1621 aaactggctg acggaattta tgcctcttcc gaccatcaag cattttatcc gtactcctga + 1681 tgatgcatgg ttactcacca ctgcgatccc agggaaaaca gcattccagg tattagaaga + 1741 atatcctgat tcaggtgaaa atattgttga tgcgctggca gtgttcctgc gccggttgca + 1801 ttcgattcct gtttgtaatt gtccttttaa cggcgatcgc gtatttcgtc tcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn w-x.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn w-x.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,76 @@ +LOCUS . 1905 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1245) + /note="conn W-X" + source complement(1154..1245) + /note="From Exported" + /source="Exported" + misc_feature complement(1251..1256) + /note="BsmBI" + terminator 1323..1354 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1355..1457 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1250..1905 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc gtgcagatag acaggaagaa tcgacagaac atccgacgaa tagaggacca + 1201 cgggcagcag aagaccatgt ctaaagtgcg agactgaata caagattcgc gagacgaaga + 1261 cgaattctct agatatcgct caatactgac catttaaatc atacctgacc tccatagcag + 1321 aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg gcacgtaaga ggttccaact + 1381 ttcaccataa tgaaataaga tcactaccgg gcgtattttt tgagttatcg agattttcag + 1441 gagctaagga agctaaaatg agccatattc aacgggaaac gtcttgctcg aggccgcgat + 1501 taaattccaa catggatgct gatttatatg ggtataaatg ggctcgcgat aatgtcgggc + 1561 aatcaggtgc gacaatctat cgattgtatg ggaagcccga tgcgccagag ttgtttctga + 1621 aacatggcaa aggtagcgtt gccaatgatg ttacagatga gatggtcagg ctaaactggc + 1681 tgacggaatt tatgcctctt ccgaccatca agcattttat ccgtactcct gatgatgcat + 1741 ggttactcac cactgcgatc ccagggaaaa cagcattcca ggtattagaa gaatatcctg + 1801 attcaggtga aaatattgtt gatgcgctgg cagtgttcct gcgccggttg cattcgattc + 1861 ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn w-y.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn w-y.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,76 @@ +LOCUS . 1905 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1245) + /note="conn W-Y" + source complement(1154..1245) + /note="From Exported" + /source="Exported" + misc_feature complement(1251..1256) + /note="BsmBI" + terminator 1323..1354 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1355..1457 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1250..1905 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc agtgggatgt gtgagtttgt tgagtgaatg gtaattgtgg gagtggtgtg + 1201 ggatttgagg tgtgctggtg tggttgtgac gaggatcaat atgtgttcgc gagacgaaga + 1261 cgaattctct agatatcgct caatactgac catttaaatc atacctgacc tccatagcag + 1321 aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg gcacgtaaga ggttccaact + 1381 ttcaccataa tgaaataaga tcactaccgg gcgtattttt tgagttatcg agattttcag + 1441 gagctaagga agctaaaatg agccatattc aacgggaaac gtcttgctcg aggccgcgat + 1501 taaattccaa catggatgct gatttatatg ggtataaatg ggctcgcgat aatgtcgggc + 1561 aatcaggtgc gacaatctat cgattgtatg ggaagcccga tgcgccagag ttgtttctga + 1621 aacatggcaa aggtagcgtt gccaatgatg ttacagatga gatggtcagg ctaaactggc + 1681 tgacggaatt tatgcctctt ccgaccatca agcattttat ccgtactcct gatgatgcat + 1741 ggttactcac cactgcgatc ccagggaaaa cagcattcca ggtattagaa gaatatcctg + 1801 attcaggtga aaatattgtt gatgcgctgg cagtgttcct gcgccggttg cattcgattc + 1861 ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn w-z.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn w-z.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,76 @@ +LOCUS . 1905 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1245) + /note="conn W-Z" + source complement(1154..1245) + /note="From Exported" + /source="Exported" + misc_feature complement(1251..1256) + /note="BsmBI" + terminator 1323..1354 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1355..1457 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1250..1905 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgt cgtgggatgt gtgagtttgt tgagtgaatg gtaattgtgg gagtggtgtg + 1201 ggatttgagg tgtgctggtg tggttgtgac gaggatcaat atgtgttcgc gagacgaaga + 1261 cgaattctct agatatcgct caatactgac catttaaatc atacctgacc tccatagcag + 1321 aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg gcacgtaaga ggttccaact + 1381 ttcaccataa tgaaataaga tcactaccgg gcgtattttt tgagttatcg agattttcag + 1441 gagctaagga agctaaaatg agccatattc aacgggaaac gtcttgctcg aggccgcgat + 1501 taaattccaa catggatgct gatttatatg ggtataaatg ggctcgcgat aatgtcgggc + 1561 aatcaggtgc gacaatctat cgattgtatg ggaagcccga tgcgccagag ttgtttctga + 1621 aacatggcaa aggtagcgtt gccaatgatg ttacagatga gatggtcagg ctaaactggc + 1681 tgacggaatt tatgcctctt ccgaccatca agcattttat ccgtactcct gatgatgcat + 1741 ggttactcac cactgcgatc ccagggaaaa cagcattcca ggtattagaa gaatatcctg + 1801 attcaggtga aaatattgtt gatgcgctgg cagtgttcct gcgccggttg cattcgattc + 1861 ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/conn y-z.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/conn y-z.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,76 @@ +LOCUS . 1905 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /note="From Exported" + /source="Exported" + misc_feature complement(1154..1245) + /note="conn Y-Z" + source complement(1154..1245) + /note="From Exported" + /source="Exported" + misc_feature complement(1251..1256) + /note="BsmBI" + terminator 1323..1354 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1355..1457 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1250..1905 + /note="From Exported" + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgt cgtgggatgt gtgagtttgt tgagtgaatg gtaattgtgg gagtggtgtg + 1201 ggatttgagg tgtgctggtg tggttgtgac gaggatcaat atgtgcagtc gagacgaaga + 1261 cgaattctct agatatcgct caatactgac catttaaatc atacctgacc tccatagcag + 1321 aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg gcacgtaaga ggttccaact + 1381 ttcaccataa tgaaataaga tcactaccgg gcgtattttt tgagttatcg agattttcag + 1441 gagctaagga agctaaaatg agccatattc aacgggaaac gtcttgctcg aggccgcgat + 1501 taaattccaa catggatgct gatttatatg ggtataaatg ggctcgcgat aatgtcgggc + 1561 aatcaggtgc gacaatctat cgattgtatg ggaagcccga tgcgccagag ttgtttctga + 1621 aacatggcaa aggtagcgtt gccaatgatg ttacagatga gatggtcagg ctaaactggc + 1681 tgacggaatt tatgcctctt ccgaccatca agcattttat ccgtactcct gatgatgcat + 1741 ggttactcac cactgcgatc ccagggaaaa cagcattcca ggtattagaa gaatatcctg + 1801 attcaggtga aaatattgtt gatgcgctgg cagtgttcct gcgccggttg cattcgattc + 1861 ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p10_tet-aptazyme.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p10_tet-aptazyme.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,75 @@ +LOCUS . 1984 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1185..1312 + /note="Tet-Aptazyme" + source 1154..1324 + /source="Exported" + misc_feature complement(1330..1335) + /note="BsmBI" + terminator 1402..1433 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1434..1536 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1329..1984 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgt gctagacaat acaggaagga accaaacaaa caaaggcgaa agccggcgcg + 1201 tcctggattc cacgtacaaa aacataccag atttcgatct ggagaggtga agaatacgac + 1261 caccttgtac ggtacatcca gctgatgagt cccaaatagg acgaaacgcg ctcaaacaaa + 1321 caaaggtacg agacgaagac gaattctcta gatatcgctc aatactgacc atttaaatca + 1381 tacctgacct ccatagcaga aagtcaaaag cctccgaccg gaggcttttg acttgatcgg + 1441 cacgtaagag gttccaactt tcaccataat gaaataagat cactaccggg cgtatttttt + 1501 gagttatcga gattttcagg agctaaggaa gctaaaatga gccatattca acgggaaacg + 1561 tcttgctcga ggccgcgatt aaattccaac atggatgctg atttatatgg gtataaatgg + 1621 gctcgcgata atgtcgggca atcaggtgcg acaatctatc gattgtatgg gaagcccgat + 1681 gcgccagagt tgtttctgaa acatggcaaa ggtagcgttg ccaatgatgt tacagatgag + 1741 atggtcaggc taaactggct gacggaattt atgcctcttc cgaccatcaa gcattttatc + 1801 cgtactcctg atgatgcatg gttactcacc actgcgatcc cagggaaaac agcattccag + 1861 gtattagaag aatatcctga ttcaggtgaa aatattgttg atgcgctggc agtgttcctg + 1921 cgccggttgc attcgattcc tgtttgtaat tgtcctttta acggcgatcg cgtatttcgt + 1981 ctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p11_sv40polya.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p11_sv40polya.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,74 @@ +LOCUS . 1944 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + misc_feature 1814..1944 + /note="SV40 polyA" + source 1814..1944 + /source="Exported" +ORIGIN + 1 cgtccgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgg gtaacttgtt tattgcagct tataatggtt acaaataaag caatagcatc + 1861 acaaatttca caaataaagc atttttttca ctgcattcta gttgtggttt gtccaaactc + 1921 atcaatgtat cttatcatgt ctgt +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p14_cmvp.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p14_cmvp.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,86 @@ +LOCUS . 2356 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1144..1149 + /note="BsmBI" + source 5..1150 + /source="Exported" + source complement(1155..1697) + /source="Exported" + promoter complement(1191..1393) + /note="CMV promoter" + /note="human cytomegalovirus (CMV) immediate early + promoter" + enhancer complement(1394..1696) + /note="CMV enhancer" + /note="human cytomegalovirus immediate early enhancer" + misc_feature complement(1703..1708) + /note="BsmBI" + terminator 1774..1805 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1806..1908 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1702..2356 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tttcgtctcg ttgccagatc tcctcggtac cggatccagt cgacgaatta gctctgctta + 1201 tatagacctc ccaccgtaca cgcctaccgc ccatttgcgt caatggggcg gagttgttac + 1261 gacattttgg aaagtcccgt tgattttggt gccaaaacaa actcccattg acgtcaatgg + 1321 ggtggagact tggaaatccc cgtgagtcaa accgctatcc acgcccattg atgtactgcc + 1381 aaaaccgcat caccatggta atagcgatga ctaatacgta gatgtactgc caagtaggaa + 1441 agtcccataa ggtcatgtac tgggcataat gccaggcggg ccatttaccg tcattgacgt + 1501 caataggggg cgtacttggc atatgataca cttgatgtac tgccaagtgg gcagtttacc + 1561 gtaaatactc cacccattga cgtcaatgga aagtccctat tggcgttact atgggaacat + 1621 acgtcattat tgacgtcaat gggcgggggt cgttgggcgg tcagccaggc gggccattta + 1681 ccgtaagtta tgtaacggta gcgagacgtg acgaattctc tagatatcgc tcaatactga + 1741 ccatttaaat catacctgac ctccatagca gaaagtcaaa agcctccgac cggaggcttt + 1801 tgacttgatc ggcacgtaag aggttccaac tttcaccata atgaaataag atcactaccg + 1861 ggcgtatttt ttgagttatc gagattttca ggagctaagg aagctaaaat gagccatatt + 1921 caacgggaaa cgtcttgctc gaggccgcga ttaaattcca acatggatgc tgatttatat + 1981 gggtataaat gggctcgcga taatgtcggg caatcaggtg cgacaatcta tcgattgtat + 2041 gggaagcccg atgcgccaga gttgtttctg aaacatggca aaggtagcgt tgccaatgat + 2101 gttacagatg agatggtcag gctaaactgg ctgacggaat ttatgcctct tccgaccatc + 2161 aagcatttta tccgtactcc tgatgatgca tggttactca ccactgcgat cccagggaaa + 2221 acagcattcc aggtattaga agaatatcct gattcaggtg aaaatattgt tgatgcgctg + 2281 gcagtgttcc tgcgccggtt gcattcgatt cctgtttgta attgtccttt taacggcgat + 2341 cgcgtatttc gtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p14_sv40p.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p14_sv40p.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,82 @@ +LOCUS . 2193 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1144..1149 + /note="BsmBI" + source 5..1150 + /source="Exported" + source complement(1155..1534) + /source="Exported" + promoter complement(1205..1534) + /note="SV40 promoter" + /note="SV40 enhancer and early promoter" + rep_origin complement(1219..1354) + /note="SV40 ori" + /note="SV40 origin of replication" + misc_feature complement(1540..1545) + /note="BsmBI" + terminator 1611..1642 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1643..1745 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1539..2193 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tttcgtctcg ttgccctgtc tcttgatcag atccgaaaat ggatatacaa gctcccggga + 1201 gctttttgca aaagcctagg cctccaaaaa agcctcctca ctacttctgg aatagctcag + 1261 aggcagaggc ggcctcggcc tctgcataaa taaaaaaaat tagtcagcca tggggcggag + 1321 aatgggcgga actgggcgga gttaggggcg ggatgggcgg agttaggggc gggactatgg + 1381 ttgctgacta attgagatgc atgctttgca tacttctgcc tgctggggag cctggggact + 1441 ttccacacct ggttgctgac taattgagat gcatgctttg catacttctg cctgctgggg + 1501 agcctgggga ctttccacac cctaactgac acacgtagcg agacgtgacg aattctctag + 1561 atatcgctca atactgacca tttaaatcat acctgacctc catagcagaa agtcaaaagc + 1621 ctccgaccgg aggcttttga cttgatcggc acgtaagagg ttccaacttt caccataatg + 1681 aaataagatc actaccgggc gtattttttg agttatcgag attttcagga gctaaggaag + 1741 ctaaaatgag ccatattcaa cgggaaacgt cttgctcgag gccgcgatta aattccaaca + 1801 tggatgctga tttatatggg tataaatggg ctcgcgataa tgtcgggcaa tcaggtgcga + 1861 caatctatcg attgtatggg aagcccgatg cgccagagtt gtttctgaaa catggcaaag + 1921 gtagcgttgc caatgatgtt acagatgaga tggtcaggct aaactggctg acggaattta + 1981 tgcctcttcc gaccatcaag cattttatcc gtactcctga tgatgcatgg ttactcacca + 2041 ctgcgatccc agggaaaaca gcattccagg tattagaaga atatcctgat tcaggtgaaa + 2101 atattgttga tgcgctggca gtgttcctgc gccggttgca ttcgattcct gtttgtaatt + 2161 gtccttttaa cggcgatcgc gtatttcgtc tcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p15_puror.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p15_puror.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,96 @@ +LOCUS . 2424 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1154..1161 + /note="KozaK" + CDS 1162..1164 + /codon_start=1 + /note="ATG" + /translation="M" + CDS 1165..1761 + /codon_start=1 + /gene="pac from Streptomyces" + /note="PuroR" + /note="confers resistance to puromycin" + /product="puromycin N-acetyltransferase" + /translation="TEYKPTVRLATRDDVPRAVRTLAAAFADYPATRHTVDPDRHIERV + TELQELFLTRVGLDIGKVWVADDGAAVAVWTTPESVEAGAVFAEIGPRMAELSGSRLAA + QQQMEGLLAPHRPKEPAWFLATVGVSPDHQGKGLGSAVVLPGVEAAERAGVPAFLETSA + PRNLPFYERLGFTVTADVECPKDRATWCMTRKPGA" + source 1154..1764 + /source="Exported" + misc_feature complement(1770..1775) + /note="BsmBI" + terminator 1842..1873 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1874..1976 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1769..2424 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgg caaccgccac catgaccgag tacaagccca cggtgcgcct cgccacccgc + 1201 gacgacgtcc ccagggccgt acgcaccctc gccgccgcgt tcgccgacta ccccgccacg + 1261 cgccacaccg tcgatccgga ccgccacatc gagcgggtca ccgagctgca agaactcttc + 1321 ctcacgcgcg tcgggctcga catcggcaag gtgtgggtcg cggacgacgg cgccgcggtg + 1381 gcggtctgga ccacgccgga gagcgtcgaa gcgggggcgg tgttcgccga gatcggcccg + 1441 cgcatggccg agttgagcgg ttcccggctg gccgcgcagc aacagatgga aggcctcctg + 1501 gcgccgcacc ggcccaagga gcccgcgtgg ttcctggcca ccgtcggcgt gtcgcccgac + 1561 caccagggca agggtctggg cagcgccgtc gtgctccccg gagtggaggc ggccgagcgc + 1621 gccggggtgc ccgccttcct ggaaacctcc gcgccccgca acctcccctt ctacgagcgg + 1681 ctcggcttca ccgtcaccgc cgacgtcgag tgcccgaagg accgcgcgac ctggtgcatg + 1741 acccgcaagc ccggtgccta ataaccctcg agacgaagac gaattctcta gatatcgctc + 1801 aatactgacc atttaaatca tacctgacct ccatagcaga aagtcaaaag cctccgaccg + 1861 gaggcttttg acttgatcgg cacgtaagag gttccaactt tcaccataat gaaataagat + 1921 cactaccggg cgtatttttt gagttatcga gattttcagg agctaaggaa gctaaaatga + 1981 gccatattca acgggaaacg tcttgctcga ggccgcgatt aaattccaac atggatgctg + 2041 atttatatgg gtataaatgg gctcgcgata atgtcgggca atcaggtgcg acaatctatc + 2101 gattgtatgg gaagcccgat gcgccagagt tgtttctgaa acatggcaaa ggtagcgttg + 2161 ccaatgatgt tacagatgag atggtcaggc taaactggct gacggaattt atgcctcttc + 2221 cgaccatcaa gcattttatc cgtactcctg atgatgcatg gttactcacc actgcgatcc + 2281 cagggaaaac agcattccag gtattagaag aatatcctga ttcaggtgaa aatattgttg + 2341 atgcgctggc agtgttcctg cgccggttgc attcgattcc tgtttgtaat tgtcctttta + 2401 acggcgatcg cgtatttcgt ctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p16_bghpolya.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p16_bghpolya.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,77 @@ +LOCUS . 2070 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + polyA_signal 1186..1410 + /note="bGH poly(A) signal" + /note="bovine growth hormone polyadenylation signal" + source 1154..1410 + /source="Exported" + misc_feature complement(1416..1421) + /note="BsmBI" + terminator 1488..1519 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1520..1622 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1415..2070 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc cctctctggg gttcgaaatg accgaccaag cgacgctgtg ccttctagtt + 1201 gccagccatc tgttgtttgc ccctcccccg tgccttcctt gaccctggaa ggtgccactc + 1261 ccactgtcct ttcctaataa aatgaggaaa ttgcatcgca ttgtctgagt aggtgtcatt + 1321 ctattctggg gggtggggtg gggcaggaca gcaaggggga ggattgggaa gacaatagca + 1381 ggcatgctgg ggatgcggtg ggctctatgg gctccgagac gaagacgaat tctctagata + 1441 tcgctcaata ctgaccattt aaatcatacc tgacctccat agcagaaagt caaaagcctc + 1501 cgaccggagg cttttgactt gatcggcacg taagaggttc caactttcac cataatgaaa + 1561 taagatcact accgggcgta ttttttgagt tatcgagatt ttcaggagct aaggaagcta + 1621 aaatgagcca tattcaacgg gaaacgtctt gctcgaggcc gcgattaaat tccaacatgg + 1681 atgctgattt atatgggtat aaatgggctc gcgataatgt cgggcaatca ggtgcgacaa + 1741 tctatcgatt gtatgggaag cccgatgcgc cagagttgtt tctgaaacat ggcaaaggta + 1801 gcgttgccaa tgatgttaca gatgagatgg tcaggctaaa ctggctgacg gaatttatgc + 1861 ctcttccgac catcaagcat tttatccgta ctcctgatga tgcatggtta ctcaccactg + 1921 cgatcccagg gaaaacagca ttccaggtat tagaagaata tcctgattca ggtgaaaata + 1981 ttgttgatgc gctggcagtg ttcctgcgcc ggttgcattc gattcctgtt tgtaattgtc + 2041 cttttaacgg cgatcgcgta tttcgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p18_cmvp.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p18_cmvp.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,86 @@ +LOCUS . 2356 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + enhancer 1155..1457 + /note="CMV enhancer" + /note="human cytomegalovirus immediate early enhancer" + promoter 1458..1660 + /note="CMV promoter" + /note="human cytomegalovirus (CMV) immediate early + promoter" + source 1154..1696 + /source="Exported" + misc_feature complement(1702..1707) + /note="BsmBI" + terminator 1774..1805 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1806..1908 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1701..2356 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc ggtcgttaca taacttacgg taaatggccc gcctggctga ccgcccaacg + 1201 acccccgccc attgacgtca ataatgacgt atgttcccat agtaacgcca atagggactt + 1261 tccattgacg tcaatgggtg gagtatttac ggtaaactgc ccacttggca gtacatcaag + 1321 tgtatcatat gccaagtacg ccccctattg acgtcaatga cggtaaatgg cccgcctggc + 1381 attatgccca gtacatgacc ttatgggact ttcctacttg gcagtacatc tacgtattag + 1441 tcatcgctat taccatggtg atgcggtttt ggcagtacat caatgggcgt ggatagcggt + 1501 ttgactcacg gggatttcca agtctccacc ccattgacgt caatgggagt ttgttttggc + 1561 accaaaatca acgggacttt ccaaaatgtc gtaacaactc cgccccattg acgcaaatgg + 1621 gcggtaggcg tgtacggtgg gaggtctata taagcagagc taattcgtcg actggatccg + 1681 gtaccgagga gatctggtgc cgagacgaag acgaattctc tagatatcgc tcaatactga + 1741 ccatttaaat catacctgac ctccatagca gaaagtcaaa agcctccgac cggaggcttt + 1801 tgacttgatc ggcacgtaag aggttccaac tttcaccata atgaaataag atcactaccg + 1861 ggcgtatttt ttgagttatc gagattttca ggagctaagg aagctaaaat gagccatatt + 1921 caacgggaaa cgtcttgctc gaggccgcga ttaaattcca acatggatgc tgatttatat + 1981 gggtataaat gggctcgcga taatgtcggg caatcaggtg cgacaatcta tcgattgtat + 2041 gggaagcccg atgcgccaga gttgtttctg aaacatggca aaggtagcgt tgccaatgat + 2101 gttacagatg agatggtcag gctaaactgg ctgacggaat ttatgcctct tccgaccatc + 2161 aagcatttta tccgtactcc tgatgatgca tggttactca ccactgcgat cccagggaaa + 2221 acagcattcc aggtattaga agaatatcct gattcaggtg aaaatattgt tgatgcgctg + 2281 gcagtgttcc tgcgccggtt gcattcgatt cctgtttgta attgtccttt taacggcgat + 2341 cgcgtatttc gtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p18_ef1ap.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p18_ef1ap.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,98 @@ +LOCUS . 3037 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + promoter 5..1183 + /note="EF-1-alpha promoter" + /note="strong constitutive promoter for human elongation + factor EF-1-alpha" + intron 236..1174 + /note="EF-1-alpha intron A" + /note="intron upstream of the start codon of human + EF-1-alpha" + source 5..1228 + /source="Exported" + misc_feature complement(1234..1239) + /note="BsmBI" + terminator 1306..1337 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1338..1440 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1233..1888 + /source="Exported" + terminator 2280..2307 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(2319..2906) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 2928..2957 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 3031..3036 + /note="BsmBI" + source 1893..3037 + /source="Exported" +ORIGIN + 1 cggtggctcc ggtgcccgtc agtgggcaga gcgcacatcg cccacagtcc ccgagaagtt + 61 ggggggaggg gtcggcaatt gaaccggtgc ctagagaagg tggcgcgggg taaactggga + 121 aagtgatgtc gtgtactggc tccgcctttt tcccgagggt gggggagaac cgtatataag + 181 tgcagtagtc gccgtgaacg ttctttttcg caacgggttt gccgccagaa cacaggtaag + 241 tgccgtgtgt ggttcccgcg ggcctggcct ctttacgggt tatggccctt gcgtgccttg + 301 aattacttcc acctggctgc agtacgtgat tcttgatccc gagcttcggg ttggaagtgg + 361 gtgggagagt tcgaggcctt gcgcttaagg agccccttcg cctcgtgctt gagttgaggc + 421 ctggcctggg cgctggggcc gccgcgtgcg aatctggtgg caccttcgcg cctgtctcgc + 481 tgctttcgat aagtctctag ccatttaaaa tttttgatga cctgctgcga cgcttttttt + 541 ctggcaagat agtcttgtaa atgcgggcca agatctgcac actggtattt cggtttttgg + 601 ggccgcgggc ggcgacgggg cccgtgcgtc ccagcgcaca tgttcggcga ggcggggcct + 661 gcgagcgcgg ccaccgagaa tcggacgggg gtagtctcaa gctggccggc ctgctctggt + 721 gcctggcctc gcgccgccgt gtatcgcccc gccctgggcg gcaaggctgg cccggtcggc + 781 accagttgcg tgagcggaaa gatggccgct tcccggccct gctgcaggga gctcaaaatg + 841 gaggacgcgg cgctcgggag agcgggcggg tgagtcaccc acacaaagga aaagggcctt + 901 tccgtcctca gccgtcgctt catgtgactc cacggagtac cgggcgccgt ccaggcacct + 961 cgattagttc tcgagctttt ggagtacgtc gtctttaggt tggggggagg ggttttatgc + 1021 gatggagttt ccccacactg agtgggtgga gactgaagtt aggccagctt ggcacttgat + 1081 gtaattctcc ttggaatttg ccctttttga gtttggatct tggttcattc tcaagcctca + 1141 gacagtggtt caaagttttt ttcttccatt tcaggtgtcg tgacgctagc gctaccggac + 1201 tcagatctcg agctcaagct tcgaattcgt gccgagacga agacgaattc tctagatatc + 1261 gctcaatact gaccatttaa atcatacctg acctccatag cagaaagtca aaagcctccg + 1321 accggaggct tttgacttga tcggcacgta agaggttcca actttcacca taatgaaata + 1381 agatcactac cgggcgtatt ttttgagtta tcgagatttt caggagctaa ggaagctaaa + 1441 atgagccata ttcaacggga aacgtcttgc tcgaggccgc gattaaattc caacatggat + 1501 gctgatttat atgggtataa atgggctcgc gataatgtcg ggcaatcagg tgcgacaatc + 1561 tatcgattgt atgggaagcc cgatgcgcca gagttgtttc tgaaacatgg caaaggtagc + 1621 gttgccaatg atgttacaga tgagatggtc aggctaaact ggctgacgga atttatgcct + 1681 cttccgacca tcaagcattt tatccgtact cctgatgatg catggttact caccactgcg + 1741 atcccaggga aaacagcatt ccaggtatta gaagaatatc ctgattcagg tgaaaatatt + 1801 gttgatgcgc tggcagtgtt cctgcgccgg ttgcattcga ttcctgtttg taattgtcct + 1861 tttaacggcg atcgcgtatt tcgtctcgct caggcgcaat cacgaatgaa taacggtttg + 1921 gttggtgcga gtgattttga tgacgagcgt aatggctggc ctgttgaaca agtctggaaa + 1981 gaaatgcata agcttttgcc attctcaccg gattcagtcg tcactcatgg tgatttctca + 2041 cttgataacc ttatttttga cgaggggaaa ttaataggtt gtattgatgt tggacgagtc + 2101 ggaatcgcag accgatacca ggatcttgcc atcctatgga actgcctcgg tgagttttct + 2161 ccttcattac agaaacggct ttttcaaaaa tatggtattg ataatcctga tatgaataaa + 2221 ttgcagtttc acttgatgct cgatgagttt ttctaatgag ggcccaaatg taatcacctg + 2281 gctcaccttc gggtgggcct ttctgcgttg ctggcgtttt tccataggct ccgcccccct + 2341 gacgagcatc acaaaaatcg atgctcaagt cagaggtggc gaaacccgac aggactataa + 2401 agataccagg cgtttccccc tggaagctcc ctcgtgcgct ctcctgttcc gaccctgccg + 2461 cttaccggat acctgtccgc ctttctccct tcgggaagcg tggcgctttc tcatagctca + 2521 cgctgtaggt atctcagttc ggtgtaggtc gttcgctcca agctgggctg tgtgcacgaa + 2581 ccccccgttc agcccgaccg ctgcgcctta tccggtaact atcgtcttga gtccaacccg + 2641 gtaagacacg acttatcgcc actggcagca gccactggta acaggattag cagagcgagg + 2701 tatgtaggcg gtgctacaga gttcttgaag tggtggccta actacggcta cactagaaga + 2761 acagtatttg gtatctgcgc tctgctgaag ccagttacct cggaaaaaga gttggtagct + 2821 cttgatccgg caaacaaacc accgctggta gcggtggttt ttttgtttgc aagcagcaga + 2881 ttacgcgcag aaaaaaagga tctcaagaag atcctttgat tttctaccga agaaaggccc + 2941 acccgtgaag gtgagccagt gagttgattg cagtccagtt acgctggagt ctgaggctcg + 3001 tcctgaatga tatcaagctt gaattcgtta cgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p19_mneogreen.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p19_mneogreen.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,98 @@ +LOCUS . 2529 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1154..1164 + /note="KozaK" + CDS 1162..1164 + /codon_start=1 + /note="ATG" + /translation="M" + CDS 1165..1869 + /codon_start=1 + /note="mNeonGreen" + /product="bright monomeric yellow-green fluorescent protein + derived from LanYFP (Shaner et al., 2013)" + /translation="VSKGEEDNMASLPATHELHIFGSINGVDFDMVGQGTGNPNDGYEE + LNLKSTKGDLQFSPWILVPHIGYGFHQYLPYPDGMSPFQAAMVDGSGYQVHRTMQFEDG + ASLTVNYRYTYEGSHIKGEAQVKGTGFPADGPVMTNSLTAADWCRSKKTYPNDKTIIST + FKWSYTTGNGKRYRSTARTTYTFAKPMAANYLKNQPMYVFRKTELKHSKTELNFKEWQK + AFTDVMGMDELYK" + source 1154..1869 + /source="Exported" + misc_feature complement(1875..1880) + /note="BsmBI" + terminator 1947..1978 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1979..2081 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1874..2529 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgg tgcccgccac catggtgagc aagggcgagg aggataacat ggcctctctc + 1201 ccagcgacac atgagttaca catctttggc tccatcaacg gtgtggactt tgacatggtg + 1261 ggtcagggca ccggcaatcc aaatgatggt tatgaggagt taaacctgaa gtccaccaag + 1321 ggtgacctcc agttctcccc ctggattctg gtccctcata tcgggtatgg cttccatcag + 1381 tacctgccct accctgacgg gatgtcgcct ttccaggccg ccatggtaga tggctccgga + 1441 taccaagtcc atcgcacaat gcagtttgaa gatggtgcct cccttactgt taactaccgc + 1501 tacacctacg agggaagcca catcaaagga gaggcccagg tgaaggggac tggtttccct + 1561 gctgacggtc ctgtgatgac caactcgctg accgctgcgg actggtgcag gtcgaagaag + 1621 acttacccca acgacaaaac catcatcagt acctttaagt ggagttacac cactggaaat + 1681 ggcaagcgct accggagcac tgcgcggacc acctacacct ttgccaagcc aatggcggct + 1741 aactatctga agaaccagcc gatgtacgtg ttccgtaaga cggagctcaa gcactccaag + 1801 accgagctca acttcaagga gtggcaaaag gcctttaccg atgtgatggg catggacgag + 1861 ctgtacaaga gcgcgagacg aagacgaatt ctctagatat cgctcaatac tgaccattta + 1921 aatcatacct gacctccata gcagaaagtc aaaagcctcc gaccggaggc ttttgacttg + 1981 atcggcacgt aagaggttcc aactttcacc ataatgaaat aagatcacta ccgggcgtat + 2041 tttttgagtt atcgagattt tcaggagcta aggaagctaa aatgagccat attcaacggg + 2101 aaacgtcttg ctcgaggccg cgattaaatt ccaacatgga tgctgattta tatgggtata + 2161 aatgggctcg cgataatgtc gggcaatcag gtgcgacaat ctatcgattg tatgggaagc + 2221 ccgatgcgcc agagttgttt ctgaaacatg gcaaaggtag cgttgccaat gatgttacag + 2281 atgagatggt caggctaaac tggctgacgg aatttatgcc tcttccgacc atcaagcatt + 2341 ttatccgtac tcctgatgat gcatggttac tcaccactgc gatcccaggg aaaacagcat + 2401 tccaggtatt agaagaatat cctgattcag gtgaaaatat tgttgatgcg ctggcagtgt + 2461 tcctgcgccg gttgcattcg attcctgttt gtaattgtcc ttttaacggc gatcgcgtat + 2521 ttcgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p19_mruby2.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p19_mruby2.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,99 @@ +LOCUS . 2532 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1154..1164 + /note="KozaK" + CDS 1162..1164 + /codon_start=1 + /note="ATG" + /translation="M" + CDS 1165..1872 + /codon_start=1 + /note="mRuby2" + /product="monomeric red fluorescent protein derived from + mRuby, with improved photophysical properties (Lam et al., + 2012)" + /translation="VSKGEELIKENMRMKVVMEGSVNGHQFKCTGEGEGNPYMGTQTMR + IKVIEGGPLPFAFDILATSFMYGSRTFIKYPKGIPDFFKQSFPEGFTWERVTRYEDGGV + VTVMQDTSLEDGCLVYHVQVRGVNFPSNGPVMQKKTKGWEPNTEMMYPADGGLRGYTHM + ALKVDGGGHLSCSFVTTYRSKKTVGNIKMPGIHAVDHRLERLEESDNEMFVVQREHAVA + KFAGLGGGMDELYK" + source 1154..1872 + /source="Exported" + misc_feature complement(1878..1883) + /note="BsmBI" + terminator 1950..1981 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1982..2084 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1877..2532 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgg tgcccgccac catggtgtct aagggcgaag agctgatcaa ggaaaatatg + 1201 cgtatgaagg tggtcatgga aggttcggtc aacggccacc aattcaaatg cacaggtgaa + 1261 ggagaaggca atccgtacat gggaactcaa accatgagga tcaaagtcat cgagggagga + 1321 cccctgccat ttgcctttga cattcttgcc acgtcgttca tgtatggcag ccgtactttt + 1381 atcaagtacc cgaaaggcat tcctgatttc tttaaacagt cctttcctga gggttttact + 1441 tgggaaagag ttacgagata cgaagatggt ggagtcgtca ccgtcatgca ggacaccagc + 1501 cttgaggatg gctgtctcgt ttaccacgtc caagtcagag gggtaaactt tccctccaat + 1561 ggtcccgtga tgcagaagaa gaccaagggt tgggagccta atacagagat gatgtatcca + 1621 gcagatggtg gtctgagggg atacactcat atggcactga aagttgatgg tggtggccat + 1681 ctgtcttgct ctttcgtaac aacttacagg tcaaaaaaga ccgtcgggaa catcaagatg + 1741 cccggtatcc atgccgttga tcaccgcctg gaaaggttag aggaaagtga caatgaaatg + 1801 ttcgtagtac aacgcgaaca cgcagttgcc aagttcgccg ggcttggtgg tgggatggac + 1861 gagctgtaca agagcgcgag acgaagacga attctctaga tatcgctcaa tactgaccat + 1921 ttaaatcata cctgacctcc atagcagaaa gtcaaaagcc tccgaccgga ggcttttgac + 1981 ttgatcggca cgtaagaggt tccaactttc accataatga aataagatca ctaccgggcg + 2041 tattttttga gttatcgaga ttttcaggag ctaaggaagc taaaatgagc catattcaac + 2101 gggaaacgtc ttgctcgagg ccgcgattaa attccaacat ggatgctgat ttatatgggt + 2161 ataaatgggc tcgcgataat gtcgggcaat caggtgcgac aatctatcga ttgtatggga + 2221 agcccgatgc gccagagttg tttctgaaac atggcaaagg tagcgttgcc aatgatgtta + 2281 cagatgagat ggtcaggcta aactggctga cggaatttat gcctcttccg accatcaagc + 2341 attttatccg tactcctgat gatgcatggt tactcaccac tgcgatccca gggaaaacag + 2401 cattccaggt attagaagaa tatcctgatt caggtgaaaa tattgttgat gcgctggcag + 2461 tgttcctgcg ccggttgcat tcgattcctg tttgtaattg tccttttaac ggcgatcgcg + 2521 tatttcgtct cg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p19_mtagbfp2.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p19_mtagbfp2.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,99 @@ +LOCUS . 2532 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1154..1164 + /note="KozaK" + CDS 1162..1164 + /codon_start=1 + /note="ATG" + /translation="M" + CDS 1165..1872 + /codon_start=1 + /note="mTagBFP2" + /note="mammalian codon-optimized" + /product="enhanced monomeric blue fluorescent protein + (Subach et al., 2011)" + /translation="VSKGEELIKENMHMKLYMEGTVDNHHFKCTSEGEGKPYEGTQTMR + IKVVEGGPLPFAFDILATSFLYGSKTFINHTQGIPDFFKQSFPEGFTWERVTTYEDGGV + LTATQDTSLQDGCLIYNVKIRGVNFTSNGPVMQKKTLGWEAFTETLYPADGGLEGRNDM + ALKLVGGSHLIANAKTTYRSKKPAKNLKMPGVYYVDYRLERIKEANNETYVEQHEVAVA + RYCDLPSKLGHKLN" + source 1154..1872 + /source="Exported" + misc_feature complement(1878..1883) + /note="BsmBI" + terminator 1950..1981 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1982..2084 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1877..2532 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgg tgcccgccac catggtgtct aagggcgaag agctgattaa ggagaacatg + 1201 cacatgaagc tgtacatgga gggcaccgtg gacaaccatc acttcaagtg cacatccgag + 1261 ggcgaaggca agccctacga gggcacccag accatgagaa tcaaggtggt cgagggcggc + 1321 cctctcccct tcgccttcga catcctggct actagcttcc tctacggcag caagaccttc + 1381 atcaaccaca cccagggcat ccccgacttc ttcaagcagt ccttccctga gggcttcaca + 1441 tgggagagag tcaccacata cgaagacggg ggcgtgctga ccgctaccca ggacaccagc + 1501 ctccaggacg gctgcctcat ctacaacgtc aagatcagag gggtgaactt cacatccaac + 1561 ggccctgtga tgcagaagaa aacactcggc tgggaggcct tcaccgaaac gctgtacccc + 1621 gctgacggcg gcctggaagg cagaaacgac atggccctga agctcgtggg cgggagccat + 1681 ctgatcgcaa acgccaagac cacatataga tccaagaaac ccgctaagaa cctcaagatg + 1741 cctggcgtct actatgtgga ctacagactg gaaagaatca aggaggccaa caacgaaacc + 1801 tacgtcgagc agcacgaggt ggcagtggcc agatactgcg acctccctag caaactgggg + 1861 cacaagctta atagcgcgag acgaagacga attctctaga tatcgctcaa tactgaccat + 1921 ttaaatcata cctgacctcc atagcagaaa gtcaaaagcc tccgaccgga ggcttttgac + 1981 ttgatcggca cgtaagaggt tccaactttc accataatga aataagatca ctaccgggcg + 2041 tattttttga gttatcgaga ttttcaggag ctaaggaagc taaaatgagc catattcaac + 2101 gggaaacgtc ttgctcgagg ccgcgattaa attccaacat ggatgctgat ttatatgggt + 2161 ataaatgggc tcgcgataat gtcgggcaat caggtgcgac aatctatcga ttgtatggga + 2221 agcccgatgc gccagagttg tttctgaaac atggcaaagg tagcgttgcc aatgatgtta + 2281 cagatgagat ggtcaggcta aactggctga cggaatttat gcctcttccg accatcaagc + 2341 attttatccg tactcctgat gatgcatggt tactcaccac tgcgatccca gggaaaacag + 2401 cattccaggt attagaagaa tatcctgatt caggtgaaaa tattgttgat gcgctggcag + 2461 tgttcctgcg ccggttgcat tcgattcctg tttgtaattg tccttttaac ggcgatcgcg + 2521 tatttcgtct cg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p19_tet-on-3g.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p19_tet-on-3g.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,95 @@ +LOCUS . 2574 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1154..1161 + /note="Kozak" + CDS 1162..1908 + /codon_start=1 + /note="Tet-On(R) 3G" + /product="modified rtTA protein that binds tightly to + promoters containing the tet operator in the presence of + doxycycline" + /translation="MSRLDKSKVINSALELLNGVGIEGLTTRKLAQKLGVEQPTLYWHV + KNKRALLDALPIEMLDRHHTHSCPLEGESWQDFLRNNAKSYRCALLSHRDGAKVHLGTR + PTEKQYETLENQLAFLCQQGFSLENALYALSAVGHFTLGCVLEEQEHQVAKEERETPTT + DSMPPLLKQAIELFDRQGAEPAFLFGLELIICGLEKQLKCESGGPTDALDDFDLDMLPA + DALDDFDLDMLPADALDDFDLDMLPGS" + source 1154..1914 + /source="Exported" + misc_feature complement(1920..1925) + /note="BsmBI" + terminator 1992..2023 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 2024..2126 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1919..2574 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgg tgcccgccac catgtctaga ctggacaaga gcaaagtcat aaactctgct + 1201 ctggaattac tcaatggagt cggtatcgaa ggcctgacga caaggaaact cgctcaaaag + 1261 ctgggagttg agcagcctac cctgtactgg cacgtgaaga acaagcgggc cctgctcgat + 1321 gccctgccaa tcgagatgct ggacaggcat catacccact cctgccccct ggaaggcgag + 1381 tcatggcaag actttctgcg gaacaacgcc aagtcatacc gctgtgctct cctctcacat + 1441 cgcgacgggg ctaaagtgca tctcggcacc cgcccaacag agaaacagta cgaaaccctg + 1501 gaaaatcagc tcgcgttcct gtgtcagcaa ggcttctccc tggagaacgc actgtacgct + 1561 ctgtccgccg tgggccactt tacactgggc tgcgtattgg aggaacagga gcatcaagta + 1621 gcaaaagagg aaagagagac acctaccacc gattctatgc ccccacttct gaaacaagca + 1681 attgagctgt tcgaccggca gggagccgaa cctgccttcc ttttcggcct ggaactaatc + 1741 atatgtggcc tggagaaaca gctaaagtgc gaaagcggcg ggccgaccga cgcccttgac + 1801 gattttgact tagacatgct cccagccgat gcccttgacg actttgacct tgatatgctg + 1861 cctgctgacg ctcttgacga ttttgacctt gacatgctcc ccgggtcact aagtagcgcg + 1921 agacgaagac gaattctcta gatatcgctc aatactgacc atttaaatca tacctgacct + 1981 ccatagcaga aagtcaaaag cctccgaccg gaggcttttg acttgatcgg cacgtaagag + 2041 gttccaactt tcaccataat gaaataagat cactaccggg cgtatttttt gagttatcga + 2101 gattttcagg agctaaggaa gctaaaatga gccatattca acgggaaacg tcttgctcga + 2161 ggccgcgatt aaattccaac atggatgctg atttatatgg gtataaatgg gctcgcgata + 2221 atgtcgggca atcaggtgcg acaatctatc gattgtatgg gaagcccgat gcgccagagt + 2281 tgtttctgaa acatggcaaa ggtagcgttg ccaatgatgt tacagatgag atggtcaggc + 2341 taaactggct gacggaattt atgcctcttc cgaccatcaa gcattttatc cgtactcctg + 2401 atgatgcatg gttactcacc actgcgatcc cagggaaaac agcattccag gtattagaag + 2461 aatatcctga ttcaggtgaa aatattgttg atgcgctggc agtgttcctg cgccggttgc + 2521 attcgattcc tgtttgtaat tgtcctttta acggcgatcg cgtatttcgt ctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p1_5'-itr-pb.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p1_5'-itr-pb.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,78 @@ +LOCUS . 2163 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature complement(1174..1483) + /note="5'-ITR-PB" + source 1154..1503 + /source="Exported" + misc_feature complement(1509..1514) + /note="BsmBI" + terminator 1581..1612 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1613..1715 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1508..2163 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgt aggactatcc taacgtccac ttcttaaccc tagaaagata gtctgcgtaa + 1201 aattgacgca tgcattcttg aaatattgct ctctctttct aaatagcgcg aatccgtcgc + 1261 tgtgcattta ggacatctca gtcgccgctt ggagctcccg tgaggcgtgc ttgtcaatgc + 1321 ggtaagtgtc actgattttg aactataacg accgcgtgag tcaaaatgac gcatgattat + 1381 cttttacgtg acttttaaga tttaactcat acgataatta tattgttatt tcatgttcta + 1441 cttacgtgat aacttattat atatatattt tcttgttata gatcaggtgg atgaaagcgt + 1501 gtaatggcga gacgaagacg aattctctag atatcgctca atactgacca tttaaatcat + 1561 acctgacctc catagcagaa agtcaaaagc ctccgaccgg aggcttttga cttgatcggc + 1621 acgtaagagg ttccaacttt caccataatg aaataagatc actaccgggc gtattttttg + 1681 agttatcgag attttcagga gctaaggaag ctaaaatgag ccatattcaa cgggaaacgt + 1741 cttgctcgag gccgcgatta aattccaaca tggatgctga tttatatggg tataaatggg + 1801 ctcgcgataa tgtcgggcaa tcaggtgcga caatctatcg attgtatggg aagcccgatg + 1861 cgccagagtt gtttctgaaa catggcaaag gtagcgttgc caatgatgtt acagatgaga + 1921 tggtcaggct aaactggctg acggaattta tgcctcttcc gaccatcaag cattttatcc + 1981 gtactcctga tgatgcatgg ttactcacca ctgcgatccc agggaaaaca gcattccagg + 2041 tattagaaga atatcctgat tcaggtgaaa atattgttga tgcgctggca gtgttcctgc + 2101 gccggttgca ttcgattcct gtttgtaatt gtccttttaa cggcgatcgc gtatttcgtc + 2161 tcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p1_5'ha-haavs1.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p1_5'ha-haavs1.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,87 @@ +LOCUS . 2723 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1154..2063 + /note="AVVS1-5'HA" + source 1154..2063 + /source="Exported" + misc_feature complement(2069..2074) + /note="BsmBI" + terminator 2141..2172 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 2173..2275 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 2068..2723 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgt agggcacctc tccatcctct tgctttcttt gcctggacac cccgttctcc + 1201 tgtggattcg ggtcacctct cactcctttc atttgggcag ctcccctacc ccccttacct + 1261 ctctagtctg tgctagctct tccagccccc tgtcatggca tcttccaggg gtccgagagc + 1321 tcagctagtc ttcttcctcc aacccgggcc cctatgtcca cttcaggaca gcatgtttgc + 1381 tgcctccagg gatcctgtgt ccccgagctg ggaccacctt atattcccag ggccggttaa + 1441 tgtggctctg gttctgggta cttttatctg tcccctccac cccacagtgg ggccactagg + 1501 gacaggattg gtgacagaaa agccccatcc ttaggcctcc tccttcctag tctcctgata + 1561 ttgggtctaa cccccacctc ctgttaggca gattccttat ctggtgacac acccccattt + 1621 cctggagcca tctctctcct tgccagaacc tctaaggttt gcttacgatg gagccagaga + 1681 ggatcctggg agggagagct tggcaggggg tgggagggaa gggggggatg cgtgacctgc + 1741 ccggttctca gtggccaccc tgcgctaccc tctcccagaa cctgagctgc tctgacgcgg + 1801 ctgtctggtg cgtttcactg atcctggtgc tgcagcttcc ttacacttcc caagaggaga + 1861 agcagtttgg aaaaacaaaa tcagaataag ttggtcctga gttctaactt tggctcttca + 1921 cctttctagt ccccaattta tattgttcct ccgtgcgtca gttttacctg tgagataagg + 1981 ccagtagcca gccccgtcct ggcagggctg tggtgaggag gggggtgtcc gtgtggaaaa + 2041 ctccctttgt gagaatggtg cgtatggcga gacgaagacg aattctctag atatcgctca + 2101 atactgacca tttaaatcat acctgacctc catagcagaa agtcaaaagc ctccgaccgg + 2161 aggcttttga cttgatcggc acgtaagagg ttccaacttt caccataatg aaataagatc + 2221 actaccgggc gtattttttg agttatcgag attttcagga gctaaggaag ctaaaatgag + 2281 ccatattcaa cgggaaacgt cttgctcgag gccgcgatta aattccaaca tggatgctga + 2341 tttatatggg tataaatggg ctcgcgataa tgtcgggcaa tcaggtgcga caatctatcg + 2401 attgtatggg aagcccgatg cgccagagtt gtttctgaaa catggcaaag gtagcgttgc + 2461 caatgatgtt acagatgaga tggtcaggct aaactggctg acggaattta tgcctcttcc + 2521 gaccatcaag cattttatcc gtactcctga tgatgcatgg ttactcacca ctgcgatccc + 2581 agggaaaaca gcattccagg tattagaaga atatcctgat tcaggtgaaa atattgttga + 2641 tgcgctggca gtgttcctgc gccggttgca ttcgattcct gtttgtaatt gtccttttaa + 2701 cggcgatcgc gtatttcgtc tcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p20_ct-minute-nes.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p20_ct-minute-nes.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,74 @@ +LOCUS . 1848 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + CDS 1156..1188 + /codon_start=1 + /note="minute NES" + /translation="MTKKFGTLTI" + source 1154..1188 + /source="Exported" + misc_feature complement(1194..1199) + /note="BsmBI" + terminator 1266..1297 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1298..1400 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1193..1848 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcga gcggaatgac caagaagttc ggcaccctga ccatctaatg gacgagacga + 1201 agacgaattc tctagatatc gctcaatact gaccatttaa atcatacctg acctccatag + 1261 cagaaagtca aaagcctccg accggaggct tttgacttga tcggcacgta agaggttcca + 1321 actttcacca taatgaaata agatcactac cgggcgtatt ttttgagtta tcgagatttt + 1381 caggagctaa ggaagctaaa atgagccata ttcaacggga aacgtcttgc tcgaggccgc + 1441 gattaaattc caacatggat gctgatttat atgggtataa atgggctcgc gataatgtcg + 1501 ggcaatcagg tgcgacaatc tatcgattgt atgggaagcc cgatgcgcca gagttgtttc + 1561 tgaaacatgg caaaggtagc gttgccaatg atgttacaga tgagatggtc aggctaaact + 1621 ggctgacgga atttatgcct cttccgacca tcaagcattt tatccgtact cctgatgatg + 1681 catggttact caccactgcg atcccaggga aaacagcatt ccaggtatta gaagaatatc + 1741 ctgattcagg tgaaaatatt gttgatgcgc tggcagtgtt cctgcgccgg ttgcattcga + 1801 ttcctgtttg taattgtcct tttaacggcg atcgcgtatt tcgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p20_ct-nes.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p20_ct-nes.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,74 @@ +LOCUS . 1857 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + CDS 1156..1197 + /codon_start=1 + /note="NES" + /translation="ALALKLAGLDIGG" + source 1154..1197 + /source="Exported" + misc_feature complement(1203..1208) + /note="BsmBI" + terminator 1275..1306 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1307..1409 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1202..1857 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcga gcggagccct ggccctgaag ctggccggac tggacatcgg aggctaatgg + 1201 acgagacgaa gacgaattct ctagatatcg ctcaatactg accatttaaa tcatacctga + 1261 cctccatagc agaaagtcaa aagcctccga ccggaggctt ttgacttgat cggcacgtaa + 1321 gaggttccaa ctttcaccat aatgaaataa gatcactacc gggcgtattt tttgagttat + 1381 cgagattttc aggagctaag gaagctaaaa tgagccatat tcaacgggaa acgtcttgct + 1441 cgaggccgcg attaaattcc aacatggatg ctgatttata tgggtataaa tgggctcgcg + 1501 ataatgtcgg gcaatcaggt gcgacaatct atcgattgta tgggaagccc gatgcgccag + 1561 agttgtttct gaaacatggc aaaggtagcg ttgccaatga tgttacagat gagatggtca + 1621 ggctaaactg gctgacggaa tttatgcctc ttccgaccat caagcatttt atccgtactc + 1681 ctgatgatgc atggttactc accactgcga tcccagggaa aacagcattc caggtattag + 1741 aagaatatcc tgattcaggt gaaaatattg ttgatgcgct ggcagtgttc ctgcgccggt + 1801 tgcattcgat tcctgtttgt aattgtcctt ttaacggcga tcgcgtattt cgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p20_linker3.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p20_linker3.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,74 @@ +LOCUS . 1850 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + CDS 1156..1188 + /codon_start=1 + /note="Linker 3" + /translation="GGGSGGGGSAS" + source 1154..1190 + /source="Exported" + misc_feature complement(1196..1201) + /note="BsmBI" + terminator 1268..1299 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1300..1402 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1195..1850 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcga gcggaggcgg aggaagcggc ggaggaggct cagccagcgc tggacgagac + 1201 gaagacgaat tctctagata tcgctcaata ctgaccattt aaatcatacc tgacctccat + 1261 agcagaaagt caaaagcctc cgaccggagg cttttgactt gatcggcacg taagaggttc + 1321 caactttcac cataatgaaa taagatcact accgggcgta ttttttgagt tatcgagatt + 1381 ttcaggagct aaggaagcta aaatgagcca tattcaacgg gaaacgtctt gctcgaggcc + 1441 gcgattaaat tccaacatgg atgctgattt atatgggtat aaatgggctc gcgataatgt + 1501 cgggcaatca ggtgcgacaa tctatcgatt gtatgggaag cccgatgcgc cagagttgtt + 1561 tctgaaacat ggcaaaggta gcgttgccaa tgatgttaca gatgagatgg tcaggctaaa + 1621 ctggctgacg gaatttatgc ctcttccgac catcaagcat tttatccgta ctcctgatga + 1681 tgcatggtta ctcaccactg cgatcccagg gaaaacagca ttccaggtat tagaagaata + 1741 tcctgattca ggtgaaaata ttgttgatgc gctggcagtg ttcctgcgcc ggttgcattc + 1801 gattcctgtt tgtaattgtc cttttaacgg cgatcgcgta tttcgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p20_p2a.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p20_p2a.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,80 @@ +LOCUS . 1874 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + CDS 1156..1212 + /codon_start=1 + /note="P2A-Porcine teschovirus-1" + /note="Eukaryotic ribosomes fail to insert a peptide bond + between the Gly and Pro residues, yielding separate + polypeptides." + /product="2A peptide from porcine teschovirus-1 + polyprotein" + /translation="ATNFSLLKQAGDVEENPGP" + source 1154..1214 + /source="Exported" + misc_feature complement(1220..1225) + /note="BsmBI" + terminator 1292..1323 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1324..1426 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1219..1874 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcga gcggcgctac taacttcagc ctgctgaagc aggctggcga cgtggaggag + 1201 aaccctggac cttctggacg agacgaagac gaattctcta gatatcgctc aatactgacc + 1261 atttaaatca tacctgacct ccatagcaga aagtcaaaag cctccgaccg gaggcttttg + 1321 acttgatcgg cacgtaagag gttccaactt tcaccataat gaaataagat cactaccggg + 1381 cgtatttttt gagttatcga gattttcagg agctaaggaa gctaaaatga gccatattca + 1441 acgggaaacg tcttgctcga ggccgcgatt aaattccaac atggatgctg atttatatgg + 1501 gtataaatgg gctcgcgata atgtcgggca atcaggtgcg acaatctatc gattgtatgg + 1561 gaagcccgat gcgccagagt tgtttctgaa acatggcaaa ggtagcgttg ccaatgatgt + 1621 tacagatgag atggtcaggc taaactggct gacggaattt atgcctcttc cgaccatcaa + 1681 gcattttatc cgtactcctg atgatgcatg gttactcacc actgcgatcc cagggaaaac + 1741 agcattccag gtattagaag aatatcctga ttcaggtgaa aatattgttg atgcgctggc + 1801 agtgttcctg cgccggttgc attcgattcc tgtttgtaat tgtcctttta acggcgatcg + 1861 cgtatttcgt ctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p21_dmra.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p21_dmra.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,82 @@ +LOCUS . 2140 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1814..2134 + /codon_start=1 + /note="FKBP (DmrA)" + /product="human FK506-binding protein FKBP12" + /translation="GVQVETISPGDGRTFPKRGQTCVVHYTGMLEDGKKFDSSRDRNKP + FKFMLGKQEVIRGWEEGVAQMSVGQRAKLTISPDYAYGATGHPGIIPPHATLVFDVELL + KLE" + source 1814..2140 + /source="Exported" +ORIGIN + 1 gttgcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgt ggaggagtgc aggtggaaac catctcccca ggcgacgggc gcaccttccc + 1861 caagcgcggc cagacctgcg tggtgcacta caccgggatg cttgaagatg gaaagaaatt + 1921 tgattcctcc cgggacagaa acaagccctt taagtttatg ctaggcaagc aggaggtgat + 1981 ccgaggctgg gaagaagggg ttgcccagat gagtgtgggt cagagagcca aactgactat + 2041 atctccagat tatgcctatg gtgccactgg gcacccaggc atcatcccac cacatgccac + 2101 tctcgtcttc gatgtggagc ttctaaaact ggaataataa +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p21_mkate2.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p21_mkate2.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,90 @@ +LOCUS . 2509 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1814..2506 + /codon_start=1 + /gene="mKate2" + /note="mKate2" + /translation="VSELIKENMHMKLYMEGTVNNHHFKCTSEGEGKPYEGTQTMRIKA + VEGGPLPFAFDILATSFMYGSKTFINHTQGIPDFFKQSFPEGFTWERVTTYEDGGVLTA + TQDTSLQDGCLIYNVKIRGVNFPSNGPVMQKKTLGWEASTETLYPADGGLEGRADMALK + LVGGGHLICNLKTTYRSKKPAKNLKMPGVYYVDRRLERIKEADKETYVEQHEVAVARYC + DLPSKLGHR" + source 1814..2509 + /source="Exported" +ORIGIN + 1 gttgcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgt ggagtgagcg agctgattaa ggagaacatg cacatgaagc tgtacatgga + 1861 gggcaccgtg aacaaccacc acttcaagtg cacatccgag ggcgaaggca agccctacga + 1921 gggcacccag accatgagaa tcaaggcggt cgagggcggc cctctcccct tcgccttcga + 1981 catcctggct accagcttca tgtacggcag caaaaccttc atcaaccaca cccagggcat + 2041 ccccgacttc tttaagcagt ccttccccga gggcttcaca tgggagagag tcaccacata + 2101 cgaagacggg ggcgtgctga ccgctaccca ggacaccagc ctccaggacg gctgcctcat + 2161 ctacaacgtc aagatcagag gggtgaactt cccatccaac ggccctgtga tgcagaagaa + 2221 aacactcggc tgggaggcct ccaccgaaac cctgtacccc gctgacggcg gcctggaagg + 2281 cagagccgac atggccctga agctcgtggg cgggggccac ctgatctgca acttgaagac + 2341 cacatacaga tccaagaaac ccgctaagaa cctcaagatg cccggcgtct actatgtgga + 2401 cagaagactg gaaagaatca aggaggccga caaagaaacc tacgtcgagc agcacgaggt + 2461 ggctgtggcc agatactgcg acctccctag caaactgggg cacagataa +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p21_mneogreen.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p21_mneogreen.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,92 @@ +LOCUS . 2521 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1814..2518 + /codon_start=1 + /note="mNeonGreen" + /product="bright monomeric yellow-green fluorescent protein + derived from LanYFP (Shaner et al., 2013)" + /translation="VSKGEEDNMASLPATHELHIFGSINGVDFDMVGQGTGNPNDGYEE + LNLKSTKGDLQFSPWILVPHIGYGFHQYLPYPDGMSPFQAAMVDGSGYQVHRTMQFEDG + ASLTVNYRYTYEGSHIKGEAQVKGTGFPADGPVMTNSLTAADWCRSKKTYPNDKTIIST + FKWSYTTGNGKRYRSTARTTYTFAKPMAANYLKNQPMYVFRKTELKHSKTELNFKEWQK + AFTDVMGMDELYK" + source 1814..2521 + /source="Exported" +ORIGIN + 1 gttgcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgt ggagtgagca agggcgagga ggataacatg gcctctctcc cagcgacaca + 1861 tgagttacac atctttggct ccatcaacgg tgtggacttt gacatggtgg gtcagggcac + 1921 cggcaatcca aatgatggtt atgaggagtt aaacctgaag tccaccaagg gtgacctcca + 1981 gttctccccc tggattctgg tccctcatat cgggtatggc ttccatcagt acctgcccta + 2041 ccctgacggg atgtcgcctt tccaggccgc catggtagat ggctccggat accaagtcca + 2101 tcgcacaatg cagtttgaag atggtgcctc ccttactgtt aactaccgct acacctacga + 2161 gggaagccac atcaaaggag aggcccaggt gaaggggact ggtttccctg ctgacggtcc + 2221 tgtgatgacc aactcgctga ccgctgcgga ctggtgcagg tcgaagaaga cttaccccaa + 2281 cgacaaaacc atcatcagta cctttaagtg gagttacacc actggaaatg gcaagcgcta + 2341 ccggagcact gcgcggacca cctacacctt tgccaagcca atggcggcta actatctgaa + 2401 gaaccagccg atgtacgtgt tccgtaagac ggagctcaag cactccaaga ccgagctcaa + 2461 cttcaaggag tggcaaaagg cctttaccga tgtgatgggc atggacgagc tgtacaagta + 2521 a +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p21_mruby2.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p21_mruby2.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,93 @@ +LOCUS . 2524 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1814..2521 + /codon_start=1 + /note="mRuby2" + /product="monomeric red fluorescent protein derived from + mRuby, with improved photophysical properties (Lam et al., + 2012)" + /translation="VSKGEELIKENMRMKVVMEGSVNGHQFKCTGEGEGNPYMGTQTMR + IKVIEGGPLPFAFDILATSFMYGSRTFIKYPKGIPDFFKQSFPEGFTWERVTRYEDGGV + VTVMQDTSLEDGCLVYHVQVRGVNFPSNGPVMQKKTKGWEPNTEMMYPADGGLRGYTHM + ALKVDGGGHLSCSFVTTYRSKKTVGNIKMPGIHAVDHRLERLEESDNEMFVVQREHAVA + KFAGLGGGMDELYK" + source 1814..2524 + /source="Exported" +ORIGIN + 1 gttgcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgt ggagtgtcta agggcgaaga gctgatcaag gaaaatatgc gtatgaaggt + 1861 ggtcatggaa ggttcggtca acggccacca attcaaatgc acaggtgaag gagaaggcaa + 1921 tccgtacatg ggaactcaaa ccatgaggat caaagtcatc gagggaggac ccctgccatt + 1981 tgcctttgac attcttgcca cgtcgttcat gtatggcagc cgtactttta tcaagtaccc + 2041 gaaaggcatt cctgatttct ttaaacagtc ctttcctgag ggttttactt gggaaagagt + 2101 tacgagatac gaagatggtg gagtcgtcac cgtcatgcag gacaccagcc ttgaggatgg + 2161 ctgtctcgtt taccacgtcc aagtcagagg ggtaaacttt ccctccaatg gtcccgtgat + 2221 gcagaagaag accaagggtt gggagcctaa tacagagatg atgtatccag cagatggtgg + 2281 tctgagggga tacactcata tggcactgaa agttgatggt ggtggccatc tgtcttgctc + 2341 tttcgtaaca acttacaggt caaaaaagac cgtcgggaac atcaagatgc ccggtatcca + 2401 tgccgttgat caccgcctgg aaaggttaga ggaaagtgac aatgaaatgt tcgtagtaca + 2461 acgcgaacac gcagttgcca agttcgccgg gcttggtggt gggatggacg agctgtacaa + 2521 gtaa +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p21_mtagbfp2.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p21_mtagbfp2.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,93 @@ +LOCUS . 2524 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1814..2521 + /codon_start=1 + /note="mTagBFP2" + /note="mammalian codon-optimized" + /product="enhanced monomeric blue fluorescent protein + (Subach et al., 2011)" + /translation="VSKGEELIKENMHMKLYMEGTVDNHHFKCTSEGEGKPYEGTQTMR + IKVVEGGPLPFAFDILATSFLYGSKTFINHTQGIPDFFKQSFPEGFTWERVTTYEDGGV + LTATQDTSLQDGCLIYNVKIRGVNFTSNGPVMQKKTLGWEAFTETLYPADGGLEGRNDM + ALKLVGGSHLIANAKTTYRSKKPAKNLKMPGVYYVDYRLERIKEANNETYVEQHEVAVA + RYCDLPSKLGHKLN" + source 1814..2524 + /source="Exported" +ORIGIN + 1 gttgcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgt ggagtgtcta agggcgaaga gctgattaag gagaacatgc acatgaagct + 1861 gtacatggag ggcaccgtgg acaaccatca cttcaagtgc acatccgagg gcgaaggcaa + 1921 gccctacgag ggcacccaga ccatgagaat caaggtggtc gagggcggcc ctctcccctt + 1981 cgccttcgac atcctggcta ctagcttcct ctacggcagc aagaccttca tcaaccacac + 2041 ccagggcatc cccgacttct tcaagcagtc cttccctgag ggcttcacat gggagagagt + 2101 caccacatac gaagacgggg gcgtgctgac cgctacccag gacaccagcc tccaggacgg + 2161 ctgcctcatc tacaacgtca agatcagagg ggtgaacttc acatccaacg gccctgtgat + 2221 gcagaagaaa acactcggct gggaggcctt caccgaaacg ctgtaccccg ctgacggcgg + 2281 cctggaaggc agaaacgaca tggccctgaa gctcgtgggc gggagccatc tgatcgcaaa + 2341 cgccaagacc acatatagat ccaagaaacc cgctaagaac ctcaagatgc ctggcgtcta + 2401 ctatgtggac tacagactgg aaagaatcaa ggaggccaac aacgaaacct acgtcgagca + 2461 gcacgaggtg gcagtggcca gatactgcga cctccctagc aaactggggc acaagcttaa + 2521 ttaa +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p21_puror.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p21_puror.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,90 @@ +LOCUS . 2413 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1814..2410 + /codon_start=1 + /gene="pac from Streptomyces" + /note="PuroR" + /note="confers resistance to puromycin" + /product="puromycin N-acetyltransferase" + /translation="TEYKPTVRLATRDDVPRAVRTLAAAFADYPATRHTVDPDRHIERV + TELQELFLTRVGLDIGKVWVADDGAAVAVWTTPESVEAGAVFAEIGPRMAELSGSRLAA + QQQMEGLLAPHRPKEPAWFLATVGVSPDHQGKGLGSAVVLPGVEAAERAGVPAFLETSA + PRNLPFYERLGFTVTADVECPKDRATWCMTRKPGA" + source 1814..2413 + /source="Exported" +ORIGIN + 1 gttgcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgt ggaaccgagt acaagcccac ggtgcgcctc gccacccgcg acgacgtccc + 1861 cagggccgta cgcaccctcg ccgccgcgtt cgccgactac cccgccacgc gccacaccgt + 1921 cgatccggac cgccacatcg agcgggtcac cgagctgcaa gaactcttcc tcacgcgcgt + 1981 cgggctcgac atcggcaagg tgtgggtcgc ggacgacggc gccgcggtgg cggtctggac + 2041 cacgccggag agcgtcgaag cgggggcggt gttcgccgag atcggcccgc gcatggccga + 2101 gttgagcggt tcccggctgg ccgcgcagca acagatggaa ggcctcctgg cgccgcaccg + 2161 gcccaaggag cccgcgtggt tcctggccac cgtcggcgtg tcgcccgacc accagggcaa + 2221 gggtctgggc agcgccgtcg tgctccccgg agtggaggcg gccgagcgcg ccggggtgcc + 2281 cgccttcctg gaaacctccg cgccccgcaa cctccccttc tacgagcggc tcggcttcac + 2341 cgtcaccgcc gacgtcgagt gcccgaagga ccgcgcgacc tggtgcatga cccgcaagcc + 2401 cggtgcctaa taa +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p22_pgkpolya.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p22_pgkpolya.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,76 @@ +LOCUS . 2042 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + polyA_signal 1837..2042 + /note="PGK-polyA" + source 1814..2042 + /source="Exported" +ORIGIN + 1 cgaacgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgg ttgccttgag catctgactt ctggctaaat tgatgatcta ttaaacaata + 1861 aagatgtcca catggaagtt ttttcctgtc atactttgtt aagaagggtg agaacagagt + 1921 acctacattt tgaatggaag gattggagct acgggggtgg gggtggggtg ggattagata + 1981 aatgcctgct ctttactgaa ggctctttac tattgcttta tgataatgtt tcatagttgg + 2041 at +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p23_insulatorfb.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p23_insulatorfb.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,74 @@ +LOCUS . 1954 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + misc_feature 1814..1954 + /note="Insulator FB-pos23" + source 1814..1954 + /source="Exported" +ORIGIN + 1 cacgcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgc gaaggccgcg aattctgaaa gaccccacct gtaggtttgg caagcccagg + 1861 gatgtacgtc cctaacccgc tagggggcag caactagtcc caggcctgca ctgccgcctg + 1921 ccggcagggg tccagtcgct agcgcatgcc tgca +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p24_3'ha_haavs1.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p24_3'ha_haavs1.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,82 @@ +LOCUS . 2446 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + misc_feature 1814..2446 + /note="3'-HA_hAAVS1" + source 1814..2446 + /source="Exported" +ORIGIN + 1 actgcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgc acgccgcctc tactcccttt ctctttctcc atccttcttt ccttaaagag + 1861 tccccagtgc tatctgggac atattcctcc gcccagagca gggtcccgct tccctaaggc + 1921 cctgctctgg gcttctgggt ttgagtcctt ggcaagccca ggagaggcgc tcaggcttcc + 1981 ctgtccccct tcctcgtcca ccatctcatg cccctggctc tcctgcccct tccctacagg + 2041 ggttcctggc tctgctcttc agactgagcc ccgttcccct gcatccccgt tcccctgcat + 2101 cccccttccc ctgcatcccc cagaggcccc aggccaccta cttggcctgg accccacgag + 2161 aggccacccc agccctgtct accaggctgc cttttgggtg gattctcctc caactgtggg + 2221 gtgactgctt ggcaaactca ctcttcgggg tatcccagga ggcctggagc attggggtgg + 2281 gctggggttc agagaggagg gattcccttc tcaggttacg tggccaagaa gcaggggagc + 2341 tgggtttggg tcaggtctgg gtgtggggtg accagcttat gctgtttgcc caggacagcc + 2401 tagttttagc actgaaaccc tcagtctaat ggttacaaat aaagca +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p24_3'pb.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p24_3'pb.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,76 @@ +LOCUS . 2060 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + misc_feature complement(1834..2039) + /note="Piggy 3'" + source 1814..2060 + /source="Exported" +ORIGIN + 1 actgcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgc acgtgcatcc acgatctagt cactttgtta ctttatagaa gaaattttga + 1861 gtttttgttt ttttttaata aataaataaa cataaataaa ttgtttgttg aatttattat + 1921 tagtatgtaa gtgtaaatat aataaaactt aatatctatt caaattaata aataaacgtc + 1981 aattttacgc atgattatct ttaacgtacg tcacaatatg attatctttc tagggttaac + 2041 tactcaccct cgagcataac +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p25_sv40-ori.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p25_sv40-ori.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,75 @@ +LOCUS . 1949 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + rep_origin 1814..1949 + /note="SV40-ORI" + /note="SV40 origin of replication" + source 1814..1949 + /source="Exported" +ORIGIN + 1 acgacgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcga ctgatcccgc ccctaactcc gcccagttcc gcccattctc cgccccatgg + 1861 ctgactaatt ttttttattt atgcagaggc cgaggccgcc tctgcctctg agctattcca + 1921 gaagtagtga ggaggctttt ttggaggcc +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p2_insulatorfb.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p2_insulatorfb.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,74 @@ +LOCUS . 1954 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1154..1294 + /note="Insulator FB" + source 1154..1294 + /source="Exported" + misc_feature complement(1300..1305) + /note="BsmBI" + terminator 1372..1403 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1404..1506 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1299..1954 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcga tggggccgcg aattctgaaa gaccccacct gtaggtttgg caagcccagg + 1201 gatgtacgtc cctaacccgc tagggggcag caactagtcc caggcctgca ctgccgcctg + 1261 ccggcagggg tccagtcgct agcgcatgcc tgcagactcg agacgaagac gaattctcta + 1321 gatatcgctc aatactgacc atttaaatca tacctgacct ccatagcaga aagtcaaaag + 1381 cctccgaccg gaggcttttg acttgatcgg cacgtaagag gttccaactt tcaccataat + 1441 gaaataagat cactaccggg cgtatttttt gagttatcga gattttcagg agctaaggaa + 1501 gctaaaatga gccatattca acgggaaacg tcttgctcga ggccgcgatt aaattccaac + 1561 atggatgctg atttatatgg gtataaatgg gctcgcgata atgtcgggca atcaggtgcg + 1621 acaatctatc gattgtatgg gaagcccgat gcgccagagt tgtttctgaa acatggcaaa + 1681 ggtagcgttg ccaatgatgt tacagatgag atggtcaggc taaactggct gacggaattt + 1741 atgcctcttc cgaccatcaa gcattttatc cgtactcctg atgatgcatg gttactcacc + 1801 actgcgatcc cagggaaaac agcattccag gtattagaag aatatcctga ttcaggtgaa + 1861 aatattgttg atgcgctggc agtgttcctg cgccggttgc attcgattcc tgtttgtaat + 1921 tgtcctttta acggcgatcg cgtatttcgt ctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p3_cagp.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p3_cagp.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,86 @@ +LOCUS . 2503 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + enhancer 1172..1551 + /note="CMV enhancer" + /note="human cytomegalovirus immediate early enhancer" + promoter 1553..1828 + /note="chicken beta-actin promoter" + source 1154..1843 + /source="Exported" + misc_feature complement(1849..1854) + /note="BsmBI" + terminator 1921..1952 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1953..2055 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1848..2503 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgg actggatctg atatcatcgt cgacattgat tattgactag ttattaatag + 1201 taatcaatta cggggtcatt agttcatagc ccatatatgg agttccgcgt tacataactt + 1261 acggtaaatg gcccgcctgg ctgaccgccc aacgaccccc gcccattgac gtcaataatg + 1321 acgtatgttc ccatagtaac gccaataggg actttccatt gacgtcaatg ggtggactat + 1381 ttacggtaaa ctgcccactt ggcagtacat caagtgtatc atatgccaag tacgccccct + 1441 attgacgtca atgacggtaa atggcccgcc tggcattatg cccagtacat gaccttatgg + 1501 gactttccta cttggcagta catctacgta ttagtcatcg ctattaccat ggtcgaggtg + 1561 agccccacgt tctgcttcac tctccccatc tcccccccct ccccaccccc aattttgtat + 1621 ttatttattt tttaattatt ttgtgcagcg atgggggcgg gggggggggg ggcgcgcgcc + 1681 aggcggggcg gggcggggcg aggggcgggg cggggcgagg cggagaggtg cggcggcagc + 1741 caatcagagc ggcgcgctcc gaaagtttcc ttttatggcg aggcggcggc ggcggcggcc + 1801 ctataaaaag cgaagcgcgc ggcgggcggg agtcgctgcg ttgggaccga gacgaagacg + 1861 aattctctag atatcgctca atactgacca tttaaatcat acctgacctc catagcagaa + 1921 agtcaaaagc ctccgaccgg aggcttttga cttgatcggc acgtaagagg ttccaacttt + 1981 caccataatg aaataagatc actaccgggc gtattttttg agttatcgag attttcagga + 2041 gctaaggaag ctaaaatgag ccatattcaa cgggaaacgt cttgctcgag gccgcgatta + 2101 aattccaaca tggatgctga tttatatggg tataaatggg ctcgcgataa tgtcgggcaa + 2161 tcaggtgcga caatctatcg attgtatggg aagcccgatg cgccagagtt gtttctgaaa + 2221 catggcaaag gtagcgttgc caatgatgtt acagatgaga tggtcaggct aaactggctg + 2281 acggaattta tgcctcttcc gaccatcaag cattttatcc gtactcctga tgatgcatgg + 2341 ttactcacca ctgcgatccc agggaaaaca gcattccagg tattagaaga atatcctgat + 2401 tcaggtgaaa atattgttga tgcgctggca gtgttcctgc gccggttgca ttcgattcct + 2461 gtttgtaatt gtccttttaa cggcgatcgc gtatttcgtc tcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p3_cmvp_tet.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p3_cmvp_tet.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,98 @@ +LOCUS . 2440 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + enhancer 1154..1533 + /note="CMV enhancer" + /note="human cytomegalovirus immediate early enhancer" + promoter 1534..1737 + /note="CMV promoter" + /note="human cytomegalovirus (CMV) immediate early + promoter" + TATA_signal 1723..1729 + protein_bind 1739..1757 + /bound_moiety="tetracycline repressor TetR" + /gene="tetO" + /note="tet operator" + /note="bacterial operator O2 for the tetR and tetA genes" + protein_bind 1760..1778 + /bound_moiety="tetracycline repressor TetR" + /gene="tetO" + /note="tet operator" + /note="bacterial operator O2 for the tetR and tetA genes" + source 1154..1780 + /source="Exported" + misc_feature complement(1786..1791) + /note="BsmBI" + terminator 1858..1889 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1890..1992 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1785..2440 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgg actgacattg attattgact agttattaat agtaatcaat tacggggtca + 1201 ttagttcata gcccatatat ggagttccgc gttacataac ttacggtaaa tggcccgcct + 1261 ggctgaccgc ccaacgaccc ccgcccattg acgtcaataa tgacgtatgt tcccatagta + 1321 acgccaatag ggactttcca ttgacgtcaa tgggtggagt atttacggta aactgcccac + 1381 ttggcagtac atcaagtgta tcatatgcca agtacgcccc ctattgacgt caatgacggt + 1441 aaatggcccg cctggcatta tgcccagtac atgaccttat gggactttcc tacttggcag + 1501 tacatctacg tattagtcat cgctattacc atggtgatgc ggttttggca gtacatcaat + 1561 gggcgtggat agcggtttga ctcacgggga tttccaagtc tccaccccat tgacgtcaat + 1621 gggagtttgt tttggaacca aaatcaacgg gactttccaa aatgtcgtaa caactccgcc + 1681 ccattgacgc aaatgggcgg taggcgtgta cggtgggagg tctatataag cagagctctc + 1741 cctatcagtg atagagatct ccctatcagt gatagagatt ggaccgagac gaagacgaat + 1801 tctctagata tcgctcaata ctgaccattt aaatcatacc tgacctccat agcagaaagt + 1861 caaaagcctc cgaccggagg cttttgactt gatcggcacg taagaggttc caactttcac + 1921 cataatgaaa taagatcact accgggcgta ttttttgagt tatcgagatt ttcaggagct + 1981 aaggaagcta aaatgagcca tattcaacgg gaaacgtctt gctcgaggcc gcgattaaat + 2041 tccaacatgg atgctgattt atatgggtat aaatgggctc gcgataatgt cgggcaatca + 2101 ggtgcgacaa tctatcgatt gtatgggaag cccgatgcgc cagagttgtt tctgaaacat + 2161 ggcaaaggta gcgttgccaa tgatgttaca gatgagatgg tcaggctaaa ctggctgacg + 2221 gaatttatgc ctcttccgac catcaagcat tttatccgta ctcctgatga tgcatggtta + 2281 ctcaccactg cgatcccagg gaaaacagca ttccaggtat tagaagaata tcctgattca + 2341 ggtgaaaata ttgttgatgc gctggcagtg ttcctgcgcc ggttgcattc gattcctgtt + 2401 tgtaattgtc cttttaacgg cgatcgcgta tttcgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p3_ef1ap.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p3_ef1ap.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,98 @@ +LOCUS . 3037 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + promoter 5..1183 + /note="EF-1-alpha promoter" + /note="strong constitutive promoter for human elongation + factor EF-1-alpha" + intron 236..1174 + /note="EF-1-alpha intron A" + /note="intron upstream of the start codon of human + EF-1-alpha" + source 5..1228 + /source="Exported" + misc_feature complement(1234..1239) + /note="BsmBI" + terminator 1306..1337 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1338..1440 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1233..1888 + /source="Exported" + terminator 2280..2307 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(2319..2906) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 2928..2957 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 3031..3036 + /note="BsmBI" + source 1893..3037 + /source="Exported" +ORIGIN + 1 gactggctcc ggtgcccgtc agtgggcaga gcgcacatcg cccacagtcc ccgagaagtt + 61 ggggggaggg gtcggcaatt gaaccggtgc ctagagaagg tggcgcgggg taaactggga + 121 aagtgatgtc gtgtactggc tccgcctttt tcccgagggt gggggagaac cgtatataag + 181 tgcagtagtc gccgtgaacg ttctttttcg caacgggttt gccgccagaa cacaggtaag + 241 tgccgtgtgt ggttcccgcg ggcctggcct ctttacgggt tatggccctt gcgtgccttg + 301 aattacttcc acctggctgc agtacgtgat tcttgatccc gagcttcggg ttggaagtgg + 361 gtgggagagt tcgaggcctt gcgcttaagg agccccttcg cctcgtgctt gagttgaggc + 421 ctggcctggg cgctggggcc gccgcgtgcg aatctggtgg caccttcgcg cctgtctcgc + 481 tgctttcgat aagtctctag ccatttaaaa tttttgatga cctgctgcga cgcttttttt + 541 ctggcaagat agtcttgtaa atgcgggcca agatctgcac actggtattt cggtttttgg + 601 ggccgcgggc ggcgacgggg cccgtgcgtc ccagcgcaca tgttcggcga ggcggggcct + 661 gcgagcgcgg ccaccgagaa tcggacgggg gtagtctcaa gctggccggc ctgctctggt + 721 gcctggcctc gcgccgccgt gtatcgcccc gccctgggcg gcaaggctgg cccggtcggc + 781 accagttgcg tgagcggaaa gatggccgct tcccggccct gctgcaggga gctcaaaatg + 841 gaggacgcgg cgctcgggag agcgggcggg tgagtcaccc acacaaagga aaagggcctt + 901 tccgtcctca gccgtcgctt catgtgactc cacggagtac cgggcgccgt ccaggcacct + 961 cgattagttc tcgagctttt ggagtacgtc gtctttaggt tggggggagg ggttttatgc + 1021 gatggagttt ccccacactg agtgggtgga gactgaagtt aggccagctt ggcacttgat + 1081 gtaattctcc ttggaatttg ccctttttga gtttggatct tggttcattc tcaagcctca + 1141 gacagtggtt caaagttttt ttcttccatt tcaggtgtcg tgacgctagc gctaccggac + 1201 tcagatctcg agctcaagct tcgaattcgg accgagacga agacgaattc tctagatatc + 1261 gctcaatact gaccatttaa atcatacctg acctccatag cagaaagtca aaagcctccg + 1321 accggaggct tttgacttga tcggcacgta agaggttcca actttcacca taatgaaata + 1381 agatcactac cgggcgtatt ttttgagtta tcgagatttt caggagctaa ggaagctaaa + 1441 atgagccata ttcaacggga aacgtcttgc tcgaggccgc gattaaattc caacatggat + 1501 gctgatttat atgggtataa atgggctcgc gataatgtcg ggcaatcagg tgcgacaatc + 1561 tatcgattgt atgggaagcc cgatgcgcca gagttgtttc tgaaacatgg caaaggtagc + 1621 gttgccaatg atgttacaga tgagatggtc aggctaaact ggctgacgga atttatgcct + 1681 cttccgacca tcaagcattt tatccgtact cctgatgatg catggttact caccactgcg + 1741 atcccaggga aaacagcatt ccaggtatta gaagaatatc ctgattcagg tgaaaatatt + 1801 gttgatgcgc tggcagtgtt cctgcgccgg ttgcattcga ttcctgtttg taattgtcct + 1861 tttaacggcg atcgcgtatt tcgtctcgct caggcgcaat cacgaatgaa taacggtttg + 1921 gttggtgcga gtgattttga tgacgagcgt aatggctggc ctgttgaaca agtctggaaa + 1981 gaaatgcata agcttttgcc attctcaccg gattcagtcg tcactcatgg tgatttctca + 2041 cttgataacc ttatttttga cgaggggaaa ttaataggtt gtattgatgt tggacgagtc + 2101 ggaatcgcag accgatacca ggatcttgcc atcctatgga actgcctcgg tgagttttct + 2161 ccttcattac agaaacggct ttttcaaaaa tatggtattg ataatcctga tatgaataaa + 2221 ttgcagtttc acttgatgct cgatgagttt ttctaatgag ggcccaaatg taatcacctg + 2281 gctcaccttc gggtgggcct ttctgcgttg ctggcgtttt tccataggct ccgcccccct + 2341 gacgagcatc acaaaaatcg atgctcaagt cagaggtggc gaaacccgac aggactataa + 2401 agataccagg cgtttccccc tggaagctcc ctcgtgcgct ctcctgttcc gaccctgccg + 2461 cttaccggat acctgtccgc ctttctccct tcgggaagcg tggcgctttc tcatagctca + 2521 cgctgtaggt atctcagttc ggtgtaggtc gttcgctcca agctgggctg tgtgcacgaa + 2581 ccccccgttc agcccgaccg ctgcgcctta tccggtaact atcgtcttga gtccaacccg + 2641 gtaagacacg acttatcgcc actggcagca gccactggta acaggattag cagagcgagg + 2701 tatgtaggcg gtgctacaga gttcttgaag tggtggccta actacggcta cactagaaga + 2761 acagtatttg gtatctgcgc tctgctgaag ccagttacct cggaaaaaga gttggtagct + 2821 cttgatccgg caaacaaacc accgctggta gcggtggttt ttttgtttgc aagcagcaga + 2881 ttacgcgcag aaaaaaagga tctcaagaag atcctttgat tttctaccga agaaaggccc + 2941 acccgtgaag gtgagccagt gagttgattg cagtccagtt acgctggagt ctgaggctcg + 3001 tcctgaatga tatcaagctt gaattcgtta cgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p3_tre3gp.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p3_tre3gp.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,115 @@ +LOCUS . 2209 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + promoter 1171..1549 + /note="TRE3G promoter" + /note="3rd-generation Tet-responsive promoter that can be + activated by binding of Tet-On(R) 3G" + protein_bind 1179..1197 + /bound_moiety="tetracycline repressor TetR" + /gene="tetO" + /note="tet operator" + /note="bacterial operator O2 for the tetR and tetA genes" + protein_bind 1215..1233 + /bound_moiety="tetracycline repressor TetR" + /gene="tetO" + /note="tet operator" + /note="bacterial operator O2 for the tetR and tetA genes" + protein_bind 1251..1269 + /bound_moiety="tetracycline repressor TetR" + /gene="tetO" + /note="tet operator" + /note="bacterial operator O2 for the tetR and tetA genes" + protein_bind 1287..1305 + /bound_moiety="tetracycline repressor TetR" + /gene="tetO" + /note="tet operator" + /note="bacterial operator O2 for the tetR and tetA genes" + protein_bind 1323..1341 + /bound_moiety="tetracycline repressor TetR" + /gene="tetO" + /note="tet operator" + /note="bacterial operator O2 for the tetR and tetA genes" + protein_bind 1359..1377 + /bound_moiety="tetracycline repressor TetR" + /gene="tetO" + /note="tet operator" + /note="bacterial operator O2 for the tetR and tetA genes" + protein_bind 1395..1413 + /bound_moiety="tetracycline repressor TetR" + /gene="tetO" + /note="tet operator" + /note="bacterial operator O2 for the tetR and tetA genes" + source 1154..1549 + /source="Exported" + misc_feature complement(1555..1560) + /note="BsmBI" + terminator 1627..1658 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1659..1761 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1554..2209 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgg actttatacg aagttatctc gagtttactc cctatcagtg atagagaacg + 1201 tatgaagagt ttactcccta tcagtgatag agaacgtatg cagactttac tccctatcag + 1261 tgatagagaa cgtataagga gtttactccc tatcagtgat agagaacgta tgaccagttt + 1321 actccctatc agtgatagag aacgtatcta cagtttactc cctatcagtg atagagaacg + 1381 tatatccagt ttactcccta tcagtgatag agaacgtata agctttaggc gtgtacggtg + 1441 ggcgcctata aaagcagagc tcgtttagtg aaccgtcaga tcgcctggag caattccaca + 1501 acacttttgt cttataccaa ctttccgtac cacttcctac cctcgtaaag gaccgagacg + 1561 aagacgaatt ctctagatat cgctcaatac tgaccattta aatcatacct gacctccata + 1621 gcagaaagtc aaaagcctcc gaccggaggc ttttgacttg atcggcacgt aagaggttcc + 1681 aactttcacc ataatgaaat aagatcacta ccgggcgtat tttttgagtt atcgagattt + 1741 tcaggagcta aggaagctaa aatgagccat attcaacggg aaacgtcttg ctcgaggccg + 1801 cgattaaatt ccaacatgga tgctgattta tatgggtata aatgggctcg cgataatgtc + 1861 gggcaatcag gtgcgacaat ctatcgattg tatgggaagc ccgatgcgcc agagttgttt + 1921 ctgaaacatg gcaaaggtag cgttgccaat gatgttacag atgagatggt caggctaaac + 1981 tggctgacgg aatttatgcc tcttccgacc atcaagcatt ttatccgtac tcctgatgat + 2041 gcatggttac tcaccactgc gatcccaggg aaaacagcat tccaggtatt agaagaatat + 2101 cctgattcag gtgaaaatat tgttgatgcg ctggcagtgt tcctgcgccg gttgcattcg + 2161 attcctgttt gtaattgtcc ttttaacggc gatcgcgtat ttcgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p4_kt-l7ae -weiss.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p4_kt-l7ae -weiss.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,72 @@ +LOCUS . 1845 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1156..1182 + /note="Kt - L7Ae" + source 1154..1185 + /source="Exported" + misc_feature complement(1191..1196) + /note="BsmBI" + terminator 1263..1294 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1295..1397 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1190..1845 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgg gacaaggatc cgtgatcgga aacgtgagat ccagttccgc gagacgaaga + 1201 cgaattctct agatatcgct caatactgac catttaaatc atacctgacc tccatagcag + 1261 aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg gcacgtaaga ggttccaact + 1321 ttcaccataa tgaaataaga tcactaccgg gcgtattttt tgagttatcg agattttcag + 1381 gagctaagga agctaaaatg agccatattc aacgggaaac gtcttgctcg aggccgcgat + 1441 taaattccaa catggatgct gatttatatg ggtataaatg ggctcgcgat aatgtcgggc + 1501 aatcaggtgc gacaatctat cgattgtatg ggaagcccga tgcgccagag ttgtttctga + 1561 aacatggcaa aggtagcgtt gccaatgatg ttacagatga gatggtcagg ctaaactggc + 1621 tgacggaatt tatgcctctt ccgaccatca agcattttat ccgtactcct gatgatgcat + 1681 ggttactcac cactgcgatc ccagggaaaa cagcattcca ggtattagaa gaatatcctg + 1741 attcaggtga aaatattgtt gatgcgctgg cagtgttcct gcgccggttg cattcgattc + 1801 ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p4_lac-o.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p4_lac-o.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,87 @@ +LOCUS . 1909 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + protein_bind 1160..1176 + /bound_moiety="lac repressor encoded by lacI" + /note="lac operator" + /note="The lac repressor binds to the lac operator to + inhibit transcription in E. coli. This inhibition can be + relieved by adding lactose or + isopropyl-beta-D-thiogalactopyranoside (IPTG)." + protein_bind 1229..1248 + /bound_moiety="lac repressor encoded by lacI" + /note="lac operator (symmetric)" + /note="The lac repressor binds to the lac operator to + inhibit transcription in E. coli. This inhibition can be + relieved by adding lactose or + isopropyl-beta-D-thiogalactopyranoside (IPTG). The + symmetric lac operator was optimized for tight binding of + lac repressor." + source 1154..1249 + /source="Exported" + misc_feature complement(1255..1260) + /note="BsmBI" + terminator 1327..1358 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1359..1461 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1254..1909 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgg gacagtcaat tgtgagcgga taacaattcc acagtcgacc ctaggttgtg + 1201 tcgcgagtgt tggatcccag ctgacaccaa ttgtgagcgc tcacaattct ccgcgagacg + 1261 aagacgaatt ctctagatat cgctcaatac tgaccattta aatcatacct gacctccata + 1321 gcagaaagtc aaaagcctcc gaccggaggc ttttgacttg atcggcacgt aagaggttcc + 1381 aactttcacc ataatgaaat aagatcacta ccgggcgtat tttttgagtt atcgagattt + 1441 tcaggagcta aggaagctaa aatgagccat attcaacggg aaacgtcttg ctcgaggccg + 1501 cgattaaatt ccaacatgga tgctgattta tatgggtata aatgggctcg cgataatgtc + 1561 gggcaatcag gtgcgacaat ctatcgattg tatgggaagc ccgatgcgcc agagttgttt + 1621 ctgaaacatg gcaaaggtag cgttgccaat gatgttacag atgagatggt caggctaaac + 1681 tggctgacgg aatttatgcc tcttccgacc atcaagcatt ttatccgtac tcctgatgat + 1741 gcatggttac tcaccactgc gatcccaggg aaaacagcat tccaggtatt agaagaatat + 1801 cctgattcag gtgaaaatat tgttgatgcg ctggcagtgt tcctgcgccg gttgcattcg + 1861 attcctgttt gtaattgtcc ttttaacggc gatcgcgtat ttcgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p5_attb-bxb1.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p5_attb-bxb1.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,76 @@ +LOCUS . 1855 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1156..1193 + /note="attB - BxB1" + misc_feature 1157..1170 + /note="B" + misc_feature complement(1179..1193) + /note="B'" + source 1154..1195 + /source="Exported" + misc_feature complement(1201..1206) + /note="BsmBI" + terminator 1273..1304 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1305..1407 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1200..1855 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgt ccgaaggctt gtcgacgacg gcggtctccg tcgtcaggat catcgccagc + 1201 gagacgaaga cgaattctct agatatcgct caatactgac catttaaatc atacctgacc + 1261 tccatagcag aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg gcacgtaaga + 1321 ggttccaact ttcaccataa tgaaataaga tcactaccgg gcgtattttt tgagttatcg + 1381 agattttcag gagctaagga agctaaaatg agccatattc aacgggaaac gtcttgctcg + 1441 aggccgcgat taaattccaa catggatgct gatttatatg ggtataaatg ggctcgcgat + 1501 aatgtcgggc aatcaggtgc gacaatctat cgattgtatg ggaagcccga tgcgccagag + 1561 ttgtttctga aacatggcaa aggtagcgtt gccaatgatg ttacagatga gatggtcagg + 1621 ctaaactggc tgacggaatt tatgcctctt ccgaccatca agcattttat ccgtactcct + 1681 gatgatgcat ggttactcac cactgcgatc ccagggaaaa cagcattcca ggtattagaa + 1741 gaatatcctg attcaggtga aaatattgtt gatgcgctgg cagtgttcct gcgccggttg + 1801 cattcgattc ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p5_attp-bxb1.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p5_attp-bxb1.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,77 @@ +LOCUS . 1869 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1156..1207 + /note="attP - BxB1" + misc_feature 1158..1176 + /note="P" + misc_feature complement(1186..1205) + /note="P'" + source 1154..1209 + /source="Exported" + misc_feature complement(1215..1220) + /note="BsmBI" + terminator 1287..1318 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1319..1421 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1214..1869 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgt ccgctgtggt ttgtctggtc aaccaccgcg gtctcagtgg tgtacggtac + 1201 aaacccatgc cagcgagacg aagacgaatt ctctagatat cgctcaatac tgaccattta + 1261 aatcatacct gacctccata gcagaaagtc aaaagcctcc gaccggaggc ttttgacttg + 1321 atcggcacgt aagaggttcc aactttcacc ataatgaaat aagatcacta ccgggcgtat + 1381 tttttgagtt atcgagattt tcaggagcta aggaagctaa aatgagccat attcaacggg + 1441 aaacgtcttg ctcgaggccg cgattaaatt ccaacatgga tgctgattta tatgggtata + 1501 aatgggctcg cgataatgtc gggcaatcag gtgcgacaat ctatcgattg tatgggaagc + 1561 ccgatgcgcc agagttgttt ctgaaacatg gcaaaggtag cgttgccaat gatgttacag + 1621 atgagatggt caggctaaac tggctgacgg aatttatgcc tcttccgacc atcaagcatt + 1681 ttatccgtac tcctgatgat gcatggttac tcaccactgc gatcccaggg aaaacagcat + 1741 tccaggtatt agaagaatat cctgattcag gtgaaaatat tgttgatgcg ctggcagtgt + 1801 tcctgcgccg gttgcattcg attcctgttt gtaattgtcc ttttaacggc gatcgcgtat + 1861 ttcgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p5_k1-k1.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p5_k1-k1.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,75 @@ +LOCUS . 1884 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1162..1183 + /note="K1" + misc_feature 1191..1212 + /note="K1" + source 1154..1224 + /source="Exported" + misc_feature complement(1230..1235) + /note="BsmBI" + terminator 1302..1333 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1334..1436 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1229..1884 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgt ccgcaaacaa agggtgtgaa cggtgatcac ccgagagcaa gggtgtgaac + 1201 ggtgatcacc cgcaaacaaa ttcgccagcg agacgaagac gaattctcta gatatcgctc + 1261 aatactgacc atttaaatca tacctgacct ccatagcaga aagtcaaaag cctccgaccg + 1321 gaggcttttg acttgatcgg cacgtaagag gttccaactt tcaccataat gaaataagat + 1381 cactaccggg cgtatttttt gagttatcga gattttcagg agctaaggaa gctaaaatga + 1441 gccatattca acgggaaacg tcttgctcga ggccgcgatt aaattccaac atggatgctg + 1501 atttatatgg gtataaatgg gctcgcgata atgtcgggca atcaggtgcg acaatctatc + 1561 gattgtatgg gaagcccgat gcgccagagt tgtttctgaa acatggcaaa ggtagcgttg + 1621 ccaatgatgt tacagatgag atggtcaggc taaactggct gacggaattt atgcctcttc + 1681 cgaccatcaa gcattttatc cgtactcctg atgatgcatg gttactcacc actgcgatcc + 1741 cagggaaaac agcattccag gtattagaag aatatcctga ttcaggtgaa aatattgttg + 1801 atgcgctggc agtgttcctg cgccggttgc attcgattcc tgtttgtaat tgtcctttta + 1861 acggcgatcg cgtatttcgt ctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p5_kt-weiss.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p5_kt-weiss.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,75 @@ +LOCUS . 1896 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1162..1188 + /note="Kt" + misc_feature 1198..1224 + /note="Kt" + source 1154..1236 + /source="Exported" + misc_feature complement(1242..1247) + /note="BsmBI" + terminator 1314..1345 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1346..1448 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1241..1896 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgt ccgcaaacaa aggatccgtg atcggaaacg tgagatccaa agcaaaagga + 1201 tccgtgatcg gaaacgtgag atcccaaaca aattcgccag cgagacgaag acgaattctc + 1261 tagatatcgc tcaatactga ccatttaaat catacctgac ctccatagca gaaagtcaaa + 1321 agcctccgac cggaggcttt tgacttgatc ggcacgtaag aggttccaac tttcaccata + 1381 atgaaataag atcactaccg ggcgtatttt ttgagttatc gagattttca ggagctaagg + 1441 aagctaaaat gagccatatt caacgggaaa cgtcttgctc gaggccgcga ttaaattcca + 1501 acatggatgc tgatttatat gggtataaat gggctcgcga taatgtcggg caatcaggtg + 1561 cgacaatcta tcgattgtat gggaagcccg atgcgccaga gttgtttctg aaacatggca + 1621 aaggtagcgt tgccaatgat gttacagatg agatggtcag gctaaactgg ctgacggaat + 1681 ttatgcctct tccgaccatc aagcatttta tccgtactcc tgatgatgca tggttactca + 1741 ccactgcgat cccagggaaa acagcattcc aggtattaga agaatatcct gattcaggtg + 1801 aaaatattgt tgatgcgctg gcagtgttcc tgcgccggtt gcattcgatt cctgtttgta + 1861 attgtccttt taacggcgat cgcgtatttc gtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p6_atg_boxc.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p6_atg_boxc.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,79 @@ +LOCUS . 1886 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1186..1195 + /note="Kozak" + CDS 1192..1194 + /codon_start=1 + /note="ATG" + /translation="M" + misc_feature 1198..1221 + /note="BoxC/D" + source 1154..1226 + /source="Exported" + misc_feature complement(1232..1237) + /note="BsmBI" + terminator 1304..1335 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1336..1438 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1231..1886 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc cagaaccgtc agatccgcta gcgattacgt caattgccac catgggaggg + 1201 cgtgatgcga aagctgaccc tagcggcagc cgagacgaag acgaattctc tagatatcgc + 1261 tcaatactga ccatttaaat catacctgac ctccatagca gaaagtcaaa agcctccgac + 1321 cggaggcttt tgacttgatc ggcacgtaag aggttccaac tttcaccata atgaaataag + 1381 atcactaccg ggcgtatttt ttgagttatc gagattttca ggagctaagg aagctaaaat + 1441 gagccatatt caacgggaaa cgtcttgctc gaggccgcga ttaaattcca acatggatgc + 1501 tgatttatat gggtataaat gggctcgcga taatgtcggg caatcaggtg cgacaatcta + 1561 tcgattgtat gggaagcccg atgcgccaga gttgtttctg aaacatggca aaggtagcgt + 1621 tgccaatgat gttacagatg agatggtcag gctaaactgg ctgacggaat ttatgcctct + 1681 tccgaccatc aagcatttta tccgtactcc tgatgatgca tggttactca ccactgcgat + 1741 cccagggaaa acagcattcc aggtattaga agaatatcct gattcaggtg aaaatattgt + 1801 tgatgcgctg gcagtgttcc tgcgccggtt gcattcgatt cctgtttgta attgtccttt + 1861 taacggcgat cgcgtatttc gtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p6_kozak-atg.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p6_kozak-atg.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,76 @@ +LOCUS . 1856 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1184..1195 + /note="Kozak" + CDS 1192..1194 + /codon_start=1 + /note="ATG" + /translation="M" + source 1154..1196 + /source="Exported" + misc_feature complement(1202..1207) + /note="BsmBI" + terminator 1274..1305 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1306..1408 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1201..1856 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc cagaaccgtc agatccgcta gagattacgc caaccgccac catgggcagc + 1201 cgagacgaag acgaattctc tagatatcgc tcaatactga ccatttaaat catacctgac + 1261 ctccatagca gaaagtcaaa agcctccgac cggaggcttt tgacttgatc ggcacgtaag + 1321 aggttccaac tttcaccata atgaaataag atcactaccg ggcgtatttt ttgagttatc + 1381 gagattttca ggagctaagg aagctaaaat gagccatatt caacgggaaa cgtcttgctc + 1441 gaggccgcga ttaaattcca acatggatgc tgatttatat gggtataaat gggctcgcga + 1501 taatgtcggg caatcaggtg cgacaatcta tcgattgtat gggaagcccg atgcgccaga + 1561 gttgtttctg aaacatggca aaggtagcgt tgccaatgat gttacagatg agatggtcag + 1621 gctaaactgg ctgacggaat ttatgcctct tccgaccatc aagcatttta tccgtactcc + 1681 tgatgatgca tggttactca ccactgcgat cccagggaaa acagcattcc aggtattaga + 1741 agaatatcct gattcaggtg aaaatattgt tgatgcgctg gcagtgttcc tgcgccggtt + 1801 gcattcgatt cctgtttgta attgtccttt taacggcgat cgcgtatttc gtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p6_nt-igkl sequence.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p6_nt-igkl sequence.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,83 @@ +LOCUS . 1886 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1154..1165 + /note="KozaK" + CDS 1162..1164 + /codon_start=1 + /note="ATG" + /translation="M" + CDS 1165..1224 + /codon_start=1 + /note="Ig-kappa leader" + /product="leader sequence from mouse immunoglobulin kappa + light chain" + /translation="ETDTLLLWVLLLWVPGSTGD" + source 1154..1226 + /source="Exported" + misc_feature complement(1232..1237) + /note="BsmBI" + terminator 1304..1335 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1336..1438 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1231..1886 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc cagccgccac catggaaaca gacacactgc tgctatgggt actgctgctc + 1201 tgggttccag gttccactgg tgacagcagc cgagacgaag acgaattctc tagatatcgc + 1261 tcaatactga ccatttaaat catacctgac ctccatagca gaaagtcaaa agcctccgac + 1321 cggaggcttt tgacttgatc ggcacgtaag aggttccaac tttcaccata atgaaataag + 1381 atcactaccg ggcgtatttt ttgagttatc gagattttca ggagctaagg aagctaaaat + 1441 gagccatatt caacgggaaa cgtcttgctc gaggccgcga ttaaattcca acatggatgc + 1501 tgatttatat gggtataaat gggctcgcga taatgtcggg caatcaggtg cgacaatcta + 1561 tcgattgtat gggaagcccg atgcgccaga gttgtttctg aaacatggca aaggtagcgt + 1621 tgccaatgat gttacagatg agatggtcag gctaaactgg ctgacggaat ttatgcctct + 1681 tccgaccatc aagcatttta tccgtactcc tgatgatgca tggttactca ccactgcgat + 1741 cccagggaaa acagcattcc aggtattaga agaatatcct gattcaggtg aaaatattgt + 1801 tgatgcgctg gcagtgttcc tgcgccggtt gcattcgatt cctgtttgta attgtccttt + 1861 taacggcgat cgcgtatttc gtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p6_nt-mls.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p6_nt-mls.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,81 @@ +LOCUS . 1910 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1154..1161 + /note="KozaK" + CDS 1162..1164 + /codon_start=1 + /note="ATG" + /translation="M" + CDS 1165..1248 + /codon_start=1 + /note="MLS" + /translation="SVLTPLLLRGLTGSARRLPVPRAKIHSL" + source 1154..1250 + /source="Exported" + misc_feature complement(1256..1261) + /note="BsmBI" + terminator 1328..1359 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1360..1462 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1255..1910 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc cagccgccac catgagcgtg ctgacccccc tgctgctgcg cggcctgacc + 1201 ggcagcgccc gccgcctgcc cgtgccccgc gccaagatcc acagcctggg cagccgagac + 1261 gaagacgaat tctctagata tcgctcaata ctgaccattt aaatcatacc tgacctccat + 1321 agcagaaagt caaaagcctc cgaccggagg cttttgactt gatcggcacg taagaggttc + 1381 caactttcac cataatgaaa taagatcact accgggcgta ttttttgagt tatcgagatt + 1441 ttcaggagct aaggaagcta aaatgagcca tattcaacgg gaaacgtctt gctcgaggcc + 1501 gcgattaaat tccaacatgg atgctgattt atatgggtat aaatgggctc gcgataatgt + 1561 cgggcaatca ggtgcgacaa tctatcgatt gtatgggaag cccgatgcgc cagagttgtt + 1621 tctgaaacat ggcaaaggta gcgttgccaa tgatgttaca gatgagatgg tcaggctaaa + 1681 ctggctgacg gaatttatgc ctcttccgac catcaagcat tttatccgta ctcctgatga + 1741 tgcatggtta ctcaccactg cgatcccagg gaaaacagca ttccaggtat tagaagaata + 1801 tcctgattca ggtgaaaata ttgttgatgc gctggcagtg ttcctgcgcc ggttgcattc + 1861 gattcctgtt tgtaattgtc cttttaacgg cgatcgcgta tttcgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p6_nt-myristoylation signal.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p6_nt-myristoylation signal.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,81 @@ +LOCUS . 1865 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1154..1161 + /note="KozaK" + CDS 1162..1164 + /codon_start=1 + /note="ATG" + /translation="M" + CDS 1165..1203 + /codon_start=1 + /note="myristoylation signal" + /translation="GSSKSKPKDPSQR" + source 1154..1205 + /source="Exported" + misc_feature complement(1211..1216) + /note="BsmBI" + terminator 1283..1314 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1315..1417 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1210..1865 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc cagccgccac catggggagt agcaagagca agcctaagga ccccagccag + 1201 cgcggcagcc gagacgaaga cgaattctct agatatcgct caatactgac catttaaatc + 1261 atacctgacc tccatagcag aaagtcaaaa gcctccgacc ggaggctttt gacttgatcg + 1321 gcacgtaaga ggttccaact ttcaccataa tgaaataaga tcactaccgg gcgtattttt + 1381 tgagttatcg agattttcag gagctaagga agctaaaatg agccatattc aacgggaaac + 1441 gtcttgctcg aggccgcgat taaattccaa catggatgct gatttatatg ggtataaatg + 1501 ggctcgcgat aatgtcgggc aatcaggtgc gacaatctat cgattgtatg ggaagcccga + 1561 tgcgccagag ttgtttctga aacatggcaa aggtagcgtt gccaatgatg ttacagatga + 1621 gatggtcagg ctaaactggc tgacggaatt tatgcctctt ccgaccatca agcattttat + 1681 ccgtactcct gatgatgcat ggttactcac cactgcgatc ccagggaaaa cagcattcca + 1741 ggtattagaa gaatatcctg attcaggtga aaatattgtt gatgcgctgg cagtgttcct + 1801 gcgccggttg cattcgattc ctgtttgtaa ttgtcctttt aacggcgatc gcgtatttcg + 1861 tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p6_nt-palm sequence.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p6_nt-palm sequence.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,81 @@ +LOCUS . 1883 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1154..1161 + /note="Kozak" + CDS 1162..1164 + /codon_start=1 + /note="ATG" + /translation="M" + CDS 1165..1221 + /codon_start=1 + /note="Palmitoylation sequence" + /translation="LCCMRRTKQVEKNDDDQKI" + source 1154..1223 + /source="Exported" + misc_feature complement(1229..1234) + /note="BsmBI" + terminator 1301..1332 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1333..1435 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1228..1883 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc cagccgccac catgctgtgc tgcatgcgcc gcaccaagca ggtggagaag + 1201 aacgacgacg accagaagat cggcagccga gacgaagacg aattctctag atatcgctca + 1261 atactgacca tttaaatcat acctgacctc catagcagaa agtcaaaagc ctccgaccgg + 1321 aggcttttga cttgatcggc acgtaagagg ttccaacttt caccataatg aaataagatc + 1381 actaccgggc gtattttttg agttatcgag attttcagga gctaaggaag ctaaaatgag + 1441 ccatattcaa cgggaaacgt cttgctcgag gccgcgatta aattccaaca tggatgctga + 1501 tttatatggg tataaatggg ctcgcgataa tgtcgggcaa tcaggtgcga caatctatcg + 1561 attgtatggg aagcccgatg cgccagagtt gtttctgaaa catggcaaag gtagcgttgc + 1621 caatgatgtt acagatgaga tggtcaggct aaactggctg acggaattta tgcctcttcc + 1681 gaccatcaag cattttatcc gtactcctga tgatgcatgg ttactcacca ctgcgatccc + 1741 agggaaaaca gcattccagg tattagaaga atatcctgat tcaggtgaaa atattgttga + 1801 tgcgctggca gtgttcctgc gccggttgca ttcgattcct gtttgtaatt gtccttttaa + 1861 cggcgatcgc gtatttcgtc tcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p6_nt-sv40_nls.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p6_nt-sv40_nls.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,82 @@ +LOCUS . 1847 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1154..1161 + /note="Kozak" + CDS 1162..1164 + /codon_start=1 + /note="ATG" + /translation="M" + CDS 1165..1185 + /codon_start=1 + /note="SV40 NLS" + /product="nuclear localization signal of SV40 large T + antigen" + /translation="PKKKRKV" + source 1154..1187 + /source="Exported" + misc_feature complement(1193..1198) + /note="BsmBI" + terminator 1265..1296 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1297..1399 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1192..1847 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc cagccgccac catgcctaag aagaaacgga aagtgggcag ccgagacgaa + 1201 gacgaattct ctagatatcg ctcaatactg accatttaaa tcatacctga cctccatagc + 1261 agaaagtcaa aagcctccga ccggaggctt ttgacttgat cggcacgtaa gaggttccaa + 1321 ctttcaccat aatgaaataa gatcactacc gggcgtattt tttgagttat cgagattttc + 1381 aggagctaag gaagctaaaa tgagccatat tcaacgggaa acgtcttgct cgaggccgcg + 1441 attaaattcc aacatggatg ctgatttata tgggtataaa tgggctcgcg ataatgtcgg + 1501 gcaatcaggt gcgacaatct atcgattgta tgggaagccc gatgcgccag agttgtttct + 1561 gaaacatggc aaaggtagcg ttgccaatga tgttacagat gagatggtca ggctaaactg + 1621 gctgacggaa tttatgcctc ttccgaccat caagcatttt atccgtactc ctgatgatgc + 1681 atggttactc accactgcga tcccagggaa aacagcattc caggtattag aagaatatcc + 1741 tgattcaggt gaaaatattg ttgatgcgct ggcagtgttc ctgcgccggt tgcattcgat + 1801 tcctgtttgt aattgtcctt ttaacggcga tcgcgtattt cgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p7_bxb1.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p7_bxb1.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,107 @@ +LOCUS . 3312 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + CDS 5..1501 + /codon_start=1 + /note="BxB1 intergase - human codon optimised" + /translation="RALVVIRLSRVTDATTSPERQLESCQQLCAQRGWDVVGVAEDLDV + SGAVDPFDRKRRPNLARWLAFEEQPFDVIVAYRVDRLTRSIRHLQQLVHWAEDHKKLVV + SATEAHFDTTTPFAAVVIALMGTVAQMELEAIKERNRSAAHFNIRAGKYRGSLPPWGYL + PTRVDGEWRLVPDPVQRERILEVYHRVVDNHEPLHLVAHDLNRRGVLSPKDYFAQLQGR + EPQGREWSATALKRSMISEAMLGYATLNGKTVRDDDGAPLVRAEPILTREQLEALRAEL + VKTSRAKPAVSTPSLLLRVLFCAVCGEPAYKFAGGGRKHPRYRCRSMGFPKHCGNGTVA + MAEWDAFCEEQVLDLLGDAERLEKVWVAGSDSAVELAEVNAELVDLTSLIGSPAYRAGS + PQREALDARIAALAARQEELEGLEARPSGWEWRETGQRFGDWWREQDTAAKNTWLRSMN + VRLTFDVRGGLTRTIDFGDLQEYEQHLRLGSVVERLHTGMS" + source 5..1503 + /source="Exported" + misc_feature complement(1509..1514) + /note="BsmBI" + terminator 1581..1612 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1613..1715 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1508..2163 + /source="Exported" + terminator 2555..2582 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(2594..3181) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 3203..3232 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 3306..3311 + /note="BsmBI" + source 2168..3312 + /source="Exported" +ORIGIN + 1 cagcagagca ctggtggtca tccgactgag tagggtcaca gacgcaacaa caagccccga + 61 acggcagctc gaaagctgtc agcagctgtg tgcccagcga ggatgggacg tggtcggagt + 121 ggcagaggat ctggacgtga gcggcgctgt cgatccattc gacagaaagc ggaggcccaa + 181 cctggcaagg tggctggctt tcgaggaaca gccctttgat gtgatcgtcg cctacagagt + 241 ggacaggctg acacgctcta ttcgacatct gcagcagctg gtgcattggg ccgaggacca + 301 caagaaactg gtggtcagtg caactgaagc ccacttcgat accacaactc cttttgccgc + 361 tgtggtcatc gcactgatgg gcaccgtggc ccagatggag ctggaagcta tcaaggagcg + 421 aaaccggagt gcagcccatt tcaatattcg ggccgggaaa tacagaggat cactgccccc + 481 ttggggctat ctgcctaccc gggtggatgg ggagtggaga ctggtgccag accccgtcca + 541 gagagagagg attctggaag tgtaccacag ggtggtcgat aaccacgaac cactgcatct + 601 ggtcgcccac gacctgaata ggcgcggcgt gctgagccca aaagattatt ttgctcagct + 661 gcagggaagg gagccacagg gacgagaatg gtccgctacc gccctgaagc ggagcatgat + 721 cagtgaggct atgctgggct acgcaactct gaatgggaaa accgtccggg acgatgacgg + 781 agcaccactg gtgagggctg agcctattct gacacgcgag cagctggaag ctctgcgggc + 841 agaactggtg aaaacctcca gagccaaacc tgccgtgagc accccaagcc tgctgctgag + 901 ggtgctgttc tgcgccgtct gtggggagcc agcatacaag tttgccggcg ggggaagaaa + 961 acatccccgc tatcgatgcc ggtctatggg attccctaag cactgtggaa acggcactgt + 1021 ggctatggcc gagtgggacg ccttttgtga ggaacaggtg ctggatctgc tgggcgacgc + 1081 cgagaggctg gaaaaagtgt gggtcgctgg cagcgactcc gctgtggagc tggcagaagt + 1141 caatgccgag ctggtggatc tgacctccct gatcggatct cctgcatata gggcaggctc + 1201 accacagcga gaagctctgg acgcacgaat tgctgcactg gcagctcgac aggaggaact + 1261 ggaggggctg gaagcacgac ctagcggatg ggagtggcga gaaacaggcc agcggtttgg + 1321 ggattggtgg agagagcagg acacagcagc caagaacact tggctgagaa gtatgaatgt + 1381 caggctgact ttcgatgtgc gcggcgggct gacccgaaca atcgattttg gcgacctgca + 1441 ggagtatgaa cagcacctga gactggggag cgtggtcgaa agactgcaca ctgggatgtc + 1501 atcaggccga gacgaagacg aattctctag atatcgctca atactgacca tttaaatcat + 1561 acctgacctc catagcagaa agtcaaaagc ctccgaccgg aggcttttga cttgatcggc + 1621 acgtaagagg ttccaacttt caccataatg aaataagatc actaccgggc gtattttttg + 1681 agttatcgag attttcagga gctaaggaag ctaaaatgag ccatattcaa cgggaaacgt + 1741 cttgctcgag gccgcgatta aattccaaca tggatgctga tttatatggg tataaatggg + 1801 ctcgcgataa tgtcgggcaa tcaggtgcga caatctatcg attgtatggg aagcccgatg + 1861 cgccagagtt gtttctgaaa catggcaaag gtagcgttgc caatgatgtt acagatgaga + 1921 tggtcaggct aaactggctg acggaattta tgcctcttcc gaccatcaag cattttatcc + 1981 gtactcctga tgatgcatgg ttactcacca ctgcgatccc agggaaaaca gcattccagg + 2041 tattagaaga atatcctgat tcaggtgaaa atattgttga tgcgctggca gtgttcctgc + 2101 gccggttgca ttcgattcct gtttgtaatt gtccttttaa cggcgatcgc gtatttcgtc + 2161 tcgctcaggc gcaatcacga atgaataacg gtttggttgg tgcgagtgat tttgatgacg + 2221 agcgtaatgg ctggcctgtt gaacaagtct ggaaagaaat gcataagctt ttgccattct + 2281 caccggattc agtcgtcact catggtgatt tctcacttga taaccttatt tttgacgagg + 2341 ggaaattaat aggttgtatt gatgttggac gagtcggaat cgcagaccga taccaggatc + 2401 ttgccatcct atggaactgc ctcggtgagt tttctccttc attacagaaa cggctttttc + 2461 aaaaatatgg tattgataat cctgatatga ataaattgca gtttcacttg atgctcgatg + 2521 agtttttcta atgagggccc aaatgtaatc acctggctca ccttcgggtg ggcctttctg + 2581 cgttgctggc gtttttccat aggctccgcc cccctgacga gcatcacaaa aatcgatgct + 2641 caagtcagag gtggcgaaac ccgacaggac tataaagata ccaggcgttt ccccctggaa + 2701 gctccctcgt gcgctctcct gttccgaccc tgccgcttac cggatacctg tccgcctttc + 2761 tcccttcggg aagcgtggcg ctttctcata gctcacgctg taggtatctc agttcggtgt + 2821 aggtcgttcg ctccaagctg ggctgtgtgc acgaaccccc cgttcagccc gaccgctgcg + 2881 ccttatccgg taactatcgt cttgagtcca acccggtaag acacgactta tcgccactgg + 2941 cagcagccac tggtaacagg attagcagag cgaggtatgt aggcggtgct acagagttct + 3001 tgaagtggtg gcctaactac ggctacacta gaagaacagt atttggtatc tgcgctctgc + 3061 tgaagccagt tacctcggaa aaagagttgg tagctcttga tccggcaaac aaaccaccgc + 3121 tggtagcggt ggtttttttg tttgcaagca gcagattacg cgcagaaaaa aaggatctca + 3181 agaagatcct ttgattttct accgaagaaa ggcccacccg tgaaggtgag ccagtgagtt + 3241 gattgcagtc cagttacgct ggagtctgag gctcgtcctg aatgatatca agcttgaatt + 3301 cgttacgtct cg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p7_l7ae-weiss.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p7_l7ae-weiss.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,82 @@ +LOCUS . 2169 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + CDS 1154..1507 + /codon_start=1 + /note="L7Ae (Weiss)" + /translation="YVRFEVPEDMQNEALSLLEKVRESGKVKKGTNETTKAVERGLAKL + VYIAEDVDPPEIVAHLPLLCEEKNVPYIYVKSKNDLGRAVGIEVPCASAAIINEGELRK + ELGSLVEKIKGLQK" + source 1154..1509 + /source="Exported" + misc_feature complement(1515..1520) + /note="BsmBI" + terminator 1587..1618 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1619..1721 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1514..2169 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc agctacgtga gatttgaggt tcctgaggac atgcagaacg aagctctgag + 1201 tctgctggag aaggttaggg agagcggtaa ggtaaagaaa ggtaccaacg aaacgacaaa + 1261 ggctgtggag aggggactgg caaagctcgt ttacatcgca gaggatgttg acccgcctga + 1321 gatcgttgct catctgcccc tcctctgcga ggagaagaat gtgccgtaca tttacgttaa + 1381 aagcaagaac gaccttggaa gggctgtggg cattgaggtg ccatgcgctt cggcagcgat + 1441 aatcaacgag ggagagctga gaaaggagct tggaagcctt gtggagaaga ttaaaggcct + 1501 tcagaagtca ggccgagacg aagacgaatt ctctagatat cgctcaatac tgaccattta + 1561 aatcatacct gacctccata gcagaaagtc aaaagcctcc gaccggaggc ttttgacttg + 1621 atcggcacgt aagaggttcc aactttcacc ataatgaaat aagatcacta ccgggcgtat + 1681 tttttgagtt atcgagattt tcaggagcta aggaagctaa aatgagccat attcaacggg + 1741 aaacgtcttg ctcgaggccg cgattaaatt ccaacatgga tgctgattta tatgggtata + 1801 aatgggctcg cgataatgtc gggcaatcag gtgcgacaat ctatcgattg tatgggaagc + 1861 ccgatgcgcc agagttgttt ctgaaacatg gcaaaggtag cgttgccaat gatgttacag + 1921 atgagatggt caggctaaac tggctgacgg aatttatgcc tcttccgacc atcaagcatt + 1981 ttatccgtac tcctgatgat gcatggttac tcaccactgc gatcccaggg aaaacagcat + 2041 tccaggtatt agaagaatat cctgattcag gtgaaaatat tgttgatgcg ctggcagtgt + 2101 tcctgcgccg gttgcattcg attcctgttt gtaattgtcc ttttaacggc gatcgcgtat + 2161 ttcgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p7_l7ae.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p7_l7ae.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,87 @@ +LOCUS . 2409 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + CDS 1154..1747 + /codon_start=1 + /note="L7Ae" + /translation="SPILGYWKIKGLVQPTRLLLEYLEEKYEEHLYERDEGDKWRNKKF + ELGLEFPNLPYYIDGDVKLTQSMAIIRYIADKHNMYVRFEVPEDMQNEALSLLEKVRES + GKVKKGTNETTKAVERGLAKLVYIAEDVDPPEIVAHLPLLCEEKNVPYIYVKSKNDLGR + AVGIEVPCASAAIINEGELRKELGSLVEKIKGLQK" + source 1154..1749 + /source="Exported" + misc_feature complement(1755..1760) + /note="BsmBI" + terminator 1827..1858 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1859..1961 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1754..2409 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc agcagcccca tcctgggcta ctggaagatc aagggcctgg tgcagcccac + 1201 ccgcctgctg ctggagtacc tggaggagaa gtacgaggag cacctgtacg agcgcgacga + 1261 gggcgacaag tggcgcaaca agaagttcga gctgggcctg gagttcccca acctgcccta + 1321 ctacatcgac ggcgacgtga agctgaccca gagcatggcc atcatccgct acatcgccga + 1381 caagcacaac atgtacgtgc gcttcgaggt gcccgaggac atgcagaacg aggccctgag + 1441 cctgctggag aaggtgcgcg agagcggcaa ggtgaagaag ggcaccaacg aaaccaccaa + 1501 ggccgtggag cgcggcctgg ccaagctggt gtacatcgcc gaggacgtgg acccccccga + 1561 gatcgtggcc cacctgcccc tgctgtgcga ggagaagaac gtgccctaca tctacgtgaa + 1621 gagcaagaac gacctgggcc gcgccgtggg catcgaggtg ccctgcgcca gcgccgccat + 1681 catcaacgag ggcgagctgc gcaaggagct gggcagcctg gtggagaaga tcaagggcct + 1741 gcagaagtca ggccgagacg aagacgaatt ctctagatat cgctcaatac tgaccattta + 1801 aatcatacct gacctccata gcagaaagtc aaaagcctcc gaccggaggc ttttgacttg + 1861 atcggcacgt aagaggttcc aactttcacc ataatgaaat aagatcacta ccgggcgtat + 1921 tttttgagtt atcgagattt tcaggagcta aggaagctaa aatgagccat attcaacggg + 1981 aaacgtcttg ctcgaggccg cgattaaatt ccaacatgga tgctgattta tatgggtata + 2041 aatgggctcg cgataatgtc gggcaatcag gtgcgacaat ctatcgattg tatgggaagc + 2101 ccgatgcgcc agagttgttt ctgaaacatg gcaaaggtag cgttgccaat gatgttacag + 2161 atgagatggt caggctaaac tggctgacgg aatttatgcc tcttccgacc atcaagcatt + 2221 ttatccgtac tcctgatgat gcatggttac tcaccactgc gatcccaggg aaaacagcat + 2281 tccaggtatt agaagaatat cctgattcag gtgaaaatat tgttgatgcg ctggcagtgt + 2341 tcctgcgccg gttgcattcg attcctgttt gtaattgtcc ttttaacggc gatcgcgtat + 2401 ttcgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p7_laci.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p7_laci.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,98 @@ +LOCUS . 2892 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + CDS 1154..2230 + /codon_start=1 + /note="LacI- human codon optimized" + /translation="KPVTLYDVAEYAGVSYQTVSRVVNQASHVSAKTREKVEAAMAELN + YIPNRVAQQLAGKQSLLIGVATSSLALHAPSQIVAAIKSRADQLGASVVVSMVERSGVE + ACKAAVHNLLAQRVSGLIINYPLDDQDAIAVEAACTNVPALFLDVSDQTPINSIIFSHE + DGTRLGVEHLVALGHQQIALLAGPLSSVSARLRLAGWHKYLTRNQIQPIAEREGDWSAM + SGFQQTMQMLNEGIVPTAMLVANDQMALGAMRAITESGLRVGADISVVGYDDTEDSSCY + IPPLTTIKQDFRLLGQTSVDRLLQLSQGQAVKGNQLLPVSLVKRKTTLAPNTQTASPRA + LADSLMQLARQVSRLESGQ" + source 1154..2232 + /source="Exported" + misc_feature complement(2238..2243) + /note="BsmBI" + terminator 2310..2341 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 2342..2444 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 2237..2892 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc agcaagcccg tgaccctgta cgacgtggcc gagtacgccg gcgtgagcta + 1201 ccagaccgtg agccgcgtgg tgaaccaggc cagccacgtg agcgccaaga cccgcgagaa + 1261 ggtggaggcc gccatggccg agctgaatta catcccaaat cgcgtggccc agcagctggc + 1321 cggcaagcag agcctgctga tcggagtggc aacaagcagc ctggccctgc acgcacctag + 1381 ccagatcgtg gcagccatca agagccgcgc cgaccagctg ggagccagcg tggttgtgag + 1441 catggtggag cgcagcggag tggaggcctg caaggccgcc gtgcacaacc tgctggcaca + 1501 gcgcgtgagc ggactgatca tcaactaccc tctggacgac caggacgcca tcgcagtgga + 1561 agcagcctgc acaaacgtgc ccgcactgtt tctggatgtg agcgatcaga cccccatcaa + 1621 cagcatcatc ttcagccacg aagatggcac ccgcctggga gtggagcacc tggtggccct + 1681 gggccaccag cagatcgcac tgctggccgg cccactgagc agcgtgagcg cacgcctgcg + 1741 cctggcaggc tggcacaagt acctgacccg caaccagatc cagcctatcg ccgaacgcga + 1801 aggcgattgg agcgccatga gcggatttca gcagaccatg cagatgctga acgagggaat + 1861 cgtgcctacc gccatgctgg tggccaacga ccagatggcc ctgggagcca tgcgcgccat + 1921 caccgagagc ggcctgcgcg tgggagcaga catcagcgtg gtgggatacg acgacaccga + 1981 agacagcagc tgctacatcc ctcctctgac aaccatcaag caggacttcc gcctgctggg + 2041 ccagaccagc gtggaccgcc tgctgcagct gagccaggga caggccgtga agggaaacca + 2101 gctgctgcct gtgagcctgg tgaagcgcaa gaccaccctg gcacccaaca cccagaccgc + 2161 cagcccccgc gccctggccg acagcctgat gcagctggcc cgccaggtga gccgcctgga + 2221 aagcggacag tcaggccgag acgaagacga attctctaga tatcgctcaa tactgaccat + 2281 ttaaatcata cctgacctcc atagcagaaa gtcaaaagcc tccgaccgga ggcttttgac + 2341 ttgatcggca cgtaagaggt tccaactttc accataatga aataagatca ctaccgggcg + 2401 tattttttga gttatcgaga ttttcaggag ctaaggaagc taaaatgagc catattcaac + 2461 gggaaacgtc ttgctcgagg ccgcgattaa attccaacat ggatgctgat ttatatgggt + 2521 ataaatgggc tcgcgataat gtcgggcaat caggtgcgac aatctatcga ttgtatggga + 2581 agcccgatgc gccagagttg tttctgaaac atggcaaagg tagcgttgcc aatgatgtta + 2641 cagatgagat ggtcaggcta aactggctga cggaatttat gcctcttccg accatcaagc + 2701 attttatccg tactcctgat gatgcatggt tactcaccac tgcgatccca gggaaaacag + 2761 cattccaggt attagaagaa tatcctgatt caggtgaaaa tattgttgat gcgctggcag + 2821 tgttcctgcg ccggttgcat tcgattcctg tttgtaattg tccttttaac ggcgatcgcg + 2881 tatttcgtct cg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p7_mcherry.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p7_mcherry.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,89 @@ +LOCUS . 2520 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + CDS 1154..1858 + /codon_start=1 + /note="mCherry- codon optimized" + /translation="VSKGEEDNMAIIKEFMRFKVHMEGSVNGHEFEIEGEGEGRPYEGT + QTAKLKVTKGGPLPFAWDILSPQFMYGSKAYVKHPADIPDYLKLSFPEGFKWERVMNFE + DGGVVTVTQDSSLQDGEFIYKVKLRGTNFPSDGPVMQKKTMGWEASSERMYPEDGALKG + EIKQRLKLKDGGHYDAEVKTTYKAKKPVQLPGAYNVNIKLDITSHNEDYTIVEQYERAE + GRHSTGGMDELYK" + source 1154..1860 + /source="Exported" + misc_feature complement(1866..1871) + /note="BsmBI" + terminator 1938..1969 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1970..2072 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1865..2520 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc agcgtgagca agggcgagga ggacaacatg gccatcatca aggagttcat + 1201 gcgcttcaag gtgcacatgg agggcagcgt gaacggccac gagttcgaga tcgagggcga + 1261 gggcgagggc cgcccctacg agggcaccca gaccgccaag ctgaaggtga ccaagggcgg + 1321 ccccctgccc ttcgcctggg acatcctgag cccccagttc atgtacggca gcaaggccta + 1381 cgtgaagcac cccgccgaca tccccgacta cctgaagctg agcttccccg agggcttcaa + 1441 gtgggagcgc gtgatgaact tcgaggacgg cggcgtggtg accgtgaccc aggacagcag + 1501 cctgcaggac ggcgagttca tctacaaggt gaagctgcgc ggcaccaact tccccagcga + 1561 cggccccgtg atgcagaaga agaccatggg ctgggaggcc agcagcgagc gcatgtaccc + 1621 cgaggacggc gccctgaagg gcgagatcaa gcagcgcctg aagctgaagg acggcggcca + 1681 ctacgacgcc gaggtgaaga ccacctacaa ggccaagaag cccgtgcagc tgcccggcgc + 1741 ctacaacgtg aacatcaagc tggacatcac cagccacaac gaggactaca ccatcgtgga + 1801 gcagtacgag cgcgccgagg gccgccacag caccggcggc atggacgagc tgtacaagtc + 1861 aggccgagac gaagacgaat tctctagata tcgctcaata ctgaccattt aaatcatacc + 1921 tgacctccat agcagaaagt caaaagcctc cgaccggagg cttttgactt gatcggcacg + 1981 taagaggttc caactttcac cataatgaaa taagatcact accgggcgta ttttttgagt + 2041 tatcgagatt ttcaggagct aaggaagcta aaatgagcca tattcaacgg gaaacgtctt + 2101 gctcgaggcc gcgattaaat tccaacatgg atgctgattt atatgggtat aaatgggctc + 2161 gcgataatgt cgggcaatca ggtgcgacaa tctatcgatt gtatgggaag cccgatgcgc + 2221 cagagttgtt tctgaaacat ggcaaaggta gcgttgccaa tgatgttaca gatgagatgg + 2281 tcaggctaaa ctggctgacg gaatttatgc ctcttccgac catcaagcat tttatccgta + 2341 ctcctgatga tgcatggtta ctcaccactg cgatcccagg gaaaacagca ttccaggtat + 2401 tagaagaata tcctgattca ggtgaaaata ttgttgatgc gctggcagtg ttcctgcgcc + 2461 ggttgcattc gattcctgtt tgtaattgtc cttttaacgg cgatcgcgta tttcgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p7_mkate2.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p7_mkate2.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,90 @@ +LOCUS . 2508 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + CDS 1154..1846 + /codon_start=1 + /gene="mKate2" + /note="mKate2" + /translation="VSELIKENMHMKLYMEGTVNNHHFKCTSEGEGKPYEGTQTMRIKA + VEGGPLPFAFDILATSFMYGSKTFINHTQGIPDFFKQSFPEGFTWERVTTYEDGGVLTA + TQDTSLQDGCLIYNVKIRGVNFPSNGPVMQKKTLGWEASTETLYPADGGLEGRADMALK + LVGGGHLICNLKTTYRSKKPAKNLKMPGVYYVDRRLERIKEADKETYVEQHEVAVARYC + DLPSKLGHR" + source 1154..1848 + /source="Exported" + misc_feature complement(1854..1859) + /note="BsmBI" + terminator 1926..1957 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1958..2060 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1853..2508 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc agcgtgagcg agctgattaa ggagaacatg cacatgaagc tgtacatgga + 1201 gggcaccgtg aacaaccacc acttcaagtg cacatccgag ggcgaaggca agccctacga + 1261 gggcacccag accatgagaa tcaaggcggt cgagggcggc cctctcccct tcgccttcga + 1321 catcctggct accagcttca tgtacggcag caaaaccttc atcaaccaca cccagggcat + 1381 ccccgacttc tttaagcagt ccttccccga gggcttcaca tgggagagag tcaccacata + 1441 cgaagacggg ggcgtgctga ccgctaccca ggacaccagc ctccaggacg gctgcctcat + 1501 ctacaacgtc aagatcagag gggtgaactt cccatccaac ggccctgtga tgcagaagaa + 1561 aacactcggc tgggaggcct ccaccgaaac cctgtacccc gctgacggcg gcctggaagg + 1621 cagagccgac atggccctga agctcgtggg cgggggccac ctgatctgca acttgaagac + 1681 cacatacaga tccaagaaac ccgctaagaa cctcaagatg cccggcgtct actatgtgga + 1741 cagaagactg gaaagaatca aggaggccga caaagaaacc tacgtcgagc agcacgaggt + 1801 ggctgtggcc agatactgcg acctccctag caaactgggg cacagatcag gccgagacga + 1861 agacgaattc tctagatatc gctcaatact gaccatttaa atcatacctg acctccatag + 1921 cagaaagtca aaagcctccg accggaggct tttgacttga tcggcacgta agaggttcca + 1981 actttcacca taatgaaata agatcactac cgggcgtatt ttttgagtta tcgagatttt + 2041 caggagctaa ggaagctaaa atgagccata ttcaacggga aacgtcttgc tcgaggccgc + 2101 gattaaattc caacatggat gctgatttat atgggtataa atgggctcgc gataatgtcg + 2161 ggcaatcagg tgcgacaatc tatcgattgt atgggaagcc cgatgcgcca gagttgtttc + 2221 tgaaacatgg caaaggtagc gttgccaatg atgttacaga tgagatggtc aggctaaact + 2281 ggctgacgga atttatgcct cttccgacca tcaagcattt tatccgtact cctgatgatg + 2341 catggttact caccactgcg atcccaggga aaacagcatt ccaggtatta gaagaatatc + 2401 ctgattcagg tgaaaatatt gttgatgcgc tggcagtgtt cctgcgccgg ttgcattcga + 2461 ttcctgtttg taattgtcct tttaacggcg atcgcgtatt tcgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p7_mneogreen.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p7_mneogreen.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,91 @@ +LOCUS . 2520 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + CDS 1154..1858 + /codon_start=1 + /note="mNeonGreen" + /product="bright monomeric yellow-green fluorescent protein + derived from LanYFP (Shaner et al., 2013)" + /translation="VSKGEEDNMASLPATHELHIFGSINGVDFDMVGQGTGNPNDGYEE + LNLKSTKGDLQFSPWILVPHIGYGFHQYLPYPDGMSPFQAAMVDGSGYQVHRTMQFEDG + ASLTVNYRYTYEGSHIKGEAQVKGTGFPADGPVMTNSLTAADWCRSKKTYPNDKTIIST + FKWSYTTGNGKRYRSTARTTYTFAKPMAANYLKNQPMYVFRKTELKHSKTELNFKEWQK + AFTDVMGMDELYK" + source 1154..1860 + /source="Exported" + misc_feature complement(1866..1871) + /note="BsmBI" + terminator 1938..1969 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1970..2072 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1865..2520 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc agcgtgagca agggcgagga ggataacatg gcctctctcc cagcgacaca + 1201 tgagttacac atctttggct ccatcaacgg tgtggacttt gacatggtgg gtcagggcac + 1261 cggcaatcca aatgatggtt atgaggagtt aaacctgaag tccaccaagg gtgacctcca + 1321 gttctccccc tggattctgg tccctcatat cgggtatggc ttccatcagt acctgcccta + 1381 ccctgacggg atgtcgcctt tccaggccgc catggtagat ggctccggat accaagtcca + 1441 tcgcacaatg cagtttgaag atggtgcctc ccttactgtt aactaccgct acacctacga + 1501 gggaagccac atcaaaggag aggcccaggt gaaggggact ggtttccctg ctgacggtcc + 1561 tgtgatgacc aactcgctga ccgctgcgga ctggtgcagg tcgaagaaga cttaccccaa + 1621 cgacaaaacc atcatcagta cctttaagtg gagttacacc actggaaatg gcaagcgcta + 1681 ccggagcact gcgcggacca cctacacctt tgccaagcca atggcggcta actatctgaa + 1741 gaaccagccg atgtacgtgt tccgtaagac ggagctcaag cactccaaga ccgagctcaa + 1801 cttcaaggag tggcaaaagg cctttaccga tgtgatgggc atggacgagc tgtacaagtc + 1861 aggccgagac gaagacgaat tctctagata tcgctcaata ctgaccattt aaatcatacc + 1921 tgacctccat agcagaaagt caaaagcctc cgaccggagg cttttgactt gatcggcacg + 1981 taagaggttc caactttcac cataatgaaa taagatcact accgggcgta ttttttgagt + 2041 tatcgagatt ttcaggagct aaggaagcta aaatgagcca tattcaacgg gaaacgtctt + 2101 gctcgaggcc gcgattaaat tccaacatgg atgctgattt atatgggtat aaatgggctc + 2161 gcgataatgt cgggcaatca ggtgcgacaa tctatcgatt gtatgggaag cccgatgcgc + 2221 cagagttgtt tctgaaacat ggcaaaggta gcgttgccaa tgatgttaca gatgagatgg + 2281 tcaggctaaa ctggctgacg gaatttatgc ctcttccgac catcaagcat tttatccgta + 2341 ctcctgatga tgcatggtta ctcaccactg cgatcccagg gaaaacagca ttccaggtat + 2401 tagaagaata tcctgattca ggtgaaaata ttgttgatgc gctggcagtg ttcctgcgcc + 2461 ggttgcattc gattcctgtt tgtaattgtc cttttaacgg cgatcgcgta tttcgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p7_mruby2.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p7_mruby2.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,93 @@ +LOCUS . 2523 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + CDS 1154..1861 + /codon_start=1 + /note="mRuby2" + /product="monomeric red fluorescent protein derived from + mRuby, with improved photophysical properties (Lam et al., + 2012)" + /translation="VSKGEELIKENMRMKVVMEGSVNGHQFKCTGEGEGNPYMGTQTMR + IKVIEGGPLPFAFDILATSFMYGSRTFIKYPKGIPDFFKQSFPEGFTWERVTRYEDGGV + VTVMQDTSLEDGCLVYHVQVRGVNFPSNGPVMQKKTKGWEPNTEMMYPADGGLRGYTHM + ALKVDGGGHLSCSFVTTYRSKKTVGNIKMPGIHAVDHRLERLEESDNEMFVVQREHAVA + KFAGLGGGMDELYK" + source 1154..1863 + /source="Exported" + misc_feature complement(1869..1874) + /note="BsmBI" + terminator 1941..1972 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1973..2075 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1868..2523 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc agcgtgtcta agggcgaaga gctgatcaag gaaaatatgc gtatgaaggt + 1201 ggtcatggaa ggttcggtca acggccacca attcaaatgc acaggtgaag gagaaggcaa + 1261 tccgtacatg ggaactcaaa ccatgaggat caaagtcatc gagggaggac ccctgccatt + 1321 tgcctttgac attcttgcca cgtcgttcat gtatggcagc cgtactttta tcaagtaccc + 1381 gaaaggcatt cctgatttct ttaaacagtc ctttcctgag ggttttactt gggaaagagt + 1441 tacgagatac gaagatggtg gagtcgtcac cgtcatgcag gacaccagcc ttgaggatgg + 1501 ctgtctcgtt taccacgtcc aagtcagagg ggtaaacttt ccctccaatg gtcccgtgat + 1561 gcagaagaag accaagggtt gggagcctaa tacagagatg atgtatccag cagatggtgg + 1621 tctgagggga tacactcata tggcactgaa agttgatggt ggtggccatc tgtcttgctc + 1681 tttcgtaaca acttacaggt caaaaaagac cgtcgggaac atcaagatgc ccggtatcca + 1741 tgccgttgat caccgcctgg aaaggttaga ggaaagtgac aatgaaatgt tcgtagtaca + 1801 acgcgaacac gcagttgcca agttcgccgg gcttggtggt gggatggacg agctgtacaa + 1861 gtcaggccga gacgaagacg aattctctag atatcgctca atactgacca tttaaatcat + 1921 acctgacctc catagcagaa agtcaaaagc ctccgaccgg aggcttttga cttgatcggc + 1981 acgtaagagg ttccaacttt caccataatg aaataagatc actaccgggc gtattttttg + 2041 agttatcgag attttcagga gctaaggaag ctaaaatgag ccatattcaa cgggaaacgt + 2101 cttgctcgag gccgcgatta aattccaaca tggatgctga tttatatggg tataaatggg + 2161 ctcgcgataa tgtcgggcaa tcaggtgcga caatctatcg attgtatggg aagcccgatg + 2221 cgccagagtt gtttctgaaa catggcaaag gtagcgttgc caatgatgtt acagatgaga + 2281 tggtcaggct aaactggctg acggaattta tgcctcttcc gaccatcaag cattttatcc + 2341 gtactcctga tgatgcatgg ttactcacca ctgcgatccc agggaaaaca gcattccagg + 2401 tattagaaga atatcctgat tcaggtgaaa atattgttga tgcgctggca gtgttcctgc + 2461 gccggttgca ttcgattcct gtttgtaatt gtccttttaa cggcgatcgc gtatttcgtc + 2521 tcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p7_mtagbfp2.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p7_mtagbfp2.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,93 @@ +LOCUS . 2523 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + CDS 1154..1861 + /codon_start=1 + /note="mTagBFP2" + /note="mammalian codon-optimized" + /product="enhanced monomeric blue fluorescent protein + (Subach et al., 2011)" + /translation="VSKGEELIKENMHMKLYMEGTVDNHHFKCTSEGEGKPYEGTQTMR + IKVVEGGPLPFAFDILATSFLYGSKTFINHTQGIPDFFKQSFPEGFTWERVTTYEDGGV + LTATQDTSLQDGCLIYNVKIRGVNFTSNGPVMQKKTLGWEAFTETLYPADGGLEGRNDM + ALKLVGGSHLIANAKTTYRSKKPAKNLKMPGVYYVDYRLERIKEANNETYVEQHEVAVA + RYCDLPSKLGHKLN" + source 1154..1863 + /source="Exported" + misc_feature complement(1869..1874) + /note="BsmBI" + terminator 1941..1972 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1973..2075 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1868..2523 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcgc agcgtgtcta agggcgaaga gctgattaag gagaacatgc acatgaagct + 1201 gtacatggag ggcaccgtgg acaaccatca cttcaagtgc acatccgagg gcgaaggcaa + 1261 gccctacgag ggcacccaga ccatgagaat caaggtggtc gagggcggcc ctctcccctt + 1321 cgccttcgac atcctggcta ctagcttcct ctacggcagc aagaccttca tcaaccacac + 1381 ccagggcatc cccgacttct tcaagcagtc cttccctgag ggcttcacat gggagagagt + 1441 caccacatac gaagacgggg gcgtgctgac cgctacccag gacaccagcc tccaggacgg + 1501 ctgcctcatc tacaacgtca agatcagagg ggtgaacttc acatccaacg gccctgtgat + 1561 gcagaagaaa acactcggct gggaggcctt caccgaaacg ctgtaccccg ctgacggcgg + 1621 cctggaaggc agaaacgaca tggccctgaa gctcgtgggc gggagccatc tgatcgcaaa + 1681 cgccaagacc acatatagat ccaagaaacc cgctaagaac ctcaagatgc ctggcgtcta + 1741 ctatgtggac tacagactgg aaagaatcaa ggaggccaac aacgaaacct acgtcgagca + 1801 gcacgaggtg gcagtggcca gatactgcga cctccctagc aaactggggc acaagcttaa + 1861 ttcaggccga gacgaagacg aattctctag atatcgctca atactgacca tttaaatcat + 1921 acctgacctc catagcagaa agtcaaaagc ctccgaccgg aggcttttga cttgatcggc + 1981 acgtaagagg ttccaacttt caccataatg aaataagatc actaccgggc gtattttttg + 2041 agttatcgag attttcagga gctaaggaag ctaaaatgag ccatattcaa cgggaaacgt + 2101 cttgctcgag gccgcgatta aattccaaca tggatgctga tttatatggg tataaatggg + 2161 ctcgcgataa tgtcgggcaa tcaggtgcga caatctatcg attgtatggg aagcccgatg + 2221 cgccagagtt gtttctgaaa catggcaaag gtagcgttgc caatgatgtt acagatgaga + 2281 tggtcaggct aaactggctg acggaattta tgcctcttcc gaccatcaag cattttatcc + 2341 gtactcctga tgatgcatgg ttactcacca ctgcgatccc agggaaaaca gcattccagg + 2401 tattagaaga atatcctgat tcaggtgaaa atattgttga tgcgctggca gtgttcctgc + 2461 gccggttgca ttcgattcct gtttgtaatt gtccttttaa cggcgatcgc gtatttcgtc + 2521 tcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p8_linker1.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p8_linker1.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,75 @@ +LOCUS . 1864 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1814..1864 + /codon_start=1 + /note="Linker 1" + /translation="SGLRSGSGGGSASGGSG" + source 1814..1864 + /source="Exported" +ORIGIN + 1 gcgtcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcga ggctctggac tcagatctgg cagcggagga ggcagcgcat ctggcggaag + 1861 cgga +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p8_linker2.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p8_linker2.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,74 @@ +LOCUS . 1849 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1814..1849 + /codon_start=1 + /note="Linker 2" + /translation="GSAGSAAGSGEF" + source 1814..1849 + /source="Exported" +ORIGIN + 1 gcgtcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcga ggcggcagcg ccggcagcgc cgccggcagc ggcgagttc +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p8_p2a.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p8_p2a.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,80 @@ +LOCUS . 1870 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1814..1870 + /codon_start=1 + /note="P2A-Porcine teschovirus-1" + /note="Eukaryotic ribosomes fail to insert a peptide bond + between the Gly and Pro residues, yielding separate + polypeptides." + /product="2A peptide from porcine teschovirus-1 + polyprotein" + /translation="ATNFSLLKQAGDVEENPGP" + source 1814..1870 + /source="Exported" +ORIGIN + 1 gcgtcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcga ggcgctacta acttcagcct gctgaagcag gctggcgacg tggaggagaa + 1861 ccctggacct +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p8a_ct-kdel.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p8a_ct-kdel.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,75 @@ +LOCUS . 1863 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1814..1828 + /codon_start=1 + /note="KDEL" + /translation="KDEL" + source 1814..1863 + /source="Exported" +ORIGIN + 1 atcccgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcga ggcaaggacg agctgtaagc ggccgcgact ctagatcata atcagccata + 1861 cca +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p8b_ires2.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p8b_ires2.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,84 @@ +LOCUS . 2427 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + terminator 392..419 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + rep_origin complement(431..1018) + /direction=LEFT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 1040..1069 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + misc_feature 1143..1148 + /note="BsmBI" + source 5..1149 + /source="Exported" + misc_feature 1182..1767 + /note="IRES2" + /note="internal ribosome entry site (IRES) of the + encephalomyocarditis virus (EMCV)" + source 1154..1767 + /source="Exported" + misc_feature complement(1773..1778) + /note="BsmBI" + terminator 1845..1876 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + promoter 1877..1979 + /note="cat promoter" + /note="promoter of the E. coli cat gene" + source 1772..2427 + /source="Exported" +ORIGIN + 1 ctcaggcgca atcacgaatg aataacggtt tggttggtgc gagtgatttt gatgacgagc + 61 gtaatggctg gcctgttgaa caagtctgga aagaaatgca taagcttttg ccattctcac + 121 cggattcagt cgtcactcat ggtgatttct cacttgataa ccttattttt gacgagggga + 181 aattaatagg ttgtattgat gttggacgag tcggaatcgc agaccgatac caggatcttg + 241 ccatcctatg gaactgcctc ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa + 301 aatatggtat tgataatcct gatatgaata aattgcagtt tcacttgatg ctcgatgagt + 361 ttttctaatg agggcccaaa tgtaatcacc tggctcacct tcgggtgggc ctttctgcgt + 421 tgctggcgtt tttccatagg ctccgccccc ctgacgagca tcacaaaaat cgatgctcaa + 481 gtcagaggtg gcgaaacccg acaggactat aaagatacca ggcgtttccc cctggaagct + 541 ccctcgtgcg ctctcctgtt ccgaccctgc cgcttaccgg atacctgtcc gcctttctcc + 601 cttcgggaag cgtggcgctt tctcatagct cacgctgtag gtatctcagt tcggtgtagg + 661 tcgttcgctc caagctgggc tgtgtgcacg aaccccccgt tcagcccgac cgctgcgcct + 721 tatccggtaa ctatcgtctt gagtccaacc cggtaagaca cgacttatcg ccactggcag + 781 cagccactgg taacaggatt agcagagcga ggtatgtagg cggtgctaca gagttcttga + 841 agtggtggcc taactacggc tacactagaa gaacagtatt tggtatctgc gctctgctga + 901 agccagttac ctcggaaaaa gagttggtag ctcttgatcc ggcaaacaaa ccaccgctgg + 961 tagcggtggt ttttttgttt gcaagcagca gattacgcgc agaaaaaaag gatctcaaga + 1021 agatcctttg attttctacc gaagaaaggc ccacccgtga aggtgagcca gtgagttgat + 1081 tgcagtccag ttacgctgga gtctgaggct cgtcctgaat gatatcaagc ttgaattcgt + 1141 tacgtctcga tcccgctcga taagcttgat atcgaattcc gcccctctcc ctcccccccc + 1201 cctaacgtta ctggccgaag ccgcttggaa taaggccggt gtgcgtttgt ctatatgtta + 1261 ttttccacca tattgccgtc ttttggcaat gtgagggccc ggaaacctgg ccctgtcttc + 1321 ttgacgagca ttcctagggg tctttcccct ctcgccaaag gaatgcaagg tctgttgaat + 1381 gtcgtgaagg aagcagttcc tctggaagct tcttgaagac aaacaacgtc tgtagcgacc + 1441 ctttgcaggc agcggaaccc cccacctggc gacaggtgcc tctgcggcca aaagccacgt + 1501 gtataagata cacctgcaaa ggcggcacaa ccccagtgcc acgttgtgag ttggatagtt + 1561 gtggaaagag tcaaatggct ctcctcaagc gtattcaaca aggggctgaa ggatgcccag + 1621 aaggtacccc attgtatggg atctgatctg gggcctcggt gcacatgctt tacatgtgtt + 1681 tagtcgaggt taaaaaacgt ctaggccccc cgaaccacgg ggacgtggtt ttcctttgaa + 1741 aaacacgatg ataatatggc cacaaccgcg tcgagacgaa gacgaattct ctagatatcg + 1801 ctcaatactg accatttaaa tcatacctga cctccatagc agaaagtcaa aagcctccga + 1861 ccggaggctt ttgacttgat cggcacgtaa gaggttccaa ctttcaccat aatgaaataa + 1921 gatcactacc gggcgtattt tttgagttat cgagattttc aggagctaag gaagctaaaa + 1981 tgagccatat tcaacgggaa acgtcttgct cgaggccgcg attaaattcc aacatggatg + 2041 ctgatttata tgggtataaa tgggctcgcg ataatgtcgg gcaatcaggt gcgacaatct + 2101 atcgattgta tgggaagccc gatgcgccag agttgtttct gaaacatggc aaaggtagcg + 2161 ttgccaatga tgttacagat gagatggtca ggctaaactg gctgacggaa tttatgcctc + 2221 ttccgaccat caagcatttt atccgtactc ctgatgatgc atggttactc accactgcga + 2281 tcccagggaa aacagcattc caggtattag aagaatatcc tgattcaggt gaaaatattg + 2341 ttgatgcgct ggcagtgttc ctgcgccggt tgcattcgat tcctgtttgt aattgtcctt + 2401 ttaacggcga tcgcgtattt cgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p9_a-tubulin.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p9_a-tubulin.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,103 @@ +LOCUS . 3175 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + CDS 7..1359 + /codon_start=1 + /note="a-Tubulin" + /translation="VRECISIHVGQAGVQIGNACWELYCLEHGIQPDGQMPSDKTIGGG + DDSFNTFFSETGAGKHVPRAVFVDLEPTVIDEVRTGTYRQLFHPEQLITGKEDAANNYA + RGHYTIGKEIIDLVLDRIRKLADQCTGLQGFLVFHSFGGGTGSGFTSLLMERLSVDYGK + KSKLEFSIYPAPQVSTAVVEPYNSILTTHTTLEHSDCAFMVDNEAIYDICRRNLDIERP + TYTNLNRLISQIVSSITASLRFDGALNVDLTEFQTNLVPYPRIHFPLATYAPVISAEKA + YHEQLSVAEITNACFEPANQMVKCDPRHGKYMACCLLYRGDVVPKDVNAAIATIKTKRS + IQFVDWCPTGFKVGINYQPPTVVPGGDLAKVQRAVCMLSNTTAIAEAWARLDHKFDLMY + AKRAFVHWYVGEGMEEGEFSEAREDMAALEKDYEEVGVDSVEGEGEEEGEEY" + source 5..1366 + /source="Exported" + misc_feature complement(1372..1377) + /note="BsmBI" + terminator 1452..1481 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 1503..2090 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 2102..2129 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 1371..2516 + /source="Exported" + promoter complement(2969..3071) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 3072..3103 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 3169..3174 + /note="BsmBI" + source 2521..3175 + /source="Exported" +ORIGIN + 1 gcgtccgtgc gtgagtgcat ctccatccac gttggccagg ctggtgtcca gattggcaat + 61 gcctgctggg agctctactg cctggaacac ggcatccagc ccgatggcca gatgccaagt + 121 gacaagacca ttgggggagg agatgactcc ttcaacacct tcttcagtga aacgggcgct + 181 ggcaagcacg tgccccgggc tgtgtttgta gacttggaac ccacagtcat tgatgaagtt + 241 cgcactggca cctaccgcca gctcttccac cctgagcagc tcatcacagg caaggaagat + 301 gctgccaata actatgcccg agggcactac accattggca aggagatcat tgaccttgtg + 361 ttggaccgaa ttcgcaagct ggctgaccag tgcaccggtc ttcagggctt cttggttttc + 421 cacagctttg gtgggggaac tggttctggg ttcacctccc tgctcatgga acgcctctca + 481 gttgattatg gcaagaagtc caagctggag ttctccattt acccagcacc ccaggtttcc + 541 acagctgtag ttgagcccta caactccatc ctcaccaccc acaccaccct ggagcactct + 601 gattgtgcct tcatggtaga caatgaggcc atctatgaca tctgtcgtag aaacctcgat + 661 atcgagcgcc caacctacac taaccttaac cgccttatta gccagattgt gtcctccatc + 721 actgcttccc tgagatttga tggagccctg aatgttgacc tgacagaatt ccagaccaac + 781 ctggtgccct acccccgcat ccacttccct ctggccacat atgcccctgt catctctgct + 841 gagaaagcct accatgaaca gctttctgta gcagagatca ccaatgcttg ctttgagcca + 901 gccaaccaga tggtgaaatg tgaccctcgc catggtaaat acatggcttg ctgcctgttg + 961 taccgtggtg acgtggttcc caaagatgtc aatgctgcca ttgccaccat caaaaccaag + 1021 cgcagcatcc agtttgtgga ttggtgcccc actggcttca aggttggcat caactaccag + 1081 cctcccactg tggtgcctgg tggcgacctg gccaaggtac agagagctgt gtgcatgctg + 1141 agcaacacca cagccattgc tgaggcctgg gctcgcctgg accacaagtt tgacctgatg + 1201 tatgccaagc gtgcctttgt tcactggtac gtgggtgagg ggatggagga aggcgagttt + 1261 tcagaggccc gtgaagatat ggctgccctt gagaaggatt atgaggaggt tggtgtggat + 1321 tctgttgaag gagagggtga ggaagaagga gaggaatact aataactgct cgagacgaaa + 1381 acgaattcaa gcttgatatc attcaggacg agcctcagac tccagcgtaa ctggactgca + 1441 atcaactcac tggctcacct tcacgggtgg gcctttcttc ggtagaaaat caaaggatct + 1501 tcttgagatc ctttttttct gcgcgtaatc tgctgcttgc aaacaaaaaa accaccgcta + 1561 ccagcggtgg tttgtttgcc ggatcaagag ctaccaactc tttttccgag gtaactggct + 1621 tcagcagagc gcagatacca aatactgttc ttctagtgta gccgtagtta ggccaccact + 1681 tcaagaactc tgtagcaccg cctacatacc tcgctctgct aatcctgtta ccagtggctg + 1741 ctgccagtgg cgataagtcg tgtcttaccg ggttggactc aagacgatag ttaccggata + 1801 aggcgcagcg gtcgggctga acggggggtt cgtgcacaca gcccagcttg gagcgaacga + 1861 cctacaccga actgagatac ctacagcgtg agctatgaga aagcgccacg cttcccgaag + 1921 ggagaaaggc ggacaggtat ccggtaagcg gcagggtcgg aacaggagag cgcacgaggg + 1981 agcttccagg gggaaacgcc tggtatcttt atagtcctgt cgggtttcgc cacctctgac + 2041 ttgagcatcg atttttgtga tgctcgtcag gggggcggag cctatggaaa aacgccagca + 2101 acgcagaaag gcccacccga aggtgagcca ggtgattaca tttgggccct cattagaaaa + 2161 actcatcgag catcaagtga aactgcaatt tattcatatc aggattatca ataccatatt + 2221 tttgaaaaag ccgtttctgt aatgaaggag aaaactcacc gaggcagttc cataggatgg + 2281 caagatcctg gtatcggtct gcgattccga ctcgtccaac atcaatacaa cctattaatt + 2341 tcccctcgtc aaaaataagg ttatcaagtg agaaatcacc atgagtgacg actgaatccg + 2401 gtgagaatgg caaaagctta tgcatttctt tccagacttg ttcaacaggc cagccattac + 2461 gctcgtcatc aaaatcactc gcaccaacca aaccgttatt cattcgtgat tgcgcctgag + 2521 cgagacgaaa tacgcgatcg ccgttaaaag gacaattaca aacaggaatc gaatgcaacc + 2581 ggcgcaggaa cactgccagc gcatcaacaa tattttcacc tgaatcagga tattcttcta + 2641 atacctggaa tgctgttttc cctgggatcg cagtggtgag taaccatgca tcatcaggag + 2701 tacggataaa atgcttgatg gtcggaagag gcataaattc cgtcagccag tttagcctga + 2761 ccatctcatc tgtaacatca ttggcaacgc tacctttgcc atgtttcaga aacaactctg + 2821 gcgcatcggg cttcccatac aatcgataga ttgtcgcacc tgattgcccg acattatcgc + 2881 gagcccattt atacccatat aaatcagcat ccatgttgga atttaatcgc ggcctcgagc + 2941 aagacgtttc ccgttgaata tggctcattt tagcttcctt agctcctgaa aatctcgata + 3001 actcaaaaaa tacgcccggt agtgatctta tttcattatg gtgaaagttg gaacctctta + 3061 cgtgccgatc aagtcaaaag cctccggtcg gaggcttttg actttctgct atggaggtca + 3121 ggtatgattt aaatggtcag tattgagcga tatctagaga attcgtcacg tctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p9_bsdr.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p9_bsdr.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,82 @@ +LOCUS . 2214 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1816..2208 + /codon_start=1 + /note="BSDR- Human codon opt" + /translation="AKPLSQEESTLIERATATINSIPISEDYSVASAALSSDGRIFTGV + NVYHFTGGPCAELVVLGTAAAAAAGNLTCIVAIGNENRGILSPCGRCRQVLLDLHPGIK + AIVKDSDGQPTAVGIRELLPSGYVWEG" + source 1814..2214 + /source="Exported" +ORIGIN + 1 tgctcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgg cgtccgccaa gcctctgagc caggaggaga gcaccctgat cgagcgcgcc + 1861 accgccacca tcaacagcat ccctatcagc gaagactaca gcgtggccag cgccgctctg + 1921 agcagcgacg gccgcatctt cacaggagtg aacgtgtacc acttcaccgg aggaccttgc + 1981 gccgaactgg tggtgctggg caccgctgcc gctgctgccg ctggaaacct gacctgcatc + 2041 gtggccatcg gcaacgagaa ccgcggaatc ctgagccctt gcggccgctg ccgccaggtg + 2101 ctgctggacc tgcaccccgg catcaaggcc atcgtgaagg acagcgacgg ccagcccacc + 2161 gccgtgggca tccgcgagct gctgcccagc ggctacgtgt gggaaggcta ataa +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p9_dmrc.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p9_dmrc.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,83 @@ +LOCUS . 2101 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1816..2094 + /codon_start=1 + /note="FRB* (DmrC)" + /note="binds synthetic ligands such as AP21967" + /product="T2098L mutant of FKBP-rapamycin binding domain of + human FRAP" + /translation="ILWHEMWHEGLEEASRLYFGERNVKGMFEVLEPLHAMMERGPQTL + KETSFNQAYGRDLMEAQEWCRKYMKSGNVKDLLQAWDLYYHVFRRISK" + source 1814..2101 + /source="Exported" +ORIGIN + 1 tgctcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgg cgtccatcct ctggcatgag atgtggcatg aaggcctgga agaggcatct + 1861 cgtttgtact ttggggaaag gaacgtgaaa ggcatgtttg aggtgctgga gcccttgcat + 1921 gctatgatgg aacggggccc ccagactctg aaggaaacat cctttaatca ggcctatggt + 1981 cgagatttaa tggaggccca agagtggtgc aggaagtaca tgaaatcagg gaatgtcaag + 2041 gacctcctcc aagcctggga cctctattat catgtgttcc gacgaatctc aaagtaataa + 2101 c +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p9_firefly luciferase.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p9_firefly luciferase.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,120 @@ +LOCUS . 3549 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + CDS 7..1653 + /codon_start=1 + /note="Firefly luciferase" + /translation="EDAKNIKKGPAPRYPLEDGTAGEQLHKAMKRYAQVPGTIAFTDAH + IEVNITYAEYFEMSVRLAEAMKRYGLNTNHRIVVCSENSLQFFMPVLGALFIGVAVAPA + NDIYNERELLNSMNISQPTVVFVSKKGLQKILNVQKKLPIIQKIIIMDSKTDYQGFQSM + YTFVTSHLPPGFNEYDFKPESFDRDKTIALIMNSSGSTGLPKGVALPHRTACVRFSHAR + DPIFGNQIKPDTAILSVVPFHHGFGMFTTLGYLICGFRVVLMYRFEEELFLRSLQDYKI + QTALLVPTLFSFFAKSTLIDKYDLSNLHEIASGGAPLSKEVGEAVAKRFHLPGIRQGYG + LTETTSAILITPEGDDKPGAVGKVVPFFEAKVVDLDTGKTLGVNQRGELCVRGPMIMSG + YVNNPEATNALIDKDGWLHSGDIAYWDEDEHFFIVDRLKSLIKYKGYQVAPAELESILL + QHPNIRDAGVAGLPDDDAGELPAAVVVLEHGKTMTEKEIVDYVASQVTTAKKLRGGVVF + VDEVPKGLTGKLDARKIREILIKAKKGGKIAV" + CDS 1654..1668 + /codon_start=1 + /note="Linker" + /translation="SGGGS" + CDS 1669..1734 + /codon_start=1 + /note="3XFLAG" + /translation="DYKDHDGDYKDHDIDYKDDDDK" + source 5..1740 + /source="Exported" + misc_feature complement(1746..1751) + /note="BsmBI" + terminator 1826..1855 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 1877..2464 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 2476..2503 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 1745..2890 + /source="Exported" + promoter complement(3343..3445) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 3446..3477 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 3543..3548 + /note="BsmBI" + source 2895..3549 + /source="Exported" +ORIGIN + 1 gcgtccgagg acgccaagaa catcaagaag ggaccagccc ccagataccc cctggaggac + 61 ggcacagccg gcgagcagct gcacaaggcc atgaagcggt acgcccaggt gccaggcacc + 121 atcgccttca ccgacgccca catcgaggtg aacatcacct acgccgagta cttcgagatg + 181 agcgtgcggc tggccgaggc catgaagcgg tacggcctga acaccaacca ccgcatcgtg + 241 gtttgcagcg aaaacagcct gcagttcttt atgccagttc tgggagcact gttcatcgga + 301 gttgcagtgg ccccagcaaa cgacatctac aacgaacgcg agctgctgaa ctccatgaac + 361 atcagccagc caaccgttgt gttcgtgagc aagaaaggcc tgcagaagat tctgaatgtg + 421 cagaagaagc tgccaatcat tcagaagatc attatcatgg acagcaagac cgattaccag + 481 ggcttccaga gcatgtacac cttcgtgacc agccacctgc ccccaggctt caacgagtac + 541 gacttcaagc ccgagagctt cgaccgggac aagaccatcg ccctgatcat gaacagcagc + 601 ggcagcaccg gcctgcccaa gggcgtggcc ctgccccacc ggaccgcctg cgtgcggttc + 661 agccacgcca gggaccccat cttcggcaac cagatcaagc cagacaccgc tatcctgagc + 721 gttgtgccat tccaccacgg cttcggcatg ttcaccaccc tgggctacct gatctgcggc + 781 ttccgggtgg tgctgatgta caggttcgag gaggagctgt tcctgcggag cctgcaggac + 841 tacaagatcc agaccgccct gctggtgccc accctgttca gcttcttcgc caagagcacc + 901 ctgatcgaca agtacgacct gagcaacctg cacgagatcg cctctggcgg agccccactg + 961 agcaaggagg tgggcgaggc cgtggccaag cggttccacc tgccaggcat ccggcagggc + 1021 tacgggctga ccgaaaccac tagcgccatc ctgatcaccc ccgagggcga cgacaagccc + 1081 ggagccgtgg gcaaggtggt tccattcttt gaggccaaag ttgtggacct ggataccggg + 1141 aagaccctgg gcgtgaacca gagaggcgag ctgtgcgtga gaggccccat gatcatgagc + 1201 ggctacgtga acaaccccga ggccaccaac gccctgatcg acaaggatgg ctggctgcac + 1261 agcggcgaca tcgcctactg ggatgaggac gagcacttct ttatcgtgga tcggctgaag + 1321 agcctgatca aatacaaggg ctaccaggtg gccccagccg agctggagag catcctgctg + 1381 cagcacccca acatccggga cgccggagtg gccggactgc ccgacgacga cgccggagag + 1441 ctgccagccg ccgtggtggt gctggagcac ggcaagacca tgaccgagaa ggagatcgtg + 1501 gactacgtgg ccagccaggt gaccaccgcc aaaaagctga gaggaggcgt ggtcttcgtg + 1561 gatgaagtgc ccaagggcct gaccgggaag ctggacgcca gaaagatccg ggagatcctg + 1621 atcaaggcca agaagggcgg caagatcgca gtgagcggag gcgggagcga ctacaaagac + 1681 catgacggtg attataaaga tcatgacatc gattacaagg atgacgatga caagtaataa + 1741 tgctcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 1801 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 1861 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 1921 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 1981 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 2041 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 2101 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 2161 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 2221 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 2281 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 2341 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 2401 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 2461 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 2521 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 2581 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 2641 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 2701 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 2761 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 2821 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 2881 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 2941 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 3001 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 3061 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 3121 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 3181 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 3241 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 3301 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 3361 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 3421 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 3481 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 3541 cacgtctcg +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p9_mneogreen.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p9_mneogreen.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,92 @@ +LOCUS . 2526 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1816..2520 + /codon_start=1 + /note="mNeonGreen" + /product="bright monomeric yellow-green fluorescent protein + derived from LanYFP (Shaner et al., 2013)" + /translation="VSKGEEDNMASLPATHELHIFGSINGVDFDMVGQGTGNPNDGYEE + LNLKSTKGDLQFSPWILVPHIGYGFHQYLPYPDGMSPFQAAMVDGSGYQVHRTMQFEDG + ASLTVNYRYTYEGSHIKGEAQVKGTGFPADGPVMTNSLTAADWCRSKKTYPNDKTIIST + FKWSYTTGNGKRYRSTARTTYTFAKPMAANYLKNQPMYVFRKTELKHSKTELNFKEWQK + AFTDVMGMDELYK" + source 1814..2526 + /source="Exported" +ORIGIN + 1 tgctcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgg cgtccgtgag caagggcgag gaggataaca tggcctctct cccagcgaca + 1861 catgagttac acatctttgg ctccatcaac ggtgtggact ttgacatggt gggtcagggc + 1921 accggcaatc caaatgatgg ttatgaggag ttaaacctga agtccaccaa gggtgacctc + 1981 cagttctccc cctggattct ggtccctcat atcgggtatg gcttccatca gtacctgccc + 2041 taccctgacg ggatgtcgcc tttccaggcc gccatggtag atggctccgg ataccaagtc + 2101 catcgcacaa tgcagtttga agatggtgcc tcccttactg ttaactaccg ctacacctac + 2161 gagggaagcc acatcaaagg agaggcccag gtgaagggga ctggtttccc tgctgacggt + 2221 cctgtgatga ccaactcgct gaccgctgcg gactggtgca ggtcgaagaa gacttacccc + 2281 aacgacaaaa ccatcatcag tacctttaag tggagttaca ccactggaaa tggcaagcgc + 2341 taccggagca ctgcgcggac cacctacacc tttgccaagc caatggcggc taactatctg + 2401 aagaaccagc cgatgtacgt gttccgtaag acggagctca agcactccaa gaccgagctc + 2461 aacttcaagg agtggcaaaa ggcctttacc gatgtgatgg gcatggacga gctgtacaag + 2521 taataa +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p9_mruby2.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p9_mruby2.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,93 @@ +LOCUS . 2529 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1816..2523 + /codon_start=1 + /note="mRuby2" + /product="monomeric red fluorescent protein derived from + mRuby, with improved photophysical properties (Lam et al., + 2012)" + /translation="VSKGEELIKENMRMKVVMEGSVNGHQFKCTGEGEGNPYMGTQTMR + IKVIEGGPLPFAFDILATSFMYGSRTFIKYPKGIPDFFKQSFPEGFTWERVTRYEDGGV + VTVMQDTSLEDGCLVYHVQVRGVNFPSNGPVMQKKTKGWEPNTEMMYPADGGLRGYTHM + ALKVDGGGHLSCSFVTTYRSKKTVGNIKMPGIHAVDHRLERLEESDNEMFVVQREHAVA + KFAGLGGGMDELYK" + source 1814..2529 + /source="Exported" +ORIGIN + 1 tgctcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgg cgtccgtgtc taagggcgaa gagctgatca aggaaaatat gcgtatgaag + 1861 gtggtcatgg aaggttcggt caacggccac caattcaaat gcacaggtga aggagaaggc + 1921 aatccgtaca tgggaactca aaccatgagg atcaaagtca tcgagggagg acccctgcca + 1981 tttgcctttg acattcttgc cacgtcgttc atgtatggca gccgtacttt tatcaagtac + 2041 ccgaaaggca ttcctgattt ctttaaacag tcctttcctg agggttttac ttgggaaaga + 2101 gttacgagat acgaagatgg tggagtcgtc accgtcatgc aggacaccag ccttgaggat + 2161 ggctgtctcg tttaccacgt ccaagtcaga ggggtaaact ttccctccaa tggtcccgtg + 2221 atgcagaaga agaccaaggg ttgggagcct aatacagaga tgatgtatcc agcagatggt + 2281 ggtctgaggg gatacactca tatggcactg aaagttgatg gtggtggcca tctgtcttgc + 2341 tctttcgtaa caacttacag gtcaaaaaag accgtcggga acatcaagat gcccggtatc + 2401 catgccgttg atcaccgcct ggaaaggtta gaggaaagtg acaatgaaat gttcgtagta + 2461 caacgcgaac acgcagttgc caagttcgcc gggcttggtg gtgggatgga cgagctgtac + 2521 aagtaataa +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p9_mtagbfp2.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p9_mtagbfp2.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,93 @@ +LOCUS . 2526 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1816..2523 + /codon_start=1 + /note="mTagBFP2" + /note="mammalian codon-optimized" + /product="enhanced monomeric blue fluorescent protein + (Subach et al., 2011)" + /translation="VSKGEELIKENMHMKLYMEGTVDNHHFKCTSEGEGKPYEGTQTMR + IKVVEGGPLPFAFDILATSFLYGSKTFINHTQGIPDFFKQSFPEGFTWERVTTYEDGGV + LTATQDTSLQDGCLIYNVKIRGVNFTSNGPVMQKKTLGWEAFTETLYPADGGLEGRNDM + ALKLVGGSHLIANAKTTYRSKKPAKNLKMPGVYYVDYRLERIKEANNETYVEQHEVAVA + RYCDLPSKLGHKLN" + source 1814..2526 + /source="Exported" +ORIGIN + 1 tgctcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgg cgtccgtgtc taagggcgaa gagctgatta aggagaacat gcacatgaag + 1861 ctgtacatgg agggcaccgt ggacaaccat cacttcaagt gcacatccga gggcgaaggc + 1921 aagccctacg agggcaccca gaccatgaga atcaaggtgg tcgagggcgg ccctctcccc + 1981 ttcgccttcg acatcctggc tactagcttc ctctacggca gcaagacctt catcaaccac + 2041 acccagggca tccccgactt cttcaagcag tccttccctg agggcttcac atgggagaga + 2101 gtcaccacat acgaagacgg gggcgtgctg accgctaccc aggacaccag cctccaggac + 2161 ggctgcctca tctacaacgt caagatcaga ggggtgaact tcacatccaa cggccctgtg + 2221 atgcagaaga aaacactcgg ctgggaggcc ttcaccgaaa cgctgtaccc cgctgacggc + 2281 ggcctggaag gcagaaacga catggccctg aagctcgtgg gcgggagcca tctgatcgca + 2341 aacgccaaga ccacatatag atccaagaaa cccgctaaga acctcaagat gcctggcgtc + 2401 tactatgtgg actacagact ggaaagaatc aaggaggcca acaacgaaac ctacgtcgag + 2461 cagcacgagg tggcagtggc cagatactgc gacctcccta gcaaactggg gcacaagctt + 2521 aattaa +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p9_neor.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p9_neor.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,94 @@ +LOCUS . 2628 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1816..2628 + /codon_start=1 + /note="KanR/NeoR" + /note="confers resistance to kanamycin in bacteria or G418 + (Geneticin(R)) in eukaryotes" + /product="aminoglycoside phosphotransferase" + /translation="SHIQRETSCSRPRLNSNMDADLYGYKWARDNVGQSGATIYRLYGK + PDAPELFLKHGKGSVANDVTDEMVRLNWLTEFMPLPTIKHFIRTPDDAWLLTTAIPGKT + AFQVLEEYPDSGENIVDALAVFLRRLHSIPVCNCPFNSDRVFRLAQAQSRMNNGLVDAS + DFDDERNGWPVEQVWKEMHKLLPFSPDSVVTHGDFSLDNLIFDEGKLIGCIDVGRVGIA + DRYQDLAILWNCLGEFSPSLQKRLFQKYGIDNPDMNKLQFHLMLDEFF" + source 1814..2628 + /source="Exported" +ORIGIN + 1 tgctcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgg cgtccagcca tattcaacgg gaaacgtctt gctcgaggcc gcgattaaat + 1861 tccaacatgg atgctgattt atatgggtat aaatgggctc gcgataatgt cgggcaatca + 1921 ggtgcgacaa tctatcgatt gtatgggaag cccgatgcgc cagagttgtt tctgaaacat + 1981 ggcaaaggta gcgttgccaa tgatgttaca gatgagatgg tcagactaaa ctggctgacg + 2041 gaatttatgc ctcttccgac catcaagcat tttatccgta ctcctgatga tgcatggtta + 2101 ctcaccactg cgatccccgg gaaaacagca ttccaggtat tagaagaata tcctgattca + 2161 ggtgaaaata ttgttgatgc gctggcagtg ttcctgcgcc ggttgcattc gattcctgtt + 2221 tgtaattgtc cttttaacag cgatcgcgta tttcgtctgg ctcaggcgca atcacgaatg + 2281 aataacggtt tggttgatgc gagtgatttt gatgacgagc gtaatggctg gcctgttgaa + 2341 caagtctgga aagaaatgca taagcttttg ccattctcac cggattcagt cgtcactcat + 2401 ggtgatttct cacttgataa ccttattttt gacgagggga aattaatagg ttgtattgat + 2461 gttggacgag tcggaatcgc agaccgatac caggatcttg ccatcctatg gaactgcctc + 2521 ggtgagtttt ctccttcatt acagaaacgg ctttttcaaa aatatggtat tgataatcct + 2581 gatatgaata aattgcagtt tcatttgatg ctcgatgagt ttttctaa +// diff -r 000000000000 -r 4bde3e90ee98 test-data/emma_parts/p9_puror.gb --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/emma_parts/p9_puror.gb Wed Aug 06 08:02:58 2025 +0000 @@ -0,0 +1,90 @@ +LOCUS . 2415 bp DNA UNK 01-JAN-1980 +DEFINITION . +ACCESSION +VERSION +KEYWORDS . +SOURCE . + ORGANISM . + . +FEATURES Location/Qualifiers + misc_feature complement(6..11) + /note="BsmBI" + terminator 86..115 + /note="T3Te terminator" + /note="phage T3 early transcription terminator" + rep_origin 137..724 + /direction=RIGHT + /note="ori" + /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of + replication" + terminator 736..763 + /note="T7Te terminator" + /note="phage T7 early transcription terminator" + source 5..1150 + /source="Exported" + promoter complement(1603..1705) + /note="cat promoter" + /note="promoter of the E. coli cat gene" + terminator 1706..1737 + /note="tonB terminator" + /note="bidirectional E. coli tonB-P14 transcription + terminator" + misc_feature 1803..1808 + /note="BsmBI" + source 1155..1809 + /source="Exported" + CDS 1816..2412 + /codon_start=1 + /gene="pac from Streptomyces" + /note="PuroR" + /note="confers resistance to puromycin" + /product="puromycin N-acetyltransferase" + /translation="TEYKPTVRLATRDDVPRAVRTLAAAFADYPATRHTVDPDRHIERV + TELQELFLTRVGLDIGKVWVADDGAAVAVWTTPESVEAGAVFAEIGPRMAELSGSRLAA + QQQMEGLLAPHRPKEPAWFLATVGVSPDHQGKGLGSAVVLPGVEAAERAGVPAFLETSA + PRNLPFYERLGFTVTADVECPKDRATWCMTRKPGA" + source 1814..2415 + /source="Exported" +ORIGIN + 1 tgctcgagac gaaaacgaat tcaagcttga tatcattcag gacgagcctc agactccagc + 61 gtaactggac tgcaatcaac tcactggctc accttcacgg gtgggccttt cttcggtaga + 121 aaatcaaagg atcttcttga gatccttttt ttctgcgcgt aatctgctgc ttgcaaacaa + 181 aaaaaccacc gctaccagcg gtggtttgtt tgccggatca agagctacca actctttttc + 241 cgaggtaact ggcttcagca gagcgcagat accaaatact gttcttctag tgtagccgta + 301 gttaggccac cacttcaaga actctgtagc accgcctaca tacctcgctc tgctaatcct + 361 gttaccagtg gctgctgcca gtggcgataa gtcgtgtctt accgggttgg actcaagacg + 421 atagttaccg gataaggcgc agcggtcggg ctgaacgggg ggttcgtgca cacagcccag + 481 cttggagcga acgacctaca ccgaactgag atacctacag cgtgagctat gagaaagcgc + 541 cacgcttccc gaagggagaa aggcggacag gtatccggta agcggcaggg tcggaacagg + 601 agagcgcacg agggagcttc cagggggaaa cgcctggtat ctttatagtc ctgtcgggtt + 661 tcgccacctc tgacttgagc atcgattttt gtgatgctcg tcaggggggc ggagcctatg + 721 gaaaaacgcc agcaacgcag aaaggcccac ccgaaggtga gccaggtgat tacatttggg + 781 ccctcattag aaaaactcat cgagcatcaa gtgaaactgc aatttattca tatcaggatt + 841 atcaatacca tatttttgaa aaagccgttt ctgtaatgaa ggagaaaact caccgaggca + 901 gttccatagg atggcaagat cctggtatcg gtctgcgatt ccgactcgtc caacatcaat + 961 acaacctatt aatttcccct cgtcaaaaat aaggttatca agtgagaaat caccatgagt + 1021 gacgactgaa tccggtgaga atggcaaaag cttatgcatt tctttccaga cttgttcaac + 1081 aggccagcca ttacgctcgt catcaaaatc actcgcacca accaaaccgt tattcattcg + 1141 tgattgcgcc tgagcgagac gaaatacgcg atcgccgtta aaaggacaat tacaaacagg + 1201 aatcgaatgc aaccggcgca ggaacactgc cagcgcatca acaatatttt cacctgaatc + 1261 aggatattct tctaatacct ggaatgctgt tttccctggg atcgcagtgg tgagtaacca + 1321 tgcatcatca ggagtacgga taaaatgctt gatggtcgga agaggcataa attccgtcag + 1381 ccagtttagc ctgaccatct catctgtaac atcattggca acgctacctt tgccatgttt + 1441 cagaaacaac tctggcgcat cgggcttccc atacaatcga tagattgtcg cacctgattg + 1501 cccgacatta tcgcgagccc atttataccc atataaatca gcatccatgt tggaatttaa + 1561 tcgcggcctc gagcaagacg tttcccgttg aatatggctc attttagctt ccttagctcc + 1621 tgaaaatctc gataactcaa aaaatacgcc cggtagtgat cttatttcat tatggtgaaa + 1681 gttggaacct cttacgtgcc gatcaagtca aaagcctccg gtcggaggct tttgactttc + 1741 tgctatggag gtcaggtatg atttaaatgg tcagtattga gcgatatcta gagaattcgt + 1801 cacgtctcgg cgtccaccga gtacaagccc acggtgcgcc tcgccacccg cgacgacgtc + 1861 cccagggccg tacgcaccct cgccgccgcg ttcgccgact accccgccac gcgccacacc + 1921 gtcgatccgg accgccacat cgagcgggtc accgagctgc aagaactctt cctcacgcgc + 1981 gtcgggctcg acatcggcaa ggtgtgggtc gcggacgacg gcgccgcggt ggcggtctgg + 2041 accacgccgg agagcgtcga agcgggggcg gtgttcgccg agatcggccc gcgcatggcc + 2101 gagttgagcg gttcccggct ggccgcgcag caacagatgg aaggcctcct ggcgccgcac + 2161 cggcccaagg agcccgcgtg gttcctggcc accgtcggcg tgtcgcccga ccaccagggc + 2221 aagggtctgg gcagcgccgt cgtgctcccc ggagtggagg cggccgagcg cgccggggtg + 2281 cccgccttcc tggaaacctc cgcgccccgc aacctcccct tctacgagcg gctcggcttc + 2341 accgtcaccg ccgacgtcga gtgcccgaag gaccgcgcga cctggtgcat gacccgcaag + 2401 cccggtgcct aataa +// diff -r 000000000000 -r 4bde3e90ee98 test-data/example_echo_plate.xlsx Binary file test-data/example_echo_plate.xlsx has changed diff -r 000000000000 -r 4bde3e90ee98 test-data/example_picklist.xls Binary file test-data/example_picklist.xls has changed