# HG changeset patch # User bgruening # Date 1426613974 14400 # Node ID 257453ff1f3d3e65d16b71365ee058cd97ec50ee # Parent b876c71cc0b18d00768e00fc7ab7baa523df6a88 Uploaded diff -r b876c71cc0b1 -r 257453ff1f3d P61920.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/P61920.fasta Tue Mar 17 13:39:34 2015 -0400 @@ -0,0 +1,4 @@ +>sp|P61920|HBG1_PANTR Hemoglobin subunit gamma-1 OS=Pan troglodytes GN=HBG1 PE=1 SV=2 +MGHFTEEDKATITSLWGKVNVEDAGGETLGRLLVVYPWTQRFFDSFGNLSSASAIMGNPK +VKAHGKKVLTSLGDAIKHLDDLKGTFAQLSELHCDKLHVDPENFKLLGNVLVTVLAIHFG +KEFTPEVQASWQKMVTAVASALSSRYH diff -r b876c71cc0b1 -r 257453ff1f3d P61921.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/P61921.fasta Tue Mar 17 13:39:34 2015 -0400 @@ -0,0 +1,4 @@ +>sp|P61921|HBG2_PANTR Hemoglobin subunit gamma-2 OS=Pan troglodytes GN=HBG2 PE=1 SV=2 +MGHFTEEDKATITSLWGKVNVEDAGGETLGRLLVVYPWTQRFFDSFGNLSSASAIMGNPK +VKAHGKKVLTSLGDAIKHLDDLKGTFAQLSELHCDKLHVDPENFKLLGNVLVTVLAIHFG +KEFTPEVQASWQKMVTGVASALSSRYH diff -r b876c71cc0b1 -r 257453ff1f3d Q6LDH1.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/Q6LDH1.fasta Tue Mar 17 13:39:34 2015 -0400 @@ -0,0 +1,4 @@ +>sp|Q6LDH1|HBE_PANTR Hemoglobin subunit epsilon OS=Pan troglodytes GN=HBE1 PE=2 SV=3 +MVHFTAEEKAAVTSLWSKMNVEEAGGEALGRLLVVYPWTQRFFDSFGNLSSPSAILGNPK +VKAHGKKVLTSFGDAIKNMDNLKPAFAKLSELHCDKLHVDPENFKLLGNVMVIILATHFG +KEFTPEVQAAWQKLVSAVAIALAHKYH diff -r b876c71cc0b1 -r 257453ff1f3d WP_037658548.fasta --- a/WP_037658548.fasta Tue Mar 17 13:33:43 2015 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,9 +0,0 @@ ->gi|739806613|ref|WP_037658548.1| beta-ACP synthase [Streptomyces aurantiacus] -MSGRRVVVTGMEVLAPGGVGTDNFWSLLSEGRTATRGITFFDPAQFRSRVAAEIDFDPYAHGLTPQEVRR -MDRAAQFAVVAARGAVADSGLDTDTLDPYRIGVTIGSAVGATMSLDEDYRVVSDAGRLDLVDHTYADPFF -YNYFVPSSFATEVARLVGAQGPSSVVSAGCTSGLDSVGYAVELIREGTADVMVAGATDAPISPITMACFD -AIKATTPRHDDPEHASRPFDDTRNGFVLGEGTAVFVLEELESARRRGARIYAEIAGYATRSNAYHMTGLR -PDGAEMAEAITVALDEARMNPTAIDYINAHGSGTKQNDRHETAAFKRSLGEHAYRTPVSSIKSMVGHSLG -AIGSIEIAASILAIQHDVVPPTANLHTPDPQCDLDYVPLNAREQIVDAVLTVGSGFGGFQSAMVLAQPER -NAA - diff -r b876c71cc0b1 -r 257453ff1f3d WP_037658557.fasta --- a/WP_037658557.fasta Tue Mar 17 13:33:43 2015 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,7 +0,0 @@ ->gi|739806622|ref|WP_037658557.1| cytochrome P450 [Streptomyces aurantiacus] -MQRTCPFSVPPVYTKFREESPITQVVLPDGGKAWLVTKYDDVRAVMANPKLSSDRRAPDFPVVVPGQNAA -LAKHAPFMIILDGAEHAAARRPVISEFSVRRVAAMKPRIQEIVDGFIDDMLKMPKPVDLNQVFSLPVPSL -VVSEILGMPYEGHEYFMELAEILLRRTTDEQGRIAVSVELRKYMDKLVEEKIENPGDDLLSRQIELQRQQ -GGIDRPQLASLCLLVLLAGHETTANMINLGVFSMLTKPELLAEIKADPSKTPKAVDELLRFYTIPDFGAH -RLALDDVEIGGVLIRKGEAVIASTFAANRDPAVFDDPEELDFGRDARHHVAFGYGPHQCLGQNLGRLELQ -VVFDTLFRRLPELRLAVPEEELSFKSDALVYGLYELPVTW diff -r b876c71cc0b1 -r 257453ff1f3d find_genes_located_nearby.ga --- a/find_genes_located_nearby.ga Tue Mar 17 13:33:43 2015 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,578 +0,0 @@ -{ - "a_galaxy_workflow": "true", - "annotation": "Input are two protein genes in FASTA format. They will be blasted with tblastn against the NCBI NR database. Both results are compared and hits are returned that are close to each other.", - "format-version": "0.1", - "name": "Finding 2 genes close to each other", - "steps": { - "0": { - "annotation": "", - "id": 0, - "input_connections": {}, - "inputs": [ - { - "description": "", - "name": "Protein in FASTA format" - } - ], - "name": "Input dataset", - "outputs": [], - "position": { - "left": 248, - "top": 311 - }, - "tool_errors": null, - "tool_id": null, - "tool_state": "{\"name\": \"Protein in FASTA format\"}", - "tool_version": null, - "type": "data_input", - "user_outputs": [] - }, - "1": { - "annotation": "", - "id": 1, - "input_connections": {}, - "inputs": [ - { - "description": "", - "name": "Protein in FASTA format" - } - ], - "name": "Input dataset", - "outputs": [], - "position": { - "left": 250, - "top": 386 - }, - "tool_errors": null, - "tool_id": null, - "tool_state": "{\"name\": \"Protein in FASTA format\"}", - "tool_version": null, - "type": "data_input", - "user_outputs": [] - }, - "2": { - "annotation": "", - "id": 2, - "input_connections": { - "query": { - "id": 0, - "output_name": "output" - } - }, - "inputs": [], - "name": "NCBI BLAST+ tblastn", - "outputs": [ - { - "name": "output1", - "type": "tabular" - } - ], - "position": { - "left": 380.6166687011719, - "top": 224.61666870117188 - }, - "post_job_actions": { - "HideDatasetActionoutput1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "output1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/ncbi_blast_plus/ncbi_tblastn_wrapper/0.1.01", - "tool_state": "{\"__page__\": 0, \"evalue_cutoff\": \"\\\"0.001\\\"\", \"adv_opts\": \"{\\\"adv_opts_selector\\\": \\\"basic\\\", \\\"__current_case__\\\": 0}\", \"__rerun_remap_job_id__\": null, \"db_opts\": \"{\\\"db_opts_selector\\\": \\\"db\\\", \\\"subject\\\": \\\"\\\", \\\"histdb\\\": \\\"\\\", \\\"__current_case__\\\": 0, \\\"database\\\": \\\"nt_28-09-14\\\"}\", \"output\": \"{\\\"out_format\\\": \\\"cols\\\", \\\"std_cols\\\": [\\\"sseqid\\\", \\\"sstart\\\", \\\"send\\\", \\\"bitscore\\\"], \\\"ids_cols\\\": null, \\\"tax_cols\\\": null, \\\"__current_case__\\\": 2, \\\"misc_cols\\\": null, \\\"ext_cols\\\": null}\", \"query\": \"null\"}", - "tool_version": "0.1.01", - "type": "tool", - "user_outputs": [] - }, - "3": { - "annotation": "", - "id": 3, - "input_connections": { - "query": { - "id": 1, - "output_name": "output" - } - }, - "inputs": [], - "name": "NCBI BLAST+ tblastn", - "outputs": [ - { - "name": "output1", - "type": "tabular" - } - ], - "position": { - "left": 393.6166687011719, - "top": 444.6166687011719 - }, - "post_job_actions": { - "HideDatasetActionoutput1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "output1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/ncbi_blast_plus/ncbi_tblastn_wrapper/0.1.01", - "tool_state": "{\"__page__\": 0, \"evalue_cutoff\": \"\\\"0.001\\\"\", \"adv_opts\": \"{\\\"adv_opts_selector\\\": \\\"basic\\\", \\\"__current_case__\\\": 0}\", \"__rerun_remap_job_id__\": null, \"db_opts\": \"{\\\"db_opts_selector\\\": \\\"db\\\", \\\"subject\\\": \\\"\\\", \\\"histdb\\\": \\\"\\\", \\\"__current_case__\\\": 0, \\\"database\\\": \\\"nt_28-09-14\\\"}\", \"output\": \"{\\\"out_format\\\": \\\"cols\\\", \\\"std_cols\\\": [\\\"sseqid\\\", \\\"sstart\\\", \\\"send\\\", \\\"bitscore\\\"], \\\"ids_cols\\\": null, \\\"tax_cols\\\": null, \\\"__current_case__\\\": 2, \\\"misc_cols\\\": null, \\\"ext_cols\\\": null}\", \"query\": \"null\"}", - "tool_version": "0.1.01", - "type": "tool", - "user_outputs": [] - }, - "4": { - "annotation": "", - "id": 4, - "input_connections": { - "input": { - "id": 2, - "output_name": "output1" - } - }, - "inputs": [], - "name": "Filter", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 656.5, - "top": 190.5 - }, - "post_job_actions": {}, - "tool_errors": null, - "tool_id": "Filter1", - "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"header_lines\": \"\\\"0\\\"\", \"cond\": \"\\\"c4>150\\\"\", \"__page__\": 0}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "5": { - "annotation": "", - "id": 5, - "input_connections": { - "input": { - "id": 3, - "output_name": "output1" - } - }, - "inputs": [], - "name": "Filter", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 609.5, - "top": 349.5 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "Filter1", - "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"header_lines\": \"\\\"0\\\"\", \"cond\": \"\\\"c4>150\\\"\", \"__page__\": 0}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "6": { - "annotation": "", - "id": 6, - "input_connections": { - "input": { - "id": 4, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 715, - "top": 224 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c3,c2)\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\", \"round\": \"\\\"yes\\\"\"}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "7": { - "annotation": "", - "id": 7, - "input_connections": { - "input": { - "id": 5, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 661.5, - "top": 381.5 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"min(c3,c2)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "8": { - "annotation": "", - "id": 8, - "input_connections": { - "input": { - "id": 6, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 767, - "top": 260 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"min(c3,c2)\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\", \"round\": \"\\\"yes\\\"\"}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "9": { - "annotation": "", - "id": 9, - "input_connections": { - "input": { - "id": 7, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 714.5, - "top": 416.5 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c3,c2)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "10": { - "annotation": "", - "id": 10, - "input_connections": { - "input": { - "id": 8, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Cut", - "outputs": [ - { - "name": "out_file1", - "type": "tabular" - } - ], - "position": { - "left": 957, - "top": 271 - }, - "post_job_actions": { - "ChangeDatatypeActionout_file1": { - "action_arguments": { - "newtype": "interval" - }, - "action_type": "ChangeDatatypeAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "Cut1", - "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"delimiter\": \"\\\"T\\\"\", \"columnList\": \"\\\"c1,c6,c5\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\"}", - "tool_version": "1.0.2", - "type": "tool", - "user_outputs": [] - }, - "11": { - "annotation": "", - "id": 11, - "input_connections": { - "input": { - "id": 9, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 768.5, - "top": 452.5 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c5-10000,1)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "12": { - "annotation": "", - "id": 12, - "input_connections": { - "input": { - "id": 11, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 819.5, - "top": 489.5 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"c6+10000\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "13": { - "annotation": "", - "id": 13, - "input_connections": { - "input": { - "id": 12, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Cut", - "outputs": [ - { - "name": "out_file1", - "type": "tabular" - } - ], - "position": { - "left": 953.5, - "top": 392.5 - }, - "post_job_actions": { - "ChangeDatatypeActionout_file1": { - "action_arguments": { - "newtype": "interval" - }, - "action_type": "ChangeDatatypeAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "Cut1", - "tool_state": "{\"columnList\": \"\\\"c1,c7,c8\\\"\", \"input\": \"null\", \"delimiter\": \"\\\"T\\\"\", \"__rerun_remap_job_id__\": null, \"__page__\": 0}", - "tool_version": "1.0.2", - "type": "tool", - "user_outputs": [] - }, - "14": { - "annotation": "", - "id": 14, - "input_connections": { - "input1": { - "id": 10, - "output_name": "out_file1" - }, - "input2": { - "id": 13, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Intersect", - "outputs": [ - { - "name": "output", - "type": "input" - } - ], - "position": { - "left": 1160.9166870117188, - "top": 325.91668701171875 - }, - "post_job_actions": { - "HideDatasetActionoutput": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "output" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/intersect/gops_intersect_1/1.0.0", - "tool_state": "{\"input2\": \"null\", \"__page__\": 0, \"input1\": \"null\", \"min\": \"\\\"1\\\"\", \"__rerun_remap_job_id__\": null, \"returntype\": \"\\\"\\\"\"}", - "tool_version": "1.0.0", - "type": "tool", - "user_outputs": [] - }, - "15": { - "annotation": "", - "id": 15, - "input_connections": { - "input": { - "id": 14, - "output_name": "output" - } - }, - "inputs": [], - "name": "Sort", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 1154.9166870117188, - "top": 458.91668701171875 - }, - "post_job_actions": {}, - "tool_errors": null, - "tool_id": "sort1", - "tool_state": "{\"__page__\": 0, \"style\": \"\\\"alpha\\\"\", \"column\": \"{\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}\", \"__rerun_remap_job_id__\": null, \"order\": \"\\\"DESC\\\"\", \"input\": \"null\", \"column_set\": \"[{\\\"other_order\\\": \\\"DESC\\\", \\\"__index__\\\": 0, \\\"other_column\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"2\\\"}, \\\"other_style\\\": \\\"num\\\"}]\"}", - "tool_version": "1.0.3", - "type": "tool", - "user_outputs": [] - }, - "16": { - "annotation": "", - "id": 16, - "input_connections": { - "input1": { - "id": 15, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Group", - "outputs": [ - { - "name": "out_file1", - "type": "tabular" - } - ], - "position": { - "left": 1352.5, - "top": 399 - }, - "post_job_actions": { - "RenameDatasetActionout_file1": { - "action_arguments": { - "newname": "Counting hits per genome" - }, - "action_type": "RenameDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "Grouping1", - "tool_state": "{\"operations\": \"[{\\\"opcol\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"__index__\\\": 0, \\\"optype\\\": \\\"length\\\", \\\"opround\\\": \\\"no\\\"}]\", \"__page__\": 0, \"input1\": \"null\", \"ignorelines\": \"null\", \"groupcol\": \"{\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}\", \"__rerun_remap_job_id__\": null, \"ignorecase\": \"\\\"False\\\"\"}", - "tool_version": "2.1.0", - "type": "tool", - "user_outputs": [] - } - }, - "uuid": "12fe8ac4-30db-4db4-b8f9-7c44e0cc0788" -} diff -r b876c71cc0b1 -r 257453ff1f3d find_genes_located_nearby.png Binary file find_genes_located_nearby.png has changed diff -r b876c71cc0b1 -r 257453ff1f3d find_three_genes_located_nearby.ga --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/find_three_genes_located_nearby.ga Tue Mar 17 13:39:34 2015 -0400 @@ -0,0 +1,957 @@ +{ + "a_galaxy_workflow": "true", + "annotation": "Input are two protein genes in FASTA format. They will be blasted with tblastn against the NCBI NR database. Both results are compared and hits are returned that are close to each other.", + "format-version": "0.1", + "name": "Finding 3 genes close to each other", + "steps": { + "0": { + "annotation": "", + "id": 0, + "input_connections": {}, + "inputs": [ + { + "description": "", + "name": "Nucleotide Reference Database" + } + ], + "name": "Input dataset", + "outputs": [], + "position": { + "left": 289, + "top": 247 + }, + "tool_errors": null, + "tool_id": null, + "tool_state": "{\"name\": \"Nucleotide Reference Database\"}", + "tool_version": null, + "type": "data_input", + "user_outputs": [] + }, + "1": { + "annotation": "", + "id": 1, + "input_connections": {}, + "inputs": [ + { + "description": "", + "name": "Protein in FASTA format" + } + ], + "name": "Input dataset", + "outputs": [], + "position": { + "left": 248.38333129882812, + "top": 474.3833312988281 + }, + "tool_errors": null, + "tool_id": null, + "tool_state": "{\"name\": \"Protein in FASTA format\"}", + "tool_version": null, + "type": "data_input", + "user_outputs": [] + }, + "2": { + "annotation": "", + "id": 2, + "input_connections": {}, + "inputs": [ + { + "description": "", + "name": "Protein in FASTA format" + } + ], + "name": "Input dataset", + "outputs": [], + "position": { + "left": 250.38333129882812, + "top": 545.3833312988281 + }, + "tool_errors": null, + "tool_id": null, + "tool_state": "{\"name\": \"Protein in FASTA format\"}", + "tool_version": null, + "type": "data_input", + "user_outputs": [] + }, + "3": { + "annotation": "", + "id": 3, + "input_connections": {}, + "inputs": [ + { + "description": "", + "name": "Protein in FASTA format" + } + ], + "name": "Input dataset", + "outputs": [], + "position": { + "left": 259.1166687011719, + "top": 754.61669921875 + }, + "tool_errors": null, + "tool_id": null, + "tool_state": "{\"name\": \"Protein in FASTA format\"}", + "tool_version": null, + "type": "data_input", + "user_outputs": [] + }, + "4": { + "annotation": "", + "id": 4, + "input_connections": { + "input_file": { + "id": 0, + "output_name": "output" + } + }, + "inputs": [], + "name": "NCBI BLAST+ makeblastdb", + "outputs": [ + { + "name": "outfile", + "type": "data" + } + ], + "position": { + "left": 526.5, + "top": 196 + }, + "post_job_actions": { + "HideDatasetActionoutfile": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "outfile" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/ncbi_blast_plus/ncbi_makeblastdb/0.1.01", + "tool_state": "{\"__page__\": 0, \"mask_data_file\": \"null\", \"input_file\": \"null\", \"dbtype\": \"\\\"nucl\\\"\", \"__rerun_remap_job_id__\": null, \"hash_index\": \"\\\"True\\\"\", \"tax\": \"{\\\"taxselect\\\": \\\"\\\", \\\"__current_case__\\\": 0}\", \"title\": \"\\\"\\\"\", \"parse_seqids\": \"\\\"True\\\"\"}", + "tool_version": "0.1.01", + "type": "tool", + "user_outputs": [] + }, + "5": { + "annotation": "", + "id": 5, + "input_connections": { + "db_opts|histdb": { + "id": 4, + "output_name": "outfile" + }, + "query": { + "id": 1, + "output_name": "output" + } + }, + "inputs": [], + "name": "NCBI BLAST+ tblastn", + "outputs": [ + { + "name": "output1", + "type": "tabular" + } + ], + "position": { + "left": 429.5, + "top": 381 + }, + "post_job_actions": { + "HideDatasetActionoutput1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/ncbi_blast_plus/ncbi_tblastn_wrapper/0.1.01", + "tool_state": "{\"__page__\": 0, \"evalue_cutoff\": \"\\\"0.001\\\"\", \"adv_opts\": \"{\\\"adv_optional_id_files_opts\\\": {\\\"adv_optional_id_files_opts_selector\\\": \\\"none\\\", \\\"__current_case__\\\": 0}, \\\"matrix\\\": \\\"BLOSUM62\\\", \\\"adv_opts_selector\\\": \\\"advanced\\\", \\\"filter_query\\\": \\\"True\\\", \\\"word_size\\\": \\\"0\\\", \\\"__current_case__\\\": 1, \\\"parse_deflines\\\": \\\"False\\\", \\\"db_gencode\\\": \\\"1\\\", \\\"max_hits\\\": \\\"1\\\"}\", \"__rerun_remap_job_id__\": null, \"db_opts\": \"{\\\"db_opts_selector\\\": \\\"histdb\\\", \\\"subject\\\": \\\"\\\", \\\"histdb\\\": null, \\\"__current_case__\\\": 1, \\\"database\\\": \\\"\\\"}\", \"output\": \"{\\\"out_format\\\": \\\"ext\\\", \\\"__current_case__\\\": 1}\", \"query\": \"null\"}", + "tool_version": "0.1.01", + "type": "tool", + "user_outputs": [] + }, + "6": { + "annotation": "", + "id": 6, + "input_connections": { + "db_opts|histdb": { + "id": 4, + "output_name": "outfile" + }, + "query": { + "id": 2, + "output_name": "output" + } + }, + "inputs": [], + "name": "NCBI BLAST+ tblastn", + "outputs": [ + { + "name": "output1", + "type": "tabular" + } + ], + "position": { + "left": 421.5, + "top": 618 + }, + "post_job_actions": { + "HideDatasetActionoutput1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/ncbi_blast_plus/ncbi_tblastn_wrapper/0.1.01", + "tool_state": "{\"__page__\": 0, \"evalue_cutoff\": \"\\\"0.001\\\"\", \"adv_opts\": \"{\\\"adv_optional_id_files_opts\\\": {\\\"adv_optional_id_files_opts_selector\\\": \\\"none\\\", \\\"__current_case__\\\": 0}, \\\"matrix\\\": \\\"BLOSUM62\\\", \\\"adv_opts_selector\\\": \\\"advanced\\\", \\\"filter_query\\\": \\\"True\\\", \\\"word_size\\\": \\\"0\\\", \\\"__current_case__\\\": 1, \\\"parse_deflines\\\": \\\"False\\\", \\\"db_gencode\\\": \\\"1\\\", \\\"max_hits\\\": \\\"1\\\"}\", \"__rerun_remap_job_id__\": null, \"db_opts\": \"{\\\"db_opts_selector\\\": \\\"histdb\\\", \\\"subject\\\": \\\"\\\", \\\"histdb\\\": null, \\\"__current_case__\\\": 1, \\\"database\\\": \\\"\\\"}\", \"output\": \"{\\\"out_format\\\": \\\"ext\\\", \\\"__current_case__\\\": 1}\", \"query\": \"null\"}", + "tool_version": "0.1.01", + "type": "tool", + "user_outputs": [] + }, + "7": { + "annotation": "", + "id": 7, + "input_connections": { + "db_opts|histdb": { + "id": 4, + "output_name": "outfile" + }, + "query": { + "id": 3, + "output_name": "output" + } + }, + "inputs": [], + "name": "NCBI BLAST+ tblastn", + "outputs": [ + { + "name": "output1", + "type": "tabular" + } + ], + "position": { + "left": 426.6166687011719, + "top": 827.61669921875 + }, + "post_job_actions": { + "HideDatasetActionoutput1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/ncbi_blast_plus/ncbi_tblastn_wrapper/0.1.01", + "tool_state": "{\"__page__\": 0, \"evalue_cutoff\": \"\\\"0.001\\\"\", \"adv_opts\": \"{\\\"adv_optional_id_files_opts\\\": {\\\"adv_optional_id_files_opts_selector\\\": \\\"none\\\", \\\"__current_case__\\\": 0}, \\\"matrix\\\": \\\"BLOSUM62\\\", \\\"adv_opts_selector\\\": \\\"advanced\\\", \\\"filter_query\\\": \\\"True\\\", \\\"word_size\\\": \\\"0\\\", \\\"__current_case__\\\": 1, \\\"parse_deflines\\\": \\\"False\\\", \\\"db_gencode\\\": \\\"1\\\", \\\"max_hits\\\": \\\"1\\\"}\", \"__rerun_remap_job_id__\": null, \"db_opts\": \"{\\\"db_opts_selector\\\": \\\"histdb\\\", \\\"subject\\\": \\\"\\\", \\\"histdb\\\": null, \\\"__current_case__\\\": 1, \\\"database\\\": \\\"\\\"}\", \"output\": \"{\\\"out_format\\\": \\\"ext\\\", \\\"__current_case__\\\": 1}\", \"query\": \"null\"}", + "tool_version": "0.1.01", + "type": "tool", + "user_outputs": [] + }, + "8": { + "annotation": "", + "id": 8, + "input_connections": { + "input": { + "id": 5, + "output_name": "output1" + } + }, + "inputs": [], + "name": "Cut", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 710.3833312988281, + "top": 415.3833312988281 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Cut1", + "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"delimiter\": \"\\\"T\\\"\", \"columnList\": \"\\\"c2,c9,c10\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\"}", + "tool_version": "1.0.2", + "type": "tool", + "user_outputs": [] + }, + "9": { + "annotation": "", + "id": 9, + "input_connections": { + "input": { + "id": 6, + "output_name": "output1" + } + }, + "inputs": [], + "name": "Cut", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 683.3833312988281, + "top": 702.38330078125 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Cut1", + "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"delimiter\": \"\\\"T\\\"\", \"columnList\": \"\\\"c2,c9,c10\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\"}", + "tool_version": "1.0.2", + "type": "tool", + "user_outputs": [] + }, + "10": { + "annotation": "", + "id": 10, + "input_connections": { + "input": { + "id": 7, + "output_name": "output1" + } + }, + "inputs": [], + "name": "Cut", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 722.1166687011719, + "top": 887.61669921875 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Cut1", + "tool_state": "{\"columnList\": \"\\\"c2,c9,c10\\\"\", \"input\": \"null\", \"delimiter\": \"\\\"T\\\"\", \"__rerun_remap_job_id__\": null, \"__page__\": 0}", + "tool_version": "1.0.2", + "type": "tool", + "user_outputs": [] + }, + "11": { + "annotation": "", + "id": 11, + "input_connections": { + "input": { + "id": 8, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 768.3833312988281, + "top": 386.3833312988281 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c3,c2)\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\", \"round\": \"\\\"yes\\\"\"}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "12": { + "annotation": "", + "id": 12, + "input_connections": { + "input": { + "id": 9, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 747.8833312988281, + "top": 673.88330078125 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"min(c3,c2)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "13": { + "annotation": "", + "id": 13, + "input_connections": { + "input": { + "id": 10, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 769.1166687011719, + "top": 879.61669921875 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"min(c3,c2)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "14": { + "annotation": "", + "id": 14, + "input_connections": { + "input": { + "id": 11, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 847.38330078125, + "top": 383.3833312988281 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"min(c3,c2)\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\", \"round\": \"\\\"yes\\\"\"}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "15": { + "annotation": "", + "id": 15, + "input_connections": { + "input": { + "id": 12, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 801.8833312988281, + "top": 668.88330078125 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c3,c2)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "16": { + "annotation": "", + "id": 16, + "input_connections": { + "input": { + "id": 13, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 813.1166687011719, + "top": 871.61669921875 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c3,c2)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "17": { + "annotation": "", + "id": 17, + "input_connections": { + "input": { + "id": 14, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Cut", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 920.38330078125, + "top": 387.3833312988281 + }, + "post_job_actions": { + "ChangeDatatypeActionout_file1": { + "action_arguments": { + "newtype": "interval" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "out_file1" + }, + "RenameDatasetActionout_file1": { + "action_arguments": { + "newname": "" + }, + "action_type": "RenameDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Cut1", + "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"delimiter\": \"\\\"T\\\"\", \"columnList\": \"\\\"c1,c5,c4\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\"}", + "tool_version": "1.0.2", + "type": "tool", + "user_outputs": [] + }, + "18": { + "annotation": "", + "id": 18, + "input_connections": { + "input": { + "id": 15, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 854.88330078125, + "top": 661.88330078125 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c4-10000,1)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "19": { + "annotation": "", + "id": 19, + "input_connections": { + "input": { + "id": 16, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 857.11669921875, + "top": 863.61669921875 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c4-10000,1)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "20": { + "annotation": "", + "id": 20, + "input_connections": { + "input": { + "id": 18, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 911.88330078125, + "top": 658.88330078125 + }, + "post_job_actions": {}, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"c5+10000\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "21": { + "annotation": "", + "id": 21, + "input_connections": { + "input": { + "id": 19, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 907.11669921875, + "top": 854.61669921875 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"c5+10000\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "22": { + "annotation": "", + "id": 22, + "input_connections": { + "input": { + "id": 20, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Cut", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 963.88330078125, + "top": 657.88330078125 + }, + "post_job_actions": { + "ChangeDatatypeActionout_file1": { + "action_arguments": { + "newtype": "interval" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Cut1", + "tool_state": "{\"columnList\": \"\\\"c1,c6,c7\\\"\", \"input\": \"null\", \"delimiter\": \"\\\"T\\\"\", \"__rerun_remap_job_id__\": null, \"__page__\": 0}", + "tool_version": "1.0.2", + "type": "tool", + "user_outputs": [] + }, + "23": { + "annotation": "", + "id": 23, + "input_connections": { + "input": { + "id": 21, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Cut", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 968.11669921875, + "top": 852.61669921875 + }, + "post_job_actions": { + "ChangeDatatypeActionout_file1": { + "action_arguments": { + "newtype": "interval" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "out_file1" + }, + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Cut1", + "tool_state": "{\"columnList\": \"\\\"c1,c6,c7\\\"\", \"input\": \"null\", \"delimiter\": \"\\\"T\\\"\", \"__rerun_remap_job_id__\": null, \"__page__\": 0}", + "tool_version": "1.0.2", + "type": "tool", + "user_outputs": [] + }, + "24": { + "annotation": "", + "id": 24, + "input_connections": { + "input1": { + "id": 17, + "output_name": "out_file1" + }, + "input2": { + "id": 22, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Intersect", + "outputs": [ + { + "name": "output", + "type": "input" + } + ], + "position": { + "left": 1099.11669921875, + "top": 501.6166687011719 + }, + "post_job_actions": {}, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/intersect/gops_intersect_1/1.0.0", + "tool_state": "{\"input2\": \"null\", \"__page__\": 0, \"input1\": \"null\", \"min\": \"\\\"1\\\"\", \"__rerun_remap_job_id__\": null, \"returntype\": \"\\\"\\\"\"}", + "tool_version": "1.0.0", + "type": "tool", + "user_outputs": [] + }, + "25": { + "annotation": "", + "id": 25, + "input_connections": { + "input1": { + "id": 24, + "output_name": "output" + }, + "input2": { + "id": 23, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Intersect", + "outputs": [ + { + "name": "output", + "type": "input" + } + ], + "position": { + "left": 1137.11669921875, + "top": 755.61669921875 + }, + "post_job_actions": {}, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/intersect/gops_intersect_1/1.0.0", + "tool_state": "{\"input2\": \"null\", \"__page__\": 0, \"input1\": \"null\", \"min\": \"\\\"1\\\"\", \"__rerun_remap_job_id__\": null, \"returntype\": \"\\\"\\\"\"}", + "tool_version": "1.0.0", + "type": "tool", + "user_outputs": [] + }, + "26": { + "annotation": "", + "id": 26, + "input_connections": { + "input": { + "id": 25, + "output_name": "output" + } + }, + "inputs": [], + "name": "Sort", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 1216.11669921875, + "top": 648.1166687011719 + }, + "post_job_actions": {}, + "tool_errors": null, + "tool_id": "sort1", + "tool_state": "{\"__page__\": 0, \"style\": \"\\\"alpha\\\"\", \"column\": \"{\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}\", \"__rerun_remap_job_id__\": null, \"order\": \"\\\"DESC\\\"\", \"input\": \"null\", \"column_set\": \"[{\\\"other_order\\\": \\\"DESC\\\", \\\"__index__\\\": 0, \\\"other_column\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"2\\\"}, \\\"other_style\\\": \\\"num\\\"}]\"}", + "tool_version": "1.0.3", + "type": "tool", + "user_outputs": [] + }, + "27": { + "annotation": "", + "id": 27, + "input_connections": { + "input1": { + "id": 26, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Group", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 1396.88330078125, + "top": 648.3833312988281 + }, + "post_job_actions": { + "RenameDatasetActionout_file1": { + "action_arguments": { + "newname": "Counting hits per genome" + }, + "action_type": "RenameDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Grouping1", + "tool_state": "{\"operations\": \"[{\\\"opcol\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"__index__\\\": 0, \\\"optype\\\": \\\"length\\\", \\\"opround\\\": \\\"no\\\"}]\", \"__page__\": 0, \"input1\": \"null\", \"ignorelines\": \"null\", \"groupcol\": \"{\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}\", \"__rerun_remap_job_id__\": null, \"ignorecase\": \"\\\"False\\\"\"}", + "tool_version": "2.1.0", + "type": "tool", + "user_outputs": [] + } + }, + "uuid": "ea8b8757-5fcb-4451-b305-31db0e5349fd" +} \ No newline at end of file diff -r b876c71cc0b1 -r 257453ff1f3d find_three_genes_located_nearby.png Binary file find_three_genes_located_nearby.png has changed diff -r b876c71cc0b1 -r 257453ff1f3d readme.rst --- a/readme.rst Tue Mar 17 13:33:43 2015 -0400 +++ b/readme.rst Tue Mar 17 13:39:34 2015 -0400 @@ -1,52 +1,61 @@ Galaxy workflow for the identification of candidate genes clusters ------------------------------------------------------------------ -This approach screens two proteins against all nucleotide sequence from the -NCBI nt database within hours on our cluster, leading to all organisms with an inter- -esting gene structure for further investigation. As usual in Galaxy workflows every +This approach screens three proteins against a given genome sequence, leading to a genome position +were all three genes are located nearby. As usual in Galaxy workflows every parameter, including the proximity distance, can be changed and additional steps can be easily added. For example additional filtering to refine the initial BLAST hits, or inclusion of a third query sequence. -.. image:: https://raw.githubusercontent.com/bgruening/galaxytools/master/workflows/ncbi_blast_plus/find_genes_located_nearby/find_genes_located_nearby.png +.. image:: https://raw.githubusercontent.com/bgruening/galaxytools/master/workflows/ncbi_blast_plus/find_three_genes_located_nearby/find_three_genes_located_nearby.png Sample Data =========== -As an example, we will use two protein sequences from *Streptomyces aurantiacus* -that are part of a gene cluster, responsible for metabolite producion. +As an example, we will use three protein sequences from *Pan troglodytes* (Chimpanzee) +which are part of the β-globin cluster. -You can upload both sequences directly into Galaxy using the "Upload File" tool +You can upload all sequences directly into Galaxy using the "Upload tool" with either of these URLs - Galaxy should recognise this is FASTA files. -* `WP_037658548.fasta `_ -* `WP_037658557.fasta `_ +Query sequences: -In addition you can find both sequences at the NCBI server: - * http://www.ncbi.nlm.nih.gov/protein/739806622 (cytochrome P450) - :: - - >gi|739806622|ref|WP_037658557.1| cytochrome P450 [Streptomyces aurantiacus] - MQRTCPFSVPPVYTKFREESPITQVVLPDGGKAWLVTKYDDVRAVMANPKLSSDRRAPDFPVVVPGQNAA - LAKHAPFMIILDGAEHAAARRPVISEFSVRRVAAMKPRIQEIVDGFIDDMLKMPKPVDLNQVFSLPVPSL - VVSEILGMPYEGHEYFMELAEILLRRTTDEQGRIAVSVELRKYMDKLVEEKIENPGDDLLSRQIELQRQQ - GGIDRPQLASLCLLVLLAGHETTANMINLGVFSMLTKPELLAEIKADPSKTPKAVDELLRFYTIPDFGAH - RLALDDVEIGGVLIRKGEAVIASTFAANRDPAVFDDPEELDFGRDARHHVAFGYGPHQCLGQNLGRLELQ - VVFDTLFRRLPELRLAVPEEELSFKSDALVYGLYELPVTW +* `P61920.fasta `_ +* `P61921.fasta `_ +* `Q6LDH1.fasta `_ + +Genome sequence: + +* http://hgdownload.cse.ucsc.edu/goldenPath/rn6/bigZips/rn6.fa.gz - * http://www.ncbi.nlm.nih.gov/protein/739806613 (beta-ACP synthase) +In addition you can find the query sequences at the UniProt server: + * http://www.uniprot.org/uniprot/P61920 (Hemoglobin subunit gamma-1) + :: + + >sp|P61920|HBG1_PANTR Hemoglobin subunit gamma-1 OS=Pan troglodytes GN=HBG1 PE=1 SV=2 + MGHFTEEDKATITSLWGKVNVEDAGGETLGRLLVVYPWTQRFFDSFGNLSSASAIMGNPK + VKAHGKKVLTSLGDAIKHLDDLKGTFAQLSELHCDKLHVDPENFKLLGNVLVTVLAIHFG + KEFTPEVQASWQKMVTAVASALSSRYH + + + * http://www.uniprot.org/uniprot/P61921 (Hemoglobin subunit gamma-2) :: - - >gi|739806613|ref|WP_037658548.1| beta-ACP synthase [Streptomyces aurantiacus] - MSGRRVVVTGMEVLAPGGVGTDNFWSLLSEGRTATRGITFFDPAQFRSRVAAEIDFDPYAHGLTPQEVRR - MDRAAQFAVVAARGAVADSGLDTDTLDPYRIGVTIGSAVGATMSLDEDYRVVSDAGRLDLVDHTYADPFF - YNYFVPSSFATEVARLVGAQGPSSVVSAGCTSGLDSVGYAVELIREGTADVMVAGATDAPISPITMACFD - AIKATTPRHDDPEHASRPFDDTRNGFVLGEGTAVFVLEELESARRRGARIYAEIAGYATRSNAYHMTGLR - PDGAEMAEAITVALDEARMNPTAIDYINAHGSGTKQNDRHETAAFKRSLGEHAYRTPVSSIKSMVGHSLG - AIGSIEIAASILAIQHDVVPPTANLHTPDPQCDLDYVPLNAREQIVDAVLTVGSGFGGFQSAMVLAQPER - NAA + + >sp|P61921|HBG2_PANTR Hemoglobin subunit gamma-2 OS=Pan troglodytes GN=HBG2 PE=1 SV=2 + MGHFTEEDKATITSLWGKVNVEDAGGETLGRLLVVYPWTQRFFDSFGNLSSASAIMGNPK + VKAHGKKVLTSLGDAIKHLDDLKGTFAQLSELHCDKLHVDPENFKLLGNVLVTVLAIHFG + KEFTPEVQASWQKMVTGVASALSSRYH + + + * http://www.uniprot.org/uniprot/Q6LDH1 (Hemoglobin subunit epsilon) + :: + + >sp|Q6LDH1|HBE_PANTR Hemoglobin subunit epsilon OS=Pan troglodytes GN=HBE1 PE=2 SV=3 + MVHFTAEEKAAVTSLWSKMNVEEAGGEALGRLLVVYPWTQRFFDSFGNLSSPSAILGNPK + VKAHGKKVLTSFGDAIKNMDNLKPAFAKLSELHCDKLHVDPENFKLLGNVMVIILATHFG + KEFTPEVQAAWQKLVSAVAIALAHKYH Citation @@ -68,11 +77,11 @@ This workflow is available on the main Galaxy Tool Shed: -http://toolshed.g2.bx.psu.edu/view/bgruening/find_genes_located_nearby_workflow +http://toolshed.g2.bx.psu.edu/view/bgruening/find_three_genes_located_nearby_workflow Development is being done on github: -https://github.com/bgruening/galaxytools/tree/master/workflows/ncbi_blast_plus/find_genes_located_nearby +https://github.com/bgruening/galaxytools/tree/master/workflows/ncbi_blast_plus/find_three_genes_located_nearby Dependencies