Mercurial > repos > bgruening > find_three_genes_located_nearby_workflow
changeset 2:b876c71cc0b1 draft
Uploaded
author | bgruening |
---|---|
date | Tue, 17 Mar 2015 13:33:43 -0400 |
parents | 3dd8f7b4703b |
children | 257453ff1f3d |
files | P61920.fasta P61921.fasta Q6LDH1.fasta WP_037658548.fasta WP_037658557.fasta find_genes_located_nearby.ga find_genes_located_nearby.png find_three_genes_located_nearby.ga find_three_genes_located_nearby.png readme.rst |
diffstat | 10 files changed, 626 insertions(+), 1008 deletions(-) [+] |
line wrap: on
line diff
--- a/P61920.fasta Tue Mar 17 13:27:23 2015 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,4 +0,0 @@ ->sp|P61920|HBG1_PANTR Hemoglobin subunit gamma-1 OS=Pan troglodytes GN=HBG1 PE=1 SV=2 -MGHFTEEDKATITSLWGKVNVEDAGGETLGRLLVVYPWTQRFFDSFGNLSSASAIMGNPK -VKAHGKKVLTSLGDAIKHLDDLKGTFAQLSELHCDKLHVDPENFKLLGNVLVTVLAIHFG -KEFTPEVQASWQKMVTAVASALSSRYH
--- a/P61921.fasta Tue Mar 17 13:27:23 2015 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,4 +0,0 @@ ->sp|P61921|HBG2_PANTR Hemoglobin subunit gamma-2 OS=Pan troglodytes GN=HBG2 PE=1 SV=2 -MGHFTEEDKATITSLWGKVNVEDAGGETLGRLLVVYPWTQRFFDSFGNLSSASAIMGNPK -VKAHGKKVLTSLGDAIKHLDDLKGTFAQLSELHCDKLHVDPENFKLLGNVLVTVLAIHFG -KEFTPEVQASWQKMVTGVASALSSRYH
--- a/Q6LDH1.fasta Tue Mar 17 13:27:23 2015 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,4 +0,0 @@ ->sp|Q6LDH1|HBE_PANTR Hemoglobin subunit epsilon OS=Pan troglodytes GN=HBE1 PE=2 SV=3 -MVHFTAEEKAAVTSLWSKMNVEEAGGEALGRLLVVYPWTQRFFDSFGNLSSPSAILGNPK -VKAHGKKVLTSFGDAIKNMDNLKPAFAKLSELHCDKLHVDPENFKLLGNVMVIILATHFG -KEFTPEVQAAWQKLVSAVAIALAHKYH
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/WP_037658548.fasta Tue Mar 17 13:33:43 2015 -0400 @@ -0,0 +1,9 @@ +>gi|739806613|ref|WP_037658548.1| beta-ACP synthase [Streptomyces aurantiacus] +MSGRRVVVTGMEVLAPGGVGTDNFWSLLSEGRTATRGITFFDPAQFRSRVAAEIDFDPYAHGLTPQEVRR +MDRAAQFAVVAARGAVADSGLDTDTLDPYRIGVTIGSAVGATMSLDEDYRVVSDAGRLDLVDHTYADPFF +YNYFVPSSFATEVARLVGAQGPSSVVSAGCTSGLDSVGYAVELIREGTADVMVAGATDAPISPITMACFD +AIKATTPRHDDPEHASRPFDDTRNGFVLGEGTAVFVLEELESARRRGARIYAEIAGYATRSNAYHMTGLR +PDGAEMAEAITVALDEARMNPTAIDYINAHGSGTKQNDRHETAAFKRSLGEHAYRTPVSSIKSMVGHSLG +AIGSIEIAASILAIQHDVVPPTANLHTPDPQCDLDYVPLNAREQIVDAVLTVGSGFGGFQSAMVLAQPER +NAA +
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/WP_037658557.fasta Tue Mar 17 13:33:43 2015 -0400 @@ -0,0 +1,7 @@ +>gi|739806622|ref|WP_037658557.1| cytochrome P450 [Streptomyces aurantiacus] +MQRTCPFSVPPVYTKFREESPITQVVLPDGGKAWLVTKYDDVRAVMANPKLSSDRRAPDFPVVVPGQNAA +LAKHAPFMIILDGAEHAAARRPVISEFSVRRVAAMKPRIQEIVDGFIDDMLKMPKPVDLNQVFSLPVPSL +VVSEILGMPYEGHEYFMELAEILLRRTTDEQGRIAVSVELRKYMDKLVEEKIENPGDDLLSRQIELQRQQ +GGIDRPQLASLCLLVLLAGHETTANMINLGVFSMLTKPELLAEIKADPSKTPKAVDELLRFYTIPDFGAH +RLALDDVEIGGVLIRKGEAVIASTFAANRDPAVFDDPEELDFGRDARHHVAFGYGPHQCLGQNLGRLELQ +VVFDTLFRRLPELRLAVPEEELSFKSDALVYGLYELPVTW
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/find_genes_located_nearby.ga Tue Mar 17 13:33:43 2015 -0400 @@ -0,0 +1,578 @@ +{ + "a_galaxy_workflow": "true", + "annotation": "Input are two protein genes in FASTA format. They will be blasted with tblastn against the NCBI NR database. Both results are compared and hits are returned that are close to each other.", + "format-version": "0.1", + "name": "Finding 2 genes close to each other", + "steps": { + "0": { + "annotation": "", + "id": 0, + "input_connections": {}, + "inputs": [ + { + "description": "", + "name": "Protein in FASTA format" + } + ], + "name": "Input dataset", + "outputs": [], + "position": { + "left": 248, + "top": 311 + }, + "tool_errors": null, + "tool_id": null, + "tool_state": "{\"name\": \"Protein in FASTA format\"}", + "tool_version": null, + "type": "data_input", + "user_outputs": [] + }, + "1": { + "annotation": "", + "id": 1, + "input_connections": {}, + "inputs": [ + { + "description": "", + "name": "Protein in FASTA format" + } + ], + "name": "Input dataset", + "outputs": [], + "position": { + "left": 250, + "top": 386 + }, + "tool_errors": null, + "tool_id": null, + "tool_state": "{\"name\": \"Protein in FASTA format\"}", + "tool_version": null, + "type": "data_input", + "user_outputs": [] + }, + "2": { + "annotation": "", + "id": 2, + "input_connections": { + "query": { + "id": 0, + "output_name": "output" + } + }, + "inputs": [], + "name": "NCBI BLAST+ tblastn", + "outputs": [ + { + "name": "output1", + "type": "tabular" + } + ], + "position": { + "left": 380.6166687011719, + "top": 224.61666870117188 + }, + "post_job_actions": { + "HideDatasetActionoutput1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/ncbi_blast_plus/ncbi_tblastn_wrapper/0.1.01", + "tool_state": "{\"__page__\": 0, \"evalue_cutoff\": \"\\\"0.001\\\"\", \"adv_opts\": \"{\\\"adv_opts_selector\\\": \\\"basic\\\", \\\"__current_case__\\\": 0}\", \"__rerun_remap_job_id__\": null, \"db_opts\": \"{\\\"db_opts_selector\\\": \\\"db\\\", \\\"subject\\\": \\\"\\\", \\\"histdb\\\": \\\"\\\", \\\"__current_case__\\\": 0, \\\"database\\\": \\\"nt_28-09-14\\\"}\", \"output\": \"{\\\"out_format\\\": \\\"cols\\\", \\\"std_cols\\\": [\\\"sseqid\\\", \\\"sstart\\\", \\\"send\\\", \\\"bitscore\\\"], \\\"ids_cols\\\": null, \\\"tax_cols\\\": null, \\\"__current_case__\\\": 2, \\\"misc_cols\\\": null, \\\"ext_cols\\\": null}\", \"query\": \"null\"}", + "tool_version": "0.1.01", + "type": "tool", + "user_outputs": [] + }, + "3": { + "annotation": "", + "id": 3, + "input_connections": { + "query": { + "id": 1, + "output_name": "output" + } + }, + "inputs": [], + "name": "NCBI BLAST+ tblastn", + "outputs": [ + { + "name": "output1", + "type": "tabular" + } + ], + "position": { + "left": 393.6166687011719, + "top": 444.6166687011719 + }, + "post_job_actions": { + "HideDatasetActionoutput1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/ncbi_blast_plus/ncbi_tblastn_wrapper/0.1.01", + "tool_state": "{\"__page__\": 0, \"evalue_cutoff\": \"\\\"0.001\\\"\", \"adv_opts\": \"{\\\"adv_opts_selector\\\": \\\"basic\\\", \\\"__current_case__\\\": 0}\", \"__rerun_remap_job_id__\": null, \"db_opts\": \"{\\\"db_opts_selector\\\": \\\"db\\\", \\\"subject\\\": \\\"\\\", \\\"histdb\\\": \\\"\\\", \\\"__current_case__\\\": 0, \\\"database\\\": \\\"nt_28-09-14\\\"}\", \"output\": \"{\\\"out_format\\\": \\\"cols\\\", \\\"std_cols\\\": [\\\"sseqid\\\", \\\"sstart\\\", \\\"send\\\", \\\"bitscore\\\"], \\\"ids_cols\\\": null, \\\"tax_cols\\\": null, \\\"__current_case__\\\": 2, \\\"misc_cols\\\": null, \\\"ext_cols\\\": null}\", \"query\": \"null\"}", + "tool_version": "0.1.01", + "type": "tool", + "user_outputs": [] + }, + "4": { + "annotation": "", + "id": 4, + "input_connections": { + "input": { + "id": 2, + "output_name": "output1" + } + }, + "inputs": [], + "name": "Filter", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 656.5, + "top": 190.5 + }, + "post_job_actions": {}, + "tool_errors": null, + "tool_id": "Filter1", + "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"header_lines\": \"\\\"0\\\"\", \"cond\": \"\\\"c4>150\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "5": { + "annotation": "", + "id": 5, + "input_connections": { + "input": { + "id": 3, + "output_name": "output1" + } + }, + "inputs": [], + "name": "Filter", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 609.5, + "top": 349.5 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Filter1", + "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"header_lines\": \"\\\"0\\\"\", \"cond\": \"\\\"c4>150\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "6": { + "annotation": "", + "id": 6, + "input_connections": { + "input": { + "id": 4, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 715, + "top": 224 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c3,c2)\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\", \"round\": \"\\\"yes\\\"\"}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "7": { + "annotation": "", + "id": 7, + "input_connections": { + "input": { + "id": 5, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 661.5, + "top": 381.5 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"min(c3,c2)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "8": { + "annotation": "", + "id": 8, + "input_connections": { + "input": { + "id": 6, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 767, + "top": 260 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"min(c3,c2)\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\", \"round\": \"\\\"yes\\\"\"}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "9": { + "annotation": "", + "id": 9, + "input_connections": { + "input": { + "id": 7, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 714.5, + "top": 416.5 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c3,c2)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "10": { + "annotation": "", + "id": 10, + "input_connections": { + "input": { + "id": 8, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Cut", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 957, + "top": 271 + }, + "post_job_actions": { + "ChangeDatatypeActionout_file1": { + "action_arguments": { + "newtype": "interval" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Cut1", + "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"delimiter\": \"\\\"T\\\"\", \"columnList\": \"\\\"c1,c6,c5\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\"}", + "tool_version": "1.0.2", + "type": "tool", + "user_outputs": [] + }, + "11": { + "annotation": "", + "id": 11, + "input_connections": { + "input": { + "id": 9, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 768.5, + "top": 452.5 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c5-10000,1)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "12": { + "annotation": "", + "id": 12, + "input_connections": { + "input": { + "id": 11, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 819.5, + "top": 489.5 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", + "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"c6+10000\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", + "tool_version": "1.1.0", + "type": "tool", + "user_outputs": [] + }, + "13": { + "annotation": "", + "id": 13, + "input_connections": { + "input": { + "id": 12, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Cut", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 953.5, + "top": 392.5 + }, + "post_job_actions": { + "ChangeDatatypeActionout_file1": { + "action_arguments": { + "newtype": "interval" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Cut1", + "tool_state": "{\"columnList\": \"\\\"c1,c7,c8\\\"\", \"input\": \"null\", \"delimiter\": \"\\\"T\\\"\", \"__rerun_remap_job_id__\": null, \"__page__\": 0}", + "tool_version": "1.0.2", + "type": "tool", + "user_outputs": [] + }, + "14": { + "annotation": "", + "id": 14, + "input_connections": { + "input1": { + "id": 10, + "output_name": "out_file1" + }, + "input2": { + "id": 13, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Intersect", + "outputs": [ + { + "name": "output", + "type": "input" + } + ], + "position": { + "left": 1160.9166870117188, + "top": 325.91668701171875 + }, + "post_job_actions": { + "HideDatasetActionoutput": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output" + } + }, + "tool_errors": null, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/intersect/gops_intersect_1/1.0.0", + "tool_state": "{\"input2\": \"null\", \"__page__\": 0, \"input1\": \"null\", \"min\": \"\\\"1\\\"\", \"__rerun_remap_job_id__\": null, \"returntype\": \"\\\"\\\"\"}", + "tool_version": "1.0.0", + "type": "tool", + "user_outputs": [] + }, + "15": { + "annotation": "", + "id": 15, + "input_connections": { + "input": { + "id": 14, + "output_name": "output" + } + }, + "inputs": [], + "name": "Sort", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 1154.9166870117188, + "top": 458.91668701171875 + }, + "post_job_actions": {}, + "tool_errors": null, + "tool_id": "sort1", + "tool_state": "{\"__page__\": 0, \"style\": \"\\\"alpha\\\"\", \"column\": \"{\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}\", \"__rerun_remap_job_id__\": null, \"order\": \"\\\"DESC\\\"\", \"input\": \"null\", \"column_set\": \"[{\\\"other_order\\\": \\\"DESC\\\", \\\"__index__\\\": 0, \\\"other_column\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"2\\\"}, \\\"other_style\\\": \\\"num\\\"}]\"}", + "tool_version": "1.0.3", + "type": "tool", + "user_outputs": [] + }, + "16": { + "annotation": "", + "id": 16, + "input_connections": { + "input1": { + "id": 15, + "output_name": "out_file1" + } + }, + "inputs": [], + "name": "Group", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 1352.5, + "top": 399 + }, + "post_job_actions": { + "RenameDatasetActionout_file1": { + "action_arguments": { + "newname": "Counting hits per genome" + }, + "action_type": "RenameDatasetAction", + "output_name": "out_file1" + } + }, + "tool_errors": null, + "tool_id": "Grouping1", + "tool_state": "{\"operations\": \"[{\\\"opcol\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"__index__\\\": 0, \\\"optype\\\": \\\"length\\\", \\\"opround\\\": \\\"no\\\"}]\", \"__page__\": 0, \"input1\": \"null\", \"ignorelines\": \"null\", \"groupcol\": \"{\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}\", \"__rerun_remap_job_id__\": null, \"ignorecase\": \"\\\"False\\\"\"}", + "tool_version": "2.1.0", + "type": "tool", + "user_outputs": [] + } + }, + "uuid": "12fe8ac4-30db-4db4-b8f9-7c44e0cc0788" +}
--- a/find_three_genes_located_nearby.ga Tue Mar 17 13:27:23 2015 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,957 +0,0 @@ -{ - "a_galaxy_workflow": "true", - "annotation": "Input are two protein genes in FASTA format. They will be blasted with tblastn against the NCBI NR database. Both results are compared and hits are returned that are close to each other.", - "format-version": "0.1", - "name": "Finding 3 genes close to each other", - "steps": { - "0": { - "annotation": "", - "id": 0, - "input_connections": {}, - "inputs": [ - { - "description": "", - "name": "Nucleotide Reference Database" - } - ], - "name": "Input dataset", - "outputs": [], - "position": { - "left": 289, - "top": 247 - }, - "tool_errors": null, - "tool_id": null, - "tool_state": "{\"name\": \"Nucleotide Reference Database\"}", - "tool_version": null, - "type": "data_input", - "user_outputs": [] - }, - "1": { - "annotation": "", - "id": 1, - "input_connections": {}, - "inputs": [ - { - "description": "", - "name": "Protein in FASTA format" - } - ], - "name": "Input dataset", - "outputs": [], - "position": { - "left": 248.38333129882812, - "top": 474.3833312988281 - }, - "tool_errors": null, - "tool_id": null, - "tool_state": "{\"name\": \"Protein in FASTA format\"}", - "tool_version": null, - "type": "data_input", - "user_outputs": [] - }, - "2": { - "annotation": "", - "id": 2, - "input_connections": {}, - "inputs": [ - { - "description": "", - "name": "Protein in FASTA format" - } - ], - "name": "Input dataset", - "outputs": [], - "position": { - "left": 250.38333129882812, - "top": 545.3833312988281 - }, - "tool_errors": null, - "tool_id": null, - "tool_state": "{\"name\": \"Protein in FASTA format\"}", - "tool_version": null, - "type": "data_input", - "user_outputs": [] - }, - "3": { - "annotation": "", - "id": 3, - "input_connections": {}, - "inputs": [ - { - "description": "", - "name": "Protein in FASTA format" - } - ], - "name": "Input dataset", - "outputs": [], - "position": { - "left": 259.1166687011719, - "top": 754.61669921875 - }, - "tool_errors": null, - "tool_id": null, - "tool_state": "{\"name\": \"Protein in FASTA format\"}", - "tool_version": null, - "type": "data_input", - "user_outputs": [] - }, - "4": { - "annotation": "", - "id": 4, - "input_connections": { - "input_file": { - "id": 0, - "output_name": "output" - } - }, - "inputs": [], - "name": "NCBI BLAST+ makeblastdb", - "outputs": [ - { - "name": "outfile", - "type": "data" - } - ], - "position": { - "left": 526.5, - "top": 196 - }, - "post_job_actions": { - "HideDatasetActionoutfile": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "outfile" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/ncbi_blast_plus/ncbi_makeblastdb/0.1.01", - "tool_state": "{\"__page__\": 0, \"mask_data_file\": \"null\", \"input_file\": \"null\", \"dbtype\": \"\\\"nucl\\\"\", \"__rerun_remap_job_id__\": null, \"hash_index\": \"\\\"True\\\"\", \"tax\": \"{\\\"taxselect\\\": \\\"\\\", \\\"__current_case__\\\": 0}\", \"title\": \"\\\"\\\"\", \"parse_seqids\": \"\\\"True\\\"\"}", - "tool_version": "0.1.01", - "type": "tool", - "user_outputs": [] - }, - "5": { - "annotation": "", - "id": 5, - "input_connections": { - "db_opts|histdb": { - "id": 4, - "output_name": "outfile" - }, - "query": { - "id": 1, - "output_name": "output" - } - }, - "inputs": [], - "name": "NCBI BLAST+ tblastn", - "outputs": [ - { - "name": "output1", - "type": "tabular" - } - ], - "position": { - "left": 429.5, - "top": 381 - }, - "post_job_actions": { - "HideDatasetActionoutput1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "output1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/ncbi_blast_plus/ncbi_tblastn_wrapper/0.1.01", - "tool_state": "{\"__page__\": 0, \"evalue_cutoff\": \"\\\"0.001\\\"\", \"adv_opts\": \"{\\\"adv_optional_id_files_opts\\\": {\\\"adv_optional_id_files_opts_selector\\\": \\\"none\\\", \\\"__current_case__\\\": 0}, \\\"matrix\\\": \\\"BLOSUM62\\\", \\\"adv_opts_selector\\\": \\\"advanced\\\", \\\"filter_query\\\": \\\"True\\\", \\\"word_size\\\": \\\"0\\\", \\\"__current_case__\\\": 1, \\\"parse_deflines\\\": \\\"False\\\", \\\"db_gencode\\\": \\\"1\\\", \\\"max_hits\\\": \\\"1\\\"}\", \"__rerun_remap_job_id__\": null, \"db_opts\": \"{\\\"db_opts_selector\\\": \\\"histdb\\\", \\\"subject\\\": \\\"\\\", \\\"histdb\\\": null, \\\"__current_case__\\\": 1, \\\"database\\\": \\\"\\\"}\", \"output\": \"{\\\"out_format\\\": \\\"ext\\\", \\\"__current_case__\\\": 1}\", \"query\": \"null\"}", - "tool_version": "0.1.01", - "type": "tool", - "user_outputs": [] - }, - "6": { - "annotation": "", - "id": 6, - "input_connections": { - "db_opts|histdb": { - "id": 4, - "output_name": "outfile" - }, - "query": { - "id": 2, - "output_name": "output" - } - }, - "inputs": [], - "name": "NCBI BLAST+ tblastn", - "outputs": [ - { - "name": "output1", - "type": "tabular" - } - ], - "position": { - "left": 421.5, - "top": 618 - }, - "post_job_actions": { - "HideDatasetActionoutput1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "output1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/ncbi_blast_plus/ncbi_tblastn_wrapper/0.1.01", - "tool_state": "{\"__page__\": 0, \"evalue_cutoff\": \"\\\"0.001\\\"\", \"adv_opts\": \"{\\\"adv_optional_id_files_opts\\\": {\\\"adv_optional_id_files_opts_selector\\\": \\\"none\\\", \\\"__current_case__\\\": 0}, \\\"matrix\\\": \\\"BLOSUM62\\\", \\\"adv_opts_selector\\\": \\\"advanced\\\", \\\"filter_query\\\": \\\"True\\\", \\\"word_size\\\": \\\"0\\\", \\\"__current_case__\\\": 1, \\\"parse_deflines\\\": \\\"False\\\", \\\"db_gencode\\\": \\\"1\\\", \\\"max_hits\\\": \\\"1\\\"}\", \"__rerun_remap_job_id__\": null, \"db_opts\": \"{\\\"db_opts_selector\\\": \\\"histdb\\\", \\\"subject\\\": \\\"\\\", \\\"histdb\\\": null, \\\"__current_case__\\\": 1, \\\"database\\\": \\\"\\\"}\", \"output\": \"{\\\"out_format\\\": \\\"ext\\\", \\\"__current_case__\\\": 1}\", \"query\": \"null\"}", - "tool_version": "0.1.01", - "type": "tool", - "user_outputs": [] - }, - "7": { - "annotation": "", - "id": 7, - "input_connections": { - "db_opts|histdb": { - "id": 4, - "output_name": "outfile" - }, - "query": { - "id": 3, - "output_name": "output" - } - }, - "inputs": [], - "name": "NCBI BLAST+ tblastn", - "outputs": [ - { - "name": "output1", - "type": "tabular" - } - ], - "position": { - "left": 426.6166687011719, - "top": 827.61669921875 - }, - "post_job_actions": { - "HideDatasetActionoutput1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "output1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/ncbi_blast_plus/ncbi_tblastn_wrapper/0.1.01", - "tool_state": "{\"__page__\": 0, \"evalue_cutoff\": \"\\\"0.001\\\"\", \"adv_opts\": \"{\\\"adv_optional_id_files_opts\\\": {\\\"adv_optional_id_files_opts_selector\\\": \\\"none\\\", \\\"__current_case__\\\": 0}, \\\"matrix\\\": \\\"BLOSUM62\\\", \\\"adv_opts_selector\\\": \\\"advanced\\\", \\\"filter_query\\\": \\\"True\\\", \\\"word_size\\\": \\\"0\\\", \\\"__current_case__\\\": 1, \\\"parse_deflines\\\": \\\"False\\\", \\\"db_gencode\\\": \\\"1\\\", \\\"max_hits\\\": \\\"1\\\"}\", \"__rerun_remap_job_id__\": null, \"db_opts\": \"{\\\"db_opts_selector\\\": \\\"histdb\\\", \\\"subject\\\": \\\"\\\", \\\"histdb\\\": null, \\\"__current_case__\\\": 1, \\\"database\\\": \\\"\\\"}\", \"output\": \"{\\\"out_format\\\": \\\"ext\\\", \\\"__current_case__\\\": 1}\", \"query\": \"null\"}", - "tool_version": "0.1.01", - "type": "tool", - "user_outputs": [] - }, - "8": { - "annotation": "", - "id": 8, - "input_connections": { - "input": { - "id": 5, - "output_name": "output1" - } - }, - "inputs": [], - "name": "Cut", - "outputs": [ - { - "name": "out_file1", - "type": "tabular" - } - ], - "position": { - "left": 710.3833312988281, - "top": 415.3833312988281 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "Cut1", - "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"delimiter\": \"\\\"T\\\"\", \"columnList\": \"\\\"c2,c9,c10\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\"}", - "tool_version": "1.0.2", - "type": "tool", - "user_outputs": [] - }, - "9": { - "annotation": "", - "id": 9, - "input_connections": { - "input": { - "id": 6, - "output_name": "output1" - } - }, - "inputs": [], - "name": "Cut", - "outputs": [ - { - "name": "out_file1", - "type": "tabular" - } - ], - "position": { - "left": 683.3833312988281, - "top": 702.38330078125 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "Cut1", - "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"delimiter\": \"\\\"T\\\"\", \"columnList\": \"\\\"c2,c9,c10\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\"}", - "tool_version": "1.0.2", - "type": "tool", - "user_outputs": [] - }, - "10": { - "annotation": "", - "id": 10, - "input_connections": { - "input": { - "id": 7, - "output_name": "output1" - } - }, - "inputs": [], - "name": "Cut", - "outputs": [ - { - "name": "out_file1", - "type": "tabular" - } - ], - "position": { - "left": 722.1166687011719, - "top": 887.61669921875 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "Cut1", - "tool_state": "{\"columnList\": \"\\\"c2,c9,c10\\\"\", \"input\": \"null\", \"delimiter\": \"\\\"T\\\"\", \"__rerun_remap_job_id__\": null, \"__page__\": 0}", - "tool_version": "1.0.2", - "type": "tool", - "user_outputs": [] - }, - "11": { - "annotation": "", - "id": 11, - "input_connections": { - "input": { - "id": 8, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 768.3833312988281, - "top": 386.3833312988281 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c3,c2)\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\", \"round\": \"\\\"yes\\\"\"}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "12": { - "annotation": "", - "id": 12, - "input_connections": { - "input": { - "id": 9, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 747.8833312988281, - "top": 673.88330078125 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"min(c3,c2)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "13": { - "annotation": "", - "id": 13, - "input_connections": { - "input": { - "id": 10, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 769.1166687011719, - "top": 879.61669921875 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"min(c3,c2)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "14": { - "annotation": "", - "id": 14, - "input_connections": { - "input": { - "id": 11, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 847.38330078125, - "top": 383.3833312988281 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"min(c3,c2)\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\", \"round\": \"\\\"yes\\\"\"}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "15": { - "annotation": "", - "id": 15, - "input_connections": { - "input": { - "id": 12, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 801.8833312988281, - "top": 668.88330078125 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c3,c2)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "16": { - "annotation": "", - "id": 16, - "input_connections": { - "input": { - "id": 13, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 813.1166687011719, - "top": 871.61669921875 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c3,c2)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "17": { - "annotation": "", - "id": 17, - "input_connections": { - "input": { - "id": 14, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Cut", - "outputs": [ - { - "name": "out_file1", - "type": "tabular" - } - ], - "position": { - "left": 920.38330078125, - "top": 387.3833312988281 - }, - "post_job_actions": { - "ChangeDatatypeActionout_file1": { - "action_arguments": { - "newtype": "interval" - }, - "action_type": "ChangeDatatypeAction", - "output_name": "out_file1" - }, - "RenameDatasetActionout_file1": { - "action_arguments": { - "newname": "" - }, - "action_type": "RenameDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "Cut1", - "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"delimiter\": \"\\\"T\\\"\", \"columnList\": \"\\\"c1,c5,c4\\\"\", \"input\": \"null\", \"chromInfo\": \"\\\"/usr/local/galaxy/galaxy-dist/tool-data/shared/ucsc/chrom/?.len\\\"\"}", - "tool_version": "1.0.2", - "type": "tool", - "user_outputs": [] - }, - "18": { - "annotation": "", - "id": 18, - "input_connections": { - "input": { - "id": 15, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 854.88330078125, - "top": 661.88330078125 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c4-10000,1)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "19": { - "annotation": "", - "id": 19, - "input_connections": { - "input": { - "id": 16, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 857.11669921875, - "top": 863.61669921875 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"max(c4-10000,1)\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "20": { - "annotation": "", - "id": 20, - "input_connections": { - "input": { - "id": 18, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 911.88330078125, - "top": 658.88330078125 - }, - "post_job_actions": {}, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"c5+10000\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "21": { - "annotation": "", - "id": 21, - "input_connections": { - "input": { - "id": 19, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Compute", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 907.11669921875, - "top": 854.61669921875 - }, - "post_job_actions": { - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.1.0", - "tool_state": "{\"input\": \"null\", \"__rerun_remap_job_id__\": null, \"cond\": \"\\\"c5+10000\\\"\", \"round\": \"\\\"yes\\\"\", \"__page__\": 0}", - "tool_version": "1.1.0", - "type": "tool", - "user_outputs": [] - }, - "22": { - "annotation": "", - "id": 22, - "input_connections": { - "input": { - "id": 20, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Cut", - "outputs": [ - { - "name": "out_file1", - "type": "tabular" - } - ], - "position": { - "left": 963.88330078125, - "top": 657.88330078125 - }, - "post_job_actions": { - "ChangeDatatypeActionout_file1": { - "action_arguments": { - "newtype": "interval" - }, - "action_type": "ChangeDatatypeAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "Cut1", - "tool_state": "{\"columnList\": \"\\\"c1,c6,c7\\\"\", \"input\": \"null\", \"delimiter\": \"\\\"T\\\"\", \"__rerun_remap_job_id__\": null, \"__page__\": 0}", - "tool_version": "1.0.2", - "type": "tool", - "user_outputs": [] - }, - "23": { - "annotation": "", - "id": 23, - "input_connections": { - "input": { - "id": 21, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Cut", - "outputs": [ - { - "name": "out_file1", - "type": "tabular" - } - ], - "position": { - "left": 968.11669921875, - "top": 852.61669921875 - }, - "post_job_actions": { - "ChangeDatatypeActionout_file1": { - "action_arguments": { - "newtype": "interval" - }, - "action_type": "ChangeDatatypeAction", - "output_name": "out_file1" - }, - "HideDatasetActionout_file1": { - "action_arguments": {}, - "action_type": "HideDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "Cut1", - "tool_state": "{\"columnList\": \"\\\"c1,c6,c7\\\"\", \"input\": \"null\", \"delimiter\": \"\\\"T\\\"\", \"__rerun_remap_job_id__\": null, \"__page__\": 0}", - "tool_version": "1.0.2", - "type": "tool", - "user_outputs": [] - }, - "24": { - "annotation": "", - "id": 24, - "input_connections": { - "input1": { - "id": 17, - "output_name": "out_file1" - }, - "input2": { - "id": 22, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Intersect", - "outputs": [ - { - "name": "output", - "type": "input" - } - ], - "position": { - "left": 1099.11669921875, - "top": 501.6166687011719 - }, - "post_job_actions": {}, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/intersect/gops_intersect_1/1.0.0", - "tool_state": "{\"input2\": \"null\", \"__page__\": 0, \"input1\": \"null\", \"min\": \"\\\"1\\\"\", \"__rerun_remap_job_id__\": null, \"returntype\": \"\\\"\\\"\"}", - "tool_version": "1.0.0", - "type": "tool", - "user_outputs": [] - }, - "25": { - "annotation": "", - "id": 25, - "input_connections": { - "input1": { - "id": 24, - "output_name": "output" - }, - "input2": { - "id": 23, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Intersect", - "outputs": [ - { - "name": "output", - "type": "input" - } - ], - "position": { - "left": 1137.11669921875, - "top": 755.61669921875 - }, - "post_job_actions": {}, - "tool_errors": null, - "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/intersect/gops_intersect_1/1.0.0", - "tool_state": "{\"input2\": \"null\", \"__page__\": 0, \"input1\": \"null\", \"min\": \"\\\"1\\\"\", \"__rerun_remap_job_id__\": null, \"returntype\": \"\\\"\\\"\"}", - "tool_version": "1.0.0", - "type": "tool", - "user_outputs": [] - }, - "26": { - "annotation": "", - "id": 26, - "input_connections": { - "input": { - "id": 25, - "output_name": "output" - } - }, - "inputs": [], - "name": "Sort", - "outputs": [ - { - "name": "out_file1", - "type": "input" - } - ], - "position": { - "left": 1216.11669921875, - "top": 648.1166687011719 - }, - "post_job_actions": {}, - "tool_errors": null, - "tool_id": "sort1", - "tool_state": "{\"__page__\": 0, \"style\": \"\\\"alpha\\\"\", \"column\": \"{\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}\", \"__rerun_remap_job_id__\": null, \"order\": \"\\\"DESC\\\"\", \"input\": \"null\", \"column_set\": \"[{\\\"other_order\\\": \\\"DESC\\\", \\\"__index__\\\": 0, \\\"other_column\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"2\\\"}, \\\"other_style\\\": \\\"num\\\"}]\"}", - "tool_version": "1.0.3", - "type": "tool", - "user_outputs": [] - }, - "27": { - "annotation": "", - "id": 27, - "input_connections": { - "input1": { - "id": 26, - "output_name": "out_file1" - } - }, - "inputs": [], - "name": "Group", - "outputs": [ - { - "name": "out_file1", - "type": "tabular" - } - ], - "position": { - "left": 1396.88330078125, - "top": 648.3833312988281 - }, - "post_job_actions": { - "RenameDatasetActionout_file1": { - "action_arguments": { - "newname": "Counting hits per genome" - }, - "action_type": "RenameDatasetAction", - "output_name": "out_file1" - } - }, - "tool_errors": null, - "tool_id": "Grouping1", - "tool_state": "{\"operations\": \"[{\\\"opcol\\\": {\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}, \\\"__index__\\\": 0, \\\"optype\\\": \\\"length\\\", \\\"opround\\\": \\\"no\\\"}]\", \"__page__\": 0, \"input1\": \"null\", \"ignorelines\": \"null\", \"groupcol\": \"{\\\"__class__\\\": \\\"UnvalidatedValue\\\", \\\"value\\\": \\\"1\\\"}\", \"__rerun_remap_job_id__\": null, \"ignorecase\": \"\\\"False\\\"\"}", - "tool_version": "2.1.0", - "type": "tool", - "user_outputs": [] - } - }, - "uuid": "ea8b8757-5fcb-4451-b305-31db0e5349fd" -} \ No newline at end of file
--- a/readme.rst Tue Mar 17 13:27:23 2015 -0400 +++ b/readme.rst Tue Mar 17 13:33:43 2015 -0400 @@ -1,59 +1,52 @@ Galaxy workflow for the identification of candidate genes clusters ------------------------------------------------------------------ -This approach screens three proteins against a given genome sequence, leading to a genome position -were all three genes are located nearby. As usual in Galaxy workflows every +This approach screens two proteins against all nucleotide sequence from the +NCBI nt database within hours on our cluster, leading to all organisms with an inter- +esting gene structure for further investigation. As usual in Galaxy workflows every parameter, including the proximity distance, can be changed and additional steps can be easily added. For example additional filtering to refine the initial BLAST hits, or inclusion of a third query sequence. -.. image:: https://raw.githubusercontent.com/bgruening/galaxytools/master/workflows/ncbi_blast_plus/find_three_genes_located_nearby/find_three_genes_located_nearby.png +.. image:: https://raw.githubusercontent.com/bgruening/galaxytools/master/workflows/ncbi_blast_plus/find_genes_located_nearby/find_genes_located_nearby.png Sample Data =========== -As an example, we will use three protein sequences from *Pan troglodytes* (Chimpanzee) -which are part of the β-globin cluster. +As an example, we will use two protein sequences from *Streptomyces aurantiacus* +that are part of a gene cluster, responsible for metabolite producion. -You can upload all sequences directly into Galaxy using the "Upload tool" +You can upload both sequences directly into Galaxy using the "Upload File" tool with either of these URLs - Galaxy should recognise this is FASTA files. -Query sequences. -* `P61920.fasta <https://raw.githubusercontent.com/bgruening/galaxytools/master/workflows/ncbi_blast_plus/find_three_genes_located_nearby/P61920.fasta>`_ -* `P61921.fasta <https://raw.githubusercontent.com/bgruening/galaxytools/master/workflows/ncbi_blast_plus/find_three_genes_located_nearby/P61921.fasta>`_ -* `Q6LDH1.fasta <https://raw.githubusercontent.com/bgruening/galaxytools/master/workflows/ncbi_blast_plus/find_three_genes_located_nearby/Q6LDH1.fasta>`_ +* `WP_037658548.fasta <https://raw.githubusercontent.com/bgruening/galaxytools/master/workflows/ncbi_blast_plus/find_genes_located_nearby/WP_037658548.fasta>`_ +* `WP_037658557.fasta <https://raw.githubusercontent.com/bgruening/galaxytools/master/workflows/ncbi_blast_plus/find_genes_located_nearby/WP_037658557.fasta>`_ -Genome sequence: -* http://hgdownload.cse.ucsc.edu/goldenPath/rn6/bigZips/rn6.fa.gz +In addition you can find both sequences at the NCBI server: + * http://www.ncbi.nlm.nih.gov/protein/739806622 (cytochrome P450) + :: + + >gi|739806622|ref|WP_037658557.1| cytochrome P450 [Streptomyces aurantiacus] + MQRTCPFSVPPVYTKFREESPITQVVLPDGGKAWLVTKYDDVRAVMANPKLSSDRRAPDFPVVVPGQNAA + LAKHAPFMIILDGAEHAAARRPVISEFSVRRVAAMKPRIQEIVDGFIDDMLKMPKPVDLNQVFSLPVPSL + VVSEILGMPYEGHEYFMELAEILLRRTTDEQGRIAVSVELRKYMDKLVEEKIENPGDDLLSRQIELQRQQ + GGIDRPQLASLCLLVLLAGHETTANMINLGVFSMLTKPELLAEIKADPSKTPKAVDELLRFYTIPDFGAH + RLALDDVEIGGVLIRKGEAVIASTFAANRDPAVFDDPEELDFGRDARHHVAFGYGPHQCLGQNLGRLELQ + VVFDTLFRRLPELRLAVPEEELSFKSDALVYGLYELPVTW -In addition you can find the query sequences at the UniProt server: - * http://www.uniprot.org/uniprot/P61920 (Hemoglobin subunit gamma-1) - :: - - >sp|P61920|HBG1_PANTR Hemoglobin subunit gamma-1 OS=Pan troglodytes GN=HBG1 PE=1 SV=2 - MGHFTEEDKATITSLWGKVNVEDAGGETLGRLLVVYPWTQRFFDSFGNLSSASAIMGNPK - VKAHGKKVLTSLGDAIKHLDDLKGTFAQLSELHCDKLHVDPENFKLLGNVLVTVLAIHFG - KEFTPEVQASWQKMVTAVASALSSRYH - - - * http://www.uniprot.org/uniprot/P61921 (Hemoglobin subunit gamma-2) + * http://www.ncbi.nlm.nih.gov/protein/739806613 (beta-ACP synthase) :: - - >sp|P61921|HBG2_PANTR Hemoglobin subunit gamma-2 OS=Pan troglodytes GN=HBG2 PE=1 SV=2 - MGHFTEEDKATITSLWGKVNVEDAGGETLGRLLVVYPWTQRFFDSFGNLSSASAIMGNPK - VKAHGKKVLTSLGDAIKHLDDLKGTFAQLSELHCDKLHVDPENFKLLGNVLVTVLAIHFG - KEFTPEVQASWQKMVTGVASALSSRYH - - - * http://www.uniprot.org/uniprot/Q6LDH1 (Hemoglobin subunit epsilon) - :: - - >sp|Q6LDH1|HBE_PANTR Hemoglobin subunit epsilon OS=Pan troglodytes GN=HBE1 PE=2 SV=3 - MVHFTAEEKAAVTSLWSKMNVEEAGGEALGRLLVVYPWTQRFFDSFGNLSSPSAILGNPK - VKAHGKKVLTSFGDAIKNMDNLKPAFAKLSELHCDKLHVDPENFKLLGNVMVIILATHFG - KEFTPEVQAAWQKLVSAVAIALAHKYH + + >gi|739806613|ref|WP_037658548.1| beta-ACP synthase [Streptomyces aurantiacus] + MSGRRVVVTGMEVLAPGGVGTDNFWSLLSEGRTATRGITFFDPAQFRSRVAAEIDFDPYAHGLTPQEVRR + MDRAAQFAVVAARGAVADSGLDTDTLDPYRIGVTIGSAVGATMSLDEDYRVVSDAGRLDLVDHTYADPFF + YNYFVPSSFATEVARLVGAQGPSSVVSAGCTSGLDSVGYAVELIREGTADVMVAGATDAPISPITMACFD + AIKATTPRHDDPEHASRPFDDTRNGFVLGEGTAVFVLEELESARRRGARIYAEIAGYATRSNAYHMTGLR + PDGAEMAEAITVALDEARMNPTAIDYINAHGSGTKQNDRHETAAFKRSLGEHAYRTPVSSIKSMVGHSLG + AIGSIEIAASILAIQHDVVPPTANLHTPDPQCDLDYVPLNAREQIVDAVLTVGSGFGGFQSAMVLAQPER + NAA Citation @@ -75,11 +68,11 @@ This workflow is available on the main Galaxy Tool Shed: -http://toolshed.g2.bx.psu.edu/view/bgruening/find_three_genes_located_nearby_workflow +http://toolshed.g2.bx.psu.edu/view/bgruening/find_genes_located_nearby_workflow Development is being done on github: -https://github.com/bgruening/galaxytools/tree/master/workflows/ncbi_blast_plus/find_three_genes_located_nearby +https://github.com/bgruening/galaxytools/tree/master/workflows/ncbi_blast_plus/find_genes_located_nearby Dependencies