Mercurial > repos > peterjc > seq_composition
changeset 13:12b964a0185e draft
planemo upload for repository https://github.com/peterjc/pico_galaxy/tree/master/tools/seq_composition commit d67596914a7bbe183851437eaafe8c7305877e5a-dirty
author | peterjc |
---|---|
date | Fri, 22 Feb 2019 10:22:20 -0500 |
parents | 9c962cfc5b7e |
children | 5a0b3c87021a |
files | tools/seq_composition/seq_composition.py tools/seq_composition/tool_dependencies.xml |
diffstat | 2 files changed, 55 insertions(+), 22 deletions(-) [+] |
line wrap: on
line diff
--- a/tools/seq_composition/seq_composition.py Fri Nov 09 11:05:30 2018 -0500 +++ b/tools/seq_composition/seq_composition.py Fri Feb 22 10:22:20 2019 -0500 @@ -33,19 +33,49 @@ # TODO - GenBank / EMBL input? Needs the datatype defined... # TODO - Handle all the FASTQ datatype subclasses in the XML cheetah code? parser = OptionParser(usage=usage) -parser.add_option('-f', '--fasta', dest='fasta', action="append", default=[], - help='Input sequence filename in FASTA format') -parser.add_option('-q', '--fastq', '--fastqsanger', '--fastqillumina', '--fastqsolexa', - dest='fastq', action="append", default=[], - help='Input sequence filename in FASTQ format') -parser.add_option('-s', '--sff', dest='sff', action="append", default=[], - help='Input sequence filename in SFF format') -parser.add_option('-o', '--output', dest='output', - default=None, help='Output filename (tabular)', - metavar="FILE") -parser.add_option("-v", "--version", dest="version", - default=False, action="store_true", - help="Show version and quit") +parser.add_option( + "-f", + "--fasta", + dest="fasta", + action="append", + default=[], + help="Input sequence filename in FASTA format", +) +parser.add_option( + "-q", + "--fastq", + "--fastqsanger", + "--fastqillumina", + "--fastqsolexa", + dest="fastq", + action="append", + default=[], + help="Input sequence filename in FASTQ format", +) +parser.add_option( + "-s", + "--sff", + dest="sff", + action="append", + default=[], + help="Input sequence filename in SFF format", +) +parser.add_option( + "-o", + "--output", + dest="output", + default=None, + help="Output filename (tabular)", + metavar="FILE", +) +parser.add_option( + "-v", + "--version", + dest="version", + default=False, + action="store_true", + help="Show version and quit", +) options, args = parser.parse_args() if options.version: @@ -62,10 +92,11 @@ seq_count = 0 counts = dict() -for format, filenames in [("fasta", options.fasta), - ("fastq", options.fastq), - ("sff-trim", options.sff), - ]: +for format, filenames in [ + ("fasta", options.fasta), + ("fastq", options.fastq), + ("sff-trim", options.sff), +]: for filename in filenames: file_count += 1 for record in SeqIO.parse(filename, format): @@ -77,8 +108,10 @@ counts[letter] = 1 total = sum(counts.values()) -sys.stderr.write("Counted %i sequence letters from %i records from %i files\n" % - (total, seq_count, file_count)) +sys.stderr.write( + "Counted %i sequence letters from %i records from %i files\n" + % (total, seq_count, file_count) +) scale = 100.0 / total with open(options.output, "w") as handle:
--- a/tools/seq_composition/tool_dependencies.xml Fri Nov 09 11:05:30 2018 -0500 +++ b/tools/seq_composition/tool_dependencies.xml Fri Feb 22 10:22:20 2019 -0500 @@ -1,6 +1,6 @@ -<?xml version="1.0"?> +<?xml version="1.0" ?> <tool_dependency> <package name="biopython" version="1.67"> - <repository changeset_revision="fc45a61abc2f" name="package_biopython_1_67" owner="biopython" toolshed="https://testtoolshed.g2.bx.psu.edu" /> + <repository changeset_revision="fc45a61abc2f" name="package_biopython_1_67" owner="biopython" toolshed="https://testtoolshed.g2.bx.psu.edu"/> </package> -</tool_dependency> +</tool_dependency> \ No newline at end of file