annotate preprocessing-wrapper.sh @ 0:d4690e65afcd draft

Uploaded
author bcclaywell
date Thu, 26 Feb 2015 18:16:36 -0500
parents
children 221a97bf686d
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
1 #!/bin/bash
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
2
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
3 source $1
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
4
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
5 deduplicate_sequences.py \
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
6 --split-map ${SPLIT_MAP} \
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
7 --deduplicated-sequences-file ${DEDUP_INFO} \
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
8 ${INPUT_SEQS} \
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
9 ${DEDUP_SEQS}
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
10
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
11 # adapted from yapp/bin/refpkg_align
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
12 ref_sto=$(taxit rp ${REFPKG} aln_sto)
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
13 profile=$(taxit rp ${REFPKG} profile)
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
14
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
15 sto=$(mktemp -u).sto
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
16
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
17 cmalign --cpu ${GALAXY_SLOTS:-4} -o "$sto" --sfile "${ALIGNED_SCORES}" --noprob --dnaout "$profile" "${DEDUP_SEQS}" | grep -E '^#'
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
18
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
19 esl-alimerge --dna --outformat afa "$ref_sto" "$sto" | \
d4690e65afcd Uploaded
bcclaywell
parents:
diff changeset
20 seqmagick convert --output-format fasta --dash-gap - "${ALIGNED_SEQS}"