Mercurial > repos > bcclaywell > microbiome_pplacer_suite
diff usearch-wrapper.sh @ 0:d4690e65afcd draft
Uploaded
| author | bcclaywell |
|---|---|
| date | Thu, 26 Feb 2015 18:16:36 -0500 |
| parents | |
| children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/usearch-wrapper.sh Thu Feb 26 18:16:36 2015 -0500 @@ -0,0 +1,28 @@ +#!/bin/bash + +source $(dirname $0)/util.sh +source $1 + +RDP_SEQS="/shared/silo_researcher/Matsen_F/MatsenGrp/micro_refset/rdp/10_31/tax_filter/filtered/rdp_10_31.filter.fasta" +RDP_SEQINFO="/shared/silo_researcher/Matsen_F/MatsenGrp/micro_refset/rdp/10_31/tax_filter/filtered/rdp_10_31.filter.seq_info.csv" + +sqlite3 -csv -header ${CLASS_DB} <<EOF > usearch_meta.csv +SELECT pn.name, CAST(pn.mass AS INT) count, tax_id, tax_name, taxa.rank + FROM multiclass_concat + JOIN taxa USING (tax_id) + JOIN placement_names pn USING (placement_id, name) + WHERE want_rank = 'species'; +EOF + +romp -v usearch_clusters \ + --usearch-quietly \ + --query-group tax_id \ + --query-duplication count \ + --database-name seqname \ + --database-group tax_id \ + ${INPUT_SEQS} \ + usearch_meta.csv \ + ${RDP_SEQS} \ + ${RDP_SEQINFO} \ + ${USEARCH_HITS} \ + ${USEARCH_GROUPS}
