Mercurial > repos > stevecassidy > textgrid
comparison query_textgrids.py @ 1:be28ced5c4e0 draft
planemo upload commit f36456464c692ed9d39a9cf654d09fe793113cce-dirty
| author | stevecassidy |
|---|---|
| date | Tue, 30 Aug 2016 20:54:17 -0400 |
| parents | e9c8e6204679 |
| children |
comparison
equal
deleted
inserted
replaced
| 0:e9c8e6204679 | 1:be28ced5c4e0 |
|---|---|
| 1 from __future__ import print_function | 1 from __future__ import print_function |
| 2 import json | 2 import json |
| 3 import argparse | 3 import argparse |
| 4 import pyalveo | |
| 5 import sys | 4 import sys |
| 6 import os | 5 import os |
| 7 import tgt | 6 import tgt |
| 8 | 7 |
| 9 API_URL = 'https://app.alveo.edu.au' # TODO: export constants to a separate module | |
| 10 | 8 |
| 11 def parser(): | 9 def parser(): |
| 12 parser = argparse.ArgumentParser(description="Find matching segments in a TextGrid") | 10 parser = argparse.ArgumentParser(description="Find matching segments in a TextGrid") |
| 13 parser.add_argument('--textgrid', required=True, action="store", type=str, help="TextGrid files (comma separated)") | 11 parser.add_argument('--textgrid', required=True, action="store", type=str, help="TextGrid files (comma separated)") |
| 14 parser.add_argument('--identifier', required=True, action="store", type=str, help="Dataset identifiers (comma separated)") | 12 parser.add_argument('--identifier', required=True, action="store", type=str, help="Dataset identifiers (comma separated)") |
| 23 tgfiles = args.textgrid.split(',') | 21 tgfiles = args.textgrid.split(',') |
| 24 identifiers = args.identifier.split(',') | 22 identifiers = args.identifier.split(',') |
| 25 assert len(tgfiles) == len(identifiers), "number of textgrids must match number of identifiers" | 23 assert len(tgfiles) == len(identifiers), "number of textgrids must match number of identifiers" |
| 26 | 24 |
| 27 pairs = zip(tgfiles, identifiers) | 25 pairs = zip(tgfiles, identifiers) |
| 28 | 26 |
| 29 rows = [] | 27 rows = [] |
| 30 for tgfile, identifier in pairs: | 28 for tgfile, identifier in pairs: |
| 31 tg = tgt.read_textgrid(tgfile) | 29 tg = tgt.read_textgrid(tgfile) |
| 32 tier = tg.get_tier_by_name(args.tier) | 30 tier = tg.get_tier_by_name(args.tier) |
| 33 matches = tier.get_annotations_with_text(args.regex, regex=True) | 31 matches = tier.get_annotations_with_text(args.regex, regex=True) |
