view xenaGetDataset.py @ 40:fd24e220f240

more edit on description
author jingchunzhu <jingchunzhu@gmail.com>
date Mon, 27 Jul 2015 00:59:02 -0700
parents 8bb037f88ed2
children 02b0824c7d60
line wrap: on
line source

#!/usr/bin/env python

import argparse
import re
import urllib2


def main():
    parser = argparse.ArgumentParser()
    parser.add_argument("dataHub", type=str)
    parser.add_argument("datasetId", type=str)
    parser.add_argument("metadatafile", type=str)
    parser.add_argument("datafile", type=str)
    args = parser.parse_args()

    datasetUrlHost = re.sub("/proj/", "/download/", args.dataHub)
    datasetIdTokens = re.split("/", args.datasetId)
    datasetUrl = datasetUrlHost + "/" + "/".join(datasetIdTokens[1:])
    print datasetUrl
    metadataUrl = datasetUrl + ".json"
    mm = urllib2.urlopen(metadataUrl)
    with open(args.metadatafile, "w") as metadata:
        metadata.write(mm.read())
    mm.close()
    dd = urllib2.urlopen(datasetUrl)
    with open(args.datafile, "w") as data:
        data.write(dd.read())
    dd.close()


if __name__ == "__main__":
    main()