# HG changeset patch # User rijst # Date 1355311957 18000 # Node ID f7c80c646b96c7f319e582a9e35fc4db0d216f25 # Parent 493433860c0840a9434cd27a6d4cabcd3e5674b8 Uploaded diff -r 493433860c08 -r f7c80c646b96 snpsplit.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/snpsplit.xml Wed Dec 12 06:32:37 2012 -0500 @@ -0,0 +1,33 @@ + + splits multicharacter entries into separate lines + snpsplit.py $input $output + + + + + + + + +Input: tab delimited, format Position Ref Mut +Position is 1-based genomic coordinate +Ref is the reference sequence +Mut is the mutant sequence + +Ref en Mut sequences consisting of more than one character will be split up into separate lines. Example: +Input: +123 CGT ATG +Output: +123 C A +124 G T +125 T G + +Bases that are the same in both columns, will be skipped. Example: +Input: +123 CGT AGG +Output: +123 C A +125 T G + + +