# HG changeset patch # User artbio # Date 1562680312 14400 # Node ID 122dbfdf082608361dbc49a42bf5ac7419423b9f planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/concat_multi_datasets commit 75811bd85c9d175d9bc7b2c4fd723adc3a361f0f diff -r 000000000000 -r 122dbfdf0826 catWrapper.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/catWrapper.xml Tue Jul 09 09:51:52 2019 -0400 @@ -0,0 +1,675 @@ + + tail-to-head by specifying how + > '$out_file1' && + #else: + $concat_command '$file' >> '$out_file1' && + #end if + #else: + $concat_command '$file' >> '$out_file1' && + #end if + printf "Done\n" && + #end for + sleep 1 + #else: + #for $file in $global_condition.inputs + printf "${file.element_identifier}..." && + #if $file.ext[-2:] == "gz" and $headers != 0: + printf "# ${file.element_identifier}\n" | gzip -c >> '$out_file1' && + gzip -dc "$file" | $concat_command |gzip -c >> '$out_file1' && + #else: + printf "# ${file.element_identifier}\n" >> '$out_file1' && + $concat_command "$file" >> '$out_file1' && + #end if + printf "Done\n" && + #end for + sleep 1 + #end if + #else if $global_condition.input_type == "simple_collections": + mkdir concatenated && + #if $dataset_names == "No": + #for $x, $y in zip($global_condition.input_1, $global_condition.input_2): + printf "${x.element_identifier} and ${y.element_identifier}..." && + #if $x.ext[-2:] == "gz" and $headers != 0: + gzip -dc '$x' | $concat_command | gzip -c > concatenated/'${x.element_identifier}.listed.${x.ext}.listed' && + gzip -dc '$y' | $concat_command | gzip -c >> concatenated/'${x.element_identifier}.listed.${x.ext}.listed' && + #else: + $concat_command '$x' '$y' > concatenated/'${x.element_identifier}.listed.${x.ext}.listed' && + #end if + printf "Done\n" && + #end for + sleep 1 + #else: + #for $x, $y in zip($global_condition.input_1, $global_condition.input_2) + printf "${x.element_identifier} and ${y.element_identifier}..." && + #if $x.ext[-2:] == "gz" and $headers != 0: + printf "# ${x.element_identifier}\n" | gzip -c > concatenated/'${x.element_identifier}_${y.element_identifier}.listed.${x.ext}.listed' && + gzip -dc '$x' | $concat_command | gzip -c >> concatenated/'${x.element_identifier}_${y.element_identifier}.listed.${x.ext}.listed' && + printf "# ${y.element_identifier}\n" | gzip -c >> concatenated/'${x.element_identifier}_${y.element_identifier}.listed.${x.ext}.listed' && + gzip -dc '$y' | $concat_command | gzip -c >> concatenated/'${x.element_identifier}_${y.element_identifier}.listed.${x.ext}.listed' && + #else: + printf "# ${x.element_identifier}\n" > concatenated/'${x.element_identifier}_${y.element_identifier}.listed.${x.ext}.listed' && + $concat_command '$x'>> concatenated/'${x.element_identifier}_${y.element_identifier}.listed.${x.ext}.listed' && + printf "# ${y.element_identifier}\n" >> concatenated/'${x.element_identifier}_${y.element_identifier}.listed.${x.ext}.listed' && + $concat_command '$y' >> concatenated/'${x.element_identifier}_${y.element_identifier}.listed.${x.ext}.listed' && + #end if + printf "Done\n" && + #end for + sleep 1 + #end if + #else if $global_condition.input_type == "paired_collection": + #if $global_condition.paired_cat_type == "by_strand": + mkdir concatenated && + #if $dataset_names == "No": + #for $file in $global_condition.inputs + printf "${file.element_identifier}- forward and reverse..." && + #if $file['forward'].ext[-2:] == "gz" and $headers != 0: + gzip -dc $file['forward'] | $concat_command | gzip -c >> concatenated/forward.listed.${file['forward'].ext}.listed && + gzip -dc $file['reverse'] | $concat_command | gzip -c >> concatenated/reverse.listed.${file['reverse'].ext}.listed && + #else: + $concat_command $file['forward'] >> concatenated/forward.listed.${file['forward'].ext}.listed && + $concat_command $file['reverse'] >> concatenated/reverse.listed.${file['reverse'].ext}.listed && + #end if + printf "Done\n" && + #end for + sleep 1 + #else: + #for $file in $global_condition.inputs.keys(): + printf "$file - forward and reverse..." && + #if $global_condition.inputs[$file]['forward'].ext[-2:] == "gz" and $headers != 0: + printf "# ${file}_forward\n" | gzip -c >> concatenated/forward.listed.${global_condition.inputs[$file]['forward'].ext}.listed && + gzip -dc $global_condition.inputs[$file]['forward'] | $concat_command | gzip -c >> concatenated/forward.listed.${global_condition.inputs[$file]['forward'].ext}.listed && + printf "# ${file}_reverse\n" | gzip -c >> concatenated/reverse.listed.${global_condition.inputs[$file]['reverse'].ext}.listed && + gzip -dc $global_condition.inputs[$file]['reverse'] | $concat_command | gzip -c >> concatenated/reverse.listed.${global_condition.inputs[$file]['reverse'].ext}.listed && + #else: + printf "# ${file}_forward\n" >> concatenated/forward.listed.${global_condition.inputs[$file]['forward'].ext}.listed && + $concat_command $global_condition.inputs[$file]['forward'] >> concatenated/forward.listed.${global_condition.inputs[$file]['forward'].ext}.listed && + printf "# ${file}_reverse\n" >> concatenated/reverse.listed.${global_condition.inputs[$file]['reverse'].ext}.listed && + $concat_command $global_condition.inputs[$file]['reverse'] >> concatenated/reverse.listed.${global_condition.inputs[$file]['reverse'].ext}.listed && + #end if + printf "Done\n" && + #end for + sleep 1 + #end if + #else if $global_condition.paired_cat_type == "by_pair": + mkdir concatenated && + #if $dataset_names == "No": + #for $file in $global_condition.inputs.keys(): + printf "$file - forward and reverse..." && + #if $global_condition.inputs[$file]['forward'].ext[-2:] == "gz" and $headers != 0: + gzip -dc $global_condition.inputs[$file]['forward'] | $concat_command | gzip -c + > concatenated/'${file}.listed.${global_condition.inputs[$file]['reverse'].ext}.listed' && + gzip -dc $global_condition.inputs[$file]['reverse'] | $concat_command | gzip -c + >> concatenated/'${file}.listed.${global_condition.inputs[$file]['reverse'].ext}.listed' && + #else: + $concat_command $global_condition.inputs[$file]['forward'] + > concatenated/'${file}.listed.${global_condition.inputs[$file]['reverse'].ext}.listed' && + $concat_command $global_condition.inputs[$file]['reverse'] + >> concatenated/'${file}.listed.${global_condition.inputs[$file]['reverse'].ext}.listed' && + #end if + printf "Done\n" && + #end for + sleep 1 + #else: + #for $file in $global_condition.inputs.keys(): + printf "$file - forward and reverse..." && + #if $global_condition.inputs[$file]['reverse'].ext[-2:] == "gz" and $headers != 0: + printf "# ${file}_forward\n" | gzip -c > concatenated/'${file}.listed.${global_condition.inputs[$file]['reverse'].ext}.listed' && + gzip -dc $global_condition.inputs[$file]['forward'] | $concat_command | gzip -c + >> concatenated/'${file}.listed.${global_condition.inputs[$file]['reverse'].ext}.listed' && + printf "# ${file}_reverse\n" | gzip -c >> concatenated/'${file}.listed.${global_condition.inputs[$file]['reverse'].ext}.listed' && + gzip -dc $global_condition.inputs[$file]['reverse'] | $concat_command | gzip -c + >> concatenated/'${file}.listed.${global_condition.inputs[$file]['reverse'].ext}.listed' && + #else: + printf "# ${file}_forward\n" > concatenated/'${file}.listed.${global_condition.inputs[$file]['reverse'].ext}.listed' && + $concat_command $global_condition.inputs[$file]['forward'] + >> concatenated/'${file}.listed.${global_condition.inputs[$file]['reverse'].ext}.listed' && + printf "# ${file}_reverse\n" >> concatenated/'${file}.listed.${global_condition.inputs[$file]['reverse'].ext}.listed' && + $concat_command $global_condition.inputs[$file]['reverse'] + >> concatenated/'${file}.listed.${global_condition.inputs[$file]['reverse'].ext}.listed' && + #end if + printf "Done\n" && + #end for + sleep 1 + #end if + #else if $global_condition.paired_cat_type == "all": + mkdir concatenated && + #set $base_name=$global_condition.inputs.element_identifier + #set $extention=$global_condition.inputs[$global_condition.inputs.keys()[0]]['forward'].ext + #if $dataset_names == "No": + #for $file in $global_condition.inputs.keys(): + printf "$file - forward and reverse..." && + #if $global_condition.inputs[$file]['forward'].ext[-2:] == "gz" and $headers != 0: + gzip -dc $global_condition.inputs[$file]['forward'] | $concat_command | gzip -c >> c'$paired_out_file' && + gzip -dc $global_condition.inputs[$file]['reverse'] | $concat_command | gzip -c >> '$paired_out_file' && + #else: + $concat_command + $global_condition.inputs[$file]['forward'] + >> '$paired_out_file' && + $concat_command + $global_condition.inputs[$file]['reverse'] + >> '$paired_out_file' && + #end if + printf "Done\n" && + #end for + sleep 1 + #else: + #for $file in $global_condition.inputs.keys(): + printf "$file - forward and reverse..." && + #if $global_condition.inputs[$file]['forward'].ext[-2:] == "gz" and $headers != 0: + printf "# ${file}_forward\n" | gzip -c > '$paired_out_file' && + gzip -dc $global_condition.inputs[$file]['forward'] | $concat_command | gzip -c >> '$paired_out_file' && + printf "# ${file}_reverse\n" | gzip -c >> '$paired_out_file' && + gzip -dc $global_condition.inputs[$file]['reverse'] | $concat_command | gzip -c >> '$paired_out_file' && + #else: + printf "# ${file}_forward\n" > '$paired_out_file' && + $concat_command + $global_condition.inputs[$file]['forward'] + >> '$paired_out_file' && + printf "# ${file}_reverse\n" >> '$paired_out_file' && + $concat_command + $global_condition.inputs[$file]['reverse'] + >> '$paired_out_file' && + #end if + printf "Done\n" && + #end for + sleep 1 + #end if + #end if + #else if $global_condition.input_type == "nested_collection": + mkdir concatenated && + #if $dataset_names == "No": + #for $sub_list in $global_condition.inputs: + #set $file_base_name=$sub_list.element_identifier + #for $sub_list_element in $sub_list: + printf "${file_base_name} - ${sub_list_element.element_identifier}..." && + #if $sub_list_element.ext[-2:] == "gz" and $headers != 0: + gzip -dc ${sub_list_element} | $concat_command | gzip -c >> concatenated/'${file_base_name}.listed.${sub_list_element.ext}.listed' && + #else: + $concat_command ${sub_list_element} >> concatenated/'${file_base_name}.listed.${sub_list_element.ext}.listed' && + #end if + printf "Done\n" && + #end for + #end for + sleep 1 + #else: + #for $sub_list in $global_condition.inputs: + #set $file_base_name=$sub_list.element_identifier + #for $sub_list_element in $sub_list: + printf "${file_base_name} - ${sub_list_element.element_identifier}..." && + #if $sub_list_element.ext[-2:] == "gz" and $headers != 0: + printf "# ${sub_list_element.element_identifier}\n" | gzip -c >> concatenated/'${file_base_name}.listed.${sub_list_element.ext}.listed' && + gzip -dc ${sub_list_element} | $concat_command | gzip -c >> concatenated/'${file_base_name}.listed.${sub_list_element.ext}.listed' && + #else: + printf "# ${sub_list_element.element_identifier}\n" >> concatenated/'${file_base_name}.listed.${sub_list_element.ext}.listed' && + $concat_command ${sub_list_element} >> concatenated/'${file_base_name}.listed.${sub_list_element.ext}.listed' && + #end if + printf "Done\n" && + #end for + #end for + sleep 1 + #end if + #end if + ]]> + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + global_condition['input_type'] == 'singles' + + + global_condition['input_type'] == 'paired_collection' and global_condition['paired_cat_type'] == 'all' + + + + global_condition['input_type'] == 'paired_collection' and global_condition['paired_cat_type'] == 'by_strand' + + + + (global_condition['input_type'] == 'paired_collection' and global_condition['paired_cat_type'] == 'by_pair') or (global_condition['input_type'] == 'simple_collections') or (global_condition['input_type'] == 'nested_collection') + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +.. class:: warningmark + +**WARNINGS:** + +- This tool does not check if the datasets being concatenated are in the same format. +- When concatenating 2 collections make sure the first collection is the one with the most items. +- This tool can't handle nested collection deeper than list:list. + +----- + +**What it does** + +Concatenates datasets and paired collections with multiple options: + + - When the input is a paired collection: + + - concatenation by strand : forward and reverse datasets are concatenated separately and a list with a single forward - reverse dataset pair is returned + + - concatenation by pair : forward - reverse dataset pairs are concatenated and a simple dataset collection is returned + + - whole collection concatenation : all datasets in the collection are concatenated and a single dataset is returned + + - When the inputs are 2 collections: datasets are concatenated in a pairwise combination and a single dataset collection is returned + + - When nested collection concatenation: datasets in each sub-collection are concatenated and a simple dataset collection is returned + + - Skipping lines before concatenation to avoid headers + + - Add the name of the concatenated files as separator + +----- + +**Single datasets concatenation example** + +Concatenating Dataset:: + + chrX 151087187 151087355 A 0 - + chrX 151572400 151572481 B 0 + + +with Dataset1:: + + chr1 151242630 151242955 X 0 + + chr1 151271715 151271999 Y 0 + + chr1 151278832 151279227 Z 0 - + +and with Dataset2:: + + chr2 100000030 200000955 P 0 + + chr2 100000015 200000999 Q 0 + + +will result in the following:: + + chrX 151087187 151087355 A 0 - + chrX 151572400 151572481 B 0 + + chr1 151242630 151242955 X 0 + + chr1 151271715 151271999 Y 0 + + chr1 151278832 151279227 Z 0 - + chr2 100000030 200000955 P 0 + + chr2 100000015 200000999 Q 0 + + +----- + +**2 Collections concatenation** + +1rst collection:: + + a + b + c + d + +2nd collection:: + + 1 + 2 + 3 + 4 + +Concatenation result:: + + A single collection containing: + + a concatenated with 1 + b concatenated with 2 + c concatenated with 3 + d concatenated with 4 + +----- + +**Paired collection concatenation example** + +1rst pair:: + + forward - reverse + +2nd pair:: + + forward - reverse + +- Concatenation by strand:: + + concatenates: + + 1rst forward + 2nd forward + 1rst reverse + 2nd reverse + + outputs: + + 1 pair + +- Concatenation by pair:: + + concatenates: + + 1rst forward + 1rst reverse + 2nd forward + 2nd reverse + + outputs: + + 2 datasets + +- Concatenate all:: + + concatenates: + + 1rst forward + 1rst reverse + 2nd forward + 2nd reverse + + outputs: + + 1 dataset + +----- + +**Nested collection concatenation example** + +Nested collection: + + - Experiment + + - Sample_1 + + - Sample_1_file_1 + - Sample_1_file_2 + + - Sample_2 + + - Sample_2_file_1 + - Sample_2_file_2 + - Sample_2_file_3 + +Concatenation result:: + + A single collection containing: + + - Sample_1: (Sample_1_file_1 + Sample_1_file_2) + - Sample_2: (Sample_2_file_1 + Sample_2_file_2 + Sample_2_file_3) + +----- + +**When selecting "Include dataset names" when concatenating files**: + +1rst file name="first_tabular":: + + chrX 151087187 151087355 A 0 - + chrX 151572400 151572481 B 0 + + +2nd file name="second_tabular":: + + chr1 151242630 151242955 X 0 + + chr1 151271715 151271999 Y 0 + + chr1 151278832 151279227 Z 0 - + +output:: + + # first_tabular + chrX 151087187 151087355 A 0 - + chrX 151572400 151572481 B 0 + + # second_tabular + chr1 151242630 151242955 X 0 + + chr1 151271715 151271999 Y 0 + + chr1 151278832 151279227 Z 0 - + +----- + +**Skiping lines** + +1rst file:: + + chrX 151087187 151087355 A 0 - + chrX 151572400 151572481 B 0 + + +2nd file:: + + chr1 151242630 151242955 X 0 + + chr1 151271715 151271999 Y 0 + + chr1 151278832 151279227 Z 0 - + +skipping 1 line + +output:: + + chrX 151572400 151572481 B 0 + + chr1 151271715 151271999 Y 0 + + chr1 151278832 151279227 Z 0 - + +----- + +Adapted from galaxy's catWrapper.xml to allow multiple input files. + + + diff -r 000000000000 -r 122dbfdf0826 test-data/1.bed --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/1.bed Tue Jul 09 09:51:52 2019 -0400 @@ -0,0 +1,65 @@ +chr1 147962192 147962580 CCDS989.1_cds_0_0_chr1_147962193_r 0 - +chr1 147984545 147984630 CCDS990.1_cds_0_0_chr1_147984546_f 0 + +chr1 148078400 148078582 CCDS993.1_cds_0_0_chr1_148078401_r 0 - +chr1 148185136 148185276 CCDS996.1_cds_0_0_chr1_148185137_f 0 + +chr10 55251623 55253124 CCDS7248.1_cds_0_0_chr10_55251624_r 0 - +chr11 116124407 116124501 CCDS8374.1_cds_0_0_chr11_116124408_r 0 - +chr11 116206508 116206563 CCDS8377.1_cds_0_0_chr11_116206509_f 0 + +chr11 116211733 116212337 CCDS8378.1_cds_0_0_chr11_116211734_r 0 - +chr11 1812377 1812407 CCDS7726.1_cds_0_0_chr11_1812378_f 0 + +chr12 38440094 38440321 CCDS8736.1_cds_0_0_chr12_38440095_r 0 - +chr13 112381694 112381953 CCDS9526.1_cds_0_0_chr13_112381695_f 0 + +chr14 98710240 98712285 CCDS9949.1_cds_0_0_chr14_98710241_r 0 - +chr15 41486872 41487060 CCDS10096.1_cds_0_0_chr15_41486873_r 0 - +chr15 41673708 41673857 CCDS10097.1_cds_0_0_chr15_41673709_f 0 + +chr15 41679161 41679250 CCDS10098.1_cds_0_0_chr15_41679162_r 0 - +chr15 41826029 41826196 CCDS10101.1_cds_0_0_chr15_41826030_f 0 + +chr16 142908 143003 CCDS10397.1_cds_0_0_chr16_142909_f 0 + +chr16 179963 180135 CCDS10401.1_cds_0_0_chr16_179964_r 0 - +chr16 244413 244681 CCDS10402.1_cds_0_0_chr16_244414_f 0 + +chr16 259268 259383 CCDS10403.1_cds_0_0_chr16_259269_r 0 - +chr18 23786114 23786321 CCDS11891.1_cds_0_0_chr18_23786115_r 0 - +chr18 59406881 59407046 CCDS11985.1_cds_0_0_chr18_59406882_f 0 + +chr18 59455932 59456337 CCDS11986.1_cds_0_0_chr18_59455933_r 0 - +chr18 59600586 59600754 CCDS11988.1_cds_0_0_chr18_59600587_f 0 + +chr19 59068595 59069564 CCDS12866.1_cds_0_0_chr19_59068596_f 0 + +chr19 59236026 59236146 CCDS12872.1_cds_0_0_chr19_59236027_r 0 - +chr19 59297998 59298008 CCDS12877.1_cds_0_0_chr19_59297999_f 0 + +chr19 59302168 59302288 CCDS12878.1_cds_0_0_chr19_59302169_r 0 - +chr2 118288583 118288668 CCDS2120.1_cds_0_0_chr2_118288584_f 0 + +chr2 118394148 118394202 CCDS2121.1_cds_0_0_chr2_118394149_r 0 - +chr2 220190202 220190242 CCDS2441.1_cds_0_0_chr2_220190203_f 0 + +chr2 220229609 220230869 CCDS2443.1_cds_0_0_chr2_220229610_r 0 - +chr20 33330413 33330423 CCDS13249.1_cds_0_0_chr20_33330414_r 0 - +chr20 33513606 33513792 CCDS13255.1_cds_0_0_chr20_33513607_f 0 + +chr20 33579500 33579527 CCDS13256.1_cds_0_0_chr20_33579501_r 0 - +chr20 33593260 33593348 CCDS13257.1_cds_0_0_chr20_33593261_f 0 + +chr21 32707032 32707192 CCDS13614.1_cds_0_0_chr21_32707033_f 0 + +chr21 32869641 32870022 CCDS13615.1_cds_0_0_chr21_32869642_r 0 - +chr21 33321040 33322012 CCDS13620.1_cds_0_0_chr21_33321041_f 0 + +chr21 33744994 33745040 CCDS13625.1_cds_0_0_chr21_33744995_r 0 - +chr22 30120223 30120265 CCDS13897.1_cds_0_0_chr22_30120224_f 0 + +chr22 30160419 30160661 CCDS13898.1_cds_0_0_chr22_30160420_r 0 - +chr22 30665273 30665360 CCDS13901.1_cds_0_0_chr22_30665274_f 0 + +chr22 30939054 30939266 CCDS13903.1_cds_0_0_chr22_30939055_r 0 - +chr5 131424298 131424460 CCDS4149.1_cds_0_0_chr5_131424299_f 0 + +chr5 131556601 131556672 CCDS4151.1_cds_0_0_chr5_131556602_r 0 - +chr5 131621326 131621419 CCDS4152.1_cds_0_0_chr5_131621327_f 0 + +chr5 131847541 131847666 CCDS4155.1_cds_0_0_chr5_131847542_r 0 - +chr6 108299600 108299744 CCDS5061.1_cds_0_0_chr6_108299601_r 0 - +chr6 108594662 108594687 CCDS5063.1_cds_0_0_chr6_108594663_f 0 + +chr6 108640045 108640151 CCDS5064.1_cds_0_0_chr6_108640046_r 0 - +chr6 108722976 108723115 CCDS5067.1_cds_0_0_chr6_108722977_f 0 + +chr7 113660517 113660685 CCDS5760.1_cds_0_0_chr7_113660518_f 0 + +chr7 116512159 116512389 CCDS5771.1_cds_0_0_chr7_116512160_r 0 - +chr7 116714099 116714152 CCDS5773.1_cds_0_0_chr7_116714100_f 0 + +chr7 116945541 116945787 CCDS5774.1_cds_0_0_chr7_116945542_r 0 - +chr8 118881131 118881317 CCDS6324.1_cds_0_0_chr8_118881132_r 0 - +chr9 128764156 128764189 CCDS6914.1_cds_0_0_chr9_128764157_f 0 + +chr9 128787519 128789136 CCDS6915.1_cds_0_0_chr9_128787520_r 0 - +chr9 128882427 128882523 CCDS6917.1_cds_0_0_chr9_128882428_f 0 + +chr9 128937229 128937445 CCDS6919.1_cds_0_0_chr9_128937230_r 0 - +chrX 122745047 122745924 CCDS14606.1_cds_0_0_chrX_122745048_f 0 + +chrX 152648964 152649196 CCDS14733.1_cds_0_0_chrX_152648965_r 0 - +chrX 152691446 152691471 CCDS14735.1_cds_0_0_chrX_152691447_f 0 + +chrX 152694029 152694263 CCDS14736.1_cds_0_0_chrX_152694030_r 0 - diff -r 000000000000 -r 122dbfdf0826 test-data/1.fastq.gz Binary file test-data/1.fastq.gz has changed diff -r 000000000000 -r 122dbfdf0826 test-data/1_f.fastq --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/1_f.fastq Tue Jul 09 09:51:52 2019 -0400 @@ -0,0 +1,12 @@ +@NS500801:189:HWGFJBGX5:1:11101:18757:1118 1:N:0:GCCAAT +CACCGTTACATCACACCAACCAAGATTACATCACACCACTCAGGATGACAGACAGTAATCCTGTTTGTTATATANG ++ +AAAAAEEEEEEEEEEEEAEEEEEEEEEAEEEEEEEEEEEEEEEEEEEEAEEEEEEEEEEEEEEE