Mercurial > repos > devteam > t_test_two_samples
diff t_test_two_samples.pl @ 0:3d24b35de20a draft
Uploaded
author | devteam |
---|---|
date | Wed, 21 Aug 2013 10:58:59 -0400 |
parents | |
children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/t_test_two_samples.pl Wed Aug 21 10:58:59 2013 -0400 @@ -0,0 +1,109 @@ +# A program to implement the non-pooled t-test for two samples where the alternative hypothesis is two-sided or one-sided. +# The first input file is a TABULAR format file representing the first sample and consisting of one column only. +# The second input file is a TABULAR format file representing the first sample nd consisting of one column only. +# The third input is the sidedness of the t-test: either two-sided or, one-sided with m1 less than m2 or, +# one-sided with m1 greater than m2. +# The fourth input is the equality status of the standard deviations of both populations +# The output file is a TXT file representing the result of the two sample t-test. + +use strict; +use warnings; + +#variable to handle the motif information +my $motif; +my $motifName = ""; +my $motifNumber = 0; +my $totalMotifsNumber = 0; +my @motifNamesArray = (); + +# check to make sure having correct files +my $usage = "usage: non_pooled_t_test_two_samples_galaxy.pl [TABULAR.in] [TABULAR.in] [testSidedness] [standardDeviationEquality] [TXT.out] \n"; +die $usage unless @ARGV == 5; + +#get the input arguments +my $firstSampleInputFile = $ARGV[0]; +my $secondSampleInputFile = $ARGV[1]; +my $testSidedness = $ARGV[2]; +my $standardDeviationEquality = $ARGV[3]; +my $outputFile = $ARGV[4]; + +#open the input files +open (INPUT1, "<", $firstSampleInputFile) || die("Could not open file $firstSampleInputFile \n"); +open (INPUT2, "<", $secondSampleInputFile) || die("Could not open file $secondSampleInputFile \n"); +open (OUTPUT, ">", $outputFile) || die("Could not open file $outputFile \n"); + + +#variables to store the name of the R script file +my $r_script; + +# R script to implement the two-sample test on the motif frequencies in upstream flanking region +#construct an R script file and save it in the same directory where the perl file is located +$r_script = "non_pooled_t_test_two_samples.r"; + +open(Rcmd,">", $r_script) or die "Cannot open $r_script \n\n"; +print Rcmd " + sampleTable1 <- read.table(\"$firstSampleInputFile\", header=FALSE); + sample1 <- sampleTable1[, 1]; + + sampleTable2 <- read.table(\"$secondSampleInputFile\", header=FALSE); + sample2 <- sampleTable2[, 1]; + + testSideStatus <- \"$testSidedness\"; + STEqualityStatus <- \"$standardDeviationEquality\"; + + #open the output a text file + sink(file = \"$outputFile\"); + + #check if the t-test is two-sided + if (testSideStatus == \"two-sided\"){ + + #check if the standard deviations are equal in both populations + if (STEqualityStatus == \"equal\"){ + #two-sample t-test where standard deviations are assumed to be unequal, the test is two-sided + testResult <- t.test(sample1, sample2, var.equal = TRUE); + } else{ + #two-sample t-test where standard deviations are assumed to be unequal, the test is two-sided + testResult <- t.test(sample1, sample2, var.equal = FALSE); + } + } else{ #the t-test is one sided + + #check if the t-test is two-sided with m1 < m2 + if (testSideStatus == \"one-sided:_m1_less_than_m2\"){ + + #check if the standard deviations are equal in both populations + if (STEqualityStatus == \"equal\"){ + #two-sample t-test where standard deviations are assumed to be unequal, the test is one-sided: Halt: m1 < m2 + testResult <- t.test(sample1, sample2, var.equal = TRUE, alternative = \"less\"); + } else{ + #two-sample t-test where standard deviations are assumed to be unequal, the test is one-sided: Halt: m1 < m2 + testResult <- t.test(sample1, sample2, var.equal = FALSE, alternative = \"less\"); + } + } else{ #the t-test is one-sided with m1 > m2 + #check if the standard deviations are equal in both populations + if (STEqualityStatus == \"equal\"){ + #two-sample t-test where standard deviations are assumed to be unequal, the test is one-sided: Halt: m1 < m2 + testResult <- t.test(sample1, sample2, var.equal = TRUE, alternative = \"greater\"); + } else{ + #two-sample t-test where standard deviations are assumed to be unequal, the test is one-sided: Halt: m1 < m2 + testResult <- t.test(sample1, sample2, var.equal = FALSE, alternative = \"greater\"); + } + } + } + + #save the output of the t-test into the output text file + testResult; + + #close the output text file + sink(); + + #eof" . "\n"; + +close Rcmd; + +system("R --no-restore --no-save --no-readline < $r_script > $r_script.out"); + +#close the input and output files +close(OUTPUT); +close(INPUT2); +close(INPUT1); +