gclib/scripts/fisher_exact_test.pl

#!/usr/bin/perl
use strict;
use Getopt::Std;
use FindBin;use lib $FindBin::Bin;
use Fisher qw(fishers_exact log_factorial);


my $usage = q/Usage:
 fisher_exact_test.pl [-T] a1 b1 a2 b2
 Computes Fisher's exact test p-values for 2x2 matrix:
   
   a1   b1
          
   a2   b2
 
 -T option will make the input values to be taken in terms of totals:
 
   t1 t2 n1 n2
   
  ..where n1 is a subset of t1 and n2 a subset of t2, i.e. 
    t1=a1+b1 and t2=a2+b2
 
/;
umask 0002;
getopts('To:') || die($usage."\n");
die($usage." Error: exactly 4 values are needed (totals first)!\n") unless @ARGV==4;
my $totals=$Getopt::Std::opt_T;
my @fncache=(0,0);

# -- needed by Audic-Calverie: calc_audic()
my $MAXIT = 500;
my $EPS   = 3.0E-30;
my $FPMIN = 1.0E-30;
my @COF = ( 76.18009172947146, -86.50532032941677,
            24.01409824083091, -1.231739572450155,
            0.1208650973866179E-2,-0.5395239384953E-5 );


{
 my ($a, $b , $c, $d)=@ARGV;
 if ($totals) {
   my ($t1, $t2, $n1,$n2)=@ARGV;
   die("Error: totals should be larger than parts!\n") 
    unless $n1<$t1 && $n2<$t2;
   ($a, $b , $c, $d)=($n1, $t1-$n1, $n2, $t2-$n2);
   print STDERR " a b c d = $a $b $c $d\n";
   #my $ap=audic($t1, $t2, $n1, $n2);
   my ($ap, $apdir)=calc_audic($n1, $n2, $t1, $t2, 1);
 print ">>>>   Audic & Claverie  : $ap ($apdir)\n";
   }
 my $FisherProb = ProbCTable($a, $b , $c, $d);
 print "-----> Fisher Probability: $FisherProb\n";
 my $fet1=fishers_exact($a,$b,$c,$d);
 my $fet2=fishers_exact($a,$b,$c,$d, 1); 
 print "Fisher.pm :   one-tailed:  $fet1\n";
 print "Fisher.pm :   two-tailed:  $fet2\n";
 exit;
 #--- rest is optional:
 my $a_b = $a + $b;
 my $c_d = $c + $d;
 my $a_c = $a + $c;
 my $b_d = $b + $d;
 my $total = $a + $b + $c + $d;
 my $p1 = $a/$a_b;
 my $p2 = $c/$c_d;
 my $deltap = abs($p1 - $p2);
 my $p  = $a_c / $total;
 my $sd = sqrt($p * (1-$p) * (1/$a_b + 1/$c_d));
 my $z  = abs($p1 - $p2) / $sd;
 my $zp = abs(ltqnorm($FisherProb));
 my $z95 = abs(ltqnorm(0.95));

 my $z_ratio = $z / $zp;
 my $deltap95 = $deltap * ($z95 / $zp);
 my $ratio95 = $z95 / $zp;
 print "Deltap:$deltap\tProjectedDeltap95:$deltap95\tRatio:$ratio95\n\n";

 print "$a\t$b\t$a_b\n$c\t$d\t$c_d\n".
   "$a_c\t$b_d\t$total\nFisherProb: $FisherProb <----\n" .
   "z:$z\nzp:$zp\nratio:$z_ratio\n$p1\t$p2\t$p\n\n";

  my $p_this_table = ProbOneTable($a , $b , $c , $d);
  print "This one table p:$p_this_table\n";

  my $mid_p = $FisherProb - $p_this_table/2;
  print "Mid-p:$mid_p\n\n";
}

#================ SUBROUTINES ============

sub LnFactorial {
    my $n = shift;
    return $fncache[$n] if defined $fncache[$n];
    return undef if $n < 0;
    for (my $i = scalar(@fncache); $i <= $n; $i++) {
      $fncache[$i] = $fncache[$i-1] + log($i);
    }

    return $fncache[$n];
}
sub factorial {
 my $r=1;
 $r *= $_ foreach 2..$_[0];
 return $r;
}

#compute Audic & Claverie probability
sub audic { 
 my ($n1, $n2, $x, $y)=@_;
 my $v=$y*log($n2/$n1)+log_factorial($x+$y)-log_factorial($x)-log_factorial($y)-
          ($x+$y+1)*log(1+$n2/$n1);
 return exp($v);
 #my $nratio=$n2/$n1;
 #my $v=($nratio ** $y)*factorial($x+$y)/(factorial($x)*factorial($y)*((1+$nratio)**($x+$y+1)));
 
}

sub calc_audic {
=pod

=head2 calc_audic $x, $y, $Nx, $Ny, <$signedValue>

Determines the statistical significance of the difference
in tag count (expression) between two libraries.  This
function uses the method described by Audic and 
Claverie (1997).  This method can be called on an
instantiated object, as well as statically.

B<Arguments>

I<$x,$y>

  The number of tags in the x- and y-axis 
  libraries, respectively.

I<$Nx,$Ny>

  The total number of tags in the x- and y-axis
  libraries, respectively.

I<$signedValue> (optional)

  A boolean value (>=1 is FALSE).  If this flag is
  set to TRUE, downregulated comparisons will return
  both a p-value and either +1, -1, or 0 to indicate
  up/down/same-regulation (i.e. -1 if the expression 
  ratio of tags in the x-axis library(s) is greater 
  than that of the y-axis library(s)).  This flag
  is FALSE by default.

B<Returns>

  The p-value for the observation.  A lower number is
  more significant.  Typically, observations with
  p <= 0.05 are considered statistically significant.

  If $signedValue is set to TRUE, the function also
  returns a 0, -1 or +1 to indicate same/down/up-regulation.

B<Usage>

  # the function is static, so it can be accessed directly
  my $p = calc_audic( 3, 10, 50000, 60000 );

  # or:
  my ( $p, $sign ) = calc_audic( 3, 10, 50000, 60000, 1 );
  if( $p <= 0.05 ) {
    if( $sign == +1 ) { print "Significantly upregulated.\n"; }
    if( $sign == -1 ) { print "Significantly downregulated.\n"; }
    if( $sign == 0 ) { die( "Same expression should never be significant!" ); }
  }

=cut
   my $x = shift;
    if( !defined( $x ) ) { die( " calc_audic no arguments provided." ); }
    my $y = shift;
    my $M = shift; # cf n1
    my $N = shift; # cf n2
    my $bSign = shift || 0;

    my $p = $M / ( $M+$N );

    my $thisproba = __betai( $x+1, $y+1, $p );
    my $thisproba2 = __betai( $y+1, $x+1, 1.0-$p );

    if( $bSign >= 1 ) {
        my $ratio1 = $x / $M;
        my $ratio2 = $y / $N;
        my $sign = 0;
        if( $ratio1 > $ratio2 ) { $sign = -1; }
        if( $ratio1 < $ratio2 ) { $sign = +1; }
        #return ( ( $thisproba < $thisproba2 ? ( 2*$thisproba ) : ( 2*$thisproba2 ) ), $sign );
        return ( ($thisproba < $thisproba2) ? $thisproba : $thisproba2, $sign );
    }

    # return ( $thisproba < $thisproba2 ? ( 2*$thisproba ) : ( 2*$thisproba2 ) );
    return ( $thisproba < $thisproba2) ?  $thisproba  :  $thisproba2 ;

}

###################################
# Audic and Claverie C->Perl Port #
###################################

sub __gammln {

    my $xx = shift;

    my $x = $xx;
    my $y = $xx;

    my $tmp = $x + 5.5;
    $tmp -= ( $x + 0.5 ) * log( $tmp );
    my $ser = 1.000000000190015;
    for( my $j = 0; $j <= 5; $j++ ) { $ser += $COF[$j] / ++$y; }

    return -$tmp + log( 2.5066282746310005 * $ser / $x );

}

sub __betai {
    my $a = shift;
    my $b = shift;
    my $x = shift;

    if( $x < 0.0 || $x > 1.0 ) {
        die( "Bad x in routine betai." );
    }

    my $bt;

    if( $x == 0.0 || $x == 1.0 ) { 
        $bt = 0.0; 
    } else {
        $bt = exp( __gammln( $a+$b ) - __gammln( $a ) - __gammln( $b ) + $a*log( $x ) + $b*log( 1.0-$x ) );
    }

    if( $x < ( $a+1.0 )/( $a+$b+2.0 ) ) {
        return $bt * __betacf( $a, $b, $x ) / $a;
    }

    return 1.0 - $bt * __betacf( $b, $a, 1.0-$x ) / $b;

}

sub __fabs {
    my $x = shift;
    return ( $x < 0 ? -$x : $x );
}

sub __betacf {

    my $a = shift;
    my $b = shift;
    my $x = shift;

    my $qab = $a + $b;
    my $qap = $a + 1.0;
    my $qam = $a - 1.0;
    my $c = 1.0;
    my $d = 1.0 - $qab * $x / $qap;

    if( __fabs( $d ) < $FPMIN ) { $d = $FPMIN; }

    $d = 1.0 / $d; # inverse d
    my $h = $d;
    my $m;
    for( $m = 1; $m <= $MAXIT; $m++ ) {
        my $m2 = 2 * $m;
        my $aa = $m * ( $b-$m ) * $x / ( ( $qam + $m2 ) * ( $a + $m2 ) );

        $d = 1.0 + $aa*$d;
        if( __fabs( $d ) < $FPMIN ) { $d = $FPMIN; }

        $c = 1.0 + $aa/$c;
        if( __fabs( $c ) < $FPMIN ) { $c = $FPMIN; }

        $d = 1.0 / $d;  # inverse d

        $h *= $d*$c;

        $aa = -($a+$m)*($qab+$m)*$x/(($a+$m2)*($qap+$m2));

        $d = 1.0 + $aa * $d;
        if( __fabs( $d ) < $FPMIN ) { $d = $FPMIN; }

        $c = 1.0 + $aa / $c;
        if( __fabs( $c ) < $FPMIN ) { $c = $FPMIN; }

        $d = 1.0 / $d; # inverse d;

        my $del = $d*$c;
        $h *= $del;
        if( __fabs( $del-1.0 ) < $EPS ) { last; }
    }

    if( $m > $MAXIT ) {
       # die( "a or b too big, or MAXIT too small in __betacf" );
       print STDERR "a($a) or b($b) too big, or MAXIT($MAXIT) too small in __betacf!\n";
    }
    return $h;
}


# Compute the probability of getting this exact table
# using the hypergeometric distribution
sub ProbOneTable {
  my ($a , $b , $c, $d) = @_;
  my $n = $a + $b + $c + $d;
  my $LnNumerator     = LnFactorial($a+$b)+
                        LnFactorial($c+$d)+
                        LnFactorial($a+$c)+
                        LnFactorial($b+$d);

  my $LnDenominator   = LnFactorial($a) +
                        LnFactorial($b) +
                        LnFactorial($c) +
                        LnFactorial($d) +
                        LnFactorial($n);

  my $LnP = $LnNumerator - $LnDenominator;
  return exp($LnP);
}

# Compute the cumulative probability by adding up individual
# probabilities
sub ProbCTable {
  my ($a, $b, $c, $d) = @_;

  my $min;

  my $n = $a + $b + $c + $d;

  my $p = 0;
  $p += ProbOneTable($a, $b, $c, $d);
  if( ($a * $d) >= ($b * $c) ) {
    $min = ($c < $b) ? $c : $b;
    for(my $i = 0; $i < $min; $i++) {
      $p += ProbOneTable(++$a, --$b, --$c, ++$d);
    }
  }

  if ( ($a * $d) < ($b * $c) ) {
    $min = ($a < $d) ? $a : $d;
    for(my $i = 0; $i < $min; $i++) {
      $p += ProbOneTable(--$a, ++$b, ++$c, --$d);
    }
  }
  return $p;
}

# Lower tail quantile for standard normal distribution function.
#
# This function returns an approximation of the inverse cumulative
# standard normal distribution function.  I.e., given P, it returns
# an approximation to the X satisfying P = Pr{Z <= X} where Z is a
# random variable from the standard normal distribution.
#
# The algorithm uses a minimax approximation by rational functions
# and the result has a relative error whose absolute value is less
# than 1.15e-9.
#
# Author:      Peter J. Acklam
# Time-stamp:  2000-07-19 18:26:14
# E-mail:      pjacklam@online.no
# WWW URL:     http://home.online.no/~pjacklam
sub ltqnorm  {
  my $p = shift;
  die "input argument must be in (0,1)\n" unless 0 < $p && $p < 1;

  # Coefficients in rational approximations.
  my @a = (-3.969683028665376e+01,  2.209460984245205e+02,
           -2.759285104469687e+02,  1.383577518672690e+02,
           -3.066479806614716e+01,  2.506628277459239e+00);
  my @b = (-5.447609879822406e+01,  1.615858368580409e+02,
           -1.556989798598866e+02,  6.680131188771972e+01,
           -1.328068155288572e+01 );
  my @c = (-7.784894002430293e-03, -3.223964580411365e-01,
           -2.400758277161838e+00, -2.549732539343734e+00,
            4.374664141464968e+00,  2.938163982698783e+00);
  my @d = ( 7.784695709041462e-03,  3.224671290700398e-01,
            2.445134137142996e+00,  3.754408661907416e+00);

  # Define break-points.
  my $plow  = 0.02425;
  my $phigh = 1 - $plow;

  # Rational approximation for lower region:
  if ( $p < $plow ) {
    my $q  = sqrt(-2*log($p));
    return ((((($c[0]*$q+$c[1])*$q+$c[2])*$q+$c[3])*$q+$c[4])*$q+$c[5]) /
           (((($d[0]*$q+$d[1])*$q+$d[2])*$q+$d[3])*$q+1);
  }

  # Rational approximation for upper region:
  if ( $phigh < $p ) {
    my $q  = sqrt(-2*log(1-$p));
    return -((((($c[0]*$q+$c[1])*$q+$c[2])*$q+$c[3])*$q+$c[4])*$q+$c[5]) /
            (((($d[0]*$q+$d[1])*$q+$d[2])*$q+$d[3])*$q+1);
  }

  # Rational approximation for central region:
  my $q = $p - 0.5;
  my $r = $q*$q;
  return ((((($a[0]*$r+$a[1])*$r+$a[2])*$r+$a[3])*$r+$a[4])*$r+$a[5])*$q /
         ((((($b[0]*$r+$b[1])*$r+$b[2])*$r+$b[3])*$r+$b[4])*$r+1);
}
Revision:	24
Committed:	Tue Jul 26 21:46:39 2011 UTC (13 years, 1 month ago) by gpertea
File size:	11212 byte(s)
Log Message:
Line	File contents
1	#!/usr/bin/perl
2	use strict;
3	use Getopt::Std;
4	use FindBin;use lib $FindBin::Bin;
5	use Fisher qw(fishers_exact log_factorial);
6
7
8	my $usage = q/Usage:
9	fisher_exact_test.pl [-T] a1 b1 a2 b2
10	Computes Fisher's exact test p-values for 2x2 matrix:
11
12	a1 b1
13
14	a2 b2
15
16	-T option will make the input values to be taken in terms of totals:
17
18	t1 t2 n1 n2
19
20	..where n1 is a subset of t1 and n2 a subset of t2, i.e.
21	t1=a1+b1 and t2=a2+b2
22
23	/;
24	umask 0002;
25	getopts('To:') \|\| die($usage."\n");
26	die($usage." Error: exactly 4 values are needed (totals first)!\n") unless @ARGV==4;
27	my $totals=$Getopt::Std::opt_T;
28	my @fncache=(0,0);
29
30	# -- needed by Audic-Calverie: calc_audic()
31	my $MAXIT = 500;
32	my $EPS = 3.0E-30;
33	my $FPMIN = 1.0E-30;
34	my @COF = ( 76.18009172947146, -86.50532032941677,
35	24.01409824083091, -1.231739572450155,
36	0.1208650973866179E-2,-0.5395239384953E-5 );
37
38
39
40	{
41	my ($a, $b , $c, $d)=@ARGV;
42	if ($totals) {
43	my ($t1, $t2, $n1,$n2)=@ARGV;
44	die("Error: totals should be larger than parts!\n")
45	unless $n1<$t1 && $n2<$t2;
46	($a, $b , $c, $d)=($n1, $t1-$n1, $n2, $t2-$n2);
47	print STDERR " a b c d = $a $b $c $d\n";
48	#my $ap=audic($t1, $t2, $n1, $n2);
49	my ($ap, $apdir)=calc_audic($n1, $n2, $t1, $t2, 1);
50	print ">>>> Audic & Claverie : $ap ($apdir)\n";
51	}
52	my $FisherProb = ProbCTable($a, $b , $c, $d);
53	print "-----> Fisher Probability: $FisherProb\n";
54	my $fet1=fishers_exact($a,$b,$c,$d);
55	my $fet2=fishers_exact($a,$b,$c,$d, 1);
56	print "Fisher.pm : one-tailed: $fet1\n";
57	print "Fisher.pm : two-tailed: $fet2\n";
58	exit;
59	#--- rest is optional:
60	my $a_b = $a + $b;
61	my $c_d = $c + $d;
62	my $a_c = $a + $c;
63	my $b_d = $b + $d;
64	my $total = $a + $b + $c + $d;
65	my $p1 = $a/$a_b;
66	my $p2 = $c/$c_d;
67	my $deltap = abs($p1 - $p2);
68	my $p = $a_c / $total;
69	my $sd = sqrt($p * (1-$p) * (1/$a_b + 1/$c_d));
70	my $z = abs($p1 - $p2) / $sd;
71	my $zp = abs(ltqnorm($FisherProb));
72	my $z95 = abs(ltqnorm(0.95));
73
74	my $z_ratio = $z / $zp;
75	my $deltap95 = $deltap * ($z95 / $zp);
76	my $ratio95 = $z95 / $zp;
77	print "Deltap:$deltap\tProjectedDeltap95:$deltap95\tRatio:$ratio95\n\n";
78
79	print "$a\t$b\t$a_b\n$c\t$d\t$c_d\n".
80	"$a_c\t$b_d\t$total\nFisherProb: $FisherProb <----\n" .
81	"z:$z\nzp:$zp\nratio:$z_ratio\n$p1\t$p2\t$p\n\n";
82
83	my $p_this_table = ProbOneTable($a , $b , $c , $d);
84	print "This one table p:$p_this_table\n";
85
86	my $mid_p = $FisherProb - $p_this_table/2;
87	print "Mid-p:$mid_p\n\n";
88	}
89
90	#================ SUBROUTINES ============
91
92	sub LnFactorial {
93	my $n = shift;
94	return $fncache[$n] if defined $fncache[$n];
95	return undef if $n < 0;
96	for (my $i = scalar(@fncache); $i <= $n; $i++) {
97	$fncache[$i] = $fncache[$i-1] + log($i);
98	}
99
100	return $fncache[$n];
101	}
102	sub factorial {
103	my $r=1;
104	$r *= $_ foreach 2..$_[0];
105	return $r;
106	}
107
108	#compute Audic & Claverie probability
109	sub audic {
110	my ($n1, $n2, $x, $y)=@_;
111	my $v=$y*log($n2/$n1)+log_factorial($x+$y)-log_factorial($x)-log_factorial($y)-
112	($x+$y+1)*log(1+$n2/$n1);
113	return exp($v);
114	#my $nratio=$n2/$n1;
115	#my $v=($nratio ** $y)factorial($x+$y)/(factorial($x)factorial($y)((1+$nratio)*($x+$y+1)));
116
117	}
118
119	sub calc_audic {
120	=pod
121
122	=head2 calc_audic $x, $y, $Nx, $Ny, <$signedValue>
123
124	Determines the statistical significance of the difference
125	in tag count (expression) between two libraries. This
126	function uses the method described by Audic and
127	Claverie (1997). This method can be called on an
128	instantiated object, as well as statically.
129
130	B<Arguments>
131
132	I<$x,$y>
133
134	The number of tags in the x- and y-axis
135	libraries, respectively.
136
137	I<$Nx,$Ny>
138
139	The total number of tags in the x- and y-axis
140	libraries, respectively.
141
142	I<$signedValue> (optional)
143
144	A boolean value (>=1 is FALSE). If this flag is
145	set to TRUE, downregulated comparisons will return
146	both a p-value and either +1, -1, or 0 to indicate
147	up/down/same-regulation (i.e. -1 if the expression
148	ratio of tags in the x-axis library(s) is greater
149	than that of the y-axis library(s)). This flag
150	is FALSE by default.
151
152	B<Returns>
153
154	The p-value for the observation. A lower number is
155	more significant. Typically, observations with
156	p <= 0.05 are considered statistically significant.
157
158	If $signedValue is set to TRUE, the function also
159	returns a 0, -1 or +1 to indicate same/down/up-regulation.
160
161	B<Usage>
162
163	# the function is static, so it can be accessed directly
164	my $p = calc_audic( 3, 10, 50000, 60000 );
165
166	# or:
167	my ( $p, $sign ) = calc_audic( 3, 10, 50000, 60000, 1 );
168	if( $p <= 0.05 ) {
169	if( $sign == +1 ) { print "Significantly upregulated.\n"; }
170	if( $sign == -1 ) { print "Significantly downregulated.\n"; }
171	if( $sign == 0 ) { die( "Same expression should never be significant!" ); }
172	}
173
174	=cut
175	my $x = shift;
176	if( !defined( $x ) ) { die( " calc_audic no arguments provided." ); }
177	my $y = shift;
178	my $M = shift; # cf n1
179	my $N = shift; # cf n2
180	my $bSign = shift \|\| 0;
181
182	my $p = $M / ( $M+$N );
183
184	my $thisproba = __betai( $x+1, $y+1, $p );
185	my $thisproba2 = __betai( $y+1, $x+1, 1.0-$p );
186
187	if( $bSign >= 1 ) {
188	my $ratio1 = $x / $M;
189	my $ratio2 = $y / $N;
190	my $sign = 0;
191	if( $ratio1 > $ratio2 ) { $sign = -1; }
192	if( $ratio1 < $ratio2 ) { $sign = +1; }
193	#return ( ( $thisproba < $thisproba2 ? ( 2$thisproba ) : ( 2$thisproba2 ) ), $sign );
194	return ( ($thisproba < $thisproba2) ? $thisproba : $thisproba2, $sign );
195	}
196
197	# return ( $thisproba < $thisproba2 ? ( 2$thisproba ) : ( 2$thisproba2 ) );
198	return ( $thisproba < $thisproba2) ? $thisproba : $thisproba2 ;
199
200	}
201
202	###################################
203	# Audic and Claverie C->Perl Port #
204	###################################
205
206	sub __gammln {
207
208	my $xx = shift;
209
210	my $x = $xx;
211	my $y = $xx;
212
213	my $tmp = $x + 5.5;
214	$tmp -= ( $x + 0.5 ) * log( $tmp );
215	my $ser = 1.000000000190015;
216	for( my $j = 0; $j <= 5; $j++ ) { $ser += $COF[$j] / ++$y; }
217
218	return -$tmp + log( 2.5066282746310005 * $ser / $x );
219
220	}
221
222	sub __betai {
223	my $a = shift;
224	my $b = shift;
225	my $x = shift;
226
227	if( $x < 0.0 \|\| $x > 1.0 ) {
228	die( "Bad x in routine betai." );
229	}
230
231	my $bt;
232
233	if( $x == 0.0 \|\| $x == 1.0 ) {
234	$bt = 0.0;
235	} else {
236	$bt = exp( __gammln( $a+$b ) - __gammln( $a ) - __gammln( $b ) + $alog( $x ) + $blog( 1.0-$x ) );
237	}
238
239	if( $x < ( $a+1.0 )/( $a+$b+2.0 ) ) {
240	return $bt * __betacf( $a, $b, $x ) / $a;
241	}
242
243	return 1.0 - $bt * __betacf( $b, $a, 1.0-$x ) / $b;
244
245	}
246
247	sub __fabs {
248	my $x = shift;
249	return ( $x < 0 ? -$x : $x );
250	}
251
252	sub __betacf {
253
254	my $a = shift;
255	my $b = shift;
256	my $x = shift;
257
258	my $qab = $a + $b;
259	my $qap = $a + 1.0;
260	my $qam = $a - 1.0;
261	my $c = 1.0;
262	my $d = 1.0 - $qab * $x / $qap;
263
264	if( __fabs( $d ) < $FPMIN ) { $d = $FPMIN; }
265
266	$d = 1.0 / $d; # inverse d
267	my $h = $d;
268	my $m;
269	for( $m = 1; $m <= $MAXIT; $m++ ) {
270	my $m2 = 2 * $m;
271	my $aa = $m * ( $b-$m ) * $x / ( ( $qam + $m2 ) * ( $a + $m2 ) );
272
273	$d = 1.0 + $aa*$d;
274	if( __fabs( $d ) < $FPMIN ) { $d = $FPMIN; }
275
276	$c = 1.0 + $aa/$c;
277	if( __fabs( $c ) < $FPMIN ) { $c = $FPMIN; }
278
279	$d = 1.0 / $d; # inverse d
280
281	$h = $d$c;
282
283	$aa = -($a+$m)($qab+$m)$x/(($a+$m2)*($qap+$m2));
284
285	$d = 1.0 + $aa * $d;
286	if( __fabs( $d ) < $FPMIN ) { $d = $FPMIN; }
287
288	$c = 1.0 + $aa / $c;
289	if( __fabs( $c ) < $FPMIN ) { $c = $FPMIN; }
290
291	$d = 1.0 / $d; # inverse d;
292
293	my $del = $d*$c;
294	$h *= $del;
295	if( __fabs( $del-1.0 ) < $EPS ) { last; }
296	}
297
298	if( $m > $MAXIT ) {
299	# die( "a or b too big, or MAXIT too small in __betacf" );
300	print STDERR "a($a) or b($b) too big, or MAXIT($MAXIT) too small in __betacf!\n";
301	}
302	return $h;
303	}
304
305
306
307	# Compute the probability of getting this exact table
308	# using the hypergeometric distribution
309	sub ProbOneTable {
310	my ($a , $b , $c, $d) = @_;
311	my $n = $a + $b + $c + $d;
312	my $LnNumerator = LnFactorial($a+$b)+
313	LnFactorial($c+$d)+
314	LnFactorial($a+$c)+
315	LnFactorial($b+$d);
316
317	my $LnDenominator = LnFactorial($a) +
318	LnFactorial($b) +
319	LnFactorial($c) +
320	LnFactorial($d) +
321	LnFactorial($n);
322
323	my $LnP = $LnNumerator - $LnDenominator;
324	return exp($LnP);
325	}
326
327	# Compute the cumulative probability by adding up individual
328	# probabilities
329	sub ProbCTable {
330	my ($a, $b, $c, $d) = @_;
331
332	my $min;
333
334	my $n = $a + $b + $c + $d;
335
336	my $p = 0;
337	$p += ProbOneTable($a, $b, $c, $d);
338	if( ($a * $d) >= ($b * $c) ) {
339	$min = ($c < $b) ? $c : $b;
340	for(my $i = 0; $i < $min; $i++) {
341	$p += ProbOneTable(++$a, --$b, --$c, ++$d);
342	}
343	}
344
345	if ( ($a * $d) < ($b * $c) ) {
346	$min = ($a < $d) ? $a : $d;
347	for(my $i = 0; $i < $min; $i++) {
348	$p += ProbOneTable(--$a, ++$b, ++$c, --$d);
349	}
350	}
351	return $p;
352	}
353
354	# Lower tail quantile for standard normal distribution function.
355	#
356	# This function returns an approximation of the inverse cumulative
357	# standard normal distribution function. I.e., given P, it returns
358	# an approximation to the X satisfying P = Pr{Z <= X} where Z is a
359	# random variable from the standard normal distribution.
360	#
361	# The algorithm uses a minimax approximation by rational functions
362	# and the result has a relative error whose absolute value is less
363	# than 1.15e-9.
364	#
365	# Author: Peter J. Acklam
366	# Time-stamp: 2000-07-19 18:26:14
367	# E-mail: pjacklam@online.no
368	# WWW URL: http://home.online.no/~pjacklam
369	sub ltqnorm {
370	my $p = shift;
371	die "input argument must be in (0,1)\n" unless 0 < $p && $p < 1;
372
373	# Coefficients in rational approximations.
374	my @a = (-3.969683028665376e+01, 2.209460984245205e+02,
375	-2.759285104469687e+02, 1.383577518672690e+02,
376	-3.066479806614716e+01, 2.506628277459239e+00);
377	my @b = (-5.447609879822406e+01, 1.615858368580409e+02,
378	-1.556989798598866e+02, 6.680131188771972e+01,
379	-1.328068155288572e+01 );
380	my @c = (-7.784894002430293e-03, -3.223964580411365e-01,
381	-2.400758277161838e+00, -2.549732539343734e+00,
382	4.374664141464968e+00, 2.938163982698783e+00);
383	my @d = ( 7.784695709041462e-03, 3.224671290700398e-01,
384	2.445134137142996e+00, 3.754408661907416e+00);
385
386	# Define break-points.
387	my $plow = 0.02425;
388	my $phigh = 1 - $plow;
389
390	# Rational approximation for lower region:
391	if ( $p < $plow ) {
392	my $q = sqrt(-2*log($p));
393	return ((((($c[0]$q+$c[1])$q+$c[2])$q+$c[3])$q+$c[4])*$q+$c[5]) /
394	(((($d[0]$q+$d[1])$q+$d[2])$q+$d[3])$q+1);
395	}
396
397	# Rational approximation for upper region:
398	if ( $phigh < $p ) {
399	my $q = sqrt(-2*log(1-$p));
400	return -((((($c[0]$q+$c[1])$q+$c[2])$q+$c[3])$q+$c[4])*$q+$c[5]) /
401	(((($d[0]$q+$d[1])$q+$d[2])$q+$d[3])$q+1);
402	}
403
404	# Rational approximation for central region:
405	my $q = $p - 0.5;
406	my $r = $q*$q;
407	return ((((($a[0]$r+$a[1])$r+$a[2])$r+$a[3])$r+$a[4])$r+$a[5])$q /
408	((((($b[0]$r+$b[1])$r+$b[2])$r+$b[3])$r+$b[4])*$r+1);
409	}