3200
|
1 ## Copyright (C) 1995, 1996, 1997 Kurt Hornik |
3426
|
2 ## |
3922
|
3 ## This file is part of Octave. |
|
4 ## |
|
5 ## Octave is free software; you can redistribute it and/or modify it |
|
6 ## under the terms of the GNU General Public License as published by |
3200
|
7 ## the Free Software Foundation; either version 2, or (at your option) |
|
8 ## any later version. |
3426
|
9 ## |
3922
|
10 ## Octave is distributed in the hope that it will be useful, but |
3200
|
11 ## WITHOUT ANY WARRANTY; without even the implied warranty of |
|
12 ## MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
3426
|
13 ## General Public License for more details. |
|
14 ## |
3200
|
15 ## You should have received a copy of the GNU General Public License |
3922
|
16 ## along with Octave; see the file COPYING. If not, write to the Free |
5307
|
17 ## Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA |
|
18 ## 02110-1301, USA. |
3200
|
19 |
3454
|
20 ## -*- texinfo -*- |
|
21 ## @deftypefn {Function File} {[@var{pval}, @var{z}] =} u_test (@var{x}, @var{y}, @var{alt}) |
|
22 ## For two samples @var{x} and @var{y}, perform a Mann-Whitney U-test of |
|
23 ## the null hypothesis PROB (@var{x} > @var{y}) == 1/2 == PROB (@var{x} |
|
24 ## < @var{y}). Under the null, the test statistic @var{z} approximately |
|
25 ## follows a standard normal distribution. Note that this test is |
|
26 ## equivalent to the Wilcoxon rank-sum test. |
3200
|
27 ## |
3454
|
28 ## With the optional argument string @var{alt}, the alternative of |
|
29 ## interest can be selected. If @var{alt} is @code{"!="} or |
|
30 ## @code{"<>"}, the null is tested against the two-sided alternative |
|
31 ## PROB (@var{x} > @var{y}) != 1/2. If @var{alt} is @code{">"}, the |
3457
|
32 ## one-sided alternative PROB (@var{x} > @var{y}) > 1/2 is considered. |
|
33 ## Similarly for @code{"<"}, the one-sided alternative PROB (@var{x} > |
7001
|
34 ## @var{y}) < 1/2 is considered. The default is the two-sided case. |
3200
|
35 ## |
3454
|
36 ## The p-value of the test is returned in @var{pval}. |
3426
|
37 ## |
3200
|
38 ## If no output argument is given, the p-value of the test is displayed. |
3454
|
39 ## @end deftypefn |
3426
|
40 |
3200
|
41 ## This implementation is still incomplete---for small sample sizes, |
|
42 ## the normal approximation is rather bad ... |
|
43 |
5428
|
44 ## Author: KH <Kurt.Hornik@wu-wien.ac.at> |
3456
|
45 ## Description: Mann-Whitney U-test |
3200
|
46 |
|
47 function [pval, z] = u_test (x, y, alt) |
3426
|
48 |
3200
|
49 if ((nargin < 2) || (nargin > 3)) |
6046
|
50 print_usage (); |
3200
|
51 endif |
3426
|
52 |
4030
|
53 if (! (isvector (x) && isvector (y))) |
3456
|
54 error ("u_test: both x and y must be vectors"); |
3200
|
55 endif |
|
56 |
|
57 n_x = length (x); |
|
58 n_y = length (y); |
3273
|
59 r = ranks ([(reshape (x, 1, n_x)), (reshape (y, 1, n_y))]); |
3200
|
60 z = (sum (r(1 : n_x)) - n_x * (n_x + n_y + 1) / 2) ... |
3426
|
61 / sqrt (n_x * n_y * (n_x + n_y + 1) / 12); |
3200
|
62 |
|
63 cdf = stdnormal_cdf (z); |
3426
|
64 |
3200
|
65 if (nargin == 2) |
|
66 alt = "!="; |
|
67 endif |
|
68 |
5443
|
69 if (! ischar (alt)) |
3456
|
70 error("u_test: alt must be a string"); |
3200
|
71 endif |
|
72 if (strcmp (alt, "!=") || strcmp (alt, "<>")) |
|
73 pval = 2 * min (cdf, 1 - cdf); |
|
74 elseif (strcmp (alt, ">")) |
|
75 pval = cdf; |
|
76 elseif (strcmp (alt, "<")) |
|
77 pval = 1 - cdf; |
|
78 else |
3456
|
79 error ("u_test: option %s not recognized", alt); |
3200
|
80 endif |
|
81 |
|
82 if (nargout == 0) |
3456
|
83 printf (" pval: %g\n", pval); |
3200
|
84 endif |
3426
|
85 |
3200
|
86 endfunction |