Mercurial > hg > octave-nkf
annotate scripts/statistics/models/logistic_regression.m @ 17338:1c89599167a6
maint: End m-files with 1 blank line.
Simplifies automated grammarchecking script.
* scripts/@ftp/ascii.m, scripts/@ftp/binary.m, scripts/@ftp/cd.m,
scripts/@ftp/close.m, scripts/@ftp/delete.m, scripts/@ftp/dir.m,
scripts/@ftp/display.m, scripts/@ftp/ftp.m, scripts/@ftp/loadobj.m,
scripts/@ftp/mget.m, scripts/@ftp/mkdir.m, scripts/@ftp/mput.m,
scripts/@ftp/rename.m, scripts/@ftp/rmdir.m, scripts/@ftp/saveobj.m,
scripts/audio/lin2mu.m, scripts/audio/loadaudio.m, scripts/audio/mu2lin.m,
scripts/audio/record.m, scripts/audio/saveaudio.m, scripts/audio/setaudio.m,
scripts/deprecated/__error_text__.m, scripts/deprecated/cut.m,
scripts/deprecated/error_text.m, scripts/deprecated/isstr.m,
scripts/deprecated/polyderiv.m, scripts/deprecated/studentize.m,
scripts/deprecated/sylvester_matrix.m, scripts/general/bicubic.m,
scripts/general/celldisp.m, scripts/general/colon.m,
scripts/general/cplxpair.m, scripts/general/del2.m, scripts/general/display.m,
scripts/general/isdir.m, scripts/general/isequaln.m, scripts/general/loadobj.m,
scripts/general/private/__isequal__.m, scripts/general/private/__splinen__.m,
scripts/general/profexplore.m, scripts/general/quadgk.m,
scripts/general/randi.m, scripts/general/repmat.m, scripts/general/saveobj.m,
scripts/geometry/delaunay.m, scripts/help/__unimplemented__.m,
scripts/help/doc_cache_create.m, scripts/help/get_first_help_sentence.m,
scripts/help/help.m, scripts/help/print_usage.m,
scripts/help/private/__additional_help_message__.m,
scripts/help/private/__strip_html_tags__.m, scripts/help/type.m,
scripts/image/imfinfo.m, scripts/image/imformats.m, scripts/image/imread.m,
scripts/image/imwrite.m, scripts/image/private/__imfinfo__.m,
scripts/image/private/__imread__.m, scripts/image/private/__imwrite__.m,
scripts/image/private/imageIO.m, scripts/image/private/imwrite_filename.m,
scripts/image/private/ind2x.m, scripts/io/beep.m, scripts/io/strread.m,
scripts/io/textread.m, scripts/io/textscan.m, scripts/linear-algebra/krylov.m,
scripts/linear-algebra/subspace.m, scripts/miscellaneous/bug_report.m,
scripts/miscellaneous/bunzip2.m, scripts/miscellaneous/cast.m,
scripts/miscellaneous/copyfile.m, scripts/miscellaneous/debug.m,
scripts/miscellaneous/dir.m, scripts/miscellaneous/dump_prefs.m,
scripts/miscellaneous/error_ids.m, scripts/miscellaneous/fileattrib.m,
scripts/miscellaneous/gunzip.m, scripts/miscellaneous/isdeployed.m,
scripts/miscellaneous/ismac.m, scripts/miscellaneous/mex.m,
scripts/miscellaneous/mexext.m, scripts/miscellaneous/mkoctfile.m,
scripts/miscellaneous/movefile.m, scripts/miscellaneous/namelengthmax.m,
scripts/miscellaneous/news.m, scripts/miscellaneous/pack.m,
scripts/miscellaneous/perl.m,
scripts/miscellaneous/private/display_info_file.m,
scripts/miscellaneous/python.m, scripts/miscellaneous/rmappdata.m,
scripts/miscellaneous/run.m, scripts/miscellaneous/tar.m,
scripts/miscellaneous/tempname.m, scripts/miscellaneous/untar.m,
scripts/miscellaneous/unzip.m, scripts/miscellaneous/what.m,
scripts/miscellaneous/zip.m, scripts/optimization/fminunc.m,
scripts/optimization/fsolve.m, scripts/optimization/fzero.m,
scripts/optimization/glpk.m, scripts/optimization/optimget.m,
scripts/optimization/optimset.m, scripts/optimization/qp.m,
scripts/optimization/sqp.m, scripts/path/pathdef.m, scripts/pkg/pkg.m,
scripts/pkg/private/build.m, scripts/pkg/private/describe.m,
scripts/pkg/private/dirempty.m, scripts/pkg/private/get_forge_download.m,
scripts/pkg/private/get_forge_pkg.m,
scripts/pkg/private/get_unsatisfied_deps.m, scripts/pkg/private/install.m,
scripts/pkg/private/is_architecture_dependent.m,
scripts/pkg/private/list_forge_packages.m, scripts/pkg/private/rebuild.m,
scripts/pkg/private/shell.m, scripts/pkg/private/uninstall.m,
scripts/plot/axes.m, scripts/plot/box.m, scripts/plot/closereq.m,
scripts/plot/diffuse.m, scripts/plot/ezpolar.m, scripts/plot/findfigs.m,
scripts/plot/gco.m, scripts/plot/guidata.m, scripts/plot/guihandles.m,
scripts/plot/hdl2struct.m, scripts/plot/linkprop.m, scripts/plot/peaks.m,
scripts/plot/print.m, scripts/plot/private/__add_datasource__.m,
scripts/plot/private/__axis_label__.m, scripts/plot/private/__clabel__.m,
scripts/plot/private/__color_str_rgb__.m, scripts/plot/private/__contour__.m,
scripts/plot/private/__default_plot_options__.m,
scripts/plot/private/__errcomm__.m, scripts/plot/private/__file_filter__.m,
scripts/plot/private/__fltk_file_filter__.m,
scripts/plot/private/__getlegenddata__.m,
scripts/plot/private/__gnuplot_open_stream__.m,
scripts/plot/private/__gnuplot_print__.m,
scripts/plot/private/__go_draw_axes__.m,
scripts/plot/private/__interp_cube__.m, scripts/plot/private/__is_function__.m,
scripts/plot/private/__line__.m, scripts/plot/private/__marching_cube__.m,
scripts/plot/private/__next_line_style__.m, scripts/plot/private/__patch__.m,
scripts/plot/private/__pie__.m, scripts/plot/private/__pltopt__.m,
scripts/plot/private/__quiver__.m, scripts/plot/private/__scatter__.m,
scripts/plot/private/__stem__.m, scripts/plot/private/__uigetdir_fltk__.m,
scripts/plot/private/__uigetfile_fltk__.m,
scripts/plot/private/__uiobject_split_args__.m,
scripts/plot/private/__uiputfile_fltk__.m, scripts/plot/refresh.m,
scripts/plot/saveas.m, scripts/plot/shg.m, scripts/plot/specular.m,
scripts/plot/sphere.m, scripts/plot/struct2hdl.m, scripts/plot/subplot.m,
scripts/plot/uicontextmenu.m, scripts/plot/uicontrol.m, scripts/plot/uipanel.m,
scripts/plot/uipushtool.m, scripts/plot/uiresume.m,
scripts/plot/uitoggletool.m, scripts/plot/uitoolbar.m, scripts/plot/uiwait.m,
scripts/plot/waitforbuttonpress.m, scripts/polynomial/pchip.m,
scripts/polynomial/polyeig.m, scripts/polynomial/ppval.m,
scripts/prefs/addpref.m, scripts/prefs/getpref.m, scripts/prefs/ispref.m,
scripts/prefs/private/loadprefs.m, scripts/prefs/private/prefsfile.m,
scripts/prefs/private/saveprefs.m, scripts/prefs/setpref.m,
scripts/set/private/validargs.m, scripts/set/unique.m,
scripts/signal/arch_fit.m, scripts/signal/arch_rnd.m,
scripts/signal/arch_test.m, scripts/signal/arma_rnd.m,
scripts/signal/durbinlevinson.m, scripts/signal/fractdiff.m,
scripts/signal/freqz.m, scripts/signal/freqz_plot.m, scripts/signal/hurst.m,
scripts/signal/periodogram.m, scripts/signal/private/rectangle_lw.m,
scripts/signal/private/rectangle_sw.m, scripts/signal/private/triangle_sw.m,
scripts/signal/spectral_adf.m, scripts/signal/spectral_xdf.m,
scripts/signal/stft.m, scripts/signal/synthesis.m, scripts/signal/yulewalker.m,
scripts/sparse/colperm.m, scripts/sparse/eigs.m, scripts/sparse/etreeplot.m,
scripts/sparse/gmres.m, scripts/sparse/private/__sprand_impl__.m,
scripts/sparse/spdiags.m, scripts/sparse/sprandn.m, scripts/specfun/bessel.m,
scripts/specfun/betaln.m, scripts/specfun/expint.m,
scripts/special-matrix/gallery.m, scripts/startup/__finish__.m,
scripts/statistics/base/qqplot.m, scripts/statistics/distributions/tcdf.m,
scripts/statistics/distributions/wienrnd.m,
scripts/statistics/models/logistic_regression.m,
scripts/statistics/models/private/logistic_regression_derivatives.m,
scripts/statistics/models/private/logistic_regression_likelihood.m,
scripts/statistics/tests/anova.m, scripts/statistics/tests/bartlett_test.m,
scripts/statistics/tests/chisquare_test_homogeneity.m,
scripts/statistics/tests/chisquare_test_independence.m,
scripts/statistics/tests/cor_test.m,
scripts/statistics/tests/f_test_regression.m,
scripts/statistics/tests/hotelling_test.m,
scripts/statistics/tests/hotelling_test_2.m,
scripts/statistics/tests/kolmogorov_smirnov_test_2.m,
scripts/statistics/tests/kruskal_wallis_test.m,
scripts/statistics/tests/manova.m, scripts/statistics/tests/mcnemar_test.m,
scripts/statistics/tests/prop_test_2.m, scripts/statistics/tests/run_test.m,
scripts/statistics/tests/sign_test.m, scripts/statistics/tests/t_test.m,
scripts/statistics/tests/t_test_2.m,
scripts/statistics/tests/t_test_regression.m,
scripts/statistics/tests/u_test.m, scripts/statistics/tests/var_test.m,
scripts/statistics/tests/welch_test.m,
scripts/statistics/tests/wilcoxon_test.m, scripts/statistics/tests/z_test.m,
scripts/statistics/tests/z_test_2.m, scripts/strings/strcat.m,
scripts/strings/strjoin.m, scripts/strings/strsplit.m,
scripts/testfun/__have_feature__.m, scripts/testfun/__printf_assert__.m,
scripts/testfun/__prog_output_assert__.m, scripts/testfun/__run_test_suite__.m,
scripts/time/clock.m, scripts/time/datenum.m, scripts/ui/errordlg.m,
scripts/ui/private/message_dialog.m: End m-files with 1 blank line.
author | Rik <rik@octave.org> |
---|---|
date | Wed, 28 Aug 2013 08:33:02 -0700 |
parents | 72c96de7a403 |
children | d63878346099 |
rev | line source |
---|---|
14138
72c96de7a403
maint: update copyright notices for 2012
John W. Eaton <jwe@octave.org>
parents:
12530
diff
changeset
|
1 ## Copyright (C) 1995-2012 Kurt Hornik |
3426 | 2 ## |
3922 | 3 ## This file is part of Octave. |
4 ## | |
5 ## Octave is free software; you can redistribute it and/or modify it | |
6 ## under the terms of the GNU General Public License as published by | |
7016 | 7 ## the Free Software Foundation; either version 3 of the License, or (at |
8 ## your option) any later version. | |
3426 | 9 ## |
3922 | 10 ## Octave is distributed in the hope that it will be useful, but |
3191 | 11 ## WITHOUT ANY WARRANTY; without even the implied warranty of |
12 ## MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
3426 | 13 ## General Public License for more details. |
14 ## | |
3191 | 15 ## You should have received a copy of the GNU General Public License |
7016 | 16 ## along with Octave; see the file COPYING. If not, see |
17 ## <http://www.gnu.org/licenses/>. | |
3191 | 18 |
3454 | 19 ## -*- texinfo -*- |
6754 | 20 ## @deftypefn {Function File} {[@var{theta}, @var{beta}, @var{dev}, @var{dl}, @var{d2l}, @var{p}] =} logistic_regression (@var{y}, @var{x}, @var{print}, @var{theta}, @var{beta}) |
3454 | 21 ## Perform ordinal logistic regression. |
3191 | 22 ## |
3454 | 23 ## Suppose @var{y} takes values in @var{k} ordered categories, and let |
24 ## @code{gamma_i (@var{x})} be the cumulative probability that @var{y} | |
25 ## falls in one of the first @var{i} categories given the covariate | |
26 ## @var{x}. Then | |
27 ## | |
28 ## @example | |
29 ## [theta, beta] = logistic_regression (y, x) | |
30 ## @end example | |
31 ## | |
32 ## @noindent | |
3191 | 33 ## fits the model |
3454 | 34 ## |
35 ## @example | |
9051
1bf0ce0930be
Grammar check TexInfo in all .m files
Rik <rdrider0-list@yahoo.com>
parents:
7031
diff
changeset
|
36 ## logit (gamma_i (x)) = theta_i - beta' * x, i = 1 @dots{} k-1 |
3454 | 37 ## @end example |
3191 | 38 ## |
3454 | 39 ## The number of ordinal categories, @var{k}, is taken to be the number |
40 ## of distinct values of @code{round (@var{y})}. If @var{k} equals 2, | |
41 ## @var{y} is binary and the model is ordinary logistic regression. The | |
42 ## matrix @var{x} is assumed to have full column rank. | |
43 ## | |
44 ## Given @var{y} only, @code{theta = logistic_regression (y)} | |
3191 | 45 ## fits the model with baseline logit odds only. |
46 ## | |
47 ## The full form is | |
3454 | 48 ## |
49 ## @example | |
9051
1bf0ce0930be
Grammar check TexInfo in all .m files
Rik <rdrider0-list@yahoo.com>
parents:
7031
diff
changeset
|
50 ## @group |
3454 | 51 ## [theta, beta, dev, dl, d2l, gamma] |
52 ## = logistic_regression (y, x, print, theta, beta) | |
9051
1bf0ce0930be
Grammar check TexInfo in all .m files
Rik <rdrider0-list@yahoo.com>
parents:
7031
diff
changeset
|
53 ## @end group |
3454 | 54 ## @end example |
55 ## | |
56 ## @noindent | |
57 ## in which all output arguments and all input arguments except @var{y} | |
58 ## are optional. | |
3191 | 59 ## |
6754 | 60 ## Setting @var{print} to 1 requests summary information about the fitted |
3454 | 61 ## model to be displayed. Setting @var{print} to 2 requests information |
62 ## about convergence at each iteration. Other values request no | |
63 ## information to be displayed. The input arguments @var{theta} and | |
64 ## @var{beta} give initial estimates for @var{theta} and @var{beta}. | |
65 ## | |
66 ## The returned value @var{dev} holds minus twice the log-likelihood. | |
3191 | 67 ## |
3454 | 68 ## The returned values @var{dl} and @var{d2l} are the vector of first |
69 ## and the matrix of second derivatives of the log-likelihood with | |
70 ## respect to @var{theta} and @var{beta}. | |
3191 | 71 ## |
3454 | 72 ## @var{p} holds estimates for the conditional distribution of @var{y} |
73 ## given @var{x}. | |
74 ## @end deftypefn | |
3191 | 75 |
3426 | 76 ## Original for MATLAB written by Gordon K Smyth <gks@maths.uq.oz.au>, |
3191 | 77 ## U of Queensland, Australia, on Nov 19, 1990. Last revision Aug 3, |
78 ## 1992. | |
79 | |
3456 | 80 ## Author: Gordon K Smyth <gks@maths.uq.oz.au>, |
5428 | 81 ## Adapted-By: KH <Kurt.Hornik@wu-wien.ac.at> |
3456 | 82 ## Description: Ordinal logistic regression |
3191 | 83 |
84 ## Uses the auxiliary functions logistic_regression_derivatives and | |
85 ## logistic_regression_likelihood. | |
86 | |
12530
d70c99028ba3
Make helper functions for logistic_regression private.
Rik <octave@nomad.inbox5.com>
parents:
11523
diff
changeset
|
87 function [theta, beta, dev, dl, d2l, p] = logistic_regression (y, x, print, theta, beta) |
3426 | 88 |
3191 | 89 ## check input |
3426 | 90 y = round (vec (y)); |
91 [my, ny] = size (y); | |
3191 | 92 if (nargin < 2) |
3426 | 93 x = zeros (my, 0); |
3191 | 94 endif; |
3238 | 95 [mx, nx] = size (x); |
3191 | 96 if (mx != my) |
11472
1740012184f9
Use uppercase for variable names in error() strings to match Info documentation. Only m-files done.
Rik <octave@nomad.inbox5.com>
parents:
10635
diff
changeset
|
97 error ("logistic_regression: X and Y must have the same number of observations"); |
3191 | 98 endif |
3426 | 99 |
3191 | 100 ## initial calculations |
101 x = -x; | |
102 tol = 1e-6; incr = 10; decr = 2; | |
103 ymin = min (y); ymax = max (y); yrange = ymax - ymin; | |
104 z = (y * ones (1, yrange)) == ((y * 0 + 1) * (ymin : (ymax - 1))); | |
105 z1 = (y * ones (1, yrange)) == ((y * 0 + 1) * ((ymin + 1) : ymax)); | |
3426 | 106 z = z(:, any (z)); |
107 z1 = z1 (:, any(z1)); | |
3238 | 108 [mz, nz] = size (z); |
3426 | 109 |
3191 | 110 ## starting values |
111 if (nargin < 3) | |
3426 | 112 print = 0; |
3191 | 113 endif; |
3426 | 114 if (nargin < 4) |
115 beta = zeros (nx, 1); | |
3191 | 116 endif; |
3426 | 117 if (nargin < 5) |
118 g = cumsum (sum (z))' ./ my; | |
119 theta = log (g ./ (1 - g)); | |
3191 | 120 endif; |
121 tb = [theta; beta]; | |
122 | |
123 ## likelihood and derivatives at starting values | |
124 [g, g1, p, dev] = logistic_regression_likelihood (y, x, tb, z, z1); | |
125 [dl, d2l] = logistic_regression_derivatives (x, z, z1, g, g1, p); | |
126 epsilon = std (vec (d2l)) / 1000; | |
3426 | 127 |
3191 | 128 ## maximize likelihood using Levenberg modified Newton's method |
129 iter = 0; | |
130 while (abs (dl' * (d2l \ dl) / length (dl)) > tol) | |
131 iter = iter + 1; | |
132 tbold = tb; | |
133 devold = dev; | |
134 tb = tbold - d2l \ dl; | |
135 [g, g1, p, dev] = logistic_regression_likelihood (y, x, tb, z, z1); | |
136 if ((dev - devold) / (dl' * (tb - tbold)) < 0) | |
137 epsilon = epsilon / decr; | |
138 else | |
139 while ((dev - devold) / (dl' * (tb - tbold)) > 0) | |
3426 | 140 epsilon = epsilon * incr; |
3191 | 141 if (epsilon > 1e+15) |
10635
d1978e7364ad
Print name of function in error() string messages.
Rik <octave@nomad.inbox5.com>
parents:
9245
diff
changeset
|
142 error ("logistic_regression: epsilon too large"); |
3191 | 143 endif |
3426 | 144 tb = tbold - (d2l - epsilon * eye (size (d2l))) \ dl; |
145 [g, g1, p, dev] = logistic_regression_likelihood (y, x, tb, z, z1); | |
3191 | 146 disp ("epsilon"); disp (epsilon); |
147 endwhile | |
148 endif | |
149 [dl, d2l] = logistic_regression_derivatives (x, z, z1, g, g1, p); | |
150 if (print == 2) | |
151 disp ("Iteration"); disp (iter); | |
152 disp ("Deviance"); disp (dev); | |
153 disp ("First derivative"); disp (dl'); | |
154 disp ("Eigenvalues of second derivative"); disp (eig (d2l)'); | |
155 endif | |
156 endwhile | |
157 | |
158 ## tidy up output | |
159 | |
160 theta = tb (1 : nz, 1); | |
161 beta = tb ((nz + 1) : (nz + nx), 1); | |
162 | |
163 if (print >= 1) | |
164 printf ("\n"); | |
165 printf ("Logistic Regression Results:\n"); | |
3426 | 166 printf ("\n"); |
3456 | 167 printf ("Number of Iterations: %d\n", iter); |
168 printf ("Deviance: %f\n", dev); | |
3191 | 169 printf ("Parameter Estimates:\n"); |
170 printf (" Theta S.E.\n"); | |
3426 | 171 se = sqrt (diag (inv (-d2l))); |
3191 | 172 for i = 1 : nz |
173 printf (" %8.4f %8.4f\n", tb (i), se (i)); | |
174 endfor | |
175 if (nx > 0) | |
176 printf (" Beta S.E.\n"); | |
177 for i = (nz + 1) : (nz + nx) | |
3426 | 178 printf (" %8.4f %8.4f\n", tb (i), se (i)); |
3191 | 179 endfor |
180 endif | |
181 endif | |
182 | |
183 if (nargout == 6) | |
184 if (nx > 0) | |
185 e = ((x * beta) * ones (1, nz)) + ((y * 0 + 1) * theta'); | |
186 else | |
187 e = (y * 0 + 1) * theta'; | |
188 endif | |
3238 | 189 gamma = diff ([(y * 0), (exp (e) ./ (1 + exp (e))), (y * 0 + 1)]')'; |
3191 | 190 endif |
3426 | 191 |
3191 | 192 endfunction |
17338
1c89599167a6
maint: End m-files with 1 blank line.
Rik <rik@octave.org>
parents:
14138
diff
changeset
|
193 |