Mercurial > hg > octave-nkf
annotate liboctave/floatLU.cc @ 10514:40c58502a78b
improve conversion & copy ctors of sparse matrix
author | Jaroslav Hajek <highegg@gmail.com> |
---|---|
date | Tue, 13 Apr 2010 12:45:24 +0200 |
parents | 12884915a8e4 |
children | 141b3fb5cef7 |
rev | line source |
---|---|
7789
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
1 /* |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
2 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
3 Copyright (C) 1994, 1995, 1996, 1997, 1999, 2002, 2003, 2004, 2005, |
8920 | 4 2007, 2008 John W. Eaton |
9708 | 5 Copyright (C) 2009 VZLU Prague, a.s. |
7789
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
6 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
7 This file is part of Octave. |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
8 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
9 Octave is free software; you can redistribute it and/or modify it |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
10 under the terms of the GNU General Public License as published by the |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
11 Free Software Foundation; either version 3 of the License, or (at your |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
12 option) any later version. |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
13 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
14 Octave is distributed in the hope that it will be useful, but WITHOUT |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
15 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
16 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
17 for more details. |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
18 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
19 You should have received a copy of the GNU General Public License |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
20 along with Octave; see the file COPYING. If not, see |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
21 <http://www.gnu.org/licenses/>. |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
22 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
23 */ |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
24 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
25 #ifdef HAVE_CONFIG_H |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
26 #include <config.h> |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
27 #endif |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
28 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
29 #include "floatLU.h" |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
30 #include "f77-fcn.h" |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
31 #include "lo-error.h" |
9708 | 32 #include "oct-locbuf.h" |
33 #include "fColVector.h" | |
7789
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
34 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
35 // Instantiate the base LU class for the types we need. |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
36 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
37 #include <base-lu.h> |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
38 #include <base-lu.cc> |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
39 |
8367
445d27d79f4e
support permutation matrix objects
Jaroslav Hajek <highegg@gmail.com>
parents:
7810
diff
changeset
|
40 template class base_lu <FloatMatrix>; |
7789
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
41 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
42 // Define the constructor for this particular derivation. |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
43 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
44 extern "C" |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
45 { |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
46 F77_RET_T |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
47 F77_FUNC (sgetrf, SGETRF) (const octave_idx_type&, const octave_idx_type&, float*, |
10314
07ebe522dac2
untabify liboctave C++ sources
John W. Eaton <jwe@octave.org>
parents:
10158
diff
changeset
|
48 const octave_idx_type&, octave_idx_type*, octave_idx_type&); |
9708 | 49 |
50 #ifdef HAVE_QRUPDATE_LUU | |
51 F77_RET_T | |
52 F77_FUNC (slu1up, SLU1UP) (const octave_idx_type&, const octave_idx_type&, | |
53 float *, const octave_idx_type&, | |
54 float *, const octave_idx_type&, | |
55 float *, float *); | |
56 | |
57 F77_RET_T | |
58 F77_FUNC (slup1up, SLUP1UP) (const octave_idx_type&, const octave_idx_type&, | |
59 float *, const octave_idx_type&, | |
60 float *, const octave_idx_type&, | |
61 octave_idx_type *, const float *, | |
62 const float *, float *); | |
63 #endif | |
7789
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
64 } |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
65 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
66 FloatLU::FloatLU (const FloatMatrix& a) |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
67 { |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
68 octave_idx_type a_nr = a.rows (); |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
69 octave_idx_type a_nc = a.cols (); |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
70 octave_idx_type mn = (a_nr < a_nc ? a_nr : a_nc); |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
71 |
10350
12884915a8e4
merge MArray classes & improve Array interface
Jaroslav Hajek <highegg@gmail.com>
parents:
10314
diff
changeset
|
72 ipvt.resize (mn, 1); |
7789
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
73 octave_idx_type *pipvt = ipvt.fortran_vec (); |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
74 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
75 a_fact = a; |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
76 float *tmp_data = a_fact.fortran_vec (); |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
77 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
78 octave_idx_type info = 0; |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
79 |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
80 F77_XFCN (sgetrf, SGETRF, (a_nr, a_nc, tmp_data, a_nr, pipvt, info)); |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
81 |
9694
50db3c5175b5
allow unpacked form of LU
Jaroslav Hajek <highegg@gmail.com>
parents:
8920
diff
changeset
|
82 for (octave_idx_type i = 0; i < mn; i++) |
50db3c5175b5
allow unpacked form of LU
Jaroslav Hajek <highegg@gmail.com>
parents:
8920
diff
changeset
|
83 pipvt[i] -= 1; |
7789
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
84 } |
82be108cc558
First attempt at single precision tyeps
David Bateman <dbateman@free.fr>
parents:
diff
changeset
|
85 |
9708 | 86 #ifdef HAVE_QRUPDATE_LUU |
87 | |
88 void FloatLU::update (const FloatColumnVector& u, const FloatColumnVector& v) | |
89 { | |
90 if (packed ()) | |
91 unpack (); | |
92 | |
93 FloatMatrix& l = l_fact; | |
94 FloatMatrix& r = a_fact; | |
95 | |
96 octave_idx_type m = l.rows (); | |
97 octave_idx_type n = r.columns (); | |
98 octave_idx_type k = l.columns (); | |
99 | |
100 if (u.length () == m && v.length () == n) | |
101 { | |
102 FloatColumnVector utmp = u, vtmp = v; | |
103 F77_XFCN (slu1up, SLU1UP, (m, n, l.fortran_vec (), m, r.fortran_vec (), k, | |
104 utmp.fortran_vec (), vtmp.fortran_vec ())); | |
105 } | |
106 else | |
107 (*current_liboctave_error_handler) ("luupdate: dimensions mismatch"); | |
108 } | |
109 | |
110 void FloatLU::update (const FloatMatrix& u, const FloatMatrix& v) | |
111 { | |
112 if (packed ()) | |
113 unpack (); | |
114 | |
115 FloatMatrix& l = l_fact; | |
116 FloatMatrix& r = a_fact; | |
117 | |
118 octave_idx_type m = l.rows (); | |
119 octave_idx_type n = r.columns (); | |
120 octave_idx_type k = l.columns (); | |
121 | |
122 if (u.rows () == m && v.rows () == n && u.cols () == v.cols ()) | |
123 { | |
124 for (volatile octave_idx_type i = 0; i < u.cols (); i++) | |
125 { | |
126 FloatColumnVector utmp = u.column (i), vtmp = v.column (i); | |
127 F77_XFCN (slu1up, SLU1UP, (m, n, l.fortran_vec (), m, r.fortran_vec (), k, | |
128 utmp.fortran_vec (), vtmp.fortran_vec ())); | |
129 } | |
130 } | |
131 else | |
132 (*current_liboctave_error_handler) ("luupdate: dimensions mismatch"); | |
133 } | |
134 | |
135 void FloatLU::update_piv (const FloatColumnVector& u, const FloatColumnVector& v) | |
136 { | |
137 if (packed ()) | |
138 unpack (); | |
139 | |
140 FloatMatrix& l = l_fact; | |
141 FloatMatrix& r = a_fact; | |
142 | |
143 octave_idx_type m = l.rows (); | |
144 octave_idx_type n = r.columns (); | |
145 octave_idx_type k = l.columns (); | |
146 | |
147 if (u.length () == m && v.length () == n) | |
148 { | |
149 FloatColumnVector utmp = u, vtmp = v; | |
150 OCTAVE_LOCAL_BUFFER (float, w, m); | |
151 for (octave_idx_type i = 0; i < m; i++) ipvt(i) += 1; // increment | |
152 F77_XFCN (slup1up, SLUP1UP, (m, n, l.fortran_vec (), m, r.fortran_vec (), k, | |
153 ipvt.fortran_vec (), utmp.data (), vtmp.data (), w)); | |
154 for (octave_idx_type i = 0; i < m; i++) ipvt(i) -= 1; // decrement | |
155 } | |
156 else | |
157 (*current_liboctave_error_handler) ("luupdate: dimensions mismatch"); | |
158 } | |
159 | |
160 void FloatLU::update_piv (const FloatMatrix& u, const FloatMatrix& v) | |
161 { | |
162 if (packed ()) | |
163 unpack (); | |
164 | |
165 FloatMatrix& l = l_fact; | |
166 FloatMatrix& r = a_fact; | |
167 | |
168 octave_idx_type m = l.rows (); | |
169 octave_idx_type n = r.columns (); | |
170 octave_idx_type k = l.columns (); | |
171 | |
172 if (u.rows () == m && v.rows () == n && u.cols () == v.cols ()) | |
173 { | |
174 OCTAVE_LOCAL_BUFFER (float, w, m); | |
175 for (octave_idx_type i = 0; i < m; i++) ipvt(i) += 1; // increment | |
176 for (volatile octave_idx_type i = 0; i < u.cols (); i++) | |
177 { | |
178 FloatColumnVector utmp = u.column (i), vtmp = v.column (i); | |
179 F77_XFCN (slup1up, SLUP1UP, (m, n, l.fortran_vec (), m, r.fortran_vec (), k, | |
180 ipvt.fortran_vec (), utmp.data (), vtmp.data (), w)); | |
181 } | |
182 for (octave_idx_type i = 0; i < m; i++) ipvt(i) -= 1; // decrement | |
183 } | |
184 else | |
185 (*current_liboctave_error_handler) ("luupdate: dimensions mismatch"); | |
186 } | |
187 | |
188 #else | |
189 | |
190 void FloatLU::update (const FloatColumnVector&, const FloatColumnVector&) | |
191 { | |
192 (*current_liboctave_error_handler) ("luupdate: not available in this version"); | |
193 } | |
194 | |
195 void FloatLU::update (const FloatMatrix&, const FloatMatrix&) | |
196 { | |
197 (*current_liboctave_error_handler) ("luupdate: not available in this version"); | |
198 } | |
199 | |
200 void FloatLU::update_piv (const FloatColumnVector&, const FloatColumnVector&) | |
201 { | |
202 (*current_liboctave_error_handler) ("luupdate: not available in this version"); | |
203 } | |
204 | |
205 void FloatLU::update_piv (const FloatMatrix&, const FloatMatrix&) | |
206 { | |
207 (*current_liboctave_error_handler) ("luupdate: not available in this version"); | |
208 } | |
209 | |
210 #endif |