diff options
Diffstat (limited to 'packages/base/src/Internal')
-rw-r--r-- | packages/base/src/Internal/C/lapack-aux.c | 1686 | ||||
-rw-r--r-- | packages/base/src/Internal/C/lapack-aux.h | 82 | ||||
-rw-r--r-- | packages/base/src/Internal/C/vector-aux.c | 1134 |
3 files changed, 2902 insertions, 0 deletions
diff --git a/packages/base/src/Internal/C/lapack-aux.c b/packages/base/src/Internal/C/lapack-aux.c new file mode 100644 index 0000000..1402050 --- /dev/null +++ b/packages/base/src/Internal/C/lapack-aux.c | |||
@@ -0,0 +1,1686 @@ | |||
1 | #include <stdio.h> | ||
2 | #include <stdlib.h> | ||
3 | #include <string.h> | ||
4 | #include <math.h> | ||
5 | #include <time.h> | ||
6 | #include "lapack-aux.h" | ||
7 | |||
8 | #define MACRO(B) do {B} while (0) | ||
9 | #define ERROR(CODE) MACRO(return CODE;) | ||
10 | #define REQUIRES(COND, CODE) MACRO(if(!(COND)) {ERROR(CODE);}) | ||
11 | |||
12 | #define MIN(A,B) ((A)<(B)?(A):(B)) | ||
13 | #define MAX(A,B) ((A)>(B)?(A):(B)) | ||
14 | |||
15 | // #define DBGL | ||
16 | |||
17 | #ifdef DBGL | ||
18 | #define DEBUGMSG(M) printf("\nLAPACK "M"\n"); | ||
19 | #else | ||
20 | #define DEBUGMSG(M) | ||
21 | #endif | ||
22 | |||
23 | #define OK return 0; | ||
24 | |||
25 | // #ifdef DBGL | ||
26 | // #define DEBUGMSG(M) printf("LAPACK Wrapper "M"\n: "); size_t t0 = time(NULL); | ||
27 | // #define OK MACRO(printf("%ld s\n",time(0)-t0); return 0;); | ||
28 | // #else | ||
29 | // #define DEBUGMSG(M) | ||
30 | // #define OK return 0; | ||
31 | // #endif | ||
32 | |||
33 | #define TRACEMAT(M) {int q; printf(" %d x %d: ",M##r,M##c); \ | ||
34 | for(q=0;q<M##r*M##c;q++) printf("%.1f ",M##p[q]); printf("\n");} | ||
35 | |||
36 | #define CHECK(RES,CODE) MACRO(if(RES) return CODE;) | ||
37 | |||
38 | #define BAD_SIZE 2000 | ||
39 | #define BAD_CODE 2001 | ||
40 | #define MEM 2002 | ||
41 | #define BAD_FILE 2003 | ||
42 | #define SINGULAR 2004 | ||
43 | #define NOCONVER 2005 | ||
44 | #define NODEFPOS 2006 | ||
45 | #define NOSPRTD 2007 | ||
46 | |||
47 | //--------------------------------------- | ||
48 | void asm_finit() { | ||
49 | #ifdef i386 | ||
50 | |||
51 | // asm("finit"); | ||
52 | |||
53 | static unsigned char buf[108]; | ||
54 | asm("FSAVE %0":"=m" (buf)); | ||
55 | |||
56 | #if FPUDEBUG | ||
57 | if(buf[8]!=255 || buf[9]!=255) { // print warning in red | ||
58 | printf("%c[;31mWarning: FPU TAG = %x %x\%c[0m\n",0x1B,buf[8],buf[9],0x1B); | ||
59 | } | ||
60 | #endif | ||
61 | |||
62 | #if NANDEBUG | ||
63 | asm("FRSTOR %0":"=m" (buf)); | ||
64 | #endif | ||
65 | |||
66 | #endif | ||
67 | } | ||
68 | |||
69 | //--------------------------------------- | ||
70 | |||
71 | #if NANDEBUG | ||
72 | |||
73 | #define CHECKNANR(M,msg) \ | ||
74 | { int k; \ | ||
75 | for(k=0; k<(M##r * M##c); k++) { \ | ||
76 | if(M##p[k] != M##p[k]) { \ | ||
77 | printf(msg); \ | ||
78 | TRACEMAT(M) \ | ||
79 | /*exit(1);*/ \ | ||
80 | } \ | ||
81 | } \ | ||
82 | } | ||
83 | |||
84 | #define CHECKNANC(M,msg) \ | ||
85 | { int k; \ | ||
86 | for(k=0; k<(M##r * M##c); k++) { \ | ||
87 | if( M##p[k].r != M##p[k].r \ | ||
88 | || M##p[k].i != M##p[k].i) { \ | ||
89 | printf(msg); \ | ||
90 | /*exit(1);*/ \ | ||
91 | } \ | ||
92 | } \ | ||
93 | } | ||
94 | |||
95 | #else | ||
96 | #define CHECKNANC(M,msg) | ||
97 | #define CHECKNANR(M,msg) | ||
98 | #endif | ||
99 | |||
100 | //--------------------------------------- | ||
101 | |||
102 | //////////////////// real svd //////////////////////////////////// | ||
103 | |||
104 | /* Subroutine */ int dgesvd_(char *jobu, char *jobvt, integer *m, integer *n, | ||
105 | doublereal *a, integer *lda, doublereal *s, doublereal *u, integer * | ||
106 | ldu, doublereal *vt, integer *ldvt, doublereal *work, integer *lwork, | ||
107 | integer *info); | ||
108 | |||
109 | int svd_l_R(KDMAT(a),DMAT(u), DVEC(s),DMAT(v)) { | ||
110 | integer m = ar; | ||
111 | integer n = ac; | ||
112 | integer q = MIN(m,n); | ||
113 | REQUIRES(sn==q,BAD_SIZE); | ||
114 | REQUIRES(up==NULL || (ur==m && (uc==m || uc==q)),BAD_SIZE); | ||
115 | char* jobu = "A"; | ||
116 | if (up==NULL) { | ||
117 | jobu = "N"; | ||
118 | } else { | ||
119 | if (uc==q) { | ||
120 | jobu = "S"; | ||
121 | } | ||
122 | } | ||
123 | REQUIRES(vp==NULL || (vc==n && (vr==n || vr==q)),BAD_SIZE); | ||
124 | char* jobvt = "A"; | ||
125 | integer ldvt = n; | ||
126 | if (vp==NULL) { | ||
127 | jobvt = "N"; | ||
128 | } else { | ||
129 | if (vr==q) { | ||
130 | jobvt = "S"; | ||
131 | ldvt = q; | ||
132 | } | ||
133 | } | ||
134 | DEBUGMSG("svd_l_R"); | ||
135 | double *B = (double*)malloc(m*n*sizeof(double)); | ||
136 | CHECK(!B,MEM); | ||
137 | memcpy(B,ap,m*n*sizeof(double)); | ||
138 | integer lwork = -1; | ||
139 | integer res; | ||
140 | // ask for optimal lwork | ||
141 | double ans; | ||
142 | dgesvd_ (jobu,jobvt, | ||
143 | &m,&n,B,&m, | ||
144 | sp, | ||
145 | up,&m, | ||
146 | vp,&ldvt, | ||
147 | &ans, &lwork, | ||
148 | &res); | ||
149 | lwork = ceil(ans); | ||
150 | double * work = (double*)malloc(lwork*sizeof(double)); | ||
151 | CHECK(!work,MEM); | ||
152 | dgesvd_ (jobu,jobvt, | ||
153 | &m,&n,B,&m, | ||
154 | sp, | ||
155 | up,&m, | ||
156 | vp,&ldvt, | ||
157 | work, &lwork, | ||
158 | &res); | ||
159 | CHECK(res,res); | ||
160 | free(work); | ||
161 | free(B); | ||
162 | OK | ||
163 | } | ||
164 | |||
165 | // (alternative version) | ||
166 | |||
167 | /* Subroutine */ int dgesdd_(char *jobz, integer *m, integer *n, doublereal * | ||
168 | a, integer *lda, doublereal *s, doublereal *u, integer *ldu, | ||
169 | doublereal *vt, integer *ldvt, doublereal *work, integer *lwork, | ||
170 | integer *iwork, integer *info); | ||
171 | |||
172 | int svd_l_Rdd(KDMAT(a),DMAT(u), DVEC(s),DMAT(v)) { | ||
173 | integer m = ar; | ||
174 | integer n = ac; | ||
175 | integer q = MIN(m,n); | ||
176 | REQUIRES(sn==q,BAD_SIZE); | ||
177 | REQUIRES((up == NULL && vp == NULL) | ||
178 | || (ur==m && vc==n | ||
179 | && ((uc == q && vr == q) | ||
180 | || (uc == m && vc==n))),BAD_SIZE); | ||
181 | char* jobz = "A"; | ||
182 | integer ldvt = n; | ||
183 | if (up==NULL) { | ||
184 | jobz = "N"; | ||
185 | } else { | ||
186 | if (uc==q && vr == q) { | ||
187 | jobz = "S"; | ||
188 | ldvt = q; | ||
189 | } | ||
190 | } | ||
191 | DEBUGMSG("svd_l_Rdd"); | ||
192 | double *B = (double*)malloc(m*n*sizeof(double)); | ||
193 | CHECK(!B,MEM); | ||
194 | memcpy(B,ap,m*n*sizeof(double)); | ||
195 | integer* iwk = (integer*) malloc(8*q*sizeof(integer)); | ||
196 | CHECK(!iwk,MEM); | ||
197 | integer lwk = -1; | ||
198 | integer res; | ||
199 | // ask for optimal lwk | ||
200 | double ans; | ||
201 | dgesdd_ (jobz,&m,&n,B,&m,sp,up,&m,vp,&ldvt,&ans,&lwk,iwk,&res); | ||
202 | lwk = ans; | ||
203 | double * workv = (double*)malloc(lwk*sizeof(double)); | ||
204 | CHECK(!workv,MEM); | ||
205 | dgesdd_ (jobz,&m,&n,B,&m,sp,up,&m,vp,&ldvt,workv,&lwk,iwk,&res); | ||
206 | CHECK(res,res); | ||
207 | free(iwk); | ||
208 | free(workv); | ||
209 | free(B); | ||
210 | OK | ||
211 | } | ||
212 | |||
213 | //////////////////// complex svd //////////////////////////////////// | ||
214 | |||
215 | // not in clapack.h | ||
216 | |||
217 | int zgesvd_(char *jobu, char *jobvt, integer *m, integer *n, | ||
218 | doublecomplex *a, integer *lda, doublereal *s, doublecomplex *u, | ||
219 | integer *ldu, doublecomplex *vt, integer *ldvt, doublecomplex *work, | ||
220 | integer *lwork, doublereal *rwork, integer *info); | ||
221 | |||
222 | int svd_l_C(KCMAT(a),CMAT(u), DVEC(s),CMAT(v)) { | ||
223 | integer m = ar; | ||
224 | integer n = ac; | ||
225 | integer q = MIN(m,n); | ||
226 | REQUIRES(sn==q,BAD_SIZE); | ||
227 | REQUIRES(up==NULL || (ur==m && (uc==m || uc==q)),BAD_SIZE); | ||
228 | char* jobu = "A"; | ||
229 | if (up==NULL) { | ||
230 | jobu = "N"; | ||
231 | } else { | ||
232 | if (uc==q) { | ||
233 | jobu = "S"; | ||
234 | } | ||
235 | } | ||
236 | REQUIRES(vp==NULL || (vc==n && (vr==n || vr==q)),BAD_SIZE); | ||
237 | char* jobvt = "A"; | ||
238 | integer ldvt = n; | ||
239 | if (vp==NULL) { | ||
240 | jobvt = "N"; | ||
241 | } else { | ||
242 | if (vr==q) { | ||
243 | jobvt = "S"; | ||
244 | ldvt = q; | ||
245 | } | ||
246 | }DEBUGMSG("svd_l_C"); | ||
247 | doublecomplex *B = (doublecomplex*)malloc(m*n*sizeof(doublecomplex)); | ||
248 | CHECK(!B,MEM); | ||
249 | memcpy(B,ap,m*n*sizeof(doublecomplex)); | ||
250 | |||
251 | double *rwork = (double*) malloc(5*q*sizeof(double)); | ||
252 | CHECK(!rwork,MEM); | ||
253 | integer lwork = -1; | ||
254 | integer res; | ||
255 | // ask for optimal lwork | ||
256 | doublecomplex ans; | ||
257 | zgesvd_ (jobu,jobvt, | ||
258 | &m,&n,B,&m, | ||
259 | sp, | ||
260 | up,&m, | ||
261 | vp,&ldvt, | ||
262 | &ans, &lwork, | ||
263 | rwork, | ||
264 | &res); | ||
265 | lwork = ceil(ans.r); | ||
266 | doublecomplex * work = (doublecomplex*)malloc(lwork*sizeof(doublecomplex)); | ||
267 | CHECK(!work,MEM); | ||
268 | zgesvd_ (jobu,jobvt, | ||
269 | &m,&n,B,&m, | ||
270 | sp, | ||
271 | up,&m, | ||
272 | vp,&ldvt, | ||
273 | work, &lwork, | ||
274 | rwork, | ||
275 | &res); | ||
276 | CHECK(res,res); | ||
277 | free(work); | ||
278 | free(rwork); | ||
279 | free(B); | ||
280 | OK | ||
281 | } | ||
282 | |||
283 | int zgesdd_ (char *jobz, integer *m, integer *n, | ||
284 | doublecomplex *a, integer *lda, doublereal *s, doublecomplex *u, | ||
285 | integer *ldu, doublecomplex *vt, integer *ldvt, doublecomplex *work, | ||
286 | integer *lwork, doublereal *rwork, integer* iwork, integer *info); | ||
287 | |||
288 | int svd_l_Cdd(KCMAT(a),CMAT(u), DVEC(s),CMAT(v)) { | ||
289 | //printf("entro\n"); | ||
290 | integer m = ar; | ||
291 | integer n = ac; | ||
292 | integer q = MIN(m,n); | ||
293 | REQUIRES(sn==q,BAD_SIZE); | ||
294 | REQUIRES((up == NULL && vp == NULL) | ||
295 | || (ur==m && vc==n | ||
296 | && ((uc == q && vr == q) | ||
297 | || (uc == m && vc==n))),BAD_SIZE); | ||
298 | char* jobz = "A"; | ||
299 | integer ldvt = n; | ||
300 | if (up==NULL) { | ||
301 | jobz = "N"; | ||
302 | } else { | ||
303 | if (uc==q && vr == q) { | ||
304 | jobz = "S"; | ||
305 | ldvt = q; | ||
306 | } | ||
307 | } | ||
308 | DEBUGMSG("svd_l_Cdd"); | ||
309 | doublecomplex *B = (doublecomplex*)malloc(m*n*sizeof(doublecomplex)); | ||
310 | CHECK(!B,MEM); | ||
311 | memcpy(B,ap,m*n*sizeof(doublecomplex)); | ||
312 | integer* iwk = (integer*) malloc(8*q*sizeof(integer)); | ||
313 | CHECK(!iwk,MEM); | ||
314 | int lrwk; | ||
315 | if (0 && *jobz == 'N') { | ||
316 | lrwk = 5*q; // does not work, crash at free below | ||
317 | } else { | ||
318 | lrwk = 5*q*q + 7*q; | ||
319 | } | ||
320 | double *rwk = (double*)malloc(lrwk*sizeof(double));; | ||
321 | CHECK(!rwk,MEM); | ||
322 | //printf("%s %ld %d\n",jobz,q,lrwk); | ||
323 | integer lwk = -1; | ||
324 | integer res; | ||
325 | // ask for optimal lwk | ||
326 | doublecomplex ans; | ||
327 | zgesdd_ (jobz,&m,&n,B,&m,sp,up,&m,vp,&ldvt,&ans,&lwk,rwk,iwk,&res); | ||
328 | lwk = ans.r; | ||
329 | //printf("lwk = %ld\n",lwk); | ||
330 | doublecomplex * workv = (doublecomplex*)malloc(lwk*sizeof(doublecomplex)); | ||
331 | CHECK(!workv,MEM); | ||
332 | zgesdd_ (jobz,&m,&n,B,&m,sp,up,&m,vp,&ldvt,workv,&lwk,rwk,iwk,&res); | ||
333 | //printf("res = %ld\n",res); | ||
334 | CHECK(res,res); | ||
335 | free(workv); // printf("freed workv\n"); | ||
336 | free(rwk); // printf("freed rwk\n"); | ||
337 | free(iwk); // printf("freed iwk\n"); | ||
338 | free(B); // printf("freed B, salgo\n"); | ||
339 | OK | ||
340 | } | ||
341 | |||
342 | //////////////////// general complex eigensystem //////////// | ||
343 | |||
344 | /* Subroutine */ int zgeev_(char *jobvl, char *jobvr, integer *n, | ||
345 | doublecomplex *a, integer *lda, doublecomplex *w, doublecomplex *vl, | ||
346 | integer *ldvl, doublecomplex *vr, integer *ldvr, doublecomplex *work, | ||
347 | integer *lwork, doublereal *rwork, integer *info); | ||
348 | |||
349 | int eig_l_C(KCMAT(a), CMAT(u), CVEC(s),CMAT(v)) { | ||
350 | integer n = ar; | ||
351 | REQUIRES(ac==n && sn==n, BAD_SIZE); | ||
352 | REQUIRES(up==NULL || (ur==n && uc==n), BAD_SIZE); | ||
353 | char jobvl = up==NULL?'N':'V'; | ||
354 | REQUIRES(vp==NULL || (vr==n && vc==n), BAD_SIZE); | ||
355 | char jobvr = vp==NULL?'N':'V'; | ||
356 | DEBUGMSG("eig_l_C"); | ||
357 | doublecomplex *B = (doublecomplex*)malloc(n*n*sizeof(doublecomplex)); | ||
358 | CHECK(!B,MEM); | ||
359 | memcpy(B,ap,n*n*sizeof(doublecomplex)); | ||
360 | double *rwork = (double*) malloc(2*n*sizeof(double)); | ||
361 | CHECK(!rwork,MEM); | ||
362 | integer lwork = -1; | ||
363 | integer res; | ||
364 | // ask for optimal lwork | ||
365 | doublecomplex ans; | ||
366 | //printf("ask zgeev\n"); | ||
367 | zgeev_ (&jobvl,&jobvr, | ||
368 | &n,B,&n, | ||
369 | sp, | ||
370 | up,&n, | ||
371 | vp,&n, | ||
372 | &ans, &lwork, | ||
373 | rwork, | ||
374 | &res); | ||
375 | lwork = ceil(ans.r); | ||
376 | //printf("ans = %d\n",lwork); | ||
377 | doublecomplex * work = (doublecomplex*)malloc(lwork*sizeof(doublecomplex)); | ||
378 | CHECK(!work,MEM); | ||
379 | //printf("zgeev\n"); | ||
380 | zgeev_ (&jobvl,&jobvr, | ||
381 | &n,B,&n, | ||
382 | sp, | ||
383 | up,&n, | ||
384 | vp,&n, | ||
385 | work, &lwork, | ||
386 | rwork, | ||
387 | &res); | ||
388 | CHECK(res,res); | ||
389 | free(work); | ||
390 | free(rwork); | ||
391 | free(B); | ||
392 | OK | ||
393 | } | ||
394 | |||
395 | |||
396 | |||
397 | //////////////////// general real eigensystem //////////// | ||
398 | |||
399 | /* Subroutine */ int dgeev_(char *jobvl, char *jobvr, integer *n, doublereal * | ||
400 | a, integer *lda, doublereal *wr, doublereal *wi, doublereal *vl, | ||
401 | integer *ldvl, doublereal *vr, integer *ldvr, doublereal *work, | ||
402 | integer *lwork, integer *info); | ||
403 | |||
404 | int eig_l_R(KDMAT(a),DMAT(u), CVEC(s),DMAT(v)) { | ||
405 | integer n = ar; | ||
406 | REQUIRES(ac==n && sn==n, BAD_SIZE); | ||
407 | REQUIRES(up==NULL || (ur==n && uc==n), BAD_SIZE); | ||
408 | char jobvl = up==NULL?'N':'V'; | ||
409 | REQUIRES(vp==NULL || (vr==n && vc==n), BAD_SIZE); | ||
410 | char jobvr = vp==NULL?'N':'V'; | ||
411 | DEBUGMSG("eig_l_R"); | ||
412 | double *B = (double*)malloc(n*n*sizeof(double)); | ||
413 | CHECK(!B,MEM); | ||
414 | memcpy(B,ap,n*n*sizeof(double)); | ||
415 | integer lwork = -1; | ||
416 | integer res; | ||
417 | // ask for optimal lwork | ||
418 | double ans; | ||
419 | //printf("ask dgeev\n"); | ||
420 | dgeev_ (&jobvl,&jobvr, | ||
421 | &n,B,&n, | ||
422 | (double*)sp, (double*)sp+n, | ||
423 | up,&n, | ||
424 | vp,&n, | ||
425 | &ans, &lwork, | ||
426 | &res); | ||
427 | lwork = ceil(ans); | ||
428 | //printf("ans = %d\n",lwork); | ||
429 | double * work = (double*)malloc(lwork*sizeof(double)); | ||
430 | CHECK(!work,MEM); | ||
431 | //printf("dgeev\n"); | ||
432 | dgeev_ (&jobvl,&jobvr, | ||
433 | &n,B,&n, | ||
434 | (double*)sp, (double*)sp+n, | ||
435 | up,&n, | ||
436 | vp,&n, | ||
437 | work, &lwork, | ||
438 | &res); | ||
439 | CHECK(res,res); | ||
440 | free(work); | ||
441 | free(B); | ||
442 | OK | ||
443 | } | ||
444 | |||
445 | |||
446 | //////////////////// symmetric real eigensystem //////////// | ||
447 | |||
448 | /* Subroutine */ int dsyev_(char *jobz, char *uplo, integer *n, doublereal *a, | ||
449 | integer *lda, doublereal *w, doublereal *work, integer *lwork, | ||
450 | integer *info); | ||
451 | |||
452 | int eig_l_S(int wantV,KDMAT(a),DVEC(s),DMAT(v)) { | ||
453 | integer n = ar; | ||
454 | REQUIRES(ac==n && sn==n, BAD_SIZE); | ||
455 | REQUIRES(vr==n && vc==n, BAD_SIZE); | ||
456 | char jobz = wantV?'V':'N'; | ||
457 | DEBUGMSG("eig_l_S"); | ||
458 | memcpy(vp,ap,n*n*sizeof(double)); | ||
459 | integer lwork = -1; | ||
460 | char uplo = 'U'; | ||
461 | integer res; | ||
462 | // ask for optimal lwork | ||
463 | double ans; | ||
464 | //printf("ask dsyev\n"); | ||
465 | dsyev_ (&jobz,&uplo, | ||
466 | &n,vp,&n, | ||
467 | sp, | ||
468 | &ans, &lwork, | ||
469 | &res); | ||
470 | lwork = ceil(ans); | ||
471 | //printf("ans = %d\n",lwork); | ||
472 | double * work = (double*)malloc(lwork*sizeof(double)); | ||
473 | CHECK(!work,MEM); | ||
474 | dsyev_ (&jobz,&uplo, | ||
475 | &n,vp,&n, | ||
476 | sp, | ||
477 | work, &lwork, | ||
478 | &res); | ||
479 | CHECK(res,res); | ||
480 | free(work); | ||
481 | OK | ||
482 | } | ||
483 | |||
484 | //////////////////// hermitian complex eigensystem //////////// | ||
485 | |||
486 | /* Subroutine */ int zheev_(char *jobz, char *uplo, integer *n, doublecomplex | ||
487 | *a, integer *lda, doublereal *w, doublecomplex *work, integer *lwork, | ||
488 | doublereal *rwork, integer *info); | ||
489 | |||
490 | int eig_l_H(int wantV,KCMAT(a),DVEC(s),CMAT(v)) { | ||
491 | integer n = ar; | ||
492 | REQUIRES(ac==n && sn==n, BAD_SIZE); | ||
493 | REQUIRES(vr==n && vc==n, BAD_SIZE); | ||
494 | char jobz = wantV?'V':'N'; | ||
495 | DEBUGMSG("eig_l_H"); | ||
496 | memcpy(vp,ap,2*n*n*sizeof(double)); | ||
497 | double *rwork = (double*) malloc((3*n-2)*sizeof(double)); | ||
498 | CHECK(!rwork,MEM); | ||
499 | integer lwork = -1; | ||
500 | char uplo = 'U'; | ||
501 | integer res; | ||
502 | // ask for optimal lwork | ||
503 | doublecomplex ans; | ||
504 | //printf("ask zheev\n"); | ||
505 | zheev_ (&jobz,&uplo, | ||
506 | &n,vp,&n, | ||
507 | sp, | ||
508 | &ans, &lwork, | ||
509 | rwork, | ||
510 | &res); | ||
511 | lwork = ceil(ans.r); | ||
512 | //printf("ans = %d\n",lwork); | ||
513 | doublecomplex * work = (doublecomplex*)malloc(lwork*sizeof(doublecomplex)); | ||
514 | CHECK(!work,MEM); | ||
515 | zheev_ (&jobz,&uplo, | ||
516 | &n,vp,&n, | ||
517 | sp, | ||
518 | work, &lwork, | ||
519 | rwork, | ||
520 | &res); | ||
521 | CHECK(res,res); | ||
522 | free(work); | ||
523 | free(rwork); | ||
524 | OK | ||
525 | } | ||
526 | |||
527 | //////////////////// general real linear system //////////// | ||
528 | |||
529 | /* Subroutine */ int dgesv_(integer *n, integer *nrhs, doublereal *a, integer | ||
530 | *lda, integer *ipiv, doublereal *b, integer *ldb, integer *info); | ||
531 | |||
532 | int linearSolveR_l(KDMAT(a),KDMAT(b),DMAT(x)) { | ||
533 | integer n = ar; | ||
534 | integer nhrs = bc; | ||
535 | REQUIRES(n>=1 && ar==ac && ar==br,BAD_SIZE); | ||
536 | DEBUGMSG("linearSolveR_l"); | ||
537 | double*AC = (double*)malloc(n*n*sizeof(double)); | ||
538 | memcpy(AC,ap,n*n*sizeof(double)); | ||
539 | memcpy(xp,bp,n*nhrs*sizeof(double)); | ||
540 | integer * ipiv = (integer*)malloc(n*sizeof(integer)); | ||
541 | integer res; | ||
542 | dgesv_ (&n,&nhrs, | ||
543 | AC, &n, | ||
544 | ipiv, | ||
545 | xp, &n, | ||
546 | &res); | ||
547 | if(res>0) { | ||
548 | return SINGULAR; | ||
549 | } | ||
550 | CHECK(res,res); | ||
551 | free(ipiv); | ||
552 | free(AC); | ||
553 | OK | ||
554 | } | ||
555 | |||
556 | //////////////////// general complex linear system //////////// | ||
557 | |||
558 | /* Subroutine */ int zgesv_(integer *n, integer *nrhs, doublecomplex *a, | ||
559 | integer *lda, integer *ipiv, doublecomplex *b, integer *ldb, integer * | ||
560 | info); | ||
561 | |||
562 | int linearSolveC_l(KCMAT(a),KCMAT(b),CMAT(x)) { | ||
563 | integer n = ar; | ||
564 | integer nhrs = bc; | ||
565 | REQUIRES(n>=1 && ar==ac && ar==br,BAD_SIZE); | ||
566 | DEBUGMSG("linearSolveC_l"); | ||
567 | doublecomplex*AC = (doublecomplex*)malloc(n*n*sizeof(doublecomplex)); | ||
568 | memcpy(AC,ap,n*n*sizeof(doublecomplex)); | ||
569 | memcpy(xp,bp,n*nhrs*sizeof(doublecomplex)); | ||
570 | integer * ipiv = (integer*)malloc(n*sizeof(integer)); | ||
571 | integer res; | ||
572 | zgesv_ (&n,&nhrs, | ||
573 | AC, &n, | ||
574 | ipiv, | ||
575 | xp, &n, | ||
576 | &res); | ||
577 | if(res>0) { | ||
578 | return SINGULAR; | ||
579 | } | ||
580 | CHECK(res,res); | ||
581 | free(ipiv); | ||
582 | free(AC); | ||
583 | OK | ||
584 | } | ||
585 | |||
586 | //////// symmetric positive definite real linear system using Cholesky //////////// | ||
587 | |||
588 | /* Subroutine */ int dpotrs_(char *uplo, integer *n, integer *nrhs, | ||
589 | doublereal *a, integer *lda, doublereal *b, integer *ldb, integer * | ||
590 | info); | ||
591 | |||
592 | int cholSolveR_l(KDMAT(a),KDMAT(b),DMAT(x)) { | ||
593 | integer n = ar; | ||
594 | integer nhrs = bc; | ||
595 | REQUIRES(n>=1 && ar==ac && ar==br,BAD_SIZE); | ||
596 | DEBUGMSG("cholSolveR_l"); | ||
597 | memcpy(xp,bp,n*nhrs*sizeof(double)); | ||
598 | integer res; | ||
599 | dpotrs_ ("U", | ||
600 | &n,&nhrs, | ||
601 | (double*)ap, &n, | ||
602 | xp, &n, | ||
603 | &res); | ||
604 | CHECK(res,res); | ||
605 | OK | ||
606 | } | ||
607 | |||
608 | //////// Hermitian positive definite real linear system using Cholesky //////////// | ||
609 | |||
610 | /* Subroutine */ int zpotrs_(char *uplo, integer *n, integer *nrhs, | ||
611 | doublecomplex *a, integer *lda, doublecomplex *b, integer *ldb, | ||
612 | integer *info); | ||
613 | |||
614 | int cholSolveC_l(KCMAT(a),KCMAT(b),CMAT(x)) { | ||
615 | integer n = ar; | ||
616 | integer nhrs = bc; | ||
617 | REQUIRES(n>=1 && ar==ac && ar==br,BAD_SIZE); | ||
618 | DEBUGMSG("cholSolveC_l"); | ||
619 | memcpy(xp,bp,n*nhrs*sizeof(doublecomplex)); | ||
620 | integer res; | ||
621 | zpotrs_ ("U", | ||
622 | &n,&nhrs, | ||
623 | (doublecomplex*)ap, &n, | ||
624 | xp, &n, | ||
625 | &res); | ||
626 | CHECK(res,res); | ||
627 | OK | ||
628 | } | ||
629 | |||
630 | //////////////////// least squares real linear system //////////// | ||
631 | |||
632 | /* Subroutine */ int dgels_(char *trans, integer *m, integer *n, integer * | ||
633 | nrhs, doublereal *a, integer *lda, doublereal *b, integer *ldb, | ||
634 | doublereal *work, integer *lwork, integer *info); | ||
635 | |||
636 | int linearSolveLSR_l(KDMAT(a),KDMAT(b),DMAT(x)) { | ||
637 | integer m = ar; | ||
638 | integer n = ac; | ||
639 | integer nrhs = bc; | ||
640 | integer ldb = xr; | ||
641 | REQUIRES(m>=1 && n>=1 && ar==br && xr==MAX(m,n) && xc == bc, BAD_SIZE); | ||
642 | DEBUGMSG("linearSolveLSR_l"); | ||
643 | double*AC = (double*)malloc(m*n*sizeof(double)); | ||
644 | memcpy(AC,ap,m*n*sizeof(double)); | ||
645 | if (m>=n) { | ||
646 | memcpy(xp,bp,m*nrhs*sizeof(double)); | ||
647 | } else { | ||
648 | int k; | ||
649 | for(k = 0; k<nrhs; k++) { | ||
650 | memcpy(xp+ldb*k,bp+m*k,m*sizeof(double)); | ||
651 | } | ||
652 | } | ||
653 | integer res; | ||
654 | integer lwork = -1; | ||
655 | double ans; | ||
656 | dgels_ ("N",&m,&n,&nrhs, | ||
657 | AC,&m, | ||
658 | xp,&ldb, | ||
659 | &ans,&lwork, | ||
660 | &res); | ||
661 | lwork = ceil(ans); | ||
662 | //printf("ans = %d\n",lwork); | ||
663 | double * work = (double*)malloc(lwork*sizeof(double)); | ||
664 | dgels_ ("N",&m,&n,&nrhs, | ||
665 | AC,&m, | ||
666 | xp,&ldb, | ||
667 | work,&lwork, | ||
668 | &res); | ||
669 | if(res>0) { | ||
670 | return SINGULAR; | ||
671 | } | ||
672 | CHECK(res,res); | ||
673 | free(work); | ||
674 | free(AC); | ||
675 | OK | ||
676 | } | ||
677 | |||
678 | //////////////////// least squares complex linear system //////////// | ||
679 | |||
680 | /* Subroutine */ int zgels_(char *trans, integer *m, integer *n, integer * | ||
681 | nrhs, doublecomplex *a, integer *lda, doublecomplex *b, integer *ldb, | ||
682 | doublecomplex *work, integer *lwork, integer *info); | ||
683 | |||
684 | int linearSolveLSC_l(KCMAT(a),KCMAT(b),CMAT(x)) { | ||
685 | integer m = ar; | ||
686 | integer n = ac; | ||
687 | integer nrhs = bc; | ||
688 | integer ldb = xr; | ||
689 | REQUIRES(m>=1 && n>=1 && ar==br && xr==MAX(m,n) && xc == bc, BAD_SIZE); | ||
690 | DEBUGMSG("linearSolveLSC_l"); | ||
691 | doublecomplex*AC = (doublecomplex*)malloc(m*n*sizeof(doublecomplex)); | ||
692 | memcpy(AC,ap,m*n*sizeof(doublecomplex)); | ||
693 | if (m>=n) { | ||
694 | memcpy(xp,bp,m*nrhs*sizeof(doublecomplex)); | ||
695 | } else { | ||
696 | int k; | ||
697 | for(k = 0; k<nrhs; k++) { | ||
698 | memcpy(xp+ldb*k,bp+m*k,m*sizeof(doublecomplex)); | ||
699 | } | ||
700 | } | ||
701 | integer res; | ||
702 | integer lwork = -1; | ||
703 | doublecomplex ans; | ||
704 | zgels_ ("N",&m,&n,&nrhs, | ||
705 | AC,&m, | ||
706 | xp,&ldb, | ||
707 | &ans,&lwork, | ||
708 | &res); | ||
709 | lwork = ceil(ans.r); | ||
710 | //printf("ans = %d\n",lwork); | ||
711 | doublecomplex * work = (doublecomplex*)malloc(lwork*sizeof(doublecomplex)); | ||
712 | zgels_ ("N",&m,&n,&nrhs, | ||
713 | AC,&m, | ||
714 | xp,&ldb, | ||
715 | work,&lwork, | ||
716 | &res); | ||
717 | if(res>0) { | ||
718 | return SINGULAR; | ||
719 | } | ||
720 | CHECK(res,res); | ||
721 | free(work); | ||
722 | free(AC); | ||
723 | OK | ||
724 | } | ||
725 | |||
726 | //////////////////// least squares real linear system using SVD //////////// | ||
727 | |||
728 | /* Subroutine */ int dgelss_(integer *m, integer *n, integer *nrhs, | ||
729 | doublereal *a, integer *lda, doublereal *b, integer *ldb, doublereal * | ||
730 | s, doublereal *rcond, integer *rank, doublereal *work, integer *lwork, | ||
731 | integer *info); | ||
732 | |||
733 | int linearSolveSVDR_l(double rcond,KDMAT(a),KDMAT(b),DMAT(x)) { | ||
734 | integer m = ar; | ||
735 | integer n = ac; | ||
736 | integer nrhs = bc; | ||
737 | integer ldb = xr; | ||
738 | REQUIRES(m>=1 && n>=1 && ar==br && xr==MAX(m,n) && xc == bc, BAD_SIZE); | ||
739 | DEBUGMSG("linearSolveSVDR_l"); | ||
740 | double*AC = (double*)malloc(m*n*sizeof(double)); | ||
741 | double*S = (double*)malloc(MIN(m,n)*sizeof(double)); | ||
742 | memcpy(AC,ap,m*n*sizeof(double)); | ||
743 | if (m>=n) { | ||
744 | memcpy(xp,bp,m*nrhs*sizeof(double)); | ||
745 | } else { | ||
746 | int k; | ||
747 | for(k = 0; k<nrhs; k++) { | ||
748 | memcpy(xp+ldb*k,bp+m*k,m*sizeof(double)); | ||
749 | } | ||
750 | } | ||
751 | integer res; | ||
752 | integer lwork = -1; | ||
753 | integer rank; | ||
754 | double ans; | ||
755 | dgelss_ (&m,&n,&nrhs, | ||
756 | AC,&m, | ||
757 | xp,&ldb, | ||
758 | S, | ||
759 | &rcond,&rank, | ||
760 | &ans,&lwork, | ||
761 | &res); | ||
762 | lwork = ceil(ans); | ||
763 | //printf("ans = %d\n",lwork); | ||
764 | double * work = (double*)malloc(lwork*sizeof(double)); | ||
765 | dgelss_ (&m,&n,&nrhs, | ||
766 | AC,&m, | ||
767 | xp,&ldb, | ||
768 | S, | ||
769 | &rcond,&rank, | ||
770 | work,&lwork, | ||
771 | &res); | ||
772 | if(res>0) { | ||
773 | return NOCONVER; | ||
774 | } | ||
775 | CHECK(res,res); | ||
776 | free(work); | ||
777 | free(S); | ||
778 | free(AC); | ||
779 | OK | ||
780 | } | ||
781 | |||
782 | //////////////////// least squares complex linear system using SVD //////////// | ||
783 | |||
784 | // not in clapack.h | ||
785 | |||
786 | int zgelss_(integer *m, integer *n, integer *nhrs, | ||
787 | doublecomplex *a, integer *lda, doublecomplex *b, integer *ldb, doublereal *s, | ||
788 | doublereal *rcond, integer* rank, | ||
789 | doublecomplex *work, integer* lwork, doublereal* rwork, | ||
790 | integer *info); | ||
791 | |||
792 | int linearSolveSVDC_l(double rcond, KCMAT(a),KCMAT(b),CMAT(x)) { | ||
793 | integer m = ar; | ||
794 | integer n = ac; | ||
795 | integer nrhs = bc; | ||
796 | integer ldb = xr; | ||
797 | REQUIRES(m>=1 && n>=1 && ar==br && xr==MAX(m,n) && xc == bc, BAD_SIZE); | ||
798 | DEBUGMSG("linearSolveSVDC_l"); | ||
799 | doublecomplex*AC = (doublecomplex*)malloc(m*n*sizeof(doublecomplex)); | ||
800 | double*S = (double*)malloc(MIN(m,n)*sizeof(double)); | ||
801 | double*RWORK = (double*)malloc(5*MIN(m,n)*sizeof(double)); | ||
802 | memcpy(AC,ap,m*n*sizeof(doublecomplex)); | ||
803 | if (m>=n) { | ||
804 | memcpy(xp,bp,m*nrhs*sizeof(doublecomplex)); | ||
805 | } else { | ||
806 | int k; | ||
807 | for(k = 0; k<nrhs; k++) { | ||
808 | memcpy(xp+ldb*k,bp+m*k,m*sizeof(doublecomplex)); | ||
809 | } | ||
810 | } | ||
811 | integer res; | ||
812 | integer lwork = -1; | ||
813 | integer rank; | ||
814 | doublecomplex ans; | ||
815 | zgelss_ (&m,&n,&nrhs, | ||
816 | AC,&m, | ||
817 | xp,&ldb, | ||
818 | S, | ||
819 | &rcond,&rank, | ||
820 | &ans,&lwork, | ||
821 | RWORK, | ||
822 | &res); | ||
823 | lwork = ceil(ans.r); | ||
824 | //printf("ans = %d\n",lwork); | ||
825 | doublecomplex * work = (doublecomplex*)malloc(lwork*sizeof(doublecomplex)); | ||
826 | zgelss_ (&m,&n,&nrhs, | ||
827 | AC,&m, | ||
828 | xp,&ldb, | ||
829 | S, | ||
830 | &rcond,&rank, | ||
831 | work,&lwork, | ||
832 | RWORK, | ||
833 | &res); | ||
834 | if(res>0) { | ||
835 | return NOCONVER; | ||
836 | } | ||
837 | CHECK(res,res); | ||
838 | free(work); | ||
839 | free(RWORK); | ||
840 | free(S); | ||
841 | free(AC); | ||
842 | OK | ||
843 | } | ||
844 | |||
845 | //////////////////// Cholesky factorization ///////////////////////// | ||
846 | |||
847 | /* Subroutine */ int zpotrf_(char *uplo, integer *n, doublecomplex *a, | ||
848 | integer *lda, integer *info); | ||
849 | |||
850 | int chol_l_H(KCMAT(a),CMAT(l)) { | ||
851 | integer n = ar; | ||
852 | REQUIRES(n>=1 && ac == n && lr==n && lc==n,BAD_SIZE); | ||
853 | DEBUGMSG("chol_l_H"); | ||
854 | memcpy(lp,ap,n*n*sizeof(doublecomplex)); | ||
855 | char uplo = 'U'; | ||
856 | integer res; | ||
857 | zpotrf_ (&uplo,&n,lp,&n,&res); | ||
858 | CHECK(res>0,NODEFPOS); | ||
859 | CHECK(res,res); | ||
860 | doublecomplex zero = {0.,0.}; | ||
861 | int r,c; | ||
862 | for (r=0; r<lr-1; r++) { | ||
863 | for(c=r+1; c<lc; c++) { | ||
864 | lp[r*lc+c] = zero; | ||
865 | } | ||
866 | } | ||
867 | OK | ||
868 | } | ||
869 | |||
870 | |||
871 | /* Subroutine */ int dpotrf_(char *uplo, integer *n, doublereal *a, integer * | ||
872 | lda, integer *info); | ||
873 | |||
874 | int chol_l_S(KDMAT(a),DMAT(l)) { | ||
875 | integer n = ar; | ||
876 | REQUIRES(n>=1 && ac == n && lr==n && lc==n,BAD_SIZE); | ||
877 | DEBUGMSG("chol_l_S"); | ||
878 | memcpy(lp,ap,n*n*sizeof(double)); | ||
879 | char uplo = 'U'; | ||
880 | integer res; | ||
881 | dpotrf_ (&uplo,&n,lp,&n,&res); | ||
882 | CHECK(res>0,NODEFPOS); | ||
883 | CHECK(res,res); | ||
884 | int r,c; | ||
885 | for (r=0; r<lr-1; r++) { | ||
886 | for(c=r+1; c<lc; c++) { | ||
887 | lp[r*lc+c] = 0.; | ||
888 | } | ||
889 | } | ||
890 | OK | ||
891 | } | ||
892 | |||
893 | //////////////////// QR factorization ///////////////////////// | ||
894 | |||
895 | /* Subroutine */ int dgeqr2_(integer *m, integer *n, doublereal *a, integer * | ||
896 | lda, doublereal *tau, doublereal *work, integer *info); | ||
897 | |||
898 | int qr_l_R(KDMAT(a), DVEC(tau), DMAT(r)) { | ||
899 | integer m = ar; | ||
900 | integer n = ac; | ||
901 | integer mn = MIN(m,n); | ||
902 | REQUIRES(m>=1 && n >=1 && rr== m && rc == n && taun == mn, BAD_SIZE); | ||
903 | DEBUGMSG("qr_l_R"); | ||
904 | double *WORK = (double*)malloc(n*sizeof(double)); | ||
905 | CHECK(!WORK,MEM); | ||
906 | memcpy(rp,ap,m*n*sizeof(double)); | ||
907 | integer res; | ||
908 | dgeqr2_ (&m,&n,rp,&m,taup,WORK,&res); | ||
909 | CHECK(res,res); | ||
910 | free(WORK); | ||
911 | OK | ||
912 | } | ||
913 | |||
914 | /* Subroutine */ int zgeqr2_(integer *m, integer *n, doublecomplex *a, | ||
915 | integer *lda, doublecomplex *tau, doublecomplex *work, integer *info); | ||
916 | |||
917 | int qr_l_C(KCMAT(a), CVEC(tau), CMAT(r)) { | ||
918 | integer m = ar; | ||
919 | integer n = ac; | ||
920 | integer mn = MIN(m,n); | ||
921 | REQUIRES(m>=1 && n >=1 && rr== m && rc == n && taun == mn, BAD_SIZE); | ||
922 | DEBUGMSG("qr_l_C"); | ||
923 | doublecomplex *WORK = (doublecomplex*)malloc(n*sizeof(doublecomplex)); | ||
924 | CHECK(!WORK,MEM); | ||
925 | memcpy(rp,ap,m*n*sizeof(doublecomplex)); | ||
926 | integer res; | ||
927 | zgeqr2_ (&m,&n,rp,&m,taup,WORK,&res); | ||
928 | CHECK(res,res); | ||
929 | free(WORK); | ||
930 | OK | ||
931 | } | ||
932 | |||
933 | /* Subroutine */ int dorgqr_(integer *m, integer *n, integer *k, doublereal * | ||
934 | a, integer *lda, doublereal *tau, doublereal *work, integer *lwork, | ||
935 | integer *info); | ||
936 | |||
937 | int c_dorgqr(KDMAT(a), KDVEC(tau), DMAT(r)) { | ||
938 | integer m = ar; | ||
939 | integer n = MIN(ac,ar); | ||
940 | integer k = taun; | ||
941 | DEBUGMSG("c_dorgqr"); | ||
942 | integer lwork = 8*n; // FIXME | ||
943 | double *WORK = (double*)malloc(lwork*sizeof(double)); | ||
944 | CHECK(!WORK,MEM); | ||
945 | memcpy(rp,ap,m*k*sizeof(double)); | ||
946 | integer res; | ||
947 | dorgqr_ (&m,&n,&k,rp,&m,(double*)taup,WORK,&lwork,&res); | ||
948 | CHECK(res,res); | ||
949 | free(WORK); | ||
950 | OK | ||
951 | } | ||
952 | |||
953 | /* Subroutine */ int zungqr_(integer *m, integer *n, integer *k, | ||
954 | doublecomplex *a, integer *lda, doublecomplex *tau, doublecomplex * | ||
955 | work, integer *lwork, integer *info); | ||
956 | |||
957 | int c_zungqr(KCMAT(a), KCVEC(tau), CMAT(r)) { | ||
958 | integer m = ar; | ||
959 | integer n = MIN(ac,ar); | ||
960 | integer k = taun; | ||
961 | DEBUGMSG("z_ungqr"); | ||
962 | integer lwork = 8*n; // FIXME | ||
963 | doublecomplex *WORK = (doublecomplex*)malloc(lwork*sizeof(doublecomplex)); | ||
964 | CHECK(!WORK,MEM); | ||
965 | memcpy(rp,ap,m*k*sizeof(doublecomplex)); | ||
966 | integer res; | ||
967 | zungqr_ (&m,&n,&k,rp,&m,(doublecomplex*)taup,WORK,&lwork,&res); | ||
968 | CHECK(res,res); | ||
969 | free(WORK); | ||
970 | OK | ||
971 | } | ||
972 | |||
973 | |||
974 | //////////////////// Hessenberg factorization ///////////////////////// | ||
975 | |||
976 | /* Subroutine */ int dgehrd_(integer *n, integer *ilo, integer *ihi, | ||
977 | doublereal *a, integer *lda, doublereal *tau, doublereal *work, | ||
978 | integer *lwork, integer *info); | ||
979 | |||
980 | int hess_l_R(KDMAT(a), DVEC(tau), DMAT(r)) { | ||
981 | integer m = ar; | ||
982 | integer n = ac; | ||
983 | integer mn = MIN(m,n); | ||
984 | REQUIRES(m>=1 && n == m && rr== m && rc == n && taun == mn-1, BAD_SIZE); | ||
985 | DEBUGMSG("hess_l_R"); | ||
986 | integer lwork = 5*n; // fixme | ||
987 | double *WORK = (double*)malloc(lwork*sizeof(double)); | ||
988 | CHECK(!WORK,MEM); | ||
989 | memcpy(rp,ap,m*n*sizeof(double)); | ||
990 | integer res; | ||
991 | integer one = 1; | ||
992 | dgehrd_ (&n,&one,&n,rp,&n,taup,WORK,&lwork,&res); | ||
993 | CHECK(res,res); | ||
994 | free(WORK); | ||
995 | OK | ||
996 | } | ||
997 | |||
998 | |||
999 | /* Subroutine */ int zgehrd_(integer *n, integer *ilo, integer *ihi, | ||
1000 | doublecomplex *a, integer *lda, doublecomplex *tau, doublecomplex * | ||
1001 | work, integer *lwork, integer *info); | ||
1002 | |||
1003 | int hess_l_C(KCMAT(a), CVEC(tau), CMAT(r)) { | ||
1004 | integer m = ar; | ||
1005 | integer n = ac; | ||
1006 | integer mn = MIN(m,n); | ||
1007 | REQUIRES(m>=1 && n == m && rr== m && rc == n && taun == mn-1, BAD_SIZE); | ||
1008 | DEBUGMSG("hess_l_C"); | ||
1009 | integer lwork = 5*n; // fixme | ||
1010 | doublecomplex *WORK = (doublecomplex*)malloc(lwork*sizeof(doublecomplex)); | ||
1011 | CHECK(!WORK,MEM); | ||
1012 | memcpy(rp,ap,m*n*sizeof(doublecomplex)); | ||
1013 | integer res; | ||
1014 | integer one = 1; | ||
1015 | zgehrd_ (&n,&one,&n,rp,&n,taup,WORK,&lwork,&res); | ||
1016 | CHECK(res,res); | ||
1017 | free(WORK); | ||
1018 | OK | ||
1019 | } | ||
1020 | |||
1021 | //////////////////// Schur factorization ///////////////////////// | ||
1022 | |||
1023 | /* Subroutine */ int dgees_(char *jobvs, char *sort, L_fp select, integer *n, | ||
1024 | doublereal *a, integer *lda, integer *sdim, doublereal *wr, | ||
1025 | doublereal *wi, doublereal *vs, integer *ldvs, doublereal *work, | ||
1026 | integer *lwork, logical *bwork, integer *info); | ||
1027 | |||
1028 | int schur_l_R(KDMAT(a), DMAT(u), DMAT(s)) { | ||
1029 | integer m = ar; | ||
1030 | integer n = ac; | ||
1031 | REQUIRES(m>=1 && n==m && ur==n && uc==n && sr==n && sc==n, BAD_SIZE); | ||
1032 | DEBUGMSG("schur_l_R"); | ||
1033 | //int k; | ||
1034 | //printf("---------------------------\n"); | ||
1035 | //printf("%p: ",ap); for(k=0;k<n*n;k++) printf("%f ",ap[k]); printf("\n"); | ||
1036 | //printf("%p: ",up); for(k=0;k<n*n;k++) printf("%f ",up[k]); printf("\n"); | ||
1037 | //printf("%p: ",sp); for(k=0;k<n*n;k++) printf("%f ",sp[k]); printf("\n"); | ||
1038 | memcpy(sp,ap,n*n*sizeof(double)); | ||
1039 | integer lwork = 6*n; // fixme | ||
1040 | double *WORK = (double*)malloc(lwork*sizeof(double)); | ||
1041 | double *WR = (double*)malloc(n*sizeof(double)); | ||
1042 | double *WI = (double*)malloc(n*sizeof(double)); | ||
1043 | // WR and WI not really required in this call | ||
1044 | logical *BWORK = (logical*)malloc(n*sizeof(logical)); | ||
1045 | integer res; | ||
1046 | integer sdim; | ||
1047 | dgees_ ("V","N",NULL,&n,sp,&n,&sdim,WR,WI,up,&n,WORK,&lwork,BWORK,&res); | ||
1048 | //printf("%p: ",ap); for(k=0;k<n*n;k++) printf("%f ",ap[k]); printf("\n"); | ||
1049 | //printf("%p: ",up); for(k=0;k<n*n;k++) printf("%f ",up[k]); printf("\n"); | ||
1050 | //printf("%p: ",sp); for(k=0;k<n*n;k++) printf("%f ",sp[k]); printf("\n"); | ||
1051 | if(res>0) { | ||
1052 | return NOCONVER; | ||
1053 | } | ||
1054 | CHECK(res,res); | ||
1055 | free(WR); | ||
1056 | free(WI); | ||
1057 | free(BWORK); | ||
1058 | free(WORK); | ||
1059 | OK | ||
1060 | } | ||
1061 | |||
1062 | |||
1063 | /* Subroutine */ int zgees_(char *jobvs, char *sort, L_fp select, integer *n, | ||
1064 | doublecomplex *a, integer *lda, integer *sdim, doublecomplex *w, | ||
1065 | doublecomplex *vs, integer *ldvs, doublecomplex *work, integer *lwork, | ||
1066 | doublereal *rwork, logical *bwork, integer *info); | ||
1067 | |||
1068 | int schur_l_C(KCMAT(a), CMAT(u), CMAT(s)) { | ||
1069 | integer m = ar; | ||
1070 | integer n = ac; | ||
1071 | REQUIRES(m>=1 && n==m && ur==n && uc==n && sr==n && sc==n, BAD_SIZE); | ||
1072 | DEBUGMSG("schur_l_C"); | ||
1073 | memcpy(sp,ap,n*n*sizeof(doublecomplex)); | ||
1074 | integer lwork = 6*n; // fixme | ||
1075 | doublecomplex *WORK = (doublecomplex*)malloc(lwork*sizeof(doublecomplex)); | ||
1076 | doublecomplex *W = (doublecomplex*)malloc(n*sizeof(doublecomplex)); | ||
1077 | // W not really required in this call | ||
1078 | logical *BWORK = (logical*)malloc(n*sizeof(logical)); | ||
1079 | double *RWORK = (double*)malloc(n*sizeof(double)); | ||
1080 | integer res; | ||
1081 | integer sdim; | ||
1082 | zgees_ ("V","N",NULL,&n,sp,&n,&sdim,W, | ||
1083 | up,&n, | ||
1084 | WORK,&lwork,RWORK,BWORK,&res); | ||
1085 | if(res>0) { | ||
1086 | return NOCONVER; | ||
1087 | } | ||
1088 | CHECK(res,res); | ||
1089 | free(W); | ||
1090 | free(BWORK); | ||
1091 | free(WORK); | ||
1092 | OK | ||
1093 | } | ||
1094 | |||
1095 | //////////////////// LU factorization ///////////////////////// | ||
1096 | |||
1097 | /* Subroutine */ int dgetrf_(integer *m, integer *n, doublereal *a, integer * | ||
1098 | lda, integer *ipiv, integer *info); | ||
1099 | |||
1100 | int lu_l_R(KDMAT(a), DVEC(ipiv), DMAT(r)) { | ||
1101 | integer m = ar; | ||
1102 | integer n = ac; | ||
1103 | integer mn = MIN(m,n); | ||
1104 | REQUIRES(m>=1 && n >=1 && ipivn == mn, BAD_SIZE); | ||
1105 | DEBUGMSG("lu_l_R"); | ||
1106 | integer* auxipiv = (integer*)malloc(mn*sizeof(integer)); | ||
1107 | memcpy(rp,ap,m*n*sizeof(double)); | ||
1108 | integer res; | ||
1109 | dgetrf_ (&m,&n,rp,&m,auxipiv,&res); | ||
1110 | if(res>0) { | ||
1111 | res = 0; // fixme | ||
1112 | } | ||
1113 | CHECK(res,res); | ||
1114 | int k; | ||
1115 | for (k=0; k<mn; k++) { | ||
1116 | ipivp[k] = auxipiv[k]; | ||
1117 | } | ||
1118 | free(auxipiv); | ||
1119 | OK | ||
1120 | } | ||
1121 | |||
1122 | |||
1123 | /* Subroutine */ int zgetrf_(integer *m, integer *n, doublecomplex *a, | ||
1124 | integer *lda, integer *ipiv, integer *info); | ||
1125 | |||
1126 | int lu_l_C(KCMAT(a), DVEC(ipiv), CMAT(r)) { | ||
1127 | integer m = ar; | ||
1128 | integer n = ac; | ||
1129 | integer mn = MIN(m,n); | ||
1130 | REQUIRES(m>=1 && n >=1 && ipivn == mn, BAD_SIZE); | ||
1131 | DEBUGMSG("lu_l_C"); | ||
1132 | integer* auxipiv = (integer*)malloc(mn*sizeof(integer)); | ||
1133 | memcpy(rp,ap,m*n*sizeof(doublecomplex)); | ||
1134 | integer res; | ||
1135 | zgetrf_ (&m,&n,rp,&m,auxipiv,&res); | ||
1136 | if(res>0) { | ||
1137 | res = 0; // fixme | ||
1138 | } | ||
1139 | CHECK(res,res); | ||
1140 | int k; | ||
1141 | for (k=0; k<mn; k++) { | ||
1142 | ipivp[k] = auxipiv[k]; | ||
1143 | } | ||
1144 | free(auxipiv); | ||
1145 | OK | ||
1146 | } | ||
1147 | |||
1148 | |||
1149 | //////////////////// LU substitution ///////////////////////// | ||
1150 | |||
1151 | /* Subroutine */ int dgetrs_(char *trans, integer *n, integer *nrhs, | ||
1152 | doublereal *a, integer *lda, integer *ipiv, doublereal *b, integer * | ||
1153 | ldb, integer *info); | ||
1154 | |||
1155 | int luS_l_R(KDMAT(a), KDVEC(ipiv), KDMAT(b), DMAT(x)) { | ||
1156 | integer m = ar; | ||
1157 | integer n = ac; | ||
1158 | integer mrhs = br; | ||
1159 | integer nrhs = bc; | ||
1160 | |||
1161 | REQUIRES(m==n && m==mrhs && m==ipivn,BAD_SIZE); | ||
1162 | integer* auxipiv = (integer*)malloc(n*sizeof(integer)); | ||
1163 | int k; | ||
1164 | for (k=0; k<n; k++) { | ||
1165 | auxipiv[k] = (integer)ipivp[k]; | ||
1166 | } | ||
1167 | integer res; | ||
1168 | memcpy(xp,bp,mrhs*nrhs*sizeof(double)); | ||
1169 | dgetrs_ ("N",&n,&nrhs,(/*no const (!?)*/ double*)ap,&m,auxipiv,xp,&mrhs,&res); | ||
1170 | CHECK(res,res); | ||
1171 | free(auxipiv); | ||
1172 | OK | ||
1173 | } | ||
1174 | |||
1175 | |||
1176 | /* Subroutine */ int zgetrs_(char *trans, integer *n, integer *nrhs, | ||
1177 | doublecomplex *a, integer *lda, integer *ipiv, doublecomplex *b, | ||
1178 | integer *ldb, integer *info); | ||
1179 | |||
1180 | int luS_l_C(KCMAT(a), KDVEC(ipiv), KCMAT(b), CMAT(x)) { | ||
1181 | integer m = ar; | ||
1182 | integer n = ac; | ||
1183 | integer mrhs = br; | ||
1184 | integer nrhs = bc; | ||
1185 | |||
1186 | REQUIRES(m==n && m==mrhs && m==ipivn,BAD_SIZE); | ||
1187 | integer* auxipiv = (integer*)malloc(n*sizeof(integer)); | ||
1188 | int k; | ||
1189 | for (k=0; k<n; k++) { | ||
1190 | auxipiv[k] = (integer)ipivp[k]; | ||
1191 | } | ||
1192 | integer res; | ||
1193 | memcpy(xp,bp,mrhs*nrhs*sizeof(doublecomplex)); | ||
1194 | zgetrs_ ("N",&n,&nrhs,(doublecomplex*)ap,&m,auxipiv,xp,&mrhs,&res); | ||
1195 | CHECK(res,res); | ||
1196 | free(auxipiv); | ||
1197 | OK | ||
1198 | } | ||
1199 | |||
1200 | //////////////////// Matrix Product ///////////////////////// | ||
1201 | |||
1202 | void dgemm_(char *, char *, integer *, integer *, integer *, | ||
1203 | double *, const double *, integer *, const double *, | ||
1204 | integer *, double *, double *, integer *); | ||
1205 | |||
1206 | int multiplyR(int ta, int tb, KDMAT(a),KDMAT(b),DMAT(r)) { | ||
1207 | //REQUIRES(ac==br && ar==rr && bc==rc,BAD_SIZE); | ||
1208 | DEBUGMSG("dgemm_"); | ||
1209 | CHECKNANR(a,"NaN multR Input\n") | ||
1210 | CHECKNANR(b,"NaN multR Input\n") | ||
1211 | integer m = ta?ac:ar; | ||
1212 | integer n = tb?br:bc; | ||
1213 | integer k = ta?ar:ac; | ||
1214 | integer lda = ar; | ||
1215 | integer ldb = br; | ||
1216 | integer ldc = rr; | ||
1217 | double alpha = 1; | ||
1218 | double beta = 0; | ||
1219 | dgemm_(ta?"T":"N",tb?"T":"N",&m,&n,&k,&alpha,ap,&lda,bp,&ldb,&beta,rp,&ldc); | ||
1220 | CHECKNANR(r,"NaN multR Output\n") | ||
1221 | OK | ||
1222 | } | ||
1223 | |||
1224 | void zgemm_(char *, char *, integer *, integer *, integer *, | ||
1225 | doublecomplex *, const doublecomplex *, integer *, const doublecomplex *, | ||
1226 | integer *, doublecomplex *, doublecomplex *, integer *); | ||
1227 | |||
1228 | int multiplyC(int ta, int tb, KCMAT(a),KCMAT(b),CMAT(r)) { | ||
1229 | //REQUIRES(ac==br && ar==rr && bc==rc,BAD_SIZE); | ||
1230 | DEBUGMSG("zgemm_"); | ||
1231 | CHECKNANC(a,"NaN multC Input\n") | ||
1232 | CHECKNANC(b,"NaN multC Input\n") | ||
1233 | integer m = ta?ac:ar; | ||
1234 | integer n = tb?br:bc; | ||
1235 | integer k = ta?ar:ac; | ||
1236 | integer lda = ar; | ||
1237 | integer ldb = br; | ||
1238 | integer ldc = rr; | ||
1239 | doublecomplex alpha = {1,0}; | ||
1240 | doublecomplex beta = {0,0}; | ||
1241 | zgemm_(ta?"T":"N",tb?"T":"N",&m,&n,&k,&alpha, | ||
1242 | ap,&lda, | ||
1243 | bp,&ldb,&beta, | ||
1244 | rp,&ldc); | ||
1245 | CHECKNANC(r,"NaN multC Output\n") | ||
1246 | OK | ||
1247 | } | ||
1248 | |||
1249 | void sgemm_(char *, char *, integer *, integer *, integer *, | ||
1250 | float *, const float *, integer *, const float *, | ||
1251 | integer *, float *, float *, integer *); | ||
1252 | |||
1253 | int multiplyF(int ta, int tb, KFMAT(a),KFMAT(b),FMAT(r)) { | ||
1254 | //REQUIRES(ac==br && ar==rr && bc==rc,BAD_SIZE); | ||
1255 | DEBUGMSG("sgemm_"); | ||
1256 | integer m = ta?ac:ar; | ||
1257 | integer n = tb?br:bc; | ||
1258 | integer k = ta?ar:ac; | ||
1259 | integer lda = ar; | ||
1260 | integer ldb = br; | ||
1261 | integer ldc = rr; | ||
1262 | float alpha = 1; | ||
1263 | float beta = 0; | ||
1264 | sgemm_(ta?"T":"N",tb?"T":"N",&m,&n,&k,&alpha,ap,&lda,bp,&ldb,&beta,rp,&ldc); | ||
1265 | OK | ||
1266 | } | ||
1267 | |||
1268 | void cgemm_(char *, char *, integer *, integer *, integer *, | ||
1269 | complex *, const complex *, integer *, const complex *, | ||
1270 | integer *, complex *, complex *, integer *); | ||
1271 | |||
1272 | int multiplyQ(int ta, int tb, KQMAT(a),KQMAT(b),QMAT(r)) { | ||
1273 | //REQUIRES(ac==br && ar==rr && bc==rc,BAD_SIZE); | ||
1274 | DEBUGMSG("cgemm_"); | ||
1275 | integer m = ta?ac:ar; | ||
1276 | integer n = tb?br:bc; | ||
1277 | integer k = ta?ar:ac; | ||
1278 | integer lda = ar; | ||
1279 | integer ldb = br; | ||
1280 | integer ldc = rr; | ||
1281 | complex alpha = {1,0}; | ||
1282 | complex beta = {0,0}; | ||
1283 | cgemm_(ta?"T":"N",tb?"T":"N",&m,&n,&k,&alpha, | ||
1284 | ap,&lda, | ||
1285 | bp,&ldb,&beta, | ||
1286 | rp,&ldc); | ||
1287 | OK | ||
1288 | } | ||
1289 | |||
1290 | |||
1291 | int multiplyI(KOIMAT(a), KOIMAT(b), OIMAT(r)) { | ||
1292 | { TRAV(r,i,j) { | ||
1293 | int k; | ||
1294 | AT(r,i,j) = 0; | ||
1295 | for (k=0;k<ac;k++) { | ||
1296 | AT(r,i,j) += AT(a,i,k) * AT(b,k,j); | ||
1297 | } | ||
1298 | } | ||
1299 | } | ||
1300 | OK | ||
1301 | } | ||
1302 | |||
1303 | //////////////////// transpose ///////////////////////// | ||
1304 | |||
1305 | int transF(KFMAT(x),FMAT(t)) { | ||
1306 | REQUIRES(xr==tc && xc==tr,BAD_SIZE); | ||
1307 | DEBUGMSG("transF"); | ||
1308 | int i,j; | ||
1309 | for (i=0; i<tr; i++) { | ||
1310 | for (j=0; j<tc; j++) { | ||
1311 | tp[i*tc+j] = xp[j*xc+i]; | ||
1312 | } | ||
1313 | } | ||
1314 | OK | ||
1315 | } | ||
1316 | |||
1317 | int transR(KDMAT(x),DMAT(t)) { | ||
1318 | REQUIRES(xr==tc && xc==tr,BAD_SIZE); | ||
1319 | DEBUGMSG("transR"); | ||
1320 | int i,j; | ||
1321 | for (i=0; i<tr; i++) { | ||
1322 | for (j=0; j<tc; j++) { | ||
1323 | tp[i*tc+j] = xp[j*xc+i]; | ||
1324 | } | ||
1325 | } | ||
1326 | OK | ||
1327 | } | ||
1328 | |||
1329 | int transQ(KQMAT(x),QMAT(t)) { | ||
1330 | REQUIRES(xr==tc && xc==tr,BAD_SIZE); | ||
1331 | DEBUGMSG("transQ"); | ||
1332 | int i,j; | ||
1333 | for (i=0; i<tr; i++) { | ||
1334 | for (j=0; j<tc; j++) { | ||
1335 | tp[i*tc+j] = xp[j*xc+i]; | ||
1336 | } | ||
1337 | } | ||
1338 | OK | ||
1339 | } | ||
1340 | |||
1341 | int transC(KCMAT(x),CMAT(t)) { | ||
1342 | REQUIRES(xr==tc && xc==tr,BAD_SIZE); | ||
1343 | DEBUGMSG("transC"); | ||
1344 | int i,j; | ||
1345 | for (i=0; i<tr; i++) { | ||
1346 | for (j=0; j<tc; j++) { | ||
1347 | tp[i*tc+j] = xp[j*xc+i]; | ||
1348 | } | ||
1349 | } | ||
1350 | OK | ||
1351 | } | ||
1352 | |||
1353 | int transP(KPMAT(x), PMAT(t)) { | ||
1354 | REQUIRES(xr==tc && xc==tr,BAD_SIZE); | ||
1355 | REQUIRES(xs==ts,NOCONVER); | ||
1356 | DEBUGMSG("transP"); | ||
1357 | int i,j; | ||
1358 | for (i=0; i<tr; i++) { | ||
1359 | for (j=0; j<tc; j++) { | ||
1360 | memcpy(tp+(i*tc+j)*xs,xp +(j*xc+i)*xs,xs); | ||
1361 | } | ||
1362 | } | ||
1363 | OK | ||
1364 | } | ||
1365 | |||
1366 | int transI(KIMAT(x),IMAT(t)) { | ||
1367 | REQUIRES(xr==tc && xc==tr,BAD_SIZE); | ||
1368 | DEBUGMSG("transI"); | ||
1369 | int i,j; | ||
1370 | for (i=0; i<tr; i++) { | ||
1371 | for (j=0; j<tc; j++) { | ||
1372 | tp[i*tc+j] = xp[j*xc+i]; | ||
1373 | } | ||
1374 | } | ||
1375 | OK | ||
1376 | } | ||
1377 | |||
1378 | |||
1379 | //////////////////// constant ///////////////////////// | ||
1380 | |||
1381 | int constantF(float * pval, FVEC(r)) { | ||
1382 | DEBUGMSG("constantF") | ||
1383 | int k; | ||
1384 | double val = *pval; | ||
1385 | for(k=0;k<rn;k++) { | ||
1386 | rp[k]=val; | ||
1387 | } | ||
1388 | OK | ||
1389 | } | ||
1390 | |||
1391 | int constantR(double * pval, DVEC(r)) { | ||
1392 | DEBUGMSG("constantR") | ||
1393 | int k; | ||
1394 | double val = *pval; | ||
1395 | for(k=0;k<rn;k++) { | ||
1396 | rp[k]=val; | ||
1397 | } | ||
1398 | OK | ||
1399 | } | ||
1400 | |||
1401 | int constantQ(complex* pval, QVEC(r)) { | ||
1402 | DEBUGMSG("constantQ") | ||
1403 | int k; | ||
1404 | complex val = *pval; | ||
1405 | for(k=0;k<rn;k++) { | ||
1406 | rp[k]=val; | ||
1407 | } | ||
1408 | OK | ||
1409 | } | ||
1410 | |||
1411 | int constantC(doublecomplex* pval, CVEC(r)) { | ||
1412 | DEBUGMSG("constantC") | ||
1413 | int k; | ||
1414 | doublecomplex val = *pval; | ||
1415 | for(k=0;k<rn;k++) { | ||
1416 | rp[k]=val; | ||
1417 | } | ||
1418 | OK | ||
1419 | } | ||
1420 | |||
1421 | int constantP(void* pval, PVEC(r)) { | ||
1422 | DEBUGMSG("constantP") | ||
1423 | int k; | ||
1424 | for(k=0;k<rn;k++) { | ||
1425 | memcpy(rp+k*rs,pval,rs); | ||
1426 | } | ||
1427 | OK | ||
1428 | } | ||
1429 | |||
1430 | |||
1431 | int constantI(int * pval, IVEC(r)) { | ||
1432 | DEBUGMSG("constantI") | ||
1433 | int k; | ||
1434 | int val = *pval; | ||
1435 | for(k=0;k<rn;k++) { | ||
1436 | rp[k]=val; | ||
1437 | } | ||
1438 | OK | ||
1439 | } | ||
1440 | |||
1441 | |||
1442 | //////////////////// float-double conversion ///////////////////////// | ||
1443 | |||
1444 | int float2double(FVEC(x),DVEC(y)) { | ||
1445 | DEBUGMSG("float2double") | ||
1446 | int k; | ||
1447 | for(k=0;k<xn;k++) { | ||
1448 | yp[k]=xp[k]; | ||
1449 | } | ||
1450 | OK | ||
1451 | } | ||
1452 | |||
1453 | int float2int(KFVEC(x),IVEC(y)) { | ||
1454 | DEBUGMSG("float2int") | ||
1455 | int k; | ||
1456 | for(k=0;k<xn;k++) { | ||
1457 | yp[k]=xp[k]; | ||
1458 | } | ||
1459 | OK | ||
1460 | } | ||
1461 | |||
1462 | |||
1463 | int double2float(DVEC(x),FVEC(y)) { | ||
1464 | DEBUGMSG("double2float") | ||
1465 | int k; | ||
1466 | for(k=0;k<xn;k++) { | ||
1467 | yp[k]=xp[k]; | ||
1468 | } | ||
1469 | OK | ||
1470 | } | ||
1471 | |||
1472 | |||
1473 | int double2int(KDVEC(x),IVEC(y)) { | ||
1474 | DEBUGMSG("double2int") | ||
1475 | int k; | ||
1476 | for(k=0;k<xn;k++) { | ||
1477 | yp[k]=xp[k]; | ||
1478 | } | ||
1479 | OK | ||
1480 | } | ||
1481 | |||
1482 | |||
1483 | int int2float(KIVEC(x),FVEC(y)) { | ||
1484 | DEBUGMSG("int2float") | ||
1485 | int k; | ||
1486 | for(k=0;k<xn;k++) { | ||
1487 | yp[k]=xp[k]; | ||
1488 | } | ||
1489 | OK | ||
1490 | } | ||
1491 | |||
1492 | |||
1493 | int int2double(KIVEC(x),DVEC(y)) { | ||
1494 | DEBUGMSG("int2double") | ||
1495 | int k; | ||
1496 | for(k=0;k<xn;k++) { | ||
1497 | yp[k]=xp[k]; | ||
1498 | } | ||
1499 | OK | ||
1500 | } | ||
1501 | |||
1502 | |||
1503 | //////////////////// conjugate ///////////////////////// | ||
1504 | |||
1505 | int conjugateQ(KQVEC(x),QVEC(t)) { | ||
1506 | REQUIRES(xn==tn,BAD_SIZE); | ||
1507 | DEBUGMSG("conjugateQ"); | ||
1508 | int k; | ||
1509 | for(k=0;k<xn;k++) { | ||
1510 | tp[k].r = xp[k].r; | ||
1511 | tp[k].i = -xp[k].i; | ||
1512 | } | ||
1513 | OK | ||
1514 | } | ||
1515 | |||
1516 | int conjugateC(KCVEC(x),CVEC(t)) { | ||
1517 | REQUIRES(xn==tn,BAD_SIZE); | ||
1518 | DEBUGMSG("conjugateC"); | ||
1519 | int k; | ||
1520 | for(k=0;k<xn;k++) { | ||
1521 | tp[k].r = xp[k].r; | ||
1522 | tp[k].i = -xp[k].i; | ||
1523 | } | ||
1524 | OK | ||
1525 | } | ||
1526 | |||
1527 | //////////////////// step ///////////////////////// | ||
1528 | |||
1529 | #define STEP_IMP \ | ||
1530 | int k; \ | ||
1531 | for(k=0;k<xn;k++) { \ | ||
1532 | yp[k]=xp[k]>0; \ | ||
1533 | } \ | ||
1534 | OK | ||
1535 | |||
1536 | int stepF(KFVEC(x),FVEC(y)) { | ||
1537 | STEP_IMP | ||
1538 | } | ||
1539 | |||
1540 | int stepD(KDVEC(x),DVEC(y)) { | ||
1541 | STEP_IMP | ||
1542 | } | ||
1543 | |||
1544 | int stepI(KIVEC(x),IVEC(y)) { | ||
1545 | STEP_IMP | ||
1546 | } | ||
1547 | |||
1548 | //////////////////// cond ///////////////////////// | ||
1549 | |||
1550 | #define COMPARE_IMP \ | ||
1551 | REQUIRES(xn==yn && xn==rn ,BAD_SIZE); \ | ||
1552 | int k; \ | ||
1553 | for(k=0;k<xn;k++) { \ | ||
1554 | rp[k] = xp[k]<yp[k]?-1:(xp[k]>yp[k]?1:0); \ | ||
1555 | } \ | ||
1556 | OK | ||
1557 | |||
1558 | |||
1559 | int compareF(KFVEC(x),KFVEC(y),IVEC(r)) { | ||
1560 | COMPARE_IMP | ||
1561 | } | ||
1562 | |||
1563 | int compareD(KDVEC(x),KDVEC(y),IVEC(r)) { | ||
1564 | COMPARE_IMP | ||
1565 | } | ||
1566 | |||
1567 | int compareI(KIVEC(x),KIVEC(y),IVEC(r)) { | ||
1568 | COMPARE_IMP | ||
1569 | } | ||
1570 | |||
1571 | |||
1572 | #define COND_IMP \ | ||
1573 | REQUIRES(xn==yn && xn==ltn && xn==eqn && xn==gtn && xn==rn ,BAD_SIZE); \ | ||
1574 | int k; \ | ||
1575 | for(k=0;k<xn;k++) { \ | ||
1576 | rp[k] = xp[k]<yp[k]?ltp[k]:(xp[k]>yp[k]?gtp[k]:eqp[k]); \ | ||
1577 | } \ | ||
1578 | OK | ||
1579 | |||
1580 | int condF(FVEC(x),FVEC(y),FVEC(lt),FVEC(eq),FVEC(gt),FVEC(r)) { | ||
1581 | COND_IMP | ||
1582 | } | ||
1583 | |||
1584 | int condD(DVEC(x),DVEC(y),DVEC(lt),DVEC(eq),DVEC(gt),DVEC(r)) { | ||
1585 | COND_IMP | ||
1586 | } | ||
1587 | |||
1588 | int condI(KIVEC(x),KIVEC(y),KIVEC(lt),KIVEC(eq),KIVEC(gt),IVEC(r)) { | ||
1589 | COND_IMP | ||
1590 | } | ||
1591 | |||
1592 | |||
1593 | #define CHOOSE_IMP \ | ||
1594 | REQUIRES(condn==ltn && ltn==eqn && ltn==gtn && ltn==rn ,BAD_SIZE); \ | ||
1595 | int k; \ | ||
1596 | for(k=0;k<condn;k++) { \ | ||
1597 | rp[k] = condp[k]<0?ltp[k]:(condp[k]>0?gtp[k]:eqp[k]); \ | ||
1598 | } \ | ||
1599 | OK | ||
1600 | |||
1601 | int chooseF(KIVEC(cond),KFVEC(lt),KFVEC(eq),KFVEC(gt),FVEC(r)) { | ||
1602 | CHOOSE_IMP | ||
1603 | } | ||
1604 | |||
1605 | int chooseD(KIVEC(cond),KDVEC(lt),KDVEC(eq),KDVEC(gt),DVEC(r)) { | ||
1606 | CHOOSE_IMP | ||
1607 | } | ||
1608 | |||
1609 | int chooseI(KIVEC(cond),KIVEC(lt),KIVEC(eq),KIVEC(gt),IVEC(r)) { | ||
1610 | CHOOSE_IMP | ||
1611 | } | ||
1612 | |||
1613 | int chooseC(KIVEC(cond),KCVEC(lt),KCVEC(eq),KCVEC(gt),CVEC(r)) { | ||
1614 | CHOOSE_IMP | ||
1615 | } | ||
1616 | |||
1617 | int chooseQ(KIVEC(cond),KQVEC(lt),KQVEC(eq),KQVEC(gt),QVEC(r)) { | ||
1618 | CHOOSE_IMP | ||
1619 | } | ||
1620 | |||
1621 | //////////////////////// extract ///////////////////////////////// | ||
1622 | |||
1623 | #define EXTRACT_IMP \ | ||
1624 | int i,j,si,sj,ni,nj; \ | ||
1625 | ni = modei ? in : ip[1]-ip[0]+1; \ | ||
1626 | nj = modej ? jn : jp[1]-jp[0]+1; \ | ||
1627 | \ | ||
1628 | for (i=0; i<ni; i++) { \ | ||
1629 | si = modei ? ip[i] : i+ip[0]; \ | ||
1630 | \ | ||
1631 | for (j=0; j<nj; j++) { \ | ||
1632 | sj = modej ? jp[j] : j+jp[0]; \ | ||
1633 | \ | ||
1634 | AT(r,i,j) = AT(m,si,sj); \ | ||
1635 | } \ | ||
1636 | } \ | ||
1637 | OK | ||
1638 | |||
1639 | int extractD(int modei, int modej, KIVEC(i), KIVEC(j), KODMAT(m), ODMAT(r)) { | ||
1640 | EXTRACT_IMP | ||
1641 | } | ||
1642 | |||
1643 | int extractF(int modei, int modej, KIVEC(i), KIVEC(j), KOFMAT(m), OFMAT(r)) { | ||
1644 | EXTRACT_IMP | ||
1645 | } | ||
1646 | |||
1647 | int extractC(int modei, int modej, KIVEC(i), KIVEC(j), KOCMAT(m), OCMAT(r)) { | ||
1648 | EXTRACT_IMP | ||
1649 | } | ||
1650 | |||
1651 | int extractQ(int modei, int modej, KIVEC(i), KIVEC(j), KOQMAT(m), OQMAT(r)) { | ||
1652 | EXTRACT_IMP | ||
1653 | } | ||
1654 | |||
1655 | int extractI(int modei, int modej, KIVEC(i), KIVEC(j), KOIMAT(m), OIMAT(r)) { | ||
1656 | EXTRACT_IMP | ||
1657 | } | ||
1658 | |||
1659 | //////////////////////// remap ///////////////////////////////// | ||
1660 | |||
1661 | #define REMAP_IMP \ | ||
1662 | REQUIRES(ir==jr && ic==jc && ir==rr && ic==rc ,BAD_SIZE); \ | ||
1663 | { TRAV(r,a,b) { AT(r,a,b) = AT(m,AT(i,a,b),AT(j,a,b)); } \ | ||
1664 | } \ | ||
1665 | OK | ||
1666 | |||
1667 | int remapD(KOIMAT(i), KOIMAT(j), KODMAT(m), ODMAT(r)) { | ||
1668 | REMAP_IMP | ||
1669 | } | ||
1670 | |||
1671 | int remapF(KOIMAT(i), KOIMAT(j), KOFMAT(m), OFMAT(r)) { | ||
1672 | REMAP_IMP | ||
1673 | } | ||
1674 | |||
1675 | int remapI(KOIMAT(i), KOIMAT(j), KOIMAT(m), OIMAT(r)) { | ||
1676 | REMAP_IMP | ||
1677 | } | ||
1678 | |||
1679 | int remapC(KOIMAT(i), KOIMAT(j), KOCMAT(m), OCMAT(r)) { | ||
1680 | REMAP_IMP | ||
1681 | } | ||
1682 | |||
1683 | int remapQ(KOIMAT(i), KOIMAT(j), KOQMAT(m), OQMAT(r)) { | ||
1684 | REMAP_IMP | ||
1685 | } | ||
1686 | |||
diff --git a/packages/base/src/Internal/C/lapack-aux.h b/packages/base/src/Internal/C/lapack-aux.h new file mode 100644 index 0000000..6ffbef1 --- /dev/null +++ b/packages/base/src/Internal/C/lapack-aux.h | |||
@@ -0,0 +1,82 @@ | |||
1 | /* | ||
2 | * We have copied the definitions in f2c.h required | ||
3 | * to compile clapack.h, modified to support both | ||
4 | * 32 and 64 bit | ||
5 | |||
6 | http://opengrok.creo.hu/dragonfly/xref/src/contrib/gcc-3.4/libf2c/readme.netlib | ||
7 | http://www.ibm.com/developerworks/library/l-port64.html | ||
8 | */ | ||
9 | |||
10 | #ifdef _LP64 | ||
11 | typedef int integer; | ||
12 | typedef unsigned int uinteger; | ||
13 | typedef int logical; | ||
14 | typedef long longint; /* system-dependent */ | ||
15 | typedef unsigned long ulongint; /* system-dependent */ | ||
16 | #else | ||
17 | typedef long int integer; | ||
18 | typedef unsigned long int uinteger; | ||
19 | typedef long int logical; | ||
20 | typedef long long longint; /* system-dependent */ | ||
21 | typedef unsigned long long ulongint; /* system-dependent */ | ||
22 | #endif | ||
23 | |||
24 | typedef char *address; | ||
25 | typedef short int shortint; | ||
26 | typedef float real; | ||
27 | typedef double doublereal; | ||
28 | typedef struct { real r, i; } complex; | ||
29 | typedef struct { doublereal r, i; } doublecomplex; | ||
30 | typedef short int shortlogical; | ||
31 | typedef char logical1; | ||
32 | typedef char integer1; | ||
33 | |||
34 | typedef logical (*L_fp)(); | ||
35 | typedef short ftnlen; | ||
36 | |||
37 | /********************************************************/ | ||
38 | |||
39 | #define IVEC(A) int A##n, int*A##p | ||
40 | #define FVEC(A) int A##n, float*A##p | ||
41 | #define DVEC(A) int A##n, double*A##p | ||
42 | #define QVEC(A) int A##n, complex*A##p | ||
43 | #define CVEC(A) int A##n, doublecomplex*A##p | ||
44 | #define PVEC(A) int A##n, void* A##p, int A##s | ||
45 | |||
46 | #define IMAT(A) int A##r, int A##c, int* A##p | ||
47 | #define FMAT(A) int A##r, int A##c, float* A##p | ||
48 | #define DMAT(A) int A##r, int A##c, double* A##p | ||
49 | #define QMAT(A) int A##r, int A##c, complex* A##p | ||
50 | #define CMAT(A) int A##r, int A##c, doublecomplex* A##p | ||
51 | #define PMAT(A) int A##r, int A##c, void* A##p, int A##s | ||
52 | |||
53 | #define OIMAT(A) int A##r, int A##c, int A##Xr, int A##Xc, int* A##p | ||
54 | #define OFMAT(A) int A##r, int A##c, int A##Xr, int A##Xc, float* A##p | ||
55 | #define ODMAT(A) int A##r, int A##c, int A##Xr, int A##Xc, double* A##p | ||
56 | #define OQMAT(A) int A##r, int A##c, int A##Xr, int A##Xc, complex* A##p | ||
57 | #define OCMAT(A) int A##r, int A##c, int A##Xr, int A##Xc, doublecomplex* A##p | ||
58 | |||
59 | |||
60 | #define KIVEC(A) int A##n, const int*A##p | ||
61 | #define KFVEC(A) int A##n, const float*A##p | ||
62 | #define KDVEC(A) int A##n, const double*A##p | ||
63 | #define KQVEC(A) int A##n, const complex*A##p | ||
64 | #define KCVEC(A) int A##n, const doublecomplex*A##p | ||
65 | #define KPVEC(A) int A##n, const void* A##p, int A##s | ||
66 | |||
67 | #define KIMAT(A) int A##r, int A##c, const int* A##p | ||
68 | #define KFMAT(A) int A##r, int A##c, const float* A##p | ||
69 | #define KDMAT(A) int A##r, int A##c, const double* A##p | ||
70 | #define KQMAT(A) int A##r, int A##c, const complex* A##p | ||
71 | #define KCMAT(A) int A##r, int A##c, const doublecomplex* A##p | ||
72 | #define KPMAT(A) int A##r, int A##c, const void* A##p, int A##s | ||
73 | |||
74 | #define KOIMAT(A) int A##r, int A##c, int A##Xr, int A##Xc, const int* A##p | ||
75 | #define KOFMAT(A) int A##r, int A##c, int A##Xr, int A##Xc, const float* A##p | ||
76 | #define KODMAT(A) int A##r, int A##c, int A##Xr, int A##Xc, const double* A##p | ||
77 | #define KOQMAT(A) int A##r, int A##c, int A##Xr, int A##Xc, const complex* A##p | ||
78 | #define KOCMAT(A) int A##r, int A##c, int A##Xr, int A##Xc, const doublecomplex* A##p | ||
79 | |||
80 | #define AT(m,i,j) (m##p[(i)*m##Xr + (j)*m##Xc]) | ||
81 | #define TRAV(m,i,j) int i,j; for (i=0;i<m##r;i++) for (j=0;j<m##c;j++) | ||
82 | |||
diff --git a/packages/base/src/Internal/C/vector-aux.c b/packages/base/src/Internal/C/vector-aux.c new file mode 100644 index 0000000..5662697 --- /dev/null +++ b/packages/base/src/Internal/C/vector-aux.c | |||
@@ -0,0 +1,1134 @@ | |||
1 | #include <complex.h> | ||
2 | |||
3 | typedef double complex TCD; | ||
4 | typedef float complex TCF; | ||
5 | |||
6 | #undef complex | ||
7 | |||
8 | #include "lapack-aux.h" | ||
9 | |||
10 | #define V(x) x##n,x##p | ||
11 | |||
12 | #include <string.h> | ||
13 | #include <math.h> | ||
14 | #include <stdio.h> | ||
15 | #include <stdlib.h> | ||
16 | #include <stdint.h> | ||
17 | |||
18 | #define MACRO(B) do {B} while (0) | ||
19 | #define ERROR(CODE) MACRO(return CODE;) | ||
20 | #define REQUIRES(COND, CODE) MACRO(if(!(COND)) {ERROR(CODE);}) | ||
21 | #define OK return 0; | ||
22 | |||
23 | #define MIN(A,B) ((A)<(B)?(A):(B)) | ||
24 | #define MAX(A,B) ((A)>(B)?(A):(B)) | ||
25 | |||
26 | #ifdef DBG | ||
27 | #define DEBUGMSG(M) printf("*** calling aux C function: %s\n",M); | ||
28 | #else | ||
29 | #define DEBUGMSG(M) | ||
30 | #endif | ||
31 | |||
32 | #define CHECK(RES,CODE) MACRO(if(RES) return CODE;) | ||
33 | |||
34 | #define BAD_SIZE 2000 | ||
35 | #define BAD_CODE 2001 | ||
36 | #define MEM 2002 | ||
37 | #define BAD_FILE 2003 | ||
38 | |||
39 | |||
40 | int sumF(KFVEC(x),FVEC(r)) { | ||
41 | DEBUGMSG("sumF"); | ||
42 | REQUIRES(rn==1,BAD_SIZE); | ||
43 | int i; | ||
44 | float res = 0; | ||
45 | for (i = 0; i < xn; i++) res += xp[i]; | ||
46 | rp[0] = res; | ||
47 | OK | ||
48 | } | ||
49 | |||
50 | int sumR(KDVEC(x),DVEC(r)) { | ||
51 | DEBUGMSG("sumR"); | ||
52 | REQUIRES(rn==1,BAD_SIZE); | ||
53 | int i; | ||
54 | double res = 0; | ||
55 | for (i = 0; i < xn; i++) res += xp[i]; | ||
56 | rp[0] = res; | ||
57 | OK | ||
58 | } | ||
59 | |||
60 | int sumI(KIVEC(x),IVEC(r)) { | ||
61 | REQUIRES(rn==1,BAD_SIZE); | ||
62 | int i; | ||
63 | int res = 0; | ||
64 | for (i = 0; i < xn; i++) res += xp[i]; | ||
65 | rp[0] = res; | ||
66 | OK | ||
67 | } | ||
68 | |||
69 | |||
70 | int sumQ(KQVEC(x),QVEC(r)) { | ||
71 | DEBUGMSG("sumQ"); | ||
72 | REQUIRES(rn==1,BAD_SIZE); | ||
73 | int i; | ||
74 | complex res; | ||
75 | res.r = 0; | ||
76 | res.i = 0; | ||
77 | for (i = 0; i < xn; i++) { | ||
78 | res.r += xp[i].r; | ||
79 | res.i += xp[i].i; | ||
80 | } | ||
81 | rp[0] = res; | ||
82 | OK | ||
83 | } | ||
84 | |||
85 | int sumC(KCVEC(x),CVEC(r)) { | ||
86 | DEBUGMSG("sumC"); | ||
87 | REQUIRES(rn==1,BAD_SIZE); | ||
88 | int i; | ||
89 | doublecomplex res; | ||
90 | res.r = 0; | ||
91 | res.i = 0; | ||
92 | for (i = 0; i < xn; i++) { | ||
93 | res.r += xp[i].r; | ||
94 | res.i += xp[i].i; | ||
95 | } | ||
96 | rp[0] = res; | ||
97 | OK | ||
98 | } | ||
99 | |||
100 | |||
101 | int prodF(KFVEC(x),FVEC(r)) { | ||
102 | DEBUGMSG("prodF"); | ||
103 | REQUIRES(rn==1,BAD_SIZE); | ||
104 | int i; | ||
105 | float res = 1; | ||
106 | for (i = 0; i < xn; i++) res *= xp[i]; | ||
107 | rp[0] = res; | ||
108 | OK | ||
109 | } | ||
110 | |||
111 | int prodR(KDVEC(x),DVEC(r)) { | ||
112 | DEBUGMSG("prodR"); | ||
113 | REQUIRES(rn==1,BAD_SIZE); | ||
114 | int i; | ||
115 | double res = 1; | ||
116 | for (i = 0; i < xn; i++) res *= xp[i]; | ||
117 | rp[0] = res; | ||
118 | OK | ||
119 | } | ||
120 | |||
121 | int prodI(KIVEC(x),IVEC(r)) { | ||
122 | REQUIRES(rn==1,BAD_SIZE); | ||
123 | int i; | ||
124 | int res = 1; | ||
125 | for (i = 0; i < xn; i++) res *= xp[i]; | ||
126 | rp[0] = res; | ||
127 | OK | ||
128 | } | ||
129 | |||
130 | |||
131 | |||
132 | int prodQ(KQVEC(x),QVEC(r)) { | ||
133 | DEBUGMSG("prodQ"); | ||
134 | REQUIRES(rn==1,BAD_SIZE); | ||
135 | int i; | ||
136 | complex res; | ||
137 | float temp; | ||
138 | res.r = 1; | ||
139 | res.i = 0; | ||
140 | for (i = 0; i < xn; i++) { | ||
141 | temp = res.r * xp[i].r - res.i * xp[i].i; | ||
142 | res.i = res.r * xp[i].i + res.i * xp[i].r; | ||
143 | res.r = temp; | ||
144 | } | ||
145 | rp[0] = res; | ||
146 | OK | ||
147 | } | ||
148 | |||
149 | int prodC(KCVEC(x),CVEC(r)) { | ||
150 | DEBUGMSG("prodC"); | ||
151 | REQUIRES(rn==1,BAD_SIZE); | ||
152 | int i; | ||
153 | doublecomplex res; | ||
154 | double temp; | ||
155 | res.r = 1; | ||
156 | res.i = 0; | ||
157 | for (i = 0; i < xn; i++) { | ||
158 | temp = res.r * xp[i].r - res.i * xp[i].i; | ||
159 | res.i = res.r * xp[i].i + res.i * xp[i].r; | ||
160 | res.r = temp; | ||
161 | } | ||
162 | rp[0] = res; | ||
163 | OK | ||
164 | } | ||
165 | |||
166 | |||
167 | double dnrm2_(integer*, const double*, integer*); | ||
168 | double dasum_(integer*, const double*, integer*); | ||
169 | |||
170 | double vector_max(KDVEC(x)) { | ||
171 | double r = xp[0]; | ||
172 | int k; | ||
173 | for (k = 1; k<xn; k++) { | ||
174 | if(xp[k]>r) { | ||
175 | r = xp[k]; | ||
176 | } | ||
177 | } | ||
178 | return r; | ||
179 | } | ||
180 | |||
181 | double vector_min(KDVEC(x)) { | ||
182 | double r = xp[0]; | ||
183 | int k; | ||
184 | for (k = 1; k<xn; k++) { | ||
185 | if(xp[k]<r) { | ||
186 | r = xp[k]; | ||
187 | } | ||
188 | } | ||
189 | return r; | ||
190 | } | ||
191 | |||
192 | double vector_max_index(KDVEC(x)) { | ||
193 | int k, r = 0; | ||
194 | for (k = 1; k<xn; k++) { | ||
195 | if(xp[k]>xp[r]) { | ||
196 | r = k; | ||
197 | } | ||
198 | } | ||
199 | return r; | ||
200 | } | ||
201 | |||
202 | double vector_min_index(KDVEC(x)) { | ||
203 | int k, r = 0; | ||
204 | for (k = 1; k<xn; k++) { | ||
205 | if(xp[k]<xp[r]) { | ||
206 | r = k; | ||
207 | } | ||
208 | } | ||
209 | return r; | ||
210 | } | ||
211 | |||
212 | int toScalarR(int code, KDVEC(x), DVEC(r)) { | ||
213 | REQUIRES(rn==1,BAD_SIZE); | ||
214 | DEBUGMSG("toScalarR"); | ||
215 | double res; | ||
216 | integer one = 1; | ||
217 | integer n = xn; | ||
218 | switch(code) { | ||
219 | case 0: { res = dnrm2_(&n,xp,&one); break; } | ||
220 | case 1: { res = dasum_(&n,xp,&one); break; } | ||
221 | case 2: { res = vector_max_index(V(x)); break; } | ||
222 | case 3: { res = vector_max(V(x)); break; } | ||
223 | case 4: { res = vector_min_index(V(x)); break; } | ||
224 | case 5: { res = vector_min(V(x)); break; } | ||
225 | default: ERROR(BAD_CODE); | ||
226 | } | ||
227 | rp[0] = res; | ||
228 | OK | ||
229 | } | ||
230 | |||
231 | |||
232 | float snrm2_(integer*, const float*, integer*); | ||
233 | float sasum_(integer*, const float*, integer*); | ||
234 | |||
235 | float vector_max_f(KFVEC(x)) { | ||
236 | float r = xp[0]; | ||
237 | int k; | ||
238 | for (k = 1; k<xn; k++) { | ||
239 | if(xp[k]>r) { | ||
240 | r = xp[k]; | ||
241 | } | ||
242 | } | ||
243 | return r; | ||
244 | } | ||
245 | |||
246 | float vector_min_f(KFVEC(x)) { | ||
247 | float r = xp[0]; | ||
248 | int k; | ||
249 | for (k = 1; k<xn; k++) { | ||
250 | if(xp[k]<r) { | ||
251 | r = xp[k]; | ||
252 | } | ||
253 | } | ||
254 | return r; | ||
255 | } | ||
256 | |||
257 | float vector_max_index_f(KFVEC(x)) { | ||
258 | int k, r = 0; | ||
259 | for (k = 1; k<xn; k++) { | ||
260 | if(xp[k]>xp[r]) { | ||
261 | r = k; | ||
262 | } | ||
263 | } | ||
264 | return r; | ||
265 | } | ||
266 | |||
267 | float vector_min_index_f(KFVEC(x)) { | ||
268 | int k, r = 0; | ||
269 | for (k = 1; k<xn; k++) { | ||
270 | if(xp[k]<xp[r]) { | ||
271 | r = k; | ||
272 | } | ||
273 | } | ||
274 | return r; | ||
275 | } | ||
276 | |||
277 | |||
278 | int toScalarF(int code, KFVEC(x), FVEC(r)) { | ||
279 | REQUIRES(rn==1,BAD_SIZE); | ||
280 | DEBUGMSG("toScalarF"); | ||
281 | float res; | ||
282 | integer one = 1; | ||
283 | integer n = xn; | ||
284 | switch(code) { | ||
285 | case 0: { res = snrm2_(&n,xp,&one); break; } | ||
286 | case 1: { res = sasum_(&n,xp,&one); break; } | ||
287 | case 2: { res = vector_max_index_f(V(x)); break; } | ||
288 | case 3: { res = vector_max_f(V(x)); break; } | ||
289 | case 4: { res = vector_min_index_f(V(x)); break; } | ||
290 | case 5: { res = vector_min_f(V(x)); break; } | ||
291 | default: ERROR(BAD_CODE); | ||
292 | } | ||
293 | rp[0] = res; | ||
294 | OK | ||
295 | } | ||
296 | |||
297 | int vector_max_i(KIVEC(x)) { | ||
298 | int r = xp[0]; | ||
299 | int k; | ||
300 | for (k = 1; k<xn; k++) { | ||
301 | if(xp[k]>r) { | ||
302 | r = xp[k]; | ||
303 | } | ||
304 | } | ||
305 | return r; | ||
306 | } | ||
307 | |||
308 | int vector_min_i(KIVEC(x)) { | ||
309 | float r = xp[0]; | ||
310 | int k; | ||
311 | for (k = 1; k<xn; k++) { | ||
312 | if(xp[k]<r) { | ||
313 | r = xp[k]; | ||
314 | } | ||
315 | } | ||
316 | return r; | ||
317 | } | ||
318 | |||
319 | int vector_max_index_i(KIVEC(x)) { | ||
320 | int k, r = 0; | ||
321 | for (k = 1; k<xn; k++) { | ||
322 | if(xp[k]>xp[r]) { | ||
323 | r = k; | ||
324 | } | ||
325 | } | ||
326 | return r; | ||
327 | } | ||
328 | |||
329 | int vector_min_index_i(KIVEC(x)) { | ||
330 | int k, r = 0; | ||
331 | for (k = 1; k<xn; k++) { | ||
332 | if(xp[k]<xp[r]) { | ||
333 | r = k; | ||
334 | } | ||
335 | } | ||
336 | return r; | ||
337 | } | ||
338 | |||
339 | |||
340 | int toScalarI(int code, KIVEC(x), IVEC(r)) { | ||
341 | REQUIRES(rn==1,BAD_SIZE); | ||
342 | int res; | ||
343 | switch(code) { | ||
344 | case 2: { res = vector_max_index_i(V(x)); break; } | ||
345 | case 3: { res = vector_max_i(V(x)); break; } | ||
346 | case 4: { res = vector_min_index_i(V(x)); break; } | ||
347 | case 5: { res = vector_min_i(V(x)); break; } | ||
348 | default: ERROR(BAD_CODE); | ||
349 | } | ||
350 | rp[0] = res; | ||
351 | OK | ||
352 | } | ||
353 | |||
354 | |||
355 | double dznrm2_(integer*, const doublecomplex*, integer*); | ||
356 | double dzasum_(integer*, const doublecomplex*, integer*); | ||
357 | |||
358 | int toScalarC(int code, KCVEC(x), DVEC(r)) { | ||
359 | REQUIRES(rn==1,BAD_SIZE); | ||
360 | DEBUGMSG("toScalarC"); | ||
361 | double res; | ||
362 | integer one = 1; | ||
363 | integer n = xn; | ||
364 | switch(code) { | ||
365 | case 0: { res = dznrm2_(&n,xp,&one); break; } | ||
366 | case 1: { res = dzasum_(&n,xp,&one); break; } | ||
367 | default: ERROR(BAD_CODE); | ||
368 | } | ||
369 | rp[0] = res; | ||
370 | OK | ||
371 | } | ||
372 | |||
373 | |||
374 | double scnrm2_(integer*, const complex*, integer*); | ||
375 | double scasum_(integer*, const complex*, integer*); | ||
376 | |||
377 | int toScalarQ(int code, KQVEC(x), FVEC(r)) { | ||
378 | REQUIRES(rn==1,BAD_SIZE); | ||
379 | DEBUGMSG("toScalarQ"); | ||
380 | float res; | ||
381 | integer one = 1; | ||
382 | integer n = xn; | ||
383 | switch(code) { | ||
384 | case 0: { res = scnrm2_(&n,xp,&one); break; } | ||
385 | case 1: { res = scasum_(&n,xp,&one); break; } | ||
386 | default: ERROR(BAD_CODE); | ||
387 | } | ||
388 | rp[0] = res; | ||
389 | OK | ||
390 | } | ||
391 | |||
392 | |||
393 | inline double sign(double x) { | ||
394 | if(x>0) { | ||
395 | return +1.0; | ||
396 | } else if (x<0) { | ||
397 | return -1.0; | ||
398 | } else { | ||
399 | return 0.0; | ||
400 | } | ||
401 | } | ||
402 | |||
403 | inline float float_sign(float x) { | ||
404 | if(x>0) { | ||
405 | return +1.0; | ||
406 | } else if (x<0) { | ||
407 | return -1.0; | ||
408 | } else { | ||
409 | return 0.0; | ||
410 | } | ||
411 | } | ||
412 | |||
413 | |||
414 | #define OP(C,F) case C: { for(k=0;k<xn;k++) rp[k] = F(xp[k]); OK } | ||
415 | #define OPV(C,E) case C: { for(k=0;k<xn;k++) rp[k] = E; OK } | ||
416 | int mapR(int code, KDVEC(x), DVEC(r)) { | ||
417 | int k; | ||
418 | REQUIRES(xn == rn,BAD_SIZE); | ||
419 | DEBUGMSG("mapR"); | ||
420 | switch (code) { | ||
421 | OP(0,sin) | ||
422 | OP(1,cos) | ||
423 | OP(2,tan) | ||
424 | OP(3,fabs) | ||
425 | OP(4,asin) | ||
426 | OP(5,acos) | ||
427 | OP(6,atan) | ||
428 | OP(7,sinh) | ||
429 | OP(8,cosh) | ||
430 | OP(9,tanh) | ||
431 | OP(10,asinh) | ||
432 | OP(11,acosh) | ||
433 | OP(12,atanh) | ||
434 | OP(13,exp) | ||
435 | OP(14,log) | ||
436 | OP(15,sign) | ||
437 | OP(16,sqrt) | ||
438 | default: ERROR(BAD_CODE); | ||
439 | } | ||
440 | } | ||
441 | |||
442 | int mapF(int code, KFVEC(x), FVEC(r)) { | ||
443 | int k; | ||
444 | REQUIRES(xn == rn,BAD_SIZE); | ||
445 | DEBUGMSG("mapF"); | ||
446 | switch (code) { | ||
447 | OP(0,sin) | ||
448 | OP(1,cos) | ||
449 | OP(2,tan) | ||
450 | OP(3,fabs) | ||
451 | OP(4,asin) | ||
452 | OP(5,acos) | ||
453 | OP(6,atan) | ||
454 | OP(7,sinh) | ||
455 | OP(8,cosh) | ||
456 | OP(9,tanh) | ||
457 | OP(10,asinh) | ||
458 | OP(11,acosh) | ||
459 | OP(12,atanh) | ||
460 | OP(13,exp) | ||
461 | OP(14,log) | ||
462 | OP(15,sign) | ||
463 | OP(16,sqrt) | ||
464 | default: ERROR(BAD_CODE); | ||
465 | } | ||
466 | } | ||
467 | |||
468 | |||
469 | int mapI(int code, KIVEC(x), IVEC(r)) { | ||
470 | int k; | ||
471 | REQUIRES(xn == rn,BAD_SIZE); | ||
472 | switch (code) { | ||
473 | OP(3,abs) | ||
474 | OP(15,sign) | ||
475 | default: ERROR(BAD_CODE); | ||
476 | } | ||
477 | } | ||
478 | |||
479 | |||
480 | |||
481 | inline double abs_complex(doublecomplex z) { | ||
482 | return sqrt(z.r*z.r + z.i*z.i); | ||
483 | } | ||
484 | |||
485 | inline doublecomplex complex_abs_complex(doublecomplex z) { | ||
486 | doublecomplex r; | ||
487 | r.r = abs_complex(z); | ||
488 | r.i = 0; | ||
489 | return r; | ||
490 | } | ||
491 | |||
492 | inline doublecomplex complex_signum_complex(doublecomplex z) { | ||
493 | doublecomplex r; | ||
494 | double mag; | ||
495 | if (z.r == 0 && z.i == 0) { | ||
496 | r.r = 0; | ||
497 | r.i = 0; | ||
498 | } else { | ||
499 | mag = abs_complex(z); | ||
500 | r.r = z.r/mag; | ||
501 | r.i = z.i/mag; | ||
502 | } | ||
503 | return r; | ||
504 | } | ||
505 | |||
506 | #define OPb(C,F) case C: { for(k=0;k<xn;k++) r2p[k] = F(x2p[k]); OK } | ||
507 | int mapC(int code, KCVEC(x), CVEC(r)) { | ||
508 | TCD* x2p = (TCD*)xp; | ||
509 | TCD* r2p = (TCD*)rp; | ||
510 | int k; | ||
511 | REQUIRES(xn == rn,BAD_SIZE); | ||
512 | DEBUGMSG("mapC"); | ||
513 | switch (code) { | ||
514 | OPb(0,csin) | ||
515 | OPb(1,ccos) | ||
516 | OPb(2,ctan) | ||
517 | OP(3,complex_abs_complex) | ||
518 | OPb(4,casin) | ||
519 | OPb(5,cacos) | ||
520 | OPb(6,catan) | ||
521 | OPb(7,csinh) | ||
522 | OPb(8,ccosh) | ||
523 | OPb(9,ctanh) | ||
524 | OPb(10,casinh) | ||
525 | OPb(11,cacosh) | ||
526 | OPb(12,catanh) | ||
527 | OPb(13,cexp) | ||
528 | OPb(14,clog) | ||
529 | OP(15,complex_signum_complex) | ||
530 | OPb(16,csqrt) | ||
531 | default: ERROR(BAD_CODE); | ||
532 | } | ||
533 | } | ||
534 | |||
535 | |||
536 | |||
537 | inline complex complex_f_math_fun(doublecomplex (*cf)(doublecomplex), complex a) | ||
538 | { | ||
539 | doublecomplex c; | ||
540 | doublecomplex r; | ||
541 | |||
542 | complex float_r; | ||
543 | |||
544 | c.r = a.r; | ||
545 | c.i = a.i; | ||
546 | |||
547 | r = (*cf)(c); | ||
548 | |||
549 | float_r.r = r.r; | ||
550 | float_r.i = r.i; | ||
551 | |||
552 | return float_r; | ||
553 | } | ||
554 | |||
555 | |||
556 | #define OPC(C,F) case C: { for(k=0;k<xn;k++) rp[k] = complex_f_math_fun(&F,xp[k]); OK } | ||
557 | int mapQ(int code, KQVEC(x), QVEC(r)) { | ||
558 | TCF* x2p = (TCF*)xp; | ||
559 | TCF* r2p = (TCF*)rp; | ||
560 | int k; | ||
561 | REQUIRES(xn == rn,BAD_SIZE); | ||
562 | DEBUGMSG("mapQ"); | ||
563 | switch (code) { | ||
564 | OPb(0,csinf) | ||
565 | OPb(1,ccosf) | ||
566 | OPb(2,ctanf) | ||
567 | OPC(3,complex_abs_complex) | ||
568 | OPb(4,casinf) | ||
569 | OPb(5,cacosf) | ||
570 | OPb(6,catanf) | ||
571 | OPb(7,csinhf) | ||
572 | OPb(8,ccoshf) | ||
573 | OPb(9,ctanhf) | ||
574 | OPb(10,casinhf) | ||
575 | OPb(11,cacoshf) | ||
576 | OPb(12,catanhf) | ||
577 | OPb(13,cexpf) | ||
578 | OPb(14,clogf) | ||
579 | OPC(15,complex_signum_complex) | ||
580 | OPb(16,csqrtf) | ||
581 | default: ERROR(BAD_CODE); | ||
582 | } | ||
583 | } | ||
584 | |||
585 | |||
586 | int mapValR(int code, double* pval, KDVEC(x), DVEC(r)) { | ||
587 | int k; | ||
588 | double val = *pval; | ||
589 | REQUIRES(xn == rn,BAD_SIZE); | ||
590 | DEBUGMSG("mapValR"); | ||
591 | switch (code) { | ||
592 | OPV(0,val*xp[k]) | ||
593 | OPV(1,val/xp[k]) | ||
594 | OPV(2,val+xp[k]) | ||
595 | OPV(3,val-xp[k]) | ||
596 | OPV(4,pow(val,xp[k])) | ||
597 | OPV(5,pow(xp[k],val)) | ||
598 | default: ERROR(BAD_CODE); | ||
599 | } | ||
600 | } | ||
601 | |||
602 | int mapValF(int code, float* pval, KFVEC(x), FVEC(r)) { | ||
603 | int k; | ||
604 | float val = *pval; | ||
605 | REQUIRES(xn == rn,BAD_SIZE); | ||
606 | DEBUGMSG("mapValF"); | ||
607 | switch (code) { | ||
608 | OPV(0,val*xp[k]) | ||
609 | OPV(1,val/xp[k]) | ||
610 | OPV(2,val+xp[k]) | ||
611 | OPV(3,val-xp[k]) | ||
612 | OPV(4,pow(val,xp[k])) | ||
613 | OPV(5,pow(xp[k],val)) | ||
614 | default: ERROR(BAD_CODE); | ||
615 | } | ||
616 | } | ||
617 | |||
618 | int mod (int a, int b) { | ||
619 | int m = a % b; | ||
620 | if (b>0) { | ||
621 | return m >=0 ? m : m+b; | ||
622 | } else { | ||
623 | return m <=0 ? m : m+b; | ||
624 | } | ||
625 | } | ||
626 | |||
627 | int mapValI(int code, int* pval, KIVEC(x), IVEC(r)) { | ||
628 | int k; | ||
629 | int val = *pval; | ||
630 | REQUIRES(xn == rn,BAD_SIZE); | ||
631 | DEBUGMSG("mapValI"); | ||
632 | switch (code) { | ||
633 | OPV(0,val*xp[k]) | ||
634 | OPV(1,val/xp[k]) | ||
635 | OPV(2,val+xp[k]) | ||
636 | OPV(3,val-xp[k]) | ||
637 | OPV(6,mod(val,xp[k])) | ||
638 | OPV(7,mod(xp[k],val)) | ||
639 | default: ERROR(BAD_CODE); | ||
640 | } | ||
641 | } | ||
642 | |||
643 | |||
644 | |||
645 | inline doublecomplex complex_add(doublecomplex a, doublecomplex b) { | ||
646 | doublecomplex r; | ||
647 | r.r = a.r+b.r; | ||
648 | r.i = a.i+b.i; | ||
649 | return r; | ||
650 | } | ||
651 | |||
652 | #define OPVb(C,E) case C: { for(k=0;k<xn;k++) r2p[k] = E; OK } | ||
653 | int mapValC(int code, doublecomplex* pval, KCVEC(x), CVEC(r)) { | ||
654 | TCD* x2p = (TCD*)xp; | ||
655 | TCD* r2p = (TCD*)rp; | ||
656 | int k; | ||
657 | TCD val = * (TCD*)pval; | ||
658 | REQUIRES(xn == rn,BAD_SIZE); | ||
659 | DEBUGMSG("mapValC"); | ||
660 | switch (code) { | ||
661 | OPVb(0,val*x2p[k]) | ||
662 | OPVb(1,val/x2p[k]) | ||
663 | OPVb(2,val+x2p[k]) | ||
664 | OPVb(3,val-x2p[k]) | ||
665 | OPVb(4,cpow(val,x2p[k])) | ||
666 | OPVb(5,cpow(x2p[k],val)) | ||
667 | default: ERROR(BAD_CODE); | ||
668 | } | ||
669 | } | ||
670 | |||
671 | |||
672 | int mapValQ(int code, complex* pval, KQVEC(x), QVEC(r)) { | ||
673 | TCF* x2p = (TCF*)xp; | ||
674 | TCF* r2p = (TCF*)rp; | ||
675 | int k; | ||
676 | TCF val = *(TCF*)pval; | ||
677 | REQUIRES(xn == rn,BAD_SIZE); | ||
678 | DEBUGMSG("mapValQ"); | ||
679 | switch (code) { | ||
680 | OPVb(0,val*x2p[k]) | ||
681 | OPVb(1,val/x2p[k]) | ||
682 | OPVb(2,val+x2p[k]) | ||
683 | OPVb(3,val-x2p[k]) | ||
684 | OPVb(4,cpow(val,x2p[k])) | ||
685 | OPVb(5,cpow(x2p[k],val)) | ||
686 | default: ERROR(BAD_CODE); | ||
687 | } | ||
688 | } | ||
689 | |||
690 | |||
691 | |||
692 | #define OPZE(C,msg,E) case C: {DEBUGMSG(msg) for(k=0;k<an;k++) rp[k] = E(ap[k],bp[k]); OK } | ||
693 | #define OPZV(C,msg,E) case C: {DEBUGMSG(msg) res = E(V(r),V(b)); CHECK(res,res); OK } | ||
694 | #define OPZO(C,msg,O) case C: {DEBUGMSG(msg) for(k=0;k<an;k++) rp[k] = ap[k] O bp[k]; OK } | ||
695 | |||
696 | int zipR(int code, KDVEC(a), KDVEC(b), DVEC(r)) { | ||
697 | REQUIRES(an == bn && an == rn, BAD_SIZE); | ||
698 | int k; | ||
699 | switch(code) { | ||
700 | OPZO(0,"zipR Add",+) | ||
701 | OPZO(1,"zipR Sub",-) | ||
702 | OPZO(2,"zipR Mul",*) | ||
703 | OPZO(3,"zipR Div",/) | ||
704 | OPZE(4,"zipR Pow", pow) | ||
705 | OPZE(5,"zipR ATan2",atan2) | ||
706 | default: ERROR(BAD_CODE); | ||
707 | } | ||
708 | } | ||
709 | |||
710 | int zipF(int code, KFVEC(a), KFVEC(b), FVEC(r)) { | ||
711 | REQUIRES(an == bn && an == rn, BAD_SIZE); | ||
712 | int k; | ||
713 | switch(code) { | ||
714 | OPZO(0,"zipR Add",+) | ||
715 | OPZO(1,"zipR Sub",-) | ||
716 | OPZO(2,"zipR Mul",*) | ||
717 | OPZO(3,"zipR Div",/) | ||
718 | OPZE(4,"zipR Pow", pow) | ||
719 | OPZE(5,"zipR ATan2",atan2) | ||
720 | default: ERROR(BAD_CODE); | ||
721 | } | ||
722 | } | ||
723 | |||
724 | |||
725 | int zipI(int code, KIVEC(a), KIVEC(b), IVEC(r)) { | ||
726 | REQUIRES(an == bn && an == rn, BAD_SIZE); | ||
727 | int k; | ||
728 | switch(code) { | ||
729 | OPZO(0,"zipI Add",+) | ||
730 | OPZO(1,"zipI Sub",-) | ||
731 | OPZO(2,"zipI Mul",*) | ||
732 | OPZO(3,"zipI Div",/) | ||
733 | OPZO(6,"zipI Mod",%) | ||
734 | default: ERROR(BAD_CODE); | ||
735 | } | ||
736 | } | ||
737 | |||
738 | |||
739 | |||
740 | #define OPZOb(C,msg,O) case C: {DEBUGMSG(msg) for(k=0;k<an;k++) r2p[k] = a2p[k] O b2p[k]; OK } | ||
741 | #define OPZEb(C,msg,E) case C: {DEBUGMSG(msg) for(k=0;k<an;k++) r2p[k] = E(a2p[k],b2p[k]); OK } | ||
742 | int zipC(int code, KCVEC(a), KCVEC(b), CVEC(r)) { | ||
743 | REQUIRES(an == bn && an == rn, BAD_SIZE); | ||
744 | TCD* a2p = (TCD*)ap; | ||
745 | TCD* b2p = (TCD*)bp; | ||
746 | TCD* r2p = (TCD*)rp; | ||
747 | int k; | ||
748 | switch(code) { | ||
749 | OPZOb(0,"zipC Add",+) | ||
750 | OPZOb(1,"zipC Sub",-) | ||
751 | OPZOb(2,"zipC Mul",*) | ||
752 | OPZOb(3,"zipC Div",/) | ||
753 | OPZEb(4,"zipC Pow",cpow) | ||
754 | default: ERROR(BAD_CODE); | ||
755 | } | ||
756 | } | ||
757 | |||
758 | |||
759 | |||
760 | |||
761 | |||
762 | #define OPCZE(C,msg,E) case C: {DEBUGMSG(msg) for(k=0;k<an;k++) rp[k] = complex_f_math_op(&E,ap[k],bp[k]); OK } | ||
763 | |||
764 | int zipQ(int code, KQVEC(a), KQVEC(b), QVEC(r)) { | ||
765 | REQUIRES(an == bn && an == rn, BAD_SIZE); | ||
766 | TCF* a2p = (TCF*)ap; | ||
767 | TCF* b2p = (TCF*)bp; | ||
768 | TCF* r2p = (TCF*)rp; | ||
769 | |||
770 | int k; | ||
771 | switch(code) { | ||
772 | OPZOb(0,"zipC Add",+) | ||
773 | OPZOb(1,"zipC Sub",-) | ||
774 | OPZOb(2,"zipC Mul",*) | ||
775 | OPZOb(3,"zipC Div",/) | ||
776 | OPZEb(4,"zipC Pow",cpowf) | ||
777 | default: ERROR(BAD_CODE); | ||
778 | } | ||
779 | } | ||
780 | |||
781 | //////////////////////////////////////////////////////////////////////////////// | ||
782 | |||
783 | int vectorScan(char * file, int* n, double**pp){ | ||
784 | FILE * fp; | ||
785 | fp = fopen (file, "r"); | ||
786 | if(!fp) { | ||
787 | ERROR(BAD_FILE); | ||
788 | } | ||
789 | int nbuf = 100*100; | ||
790 | double * p = (double*)malloc(nbuf*sizeof(double)); | ||
791 | int k=0; | ||
792 | double d; | ||
793 | int ok; | ||
794 | for (;;) { | ||
795 | ok = fscanf(fp,"%lf",&d); | ||
796 | if (ok<1) { | ||
797 | break; | ||
798 | } | ||
799 | if (k==nbuf) { | ||
800 | nbuf = nbuf * 2; | ||
801 | p = (double*)realloc(p,nbuf*sizeof(double)); | ||
802 | // printf("R\n"); | ||
803 | } | ||
804 | p[k++] = d; | ||
805 | } | ||
806 | *n = k; | ||
807 | *pp = p; | ||
808 | fclose(fp); | ||
809 | OK | ||
810 | } | ||
811 | |||
812 | int saveMatrix(char * file, char * format, KDMAT(a)){ | ||
813 | FILE * fp; | ||
814 | fp = fopen (file, "w"); | ||
815 | int r, c; | ||
816 | for (r=0;r<ar; r++) { | ||
817 | for (c=0; c<ac; c++) { | ||
818 | fprintf(fp,format,ap[r*ac+c]); | ||
819 | if (c<ac-1) { | ||
820 | fprintf(fp," "); | ||
821 | } else { | ||
822 | fprintf(fp,"\n"); | ||
823 | } | ||
824 | } | ||
825 | } | ||
826 | fclose(fp); | ||
827 | OK | ||
828 | } | ||
829 | |||
830 | //////////////////////////////////////////////////////////////////////////////// | ||
831 | |||
832 | #if defined (__APPLE__) || (__FreeBSD__) | ||
833 | /* FreeBSD and Mac OS X do not provide random_r(), thread safety cannot be | ||
834 | guaranteed. | ||
835 | For FreeBSD and Mac OS X, nrand48() is much better than random(). | ||
836 | See: http://www.evanjones.ca/random-thread-safe.html | ||
837 | */ | ||
838 | #pragma message "randomVector is not thread-safe in OSX and FreeBSD" | ||
839 | |||
840 | inline double urandom() { | ||
841 | /* the probalility of matching will be theoretically p^3(in fact, it is not) | ||
842 | p is matching probalility of random(). | ||
843 | using the test there, only 3 matches, using random(), 13783 matches | ||
844 | */ | ||
845 | unsigned short state[3]; | ||
846 | state[0] = random(); | ||
847 | state[1] = random(); | ||
848 | state[2] = random(); | ||
849 | |||
850 | const long max_random = 2147483647; // 2**31 - 1 | ||
851 | return (double)nrand48(state) / (double)max_random; | ||
852 | } | ||
853 | |||
854 | double gaussrand(int *phase, double *pV1, double *pV2, double *pS) | ||
855 | { | ||
856 | double V1=*pV1, V2=*pV2, S=*pS; | ||
857 | double X; | ||
858 | |||
859 | if(*phase == 0) { | ||
860 | do { | ||
861 | double U1 = urandom(); | ||
862 | double U2 = urandom(); | ||
863 | |||
864 | V1 = 2 * U1 - 1; | ||
865 | V2 = 2 * U2 - 1; | ||
866 | S = V1 * V1 + V2 * V2; | ||
867 | } while(S >= 1 || S == 0); | ||
868 | |||
869 | X = V1 * sqrt(-2 * log(S) / S); | ||
870 | } else | ||
871 | X = V2 * sqrt(-2 * log(S) / S); | ||
872 | |||
873 | *phase = 1 - *phase; | ||
874 | *pV1=V1; *pV2=V2; *pS=S; | ||
875 | |||
876 | return X; | ||
877 | |||
878 | } | ||
879 | |||
880 | int random_vector(unsigned int seed, int code, DVEC(r)) { | ||
881 | int phase = 0; | ||
882 | double V1,V2,S; | ||
883 | |||
884 | srandom(seed); | ||
885 | |||
886 | int k; | ||
887 | switch (code) { | ||
888 | case 0: { // uniform | ||
889 | for (k=0; k<rn; k++) { | ||
890 | rp[k] = urandom(); | ||
891 | } | ||
892 | OK | ||
893 | } | ||
894 | case 1: { // gaussian | ||
895 | for (k=0; k<rn; k++) { | ||
896 | rp[k] = gaussrand(&phase,&V1,&V2,&S); | ||
897 | } | ||
898 | OK | ||
899 | } | ||
900 | |||
901 | default: ERROR(BAD_CODE); | ||
902 | } | ||
903 | } | ||
904 | |||
905 | #else | ||
906 | |||
907 | inline double urandom(struct random_data * buffer) { | ||
908 | int32_t res; | ||
909 | random_r(buffer,&res); | ||
910 | return (double)res/RAND_MAX; | ||
911 | } | ||
912 | |||
913 | |||
914 | // http://c-faq.com/lib/gaussian.html | ||
915 | double gaussrand(struct random_data *buffer, | ||
916 | int *phase, double *pV1, double *pV2, double *pS) | ||
917 | { | ||
918 | double V1=*pV1, V2=*pV2, S=*pS; | ||
919 | double X; | ||
920 | |||
921 | if(*phase == 0) { | ||
922 | do { | ||
923 | double U1 = urandom(buffer); | ||
924 | double U2 = urandom(buffer); | ||
925 | |||
926 | V1 = 2 * U1 - 1; | ||
927 | V2 = 2 * U2 - 1; | ||
928 | S = V1 * V1 + V2 * V2; | ||
929 | } while(S >= 1 || S == 0); | ||
930 | |||
931 | X = V1 * sqrt(-2 * log(S) / S); | ||
932 | } else | ||
933 | X = V2 * sqrt(-2 * log(S) / S); | ||
934 | |||
935 | *phase = 1 - *phase; | ||
936 | *pV1=V1; *pV2=V2; *pS=S; | ||
937 | |||
938 | return X; | ||
939 | |||
940 | } | ||
941 | |||
942 | int random_vector(unsigned int seed, int code, DVEC(r)) { | ||
943 | struct random_data buffer; | ||
944 | char random_state[128]; | ||
945 | memset(&buffer, 0, sizeof(struct random_data)); | ||
946 | memset(random_state, 0, sizeof(random_state)); | ||
947 | |||
948 | initstate_r(seed,random_state,sizeof(random_state),&buffer); | ||
949 | // setstate_r(random_state,&buffer); | ||
950 | // srandom_r(seed,&buffer); | ||
951 | |||
952 | int phase = 0; | ||
953 | double V1,V2,S; | ||
954 | |||
955 | int k; | ||
956 | switch (code) { | ||
957 | case 0: { // uniform | ||
958 | for (k=0; k<rn; k++) { | ||
959 | rp[k] = urandom(&buffer); | ||
960 | } | ||
961 | OK | ||
962 | } | ||
963 | case 1: { // gaussian | ||
964 | for (k=0; k<rn; k++) { | ||
965 | rp[k] = gaussrand(&buffer,&phase,&V1,&V2,&S); | ||
966 | } | ||
967 | OK | ||
968 | } | ||
969 | |||
970 | default: ERROR(BAD_CODE); | ||
971 | } | ||
972 | } | ||
973 | |||
974 | #endif | ||
975 | |||
976 | //////////////////////////////////////////////////////////////////////////////// | ||
977 | |||
978 | int smXv(KDVEC(vals),KIVEC(cols),KIVEC(rows),KDVEC(x),DVEC(r)) { | ||
979 | int r, c; | ||
980 | for (r = 0; r < rowsn - 1; r++) { | ||
981 | rp[r] = 0; | ||
982 | for (c = rowsp[r]; c < rowsp[r+1]; c++) { | ||
983 | rp[r] += valsp[c-1] * xp[colsp[c-1]-1]; | ||
984 | } | ||
985 | } | ||
986 | OK | ||
987 | } | ||
988 | |||
989 | int smTXv(KDVEC(vals),KIVEC(cols),KIVEC(rows),KDVEC(x),DVEC(r)) { | ||
990 | int r,c; | ||
991 | for (c = 0; c < rn; c++) { | ||
992 | rp[c] = 0; | ||
993 | } | ||
994 | for (r = 0; r < rowsn - 1; r++) { | ||
995 | for (c = rowsp[r]; c < rowsp[r+1]; c++) { | ||
996 | rp[colsp[c-1]-1] += valsp[c-1] * xp[r]; | ||
997 | } | ||
998 | } | ||
999 | OK | ||
1000 | } | ||
1001 | |||
1002 | //////////////////////////////////////////////////////////////////////////////// | ||
1003 | |||
1004 | int | ||
1005 | compare_doubles (const void *a, const void *b) { | ||
1006 | return *(double*)a > *(double*)b; | ||
1007 | } | ||
1008 | |||
1009 | int sort_valuesD(KDVEC(v),DVEC(r)) { | ||
1010 | memcpy(rp,vp,vn*sizeof(double)); | ||
1011 | qsort(rp,rn,sizeof(double),compare_doubles); | ||
1012 | OK | ||
1013 | } | ||
1014 | |||
1015 | int | ||
1016 | compare_floats (const void *a, const void *b) { | ||
1017 | return *(float*)a > *(float*)b; | ||
1018 | } | ||
1019 | |||
1020 | int sort_valuesF(KFVEC(v),FVEC(r)) { | ||
1021 | memcpy(rp,vp,vn*sizeof(float)); | ||
1022 | qsort(rp,rn,sizeof(float),compare_floats); | ||
1023 | OK | ||
1024 | } | ||
1025 | |||
1026 | int | ||
1027 | compare_ints(const void *a, const void *b) { | ||
1028 | return *(int*)a > *(int*)b; | ||
1029 | } | ||
1030 | |||
1031 | int sort_valuesI(KIVEC(v),IVEC(r)) { | ||
1032 | memcpy(rp,vp,vn*sizeof(int)); | ||
1033 | qsort(rp,rn,sizeof(int),compare_ints); | ||
1034 | OK | ||
1035 | } | ||
1036 | |||
1037 | //////////////////////////////////////// | ||
1038 | |||
1039 | |||
1040 | #define SORTIDX_IMP(T,C) \ | ||
1041 | T* x = (T*)malloc(sizeof(T)*vn); \ | ||
1042 | int k; \ | ||
1043 | for (k=0;k<vn;k++) { \ | ||
1044 | x[k].pos = k; \ | ||
1045 | x[k].val = vp[k]; \ | ||
1046 | } \ | ||
1047 | \ | ||
1048 | qsort(x,vn,sizeof(T),C); \ | ||
1049 | \ | ||
1050 | for (k=0;k<vn;k++) { \ | ||
1051 | rp[k] = x[k].pos; \ | ||
1052 | } \ | ||
1053 | free(x); \ | ||
1054 | OK | ||
1055 | |||
1056 | |||
1057 | typedef struct SDI { int pos; double val;} DI; | ||
1058 | |||
1059 | int compare_doubles_i (const void *a, const void *b) { | ||
1060 | return ((DI*)a)->val > ((DI*)b)->val; | ||
1061 | } | ||
1062 | |||
1063 | int sort_indexD(KDVEC(v),IVEC(r)) { | ||
1064 | SORTIDX_IMP(DI,compare_doubles_i) | ||
1065 | } | ||
1066 | |||
1067 | |||
1068 | typedef struct FI { int pos; float val;} FI; | ||
1069 | |||
1070 | int compare_floats_i (const void *a, const void *b) { | ||
1071 | return ((FI*)a)->val > ((FI*)b)->val; | ||
1072 | } | ||
1073 | |||
1074 | int sort_indexF(KFVEC(v),IVEC(r)) { | ||
1075 | SORTIDX_IMP(FI,compare_floats_i) | ||
1076 | } | ||
1077 | |||
1078 | |||
1079 | typedef struct II { int pos; int val;} II; | ||
1080 | |||
1081 | int compare_ints_i (const void *a, const void *b) { | ||
1082 | return ((II*)a)->val > ((II*)b)->val; | ||
1083 | } | ||
1084 | |||
1085 | int sort_indexI(KIVEC(v),IVEC(r)) { | ||
1086 | SORTIDX_IMP(II,compare_ints_i) | ||
1087 | } | ||
1088 | |||
1089 | |||
1090 | //////////////////////////////////////////////////////////////////////////////// | ||
1091 | |||
1092 | int round_vector(KDVEC(v),DVEC(r)) { | ||
1093 | int k; | ||
1094 | for(k=0; k<vn; k++) { | ||
1095 | rp[k] = round(vp[k]); | ||
1096 | } | ||
1097 | OK | ||
1098 | } | ||
1099 | |||
1100 | //////////////////////////////////////////////////////////////////////////////// | ||
1101 | |||
1102 | int round_vector_i(KDVEC(v),IVEC(r)) { | ||
1103 | int k; | ||
1104 | for(k=0; k<vn; k++) { | ||
1105 | rp[k] = round(vp[k]); | ||
1106 | } | ||
1107 | OK | ||
1108 | } | ||
1109 | |||
1110 | |||
1111 | int mod_vector(int m, KIVEC(v), IVEC(r)) { | ||
1112 | int k; | ||
1113 | for(k=0; k<vn; k++) { | ||
1114 | rp[k] = vp[k] % m; | ||
1115 | } | ||
1116 | OK | ||
1117 | } | ||
1118 | |||
1119 | int div_vector(int m, KIVEC(v), IVEC(r)) { | ||
1120 | int k; | ||
1121 | for(k=0; k<vn; k++) { | ||
1122 | rp[k] = vp[k] / m; | ||
1123 | } | ||
1124 | OK | ||
1125 | } | ||
1126 | |||
1127 | int range_vector(IVEC(r)) { | ||
1128 | int k; | ||
1129 | for(k=0; k<rn; k++) { | ||
1130 | rp[k] = k; | ||
1131 | } | ||
1132 | OK | ||
1133 | } | ||
1134 | |||