Context Navigation

matrix.c @ 103c026

Visit:

stereo-2025

Last change on this file since 103c026 was 103c026, checked in by Olly Betts <olly@…>, 12 months ago

Store stn_tab index in stn->colour for matrix build

This avoids a linear search for every station to find the index
while building the matrix (though this doesn't change doesn't
improve the O() behaviour of the matrix build).

Property mode set to 100644

File size: 12.2 KB

Rev	Line
[421b7d2]	1	/* matrix.c
[d1b1380]	2	* Matrix building and solving routines
[a4adf09]	3	* Copyright (C) 1993-2003,2010,2013 Olly Betts
[846746e]	4	*
[89231c4]	5	* This program is free software; you can redistribute it and/or modify
	6	* it under the terms of the GNU General Public License as published by
	7	* the Free Software Foundation; either version 2 of the License, or
	8	* (at your option) any later version.
[846746e]	9	*
	10	* This program is distributed in the hope that it will be useful,
	11	* but WITHOUT ANY WARRANTY; without even the implied warranty of
[89231c4]	12	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	13	* GNU General Public License for more details.
[846746e]	14	*
[89231c4]	15	* You should have received a copy of the GNU General Public License
	16	* along with this program; if not, write to the Free Software
[ecbc6c18]	17	* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
[d1b1380]	18	*/
	19
[2164fa4]	20	/#define SOR 1/
[702f518]	21
[032ed06]	22	#if 0
	23	# define DEBUG_INVALID 1
	24	#endif
	25
[4c83f84]	26	#include <config.h>
[d1b1380]	27
	28	#include "debug.h"
[a420b49]	29	#include "cavern.h"
[c082b69]	30	#include "filename.h"
	31	#include "message.h"
[d1b1380]	32	#include "netbits.h"
	33	#include "matrix.h"
	34	#include "out.h"
	35
	36	#undef PRINT_MATRICES
	37	#define PRINT_MATRICES 0
	38
	39	#undef DEBUG_MATRIX_BUILD
	40	#define DEBUG_MATRIX_BUILD 0
	41
	42	#undef DEBUG_MATRIX
	43	#define DEBUG_MATRIX 0
	44
	45	#if PRINT_MATRICES
[9965b2b]	46	static void print_matrix(real M, real B, long n);
[d1b1380]	47	#endif
	48
[9965b2b]	49	static void choleski(real M, real B, long n);
[3fde384f]	50
[d1b1380]	51	#ifdef SOR
[9965b2b]	52	static void sor(real M, real B, long n);
[d1b1380]	53	#endif
	54
[a420b49]	55	/* for M(row, col) col must be <= row, so Y <= X */
[9965b2b]	56	# define M(X, Y) ((real )M)[((((OSSIZE_T)(X)) ((X) + 1)) >> 1) + (Y)]
[421b7d2]	57	/* +(Y>X?0printf("row<col (line %d)\n",__LINE__):0) /
[9965b2b]	58	/#define M_(X, Y) ((real )M)[((((OSSIZE_T)(Y)) * ((Y) + 1)) >> 1) + (X)]*/
[d1b1380]	59
[eb18f4d]	60	static void build_matrix(node *list);
[d1b1380]	61
	62	static long n_stn_tab;
	63
[c19f129]	64	static pos **stn_tab;
[d1b1380]	65
[032ed06]	66	extern void
[d9b5db53]	67	solve_matrix(node *list)
[032ed06]	68	{
	69	node *stn;
[702f518]	70	long n = 0;
[d9b5db53]	71	FOR_EACH_STN(stn, list) {
[103c026]	72	if (!fixed(stn))
	73	n++;
[032ed06]	74	}
	75	if (n == 0) return;
	76
[86907b0]	77	/* We need to allocate stn_tab with one entry per unfixed cluster of equated
	78	* stations, but it's much simpler to count the number of unfixed nodes.
	79	* This will over-count stations with more than 3 legs and equated stations
	80	* but in a typical survey that's a small minority of stations.
[032ed06]	81	*/
[66de220]	82	stn_tab = osmalloc((OSSIZE_T)(n * ossizeof(pos*)));
[4f613e0]	83	n_stn_tab = 0;
[cb3d1e2]	84
[103c026]	85	/* We store the stn_tab index in stn->colour for quick and easy lookup in
	86	* build_matrix().
	87	*/
[d9b5db53]	88	FOR_EACH_STN(stn, list) {
[103c026]	89	if (!fixed(stn)) {
	90	int i;
	91	pos *p = stn->name->pos;
	92	for (i = 0; i < n_stn_tab; i++) {
	93	if (stn_tab[i] == p)
	94	break;
	95	}
	96	if (i == n_stn_tab)
	97	stn_tab[n_stn_tab++] = p;
	98	stn->colour = i;
	99	} else {
	100	stn->colour = -1;
	101	}
[032ed06]	102	}
	103
[eb18f4d]	104	build_matrix(list);
[2c9c3ff]	105	#if DEBUG_MATRIX
[2164fa4]	106	FOR_EACH_STN(stn, list) {
[2aa930f]	107	printf("(%8.2f, %8.2f, %8.2f ) ", POS(stn, 0), POS(stn, 1), POS(stn, 2));
[2164fa4]	108	print_prefix(stn->name);
[2aa930f]	109	putnl();
[2164fa4]	110	}
[2c9c3ff]	111	#endif
[4f613e0]	112
	113	osfree(stn_tab);
[032ed06]	114	}
[d1b1380]	115
[3fde384f]	116	#ifdef NO_COVARIANCES
[702f518]	117	# define FACTOR 1
[3fde384f]	118	#else
[702f518]	119	# define FACTOR 3
[3fde384f]	120	#endif
	121
[a420b49]	122	static void
[eb18f4d]	123	build_matrix(node *list)
[a420b49]	124	{
[eb18f4d]	125	if (n_stn_tab == 0) {
[5b68ae1]	126	if (!fQuiet)
	127	puts(msg(/Network solved by reduction - no simultaneous equations to solve./74));
[dbd68203]	128	return;
	129	}
[eb18f4d]	130	/* (OSSIZE_T) cast may be needed if n_stn_tab>=181 */
[5bb3dc4]	131	real M = osmalloc((OSSIZE_T)((((OSSIZE_T)n_stn_tab FACTOR * (n_stn_tab * FACTOR + 1)) >> 1)) * ossizeof(real));
	132	real B = osmalloc((OSSIZE_T)(n_stn_tab FACTOR * ossizeof(real)));
[dbd68203]	133
[647407d]	134	if (!fQuiet) {
[a4adf09]	135	if (n_stn_tab == 1)
	136	out_current_action(msg(/Solving one equation/78));
	137	else
	138	out_current_action1(msg(/Solving %d simultaneous equations/75), n_stn_tab);
[dbd68203]	139	}
	140
[3fde384f]	141	#ifdef NO_COVARIANCES
[5bb3dc4]	142	int dim = 2;
[3fde384f]	143	#else
[5bb3dc4]	144	int dim = 0; /* fudge next loop for now */
[3fde384f]	145	#endif
[a420b49]	146	for ( ; dim >= 0; dim--) {
[2164fa4]	147	node *stn;
	148	int row;
	149
[907fe10]	150	/* Initialise M and B to zero - zeroing "linearly" will minimise
[421b7d2]	151	* paging when the matrix is large */
[66de220]	152	{
	153	int end = n_stn_tab * FACTOR;
	154	for (row = 0; row < end; row++) B[row] = (real)0.0;
	155	end = ((OSSIZE_T)n_stn_tab * FACTOR * (n_stn_tab * FACTOR + 1)) >> 1;
	156	for (row = 0; row < end; row++) M[row] = (real)0.0;
	157	}
[dbd68203]	158
[3c7ab9a]	159	/* Construct matrix by going through the stn list.
[421b7d2]	160	*
[907fe10]	161	* All legs between two fixed stations can be ignored here.
[421b7d2]	162	*
[3c7ab9a]	163	* Other legs we want to add exactly once to M. To achieve this we
	164	* wan to:
	165	*
	166	* - add forward legs between two unfixed stations,
	167	*
	168	* - add legs from unfixed stations to fixed stations (we do them from
	169	* the unfixed end so we don't need to detect when we're at a fixed
	170	* point cut line and determine which side we're currently dealing
	171	* with).
	172	*
	173	* To implement this, we only look at legs from unfixed stations and add
	174	* a leg if to a fixed station, or to an unfixed station and it's a
	175	* forward leg.
	176	*/
[d9b5db53]	177	FOR_EACH_STN(stn, list) {
[2164fa4]	178	#ifdef NO_COVARIANCES
	179	real e;
	180	#else
[dac18d8]	181	svar e;
[eb18f4d]	182	delta a;
[2164fa4]	183	#endif
[b5d3988]	184	#if DEBUG_MATRIX_BUILD
[dbd68203]	185	print_prefix(stn->name);
[b5d3988]	186	printf(" used: %d colour %ld\n",
[a420b49]	187	(!!stn->leg[2]) << 2 \| (!!stn -> leg[1]) << 1 \| (!!stn->leg[0]),
[b5d3988]	188	stn->colour);
[3fde384f]	189
[5bb3dc4]	190	for (int dirn = 0; dirn <= 2 && stn->leg[dirn]; dirn++) {
[b5d3988]	191	#ifdef NO_COVARIANCES
[907fe10]	192	printf("Leg %d, vx=%f, reverse=%d, to ", dirn,
	193	stn->leg[dirn]->v[0], stn->leg[dirn]->l.reverse);
[b5d3988]	194	#else
[907fe10]	195	printf("Leg %d, vx=%f, reverse=%d, to ", dirn,
	196	stn->leg[dirn]->v[0][0], stn->leg[dirn]->l.reverse);
[b5d3988]	197	#endif
[907fe10]	198	print_prefix(stn->leg[dirn]->l.to->name);
	199	putnl();
	200	}
[dbd68203]	201	putnl();
[d1b1380]	202	#endif /* DEBUG_MATRIX_BUILD */
[b5d3988]	203
[907fe10]	204	if (!fixed(stn)) {
[103c026]	205	int f = stn->colour;
[5bb3dc4]	206	for (int dirn = 0; dirn <= 2 && stn->leg[dirn]; dirn++) {
[907fe10]	207	linkfor *leg = stn->leg[dirn];
	208	node *to = leg->l.to;
	209	if (fixed(to)) {
	210	bool fRev = !data_here(leg);
	211	if (fRev) leg = reverse_leg(leg);
	212	/* Ignore equated nodes */
[3fde384f]	213	#ifdef NO_COVARIANCES
[907fe10]	214	e = leg->v[dim];
	215	if (e != (real)0.0) {
	216	e = ((real)1.0) / e;
	217	M(f,f) += e;
[f52dcc7]	218	B[f] += e * POS(to, dim);
[907fe10]	219	if (fRev) {
[f52dcc7]	220	B[f] += leg->d[dim];
[907fe10]	221	} else {
[f52dcc7]	222	B[f] -= leg->d[dim];
[564f471]	223	}
[907fe10]	224	}
[3fde384f]	225	#else
[907fe10]	226	if (invert_svar(&e, &leg->v)) {
	227	if (fRev) {
	228	adddd(&a, &POSD(to), &leg->d);
	229	} else {
	230	subdd(&a, &POSD(to), &leg->d);
	231	}
[5bb3dc4]	232	delta b;
[907fe10]	233	mulsd(&b, &e, &a);
[5bb3dc4]	234	for (int i = 0; i < 3; i++) {
[907fe10]	235	M(f * FACTOR + i, f * FACTOR + i) += e[i];
	236	B[f * FACTOR + i] += b[i];
[564f471]	237	}
[907fe10]	238	M(f * FACTOR + 1, f * FACTOR) += e[3];
	239	M(f * FACTOR + 2, f * FACTOR) += e[4];
	240	M(f * FACTOR + 2, f * FACTOR + 1) += e[5];
	241	}
[3fde384f]	242	#endif
[907fe10]	243	} else if (data_here(leg)) {
	244	/* forward leg, unfixed -> unfixed */
[103c026]	245	int t = to->colour;
[d1b1380]	246	#if DEBUG_MATRIX
[907fe10]	247	printf("Leg %d to %d, var %f, delta %f\n", f, t, e,
	248	leg->d[dim]);
[d1b1380]	249	#endif
[907fe10]	250	/* Ignore equated nodes & lollipops */
[3fde384f]	251	#ifdef NO_COVARIANCES
[907fe10]	252	e = leg->v[dim];
	253	if (t != f && e != (real)0.0) {
	254	e = ((real)1.0) / e;
	255	M(f,f) += e;
	256	M(t,t) += e;
	257	if (f < t) M(t,f) -= e; else M(f,t) -= e;
[5bb3dc4]	258	real a = e * leg->d[dim];
[907fe10]	259	B[f] -= a;
	260	B[t] += a;
	261	}
[3fde384f]	262	#else
[907fe10]	263	if (t != f && invert_svar(&e, &leg->v)) {
	264	mulsd(&a, &e, &leg->d);
[5bb3dc4]	265	for (int i = 0; i < 3; i++) {
[907fe10]	266	M(f * FACTOR + i, f * FACTOR + i) += e[i];
	267	M(t * FACTOR + i, t * FACTOR + i) += e[i];
	268	if (f < t)
	269	M(t * FACTOR + i, f * FACTOR + i) -= e[i];
	270	else
	271	M(f * FACTOR + i, t * FACTOR + i) -= e[i];
	272	B[f * FACTOR + i] -= a[i];
	273	B[t * FACTOR + i] += a[i];
	274	}
	275	M(f * FACTOR + 1, f * FACTOR) += e[3];
	276	M(t * FACTOR + 1, t * FACTOR) += e[3];
	277	M(f * FACTOR + 2, f * FACTOR) += e[4];
	278	M(t * FACTOR + 2, t * FACTOR) += e[4];
	279	M(f * FACTOR + 2, f * FACTOR + 1) += e[5];
	280	M(t * FACTOR + 2, t * FACTOR + 1) += e[5];
	281	if (f < t) {
	282	M(t * FACTOR + 1, f * FACTOR) -= e[3];
	283	M(t * FACTOR, f * FACTOR + 1) -= e[3];
	284	M(t * FACTOR + 2, f * FACTOR) -= e[4];
	285	M(t * FACTOR, f * FACTOR + 2) -= e[4];
	286	M(t * FACTOR + 2, f * FACTOR + 1) -= e[5];
	287	M(t * FACTOR + 1, f * FACTOR + 2) -= e[5];
	288	} else {
	289	M(f * FACTOR + 1, t * FACTOR) -= e[3];
	290	M(f * FACTOR, t * FACTOR + 1) -= e[3];
	291	M(f * FACTOR + 2, t * FACTOR) -= e[4];
	292	M(f * FACTOR, t * FACTOR + 2) -= e[4];
	293	M(f * FACTOR + 2, t * FACTOR + 1) -= e[5];
	294	M(f * FACTOR + 1, t * FACTOR + 2) -= e[5];
[dbd68203]	295	}
	296	}
[907fe10]	297	#endif
[564f471]	298	}
[907fe10]	299	}
[dbd68203]	300	}
[d1b1380]	301	}
	302
	303	#if PRINT_MATRICES
[eb18f4d]	304	print_matrix(M, B, n_stn_tab * FACTOR); /* 'ave a look! */
[d1b1380]	305	#endif
	306
	307	#ifdef SOR
[032ed06]	308	/* defined in network.c, may be altered by -z<letters> on command line */
[a420b49]	309	if (optimize & BITA('i'))
[eb18f4d]	310	sor(M, B, n_stn_tab * FACTOR);
[dbd68203]	311	else
[d1b1380]	312	#endif
[eb18f4d]	313	choleski(M, B, n_stn_tab * FACTOR);
[d1b1380]	314
[dbd68203]	315	{
[5bb3dc4]	316	for (int m = (int)(n_stn_tab - 1); m >= 0; m--) {
[3fde384f]	317	#ifdef NO_COVARIANCES
[c19f129]	318	stn_tab[m]->p[dim] = B[m];
[032ed06]	319	if (dim == 0) {
[4c07c51]	320	SVX_ASSERT2(pos_fixed(stn_tab[m]),
[032ed06]	321	"setting station coordinates didn't mark pos as fixed");
	322	}
[3fde384f]	323	#else
[5bb3dc4]	324	for (int i = 0; i < 3; i++) {
[c19f129]	325	stn_tab[m]->p[i] = B[m * FACTOR + i];
[702f518]	326	}
[4c07c51]	327	SVX_ASSERT2(pos_fixed(stn_tab[m]),
[032ed06]	328	"setting station coordinates didn't mark pos as fixed");
[3fde384f]	329	#endif
[a420b49]	330	}
[d1b1380]	331	#if EXPLICIT_FIXED_FLAG
[5bb3dc4]	332	for (int m = n_stn_tab - 1; m >= 0; m--) fixpos(stn_tab[m]);
[d1b1380]	333	#endif
[dbd68203]	334	}
	335	}
	336	osfree(B);
	337	osfree(M);
[d1b1380]	338	}
	339
[702f518]	340	/* Solve MX=B for X by Choleski factorisation - modified Choleski actually
	341	* since we factor into LDL' while Choleski is just LL'
	342	*/
[d1b1380]	343	/* Note M must be symmetric positive definite */
	344	/* routine is entitled to scribble on M and B if it wishes */
[a420b49]	345	static void
[9965b2b]	346	choleski(real M, real B, long n)
[a420b49]	347	{
[5bb3dc4]	348	for (int j = 1; j < n; j++) {
[3fde384f]	349	real V;
[5bb3dc4]	350	for (int i = 0; i < j; i++) {
[421b7d2]	351	V = (real)0.0;
[5bb3dc4]	352	for (int k = 0; k < i; k++) V += M(i,k) * M(j,k) * M(k,k);
[a420b49]	353	M(j,i) = (M(j,i) - V) / M(i,i);
[dbd68203]	354	}
	355	V = (real)0.0;
[5bb3dc4]	356	for (int k = 0; k < j; k++) V += M(j,k) * M(j,k) * M(k,k);
[3fde384f]	357	M(j,j) -= V; /* may be best to add M() last for numerical reasons too */
[dbd68203]	358	}
[d1b1380]	359
[dbd68203]	360	/* Multiply x by L inverse */
[5bb3dc4]	361	for (int i = 0; i < n - 1; i++) {
	362	for (int j = i + 1; j < n; j++) {
[dbd68203]	363	B[j] -= M(j,i) * B[i];
[3fde384f]	364	}
[dbd68203]	365	}
[d1b1380]	366
[dbd68203]	367	/* Multiply x by D inverse */
[5bb3dc4]	368	for (int i = 0; i < n; i++) {
[dbd68203]	369	B[i] /= M(i,i);
[3fde384f]	370	}
	371
	372	/* Multiply x by (L transpose) inverse */
[5bb3dc4]	373	for (int i = (int)(n - 1); i > 0; i--) {
	374	for (int j = i - 1; j >= 0; j--) {
[421b7d2]	375	B[j] -= M(i,j) * B[i];
[3fde384f]	376	}
[dbd68203]	377	}
[d1b1380]	378
[dbd68203]	379	/* printf("\n%ld/%ld\n\n",flops,flopsTot); */
[d1b1380]	380	}
	381
	382	#ifdef SOR
	383	/* factor to use for SOR (must have 1 <= SOR_factor < 2) */
[702f518]	384	#define SOR_factor 1.93 /* 1.95 */
[d1b1380]	385
	386	/* Solve MX=B for X by SOR of Gauss-Siedel */
	387	/* routine is entitled to scribble on M and B if it wishes */
[a420b49]	388	static void
[9965b2b]	389	sor(real M, real B, long n)
[a420b49]	390	{
[dbd68203]	391	long it = 0;
[d1b1380]	392
[5bb3dc4]	393	real X = osmalloc(n ossizeof(real));
[d1b1380]	394
[5bb3dc4]	395	const real threshold = 0.00001;
[d1b1380]	396
[647407d]	397	printf("reciprocating diagonal\n"); /* TRANSLATE */
[d1b1380]	398
[3fde384f]	399	/* munge diagonal so we can multiply rather than divide */
[5bb3dc4]	400	for (int row = n - 1; row >= 0; row--) {
[dbd68203]	401	M(row,row) = 1 / M(row,row);
[702f518]	402	X[row] = 0;
[dbd68203]	403	}
[d1b1380]	404
[647407d]	405	printf("starting iteration\n"); /* TRANSLATE */
[d1b1380]	406
[5bb3dc4]	407	real t;
[dbd68203]	408	do {
	409	/printf("");*/
	410	it++;
	411	t = 0.0;
[5bb3dc4]	412	for (int row = 0; row < n; row++) {
	413	real x = B[row];
	414	int col;
[a420b49]	415	for (col = 0; col < row; col++) x -= M(row,col) * X[col];
	416	for (col++; col < n; col++) x -= M(col,row) * X[col];
[dbd68203]	417	x *= M(row,row);
[5bb3dc4]	418	real delta = (x - X[row]) * SOR_factor;
[dbd68203]	419	X[row] += delta;
[5bb3dc4]	420	real t2 = fabs(delta);
[dbd68203]	421	if (t2 > t) t = t2;
	422	}
[702f518]	423	printf("% 6d: %8.6f\n", it, t);
[dbd68203]	424	} while (t >= threshold && it < 100000);
[d1b1380]	425
[dbd68203]	426	if (t >= threshold) {
	427	fprintf(stderr, "not converged after %ld iterations\n", it);
	428	BUG("iteration stinks");
	429	}
[d1b1380]	430
[647407d]	431	printf("%ld iterations\n", it); /* TRANSLATE */
[d1b1380]	432
	433	#if 0
[dbd68203]	434	putnl();
[5bb3dc4]	435	for (int row = n - 1; row >= 0; row--) {
[dbd68203]	436	t = 0.0;
[5bb3dc4]	437	for (int col = 0; col < row; col++) t += M(row, col) * X[col];
[a420b49]	438	t += X[row] / M(row, row);
	439	for (col = row + 1; col < n; col++)
	440	t += M(col, row) * X[col];
[b5d3988]	441	printf("[ %f %f ]\n", t, B[row]);
[dbd68203]	442	}
[d1b1380]	443	#endif
	444
[5bb3dc4]	445	for (int row = n - 1; row >= 0; row--) B[row] = X[row];
[d1b1380]	446
[dbd68203]	447	osfree(X);
[647407d]	448	printf("\ndone\n"); /* TRANSLATE */
[dbd68203]	449	}
[d1b1380]	450	#endif
	451
	452	#if PRINT_MATRICES
[a420b49]	453	static void
[9965b2b]	454	print_matrix(real M, real B, long n)
[a420b49]	455	{
[dbd68203]	456	printf("Matrix, M and vector, B:\n");
[5bb3dc4]	457	for (long row = 0; row < n; row++) {
	458	long col;
[a420b49]	459	for (col = 0; col <= row; col++) printf("%6.2f\t", M(row, col));
	460	for (; col <= n; col++) printf(" \t");
[dbd68203]	461	printf("\t%6.2f\n", B[row]);
	462	}
	463	putnl();
	464	return;
[d1b1380]	465	}
	466	#endif

Note: See TracBrowser for help on using the repository browser.

Context Navigation

source: git/src/matrix.c @ 103c026

Download in other formats: