Context Navigation

message.c @ 7bdf66d

Visit:

RELEASE/1.2debug-cidebug-ci-sanitisersfaster-cavernloglog-selectstereostereo-2025walls-datawalls-data-hanging-as-warningwarn-only-for-hanging-survey

Last change on this file since 7bdf66d was 7bdf66d, checked in by Olly Betts <olly@…>, 15 years ago

lib/messages.txt,src/: Remove things we no longer need now we've
dropped support for RISC OS and DOS.

git-svn-id: file:///home/survex-svn/survex/trunk@3505 4b37db11-9a0c-4f06-9ece-9ab7cdaee568

Property mode set to 100644

File size: 34.0 KB

Line
1	/* message.c
2	* Fairly general purpose message and error routines
3	* Copyright (C) 1993-2003,2004,2005,2006,2007,2010 Olly Betts
4	*
5	* This program is free software; you can redistribute it and/or modify
6	* it under the terms of the GNU General Public License as published by
7	* the Free Software Foundation; either version 2 of the License, or
8	* (at your option) any later version.
9	*
10	* This program is distributed in the hope that it will be useful,
11	* but WITHOUT ANY WARRANTY; without even the implied warranty of
12	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13	* GNU General Public License for more details.
14	*
15	* You should have received a copy of the GNU General Public License
16	* along with this program; if not, write to the Free Software
17	* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
18	*/
19
20	/#define DEBUG 1/
21
22	#ifdef HAVE_CONFIG_H
23	# include <config.h>
24	#endif
25
26	#include <stdio.h>
27	#include <stdlib.h>
28	#include <string.h>
29	#include <ctype.h>
30	#include <limits.h>
31	#include <errno.h>
32	#include <locale.h>
33
34	#include "cmdline.h"
35	#include "whichos.h"
36	#include "filename.h"
37	#include "message.h"
38	#include "osdepend.h"
39	#include "filelist.h"
40	#include "debug.h"
41
42	#ifdef AVEN
43	# include "aven.h"
44	#endif
45
46	#ifdef HAVE_SIGNAL
47	# ifdef HAVE_SETJMP_H
48	# include <setjmp.h>
49	static jmp_buf jmpbufSignal;
50	# include <signal.h>
51	# else
52	# undef HAVE_SIGNAL
53	# endif
54	#endif
55
56	#if OS_WIN32
57	# define WIN32_LEAN_AND_MEAN
58	# include <windows.h>
59	#elif OS_UNIX
60	# include <sys/types.h>
61	# include <sys/stat.h>
62	#endif
63
64	/* For funcs which want to be immune from messing around with different
65	* calling conventions */
66	#ifndef CDECL
67	# define CDECL
68	#endif
69
70	int msg_warnings = 0; /* keep track of how many warnings we've given */
71	int msg_errors = 0; /* and how many (non-fatal) errors */
72
73	/* in case osmalloc() fails before appname_copy is set up */
74	static const char *appname_copy = "anonymous program";
75
76	/* Path to use to look for executables (used by aven to find cavern). */
77	static const char *exe_pth = "";
78
79	/* error code for failed osmalloc and osrealloc calls */
80	static void
81	outofmem(OSSIZE_T size)
82	{
83	fatalerror(/Out of memory (couldn't find %lu bytes)./1,
84	(unsigned long)size);
85	}
86
87	#ifdef TOMBSTONES
88	#define TOMBSTONE_SIZE 16
89	static const char tombstone[TOMBSTONE_SIZE] = "012345\xfftombstone";
90	#endif
91
92	/* malloc with error catching if it fails. Also allows us to write special
93	* versions easily eg for MS Windows.
94	*/
95	void *
96	osmalloc(OSSIZE_T size)
97	{
98	void *p;
99	#ifdef TOMBSTONES
100	size += TOMBSTONE_SIZE * 2;
101	p = malloc(size);
102	#else
103	p = xosmalloc(size);
104	#endif
105	if (p == NULL) outofmem(size);
106	#ifdef TOMBSTONES
107	printf("osmalloc truep=%p truesize=%d\n", p, size);
108	memcpy(p, tombstone, TOMBSTONE_SIZE);
109	memcpy(p + size - TOMBSTONE_SIZE, tombstone, TOMBSTONE_SIZE);
110	(size_t )p = size;
111	p += TOMBSTONE_SIZE;
112	#endif
113	return p;
114	}
115
116	/* realloc with error catching if it fails. */
117	void *
118	osrealloc(void *p, OSSIZE_T size)
119	{
120	/* some pre-ANSI realloc implementations don't cope with a NULL pointer */
121	if (p == NULL) {
122	p = xosmalloc(size);
123	} else {
124	#ifdef TOMBSTONES
125	int true_size;
126	size += TOMBSTONE_SIZE * 2;
127	p -= TOMBSTONE_SIZE;
128	true_size = (size_t )p;
129	printf("osrealloc (in truep=%p truesize=%d)\n", p, true_size);
130	if (memcmp(p + sizeof(size_t), tombstone + sizeof(size_t),
131	TOMBSTONE_SIZE - sizeof(size_t)) != 0) {
132	printf("start tombstone for block %p, size %d corrupted!",
133	p + TOMBSTONE_SIZE, true_size - TOMBSTONE_SIZE * 2);
134	}
135	if (memcmp(p + true_size - TOMBSTONE_SIZE, tombstone,
136	TOMBSTONE_SIZE) != 0) {
137	printf("end tombstone for block %p, size %d corrupted!",
138	p + TOMBSTONE_SIZE, true_size - TOMBSTONE_SIZE * 2);
139	}
140	p = realloc(p, size);
141	if (p == NULL) outofmem(size);
142	printf("osrealloc truep=%p truesize=%d\n", p, size);
143	memcpy(p, tombstone, TOMBSTONE_SIZE);
144	memcpy(p + size - TOMBSTONE_SIZE, tombstone, TOMBSTONE_SIZE);
145	(size_t )p = size;
146	p += TOMBSTONE_SIZE;
147	#else
148	p = xosrealloc(p, size);
149	#endif
150	}
151	if (p == NULL) outofmem(size);
152	return p;
153	}
154
155	char *
156	osstrdup(const char *str)
157	{
158	char *p;
159	OSSIZE_T len;
160	len = strlen(str) + 1;
161	p = osmalloc(len);
162	memcpy(p, str, len);
163	return p;
164	}
165
166	/* osfree is usually just a macro in osalloc.h */
167	#ifdef TOMBSTONES
168	void
169	osfree(void *p)
170	{
171	int true_size;
172	if (!p) return;
173	p -= TOMBSTONE_SIZE;
174	true_size = (size_t )p;
175	printf("osfree truep=%p truesize=%d\n", p, true_size);
176	if (memcmp(p + sizeof(size_t), tombstone + sizeof(size_t),
177	TOMBSTONE_SIZE - sizeof(size_t)) != 0) {
178	printf("start tombstone for block %p, size %d corrupted!",
179	p + TOMBSTONE_SIZE, true_size - TOMBSTONE_SIZE * 2);
180	}
181	if (memcmp(p + true_size - TOMBSTONE_SIZE, tombstone,
182	TOMBSTONE_SIZE) != 0) {
183	printf("end tombstone for block %p, size %d corrupted!",
184	p + TOMBSTONE_SIZE, true_size - TOMBSTONE_SIZE * 2);
185	}
186	free(p);
187	}
188	#endif
189
190	#ifdef HAVE_SIGNAL
191
192	static int sigReceived;
193
194	/* for systems not using autoconf, assume the signal handler returns void
195	* unless specified elsewhere */
196	#ifndef RETSIGTYPE
197	# define RETSIGTYPE void
198	#endif
199
200	static CDECL RETSIGTYPE
201	report_sig(int sig)
202	{
203	sigReceived = sig;
204	longjmp(jmpbufSignal, 1);
205	}
206
207	static void
208	init_signals(void)
209	{
210	int en;
211	if (!setjmp(jmpbufSignal)) {
212	signal(SIGABRT, report_sig); /* abnormal termination eg abort() */
213	signal(SIGFPE, report_sig); /* arithmetic error eg /0 or overflow */
214	signal(SIGILL, report_sig); /* illegal function image eg illegal instruction */
215	signal(SIGSEGV, report_sig); /* illegal storage access eg access outside memory limits */
216	return;
217	}
218
219	/* Remove that signal handler to avoid the possibility of an infinite loop.
220	*/
221	signal(sigReceived, SIG_DFL);
222
223	switch (sigReceived) {
224	case SIGABRT: en = /Abnormal termination/90; break;
225	case SIGFPE: en = /Arithmetic error/91; break;
226	case SIGILL: en = /Illegal instruction/92; break;
227	case SIGSEGV: en = /Bad memory access/94; break;
228	default: en = /Unknown signal received/97; break;
229	}
230	fputsnl(msg(en), STDERR);
231
232	/* Any of the signals we catch indicates a bug */
233	fatalerror(/Bug in program detected! Please report this to the authors/11);
234
235	exit(EXIT_FAILURE);
236	}
237	#endif
238
239	static int
240	default_charset(void)
241	{
242	if (getenv("SURVEX_UTF8")) return CHARSET_UTF8;
243	#if OS_WIN32
244	# ifdef AVEN
245	# define CODEPAGE GetACP()
246	# else
247	# define CODEPAGE GetConsoleOutputCP()
248	# endif
249	switch (CODEPAGE) {
250	case 0: return CHARSET_UTF8;
251	case 1252: return CHARSET_WINCP1252;
252	case 1250: return CHARSET_WINCP1250;
253	case 850: return CHARSET_DOSCP850;
254	}
255	return CHARSET_USASCII;
256	#elif OS_UNIX
257	#ifdef AVEN
258	return CHARSET_UTF8;
259	#else
260	const char *p = getenv("LC_ALL");
261	if (p == NULL \|\| p[0] == '\0') {
262	p = getenv("LC_CTYPE");
263	if (p == NULL \|\| p[0] == '\0') {
264	p = msg_lang;
265	}
266	}
267
268	if (p) {
269	char *q = strchr(p, '.');
270	if (q) p = q + 1;
271	}
272
273	if (p) {
274	const char *chset = p;
275	size_t name_len;
276
277	while (p != '\0' && p != '@') p++;
278
279	name_len = p - chset;
280
281	if (name_len) {
282	int only_digit = 1;
283	size_t cnt;
284
285	for (cnt = 0; cnt < name_len; ++cnt)
286	if (isalpha((unsigned char)chset[cnt])) {
287	only_digit = 0;
288	break;
289	}
290
291	if (only_digit) goto iso;
292
293	switch (tolower(chset[0])) {
294	case 'i':
295	if (tolower(chset[1]) == 's' && tolower(chset[2]) == 'o') {
296	chset += 3;
297	iso:
298	if (strncmp(chset, "8859", 4) == 0) {
299	chset += 4;
300	while (chset < p && chset && !isdigit((unsigned char)chset))
301	chset++;
302	switch (atoi(chset)) {
303	case 1: return CHARSET_ISO_8859_1;
304	case 2: return CHARSET_ISO_8859_2;
305	case 15: return CHARSET_ISO_8859_15;
306	default: return CHARSET_USASCII;
307	}
308	}
309	}
310	break;
311	case 'u':
312	if (tolower(chset[1]) == 't' && tolower(chset[2]) == 'f') {
313	chset += 3;
314	while (chset < p && chset && !isdigit((unsigned char)chset))
315	chset++;
316	switch (atoi(chset)) {
317	case 8: return CHARSET_UTF8;
318	default: return CHARSET_USASCII;
319	}
320	}
321	}
322	}
323	}
324	return CHARSET_USASCII;
325	#endif
326	#else
327	# error Do not know operating system!
328	#endif
329	}
330
331	/* It seems that Swedish and maybe some other scandanavian languages don't
332	* transliterate ä to ae - but it seems there may be conflicting views
333	* on this...
334	*/
335	#define umlaut_to_e() 1
336
337	/* values <= 127 already dealt with */
338	static int
339	add_unicode(int charset, unsigned char *p, int value)
340	{
341	#ifdef DEBUG
342	fprintf(stderr, "add_unicode(%d, %p, %d)\n", charset, p, value);
343	#endif
344	if (value == 0) return 0;
345	switch (charset) {
346	case CHARSET_USASCII:
347	if (value < 0x80) {
348	*p = value;
349	return 1;
350	}
351	break;
352	case CHARSET_ISO_8859_1:
353	if (value < 0x100) {
354	*p = value;
355	return 1;
356	}
357	break;
358	case CHARSET_ISO_8859_2:
359	if (value >= 0xa0) {
360	int v = 0;
361	switch (value) {
362	case 0xa0: case 0xa4: case 0xa7: case 0xa8: case 0xad: case 0xb0:
363	case 0xb4: case 0xb8: case 0xc1: case 0xc2: case 0xc4: case 0xc7:
364	case 0xc9: case 0xcb: case 0xcd: case 0xce: case 0xd3: case 0xd4:
365	case 0xd6: case 0xd7: case 0xda: case 0xdc: case 0xdd: case 0xdf:
366	case 0xe1: case 0xe2: case 0xe4: case 0xe7: case 0xe9: case 0xeb:
367	case 0xed: case 0xee: case 0xf3: case 0xf4: case 0xf6: case 0xf7:
368	case 0xfa: case 0xfc: case 0xfd:
369	v = value; break;
370	case 0x104: v = '\xa1'; break;
371	case 0x2d8: v = '\xa2'; break;
372	case 0x141: v = '\xa3'; break;
373	case 0x13d: v = '\xa5'; break;
374	case 0x15a: v = '\xa6'; break;
375	case 0x160: v = '\xa9'; break;
376	case 0x15e: v = '\xaa'; break; /* Scedil */
377	case 0x164: v = '\xab'; break;
378	case 0x179: v = '\xac'; break;
379	case 0x17d: v = '\xae'; break;
380	case 0x17b: v = '\xaf'; break;
381	case 0x105: v = '\xb1'; break;
382	case 0x2db: v = '\xb2'; break;
383	case 0x142: v = '\xb3'; break;
384	case 0x13e: v = '\xb5'; break;
385	case 0x15b: v = '\xb6'; break;
386	case 0x2c7: v = '\xb7'; break;
387	case 0x161: v = '\xb9'; break;
388	case 0x15f: v = '\xba'; break; /* scedil */
389	case 0x165: v = '\xbb'; break;
390	case 0x17a: v = '\xbc'; break;
391	case 0x2dd: v = '\xbd'; break;
392	case 0x17e: v = '\xbe'; break;
393	case 0x17c: v = '\xbf'; break;
394	case 0x154: v = '\xc0'; break;
395	case 0x102: v = '\xc3'; break;
396	case 0x139: v = '\xc5'; break;
397	case 0x106: v = '\xc6'; break;
398	case 0x10c: v = '\xc8'; break;
399	case 0x118: v = '\xca'; break;
400	case 0x11a: v = '\xcc'; break;
401	case 0x10e: v = '\xcf'; break;
402	case 0x110: v = '\xd0'; break;
403	case 0x143: v = '\xd1'; break;
404	case 0x147: v = '\xd2'; break;
405	case 0x150: v = '\xd5'; break;
406	case 0x158: v = '\xd8'; break;
407	case 0x16e: v = '\xd9'; break;
408	case 0x170: v = '\xdb'; break;
409	case 0x162: v = '\xde'; break; /* &Tcedil; */
410	case 0x155: v = '\xe0'; break;
411	case 0x103: v = '\xe3'; break;
412	case 0x13a: v = '\xe5'; break;
413	case 0x107: v = '\xe6'; break;
414	case 0x10d: v = '\xe8'; break;
415	case 0x119: v = '\xea'; break;
416	case 0x11b: v = '\xec'; break;
417	case 0x10f: v = '\xef'; break;
418	case 0x111: v = '\xf0'; break;
419	case 0x144: v = '\xf1'; break;
420	case 0x148: v = '\xf2'; break;
421	case 0x151: v = '\xf5'; break;
422	case 0x159: v = '\xf8'; break;
423	case 0x16f: v = '\xf9'; break;
424	case 0x171: v = '\xfb'; break;
425	case 0x163: v = '\xfe'; break; /* tcedil */
426	case 0x2d9: v = '\xff'; break;
427	}
428	if (v == 0) break;
429	value = v;
430	}
431	*p = value;
432	return 1;
433	case CHARSET_ISO_8859_15:
434	switch (value) {
435	case 0xa4: case 0xa6: case 0xb0: case 0xc4:
436	case 0xd0: case 0xd4: case 0xd5: case 0xd6:
437	goto donthave;
438	case 0x152: value = 0xd4; break; /* &OElig; */
439	case 0x153: value = 0xd5; break; /* &oelig; */
440	#if 0
441	case 0x0: value = 0xa4; break; /* euro */
442	#endif
443	case 0x160: value = 0xa6; break; /* Scaron */
444	case 0x161: value = 0xb0; break; /* scaron */
445	case 0x17d: value = 0xc4; break; /* Zcaron */
446	case 0x17e: value = 0xd0; break; /* zcaron */
447	#if 0
448	case 0x0: value = 0xd6; break; /* Ydiersis */
449	#endif
450	}
451	if (value < 0x100) {
452	*p = value;
453	return 1;
454	}
455	donthave:
456	break;
457	#if OS_WIN32
458	case CHARSET_WINCP1250:
459	/* MS Windows rough equivalent to ISO-8859-2 */
460	if (value >= 0x80) {
461	int v = 0;
462	switch (value) {
463	case 0xa0: case 0xa4: case 0xa6: case 0xa7: case 0xa8: case 0xa9:
464	case 0xab: case 0xac: case 0xad: case 0xae: case 0xb0: case 0xb1:
465	case 0xb4: case 0xb5: case 0xb6: case 0xb7: case 0xb8: case 0xbb:
466	case 0xc1: case 0xc2: case 0xc4: case 0xc7: case 0xc9: case 0xcb:
467	case 0xcd: case 0xce: case 0xd3: case 0xd4: case 0xd6: case 0xd7:
468	case 0xda: case 0xdc: case 0xdd: case 0xdf: case 0xe1: case 0xe2:
469	case 0xe4: case 0xe7: case 0xe9: case 0xeb: case 0xed: case 0xee:
470	case 0xf3: case 0xf4: case 0xf6: case 0xf7: case 0xfa: case 0xfc:
471	case 0xfd:
472	v = value; break;
473	case 0x20ac: v = '\x80'; break;
474	case 0x201a: v = '\x82'; break;
475	case 0x201e: v = '\x84'; break;
476	case 0x2026: v = '\x85'; break;
477	case 0x2020: v = '\x86'; break;
478	case 0x2021: v = '\x87'; break;
479	case 0x2030: v = '\x89'; break;
480	case 0x0160: v = '\x8a'; break;
481	case 0x2039: v = '\x8b'; break;
482	case 0x015a: v = '\x8c'; break;
483	case 0x0164: v = '\x8d'; break;
484	case 0x017d: v = '\x8e'; break;
485	case 0x0179: v = '\x8f'; break;
486	case 0x2018: v = '\x91'; break;
487	case 0x2019: v = '\x92'; break;
488	case 0x201c: v = '\x93'; break;
489	case 0x201d: v = '\x94'; break;
490	case 0x2022: v = '\x95'; break;
491	case 0x2013: v = '\x96'; break;
492	case 0x2014: v = '\x97'; break;
493	case 0x2122: v = '\x99'; break;
494	case 0x0161: v = '\x9a'; break;
495	case 0x203a: v = '\x9b'; break;
496	case 0x015b: v = '\x9c'; break;
497	case 0x0165: v = '\x9d'; break;
498	case 0x017e: v = '\x9e'; break;
499	case 0x017a: v = '\x9f'; break;
500	case 0x02c7: v = '\xa1'; break;
501	case 0x02d8: v = '\xa2'; break;
502	case 0x0141: v = '\xa3'; break;
503	case 0x0104: v = '\xa5'; break;
504	case 0x015e: v = '\xaa'; break; /* Scedil */
505	case 0x017b: v = '\xaf'; break;
506	case 0x02db: v = '\xb2'; break;
507	case 0x0142: v = '\xb3'; break;
508	case 0x0105: v = '\xb9'; break;
509	case 0x015f: v = '\xba'; break; /* scedil */
510	case 0x013d: v = '\xbc'; break;
511	case 0x02dd: v = '\xbd'; break;
512	case 0x013e: v = '\xbe'; break;
513	case 0x017c: v = '\xbf'; break;
514	case 0x0154: v = '\xc0'; break;
515	case 0x0102: v = '\xc3'; break;
516	case 0x0139: v = '\xc5'; break;
517	case 0x0106: v = '\xc6'; break;
518	case 0x010c: v = '\xc8'; break;
519	case 0x0118: v = '\xca'; break;
520	case 0x011a: v = '\xcc'; break;
521	case 0x010e: v = '\xcf'; break;
522	case 0x0110: v = '\xd0'; break;
523	case 0x0143: v = '\xd1'; break;
524	case 0x0147: v = '\xd2'; break;
525	case 0x0150: v = '\xd5'; break;
526	case 0x0158: v = '\xd8'; break;
527	case 0x016e: v = '\xd9'; break;
528	case 0x0170: v = '\xdb'; break;
529	case 0x0162: v = '\xde'; break; /* &Tcedil; */
530	case 0x0155: v = '\xe0'; break;
531	case 0x0103: v = '\xe3'; break;
532	case 0x013a: v = '\xe5'; break;
533	case 0x0107: v = '\xe6'; break;
534	case 0x010d: v = '\xe8'; break;
535	case 0x0119: v = '\xea'; break;
536	case 0x011b: v = '\xec'; break;
537	case 0x010f: v = '\xef'; break;
538	case 0x0111: v = '\xf0'; break;
539	case 0x0144: v = '\xf1'; break;
540	case 0x0148: v = '\xf2'; break;
541	case 0x0151: v = '\xf5'; break;
542	case 0x0159: v = '\xf8'; break;
543	case 0x016f: v = '\xf9'; break;
544	case 0x0171: v = '\xfb'; break;
545	case 0x0163: v = '\xfe'; break; /* tcedil */
546	case 0x02d9: v = '\xff'; break;
547	}
548	if (v == 0) break;
549	value = v;
550	}
551	*p = value;
552	return 1;
553	case CHARSET_WINCP1252:
554	/* MS Windows extensions to ISO-8859-1 */
555	switch (value) {
556	case 0x152: value = 0x8c; break; /* &OElig; */
557	case 0x153: value = 0x9c; break; /* &oelig; */
558	#if 0
559	/* there are a few other obscure ones we don't currently need */
560	#endif
561	}
562	if (value < 0x100) {
563	*p = value;
564	return 1;
565	}
566	break;
567	#endif
568	#if OS_WIN32
569	case CHARSET_DOSCP850: {
570	unsigned char uni2dostab[] = {
571	255, 173, 189, 156, 207, 190, 221, 245,
572	249, 184, 166, 174, 170, 240, 169, 238,
573	248, 241, 253, 252, 239, 230, 244, 250,
574	247, 251, 167, 175, 172, 171, 243, 168,
575	183, 181, 182, 199, 142, 143, 146, 128,
576	212, 144, 210, 211, 222, 214, 215, 216,
577	209, 165, 227, 224, 226, 229, 153, 158,
578	157, 235, 233, 234, 154, 237, 232, 225,
579	133, 160, 131, 198, 132, 134, 145, 135,
580	138, 130, 136, 137, 141, 161, 140, 139,
581	208, 164, 149, 162, 147, 228, 148, 246,
582	155, 151, 163, 150, 129, 236, 231, 152
583	};
584	if (value >= 160 && value < 256) {
585	*p = (int)uni2dostab[value - 160];
586	return 1;
587	}
588	#if 0
589	if (value == 305) { /* LATIN SMALL LETTER DOTLESS I */
590	*p = 213;
591	return 1;
592	}
593	if (value == 402) { /* LATIN SMALL LETTER F WITH HOOK */
594	*p = 159;
595	return 1;
596	}
597	#endif
598	break;
599	}
600	#endif
601	}
602	/* Transliterate characters we can't represent */
603	#ifdef DEBUG
604	fprintf(stderr, "transliterate `%c' 0x%x\n", value, value);
605	#endif
606	switch (value) {
607	case 160:
608	*p = ' '; return 1;
609	case 161 /* ¡ */:
610	*p = '!'; return 1;
611	case 171 /* « */:
612	p[1] = *p = '<'; return 2;
613	case 187 /* » */:
614	p[1] = *p = '>'; return 2;
615	case 191 /* ¿ */:
616	*p = '?'; return 1;
617	case 192 /* À /: case 193 / Á /: case 194 / Â /: case 195 / Ã */:
618	*p = 'A'; return 1;
619	case 197 /* Å */:
620	p[1] = *p = 'A'; return 2;
621	case 196 /* Ä /: / Ä */
622	*p = 'A';
623	if (!umlaut_to_e()) return 1;
624	p[1] = 'E'; return 2;
625	case 198 /* Æ */:
626	*p = 'A'; p[1] = 'E'; return 2;
627	case 199 /* Ç /: case 268: / &Ccaron; */
628	*p = 'C'; return 1;
629	case 270: /* &Dcaron; */
630	*p = 'D'; return 1;
631	case 200 /* È /: case 201 / É /: case 202 / Ê /: case 203 / Ë */:
632	*p = 'E'; return 1;
633	case 204 /* Ì /: case 205 / Í /: case 206 / Î /: case 207 / Ï */:
634	*p = 'I'; return 1;
635	case 208 /* Ð /: case 222 / Þ */:
636	*p = 'T'; p[1] = 'H'; return 2;
637	case 315: /* &Lacute; */
638	case 317: /* &Lcaron; */
639	*p = 'L'; return 1;
640	case 209 /* Ñ */:
641	*p = 'N'; return 1;
642	case 210 /* Ò /: case 211 / Ó /: case 212 / Ô /: case 213 / Õ */:
643	*p = 'O'; return 1;
644	case 214 /* Ö /: / Ö / case 0x152: / &OElig; */
645	*p = 'O'; p[1] = 'E'; return 2;
646	case 352: /* &Scaron; */
647	case 0x15e: /* &Scedil; */
648	*p = 'S'; return 1;
649	case 0x162: /* &Tcedil; */
650	case 0x164: /* &Tcaron; */
651	*p = 'T'; return 1;
652	case 217 /* Ù /: case 218 / Ú /: case 219 / Û */:
653	*p = 'U'; return 1;
654	case 220 /* Ü /: / Ü */
655	*p = 'U'; p[1] = 'E'; return 2;
656	case 221 /* Ý */:
657	*p = 'Y'; return 1;
658	case 381: /* &Zcaron; */
659	*p = 'Z'; return 1;
660	case 223 /* ß */:
661	p[1] = *p = 's'; return 2;
662	case 224 /* à /: case 225 / á /: case 226 / â /: case 227 / ã */:
663	case 259: /* &abreve; */
664	*p = 'a'; return 1;
665	case 228 /* ä /: / ä / case 230 / æ */:
666	*p = 'a'; p[1] = 'e'; return 2;
667	case 229 /* å */:
668	p[1] = *p = 'a'; return 2;
669	case 231 /* ç /: case 269 / &ccaron; */:
670	*p = 'c'; return 1;
671	case 271: /* &dcaron; */
672	*p = 'd'; return 1;
673	case 232 /* è /: case 233 / é /: case 234 / ê /: case 235 / ë */:
674	case 283 /* &ecaron; */:
675	*p = 'e'; return 1;
676	case 236 /* ì /: case 237 / í /: case 238 / î /: case 239 / ï */:
677	*p = 'i'; return 1;
678	case 316 /* &lacute; */:
679	case 318 /* &lcaron; */:
680	*p = 'l'; return 1;
681	case 241 /* ñ /: case 328 / &ncaron; */:
682	*p = 'n'; return 1;
683	case 345: /* &rcaron; */
684	*p = 'r'; return 1;
685	case 353: /* &scaron; */
686	case 0x15f: /* &scedil; */
687	*p = 's'; return 1;
688	case 357: /* &tcaron; */
689	case 0x163: /* &tcedil; */
690	*p = 't'; return 1;
691	case 240 /* ð /: case 254 / þ */:
692	*p = 't'; p[1] = 'h'; return 2;
693	case 242 /* ò /: case 243 / ó /: case 244 / ô /: case 245 / õ */:
694	*p = 'o'; return 1;
695	case 246 /* ö /: / ö / case 0x153: / &oelig; */
696	*p = 'o'; p[1] = 'e'; return 2;
697	case 249 /* ù /: case 250 / ú /: case 251 / û */:
698	case 367 /* &uring; */:
699	*p = 'u'; return 1;
700	case 252 /* ü /: / ü */
701	*p = 'u'; p[1] = 'e'; return 2;
702	case 253 /* ý /: case 255 / ÿ */:
703	*p = 'y'; return 1;
704	case 382: /* &zcaron; */
705	*p = 'z'; return 1;
706	}
707	#ifdef DEBUG
708	fprintf(stderr, "failed to transliterate\n");
709	#endif
710	return 0;
711	}
712
713	#if OS_UNIX && defined DATADIR && defined PACKAGE
714	/* Under Unix, we compile in the configured path */
715	static const char *pth_cfg_files = DATADIR "/" PACKAGE;
716	#else
717	/* On other platforms, we fall back on looking in the current directory */
718	static const char *pth_cfg_files = "";
719	#endif
720
721	static int num_msgs = 0;
722	static char **msg_array = NULL;
723
724	const char *msg_lang = NULL;
725	const char *msg_lang2 = NULL;
726
727	static char **
728	parse_msgs(int n, unsigned char *p, int charset_code) {
729	int i;
730
731	char *msgs = osmalloc(n sizeof(char *));
732
733	for (i = 0; i < n; i++) {
734	unsigned char *to = p;
735	int ch;
736	msgs[i] = (char *)p;
737
738	/* If we want UTF8 anyway, we just need to find the start of each
739	* message */
740	if (charset_code == CHARSET_UTF8) {
741	p += strlen((char *)p) + 1;
742	continue;
743	}
744
745	while ((ch = *p++) != 0) {
746	/* A byte in the range 0x80-0xbf or 0xf0-0xff isn't valid in
747	* this state, (0xf0-0xfd mean values > 0xffff) so treat as
748	* literal and try to resync so we cope better when fed
749	* non-utf-8 data. Similarly we abandon a multibyte sequence
750	* if we hit an invalid character. */
751	if (ch >= 0xc0 && ch < 0xf0) {
752	int ch1 = *p;
753	if ((ch1 & 0xc0) != 0x80) goto resync;
754
755	if (ch < 0xe0) {
756	/* 2 byte sequence */
757	ch = ((ch & 0x1f) << 6) \| (ch1 & 0x3f);
758	p++;
759	} else {
760	/* 3 byte sequence */
761	int ch2 = p[1];
762	if ((ch2 & 0xc0) != 0x80) goto resync;
763	ch = ((ch & 0x1f) << 12) \| ((ch1 & 0x3f) << 6) \| (ch2 & 0x3f);
764	p += 2;
765	}
766	}
767
768	resync:
769
770	if (ch < 127) {
771	*to++ = (char)ch;
772	} else {
773	/* We assume an N byte UTF-8 code never transliterates to more
774	* than N characters (so we can't transliterate © to (C) or
775	* ® to (R) for example) */
776	to += add_unicode(charset_code, to, ch);
777	}
778	}
779	*to++ = '\0';
780	}
781	return msgs;
782	}
783
784	/* This is the name of the default language, which can be set like so:
785	* ./configure --enable-defaultlang=fr
786	*/
787	#ifdef DEFAULTLANG
788	/* No point extracting these errors as they won't get used if file opens */
789	# include "../lib/defaultlang.h"
790	#else
791	#define N_DONTEXTRACTMSGS 5
792	static unsigned char dontextractmsgs[] =
793	"Can't open message file `%s' using path `%s'\0"/1000/
794	"Problem with message file `%s'\0"/1001/
795	"I don't understand this message file version\0"/1002/
796	"Message file truncated?\0"/1003/
797	"Out of memory (couldn't find %lu bytes).\0"/1004/;
798	#endif
799
800	static char **dontextract = NULL;
801
802	static void
803	parse_msg_file(int charset_code)
804	{
805	FILE *fh;
806	unsigned char header[20];
807	int i;
808	unsigned len;
809	unsigned char *p;
810	char fnm, s;
811	int n;
812
813	#ifdef DEBUG
814	fprintf(stderr, "parse_msg_file(%d)\n", charset_code);
815	#endif
816
817	/* sort out messages we need to print if we can't open the message file */
818	dontextract = parse_msgs(N_DONTEXTRACTMSGS, dontextractmsgs, charset_code);
819
820	fnm = osstrdup(msg_lang);
821	/* trim off charset from stuff like "de_DE.iso8859_1" */
822	s = strchr(fnm, '.');
823	if (s) *s = '\0';
824
825	fh = fopenWithPthAndExt(pth_cfg_files, fnm, EXT_SVX_MSG, "rb", NULL);
826
827	if (!fh) {
828	/* e.g. if 'en_GB' is unknown, see if we know 'en' */
829	if (strlen(fnm) > 3 && fnm[2] == '_') {
830	fnm[2] = '\0';
831	fh = fopenWithPthAndExt(pth_cfg_files, fnm, EXT_SVX_MSG, "rb", NULL);
832	if (!fh) fnm[2] = '_'; /* for error reporting */
833	}
834	}
835
836	if (!fh) {
837	fatalerror(/Can't open message file `%s' using path `%s'/1000,
838	fnm, pth_cfg_files);
839	}
840
841	if (fread(header, 1, 20, fh) < 20 \|\|
842	memcmp(header, "Svx\nMsg\r\n\xfe\xff", 12) != 0) {
843	fatalerror(/Problem with message file `%s'/1001, fnm);
844	}
845
846	if (header[12] != 0)
847	fatalerror(/I don't understand this message file version/1002);
848
849	n = (header[14] << 8) \| header[15];
850
851	len = 0;
852	for (i = 16; i < 20; i++) len = (len << 8) \| header[i];
853
854	p = osmalloc(len);
855	if (fread(p, 1, len, fh) < len)
856	fatalerror(/Message file truncated?/1003);
857
858	fclose(fh);
859
860	#ifdef DEBUG
861	fprintf(stderr, "fnm = `%s', n = %d, len = %d\n", fnm, n, len);
862	#endif
863	osfree(fnm);
864
865	msg_array = parse_msgs(n, p, charset_code);
866	num_msgs = n;
867	}
868
869	const char *
870	msg_cfgpth(void)
871	{
872	return pth_cfg_files;
873	}
874
875	const char *
876	msg_exepth(void)
877	{
878	return exe_pth;
879	}
880
881	const char *
882	msg_appname(void)
883	{
884	return appname_copy;
885	}
886
887	void
888	msg_init(char * const *argv)
889	{
890	char *p;
891	SVX_ASSERT(argv);
892
893	#ifdef HAVE_SIGNAL
894	init_signals();
895	#endif
896	/* Point to argv[0] itself so we report a more helpful error if the
897	* code to work out the clean appname generates a signal */
898	appname_copy = argv[0];
899	#if OS_UNIX
900	/* use name as-is on Unix - programs run from path get name as supplied */
901	appname_copy = osstrdup(argv[0]);
902	#else
903	/* use the lower-cased leafname on other platforms */
904	p = leaf_from_fnm(argv[0]);
905	appname_copy = p;
906	while (*p) {
907	p = tolower(p);
908	++p;
909	}
910	#endif
911
912	/* shortcut --version so you can check the version number even when the
913	* correct message file can't be found... */
914	if (argv[1] && strcmp(argv[1], "--version") == 0) {
915	cmdline_version();
916	exit(0);
917	}
918	if (argv[0]) {
919	exe_pth = path_from_fnm(argv[0]);
920	#ifdef MACOSX_BUNDLE
921	/* If we're being built into a bundle, always look relative to
922	* the path to the binary. */
923	#ifdef AVEN
924	/* Aven is packaged as an application, so we must look inside there. */
925	pth_cfg_files = use_path(exe_pth, "../Resources");
926	#else
927	pth_cfg_files = use_path(exe_pth, "share/survex");
928	#endif
929	#elif OS_UNIX && defined DATADIR && defined PACKAGE
930	bool free_pth = fFalse;
931	char *pth = getenv("srcdir");
932	if (!pth \|\| !pth[0]) {
933	pth = path_from_fnm(argv[0]);
934	free_pth = fTrue;
935	}
936	if (pth[0]) {
937	struct stat buf;
938	#if OS_UNIX_MACOSX
939	/* On MacOS X the programs may be installed anywhere, with the
940	* share directory and the binaries in the same directory. */
941	p = use_path(pth, "share/survex/en.msg");
942	if (lstat(p, &buf) == 0 && S_ISREG(buf.st_mode)) {
943	pth_cfg_files = use_path(pth, "share/survex");
944	goto macosx_got_msg;
945	}
946	osfree(p);
947	#endif
948	/* If we're run with an explicit path, check if "../lib/en.msg"
949	* from the program's path exists, and if so look there for
950	* support files - this allows us to test binaries in the build
951	* tree easily. */
952	p = use_path(pth, "../lib/en.msg");
953	if (lstat(p, &buf) == 0) {
954	#ifdef S_ISREG
955	/* POSIX way */
956	if (S_ISREG(buf.st_mode)) {
957	pth_cfg_files = use_path(pth, "../lib");
958	}
959	#else
960	/* BSD way */
961	if ((buf.st_mode & S_IFMT) == S_IFREG) {
962	pth_cfg_files = use_path(pth, "../lib");
963	}
964	#endif
965	}
966	#if defined(__GNUC__) && defined(__APPLE_CC__)
967	macosx_got_msg:
968	#endif
969	osfree(p);
970	}
971
972	if (free_pth) osfree(pth);
973	#elif OS_WIN32
974	DWORD len = 256;
975	char buf = NULL, modname;
976	while (1) {
977	DWORD got;
978	buf = osrealloc(buf, len);
979	got = GetModuleFileName(NULL, buf, len);
980	if (got < len) break;
981	len += len;
982	}
983	modname = buf;
984	/* Strange Win32 nastiness - strip prefix "\\?\" if present */
985	if (strncmp(modname, "\\\\?\\", 4) == 0) modname += 4;
986	pth_cfg_files = path_from_fnm(modname);
987	osfree(buf);
988	#else
989	/* Get the path to the support files from argv[0] */
990	pth_cfg_files = path_from_fnm(argv[0]);
991	#endif
992	}
993
994	msg_lang = getenv("SURVEXLANG");
995	#ifdef DEBUG
996	fprintf(stderr, "msg_lang = %p (= \"%s\")\n", msg_lang, msg_lang?msg_lang:"(null)");
997	#endif
998
999	if (!msg_lang \|\| !*msg_lang) {
1000	msg_lang = getenv("LC_MESSAGES");
1001	if (!msg_lang \|\| !*msg_lang) {
1002	msg_lang = getenv("LANG");
1003	/* Something (AutoCAD?) on Microsoft Windows sets LANG to a number. */
1004	if (msg_lang && !isalpha(msg_lang[0])) msg_lang = NULL;
1005	}
1006	if (!msg_lang \|\| !*msg_lang) {
1007	#if OS_WIN32
1008	LCID locid;
1009	#endif
1010	#ifdef DEFAULTLANG
1011	msg_lang = STRING(DEFAULTLANG);
1012	#else
1013	msg_lang = "en";
1014	#endif
1015	#if OS_WIN32
1016	locid = GetUserDefaultLCID();
1017	if (locid) {
1018	WORD langid = LANGIDFROMLCID(locid);
1019	switch (PRIMARYLANGID(langid)) {
1020	/* older mingw compilers don't seem to supply this value */
1021	#ifndef LANG_CATALAN
1022	# define LANG_CATALAN 0x03
1023	#endif
1024	case LANG_CATALAN:
1025	msg_lang = "ca";
1026	break;
1027	case LANG_CHINESE:
1028	msg_lang = "zh";
1029	break;
1030	case LANG_ENGLISH:
1031	if (SUBLANGID(langid) == SUBLANG_ENGLISH_US)
1032	msg_lang = "en_US";
1033	else
1034	msg_lang = "en";
1035	break;
1036	case LANG_FRENCH:
1037	msg_lang = "fr";
1038	break;
1039	case LANG_GERMAN:
1040	switch (SUBLANGID(langid)) {
1041	case SUBLANG_GERMAN_SWISS:
1042	msg_lang = "de_CH";
1043	break;
1044	case SUBLANG_GERMAN:
1045	msg_lang = "de_DE";
1046	break;
1047	default:
1048	msg_lang = "de";
1049	}
1050	break;
1051	case LANG_ITALIAN:
1052	msg_lang = "it";
1053	break;
1054	case LANG_PORTUGUESE:
1055	if (SUBLANGID(langid) == SUBLANG_PORTUGUESE_BRAZILIAN)
1056	msg_lang = "pt_BR";
1057	else
1058	msg_lang = "pt";
1059	break;
1060	case LANG_ROMANIAN:
1061	msg_lang = "ro";
1062	break;
1063	case LANG_SLOVAK:
1064	msg_lang = "sk";
1065	break;
1066	case LANG_SPANISH:
1067	msg_lang = "es";
1068	break;
1069	}
1070	}
1071	#endif
1072	}
1073	}
1074	#ifdef DEBUG
1075	fprintf(stderr, "msg_lang = %p (= \"%s\")\n", msg_lang, msg_lang?msg_lang:"(null)");
1076	#endif
1077
1078	/* On Mandrake LANG defaults to C */
1079	if (strcmp(msg_lang, "C") == 0) msg_lang = "en";
1080
1081	msg_lang = osstrdup(msg_lang);
1082
1083	/* Convert en-us to en_US, etc */
1084	p = strchr(msg_lang, '-');
1085	if (p) {
1086	*p++ = '_';
1087	while (*p) {
1088	p = toupper(p);
1089	p++;
1090	}
1091	}
1092
1093	p = strchr(msg_lang, '_');
1094	if (p) {
1095	*p = '\0';
1096	msg_lang2 = osstrdup(msg_lang);
1097	*p = '_';
1098	}
1099
1100	int def_charset = default_charset();
1101
1102	#ifdef LC_MESSAGES
1103	/* try to setlocale() appropriately too */
1104	if (!setlocale(LC_MESSAGES, msg_lang)) {
1105	if (!msg_lang2 \|\| !setlocale(LC_MESSAGES, msg_lang2)) {
1106	def_charset = CHARSET_ISO_8859_1;
1107	}
1108	}
1109	#endif
1110
1111	select_charset(def_charset);
1112	}
1113
1114	/* Message may be overwritten by next call
1115	* (but not in current implementation) */
1116	const char *
1117	msg(int en)
1118	{
1119	/* NB can't use SVX_ASSERT here! */
1120	static char badbuf[256];
1121	if (en >= 1000 && en < 1000 + N_DONTEXTRACTMSGS)
1122	return dontextract[en - 1000];
1123	if (!msg_array) {
1124	if (en != 1) {
1125	sprintf(badbuf, "Message %d requested before msg_array initialised\n",
1126	en);
1127	return badbuf;
1128	}
1129	/* this should be the only other message which can be requested before
1130	* the message file is opened and read... */
1131	if (!dontextract) return "Out of memory (couldn't find %lu bytes).";
1132	return dontextract[(/Out of memory (couldn't find %lu bytes)./1004)
1133	- 1000];
1134	}
1135
1136	if (en < 0 \|\| en >= num_msgs) {
1137	sprintf(badbuf, "Message %d out of range\n", en);
1138	return badbuf;
1139	}
1140
1141	if (en == 0) {
1142	const char *p = msg_array[0];
1143	if (!*p) p = "(C)";
1144	return p;
1145	}
1146
1147	return msg_array[en];
1148	}
1149
1150	/* returns persistent copy of message */
1151	const char *
1152	msgPerm(int en)
1153	{
1154	return msg(en);
1155	}
1156
1157	void
1158	v_report(int severity, const char *fnm, int line, int en, va_list ap)
1159	{
1160	#ifdef AVEN
1161	aven_v_report(severity, fnm, line, en, ap);
1162	#else
1163	if (fnm) {
1164	fputs(fnm, STDERR);
1165	if (line) fprintf(STDERR, ":%d", line);
1166	} else {
1167	fputs(appname_copy, STDERR);
1168	}
1169	fputs(": ", STDERR);
1170
1171	if (severity == 0) {
1172	fputs(msg(/warning/4), STDERR);
1173	fputs(": ", STDERR);
1174	}
1175
1176	vfprintf(STDERR, msg(en), ap);
1177	fputnl(STDERR);
1178	#endif
1179
1180	switch (severity) {
1181	case 0:
1182	msg_warnings++;
1183	break;
1184	case 1:
1185	msg_errors++;
1186	if (msg_errors == 50)
1187	fatalerror_in_file(fnm, 0, /Too many errors - giving up/19);
1188	break;
1189	case 2:
1190	exit(EXIT_FAILURE);
1191	}
1192	}
1193
1194	void
1195	warning(int en, ...)
1196	{
1197	va_list ap;
1198	va_start(ap, en);
1199	v_report(0, NULL, 0, en, ap);
1200	va_end(ap);
1201	}
1202
1203	void
1204	error(int en, ...)
1205	{
1206	va_list ap;
1207	va_start(ap, en);
1208	v_report(1, NULL, 0, en, ap);
1209	va_end(ap);
1210	}
1211
1212	void
1213	fatalerror(int en, ...)
1214	{
1215	va_list ap;
1216	va_start(ap, en);
1217	v_report(2, NULL, 0, en, ap);
1218	va_end(ap);
1219	}
1220
1221	void
1222	warning_in_file(const char *fnm, int line, int en, ...)
1223	{
1224	va_list ap;
1225	va_start(ap, en);
1226	v_report(0, fnm, line, en, ap);
1227	va_end(ap);
1228	}
1229
1230	void
1231	error_in_file(const char *fnm, int line, int en, ...)
1232	{
1233	va_list ap;
1234	va_start(ap, en);
1235	v_report(1, fnm, line, en, ap);
1236	va_end(ap);
1237	}
1238
1239	void
1240	fatalerror_in_file(const char *fnm, int line, int en, ...)
1241	{
1242	va_list ap;
1243	va_start(ap, en);
1244	v_report(2, fnm, line, en, ap);
1245	va_end(ap);
1246	}
1247
1248	/* Code to support switching character set at runtime (e.g. for a printer
1249	* driver to support different character sets on screen and on the printer)
1250	*/
1251	typedef struct charset_li {
1252	struct charset_li *next;
1253	int code;
1254	char **msg_array;
1255	} charset_li;
1256
1257	static charset_li *charset_head = NULL;
1258
1259	static int charset = CHARSET_BAD;
1260
1261	int
1262	select_charset(int charset_code)
1263	{
1264	int old_charset = charset;
1265	charset_li *p;
1266
1267	#ifdef DEBUG
1268	fprintf(stderr, "select_charset(%d), old charset = %d\n", charset_code,
1269	charset);
1270	#endif
1271
1272	charset = charset_code;
1273
1274	/* check if we've already parsed messages for new charset */
1275	for (p = charset_head; p; p = p->next) {
1276	#ifdef DEBUG
1277	printf("%p: code %d msg_array %p\n", p, p->code, p->msg_array);
1278	#endif
1279	if (p->code == charset) {
1280	msg_array = p->msg_array;
1281	return old_charset;
1282	}
1283	}
1284
1285	/* nope, got to reparse message file */
1286	parse_msg_file(charset_code);
1287
1288	/* add to list */
1289	p = osnew(charset_li);
1290	p->code = charset;
1291	p->msg_array = msg_array;
1292	p->next = charset_head;
1293	charset_head = p;
1294
1295	return old_charset;
1296	}

Note: See TracBrowser for help on using the repository browser.

Context Navigation

source: git/src/message.c @ 7bdf66d

Download in other formats: