| 1 | /* lang.h -- declarations for language codes etc.
|
|---|
| 2 | $Id: lang.h,v 1.6 2004/04/11 17:56:47 karl Exp $
|
|---|
| 3 |
|
|---|
| 4 | Copyright (C) 1999, 2001, 2002, 2003 Free Software Foundation, Inc.
|
|---|
| 5 |
|
|---|
| 6 | This program is free software; you can redistribute it and/or modify
|
|---|
| 7 | it under the terms of the GNU General Public License as published by
|
|---|
| 8 | the Free Software Foundation; either version 2, or (at your option)
|
|---|
| 9 | any later version.
|
|---|
| 10 |
|
|---|
| 11 | This program is distributed in the hope that it will be useful,
|
|---|
| 12 | but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|---|
| 13 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|---|
| 14 | GNU General Public License for more details.
|
|---|
| 15 |
|
|---|
| 16 | You should have received a copy of the GNU General Public License
|
|---|
| 17 | along with this program; if not, write to the Free Software
|
|---|
| 18 | Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
|
|---|
| 19 |
|
|---|
| 20 | Originally written by Karl Heinz Marbaise <kama@hippo.fido.de>. */
|
|---|
| 21 |
|
|---|
| 22 | #ifndef LANG_H
|
|---|
| 23 | #define LANG_H
|
|---|
| 24 |
|
|---|
| 25 | /* The language code which can be changed through @documentlanguage
|
|---|
| 26 | * Actually we don't currently support this (may be in the future) ;-)
|
|---|
| 27 | * These code are the ISO-639 two letter codes.
|
|---|
| 28 | */
|
|---|
| 29 | typedef enum
|
|---|
| 30 | {
|
|---|
| 31 | aa, ab, af, am, ar, as, ay, az,
|
|---|
| 32 | ba, be, bg, bh, bi, bn, bo, br,
|
|---|
| 33 | ca, co, cs, cy,
|
|---|
| 34 | da, de, dz,
|
|---|
| 35 | el, en, eo, es, et, eu,
|
|---|
| 36 | fa, fi, fj, fo, fr, fy,
|
|---|
| 37 | ga, gd, gl, gn, gu,
|
|---|
| 38 | ha, he, hi, hr, hu, hy,
|
|---|
| 39 | ia, id, ie, ik, is, it, iu,
|
|---|
| 40 | ja, jw,
|
|---|
| 41 | ka, kk, kl, km, kn, ko, ks, ku, ky,
|
|---|
| 42 | la, ln, lo, lt, lv,
|
|---|
| 43 | mg, mi, mk, ml, mn, mo, mr, ms, mt, my,
|
|---|
| 44 | na, ne, nl, no,
|
|---|
| 45 | oc, om, or,
|
|---|
| 46 | pa, pl, ps, pt,
|
|---|
| 47 | qu,
|
|---|
| 48 | rm, rn, ro, ru, rw,
|
|---|
| 49 | sa, sd, sg, sh, si, sk, sl, sm, sn, so, sq, sr, ss, st, su, sv, sw,
|
|---|
| 50 | ta, te, tg, th, ti, tk, tl, tn, to, tr, ts, tt, tw,
|
|---|
| 51 | ug, uk, ur, uz,
|
|---|
| 52 | vi, vo,
|
|---|
| 53 | wo,
|
|---|
| 54 | xh,
|
|---|
| 55 | yi, yo,
|
|---|
| 56 | za, zh, zu,
|
|---|
| 57 | last_language_code
|
|---|
| 58 | } language_code_type;
|
|---|
| 59 |
|
|---|
| 60 | /* The current language code. */
|
|---|
| 61 | extern language_code_type language_code;
|
|---|
| 62 |
|
|---|
| 63 |
|
|---|
| 64 | /* Information for each language. */
|
|---|
| 65 | typedef struct
|
|---|
| 66 | {
|
|---|
| 67 | language_code_type lc; /* language code as enum type */
|
|---|
| 68 | char *abbrev; /* two letter language code */
|
|---|
| 69 | char *desc; /* full name for language code */
|
|---|
| 70 | } language_type;
|
|---|
| 71 |
|
|---|
| 72 | extern language_type language_table[];
|
|---|
| 73 |
|
|---|
| 74 |
|
|---|
| 75 | |
|---|
| 76 |
|
|---|
| 77 | /* The document encoding. This is useful to produce true 8-bit
|
|---|
| 78 | characters according to the @documentencoding. */
|
|---|
| 79 |
|
|---|
| 80 | typedef enum {
|
|---|
| 81 | no_encoding,
|
|---|
| 82 | US_ASCII,
|
|---|
| 83 | ISO_8859_1,
|
|---|
| 84 | ISO_8859_2,
|
|---|
| 85 | ISO_8859_3, /* this and none of the rest are supported. */
|
|---|
| 86 | ISO_8859_4,
|
|---|
| 87 | ISO_8859_5,
|
|---|
| 88 | ISO_8859_6,
|
|---|
| 89 | ISO_8859_7,
|
|---|
| 90 | ISO_8859_8,
|
|---|
| 91 | ISO_8859_9,
|
|---|
| 92 | ISO_8859_10,
|
|---|
| 93 | ISO_8859_11,
|
|---|
| 94 | ISO_8859_12,
|
|---|
| 95 | ISO_8859_13,
|
|---|
| 96 | ISO_8859_14,
|
|---|
| 97 | ISO_8859_15,
|
|---|
| 98 | last_encoding_code
|
|---|
| 99 | } encoding_code_type;
|
|---|
| 100 |
|
|---|
| 101 | /* The current document encoding, or null if not set. */
|
|---|
| 102 | extern encoding_code_type document_encoding_code;
|
|---|
| 103 |
|
|---|
| 104 | /* If an encoding is not supported, just keep it as a string. */
|
|---|
| 105 | extern char *unknown_encoding;
|
|---|
| 106 |
|
|---|
| 107 | /* Maps an HTML abbreviation to ISO and Unicode codes for a given code. */
|
|---|
| 108 |
|
|---|
| 109 | typedef unsigned short int unicode_t; /* should be 16 bits */
|
|---|
| 110 | typedef unsigned char byte_t;
|
|---|
| 111 |
|
|---|
| 112 | typedef struct
|
|---|
| 113 | {
|
|---|
| 114 | char *html; /* HTML equivalent like umlaut auml => ä */
|
|---|
| 115 | byte_t bytecode; /* 8-Bit Code (ISO 8859-1,...) */
|
|---|
| 116 | unicode_t unicode; /* Unicode in U+ convention */
|
|---|
| 117 | } iso_map_type;
|
|---|
| 118 |
|
|---|
| 119 | /* Information about the document encoding. */
|
|---|
| 120 | typedef struct
|
|---|
| 121 | {
|
|---|
| 122 | encoding_code_type ec; /* document encoding type (see above enum) */
|
|---|
| 123 | char *encname; /* encoding name like "iso-8859-1", valid in
|
|---|
| 124 | HTML and Emacs */
|
|---|
| 125 | iso_map_type *isotab; /* address of ISO translation table */
|
|---|
| 126 | } encoding_type;
|
|---|
| 127 |
|
|---|
| 128 | /* Table with all the encoding codes that we recognize. */
|
|---|
| 129 | extern encoding_type encoding_table[];
|
|---|
| 130 |
|
|---|
| 131 | |
|---|
| 132 |
|
|---|
| 133 | /* The commands. */
|
|---|
| 134 | extern void cm_documentlanguage (void),
|
|---|
| 135 | cm_documentencoding (void);
|
|---|
| 136 |
|
|---|
| 137 | /* Accents, other non-English characters. */
|
|---|
| 138 | void cm_accent (int arg), cm_special_char (int arg),
|
|---|
| 139 | cm_dotless (int arg, int start, int end);
|
|---|
| 140 |
|
|---|
| 141 | extern void cm_accent_umlaut (int arg, int start, int end),
|
|---|
| 142 | cm_accent_acute (int arg, int start, int end),
|
|---|
| 143 | cm_accent_cedilla (int arg, int start, int end),
|
|---|
| 144 | cm_accent_hat (int arg, int start, int end),
|
|---|
| 145 | cm_accent_grave (int arg, int start, int end),
|
|---|
| 146 | cm_accent_tilde (int arg, int start, int end);
|
|---|
| 147 |
|
|---|
| 148 | extern char *current_document_encoding (void);
|
|---|
| 149 |
|
|---|
| 150 | #endif /* not LANG_H */
|
|---|