1 /* The lexer multiplexer for Gedcom.
2 Copyright (C) 2001,2002 The Genes Development Team
3 This file is part of the Gedcom parser library.
4 Contributed by Peter Verthez <Peter.Verthez@advalvas.be>, 2001.
6 The Gedcom parser library is free software; you can redistribute it
7 and/or modify it under the terms of the GNU Lesser General Public
8 License as published by the Free Software Foundation; either
9 version 2.1 of the License, or (at your option) any later version.
11 The Gedcom parser library is distributed in the hope that it will be
12 useful, but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Lesser General Public License for more details.
16 You should have received a copy of the GNU Lesser General Public
17 License along with the Gedcom parser library; if not, write to the
18 Free Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
24 #include "gedcom_internal.h"
31 typedef int (*lex_func)(void);
34 #define NEW_MODEL_FILE "new.ged"
36 int lexer_init(ENCODING enc, FILE* f)
38 if (enc == ONE_BYTE) {
39 lf = &gedcom_1byte_lex;
40 gedcom_1byte_myinit(f);
41 set_encoding_width(enc);
42 return open_conv_to_internal("ASCII");
44 else if (enc == TWO_BYTE_HILO) {
45 lf = &gedcom_hilo_lex;
46 gedcom_hilo_myinit(f);
47 set_encoding_width(enc);
48 return open_conv_to_internal("UNICODE");
50 else if (enc == TWO_BYTE_LOHI) {
51 lf = &gedcom_lohi_lex;
52 gedcom_lohi_myinit(f);
53 set_encoding_width(enc);
54 return open_conv_to_internal("UNICODE");
63 close_conv_to_internal();
71 int determine_encoding(FILE* f)
76 read = fread(first, 1, 2, f);
78 gedcom_warning(_("Error reading from input file: %s"), strerror(errno));
81 else if ((first[0] == '0') && (first[1] == ' ')) {
82 gedcom_debug_print(_("One-byte encoding"));
83 if (fseek(f, 0, 0) != 0)
84 gedcom_warning(_("Error positioning input file: %s"), strerror(errno));
87 else if ((first[0] == '\0') && (first[1] == '0'))
89 gedcom_debug_print(_("Two-byte encoding, high-low"));
90 if (fseek(f, 0, 0) != 0)
91 gedcom_warning(_("Error positioning input file: %s"), strerror(errno));
94 else if ((first[0] == '\xFE') && (first[1] == '\xFF'))
96 gedcom_debug_print(_("Two-byte encoding, high-low, with BOM"));
99 else if ((first[0] == '0') && (first[1] == '\0'))
101 gedcom_debug_print(_("Two-byte encoding, low-high"));
102 if (fseek(f, 0, 0) != 0)
103 gedcom_warning(_("Error positioning input file: %s"), strerror(errno));
104 return TWO_BYTE_LOHI;
106 else if ((first[0] == '\xFF') && (first[1] == '\xFE'))
108 gedcom_debug_print(_("Two-byte encoding, low-high, with BOM"));
109 return TWO_BYTE_LOHI;
112 gedcom_warning(_("Unknown encoding, falling back to one-byte"));
113 if (fseek(f, 0, 0) != 0)
114 gedcom_warning(_("Error positioning input file: %s"), strerror(errno));
124 update_gconv_search_path();
127 int gedcom_parse_file(const char* file_name)
132 char *locale, *save_locale, *save_textdom;
134 locale = setlocale(LC_ALL, NULL);
136 gedcom_error(_("Could not retrieve locale information"));
140 save_locale = strdup(locale);
146 save_textdom = textdomain(NULL);
148 gedcom_error(_("Could not retrieve locale domain: %s"), strerror(errno));
152 if (! setlocale(LC_ALL, "")
153 || ! bindtextdomain(PACKAGE, LOCALEDIR)
154 || ! bind_textdomain_codeset(PACKAGE, INTERNAL_ENCODING)
155 || ! textdomain(PACKAGE)) {
156 gedcom_error(_("Could not set locale: %s"), strerror(errno));
161 gedcom_error(_("Internal error: GEDCOM parser not initialized"));
164 file = fopen(file_name, "r");
166 gedcom_error(_("Could not open file '%s': %s"),
167 file_name, strerror(errno));
171 enc = determine_encoding(file);
173 if (lexer_init(enc, file)) {
176 result = gedcom_parse();
179 result = check_xref_table();
186 if (! textdomain(save_textdom)
187 || ! setlocale(LC_ALL, save_locale)) {
188 gedcom_error(_("Could not restore locale: %s"), strerror(errno));
195 int gedcom_new_model()
200 file = fopen(NEW_MODEL_FILE, "r");
203 result = gedcom_parse_file(NEW_MODEL_FILE);
206 char* filename = (char*) malloc(strlen(PKGDATADIR) + strlen(NEW_MODEL_FILE)
211 sprintf(filename, "%s/%s", PKGDATADIR, NEW_MODEL_FILE);
212 result = gedcom_parse_file(filename);