+/* Test program for the Gedcom library.
+ Copyright (C) 2001, 2002 The Genes Development Team
+ This file is part of the Gedcom parser library.
+ Contributed by Peter Verthez <Peter.Verthez@advalvas.be>, 2001.
+
+ The Gedcom parser library is free software; you can redistribute it
+ and/or modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The Gedcom parser library is distributed in the hope that it will be
+ useful, but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the Gedcom parser library; if not, write to the
+ Free Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
+ 02111-1307 USA. */
+
/* $Id$ */
/* $Name$ */
+#include <stdio.h>
+#include <string.h>
+#include <stdlib.h>
+#include <stdarg.h>
+#include <locale.h>
+#include <errno.h>
+#include <iconv.h>
#include "gedcom.h"
+#include "utf8-locale.h"
+
+#define OUTFILE "testgedcom.out"
+FILE* outfile = NULL;
+int quiet = 0;
+
+void output(int to_stdout_too, char* format, ...)
+{
+ va_list ap;
+ va_start(ap, format);
+ if (outfile) {
+ vfprintf(outfile, format, ap);
+ }
+ if (to_stdout_too && !quiet) {
+ vprintf(format, ap);
+ }
+ va_end(ap);
+}
void show_help ()
{
printf("gedcom-parse test program for libgedcom\n\n");
- printf("Usage: gedcom-parse [options] file\n");
+ printf("Usage: testgedcom [options] file\n");
printf("Options:\n");
printf(" -h Show this help text\n");
printf(" -nc Disable compatibility mode\n");
printf(" -fn No fail on errors\n");
printf(" -dg Debug setting: only libgedcom debug messages\n");
printf(" -da Debug setting: libgedcom + yacc debug messages\n");
+ printf(" -2 Run the test parse 2 times instead of once\n");
+ printf(" -3 Run the test parse 3 times instead of once\n");
+ printf(" -q No output to standard output\n");
}
-int determine_encoding(FILE* f)
+Gedcom_ctxt header_start(int level, Gedcom_val xref, char *tag,
+ char *raw_value, int tag_value,
+ Gedcom_val parsed_value)
{
- char first[2];
+ output(1, "Header start\n");
+ return (Gedcom_ctxt)1;
+}
- fread(first, 1, 2, f);
- if ((first[0] == '0') && (first[1] == ' ')) {
- gedcom_warning("One-byte encoding");
- fseek(f, 0, 0);
- return ONE_BYTE;
- }
- else if ((first[0] == '\0') && (first[1] == '0'))
- {
- gedcom_warning("Two-byte encoding, high-low");
- fseek(f, 0, 0);
- return TWO_BYTE_HILO;
- }
- else if ((first[0] == '\xFE') && (first[1] == '\xFF'))
- {
- gedcom_warning("Two-byte encoding, high-low, with BOM");
- return TWO_BYTE_HILO;
- }
- else if ((first[0] == '0') && (first[1] == '\0'))
- {
- gedcom_warning("Two-byte encoding, low-high");
- fseek(f, 0, 0);
- return TWO_BYTE_LOHI;
- }
- else if ((first[0] == '\xFF') && (first[1] == '\xFE'))
- {
- gedcom_warning("Two-byte encoding, low-high, with BOM");
- return TWO_BYTE_LOHI;
- }
- else {
- gedcom_warning("Unknown encoding, falling back to one-byte");
- fseek(f, 0, 0);
- return ONE_BYTE;
- }
+void header_end(Gedcom_ctxt self)
+{
+ output(1, "Header end, context is %d\n", (int)self);
}
-int gedcom_xxx_parse(char* file_name)
+char family_xreftags[100][255];
+int family_nr = 1;
+
+Gedcom_ctxt family_start(int level, Gedcom_val xref, char *tag,
+ char *raw_value, int tag_value,
+ Gedcom_val parsed_value)
{
- ENCODING enc;
- FILE* file = fopen (file_name, "r");
- if (!file) {
- printf("Could not open file '%s'\n", file_name);
- exit(1);
- }
- enc = determine_encoding(file);
+ struct xref_value *xr = GEDCOM_XREF_PTR(xref);
+ output(1, "Family start, xref is %s\n", xr->string);
+ strcpy(family_xreftags[family_nr], xr->string);
+ xr->object = (Gedcom_ctxt)family_nr;
+ return (Gedcom_ctxt)(family_nr++);
+}
- if (enc == ONE_BYTE) {
- gedcom_in = file;
- return gedcom_parse();
- }
- else {
- printf("No parser yet for encoding\n");
- exit(1);
- }
+Gedcom_ctxt rec_start(int level, Gedcom_val xref, char *tag,
+ char *raw_value, int tag_value,
+ Gedcom_val parsed_value)
+{
+ char* xref_str = NULL;
+ if (! GEDCOM_IS_NULL(xref))
+ xref_str = GEDCOM_XREF_PTR(xref)->string;
+ output(1, "Rec %s start, xref is %s\n", tag, xref_str);
+ return (Gedcom_ctxt)tag_value;
+}
+
+Gedcom_ctxt note_start(int level, Gedcom_val xref, char *tag,
+ char *raw_value, int tag_value,
+ Gedcom_val parsed_value)
+{
+ output(1, "== %d %s (%d) %s (xref is %s)\n",
+ level, tag, tag_value, GEDCOM_STRING(parsed_value),
+ GEDCOM_XREF_PTR(xref)->string);
+ return (Gedcom_ctxt)tag_value;
+}
+
+void family_end(Gedcom_ctxt self)
+{
+ output(1, "Family end, xref is %s\n", family_xreftags[(int)self]);
+}
+
+Gedcom_ctxt submit_start(int level, Gedcom_val xref, char *tag,
+ char *raw_value, int tag_value,
+ Gedcom_val parsed_value)
+{
+ output(1, "Submitter, xref is %s\n", GEDCOM_XREF_PTR(xref)->string);
+ return (Gedcom_ctxt)10000;
+}
+
+Gedcom_ctxt source_start(Gedcom_ctxt parent, int level, char *tag,
+ char* raw_value,
+ int tag_value, Gedcom_val parsed_value)
+{
+ Gedcom_ctxt self = (Gedcom_ctxt)((int) parent + 1000);
+ output(1, "Source is %s (ctxt is %d, parent is %d)\n",
+ GEDCOM_STRING(parsed_value), (int) self, (int) parent);
+ return self;
+}
+
+void source_end(Gedcom_ctxt parent, Gedcom_ctxt self, Gedcom_val parsed_value)
+{
+ output(1, "Source context %d in parent %d\n", (int)self, (int)parent);
+}
+
+Gedcom_ctxt source_date_start(Gedcom_ctxt parent, int level, char *tag,
+ char* raw_value,
+ int tag_value, Gedcom_val parsed_value)
+{
+ struct date_value dv;
+ Gedcom_ctxt self = (Gedcom_ctxt)((int) parent + 1000);
+ dv = GEDCOM_DATE(parsed_value);
+ output(1, "Contents of the date_value:\n");
+ output(1, " raw value: %s\n", raw_value);
+ output(1, " type: %d\n", dv.type);
+ output(1, " date1:\n");
+ output(1, " calendar type: %d\n", dv.date1.cal);
+ output(1, " day: %s\n", dv.date1.day_str);
+ output(1, " month: %s\n", dv.date1.month_str);
+ output(1, " year: %s\n", dv.date1.year_str);
+ output(1, " date type: %d\n", dv.date1.type);
+ output(1, " sdn1: %ld\n", dv.date1.sdn1);
+ output(1, " sdn2: %ld\n", dv.date1.sdn2);
+ output(1, " date2:\n");
+ output(1, " calendar type: %d\n", dv.date2.cal);
+ output(1, " day: %s\n", dv.date2.day_str);
+ output(1, " month: %s\n", dv.date2.month_str);
+ output(1, " year: %s\n", dv.date2.year_str);
+ output(1, " date type: %d\n", dv.date2.type);
+ output(1, " sdn1: %ld\n", dv.date2.sdn1);
+ output(1, " sdn2: %ld\n", dv.date2.sdn2);
+ output(1, " phrase: %s\n", dv.phrase);
+ return self;
+}
+
+void default_cb(Gedcom_ctxt ctxt, int level, char *tag, char *raw_value,
+ int tag_value)
+{
+ char *converted = NULL;
+ int conv_fails = 0;
+ if (raw_value)
+ converted = convert_utf8_to_locale(raw_value, &conv_fails);
+ output(0, "== %d %s (%d) %s (ctxt is %d, conversion failures: %d)\n",
+ level, tag, tag_value, converted, (int)ctxt, conv_fails);
+}
+
+void subscribe_callbacks()
+{
+ gedcom_subscribe_to_record(REC_HEAD, header_start, header_end);
+ gedcom_subscribe_to_record(REC_FAM, family_start, family_end);
+ gedcom_subscribe_to_record(REC_INDI, rec_start, NULL);
+ gedcom_subscribe_to_record(REC_OBJE, rec_start, NULL);
+ gedcom_subscribe_to_record(REC_NOTE, note_start, NULL);
+ gedcom_subscribe_to_record(REC_REPO, rec_start, NULL);
+ gedcom_subscribe_to_record(REC_SOUR, rec_start, NULL);
+ gedcom_subscribe_to_record(REC_SUBN, rec_start, NULL);
+ gedcom_subscribe_to_record(REC_SUBM, submit_start, NULL);
+ gedcom_subscribe_to_record(REC_USER, rec_start, NULL);
+ gedcom_subscribe_to_element(ELT_HEAD_SOUR, source_start, source_end);
+ gedcom_subscribe_to_element(ELT_SOUR_DATA_EVEN_DATE,
+ source_date_start, NULL);
+}
+
+void gedcom_message_handler(Gedcom_msg_type type, char *msg)
+{
+ if (type == MESSAGE)
+ output(1, "MESSAGE: ");
+ else if (type == WARNING)
+ output(1, "WARNING: ");
+ else if (type == ERROR)
+ output(1, "ERROR: ");
+ output(1, "%s\n", msg);
}
int main(int argc, char* argv[])
{
- MECHANISM mech = IMMED_FAIL;
+ Gedcom_err_mech mech = IMMED_FAIL;
int compat_enabled = 1;
int debug_level = 0;
+ int run_times = 1;
+ int result = 0;
char* file_name = NULL;
if (argc > 1) {
show_help();
exit(1);
}
+ else if (!strncmp(argv[i], "-2", 3)) {
+ run_times = 2;
+ }
+ else if (!strncmp(argv[i], "-3", 3)) {
+ run_times = 3;
+ }
+ else if (!strncmp(argv[i], "-q", 3)) {
+ quiet = 1;
+ }
else if (strncmp(argv[i], "-", 1)) {
file_name = argv[i];
break;
exit(1);
}
- gedcom_set_debug_level(debug_level);
+ setlocale(LC_ALL, "");
+ gedcom_set_debug_level(debug_level, NULL);
gedcom_set_compat_handling(compat_enabled);
gedcom_set_error_handling(mech);
+ gedcom_set_message_handler(gedcom_message_handler);
+ gedcom_set_default_callback(default_cb);
- if (gedcom_xxx_parse(file_name) == 0) {
- printf("Parse succeeded\n");
+ subscribe_callbacks();
+ outfile = fopen(OUTFILE, "a");
+ if (!outfile) {
+ printf("Could not open %s for appending\n", OUTFILE);
+ }
+ while (run_times-- > 0) {
+ output(0, "\n=== Parsing file %s\n", file_name);
+ result |= gedcom_parse_file(file_name);
+ }
+ fclose(outfile);
+ if (result == 0) {
+ output(1, "Parse succeeded\n");
return 0;
}
else {
- printf("Parse failed\n");
+ output(1, "Parse failed\n");
return 1;
}
}
-
-int gedcom_warning(char* s, ...)
-{
- int res;
- va_list ap;
-
- va_start(ap, s);
- fprintf(stderr, "Warning on line %d: ", line_no);
- res = vfprintf(stderr, s, ap);
- fprintf(stderr, "\n");
- va_end(ap);
-
- return res;
-}
-
-int gedcom_error(char* s, ...)
-{
- int res;
- va_list ap;
-
- va_start(ap, s);
- fprintf(stderr, "Error on line %d: ", line_no);
- res = vfprintf(stderr, s, ap);
- fprintf(stderr, "\n");
- va_end(ap);
-
- return res;
-}