]> git.tdb.fi Git - ext/subsurface.git/blobdiff - parse.c
Start moving some of the non-parsing stuff out of 'parse.c'
[ext/subsurface.git] / parse.c
diff --git a/parse.c b/parse.c
index 2321f7d13a890b4fc085e818ce57ad9cf791654a..1a8e3ba6113064fb71a8273483941678f814df8c 100644 (file)
--- a/parse.c
+++ b/parse.c
@@ -1,9 +1,374 @@
 #include <stdio.h>
 #include <ctype.h>
 #include <string.h>
+#include <stdlib.h>
+#include <errno.h>
+#include <time.h>
 #include <libxml/parser.h>
 #include <libxml/tree.h>
 
+#include "dive.h"
+
+int verbose;
+
+struct dive_table dive_table;
+
+/*
+ * Add a dive into the dive_table array
+ */
+static void record_dive(struct dive *dive)
+{
+       int nr = dive_table.nr, allocated = dive_table.allocated;
+       struct dive **dives = dive_table.dives;
+
+       if (nr >= allocated) {
+               allocated = (nr + 32) * 3 / 2;
+               dives = realloc(dives, allocated * sizeof(struct dive *));
+               if (!dives)
+                       exit(1);
+               dive_table.dives = dives;
+               dive_table.allocated = allocated;
+       }
+       dives[nr] = dive;
+       dive_table.nr = nr+1;
+}
+
+static void nonmatch(const char *type, const char *fullname, const char *name, char *buffer)
+{
+       if (verbose > 1)
+               printf("Unable to match %s '(%.*s)%s' (%s)\n", type,
+                       (int) (name - fullname), fullname, name,
+                       buffer);
+       free(buffer);
+}
+
+static const char *last_part(const char *name)
+{
+       const char *p = strrchr(name, '.');
+       return p ? p+1 : name;
+}
+
+typedef void (*matchfn_t)(char *buffer, void *);
+
+static int match(const char *pattern, const char *name, matchfn_t fn, char *buf, void *data)
+{
+       if (strcasecmp(pattern, name))
+               return 0;
+       fn(buf, data);
+       return 1;
+}
+
+/*
+ * Dive info as it is being built up..
+ */
+static int alloc_samples;
+static struct dive *dive;
+static struct sample *sample;
+static struct tm tm;
+
+static time_t utc_mktime(struct tm *tm)
+{
+       static const int mdays[] = {
+           0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334
+       };
+       int year = tm->tm_year;
+       int month = tm->tm_mon;
+       int day = tm->tm_mday;
+
+       /* First normalize relative to 1900 */
+       if (year < 70)
+               year += 100;
+       else if (year > 1900)
+               year -= 1900;
+
+       /* Normalized to Jan 1, 1970: unix time */
+       year -= 70;
+
+       if (year < 0 || year > 129) /* algo only works for 1970-2099 */
+               return -1;
+       if (month < 0 || month > 11) /* array bounds */
+               return -1;
+       if (month < 2 || (year + 2) % 4)
+               day--;
+       if (tm->tm_hour < 0 || tm->tm_min < 0 || tm->tm_sec < 0)
+               return -1;
+       return (year * 365 + (year + 1) / 4 + mdays[month] + day) * 24*60*60UL +
+               tm->tm_hour * 60*60 + tm->tm_min * 60 + tm->tm_sec;
+}
+
+static void divedate(char *buffer, void *_when)
+{
+       int d,m,y;
+       time_t *when = _when;
+
+       if (sscanf(buffer, "%d.%d.%d", &d, &m, &y) == 3) {
+               tm.tm_year = y;
+               tm.tm_mon = m-1;
+               tm.tm_mday = d;
+               if (tm.tm_sec | tm.tm_min | tm.tm_hour)
+                       *when = utc_mktime(&tm);
+       }
+       free(buffer);
+}
+
+static void divetime(char *buffer, void *_when)
+{
+       int h,m,s = 0;
+       time_t *when = _when;
+
+       if (sscanf(buffer, "%d:%d:%d", &h, &m, &s) >= 2) {
+               tm.tm_hour = h;
+               tm.tm_min = m;
+               tm.tm_sec = s;
+               if (tm.tm_year)
+                       *when = utc_mktime(&tm);
+       }
+       free(buffer);
+}
+
+/* Libdivecomputer: "2011-03-20 10:22:38" */
+static void divedatetime(char *buffer, void *_when)
+{
+       int y,m,d;
+       int hr,min,sec;
+       time_t *when = _when;
+
+       if (sscanf(buffer, "%d-%d-%d %d:%d:%d",
+               &y, &m, &d, &hr, &min, &sec) == 6) {
+               tm.tm_year = y;
+               tm.tm_mon = m-1;
+               tm.tm_mday = d;
+               tm.tm_hour = hr;
+               tm.tm_min = min;
+               tm.tm_sec = sec;
+               *when = utc_mktime(&tm);
+       }
+       free(buffer);
+}
+
+union int_or_float {
+       long i;
+       double fp;
+};
+
+enum number_type {
+       NEITHER,
+       INTEGER,
+       FLOAT
+};
+
+static enum number_type integer_or_float(char *buffer, union int_or_float *res)
+{
+       char *end;
+       long val;
+       double fp;
+
+       /* Integer or floating point? */
+       val = strtol(buffer, &end, 10);
+       if (val < 0 || end == buffer)
+               return NEITHER;
+
+       /* Looks like it might be floating point? */
+       if (*end == '.') {
+               errno = 0;
+               fp = strtod(buffer, &end);
+               if (!errno) {
+                       res->fp = fp;
+                       return FLOAT;
+               }
+       }
+
+       res->i = val;
+       return INTEGER;
+}
+
+static void pressure(char *buffer, void *_press)
+{
+       pressure_t *pressure = _press;
+       union int_or_float val;
+
+       switch (integer_or_float(buffer, &val)) {
+       case FLOAT:
+               /* Maybe it's in Bar? */
+               if (val.fp < 500.0) {
+                       pressure->mbar = val.fp * 1000;
+                       break;
+               }
+               printf("Unknown fractional pressure reading %s\n", buffer);
+               break;
+
+       case INTEGER:
+               /*
+                * Random integer? Maybe in PSI? Or millibar already?
+                *
+                * We assume that 5 bar is a ridiculous tank pressure,
+                * so if it's smaller than 5000, it's in PSI..
+                */
+               if (val.i < 5000) {
+                       pressure->mbar = val.i * 68.95;
+                       break;
+               }
+               pressure->mbar = val.i;
+               break;
+       default:
+               printf("Strange pressure reading %s\n", buffer);
+       }
+       free(buffer);
+}
+
+static void depth(char *buffer, void *_depth)
+{
+       depth_t *depth = _depth;
+       union int_or_float val;
+
+       switch (integer_or_float(buffer, &val)) {
+       /* Integer values are probably in feet */
+       case INTEGER:
+               depth->mm = 304.8 * val.i;
+               break;
+       /* Float? Probably meters.. */
+       case FLOAT:
+               depth->mm = val.fp * 1000;
+               break;
+       default:
+               printf("Strange depth reading %s\n", buffer);
+       }
+       free(buffer);
+}
+
+static void temperature(char *buffer, void *_temperature)
+{
+       temperature_t *temperature = _temperature;
+       union int_or_float val;
+
+       switch (integer_or_float(buffer, &val)) {
+       /* C or F? Who knows? Let's default to Celsius */
+       case INTEGER:
+               val.fp = val.i;
+               /* Fallthrough */
+       case FLOAT:
+               /* Ignore zero. It means "none" */
+               if (!val.fp)
+                       break;
+               /* Celsius */
+               if (val.fp < 50.0) {
+                       temperature->mkelvin = (val.fp + 273.16) * 1000;
+                       break;
+               }
+               /* Fahrenheit */
+               if (val.fp < 212.0) {
+                       temperature->mkelvin = (val.fp + 459.67) * 5000/9;
+                       break;
+               }
+               /* Kelvin or already millikelvin */
+               if (val.fp < 1000.0)
+                       val.fp *= 1000;
+               temperature->mkelvin = val.fp;
+               break;
+       default:
+               printf("Strange temperature reading %s\n", buffer);
+       }
+       free(buffer);
+}
+
+static void sampletime(char *buffer, void *_time)
+{
+       int i;
+       int min, sec;
+       duration_t *time = _time;
+
+       i = sscanf(buffer, "%d:%d", &min, &sec);
+       switch (i) {
+       case 1:
+               sec = min;
+               min = 0;
+       /* fallthrough */
+       case 2:
+               time->seconds = sec + min*60;
+               break;
+       default:
+               printf("Strange sample time reading %s\n", buffer);
+       }
+       free(buffer);
+}
+
+static void duration(char *buffer, void *_time)
+{
+       sampletime(buffer, _time);
+}
+
+static void ignore(char *buffer, void *_time)
+{
+}
+
+/* We're in samples - try to convert the random xml value to something useful */
+static void try_to_fill_sample(struct sample *sample, const char *name, char *buf)
+{
+       const char *last = last_part(name);
+
+       if (match("pressure", last, pressure, buf, &sample->tankpressure))
+               return;
+       if (match("cylpress", last, pressure, buf, &sample->tankpressure))
+               return;
+       if (match("depth", last, depth, buf, &sample->depth))
+               return;
+       if (match("temperature", last, temperature, buf, &sample->temperature))
+               return;
+       if (match("sampletime", last, sampletime, buf, &sample->time))
+               return;
+       if (match("time", last, sampletime, buf, &sample->time))
+               return;
+
+       nonmatch("sample", name, last, buf);
+}
+
+/* We're in the top-level dive xml. Try to convert whatever value to a dive value */
+static void try_to_fill_dive(struct dive *dive, const char *name, char *buf)
+{
+       const char *last = last_part(name);
+
+       if (match("date", last, divedate, buf, &dive->when))
+               return;
+       if (match("time", last, divetime, buf, &dive->when))
+               return;
+       if (match("datetime", last, divedatetime, buf, &dive->when))
+               return;
+       if (match("maxdepth", last, depth, buf, &dive->maxdepth))
+               return;
+       if (match("meandepth", last, depth, buf, &dive->meandepth))
+               return;
+       if (match("divetime", last, duration, buf, &dive->duration))
+               return;
+       if (match("divetimesec", last, duration, buf, &dive->duration))
+               return;
+       if (match("surfacetime", last, duration, buf, &dive->surfacetime))
+               return;
+       if (match("airtemp", last, temperature, buf, &dive->airtemp))
+               return;
+       if (match("watertemp", last, temperature, buf, &dive->watertemp))
+               return;
+       if (match("cylinderstartpressure", last, pressure, buf, &dive->beginning_pressure))
+               return;
+       if (match("cylinderendpressure", last, pressure, buf, &dive->end_pressure))
+               return;
+       if (match("divenumber", last, ignore, buf, NULL))
+               return;
+       if (match("diveseries", last, ignore, buf, NULL))
+               return;
+       if (match("number", last, ignore, buf, NULL))
+               return;
+       if (match("size", last, ignore, buf, NULL))
+               return;
+       if (match("fingerprint", last, ignore, buf, NULL))
+               return;
+       nonmatch("dive", name, last, buf);
+}
+
+static unsigned int dive_size(int samples)
+{
+       return sizeof(struct dive) + samples*sizeof(struct sample);
+}
+
 /*
  * File boundaries are dive boundaries. But sometimes there are
  * multiple dives per file, so there can be other events too that
  */
 static void dive_start(void)
 {
-       printf("---\n");
+       unsigned int size;
+
+       if (dive)
+               return;
+
+       alloc_samples = 5;
+       size = dive_size(alloc_samples);
+       dive = malloc(size);
+       if (!dive)
+               exit(1);
+       memset(dive, 0, size);
+       memset(&tm, 0, sizeof(tm));
 }
 
 static void dive_end(void)
 {
+       if (!dive)
+               return;
+       record_dive(dive);
+       dive = NULL;
 }
 
 static void sample_start(void)
 {
-       printf("Sample:\n");
+       int nr;
+
+       if (!dive)
+               return;
+       nr = dive->samples;
+       if (nr >= alloc_samples) {
+               unsigned int size;
+
+               alloc_samples = (alloc_samples * 3)/2 + 10;
+               size = dive_size(alloc_samples);
+               dive = realloc(dive, size);
+               if (!dive)
+                       return;
+       }
+       sample = dive->sample + nr;
+       memset(sample, 0, sizeof(*sample));
 }
 
 static void sample_end(void)
 {
+       sample = NULL;
+       if (!dive)
+               return;
+       dive->samples++;
 }
 
-static void entry(const char *name, int size, const char *buffer)
+static void entry(const char *name, int size, const char *raw)
 {
-       printf("%s: %.*s\n", name, size, buffer);
+       char *buf = malloc(size+1);
+
+       if (!buf)
+               return;
+       memcpy(buf, raw, size);
+       buf[size] = 0;
+       if (sample) {
+               try_to_fill_sample(sample, name, buf);
+               return;
+       }
+       if (dive) {
+               try_to_fill_dive(dive, name, buf);
+               return;
+       }
 }
 
 static const char *nodename(xmlNode *node, char *buf, int len)
 {
-       /* Don't print out the node name if it is "text" */
-       if (!strcmp(node->name, "text")) {
-               node = node->parent;
-               if (!node || !node->name)
-                       return "root";
-       }
+       if (!node || !node->name)
+               return "root";
 
        buf += len;
        *--buf = 0;
@@ -89,6 +497,10 @@ static void visit_one_node(xmlNode *node)
        if (!len)
                return;
 
+       /* Don't print out the node name if it is "text" */
+       if (!strcmp(node->name, "text"))
+               node = node->parent;
+
        name = nodename(node, buffer, sizeof(buffer));
 
        entry(name, len, content);
@@ -126,7 +538,7 @@ static void traverse(xmlNode *node)
        }
 }
 
-static void parse(const char *filename)
+void parse_xml_file(const char *filename)
 {
        xmlDoc *doc;
 
@@ -143,13 +555,7 @@ static void parse(const char *filename)
        xmlCleanupParser();
 }
 
-int main(int argc, char **argv)
+void parse_xml_init(void)
 {
-       int i;
-
        LIBXML_TEST_VERSION
-
-       for (i = 1; i < argc; i++)
-               parse(argv[i]);
-       return 0;
 }