22 #include "utils/builtins.h"
24 #include <libxml/tree.h>
25 #include <libxml/parser.h>
28 #include "../postgis_config.h"
29 #include "lwgeom_pg.h"
58 xmlNodePtr xmlroot = NULL;
60 if (PG_ARGISNULL(0)) PG_RETURN_NULL();
62 xml_input = PG_GETARG_TEXT_P(0);
63 xml = text_to_cstring(xml_input);
64 xml_size = VARSIZE_ANY_EXHDR(xml_input);
67 xmldoc = xmlReadMemory(xml, xml_size, NULL, NULL, XML_PARSE_SAX1);
69 if (!xmldoc || (xmlroot = xmlDocGetRootElement(xmldoc)) == NULL) {
72 lwpgerror(
"invalid MARC21/XML document.");
87 geom = geometry_serialize(lwgeom);
91 PG_RETURN_POINTER(geom);
100 if(literal == NULL)
return LW_FALSE;
102 literal_length = strlen(literal);
104 POSTGIS_DEBUGF(2,
"is_literal_valid called (%s)", literal);
106 if (literal_length < 3)
return LW_FALSE;
120 if (literal[0] ==
'N' || literal[0] ==
'E' || literal[0] ==
'S' || literal[0] ==
'W' || literal[0] ==
'+' || literal[0] ==
'-') {
122 if (literal_length < 4) {
123 POSTGIS_DEBUGF(3,
" invalid literal length (%d): \"%s\"", literal_length, literal);
130 for (
int j = coord_start; j < literal_length; j++) {
132 if (!isdigit(literal[j])) {
141 POSTGIS_DEBUGF(3,
" invalid character '%c' at the degrees section: \"%s\"", literal[j], literal);
150 if (literal[j] ==
'.' || literal[j] ==
',') {
154 if (num_dec_sep > 1)
return LW_FALSE;
157 POSTGIS_DEBUGF(3,
" invalid character '%c' in %d: \"%s\"", literal[j], j, literal);
166 POSTGIS_DEBUGF(2,
"=> is_literal_valid returns LW_TRUE for \"%s\"", literal);
188 size_t literal_length;
190 char start_character = literal[0];
191 int start_literal = 0;
194 const size_t numdigits_degrees = 3;
195 const size_t numdigits_minutes = 2;
196 const size_t numdigits_seconds = 2;
198 POSTGIS_DEBUGF(2,
"parse_geo_literal called (%s)", literal);
199 POSTGIS_DEBUGF(2,
" start character: %c", start_character);
201 literal_length = strlen(literal);
203 if (!isdigit(start_character)) start_literal = 1;
205 POSTGIS_DEBUGF(2,
" start_literal=%d", start_literal);
207 dgr = palloc(
sizeof(
char)*numdigits_degrees+1);
208 snprintf(dgr, numdigits_degrees+1,
"%s", &literal[start_literal]);
210 if (strchr(literal,
'.') == NULL && strchr(literal,
',') == NULL) {
223 POSTGIS_DEBUG(2,
" lat/lon integer coordinates detected");
224 POSTGIS_DEBUGF(2,
" parsed degrees (lon/lat): %s", dgr);
231 if (literal_length > (start_literal + numdigits_degrees)) {
233 min = palloc(
sizeof(
char)*numdigits_minutes+1);
234 snprintf(min, numdigits_minutes+1,
"%s", &literal[start_literal+numdigits_degrees]);
235 POSTGIS_DEBUGF(2,
" parsed minutes (lon/lat): %s", min);
240 if (literal_length >= (start_literal + numdigits_degrees + numdigits_minutes)) {
242 sec = palloc(
sizeof(
char)*numdigits_seconds+1);
243 snprintf(sec, numdigits_seconds+1,
"%s", &literal[start_literal+numdigits_degrees+numdigits_minutes]);
244 POSTGIS_DEBUGF(2,
" parsed seconds (lon/lat): %s", sec);
257 POSTGIS_DEBUG(2,
" decimal coordinates detected");
259 if (strchr(literal,
',')) {
264 literal[literal_length-strlen(strchr(literal,
','))]=
'.';
265 POSTGIS_DEBUGF(2,
" decimal separator changed to '.': %s",literal);
270 if (literal[start_literal + numdigits_degrees] ==
'.') {
281 char *dec = palloc(
sizeof(
char)*literal_length+1);
282 snprintf(dec, literal_length+1,
"%s", &literal[start_literal]);
285 POSTGIS_DEBUGF(2,
" parsed decimal degrees: %s", dec);
289 }
else if (literal[start_literal + numdigits_degrees + numdigits_minutes] ==
'.') {
300 size_t len_decimal_minutes = literal_length - (start_literal + numdigits_degrees);
302 min = palloc(
sizeof(
char)*len_decimal_minutes+1);
303 snprintf(min, len_decimal_minutes+1,
"%s", &literal[start_literal + numdigits_degrees]);
305 POSTGIS_DEBUGF(2,
" parsed degrees: %s", dgr);
306 POSTGIS_DEBUGF(2,
" parsed decimal minutes: %s", min);
308 result = atof(dgr) + (atof(min) / 60);
313 }
else if (literal[start_literal + numdigits_degrees + numdigits_minutes + numdigits_seconds] ==
'.') {
325 size_t len_decimal_seconds = literal_length - (start_literal + numdigits_degrees + numdigits_minutes);
327 min = palloc(
sizeof(
char)*numdigits_minutes+1);
328 snprintf(min, numdigits_minutes+1,
"%s", &literal[start_literal + numdigits_degrees]);
330 sec = palloc(
sizeof(
char)*len_decimal_seconds+1);
331 snprintf(sec, len_decimal_seconds+1,
"%s", &literal[start_literal + numdigits_degrees + numdigits_minutes]);
333 result = atof(dgr) + (atof(min) / 60) + (atof(sec) / 3600);
335 POSTGIS_DEBUGF(2,
" parsed degrees: %s", dgr);
336 POSTGIS_DEBUGF(2,
" parsed minutes: %s", min);
337 POSTGIS_DEBUGF(2,
" parsed decimal seconds: %s", sec);
352 if (start_character ==
'S' || start_character ==
'W' || start_character ==
'-') {
354 POSTGIS_DEBUGF(2,
" switching sign due to start character: '%c'", start_character);
359 POSTGIS_DEBUGF(2,
"=> parse_geo_literal returns: %.*f (in decimal degrees)", literal_length-(3+start_literal),
result);
368 xmlNodePtr datafield;
372 uint8_t geometry_type;
377 POSTGIS_DEBUGF(2,
"parse_marc21 called: root '<%s>'", xnode->name);
384 if (xmlStrcmp(xnode->name, (xmlChar*)
"record")) lwpgerror(
"invalid MARC21/XML document. Root element <record> expected but <%s> found.",xnode->name);
389 for (datafield = xnode->children; datafield != NULL; datafield = datafield->next) {
396 if (datafield->type != XML_ELEMENT_NODE)
continue;
398 if (xmlStrcmp(datafield->name, (xmlChar*)
"datafield") != 0 || xmlStrcmp(xmlGetProp(datafield, (xmlChar*)
"tag"),(xmlChar*)
"034") != 0)
continue;
400 POSTGIS_DEBUG(3,
" datafield found");
402 for (subfield = datafield->children; subfield != NULL; subfield = subfield->next) {
404 if (subfield->type != XML_ELEMENT_NODE)
continue;
405 if (xmlStrcmp(subfield->name, (xmlChar*)
"subfield") != 0)
continue;
407 code = (
char*) xmlGetProp(subfield, (xmlChar*)
"code");
409 if ((strcmp(code,
"d") != 0 && strcmp(code,
"e") != 0 && strcmp(code,
"f") != 0 && strcmp(code,
"g")) != 0)
continue;
411 literal = (
char*) xmlNodeGetContent(subfield);
413 POSTGIS_DEBUGF(3,
" subfield code '%s': %s", code, literal);
417 if (strcmp(code,
"d") == 0) lw = literal;
418 else if (strcmp(code,
"e") == 0) le = literal;
419 else if (strcmp(code,
"f") == 0) ln = literal;
420 else if (strcmp(code,
"g") == 0) ls = literal;
424 lwpgerror(
"parse error - invalid literal at 034$%s: \"%s\"", code, literal);
430 xmlFreeNode(subfield);
432 if (lw && le && ln && ls) {
442 if (fabs(
w - e) < 0.0000001f && fabs(n -
s) < 0.0000001f) {
460 if (ngeoms && result_type != geometry_type) {
463 result_type = geometry_type;
470 if (lw || le || ln || ls) {
472 lwpgerror(
"parse error - the Coded Cartographic Mathematical Data (datafield:034) in the given MARC21/XML is incomplete. Coordinates for subfields \"$d\",\"$e\",\"$f\" and \"$g\" are expected.");
479 POSTGIS_DEBUG(5,
" xmlFreeNode(datafield)");
480 xmlFreeNode(datafield);
488 }
else if (ngeoms > 1) {
492 for (i = 0; i < ngeoms; i++) {
508 POSTGIS_DEBUG(2,
"=> parse_marc21 returns NULL");
char result[OUT_DOUBLE_BUFFER_SIZE]
LWPOINT * lwpoint_make2d(int32_t srid, double x, double y)
void lwgeom_free(LWGEOM *geom)
LWPOLY * lwpoly_construct_envelope(int32_t srid, double x1, double y1, double x2, double y2)
void * lwrealloc(void *mem, size_t size)
LWCOLLECTION * lwcollection_construct_empty(uint8_t type, int32_t srid, char hasz, char hasm)
const char * lwtype_name(uint8_t type)
Return the type name string associated with a type number (e.g.
void lwgeom_force_clockwise(LWGEOM *lwgeom)
Force Right-hand-rule on LWGEOM polygons.
LWCOLLECTION * lwcollection_add_lwgeom(LWCOLLECTION *col, const LWGEOM *geom)
Appends geom to the collection managed by col.
void * lwalloc(size_t size)
#define LW_TRUE
Return types for functions with status returns.
#define SRID_UNKNOWN
Unknown SRID value.
This library is the generic geometry handling section of PostGIS.
PG_FUNCTION_INFO_V1(ST_GeomFromMARC21)
static LWGEOM * parse_marc21(xmlNodePtr xnode)
Datum ST_GeomFromMARC21(PG_FUNCTION_ARGS)
static double parse_geo_literal(char *literal)
static int is_literal_valid(const char *literal)
static uint32_t lwgeom_get_type(const LWGEOM *geom)
Return LWTYPE number.