22 #include "utils/builtins.h"
24 #include <libxml/tree.h>
25 #include <libxml/parser.h>
28 #include "../postgis_config.h"
29 #include "lwgeom_pg.h"
58 xmlNodePtr xmlroot = NULL;
60 if (PG_ARGISNULL(0)) PG_RETURN_NULL();
62 xml_input = PG_GETARG_TEXT_P(0);
63 xml = text_to_cstring(xml_input);
64 xml_size = VARSIZE_ANY_EXHDR(xml_input);
67 xmldoc = xmlReadMemory(xml, xml_size, NULL, NULL, 0);
69 if (!xmldoc || (xmlroot = xmlDocGetRootElement(xmldoc)) == NULL) {
72 lwpgerror(
"invalid MARC21/XML document.");
87 geom = geometry_serialize(lwgeom);
91 PG_RETURN_POINTER(geom);
97 const char *colon_pos;
98 const char *node_name;
101 if (!xn || xn->type != XML_ELEMENT_NODE)
107 node_name = (
const char*)xn->name;
108 colon_pos = strchr(node_name,
':');
110 node_name = colon_pos + 1;
112 return strcmp(node_name, xml_name) == 0;
121 if(literal == NULL)
return LW_FALSE;
123 literal_length = strlen(literal);
125 POSTGIS_DEBUGF(2,
"is_literal_valid called (%s)", literal);
127 if (literal_length < 3)
return LW_FALSE;
141 if (literal[0] ==
'N' || literal[0] ==
'E' || literal[0] ==
'S' || literal[0] ==
'W' || literal[0] ==
'+' || literal[0] ==
'-') {
143 if (literal_length < 4) {
144 POSTGIS_DEBUGF(3,
" invalid literal length (%d): \"%s\"", literal_length, literal);
151 for (
int j = coord_start; j < literal_length; j++) {
153 if (!isdigit(literal[j])) {
162 POSTGIS_DEBUGF(3,
" invalid character '%c' at the degrees section: \"%s\"", literal[j], literal);
171 if (literal[j] ==
'.' || literal[j] ==
',') {
175 if (num_dec_sep > 1)
return LW_FALSE;
178 POSTGIS_DEBUGF(3,
" invalid character '%c' in %d: \"%s\"", literal[j], j, literal);
187 POSTGIS_DEBUGF(2,
"=> is_literal_valid returns LW_TRUE for \"%s\"", literal);
209 size_t literal_length;
211 char start_character = literal[0];
212 int start_literal = 0;
215 const size_t numdigits_degrees = 3;
216 const size_t numdigits_minutes = 2;
217 const size_t numdigits_seconds = 2;
219 POSTGIS_DEBUGF(2,
"parse_geo_literal called (%s)", literal);
220 POSTGIS_DEBUGF(2,
" start character: %c", start_character);
222 literal_length = strlen(literal);
224 if (!isdigit(start_character)) start_literal = 1;
226 POSTGIS_DEBUGF(2,
" start_literal=%d", start_literal);
228 dgr = palloc(
sizeof(
char)*numdigits_degrees+1);
229 snprintf(dgr, numdigits_degrees+1,
"%s", &literal[start_literal]);
231 if (strchr(literal,
'.') == NULL && strchr(literal,
',') == NULL) {
244 POSTGIS_DEBUG(2,
" lat/lon integer coordinates detected");
245 POSTGIS_DEBUGF(2,
" parsed degrees (lon/lat): %s", dgr);
252 if (literal_length > (start_literal + numdigits_degrees)) {
254 min = palloc(
sizeof(
char)*numdigits_minutes+1);
255 snprintf(min, numdigits_minutes+1,
"%s", &literal[start_literal+numdigits_degrees]);
256 POSTGIS_DEBUGF(2,
" parsed minutes (lon/lat): %s", min);
261 if (literal_length >= (start_literal + numdigits_degrees + numdigits_minutes)) {
263 sec = palloc(
sizeof(
char)*numdigits_seconds+1);
264 snprintf(sec, numdigits_seconds+1,
"%s", &literal[start_literal+numdigits_degrees+numdigits_minutes]);
265 POSTGIS_DEBUGF(2,
" parsed seconds (lon/lat): %s", sec);
278 POSTGIS_DEBUG(2,
" decimal coordinates detected");
280 if (strchr(literal,
',')) {
285 literal[literal_length-strlen(strchr(literal,
','))]=
'.';
286 POSTGIS_DEBUGF(2,
" decimal separator changed to '.': %s",literal);
291 if (literal[start_literal + numdigits_degrees] ==
'.') {
302 char *dec = palloc(
sizeof(
char)*literal_length+1);
303 snprintf(dec, literal_length+1,
"%s", &literal[start_literal]);
306 POSTGIS_DEBUGF(2,
" parsed decimal degrees: %s", dec);
310 }
else if (literal[start_literal + numdigits_degrees + numdigits_minutes] ==
'.') {
321 size_t len_decimal_minutes = literal_length - (start_literal + numdigits_degrees);
323 min = palloc(
sizeof(
char)*len_decimal_minutes+1);
324 snprintf(min, len_decimal_minutes+1,
"%s", &literal[start_literal + numdigits_degrees]);
326 POSTGIS_DEBUGF(2,
" parsed degrees: %s", dgr);
327 POSTGIS_DEBUGF(2,
" parsed decimal minutes: %s", min);
329 result = atof(dgr) + (atof(min) / 60);
334 }
else if (literal[start_literal + numdigits_degrees + numdigits_minutes + numdigits_seconds] ==
'.') {
346 size_t len_decimal_seconds = literal_length - (start_literal + numdigits_degrees + numdigits_minutes);
348 min = palloc(
sizeof(
char)*numdigits_minutes+1);
349 snprintf(min, numdigits_minutes+1,
"%s", &literal[start_literal + numdigits_degrees]);
351 sec = palloc(
sizeof(
char)*len_decimal_seconds+1);
352 snprintf(sec, len_decimal_seconds+1,
"%s", &literal[start_literal + numdigits_degrees + numdigits_minutes]);
354 result = atof(dgr) + (atof(min) / 60) + (atof(sec) / 3600);
356 POSTGIS_DEBUGF(2,
" parsed degrees: %s", dgr);
357 POSTGIS_DEBUGF(2,
" parsed minutes: %s", min);
358 POSTGIS_DEBUGF(2,
" parsed decimal seconds: %s", sec);
373 if (start_character ==
'S' || start_character ==
'W' || start_character ==
'-') {
375 POSTGIS_DEBUGF(2,
" switching sign due to start character: '%c'", start_character);
388 xmlNodePtr datafield;
392 uint8_t geometry_type;
397 POSTGIS_DEBUGF(2,
"parse_marc21 called: root '<%s>'", xnode->name);
405 lwpgerror(
"invalid MARC21/XML document. Root element <record> expected but <%s> found.",xnode->name);
410 for (datafield = xnode->children; datafield != NULL; datafield = datafield->next) {
417 if (datafield->type != XML_ELEMENT_NODE)
continue;
419 if (!
is_xml_element(datafield,
"datafield") || xmlStrcmp(xmlGetProp(datafield, (xmlChar*)
"tag"),(xmlChar*)
"034") != 0)
continue;
421 POSTGIS_DEBUG(3,
" datafield found");
423 for (subfield = datafield->children; subfield != NULL; subfield = subfield->next) {
425 if (subfield->type != XML_ELEMENT_NODE)
continue;
429 code = (
char*) xmlGetProp(subfield, (xmlChar*)
"code");
431 if ((strcmp(code,
"d") != 0 &&
432 strcmp(code,
"e") != 0 &&
433 strcmp(code,
"f") != 0 &&
434 strcmp(code,
"g")) != 0)
437 literal = (
char*) xmlNodeGetContent(subfield);
439 POSTGIS_DEBUGF(3,
" subfield code '%s': %s", code, literal);
443 if (strcmp(code,
"d") == 0) lw = literal;
444 else if (strcmp(code,
"e") == 0) le = literal;
445 else if (strcmp(code,
"f") == 0) ln = literal;
446 else if (strcmp(code,
"g") == 0) ls = literal;
450 lwpgerror(
"parse error - invalid literal at 034$%s: \"%s\"", code, literal);
456 xmlFreeNode(subfield);
458 if (lw && le && ln && ls) {
466 if (ngeoms > 0) lwgeoms = (
LWGEOM**)
469 if (fabs(
w - e) < 0.0000001f && fabs(n -
s) < 0.0000001f) {
487 if (ngeoms && result_type != geometry_type) {
490 result_type = geometry_type;
497 if (lw || le || ln || ls) {
499 lwpgerror(
"parse error - the Coded Cartographic Mathematical Data (datafield:034) in the given MARC21/XML is incomplete. Coordinates for subfields \"$d\",\"$e\",\"$f\" and \"$g\" are expected.");
506 POSTGIS_DEBUG(5,
" xmlFreeNode(datafield)");
507 xmlFreeNode(datafield);
515 }
else if (ngeoms > 1) {
519 for (i = 0; i < ngeoms; i++) {
535 POSTGIS_DEBUG(2,
"=> parse_marc21 returns NULL");
char result[OUT_DOUBLE_BUFFER_SIZE]
LWPOINT * lwpoint_make2d(int32_t srid, double x, double y)
void lwgeom_free(LWGEOM *geom)
LWPOLY * lwpoly_construct_envelope(int32_t srid, double x1, double y1, double x2, double y2)
void * lwrealloc(void *mem, size_t size)
LWCOLLECTION * lwcollection_construct_empty(uint8_t type, int32_t srid, char hasz, char hasm)
const char * lwtype_name(uint8_t type)
Return the type name string associated with a type number (e.g.
void lwgeom_force_clockwise(LWGEOM *lwgeom)
Force Right-hand-rule on LWGEOM polygons.
LWCOLLECTION * lwcollection_add_lwgeom(LWCOLLECTION *col, const LWGEOM *geom)
Appends geom to the collection managed by col.
void * lwalloc(size_t size)
#define LW_TRUE
Return types for functions with status returns.
#define SRID_UNKNOWN
Unknown SRID value.
This library is the generic geometry handling section of PostGIS.
static bool is_xml_element(xmlNodePtr xn, const char *xml_name)
PG_FUNCTION_INFO_V1(ST_GeomFromMARC21)
static LWGEOM * parse_marc21(xmlNodePtr xnode)
Datum ST_GeomFromMARC21(PG_FUNCTION_ARGS)
static double parse_geo_literal(char *literal)
static int is_literal_valid(const char *literal)
static uint32_t lwgeom_get_type(const LWGEOM *geom)
Return LWTYPE number.