BEGIN;
INSERT INTO config.upgrade_log (version) VALUES ('0035'); -- miker
CREATE FUNCTION version_specific_xpath () RETURNS TEXT AS $wrapper_function$
DECLARE
out_text TEXT;
BEGIN
IF REGEXP_REPLACE(VERSION(),E'^.+?(\\d+\\.\\d+).*?$',E'\\1')::FLOAT < 8.3 THEN
out_text := 'Creating XPath functions that work like the native XPATH function in 8.3+';
EXECUTE $create_82_funcs$
CREATE OR REPLACE FUNCTION oils_xpath ( xpath TEXT, xml TEXT, ns ANYARRAY ) RETURNS TEXT[] AS $func$
DECLARE
node_text TEXT;
ns_regexp TEXT;
munged_xpath TEXT;
BEGIN
munged_xpath := xpath;
IF ns IS NOT NULL THEN
FOR namespace IN 1 .. array_upper(ns, 1) LOOP
munged_xpath := REGEXP_REPLACE(
munged_xpath,
E'(' || ns[namespace][1] || E'):(\\w+)',
E'*[local-name() = "\\2" and namespace-uri() = "' || ns[namespace][2] || E'"]',
'g'
);
END LOOP;
munged_xpath := REGEXP_REPLACE( munged_xpath, E'\\]\\[(\\D)',E' and \\1', 'g');
END IF;
node_text := xpath_nodeset(xml, munged_xpath, 'XXX_OILS_NODESET');
node_text := REGEXP_REPLACE(node_text,'^', '');
node_text := REGEXP_REPLACE(node_text,'$', '');
RETURN STRING_TO_ARRAY(node_text, '');
END;
$func$ LANGUAGE PLPGSQL;
CREATE OR REPLACE FUNCTION oils_xpath ( TEXT, TEXT ) RETURNS TEXT[] AS 'SELECT oils_xpath( $1, $2, NULL::TEXT[] );' LANGUAGE SQL;
$create_82_funcs$;
ELSE
out_text := 'Creating XPath wrapper functions around the native XPATH function in 8.3+';
EXECUTE $create_83_funcs$
-- 8.3 or after
CREATE OR REPLACE FUNCTION oils_xpath ( TEXT, TEXT, ANYARRAY ) RETURNS TEXT[] AS 'SELECT XPATH( $1, $2::XML, $3 )::TEXT[];' LANGUAGE SQL;
CREATE OR REPLACE FUNCTION oils_xpath ( TEXT, TEXT ) RETURNS TEXT[] AS 'SELECT XPATH( $1, $2::XML )::TEXT[];' LANGUAGE SQL;
$create_83_funcs$;
END IF;
RETURN out_text;
END;
$wrapper_function$ LANGUAGE PLPGSQL;
SELECT version_specific_xpath();
DROP FUNCTION version_specific_xpath();
CREATE TYPE metabib.field_entry_template AS (
field_class TEXT,
field INT,
source BIGINT,
value TEXT
);
CREATE OR REPLACE FUNCTION biblio.extract_metabib_field_entry ( rid BIGINT, default_joiner TEXT ) RETURNS SETOF metabib.field_entry_template AS $func$
DECLARE
bib biblio.record_entry%ROWTYPE;
idx config.metabib_field%ROWTYPE;
xfrm config.xml_transform%ROWTYPE;
prev_xfrm TEXT;
transformed_xml TEXT;
xml_node TEXT;
xml_node_list TEXT[];
raw_text TEXT;
joiner TEXT := default_joiner; -- XXX will index defs supply a joiner?
output_row metabib.field_entry_template%ROWTYPE;
BEGIN
-- Get the record
SELECT INTO bib * FROM biblio.record_entry WHERE id = rid;
-- Loop over the indexing entries
FOR idx IN SELECT * FROM config.metabib_field ORDER BY format LOOP
SELECT INTO xfrm * from config.xml_transform WHERE name = idx.format;
-- See if we can skip the XSLT ... it's expensive
IF prev_xfrm IS NULL OR prev_xfrm <> xfrm.name THEN
-- Can't skip the transform
IF xfrm.xslt <> '---' THEN
transformed_xml := xslt_process(bib.marc,xfrm.xslt);
ELSE
transformed_xml := bib.marc;
END IF;
prev_xfrm := xfrm.name;
END IF;
xml_node_list := oils_xpath( idx.xpath, transformed_xml, ARRAY[ARRAY[xfrm.prefix, xfrm.namespace_uri]] );
raw_text := NULL;
FOR xml_node IN SELECT x FROM explode_array(xml_node_list) AS x LOOP
IF raw_text IS NOT NULL THEN
raw_text := raw_text || joiner;
END IF;
raw_text := COALESCE(raw_text,'') || ARRAY_TO_STRING(oils_xpath( '//text()', xml_node ), ' ');
END LOOP;
CONTINUE WHEN raw_text IS NULL;
output_row.field_class = idx.field_class;
output_row.field = idx.id;
output_row.source = rid;
output_row.value = BTRIM(REGEXP_REPLACE(raw_text, E'\\s+', ' ', 'gs'));
RETURN NEXT output_row;
END LOOP;
END;
$func$ LANGUAGE PLPGSQL;
-- default to a space joiner
CREATE OR REPLACE FUNCTION biblio.extract_metabib_field_entry ( BIGINT ) RETURNS SETOF metabib.field_entry_template AS $func$
SELECT * FROM biblio.extract_metabib_field_entry($1, ' ');
$func$ LANGUAGE SQL;
COMMIT;