]> git.evergreen-ils.org Git - Evergreen.git/blob - Open-ILS/src/sql/Pg/upgrade/1301.schema.fix-bre-upgrade-issue.sql
LP#1864516: (follow-up) install current version of function
[Evergreen.git] / Open-ILS / src / sql / Pg / upgrade / 1301.schema.fix-bre-upgrade-issue.sql
1 BEGIN;
2
3 SELECT evergreen.upgrade_deps_block_check('1301', :eg_version);
4
5 CREATE OR REPLACE FUNCTION biblio.extract_metabib_field_entry (
6     rid BIGINT,
7     default_joiner TEXT,
8     field_types TEXT[],
9     only_fields INT[]
10 ) RETURNS SETOF metabib.field_entry_template AS $func$
11 DECLARE
12     bib     biblio.record_entry%ROWTYPE;
13     idx     config.metabib_field%ROWTYPE;
14     xfrm        config.xml_transform%ROWTYPE;
15     prev_xfrm   TEXT;
16     transformed_xml TEXT;
17     xml_node    TEXT;
18     xml_node_list   TEXT[];
19     facet_text  TEXT;
20     display_text TEXT;
21     browse_text TEXT;
22     sort_value  TEXT;
23     raw_text    TEXT;
24     curr_text   TEXT;
25     joiner      TEXT := default_joiner; -- XXX will index defs supply a joiner?
26     authority_text TEXT;
27     authority_link BIGINT;
28     output_row  metabib.field_entry_template%ROWTYPE;
29     process_idx BOOL;
30 BEGIN
31
32     -- Start out with no field-use bools set
33     output_row.browse_nocase = FALSE;
34     output_row.browse_field = FALSE;
35     output_row.facet_field = FALSE;
36     output_row.display_field = FALSE;
37     output_row.search_field = FALSE;
38
39     -- Get the record
40     SELECT INTO bib * FROM biblio.record_entry WHERE id = rid;
41
42     -- Loop over the indexing entries
43     FOR idx IN SELECT * FROM config.metabib_field WHERE id = ANY (only_fields) ORDER BY format LOOP
44         CONTINUE WHEN idx.xpath IS NULL OR idx.xpath = ''; -- pure virtual field
45
46         process_idx := FALSE;
47         IF idx.display_field AND 'display' = ANY (field_types) THEN process_idx = TRUE; END IF;
48         IF idx.browse_field AND 'browse' = ANY (field_types) THEN process_idx = TRUE; END IF;
49         IF idx.search_field AND 'search' = ANY (field_types) THEN process_idx = TRUE; END IF;
50         IF idx.facet_field AND 'facet' = ANY (field_types) THEN process_idx = TRUE; END IF;
51         CONTINUE WHEN process_idx = FALSE; -- disabled for all types
52
53         joiner := COALESCE(idx.joiner, default_joiner);
54
55         SELECT INTO xfrm * from config.xml_transform WHERE name = idx.format;
56
57         -- See if we can skip the XSLT ... it's expensive
58         IF prev_xfrm IS NULL OR prev_xfrm <> xfrm.name THEN
59             -- Can't skip the transform
60             IF xfrm.xslt <> '---' THEN
61                 transformed_xml := oils_xslt_process(bib.marc,xfrm.xslt);
62             ELSE
63                 transformed_xml := bib.marc;
64             END IF;
65
66             prev_xfrm := xfrm.name;
67         END IF;
68
69         xml_node_list := oils_xpath( idx.xpath, transformed_xml, ARRAY[ARRAY[xfrm.prefix, xfrm.namespace_uri]] );
70
71         raw_text := NULL;
72         FOR xml_node IN SELECT x FROM unnest(xml_node_list) AS x LOOP
73             CONTINUE WHEN xml_node !~ E'^\\s*<';
74
75             -- XXX much of this should be moved into oils_xpath_string...
76             curr_text := ARRAY_TO_STRING(array_remove(array_remove(
77                 oils_xpath( '//text()', -- get the content of all the nodes within the main selected node
78                     REGEXP_REPLACE( xml_node, E'\\s+', ' ', 'g' ) -- Translate adjacent whitespace to a single space
79                 ), ' '), ''),  -- throw away morally empty (bankrupt?) strings
80                 joiner
81             );
82
83             CONTINUE WHEN curr_text IS NULL OR curr_text = '';
84
85             IF raw_text IS NOT NULL THEN
86                 raw_text := raw_text || joiner;
87             END IF;
88
89             raw_text := COALESCE(raw_text,'') || curr_text;
90
91             -- autosuggest/metabib.browse_entry
92             IF idx.browse_field THEN
93                 output_row.browse_nocase = idx.browse_nocase;
94
95                 IF idx.browse_xpath IS NOT NULL AND idx.browse_xpath <> '' THEN
96                     browse_text := oils_xpath_string( idx.browse_xpath, xml_node, joiner, ARRAY[ARRAY[xfrm.prefix, xfrm.namespace_uri]] );
97                 ELSE
98                     browse_text := curr_text;
99                 END IF;
100
101                 IF idx.browse_sort_xpath IS NOT NULL AND
102                     idx.browse_sort_xpath <> '' THEN
103
104                     sort_value := oils_xpath_string(
105                         idx.browse_sort_xpath, xml_node, joiner,
106                         ARRAY[ARRAY[xfrm.prefix, xfrm.namespace_uri]]
107                     );
108                 ELSE
109                     sort_value := browse_text;
110                 END IF;
111
112                 output_row.field_class = idx.field_class;
113                 output_row.field = idx.id;
114                 output_row.source = rid;
115                 output_row.value = BTRIM(REGEXP_REPLACE(browse_text, E'\\s+', ' ', 'g'));
116                 output_row.sort_value :=
117                     public.naco_normalize(sort_value);
118
119                 output_row.authority := NULL;
120
121                 IF idx.authority_xpath IS NOT NULL AND idx.authority_xpath <> '' THEN
122                     authority_text := oils_xpath_string(
123                         idx.authority_xpath, xml_node, joiner,
124                         ARRAY[
125                             ARRAY[xfrm.prefix, xfrm.namespace_uri],
126                             ARRAY['xlink','http://www.w3.org/1999/xlink']
127                         ]
128                     );
129
130                     IF authority_text ~ '^\d+$' THEN
131                         authority_link := authority_text::BIGINT;
132                         PERFORM * FROM authority.record_entry WHERE id = authority_link;
133                         IF FOUND THEN
134                             output_row.authority := authority_link;
135                         END IF;
136                     END IF;
137
138                 END IF;
139
140                 output_row.browse_field = TRUE;
141                 -- Returning browse rows with search_field = true for search+browse
142                 -- configs allows us to retain granularity of being able to search
143                 -- browse fields with "starts with" type operators (for example, for
144                 -- titles of songs in music albums)
145                 IF idx.search_field THEN
146                     output_row.search_field = TRUE;
147                 END IF;
148                 RETURN NEXT output_row;
149                 output_row.browse_nocase = FALSE;
150                 output_row.browse_field = FALSE;
151                 output_row.search_field = FALSE;
152                 output_row.sort_value := NULL;
153             END IF;
154
155             -- insert raw node text for faceting
156             IF idx.facet_field THEN
157
158                 IF idx.facet_xpath IS NOT NULL AND idx.facet_xpath <> '' THEN
159                     facet_text := oils_xpath_string( idx.facet_xpath, xml_node, joiner, ARRAY[ARRAY[xfrm.prefix, xfrm.namespace_uri]] );
160                 ELSE
161                     facet_text := curr_text;
162                 END IF;
163
164                 output_row.field_class = idx.field_class;
165                 output_row.field = -1 * idx.id;
166                 output_row.source = rid;
167                 output_row.value = BTRIM(REGEXP_REPLACE(facet_text, E'\\s+', ' ', 'g'));
168
169                 output_row.facet_field = TRUE;
170                 RETURN NEXT output_row;
171                 output_row.facet_field = FALSE;
172             END IF;
173
174             -- insert raw node text for display
175             IF idx.display_field THEN
176
177                 IF idx.display_xpath IS NOT NULL AND idx.display_xpath <> '' THEN
178                     display_text := oils_xpath_string( idx.display_xpath, xml_node, joiner, ARRAY[ARRAY[xfrm.prefix, xfrm.namespace_uri]] );
179                 ELSE
180                     display_text := curr_text;
181                 END IF;
182
183                 output_row.field_class = idx.field_class;
184                 output_row.field = -1 * idx.id;
185                 output_row.source = rid;
186                 output_row.value = BTRIM(REGEXP_REPLACE(display_text, E'\\s+', ' ', 'g'));
187
188                 output_row.display_field = TRUE;
189                 RETURN NEXT output_row;
190                 output_row.display_field = FALSE;
191             END IF;
192
193         END LOOP;
194
195         CONTINUE WHEN raw_text IS NULL OR raw_text = '';
196
197         -- insert combined node text for searching
198         IF idx.search_field THEN
199             output_row.field_class = idx.field_class;
200             output_row.field = idx.id;
201             output_row.source = rid;
202             output_row.value = BTRIM(REGEXP_REPLACE(raw_text, E'\\s+', ' ', 'g'));
203
204             output_row.search_field = TRUE;
205             RETURN NEXT output_row;
206             output_row.search_field = FALSE;
207         END IF;
208
209     END LOOP;
210
211 END;
212 $func$ LANGUAGE PLPGSQL;
213
214 COMMIT;