2 * Copyright (C) 2007-2010 Equinox Software, Inc.
3 * Mike Rylander <miker@esilibrary.com>
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License
7 * as published by the Free Software Foundation; either version 2
8 * of the License, or (at your option) any later version.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
18 DROP SCHEMA IF EXISTS search CASCADE;
24 CREATE OR REPLACE FUNCTION evergreen.pg_statistics (tab TEXT, col TEXT) RETURNS TABLE(element TEXT, frequency INT) AS $$
26 -- This query will die on PG < 9.2, but the function can be created. We just won't use it where we can't.
30 FROM (SELECT ROW_NUMBER() OVER (),
32 FROM (SELECT UNNEST(most_common_elem_freqs) AS f
38 JOIN (SELECT ROW_NUMBER() OVER (),
40 FROM (SELECT UNNEST(most_common_elems::text::text[]) AS e
45 ) AS elems USING (row_number);
49 CREATE OR REPLACE FUNCTION evergreen.query_int_wrapper (INT[],TEXT) RETURNS BOOL AS $$
51 RETURN $1 @@ $2::query_int;
53 $$ LANGUAGE PLPGSQL STABLE;
55 CREATE TABLE search.relevance_adjustment (
56 id SERIAL PRIMARY KEY,
57 active BOOL NOT NULL DEFAULT TRUE,
58 field INT NOT NULL REFERENCES config.metabib_field (id) DEFERRABLE INITIALLY DEFERRED,
59 bump_type TEXT NOT NULL CHECK (bump_type IN ('word_order','first_word','full_match')),
60 multiplier NUMERIC NOT NULL DEFAULT 1.0
62 CREATE UNIQUE INDEX bump_once_per_field_idx ON search.relevance_adjustment ( field, bump_type );
64 CREATE TYPE search.search_result AS ( id BIGINT, rel NUMERIC, record INT, total INT, checked INT, visible INT, deleted INT, excluded INT );
65 CREATE TYPE search.search_args AS ( id INT, field_class TEXT, field_name TEXT, table_alias TEXT, term TEXT, term_type TEXT );
67 CREATE OR REPLACE FUNCTION search.query_parser_fts (
73 param_locations INT[],
80 param_pref_ou INT DEFAULT NULL
81 ) RETURNS SETOF search.search_result AS $func$
84 current_res search.search_result%ROWTYPE;
85 search_org_list INT[];
95 core_cursor REFCURSOR;
100 deleted_count INT := 0;
101 visible_count INT := 0;
102 excluded_count INT := 0;
107 check_limit := COALESCE( param_check, 1000 );
108 core_limit := COALESCE( param_limit, 25000 );
109 core_offset := COALESCE( param_offset, 0 );
111 SELECT COALESCE( enabled, FALSE ) INTO luri_as_copy FROM config.global_flag WHERE name = 'opac.located_uri.act_as_copy';
113 -- core_skip_chk := COALESCE( param_skip_chk, 1 );
115 IF param_search_ou > 0 THEN
116 IF param_depth IS NOT NULL THEN
117 SELECT ARRAY_AGG(distinct id) INTO search_org_list FROM actor.org_unit_descendants( param_search_ou, param_depth );
119 SELECT ARRAY_AGG(distinct id) INTO search_org_list FROM actor.org_unit_descendants( param_search_ou );
123 SELECT ARRAY_AGG(distinct id) INTO luri_org_list FROM actor.org_unit_full_path( param_search_ou );
125 SELECT ARRAY_AGG(distinct id) INTO luri_org_list FROM actor.org_unit_ancestors( param_search_ou );
128 ELSIF param_search_ou < 0 THEN
129 SELECT ARRAY_AGG(distinct org_unit) INTO search_org_list FROM actor.org_lasso_map WHERE lasso = -param_search_ou;
131 FOR tmp_int IN SELECT * FROM UNNEST(search_org_list) LOOP
134 SELECT ARRAY_AGG(distinct id) INTO tmp_int_list FROM actor.org_unit_full_path( tmp_int );
136 SELECT ARRAY_AGG(distinct id) INTO tmp_int_list FROM actor.org_unit_ancestors( tmp_int );
139 luri_org_list := luri_org_list || tmp_int_list;
142 SELECT ARRAY_AGG(DISTINCT x.id) INTO luri_org_list FROM UNNEST(luri_org_list) x(id);
144 ELSIF param_search_ou = 0 THEN
145 -- reserved for user lassos (ou_buckets/type='lasso') with ID passed in depth ... hack? sure.
148 IF param_pref_ou IS NOT NULL THEN
150 SELECT ARRAY_AGG(distinct id) INTO tmp_int_list FROM actor.org_unit_full_path( param_pref_ou );
152 SELECT ARRAY_AGG(distinct id) INTO tmp_int_list FROM actor.org_unit_ancestors( param_pref_ou );
155 luri_org_list := luri_org_list || tmp_int_list;
158 OPEN core_cursor FOR EXECUTE param_query;
162 FETCH core_cursor INTO core_result;
164 EXIT WHEN total_count >= core_limit;
166 total_count := total_count + 1;
168 CONTINUE WHEN total_count NOT BETWEEN core_offset + 1 AND check_limit + core_offset;
170 check_count := check_count + 1;
172 IF NOT deleted_search THEN
174 PERFORM 1 FROM biblio.record_entry b WHERE NOT b.deleted AND b.id IN ( SELECT * FROM unnest( core_result.records ) );
176 -- RAISE NOTICE ' % were all deleted ... ', core_result.records;
177 deleted_count := deleted_count + 1;
182 FROM biblio.record_entry b
183 JOIN config.bib_source s ON (b.source = s.id)
185 AND b.id IN ( SELECT * FROM unnest( core_result.records ) );
188 -- RAISE NOTICE ' % were all transcendant ... ', core_result.records;
189 visible_count := visible_count + 1;
191 current_res.id = core_result.id;
192 current_res.rel = core_result.rel;
196 SELECT COUNT(DISTINCT s.source) INTO tmp_int FROM metabib.metarecord_source_map s WHERE s.metarecord = core_result.id;
200 current_res.record = core_result.records[1];
202 current_res.record = NULL;
205 RETURN NEXT current_res;
211 FROM asset.call_number cn
212 JOIN asset.uri_call_number_map map ON (map.call_number = cn.id)
213 JOIN asset.uri uri ON (map.uri = uri.id)
215 AND cn.label = '##URI##'
217 AND ( param_locations IS NULL OR array_upper(param_locations, 1) IS NULL )
218 AND cn.record IN ( SELECT * FROM unnest( core_result.records ) )
219 AND cn.owning_lib IN ( SELECT * FROM unnest( luri_org_list ) )
223 -- RAISE NOTICE ' % have at least one URI ... ', core_result.records;
224 visible_count := visible_count + 1;
226 current_res.id = core_result.id;
227 current_res.rel = core_result.rel;
231 SELECT COUNT(DISTINCT s.source) INTO tmp_int FROM metabib.metarecord_source_map s WHERE s.metarecord = core_result.id;
235 current_res.record = core_result.records[1];
237 current_res.record = NULL;
240 RETURN NEXT current_res;
245 IF param_statuses IS NOT NULL AND array_upper(param_statuses, 1) > 0 THEN
248 FROM asset.call_number cn
249 JOIN asset.copy cp ON (cp.call_number = cn.id)
252 AND cp.status IN ( SELECT * FROM unnest( param_statuses ) )
253 AND cn.record IN ( SELECT * FROM unnest( core_result.records ) )
254 AND cp.circ_lib IN ( SELECT * FROM unnest( search_org_list ) )
259 FROM biblio.peer_bib_copy_map pr
260 JOIN asset.copy cp ON (cp.id = pr.target_copy)
262 AND cp.status IN ( SELECT * FROM unnest( param_statuses ) )
263 AND pr.peer_record IN ( SELECT * FROM unnest( core_result.records ) )
264 AND cp.circ_lib IN ( SELECT * FROM unnest( search_org_list ) )
268 -- RAISE NOTICE ' % and multi-home linked records were all status-excluded ... ', core_result.records;
269 excluded_count := excluded_count + 1;
276 IF param_locations IS NOT NULL AND array_upper(param_locations, 1) > 0 THEN
279 FROM asset.call_number cn
280 JOIN asset.copy cp ON (cp.call_number = cn.id)
283 AND cp.location IN ( SELECT * FROM unnest( param_locations ) )
284 AND cn.record IN ( SELECT * FROM unnest( core_result.records ) )
285 AND cp.circ_lib IN ( SELECT * FROM unnest( search_org_list ) )
290 FROM biblio.peer_bib_copy_map pr
291 JOIN asset.copy cp ON (cp.id = pr.target_copy)
293 AND cp.location IN ( SELECT * FROM unnest( param_locations ) )
294 AND pr.peer_record IN ( SELECT * FROM unnest( core_result.records ) )
295 AND cp.circ_lib IN ( SELECT * FROM unnest( search_org_list ) )
299 -- RAISE NOTICE ' % and multi-home linked records were all copy_location-excluded ... ', core_result.records;
300 excluded_count := excluded_count + 1;
307 IF staff IS NULL OR NOT staff THEN
310 FROM asset.opac_visible_copies
311 WHERE circ_lib IN ( SELECT * FROM unnest( search_org_list ) )
312 AND record IN ( SELECT * FROM unnest( core_result.records ) )
317 FROM biblio.peer_bib_copy_map pr
318 JOIN asset.opac_visible_copies cp ON (cp.copy_id = pr.target_copy)
319 WHERE cp.circ_lib IN ( SELECT * FROM unnest( search_org_list ) )
320 AND pr.peer_record IN ( SELECT * FROM unnest( core_result.records ) )
325 -- RAISE NOTICE ' % and multi-home linked records were all visibility-excluded ... ', core_result.records;
326 excluded_count := excluded_count + 1;
334 FROM asset.call_number cn
335 JOIN asset.copy cp ON (cp.call_number = cn.id)
338 AND cp.circ_lib IN ( SELECT * FROM unnest( search_org_list ) )
339 AND cn.record IN ( SELECT * FROM unnest( core_result.records ) )
345 FROM biblio.peer_bib_copy_map pr
346 JOIN asset.copy cp ON (cp.id = pr.target_copy)
348 AND cp.circ_lib IN ( SELECT * FROM unnest( search_org_list ) )
349 AND pr.peer_record IN ( SELECT * FROM unnest( core_result.records ) )
355 FROM asset.call_number cn
356 JOIN asset.copy cp ON (cp.call_number = cn.id)
357 WHERE cn.record IN ( SELECT * FROM unnest( core_result.records ) )
362 -- Recheck Located URI visibility in the case of no "foreign" copies
364 FROM asset.call_number cn
365 JOIN asset.uri_call_number_map map ON (map.call_number = cn.id)
366 JOIN asset.uri uri ON (map.uri = uri.id)
368 AND cn.label = '##URI##'
370 AND cn.record IN ( SELECT * FROM unnest( core_result.records ) )
371 AND cn.owning_lib NOT IN ( SELECT * FROM unnest( luri_org_list ) )
375 -- RAISE NOTICE ' % were excluded for foreign located URIs... ', core_result.records;
376 excluded_count := excluded_count + 1;
380 -- RAISE NOTICE ' % and multi-home linked records were all visibility-excluded ... ', core_result.records;
381 excluded_count := excluded_count + 1;
392 visible_count := visible_count + 1;
394 current_res.id = core_result.id;
395 current_res.rel = core_result.rel;
399 SELECT COUNT(DISTINCT s.source) INTO tmp_int FROM metabib.metarecord_source_map s WHERE s.metarecord = core_result.id;
403 current_res.record = core_result.records[1];
405 current_res.record = NULL;
408 RETURN NEXT current_res;
410 IF visible_count % 1000 = 0 THEN
411 -- RAISE NOTICE ' % visible so far ... ', visible_count;
416 current_res.id = NULL;
417 current_res.rel = NULL;
418 current_res.record = NULL;
419 current_res.total = total_count;
420 current_res.checked = check_count;
421 current_res.deleted = deleted_count;
422 current_res.visible = visible_count;
423 current_res.excluded = excluded_count;
427 RETURN NEXT current_res;
430 $func$ LANGUAGE PLPGSQL;
432 CREATE OR REPLACE FUNCTION search.facets_for_record_set(ignore_facet_classes TEXT[], hits BIGINT[]) RETURNS TABLE (id INT, value TEXT, count BIGINT) AS $$
433 SELECT id, value, count FROM (
434 SELECT mfae.field AS id,
436 COUNT(DISTINCT mmrsm.source),
438 PARTITION BY mfae.field ORDER BY COUNT(distinct mmrsm.source) DESC
440 FROM metabib.facet_entry mfae
441 JOIN metabib.metarecord_source_map mmrsm ON (mfae.source = mmrsm.source)
442 JOIN config.metabib_field cmf ON (cmf.id = mfae.field)
443 WHERE mmrsm.source IN (SELECT * FROM unnest(hits))
445 AND cmf.field_class NOT IN (SELECT * FROM unnest(ignore_facet_classes))
448 WHERE rownum <= (SELECT COALESCE((SELECT value::INT FROM config.global_flag WHERE name = 'search.max_facets_per_field' AND enabled), 1000));
451 CREATE OR REPLACE FUNCTION search.facets_for_metarecord_set(ignore_facet_classes TEXT[], hits BIGINT[]) RETURNS TABLE (id INT, value TEXT, count BIGINT) AS $$
452 SELECT id, value, count FROM (
453 SELECT mfae.field AS id,
455 COUNT(DISTINCT mmrsm.metarecord),
457 PARTITION BY mfae.field ORDER BY COUNT(distinct mmrsm.metarecord) DESC
459 FROM metabib.facet_entry mfae
460 JOIN metabib.metarecord_source_map mmrsm ON (mfae.source = mmrsm.source)
461 JOIN config.metabib_field cmf ON (cmf.id = mfae.field)
462 WHERE mmrsm.metarecord IN (SELECT * FROM unnest(hits))
464 AND cmf.field_class NOT IN (SELECT * FROM unnest(ignore_facet_classes))
467 WHERE rownum <= (SELECT COALESCE((SELECT value::INT FROM config.global_flag WHERE name = 'search.max_facets_per_field' AND enabled), 1000));