1
|
SELECT util.search_path_append('util');
|
2
|
|
3
|
SELECT create_if_not_exists($$CREATE INDEX "Specimen.acronym" ON $$||:table_str||$$ (acronym)$$);
|
4
|
|
5
|
SELECT create_if_not_exists($$CREATE INDEX "Specimen.acronym" ON $$||:table_str||$$ (acronym)$$);
|
6
|
SELECT create_if_not_exists($$CREATE INDEX "Specimen.coll_year" ON $$||:table_str||$$ (coll_year)$$);
|
7
|
SELECT create_if_not_exists($$CREATE INDEX "Specimen.country" ON $$||:table_str||$$ (country)$$);
|
8
|
SELECT create_if_not_exists($$CREATE INDEX "Specimen.long_deg" ON $$||:table_str||$$ (long_deg)$$);
|
9
|
|
10
|
-- remove frameshifted rows
|
11
|
-- rerun time: 6 s ("Time: 5537.211 ms") thanks to index
|
12
|
DELETE FROM :table
|
13
|
WHERE
|
14
|
acronym IS NULL
|
15
|
OR coll_year !~ E'^(?:1[7-9]|20)\\d{2}$'
|
16
|
OR country ~ E'\\d'
|
17
|
OR (long_deg ~ E'[[:alpha:]]' AND long_deg NOT IN ('RESTRINGIDO'))
|
18
|
;
|
19
|
|
20
|
-- Remove institutions that we have direct data for
|
21
|
DELETE FROM :table
|
22
|
WHERE acronym IN (
|
23
|
-- Comments are from e-mail from Brad Boyle on 2013-1-16
|
24
|
'MO' -- "all MO records in REMIB are also available from MO's own website"
|
25
|
--, 'ARIZ' -- Some REMIB ARIZ specimens not yet in ARIZ itself
|
26
|
--, 'NY' -- Some REMIB NY specimens not yet in NY itself
|
27
|
, 'TEX'
|
28
|
)
|
29
|
/* list obtained using the following on r9459:
|
30
|
SELECT DISTINCT dataprovider
|
31
|
FROM sourcelist
|
32
|
JOIN provider_count ON provider_count.dataprovider = sourcelist.name
|
33
|
WHERE source_id = source_by_shortname('REMIB')
|
34
|
ORDER BY dataprovider
|
35
|
*/
|
36
|
;
|