Project

General

Profile

1
SELECT util.search_path_append('util');
2

    
3
SELECT create_if_not_exists($$CREATE INDEX "Specimen.acronym" ON $$||:table_str||$$ (acronym)$$);
4

    
5
-- remove frameshifted rows
6
-- rerun time: 6 s ("Time: 5537.211 ms") thanks to index
7
DELETE FROM :table WHERE acronym IS NULL;
8
DELETE FROM :table WHERE coll_year !~ E'^(?:1[7-9]|20)\\d{2}$';
9
DELETE FROM :table WHERE country ~ E'\\d';
10
DELETE FROM :table WHERE long_deg ~ E'[[:alpha:]]' AND long_deg NOT IN ('RESTRINGIDO');
11

    
12
-- Remove institutions that we have direct data for
13
DELETE FROM :table
14
WHERE acronym IN (
15
    -- Comments are from e-mail from Brad Boyle on 2013-1-16
16
    'MO' -- "all MO records in REMIB are also available from MO's own website"
17
    --, 'ARIZ' -- Some REMIB ARIZ specimens not yet in ARIZ itself
18
    --, 'NY' -- Some REMIB NY specimens not yet in NY itself
19
    , 'TEX'
20
)
21
/* list obtained using the following on r9459:
22
SELECT DISTINCT dataprovider
23
FROM sourcelist
24
JOIN provider_count ON provider_count.dataprovider = sourcelist.name
25
WHERE source_id = source_by_shortname('REMIB')
26
ORDER BY dataprovider
27
*/
28
;
(7-7/9)