1 |
10245
|
aaronmk
|
SELECT util.search_path_append('util');
|
2 |
7249
|
aaronmk
|
|
3 |
10334
|
aaronmk
|
SELECT create_if_not_exists($$CREATE INDEX "Specimen.acronym" ON $$||:table_str||$$ (acronym)$$);
|
4 |
10330
|
aaronmk
|
|
5 |
|
|
-- remove frameshifted rows
|
6 |
|
|
-- rerun time: 6 s ("Time: 5537.211 ms") thanks to index
|
7 |
10333
|
aaronmk
|
DELETE FROM :table WHERE acronym IS NULL;
|
8 |
10336
|
aaronmk
|
DELETE FROM :table WHERE coll_year !~ '^(?:1[7-9]|20)\d{2}$';
|
9 |
|
|
DELETE FROM :table WHERE country ~ '\d';
|
10 |
|
|
DELETE FROM :table WHERE long_deg ~ '[[:alpha:]]' AND long_deg NOT IN ('RESTRINGIDO');
|
11 |
10337
|
aaronmk
|
DELETE FROM :table WHERE long_min !~ '^\d*$';
|
12 |
10338
|
aaronmk
|
DELETE FROM :table WHERE long_sec !~ '^\d*$';
|
13 |
|
|
DELETE FROM :table WHERE lat_min !~ '^\d*$';
|
14 |
|
|
DELETE FROM :table WHERE lat_sec !~ '^\d*$';
|
15 |
10330
|
aaronmk
|
|
16 |
7249
|
aaronmk
|
-- Remove institutions that we have direct data for
|
17 |
|
|
DELETE FROM :table
|
18 |
|
|
WHERE acronym IN (
|
19 |
7250
|
aaronmk
|
-- Comments are from e-mail from Brad Boyle on 2013-1-16
|
20 |
|
|
'MO' -- "all MO records in REMIB are also available from MO's own website"
|
21 |
|
|
--, 'ARIZ' -- Some REMIB ARIZ specimens not yet in ARIZ itself
|
22 |
|
|
--, 'NY' -- Some REMIB NY specimens not yet in NY itself
|
23 |
9502
|
aaronmk
|
, 'TEX'
|
24 |
7249
|
aaronmk
|
)
|
25 |
9502
|
aaronmk
|
/* list obtained using the following on r9459:
|
26 |
9501
|
aaronmk
|
SELECT DISTINCT dataprovider
|
27 |
7249
|
aaronmk
|
FROM sourcelist
|
28 |
9501
|
aaronmk
|
JOIN provider_count ON provider_count.dataprovider = sourcelist.name
|
29 |
7249
|
aaronmk
|
WHERE source_id = source_by_shortname('REMIB')
|
30 |
9501
|
aaronmk
|
ORDER BY dataprovider
|
31 |
7249
|
aaronmk
|
*/
|
32 |
|
|
;
|