Revision 12055
Added by Aaron Marcuse-Kubitza almost 11 years ago
trunk/validation/aggregating/plots/_archive/bien3_validations_salvias_vegbien.by=Brad@iPlant.sql | ||
---|---|---|
1 |
-- ----------------------------------------------------------------------------- |
|
2 |
-- Quantitative validation queries on the BIEN database |
|
3 |
-- |
|
4 |
-- Applies to SALVIAS, or any datasource with all of the following attributes: |
|
5 |
-- - Plots |
|
6 |
-- - Comprised of multiple datasets organized as "projects" |
|
7 |
-- - Maximum 2-level nesting (subplots within plots) |
|
8 |
-- - One or more plots contain individual observations with stem measurements |
|
9 |
-- - One or more plots contain aggregate observations of counts of individuals within species |
|
10 |
-- - One or more plots contain aggregate observations of cover by species |
|
11 |
-- |
|
12 |
-- Requires list of projects from source db manager, in three groups: (1) individual observation |
|
13 |
-- plot, (2) aggregate individual count plots, (3) aggregate percent cover plots |
|
14 |
-- ------------------------------------------------------------------------- |
|
15 |
|
|
16 |
-- ------------------ |
|
17 |
-- Set variables specific to this source |
|
18 |
-- Currently configured for SALVIAS |
|
19 |
-- ------------------ |
|
20 |
|
|
21 |
-- datasource |
|
22 |
\set ds '\'SALVIAS\'' |
|
23 |
|
|
24 |
-- ------------------ |
|
25 |
-- 1. Count of projects |
|
26 |
-- Check: identical count in source db |
|
27 |
-- ------------------ |
|
28 |
SELECT COUNT(*) AS projects |
|
29 |
FROM project p JOIN source s |
|
30 |
ON p.source_id=s.source_id |
|
31 |
WHERE s.shortname=:ds; |
|
32 |
|
|
33 |
-- ------------------ |
|
34 |
-- 2. List of project names |
|
35 |
-- Check: join to source db returns same number of rows |
|
36 |
-- ------------------ |
|
37 |
SELECT p.projectname |
|
38 |
FROM project p JOIN source s |
|
39 |
ON p.source_id=s.source_id |
|
40 |
WHERE s.shortname=:ds; |
|
41 |
|
|
42 |
-- ------------------ |
|
43 |
-- 3. Count of all plots in this source |
|
44 |
-- Check: identical count in source db |
|
45 |
-- ------------------ |
|
46 |
SELECT COUNT(*) AS plots |
|
47 |
FROM location l JOIN locationevent le |
|
48 |
ON l.location_id=le.location_id |
|
49 |
JOIN project p |
|
50 |
ON p.project_id=le.project_id |
|
51 |
JOIN source s |
|
52 |
ON p.source_id=s.source_id |
|
53 |
WHERE s.shortname=:ds; |
|
54 |
|
|
55 |
-- ------------------ |
|
56 |
-- 4. Count of plots in each project in this source |
|
57 |
-- ------------------ |
|
58 |
SELECT p.projectname, COUNT(DISTINCT l.location_id) AS plots |
|
59 |
FROM location l JOIN locationevent le |
|
60 |
ON l.location_id=le.location_id |
|
61 |
JOIN project p |
|
62 |
ON p.project_id=le.project_id |
|
63 |
JOIN source s |
|
64 |
ON p.source_id=s.source_id |
|
65 |
WHERE s.shortname=:ds |
|
66 |
GROUP BY p.projectname; |
|
67 |
|
|
68 |
-- ------------------ |
|
69 |
-- 5.List of plot codes by project |
|
70 |
-- Check: join to source db by all columns returns same number of rows |
|
71 |
-- ------------------ |
|
72 |
SELECT p.projectname, l.authorlocationcode AS plotCode |
|
73 |
FROM location l JOIN locationevent le |
|
74 |
ON l.location_id=le.location_id |
|
75 |
JOIN project p |
|
76 |
ON p.project_id=le.project_id |
|
77 |
JOIN source s |
|
78 |
ON p.source_id=s.source_id |
|
79 |
WHERE s.shortname=:ds; |
|
80 |
|
|
81 |
-- ------------------ |
|
82 |
-- 6. List of plots with stem measurements |
|
83 |
-- ------------------ |
|
84 |
|
|
85 |
SET search_path TO "SALVIAS_VegBIEN"; |
|
86 |
SELECT |
|
87 |
authorlocationcode |
|
88 |
FROM (SELECT * FROM location WHERE parent_id IS NULL) top_plot |
|
89 |
WHERE source_id = source_by_shortname('SALVIAS') |
|
90 |
AND EXISTS( |
|
91 |
SELECT NULL |
|
92 |
FROM location |
|
93 |
JOIN locationevent USING (location_id) |
|
94 |
JOIN taxonoccurrence USING (locationevent_id) |
|
95 |
JOIN aggregateoccurrence USING (taxonoccurrence_id) |
|
96 |
JOIN plantobservation USING (aggregateoccurrence_id) |
|
97 |
JOIN stemobservation USING (plantobservation_id) |
|
98 |
WHERE location.top_plot = top_plot.location_id |
|
99 |
LIMIT 1 |
|
100 |
) |
|
101 |
ORDER BY authorlocationcode |
|
102 |
; |
|
103 |
|
|
104 |
-- ------------------ |
|
105 |
-- 7.List of plots with counts of individuals per species |
|
106 |
-- ------------------ |
|
107 |
|
|
108 |
|
|
109 |
|
|
110 |
-- ------------------ |
|
111 |
-- 8.List of plots which use percent cover |
|
112 |
-- ------------------ |
|
113 |
|
|
114 |
|
|
115 |
|
|
116 |
|
|
117 |
-- ------------------ |
|
118 |
-- 9.List of plots which use line-intercept |
|
119 |
-- ------------------ |
|
120 |
|
|
121 |
|
|
122 |
-- ------------------ |
|
123 |
-- 10. Count of individuals per plot in each project |
|
124 |
-- |
|
125 |
-- Method: count taxonObservations |
|
126 |
-- Note 1: `individuals` should be NULL for plots which use percent cover |
|
127 |
-- or line-intercept methods. |
|
128 |
-- Note 2: Does this method requires that plots have 2-level nesting of |
|
129 |
-- subplots within plots? |
|
130 |
-- ------------------ |
|
131 |
select p.projectname, l.authorlocationcode as plotcode, sum(ao.count) as individuals |
|
132 |
from project p join source s |
|
133 |
on p.source_id=s.source_id |
|
134 |
join locationevent le on p.project_id=le.project_id |
|
135 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
136 |
join location l on le.location_id=l.location_id |
|
137 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
138 |
join aggregateoccurrence ao on o.taxonoccurrence_id=ao.taxonoccurrence_id |
|
139 |
where s.shortname=:ds |
|
140 |
group by p.projectname, l.authorlocationcode |
|
141 |
order by p.projectname, l.authorlocationcode; |
|
142 |
|
|
143 |
-- ------------------ |
|
144 |
-- 11. Count of stems per plot in each project |
|
145 |
-- |
|
146 |
-- Method: count records in stemobservation table |
|
147 |
-- ------------------ |
|
148 |
select p.projectname, l.authorlocationcode as plotcode, count(distinct stemobservation_id) as stems |
|
149 |
from project p join source s |
|
150 |
on p.source_id=s.source_id |
|
151 |
join locationevent le on p.project_id=le.project_id |
|
152 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
153 |
join location l on le.location_id=l.location_id |
|
154 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
155 |
join aggregateoccurrence ao on o.taxonoccurrence_id=ao.taxonoccurrence_id |
|
156 |
join plantobservation po on po.aggregateoccurrence_id=ao.aggregateoccurrence_id |
|
157 |
join stemobservation so on so.plantobservation_id=po.plantobservation_id |
|
158 |
where s.shortname=:ds |
|
159 |
group by p.projectname, l.authorlocationcode |
|
160 |
order by p.projectname, l.authorlocationcode; |
|
161 |
|
|
162 |
-- ------------------ |
|
163 |
-- 12. Count of verbatim taxa per plot in each project |
|
164 |
-- Check: join to source db by all columns, returns same number of rows |
|
165 |
-- Note: Must perform equivalent concatenation of taxonomic field in source db. |
|
166 |
-- NOT YET READY, NEED TO INCLUDE SUBSPECIES, IF ANY |
|
167 |
-- ------------------ |
|
168 |
select p.projectname, l.authorlocationcode as plotcode, |
|
169 |
count(distinct trim('' || coalesce(family::text,'') || ' ' || coalesce(genus::text,'') || ' ' || coalesce(specific_epithet::text,'') || ' ' || coalesce(morphospecies::text,''))) |
|
170 |
as taxa |
|
171 |
from project p join source s |
|
172 |
on p.source_id=s.source_id |
|
173 |
join locationevent le on p.project_id=le.project_id |
|
174 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
175 |
join location l on le.location_id=l.location_id |
|
176 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
177 |
join taxondetermination td on td.taxonoccurrence_id=o.taxonoccurrence_id |
|
178 |
join taxonverbatim tv on td.taxonverbatim_id=tv.taxonverbatim_id |
|
179 |
where s.shortname=:ds and td.isoriginal='t' |
|
180 |
group by p.projectname, l.authorlocationcode |
|
181 |
order by p.projectname, l.authorlocationcode 12; |
|
182 |
|
|
183 |
-- ------------------ |
|
184 |
-- 13. List of distinct verbatim taxa in each plot in each project |
|
185 |
-- |
|
186 |
-- Note: Must perform equivalent concatenation of taxonomic field in source db. |
|
187 |
-- ------------------ |
|
188 |
select distinct p.projectname, l.authorlocationcode as plotcode, |
|
189 |
trim('' || coalesce(family::text,'') || ' ' || coalesce(genus::text,'') || ' ' || coalesce(specific_epithet::text,'') || ' ' || coalesce(morphospecies::text,'')) as taxon |
|
190 |
from project p join source s |
|
191 |
on p.source_id=s.source_id |
|
192 |
join locationevent le on p.project_id=le.project_id |
|
193 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
194 |
join location l on le.location_id=l.location_id |
|
195 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
196 |
join taxondetermination td on td.taxonoccurrence_id=o.taxonoccurrence_id |
|
197 |
join taxonverbatim tv on td.taxonverbatim_id=tv.taxonverbatim_id |
|
198 |
where s.shortname=:ds and td.isoriginal='t' |
|
199 |
order by p.projectname, l.authorlocationcode, taxon; |
|
200 |
|
|
201 |
-- ------------------ |
|
202 |
-- 14. Count of individuals per (verbatim) taxon per plot in each project |
|
203 |
-- |
|
204 |
-- Note: Must do equivalent concatenation of taxonomic field in source db. |
|
205 |
-- ------------------ |
|
206 |
select distinct p.projectname, l.authorlocationcode as plotcode, |
|
207 |
trim('' || coalesce(family::text,'') || ' ' || coalesce(genus::text,'') || ' ' || coalesce(specific_epithet::text,'') || ' ' || coalesce(morphospecies::text,'')) as taxon, |
|
208 |
sum(ao.count) as individuals |
|
209 |
from project p join source s |
|
210 |
on p.source_id=s.source_id |
|
211 |
join locationevent le on p.project_id=le.project_id |
|
212 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
213 |
join location l on le.location_id=l.location_id |
|
214 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
215 |
join taxondetermination td on td.taxonoccurrence_id=o.taxonoccurrence_id |
|
216 |
join taxonverbatim tv on td.taxonverbatim_id=tv.taxonverbatim_id |
|
217 |
join aggregateoccurrence ao on o.taxonoccurrence_id=ao.taxonoccurrence_id |
|
218 |
where s.shortname=:ds and td.isoriginal='t' |
|
219 |
group by p.projectname, l.authorlocationcode, taxon |
|
220 |
order by p.projectname, l.authorlocationcode, taxon; |
|
221 |
|
|
222 |
-- ------------------ |
|
223 |
-- 15. Percent cover of each (verbatim) taxon in each plot in each project |
|
224 |
-- Applies to: aggregate-cover plots only |
|
225 |
-- Method: sums percent cover in aggregateoccurrence (as recorded in coverindex) |
|
226 |
-- Check: join to source db by all columns, returns same number of rows |
|
227 |
-- Note: Must do equivalent concatenation of taxonomic field in source db. |
|
228 |
-- ------------------ |
|
229 |
select distinct p.projectname, l.authorlocationcode as plotcode, |
|
230 |
trim('' || coalesce(family::text,'') || ' ' || coalesce(genus::text,'') || ' ' || coalesce(specific_epithet::text,'') || ' ' || coalesce(morphospecies::text,'')) as taxon, |
|
231 |
sum(ci.coverpercent) as totalpercentcover |
|
232 |
from project p join source s |
|
233 |
on p.source_id=s.source_id |
|
234 |
join locationevent le on p.project_id=le.project_id |
|
235 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
236 |
join location l on le.location_id=l.location_id |
|
237 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
238 |
join taxondetermination td on td.taxonoccurrence_id=o.taxonoccurrence_id |
|
239 |
join taxonverbatim tv on td.taxonverbatim_id=tv.taxonverbatim_id |
|
240 |
join aggregateoccurrence ao on o.taxonoccurrence_id=ao.taxonoccurrence_id |
|
241 |
join coverindex ci on ao.coverindex_id=ci.coverindex_id |
|
242 |
where s.shortname=:ds and td.isoriginal='t' |
|
243 |
and ci.coverpercent is not null |
|
244 |
group by p.projectname, l.authorlocationcode, taxon |
|
245 |
order by p.projectname, l.authorlocationcode, taxon; |
|
246 |
|
|
247 |
-- ------------------ |
|
248 |
-- 16. Intercept values for each (verbatim) taxon in each plot in each project |
|
249 |
-- where line-intercept values are recorded |
|
250 |
-- |
|
251 |
-- Note 1: Assumes identical concatenation of taxonomic fields |
|
252 |
-- to form verbatim taxon name in origina db |
|
253 |
-- Note 2: Grouping mean cover for entire plot combines plots with |
|
254 |
-- subplots (separate cover measure for each species in each subplot) with |
|
255 |
-- plots with strata (separate cover measures for each species in each |
|
256 |
-- stratum) with plots without subplots or strata (one cover measure |
|
257 |
-- per species per plot. |
|
258 |
-- ------------------ |
|
259 |
|
|
260 |
|
|
261 |
|
|
262 |
|
|
263 |
|
|
264 |
|
|
265 |
-- ------------------ |
|
266 |
-- 17. Count of subplots per plot, for each project |
|
267 |
-- ------------------ |
|
268 |
select p.projectname, l.authorlocationcode as plotcode, |
|
269 |
count(distinct sub_locationevent.locationevent_id) as subplots |
|
270 |
from project p join source s |
|
271 |
on p.source_id=s.source_id |
|
272 |
join locationevent le on p.project_id=le.project_id |
|
273 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
274 |
join location l on le.location_id=l.location_id |
|
275 |
where s.shortname=:ds |
|
276 |
group by p.projectname, l.authorlocationcode |
|
277 |
order by p.projectname, l.authorlocationcode; |
|
278 |
|
|
279 |
-- ------------------ |
|
280 |
-- 18. List of subplots codes for each plot for each project |
|
281 |
-- DOESN'T YET WORK PROPERLY |
|
282 |
-- ------------------ |
|
283 |
select p.projectname, |
|
284 |
l.authorlocationcode as plotcode, |
|
285 |
sub_locationevent.authoreventcode as subplotCode |
|
286 |
from project p join source s |
|
287 |
on p.source_id=s.source_id |
|
288 |
join locationevent le on p.project_id=le.project_id |
|
289 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
290 |
join location l on sub_locationevent.location_id=l.location_id |
|
291 |
where s.shortname=:ds |
|
292 |
order by p.projectname, l.authorlocationcode; |
trunk/validation/aggregating/plots/_archive/bien3_validations_salvias_and_similar.by=Brad@iPlant.sql | ||
---|---|---|
1 |
-- ----------------------------------------------------------------------------- |
|
2 |
-- Quantitative validation queries on the BIEN database |
|
3 |
-- |
|
4 |
-- Applies to SALVIAS, or any datasource with all of the following attributes: |
|
5 |
-- - Plots |
|
6 |
-- - Comprised of multiple datasets organized as "projects" |
|
7 |
-- - Maximum 2-level nesting (subplots within plots) |
|
8 |
-- - One or more plots contain individual observations with stem measurements |
|
9 |
-- - One or more plots contain aggregate observations of counts of individuals within species |
|
10 |
-- - One or more plots contain aggregate observations of cover by species |
|
11 |
-- |
|
12 |
-- Requires list of projects from source db manager, in three groups: (1) individual observation |
|
13 |
-- plot, (2) aggregate individual count plots, (3) aggregate percent cover plots |
|
14 |
-- ------------------------------------------------------------------------- |
|
15 |
|
|
16 |
-- ------------------ |
|
17 |
-- Set variables specific to this source |
|
18 |
-- Currently configured for SALVIAS |
|
19 |
-- ------------------ |
|
20 |
|
|
21 |
-- datasource |
|
22 |
\set ds '\'SALVIAS\'' |
|
23 |
|
|
24 |
-- list of projects with individual observations |
|
25 |
\set pio '\'Boyle Transects\',\'Enquist Lab Transect Dataset\',\'ACA Amazon Forest Inventories\',\'Bonifacino Forest Transects\',\'Cam Webb Borneo Plots\',\'DeWalt Bolivia forest plots\',\'La Selva Secondary Forest Plots\',\'Noel Kempff Forest Plots\',\'OTS Transects\',\'Pilon Lajas Treeplots Bolivia\',\'RAINFOR - 0.1 ha Madre de Dios, Peru\',\'RAINFOR - 1 ha Peru\'' |
|
26 |
|
|
27 |
-- list of projects with aggregate individual counts |
|
28 |
\set pai '\'Gentry Transect Dataset\'' |
|
29 |
|
|
30 |
-- list of projects with aggregate cover counts |
|
31 |
\set pac '\'Noel Kempff Savanna Plots\'' |
|
32 |
|
|
33 |
-- ------------------ |
|
34 |
-- 1. Count of projects |
|
35 |
-- Check: identical count in source db |
|
36 |
-- ------------------ |
|
37 |
SELECT COUNT(*) AS projects |
|
38 |
FROM project p JOIN source s |
|
39 |
ON p.source_id=s.source_id |
|
40 |
WHERE s.shortname=:ds; |
|
41 |
|
|
42 |
-- ------------------ |
|
43 |
-- 2. List of project names |
|
44 |
-- Check: join to source db returns same number of rows |
|
45 |
-- ------------------ |
|
46 |
SELECT p.projectname |
|
47 |
FROM project p JOIN source s |
|
48 |
ON p.source_id=s.source_id |
|
49 |
WHERE s.shortname=:ds; |
|
50 |
|
|
51 |
-- ------------------ |
|
52 |
-- 3. Count of all plots in this source |
|
53 |
-- Check: identical count in source db |
|
54 |
-- ------------------ |
|
55 |
SELECT COUNT(*) AS plots |
|
56 |
FROM source s JOIN location l |
|
57 |
ON s.source_id=l.source_id |
|
58 |
WHERE s.shortname=:ds; |
|
59 |
|
|
60 |
-- ------------------ |
|
61 |
-- 4. Count of plots in each project in this source |
|
62 |
-- Check: join to source db by all columns returns same number of rows |
|
63 |
-- ------------------ |
|
64 |
SELECT p.projectname, COUNT(DISTINCT l.location_id) AS plots |
|
65 |
FROM location l JOIN locationevent le |
|
66 |
ON l.location_id=le.location_id |
|
67 |
JOIN project p |
|
68 |
ON p.project_id=le.project_id |
|
69 |
JOIN source s |
|
70 |
ON p.source_id=s.source_id |
|
71 |
WHERE s.shortname=:ds |
|
72 |
AND p.projectname IN (:pio) |
|
73 |
GROUP BY p.projectname; |
|
74 |
|
|
75 |
-- ------------------ |
|
76 |
-- 5.List of plot codes by project |
|
77 |
-- Check: join to source db by all columns returns same number of rows |
|
78 |
-- ------------------ |
|
79 |
SELECT p.projectname, l.authorlocationcode AS plotCode |
|
80 |
FROM location l JOIN locationevent le |
|
81 |
ON l.location_id=le.location_id |
|
82 |
JOIN project p |
|
83 |
ON p.project_id=le.project_id |
|
84 |
JOIN source s |
|
85 |
ON p.source_id=s.source_id |
|
86 |
WHERE s.shortname=:ds |
|
87 |
AND p.projectname IN (:pio); |
|
88 |
|
|
89 |
-- ------------------ |
|
90 |
-- 6. Count of individuals per plot in each project |
|
91 |
-- Applies to: individual observation plots only |
|
92 |
-- Method: count taxonObservations |
|
93 |
-- Check: join to source db by all columns, returns same number of rows |
|
94 |
-- Note: I believe this method requires that plots have 2-level nesting of |
|
95 |
-- subplots within plots? |
|
96 |
-- ------------------ |
|
97 |
select p.projectname, l.authorlocationcode as plotcode, count(*) as individuals |
|
98 |
from project p join source s |
|
99 |
on p.source_id=s.source_id |
|
100 |
join locationevent le on p.project_id=le.project_id |
|
101 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
102 |
join location l on le.location_id=l.location_id |
|
103 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
104 |
where s.shortname=:ds and p.projectname IN (:pio) |
|
105 |
group by p.projectname, l.authorlocationcode |
|
106 |
order by p.projectname, l.authorlocationcode; |
|
107 |
|
|
108 |
-- ------------------ |
|
109 |
-- 7. Count of individuals per plot in each project |
|
110 |
-- Applies to: aggregate-individual plots only |
|
111 |
-- Method: sum column `count` in table aggregateoccurrence |
|
112 |
-- Check: join to source db by all columns, returns same number of rows |
|
113 |
-- Note: I believe this method requires that plots have 2-level nesting of |
|
114 |
-- subplots within plots? |
|
115 |
-- ------------------ |
|
116 |
select p.projectname, l.authorlocationcode as plotcode, sum(ao.count) as individuals |
|
117 |
from project p join source s |
|
118 |
on p.source_id=s.source_id |
|
119 |
join locationevent le on p.project_id=le.project_id |
|
120 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
121 |
join location l on le.location_id=l.location_id |
|
122 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
123 |
join aggregateoccurrence ao on o.taxonoccurrence_id=ao.taxonoccurrence_id |
|
124 |
where s.shortname=:ds and p.projectname IN (:pai) |
|
125 |
group by p.projectname, l.authorlocationcode |
|
126 |
order by p.projectname, l.authorlocationcode; |
|
127 |
|
|
128 |
-- ------------------ |
|
129 |
-- 8. Count of stems per plot in each project |
|
130 |
-- Applies to: individual observation and aggregate individual count plots with |
|
131 |
-- stem counts |
|
132 |
-- Method: count records in stemobservation table |
|
133 |
-- Check: join to source db by all columns, returns same number of rows |
|
134 |
-- Note: I believe this method requires that plots have 2-level nesting of |
|
135 |
-- subplots within plots? |
|
136 |
-- ------------------ |
|
137 |
select p.projectname, l.authorlocationcode as plotcode, count(distinct stemobservation_id) as stems |
|
138 |
from project p join source s |
|
139 |
on p.source_id=s.source_id |
|
140 |
join locationevent le on p.project_id=le.project_id |
|
141 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
142 |
join location l on le.location_id=l.location_id |
|
143 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
144 |
join aggregateoccurrence ao on o.taxonoccurrence_id=ao.taxonoccurrence_id |
|
145 |
join plantobservation po on po.aggregateoccurrence_id=ao.aggregateoccurrence_id |
|
146 |
join stemobservation so on so.plantobservation_id=po.plantobservation_id |
|
147 |
where s.shortname=:ds and (p.projectname IN (:pio) or p.projectname IN (:pai)) |
|
148 |
group by p.projectname, l.authorlocationcode |
|
149 |
order by p.projectname, l.authorlocationcode; |
|
150 |
|
|
151 |
-- ------------------ |
|
152 |
-- 9. Count of verbatim taxa per plot in each project |
|
153 |
-- Check: join to source db by all columns, returns same number of rows |
|
154 |
-- Note: Must perform equivalent concatenation of taxonomic field in source db. |
|
155 |
-- ------------------ |
|
156 |
select p.projectname, l.authorlocationcode as plotcode, |
|
157 |
count(distinct trim('' || coalesce(family::text,'') || ' ' || coalesce(genus::text,'') || ' ' || coalesce(specific_epithet::text,'') || ' ' || coalesce(morphospecies::text,''))) |
|
158 |
as taxa |
|
159 |
from project p join source s |
|
160 |
on p.source_id=s.source_id |
|
161 |
join locationevent le on p.project_id=le.project_id |
|
162 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
163 |
join location l on le.location_id=l.location_id |
|
164 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
165 |
join taxondetermination td on td.taxonoccurrence_id=o.taxonoccurrence_id |
|
166 |
join taxonverbatim tv on td.taxonverbatim_id=tv.taxonverbatim_id |
|
167 |
where s.shortname=:ds and td.isoriginal='t' |
|
168 |
group by p.projectname, l.authorlocationcode |
|
169 |
order by p.projectname, l.authorlocationcode; |
|
170 |
|
|
171 |
-- ------------------ |
|
172 |
-- 10. List of verbatim taxa in each plot in each project |
|
173 |
-- Check: join to source db by all columns, returns same number of rows. |
|
174 |
-- Note: Must perform equivalent concatenation of taxonomic field in source db. |
|
175 |
-- ------------------ |
|
176 |
select distinct p.projectname, l.authorlocationcode as plotcode, |
|
177 |
trim('' || coalesce(family::text,'') || ' ' || coalesce(genus::text,'') || ' ' || coalesce(specific_epithet::text,'') || ' ' || coalesce(morphospecies::text,'')) as taxon |
|
178 |
from project p join source s |
|
179 |
on p.source_id=s.source_id |
|
180 |
join locationevent le on p.project_id=le.project_id |
|
181 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
182 |
join location l on le.location_id=l.location_id |
|
183 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
184 |
join taxondetermination td on td.taxonoccurrence_id=o.taxonoccurrence_id |
|
185 |
join taxonverbatim tv on td.taxonverbatim_id=tv.taxonverbatim_id |
|
186 |
where s.shortname=:ds and td.isoriginal='t' |
|
187 |
order by p.projectname, l.authorlocationcode, taxon; |
|
188 |
|
|
189 |
-- ------------------ |
|
190 |
-- 11. Count of individuals per (verbatim) taxon for each plot in each project |
|
191 |
-- Applies to: individual observation plots only |
|
192 |
-- Method: counts taxonoccurrence records |
|
193 |
-- Check: join to source db by all columns, returns same number of rows |
|
194 |
-- Note: Must do equivalent concatenation of taxonomic field in source db. |
|
195 |
-- ------------------ |
|
196 |
select distinct p.projectname, l.authorlocationcode as plotcode, |
|
197 |
trim('' || coalesce(family::text,'') || ' ' || coalesce(genus::text,'') || ' ' || coalesce(specific_epithet::text,'') || ' ' || coalesce(morphospecies::text,'')) as taxon, |
|
198 |
count(distinct o.taxonoccurrence_id) as individuals |
|
199 |
from project p join source s |
|
200 |
on p.source_id=s.source_id |
|
201 |
join locationevent le on p.project_id=le.project_id |
|
202 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
203 |
join location l on le.location_id=l.location_id |
|
204 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
205 |
join taxondetermination td on td.taxonoccurrence_id=o.taxonoccurrence_id |
|
206 |
join taxonverbatim tv on td.taxonverbatim_id=tv.taxonverbatim_id |
|
207 |
where s.shortname=:ds and td.isoriginal='t' |
|
208 |
and p.projectname IN (:pio) |
|
209 |
group by p.projectname, l.authorlocationcode, taxon |
|
210 |
order by p.projectname, l.authorlocationcode, taxon; |
|
211 |
|
|
212 |
-- ------------------ |
|
213 |
-- 12. Count of individuals per (verbatim) taxon for each plot in each project |
|
214 |
-- Applies to: aggregate-individual count plots only |
|
215 |
-- Method: sums column `count` in aggregateoccurrence |
|
216 |
-- Check: join to source db by all columns, returns same number of rows |
|
217 |
-- Note: Must do equivalent concatenation of taxonomic field in source db. |
|
218 |
-- DOESN'T WORK YET |
|
219 |
-- ------------------ |
|
220 |
select distinct p.projectname, l.authorlocationcode as plotcode, |
|
221 |
trim('' || coalesce(family::text,'') || ' ' || coalesce(genus::text,'') || ' ' || coalesce(specific_epithet::text,'') || ' ' || coalesce(morphospecies::text,'')) as taxon, |
|
222 |
sum(ao.count) as individuals |
|
223 |
from project p join source s |
|
224 |
on p.source_id=s.source_id |
|
225 |
join locationevent le on p.project_id=le.project_id |
|
226 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
227 |
join location l on le.location_id=l.location_id |
|
228 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
229 |
join taxondetermination td on td.taxonoccurrence_id=o.taxonoccurrence_id |
|
230 |
join taxonverbatim tv on td.taxonverbatim_id=tv.taxonverbatim_id |
|
231 |
join aggregateoccurrence ao on o.taxonoccurrence_id=ao.taxonoccurrence_id |
|
232 |
where s.shortname=:ds and td.isoriginal='t' |
|
233 |
and p.projectname IN (:pai) |
|
234 |
group by p.projectname, l.authorlocationcode, taxon |
|
235 |
order by p.projectname, l.authorlocationcode, taxon; |
|
236 |
|
|
237 |
-- ------------------ |
|
238 |
-- 13. Percent cover of each (verbatim) taxon in each plot in each project |
|
239 |
-- Applies to: aggregate-cover plots only |
|
240 |
-- Method: sums percent cover in aggregateoccurrence (as recorded in coverindex) |
|
241 |
-- Check: join to source db by all columns, returns same number of rows |
|
242 |
-- Note: Must do equivalent concatenation of taxonomic field in source db. |
|
243 |
-- DOESN'T WORK YET, ALSO MAY NEED LEFT JOINS |
|
244 |
-- ------------------ |
|
245 |
select distinct p.projectname, l.authorlocationcode as plotcode, |
|
246 |
trim('' || coalesce(family::text,'') || ' ' || coalesce(genus::text,'') || ' ' || coalesce(specific_epithet::text,'') || ' ' || coalesce(morphospecies::text,'')) as taxon, |
|
247 |
sum(ci.coverpercent) as totalpercentcover |
|
248 |
from project p join source s |
|
249 |
on p.source_id=s.source_id |
|
250 |
join locationevent le on p.project_id=le.project_id |
|
251 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
252 |
join location l on le.location_id=l.location_id |
|
253 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
254 |
join taxondetermination td on td.taxonoccurrence_id=o.taxonoccurrence_id |
|
255 |
join taxonverbatim tv on td.taxonverbatim_id=tv.taxonverbatim_id |
|
256 |
join aggregateoccurrence ao on o.taxonoccurrence_id=ao.taxonoccurrence_id |
|
257 |
join coverindex ci on ao.coverindex_id=ci.coverindex_id |
|
258 |
where s.shortname=:ds and td.isoriginal='t' |
|
259 |
and p.projectname IN (:pac) |
|
260 |
group by p.projectname, l.authorlocationcode, taxon |
|
261 |
order by p.projectname, l.authorlocationcode, taxon; |
|
262 |
|
|
263 |
-- ------------------ |
|
264 |
-- 14. Count of subplots per plot, for each project |
|
265 |
-- Check: identical count in source db |
|
266 |
-- ------------------ |
|
267 |
select p.projectname, l.authorlocationcode as plotcode, |
|
268 |
count(distinct sub_locationevent.locationevent_id) as subplots |
|
269 |
from project p join source s |
|
270 |
on p.source_id=s.source_id |
|
271 |
join locationevent le on p.project_id=le.project_id |
|
272 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
273 |
join location l on le.location_id=l.location_id |
|
274 |
where s.shortname=:ds |
|
275 |
group by p.projectname, l.authorlocationcode |
|
276 |
order by p.projectname, l.authorlocationcode; |
|
277 |
|
|
278 |
-- ------------------ |
|
279 |
-- 15. List of subplots codes for each plot for each project |
|
280 |
-- Check: join to source db by all columns, returns same number of rows |
|
281 |
-- DOESN'T WORK YET, NOT SURE HOW TO DISPLAY SUBPLOT CODES |
|
282 |
-- ------------------ |
|
283 |
select p.projectname, l.authorlocationcode as plotcode, |
|
284 |
sub_locationevent.authoreventcode as subplotCode |
|
285 |
from project p join source s |
|
286 |
on p.source_id=s.source_id |
|
287 |
join locationevent le on p.project_id=le.project_id |
|
288 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
289 |
join location l on le.location_id=l.location_id |
|
290 |
where s.shortname=:ds and (p.projectname IN (:pio) or p.projectname IN (:pai)) |
|
291 |
order by p.projectname, l.authorlocationcode; |
trunk/validation/aggregating/plots/SALVIAS/_archive/bien3_validations_salvias_db_original.by=Brad@iPlant.sql | ||
---|---|---|
1 |
-- ----------------------------------------------------------------------------- |
|
2 |
-- Quantitative validation queries against the original SALVIAS database |
|
3 |
-- ------------------------------------------------------------------------- |
|
4 |
|
|
5 |
-- ------------------ |
|
6 |
-- Set variables specific to this source |
|
7 |
-- Currently configured for SALVIAS |
|
8 |
-- ------------------ |
|
9 |
|
|
10 |
USE salvias_plots; |
|
11 |
|
|
12 |
-- SALVIAS projects in BIEN |
|
13 |
-- Must filter out all others as not all SALVIAS plots exported to BIEN |
|
14 |
SET @p = "'Gentry Transect Dataset','Boyle Transects','Enquist Lab Transect Dataset','ACA Amazon Forest Inventories','Bonifacino Forest Transects','Cam Webb Borneo Plots','DeWalt Bolivia forest plots','La Selva Secondary Forest Plots','Noel Kempff Forest Plots','Noel Kempff Savanna Plots','OTS Transects','Pilon Lajas Treeplots Bolivia','RAINFOR - 0.1 ha Madre de Dios, Peru','RAINFOR - 1 ha Peru'"; |
|
15 |
|
|
16 |
-- ------------------ |
|
17 |
-- 1. Count of projects |
|
18 |
-- ------------------ |
|
19 |
SET @sql= CONCAT(' |
|
20 |
SELECT COUNT(*) AS projects |
|
21 |
FROM projects |
|
22 |
WHERE project_name IN (',@p,') |
|
23 |
'); |
|
24 |
PREPARE stmt FROM @sql; |
|
25 |
EXECUTE stmt; |
|
26 |
|
|
27 |
-- ------------------ |
|
28 |
-- 2. List of project names |
|
29 |
-- ------------------ |
|
30 |
SET @sql= CONCAT(' |
|
31 |
SELECT project_name AS projectname |
|
32 |
FROM projects |
|
33 |
WHERE project_name IN (',@p,') |
|
34 |
'); |
|
35 |
PREPARE stmt FROM @sql; |
|
36 |
EXECUTE stmt; |
|
37 |
|
|
38 |
-- ------------------ |
|
39 |
-- 3. Count of all plots in this source |
|
40 |
-- ------------------ |
|
41 |
SET @sql= CONCAT(' |
|
42 |
SELECT COUNT(DISTINCT SiteCode) AS plots |
|
43 |
FROM projects p JOIN PlotMetadata pm |
|
44 |
ON p.project_id=pm.project_id |
|
45 |
WHERE p.project_name IN (',@p,') |
|
46 |
'); |
|
47 |
PREPARE stmt FROM @sql; |
|
48 |
EXECUTE stmt; |
|
49 |
|
|
50 |
-- ------------------ |
|
51 |
-- 4. Count of plots in each project in this source |
|
52 |
-- ------------------ |
|
53 |
SET @sql= CONCAT(' |
|
54 |
SELECT p.project_name, COUNT(*) AS plots |
|
55 |
FROM projects p JOIN PlotMetadata pm |
|
56 |
ON p.project_id=pm.project_id |
|
57 |
WHERE p.project_name IN (',@p,') |
|
58 |
GROUP BY p.project_name |
|
59 |
'); |
|
60 |
PREPARE stmt FROM @sql; |
|
61 |
EXECUTE stmt; |
|
62 |
|
|
63 |
-- ------------------ |
|
64 |
-- 5.List of plot codes by project |
|
65 |
-- ------------------ |
|
66 |
SET @sql= CONCAT(' |
|
67 |
SELECT p.project_name, pm.SiteCode |
|
68 |
FROM projects p JOIN PlotMetadata pm |
|
69 |
ON p.project_id=pm.project_id |
|
70 |
WHERE p.project_name IN (',@p,') |
|
71 |
'); |
|
72 |
PREPARE stmt FROM @sql; |
|
73 |
EXECUTE stmt; |
|
74 |
|
|
75 |
-- ------------------ |
|
76 |
-- 6. List of plots with stem measurements |
|
77 |
-- ------------------ |
|
78 |
SET @sql= CONCAT(' |
|
79 |
SELECT DISTINCT p.project_name, pm.SiteCode |
|
80 |
FROM projects p JOIN PlotMetadata pm |
|
81 |
JOIN PlotObservations po JOIN stems s |
|
82 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
83 |
AND po.PlotObsID=s.plotobs_id |
|
84 |
WHERE p.project_name IN (',@p,') |
|
85 |
GROUP BY p.project_name, SiteCode |
|
86 |
ORDER BY p.project_name, SiteCode |
|
87 |
'); |
|
88 |
PREPARE stmt FROM @sql; |
|
89 |
EXECUTE stmt; |
|
90 |
|
|
91 |
-- ------------------ |
|
92 |
-- 7.List of plots with counts of individuals per species |
|
93 |
-- ------------------ |
|
94 |
SET @sql= CONCAT(' |
|
95 |
SELECT DISTINCT p.project_name, pm.SiteCode |
|
96 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
97 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
98 |
WHERE p.project_name IN (',@p,') |
|
99 |
AND po.NoInd>1 |
|
100 |
GROUP BY p.project_name, SiteCode |
|
101 |
ORDER BY p.project_name, SiteCode |
|
102 |
'); |
|
103 |
PREPARE stmt FROM @sql; |
|
104 |
EXECUTE stmt; |
|
105 |
|
|
106 |
-- ------------------ |
|
107 |
-- 8.List of plots which use percent cover |
|
108 |
-- ------------------ |
|
109 |
SET @sql= CONCAT(' |
|
110 |
SELECT DISTINCT p.project_name, pm.SiteCode |
|
111 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
112 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
113 |
WHERE p.project_name IN (',@p,') |
|
114 |
AND cover_percent IS NOT NULL |
|
115 |
GROUP BY p.project_name, SiteCode |
|
116 |
ORDER BY p.project_name, SiteCode |
|
117 |
'); |
|
118 |
PREPARE stmt FROM @sql; |
|
119 |
EXECUTE stmt; |
|
120 |
|
|
121 |
-- ------------------ |
|
122 |
-- 9.List of plots which use line-intercept |
|
123 |
-- ------------------ |
|
124 |
SET @sql= CONCAT(' |
|
125 |
SELECT DISTINCT p.project_name, pm.SiteCode |
|
126 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
127 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
128 |
WHERE p.project_name IN (',@p,') |
|
129 |
AND intercept_cm IS NOT NULL |
|
130 |
GROUP BY p.project_name, SiteCode |
|
131 |
ORDER BY p.project_name, SiteCode |
|
132 |
'); |
|
133 |
PREPARE stmt FROM @sql; |
|
134 |
EXECUTE stmt; |
|
135 |
|
|
136 |
-- ------------------ |
|
137 |
-- 10. Count of individuals per plot in each project |
|
138 |
-- |
|
139 |
-- Method: Sum on NoInd (number of individuals) column. |
|
140 |
-- Note 1: `individuals` should be NULL for plots which use percent cover |
|
141 |
-- or line-intercept methods. |
|
142 |
-- Note 2: Do not count records in PlotObservations table, as this will give |
|
143 |
-- incorrect total for plots such as Gentry plot, which count individuals |
|
144 |
-- per species per subplot |
|
145 |
-- ------------------ |
|
146 |
SET @sql= CONCAT(' |
|
147 |
SELECT p.project_name, SiteCode AS plotcode, |
|
148 |
SUM(NoInd) AS individuals |
|
149 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
150 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
151 |
WHERE p.project_name IN (',@p,') |
|
152 |
GROUP BY p.project_name, SiteCode |
|
153 |
ORDER BY p.project_name, SiteCode |
|
154 |
'); |
|
155 |
PREPARE stmt FROM @sql; |
|
156 |
EXECUTE stmt; |
|
157 |
|
|
158 |
-- ------------------ |
|
159 |
-- 11. Count of stems per plot in each project |
|
160 |
-- |
|
161 |
-- Method: count records in stems table |
|
162 |
-- ------------------ |
|
163 |
SET @sql= CONCAT(' |
|
164 |
SELECT p.project_name, SiteCode AS plotcode, |
|
165 |
COUNT(DISTINCT stem_id) AS stems |
|
166 |
FROM projects p JOIN PlotMetadata pm |
|
167 |
JOIN PlotObservations po JOIN stems s |
|
168 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
169 |
AND po.PlotObsID=s.plotobs_id |
|
170 |
WHERE p.project_name IN (',@p,') |
|
171 |
GROUP BY p.project_name, SiteCode |
|
172 |
ORDER BY p.project_name, SiteCode |
|
173 |
'); |
|
174 |
PREPARE stmt FROM @sql; |
|
175 |
EXECUTE stmt; |
|
176 |
|
|
177 |
-- ------------------ |
|
178 |
-- 12. Count of verbatim taxa per plot in each project |
|
179 |
-- |
|
180 |
-- Note: Assumes identical concatenation of taxonomic fields |
|
181 |
-- to form verbatim taxon name in vegBIEN |
|
182 |
-- ------------------ |
|
183 |
SET @sql= CONCAT(" |
|
184 |
SELECT project_name, plotcode, COUNT(taxon) AS taxa |
|
185 |
FROM |
|
186 |
( |
|
187 |
SELECT DISTINCT p.project_name, SiteCode AS plotcode, |
|
188 |
TRIM(CONCAT_WS(' ',IFNULL(Family,''),IFNULL(Genus,''),IFNULL(Species,''), |
|
189 |
IF(infra_ep_1 IS NULL,IFNULL(auth,''), |
|
190 |
TRIM(CONCAT_WS(' ',IFNULL(infra_rank_1,''),IFNULL(infra_ep_1,''),IFNULL(infra_auth_1,''))) |
|
191 |
))) AS taxon |
|
192 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
193 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
194 |
WHERE p.project_name IN (",@p,") |
|
195 |
) AS a |
|
196 |
GROUP BY project_name, plotcode |
|
197 |
ORDER BY project_name, plotcode |
|
198 |
"); |
|
199 |
PREPARE stmt FROM @sql; |
|
200 |
EXECUTE stmt; |
|
201 |
|
|
202 |
-- ------------------ |
|
203 |
-- 13. List of distinct verbatim taxa in each plot in each project |
|
204 |
-- |
|
205 |
-- Note: Assumes identical concatenation of taxonomic fields |
|
206 |
-- to form verbatim taxon name in vegBIEN. |
|
207 |
-- ------------------ |
|
208 |
SET @sql= CONCAT(" |
|
209 |
SELECT DISTINCT p.project_name, SiteCode AS plotcode, |
|
210 |
TRIM(CONCAT_WS(' ',IFNULL(Family,''),IFNULL(Genus,''),IFNULL(Species,''), |
|
211 |
IF(infra_ep_1 IS NULL,IFNULL(auth,''), |
|
212 |
TRIM(CONCAT_WS(' ',IFNULL(infra_rank_1,''),IFNULL(infra_ep_1,''),IFNULL(infra_auth_1,''))) |
|
213 |
))) AS taxon |
|
214 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
215 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
216 |
WHERE p.project_name IN (",@p,") |
|
217 |
ORDER BY p.project_name, SiteCode, taxon |
|
218 |
"); |
|
219 |
PREPARE stmt FROM @sql; |
|
220 |
EXECUTE stmt; |
|
221 |
|
|
222 |
-- ------------------ |
|
223 |
-- 14. Count of individuals per (verbatim) taxon per plot in each project |
|
224 |
-- |
|
225 |
-- Note: Assumes identical concatenation of taxonomic fields |
|
226 |
-- to form verbatim taxon name in vegBIEN |
|
227 |
-- ------------------ |
|
228 |
SET @sql= CONCAT(" |
|
229 |
SELECT DISTINCT p.project_name, SiteCode AS plotcode, |
|
230 |
TRIM(CONCAT_WS(' ',IFNULL(Family,''),IFNULL(Genus,''),IFNULL(Species,''), |
|
231 |
IF(infra_ep_1 IS NULL,IFNULL(auth,''), |
|
232 |
TRIM(CONCAT_WS(' ',IFNULL(infra_rank_1,''),IFNULL(infra_ep_1,''),IFNULL(infra_auth_1,''))) |
|
233 |
))) AS taxon, |
|
234 |
SUM(NoInd) AS individuals |
|
235 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
236 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
237 |
WHERE p.project_name IN (",@p,") |
|
238 |
GROUP BY p.project_name, SiteCode, taxon |
|
239 |
ORDER BY p.project_name, SiteCode, taxon |
|
240 |
"); |
|
241 |
PREPARE stmt FROM @sql; |
|
242 |
EXECUTE stmt; |
|
243 |
|
|
244 |
-- ------------------ |
|
245 |
-- 15. Percent cover of each (verbatim) taxon in each plot in each project |
|
246 |
-- where percent cover is recorded |
|
247 |
-- |
|
248 |
-- Note 1: Assumes identical concatenation of taxonomic fields |
|
249 |
-- to form verbatim taxon name in vegbien |
|
250 |
-- Note 2: Grouping mean cover for entire plot allows inclusion of plots with |
|
251 |
-- subplots (separate cover measure for each species in each subplot), |
|
252 |
-- plots with strata (separate cover measures for each species in each |
|
253 |
-- stratum), and plots without subplots or strata (one cover measure |
|
254 |
-- per species per plot) in same query. |
|
255 |
-- Note 3: currently, there are no SALVIAS percent cover plots in BIEN |
|
256 |
-- ------------------ |
|
257 |
SET @sql= CONCAT(" |
|
258 |
SELECT DISTINCT p.project_name, SiteCode AS plotcode, |
|
259 |
TRIM(CONCAT_WS(' ',IFNULL(Family,''),IFNULL(Genus,''),IFNULL(Species,''), |
|
260 |
IF(infra_ep_1 IS NULL,IFNULL(auth,''), |
|
261 |
TRIM(CONCAT_WS(' ',IFNULL(infra_rank_1,''),IFNULL(infra_ep_1,''),IFNULL(infra_auth_1,''))) |
|
262 |
))) AS taxon, |
|
263 |
AVG(cover_percent) AS mean_cover |
|
264 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
265 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
266 |
WHERE p.project_name IN (",@p,") |
|
267 |
AND cover_percent IS NOT NULL |
|
268 |
GROUP BY p.project_name, SiteCode, taxon |
|
269 |
ORDER BY p.project_name, SiteCode, taxon |
|
270 |
"); |
|
271 |
PREPARE stmt FROM @sql; |
|
272 |
EXECUTE stmt; |
|
273 |
|
|
274 |
-- ------------------ |
|
275 |
-- 16. Intercept values for each (verbatim) taxon in each plot in each project |
|
276 |
-- where line-intercept values are recorded |
|
277 |
-- |
|
278 |
-- Note 1: Assumes identical concatenation of taxonomic fields |
|
279 |
-- to form verbatim taxon name in vegbien |
|
280 |
-- Note 2: Grouping mean cover for entire plot combines plots with |
|
281 |
-- subplots (separate cover measure for each species in each subplot) with |
|
282 |
-- plots with strata (separate cover measures for each species in each |
|
283 |
-- stratum) with plots without subplots or strata (one cover measure |
|
284 |
-- per species per plot. |
|
285 |
-- ------------------ |
|
286 |
SET @sql= CONCAT(" |
|
287 |
SELECT DISTINCT p.project_name, SiteCode AS plotcode, |
|
288 |
TRIM(CONCAT_WS(' ',IFNULL(Family,''),IFNULL(Genus,''),IFNULL(Species,''), |
|
289 |
IF(infra_ep_1 IS NULL,IFNULL(auth,''), |
|
290 |
TRIM(CONCAT_WS(' ',IFNULL(infra_rank_1,''),IFNULL(infra_ep_1,''),IFNULL(infra_auth_1,''))) |
|
291 |
))) AS taxon, |
|
292 |
intercept_cm |
|
293 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
294 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
295 |
WHERE p.project_name IN (",@p,") |
|
296 |
AND intercept_cm IS NOT NULL |
|
297 |
ORDER BY p.project_name, SiteCode, taxon |
|
298 |
"); |
|
299 |
PREPARE stmt FROM @sql; |
|
300 |
EXECUTE stmt; |
|
301 |
|
|
302 |
-- ------------------ |
|
303 |
-- 17. Count of subplots per plot, for each project |
|
304 |
-- ------------------ |
|
305 |
SET @sql= CONCAT(" |
|
306 |
SELECT project_name, pm.SiteCode AS plotcode, COUNT(DISTINCT Line) as subplots |
|
307 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
308 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
309 |
WHERE p.project_name IN (",@p,") |
|
310 |
GROUP BY project_name, pm.SiteCode |
|
311 |
ORDER BY project_name, pm.SiteCode |
|
312 |
"); |
|
313 |
PREPARE stmt FROM @sql; |
|
314 |
EXECUTE stmt; |
|
315 |
|
|
316 |
-- ------------------ |
|
317 |
-- 18. List of subplots codes for each plot for each project |
|
318 |
-- |
|
319 |
-- Note: includes plots with and without subplots |
|
320 |
-- ------------------ |
|
321 |
SET @sql= CONCAT(" |
|
322 |
SELECT DISTINCT project_name, pm.SiteCode AS plotcode, Line as subplot |
|
323 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
324 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
325 |
WHERE p.project_name IN (",@p,") |
|
326 |
AND pm.SiteCode IS NOT NULL |
|
327 |
ORDER BY project_name, pm.SiteCode, subplot |
|
328 |
"); |
|
329 |
PREPARE stmt FROM @sql; |
|
330 |
EXECUTE stmt; |
trunk/validation/aggregating/plots/SALVIAS/bien3_validations_salvias_db_original.by=Brad@iPlant,Aaron@UCSB.sql | ||
---|---|---|
1 |
-- ----------------------------------------------------------------------------- |
|
2 |
-- Quantitative validation queries against the original SALVIAS database |
|
3 |
-- ------------------------------------------------------------------------- |
|
4 |
|
|
5 |
-- ------------------ |
|
6 |
-- Set variables specific to this source |
|
7 |
-- Currently configured for SALVIAS |
|
8 |
-- ------------------ |
|
9 |
|
|
10 |
USE salvias_plots; |
|
11 |
|
|
12 |
-- SALVIAS projects in BIEN |
|
13 |
-- Must filter out all others as not all SALVIAS plots exported to BIEN |
|
14 |
SET @p = "'Gentry Transect Dataset','Boyle Transects','Enquist Lab Transect Dataset','ACA Amazon Forest Inventories','Bonifacino Forest Transects','Cam Webb Borneo Plots','DeWalt Bolivia forest plots','La Selva Secondary Forest Plots','Noel Kempff Forest Plots','Noel Kempff Savanna Plots','OTS Transects','Pilon Lajas Treeplots Bolivia','RAINFOR - 0.1 ha Madre de Dios, Peru','RAINFOR - 1 ha Peru'"; |
|
15 |
|
|
16 |
-- ------------------ |
|
17 |
-- 1. Count of projects |
|
18 |
-- ------------------ |
|
19 |
SET @sql= CONCAT(' |
|
20 |
SELECT COUNT(*) AS projects |
|
21 |
FROM projects |
|
22 |
WHERE project_name IN (',@p,') |
|
23 |
LIMIT 10 |
|
24 |
'); |
|
25 |
PREPARE stmt FROM @sql; |
|
26 |
EXECUTE stmt; |
|
27 |
|
|
28 |
-- ------------------ |
|
29 |
-- 2. List of project names |
|
30 |
-- ------------------ |
|
31 |
SET @sql= CONCAT(' |
|
32 |
SELECT project_name AS projectname |
|
33 |
FROM projects |
|
34 |
WHERE project_name IN (',@p,') |
|
35 |
LIMIT 10 |
|
36 |
'); |
|
37 |
PREPARE stmt FROM @sql; |
|
38 |
EXECUTE stmt; |
|
39 |
|
|
40 |
-- ------------------ |
|
41 |
-- 3. Count of all plots in this source |
|
42 |
-- ------------------ |
|
43 |
SET @sql= CONCAT(' |
|
44 |
SELECT COUNT(DISTINCT SiteCode) AS plots |
|
45 |
FROM projects p JOIN PlotMetadata pm |
|
46 |
ON p.project_id=pm.project_id |
|
47 |
WHERE p.project_name IN (',@p,') |
|
48 |
LIMIT 10 |
|
49 |
'); |
|
50 |
PREPARE stmt FROM @sql; |
|
51 |
EXECUTE stmt; |
|
52 |
|
|
53 |
-- ------------------ |
|
54 |
-- 4. Count of plots in each project in this source |
|
55 |
-- ------------------ |
|
56 |
SET @sql= CONCAT(' |
|
57 |
SELECT p.project_name, COUNT(*) AS plots |
|
58 |
FROM projects p JOIN PlotMetadata pm |
|
59 |
ON p.project_id=pm.project_id |
|
60 |
WHERE p.project_name IN (',@p,') |
|
61 |
GROUP BY p.project_name |
|
62 |
LIMIT 10 |
|
63 |
'); |
|
64 |
PREPARE stmt FROM @sql; |
|
65 |
EXECUTE stmt; |
|
66 |
|
|
67 |
-- ------------------ |
|
68 |
-- 5.List of plot codes by project |
|
69 |
-- ------------------ |
|
70 |
SET @sql= CONCAT(' |
|
71 |
SELECT p.project_name, pm.SiteCode |
|
72 |
FROM projects p JOIN PlotMetadata pm |
|
73 |
ON p.project_id=pm.project_id |
|
74 |
WHERE p.project_name IN (',@p,') |
|
75 |
LIMIT 10 |
|
76 |
'); |
|
77 |
PREPARE stmt FROM @sql; |
|
78 |
EXECUTE stmt; |
|
79 |
|
|
80 |
-- ------------------ |
|
81 |
-- 6. List of plots with stem measurements |
|
82 |
-- ------------------ |
|
83 |
SET @sql= CONCAT(' |
|
84 |
SELECT DISTINCT p.project_name, pm.SiteCode |
|
85 |
FROM projects p JOIN PlotMetadata pm |
|
86 |
JOIN PlotObservations po JOIN stems s |
|
87 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
88 |
AND po.PlotObsID=s.plotobs_id |
|
89 |
WHERE p.project_name IN (',@p,') |
|
90 |
GROUP BY p.project_name, SiteCode |
|
91 |
ORDER BY p.project_name, SiteCode |
|
92 |
LIMIT 10 |
|
93 |
'); |
|
94 |
PREPARE stmt FROM @sql; |
|
95 |
EXECUTE stmt; |
|
96 |
|
|
97 |
-- ------------------ |
|
98 |
-- 7.List of plots with counts of individuals per species |
|
99 |
-- ------------------ |
|
100 |
SET @sql= CONCAT(' |
|
101 |
SELECT DISTINCT p.project_name, pm.SiteCode |
|
102 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
103 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
104 |
WHERE p.project_name IN (',@p,') |
|
105 |
AND po.NoInd>1 |
|
106 |
GROUP BY p.project_name, SiteCode |
|
107 |
ORDER BY p.project_name, SiteCode |
|
108 |
LIMIT 10 |
|
109 |
'); |
|
110 |
PREPARE stmt FROM @sql; |
|
111 |
EXECUTE stmt; |
|
112 |
|
|
113 |
-- ------------------ |
|
114 |
-- 8.List of plots which use percent cover |
|
115 |
-- ------------------ |
|
116 |
SET @sql= CONCAT(' |
|
117 |
SELECT DISTINCT p.project_name, pm.SiteCode |
|
118 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
119 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
120 |
WHERE p.project_name IN (',@p,') |
|
121 |
AND cover_percent IS NOT NULL |
|
122 |
GROUP BY p.project_name, SiteCode |
|
123 |
ORDER BY p.project_name, SiteCode |
|
124 |
LIMIT 10 |
|
125 |
'); |
|
126 |
PREPARE stmt FROM @sql; |
|
127 |
EXECUTE stmt; |
|
128 |
|
|
129 |
-- ------------------ |
|
130 |
-- 9.List of plots which use line-intercept |
|
131 |
-- ------------------ |
|
132 |
SET @sql= CONCAT(' |
|
133 |
SELECT DISTINCT p.project_name, pm.SiteCode |
|
134 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
135 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
136 |
WHERE p.project_name IN (',@p,') |
|
137 |
AND intercept_cm IS NOT NULL |
|
138 |
GROUP BY p.project_name, SiteCode |
|
139 |
ORDER BY p.project_name, SiteCode |
|
140 |
LIMIT 10 |
|
141 |
'); |
|
142 |
PREPARE stmt FROM @sql; |
|
143 |
EXECUTE stmt; |
|
144 |
|
|
145 |
-- ------------------ |
|
146 |
-- 10. Count of individuals per plot in each project |
|
147 |
-- |
|
148 |
-- Method: Sum on NoInd (number of individuals) column. |
|
149 |
-- Note 1: `individuals` should be NULL for plots which use percent cover |
|
150 |
-- or line-intercept methods. |
|
151 |
-- Note 2: Do not count records in PlotObservations table, as this will give |
|
152 |
-- incorrect total for plots such as Gentry plot, which count individuals |
|
153 |
-- per species per subplot |
|
154 |
-- ------------------ |
|
155 |
SET @sql= CONCAT(' |
|
156 |
SELECT p.project_name, SiteCode AS plotcode, |
|
157 |
SUM(NoInd) AS individuals |
|
158 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
159 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
160 |
WHERE p.project_name IN (',@p,') |
|
161 |
GROUP BY p.project_name, SiteCode |
|
162 |
ORDER BY p.project_name, SiteCode |
|
163 |
LIMIT 10 |
|
164 |
'); |
|
165 |
PREPARE stmt FROM @sql; |
|
166 |
EXECUTE stmt; |
|
167 |
|
|
168 |
-- ------------------ |
|
169 |
-- 11. Count of stems per plot in each project |
|
170 |
-- |
|
171 |
-- Method: count records in stems table |
|
172 |
-- ------------------ |
|
173 |
SET @sql= CONCAT(' |
|
174 |
SELECT p.project_name, SiteCode AS plotcode, |
|
175 |
COUNT(DISTINCT stem_id) AS stems |
|
176 |
FROM projects p JOIN PlotMetadata pm |
|
177 |
JOIN PlotObservations po JOIN stems s |
|
178 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
179 |
AND po.PlotObsID=s.plotobs_id |
|
180 |
WHERE p.project_name IN (',@p,') |
|
181 |
GROUP BY p.project_name, SiteCode |
|
182 |
ORDER BY p.project_name, SiteCode |
|
183 |
LIMIT 10 |
|
184 |
'); |
|
185 |
PREPARE stmt FROM @sql; |
|
186 |
EXECUTE stmt; |
|
187 |
|
|
188 |
-- ------------------ |
|
189 |
-- 12. Count of verbatim taxa per plot in each project |
|
190 |
-- |
|
191 |
-- Note: Assumes identical concatenation of taxonomic fields |
|
192 |
-- to form verbatim taxon name in vegBIEN |
|
193 |
-- ------------------ |
|
194 |
SET @sql= CONCAT(" |
|
195 |
SELECT project_name, plotcode, COUNT(taxon) AS taxa |
|
196 |
FROM |
|
197 |
( |
|
198 |
SELECT DISTINCT p.project_name, SiteCode AS plotcode, |
|
199 |
TRIM(CONCAT_WS(' ',IFNULL(Family,''),IFNULL(Genus,''),IFNULL(Species,''), |
|
200 |
IF(infra_ep_1 IS NULL,IFNULL(auth,''), |
|
201 |
TRIM(CONCAT_WS(' ',IFNULL(infra_rank_1,''),IFNULL(infra_ep_1,''),IFNULL(infra_auth_1,''))) |
|
202 |
))) AS taxon |
|
203 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
204 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
205 |
WHERE p.project_name IN (",@p,") |
|
206 |
) AS a |
|
207 |
GROUP BY project_name, plotcode |
|
208 |
ORDER BY project_name, plotcode |
|
209 |
LIMIT 10 |
|
210 |
"); |
|
211 |
PREPARE stmt FROM @sql; |
|
212 |
EXECUTE stmt; |
|
213 |
|
|
214 |
-- ------------------ |
|
215 |
-- 13. List of distinct verbatim taxa in each plot in each project |
|
216 |
-- |
|
217 |
-- Note: Assumes identical concatenation of taxonomic fields |
|
218 |
-- to form verbatim taxon name in vegBIEN. |
|
219 |
-- ------------------ |
|
220 |
SET @sql= CONCAT(" |
|
221 |
SELECT DISTINCT p.project_name, SiteCode AS plotcode, |
|
222 |
TRIM(CONCAT_WS(' ',IFNULL(Family,''),IFNULL(Genus,''),IFNULL(Species,''), |
|
223 |
IF(infra_ep_1 IS NULL,IFNULL(auth,''), |
|
224 |
TRIM(CONCAT_WS(' ',IFNULL(infra_rank_1,''),IFNULL(infra_ep_1,''),IFNULL(infra_auth_1,''))) |
|
225 |
))) AS taxon |
|
226 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
227 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
228 |
WHERE p.project_name IN (",@p,") |
|
229 |
ORDER BY p.project_name, SiteCode, taxon |
|
230 |
LIMIT 10 |
|
231 |
"); |
|
232 |
PREPARE stmt FROM @sql; |
|
233 |
EXECUTE stmt; |
|
234 |
|
|
235 |
-- ------------------ |
|
236 |
-- 14. Count of individuals per (verbatim) taxon per plot in each project |
|
237 |
-- |
|
238 |
-- Note: Assumes identical concatenation of taxonomic fields |
|
239 |
-- to form verbatim taxon name in vegBIEN |
|
240 |
-- ------------------ |
|
241 |
SET @sql= CONCAT(" |
|
242 |
SELECT DISTINCT p.project_name, SiteCode AS plotcode, |
|
243 |
TRIM(CONCAT_WS(' ',IFNULL(Family,''),IFNULL(Genus,''),IFNULL(Species,''), |
|
244 |
IF(infra_ep_1 IS NULL,IFNULL(auth,''), |
|
245 |
TRIM(CONCAT_WS(' ',IFNULL(infra_rank_1,''),IFNULL(infra_ep_1,''),IFNULL(infra_auth_1,''))) |
|
246 |
))) AS taxon, |
|
247 |
SUM(NoInd) AS individuals |
|
248 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
249 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
250 |
WHERE p.project_name IN (",@p,") |
|
251 |
GROUP BY p.project_name, SiteCode, taxon |
|
252 |
ORDER BY p.project_name, SiteCode, taxon |
|
253 |
LIMIT 10 |
|
254 |
"); |
|
255 |
PREPARE stmt FROM @sql; |
|
256 |
EXECUTE stmt; |
|
257 |
|
|
258 |
-- ------------------ |
|
259 |
-- 15. Percent cover of each (verbatim) taxon in each plot in each project |
|
260 |
-- where percent cover is recorded |
|
261 |
-- |
|
262 |
-- Note 1: Assumes identical concatenation of taxonomic fields |
|
263 |
-- to form verbatim taxon name in vegbien |
|
264 |
-- Note 2: Grouping mean cover for entire plot allows inclusion of plots with |
|
265 |
-- subplots (separate cover measure for each species in each subplot), |
|
266 |
-- plots with strata (separate cover measures for each species in each |
|
267 |
-- stratum), and plots without subplots or strata (one cover measure |
|
268 |
-- per species per plot) in same query. |
|
269 |
-- Note 3: currently, there are no SALVIAS percent cover plots in BIEN |
|
270 |
-- ------------------ |
|
271 |
SET @sql= CONCAT(" |
|
272 |
SELECT DISTINCT p.project_name, SiteCode AS plotcode, |
|
273 |
TRIM(CONCAT_WS(' ',IFNULL(Family,''),IFNULL(Genus,''),IFNULL(Species,''), |
|
274 |
IF(infra_ep_1 IS NULL,IFNULL(auth,''), |
|
275 |
TRIM(CONCAT_WS(' ',IFNULL(infra_rank_1,''),IFNULL(infra_ep_1,''),IFNULL(infra_auth_1,''))) |
|
276 |
))) AS taxon, |
|
277 |
AVG(cover_percent) AS mean_cover |
|
278 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
279 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
280 |
WHERE p.project_name IN (",@p,") |
|
281 |
AND cover_percent IS NOT NULL |
|
282 |
GROUP BY p.project_name, SiteCode, taxon |
|
283 |
ORDER BY p.project_name, SiteCode, taxon |
|
284 |
LIMIT 10 |
|
285 |
"); |
|
286 |
PREPARE stmt FROM @sql; |
|
287 |
EXECUTE stmt; |
|
288 |
|
|
289 |
-- ------------------ |
|
290 |
-- 16. Intercept values for each (verbatim) taxon in each plot in each project |
|
291 |
-- where line-intercept values are recorded |
|
292 |
-- |
|
293 |
-- Note 1: Assumes identical concatenation of taxonomic fields |
|
294 |
-- to form verbatim taxon name in vegbien |
|
295 |
-- Note 2: Grouping mean cover for entire plot combines plots with |
|
296 |
-- subplots (separate cover measure for each species in each subplot) with |
|
297 |
-- plots with strata (separate cover measures for each species in each |
|
298 |
-- stratum) with plots without subplots or strata (one cover measure |
|
299 |
-- per species per plot. |
|
300 |
-- ------------------ |
|
301 |
SET @sql= CONCAT(" |
|
302 |
SELECT DISTINCT p.project_name, SiteCode AS plotcode, |
|
303 |
TRIM(CONCAT_WS(' ',IFNULL(Family,''),IFNULL(Genus,''),IFNULL(Species,''), |
|
304 |
IF(infra_ep_1 IS NULL,IFNULL(auth,''), |
|
305 |
TRIM(CONCAT_WS(' ',IFNULL(infra_rank_1,''),IFNULL(infra_ep_1,''),IFNULL(infra_auth_1,''))) |
|
306 |
))) AS taxon, |
|
307 |
intercept_cm |
|
308 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
309 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
310 |
WHERE p.project_name IN (",@p,") |
|
311 |
AND intercept_cm IS NOT NULL |
|
312 |
ORDER BY p.project_name, SiteCode, taxon |
|
313 |
LIMIT 10 |
|
314 |
"); |
|
315 |
PREPARE stmt FROM @sql; |
|
316 |
EXECUTE stmt; |
|
317 |
|
|
318 |
-- ------------------ |
|
319 |
-- 17. Count of subplots per plot, for each project |
|
320 |
-- ------------------ |
|
321 |
SET @sql= CONCAT(" |
|
322 |
SELECT project_name, pm.SiteCode AS plotcode, COUNT(DISTINCT Line) as subplots |
|
323 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
324 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
325 |
WHERE p.project_name IN (",@p,") |
|
326 |
GROUP BY project_name, pm.SiteCode |
|
327 |
ORDER BY project_name, pm.SiteCode |
|
328 |
LIMIT 10 |
|
329 |
"); |
|
330 |
PREPARE stmt FROM @sql; |
|
331 |
EXECUTE stmt; |
|
332 |
|
|
333 |
-- ------------------ |
|
334 |
-- 18. List of subplots codes for each plot for each project |
|
335 |
-- |
|
336 |
-- Note: includes plots with and without subplots |
|
337 |
-- ------------------ |
|
338 |
SET @sql= CONCAT(" |
|
339 |
SELECT DISTINCT project_name, pm.SiteCode AS plotcode, Line as subplot |
|
340 |
FROM projects p JOIN PlotMetadata pm JOIN PlotObservations po |
|
341 |
ON p.project_id=pm.project_id AND pm.PlotID=po.PlotID |
|
342 |
WHERE p.project_name IN (",@p,") |
|
343 |
AND pm.SiteCode IS NOT NULL |
|
344 |
ORDER BY project_name, pm.SiteCode, subplot |
|
345 |
LIMIT 10 |
|
346 |
"); |
|
347 |
PREPARE stmt FROM @sql; |
|
348 |
EXECUTE stmt; |
trunk/validation/aggregating/plots/bien3_validations_salvias_vegbien.by=Brad@iPlant,Aaron@UCSB.sql | ||
---|---|---|
1 |
-- ----------------------------------------------------------------------------- |
|
2 |
-- Quantitative validation queries on the BIEN database |
|
3 |
-- |
|
4 |
-- Applies to SALVIAS, or any datasource with all of the following attributes: |
|
5 |
-- - Plots |
|
6 |
-- - Comprised of multiple datasets organized as "projects" |
|
7 |
-- - Maximum 2-level nesting (subplots within plots) |
|
8 |
-- - One or more plots contain individual observations with stem measurements |
|
9 |
-- - One or more plots contain aggregate observations of counts of individuals within species |
|
10 |
-- - One or more plots contain aggregate observations of cover by species |
|
11 |
-- |
|
12 |
-- Requires list of projects from source db manager, in three groups: (1) individual observation |
|
13 |
-- plot, (2) aggregate individual count plots, (3) aggregate percent cover plots |
|
14 |
-- ------------------------------------------------------------------------- |
|
15 |
|
|
16 |
-- ------------------ |
|
17 |
-- Set variables specific to this source |
|
18 |
-- Currently configured for SALVIAS |
|
19 |
-- ------------------ |
|
20 |
|
|
21 |
-- datasource |
|
22 |
\set ds '\'SALVIAS\'' |
|
23 |
|
|
24 |
-- ------------------ |
|
25 |
-- 1. Count of projects |
|
26 |
-- Check: identical count in source db |
|
27 |
-- ------------------ |
|
28 |
SELECT COUNT(*) AS projects |
|
29 |
FROM project p JOIN source s |
|
30 |
ON p.source_id=s.source_id |
|
31 |
WHERE s.shortname=:ds; |
|
32 |
|
|
33 |
-- ------------------ |
|
34 |
-- 2. List of project names |
|
35 |
-- Check: join to source db returns same number of rows |
|
36 |
-- ------------------ |
|
37 |
SELECT p.projectname |
|
38 |
FROM project p JOIN source s |
|
39 |
ON p.source_id=s.source_id |
|
40 |
WHERE s.shortname=:ds; |
|
41 |
|
|
42 |
-- ------------------ |
|
43 |
-- 3. Count of all plots in this source |
|
44 |
-- Check: identical count in source db |
|
45 |
-- ------------------ |
|
46 |
SELECT COUNT(*) AS plots |
|
47 |
FROM location l JOIN locationevent le |
|
48 |
ON l.location_id=le.location_id |
|
49 |
JOIN project p |
|
50 |
ON p.project_id=le.project_id |
|
51 |
JOIN source s |
|
52 |
ON p.source_id=s.source_id |
|
53 |
WHERE s.shortname=:ds; |
|
54 |
|
|
55 |
-- ------------------ |
|
56 |
-- 4. Count of plots in each project in this source |
|
57 |
-- ------------------ |
|
58 |
SELECT p.projectname, COUNT(DISTINCT l.location_id) AS plots |
|
59 |
FROM location l JOIN locationevent le |
|
60 |
ON l.location_id=le.location_id |
|
61 |
JOIN project p |
|
62 |
ON p.project_id=le.project_id |
|
63 |
JOIN source s |
|
64 |
ON p.source_id=s.source_id |
|
65 |
WHERE s.shortname=:ds |
|
66 |
GROUP BY p.projectname; |
|
67 |
|
|
68 |
-- ------------------ |
|
69 |
-- 5.List of plot codes by project |
|
70 |
-- Check: join to source db by all columns returns same number of rows |
|
71 |
-- ------------------ |
|
72 |
SELECT p.projectname, l.authorlocationcode AS plotCode |
|
73 |
FROM location l JOIN locationevent le |
|
74 |
ON l.location_id=le.location_id |
|
75 |
JOIN project p |
|
76 |
ON p.project_id=le.project_id |
|
77 |
JOIN source s |
|
78 |
ON p.source_id=s.source_id |
|
79 |
WHERE s.shortname=:ds; |
|
80 |
|
|
81 |
-- ------------------ |
|
82 |
-- 6. List of plots with stem measurements |
|
83 |
-- ------------------ |
|
84 |
|
|
85 |
SELECT authorlocationcode |
|
86 |
FROM top_plot |
|
87 |
WHERE source_id = source_by_shortname(:ds) |
|
88 |
AND EXISTS( |
|
89 |
SELECT NULL |
|
90 |
FROM location |
|
91 |
JOIN locationevent USING (location_id) |
|
92 |
JOIN taxonoccurrence USING (locationevent_id) |
|
93 |
JOIN aggregateoccurrence USING (taxonoccurrence_id) |
|
94 |
JOIN plantobservation USING (aggregateoccurrence_id) |
|
95 |
JOIN stemobservation USING (plantobservation_id) |
|
96 |
WHERE location.top_plot = top_plot.location_id |
|
97 |
LIMIT 1 |
|
98 |
) |
|
99 |
ORDER BY authorlocationcode |
|
100 |
; |
|
101 |
|
|
102 |
-- ------------------ |
|
103 |
-- 7.List of plots with counts of individuals per species |
|
104 |
-- ------------------ |
|
105 |
|
|
106 |
|
|
107 |
|
|
108 |
-- ------------------ |
|
109 |
-- 8.List of plots which use percent cover |
|
110 |
-- ------------------ |
|
111 |
|
|
112 |
|
|
113 |
|
|
114 |
|
|
115 |
-- ------------------ |
|
116 |
-- 9.List of plots which use line-intercept |
|
117 |
-- ------------------ |
|
118 |
|
|
119 |
|
|
120 |
-- ------------------ |
|
121 |
-- 10. Count of individuals per plot in each project |
|
122 |
-- |
|
123 |
-- Method: count taxonObservations |
|
124 |
-- Note 1: `individuals` should be NULL for plots which use percent cover |
|
125 |
-- or line-intercept methods. |
|
126 |
-- Note 2: Does this method requires that plots have 2-level nesting of |
|
127 |
-- subplots within plots? |
|
128 |
-- ------------------ |
|
129 |
select p.projectname, l.authorlocationcode as plotcode, sum(ao.count) as individuals |
|
130 |
from project p join source s |
|
131 |
on p.source_id=s.source_id |
|
132 |
join locationevent le on p.project_id=le.project_id |
|
133 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
134 |
join location l on le.location_id=l.location_id |
|
135 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
136 |
join aggregateoccurrence ao on o.taxonoccurrence_id=ao.taxonoccurrence_id |
|
137 |
where s.shortname=:ds |
|
138 |
group by p.projectname, l.authorlocationcode |
|
139 |
order by p.projectname, l.authorlocationcode; |
|
140 |
|
|
141 |
-- ------------------ |
|
142 |
-- 11. Count of stems per plot in each project |
|
143 |
-- |
|
144 |
-- Method: count records in stemobservation table |
|
145 |
-- ------------------ |
|
146 |
select p.projectname, l.authorlocationcode as plotcode, count(distinct stemobservation_id) as stems |
|
147 |
from project p join source s |
|
148 |
on p.source_id=s.source_id |
|
149 |
join locationevent le on p.project_id=le.project_id |
|
150 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
151 |
join location l on le.location_id=l.location_id |
|
152 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
153 |
join aggregateoccurrence ao on o.taxonoccurrence_id=ao.taxonoccurrence_id |
|
154 |
join plantobservation po on po.aggregateoccurrence_id=ao.aggregateoccurrence_id |
|
155 |
join stemobservation so on so.plantobservation_id=po.plantobservation_id |
|
156 |
where s.shortname=:ds |
|
157 |
group by p.projectname, l.authorlocationcode |
|
158 |
order by p.projectname, l.authorlocationcode; |
|
159 |
|
|
160 |
-- ------------------ |
|
161 |
-- 12. Count of verbatim taxa per plot in each project |
|
162 |
-- Check: join to source db by all columns, returns same number of rows |
|
163 |
-- Note: Must perform equivalent concatenation of taxonomic field in source db. |
|
164 |
-- NOT YET READY, NEED TO INCLUDE SUBSPECIES, IF ANY |
|
165 |
-- ------------------ |
|
166 |
select p.projectname, l.authorlocationcode as plotcode, |
|
167 |
count(distinct trim('' || coalesce(family::text,'') || ' ' || coalesce(genus::text,'') || ' ' || coalesce(specific_epithet::text,'') || ' ' || coalesce(morphospecies::text,''))) |
|
168 |
as taxa |
|
169 |
from project p join source s |
|
170 |
on p.source_id=s.source_id |
|
171 |
join locationevent le on p.project_id=le.project_id |
|
172 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
173 |
join location l on le.location_id=l.location_id |
|
174 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
175 |
join taxondetermination td on td.taxonoccurrence_id=o.taxonoccurrence_id |
|
176 |
join taxonverbatim tv on td.taxonverbatim_id=tv.taxonverbatim_id |
|
177 |
where s.shortname=:ds and td.isoriginal='t' |
|
178 |
group by p.projectname, l.authorlocationcode |
|
179 |
order by p.projectname, l.authorlocationcode 12; |
|
180 |
|
|
181 |
-- ------------------ |
|
182 |
-- 13. List of distinct verbatim taxa in each plot in each project |
|
183 |
-- |
|
184 |
-- Note: Must perform equivalent concatenation of taxonomic field in source db. |
|
185 |
-- ------------------ |
|
186 |
select distinct p.projectname, l.authorlocationcode as plotcode, |
|
187 |
trim('' || coalesce(family::text,'') || ' ' || coalesce(genus::text,'') || ' ' || coalesce(specific_epithet::text,'') || ' ' || coalesce(morphospecies::text,'')) as taxon |
|
188 |
from project p join source s |
|
189 |
on p.source_id=s.source_id |
|
190 |
join locationevent le on p.project_id=le.project_id |
|
191 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
192 |
join location l on le.location_id=l.location_id |
|
193 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
194 |
join taxondetermination td on td.taxonoccurrence_id=o.taxonoccurrence_id |
|
195 |
join taxonverbatim tv on td.taxonverbatim_id=tv.taxonverbatim_id |
|
196 |
where s.shortname=:ds and td.isoriginal='t' |
|
197 |
order by p.projectname, l.authorlocationcode, taxon; |
|
198 |
|
|
199 |
-- ------------------ |
|
200 |
-- 14. Count of individuals per (verbatim) taxon per plot in each project |
|
201 |
-- |
|
202 |
-- Note: Must do equivalent concatenation of taxonomic field in source db. |
|
203 |
-- ------------------ |
|
204 |
select distinct p.projectname, l.authorlocationcode as plotcode, |
|
205 |
trim('' || coalesce(family::text,'') || ' ' || coalesce(genus::text,'') || ' ' || coalesce(specific_epithet::text,'') || ' ' || coalesce(morphospecies::text,'')) as taxon, |
|
206 |
sum(ao.count) as individuals |
|
207 |
from project p join source s |
|
208 |
on p.source_id=s.source_id |
|
209 |
join locationevent le on p.project_id=le.project_id |
|
210 |
join locationevent sub_locationevent on sub_locationevent.parent_id=le.locationevent_id |
|
211 |
join location l on le.location_id=l.location_id |
|
212 |
join taxonoccurrence o on sub_locationevent.locationevent_id=o.locationevent_id |
|
213 |
join taxondetermination td on td.taxonoccurrence_id=o.taxonoccurrence_id |
|
214 |
join taxonverbatim tv on td.taxonverbatim_id=tv.taxonverbatim_id |
|
215 |
join aggregateoccurrence ao on o.taxonoccurrence_id=ao.taxonoccurrence_id |
Also available in: Unified diff
validation/aggregating/*.by=Brad@iPlant*: placed under version control, since these are now open-source