/ - Diff - Environment and organisms - NCEAS Projects

« Previous | Next »

Revision 8c68c923

Added by Benoit Parmentier over 10 years ago

ID 8c68c923ad9be60e5c9ebd90b46da5f37a360c2b
Parent 7fe29b7e
Child bcfff168

global scalingup assessment modifications of stage 5 workflow code for diagnosis of issues

     #Part 2: Examine
     #AUTHOR: Benoit Parmentier
     #DATE: 08/05/2013
     #DATE MODIFIED: 05/21/2014
     #PROJECT: NCEAS INPLANT: Environment and Organisms --TASK#???--
-...
       #DATE: 08/05/2013
       #PROJECT: NCEAS INPLANT: Environment and Organisms --TASK#363--
       #1) in_path
       #1) in_path_tile: location of files, if NULL then code is run on NEX node or as stage 5
       #2) out_path
       #3) script_path
       #4) raster_prediction_obj
-...
       ### BEGIN SCRIPT
       #Parse input parameters
       #date_selected_results <- c("x")
       date_selected<-list_param$date_selected_results #dates for plot creation
       var<-list_param$var #variable being interpolated
       out_path <- list_param$out_path
       interpolation_method <- list_param$interpolation_method
       infile_covariates <- list_param$covar_obj$infile_covariates
       covar_names<-list_param$covar_obj$covar_names
       in_path_tile <- list_param$in_path_tile
       if(!is.null(in_path_tile)){
         covar_obj <- load_obj(list_param$covar_obj)
         infile_covariates <- file.path(in_path_tile,basename(covar_obj$infile_covariates))
         covar_names <- covar_obj$covar_names
       }else{ #we are on the node or running as stage 5
         infile_covariates <- list_param$covar_obj$infile_covariates #already loaded in memory
         covar_names<-list_param$covar_obj$covar_names
+      }
       #if raster_obj has not been loaded in memory then we have
       #the name of the RData object for a specific tile
       raster_prediction_obj<-list_param$raster_prediction_obj
       method_mod_obj<-raster_prediction_obj$method_mod_obj
       validation_mod_obj<-raster_prediction_obj$validation_mod_obj
       if(class(raster_prediction_obj)=="character"){
         raster_prediction_obj <- load_obj(raster_prediction_obj)
+      }
       method_mod_obj <- raster_prediction_obj$method_mod_obj
       validation_mod_obj <-raster_prediction_obj$validation_mod_obj
       if(interpolation_method %in% c("gam_CAI","kriging_CAI","gwr_CAI","gam_fusion","kriging_fusion","gwr_fusion")){
         multi_timescale <- TRUE
+      }
       #This should not be set here...? master script
       if (var=="TMAX"){
         y_var_name<-"dailyTmax"
-...
         y_var_name<-"dailyTmin"
         y_var_month <-"TMin"
+      }
       #add precip option later...
       ## Read covariate brick...
       s_raster<-brick(infile_covariates)
       names(s_raster)<-covar_names               #Assigning names to the raster layers: making sure it is included in the extraction
       s_raster <- brick(infile_covariates) #stack produced for specific tile
       names(s_raster)<- covar_names               #Assigning names to the raster layers: making sure it is included in the extraction
       ## Prepare study area  mask: based on LC12 (water)
       LC_mask<-subset(s_raster,"LC12")
       LC_mask[LC_mask==100]<-NA
       LC_mask <- subset(s_raster,"LC12")
       LC_mask[LC_mask==100]<- NA
       LC_mask <- LC_mask < 100
       LC_mask_rec<-LC_mask
       LC_mask_rec[is.na(LC_mask_rec)]<-0
       LC_mask_rec[is.na(LC_mask_rec)]<- 0
       #determine index position matching date selected
       i_dates<-vector("list",length(date_selected))
-...
+      }
       #Examine the first select date add loop or function later
       #j=1
       date<-strptime(date_selected[j], "%Y%m%d")   # interpolation date being processed
       month<-strftime(date, "%m")          # current month of the date being processed
       date <- strptime(date_selected[j], "%Y%m%d")   # interpolation date being processed
       month <- strftime(date, "%m")          # current month of the date being processed
       #Get raster stack of interpolated surfaces
       index<-i_dates[[j]]
       pred_temp<-as.character(method_mod_obj[[index]][[y_var_name]]) #list of daily prediction files with path included
       rast_pred_temp_s <-stack(pred_temp) #stack of temperature predictions from models (daily)
       rast_pred_temp <-mask(rast_pred_temp_s,LC_mask,file=file.path(out_path,"test.tif"),overwrite=TRUE)
       index <- i_dates[[j]]
       ##The path of production is not the same if input_path_tile is not NULL
       if(!is.null(in_path_tile)){
         #infile_covariates <- file.path(in_path_tile,basename(list_param$covar_obj$infile_covariates))
         pred_temp <- basename(as.character(method_mod_obj[[index]][[y_var_name]])) #list of daily prediction files with path included
         pred_temp <- file.path(in_path_tile,pred_temp)
       }else{
         pred_temp <- as.character(method_mod_obj[[index]][[y_var_name]]) #list of daily prediction files with path included
+      }
       rast_pred_temp_s <- stack(pred_temp) #stack of temperature predictions from models (daily)
       rast_pred_temp <- mask(rast_pred_temp_s,LC_mask,file=file.path(out_path,"test.tif"),overwrite=TRUE)
       #Get validation metrics, daily spdf training and testing stations, monthly spdf station input
       sampling_dat<-method_mod_obj[[index]]$sampling_dat
       metrics_v<-validation_mod_obj[[index]]$metrics_v
       metrics_s<-validation_mod_obj[[index]]$metrics_s
       data_v<-validation_mod_obj[[index]]$data_v
       data_v<-validation_mod_obj[[index]]$data_v #testing with residuals
       data_s<-validation_mod_obj[[index]]$data_s
       formulas<-method_mod_obj[[index]]$formulas
       #no formula if multi-timescale method
       if(multi_timescale==TRUE){
         formulas<- raster_prediction_obj$clim_method_mod_obj[[as.integer(month)]]$formulas #models ran
       }else{
         formulas<- method_mod_obj[[index]]$formulas #models ran
+      }
       #Adding layer LST to the raster stack of covariates
       #The names of covariates can be changed...
-...
       rmse_f<-metrics_s$rmse[nrow(metrics_s)]
       #Set as constant in master script ?? : c("gam_CAI","kriging_CAI","gwr_CAI","gam_fusion","kriging_fusion","gwr_fusion")
       if (interpolation_method %in% c("gam_CAI","kriging_CAI","gwr_CAI","gam_fusion","kriging_fusion","gwr_fusion")){
       #if (interpolation_method %in% c("gam_CAI","kriging_CAI","gwr_CAI","gam_fusion","kriging_fusion","gwr_fusion")){
       if (multi_timescale==TRUE){
         #if multi-time scale method then the raster prediction object contains a "clim_method_mod_obj"
         clim_method_mod_obj <- raster_prediction_obj$clim_method_mod_obj
         data_month<-clim_method_mod_obj[[index]]$data_month
         data_month <-clim_method_mod_obj[[mo]]$data_month
         png(file.path(out_path,paste("LST_",y_var_month,"_scatterplot_",sampling_dat$date,"_",sampling_dat$prop,"_",sampling_dat$run_samp,
                                      out_prefix,".png", sep="")))
         plot(data_month[[y_var_month]],data_month$LST,xlab=paste("Station mo ",y_var_month,sep=""),ylab=paste("LST mo ",y_var_month,sep=""))
         title(paste("LST vs ", y_var_month,"for",datelabel,sep=" "))
         plot(data_month[[y_var_month]],data_month$LST,xlab=paste("Station mo ",y_var_month,sep=""),ylab=paste("LST month ",mo," ",sep=""))
         title(paste("LST vs ", y_var_month,"for month ",mo,sep=" "))
         abline(0,1)
         nb_point<-paste("n=",length(data_month[[y_var_month]]),sep="")
         LSTD_bias <- data_month$TMax - data_month$LST #in case it is a CAI method, calculate bias
-...
         dev.off()
         ## Figure 2: Daily_tmax_monthly_TMax_scatterplot, modify for TMin!!
         png(file.path(out_path,paste("Month_day_scatterplot_",y_var_name,"_",y_var_month,"_",sampling_dat$date,"_",sampling_dat$prop,"_",sampling_dat$run_samp,
                                      out_prefix,".png", sep="")))
         plot(data_s[[y_var_name]]~data_s[[y_var_month]],xlab=paste("Month") ,ylab=paste("Daily for",datelabel),main="across stations in VE")
         nb_point<-paste("ns=",length(data_s[[y_var_month]]),sep="")
         nb_point2<-paste("ns_obs=",length(data_s[[y_var_month]])-sum(is.na(data_s[[y_var_name]])),sep="")
         nb_point3<-paste("n_month=",length(data_month[[y_var_month]]),sep="")
         #This is not stored in data_s$TMax?
         #png(file.path(out_path,paste("Month_day_scatterplot_",y_var_name,"_",y_var_month,"_",sampling_dat$date,"_",sampling_dat$prop,"_",sampling_dat$run_samp,
         #                             out_prefix,".png", sep="")))
         #plot(data_s[[y_var_name]]~data_s[[y_var_month]],xlab=paste("Month") ,ylab=paste("Daily for",datelabel),main="across stations in VE")
         #nb_point<-paste("ns=",length(data_s[[y_var_month]]),sep="")
         #nb_point2<-paste("ns_obs=",length(data_s[[y_var_month]])-sum(is.na(data_s[[y_var_name]])),sep="")
         #nb_point3<-paste("n_month=",length(data_month[[y_var_month]]),sep="")
         #Add the number of data points on the plot
         legend("topleft",legend=c(nb_point,nb_point2,nb_point3),bty="n",cex=0.8)
         dev.off()
         #legend("topleft",legend=c(nb_point,nb_point2,nb_point3),bty="n",cex=0.8)
         #dev.off()
         ## Figure 3: monthly stations used
         png(file.path(out_path,paste("Monthly_data_study_area_", y_var_name,
                                      out_prefix,".png", sep="")))
         plot(raster(rast_pred_temp,layer=5))
         plot(raster(rast_pred_temp,layer=1))
         plot(data_month,col="black",cex=1.2,pch=4,add=TRUE)
         title("Monthly ghcn station in Venezuela for January")
         title("Monthly ghcn station in tile for January")
         dev.off()
+      }
       } #End of if multi_timescale=TRUE
       ## Figure 4: Predicted_tmax_versus_observed_scatterplot
       names_mod <- names(method_mod_obj[[index]][[y_var_name]]) #names of models to plot
-...
+      }
       ## Figure 5a: prediction raster images
       png(file.path(out_path,paste("Raster_prediction_",y_var_name,"_",sampling_dat$date,"_",sampling_dat$prop,"_",sampling_dat$run_samp,
       png(file.path(out_path,paste("Raster_prediction_levelplot_",y_var_name,"_",sampling_dat$date,"_",sampling_dat$prop,"_",sampling_dat$run_samp,
                 out_prefix,".png", sep="")))
       #paste(metrics_v$pred_mod,format(metrics_v$rmse,digits=3),sep=":")
       names(rast_pred_temp)<-paste(metrics_v$pred_mod,format(metrics_v$rmse,digits=3),sep=":")
-...
       dev.off()
       ## Figure 5b: prediction raster images
       png(file.path(out_path,paste("Raster_prediction_plot",sampling_dat$date,"_",sampling_dat$prop,"_",sampling_dat$run_samp,
       png(file.path(out_path,paste("Raster_prediction_plot_",y_var_name,"_",sampling_dat$date,"_",sampling_dat$prop,"_",sampling_dat$run_samp,
                 out_prefix,".png", sep="")))
       #paste(metrics_v$pred_mod,format(metrics_v$rmse,digits=3),sep=":")
       names(rast_pred_temp)<-paste(metrics_v$pred_mod,format(metrics_v$rmse,digits=3),sep=":")
       plot(rast_pred_temp)
       dev.off()
       ## Figure 6: training and testing stations used
       ## Figure 6: training and testing daily stations used
       png(file.path(out_path,paste("Training_testing_stations_map_",y_var_name,"_",sampling_dat$date,"_",sampling_dat$prop,"_",sampling_dat$run_samp,
                 out_prefix,".png", sep="")))
       plot(raster(rast_pred_temp,layer=5))
       plot(raster(rast_pred_temp,layer=1))
       plot(data_s,col="black",cex=1.2,pch=2,add=TRUE)
       plot(data_v,col="red",cex=1.2,pch=1,add=TRUE)
       legend("topleft",legend=c("training stations", "testing stations"),
              cex=1, col=c("black","red"),
              pch=c(2,1),bty="n")
       title(paste("Daily stations ", datelabel,sep=""))
       nb_point1<-paste("ns_obs=",nrow(data_s),sep="")
       nb_point2<-paste("nv_obs=",nrow(data_v),sep="")
       legend("bottomright",legend=c(nb_point1,nb_point2),bty="n",cex=0.8)
       dev.off()
       ## Figure 7: delta surface and bias
-...
       if (interpolation_method%in% c("gam_fusion","kriging_fusion","gwr_fusion")){
         png(file.path(out_path,paste("Bias_delta_surface_",y_var_name,"_",sampling_dat$date[i],"_",sampling_dat$prop[i],
                   "_",sampling_dat$run_samp[i],out_prefix,".png", sep="")))
         bias_rast<-stack(clim_method_mod_obj[[index]]$bias)
         delta_rast<-raster(method_mod_obj[[index]]$delta) #only one delta image!!!
           ##The path of production is not the same if input_path_tile is not NULL
         if(!is.null(in_path_tile)){
           #infile_covariates <- file.path(in_path_tile,basename(list_param$covar_obj$infile_covariates))
           bias_lf <- basename(as.character(clim_method_mod_obj[[index]]$bias)) #list of daily prediction files with path included
           bias_lf <- file.path(in_path_tile,bias_lf)
           delta_lf <- basename(unlist(method_mod_obj[[index]]$delta))
           delta_lf <- file.path(in_path,delta_lf)
         }else{
           bias_lf <- clim_method_mod_obj[[index]]$bias #list of daily prediction files with path included
           delta_lf <- method_mod_obj[[index]]$delta
+        }
         bias_rast<-stack(bias_lf)
         delta_rast<-raster(delta_lf) #only one delta image!!!
         names(delta_rast)<-"delta"
         rast_temp_date<-stack(bias_rast,delta_rast)
         layers_names <- names(rast_temp_date)
-...
         plot(rast_temp_date)
         dev.off()
+      }
       #if CAI
       if (interpolation_method %in% c("gam_CAI","kriging_CAI","gwr_CAI","gam_fusion","kriging_fusion","gwr_fusion")){
         png(file.path(out_path,paste("clim_surface_",y_var_name,"_",sampling_dat$date[i],"_",sampling_dat$prop[i],
                   "_",sampling_dat$run_samp[i],out_prefix,".png", sep="")))
         clim_rast<-stack(clim_method_mod_obj[[index]]$clim)
         delta_rast<-raster(method_mod_obj[[index]]$delta) #only one delta image!!!
         names(delta_rast)<-"delta"
         layers_names <- c(names(clim_rast),"delta")
         rast_temp_date<-stack(clim_rast,delta_rast)
         rast_temp_date<-mask(rast_temp_date,LC_mask,file=file.path(out_path,"test.tif"),overwrite=TRUE) #loosing names here
           ##The path of production is not the same if input_path_tile is not NULL
         if(!is.null(in_path_tile)){
           #infile_covariates <- file.path(in_path_tile,basename(list_param$covar_obj$infile_covariates))
           clim_lf <- basename(as.character(clim_method_mod_obj[[mo]]$clim)) #list of daily prediction files with path included
           clim_lf <- file.path(in_path_tile,clim_lf)
           delta_lf <- basename(unlist(method_mod_obj[[index]]$delta))
           delta_lf <- file.path(in_path,delta_lf)
         }else{
           clim_lf <- clim_method_mod_obj[[index]]$clim #list of monthly prediction files with path included
           delta_lf <- method_mod_obj[[index]]$delta
+        }
         clim_rast<-stack(clim_lf)
         delta_rast<-stack(delta_lf) #this is a stack now... delta images!!!
         names(delta_rast)<- paste(names_mod,"_delta",sep="")
         names(clim_rast) <- paste(names_mod,"_month",mo,sep="")
         #layers_names <- c(names(clim_rast),"delta")
         #rast_temp_date<-stack(clim_rast,delta_rast)
         #rast_temp_date<-mask(rast_temp_date,LC_mask,file=file.path(out_path,"test.tif"),overwrite=TRUE) #loosing names here
         #bias_d_rast<-raster("fusion_bias_LST_20100103_30_1_10d_GAM_fus5_all_lstd_02082013.rst")
         names(rast_temp_date) <-layers_names
         plot(rast_temp_date)
         #names(rast_temp_date) <-layers_names
         #plot(rast_temp_date)
         plot(clim_rast)
         #title("Climatology for month ", mo, sep="")
         dev.off()
         png(file.path(out_path,paste("delta_surface_",y_var_name,"_",sampling_dat$date[i],"_",sampling_dat$prop[i],
                   "_",sampling_dat$run_samp[i],out_prefix,".png", sep="")))
         plot(delta_rast)
         dev.off()
+      }
       ### Figure 9: map of residuals...
       for (k in 1:length(names_mod)){
         model_name <- names_mod[k]
         #fig_name <- file.path(out_path,paste("Figure_residuals_map_",y_var_name,"_",model_name,"_",sampling_dat$date,"_",sampling_dat$prop,"_",
         #                             sampling_dat$run_samp,out_prefix,".png", sep=""))
         png(file.path(out_path,paste("Figure_residuals_map_",y_var_name,"_",model_name,"_",sampling_dat$date,"_",sampling_dat$prop,"_",
                                      sampling_dat$run_samp,out_prefix,".png", sep="")))
         res_model_name <- paste("res",model_name,sep="_")
         elev <- subset(s_raster,"elev_s")
         p1 <- levelplot(elev,scales = list(draw = FALSE), colorkey = FALSE,col.regions=rev(terrain.colors(255)))
         #add legend..
         cx <- ((data_v[[res_model_name]])^2)/10
         p2 <- spplot(data_v,res_model_name, cex=1 * cx,main=paste("Residuals for ",res_model_name," ",datelabel,sep=""))
         p3 <-p2+p1+p2 #to force legend...
         #p2
         print(p3)
         dev.off()
+      }
       #Figure 9: histogram for all images...
       #Figure 9: histogram for all images/residuals...
       ## Add later...? distance to closest fitting station?
       #tb_diagnostic_v <- raster_prediction_obj$tb_diagnostic_v

Also available in: Unified diff

Project

General

Profile

Revision 8c68c923

Added by Benoit Parmentier over 10 years ago