/ - Diff - Environment and organisms - NCEAS Projects

« Previous | Next »

Revision 08721acf

Added by Benoit Parmentier over 11 years ago

ID 08721acf112b52d746f96907f43c857161a52f82
Parent da7bcc4a
Child ba485f60

changes in validation script to deal with hold out proportion at monthly time scale

       #PARSING INPUT PARAMETERS
       out_path <- list_param$out_path
       day_list<- list_param$rast_day_year_list[[i]]
       day_list <- list_param$rast_day_year_list[[i]]
       #day_list <-rast_day_yearlist[[i]] #list of prediction for the current date...
       names_mod<-names(day_list)
       method_mod_obj<-list_param$method_mod_obj
       #Change to results_mod_obj[[i]]$data_s to make it less specific
       data_v <- method_mod_obj[[i]]$data_v
       data_s <- method_mod_obj[[i]]$data_s
       names_mod <- names(day_list)
       method_mod_obj <- list_param$method_mod_obj
       y_var_name <- list_param$y_var_name #missing--debugging
       multi_time_scale <- list_param$multi_time_scale
       if(multi_time_scale==TRUE){
         data_v <- method_mod_obj[[i]]$data_month_v
         data_s <- method_mod_obj[[i]]$data_month_s
         daily_dev_sampling_dat <- method_mod_obj[[i]]$daily_dev_sampling_dat
         sampling_dat_day <- method_mod_obj[[i]]$daily_dev_sampling_dat
       }else{
         #Change to results_mod_obj[[i]]$data_s to make it less specific
         data_v <- method_mod_obj[[i]]$data_v
         data_s <- method_mod_obj[[i]]$data_s
         sampling_dat_day <- (method_mod_obj[[i]])$sampling_dat
+      }
       ## Now create the stack
       rast_day_mod <- stack(day_list)
       names(rast_day_mod) <- names(day_list)
       extract_data_v<-extract(rast_day_mod,data_v,df=TRUE)
       extract_data_s<-extract(rast_day_mod,data_s,df=TRUE)
       data_v <-spCbind(data_v,extract_data_v) #should match IDs before joining for good practice
       data_s <-spCbind(data_s,extract_data_s)
       #Change to handle cases in which data_v is NULL!!!
       ns<-nrow(data_s) # some loss of data might have happened because of the averaging...
       nv<-nrow(data_v)
       sampling_dat_day<-(method_mod_obj[[i]])$sampling_dat
       metrics_v_obj<-calc_val_metrics_rast(data_v,y_var_name,names_mod)
       metrics_s_obj<-calc_val_metrics_rast(data_s,y_var_name,names_mod)
       #add sampling dat info...
       N=length(names_mod)
       run_info<-cbind(sampling_dat_day,n=nv)
       run_info[rep(seq_len(nrow(run_info)), each=N),] #repeating same row n times
       metrics_v_df<-cbind(metrics_v_obj$metrics,run_info)
       metrics_v_df["var_interp"]<-rep(y_var_name,times=nrow(metrics_v_df))
       #Name of the variable interpolated, useful for cross-comparison between methods at later stages
       run_info<-cbind(sampling_dat_day,n=ns)
       #Handle case of 0% hold out, monhtly or daily
       if (nv > 0){
         run_info<-cbind(sampling_dat_day,n=nv)
         run_info[rep(seq_len(nrow(run_info)), each=N),] #repeating same row n times
         extract_data_v<-extract(rast_day_mod,data_v,df=TRUE)
         data_v <-spCbind(data_v,extract_data_v) #should match IDs before joining for good practice
         metrics_v_obj<-calc_val_metrics_rast(data_v,y_var_name,names_mod)
         metrics_v_df<-cbind(metrics_v_obj$metrics,run_info)
         metrics_v_df["var_interp"]<-rep(y_var_name,times=nrow(metrics_v_df))
         #Name of the variable interpolated, useful for cross-comparison between methods at later stages
         data_v<-spCbind(data_v,metrics_v_obj$residuals)
+      }
       extract_data_s<-extract(rast_day_mod,data_s,df=TRUE)
       data_s <-spCbind(data_s,extract_data_s)
       metrics_s_obj <- calc_val_metrics_rast(data_s,y_var_name,names_mod)
       run_info <- cbind(sampling_dat_day,n=ns)
       run_info[rep(seq_len(nrow(run_info)), each=N),]
       metrics_s_df<-cbind(metrics_s_obj$metrics,run_info)
       metrics_s_df["var_interp"]<-rep(y_var_name,times=nrow(metrics_s_df))
       metrics_s_df <- cbind(metrics_s_obj$metrics,run_info)
       metrics_s_df["var_interp"] <- rep(y_var_name,times=nrow(metrics_s_df))
       #Name of the variable interpolated, useful for cross-comparison between methods at later stages
       data_v<-spCbind(data_v,metrics_v_obj$residuals)
       data_s<-spCbind(data_s,metrics_s_obj$residuals)
       validation_obj<-list(metrics_s_df,metrics_v_df,data_s,data_v)
       names(validation_obj)<-c("metrics_s","metrics_v","data_s","data_v")
       data_s <- spCbind(data_s,metrics_s_obj$residuals)
       #prepare output object
       if (nv > 0){
         validation_obj<-list(metrics_s_df,metrics_v_df,data_s,data_v)
         names(validation_obj)<-c("metrics_s","metrics_v","data_s","data_v")
       }else{
         validation_obj<-list(metrics_s_df,data_s)
         names(validation_obj)<-c("metrics_s","data_s")
+      }
       return(validation_obj)
-...
       return(tb_list_tmp) #this is  a data.frame
+    }
     #### Function to create a list from a object made up of a list with names e.g. method_mod_obj or clim_method_mod_obj
     extract_list_from_list_obj<-function(obj_list,list_name){
       #Create a list of an object from a given list of object using a name prodived as input
       list_tmp<-vector("list",length(obj_list))
       for (i in 1:length(obj_list)){
         tmp<-obj_list[[i]][[list_name]] #double bracket to return data.frame
         list_tmp[[i]]<-tmp
+      }
       return(list_tmp) #this is  a data.frame
+    }
     #### Function to plot boxplot from data.frame table of accuracy metrics
     boxplot_from_tb <-function(tb_diagnostic,metric_names,out_prefix,out_path){

Also available in: Unified diff

Project

General

Profile

Revision 08721acf

Added by Benoit Parmentier over 11 years ago