/ - Diff - Environment and organisms - NCEAS Projects

« Previous | Next »

Revision 80363c49

Added by Benoit Parmentier over 11 years ago

ID 80363c49e7c215185b5f241c6c196f0232ef7702
Parent 280bb8d2
Child 7b9aba64

analyses paperm, experimentation with correlograms in predictions

     ### Analyses and exploration of results for single time scale methods
     ### Loading R library and packages
     #library used in the workflow production:
     library(gtools)                              # loading some useful tools
     library(mgcv)                                # GAM package by Simon Wood
     library(sp)                                  # Spatial pacakge with class definition by Bivand et al.
     library(spdep)                               # Spatial pacakge with methods and spatial stat. by Bivand et al.
     library(rgdal)                               # GDAL wrapper for R, spatial utilities
     library(gstat)                               # Kriging and co-kriging by Pebesma et al.
     library(fields)                              # NCAR Spatial Interpolation methods such as kriging, splines
     library(raster)                              # Hijmans et al. package for raster processing
     library(gdata)                               # various tools with xls reading, cbindX
     library(rasterVis)                           # Raster plotting functions
     library(parallel)                            # Parallelization of processes with multiple cores
     library(maptools)                            # Tools and functions for sp and other spatial objects e.g. spCbind
     library(maps)                                # Tools and data for spatial/geographic objects
     library(reshape)                             # Change shape of object, summarize results
     library(plotrix)                             # Additional plotting functions
     library(plyr)                                # Various tools including rbind.fill
     library(spgwr)                               # GWR method
     library(automap)                             # Kriging automatic fitting of variogram using gstat
     library(rgeos)                               # Geometric, topologic library of functions
     #RPostgreSQL                                 # Interface R and Postgres, not used in this script
     #Additional libraries not used in workflow
     library(pgirmess)                            # Krusall Wallis test with mulitple options, Kruskalmc {pgirmess}
     library(ncf)
     #### FUNCTION USED IN SCRIPT
     function_analyses_paper <-"contribution_of_covariates_paper_interpolation_functions_10152013.R"
     load_obj <- function(f)
+    {
       env <- new.env()
       nm <- load(f, env)[1]
       env[[nm]]
+    }
     ##############################
     #### Parameters and constants
     script_path<-"/home/parmentier/Data/IPLANT_project/env_layers_scripts/" #path to script
     source(file.path(script_path,function_analyses_paper)) #source all functions used in this script.
     in_dir1 <-"/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_gam_day_lst_comb3_08132013"
     in_dir2 <-"/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_gam_day_lst_comb4_08152013"
     #kriging results:
     in_dir3 <-"/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_kriging_day_lst_comb3_07112013"
     #gwr results:
     in_dir4 <-"/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_gwr_day_lst_comb3_part1_07122013"
     #multisampling results (gam)
     #in_dir5<- "/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_gam_daily_mults10_lst_comb3_08082013"
     #in_dir6<- "/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_kriging_daily_mults10_lst_comb3_08062013"
     #in_dir7<- "/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_gwr_daily_mults10_lst_comb3_08072013"
     #Hold-out every two days over 365 days
     in_dir5 <-"/data/project/layers/commons/Oregon_interpolation/output_data_365d_gam_daily_mults1_lst_comb3_10122013"
     in_dir6 <- "/data/project/layers/commons/Oregon_interpolation/output_data_365d_kriging_daily_mults1_lst_comb3_10112013"
     in_dir7 <-"/data/project/layers/commons/Oregon_interpolation/output_data_365d_gwr_daily_mults1_lst_comb3_10132013"
     out_dir<-"/home/parmentier/Data/IPLANT_project/paper_analyses_tables_fig_08032013"
     setwd(out_dir)
     infile_reg_outline <- "/data/project/layers/commons/data_workflow/inputs/region_outlines_ref_files/OR83M_state_outline.shp"  #input region outline defined by polygon: Oregon
     met_stations_outfiles_obj_file<-"/data/project/layers/commons/data_workflow/output_data_365d_gam_fus_lst_test_run_07172013/met_stations_outfiles_obj_gam_fusion__365d_gam_fus_lst_test_run_07172013.RData"
     CRS_locs_WGS84<-CRS("+proj=longlat +ellps=WGS84 +datum=WGS84 +towgs84=0,0,0") #Station coords WGS84
     y_var_name <- "dailyTmax"
     out_prefix<-"analyses_10152013"
     #method_interpolation <- "gam_daily"
     covar_obj_file_1 <- "covar_obj__365d_gam_day_lst_comb3_08132013.RData"
     met_obj_file_1 <- "met_stations_outfiles_obj_gam_daily__365d_gam_day_lst_comb3_08132013.RData"
     #met_stations_outfiles_obj_gam_daily__365d_gam_day_lst_comb3_08132013.RData
     #raster_prediciton object for baseline 1 () s(lat,lon) + s(elev)) and baseline 2 (slat,lon))
     raster_obj_file_1 <- "raster_prediction_obj_gam_daily_dailyTmax_365d_gam_day_lst_comb3_08132013.RData"
     raster_obj_file_2 <- "raster_prediction_obj_gam_daily_dailyTmax_365d_gam_day_lst_comb4_08152013.RData"
     raster_obj_file_3 <- "raster_prediction_obj_kriging_daily_dailyTmax_365d_kriging_day_lst_comb3_07112013.RData"
     raster_obj_file_4 <- "raster_prediction_obj_gwr_daily_dailyTmax_365d_gwr_day_lst_comb3_part1_07122013.RData"
     #multisampling using baseline lat,lon + elev
     #raster_obj_file_5 <- "raster_prediction_obj_gam_daily_dailyTmax_365d_gam_daily_mults10_lst_comb3_08082013.RData"
     #raster_obj_file_6 <- "raster_prediction_obj_kriging_daily_dailyTmax_365d_kriging_daily_mults10_lst_comb3_08062013.RData"
     #raster_obj_file_7 <- "raster_prediction_obj_gwr_daily_dailyTmax_365d_gwr_daily_mults10_lst_comb3_08072013.RData"
     raster_obj_file_5 <- "raster_prediction_obj_gam_daily_dailyTmax_365d_gam_daily_mults1_lst_comb3_10122013.RData"
     raster_obj_file_6 <- "raster_prediction_obj_kriging_daily_dailyTmax_365d_kriging_daily_mults1_lst_comb3_10112013.RData"
     raster_obj_file_7 <- "raster_prediction_obj_gwr_daily_dailyTmax_365d_gwr_daily_mults1_lst_comb3_10132013.RData"
     #Load objects containing training, testing, models objects
     met_stations_obj <- load_obj(met_stations_outfiles_obj_file)
     covar_obj <-load_obj(file.path(in_dir1,covar_obj_file_1)) #Reading covariates object for GAM daily method
     infile_covariates <- covar_obj$infile_covariates
     infile_reg_outline <- covar_obj$infile_reg_outline
     covar_names<- covar_obj$covar_names
     #####
     s_raster <- brick(infile_covariates)
     names(s_raster)<-covar_names
     raster_prediction_obj_1 <-load_obj(file.path(in_dir1,raster_obj_file_1)) #comb3 (baseline 2)
     raster_prediction_obj_2 <-load_obj(file.path(in_dir2,raster_obj_file_2)) #comb4 (baseline 1)
     raster_prediction_obj_3 <-load_obj(file.path(in_dir3,raster_obj_file_3)) #comb3/mod1 baseline 2, kriging
     raster_prediction_obj_4 <-load_obj(file.path(in_dir4,raster_obj_file_4)) #comb3/mod1 baseline 2, gwr
     raster_prediction_obj_5 <-load_obj(file.path(in_dir5,raster_obj_file_5)) #gam daily multisampling 10 to 70%
     raster_prediction_obj_6 <-load_obj(file.path(in_dir6,raster_obj_file_6)) #kriging daily multisampling 10 to 70%
     raster_prediction_obj_7 <-load_obj(file.path(in_dir7,raster_obj_file_7)) #gwr daily multisampling 10 to 70%
     ############### BEGIN SCRIPT #################
     ############ PART 1: Exploration of surfaces bias, delta and climatology surfaces ###########
     #"/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_gam_day_lst_comb4_07152013/"
     in_dir<-"/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_kriging_cai_lst_comb3_07312013"
     out_dir<-""
     setwd(in_dir)
     y_var_name <- "dailyTmax"
     y_var_month <- "TMax"
     #y_var_month <- "LSTD_bias"
     out_prefix<-"/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_GAM_fus_all_lst_05312013"
     method_interpolation <- "kriging_CAI"
     covar_obj_file <- "covar_obj__365d_kriging_cai_lst_comb3_07312013.RData"
     raster_obj_file <- "raster_prediction_obj_kriging_CAI_dailyTmax_365d_kriging_cai_lst_comb3_07312013.RData"
     script_path<-"/data/project/layers/commons/data_workflow/env_layers_scripts/"
     source(file.path(script_path,"interpolation_method_day_function_multisampling_07052013.R")) #Include GAM_day
     #Load objects containing training, testing, models objects
     covar_obj <-load_obj(covar_obj_file)
     infile_covariates <- covar_obj$infile_covariates
     infile_reg_outline <- covar_obj$infile_reg_outline
     covar_names<- covar_obj$covar_names
     raster_prediction_obj <-load_obj(raster_obj_file)
     names(raster_prediction_obj) #list of two objects
     raster_prediction_obj$summary_metrics_v
     j<-1 #selected month for climatology
     i<-1
     data_s <- raster_prediction_obj$method_mod_obj[[i]]$data_s #training data
     data_v <- raster_prediction_obj$method_mod_obj[[i]]$data_v #testing data
     method_mod_obj <- raster_prediction_obj$method_mod_obj #this object contains daily information, training, testing and images
     clim_method_mod_obj <- raster_prediction_obj$clim_method_mod_obj
     data_month1 <- clim_method_mod_obj[[1]]$data_month #monthly data
     data_month <- clim_method_mod_obj[[j]]$data_month #monthly data
     clim_mod_obj_month <- clim_method_mod_obj[[j]]
     names(clim_mod_obj_month)
     #####
     s_raster <- brick(infile_covariates)
     names(s_raster)<-covar_names
     #data_s$y_var <- data_s[[y_var_name]]
     #formula<-"y_var ~ s(lat,lon,elev_s)"
     #date<-strptime(sampling_dat$date[i], "%Y%m%d")   # interpolation date being processed
     month<-strftime(date, "%m")          # current month of the date being processed
     month<-"01"
     LST_month<-paste("mm_",month,sep="") # name of LST month to be matched
     pos<-match("LST",names(s_raster)) #Find the position of the layer with name "LST", if not present pos=NA
     s_raster<-dropLayer(s_raster,pos)      # If it exists drop layer
     LST<-subset(s_raster,LST_month)
     names(LST)<-"LST"
     s_raster<-addLayer(s_raster,LST)            #Adding current month
     ### MONTH MODELS
     index<-1
     data_month$y_var<-data_month[[y_var_month]]
     mod1 <- clim_method_mod_obj[[1]]$mod[[1]]
     clim_method_mod_obj[[1]]$clim #list of files containing model predictions...
     clim_rast<-stack(clim_method_mod_obj[[index]]$clim)
     delta_rast<-raster(method_mod_obj[[index]]$delta) #only one delta image!!!
     pred_temp<-as.character(method_mod_obj[[index]][[y_var_name]]) #list of files with path included
     rast_pred_temp_s <-stack(pred_temp) #stack of temperature predictions from models (daily)
     names(delta_rast)<-"delta"
     rast_temp_date<-stack(clim_rast,delta_rast)
     #rast_temp_date<-mask(rast_temp_date,LC_mask,file=file.path(out_path,"test.tif"),overwrite=TRUE)
     #bias_d_rast<-raster("fusion_bias_LST_20100103_30_1_10d_GAM_fus5_all_lstd_02082013.rst")
     plot(rast_temp_date)
     month_m_rast<-subset(clim_rast,"mod1")
     day_m_rast<-subset(rast_pred_temp_s,1)
     test<- month_m_rast + delta_rast
     diff <- test - day_m_rast  #this is equal to zeor roughly...
     s_sgdf<-as(day_m_rast,"SpatialGridDataFrame") #Conversion to spatial grid data frame, only convert the necessary layers!!
     #s_spdf<-as(day_m_rast,"SpatialPointsDataFrame") #Conversion to spatial grid data frame, only convert the necessary layers!!
     names(s_sgdf)<-"var1.pred"
     mod1$krige_output<-s_sgdf
     plot(mod1) #does not work because we set krige_output to null!!!
     formula_mod<-formula("y_var~lat*lon + elev_s")
     col_names<-all.vars(formula_mod) #extract terms names from formula object
     if (length(col_names)==1){
       data_fit <-data_month
     }else{
       data_fit <- remove_na_spdf(col_names,data_month)
+    }
     ref_rast<-as(subset(s_raster,1),"SpatialGridDataFrame")
     s_spdf<-select_var_stack(s_raster,formula_mod,spdf=TRUE) #This only works if s_raster is in memory!!! need to be modified
     proj4string(data_fit)<-proj4string(s_spdf)
     test_mod <- autoKrige(formula_mod, input_data=data_fit,new_data=s_spdf,data_variogram=data_fit)
     plot(test_mod)
     prediction_spdf = test_mod$krige_output
     sample_variogram = test_mod$exp_var
     variogram_model = test_mod$var_model
     #### CHECKING THE INPUTS FROM COVARIATES
     LC1 <- subset(s_raster,"LC1")
     plot(LC1,colNA=c("red"))
     LC2 <- subset(s_raster,"LC2")
     plot(LC2,colNA=c("red"))
     LC_names<- paste("LC",1:10,sep="")
     lc_reg_s <-subset(s_raster,LC_names)
     plot(lc_reg_s,colNA="red")
     plot(subset(s_raster,"CANHGHT"),colNA="red")
     #Now create mask based on water areas
     LC12<-raster(lc_reg_s,layer=nlayers(lc_reg_s)) #this is open water
     LC_mask<-LC12
     LC_mask[LC_mask==100]<-NA
     LC_mask <- LC_mask > 100
     CANHGHT <- subset(s_raster,"CANHGHT")
     lc_path<-"/data/project/layers/commons/data_workflow/inputs/lc-consensus-global"
     infile_modis_grid<-"/data/project/layers/commons/data_workflow/inputs/modis_grid/modis_sinusoidal_grid_world.shp" #modis grid tiling system, global
     infile_elev<-"/data/project/layers/commons/data_workflow/inputs/dem-cgiar-srtm-1km-tif/srtm_1km.tif"  #elevation at 1km, global extent to be replaced by the new fused product
     infile_canheight<-"/data/project/layers/commons/data_workflow/inputs/treeheight-simard2011/Simard_Pinto_3DGlobalVeg_JGR.tif"         #Canopy height, global extent
     infile_distoc <- "/data/project/layers/commons/data_workflow/inputs/distance_to_coast/GMT_intermediate_coast_distance_01d_rev.tif" #distance to coast, global extent at 0.01 deg
     CANH<-raster(infile_canheight)
     LC1_W<-raster(list.files(path=lc_path,full.names=T)[4])
     #Correlation matrix for a subset
     r<-subset(s_raster,5:8)
     t44<-layerStats(r,"pearson",na.rm=T)
     image(t44[[1]])
     ###########################################################################################
     ############ PART 2: Granularity-Autocorrelation analyses of predicted surfaces ###########
     #####
     lf2 <- raster_prediction_obj_2$method_mod_obj[[index]][[y_var_name]]
     lf2 #contains the models for gam
     pred_temp_s <-stack(lf2)
     date_selected <- "20109101"
     #names_layers <-c("mod1=s(lat,long)+s(elev)","mod4=s(lat,long)+s(LST)","diff=mod1-mod4")
     names_layers <-c("mod1 = s(lat,long)","mod2 = s(lat,long)+s(elev)","mod3 = s(lat,long)+s(N_w)","mod4 = s(lat,long)+s(E_w)",
                      "mod5 = s(lat,long)+s(LST)","mod6 = s(lat,long)+s(DISTOC)","mod7 = s(lat,long)+s(LC1)",
                      "mod8 = s(lat,long)+s(LC1,LST)","mod9 = s(lat,long)+s(CANHGHT)","mod10 = s(lat,long)+s(LST,CANHGHT)")
     #names_layers<-names(pred_temp_s)
     #names(pred_temp_s)<-names_layers
     s.range <- c(min(minValue(pred_temp_s)), max(maxValue(pred_temp_s)))
     #s.range <- s.range+c(5,-5)
     col.breaks <- pretty(s.range, n=200)
     lab.breaks <- pretty(s.range, n=100)
     temp.colors <- colorRampPalette(c('blue', 'white', 'red'))
     max_val<-s.range[2]
     min_val <-s.range[1]
     #max_val<- -10
     #min_val <- 0
     layout_m<-c(4,3) #one row two columns
     p<-levelplot(pred_temp_s,main="Interpolated Surfaces Model Comparison baseline 1", ylab=NULL,xlab=NULL,
               par.settings = list(axis.text = list(font = 2, cex = 1.3),layout=layout_m,
                                   par.main.text=list(font=2,cex=2),strip.background=list(col="white")),par.strip.text=list(font=2,cex=1.5),
               names.attr=names_layers,col.regions=temp.colors,at=seq(max_val,min_val,by=0.01))
     #col.regions=temp.colors(25))
     print(p)
     #####################################
     ### Create spatial correlogram ####
     r_mod5 <- subset(pred_temp_s,"mod5") #wiht LST
     r_mod1 <- subset(pred_temp_s,"mod1") #wiht lat,long
     r_mod2 <- subset(pred_temp_s,"mod2") #wiht elev
     df_mod5 <- as(r_mod5,"SpatialPointsDataFrame")
     df_mod1 <- as(r_mod1,"SpatialPointsDataFrame")
     df_mod2 <- as(r_mod2,"SpatialPointsDataFrame")
     r_stack <-stack(subset(s_raster,"mm_01"),pred_temp_s)
     df_rs <- as(r_stack,"SpatialPointsDataFrame")
     correg_t<-correlog(coordinates(df_mod5),df_mod5$mod5)
     correg_t<-correlog(coordinates(df_mod5)[,1],coordinates(df_mod5)[,2],df_mod5$mod5)
     data_s<-(as.data.frame((list_data_s[[1]])))
     data_v<-(list_data_v[[1]])
     data_s <-na.omit(data_s[,c("x","y","LST",y_var_name,"elev")])
     correg_t1 <- correlog(as.matrix(cbind(data_s$x,data_s$y)),z=data_s$LST)
     correg_t2 <- correlog(as.matrix(cbind(data_s$x,data_s$y)),z=data_s$elev)
     correg_t3 <- correlog(as.matrix(cbind(data_s$x,data_s$y)),z=data_s[[y_var_name]])
     correg_t4 <- correlog(as.matrix(cbind(data_s$x,data_s$y)),z=data_s[,c("LST",y_var_name,"elev")])
     plot(correg_t1)
     plot(correg_t2,add=T)
     correg_t1[,1]
     correg_t2[,1]
     df_x <- as.data.frame(cbind(correg_t1[,1],correg_t1[,2],correg_t2[,2],correg_t3[,2]))
     names(df_x)<-c("dist","LST",y_var_name,"elev")
     xyplot(LST+dailyTmax+elev~dist,df_x,type="b",
            auto.key=list(title="Var", space = "right", cex=1.0),
            par.settings = list(superpose.symbol=list(pch = 0:3, cex=1)),
+    )
     ### For the whole image:
     sp_correlogram_fun <- function(i,list_param){
       df <- list_param$list_df[[i]]
       var_zname <- list_param$var_zname[i]
       order_lag <- list_param$order_lag[i]
       method_cor <- list_param$method_cor
       nb_obj <- list_param$nb_obj
       randomisation_par <- list_param$randomisation_par
       sp.cor <- sp.correlogram(nb_obj, df[[var_zname]], order=order_lag,
                                method=method_cor, randomisation=randomisation_par)
       return(sp.cor)
+    }
     # 'nb' - neighbourhood of each cell
     #r.nb <- dnearneigh(as.matrix(xy), d1=0.5, d2=1.5)
     # 'nb' - an alternative way to specify the neighbourhood
     # r.nb <- cell2nb(nrow=side, ncol=side, type="queen")
     #sp.cor <- sp.correlogram(r.nb, df_mod5$mod5, order=15,
     #                         method="I", randomisation=FALSE)
     r_stack <-stack(subset(s_raster,c("mm_01","mm_07")),pred_temp_s)
     names(r_stack)[1:2]<-c("mm01","mm_07")
     df_rs <- as(r_stack,"SpatialPointsDataFrame")
     r.nb <- dnearneigh(coordinates(df_rs), d1=res(s_raster)[1]/2, d2=1.5*res(s_raster)[1]) #lag1
     #Do not run... slow
     rk.nb14 <- knearneigh(coordinates(df_rs), k=14) #lag1
     #rk_nb14 <- knearneigh(coordinates(df_rs), k=14) #lag1
     #save(rk_nb14, file = "rk_nb14.RData")
     #rk_nb7 <- knearneigh(coordinates(df_rs), k=7) #lag1
     #save(rk_nb7, file = "rk_nb7.RData")
     #lrk_nb7 <- knn2nb(rk_nb7)
     #m_LST1 <- moran.test(df_rs$mm01,nb2listw(lrk_nb7),na.action=na.omit,zero.policy=TRUE)
     #sp.cor <- sp.correlogram(lrk_nb7, df_rs$mm01, order=7,
     #                         method="I", randomisation=FALSE)
     list_df <- list(df_rs,df_rs,df_rs,df_rs,df_rs)
     var_zname <- c("mm01","mm_07","mod1","mod2","mod5")
     order_lag <- c(14,14,14,14,14)
     method_cor <- "I"
     nb_obj <- r.nb
     randomisation_par <- "FALSE"
     list_param_spat_correlog <- list(list_df,var_zname,order_lag,method_cor,nb_obj,randomisation_par)
     names(list_param_spat_correlog) <- c("list_df","var_zname","order_lag","method_cor","nb_obj","randomisation_par")
     #debug(sp_correlogram_fun)
     #list_sp_correlog  <-sp_correlogram_fun(2,list_param_spat_correlog)
     #r_qc_s <- lapply(1:length(infile_var),FUN=import_list_modis_layers_fun,list_param=list_param_import_modis)
     #r_qc_s <-mclapply(1:11,FUN=import_list_modis_layers_fun,list_param=list_param_import_modis,mc.preschedule=FALSE,mc.cores = 11) #This is the end bracket from mclapply(...) statement
     list_sp_correlog <-mclapply(1:length(list_df),FUN=sp_correlogram_fun,list_param=list_param_spat_correlog ,mc.preschedule=FALSE,mc.cores = 5) #This is the end bracket from mclapply(...) statement
     #does not work...
     print(list_sp_correlog[[1]])
     plot(list_sp_correlog[[1]])
     print(list_sp_correlog[[2]])
     plot(list_sp_correlog[[2]])
     ##### Use filter option to compute lag Moran's I
     #Queen's case for 5 lags...: should do this in a function to generate filters...
     #lag 1: 2*1+1 rows
     f1 <- matrix(c(1,1,1,
 ,0,1,
 ,1,1), nrow=3)
     #lag 2: 2*2+1 rows
     f2 <- matrix(c(1,1,1,1,1,             #filter for lag 2
 ,0,0,0,1,
 ,0,0,0,1,
 ,0,0,0,1,
 ,1,1,1,1),nrow=5)
     f3 <- matrix(c(1,1,1,1,1,1,1,
 ,0,0,0,0,0,1,
 ,0,0,0,0,0,1,
 ,0,0,0,0,0,1,
 ,0,0,0,0,0,1,
 ,0,0,0,0,0,1,
 ,1,1,1,1,1,1),nrow=7)
     f4 <- matrix(c(1,1,1,1,1,1,1,1,1,
 ,0,0,0,0,0,0,0,1,
 ,0,0,0,0,0,0,0,1,
 ,0,0,0,0,0,0,0,1,
 ,0,0,0,0,0,0,0,1,
 ,0,0,0,0,0,0,0,1,
 ,0,0,0,0,0,0,0,1,
 ,0,0,0,0,0,0,0,1,
 ,1,1,1,1,1,1,1,1),nrow=9)
     r<- subset(s_raster,"mm_07")
     Moran(r,f1)
     Moran(r,f2)
     Moran(r,f3)
     #generate automatically filters for MORAN's I in the image...
     autocor_filter_fun <-function(no_lag=1,f_type="queen"){
       if(f_type=="queen"){
         no_rows <- 2*no_lag +1
         border_row <-rep(1,no_rows)
         other_row <- c(1,rep(0,no_rows-2),1)
         other_rows <- rep(other_row,no_rows-2)
         mat_data<- c(border_row,other_rows,border_row)
         autocor_filter<-matrix(mat_data,nrow=no_rows)
+      }
       #if(f_type=="rook){} #add later
       return(autocor_filter)
+    }
     #moran_multipe_fun<-function(i,list_param)
     #  lapply(list_filters,FUN=Moran,x=r)
     r<- subset(r_stack,"mod1")
     Moran(r,f1)
     Moran(r,f2)
     list_filters<-lapply(1:5,FUN=autocor_filter_fun,f_type="queen")
     Moran(r,list_filters[[1]])
     Moran(r,list_filters[[2]])
     plot(subset(s_raster,"mm_09"))
     r_stack <-stack(subset(s_raster,c("mm_09")),pred_temp_s)
     names(r_stack)[1]<-c("mm_09")
     r<- subset(r_stack,"mod1")
     Moran(r) #with lag 1 and default rooks lag correlation
     list_filters<-lapply(1:5,FUN=autocor_filter_fun,f_type="queen")
     #cacluate Moran's I for 5 lags for one layer
     moran_list <- lapply(list_filters,FUN=Moran,x=r)
     moran_multiple_fun<-function(i,list_param){
       #un
       list_filters <-list_param$list_filters
       r <- subset(list_param$r_stack,i)
       moran_list <- lapply(list_filters,FUN=Moran,x=r)
       moran_v <-as.data.frame(unlist(moran_list))
       names(moran_v)<-names(r)
       return(moran_v)
+    }
     list_filters<-lapply(1:10,FUN=autocor_filter_fun,f_type="queen")
     list_param_moran <- list(list_filters=list_filters,r_stack=r_stack)
     #moran_r <-moran_multiple_fun(1,list_param=list_param_moran)
     nlayers(r_stack)
     moran_I_df <-mclapply(1:nlayers(r_stack), list_param=list_param_moran, FUN=moran_multiple_fun,mc.preschedule=FALSE,mc.cores = 11) #This is the end bracket from mclapply(...) statement
     moran_df <- do.call(cbind,moran_I_df)
     moran_df$lag <-1:nrow(moran_df)
     #melt(moran_df,id=names(moran_df))
     #moran_df <- do.call(rbind,moran_I_df)
     mydata<-moran_df
     dd <- do.call(make.groups, mydata[,-ncol(mydata)])
     dd$lag <- mydata$lag
     #names(dd)[2]<-"models"
     names_layers <-c("LST",names_layers)
     xyplot(data ~ lag | which, dd,type="b",strip=strip.custom(factor.levels=names_layers))
     #solve problem wiht name

     ######################################## Paper Methods_comparison: Analyses part 5 #######################################
     ############################ Scripts for figures and analyses for paper 2 #####################################
     #This script performs analyses and create figures for the FSS paper.
     #It uses inputs from interpolation objects created at earlier stages...
     #Note that this is exploratory code i.e. not part of the worklfow.
     #AUTHOR: Benoit Parmentier                                                                       #
     #DATE: 09/13/2013                                                                                #
     #PROJECT: NCEAS INPLANT: Environment and Organisms --TASK#491--                                  #
     ###################################################################################################
     ###Loading R library and packages
     #library(gtools)                                        # loading some useful tools
     library(mgcv)                   # GAM package by Wood 2006 (version 2012)
     library(sp)                     # Spatial pacakge with class definition by Bivand et al. 2008
     library(spdep)                  # Spatial package with methods and spatial stat. by Bivand et al. 2012
     library(rgdal)                  # GDAL wrapper for R, spatial utilities (Keitt et al. 2012)
     library(gstat)                  # Kriging and co-kriging by Pebesma et al. 2004
     library(automap)                # Automated Kriging based on gstat module by Hiemstra et al. 2008
     library(spgwr)
     library(maptools)
     library(graphics)
     library(parallel)               # Urbanek S. and Ripley B., package for multi cores & parralel processing
     library(raster)
     library(rasterVis)
     library(plotrix)                # Draw circle on graph and additional plotting options
     library(reshape)                # Data format and type transformation
     ##################### Function used in the script ##############
     ## Extract a list of object from an object: Useful to extract information from
     ## RData objects saved in the interpolation phase.
     ### Analyses and exploration of results for single time scale methods
     ### Loading R library and packages
     #library used in the workflow production:
     library(gtools)                              # loading some useful tools
     library(mgcv)                                # GAM package by Simon Wood
     library(sp)                                  # Spatial pacakge with class definition by Bivand et al.
     library(spdep)                               # Spatial pacakge with methods and spatial stat. by Bivand et al.
     library(rgdal)                               # GDAL wrapper for R, spatial utilities
     library(gstat)                               # Kriging and co-kriging by Pebesma et al.
     library(fields)                              # NCAR Spatial Interpolation methods such as kriging, splines
     library(raster)                              # Hijmans et al. package for raster processing
     library(gdata)                               # various tools with xls reading, cbindX
     library(rasterVis)                           # Raster plotting functions
     library(parallel)                            # Parallelization of processes with multiple cores
     library(maptools)                            # Tools and functions for sp and other spatial objects e.g. spCbind
     library(maps)                                # Tools and data for spatial/geographic objects
     library(reshape)                             # Change shape of object, summarize results
     library(plotrix)                             # Additional plotting functions
     library(plyr)                                # Various tools including rbind.fill
     library(spgwr)                               # GWR method
     library(automap)                             # Kriging automatic fitting of variogram using gstat
     library(rgeos)                               # Geometric, topologic library of functions
     #RPostgreSQL                                 # Interface R and Postgres, not used in this script
     #Additional libraries not used in workflow
     library(pgirmess)                            # Krusall Wallis test with mulitple options, Kruskalmc {pgirmess}
     library(ncf)
     #### FUNCTION USED IN SCRIPT
     function_analyses_paper <-"contribution_of_covariates_paper_interpolation_functions_10152013.R"
     load_obj <- function(f)
+    {
-...
       env[[nm]]
+    }
     ### Need to improve this function!!!
     calc_stat_prop_tb_diagnostic <-function(names_mod,names_id,tb){
       t<-melt(subset(tb,pred_mod==names_mod),
               measure=c("mae","rmse","r","me","m50"),
               id=names_id,
               na.rm=T)
       char_tmp <-rep("+",length=length(names_id)-1)
       var_summary <-paste(names_id,sep="",collapse=char_tmp)
       var_summary_formula <-paste(var_summary,collpase="~variable")
       avg_tb<-cast(t,var_summary_formula,mean)
       sd_tb<-cast(t,var_summary_formula,sd)
       n_tb<-cast(t,var_summary_formula,length)
       #n_NA<-cast(t,dst_cat1~variable,is.na)
       #### prepare returning object
       prop_obj<-list(tb,avg_tb,sd_tb,n_tb)
       names(prop_obj) <-c("tb","avg_tb","sd_tb","n_tb")
       return(prop_obj)
+    }
     #Calculate the difference between training and testing in two different data.frames. Columns to substract are provided.
     diff_df<-function(tb_s,tb_v,list_metric_names){
       tb_diff<-vector("list", length(list_metric_names))
       for (i in 1:length(list_metric_names)){
         metric_name<-list_metric_names[i]
         tb_diff[[i]] <-tb_s[,c(metric_name)] - tb_v[,c(metric_name)]
+      }
       names(tb_diff)<-list_metric_names
       tb_diff<-as.data.frame(do.call(cbind,tb_diff))
       return(tb_diff)
+    }
     ##############################
     #### Parameters and constants
     ################## PARAMETERS ##########
     #path to gam CAI and kriging analyes with hold-out
     in_dir1 <- "/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_gam_CAI_lst_comb3_08312013/"
     in_dir2 <- "/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_gam_CAI_lst_comb3_09012013"
     in_dir3 <-"/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_gam_CAI_lst_comb3_09032013"
     in_dir4 <- "/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_kriging_CAI_lst_comb3_09042013"
     #path to gam fusion and kriging fusion analyes with hold-out
     in_dir5 <- "/data/project/layers/commons/Oregon_interpolation/output_data_365d_gam_fus_lst_comb3_09092013"
     in_dir6 <- "/data/project/layers/commons/Oregon_interpolation/output_data_365d_gam_fus_lst_comb3_09102013"
     in_dir7 <-"/data/project/layers/commons/Oregon_interpolation/output_data_365d_gam_fus_lst_comb3_09112013"
     in_dir8 <-"/data/project/layers/commons/Oregon_interpolation/output_data_365d_kriging_fus_lst_comb3_09122013"
     in_dir9 <-"/data/project/layers/commons/Oregon_interpolation/output_data_365d_kriging_fus_lst_comb3_09132013"
     in_dir10 <-"/data/project/layers/commons/Oregon_interpolation/output_data_365d_kriging_fus_lst_comb3_09142013"
     in_dir11 <-"/data/project/layers/commons/Oregon_interpolation/output_data_365d_gwr_CAI_lst_comb3_09162013"
     in_dir12 <-"/data/project/layers/commons/Oregon_interpolation/output_data_365d_gwr_CAI_lst_comb3_09172013"
     in_dir13 <-"/data/project/layers/commons/Oregon_interpolation/output_data_365d_gwr_cai_lst_comb3_09282013"
     in_dir14 <-"/data/project/layers/commons/Oregon_interpolation/output_data_365d_gwr_fus_lst_comb3_09232013"
     in_dir15 <-"/data/project/layers/commons/Oregon_interpolation/output_data_365d_gwr_fus_lst_comb3_09262013"
     in_dir16 <-"/data/project/layers/commons/Oregon_interpolation/output_data_365d_gam_cai_lst_comb3_10042013"
     #better as list and load one by one specific element from the object
     raster_prediction_obj1 <-load_obj(file.path(in_dir1,"raster_prediction_obj_gam_CAI_dailyTmax_365d_gam_CAI_lst_comb3_08312013.RData"))
     raster_prediction_obj2 <-load_obj(file.path(in_dir2,"raster_prediction_obj_gam_CAI_dailyTmax_365d_gam_CAI_lst_comb3_09012013.RData"))
     raster_prediction_obj3 <-load_obj(file.path(in_dir3,"raster_prediction_obj_gam_CAI_dailyTmax_365d_gam_CAI_lst_comb3_09032013.RData"))
     raster_prediction_obj4 <-load_obj(file.path(in_dir4,"raster_prediction_obj_kriging_CAI_dailyTmax_365d_kriging_CAI_lst_comb3_09042013.RData"))
     raster_prediction_obj5 <-load_obj(file.path(in_dir5,"raster_prediction_obj_gam_fusion_dailyTmax_365d_gam_fus_lst_comb3_09092013.RData"))
     raster_prediction_obj6 <-load_obj(file.path(in_dir6,"raster_prediction_obj_gam_fusion_dailyTmax_365d_gam_fus_lst_comb3_09102013.RData"))
     raster_prediction_obj7 <-load_obj(file.path(in_dir7,"raster_prediction_obj_gam_fusion_dailyTmax_365d_gam_fus_lst_comb3_09112013.RData"))
     raster_prediction_obj8 <-load_obj(file.path(in_dir8,"raster_prediction_obj_kriging_fusion_dailyTmax_365d_kriging_fus_lst_comb3_09122013.RData"))
     raster_prediction_obj9 <-load_obj(file.path(in_dir9,"raster_prediction_obj_kriging_fusion_dailyTmax_365d_kriging_fus_lst_comb3_09132013.RData"))
     raster_prediction_obj10 <-load_obj(file.path(in_dir10,"raster_prediction_obj_kriging_fusion_dailyTmax_365d_kriging_fus_lst_comb3_09142013.RData"))
     raster_prediction_obj11 <-load_obj(file.path(in_dir11,"raster_prediction_obj_gwr_CAI_dailyTmax_365d_gwr_CAI_lst_comb3_09162013.RData"))
     raster_prediction_obj12 <-load_obj(file.path(in_dir12,"raster_prediction_obj_gwr_CAI_dailyTmax_365d_gwr_CAI_lst_comb3_09172013.RData"))
     raster_prediction_obj13 <-load_obj(file.path(in_dir13,"raster_prediction_obj_gwr_CAI_dailyTmax_365d_gwr_cai_lst_comb3_09282013.RData"))
     raster_prediction_obj14 <-load_obj(file.path(in_dir14,"raster_prediction_obj_gwr_fusion_dailyTmax_365d_gwr_fus_lst_comb3_09232013.RData"))
     raster_prediction_obj15 <-load_obj(file.path(in_dir15,"raster_prediction_obj_gwr_fusion_dailyTmax_365d_gwr_fus_lst_comb3_09262013.RData"))
     raster_prediction_obj16 <-load_obj(file.path(in_dir16,"raster_prediction_obj_gam_CAI_dailyTmax_365d_gam_cai_lst_comb3_10042013.RData"))
     out_dir<-"/home/parmentier/Data/IPLANT_project/paper_multitime_scale__analyses_tables_fig_09032013"
     script_path<-"/home/parmentier/Data/IPLANT_project/env_layers_scripts/" #path to script
     source(file.path(script_path,function_analyses_paper)) #source all functions used in this script.
     in_dir1 <-"/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_gam_day_lst_comb3_08132013"
     in_dir2 <-"/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_gam_day_lst_comb4_08152013"
     #kriging results:
     in_dir3 <-"/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_kriging_day_lst_comb3_07112013"
     #gwr results:
     in_dir4 <-"/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_gwr_day_lst_comb3_part1_07122013"
     #multisampling results (gam)
     #in_dir5<- "/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_gam_daily_mults10_lst_comb3_08082013"
     #in_dir6<- "/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_kriging_daily_mults10_lst_comb3_08062013"
     #in_dir7<- "/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_gwr_daily_mults10_lst_comb3_08072013"
     #Hold-out every two days over 365 days
     in_dir5 <-"/data/project/layers/commons/Oregon_interpolation/output_data_365d_gam_daily_mults1_lst_comb3_10122013"
     in_dir6 <- "/data/project/layers/commons/Oregon_interpolation/output_data_365d_kriging_daily_mults1_lst_comb3_10112013"
     in_dir7 <-"/data/project/layers/commons/Oregon_interpolation/output_data_365d_gwr_daily_mults1_lst_comb3_10132013"
     out_dir<-"/home/parmentier/Data/IPLANT_project/paper_analyses_tables_fig_08032013"
     setwd(out_dir)
     infile_reg_outline <- "/data/project/layers/commons/data_workflow/inputs/region_outlines_ref_files/OR83M_state_outline.shp"  #input region outline defined by polygon: Oregon
     met_stations_outfiles_obj_file<-"/data/project/layers/commons/data_workflow/output_data_365d_gam_fus_lst_test_run_07172013/met_stations_outfiles_obj_gam_fusion__365d_gam_fus_lst_test_run_07172013.RData"
     CRS_locs_WGS84<-CRS("+proj=longlat +ellps=WGS84 +datum=WGS84 +towgs84=0,0,0") #Station coords WGS84
     y_var_name <- "dailyTmax"
     out_prefix<-"analyses_10152013"
     #method_interpolation <- "gam_daily"
     covar_obj_file_1 <- "covar_obj__365d_gam_day_lst_comb3_08132013.RData"
     met_obj_file_1 <- "met_stations_outfiles_obj_gam_daily__365d_gam_day_lst_comb3_08132013.RData"
     #met_stations_outfiles_obj_gam_daily__365d_gam_day_lst_comb3_08132013.RData
     #raster_prediciton object for baseline 1 () s(lat,lon) + s(elev)) and baseline 2 (slat,lon))
     raster_obj_file_1 <- "raster_prediction_obj_gam_daily_dailyTmax_365d_gam_day_lst_comb3_08132013.RData"
     raster_obj_file_2 <- "raster_prediction_obj_gam_daily_dailyTmax_365d_gam_day_lst_comb4_08152013.RData"
     raster_obj_file_3 <- "raster_prediction_obj_kriging_daily_dailyTmax_365d_kriging_day_lst_comb3_07112013.RData"
     raster_obj_file_4 <- "raster_prediction_obj_gwr_daily_dailyTmax_365d_gwr_day_lst_comb3_part1_07122013.RData"
     #multisampling using baseline lat,lon + elev
     #raster_obj_file_5 <- "raster_prediction_obj_gam_daily_dailyTmax_365d_gam_daily_mults10_lst_comb3_08082013.RData"
     #raster_obj_file_6 <- "raster_prediction_obj_kriging_daily_dailyTmax_365d_kriging_daily_mults10_lst_comb3_08062013.RData"
     #raster_obj_file_7 <- "raster_prediction_obj_gwr_daily_dailyTmax_365d_gwr_daily_mults10_lst_comb3_08072013.RData"
     raster_obj_file_5 <- "raster_prediction_obj_gam_daily_dailyTmax_365d_gam_daily_mults1_lst_comb3_10122013.RData"
     raster_obj_file_6 <- "raster_prediction_obj_kriging_daily_dailyTmax_365d_kriging_daily_mults1_lst_comb3_10112013.RData"
     raster_obj_file_7 <- "raster_prediction_obj_gwr_daily_dailyTmax_365d_gwr_daily_mults1_lst_comb3_10132013.RData"
     #Load objects containing training, testing, models objects
     met_stations_obj <- load_obj(met_stations_outfiles_obj_file)
     covar_obj <-load_obj(file.path(in_dir1,covar_obj_file_1)) #Reading covariates object for GAM daily method
     infile_covariates <- covar_obj$infile_covariates
     infile_reg_outline <- covar_obj$infile_reg_outline
     covar_names<- covar_obj$covar_names
     #####
     s_raster <- brick(infile_covariates)
     names(s_raster)<-covar_names
     raster_prediction_obj_1 <-load_obj(file.path(in_dir1,raster_obj_file_1)) #comb3 (baseline 2)
     raster_prediction_obj_2 <-load_obj(file.path(in_dir2,raster_obj_file_2)) #comb4 (baseline 1)
     raster_prediction_obj_3 <-load_obj(file.path(in_dir3,raster_obj_file_3)) #comb3/mod1 baseline 2, kriging
     raster_prediction_obj_4 <-load_obj(file.path(in_dir4,raster_obj_file_4)) #comb3/mod1 baseline 2, gwr
     raster_prediction_obj_5 <-load_obj(file.path(in_dir5,raster_obj_file_5)) #gam daily multisampling 10 to 70%
     raster_prediction_obj_6 <-load_obj(file.path(in_dir6,raster_obj_file_6)) #kriging daily multisampling 10 to 70%
     raster_prediction_obj_7 <-load_obj(file.path(in_dir7,raster_obj_file_7)) #gwr daily multisampling 10 to 70%
     ############### BEGIN SCRIPT #################
     ############ PART 1: Exploration of surfaces bias, delta and climatology surfaces ###########
     #"/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_gam_day_lst_comb4_07152013/"
     in_dir<-"/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_kriging_cai_lst_comb3_07312013"
     out_dir<-""
     setwd(in_dir)
     y_var_name <- "dailyTmax"
     y_var_month <- "TMax"
     #y_var_month <- "LSTD_bias"
     out_suffix <- "_OR_10102013"
     #script_path<-"/data/project/layers/commons/data_workflow/env_layers_scripts/"
     #### FUNCTION USED IN SCRIPT
     function_analyses_paper <-"contribution_of_covariates_paper_interpolation_functions_09232013.R"
     out_prefix<-"/home/parmentier/Data/IPLANT_project/Oregon_interpolation/Oregon_03142013/output_data_365d_GAM_fus_all_lst_05312013"
     method_interpolation <- "kriging_CAI"
     covar_obj_file <- "covar_obj__365d_kriging_cai_lst_comb3_07312013.RData"
     raster_obj_file <- "raster_prediction_obj_kriging_CAI_dailyTmax_365d_kriging_cai_lst_comb3_07312013.RData"
     script_path<-"/data/project/layers/commons/data_workflow/env_layers_scripts/"
     script_path<-"/home/parmentier/Data/IPLANT_project/env_layers_scripts/" #path to script
     source(file.path(script_path,function_analyses_paper)) #source all functions used in this script.
     source(file.path(script_path,"interpolation_method_day_function_multisampling_07052013.R")) #Include GAM_day
     #################################################################################
     ############ ANALYSES 1: Average accuracy per proportion for monthly hold out in muli-timescale mehtods... #######
     #Load objects containing training, testing, models objects
     covar_obj <-load_obj(covar_obj_file)
     infile_covariates <- covar_obj$infile_covariates
     infile_reg_outline <- covar_obj$infile_reg_outline
     covar_names<- covar_obj$covar_names
     tb_mv_gam_CAI <-rbind(raster_prediction_obj1$tb_month_diagnostic_v,raster_prediction_obj2$tb_month_diagnostic_v,raster_prediction_obj3$tb_month_diagnostic_v)
     tb_ms_gam_CAI <-rbind(raster_prediction_obj1$tb_month_diagnostic_s,raster_prediction_obj2$tb_month_diagnostic_s,raster_prediction_obj3$tb_month_diagnostic_s)
     raster_prediction_obj <-load_obj(raster_obj_file)
     tb_v_gam_CAI <-rbind(raster_prediction_obj1$tb_diagnostic_v,raster_prediction_obj2$tb_diagnostic_v,raster_prediction_obj3$tb_diagnostic_v)
     tb_s_gam_CAI <-rbind(raster_prediction_obj1$tb_diagnostic_s,raster_prediction_obj2$tb_diagnostic_s,raster_prediction_obj3$tb_diagnostic_s)
     #prop_obj_gam_CAI_v <- calc_stat_prop_tb_diagnostic(names_mod,names_id,tb_v)
     names(raster_prediction_obj) #list of two objects
     tb_mv_gwr_CAI <-rbind(raster_prediction_obj11$tb_month_diagnostic_v,raster_prediction_obj12$tb_month_diagnostic_v,raster_prediction_obj13$tb_month_diagnostic_v)
     tb_ms_gwr_CAI <-rbind(raster_prediction_obj11$tb_month_diagnostic_s,raster_prediction_obj12$tb_month_diagnostic_s,raster_prediction_obj13$tb_month_diagnostic_s)
     raster_prediction_obj$summary_metrics_v
     tb_v_gwr_CAI <-rbind(raster_prediction_obj11$tb_diagnostic_v,raster_prediction_obj12$tb_diagnostic_v,raster_prediction_obj13$tb_diagnostic_v)
     tb_s_gwr_CAI <-rbind(raster_prediction_obj11$tb_diagnostic_s,raster_prediction_obj12$tb_diagnostic_s,raster_prediction_obj13$tb_diagnostic_s)
     j<-1 #selected month for climatology
     i<-1
     data_s <- raster_prediction_obj$method_mod_obj[[i]]$data_s #training data
     data_v <- raster_prediction_obj$method_mod_obj[[i]]$data_v #testing data
     tb_mv_kriging_CAI <- raster_prediction_obj4$tb_month_diagnostic_v
     tb_ms_kriging_CAI <- raster_prediction_obj4$tb_month_diagnostic_s
     method_mod_obj <- raster_prediction_obj$method_mod_obj #this object contains daily information, training, testing and images
     tb_v_kriging_CAI <- raster_prediction_obj4$tb_diagnostic_v
     tb_s_kriging_CAI <- raster_prediction_obj4$tb_diagnostic_s
     clim_method_mod_obj <- raster_prediction_obj$clim_method_mod_obj
     data_month1 <- clim_method_mod_obj[[1]]$data_month #monthly data
     data_month <- clim_method_mod_obj[[j]]$data_month #monthly data
     clim_mod_obj_month <- clim_method_mod_obj[[j]]
     names(clim_mod_obj_month)
     ### SAME for gam fusion
     #####
     s_raster <- brick(infile_covariates)
     names(s_raster)<-covar_names
     #data_s$y_var <- data_s[[y_var_name]]
     #formula<-"y_var ~ s(lat,lon,elev_s)"
     #date<-strptime(sampling_dat$date[i], "%Y%m%d")   # interpolation date being processed
     month<-strftime(date, "%m")          # current month of the date being processed
     month<-"01"
     LST_month<-paste("mm_",month,sep="") # name of LST month to be matched
     pos<-match("LST",names(s_raster)) #Find the position of the layer with name "LST", if not present pos=NA
     s_raster<-dropLayer(s_raster,pos)      # If it exists drop layer
     LST<-subset(s_raster,LST_month)
     names(LST)<-"LST"
     s_raster<-addLayer(s_raster,LST)            #Adding current month
     tb_mv_gam_fus <-rbind(raster_prediction_obj5$tb_month_diagnostic_v,raster_prediction_obj6$tb_month_diagnostic_v,raster_prediction_obj7$tb_month_diagnostic_v)
     tb_ms_gam_fus <-rbind(raster_prediction_obj5$tb_month_diagnostic_s,raster_prediction_obj6$tb_month_diagnostic_s,raster_prediction_obj7$tb_month_diagnostic_s)
     tb_v_gam_fus <-rbind(raster_prediction_obj5$tb_diagnostic_v,raster_prediction_obj6$tb_diagnostic_v,raster_prediction_obj7$tb_diagnostic_v)
     tb_s_gam_fus <-rbind(raster_prediction_obj5$tb_diagnostic_s,raster_prediction_obj6$tb_diagnostic_s,raster_prediction_obj7$tb_diagnostic_s)
     ### MONTH MODELS
     index<-1
     data_month$y_var<-data_month[[y_var_month]]
     mod1 <- clim_method_mod_obj[[1]]$mod[[1]]
     tb_mv_gwr_fus <-rbind(raster_prediction_obj14$tb_month_diagnostic_v,raster_prediction_obj15$tb_month_diagnostic_v)
     tb_ms_gwr_fus <-rbind(raster_prediction_obj14$tb_month_diagnostic_s,raster_prediction_obj15$tb_month_diagnostic_s)
     tb_v_gwr_fus <-rbind(raster_prediction_obj14$tb_diagnostic_v,raster_prediction_obj15$tb_diagnostic_v)
     tb_s_gwr_fus <-rbind(raster_prediction_obj14$tb_diagnostic_s,raster_prediction_obj15$tb_diagnostic_s)
     clim_method_mod_obj[[1]]$clim #list of files containing model predictions...
     clim_rast<-stack(clim_method_mod_obj[[index]]$clim)
     delta_rast<-raster(method_mod_obj[[index]]$delta) #only one delta image!!!
     pred_temp<-as.character(method_mod_obj[[index]][[y_var_name]]) #list of files with path included
     rast_pred_temp_s <-stack(pred_temp) #stack of temperature predictions from models (daily)
     tb_mv_kriging_fus <-rbind(raster_prediction_obj8$tb_month_diagnostic_v,raster_prediction_obj9$tb_month_diagnostic_v,raster_prediction_obj10$tb_month_diagnostic_v)
     tb_ms_kriging_fus <-rbind(raster_prediction_obj8$tb_month_diagnostic_s,raster_prediction_obj9$tb_month_diagnostic_s,raster_prediction_obj10$tb_month_diagnostic_s)
     names(delta_rast)<-"delta"
     rast_temp_date<-stack(clim_rast,delta_rast)
     #rast_temp_date<-mask(rast_temp_date,LC_mask,file=file.path(out_path,"test.tif"),overwrite=TRUE)
     #bias_d_rast<-raster("fusion_bias_LST_20100103_30_1_10d_GAM_fus5_all_lstd_02082013.rst")
     tb_v_kriging_fus <-rbind(raster_prediction_obj8$tb_diagnostic_v,raster_prediction_obj9$tb_diagnostic_v,raster_prediction_obj10$tb_diagnostic_v)
     tb_s_kriging_fus <-rbind(raster_prediction_obj8$tb_diagnostic_s,raster_prediction_obj9$tb_diagnostic_s,raster_prediction_obj10$tb_diagnostic_s)
     plot(rast_temp_date)
     list_tb <- list(tb_v_gam_CAI,tb_v_kriging_CAI,tb_v_gwr_CAI,tb_s_gam_CAI,tb_s_kriging_CAI,tb_s_gwr_CAI,
                tb_mv_gam_CAI,tb_mv_kriging_CAI,tb_mv_gwr_CAI,tb_ms_gam_CAI,tb_ms_kriging_CAI,tb_ms_gwr_CAI,
                tb_v_gam_fus,tb_v_kriging_fus,tb_v_gwr_fus,tb_s_gam_fus,tb_s_kriging_fus,tb_s_gwr_fus,
                tb_mv_gam_fus,tb_mv_kriging_fus,tb_mv_gwr_fus,tb_ms_gam_fus,tb_ms_kriging_fus,tb_ms_gwr_fus)
     month_m_rast<-subset(clim_rast,"mod1")
     day_m_rast<-subset(rast_pred_temp_s,1)
     names(list_tb) <- c("tb_v_gam_CAI","tb_v_kriging_CAI","tb_v_gwr_CAI","tb_s_gam_CAI","tb_s_kriging_CAI","tb_s_gwr_CAI",
             "tb_mv_gam_CAI","tb_mv_kriging_CAI","tb_mv_gwr_CAI","tb_ms_gam_CAI","tb_ms_kriging_CAI","tb_ms_gwr_CAI",
             "tb_v_gam_fus","tb_v_kriging_fus","tb_v_gwr_fus","tb_s_gam_fus","tb_s_kriging_fus","tb_s_gwr_fus",
             "tb_mv_gam_fus","tb_mv_kriging_fus","tb_mv_gwr_fus","tb_ms_gam_fus","tb_ms_kriging_fus","tb_ms_gwr_fus")
     test<- month_m_rast + delta_rast
     diff <- test - day_m_rast  #this is equal to zeor roughly...
     #list_tb <-list(tb_v_gam_CAI,tb_v_kriging_CAI,tb_v_gwr_CAI,tb_s_gam_CAI,tb_s_kriging_CAI,tb_s_gwr_CAI,tb_mv_gam_CAI,tb_mv_kriging_CAI,tb_ms_gam_CAI,tb_ms_kriging_CAI,tb_ms_gwr_CAI,tb_ms_gwr_CAI #Add fusion here
     #               tb_v_gam_fus,tb_v_kriging_fus,tb_s_gam_fus,tb_s_kriging_fus,tb_mv_gam_fus,tb_mv_kriging_fus,tb_ms_gam_fus,tb_ms_kriging_fus) #Add fusion here
     #names(list_tb) <- c("tb_v_gam_CAI","tb_v_kriging_CAI","tb_v_gwr_CAI","tb_s_gam_CAI","tb_s_kriging_CAI","tb_s_gwr_CAI","tb_mv_gam_CAI","tb_mv_kriging_CAI","tb_ms_gam_CAI","tb_ms_kriging_CAI","tb_ms_gwr_CAI","tb_ms_gwr_CAI" #Add fusion here
     #                   "tb_v_gam_fus","tb_v_kriging_fus","tb_s_gam_fus","tb_s_kriging_fus","tb_mv_gam_fus","tb_mv_kriging_fus","tb_ms_gam_fus","tb_ms_kriging_fus") #Add fusion here
     s_sgdf<-as(day_m_rast,"SpatialGridDataFrame") #Conversion to spatial grid data frame, only convert the necessary layers!!
     #s_spdf<-as(day_m_rast,"SpatialPointsDataFrame") #Conversion to spatial grid data frame, only convert the necessary layers!!
     ##### DAILY AVERAGE ACCURACY : PLOT AND DIFFERENCES...Cd
     names(s_sgdf)<-"var1.pred"
     for(i in 1:length(list_tb)){
       #i <- i+1
       tb <-list_tb[[i]]
       plot_name <- names(list_tb)[i]
       pat_str <- "tb_m"
       if(substr(plot_name,start=1,stop=4)== pat_str){
         names_id <- c("pred_mod","prop")
         plot_formula <- paste("rmse","~prop",sep="",collapse="")
       }else{
         names_id <- c("pred_mod","prop_month")
         plot_formula <- paste("rmse","~prop_month",collapse="")
+      }
       names_mod <-unique(tb$pred_mod)
       prop_obj <- calc_stat_prop_tb_diagnostic(names_mod,names_id,tb)
       avg_tb <- prop_obj$avg_tb
       layout_m<-c(1,1) #one row two columns
       par(mfrow=layout_m)
       png(paste("Figure__accuracy_rmse_prop_month_",plot_name,out_suffix,".png", sep=""),
           height=480*layout_m[1],width=480*layout_m[2])
       p<- xyplot(as.formula(plot_formula),group=pred_mod,type="b",
               data=avg_tb,
               main=paste("rmse ",plot_name,sep=" "),
               pch=1:length(avg_tb$pred_mod),
               par.settings=list(superpose.symbol = list(
               pch=1:length(avg_tb$pred_mod))),
               auto.key=list(columns=5))
       print(p)
     mod1$krige_output<-s_sgdf
     plot(mod1) #does not work because we set krige_output to null!!!
     formula_mod<-formula("y_var~lat*lon + elev_s")
     col_names<-all.vars(formula_mod) #extract terms names from formula object
     if (length(col_names)==1){
       data_fit <-data_month
     }else{
       data_fit <- remove_na_spdf(col_names,data_month)
+    }
     ref_rast<-as(subset(s_raster,1),"SpatialGridDataFrame")
     s_spdf<-select_var_stack(s_raster,formula_mod,spdf=TRUE) #This only works if s_raster is in memory!!! need to be modified
     proj4string(data_fit)<-proj4string(s_spdf)
     test_mod <- autoKrige(formula_mod, input_data=data_fit,new_data=s_spdf,data_variogram=data_fit)
     plot(test_mod)
     prediction_spdf = test_mod$krige_output
     sample_variogram = test_mod$exp_var
     variogram_model = test_mod$var_model
     #### CHECKING THE INPUTS FROM COVARIATES
     LC1 <- subset(s_raster,"LC1")
     plot(LC1,colNA=c("red"))
     LC2 <- subset(s_raster,"LC2")
     plot(LC2,colNA=c("red"))
     LC_names<- paste("LC",1:10,sep="")
     lc_reg_s <-subset(s_raster,LC_names)
     plot(lc_reg_s,colNA="red")
     plot(subset(s_raster,"CANHGHT"),colNA="red")
     #Now create mask based on water areas
     LC12<-raster(lc_reg_s,layer=nlayers(lc_reg_s)) #this is open water
     LC_mask<-LC12
     LC_mask[LC_mask==100]<-NA
     LC_mask <- LC_mask > 100
     CANHGHT <- subset(s_raster,"CANHGHT")
     lc_path<-"/data/project/layers/commons/data_workflow/inputs/lc-consensus-global"
     infile_modis_grid<-"/data/project/layers/commons/data_workflow/inputs/modis_grid/modis_sinusoidal_grid_world.shp" #modis grid tiling system, global
     infile_elev<-"/data/project/layers/commons/data_workflow/inputs/dem-cgiar-srtm-1km-tif/srtm_1km.tif"  #elevation at 1km, global extent to be replaced by the new fused product
     infile_canheight<-"/data/project/layers/commons/data_workflow/inputs/treeheight-simard2011/Simard_Pinto_3DGlobalVeg_JGR.tif"         #Canopy height, global extent
     infile_distoc <- "/data/project/layers/commons/data_workflow/inputs/distance_to_coast/GMT_intermediate_coast_distance_01d_rev.tif" #distance to coast, global extent at 0.01 deg
     CANH<-raster(infile_canheight)
     LC1_W<-raster(list.files(path=lc_path,full.names=T)[4])
     #Correlation matrix for a subset
     r<-subset(s_raster,5:8)
     t44<-layerStats(r,"pearson",na.rm=T)
     image(t44[[1]])
     ###########################################################################################
     ############ PART 2: Granularity-Autocorrelation analyses of predicted surfaces ###########
     #####
     lf2 <- raster_prediction_obj_2$method_mod_obj[[index]][[y_var_name]]
     lf2 #contains the models for gam
     pred_temp_s <-stack(lf2)
     date_selected <- "20109101"
     #names_layers <-c("mod1=s(lat,long)+s(elev)","mod4=s(lat,long)+s(LST)","diff=mod1-mod4")
     names_layers <-c("mod1 = s(lat,long)","mod2 = s(lat,long)+s(elev)","mod3 = s(lat,long)+s(N_w)","mod4 = s(lat,long)+s(E_w)",
                      "mod5 = s(lat,long)+s(LST)","mod6 = s(lat,long)+s(DISTOC)","mod7 = s(lat,long)+s(LC1)",
                      "mod8 = s(lat,long)+s(LC1,LST)","mod9 = s(lat,long)+s(CANHGHT)","mod10 = s(lat,long)+s(LST,CANHGHT)")
     #names_layers<-names(pred_temp_s)
     #names(pred_temp_s)<-names_layers
     s.range <- c(min(minValue(pred_temp_s)), max(maxValue(pred_temp_s)))
     #s.range <- s.range+c(5,-5)
     col.breaks <- pretty(s.range, n=200)
     lab.breaks <- pretty(s.range, n=100)
     temp.colors <- colorRampPalette(c('blue', 'white', 'red'))
     max_val<-s.range[2]
     min_val <-s.range[1]
     #max_val<- -10
     #min_val <- 0
     layout_m<-c(4,3) #one row two columns
     p<-levelplot(pred_temp_s,main="Interpolated Surfaces Model Comparison baseline 1", ylab=NULL,xlab=NULL,
               par.settings = list(axis.text = list(font = 2, cex = 1.3),layout=layout_m,
                                   par.main.text=list(font=2,cex=2),strip.background=list(col="white")),par.strip.text=list(font=2,cex=1.5),
               names.attr=names_layers,col.regions=temp.colors,at=seq(max_val,min_val,by=0.01))
     #col.regions=temp.colors(25))
     print(p)
     #####################################
     ### Create spatial correlogram ####
     r_mod5 <- subset(pred_temp_s,"mod5") #wiht LST
     r_mod1 <- subset(pred_temp_s,"mod1") #wiht lat,long
     r_mod2 <- subset(pred_temp_s,"mod2") #wiht elev
     df_mod5 <- as(r_mod5,"SpatialPointsDataFrame")
     df_mod1 <- as(r_mod1,"SpatialPointsDataFrame")
     df_mod2 <- as(r_mod2,"SpatialPointsDataFrame")
     r_stack <-stack(subset(s_raster,"mm_01"),pred_temp_s)
     df_rs <- as(r_stack,"SpatialPointsDataFrame")
     correg_t<-correlog(coordinates(df_mod5),df_mod5$mod5)
     correg_t<-correlog(coordinates(df_mod5)[,1],coordinates(df_mod5)[,2],df_mod5$mod5)
     data_s<-(as.data.frame((list_data_s[[1]])))
     data_v<-(list_data_v[[1]])
     data_s <-na.omit(data_s[,c("x","y","LST",y_var_name,"elev")])
     correg_t1 <- correlog(as.matrix(cbind(data_s$x,data_s$y)),z=data_s$LST)
     correg_t2 <- correlog(as.matrix(cbind(data_s$x,data_s$y)),z=data_s$elev)
     correg_t3 <- correlog(as.matrix(cbind(data_s$x,data_s$y)),z=data_s[[y_var_name]])
     correg_t4 <- correlog(as.matrix(cbind(data_s$x,data_s$y)),z=data_s[,c("LST",y_var_name,"elev")])
     plot(correg_t1)
     plot(correg_t2,add=T)
     correg_t1[,1]
     correg_t2[,1]
     df_x <- as.data.frame(cbind(correg_t1[,1],correg_t1[,2],correg_t2[,2],correg_t3[,2]))
     names(df_x)<-c("dist","LST",y_var_name,"elev")
     xyplot(LST+dailyTmax+elev~dist,df_x,type="b",
            auto.key=list(title="Var", space = "right", cex=1.0),
            par.settings = list(superpose.symbol=list(pch = 0:3, cex=1)),
+    )
     ### For the whole image:
     sp_correlogram_fun <- function(i,list_param){
       dev.off()
       df <- list_param$list_df[[i]]
       var_zname <- list_param$var_zname[i]
       order_lag <- list_param$order_lag[i]
       method_cor <- list_param$method_cor
       nb_obj <- list_param$nb_obj
       randomisation_par <- list_param$randomisation_par
       sp.cor <- sp.correlogram(nb_obj, df[[var_zname]], order=order_lag,
                                method=method_cor, randomisation=randomisation_par)
       return(sp.cor)
+    }
     #xyplot( rmse ~ prop_month | pred_mod,type="b",data=as.data.frame(avg_tb))
     ##### Calculate differences
     metric_names <- c("mae","rmse","me","r")
     diff_kriging_CAI <- diff_df(tb_s_kriging_CAI,tb_v_kriging_CAI,metric_names)
     diff_gam_CAI <- diff_df(tb_s_gam_CAI[tb_s_gam_CAI$pred_mod!="mod_kr"],tb_v_gam_CAI,metric_names)
     diff_gwr_CAI <- diff_df(tb_s_gwr_CAI,tb_v_gwr_CAI,metric_names)
     layout_m<-c(1,1) #one row two columns
     par(mfrow=layout_m)
     png(paste("Figure__accuracy_rmse_prop_month_",plot_name,out_suffix,".png", sep=""),
         height=480*layout_m[1],width=480*layout_m[2])
     boxplot(diff_kriging_CAI$rmse,diff_gam_CAI$rmse,diff_gwr_CAI$rmse,names=c("kriging_CAI","gam_CAI","gwr_CAI"),
             main="Difference between training and testing daily rmse")
     dev.off()
     #remove prop 0,
     diff_kriging_CAI <- diff_df(tb_s_kriging_CAI[tb_s_kriging_CAI$prop_month!=0,],tb_v_kriging_CAI[tb_v_kriging_CAI$prop_month!=0,],metric_names)
     diff_gam_CAI <- diff_df(tb_s_gam_CAI[tb_s_gam_CAI$prop_month!=0,],tb_v_gam_CAI[tb_v_gam_CAI$prop_month!=0,],metric_names)
     diff_gwr_CAI <- diff_df(tb_s_gwr_CAI[tb_s_gwr_CAI$prop_month!=0,],tb_v_gwr_CAI[tb_v_gwr_CAI$prop_month!=0,],metric_names)
     boxplot(diff_kriging_CAI$rmse,diff_gam_CAI$rmse,diff_gwr_CAI$rmse,names=c("kriging_CAI","gam_CAI","gwr_CAI"),
             main="Difference between training and testing daily rmse")
     #now monthly accuracy
     metric_names <- c("mae","rmse","me","r")
     diff_kriging_m_CAI <- diff_df(tb_ms_kriging_CAI[tb_ms_kriging_CAI$prop!=0,],tb_mv_kriging_CAI,metric_names)
     diff_gam_m_CAI <- diff_df(tb_ms_gam_CAI[tb_ms_gam_CAI$prop!=0,],tb_mv_gam_CAI,metric_names)
     diff_gwr_m_CAI <- diff_df(tb_ms_gwr_CAI[tb_ms_gwr_CAI$prop!=0,],tb_mv_gwr_CAI,metric_names)
     layout_m<-c(1,1) #one row two columns
     par(mfrow=layout_m)
     png(paste("Figure__accuracy_rmse_prop_month_",plot_name,out_suffix,".png", sep=""),
         height=480*layout_m[1],width=480*layout_m[2])
     boxplot(diff_kriging_m_CAI$rmse,diff_gam_m_CAI$rmse,diff_gwr_m_CAI$rmse,names=c("kriging_CAI","gam_CAI","gwr_CAI"),
             main="Difference between training and monhtly testing rmse")
     dev.off()
     #boxplot(diff_kriging_m_CAI$rmse,diff_gam_m_CAI$rmse,diff_gwr_CAI,names=c("kriging_CAI","gam_CAI","gwr_CAI"),
     #        main="Difference between training and monhtly testing rmse")
     ### For fusion
     metric_names <- c("mae","rmse","me","r")
     diff_kriging_fus <- diff_df(tb_s_kriging_fus,tb_v_kriging_fus,metric_names)
     diff_gam_fus <- diff_df(tb_s_gam_fus,tb_v_gam_fus,metric_names)
     diff_gwr_fus <- diff_df(tb_s_gwr_fus,tb_v_gwr_fus,metric_names)
     layout_m<-c(1,1) #one row two columns
     par(mfrow=layout_m)
     png(paste("Figure__accuracy_rmse_prop_month_",plot_name,out_suffix,".png", sep=""),
         height=480*layout_m[1],width=480*layout_m[2])
     boxplot(diff_kriging_fus$rmse,diff_gam_fus$rmse,diff_gwr_fus$rmse,names=c("kriging_fus","gam_fus","gwr_fus"),
             main="Difference between training and testing daily rmse")
     dev.off()
     metric_names <- c("mae","rmse","me","r")
     diff_kriging_m_fus <- diff_df(tb_ms_kriging_fus[tb_ms_kriging_fus$prop!=0,],tb_mv_kriging_fus[tb_mv_kriging_fus$prop!=0,],metric_names)
     diff_gam_m_fus <- diff_df(tb_ms_gam_fus[tb_ms_gam_fus$prop!=0,],tb_mv_gam_fus[tb_mv_gam_fus$prop!=0,],metric_names)
     diff_gwr_m_fus <- diff_df(tb_ms_gwr_fus[tb_ms_gwr_fus$prop!=0,],tb_mv_gwr_fus[tb_mv_gwr_fus$prop!=0,],metric_names)
     layout_m<-c(1,1) #one row two columns
     par(mfrow=layout_m)
     png(paste("Figure__accuracy_rmse_prop_month_",plot_name,out_suffix,".png", sep=""),
         height=480*layout_m[1],width=480*layout_m[2])
     boxplot(diff_kriging_m_fus$rmse,diff_gam_m_fus$rmse,diff_gwr_m_fus$rmse, names=c("kriging_fus","gam_fus","gwr_fus"),
             main="Difference between training and testing FUS rmse")
     dev.off()
     ### NOW PLOT OF COMPARISON BETWEEN Kriging and GAM
     #Now get variance and range for holdout an dmethods.
     tb_v_gam_CAI
     tb_v_gam_fus
     tb_v_kriging_CAI
     tb_v_kriging_fus
     methods_names <- c("tb_v_gam_CAI","tb_v_gam_fus","tb_v_kriging_CAI","tb_v_kriging_fus","tb_v_gwr_CAI","tb_v_gwr_fus")
     list_prop_obj <- vector("list",length=length(methods_names))
     for(i in 1:length(methods_names)){
       tb <- list_tb[[methods_names[i]]]
       names_id <- c("pred_mod","prop_month")
       names_mod <-unique(tb$pred_mod)
       list_prop_obj[[i]] <- calc_stat_prop_tb_diagnostic(names_mod,names_id,tb)
       names(list_prop_obj)[i] <- methods_names[i]
       #avg_tb <- prop_obj$avg_tb
     # 'nb' - neighbourhood of each cell
     #r.nb <- dnearneigh(as.matrix(xy), d1=0.5, d2=1.5)
     # 'nb' - an alternative way to specify the neighbourhood
     # r.nb <- cell2nb(nrow=side, ncol=side, type="queen")
     #sp.cor <- sp.correlogram(r.nb, df_mod5$mod5, order=15,
     #                         method="I", randomisation=FALSE)
     r_stack <-stack(subset(s_raster,c("mm_01","mm_07")),pred_temp_s)
     names(r_stack)[1:2]<-c("mm01","mm_07")
     df_rs <- as(r_stack,"SpatialPointsDataFrame")
     r.nb <- dnearneigh(coordinates(df_rs), d1=res(s_raster)[1]/2, d2=1.5*res(s_raster)[1]) #lag1
     #Do not run... slow
     rk.nb14 <- knearneigh(coordinates(df_rs), k=14) #lag1
     #rk_nb14 <- knearneigh(coordinates(df_rs), k=14) #lag1
     #save(rk_nb14, file = "rk_nb14.RData")
     #rk_nb7 <- knearneigh(coordinates(df_rs), k=7) #lag1
     #save(rk_nb7, file = "rk_nb7.RData")
     #lrk_nb7 <- knn2nb(rk_nb7)
     #m_LST1 <- moran.test(df_rs$mm01,nb2listw(lrk_nb7),na.action=na.omit,zero.policy=TRUE)
     #sp.cor <- sp.correlogram(lrk_nb7, df_rs$mm01, order=7,
     #                         method="I", randomisation=FALSE)
     list_df <- list(df_rs,df_rs,df_rs,df_rs,df_rs)
     var_zname <- c("mm01","mm_07","mod1","mod2","mod5")
     order_lag <- c(14,14,14,14,14)
     method_cor <- "I"
     nb_obj <- r.nb
     randomisation_par <- "FALSE"
     list_param_spat_correlog <- list(list_df,var_zname,order_lag,method_cor,nb_obj,randomisation_par)
     names(list_param_spat_correlog) <- c("list_df","var_zname","order_lag","method_cor","nb_obj","randomisation_par")
     #debug(sp_correlogram_fun)
     #list_sp_correlog  <-sp_correlogram_fun(2,list_param_spat_correlog)
     #r_qc_s <- lapply(1:length(infile_var),FUN=import_list_modis_layers_fun,list_param=list_param_import_modis)
     #r_qc_s <-mclapply(1:11,FUN=import_list_modis_layers_fun,list_param=list_param_import_modis,mc.preschedule=FALSE,mc.cores = 11) #This is the end bracket from mclapply(...) statement
     list_sp_correlog <-mclapply(1:length(list_df),FUN=sp_correlogram_fun,list_param=list_param_spat_correlog ,mc.preschedule=FALSE,mc.cores = 5) #This is the end bracket from mclapply(...) statement
     #does not work...
     print(list_sp_correlog[[1]])
     plot(list_sp_correlog[[1]])
     print(list_sp_correlog[[2]])
     plot(list_sp_correlog[[2]])
     ##### Use filter option to compute lag Moran's I
     #Queen's case for 5 lags...: should do this in a function to generate filters...
     #lag 1: 2*1+1 rows
     f1 <- matrix(c(1,1,1,
 ,0,1,
 ,1,1), nrow=3)
     #lag 2: 2*2+1 rows
     f2 <- matrix(c(1,1,1,1,1,             #filter for lag 2
 ,0,0,0,1,
 ,0,0,0,1,
 ,0,0,0,1,
 ,1,1,1,1),nrow=5)
     f3 <- matrix(c(1,1,1,1,1,1,1,
 ,0,0,0,0,0,1,
 ,0,0,0,0,0,1,
 ,0,0,0,0,0,1,
 ,0,0,0,0,0,1,
 ,0,0,0,0,0,1,
 ,1,1,1,1,1,1),nrow=7)
     f4 <- matrix(c(1,1,1,1,1,1,1,1,1,
 ,0,0,0,0,0,0,0,1,
 ,0,0,0,0,0,0,0,1,
 ,0,0,0,0,0,0,0,1,
 ,0,0,0,0,0,0,0,1,
 ,0,0,0,0,0,0,0,1,
 ,0,0,0,0,0,0,0,1,
 ,0,0,0,0,0,0,0,1,
 ,1,1,1,1,1,1,1,1),nrow=9)
     r<- subset(s_raster,"mm_07")
     Moran(r,f1)
     Moran(r,f2)
     Moran(r,f3)
     #generate automatically filters for MORAN's I in the image...
     autocor_filter_fun <-function(no_lag=1,f_type="queen"){
       if(f_type=="queen"){
         no_rows <- 2*no_lag +1
         border_row <-rep(1,no_rows)
         other_row <- c(1,rep(0,no_rows-2),1)
         other_rows <- rep(other_row,no_rows-2)
         mat_data<- c(border_row,other_rows,border_row)
         autocor_filter<-matrix(mat_data,nrow=no_rows)
+      }
       #if(f_type=="rook){} #add later
       return(autocor_filter)
+    }
     ac_prop_tb_list <- extract_list_from_list_obj(list_prop_obj,"avg_tb")
     nb_rows <- sapply(ac_prop_tb_list,FUN=nrow)
     method_interp_names<-c("gam_CAI","gam_fus","kriging_CAI","kriging_fus","gwr_CAI","gwr_fus")
     for(i in 1:length(methods_names)){
       avg_tb<-ac_prop_tb_list[[i]]
       avg_tb$method_interp <-rep(x=method_interp_names[i],times=nb_rows[i])
       ac_prop_tb_list[[i]] <- avg_tb
     #moran_multipe_fun<-function(i,list_param)
     #  lapply(list_filters,FUN=Moran,x=r)
     r<- subset(r_stack,"mod1")
     Moran(r,f1)
     Moran(r,f2)
     list_filters<-lapply(1:5,FUN=autocor_filter_fun,f_type="queen")
     Moran(r,list_filters[[1]])
     Moran(r,list_filters[[2]])
     plot(subset(s_raster,"mm_09"))
     r_stack <-stack(subset(s_raster,c("mm_09")),pred_temp_s)
     names(r_stack)[1]<-c("mm_09")
     r<- subset(r_stack,"mod1")
     Moran(r) #with lag 1 and default rooks lag correlation
     list_filters<-lapply(1:5,FUN=autocor_filter_fun,f_type="queen")
     #cacluate Moran's I for 5 lags for one layer
     moran_list <- lapply(list_filters,FUN=Moran,x=r)
     moran_multiple_fun<-function(i,list_param){
       #un
       list_filters <-list_param$list_filters
       r <- subset(list_param$r_stack,i)
       moran_list <- lapply(list_filters,FUN=Moran,x=r)
       moran_v <-as.data.frame(unlist(moran_list))
       names(moran_v)<-names(r)
       return(moran_v)
+    }
     #lapply(methods_names,function(i) {rep(x[i],nrows[i],times[i])},times=nb_rows)
     #names(ac_prop_tb_list) <- names(list_prop_obj)
     t44 <- do.call(rbind,ac_prop_tb_list) #contains all accuracy by method, proportion, model, sample etc.
     View(t44)
     t44[which.min(t44$rmse),] #Find the mimum rmse across all models and methods...
     test <- t44[order(t44$rmse),]
     test[1:24,]
     test2<-test[test$method_interp%in% c("gam_fus","gam_CAI"),]
     test2[1:24,]
     #head(ac_prop_tb)
     test3<-subset(test,prop_month==0 & method_interp%in%c("gam_CAI"))
     #test3<-test[test$method_interp%in% c("gam_CAI"),]
     test3[1:24,]
     #list_prop_obj$avg_tb
     #xyplot(as.formula(plot_formula),group=pred_mod,type="b",
     #       data=avg_tb,
     #       main=paste("rmse ",plot_name,sep=" "),
     #       pch=1:length(avg_tb$pred_mod),
     #       par.settings=list(superpose.symbol = list(
     #         pch=1:length(avg_tb$pred_mod))),
     #       auto.key=list(columns=5))
     ## DAILY DEVIATIONS WITH MODELS
     ### Examining results with models for daily deviation called 2: need to subset the models
     #c("mod1.dev_mod1","mod1.dev_mod2","mod2.dev_mod1","mod2.dev_mod2","mod3.dev_mod1","mod3.dev_mod2","mod4.dev_mod1",
     #  "mod4.dev_mod2","mod5.dev_mod1","mod5.dev_mod2","mod6.dev_mod1","mod6.dev_mod2","mod7.dev_mod1","mod7.dev_mod2",
     #  "mod_kr.dev_mod1" "mod_kr.dev_mod2")
     tb_s_gam_CAI_selected <-subset(tb_s_gam_CAI,prop_month==0 & pred_mod%in%c("mod1","mod4","mod5","mod6","mod7","mod8"))
     tb_v_gam_CAI_selected <-subset(tb_v_gam_CAI,prop_month==0 & pred_mod%in%c("mod1","mod4","mod5","mod6","mod7","mod8"))
     tb_s_gwr_CAI_selected <-subset(tb_s_gwr_CAI,prop_month==0 & pred_mod%in%c("mod1","mod4","mod5","mod6","mod7","mod8"))
     tb_v_gwr_CAI_selected <-subset(tb_v_gwr_CAI,prop_month==0 & pred_mod%in%c("mod1","mod4","mod5","mod6","mod7","mod8"))
     tb_s_kriging_CAI_selected <-subset(tb_s_kriging_CAI,prop_month==0 & pred_mod%in%c("mod1","mod4","mod5","mod6","mod7","mod8"))
     tb_v_kriging_CAI_selected <-subset(tb_v_kriging_CAI,prop_month==0 & pred_mod%in%c("mod1","mod4","mod5","mod6","mod7","mod8"))
     tb_s_gam_CAI2_selected <- subset(raster_prediction_obj16$tb_diagnostic_s,pred_mod%in%c("mod1.dev_mod1","mod1.dev_mod2","mod3.dev_mod1",
                                                                                            "mod3.dev_mod2","mod4.dev_mod1",  "mod4.dev_mod2",
                                                                                            "mod5.dev_mod1","mod5.dev_mod2","mod6.dev_mod1",
                                                                                            "mod6.dev_mod2","mod7.dev_mod1","mod7.dev_mod2"))
     tb_v_gam_CAI2_selected <- subset(raster_prediction_obj16$tb_diagnostic_v,pred_mod%in%c("mod1.dev_mod1","mod1.dev_mod2","mod3.dev_mod1",
                                                                                            "mod3.dev_mod2","mod4.dev_mod1",  "mod4.dev_mod2",
                                                                                            "mod5.dev_mod1","mod5.dev_mod2","mod6.dev_mod1",
                                                                                            "mod6.dev_mod2","mod7.dev_mod1","mod7.dev_mod2"))
     metric_names <- c("mae","rmse","me","r")
     diff_gam_cai2 <- diff_df(tb_s_gam_CAI2_selected,tb_v_gam_CAI2_selected,metric_names)
     diff_kriging_CAI_selected <- diff_df(tb_s_kriging_CAI_selected,tb_v_kriging_CAI_selected,metric_names)
     diff_gam_CAI_selected <- diff_df(tb_s_gam_CAI_selected,tb_v_gam_CAI_selected,metric_names)
     diff_gwr_CAI_selected <- diff_df(tb_s_gwr_CAI_selected,tb_v_gwr_CAI_selected,metric_names)
     layout_m<-c(1,1) #one row two columns
     par(mfrow=layout_m)
     png(paste("Figure__accuracy_rmse_prop_month_",plot_name,out_suffix,".png", sep=""),
         height=480*layout_m[1],width=480*layout_m[2])
     boxplot(diff_gam_cai2$rmse,diff_gam_CAI_selected$rmse,
             diff_kriging_CAI_selected$rmse,diff_gwr_CAI_selected$rmse,names=c("gam_cai2","gam_CAI","kriging","gwr"))
     dev.off()
     list_filters<-lapply(1:10,FUN=autocor_filter_fun,f_type="queen")
     list_param_moran <- list(list_filters=list_filters,r_stack=r_stack)
     #moran_r <-moran_multiple_fun(1,list_param=list_param_moran)
     nlayers(r_stack)
     moran_I_df <-mclapply(1:nlayers(r_stack), list_param=list_param_moran, FUN=moran_multiple_fun,mc.preschedule=FALSE,mc.cores = 11) #This is the end bracket from mclapply(...) statement
     moran_df <- do.call(cbind,moran_I_df)
     moran_df$lag <-1:nrow(moran_df)
     #melt(moran_df,id=names(moran_df))
     #moran_df <- do.call(rbind,moran_I_df)
     mydata<-moran_df
     dd <- do.call(make.groups, mydata[,-ncol(mydata)])
     dd$lag <- mydata$lag
     #names(dd)[2]<-"models"
     names_layers <-c("LST",names_layers)
     xyplot(data ~ lag | which, dd,type="b",strip=strip.custom(factor.levels=names_layers))
     #solve problem wiht name

Also available in: Unified diff

Project

General

Profile

Revision 80363c49

Added by Benoit Parmentier over 11 years ago