/ - Diff - Environment and organisms - NCEAS Projects

« Previous | Next »

Revision c447e6b8

Added by Benoit Parmentier almost 9 years ago

ID c447e6b8527a477368cec487333330ede8c75e1f
Parent f1b2b657
Child 5f776b29

turning script into shell callable code for stage 7 mosaicing

     #AUTHOR: Benoit Parmentier
     #CREATED ON: 01/01/2016
     #MODIFIED ON: 04/08/2016
     #MODIFIED ON: 04/11/2016
     #PROJECT: NCEAS INPLANT: Environment and Organisms
     #First source these files:
-...
+    #
     ##################################################################################################
     ### PARAMETERS DEFINED IN THE SCRIPT
     #There are 21 parameters, 1 constant and 8 arguments (drawn from the parameters) for the Rscript call.
     #The arguments are passed directly from Rscript:
     #var <- args[1] # variable being interpolated #param 1, arg 1
     #in_dir1 <- args[2] # This is the output directory containing global prediction e.g./nobackupp6/aguzman4/climateLayers/out/ param 5, arg 2
     #region_name <- args[3] # region e.g. "reg4" param 6, arg 3
     #out_prefix <- args[4] # this is used in creating an output directory,include region name? param 7, arg 4
     #out_dir <- args[5] # output parent dir, can be home dir or other, param 8, arg 5)
     #create_out_dir_param <- args[6] # if TRUE create a output from "output"+out_prefix param 9, arg 6
     #list_year_predicted <- args[7] # enter as list but currently runs on the first element of the list, param 10, arg 7
     #num_cores <- args[8] #number of cores used # param 13, arg 8
     #max_mem <- args[9] # maximum memory, param 21
     ###Loading R library and packages  ou
     library(RPostgreSQL)
     library(maps)
-...
     #script_path <- "/home/parmentier/Data/IPLANT_project/env_layers_scripts"
     script_path <- "/nobackupp8/bparmen1/env_layers_scripts" #path to script
     function_mosaicing_functions <- "global_run_scalingup_mosaicing_function_04102016.R" #PARAM12
     function_mosaicing <-"global_run_scalingup_mosaicing_04082016.R"
     function_mosaicing_functions <- "global_run_scalingup_mosaicing_function_04112016.R" #PARAM12
     function_mosaicing <-"global_run_scalingup_mosaicing_04102016.R"
     source(file.path(script_path,function_mosaicing)) #source all functions used in this script
     source(file.path(script_path,function_mosaicing_functions)) #source all functions used in this script
-...
     #Data is on ATLAS or NASA NEX
     ### PARAMETERS DEFINED IN THE SCRIPT
     #There are 21 parameters, 1 constant and 8 arguments (drawn from the parameters) for the Rscript call.
     #The arguments are passed directly from Rscript:
     #var <- args[1] # variable being interpolated #param 1, arg 1
     #in_dir <- args[2] # This is the output directory containing global prediction e.g./nobackupp6/aguzman4/climateLayers/out/ param 5, arg 2
     #region_name <- args[3] # region e.g. "reg4" param 6, arg 3
     #out_suffix <- args[4] # formely out_prefix, this is used in creating an output directory, it is suggested to use "reg4" or same as region_name
     #out_dir <- args[5] # output parent dir, can be home dir or other, param 8, arg 5
     #create_out_dir_param <- args[6] # if TRUE create a output from "output"+out_prefix param 9, arg 6
     #year_predicted <- args[7] # enter as list but currently runs on the first element of the list, param 10, arg 7
     #num_cores <- args[8] #number of cores used # param 13, arg 8
     #max_mem <- args[9] # maximum memory, param 21
     #mosaicing_method <- arg[10] #PARAM5
     #metric_name <- arg[11] #"rmse" #RMSE, MAE etc. #PARAM 8
     #day_to_mosaic_range <- arg[12] #c("19910101","19910103") #if null run all year
     #infile_mask <- arg[12] # "/nobackupp8/bparmen1/NEX_data/regions_input_files/r_mask_reg4.tif"
     #df_assessment_files_name <- arg[13] #"/nobackupp6/aguzman4/climateLayers/out/reg4/assessment/output_reg4_1991/df_assessment_files_reg4_1991_reg4_1991.txt" # data.frame with all files used in assessmnet, PARAM 21
     #algorithm <- arg[14] #"python" #PARAM 28 #if R use mosaic function for R, if python use modified gdalmerge script from Alberto Guzmann
     #layers_option <- arg[15] #c("var_pred") #options are:
     #res_training, res_testing,ac_training, ac_testing, var_pred
     #tmp_files <- arg[16] #FALSE
     #mosaicing_method <- c("unweighted","use_edge_weights") #PARAM5
     #metric_name <- "rmse" #RMSE, MAE etc. #PARAM 8
     #day_to_mosaic_range <- c("19910101","19910103") #if null run all year
     #infile_mask <- "/nobackupp8/bparmen1/NEX_data/regions_input_files/r_mask_reg4.tif"
     #df_assessment_files_name <- "/nobackupp6/aguzman4/climateLayers/out/reg4/assessment/output_reg4_1991/df_assessment_files_reg4_1991_reg4_1991.txt" # data.frame with all files used in assessmnet, PARAM 21
     #algorithm <- "python" #PARAM 28 #if R use mosaic function for R, if python use modified gdalmerge script from Alberto Guzmann
     #layers_option <- c("var_pred") #options are:
     #res_training, res_testing,ac_training, ac_testing, var_pred
     #tmp_files <- FALSE
     var <- args[1] # variable being interpolated #param 1, arg 1
     var<-"TMAX" # variable being interpolated #param 1, arg 1
-...
     #PARAM 2
     #in_dir <- "/data/project/layers/commons/NEX_data/output_run10_1500x4500_global_analyses_pred_1992_12072015" #NCEAS
     #in_dir <- "/nobackupp8/bparmen1/output_run10_1500x4500_global_analyses_pred_1992_12072015" #NEX
     in_dir <- "/nobackupp6/aguzman4/climateLayers/out/"
     in_dir <- "/nobackupp6/aguzman4/climateLayers/out/"
     in_dir <- args[2]
     interpolation_method <- c("gam_CAI") #PARAM3
     #var <- args[1] # variable being interpolated #param 1, arg 1
     #in_dir <- args[2] # This is the output directory containing global prediction e.g./nobackupp6/aguzman4/climateLayers/out/ param 5, arg 2
     #region_name <- args[3] # region e.g. "reg4" param 6, arg 3
     #out_suffix <- args[4] # formely out_prefix, this is used in creating an output directory, it is suggested to use "reg4" or same as region_name
     #out_dir <- args[5] # output parent dir, can be home dir or other, param 8, arg 5
     #create_out_dir_param <- args[6] # if TRUE create a output from "output"+out_prefix param 9, arg 6
     #year_predicted <- args[7] # enter as list but currently runs on the first element of the list, param 10, arg 7
     #num_cores <- args[8] #number of cores used # param 13, arg 8
     #max_mem <- args[9] # maximum memory, param 21
     #mosaicing_method <- args[10] #PARAM5
     #metric_name <- args[11] #"rmse" #RMSE, MAE etc. #PARAM 8
     #day_to_mosaic_range <- arg[12] #c("19910101","19910103") #if null run all year
     #infile_mask <- args[13] # "/nobackupp8/bparmen1/NEX_data/regions_input_files/r_mask_reg4.tif"
     #df_assessment_files_name <- args[14] #"/nobackupp6/aguzman4/climateLayers/out/reg4/assessment/output_reg4_1991/df_assessment_files_reg4_1991_reg4_1991.txt" # data.frame with all files used in assessmnet, PARAM 21
     #algorithm <- args[15] #"python" #PARAM 28 #if R use mosaic function for R, if python use modified gdalmerge script from Alberto Guzmann
     #layers_option <- args[16] #c("var_pred") #options are:
     #res_training, res_testing,ac_training, ac_testing, var_pred
     #tmp_files <- args[17] #FALSE
     region_name <- args[3]
     region_name <- "reg4" #PARAM 4 #reg4 South America, Africa reg5,Europe reg2, North America reg1, Asia reg3
     mosaicing_method <- c("unweighted","use_edge_weights") #PARAM5
     #out_suffix <- paste(region_name,"_","run10_1500x4500_global_analyses_pred_1991_04052016",sep="") #PARAM 6
     #out_suffix_str <- "run10_1500x4500_global_analyses_pred_1991_04052016" #PARAM 7
     out_suffix <- args[4]
     out_suffix <- region_name #PARAM 6
     out_suffix_str <- region_name #PARAM 7
     metric_name <- "rmse" #RMSE, MAE etc. #PARAM 8
     pred_mod_name <- "mod1" #PARAM 9
     var_pred <- "res_mod1" #used in residuals mapping #PARAM 10
     #out_dir <- in_dir #PARAM 11
     out_dir <- args[5]
     out_dir <- "/nobackupp8/bparmen1/climateLayers/out/reg4" #PARAM 11, use this location for now
     create_out_dir_param <- args[6]
     create_out_dir_param <- TRUE #PARAM 12
     year_predicted <- args[7]
     year_predicted <- 1991 #PARAM 31
     num_cores <- args[8]
     num_cores <- 6 #PARAM 17
     #max number of cells to read in memory
     max_mem<-args[9]
     mosaicing_method <- c("unweighted","use_edge_weights") #PARAM5
     mosaicing_method <- args[10]
     metric_name <- args[11]
     metric_name <- "rmse" #RMSE, MAE etc. #PARAM 8
     #if daily mosaics NULL then mosaicas all days of the year #PARAM 13
     #day_to_mosaic <- c("19910101","19910102","19910103") #,"19920104","19920105") #PARAM9, two dates note in /tiles for now on NEX
     day_to_mosaic_range <- c("19910101","19910103") #if null run all year
     day_to_mosaic_range <- c("19910101","19910101") #if null run all year
     day_to_mosaic_range <- args[12]
     ###Separate folder for masks by regions, should be listed as just the dir!!... #PARAM 20
     infile_mask <- "/nobackupp8/bparmen1/NEX_data/regions_input_files/r_mask_reg4.tif"
     inflie_mask <- args[13]
     #infile_mask <- "/data/project/layers/commons/NEX_data/regions_input_files/r_mask_reg4.tif"
     ## All of this is interesting so use df_assessment!!
     #path_assessment <- "/nobackupp6/aguzman4/climateLayers/out/reg4/assessment/output_reg4_1991"
     #path_assessment <- file.path(in_dir,region_name,"assessment",paste("output_",region_name,year_processed,sep=""))
     df_assessment_files_name <- args[14]
     df_assessment_files_name <- "/nobackupp6/aguzman4/climateLayers/out/reg4/assessment/output_reg4_1991/df_assessment_files_reg4_1991_reg4_1991.txt" # data.frame with all files used in assessmnet, PARAM 21
     algorithm <- args[15]
     algorithm <- "python" #PARAM 28 #if R use mosaic function for R, if python use modified gdalmerge script from Alberto Guzmann
     #algorithm <- "R" #if R use mosaic function for R, if python use modified gdalmerge script from Alberto Guzmann
     layers_option <- c("var_pred") #options are:
     #res_training, res_testing,ac_training, ac_testing, var_pred
     tmp_files <- FALSE
     pred_mod_name <- "mod1" #PARAM 9
     var_pred <- "res_mod1" #used in residuals mapping #PARAM 10
     #CRS_WGS84 <- CRS("+proj=longlat +ellps=WGS84 +datum=WGS84 +towgs84=0,0,0") #Station coords WGS84 #CONSTANT1
     #CRS_locs_WGS84<-CRS("+proj=longlat +ellps=WGS84 +datum=WGS84 +towgs84=0,0,0") #Station coords WGS84
     #proj_str<- CRS_WGS84 #PARAM 8 #check this parameter
-...
     NA_value <- -9999 #PARAM 15
     NA_flag_val <- NA_value #PARAM 16
     num_cores <- 6 #PARAM 17
     #region_names <- c("reg23","reg4") #selected region names, ##PARAM 18
     use_autokrige <- F #PARAM 19
     proj_str <- CRS_locs_WGS84
     ###Separate folder for masks by regions, should be listed as just the dir!!... #PARAM 20
     infile_mask <- "/nobackupp8/bparmen1/NEX_data/regions_input_files/r_mask_reg4.tif"
     #infile_mask <- "/data/project/layers/commons/NEX_data/regions_input_files/r_mask_reg4.tif"
     ## All of this is interesting so use df_assessment!!
     year_processed <- 1991 #PARAM 31
     #path_assessment <- "/nobackupp6/aguzman4/climateLayers/out/reg4/assessment/output_reg4_1991"
     #path_assessment <- file.path(in_dir,region_name,"assessment",paste("output_",region_name,year_processed,sep=""))
     df_assessment_files_name <- "/nobackupp6/aguzman4/climateLayers/out/reg4/assessment/output_reg4_1991/df_assessment_files_reg4_1991_reg4_1991.txt" # data.frame with all files used in assessmnet, PARAM 21
     #in_dir can be on NEX or Atlas
     #python script and gdal on NEX NASA:
-...
     #mosaic_python <- "/data/project/layers/commons/NEX_data/sharedCode" #PARAM 26
     #python_bin <- "/usr/bin" #PARAM 27
     algorithm <- "python" #PARAM 28 #if R use mosaic function for R, if python use modified gdalmerge script from Alberto Guzmann
     #algorithm <- "R" #if R use mosaic function for R, if python use modified gdalmerge script from Alberto Guzmann
     match_extent <- "FALSE" #PARAM 29 #try without matching!!!
     #for residuals...
     list_models <- NULL #PARAM 30
     #list_models <- paste(var_pred,"~","1",sep=" ") #if null then this is the default...
     #max number of cells to read in memory
     max_mem<-args[11]
     #in_dir_tiles <- file.path(in_dir,"tiles") #this is valid both for Atlas and NEX
     layers_option <- c("var_pred") #options are:
     #res_training, res_testing,ac_training, ac_testing, var_pred
     tmp_files <- FALSE
     #rasterOptions(maxmemory=1e+07,timer=TRUE)
     list_param_run_mosaicing_prediction <- list(in_dir,y_var_name,interpolation_method,region_name,
                      mosaicing_method,out_suffix,out_suffix_str,metric_name,pred_mod_name,var_pred,
                      create_out_dir_param,day_to_mosaic_range,proj_str,file_format,NA_value,num_cores,
                      create_out_dir_param,day_to_mosaic_range,year_predicted,proj_str,file_format,NA_value,num_cores,
                      use_autokrige,infile_mask,df_assessment_files_name,mosaic_python,
                      python_bin,algorithm,match_extent,list_models,layers_option,tmp_files)
     param_names <- c("in_dir","y_var_name","interpolation_method","region_name",
                      "mosaicing_method","out_suffix","out_suffix_str","metric_name","pred_mod_name","var_pred",
                      "create_out_dir_param","day_to_mosaic_range","proj_str","file_format","NA_value","num_cores",
                      "create_out_dir_param","day_to_mosaic_range","year_predicted","proj_str","file_format","NA_value","num_cores",
                      "use_autokrige","infile_mask","df_assessment_files_name","mosaic_python",
                      "python_bin","algorithm","match_extent","list_models","layers_option","tmp_files")
     names(list_param_run_mosaicing_prediction) <- param_names
-...
       #list_param_run_mosaicing_prediction
+    }
     #runs in 42 minutes for 3 dates but note that beyond date 1, the process is about 11 minutes or so.
     ###############   END OF SCRIPT   ###################
     #####################################################

Also available in: Unified diff

Project

General

Profile

Revision c447e6b8

Added by Benoit Parmentier almost 9 years ago