Project

General

Profile

Download (8.88 KB) Statistics
| Branch: | Revision:
1 35d59dc1 Adam M. Wilson @ pfe
#### Script to facilitate processing of MOD06 data
2
  
3 c1352601 Adam M. Wilson @ pfe
setwd("/nobackupp1/awilso10/mod35")
4 35d59dc1 Adam M. Wilson @ pfe
5
library(rgdal)
6
library(raster)
7
library(RSQLite)
8
9
10
verbose=T
11
12
## get MODLAND tile information
13
tb=read.table("http://landweb.nascom.nasa.gov/developers/sn_tiles/sn_bound_10deg.txt",skip=6,nrows=648,header=T)
14
tb$tile=paste("h",sprintf("%02d",tb$ih),"v",sprintf("%02d",tb$iv),sep="")
15 aba23d60 Adam M. Wilson @ pfe
tb=tb[tb$lon_min!=-999,]
16 35d59dc1 Adam M. Wilson @ pfe
save(tb,file="modlandTiles.Rdata")
17
load("modlandTiles.Rdata")
18
19
## delete temporary log file that can grow to GB
20
system("rm /nobackupp1/awilso10/software/heg/TOOLKIT_MTD/runtime/LogStatus")
21
22
### list of tiles to process
23 aba23d60 Adam M. Wilson @ pfe
tiles=c("h10v08","h11v08","h12v08","h10v07","h11v07","h12v07")  # South America
24
25
## subset to MODLAND tiles
26 b3344197 Adam M. Wilson @ pfe
 modlandtiles=system("ls -r /nobackupp4/datapool/modis/MOD11A1.005/2010* | grep hdf$ | cut -c18-23 | sort | uniq - ",intern=T)
27 aba23d60 Adam M. Wilson @ pfe
 tb$land=tb$tile%in%modlandtiles
28
tiles=tb$tile[tb$land]
29
30
## subset tile corner matrix to tiles selected above
31 35d59dc1 Adam M. Wilson @ pfe
tile_bb=tb[tb$tile%in%tiles,]
32
33
### get list of files to process
34
datadir="/nobackupp4/datapool/modis/MOD35_L2.006/"
35
36
outdir="daily/" #paste("daily/",tile,sep="")
37
38
##find swaths in region from sqlite database for the specified date/tile
39 b3344197 Adam M. Wilson @ pfe
## this takes a while, about 30 minutes, so only rebuild if you need to update what's available...
40
rebuildswathtable=F
41
if(rebuildswathtable){
42
  ## path to swath database
43
  db="/nobackupp4/pvotava/DB/export/swath_geo.sql.sqlite3.db"
44
  con=dbConnect("SQLite", dbname = db)
45
  fs=do.call(rbind.data.frame,lapply(1:nrow(tile_bb),function(i){
46
    d=dbGetQuery(con,paste("SELECT * from swath_geo6
47 35d59dc1 Adam M. Wilson @ pfe
            WHERE east>=",tile_bb$lon_min[i]," AND
48
                  west<=",tile_bb$lon_max[i]," AND
49
                  north>=",tile_bb$lat_min[i]," AND
50
                  south<=",tile_bb$lat_max[i])
51 b3344197 Adam M. Wilson @ pfe
      )
52
    d$tile=tile_bb$tile[i]
53
    print(paste("Finished tile",tile_bb$tile[i]))
54
    return(d)
55
  }))
56
  con=dbDisconnect(con)
57
  fs$id=substr(fs$id,7,19)
58
59
  ## Identify which swaths are available in the datapool
60
  swaths=data.frame(path=list.files(datadir,pattern=paste("hdf$"),recursive=T,full=T),stringsAsFactors=F)  #all swaths in data pool
61
  swaths$id=substr(basename(swaths$path),10,22)
62
  fs$exists=fs$id%in%swaths$id 
63
  fs$path=swaths$path[match(fs$id,swaths$id)]
64
65
  ## write tile-swath list to disk
66
  save(fs,swaths,file="swathtile.Rdata")
67
}
68
69
load("swathtile.Rdata")
70
71 35d59dc1 Adam M. Wilson @ pfe
if(verbose) print(paste("###############",nrow(fs)," swath IDs recieved from database"))
72
73
## get all unique dates
74
fs$dateid=format(as.Date(paste(fs$year,fs$day,sep=""),"%Y%j"),"%Y%m%d")
75 b3344197 Adam M. Wilson @ pfe
#alldates=unique(fs$dateid[fs$exists])
76 35d59dc1 Adam M. Wilson @ pfe
77
#### Generate submission file
78 aba23d60 Adam M. Wilson @ pfe
startdate="2000-03-01"
79
stopdate="2011-12-31"
80 b3344197 Adam M. Wilson @ pfe
## just 2005-2010
81
startdate="2009-01-01"
82
stopdate="2009-12-31"
83 aba23d60 Adam M. Wilson @ pfe
84
alldates=format(seq(as.Date(startdate),as.Date(stopdate),1),"%Y%m%d")
85
86 35d59dc1 Adam M. Wilson @ pfe
proclist=expand.grid(date=alldates,tile=tiles)
87
proclist$year=substr(proclist$date,1,4)
88 aba23d60 Adam M. Wilson @ pfe
89
## identify tile-dates with no available swaths
90
avail=unique(cbind.data.frame(tile=fs$tile,date=fs$dateid)[fs$exists, ])
91
proclist$avail=paste(proclist$tile,proclist$date,sep="_")%in%paste(avail$tile,avail$date,sep="_")
92
93 35d59dc1 Adam M. Wilson @ pfe
## identify which have been completed
94 b3344197 Adam M. Wilson @ pfe
#fdone=data.frame(path=system("ssh lou 'find MOD35/daily -name \"*.nc\"' ",intern=T))
95
fdone=data.frame(path=list.files(outdir,pattern="nc$",recursive=T))
96 35d59dc1 Adam M. Wilson @ pfe
fdone$date=substr(basename(as.character(fdone$path)),14,21)
97
fdone$tile=substr(basename(as.character(fdone$path)),7,12)
98
proclist$done=paste(proclist$tile,proclist$date,sep="_")%in%substr(basename(as.character(fdone$path)),7,21)
99
100
### report on what has already been processed
101
print(paste(sum(!proclist$done)," out of ",nrow(proclist)," (",round(100*sum(!proclist$done)/nrow(proclist),2),"%) remain"))
102
table(tile=proclist$tile[proclist$done],year=proclist$year[proclist$done])
103 b3344197 Adam M. Wilson @ pfe
table(table(tile=proclist$tile[!proclist$done],year=proclist$year[!proclist$done]))
104
105
### explore tile counts
106
#x=table(tile=proclist$tile[proclist$done],year=proclist$year[proclist$done])
107
#x=x[order(rownames(x)),]
108 35d59dc1 Adam M. Wilson @ pfe
109
script="/u/awilso10/environmental-layers/climate/procedures/MOD35_L2_process.r"
110
111
## write the table processed by mpiexec
112 be64daa8 Adam M. Wilson @ pfe
tp=((!proclist$done)&proclist$avail)  #date-tiles to process
113 aba23d60 Adam M. Wilson @ pfe
table(Available=proclist$avail,Completed=proclist$done)
114
115
write.table(paste("--verbose ",script," --date ",proclist$date[tp]," --verbose T --tile ",proclist$tile[tp],sep=""),
116 35d59dc1 Adam M. Wilson @ pfe
file=paste("notdone.txt",sep=""),row.names=F,col.names=F,quote=F)
117
118
### qsub script
119
cat(paste("
120
#PBS -S /bin/bash
121 171a4e16 Adam M. Wilson @ pfe
##PBS -l select=1:ncpus=8:mpiprocs=8
122
#PBS -l select=100:ncpus=8:mpiprocs=8
123
#PBS -l walltime=8:00:00
124
##PBS -l walltime=2:00:00
125 35d59dc1 Adam M. Wilson @ pfe
#PBS -j n
126
#PBS -m be
127
#PBS -N mod35
128 171a4e16 Adam M. Wilson @ pfe
#PBS -q normal
129
##PBS -q devel
130 35d59dc1 Adam M. Wilson @ pfe
#PBS -V
131
132 171a4e16 Adam M. Wilson @ pfe
CORES=800
133 be64daa8 Adam M. Wilson @ pfe
#CORES=160
134
135 35d59dc1 Adam M. Wilson @ pfe
HDIR=/u/armichae/pr/
136 5af36cdd Adam M. Wilson @ pfe
  source $HDIR/etc/environ.sh
137 35d59dc1 Adam M. Wilson @ pfe
  source /u/awilso10/environ.sh
138
  source /u/awilso10/.bashrc
139
IDIR=/nobackupp1/awilso10/mod35/
140
##WORKLIST=$HDIR/var/run/pxrRgrs/work.txt
141
WORKLIST=$IDIR/notdone.txt
142
EXE=Rscript
143
LOGSTDOUT=$IDIR/log/mod35_stdout
144
LOGSTDERR=$IDIR/log/mod35_stderr
145
### use mpiexec to parallelize across days
146
mpiexec -np $CORES pxargs -a $WORKLIST -p $EXE -v -v -v --work-analyze 1> $LOGSTDOUT 2> $LOGSTDERR
147
",sep=""),file=paste("mod35_qsub",sep=""))
148
149
### Check the files
150
system(paste("cat mod35_qsub",sep=""))
151
system(paste("cat notdone.txt | head",sep=""))
152
system(paste("cat notdone.txt | wc -l ",sep=""))
153
154
## Submit it
155
system(paste("qsub mod35_qsub",sep=""))
156 b3344197 Adam M. Wilson @ pfe
157 c24e32a8 Adam M. Wilson @ pfe
system("qstat -u awilso10")
158 35d59dc1 Adam M. Wilson @ pfe
159
#######################################################
160
### Now submit the script to generate the climatologies
161
162 5af36cdd Adam M. Wilson @ pfe
163 35d59dc1 Adam M. Wilson @ pfe
tiles
164 b3344197 Adam M. Wilson @ pfe
ctiles=c("h10v08","h11v08","h12v08","h10v07","h11v07","h12v07")  # South America
165
166 be64daa8 Adam M. Wilson @ pfe
ctiles=tiles#[c(1:3)]  #subset to only some tiles (for example if some aren't finished yet)?
167 aba23d60 Adam M. Wilson @ pfe
climatescript="/pleiades/u/awilso10/environmental-layers/climate/procedures/MOD35_Climatology.r"
168 35d59dc1 Adam M. Wilson @ pfe
169 be64daa8 Adam M. Wilson @ pfe
## check which tiles have been processed and are on lou with a filename "MOD35_[tile].nc"
170 b3344197 Adam M. Wilson @ pfe
cdone=data.frame(path="",tile="")  #use this if you want to re-run everything
171 be64daa8 Adam M. Wilson @ pfe
cdone=data.frame(path=sapply(strsplit(basename(
172
                   system("ssh lou 'find MOD35/summary -name \"MOD35_h[0-9][0-9]v[0-9][0-9].nc\"' ",intern=T)),split="_"),function(x) x[2]))
173 5af36cdd Adam M. Wilson @ pfe
cdone=data.frame(path=sapply(strsplit(basename(
174
                   system("find summary -name \"MOD35_h[0-9][0-9]v[0-9][0-9].nc\"",intern=T)),split="_"),function(x) x[2]))
175 be64daa8 Adam M. Wilson @ pfe
cdone$tile=substr(basename(as.character(cdone$path)),1,6)
176 b3344197 Adam M. Wilson @ pfe
print(paste(length(ctiles[!ctiles%in%cdone$tile]),"Tiles still need to be processed"))
177 be64daa8 Adam M. Wilson @ pfe
178 35d59dc1 Adam M. Wilson @ pfe
## write the table processed by mpiexec
179 be64daa8 Adam M. Wilson @ pfe
write.table(paste("--verbose ",climatescript," --verbose T --tile ",ctiles[!ctiles%in%cdone$tile],sep=""),
180 35d59dc1 Adam M. Wilson @ pfe
file=paste("notdone_climate.txt",sep=""),row.names=F,col.names=F,quote=F)
181
182
## delay start until previous jobs have finished?
183
delay=F
184
## check running jobs to get JobID of job you want to wait for
185
system("qstat -u awilso10")
186
## enter JobID here:
187
job="881394.pbspl1.nas.nasa.gov"
188
189
### qsub script
190
cat(paste("
191
#PBS -S /bin/bash
192 5af36cdd Adam M. Wilson @ pfe
#PBS -l select=40:ncpus=8:mem=94
193
#PBS -l walltime=2:00:00
194 35d59dc1 Adam M. Wilson @ pfe
#PBS -j n
195
#PBS -m be
196
#PBS -N mod35_climate
197 5af36cdd Adam M. Wilson @ pfe
#PBS -q devel
198
##PBS -q normal
199 b3344197 Adam M. Wilson @ pfe
##PBS -q ldan
200 35d59dc1 Adam M. Wilson @ pfe
#PBS -V
201
",if(delay) paste("#PBS -W depend=afterany:",job,sep="")," 
202
203 5af36cdd Adam M. Wilson @ pfe
CORES=320
204 be64daa8 Adam M. Wilson @ pfe
HDIR=/u/armichae/pr/
205 aba23d60 Adam M. Wilson @ pfe
  source $HDIR/etc/environ.sh
206
  source /pleiades/u/awilso10/environ.sh
207
  source /pleiades/u/awilso10/.bashrc
208 35d59dc1 Adam M. Wilson @ pfe
IDIR=/nobackupp1/awilso10/mod35/
209
##WORKLIST=$HDIR/var/run/pxrRgrs/work.txt
210
WORKLIST=$IDIR/notdone_climate.txt
211
EXE=Rscript
212
LOGSTDOUT=$IDIR/log/climatology_stdout
213
LOGSTDERR=$IDIR/log/climatology_stderr
214 aba23d60 Adam M. Wilson @ pfe
### use mpiexec to parallelize across tiles
215 35d59dc1 Adam M. Wilson @ pfe
mpiexec -np $CORES pxargs -a $WORKLIST -p $EXE -v -v -v --work-analyze 1> $LOGSTDOUT 2> $LOGSTDERR
216
",sep=""),file=paste("mod35_climatology_qsub",sep=""))
217
218
## check files
219
system(paste("cat mod35_climatology_qsub",sep=""))        #qsub submission script
220
system(paste("cat notdone_climate.txt | head",sep=""))    #top of job file
221
system(paste("cat notdone_climate.txt | wc -l ",sep=""))  #number of jobs to be run
222
223
## Submit it
224
system(paste("qsub mod35_climatology_qsub",sep=""))
225
226
## check progress
227
system("qstat -u awilso10")
228
229
## start interactive job on compute node for debugging
230
# system("qsub -I -l walltime=2:00:00 -lselect=2:ncpus=16:model=san -q devel")
231
232
233
#################################################################
234
### copy the files back to Yale
235
236 5af36cdd Adam M. Wilson @ pfe
237 be64daa8 Adam M. Wilson @ pfe
system("ssh lou")
238
#scp `find MOD35/summary -name "MOD35_h[0-9][0-9]v[0-9][0-9].nc"` adamw@acrobates.eeb.yale.edu:/data/personal/adamw/projects/interp/data/modis/mod35/summary/
239 5af36cdd Adam M. Wilson @ pfe
system("rsync -cavv `find summary -name \"MOD35_h[0-9][0-9]v[0-9][0-9]_2009mean.nc\"` adamw@acrobates.eeb.yale.edu:/data/personal/adamw/projects/interp/data/modis/mod35/summary/")
240
system("rsync -cavv `find summary -name \"MOD35_h[0-9][0-9]v[0-9][0-9].nc\"` adamw@acrobates.eeb.yale.edu:/data/personal/adamw/projects/interp/data/modis/mod35/summary/")
241
242
243
system("gdalbuildvrt MOD35C6_2009.vrt summary/*2009mean.nc ") 
244
system("gdal_translate -stats -co \"COMPRESS=LZW\" -of GTiff MOD35C6_2009.vrt MOD35C6_2009.tif ")              
245
system("scp MOD35C6_2009.tif adamw@acrobates.eeb.24.177.10.190:/Users/adamw/Downloads/")
246 be64daa8 Adam M. Wilson @ pfe
exit
247 35d59dc1 Adam M. Wilson @ pfe