/ - Diff - Environment and organisms - NCEAS Projects

« Previous | Next »

Revision 7a06885b

Added by Jim Regetz over 12 years ago

ID 7a06885b334538aadc833759175e9d707eeae44e

numerous comment, format, and variable name changes

     #!/usr/bin/env python
     ############################################################################
     # MODULE:   r.plane for GRASS 5.7; based on r.plane for GRASS 5
     # MODULE:   r.multiscalesmooth for GRASS
     # AUTHOR(S):    Original algorithm and AML implementation by John
     #               Gallant. Translation to GRASS/Python by Jim Regetz.
     # REFERENCES:
-...
     # create set to store names of temporary maps to be deleted upon exit
     tmp_rast = set()
     #@atexit.register
     def cleanup():
         gs.message("Removing temporary files...", flag='i')
         for rast in tmp_rast:
             gs.run_command("g.remove", rast=rast, quiet=True)
     def report():
         gs.debug("raster report...")
         for rast in tmp_rast:
             info = gs.raster_info(rast)
             gs.debug('%s: %s (%f-%f)' % (rast, info['datatype'],
                 info['min'], info['max']))
     def coarsen_region(factor=3):
         gs.run_command('g.region',
             rows=gs.region()['rows']/3,
-...
         chisqb = (-5.871 - 3.675 * math.log10(alpha) + 4.690 *
             math.pow(alpha, 0.3377))
         # set number of aggregation levels and neighborhood size
         NUM_LEVELS = 4
         NUM_CELLS = 3
         gs.message("Preparing initial grids", flag='i')
         # create copy of initial grid of values using current region
         gs.mapcalc('z0 = ${input}', input=input, quiet=True)
         tmp_rast.add('z0')
         # set number of aggregation levels and neighborhood size
         NUM_LEVELS = 4
         NUM_CELLS = 3
         # expand region to accommodate integer number of cells at coarsest
         # level, by adding cells to all sides (with one extra on top/right
         # if an odd number of cells needs to be added)
         # level, by adding roungly equal number of cells on either side
         # (with one extra on top/right if an odd number of cells is needed)
         max_size = NUM_CELLS**NUM_LEVELS
         region = gs.region()
         extra = region['cols'] % max_size
-...
         else:
             addy = 0.0
         gs.run_command('g.region', flags='a',
             w = region['w']-math.floor(addx)*region['ewres'],
             e = region['e']+math.ceil(addx)*region['ewres'],
             s = region['s']-math.floor(addy)*region['nsres'],
             n = region['n']+math.ceil(addy)*region['nsres'])
             w = region['w'] - math.floor(addx) * region['ewres'],
             e = region['e'] + math.ceil(addx) * region['ewres'],
             s = region['s'] - math.floor(addy) * region['nsres'],
             n = region['n'] + math.ceil(addy) * region['nsres'])
         gs.debug('\n'.join(gs.parse_command('g.region', 'up').keys()))
         # create initial grid of variances; sd can be a raster or a constant
-...
                 vm = '(1.0/w)', mv = '(n/w)', quiet=True)
             tmp_rast.add('v%d' % i)
         # arbitrary value used to fill null variance cells
         # get arbitrarily large value to fill null variance cells
         bigvar = gs.raster_info('v0')['max'] * 10
         # prep for refinement phase
-...
                 overwrite=True, quiet=True)
             # create smoothed higher resolution versions of z and v
             #TODO: is this the same as circle with radius 2 in arc?
             #TODO: what's happening at the edges here???
             #TODO: is order of ops faithful to aml w.r.t resolution changes?
             # using weight matrix equivalent to ArcGIS circle with radius 2
             gs.run_command('r.neighbors', flags='c', input=smooth,
                 output='zs', method='average', size=5, overwrite=True,
                 quiet=True)
-...
             gs.mapcalc('v.smooth = 1 / (1/${v_c} + 1/vs)', v_c = v_c,
                 quiet=True)
         if (1 <= gs.debug_level):
             report()
         cleanup()
         return None

     # run in GRID, not ARC
     # &run .aml ingrid sd prob bbox
     # sd 0.0001 prob 0.05
     # Multiscale raster smoother function designed for use with noisy DEMs.
     # Original algorithm and AML implementation by John Gallant. Translation
     # to R (relying on raster package functionality) by Jim Regetz, based on
     # AML script 'multiscalesmooth9a_clean.aml'.
+    #
     # 9a - limit to 4 steps, see if that has any significant deterioration of smoothing performance. Should fix
     # the problem with islands and headlands - turns out also need to remove water except
     # for one cell adjacent to land, and give that a higher uncertainty. See cluster_multiscalesmooth9a_clean_216
+    #
     # Version 9:
     # Focus on implementing identical algorithm to directsmooth2 using multiscale method i.e. aggregating by factor of 3
     # from already aggregated data, rather than from original resolution each time.
+    #
     # Version 8:
     # WARNING: have not yet checked that the additional weighting of the gaussian smoothing is not messing with
     # the calculations of variance etc.
     # Replaced simple 3x3 aggregation with gaussian smoothing
     # Kernel is chosen to give appropriate level of smoothing and produce a fairly accurate approximation of the smoothed
     # surface by interpolation of the coarser scale smoothed values
     # Details in gaussian.xls on john's laptop
+    #
     # Version 7:
     # Further reworking of how the final values are selected - a mean is a candidate if its associated variance
     # is less than the mean sample uncertainty, and the mean with the lowest variance among the candidates is the chosen one.
     # Implement that in the nested sense by taking the lowest group variance divided by the chi^2 value, and its associated mean variance,
     # and if that is lower than the data point variance the
+    #
     # approximate critical value of chi^2/N with N degrees of freedom at 5% level as 1 + 2.45/sqrt(N) + 0.55/N
     # for 1% level use 1 + 3.4/sqrt(N) + 2.4/N
+    #
     # Version 6:
     # Done from scratch after careful working through of theory.
     # ingrid is the (potentially sparse) grid of data to be smoothed and
     # interpolated, which can be of different extent to the output
     # (resolution is assumed to be the same, could adapt this to relax that)
+    #
     # var can be a constant or a grid
+    #
     # bbox can be either a grid name or the 'xmin ymin xmax ymax' parameters
     # for setwindow
     # REGETZ NOTES
     # - it looks like Ming used sd=0.001 (based on the Arc 'log' file in the
     #   topo experimental directory)
     # Jim Regetz
     # NCEAS
     # Created on 22-Mar-2012
     library(raster)
     #&type NB - using standard deviation as noise specification now, not variance!
     multiscalesmooth <- function(ingrid, sd=0.0001 , prob=0.05, bbox) {
         # ingrid: grid to smooth
         # sd: stdev
         # prob: prob
     multiscalesmooth <- function(ingrid, sd=0.0001, alpha=0.05, bbox) {
         # ingrid: RasterLayer to smooth
         # sd: numeric constant or RasterLayer
         # alpha: alpha level for chi-square critical value
         # bbox: optional extent object used to subset ingrid
         # subset ingrid if desired
-...
             ingrid <- crop(ingrid, bbox)
+        }
         # set number of levels of aggregation
         # set number of aggregation levels and neighborhood size
         NUM.LEVELS <- 4
         # set aggregation factor
         AGG.FACTOR <- 3
         NUM.CELLS <- 3
         # expand grid to accommodate integer number of cells at coarsest
         # level, by adding roungly equal number of cells on either side
         # (with one extra on top/right if an odd number of cells needs to be
         # added)
         max.size <- AGG.FACTOR^NUM.LEVELS
         # (with one extra on top/right if an odd number of cells is needed)
         max.size <- NUM.CELLS^NUM.LEVELS
         addx <- if (0 < (extra<-ncol(ingrid)%%max.size)) {
                 (max.size-extra)/2
             } else {
-...
+            }
         full.extent <- extent(
             xmin(ingrid)-floor(addx)*xres(ingrid),
             xmax(ingrid)+ceiling(addx)*xres(ingrid),
             ymin(ingrid)-floor(addy)*yres(ingrid),
             ymax(ingrid)+ceiling(addy)*yres(ingrid)
             xmin(ingrid) - floor(addx) * xres(ingrid),
             xmax(ingrid) + ceiling(addx) * xres(ingrid),
             ymin(ingrid) - floor(addy) * yres(ingrid),
             ymax(ingrid) + ceiling(addy) * yres(ingrid)
+            )
         # create grids
         # NB - only calculating sample variances here, not variances of estimated means.
         # Also note that v0_bg is an uncertainty, not a sample variance
         # and v1_bg is total variances, but both are labelled as "between-group" to simplify the smoothing
         # create lists to hold the series of successively coarsened grids of
         # values and variances, respectively; the first element of each is
         # the grid at the original input resolution
-...
         # set initial "group variance" to individual msmt variance (noise)
         v.g = v[[1]]
         # weighting for aggregation, based on total variance
         # weights for aggregation, based on total variance
         w <- calc(v[[1]], function(x) ifelse(is.na(x), 0, 1/x))
         # squared weights
         wsq = w^2
         # effective number of measurements
         n <- calc(z[[1]], function(x) ifelse(!is.na(x), 1, 0))
         bigvar <- cellStats(v[[1]], max)
         #setcell minof
         # aggregate to broader scales
         for (i in 1+seq.int(NUM.LEVELS)) {
-...
             # calc variance-weighted neighborhood mean
             z[[i]] <- aggregate(w.prev * z[[i-1]], 3, sum) / w
             # calc between-cell variance, taken over neighborhood
             hdiff <- z[[i-1]] - disaggregate(z[[i]], 3)
             v.bg <- aggregate(w.prev * hdiff^2, 3, sum) / w
             zdiff <- z[[i-1]] - disaggregate(z[[i]], 3)
             v.bg <- aggregate(w.prev * zdiff^2, 3, sum) / w
             # calc wtd avg of within-cell variance, taken over neighborhood
             if (i==2) {
                 v.wg <- n - n # zero, but with window and cell size set for us
                 v.wg <- n - n # zero, but with correct window and cell size
             } else {
                 v.wg <- aggregate(w.prev * v.g.prev, 3, sum) / w
+            }
-...
             mv <- n / w
             # calc chisq critical values
             chisq <- calc(n.eff, function(n) qchisq(0.05, n-1,
             chisq <- calc(n.eff, function(n) qchisq(alpha, n-1,
                 lower=FALSE)/(n-1))
             # set coarsened cell variances: if group variance is small
             # relative to noise variance, use variance of the mean instead
-...
+        }
         bigvar  <- bigvar * 10
         #copy z[NUM.LEVELS] hs[NUM.LEVELS]
         #copy v[NUM.LEVELS] vs[NUM.LEVELS]
         #kill z[NUM.LEVELS]
         #kill v[NUM.LEVELS]
         #setcell hs[NUM.LEVELS]
         #setwindow hs[NUM.LEVELS]
         # smooth, refine and combine each layer in turn
         #hs <- z[[NUM.LEVELS+1]]
         #vs <- v[[NUM.LEVELS+1]]
         hs <- z
         vs <- v
         #todo: is this the same as circle with radius 2 in arc???
         #circle2 <- matrix(c(0,1,0, 1,1,1, 0,1,0), nrow=3)
         circle2 <- matrix(c(0,0,1,0,0, 0,1,1,1,0, 1,1,1,1,1, 0,1,1,1,0, 0,0,1,0,0), nrow=5)
         # get arbitrarily large value to fill null variance cells
         bigvar <- cellStats(v[[1]], max) * 10
         # prep for refinement phase
         z.smooth <- z[[NUM.LEVELS+1]]
         v.smooth <- v[[NUM.LEVELS+1]]
         # create weight matrix equivalent to ArcGIS circle with radius 2
         circle2 <- matrix(c(0,0,1,0,0,
 ,1,1,1,0,
 ,1,1,1,1,
 ,1,1,1,0,
 ,0,1,0,0), nrow=5)
         circle2[circle2==0] <- NA
         # refine, smooth, and combine each layer in turn
         for (j in 1+rev(seq.int(NUM.LEVELS))) {
             message("Refine from ", j, " to ", j-1)
             message("Refining from ", j, " to ", j-1)
             # for the first stage where the coarser grid is refined and smoothed, set window to the coarse grid
             #setcell z[j-1]
             #setwindow maxof
             # create smoothed higher resolution versions of z and v_bg, hopefully with no nulls!
             hs.tmp <- focal(disaggregate(hs[[j]], 3), w=circle2, fun=mean,
             # create smoothed higher resolution versions of z and v
             zs <- focal(disaggregate(z.smooth, 3), w=circle2, fun=mean,
                 pad=TRUE, padValue=NA, na.rm=TRUE)
             vs <- focal(disaggregate(v.smooth, 3), w=circle2, fun=mean,
                 pad=TRUE, padValue=NA, na.rm=TRUE)
             vs.tmp <- focal(disaggregate(vs[[j]], 3), w=circle2, fun=mean,
                pad=TRUE, padValue=NA, na.rm=TRUE)
             # create no-null version of finer z and v
             h_c <- calc(z[[j-1]], function(x) ifelse(is.na(x), 0, x))
             z_c <- calc(z[[j-1]], function(x) ifelse(is.na(x), 0, x))
             v_c <- calc(v[[j-1]], function(x) ifelse(is.na(x), bigvar, x))
             # combine two values using least variance
             hs[[j-1]] <- (h_c/v_c + hs.tmp/vs.tmp ) / (1/v_c + 1/vs.tmp)
             vs[[j-1]] <- 1 / (1/v_c + 1/vs.tmp)
             # explicitly clean up, in case it helps
             z[[j-1]] <- NULL
             v[[j-1]] <- NULL
     #todo: mimic all the AML setwindow/setcell stuff???
     #        hs[[j-1]] <- expand(hs[[j-1]], 4)
     #        vs[[j-1]] <- expand(vs[[j-1]], 4)
             # combine two values using least variance
             z.smooth <- (z_c/v_c + zs/vs ) / (1/v_c + 1/vs)
             v.smooth <- 1 / (1/v_c + 1/vs)
+        }
         result <- crop(stack(hs[[1]], vs[[1]]), extent(ingrid))
         layerNames(result) <- c("hs", "vs")
         result <- crop(stack(z.smooth, v.smooth, extent(ingrid))
         layerNames(result) <- c("zs", "vs")
         return(result)
+    }

Also available in: Unified diff

Project

General

Profile

Revision 7a06885b

Added by Jim Regetz over 12 years ago