/ - Diff - Environment and organisms - NCEAS Projects

« Previous | Next »

Revision 9b850015

Added by Jim Regetz over 12 years ago

ID 9b85001515b7b57a831aa1ab988f09ac1db0671c
Parent fb35e17b
Child 86d73d7e

updated directory paths and related comments

     # R script for batch parsing and loading GHCN daily station files
     # (*.dly) into a PostgreSQL database. Script will process all such files
     # in the current working directory.
     # (*.dly) into a PostgreSQL database. The appropriate GHCN files are
     # assumed to have been downloaded to the location specified by
     # 'ghcndir', with the daily files themselves in a "ghcnd_all"
     # subdirectory exactly as generated by unpacking "ghcnd_all.tar.gz";
     # note that for the purposes of storage efficiency, we're not currently
     # keeping these uncompressed files on disk, so this tarball would need
     # to be unpacked again if for some reason this script needs to be
     # re-run.
+    #
     # As currently written, the script assumes that the 'ghcn' database
     # already exists locally but has no tables, and that it can be accessed
-...
     #-------------#
     # location of ghcn daily data (on atlas)
     datadir <- "/home/layers/data/climate/ghcn/ghcnd_all"
     ghcndir <- "/home/layers/data/climate/ghcn/v2.92-upd-2012052822"
     # output file
     logfile <- "~/ghcn-psql-load.log"
-...
             )"))
     # process and insert daily data
     dailies <- list.files(datadir, pattern="*.dly")
     dailies <- list.files(file.path(ghcndir, "ghcnd_all"), pattern="*.dly")
     for (file in dailies) {
         cat(date(), "\t", file=logfile, append=TRUE)
         if (loadAsCSV(file.path(datadir, file), VARS)) {
         if (loadAsCSV(file.path(ghcndir, "ghcnd_all", file), VARS)) {
             wideToLong(db)
             dbGetQuery(db, 'delete from ghcn_wide')
+        }
-...
     #BATCH.SIZE <- 10
     #counter <- 1
     #for (file in dailies) {
     #    loadAsCSV(file.path(datadir, file), VARS)
     #    loadAsCSV(file.path(ghcndir, "ghcnd_all", file), VARS)
     #    if (counter %% BATCH.SIZE == 0) {
     #        wideToLong(db)
     #        dbGetQuery(db, 'delete from ghcn_wide')

Also available in: Unified diff

Project

General

Profile

Revision 9b850015

Added by Jim Regetz over 12 years ago