v.rast.stats.py 8.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280
  1. #!/usr/bin/env python
  2. ############################################################################
  3. #
  4. # MODULE: v.rast.stats
  5. # AUTHOR(S): Markus Neteler, converted to Python by Glynn Clements
  6. # PURPOSE: Calculates univariate statistics from a GRASS raster map
  7. # only for areas covered by vector objects on a per-category base
  8. # COPYRIGHT: (C) 2005-2008 by the GRASS Development Team
  9. #
  10. # This program is free software under the GNU General Public
  11. # License (>=v2). Read the file COPYING that comes with GRASS
  12. # for details.
  13. #
  14. # TODO: do we need layer= management?
  15. #############################################################################
  16. #%Module
  17. #% description: Calculates univariate statistics from a GRASS raster map based on vector polygons and uploads statistics to new attribute columns.
  18. #% keywords: vector, raster, statistics
  19. #%End
  20. #%flag
  21. #% key: c
  22. #% description: Continue if upload column(s) already exist
  23. #%END
  24. #%flag
  25. #% key: e
  26. #% description: Calculate extended statistics
  27. #%END
  28. #%option
  29. #% key: vector
  30. #% type: string
  31. #% key_desc: name
  32. #% gisprompt: old,vector,vector
  33. #% description: Name of vector polygon map
  34. #% required : yes
  35. #%End
  36. #%option
  37. #% key: layer
  38. #% type: integer
  39. #% description: Layer to which the table to be changed is connected
  40. #% answer: 1
  41. #% required : no
  42. #%end
  43. #%option
  44. #% key: raster
  45. #% type: string
  46. #% key_desc: name
  47. #% gisprompt: old,cell,raster
  48. #% description: Name of raster map to calculate statistics from
  49. #% required : yes
  50. #%END
  51. #%option
  52. #% key: colprefix
  53. #% type: string
  54. #% description: Column prefix for new attribute columns
  55. #% required : yes
  56. #%end
  57. #%option
  58. #% key: percentile
  59. #% type: integer
  60. #% description: Percentile to calculate (requires extended statistics flag)
  61. #% options: 0-100
  62. #% answer: 90
  63. #% required : no
  64. #%end
  65. import sys
  66. import os
  67. import atexit
  68. import grass
  69. def has_column(vector, col):
  70. s = grass.read_command('v.info', flags = 'c', map = vector, quiet = True)
  71. for l in s.splitlines():
  72. f = l.split('|')
  73. if len(f) < 2:
  74. continue
  75. if f[1] == col:
  76. return True
  77. return False
  78. def cleanup():
  79. grass.run_command('g.remove', rast = '%s_%s' % (vector, tmpname), quiet = True)
  80. grass.run_command('g.remove', rast = 'MASK', quiet = True, stderr = nuldev)
  81. if mask_found:
  82. grass.message("Restoring previous MASK...")
  83. grass.run_command('g.rename', rast = (tmpname + "_origmask", 'MASK'), quiet = True)
  84. for f in [tmp, tmpname, sqltmp]:
  85. grass.try_remove(f)
  86. def main():
  87. global tmp, sqltmp, tmpname, nuldev, vector, mask_found
  88. #### setup temporary files
  89. tmp = grass.tempfile()
  90. sqltmp = tmp + ".sql"
  91. # we need a random name
  92. tmpname = grass.basename(tmp)
  93. nuldev = file(os.devnull, 'w')
  94. raster = options['raster']
  95. colprefix = options['colprefix']
  96. vector = options['vector']
  97. layer = options['layer']
  98. percentile = options['percentile']
  99. ### setup enviro vars ###
  100. env = grass.gisenv()
  101. mapset = env['MAPSET']
  102. vs = vector.split('@')
  103. if len(vs) > 1:
  104. vect_mapset = vs[1]
  105. else:
  106. vect_mapset = mapset
  107. # does map exist in CURRENT mapset?
  108. if vect_mapset != mapset or not grass.find_file(vector, 'vector', mapset)['file']:
  109. grass.fatal("Vector map <%s> not found in current mapset" % vector)
  110. vector = vs[0]
  111. #check the input raster map
  112. if not grass.find_file(raster, 'cell')['file']:
  113. grass.fatal("Raster map <%s> not found" % raster)
  114. #check presence of raster MASK, put it aside
  115. mask_found = bool(grass.find_file('MASK', 'cell')['file'])
  116. if mask_found:
  117. grass.message("Raster MASK found, temporarily disabled")
  118. grass.run_command('g.rename', rast = ('MASK', tmpname + "_origmask"), quiet = True)
  119. #get RASTER resolution of map which we want to query:
  120. #fetch separated to permit for non-square cells (latlong etc)
  121. s = grass.read_command('r.info', flags = 's', map = raster)
  122. kv = grass.parse_key_val(s)
  123. nsres = float(kv['nsres'])
  124. ewres = float(kv['ewres'])
  125. #save current settings:
  126. grass.use_temp_region()
  127. #Temporarily setting raster resolution to $RASTER resolution
  128. #keep boundary settings
  129. grass.run_command('g.region', flags = 'a', nsres = nsres, ewres = ewres)
  130. #prepare raster MASK
  131. if grass.run_command('v.to.rast', input = vector, output = "%s_%s" % (vector, tmpname),
  132. use = 'cat', quiet = True) != 0:
  133. grass.fatal("An error occurred while converting vector to raster")
  134. #dump cats to file to avoid "too many argument" problem:
  135. p = grass.pipe_command('r.category', map = '%s_%s' % (vector, tmpname), fs = ';', quiet = True)
  136. cats = []
  137. for line in p.stdout:
  138. cats.append(line.rstrip('\r\n').split(';')[0])
  139. p.wait()
  140. #echo "List of categories found: $CATSLIST"
  141. number = len(cats)
  142. if number < 1:
  143. grass.fatal("No categories found in raster map")
  144. #check if DBF driver used, in this case cut to 10 chars col names:
  145. s = grass.read_command('v.db.connect', flags = 'g', map = vector, layer = layer)
  146. # we need this for non-DBF driver:
  147. f = s.split()
  148. table = f[1]
  149. db_database = f[3]
  150. db_sqldriver = f[4]
  151. dbfdriver = db_sqldriver == 'dbf'
  152. #Find out which table is linked to the vector map on the given layer
  153. if not table:
  154. grass.fatal('There is no table connected to this map! Run v.db.connect or v.db.addtable first.')
  155. basecols = ['n', 'min', 'max', 'range', 'mean', 'stddev', 'variance', 'cf_var', 'sum']
  156. # we need at least three chars to distinguish [mea]n from [med]ian
  157. # so colprefix can't be longer than 6 chars with DBF driver
  158. if dbfdriver:
  159. colprefix = colprefix[:6]
  160. # do extended stats?
  161. if flags['e']:
  162. # namespace is limited in DBF but the % value is important
  163. if dbfdriver:
  164. perccol = "per" + percentile
  165. else:
  166. perccol = "percentile_" + percentile
  167. extracols = ['first_quartile', 'median', 'third_quartile'] + [perccol]
  168. else:
  169. extracols = []
  170. addcols = []
  171. for i in basecols + extracols:
  172. #check if column already present
  173. currcolumn = ("%s_%s" % (colprefix, i))
  174. if dbfdriver:
  175. currcolumn = currcolumn[:10]
  176. if has_column(vector, currcolumn):
  177. if not flags['c']:
  178. grass.fatal(("Cannot create column <%s> (already present)." % currcolumn) +
  179. "Use -c flag to update values in this column.")
  180. else:
  181. if i == "n":
  182. coltype = "INTEGER"
  183. else:
  184. coltype = "DOUBLE PRECISION"
  185. addcols.append(currcolumn + ' ' + coltype)
  186. grass.verbose("Adding columns <%s>" % addcols)
  187. if grass.run_command('v.db.addcol', map = vector, columns = addcols) != 0:
  188. grass.fatal("Cannot continue (problem adding columns).")
  189. #loop over cats and calculate statistics:
  190. grass.verbose("Processing data ...")
  191. # get rid of any earlier attempts
  192. grass.try_remove(sqltmp)
  193. # do extended stats?
  194. if flags['e']:
  195. extstat = 'e'
  196. else:
  197. extstat = ""
  198. f = file(sqltmp, 'w')
  199. currnum = 1
  200. for i in cats:
  201. grass.verbose("Processing category %s (%d/%d)" % (i, currnum, number))
  202. grass.run_command('g.remove', rast = 'MASK', quiet = True, stderr = nuldev)
  203. grass.run_command('r.mapcalc', quiet = True,
  204. expression = "MASK = if(%s_%s == %s, 1, null())" % (vector, tmpname, i))
  205. #n, min, max, range, mean, stddev, variance, coeff_var, sum
  206. # How to test r.univar $? exit status? using -e creates the real possibility of out-of-memory errors
  207. s = grass.read_command('r.univar', flags = 'g' + extstat, map = raster, percentile = percentile)
  208. vars = grass.parse_key_val(s)
  209. vars['cf_var'] = vars['coeff_var']
  210. if flags['e'] and dbfdriver:
  211. percvar = 'percentile_' + percentile
  212. vars[perccol] = vars[percvar]
  213. for var in basecols + extracols:
  214. value = vars[var]
  215. if value.lower() == 'nan':
  216. value = 'NULL'
  217. colname = '%s_%s' % (colprefix, var)
  218. if dbfdriver:
  219. colname = colname[:10]
  220. f.write("UPDATE %s SET %s=%s WHERE cat=%s;\n" % (table, colname, value, i))
  221. currnum += 1
  222. f.close()
  223. grass.verbose("Updating the database ...")
  224. exitcode = grass.run_command('db.execute', input = sqltmp,
  225. database = db_database, driver = db_sqldriver)
  226. grass.run_command('g.remove', rast = 'MASK', quiet = True, stderr = nuldev)
  227. if exitcode == 0:
  228. grass.message(("Statistics calculated from raster map %s" % raster) +
  229. (" and uploaded to attribute table of vector map %s." % vector))
  230. grass.message("Done.")
  231. sys.exit(exitcode)
  232. if __name__ == "__main__":
  233. options, flags = grass.parser()
  234. atexit.register(cleanup)
  235. main()