v.rast.stats.py 7.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274
  1. #!/usr/bin/env python
  2. ############################################################################
  3. #
  4. # MODULE: v.rast.stats
  5. # AUTHOR(S): Markus Neteler
  6. # converted to Python by Glynn Clements
  7. # speed up by Markus Metz
  8. # PURPOSE: Calculates univariate statistics from a GRASS raster map
  9. # only for areas covered by vector objects on a per-category base
  10. # COPYRIGHT: (C) 2005-2010 by the GRASS Development Team
  11. #
  12. # This program is free software under the GNU General Public
  13. # License (>=v2). Read the file COPYING that comes with GRASS
  14. # for details.
  15. #
  16. #############################################################################
  17. #%module
  18. #% description: Calculates univariate statistics from a raster map based on vector polygon map and uploads statistics to new attribute columns.
  19. #% keywords: vector
  20. #% keywords: statistics
  21. #% keywords: raster
  22. #%end
  23. #%flag
  24. #% key: c
  25. #% description: Continue if upload column(s) already exist
  26. #%end
  27. #%flag
  28. #% key: e
  29. #% description: Calculate extended statistics
  30. #%end
  31. #%option G_OPT_V_MAP
  32. #% key: vector
  33. #%end
  34. #%option G_OPT_V_FIELD
  35. #%end
  36. #%option G_OPT_R_INPUT
  37. #% key: raster
  38. #% description: Name of input raster map to calculate statistics from
  39. #%end
  40. #%option
  41. #% key: column_prefix
  42. #% type: string
  43. #% description: Column prefix for new attribute columns
  44. #% required : yes
  45. #%end
  46. #%option
  47. #% key: percentile
  48. #% type: integer
  49. #% description: Percentile to calculate (requires extended statistics flag)
  50. #% options: 0-100
  51. #% answer: 90
  52. #% required : no
  53. #%end
  54. import sys
  55. import os
  56. import atexit
  57. import grass.script as grass
  58. def has_column(vector, col):
  59. return
  60. def cleanup():
  61. if rastertmp:
  62. grass.run_command('g.remove', rast = rastertmp, quiet = True)
  63. grass.run_command('g.remove', rast = 'MASK', quiet = True, stderr = nuldev)
  64. if mask_found:
  65. grass.message(_("Restoring previous MASK..."))
  66. grass.run_command('g.rename', rast = (tmpname + "_origmask", 'MASK'), quiet = True)
  67. # for f in [tmp, tmpname, sqltmp]:
  68. # grass.try_remove(f)
  69. def main():
  70. global tmp, sqltmp, tmpname, nuldev, vector, mask_found, rastertmp
  71. mask_found = False
  72. rastertmp = False
  73. #### setup temporary files
  74. tmp = grass.tempfile()
  75. sqltmp = tmp + ".sql"
  76. # we need a random name
  77. tmpname = grass.basename(tmp)
  78. nuldev = file(os.devnull, 'w')
  79. raster = options['raster']
  80. colprefix = options['column_prefix']
  81. vector = options['vector']
  82. layer = options['layer']
  83. percentile = options['percentile']
  84. ### setup enviro vars ###
  85. env = grass.gisenv()
  86. mapset = env['MAPSET']
  87. vs = vector.split('@')
  88. if len(vs) > 1:
  89. vect_mapset = vs[1]
  90. else:
  91. vect_mapset = mapset
  92. # does map exist in CURRENT mapset?
  93. if vect_mapset != mapset or not grass.find_file(vector, 'vector', mapset)['file']:
  94. grass.fatal(_("Vector map <%s> not found in current mapset") % vector)
  95. vector = vs[0]
  96. rastertmp = "%s_%s" % (vector, tmpname)
  97. # check the input raster map
  98. if not grass.find_file(raster, 'cell')['file']:
  99. grass.fatal(_("Raster map <%s> not found") % raster)
  100. # check presence of raster MASK, put it aside
  101. mask_found = bool(grass.find_file('MASK', 'cell')['file'])
  102. if mask_found:
  103. grass.message(_("Raster MASK found, temporarily disabled"))
  104. grass.run_command('g.rename', rast = ('MASK', tmpname + "_origmask"), quiet = True)
  105. # save current settings:
  106. grass.use_temp_region()
  107. # Temporarily aligning region resolution to $RASTER resolution
  108. # keep boundary settings
  109. grass.run_command('g.region', align = raster)
  110. # prepare raster MASK
  111. if grass.run_command('v.to.rast', input = vector, output = rastertmp,
  112. use = 'cat', quiet = True) != 0:
  113. grass.fatal(_("An error occurred while converting vector to raster"))
  114. # dump cats to file to avoid "too many argument" problem:
  115. p = grass.pipe_command('r.category', map = rastertmp, sep = ';', quiet = True)
  116. cats = []
  117. for line in p.stdout:
  118. cats.append(line.rstrip('\r\n').split(';')[0])
  119. p.wait()
  120. number = len(cats)
  121. if number < 1:
  122. grass.fatal(_("No categories found in raster map"))
  123. # check if DBF driver used, in this case cut to 10 chars col names:
  124. try:
  125. fi = grass.vector_db(map = vector)[int(layer)]
  126. except KeyError:
  127. grass.fatal(_('There is no table connected to this map. Run v.db.connect or v.db.addtable first.'))
  128. # we need this for non-DBF driver:
  129. dbfdriver = fi['driver'] == 'dbf'
  130. # Find out which table is linked to the vector map on the given layer
  131. if not fi['table']:
  132. grass.fatal(_('There is no table connected to this map. Run v.db.connect or v.db.addtable first.'))
  133. basecols = ['n', 'min', 'max', 'range', 'mean', 'stddev', 'variance', 'cf_var', 'sum']
  134. # we need at least three chars to distinguish [mea]n from [med]ian
  135. # so colprefix can't be longer than 6 chars with DBF driver
  136. if dbfdriver:
  137. colprefix = colprefix[:6]
  138. # do extended stats?
  139. if flags['e']:
  140. # namespace is limited in DBF but the % value is important
  141. if dbfdriver:
  142. perccol = "per" + percentile
  143. else:
  144. perccol = "percentile_" + percentile
  145. extracols = ['first_quartile', 'median', 'third_quartile'] + [perccol]
  146. else:
  147. extracols = []
  148. addcols = []
  149. for i in basecols + extracols:
  150. # check if column already present
  151. currcolumn = ("%s_%s" % (colprefix, i))
  152. if dbfdriver:
  153. currcolumn = currcolumn[:10]
  154. if currcolumn in grass.vector_columns(vector, layer).keys():
  155. if not flags['c']:
  156. grass.fatal((_("Cannot create column <%s> (already present). ") % currcolumn) +
  157. _("Use -c flag to update values in this column."))
  158. else:
  159. if i == "n":
  160. coltype = "INTEGER"
  161. else:
  162. coltype = "DOUBLE PRECISION"
  163. addcols.append(currcolumn + ' ' + coltype)
  164. if addcols:
  165. grass.verbose(_("Adding columns '%s'") % addcols)
  166. if grass.run_command('v.db.addcolumn', map = vector, columns = addcols) != 0:
  167. grass.fatal(_("Adding columns failed. Exiting."))
  168. # calculate statistics:
  169. grass.message(_("Processing data (%d categories)...") % number)
  170. # get rid of any earlier attempts
  171. grass.try_remove(sqltmp)
  172. colnames = []
  173. for var in basecols + extracols:
  174. colname = '%s_%s' % (colprefix, var)
  175. if dbfdriver:
  176. colname = colname[:10]
  177. colnames.append(colname)
  178. ntabcols = len(colnames)
  179. # do extended stats?
  180. if flags['e']:
  181. extstat = 'e'
  182. else:
  183. extstat = ""
  184. f = file(sqltmp, 'w')
  185. # do the stats
  186. p = grass.pipe_command('r.univar', flags = 't' + 'g' + extstat, map = raster,
  187. zones = rastertmp, percentile = percentile, sep = ';')
  188. first_line = 1
  189. for line in p.stdout:
  190. if first_line:
  191. first_line = 0
  192. continue
  193. vars = line.rstrip('\r\n').split(';')
  194. f.write("UPDATE %s SET" % fi['table'])
  195. i = 2
  196. first_var = 1
  197. for colname in colnames:
  198. value = vars[i]
  199. # convert nan, +nan, -nan to NULL
  200. if value.lower().endswith('nan'):
  201. value = 'NULL'
  202. if not first_var:
  203. f.write(" , ")
  204. else:
  205. first_var = 0
  206. f.write(" %s=%s" % (colname, value))
  207. i += 1
  208. # skip n_null_cells, mean_of_abs, sum_of_abs
  209. if i == 3 or i == 8 or i == 13:
  210. i += 1
  211. f.write(" WHERE %s=%s;\n" % (fi['key'], vars[0]))
  212. p.wait()
  213. f.close()
  214. grass.message(_("Updating the database ..."))
  215. exitcode = grass.run_command('db.execute', input = sqltmp,
  216. database = fi['database'], driver = fi['driver'])
  217. grass.run_command('g.remove', rast = 'MASK', quiet = True, stderr = nuldev)
  218. if exitcode == 0:
  219. grass.message((_("Statistics calculated from raster map <%s>") % raster) +
  220. (_(" and uploaded to attribute table of vector map <%s>.") % vector))
  221. else:
  222. grass.warning(_("Failed to upload statistics to attribute table of vector map <%s>.") % vector)
  223. sys.exit(exitcode)
  224. if __name__ == "__main__":
  225. options, flags = grass.parser()
  226. atexit.register(cleanup)
  227. main()