points.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423
  1. #include <stdio.h>
  2. #include <string.h>
  3. #include <stdlib.h>
  4. #include <ctype.h>
  5. #include <grass/gis.h>
  6. #include <grass/dbmi.h>
  7. #include <grass/vector.h>
  8. #include <grass/glocale.h>
  9. #include "local_proto.h"
  10. /* Determine if the string is integer, e.g. 123, +123, -123,
  11. * return 1 if integer, 0 otherwise */
  12. static int is_int(char *str)
  13. {
  14. char *tail;
  15. if (strtol(str, &tail, 10), tail == str || *tail != '\0') {
  16. /* doesn't look like a number,
  17. or has extra characters after what looks to be a number */
  18. return 0;
  19. }
  20. return 1;
  21. }
  22. /* Determine if the string is double, e.g. 123.456, +123.456, -123.456, 1.23456e2
  23. * return 1 if double, 0 otherwise */
  24. static int is_double(char *str)
  25. {
  26. char *tail;
  27. if (strtod(str, &tail), tail == str || *tail != '\0') {
  28. /* doesn't look like a number,
  29. or has extra characters after what looks to be a number */
  30. return 0;
  31. }
  32. return 1;
  33. }
  34. /* Analyse points ascii file. Determine number of columns and column types.
  35. * ascii_tmp: write copy of tempfile to ascii_tmp:
  36. * rowlength: maximum row length
  37. * ncolumns: number of columns
  38. * minncolumns: minimum number of columns
  39. * nrows: number of rows
  40. * column_type: column types
  41. * column_length: column lengths (string only)
  42. */
  43. int points_analyse(FILE * ascii_in, FILE * ascii, char *fs,
  44. int *rowlength, int *ncolumns, int *minncolumns,
  45. int *nrows, int **column_type, int **column_length,
  46. int skip_lines, int xcol, int ycol, int region_flag)
  47. {
  48. int i;
  49. int buflen; /* buffer length */
  50. char *buf, *buf_raw; /* buffer */
  51. int row = 1; /* line number, first is 1 */
  52. int ncols = 0; /* number of columns */
  53. int minncols = -1;
  54. int *coltype = NULL; /* column types */
  55. int *collen = NULL; /* column lengths */
  56. char **tokens;
  57. int ntokens; /* number of tokens */
  58. int len, rowlen = 0; /* maximum row length */
  59. struct Cell_head window;
  60. double northing = .0;
  61. double easting = .0;
  62. char *coorbuf, *tmp_token, *sav_buf;
  63. int skip = FALSE, skipped = 0;
  64. buflen = 4000;
  65. buf = (char *)G_malloc(buflen);
  66. buf_raw = (char *)G_malloc(buflen);
  67. coorbuf = (char *)G_malloc(256);
  68. tmp_token = (char *)G_malloc(256);
  69. sav_buf = NULL;
  70. G_message(_("Scanning input for column types..."));
  71. /* fetch projection for LatLong test */
  72. G_get_window(&window);
  73. while (1) {
  74. len = 0; /* not really needed, but what the heck */
  75. skip = FALSE; /* reset out-of-region check */
  76. if (G_getl2(buf, buflen - 1, ascii_in) == 0)
  77. break; /* EOF */
  78. if (row <= skip_lines) {
  79. G_debug(3, "skipping header row %d : %d chars", row,
  80. (int)strlen(buf));
  81. /* this fn is read-only, write to hist with points_to_bin() */
  82. fprintf(ascii, "%s\n", buf);
  83. len = strlen(buf) + 1;
  84. if (len > rowlen)
  85. rowlen = len;
  86. row++;
  87. continue;
  88. }
  89. if ((buf[0] == '#') || (buf[0] == '\0')) {
  90. G_debug(3, "skipping comment row %d : %d chars", row,
  91. (int)strlen(buf));
  92. continue;
  93. }
  94. /* no G_chop() as first/last column may be empty fs=tab value */
  95. G_debug(3, "row %d : %d chars", row, (int)strlen(buf));
  96. /* G_tokenize() will modify the buffer, so we make a copy */
  97. strcpy(buf_raw, buf);
  98. len = strlen(buf) + 1;
  99. if (len > rowlen)
  100. rowlen = len;
  101. tokens = G_tokenize(buf, fs);
  102. ntokens = G_number_of_tokens(tokens);
  103. if (ntokens > ncols) {
  104. int c;
  105. coltype = (int *)G_realloc(coltype, ntokens * sizeof(int));
  106. collen = (int *)G_realloc(collen, ntokens * sizeof(int));
  107. for (c = ncols; c < ntokens; c++) {
  108. coltype[c] = DB_C_TYPE_INT; /* default type */
  109. collen[c] = 0;
  110. }
  111. ncols = ntokens;
  112. }
  113. if (minncols == -1 || minncols > ntokens)
  114. minncols = ntokens;
  115. /* Determine column types */
  116. for (i = 0; i < ntokens; i++) {
  117. if ((G_projection() == PROJECTION_LL)) {
  118. if (i == xcol || i == ycol) {
  119. if (i == 0) { /* Save position of original internal token buffer */
  120. /* Prevent memory leaks */
  121. sav_buf = tokens[0];
  122. }
  123. /* check if coordinates are DMS or decimal or not latlong at all */
  124. sprintf(coorbuf, "%s", tokens[i]);
  125. G_debug(4, "token: %s", coorbuf);
  126. if (i == xcol) {
  127. if (G_scan_easting(coorbuf, &easting, window.proj)) {
  128. G_debug(4, "is_latlong east: %f", easting);
  129. sprintf(tmp_token, "%.12f", easting);
  130. /* replace current DMS token by decimal degree */
  131. tokens[i] = tmp_token;
  132. if (region_flag) {
  133. if ((window.east < easting) ||
  134. (window.west > easting))
  135. skip = TRUE;
  136. }
  137. }
  138. else {
  139. fprintf(stderr, _("Current row %d:\n%s\n"), row, buf_raw);
  140. G_fatal_error(_("Unparsable longitude value in column num %d: %s"),
  141. i + 1, tokens[i]);
  142. }
  143. }
  144. if (i == ycol) {
  145. if (G_scan_northing(coorbuf, &northing, window.proj)) {
  146. G_debug(4, "is_latlong north: %f", northing);
  147. sprintf(tmp_token, "%.12f", northing);
  148. /* replace current DMS token by decimal degree */
  149. tokens[i] = tmp_token;
  150. if (region_flag) {
  151. if ((window.north < northing) ||
  152. (window.south > northing))
  153. skip = TRUE;
  154. }
  155. }
  156. else {
  157. fprintf(stderr, _("Current row %d:\n%s\n"), row, buf_raw);
  158. G_fatal_error(_("Unparsable latitude value in column num %d: %s"),
  159. i, tokens[i]);
  160. }
  161. }
  162. } /* if (x or y) */
  163. if (i == ntokens - 1 && sav_buf != NULL) {
  164. /* Restore original token buffer so free_tokens works */
  165. /* Only do this if tokens[0] was re-assigned */
  166. tokens[0] = sav_buf;
  167. sav_buf = NULL;
  168. }
  169. } /* PROJECTION_LL */
  170. else {
  171. if (region_flag) {
  172. /* consider z range if -z flag is used? */
  173. /* change to if(>= east,north){skip=1;} to allow correct tiling */
  174. /* don't "continue;" so multiple passes will have the
  175. same column types and length for patching */
  176. if (i == xcol) {
  177. easting = atof(tokens[i]);
  178. if ((window.east < easting) ||
  179. (window.west > easting))
  180. skip = TRUE;
  181. }
  182. if (i == ycol) {
  183. northing = atof(tokens[i]);
  184. if ((window.north < northing) ||
  185. (window.south > northing))
  186. skip = TRUE;
  187. }
  188. }
  189. }
  190. len = strlen(tokens[i]);
  191. /* do not guess column type for missing values */
  192. if (len == 0)
  193. continue;
  194. G_debug(4, "row %d col %d: '%s' is_int = %d is_double = %d",
  195. row, i, tokens[i], is_int(tokens[i]),
  196. is_double(tokens[i]));
  197. if (is_int(tokens[i])) {
  198. continue; /* integer */
  199. }
  200. if (is_double(tokens[i])) { /* double */
  201. if (coltype[i] == DB_C_TYPE_INT) {
  202. coltype[i] = DB_C_TYPE_DOUBLE;
  203. }
  204. continue;
  205. }
  206. /* string */
  207. coltype[i] = DB_C_TYPE_STRING;
  208. if (len > collen[i])
  209. collen[i] = len;
  210. }
  211. /* write dataline to tmp file */
  212. if (!skip)
  213. fprintf(ascii, "%s\n", buf_raw);
  214. else
  215. skipped++;
  216. G_free_tokens(tokens);
  217. row++;
  218. }
  219. *rowlength = rowlen;
  220. *ncolumns = ncols;
  221. *minncolumns = minncols;
  222. *column_type = coltype;
  223. *column_length = collen;
  224. *nrows = row - 1; /* including skipped lines */
  225. G_free(buf);
  226. G_free(buf_raw);
  227. G_free(coorbuf);
  228. G_free(tmp_token);
  229. if (region_flag)
  230. G_message(_n("Skipping %d of %d row falling outside of current region",
  231. "Skipping %d of %d rows falling outside of current region",
  232. row - 1),
  233. skipped, row - 1);
  234. return 0;
  235. }
  236. /* Import points from ascii file.
  237. *
  238. * fs: field separator
  239. * xcol, ycol, zcol, catcol: x,y,z,cat column in input file, first column is 1,
  240. * zcol and catcol may be 0 (do not use)
  241. * rowlen: maximum row length
  242. * Note: column types (both in header or coldef) must be supported by driver
  243. */
  244. int points_to_bin(FILE * ascii, int rowlen, struct Map_info *Map,
  245. dbDriver * driver, char *table, char *fs, int nrows,
  246. int ncols, int *coltype, int xcol, int ycol, int zcol,
  247. int catcol, int skip_lines)
  248. {
  249. char *buf, buf2[4000];
  250. int cat = 0;
  251. int row = 1;
  252. struct line_pnts *Points;
  253. struct line_cats *Cats;
  254. dbString sql, val;
  255. struct Cell_head window;
  256. G_message(_("Importing points..."));
  257. /* fetch projection for LatLong test */
  258. G_get_window(&window);
  259. rewind(ascii);
  260. Points = Vect_new_line_struct();
  261. Cats = Vect_new_cats_struct();
  262. /* actually last 2 characters won't be read */
  263. buf = (char *)G_malloc(rowlen + 2);
  264. db_init_string(&sql);
  265. db_init_string(&val);
  266. if (skip_lines > 0) {
  267. sprintf(buf2, "HEADER: (%d lines)\n", skip_lines);
  268. Vect_hist_write(Map, buf2);
  269. }
  270. /* rowlen + 2 to read till the end of line on both UNIX and Windows */
  271. while (G_getl2(buf, rowlen + 2, ascii) != 0) {
  272. int i, len;
  273. double x, y, z;
  274. char **tokens;
  275. int ntokens; /* number of tokens */
  276. if (row <= skip_lines) {
  277. G_debug(4, "writing skip line %d to hist : %d chars", row,
  278. (int)strlen(buf));
  279. Vect_hist_write(Map, buf);
  280. Vect_hist_write(Map, "\n");
  281. row++;
  282. continue;
  283. }
  284. len = strlen(buf);
  285. if (len == 0)
  286. continue; /* should not happen */
  287. G_debug(4, "row: %s", buf);
  288. tokens = G_tokenize(buf, fs);
  289. ntokens = G_number_of_tokens(tokens);
  290. if ((G_projection() == PROJECTION_LL)) {
  291. G_scan_easting(tokens[xcol], &x, window.proj);
  292. G_scan_northing(tokens[ycol], &y, window.proj);
  293. }
  294. else {
  295. x = atof(tokens[xcol]);
  296. y = atof(tokens[ycol]);
  297. }
  298. G_debug(4, "x: %f, y: %f", x, y);
  299. if (zcol >= 0)
  300. z = atof(tokens[zcol]);
  301. else
  302. z = 0.0;
  303. if (catcol >= 0)
  304. cat = atof(tokens[catcol]);
  305. else
  306. cat++;
  307. Vect_reset_line(Points);
  308. Vect_reset_cats(Cats);
  309. Vect_append_point(Points, x, y, z);
  310. Vect_cat_set(Cats, 1, cat);
  311. Vect_write_line(Map, GV_POINT, Points, Cats);
  312. /* Attributes */
  313. if (driver) {
  314. sprintf(buf2, "insert into %s values ( ", table);
  315. db_set_string(&sql, buf2);
  316. if (catcol < 0) {
  317. sprintf(buf2, "%d, ", cat);
  318. db_append_string(&sql, buf2);
  319. }
  320. for (i = 0; i < ntokens; i++) {
  321. if (i > 0)
  322. db_append_string(&sql, ", ");
  323. if (strlen(tokens[i]) > 0) {
  324. if (coltype[i] == DB_C_TYPE_INT ||
  325. coltype[i] == DB_C_TYPE_DOUBLE) {
  326. if (G_projection() == PROJECTION_LL &&
  327. (i == xcol || i == ycol)) {
  328. if (i == xcol)
  329. sprintf(buf2, "%.15g", x);
  330. else
  331. sprintf(buf2, "%.15g", y);
  332. }
  333. else
  334. sprintf(buf2, "%s", tokens[i]);
  335. }
  336. else {
  337. db_set_string(&val, tokens[i]);
  338. /* TODO: strip leading and trailing "quotes" from input string */
  339. db_double_quote_string(&val);
  340. sprintf(buf2, "'%s'", db_get_string(&val));
  341. }
  342. }
  343. else {
  344. sprintf(buf2, "null");
  345. }
  346. db_append_string(&sql, buf2);
  347. }
  348. db_append_string(&sql, ")");
  349. G_debug(3, db_get_string(&sql));
  350. if (db_execute_immediate(driver, &sql) != DB_OK) {
  351. G_fatal_error(_("Unable to insert new record: %s"),
  352. db_get_string(&sql));
  353. }
  354. }
  355. G_percent(row, nrows, 2);
  356. G_free_tokens(tokens);
  357. row++;
  358. }
  359. return 0;
  360. }