points.c 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463
  1. #include <stdio.h>
  2. #include <string.h>
  3. #include <stdlib.h>
  4. #include <ctype.h>
  5. #include <grass/gis.h>
  6. #include <grass/dbmi.h>
  7. #include <grass/vector.h>
  8. #include <grass/glocale.h>
  9. #include "local_proto.h"
  10. /* Determine if the string is integer, e.g. 123, +123, -123,
  11. * return 1 if integer, 0 otherwise */
  12. static int is_int(char *str)
  13. {
  14. char *tail;
  15. if (strtol(str, &tail, 10), tail == str || *tail != '\0') {
  16. /* doesn't look like a number,
  17. or has extra characters after what looks to be a number */
  18. return 0;
  19. }
  20. return 1;
  21. }
  22. /* Determine if the string is double, e.g. 123.456, +123.456, -123.456, 1.23456e2
  23. * return 1 if double, 0 otherwise */
  24. static int is_double(char *str)
  25. {
  26. char *tail;
  27. if (strtod(str, &tail), tail == str || *tail != '\0') {
  28. /* doesn't look like a number,
  29. or has extra characters after what looks to be a number */
  30. return 0;
  31. }
  32. return 1;
  33. }
  34. /* Analyse points ascii file. Determine number of columns and column types.
  35. * ascii_tmp: write copy of tempfile to ascii_tmp:
  36. * rowlength: maximum row length
  37. * ncolumns: number of columns
  38. * minncolumns: minimum number of columns
  39. * nrows: number of rows
  40. * column_type: column types
  41. * column_length: column lengths (string only)
  42. */
  43. int points_analyse(FILE * ascii_in, FILE * ascii, char *fs, char *td,
  44. int *rowlength, int *ncolumns, int *minncolumns,
  45. int *nrows, int **column_type, int **column_length,
  46. int skip_lines, int xcol, int ycol, int zcol, int catcol,
  47. int region_flag, int ignore_flag)
  48. {
  49. int i;
  50. int buflen; /* buffer length */
  51. char *buf; /* buffer */
  52. int row = 1; /* line number, first is 1 */
  53. int ncols = 0; /* number of columns */
  54. int minncols = -1;
  55. int *coltype = NULL; /* column types */
  56. int *collen = NULL; /* column lengths */
  57. char **tokens;
  58. int ntokens; /* number of tokens */
  59. int len, rowlen = 0; /* maximum row length */
  60. struct Cell_head window;
  61. double northing = .0;
  62. double easting = .0;
  63. char *xtoken, *ytoken, *sav_buf;
  64. int skip = FALSE, skipped = 0;
  65. buflen = 4000;
  66. buf = (char *)G_malloc(buflen);
  67. xtoken = (char *)G_malloc(256);
  68. ytoken = (char *)G_malloc(256);
  69. G_message(_("Scanning input for column types..."));
  70. /* fetch projection for LatLong test */
  71. G_get_window(&window);
  72. /* points_to_bin() would be faster if we would write out
  73. * clean data to ascii
  74. * points_to_bin() would then not need G_chop() and
  75. * for latlon not G_scan_[easting|northing]() */
  76. while (1) {
  77. len = 0; /* not really needed, but what the heck */
  78. skip = FALSE; /* reset out-of-region check */
  79. sav_buf = NULL;
  80. if (G_getl2(buf, buflen - 1, ascii_in) == 0)
  81. break; /* EOF */
  82. if (row <= skip_lines) {
  83. G_debug(3, "skipping header row %d : %d chars", row,
  84. (int)strlen(buf));
  85. /* this fn is read-only, write to hist with points_to_bin() */
  86. fprintf(ascii, "%s\n", buf);
  87. len = strlen(buf) + 1;
  88. if (len > rowlen)
  89. rowlen = len;
  90. row++;
  91. continue;
  92. }
  93. if ((buf[0] == '#') || (buf[0] == '\0')) {
  94. G_debug(3, "skipping comment row %d : %d chars", row,
  95. (int)strlen(buf));
  96. continue;
  97. }
  98. /* no G_chop() as first/last column may be empty fs=tab value */
  99. G_debug(3, "row %d : %d chars", row, (int)strlen(buf));
  100. tokens = G_tokenize2(buf, fs, td);
  101. ntokens = G_number_of_tokens(tokens);
  102. if (ntokens == 0) {
  103. continue;
  104. }
  105. if (ncols > 0 && ntokens != ncols) {
  106. /* these rows can not be imported into the attribute table */
  107. if (ignore_flag) {
  108. G_warning(_("Row %d: '%s' can not be imported into the attribute table"),
  109. row, buf);
  110. }
  111. else {
  112. G_fatal_error(_("Broken row %d: '%s'"), row, buf);
  113. }
  114. }
  115. if (xcol >= ntokens || ycol >= ntokens || zcol >= ntokens ||
  116. catcol >= ntokens) {
  117. if (ignore_flag) {
  118. G_debug(3, "Skipping broken row %d: '%s'", row, buf);
  119. continue;
  120. }
  121. else {
  122. G_fatal_error(_("Broken row %d: '%s'"), row, buf);
  123. }
  124. }
  125. len = strlen(buf) + 1;
  126. if (len > rowlen)
  127. rowlen = len;
  128. if (ntokens > ncols) {
  129. coltype = (int *)G_realloc(coltype, ntokens * sizeof(int));
  130. collen = (int *)G_realloc(collen, ntokens * sizeof(int));
  131. for (i = ncols; i < ntokens; i++) {
  132. coltype[i] = DB_C_TYPE_INT; /* default type */
  133. collen[i] = 0;
  134. }
  135. ncols = ntokens;
  136. }
  137. if (minncols == -1 || minncols > ntokens)
  138. minncols = ntokens;
  139. /* Determine column types */
  140. for (i = 0; i < ntokens; i++) {
  141. G_chop(tokens[i]);
  142. if ((G_projection() == PROJECTION_LL)) {
  143. if (i == xcol || i == ycol) {
  144. if (i == 0) { /* Save position of original internal token buffer */
  145. /* Prevent memory leaks */
  146. sav_buf = tokens[0];
  147. }
  148. /* check if coordinates are DMS or decimal or not latlong at all */
  149. if (i == xcol) {
  150. if (G_scan_easting(tokens[i], &easting, window.proj)) {
  151. G_debug(4, "is_latlong east: %g", easting);
  152. sprintf(xtoken, "%.15g", easting);
  153. /* replace current DMS token by decimal degree */
  154. tokens[i] = xtoken;
  155. if (region_flag) {
  156. if ((window.east < easting) ||
  157. (window.west > easting))
  158. skip = TRUE;
  159. }
  160. }
  161. else {
  162. fprintf(stderr, _("Current row %d:\n%s\n"), row, buf);
  163. G_fatal_error(_("Unparsable longitude value in column %d: %s"),
  164. i + 1, tokens[i]);
  165. }
  166. }
  167. if (i == ycol) {
  168. if (G_scan_northing(tokens[i], &northing, window.proj)) {
  169. G_debug(4, "is_latlong north: %g", northing);
  170. sprintf(ytoken, "%.15g", northing);
  171. /* replace current DMS token by decimal degree */
  172. tokens[i] = ytoken;
  173. if (region_flag) {
  174. if ((window.north < northing) ||
  175. (window.south > northing))
  176. skip = TRUE;
  177. }
  178. }
  179. else {
  180. fprintf(stderr, _("Current row %d:\n%s\n"), row, buf);
  181. G_fatal_error(_("Unparsable latitude value in column %d: %s"),
  182. i + 1, tokens[i]);
  183. }
  184. }
  185. } /* if (x or y) */
  186. } /* PROJECTION_LL */
  187. else {
  188. if (strlen(tokens[i]) == 0) {
  189. if (i == xcol) {
  190. G_fatal_error(_("Unparsable longitude value in column %d: %s"),
  191. i + 1, tokens[i]);
  192. }
  193. if (i == ycol) {
  194. G_fatal_error(_("Unparsable latitude value in column %d: %s"),
  195. i + 1, tokens[i]);
  196. }
  197. }
  198. if (region_flag) {
  199. /* consider z range if -z flag is used? */
  200. /* change to if(>= east,north){skip=1;} to allow correct tiling */
  201. /* don't "continue;" so multiple passes will have the
  202. same column types and length for patching */
  203. if (i == xcol) {
  204. easting = atof(tokens[i]);
  205. if ((window.east < easting) ||
  206. (window.west > easting))
  207. skip = TRUE;
  208. }
  209. if (i == ycol) {
  210. northing = atof(tokens[i]);
  211. if ((window.north < northing) ||
  212. (window.south > northing))
  213. skip = TRUE;
  214. }
  215. }
  216. }
  217. len = strlen(tokens[i]);
  218. /* do not guess column type for missing values */
  219. if (len == 0)
  220. continue;
  221. G_debug(4, "row %d col %d: '%s' is_int = %d is_double = %d",
  222. row + 1, i + 1, tokens[i], is_int(tokens[i]),
  223. is_double(tokens[i]));
  224. if (is_int(tokens[i])) {
  225. continue; /* integer */
  226. }
  227. if (is_double(tokens[i])) { /* double */
  228. if (coltype[i] == DB_C_TYPE_INT) {
  229. coltype[i] = DB_C_TYPE_DOUBLE;
  230. }
  231. continue;
  232. }
  233. /* string */
  234. coltype[i] = DB_C_TYPE_STRING;
  235. if (len > collen[i])
  236. collen[i] = len;
  237. }
  238. /* write dataline to tmp file */
  239. if (!skip)
  240. fprintf(ascii, "%s\n", buf);
  241. else
  242. skipped++;
  243. if (sav_buf != NULL) {
  244. /* Restore original token buffer so free_tokens works */
  245. /* Only do this if tokens[0] was re-assigned */
  246. tokens[0] = sav_buf;
  247. sav_buf = NULL;
  248. }
  249. G_free_tokens(tokens);
  250. row++;
  251. }
  252. *rowlength = rowlen;
  253. *ncolumns = ncols;
  254. *minncolumns = minncols;
  255. *column_type = coltype;
  256. *column_length = collen;
  257. *nrows = row - 1; /* including skipped lines */
  258. G_free(buf);
  259. G_free(xtoken);
  260. G_free(ytoken);
  261. if (region_flag)
  262. G_message(n_("Skipping %d of %d row falling outside of current region",
  263. "Skipping %d of %d rows falling outside of current region",
  264. row - 1),
  265. skipped, row - 1);
  266. return 0;
  267. }
  268. /* Import points from ascii file.
  269. *
  270. * fs: field separator
  271. * xcol, ycol, zcol, catcol: x,y,z,cat column in input file, first column is 1,
  272. * zcol and catcol may be 0 (do not use)
  273. * rowlen: maximum row length
  274. * Note: column types (both in header or coldef) must be supported by driver
  275. */
  276. int points_to_bin(FILE * ascii, int rowlen, struct Map_info *Map,
  277. dbDriver * driver, char *table, char *fs, char *td,
  278. int nrows, int *coltype, int xcol, int ycol, int zcol,
  279. int catcol, int skip_lines)
  280. {
  281. char *buf, buf2[4000];
  282. int cat = 0;
  283. int row = 0;
  284. struct line_pnts *Points;
  285. struct line_cats *Cats;
  286. dbString sql, val;
  287. struct Cell_head window;
  288. G_message(_("Importing points..."));
  289. /* fetch projection for LatLong test */
  290. G_get_window(&window);
  291. rewind(ascii);
  292. Points = Vect_new_line_struct();
  293. Cats = Vect_new_cats_struct();
  294. /* actually last 2 characters won't be read */
  295. buf = (char *)G_malloc(rowlen + 2);
  296. db_init_string(&sql);
  297. db_init_string(&val);
  298. if (skip_lines > 0) {
  299. sprintf(buf2, "HEADER: (%d lines)\n", skip_lines);
  300. Vect_hist_write(Map, buf2);
  301. }
  302. /* rowlen + 2 to read till the end of line on both UNIX and Windows */
  303. while (G_getl2(buf, rowlen + 2, ascii) != 0) {
  304. int i, len;
  305. double x, y, z;
  306. char **tokens;
  307. int ntokens; /* number of tokens */
  308. G_percent(row, nrows, 2);
  309. row++;
  310. if (row <= skip_lines) {
  311. G_debug(4, "writing skip line %d to hist : %d chars", row,
  312. (int)strlen(buf));
  313. Vect_hist_write(Map, buf);
  314. Vect_hist_write(Map, "\n");
  315. continue;
  316. }
  317. len = strlen(buf);
  318. if (len == 0)
  319. continue; /* should not happen */
  320. G_debug(4, "row: %s", buf);
  321. tokens = G_tokenize2(buf, fs, td);
  322. ntokens = G_number_of_tokens(tokens);
  323. G_chop(tokens[xcol]);
  324. G_chop(tokens[ycol]);
  325. if ((G_projection() == PROJECTION_LL)) {
  326. G_scan_easting(tokens[xcol], &x, window.proj);
  327. G_scan_northing(tokens[ycol], &y, window.proj);
  328. }
  329. else {
  330. x = atof(tokens[xcol]);
  331. y = atof(tokens[ycol]);
  332. }
  333. G_debug(4, "x: %f, y: %f", x, y);
  334. if (zcol >= 0) {
  335. G_chop(tokens[zcol]);
  336. z = atof(tokens[zcol]);
  337. }
  338. else
  339. z = 0.0;
  340. if (catcol >= 0) {
  341. G_chop(tokens[catcol]);
  342. cat = atof(tokens[catcol]);
  343. }
  344. else
  345. cat++;
  346. Vect_reset_line(Points);
  347. Vect_reset_cats(Cats);
  348. Vect_append_point(Points, x, y, z);
  349. Vect_cat_set(Cats, 1, cat);
  350. Vect_write_line(Map, GV_POINT, Points, Cats);
  351. /* Attributes */
  352. if (driver) {
  353. sprintf(buf2, "insert into %s values ( ", table);
  354. db_set_string(&sql, buf2);
  355. if (catcol < 0) {
  356. sprintf(buf2, "%d, ", cat);
  357. db_append_string(&sql, buf2);
  358. }
  359. for (i = 0; i < ntokens; i++) {
  360. G_chop(tokens[i]);
  361. if (i > 0)
  362. db_append_string(&sql, ", ");
  363. if (strlen(tokens[i]) > 0) {
  364. if (coltype[i] == DB_C_TYPE_INT ||
  365. coltype[i] == DB_C_TYPE_DOUBLE) {
  366. if (G_projection() == PROJECTION_LL &&
  367. (i == xcol || i == ycol)) {
  368. if (i == xcol)
  369. sprintf(buf2, "%.15g", x);
  370. else
  371. sprintf(buf2, "%.15g", y);
  372. }
  373. else
  374. sprintf(buf2, "%s", tokens[i]);
  375. }
  376. else {
  377. db_set_string(&val, tokens[i]);
  378. /* TODO: strip leading and trailing "quotes" from input string */
  379. db_double_quote_string(&val);
  380. sprintf(buf2, "'%s'", db_get_string(&val));
  381. }
  382. }
  383. else {
  384. sprintf(buf2, "null");
  385. }
  386. db_append_string(&sql, buf2);
  387. }
  388. db_append_string(&sql, ")");
  389. G_debug(3, db_get_string(&sql));
  390. if (db_execute_immediate(driver, &sql) != DB_OK) {
  391. G_fatal_error(_("Unable to insert new record: %s"),
  392. db_get_string(&sql));
  393. }
  394. }
  395. G_free_tokens(tokens);
  396. }
  397. G_percent(nrows, nrows, 2);
  398. return 0;
  399. }