#include "csv.hpp" #include "text.hpp" std::vector csv_split(const char *s) { std::vector ret; while (*s && *s != '\n' && *s != '\r') { const char *start = s; int within = 0; for (; *s && *s != '\n' && *s != '\r'; s++) { if (*s == '"') { within = !within; } if (*s == ',' && !within) { break; } } std::string v = std::string(start, s - start); ret.push_back(v); if (*s == ',') { s++; while (*s && isspace(*s)) { s++; } if (*s == '\0' || *s == '\r' || *s == '\n') { ret.push_back(std::string("")); break; } } } return ret; } std::string csv_dequote(std::string s) { std::string out; for (size_t i = 0; i < s.size(); i++) { if (s[i] == '"') { if (i + 1 < s.size() && s[i + 1] == '"') { out.push_back('"'); } } else { out.push_back(s[i]); } } return out; } std::string csv_getline(FILE *f) { std::string out; int c; while ((c = getc(f)) != EOF) { out.push_back(c); if (c == '\n') { break; } } return out; } void readcsv(const char *fn, std::vector &header, std::map> &mapping) { FILE *f = fopen(fn, "r"); if (f == NULL) { perror(fn); exit(EXIT_FAILURE); } std::string s; if ((s = csv_getline(f)).size() > 0) { std::string err = check_utf8(s); if (err != "") { fprintf(stderr, "%s: %s\n", fn, err.c_str()); exit(EXIT_FAILURE); } header = csv_split(s.c_str()); for (size_t i = 0; i < header.size(); i++) { header[i] = csv_dequote(header[i]); } } while ((s = csv_getline(f)).size() > 0) { std::string err = check_utf8(s); if (err != "") { fprintf(stderr, "%s: %s\n", fn, err.c_str()); exit(EXIT_FAILURE); } std::vector line = csv_split(s.c_str()); if (line.size() > 0) { line[0] = csv_dequote(line[0]); } for (size_t i = 0; i < line.size() && i < header.size(); i++) { // printf("putting %s\n", line[0].c_str()); mapping.insert(std::pair>(line[0], line)); } } if (fclose(f) != 0) { perror("fclose"); exit(EXIT_FAILURE); } } // Follow JSON rules for what looks like a number bool is_number(std::string const &s) { const char *cp = s.c_str(); char c = *(cp++); if (c == '-' || (c >= '0' && c <= '9')) { if (c == '-') { c = *(cp++); } if (c == '0') { ; } else if (c >= '1' && c <= '9') { c = *cp; while (c >= '0' && c <= '9') { cp++; c = *cp; } } if (*cp == '.') { cp++; c = *cp; if (c < '0' || c > '9') { return false; } while (c >= '0' && c <= '9') { cp++; c = *cp; } } c = *cp; if (c == 'e' || c == 'E') { cp++; c = *cp; if (c == '+' || c == '-') { cp++; } c = *cp; if (c < '0' || c > '9') { return false; } while (c >= '0' && c <= '9') { cp++; c = *cp; } } if (*cp == '\0') { return true; } else { // Something non-numeric at the end return false; } } return false; }