/***************************************************************************** * * This file is part of Mapnik (c++ mapping toolkit) * * Copyright (C) 2015 Artem Pavlenko * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2.1 of the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with this library; if not, write to the Free Software * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA * *****************************************************************************/ #ifndef MAPNIK_CSV_UTILS_DATASOURCE_HPP #define MAPNIK_CSV_UTILS_DATASOURCE_HPP // mapnik #include #include #include #include #include #include // std #include #include #include namespace csv_utils { mapnik::csv_line parse_line(char const* start, char const* end, char separator, char quote, std::size_t num_columns); mapnik::csv_line parse_line(std::string const& line_str, char separator, char quote); bool is_likely_number(std::string const& value); bool ignore_case_equal(std::string const& s0, std::string const& s1); struct geometry_column_locator { geometry_column_locator() : type(UNKNOWN), index(-1), index2(-1) {} enum { UNKNOWN = 0, WKT, GEOJSON, LON_LAT } type; std::size_t index; std::size_t index2; }; namespace detail { std::size_t file_length(std::istream & stream); std::tuple autodect_csv_flavour(std::istream & stream, std::size_t file_length); void locate_geometry_column(std::string const& header, std::size_t index, geometry_column_locator & locator); bool valid(geometry_column_locator const& locator, std::size_t max_size); } // namespace detail mapnik::geometry::geometry extract_geometry(std::vector const& row, geometry_column_locator const& locator); template void process_properties(Feature & feature, Headers const& headers, Values const& values, Locator const& locator, Transcoder const& tr) { auto val_beg = values.begin(); auto val_end = values.end(); auto num_headers = headers.size(); for (std::size_t i = 0; i < num_headers; ++i) { std::string const& fld_name = headers.at(i); if (val_beg == val_end) { feature.put(fld_name,tr.transcode("")); continue; } std::string value = mapnik::util::trim_copy(*val_beg++); int value_length = value.length(); if (locator.index == i && (locator.type == geometry_column_locator::WKT || locator.type == geometry_column_locator::GEOJSON) ) continue; bool matched = false; bool has_dot = value.find(".") != std::string::npos; if (value.empty() || (value_length > 20) || (value_length > 1 && !has_dot && value[0] == '0')) { matched = true; feature.put(fld_name,std::move(tr.transcode(value.c_str()))); } else if (csv_utils::is_likely_number(value)) { bool has_e = value.find("e") != std::string::npos; if (has_dot || has_e) { double float_val = 0.0; if (mapnik::util::string2double(value,float_val)) { matched = true; feature.put(fld_name,float_val); } } else { mapnik::value_integer int_val = 0; if (mapnik::util::string2int(value,int_val)) { matched = true; feature.put(fld_name,int_val); } } } if (!matched) { if (csv_utils::ignore_case_equal(value, "true")) { feature.put(fld_name, true); } else if (csv_utils::ignore_case_equal(value, "false")) { feature.put(fld_name, false); } else // fallback to string { feature.put(fld_name,std::move(tr.transcode(value.c_str()))); } } } } struct csv_file_parser { using box_type = mapnik::box2d; using item_type = std::pair>; using boxes_type = std::vector; void parse_csv(std::istream & csv_file, boxes_type & boxes); virtual void add_feature(mapnik::value_integer index, mapnik::csv_line const & values); std::vector headers_; std::string manual_headers_; geometry_column_locator locator_; mapnik::box2d extent_; mapnik::value_integer row_limit_ = 0; char separator_ = '\0'; char quote_ = '\0'; bool strict_ = false; bool extent_initialized_ = false; bool has_disk_index_ = false; }; } // namespace csv_utils #endif // MAPNIK_CSV_UTILS_DATASOURCE_HPP