// Copyright 2013 Daniel Parker // Distributed under the Boost license, Version 1.0. // (See accompanying file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt) // See https://github.com/danielaparker/jsoncons for latest version #ifndef JSONCONS_CSV_CSV_READER_HPP #define JSONCONS_CSV_CSV_READER_HPP #include <string> #include <vector> #include <stdexcept> #include <memory> // std::allocator #include <utility> // std::move #include <istream> // std::basic_istream #include <jsoncons/source.hpp> #include <jsoncons/json_exception.hpp> #include <jsoncons/json_visitor.hpp> #include <jsoncons_ext/csv/csv_error.hpp> #include <jsoncons_ext/csv/csv_parser.hpp> #include <jsoncons/json.hpp> #include <jsoncons/json_reader.hpp> #include <jsoncons/json_decoder.hpp> #include <jsoncons/source_adaptor.hpp> #include <jsoncons_ext/csv/csv_options.hpp> namespace jsoncons { namespace csv { template<class CharT,class Source=jsoncons::stream_source<CharT>,class Allocator=std::allocator<char>> class basic_csv_reader { struct stack_item { stack_item() noexcept : array_begun_(false) { } bool array_begun_; }; using char_type = CharT; using temp_allocator_type = Allocator; typedef typename std::allocator_traits<temp_allocator_type>:: template rebind_alloc<CharT> char_allocator_type; basic_csv_reader(const basic_csv_reader&) = delete; basic_csv_reader& operator = (const basic_csv_reader&) = delete; basic_default_json_visitor<CharT> default_visitor_; text_source_adaptor<Source> source_; basic_json_visitor<CharT>& visitor_; basic_csv_parser<CharT,Allocator> parser_; public: // Structural characters static constexpr size_t default_max_buffer_size = 16384; //! Parse an input stream of CSV text into a json object /*! \param is The input stream to read from */ template <class Sourceable> basic_csv_reader(Sourceable&& source, basic_json_visitor<CharT>& visitor, const Allocator& alloc = Allocator()) : basic_csv_reader(std::forward<Sourceable>(source), visitor, basic_csv_decode_options<CharT>(), default_csv_parsing(), alloc) { } template <class Sourceable> basic_csv_reader(Sourceable&& source, basic_json_visitor<CharT>& visitor, const basic_csv_decode_options<CharT>& options, const Allocator& alloc = Allocator()) : basic_csv_reader(std::forward<Sourceable>(source), visitor, options, default_csv_parsing(), alloc) { } template <class Sourceable> basic_csv_reader(Sourceable&& source, basic_json_visitor<CharT>& visitor, std::function<bool(csv_errc,const ser_context&)> err_handler, const Allocator& alloc = Allocator()) : basic_csv_reader(std::forward<Sourceable>(source), visitor, basic_csv_decode_options<CharT>(), err_handler, alloc) { } template <class Sourceable> basic_csv_reader(Sourceable&& source, basic_json_visitor<CharT>& visitor, const basic_csv_decode_options<CharT>& options, std::function<bool(csv_errc,const ser_context&)> err_handler, const Allocator& alloc = Allocator()) : source_(std::forward<Sourceable>(source)), visitor_(visitor), parser_(options, err_handler, alloc) { } ~basic_csv_reader() noexcept = default; void read() { std::error_code ec; read(ec); if (ec) { JSONCONS_THROW(ser_error(ec,parser_.line(),parser_.column())); } } void read(std::error_code& ec) { read_internal(ec); } std::size_t line() const { return parser_.line(); } std::size_t column() const { return parser_.column(); } bool eof() const { return parser_.source_exhausted() && source_.eof(); } private: void read_internal(std::error_code& ec) { if (source_.is_error()) { ec = csv_errc::source_error; return; } while (!parser_.stopped()) { if (parser_.source_exhausted()) { auto s = source_.read_buffer(ec); if (ec) return; if (s.size() > 0) { parser_.update(s.data(),s.size()); } } parser_.parse_some(visitor_, ec); if (ec) return; } } }; template<class CharT,class Source=jsoncons::stream_source<CharT>,class Allocator=std::allocator<char>> class legacy_basic_csv_reader { struct stack_item { stack_item() noexcept : array_begun_(false) { } bool array_begun_; }; using char_type = CharT; using temp_allocator_type = Allocator; typedef typename std::allocator_traits<temp_allocator_type>:: template rebind_alloc<CharT> char_allocator_type; legacy_basic_csv_reader(const legacy_basic_csv_reader&) = delete; legacy_basic_csv_reader& operator = (const legacy_basic_csv_reader&) = delete; basic_default_json_visitor<CharT> default_visitor_; text_source_adaptor<Source> source_; basic_json_visitor<CharT>& visitor_; basic_csv_parser<CharT,Allocator> parser_; public: // Structural characters static constexpr size_t default_max_buffer_size = 16384; //! Parse an input stream of CSV text into a json object /*! \param is The input stream to read from */ template <class Sourceable> legacy_basic_csv_reader(Sourceable&& source, basic_json_visitor<CharT>& visitor, const Allocator& alloc = Allocator()) : legacy_basic_csv_reader(std::forward<Sourceable>(source), visitor, basic_csv_decode_options<CharT>(), default_csv_parsing(), alloc) { } template <class Sourceable> legacy_basic_csv_reader(Sourceable&& source, basic_json_visitor<CharT>& visitor, const basic_csv_decode_options<CharT>& options, const Allocator& alloc = Allocator()) : legacy_basic_csv_reader(std::forward<Sourceable>(source), visitor, options, default_csv_parsing(), alloc) { } template <class Sourceable> legacy_basic_csv_reader(Sourceable&& source, basic_json_visitor<CharT>& visitor, std::function<bool(csv_errc,const ser_context&)> err_handler, const Allocator& alloc = Allocator()) : legacy_basic_csv_reader(std::forward<Sourceable>(source), visitor, basic_csv_decode_options<CharT>(), err_handler, alloc) { } template <class Sourceable> legacy_basic_csv_reader(Sourceable&& source, basic_json_visitor<CharT>& visitor, const basic_csv_decode_options<CharT>& options, std::function<bool(csv_errc,const ser_context&)> err_handler, const Allocator& alloc = Allocator(), typename std::enable_if<!std::is_constructible<jsoncons::basic_string_view<CharT>,Sourceable>::value>::type* = 0) : source_(std::forward<Sourceable>(source)), visitor_(visitor), parser_(options, err_handler, alloc) { } template <class Sourceable> legacy_basic_csv_reader(Sourceable&& source, basic_json_visitor<CharT>& visitor, const basic_csv_decode_options<CharT>& options, std::function<bool(csv_errc,const ser_context&)> err_handler, const Allocator& alloc = Allocator(), typename std::enable_if<std::is_constructible<jsoncons::basic_string_view<CharT>,Sourceable>::value>::type* = 0) : source_(), visitor_(visitor), parser_(options, err_handler, alloc) { jsoncons::basic_string_view<CharT> sv(std::forward<Sourceable>(source)); auto r = unicode_traits::detect_encoding_from_bom(sv.data(), sv.size()); if (!(r.encoding == unicode_traits::encoding_kind::utf8 || r.encoding == unicode_traits::encoding_kind::undetected)) { JSONCONS_THROW(ser_error(json_errc::illegal_unicode_character,parser_.line(),parser_.column())); } std::size_t offset = (r.ptr - sv.data()); parser_.update(sv.data()+offset,sv.size()-offset); } ~legacy_basic_csv_reader() noexcept = default; void read() { std::error_code ec; read(ec); if (ec) { JSONCONS_THROW(ser_error(ec,parser_.line(),parser_.column())); } } void read(std::error_code& ec) { read_internal(ec); } std::size_t line() const { return parser_.line(); } std::size_t column() const { return parser_.column(); } bool eof() const { return parser_.source_exhausted() && source_.eof(); } private: void read_internal(std::error_code& ec) { if (source_.is_error()) { ec = csv_errc::source_error; return; } while (!parser_.stopped()) { if (parser_.source_exhausted()) { auto s = source_.read_buffer(ec); if (ec) return; if (s.size() > 0) { parser_.update(s.data(),s.size()); } } parser_.parse_some(visitor_, ec); if (ec) return; } } }; #if !defined(JSONCONS_NO_DEPRECATED) using csv_reader = legacy_basic_csv_reader<char>; using wcsv_reader = legacy_basic_csv_reader<wchar_t>; #endif using csv_string_reader = basic_csv_reader<char,string_source<char>>; using wcsv_string_reader = basic_csv_reader<wchar_t,string_source<wchar_t>>; using csv_stream_reader = basic_csv_reader<char,stream_source<char>>; using wcsv_stream_reader = basic_csv_reader<wchar_t,stream_source<wchar_t>>; }} #endif