aboutsummaryrefslogtreecommitdiff
path: root/include/jsoncons_ext/csv/csv_reader.hpp
diff options
context:
space:
mode:
Diffstat (limited to 'include/jsoncons_ext/csv/csv_reader.hpp')
-rw-r--r--include/jsoncons_ext/csv/csv_reader.hpp348
1 files changed, 348 insertions, 0 deletions
diff --git a/include/jsoncons_ext/csv/csv_reader.hpp b/include/jsoncons_ext/csv/csv_reader.hpp
new file mode 100644
index 0000000..f10211a
--- /dev/null
+++ b/include/jsoncons_ext/csv/csv_reader.hpp
@@ -0,0 +1,348 @@
+// Copyright 2013 Daniel Parker
+// Distributed under the Boost license, Version 1.0.
+// (See accompanying file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
+
+// See https://github.com/danielaparker/jsoncons for latest version
+
+#ifndef JSONCONS_CSV_CSV_READER_HPP
+#define JSONCONS_CSV_CSV_READER_HPP
+
+#include <string>
+#include <vector>
+#include <stdexcept>
+#include <memory> // std::allocator
+#include <utility> // std::move
+#include <istream> // std::basic_istream
+#include <jsoncons/source.hpp>
+#include <jsoncons/json_exception.hpp>
+#include <jsoncons/json_visitor.hpp>
+#include <jsoncons_ext/csv/csv_error.hpp>
+#include <jsoncons_ext/csv/csv_parser.hpp>
+#include <jsoncons/json.hpp>
+#include <jsoncons/json_reader.hpp>
+#include <jsoncons/json_decoder.hpp>
+#include <jsoncons/source_adaptor.hpp>
+#include <jsoncons_ext/csv/csv_options.hpp>
+
+namespace jsoncons { namespace csv {
+
+ template<class CharT,class Source=jsoncons::stream_source<CharT>,class Allocator=std::allocator<char>>
+ class basic_csv_reader
+ {
+ struct stack_item
+ {
+ stack_item() noexcept
+ : array_begun_(false)
+ {
+ }
+
+ bool array_begun_;
+ };
+ using char_type = CharT;
+ using temp_allocator_type = Allocator;
+ typedef typename std::allocator_traits<temp_allocator_type>:: template rebind_alloc<CharT> char_allocator_type;
+
+ basic_csv_reader(const basic_csv_reader&) = delete;
+ basic_csv_reader& operator = (const basic_csv_reader&) = delete;
+
+ basic_default_json_visitor<CharT> default_visitor_;
+ text_source_adaptor<Source> source_;
+ basic_json_visitor<CharT>& visitor_;
+ basic_csv_parser<CharT,Allocator> parser_;
+
+ public:
+ // Structural characters
+ static constexpr size_t default_max_buffer_size = 16384;
+ //! Parse an input stream of CSV text into a json object
+ /*!
+ \param is The input stream to read from
+ */
+
+ template <class Sourceable>
+ basic_csv_reader(Sourceable&& source,
+ basic_json_visitor<CharT>& visitor,
+ const Allocator& alloc = Allocator())
+
+ : basic_csv_reader(std::forward<Sourceable>(source),
+ visitor,
+ basic_csv_decode_options<CharT>(),
+ default_csv_parsing(),
+ alloc)
+ {
+ }
+
+ template <class Sourceable>
+ basic_csv_reader(Sourceable&& source,
+ basic_json_visitor<CharT>& visitor,
+ const basic_csv_decode_options<CharT>& options,
+ const Allocator& alloc = Allocator())
+
+ : basic_csv_reader(std::forward<Sourceable>(source),
+ visitor,
+ options,
+ default_csv_parsing(),
+ alloc)
+ {
+ }
+
+ template <class Sourceable>
+ basic_csv_reader(Sourceable&& source,
+ basic_json_visitor<CharT>& visitor,
+ std::function<bool(csv_errc,const ser_context&)> err_handler,
+ const Allocator& alloc = Allocator())
+ : basic_csv_reader(std::forward<Sourceable>(source),
+ visitor,
+ basic_csv_decode_options<CharT>(),
+ err_handler,
+ alloc)
+ {
+ }
+
+ template <class Sourceable>
+ basic_csv_reader(Sourceable&& source,
+ basic_json_visitor<CharT>& visitor,
+ const basic_csv_decode_options<CharT>& options,
+ std::function<bool(csv_errc,const ser_context&)> err_handler,
+ const Allocator& alloc = Allocator())
+ : source_(std::forward<Sourceable>(source)),
+ visitor_(visitor),
+ parser_(options, err_handler, alloc)
+
+ {
+ }
+
+ ~basic_csv_reader() noexcept = default;
+
+ void read()
+ {
+ std::error_code ec;
+ read(ec);
+ if (ec)
+ {
+ JSONCONS_THROW(ser_error(ec,parser_.line(),parser_.column()));
+ }
+ }
+
+ void read(std::error_code& ec)
+ {
+ read_internal(ec);
+ }
+
+ std::size_t line() const
+ {
+ return parser_.line();
+ }
+
+ std::size_t column() const
+ {
+ return parser_.column();
+ }
+
+ bool eof() const
+ {
+ return parser_.source_exhausted() && source_.eof();
+ }
+
+ private:
+
+ void read_internal(std::error_code& ec)
+ {
+ if (source_.is_error())
+ {
+ ec = csv_errc::source_error;
+ return;
+ }
+ while (!parser_.stopped())
+ {
+ if (parser_.source_exhausted())
+ {
+ auto s = source_.read_buffer(ec);
+ if (ec) return;
+ if (s.size() > 0)
+ {
+ parser_.update(s.data(),s.size());
+ }
+ }
+ parser_.parse_some(visitor_, ec);
+ if (ec) return;
+ }
+ }
+ };
+
+ template<class CharT,class Source=jsoncons::stream_source<CharT>,class Allocator=std::allocator<char>>
+ class legacy_basic_csv_reader
+ {
+ struct stack_item
+ {
+ stack_item() noexcept
+ : array_begun_(false)
+ {
+ }
+
+ bool array_begun_;
+ };
+ using char_type = CharT;
+ using temp_allocator_type = Allocator;
+ typedef typename std::allocator_traits<temp_allocator_type>:: template rebind_alloc<CharT> char_allocator_type;
+
+ legacy_basic_csv_reader(const legacy_basic_csv_reader&) = delete;
+ legacy_basic_csv_reader& operator = (const legacy_basic_csv_reader&) = delete;
+
+ basic_default_json_visitor<CharT> default_visitor_;
+ text_source_adaptor<Source> source_;
+ basic_json_visitor<CharT>& visitor_;
+ basic_csv_parser<CharT,Allocator> parser_;
+
+ public:
+ // Structural characters
+ static constexpr size_t default_max_buffer_size = 16384;
+ //! Parse an input stream of CSV text into a json object
+ /*!
+ \param is The input stream to read from
+ */
+
+ template <class Sourceable>
+ legacy_basic_csv_reader(Sourceable&& source,
+ basic_json_visitor<CharT>& visitor,
+ const Allocator& alloc = Allocator())
+
+ : legacy_basic_csv_reader(std::forward<Sourceable>(source),
+ visitor,
+ basic_csv_decode_options<CharT>(),
+ default_csv_parsing(),
+ alloc)
+ {
+ }
+
+ template <class Sourceable>
+ legacy_basic_csv_reader(Sourceable&& source,
+ basic_json_visitor<CharT>& visitor,
+ const basic_csv_decode_options<CharT>& options,
+ const Allocator& alloc = Allocator())
+
+ : legacy_basic_csv_reader(std::forward<Sourceable>(source),
+ visitor,
+ options,
+ default_csv_parsing(),
+ alloc)
+ {
+ }
+
+ template <class Sourceable>
+ legacy_basic_csv_reader(Sourceable&& source,
+ basic_json_visitor<CharT>& visitor,
+ std::function<bool(csv_errc,const ser_context&)> err_handler,
+ const Allocator& alloc = Allocator())
+ : legacy_basic_csv_reader(std::forward<Sourceable>(source),
+ visitor,
+ basic_csv_decode_options<CharT>(),
+ err_handler,
+ alloc)
+ {
+ }
+
+ template <class Sourceable>
+ legacy_basic_csv_reader(Sourceable&& source,
+ basic_json_visitor<CharT>& visitor,
+ const basic_csv_decode_options<CharT>& options,
+ std::function<bool(csv_errc,const ser_context&)> err_handler,
+ const Allocator& alloc = Allocator(),
+ typename std::enable_if<!std::is_constructible<jsoncons::basic_string_view<CharT>,Sourceable>::value>::type* = 0)
+ : source_(std::forward<Sourceable>(source)),
+ visitor_(visitor),
+ parser_(options, err_handler, alloc)
+ {
+ }
+
+ template <class Sourceable>
+ legacy_basic_csv_reader(Sourceable&& source,
+ basic_json_visitor<CharT>& visitor,
+ const basic_csv_decode_options<CharT>& options,
+ std::function<bool(csv_errc,const ser_context&)> err_handler,
+ const Allocator& alloc = Allocator(),
+ typename std::enable_if<std::is_constructible<jsoncons::basic_string_view<CharT>,Sourceable>::value>::type* = 0)
+ : source_(),
+ visitor_(visitor),
+ parser_(options, err_handler, alloc)
+ {
+ jsoncons::basic_string_view<CharT> sv(std::forward<Sourceable>(source));
+ auto r = unicode_traits::detect_encoding_from_bom(sv.data(), sv.size());
+ if (!(r.encoding == unicode_traits::encoding_kind::utf8 || r.encoding == unicode_traits::encoding_kind::undetected))
+ {
+ JSONCONS_THROW(ser_error(json_errc::illegal_unicode_character,parser_.line(),parser_.column()));
+ }
+ std::size_t offset = (r.ptr - sv.data());
+ parser_.update(sv.data()+offset,sv.size()-offset);
+ }
+
+ ~legacy_basic_csv_reader() noexcept = default;
+
+ void read()
+ {
+ std::error_code ec;
+ read(ec);
+ if (ec)
+ {
+ JSONCONS_THROW(ser_error(ec,parser_.line(),parser_.column()));
+ }
+ }
+
+ void read(std::error_code& ec)
+ {
+ read_internal(ec);
+ }
+
+ std::size_t line() const
+ {
+ return parser_.line();
+ }
+
+ std::size_t column() const
+ {
+ return parser_.column();
+ }
+
+ bool eof() const
+ {
+ return parser_.source_exhausted() && source_.eof();
+ }
+
+ private:
+
+ void read_internal(std::error_code& ec)
+ {
+ if (source_.is_error())
+ {
+ ec = csv_errc::source_error;
+ return;
+ }
+ while (!parser_.stopped())
+ {
+ if (parser_.source_exhausted())
+ {
+ auto s = source_.read_buffer(ec);
+ if (ec) return;
+ if (s.size() > 0)
+ {
+ parser_.update(s.data(),s.size());
+ }
+ }
+ parser_.parse_some(visitor_, ec);
+ if (ec) return;
+ }
+ }
+ };
+
+#if !defined(JSONCONS_NO_DEPRECATED)
+ using csv_reader = legacy_basic_csv_reader<char>;
+ using wcsv_reader = legacy_basic_csv_reader<wchar_t>;
+#endif
+
+ using csv_string_reader = basic_csv_reader<char,string_source<char>>;
+ using wcsv_string_reader = basic_csv_reader<wchar_t,string_source<wchar_t>>;
+ using csv_stream_reader = basic_csv_reader<char,stream_source<char>>;
+ using wcsv_stream_reader = basic_csv_reader<wchar_t,stream_source<wchar_t>>;
+
+}}
+
+#endif