pikotools/src/csv/csvparser.h

163 lines
3.9 KiB
C++

/*
* This file is a part of PikoTools
* and is distributed under the (new) BSD licence.
* Author: Tomasz Sowa <t.sowa@ttmath.org>
*/
/*
* Copyright (c) 2021, Tomasz Sowa
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions are met:
*
* * Redistributions of source code must retain the above copyright notice,
* this list of conditions and the following disclaimer.
*
* * Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* * Neither the name Tomasz Sowa nor the names of contributors to this
* project may be used to endorse or promote products derived
* from this software without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
* THE POSSIBILITY OF SUCH DAMAGE.
*/
#ifndef headerfile_picotools_csv_csvparser
#define headerfile_picotools_csv_csvparser
#include "space/space.h"
#include <string>
#include <fstream>
namespace PT
{
/*
*
* https://datatracker.ietf.org/doc/html/rfc4180
*
*/
class CSVParser
{
public:
enum Status
{
ok,
cant_open_file,
};
Status parse_file(const char * file_name, Space & out_space);
Status parse_file(const std::string & file_name, Space & out_space);
Status parse_file(const wchar_t * file_name, Space & out_space);
Status parse_file(const std::wstring & file_name, Space & out_space);
Status parse(const char * str, Space & out_space);
Status parse(const std::string & str, Space & out_space);
Status parse(const wchar_t * str, Space & out_space);
Status parse(const std::wstring & str, Space & out_space);
protected:
/*
the last status of parsing, set by Parse() methods
*/
Status status;
Space * space;
/*
true if parse_file() method was called
false if parse() was called
*/
bool reading_from_file;
/*
true if parse(wchar_t *) or parse(std::wstring&) was called
*/
bool reading_from_wchar_string;
/*
pointers to the current character
if parse() is being used
*/
const char * pchar_ascii;
const wchar_t * pchar_unicode;
/*
last read char
or -1 if the end
*/
int lastc;
/*
a number of a line in which there is a syntax_error
*/
int line;
/*
current file
may it would be better to make a pointer?
if we parse only a string then there is no sense to have such an object
*/
std::ifstream file;
/*
input file is in UTF-8
default: true
*/
bool input_as_utf8;
void parse();
void parse_row(Space & row_space);
bool read_value_to(Space & row_space);
bool read_quoted_value_to(std::wstring & value);
bool read_non_quoted_value_to(std::wstring & value);
/*
* copied from SpaceParser
* may it would be better to have a class with those methods and inherit from it?
*/
int read_utf8_char();
int read_ascii_char();
int read_char_from_wchar_string();
int read_char_from_utf8_string();
int read_char_from_ascii_string();
int read_char_no_escape();
int read_char();
};
}
#endif