diff options
author | Dominick Allen <djallen@librehumanitas.org> | 2025-01-01 17:41:17 -0600 |
---|---|---|
committer | Dominick Allen <djallen@librehumanitas.org> | 2025-01-01 17:41:17 -0600 |
commit | 16379362c02a2472f00fac49cad62788547c9519 (patch) | |
tree | 9b7f42acbba8dd259a536287a2b130e92ad2e2c7 /include/fud_csv.hpp | |
parent | 012df4bc38777c9053353ec2c4213bba67d63ab4 (diff) |
Add CSV parsing, printing, fix buffered file reading.
Diffstat (limited to 'include/fud_csv.hpp')
-rw-r--r-- | include/fud_csv.hpp | 82 |
1 files changed, 82 insertions, 0 deletions
diff --git a/include/fud_csv.hpp b/include/fud_csv.hpp new file mode 100644 index 0000000..efd37e6 --- /dev/null +++ b/include/fud_csv.hpp @@ -0,0 +1,82 @@ +/* + * libfud + * Copyright 2025 Dominick Allen + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +#ifndef FUD_CSV_HPP +#define FUD_CSV_HPP + +#include "fud_file.hpp" +#include "fud_status.hpp" +#include "fud_string_view.hpp" +#include "fud_text.hpp" +#include "fud_vector.hpp" + +#include <functional> // reference_wrapper + +namespace fud { + +using TextBuffer = Vector<std::byte>; +using CsvBuffer = Vector<std::byte>; +using CsvLine = Vector<StringView>; + +struct Csv { + /** \brief The number of lines of data in the CSV. */ + size_t numLines; + + /** \brief The number of columns in the CSV. */ + size_t numColumns; + + /** \brief Buffer for each line with numColumns of StringView. */ + Vector<CsvLine> lines; + + /** \brief Backing buffer for data. */ + CsvBuffer buffer; + + /** \separator for each column */ + Utf8 columnDelimiter{Ascii{','}}; + + /** \separator for each line */ + NewlineRepr newlineDelimiter{NewlineRepr::Posix}; + + bool strict; + + /** \brief Uses global Fud allocator for lines and backing buffer. */ + static Csv makeDefault(); + + /** \brief Specify allocator to use for both lines and backing buffer. */ + static Csv makeSingleAllocator(Allocator& allocator); + + /** \brief Specify allocator. */ + static Csv make(Allocator& lineAllocator, Allocator& bufferAllocator); + + /** Consume and return the CSV. */ + static FudStatus parseCsvFromFilename( + Csv& csv, + Option<TextBuffer&&> bufferOption, + StringView filename, + OpenFlags flags = OpenFlags{}, + Option<int> dirFdOption = NullOpt); + + // assumes file is at start + static FudStatus parseCsvFromUnbufferedFile(Csv& csv, RegularFile&& file); + + // assumes file is at start + static FudStatus parseCsvFromBufferedFile(Csv& csv, BufferedRegularFile& file); +}; + +} // namespace fud + +#endif |