From 32e14551a90e85000e41b3f0445d34d58a1431e4 Mon Sep 17 00:00:00 2001 From: Joel Klinghed Date: Wed, 10 Sep 2025 22:12:22 +0200 Subject: Add unicode general category lookup Generate the lookup tables from UnicodeData.txt, do to that, add gen_ugc, which uses csv, buffers, line, io and other modules to do the job. --- src/line.hh | 44 ++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 44 insertions(+) create mode 100644 src/line.hh (limited to 'src/line.hh') diff --git a/src/line.hh b/src/line.hh new file mode 100644 index 0000000..94e3646 --- /dev/null +++ b/src/line.hh @@ -0,0 +1,44 @@ +#ifndef LINE_HH +#define LINE_HH + +#include "io.hh" // IWYU pragma: export + +#include +#include +#include +#include +#include + +namespace line { + +struct ReadError { + bool eof; + std::optional io_error; + + ReadError(); + explicit ReadError(io::ReadError error); +}; + +class Reader { + public: + virtual ~Reader() = default; + + // Returned view is only valid until next call to read. + [[nodiscard]] virtual std::expected read() = 0; + // Starts at zero. Returns next line. + // So, before first read it is zero, after first read it is one. + [[nodiscard]] virtual uint64_t number() const = 0; + + protected: + Reader() = default; + + Reader(Reader const&) = delete; + Reader& operator=(Reader const&) = delete; +}; + +[[nodiscard]] std::unique_ptr open(std::unique_ptr reader, + size_t max_len = 8192); + +} // namespace line + +#endif // LINE_HH -- cgit v1.3