aboutsummaryrefslogtreecommitdiff
path: root/libbutl/tab-parser.mxx
blob: a7f7e01da60091ad3c1a136dbbe57cc4358ab03c (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
// file      : libbutl/tab-parser.mxx -*- C++ -*-
// license   : MIT; see accompanying LICENSE file

#ifndef __cpp_modules_ts
#pragma once
#endif

// C includes.

#ifndef __cpp_lib_modules_ts
#include <iosfwd>
#include <string>
#include <vector>
#include <cstdint>   // uint64_t
#include <stdexcept> // runtime_error
#endif

// Other includes.

#ifdef __cpp_modules_ts
export module butl.tab_parser;
#ifdef __cpp_lib_modules_ts
import std.core;
import std.io;
#endif
#endif

#include <libbutl/export.hxx>

LIBBUTL_MODEXPORT namespace butl
{
  class LIBBUTL_SYMEXPORT tab_parsing: public std::runtime_error
  {
  public:
    tab_parsing (const std::string& name,
                 std::uint64_t line,
                 std::uint64_t column,
                 const std::string& description);

    std::string name;
    std::uint64_t line;
    std::uint64_t column;
    std::string description;
  };

  // Line and columns are useful for issuing diagnostics about invalid or
  // missing fields.
  //
  struct tab_field
  {
    std::string value;    // Field string (quoting preserved).
    std::uint64_t column; // Field start column number (one-based).
  };

  struct tab_fields: std::vector<tab_field>
  {
    std::uint64_t line;       // Line number (one-based).
    std::uint64_t end_column; // End-of-line column (line length).
  };

  // Read and parse lines consisting of space-separated fields. Field can
  // contain single or double quoted substrings (with spaces) which are
  // interpreted but preserved. No escaping of the quote characters is
  // supported. Blank lines and lines that start with # (collectively called
  // empty lines) are ignored.
  //
  class LIBBUTL_SYMEXPORT tab_parser
  {
  public:
    tab_parser (std::istream& is, const std::string& name)
        : is_ (is), name_ (name) {}

    // Return next line of fields. Skip empty lines. Empty result denotes the
    // end of stream.
    //
    tab_fields
    next ();

  private:
    std::istream& is_;
    const std::string name_;
    std::uint64_t line_ = 0;
  };
}