minori: dep/toml11/toml/lexer.hpp annotate

author	Paper <paper@paper.us.eu.org>
date	Wed, 12 Jun 2024 05:25:41 -0400
parents
children

rev	line source
318 3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	1 // Copyright Toru Niina 2017.
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	2 // Distributed under the MIT License.
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	3 #ifndef TOML11_LEXER_HPP
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	4 #define TOML11_LEXER_HPP
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	5 #include <istream>
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	6 #include <sstream>
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	7 #include <stdexcept>
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	8
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	9 #include "combinator.hpp"
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	10
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	11 namespace toml
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	12 {
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	13 namespace detail
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	14 {
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	15
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	16 // these scans contents from current location in a container of char
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	17 // and extract a region that matches their own pattern.
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	18 // to see the implementation of each component, see combinator.hpp.
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	19
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	20 using lex_wschar = either<character<' '>, character<'\t'>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	21 using lex_ws = repeat<lex_wschar, at_least<1>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	22 using lex_newline = either<character<'\n'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	23 sequence<character<'\r'>, character<'\n'>>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	24 using lex_lower = in_range<'a', 'z'>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	25 using lex_upper = in_range<'A', 'Z'>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	26 using lex_alpha = either<lex_lower, lex_upper>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	27 using lex_digit = in_range<'0', '9'>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	28 using lex_nonzero = in_range<'1', '9'>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	29 using lex_oct_dig = in_range<'0', '7'>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	30 using lex_bin_dig = in_range<'0', '1'>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	31 using lex_hex_dig = either<lex_digit, in_range<'A', 'F'>, in_range<'a', 'f'>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	32
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	33 using lex_hex_prefix = sequence<character<'0'>, character<'x'>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	34 using lex_oct_prefix = sequence<character<'0'>, character<'o'>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	35 using lex_bin_prefix = sequence<character<'0'>, character<'b'>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	36 using lex_underscore = character<'_'>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	37 using lex_plus = character<'+'>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	38 using lex_minus = character<'-'>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	39 using lex_sign = either<lex_plus, lex_minus>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	40
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	41 // digit \| nonzero 1*(digit \| _ digit)
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	42 using lex_unsigned_dec_int = either<sequence<lex_nonzero, repeat<
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	43 either<lex_digit, sequence<lex_underscore, lex_digit>>, at_least<1>>>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	44 lex_digit>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	45 // (+\|-)? unsigned_dec_int
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	46 using lex_dec_int = sequence<maybe<lex_sign>, lex_unsigned_dec_int>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	47
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	48 // hex_prefix hex_dig *(hex_dig \| _ hex_dig)
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	49 using lex_hex_int = sequence<lex_hex_prefix, sequence<lex_hex_dig, repeat<
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	50 either<lex_hex_dig, sequence<lex_underscore, lex_hex_dig>>, unlimited>>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	51 // oct_prefix oct_dig *(oct_dig \| _ oct_dig)
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	52 using lex_oct_int = sequence<lex_oct_prefix, sequence<lex_oct_dig, repeat<
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	53 either<lex_oct_dig, sequence<lex_underscore, lex_oct_dig>>, unlimited>>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	54 // bin_prefix bin_dig *(bin_dig \| _ bin_dig)
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	55 using lex_bin_int = sequence<lex_bin_prefix, sequence<lex_bin_dig, repeat<
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	56 either<lex_bin_dig, sequence<lex_underscore, lex_bin_dig>>, unlimited>>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	57
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	58 // (dec_int \| hex_int \| oct_int \| bin_int)
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	59 using lex_integer = either<lex_bin_int, lex_oct_int, lex_hex_int, lex_dec_int>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	60
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	61 // ===========================================================================
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	62
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	63 using lex_inf = sequence<character<'i'>, character<'n'>, character<'f'>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	64 using lex_nan = sequence<character<'n'>, character<'a'>, character<'n'>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	65 using lex_special_float = sequence<maybe<lex_sign>, either<lex_inf, lex_nan>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	66
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	67 using lex_zero_prefixable_int = sequence<lex_digit, repeat<either<lex_digit,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	68 sequence<lex_underscore, lex_digit>>, unlimited>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	69
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	70 using lex_fractional_part = sequence<character<'.'>, lex_zero_prefixable_int>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	71
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	72 using lex_exponent_part = sequence<either<character<'e'>, character<'E'>>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	73 maybe<lex_sign>, lex_zero_prefixable_int>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	74
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	75 using lex_float = either<lex_special_float,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	76 sequence<lex_dec_int, either<lex_exponent_part,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	77 sequence<lex_fractional_part, maybe<lex_exponent_part>>>>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	78
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	79 // ===========================================================================
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	80
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	81 using lex_true = sequence<character<'t'>, character<'r'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	82 character<'u'>, character<'e'>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	83 using lex_false = sequence<character<'f'>, character<'a'>, character<'l'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	84 character<'s'>, character<'e'>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	85 using lex_boolean = either<lex_true, lex_false>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	86
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	87 // ===========================================================================
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	88
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	89 using lex_date_fullyear = repeat<lex_digit, exactly<4>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	90 using lex_date_month = repeat<lex_digit, exactly<2>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	91 using lex_date_mday = repeat<lex_digit, exactly<2>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	92 using lex_time_delim = either<character<'T'>, character<'t'>, character<' '>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	93 using lex_time_hour = repeat<lex_digit, exactly<2>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	94 using lex_time_minute = repeat<lex_digit, exactly<2>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	95 using lex_time_second = repeat<lex_digit, exactly<2>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	96 using lex_time_secfrac = sequence<character<'.'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	97 repeat<lex_digit, at_least<1>>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	98
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	99 using lex_time_numoffset = sequence<either<character<'+'>, character<'-'>>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	100 sequence<lex_time_hour, character<':'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	101 lex_time_minute>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	102 using lex_time_offset = either<character<'Z'>, character<'z'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	103 lex_time_numoffset>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	104
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	105 using lex_partial_time = sequence<lex_time_hour, character<':'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	106 lex_time_minute, character<':'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	107 lex_time_second, maybe<lex_time_secfrac>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	108 using lex_full_date = sequence<lex_date_fullyear, character<'-'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	109 lex_date_month, character<'-'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	110 lex_date_mday>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	111 using lex_full_time = sequence<lex_partial_time, lex_time_offset>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	112
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	113 using lex_offset_date_time = sequence<lex_full_date, lex_time_delim, lex_full_time>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	114 using lex_local_date_time = sequence<lex_full_date, lex_time_delim, lex_partial_time>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	115 using lex_local_date = lex_full_date;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	116 using lex_local_time = lex_partial_time;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	117
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	118 // ===========================================================================
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	119
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	120 using lex_quotation_mark = character<'"'>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	121 using lex_basic_unescaped = exclude<either<in_range<0x00, 0x08>, // 0x09 (tab) is allowed
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	122 in_range<0x0A, 0x1F>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	123 character<0x22>, character<0x5C>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	124 character<0x7F>>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	125
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	126 using lex_escape = character<'\\'>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	127 using lex_escape_unicode_short = sequence<character<'u'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	128 repeat<lex_hex_dig, exactly<4>>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	129 using lex_escape_unicode_long = sequence<character<'U'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	130 repeat<lex_hex_dig, exactly<8>>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	131 using lex_escape_seq_char = either<character<'"'>, character<'\\'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	132 character<'b'>, character<'f'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	133 character<'n'>, character<'r'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	134 character<'t'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	135 #ifdef TOML11_USE_UNRELEASED_TOML_FEATURES
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	136 character<'e'>, // ESC (0x1B)
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	137 #endif
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	138 lex_escape_unicode_short,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	139 lex_escape_unicode_long
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	140 >;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	141 using lex_escaped = sequence<lex_escape, lex_escape_seq_char>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	142 using lex_basic_char = either<lex_basic_unescaped, lex_escaped>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	143 using lex_basic_string = sequence<lex_quotation_mark,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	144 repeat<lex_basic_char, unlimited>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	145 lex_quotation_mark>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	146
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	147 // After toml post-v0.5.0, it is explicitly clarified how quotes in ml-strings
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	148 // are allowed to be used.
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	149 // After this, the following strings are explicitly allowed.
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	150 // - One or two `"`s in a multi-line basic string is allowed wherever it is.
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	151 // - Three consecutive `"`s in a multi-line basic string is considered as a delimiter.
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	152 // - One or two `"`s can appear just before or after the delimiter.
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	153 // ```toml
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	154 // str4 = """Here are two quotation marks: "". Simple enough."""
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	155 // str5 = """Here are three quotation marks: ""\"."""
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	156 // str6 = """Here are fifteen quotation marks: ""\"""\"""\"""\"""\"."""
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	157 // str7 = """"This," she said, "is just a pointless statement.""""
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	158 // ```
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	159 // In the current implementation (v3.3.0), it is difficult to parse `str7` in
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	160 // the above example. It is difficult to recognize `"` at the end of string body
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	161 // collectly. It will be misunderstood as a `"""` delimiter and an additional,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	162 // invalid `"`. Like this:
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	163 // ```console
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	164 // what(): [error] toml::parse_table: invalid line format
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	165 // --> hoge.toml
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	166 // \|
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	167 // 13 \| str7 = """"This," she said, "is just a pointless statement.""""
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	168 // \| ^- expected newline, but got '"'.
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	169 // ```
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	170 // As a quick workaround for this problem, `lex_ml_basic_string_delim` was
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	171 // split into two, `lex_ml_basic_string_open` and `lex_ml_basic_string_close`.
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	172 // `lex_ml_basic_string_open` allows only `"""`. `_close` allows 3-5 `"`s.
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	173 // In parse_ml_basic_string() function, the trailing `"`s will be attached to
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	174 // the string body.
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	175 //
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	176 using lex_ml_basic_string_delim = repeat<lex_quotation_mark, exactly<3>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	177 using lex_ml_basic_string_open = lex_ml_basic_string_delim;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	178 using lex_ml_basic_string_close = sequence<
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	179 repeat<lex_quotation_mark, exactly<3>>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	180 maybe<lex_quotation_mark>, maybe<lex_quotation_mark>
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	181 >;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	182
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	183 using lex_ml_basic_unescaped = exclude<either<in_range<0x00, 0x08>, // 0x09 is tab
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	184 in_range<0x0A, 0x1F>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	185 character<0x5C>, // backslash
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	186 character<0x7F>, // DEL
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	187 lex_ml_basic_string_delim>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	188
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	189 using lex_ml_basic_escaped_newline = sequence<
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	190 lex_escape, maybe<lex_ws>, lex_newline,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	191 repeat<either<lex_ws, lex_newline>, unlimited>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	192
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	193 using lex_ml_basic_char = either<lex_ml_basic_unescaped, lex_escaped>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	194 using lex_ml_basic_body = repeat<either<lex_ml_basic_char, lex_newline,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	195 lex_ml_basic_escaped_newline>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	196 unlimited>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	197 using lex_ml_basic_string = sequence<lex_ml_basic_string_open,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	198 lex_ml_basic_body,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	199 lex_ml_basic_string_close>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	200
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	201 using lex_literal_char = exclude<either<in_range<0x00, 0x08>, in_range<0x0A, 0x1F>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	202 character<0x7F>, character<0x27>>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	203 using lex_apostrophe = character<'\''>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	204 using lex_literal_string = sequence<lex_apostrophe,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	205 repeat<lex_literal_char, unlimited>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	206 lex_apostrophe>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	207
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	208 // the same reason as above.
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	209 using lex_ml_literal_string_delim = repeat<lex_apostrophe, exactly<3>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	210 using lex_ml_literal_string_open = lex_ml_literal_string_delim;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	211 using lex_ml_literal_string_close = sequence<
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	212 repeat<lex_apostrophe, exactly<3>>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	213 maybe<lex_apostrophe>, maybe<lex_apostrophe>
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	214 >;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	215
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	216 using lex_ml_literal_char = exclude<either<in_range<0x00, 0x08>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	217 in_range<0x0A, 0x1F>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	218 character<0x7F>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	219 lex_ml_literal_string_delim>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	220 using lex_ml_literal_body = repeat<either<lex_ml_literal_char, lex_newline>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	221 unlimited>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	222 using lex_ml_literal_string = sequence<lex_ml_literal_string_open,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	223 lex_ml_literal_body,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	224 lex_ml_literal_string_close>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	225
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	226 using lex_string = either<lex_ml_basic_string, lex_basic_string,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	227 lex_ml_literal_string, lex_literal_string>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	228
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	229 // ===========================================================================
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	230 using lex_dot_sep = sequence<maybe<lex_ws>, character<'.'>, maybe<lex_ws>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	231
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	232 using lex_unquoted_key = repeat<either<lex_alpha, lex_digit,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	233 character<'-'>, character<'_'>>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	234 at_least<1>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	235 using lex_quoted_key = either<lex_basic_string, lex_literal_string>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	236 using lex_simple_key = either<lex_unquoted_key, lex_quoted_key>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	237 using lex_dotted_key = sequence<lex_simple_key,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	238 repeat<sequence<lex_dot_sep, lex_simple_key>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	239 at_least<1>
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	240 >
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	241 >;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	242 using lex_key = either<lex_dotted_key, lex_simple_key>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	243
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	244 using lex_keyval_sep = sequence<maybe<lex_ws>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	245 character<'='>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	246 maybe<lex_ws>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	247
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	248 using lex_std_table_open = character<'['>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	249 using lex_std_table_close = character<']'>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	250 using lex_std_table = sequence<lex_std_table_open,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	251 maybe<lex_ws>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	252 lex_key,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	253 maybe<lex_ws>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	254 lex_std_table_close>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	255
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	256 using lex_array_table_open = sequence<lex_std_table_open, lex_std_table_open>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	257 using lex_array_table_close = sequence<lex_std_table_close, lex_std_table_close>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	258 using lex_array_table = sequence<lex_array_table_open,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	259 maybe<lex_ws>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	260 lex_key,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	261 maybe<lex_ws>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	262 lex_array_table_close>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	263
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	264 using lex_utf8_1byte = in_range<0x00, 0x7F>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	265 using lex_utf8_2byte = sequence<
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	266 in_range<'\xC2', '\xDF'>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	267 in_range<'\x80', '\xBF'>
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	268 >;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	269 using lex_utf8_3byte = sequence<either<
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	270 sequence<character<'\xE0'>, in_range<'\xA0', '\xBF'>>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	271 sequence<in_range<'\xE1', '\xEC'>, in_range<'\x80', '\xBF'>>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	272 sequence<character<'\xED'>, in_range<'\x80', '\x9F'>>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	273 sequence<in_range<'\xEE', '\xEF'>, in_range<'\x80', '\xBF'>>
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	274 >, in_range<'\x80', '\xBF'>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	275 using lex_utf8_4byte = sequence<either<
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	276 sequence<character<'\xF0'>, in_range<'\x90', '\xBF'>>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	277 sequence<in_range<'\xF1', '\xF3'>, in_range<'\x80', '\xBF'>>,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	278 sequence<character<'\xF4'>, in_range<'\x80', '\x8F'>>
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	279 >, in_range<'\x80', '\xBF'>, in_range<'\x80', '\xBF'>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	280 using lex_utf8_code = either<
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	281 lex_utf8_1byte,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	282 lex_utf8_2byte,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	283 lex_utf8_3byte,
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	284 lex_utf8_4byte
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	285 >;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	286
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	287 using lex_comment_start_symbol = character<'#'>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	288 using lex_non_eol_ascii = either<character<0x09>, in_range<0x20, 0x7E>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	289 using lex_comment = sequence<lex_comment_start_symbol, repeat<either<
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	290 lex_non_eol_ascii, lex_utf8_2byte, lex_utf8_3byte, lex_utf8_4byte>, unlimited>>;
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	291
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	292 } // detail
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	293 } // toml
3b355fa948c7 config: use TOML instead of INI Paper <paper@paper.us.eu.org> parents: diff changeset	294 #endif // TOML_LEXER_HPP

318

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

1 // Copyright Toru Niina 2017.

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

2 // Distributed under the MIT License.

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

3 #ifndef TOML11_LEXER_HPP

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

4 #define TOML11_LEXER_HPP

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

5 #include <istream>

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

6 #include <sstream>

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

7 #include <stdexcept>

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

8

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

9 #include "combinator.hpp"

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

10

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

11 namespace toml

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

12 {

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

13 namespace detail

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

14 {

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

15

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

16 // these scans contents from current location in a container of char

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

17 // and extract a region that matches their own pattern.

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

18 // to see the implementation of each component, see combinator.hpp.

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

19

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

20 using lex_wschar = either<character<' '>, character<'\t'>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

21 using lex_ws = repeat<lex_wschar, at_least<1>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

22 using lex_newline = either<character<'\n'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

23 sequence<character<'\r'>, character<'\n'>>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

24 using lex_lower = in_range<'a', 'z'>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

25 using lex_upper = in_range<'A', 'Z'>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

26 using lex_alpha = either<lex_lower, lex_upper>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

27 using lex_digit = in_range<'0', '9'>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

28 using lex_nonzero = in_range<'1', '9'>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

29 using lex_oct_dig = in_range<'0', '7'>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

30 using lex_bin_dig = in_range<'0', '1'>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

31 using lex_hex_dig = either<lex_digit, in_range<'A', 'F'>, in_range<'a', 'f'>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

32

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

33 using lex_hex_prefix = sequence<character<'0'>, character<'x'>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

34 using lex_oct_prefix = sequence<character<'0'>, character<'o'>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

35 using lex_bin_prefix = sequence<character<'0'>, character<'b'>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

36 using lex_underscore = character<'_'>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

37 using lex_plus = character<'+'>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

38 using lex_minus = character<'-'>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

39 using lex_sign = either<lex_plus, lex_minus>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

40

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

41 // digit | nonzero 1*(digit | _ digit)

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

42 using lex_unsigned_dec_int = either<sequence<lex_nonzero, repeat<

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

43 either<lex_digit, sequence<lex_underscore, lex_digit>>, at_least<1>>>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

44 lex_digit>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

45 // (+|-)? unsigned_dec_int

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

46 using lex_dec_int = sequence<maybe<lex_sign>, lex_unsigned_dec_int>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

47

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

48 // hex_prefix hex_dig *(hex_dig | _ hex_dig)

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

49 using lex_hex_int = sequence<lex_hex_prefix, sequence<lex_hex_dig, repeat<

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

50 either<lex_hex_dig, sequence<lex_underscore, lex_hex_dig>>, unlimited>>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

51 // oct_prefix oct_dig *(oct_dig | _ oct_dig)

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

52 using lex_oct_int = sequence<lex_oct_prefix, sequence<lex_oct_dig, repeat<

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

53 either<lex_oct_dig, sequence<lex_underscore, lex_oct_dig>>, unlimited>>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

54 // bin_prefix bin_dig *(bin_dig | _ bin_dig)

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

55 using lex_bin_int = sequence<lex_bin_prefix, sequence<lex_bin_dig, repeat<

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

56 either<lex_bin_dig, sequence<lex_underscore, lex_bin_dig>>, unlimited>>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

57

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

58 // (dec_int | hex_int | oct_int | bin_int)

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

59 using lex_integer = either<lex_bin_int, lex_oct_int, lex_hex_int, lex_dec_int>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

60

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

61 // ===========================================================================

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

62

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

63 using lex_inf = sequence<character<'i'>, character<'n'>, character<'f'>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

64 using lex_nan = sequence<character<'n'>, character<'a'>, character<'n'>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

65 using lex_special_float = sequence<maybe<lex_sign>, either<lex_inf, lex_nan>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

66

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

67 using lex_zero_prefixable_int = sequence<lex_digit, repeat<either<lex_digit,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

68 sequence<lex_underscore, lex_digit>>, unlimited>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

69

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

70 using lex_fractional_part = sequence<character<'.'>, lex_zero_prefixable_int>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

71

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

72 using lex_exponent_part = sequence<either<character<'e'>, character<'E'>>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

73 maybe<lex_sign>, lex_zero_prefixable_int>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

74

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

75 using lex_float = either<lex_special_float,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

76 sequence<lex_dec_int, either<lex_exponent_part,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

77 sequence<lex_fractional_part, maybe<lex_exponent_part>>>>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

78

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

79 // ===========================================================================

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

80

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

81 using lex_true = sequence<character<'t'>, character<'r'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

82 character<'u'>, character<'e'>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

83 using lex_false = sequence<character<'f'>, character<'a'>, character<'l'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

84 character<'s'>, character<'e'>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

85 using lex_boolean = either<lex_true, lex_false>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

86

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

87 // ===========================================================================

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

88

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

89 using lex_date_fullyear = repeat<lex_digit, exactly<4>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

90 using lex_date_month = repeat<lex_digit, exactly<2>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

91 using lex_date_mday = repeat<lex_digit, exactly<2>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

92 using lex_time_delim = either<character<'T'>, character<'t'>, character<' '>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

93 using lex_time_hour = repeat<lex_digit, exactly<2>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

94 using lex_time_minute = repeat<lex_digit, exactly<2>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

95 using lex_time_second = repeat<lex_digit, exactly<2>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

96 using lex_time_secfrac = sequence<character<'.'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

97 repeat<lex_digit, at_least<1>>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

98

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

99 using lex_time_numoffset = sequence<either<character<'+'>, character<'-'>>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

100 sequence<lex_time_hour, character<':'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

101 lex_time_minute>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

102 using lex_time_offset = either<character<'Z'>, character<'z'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

103 lex_time_numoffset>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

104

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

105 using lex_partial_time = sequence<lex_time_hour, character<':'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

106 lex_time_minute, character<':'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

107 lex_time_second, maybe<lex_time_secfrac>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

108 using lex_full_date = sequence<lex_date_fullyear, character<'-'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

109 lex_date_month, character<'-'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

110 lex_date_mday>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

111 using lex_full_time = sequence<lex_partial_time, lex_time_offset>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

112

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

113 using lex_offset_date_time = sequence<lex_full_date, lex_time_delim, lex_full_time>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

114 using lex_local_date_time = sequence<lex_full_date, lex_time_delim, lex_partial_time>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

115 using lex_local_date = lex_full_date;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

116 using lex_local_time = lex_partial_time;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

117

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

118 // ===========================================================================

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

119

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

120 using lex_quotation_mark = character<'"'>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

121 using lex_basic_unescaped = exclude<either<in_range<0x00, 0x08>, // 0x09 (tab) is allowed

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

122 in_range<0x0A, 0x1F>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

123 character<0x22>, character<0x5C>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

124 character<0x7F>>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

125

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

126 using lex_escape = character<'\\'>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

127 using lex_escape_unicode_short = sequence<character<'u'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

128 repeat<lex_hex_dig, exactly<4>>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

129 using lex_escape_unicode_long = sequence<character<'U'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

130 repeat<lex_hex_dig, exactly<8>>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

131 using lex_escape_seq_char = either<character<'"'>, character<'\\'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

132 character<'b'>, character<'f'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

133 character<'n'>, character<'r'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

134 character<'t'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

135 #ifdef TOML11_USE_UNRELEASED_TOML_FEATURES

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

136 character<'e'>, // ESC (0x1B)

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

137 #endif

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

138 lex_escape_unicode_short,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

139 lex_escape_unicode_long

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

140 >;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

141 using lex_escaped = sequence<lex_escape, lex_escape_seq_char>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

142 using lex_basic_char = either<lex_basic_unescaped, lex_escaped>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

143 using lex_basic_string = sequence<lex_quotation_mark,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

144 repeat<lex_basic_char, unlimited>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

145 lex_quotation_mark>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

146

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

147 // After toml post-v0.5.0, it is explicitly clarified how quotes in ml-strings

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

148 // are allowed to be used.

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

149 // After this, the following strings are *explicitly* allowed.

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

150 // - One or two `"`s in a multi-line basic string is allowed wherever it is.

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

151 // - Three consecutive `"`s in a multi-line basic string is considered as a delimiter.

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

152 // - One or two `"`s can appear just before or after the delimiter.

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

153 // ```toml

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

154 // str4 = """Here are two quotation marks: "". Simple enough."""

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

155 // str5 = """Here are three quotation marks: ""\"."""

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

156 // str6 = """Here are fifteen quotation marks: ""\"""\"""\"""\"""\"."""

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

157 // str7 = """"This," she said, "is just a pointless statement.""""

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

158 // ```

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

159 // In the current implementation (v3.3.0), it is difficult to parse `str7` in

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

160 // the above example. It is difficult to recognize `"` at the end of string body

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

161 // collectly. It will be misunderstood as a `"""` delimiter and an additional,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

162 // invalid `"`. Like this:

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

163 // ```console

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

164 // what(): [error] toml::parse_table: invalid line format

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

165 // --> hoge.toml

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

166 // |

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

167 // 13 | str7 = """"This," she said, "is just a pointless statement.""""

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

168 // | ^- expected newline, but got '"'.

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

169 // ```

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

170 // As a quick workaround for this problem, `lex_ml_basic_string_delim` was

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

171 // split into two, `lex_ml_basic_string_open` and `lex_ml_basic_string_close`.

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

172 // `lex_ml_basic_string_open` allows only `"""`. `_close` allows 3-5 `"`s.

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

173 // In parse_ml_basic_string() function, the trailing `"`s will be attached to

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

174 // the string body.

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

175 //

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

176 using lex_ml_basic_string_delim = repeat<lex_quotation_mark, exactly<3>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

177 using lex_ml_basic_string_open = lex_ml_basic_string_delim;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

178 using lex_ml_basic_string_close = sequence<

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

179 repeat<lex_quotation_mark, exactly<3>>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

180 maybe<lex_quotation_mark>, maybe<lex_quotation_mark>

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

181 >;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

182

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

183 using lex_ml_basic_unescaped = exclude<either<in_range<0x00, 0x08>, // 0x09 is tab

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

184 in_range<0x0A, 0x1F>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

185 character<0x5C>, // backslash

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

186 character<0x7F>, // DEL

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

187 lex_ml_basic_string_delim>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

188

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

189 using lex_ml_basic_escaped_newline = sequence<

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

190 lex_escape, maybe<lex_ws>, lex_newline,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

191 repeat<either<lex_ws, lex_newline>, unlimited>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

192

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

193 using lex_ml_basic_char = either<lex_ml_basic_unescaped, lex_escaped>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

194 using lex_ml_basic_body = repeat<either<lex_ml_basic_char, lex_newline,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

195 lex_ml_basic_escaped_newline>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

196 unlimited>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

197 using lex_ml_basic_string = sequence<lex_ml_basic_string_open,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

198 lex_ml_basic_body,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

199 lex_ml_basic_string_close>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

200

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

201 using lex_literal_char = exclude<either<in_range<0x00, 0x08>, in_range<0x0A, 0x1F>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

202 character<0x7F>, character<0x27>>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

203 using lex_apostrophe = character<'\''>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

204 using lex_literal_string = sequence<lex_apostrophe,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

205 repeat<lex_literal_char, unlimited>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

206 lex_apostrophe>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

207

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

208 // the same reason as above.

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

209 using lex_ml_literal_string_delim = repeat<lex_apostrophe, exactly<3>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

210 using lex_ml_literal_string_open = lex_ml_literal_string_delim;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

211 using lex_ml_literal_string_close = sequence<

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

212 repeat<lex_apostrophe, exactly<3>>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

213 maybe<lex_apostrophe>, maybe<lex_apostrophe>

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

214 >;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

215

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

216 using lex_ml_literal_char = exclude<either<in_range<0x00, 0x08>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

217 in_range<0x0A, 0x1F>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

218 character<0x7F>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

219 lex_ml_literal_string_delim>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

220 using lex_ml_literal_body = repeat<either<lex_ml_literal_char, lex_newline>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

221 unlimited>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

222 using lex_ml_literal_string = sequence<lex_ml_literal_string_open,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

223 lex_ml_literal_body,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

224 lex_ml_literal_string_close>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

225

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

226 using lex_string = either<lex_ml_basic_string, lex_basic_string,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

227 lex_ml_literal_string, lex_literal_string>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

228

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

229 // ===========================================================================

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

230 using lex_dot_sep = sequence<maybe<lex_ws>, character<'.'>, maybe<lex_ws>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

231

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

232 using lex_unquoted_key = repeat<either<lex_alpha, lex_digit,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

233 character<'-'>, character<'_'>>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

234 at_least<1>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

235 using lex_quoted_key = either<lex_basic_string, lex_literal_string>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

236 using lex_simple_key = either<lex_unquoted_key, lex_quoted_key>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

237 using lex_dotted_key = sequence<lex_simple_key,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

238 repeat<sequence<lex_dot_sep, lex_simple_key>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

239 at_least<1>

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

240 >

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

241 >;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

242 using lex_key = either<lex_dotted_key, lex_simple_key>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

243

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

244 using lex_keyval_sep = sequence<maybe<lex_ws>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

245 character<'='>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

246 maybe<lex_ws>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

247

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

248 using lex_std_table_open = character<'['>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

249 using lex_std_table_close = character<']'>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

250 using lex_std_table = sequence<lex_std_table_open,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

251 maybe<lex_ws>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

252 lex_key,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

253 maybe<lex_ws>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

254 lex_std_table_close>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

255

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

256 using lex_array_table_open = sequence<lex_std_table_open, lex_std_table_open>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

257 using lex_array_table_close = sequence<lex_std_table_close, lex_std_table_close>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

258 using lex_array_table = sequence<lex_array_table_open,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

259 maybe<lex_ws>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

260 lex_key,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

261 maybe<lex_ws>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

262 lex_array_table_close>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

263

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

264 using lex_utf8_1byte = in_range<0x00, 0x7F>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

265 using lex_utf8_2byte = sequence<

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

266 in_range<'\xC2', '\xDF'>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

267 in_range<'\x80', '\xBF'>

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

268 >;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

269 using lex_utf8_3byte = sequence<either<

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

270 sequence<character<'\xE0'>, in_range<'\xA0', '\xBF'>>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

271 sequence<in_range<'\xE1', '\xEC'>, in_range<'\x80', '\xBF'>>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

272 sequence<character<'\xED'>, in_range<'\x80', '\x9F'>>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

273 sequence<in_range<'\xEE', '\xEF'>, in_range<'\x80', '\xBF'>>

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

274 >, in_range<'\x80', '\xBF'>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

275 using lex_utf8_4byte = sequence<either<

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

276 sequence<character<'\xF0'>, in_range<'\x90', '\xBF'>>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

277 sequence<in_range<'\xF1', '\xF3'>, in_range<'\x80', '\xBF'>>,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

278 sequence<character<'\xF4'>, in_range<'\x80', '\x8F'>>

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

279 >, in_range<'\x80', '\xBF'>, in_range<'\x80', '\xBF'>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

280 using lex_utf8_code = either<

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

281 lex_utf8_1byte,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

282 lex_utf8_2byte,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

283 lex_utf8_3byte,

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

284 lex_utf8_4byte

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

285 >;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

286

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

287 using lex_comment_start_symbol = character<'#'>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

288 using lex_non_eol_ascii = either<character<0x09>, in_range<0x20, 0x7E>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

289 using lex_comment = sequence<lex_comment_start_symbol, repeat<either<

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

290 lex_non_eol_ascii, lex_utf8_2byte, lex_utf8_3byte, lex_utf8_4byte>, unlimited>>;

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

291

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

292 } // detail

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

293 } // toml

3b355fa948c7 config: use TOML instead of INI

Paper <paper@paper.us.eu.org>

parents:

diff changeset

294 #endif // TOML_LEXER_HPP

Mercurial > minori

annotate dep/toml11/toml/lexer.hpp @ 318:3b355fa948c7