feat: get region info when parsing keys

Error messages related to dotted keys looks weird. like:
 1 | a.b.c = 42
   |         ~~ in this table
The underlined token is not a table. This should be like the following.
 1 | a.b.c = 42
   | ~~~ in this table
To implement this, the region information is needed when the keys are
read. This commit add this functionality, though currently the region
information is not used yet.
This commit is contained in:
ToruNiina 2019-02-26 00:17:28 +09:00
parent 83bf83b6dd
commit 679b365cf7
2 changed files with 35 additions and 29 deletions

View File

@ -13,23 +13,23 @@ using namespace detail;
BOOST_AUTO_TEST_CASE(test_bare_key) BOOST_AUTO_TEST_CASE(test_bare_key)
{ {
TOML11_TEST_PARSE_EQUAL_VALUE(parse_key, "barekey", std::vector<key>(1, "barekey")); TOML11_TEST_PARSE_EQUAL(parse_key, "barekey", std::vector<key>(1, "barekey"));
TOML11_TEST_PARSE_EQUAL_VALUE(parse_key, "bare-key", std::vector<key>(1, "bare-key")); TOML11_TEST_PARSE_EQUAL(parse_key, "bare-key", std::vector<key>(1, "bare-key"));
TOML11_TEST_PARSE_EQUAL_VALUE(parse_key, "bare_key", std::vector<key>(1, "bare_key")); TOML11_TEST_PARSE_EQUAL(parse_key, "bare_key", std::vector<key>(1, "bare_key"));
TOML11_TEST_PARSE_EQUAL_VALUE(parse_key, "1234", std::vector<key>(1, "1234")); TOML11_TEST_PARSE_EQUAL(parse_key, "1234", std::vector<key>(1, "1234"));
} }
BOOST_AUTO_TEST_CASE(test_quoted_key) BOOST_AUTO_TEST_CASE(test_quoted_key)
{ {
TOML11_TEST_PARSE_EQUAL_VALUE(parse_key, "\"127.0.0.1\"", std::vector<key>(1, "127.0.0.1" )); TOML11_TEST_PARSE_EQUAL(parse_key, "\"127.0.0.1\"", std::vector<key>(1, "127.0.0.1" ));
TOML11_TEST_PARSE_EQUAL_VALUE(parse_key, "\"character encoding\"", std::vector<key>(1, "character encoding")); TOML11_TEST_PARSE_EQUAL(parse_key, "\"character encoding\"", std::vector<key>(1, "character encoding"));
#if defined(_MSC_VER) || defined(__INTEL_COMPILER) #if defined(_MSC_VER) || defined(__INTEL_COMPILER)
TOML11_TEST_PARSE_EQUAL_VALUE(parse_key, "\"\xCA\x8E\xC7\x9D\xCA\x9E\"", std::vector<key>(1, "\xCA\x8E\xC7\x9D\xCA\x9E")); TOML11_TEST_PARSE_EQUAL(parse_key, "\"\xCA\x8E\xC7\x9D\xCA\x9E\"", std::vector<key>(1, "\xCA\x8E\xC7\x9D\xCA\x9E"));
#else #else
TOML11_TEST_PARSE_EQUAL_VALUE(parse_key, "\"ʎǝʞ\"", std::vector<key>(1, "ʎǝʞ" )); TOML11_TEST_PARSE_EQUAL(parse_key, "\"ʎǝʞ\"", std::vector<key>(1, "ʎǝʞ" ));
#endif #endif
TOML11_TEST_PARSE_EQUAL_VALUE(parse_key, "'key2'", std::vector<key>(1, "key2" )); TOML11_TEST_PARSE_EQUAL(parse_key, "'key2'", std::vector<key>(1, "key2" ));
TOML11_TEST_PARSE_EQUAL_VALUE(parse_key, "'quoted \"value\"'", std::vector<key>(1, "quoted \"value\"" )); TOML11_TEST_PARSE_EQUAL(parse_key, "'quoted \"value\"'", std::vector<key>(1, "quoted \"value\"" ));
} }
BOOST_AUTO_TEST_CASE(test_dotted_key) BOOST_AUTO_TEST_CASE(test_dotted_key)
@ -38,13 +38,13 @@ BOOST_AUTO_TEST_CASE(test_dotted_key)
std::vector<key> keys(2); std::vector<key> keys(2);
keys[0] = "physical"; keys[0] = "physical";
keys[1] = "color"; keys[1] = "color";
TOML11_TEST_PARSE_EQUAL_VALUE(parse_key, "physical.color", keys); TOML11_TEST_PARSE_EQUAL(parse_key, "physical.color", keys);
} }
{ {
std::vector<key> keys(2); std::vector<key> keys(2);
keys[0] = "physical"; keys[0] = "physical";
keys[1] = "shape"; keys[1] = "shape";
TOML11_TEST_PARSE_EQUAL_VALUE(parse_key, "physical.shape", keys); TOML11_TEST_PARSE_EQUAL(parse_key, "physical.shape", keys);
} }
{ {
std::vector<key> keys(4); std::vector<key> keys(4);
@ -52,12 +52,12 @@ BOOST_AUTO_TEST_CASE(test_dotted_key)
keys[1] = "y"; keys[1] = "y";
keys[2] = "z"; keys[2] = "z";
keys[3] = "w"; keys[3] = "w";
TOML11_TEST_PARSE_EQUAL_VALUE(parse_key, "x.y.z.w", keys); TOML11_TEST_PARSE_EQUAL(parse_key, "x.y.z.w", keys);
} }
{ {
std::vector<key> keys(2); std::vector<key> keys(2);
keys[0] = "site"; keys[0] = "site";
keys[1] = "google.com"; keys[1] = "google.com";
TOML11_TEST_PARSE_EQUAL_VALUE(parse_key, "site.\"google.com\"", keys); TOML11_TEST_PARSE_EQUAL(parse_key, "site.\"google.com\"", keys);
} }
} }

View File

@ -754,19 +754,21 @@ parse_offset_datetime(location<Container>& loc)
} }
template<typename Container> template<typename Container>
result<key, std::string> parse_simple_key(location<Container>& loc) result<std::pair<key, region<Container>>, std::string>
parse_simple_key(location<Container>& loc)
{ {
if(const auto bstr = parse_basic_string(loc)) if(const auto bstr = parse_basic_string(loc))
{ {
return ok(bstr.unwrap().first.str); return ok(std::make_pair(bstr.unwrap().first.str, bstr.unwrap().second));
} }
if(const auto lstr = parse_literal_string(loc)) if(const auto lstr = parse_literal_string(loc))
{ {
return ok(lstr.unwrap().first.str); return ok(std::make_pair(lstr.unwrap().first.str, lstr.unwrap().second));
} }
if(const auto bare = lex_unquoted_key::invoke(loc)) if(const auto bare = lex_unquoted_key::invoke(loc))
{ {
return ok(bare.unwrap().str()); const auto reg = bare.unwrap();
return ok(std::make_pair(reg.str(), reg));
} }
return err(std::string("[error] toml::parse_simple_key: " return err(std::string("[error] toml::parse_simple_key: "
"the next token is not a simple key")); "the next token is not a simple key"));
@ -774,13 +776,15 @@ result<key, std::string> parse_simple_key(location<Container>& loc)
// dotted key become vector of keys // dotted key become vector of keys
template<typename Container> template<typename Container>
result<std::vector<key>, std::string> parse_key(location<Container>& loc) result<std::pair<std::vector<key>, region<Container>>, std::string>
parse_key(location<Container>& loc)
{ {
const auto first = loc.iter(); const auto first = loc.iter();
// dotted key -> foo.bar.baz whitespaces are allowed // dotted key -> foo.bar.baz whitespaces are allowed
if(const auto token = lex_dotted_key::invoke(loc)) if(const auto token = lex_dotted_key::invoke(loc))
{ {
location<std::string> inner_loc(loc.name(), token.unwrap().str()); const auto reg = token.unwrap();
location<std::string> inner_loc(loc.name(), reg.str());
std::vector<key> keys; std::vector<key> keys;
while(inner_loc.iter() != inner_loc.end()) while(inner_loc.iter() != inner_loc.end())
@ -788,7 +792,7 @@ result<std::vector<key>, std::string> parse_key(location<Container>& loc)
lex_ws::invoke(inner_loc); lex_ws::invoke(inner_loc);
if(const auto k = parse_simple_key(inner_loc)) if(const auto k = parse_simple_key(inner_loc))
{ {
keys.push_back(k.unwrap()); keys.push_back(k.unwrap().first);
} }
else else
{ {
@ -813,14 +817,15 @@ result<std::vector<key>, std::string> parse_key(location<Container>& loc)
"should be `.`")); "should be `.`"));
} }
} }
return ok(keys); return ok(std::make_pair(keys, reg));
} }
loc.iter() = first; loc.iter() = first;
// simple key -> foo // simple key -> foo
if(const auto smpl = parse_simple_key(loc)) if(const auto smpl = parse_simple_key(loc))
{ {
return ok(std::vector<key>(1, smpl.unwrap())); return ok(std::make_pair(std::vector<key>(1, smpl.unwrap().first),
smpl.unwrap().second));
} }
return err(std::string("[error] toml::parse_key: " return err(std::string("[error] toml::parse_key: "
"the next token is not a key")); "the next token is not a key"));
@ -904,10 +909,10 @@ result<std::pair<std::vector<key>, value>, std::string>
parse_key_value_pair(location<Container>& loc) parse_key_value_pair(location<Container>& loc)
{ {
const auto first = loc.iter(); const auto first = loc.iter();
auto key = parse_key(loc); auto key_reg = parse_key(loc);
if(!key) if(!key_reg)
{ {
std::string msg = std::move(key.unwrap_err()); std::string msg = std::move(key_reg.unwrap_err());
// if the next token is keyvalue-separator, it means that there are no // if the next token is keyvalue-separator, it means that there are no
// key. then we need to show error as "empty key is not allowed". // key. then we need to show error as "empty key is not allowed".
if(const auto keyval_sep = lex_keyval_sep::invoke(loc)) if(const auto keyval_sep = lex_keyval_sep::invoke(loc))
@ -963,7 +968,8 @@ parse_key_value_pair(location<Container>& loc)
loc.iter() = first; loc.iter() = first;
return err(msg); return err(msg);
} }
return ok(std::make_pair(std::move(key.unwrap()), std::move(val.unwrap()))); return ok(std::make_pair(std::move(key_reg.unwrap().first),
std::move(val.unwrap())));
} }
// for error messages. // for error messages.
@ -1289,7 +1295,7 @@ parse_table_key(location<Container>& loc)
throw internal_error(format_underline("[error] " throw internal_error(format_underline("[error] "
"toml::parse_table_key: no `]`", inner_loc, "should be `]`")); "toml::parse_table_key: no `]`", inner_loc, "should be `]`"));
} }
return ok(std::make_pair(keys.unwrap(), token.unwrap())); return ok(std::make_pair(keys.unwrap().first, token.unwrap()));
} }
else else
{ {
@ -1327,7 +1333,7 @@ parse_array_table_key(location<Container>& loc)
throw internal_error(format_underline("[error] " throw internal_error(format_underline("[error] "
"toml::parse_table_key: no `]]`", inner_loc, "should be `]]`")); "toml::parse_table_key: no `]]`", inner_loc, "should be `]]`"));
} }
return ok(std::make_pair(keys.unwrap(), token.unwrap())); return ok(std::make_pair(keys.unwrap().first, token.unwrap()));
} }
else else
{ {