Commit 1b141940 authored by Kenton Varda's avatar Kenton Varda

Add Parser combinator framework to KJ (WIP).

parent d534ef9b
...@@ -242,6 +242,9 @@ public: ...@@ -242,6 +242,9 @@ public:
inline ArrayPtr<T> asPtr() { inline ArrayPtr<T> asPtr() {
return arrayPtr(ptr, pos); return arrayPtr(ptr, pos);
} }
inline ArrayPtr<const T> asPtr() const {
return arrayPtr(ptr, pos);
}
inline size_t size() const { return pos - ptr; } inline size_t size() const { return pos - ptr; }
inline size_t capacity() const { return endPtr - ptr; } inline size_t capacity() const { return endPtr - ptr; }
...@@ -305,6 +308,10 @@ public: ...@@ -305,6 +308,10 @@ public:
return result; return result;
} }
inline bool isFull() const {
return pos == endPtr;
}
private: private:
T* ptr; T* ptr;
RemoveConst<T>* pos; RemoveConst<T>* pos;
......
// Copyright (c) 2013, Kenton Varda <temporal@gmail.com>
// All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
//
// 1. Redistributions of source code must retain the above copyright notice, this
// list of conditions and the following disclaimer.
// 2. Redistributions in binary form must reproduce the above copyright notice,
// this list of conditions and the following disclaimer in the documentation
// and/or other materials provided with the distribution.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
// ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
// WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
// ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
// (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
// LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
// ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
#include "parse.h"
#include "string.h"
#include <gtest/gtest.h>
namespace kj {
namespace parse {
namespace {
TEST(Tuple, Flatten) {
int output = 0;
Tuple<int, int, int> t =
tuple(tuple(tuple(), tuple(1)), tuple(), 20, tuple(tuple(tuple(), 300)));
applyTuple([&](int i, int j, int k) { output = i + j + k; }, t);
EXPECT_EQ(321, output);
EXPECT_EQ(321, applyTuple([](int i, int j, int k) { return i + j + k; }, t));
Tuple<Maybe<int>, String> t2 = tuple(Maybe<int>(123), heapString("foo"));
String t3 = tuple(heapString("foo"));
String t4 = tuple(heapString("foo"), Void());
}
typedef IteratorInput<char, const char*> Input;
ExactElementParser<Input> exactChar(char c) {
return exactElement<Input>(mv(c));
}
typedef Span<const char*> TestLocation;
TEST(Parsers, ExactElementParser) {
StringPtr text = "foo";
Input input(text.begin(), text.end());
Maybe<Void> result = exactChar('f')(input);
EXPECT_TRUE(result != nullptr);
EXPECT_FALSE(input.atEnd());
result = exactChar('o')(input);
EXPECT_TRUE(result != nullptr);
EXPECT_FALSE(input.atEnd());
result = exactChar('x')(input);
EXPECT_TRUE(result == nullptr);
EXPECT_FALSE(input.atEnd());
Parser<Input, Void> wrapped = exactChar('o');
result = wrapped(input);
EXPECT_TRUE(result != nullptr);
EXPECT_TRUE(input.atEnd());
}
TEST(Parsers, SequenceParser) {
StringPtr text = "foo";
{
Input input(text.begin(), text.end());
Maybe<Void> result = sequence(exactChar('f'), exactChar('o'), exactChar('o'))(input);
EXPECT_TRUE(result != nullptr);
EXPECT_TRUE(input.atEnd());
}
{
Input input(text.begin(), text.end());
Maybe<Void> result = sequence(exactChar('f'), exactChar('o'))(input);
EXPECT_TRUE(result != nullptr);
EXPECT_FALSE(input.atEnd());
}
{
Input input(text.begin(), text.end());
Maybe<Void> result = sequence(exactChar('x'), exactChar('o'), exactChar('o'))(input);
EXPECT_TRUE(result == nullptr);
EXPECT_FALSE(input.atEnd());
}
{
Input input(text.begin(), text.end());
Maybe<Void> result = sequence(sequence(exactChar('f'), exactChar('o')), exactChar('o'))(input);
EXPECT_TRUE(result != nullptr);
EXPECT_TRUE(input.atEnd());
}
{
Input input(text.begin(), text.end());
Maybe<Void> result = sequence(sequence(exactChar('f')), exactChar('o'), exactChar('o'))(input);
EXPECT_TRUE(result != nullptr);
EXPECT_TRUE(input.atEnd());
}
{
Input input(text.begin(), text.end());
Maybe<int> result = sequence(transform(exactChar('f'), [](TestLocation){return 123;}),
exactChar('o'), exactChar('o'))(input);
KJ_IF_MAYBE(i, result) {
EXPECT_EQ(123, *i);
} else {
ADD_FAILURE() << "Expected 123, got null.";
}
EXPECT_TRUE(input.atEnd());
}
}
TEST(Parsers, TransformParser) {
StringPtr text = "foo";
auto parser = transform(
sequence(exactChar('f'), exactChar('o'), exactChar('o')),
[](TestLocation location) -> int {
EXPECT_EQ("foo", StringPtr(location.begin(), location.end()));
return 123;
});
{
Input input(text.begin(), text.end());
Maybe<int> result = parser(input);
KJ_IF_MAYBE(i, result) {
EXPECT_EQ(123, *i);
} else {
ADD_FAILURE() << "Expected 123, got null.";
}
EXPECT_TRUE(input.atEnd());
}
}
TEST(Parsers, TransformParser_MaybeRef) {
struct Transform {
int value;
Transform(int value): value(value) {}
int operator()(TestLocation) const { return value; }
};
// Don't use auto for the TransformParsers here because we're trying to make sure that MaybeRef
// is working correctly. When transform() is given an lvalue, it should wrap the type in
// ParserRef.
TransformParser<ExactElementParser<Input>, Transform> parser1 =
transform(exactChar('f'), Transform(12));
auto otherParser = exactChar('o');
TransformParser<ParserRef<ExactElementParser<Input>>, Transform> parser2 =
transform(otherParser, Transform(34));
auto otherParser2 = exactChar('b');
TransformParser<ExactElementParser<Input>, Transform> parser3 =
transform(mv(otherParser2), Transform(56));
StringPtr text = "foob";
auto parser = transform(
sequence(parser1, parser2, exactChar('o'), parser3),
[](TestLocation, int i, int j, int k) { return i + j + k; });
{
Input input(text.begin(), text.end());
Maybe<int> result = parser(input);
KJ_IF_MAYBE(i, result) {
EXPECT_EQ(12 + 34 + 56, *i);
} else {
ADD_FAILURE() << "Expected 12 + 34 + 56, got null.";
}
EXPECT_TRUE(input.atEnd());
}
}
TEST(Parsers, RepeatedParser) {
StringPtr text = "foooob";
auto parser = transform(
sequence(exactChar('f'), repeated(exactChar('o'))),
[](TestLocation, ArrayPtr<Void> values) -> int { return values.size(); });
{
Input input(text.begin(), text.begin() + 3);
Maybe<int> result = parser(input);
KJ_IF_MAYBE(i, result) {
EXPECT_EQ(2, *i);
} else {
ADD_FAILURE() << "Expected 2, got null.";
}
EXPECT_TRUE(input.atEnd());
}
{
Input input(text.begin(), text.begin() + 5);
Maybe<int> result = parser(input);
KJ_IF_MAYBE(i, result) {
EXPECT_EQ(4, *i);
} else {
ADD_FAILURE() << "Expected 4, got null.";
}
EXPECT_TRUE(input.atEnd());
}
{
Input input(text.begin(), text.end());
Maybe<int> result = parser(input);
KJ_IF_MAYBE(i, result) {
EXPECT_EQ(4, *i);
} else {
ADD_FAILURE() << "Expected 4, got null.";
}
EXPECT_FALSE(input.atEnd());
}
}
TEST(Parsers, OneOfParser) {
auto parser = oneOf(
transform(sequence(exactChar('f'), exactChar('o'), exactChar('o')),
[](TestLocation) -> StringPtr { return "foo"; }),
transform(sequence(exactChar('b'), exactChar('a'), exactChar('r')),
[](TestLocation) -> StringPtr { return "bar"; }));
{
StringPtr text = "foo";
Input input(text.begin(), text.end());
Maybe<StringPtr> result = parser(input);
KJ_IF_MAYBE(s, result) {
EXPECT_EQ("foo", *s);
} else {
ADD_FAILURE() << "Expected 'foo', got null.";
}
EXPECT_TRUE(input.atEnd());
}
{
StringPtr text = "bar";
Input input(text.begin(), text.end());
Maybe<StringPtr> result = parser(input);
KJ_IF_MAYBE(s, result) {
EXPECT_EQ("bar", *s);
} else {
ADD_FAILURE() << "Expected 'bar', got null.";
}
EXPECT_TRUE(input.atEnd());
}
}
} // namespace
} // namespace parse
} // namespace kj
// Copyright (c) 2013, Kenton Varda <temporal@gmail.com>
// All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
//
// 1. Redistributions of source code must retain the above copyright notice, this
// list of conditions and the following disclaimer.
// 2. Redistributions in binary form must reproduce the above copyright notice,
// this list of conditions and the following disclaimer in the documentation
// and/or other materials provided with the distribution.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
// ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
// WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
// ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
// (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
// LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
// ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
#ifndef KJ_PARSER_H_
#define KJ_PARSER_H_
#include "common.h"
#include "memory.h"
#include "array.h"
namespace kj {
namespace parse {
// I don't understand std::tuple.
template <typename... T>
struct Tuple;
template <>
struct Tuple<> {
Tuple() {}
};
template <typename First, typename... Rest>
struct Tuple<First, Rest...> {
Tuple() {}
Tuple(Tuple&& other): first(kj::mv(other.first)), rest(kj::mv(other.rest)) {}
Tuple(const Tuple& other): first(other.first), rest(other.rest) {}
Tuple(Tuple& other): first(other.first), rest(other.rest) {}
template <typename First2, typename Rest2>
explicit Tuple(First2&& first2, Rest2&& rest2)
: first(kj::fwd<First2>(first2)),
rest(kj::fwd<Rest2>(rest2)) {}
First first;
Tuple<Rest...> rest;
};
typedef Tuple<> Void;
template <typename T, typename U>
struct ConsTuple {
typedef Tuple<Decay<T>, Decay<U>> Type;
};
template <typename T, typename... U>
struct ConsTuple<T, Tuple<U...>> {
typedef Tuple<Decay<T>, U...> Type;
};
template <typename T>
struct ConsTuple<T, Tuple<>> {
typedef Decay<T> Type;
};
template <typename... T>
struct MakeTuple;
template <>
struct MakeTuple<> {
typedef Tuple<> Type;
};
template <typename T>
struct MakeTuple<T> {
typedef Decay<T> Type;
};
template <typename T, typename U, typename... V>
struct MakeTuple<T, U, V...> {
typedef typename ConsTuple<T, typename MakeTuple<U, V...>::Type>::Type Type;
};
template <typename T, typename... U>
struct MakeTuple<Tuple<>, T, U...> {
typedef typename MakeTuple<T, U...>::Type Type;
};
template <typename T, typename... U, typename V, typename... W>
struct MakeTuple<Tuple<T, U...>, V, W...> {
typedef typename ConsTuple<T, typename MakeTuple<Tuple<U...>, V, W...>::Type>::Type Type;
};
template <typename T, typename U>
typename ConsTuple<T, U>::Type
inline consTuple(T&& t, U&& u) {
return typename ConsTuple<T, U>::Type(
kj::fwd<T>(t),
Tuple<Decay<U>>(kj::fwd<U>(u), Void()));
}
template <typename T, typename... U>
typename ConsTuple<T, Tuple<U...>>::Type
inline consTuple(T&& t, Tuple<U...>&& u) {
return typename ConsTuple<T, Tuple<U...>>::Type(kj::mv(t), kj::mv(u));
}
template <typename T>
typename ConsTuple<T, Tuple<>>::Type
inline consTuple(T&& t, Tuple<>&& u) {
return kj::fwd<T>(t);
}
typename MakeTuple<>::Type
inline tuple() {
return Tuple<>();
}
template <typename T>
typename MakeTuple<T>::Type
inline tuple(T&& first) {
return kj::fwd<T>(first);
}
template <typename T, typename U, typename... V>
typename MakeTuple<T, U, V...>::Type
inline tuple(T&& first, U&& second, V&&... rest) {
return consTuple(kj::fwd<T>(first),
tuple(kj::fwd<U>(second), kj::fwd<V>(rest)...));
}
template <typename T, typename... U>
typename MakeTuple<Tuple<>, T, U...>::Type
inline tuple(Tuple<>&&, T&& first, U&&... rest) {
return tuple(kj::fwd<T>(first), kj::fwd<U>(rest)...);
}
template <typename T, typename... U>
typename MakeTuple<Tuple<>, T, U...>::Type
inline tuple(const Tuple<>&, T&& first, U&&... rest) {
return tuple(kj::fwd<T>(first), kj::fwd<U>(rest)...);
}
template <typename T, typename... U, typename V, typename... W>
typename MakeTuple<Tuple<T, U...>, V, W...>::Type
inline tuple(Tuple<T, U...>&& first, V&& second, W&&... rest) {
return consTuple(kj::mv(first.first),
tuple(kj::mv(first.rest), kj::fwd<V>(second), kj::fwd<W>(rest)...));
}
template <typename T, typename... U, typename V, typename... W>
typename MakeTuple<Tuple<T, U...>, V, W...>::Type
inline tuple(const Tuple<T, U...>& first, V&& second, W&&... rest) {
return consTuple(first.first,
tuple(first.rest, kj::fwd<V>(second), kj::fwd<W>(rest)...));
}
template <typename Func, typename T, typename... Params>
inline auto applyTuple(Func&& func, T&& t, Params&&... params) ->
decltype(func(kj::fwd<Params>(params)..., kj::fwd<T>(t))) {
return func(kj::fwd<Params>(params)..., kj::fwd<T>(t));
}
template <typename Func, typename... Params>
inline auto applyTuple(Func&& func, Tuple<> t, Params&&... params) ->
decltype(func(kj::fwd<Params>(params)...)) {
return func(kj::fwd<Params>(params)...);
}
template <typename Func, typename T, typename... U, typename... Params>
inline auto applyTuple(Func&& func, Tuple<T, U...>&& t, Params&&... params) ->
decltype(func(kj::fwd<Params>(params)..., instance<T&&>(), instance<U&&>()...)) {
return applyTuple(kj::fwd<Func>(func), kj::mv(t.rest),
kj::fwd<Params>(params)..., kj::mv(t.first));
}
template <typename Func, typename T, typename... U, typename... Params>
inline auto applyTuple(Func&& func, const Tuple<T, U...>& t, Params&&... params) ->
decltype(func(kj::fwd<Params>(params)..., instance<const T&>(), instance<const U&>()...)) {
return applyTuple(kj::fwd<Func>(func), t.rest,
kj::fwd<Params>(params)..., t.first);
}
// =======================================================================================
template <typename Element, typename Iterator>
class IteratorInput {
public:
typedef Element ElementType;
IteratorInput(Iterator begin, Iterator end)
: parent(nullptr), pos(begin), end(end), best(begin) {}
IteratorInput(IteratorInput& parent)
: parent(&parent), pos(parent.pos), end(parent.end), best(parent.pos) {}
~IteratorInput() {
if (parent != nullptr) {
parent->best = kj::max(kj::max(pos, best), parent->best);
}
}
void advanceParent() {
parent->pos = pos;
}
bool atEnd() { return pos == end; }
const Element& current() {
KJ_IREQUIRE(!atEnd());
return *pos;
}
const Element& consume() {
assert(!atEnd());
return *pos++;
}
void next() {
KJ_IREQUIRE(!atEnd());
++pos;
}
Iterator getBest() { return kj::max(pos, best); }
Iterator getPosition() { return pos; }
private:
IteratorInput* parent;
Iterator pos;
Iterator end;
Iterator best; // furthest we got with any sub-input
IteratorInput(IteratorInput&&) = delete;
IteratorInput& operator=(const IteratorInput&) = delete;
IteratorInput& operator=(IteratorInput&&) = delete;
};
template <typename T>
struct ExtractParseFuncType;
template <typename I, typename O, typename Object>
struct ExtractParseFuncType<Maybe<O> (Object::*)(I&) const> {
typedef I InputType;
typedef typename I::ElementType ElementType;
typedef O OutputType;
};
template <typename I, typename O, typename Object>
struct ExtractParseFuncType<Maybe<O> (Object::*)(I&)> {
typedef I InputType;
typedef typename I::ElementType ElementType;
typedef O OutputType;
};
template <typename T>
struct ExtractParserType: public ExtractParseFuncType<decltype(&T::operator())> {};
template <typename T>
struct ExtractParserType<T&>: public ExtractParserType<T> {};
template <typename T>
struct ExtractParserType<T&&>: public ExtractParserType<T> {};
template <typename T>
struct ExtractParserType<const T>: public ExtractParserType<T> {};
template <typename T>
struct ExtractParserType<const T&>: public ExtractParserType<T> {};
template <typename T>
struct ExtractParserType<const T&&>: public ExtractParserType<T> {};
// =======================================================================================
template <typename Input, typename Output>
class ParserWrapper {
public:
virtual ~ParserWrapper() {}
typedef Input InputType;
typedef typename Input::ElementType ElementType;
typedef Output OutputType;
virtual Maybe<Output> operator()(Input& input) const = 0;
virtual Own<ParserWrapper> clone() = 0;
};
template <typename Input, typename Output>
class Parser {
public:
Parser(const Parser& other): wrapper(other.wrapper->clone()) {}
Parser(Parser& other): wrapper(other.wrapper->clone()) {}
Parser(const Parser&& other): wrapper(other.wrapper->clone()) {}
Parser(Parser&& other): wrapper(kj::mv(other.wrapper)) {}
Parser(Own<ParserWrapper<Input, Output>> wrapper): wrapper(kj::mv(wrapper)) {}
template <typename Other>
Parser(Other&& other): wrapper(heap<WrapperImpl<Other>>(kj::mv(other))) {}
Parser& operator=(const Parser& other) { wrapper = other.wrapper->clone(); }
Parser& operator=(Parser&& other) { wrapper = kj::mv(other.wrapper); }
// Always inline in the hopes that this allows branch prediction to kick in so the virtual call
// doesn't hurt so much.
inline Maybe<Output> operator()(Input& input) const __attribute__((always_inline)) {
return (*wrapper)(input);
}
private:
Own<ParserWrapper<Input, Output>> wrapper;
template <typename Other>
struct WrapperImpl: public ParserWrapper<Input, Output> {
WrapperImpl(Other&& impl): impl(kj::mv(impl)) {};
~WrapperImpl() {}
Maybe<Output> operator()(Input& input) const {
return impl(input);
}
Own<ParserWrapper<Input, Output>> clone() {
return heap<WrapperImpl>(*this);
}
Other impl;
};
};
template <typename ParserImpl>
Parser<typename ExtractParserType<ParserImpl>::InputType,
typename ExtractParserType<ParserImpl>::OutputType>
wrap(ParserImpl&& impl) {
typedef typename ExtractParserType<ParserImpl>::InputType Input;
typedef typename ExtractParserType<ParserImpl>::OutputType Output;
return Parser<Input, Output>(kj::mv(impl));
}
template <typename SubParser>
class ParserRef {
public:
explicit ParserRef(const SubParser& parser): parser(&parser) {}
Maybe<typename ExtractParserType<SubParser>::OutputType> operator()(
typename ExtractParserType<SubParser>::InputType& input) const {
return (*parser)(input);
}
private:
const SubParser* parser;
};
template <typename SubParser>
ParserRef<Decay<SubParser>> ref(const SubParser& impl) {
return ParserRef<Decay<SubParser>>(impl);
}
template <typename T>
struct MaybeRef {
typedef Decay<T> Type;
template <typename U>
static Type from(U&& parser) {
return static_cast<Type&&>(parser);
}
};
template <typename T>
struct MaybeRef<T&> {
typedef ParserRef<Decay<T>> Type;
template <typename U>
static Type from(U& parser) {
return parse::ref(parser);
}
};
template <template <typename SubParser> class WrapperParser>
struct WrapperParserConstructor {
template <typename SubParser, typename... Args>
WrapperParser<typename MaybeRef<SubParser>::Type> operator()(
SubParser&& subParser, Args&&... args) {
return WrapperParser<typename MaybeRef<SubParser>::Type>(
MaybeRef<SubParser>::from(subParser),
kj::fwd(args)...);
}
};
// -------------------------------------------------------------------
// ExactElementParser
// Output = Void
template <typename Input>
class ExactElementParser {
public:
explicit ExactElementParser(typename Input::ElementType&& expected): expected(expected) {}
virtual Maybe<Void> operator()(Input& input) const {
if (input.atEnd() || input.current() != expected) {
return nullptr;
} else {
input.next();
return Void();
}
}
private:
typename Input::ElementType expected;
};
template <typename Input>
ExactElementParser<Input> exactElement(typename Input::ElementType&& expected) {
return ExactElementParser<Decay<Input>>(kj::mv(expected));
}
// -------------------------------------------------------------------
// SequenceParser
// Output = Flattened Tuple of outputs of sub-parsers.
template <typename Input, typename... SubParsers> class SequenceParser;
template <typename Input, typename FirstSubParser, typename... SubParsers>
class SequenceParser<Input, FirstSubParser, SubParsers...> {
public:
template <typename T, typename... U>
explicit SequenceParser(T&& firstSubParser, U&&... rest)
: first(kj::fwd<T>(firstSubParser)), rest(kj::fwd<U>(rest)...) {}
auto operator()(Input& input) const ->
Maybe<decltype(tuple(
instance<typename ExtractParserType<FirstSubParser>::OutputType>(),
instance<typename ExtractParserType<SubParsers>::OutputType>()...))> {
return parseNext(input);
}
template <typename... InitialParams>
auto parseNext(Input& input, InitialParams&&... initialParams) const ->
Maybe<decltype(tuple(
kj::fwd<InitialParams>(initialParams)...,
instance<typename ExtractParserType<FirstSubParser>::OutputType>(),
instance<typename ExtractParserType<SubParsers>::OutputType>()...))> {
KJ_IF_MAYBE(firstResult, first(input)) {
return rest.parseNext(input, kj::fwd<InitialParams>(initialParams)...,
kj::mv(*firstResult));
} else {
return nullptr;
}
}
private:
FirstSubParser first;
SequenceParser<Input, SubParsers...> rest;
};
template <typename Input>
class SequenceParser<Input> {
public:
Maybe<Void> operator()(Input& input) const {
return parseNext(input);
}
template <typename... Params>
auto parseNext(Input& input, Params&&... params) const ->
Maybe<decltype(tuple(kj::fwd<Params>(params)...))> {
return tuple(kj::fwd<Params>(params)...);
}
};
template <typename FirstSubParser, typename... MoreSubParsers>
SequenceParser<typename ExtractParserType<FirstSubParser>::InputType,
typename MaybeRef<FirstSubParser>::Type,
typename MaybeRef<MoreSubParsers>::Type...>
sequence(FirstSubParser&& first, MoreSubParsers&&... rest) {
return SequenceParser<typename ExtractParserType<FirstSubParser>::InputType,
typename MaybeRef<FirstSubParser>::Type,
typename MaybeRef<MoreSubParsers>::Type...>(
MaybeRef<FirstSubParser>::from(first), MaybeRef<MoreSubParsers>::from(rest)...);
}
// -------------------------------------------------------------------
// RepeatedParser
// Output = Array of output of sub-parser.
template <typename T>
class Vector {
// Similar to std::vector, but based on KJ framework.
//
// This implementation always uses move constructors when growing the backing array. If the
// move constructor throws, the Vector is left in an inconsistent state. This is acceptable
// under KJ exception theory which assumes that exceptions leave things in inconsistent states.
public:
inline Vector() = default;
inline explicit Vector(size_t capacity): builder(heapArrayBuilder<T>(capacity)) {}
inline operator ArrayPtr<T>() { return builder; }
inline operator ArrayPtr<const T>() const { return builder; }
inline ArrayPtr<T> asPtr() { return builder.asPtr(); }
inline ArrayPtr<const T> asPtr() const { return builder.asPtr(); }
inline size_t size() const { return builder.size(); }
inline bool empty() const { return size() == 0; }
inline size_t capacity() const { return builder.capacity(); }
inline T& operator[](size_t index) const { return builder[index]; }
inline const T* begin() const { return builder.begin(); }
inline const T* end() const { return builder.end(); }
inline const T& front() const { return builder.front(); }
inline const T& back() const { return builder.back(); }
inline T* begin() { return builder.begin(); }
inline T* end() { return builder.end(); }
inline T& front() { return builder.front(); }
inline T& back() { return builder.back(); }
template <typename... Params>
inline void add(Params&&... params) {
if (builder.isFull()) grow();
builder.add(kj::fwd<Params>(params)...);
}
private:
ArrayBuilder<T> builder;
void grow() {
size_t newSize = capacity() == 0 ? 4 : capacity() * 2;
ArrayBuilder<T> newBuilder = heapArrayBuilder<T>(newSize);
for (T& element: builder) {
newBuilder.add(kj::mv(element));
}
builder = kj::mv(newBuilder);
}
};
template <typename SubParser, bool atLeastOne>
class RepeatedParser {
public:
explicit RepeatedParser(SubParser&& subParser)
: subParser(kj::mv(subParser)) {}
Maybe<Vector<typename ExtractParserType<SubParser>::OutputType>> operator()(
typename ExtractParserType<SubParser>::InputType& input) const {
typedef Vector<typename ExtractParserType<SubParser>::OutputType> Results;
Results results;
while (!input.atEnd()) {
typename ExtractParserType<SubParser>::InputType subInput(input);
KJ_IF_MAYBE(subResult, subParser(subInput)) {
subInput.advanceParent();
results.add(kj::mv(*subResult));
} else {
break;
}
}
if (atLeastOne && results.empty()) {
return nullptr;
}
return kj::mv(results);
}
private:
SubParser subParser;
};
template <typename SubParser>
RepeatedParser<typename MaybeRef<SubParser>::Type, false>
repeated(SubParser&& subParser) {
return RepeatedParser<typename MaybeRef<SubParser>::Type, false>(
MaybeRef<SubParser>::from(subParser));
}
template <typename SubParser>
RepeatedParser<typename MaybeRef<SubParser>::Type, true>
oneOrMore(SubParser&& subParser) {
return RepeatedParser<typename MaybeRef<SubParser>::Type, true>(
MaybeRef<SubParser>::from(subParser));
}
// -------------------------------------------------------------------
// OptionalParser
// Output = Maybe<output of sub-parser>
template <typename SubParser>
class OptionalParser {
public:
explicit OptionalParser(SubParser&& subParser)
: subParser(kj::mv(subParser)) {}
Maybe<Maybe<typename ExtractParserType<SubParser>::OutputType>> operator()(
typename ExtractParserType<SubParser>::InputType& input) const {
typedef Maybe<typename ExtractParserType<SubParser>::OutputType> Result;
typename ExtractParserType<SubParser>::InputType subInput(input);
auto subResult = subParser(subInput);
if (subResult == nullptr) {
return Result(nullptr);
} else {
subInput.advanceParent();
return Result(kj::mv(*subResult));
}
}
private:
SubParser subParser;
};
template <typename SubParser>
OptionalParser<typename MaybeRef<SubParser>::Type>
optional(SubParser&& subParser) {
return OptionalParser<typename MaybeRef<SubParser>::Type>(
MaybeRef<SubParser>::from(subParser));
}
// -------------------------------------------------------------------
// OneOfParser
// All SubParsers must have same output type, which becomes the output type of the
// OneOfParser.
template <typename Input, typename Output, typename... SubParsers>
class OneOfParser;
template <typename Input, typename Output, typename FirstSubParser, typename... SubParsers>
class OneOfParser<Input, Output, FirstSubParser, SubParsers...> {
public:
template <typename T, typename... U>
explicit OneOfParser(T&& firstSubParser, U&&... rest)
: first(kj::fwd<T>(firstSubParser)), rest(kj::fwd<U>(rest)...) {}
Maybe<Output> operator()(Input& input) const {
{
Input subInput(input);
Maybe<Output> firstResult = first(subInput);
if (firstResult != nullptr) {
// MAYBE: Should we try parsing with "rest" in order to check for ambiguities?
subInput.advanceParent();
return kj::mv(firstResult);
}
}
// Hoping for some tail recursion here...
return rest(input);
}
private:
FirstSubParser first;
OneOfParser<Input, Output, SubParsers...> rest;
};
template <typename Input, typename Output>
class OneOfParser<Input, Output> {
public:
Maybe<Output> operator()(Input& input) const {
return nullptr;
}
};
template <typename FirstSubParser, typename... MoreSubParsers>
OneOfParser<typename ExtractParserType<FirstSubParser>::InputType,
typename ExtractParserType<FirstSubParser>::OutputType,
typename MaybeRef<FirstSubParser>::Type,
typename MaybeRef<MoreSubParsers>::Type...>
oneOf(FirstSubParser&& first, MoreSubParsers&&... rest) {
return OneOfParser<typename ExtractParserType<FirstSubParser>::InputType,
typename ExtractParserType<FirstSubParser>::OutputType,
typename MaybeRef<FirstSubParser>::Type,
typename MaybeRef<MoreSubParsers>::Type...>(
MaybeRef<FirstSubParser>::from(first), MaybeRef<MoreSubParsers>::from(rest)...);
}
// -------------------------------------------------------------------
// TransformParser
// Output = Result of applying transform functor to input value. If input is a tuple, it is
// unpacked to form the transformation parameters.
template <typename Position>
struct Span {
public:
inline const Position& begin() { return begin_; }
inline const Position& end() { return end_; }
Span() = default;
inline Span(Position&& begin, Position&& end): begin_(mv(begin)), end_(mv(end)) {}
private:
Position begin_;
Position end_;
};
template <typename SubParser, typename Transform>
class TransformParser {
public:
explicit TransformParser(SubParser&& subParser, Transform&& transform)
: subParser(kj::mv(subParser)), transform(kj::mv(transform)) {}
typedef typename ExtractParserType<SubParser>::InputType InputType;
typedef Decay<decltype(instance<InputType>().getPosition())> Position;
typedef typename ExtractParserType<SubParser>::OutputType SubOutput;
typedef decltype(applyTuple(instance<Transform&>(), instance<SubOutput&&>(),
instance<Span<Position>>())) Output;
Maybe<Output> operator()(InputType& input) const {
auto start = input.getPosition();
KJ_IF_MAYBE(subResult, subParser(input)) {
return applyTuple(transform, kj::mv(*subResult),
Span<Position>(kj::mv(start), input.getPosition()));
} else {
return nullptr;
}
}
private:
SubParser subParser;
Transform transform;
};
template <typename SubParser, typename Transform>
TransformParser<typename MaybeRef<SubParser>::Type, Decay<Transform>>
transform(SubParser&& subParser, Transform&& transform) {
return TransformParser<typename MaybeRef<SubParser>::Type, Decay<Transform>>(
MaybeRef<SubParser>::from(subParser), kj::fwd<Transform>(transform));
}
// -------------------------------------------------------------------
// AcceptIfParser
// Output = Same as SubParser
template <typename SubParser, typename Condition>
class AcceptIfParser {
public:
explicit AcceptIfParser(SubParser&& subParser, Condition&& condition)
: subParser(kj::mv(subParser)), condition(kj::mv(condition)) {}
Maybe<typename ExtractParserType<SubParser>::OutputType>
operator()(typename ExtractParserType<SubParser>::InputType& input) const {
Maybe<typename ExtractParserType<SubParser>::OutputType> subResult = subParser(input);
if (subResult && !condition(*subResult)) {
subResult = nullptr;
}
return subResult;
}
private:
SubParser subParser;
Condition condition;
};
template <typename SubParser, typename Condition>
AcceptIfParser<typename MaybeRef<SubParser>::Type, Decay<Condition>>
acceptIf(SubParser&& subParser, Condition&& condition) {
return AcceptIfParser<typename MaybeRef<SubParser>::Type, Decay<Condition>>(
MaybeRef<SubParser>::from(subParser), kj::fwd<Condition>(condition));
}
// -------------------------------------------------------------------
// EndOfInputParser
// Output = Void, only succeeds if at end-of-input
template <typename Input>
class EndOfInputParser {
public:
Maybe<Void> operator()(Input& input) const {
if (input.atEnd()) {
return Void();
} else {
return nullptr;
}
}
};
template <typename T>
EndOfInputParser<T> endOfInput() {
return EndOfInputParser<T>();
}
} // namespace parse
} // namespace kj
#endif // KJ_PARSER_H_
...@@ -48,6 +48,7 @@ public: ...@@ -48,6 +48,7 @@ public:
inline StringPtr(const char* value, size_t size): content(value, size + 1) { inline StringPtr(const char* value, size_t size): content(value, size + 1) {
KJ_IREQUIRE(value[size] == '\0', "StringPtr must be NUL-terminated."); KJ_IREQUIRE(value[size] == '\0', "StringPtr must be NUL-terminated.");
} }
inline StringPtr(const char* begin, const char* end): StringPtr(begin, end - begin) {}
inline StringPtr(const String& value); inline StringPtr(const String& value);
inline operator ArrayPtr<const char>() const; inline operator ArrayPtr<const char>() const;
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment