aboutsummaryrefslogtreecommitdiff
path: root/src/openvic-dataloader/v2script/SimpleGrammar.hpp
blob: c91935eace15b86bad6a1969ec5e2eecfad05e8d (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
#pragma once

#include <memory>
#include <string>
#include <vector>

#include <openvic-dataloader/v2script/AbstractSyntaxTree.hpp>

#include <lexy/callback.hpp>
#include <lexy/dsl.hpp>

#include "detail/LexyLitRange.hpp"

// Grammar Definitions //
namespace ovdl::v2script::grammar {
   struct StatementListBlock;

   static constexpr auto whitespace_specifier = lexy::dsl::ascii::blank / lexy::dsl::ascii::newline;
   static constexpr auto comment_specifier = LEXY_LIT("#") >> lexy::dsl::until(lexy::dsl::newline).or_eof();

   static constexpr auto data_specifier =
      lexy::dsl::ascii::alpha_digit_underscore /
      LEXY_ASCII_ONE_OF("%&'") / lexy::dsl::lit_c<0x2B> / LEXY_ASCII_ONE_OF("-.") /
      lexy::dsl::ascii::digit / lexy::dsl::lit_c<0x3A> /
      lexy::dsl::lit_c<0x40> / lexy::dsl::ascii::upper / lexy::dsl::lit_c<0x5F> /
      lexy::dsl::ascii::lower / lexy::dsl::lit_b<0x8A> / lexy::dsl::lit_b<0x8C> / lexy::dsl::lit_b<0x8E> /
      lexy::dsl::lit_b<0x92> / lexy::dsl::lit_b<0x97> / lexy::dsl::lit_b<0x9A> / lexy::dsl::lit_b<0x9C> / lexy::dsl::lit_b<0x9E> / lexy::dsl::lit_b<0x9F> /
      lexy::dsl::lit_b<0xC0> /
      ovdl::detail::lexydsl::make_range<0xC0, 0xD6>() / ovdl::detail::lexydsl::make_range<0xD8, 0xF6>() / ovdl::detail::lexydsl::make_range<0xF8, 0xFF>();

   static constexpr auto data_char_class = LEXY_CHAR_CLASS("DataSpecifier", data_specifier);

   struct Identifier {
      static constexpr auto rule = lexy::dsl::identifier(data_char_class);
      static constexpr auto value = lexy::as_string<std::string> | lexy::new_<ast::IdentifierNode, ast::NodePtr>;
   };

   struct StringExpression {
      static constexpr auto escaped_symbols = lexy::symbol_table<char> //
                                       .map<'"'>('"')
                                       .map<'\''>('\'')
                                       .map<'\\'>('\\')
                                       .map<'/'>('/')
                                       .map<'b'>('\b')
                                       .map<'f'>('\f')
                                       .map<'n'>('\n')
                                       .map<'r'>('\r')
                                       .map<'t'>('\t');
      static constexpr auto rule = [] {
         // Arbitrary code points that aren't control characters.
         auto c = ovdl::detail::lexydsl::make_range<0x20, 0xFF>() - lexy::dsl::ascii::control;

         // Escape sequences start with a backlash.
         // They either map one of the symbols,
         // or a Unicode code point of the form uXXXX.
         auto escape = lexy::dsl::backslash_escape //
                       .symbol<escaped_symbols>();
         return lexy::dsl::quoted(c, escape);
      }();

      static constexpr auto value = lexy::as_string<std::string> >> lexy::new_<ast::StringNode, ast::NodePtr>;
   };

   struct SimpleAssignmentStatement {
      static constexpr auto rule =
         lexy::dsl::p<Identifier> >>
         lexy::dsl::equal_sign +
            (lexy::dsl::p<Identifier> | lexy::dsl::p<StringExpression> | lexy::dsl::recurse_branch<StatementListBlock>);

      static constexpr auto value = lexy::callback<ast::NodePtr>(
         [](auto name, auto&& initalizer) {
            return make_node_ptr<ast::AssignNode>(LEXY_MOV(name), LEXY_MOV(initalizer));
         });
   };

   struct AssignmentStatement {
      static constexpr auto rule =
         lexy::dsl::p<Identifier> >>
            (lexy::dsl::equal_sign >>
                  (lexy::dsl::p<Identifier> | lexy::dsl::p<StringExpression> | lexy::dsl::recurse_branch<StatementListBlock>) |
               lexy::dsl::else_ >> lexy::dsl::return_) |
         lexy::dsl::p<StringExpression>;

      static constexpr auto value = lexy::callback<ast::NodePtr>(
         [](auto name, lexy::nullopt = {}) {
            return LEXY_MOV(name);
         },
         [](auto name, auto&& initalizer) {
            return make_node_ptr<ast::AssignNode>(LEXY_MOV(name), LEXY_MOV(initalizer));
         });
   };

   struct StatementListBlock {
      static constexpr auto rule =
         lexy::dsl::curly_bracketed(
            lexy::dsl::opt(lexy::dsl::list(lexy::dsl::p<AssignmentStatement>)) + lexy::dsl::opt(lexy::dsl::semicolon));

      static constexpr auto value =
         lexy::as_list<std::vector<ast::NodePtr>> >>
         lexy::callback<ast::NodePtr>(
            [](lexy::nullopt = {}, lexy::nullopt = {}) {
               return ast::make_node_ptr<ast::ListNode>();
            },
            [](auto&& list, lexy::nullopt = {}) {
               return make_node_ptr<ast::ListNode>(LEXY_MOV(list));
            },
            [](auto& list) {
               return make_node_ptr<ast::ListNode>(list);
            });
   };

   struct File {
      // Allow arbitrary spaces between individual tokens.
      static constexpr auto whitespace = whitespace_specifier | comment_specifier;

      static constexpr auto rule = lexy::dsl::terminator(lexy::dsl::eof).list(lexy::dsl::p<AssignmentStatement>);

      static constexpr auto value = lexy::as_list<std::vector<ast::NodePtr>> >> lexy::new_<ast::FileNode, ast::NodePtr>;
   };
}