catala/compiler/surface/parser.mly

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

735 lines
19 KiB
OCaml
Raw Normal View History

(*
2020-04-16 18:47:35 +03:00
This file is part of the Catala compiler, a specification language for tax and social benefits
computation rules.
Copyright (C) 2020 Inria, contributors: Denis Merigoux <denis.merigoux@inria.fr>,
Emile Rolley <emile.rolley@tuta.io>
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*)
%{
2022-11-21 12:46:17 +03:00
open Catala_utils
%}
%parameter<Localisation: sig
2021-08-19 19:26:06 +03:00
val lex_builtin: string -> Ast.builtin_expression option
end>
2020-04-03 23:34:11 +03:00
%type <Ast.source_file> source_file
%start source_file
(* The token is returned for every line of law text, make them right-associative
so that we concat them efficiently as much as possible. *)
%right LAW_TEXT
%%
let typ_base :=
| INTEGER ; { (Integer, Pos.from_lpos $sloc) }
| BOOLEAN ; { (Boolean, Pos.from_lpos $sloc) }
| MONEY ; { (Money, Pos.from_lpos $sloc) }
| DURATION ; { (Duration, Pos.from_lpos $sloc) }
| TEXT ; { (Text, Pos.from_lpos $sloc) }
| DECIMAL ; { (Decimal, Pos.from_lpos $sloc) }
| DATE ; { (Date, Pos.from_lpos $sloc) }
| c = constructor ; {
2020-04-14 12:46:48 +03:00
let (s, _) = c in
2021-01-20 17:37:20 +03:00
(Named s, Pos.from_lpos $sloc)
2020-04-14 12:46:48 +03:00
}
let typ :=
| t = typ_base ; {
let t, loc = t in
(Primitive t, loc)
}
| COLLECTION ; t = typ ; {
2021-01-20 17:37:20 +03:00
(Collection t, Pos.from_lpos $sloc)
2020-04-14 12:46:48 +03:00
}
2020-03-08 07:01:26 +03:00
let qident :=
| b = separated_nonempty_list(DOT, ident) ; {
2021-01-20 17:37:20 +03:00
( b, Pos.from_lpos $sloc)
2020-04-14 18:58:36 +03:00
}
let atomic_expression :=
| q = IDENT ; {
2021-08-19 19:26:06 +03:00
(match Localisation.lex_builtin q with
| Some b -> Builtin b
| None -> Ident q),
2021-04-30 20:14:51 +03:00
Pos.from_lpos $sloc }
| l = literal ; { let (l, l_pos) = l in (Literal l, l_pos) }
| LPAREN ; e = expression ; RPAREN ; { e }
let small_expression :=
2022-12-13 19:57:21 +03:00
| ~ = atomic_expression ; <>
| e = small_expression ; DOT ; c = option(terminated(constructor,DOT)) ; i = ident ; {
(Dotted (e, c, i), Pos.from_lpos $sloc)
}
| CARDINAL ; {
Make scopes directly callable Quite a few changes are included here, some of which have some extra implications visible in the language: - adds the `Scope of { -- input_v: value; ... }` construct in the language - handle it down the pipeline: * `ScopeCall` in the surface AST * `EScopeCall` in desugared and scopelang * expressions are now traversed to detect dependencies between scopes * transformed into a normal function call in dcalc - defining a scope now implicitely defines a structure with the same name, with the output variables of the scope defined as fields. This allows us to type the return value from a scope call and access its fields easily. * the implications are mostly in surface/name_resolution.ml code-wise * the `Scope_out` struct that was defined in scope_to_dcalc is no longer needed/used and the fields are no longer renamed (changes some outputs; the explicit suffix for variables with multiple states is ignored as well) * one benefit is that disambiguation works just like for structures when there are conflicts on field names * however, it's now a conflict if a scope and a structure have the same name (side-note: issues with conflicting enum / struct names or scope variables / subscope names were silent and are now properly reported) - you can consequently use scope names as types for variables as well. Writing literals is not allowed though, they can only be obtained by calling the scope. Remaining TODOs: - context variables are not handled properly at the moment - error handling on invalid calls - tests show a small error message regression; lots of examples will need tweaking to avoid scope/struct name or struct fields / output variable conflicts - add a `->` syntax to make struct field access distinct from scope output var access, enforced with typing. This is expected to reduce confusion of users and add a little typing precision. - document the new syntax & implications (tutorial, cheat-sheet) - a consequence of the changes is that subscope variables also can now be typed. A possible future evolution / simplification would be to rewrite subscopes as explicit scope calls early in the pipeline. That could also allow to manipulate them as expressions (bind them in let-ins, return them...)
2022-10-21 16:47:17 +03:00
(Builtin Cardinal, Pos.from_lpos $sloc)
}
| DECIMAL ; { Builtin ToDecimal, Pos.from_lpos $sloc }
| MONEY ; { Builtin ToMoney, Pos.from_lpos $sloc }
| LSQUARE ; l = separated_list(SEMICOLON, expression) ; RSQUARE ; {
Make scopes directly callable Quite a few changes are included here, some of which have some extra implications visible in the language: - adds the `Scope of { -- input_v: value; ... }` construct in the language - handle it down the pipeline: * `ScopeCall` in the surface AST * `EScopeCall` in desugared and scopelang * expressions are now traversed to detect dependencies between scopes * transformed into a normal function call in dcalc - defining a scope now implicitely defines a structure with the same name, with the output variables of the scope defined as fields. This allows us to type the return value from a scope call and access its fields easily. * the implications are mostly in surface/name_resolution.ml code-wise * the `Scope_out` struct that was defined in scope_to_dcalc is no longer needed/used and the fields are no longer renamed (changes some outputs; the explicit suffix for variables with multiple states is ignored as well) * one benefit is that disambiguation works just like for structures when there are conflicts on field names * however, it's now a conflict if a scope and a structure have the same name (side-note: issues with conflicting enum / struct names or scope variables / subscope names were silent and are now properly reported) - you can consequently use scope names as types for variables as well. Writing literals is not allowed though, they can only be obtained by calling the scope. Remaining TODOs: - context variables are not handled properly at the moment - error handling on invalid calls - tests show a small error message regression; lots of examples will need tweaking to avoid scope/struct name or struct fields / output variable conflicts - add a `->` syntax to make struct field access distinct from scope output var access, enforced with typing. This is expected to reduce confusion of users and add a little typing precision. - document the new syntax & implications (tutorial, cheat-sheet) - a consequence of the changes is that subscope variables also can now be typed. A possible future evolution / simplification would be to rewrite subscopes as explicit scope calls early in the pipeline. That could also allow to manipulate them as expressions (bind them in let-ins, return them...)
2022-10-21 16:47:17 +03:00
(ArrayLit l, Pos.from_lpos $sloc)
}
let struct_content_field :=
| field = ident ; COLON ; e = logical_expression ; {
(field, e)
2020-04-14 20:13:20 +03:00
}
let enum_inject_content :=
| CONTENT ; e = small_expression ; { e }
2020-03-08 07:01:26 +03:00
let struct_inject_content :=
| LBRACKET ;
fields = nonempty_list(preceded(ALT, struct_content_field)) ;
RBRACKET ; {
fields
}
let struct_or_enum_inject :=
| enum = constructor ;
c = option(preceded(DOT, constructor)) ;
data = option(enum_inject_content) ; {
(* The fully qualified enum is actually the optional part, but it leads to shift/reduce conflicts.
We flip it here *)
match c with
| None -> (EnumInject(None, enum, data), Pos.from_lpos $sloc)
| Some c -> (EnumInject(Some enum, c, data), Pos.from_lpos $sloc)
}
| c = constructor ;
fields = struct_inject_content ; {
(StructLit(c, fields), Pos.from_lpos $sloc)
}
let primitive_expression :=
2022-12-13 19:57:21 +03:00
| ~ = small_expression ; <>
| e = struct_or_enum_inject ; {
e
}
let num_literal :=
| d = INT_LITERAL ; { (Int d, Pos.from_lpos $sloc) }
| d = DECIMAL_LITERAL ; {
let (d1, d2) = d in
(Dec (d1, d2), Pos.from_lpos $sloc)
}
2020-04-14 20:13:20 +03:00
let unit_literal :=
| PERCENT ; { (Percent, Pos.from_lpos $sloc) }
| YEAR ; { (Year, Pos.from_lpos $sloc)}
| MONTH ; { (Month, Pos.from_lpos $sloc) }
| DAY ; { (Day, Pos.from_lpos $sloc) }
2020-04-11 19:16:15 +03:00
let literal :=
| l = num_literal; u = option(unit_literal) ; {
(LNumber (l, u), Pos.from_lpos $sloc)
}
| money = MONEY_AMOUNT ; {
let (units, cents) = money in
2021-01-20 18:06:04 +03:00
(LMoneyAmount {
money_amount_units = units;
money_amount_cents = cents;
2021-01-20 17:37:20 +03:00
}, Pos.from_lpos $sloc)
}
| VERTICAL ; d = DATE_LITERAL ; VERTICAL ; {
2022-07-21 15:14:22 +03:00
let (y,m,d) = d in
(LDate {
literal_date_year = y;
literal_date_month = m;
literal_date_day = d;
2021-01-20 17:37:20 +03:00
}, Pos.from_lpos $sloc)
}
| TRUE ; { (LBool true, Pos.from_lpos $sloc) }
| FALSE ; { (LBool false, Pos.from_lpos $sloc) }
let compare_op :=
| LESSER ; { (Lt KPoly, Pos.from_lpos $sloc) }
| LESSER_EQUAL ; { (Lte KPoly, Pos.from_lpos $sloc) }
| GREATER ; { (Gt KPoly, Pos.from_lpos $sloc) }
| GREATER_EQUAL ; { (Gte KPoly, Pos.from_lpos $sloc) }
| EQUAL ; { (Eq, Pos.from_lpos $sloc) }
| NOT_EQUAL ; { (Neq, Pos.from_lpos $sloc) }
let scope_call_args :=
| WITH_V ;
LBRACKET ;
fields = list(preceded (ALT, struct_content_field)) ;
RBRACKET ; {
fields
}
let minmax :=
| MAXIMUM ; { true }
| MINIMUM ; { false }
2022-12-12 18:02:07 +03:00
let base_expression :=
2022-12-13 19:57:21 +03:00
| ~ = primitive_expression ; <>
| e1 = small_expression ;
OF ;
e2 = base_expression ; {
(FunCall (e1, e2), Pos.from_lpos $sloc)
}
| OUTPUT ; OF ;
c = constructor ;
fields = option(scope_call_args) ; {
let fields = Option.value ~default:[] fields in
Make scopes directly callable Quite a few changes are included here, some of which have some extra implications visible in the language: - adds the `Scope of { -- input_v: value; ... }` construct in the language - handle it down the pipeline: * `ScopeCall` in the surface AST * `EScopeCall` in desugared and scopelang * expressions are now traversed to detect dependencies between scopes * transformed into a normal function call in dcalc - defining a scope now implicitely defines a structure with the same name, with the output variables of the scope defined as fields. This allows us to type the return value from a scope call and access its fields easily. * the implications are mostly in surface/name_resolution.ml code-wise * the `Scope_out` struct that was defined in scope_to_dcalc is no longer needed/used and the fields are no longer renamed (changes some outputs; the explicit suffix for variables with multiple states is ignored as well) * one benefit is that disambiguation works just like for structures when there are conflicts on field names * however, it's now a conflict if a scope and a structure have the same name (side-note: issues with conflicting enum / struct names or scope variables / subscope names were silent and are now properly reported) - you can consequently use scope names as types for variables as well. Writing literals is not allowed though, they can only be obtained by calling the scope. Remaining TODOs: - context variables are not handled properly at the moment - error handling on invalid calls - tests show a small error message regression; lots of examples will need tweaking to avoid scope/struct name or struct fields / output variable conflicts - add a `->` syntax to make struct field access distinct from scope output var access, enforced with typing. This is expected to reduce confusion of users and add a little typing precision. - document the new syntax & implications (tutorial, cheat-sheet) - a consequence of the changes is that subscope variables also can now be typed. A possible future evolution / simplification would be to rewrite subscopes as explicit scope calls early in the pipeline. That could also allow to manipulate them as expressions (bind them in let-ins, return them...)
2022-10-21 16:47:17 +03:00
(ScopeCall (c, fields), Pos.from_lpos $sloc)
}
| e = primitive_expression ;
WITH ; c = constructor_binding ; {
(TestMatchCase (e, (c, Pos.from_lpos $sloc)), Pos.from_lpos $sloc)
}
| e1 = primitive_expression ;
CONTAINS ;
e2 = base_expression ; {
(MemCollection (e2, e1), Pos.from_lpos $sloc)
}
| SUM ; typ = typ_base ;
OF ; coll = base_expression ; {
2022-12-12 18:02:07 +03:00
CollectionOp (AggregateSum { typ = Marked.unmark typ }, coll), Pos.from_lpos $sloc
}
| f = primitive_expression ;
FOR ; i = ident ;
IN ; coll = base_expression ; {
2022-12-12 18:02:07 +03:00
CollectionOp (Map {f = i, f}, coll), Pos.from_lpos $sloc
}
| max = minmax ;
OF ; coll = base_expression ;
OR ; IF ; COLLECTION ; IS ; EMPTY ; THEN ;
default = base_expression ; {
2022-12-12 18:02:07 +03:00
CollectionOp (AggregateExtremum { max; default }, coll), Pos.from_lpos $sloc
}
2020-03-08 07:12:12 +03:00
let unop :=
| NOT ; { (Not, Pos.from_lpos $sloc) }
| k = MINUS ; { (Minus k, Pos.from_lpos $sloc) }
let unop_expression :=
2022-12-13 19:57:21 +03:00
| ~ = base_expression ; <>
| op = unop ; e = unop_expression ; {
(Unop (op, e), Pos.from_lpos $sloc)
}
let mult_op :=
| k = MULT ; { (Mult k, Pos.from_lpos $sloc) }
| k = DIV ; { (Div k, Pos.from_lpos $sloc) }
let mult_expression :=
2022-12-13 19:57:21 +03:00
| ~ = unop_expression ; <>
| e1 = mult_expression ;
binop = mult_op ;
e2 = unop_expression ; {
(Binop (binop, e1, e2), Pos.from_lpos $sloc)
}
2020-03-08 08:06:32 +03:00
let sum_op :=
| k = PLUS ; { (Add k, Pos.from_lpos $sloc) }
| k = MINUS ; { (Sub k, Pos.from_lpos $sloc) }
| PLUSPLUS ; { (Concat, Pos.from_lpos $sloc) }
let sum_expression :=
2022-12-13 19:57:21 +03:00
| ~ = mult_expression ; <>
| e1 = sum_expression ;
binop = sum_op ;
e2 = mult_expression ; {
(Binop (binop, e1, e2), Pos.from_lpos $sloc)
}
let logical_and_op :=
| AND ; { (And, Pos.from_lpos $sloc) }
2021-11-12 11:43:23 +03:00
let logical_or_op :=
| OR ; { (Or, Pos.from_lpos $sloc) }
| XOR ; { (Xor, Pos.from_lpos $sloc) }
let compare_expression :=
| ~ = sum_expression ; <>
| e1 = sum_expression ;
binop = compare_op ;
e2 = compare_expression ; {
(Binop (binop, e1, e2), Pos.from_lpos $sloc)
}
let logical_atom :=
| ~ = compare_expression ; <>
2021-11-12 11:43:23 +03:00
let logical_or_expression :=
| ~ = logical_atom ; <>
| e1 = logical_atom ;
binop = logical_or_op ;
e2 = logical_or_expression ; {
2021-11-12 11:43:23 +03:00
(Binop (binop, e1, e2), Pos.from_lpos $sloc)
}
let logical_expression :=
2022-12-13 19:57:21 +03:00
| ~ = logical_or_expression ; <>
| e1 = logical_or_expression ;
binop = logical_and_op ;
e2 = logical_expression ; {
(Binop (binop, e1, e2), Pos.from_lpos $sloc)
}
let maybe_qualified_constructor :=
| c_or_path = constructor ;
c = option(preceded(DOT, constructor)) ; {
match c with
| None -> (None, c_or_path)
| Some c -> (Some c_or_path, c)
}
let optional_binding :=
| { ([], None)}
| OF ; i = ident ; {([], Some i)}
| OF ;
c = maybe_qualified_constructor ;
cs_and_i = constructor_binding ; {
2020-04-14 20:13:20 +03:00
let (cs, i) = cs_and_i in
(c::cs, i)
}
2020-03-08 08:49:29 +03:00
let constructor_binding :=
| c = maybe_qualified_constructor ;
cs_and_i = optional_binding ; {
let (cs, i) = cs_and_i in
(c::cs, i)
}
2020-03-08 08:06:32 +03:00
let match_arm :=
| WILDCARD ;
COLON ;
e = logical_expression ; {
(WildCard (e), Pos.from_lpos $sloc)
}
| pat = constructor_binding ;
COLON ;
e = logical_expression ; {
(MatchCase {
(* DM 14/04/2020 : I can't have the $sloc in constructor_binding... *)
match_case_pattern = (pat, Pos.from_lpos $sloc);
match_case_expr = e;
}, Pos.from_lpos $sloc)
}
2020-03-08 08:06:32 +03:00
let match_arms :=
| ALT ; a = match_arm ; arms = match_arms ; {
let (arms, _) = arms in
(a::arms, Pos.from_lpos $sloc)
}
| { ([], Pos.from_lpos $sloc) }
2020-03-08 08:06:32 +03:00
let let_expression :=
2022-12-13 19:57:21 +03:00
| ~ = logical_expression ; <>
| EXISTS ; i = ident ;
IN ; coll = compare_expression ;
SUCH ; THAT ; predicate = compare_expression ; {
2022-12-12 18:02:07 +03:00
CollectionOp (Exists {predicate = i, predicate}, coll), Pos.from_lpos $sloc
}
| FOR ; ALL ; i = ident ;
IN ; coll = compare_expression ;
WE_HAVE ; predicate = compare_expression ; {
2022-12-12 18:02:07 +03:00
CollectionOp (Forall {predicate = i, predicate}, coll), Pos.from_lpos $sloc
}
| MATCH ; e = primitive_expression ;
WITH ; arms = match_arms ; {
(MatchWith (e, arms), Pos.from_lpos $sloc)
}
| IF ; e1 = let_expression ;
THEN ; e2 = let_expression ;
ELSE ; e3 = let_expression ; {
(IfThenElse (e1, e2, e3), Pos.from_lpos $sloc)
}
| LET ; id = ident ;
DEFINED_AS ; e1 = let_expression ;
IN ; e2 = let_expression ; {
2022-07-26 14:40:43 +03:00
(LetIn (id, e1, e2), Pos.from_lpos $sloc)
}
2022-12-12 18:02:07 +03:00
let expression :=
2022-12-13 19:57:21 +03:00
| ~ = let_expression ; <>
| i = ident ;
IN ; coll = compare_expression ;
SUCH ; THAT ; f = compare_expression ; {
2022-12-12 18:02:07 +03:00
CollectionOp (Filter {f = i, f}, coll), Pos.from_lpos $sloc
}
| i = ident ;
IN ; coll = compare_expression ;
SUCH ; THAT ; f = compare_expression ;
IS ; max = minmax ;
OR ; IF ; COLLECTION ; IS ; EMPTY ; THEN ; default = expression ; {
2022-12-12 18:02:07 +03:00
CollectionOp (AggregateArgExtremum { max; default; f = i, f }, coll),
Pos.from_lpos $sloc
}
let condition :=
| UNDER_CONDITION ; e = expression ; { e }
2020-03-08 07:01:26 +03:00
let condition_consequence :=
| cond = condition ; CONSEQUENCE ; { cond }
let rule_expr :=
| i = qident ;
p = option(definition_parameters) ; {
(i, p)
}
2020-04-14 20:16:40 +03:00
let rule_consequence :=
| flag = option(NOT); FILLED ; {
2020-08-07 11:57:57 +03:00
let b = match flag with Some _ -> false | None -> true in
2021-01-20 17:37:20 +03:00
(b, Pos.from_lpos $sloc)
}
2020-08-07 11:57:57 +03:00
let rule :=
| label = option(label) ;
except = option(exception_to) ;
RULE ;
name_and_param = rule_expr ;
cond = option(condition_consequence) ;
state = option(state) ;
consequence = rule_consequence ; {
let (name, param_applied) = name_and_param in
let cons : bool Marked.pos = consequence in
let rule_exception = match except with
| None -> NotAnException
| Some x -> x
in
{
rule_label = label;
rule_exception_to = rule_exception;
rule_parameter = param_applied;
rule_condition = cond;
rule_name = name;
rule_id = Shared_ast.RuleName.fresh
(String.concat "." (List.map (fun i -> Marked.unmark i) (Marked.unmark name)),
Pos.from_lpos $sloc);
rule_consequence = cons;
rule_state = state;
}, $sloc
}
let definition_parameters :=
| OF ; i = ident ; { i }
let label :=
| LABEL ; i = ident ; { i }
let state :=
| STATE ; s = ident ; { s }
let exception_to :=
| EXCEPTION ; i = option(ident) ; {
match i with
| None -> UnlabeledException
| Some x -> ExceptionToLabel x
}
let definition :=
| label = option(label);
except = option(exception_to) ;
DEFINITION ;
name = qident ;
param = option(definition_parameters) ;
state = option(state) ;
cond = option(condition_consequence) ;
DEFINED_AS ;
e = expression ; {
let def_exception = match except with
| None -> NotAnException
| Some x -> x
in
{
definition_label = label;
definition_exception_to = def_exception;
definition_name = name;
definition_parameter = param;
definition_condition = cond;
definition_id =
Shared_ast.RuleName.fresh
(String.concat "." (List.map (fun i -> Marked.unmark i) (Marked.unmark name)),
Pos.from_lpos $sloc);
definition_expr = e;
definition_state = state;
}, $sloc
}
let variation_type :=
| INCREASING ; { (Increasing, Pos.from_lpos $sloc) }
| DECREASING ; { (Decreasing, Pos.from_lpos $sloc) }
let assertion_base :=
| e = expression ; { let (e, _) = e in (e, Pos.from_lpos $sloc) }
let assertion :=
| cond = option(condition_consequence) ;
base = assertion_base ; {
(Assertion {
assertion_condition = cond;
assertion_content = base;
})
}
| FIXED ; q = qident ; BY ; i = ident ; {
MetaAssertion (FixedBy (q, i))
}
| VARIES ; q = qident ;
WITH_V ; e = base_expression ;
t = option(variation_type) ; {
MetaAssertion (VariesWith (q, e, t))
}
2020-03-08 08:06:32 +03:00
let scope_item :=
| r = rule ; {
let (r, _) = r in (Rule r, Pos.from_lpos $sloc)
}
| d = definition ; {
let (d, _) = d in (Definition d, Pos.from_lpos $sloc)
}
| ASSERTION ; contents = assertion ; {
(contents, Pos.from_lpos $sloc)
}
2020-03-08 06:28:45 +03:00
let ident :=
| i = IDENT ; {
2021-08-19 19:26:06 +03:00
match Localisation.lex_builtin i with
| Some _ ->
Errors.raise_spanned_error
(Pos.from_lpos $sloc)
"Reserved builtin name"
2021-08-19 19:26:06 +03:00
| None ->
(i, Pos.from_lpos $sloc)
}
2020-04-14 12:46:48 +03:00
let condition_pos :=
| CONDITION ; { Pos.from_lpos $sloc }
2020-04-14 12:46:48 +03:00
let struct_scope_base :=
| DATA ; i = ident ;
CONTENT ; t = typ ; {
let t, pos = t in
(i, (Data t, pos))
}
| pos = condition_pos ; i = ident ; {
(i, (Condition, pos))
}
2020-04-03 23:58:34 +03:00
let struct_scope_func :=
| DEPENDS ; t = typ ; { t }
2020-04-03 23:58:34 +03:00
let struct_scope :=
| name_and_typ = struct_scope_base ;
func_typ = option(struct_scope_func) ; {
let (name, typ) = name_and_typ in
let (typ, typ_pos) = typ in
{
struct_decl_field_name = name;
2020-04-14 13:34:09 +03:00
struct_decl_field_typ = match func_typ with
| None -> (Base typ, typ_pos)
| Some (arg_typ, arg_pos) ->
Func {
arg_typ = (Data arg_typ, arg_pos);
return_typ = (typ, typ_pos);
}, Pos.from_lpos $sloc ;
}, Pos.from_lpos $sloc
}
2020-04-03 23:58:34 +03:00
let scope_decl_item_attribute_input :=
| CONTEXT ; { Context, Pos.from_lpos $sloc }
| INPUT ; { Input, Pos.from_lpos $sloc }
let scope_decl_item_attribute_output :=
| OUTPUT ; { true, Pos.from_lpos $sloc }
| { false, Pos.from_lpos $sloc }
let scope_decl_item_attribute :=
| input = scope_decl_item_attribute_input ;
output = scope_decl_item_attribute_output ; {
{
scope_decl_context_io_input = input;
scope_decl_context_io_output = output
}
}
| INTERNAL ; {
{
scope_decl_context_io_input = (Internal, Pos.from_lpos $sloc);
scope_decl_context_io_output = (false, Pos.from_lpos $sloc)
}
}
| OUTPUT ; {
{
scope_decl_context_io_input = (Internal, Pos.from_lpos $sloc);
scope_decl_context_io_output = (true, Pos.from_lpos $sloc)
}
}
let scope_decl_item :=
| attr = scope_decl_item_attribute ;
i = ident ;
CONTENT ; t = typ ;
func_typ = option(struct_scope_func) ;
states = list(state) ; {
(ContextData {
scope_decl_context_item_name = i;
scope_decl_context_item_attribute = attr;
2020-05-14 22:19:46 +03:00
scope_decl_context_item_typ =
2022-02-28 16:33:07 +03:00
(let (typ, typ_pos) = t in
match func_typ with
| None -> (Base (Data typ), typ_pos)
| Some (arg_typ, arg_pos) ->
Func {
arg_typ = (Data arg_typ, arg_pos);
return_typ = (Data typ, typ_pos);
}, Pos.from_lpos $sloc);
2022-02-28 16:33:07 +03:00
scope_decl_context_item_states = states;
}, Pos.from_lpos $sloc)
}
| i = ident ; SCOPE ; c = constructor ; {
(ContextScope{
scope_decl_context_scope_name = i;
scope_decl_context_scope_sub_scope = c;
scope_decl_context_scope_attribute = {
scope_decl_context_io_input = (Internal, Pos.from_lpos $sloc);
scope_decl_context_io_output = (false, Pos.from_lpos $sloc);
};
}, Pos.from_lpos $sloc)
}
| attr = scope_decl_item_attribute ;
i = ident ;
_condition = CONDITION ;
func_typ = option(struct_scope_func) ;
states = list(state) ; {
ContextData {
scope_decl_context_item_name = i;
scope_decl_context_item_attribute = attr;
scope_decl_context_item_typ =
2022-02-28 16:33:07 +03:00
(match func_typ with
| None -> (Base (Condition), Pos.from_lpos $loc(_condition))
| Some (arg_typ, arg_pos) ->
Func {
arg_typ = (Data arg_typ, arg_pos);
return_typ = (Condition, Pos.from_lpos $loc(_condition));
}, Pos.from_lpos $sloc);
2022-02-28 16:33:07 +03:00
scope_decl_context_item_states = states;
}, Pos.from_lpos $sloc
}
2020-04-03 23:58:34 +03:00
let enum_decl_line_payload :=
| CONTENT ; t = typ ; { let (t, t_pos) = t in (Base (Data t), t_pos) }
2020-04-10 13:55:18 +03:00
let enum_decl_line :=
| ALT ; c = constructor ;
t = option(enum_decl_line_payload) ; {
({
enum_decl_case_name = c;
2020-04-14 13:34:09 +03:00
enum_decl_case_typ = t;
}, Pos.from_lpos $sloc)
}
2020-04-14 12:46:48 +03:00
let constructor :=
| c = CONSTRUCTOR ; { (c, Pos.from_lpos $sloc) }
2020-04-10 13:55:18 +03:00
let scope_use_condition :=
| UNDER_CONDITION ; e = expression ; { e }
let code_item :=
| SCOPE ; c = constructor ;
e = option(scope_use_condition) ;
COLON ; items = nonempty_list(scope_item) ; {
(ScopeUse {
scope_use_name = c;
scope_use_condition = e;
2020-05-14 22:19:46 +03:00
scope_use_items = items;
}, Pos.from_lpos $sloc)
}
| DECLARATION ; STRUCT ; c = constructor ;
COLON ; scopes = list(struct_scope) ; {
(StructDecl {
struct_decl_name = c;
2020-05-14 22:19:46 +03:00
struct_decl_fields = scopes;
}, Pos.from_lpos $sloc)
}
| DECLARATION ; SCOPE ; c = constructor ;
COLON ; context = nonempty_list(scope_decl_item) ; {
(ScopeDecl {
scope_decl_name = c;
scope_decl_context = context;
}, Pos.from_lpos $sloc)
}
| DECLARATION ; ENUM ; c = constructor ;
COLON ; cases = list(enum_decl_line) ; {
(EnumDecl {
enum_decl_name = c;
2020-04-14 13:34:09 +03:00
enum_decl_cases = cases;
}, Pos.from_lpos $sloc)
}
let code :=
| code = list(code_item) ; { (code, Pos.from_lpos $sloc) }
let metadata_block :=
| BEGIN_METADATA ; option(law_text) ;
code_and_pos = code ;
text = END_CODE ; {
2022-08-16 12:46:20 +03:00
let (code, _) = code_and_pos in
(code, (text, Pos.from_lpos $sloc))
}
let law_heading :=
| title = LAW_HEADING ; {
2022-09-07 18:14:22 +03:00
let (title, id, is_archive, precedence) = title in {
law_heading_name = (title, Pos.from_lpos $sloc);
law_heading_id = id;
2022-09-07 18:14:22 +03:00
law_heading_is_archive = is_archive;
law_heading_precedence = precedence;
}
}
let law_text :=
| lines = nonempty_list(LAW_TEXT) ; { String.trim (String.concat "" lines) }
let source_file_item :=
| text = law_text ; { LawText text }
| BEGIN_CODE ;
code_and_pos = code ;
text = END_CODE ; {
2022-08-10 19:04:44 +03:00
let (code, _) = code_and_pos in
CodeBlock (code, (text, Pos.from_lpos $sloc), false)
}
| heading = law_heading ; {
LawHeading (heading, [])
}
| code = metadata_block ; {
let (code, source_repr) = code in
CodeBlock (code, source_repr, true)
}
| BEGIN_DIRECTIVE ; LAW_INCLUDE ; COLON ;
args = nonempty_list(DIRECTIVE_ARG) ;
page = option(AT_PAGE) ;
END_DIRECTIVE ; {
let filename = String.trim (String.concat "" args) in
let pos = Pos.from_lpos $sloc in
let jorftext = Re.Pcre.regexp "JORFTEXT\\d; {12}" in
if Re.Pcre.pmatch ~rex:jorftext filename && page = None then
LawInclude (Ast.LegislativeText (filename, pos))
else if Filename.extension filename = ".pdf" || page <> None then
LawInclude (Ast.PdfFile ((filename, pos), page))
else
LawInclude (Ast.CatalaFile (filename, pos))
}
let source_file :=
| hd = source_file_item ; tl = source_file ; { hd::tl }
| EOF ; { [] }