2017-01-06 15:15:57 +00:00
|
|
|
/* vim: set filetype=rust.rustpeg */
|
|
|
|
|
|
|
|
// Copyright 2016 Mozilla
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License"); you may not use
|
|
|
|
// this file except in compliance with the License. You may obtain a copy of the
|
|
|
|
// License at http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
// Unless required by applicable law or agreed to in writing, software distributed
|
|
|
|
// under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
|
|
|
|
// CONDITIONS OF ANY KIND, either express or implied. See the License for the
|
|
|
|
// specific language governing permissions and limitations under the License.
|
|
|
|
|
|
|
|
use std::collections::{BTreeSet, BTreeMap, LinkedList};
|
|
|
|
use std::iter::FromIterator;
|
2017-02-03 18:14:23 +00:00
|
|
|
use std::f64::{NAN, INFINITY, NEG_INFINITY};
|
2017-01-11 21:51:34 +00:00
|
|
|
|
2017-01-06 15:15:57 +00:00
|
|
|
use num::BigInt;
|
|
|
|
use ordered_float::OrderedFloat;
|
2017-01-11 21:51:34 +00:00
|
|
|
use types;
|
|
|
|
use types::Value;
|
2017-01-06 15:15:57 +00:00
|
|
|
|
|
|
|
// Goal: Be able to parse https://github.com/edn-format/edn
|
|
|
|
// Also extensible to help parse http://docs.datomic.com/query.html
|
|
|
|
|
|
|
|
// Debugging hint: test using `cargo test --features peg/trace -- --nocapture`
|
|
|
|
// to trace where the parser is failing
|
|
|
|
|
|
|
|
// TODO: Support tagged elements
|
|
|
|
// TODO: Support discard
|
|
|
|
|
2017-02-02 10:36:53 +00:00
|
|
|
pub nil -> Value =
|
|
|
|
"nil" { Value::Nil }
|
2017-01-06 15:15:57 +00:00
|
|
|
|
2017-02-03 18:14:23 +00:00
|
|
|
pub nan -> Value =
|
2017-02-09 17:13:44 +00:00
|
|
|
"#f" whitespace+ "NaN" { Value::Float(OrderedFloat(NAN)) }
|
2017-02-03 18:14:23 +00:00
|
|
|
|
|
|
|
pub infinity -> Value =
|
2017-02-09 17:13:44 +00:00
|
|
|
"#f" whitespace+ s:$(sign) "Infinity" {
|
2017-02-03 18:14:23 +00:00
|
|
|
Value::Float(OrderedFloat(if s == "+" { INFINITY } else { NEG_INFINITY }))
|
|
|
|
}
|
|
|
|
|
2017-02-02 10:36:53 +00:00
|
|
|
pub boolean -> Value =
|
2017-01-06 15:15:57 +00:00
|
|
|
"true" { Value::Boolean(true) } /
|
|
|
|
"false" { Value::Boolean(false) }
|
|
|
|
|
|
|
|
digit = [0-9]
|
2017-02-11 00:03:35 +00:00
|
|
|
alphanumeric = [0-9a-zA-Z]
|
|
|
|
octaldigit = [0-7]
|
|
|
|
validbase = [3][0-6] / [12][0-9] / [2-9]
|
|
|
|
hex = [0-9a-fA-F]
|
2017-01-06 15:15:57 +00:00
|
|
|
sign = "-" / "+"
|
|
|
|
|
2017-02-02 10:36:53 +00:00
|
|
|
pub bigint -> Value =
|
|
|
|
b:$( sign? digit+ ) "N" {
|
|
|
|
Value::BigInteger(b.parse::<BigInt>().unwrap())
|
|
|
|
}
|
2017-01-06 15:15:57 +00:00
|
|
|
|
2017-02-11 00:03:35 +00:00
|
|
|
pub octalinteger -> Value =
|
|
|
|
"0" i:$( octaldigit+ ) {
|
|
|
|
Value::Integer(i64::from_str_radix(i, 8).unwrap())
|
|
|
|
}
|
|
|
|
|
|
|
|
pub hexinteger -> Value =
|
|
|
|
"0x" i:$( hex+ ) {
|
|
|
|
Value::Integer(i64::from_str_radix(i, 16).unwrap())
|
|
|
|
}
|
|
|
|
|
|
|
|
pub basedinteger -> Value =
|
|
|
|
// Only allow values 2-36
|
|
|
|
b:$( validbase ) "r" i:$( alphanumeric+ ) {
|
|
|
|
Value::Integer(i64::from_str_radix(i, b.parse::<u32>().unwrap()).unwrap())
|
|
|
|
}
|
|
|
|
|
2017-02-02 10:36:53 +00:00
|
|
|
pub integer -> Value =
|
|
|
|
i:$( sign? digit+ ) {
|
|
|
|
Value::Integer(i.parse::<i64>().unwrap())
|
|
|
|
}
|
2017-01-06 15:15:57 +00:00
|
|
|
|
|
|
|
frac = sign? digit+ "." digit+
|
|
|
|
exp = sign? digit+ ("e" / "E") sign? digit+
|
|
|
|
frac_exp = sign? digit+ "." digit+ ("e" / "E") sign? digit+
|
|
|
|
|
|
|
|
// The order here is important - frac_exp must come before (exp / frac) or the
|
|
|
|
// parser assumes exp or frac when the float is really a frac_exp and fails
|
2017-02-02 10:36:53 +00:00
|
|
|
pub float -> Value =
|
|
|
|
f:$( frac_exp / exp / frac ) {
|
|
|
|
Value::Float(OrderedFloat(f.parse::<f64>().unwrap()))
|
|
|
|
}
|
2017-01-06 15:15:57 +00:00
|
|
|
|
|
|
|
// TODO: \newline, \return, \space and \tab
|
|
|
|
special_char = quote / tab
|
|
|
|
quote = "\\\""
|
|
|
|
tab = "\\tab"
|
|
|
|
char = [^"] / special_char
|
|
|
|
|
2017-02-02 10:36:53 +00:00
|
|
|
pub text -> Value =
|
|
|
|
"\"" t:$( char* ) "\"" {
|
|
|
|
Value::Text(t.to_string())
|
|
|
|
}
|
2017-01-06 15:15:57 +00:00
|
|
|
|
2017-01-11 21:51:34 +00:00
|
|
|
namespace_divider = "."
|
|
|
|
namespace_separator = "/"
|
|
|
|
|
2017-01-06 15:15:57 +00:00
|
|
|
// TODO: Be more picky here
|
2017-02-02 10:52:34 +00:00
|
|
|
// Keywords follow the rules of symbols, except they can (and must) begin with :
|
|
|
|
// e.g. :fred or :my/fred. See https://github.com/edn-format/edn#keywords
|
2017-01-11 21:51:34 +00:00
|
|
|
symbol_char_initial = [a-z] / [A-Z] / [0-9] / [*!_?$%&=<>]
|
|
|
|
symbol_char_subsequent = [a-z] / [A-Z] / [0-9] / [-*!_?$%&=<>]
|
2017-01-06 15:15:57 +00:00
|
|
|
|
2017-02-02 10:52:34 +00:00
|
|
|
symbol_namespace = symbol_char_initial symbol_char_subsequent* (namespace_divider symbol_char_subsequent+)*
|
2017-01-11 21:51:34 +00:00
|
|
|
symbol_name = ( symbol_char_initial+ / "." ) ( symbol_char_subsequent* / "." )
|
|
|
|
|
|
|
|
keyword_prefix = ":"
|
2017-01-06 15:15:57 +00:00
|
|
|
|
2017-02-02 10:36:53 +00:00
|
|
|
pub symbol -> Value =
|
2017-02-02 10:52:34 +00:00
|
|
|
ns:( sns:$(symbol_namespace) namespace_separator {
|
|
|
|
sns
|
|
|
|
})? n:$(symbol_name) {
|
2017-01-11 21:51:34 +00:00
|
|
|
types::to_symbol(ns, n)
|
|
|
|
}
|
|
|
|
|
2017-02-02 10:36:53 +00:00
|
|
|
pub keyword -> Value =
|
2017-02-02 10:52:34 +00:00
|
|
|
keyword_prefix ns:( sns:$(symbol_namespace) namespace_separator {
|
|
|
|
sns
|
|
|
|
})? n:$(symbol_name) {
|
2017-01-11 21:51:34 +00:00
|
|
|
types::to_keyword(ns, n)
|
|
|
|
}
|
2017-01-06 15:15:57 +00:00
|
|
|
|
2017-02-02 10:36:53 +00:00
|
|
|
pub list -> Value =
|
2017-02-04 07:45:31 +00:00
|
|
|
"(" __ v:(value)* __ ")" {
|
2017-02-02 10:36:53 +00:00
|
|
|
Value::List(LinkedList::from_iter(v))
|
|
|
|
}
|
2017-01-06 15:15:57 +00:00
|
|
|
|
2017-02-02 10:36:53 +00:00
|
|
|
pub vector -> Value =
|
2017-02-04 07:45:31 +00:00
|
|
|
"[" __ v:(value)* __ "]" {
|
2017-02-02 10:36:53 +00:00
|
|
|
Value::Vector(v)
|
|
|
|
}
|
2017-01-06 15:15:57 +00:00
|
|
|
|
2017-02-02 10:36:53 +00:00
|
|
|
pub set -> Value =
|
2017-02-04 07:45:31 +00:00
|
|
|
"#{" __ v:(value)* __ "}" {
|
2017-02-02 10:36:53 +00:00
|
|
|
Value::Set(BTreeSet::from_iter(v))
|
|
|
|
}
|
2017-01-06 15:15:57 +00:00
|
|
|
|
2017-02-02 10:36:53 +00:00
|
|
|
pair -> (Value, Value) =
|
|
|
|
k:(value) v:(value) {
|
|
|
|
(k, v)
|
|
|
|
}
|
2017-01-06 15:15:57 +00:00
|
|
|
|
2017-02-02 10:36:53 +00:00
|
|
|
pub map -> Value =
|
2017-02-04 07:45:31 +00:00
|
|
|
"{" __ v:(pair)* __ "}" {
|
2017-02-02 10:36:53 +00:00
|
|
|
Value::Map(BTreeMap::from_iter(v))
|
|
|
|
}
|
2017-01-06 15:15:57 +00:00
|
|
|
|
|
|
|
// It's important that float comes before integer or the parser assumes that
|
|
|
|
// floats are integers and fails to parse
|
2017-02-02 10:36:53 +00:00
|
|
|
pub value -> Value =
|
2017-02-11 00:03:35 +00:00
|
|
|
__ v:(nil / nan / infinity / boolean / float / octalinteger / hexinteger / basedinteger / bigint / integer / text / keyword / symbol / list / vector / map / set) __ {
|
2017-02-02 10:36:53 +00:00
|
|
|
v
|
|
|
|
}
|
2017-01-17 19:26:45 +00:00
|
|
|
|
|
|
|
// Clojure (and thus EDN) regards commas as whitespace, and thus the two-element vectors [1 2] and
|
|
|
|
// [1,,,,2] are equivalent, as are the maps {:a 1, :b 2} and {:a 1 :b 2}.
|
|
|
|
whitespace = (" " / "\r" / "\n" / "\t" / ",")
|
2017-01-17 19:25:31 +00:00
|
|
|
comment = ";" [^\r\n]* ("\r" / "\n")?
|
2017-01-06 15:15:57 +00:00
|
|
|
|
2017-01-17 19:25:31 +00:00
|
|
|
__ = (whitespace / comment)*
|