use std::{fmt, hash::Hash};
use combine::combinator::{choice, many, many1, optional, position};
use combine::easy::Error;
use combine::error::StreamError;
use combine::{parser, ParseResult, Parser};
use indexmap::IndexMap;
use crate::helpers::{ident, kind, name, punct};
use crate::position::Pos;
use crate::tokenizer::{Kind as T, Token, TokenStream};
pub trait Text<'a>: 'a {
type Value: 'a
+ From<&'a str>
+ AsRef<str>
+ std::borrow::Borrow<str>
+ PartialEq
+ Eq
+ PartialOrd
+ Ord
+ fmt::Debug
+ Clone
+ Hash;
}
impl<'a> Text<'a> for &'a str {
type Value = Self;
}
impl<'a> Text<'a> for String {
type Value = String;
}
impl<'a> Text<'a> for std::borrow::Cow<'a, str> {
type Value = Self;
}
#[derive(Debug, Clone, PartialEq)]
pub struct Directive<'a, T: Text<'a>> {
pub position: Pos,
pub name: T::Value,
pub arguments: Vec<(T::Value, Value<'a, T>)>,
}
#[derive(Debug, Clone, PartialEq)]
pub struct Number(pub(crate) i64);
#[derive(Debug, Clone, PartialEq)]
pub enum Value<'a, T: Text<'a>> {
Variable(T::Value),
Int(Number),
Float(f64),
String(String),
Boolean(bool),
Null,
Enum(T::Value),
List(Vec<Value<'a, T>>),
Object(IndexMap<T::Value, Value<'a, T>>),
}
#[derive(Debug, Clone, PartialEq)]
pub enum Type<'a, T: Text<'a>> {
NamedType(T::Value),
ListType(Box<Type<'a, T>>),
NonNullType(Box<Type<'a, T>>),
}
impl Number {
pub fn as_i64(&self) -> Option<i64> {
Some(self.0)
}
}
impl From<i32> for Number {
fn from(i: i32) -> Self {
Number(i as i64)
}
}
pub fn directives<'a, T>(
input: &mut TokenStream<'a>,
) -> ParseResult<Vec<Directive<'a, T>>, TokenStream<'a>>
where
T: Text<'a>,
{
many(
position()
.skip(punct("@"))
.and(name::<'a, T>())
.and(parser(arguments))
.map(|((position, name), arguments)| Directive {
position,
name,
arguments,
}),
)
.parse_stream(input)
}
pub fn arguments<'a, T>(
input: &mut TokenStream<'a>,
) -> ParseResult<Vec<(T::Value, Value<'a, T>)>, TokenStream<'a>>
where
T: Text<'a>,
{
optional(
punct("(")
.with(many1(name::<'a, T>().skip(punct(":")).and(parser(value))))
.skip(punct(")")),
)
.map(|opt| opt.unwrap_or_else(Vec::new))
.parse_stream(input)
}
pub fn int_value<'a, S>(input: &mut TokenStream<'a>) -> ParseResult<Value<'a, S>, TokenStream<'a>>
where
S: Text<'a>,
{
kind(T::IntValue)
.and_then(|tok| tok.value.parse())
.map(Number)
.map(Value::Int)
.parse_stream(input)
}
pub fn float_value<'a, S>(input: &mut TokenStream<'a>) -> ParseResult<Value<'a, S>, TokenStream<'a>>
where
S: Text<'a>,
{
kind(T::FloatValue)
.and_then(|tok| tok.value.parse())
.map(Value::Float)
.parse_stream(input)
}
fn unquote_block_string<'a>(src: &'a str) -> Result<String, Error<Token<'a>, Token<'a>>> {
debug_assert!(src.starts_with("\"\"\"") && src.ends_with("\"\"\""));
let indent = src[3..src.len() - 3]
.lines()
.skip(1)
.filter_map(|line| {
let trimmed = line.trim_start().len();
if trimmed > 0 {
Some(line.len() - trimmed)
} else {
None }
})
.min()
.unwrap_or(0);
let mut result = String::with_capacity(src.len() - 6);
let mut lines = src[3..src.len() - 3].lines();
if let Some(first) = lines.next() {
let stripped = first.trim();
if !stripped.is_empty() {
result.push_str(stripped);
result.push('\n');
}
}
let mut last_line = 0;
for line in lines {
last_line = result.len();
if line.len() > indent {
result.push_str(&line[indent..].replace(r#"\""""#, r#"""""#));
}
result.push('\n');
}
if result[last_line..].trim().is_empty() {
result.truncate(last_line);
}
Ok(result)
}
fn unquote_string<'a>(s: &'a str) -> Result<String, Error<Token, Token>> {
let mut res = String::with_capacity(s.len());
debug_assert!(s.starts_with('"') && s.ends_with('"'));
let mut chars = s[1..s.len() - 1].chars();
let mut temp_code_point = String::with_capacity(4);
while let Some(c) = chars.next() {
match c {
'\\' => {
match chars.next().expect("slash cant be at the end") {
c @ '"' | c @ '\\' | c @ '/' => res.push(c),
'b' => res.push('\u{0010}'),
'f' => res.push('\u{000C}'),
'n' => res.push('\n'),
'r' => res.push('\r'),
't' => res.push('\t'),
'u' => {
temp_code_point.clear();
for _ in 0..4 {
match chars.next() {
Some(inner_c) => temp_code_point.push(inner_c),
None => {
return Err(Error::unexpected_message(format_args!(
"\\u must have 4 characters after it, only found '{}'",
temp_code_point
)))
}
}
}
match u32::from_str_radix(&temp_code_point, 16).map(std::char::from_u32) {
Ok(Some(unicode_char)) => res.push(unicode_char),
_ => {
return Err(Error::unexpected_message(format_args!(
"{} is not a valid unicode code point",
temp_code_point
)))
}
}
}
c => {
return Err(Error::unexpected_message(format_args!(
"bad escaped char {:?}",
c
)));
}
}
}
c => res.push(c),
}
}
Ok(res)
}
pub fn string<'a>(input: &mut TokenStream<'a>) -> ParseResult<String, TokenStream<'a>> {
choice((
kind(T::StringValue).and_then(|tok| unquote_string(tok.value)),
kind(T::BlockString).and_then(|tok| unquote_block_string(tok.value)),
))
.parse_stream(input)
}
pub fn string_value<'a, S>(
input: &mut TokenStream<'a>,
) -> ParseResult<Value<'a, S>, TokenStream<'a>>
where
S: Text<'a>,
{
kind(T::StringValue)
.and_then(|tok| unquote_string(tok.value))
.map(Value::String)
.parse_stream(input)
}
pub fn block_string_value<'a, S>(
input: &mut TokenStream<'a>,
) -> ParseResult<Value<'a, S>, TokenStream<'a>>
where
S: Text<'a>,
{
kind(T::BlockString)
.and_then(|tok| unquote_block_string(tok.value))
.map(Value::String)
.parse_stream(input)
}
pub fn plain_value<'a, T>(input: &mut TokenStream<'a>) -> ParseResult<Value<'a, T>, TokenStream<'a>>
where
T: Text<'a>,
{
ident("true")
.map(|_| Value::Boolean(true))
.or(ident("false").map(|_| Value::Boolean(false)))
.or(ident("null").map(|_| Value::Null))
.or(name::<'a, T>().map(Value::Enum))
.or(parser(int_value))
.or(parser(float_value))
.or(parser(string_value))
.or(parser(block_string_value))
.parse_stream(input)
}
pub fn value<'a, T>(input: &mut TokenStream<'a>) -> ParseResult<Value<'a, T>, TokenStream<'a>>
where
T: Text<'a>,
{
parser(plain_value)
.or(punct("$").with(name::<'a, T>()).map(Value::Variable))
.or(punct("[")
.with(many(parser(value)))
.skip(punct("]"))
.map(Value::List))
.or(punct("{")
.with(many(name::<'a, T>().skip(punct(":")).and(parser(value))))
.skip(punct("}"))
.map(Value::Object))
.parse_stream(input)
}
pub fn default_value<'a, T>(
input: &mut TokenStream<'a>,
) -> ParseResult<Value<'a, T>, TokenStream<'a>>
where
T: Text<'a>,
{
parser(plain_value)
.or(punct("[")
.with(many(parser(default_value)))
.skip(punct("]"))
.map(Value::List))
.or(punct("{")
.with(many(
name::<'a, T>().skip(punct(":")).and(parser(default_value)),
))
.skip(punct("}"))
.map(Value::Object))
.parse_stream(input)
}
pub fn parse_type<'a, T>(input: &mut TokenStream<'a>) -> ParseResult<Type<'a, T>, TokenStream<'a>>
where
T: Text<'a>,
{
name::<'a, T>()
.map(Type::NamedType)
.or(punct("[")
.with(parser(parse_type))
.skip(punct("]"))
.map(Box::new)
.map(Type::ListType))
.and(optional(punct("!")).map(|v| v.is_some()))
.map(|(typ, strict)| {
if strict {
Type::NonNullType(Box::new(typ))
} else {
typ
}
})
.parse_stream(input)
}
#[cfg(test)]
mod tests {
use super::unquote_string;
use super::Number;
#[test]
fn number_from_i32_and_to_i64_conversion() {
assert_eq!(Number::from(1).as_i64(), Some(1));
assert_eq!(Number::from(584).as_i64(), Some(584));
assert_eq!(
Number::from(i32::min_value()).as_i64(),
Some(i32::min_value() as i64)
);
assert_eq!(
Number::from(i32::max_value()).as_i64(),
Some(i32::max_value() as i64)
);
}
#[test]
fn unquote_unicode_string() {
assert_eq!(unquote_string(r#""\u0009""#).expect(""), "\u{0009}");
assert_eq!(unquote_string(r#""\u000A""#).expect(""), "\u{000A}");
assert_eq!(unquote_string(r#""\u000D""#).expect(""), "\u{000D}");
assert_eq!(unquote_string(r#""\u0020""#).expect(""), "\u{0020}");
assert_eq!(unquote_string(r#""\uFFFF""#).expect(""), "\u{FFFF}");
assert_eq!(
unquote_string(r#""\u0009 hello \u000A there""#).expect(""),
"\u{0009} hello \u{000A} there"
);
}
}