aboutsummaryrefslogtreecommitdiffstats
path: root/askama_shared/src/parser.rs
diff options
context:
space:
mode:
Diffstat (limited to 'askama_shared/src/parser.rs')
-rw-r--r--askama_shared/src/parser.rs471
1 files changed, 471 insertions, 0 deletions
diff --git a/askama_shared/src/parser.rs b/askama_shared/src/parser.rs
new file mode 100644
index 0000000..8732f0e
--- /dev/null
+++ b/askama_shared/src/parser.rs
@@ -0,0 +1,471 @@
+use nom::{self, IResult};
+use std::str;
+
+#[derive(Debug)]
+pub enum Expr<'a> {
+ NumLit(&'a str),
+ StrLit(&'a str),
+ Var(&'a str),
+ Attr(Box<Expr<'a>>, &'a str),
+ Filter(&'a str, Vec<Expr<'a>>),
+ BinOp(&'a str, Box<Expr<'a>>, Box<Expr<'a>>),
+ Group(Box<Expr<'a>>),
+ MethodCall(Box<Expr<'a>>, &'a str, Vec<Expr<'a>>),
+}
+
+#[derive(Debug)]
+pub enum Target<'a> {
+ Name(&'a str),
+}
+
+#[derive(Clone, Copy, Debug)]
+pub struct WS(pub bool, pub bool);
+
+#[derive(Debug)]
+pub enum Node<'a> {
+ Lit(&'a str, &'a str, &'a str),
+ Comment(),
+ Expr(WS, Expr<'a>),
+ Call(WS, &'a str, Vec<Expr<'a>>),
+ LetDecl(WS, Target<'a>),
+ Let(WS, Target<'a>, Expr<'a>),
+ Cond(Vec<(WS, Option<Expr<'a>>, Vec<Node<'a>>)>, WS),
+ Loop(WS, Target<'a>, Expr<'a>, Vec<Node<'a>>, WS),
+ Extends(Expr<'a>),
+ BlockDef(WS, &'a str, Vec<Node<'a>>, WS),
+ Block(WS, &'a str, WS),
+ Include(WS, &'a str),
+ Macro(WS, &'a str, Vec<&'a str>, Vec<Node<'a>>, WS),
+}
+
+pub type Cond<'a> = (WS, Option<Expr<'a>>, Vec<Node<'a>>);
+
+fn split_ws_parts(s: &[u8]) -> Node {
+ if s.is_empty() {
+ let rs = str::from_utf8(s).unwrap();
+ return Node::Lit(rs, rs, rs);
+ }
+ let is_ws = |c: &u8| {
+ *c != b' ' && *c != b'\t' && *c != b'\r' && *c != b'\n'
+ };
+ let start = s.iter().position(&is_ws);
+ let res = if start.is_none() {
+ (s, &s[0..0], &s[0..0])
+ } else {
+ let start = start.unwrap();
+ let end = s.iter().rposition(&is_ws);
+ if end.is_none() {
+ (&s[..start], &s[start..], &s[0..0])
+ } else {
+ let end = end.unwrap();
+ (&s[..start], &s[start..end + 1], &s[end + 1..])
+ }
+ };
+ Node::Lit(str::from_utf8(res.0).unwrap(),
+ str::from_utf8(res.1).unwrap(),
+ str::from_utf8(res.2).unwrap())
+}
+
+enum ContentState {
+ Any,
+ Brace(usize),
+ End(usize),
+}
+
+fn take_content(i: &[u8]) -> IResult<&[u8], Node> {
+ use parser::ContentState::*;
+ let mut state = Any;
+ for (idx, c) in i.iter().enumerate() {
+ state = match (state, *c) {
+ (Any, b'{') => Brace(idx),
+ (Any, _) => Any,
+ (Brace(start), b'{') |
+ (Brace(start), b'%') |
+ (Brace(start), b'#') => End(start),
+ (Brace(_), _) => Any,
+ (End(_), _) => panic!("cannot happen"),
+ };
+ if let End(_) = state {
+ break;
+ }
+ }
+ match state {
+ Any |
+ Brace(_) => IResult::Done(&i[..0], split_ws_parts(i)),
+ End(0) => IResult::Error(nom::ErrorKind::Custom(0)),
+ End(start) => IResult::Done(&i[start..], split_ws_parts(&i[..start])),
+ }
+}
+
+fn identifier(input: &[u8]) -> IResult<&[u8], &str> {
+ if !nom::is_alphabetic(input[0]) && input[0] != b'_' {
+ return IResult::Error(nom::ErrorKind::Custom(0));
+ }
+ for (i, ch) in input.iter().enumerate() {
+ if i == 0 || nom::is_alphanumeric(*ch) || *ch == b'_' {
+ continue;
+ }
+ return IResult::Done(&input[i..],
+ str::from_utf8(&input[..i]).unwrap());
+ }
+ IResult::Done(&input[1..], str::from_utf8(&input[..1]).unwrap())
+}
+
+named!(expr_num_lit<Expr>, map!(nom::digit,
+ |s| Expr::NumLit(str::from_utf8(s).unwrap())
+));
+
+named!(expr_str_lit<Expr>, map!(
+ delimited!(char!('"'), is_not!("\""), char!('"')),
+ |s| Expr::StrLit(str::from_utf8(s).unwrap())
+));
+
+named!(expr_var<Expr>, map!(identifier,
+ |s| Expr::Var(s))
+);
+
+named!(target_single<Target>, map!(identifier,
+ |s| Target::Name(s)
+));
+
+named!(arguments<Vec<Expr>>, do_parse!(
+ tag_s!("(") >>
+ args: opt!(do_parse!(
+ arg0: ws!(expr_any) >>
+ args: many0!(do_parse!(
+ tag_s!(",") >>
+ argn: ws!(expr_any) >>
+ (argn)
+ )) >>
+ ({
+ let mut res = vec![arg0];
+ res.extend(args);
+ res
+ })
+ )) >>
+ tag_s!(")") >>
+ (args.unwrap_or(Vec::new()))
+));
+
+named!(parameters<Vec<&'a str>>, do_parse!(
+ tag_s!("(") >>
+ vals: opt!(do_parse!(
+ arg0: ws!(identifier) >>
+ args: many0!(do_parse!(
+ tag_s!(",") >>
+ argn: ws!(identifier) >>
+ (argn)
+ )) >>
+ ({
+ let mut res = vec![arg0];
+ res.extend(args);
+ res
+ })
+ )) >>
+ tag_s!(")") >>
+ (vals.unwrap_or(Vec::new()))
+));
+
+named!(expr_group<Expr>, map!(
+ delimited!(char!('('), expr_any, char!(')')),
+ |s| Expr::Group(Box::new(s))
+));
+
+named!(expr_single<Expr>, alt!(
+ expr_num_lit |
+ expr_str_lit |
+ expr_var |
+ expr_group
+));
+
+named!(attr<(&str, Option<Vec<Expr>>)>, do_parse!(
+ tag_s!(".") >>
+ attr: identifier >>
+ args: opt!(arguments) >>
+ (attr, args)
+));
+
+named!(expr_attr<Expr>, do_parse!(
+ obj: expr_single >>
+ attrs: many0!(attr) >>
+ ({
+ let mut res = obj;
+ for (aname, args) in attrs {
+ res = if args.is_some() {
+ Expr::MethodCall(Box::new(res), aname, args.unwrap())
+ } else {
+ Expr::Attr(Box::new(res), aname)
+ };
+ }
+ res
+ })
+));
+
+named!(filter<(&str, Option<Vec<Expr>>)>, do_parse!(
+ tag_s!("|") >>
+ fname: identifier >>
+ args: opt!(arguments) >>
+ (fname, args)
+));
+
+named!(expr_filtered<Expr>, do_parse!(
+ obj: expr_attr >>
+ filters: many0!(filter) >>
+ ({
+ let mut res = obj;
+ for (fname, args) in filters {
+ res = Expr::Filter(fname, {
+ let mut args = match args {
+ Some(inner) => inner,
+ None => Vec::new(),
+ };
+ args.insert(0, res);
+ args
+ });
+ }
+ res
+ })
+));
+
+macro_rules! expr_prec_layer {
+ ( $name:ident, $inner:ident, $( $op:expr ),* ) => {
+ named!($name<Expr>, alt!(
+ do_parse!(
+ left: $inner >>
+ op: ws!(alt!($( tag_s!($op) )|*)) >>
+ right: $inner >>
+ (Expr::BinOp(str::from_utf8(op).unwrap(),
+ Box::new(left), Box::new(right)))
+ ) | $inner
+ ));
+ }
+}
+
+expr_prec_layer!(expr_muldivmod, expr_filtered, "*", "/", "%");
+expr_prec_layer!(expr_addsub, expr_muldivmod, "+", "-");
+expr_prec_layer!(expr_shifts, expr_addsub, ">>", "<<");
+expr_prec_layer!(expr_band, expr_shifts, "&");
+expr_prec_layer!(expr_bxor, expr_band, "^");
+expr_prec_layer!(expr_bor, expr_bxor, "|");
+expr_prec_layer!(expr_compare, expr_bor,
+ "==", "!=", ">=", ">", "<=", "<"
+);
+expr_prec_layer!(expr_and, expr_compare, "&&");
+expr_prec_layer!(expr_any, expr_and, "||");
+
+named!(expr_node<Node>, do_parse!(
+ tag_s!("{{") >>
+ pws: opt!(tag_s!("-")) >>
+ expr: ws!(expr_any) >>
+ nws: opt!(tag_s!("-")) >>
+ tag_s!("}}") >>
+ (Node::Expr(WS(pws.is_some(), nws.is_some()), expr))
+));
+
+named!(block_call<Node>, do_parse!(
+ pws: opt!(tag_s!("-")) >>
+ ws!(tag_s!("call")) >>
+ name: ws!(identifier) >>
+ args: ws!(arguments) >>
+ nws: opt!(tag_s!("-")) >>
+ (Node::Call(WS(pws.is_some(), nws.is_some()), name, args))
+));
+
+named!(cond_if<Expr>, do_parse!(
+ ws!(tag_s!("if")) >>
+ cond: ws!(expr_any) >>
+ (cond)
+));
+
+named!(cond_block<Cond>, do_parse!(
+ tag_s!("{%") >>
+ pws: opt!(tag_s!("-")) >>
+ ws!(tag_s!("else")) >>
+ cond: opt!(cond_if) >>
+ nws: opt!(tag_s!("-")) >>
+ tag_s!("%}") >>
+ block: parse_template >>
+ (WS(pws.is_some(), nws.is_some()), cond, block)
+));
+
+named!(block_if<Node>, do_parse!(
+ pws1: opt!(tag_s!("-")) >>
+ cond: ws!(cond_if) >>
+ nws1: opt!(tag_s!("-")) >>
+ tag_s!("%}") >>
+ block: parse_template >>
+ elifs: many0!(cond_block) >>
+ tag_s!("{%") >>
+ pws2: opt!(tag_s!("-")) >>
+ ws!(tag_s!("endif")) >>
+ nws2: opt!(tag_s!("-")) >>
+ ({
+ let mut res = Vec::new();
+ res.push((WS(pws1.is_some(), nws1.is_some()), Some(cond), block));
+ res.extend(elifs);
+ Node::Cond(res, WS(pws2.is_some(), nws2.is_some()))
+ })
+));
+
+named!(block_let<Node>, do_parse!(
+ pws: opt!(tag_s!("-")) >>
+ ws!(tag_s!("let")) >>
+ var: ws!(target_single) >>
+ val: opt!(do_parse!(
+ ws!(tag_s!("=")) >>
+ val: ws!(expr_any) >>
+ (val)
+ )) >>
+ nws: opt!(tag_s!("-")) >>
+ (if val.is_some() {
+ Node::Let(WS(pws.is_some(), nws.is_some()), var, val.unwrap())
+ } else {
+ Node::LetDecl(WS(pws.is_some(), nws.is_some()), var)
+ })
+));
+
+named!(block_for<Node>, do_parse!(
+ pws1: opt!(tag_s!("-")) >>
+ ws!(tag_s!("for")) >>
+ var: ws!(target_single) >>
+ ws!(tag_s!("in")) >>
+ iter: ws!(expr_any) >>
+ nws1: opt!(tag_s!("-")) >>
+ tag_s!("%}") >>
+ block: parse_template >>
+ tag_s!("{%") >>
+ pws2: opt!(tag_s!("-")) >>
+ ws!(tag_s!("endfor")) >>
+ nws2: opt!(tag_s!("-")) >>
+ (Node::Loop(WS(pws1.is_some(), nws1.is_some()),
+ var, iter, block,
+ WS(pws2.is_some(), pws2.is_some())))
+));
+
+named!(block_extends<Node>, do_parse!(
+ ws!(tag_s!("extends")) >>
+ name: ws!(expr_str_lit) >>
+ (Node::Extends(name))
+));
+
+named!(block_block<Node>, do_parse!(
+ pws1: opt!(tag_s!("-")) >>
+ ws!(tag_s!("block")) >>
+ name: ws!(identifier) >>
+ nws1: opt!(tag_s!("-")) >>
+ tag_s!("%}") >>
+ contents: parse_template >>
+ tag_s!("{%") >>
+ pws2: opt!(tag_s!("-")) >>
+ ws!(tag_s!("endblock")) >>
+ opt!(ws!(tag_s!(name))) >>
+ nws2: opt!(tag_s!("-")) >>
+ (Node::BlockDef(WS(pws1.is_some(), nws1.is_some()),
+ name, contents,
+ WS(pws2.is_some(), pws2.is_some())))
+));
+
+named!(block_include<Node>, do_parse!(
+ pws: opt!(tag_s!("-")) >>
+ ws!(tag_s!("include")) >>
+ name: ws!(expr_str_lit) >>
+ nws: opt!(tag_s!("-")) >>
+ (Node::Include(WS(pws.is_some(), nws.is_some()), match name {
+ Expr::StrLit(s) => s,
+ _ => panic!("include path must be a string literal"),
+ }))
+));
+
+named!(block_macro<Node>, do_parse!(
+ pws1: opt!(tag_s!("-")) >>
+ ws!(tag_s!("macro")) >>
+ name: ws!(identifier) >>
+ params: ws!(parameters) >>
+ nws1: opt!(tag_s!("-")) >>
+ tag_s!("%}") >>
+ contents: parse_template >>
+ tag_s!("{%") >>
+ pws2: opt!(tag_s!("-")) >>
+ ws!(tag_s!("endmacro")) >>
+ nws2: opt!(tag_s!("-")) >>
+ (Node::Macro(
+ WS(pws1.is_some(), nws1.is_some()),
+ name,
+ params,
+ contents,
+ WS(pws2.is_some(), nws2.is_some())
+ ))
+));
+
+named!(block_node<Node>, do_parse!(
+ tag_s!("{%") >>
+ contents: alt!(
+ block_call |
+ block_let |
+ block_if |
+ block_for |
+ block_extends |
+ block_include |
+ block_block |
+ block_macro
+ ) >>
+ tag_s!("%}") >>
+ (contents)
+));
+
+named!(block_comment<Node>, do_parse!(
+ tag_s!("{#") >>
+ take_until_s!("#}") >>
+ tag_s!("#}") >>
+ (Node::Comment())
+));
+
+named!(parse_template<Vec<Node<'a>>>, many0!(alt!(
+ take_content |
+ block_comment |
+ expr_node |
+ block_node
+)));
+
+pub fn parse(src: &str) -> Vec<Node> {
+ match parse_template(src.as_bytes()) {
+ IResult::Done(left, res) => {
+ if left.len() > 0 {
+ let s = str::from_utf8(left).unwrap();
+ panic!("unable to parse template:\n\n{:?}", s);
+ } else {
+ res
+ }
+ },
+ IResult::Error(err) => panic!("problems parsing template source: {}", err),
+ IResult::Incomplete(_) => panic!("parsing incomplete"),
+ }
+}
+
+#[cfg(test)]
+mod tests {
+ fn check_ws_split(s: &str, res: &(&str, &str, &str)) {
+ let node = super::split_ws_parts(s.as_bytes());
+ match node {
+ super::Node::Lit(lws, s, rws) => {
+ assert_eq!(lws, res.0);
+ assert_eq!(s, res.1);
+ assert_eq!(rws, res.2);
+ },
+ _ => { panic!("fail"); },
+ }
+ }
+ #[test]
+ fn test_ws_splitter() {
+ check_ws_split("", &("", "", ""));
+ check_ws_split("a", &("", "a", ""));
+ check_ws_split("\ta", &("\t", "a", ""));
+ check_ws_split("b\n", &("", "b", "\n"));
+ check_ws_split(" \t\r\n", &(" \t\r\n", "", ""));
+ }
+ #[test]
+ #[should_panic]
+ fn test_invalid_block() {
+ super::parse("{% extend \"blah\" %}");
+ }
+}