// Copyright 2012 The Rust Project Developers. See the COPYRIGHT // file at the top-level directory of this distribution and at // http://rust-lang.org/COPYRIGHT. // // Licensed under the Apache License, Version 2.0 or the MIT license // , at your // option. This file may not be copied, modified, or distributed // except according to those terms. use ast; use ast::{TokenTree, TTDelim, TTTok, TTSeq, TTNonterminal, Ident}; use codemap::{Span, DUMMY_SP}; use diagnostic::SpanHandler; use ext::tt::macro_parser::{NamedMatch, MatchedSeq, MatchedNonterminal}; use parse::token::{EOF, INTERPOLATED, IDENT, Token, NtIdent}; use parse::token; use parse::lexer::TokenAndSpan; use std::rc::Rc; use std::collections::HashMap; ///an unzipping of `TokenTree`s #[deriving(Clone)] struct TtFrame { forest: Rc>, idx: uint, dotdotdoted: bool, sep: Option, } #[deriving(Clone)] pub struct TtReader<'a> { pub sp_diag: &'a SpanHandler, /// the unzipped tree: stack: Vec, /* for MBE-style macro transcription */ interpolations: HashMap>, repeat_idx: Vec, repeat_len: Vec, /* cached: */ pub cur_tok: Token, pub cur_span: Span, } /// This can do Macro-By-Example transcription. On the other hand, if /// `src` contains no `TTSeq`s and `TTNonterminal`s, `interp` can (and /// should) be none. pub fn new_tt_reader<'a>(sp_diag: &'a SpanHandler, interp: Option>>, src: Vec ) -> TtReader<'a> { let mut r = TtReader { sp_diag: sp_diag, stack: vec!(TtFrame { forest: Rc::new(src), idx: 0, dotdotdoted: false, sep: None, }), interpolations: match interp { /* just a convenience */ None => HashMap::new(), Some(x) => x, }, repeat_idx: Vec::new(), repeat_len: Vec::new(), /* dummy values, never read: */ cur_tok: EOF, cur_span: DUMMY_SP, }; tt_next_token(&mut r); /* get cur_tok and cur_span set up */ r } fn lookup_cur_matched_by_matched(r: &TtReader, start: Rc) -> Rc { r.repeat_idx.iter().fold(start, |ad, idx| { match *ad { MatchedNonterminal(_) => { // end of the line; duplicate henceforth ad.clone() } MatchedSeq(ref ads, _) => ads.get(*idx).clone() } }) } fn lookup_cur_matched(r: &TtReader, name: Ident) -> Rc { let matched_opt = r.interpolations.find_copy(&name); match matched_opt { Some(s) => lookup_cur_matched_by_matched(r, s), None => { r.sp_diag .span_fatal(r.cur_span, format!("unknown macro variable `{}`", token::get_ident(name)).as_slice()); } } } #[deriving(Clone)] enum LockstepIterSize { LisUnconstrained, LisConstraint(uint, Ident), LisContradiction(String), } fn lis_merge(lhs: LockstepIterSize, rhs: LockstepIterSize) -> LockstepIterSize { match lhs { LisUnconstrained => rhs.clone(), LisContradiction(_) => lhs.clone(), LisConstraint(l_len, l_id) => match rhs { LisUnconstrained => lhs.clone(), LisContradiction(_) => rhs.clone(), LisConstraint(r_len, _) if l_len == r_len => lhs.clone(), LisConstraint(r_len, r_id) => { let l_n = token::get_ident(l_id); let r_n = token::get_ident(r_id); LisContradiction(format!("inconsistent lockstep iteration: \ '{}' has {} items, but '{}' has {}", l_n, l_len, r_n, r_len).to_string()) } } } } fn lockstep_iter_size(t: &TokenTree, r: &TtReader) -> LockstepIterSize { match *t { TTDelim(ref tts) | TTSeq(_, ref tts, _, _) => { tts.iter().fold(LisUnconstrained, |lis, tt| { lis_merge(lis, lockstep_iter_size(tt, r)) }) } TTTok(..) => LisUnconstrained, TTNonterminal(_, name) => match *lookup_cur_matched(r, name) { MatchedNonterminal(_) => LisUnconstrained, MatchedSeq(ref ads, _) => LisConstraint(ads.len(), name) } } } /// Return the next token from the TtReader. /// EFFECT: advances the reader's token field pub fn tt_next_token(r: &mut TtReader) -> TokenAndSpan { // FIXME(pcwalton): Bad copy? let ret_val = TokenAndSpan { tok: r.cur_tok.clone(), sp: r.cur_span.clone(), }; loop { let should_pop = match r.stack.last() { None => { assert_eq!(ret_val.tok, EOF); return ret_val; } Some(frame) => { if frame.idx < frame.forest.len() { break; } !frame.dotdotdoted || *r.repeat_idx.last().unwrap() == *r.repeat_len.last().unwrap() - 1 } }; /* done with this set; pop or repeat? */ if should_pop { let prev = r.stack.pop().unwrap(); match r.stack.mut_last() { None => { r.cur_tok = EOF; return ret_val; } Some(frame) => { frame.idx += 1; } } if prev.dotdotdoted { r.repeat_idx.pop(); r.repeat_len.pop(); } } else { /* repeat */ *r.repeat_idx.mut_last().unwrap() += 1u; r.stack.mut_last().unwrap().idx = 0; match r.stack.last().unwrap().sep.clone() { Some(tk) => { r.cur_tok = tk; /* repeat same span, I guess */ return ret_val; } None => {} } } } loop { /* because it's easiest, this handles `TTDelim` not starting with a `TTTok`, even though it won't happen */ let t = { let frame = r.stack.last().unwrap(); // FIXME(pcwalton): Bad copy. (*frame.forest.get(frame.idx)).clone() }; match t { TTDelim(tts) => { r.stack.push(TtFrame { forest: tts, idx: 0, dotdotdoted: false, sep: None }); // if this could be 0-length, we'd need to potentially recur here } TTTok(sp, tok) => { r.cur_span = sp; r.cur_tok = tok; r.stack.mut_last().unwrap().idx += 1; return ret_val; } TTSeq(sp, tts, sep, zerok) => { // FIXME(pcwalton): Bad copy. match lockstep_iter_size(&TTSeq(sp, tts.clone(), sep.clone(), zerok), r) { LisUnconstrained => { r.sp_diag.span_fatal( sp.clone(), /* blame macro writer */ "attempted to repeat an expression \ containing no syntax \ variables matched as repeating at this depth"); } LisContradiction(ref msg) => { // FIXME #2887 blame macro invoker instead r.sp_diag.span_fatal(sp.clone(), msg.as_slice()); } LisConstraint(len, _) => { if len == 0 { if !zerok { // FIXME #2887 blame invoker r.sp_diag.span_fatal(sp.clone(), "this must repeat at least once"); } r.stack.mut_last().unwrap().idx += 1; return tt_next_token(r); } r.repeat_len.push(len); r.repeat_idx.push(0); r.stack.push(TtFrame { forest: tts, idx: 0, dotdotdoted: true, sep: sep.clone() }); } } } // FIXME #2887: think about span stuff here TTNonterminal(sp, ident) => { r.stack.mut_last().unwrap().idx += 1; match *lookup_cur_matched(r, ident) { /* sidestep the interpolation tricks for ident because (a) idents can be in lots of places, so it'd be a pain (b) we actually can, since it's a token. */ MatchedNonterminal(NtIdent(box sn, b)) => { r.cur_span = sp; r.cur_tok = IDENT(sn,b); return ret_val; } MatchedNonterminal(ref other_whole_nt) => { // FIXME(pcwalton): Bad copy. r.cur_span = sp; r.cur_tok = INTERPOLATED((*other_whole_nt).clone()); return ret_val; } MatchedSeq(..) => { r.sp_diag.span_fatal( r.cur_span, /* blame the macro writer */ format!("variable '{}' is still repeating at this depth", token::get_ident(ident)).as_slice()); } } } } } }