blob: f5ecb50cf1a7be41a7482361112e6b5be0c30d9f [file] [log] [blame]
David Tolnay80a914f2018-08-30 23:49:53 -07001// Copyright 2018 Syn Developers
2//
3// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
4// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
5// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
6// option. This file may not be copied, modified, or distributed
7// except according to those terms.
8
David Tolnay18c754c2018-08-21 23:26:58 -04009//! Parsing interface for parsing a token stream into a syntax tree node.
David Tolnay80a914f2018-08-30 23:49:53 -070010//!
David Tolnaye0c51762018-08-31 11:05:22 -070011//! Parsing in Syn is built on parser functions that take in a [`ParseStream`]
12//! and produce a [`Result<T>`] where `T` is some syntax tree node. Underlying
13//! these parser functions is a lower level mechanism built around the
14//! [`Cursor`] type. `Cursor` is a cheaply copyable cursor over a range of
15//! tokens in a token stream.
David Tolnay80a914f2018-08-30 23:49:53 -070016//!
David Tolnaye0c51762018-08-31 11:05:22 -070017//! [`ParseStream`]: type.ParseStream.html
18//! [`Result<T>`]: type.Result.html
David Tolnay80a914f2018-08-30 23:49:53 -070019//! [`Cursor`]: ../buffer/index.html
David Tolnay80a914f2018-08-30 23:49:53 -070020//!
David Tolnaye0c51762018-08-31 11:05:22 -070021//! The `ParseStream`-based interface is convenient for parser implementations,
22//! but not necessarily when you just have some tokens that you want to parse.
23//! For that we expose the following two entry points.
David Tolnay80a914f2018-08-30 23:49:53 -070024//!
25//! ## The `syn::parse*` functions
26//!
27//! The [`syn::parse`], [`syn::parse2`], and [`syn::parse_str`] functions serve
28//! as an entry point for parsing syntax tree nodes that can be parsed in an
29//! obvious default way. These functions can return any syntax tree node that
David Tolnay8aacee12018-08-31 09:15:15 -070030//! implements the [`Parse`] trait, which includes most types in Syn.
David Tolnay80a914f2018-08-30 23:49:53 -070031//!
32//! [`syn::parse`]: ../fn.parse.html
33//! [`syn::parse2`]: ../fn.parse2.html
34//! [`syn::parse_str`]: ../fn.parse_str.html
David Tolnay8aacee12018-08-31 09:15:15 -070035//! [`Parse`]: trait.Parse.html
David Tolnay80a914f2018-08-30 23:49:53 -070036//!
37//! ```
38//! use syn::Type;
39//!
David Tolnay8aacee12018-08-31 09:15:15 -070040//! # fn run_parser() -> Result<(), syn::parse::Error> {
David Tolnay80a914f2018-08-30 23:49:53 -070041//! let t: Type = syn::parse_str("std::collections::HashMap<String, Value>")?;
42//! # Ok(())
43//! # }
44//! #
45//! # fn main() {
46//! # run_parser().unwrap();
47//! # }
48//! ```
49//!
50//! The [`parse_quote!`] macro also uses this approach.
51//!
52//! [`parse_quote!`]: ../macro.parse_quote.html
53//!
54//! ## The `Parser` trait
55//!
56//! Some types can be parsed in several ways depending on context. For example
57//! an [`Attribute`] can be either "outer" like `#[...]` or "inner" like
58//! `#![...]` and parsing the wrong one would be a bug. Similarly [`Punctuated`]
59//! may or may not allow trailing punctuation, and parsing it the wrong way
60//! would either reject valid input or accept invalid input.
61//!
62//! [`Attribute`]: ../struct.Attribute.html
63//! [`Punctuated`]: ../punctuated/index.html
64//!
David Tolnaye0c51762018-08-31 11:05:22 -070065//! The `Parse` trait is not implemented in these cases because there is no good
David Tolnay80a914f2018-08-30 23:49:53 -070066//! behavior to consider the default.
67//!
68//! ```ignore
69//! // Can't parse `Punctuated` without knowing whether trailing punctuation
70//! // should be allowed in this context.
71//! let path: Punctuated<PathSegment, Token![::]> = syn::parse(tokens)?;
72//! ```
73//!
74//! In these cases the types provide a choice of parser functions rather than a
David Tolnaye0c51762018-08-31 11:05:22 -070075//! single `Parse` implementation, and those parser functions can be invoked
David Tolnay80a914f2018-08-30 23:49:53 -070076//! through the [`Parser`] trait.
77//!
78//! [`Parser`]: trait.Parser.html
79//!
80//! ```
David Tolnay80a914f2018-08-30 23:49:53 -070081//! # extern crate syn;
82//! #
83//! # extern crate proc_macro2;
84//! # use proc_macro2::TokenStream;
85//! #
David Tolnay3e3f7752018-08-31 09:33:59 -070086//! use syn::parse::Parser;
David Tolnay80a914f2018-08-30 23:49:53 -070087//! use syn::punctuated::Punctuated;
David Tolnay9b00f652018-09-01 10:31:02 -070088//! use syn::{Attribute, Expr, PathSegment, Token};
David Tolnay80a914f2018-08-30 23:49:53 -070089//!
David Tolnay3e3f7752018-08-31 09:33:59 -070090//! # fn run_parsers() -> Result<(), syn::parse::Error> {
David Tolnay80a914f2018-08-30 23:49:53 -070091//! # let tokens = TokenStream::new().into();
92//! // Parse a nonempty sequence of path segments separated by `::` punctuation
93//! // with no trailing punctuation.
94//! let parser = Punctuated::<PathSegment, Token![::]>::parse_separated_nonempty;
95//! let path = parser.parse(tokens)?;
96//!
97//! # let tokens = TokenStream::new().into();
98//! // Parse a possibly empty sequence of expressions terminated by commas with
99//! // an optional trailing punctuation.
100//! let parser = Punctuated::<Expr, Token![,]>::parse_terminated;
101//! let args = parser.parse(tokens)?;
102//!
103//! # let tokens = TokenStream::new().into();
104//! // Parse zero or more outer attributes but not inner attributes.
David Tolnay3e3f7752018-08-31 09:33:59 -0700105//! let parser = Attribute::parse_outer;
106//! let attrs = parser.parse(tokens)?;
David Tolnay80a914f2018-08-30 23:49:53 -0700107//! #
108//! # Ok(())
109//! # }
110//! #
111//! # fn main() {}
112//! ```
113//!
David Tolnaye0c51762018-08-31 11:05:22 -0700114//! ---
David Tolnay80a914f2018-08-30 23:49:53 -0700115//!
116//! *This module is available if Syn is built with the `"parsing"` feature.*
David Tolnay18c754c2018-08-21 23:26:58 -0400117
118use std::cell::Cell;
119use std::fmt::Display;
120use std::marker::PhantomData;
121use std::mem;
122use std::ops::Deref;
David Tolnayeafc8052018-08-25 16:33:53 -0400123use std::rc::Rc;
David Tolnay80a914f2018-08-30 23:49:53 -0700124use std::str::FromStr;
David Tolnayeafc8052018-08-25 16:33:53 -0400125
David Tolnay80a914f2018-08-30 23:49:53 -0700126#[cfg(all(
127 not(all(target_arch = "wasm32", target_os = "unknown")),
128 feature = "proc-macro"
129))]
130use proc_macro;
131use proc_macro2::{self, Delimiter, Group, Ident, Literal, Punct, Span, TokenStream, TokenTree};
David Tolnay18c754c2018-08-21 23:26:58 -0400132
David Tolnay80a914f2018-08-30 23:49:53 -0700133use buffer::{Cursor, TokenBuffer};
David Tolnayb6254182018-08-25 08:44:54 -0400134use error;
David Tolnay94f06632018-08-31 10:17:17 -0700135use lookahead;
136use private;
David Tolnay577d0332018-08-25 21:45:24 -0400137use punctuated::Punctuated;
David Tolnay4fb71232018-08-25 23:14:50 -0400138use token::Token;
David Tolnay18c754c2018-08-21 23:26:58 -0400139
David Tolnayb6254182018-08-25 08:44:54 -0400140pub use error::{Error, Result};
141pub use lookahead::{Lookahead1, Peek};
David Tolnay18c754c2018-08-21 23:26:58 -0400142
143/// Parsing interface implemented by all types that can be parsed in a default
144/// way from a token stream.
145pub trait Parse: Sized {
146 fn parse(input: ParseStream) -> Result<Self>;
147}
148
149/// Input to a Syn parser function.
David Tolnaya0daa482018-09-01 02:09:40 -0700150///
151/// See the methods of this type under the documentation of [`ParseBuffer`]. For
152/// an overview of parsing in Syn, refer to the [module documentation].
153///
154/// [module documentation]: index.html
David Tolnay18c754c2018-08-21 23:26:58 -0400155pub type ParseStream<'a> = &'a ParseBuffer<'a>;
156
157/// Cursor position within a buffered token stream.
David Tolnay18c754c2018-08-21 23:26:58 -0400158pub struct ParseBuffer<'a> {
159 scope: Span,
160 cell: Cell<Cursor<'static>>,
161 marker: PhantomData<Cursor<'a>>,
David Tolnayeafc8052018-08-25 16:33:53 -0400162 unexpected: Rc<Cell<Option<Span>>>,
163}
164
165impl<'a> Drop for ParseBuffer<'a> {
166 fn drop(&mut self) {
167 if !self.is_empty() && self.unexpected.get().is_none() {
168 self.unexpected.set(Some(self.cursor().span()));
169 }
170 }
David Tolnay18c754c2018-08-21 23:26:58 -0400171}
172
David Tolnay18c754c2018-08-21 23:26:58 -0400173#[derive(Copy, Clone)]
174pub struct StepCursor<'c, 'a> {
175 scope: Span,
176 cursor: Cursor<'c>,
177 marker: PhantomData<fn(Cursor<'c>) -> Cursor<'a>>,
178}
179
180impl<'c, 'a> Deref for StepCursor<'c, 'a> {
181 type Target = Cursor<'c>;
182
183 fn deref(&self) -> &Self::Target {
184 &self.cursor
185 }
186}
187
188impl<'c, 'a> StepCursor<'c, 'a> {
David Tolnay18c754c2018-08-21 23:26:58 -0400189 pub fn advance(self, other: Cursor<'c>) -> Cursor<'a> {
190 unsafe { mem::transmute::<Cursor<'c>, Cursor<'a>>(other) }
191 }
192
David Tolnay18c754c2018-08-21 23:26:58 -0400193 pub fn error<T: Display>(self, message: T) -> Error {
194 error::new_at(self.scope, self.cursor, message)
195 }
196}
197
David Tolnay66cb0c42018-08-31 09:01:30 -0700198fn skip(input: ParseStream) -> bool {
David Tolnay4ac232d2018-08-31 10:18:03 -0700199 input
200 .step(|cursor| {
201 if let Some((_lifetime, rest)) = cursor.lifetime() {
202 Ok((true, rest))
203 } else if let Some((_token, rest)) = cursor.token_tree() {
204 Ok((true, rest))
205 } else {
206 Ok((false, *cursor))
207 }
208 }).unwrap()
David Tolnay66cb0c42018-08-31 09:01:30 -0700209}
210
David Tolnay10951d52018-08-31 10:27:39 -0700211impl private {
David Tolnay70f30e92018-09-01 02:04:17 -0700212 pub fn new_parse_buffer(
213 scope: Span,
214 cursor: Cursor,
215 unexpected: Rc<Cell<Option<Span>>>,
216 ) -> ParseBuffer {
David Tolnay94f06632018-08-31 10:17:17 -0700217 let extend = unsafe { mem::transmute::<Cursor, Cursor<'static>>(cursor) };
David Tolnay18c754c2018-08-21 23:26:58 -0400218 ParseBuffer {
219 scope: scope,
220 cell: Cell::new(extend),
221 marker: PhantomData,
David Tolnayeafc8052018-08-25 16:33:53 -0400222 unexpected: unexpected,
David Tolnay18c754c2018-08-21 23:26:58 -0400223 }
224 }
225
David Tolnay94f06632018-08-31 10:17:17 -0700226 pub fn get_unexpected(buffer: &ParseBuffer) -> Rc<Cell<Option<Span>>> {
227 buffer.unexpected.clone()
228 }
229}
230
231impl<'a> ParseBuffer<'a> {
David Tolnay18c754c2018-08-21 23:26:58 -0400232 pub fn parse<T: Parse>(&self) -> Result<T> {
233 T::parse(self)
234 }
235
David Tolnay3a515a02018-08-25 21:08:27 -0400236 pub fn call<T>(&self, function: fn(ParseStream) -> Result<T>) -> Result<T> {
237 function(self)
238 }
239
David Tolnayb77c8b62018-08-25 16:39:41 -0400240 pub fn peek<T: Peek>(&self, token: T) -> bool {
241 self.lookahead1().peek(token)
242 }
243
David Tolnay4fb71232018-08-25 23:14:50 -0400244 pub fn peek2<T: Peek>(&self, token: T) -> bool {
David Tolnay4fb71232018-08-25 23:14:50 -0400245 let ahead = self.fork();
David Tolnay66cb0c42018-08-31 09:01:30 -0700246 skip(&ahead) && ahead.peek(token)
David Tolnay4fb71232018-08-25 23:14:50 -0400247 }
248
249 pub fn peek3<T: Peek>(&self, token: T) -> bool {
David Tolnay4fb71232018-08-25 23:14:50 -0400250 let ahead = self.fork();
David Tolnay66cb0c42018-08-31 09:01:30 -0700251 skip(&ahead) && skip(&ahead) && ahead.peek(token)
David Tolnay4fb71232018-08-25 23:14:50 -0400252 }
253
David Tolnay577d0332018-08-25 21:45:24 -0400254 pub fn parse_terminated<T, P: Parse>(
255 &self,
256 parser: fn(ParseStream) -> Result<T>,
257 ) -> Result<Punctuated<T, P>> {
David Tolnayd0f80212018-08-30 18:32:14 -0700258 Punctuated::parse_terminated_with(self, parser)
David Tolnay577d0332018-08-25 21:45:24 -0400259 }
260
David Tolnayf5d30452018-09-01 02:29:04 -0700261 pub fn is_empty(&self) -> bool {
262 self.cursor().eof()
263 }
264
265 pub fn lookahead1(&self) -> Lookahead1<'a> {
266 lookahead::new(self.scope, self.cursor())
267 }
268
David Tolnayb77c8b62018-08-25 16:39:41 -0400269 pub fn fork(&self) -> Self {
David Tolnay6456a9d2018-08-26 08:11:18 -0400270 ParseBuffer {
271 scope: self.scope,
272 cell: self.cell.clone(),
273 marker: PhantomData,
274 // Not the parent's unexpected. Nothing cares whether the clone
275 // parses all the way.
276 unexpected: Rc::new(Cell::new(None)),
277 }
David Tolnayb77c8b62018-08-25 16:39:41 -0400278 }
279
David Tolnay4fb71232018-08-25 23:14:50 -0400280 pub fn error<T: Display>(&self, message: T) -> Error {
281 error::new_at(self.scope, self.cursor(), message)
282 }
283
David Tolnayb50c65a2018-08-30 21:14:57 -0700284 pub fn step<F, R>(&self, function: F) -> Result<R>
David Tolnay18c754c2018-08-21 23:26:58 -0400285 where
286 F: for<'c> FnOnce(StepCursor<'c, 'a>) -> Result<(R, Cursor<'c>)>,
287 {
288 match function(StepCursor {
289 scope: self.scope,
290 cursor: self.cell.get(),
291 marker: PhantomData,
292 }) {
293 Ok((ret, cursor)) => {
294 self.cell.set(cursor);
295 Ok(ret)
296 }
297 Err(err) => Err(err),
298 }
299 }
David Tolnayeafc8052018-08-25 16:33:53 -0400300
David Tolnayf5d30452018-09-01 02:29:04 -0700301 pub fn cursor(&self) -> Cursor<'a> {
302 self.cell.get()
303 }
304
David Tolnay94f06632018-08-31 10:17:17 -0700305 fn check_unexpected(&self) -> Result<()> {
David Tolnayeafc8052018-08-25 16:33:53 -0400306 match self.unexpected.get() {
307 Some(span) => Err(Error::new(span, "unexpected token")),
308 None => Ok(()),
309 }
310 }
David Tolnay18c754c2018-08-21 23:26:58 -0400311}
312
313impl Parse for Ident {
314 fn parse(input: ParseStream) -> Result<Self> {
David Tolnayb50c65a2018-08-30 21:14:57 -0700315 input.step(|cursor| {
David Tolnay18c754c2018-08-21 23:26:58 -0400316 if let Some((ident, rest)) = cursor.ident() {
David Tolnayc4fdb1a2018-08-24 21:11:07 -0400317 match ident.to_string().as_str() {
318 "_"
319 // Based on https://doc.rust-lang.org/grammar.html#keywords
320 // and https://github.com/rust-lang/rfcs/blob/master/text/2421-unreservations-2018.md
321 | "abstract" | "as" | "become" | "box" | "break" | "const"
322 | "continue" | "crate" | "do" | "else" | "enum" | "extern" | "false" | "final"
323 | "fn" | "for" | "if" | "impl" | "in" | "let" | "loop" | "macro" | "match"
324 | "mod" | "move" | "mut" | "override" | "priv" | "proc" | "pub"
325 | "ref" | "return" | "Self" | "self" | "static" | "struct"
326 | "super" | "trait" | "true" | "type" | "typeof" | "unsafe" | "unsized" | "use"
327 | "virtual" | "where" | "while" | "yield" => {}
328 _ => return Ok((ident, rest)),
329 }
David Tolnay18c754c2018-08-21 23:26:58 -0400330 }
David Tolnayc4fdb1a2018-08-24 21:11:07 -0400331 Err(cursor.error("expected identifier"))
David Tolnay18c754c2018-08-21 23:26:58 -0400332 })
333 }
334}
335
David Tolnaya7d69fc2018-08-26 13:30:24 -0400336impl<T: Parse> Parse for Box<T> {
337 fn parse(input: ParseStream) -> Result<Self> {
338 input.parse().map(Box::new)
339 }
340}
341
David Tolnay4fb71232018-08-25 23:14:50 -0400342impl<T: Parse + Token> Parse for Option<T> {
David Tolnay18c754c2018-08-21 23:26:58 -0400343 fn parse(input: ParseStream) -> Result<Self> {
David Tolnay00f81fd2018-09-01 10:50:12 -0700344 if T::peek(input.cursor()) {
David Tolnay4fb71232018-08-25 23:14:50 -0400345 Ok(Some(input.parse()?))
346 } else {
347 Ok(None)
David Tolnay18c754c2018-08-21 23:26:58 -0400348 }
David Tolnay18c754c2018-08-21 23:26:58 -0400349 }
350}
David Tolnay4ac232d2018-08-31 10:18:03 -0700351
David Tolnay80a914f2018-08-30 23:49:53 -0700352impl Parse for TokenStream {
353 fn parse(input: ParseStream) -> Result<Self> {
354 input.step(|cursor| Ok((cursor.token_stream(), Cursor::empty())))
355 }
356}
357
358impl Parse for TokenTree {
359 fn parse(input: ParseStream) -> Result<Self> {
360 input.step(|cursor| match cursor.token_tree() {
361 Some((tt, rest)) => Ok((tt, rest)),
362 None => Err(cursor.error("expected token tree")),
363 })
364 }
365}
366
367impl Parse for Group {
368 fn parse(input: ParseStream) -> Result<Self> {
369 input.step(|cursor| {
370 for delim in &[Delimiter::Parenthesis, Delimiter::Brace, Delimiter::Bracket] {
371 if let Some((inside, span, rest)) = cursor.group(*delim) {
372 let mut group = Group::new(*delim, inside.token_stream());
373 group.set_span(span);
374 return Ok((group, rest));
375 }
376 }
377 Err(cursor.error("expected group token"))
378 })
379 }
380}
381
382impl Parse for Punct {
383 fn parse(input: ParseStream) -> Result<Self> {
384 input.step(|cursor| match cursor.punct() {
385 Some((punct, rest)) => Ok((punct, rest)),
386 None => Err(cursor.error("expected punctuation token")),
387 })
388 }
389}
390
391impl Parse for Literal {
392 fn parse(input: ParseStream) -> Result<Self> {
393 input.step(|cursor| match cursor.literal() {
394 Some((literal, rest)) => Ok((literal, rest)),
395 None => Err(cursor.error("expected literal token")),
396 })
397 }
398}
399
400/// Parser that can parse Rust tokens into a particular syntax tree node.
401///
402/// Refer to the [module documentation] for details about parsing in Syn.
403///
404/// [module documentation]: index.html
405///
406/// *This trait is available if Syn is built with the `"parsing"` feature.*
407pub trait Parser: Sized {
408 type Output;
409
410 /// Parse a proc-macro2 token stream into the chosen syntax tree node.
411 fn parse2(self, tokens: TokenStream) -> Result<Self::Output>;
412
413 /// Parse tokens of source code into the chosen syntax tree node.
414 ///
415 /// *This method is available if Syn is built with both the `"parsing"` and
416 /// `"proc-macro"` features.*
417 #[cfg(all(
418 not(all(target_arch = "wasm32", target_os = "unknown")),
419 feature = "proc-macro"
420 ))]
421 fn parse(self, tokens: proc_macro::TokenStream) -> Result<Self::Output> {
422 self.parse2(proc_macro2::TokenStream::from(tokens))
423 }
424
425 /// Parse a string of Rust code into the chosen syntax tree node.
426 ///
427 /// # Hygiene
428 ///
429 /// Every span in the resulting syntax tree will be set to resolve at the
430 /// macro call site.
431 fn parse_str(self, s: &str) -> Result<Self::Output> {
432 self.parse2(proc_macro2::TokenStream::from_str(s)?)
433 }
434}
435
David Tolnay7b07aa12018-09-01 11:41:12 -0700436fn tokens_to_parse_buffer(tokens: &TokenBuffer) -> ParseBuffer {
437 let scope = Span::call_site();
438 let cursor = tokens.begin();
439 let unexpected = Rc::new(Cell::new(None));
440 private::new_parse_buffer(scope, cursor, unexpected)
441}
442
David Tolnay80a914f2018-08-30 23:49:53 -0700443impl<F, T> Parser for F
444where
445 F: FnOnce(ParseStream) -> Result<T>,
446{
447 type Output = T;
448
449 fn parse2(self, tokens: TokenStream) -> Result<T> {
450 let buf = TokenBuffer::new2(tokens);
David Tolnay7b07aa12018-09-01 11:41:12 -0700451 let state = tokens_to_parse_buffer(&buf);
David Tolnay80a914f2018-08-30 23:49:53 -0700452 let node = self(&state)?;
453 state.check_unexpected()?;
454 if state.is_empty() {
455 Ok(node)
456 } else {
457 Err(state.error("unexpected token"))
458 }
459 }
460}