1 // Copyright 2012-2013 The Rust Project Developers. See the COPYRIGHT
2 // file at the top-level directory of this distribution and at
3 // http://rust-lang.org/COPYRIGHT.
5 // Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
6 // http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
7 // <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
8 // option. This file may not be copied, modified, or distributed
9 // except according to those terms.
11 pub use self::BinOpToken
::*;
12 pub use self::Nonterminal
::*;
13 pub use self::DelimToken
::*;
14 pub use self::IdentStyle
::*;
16 pub use self::Token
::*;
21 use util
::interner
::{RcStr, StrInterner}
;
24 use serialize
::{Decodable, Decoder, Encodable, Encoder}
;
29 #[allow(non_camel_case_types)]
30 #[derive(Clone, RustcEncodable, RustcDecodable, PartialEq, Eq, Hash, Debug, Copy)]
45 #[derive(Clone, RustcEncodable, RustcDecodable, PartialEq, Eq, Hash, Debug, Copy)]
47 /// A round parenthesis: `(` or `)`
49 /// A square bracket: `[` or `]`
51 /// A curly brace: `{` or `}`
55 #[derive(Clone, RustcEncodable, RustcDecodable, PartialEq, Eq, Hash, Debug, Copy)]
57 /// `::` follows the identifier with no whitespace in-between.
62 #[derive(Clone, RustcEncodable, RustcDecodable, PartialEq, Eq, Hash, Debug, Copy)]
63 pub enum SpecialMacroVar
{
64 /// `$crate` will be filled in with the name of the crate a macro was
65 /// imported from, if any.
69 impl SpecialMacroVar
{
70 pub fn as_str(self) -> &'
static str {
72 SpecialMacroVar
::CrateMacroVar
=> "crate",
77 #[derive(Clone, RustcEncodable, RustcDecodable, PartialEq, Eq, Hash, Debug, Copy)]
84 StrRaw(ast
::Name
, usize), /* raw str delimited by n hash symbols */
86 BinaryRaw(ast
::Name
, usize), /* raw binary str delimited by n hash symbols */
90 pub fn short_name(&self) -> &'
static str {
94 Integer(_
) => "integer",
96 Str_(_
) | StrRaw(..) => "str",
97 Binary(_
) | BinaryRaw(..) => "binary str"
102 #[allow(non_camel_case_types)]
103 #[derive(Clone, RustcEncodable, RustcDecodable, PartialEq, Eq, Hash, Debug)]
105 /* Expression-operator symbols. */
120 /* Structural symbols */
135 /// An opening delimiter, eg. `{`
136 OpenDelim(DelimToken
),
137 /// A closing delimiter, eg. `}`
138 CloseDelim(DelimToken
),
141 Literal(Lit
, Option
<ast
::Name
>),
143 /* Name components */
144 Ident(ast
::Ident
, IdentStyle
),
146 Lifetime(ast
::Ident
),
148 /* For interpolation */
149 Interpolated(Nonterminal
),
150 // Can be expanded into several tokens.
152 DocComment(ast
::Name
),
153 // In left-hand-sides of MBE macros:
154 /// Parse a nonterminal (name to bind, name of NT, styles of their idents)
155 MatchNt(ast
::Ident
, ast
::Ident
, IdentStyle
, IdentStyle
),
156 // In right-hand-sides of MBE macros:
157 /// A syntactic variable that will be filled in by macro expansion.
158 SubstNt(ast
::Ident
, IdentStyle
),
159 /// A macro variable with special meaning.
160 SpecialVarNt(SpecialMacroVar
),
162 // Junk. These carry no data because we don't really care about the data
163 // they *would* carry, and don't really want to allocate a new ident for
164 // them. Instead, users could extract that from the associated span.
176 /// Returns `true` if the token starts with '>'.
177 pub fn is_like_gt(&self) -> bool
{
179 BinOp(Shr
) | BinOpEq(Shr
) | Gt
| Ge
=> true,
184 /// Returns `true` if the token can appear at the start of an expression.
185 pub fn can_begin_expr(&self) -> bool
{
187 OpenDelim(_
) => true,
191 Literal(_
, _
) => true,
193 BinOp(Minus
) => true,
196 BinOp(Or
) => true, // in lambda syntax
197 OrOr
=> true, // in lambda syntax
198 AndAnd
=> true, // double borrow
199 DotDot
=> true, // range notation
201 Interpolated(NtExpr(..)) => true,
202 Interpolated(NtIdent(..)) => true,
203 Interpolated(NtBlock(..)) => true,
204 Interpolated(NtPath(..)) => true,
209 /// Returns `true` if the token is any literal
210 pub fn is_lit(&self) -> bool
{
212 Literal(_
, _
) => true,
217 /// Returns `true` if the token is an identifier.
218 pub fn is_ident(&self) -> bool
{
225 /// Returns `true` if the token is an interpolated path.
226 pub fn is_path(&self) -> bool
{
228 Interpolated(NtPath(..)) => true,
233 /// Returns `true` if the token is a path that is not followed by a `::`
235 #[allow(non_upper_case_globals)]
236 pub fn is_plain_ident(&self) -> bool
{
238 Ident(_
, Plain
) => true,
243 /// Returns `true` if the token is a lifetime.
244 pub fn is_lifetime(&self) -> bool
{
246 Lifetime(..) => true,
251 /// Returns `true` if the token is either the `mut` or `const` keyword.
252 pub fn is_mutability(&self) -> bool
{
253 self.is_keyword(keywords
::Mut
) ||
254 self.is_keyword(keywords
::Const
)
257 /// Maps a token to its corresponding binary operator.
258 pub fn to_binop(&self) -> Option
<ast
::BinOp_
> {
260 BinOp(Star
) => Some(ast
::BiMul
),
261 BinOp(Slash
) => Some(ast
::BiDiv
),
262 BinOp(Percent
) => Some(ast
::BiRem
),
263 BinOp(Plus
) => Some(ast
::BiAdd
),
264 BinOp(Minus
) => Some(ast
::BiSub
),
265 BinOp(Shl
) => Some(ast
::BiShl
),
266 BinOp(Shr
) => Some(ast
::BiShr
),
267 BinOp(And
) => Some(ast
::BiBitAnd
),
268 BinOp(Caret
) => Some(ast
::BiBitXor
),
269 BinOp(Or
) => Some(ast
::BiBitOr
),
270 Lt
=> Some(ast
::BiLt
),
271 Le
=> Some(ast
::BiLe
),
272 Ge
=> Some(ast
::BiGe
),
273 Gt
=> Some(ast
::BiGt
),
274 EqEq
=> Some(ast
::BiEq
),
275 Ne
=> Some(ast
::BiNe
),
276 AndAnd
=> Some(ast
::BiAnd
),
277 OrOr
=> Some(ast
::BiOr
),
282 /// Returns `true` if the token is a given keyword, `kw`.
283 #[allow(non_upper_case_globals)]
284 pub fn is_keyword(&self, kw
: keywords
::Keyword
) -> bool
{
286 Ident(sid
, Plain
) => kw
.to_name() == sid
.name
,
291 pub fn is_keyword_allow_following_colon(&self, kw
: keywords
::Keyword
) -> bool
{
293 Ident(sid
, _
) => { kw.to_name() == sid.name }
298 /// Returns `true` if the token is either a special identifier, or a strict
299 /// or reserved keyword.
300 #[allow(non_upper_case_globals)]
301 pub fn is_any_keyword(&self) -> bool
{
303 Ident(sid
, Plain
) => {
306 n
== SELF_KEYWORD_NAME
307 || n
== STATIC_KEYWORD_NAME
308 || n
== SUPER_KEYWORD_NAME
309 || n
== SELF_TYPE_KEYWORD_NAME
310 || STRICT_KEYWORD_START
<= n
311 && n
<= RESERVED_KEYWORD_FINAL
317 /// Returns `true` if the token may not appear as an identifier.
318 #[allow(non_upper_case_globals)]
319 pub fn is_strict_keyword(&self) -> bool
{
321 Ident(sid
, Plain
) => {
324 n
== SELF_KEYWORD_NAME
325 || n
== STATIC_KEYWORD_NAME
326 || n
== SUPER_KEYWORD_NAME
327 || n
== SELF_TYPE_KEYWORD_NAME
328 || STRICT_KEYWORD_START
<= n
329 && n
<= STRICT_KEYWORD_FINAL
331 Ident(sid
, ModName
) => {
334 n
!= SELF_KEYWORD_NAME
335 && n
!= SUPER_KEYWORD_NAME
336 && STRICT_KEYWORD_START
<= n
337 && n
<= STRICT_KEYWORD_FINAL
343 /// Returns `true` if the token is a keyword that has been reserved for
344 /// possible future use.
345 #[allow(non_upper_case_globals)]
346 pub fn is_reserved_keyword(&self) -> bool
{
348 Ident(sid
, Plain
) => {
351 RESERVED_KEYWORD_START
<= n
352 && n
<= RESERVED_KEYWORD_FINAL
358 /// Hygienic identifier equality comparison.
360 /// See `styntax::ext::mtwt`.
361 pub fn mtwt_eq(&self, other
: &Token
) -> bool
{
362 match (self, other
) {
363 (&Ident(id1
,_
), &Ident(id2
,_
)) | (&Lifetime(id1
), &Lifetime(id2
)) =>
364 mtwt
::resolve(id1
) == mtwt
::resolve(id2
),
370 #[derive(Clone, RustcEncodable, RustcDecodable, PartialEq, Eq, Hash)]
371 /// For interpolation during macro expansion.
372 pub enum Nonterminal
{
373 NtItem(P
<ast
::Item
>),
374 NtBlock(P
<ast
::Block
>),
375 NtStmt(P
<ast
::Stmt
>),
377 NtExpr(P
<ast
::Expr
>),
379 NtIdent(Box
<ast
::Ident
>, IdentStyle
),
380 /// Stuff inside brackets for attributes
381 NtMeta(P
<ast
::MetaItem
>),
382 NtPath(Box
<ast
::Path
>),
383 NtTT(P
<ast
::TokenTree
>), // needs P'ed to break a circularity
386 impl fmt
::Debug
for Nonterminal
{
387 fn fmt(&self, f
: &mut fmt
::Formatter
) -> fmt
::Result
{
389 NtItem(..) => f
.pad("NtItem(..)"),
390 NtBlock(..) => f
.pad("NtBlock(..)"),
391 NtStmt(..) => f
.pad("NtStmt(..)"),
392 NtPat(..) => f
.pad("NtPat(..)"),
393 NtExpr(..) => f
.pad("NtExpr(..)"),
394 NtTy(..) => f
.pad("NtTy(..)"),
395 NtIdent(..) => f
.pad("NtIdent(..)"),
396 NtMeta(..) => f
.pad("NtMeta(..)"),
397 NtPath(..) => f
.pad("NtPath(..)"),
398 NtTT(..) => f
.pad("NtTT(..)"),
404 // Get the first "argument"
406 ( $first
:expr
, $
( $remainder
:expr
, )* ) => ( $first
)
409 // Get the last "argument" (has to be done recursively to avoid phoney local ambiguity error)
411 ( $first
:expr
, $
( $remainder
:expr
, )+ ) => ( last
!( $
( $remainder
, )+ ) );
412 ( $first
:expr
, ) => ( $first
)
415 // In this macro, there is the requirement that the name (the number) must be monotonically
416 // increasing by one in the special identifiers, starting at 0; the same holds for the keywords,
417 // except starting from the next number instead of zero, and with the additional exception that
418 // special identifiers are *also* allowed (they are deduplicated in the important place, the
419 // interner), an exception which is demonstrated by "static" and "self".
420 macro_rules
! declare_special_idents_and_keywords
{(
421 // So now, in these rules, why is each definition parenthesised?
422 // Answer: otherwise we get a spurious local ambiguity bug on the "}"
423 pub mod special_idents
{
424 $
( ($si_name
:expr
, $si_static
:ident
, $si_str
:expr
); )*
429 $
( ($sk_name
:expr
, $sk_variant
:ident
, $sk_str
:expr
); )*
431 $
( ($rk_name
:expr
, $rk_variant
:ident
, $rk_str
:expr
); )*
434 const STRICT_KEYWORD_START
: ast
::Name
= first
!($
( ast
::Name($sk_name
), )*);
435 const STRICT_KEYWORD_FINAL
: ast
::Name
= last
!($
( ast
::Name($sk_name
), )*);
436 const RESERVED_KEYWORD_START
: ast
::Name
= first
!($
( ast
::Name($rk_name
), )*);
437 const RESERVED_KEYWORD_FINAL
: ast
::Name
= last
!($
( ast
::Name($rk_name
), )*);
439 pub mod special_idents
{
442 #[allow(non_upper_case_globals)]
443 pub const $si_static
: ast
::Ident
= ast
::Ident
{
444 name
: ast
::Name($si_name
),
450 pub mod special_names
{
453 #[allow(non_upper_case_globals)]
454 pub const $si_static
: ast
::Name
= ast
::Name($si_name
);
458 /// All the valid words that have meaning in the Rust language.
460 /// Rust keywords are either 'strict' or 'reserved'. Strict keywords may not
461 /// appear as identifiers at all. Reserved keywords are not used anywhere in
462 /// the language and may not appear as identifiers.
464 pub use self::Keyword
::*;
467 #[derive(Copy, Clone, PartialEq, Eq)]
474 pub fn to_name(&self) -> ast
::Name
{
476 $
( $sk_variant
=> ast
::Name($sk_name
), )*
477 $
( $rk_variant
=> ast
::Name($rk_name
), )*
483 fn mk_fresh_ident_interner() -> IdentInterner
{
484 // The indices here must correspond to the numbers in
485 // special_idents, in Keyword to_name(), and in static
487 let mut init_vec
= Vec
::new();
488 $
(init_vec
.push($si_str
);)*
489 $
(init_vec
.push($sk_str
);)*
490 $
(init_vec
.push($rk_str
);)*
491 interner
::StrInterner
::prefill(&init_vec
[..])
495 // If the special idents get renumbered, remember to modify these two as appropriate
496 pub const SELF_KEYWORD_NAME
: ast
::Name
= ast
::Name(SELF_KEYWORD_NAME_NUM
);
497 const STATIC_KEYWORD_NAME
: ast
::Name
= ast
::Name(STATIC_KEYWORD_NAME_NUM
);
498 const SUPER_KEYWORD_NAME
: ast
::Name
= ast
::Name(SUPER_KEYWORD_NAME_NUM
);
499 const SELF_TYPE_KEYWORD_NAME
: ast
::Name
= ast
::Name(SELF_TYPE_KEYWORD_NAME_NUM
);
501 pub const SELF_KEYWORD_NAME_NUM
: u32 = 1;
502 const STATIC_KEYWORD_NAME_NUM
: u32 = 2;
503 const SUPER_KEYWORD_NAME_NUM
: u32 = 3;
504 const SELF_TYPE_KEYWORD_NAME_NUM
: u32 = 10;
506 // NB: leaving holes in the ident table is bad! a different ident will get
507 // interned with the id from the hole, but it will be between the min and max
508 // of the reserved words, and thus tagged as "reserved".
510 declare_special_idents_and_keywords
! {
511 pub mod special_idents
{
512 // These ones are statics
514 (super::SELF_KEYWORD_NAME_NUM
, self_
, "self");
515 (super::STATIC_KEYWORD_NAME_NUM
, statik
, "static");
516 (super::SUPER_KEYWORD_NAME_NUM
, super_
, "super");
517 (4, static_lifetime
, "'static");
521 (6, matchers
, "matchers");
523 // outside of libsyntax
524 (7, clownshoe_abi
, "__rust_abi");
525 (8, opaque
, "<opaque>");
526 (9, unnamed_field
, "<unnamed_field>");
527 (super::SELF_TYPE_KEYWORD_NAME_NUM
, type_self
, "Self");
528 (11, prelude_import
, "prelude_import");
532 // These ones are variants of the Keyword enum
536 (13, Break
, "break");
537 (14, Crate
, "crate");
540 (17, Extern
, "extern");
541 (18, False
, "false");
549 (26, Match
, "match");
555 (32, Return
, "return");
556 // Static and Self are also special idents (prefill de-dupes)
557 (super::STATIC_KEYWORD_NAME_NUM
, Static
, "static");
558 (super::SELF_KEYWORD_NAME_NUM
, SelfValue
, "self");
559 (super::SELF_TYPE_KEYWORD_NAME_NUM
, SelfType
, "Self");
560 (33, Struct
, "struct");
561 (super::SUPER_KEYWORD_NAME_NUM
, Super
, "super");
563 (35, Trait
, "trait");
565 (37, Unsafe
, "unsafe");
567 (39, Virtual
, "virtual");
568 (40, While
, "while");
569 (41, Continue
, "continue");
571 (43, Const
, "const");
572 (44, Where
, "where");
575 (46, Alignof
, "alignof");
576 (47, Become
, "become");
577 (48, Offsetof
, "offsetof");
580 (51, Sizeof
, "sizeof");
581 (52, Typeof
, "typeof");
582 (53, Unsized
, "unsized");
583 (54, Yield
, "yield");
585 (56, Abstract
, "abstract");
586 (57, Final
, "final");
587 (58, Override
, "override");
588 (59, Macro
, "macro");
592 // looks like we can get rid of this completely...
593 pub type IdentInterner
= StrInterner
;
595 // if an interner exists in TLS, return it. Otherwise, prepare a
597 // FIXME(eddyb) #8726 This should probably use a thread-local reference.
598 pub fn get_ident_interner() -> Rc
<IdentInterner
> {
599 thread_local
!(static KEY
: Rc
<::parse
::token
::IdentInterner
> = {
600 Rc
::new(mk_fresh_ident_interner())
602 KEY
.with(|k
| k
.clone())
605 /// Reset the ident interner to its initial state.
606 pub fn reset_ident_interner() {
607 let interner
= get_ident_interner();
608 interner
.reset(mk_fresh_ident_interner());
611 /// Represents a string stored in the thread-local interner. Because the
612 /// interner lives for the life of the thread, this can be safely treated as an
613 /// immortal string, as long as it never crosses between threads.
615 /// FIXME(pcwalton): You must be careful about what you do in the destructors
616 /// of objects stored in TLS, because they may run after the interner is
617 /// destroyed. In particular, they must not access string contents. This can
618 /// be fixed in the future by just leaking all strings until thread death
620 #[derive(Clone, PartialEq, Hash, PartialOrd, Eq, Ord)]
621 pub struct InternedString
{
625 impl InternedString
{
627 pub fn new(string
: &'
static str) -> InternedString
{
629 string
: RcStr
::new(string
),
634 fn new_from_rc_str(string
: RcStr
) -> InternedString
{
641 impl Deref
for InternedString
{
644 fn deref(&self) -> &str { &*self.string }
647 impl fmt
::Debug
for InternedString
{
648 fn fmt(&self, f
: &mut fmt
::Formatter
) -> fmt
::Result
{
649 fmt
::Debug
::fmt(&self.string
, f
)
653 impl fmt
::Display
for InternedString
{
654 fn fmt(&self, f
: &mut fmt
::Formatter
) -> fmt
::Result
{
655 fmt
::Display
::fmt(&self.string
, f
)
659 impl<'a
> PartialEq
<&'a
str> for InternedString
{
661 fn eq(&self, other
: & &'a
str) -> bool
{
662 PartialEq
::eq(&self.string
[..], *other
)
665 fn ne(&self, other
: & &'a
str) -> bool
{
666 PartialEq
::ne(&self.string
[..], *other
)
670 impl<'a
> PartialEq
<InternedString
> for &'a
str {
672 fn eq(&self, other
: &InternedString
) -> bool
{
673 PartialEq
::eq(*self, &other
.string
[..])
676 fn ne(&self, other
: &InternedString
) -> bool
{
677 PartialEq
::ne(*self, &other
.string
[..])
681 impl Decodable
for InternedString
{
682 fn decode
<D
: Decoder
>(d
: &mut D
) -> Result
<InternedString
, D
::Error
> {
683 Ok(get_name(get_ident_interner().intern(&try
!(d
.read_str())[..])))
687 impl Encodable
for InternedString
{
688 fn encode
<S
: Encoder
>(&self, s
: &mut S
) -> Result
<(), S
::Error
> {
689 s
.emit_str(&self.string
)
693 /// Returns the string contents of a name, using the thread-local interner.
695 pub fn get_name(name
: ast
::Name
) -> InternedString
{
696 let interner
= get_ident_interner();
697 InternedString
::new_from_rc_str(interner
.get(name
))
700 /// Returns the string contents of an identifier, using the thread-local
703 pub fn get_ident(ident
: ast
::Ident
) -> InternedString
{
707 /// Interns and returns the string contents of an identifier, using the
708 /// thread-local interner.
710 pub fn intern_and_get_ident(s
: &str) -> InternedString
{
714 /// Maps a string to its interned representation.
716 pub fn intern(s
: &str) -> ast
::Name
{
717 get_ident_interner().intern(s
)
720 /// gensym's a new usize, using the current interner.
722 pub fn gensym(s
: &str) -> ast
::Name
{
723 get_ident_interner().gensym(s
)
726 /// Maps a string to an identifier with an empty syntax context.
728 pub fn str_to_ident(s
: &str) -> ast
::Ident
{
729 ast
::Ident
::new(intern(s
))
732 /// Maps a string to a gensym'ed identifier.
734 pub fn gensym_ident(s
: &str) -> ast
::Ident
{
735 ast
::Ident
::new(gensym(s
))
738 // create a fresh name that maps to the same string as the old one.
739 // note that this guarantees that str_ptr_eq(ident_to_string(src),interner_get(fresh_name(src)));
740 // that is, that the new name and the old one are connected to ptr_eq strings.
741 pub fn fresh_name(src
: &ast
::Ident
) -> ast
::Name
{
742 let interner
= get_ident_interner();
743 interner
.gensym_copy(src
.name
)
744 // following: debug version. Could work in final except that it's incompatible with
745 // good error messages and uses of struct names in ambiguous could-be-binding
746 // locations. Also definitely destroys the guarantee given above about ptr_eq.
747 /*let num = rand::thread_rng().gen_uint_range(0,0xffff);
748 gensym(format!("{}_{}",ident_to_string(src),num))*/
751 // create a fresh mark.
752 pub fn fresh_mark() -> ast
::Mrk
{
753 gensym("mark").usize() as u32
762 fn mark_ident(id
: ast
::Ident
, m
: ast
::Mrk
) -> ast
::Ident
{
763 ast
::Ident { name: id.name, ctxt:mtwt::apply_mark(m, id.ctxt) }
766 #[test] fn mtwt_token_eq_test() {
767 assert
!(Gt
.mtwt_eq(&Gt
));
768 let a
= str_to_ident("bac");
769 let a1
= mark_ident(a
,92);
770 assert
!(Ident(a
, ModName
).mtwt_eq(&Ident(a1
, Plain
)));