@@ -101,7 +101,14 @@ struct MatcherTtFrame<'tt> {
101
101
idx : usize ,
102
102
}
103
103
104
- type NamedMatchVec = SmallVec < [ NamedMatch ; 4 ] > ;
104
+ // One element is enough to cover 95-99% of vectors for most benchmarks. Also,
105
+ // vectors longer than one frequently have many elements, not just two or
106
+ // three.
107
+ type NamedMatchVec = SmallVec < [ NamedMatch ; 1 ] > ;
108
+
109
+ // This type is used a lot. Make sure it doesn't unintentionally get bigger.
110
+ #[ cfg( all( target_arch = "x86_64" , target_pointer_width = "64" ) ) ]
111
+ rustc_data_structures:: static_assert_size!( NamedMatchVec , 48 ) ;
105
112
106
113
/// Represents a single "position" (aka "matcher position", aka "item"), as
107
114
/// described in the module documentation.
@@ -153,7 +160,7 @@ struct MatcherPos<'tt> {
153
160
154
161
// This type is used a lot. Make sure it doesn't unintentionally get bigger.
155
162
#[ cfg( all( target_arch = "x86_64" , target_pointer_width = "64" ) ) ]
156
- rustc_data_structures:: static_assert_size!( MatcherPos <' _>, 136 ) ;
163
+ rustc_data_structures:: static_assert_size!( MatcherPos <' _>, 112 ) ;
157
164
158
165
impl < ' tt > MatcherPos < ' tt > {
159
166
/// `len` `Vec`s (initially shared and empty) that will store matches of metavars.
@@ -202,11 +209,7 @@ impl<'tt> MatcherPos<'tt> {
202
209
match_lo : up. match_cur ,
203
210
match_cur : up. match_cur ,
204
211
match_hi : up. match_cur + seq. num_captures ,
205
- repetition : Some ( MatcherPosRepetition {
206
- up,
207
- sep : seq. separator . clone ( ) ,
208
- seq_op : seq. kleene . op ,
209
- } ) ,
212
+ repetition : Some ( MatcherPosRepetition { up, seq } ) ,
210
213
stack : smallvec ! [ ] ,
211
214
}
212
215
}
@@ -220,15 +223,12 @@ impl<'tt> MatcherPos<'tt> {
220
223
221
224
#[ derive( Clone ) ]
222
225
struct MatcherPosRepetition < ' tt > {
223
- /// The KleeneOp of this sequence.
224
- seq_op : mbe:: KleeneOp ,
225
-
226
- /// The separator.
227
- sep : Option < Token > ,
228
-
229
226
/// The "parent" matcher position. That is, the matcher position just before we enter the
230
227
/// sequence.
231
228
up : Box < MatcherPos < ' tt > > ,
229
+
230
+ /// The sequence itself.
231
+ seq : & ' tt SequenceRepetition ,
232
232
}
233
233
234
234
enum EofItems < ' tt > {
@@ -274,22 +274,20 @@ pub(super) fn count_names(ms: &[TokenTree]) -> usize {
274
274
} )
275
275
}
276
276
277
- /// `NamedMatch` is a pattern-match result for a single `token::MATCH_NONTERMINAL`:
278
- /// so it is associated with a single ident in a parse, and all
279
- /// `MatchedNonterminal`s in the `NamedMatch` have the same non-terminal type
280
- /// (expr, item, etc). Each leaf in a single `NamedMatch` corresponds to a
281
- /// single `token::MATCH_NONTERMINAL` in the `TokenTree` that produced it.
277
+ /// `NamedMatch` is a pattern-match result for a single metavar. All
278
+ /// `MatchedNtNonTt`s in the `NamedMatch` have the same non-terminal type
279
+ /// (expr, item, etc).
282
280
///
283
281
/// The in-memory structure of a particular `NamedMatch` represents the match
284
282
/// that occurred when a particular subset of a matcher was applied to a
285
283
/// particular token tree.
286
284
///
287
285
/// The width of each `MatchedSeq` in the `NamedMatch`, and the identity of
288
- /// the `MatchedNonterminal `s, will depend on the token tree it was applied
289
- /// to: each `MatchedSeq` corresponds to a single `TTSeq` in the originating
286
+ /// the `MatchedNtNonTts `s, will depend on the token tree it was applied
287
+ /// to: each `MatchedSeq` corresponds to a single repetition in the originating
290
288
/// token tree. The depth of the `NamedMatch` structure will therefore depend
291
- /// only on the nesting depth of `ast::TTSeq`s in the originating
292
- /// token tree it was derived from.
289
+ /// only on the nesting depth of repetitions in the originating token tree it
290
+ /// was derived from.
293
291
///
294
292
/// In layman's terms: `NamedMatch` will form a tree representing nested matches of a particular
295
293
/// meta variable. For example, if we are matching the following macro against the following
@@ -308,24 +306,32 @@ pub(super) fn count_names(ms: &[TokenTree]) -> usize {
308
306
/// ```rust
309
307
/// MatchedSeq([
310
308
/// MatchedSeq([
311
- /// MatchedNonterminal (a),
312
- /// MatchedNonterminal (b),
313
- /// MatchedNonterminal (c),
314
- /// MatchedNonterminal (d),
309
+ /// MatchedNtNonTt (a),
310
+ /// MatchedNtNonTt (b),
311
+ /// MatchedNtNonTt (c),
312
+ /// MatchedNtNonTt (d),
315
313
/// ]),
316
314
/// MatchedSeq([
317
- /// MatchedNonterminal (a),
318
- /// MatchedNonterminal (b),
319
- /// MatchedNonterminal (c),
320
- /// MatchedNonterminal (d),
321
- /// MatchedNonterminal (e),
315
+ /// MatchedNtNonTt (a),
316
+ /// MatchedNtNonTt (b),
317
+ /// MatchedNtNonTt (c),
318
+ /// MatchedNtNonTt (d),
319
+ /// MatchedNtNonTt (e),
322
320
/// ])
323
321
/// ])
324
322
/// ```
325
323
#[ derive( Debug , Clone ) ]
326
324
crate enum NamedMatch {
327
325
MatchedSeq ( Lrc < NamedMatchVec > ) ,
328
- MatchedNonterminal ( Lrc < Nonterminal > ) ,
326
+
327
+ // This variant should never hold an `NtTT`. `MatchedNtTt` should be used
328
+ // for that case.
329
+ MatchedNtNonTt ( Lrc < Nonterminal > ) ,
330
+
331
+ // `NtTT` is handled without any cloning when transcribing, unlike other
332
+ // nonterminals. Therefore, an `Lrc` isn't helpful and causes unnecessary
333
+ // allocations. Hence this separate variant.
334
+ MatchedNtTt ( rustc_ast:: tokenstream:: TokenTree ) ,
329
335
}
330
336
331
337
/// Takes a slice of token trees `ms` representing a matcher which successfully matched input
@@ -546,14 +552,19 @@ impl<'tt> TtParser<'tt> {
546
552
self . cur_items . push ( new_pos) ;
547
553
}
548
554
549
- if idx == len && repetition. sep . is_some ( ) {
550
- if repetition. sep . as_ref ( ) . map_or ( false , |sep| token_name_eq ( token, sep) ) {
555
+ if idx == len && repetition. seq . separator . is_some ( ) {
556
+ if repetition
557
+ . seq
558
+ . separator
559
+ . as_ref ( )
560
+ . map_or ( false , |sep| token_name_eq ( token, sep) )
561
+ {
551
562
// The matcher has a separator, and it matches the current token. We can
552
563
// advance past the separator token.
553
564
item. idx += 1 ;
554
565
self . next_items . push ( item) ;
555
566
}
556
- } else if repetition. seq_op != mbe:: KleeneOp :: ZeroOrOne {
567
+ } else if repetition. seq . kleene . op != mbe:: KleeneOp :: ZeroOrOne {
557
568
// We don't need a separator. Move the "dot" back to the beginning of the
558
569
// matcher and try to match again UNLESS we are only allowed to have _one_
559
570
// repetition.
@@ -665,7 +676,11 @@ impl<'tt> TtParser<'tt> {
665
676
}
666
677
Ok ( nt) => nt,
667
678
} ;
668
- item. push_match ( match_cur, MatchedNonterminal ( Lrc :: new ( nt) ) ) ;
679
+ let m = match nt {
680
+ Nonterminal :: NtTT ( tt) => MatchedNtTt ( tt) ,
681
+ _ => MatchedNtNonTt ( Lrc :: new ( nt) ) ,
682
+ } ;
683
+ item. push_match ( match_cur, m) ;
669
684
item. idx += 1 ;
670
685
item. match_cur += 1 ;
671
686
} else {
0 commit comments