cranelift_reader/
parser.rs

1//! Parser for .clif files.
2
3use crate::error::{Location, ParseError, ParseResult};
4use crate::isaspec;
5use crate::lexer::{LexError, Lexer, LocatedError, LocatedToken, Token};
6use crate::run_command::{Comparison, Invocation, RunCommand};
7use crate::sourcemap::SourceMap;
8use crate::testcommand::TestCommand;
9use crate::testfile::{Comment, Details, Feature, TestFile};
10use cranelift_codegen::data_value::DataValue;
11use cranelift_codegen::entity::{EntityRef, PrimaryMap};
12use cranelift_codegen::ir::entities::{AnyEntity, DynamicType, MemoryType};
13use cranelift_codegen::ir::immediates::{
14    Ieee16, Ieee32, Ieee64, Ieee128, Imm64, Offset32, Uimm32, Uimm64,
15};
16use cranelift_codegen::ir::instructions::{InstructionData, InstructionFormat, VariableArgs};
17use cranelift_codegen::ir::pcc::{BaseExpr, Expr, Fact};
18use cranelift_codegen::ir::{self, StackSlotKey, UserExternalNameRef};
19use cranelift_codegen::ir::{DebugTag, types::*};
20
21use cranelift_codegen::ir::{
22    AbiParam, ArgumentExtension, ArgumentPurpose, Block, BlockArg, Constant, ConstantData,
23    DynamicStackSlot, DynamicStackSlotData, DynamicTypeData, ExtFuncData, ExternalName, FuncRef,
24    Function, GlobalValue, GlobalValueData, JumpTableData, MemFlags, MemoryTypeData,
25    MemoryTypeField, Opcode, SigRef, Signature, StackSlot, StackSlotData, StackSlotKind,
26    UserFuncName, Value, types,
27};
28use cranelift_codegen::isa::{self, CallConv};
29use cranelift_codegen::packed_option::ReservedValue;
30use cranelift_codegen::{settings, settings::Configurable, timing};
31use smallvec::SmallVec;
32use std::mem;
33use std::str::FromStr;
34use std::{u16, u32};
35use target_lexicon::Triple;
36
37macro_rules! match_imm {
38    ($signed:ty, $unsigned:ty, $parser:expr, $err_msg:expr) => {{
39        if let Some(Token::Integer(text)) = $parser.token() {
40            $parser.consume();
41            let negative = text.starts_with('-');
42            let positive = text.starts_with('+');
43            let text = if negative || positive {
44                // Strip sign prefix.
45                &text[1..]
46            } else {
47                text
48            };
49
50            // Parse the text value; the lexer gives us raw text that looks like an integer.
51            let value = if text.starts_with("0x") {
52                // Skip underscores.
53                let text = text.replace("_", "");
54                // Parse it in hexadecimal form.
55                <$unsigned>::from_str_radix(&text[2..], 16).map_err(|_| {
56                    $parser.error(&format!(
57                        "unable to parse '{}' value as a hexadecimal {} immediate",
58                        &text[2..],
59                        stringify!($unsigned),
60                    ))
61                })?
62            } else {
63                // Parse it as a signed type to check for overflow and other issues.
64                text.parse()
65                    .map_err(|_| $parser.error("expected decimal immediate"))?
66            };
67
68            // Apply sign if necessary.
69            let signed = if negative {
70                let value = value.wrapping_neg() as $signed;
71                if value > 0 {
72                    return Err($parser.error("negative number too small"));
73                }
74                value
75            } else {
76                value as $signed
77            };
78
79            Ok(signed)
80        } else {
81            err!($parser.loc, $err_msg)
82        }
83    }};
84}
85
86/// After some quick benchmarks a program should never have more than 100,000 blocks.
87const MAX_BLOCKS_IN_A_FUNCTION: u32 = 100_000;
88
89/// Parse the entire `text` into a list of functions.
90///
91/// Any test commands or target declarations are ignored.
92pub fn parse_functions(text: &str) -> ParseResult<Vec<Function>> {
93    let _tt = timing::parse_text();
94    parse_test(text, ParseOptions::default())
95        .map(|file| file.functions.into_iter().map(|(func, _)| func).collect())
96}
97
98/// Options for configuring the parsing of filetests.
99pub struct ParseOptions<'a> {
100    /// Compiler passes to run on the parsed functions.
101    pub passes: Option<&'a [String]>,
102    /// Target ISA for compiling the parsed functions, e.g. "x86_64 skylake".
103    pub target: Option<&'a str>,
104    /// Default calling convention used when none is specified for a parsed function.
105    pub default_calling_convention: CallConv,
106    /// Default for unwind-info setting (enabled or disabled).
107    pub unwind_info: bool,
108    /// Default for machine_code_cfg_info setting (enabled or disabled).
109    pub machine_code_cfg_info: bool,
110}
111
112impl Default for ParseOptions<'_> {
113    fn default() -> Self {
114        Self {
115            passes: None,
116            target: None,
117            default_calling_convention: CallConv::Fast,
118            unwind_info: false,
119            machine_code_cfg_info: false,
120        }
121    }
122}
123
124/// Parse the entire `text` as a test case file.
125///
126/// The returned `TestFile` contains direct references to substrings of `text`.
127pub fn parse_test<'a>(text: &'a str, options: ParseOptions<'a>) -> ParseResult<TestFile<'a>> {
128    let _tt = timing::parse_text();
129    let mut parser = Parser::new(text);
130
131    // Gather the preamble comments.
132    parser.start_gathering_comments();
133
134    let isa_spec: isaspec::IsaSpec;
135    let commands: Vec<TestCommand<'a>>;
136
137    // Check for specified passes and target, if present throw out test commands/targets specified
138    // in file.
139    match options.passes {
140        Some(pass_vec) => {
141            parser.parse_test_commands();
142            commands = parser.parse_cmdline_passes(pass_vec);
143            parser.parse_target_specs(&options)?;
144            isa_spec = parser.parse_cmdline_target(options.target)?;
145        }
146        None => {
147            commands = parser.parse_test_commands();
148            isa_spec = parser.parse_target_specs(&options)?;
149        }
150    };
151    let features = parser.parse_cranelift_features()?;
152
153    // Decide between using the calling convention passed in the options or using the
154    // host's calling convention--if any tests are to be run on the host we should default to the
155    // host's calling convention.
156    parser = if commands.iter().any(|tc| tc.command == "run") {
157        let host_default_calling_convention = CallConv::triple_default(&Triple::host());
158        parser.with_default_calling_convention(host_default_calling_convention)
159    } else {
160        parser.with_default_calling_convention(options.default_calling_convention)
161    };
162
163    parser.token();
164    parser.claim_gathered_comments(AnyEntity::Function);
165
166    let preamble_comments = parser.take_comments();
167    let functions = parser.parse_function_list()?;
168
169    Ok(TestFile {
170        commands,
171        isa_spec,
172        features,
173        preamble_comments,
174        functions,
175    })
176}
177
178/// Parse a CLIF comment `text` as a run command.
179///
180/// Return:
181///  - `Ok(None)` if the comment is not intended to be a `RunCommand` (i.e. does not start with `run`
182///    or `print`
183///  - `Ok(Some(command))` if the comment is intended as a `RunCommand` and can be parsed to one
184///  - `Err` otherwise.
185pub fn parse_run_command(text: &str, signature: &Signature) -> ParseResult<Option<RunCommand>> {
186    let _tt = timing::parse_text();
187    // We remove leading spaces and semi-colons for convenience here instead of at the call sites
188    // since this function will be attempting to parse a RunCommand from a CLIF comment.
189    let trimmed_text = text.trim_start_matches(|c| c == ' ' || c == ';');
190    let mut parser = Parser::new(trimmed_text);
191    match parser.token() {
192        Some(Token::Identifier("run")) | Some(Token::Identifier("print")) => {
193            parser.parse_run_command(signature).map(|c| Some(c))
194        }
195        Some(_) | None => Ok(None),
196    }
197}
198
199pub struct Parser<'a> {
200    lex: Lexer<'a>,
201
202    lex_error: Option<LexError>,
203
204    /// Current lookahead token.
205    lookahead: Option<Token<'a>>,
206
207    /// Location of lookahead.
208    loc: Location,
209
210    /// Are we gathering any comments that we encounter?
211    gathering_comments: bool,
212
213    /// The gathered comments; claim them with `claim_gathered_comments`.
214    gathered_comments: Vec<&'a str>,
215
216    /// Comments collected so far.
217    comments: Vec<Comment<'a>>,
218
219    /// Maps inlined external names to a ref value, so they can be declared before parsing the rest
220    /// of the function later.
221    ///
222    /// This maintains backward compatibility with previous ways for declaring external names.
223    predeclared_external_names: PrimaryMap<UserExternalNameRef, ir::UserExternalName>,
224
225    /// Default calling conventions; used when none is specified.
226    default_calling_convention: CallConv,
227}
228
229/// Context for resolving references when parsing a single function.
230struct Context {
231    function: Function,
232    map: SourceMap,
233
234    /// Aliases to resolve once value definitions are known.
235    aliases: Vec<Value>,
236}
237
238impl Context {
239    fn new(f: Function) -> Self {
240        Self {
241            function: f,
242            map: SourceMap::new(),
243            aliases: Vec::new(),
244        }
245    }
246
247    // Allocate a new stack slot.
248    fn add_ss(&mut self, ss: StackSlot, data: StackSlotData, loc: Location) -> ParseResult<()> {
249        self.map.def_ss(ss, loc)?;
250        while self.function.sized_stack_slots.next_key().index() <= ss.index() {
251            self.function.create_sized_stack_slot(StackSlotData::new(
252                StackSlotKind::ExplicitSlot,
253                0,
254                0,
255            ));
256        }
257        self.function.sized_stack_slots[ss] = data;
258        Ok(())
259    }
260
261    // Resolve a reference to a stack slot.
262    fn check_ss(&self, ss: StackSlot, loc: Location) -> ParseResult<()> {
263        if !self.map.contains_ss(ss) {
264            err!(loc, "undefined stack slot {}", ss)
265        } else {
266            Ok(())
267        }
268    }
269
270    // Allocate a new stack slot.
271    fn add_dss(
272        &mut self,
273        ss: DynamicStackSlot,
274        data: DynamicStackSlotData,
275        loc: Location,
276    ) -> ParseResult<()> {
277        self.map.def_dss(ss, loc)?;
278        while self.function.dynamic_stack_slots.next_key().index() <= ss.index() {
279            self.function
280                .create_dynamic_stack_slot(DynamicStackSlotData::new(
281                    StackSlotKind::ExplicitDynamicSlot,
282                    data.dyn_ty,
283                ));
284        }
285        self.function.dynamic_stack_slots[ss] = data;
286        Ok(())
287    }
288
289    // Resolve a reference to a dynamic stack slot.
290    fn check_dss(&self, dss: DynamicStackSlot, loc: Location) -> ParseResult<()> {
291        if !self.map.contains_dss(dss) {
292            err!(loc, "undefined dynamic stack slot {}", dss)
293        } else {
294            Ok(())
295        }
296    }
297
298    // Allocate a new dynamic type.
299    fn add_dt(&mut self, dt: DynamicType, data: DynamicTypeData, loc: Location) -> ParseResult<()> {
300        self.map.def_dt(dt, loc)?;
301        while self.function.dfg.dynamic_types.next_key().index() <= dt.index() {
302            self.function.dfg.make_dynamic_ty(DynamicTypeData::new(
303                data.base_vector_ty,
304                data.dynamic_scale,
305            ));
306        }
307        self.function.dfg.dynamic_types[dt] = data;
308        Ok(())
309    }
310
311    // Allocate a global value slot.
312    fn add_gv(
313        &mut self,
314        gv: GlobalValue,
315        data: GlobalValueData,
316        maybe_fact: Option<Fact>,
317        loc: Location,
318    ) -> ParseResult<()> {
319        self.map.def_gv(gv, loc)?;
320        while self.function.global_values.next_key().index() <= gv.index() {
321            self.function.create_global_value(GlobalValueData::Symbol {
322                name: ExternalName::testcase(""),
323                offset: Imm64::new(0),
324                colocated: false,
325                tls: false,
326            });
327        }
328        self.function.global_values[gv] = data;
329        if let Some(fact) = maybe_fact {
330            self.function.global_value_facts[gv] = Some(fact);
331        }
332        Ok(())
333    }
334
335    // Allocate a memory-type slot.
336    fn add_mt(&mut self, mt: MemoryType, data: MemoryTypeData, loc: Location) -> ParseResult<()> {
337        self.map.def_mt(mt, loc)?;
338        while self.function.memory_types.next_key().index() <= mt.index() {
339            self.function.create_memory_type(MemoryTypeData::default());
340        }
341        self.function.memory_types[mt] = data;
342        Ok(())
343    }
344
345    // Resolve a reference to a global value.
346    fn check_gv(&self, gv: GlobalValue, loc: Location) -> ParseResult<()> {
347        if !self.map.contains_gv(gv) {
348            err!(loc, "undefined global value {}", gv)
349        } else {
350            Ok(())
351        }
352    }
353
354    // Allocate a new signature.
355    fn add_sig(
356        &mut self,
357        sig: SigRef,
358        data: Signature,
359        loc: Location,
360        defaultcc: CallConv,
361    ) -> ParseResult<()> {
362        self.map.def_sig(sig, loc)?;
363        while self.function.dfg.signatures.next_key().index() <= sig.index() {
364            self.function.import_signature(Signature::new(defaultcc));
365        }
366        self.function.dfg.signatures[sig] = data;
367        Ok(())
368    }
369
370    // Resolve a reference to a signature.
371    fn check_sig(&self, sig: SigRef, loc: Location) -> ParseResult<()> {
372        if !self.map.contains_sig(sig) {
373            err!(loc, "undefined signature {}", sig)
374        } else {
375            Ok(())
376        }
377    }
378
379    // Allocate a new external function.
380    fn add_fn(&mut self, fn_: FuncRef, data: ExtFuncData, loc: Location) -> ParseResult<()> {
381        self.map.def_fn(fn_, loc)?;
382        while self.function.dfg.ext_funcs.next_key().index() <= fn_.index() {
383            self.function.import_function(ExtFuncData {
384                name: ExternalName::testcase(""),
385                signature: SigRef::reserved_value(),
386                colocated: false,
387                patchable: false,
388            });
389        }
390        self.function.dfg.ext_funcs[fn_] = data;
391        Ok(())
392    }
393
394    // Resolve a reference to a function.
395    fn check_fn(&self, fn_: FuncRef, loc: Location) -> ParseResult<()> {
396        if !self.map.contains_fn(fn_) {
397            err!(loc, "undefined function {}", fn_)
398        } else {
399            Ok(())
400        }
401    }
402
403    // Allocate a new constant.
404    fn add_constant(
405        &mut self,
406        constant: Constant,
407        data: ConstantData,
408        loc: Location,
409    ) -> ParseResult<()> {
410        self.map.def_constant(constant, loc)?;
411        self.function.dfg.constants.set(constant, data);
412        Ok(())
413    }
414
415    // Configure the stack limit of the current function.
416    fn add_stack_limit(&mut self, limit: GlobalValue, loc: Location) -> ParseResult<()> {
417        if self.function.stack_limit.is_some() {
418            return err!(loc, "stack limit defined twice");
419        }
420        self.function.stack_limit = Some(limit);
421        Ok(())
422    }
423
424    // Resolve a reference to a constant.
425    fn check_constant(&self, c: Constant, loc: Location) -> ParseResult<()> {
426        if !self.map.contains_constant(c) {
427            err!(loc, "undefined constant {}", c)
428        } else {
429            Ok(())
430        }
431    }
432
433    // Allocate a new block.
434    fn add_block(&mut self, block: Block, loc: Location) -> ParseResult<Block> {
435        self.map.def_block(block, loc)?;
436        while self.function.dfg.num_blocks() <= block.index() {
437            self.function.dfg.make_block();
438        }
439        self.function.layout.append_block(block);
440        Ok(block)
441    }
442
443    /// Set a block as cold.
444    fn set_cold_block(&mut self, block: Block) {
445        self.function.layout.set_cold(block);
446    }
447}
448
449impl<'a> Parser<'a> {
450    /// Create a new `Parser` which reads `text`. The referenced text must outlive the parser.
451    pub fn new(text: &'a str) -> Self {
452        Self {
453            lex: Lexer::new(text),
454            lex_error: None,
455            lookahead: None,
456            loc: Location { line_number: 0 },
457            gathering_comments: false,
458            gathered_comments: Vec::new(),
459            comments: Vec::new(),
460            default_calling_convention: CallConv::Fast,
461            predeclared_external_names: Default::default(),
462        }
463    }
464
465    /// Modify the default calling convention; returns a new parser with the changed calling
466    /// convention.
467    pub fn with_default_calling_convention(self, default_calling_convention: CallConv) -> Self {
468        Self {
469            default_calling_convention,
470            ..self
471        }
472    }
473
474    // Consume the current lookahead token and return it.
475    fn consume(&mut self) -> Token<'a> {
476        self.lookahead.take().expect("No token to consume")
477    }
478
479    // Consume the whole line following the current lookahead token.
480    // Return the text of the line tail.
481    fn consume_line(&mut self) -> &'a str {
482        let rest = self.lex.rest_of_line();
483        self.consume();
484        rest
485    }
486
487    // Get the current lookahead token, after making sure there is one.
488    fn token(&mut self) -> Option<Token<'a>> {
489        while self.lookahead.is_none() {
490            match self.lex.next() {
491                Some(Ok(LocatedToken { token, location })) => {
492                    match token {
493                        Token::Comment(text) => {
494                            if self.gathering_comments {
495                                self.gathered_comments.push(text);
496                            }
497                        }
498                        _ => self.lookahead = Some(token),
499                    }
500                    self.loc = location;
501                }
502                Some(Err(LocatedError { error, location })) => {
503                    self.lex_error = Some(error);
504                    self.loc = location;
505                    break;
506                }
507                None => break,
508            }
509        }
510        self.lookahead
511    }
512
513    // Enable gathering of all comments encountered.
514    fn start_gathering_comments(&mut self) {
515        debug_assert!(!self.gathering_comments);
516        self.gathering_comments = true;
517        debug_assert!(self.gathered_comments.is_empty());
518    }
519
520    // Claim the comments gathered up to the current position for the
521    // given entity.
522    fn claim_gathered_comments<E: Into<AnyEntity>>(&mut self, entity: E) {
523        debug_assert!(self.gathering_comments);
524        let entity = entity.into();
525        self.comments.extend(
526            self.gathered_comments
527                .drain(..)
528                .map(|text| Comment { entity, text }),
529        );
530        self.gathering_comments = false;
531    }
532
533    // Get the comments collected so far, clearing out the internal list.
534    fn take_comments(&mut self) -> Vec<Comment<'a>> {
535        debug_assert!(!self.gathering_comments);
536        mem::replace(&mut self.comments, Vec::new())
537    }
538
539    // Match and consume a token without payload.
540    fn match_token(&mut self, want: Token<'a>, err_msg: &str) -> ParseResult<Token<'a>> {
541        if self.token() == Some(want) {
542            Ok(self.consume())
543        } else {
544            err!(self.loc, err_msg)
545        }
546    }
547
548    // If the next token is a `want`, consume it, otherwise do nothing.
549    fn optional(&mut self, want: Token<'a>) -> bool {
550        if self.token() == Some(want) {
551            self.consume();
552            true
553        } else {
554            false
555        }
556    }
557
558    // Match and consume a specific identifier string.
559    // Used for pseudo-keywords like "stack_slot" that only appear in certain contexts.
560    fn match_identifier(&mut self, want: &'static str, err_msg: &str) -> ParseResult<Token<'a>> {
561        if self.token() == Some(Token::Identifier(want)) {
562            Ok(self.consume())
563        } else {
564            err!(self.loc, err_msg)
565        }
566    }
567
568    // Match and consume a type.
569    fn match_type(&mut self, err_msg: &str) -> ParseResult<Type> {
570        if let Some(Token::Type(t)) = self.token() {
571            self.consume();
572            Ok(t)
573        } else {
574            err!(self.loc, err_msg)
575        }
576    }
577
578    // Match and consume a stack slot reference.
579    fn match_ss(&mut self, err_msg: &str) -> ParseResult<StackSlot> {
580        if let Some(Token::StackSlot(ss)) = self.token() {
581            self.consume();
582            if let Some(ss) = StackSlot::with_number(ss) {
583                return Ok(ss);
584            }
585        }
586        err!(self.loc, err_msg)
587    }
588
589    // Match and consume a dynamic stack slot reference.
590    fn match_dss(&mut self, err_msg: &str) -> ParseResult<DynamicStackSlot> {
591        if let Some(Token::DynamicStackSlot(ss)) = self.token() {
592            self.consume();
593            if let Some(ss) = DynamicStackSlot::with_number(ss) {
594                return Ok(ss);
595            }
596        }
597        err!(self.loc, err_msg)
598    }
599
600    // Match and consume a dynamic type reference.
601    fn match_dt(&mut self, err_msg: &str) -> ParseResult<DynamicType> {
602        if let Some(Token::DynamicType(dt)) = self.token() {
603            self.consume();
604            if let Some(dt) = DynamicType::with_number(dt) {
605                return Ok(dt);
606            }
607        }
608        err!(self.loc, err_msg)
609    }
610
611    // Extract Type from DynamicType
612    fn concrete_from_dt(&mut self, dt: DynamicType, ctx: &mut Context) -> Option<Type> {
613        ctx.function.get_concrete_dynamic_ty(dt)
614    }
615
616    // Match and consume a global value reference.
617    fn match_gv(&mut self, err_msg: &str) -> ParseResult<GlobalValue> {
618        if let Some(Token::GlobalValue(gv)) = self.token() {
619            self.consume();
620            if let Some(gv) = GlobalValue::with_number(gv) {
621                return Ok(gv);
622            }
623        }
624        err!(self.loc, err_msg)
625    }
626
627    // Match and consume a function reference.
628    fn match_fn(&mut self, err_msg: &str) -> ParseResult<FuncRef> {
629        if let Some(Token::FuncRef(fnref)) = self.token() {
630            self.consume();
631            if let Some(fnref) = FuncRef::with_number(fnref) {
632                return Ok(fnref);
633            }
634        }
635        err!(self.loc, err_msg)
636    }
637
638    // Match and consume a signature reference.
639    fn match_sig(&mut self, err_msg: &str) -> ParseResult<SigRef> {
640        if let Some(Token::SigRef(sigref)) = self.token() {
641            self.consume();
642            if let Some(sigref) = SigRef::with_number(sigref) {
643                return Ok(sigref);
644            }
645        }
646        err!(self.loc, err_msg)
647    }
648
649    // Match and consume a memory-type reference.
650    fn match_mt(&mut self, err_msg: &str) -> ParseResult<MemoryType> {
651        if let Some(Token::MemoryType(mt)) = self.token() {
652            self.consume();
653            if let Some(mt) = MemoryType::with_number(mt) {
654                return Ok(mt);
655            }
656        }
657        err!(self.loc, err_msg)
658    }
659
660    // Match and consume a constant reference.
661    fn match_constant(&mut self) -> ParseResult<Constant> {
662        if let Some(Token::Constant(c)) = self.token() {
663            self.consume();
664            if let Some(c) = Constant::with_number(c) {
665                return Ok(c);
666            }
667        }
668        err!(self.loc, "expected constant number: const«n»")
669    }
670
671    // Match and consume a stack limit token
672    fn match_stack_limit(&mut self) -> ParseResult<()> {
673        if let Some(Token::Identifier("stack_limit")) = self.token() {
674            self.consume();
675            return Ok(());
676        }
677        err!(self.loc, "expected identifier: stack_limit")
678    }
679
680    // Match and consume a block reference.
681    fn match_block(&mut self, err_msg: &str) -> ParseResult<Block> {
682        if let Some(Token::Block(block)) = self.token() {
683            self.consume();
684            Ok(block)
685        } else {
686            err!(self.loc, err_msg)
687        }
688    }
689
690    // Match and consume a value reference.
691    fn match_value(&mut self, err_msg: &str) -> ParseResult<Value> {
692        if let Some(Token::Value(v)) = self.token() {
693            self.consume();
694            Ok(v)
695        } else {
696            err!(self.loc, err_msg)
697        }
698    }
699
700    fn error(&self, message: &str) -> ParseError {
701        ParseError {
702            location: self.loc,
703            message: message.to_string(),
704            is_warning: false,
705        }
706    }
707
708    // Match and consume an Imm64 immediate.
709    fn match_imm64(&mut self, err_msg: &str) -> ParseResult<Imm64> {
710        if let Some(Token::Integer(text)) = self.token() {
711            self.consume();
712            // Lexer just gives us raw text that looks like an integer.
713            // Parse it as an Imm64 to check for overflow and other issues.
714            text.parse().map_err(|e| self.error(e))
715        } else {
716            err!(self.loc, err_msg)
717        }
718    }
719
720    // Match and consume a hexadeximal immediate
721    fn match_hexadecimal_constant(&mut self, err_msg: &str) -> ParseResult<ConstantData> {
722        if let Some(Token::Integer(text)) = self.token() {
723            self.consume();
724            text.parse().map_err(|e| {
725                self.error(&format!(
726                    "expected hexadecimal immediate, failed to parse: {e}"
727                ))
728            })
729        } else {
730            err!(self.loc, err_msg)
731        }
732    }
733
734    // Match and consume either a hexadecimal Uimm128 immediate (e.g. 0x000102...) or its literal
735    // list form (e.g. [0 1 2...]). For convenience, since uimm128 values are stored in the
736    // `ConstantPool`, this returns `ConstantData`.
737    fn match_uimm128(&mut self, controlling_type: Type) -> ParseResult<ConstantData> {
738        let expected_size = controlling_type.bytes() as usize;
739        let constant_data = if self.optional(Token::LBracket) {
740            // parse using a list of values, e.g. vconst.i32x4 [0 1 2 3]
741            let uimm128 = self.parse_literals_to_constant_data(controlling_type)?;
742            self.match_token(Token::RBracket, "expected a terminating right bracket")?;
743            uimm128
744        } else {
745            // parse using a hexadecimal value, e.g. 0x000102...
746            let uimm128 =
747                self.match_hexadecimal_constant("expected an immediate hexadecimal operand")?;
748            uimm128.expand_to(expected_size)
749        };
750
751        if constant_data.len() == expected_size {
752            Ok(constant_data)
753        } else {
754            Err(self.error(&format!(
755                "expected parsed constant to have {expected_size} bytes"
756            )))
757        }
758    }
759
760    // Match and consume a Uimm64 immediate.
761    fn match_uimm64(&mut self, err_msg: &str) -> ParseResult<Uimm64> {
762        if let Some(Token::Integer(text)) = self.token() {
763            self.consume();
764            // Lexer just gives us raw text that looks like an integer.
765            // Parse it as an Uimm64 to check for overflow and other issues.
766            text.parse()
767                .map_err(|_| self.error("expected u64 decimal immediate"))
768        } else {
769            err!(self.loc, err_msg)
770        }
771    }
772
773    // Match and consume a Uimm32 immediate.
774    fn match_uimm32(&mut self, err_msg: &str) -> ParseResult<Uimm32> {
775        if let Some(Token::Integer(text)) = self.token() {
776            self.consume();
777            // Lexer just gives us raw text that looks like an integer.
778            // Parse it as an Uimm32 to check for overflow and other issues.
779            text.parse().map_err(|e| self.error(e))
780        } else {
781            err!(self.loc, err_msg)
782        }
783    }
784
785    // Match and consume a u8 immediate.
786    // This is used for lane numbers in SIMD vectors.
787    fn match_uimm8(&mut self, err_msg: &str) -> ParseResult<u8> {
788        if let Some(Token::Integer(text)) = self.token() {
789            self.consume();
790            // Lexer just gives us raw text that looks like an integer.
791            if let Some(num) = text.strip_prefix("0x") {
792                // Parse it as a u8 in hexadecimal form.
793                u8::from_str_radix(num, 16)
794                    .map_err(|_| self.error("unable to parse u8 as a hexadecimal immediate"))
795            } else {
796                // Parse it as a u8 to check for overflow and other issues.
797                text.parse()
798                    .map_err(|_| self.error("expected u8 decimal immediate"))
799            }
800        } else {
801            err!(self.loc, err_msg)
802        }
803    }
804
805    // Match and consume an i8 immediate.
806    fn match_imm8(&mut self, err_msg: &str) -> ParseResult<i8> {
807        match_imm!(i8, u8, self, err_msg)
808    }
809
810    // Match and consume a signed 16-bit immediate.
811    fn match_imm16(&mut self, err_msg: &str) -> ParseResult<i16> {
812        match_imm!(i16, u16, self, err_msg)
813    }
814
815    // Match and consume an i32 immediate.
816    // This is used for stack argument byte offsets.
817    fn match_imm32(&mut self, err_msg: &str) -> ParseResult<i32> {
818        match_imm!(i32, u32, self, err_msg)
819    }
820
821    // Match and consume an i128 immediate.
822    fn match_imm128(&mut self, err_msg: &str) -> ParseResult<i128> {
823        match_imm!(i128, u128, self, err_msg)
824    }
825
826    // Match and consume an optional offset32 immediate.
827    //
828    // Note that this will match an empty string as an empty offset, and that if an offset is
829    // present, it must contain a sign.
830    fn optional_offset32(&mut self) -> ParseResult<Offset32> {
831        if let Some(Token::Integer(text)) = self.token() {
832            if text.starts_with('+') || text.starts_with('-') {
833                self.consume();
834                // Lexer just gives us raw text that looks like an integer.
835                // Parse it as an `Offset32` to check for overflow and other issues.
836                return text.parse().map_err(|e| self.error(e));
837            }
838        }
839        // An offset32 operand can be absent.
840        Ok(Offset32::new(0))
841    }
842
843    // Match and consume an optional offset32 immediate.
844    //
845    // Note that this will match an empty string as an empty offset, and that if an offset is
846    // present, it must contain a sign.
847    fn optional_offset_imm64(&mut self) -> ParseResult<Imm64> {
848        if let Some(Token::Integer(text)) = self.token() {
849            if text.starts_with('+') || text.starts_with('-') {
850                self.consume();
851                // Lexer just gives us raw text that looks like an integer.
852                // Parse it as an `Offset32` to check for overflow and other issues.
853                return text.parse().map_err(|e| self.error(e));
854            }
855        }
856        // If no explicit offset is present, the offset is 0.
857        Ok(Imm64::new(0))
858    }
859
860    // Match and consume an Ieee16 immediate.
861    fn match_ieee16(&mut self, err_msg: &str) -> ParseResult<Ieee16> {
862        if let Some(Token::Float(text)) = self.token() {
863            self.consume();
864            // Lexer just gives us raw text that looks like a float.
865            // Parse it as an Ieee16 to check for the right number of digits and other issues.
866            text.parse().map_err(|e| self.error(e))
867        } else {
868            err!(self.loc, err_msg)
869        }
870    }
871
872    // Match and consume an Ieee32 immediate.
873    fn match_ieee32(&mut self, err_msg: &str) -> ParseResult<Ieee32> {
874        if let Some(Token::Float(text)) = self.token() {
875            self.consume();
876            // Lexer just gives us raw text that looks like a float.
877            // Parse it as an Ieee32 to check for the right number of digits and other issues.
878            text.parse().map_err(|e| self.error(e))
879        } else {
880            err!(self.loc, err_msg)
881        }
882    }
883
884    // Match and consume an Ieee64 immediate.
885    fn match_ieee64(&mut self, err_msg: &str) -> ParseResult<Ieee64> {
886        if let Some(Token::Float(text)) = self.token() {
887            self.consume();
888            // Lexer just gives us raw text that looks like a float.
889            // Parse it as an Ieee64 to check for the right number of digits and other issues.
890            text.parse().map_err(|e| self.error(e))
891        } else {
892            err!(self.loc, err_msg)
893        }
894    }
895
896    // Match and consume an Ieee128 immediate.
897    fn match_ieee128(&mut self, err_msg: &str) -> ParseResult<Ieee128> {
898        if let Some(Token::Float(text)) = self.token() {
899            self.consume();
900            // Lexer just gives us raw text that looks like a float.
901            // Parse it as an Ieee128 to check for the right number of digits and other issues.
902            text.parse().map_err(|e| self.error(e))
903        } else {
904            err!(self.loc, err_msg)
905        }
906    }
907
908    // Match and consume an enumerated immediate, like one of the condition codes.
909    fn match_enum<T: FromStr>(&mut self, err_msg: &str) -> ParseResult<T> {
910        if let Some(Token::Identifier(text)) = self.token() {
911            self.consume();
912            text.parse().map_err(|_| self.error(err_msg))
913        } else {
914            err!(self.loc, err_msg)
915        }
916    }
917
918    // Match and a consume a possibly empty sequence of memory operation flags.
919    fn optional_memflags(&mut self) -> ParseResult<MemFlags> {
920        let mut flags = MemFlags::new();
921        while let Some(Token::Identifier(text)) = self.token() {
922            match flags.set_by_name(text) {
923                Ok(true) => {
924                    self.consume();
925                }
926                Ok(false) => break,
927                Err(msg) => return err!(self.loc, msg),
928            }
929        }
930        Ok(flags)
931    }
932
933    // Match and consume an identifier.
934    fn match_any_identifier(&mut self, err_msg: &str) -> ParseResult<&'a str> {
935        if let Some(Token::Identifier(text)) = self.token() {
936            self.consume();
937            Ok(text)
938        } else {
939            err!(self.loc, err_msg)
940        }
941    }
942
943    /// Parse an optional source location.
944    ///
945    /// Return an optional source location if no real location is present.
946    fn optional_srcloc(&mut self) -> ParseResult<ir::SourceLoc> {
947        if let Some(Token::SourceLoc(text)) = self.token() {
948            match u32::from_str_radix(text, 16) {
949                Ok(num) => {
950                    self.consume();
951                    Ok(ir::SourceLoc::new(num))
952                }
953                Err(_) => return err!(self.loc, "invalid source location: {}", text),
954            }
955        } else {
956            Ok(Default::default())
957        }
958    }
959
960    /// Parse an optional list of debug tags.
961    fn optional_debug_tags(&mut self) -> ParseResult<Vec<DebugTag>> {
962        if self.optional(Token::LAngle) {
963            let mut tags = vec![];
964            while !self.optional(Token::RAngle) {
965                match self.token() {
966                    Some(Token::Integer(_)) => {
967                        let value: u32 = self.match_uimm32("expected a u32 value")?.into();
968                        tags.push(DebugTag::User(value));
969                    }
970                    Some(Token::StackSlot(slot)) => {
971                        self.consume();
972                        tags.push(DebugTag::StackSlot(StackSlot::from_u32(slot)));
973                    }
974                    _ => {
975                        return err!(
976                            self.loc,
977                            "expected integer user value or stack slot in debug tags"
978                        );
979                    }
980                }
981                if !self.optional(Token::Comma) {
982                    self.match_token(Token::RAngle, "expected `,` or `>`")?;
983                    break;
984                }
985            }
986            Ok(tags)
987        } else {
988            Ok(vec![])
989        }
990    }
991
992    /// Parse a list of literals (i.e. integers, floats, booleans); e.g. `0 1 2 3`, usually as
993    /// part of something like `vconst.i32x4 [0 1 2 3]`.
994    fn parse_literals_to_constant_data(&mut self, ty: Type) -> ParseResult<ConstantData> {
995        macro_rules! consume {
996            ( $ty:ident, $match_fn:expr ) => {{
997                assert!($ty.is_vector());
998                let mut data = ConstantData::default();
999                for _ in 0..$ty.lane_count() {
1000                    data = data.append($match_fn);
1001                }
1002                data
1003            }};
1004        }
1005
1006        if !ty.is_vector() && !ty.is_dynamic_vector() {
1007            err!(self.loc, "Expected a controlling vector type, not {}", ty)
1008        } else {
1009            let constant_data = match ty.lane_type() {
1010                I8 => consume!(ty, self.match_imm8("Expected an 8-bit integer")?),
1011                I16 => consume!(ty, self.match_imm16("Expected a 16-bit integer")?),
1012                I32 => consume!(ty, self.match_imm32("Expected a 32-bit integer")?),
1013                I64 => consume!(ty, self.match_imm64("Expected a 64-bit integer")?),
1014                F32 => consume!(ty, self.match_ieee32("Expected a 32-bit float")?),
1015                F64 => consume!(ty, self.match_ieee64("Expected a 64-bit float")?),
1016                _ => return err!(self.loc, "Expected a type of: float, int, bool"),
1017            };
1018            Ok(constant_data)
1019        }
1020    }
1021
1022    /// Parse a list of test command passes specified in command line.
1023    pub fn parse_cmdline_passes(&mut self, passes: &'a [String]) -> Vec<TestCommand<'a>> {
1024        let mut list = Vec::new();
1025        for pass in passes {
1026            list.push(TestCommand::new(pass));
1027        }
1028        list
1029    }
1030
1031    /// Parse a list of test commands.
1032    pub fn parse_test_commands(&mut self) -> Vec<TestCommand<'a>> {
1033        let mut list = Vec::new();
1034        while self.token() == Some(Token::Identifier("test")) {
1035            list.push(TestCommand::new(self.consume_line()));
1036        }
1037        list
1038    }
1039
1040    /// Parse a target spec.
1041    ///
1042    /// Accept the target from the command line for pass command.
1043    ///
1044    fn parse_cmdline_target(&mut self, target_pass: Option<&str>) -> ParseResult<isaspec::IsaSpec> {
1045        // Were there any `target` commands specified?
1046        let mut specified_target = false;
1047
1048        let mut targets = Vec::new();
1049        let flag_builder = settings::builder();
1050
1051        if let Some(targ) = target_pass {
1052            let loc = self.loc;
1053            let triple = match Triple::from_str(targ) {
1054                Ok(triple) => triple,
1055                Err(err) => return err!(loc, err),
1056            };
1057            let isa_builder = match isa::lookup(triple) {
1058                Err(isa::LookupError::SupportDisabled) => {
1059                    return err!(loc, "support disabled target '{}'", targ);
1060                }
1061                Err(isa::LookupError::Unsupported) => {
1062                    return warn!(loc, "unsupported target '{}'", targ);
1063                }
1064                Ok(b) => b,
1065            };
1066            specified_target = true;
1067
1068            // Construct a trait object with the aggregate settings.
1069            targets.push(
1070                isa_builder
1071                    .finish(settings::Flags::new(flag_builder.clone()))
1072                    .map_err(|e| ParseError {
1073                        location: loc,
1074                        message: format!("invalid ISA flags for '{targ}': {e:?}"),
1075                        is_warning: false,
1076                    })?,
1077            );
1078        }
1079
1080        if !specified_target {
1081            // No `target` commands.
1082            Ok(isaspec::IsaSpec::None(settings::Flags::new(flag_builder)))
1083        } else {
1084            Ok(isaspec::IsaSpec::Some(targets))
1085        }
1086    }
1087
1088    /// Parse a list of target specs.
1089    ///
1090    /// Accept a mix of `target` and `set` command lines. The `set` commands are cumulative.
1091    ///
1092    fn parse_target_specs(&mut self, options: &ParseOptions) -> ParseResult<isaspec::IsaSpec> {
1093        // Were there any `target` commands?
1094        let mut seen_target = false;
1095        // Location of last `set` command since the last `target`.
1096        let mut last_set_loc = None;
1097
1098        let mut targets = Vec::new();
1099        let mut flag_builder = settings::builder();
1100
1101        let bool_to_str = |val: bool| {
1102            if val { "true" } else { "false" }
1103        };
1104
1105        // default to enabling cfg info
1106        flag_builder
1107            .set(
1108                "machine_code_cfg_info",
1109                bool_to_str(options.machine_code_cfg_info),
1110            )
1111            .expect("machine_code_cfg_info option should be present");
1112
1113        flag_builder
1114            .set("unwind_info", bool_to_str(options.unwind_info))
1115            .expect("unwind_info option should be present");
1116
1117        while let Some(Token::Identifier(command)) = self.token() {
1118            match command {
1119                "set" => {
1120                    last_set_loc = Some(self.loc);
1121                    isaspec::parse_options(
1122                        self.consume_line().trim().split_whitespace(),
1123                        &mut flag_builder,
1124                        self.loc,
1125                    )
1126                    .map_err(|err| ParseError::from(err))?;
1127                }
1128                "target" => {
1129                    let loc = self.loc;
1130                    // Grab the whole line so the lexer won't go looking for tokens on the
1131                    // following lines.
1132                    let mut words = self.consume_line().trim().split_whitespace().peekable();
1133                    // Look for `target foo`.
1134                    let target_name = match words.next() {
1135                        Some(w) => w,
1136                        None => return err!(loc, "expected target triple"),
1137                    };
1138                    let triple = match Triple::from_str(target_name) {
1139                        Ok(triple) => triple,
1140                        Err(err) => return err!(loc, err),
1141                    };
1142                    let mut isa_builder = match isa::lookup(triple) {
1143                        Err(isa::LookupError::SupportDisabled) => {
1144                            continue;
1145                        }
1146                        Err(isa::LookupError::Unsupported) => {
1147                            return warn!(loc, "unsupported target '{}'", target_name);
1148                        }
1149                        Ok(b) => b,
1150                    };
1151                    last_set_loc = None;
1152                    seen_target = true;
1153                    // Apply the target-specific settings to `isa_builder`.
1154                    isaspec::parse_options(words, &mut isa_builder, self.loc)?;
1155
1156                    // Construct a trait object with the aggregate settings.
1157                    targets.push(
1158                        isa_builder
1159                            .finish(settings::Flags::new(flag_builder.clone()))
1160                            .map_err(|e| ParseError {
1161                                location: loc,
1162                                message: format!("invalid ISA flags for '{target_name}': {e:?}"),
1163                                is_warning: false,
1164                            })?,
1165                    );
1166                }
1167                _ => break,
1168            }
1169        }
1170
1171        if !seen_target {
1172            // No `target` commands, but we allow for `set` commands.
1173            Ok(isaspec::IsaSpec::None(settings::Flags::new(flag_builder)))
1174        } else if let Some(loc) = last_set_loc {
1175            err!(
1176                loc,
1177                "dangling 'set' command after ISA specification has no effect."
1178            )
1179        } else {
1180            Ok(isaspec::IsaSpec::Some(targets))
1181        }
1182    }
1183
1184    /// Parse a list of expected features that Cranelift should be compiled with, or without.
1185    pub fn parse_cranelift_features(&mut self) -> ParseResult<Vec<Feature<'a>>> {
1186        let mut list = Vec::new();
1187        while self.token() == Some(Token::Identifier("feature")) {
1188            self.consume();
1189            let has = !self.optional(Token::Bang);
1190            match (self.token(), has) {
1191                (Some(Token::String(flag)), true) => list.push(Feature::With(flag)),
1192                (Some(Token::String(flag)), false) => list.push(Feature::Without(flag)),
1193                (tok, _) => {
1194                    return err!(
1195                        self.loc,
1196                        format!("Expected feature flag string, got {:?}", tok)
1197                    );
1198                }
1199            }
1200            self.consume();
1201        }
1202        Ok(list)
1203    }
1204
1205    /// Parse a list of function definitions.
1206    ///
1207    /// This is the top-level parse function matching the whole contents of a file.
1208    pub fn parse_function_list(&mut self) -> ParseResult<Vec<(Function, Details<'a>)>> {
1209        let mut list = Vec::new();
1210        while self.token().is_some() {
1211            list.push(self.parse_function()?);
1212        }
1213        if let Some(err) = self.lex_error {
1214            return match err {
1215                LexError::InvalidChar => err!(self.loc, "invalid character"),
1216            };
1217        }
1218        Ok(list)
1219    }
1220
1221    // Parse a whole function definition.
1222    //
1223    // function ::= * "function" name signature "{" preamble function-body "}"
1224    //
1225    fn parse_function(&mut self) -> ParseResult<(Function, Details<'a>)> {
1226        // Begin gathering comments.
1227        // Make sure we don't include any comments before the `function` keyword.
1228        self.token();
1229        debug_assert!(self.comments.is_empty());
1230        self.start_gathering_comments();
1231
1232        self.match_identifier("function", "expected 'function'")?;
1233
1234        let location = self.loc;
1235
1236        // function ::= "function" * name signature "{" preamble function-body "}"
1237        let name = self.parse_user_func_name()?;
1238
1239        // function ::= "function" name * signature "{" preamble function-body "}"
1240        let sig = self.parse_signature()?;
1241
1242        let mut ctx = Context::new(Function::with_name_signature(name, sig));
1243
1244        // function ::= "function" name signature * "{" preamble function-body "}"
1245        self.match_token(Token::LBrace, "expected '{' before function body")?;
1246
1247        self.token();
1248        self.claim_gathered_comments(AnyEntity::Function);
1249
1250        // function ::= "function" name signature "{" * preamble function-body "}"
1251        self.parse_preamble(&mut ctx)?;
1252        // function ::= "function" name signature "{"  preamble * function-body "}"
1253        self.parse_function_body(&mut ctx)?;
1254        // function ::= "function" name signature "{" preamble function-body * "}"
1255        self.match_token(Token::RBrace, "expected '}' after function body")?;
1256
1257        // Collect any comments following the end of the function, then stop gathering comments.
1258        self.start_gathering_comments();
1259        self.token();
1260        self.claim_gathered_comments(AnyEntity::Function);
1261
1262        // Claim all the declared user-defined function names.
1263        for (user_func_ref, user_external_name) in
1264            std::mem::take(&mut self.predeclared_external_names)
1265        {
1266            let actual_ref = ctx
1267                .function
1268                .declare_imported_user_function(user_external_name);
1269            assert_eq!(user_func_ref, actual_ref);
1270        }
1271
1272        let details = Details {
1273            location,
1274            comments: self.take_comments(),
1275            map: ctx.map,
1276        };
1277
1278        Ok((ctx.function, details))
1279    }
1280
1281    // Parse a user-defined function name
1282    //
1283    // For example, in a function decl, the parser would be in this state:
1284    //
1285    // function ::= "function" * name signature { ... }
1286    //
1287    fn parse_user_func_name(&mut self) -> ParseResult<UserFuncName> {
1288        match self.token() {
1289            Some(Token::Name(s)) => {
1290                self.consume();
1291                Ok(UserFuncName::testcase(s))
1292            }
1293            Some(Token::UserRef(namespace)) => {
1294                self.consume();
1295                match self.token() {
1296                    Some(Token::Colon) => {
1297                        self.consume();
1298                        match self.token() {
1299                            Some(Token::Integer(index_str)) => {
1300                                self.consume();
1301                                let index: u32 =
1302                                    u32::from_str_radix(index_str, 10).map_err(|_| {
1303                                        self.error("the integer given overflows the u32 type")
1304                                    })?;
1305                                Ok(UserFuncName::user(namespace, index))
1306                            }
1307                            _ => err!(self.loc, "expected integer"),
1308                        }
1309                    }
1310                    _ => {
1311                        err!(self.loc, "expected user function name in the form uX:Y")
1312                    }
1313                }
1314            }
1315            _ => err!(self.loc, "expected external name"),
1316        }
1317    }
1318
1319    // Parse an external name.
1320    //
1321    // For example, in a function reference decl, the parser would be in this state:
1322    //
1323    // fn0 = * name signature
1324    //
1325    fn parse_external_name(&mut self) -> ParseResult<ExternalName> {
1326        match self.token() {
1327            Some(Token::Name(s)) => {
1328                self.consume();
1329                s.parse()
1330                    .map_err(|_| self.error("invalid test case or libcall name"))
1331            }
1332
1333            Some(Token::UserNameRef(name_ref)) => {
1334                self.consume();
1335                Ok(ExternalName::user(UserExternalNameRef::new(
1336                    name_ref as usize,
1337                )))
1338            }
1339
1340            Some(Token::UserRef(namespace)) => {
1341                self.consume();
1342                if let Some(Token::Colon) = self.token() {
1343                    self.consume();
1344                    match self.token() {
1345                        Some(Token::Integer(index_str)) => {
1346                            let index: u32 = u32::from_str_radix(index_str, 10).map_err(|_| {
1347                                self.error("the integer given overflows the u32 type")
1348                            })?;
1349                            self.consume();
1350
1351                            // Deduplicate the reference (O(n), but should be fine for tests),
1352                            // to follow `FunctionParameters::declare_imported_user_function`,
1353                            // otherwise this will cause ref mismatches when asserted below.
1354                            let name_ref = self
1355                                .predeclared_external_names
1356                                .iter()
1357                                .find_map(|(reff, name)| {
1358                                    if name.index == index && name.namespace == namespace {
1359                                        Some(reff)
1360                                    } else {
1361                                        None
1362                                    }
1363                                })
1364                                .unwrap_or_else(|| {
1365                                    self.predeclared_external_names
1366                                        .push(ir::UserExternalName { namespace, index })
1367                                });
1368
1369                            Ok(ExternalName::user(name_ref))
1370                        }
1371                        _ => err!(self.loc, "expected integer"),
1372                    }
1373                } else {
1374                    err!(self.loc, "expected colon")
1375                }
1376            }
1377
1378            _ => err!(self.loc, "expected external name"),
1379        }
1380    }
1381
1382    // Parse a function signature.
1383    //
1384    // signature ::=  * "(" [paramlist] ")" ["->" retlist] [callconv]
1385    //
1386    fn parse_signature(&mut self) -> ParseResult<Signature> {
1387        // Calling convention defaults to `fast`, but can be changed.
1388        let mut sig = Signature::new(self.default_calling_convention);
1389
1390        self.match_token(Token::LPar, "expected function signature: ( args... )")?;
1391        // signature ::=  "(" * [abi-param-list] ")" ["->" retlist] [callconv]
1392        if self.token() != Some(Token::RPar) {
1393            sig.params = self.parse_abi_param_list()?;
1394        }
1395        self.match_token(Token::RPar, "expected ')' after function arguments")?;
1396        if self.optional(Token::Arrow) {
1397            sig.returns = self.parse_abi_param_list()?;
1398        }
1399
1400        // The calling convention is optional.
1401        match self.token() {
1402            Some(Token::Identifier(text)) => match text.parse() {
1403                Ok(cc) => {
1404                    self.consume();
1405                    sig.call_conv = cc;
1406                }
1407                _ => return err!(self.loc, "unknown calling convention: {}", text),
1408            },
1409            _ => {}
1410        }
1411
1412        Ok(sig)
1413    }
1414
1415    // Parse list of function parameter / return value types.
1416    //
1417    // paramlist ::= * param { "," param }
1418    //
1419    fn parse_abi_param_list(&mut self) -> ParseResult<Vec<AbiParam>> {
1420        let mut list = Vec::new();
1421
1422        // abi-param-list ::= * abi-param { "," abi-param }
1423        list.push(self.parse_abi_param()?);
1424
1425        // abi-param-list ::= abi-param * { "," abi-param }
1426        while self.optional(Token::Comma) {
1427            // abi-param-list ::= abi-param { "," * abi-param }
1428            list.push(self.parse_abi_param()?);
1429        }
1430
1431        Ok(list)
1432    }
1433
1434    // Parse a single argument type with flags.
1435    fn parse_abi_param(&mut self) -> ParseResult<AbiParam> {
1436        // abi-param ::= * type { flag }
1437        let mut arg = AbiParam::new(self.match_type("expected parameter type")?);
1438
1439        // abi-param ::= type * { flag }
1440        while let Some(Token::Identifier(s)) = self.token() {
1441            match s {
1442                "uext" => arg.extension = ArgumentExtension::Uext,
1443                "sext" => arg.extension = ArgumentExtension::Sext,
1444                "sarg" => {
1445                    self.consume();
1446                    self.match_token(Token::LPar, "expected '(' to begin sarg size")?;
1447                    let size = self.match_uimm32("expected byte-size in sarg decl")?;
1448                    self.match_token(Token::RPar, "expected ')' to end sarg size")?;
1449                    arg.purpose = ArgumentPurpose::StructArgument(size.into());
1450                    continue;
1451                }
1452                _ => {
1453                    if let Ok(purpose) = s.parse() {
1454                        arg.purpose = purpose;
1455                    } else {
1456                        break;
1457                    }
1458                }
1459            }
1460            self.consume();
1461        }
1462
1463        Ok(arg)
1464    }
1465
1466    // Parse the function preamble.
1467    //
1468    // preamble      ::= * { preamble-decl }
1469    // preamble-decl ::= * stack-slot-decl
1470    //                   * function-decl
1471    //                   * signature-decl
1472    //                   * jump-table-decl
1473    //                   * stack-limit-decl
1474    //
1475    // The parsed decls are added to `ctx` rather than returned.
1476    fn parse_preamble(&mut self, ctx: &mut Context) -> ParseResult<()> {
1477        loop {
1478            match self.token() {
1479                Some(Token::StackSlot(..)) => {
1480                    self.start_gathering_comments();
1481                    let loc = self.loc;
1482                    self.parse_stack_slot_decl()
1483                        .and_then(|(ss, dat)| ctx.add_ss(ss, dat, loc))
1484                }
1485                Some(Token::DynamicStackSlot(..)) => {
1486                    self.start_gathering_comments();
1487                    let loc = self.loc;
1488                    self.parse_dynamic_stack_slot_decl()
1489                        .and_then(|(dss, dat)| ctx.add_dss(dss, dat, loc))
1490                }
1491                Some(Token::DynamicType(..)) => {
1492                    self.start_gathering_comments();
1493                    let loc = self.loc;
1494                    self.parse_dynamic_type_decl()
1495                        .and_then(|(dt, dat)| ctx.add_dt(dt, dat, loc))
1496                }
1497                Some(Token::GlobalValue(..)) => {
1498                    self.start_gathering_comments();
1499                    self.parse_global_value_decl()
1500                        .and_then(|(gv, dat, maybe_fact)| ctx.add_gv(gv, dat, maybe_fact, self.loc))
1501                }
1502                Some(Token::MemoryType(..)) => {
1503                    self.start_gathering_comments();
1504                    self.parse_memory_type_decl()
1505                        .and_then(|(mt, dat)| ctx.add_mt(mt, dat, self.loc))
1506                }
1507                Some(Token::SigRef(..)) => {
1508                    self.start_gathering_comments();
1509                    self.parse_signature_decl().and_then(|(sig, dat)| {
1510                        ctx.add_sig(sig, dat, self.loc, self.default_calling_convention)
1511                    })
1512                }
1513                Some(Token::FuncRef(..)) => {
1514                    self.start_gathering_comments();
1515                    self.parse_function_decl(ctx)
1516                        .and_then(|(fn_, dat)| ctx.add_fn(fn_, dat, self.loc))
1517                }
1518                Some(Token::Constant(..)) => {
1519                    self.start_gathering_comments();
1520                    self.parse_constant_decl()
1521                        .and_then(|(c, v)| ctx.add_constant(c, v, self.loc))
1522                }
1523                Some(Token::Identifier("stack_limit")) => {
1524                    self.start_gathering_comments();
1525                    self.parse_stack_limit_decl()
1526                        .and_then(|gv| ctx.add_stack_limit(gv, self.loc))
1527                }
1528                // More to come..
1529                _ => return Ok(()),
1530            }?;
1531        }
1532    }
1533
1534    // Parse a stack slot decl.
1535    //
1536    // stack-slot-decl ::= * StackSlot(ss) "=" stack-slot-kind Bytes {"," stack-slot-flag}
1537    // stack-slot-kind ::= "explicit_slot"
1538    //                   | "spill_slot"
1539    //                   | "incoming_arg"
1540    //                   | "outgoing_arg"
1541    // stack-slot-flag ::= "align" "=" Bytes | "key" "=" uimm64
1542    fn parse_stack_slot_decl(&mut self) -> ParseResult<(StackSlot, StackSlotData)> {
1543        let ss = self.match_ss("expected stack slot number: ss«n»")?;
1544        self.match_token(Token::Equal, "expected '=' in stack slot declaration")?;
1545        let kind = self.match_enum("expected stack slot kind")?;
1546
1547        // stack-slot-decl ::= StackSlot(ss) "=" stack-slot-kind * Bytes {"," stack-slot-flag}
1548        let bytes: i64 = self
1549            .match_imm64("expected byte-size in stack_slot decl")?
1550            .into();
1551        if bytes < 0 {
1552            return err!(self.loc, "negative stack slot size");
1553        }
1554        if bytes > i64::from(u32::MAX) {
1555            return err!(self.loc, "stack slot too large");
1556        }
1557
1558        let mut align = 1;
1559        let mut key = None;
1560
1561        while self.token() == Some(Token::Comma) {
1562            self.consume();
1563            match self.token() {
1564                Some(Token::Identifier("align")) => {
1565                    self.consume();
1566                    self.match_token(Token::Equal, "expected `=` after flag")?;
1567                    let align64: i64 = self
1568                        .match_imm64("expected alignment-size after `align` flag")?
1569                        .into();
1570                    align = u32::try_from(align64)
1571                        .map_err(|_| self.error("alignment must be a 32-bit unsigned integer"))?;
1572                }
1573                Some(Token::Identifier("key")) => {
1574                    self.consume();
1575                    self.match_token(Token::Equal, "expected `=` after flag")?;
1576                    let value = self.match_uimm64("expected `u64` value for `key` flag")?;
1577                    key = Some(StackSlotKey::new(value.into()));
1578                }
1579                _ => {
1580                    return Err(self.error("invalid flag for stack slot"));
1581                }
1582            }
1583        }
1584
1585        if !align.is_power_of_two() {
1586            return err!(self.loc, "stack slot alignment is not a power of two");
1587        }
1588        let align_shift = u8::try_from(align.ilog2()).unwrap(); // Always succeeds: range 0..=31.
1589
1590        let data = match key {
1591            Some(key) => StackSlotData::new_with_key(kind, bytes as u32, align_shift, key),
1592            None => StackSlotData::new(kind, bytes as u32, align_shift),
1593        };
1594
1595        // Collect any trailing comments.
1596        self.token();
1597        self.claim_gathered_comments(ss);
1598
1599        // TBD: stack-slot-decl ::= StackSlot(ss) "=" stack-slot-kind Bytes * {"," stack-slot-flag}
1600        Ok((ss, data))
1601    }
1602
1603    fn parse_dynamic_stack_slot_decl(
1604        &mut self,
1605    ) -> ParseResult<(DynamicStackSlot, DynamicStackSlotData)> {
1606        let dss = self.match_dss("expected stack slot number: dss«n»")?;
1607        self.match_token(Token::Equal, "expected '=' in stack slot declaration")?;
1608        let kind = self.match_enum("expected stack slot kind")?;
1609        let dt = self.match_dt("expected dynamic type")?;
1610        let data = DynamicStackSlotData::new(kind, dt);
1611        // Collect any trailing comments.
1612        self.token();
1613        self.claim_gathered_comments(dss);
1614
1615        // TBD: stack-slot-decl ::= StackSlot(ss) "=" stack-slot-kind Bytes * {"," stack-slot-flag}
1616        Ok((dss, data))
1617    }
1618
1619    fn parse_dynamic_type_decl(&mut self) -> ParseResult<(DynamicType, DynamicTypeData)> {
1620        let dt = self.match_dt("expected dynamic type number: dt«n»")?;
1621        self.match_token(Token::Equal, "expected '=' in stack slot declaration")?;
1622        let vector_base_ty = self.match_type("expected base type")?;
1623        assert!(vector_base_ty.is_vector(), "expected vector type");
1624        self.match_token(
1625            Token::Multiply,
1626            "expected '*' followed by a dynamic scale value",
1627        )?;
1628        let dyn_scale = self.match_gv("expected dynamic scale global value")?;
1629        let data = DynamicTypeData::new(vector_base_ty, dyn_scale);
1630        // Collect any trailing comments.
1631        self.token();
1632        self.claim_gathered_comments(dt);
1633        Ok((dt, data))
1634    }
1635
1636    // Parse a global value decl.
1637    //
1638    // global-val-decl ::= * GlobalValue(gv) [ "!" fact ] "=" global-val-desc
1639    // global-val-desc ::= "vmctx"
1640    //                   | "load" "." type "notrap" "aligned" GlobalValue(base) [offset]
1641    //                   | "iadd_imm" "(" GlobalValue(base) ")" imm64
1642    //                   | "symbol" ["colocated"] name + imm64
1643    //                   | "dyn_scale_target_const" "." type
1644    //
1645    fn parse_global_value_decl(
1646        &mut self,
1647    ) -> ParseResult<(GlobalValue, GlobalValueData, Option<Fact>)> {
1648        let gv = self.match_gv("expected global value number: gv«n»")?;
1649
1650        let fact = if self.token() == Some(Token::Bang) {
1651            self.consume();
1652            Some(self.parse_fact()?)
1653        } else {
1654            None
1655        };
1656
1657        self.match_token(Token::Equal, "expected '=' in global value declaration")?;
1658
1659        let data = match self.match_any_identifier("expected global value kind")? {
1660            "vmctx" => GlobalValueData::VMContext,
1661            "load" => {
1662                self.match_token(
1663                    Token::Dot,
1664                    "expected '.' followed by type in load global value decl",
1665                )?;
1666                let global_type = self.match_type("expected load type")?;
1667                let flags = self.optional_memflags()?;
1668                let base = self.match_gv("expected global value: gv«n»")?;
1669                let offset = self.optional_offset32()?;
1670
1671                if !(flags.notrap() && flags.aligned()) {
1672                    return err!(self.loc, "global-value load must be notrap and aligned");
1673                }
1674                GlobalValueData::Load {
1675                    base,
1676                    offset,
1677                    global_type,
1678                    flags,
1679                }
1680            }
1681            "iadd_imm" => {
1682                self.match_token(
1683                    Token::Dot,
1684                    "expected '.' followed by type in iadd_imm global value decl",
1685                )?;
1686                let global_type = self.match_type("expected iadd type")?;
1687                let base = self.match_gv("expected global value: gv«n»")?;
1688                self.match_token(
1689                    Token::Comma,
1690                    "expected ',' followed by rhs in iadd_imm global value decl",
1691                )?;
1692                let offset = self.match_imm64("expected iadd_imm immediate")?;
1693                GlobalValueData::IAddImm {
1694                    base,
1695                    offset,
1696                    global_type,
1697                }
1698            }
1699            "symbol" => {
1700                let colocated = self.optional(Token::Identifier("colocated"));
1701                let tls = self.optional(Token::Identifier("tls"));
1702                let name = self.parse_external_name()?;
1703                let offset = self.optional_offset_imm64()?;
1704                GlobalValueData::Symbol {
1705                    name,
1706                    offset,
1707                    colocated,
1708                    tls,
1709                }
1710            }
1711            "dyn_scale_target_const" => {
1712                self.match_token(
1713                    Token::Dot,
1714                    "expected '.' followed by type in dynamic scale global value decl",
1715                )?;
1716                let vector_type = self.match_type("expected load type")?;
1717                assert!(vector_type.is_vector(), "Expected vector type");
1718                GlobalValueData::DynScaleTargetConst { vector_type }
1719            }
1720            other => return err!(self.loc, "Unknown global value kind '{}'", other),
1721        };
1722
1723        // Collect any trailing comments.
1724        self.token();
1725        self.claim_gathered_comments(gv);
1726
1727        Ok((gv, data, fact))
1728    }
1729
1730    // Parse one field definition in a memory-type struct decl.
1731    //
1732    // memory-type-field ::=  offset ":" type ["readonly"] [ "!" fact ]
1733    // offset ::= uimm64
1734    fn parse_memory_type_field(&mut self) -> ParseResult<MemoryTypeField> {
1735        let offset: u64 = self
1736            .match_uimm64(
1737                "expected u64 constant value for field offset in struct memory-type declaration",
1738            )?
1739            .into();
1740        self.match_token(
1741            Token::Colon,
1742            "expected colon after field offset in struct memory-type declaration",
1743        )?;
1744        let ty = self.match_type("expected type for field in struct memory-type declaration")?;
1745        let readonly = if self.token() == Some(Token::Identifier("readonly")) {
1746            self.consume();
1747            true
1748        } else {
1749            false
1750        };
1751        let fact = if self.token() == Some(Token::Bang) {
1752            self.consume();
1753            let fact = self.parse_fact()?;
1754            Some(fact)
1755        } else {
1756            None
1757        };
1758        Ok(MemoryTypeField {
1759            offset,
1760            ty,
1761            readonly,
1762            fact,
1763        })
1764    }
1765
1766    // Parse a memory-type decl.
1767    //
1768    // memory-type-decl ::= MemoryType(mt) "=" memory-type-desc
1769    // memory-type-desc ::= "struct" size "{" memory-type-field,* "}"
1770    //                    | "memory" size
1771    //                    | "dynamic_memory" GlobalValue "+" offset
1772    //                    | "empty"
1773    // size ::= uimm64
1774    // offset ::= uimm64
1775    fn parse_memory_type_decl(&mut self) -> ParseResult<(MemoryType, MemoryTypeData)> {
1776        let mt = self.match_mt("expected memory type number: mt«n»")?;
1777        self.match_token(Token::Equal, "expected '=' in memory type declaration")?;
1778
1779        let data = match self.token() {
1780            Some(Token::Identifier("struct")) => {
1781                self.consume();
1782                let size: u64 = self.match_uimm64("expected u64 constant value for struct size in struct memory-type declaration")?.into();
1783                self.match_token(Token::LBrace, "expected opening brace to start struct fields in struct memory-type declaration")?;
1784                let mut fields = vec![];
1785                while self.token() != Some(Token::RBrace) {
1786                    let field = self.parse_memory_type_field()?;
1787                    fields.push(field);
1788                    if self.token() == Some(Token::Comma) {
1789                        self.consume();
1790                    } else {
1791                        break;
1792                    }
1793                }
1794                self.match_token(
1795                    Token::RBrace,
1796                    "expected closing brace after struct fields in struct memory-type declaration",
1797                )?;
1798                MemoryTypeData::Struct { size, fields }
1799            }
1800            Some(Token::Identifier("memory")) => {
1801                self.consume();
1802                let size: u64 = self.match_uimm64("expected u64 constant value for size in static-memory memory-type declaration")?.into();
1803                MemoryTypeData::Memory { size }
1804            }
1805            Some(Token::Identifier("dynamic_memory")) => {
1806                self.consume();
1807                let gv = self.match_gv(
1808                    "expected a global value for `dynamic_memory` memory-type declaration",
1809                )?;
1810                self.match_token(
1811                    Token::Plus,
1812                    "expected `+` after global value in `dynamic_memory` memory-type declaration",
1813                )?;
1814                let size: u64 = self.match_uimm64("expected u64 constant value for size offset in `dynamic_memory` memory-type declaration")?.into();
1815                MemoryTypeData::DynamicMemory { gv, size }
1816            }
1817            Some(Token::Identifier("empty")) => {
1818                self.consume();
1819                MemoryTypeData::Empty
1820            }
1821            other => {
1822                return err!(
1823                    self.loc,
1824                    "Unknown memory type declaration kind '{:?}'",
1825                    other
1826                );
1827            }
1828        };
1829
1830        // Collect any trailing comments.
1831        self.token();
1832        self.claim_gathered_comments(mt);
1833
1834        Ok((mt, data))
1835    }
1836
1837    // Parse a signature decl.
1838    //
1839    // signature-decl ::= SigRef(sigref) "=" signature
1840    //
1841    fn parse_signature_decl(&mut self) -> ParseResult<(SigRef, Signature)> {
1842        let sig = self.match_sig("expected signature number: sig«n»")?;
1843        self.match_token(Token::Equal, "expected '=' in signature decl")?;
1844        let data = self.parse_signature()?;
1845
1846        // Collect any trailing comments.
1847        self.token();
1848        self.claim_gathered_comments(sig);
1849
1850        Ok((sig, data))
1851    }
1852
1853    // Parse a function decl.
1854    //
1855    // Two variants:
1856    //
1857    // function-decl ::= FuncRef(fnref) "=" ["colocated"] ["patchable"] name function-decl-sig
1858    // function-decl-sig ::= SigRef(sig) | signature
1859    //
1860    // The first variant allocates a new signature reference. The second references an existing
1861    // signature which must be declared first.
1862    //
1863    fn parse_function_decl(&mut self, ctx: &mut Context) -> ParseResult<(FuncRef, ExtFuncData)> {
1864        let fn_ = self.match_fn("expected function number: fn«n»")?;
1865        self.match_token(Token::Equal, "expected '=' in function decl")?;
1866
1867        let loc = self.loc;
1868
1869        // function-decl ::= FuncRef(fnref) "=" * ["colocated"] ["patchable"] name function-decl-sig
1870        let colocated = self.optional(Token::Identifier("colocated"));
1871        // function-decl ::= FuncRef(fnref) "=" ["colocated"] * ["patchable"] name function-decl-sig
1872        let patchable = self.optional(Token::Identifier("patchable"));
1873
1874        // function-decl ::= FuncRef(fnref) "=" ["colocated"] ["patchable"] * name function-decl-sig
1875        let name = self.parse_external_name()?;
1876
1877        // function-decl ::= FuncRef(fnref) "=" ["colocated"] ["patchable"] name * function-decl-sig
1878        let data = match self.token() {
1879            Some(Token::LPar) => {
1880                // function-decl ::= FuncRef(fnref) "=" ["colocated"] ["patchable"] name * signature
1881                let sig = self.parse_signature()?;
1882                let sigref = ctx.function.import_signature(sig);
1883                ctx.map
1884                    .def_entity(sigref.into(), loc)
1885                    .expect("duplicate SigRef entities created");
1886                ExtFuncData {
1887                    name,
1888                    signature: sigref,
1889                    colocated,
1890                    patchable,
1891                }
1892            }
1893            Some(Token::SigRef(sig_src)) => {
1894                let sig = match SigRef::with_number(sig_src) {
1895                    None => {
1896                        return err!(self.loc, "attempted to use invalid signature ss{}", sig_src);
1897                    }
1898                    Some(sig) => sig,
1899                };
1900                ctx.check_sig(sig, self.loc)?;
1901                self.consume();
1902                ExtFuncData {
1903                    name,
1904                    signature: sig,
1905                    colocated,
1906                    patchable,
1907                }
1908            }
1909            _ => return err!(self.loc, "expected 'function' or sig«n» in function decl"),
1910        };
1911
1912        // Collect any trailing comments.
1913        self.token();
1914        self.claim_gathered_comments(fn_);
1915
1916        Ok((fn_, data))
1917    }
1918
1919    // Parse a jump table literal.
1920    //
1921    // jump-table-lit ::= "[" block(args) {"," block(args) } "]"
1922    //                  | "[]"
1923    fn parse_jump_table(
1924        &mut self,
1925        ctx: &mut Context,
1926        def: ir::BlockCall,
1927    ) -> ParseResult<ir::JumpTable> {
1928        self.match_token(Token::LBracket, "expected '[' before jump table contents")?;
1929
1930        let mut data = Vec::new();
1931
1932        match self.token() {
1933            Some(Token::Block(dest)) => {
1934                self.consume();
1935                let args = self.parse_opt_block_call_args()?;
1936                data.push(ctx.function.dfg.block_call(dest, &args));
1937
1938                loop {
1939                    match self.token() {
1940                        Some(Token::Comma) => {
1941                            self.consume();
1942                            if let Some(Token::Block(dest)) = self.token() {
1943                                self.consume();
1944                                let args = self.parse_opt_block_call_args()?;
1945                                data.push(ctx.function.dfg.block_call(dest, &args));
1946                            } else {
1947                                return err!(self.loc, "expected jump_table entry");
1948                            }
1949                        }
1950                        Some(Token::RBracket) => break,
1951                        _ => return err!(self.loc, "expected ']' after jump table contents"),
1952                    }
1953                }
1954            }
1955            Some(Token::RBracket) => (),
1956            _ => return err!(self.loc, "expected jump_table entry"),
1957        }
1958
1959        self.consume();
1960
1961        Ok(ctx
1962            .function
1963            .dfg
1964            .jump_tables
1965            .push(JumpTableData::new(def, &data)))
1966    }
1967
1968    // Parse an exception-table decl.
1969    //
1970    // exception-table ::= * SigRef(sig) "," BlockCall "," "[" (exception-table-entry ( "," exception-table-entry )*)? "]"
1971    // exception-table-entry ::=   ExceptionTag(tag) ":" BlockCall
1972    //                           | "default" ":" BlockCall
1973    //                           | "context" value
1974    fn parse_exception_table(&mut self, ctx: &mut Context) -> ParseResult<ir::ExceptionTable> {
1975        let sig = self.match_sig("expected signature of called function")?;
1976        self.match_token(Token::Comma, "expected comma after signature argument")?;
1977
1978        let mut handlers = vec![];
1979
1980        let block_num = self.match_block("expected branch destination block")?;
1981        let args = self.parse_opt_block_call_args()?;
1982        let normal_return = ctx.function.dfg.block_call(block_num, &args);
1983
1984        self.match_token(
1985            Token::Comma,
1986            "expected comma after normal-return destination",
1987        )?;
1988
1989        self.match_token(
1990            Token::LBracket,
1991            "expected an open-bracket for exception table list",
1992        )?;
1993        loop {
1994            match self.token() {
1995                Some(Token::RBracket) => {
1996                    break;
1997                }
1998                Some(Token::ExceptionTag(tag)) => {
1999                    self.consume();
2000                    self.match_token(Token::Colon, "expected ':' after exception tag")?;
2001                    let tag = ir::ExceptionTag::from_u32(tag);
2002                    let block_num = self.match_block("expected branch destination block")?;
2003                    let args = self.parse_opt_block_call_args()?;
2004                    let block_call = ctx.function.dfg.block_call(block_num, &args);
2005                    handlers.push(ir::ExceptionTableItem::Tag(tag, block_call));
2006                }
2007                Some(Token::Identifier("default")) => {
2008                    self.consume();
2009                    self.match_token(Token::Colon, "expected ':' after 'default'")?;
2010                    let block_num = self.match_block("expected branch destination block")?;
2011                    let args = self.parse_opt_block_call_args()?;
2012                    let block_call = ctx.function.dfg.block_call(block_num, &args);
2013                    handlers.push(ir::ExceptionTableItem::Default(block_call));
2014                }
2015                Some(Token::Identifier("context")) => {
2016                    self.consume();
2017                    let val = self.match_value("expected value for exception-handler context")?;
2018                    handlers.push(ir::ExceptionTableItem::Context(val));
2019                }
2020                _ => return err!(self.loc, "invalid token"),
2021            }
2022
2023            if let Some(Token::Comma) = self.token() {
2024                self.consume();
2025            } else {
2026                break;
2027            }
2028        }
2029        self.match_token(Token::RBracket, "expected closing bracket")?;
2030
2031        Ok(ctx
2032            .function
2033            .dfg
2034            .exception_tables
2035            .push(ir::ExceptionTableData::new(sig, normal_return, handlers)))
2036    }
2037
2038    // Parse a constant decl.
2039    //
2040    // constant-decl ::= * Constant(c) "=" ty? "[" literal {"," literal} "]"
2041    fn parse_constant_decl(&mut self) -> ParseResult<(Constant, ConstantData)> {
2042        let name = self.match_constant()?;
2043        self.match_token(Token::Equal, "expected '=' in constant decl")?;
2044        let data = if let Some(Token::Type(_)) = self.token() {
2045            let ty = self.match_type("expected type of constant")?;
2046            self.match_uimm128(ty)
2047        } else {
2048            self.match_hexadecimal_constant("expected an immediate hexadecimal operand")
2049        }?;
2050
2051        // Collect any trailing comments.
2052        self.token();
2053        self.claim_gathered_comments(name);
2054
2055        Ok((name, data))
2056    }
2057
2058    // Parse a stack limit decl
2059    //
2060    // stack-limit-decl ::= * StackLimit "=" GlobalValue(gv)
2061    fn parse_stack_limit_decl(&mut self) -> ParseResult<GlobalValue> {
2062        self.match_stack_limit()?;
2063        self.match_token(Token::Equal, "expected '=' in stack limit decl")?;
2064        let limit = match self.token() {
2065            Some(Token::GlobalValue(base_num)) => match GlobalValue::with_number(base_num) {
2066                Some(gv) => gv,
2067                None => return err!(self.loc, "invalid global value number for stack limit"),
2068            },
2069            _ => return err!(self.loc, "expected global value"),
2070        };
2071        self.consume();
2072
2073        // Collect any trailing comments.
2074        self.token();
2075        self.claim_gathered_comments(AnyEntity::StackLimit);
2076
2077        Ok(limit)
2078    }
2079
2080    // Parse a function body, add contents to `ctx`.
2081    //
2082    // function-body ::= * { extended-basic-block }
2083    //
2084    fn parse_function_body(&mut self, ctx: &mut Context) -> ParseResult<()> {
2085        while self.token() != Some(Token::RBrace) {
2086            self.parse_basic_block(ctx)?;
2087        }
2088
2089        // Now that we've seen all defined values in the function, ensure that
2090        // all references refer to a definition.
2091        for block in &ctx.function.layout {
2092            for inst in ctx.function.layout.block_insts(block) {
2093                for value in ctx.function.dfg.inst_values(inst) {
2094                    if !ctx.map.contains_value(value) {
2095                        return err!(
2096                            ctx.map.location(AnyEntity::Inst(inst)).unwrap(),
2097                            "undefined operand value {}",
2098                            value
2099                        );
2100                    }
2101                }
2102            }
2103        }
2104
2105        for alias in &ctx.aliases {
2106            if !ctx.function.dfg.set_alias_type_for_parser(*alias) {
2107                let loc = ctx.map.location(AnyEntity::Value(*alias)).unwrap();
2108                return err!(loc, "alias cycle involving {}", alias);
2109            }
2110        }
2111
2112        Ok(())
2113    }
2114
2115    // Parse a basic block, add contents to `ctx`.
2116    //
2117    // extended-basic-block ::= * block-header { instruction }
2118    // block-header         ::= Block(block) [block-params] [block-flags] ":"
2119    // block-flags          ::= [Cold]
2120    //
2121    fn parse_basic_block(&mut self, ctx: &mut Context) -> ParseResult<()> {
2122        // Collect comments for the next block.
2123        self.start_gathering_comments();
2124
2125        let block_num = self.match_block("expected block header")?;
2126        let block = ctx.add_block(block_num, self.loc)?;
2127
2128        if block_num.as_u32() >= MAX_BLOCKS_IN_A_FUNCTION {
2129            return Err(self.error("too many blocks"));
2130        }
2131
2132        if self.token() == Some(Token::LPar) {
2133            self.parse_block_params(ctx, block)?;
2134        }
2135
2136        if self.optional(Token::Cold) {
2137            ctx.set_cold_block(block);
2138        }
2139
2140        self.match_token(Token::Colon, "expected ':' after block parameters")?;
2141
2142        // Collect any trailing comments.
2143        self.token();
2144        self.claim_gathered_comments(block);
2145
2146        // extended-basic-block ::= block-header * { instruction }
2147        while match self.token() {
2148            Some(Token::Value(_))
2149            | Some(Token::Identifier(_))
2150            | Some(Token::LBracket)
2151            | Some(Token::SourceLoc(_))
2152            | Some(Token::LAngle) => true,
2153            _ => false,
2154        } {
2155            let srcloc = self.optional_srcloc()?;
2156
2157            let debug_tags = self.optional_debug_tags()?;
2158
2159            // We need to parse instruction results here because they are shared
2160            // between the parsing of value aliases and the parsing of instructions.
2161            //
2162            // inst-results ::= Value(v) { "," Value(v) }
2163            let results = self.parse_inst_results(ctx)?;
2164
2165            for result in &results {
2166                while ctx.function.dfg.num_values() <= result.index() {
2167                    ctx.function.dfg.make_invalid_value_for_parser();
2168                }
2169            }
2170
2171            match self.token() {
2172                Some(Token::Arrow) => {
2173                    self.consume();
2174                    self.parse_value_alias(&results, ctx)?;
2175                }
2176                Some(Token::Equal) => {
2177                    self.consume();
2178                    self.parse_instruction(&results, srcloc, debug_tags, ctx, block)?;
2179                }
2180                _ if !results.is_empty() => return err!(self.loc, "expected -> or ="),
2181                _ => self.parse_instruction(&results, srcloc, debug_tags, ctx, block)?,
2182            }
2183        }
2184
2185        Ok(())
2186    }
2187
2188    // Parse parenthesized list of block parameters.
2189    //
2190    // block-params ::= * "(" ( block-param { "," block-param } )? ")"
2191    fn parse_block_params(&mut self, ctx: &mut Context, block: Block) -> ParseResult<()> {
2192        // block-params ::= * "(" ( block-param { "," block-param } )? ")"
2193        self.match_token(Token::LPar, "expected '(' before block parameters")?;
2194
2195        // block-params ::= "(" * ")"
2196        if self.token() == Some(Token::RPar) {
2197            self.consume();
2198            return Ok(());
2199        }
2200
2201        // block-params ::= "(" * block-param { "," block-param } ")"
2202        self.parse_block_param(ctx, block)?;
2203
2204        // block-params ::= "(" block-param * { "," block-param } ")"
2205        while self.optional(Token::Comma) {
2206            // block-params ::= "(" block-param { "," * block-param } ")"
2207            self.parse_block_param(ctx, block)?;
2208        }
2209
2210        // block-params ::= "(" block-param { "," block-param } * ")"
2211        self.match_token(Token::RPar, "expected ')' after block parameters")?;
2212
2213        Ok(())
2214    }
2215
2216    // Parse a single block parameter declaration, and append it to `block`.
2217    //
2218    // block-param ::= * Value(v) [ "!" fact ]  ":" Type(t) arg-loc?
2219    // arg-loc ::= "[" value-location "]"
2220    //
2221    fn parse_block_param(&mut self, ctx: &mut Context, block: Block) -> ParseResult<()> {
2222        // block-param ::= * Value(v) [ "!" fact ] ":" Type(t) arg-loc?
2223        let v = self.match_value("block argument must be a value")?;
2224        let v_location = self.loc;
2225        // block-param ::= Value(v) * [ "!" fact ]  ":" Type(t) arg-loc?
2226        let fact = if self.token() == Some(Token::Bang) {
2227            self.consume();
2228            // block-param ::= Value(v) [ "!" * fact ]  ":" Type(t) arg-loc?
2229            Some(self.parse_fact()?)
2230        } else {
2231            None
2232        };
2233        self.match_token(Token::Colon, "expected ':' after block argument")?;
2234        // block-param ::= Value(v) [ "!" fact ] ":" * Type(t) arg-loc?
2235
2236        while ctx.function.dfg.num_values() <= v.index() {
2237            ctx.function.dfg.make_invalid_value_for_parser();
2238        }
2239
2240        let t = self.match_type("expected block argument type")?;
2241        // Allocate the block argument.
2242        ctx.function.dfg.append_block_param_for_parser(block, t, v);
2243        ctx.map.def_value(v, v_location)?;
2244        ctx.function.dfg.facts[v] = fact;
2245
2246        Ok(())
2247    }
2248
2249    // Parse a "fact" for proof-carrying code, attached to a value.
2250    //
2251    // fact ::= "range" "(" bit-width "," min-value "," max-value ")"
2252    //        | "dynamic_range" "(" bit-width "," expr "," expr ")"
2253    //        | "mem" "(" memory-type "," mt-offset "," mt-offset [ "," "nullable" ] ")"
2254    //        | "dynamic_mem" "(" memory-type "," expr "," expr [ "," "nullable" ] ")"
2255    //        | "conflict"
2256    // bit-width ::= uimm64
2257    // min-value ::= uimm64
2258    // max-value ::= uimm64
2259    // valid-range ::= uimm64
2260    // mt-offset ::= uimm64
2261    fn parse_fact(&mut self) -> ParseResult<Fact> {
2262        match self.token() {
2263            Some(Token::Identifier("range")) => {
2264                self.consume();
2265                self.match_token(Token::LPar, "`range` fact needs an opening `(`")?;
2266                let bit_width: u64 = self
2267                    .match_uimm64("expected a bit-width value for `range` fact")?
2268                    .into();
2269                self.match_token(Token::Comma, "expected a comma")?;
2270                let min: u64 = self
2271                    .match_uimm64("expected a min value for `range` fact")?
2272                    .into();
2273                self.match_token(Token::Comma, "expected a comma")?;
2274                let max: u64 = self
2275                    .match_uimm64("expected a max value for `range` fact")?
2276                    .into();
2277                self.match_token(Token::RPar, "`range` fact needs a closing `)`")?;
2278                let bit_width_max = match bit_width {
2279                    x if x > 64 => {
2280                        return Err(self.error("bitwidth must be <= 64 bits on a `range` fact"));
2281                    }
2282                    64 => u64::MAX,
2283                    x => (1u64 << x) - 1,
2284                };
2285                if min > max {
2286                    return Err(self.error(
2287                        "min value must be less than or equal to max value on a `range` fact",
2288                    ));
2289                }
2290                if max > bit_width_max {
2291                    return Err(
2292                        self.error("max value is out of range for bitwidth on a `range` fact")
2293                    );
2294                }
2295                Ok(Fact::Range {
2296                    bit_width: u16::try_from(bit_width).unwrap(),
2297                    min,
2298                    max,
2299                })
2300            }
2301            Some(Token::Identifier("dynamic_range")) => {
2302                self.consume();
2303                self.match_token(Token::LPar, "`dynamic_range` fact needs an opening `(`")?;
2304                let bit_width: u64 = self
2305                    .match_uimm64("expected a bit-width value for `dynamic_range` fact")?
2306                    .into();
2307                self.match_token(Token::Comma, "expected a comma")?;
2308                let min = self.parse_expr()?;
2309                self.match_token(Token::Comma, "expected a comma")?;
2310                let max = self.parse_expr()?;
2311                self.match_token(Token::RPar, "`dynamic_range` fact needs a closing `)`")?;
2312                Ok(Fact::DynamicRange {
2313                    bit_width: u16::try_from(bit_width).unwrap(),
2314                    min,
2315                    max,
2316                })
2317            }
2318            Some(Token::Identifier("mem")) => {
2319                self.consume();
2320                self.match_token(Token::LPar, "expected a `(`")?;
2321                let ty = self.match_mt("expected a memory type for `mem` fact")?;
2322                self.match_token(
2323                    Token::Comma,
2324                    "expected a comma after memory type in `mem` fact",
2325                )?;
2326                let min_offset: u64 = self
2327                    .match_uimm64("expected a uimm64 minimum pointer offset for `mem` fact")?
2328                    .into();
2329                self.match_token(Token::Comma, "expected a comma after offset in `mem` fact")?;
2330                let max_offset: u64 = self
2331                    .match_uimm64("expected a uimm64 maximum pointer offset for `mem` fact")?
2332                    .into();
2333                let nullable = if self.token() == Some(Token::Comma) {
2334                    self.consume();
2335                    self.match_token(
2336                        Token::Identifier("nullable"),
2337                        "expected `nullable` in last optional field of `dynamic_mem`",
2338                    )?;
2339                    true
2340                } else {
2341                    false
2342                };
2343                self.match_token(Token::RPar, "expected a `)`")?;
2344                Ok(Fact::Mem {
2345                    ty,
2346                    min_offset,
2347                    max_offset,
2348                    nullable,
2349                })
2350            }
2351            Some(Token::Identifier("dynamic_mem")) => {
2352                self.consume();
2353                self.match_token(Token::LPar, "expected a `(`")?;
2354                let ty = self.match_mt("expected a memory type for `dynamic_mem` fact")?;
2355                self.match_token(
2356                    Token::Comma,
2357                    "expected a comma after memory type in `dynamic_mem` fact",
2358                )?;
2359                let min = self.parse_expr()?;
2360                self.match_token(
2361                    Token::Comma,
2362                    "expected a comma after offset in `dynamic_mem` fact",
2363                )?;
2364                let max = self.parse_expr()?;
2365                let nullable = if self.token() == Some(Token::Comma) {
2366                    self.consume();
2367                    self.match_token(
2368                        Token::Identifier("nullable"),
2369                        "expected `nullable` in last optional field of `dynamic_mem`",
2370                    )?;
2371                    true
2372                } else {
2373                    false
2374                };
2375                self.match_token(Token::RPar, "expected a `)`")?;
2376                Ok(Fact::DynamicMem {
2377                    ty,
2378                    min,
2379                    max,
2380                    nullable,
2381                })
2382            }
2383            Some(Token::Identifier("def")) => {
2384                self.consume();
2385                self.match_token(Token::LPar, "expected a `(`")?;
2386                let value = self.match_value("expected a value number in `def` fact")?;
2387                self.match_token(Token::RPar, "expected a `)`")?;
2388                Ok(Fact::Def { value })
2389            }
2390            Some(Token::Identifier("compare")) => {
2391                self.consume();
2392                self.match_token(Token::LPar, "expected a `(`")?;
2393                let kind = self.match_enum("expected intcc condition code in `compare` fact")?;
2394                self.match_token(
2395                    Token::Comma,
2396                    "expected comma in `compare` fact after condition code",
2397                )?;
2398                let lhs = self.parse_expr()?;
2399                self.match_token(Token::Comma, "expected comma in `compare` fact after LHS")?;
2400                let rhs = self.parse_expr()?;
2401                self.match_token(Token::RPar, "expected a `)`")?;
2402                Ok(Fact::Compare { kind, lhs, rhs })
2403            }
2404            Some(Token::Identifier("conflict")) => {
2405                self.consume();
2406                Ok(Fact::Conflict)
2407            }
2408            _ => Err(self.error(
2409                "expected a `range`, 'dynamic_range', `mem`, `dynamic_mem`, `def`, `compare` or `conflict` fact",
2410            )),
2411        }
2412    }
2413
2414    // Parse a dynamic expression used in some kinds of PCC facts.
2415    //
2416    // expr ::= base-expr
2417    //        | base-expr + uimm64  // but in-range for imm64
2418    //        | base-expr - uimm64  // but in-range for imm64
2419    //        | imm64
2420    fn parse_expr(&mut self) -> ParseResult<Expr> {
2421        if let Some(Token::Integer(_)) = self.token() {
2422            let offset: i64 = self
2423                .match_imm64("expected imm64 for dynamic expression")?
2424                .into();
2425            Ok(Expr {
2426                base: BaseExpr::None,
2427                offset,
2428            })
2429        } else {
2430            let base = self.parse_base_expr()?;
2431            match self.token() {
2432                Some(Token::Plus) => {
2433                    self.consume();
2434                    let offset: u64 = self
2435                        .match_uimm64(
2436                            "expected uimm64 in imm64 range for offset in dynamic expression",
2437                        )?
2438                        .into();
2439                    let offset: i64 = i64::try_from(offset).map_err(|_| {
2440                        self.error("integer offset in dynamic expression is out of range")
2441                    })?;
2442                    Ok(Expr { base, offset })
2443                }
2444                Some(Token::Integer(x)) if x.starts_with("-") => {
2445                    let offset: i64 = self
2446                        .match_imm64("expected an imm64 range for offset in dynamic expression")?
2447                        .into();
2448                    Ok(Expr { base, offset })
2449                }
2450                _ => Ok(Expr { base, offset: 0 }),
2451            }
2452        }
2453    }
2454
2455    // Parse the base part of a dynamic expression, used in some PCC facts.
2456    //
2457    // base-expr ::= GlobalValue(base)
2458    //             | Value(base)
2459    //             | "max"
2460    //             | (epsilon)
2461    fn parse_base_expr(&mut self) -> ParseResult<BaseExpr> {
2462        match self.token() {
2463            Some(Token::Identifier("max")) => {
2464                self.consume();
2465                Ok(BaseExpr::Max)
2466            }
2467            Some(Token::GlobalValue(..)) => {
2468                let gv = self.match_gv("expected global value")?;
2469                Ok(BaseExpr::GlobalValue(gv))
2470            }
2471            Some(Token::Value(..)) => {
2472                let value = self.match_value("expected value")?;
2473                Ok(BaseExpr::Value(value))
2474            }
2475            _ => Ok(BaseExpr::None),
2476        }
2477    }
2478
2479    // Parse instruction results and return them.
2480    //
2481    // inst-results ::= Value(v) { "," Value(v) }
2482    //
2483    fn parse_inst_results(&mut self, ctx: &mut Context) -> ParseResult<SmallVec<[Value; 1]>> {
2484        // Result value numbers.
2485        let mut results = SmallVec::new();
2486
2487        // instruction  ::=  * [inst-results "="] Opcode(opc) ["." Type] ...
2488        // inst-results ::= * Value(v) { "," Value(v) }
2489        if let Some(Token::Value(v)) = self.token() {
2490            self.consume();
2491
2492            results.push(v);
2493
2494            let fact = if self.token() == Some(Token::Bang) {
2495                self.consume();
2496                // block-param ::= Value(v) [ "!" * fact ]  ":" Type(t) arg-loc?
2497                Some(self.parse_fact()?)
2498            } else {
2499                None
2500            };
2501            ctx.function.dfg.facts[v] = fact;
2502
2503            // inst-results ::= Value(v) * { "," Value(v) }
2504            while self.optional(Token::Comma) {
2505                // inst-results ::= Value(v) { "," * Value(v) }
2506                let v = self.match_value("expected result value")?;
2507                results.push(v);
2508
2509                let fact = if self.token() == Some(Token::Bang) {
2510                    self.consume();
2511                    // block-param ::= Value(v) [ "!" * fact ]  ":" Type(t) arg-loc?
2512                    Some(self.parse_fact()?)
2513                } else {
2514                    None
2515                };
2516                ctx.function.dfg.facts[v] = fact;
2517            }
2518        }
2519
2520        Ok(results)
2521    }
2522
2523    // Parse a value alias, and append it to `block`.
2524    //
2525    // value_alias ::= [inst-results] "->" Value(v)
2526    //
2527    fn parse_value_alias(&mut self, results: &[Value], ctx: &mut Context) -> ParseResult<()> {
2528        if results.len() != 1 {
2529            return err!(self.loc, "wrong number of aliases");
2530        }
2531        let result = results[0];
2532        let dest = self.match_value("expected value alias")?;
2533
2534        // Allow duplicate definitions of aliases, as long as they are identical.
2535        if ctx.map.contains_value(result) {
2536            if let Some(old) = ctx.function.dfg.value_alias_dest_for_serialization(result) {
2537                if old != dest {
2538                    return err!(
2539                        self.loc,
2540                        "value {} is already defined as an alias with destination {}",
2541                        result,
2542                        old
2543                    );
2544                }
2545            } else {
2546                return err!(self.loc, "value {} is already defined");
2547            }
2548        } else {
2549            ctx.map.def_value(result, self.loc)?;
2550        }
2551
2552        if !ctx.map.contains_value(dest) {
2553            return err!(self.loc, "value {} is not yet defined", dest);
2554        }
2555
2556        ctx.function
2557            .dfg
2558            .make_value_alias_for_serialization(dest, result);
2559
2560        ctx.aliases.push(result);
2561        Ok(())
2562    }
2563
2564    // Parse an instruction, append it to `block`.
2565    //
2566    // instruction ::= [inst-results "="] Opcode(opc) ["." Type] ...
2567    //
2568    fn parse_instruction(
2569        &mut self,
2570        results: &[Value],
2571        srcloc: ir::SourceLoc,
2572        debug_tags: Vec<DebugTag>,
2573        ctx: &mut Context,
2574        block: Block,
2575    ) -> ParseResult<()> {
2576        // Define the result values.
2577        for val in results {
2578            ctx.map.def_value(*val, self.loc)?;
2579        }
2580
2581        // Collect comments for the next instruction.
2582        self.start_gathering_comments();
2583
2584        // instruction ::=  [inst-results "="] * Opcode(opc) ["." Type] ...
2585        let opcode = if let Some(Token::Identifier(text)) = self.token() {
2586            match text.parse() {
2587                Ok(opc) => opc,
2588                Err(msg) => return err!(self.loc, "{}: '{}'", msg, text),
2589            }
2590        } else {
2591            return err!(self.loc, "expected instruction opcode");
2592        };
2593        let opcode_loc = self.loc;
2594        self.consume();
2595
2596        // Look for a controlling type variable annotation.
2597        // instruction ::=  [inst-results "="] Opcode(opc) * ["." Type] ...
2598        let explicit_ctrl_type = if self.optional(Token::Dot) {
2599            if let Some(Token::Type(_t)) = self.token() {
2600                Some(self.match_type("expected type after 'opcode.'")?)
2601            } else {
2602                let dt = self.match_dt("expected dynamic type")?;
2603                self.concrete_from_dt(dt, ctx)
2604            }
2605        } else {
2606            None
2607        };
2608
2609        // instruction ::=  [inst-results "="] Opcode(opc) ["." Type] * ...
2610        let inst_data = self.parse_inst_operands(ctx, opcode, explicit_ctrl_type)?;
2611
2612        let ctrl_typevar = self.infer_typevar(ctx, opcode, explicit_ctrl_type, &inst_data)?;
2613        let inst = ctx.function.dfg.make_inst(inst_data);
2614
2615        // Attach stack map, if present.
2616        if self.optional(Token::Comma) {
2617            self.match_token(
2618                Token::Identifier("stack_map"),
2619                "expected `stack_map = [...]`",
2620            )?;
2621            if !opcode.is_call() || opcode.is_return() {
2622                return err!(
2623                    self.loc,
2624                    "stack map can only be attached to a (non-tail) call"
2625                );
2626            }
2627
2628            self.match_token(Token::Equal, "expected `= [...]`")?;
2629            self.match_token(Token::LBracket, "expected `[...]`")?;
2630            while !self.optional(Token::RBracket) {
2631                let ty = self.match_type("expected `<type> @ <slot> + <offset>`")?;
2632                self.match_token(Token::At, "expected `@ <slot> + <offset>`")?;
2633                let slot = self.match_ss("expected `<slot> + <offset>`")?;
2634                let offset: u32 = match self.token() {
2635                    Some(Token::Integer(s)) if s.starts_with('+') => {
2636                        self.match_uimm32("expected a u32 offset")?.into()
2637                    }
2638                    _ => {
2639                        self.match_token(Token::Plus, "expected `+ <offset>`")?;
2640                        self.match_uimm32("expected a u32 offset")?.into()
2641                    }
2642                };
2643                ctx.function
2644                    .dfg
2645                    .append_user_stack_map_entry(inst, ir::UserStackMapEntry { ty, slot, offset });
2646                if !self.optional(Token::Comma) {
2647                    self.match_token(Token::RBracket, "expected `,` or `]`")?;
2648                    break;
2649                }
2650            }
2651        }
2652
2653        // We're done parsing the instruction data itself.
2654        //
2655        // We still need to check that the number of result values in
2656        // the source matches the opcode or function call
2657        // signature. We also need to create values with the right
2658        // type for all the instruction results.
2659        let num_results =
2660            ctx.function
2661                .dfg
2662                .make_inst_results_for_parser(inst, ctrl_typevar, results);
2663        ctx.function.layout.append_inst(inst, block);
2664        ctx.map
2665            .def_entity(inst.into(), opcode_loc)
2666            .expect("duplicate inst references created");
2667
2668        if !srcloc.is_default() {
2669            ctx.function.set_srcloc(inst, srcloc);
2670        }
2671        if !debug_tags.is_empty() {
2672            ctx.function.debug_tags.set(inst, debug_tags);
2673        }
2674
2675        if results.len() != num_results {
2676            return err!(
2677                self.loc,
2678                "instruction produces {} result values, {} given",
2679                num_results,
2680                results.len()
2681            );
2682        }
2683
2684        // Collect any trailing comments.
2685        self.token();
2686        self.claim_gathered_comments(inst);
2687
2688        Ok(())
2689    }
2690
2691    // Type inference for polymorphic instructions.
2692    //
2693    // The controlling type variable can be specified explicitly as 'splat.i32x4 v5', or it can be
2694    // inferred from `inst_data.typevar_operand` for some opcodes.
2695    //
2696    // Returns the controlling typevar for a polymorphic opcode, or `INVALID` for a non-polymorphic
2697    // opcode.
2698    fn infer_typevar(
2699        &self,
2700        ctx: &Context,
2701        opcode: Opcode,
2702        explicit_ctrl_type: Option<Type>,
2703        inst_data: &InstructionData,
2704    ) -> ParseResult<Type> {
2705        let constraints = opcode.constraints();
2706        let ctrl_type = match explicit_ctrl_type {
2707            Some(t) => t,
2708            None => {
2709                if constraints.use_typevar_operand() {
2710                    // This is an opcode that supports type inference, AND there was no
2711                    // explicit type specified. Look up `ctrl_value` to see if it was defined
2712                    // already.
2713                    // TBD: If it is defined in another block, the type should have been
2714                    // specified explicitly. It is unfortunate that the correctness of IR
2715                    // depends on the layout of the blocks.
2716                    let ctrl_src_value = inst_data
2717                        .typevar_operand(&ctx.function.dfg.value_lists)
2718                        .expect("Constraints <-> Format inconsistency");
2719                    if !ctx.map.contains_value(ctrl_src_value) {
2720                        return err!(
2721                            self.loc,
2722                            "type variable required for polymorphic opcode, e.g. '{}.{}'; \
2723                             can't infer from {} which is not yet defined",
2724                            opcode,
2725                            constraints.ctrl_typeset().unwrap().example(),
2726                            ctrl_src_value
2727                        );
2728                    }
2729                    if !ctx.function.dfg.value_is_valid_for_parser(ctrl_src_value) {
2730                        return err!(
2731                            self.loc,
2732                            "type variable required for polymorphic opcode, e.g. '{}.{}'; \
2733                             can't infer from {} which is not yet resolved",
2734                            opcode,
2735                            constraints.ctrl_typeset().unwrap().example(),
2736                            ctrl_src_value
2737                        );
2738                    }
2739                    ctx.function.dfg.value_type(ctrl_src_value)
2740                } else if constraints.is_polymorphic() {
2741                    // This opcode does not support type inference, so the explicit type
2742                    // variable is required.
2743                    return err!(
2744                        self.loc,
2745                        "type variable required for polymorphic opcode, e.g. '{}.{}'",
2746                        opcode,
2747                        constraints.ctrl_typeset().unwrap().example()
2748                    );
2749                } else {
2750                    // This is a non-polymorphic opcode. No typevar needed.
2751                    INVALID
2752                }
2753            }
2754        };
2755
2756        // Verify that `ctrl_type` is valid for the controlling type variable. We don't want to
2757        // attempt deriving types from an incorrect basis.
2758        // This is not a complete type check. The verifier does that.
2759        if let Some(typeset) = constraints.ctrl_typeset() {
2760            // This is a polymorphic opcode.
2761            if !typeset.contains(ctrl_type) {
2762                return err!(
2763                    self.loc,
2764                    "{} is not a valid typevar for {}",
2765                    ctrl_type,
2766                    opcode
2767                );
2768            }
2769        // Treat it as a syntax error to specify a typevar on a non-polymorphic opcode.
2770        } else if ctrl_type != INVALID {
2771            return err!(self.loc, "{} does not take a typevar", opcode);
2772        }
2773
2774        Ok(ctrl_type)
2775    }
2776
2777    // Parse comma-separated value list into a VariableArgs struct.
2778    //
2779    // value_list ::= [ value { "," value } ]
2780    //
2781    fn parse_value_list(&mut self) -> ParseResult<VariableArgs> {
2782        let mut args = VariableArgs::new();
2783
2784        if let Some(Token::Value(v)) = self.token() {
2785            args.push(v);
2786            self.consume();
2787        } else {
2788            return Ok(args);
2789        }
2790
2791        while self.optional(Token::Comma) {
2792            args.push(self.match_value("expected value in argument list")?);
2793        }
2794
2795        Ok(args)
2796    }
2797
2798    /// Parse an optional list of block-call arguments enclosed in
2799    /// parentheses.
2800    fn parse_opt_block_call_args(&mut self) -> ParseResult<Vec<BlockArg>> {
2801        if !self.optional(Token::LPar) {
2802            return Ok(vec![]);
2803        }
2804
2805        let mut args = vec![];
2806        while self.token() != Some(Token::RPar) {
2807            args.push(self.parse_block_call_arg()?);
2808            if self.token() == Some(Token::Comma) {
2809                self.consume();
2810            } else {
2811                break;
2812            }
2813        }
2814
2815        self.match_token(Token::RPar, "expected ')' after arguments")?;
2816
2817        Ok(args)
2818    }
2819
2820    fn parse_block_call_arg(&mut self) -> ParseResult<BlockArg> {
2821        match self.token() {
2822            Some(Token::Value(v)) => {
2823                self.consume();
2824                Ok(BlockArg::Value(v))
2825            }
2826            Some(Token::TryCallRet(i)) => {
2827                self.consume();
2828                Ok(BlockArg::TryCallRet(i))
2829            }
2830            Some(Token::TryCallExn(i)) => {
2831                self.consume();
2832                Ok(BlockArg::TryCallExn(i))
2833            }
2834            tok => Err(self.error(&format!("unexpected token: {tok:?}"))),
2835        }
2836    }
2837
2838    /// Parse a CLIF run command.
2839    ///
2840    /// run-command ::= "run" [":" invocation comparison expected]
2841    ///               \ "print" [":" invocation]
2842    fn parse_run_command(&mut self, sig: &Signature) -> ParseResult<RunCommand> {
2843        // skip semicolon
2844        match self.token() {
2845            Some(Token::Identifier("run")) => {
2846                self.consume();
2847                if self.optional(Token::Colon) {
2848                    let invocation = self.parse_run_invocation(sig)?;
2849                    let comparison = self.parse_run_comparison()?;
2850                    let expected = self.parse_run_returns(sig)?;
2851                    Ok(RunCommand::Run(invocation, comparison, expected))
2852                } else if sig.params.is_empty()
2853                    && sig.returns.len() == 1
2854                    && sig.returns[0].value_type.is_int()
2855                {
2856                    // To match the existing run behavior that does not require an explicit
2857                    // invocation, we create an invocation from a function like `() -> i*` and
2858                    // require the result to be non-zero.
2859                    let invocation = Invocation::new("default", vec![]);
2860                    let expected = vec![DataValue::I8(0)];
2861                    let comparison = Comparison::NotEquals;
2862                    Ok(RunCommand::Run(invocation, comparison, expected))
2863                } else {
2864                    Err(self.error("unable to parse the run command"))
2865                }
2866            }
2867            Some(Token::Identifier("print")) => {
2868                self.consume();
2869                if self.optional(Token::Colon) {
2870                    Ok(RunCommand::Print(self.parse_run_invocation(sig)?))
2871                } else if sig.params.is_empty() {
2872                    // To allow printing of functions like `() -> *`, we create a no-arg invocation.
2873                    let invocation = Invocation::new("default", vec![]);
2874                    Ok(RunCommand::Print(invocation))
2875                } else {
2876                    Err(self.error("unable to parse the print command"))
2877                }
2878            }
2879            _ => Err(self.error("expected a 'run:' or 'print:' command")),
2880        }
2881    }
2882
2883    /// Parse the invocation of a CLIF function.
2884    ///
2885    /// This is different from parsing a CLIF `call`; it is used in parsing run commands like
2886    /// `run: %fn(42, 4.2) == false`.
2887    ///
2888    /// invocation ::= name "(" [data-value-list] ")"
2889    fn parse_run_invocation(&mut self, sig: &Signature) -> ParseResult<Invocation> {
2890        if let Some(Token::Name(name)) = self.token() {
2891            self.consume();
2892            self.match_token(
2893                Token::LPar,
2894                "expected invocation parentheses, e.g. %fn(...)",
2895            )?;
2896
2897            let arg_types = sig
2898                .params
2899                .iter()
2900                .map(|abi| abi.value_type)
2901                .collect::<Vec<_>>();
2902            let args = self.parse_data_value_list(&arg_types)?;
2903
2904            self.match_token(
2905                Token::RPar,
2906                "expected invocation parentheses, e.g. %fn(...)",
2907            )?;
2908            Ok(Invocation::new(name, args))
2909        } else {
2910            Err(self.error("expected a function name, e.g. %my_fn"))
2911        }
2912    }
2913
2914    /// Parse a comparison operator for run commands.
2915    ///
2916    /// comparison ::= "==" | "!="
2917    fn parse_run_comparison(&mut self) -> ParseResult<Comparison> {
2918        if self.optional(Token::Equal) {
2919            self.match_token(Token::Equal, "expected another =")?;
2920            Ok(Comparison::Equals)
2921        } else if self.optional(Token::Bang) {
2922            self.match_token(Token::Equal, "expected a =")?;
2923            Ok(Comparison::NotEquals)
2924        } else {
2925            Err(self.error("unable to parse a valid comparison operator"))
2926        }
2927    }
2928
2929    /// Parse the expected return values of a run invocation.
2930    ///
2931    /// expected ::= "[" "]"
2932    ///            | data-value
2933    ///            | "[" data-value-list "]"
2934    fn parse_run_returns(&mut self, sig: &Signature) -> ParseResult<Vec<DataValue>> {
2935        if sig.returns.len() != 1 {
2936            self.match_token(Token::LBracket, "expected a left bracket [")?;
2937        }
2938
2939        let returns = self
2940            .parse_data_value_list(&sig.returns.iter().map(|a| a.value_type).collect::<Vec<_>>())?;
2941
2942        if sig.returns.len() != 1 {
2943            self.match_token(Token::RBracket, "expected a right bracket ]")?;
2944        }
2945        Ok(returns)
2946    }
2947
2948    /// Parse a comma-separated list of data values.
2949    ///
2950    /// data-value-list ::= [data-value {"," data-value-list}]
2951    fn parse_data_value_list(&mut self, types: &[Type]) -> ParseResult<Vec<DataValue>> {
2952        let mut values = vec![];
2953        for ty in types.iter().take(1) {
2954            values.push(self.parse_data_value(*ty)?);
2955        }
2956        for ty in types.iter().skip(1) {
2957            self.match_token(
2958                Token::Comma,
2959                "expected a comma between invocation arguments",
2960            )?;
2961            values.push(self.parse_data_value(*ty)?);
2962        }
2963        Ok(values)
2964    }
2965
2966    /// Parse a data value; e.g. `42`, `4.2`, `true`.
2967    ///
2968    /// data-value-list ::= [data-value {"," data-value-list}]
2969    fn parse_data_value(&mut self, ty: Type) -> ParseResult<DataValue> {
2970        let dv = match ty {
2971            I8 => DataValue::from(self.match_imm8("expected a i8")?),
2972            I16 => DataValue::from(self.match_imm16("expected an i16")?),
2973            I32 => DataValue::from(self.match_imm32("expected an i32")?),
2974            I64 => DataValue::from(Into::<i64>::into(self.match_imm64("expected an i64")?)),
2975            I128 => DataValue::from(self.match_imm128("expected an i128")?),
2976            F16 => DataValue::from(self.match_ieee16("expected an f16")?),
2977            F32 => DataValue::from(self.match_ieee32("expected an f32")?),
2978            F64 => DataValue::from(self.match_ieee64("expected an f64")?),
2979            F128 => DataValue::from(self.match_ieee128("expected an f128")?),
2980            _ if (ty.is_vector() || ty.is_dynamic_vector()) => {
2981                let as_vec = self.match_uimm128(ty)?.into_vec();
2982                let slice = as_vec.as_slice();
2983                match slice.len() {
2984                    16 => DataValue::V128(slice.try_into().unwrap()),
2985                    8 => DataValue::V64(slice.try_into().unwrap()),
2986                    4 => DataValue::V32(slice.try_into().unwrap()),
2987                    2 => DataValue::V16(slice.try_into().unwrap()),
2988                    _ => {
2989                        return Err(
2990                            self.error("vectors larger than 128 bits are not currently supported")
2991                        );
2992                    }
2993                }
2994            }
2995            _ => return Err(self.error(&format!("don't know how to parse data values of: {ty}"))),
2996        };
2997        Ok(dv)
2998    }
2999
3000    // Parse the operands following the instruction opcode.
3001    // This depends on the format of the opcode.
3002    fn parse_inst_operands(
3003        &mut self,
3004        ctx: &mut Context,
3005        opcode: Opcode,
3006        explicit_control_type: Option<Type>,
3007    ) -> ParseResult<InstructionData> {
3008        let idata = match opcode.format() {
3009            InstructionFormat::Unary => InstructionData::Unary {
3010                opcode,
3011                arg: self.match_value("expected SSA value operand")?,
3012            },
3013            InstructionFormat::UnaryImm => {
3014                let msg = |bits| format!("expected immediate {bits}-bit integer operand");
3015                let unsigned = match explicit_control_type {
3016                    Some(types::I8) => self.match_imm8(&msg(8))? as u8 as i64,
3017                    Some(types::I16) => self.match_imm16(&msg(16))? as u16 as i64,
3018                    Some(types::I32) => self.match_imm32(&msg(32))? as u32 as i64,
3019                    Some(types::I64) => self.match_imm64(&msg(64))?.bits(),
3020                    _ => {
3021                        return err!(
3022                            self.loc,
3023                            "expected one of the following type: i8, i16, i32 or i64"
3024                        );
3025                    }
3026                };
3027                InstructionData::UnaryImm {
3028                    opcode,
3029                    imm: Imm64::new(unsigned),
3030                }
3031            }
3032            InstructionFormat::UnaryIeee16 => InstructionData::UnaryIeee16 {
3033                opcode,
3034                imm: self.match_ieee16("expected immediate 16-bit float operand")?,
3035            },
3036            InstructionFormat::UnaryIeee32 => InstructionData::UnaryIeee32 {
3037                opcode,
3038                imm: self.match_ieee32("expected immediate 32-bit float operand")?,
3039            },
3040            InstructionFormat::UnaryIeee64 => InstructionData::UnaryIeee64 {
3041                opcode,
3042                imm: self.match_ieee64("expected immediate 64-bit float operand")?,
3043            },
3044            InstructionFormat::UnaryConst => {
3045                let constant_handle = if let Some(Token::Constant(_)) = self.token() {
3046                    // If handed a `const?`, use that.
3047                    let c = self.match_constant()?;
3048                    ctx.check_constant(c, self.loc)?;
3049                    c
3050                } else if opcode == Opcode::F128const {
3051                    let ieee128 = self.match_ieee128("expected immediate 128-bit float operand")?;
3052                    ctx.function.dfg.constants.insert(ieee128.into())
3053                } else if let Some(controlling_type) = explicit_control_type {
3054                    // If an explicit control type is present, we expect a sized value and insert
3055                    // it in the constant pool.
3056                    let uimm128 = self.match_uimm128(controlling_type)?;
3057                    ctx.function.dfg.constants.insert(uimm128)
3058                } else {
3059                    return err!(
3060                        self.loc,
3061                        "Expected either a const entity or a typed value, e.g. inst.i32x4 [...]"
3062                    );
3063                };
3064                InstructionData::UnaryConst {
3065                    opcode,
3066                    constant_handle,
3067                }
3068            }
3069            InstructionFormat::UnaryGlobalValue => {
3070                let gv = self.match_gv("expected global value")?;
3071                ctx.check_gv(gv, self.loc)?;
3072                InstructionData::UnaryGlobalValue {
3073                    opcode,
3074                    global_value: gv,
3075                }
3076            }
3077            InstructionFormat::Binary => {
3078                let lhs = self.match_value("expected SSA value first operand")?;
3079                self.match_token(Token::Comma, "expected ',' between operands")?;
3080                let rhs = self.match_value("expected SSA value second operand")?;
3081                InstructionData::Binary {
3082                    opcode,
3083                    args: [lhs, rhs],
3084                }
3085            }
3086            InstructionFormat::BinaryImm8 => {
3087                let arg = self.match_value("expected SSA value first operand")?;
3088                self.match_token(Token::Comma, "expected ',' between operands")?;
3089                let imm = self.match_uimm8("expected unsigned 8-bit immediate")?;
3090                InstructionData::BinaryImm8 { opcode, arg, imm }
3091            }
3092            InstructionFormat::BinaryImm64 => {
3093                let lhs = self.match_value("expected SSA value first operand")?;
3094                self.match_token(Token::Comma, "expected ',' between operands")?;
3095                let rhs = self.match_imm64("expected immediate integer second operand")?;
3096                InstructionData::BinaryImm64 {
3097                    opcode,
3098                    arg: lhs,
3099                    imm: rhs,
3100                }
3101            }
3102            InstructionFormat::Ternary => {
3103                // Names here refer to the `select` instruction.
3104                // This format is also use by `fma`.
3105                let ctrl_arg = self.match_value("expected SSA value control operand")?;
3106                self.match_token(Token::Comma, "expected ',' between operands")?;
3107                let true_arg = self.match_value("expected SSA value true operand")?;
3108                self.match_token(Token::Comma, "expected ',' between operands")?;
3109                let false_arg = self.match_value("expected SSA value false operand")?;
3110                InstructionData::Ternary {
3111                    opcode,
3112                    args: [ctrl_arg, true_arg, false_arg],
3113                }
3114            }
3115            InstructionFormat::MultiAry => {
3116                let args = self.parse_value_list()?;
3117                InstructionData::MultiAry {
3118                    opcode,
3119                    args: args.into_value_list(&[], &mut ctx.function.dfg.value_lists),
3120                }
3121            }
3122            InstructionFormat::NullAry => InstructionData::NullAry { opcode },
3123            InstructionFormat::Jump => {
3124                // Parse the destination block number.
3125                let block_num = self.match_block("expected jump destination block")?;
3126                let args = self.parse_opt_block_call_args()?;
3127                let destination = ctx.function.dfg.block_call(block_num, &args);
3128                InstructionData::Jump {
3129                    opcode,
3130                    destination,
3131                }
3132            }
3133            InstructionFormat::Brif => {
3134                let arg = self.match_value("expected SSA value control operand")?;
3135                self.match_token(Token::Comma, "expected ',' between operands")?;
3136                let block_then = {
3137                    let block_num = self.match_block("expected branch then block")?;
3138                    let args = self.parse_opt_block_call_args()?;
3139                    ctx.function.dfg.block_call(block_num, &args)
3140                };
3141                self.match_token(Token::Comma, "expected ',' between operands")?;
3142                let block_else = {
3143                    let block_num = self.match_block("expected branch else block")?;
3144                    let args = self.parse_opt_block_call_args()?;
3145                    ctx.function.dfg.block_call(block_num, &args)
3146                };
3147                InstructionData::Brif {
3148                    opcode,
3149                    arg,
3150                    blocks: [block_then, block_else],
3151                }
3152            }
3153            InstructionFormat::BranchTable => {
3154                let arg = self.match_value("expected SSA value operand")?;
3155                self.match_token(Token::Comma, "expected ',' between operands")?;
3156                let block_num = self.match_block("expected branch destination block")?;
3157                let args = self.parse_opt_block_call_args()?;
3158                let destination = ctx.function.dfg.block_call(block_num, &args);
3159                self.match_token(Token::Comma, "expected ',' between operands")?;
3160                let table = self.parse_jump_table(ctx, destination)?;
3161                InstructionData::BranchTable { opcode, arg, table }
3162            }
3163            InstructionFormat::TernaryImm8 => {
3164                let lhs = self.match_value("expected SSA value first operand")?;
3165                self.match_token(Token::Comma, "expected ',' between operands")?;
3166                let rhs = self.match_value("expected SSA value last operand")?;
3167                self.match_token(Token::Comma, "expected ',' between operands")?;
3168                let imm = self.match_uimm8("expected 8-bit immediate")?;
3169                InstructionData::TernaryImm8 {
3170                    opcode,
3171                    imm,
3172                    args: [lhs, rhs],
3173                }
3174            }
3175            InstructionFormat::Shuffle => {
3176                let a = self.match_value("expected SSA value first operand")?;
3177                self.match_token(Token::Comma, "expected ',' between operands")?;
3178                let b = self.match_value("expected SSA value second operand")?;
3179                self.match_token(Token::Comma, "expected ',' between operands")?;
3180                let uimm128 = self.match_uimm128(I8X16)?;
3181                let imm = ctx.function.dfg.immediates.push(uimm128);
3182                InstructionData::Shuffle {
3183                    opcode,
3184                    imm,
3185                    args: [a, b],
3186                }
3187            }
3188            InstructionFormat::IntCompare => {
3189                let cond = self.match_enum("expected intcc condition code")?;
3190                let lhs = self.match_value("expected SSA value first operand")?;
3191                self.match_token(Token::Comma, "expected ',' between operands")?;
3192                let rhs = self.match_value("expected SSA value second operand")?;
3193                InstructionData::IntCompare {
3194                    opcode,
3195                    cond,
3196                    args: [lhs, rhs],
3197                }
3198            }
3199            InstructionFormat::IntCompareImm => {
3200                let cond = self.match_enum("expected intcc condition code")?;
3201                let lhs = self.match_value("expected SSA value first operand")?;
3202                self.match_token(Token::Comma, "expected ',' between operands")?;
3203                let rhs = self.match_imm64("expected immediate second operand")?;
3204                InstructionData::IntCompareImm {
3205                    opcode,
3206                    cond,
3207                    arg: lhs,
3208                    imm: rhs,
3209                }
3210            }
3211            InstructionFormat::FloatCompare => {
3212                let cond = self.match_enum("expected floatcc condition code")?;
3213                let lhs = self.match_value("expected SSA value first operand")?;
3214                self.match_token(Token::Comma, "expected ',' between operands")?;
3215                let rhs = self.match_value("expected SSA value second operand")?;
3216                InstructionData::FloatCompare {
3217                    opcode,
3218                    cond,
3219                    args: [lhs, rhs],
3220                }
3221            }
3222            InstructionFormat::Call => {
3223                let func_ref = self.match_fn("expected function reference")?;
3224                ctx.check_fn(func_ref, self.loc)?;
3225                self.match_token(Token::LPar, "expected '(' before arguments")?;
3226                let args = self.parse_value_list()?;
3227                self.match_token(Token::RPar, "expected ')' after arguments")?;
3228                InstructionData::Call {
3229                    opcode,
3230                    func_ref,
3231                    args: args.into_value_list(&[], &mut ctx.function.dfg.value_lists),
3232                }
3233            }
3234            InstructionFormat::CallIndirect => {
3235                let sig_ref = self.match_sig("expected signature reference")?;
3236                ctx.check_sig(sig_ref, self.loc)?;
3237                self.match_token(Token::Comma, "expected ',' between operands")?;
3238                let callee = self.match_value("expected SSA value callee operand")?;
3239                self.match_token(Token::LPar, "expected '(' before arguments")?;
3240                let args = self.parse_value_list()?;
3241                self.match_token(Token::RPar, "expected ')' after arguments")?;
3242                InstructionData::CallIndirect {
3243                    opcode,
3244                    sig_ref,
3245                    args: args.into_value_list(&[callee], &mut ctx.function.dfg.value_lists),
3246                }
3247            }
3248            InstructionFormat::TryCall => {
3249                let func_ref = self.match_fn("expected function reference")?;
3250                ctx.check_fn(func_ref, self.loc)?;
3251                self.match_token(Token::LPar, "expected '(' before arguments")?;
3252                let args = self.parse_value_list()?;
3253                self.match_token(Token::RPar, "expected ')' after arguments")?;
3254                self.match_token(Token::Comma, "expected ',' after argument list")?;
3255                let exception = self.parse_exception_table(ctx)?;
3256                InstructionData::TryCall {
3257                    opcode,
3258                    func_ref,
3259                    args: args.into_value_list(&[], &mut ctx.function.dfg.value_lists),
3260                    exception,
3261                }
3262            }
3263            InstructionFormat::TryCallIndirect => {
3264                let callee = self.match_value("expected SSA value callee operand")?;
3265                self.match_token(Token::LPar, "expected '(' before arguments")?;
3266                let args = self.parse_value_list()?;
3267                self.match_token(Token::RPar, "expected ')' after arguments")?;
3268                self.match_token(Token::Comma, "expected ',' after argument list")?;
3269                let exception = self.parse_exception_table(ctx)?;
3270                InstructionData::TryCallIndirect {
3271                    opcode,
3272                    args: args.into_value_list(&[callee], &mut ctx.function.dfg.value_lists),
3273                    exception,
3274                }
3275            }
3276            InstructionFormat::FuncAddr => {
3277                let func_ref = self.match_fn("expected function reference")?;
3278                ctx.check_fn(func_ref, self.loc)?;
3279                InstructionData::FuncAddr { opcode, func_ref }
3280            }
3281            InstructionFormat::StackLoad => {
3282                let ss = self.match_ss("expected stack slot number: ss«n»")?;
3283                ctx.check_ss(ss, self.loc)?;
3284                let offset = self.optional_offset32()?;
3285                InstructionData::StackLoad {
3286                    opcode,
3287                    stack_slot: ss,
3288                    offset,
3289                }
3290            }
3291            InstructionFormat::StackStore => {
3292                let arg = self.match_value("expected SSA value operand")?;
3293                self.match_token(Token::Comma, "expected ',' between operands")?;
3294                let ss = self.match_ss("expected stack slot number: ss«n»")?;
3295                ctx.check_ss(ss, self.loc)?;
3296                let offset = self.optional_offset32()?;
3297                InstructionData::StackStore {
3298                    opcode,
3299                    arg,
3300                    stack_slot: ss,
3301                    offset,
3302                }
3303            }
3304            InstructionFormat::DynamicStackLoad => {
3305                let dss = self.match_dss("expected dynamic stack slot number: dss«n»")?;
3306                ctx.check_dss(dss, self.loc)?;
3307                InstructionData::DynamicStackLoad {
3308                    opcode,
3309                    dynamic_stack_slot: dss,
3310                }
3311            }
3312            InstructionFormat::DynamicStackStore => {
3313                let arg = self.match_value("expected SSA value operand")?;
3314                self.match_token(Token::Comma, "expected ',' between operands")?;
3315                let dss = self.match_dss("expected dynamic stack slot number: dss«n»")?;
3316                ctx.check_dss(dss, self.loc)?;
3317                InstructionData::DynamicStackStore {
3318                    opcode,
3319                    arg,
3320                    dynamic_stack_slot: dss,
3321                }
3322            }
3323            InstructionFormat::Load => {
3324                let flags = self.optional_memflags()?;
3325                let addr = self.match_value("expected SSA value address")?;
3326                let offset = self.optional_offset32()?;
3327                InstructionData::Load {
3328                    opcode,
3329                    flags,
3330                    arg: addr,
3331                    offset,
3332                }
3333            }
3334            InstructionFormat::Store => {
3335                let flags = self.optional_memflags()?;
3336                let arg = self.match_value("expected SSA value operand")?;
3337                self.match_token(Token::Comma, "expected ',' between operands")?;
3338                let addr = self.match_value("expected SSA value address")?;
3339                let offset = self.optional_offset32()?;
3340                InstructionData::Store {
3341                    opcode,
3342                    flags,
3343                    args: [arg, addr],
3344                    offset,
3345                }
3346            }
3347            InstructionFormat::Trap => {
3348                let code = self.match_enum("expected trap code")?;
3349                InstructionData::Trap { opcode, code }
3350            }
3351            InstructionFormat::CondTrap => {
3352                let arg = self.match_value("expected SSA value operand")?;
3353                self.match_token(Token::Comma, "expected ',' between operands")?;
3354                let code = self.match_enum("expected trap code")?;
3355                InstructionData::CondTrap { opcode, arg, code }
3356            }
3357            InstructionFormat::AtomicCas => {
3358                let flags = self.optional_memflags()?;
3359                let addr = self.match_value("expected SSA value address")?;
3360                self.match_token(Token::Comma, "expected ',' between operands")?;
3361                let expected = self.match_value("expected SSA value address")?;
3362                self.match_token(Token::Comma, "expected ',' between operands")?;
3363                let replacement = self.match_value("expected SSA value address")?;
3364                InstructionData::AtomicCas {
3365                    opcode,
3366                    flags,
3367                    args: [addr, expected, replacement],
3368                }
3369            }
3370            InstructionFormat::AtomicRmw => {
3371                let flags = self.optional_memflags()?;
3372                let op = self.match_enum("expected AtomicRmwOp")?;
3373                let addr = self.match_value("expected SSA value address")?;
3374                self.match_token(Token::Comma, "expected ',' between operands")?;
3375                let arg2 = self.match_value("expected SSA value address")?;
3376                InstructionData::AtomicRmw {
3377                    opcode,
3378                    flags,
3379                    op,
3380                    args: [addr, arg2],
3381                }
3382            }
3383            InstructionFormat::LoadNoOffset => {
3384                let flags = self.optional_memflags()?;
3385                let addr = self.match_value("expected SSA value address")?;
3386                InstructionData::LoadNoOffset {
3387                    opcode,
3388                    flags,
3389                    arg: addr,
3390                }
3391            }
3392            InstructionFormat::StoreNoOffset => {
3393                let flags = self.optional_memflags()?;
3394                let arg = self.match_value("expected SSA value operand")?;
3395                self.match_token(Token::Comma, "expected ',' between operands")?;
3396                let addr = self.match_value("expected SSA value address")?;
3397                InstructionData::StoreNoOffset {
3398                    opcode,
3399                    flags,
3400                    args: [arg, addr],
3401                }
3402            }
3403            InstructionFormat::IntAddTrap => {
3404                let a = self.match_value("expected SSA value operand")?;
3405                self.match_token(Token::Comma, "expected ',' between operands")?;
3406                let b = self.match_value("expected SSA value operand")?;
3407                self.match_token(Token::Comma, "expected ',' between operands")?;
3408                let code = self.match_enum("expected trap code")?;
3409                InstructionData::IntAddTrap {
3410                    opcode,
3411                    args: [a, b],
3412                    code,
3413                }
3414            }
3415            InstructionFormat::ExceptionHandlerAddress => {
3416                let block = self.match_block("expected block")?;
3417                self.match_token(Token::Comma, "expected ',' between operands")?;
3418                let imm = self.match_imm64("expected immediate handler index")?;
3419                InstructionData::ExceptionHandlerAddress { opcode, block, imm }
3420            }
3421        };
3422        Ok(idata)
3423    }
3424}
3425
3426#[cfg(test)]
3427mod tests {
3428    use super::*;
3429    use crate::isaspec::IsaSpec;
3430
3431    #[test]
3432    fn argument_type() {
3433        let mut p = Parser::new("i32 sext");
3434        let arg = p.parse_abi_param().unwrap();
3435        assert_eq!(arg.value_type, types::I32);
3436        assert_eq!(arg.extension, ArgumentExtension::Sext);
3437        assert_eq!(arg.purpose, ArgumentPurpose::Normal);
3438        let ParseError {
3439            location,
3440            message,
3441            is_warning,
3442        } = p.parse_abi_param().unwrap_err();
3443        assert_eq!(location.line_number, 1);
3444        assert_eq!(message, "expected parameter type");
3445        assert!(!is_warning);
3446    }
3447
3448    #[test]
3449    fn aliases() {
3450        let (func, details) = Parser::new(
3451            "function %qux() system_v {
3452                                           block0:
3453                                             v4 = iconst.i8 6
3454                                             v3 -> v4
3455                                             v1 = iadd_imm v3, 17
3456                                           }",
3457        )
3458        .parse_function()
3459        .unwrap();
3460        assert_eq!(func.name.to_string(), "%qux");
3461        let v4 = details.map.lookup_str("v4").unwrap();
3462        assert_eq!(v4.to_string(), "v4");
3463        let v3 = details.map.lookup_str("v3").unwrap();
3464        assert_eq!(v3.to_string(), "v3");
3465        match v3 {
3466            AnyEntity::Value(v3) => {
3467                let aliased_to = func.dfg.resolve_aliases(v3);
3468                assert_eq!(aliased_to.to_string(), "v4");
3469            }
3470            _ => panic!("expected value: {v3}"),
3471        }
3472    }
3473
3474    #[test]
3475    fn signature() {
3476        let sig = Parser::new("()system_v").parse_signature().unwrap();
3477        assert_eq!(sig.params.len(), 0);
3478        assert_eq!(sig.returns.len(), 0);
3479        assert_eq!(sig.call_conv, CallConv::SystemV);
3480
3481        let sig2 =
3482            Parser::new("(i8 uext, f16, f32, f64, f128, i32 sret) -> i32 sext, f64 system_v")
3483                .parse_signature()
3484                .unwrap();
3485        assert_eq!(
3486            sig2.to_string(),
3487            "(i8 uext, f16, f32, f64, f128, i32 sret) -> i32 sext, f64 system_v"
3488        );
3489        assert_eq!(sig2.call_conv, CallConv::SystemV);
3490
3491        // Old-style signature without a calling convention.
3492        assert_eq!(
3493            Parser::new("()").parse_signature().unwrap().to_string(),
3494            "() fast"
3495        );
3496        assert_eq!(
3497            Parser::new("() notacc")
3498                .parse_signature()
3499                .unwrap_err()
3500                .to_string(),
3501            "1: unknown calling convention: notacc"
3502        );
3503
3504        // `void` is not recognized as a type by the lexer. It should not appear in files.
3505        assert_eq!(
3506            Parser::new("() -> void")
3507                .parse_signature()
3508                .unwrap_err()
3509                .to_string(),
3510            "1: expected parameter type"
3511        );
3512        assert_eq!(
3513            Parser::new("i8 -> i8")
3514                .parse_signature()
3515                .unwrap_err()
3516                .to_string(),
3517            "1: expected function signature: ( args... )"
3518        );
3519        assert_eq!(
3520            Parser::new("(i8 -> i8")
3521                .parse_signature()
3522                .unwrap_err()
3523                .to_string(),
3524            "1: expected ')' after function arguments"
3525        );
3526    }
3527
3528    #[test]
3529    fn stack_slot_decl() {
3530        let (func, _) = Parser::new(
3531            "function %foo() system_v {
3532                                       ss3 = explicit_slot 13
3533                                       ss1 = explicit_slot 1
3534                                     }",
3535        )
3536        .parse_function()
3537        .unwrap();
3538        assert_eq!(func.name.to_string(), "%foo");
3539        let mut iter = func.sized_stack_slots.keys();
3540        let _ss0 = iter.next().unwrap();
3541        let ss1 = iter.next().unwrap();
3542        assert_eq!(ss1.to_string(), "ss1");
3543        assert_eq!(
3544            func.sized_stack_slots[ss1].kind,
3545            StackSlotKind::ExplicitSlot
3546        );
3547        assert_eq!(func.sized_stack_slots[ss1].size, 1);
3548        let _ss2 = iter.next().unwrap();
3549        let ss3 = iter.next().unwrap();
3550        assert_eq!(ss3.to_string(), "ss3");
3551        assert_eq!(
3552            func.sized_stack_slots[ss3].kind,
3553            StackSlotKind::ExplicitSlot
3554        );
3555        assert_eq!(func.sized_stack_slots[ss3].size, 13);
3556        assert_eq!(iter.next(), None);
3557
3558        // Catch duplicate definitions.
3559        assert_eq!(
3560            Parser::new(
3561                "function %bar() system_v {
3562                                    ss1  = explicit_slot 13
3563                                    ss1  = explicit_slot 1
3564                                }",
3565            )
3566            .parse_function()
3567            .unwrap_err()
3568            .to_string(),
3569            "3: duplicate entity: ss1"
3570        );
3571    }
3572
3573    #[test]
3574    fn block_header() {
3575        let (func, _) = Parser::new(
3576            "function %blocks() system_v {
3577                                     block0:
3578                                     block4(v3: i32):
3579                                     }",
3580        )
3581        .parse_function()
3582        .unwrap();
3583        assert_eq!(func.name.to_string(), "%blocks");
3584
3585        let mut blocks = func.layout.blocks();
3586
3587        let block0 = blocks.next().unwrap();
3588        assert_eq!(func.dfg.block_params(block0), &[]);
3589
3590        let block4 = blocks.next().unwrap();
3591        let block4_args = func.dfg.block_params(block4);
3592        assert_eq!(block4_args.len(), 1);
3593        assert_eq!(func.dfg.value_type(block4_args[0]), types::I32);
3594    }
3595
3596    #[test]
3597    fn duplicate_block() {
3598        let ParseError {
3599            location,
3600            message,
3601            is_warning,
3602        } = Parser::new(
3603            "function %blocks() system_v {
3604                block0:
3605                block0:
3606                    return 2",
3607        )
3608        .parse_function()
3609        .unwrap_err();
3610
3611        assert_eq!(location.line_number, 3);
3612        assert_eq!(message, "duplicate entity: block0");
3613        assert!(!is_warning);
3614    }
3615
3616    #[test]
3617    fn number_of_blocks() {
3618        let ParseError {
3619            location,
3620            message,
3621            is_warning,
3622        } = Parser::new(
3623            "function %a() {
3624                block100000:",
3625        )
3626        .parse_function()
3627        .unwrap_err();
3628
3629        assert_eq!(location.line_number, 2);
3630        assert_eq!(message, "too many blocks");
3631        assert!(!is_warning);
3632    }
3633
3634    #[test]
3635    fn duplicate_ss() {
3636        let ParseError {
3637            location,
3638            message,
3639            is_warning,
3640        } = Parser::new(
3641            "function %blocks() system_v {
3642                ss0 = explicit_slot 8
3643                ss0 = explicit_slot 8",
3644        )
3645        .parse_function()
3646        .unwrap_err();
3647
3648        assert_eq!(location.line_number, 3);
3649        assert_eq!(message, "duplicate entity: ss0");
3650        assert!(!is_warning);
3651    }
3652
3653    #[test]
3654    fn duplicate_gv() {
3655        let ParseError {
3656            location,
3657            message,
3658            is_warning,
3659        } = Parser::new(
3660            "function %blocks() system_v {
3661                gv0 = vmctx
3662                gv0 = vmctx",
3663        )
3664        .parse_function()
3665        .unwrap_err();
3666
3667        assert_eq!(location.line_number, 3);
3668        assert_eq!(message, "duplicate entity: gv0");
3669        assert!(!is_warning);
3670    }
3671
3672    #[test]
3673    fn duplicate_sig() {
3674        let ParseError {
3675            location,
3676            message,
3677            is_warning,
3678        } = Parser::new(
3679            "function %blocks() system_v {
3680                sig0 = ()
3681                sig0 = ()",
3682        )
3683        .parse_function()
3684        .unwrap_err();
3685
3686        assert_eq!(location.line_number, 3);
3687        assert_eq!(message, "duplicate entity: sig0");
3688        assert!(!is_warning);
3689    }
3690
3691    #[test]
3692    fn duplicate_fn() {
3693        let ParseError {
3694            location,
3695            message,
3696            is_warning,
3697        } = Parser::new(
3698            "function %blocks() system_v {
3699                sig0 = ()
3700                fn0 = %foo sig0
3701                fn0 = %foo sig0",
3702        )
3703        .parse_function()
3704        .unwrap_err();
3705
3706        assert_eq!(location.line_number, 4);
3707        assert_eq!(message, "duplicate entity: fn0");
3708        assert!(!is_warning);
3709    }
3710
3711    #[test]
3712    fn comments() {
3713        let (func, Details { comments, .. }) = Parser::new(
3714            "; before
3715                         function %comment() system_v { ; decl
3716                            ss10  = explicit_slot 13 ; stackslot.
3717                            ; Still stackslot.
3718                         block0: ; Basic block
3719                         trap user42; Instruction
3720                         } ; Trailing.
3721                         ; More trailing.",
3722        )
3723        .parse_function()
3724        .unwrap();
3725        assert_eq!(func.name.to_string(), "%comment");
3726        assert_eq!(comments.len(), 7); // no 'before' comment.
3727        assert_eq!(
3728            comments[0],
3729            Comment {
3730                entity: AnyEntity::Function,
3731                text: "; decl",
3732            }
3733        );
3734        assert_eq!(comments[1].entity.to_string(), "ss10");
3735        assert_eq!(comments[2].entity.to_string(), "ss10");
3736        assert_eq!(comments[2].text, "; Still stackslot.");
3737        assert_eq!(comments[3].entity.to_string(), "block0");
3738        assert_eq!(comments[3].text, "; Basic block");
3739
3740        assert_eq!(comments[4].entity.to_string(), "inst0");
3741        assert_eq!(comments[4].text, "; Instruction");
3742
3743        assert_eq!(comments[5].entity, AnyEntity::Function);
3744        assert_eq!(comments[6].entity, AnyEntity::Function);
3745    }
3746
3747    #[test]
3748    fn test_file() {
3749        let tf = parse_test(
3750            r#"; before
3751                             test cfg option=5
3752                             test verify
3753                             set unwind_info=false
3754                             feature "foo"
3755                             feature !"bar"
3756                             ; still preamble
3757                             function %comment() system_v {}"#,
3758            ParseOptions::default(),
3759        )
3760        .unwrap();
3761        assert_eq!(tf.commands.len(), 2);
3762        assert_eq!(tf.commands[0].command, "cfg");
3763        assert_eq!(tf.commands[1].command, "verify");
3764        match tf.isa_spec {
3765            IsaSpec::None(s) => {
3766                assert!(s.enable_verifier());
3767                assert!(!s.unwind_info());
3768            }
3769            _ => panic!("unexpected ISAs"),
3770        }
3771        assert_eq!(tf.features[0], Feature::With(&"foo"));
3772        assert_eq!(tf.features[1], Feature::Without(&"bar"));
3773        assert_eq!(tf.preamble_comments.len(), 2);
3774        assert_eq!(tf.preamble_comments[0].text, "; before");
3775        assert_eq!(tf.preamble_comments[1].text, "; still preamble");
3776        assert_eq!(tf.functions.len(), 1);
3777        assert_eq!(tf.functions[0].0.name.to_string(), "%comment");
3778    }
3779
3780    #[test]
3781    fn isa_spec() {
3782        assert!(
3783            parse_test(
3784                "target
3785                            function %foo() system_v {}",
3786                ParseOptions::default()
3787            )
3788            .is_err()
3789        );
3790
3791        assert!(
3792            parse_test(
3793                "target x86_64
3794                            set unwind_info=false
3795                            function %foo() system_v {}",
3796                ParseOptions::default()
3797            )
3798            .is_err()
3799        );
3800
3801        match parse_test(
3802            "set unwind_info=false
3803                          target x86_64
3804                          function %foo() system_v {}",
3805            ParseOptions::default(),
3806        )
3807        .unwrap()
3808        .isa_spec
3809        {
3810            IsaSpec::None(_) => panic!("Expected some ISA"),
3811            IsaSpec::Some(v) => {
3812                assert_eq!(v.len(), 1);
3813                assert!(v[0].name() == "x64" || v[0].name() == "x86");
3814            }
3815        }
3816    }
3817
3818    #[test]
3819    fn user_function_name() {
3820        // Valid characters in the name:
3821        let func = Parser::new(
3822            "function u1:2() system_v {
3823                                           block0:
3824                                             trap int_divz
3825                                           }",
3826        )
3827        .parse_function()
3828        .unwrap()
3829        .0;
3830        assert_eq!(func.name.to_string(), "u1:2");
3831
3832        // Invalid characters in the name:
3833        let mut parser = Parser::new(
3834            "function u123:abc() system_v {
3835                                           block0:
3836                                             trap stk_ovf
3837                                           }",
3838        );
3839        assert!(parser.parse_function().is_err());
3840
3841        // Incomplete function names should not be valid:
3842        let mut parser = Parser::new(
3843            "function u() system_v {
3844                                           block0:
3845                                             trap int_ovf
3846                                           }",
3847        );
3848        assert!(parser.parse_function().is_err());
3849
3850        let mut parser = Parser::new(
3851            "function u0() system_v {
3852                                           block0:
3853                                             trap int_ovf
3854                                           }",
3855        );
3856        assert!(parser.parse_function().is_err());
3857
3858        let mut parser = Parser::new(
3859            "function u0:() system_v {
3860                                           block0:
3861                                             trap int_ovf
3862                                           }",
3863        );
3864        assert!(parser.parse_function().is_err());
3865    }
3866
3867    #[test]
3868    fn change_default_calling_convention() {
3869        let code = "function %test() {
3870        block0:
3871            return
3872        }";
3873
3874        // By default the parser will use the fast calling convention if none is specified.
3875        let mut parser = Parser::new(code);
3876        assert_eq!(
3877            parser.parse_function().unwrap().0.signature.call_conv,
3878            CallConv::Fast
3879        );
3880
3881        // However, we can specify a different calling convention to be the default.
3882        let mut parser = Parser::new(code).with_default_calling_convention(CallConv::PreserveAll);
3883        assert_eq!(
3884            parser.parse_function().unwrap().0.signature.call_conv,
3885            CallConv::PreserveAll
3886        );
3887    }
3888
3889    #[test]
3890    fn u8_as_hex() {
3891        fn parse_as_uimm8(text: &str) -> ParseResult<u8> {
3892            Parser::new(text).match_uimm8("unable to parse u8")
3893        }
3894
3895        assert_eq!(parse_as_uimm8("0").unwrap(), 0);
3896        assert_eq!(parse_as_uimm8("0xff").unwrap(), 255);
3897        assert!(parse_as_uimm8("-1").is_err());
3898        assert!(parse_as_uimm8("0xffa").is_err());
3899    }
3900
3901    #[test]
3902    fn i16_as_hex() {
3903        fn parse_as_imm16(text: &str) -> ParseResult<i16> {
3904            Parser::new(text).match_imm16("unable to parse i16")
3905        }
3906
3907        assert_eq!(parse_as_imm16("0x8000").unwrap(), -32768);
3908        assert_eq!(parse_as_imm16("0xffff").unwrap(), -1);
3909        assert_eq!(parse_as_imm16("0").unwrap(), 0);
3910        assert_eq!(parse_as_imm16("0x7fff").unwrap(), 32767);
3911        assert_eq!(
3912            parse_as_imm16("-0x0001").unwrap(),
3913            parse_as_imm16("0xffff").unwrap()
3914        );
3915        assert_eq!(
3916            parse_as_imm16("-0x7fff").unwrap(),
3917            parse_as_imm16("0x8001").unwrap()
3918        );
3919        assert!(parse_as_imm16("0xffffa").is_err());
3920    }
3921
3922    #[test]
3923    fn i32_as_hex() {
3924        fn parse_as_imm32(text: &str) -> ParseResult<i32> {
3925            Parser::new(text).match_imm32("unable to parse i32")
3926        }
3927
3928        assert_eq!(parse_as_imm32("0x80000000").unwrap(), -2147483648);
3929        assert_eq!(parse_as_imm32("0xffffffff").unwrap(), -1);
3930        assert_eq!(parse_as_imm32("0").unwrap(), 0);
3931        assert_eq!(parse_as_imm32("0x7fffffff").unwrap(), 2147483647);
3932        assert_eq!(
3933            parse_as_imm32("-0x00000001").unwrap(),
3934            parse_as_imm32("0xffffffff").unwrap()
3935        );
3936        assert_eq!(
3937            parse_as_imm32("-0x7fffffff").unwrap(),
3938            parse_as_imm32("0x80000001").unwrap()
3939        );
3940        assert!(parse_as_imm32("0xffffffffa").is_err());
3941    }
3942
3943    #[test]
3944    fn i64_as_hex() {
3945        fn parse_as_imm64(text: &str) -> ParseResult<Imm64> {
3946            Parser::new(text).match_imm64("unable to parse Imm64")
3947        }
3948
3949        assert_eq!(
3950            parse_as_imm64("0x8000000000000000").unwrap(),
3951            Imm64::new(-9223372036854775808)
3952        );
3953        assert_eq!(
3954            parse_as_imm64("0xffffffffffffffff").unwrap(),
3955            Imm64::new(-1)
3956        );
3957        assert_eq!(parse_as_imm64("0").unwrap(), Imm64::new(0));
3958        assert_eq!(
3959            parse_as_imm64("0x7fffffffffffffff").unwrap(),
3960            Imm64::new(9223372036854775807)
3961        );
3962        assert_eq!(
3963            parse_as_imm64("-0x0000000000000001").unwrap(),
3964            parse_as_imm64("0xffffffffffffffff").unwrap()
3965        );
3966        assert_eq!(
3967            parse_as_imm64("-0x7fffffffffffffff").unwrap(),
3968            parse_as_imm64("0x8000000000000001").unwrap()
3969        );
3970        assert!(parse_as_imm64("0xffffffffffffffffa").is_err());
3971    }
3972
3973    #[test]
3974    fn uimm128() {
3975        macro_rules! parse_as_constant_data {
3976            ($text:expr, $type:expr) => {{ Parser::new($text).parse_literals_to_constant_data($type) }};
3977        }
3978        macro_rules! can_parse_as_constant_data {
3979            ($text:expr, $type:expr) => {{ assert!(parse_as_constant_data!($text, $type).is_ok()) }};
3980        }
3981        macro_rules! cannot_parse_as_constant_data {
3982            ($text:expr, $type:expr) => {{ assert!(parse_as_constant_data!($text, $type).is_err()) }};
3983        }
3984
3985        can_parse_as_constant_data!("1 2 3 4", I32X4);
3986        can_parse_as_constant_data!("1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16", I8X16);
3987        can_parse_as_constant_data!("0x1.1 0x2.2 0x3.3 0x4.4", F32X4);
3988        can_parse_as_constant_data!("0x0 0x1 0x2 0x3", I32X4);
3989        can_parse_as_constant_data!("-1 0 -1 0 -1 0 -1 0", I16X8);
3990        can_parse_as_constant_data!("0 -1", I64X2);
3991        can_parse_as_constant_data!("-1 0", I64X2);
3992        can_parse_as_constant_data!("-1 -1 -1 -1 -1", I32X4); // note that parse_literals_to_constant_data will leave extra tokens unconsumed
3993
3994        cannot_parse_as_constant_data!("1 2 3", I32X4);
3995        cannot_parse_as_constant_data!(" ", F32X4);
3996    }
3997
3998    #[test]
3999    fn parse_constant_from_booleans() {
4000        let c = Parser::new("-1 0 -1 0")
4001            .parse_literals_to_constant_data(I32X4)
4002            .unwrap();
4003        assert_eq!(
4004            c.into_vec(),
4005            [
4006                0xFF, 0xFF, 0xFF, 0xFF, 0, 0, 0, 0, 0xFF, 0xFF, 0xFF, 0xFF, 0, 0, 0, 0
4007            ]
4008        )
4009    }
4010
4011    #[test]
4012    fn parse_unbounded_constants() {
4013        // Unlike match_uimm128, match_hexadecimal_constant can parse byte sequences of any size:
4014        assert_eq!(
4015            Parser::new("0x0100")
4016                .match_hexadecimal_constant("err message")
4017                .unwrap(),
4018            vec![0, 1].into()
4019        );
4020
4021        // Only parse hexadecimal constants:
4022        assert!(
4023            Parser::new("228")
4024                .match_hexadecimal_constant("err message")
4025                .is_err()
4026        );
4027    }
4028
4029    #[test]
4030    fn parse_run_commands() {
4031        // Helper for creating signatures.
4032        fn sig(ins: &[Type], outs: &[Type]) -> Signature {
4033            let mut sig = Signature::new(CallConv::Fast);
4034            for i in ins {
4035                sig.params.push(AbiParam::new(*i));
4036            }
4037            for o in outs {
4038                sig.returns.push(AbiParam::new(*o));
4039            }
4040            sig
4041        }
4042
4043        // Helper for parsing run commands.
4044        fn parse(text: &str, sig: &Signature) -> ParseResult<RunCommand> {
4045            Parser::new(text).parse_run_command(sig)
4046        }
4047
4048        // Check that we can parse and display the same set of run commands.
4049        fn assert_roundtrip(text: &str, sig: &Signature) {
4050            assert_eq!(parse(text, sig).unwrap().to_string(), text);
4051        }
4052        assert_roundtrip("run: %fn0() == 42", &sig(&[], &[I32]));
4053        assert_roundtrip(
4054            "run: %fn0(8, 16, 32, 64) == 1",
4055            &sig(&[I8, I16, I32, I64], &[I8]),
4056        );
4057        assert_roundtrip(
4058            "run: %my_func(1) == 0x0f0e0d0c0b0a09080706050403020100",
4059            &sig(&[I32], &[I8X16]),
4060        );
4061
4062        // Verify that default invocations are created when not specified.
4063        assert_eq!(
4064            parse("run", &sig(&[], &[I32])).unwrap().to_string(),
4065            "run: %default() != 0"
4066        );
4067        assert_eq!(
4068            parse("print", &sig(&[], &[F32X4, I16X8]))
4069                .unwrap()
4070                .to_string(),
4071            "print: %default()"
4072        );
4073
4074        // Demonstrate some unparsable cases.
4075        assert!(parse("print", &sig(&[I32], &[I32])).is_err());
4076        assert!(parse("print:", &sig(&[], &[])).is_err());
4077        assert!(parse("run: ", &sig(&[], &[])).is_err());
4078    }
4079
4080    #[test]
4081    fn parse_data_values() {
4082        fn parse(text: &str, ty: Type) -> DataValue {
4083            Parser::new(text).parse_data_value(ty).unwrap()
4084        }
4085
4086        assert_eq!(parse("8", I8).to_string(), "8");
4087        assert_eq!(parse("16", I16).to_string(), "16");
4088        assert_eq!(parse("32", I32).to_string(), "32");
4089        assert_eq!(parse("64", I64).to_string(), "64");
4090        assert_eq!(
4091            parse("0x01234567_01234567_01234567_01234567", I128).to_string(),
4092            "1512366032949150931280199141537564007"
4093        );
4094        assert_eq!(parse("1234567", I128).to_string(), "1234567");
4095        assert_eq!(parse("0x16.1", F16).to_string(), "0x1.610p4");
4096        assert_eq!(parse("0x32.32", F32).to_string(), "0x1.919000p5");
4097        assert_eq!(parse("0x64.64", F64).to_string(), "0x1.9190000000000p6");
4098        assert_eq!(
4099            parse("0x128.128", F128).to_string(),
4100            "0x1.2812800000000000000000000000p8"
4101        );
4102        assert_eq!(
4103            parse("[0 1 2 3]", I32X4).to_string(),
4104            "0x00000003000000020000000100000000"
4105        );
4106        assert_eq!(parse("[1 2]", I32X2).to_string(), "0x0000000200000001");
4107        assert_eq!(parse("[1 2 3 4]", I8X4).to_string(), "0x04030201");
4108        assert_eq!(parse("[1 2]", I8X2).to_string(), "0x0201");
4109    }
4110
4111    #[test]
4112    fn parse_cold_blocks() {
4113        let code = "function %test() {
4114        block0 cold:
4115            return
4116        block1(v0: i32) cold:
4117            return
4118        block2(v1: i32):
4119            return
4120        }";
4121
4122        let mut parser = Parser::new(code);
4123        let func = parser.parse_function().unwrap().0;
4124        assert_eq!(func.layout.blocks().count(), 3);
4125        assert!(func.layout.is_cold(Block::from_u32(0)));
4126        assert!(func.layout.is_cold(Block::from_u32(1)));
4127        assert!(!func.layout.is_cold(Block::from_u32(2)));
4128    }
4129}