/- Copyright (c) 2019 Microsoft Corporation. All rights reserved. Released under Apache 2.0 license as described in the file LICENSE. Authors: Sebastian Ullrich Elaboration of syntax quotations as terms and patterns (in `match_syntax`). See also `./Hygiene.lean` for the basic hygiene workings and data types. -/ import Lean.Syntax import Lean.Elab.ResolveName import Lean.Elab.Term import Lean.Parser -- TODO: remove after removing old elaborator /- TODO Quotations are currently integrated hackily into the old frontend. This implies the following restrictions: * quotations have to fit in a single line, because that's how the old scanner works :) * `open` commands are not respected (but `export`, `namespace` are) * antiquotation terms have to be trivial (locals, consts (w/ projections), and apps, basically) After removing the old frontend, quotations in this and other files should be cleaned up. -/ namespace Lean namespace Elab namespace Term namespace Quotation -- antiquotation node kinds are formed from the original node kind (if any) plus "antiquot" def isAntiquot : Syntax → Bool | Syntax.node (Name.str _ "antiquot" _) _ => true | _ => false -- Antiquotations can be escaped as in `$$x`, which is useful for nesting macros. def isEscapedAntiquot (stx : Syntax) : Bool := !(stx.getArg 1).getArgs.isEmpty def unescapeAntiquot (stx : Syntax) : Syntax := if isAntiquot stx then stx.setArg 1 $ mkNullNode (stx.getArg 1).getArgs.pop else stx def getAntiquotTerm (stx : Syntax) : Syntax := let e := stx.getArg 2; if e.isIdent then mkTermIdFromIdent e else -- `e` is from `"(" >> termParser >> ")"` e.getArg 1 def antiquotKind? : Syntax → Option SyntaxNodeKind | Syntax.node (Name.str k "antiquot" _) args => if (args.get! 3).isOfKind `antiquotName then some k else -- we treat all antiquotations where the kind was left implicit (`$e`) the same (see `elimAntiquotChoices`) some Name.anonymous | _ => none -- `$e*` is an antiquotation "splice" matching an arbitrary number of syntax nodes def isAntiquotSplice (stx : Syntax) : Bool := isAntiquot stx && (stx.getArg 4).getOptional?.isSome -- If any item of a `many` node is an antiquotation splice, its result should -- be substituted into the `many` node's children def isAntiquotSplicePat (stx : Syntax) : Bool := stx.isOfKind nullKind && stx.getArgs.any (fun arg => isAntiquotSplice arg && !isEscapedAntiquot arg) /-- A term like `($e) is actually ambiguous: the antiquotation could be of kind `term`, or `ident`, or ... . But it shouldn't really matter because antiquotations without explicit kinds behave the same at runtime. So we replace `choice` nodes that contain at least one implicit antiquotation with that antiquotation. -/ private partial def elimAntiquotChoices : Syntax → Syntax | Syntax.node `choice args => match args.find? (fun arg => antiquotKind? arg == Name.anonymous) with | some anti => anti | none => Syntax.node `choice $ args.map elimAntiquotChoices | Syntax.node k args => Syntax.node k $ args.map elimAntiquotChoices | stx => stx -- Elaborate the content of a syntax quotation term private partial def quoteSyntax : Syntax → TermElabM Syntax | Syntax.ident info rawVal val preresolved => do -- Add global scopes at compilation time (now), add macro scope at runtime (in the quotation). -- See the paper for details. r ← resolveGlobalName val; let preresolved := r ++ preresolved; let val := quote val; -- `scp` is bound in stxQuot.expand `(Syntax.ident (SourceInfo.mk none none none) $(quote rawVal) (addMacroScope mainModule $val scp) $(quote preresolved)) -- if antiquotation, insert contents as-is, else recurse | stx@(Syntax.node k _) => if isAntiquot stx && !isEscapedAntiquot stx then -- splices must occur in a `many` node if isAntiquotSplice stx then throwErrorAt stx "unexpected antiquotation splice" else pure $ getAntiquotTerm stx else do empty ← `(Array.empty); -- if escaped antiquotation, decrement by one escape level let stx := unescapeAntiquot stx; args ← stx.getArgs.foldlM (fun args arg => if k == nullKind && isAntiquotSplice arg then -- antiquotation splice pattern: inject args array `(Array.append $args $(getAntiquotTerm arg)) else do arg ← quoteSyntax arg; `(Array.push $args $arg)) empty; `(Syntax.node $(quote k) $args) | Syntax.atom info val => `(Syntax.atom (SourceInfo.mk none none none) $(quote val)) | Syntax.missing => unreachable! def stxQuot.expand (stx : Syntax) : TermElabM Syntax := do let quoted := stx.getArg 1; /- Syntax quotations are monadic values depending on the current macro scope. For efficiency, we bind the macro scope once for each quotation, then build the syntax tree in a completely pure computation depending on this binding. Note that regular function calls do not introduce a new macro scope (i.e. we preserve referential transparency), so we can refer to this same `scp` inside `quoteSyntax` by including it literally in a syntax quotation. -/ -- TODO: simplify to `(do scp ← getCurrMacroScope; pure $(quoteSyntax quoted)) stx ← quoteSyntax (elimAntiquotChoices quoted); `(bind getCurrMacroScope (fun scp => bind getMainModule (fun mainModule => pure $stx))) /- NOTE: It may seem like the newly introduced binding `scp` may accidentally capture identifiers in an antiquotation introduced by `quoteSyntax`. However, note that the syntax quotation above enjoys the same hygiene guarantees as anywhere else in Lean; that is, we implement hygienic quotations by making use of the hygienic quotation support of the bootstrapped Lean compiler! Aside: While this might sound "dangerous", it is in fact less reliant on a "chain of trust" than other bootstrapping parts of Lean: because this implementation itself never uses `scp` (or any other identifier) both inside and outside quotations, it can actually correctly be compiled by an unhygienic (but otherwise correct) implementation of syntax quotations. As long as it is then compiled again with the resulting executable (i.e. up to stage 2), the result is a correct hygienic implementation. In this sense the implementation is "self-stabilizing". It was in fact originally compiled by an unhygienic prototype implementation. -/ @[builtinTermElab stxQuot] def elabStxQuot : TermElab := adaptExpander stxQuot.expand /- match_syntax -/ -- an "alternative" of patterns plus right-hand side private abbrev Alt := List Syntax × Syntax /-- Information on a pattern's head that influences the compilation of a single match step. -/ structure HeadInfo := -- Node kind to match, if any (kind : Option SyntaxNodeKind := none) -- Nested patterns for each argument, if any. In a single match step, we only -- check that the arity matches. The arity is usually implied by the node kind, -- but not in the case of `many` nodes. (argPats : Option (Array Syntax) := none) -- Function to apply to the right-hand side in case the match succeeds. Used to -- bind pattern variables. (rhsFn : Syntax → TermElabM Syntax := pure) instance HeadInfo.Inhabited : Inhabited HeadInfo := ⟨{}⟩ /-- `h1.generalizes h2` iff h1 is equal to or more general than h2, i.e. it matches all nodes h2 matches. This induces a partial ordering. -/ def HeadInfo.generalizes : HeadInfo → HeadInfo → Bool | { kind := none, .. }, _ => true | { kind := some k1, argPats := none, .. }, { kind := some k2, .. } => k1 == k2 | { kind := some k1, argPats := some ps1, .. }, { kind := some k2, argPats := some ps2, .. } => k1 == k2 && ps1.size == ps2.size | _, _ => false private def getHeadInfo (alt : Alt) : HeadInfo := let pat := alt.fst.head!; let unconditional (rhsFn) := { rhsFn := rhsFn : HeadInfo }; -- variable pattern if pat.isOfKind `Lean.Parser.Term.id then unconditional $ fun rhs => `(let $pat := discr; $rhs) -- wildcard pattern else if pat.isOfKind `Lean.Parser.Term.hole then unconditional pure -- quotation pattern else if pat.isOfKind `Lean.Parser.Term.stxQuot then let quoted := pat.getArg 1; if quoted.isAtom then -- We assume that atoms are uniquely determined by the node kind and never have to be checked unconditional pure else if isAntiquot quoted && !isEscapedAntiquot quoted then -- quotation contains a single antiquotation let k := antiquotKind? quoted; -- Antiquotation kinds like `$id:id` influence the parser, but also need to be considered by -- match_syntax (but not by quotation terms). For example, `($id:id) and `($e) are not -- distinguishable without checking the kind of the node to be captured. Note that some -- antiquotations like the latter one for terms do not correspond to any actual node kind -- (signified by `k == Name.anonymous`), so we would only check for `Term.id` here. -- -- if stx.isOfKind `Lean.Parser.Term.id then -- let id := stx; ... -- else -- let e := stx; ... let kind := if k == Name.anonymous then none else k; let anti := getAntiquotTerm quoted; -- Splices should only appear inside a nullKind node, see next case if isAntiquotSplice quoted then unconditional $ fun _ => throwErrorAt quoted "unexpected antiquotation splice" else if anti.isOfKind `Lean.Parser.Term.id then { kind := kind, rhsFn := fun rhs => `(let $anti := discr; $rhs) } else unconditional $ fun _ => throwErrorAt anti ("match_syntax: antiquotation must be variable " ++ toString anti) else if isAntiquotSplicePat quoted && quoted.getArgs.size == 1 then -- quotation is a single antiquotation splice => bind args array let anti := getAntiquotTerm (quoted.getArg 0); unconditional $ fun rhs => `(let $anti := Syntax.getArgs discr; $rhs) -- TODO: support for more complex antiquotation splices else -- not an antiquotation or escaped antiquotation: match head shape let quoted := unescapeAntiquot quoted; let argPats := quoted.getArgs.map $ fun arg => Syntax.node `Lean.Parser.Term.stxQuot #[mkAtom "`(", arg, mkAtom ")"]; { kind := quoted.getKind, argPats := argPats } else unconditional $ fun _ => throwErrorAt pat ("match_syntax: unexpected pattern kind " ++ toString pat) -- Assuming that the first pattern of the alternative is taken, replace it with patterns (if any) for its -- child nodes. -- Ex: `($a + (- $b)) => `($a), `(+), `(- $b) -- Note: The atom pattern `(+) will be discarded in a later step private def explodeHeadPat (numArgs : Nat) : HeadInfo × Alt → TermElabM Alt | (info, (pat::pats, rhs)) => do let newPats := match info.argPats with | some argPats => argPats.toList | none => List.replicate numArgs $ Unhygienic.run `(_); rhs ← info.rhsFn rhs; pure (newPats ++ pats, rhs) | _ => unreachable! private partial def compileStxMatch : List Syntax → List Alt → TermElabM Syntax | [], ([], rhs)::_ => pure rhs -- nothing left to match | _, [] => throwError "non-exhaustive 'match_syntax'" | discr::discrs, alts => do let alts := (alts.map getHeadInfo).zip alts; -- Choose a most specific pattern, ie. a minimal element according to `generalizes`. -- If there are multiple minimal elements, the choice does not matter. let (info, alt) := alts.tail!.foldl (fun (min : HeadInfo × Alt) (alt : HeadInfo × Alt) => if min.1.generalizes alt.1 then alt else min) alts.head!; -- introduce pattern matches on the discriminant's children if there are any nested patterns newDiscrs ← match info.argPats with | some pats => (List.range pats.size).mapM $ fun i => `(Syntax.getArg discr $(quote i)) | none => pure []; -- collect matching alternatives and explode them let yesAlts := alts.filter $ fun (alt : HeadInfo × Alt) => alt.1.generalizes info; yesAlts ← yesAlts.mapM $ explodeHeadPat newDiscrs.length; -- NOTE: use fresh macro scopes for recursive call so that different `discr`s introduced by the quotations below do not collide yes ← withFreshMacroScope $ compileStxMatch (newDiscrs ++ discrs) yesAlts; some kind ← pure info.kind -- unconditional match step | `(let discr := $discr; $yes); -- conditional match step let noAlts := (alts.filter $ fun (alt : HeadInfo × Alt) => !info.generalizes alt.1).map Prod.snd; no ← withFreshMacroScope $ compileStxMatch (discr::discrs) noAlts; cond ← match info.argPats with | some pats => `(Syntax.isOfKind discr $(quote kind) && Array.size (Syntax.getArgs discr) == $(quote pats.size)) | none => `(Syntax.isOfKind discr $(quote kind)); `(let discr := $discr; if $cond = true then $yes else $no) | _, _ => unreachable! private partial def getPatternVarsAux : Syntax → List Syntax | stx@(Syntax.node k args) => if isAntiquot stx && !isEscapedAntiquot stx then let anti := getAntiquotTerm stx; if anti.isOfKind `Lean.Parser.Term.id then [anti] else [] else List.join $ args.toList.map getPatternVarsAux | _ => [] -- Get all pattern vars (as Term.id nodes) in `stx` partial def getPatternVars (stx : Syntax) : List Syntax := if stx.isOfKind `Lean.Parser.Term.stxQuot then do let quoted := stx.getArg 1; getPatternVarsAux stx else if stx.isOfKind `Lean.Parser.Term.id then [stx] else [] -- Transform alternatives by binding all right-hand sides to outside the match_syntax in order to prevent -- code duplication during match_syntax compilation private def letBindRhss (cont : List Alt → TermElabM Syntax) : List Alt → List Alt → TermElabM Syntax | [], altsRev' => cont altsRev'.reverse | (pats, rhs)::alts, altsRev' => do let vars := List.join $ pats.map getPatternVars; match vars with -- no antiquotations => introduce Unit parameter to preserve evaluation order | [] => do -- NOTE: references binding below rhs' ← `(rhs ()); -- NOTE: new macro scope so that introduced bindings do not collide stx ← withFreshMacroScope $ letBindRhss alts ((pats, rhs')::altsRev'); `(let rhs := fun _ => $rhs; $stx) | _ => do -- rhs ← `(fun $vars* => $rhs) let rhs := Syntax.node `Lean.Parser.Term.fun #[mkAtom "fun", Syntax.node `null vars.toArray, mkAtom "=>", rhs]; rhs' ← `(rhs); stx ← withFreshMacroScope $ letBindRhss alts ((pats, rhs')::altsRev'); `(let rhs := $rhs; $stx) def match_syntax.expand (stx : Syntax) : TermElabM Syntax := do let discr := stx.getArg 1; let alts := stx.getArg 4; alts ← alts.getArgs.getSepElems.mapM $ fun alt => do { let pats := alt.getArg 0; pat ← if pats.getArgs.size == 1 then pure $ pats.getArg 0 else throwError "match_syntax: expected exactly one pattern per alternative"; let pat := if pat.isOfKind `Lean.Parser.Term.stxQuot then pat.setArg 1 $ elimAntiquotChoices $ pat.getArg 1 else pat; match pat.find? $ fun stx => stx.getKind == choiceKind with | some choiceStx => throwErrorAt choiceStx "invalid pattern, nested syntax has multiple interpretations" | none => let rhs := alt.getArg 2; pure ([pat], rhs) }; -- letBindRhss (compileStxMatch stx [discr]) alts.toList [] compileStxMatch [discr] alts.toList @[builtinTermElab «match_syntax»] def elabMatchSyntax : TermElab := adaptExpander match_syntax.expand -- REMOVE with old frontend private def exprPlaceholder := mkMVar Name.anonymous private unsafe partial def toPreterm : Syntax → TermElabM Expr | stx => withRef stx $ let args := stx.getArgs; match stx.getKind with | `Lean.Parser.Term.id => match args.get! 0 with | Syntax.ident _ _ val preresolved => do resolved ← resolveName val preresolved []; match resolved with | (pre,projs)::_ => let pre := match pre with | Expr.const c _ _ => Lean.mkConst c -- remove universes confusing the old frontend | _ => pre; pure $ projs.foldl (fun e proj => mkMData (MData.empty.setName `fieldNotation proj) e) pre | [] => unreachable! | _ => unreachable! | `Lean.Parser.Term.fun => do let params := (args.get! 1).getArgs; let body := args.get! 3; if params.size == 0 then toPreterm body else do let param := params.get! 0; (n, ty) ← if param.isOfKind `Lean.Parser.Term.id then pure (param.getIdAt 0, exprPlaceholder) else if param.isOfKind `Lean.Parser.Term.hole then pure (`_a, exprPlaceholder) else do { let n := ((param.getArg 1).getArg 0).getIdAt 0; ty ← toPreterm $ (((param.getArg 1).getArg 1).getArg 0).getArg 1; pure (n, ty) }; lctx ← getLCtx; let lctx := lctx.mkLocalDecl n n ty; let params := params.eraseIdx 0; stx ← `(fun $params* => $body); adaptReader (fun (ctx : Context) => { ctx with lctx := lctx }) $ do e ← toPreterm stx; pure $ lctx.mkLambda #[mkFVar n] e | `Lean.Parser.Term.let => do let decl := args.get! 1; let n := if (decl.getArg 0).isIdent then (decl.getArg 0).getId else (decl.getArg 0).getIdAt 0; let val := decl.getArg 4; let body := args.get! 3; val ← toPreterm val; lctx ← getLCtx; let lctx := lctx.mkLetDecl n n exprPlaceholder val; adaptReader (fun (ctx : Context) => { ctx with lctx := lctx }) $ do e ← toPreterm $ body; pure $ lctx.mkLambda #[mkFVar n] e | `Lean.Parser.Term.app => do fn ← toPreterm $ args.get! 0; as ← (args.get! 1).getArgs.mapM toPreterm; pure $ mkAppN fn as | `Lean.Parser.Term.if => do let con := args.get! 2; let yes := args.get! 4; let no := args.get! 6; toPreterm $ Unhygienic.run `(ite $con $yes $no) | `Lean.Parser.Term.paren => let inner := (args.get! 1).getArgs; if inner.size == 0 then pure $ Lean.mkConst `Unit.unit else toPreterm $ inner.get! 0 | `Lean.Parser.Term.band => let lhs := args.get! 0; let rhs := args.get! 2; toPreterm $ Unhygienic.run `(and $lhs $rhs) | `Lean.Parser.Term.beq => let lhs := args.get! 0; let rhs := args.get! 2; toPreterm $ Unhygienic.run `(HasBeq.beq $lhs $rhs) | `Lean.Parser.Term.eq => let lhs := args.get! 0; let rhs := args.get! 2; toPreterm $ Unhygienic.run `(Eq $lhs $rhs) | `Lean.Parser.Term.str => pure $ mkStrLit $ (stx.getArg 0).isStrLit?.getD "" | `Lean.Parser.Term.num => pure $ mkNatLit $ (stx.getArg 0).isNatLit?.getD 0 | `expr => pure $ unsafeCast $ stx.getArg 0 -- HACK: see below | k => throwError $ "stxQuot: unimplemented kind " ++ toString k @[export lean_parse_expr] def oldParseExpr (env : Environment) (input : String) (pos : String.Pos) : Except String (Syntax × String.Pos) := do let c := Parser.mkParserContext env (Parser.mkInputContext input ""); let s := Parser.mkParserState c.input; let s := s.setPos pos; let s := (Parser.termParser Parser.maxPrec : Parser.Parser).fn { c with prec := Parser.maxPrec } s; let stx := s.stxStack.back; match s.errorMsg with | some errorMsg => Except.error $ toString errorMsg | none => Except.ok (stx, s.pos) structure OldContext := (env : Environment) (locals : List Name) (open_nss : List Name) private def oldRunTermElabM {α} (ctx : OldContext) (x : TermElabM α) : Except String α := do match x {fileName := "foo", fileMap := FileMap.ofString "", currNamespace := ctx.env.getNamespace, currRecDepth := 0, maxRecDepth := 10000, openDecls := ctx.open_nss.map $ fun n => OpenDecl.simple n [], lctx := ctx.locals.foldl (fun lctx l => LocalContext.mkLocalDecl lctx l l exprPlaceholder) $ LocalContext.mkEmpty ()} {env := ctx.env} with | EStateM.Result.ok a _ => Except.ok a | EStateM.Result.error msg _ => Except.error $ toString msg @[export lean_expand_stx_quot] unsafe def oldExpandStxQuot (ctx : OldContext) (stx : Syntax) : Except String Expr := oldRunTermElabM ctx $ do stx ← stxQuot.expand stx; toPreterm stx @[export lean_get_antiquot_vars] def oldGetPatternVars (ctx : OldContext) (pats : List Syntax) : Except String (List Name) := oldRunTermElabM ctx $ do let vars := List.join $ pats.map getPatternVars; pure $ vars.map $ fun var => var.getIdAt 0 @[export lean_expand_match_syntax] unsafe def oldExpandMatchSyntax (ctx : OldContext) (discr : Syntax) (alts : List (List Syntax × Syntax)) : Except String Expr := oldRunTermElabM ctx $ do -- HACK: discr and the RHSs are actually `Expr` let discr := Syntax.node `expr #[discr]; let alts := alts.map $ fun alt => let pats := alt.1.map elimAntiquotChoices; (pats, Syntax.node `expr #[alt.2]); -- letBindRhss (compileStxMatch Syntax.missing [discr]) alts [] stx ← compileStxMatch [discr] alts; toPreterm stx end Quotation end Term end Elab end Lean