diff options
Diffstat (limited to 'compiler/types/Unify.lhs')
-rw-r--r-- | compiler/types/Unify.lhs | 536 |
1 files changed, 536 insertions, 0 deletions
diff --git a/compiler/types/Unify.lhs b/compiler/types/Unify.lhs new file mode 100644 index 0000000000..f60c7bee61 --- /dev/null +++ b/compiler/types/Unify.lhs @@ -0,0 +1,536 @@ +\begin{code} +module Unify ( + -- Matching and unification + tcMatchTys, tcMatchTyX, ruleMatchTyX, tcMatchPreds, MatchEnv(..), + + tcUnifyTys, + + gadtRefineTys, BindFlag(..), + + coreRefineTys, TypeRefinement, + + -- Re-export + MaybeErr(..) + ) where + +#include "HsVersions.h" + +import Var ( Var, TyVar, tyVarKind ) +import VarEnv +import VarSet +import Kind ( isSubKind ) +import Type ( typeKind, tyVarsOfType, tyVarsOfTypes, tyVarsOfTheta, mkTyVarTys, + TvSubstEnv, emptyTvSubstEnv, TvSubst(..), substTy, tcEqTypeX, + mkOpenTvSubst, tcView ) +import TypeRep ( Type(..), PredType(..), funTyCon ) +import DataCon ( DataCon, dataConInstResTy ) +import Util ( snocView ) +import ErrUtils ( Message ) +import Outputable +import Maybes +\end{code} + + +%************************************************************************ +%* * + Matching +%* * +%************************************************************************ + + +Matching is much tricker than you might think. + +1. The substitution we generate binds the *template type variables* + which are given to us explicitly. + +2. We want to match in the presence of foralls; + e.g (forall a. t1) ~ (forall b. t2) + + That is what the RnEnv2 is for; it does the alpha-renaming + that makes it as if a and b were the same variable. + Initialising the RnEnv2, so that it can generate a fresh + binder when necessary, entails knowing the free variables of + both types. + +3. We must be careful not to bind a template type variable to a + locally bound variable. E.g. + (forall a. x) ~ (forall b. b) + where x is the template type variable. Then we do not want to + bind x to a/b! This is a kind of occurs check. + The necessary locals accumulate in the RnEnv2. + + +\begin{code} +data MatchEnv + = ME { me_tmpls :: VarSet -- Template tyvars + , me_env :: RnEnv2 -- Renaming envt for nested foralls + } -- In-scope set includes template tyvars + +tcMatchTys :: TyVarSet -- Template tyvars + -> [Type] -- Template + -> [Type] -- Target + -> Maybe TvSubst -- One-shot; in principle the template + -- variables could be free in the target + +tcMatchTys tmpls tys1 tys2 + = case match_tys menv emptyTvSubstEnv tys1 tys2 of + Just subst_env -> Just (TvSubst in_scope subst_env) + Nothing -> Nothing + where + menv = ME { me_tmpls = tmpls, me_env = mkRnEnv2 in_scope } + in_scope = mkInScopeSet (tmpls `unionVarSet` tyVarsOfTypes tys2) + -- We're assuming that all the interesting + -- tyvars in tys1 are in tmpls + +-- This is similar, but extends a substitution +tcMatchTyX :: TyVarSet -- Template tyvars + -> TvSubst -- Substitution to extend + -> Type -- Template + -> Type -- Target + -> Maybe TvSubst +tcMatchTyX tmpls (TvSubst in_scope subst_env) ty1 ty2 + = case match menv subst_env ty1 ty2 of + Just subst_env -> Just (TvSubst in_scope subst_env) + Nothing -> Nothing + where + menv = ME {me_tmpls = tmpls, me_env = mkRnEnv2 in_scope} + +tcMatchPreds + :: [TyVar] -- Bind these + -> [PredType] -> [PredType] + -> Maybe TvSubstEnv +tcMatchPreds tmpls ps1 ps2 + = match_list (match_pred menv) emptyTvSubstEnv ps1 ps2 + where + menv = ME { me_tmpls = mkVarSet tmpls, me_env = mkRnEnv2 in_scope_tyvars } + in_scope_tyvars = mkInScopeSet (tyVarsOfTheta ps1 `unionVarSet` tyVarsOfTheta ps2) + +-- This one is called from the expression matcher, which already has a MatchEnv in hand +ruleMatchTyX :: MatchEnv + -> TvSubstEnv -- Substitution to extend + -> Type -- Template + -> Type -- Target + -> Maybe TvSubstEnv + +ruleMatchTyX menv subst ty1 ty2 = match menv subst ty1 ty2 -- Rename for export +\end{code} + +Now the internals of matching + +\begin{code} +match :: MatchEnv -- For the most part this is pushed downwards + -> TvSubstEnv -- Substitution so far: + -- Domain is subset of template tyvars + -- Free vars of range is subset of + -- in-scope set of the RnEnv2 + -> Type -> Type -- Template and target respectively + -> Maybe TvSubstEnv +-- This matcher works on source types; that is, +-- it respects NewTypes and PredType + +match menv subst ty1 ty2 | Just ty1' <- tcView ty1 = match menv subst ty1' ty2 +match menv subst ty1 ty2 | Just ty2' <- tcView ty2 = match menv subst ty1 ty2' + +match menv subst (TyVarTy tv1) ty2 + | tv1 `elemVarSet` me_tmpls menv + = case lookupVarEnv subst tv1' of + Nothing | any (inRnEnvR rn_env) (varSetElems (tyVarsOfType ty2)) + -> Nothing -- Occurs check + | not (typeKind ty2 `isSubKind` tyVarKind tv1) + -> Nothing -- Kind mis-match + | otherwise + -> Just (extendVarEnv subst tv1 ty2) + + Just ty1' | tcEqTypeX (nukeRnEnvL rn_env) ty1' ty2 + -- ty1 has no locally-bound variables, hence nukeRnEnvL + -- Note tcEqType...we are doing source-type matching here + -> Just subst + + other -> Nothing + + | otherwise -- tv1 is not a template tyvar + = case ty2 of + TyVarTy tv2 | tv1' == rnOccR rn_env tv2 -> Just subst + other -> Nothing + where + rn_env = me_env menv + tv1' = rnOccL rn_env tv1 + +match menv subst (ForAllTy tv1 ty1) (ForAllTy tv2 ty2) + = match menv' subst ty1 ty2 + where -- Use the magic of rnBndr2 to go under the binders + menv' = menv { me_env = rnBndr2 (me_env menv) tv1 tv2 } + +match menv subst (PredTy p1) (PredTy p2) + = match_pred menv subst p1 p2 +match menv subst (TyConApp tc1 tys1) (TyConApp tc2 tys2) + | tc1 == tc2 = match_tys menv subst tys1 tys2 +match menv subst (FunTy ty1a ty1b) (FunTy ty2a ty2b) + = do { subst' <- match menv subst ty1a ty2a + ; match menv subst' ty1b ty2b } +match menv subst (AppTy ty1a ty1b) ty2 + | Just (ty2a, ty2b) <- repSplitAppTy_maybe ty2 + = do { subst' <- match menv subst ty1a ty2a + ; match menv subst' ty1b ty2b } + +match menv subst ty1 ty2 + = Nothing + +-------------- +match_tys menv subst tys1 tys2 = match_list (match menv) subst tys1 tys2 + +-------------- +match_list :: (TvSubstEnv -> a -> a -> Maybe TvSubstEnv) + -> TvSubstEnv -> [a] -> [a] -> Maybe TvSubstEnv +match_list fn subst [] [] = Just subst +match_list fn subst (ty1:tys1) (ty2:tys2) = do { subst' <- fn subst ty1 ty2 + ; match_list fn subst' tys1 tys2 } +match_list fn subst tys1 tys2 = Nothing + +-------------- +match_pred menv subst (ClassP c1 tys1) (ClassP c2 tys2) + | c1 == c2 = match_tys menv subst tys1 tys2 +match_pred menv subst (IParam n1 t1) (IParam n2 t2) + | n1 == n2 = match menv subst t1 t2 +match_pred menv subst p1 p2 = Nothing +\end{code} + + +%************************************************************************ +%* * + Unification +%* * +%************************************************************************ + +\begin{code} +tcUnifyTys :: (TyVar -> BindFlag) + -> [Type] -> [Type] + -> Maybe TvSubst -- A regular one-shot substitution +-- The two types may have common type variables, and indeed do so in the +-- second call to tcUnifyTys in FunDeps.checkClsFD +tcUnifyTys bind_fn tys1 tys2 + = maybeErrToMaybe $ initUM bind_fn $ + do { subst_env <- unify_tys emptyTvSubstEnv tys1 tys2 + + -- Find the fixed point of the resulting non-idempotent substitution + ; let in_scope = mkInScopeSet (tvs1 `unionVarSet` tvs2) + subst = TvSubst in_scope subst_env_fixpt + subst_env_fixpt = mapVarEnv (substTy subst) subst_env + ; return subst } + where + tvs1 = tyVarsOfTypes tys1 + tvs2 = tyVarsOfTypes tys2 + +---------------------------- +coreRefineTys :: DataCon -> [TyVar] -- Case pattern (con tv1 .. tvn ...) + -> Type -- Type of scrutinee + -> Maybe TypeRefinement + +type TypeRefinement = (TvSubstEnv, Bool) + -- The Bool is True iff all the bindings in the + -- env are for the pattern type variables + -- In this case, there is no type refinement + -- for already-in-scope type variables + +-- Used by Core Lint and the simplifier. +coreRefineTys con tvs scrut_ty + = maybeErrToMaybe $ initUM (tryToBind tv_set) $ + do { -- Run the unifier, starting with an empty env + ; subst_env <- unify emptyTvSubstEnv pat_res_ty scrut_ty + + -- Find the fixed point of the resulting non-idempotent substitution + ; let subst = mkOpenTvSubst subst_env_fixpt + subst_env_fixpt = mapVarEnv (substTy subst) subst_env + + ; return (subst_env_fixpt, all_bound_here subst_env) } + where + pat_res_ty = dataConInstResTy con (mkTyVarTys tvs) + + -- 'tvs' are the tyvars bound by the pattern + tv_set = mkVarSet tvs + all_bound_here env = all bound_here (varEnvKeys env) + bound_here uniq = elemVarSetByKey uniq tv_set + +-- This version is used by the type checker +gadtRefineTys :: TvSubst + -> DataCon -> [TyVar] + -> [Type] -> [Type] + -> MaybeErr Message (TvSubst, Bool) +-- The bool is True <=> the only *new* bindings are for pat_tvs + +gadtRefineTys (TvSubst in_scope env1) con pat_tvs pat_tys ctxt_tys + = initUM (tryToBind tv_set) $ + do { -- Run the unifier, starting with an empty env + ; env2 <- unify_tys env1 pat_tys ctxt_tys + + -- Find the fixed point of the resulting non-idempotent substitution + ; let subst2 = TvSubst in_scope subst_env_fixpt + subst_env_fixpt = mapVarEnv (substTy subst2) env2 + + ; return (subst2, all_bound_here env2) } + where + -- 'tvs' are the tyvars bound by the pattern + tv_set = mkVarSet pat_tvs + all_bound_here env = all bound_here (varEnvKeys env) + bound_here uniq = elemVarEnvByKey uniq env1 || elemVarSetByKey uniq tv_set + -- The bool is True <=> the only *new* bindings are for pat_tvs + +---------------------------- +tryToBind :: TyVarSet -> TyVar -> BindFlag +tryToBind tv_set tv | tv `elemVarSet` tv_set = BindMe + | otherwise = AvoidMe +\end{code} + + +%************************************************************************ +%* * + The workhorse +%* * +%************************************************************************ + +\begin{code} +unify :: TvSubstEnv -- An existing substitution to extend + -> Type -> Type -- Types to be unified + -> UM TvSubstEnv -- Just the extended substitution, + -- Nothing if unification failed +-- We do not require the incoming substitution to be idempotent, +-- nor guarantee that the outgoing one is. That's fixed up by +-- the wrappers. + +-- Respects newtypes, PredTypes + +unify subst ty1 ty2 = -- pprTrace "unify" (ppr subst <+> pprParendType ty1 <+> pprParendType ty2) $ + unify_ subst ty1 ty2 + +-- in unify_, any NewTcApps/Preds should be taken at face value +unify_ subst (TyVarTy tv1) ty2 = uVar False subst tv1 ty2 +unify_ subst ty1 (TyVarTy tv2) = uVar True subst tv2 ty1 + +unify_ subst ty1 ty2 | Just ty1' <- tcView ty1 = unify subst ty1' ty2 +unify_ subst ty1 ty2 | Just ty2' <- tcView ty2 = unify subst ty1 ty2' + +unify_ subst (PredTy p1) (PredTy p2) = unify_pred subst p1 p2 + +unify_ subst t1@(TyConApp tyc1 tys1) t2@(TyConApp tyc2 tys2) + | tyc1 == tyc2 = unify_tys subst tys1 tys2 + +unify_ subst (FunTy ty1a ty1b) (FunTy ty2a ty2b) + = do { subst' <- unify subst ty1a ty2a + ; unify subst' ty1b ty2b } + + -- Applications need a bit of care! + -- They can match FunTy and TyConApp, so use splitAppTy_maybe + -- NB: we've already dealt with type variables and Notes, + -- so if one type is an App the other one jolly well better be too +unify_ subst (AppTy ty1a ty1b) ty2 + | Just (ty2a, ty2b) <- repSplitAppTy_maybe ty2 + = do { subst' <- unify subst ty1a ty2a + ; unify subst' ty1b ty2b } + +unify_ subst ty1 (AppTy ty2a ty2b) + | Just (ty1a, ty1b) <- repSplitAppTy_maybe ty1 + = do { subst' <- unify subst ty1a ty2a + ; unify subst' ty1b ty2b } + +unify_ subst ty1 ty2 = failWith (misMatch ty1 ty2) + +------------------------------ +unify_pred subst (ClassP c1 tys1) (ClassP c2 tys2) + | c1 == c2 = unify_tys subst tys1 tys2 +unify_pred subst (IParam n1 t1) (IParam n2 t2) + | n1 == n2 = unify subst t1 t2 +unify_pred subst p1 p2 = failWith (misMatch (PredTy p1) (PredTy p2)) + +------------------------------ +unify_tys = unifyList unify + +unifyList :: Outputable a + => (TvSubstEnv -> a -> a -> UM TvSubstEnv) + -> TvSubstEnv -> [a] -> [a] -> UM TvSubstEnv +unifyList unifier subst orig_xs orig_ys + = go subst orig_xs orig_ys + where + go subst [] [] = return subst + go subst (x:xs) (y:ys) = do { subst' <- unifier subst x y + ; go subst' xs ys } + go subst _ _ = failWith (lengthMisMatch orig_xs orig_ys) + +------------------------------ +uVar :: Bool -- Swapped + -> TvSubstEnv -- An existing substitution to extend + -> TyVar -- Type variable to be unified + -> Type -- with this type + -> UM TvSubstEnv + +uVar swap subst tv1 ty + = -- Check to see whether tv1 is refined by the substitution + case (lookupVarEnv subst tv1) of + -- Yes, call back into unify' + Just ty' | swap -> unify subst ty ty' + | otherwise -> unify subst ty' ty + -- No, continue + Nothing -> uUnrefined subst tv1 ty ty + + +uUnrefined :: TvSubstEnv -- An existing substitution to extend + -> TyVar -- Type variable to be unified + -> Type -- with this type + -> Type -- (de-noted version) + -> UM TvSubstEnv + +-- We know that tv1 isn't refined + +uUnrefined subst tv1 ty2 ty2' + | Just ty2'' <- tcView ty2' + = uUnrefined subst tv1 ty2 ty2'' -- Unwrap synonyms + -- This is essential, in case we have + -- type Foo a = a + -- and then unify a :=: Foo a + +uUnrefined subst tv1 ty2 (TyVarTy tv2) + | tv1 == tv2 -- Same type variable + = return subst + + -- Check to see whether tv2 is refined + | Just ty' <- lookupVarEnv subst tv2 + = uUnrefined subst tv1 ty' ty' + + -- So both are unrefined; next, see if the kinds force the direction + | k1 == k2 -- Can update either; so check the bind-flags + = do { b1 <- tvBindFlag tv1 + ; b2 <- tvBindFlag tv2 + ; case (b1,b2) of + (BindMe, _) -> bind tv1 ty2 + + (AvoidMe, BindMe) -> bind tv2 ty1 + (AvoidMe, _) -> bind tv1 ty2 + + (WildCard, WildCard) -> return subst + (WildCard, Skolem) -> return subst + (WildCard, _) -> bind tv2 ty1 + + (Skolem, WildCard) -> return subst + (Skolem, Skolem) -> failWith (misMatch ty1 ty2) + (Skolem, _) -> bind tv2 ty1 + } + + | k1 `isSubKind` k2 = bindTv subst tv2 ty1 -- Must update tv2 + | k2 `isSubKind` k1 = bindTv subst tv1 ty2 -- Must update tv1 + + | otherwise = failWith (kindMisMatch tv1 ty2) + where + ty1 = TyVarTy tv1 + k1 = tyVarKind tv1 + k2 = tyVarKind tv2 + bind tv ty = return (extendVarEnv subst tv ty) + +uUnrefined subst tv1 ty2 ty2' -- ty2 is not a type variable + | tv1 `elemVarSet` substTvSet subst (tyVarsOfType ty2') + = failWith (occursCheck tv1 ty2) -- Occurs check + | not (k2 `isSubKind` k1) + = failWith (kindMisMatch tv1 ty2) -- Kind check + | otherwise + = bindTv subst tv1 ty2 -- Bind tyvar to the synonym if poss + where + k1 = tyVarKind tv1 + k2 = typeKind ty2' + +substTvSet :: TvSubstEnv -> TyVarSet -> TyVarSet +-- Apply the non-idempotent substitution to a set of type variables, +-- remembering that the substitution isn't necessarily idempotent +substTvSet subst tvs + = foldVarSet (unionVarSet . get) emptyVarSet tvs + where + get tv = case lookupVarEnv subst tv of + Nothing -> unitVarSet tv + Just ty -> substTvSet subst (tyVarsOfType ty) + +bindTv subst tv ty -- ty is not a type variable + = do { b <- tvBindFlag tv + ; case b of + Skolem -> failWith (misMatch (TyVarTy tv) ty) + WildCard -> return subst + other -> return (extendVarEnv subst tv ty) + } +\end{code} + +%************************************************************************ +%* * + Unification monad +%* * +%************************************************************************ + +\begin{code} +data BindFlag + = BindMe -- A regular type variable + | AvoidMe -- Like BindMe but, given the choice, avoid binding it + + | Skolem -- This type variable is a skolem constant + -- Don't bind it; it only matches itself + + | WildCard -- This type variable matches anything, + -- and does not affect the substitution + +newtype UM a = UM { unUM :: (TyVar -> BindFlag) + -> MaybeErr Message a } + +instance Monad UM where + return a = UM (\tvs -> Succeeded a) + fail s = UM (\tvs -> Failed (text s)) + m >>= k = UM (\tvs -> case unUM m tvs of + Failed err -> Failed err + Succeeded v -> unUM (k v) tvs) + +initUM :: (TyVar -> BindFlag) -> UM a -> MaybeErr Message a +initUM badtvs um = unUM um badtvs + +tvBindFlag :: TyVar -> UM BindFlag +tvBindFlag tv = UM (\tv_fn -> Succeeded (tv_fn tv)) + +failWith :: Message -> UM a +failWith msg = UM (\tv_fn -> Failed msg) + +maybeErrToMaybe :: MaybeErr fail succ -> Maybe succ +maybeErrToMaybe (Succeeded a) = Just a +maybeErrToMaybe (Failed m) = Nothing + +------------------------------ +repSplitAppTy_maybe :: Type -> Maybe (Type,Type) +-- Like Type.splitAppTy_maybe, but any coreView stuff is already done +repSplitAppTy_maybe (FunTy ty1 ty2) = Just (TyConApp funTyCon [ty1], ty2) +repSplitAppTy_maybe (AppTy ty1 ty2) = Just (ty1, ty2) +repSplitAppTy_maybe (TyConApp tc tys) = case snocView tys of + Just (tys', ty') -> Just (TyConApp tc tys', ty') + Nothing -> Nothing +repSplitAppTy_maybe other = Nothing +\end{code} + + +%************************************************************************ +%* * + Error reporting + We go to a lot more trouble to tidy the types + in TcUnify. Maybe we'll end up having to do that + here too, but I'll leave it for now. +%* * +%************************************************************************ + +\begin{code} +misMatch t1 t2 + = ptext SLIT("Can't match types") <+> quotes (ppr t1) <+> + ptext SLIT("and") <+> quotes (ppr t2) + +lengthMisMatch tys1 tys2 + = sep [ptext SLIT("Can't match unequal length lists"), + nest 2 (ppr tys1), nest 2 (ppr tys2) ] + +kindMisMatch tv1 t2 + = vcat [ptext SLIT("Can't match kinds") <+> quotes (ppr (tyVarKind tv1)) <+> + ptext SLIT("and") <+> quotes (ppr (typeKind t2)), + ptext SLIT("when matching") <+> quotes (ppr tv1) <+> + ptext SLIT("with") <+> quotes (ppr t2)] + +occursCheck tv ty + = hang (ptext SLIT("Can't construct the infinite type")) + 2 (ppr tv <+> equals <+> ppr ty) +\end{code}
\ No newline at end of file |