-instance toString SemError where
- toString (ParseError p e) = concat [
- toString p,"SemError: ParseError: ", e]
- toString (Error e) = "SemError: " +++ e
- toString (UnifyErrorStub t1 t2) = toString (UnifyError {line=0,col=0} t1 t2)
- toString (UnifyError p t1 t2) = concat [
- toString p,
- "SemError: Cannot unify types. Expected: ",
- toString t1, ". Given: ", toString t2]
-
-sem :: AST -> SemOutput
-sem (AST vd fd) = case runStateT m ('Map'.newMap, getRandomStream 1) of
- Left e = Left [e]
- Right ((vds, fds), gamma) = Right ((AST vds fds), gamma)
-where
- m :: Env ([VarDecl], [FunDecl])
- m = (mapM semVarDecl vd) >>= \vds ->
- mapM semFunDecl fd >>= \fds ->
- pure (vds, fds)
-
-semFunDecl :: FunDecl -> Env FunDecl
-semFunDecl f = pure f
-
-semVarDecl :: VarDecl -> Env VarDecl
-semVarDecl (VarDecl pos type ident ex) = unify type ex
- >>= \t-> putIdent ident t >>| (pure $ VarDecl pos t ident ex)
-
-typeExpr :: Expr -> Env Type
-typeExpr (IntExpr _ _) = pure IntType
-typeExpr (CharExpr _ _) = pure CharType
-typeExpr (BoolExpr _ _) = pure BoolType
-typeExpr (Op1Expr p UnNegation expr) = unify BoolType expr
-typeExpr (Op1Expr p UnMinus expr) = unify IntType expr
-typeExpr (TupleExpr p (e1, e2)) = typeExpr e1
- >>= \t1-> typeExpr e2 >>= \t2-> pure $ TupleType (t1, t2)
-//Int
-typeExpr (Op2Expr p e1 BiPlus e2) = unify IntType e1 >>| unify IntType e2
-typeExpr (Op2Expr p e1 BiMinus e2) = unify IntType e1 >>| unify IntType e2
-typeExpr (Op2Expr p e1 BiTimes e2) = unify IntType e1 >>| unify IntType e2
-typeExpr (Op2Expr p e1 BiDivide e2) = unify IntType e1 >>| unify IntType e2
-typeExpr (Op2Expr p e1 BiMod e2) = unify IntType e1 >>| unify IntType e2
-//bool, char of int
-typeExpr (Op2Expr p e1 BiEquals e2) = typeExpr e1 >>= \t1 -> unify t1 e2
- >>| pure BoolType //todo, actually check t1 in Char,Bool,Int
-typeExpr (Op2Expr p e1 BiUnEqual e2) = typeExpr (Op2Expr p e1 BiEquals e2)
-//char of int
-typeExpr (Op2Expr p e1 BiLesser e2) = typeExpr e1 >>= \t1 -> unify t1 e2
- >>| pure BoolType //todo, actually check t1 in Char, Int
-typeExpr (Op2Expr p e1 BiGreater e2) = typeExpr (Op2Expr p e1 BiLesser e2)
-typeExpr (Op2Expr p e1 BiLesserEq e2) = typeExpr (Op2Expr p e1 BiLesser e2)
-typeExpr (Op2Expr p e1 BiGreaterEq e2) = typeExpr (Op2Expr p e1 BiLesser e2)
-//bool
-typeExpr (Op2Expr p e1 BiAnd e2) = unify BoolType e1 >>| unify BoolType e2
-typeExpr (Op2Expr p e1 BiOr e2) = unify BoolType e1 >>| unify BoolType e2
-//a
-typeExpr (Op2Expr p e1 BiCons e2) = typeExpr e1 >>= \t1-> typeExpr e2
- >>= \t2-> unify (ListType t1) t2
-typeExpr (EmptyListExpr p) = freshIdent >>= \frsh-> let t = IdType frsh in
- putIdent frsh t >>| pure t
-//typeExpr (FunExpr p FunCall) = undef
-//typeExpr (VarExpr Pos VarDef) = undef //when checking var-expr, be sure to
- //put the infered type in the context
-
-class unify a :: Type a -> Env Type
-
-instance unify Expr where
- unify (_ ->> _) e = liftT $ Left $ ParseError (extrPos e)
- "Expression cannot be a higher order function. Yet..."
- unify VoidType e = liftT $ Left $ ParseError (extrPos e)
- "Expression cannot be a Void type."
- unify (IdType _) e = liftT $ Left $ ParseError (extrPos e)
- "Expression cannot be an polymorf type."
- unify VarType e = typeExpr e
- unify (IdType i) e = undef
- //we have to cheat to decorate the error, can be done nicer?
- unify t e = StateT $ \s0 -> let res = runStateT m s0 in case res of
- Left err = Left $ decErr e err
- Right t = Right t //note, t :: (Type, Gamma)
- where m = typeExpr e >>= \tex-> unify t tex
-
-replace :: String Type -> Env Void
-replace _ _ = undef
-
-instance unify Type where
- unify IntType IntType = pure IntType
- unify BoolType BoolType = pure BoolType
- unify CharType CharType = pure CharType
- unify (IdType i) t=:(IdType j) = replace i t >>| pure t
- unify t (IdType i) = unify (IdType i) t
- unify (IdType i) t = replace i t >>| pure t
- //unify (ListType t1) (ListType t2) = unify t1 t2
- unify t1 t2 = liftT $ Left $ UnifyError zero t1 t2
-
-instance zero Pos where
- zero = {line=0,col=0}
-
-decErr :: Expr SemError -> SemError
-decErr e (UnifyError _ t1 t2) = UnifyError (extrPos e) t1 t2
-decErr e (ParseError _ s) = ParseError (extrPos e) s
-decErr e err = err
-
-dc2 :: Expr (Either SemError a) -> Either SemError a
-dc2 e (Right t) = Right t
-dc2 e (Left err) = Left err
-
-extrPos :: Expr -> Pos
-extrPos (VarExpr p _) = p
-extrPos (Op2Expr p _ _ _) = p
-extrPos (Op1Expr p _ _) = p
-extrPos (IntExpr p _) = p
-extrPos (CharExpr p _) = p
-extrPos (BoolExpr p _) = p
-extrPos (FunExpr p _) = p
-extrPos (EmptyListExpr p) = p
-extrPos (TupleExpr p _) = p
+ isNiceMain :: FunDecl -> Either SemError ()
+ isNiceMain (FunDecl p "main" as mt _ _) = case (as, mt) of
+ ([_:_], _) = Left $ SanityError p "main must have arity 0"
+ ([], t) = (case t of
+ Nothing = pure ()
+ Just VoidType = pure ()
+ _ = Left $ SanityError p "main has to return Void")
+ isNiceMain _ = pure ()
+
+class Typeable a where
+ ftv :: a -> [TVar]
+ subst :: Substitution a -> a
+
+instance Typeable Scheme where
+ ftv (Forall bound t) = difference (ftv t) bound
+ subst s (Forall bound t) = Forall bound $ subst s_ t
+ where s_ = 'Map'.filterWithKey (\k _ -> not (elem k bound)) s
+
+instance Typeable [a] | Typeable a where
+ ftv types = foldr (\t ts-> ftv t ++ ts) [] types
+ subst s ts = map (\t->subst s t) ts
+
+instance Typeable Type where
+ ftv (TupleType (t1, t2)) = ftv t1 ++ ftv t2
+ ftv (ListType t) = ftv t
+ ftv (IdType tvar) = [tvar]
+ ftv (FuncType t) = ftv t
+ ftv (t1 ->> t2) = ftv t1 ++ ftv t2
+ ftv _ = []
+ subst s (TupleType (t1, t2))= TupleType (subst s t1, subst s t2)
+ subst s (ListType t1) = ListType (subst s t1)
+ subst s (FuncType t) = FuncType (subst s t)
+ subst s (t1 ->> t2) = (subst s t1) ->> (subst s t2)
+ subst s t1=:(IdType tvar) = 'Map'.findWithDefault t1 tvar s
+ subst s t = t
+
+instance Typeable Gamma where
+ ftv gamma = concatMap id $ map ftv ('Map'.elems gamma)
+ subst s gamma = Mapmap (subst s) gamma
+
+extend :: String Scheme Gamma -> Gamma
+extend k t g = 'Map'.put k t g
+
+//// ------------------------
+//// algorithm U, Unification
+//// ------------------------
+instance zero Substitution where zero = 'Map'.newMap
+
+compose :: Substitution Substitution -> Substitution
+compose s1 s2 = 'Map'.union (Mapmap (subst s1) s2) s1
+//Note: just like function compositon compose does snd first
+
+occurs :: TVar a -> Bool | Typeable a
+occurs tvar a = elem tvar (ftv a)
+
+unify :: Type Type -> Either SemError Substitution
+unify t1 t2=:(IdType tv) | t1 == (IdType tv) = Right zero
+ | occurs tv t1 = Left $ InfiniteTypeError zero t1
+ | otherwise = Right $ 'Map'.singleton tv t1
+unify t1=:(IdType tv) t2 = unify t2 t1
+unify (ta1->>ta2) (tb1->>tb2) = unify ta1 tb1 >>= \s1->
+ unify ta2 tb2 >>= \s2->
+ Right $ compose s1 s2
+unify (TupleType (ta1,ta2)) (TupleType (tb1,tb2)) = unify ta1 tb1 >>= \s1->
+ unify ta2 tb2 >>= \s2->
+ Right $ compose s1 s2
+unify (ListType t1) (ListType t2) = unify t1 t2
+unify (FuncType t1) (FuncType t2) = unify t1 t2
+unify t1 t2 | t1 == t2 = Right zero
+ | otherwise = Left $ UnifyError zero t1 t2
+
+//// ------------------------
+//// Algorithm M, Inference and Solving
+//// ------------------------
+gamma :: Typing Gamma
+gamma = gets fst
+putGamma :: Gamma -> Typing ()
+putGamma g = modify (appFst $ const g) >>| pure ()
+changeGamma :: (Gamma -> Gamma) -> Typing Gamma
+changeGamma f = modify (appFst f) >>| gamma
+withGamma :: (Gamma -> a) -> Typing a
+withGamma f = f <$> gamma
+fresh :: Typing Type
+fresh = gets snd >>= \vars->
+ modify (appSnd $ const $ tail vars) >>|
+ pure (IdType (head vars))
+
+lift :: (Either SemError a) -> Typing a
+lift (Left e) = liftT $ Left e
+lift (Right v) = pure v
+
+//instantiate maps a schemes type variables to variables with fresh names
+//and drops the quantification: i.e. forall a,b.a->[b] becomes c->[d]
+instantiate :: Scheme -> Typing Type
+instantiate (Forall bound t) =
+ mapM (const fresh) bound >>= \newVars->
+ let s = 'Map'.fromList (zip (bound,newVars)) in
+ pure (subst s t)
+
+//generalize quentifies all free type variables in a type which are not
+//in the gamma
+generalize :: Type -> Typing Scheme
+generalize t = gamma >>= \g-> pure $ Forall (difference (ftv t) (ftv g)) t
+
+lookup :: String -> Typing Type
+lookup k = gamma >>= \g-> case 'Map'.member k g of
+ False = liftT (Left $ UndeclaredVariableError zero k)
+ True = instantiate $ 'Map'.find k g
+
+//The inference class
+//When tying it all together we will treat the program is a big
+//let x=e1 in let y=e2 in ....
+class infer a :: a -> Typing (Substitution, Type, a)
+
+////---- Inference for Expressions ----
+
+instance infer Expr where
+ infer e = case e of
+ VarExpr _ (VarDef k fs) = lookup k >>= \t ->
+ foldM foldFieldSelectors t fs >>= \finalT ->
+ pure (zero, finalT, e)
+
+ Op2Expr p e1 op e2 =
+ infer e1 >>= \(s1, t1, e1_) ->
+ infer e2 >>= \(s2, t2, e2_) ->
+ fresh >>= \tv ->
+ let given = t1 ->> t2 ->> tv in
+ op2Type op >>= \expected ->
+ lift (unify expected given) >>= \s3 ->
+ pure ((compose s3 $ compose s2 s1), subst s3 tv, Op2Expr p e1_ op e2_)
+
+ Op1Expr p op e1 =
+ infer e1 >>= \(s1, t1, e1_) ->
+ fresh >>= \tv ->
+ let given = t1 ->> tv in
+ op1Type op >>= \expected ->
+ lift (unify expected given) >>= \s2 ->
+ pure (compose s2 s1, subst s2 tv, Op1Expr p op e1)
+
+ EmptyListExpr _ = (\tv->(zero,tv,e)) <$> fresh
+
+ TupleExpr p (e1, e2) =
+ infer e1 >>= \(s1, t1, e1_) ->
+ infer e2 >>= \(s2, t2, e2_) ->
+ pure (compose s2 s1, TupleType (t1,t2), TupleExpr p (e1_,e2_))
+
+ LambdaExpr _ _ _ = liftT $ Left $ Error "PANIC: lambdas should be tasnformed"
+
+ FunExpr p f args fs =
+ lookup f >>= \expected ->
+ let accST = (\(s,ts,es) e->infer e >>= \(s_,et,e_)-> pure (compose s_ s,ts++[et],es++[e_])) in
+ foldM accST (zero,[],[]) args >>= \(s1, argTs, args_)->
+ fresh >>= \tv->case expected of
+ FuncType t = pure (s1, t, e)
+ _ = (let given = foldr (->>) tv argTs in
+ lift (unify expected given) >>= \s2->
+ let fReturnType = subst s2 tv in
+ foldM foldFieldSelectors fReturnType fs >>= \returnType ->
+ (case f of
+ "print" = case head argTs of
+ IntType = pure "1printint"
+ CharType = pure "1printchar"
+ BoolType = pure "1printbool"
+ ListType (CharType) = pure "1printstr"
+ t = liftT $ Left $ SanityError p ("can not print " +++ toString t)
+ _ = pure f) >>= \newF->
+ pure (compose s2 s1, returnType, FunExpr p newF args_ fs))
+
+ IntExpr _ _ = pure $ (zero, IntType, e)
+ BoolExpr _ _ = pure $ (zero, BoolType, e)
+ CharExpr _ _ = pure $ (zero, CharType, e)
+
+foldFieldSelectors :: Type FieldSelector -> Typing Type
+foldFieldSelectors (ListType t) (FieldHd) = pure t
+foldFieldSelectors t=:(ListType _) (FieldTl) = pure t
+foldFieldSelectors (TupleType (t1, _)) (FieldFst) = pure t1
+foldFieldSelectors (TupleType (_, t2)) (FieldSnd) = pure t2
+foldFieldSelectors t fs = liftT $ Left $ FieldSelectorError zero t fs
+
+op2Type :: Op2 -> Typing Type
+op2Type op
+| elem op [BiPlus, BiMinus, BiTimes, BiDivide, BiMod]
+ = pure (IntType ->> IntType ->> IntType)
+| elem op [BiEquals, BiUnEqual]
+ = fresh >>= \t1-> fresh >>= \t2-> pure (t1 ->> t2 ->> BoolType)
+| elem op [BiLesser, BiGreater, BiLesserEq, BiGreaterEq]
+ = pure (IntType ->> IntType ->> BoolType)
+| elem op [BiAnd, BiOr]
+ = pure (BoolType ->> BoolType ->> BoolType)
+| op == BiCons
+ = fresh >>= \t1-> pure (t1 ->> ListType t1 ->> ListType t1)
+
+op1Type :: Op1 -> Typing Type
+op1Type UnNegation = pure $ (BoolType ->> BoolType)
+op1Type UnMinus = pure $ (IntType ->> IntType)
+
+////----- Inference for Statements -----
+applySubst :: Substitution -> Typing Gamma
+applySubst s = changeGamma (subst s)
+
+instance infer Stmt where
+ infer s = case s of
+ IfStmt e th el =
+ infer e >>= \(s1, et, e_)->
+ lift (unify et BoolType) >>= \s2 ->
+ applySubst (compose s2 s1) >>|
+ infer th >>= \(s3, tht, th_)->
+ applySubst s3 >>|
+ infer el >>= \(s4, elt, el_)->
+ applySubst s4 >>|
+ lift (unify tht elt) >>= \s5->
+ let sub = compose s5 $ compose s4 $ compose s3 $ compose s2 s1 in
+ pure (sub, subst s5 tht, IfStmt e_ th_ el_)
+
+ WhileStmt e wh =
+ infer e >>= \(s1, et, e_)->
+ lift (unify et BoolType) >>= \s2 ->
+ applySubst (compose s2 s1) >>|
+ infer wh >>= \(s3, wht, wh_)->
+ pure (compose s3 $ compose s2 s1, subst s3 wht, WhileStmt e_ wh_)
+
+ AssStmt vd=:(VarDef k fs) e =
+ lookup k >>= \expected ->
+ infer e >>= \(s1, given, e_)->
+ foldM reverseFs given (reverse fs) >>= \varType->
+ lift (unify expected varType) >>= \s2->
+ let s = compose s2 s1 in
+ applySubst s >>|
+ changeGamma (extend k (Forall [] (subst s varType))) >>|
+ pure (s, VoidType, AssStmt vd e_)
+
+ FunStmt f args fs =
+ lookup f >>= \expected ->
+ let accST = (\(s,ts,es) e->infer e >>= \(s_,et,e_)-> pure (compose s_ s,ts++[et],es++[e_])) in
+ foldM accST (zero,[],[]) args >>= \(s1, argTs, args_)->
+ fresh >>= \tv->
+ let given = foldr (->>) tv argTs in
+ lift (unify expected given) >>= \s2->
+ let fReturnType = subst s2 tv in
+ foldM foldFieldSelectors fReturnType fs >>= \returnType ->
+ (case f of
+ "print" = case head argTs of
+ IntType = pure "1printint"
+ CharType = pure "1printchar"
+ BoolType = pure "1printbool"
+ ListType (CharType) = pure "1printstr"
+ t = liftT $ Left $ SanityError zero ("can not print " +++ toString t)
+ _ = pure f) >>= \newF->
+ pure (compose s2 s1, VoidType, FunStmt newF args_ fs)
+
+ ReturnStmt Nothing = pure (zero, VoidType, s)
+ ReturnStmt (Just e) = infer e >>= \(sub, t, _)-> pure (sub, t, s)
+
+reverseFs :: Type FieldSelector -> Typing Type
+reverseFs t FieldHd = pure $ ListType t
+reverseFs t FieldTl = pure $ ListType t
+reverseFs t FieldFst = fresh >>= \tv -> pure $ TupleType (t, tv)
+reverseFs t FieldSnd = fresh >>= \tv -> pure $ TupleType (tv, t)
+
+//The type of a list of statements is either an encountered
+//return, or VoidType
+instance infer [a] | infer a where
+ infer [] = pure (zero, VoidType, [])
+ infer [stmt:ss] =
+ infer stmt >>= \(s1, t1, s_) ->
+ applySubst s1 >>|
+ infer ss >>= \(s2, t2, ss_) ->
+ applySubst s2 >>|
+ case t1 of
+ VoidType = pure (compose s2 s1, t2, [s_:ss_])
+ _ = case t2 of
+ VoidType = pure (compose s2 s1, t1, [s_:ss_])
+ _ = lift (unify t1 t2) >>= \s3 ->
+ pure (compose s3 $ compose s2 s1, t1, [s_:ss_])
+
+//the type class inferes the type of an AST element (VarDecl or FunDecl)
+//and adds it to the AST element
+class type a :: a -> Typing (Substitution, a)
+
+instance type VarDecl where
+ type (VarDecl p expected k e) =
+ infer e >>= \(s1, given, e_) ->
+ applySubst s1 >>|
+ case expected of
+ Nothing = pure zero
+ Just expected_ = lift (unify expected_ given)
+ >>= \s2->
+ applySubst s2 >>|
+ let vtype = subst (compose s2 s1) given in
+ generalize vtype >>= \t ->
+ changeGamma (extend k t) >>|
+ pure (compose s2 s1, VarDecl p (Just vtype) k e_)
+
+instance type FunDecl where
+ type (FunDecl p f args expected vds stmts) =
+ gamma >>= \outerScope-> //functions are infered in their own scopde
+ introduce f >>|
+ mapM introduce args >>= \argTs->
+ type vds >>= \(s1, tVds)->
+ applySubst s1 >>|
+ infer stmts >>= \(s2, result, stmts_)->
+ applySubst s1 >>|
+ let argTs_ = map (subst $ compose s2 s1) argTs in
+ let given = foldr (->>) result argTs_ in
+ (case expected of
+ Nothing = pure zero
+ Just (FuncType expected_) = lift (unify expected_ given)
+ Just expected_ = lift (unify expected_ given)
+ ) >>= \s3 ->
+ let ftype = subst (compose s3 $ compose s2 s1) given in
+ (case ftype of
+ _ ->> _ = pure ftype
+ _ = pure $ FuncType ftype
+ ) >>= \ftype_->
+ generalize ftype_ >>= \t->
+ putGamma outerScope >>|
+ changeGamma (extend f t) >>|
+ pure (compose s3 $ compose s2 s1, FunDecl p f args (Just ftype_) tVds stmts_)
+
+instance type [a] | type a where
+ type [] = pure (zero, [])
+ type [v:vs] =
+ type v >>= \(s1, v_)->
+ applySubst s1 >>|
+ type vs >>= \(s2, vs_)->
+ applySubst (compose s2 s1) >>|
+ pure (compose s2 s1, [v_:vs_])
+
+introduce :: String -> Typing Type
+introduce k =
+ fresh >>= \tv ->
+ changeGamma (extend k (Forall [] tv)) >>|
+ pure tv
+
+instance toString Scheme where
+ toString (Forall x t) =
+ concat ["Forall ": intersperse "," x] +++ concat [". ", toString t];