Difference between revisions of "IO inside"

putStrLn "Press any key to begin formatting"

getchar :: Char

get2chars = [getchar, getchar]

get2chars = let x = getchar in [x, x]  -- this should be a legitimate optimisation!

getchar :: Int -> Char

get2chars = [getchar 1, getchar 2]

now_or_later :: String
now_or_later = case getchar 0 of
                 c | c == 'y'  = "Now"
                   | c == 'Y'  = "Now"
                 _             = "Later"

getchar :: Time -> Char

get2chars (t1, t2) = [getchar t1, getchar t2]

now_or_later :: Time -> String
now_or_later t = case getchar t of
                   c | c == 'y'  = "Now"
                     | c == 'Y'  = "Now"
                   _             = "Later"

getchar :: Val -> Char

now_or_later :: Val -> String
now_or_later u = case getchar u of
                 c | c == 'y'  = "Now"
                   | c == 'Y'  = "Now"
                 _             = "Later"

get2chars :: (Val, Val) -> String
get2chars (u1, u2) = [getchar u1, getchar u2]

getchar :: Val -> (Char, Val)

get2chars :: (Val, Val) -> String
get2chars (u1, u2) = [a, b]  where (a, u3) = getchar u1
                                   (b, _ ) = getchar u3

now_or_later :: Val -> String
now_or_later u = case getchar u of
                   c | c == 'y'  = "Now"
                     | c == 'Y'  = "Now"
                   _             = "Later"

get2chars :: Val -> String
get2chars u1 = [a, b]  where (a, u2) = getchar u1
                             (b, _ ) = getchar u2

get2chars    :: Val -> String
now_or_later :: Val -> String

get4chars (u1, u2) = [get2chars u1, get2chars u2]  -- order of calls to 'get2chars' isn't defined

get2chars :: Val -> (String, Val)

get4chars u0 = (a++b)  where (a, u1) = get2chars u0
                             (b, _ ) = get2chars u1

getchar :: Val -> (Char, Val)

get2chars :: Val -> (String, Val)
get2chars u0 = ([a, b], u2)  where (a, u1) = getchar u0
                                   (b, u2) = getchar u1
get2chars :: Val -> (String, Val)
get4chars u0 = (a++b, u2)    where (a, u1) = get2chars u0
                                   (b, u2) = get2chars u1

now_or_later :: Val -> (String, Val)
now_or_later u = case getchar u of
                   (c, u') | c == 'y'  = ("Now",   u')
                           | c == 'Y'  = ("Now",   u')
                   (_, u')             = ("Later", u')

get2chars :: Val -> (String, Val)
get2chars u0 = ([a, b], u2)  where (a, u1) = getchar u2  -- this might take
                                   (b, u2) = getchar u1  --    a while...

get2chars :: Val -> (String, Val)
get2chars u0 = let (a, u1) = getchar u2 in  -- error: i2 is undefined!
               let (b, u2) = getchar u1 in
               ([a, b], u2)

get2chars :: Val -> (String, Val)
get2chars u0 = let (a, u1) = getchar u0 in
               let (b, u2) = getchar u2 in  -- here we go again...
               ([a, b], u2)

class Monad m where
    unit :: a -> m a
    bind :: m a -> (a -> m b) -> m b

type IO' a =  Val -> (a, Val)

unit       :: a -> IO' a
unit x     =  \u0 -> (x, u0)

bind       :: IO' a -> (a -> IO' b) -> IO' b
bind m k   =  \u0 -> let (x, u1) =  m u0 in
                     let (y, u2) =  k x u1 in
                     (y, u2)

getchar      :: IO' Char    {-  = Val -> (Char, Val)  -}

get2chars    :: IO' String  {-  = Val -> (String, Val)  -}

get2chars =  \u0 -> let (a, u1) =  getchar u0 in
                    let (b, u2) =  getchar u1 in
                    let r       =  [a, b] in
                    (r, u2)

get4chars    :: IO' String  {-  = Val -> (String, Val)  -}

get4chars =  \u0 -> let (a, u1) = get2chars u0 in
                    let (b, u2) = get2chars u1 in
                    let r       = a++b in
                    (r, u2)

now_or_later :: IO' String  {-  = Val -> (String, Val) -}
now_or_later = \u -> let (c, u') = getchar u in
                     let r = if elem c "yY" then "Now" else "Later" in
                     (r, u')

getchar   :: IO' Char

get2chars :: IO' String
get2chars =  getchar `bind` \a ->
             getchar `bind` \b ->
             unit [a, b]

get4chars :: IO' String
get4chars =  get2chars `bind` \a ->
             get2chars `bind` \b ->
             unit (a++b)

now_or_later :: IO' String
now_or_later = getchar `bind` \c ->
               unit (if elem c "yY" then "Now" else "Later")

main :: RealWorld -> ((), RealWorld)

type IO a  =  RealWorld -> (a, RealWorld)

getChar :: RealWorld -> (Char, RealWorld)

main :: RealWorld -> ((), RealWorld)
main world0 = let (a, world1) = getChar world0
                  (b, world2) = getChar world1
              in ((), world2)

main = do a <- ask "What is your name?"
          b <- ask "How old are you?"
          return ()

ask s = do putStr s
           readLn

when :: Bool -> IO () -> IO ()
when condition action world =
    if condition
      then action world
      else ((), world)

  main = do putStr "Hello!"

  main = putStr "Hello!"

main = do putStr "What is your name?"
          putStr "How old are you?"
          putStr "Nice day!"

main = (putStr "What is your name?")
       >> ( (putStr "How old are you?")
            >> (putStr "Nice day!")
          )

(>>) :: IO a -> IO b -> IO b
(action1 >> action2) world0 =
   let (a, world1) = action1 world0
       (b, world2) = action2 world1
   in (b, world2)

action1 >> action2 = action
  where
    action world0 = let (a, world1) = action1 world0
                        (b, world2) = action2 world1
                    in (b, world2)

main = do a <- readLn
          print a

main = readLn
       >>= (\a -> print a)

(>>=) :: IO a -> (a -> IO b) -> IO b
(action >>= reaction) world0 =
   let (a, world1) = action world0
       (b, world2) = reaction a world1
   in (b, world2)

type IO a  =  RealWorld -> (a, RealWorld)

main = readLn >>= print

 do x <- action1
    action2

 action1 >>= (\x -> action2)

main = do putStr "What is your name?"
          a <- readLn
          putStr "How old are you?"
          b <- readLn
          print (a,b)

main = putStr "What is your name?"
       >> readLn
       >>= \a -> putStr "How old are you?"
       >> readLn
       >>= \b -> print (a,b)

return :: a -> IO a
return a world0  =  (a, world0)

main = do a <- readLn
          return (a*2)

main = do a <- readLn
          when (a>=0) $ do
              return ()
          print "a is negative"

main = do a <- readLn
          if (a>=0)
            then return ()
            else print "a is negative"

main = do a <- readLn
          if (a>=0) then return ()
            else do
          print "a is negative"
          ...

liftM :: (a -> b) -> (IO a -> IO b)

liftM f action = do x <- action
                    return (f x)

main = do let a0 = readVariable varA
              _  = writeVariable varA 1
              a1 = readVariable varA
          print (a0, a1)

import Data.IORef
main = do varA <- newIORef 0  -- Create and initialize a new variable
          a0 <- readIORef varA
          writeIORef varA 1
          a1 <- readIORef varA
          print (a0, a1)

import Data.Array.IO
main = do arr <- newArray (1,10) 37 :: IO (IOArray Int Int)
          a <- readArray arr 1
          writeArray arr 1 64
          b <- readArray arr 1
          print (a, b)

rand :: IO Int

foreign import ccall
   sin :: Double -> Double

foreign import ccall
   tell :: Int -> IO Int

runST :: (forall s . ST s a) -> a

newSTRef :: a -> ST s (STRef s a)
newArray_ :: Ix i => (i, i) -> ST s (STArray s i e)

makeSTRef :: a -> STRef s a
makeSTRef a = runST (newSTRef a)

stToIO :: ST RealWorld a -> IO a

oneST :: ST s Integer -- note that this works correctly for any s
oneST = do var <- newSTRef 0
           modifySTRef var (+1)
           readSTRef var

one :: Int
one = runST oneST

main world0 = let get2chars = getChar >> getChar
                  ((), world1) = putStr "Press two keys" world0
                  (answer, world2) = get2chars world1
              in ((), world2)

main = do let get2chars = getChar >> getChar
          putStr "Press two keys"
          get2chars
          return ()

ioActions :: [IO ()]
ioActions = [(print "Hello!"),
             (putStr "just kidding"),
             (getChar >> return ())
            ]

ioActions :: [RealWorld -> ((), RealWorld)]

main = do head ioActions
          ioActions !! 1
          last ioActions

sequence_ :: [IO a] -> IO ()
sequence_ [] = return ()
sequence_ (x:xs) = do x
                      sequence_ xs

main = sequence_ ioActions

while :: IO Bool -> IO ()
while action = ???

main = do let a = sequence ioActions
              b = when True getChar
              c = getChar >> getChar
          putStr "These let-bindings are not executed!"

readi h i = do hSeek h AbsoluteSeek i
               hGetChar h

readfilei :: String -> IO (Integer -> IO Char)
readfilei name = do h <- openFile name ReadMode
                    return (readi h)

readfilei name = do h <- openFile name ReadMode
                    let readi h i = do hSeek h AbsoluteSeek i
                                       hGetChar h
                    return (readi h)

readfilei name = do h <- openFile name ReadMode
                    let readi i = do hSeek h AbsoluteSeek i
                                     hGetChar h
                    return readi

main = do myfile <- readfilei "test"
          a <- myfile 0
          b <- myfile 1
          print (a,b)

memoryAllocator :: Ptr a -> Int -> IO (Int -> IO (Ptr b),
                                       Ptr c -> IO ())

memoryAllocator buf size = do ......
                              let alloc size = do ...
                                                  ...
                                  free ptr = do ...
                                                ...
                              return (alloc, free)

memoryAllocator buf size = do start <- newIORef buf
                              end <- newIORef (buf `plusPtr` size)
                              ...

      ...
      let alloc size = do addr <- readIORef start
                          writeIORef start (addr `plusPtr` size)
                          return addr
                          
      let free ptr = do writeIORef start ptr

main = do buf1 <- mallocBytes (2^16)
          buf2 <- mallocBytes (2^20)
          (alloc1, free1) <- memoryAllocator buf1 (2^16)
          (alloc2, free2) <- memoryAllocator buf2 (2^20)
          ptr11 <- alloc1 100
          ptr21 <- alloc2 1000
          free1 ptr11
          free2 ptr21
          ptr12 <- alloc1 100
          ptr22 <- alloc2 1000

data Figure = Figure { draw :: IO (),
                       move :: Displacement -> IO ()
                     }

type Displacement = (Int, Int)  -- horizontal and vertical displacement in points

circle    :: Point -> Radius -> IO Figure
rectangle :: Point -> Point -> IO Figure

type Point = (Int, Int)  -- point coordinates
type Radius = Int        -- circle radius in points

circle center radius = do
    let description = "  Circle at "++show center++" with radius "++show radius
    return $ Figure { draw = putStrLn description }

rectangle from to = do
    let description = "  Rectangle "++show from++"-"++show to)
    return $ Figure { draw = putStrLn description }

drawAll :: [Figure] -> IO ()
drawAll figures = do putStrLn "Drawing figures:"
                     mapM_ draw figures

main = do figures <- sequence [circle (10,10) 5,
                               circle (20,20) 3,
                               rectangle (10,10) (20,20),
                               rectangle (15,15) (40,40)]
          drawAll figures

circle center radius = do
    centerVar <- newIORef center
    
    let drawF = do center <- readIORef centerVar
                   putStrLn ("  Circle at "++show center
                             ++" with radius "++show radius)
                   
    let moveF (addX,addY) = do (x,y) <- readIORef centerVar
                               writeIORef centerVar (x+addX, y+addY)
                               
    return $ Figure { draw=drawF, move=moveF }
   
rectangle from to = do
    fromVar <- newIORef from
    toVar   <- newIORef to

    let drawF = do from <- readIORef fromVar
                   to   <- readIORef toVar
                   putStrLn ("  Rectangle "++show from++"-"++show to)
                   
    let moveF (addX,addY) = do (fromX,fromY) <- readIORef fromVar
                               (toX,toY)     <- readIORef toVar
                               writeIORef fromVar (fromX+addX, fromY+addY)
                               writeIORef toVar   (toX+addX, toY+addY)

    return $ Figure { draw=drawF, move=moveF }

main = do figures <- sequence [circle (10,10) 5,
                               rectangle (10,10) (20,20)]
          drawAll figures
          mapM_ (\fig -> move fig (10,10)) figures
          drawAll figures

data Figure = Figure { draw :: IO (),
                       move :: Displacement -> IO (),
                       area :: Double,
                       origin :: IORef Point
                     }

main = print (f 2)

f 0 = "zero"
f 1 = "one"

main = print (head [])

main = print (1 + (error "Value that wasn't initialized or cannot be computed"))

{-# LANGUAGE ForeignFunctionInterface #-}

main = do print "Hello from main"
          c_function

haskell_function = print "Hello from haskell_function"

foreign import ccall safe "prototypes.h"
    c_function :: IO ()

foreign export ccall
    haskell_function :: IO ()

#include <stdio.h>
#include "prototypes.h"

void c_function (void)
{
  printf("Hello from c_function\n");
  haskell_function();
}

extern void c_function (void);
extern void haskell_function (void);

 ghc --make main.hs vile.c

 ghc -c vile.c
 ghc --make main.hs vile.o

#ifdef __cplusplus
extern "C" {
#endif

extern void c_function (void);
extern void haskell_function (void);

#ifdef __cplusplus
}
#endif

 ghc --make main.hs vile.cpp

foreign import ccall safe "prototypes.h CFunction"
    c_function :: IO ()

foreign export ccall "HaskellFunction"
    haskell_function :: IO ()

foreign import stdcall unsafe "windows.h SetFileApisToOEM"
  setFileApisToOEM :: IO ()

import Foreign.C.Types (               -- equivalent to the following C type:
         CChar, CUChar,                --  char/unsigned char
         CShort, CUShort,              --  short/unsigned short
         CInt, CUInt, CLong, CULong,   --  int/unsigned/long/unsigned long
         CFloat, CDouble...)           --  float/double

foreign import ccall unsafe "math.h"
    c_sin :: CDouble -> CDouble

-- |Type-conversion wrapper around c_sin
sin :: Double -> Double
sin = fromRational . c_sin . toRational

import Foreign.C.String (   -- representation of strings in C
         CString,           -- = Ptr CChar
         CStringLen)        -- = (Ptr CChar, Int)

foreign import ccall unsafe "string.h"
    c_strlen :: CString -> IO CSize     -- CSize defined in Foreign.C.Types and is equal to size_t

-- |Type-conversion wrapper around c_strlen 
strlen :: String -> Int
strlen = ....

getchar :: Char

get2chars = [getchar, getchar]

void putchar(char c);

putchar :: Char -> ()
putchar c = ...

readContents :: Filename -> String

unsafePerformIO :: IO a -> a

unsafePerformIO :: (RealWorld -> (a, RealWorld)) -> a
unsafePerformIO action = let (a, world1) = action createNewWorld
                         in a

one :: Integer
one = unsafePerformIO $ do var <- newIORef 0
                           modifyIORef var (+1)
                           readIORef var

unsafePerformIO action = let (a,world1) = action createNewWorld
                         in (world1 `seq` a)

-- | Just like unsafePerformIO, but we inline it. Big performance gains as
-- it exposes lots of things to further inlining
{-# INLINE inlinePerformIO #-}
inlinePerformIO action = let (a, world1) = action createNewWorld
                         in (world1 `seq` a)
#endif

write :: Int -> (Ptr Word8 -> IO ()) -> Put ()
write !n body = Put $ \c buf@(Buffer fp o u l) ->
  if n <= l
    then write</code> c fp o u l
    else write</code> (flushOld c n fp o u) (newBuffer c n) 0 0 0

  where {-# NOINLINE write</code> #-}
        write</code> c !fp !o !u !l =
          -- warning: this is a tad hardcore
          inlinePerformIO
            (withForeignPtr fp
              (\p -> body $! (p `plusPtr` (o+u))))
          `seq` c () (Buffer fp o (u+n) (l-n))

word8 w = write 1 (\p -> poke p w)

unsafeInterleaveIO :: IO a -> IO a

unsafeInterleaveIO   :: IO a -> IO a
unsafeInterleaveIO a =  return (unsafePerformIO a)

do let c = unsafePerformIO getChar
   do_proc c

do let s = [unsafePerformIO getChar, unsafePerformIO getChar, unsafePerformIO getChar]
   do_proc s

do str <- unsafeInterleaveIO myGetContents

myGetContents = do
   c <- getChar
   s <- unsafeInterleaveIO myGetContents
   return (c:s)

myGetContents = do
   c <- replicateM 512 getChar
   s <- unsafeInterleaveIO myGetContents
   return (c++s)

myGetContents = unsafeInterleaveIO $ do
   c <- replicateM 512 getChar
   s <- myGetContents
   return (c++s)

newtype IO a = IO (State# RealWorld -> (# State# RealWorld, a #))

data World = World
newtype IO a = IO (World -> Either IOError a)

Difference between revisions of "IO inside"

Revision as of 04:58, 8 January 2022

Contents

Haskell is a pure language

I/O in Haskell, simplified

A matter of time

A change of input

One step after another

The fun of plumbing

Enter the monad

Running with the `RealWorld`

`(>>=)` and `do` notation

Mutable data (references, arrays, hash tables...)

Encapsulated mutable data: ST

I/O actions as values

Example: a list of I/O actions

Example: returning an I/O action as a result

Example: a memory allocator generator

Example: emulating OOP with record types

Exception handling (under development)

Interfacing with C/C++ and foreign libraries (under development)

Calling functions

All about the `foreign` declaration

Marshalling simple types

Memory management

Marshalling strings

Marshalling composite types

Dynamic calls

DLLs

The dark side of the I/O monad

unsafePerformIO

inlinePerformIO

unsafeInterleaveIO

Welcome to the machine: the actual GHC implementation

The Yhc/nhc98 implementation

Further reading

To-do list

Navigation menu

Search

@@ Line 17: / Line 17: @@
 Compared to an optimizing C compiler, a Haskell compiler is a set of pure mathematical transformations. This results in much better high-level optimization facilities. Moreover, pure mathematical computations can be much more easily divided into several threads that may be executed in parallel, which is increasingly important in these days of multi-core CPUs. Finally, pure computations are less error-prone and easier to verify, which adds to Haskell's robustness and to the speed of program development using Haskell.
-Haskell's purity allows the compiler to call only functions whose results are really required to calculate the final value of a top-level function (e.g. <code>main</code>) - this is called lazy evaluation. It's a great thing for pure mathematical computations, but how about I/O actions? A function like
+Haskell's purity allows the compiler to call only functions whose results are really required to calculate the final value of a top-level definition (e.g. <code>main</code>) - this is called lazy evaluation. It's a great thing for pure mathematical computations, but how about I/O actions? A function like
 <haskell>
@@ Line 51: / Line 51: @@
 </haskell>
-Right away, this solves the first problem mentioned above - now the compiler will make two calls because it sees that the calls have different parameters. But there's another problem:
+That solves the first problem mentioned above - now the compiler will make two calls because it sees that the calls have different parameters. So a single call to <code>getchar</code> should be even easier:
+<haskell>
+now_or_later :: String
+now_or_later = case getchar 0 of
+                 c | c == 'y'  = "Now"
+                   | c == 'Y'  = "Now"
+                 _             = "Later"
+</haskell>
+...or not - depending on when the program is running (and how interested the user is :-) <code>getchar 0</code> could equal:
+* <code>'y'</code>
+* <code>'Y'</code>
+* ...or any other possible character: ''ouch!''
+=== A matter of time ===
+The problem is that while <code>getchar</code> looks like a function, it breaks one of the rules of being a function:
+* if a function's result changes, it '''should be''' because it's arguments have changed.
+Instead of arbitrary <code>Int</code> values, what about using a ever-changing quantity as the input to <code>getchar</code>...like time? We just need to modify <code>get2chars</code> and <code>now_or_later</code> accordingly:
+<haskell>
+getchar :: Time -> Char
+get2chars (t1, t2) = [getchar t1, getchar t2]
+now_or_later :: Time -> String
+now_or_later t = case getchar t of
+                   c | c == 'y'  = "Now"
+                     | c == 'Y'  = "Now"
+                   _             = "Later"
+</haskell>
+Now the result of calling <code>getchar</code> is free to change along with its input, irrespective of when the user runs the program - one user, that is.
+What if the program supports multiple users, and:
+* one presses <code>'y'</code>,
+* another presses <code>'n'</code>,
+* the rest press the space bar: <code> </code>,
+at exactly the same time - what should the result of <code>getchar</code> be equal to then?
+We could try to avoid the problem by measuring time down to the nearest millisecond, microsecond, nanosecond, etc - however, these days humans aren't the only users: a program can also use another program. It's happening right now in the operating system running on your computer.
+=== A change of input ===
+So, what was the problem with <code>getchar</code> again? Oh, right - it breaks one of the rules of being a function:
+* if a function's result changes, it should be because it's arguments have changed.
+This rule ''works'' - just ask your nearest mathematician, physicist, engineer, chemist, geologist, biologist ''et al''. That means the problem must be with what we've tried using as an argument to <code>getchar</code>. To avoid further distraction (and annoyance!), let's just make a really big assumption:
+* each call to <code>getchar</code> will use a unique argument, of type <code>Val</code>.
+Based on that assumption:
+<haskell>
+getchar :: Val -> Char
+now_or_later :: Val -> String
+now_or_later u = case getchar u of
+                 c | c == 'y'  = "Now"
+                   | c == 'Y'  = "Now"
+                 _             = "Later"
+get2chars :: (Val, Val) -> String
+get2chars (u1, u2) = [getchar u1, getchar u2]
+</haskell>
+At some point, we will have to define what <code>Val</code> is. For now, we'll see how far we can go using our assumption.
+=== One step after another ===
+We now face another problem:
 * even if it does make two calls, there is no way to determine which call should be performed first. Do you want to return the two characters in the order in which they were read, or in the opposite order? Nothing in the definition of <code>get2chars</code> answers this question.
-We need to give the compiler some clue to determine which function it should call first. The Haskell language doesn't provide any way to specify the sequence needed to evaluate <code>getchar 1</code> and <code>getchar 2</code> - except for data dependencies! How about adding an artificial data dependency which prevents evaluation of the second <code>getchar</code> before the first one? In order to achieve this, we will return an additional fake result from <code>getchar</code> that will be used as a parameter for the next <code>getchar</code> call:
+We need to give the compiler some clue to determine which function it should call first. The Haskell language doesn't provide any way to specify the sequence needed to evaluate <code>getchar u1</code> and <code>getchar u2</code> - except for data dependencies! How about adding an artificial data dependency which prevents evaluation of the second <code>getchar</code> before the first one? In order to achieve this, we will return an additional abstract result from <code>getchar</code> that will be used as a parameter for the next <code>getchar</code> call:
 <haskell>
-getchar :: Int -> (Char, Int)
+getchar :: Val -> (Char, Val)
-get2chars _ = [a, b]  where (a, i) = getchar 1
+get2chars :: (Val, Val) -> String
-                            (b, _) = getchar i
+get2chars (u1, u2) = [a, b]  where (a, u3) = getchar u1
+                                   (b, _ ) = getchar u3
+now_or_later :: Val -> String
+now_or_later u = case getchar u of
+                   c | c == 'y'  = "Now"
+                     | c == 'Y'  = "Now"
+                   _             = "Later"
 </haskell>
-So far so good - now we can guarantee that <code>a</code> is read before <code>b</code> because reading <code>b</code> needs the value (<code>i</code>) that is returned by reading <code>a</code>!
+So far, so good - now we can guarantee that <code>a</code> is read before <code>b</code> because reading <code>b</code> needs the value (<code>u3</code>) that is returned by reading <code>a</code>! As a bonus,
+we can simplify <code>get2chars</code>:
+<haskell>
-We've added a fake parameter to <code>get2chars</code> but the problem is that the Haskell compiler is too smart! It can believe that the external <code>getchar</code> function is really dependent on its parameter but for <code>get2chars</code> it will see that we're just cheating because we throw it away! Therefore it won't feel obliged to execute the calls in the order we want.
+get2chars :: Val -> String
+get2chars u1 = [a, b]  where (a, u2) = getchar u1
+                             (b, _ ) = getchar u2
+</haskell>
+Note the similarity of type signatures for <code>get2chars</code> and <code>now_or_later</code>:
-How can we fix this? How about passing this fake parameter to the <code>getchar</code> function? In this case the compiler can't guess that it is really unused.
 <haskell>
-get2chars i0 = [a, b]  where (a, i1) = getchar i0
+get2chars    :: Val -> String
+now_or_later :: Val -> String
-                             (b, i2) = getchar i1
 </haskell>
+...which brings us to the next problem - what if e.g. <code>get2chars</code> is called twice:
-Furthermore, <code>get2chars</code> has the same purity problems as the <code>getchar</code> function. If you need to call it two times, you need a way to describe the order of these calls. Consider this:
 <haskell>
-get4chars = [get2chars 1, get2chars 2]  -- order of calls to 'get2chars' isn't defined
+get4chars (u1, u2) = [get2chars u1, get2chars u2]  -- order of calls to 'get2chars' isn't defined
 </haskell>
-We already know how to deal with this problem: <code>get2chars</code> should also return some fake value that can be used to order calls:
+But we already know how to deal with this problem: <code>get2chars</code> should also return an abstract value that can be used to order calls:
 <haskell>
-get2chars :: Int -> (String, Int)
+get2chars :: Val -> (String, Val)
-get4chars i0 = (a++b)  where (a, i1) = get2chars i0
+get4chars u0 = (a++b)  where (a, u1) = get2chars u0
-                             (b, i2) = get2chars i1
+                             (b, _ ) = get2chars u1
 </haskell>
-But what should the fake return value of <code>get2chars</code> be? If we use some integer constant, the excessively smart Haskell compiler will guess that we're cheating again. What about returning the value returned by <code>getchar</code>? See:
+...but what should the abstract value returned by <code>get2chars</code> be? Or <code>get4chars</code>,
+<code>get8chars</code>, <code>get16chars</code>...? Let's try going in the opposite direction:
+* <code>get4chars</code> calls <code>get2chars :: Val -> (String, Val)</code>
+* <code>get2chars</code> calls <code>getchar   :: Val -> (Char, Val)</code>
+So in a call to <code>get4chars</code>, <code>getchar</code> is the very last definition to use ''and return'' one of those abstract values - it's that returned value we need:
 <haskell>
-get2chars :: Int -> (String, Int)
+getchar :: Val -> (Char, Val)
-get2chars i0 = ([a, b], i2)  where (a, i1) = getchar i0
+get2chars :: Val -> (String, Val)
-                                   (b, i2) = getchar i1
+get2chars u0 = ([a, b], u2)  where (a, u1) = getchar u0
+                                   (b, u2) = getchar u1
+get2chars :: Val -> (String, Val)
+get4chars u0 = (a++b, u2)    where (a, u1) = get2chars u0
+                                   (b, u2) = get2chars u1
+now_or_later :: Val -> (String, Val)
+now_or_later u = case getchar u of
+                   (c, u') | c == 'y'  = ("Now",   u')
+                           | c == 'Y'  = ("Now",   u')
+                   (_, u')             = ("Later", u')
 </haskell>
+=== The fun of plumbing ===
-While that does work, it's error-prone:
+While that does work, it's error-prone e.g:
 <haskell>
-get2chars :: Int -> (String, Int)
+get2chars :: Val -> (String, Val)
-get2chars i0 = ([a, b], i2)  where (a, i1) = getchar i2  -- this might take a while...
+get2chars u0 = ([a, b], u2)  where (a, u1) = getchar u2  -- this might take
-                                   (b, i2) = getchar i1
+                                   (b, u2) = getchar u1  --    a while...
 </haskell>
@@ Line 109: / Line 212: @@
 <haskell>
-get2chars :: Int -> (String, Int)
+get2chars :: Val -> (String, Val)
-get2chars i0 = let (a, i1) = getchar i2 in  -- error: i2 is undefined!
+get2chars u0 = let (a, u1) = getchar u2 in  -- error: i2 is undefined!
-               let (b, i2) = getchar i1 in
+               let (b, u2) = getchar u1 in
-               ([a, b], i2)
+               ([a, b], u2)
 </haskell>
@@ Line 118: / Line 221: @@
 <haskell>
-get2chars :: Int -> (String, Int)
+get2chars :: Val -> (String, Val)
-get2chars i0 = let (a, i1) = getchar i0 in
+get2chars u0 = let (a, u1) = getchar u0 in
-               let (b, i2) = getchar i2 in  -- here we go again...
+               let (b, u2) = getchar u2 in  -- here we go again...
-               ([a, b], i2)
+               ([a, b], u2)
 </haskell>
+We need some way to automate the chore of passing around all those abstract values...
-So how in Haskell shall we prevent such mistakes from happening? With a [[monad]]!
-=== What is a monad? ===
+=== Enter the monad ===
 But what is a monad? For Haskell, it's a three-way partnership between:
@@ Line 133: / Line 236: @@
 * an operator <code>bind(M) :: M a -> (a -> M b) -> M b</code>
-where <code>unit(M)</code> and <code>bind(M)</code> satisify the [[monad laws]].
+where <code>unit(M)</code> and <code>bind(M)</code> satisfy the [[monad laws]].
 This would translate literally into Haskell as:
@@ Line 145: / Line 248: @@
 For now, we'll just define <code>unit</code> and <code>bind</code> directly - no type classes.
-So how does something so <strike>vague</strike> abstract help us with I/O? Because this abstraction allows us to hide the manipulation of all those fake values - the ones we've been using to maintain the correct sequence of evaluation. We just need a suitable type:
+So how does something so <strike>vague</strike> abstract help us with I/O? Because this abstraction allows us to hide the manipulation of all those abstract values - the ones we've been using to maintain the correct sequence of evaluation. We just need a suitable type:
 <haskell>
-type IO' a =  Int -> (a, Int)
+type IO' a =  Val -> (a, Val)
 </haskell>
-and appropriate defintions for <code>unit</code> and <code>bind</code>:
+and appropriate definitions for <code>unit</code> and <code>bind</code>:
 <haskell>
 unit       :: a -> IO' a
-unit x     =  \i0 -> (x, i0)
+unit x     =  \u0 -> (x, u0)
 bind       :: IO' a -> (a -> IO' b) -> IO' b
-bind m k   =  \i0 -> let (x, i1) =  m i0 in
+bind m k   =  \u0 -> let (x, u1) =  m u0 in
-                     let (y, i2) =  k x i1 in
+                     let (y, u2) =  k x u1 in
-                     (y, i2)
+                     (y, u2)
 </haskell>
-Now for some extra changes to <code>getchar</code> and <code>get2chars</code>:
+Now for some extra changes to <code>getchar</code>, along with <code>get2chars</code> & co:
 <haskell>
-getchar      :: IO' Char    {-  = Int -> (Char, Int)  -}
+getchar      :: IO' Char    {-  = Val -> (Char, Val)  -}
-get2chars    :: IO' String  {-  = Int -> (String, Int)  -}
+get2chars    :: IO' String  {-  = Val -> (String, Val)  -}
-get2chars =  \i0 -> let (a, i1) =  getchar i0 in
+get2chars =  \u0 -> let (a, u1) =  getchar u0 in
-                    let (b, i2) =  getchar i1 in
+                    let (b, u2) =  getchar u1 in
                     let r       =  [a, b] in
-                    (r, i2)
+                    (r, u2)
+get4chars    :: IO' String  {-  = Val -> (String, Val)  -}
+get4chars =  \u0 -> let (a, u1) = get2chars u0 in
+                    let (b, u2) = get2chars u1 in
+                    let r       = a++b in
+                    (r, u2)
+now_or_later :: IO' String  {-  = Val -> (String, Val) -}
+now_or_later = \u -> let (c, u') = getchar u in
+                     let r = if elem c "yY" then "Now" else "Later" in
+                     (r, u')
 </haskell>
@@ Line 185: / Line 300: @@
              getchar `bind` \b ->
              unit [a, b]
+get4chars :: IO' String
+get4chars =  get2chars `bind` \a ->
+             get2chars `bind` \b ->
+             unit (a++b)
+now_or_later :: IO' String
+now_or_later = getchar `bind` \c ->
+               unit (if elem c "yY" then "Now" else "Later")
 </haskell>
-We no longer have to mess <strike>up</strike> with those fake values directly! We just need to be sure that all the operations on I/O actions like <code>unit</code> and <code>bind</code> use them correctly. We can then make <code>IO'</code>, <code>unit</code>, <code>bind</code> and (in this example) <code>getchar</code> into an ''abstract data type'' and just use those abstract I/O operations instead -
+We no longer have to mess <strike>up</strike> with those abstract values directly! We just need to be sure that all the operations on I/O actions like <code>unit</code> and <code>bind</code> use them correctly. We can then make <code>IO'</code>, <code>unit</code>, <code>bind</code> and (in this example) <code>getchar</code> into an ''abstract data type'' and just use those abstract I/O operations instead -
 only the Haskell implementation (e.g. compilers like ghc or jhc) needs to know how I/O actions actually work.
-So there you have it - a miniature monadic I/O system in Haskell!
+So there you have it - a miniature monadic I/O system in Haskell! Just one question remains: ''what in the world is ''<code>Val</code>''?''
 == Running with the <code>RealWorld</code> ==
@@ Line 202: / Line 326: @@
 </haskell>
-where <code>RealWorld</code> is a fake type used instead of our Int. It's something
+where <code>RealWorld</code> [[Output/Input|really is a fake type]] used instead of our <code>Val</code>. It's something
 like the baton passed in a relay race. When <code>main</code> calls some I/O action,
 it passes the <code>RealWorld</code> it received as a parameter. All I/O actions have
@@ Line 1,055: / Line 1,179: @@
 We also need to interact with the C world for using Windows/Linux APIs, linking to various libraries and DLLs. Even interfacing with other languages often requires going through C world as a "common denominator". [https://www.haskell.org/onlinereport/haskell2010/haskellch8.html Chapter 8 of the Haskell 2010 report] provides a complete description of interfacing with C.
-We will learn FFI via a series of examples. These examples include C/C++ code, so they need C/C++ compilers to be installed, the same will be true if you need to include code written in C/C++ in your program (C/C++ compilers are not required when you just need to link with existing libraries providing APIs with C calling convention). On Unix (and Mac OS?) systems, the system-wide default C/C++ compiler is typically used by GHC installation. On Windows, no default compilers exist, so GHC is typically shipped with a C compiler, and you may find on the download page a GHC distribution bundled with C and C++ compilers. Alternatively, you may find and install a GCC/MinGW version compatible with your GHC installation.
+We will learn to use the FFI via a series of examples. These examples include C/C++ code, so they need C/C++ compilers to be installed, the same will be true if you need to include code written in C/C++ in your program (C/C++ compilers are not required when you just need to link with existing libraries providing APIs with C calling convention). On Unix (and Mac OS?) systems, the system-wide default C/C++ compiler is typically used by GHC installation. On Windows, no default compilers exist, so GHC is typically shipped with a C compiler, and you may find on the download page a GHC distribution bundled with C and C++ compilers. Alternatively, you may find and install a GCC/MinGW version compatible with your GHC installation.
 If you need to make your C/C++ code as fast as possible, you may compile your code by Intel compilers instead of GCC. However, these compilers are not free, moreover on Windows, code compiled by Intel compilers may not interact correctly with GHC-compiled code, unless one of them is put into DLLs (due to object file incompatibility).
@@ Line 1,065: / Line 1,189: @@
 ;[[HSFFIG]]
-:Haskell FFI Binding Modules Generator (HSFFIG) is a tool that takes a C library header (".h") and generates Haskell Foreign Functions Interface import declarations for items (functions, structures, etc.) the header defines.
+:The Haskell FFI Binding Modules Generator (HSFFIG) is a tool that takes a C library header (".h") and generates Haskell Foreign Functions Interface import declarations for items (functions, structures, etc.) the header defines.
 ;[http://quux.org/devel/missingpy MissingPy]
@@ Line 1,238: / Line 1,362: @@
 == '''The dark side of the I/O monad''' ==
-Unless you are a systems developer, postgraduate CS student, or have alternate (and eminent!) verificable qualifications you should have '''no need whatsoever''' for this section - [https://stackoverflow.com/questions/9449239/unsafeperformio-in-threaded-applications-does-not-work here] is just one tiny example of what can go wrong if you don't know what you are doing. Look for other solutions!
+Unless you are a systems developer, postgraduate CS student, or have alternate (and eminent!) verifiable qualifications you should have '''no need whatsoever''' for this section - [https://stackoverflow.com/questions/9449239/unsafeperformio-in-threaded-applications-does-not-work here] is just one tiny example of what can go wrong if you don't know what you are doing. Look for other solutions!
 === '''unsafePerformIO''' ===
@@ Line 1,545: / Line 1,669: @@
 == <span id="readmore"></span>Further reading ==
-[1] This tutorial is largely based on Simon Peyton Jones's paper [https://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.13.9123&rep=rep1&type=pdf Tackling the awkward squad: monadic input/output, concurrency, exceptions, and foreign-language calls in Haskell]. I hope that my tutorial improves his original explanation of the Haskell I/O system and brings it closer to the point of view of new Haskell programmers. But if you need to learn about concurrency, exceptions and FFI in Haskell/GHC, the original paper is the best source of information.
+[1] This tutorial is largely based on Simon Peyton Jones's paper [https://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.13.9123&rep=rep1&type=pdf Tackling the awkward squad: monadic input/output, concurrency, exceptions, and foreign-language calls in Haskell]. I hope that my tutorial improves his original explanation of the Haskell I/O system and brings it closer to the point of view of new Haskell programmers. But if you need to learn about concurrency, exceptions and the FFI in Haskell/GHC, the original paper is the best source of information.
-[2] You can find more information about concurrency, FFI and STM at the [[GHC/Concurrency#Starting points]] page.
+[2] You can find more information about concurrency, the FFI and STM at the [[GHC/Concurrency#Starting points]] page.
 [3] The [[Arrays]] page contains exhaustive explanations about using mutable arrays.
@@ Line 1,557: / Line 1,681: @@
 [6] Official FFI specifications can be found on the page [http://www.cse.unsw.edu.au/~chak/haskell/ffi/ The Haskell 98 Foreign Function Interface 1.0: An Addendum to the Haskell 98 Report]
-[7] Using FFI in multithreaded programs described in paper [http://www.haskell.org/~simonmar/bib/concffi04_abstract.html Extending the Haskell Foreign Function Interface with Concurrency]
+[7] Using the FFI in multithreaded programs is described in [http://www.haskell.org/~simonmar/bib/concffi04_abstract.html Extending the Haskell Foreign Function Interface with Concurrency]
 [8] This particular behaviour is not a requirement of Haskell 2010, so the operation of <code>seq</code> may differ between various Haskell implementations - if you're not sure, staying within the I/O monad is the safest option.
@@ Line 1,583: / Line 1,707: @@
 * how <code>unsafeInterLeaveIO</code> can be seen as a kind of concurrency, and therefore isn't so unsafe (unlike <code>unsafeInterleaveST</code> which really is unsafe)
 * discussion about different senses of <code>safe</code>/<code>unsafe</code> (like breaking equational reasoning vs. invoking undefined behaviour (so can corrupt the run-time system))
-* actual GHC implementation - how to write low-level routines based on example of <code>newIORef</code> implementation
+* actual GHC implementation - how to write low-level routines based on example of <code>newIORef</code>'s implementation
 This manual is collective work, so feel free to add more information to it yourself. The final goal is to collectively develop a comprehensive manual for using the I/O monad.

Difference between revisions of "IO inside"

Revision as of 04:58, 8 January 2022

Haskell is a pure language

I/O in Haskell, simplified

A matter of time

A change of input

One step after another

The fun of plumbing

Enter the monad

Running with the RealWorld

(>>=) and do notation

Mutable data (references, arrays, hash tables...)

Encapsulated mutable data: ST

I/O actions as values

Example: a list of I/O actions

Example: returning an I/O action as a result

Example: a memory allocator generator

Example: emulating OOP with record types

Exception handling (under development)

Interfacing with C/C++ and foreign libraries (under development)

Calling functions

All about the foreign declaration

Marshalling simple types

Memory management

Marshalling strings

Marshalling composite types

Dynamic calls

DLLs

The dark side of the I/O monad

unsafePerformIO

inlinePerformIO

unsafeInterleaveIO

Welcome to the machine: the actual GHC implementation

The Yhc/nhc98 implementation

Further reading

To-do list

Navigation menu

Search

Running with the `RealWorld`

`(>>=)` and `do` notation

All about the `foreign` declaration