Difference between revisions of "IO inside"

guarantees

putStrLn "Press any key to begin formatting"

class Monad m where
    unit :: a -> m a
    bind :: m a -> (a -> m b) -> m b

getchar :: Char

get2chars = [getchar, getchar]

get2chars = let x = getchar in [x, x]  -- this should be a legitimate optimisation!

getchar :: Int -> Char

get2chars = [getchar 1, getchar 2]

getchar :: Int -> (Char, Int)

get2chars _ = [a, b]  where (a, i) = getchar 1
                            (b, _) = getchar i

get2chars i0 = [a, b]  where (a, i1) = getchar i0
                             (b, i2) = getchar i1

get4chars = [get2chars 1, get2chars 2]  -- order of calls to 'get2chars' isn't defined

get2chars :: Int -> (String, Int)

get4chars i0 = (a++b)  where (a, i1) = get2chars i0
                             (b, i2) = get2chars i1

get2chars :: Int -> (String, Int)
get2chars i0 = ([a, b], i2)  where (a, i1) = getchar i0
                                   (b, i2) = getchar i1

get2chars :: Int -> (String, Int)
get2chars i0 = ([a, b], i2)  where (a, i1) = getchar i2  -- this might take a while...
                                   (b, i2) = getchar i1

getchar   :: IO' Char

get2chars :: IO' String
get2chars =  getchar `bind` \a ->
             getchar `bind` \b ->
             unit [a, b]

get4chars :: IO' String
get4chars =  get2chars `bind` \a ->
             get2chars `bind` \b ->
             unit (a++b)

type IO' a =  Int -> (a, Int)  -- IO' is kept private!

unit       :: a -> IO' a
unit x     =  MkIO' $ \i0 -> (x, i0)

bind       :: IO' a -> (a -> IO' b) -> IO' b
bind m k   =  MkIO' $ \i0 -> let (x, i1) =  m i0 in
                             let (y, i2) =  (case f x of w -> w i1) in
                             (y, i2)

getchar    :: IO' Char
getchar    =  \i0 -> case primGetChar i0 of (i1, c) -> (c, i1)

primitive primGetChar :: Int -> (Int, Char)  -- also kept private!

main :: RealWorld -> ((), RealWorld)

type IO a  =  RealWorld -> (a, RealWorld)

getChar :: RealWorld -> (Char, RealWorld)

main :: RealWorld -> ((), RealWorld)
main world0 = let (a, world1) = getChar world0
                  (b, world2) = getChar world1
              in ((), world2)

main = do a <- ask "What is your name?"
          b <- ask "How old are you?"
          return ()

ask s = do putStr s
           readLn

when :: Bool -> IO () -> IO ()
when condition action world =
    if condition
      then action world
      else ((), world)

  main = do putStr "Hello!"

  main = putStr "Hello!"

main = do putStr "What is your name?"
          putStr "How old are you?"
          putStr "Nice day!"

main = (putStr "What is your name?")
       >> ( (putStr "How old are you?")
            >> (putStr "Nice day!")
          )

(>>) :: IO a -> IO b -> IO b
(action1 >> action2) world0 =
   let (a, world1) = action1 world0
       (b, world2) = action2 world1
   in (b, world2)

action1 >> action2 = action
  where
    action world0 = let (a, world1) = action1 world0
                        (b, world2) = action2 world1
                    in (b, world2)

main = do a <- readLn
          print a

main = readLn
       >>= (\a -> print a)

(>>=) :: IO a -> (a -> IO b) -> IO b
(action >>= reaction) world0 =
   let (a, world1) = action world0
       (b, world2) = reaction a world1
   in (b, world2)

type IO a  =  RealWorld -> (a, RealWorld)

main = readLn >>= print

 do x <- action1
    action2

 action1 >>= (\x -> action2)

main = do putStr "What is your name?"
          a <- readLn
          putStr "How old are you?"
          b <- readLn
          print (a,b)

main = putStr "What is your name?"
       >> readLn
       >>= \a -> putStr "How old are you?"
       >> readLn
       >>= \b -> print (a,b)

return :: a -> IO a
return a world0  =  (a, world0)

main = do a <- readLn
          return (a*2)

main = do a <- readLn
          when (a>=0) $ do
              return ()
          print "a is negative"

main = do a <- readLn
          if (a>=0)
            then return ()
            else print "a is negative"

main = do a <- readLn
          if (a>=0) then return ()
            else do
          print "a is negative"
          ...

liftM :: (a -> b) -> (IO a -> IO b)

liftM f action = do x <- action
                    return (f x)

main = do let a0 = readVariable varA
              _  = writeVariable varA 1
              a1 = readVariable varA
          print (a0, a1)

import Data.IORef
main = do varA <- newIORef 0  -- Create and initialize a new variable
          a0 <- readIORef varA
          writeIORef varA 1
          a1 <- readIORef varA
          print (a0, a1)

import Data.Array.IO
main = do arr <- newArray (1,10) 37 :: IO (IOArray Int Int)
          a <- readArray arr 1
          writeArray arr 1 64
          b <- readArray arr 1
          print (a, b)

rand :: IO Int

foreign import ccall
   sin :: Double -> Double

foreign import ccall
   tell :: Int -> IO Int

main world0 = let get2chars = getChar >> getChar
                  ((), world1) = putStr "Press two keys" world0
                  (answer, world2) = get2chars world1
              in ((), world2)

main = do let get2chars = getChar >> getChar
          putStr "Press two keys"
          get2chars
          return ()

ioActions :: [IO ()]
ioActions = [(print "Hello!"),
             (putStr "just kidding"),
             (getChar >> return ())
            ]

ioActions :: [RealWorld -> ((), RealWorld)]

main = do head ioActions
          ioActions !! 1
          last ioActions

sequence_ :: [IO a] -> IO ()
sequence_ [] = return ()
sequence_ (x:xs) = do x
                      sequence_ xs

main = sequence_ ioActions

while :: IO Bool -> IO ()
while action = ???

main = do let a = sequence ioActions
              b = when True getChar
              c = getChar >> getChar
          putStr "These let-statements are not executed!"

readi h i = do hSeek h AbsoluteSeek i
               hGetChar h

readfilei :: String -> IO (Integer -> IO Char)
readfilei name = do h <- openFile name ReadMode
                    return (readi h)

readfilei name = do h <- openFile name ReadMode
                    let readi h i = do hSeek h AbsoluteSeek i
                                       hGetChar h
                    return (readi h)

readfilei name = do h <- openFile name ReadMode
                    let readi i = do hSeek h AbsoluteSeek i
                                     hGetChar h
                    return readi

main = do myfile <- readfilei "test"
          a <- myfile 0
          b <- myfile 1
          print (a,b)

memoryAllocator :: Ptr a -> Int -> IO (Int -> IO (Ptr b),
                                       Ptr c -> IO ())

memoryAllocator buf size = do ......
                              let alloc size = do ...
                                                  ...
                                  free ptr = do ...
                                                ...
                              return (alloc, free)

memoryAllocator buf size = do start <- newIORef buf
                              end <- newIORef (buf `plusPtr` size)
                              ...

      ...
      let alloc size = do addr <- readIORef start
                          writeIORef start (addr `plusPtr` size)
                          return addr

      let free ptr = do writeIORef start ptr

main = do buf1 <- mallocBytes (2^16)
          buf2 <- mallocBytes (2^20)
          (alloc1, free1) <- memoryAllocator buf1 (2^16)
          (alloc2, free2) <- memoryAllocator buf2 (2^20)
          ptr11 <- alloc1 100
          ptr21 <- alloc2 1000
          free1 ptr11
          free2 ptr21
          ptr12 <- alloc1 100
          ptr22 <- alloc2 1000

data Figure = Figure { draw :: IO (),
                       move :: Displacement -> IO ()
                     }

type Displacement = (Int, Int)  -- horizontal and vertical displacement in points

circle    :: Point -> Radius -> IO Figure
rectangle :: Point -> Point -> IO Figure

type Point = (Int, Int)  -- point coordinates
type Radius = Int        -- circle radius in points

circle center radius = do
    let description = "  Circle at "++show center++" with radius "++show radius
    return $ Figure { draw = putStrLn description }

rectangle from to = do
    let description = "  Rectangle "++show from++"-"++show to)
    return $ Figure { draw = putStrLn description }

drawAll :: [Figure] -> IO ()
drawAll figures = do putStrLn "Drawing figures:"
                     mapM_ draw figures

main = do figures <- sequence [circle (10,10) 5,
                               circle (20,20) 3,
                               rectangle (10,10) (20,20),
                               rectangle (15,15) (40,40)]
          drawAll figures

circle center radius = do
    centerVar <- newIORef center

    let drawF = do center <- readIORef centerVar
                   putStrLn ("  Circle at "++show center
                             ++" with radius "++show radius)

    let moveF (addX,addY) = do (x,y) <- readIORef centerVar
                               writeIORef centerVar (x+addX, y+addY)

    return $ Figure { draw=drawF, move=moveF }

rectangle from to = do
    fromVar <- newIORef from
    toVar   <- newIORef to

    let drawF = do from <- readIORef fromVar
                   to   <- readIORef toVar
                   putStrLn ("  Rectangle "++show from++"-"++show to)

    let moveF (addX,addY) = do (fromX,fromY) <- readIORef fromVar
                               (toX,toY)     <- readIORef toVar
                               writeIORef fromVar (fromX+addX, fromY+addY)
                               writeIORef toVar   (toX+addX, toY+addY)

    return $ Figure { draw=drawF, move=moveF }

main = do figures <- sequence [circle (10,10) 5,
                               rectangle (10,10) (20,20)]
          drawAll figures
          mapM_ (\fig -> move fig (10,10)) figures
          drawAll figures

data Figure = Figure { draw :: IO (),
                       move :: Displacement -> IO (),
                       area :: Double,
                       origin :: IORef Point
                     }

main = print (f 2)

f 0 = "zero"
f 1 = "one"

main = print (head [])

main = print (1 + (error "Value that wasn't initialized or cannot be computed"))

{-# LANGUAGE ForeignFunctionInterface #-}

main = do print "Hello from main"
          c_function

haskell_function = print "Hello from haskell_function"

foreign import ccall safe "prototypes.h"
    c_function :: IO ()

foreign export ccall
    haskell_function :: IO ()

#include <stdio.h>
#include "prototypes.h"

void c_function (void)
{
  printf("Hello from c_function\n");
  haskell_function();
}

extern void c_function (void);
extern void haskell_function (void);

 ghc --make main.hs evil.c

 ghc -c evil.c
 ghc --make main.hs evil.o

#ifdef __cplusplus
extern "C" {
#endif

extern void c_function (void);
extern void haskell_function (void);

#ifdef __cplusplus
}
#endif

 ghc --make main.hs evil.cpp

foreign import ccall safe "prototypes.h CFunction"
    c_function :: IO ()

foreign export ccall "HaskellFunction"
    haskell_function :: IO ()

foreign import stdcall unsafe "windows.h SetFileApisToOEM"
  setFileApisToOEM :: IO ()

import Foreign.C.Types (               -- equivalent to the following C type:
         CChar, CUChar,                --  char/unsigned char
         CShort, CUShort,              --  short/unsigned short
         CInt, CUInt, CLong, CULong,   --  int/unsigned/long/unsigned long
         CFloat, CDouble...)           --  float/double

foreign import ccall unsafe "math.h"
    c_sin :: CDouble -> CDouble

-- |Type-conversion wrapper around c_sin
sin :: Double -> Double
sin = fromRational . c_sin . toRational

import Foreign.C.String (   -- representation of strings in C
         CString,           -- = Ptr CChar
         CStringLen)        -- = (Ptr CChar, Int)

foreign import ccall unsafe "string.h"
    c_strlen :: CString -> IO CSize     -- CSize defined in Foreign.C.Types and is equal to size_t

-- |Type-conversion wrapper around c_strlen 
strlen :: String -> Int
strlen = ....

readContents :: Filename -> String

unsafePerformIO :: IO a -> a

unsafePerformIO :: (RealWorld -> (a, RealWorld)) -> a
unsafePerformIO action = let (a, world1) = action (createNewWorld action)
                         in a

one :: Integer
one = unsafePerformIO $ do var <- newIORef 0
                           modifyIORef var (+1)
                           readIORef var

unsafePerformIO action = let (a,world1) = action (createNewWorld action)
                         in (world1 `seq` a)

-- | Just like unsafePerformIO, but we inline it. Big performance gains as
-- it exposes lots of things to further inlining
{-# INLINE inlinePerformIO #-}
inlinePerformIO action = let (a, world1) = action createNewWorld
                         in (world1 `seq` a)
#endif

write :: Int -> (Ptr Word8 -> IO ()) -> Put ()
write !n body = Put $ \c buf@(Buffer fp o u l) ->
  if n <= l
    then write</code> c fp o u l
    else write</code> (flushOld c n fp o u) (newBuffer c n) 0 0 0

  where {-# NOINLINE write</code> #-}
        write</code> c !fp !o !u !l =
          -- warning: this is a tad hardcore
          inlinePerformIO
            (withForeignPtr fp
              (\p -> body $! (p `plusPtr` (o+u))))
          `seq` c () (Buffer fp o (u+n) (l-n))

word8 w = write 1 (\p -> poke p w)

unsafeInterleaveIO :: IO a -> IO a

unsafeInterleaveIO   :: IO a -> IO a
unsafeInterleaveIO a =  return (unsafePerformIO a)

do let c = unsafePerformIO getChar
   do_proc c

do let s = [unsafePerformIO getChar, unsafePerformIO getChar, unsafePerformIO getChar]
   do_proc s

do str <- unsafeInterleaveIO myGetContents

myGetContents = do
   c <- getChar
   s <- unsafeInterleaveIO myGetContents
   return (c:s)

myGetContents = do
   c <- replicateM 512 getChar
   s <- unsafeInterleaveIO myGetContents
   return (c++s)

myGetContents = unsafeInterleaveIO $ do
   c <- replicateM 512 getChar
   s <- myGetContents
   return (c++s)

runST :: (forall s . ST s a) -> a

newSTRef :: a -> ST s (STRef s a)
newArray_ :: Ix i => (i, i) -> ST s (STArray s i e)

makeSTRef :: a -> STRef s a
makeSTRef a = runST (newSTRef a)

stToIO :: ST RealWorld a -> IO a

oneST :: ST s Int -- note that this works correctly for any s
oneST = do var <- newSTRef 0
           modifySTRef var (+1)
           readSTRef var

one :: Int
one = runST oneST

newtype IO a = IO (State# RealWorld -> (# State# RealWorld, a #))

data World = World
newtype IO a = IO (World -> Either IOError a)

Difference between revisions of "IO inside"

Revision as of 13:59, 10 December 2020

Contents

Haskell is a pure language

What is a monad?

Welcome to the `RealWorld`, baby

`(>>=)` and `do` notation

Mutable data (references, arrays, hash tables...)

I/O actions as values

Example: a list of I/O actions

Example: returning an I/O action as a result

Example: a memory allocator generator

Example: emulating OOP with record types

Exception handling (under development)

Interfacing with C/C++ and foreign libraries (under development)

Calling functions

All about the `foreign` statement

Marshalling simple types

Memory management

Marshalling strings

Marshalling composite types

Dynamic calls

DLLs

Dark side of I/O monad

`unsafePerformIO`

`inlinePerformIO`

`unsafeInterleaveIO`

A safer approach: the ST monad

Welcome to the machine: the actual GHC implementation

The Yhc/nhc98 implementation

Further reading

To-do list

Navigation menu

Search

@@ Line 6: / Line 6: @@
 mess. This is because Haskell I/O is really very different in how it actually works.
-The following text is an attempt to explain the details of Haskell I/O implementations. This explanation should help you eventually learn all the smart I/O tricks.
+The following text is an attempt to explain the details of Haskell I/O implementations. This explanation should help you eventually learn all the smart I/O tips.
-Moreover, I've added a detailed explanation of various traps you might encounter along the way. After reading this text, you will be well on your way towards mastering I/O
+Moreover, I've added a detailed explanation of various traps you might encounter along the way. After reading this text, you will be well on your way towards mastering I/O in Haskell.
-in Haskell.
 == Haskell is a pure language ==
-Haskell is a pure language and even the I/O system can't break this purity. Being pure means that the result of any function call is fully determined by its arguments. Pseudo-functions like rand() or getchar() in C, which return different results on each call, are simply impossible to write in Haskell. Moreover, Haskell functions can't have side effects, which means that they can't effect any changes to the "real world", like changing files, writing to the screen, printing, sending data over the network, and so on. These two restrictions together mean that any function call can be replaced by the result of a previous call with the same parameters, and the language ''guarantees'' that all these rearrangements will not change the program result!
+Haskell is a pure language and even the I/O system can't break this purity. Being pure means that the result of any function call is fully determined by its arguments. Procedural entities like <code>rand()</code> or <code>getchar()</code> in C, which return different results on each call, are simply impossible to write in Haskell. Moreover, Haskell functions can't have side effects, which means that they can't effect any changes to the "real world", like changing files, writing to the screen, printing, sending data over the network, and so on. These two restrictions together mean that any function call can be replaced by the result of a previous call with the same parameters, and the language ''guarantees'' that all these rearrangements will not change the program result!
 Let's compare this to C: optimizing C compilers try to guess which functions have no side effects and don't depend on mutable global variables. If this guess is wrong, an optimization can change the program's semantics! To avoid this kind of disaster, C optimizers are conservative in their guesses or require hints from the programmer about the purity of functions.
@@ Line 18: / Line 17: @@
 Compared to an optimizing C compiler, a Haskell compiler is a set of pure mathematical transformations. This results in much better high-level optimization facilities. Moreover, pure mathematical computations can be much more easily divided into several threads that may be executed in parallel, which is increasingly important in these days of multi-core CPUs. Finally, pure computations are less error-prone and easier to verify, which adds to Haskell's robustness and to the speed of program development using Haskell.
-Haskell's purity allows the compiler to call only functions whose results are really required to calculate the final value of a top-level function (e.g., main) - this is called lazy evaluation. It's a great thing for pure mathematical computations, but how about I/O actions? A function like
+Haskell's purity allows the compiler to call only functions whose results are really required to calculate the final value of a top-level function (e.g. <code>main</code>) - this is called lazy evaluation. It's a great thing for pure mathematical computations, but how about I/O actions? A function like
 <haskell>
@@ Line 41: / Line 40: @@
 </haskell>
-For now, we'll just define 'unit' and 'bind' directly - no type classes.
+For now, we'll just define <code>unit</code> and <code>bind</code> directly - no type classes.
-So how does something so <strike>abstract</strike> vague help us with I/O? Well, let's imagine that we want to implement the well-known 'getchar' function in Haskell. What type should it have?  Let's try:
+So how does something so <strike>abstract</strike> vague help us with I/O? Well, let's imagine that we want to implement the well-known <code>getchar</code> I/O operation in Haskell. What type should it have?  Let's try:
 <haskell>
@@ Line 51: / Line 50: @@
 </haskell>
-What will we get with 'getchar' having just the 'Char' type? You can see one problem in the definition of 'get2chars' immediately:
+What will we get with <code>getchar</code> having just the <code>Char</code> type? You can see one problem in the definition of <code>get2chars</code> immediately:
+* because the Haskell compiler treats all functions as pure (not having side effects), it can avoid "unnecessary" calls to <code>getchar</code> and use one returned value twice:
-* because the Haskell compiler treats all functions as pure (not having side effects), it can avoid "unnecessary" calls to 'getchar' and use one returned value twice:
 <haskell>
@@ Line 59: / Line 59: @@
 </haskell>
-How can this problem be solved from the programmer's perspective? Let's introduce a fake parameter of 'getchar' to make each call "different" from the compiler's point of view:
+How can this problem be solved from the programmer's perspective? Let's introduce a fake parameter of <code>getchar</code> to make each call "different" from the compiler's point of view:
 <haskell>
@@ Line 69: / Line 69: @@
 Right away, this solves the first problem mentioned above - now the compiler will make two calls because it sees that the calls have different parameters. But there's another problem:
-* even if it does make two calls, there is no way to determine which call should be performed first. Do you want to return the two chars in the order in which they were read, or in the opposite order? Nothing in the definition of 'get2chars' answers this question.
+* even if it does make two calls, there is no way to determine which call should be performed first. Do you want to return the two chars in the order in which they were read, or in the opposite order? Nothing in the definition of <code>get2chars</code> answers this question.
-We need to give the compiler some clue to determine which function it should call first. The Haskell language doesn't provide any way to specify the sequence needed to evaluate 'getchar 1' and getchar '2' - except for data dependencies! How about adding an artificial data dependency which prevents evaluation of the second 'getchar' before the first one? In order to achieve this, we will return an additional fake result from 'getchar' that will be used as a parameter for the next 'getchar' call:
+We need to give the compiler some clue to determine which function it should call first. The Haskell language doesn't provide any way to specify the sequence needed to evaluate <code>getchar 1</code> and <code>getchar 2</code> - except for data dependencies! How about adding an artificial data dependency which prevents evaluation of the second <code>getchar</code> before the first one? In order to achieve this, we will return an additional fake result from <code>getchar</code> that will be used as a parameter for the next <code>getchar</code> call:
 <haskell>
@@ Line 80: / Line 80: @@
 </haskell>
-So far so good - now we can guarantee that 'a' is read before 'b' because reading 'b' needs the value ('i') that is returned by reading 'a'!
+So far so good - now we can guarantee that <code>a</code> is read before <code>b</code> because reading <code>b</code> needs the value (<code>i</code>) that is returned by reading <code>a</code>!
-We've added a fake parameter to 'get2chars' but the problem is that the Haskell compiler is too smart! It can believe that the external 'getchar' function is really dependent on its parameter but for 'get2chars' it will see that we're just cheating because we throw it away! Therefore it won't feel obliged to execute the calls in the order we want.
+We've added a fake parameter to <code>get2chars</code> but the problem is that the Haskell compiler is too smart! It can believe that the external <code>getchar</code> function is really dependent on its parameter but for <code>get2chars</code> it will see that we're just cheating because we throw it away! Therefore it won't feel obliged to execute the calls in the order we want.
-How can we fix this? How about passing this fake parameter to the 'getchar' function? In this case the compiler can't guess that it is really unused.
+How can we fix this? How about passing this fake parameter to the <code>getchar</code> function? In this case the compiler can't guess that it is really unused.
 <haskell>
@@ Line 91: / Line 91: @@
 </haskell>
-Furthermore, 'get2chars' has the same purity problems as the 'getchar' function. If you need to call it two times, you need a way to describe the order of these calls. Consider this:
+Furthermore, <code>get2chars</code> has the same purity problems as the <code>getchar</code> function. If you need to call it two times, you need a way to describe the order of these calls. Consider this:
 <haskell>
-get4chars = [get2chars 1, get2chars 2]  -- order of 'get2chars' calls isn't defined
+get4chars = [get2chars 1, get2chars 2]  -- order of calls to 'get2chars' isn't defined
 </haskell>
-We already know how to deal with this problem: 'get2chars' should also return some fake value that can be used to order calls:
+We already know how to deal with this problem: <code>get2chars</code> should also return some fake value that can be used to order calls:
 <haskell>
@@ Line 106: / Line 106: @@
 </haskell>
-But what should the fake return value of 'get2chars' be? If we use some integer constant, the excessively smart Haskell compiler will guess that we're cheating again. What about returning the value returned by 'getchar'? See:
+But what should the fake return value of <code>get2chars</code> be? If we use some integer constant, the excessively smart Haskell compiler will guess that we're cheating again. What about returning the value returned by <code>getchar</code>? See:
 <haskell>
@@ Line 159: / Line 159: @@
 There you have it - the whole "monadic" Haskell I/O system!
-== Welcome to the RealWorld, baby ==
+== Welcome to the <code>RealWorld</code>, baby ==
-Warning: The following story about IO is incorrect in that it cannot actually explain some important aspects of IO (including interaction and concurrency). However, some people find it useful to begin developing an understanding.
+Warning: The following story about I/O is incorrect in that it cannot actually explain some important aspects of I/O (including interaction and concurrency). However, some people find it useful to begin developing an understanding.
-The 'main' Haskell function has the type:
+The <code>main</code> Haskell function has the type:
 <haskell>
@@ Line 169: / Line 169: @@
 </haskell>
-where 'RealWorld' is a fake type used instead of our Int. It's something
+where <code>RealWorld</code> is a fake type used instead of our Int. It's something
-like the baton passed in a relay race. When 'main' calls some IO function,
+like the baton passed in a relay race. When <code>main</code> calls some I/O action,
-it passes the "RealWorld" it received as a parameter. All IO functions have
+it passes the <code>RealWorld</code> it received as a parameter. All I/O actions have
-similar types involving RealWorld as a parameter and result. To be
+similar types involving <code>RealWorld</code> as a parameter and result. To be
-exact, "IO" is a type synonym defined in the following way:
+exact, <code>IO</code> is a type synonym defined in the following way:
 <haskell>
@@ Line 179: / Line 179: @@
 </haskell>
-So, 'main' just has type "IO ()", 'getChar' has type "IO Char" and so
+So, <code>main</code> just has type <code>IO ()</code>, <code>getChar</code> has type <code>IO Char</code> and so
-on.  You can think of the type "IO Char" as meaning "take the current RealWorld, do something to it, and return a Char and a (possibly changed) RealWorld".  Let's look at 'main' calling 'getChar' two times:
+on.  You can think of the type <code>IO Char</code> as meaning "take the current <code>RealWorld</code>, do something to it, and return a <code>Char</code> and a (possibly changed) <code>RealWorld</code>".  Let's look at <code>main</code> calling <code>getChar</code> two times:
 <haskell>
@@ Line 191: / Line 191: @@
 </haskell>
-Look at this closely: 'main' passes the "world" it received to the first 'getChar'. This 'getChar' returns some new value of type RealWorld
+Look at this closely: <code>main</code> passes the "world" it received to the first <code>getChar</code>. This <code>getChar</code> returns some new value of type <code>RealWorld</code>
-that gets used in the next call. Finally, 'main' returns the "world" it got
+that gets used in the next call. Finally, <code>main</code> returns the "world" it got
-from the second 'getChar'.
+from the second <code>getChar</code>.
-* Is it possible here to omit any call of 'getChar' if the Char it read is not used? No: we need to return the "world" that is the result of the second 'getChar' and this in turn requires the "world" returned from the first 'getChar'.
+* Is it possible here to omit any call of <code>getChar</code> if the <code>Char</code> it read is not used? No: we need to return the "world" that is the result of the second <code>getChar</code> and this in turn requires the "world" returned from the first <code>getChar</code>.
-* Is it possible to reorder the 'getChar' calls? No: the second 'getChar' can't be called before the first one because it uses the "world" returned from the first call.
+* Is it possible to reorder the <code>getChar</code> calls? No: the second <code>getChar</code> can't be called before the first one because it uses the "world" returned from the first call.
 * Is it possible to duplicate calls? In Haskell semantics - yes, but real compilers never duplicate work in such simple cases (otherwise, the programs generated will not have any speed guarantees).
-As we already said, RealWorld values are used like a baton which gets passed
+As we already said, <code>RealWorld</code> values are used like a baton which gets passed
-between all routines called by 'main' in strict order. Inside each
+between all routines called by <code>main</code> in strict order. Inside each
-routine called, RealWorld values are used in the same way. Overall, in
+routine called, <code>RealWorld</code> values are used in the same way. Overall, in
-order to "compute" the world to be returned from 'main', we should perform
+order to "compute" the world to be returned from <code>main</code>, we should perform
-each IO procedure that is called from 'main', directly or indirectly.
+each I/O action that is called from <code>main</code>, directly or indirectly.
-This means that each procedure inserted in the chain will be performed
+This means that each action inserted in the chain will be performed
-just at the moment (relative to the other IO actions) when we intended it
+just at the moment (relative to the other I/O actions) when we intended it
 to be called. Let's consider the following program:
@@ Line 224: / Line 224: @@
 But what about conditional execution? No problem. Let's define the
-well-known 'when' operation:
+well-known <code>when</code> operation:
 <haskell>
@@ Line 235: / Line 235: @@
 As you can see, we can easily include or exclude from the execution chain
-IO procedures (actions) depending on the data values. If 'condition'
+I/O actions depending on the data values. If <code>condition</code>
-will be False on the call of 'when', 'action' will never be called because
+will be <code>False</code> on the call of <code>when</code>, <code>action</code> will never be called because real Haskell compilers, again, never call functions whose results
+are not required to calculate the final result (''i.e.'' here, the final "world" value of <code>main</code>).
-real Haskell compilers, again, never call functions whose results
-are not required to calculate the final result (''i.e.'', here, the final "world" value of 'main').
 Loops and more complex control structures can be implemented in
 the same way. Try it as an exercise!
-Finally, you may want to know how much passing these RealWorld
+Finally, you may want to know how much passing these <code>RealWorld</code>
-values around the program costs. It's free! These fake values exist solely for the compiler while it analyzes and optimizes the code, but when it gets to assembly code generation, it "suddenly" realize that this type is like "()", so
+values around the program costs. It's free! These fake values exist solely for the compiler while it analyzes and optimizes the code, but when it gets to assembly code generation, it notices that this type is like <code>()</code>, so
 all these parameters and result values can be omitted from the final generated code - they're not needed any more!
-== '>>=' and 'do' notation ==
+== <code>(>>=)</code> and <code>do</code> notation ==
-All beginners (including me) start by thinking that 'do' is some
+All beginners (including me) start by thinking that <code>do</code> is some
-super-awesome statement that executes IO actions. That's wrong - 'do' is just
+super-awesome statement that executes I/O actions. That's wrong - <code>do</code> is just
-syntactic sugar that simplifies the writing of procedures that use IO (and also other monads, but that's beyond the scope of this tutorial). 'do' notation eventually gets translated to
+syntactic sugar that simplifies the writing of definitions that use I/O (and also other monads, but that's beyond the scope of this tutorial). <code>do</code> notation eventually gets translated to
 a series of I/O actions passing "world" values around like we've manually written above.
-This simplifies the gluing of several IO actions together.
+This simplifies the gluing of several I/O actions together.
-You don't need to use 'do' for just one statement; for example,
+You don't need to use <code>do</code> for just one statement; for example,
 <haskell>
@@ Line 267: / Line 266: @@
 </haskell>
-Let's examine how to desugar a 'do' with multiple statements in the
+Let's examine how to desugar a <code>do</code> with multiple statements in the
 following example:
@@ Line 276: / Line 275: @@
 </haskell>
-The 'do' statement here just joins several IO actions that should be
+The <code>do</code> statement here just joins several I/O actions that should be
 performed sequentially. It's translated to sequential applications
-of one of the so-called "binding operators", namely '>>':
+of one of the so-called "binding operators", namely <code>(>>)</code>:
 <haskell>
@@ Line 287: / Line 286: @@
 </haskell>
-This binding operator just combines two IO actions, executing them
+This binding operator just combines two I/O actions, executing them
 sequentially by passing the "world" between them:
@@ Line 309: / Line 308: @@
 </haskell>
-Now you can substitute the definition of '>>' at the places of its usage
+Now you can substitute the definition of <code>(>>)</code> at the places of its usage
-and check that program constructed by the 'do' desugaring is actually the
+and check that program constructed by the <code>do</code> desugaring is actually the
 same as we could write by manually manipulating "world" values.
-A more complex example involves the binding of variables using "<-":
+A more complex example involves the binding of variables using <code><-</code>:
 <haskell>
@@ Line 327: / Line 326: @@
 </haskell>
-As you should remember, the '>>' binding operator silently ignores
+As you should remember, the <code>(>>)</code> binding operator silently ignores
 the value of its first action and returns as an overall result
-the result of its second action only. On the other hand, the '>>=' binding operator (note the extra '=' at the end) allows us to use the result of its first action - it gets passed as an additional parameter to the second one! Look at the definition:
+the result of its second action only. On the other hand, the <code>(>>=)</code> binding operator (note the extra <code>=</code> at the end) allows us to use the result of its first action - it gets passed as an additional parameter to the second one! Look at the definition:
 <haskell>
@@ Line 339: / Line 338: @@
 </haskell>
-* What does the type of "reaction" - namely "a -> IO b" - mean? By substituting the "IO" definition, we get "a -> RealWorld -> (b, RealWorld)". This means that "reaction" actually has two parameters - the type 'a' actually used inside it, and the value of type RealWorld used for sequencing of IO actions. That's always the case - any IO procedure has one more parameter compared to what you see in its type signature. This parameter is hidden inside the definition of the type synonym "IO":
+* What does the type of <code>reaction</code> - namely <code>a -> IO b</code> - mean? By substituting the <code>IO</code> definition, we get <code>a -> RealWorld -> (b, RealWorld)</code>. This means that <code>reaction</code> actually has two parameters - the type <code>a</code> actually used inside it, and the value of type <code>RealWorld</code> used for sequencing of I/O actions. That's always the case - any I/O definition has one more parameter compared to what you see in its type signature. This parameter is hidden inside the definition of the type synonym <code>IO</code>:
 <haskell>
@@ Line 345: / Line 344: @@
 </haskell>
-* You can use these '>>' and '>>=' operations to simplify your program. For example, in the code above we don't need to introduce the variable, because the result of 'readLn' can be send directly to 'print':
+* You can use these <code>(>>)</code> and <code>(>>=)</code> operations to simplify your program. For example, in the code above we don't need to introduce the variable, because the result of <code>readLn</code> can be send directly to <code>print</code>:
 <haskell>
@@ Line 358: / Line 357: @@
 </haskell>
-where 'action1' has type "IO a" and 'action2' has type "IO b",
+where <code>action1</code> has type <code>IO a</code> and <code>action2</code> has type <code>IO b</code>,
 translates into:
@@ Line 365: / Line 364: @@
 </haskell>
-where the second argument of '>>=' has the type "a -> IO b". It's the way
+where the second argument of <code>(>>=)</code> has the type <code>a -> IO b</code>. It's the way
-the '<-' binding is processed - the name on the left-hand side of '<-' just becomes a parameter of subsequent operations represented as one large IO action.  Note also that if 'action1' has type "IO a" then 'x' will just have type "a"; you can think of the effect of '<-' as "unpacking" the IO value of 'action1' into 'x'.  Note also that '<-' is not a true operator; it's pure syntax, just like 'do' itself.  Its meaning results only from the way it gets desugared.
+the <code><-</code> binding is processed - the name on the left-hand side of <code><-</code> just becomes a parameter of subsequent operations represented as one large I/O action.  Note also that if <code>action1</code> has type <code>IO a</code> then <code>x</code> will just have type <code>a</code>; you can think of the effect of <code><-</code> as "unpacking" the I/O value of <code>action1</code> into <code>x</code>.  Note also that <code><-</code> is not a true operator; it's pure syntax, just like <code>do</code> itself.  Its meaning results only from the way it gets desugared.
 Look at the next example:
@@ Line 388: / Line 387: @@
 </haskell>
-I omitted the parentheses here; both the '>>' and the '>>=' operators are
+I omitted the parentheses here; both the <code>(>>)</code> and the <code>(>>=)</code> operators are
-left-associative, but lambda-bindings always stretches as far to the right as possible, which means that the 'a' and 'b' bindings introduced
+left-associative, but lambda-bindings always stretches as far to the right as possible, which means that the <code>a</code> and <code>b</code> bindings introduced
 here are valid for all remaining actions. As an exercise, add the
-parentheses yourself and translate this procedure into the low-level
+parentheses yourself and translate this definition into the low-level
-code that explicitly passes "world" values. I think it should be enough to help you finally realize how the 'do' translation and binding operators work.
+code that explicitly passes "world" values. I think it should be enough to help you finally realize how the <code>do</code> translation and binding operators work.
-Oh, no! I forgot the third monadic operator - 'return'. It just
+Oh, no! I forgot the third monadic operator - <code>return</code>. It just
 combines its two parameters - the value passed and "world":
@@ Line 402: / Line 401: @@
 </haskell>
-How about translating a simple example of 'return' usage? Say,
+How about translating a simple example of <code>return</code> usage? Say,
 <haskell>
@@ Line 410: / Line 409: @@
 Programmers with an imperative language background often think that
-'return' in Haskell, as in other languages, immediately returns from
+<code>return</code> in Haskell, as in other languages, immediately returns from
-the IO procedure. As you can see in its definition (and even just from its
+the I/O definition. As you can see in its definition (and even just from its
 type!), such an assumption is totally wrong. The only purpose of using
-'return' is to "lift" some value (of type 'a') into the result of
+<code>return</code> is to "lift" some value (of type <code>a</code>) into the result of
-a whole action (of type "IO a") and therefore it should generally be used only as the last executed statement of some IO sequence. For example try to
+a whole action (of type <code>IO a</code>) and therefore it should generally
+be used only as the last executed statement of some I/O sequence. For example try to
-translate the following procedure into the corresponding low-level code:
+translate the following definition into the corresponding low-level code:
 <haskell>
@@ Line 424: / Line 424: @@
 </haskell>
-and you will realize that the 'print' statement is executed even for non-negative values of 'a'. If you need to escape from the middle of an IO procedure, you can use the 'if' statement:
+and you will realize that the <code>print</code> statement is executed even for non-negative values of <code>a</code>. If you need to escape from the middle of an I/O definition, you can use the <code>if</code> statement:
 <haskell>
@@ Line 443: / Line 443: @@
 </haskell>
-that may be useful for escaping from the middle of a longish 'do' statement.
+that may be useful for escaping from the middle of a longish <code>do</code> statement.
-Last exercise: implement a function 'liftM' that lifts operations on
+Last exercise: implement a function <code>liftM</code> that lifts operations on
 plain values to the operations on monadic ones. Its type signature:
@@ Line 476: / Line 476: @@
 Does this look strange?
-# The two calls to 'readVariable' look the same, so the compiler can just reuse the value returned by the first call.
+# The two calls to <code>readVariable</code> look the same, so the compiler can just reuse the value returned by the first call.
-# The result of the 'writeVariable' call isn't used so the compiler can (and will!) omit this call completely.
+# The result of the <code>writeVariable</code> call isn't used so the compiler can (and will!) omit this call completely.
 # These three calls may be rearranged in any order because they appear to be independent of each other.
-This is obviously not what was intended.  What's the solution? You already know this - use IO actions!  Using IO actions guarantees that:
+This is obviously not what was intended.  What's the solution? You already know this - use I/O actions! Doing that guarantees:
-# the result of the "same" action (such as "readVariable varA") will not be reused
+# the result of the "same" action (such as <code>readVariable varA</code>) will not be reused
 # each action will have to be executed
 # the execution order will be retained as written
@@ Line 497: / Line 497: @@
 </haskell>
-Here, 'varA' has the type "IORef Int" which means "a variable (reference) in
+Here, <code>varA</code> has the type <code>IORef Int</code> which means "a variable (reference) in
-the IO monad holding a value of type Int". newIORef creates a new variable
+the I/O monad holding a value of type <code>Int</code>". <code>newIORef</code> creates a new variable
 (reference) and returns it, and then read/write actions use this
-reference. The value returned by the "readIORef varA" action depends not
+reference. The value returned by the <code>readIORef varA</code> action depends not
 only on the variable involved but also on the moment this operation is performed so it can return different values on each call.
 Arrays, hash tables and any other _mutable_ data structures are
 defined in the same way - for each of them, there's an operation that creates new "mutable values" and returns a reference to it. Then value-specific read and write
-operations in the IO monad are used. The following code shows an example
+operations in the I/O monad are used. The following code shows an example
 using mutable arrays:
@@ Line 517: / Line 517: @@
 </haskell>
-Here, an array of 10 elements with 37 as the initial value at each location is created. After reading the value of the first element (index 1) into 'a' this element's value is changed to 64 and then read again into 'b'. As you can see by executing this code, 'a' will be set to 37 and 'b' to 64.
+Here, an array of 10 elements with 37 as the initial value at each location is created. After reading the value of the first element (index 1) into <code>a</code> this element's value is changed to 64 and then read again into <code>b</code>. As you can see by executing this code, <code>a</code> will be set to 37 and <code>b</code> to 64.
-Other state-dependent operations are also often implemented as IO
+Other state-dependent operations are also often implemented with I/O
 actions. For example, a random number generator should return a different
-value on each call. It looks natural to give it a type involving IO:
+value on each call. It looks natural to give it a type involving <code>IO</code>:
 <haskell>
@@ Line 530: / Line 530: @@
 routine is impure, i.e. its result depends on something in the "real
 world" (file system, memory contents...), internal state and so on,
-you should give it an IO type. Otherwise, the compiler can
+you should give it an <code>IO</code> type. Otherwise, the compiler can
-"optimize" repetitive calls of this procedure with the same parameters!
+"optimize" repetitive calls to the definition with the same parameters!
-For example, we can write a non-IO type for:
+For example, we can write a non-<code>IO</code> type for:
 <haskell>
@@ Line 540: / Line 540: @@
 </haskell>
-because the result of 'sin' depends only on its argument, but
+because the result of <code>sin</code> depends only on its argument, but
 <haskell>
@@ Line 547: / Line 547: @@
 </haskell>
-If you will declare 'tell' as a pure function (without IO) then you may
+If you will declare <code>tell</code> as a pure function (without <code>IO</code>) then you may
 get the same position on each call!
-== IO actions as values ==
+== I/O actions as values ==
-By this point you should understand why it's impossible to use IO
+By this point you should understand why it's impossible to use I/O
-actions inside non-IO (pure) procedures. Such procedures just don't
+actions inside non-I/O (pure) functions. Such functions just don't
-get a "baton"; they don't know any "world" value to pass to an IO action.
+get a "baton"; they don't know any "world" value to pass to an I/O action.
+The <code>RealWorld</code> type is an abstract datatype, so pure functions
-The RealWorld type is an abstract datatype, so pure functions also can't construct RealWorld values by themselves, and it's a strict type, so 'undefined' also can't be used. So, the prohibition of using IO actions inside pure procedures is just a type system trick (as it usually is in Haskell).
+also can't construct <code>RealWorld</code> values by themselves, and it's
+a strict type, so <code>undefined</code> also can't be used. So, the
+prohibition of using I/O actions inside pure functions is maintained by the
+type system (as it usually is in Haskell).
-But while pure code can't ''execute'' IO actions, it can work with them
+But while pure code can't ''execute'' I/O actions, it can work with them
 as with any other functional values - they can be stored in data
 structures, passed as parameters, returned as results, collected in
-lists, and partially applied. But an IO action will remain a
+lists, and partially applied. But an I/O action will remain a
 functional value because we can't apply it to the last argument - of
-type RealWorld.
+type <code>RealWorld</code>.
-In order to ''execute'' the IO action we need to apply it to some
+In order to ''execute'' the I/O action we need to apply it to some
-RealWorld value.  That can be done only inside some IO procedure,
+<code>RealWorld</code> value.  That can be done only inside other I/O actions,
-in its "actions chain". And real execution of this action will take
+in their "actions chains". And real execution of this action will take
-place only when this procedure is called as part of the process of
+place only when this action is called as part of the process of
-"calculating the final value of world" for 'main'. Look at this example:
+"calculating the final value of world" for <code>main</code>. Look at this example:
 <haskell>
@@ Line 577: / Line 581: @@
 </haskell>
-Here we first bind a value to 'get2chars' and then write a binding
+Here we first bind a value to <code>get2chars</code> and then write a binding
-involving 'putStr'. But what's the execution order? It's not defined
+involving <code>putStr</code>. But what's the execution order? It's not defined
-by the order of the 'let' bindings, it's defined by the order of processing
+by the order of the <code>let</code> bindings, it's defined by the order of processing
 "world" values! You can arbitrarily reorder the binding statements - the execution order will be defined by the data dependency with respect to the
-"world" values that get passed around. Let's see what this 'main' looks like in the 'do' notation:
+"world" values that get passed around. Let's see what this <code>main</code> looks like in the <code>do</code> notation:
 <haskell>
@@ Line 590: / Line 594: @@
 </haskell>
-As you can see, we've eliminated two of the 'let' bindings and left only the one defining 'get2chars'.  The non-'let' statements are executed in the exact order in which they're written, because they pass the "world" value from statement to statement as we described above.  Thus, this version of the function is much easier to understand because we don't have to mentally figure out the data dependency of the "world" value.
+As you can see, we've eliminated two of the <code>let</code> bindings and left only the one defining <code>get2chars</code>. The non-<code>let</code> statements are executed in the exact order in which they're written, because they pass the "world" value from statement to statement as we described above.  Thus, this version of the function is much easier to understand because we don't have to mentally figure out the data dependency of the "world" value.
-Moreover, IO actions like 'get2chars' can't be executed directly
+Moreover, I/O actions like <code>get2chars</code> can't be executed directly
-because they are functions with a RealWorld parameter. To execute them,
+because they are functions with a <code>RealWorld</code> parameter. To execute them,
-we need to supply the RealWorld parameter, i.e. insert them in the 'main'
+we need to supply the <code>RealWorld</code> parameter, i.e. insert them in the <code>main</code>
-chain, placing them in some 'do' sequence executed from 'main' (either directly in the 'main' function, or indirectly in an IO function called from 'main'). Until that's done, they will remain like any function, in partially
+chain, placing them in some <code>do</code> sequence executed from <code>main</code> (either directly in the <code>main</code> function, or indirectly in an
+I/O function called from <code>main</code>). Until that's done, they will remain like any function, in partially
-evaluated form. And we can work with IO actions as with any other
+evaluated form. And we can work with I/O actions as with any other
 functions - bind them to names (as we did above), save them in data
 structures, pass them as function parameters and return them as results - and
-they won't be performed until you give them that inaugural RealWorld
+they won't be performed until you give them that inaugural <code>RealWorld</code>
 parameter!
-=== Example: a list of IO actions ===
+=== Example: a list of I/O actions ===
-Let's try defining a list of IO actions:
+Let's try defining a list of I/O actions:
 <haskell>
@@ Line 621: / Line 626: @@
 Well, now we want to execute some of these actions. No problem, just
-insert them into the 'main' chain:
+insert them into the <code>main</code> chain:
 <haskell>
@@ Line 629: / Line 634: @@
 </haskell>
-Looks strange, right? Really, any IO action that you write in a 'do'
+Looks strange, right? Really, any I/O action that you write in a <code>do</code>
-statement (or use as a parameter for the '>>'/'>>=' operators) is an expression
+statement (or use as a parameter for the <code>(>>)</code>/<code>(>>=)</code> operators) is an expression
-returning a result of type 'IO a' for some type 'a'. Typically, you use some function that has the type 'x -> y -> ... -> IO a' and provide all the x, y, etc. parameters. But you're not limited to this standard scenario -
+returning a result of type <code>IO a</code> for some type <code>a</code>. Typically, you use some function that has the type <code>x -> y -> ... -> IO a</code> and provide all the x, y, etc. parameters. But you're not limited to this standard scenario -
 don't forget that Haskell is a functional language and you're free to
-compute the functional value required (recall that "IO a" is really a function
+compute the functional value required (recall that <code>IO a</code> is really a function
 type) in any possible way. Here we just extracted several functions
 from the list - no problem. This functional value can also be
 constructed on-the-fly, as we've done in the previous example - that's also
 OK. Want to see this functional value passed as a parameter?
-Just look at the definition of 'when'.  Hey, we can buy, sell, and rent
+Just look at the definition of <code>when</code>.  Hey, we can buy, sell, and rent
-these IO actions just like we can with any other functional values! For example, let's define a function that executes all the IO actions in the list:
+these I/O actions just like we can with any other functional values! For example,
+let's define a function that executes all the I/O actions in the list:
 <haskell>
@@ Line 648: / Line 654: @@
 </haskell>
-No mirrors or smoke - we just extract IO actions from the list and insert
+No mirrors or smoke - we just extract I/O actions from the list and insert
-them into a chain of IO operations that should be performed one after another (in the same order that they occurred in the list) to "compute the final world value" of the entire 'sequence_' call.
+them into a chain of I/O operations that should be performed one after another (in the same order that they occurred in the list) to "compute the final world value" of the entire <code>sequence_</code> call.
-With the help of 'sequence_', we can rewrite our last 'main' function as:
+With the help of <code>sequence_</code>, we can rewrite our last <code>main</code> function as:
 <haskell>
@@ Line 657: / Line 663: @@
 </haskell>
-Haskell's ability to work with IO actions as with any other
+Haskell's ability to work with I/O actions as with any other
 (functional and non-functional) values allows us to define control
 structures of arbitrary complexity. Try, for example, to define a control
-structure that repeats an action until it returns the 'False' result:
+structure that repeats an action until it returns the <code>False</code> result:
 <haskell>
@@ Line 669: / Line 675: @@
 Most programming languages don't allow you to define control structures at all, and those that do often require you to use a macro-expansion system.  In Haskell, control structures are just trivial functions anyone can write.
-=== Example: returning an IO action as a result ===
+=== Example: returning an I/O action as a result ===
-How about returning an IO action as the result of a function?  Well, we've done
+How about returning an I/O action as the result of a function?  Well, we've done
-this each time we've defined an IO procedure - they all return IO actions
+this for each I/O definition - they all return I/O actions
-that need a RealWorld value to be performed. While we usually just
+that need a <code>RealWorld</code> value to be performed. While we usually just
-execute them as part of a higher-level IO procedure, it's also
+execute them as part of a higher-level I/O definition, it's also
 possible to just collect them without actual execution:
@@ Line 681: / Line 687: @@
               b = when True getChar
               c = getChar >> getChar
-          putStr "These 'let' statements are not executed!"
+          putStr "These let-statements are not executed!"
 </haskell>
-These assigned IO procedures can be used as parameters to other
+These assigned I/O actions can be used as parameters to other
-procedures, or written to global variables, or processed in some other
+definitions, or written to global variables, or processed in some other
-way, or just executed later, as we did in the example with 'get2chars'.
+way, or just executed later, as we did in the example with <code>get2chars</code>.
-But how about returning a parameterized IO action from an IO procedure?  Let's define a procedure that returns the i'th byte from a file represented as a Handle:
+But how about returning a parameterized I/O action from an I/O definition?
+Here's a definition that returns the i'th byte from a file represented as a Handle:
 <haskell>
@@ Line 695: / Line 702: @@
 </haskell>
-So far so good. But how about a procedure that returns the i'th byte of a file
+So far so good. But how about a definition that returns the i'th byte of a file
 with a given name without reopening it each time?
@@ Line 704: / Line 711: @@
 </haskell>
-As you can see, it's an IO procedure that opens a file and returns...
+As you can see, it's an I/O definition that opens a file and returns...an
-another IO procedure that will read the specified byte. But we can go
+I/O action that will read the specified byte. But we can go
-further and include the 'readi' body in 'readfilei':
+further and include the <code>readi</code> body in <code>readfilei</code>:
 <haskell>
@@ Line 715: / Line 722: @@
 </haskell>
-That's a little better.  But why do we add 'h' as a parameter to 'readi' if it can be obtained from the environment where 'readi' is now defined?  An even shorter version is this:
+That's a little better.  But why do we add <code>h</code> as a parameter to <code>readi</code> if it can be obtained from the environment where <code>readi</code> is now defined?  An even shorter version is this:
 <haskell>
@@ Line 724: / Line 731: @@
 </haskell>
-What have we done here? We've build a parameterized IO action involving local
+What have we done here? We've build a parameterized I/O action involving local
-names inside 'readfilei' and returned it as the result. Now it can be
+names inside <code>readfilei</code> and returned it as the result. Now it can be
 used in the following way:
@@ Line 735: / Line 742: @@
 </haskell>
-This way of using IO actions is very typical for Haskell programs - you
+This way of using I/O actions is very typical for Haskell programs - you
-just construct one or more IO actions that you need,
+just construct one or more I/O actions that you need,
 with or without parameters, possibly involving the parameters that your
-"constructor" received, and return them to the caller. Then these IO actions
+"constructor" received, and return them to the caller. Then these I/O actions
 can be used in the rest of the program without any knowledge about your
 internal implementation strategy. One thing this can be used for is to
@@ Line 745: / Line 752: @@
 === Example: a memory allocator generator ===
-As an example, one of my programs has a module which is a memory suballocator. It receives the address and size of a large memory block and returns two
+As an example, one of my programs has a module which is a memory suballocator.
+It receives the address and size of a large memory block and returns two
-procedures - one to allocate a subblock of a given size and the other to
+specialised I/O operations - one to allocate a subblock of a given size
-free the allocated subblock:
+and the other to free the allocated subblock:
 <haskell>
@@ Line 761: / Line 769: @@
 </haskell>
-How this is implemented? 'alloc' and 'free' work with references
+How this is implemented? <code>alloc</code> and <code>free</code> work with references
-created inside the memoryAllocator procedure. Because the creation of these references is a part of the memoryAllocator IO actions chain, a new independent set of references will be created for each memory block for which
+created inside the <code>memoryAllocator</code> definition. Because the creation of these references is a part of the
+<code>memoryAllocator</code> I/O-action chain, a new independent set of references will be created for each memory block for which
-memoryAllocator is called:
+<code>memoryAllocator</code> is called:
 <haskell>
@@ Line 771: / Line 780: @@
 </haskell>
-These two references are read and written in the 'alloc' and 'free' definitions (we'll implement a very simple memory allocator for this example):
+These two references are read and written in the <code>alloc</code> and <code>free</code> definitions (we'll implement a very simple memory allocator for this example):
 <haskell>
@@ Line 787: / Line 796: @@
 of direct support for impure functions.
-The following example uses procedures, returned by memoryAllocator, to
+The following example uses the operations returned by <code>memoryAllocator</code>, to
 simultaneously allocate/free blocks in two independent memory buffers:
@@ Line 809: / Line 818: @@
 to create a heterogeneous list of figures. All figures in this list should
 support the same set of operations: draw, move and so on. We will
-represent these operations as IO procedures. Instead of a "class" let's
+define these operations using I/O actions. Instead of a "class" let's
-define a structure containing implementations of all the procedures
+define a structure containing implementations of all the operations
 required:
@@ Line 832: / Line 841: @@
 We will "draw" figures by just printing their current parameters.
-Let's start with a simplified implementation of the 'circle' and 'rectangle'
+Let's start with a simplified implementation of the <code>circle</code> and <code>rectangle'
-constructors, without actual 'move' support:
+constructors, without actual <code>move</code> support:
 <haskell>
@@ Line 845: / Line 854: @@
 </haskell>
-As you see, each constructor just returns a fixed 'draw' procedure that prints
+As you see, each constructor just returns a fixed <code>draw</code> operation that prints
 parameters with which the concrete figure was created. Let's test it:
@@ Line 864: / Line 873: @@
 moved around. In order to achieve this, we should provide each figure
 with a mutable variable that holds each figure's current screen location. The
-type of this variable will be "IORef Point". This variable should be created in the figure constructor and manipulated in IO procedures (closures) enclosed in
+type of this variable will be <code>IORef Point</code>. This variable should
+be created in the figure constructor and manipulated in I/O operations (closures) enclosed in
 the Figure record:
@@ Line 906: / Line 916: @@
 </haskell>
-It's important to realize that we are not limited to including only IO actions
+It's important to realize that we are not limited to including only I/O actions
-in a record that's intended to simulate a C++/Java-style interface. The record can also include values, IORefs, pure functions - in short, any type of data. For example, we can easily add to the Figure interface fields for area and origin:
+in a record that's intended to simulate a C++/Java-style interface. The record can also include values, <code>IORef</code>s, pure functions - in short, any type of data. For example, we can easily add to the Figure interface fields for area and origin:
 <haskell>
@@ Line 921: / Line 931: @@
 Although Haskell provides a set of exception raising/handling features comparable to those in popular OOP languages (C++, Java, C#), this part of the language receives much less attention. This is for two reasons. First, you just don't need to worry as much about them - most of the time it just works "behind the scenes". The second reason is that Haskell, lacking OOP inheritance, doesn't allow the programmer to easily subclass exception types, therefore limiting flexibility of exception handling.
-The Haskell RTS raises more exceptions than traditional languages - pattern match failures, calls with invalid arguments (such as '''head []''') and computations whose results depend on special values '''undefined''' and '''error "...."''' all raise their own exceptions:
+The Haskell RTS raises more exceptions than traditional languages - pattern match failures, calls with invalid arguments (such as <code>head []</code>) and computations whose results depend on special values <code>undefined</code> and <code>error "...."</code> all raise their own exceptions:
 * example 1:
@@ Line 1,008: / Line 1,018: @@
   ghc --make main.hs evil.c
-Or, you may compile C module(s) separately and link in .o files (this may be preferable if you use <code>make</code> and don't want to recompile unchanged sources; ghc's --make option provides smart recompilation only for .hs files):
+Or, you may compile C module(s) separately and link in ".o" files (this may be preferable if you use <code>make</code> and don't want to recompile unchanged sources; ghc's --make option provides smart recompilation only for .hs files):
   ghc -c evil.c
   ghc --make main.hs evil.o
-You may use gcc/g++ directly to compile your C/C++ files but I recommend to do linking via ghc because it adds a lot of libraries required for execution of Haskell code. For the same reason, even if your main routine is written in C/C++, I recommend calling it from the Haskell function <hask>main</hask> - otherwise you'll have to explicitly init/shutdown the GHC RTS (run-time system).
+You may use gcc/g++ directly to compile your C/C++ files but I recommend to do linking via ghc because it adds a lot of libraries required for execution of Haskell code. For the same reason, even if your <code>main</code> routine is written in C/C++, I recommend calling it from the Haskell function <code>main</code> - otherwise you'll have to explicitly init/shutdown the GHC RTS (run-time system).
-We use the "foreign import" specification to import foreign routines into our Haskell world, and "foreign export" to export Haskell routines into the external world. Note that the import statement creates a new Haskell symbol (from the external one), while the export statement uses a Haskell symbol previously defined. Technically speaking, both types of statements create a wrapper that converts the names and calling conventions from C to Haskell or vice versa.
+We use the <code>foreign import</code> specification to import foreign routines into our Haskell world, and <code>foreign export</code> to export Haskell routines into the external world. Note that the import statement creates a new Haskell symbol (from the external one), while the export statement uses a Haskell symbol previously defined. Technically speaking, both types of statements create a wrapper that converts the names and calling conventions from C to Haskell or vice versa.
-=== All about the "foreign" statement ===
+=== All about the <code>foreign</code> statement ===
-The "ccall" specifier in foreign statements means the use of C (not C++ !) calling convention. This means that if you want to write the external function in C++ (instead of C) you should add '''export "C"''' specification to its declaration - otherwise you'll get linking errors. Let's rewrite our first example to use C++ instead of C:
+The <code>ccall</code> specifier in foreign statements means the use of C (not C++ !) calling convention. This means that if you want to write the external function in C++ (instead of C) you should add <code>export "C"</code> specification to its declaration - otherwise you'll get linking errors. Let's rewrite our first example to use C++ instead of C:
 prototypes.h:
@@ Line 1,038: / Line 1,048: @@
   ghc --make main.hs evil.cpp
-where evil.cpp is just a renamed copy of evil.c from the first example. Note that the new prototypes.h is written to allow compiling it both as C and C++ code. When it's included from evil.cpp, it's compiled as C++ code. When GHC compiles main.hs via the C compiler (enabled by -fvia-C option), it also includes prototypes.h but compiles it in C mode. It's why you need to specify .h files in "foreign" declarations - depending on which Haskell compiler you use, these files may be included to check consistency of C and Haskell declarations.
+where "evil.cpp" is just a renamed copy of "evil.c" from the first example. Note that the new "prototypes.h" is written to allow compiling it both as C and C++ code. When it's included from evil.cpp, it's compiled as C++ code. When GHC compiles "main.hs" via the C compiler (enabled by -fvia-C option), it also includes prototypes.h but compiles it in C mode. It's why you need to specify ".h" files in <code>foreign</code> declarations - depending on which Haskell compiler you use, these files may be included to check consistency of C and Haskell declarations.
 The quoted part of the foreign statement may also be used to import or export a function under another name--for example,
@@ Line 1,050: / Line 1,060: @@
 </haskell>
-specifies that the C function called CFunction will become known as the Haskell function c_function, while the Haskell function haskell_function will be known in the C world as HaskellFunction. It's required when the C name doesn't conform to Haskell naming requirements.
+specifies that the C function called <code>CFunction</code> will become known as the Haskell function <code>c_function</code>, while the Haskell function <code>haskell_function</code> will be known in the C world as <code>HaskellFunction</code>. It's required when the C name doesn't conform to Haskell naming requirements.
-Although the Haskell FFI standard tells about many other calling conventions in addition to ccall (e.g. cplusplus, jvm, net) current Haskell implementations support only ccall and stdcall. The latter, also called the "Pascal" calling convention, is used to interface with WinAPI:
+Although the Haskell FFI standard tells about many other calling conventions in addition to <code>ccall</code> (e.g. <code>cplusplus</code>, <code>jvm</code>, <code>net</code>) current Haskell implementations support only <code>ccall</code> and <code>stdcall</code>. The latter, also called the "Pascal" calling convention, is used to interface with WinAPI:
 <haskell>
@@ Line 1,059: / Line 1,069: @@
 </haskell>
-And finally, about the safe/unsafe specifier: a C function imported with the "unsafe" keyword is called directly and the Haskell runtime is stopped while the C function is executed (when there are several OS threads executing the Haskell program, only the current OS thread is delayed). This call doesn't allow recursively entering into the Haskell world by calling any Haskell function - the Haskell RTS is just not prepared for such an event. However, unsafe calls are as quick as calls in C world. It's ideal for "momentary" calls that quickly return back to the caller.
+And finally, about the <code>safe</code>/<code>unsafe</code> specifier: a C function imported with the <code>unsafe</code> keyword is called directly and the Haskell runtime is stopped while the C function is executed (when there are several OS threads executing the Haskell program, only the current OS thread is delayed). This call doesn't allow recursively entering into the Haskell world by calling any Haskell function - the Haskell RTS is just not prepared for such an event. However, <code>unsafe</code> calls are as quick as calls in C world. It's ideal for "momentary" calls that quickly return back to the caller.
-When "safe" is specified, the C function is called in safe environment - the Haskell execution context is saved, so it's possible to call back to Haskell and, if the C call takes a long time, another OS thread may be started to execute Haskell code (of course, in threads other than the one that called the C code). This has its own price, though - around 1000 CPU ticks per call.
+When <code>safe</code> is specified, the C function is called in safe environment - the Haskell execution context is saved, so it's possible to call back to Haskell and, if the C call takes a long time, another OS thread may be started to execute Haskell code (of course, in threads other than the one that called the C code). This has its own price, though - around 1000 CPU ticks per call.
 You can read more about interaction between FFI calls and Haskell concurrency in [[#readmore|[7]]].
@@ Line 1,083: / Line 1,093: @@
 </haskell>
-Note that pure C functions (those whose results depend only on their arguments) are imported without IO in their return type. The "const" specifier in C is not reflected in Haskell types, so appropriate compiler checks are not performed. <!-- What would these be? -->
+Note that pure C functions (those whose results depend only on their arguments) are imported without <code>IO</code> in their return type. The <code>const</code> specifier in C is not reflected in Haskell types, so appropriate compiler checks are not performed. <!-- What would these be? -->
-All these numeric types are instances of the same classes as their Haskell cousins (Ord, Num, Show and so on), so you may perform calculations on these data directly. Alternatively, you may convert them to native Haskell types. It's very typical to write simple wrappers around imported and exported functions just to provide interfaces having native Haskell types:
+All these numeric types are instances of the same classes as their Haskell cousins (<code>Ord</code>, <code>Num</code>, <code>Show</code> and so on), so you may perform calculations on these data directly. Alternatively, you may convert them to native Haskell types. It's very typical to write simple wrappers around imported and exported functions just to provide interfaces having native Haskell types:
 <haskell>
@@ Line 1,130: / Line 1,140: @@
 * putting Haskell code into a DLL which may be called from C code
-== Dark side of IO monad ==
+== Dark side of I/O monad ==
-=== unsafePerformIO ===
+=== <code>unsafePerformIO</code> ===
-Programmers coming from an imperative language background often look for a way to execute IO actions inside a pure procedure. But what does this mean?
+Programmers coming from an imperative language background often look for a way to execute I/O actions inside a pure function. But what does this mean?
-Imagine that you're trying to write a procedure that reads the contents of a file with a given name, and you try to write it as a pure (non-IO) function:
+Imagine that you're trying to write a function that reads the contents of a file with a given name, and you try to write it as a pure (non-<code>IO</code>) function:
 <haskell>
@@ Line 1,144: / Line 1,154: @@
 * This call is not inserted in a sequence of "world transformations", so the compiler doesn't know at what exact moment you want to execute this action. For example, if the file has one kind of contents at the beginning of the program and another at the end - which contents do you want to see?  You have no idea when (or even if) this function is going to get invoked, because Haskell sees this function as pure and feels free to reorder the execution of any or all pure functions as needed.
-* Attempts to read the contents of files with the same name can be factored (''i.e.'' reduced to a single call) despite the fact that the file (or the current directory) can be changed between calls. Again, Haskell considers all non-IO functions to be pure and feels free to omit multiple calls with the same parameters.
+* Attempts to read the contents of files with the same name can be factored (''i.e.'' reduced to a single call) despite the fact that the file (or the current directory) can be changed between calls. Again, Haskell considers all non-<code>IO</code> functions to be pure and feels free to omit multiple calls with the same parameters.
-So, implementing pure functions that interact with the Real World is
+So, implementing supposedly-pure functions that interact with the '''Real World''' is
-considered to be Bad Behavior. Nice programmers never do it ;)
+considered to be '''Bad Behavior'''. Nice programmers never do it ;-)
-Nevertheless, there are (semi-official) ways to use IO actions inside
+Nevertheless, there are (semi-official) ways to use I/O actions inside
 of pure functions. As you should remember this is prohibited by
-requiring the RealWorld "baton" in order to call an IO action. Pure functions don't have the baton, but there is a ''(ahem)'' "special" procedure that produces this baton from nowhere, uses it to call an IO action and then throws the resulting "world" away!  It's a little low-level mirror-smoke. This particular (and dangerous) procedure is:
+requiring the <code>RealWorld</code> "baton" in order to call an I/O action. Pure functions don't have the baton, but there is a ''(ahem)'' "special" definition that produces this baton from nowhere, uses it to call an I/O action and then throws the resulting "world" away!  It's a little low-level mirror-smoke. This particular (and dangerous) definition is:
 <haskell>
@@ Line 1,165: / Line 1,175: @@
 </haskell>
-where 'createNewWorld' is an internal function producing a new value of
+where <code>createNewWorld</code> is an internal function producing a new value of
-the RealWorld type.
+the <code>RealWorld</code> type.
-Using unsafePerformIO, you can easily write pure functions that do
+Using <code>unsafePerformIO</code>, you could easily write pure functions that do
 I/O inside. But don't do this without a real need, and remember to
 follow this rule: the compiler doesn't know that you are cheating; it still
-considers each non-IO function to be a pure one. Therefore, all the usual
+considers each non-<code>IO</code> function to be a pure one. Therefore, all the usual
 optimization rules can (and will!) be applied to its execution. So
 you must ensure that:
@@ Line 1,179: / Line 1,189: @@
 Let's investigate this problem more deeply. Function evaluation in Haskell
-is determined by a value's necessity - the language computes only the values that are really required to calculate the final result. But what does this mean with respect to the 'main' function?  To "calculate the final world's" value, you need to perform all the intermediate IO actions that are included in the 'main' chain. By using 'unsafePerformIO' we call IO actions outside of this chain.  What guarantee do we have that they will be run at all? None. The only time they will be run is if running them is required to compute the overall function result (which in turn should be required to perform some action in the
+is determined by a value's necessity - the language computes only the values that are really required to calculate the final result. But what does this mean with respect to the <code>main</code> function?  To "calculate the final world's" value, you need to perform all the intermediate I/O actions that are included in the <code>main</code> chain. By using <code>unsafePerformIO</code> we call I/O actions outside of this chain.  What guarantee do we have that they will be run at all? None. The only time they will be run is if running them is required to compute the overall function result (which in turn should be required to perform some action in the <code>main</code> chain). This is an example of Haskell's evaluation-by-need strategy. Now you should clearly see the difference:
-'main' chain). This is an example of Haskell's evaluation-by-need strategy. Now you should clearly see the difference:
-* An IO action inside an IO procedure is guaranteed to execute as long as it is (directly or indirectly) inside the 'main' chain - even when its result isn't used (because the implicit "world" value it returns ''will'' be used). You directly specify the order of the action's execution inside the IO procedure. Data dependencies are simulated via the implicit "world" values that are passed from each IO action to the next.
+* An I/O action inside an I/O definition is guaranteed to execute as long as it is (directly or indirectly) inside the <code>main</code> chain - even when its result isn't used (because the implicit "world" value it returns ''will'' be used). You directly specify the order of the action's execution inside the I/O definition. Data dependencies are simulated via the implicit "world" values that are passed from each I/O action to the next.
-* An IO action inside 'unsafePerformIO' will be performed only if the result of this operation is really used. The evaluation order is not guaranteed and you should not rely on it (except when you're sure about
+* An I/O action inside <code>unsafePerformIO</code> will be performed only if the result of this operation is really used. The evaluation order is not guaranteed and you should not rely on it (except when you're sure about
 whatever data dependencies may exist).
-I should also say that inside 'unsafePerformIO' call you can organize
+I should also say that inside <code>unsafePerformIO</code> call you can organize
-a small internal chain of IO actions with the help of the same binding
+a small internal chain of I/O actions with the help of the same binding
-operators and/or 'do' syntactic sugar we've seen above.  For example, here's a particularly convoluted way to compute the integer that comes after zero:
+operators and/or <code>do</code> syntactic sugar we've seen above.  For example, here's a particularly convoluted way to compute the integer that comes after zero:
 <haskell>
-one :: Int
+one :: Integer
 one = unsafePerformIO $ do var <- newIORef 0
                            modifyIORef var (+1)
@@ Line 1,199: / Line 1,208: @@
 and in this case ALL the operations in this chain will be performed as
-long as the result of the 'unsafePerformIO' call is needed. To ensure this,
+long as the result of the <code>unsafePerformIO</code> call is needed. To ensure this,
-the actual 'unsafePerformIO' implementation evaluates the "world" returned
+the actual <code>unsafePerformIO</code> implementation evaluates the "world" returned
-by the 'action':
+by the <code>action</code>:
 <haskell>
@@ Line 1,208: / Line 1,217: @@
 </haskell>
-(The 'seq' operation strictly evaluates its first argument before
+(The <code>seq</code> operation strictly evaluates its first argument before
 returning the value of the second one [[#readmore|[8]]]).
-=== inlinePerformIO ===
+=== <code>inlinePerformIO</code> ===
-inlinePerformIO has the same definition as unsafePerformIO but with addition of an INLINE pragma:
+<code>inlinePerformIO</code> has the same definition as <code>unsafePerformIO</code> but with addition of an <code>INLINE</code> pragma:
 <haskell>
 -- | Just like unsafePerformIO, but we inline it. Big performance gains as
@@ Line 1,223: / Line 1,232: @@
 </haskell>
-Semantically inlinePerformIO = unsafePerformIO
+Semantically <code>inlinePerformIO</code> = <code>unsafePerformIO</code>
 in as much as either of those have any semantics at all.
-The difference of course is that inlinePerformIO is even less safe than
+The difference of course is that <code>inlinePerformIO</code> is even less safe than
-unsafePerformIO. While ghc will try not to duplicate or common up
+<code>unsafePerformIO</code>. While ghc will try not to duplicate or common up
-different uses of unsafePerformIO, we aggressively inline
+different uses of <code>unsafePerformIO</code>, we aggressively inline
-inlinePerformIO. So you can really only use it where the IO content is
+<code>inlinePerformIO</code>. So you can really only use it where the I/O content is
 really properly pure, like reading from an immutable memory buffer (as
-in the case of ByteStrings). However things like allocating new buffers
+in the case of <code>ByteString</code>s). However things like allocating new buffers
-should not be done inside inlinePerformIO since that can easily be
+should not be done inside <code>inlinePerformIO</code> since that can easily be
 floated out and performed just once for the whole program, so you end up
 with many things sharing the same buffer, which would be bad.
-So the rule of thumb is that IO things wrapped in unsafePerformIO have
+So the rule of thumb is that I/O actions wrapped in <code>unsafePerformIO</code> have
-to be externally pure while with inlinePerformIO it has to be really
+to be externally pure while with <code>inlinePerformIO</code> it has to be really,
-really pure or it'll all go horribly wrong.
+''really'' pure or it'll all go horribly wrong.
 That said, here's some really hairy code. This should frighten any pure
@@ Line 1,247: / Line 1,256: @@
 write !n body = Put $ \c buf@(Buffer fp o u l) ->
   if n <= l
-    then write' c fp o u l
+    then write</code> c fp o u l
-    else write' (flushOld c n fp o u) (newBuffer c n) 0 0 0
+    else write</code> (flushOld c n fp o u) (newBuffer c n) 0 0 0
-  where {-# NOINLINE write' #-}
+  where {-# NOINLINE write</code> #-}
-        write' c !fp !o !u !l =
+        write</code> c !fp !o !u !l =
           -- warning: this is a tad hardcore
           inlinePerformIO
@@ Line 1,266: / Line 1,275: @@
 This does not adhere to my rule of thumb above. Don't ask exactly why we
 claim it's safe :-) (and if anyone really wants to know, ask Ross
-Paterson who did it first in the Builder monoid)
+Paterson who did it first in the <code>Builder</code> monoid)
-=== unsafeInterleaveIO ===
+=== <code>unsafeInterleaveIO</code> ===
 But there is an even stranger operation:
@@ Line 1,276: / Line 1,285: @@
 </haskell>
-Don't let that type signature fool you - 'unsafeInterleaveIO' also uses
+Don't let that type signature fool you - <code>unsafeInterleaveIO</code> also uses
 a dubiously-acquired baton which it uses to set up an underground
 relay-race for its unsuspecting parameter. If it happens, this seedy race
-then occurs alongside the offical 'main' relay-race - if they collide,
+then occurs alongside the offical <code>main</code> relay-race - if they collide,
 things will get ugly!
-So how does 'unsafeInterleaveIO' get that bootleg baton? Typically by
+So how does <code>unsafeInterleaveIO</code> get that bootleg baton? Typically by
 making a forgery of the offical one to keep for itself - it can do
-this because the I/O action 'unsafeInterleaveIO' returns will be
+this because the I/O action <code>unsafeInterleaveIO</code> returns will be
-handed the offical baton in the 'main' relay-race. But one
+handed the offical baton in the <code>main</code> relay-race. But one
 miscreant realised there was a simpler way:
@@ Line 1,295: / Line 1,304: @@
 Why bother with counterfeit copies of batons if you can just make them up?
-At least you have some appreciation as to why 'unsafeInterleaveIO' is, well
+At least you have some appreciation as to why <code>unsafeInterleaveIO</code> is, well
-''unsafe!'' Just don't ask - to talk further is bound to cause grief and
+'''unsafe!''' Just don't ask - to talk further is bound to cause grief and
 indignation. I won't say anything more about this ruffian I...use
 all the time (darn it!)
-One can use unsafePerformIO (not unsafeInterleaveIO) to perform I/O
+One can use <code>unsafePerformIO</code> (not <code>unsafeInterleaveIO</code>) to perform I/O
 operations not in predefined order but by demand. For example, the
 following code:
@@ Line 1,324: / Line 1,333: @@
 is not that we usually need.
+<code>unsafeInterleaveIO</code> solves this problem - it performs I/O only on
+demand but allows to define exact <code>'internal'</code> execution order for parts
-unsafeInterleaveIO solves this problem - it performs I/O only on
+of your datastructure. It is why I wrote that <code>unsafeInterleaveIO</code> makes
-demand but allows to define exact ''internal'' execution order for parts
-of your datastructure. It is why I wrote that unsafeInterleaveIO makes
 an illegal copy of the baton:
-* unsafeInterleaveIO accepts an I/O action as a parameter and returns
+* <code>unsafeInterleaveIO</code> accepts an I/O action as a parameter and returns another I/O action as the result:
-another I/O action as the result:
 <haskell>
@@ Line 1,337: / Line 1,345: @@
 </haskell>
-* unsafeInterleaveIO doesn't perform any action immediately, it
+* <code>unsafeInterleaveIO</code> doesn't perform any action immediately, it only creates a box of type <code>a</code> which on requesting this value will perform action specified as a parameter.
-only creates a box of type 'a' which on requesting this value will
-perform action specified as a parameter.
-* this action by itself may compute the whole value immediately
+* this action by itself may compute the whole value immediately or...use <code>unsafeInterleaveIO</code> again to defer calculation of some sub-components:
-or... use unsafeInterleaveIO again to defer calculation of some
-sub-components:
 <haskell>
@@ Line 1,353: / Line 1,357: @@
 This code will be executed only at the moment when value of str is
-really demanded. In this moment, getChar will be performed (with
+really demanded. In this moment, <code>getChar</code> will be performed (with
-result assigned to c) and one more lazy IO box will be created - for s.
+result assigned to <code>c</code>) and one more lazy I/O box will be created - for <code>s</code>.
-This box again contains link to the myGetContents call
+This box again contains link to the <code>myGetContents</code> call.
 Then, list cell returned that contains one char read and link to
-myGetContents call as a way to compute rest of the list. Only at the
+<code>myGetContents</code> call as a way to compute rest of the list. Only at the
 moment when next value in list required, this operation will be
 performed again
@@ Line 1,373: / Line 1,377: @@
    c <- replicateM 512 getChar
    s <- unsafeInterleaveIO myGetContents
+   return (c++s)
+</haskell>
+and we can rewrite <code>myGetContents</code> to avoid needing to
+use <code>unsafeInterleaveIO</code> where it's called:
+<haskell>
+myGetContents = unsafeInterleaveIO $ do
+   c <- replicateM 512 getChar
+   s <- myGetContents
    return (c++s)
 </haskell>
@@ Line 1,378: / Line 1,392: @@
 == A safer approach: the ST monad ==
-We said earlier that we can use unsafePerformIO to perform computations that are totally pure but nevertheless interact with the Real World in some way.  There is, however, a better way!  One that remains totally pure and yet allows the use of references, arrays, and so on -- and it's done using, you guessed it, Haskell's versatile type system (and one extension). This is the ST monad.
+We said earlier that we can use <code>unsafePerformIO</code> to perform computations that are totally pure but nevertheless interact with the real world in some way.  There is, however, a better way!  One that remains totally pure and yet allows the use of references, arrays, and so on - and it's done using, you guessed it, Haskell's versatile type system (and one extension). This is the ST monad.
-The ST monad's version of unsafePerformIO is called runST, and it has a very unusual type.
+The ST monad's version of <code>unsafePerformIO</code> is called <code>runST</code>, and it has a very unusual type.
 <haskell>
 runST :: (forall s . ST s a) -> a
 </haskell>
-The s variable in the ST monad is the state type.  Moreover, all the fun mutable stuff available in the ST monad is quantified over s:
+The <code>s</code> variable in the ST monad is the state type.  Moreover, all the fun mutable stuff available in the ST monad is quantified over <code>s</code>:
 <haskell>
 newSTRef :: a -> ST s (STRef s a)
@@ Line 1,391: / Line 1,405: @@
 </haskell>
-So why does runST have such a funky type? Let's see what would happen if we wrote
+So why does <code>runST</code> have such a funky type? Let's see what would happen if we wrote
 <haskell>
 makeSTRef :: a -> STRef s a
 makeSTRef a = runST (newSTRef a)
 </haskell>
-This fails, because newSTRef a doesn't work for all state types s -- it only works for the s from the return type STRef s a.
+This fails, because <code>newSTRef a</code> doesn't work for all state types <code>s</code> - it only works for the <code>s</code> from the return type <code>STRef s a</code>.
-This is all sort of wacky, but the result is that you can only run an ST computation where the output type is functionally pure, and makes no references to the internal mutable state of the computation.  The ST monad doesn't have access to I/O operations like writing to the console, either -- only references, arrays, and suchlike that come in handy for pure computations.
+This is all sort of wacky, but the result is that you can only run an ST computation where the output type is functionally pure, and makes no references to the internal mutable state of the computation.  The ST monad doesn't have access to I/O operations like writing to the console, either - only references, arrays, and such that come in handy for pure computations.
-Important note -- the state type doesn't actually mean anything.  We never have a value of type s, for instance.  It's just a way of getting the type system to do the work of ensuring purity for us, with smoke and mirrors.
+Important note - the state type doesn't actually mean anything.  We never have a value of type <code>s</code>, for instance.  It's just a way of getting the type system to do the work of ensuring purity is preserved.
-On the inside, runST runs a computation with the real world baton just like unsafePerformIO.  Their internal implementations are almost identical: in fact, there's a function
+On the inside, <code>runST</code> runs a computation with the real world baton just like <code>unsafePerformIO</code>.  Their internal implementations are almost identical: in fact, there's a function
 <haskell>
 stToIO :: ST RealWorld a -> IO a
@@ Line 1,409: / Line 1,423: @@
 The difference is that ST uses the type system to forbid unsafe behavior like extracting mutable objects from their safe ST wrapping, but allowing purely functional outputs to be performed with all the handy access to mutable references and arrays.
-So here's how we'd rewrite our function using unsafePerformIO from above:
+So here's how we'd rewrite our function using <code>unsafePerformIO</code> from above:
 <haskell>
@@ Line 1,424: / Line 1,438: @@
 A little disclaimer: I should say that I'm not describing
-here exactly what a monad is (I don't even completely understand it myself) and my explanation shows only one ''possible'' way to implement the IO monad in
+here exactly what a monad is (I don't even completely understand it myself) and my explanation shows only one ''possible'' way to implement the I/O monad in
 Haskell. For example, the hbc compiler and the Hugs interpreter
-implements the IO monad via continuations [[#readmore|[9]]]. I also haven't said anything about
+implements the I/O monad via continuations [[#readmore|[9]]]. I also haven't said anything about
 exception handling, which is a natural part of the "monad" concept. You can
 read the "All About Monads" guide to learn more about these topics.
-But there is some good news: first, the IO monad understanding you've just acquired will work with any implementation and with many other monads. You just can't work with RealWorld
+But there is some good news: first, the I/O monad understanding you've just acquired will work with any implementation and with many other monads. You just can't work with <code>RealWorld</code>
 values directly.
-Second, the IO monad implementation described here is really used in the GHC,
+Second, the I/O monad implementation described here is really used in the GHC,
-yhc/nhc (jhc, too?) compilers. Here is the actual IO definition
+yhc/nhc (jhc, too?) compilers. Here is the actual <code>IO</code> definition
 from the GHC sources:
@@ Line 1,441: / Line 1,455: @@
 </haskell>
-It uses the "State# RealWorld" type instead of our RealWorld, it uses the "(# #)" strict tuple for optimization, and it adds an IO data constructor
+It uses the <code>State# RealWorld</code> type instead of our <code>RealWorld</code>, it uses the <code>(# ... #)</code> strict tuple for optimization, and it adds an <code>IO</code> data constructor
-around the type. Nevertheless, there are no significant changes from the standpoint of our explanation. Knowing the principle of "chaining" IO actions via fake "state of the world" values, you can now easily understand and write low-level implementations of GHC I/O operations.
+around the type. Nevertheless, there are no significant changes from the standpoint of our explanation. Knowing the principle of "chaining" I/O actions via fake "state of the world" values, you can now easily understand and write low-level implementations of GHC I/O operations.
 === The [[Yhc]]/nhc98 implementation ===
@@ Line 1,451: / Line 1,465: @@
 </haskell>
-This implementation makes the "World" disappear somewhat[[#readmore|[10]]], and returns Either a
+This implementation makes the <code>World</code> disappear somewhat[[#readmore|[10]]], and returns <code>Either</code> a
-result of type "a", or if an error occurs then "IOError". The lack of the World on the right-hand side of the function can only be done because the compiler knows special things about the IO type, and won't overoptimise it.
+result of type <code>a</code>, or if an error occurs then <code>IOError</code>. The lack of the <code>World</code> on the right-hand side of the function can only be done because the compiler knows special things about the <code>IO</code> type, and won't overoptimise it.
 == <span id="readmore"></span>Further reading ==
-[1] This tutorial is largely based on the Simon Peyton Jones' paper [http://research.microsoft.com/%7Esimonpj/Papers/marktoberdorf Tackling the awkward squad: monadic input/output, concurrency, exceptions, and foreign-language calls in Haskell]. I hope that my tutorial improves his original explanation of the Haskell I/O system and brings it closer to the point of view of beginning Haskell programmers. But if you need to learn about concurrency, exceptions and FFI in Haskell/GHC, the original paper is the best source of information.
+[1] This tutorial is largely based on Simon Peyton Jones's paper [http://research.microsoft.com/%7Esimonpj/Papers/marktoberdorf Tackling the awkward squad: monadic input/output, concurrency, exceptions, and foreign-language calls in Haskell]. I hope that my tutorial improves his original explanation of the Haskell I/O system and brings it closer to the point of view of beginning Haskell programmers. But if you need to learn about concurrency, exceptions and FFI in Haskell/GHC, the original paper is the best source of information.
 [2] You can find more information about concurrency, FFI and STM at the [[GHC/Concurrency#Starting points]] page.
@@ Line 1,470: / Line 1,484: @@
 [7] Using FFI in multithreaded programs described in paper [http://www.haskell.org/~simonmar/bib/concffi04_abstract.html Extending the Haskell Foreign Function Interface with Concurrency]
-[8] This particular behaviour is not a requirement of Haskell 2010, so the operation of 'seq' may differ between various Haskell implementations - if you're not sure, staying within the IO monad is the safest option.
+[8] This particular behaviour is not a requirement of Haskell 2010, so the operation of <code>seq</code> may differ between various Haskell implementations - if you're not sure, staying within the I/O monad is the safest option.
 [9] [http://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.91.3579&rep=rep1&type=pdf How to Declare an Imperative] by Phil Wadler provides an explanation of how this can be done.
-[10] The RealWorld type can even be replaced e.g. <span style="color:darkred;">Functional I/O Using System Tokens</span> by Lennart Augustsson.
+[10] The <code>RealWorld</code> type can even be replaced e.g. <span style="color:darkred;">Functional I/O Using System Tokens</span> by Lennart Augustsson.
 Do you have more questions? Ask in the [http://www.haskell.org/mailman/listinfo/haskell-cafe haskell-cafe mailing list].
@@ Line 1,483: / Line 1,497: @@
 Topics:
-* fixIO and 'mdo'
+* <code>fixIO</code> and <code>mdo</code>
-* Q monad
+* <code>Q</code> monad
 Questions:
-* split '>>='/'>>'/return section and 'do' section, more examples of using binding operators
+* split <code>(>>=)</code>/<code>(>>)</code>/return section and <code>do</code> section, more examples of using binding operators
-* IORef detailed explanation (==const*), usage examples, syntax sugar, unboxed refs
+* <code>IORef</code> detailed explanation (==<code>const*</code>), usage examples, syntax sugar, unboxed refs
-* explanation of how the actual data "in" mutable references are inside 'RealWorld', rather than inside the references themselves ('IORef','IOArray',&c.)
+* explanation of how the actual data "in" mutable references are inside <code>RealWorld</code>, rather than inside the references themselves (<code>IORef</code>, <code>IOArray</code> & co.)
 * control structures developing - much more examples
-* unsafePerformIO usage examples: global variable, ByteString, other examples
+* <code>unsafePerformIO</code> usage examples: global variable, <code>ByteString</code>, other examples
-* how 'unsafeInterLeaveIO' can be seen as a kind of concurrency, and therefore isn't so unsafe (unlike 'unsafeInterleaveST' which really is unsafe)
+* how <code>unsafeInterLeaveIO</code> can be seen as a kind of concurrency, and therefore isn't so unsafe (unlike <code>unsafeInterleaveST</code> which really is unsafe)
-* discussion about different senses of "safe"/"unsafe" (like breaking equational reasoning vs. invoking undefined behaviour (so can corrupt the run-time system))
+* discussion about different senses of <code>safe</code>/<code>unsafe</code> (like breaking equational reasoning vs. invoking undefined behaviour (so can corrupt the run-time system))
-* actual GHC implementation - how to write low-level routines on example of newIORef implementation
+* actual GHC implementation - how to write low-level routines on example of <code>newIORef</code> implementation
-This manual is collective work, so feel free to add more information to it yourself. The final goal is to collectively develop a comprehensive manual for using the IO monad.
+This manual is collective work, so feel free to add more information to it yourself. The final goal is to collectively develop a comprehensive manual for using the I/O monad.
 ----

Difference between revisions of "IO inside"

Revision as of 13:59, 10 December 2020

Haskell is a pure language

What is a monad?

Welcome to the RealWorld, baby

(>>=) and do notation

Mutable data (references, arrays, hash tables...)

I/O actions as values

Example: a list of I/O actions

Example: returning an I/O action as a result

Example: a memory allocator generator

Example: emulating OOP with record types

Exception handling (under development)

Interfacing with C/C++ and foreign libraries (under development)

Calling functions

All about the foreign statement

Marshalling simple types

Memory management

Marshalling strings

Marshalling composite types

Dynamic calls

DLLs

Dark side of I/O monad

unsafePerformIO

inlinePerformIO

unsafeInterleaveIO

A safer approach: the ST monad

Welcome to the machine: the actual GHC implementation

The Yhc/nhc98 implementation

Further reading

To-do list

Navigation menu

Search

Welcome to the `RealWorld`, baby

`(>>=)` and `do` notation

All about the `foreign` statement

`unsafePerformIO`

`inlinePerformIO`

`unsafeInterleaveIO`