aboutsummaryrefslogtreecommitdiffhomepage
diff options
context:
space:
mode:
authormichaelt <what_is_it_to_do_anything@yahoo.com>2014-02-05 00:42:35 -0500
committermichaelt <what_is_it_to_do_anything@yahoo.com>2014-02-05 00:42:35 -0500
commit167f880504e05b19d3487c7ba701afa9633a2f41 (patch)
tree23eecc37d471915254d6ef6f3314e14b6bb2719f
parent4da91c37355b3d688c9dfc6f92ae92266ad4e883 (diff)
downloadtext-pipes-167f880504e05b19d3487c7ba701afa9633a2f41.tar.gz
text-pipes-167f880504e05b19d3487c7ba701afa9633a2f41.tar.zst
text-pipes-167f880504e05b19d3487c7ba701afa9633a2f41.zip
scrapped stdinLn etc. Improved haddocks
-rw-r--r--Pipes/Text.hs103
1 files changed, 29 insertions, 74 deletions
diff --git a/Pipes/Text.hs b/Pipes/Text.hs
index 796f672..bbf200f 100644
--- a/Pipes/Text.hs
+++ b/Pipes/Text.hs
@@ -66,11 +66,9 @@ module Pipes.Text (
66 , stdin 66 , stdin
67 , fromHandle 67 , fromHandle
68 , readFile 68 , readFile
69 , stdinLn
70 69
71 -- * Consumers 70 -- * Consumers
72 , stdout 71 , stdout
73 , stdoutLn
74 , toHandle 72 , toHandle
75 , writeFile 73 , writeFile
76 74
@@ -275,27 +273,6 @@ readFile :: MonadSafe m => FilePath -> Producer Text m ()
275readFile file = Safe.withFile file IO.ReadMode fromHandle 273readFile file = Safe.withFile file IO.ReadMode fromHandle
276{-# INLINE readFile #-} 274{-# INLINE readFile #-}
277 275
278{-| Crudely stream lines of input from stdin in the style of Pipes.Prelude.
279 This is for testing in ghci etc.; obviously it will be unsound if used to recieve
280 the contents of immense files with few newlines.
281
282>>> let safely = runSafeT . runEffect
283>>> safely $ for Text.stdinLn (lift . lift . print . T.length)
284hello
2855
286world
2875
288
289-}
290stdinLn :: MonadIO m => Producer' Text m ()
291stdinLn = go where
292 go = do
293 eof <- liftIO (IO.hIsEOF IO.stdin)
294 unless eof $ do
295 txt <- liftIO (T.hGetLine IO.stdin)
296 yield txt
297 go
298{-# INLINABLE stdinLn #-}
299 276
300{-| Stream text to 'stdout' 277{-| Stream text to 'stdout'
301 278
@@ -319,20 +296,6 @@ stdout = go
319 Right () -> go 296 Right () -> go
320{-# INLINABLE stdout #-} 297{-# INLINABLE stdout #-}
321 298
322stdoutLn :: (MonadIO m) => Consumer' Text m ()
323stdoutLn = go
324 where
325 go = do
326 str <- await
327 x <- liftIO $ try (T.putStrLn str)
328 case x of
329 Left (G.IOError { G.ioe_type = G.ResourceVanished
330 , G.ioe_errno = Just ioe })
331 | Errno ioe == ePIPE
332 -> return ()
333 Left e -> liftIO (throwIO e)
334 Right () -> go
335{-# INLINABLE stdoutLn #-}
336 299
337{-| Convert a text stream into a 'Handle' 300{-| Convert a text stream into a 'Handle'
338 301
@@ -723,8 +686,9 @@ isEndOfChars = do
723{-# INLINABLE isEndOfChars #-} 686{-# INLINABLE isEndOfChars #-}
724 687
725 688
726-- | An improper lens into a stream of 'ByteString' expected to be UTF-8 encoded; the associated 689{- | An improper lens into a stream of 'ByteString' expected to be UTF-8 encoded; the associated
727-- stream of Text ends by returning a stream of ByteStrings beginning at the point of failure. 690 stream of Text ends by returning a stream of ByteStrings beginning at the point of failure.
691 -}
728 692
729decodeUtf8 :: Monad m => Lens' (Producer ByteString m r) 693decodeUtf8 :: Monad m => Lens' (Producer ByteString m r)
730 (Producer Text m (Producer ByteString m r)) 694 (Producer Text m (Producer ByteString m r))
@@ -1010,7 +974,6 @@ lines = Data.Profunctor.dimap _lines (fmap _unlines)
1010{-# INLINABLE lines #-} 974{-# INLINABLE lines #-}
1011 975
1012 976
1013
1014-- | Split a text stream into 'FreeT'-delimited words 977-- | Split a text stream into 'FreeT'-delimited words
1015words 978words
1016 :: (Monad m) => Iso' (Producer Text m r) (FreeT (Producer Text m) m r) 979 :: (Monad m) => Iso' (Producer Text m r) (FreeT (Producer Text m) m r)
@@ -1090,6 +1053,16 @@ unwords = intercalate (yield $ T.singleton ' ')
1090 @Pipes.Parse@ re-exports 'input', 'concat', 'FreeT' (the type) and the 'Parse' synonym. 1053 @Pipes.Parse@ re-exports 'input', 'concat', 'FreeT' (the type) and the 'Parse' synonym.
1091-} 1054-}
1092 1055
1056{- | Use a 'Codec' as a pipes-style 'Lens' into a byte stream; the available 'Codec' s are
1057 'utf8', 'utf16_le', 'utf16_be', 'utf32_le', 'utf32_be' . The 'Codec' concept and the
1058 individual 'Codec' definitions follow the enumerator and conduit libraries.
1059
1060 Utf8 is handled differently in this library -- without the use of 'unsafePerformIO' &co
1061 to catch 'Text' exceptions; but the same 'mypipe ^. codec utf8' interface can be used.
1062 'mypipe ^. decodeUtf8' should be the same, but has a somewhat more direct and thus perhaps
1063 better implementation.
1064
1065 -}
1093codec :: Monad m => Codec -> Lens' (Producer ByteString m r) (Producer Text m (Producer ByteString m r)) 1066codec :: Monad m => Codec -> Lens' (Producer ByteString m r) (Producer Text m (Producer ByteString m r))
1094codec (Codec _ enc dec) k p0 = fmap (\p -> join (for p (yield . fst . enc))) 1067codec (Codec _ enc dec) k p0 = fmap (\p -> join (for p (yield . fst . enc)))
1095 (k (decoder (dec B.empty) p0) ) where 1068 (k (decoder (dec B.empty) p0) ) where
@@ -1104,9 +1077,13 @@ codec (Codec _ enc dec) k p0 = fmap (\p -> join (for p (yield . fst . enc)))
1104 return r) 1077 return r)
1105 Right (chunk,p1) -> decoder (dec chunk) p1 1078 Right (chunk,p1) -> decoder (dec chunk) p1
1106 1079
1107-- decodeUtf8 k p0 = fmap (\p -> join (for p (yield . TE.encodeUtf8))) 1080{- | ascii and latin encodings only represent a small fragment of 'Text'; thus we cannot
1108-- (k (go B.empty PI.streamDecodeUtf8 p0)) where 1081 use the pipes 'Lens' style to work with them. Rather we simply define functions
1082 each way.
1109 1083
1084 'encodeAscii' : Reduce as much of your stream of 'Text' actually is ascii to a byte stream,
1085 returning the rest of the 'Text' at the first non-ascii 'Char'
1086-}
1110encodeAscii :: Monad m => Producer Text m r -> Producer ByteString m (Producer Text m r) 1087encodeAscii :: Monad m => Producer Text m r -> Producer ByteString m (Producer Text m r)
1111encodeAscii = go where 1088encodeAscii = go where
1112 go p = do echunk <- lift (next p) 1089 go p = do echunk <- lift (next p)
@@ -1121,7 +1098,9 @@ encodeAscii = go where
1121 then go p' 1098 then go p'
1122 else return $ do yield unsafe 1099 else return $ do yield unsafe
1123 p' 1100 p'
1124 1101{- | Reduce as much of your stream of 'Text' actually is iso8859 or latin1 to a byte stream,
1102 returning the rest of the 'Text' upon hitting any non-latin 'Char'
1103 -}
1125encodeIso8859_1 :: Monad m => Producer Text m r -> Producer ByteString m (Producer Text m r) 1104encodeIso8859_1 :: Monad m => Producer Text m r -> Producer ByteString m (Producer Text m r)
1126encodeIso8859_1 = go where 1105encodeIso8859_1 = go where
1127 go p = do etxt <- lift (next p) 1106 go p = do etxt <- lift (next p)
@@ -1137,6 +1116,9 @@ encodeIso8859_1 = go where
1137 else return $ do yield unsafe 1116 else return $ do yield unsafe
1138 p' 1117 p'
1139 1118
1119{- | Reduce a byte stream to a corresponding stream of ascii chars, returning the
1120 unused 'ByteString' upon hitting an un-ascii byte.
1121 -}
1140decodeAscii :: Monad m => Producer ByteString m r -> Producer Text m (Producer ByteString m r) 1122decodeAscii :: Monad m => Producer ByteString m r -> Producer Text m (Producer ByteString m r)
1141decodeAscii = go where 1123decodeAscii = go where
1142 go p = do echunk <- lift (next p) 1124 go p = do echunk <- lift (next p)
@@ -1152,7 +1134,9 @@ decodeAscii = go where
1152 else return $ do yield unsafe 1134 else return $ do yield unsafe
1153 p' 1135 p'
1154 1136
1155 1137{- | Reduce a byte stream to a corresponding stream of ascii chars, returning the
1138 unused 'ByteString' upon hitting the rare un-latinizable byte.
1139 -}
1156decodeIso8859_1 :: Monad m => Producer ByteString m r -> Producer Text m (Producer ByteString m r) 1140decodeIso8859_1 :: Monad m => Producer ByteString m r -> Producer Text m (Producer ByteString m r)
1157decodeIso8859_1 = go where 1141decodeIso8859_1 = go where
1158 go p = do echunk <- lift (next p) 1142 go p = do echunk <- lift (next p)
@@ -1170,34 +1154,5 @@ decodeIso8859_1 = go where
1170 1154
1171 1155
1172 1156
1173{- 1157
1174 ascii :: Codec
1175 ascii = Codec name enc (toDecoding dec) where
1176 name = T.pack "ASCII"
1177 enc text = (bytes, extra) where
1178 (safe, unsafe) = T.span (\c -> ord c <= 0x7F) text
1179 bytes = B8.pack (T.unpack safe)
1180 extra = if T.null unsafe
1181 then Nothing
1182 else Just (EncodeException ascii (T.head unsafe), unsafe)
1183
1184 dec bytes = (text, extra) where
1185 (safe, unsafe) = B.span (<= 0x7F) bytes
1186 text = T.pack (B8.unpack safe)
1187 extra = if B.null unsafe
1188 then Right B.empty
1189 else Left (DecodeException ascii (B.head unsafe), unsafe)
1190
1191 iso8859_1 :: Codec
1192 iso8859_1 = Codec name enc (toDecoding dec) where
1193 name = T.pack "ISO-8859-1"
1194 enc text = (bytes, extra) where
1195 (safe, unsafe) = T.span (\c -> ord c <= 0xFF) text
1196 bytes = B8.pack (T.unpack safe)
1197 extra = if T.null unsafe
1198 then Nothing
1199 else Just (EncodeException iso8859_1 (T.head unsafe), unsafe)
1200
1201 dec bytes = (T.pack (B8.unpack bytes), Right B.empty)
1202-}
1203 \ No newline at end of file 1158 \ No newline at end of file