scrapped stdinLn etc. Improved haddocks

author: michaelt <what_is_it_to_do_anything@yahoo.com> 2014-02-05 00:42:35 -0500
committer: michaelt <what_is_it_to_do_anything@yahoo.com> 2014-02-05 00:42:35 -0500
commit: 167f880504e05b19d3487c7ba701afa9633a2f41 (patch)
tree: 23eecc37d471915254d6ef6f3314e14b6bb2719f /Pipes
parent: 4da91c37355b3d688c9dfc6f92ae92266ad4e883 (diff)
download: text-pipes-167f880504e05b19d3487c7ba701afa9633a2f41.tar.gz
text-pipes-167f880504e05b19d3487c7ba701afa9633a2f41.tar.zst
text-pipes-167f880504e05b19d3487c7ba701afa9633a2f41.zip
1 files changed, 29 insertions, 74 deletions
diff --git a/Pipes/Text.hs b/Pipes/Text.hs
index 796f672..bbf200f 100644
--- a/Pipes/Text.hs
+++ b/Pipes/Text.hs
@@ -66,11 +66,9 @@ module Pipes.Text  (
    , stdin
    , fromHandle
    , readFile
-    , stdinLn
    -- * Consumers
    , stdout
-    , stdoutLn
    , toHandle
    , writeFile
@@ -275,27 +273,6 @@ readFile :: MonadSafe m => FilePath -> Producer Text m ()
 readFile file = Safe.withFile file IO.ReadMode fromHandle
 {-# INLINE readFile #-}
-{-| Crudely stream lines of input from stdin in the style of Pipes.Prelude. 
-    This is for testing in ghci etc.; obviously it will be unsound if used to recieve
-    the contents of immense files with few newlines.
->>> let safely = runSafeT . runEffect
->>> safely $ for Text.stdinLn (lift . lift . print . T.length)
-hello
-5
-world
-5
-}
-stdinLn :: MonadIO m => Producer' Text m ()
-stdinLn = go where
-    go = do
-        eof <- liftIO (IO.hIsEOF IO.stdin)
-        unless eof $ do
-            txt <- liftIO (T.hGetLine IO.stdin)
-            yield txt
-            go
-{-# INLINABLE stdinLn #-}
 {-| Stream text to 'stdout'
@@ -319,20 +296,6 @@ stdout = go
            Right () -> go
 {-# INLINABLE stdout #-}
-stdoutLn :: (MonadIO m) => Consumer' Text m ()
-stdoutLn = go
-  where
-    go = do
-        str <- await
-        x   <- liftIO $ try (T.putStrLn str)
-        case x of
-           Left (G.IOError { G.ioe_type  = G.ResourceVanished
-                           , G.ioe_errno = Just ioe })
-                | Errno ioe == ePIPE
-                    -> return ()
-           Left  e  -> liftIO (throwIO e)
-           Right () -> go
-{-# INLINABLE stdoutLn #-}
 {-| Convert a text stream into a 'Handle'
@@ -723,8 +686,9 @@ isEndOfChars = do
 {-# INLINABLE isEndOfChars #-}
-- | An improper lens into a stream of 'ByteString' expected to be UTF-8 encoded; the associated
+{- | An improper lens into a stream of 'ByteString' expected to be UTF-8 encoded; the associated
-- stream of Text ends by returning a stream of ByteStrings beginning at the point of failure.
+   stream of Text ends by returning a stream of ByteStrings beginning at the point of failure. 
+   -}
 decodeUtf8 :: Monad m => Lens' (Producer ByteString m r) 
                               (Producer Text m (Producer ByteString m r))
@@ -1010,7 +974,6 @@ lines = Data.Profunctor.dimap _lines (fmap _unlines)
 {-# INLINABLE lines #-}
 -- | Split a text stream into 'FreeT'-delimited words
 words
    :: (Monad m) => Iso' (Producer Text m r) (FreeT (Producer Text m) m r)
@@ -1090,6 +1053,16 @@ unwords = intercalate (yield $ T.singleton ' ')
    @Pipes.Parse@ re-exports 'input', 'concat', 'FreeT' (the type) and the 'Parse' synonym. 
 -}
+{- | Use a 'Codec' as a pipes-style 'Lens' into a byte stream; the available 'Codec' s are
+     'utf8', 'utf16_le', 'utf16_be', 'utf32_le', 'utf32_be' . The 'Codec' concept and the 
+     individual 'Codec' definitions follow the enumerator and conduit libraries. 
+     
+     Utf8 is handled differently in this library -- without the use of 'unsafePerformIO' &co 
+     to catch 'Text' exceptions; but the same 'mypipe ^. codec utf8' interface can be used.
+     'mypipe ^. decodeUtf8' should be the same, but has a somewhat more direct and thus perhaps
+     better implementation.  
+     -}
 codec :: Monad m => Codec -> Lens' (Producer ByteString m r) (Producer Text m (Producer ByteString m r))
 codec (Codec _ enc dec) k p0 = fmap (\p -> join (for p (yield . fst . enc))) 
                                     (k (decoder (dec B.empty) p0) ) where 
@@ -1104,9 +1077,13 @@ codec (Codec _ enc dec) k p0 = fmap (\p -> join (for p (yield . fst . enc)))
                                                                 return r)
                                            Right (chunk,p1) -> decoder (dec chunk) p1
-- decodeUtf8 k p0 = fmap (\p -> join  (for p (yield . TE.encodeUtf8))) 
+{- | ascii and latin encodings only represent a small fragment of 'Text'; thus we cannot
--                        (k (go B.empty PI.streamDecodeUtf8 p0)) where
+     use the pipes 'Lens' style to work with them. Rather we simply define functions 
+     each way. 
+     'encodeAscii' : Reduce as much of your stream of 'Text' actually is ascii to a byte stream,
+     returning the rest of the 'Text' at the first non-ascii 'Char'
+-}
 encodeAscii :: Monad m => Producer Text m r -> Producer ByteString m (Producer Text m r)
 encodeAscii = go where
  go p = do echunk <- lift (next p)
@@ -1121,7 +1098,9 @@ encodeAscii = go where
                                then go p'
                                else return $ do yield unsafe 
                                                 p'
+{- | Reduce as much of your stream of 'Text' actually is iso8859 or latin1 to a byte stream,
+     returning the rest of the 'Text' upon hitting any non-latin 'Char'
+   -}
 encodeIso8859_1 :: Monad m => Producer Text m r -> Producer ByteString m (Producer Text m r)
 encodeIso8859_1 = go where
  go p = do etxt <- lift (next p)
@@ -1137,6 +1116,9 @@ encodeIso8859_1 = go where
                                else return $ do yield unsafe 
                                                 p'
+{- | Reduce a byte stream to a corresponding stream of ascii chars, returning the
+     unused 'ByteString' upon hitting an un-ascii byte.
+   -}
 decodeAscii :: Monad m => Producer ByteString m r -> Producer Text m (Producer ByteString m r)
 decodeAscii = go where
  go p = do echunk <- lift (next p)
@@ -1152,7 +1134,9 @@ decodeAscii = go where
                                else return $ do yield unsafe 
                                                 p'
+{- | Reduce a byte stream to a corresponding stream of ascii chars, returning the
+     unused 'ByteString' upon hitting the rare un-latinizable byte.
+     -}
 decodeIso8859_1 :: Monad m => Producer ByteString m r -> Producer Text m (Producer ByteString m r)
 decodeIso8859_1 = go where
  go p = do echunk <- lift (next p)
@@ -1170,34 +1154,5 @@ decodeIso8859_1 = go where
-{-
-  ascii :: Codec
-  ascii = Codec name enc (toDecoding dec) where
-      name = T.pack "ASCII"
-      enc text = (bytes, extra) where
-          (safe, unsafe) = T.span (\c -> ord c <= 0x7F) text
-          bytes = B8.pack (T.unpack safe)
-          extra = if T.null unsafe
-              then Nothing
-              else Just (EncodeException ascii (T.head unsafe), unsafe)
-      dec bytes = (text, extra) where
-          (safe, unsafe) = B.span (<= 0x7F) bytes
-          text = T.pack (B8.unpack safe)
-          extra = if B.null unsafe
-              then Right B.empty
-              else Left (DecodeException ascii (B.head unsafe), unsafe)
-  iso8859_1 :: Codec
-  iso8859_1 = Codec name enc (toDecoding dec) where
-      name = T.pack "ISO-8859-1"
-      enc text = (bytes, extra) where
-          (safe, unsafe) = T.span (\c -> ord c <= 0xFF) text
-          bytes = B8.pack (T.unpack safe)
-          extra = if T.null unsafe
-              then Nothing
-              else Just (EncodeException iso8859_1 (T.head unsafe), unsafe)
-      dec bytes = (T.pack (B8.unpack bytes), Right B.empty)
-}
                                            
 \ No newline at end of file
author	michaelt <what_is_it_to_do_anything@yahoo.com>	2014-02-05 00:42:35 -0500
committer	michaelt <what_is_it_to_do_anything@yahoo.com>	2014-02-05 00:42:35 -0500
commit	167f880504e05b19d3487c7ba701afa9633a2f41 (patch)
tree	23eecc37d471915254d6ef6f3314e14b6bb2719f /Pipes
parent	4da91c37355b3d688c9dfc6f92ae92266ad4e883 (diff)
download	text-pipes-167f880504e05b19d3487c7ba701afa9633a2f41.tar.gz text-pipes-167f880504e05b19d3487c7ba701afa9633a2f41.tar.zst text-pipes-167f880504e05b19d3487c7ba701afa9633a2f41.zip

diff --git a/Pipes/Text.hs b/Pipes/Text.hs index 796f672..bbf200f 100644 --- a/Pipes/Text.hs +++ b/Pipes/Text.hs
@@ -66,11 +66,9 @@ module Pipes.Text (
66	, stdin	66	, stdin
67	, fromHandle	67	, fromHandle
68	, readFile	68	, readFile
69	, stdinLn
70		69
71	-- * Consumers	70	-- * Consumers
72	, stdout	71	, stdout
73	, stdoutLn
74	, toHandle	72	, toHandle
75	, writeFile	73	, writeFile
76		74
@@ -275,27 +273,6 @@ readFile :: MonadSafe m => FilePath -> Producer Text m ()
275	readFile file = Safe.withFile file IO.ReadMode fromHandle	273	readFile file = Safe.withFile file IO.ReadMode fromHandle
276	{-# INLINE readFile #-}	274	{-# INLINE readFile #-}
277		275
278	{-\| Crudely stream lines of input from stdin in the style of Pipes.Prelude.
279	This is for testing in ghci etc.; obviously it will be unsound if used to recieve
280	the contents of immense files with few newlines.
281
282	>>> let safely = runSafeT . runEffect
283	>>> safely $ for Text.stdinLn (lift . lift . print . T.length)
284	hello
285	5
286	world
287	5
288
289	-}
290	stdinLn :: MonadIO m => Producer' Text m ()
291	stdinLn = go where
292	go = do
293	eof <- liftIO (IO.hIsEOF IO.stdin)
294	unless eof $ do
295	txt <- liftIO (T.hGetLine IO.stdin)
296	yield txt
297	go
298	{-# INLINABLE stdinLn #-}
299		276
300	{-\| Stream text to 'stdout'	277	{-\| Stream text to 'stdout'
301		278
@@ -319,20 +296,6 @@ stdout = go
319	Right () -> go	296	Right () -> go
320	{-# INLINABLE stdout #-}	297	{-# INLINABLE stdout #-}
321		298
322	stdoutLn :: (MonadIO m) => Consumer' Text m ()
323	stdoutLn = go
324	where
325	go = do
326	str <- await
327	x <- liftIO $ try (T.putStrLn str)
328	case x of
329	Left (G.IOError { G.ioe_type = G.ResourceVanished
330	, G.ioe_errno = Just ioe })
331	\| Errno ioe == ePIPE
332	-> return ()
333	Left e -> liftIO (throwIO e)
334	Right () -> go
335	{-# INLINABLE stdoutLn #-}
336		299
337	{-\| Convert a text stream into a 'Handle'	300	{-\| Convert a text stream into a 'Handle'
338		301
@@ -723,8 +686,9 @@ isEndOfChars = do
723	{-# INLINABLE isEndOfChars #-}	686	{-# INLINABLE isEndOfChars #-}
724		687
725		688
726	-- \| An improper lens into a stream of 'ByteString' expected to be UTF-8 encoded; the associated	689	{- \| An improper lens into a stream of 'ByteString' expected to be UTF-8 encoded; the associated
727	-- stream of Text ends by returning a stream of ByteStrings beginning at the point of failure.	690	stream of Text ends by returning a stream of ByteStrings beginning at the point of failure.
		691	-}
728		692
729	decodeUtf8 :: Monad m => Lens' (Producer ByteString m r)	693	decodeUtf8 :: Monad m => Lens' (Producer ByteString m r)
730	(Producer Text m (Producer ByteString m r))	694	(Producer Text m (Producer ByteString m r))
@@ -1010,7 +974,6 @@ lines = Data.Profunctor.dimap _lines (fmap _unlines)
1010	{-# INLINABLE lines #-}	974	{-# INLINABLE lines #-}
1011		975
1012		976
1013
1014	-- \| Split a text stream into 'FreeT'-delimited words	977	-- \| Split a text stream into 'FreeT'-delimited words
1015	words	978	words
1016	:: (Monad m) => Iso' (Producer Text m r) (FreeT (Producer Text m) m r)	979	:: (Monad m) => Iso' (Producer Text m r) (FreeT (Producer Text m) m r)
@@ -1090,6 +1053,16 @@ unwords = intercalate (yield $ T.singleton ' ')
1090	@Pipes.Parse@ re-exports 'input', 'concat', 'FreeT' (the type) and the 'Parse' synonym.	1053	@Pipes.Parse@ re-exports 'input', 'concat', 'FreeT' (the type) and the 'Parse' synonym.
1091	-}	1054	-}
1092		1055
		1056	{- \| Use a 'Codec' as a pipes-style 'Lens' into a byte stream; the available 'Codec' s are
		1057	'utf8', 'utf16_le', 'utf16_be', 'utf32_le', 'utf32_be' . The 'Codec' concept and the
		1058	individual 'Codec' definitions follow the enumerator and conduit libraries.
		1059
		1060	Utf8 is handled differently in this library -- without the use of 'unsafePerformIO' &co
		1061	to catch 'Text' exceptions; but the same 'mypipe ^. codec utf8' interface can be used.
		1062	'mypipe ^. decodeUtf8' should be the same, but has a somewhat more direct and thus perhaps
		1063	better implementation.
		1064
		1065	-}
1093	codec :: Monad m => Codec -> Lens' (Producer ByteString m r) (Producer Text m (Producer ByteString m r))	1066	codec :: Monad m => Codec -> Lens' (Producer ByteString m r) (Producer Text m (Producer ByteString m r))
1094	codec (Codec _ enc dec) k p0 = fmap (\p -> join (for p (yield . fst . enc)))	1067	codec (Codec _ enc dec) k p0 = fmap (\p -> join (for p (yield . fst . enc)))
1095	(k (decoder (dec B.empty) p0) ) where	1068	(k (decoder (dec B.empty) p0) ) where
@@ -1104,9 +1077,13 @@ codec (Codec _ enc dec) k p0 = fmap (\p -> join (for p (yield . fst . enc)))
1104	return r)	1077	return r)
1105	Right (chunk,p1) -> decoder (dec chunk) p1	1078	Right (chunk,p1) -> decoder (dec chunk) p1
1106		1079
1107	-- decodeUtf8 k p0 = fmap (\p -> join (for p (yield . TE.encodeUtf8)))	1080	{- \| ascii and latin encodings only represent a small fragment of 'Text'; thus we cannot
1108	-- (k (go B.empty PI.streamDecodeUtf8 p0)) where	1081	use the pipes 'Lens' style to work with them. Rather we simply define functions
		1082	each way.
1109		1083
		1084	'encodeAscii' : Reduce as much of your stream of 'Text' actually is ascii to a byte stream,
		1085	returning the rest of the 'Text' at the first non-ascii 'Char'
		1086	-}
1110	encodeAscii :: Monad m => Producer Text m r -> Producer ByteString m (Producer Text m r)	1087	encodeAscii :: Monad m => Producer Text m r -> Producer ByteString m (Producer Text m r)
1111	encodeAscii = go where	1088	encodeAscii = go where
1112	go p = do echunk <- lift (next p)	1089	go p = do echunk <- lift (next p)
@@ -1121,7 +1098,9 @@ encodeAscii = go where
1121	then go p'	1098	then go p'
1122	else return $ do yield unsafe	1099	else return $ do yield unsafe
1123	p'	1100	p'
1124		1101	{- \| Reduce as much of your stream of 'Text' actually is iso8859 or latin1 to a byte stream,
		1102	returning the rest of the 'Text' upon hitting any non-latin 'Char'
		1103	-}
1125	encodeIso8859_1 :: Monad m => Producer Text m r -> Producer ByteString m (Producer Text m r)	1104	encodeIso8859_1 :: Monad m => Producer Text m r -> Producer ByteString m (Producer Text m r)
1126	encodeIso8859_1 = go where	1105	encodeIso8859_1 = go where
1127	go p = do etxt <- lift (next p)	1106	go p = do etxt <- lift (next p)
@@ -1137,6 +1116,9 @@ encodeIso8859_1 = go where
1137	else return $ do yield unsafe	1116	else return $ do yield unsafe
1138	p'	1117	p'
1139		1118
		1119	{- \| Reduce a byte stream to a corresponding stream of ascii chars, returning the
		1120	unused 'ByteString' upon hitting an un-ascii byte.
		1121	-}
1140	decodeAscii :: Monad m => Producer ByteString m r -> Producer Text m (Producer ByteString m r)	1122	decodeAscii :: Monad m => Producer ByteString m r -> Producer Text m (Producer ByteString m r)
1141	decodeAscii = go where	1123	decodeAscii = go where
1142	go p = do echunk <- lift (next p)	1124	go p = do echunk <- lift (next p)
@@ -1152,7 +1134,9 @@ decodeAscii = go where
1152	else return $ do yield unsafe	1134	else return $ do yield unsafe
1153	p'	1135	p'
1154		1136
1155		1137	{- \| Reduce a byte stream to a corresponding stream of ascii chars, returning the
		1138	unused 'ByteString' upon hitting the rare un-latinizable byte.
		1139	-}
1156	decodeIso8859_1 :: Monad m => Producer ByteString m r -> Producer Text m (Producer ByteString m r)	1140	decodeIso8859_1 :: Monad m => Producer ByteString m r -> Producer Text m (Producer ByteString m r)
1157	decodeIso8859_1 = go where	1141	decodeIso8859_1 = go where
1158	go p = do echunk <- lift (next p)	1142	go p = do echunk <- lift (next p)
@@ -1170,34 +1154,5 @@ decodeIso8859_1 = go where
1170		1154
1171		1155
1172		1156
1173	{-	1157
1174	ascii :: Codec
1175	ascii = Codec name enc (toDecoding dec) where
1176	name = T.pack "ASCII"
1177	enc text = (bytes, extra) where
1178	(safe, unsafe) = T.span (\c -> ord c <= 0x7F) text
1179	bytes = B8.pack (T.unpack safe)
1180	extra = if T.null unsafe
1181	then Nothing
1182	else Just (EncodeException ascii (T.head unsafe), unsafe)
1183
1184	dec bytes = (text, extra) where
1185	(safe, unsafe) = B.span (<= 0x7F) bytes
1186	text = T.pack (B8.unpack safe)
1187	extra = if B.null unsafe
1188	then Right B.empty
1189	else Left (DecodeException ascii (B.head unsafe), unsafe)
1190
1191	iso8859_1 :: Codec
1192	iso8859_1 = Codec name enc (toDecoding dec) where
1193	name = T.pack "ISO-8859-1"
1194	enc text = (bytes, extra) where
1195	(safe, unsafe) = T.span (\c -> ord c <= 0xFF) text
1196	bytes = B8.pack (T.unpack safe)
1197	extra = if T.null unsafe
1198	then Nothing
1199	else Just (EncodeException iso8859_1 (T.head unsafe), unsafe)
1200
1201	dec bytes = (T.pack (B8.unpack bytes), Right B.empty)
1202	-}
1203	\ No newline at end of file	1158	\ No newline at end of file