From d3c20b21c97b88b5ab49ce07d18778c1ef563b62 Mon Sep 17 00:00:00 2001 From: Li-yao Xia Date: Thu, 14 Mar 2024 01:32:39 +0100 Subject: [PATCH] Improve lazy performance of `Data.Text.Lazy.inits` MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit The previous implementation, itself based on an earlier version of `Data.List.inits`, inherited the flaw that accessing the i-th element took quadratic time O(i²). This now takes linear time O(i) as expected. The current version of `Data.List.inits` uses a banker's queue to obtain good performance when generating very long lists. For lazy text, consisting of a few big chunks, that benefit seems negligible. So I chose a simpler implementation. --- benchmarks/haskell/Benchmarks.hs | 2 ++ benchmarks/haskell/Benchmarks/Micro.hs | 22 ++++++++++++++++++++++ src/Data/Text/Lazy.hs | 16 ++++++++++++---- text.cabal | 1 + 4 files changed, 37 insertions(+), 4 deletions(-) create mode 100644 benchmarks/haskell/Benchmarks/Micro.hs diff --git a/benchmarks/haskell/Benchmarks.hs b/benchmarks/haskell/Benchmarks.hs index 7b3aa17c6..33e6a0259 100644 --- a/benchmarks/haskell/Benchmarks.hs +++ b/benchmarks/haskell/Benchmarks.hs @@ -20,6 +20,7 @@ import qualified Benchmarks.EncodeUtf8 as EncodeUtf8 import qualified Benchmarks.Equality as Equality import qualified Benchmarks.FileRead as FileRead import qualified Benchmarks.FoldLines as FoldLines +import qualified Benchmarks.Micro as Micro import qualified Benchmarks.Multilang as Multilang import qualified Benchmarks.Pure as Pure import qualified Benchmarks.ReadNumbers as ReadNumbers @@ -61,6 +62,7 @@ main = do defaultMain [ Builder.benchmark , Concat.benchmark + , Micro.benchmark , bgroup "DecodeUtf8" [ env (DecodeUtf8.initEnv (tf "libya-chinese.html")) (DecodeUtf8.benchmark "html") , env (DecodeUtf8.initEnv (tf "yiwiki.xml")) (DecodeUtf8.benchmark "xml") diff --git a/benchmarks/haskell/Benchmarks/Micro.hs b/benchmarks/haskell/Benchmarks/Micro.hs new file mode 100644 index 000000000..5462393a5 --- /dev/null +++ b/benchmarks/haskell/Benchmarks/Micro.hs @@ -0,0 +1,22 @@ +-- | Benchmarks on artificial data. + +module Benchmarks.Micro (benchmark) where + +import qualified Data.Text.Lazy as TL +import qualified Data.Text as T +import Test.Tasty.Bench (Benchmark, bgroup, bench, nf) + +benchmark :: Benchmark +benchmark = bgroup "Micro" + [ -- Accessing i-th element should take O(i) time. + -- The 2k case should run in 2x the time of the 1k case. + bgroup "Lazy.inits" + [ bench "last 1k" $ nf (last . TL.inits) (chunks 1000) + , bench "last 2k" $ nf (last . TL.inits) (chunks 2000) + , bench "map-take1 1k" $ nf (map (TL.take 1) . TL.inits) (chunks 1000) + , bench "map-take1 2k" $ nf (map (TL.take 1) . TL.inits) (chunks 2000) + ] + ] + +chunks :: Int -> TL.Text +chunks n = TL.fromChunks (replicate n (T.pack "a")) diff --git a/src/Data/Text/Lazy.hs b/src/Data/Text/Lazy.hs index 41e6885da..b93c37f99 100644 --- a/src/Data/Text/Lazy.hs +++ b/src/Data/Text/Lazy.hs @@ -1443,10 +1443,18 @@ inits = (NE.toList P.$!) . initsNE -- -- @since 2.1.2 initsNE :: Text -> NonEmpty Text -initsNE = (Empty NE.:|) . inits' - where inits' Empty = [] - inits' (Chunk t ts) = L.map (\t' -> Chunk t' Empty) (NE.tail (T.initsNE t)) - ++ L.map (Chunk t) (inits' ts) +initsNE ts0 = Empty NE.:| inits' 0 ts0 + where + inits' :: Int64 -- Number of previous chunks i + -> Text -- The remainder after dropping i chunks from ts0 + -> [Text] -- Prefixes longer than the first i chunks of ts0. + inits' _ Empty = [] + inits' i (Chunk t ts) = L.map (takeChunks i ts0) (NE.tail (T.initsNE t)) + ++ inits' (i + 1) ts + +takeChunks :: Int64 -> Text -> T.Text -> Text +takeChunks !i (Chunk t ts) lastChunk | i > 0 = Chunk t (takeChunks (i - 1) ts lastChunk) +takeChunks _ _ lastChunk = Chunk lastChunk Empty -- | /O(n)/ Return all final segments of the given 'Text', longest -- first. diff --git a/text.cabal b/text.cabal index af868d222..9b10c97c2 100644 --- a/text.cabal +++ b/text.cabal @@ -333,6 +333,7 @@ benchmark text-benchmarks Benchmarks.Equality Benchmarks.FileRead Benchmarks.FoldLines + Benchmarks.Micro Benchmarks.Multilang Benchmarks.Programs.BigTable Benchmarks.Programs.Cut