Skip to content

Commit

Permalink
Fix RAM usage upon big dump-hi files parsing
Browse files Browse the repository at this point in the history
See #4027
  • Loading branch information
k-bx committed Jun 6, 2018
1 parent 8ba673f commit a93e630
Show file tree
Hide file tree
Showing 2 changed files with 32 additions and 13 deletions.
2 changes: 2 additions & 0 deletions ChangeLog.md
Original file line number Diff line number Diff line change
Expand Up @@ -38,6 +38,8 @@ Bug fixes:
was tried to be registered. This is now fixed by always building internal
libraries. See
[#3996](https://github.com/commercialhaskell/stack/issues/3996).
* Fix a regression which might use a lot of RAM. See
[#4027](https://github.com/commercialhaskell/stack/issues/4027).


## v1.7.1
Expand Down
43 changes: 30 additions & 13 deletions src/Stack/Package.hs
Original file line number Diff line number Diff line change
Expand Up @@ -40,13 +40,14 @@ module Stack.Package
where

import qualified Data.ByteString as BS
import qualified Data.ByteString.Char8 as C8
import qualified Data.ByteString.Lazy.Char8 as CL8
import Data.List (isSuffixOf, isPrefixOf)
import Data.Maybe (maybe)
import qualified Data.Map.Strict as M
import qualified Data.Set as S
import qualified Data.Text as T
import Data.Text.Encoding (decodeUtf8)
import qualified Data.Text.Lazy as TL
import qualified Data.Text.Lazy.Encoding as TLE
import Distribution.Compiler
import Distribution.ModuleName (ModuleName)
import qualified Distribution.ModuleName as Cabal
Expand Down Expand Up @@ -1213,24 +1214,24 @@ parseDumpHI
:: FilePath -> RIO Ctx (Set ModuleName, [Path Abs File])
parseDumpHI dumpHIPath = do
dir <- asks (parent . ctxFile)
dumpHI <- liftIO $ fmap C8.lines (C8.readFile dumpHIPath)
dumpHI <- liftIO $ filterDumpHi <$> fmap CL8.lines (CL8.readFile dumpHIPath)
let startModuleDeps =
dropWhile (not . ("module dependencies:" `C8.isPrefixOf`)) dumpHI
dropWhile (not . ("module dependencies:" `CL8.isPrefixOf`)) dumpHI
moduleDeps =
S.fromList $
mapMaybe (D.simpleParse . T.unpack . decodeUtf8) $
C8.words $
C8.concat $
C8.dropWhile (/= ' ') (fromMaybe "" $ listToMaybe startModuleDeps) :
takeWhile (" " `C8.isPrefixOf`) (drop 1 startModuleDeps)
mapMaybe (D.simpleParse . TL.unpack . TLE.decodeUtf8) $
CL8.words $
CL8.concat $
CL8.dropWhile (/= ' ') (fromMaybe "" $ listToMaybe startModuleDeps) :
takeWhile (" " `CL8.isPrefixOf`) (drop 1 startModuleDeps)
thDeps =
-- The dependent file path is surrounded by quotes but is not escaped.
-- It can be an absolute or relative path.
mapMaybe
(fmap T.unpack .
(T.stripSuffix "\"" <=< T.stripPrefix "\"") .
T.dropWhileEnd (== '\r') . decodeUtf8 . C8.dropWhile (/= '"')) $
filter ("addDependentFile \"" `C8.isPrefixOf`) dumpHI
(fmap TL.unpack .
(TL.stripSuffix "\"" <=< TL.stripPrefix "\"") .
TL.dropWhileEnd (== '\r') . TLE.decodeUtf8 . CL8.dropWhile (/= '"')) $
filter ("addDependentFile \"" `CL8.isPrefixOf`) dumpHI
thDepsResolved <- liftM catMaybes $ forM thDeps $ \x -> do
mresolved <- liftIO (forgivingAbsence (resolveFile dir x)) >>= rejectMissingFile
when (isNothing mresolved) $
Expand All @@ -1242,6 +1243,22 @@ parseDumpHI dumpHIPath = do
]
return mresolved
return (moduleDeps, thDepsResolved)
where
-- | Filtering step fixing RAM usage upon a big dump-hi file. See
-- https://github.com/commercialhaskell/stack/issues/4027 It is
-- an optional step from a functionality stand-point.
filterDumpHi dumpHI =
let dl x xs = x ++ xs
isLineInteresting (acc, moduleDepsStarted) l
| moduleDepsStarted && " " `CL8.isPrefixOf` l =
(acc . dl [l], True)
| "module dependencies:" `CL8.isPrefixOf` l =
(acc . dl [l], True)
| "addDependentFile \"" `CL8.isPrefixOf` l =
(acc . dl [l], False)
| otherwise = (acc, False)
in fst (foldl' isLineInteresting (dl [], False) dumpHI) []


-- | Try to resolve the list of base names in the given directory by
-- looking for unique instances of base names applied with the given
Expand Down

0 comments on commit a93e630

Please sign in to comment.