From be3637354df8185ba56930ed556ae5104f056b9f Mon Sep 17 00:00:00 2001 From: Simon Hengel Date: Tue, 14 Aug 2018 10:02:33 +0800 Subject: [PATCH 1/4] Add support for detecting duplicate keys (see #142) --- ChangeLog.md | 4 ++ package.yaml | 2 + src/Data/Yaml.hs | 19 ++++++--- src/Data/Yaml/Include.hs | 20 ++++++++-- src/Data/Yaml/Internal.hs | 74 ++++++++++++++++++++++------------- test/Data/Yaml/IncludeSpec.hs | 66 +++++++++++++++++++++++++++++++ 6 files changed, 149 insertions(+), 36 deletions(-) diff --git a/ChangeLog.md b/ChangeLog.md index 602df50..b4347da 100644 --- a/ChangeLog.md +++ b/ChangeLog.md @@ -1,5 +1,9 @@ # ChangeLog for yaml +## next + +* Add `decodeFileWithWarnings` which returns warnings for duplicate fields + ## 0.9.0 * Expose style and tags on mappings and sequences in Text.Libyaml [#141](https://github.com/snoyberg/yaml/pull/141) diff --git a/package.yaml b/package.yaml index 4a15f68..8d0e9ac 100644 --- a/package.yaml +++ b/package.yaml @@ -49,6 +49,7 @@ dependencies: - base >=4.9.1 && <5 # GHC 8.0.2 and later - bytestring >=0.9.1.4 - transformers >=0.1 +- mtl - conduit >=1.2.8 && <1.4 - resourcet >=0.3 && <1.3 - aeson >=0.11 @@ -133,3 +134,4 @@ tests: - mockery - base-compat - temporary + - raw-strings-qq diff --git a/src/Data/Yaml.hs b/src/Data/Yaml.hs index 076f1ad..497b403 100644 --- a/src/Data/Yaml.hs +++ b/src/Data/Yaml.hs @@ -32,6 +32,7 @@ module Data.Yaml -- * Decoding , decodeEither' , decodeFileEither + , decodeFileWithWarnings , decodeThrow , decodeFileThrow -- ** More control over decoding @@ -163,14 +164,14 @@ decode :: FromJSON a => ByteString -> Maybe a decode bs = unsafePerformIO - $ either (const Nothing) id + $ either (const Nothing) snd <$> decodeHelper_ (Y.decode bs) {-# DEPRECATED decode "Please use decodeEither or decodeThrow, which provide information on how the decode failed" #-} decodeFile :: FromJSON a => FilePath -> IO (Maybe a) -decodeFile fp = decodeHelper (Y.decodeFile fp) >>= either throwIO (return . either (const Nothing) id) +decodeFile fp = (fmap snd <$> decodeHelper (Y.decodeFile fp)) >>= either throwIO (return . either (const Nothing) id) {-# DEPRECATED decodeFile "Please use decodeFileEither, which does not confused type-directed and runtime exceptions." #-} -- | A version of 'decodeFile' which should not throw runtime exceptions. @@ -180,12 +181,20 @@ decodeFileEither :: FromJSON a => FilePath -> IO (Either ParseException a) -decodeFileEither = decodeHelper_ . Y.decodeFile +decodeFileEither = fmap (fmap snd) . decodeFileWithWarnings + +-- | +-- @since 0.10.0 +decodeFileWithWarnings + :: FromJSON a + => FilePath + -> IO (Either ParseException ([Warning], a)) +decodeFileWithWarnings = decodeHelper_ . Y.decodeFile decodeEither :: FromJSON a => ByteString -> Either String a decodeEither bs = unsafePerformIO $ either (Left . prettyPrintParseException) id - <$> decodeHelper (Y.decode bs) + <$> (fmap snd <$> decodeHelper (Y.decode bs)) {-# DEPRECATED decodeEither "Please use decodeEither' or decodeThrow, which provide more useful failures" #-} -- | More helpful version of 'decodeEither' which returns the 'YamlException'. @@ -194,7 +203,7 @@ decodeEither bs = unsafePerformIO decodeEither' :: FromJSON a => ByteString -> Either ParseException a decodeEither' = either Left (either (Left . AesonException) Right) . unsafePerformIO - . decodeHelper + . fmap (fmap snd) . decodeHelper . Y.decode -- | A version of 'decodeEither'' lifted to MonadThrow diff --git a/src/Data/Yaml/Include.hs b/src/Data/Yaml/Include.hs index 6dd7a41..494dbac 100644 --- a/src/Data/Yaml/Include.hs +++ b/src/Data/Yaml/Include.hs @@ -1,6 +1,10 @@ {-# LANGUAGE CPP #-} {-# LANGUAGE RankNTypes #-} -module Data.Yaml.Include (decodeFile, decodeFileEither) where +module Data.Yaml.Include ( + decodeFile +, decodeFileEither +, decodeFileWithWarnings +) where #if !MIN_VERSION_directory(1, 2, 3) import Control.Exception (handleJust) @@ -20,7 +24,7 @@ import Data.Text.Encoding (decodeUtf8) import System.Directory import System.FilePath -import Data.Yaml.Internal (ParseException(..), decodeHelper_, decodeHelper) +import Data.Yaml.Internal (ParseException(..), Warning(..), decodeHelper_, decodeHelper) import Text.Libyaml hiding (decodeFile) import qualified Text.Libyaml as Y @@ -65,7 +69,7 @@ decodeFile :: FromJSON a => FilePath -> IO (Maybe a) -decodeFile fp = decodeHelper (eventsFromFile fp) >>= either throwIO (return . either (const Nothing) id) +decodeFile fp = (fmap snd <$> decodeHelper (eventsFromFile fp)) >>= either throwIO (return . either (const Nothing) id) -- | Like `Data.Yaml.decodeFileEither` but with support for relative and -- absolute includes. @@ -77,4 +81,12 @@ decodeFileEither :: FromJSON a => FilePath -> IO (Either ParseException a) -decodeFileEither = decodeHelper_ . eventsFromFile +decodeFileEither = fmap (fmap snd) . decodeFileWithWarnings + +-- | +-- @since 0.10.0 +decodeFileWithWarnings + :: FromJSON a + => FilePath + -> IO (Either ParseException ([Warning], a)) +decodeFileWithWarnings = decodeHelper_ . eventsFromFile diff --git a/src/Data/Yaml/Internal.hs b/src/Data/Yaml/Internal.hs index 7df2bfe..ffcfb62 100644 --- a/src/Data/Yaml/Internal.hs +++ b/src/Data/Yaml/Internal.hs @@ -6,6 +6,7 @@ module Data.Yaml.Internal ( ParseException(..) , prettyPrintParseException + , Warning(..) , parse , decodeHelper , decodeHelper_ @@ -19,23 +20,27 @@ import Control.Applicative ((<$>), Applicative(..)) #endif import Control.Applicative ((<|>)) import Control.Exception -import Control.Monad (liftM, ap, unless) +import Control.Monad (liftM, ap, when, unless) import Control.Monad.IO.Class (MonadIO, liftIO) import Control.Monad.Trans.Class (MonadTrans, lift) import Control.Monad.Trans.Resource (ResourceT, runResourceT) -import Control.Monad.Trans.State +import Control.Monad.RWS import Data.Aeson +import Data.Aeson.Internal (JSONPath, JSONPathElement(..)) import Data.Aeson.Types hiding (parse) import qualified Data.Attoparsec.Text as Atto import Data.Bits (shiftL, (.|.)) import Data.ByteString (ByteString) import Data.Char (toUpper, ord) +import Data.List import Data.Conduit ((.|), ConduitM, runConduit) import qualified Data.Conduit.List as CL import qualified Data.HashMap.Strict as M import qualified Data.HashSet as HashSet import Data.Map (Map) import qualified Data.Map as Map +import Data.Set (Set) +import qualified Data.Set as Set import Data.Scientific (Scientific) import Data.Text (Text, pack) import qualified Data.Text as T @@ -125,15 +130,21 @@ instance Monad m => Monad (PErrorT m) where instance MonadTrans PErrorT where lift = PErrorT . liftM Right instance MonadIO m => MonadIO (PErrorT m) where - liftIO = lift . liftIO + liftIO = liftIO defineAnchor :: Value -> String -> ConduitM e o Parse () -defineAnchor value name = lift $ modify $ Map.insert name value +defineAnchor value name = modify $ Map.insert name value lookupAnchor :: String -> ConduitM e o Parse (Maybe Value) -lookupAnchor name = lift $ gets (Map.lookup name) +lookupAnchor name = gets (Map.lookup name) -type Parse = StateT (Map String Value) (ResourceT IO) +data Warning = DuplicateKey JSONPath + deriving (Eq, Show) + +addWarning :: Warning -> ConduitM e o Parse () +addWarning = tell . return + +type Parse = RWST JSONPath [Warning] (Map String Value) (ResourceT IO) requireEvent :: Event -> ConduitM Event o Parse () requireEvent e = do @@ -199,8 +210,8 @@ parseO = do me <- CL.head case me of Just (EventScalar v tag style a) -> textToValue style tag <$> parseScalar v a style tag - Just (EventSequenceStart _ _ a) -> parseS a id - Just (EventMappingStart _ _ a) -> parseM a M.empty + Just (EventSequenceStart _ _ a) -> parseS 0 a id + Just (EventMappingStart _ _ a) -> parseM mempty a M.empty Just (EventAlias an) -> do m <- lookupAnchor an case m of @@ -208,10 +219,11 @@ parseO = do Just v -> return v _ -> liftIO $ throwIO $ UnexpectedEvent me Nothing -parseS :: Y.Anchor +parseS :: Int + -> Y.Anchor -> ([Value] -> [Value]) -> ConduitM Event o Parse Value -parseS a front = do +parseS n a front = do me <- CL.peek case me of Just EventSequenceEnd -> do @@ -220,13 +232,14 @@ parseS a front = do mapM_ (defineAnchor res) a return res _ -> do - o <- parseO - parseS a $ front . (:) o + o <- local (Index n :) parseO + parseS (succ n) a $ front . (:) o -parseM :: Y.Anchor +parseM :: Set Text + -> Y.Anchor -> M.HashMap Text Value -> ConduitM Event o Parse Value -parseM a front = do +parseM mergedKeys a front = do me <- CL.head case me of Just EventMappingEnd -> do @@ -243,48 +256,55 @@ parseM a front = do Just (String t) -> return t Just v -> liftIO $ throwIO $ NonStringKeyAlias an v _ -> liftIO $ throwIO $ UnexpectedEvent me Nothing - o <- parseO - let al = M.insert s o front - al' = if s == pack "<<" + (mergedKeys', al') <- local (Key s :) $ do + o <- parseO + let al = do + when (M.member s front && Set.notMember s mergedKeys) $ do + path <- reverse <$> ask + addWarning (DuplicateKey path) + return (Set.delete s mergedKeys, M.insert s o front) + if s == pack "<<" then case o of - Object l -> M.union front l - Array l -> M.union front $ foldl mergeObjects M.empty $ V.toList l + Object l -> return (merge l) + Array l -> return $ merge $ foldl mergeObjects M.empty $ V.toList l _ -> al else al - parseM a al' + parseM mergedKeys' a al' where mergeObjects al (Object om) = M.union al om mergeObjects al _ = al + merge xs = (Set.fromList (M.keys xs \\ M.keys front), M.union front xs) + decodeHelper :: FromJSON a => ConduitM () Y.Event Parse () - -> IO (Either ParseException (Either String a)) + -> IO (Either ParseException ([Warning], Either String a)) decodeHelper src = do -- This used to be tryAny, but the fact is that catching async -- exceptions is fine here. We'll rethrow them immediately in the -- otherwise clause. - x <- try $ runResourceT $ flip evalStateT Map.empty $ runConduit $ src .| parse + x <- try $ runResourceT $ evalRWST (runConduit $ src .| parse) [] Map.empty case x of Left e | Just pe <- fromException e -> return $ Left pe | Just ye <- fromException e -> return $ Left $ InvalidYaml $ Just (ye :: YamlException) | otherwise -> throwIO e - Right y -> return $ Right $ parseEither parseJSON y + Right (y, warnings) -> return $ Right (warnings, parseEither parseJSON y) decodeHelper_ :: FromJSON a => ConduitM () Event Parse () - -> IO (Either ParseException a) + -> IO (Either ParseException ([Warning], a)) decodeHelper_ src = do - x <- try $ runResourceT $ flip evalStateT Map.empty $ runConduit $ src .| parse + x <- try $ runResourceT $ evalRWST (runConduit $ src .| parse) [] Map.empty return $ case x of Left e | Just pe <- fromException e -> Left pe | Just ye <- fromException e -> Left $ InvalidYaml $ Just (ye :: YamlException) | otherwise -> Left $ OtherParseException e - Right y -> either + Right (y, warnings) -> either (Left . AesonException) Right - (parseEither parseJSON y) + ((,) warnings <$> parseEither parseJSON y) -- | Strings which must be escaped so as not to be treated as non-string scalars. specialStrings :: HashSet.HashSet Text diff --git a/test/Data/Yaml/IncludeSpec.hs b/test/Data/Yaml/IncludeSpec.hs index 52aab67..39ea24a 100644 --- a/test/Data/Yaml/IncludeSpec.hs +++ b/test/Data/Yaml/IncludeSpec.hs @@ -1,12 +1,18 @@ +{-# LANGUAGE QuasiQuotes #-} {-# LANGUAGE OverloadedStrings #-} module Data.Yaml.IncludeSpec (main, spec) where import Test.Hspec import Data.List (isPrefixOf) import Data.Aeson +import Data.Aeson.Internal (JSONPathElement(..)) import Data.Yaml (ParseException(InvalidYaml)) import Data.Yaml.Include +import Data.Yaml.Internal import Text.Libyaml (YamlException(YamlException)) +import Test.Mockery.Directory +import Text.RawString.QQ +import Data.Yaml.TH (yamlQQ) main :: IO () main = hspec spec @@ -52,6 +58,66 @@ spec = do (decodeFileEither "./does_not_exist.yaml" :: IO (Either ParseException Value)) >>= (`shouldSatisfy` either isYamlFileNotFoundException (const False)) + describe "decodeFileWithWarnings" $ around_ inTempDirectory $ do + it "warns on duplicate keys" $ do + writeFile "foo.yaml" [r| + foo: 23 + foo: bar + |] + Right result <- decodeFileWithWarnings "foo.yaml" + result `shouldBe` ([DuplicateKey [Key "foo"]], [yamlQQ| + foo: bar + |]) + + it "warns on nested duplicate keys" $ do + writeFile "foo.yaml" [r| + foo: + - 42 + - bar: 23 + bar: baz + |] + Right result <- decodeFileWithWarnings "foo.yaml" + result `shouldBe` ([DuplicateKey [Key "foo", Index 1, Key "bar"]], [yamlQQ| + foo: + - 42 + - bar: baz + |]) + + context "when overriding a merged key" $ do + it "does not warn" $ do + writeFile "foo.yaml" [r| + foo-1: &my-ref + bar: 23 + foo-2: + <<: *my-ref + bar: 42 + |] + Right result <- decodeFileWithWarnings "foo.yaml" + result `shouldBe` ([], [yamlQQ| + foo-1: + bar: 23 + foo-2: + bar: 42 + |]) + + context "when overriding twice" $ do + it "warns" $ do + writeFile "foo.yaml" [r| + foo-1: &my-ref + bar: 23 + foo-2: + <<: *my-ref + bar: 42 + bar: 65 + |] + Right result <- decodeFileWithWarnings "foo.yaml" + result `shouldBe` ([DuplicateKey [Key "foo-2", Key "bar"]], [yamlQQ| + foo-1: + bar: 23 + foo-2: + bar: 65 + |]) + isYamlFileNotFoundException :: ParseException -> Bool isYamlFileNotFoundException (InvalidYaml (Just (YamlException msg))) | "Yaml file not found: " `isPrefixOf` msg = True From 11f9f3f375860c566a7e73cbf86f9c587dadd635 Mon Sep 17 00:00:00 2001 From: Simon Hengel Date: Wed, 15 Aug 2018 13:41:49 +0800 Subject: [PATCH 2/4] Bump version --- ChangeLog.md | 2 +- package.yaml | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/ChangeLog.md b/ChangeLog.md index b4347da..f429ad9 100644 --- a/ChangeLog.md +++ b/ChangeLog.md @@ -1,6 +1,6 @@ # ChangeLog for yaml -## next +## 0.10.0 * Add `decodeFileWithWarnings` which returns warnings for duplicate fields diff --git a/package.yaml b/package.yaml index 8d0e9ac..4b78543 100644 --- a/package.yaml +++ b/package.yaml @@ -1,5 +1,5 @@ name: yaml -version: 0.9.0 +version: 0.10.0 synopsis: Support for parsing and rendering YAML documents. description: README and API documentation are available at category: Data From 8d491e4772f6678208b5fd0ee3e8180788a7a751 Mon Sep 17 00:00:00 2001 From: Simon Hengel Date: Sun, 19 Aug 2018 11:40:22 +0800 Subject: [PATCH 3/4] Remove dead code --- src/Data/Yaml/Internal.hs | 22 +--------------------- 1 file changed, 1 insertion(+), 21 deletions(-) diff --git a/src/Data/Yaml/Internal.hs b/src/Data/Yaml/Internal.hs index ffcfb62..cf58f19 100644 --- a/src/Data/Yaml/Internal.hs +++ b/src/Data/Yaml/Internal.hs @@ -20,9 +20,7 @@ import Control.Applicative ((<$>), Applicative(..)) #endif import Control.Applicative ((<|>)) import Control.Exception -import Control.Monad (liftM, ap, when, unless) -import Control.Monad.IO.Class (MonadIO, liftIO) -import Control.Monad.Trans.Class (MonadTrans, lift) +import Control.Monad (when, unless) import Control.Monad.Trans.Resource (ResourceT, runResourceT) import Control.Monad.RWS import Data.Aeson @@ -114,24 +112,6 @@ prettyPrintParseException pe = case pe of ] CyclicIncludes -> "Cyclic includes" -newtype PErrorT m a = PErrorT { runPErrorT :: m (Either ParseException a) } -instance Monad m => Functor (PErrorT m) where - fmap = liftM -instance Monad m => Applicative (PErrorT m) where - pure = PErrorT . return . Right - (<*>) = ap -instance Monad m => Monad (PErrorT m) where - return = pure - (PErrorT m) >>= f = PErrorT $ do - e <- m - case e of - Left e' -> return $ Left e' - Right a -> runPErrorT $ f a -instance MonadTrans PErrorT where - lift = PErrorT . liftM Right -instance MonadIO m => MonadIO (PErrorT m) where - liftIO = liftIO - defineAnchor :: Value -> String -> ConduitM e o Parse () defineAnchor value name = modify $ Map.insert name value From 3d29d0bf87f25936c80b29ad4cefe0afc4f7c326 Mon Sep 17 00:00:00 2001 From: Simon Hengel Date: Sun, 19 Aug 2018 12:06:08 +0800 Subject: [PATCH 4/4] Add haddocks for decodeFileWithWarnings --- src/Data/Yaml.hs | 4 +++- src/Data/Yaml/Include.hs | 4 +++- 2 files changed, 6 insertions(+), 2 deletions(-) diff --git a/src/Data/Yaml.hs b/src/Data/Yaml.hs index 497b403..bdc7edd 100644 --- a/src/Data/Yaml.hs +++ b/src/Data/Yaml.hs @@ -183,7 +183,9 @@ decodeFileEither -> IO (Either ParseException a) decodeFileEither = fmap (fmap snd) . decodeFileWithWarnings --- | +-- | A version of `decodeFileEither` that returns warnings along with the parse +-- result. +-- -- @since 0.10.0 decodeFileWithWarnings :: FromJSON a diff --git a/src/Data/Yaml/Include.hs b/src/Data/Yaml/Include.hs index 494dbac..640131a 100644 --- a/src/Data/Yaml/Include.hs +++ b/src/Data/Yaml/Include.hs @@ -83,7 +83,9 @@ decodeFileEither -> IO (Either ParseException a) decodeFileEither = fmap (fmap snd) . decodeFileWithWarnings --- | +-- | A version of `decodeFileEither` that returns warnings along with the parse +-- result. +-- -- @since 0.10.0 decodeFileWithWarnings :: FromJSON a