{-# LANGUAGE DeriveGeneric #-}
{-# LANGUAGE GeneralizedNewtypeDeriving #-}
module Source.Source
( Source
, bytes
, fromUTF8
, Source.Source.length
, Source.Source.null
, totalRange
, totalSpan
, fromText
, toText
, slice
, drop
, take
, Source.Source.lines
, lineRanges
, lineRangesWithin
, newlineIndices
) where
import Prelude hiding (drop, take)
import Control.Arrow ((&&&))
import Control.DeepSeq (NFData)
import Data.Aeson (FromJSON (..), withText)
import qualified Data.ByteString as B
import Data.Char (ord)
import Data.Maybe (fromMaybe)
import Data.Monoid (Last (..))
import Data.Semilattice.Lower
import Data.String (IsString (..))
import qualified Data.Text as T
import qualified Data.Text.Encoding as T
import Data.Text.Encoding.Error (lenientDecode)
import GHC.Generics (Generic)
import Source.Range
import Source.Span (Pos (..), Span (Span))
newtype Source = Source { Source -> ByteString
bytes :: B.ByteString }
deriving (Source -> Source -> Bool
(Source -> Source -> Bool)
-> (Source -> Source -> Bool) -> Eq Source
forall a. (a -> a -> Bool) -> (a -> a -> Bool) -> Eq a
$c== :: Source -> Source -> Bool
== :: Source -> Source -> Bool
$c/= :: Source -> Source -> Bool
/= :: Source -> Source -> Bool
Eq, NonEmpty Source -> Source
Source -> Source -> Source
(Source -> Source -> Source)
-> (NonEmpty Source -> Source)
-> (forall b. Integral b => b -> Source -> Source)
-> Semigroup Source
forall b. Integral b => b -> Source -> Source
forall a.
(a -> a -> a)
-> (NonEmpty a -> a)
-> (forall b. Integral b => b -> a -> a)
-> Semigroup a
$c<> :: Source -> Source -> Source
<> :: Source -> Source -> Source
$csconcat :: NonEmpty Source -> Source
sconcat :: NonEmpty Source -> Source
$cstimes :: forall b. Integral b => b -> Source -> Source
stimes :: forall b. Integral b => b -> Source -> Source
Semigroup, Semigroup Source
Source
Semigroup Source
-> Source
-> (Source -> Source -> Source)
-> ([Source] -> Source)
-> Monoid Source
[Source] -> Source
Source -> Source -> Source
forall a.
Semigroup a -> a -> (a -> a -> a) -> ([a] -> a) -> Monoid a
$cmempty :: Source
mempty :: Source
$cmappend :: Source -> Source -> Source
mappend :: Source -> Source -> Source
$cmconcat :: [Source] -> Source
mconcat :: [Source] -> Source
Monoid, String -> Source
(String -> Source) -> IsString Source
forall a. (String -> a) -> IsString a
$cfromString :: String -> Source
fromString :: String -> Source
IsString, Int -> Source -> ShowS
[Source] -> ShowS
Source -> String
(Int -> Source -> ShowS)
-> (Source -> String) -> ([Source] -> ShowS) -> Show Source
forall a.
(Int -> a -> ShowS) -> (a -> String) -> ([a] -> ShowS) -> Show a
$cshowsPrec :: Int -> Source -> ShowS
showsPrec :: Int -> Source -> ShowS
$cshow :: Source -> String
show :: Source -> String
$cshowList :: [Source] -> ShowS
showList :: [Source] -> ShowS
Show, (forall x. Source -> Rep Source x)
-> (forall x. Rep Source x -> Source) -> Generic Source
forall x. Rep Source x -> Source
forall x. Source -> Rep Source x
forall a.
(forall x. a -> Rep a x) -> (forall x. Rep a x -> a) -> Generic a
$cfrom :: forall x. Source -> Rep Source x
from :: forall x. Source -> Rep Source x
$cto :: forall x. Rep Source x -> Source
to :: forall x. Rep Source x -> Source
Generic, Source -> ()
(Source -> ()) -> NFData Source
forall a. (a -> ()) -> NFData a
$crnf :: Source -> ()
rnf :: Source -> ()
NFData)
fromUTF8 :: B.ByteString -> Source
fromUTF8 :: ByteString -> Source
fromUTF8 = ByteString -> Source
Source
instance FromJSON Source where
parseJSON :: Value -> Parser Source
parseJSON = String -> (Text -> Parser Source) -> Value -> Parser Source
forall a. String -> (Text -> Parser a) -> Value -> Parser a
withText String
"Source" (Source -> Parser Source
forall a. a -> Parser a
forall (f :: * -> *) a. Applicative f => a -> f a
pure (Source -> Parser Source)
-> (Text -> Source) -> Text -> Parser Source
forall b c a. (b -> c) -> (a -> b) -> a -> c
. Text -> Source
fromText)
length :: Source -> Int
length :: Source -> Int
length = ByteString -> Int
B.length (ByteString -> Int) -> (Source -> ByteString) -> Source -> Int
forall b c a. (b -> c) -> (a -> b) -> a -> c
. Source -> ByteString
bytes
null :: Source -> Bool
null :: Source -> Bool
null = ByteString -> Bool
B.null (ByteString -> Bool) -> (Source -> ByteString) -> Source -> Bool
forall b c a. (b -> c) -> (a -> b) -> a -> c
. Source -> ByteString
bytes
totalRange :: Source -> Range
totalRange :: Source -> Range
totalRange = Int -> Int -> Range
Range Int
0 (Int -> Range) -> (Source -> Int) -> Source -> Range
forall b c a. (b -> c) -> (a -> b) -> a -> c
. ByteString -> Int
B.length (ByteString -> Int) -> (Source -> ByteString) -> Source -> Int
forall b c a. (b -> c) -> (a -> b) -> a -> c
. Source -> ByteString
bytes
totalSpan :: Source -> Span
totalSpan :: Source -> Span
totalSpan Source
source = Pos -> Pos -> Span
Span (Int -> Int -> Pos
Pos Int
1 Int
1) (Int -> Int -> Pos
Pos ([Range] -> Int
forall a. [a] -> Int
forall (t :: * -> *) a. Foldable t => t a -> Int
Prelude.length [Range]
ranges) (Int -> Int
forall a. Enum a => a -> a
succ (Range -> Int
end Range
lastRange Int -> Int -> Int
forall a. Num a => a -> a -> a
- Range -> Int
start Range
lastRange))) where
ranges :: [Range]
ranges = Source -> [Range]
lineRanges Source
source
lastRange :: Range
lastRange = Range -> Maybe Range -> Range
forall a. a -> Maybe a -> a
fromMaybe Range
forall s. Lower s => s
lowerBound (Last Range -> Maybe Range
forall a. Last a -> Maybe a
getLast ((Range -> Last Range) -> [Range] -> Last Range
forall m a. Monoid m => (a -> m) -> [a] -> m
forall (t :: * -> *) m a.
(Foldable t, Monoid m) =>
(a -> m) -> t a -> m
foldMap (Maybe Range -> Last Range
forall a. Maybe a -> Last a
Last (Maybe Range -> Last Range)
-> (Range -> Maybe Range) -> Range -> Last Range
forall b c a. (b -> c) -> (a -> b) -> a -> c
. Range -> Maybe Range
forall a. a -> Maybe a
Just) [Range]
ranges))
fromText :: T.Text -> Source
fromText :: Text -> Source
fromText = ByteString -> Source
Source (ByteString -> Source) -> (Text -> ByteString) -> Text -> Source
forall b c a. (b -> c) -> (a -> b) -> a -> c
. Text -> ByteString
T.encodeUtf8
toText :: Source -> T.Text
toText :: Source -> Text
toText = OnDecodeError -> ByteString -> Text
T.decodeUtf8With OnDecodeError
lenientDecode (ByteString -> Text) -> (Source -> ByteString) -> Source -> Text
forall b c a. (b -> c) -> (a -> b) -> a -> c
. Source -> ByteString
bytes
slice :: Source -> Range -> Source
slice :: Source -> Range -> Source
slice Source
source Range
range = Source -> Source
taking (Source -> Source) -> Source -> Source
forall a b. (a -> b) -> a -> b
$ Source -> Source
dropping Source
source where
dropping :: Source -> Source
dropping = Int -> Source -> Source
drop (Range -> Int
start Range
range)
taking :: Source -> Source
taking = Int -> Source -> Source
take (Range -> Int
rangeLength Range
range)
drop :: Int -> Source -> Source
drop :: Int -> Source -> Source
drop Int
i = ByteString -> Source
Source (ByteString -> Source)
-> (Source -> ByteString) -> Source -> Source
forall b c a. (b -> c) -> (a -> b) -> a -> c
. Int -> ByteString -> ByteString
B.drop Int
i (ByteString -> ByteString)
-> (Source -> ByteString) -> Source -> ByteString
forall b c a. (b -> c) -> (a -> b) -> a -> c
. Source -> ByteString
bytes
take :: Int -> Source -> Source
take :: Int -> Source -> Source
take Int
i = ByteString -> Source
Source (ByteString -> Source)
-> (Source -> ByteString) -> Source -> Source
forall b c a. (b -> c) -> (a -> b) -> a -> c
. Int -> ByteString -> ByteString
B.take Int
i (ByteString -> ByteString)
-> (Source -> ByteString) -> Source -> ByteString
forall b c a. (b -> c) -> (a -> b) -> a -> c
. Source -> ByteString
bytes
lines :: Source -> [Source]
lines :: Source -> [Source]
lines Source
source = Source -> Range -> Source
slice Source
source (Range -> Source) -> [Range] -> [Source]
forall (f :: * -> *) a b. Functor f => (a -> b) -> f a -> f b
<$> Source -> [Range]
lineRanges Source
source
lineRanges :: Source -> [Range]
lineRanges :: Source -> [Range]
lineRanges Source
source = Source -> Range -> [Range]
lineRangesWithin Source
source (Source -> Range
totalRange Source
source)
lineRangesWithin :: Source -> Range -> [Range]
lineRangesWithin :: Source -> Range -> [Range]
lineRangesWithin Source
source Range
range
= ([Int] -> [Int] -> [Range]) -> ([Int], [Int]) -> [Range]
forall a b c. (a -> b -> c) -> (a, b) -> c
uncurry ((Int -> Int -> Range) -> [Int] -> [Int] -> [Range]
forall a b c. (a -> b -> c) -> [a] -> [b] -> [c]
zipWith Int -> Int -> Range
Range)
(([Int], [Int]) -> [Range])
-> (Source -> ([Int], [Int])) -> Source -> [Range]
forall b c a. (b -> c) -> (a -> b) -> a -> c
. ((Range -> Int
start Range
rangeInt -> [Int] -> [Int]
forall a. a -> [a] -> [a]
:) ([Int] -> [Int]) -> ([Int] -> [Int]) -> [Int] -> ([Int], [Int])
forall b c c'. (b -> c) -> (b -> c') -> b -> (c, c')
forall (a :: * -> * -> *) b c c'.
Arrow a =>
a b c -> a b c' -> a b (c, c')
&&& ([Int] -> [Int] -> [Int]
forall a. Semigroup a => a -> a -> a
<> [ Range -> Int
end Range
range ]))
([Int] -> ([Int], [Int]))
-> (Source -> [Int]) -> Source -> ([Int], [Int])
forall b c a. (b -> c) -> (a -> b) -> a -> c
. (Int -> Int) -> [Int] -> [Int]
forall a b. (a -> b) -> [a] -> [b]
forall (f :: * -> *) a b. Functor f => (a -> b) -> f a -> f b
fmap (Int -> Int -> Int
forall a. Num a => a -> a -> a
+ Int -> Int
forall a. Enum a => a -> a
succ (Range -> Int
start Range
range))
([Int] -> [Int]) -> (Source -> [Int]) -> Source -> [Int]
forall b c a. (b -> c) -> (a -> b) -> a -> c
. ByteString -> [Int]
newlineIndices
(ByteString -> [Int]) -> (Source -> ByteString) -> Source -> [Int]
forall b c a. (b -> c) -> (a -> b) -> a -> c
. Source -> ByteString
bytes
(Source -> [Range]) -> Source -> [Range]
forall a b. (a -> b) -> a -> b
$ Source -> Range -> Source
slice Source
source Range
range
newlineIndices :: B.ByteString -> [Int]
newlineIndices :: ByteString -> [Int]
newlineIndices = Int -> ByteString -> [Int]
go Int
0 where
go :: Int -> ByteString -> [Int]
go Int
n ByteString
bs
| ByteString -> Bool
B.null ByteString
bs = []
| Bool
otherwise = case (ByteString -> Maybe Int
searchCR ByteString
bs, ByteString -> Maybe Int
searchLF ByteString
bs) of
(Maybe Int
Nothing, Maybe Int
Nothing) -> []
(Just Int
i, Maybe Int
Nothing) -> Int -> Int -> ByteString -> [Int]
recur Int
n Int
i ByteString
bs
(Maybe Int
Nothing, Just Int
i) -> Int -> Int -> ByteString -> [Int]
recur Int
n Int
i ByteString
bs
(Just Int
crI, Just Int
lfI)
| Int -> Int
forall a. Enum a => a -> a
succ Int
crI Int -> Int -> Bool
forall a. Eq a => a -> a -> Bool
== Int
lfI -> Int -> Int -> ByteString -> [Int]
recur Int
n Int
lfI ByteString
bs
| Bool
otherwise -> Int -> Int -> ByteString -> [Int]
recur Int
n (Int -> Int -> Int
forall a. Ord a => a -> a -> a
min Int
crI Int
lfI) ByteString
bs
recur :: Int -> Int -> ByteString -> [Int]
recur Int
n Int
i ByteString
bs = let j :: Int
j = Int
n Int -> Int -> Int
forall a. Num a => a -> a -> a
+ Int
i in Int
j Int -> [Int] -> [Int]
forall a. a -> [a] -> [a]
: Int -> ByteString -> [Int]
go (Int -> Int
forall a. Enum a => a -> a
succ Int
j) (Int -> ByteString -> ByteString
B.drop (Int -> Int
forall a. Enum a => a -> a
succ Int
i) ByteString
bs)
searchLF :: ByteString -> Maybe Int
searchLF = Word8 -> ByteString -> Maybe Int
B.elemIndex (Int -> Word8
forall a. Enum a => Int -> a
toEnum (Char -> Int
ord Char
'\n'))
searchCR :: ByteString -> Maybe Int
searchCR = Word8 -> ByteString -> Maybe Int
B.elemIndex (Int -> Word8
forall a. Enum a => Int -> a
toEnum (Char -> Int
ord Char
'\r'))
{-# INLINE newlineIndices #-}