{-# LANGUAGE BangPatterns #-} {-# LANGUAGE MagicHash #-} {-# LANGUAGE NoImplicitPrelude #-} {-# LANGUAGE TypeFamilies #-} {-# LANGUAGE FlexibleContexts #-} {-# LANGUAGE ScopedTypeVariables #-} {-# LANGUAGE CPP #-} module Basement.Alg.String ( copyFilter , validate , findIndexPredicate , revFindIndexPredicate ) where import GHC.Prim import GHC.ST import Basement.Alg.Class import Basement.Alg.UTF8 import Basement.Compat.Base import Basement.Numerical.Additive import Basement.Types.OffsetSize import Basement.PrimType import Basement.Block (MutableBlock(..)) import Basement.UTF8.Helper import Basement.UTF8.Table import Basement.UTF8.Types copyFilter :: forall s container . Indexable container Word8 => (Char -> Bool) -> CountOf Word8 -> MutableByteArray# s -> container -> Offset Word8 -> ST s (CountOf Word8) copyFilter :: forall s container. Indexable container Word8 => (Char -> Bool) -> CountOf Word8 -> MutableByteArray# s -> container -> Offset Word8 -> ST s (CountOf Word8) copyFilter Char -> Bool predicate !CountOf Word8 sz MutableByteArray# s dst container src Offset Word8 start = Offset Word8 -> Offset Word8 -> ST s (CountOf Word8) loop (Int -> Offset Word8 forall ty. Int -> Offset ty Offset Int 0) Offset Word8 start where !end :: Offset Word8 end = Offset Word8 start Offset Word8 -> CountOf Word8 -> Offset Word8 forall ty. Offset ty -> CountOf ty -> Offset ty `offsetPlusE` CountOf Word8 sz loop :: Offset Word8 -> Offset Word8 -> ST s (CountOf Word8) loop !Offset Word8 d !Offset Word8 s | Offset Word8 s Offset Word8 -> Offset Word8 -> Bool forall a. Eq a => a -> a -> Bool == Offset Word8 end = CountOf Word8 -> ST s (CountOf Word8) forall a. a -> ST s a forall (f :: * -> *) a. Applicative f => a -> f a pure (Offset Word8 -> CountOf Word8 forall a. Offset a -> CountOf a offsetAsSize Offset Word8 d) | Bool otherwise = let !h :: StepASCII h = container -> Offset Word8 -> StepASCII forall container. Indexable container Word8 => container -> Offset Word8 -> StepASCII nextAscii container src Offset Word8 s in case StepASCII -> Bool headerIsAscii StepASCII h of Bool True | Char -> Bool predicate (StepASCII -> Char toChar1 StepASCII h) -> MutableByteArray# (PrimState (ST s)) -> Offset Word8 -> Word8 -> ST s () forall ty (prim :: * -> *). (PrimType ty, PrimMonad prim) => MutableByteArray# (PrimState prim) -> Offset ty -> ty -> prim () primMbaWrite MutableByteArray# s MutableByteArray# (PrimState (ST s)) dst Offset Word8 d (StepASCII -> Word8 stepAsciiRawValue StepASCII h) ST s () -> ST s (CountOf Word8) -> ST s (CountOf Word8) forall a b. ST s a -> ST s b -> ST s b forall (m :: * -> *) a b. Monad m => m a -> m b -> m b >> Offset Word8 -> Offset Word8 -> ST s (CountOf Word8) loop (Offset Word8 d Offset Word8 -> Offset Word8 -> Offset Word8 forall a. Additive a => a -> a -> a + Int -> Offset Word8 forall ty. Int -> Offset ty Offset Int 1) (Offset Word8 s Offset Word8 -> Offset Word8 -> Offset Word8 forall a. Additive a => a -> a -> a + Int -> Offset Word8 forall ty. Int -> Offset ty Offset Int 1) | Bool otherwise -> Offset Word8 -> Offset Word8 -> ST s (CountOf Word8) loop Offset Word8 d (Offset Word8 s Offset Word8 -> Offset Word8 -> Offset Word8 forall a. Additive a => a -> a -> a + Int -> Offset Word8 forall ty. Int -> Offset ty Offset Int 1) Bool False -> case container -> Offset Word8 -> Step forall container. Indexable container Word8 => container -> Offset Word8 -> Step next container src Offset Word8 s of Step Char c Offset Word8 s' | Char -> Bool predicate Char c -> MutableBlock Word8 s -> Offset Word8 -> Char -> ST s (Offset Word8) forall (prim :: * -> *) container. (PrimMonad prim, RandomAccess container prim Word8) => container -> Offset Word8 -> Char -> prim (Offset Word8) writeUTF8 (MutableByteArray# s -> MutableBlock Word8 s forall ty st. MutableByteArray# st -> MutableBlock ty st MutableBlock MutableByteArray# s dst :: MutableBlock Word8 s) Offset Word8 d Char c ST s (Offset Word8) -> (Offset Word8 -> ST s (CountOf Word8)) -> ST s (CountOf Word8) forall a b. ST s a -> (a -> ST s b) -> ST s b forall (m :: * -> *) a b. Monad m => m a -> (a -> m b) -> m b >>= \Offset Word8 d' -> Offset Word8 -> Offset Word8 -> ST s (CountOf Word8) loop Offset Word8 d' Offset Word8 s' | Bool otherwise -> Offset Word8 -> Offset Word8 -> ST s (CountOf Word8) loop Offset Word8 d Offset Word8 s' {-# INLINE copyFilter #-} validate :: Indexable container Word8 => Offset Word8 -> container -> Offset Word8 -> (Offset Word8, Maybe ValidationFailure) validate :: forall container. Indexable container Word8 => Offset Word8 -> container -> Offset Word8 -> (Offset Word8, Maybe ValidationFailure) validate Offset Word8 end container ba Offset Word8 ofsStart = Offset Word8 -> (Offset Word8, Maybe ValidationFailure) loop4 Offset Word8 ofsStart where loop4 :: Offset Word8 -> (Offset Word8, Maybe ValidationFailure) loop4 !Offset Word8 ofs | Offset Word8 ofs4 Offset Word8 -> Offset Word8 -> Bool forall a. Ord a => a -> a -> Bool < Offset Word8 end = let h1 :: StepASCII h1 = container -> Offset Word8 -> StepASCII forall container. Indexable container Word8 => container -> Offset Word8 -> StepASCII nextAscii container ba Offset Word8 ofs h2 :: StepASCII h2 = container -> Offset Word8 -> StepASCII forall container. Indexable container Word8 => container -> Offset Word8 -> StepASCII nextAscii container ba (Offset Word8 ofsOffset Word8 -> Offset Word8 -> Offset Word8 forall a. Additive a => a -> a -> a +Offset Word8 1) h3 :: StepASCII h3 = container -> Offset Word8 -> StepASCII forall container. Indexable container Word8 => container -> Offset Word8 -> StepASCII nextAscii container ba (Offset Word8 ofsOffset Word8 -> Offset Word8 -> Offset Word8 forall a. Additive a => a -> a -> a +Offset Word8 2) h4 :: StepASCII h4 = container -> Offset Word8 -> StepASCII forall container. Indexable container Word8 => container -> Offset Word8 -> StepASCII nextAscii container ba (Offset Word8 ofsOffset Word8 -> Offset Word8 -> Offset Word8 forall a. Additive a => a -> a -> a +Offset Word8 3) in if StepASCII -> Bool headerIsAscii StepASCII h1 Bool -> Bool -> Bool && StepASCII -> Bool headerIsAscii StepASCII h2 Bool -> Bool -> Bool && StepASCII -> Bool headerIsAscii StepASCII h3 Bool -> Bool -> Bool && StepASCII -> Bool headerIsAscii StepASCII h4 then Offset Word8 -> (Offset Word8, Maybe ValidationFailure) loop4 Offset Word8 ofs4 else Offset Word8 -> (Offset Word8, Maybe ValidationFailure) loop Offset Word8 ofs | Bool otherwise = Offset Word8 -> (Offset Word8, Maybe ValidationFailure) loop Offset Word8 ofs where !ofs4 :: Offset Word8 ofs4 = Offset Word8 ofsOffset Word8 -> Offset Word8 -> Offset Word8 forall a. Additive a => a -> a -> a +Offset Word8 4 loop :: Offset Word8 -> (Offset Word8, Maybe ValidationFailure) loop !Offset Word8 ofs | Offset Word8 ofs Offset Word8 -> Offset Word8 -> Bool forall a. Eq a => a -> a -> Bool == Offset Word8 end = (Offset Word8 end, Maybe ValidationFailure forall a. Maybe a Nothing) | StepASCII -> Bool headerIsAscii StepASCII h = Offset Word8 -> (Offset Word8, Maybe ValidationFailure) loop (Offset Word8 ofs Offset Word8 -> Offset Word8 -> Offset Word8 forall a. Additive a => a -> a -> a + Int -> Offset Word8 forall ty. Int -> Offset ty Offset Int 1) | Bool otherwise = CountOf Word8 -> Offset Word8 -> (Offset Word8, Maybe ValidationFailure) multi (Int -> CountOf Word8 forall ty. Int -> CountOf ty CountOf (Int -> CountOf Word8) -> Int -> CountOf Word8 forall a b. (a -> b) -> a -> b $ StepASCII -> Int getNbBytes StepASCII h) Offset Word8 ofs where h :: StepASCII h = container -> Offset Word8 -> StepASCII forall container. Indexable container Word8 => container -> Offset Word8 -> StepASCII nextAscii container ba Offset Word8 ofs multi :: CountOf Word8 -> Offset Word8 -> (Offset Word8, Maybe ValidationFailure) multi (CountOf Int 0xff) Offset Word8 pos = (Offset Word8 pos, ValidationFailure -> Maybe ValidationFailure forall a. a -> Maybe a Just ValidationFailure InvalidHeader) multi CountOf Word8 nbConts Offset Word8 pos | (Offset Word8 posNext Offset Word8 -> CountOf Word8 -> Offset Word8 forall ty. Offset ty -> CountOf ty -> Offset ty `offsetPlusE` CountOf Word8 nbConts) Offset Word8 -> Offset Word8 -> Bool forall a. Ord a => a -> a -> Bool > Offset Word8 end = (Offset Word8 pos, ValidationFailure -> Maybe ValidationFailure forall a. a -> Maybe a Just ValidationFailure MissingByte) | Bool otherwise = case CountOf Word8 nbConts of CountOf Int 1 -> let c1 :: Word8 c1 = container -> Offset Word8 -> Word8 forall container ty. Indexable container ty => container -> Offset ty -> ty index container ba Offset Word8 posNext in if Word8 -> Bool isContinuation Word8 c1 then Offset Word8 -> (Offset Word8, Maybe ValidationFailure) loop (Offset Word8 pos Offset Word8 -> Offset Word8 -> Offset Word8 forall a. Additive a => a -> a -> a + Int -> Offset Word8 forall ty. Int -> Offset ty Offset Int 2) else (Offset Word8 pos, ValidationFailure -> Maybe ValidationFailure forall a. a -> Maybe a Just ValidationFailure InvalidContinuation) CountOf Int 2 -> let c1 :: Word8 c1 = container -> Offset Word8 -> Word8 forall container ty. Indexable container ty => container -> Offset ty -> ty index container ba Offset Word8 posNext c2 :: Word8 c2 = container -> Offset Word8 -> Word8 forall container ty. Indexable container ty => container -> Offset ty -> ty index container ba (Offset Word8 pos Offset Word8 -> Offset Word8 -> Offset Word8 forall a. Additive a => a -> a -> a + Int -> Offset Word8 forall ty. Int -> Offset ty Offset Int 2) in if Word8 -> Word8 -> Bool isContinuation2 Word8 c1 Word8 c2 then Offset Word8 -> (Offset Word8, Maybe ValidationFailure) loop (Offset Word8 pos Offset Word8 -> Offset Word8 -> Offset Word8 forall a. Additive a => a -> a -> a + Int -> Offset Word8 forall ty. Int -> Offset ty Offset Int 3) else (Offset Word8 pos, ValidationFailure -> Maybe ValidationFailure forall a. a -> Maybe a Just ValidationFailure InvalidContinuation) CountOf Int _ -> let c1 :: Word8 c1 = container -> Offset Word8 -> Word8 forall container ty. Indexable container ty => container -> Offset ty -> ty index container ba Offset Word8 posNext c2 :: Word8 c2 = container -> Offset Word8 -> Word8 forall container ty. Indexable container ty => container -> Offset ty -> ty index container ba (Offset Word8 pos Offset Word8 -> Offset Word8 -> Offset Word8 forall a. Additive a => a -> a -> a + Int -> Offset Word8 forall ty. Int -> Offset ty Offset Int 2) c3 :: Word8 c3 = container -> Offset Word8 -> Word8 forall container ty. Indexable container ty => container -> Offset ty -> ty index container ba (Offset Word8 pos Offset Word8 -> Offset Word8 -> Offset Word8 forall a. Additive a => a -> a -> a + Int -> Offset Word8 forall ty. Int -> Offset ty Offset Int 3) in if Word8 -> Word8 -> Word8 -> Bool isContinuation3 Word8 c1 Word8 c2 Word8 c3 then Offset Word8 -> (Offset Word8, Maybe ValidationFailure) loop (Offset Word8 pos Offset Word8 -> Offset Word8 -> Offset Word8 forall a. Additive a => a -> a -> a + Int -> Offset Word8 forall ty. Int -> Offset ty Offset Int 4) else (Offset Word8 pos, ValidationFailure -> Maybe ValidationFailure forall a. a -> Maybe a Just ValidationFailure InvalidContinuation) where posNext :: Offset Word8 posNext = Offset Word8 pos Offset Word8 -> Offset Word8 -> Offset Word8 forall a. Additive a => a -> a -> a + Int -> Offset Word8 forall ty. Int -> Offset ty Offset Int 1 {-# INLINE validate #-} findIndexPredicate :: Indexable container Word8 => (Char -> Bool) -> container -> Offset Word8 -> Offset Word8 -> Offset Word8 findIndexPredicate :: forall container. Indexable container Word8 => (Char -> Bool) -> container -> Offset Word8 -> Offset Word8 -> Offset Word8 findIndexPredicate Char -> Bool predicate container ba !Offset Word8 startIndex !Offset Word8 endIndex = Offset Word8 -> Offset Word8 loop Offset Word8 startIndex where loop :: Offset Word8 -> Offset Word8 loop !Offset Word8 i | Offset Word8 i Offset Word8 -> Offset Word8 -> Bool forall a. Ord a => a -> a -> Bool < Offset Word8 endIndex Bool -> Bool -> Bool && Bool -> Bool not (Char -> Bool predicate Char c) = Offset Word8 -> Offset Word8 loop (Offset Word8 i') | Bool otherwise = Offset Word8 i where Step Char c Offset Word8 i' = container -> Offset Word8 -> Step forall container. Indexable container Word8 => container -> Offset Word8 -> Step next container ba Offset Word8 i {-# INLINE findIndexPredicate #-} revFindIndexPredicate :: Indexable container Word8 => (Char -> Bool) -> container -> Offset Word8 -> Offset Word8 -> Offset Word8 revFindIndexPredicate :: forall container. Indexable container Word8 => (Char -> Bool) -> container -> Offset Word8 -> Offset Word8 -> Offset Word8 revFindIndexPredicate Char -> Bool predicate container ba Offset Word8 startIndex Offset Word8 endIndex | Offset Word8 endIndex Offset Word8 -> Offset Word8 -> Bool forall a. Ord a => a -> a -> Bool > Offset Word8 startIndex = Offset Word8 -> Offset Word8 loop Offset Word8 endIndex | Bool otherwise = Offset Word8 endIndex where loop :: Offset Word8 -> Offset Word8 loop !Offset Word8 i | Char -> Bool predicate Char c = Offset Word8 i' | Offset Word8 i' Offset Word8 -> Offset Word8 -> Bool forall a. Ord a => a -> a -> Bool > Offset Word8 startIndex = Offset Word8 -> Offset Word8 loop Offset Word8 i' | Bool otherwise = Offset Word8 endIndex where StepBack Char c Offset Word8 i' = container -> Offset Word8 -> StepBack forall container. Indexable container Word8 => container -> Offset Word8 -> StepBack prev container ba Offset Word8 i {-# INLINE revFindIndexPredicate #-}