@@ -17,11 +17,13 @@ module Regex.Internal.Num
17
17
import Control.Applicative ((<|>) , empty )
18
18
import qualified Control.Applicative as Ap
19
19
import Control.Monad (replicateM_ , void )
20
- import Data.Primitive.PrimArray
21
- (PrimArray (.. ), newPrimArray , runPrimArray , writePrimArray )
22
20
import Data.Bits ((.&.) , countLeadingZeros , unsafeShiftL , unsafeShiftR )
23
21
import Numeric.Natural (Natural )
22
+ #ifdef __GLASGOW_HASKELL__
23
+ import Data.Primitive.PrimArray
24
+ (PrimArray (.. ), newPrimArray , runPrimArray , writePrimArray )
24
25
import qualified GHC.Num.Natural as Nat
26
+ #endif
25
27
26
28
import Regex.Internal.Regex (RE )
27
29
import qualified Regex.Internal.Regex as R
@@ -221,10 +223,14 @@ mkWordRangeBase base quotRemPowBase powBase baseLen d low high
221
223
-- Parsing hexadecimal is simple, there is no base conversion involved.
222
224
--
223
225
-- Step 1: Accumulate the hex digits, packed into Words
224
- -- Step 2: Initialize a ByteArray and fill it with the Words
225
- --
226
- -- Because we create a Nat directly, this makes us depend on ghc-bignum and
227
- -- GHC>=9.0.
226
+ -- Step 2:
227
+ -- * GHC: Initialize a ByteArray and fill it with the Words. This takes
228
+ -- O(n) time. Because we create a Nat directly, this makes us depend on
229
+ -- ghc-bignum and GHC>=9.0.
230
+ -- * Not GHC: Do it like we do for decimal, without being aware of the
231
+ -- representation of Naturals, but replace the base multiplications with
232
+ -- shifts. If it is a binary representation, this takes O(n log n) time
233
+ -- instead of O(n^2).
228
234
229
235
stepHex :: NatParseState -> Word -> NatParseState
230
236
stepHex (NatParseState acc len ns) d
@@ -235,6 +241,7 @@ finishHex
235
241
:: Word -- ^ Leading digit
236
242
-> NatParseState -- ^ Everything else
237
243
-> Natural
244
+ #ifdef __GLASGOW_HASKELL__
238
245
finishHex ! ld (NatParseState acc0 len0 ns0) = case ns0 of
239
246
WNil -> Nat. naturalFromWord (ld `unsafeShiftL` (4 * (len0- 1 )) + acc0)
240
247
WCons n ns1 ->
@@ -268,6 +275,37 @@ finishHex !ld (NatParseState acc0 len0 ns0) = case ns0 of
268
275
-- * Natural invariants:
269
276
-- * If the value fits in a word, it must be NS (via naturalFromWord here).
270
277
-- * Otherwise, use a ByteArray# with NB. The highest Word must not be 0.
278
+ #else
279
+ finishHex ! ld (NatParseState acc0 len0 ns0) = combine acc0 len0 ns0
280
+ where
281
+ combine ! acc ! len ns = case ns of
282
+ WNil -> mul16Pow (w2n ld) (len- 1 ) + w2n acc
283
+ WCons n ns1 ->
284
+ mul16Pow (combine1 maxBoundWordHexLen (go n ns1)) len + w2n acc
285
+ where
286
+ go n WNil =
287
+ let ! n' = mul16Pow (w2n ld) (maxBoundWordHexLen - 1 ) + w2n n
288
+ in [n']
289
+ go n (WCons m WNil ) =
290
+ let ! n' = mul16Pow (w2n ld) (2 * maxBoundWordHexLen - 1 ) +
291
+ mul16Pow (w2n m) maxBoundWordHexLen +
292
+ w2n n
293
+ in [n']
294
+ go n (WCons m (WCons n1 ns1)) =
295
+ let ! n' = mul16Pow (w2n m) maxBoundWordHexLen + w2n n
296
+ in n' : go n1 ns1
297
+
298
+ combine1 :: Int -> [Natural ] -> Natural
299
+ combine1 ! _ [n] = n
300
+ combine1 ! numDigs ns1 = combine1 numDigs1 (go ns1)
301
+ where
302
+ numDigs1 = 2 * numDigs
303
+ go (n: m: ns) = let ! n' = mul16Pow m numDigs1 + n in n' : go ns
304
+ go ns = ns
305
+
306
+ mul16Pow :: Natural -> Int -> Natural
307
+ mul16Pow x p = unsafeShiftL x (4 * p)
308
+ #endif
271
309
272
310
-----------------------------
273
311
-- Parsing decimal Naturals
@@ -282,9 +320,10 @@ finishHex !ld (NatParseState acc0 len0 ns0) = case ns0 of
282
320
--
283
321
-- The obvious foldl approach is O(n^2) for n digits. The combine approach
284
322
-- performs O(n/2^i) multiplications of size O(2^i), for i in [0..log_2(n)].
285
- -- If multiplication is O(n^k), this is also O(n^k). We have k < 2,
286
- -- thanks to subquadratic multiplication of GMP-backed Naturals:
287
- -- https://gmplib.org/manual/Multiplication-Algorithms.
323
+ -- If multiplication is O(n^k), this is also O(n^k).
324
+ --
325
+ -- On GHC, we have k < 2, thanks to subquadratic multiplication of GMP-backed
326
+ -- Naturals: https://gmplib.org/manual/Multiplication-Algorithms.
288
327
--
289
328
-- For reference, here's how GMP converts any base (including 10) to a natural
290
329
-- using broadly the same approach.
@@ -311,6 +350,7 @@ finishDec !ld (NatParseState acc0 len0 ns0) = combine acc0 len0 ns0
311
350
go n (WCons m (WCons n1 ns1)) =
312
351
let ! n' = w2n m * safeBaseDec + w2n n in n' : go n1 ns1
313
352
353
+ combine1 :: Natural -> [Natural ] -> Natural
314
354
combine1 _ [n] = n
315
355
combine1 base ns1 = combine1 base1 (go ns1)
316
356
where
@@ -412,7 +452,7 @@ pow10 p = case p of
412
452
18 -> 1000000000000000000
413
453
19 -> 10000000000000000000
414
454
#endif
415
- _ -> errorWithoutStackTrace " Regex.Internal.Int.pow10: p too large"
455
+ _ -> error " Regex.Internal.Int.pow10: p too large"
416
456
#else
417
457
#error "unsupported word size"
418
458
#endif
0 commit comments