fork download
  1. {-# OPTIONS_GHC -O2 #-}
  2. {-# LANGUAGE BangPatterns #-}
  3.  
  4. -- forked ideone.com/q3fma: use Int in nthHam for speed
  5.  
  6. -- rosettacode.org/wiki/Hamming_numbers#Haskell
  7. -- stackoverflow.com/a/10160054/849891
  8. -- stackoverflow.com/a/12041774/849891
  9. -- stackoverflow.com/a/60805693/849891
  10.  
  11. module Main where -- cf. ideone.com/k8PU3, GXh4P0, 01dpQu
  12.  
  13. import Data.List
  14. import Data.Function
  15.  
  16. hamming :: [Integer]
  17. hamming = 1 : map (2*) hamming `union` map (3*) hamming `union` map (5*) hamming
  18. where
  19. union a@(x:xs) b@(y:ys) = case compare x y of
  20. LT -> x : union xs b
  21. EQ -> x : union xs ys
  22. GT -> y : union a ys
  23.  
  24. main :: IO ()
  25. main =
  26. do
  27. s <- getLine
  28. case s of
  29. "a" -> do print $ take 20 hamming
  30. print (hamming !! 1690, hamming !! 1691)
  31. print $ hamming !! (1000000-1) -- 9 MB: releases the prefix of the list
  32. "b" -> do
  33. print $ hamming !! (1000000-1)
  34. print $ hamming !! 1000000 -- 77 MB: does NOT release the prefix (is needed twice)
  35. "c" -> do
  36. mapM_ print $ take 2 $ drop 999999 hamming -- 9 MB: used once, prefix gc-d
  37. "d" -> do
  38. let (_ ,(r,t)) = nthHam (1000000) -- 4 MB: stores upper band only
  39. (_ ,(r2,t2)) = nthHam (1000001)
  40. print (t,trival t)
  41. print (t2,trival t2)
  42. _ -> do -- 10^8: 4 MB 0.27 sec
  43. let (nb,(r,t)) = nthHam (read s) -- 10^9: 6 MB (-4=2) 1.42 sec ~n^0.7
  44. print (nb, t, showLogVal 2 r) -- 10^10: 14 MB (-4=10) 7.20 sec ~n^0.7
  45. -- print (case t of (i,j,k) -> 2^i*3^j*5^k)
  46. -- print (case t of (i,j,k) -> 2^i*3^j*5^k)
  47.  
  48. showLogVal :: Double -> Double -> String
  49. showLogVal base logval = show (10**y) ++ "E+" ++ show x
  50. where (x,y) = properFraction (logBase 10 base * logval)
  51.  
  52. trival (i,j,k) = 2^i * 3^j * 5^k
  53.  
  54. -- directly find n-th Hamming number (base 1, from 2), in ~ O(n^{2/3}) time
  55. -- based on "top band" idea by Louis Klauder from DDJ discussion,
  56. -- by Will Ness, my original post: drdobbs.com/blogs/architecture-and-design/228700538
  57. {-
  58. ln2 = log 2; ln3 = log 3; ln5 = log 5
  59. logval (i,j,k) = fromIntegral i*ln2 + fromIntegral j*ln3 + fromIntegral k*ln5
  60. estval n = (6*ln2*ln3*ln5* fromIntegral n)**(1/3) -- estimated logval
  61. rngval n
  62.   | n > 500000 = (1.698 , 0.0050) -- empirical
  63.   | n > 50000 = (1.693 , 0.0100) -- estimation
  64.   | n > 500 = (1.66 , 0.0500) -- correction
  65.   | n > 1 = (1.56 , 0.2000) -- (dist,width)
  66.   | otherwise = (1.56 , 0.4000)
  67.  
  68.  -- estval(n) = log (M[n]) = ln2 * logBase 2 (M[n])
  69. -}
  70. ww = logBase 2 30 / 2
  71. -- lb3 :: Double
  72. lb3 = logBase 2 3; lb5 = logBase 2 5 -- lb3 == log 3/log 2, lb5 == log 5/log 2
  73. -- logval2 :: (Int,Int,Int) -> Double
  74. logval2 (i,j,k) = fromIntegral i + fromIntegral j*lb3 + fromIntegral k*lb5
  75. -- estval2 :: Integer -> Double
  76. estval2 n = (6*lb3*lb5* fromIntegral n)**(1/3) -- estimated logval **Base 2**
  77. rngval2 n -- -1/v +2/v seems to works too
  78. | n > 500000 = (ww-(3/estval2 n), 6/estval2 n) -- space tweak !!! (thx, GBG!)
  79. | n > 500000 = (2.4496 , 0.0076 ) -- empirical
  80. | n > 50000 = (2.4424 , 0.0146 ) -- estimation
  81. | n > 500 = (2.3948 , 0.0723 ) -- correction - base 2
  82. | n > 1 = (2.2506 , 0.2887 ) -- (dist,width)
  83. | otherwise = (2.2506 , 0.5771 )
  84.  
  85. -- nthHam :: Integer -> ( (Int,Int), (Double, (Int, Int, Int))) -- ( 64-bits: use Int!! NB! )
  86. -- _band size stuff_ ---------------- (*1*)
  87.  
  88. nthHam :: Int -> ( (Bool, Double, Double), (Double, (Int, Int, Int)))
  89. -- _max logval, min delta in band_
  90. nthHam n -- n: 1-based 1,2,3...
  91. | w >= 1 = error $ "Breach of contract: (w < 1): " ++ show (w)
  92. | m < 0 = error $ "Not enough triples generated: " ++ show (c,n)
  93. | m >= nb = error $ "Generated band is too narrow: " ++ show (m,nb)
  94. | True = -- ((m,nb),res) -- m=target index in band from top, nb=band's length
  95. ( ( isTrulySorted ,
  96. fst (head s), ---------------- (*1*)
  97. minimum -- By (compare `on` abs)
  98. (zipWith (-) (map fst s) (tail (map fst s))) )
  99. , res)
  100. where
  101. isTrulySorted = and [a>b | let z=map (trival.snd) s, (a,b)<-zip z (tail z)]
  102. (d,w) = rngval2 n -- correction dist, width
  103. hi = estval2 n - d -- hi > logval2 > hi-w
  104. (c,b) = foldl_ -- total count, the band
  105. (\(!c,!b) (i,t) -> case t of [] -> (i+c,b)
  106. [x] -> (i+c,x:b))
  107. (0::Int,[]) -- ( 64bit: use Int!!! NB! )
  108. -- (sum *** concat) . unzip $
  109. [ ( fromIntegral i+1, -- total triples w/ this (j,k)
  110. [ (r,(i,j,k)) | frac < w ] ) -- store it, if inside band
  111. | k <- [ 0 .. floor ( hi /lb5) ], let p = fromIntegral k*lb5,
  112. j <- [ 0 .. floor ((hi-p)/lb3) ], let q = fromIntegral j*lb3 + p,
  113. let (i,frac) = pr (hi-q) ; r = hi - frac -- r = i + q
  114. ] where pr = properFraction -- pr 1.24 => (1,0.24)
  115. (m,nb) = ( fromIntegral $ c - n, length b ) -- m 0-based from top, |band|
  116. (s,res) = ( sortBy (flip compare `on` fst) b, s!!m ) -- sorted decreasing, result
  117. foldl_ = foldl'
Success #stdin #stdout 2.85s 15132KB
stdin
1000000000000

to print the full value as well, uncomment one of the
  `-- print (case t of (i,j,k) -> 2^i*3^j*5^k)`
lines in `main`, at its very end

------
2020-03-24: use `Int` in nthHam, now on 64 bit, for speed:

1B  0.02s 6.0MB
((True,2803.022191612378,1.325179255218245e-7),(1334,335,404),"6.216075755562335E+843")
1T  2.01s 15.1MB
((True,28052.292341476037,2.979504643008113e-9),(1126,16930,40),"3.814325005007765E+8444")
4T  5.81s 22.2MB   16 digits used.... 
                  still good (as evidenced by the `True` below), but really pushing it.
((True,44531.67942695671,7.275957614183426e-11),(16348,16503,873),"2.3509832704071347E+13405")
10T   11.13s 26.4MB
((True,60439.66391703062,7.275957614183426e-11),(18187,23771,1971),"1.4182592613214273E+18194")
13T   14.44s 30.4MB    ...still good
((True,65963.64327239885,5.820766091346741e-11),(28648,21308,1526),"1.0845209980457384E+19857")

same code on tio:
10T   16.77s
35T   38.84s 
((True,91766.48002166452,5.820766091346741e-11),(13824,2133,32112),"2.904528312044042E+27624")
60T   53.76s
((True,109828.1626252908,5.820766091346741e-11),(28123,45913,3848),"3.7265992051315013E+33061")
65T   53.98s
((True,112797.98518694332,5.820766091346741e-11),(26349,21177,22776),"3.7755976376763294E+33955")
68T   55.88s
((True,114507.3424180621,5.820766091346741e-11),(28179,16558,25877),"1.395679394278755E+34470")
70T   59.57s
((True,115619.15754088841,5.820766091346741e-11),(13125,13687,34799),"6.831047840502602E+34804")

on home machine:
100T: 368.13s     n^0.708
((True,130216.14085518729,5.820766091346741e-11),(88324,876,17444),"9.211106366443564E+39198")

140T: 466.69s     n^0.705
((True,145671.64804685948,5.820766091346741e-11),(9918,24002,42082),"3.432221006522245E+43851")

170T: 383.26s     n^0.076   ---FAULTY---
((False,155411.25012054382,0.0),(77201,27980,14584),"2.8050819114774215E+46783")
------

c  0.85s-8.0MB
a  0.87s-8.0MB 

is Double precision enough?
1T:   (28052.292341476037,2.983142621815205e-9) 14 significant digits needed.   iffy... but OK
100B: (13019.406212824639,4.964022082276642e-9) 14 significant digits needed. 
10B:   (6041.758782302383,2.292654244229198e-8) 12 significant digits needed. 
1B:    (2803.022191612377,1.325179255218245e-7) 11 significant digits needed.  


1T   (1126,16930, 40), "3.814325005007765E+8444"            ( GXh4P0 20% faster,  
100B (10178,1384,279), "1.705075482875041E+3919"                with explicit loops)
10B  (2177,  8, 1659), "5.629992181012814E+1818" 
1B   (1334, 335, 404), "6.216075755565590E+843"  
100M (  2,  454, 249), "1.814014330961032E+391"
____
old (32-bit) TIMINGS, without the isTrulySorted calculation which slowes it down by ~20% for 100B:
----
             target idx    
            (  from top,band size ) 
1T   13.39s-7.9MB (8609,22872)   37.63%    ~ n^0.69 time, n^0.33 space
100B  2.74s-6.9MB (3993,10609)   37.64%          --------    (no tweak: ~3.2s; ~175,000 band size)
50B   1.66s-6.9MB (3167,8421 )   37.61%             |
10B   0.49s-5.9MB (1854,4928 )   37.62%             n^(1/3) -- band size
1B    0.05s-4.9MB ( 862,2288 )   37.67%             |
100M  0.01s-4.9MB ( 399,1061 )   37.61%          --------
10M   0.00s-4.9MB ( 183,492  )   37.20% 
5M    0.00s-4.9MB ( 150,391  )   38.36%     ( no tweak:  5M 0-4.9  (74,238) 0.311%  )
1M    0.00s-4.9MB (  86,231  )   37.23%     ( no tweak:  1M 0-4.9  (12,79)  0.1519% )


stdout
((True,28052.292341476037,2.979504643008113e-9),(1126,16930,40),"3.814325005007765E+8444")
