time-to-botec/ocaml/samples.ml

72 lines
2.2 KiB
OCaml

(* Constants *)
let pi = acos (-1.)
let normal_95_ci_length = 1.6448536269514722
(* Array manipulation helpers *)
let sumFloats xs = Array.fold_left(fun acc x -> acc +. x) 0.0 xs
let normalizeXs xs =
let sum_xs = sumFloats xs in
Array.map(fun x -> x /. sum_xs) xs
let cumsumXs xs =
let _, cum_sum = Array.fold_left(fun (sum, ys) x ->
let new_sum = sum +. x in
new_sum, ys @ [new_sum]
) (0.0, []) xs in
cum_sum
let findIndex xs test =
let rec recursiveHelper ys i =
match ys with
| [] -> None
| z :: zs -> if test z then Some i else recursiveHelper zs (i+1)
in
recursiveHelper xs 0
(* Basic samplers *)
let sampleZeroToOne () : float = Random.float 1.0
let sampleStandardNormal (): float =
let u1 = sampleZeroToOne () in
let u2 = sampleZeroToOne () in
let z = sqrt(-2.0 *. log(u1)) *. sin(2.0 *. pi *. u2) in
z
let sampleNormal mean std = mean +. std *. (sampleStandardNormal ())
let sampleLognormal logmean logstd = exp(sampleNormal logmean logstd)
let sampleTo low high =
let loglow = log(low) in
let loghigh = log(high) in
let logmean = (loglow +. loghigh) /. 2.0 in
let logstd = (loghigh -. loglow) /. (2.0 -. normal_95_ci_length ) in
sampleLognormal logmean logstd
let mixture (samplers: (unit -> float) array) (weights: float array): float option =
if (Array.length samplers == Array.length weights)
then None
else
let normalized_weights = normalizeXs weights in
let cumsummed_normalized_weights = cumsumXs normalized_weights in
let p = sampleZeroToOne () in
let chosenSamplerIndex = findIndex cumsummed_normalized_weights (fun x -> x < p) in
let sample = match chosenSamplerIndex with
| None -> None
| Some(i) -> Some (samplers.(i) ())
in
sample
let () =
let sample0 () = 0. in
let sample1 () = 1. in
let sampleFew () = sampleTo 1. 3. in
let sampleMany () = sampleTo 2. 10. in
let p1 = 0.8 in
let p2 = 0.5 in
let p3 = p1 *. p2 in
let weights = [| 1. -. p3; p3 /. 2.; p3 /. 4.; p3/. 4. |] in
let sampler () = mixture [| sample0; sample1; sampleFew; sampleMany |] weights in
let n = 1_000_000 in
let samples = Array.init n (fun _ -> sampler ()) in
(* let mean = sumFloats samples /. n in *)
Printf.printf "Hello world\n"