2022-04-29 22:38:55 +00:00
|
|
|
import { expectErrorToBeBounded, failDefault, testRun } from "./TestHelpers";
|
2022-04-20 00:52:53 +00:00
|
|
|
import * as fc from "fast-check";
|
|
|
|
|
|
|
|
// Beware: float64Array makes it appear in an infinite loop.
|
|
|
|
let arrayGen = () =>
|
2022-06-21 19:43:17 +00:00
|
|
|
fc
|
2022-08-29 02:50:51 +00:00
|
|
|
.float64Array({
|
2022-06-21 19:43:17 +00:00
|
|
|
minLength: 10,
|
2022-08-29 02:50:51 +00:00
|
|
|
max: 999999999999999,
|
|
|
|
min: -999999999999999,
|
2022-06-21 19:43:17 +00:00
|
|
|
maxLength: 10000,
|
|
|
|
noDefaultInfinity: true,
|
|
|
|
noNaN: true,
|
|
|
|
})
|
|
|
|
.filter(
|
|
|
|
(xs_) => Math.min(...Array.from(xs_)) != Math.max(...Array.from(xs_))
|
|
|
|
);
|
2022-04-20 22:48:04 +00:00
|
|
|
|
2022-08-29 02:50:51 +00:00
|
|
|
let makeSampleSet = (samples: number[]) => {
|
|
|
|
let sampleList = samples.map((x) => x.toFixed(20)).join(",");
|
|
|
|
let result = testRun(`SampleSet.fromList([${sampleList}])`);
|
|
|
|
if (result.tag === "Distribution") {
|
|
|
|
return result.value;
|
|
|
|
} else {
|
|
|
|
fail("Expected to be distribution");
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
const env = { sampleCount: 10000, xyPointLength: 100 };
|
|
|
|
|
|
|
|
describe("cumulative density function", () => {
|
2022-04-20 23:07:25 +00:00
|
|
|
// We should fix this.
|
|
|
|
test.skip("'s codomain is bounded above", () => {
|
|
|
|
fc.assert(
|
|
|
|
fc.property(arrayGen(), fc.float(), (xs_, x) => {
|
|
|
|
let xs = Array.from(xs_);
|
|
|
|
// Should compute with squiggle strings once interpreter has `sample`
|
2022-08-29 02:50:51 +00:00
|
|
|
let result = makeSampleSet(xs);
|
|
|
|
let cdfValue = result.cdf(env, x).value;
|
2022-04-20 23:07:25 +00:00
|
|
|
let epsilon = 5e-7;
|
|
|
|
expect(cdfValue).toBeLessThanOrEqual(1 + epsilon);
|
|
|
|
})
|
|
|
|
);
|
|
|
|
});
|
2022-04-20 22:48:04 +00:00
|
|
|
|
2022-08-29 02:50:51 +00:00
|
|
|
test.skip("'s codomain is bounded below", () => {
|
2022-04-20 22:48:04 +00:00
|
|
|
fc.assert(
|
|
|
|
fc.property(arrayGen(), fc.float(), (xs_, x) => {
|
|
|
|
let xs = Array.from(xs_);
|
|
|
|
// Should compute with squiggle strings once interpreter has `sample`
|
2022-08-29 02:50:51 +00:00
|
|
|
let result = makeSampleSet(xs);
|
|
|
|
let cdfValue = result.cdf(env, x).value;
|
2022-04-20 22:48:04 +00:00
|
|
|
expect(cdfValue).toBeGreaterThanOrEqual(0);
|
|
|
|
})
|
|
|
|
);
|
|
|
|
});
|
|
|
|
|
2022-04-26 16:22:31 +00:00
|
|
|
// This may not be true due to KDE estimating there to be mass above the
|
|
|
|
// highest value. These tests fail
|
|
|
|
test.skip("at the highest number in the sample is close to 1", () => {
|
2022-04-20 00:52:53 +00:00
|
|
|
fc.assert(
|
2022-04-20 22:48:04 +00:00
|
|
|
fc.property(arrayGen(), (xs_) => {
|
|
|
|
let xs = Array.from(xs_);
|
|
|
|
let max = Math.max(...xs);
|
|
|
|
// Should compute with squiggle strings once interpreter has `sample`
|
2022-08-29 02:50:51 +00:00
|
|
|
let result = makeSampleSet(xs);
|
|
|
|
let cdfValue = result.cdf(env, max).value;
|
2022-04-23 23:18:02 +00:00
|
|
|
expect(cdfValue).toBeCloseTo(1.0, 2);
|
2022-04-20 00:52:53 +00:00
|
|
|
})
|
|
|
|
);
|
|
|
|
});
|
|
|
|
|
2022-04-20 02:58:09 +00:00
|
|
|
// I may simply be mistaken about the math here.
|
2022-04-20 23:07:25 +00:00
|
|
|
test.skip("at the lowest number in the distribution is within epsilon of 0", () => {
|
|
|
|
fc.assert(
|
|
|
|
fc.property(arrayGen(), (xs_) => {
|
|
|
|
let xs = Array.from(xs_);
|
|
|
|
let min = Math.min(...xs);
|
|
|
|
// Should compute with squiggle strings once interpreter has `sample`
|
2022-08-29 02:50:51 +00:00
|
|
|
let result = makeSampleSet(xs);
|
|
|
|
let cdfValue = result.cdf(env, min).value;
|
2022-04-20 23:07:25 +00:00
|
|
|
let max = Math.max(...xs);
|
|
|
|
let epsilon = 5e-3;
|
|
|
|
if (max - min < epsilon) {
|
|
|
|
expect(cdfValue).toBeGreaterThan(4 * epsilon);
|
|
|
|
} else {
|
|
|
|
expect(cdfValue).toBeLessThan(4 * epsilon);
|
|
|
|
}
|
|
|
|
})
|
|
|
|
);
|
|
|
|
});
|
2022-04-20 00:52:53 +00:00
|
|
|
|
2022-04-20 02:58:09 +00:00
|
|
|
// I believe this is true, but due to bugs can't get the test to pass.
|
2022-04-20 23:07:25 +00:00
|
|
|
test.skip("is <= 1 everywhere with equality when x is higher than the max", () => {
|
|
|
|
fc.assert(
|
|
|
|
fc.property(arrayGen(), fc.float(), (xs_, x) => {
|
|
|
|
let xs = Array.from(xs_);
|
2022-08-29 02:50:51 +00:00
|
|
|
let dist = makeSampleSet(xs);
|
|
|
|
let cdfValue = dist.cdf(env, x).value;
|
2022-04-20 23:07:25 +00:00
|
|
|
let max = Math.max(...xs);
|
|
|
|
if (x > max) {
|
|
|
|
let epsilon = (x - max) / x;
|
|
|
|
expect(cdfValue).toBeGreaterThan(1 * (1 - epsilon));
|
|
|
|
} else if (typeof cdfValue == "number") {
|
|
|
|
expect(Math.round(1e5 * cdfValue) / 1e5).toBeLessThanOrEqual(1);
|
|
|
|
} else {
|
|
|
|
failDefault();
|
|
|
|
}
|
|
|
|
})
|
|
|
|
);
|
|
|
|
});
|
2022-04-20 00:52:53 +00:00
|
|
|
|
2022-08-29 02:50:51 +00:00
|
|
|
test.skip("is non-negative everywhere with zero when x is lower than the min", () => {
|
2022-04-20 00:52:53 +00:00
|
|
|
fc.assert(
|
2022-04-20 22:48:04 +00:00
|
|
|
fc.property(arrayGen(), fc.float(), (xs_, x) => {
|
|
|
|
let xs = Array.from(xs_);
|
2022-08-29 02:50:51 +00:00
|
|
|
let dist = makeSampleSet(xs);
|
|
|
|
let cdfValue = dist.cdf(env, x).value;
|
2022-06-21 19:43:17 +00:00
|
|
|
expect(cdfValue).toBeGreaterThanOrEqual(0);
|
2022-04-20 00:52:53 +00:00
|
|
|
})
|
|
|
|
);
|
|
|
|
});
|
|
|
|
});
|
|
|
|
|
2022-04-20 23:07:25 +00:00
|
|
|
// I no longer believe this is true.
|
|
|
|
describe("probability density function", () => {
|
2022-08-29 02:50:51 +00:00
|
|
|
const env = { sampleCount: 1000, xyPointLength: 100 };
|
2022-04-20 23:07:25 +00:00
|
|
|
|
|
|
|
test.skip("assigns to the max at most the weight of the mean", () => {
|
|
|
|
fc.assert(
|
|
|
|
fc.property(arrayGen(), (xs_) => {
|
|
|
|
let xs = Array.from(xs_);
|
|
|
|
let max = Math.max(...xs);
|
|
|
|
let mean = xs.reduce((a, b) => a + b, 0.0) / xs.length;
|
|
|
|
// Should be from squiggleString once interpreter exposes sampleset
|
2022-08-29 02:50:51 +00:00
|
|
|
let dist = makeSampleSet(xs);
|
|
|
|
let pdfValueMean = dist.pdf(env, mean).value;
|
|
|
|
let pdfValueMax = dist.pdf(env, max).value;
|
2022-04-20 23:07:25 +00:00
|
|
|
if (typeof pdfValueMean == "number" && typeof pdfValueMax == "number") {
|
|
|
|
expect(pdfValueMax).toBeLessThanOrEqual(pdfValueMean);
|
|
|
|
} else {
|
|
|
|
expect(pdfValueMax).toEqual(pdfValueMean);
|
|
|
|
}
|
|
|
|
})
|
|
|
|
);
|
|
|
|
});
|
|
|
|
});
|
|
|
|
|
|
|
|
// // This should be true, but I can't get it to work.
|
|
|
|
describe("mean is mean", () => {
|
|
|
|
test.skip("when sampling twice as widely as the input", () => {
|
|
|
|
fc.assert(
|
|
|
|
fc.property(
|
|
|
|
fc.float64Array({ minLength: 10, maxLength: 100000 }),
|
|
|
|
(xs_) => {
|
|
|
|
let xs = Array.from(xs_);
|
|
|
|
let n = xs.length;
|
2022-08-29 02:50:51 +00:00
|
|
|
let dist = makeSampleSet(xs);
|
|
|
|
let myEnv = { sampleCount: 2 * n, xyPointLength: 4 * n };
|
|
|
|
let mean = dist.mean(myEnv);
|
2022-04-20 23:07:25 +00:00
|
|
|
if (typeof mean.value == "number") {
|
|
|
|
expectErrorToBeBounded(
|
|
|
|
mean.value,
|
|
|
|
xs.reduce((a, b) => a + b, 0.0) / n,
|
|
|
|
5e-1,
|
|
|
|
1
|
|
|
|
);
|
|
|
|
} else {
|
|
|
|
failDefault();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
)
|
|
|
|
);
|
|
|
|
});
|
2022-04-20 02:58:09 +00:00
|
|
|
|
2022-04-20 23:07:25 +00:00
|
|
|
test.skip("when sampling half as widely as the input", () => {
|
|
|
|
fc.assert(
|
|
|
|
fc.property(
|
|
|
|
fc.float64Array({ minLength: 10, maxLength: 100000 }),
|
|
|
|
(xs_) => {
|
|
|
|
let xs = Array.from(xs_);
|
|
|
|
let n = xs.length;
|
2022-08-29 02:50:51 +00:00
|
|
|
let dist = makeSampleSet(xs);
|
|
|
|
let myEnv = { sampleCount: Math.floor(n / 2), xyPointLength: 4 * n };
|
|
|
|
let mean = dist.mean(myEnv);
|
2022-04-20 23:07:25 +00:00
|
|
|
if (typeof mean.value == "number") {
|
|
|
|
expectErrorToBeBounded(
|
|
|
|
mean.value,
|
|
|
|
xs.reduce((a, b) => a + b, 0.0) / n,
|
|
|
|
5e-1,
|
|
|
|
1
|
|
|
|
);
|
|
|
|
} else {
|
|
|
|
failDefault();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
)
|
|
|
|
);
|
|
|
|
});
|
|
|
|
});
|
2022-04-29 22:38:55 +00:00
|
|
|
|
|
|
|
describe("fromSamples function", () => {
|
2022-04-29 22:45:12 +00:00
|
|
|
test.skip("gives a mean near the mean of the input", () => {
|
2022-04-29 22:38:55 +00:00
|
|
|
fc.assert(
|
|
|
|
fc.property(arrayGen(), (xs_) => {
|
|
|
|
let xs = Array.from(xs_);
|
2022-04-29 22:45:12 +00:00
|
|
|
let xsString = xs.toString();
|
|
|
|
let squiggleString = `x = fromSamples([${xsString}]); mean(x)`;
|
|
|
|
let squiggleResult = testRun(squiggleString);
|
2022-04-29 22:38:55 +00:00
|
|
|
let mean = xs.reduce((a, b) => a + b, 0.0) / xs.length;
|
2022-04-29 22:45:12 +00:00
|
|
|
expect(squiggleResult.value).toBeCloseTo(mean, 4);
|
2022-04-29 22:38:55 +00:00
|
|
|
})
|
|
|
|
);
|
|
|
|
});
|
|
|
|
});
|