jvmTest.plot.builder.sampling.method.GroupSystematicSamplingTest.kt Maven / Gradle / Ivy
/*
* Copyright (c) 2019. JetBrains s.r.o.
* Use of this source code is governed by the MIT license that can be found in the LICENSE file.
*/
package jetbrains.datalore.plot.builder.sampling.method
import jetbrains.datalore.plot.base.DataFrame
import jetbrains.datalore.plot.builder.sampling.GroupAwareSampling
import kotlin.test.*
internal class GroupSystematicSamplingTest : GroupSamplingTestBase() {
@BeforeTest
fun setUp() {
setUp(
N_POINTS,
N_GROUPS
)
}
private fun assertThat(sampleSize: Int): SamplingAssert {
return SamplingAssert(sampleSize)
}
@Test
fun noop() {
// not applicable with steps < 1.5
assertThat(N_GROUPS + 1).isNotApplicable
assertThat(N_GROUPS).isNotApplicable
assertThat(N_GROUPS - 1).isNotApplicable
assertThat(sampleSize(1.1)).isNotApplicable
// applicable with steps >= 1.5
assertThat(N_GROUPS / 2).isApplicable
val napSampling = assertThat(N_GROUPS).isNotApplicable.sampling
assertFailsWith(RuntimeException::class) {
napSampling.apply(data!!, groupMapper!!)
}
}
@Test
fun exactStep() {
// step 3 is a perfect fit when last data index in 9, 99... (i.e. that size of data is 10, 100...)
assertThat(sampleSize(3.0))
.hasGroupCount(sampleSize(3.0))
.hasGroup(0)
.hasGroup(N_GROUPS - 1)
}
@Test
fun roundDownStep() {
// rounded to closest lesser int
val targetStep = 3.1
val expectedStep = 3
assertThat(sampleSize(targetStep))
.hasGroupCount(sampleSize(expectedStep.toDouble()))
.hasGroup(0)
.hasGroup(N_GROUPS - 1)
}
@Test
fun roundUpStep() {
// rounded to closest greater int
val targetStep = 2.9
val expectedStep = 3
assertThat(sampleSize(targetStep))
.hasGroupCount(sampleSize(expectedStep.toDouble()))
.hasGroup(0)
.hasGroup(N_GROUPS - 1)
}
@Test
fun unfitStep() {
assertThat(sampleSize(2.0))
.hasGroupCount(sampleSize(2.0))
.hasGroup(0)
.hasNoGroup(N_GROUPS - 1)
}
private inner class SamplingAssert internal constructor(sampleSize: Int) {
internal val sampling: GroupAwareSampling
private val mySample: DataFrame?
internal val isApplicable: SamplingAssert
get() {
assertTrue(sampling.isApplicable(data!!, groupMapper!!))
return this
}
internal val isNotApplicable: SamplingAssert
get() {
assertFalse(sampling.isApplicable(data!!, groupMapper!!))
return this
}
init {
sampling = GroupSystematicSampling(sampleSize)
if (sampling.isApplicable(data!!, groupMapper!!)) {
mySample = sampling.apply(data!!, groupMapper!!)
} else {
mySample = null
}
}
internal fun hasGroupCount(expected: Int): SamplingAssert {
val groupCount = mySample!![GROUP_SERIE_VAR].distinct().count()
assertEquals(expected, groupCount, "Group count")
return this
}
internal fun hasGroup(distinctGroupIndex: Int): SamplingAssert {
val b = checkGroup(distinctGroupIndex)
assertTrue(b, "Group [$distinctGroupIndex]")
return this
}
internal fun hasNoGroup(distinctGroupIndex: Int): SamplingAssert {
val b = checkGroup(distinctGroupIndex)
assertFalse(b, "Group [$distinctGroupIndex]")
return this
}
private fun checkGroup(distinctGroupIndex: Int): Boolean {
val originalDistinctGroups = data!![GROUP_SERIE_VAR].distinct()
val v = originalDistinctGroups[distinctGroupIndex]
return mySample!![GROUP_SERIE_VAR].any { v == it }
}
}
companion object {
private const val N_GROUPS = 100
private const val POINTS_PER_GROUP = 100
private const val N_POINTS = N_GROUPS * POINTS_PER_GROUP
private fun sampleSize(step: Double): Int {
return SystematicSamplingTest.sampleSize(
step,
N_GROUPS
)
}
}
}