1
0
mirror of https://github.com/sjwhitworth/golearn.git synced 2025-04-25 13:48:49 +08:00
golearn/base/util_test.go
Richard Townsend 527c6476e1 Optimised version of KNN for Euclidean distances
This patch also:
   * Completes removal of the edf/ package
   * Corrects an erroneous print statement
   * Introduces two new CSV functions
      * ParseCSVToInstancesTemplated makes sure that
        reading a second CSV file maintains strict Attribute
        compatibility with an existing DenseInstances
      * ParseCSVToInstancesWithAttributeGroups gives more control
        over where Attributes end up in memory, important for
        gaining predictable control over the KNN optimisation
      * Decouples BinaryAttributeGroup from FixedAttributeGroup for
        better casting support
2014-09-30 23:10:22 +01:00

112 lines
3.7 KiB
Go

package base
import (
. "github.com/smartystreets/goconvey/convey"
"testing"
)
func TestClassDistributionAfterSplit(t *testing.T) {
Convey("Given the PlayTennis dataset", t, func() {
inst, err := ParseCSVToInstances("../examples/datasets/tennis.csv", true)
So(err, ShouldEqual, nil)
Convey("Splitting on Sunny should give the right result...", func() {
result := GetClassDistributionAfterSplit(inst, inst.AllAttributes()[0])
So(result["sunny"]["no"], ShouldEqual, 3)
So(result["sunny"]["yes"], ShouldEqual, 2)
So(result["overcast"]["yes"], ShouldEqual, 4)
So(result["rainy"]["yes"], ShouldEqual, 3)
So(result["rainy"]["no"], ShouldEqual, 2)
})
})
}
func TestPackAndUnpack(t *testing.T) {
Convey("Given some uint64", t, func() {
x := uint64(0xDEADBEEF)
Convey("When the integer is packed", func() {
packed := PackU64ToBytes(x)
Convey("And then unpacked", func() {
unpacked := UnpackBytesToU64(packed)
Convey("The unpacked version should be the same", func() {
So(x, ShouldEqual, unpacked)
})
})
})
})
Convey("Given another uint64", t, func() {
x := uint64(1)
Convey("When the integer is packed", func() {
packed := PackU64ToBytes(x)
Convey("And then unpacked", func() {
unpacked := UnpackBytesToU64(packed)
Convey("The unpacked version should be the same", func() {
So(x, ShouldEqual, unpacked)
})
})
})
})
}
func TestPackAndUnpackFloat(t *testing.T) {
Convey("Given some float", t, func() {
x := 1.2011
Convey("When the float gets packed", func() {
packed := PackFloatToBytes(x)
Convey("And then unpacked", func() {
unpacked := UnpackBytesToFloat(packed)
Convey("The unpacked version should be the same", func() {
So(unpacked, ShouldEqual, x)
})
})
})
})
}
func TestStrictlyCompatable(t *testing.T) {
Convey("Given two datasets...", t, func() {
Convey("Given two identical datasets", func() {
// Violates the requirement that both CategoricalAttributes
// must have values in the same order
d1, err := ParseCSVToInstances("../examples/datasets/exam.csv", true)
So(err, ShouldEqual, nil)
d2, err := ParseCSVToInstances("../examples/datasets/exams.csv", true)
So(err, ShouldEqual, nil)
So(CheckStrictlyCompatible(d1, d2), ShouldEqual, true)
})
Convey("Given two identical datasets (apart from sorting)", func() {
// Violates the requirement that both CategoricalAttributes
// must have values in the same order
d1, err := ParseCSVToInstances("../examples/datasets/iris_sorted_asc.csv", true)
So(err, ShouldEqual, nil)
d2, err := ParseCSVToInstances("../examples/datasets/iris_sorted_desc.csv", true)
So(err, ShouldEqual, nil)
So(CheckStrictlyCompatible(d1, d2), ShouldEqual, false)
})
Convey("Given two different datasets...", func() {
// Violates verything
d1, err := ParseCSVToInstances("../examples/datasets/tennis.csv", true)
So(err, ShouldEqual, nil)
d2, err := ParseCSVToInstances("../examples/datasets/iris_sorted_desc.csv", true)
So(err, ShouldEqual, nil)
So(CheckStrictlyCompatible(d1, d2), ShouldEqual, false)
})
})
}
func TestCategoricalEquality(t *testing.T) {
Convey("Given two outwardly identical class Attributes...", t, func() {
d1, err := ParseCSVToInstances("../examples/datasets/iris_sorted_asc.csv", true)
So(err, ShouldEqual, nil)
d2, err := ParseCSVToInstances("../examples/datasets/iris_sorted_desc.csv", true)
So(err, ShouldEqual, nil)
c1 := d1.AllClassAttributes()[0]
c2 := d2.AllClassAttributes()[0]
So(c1.GetName(), ShouldEqual, c2.GetName())
So(c1.Equals(c2), ShouldBeFalse)
So(c2.Equals(c1), ShouldBeFalse) // Violates the fact that Attributes must appear in the same order
})
}