2017-02-17 01:23:55 +03:00
|
|
|
<?php
|
|
|
|
|
|
|
|
declare(strict_types=1);
|
|
|
|
|
2017-09-02 21:39:59 +02:00
|
|
|
namespace tests\Phpml\Classification\Linear;
|
2017-02-17 01:23:55 +03:00
|
|
|
|
|
|
|
use Phpml\Classification\Linear\DecisionStump;
|
|
|
|
use Phpml\ModelManager;
|
|
|
|
use PHPUnit\Framework\TestCase;
|
|
|
|
|
|
|
|
class DecisionStumpTest extends TestCase
|
|
|
|
{
|
|
|
|
public function testPredictSingleSample()
|
|
|
|
{
|
2017-03-05 11:43:19 +03:00
|
|
|
// Samples should be separable with a line perpendicular
|
|
|
|
// to any dimension given in the dataset
|
|
|
|
//
|
2017-02-17 01:23:55 +03:00
|
|
|
// First: horizontal test
|
|
|
|
$samples = [[0, 0], [1, 0], [0, 1], [1, 1]];
|
|
|
|
$targets = [0, 0, 1, 1];
|
|
|
|
$classifier = new DecisionStump();
|
|
|
|
$classifier->train($samples, $targets);
|
|
|
|
$this->assertEquals(0, $classifier->predict([0.1, 0.2]));
|
|
|
|
$this->assertEquals(0, $classifier->predict([1.1, 0.2]));
|
|
|
|
$this->assertEquals(1, $classifier->predict([0.1, 0.99]));
|
|
|
|
$this->assertEquals(1, $classifier->predict([1.1, 0.8]));
|
|
|
|
|
|
|
|
// Then: vertical test
|
|
|
|
$samples = [[0, 0], [1, 0], [0, 1], [1, 1]];
|
|
|
|
$targets = [0, 1, 0, 1];
|
|
|
|
$classifier = new DecisionStump();
|
|
|
|
$classifier->train($samples, $targets);
|
|
|
|
$this->assertEquals(0, $classifier->predict([0.1, 0.2]));
|
|
|
|
$this->assertEquals(0, $classifier->predict([0.1, 1.1]));
|
|
|
|
$this->assertEquals(1, $classifier->predict([1.0, 0.99]));
|
|
|
|
$this->assertEquals(1, $classifier->predict([1.1, 0.1]));
|
|
|
|
|
2017-03-05 11:43:19 +03:00
|
|
|
// By use of One-v-Rest, DecisionStump can perform multi-class classification
|
|
|
|
// The samples should be separable by lines perpendicular to the dimensions
|
|
|
|
$samples = [
|
|
|
|
[0, 0], [0, 1], [1, 0], [1, 1], // First group : a cluster at bottom-left corner in 2D
|
|
|
|
[5, 5], [6, 5], [5, 6], [7, 5], // Second group: another cluster at the middle-right
|
2017-11-22 22:16:10 +01:00
|
|
|
[3, 10], [3, 10], [3, 8], [3, 9], // Third group : cluster at the top-middle
|
2017-03-05 11:43:19 +03:00
|
|
|
];
|
|
|
|
$targets = [0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2];
|
|
|
|
|
|
|
|
$classifier = new DecisionStump();
|
|
|
|
$classifier->train($samples, $targets);
|
|
|
|
$this->assertEquals(0, $classifier->predict([0.5, 0.5]));
|
|
|
|
$this->assertEquals(1, $classifier->predict([6.0, 5.0]));
|
|
|
|
$this->assertEquals(2, $classifier->predict([3.5, 9.5]));
|
|
|
|
|
2017-02-17 01:23:55 +03:00
|
|
|
return $classifier;
|
|
|
|
}
|
|
|
|
|
2017-11-14 21:21:23 +01:00
|
|
|
public function testSaveAndRestore(): void
|
2017-02-17 01:23:55 +03:00
|
|
|
{
|
|
|
|
// Instantinate new Percetron trained for OR problem
|
|
|
|
$samples = [[0, 0], [1, 0], [0, 1], [1, 1]];
|
|
|
|
$targets = [0, 1, 1, 1];
|
|
|
|
$classifier = new DecisionStump();
|
|
|
|
$classifier->train($samples, $targets);
|
|
|
|
$testSamples = [[0, 1], [1, 1], [0.2, 0.1]];
|
|
|
|
$predicted = $classifier->predict($testSamples);
|
|
|
|
|
2017-11-22 22:16:10 +01:00
|
|
|
$filename = 'dstump-test-'.random_int(100, 999).'-'.uniqid();
|
2017-02-17 01:23:55 +03:00
|
|
|
$filepath = tempnam(sys_get_temp_dir(), $filename);
|
|
|
|
$modelManager = new ModelManager();
|
|
|
|
$modelManager->saveToFile($classifier, $filepath);
|
|
|
|
|
|
|
|
$restoredClassifier = $modelManager->restoreFromFile($filepath);
|
|
|
|
$this->assertEquals($classifier, $restoredClassifier);
|
|
|
|
$this->assertEquals($predicted, $restoredClassifier->predict($testSamples));
|
|
|
|
}
|
|
|
|
}
|