2016-04-14 20:56:54 +00:00
|
|
|
<?php
|
|
|
|
|
2016-11-20 21:53:17 +00:00
|
|
|
declare(strict_types=1);
|
2016-04-14 20:56:54 +00:00
|
|
|
|
2018-01-06 12:09:33 +00:00
|
|
|
namespace Phpml\Tests\Classification;
|
2016-04-14 20:56:54 +00:00
|
|
|
|
2016-04-30 21:45:21 +00:00
|
|
|
use Phpml\Classification\NaiveBayes;
|
2018-11-07 08:39:51 +00:00
|
|
|
use Phpml\Exception\InvalidArgumentException;
|
2017-02-02 08:03:09 +00:00
|
|
|
use Phpml\ModelManager;
|
2017-02-03 11:58:25 +00:00
|
|
|
use PHPUnit\Framework\TestCase;
|
2016-04-14 20:56:54 +00:00
|
|
|
|
2017-02-03 11:58:25 +00:00
|
|
|
class NaiveBayesTest extends TestCase
|
2016-04-14 20:56:54 +00:00
|
|
|
{
|
2017-11-14 20:21:23 +00:00
|
|
|
public function testPredictSingleSample(): void
|
2016-04-14 20:56:54 +00:00
|
|
|
{
|
|
|
|
$samples = [[5, 1, 1], [1, 5, 1], [1, 1, 5]];
|
|
|
|
$labels = ['a', 'b', 'c'];
|
|
|
|
|
|
|
|
$classifier = new NaiveBayes();
|
|
|
|
$classifier->train($samples, $labels);
|
|
|
|
|
2018-10-28 06:44:52 +00:00
|
|
|
self::assertEquals('a', $classifier->predict([3, 1, 1]));
|
|
|
|
self::assertEquals('b', $classifier->predict([1, 4, 1]));
|
|
|
|
self::assertEquals('c', $classifier->predict([1, 1, 6]));
|
2016-04-14 20:56:54 +00:00
|
|
|
}
|
|
|
|
|
2017-11-14 20:21:23 +00:00
|
|
|
public function testPredictArrayOfSamples(): void
|
2016-04-14 20:56:54 +00:00
|
|
|
{
|
|
|
|
$trainSamples = [[5, 1, 1], [1, 5, 1], [1, 1, 5]];
|
|
|
|
$trainLabels = ['a', 'b', 'c'];
|
|
|
|
|
|
|
|
$testSamples = [[3, 1, 1], [5, 1, 1], [4, 3, 8], [1, 1, 2], [2, 3, 2], [1, 2, 1], [9, 5, 1], [3, 1, 2]];
|
|
|
|
$testLabels = ['a', 'a', 'c', 'c', 'b', 'b', 'a', 'a'];
|
|
|
|
|
|
|
|
$classifier = new NaiveBayes();
|
|
|
|
$classifier->train($trainSamples, $trainLabels);
|
|
|
|
$predicted = $classifier->predict($testSamples);
|
|
|
|
|
2018-10-28 06:44:52 +00:00
|
|
|
self::assertEquals($testLabels, $predicted);
|
2017-02-01 18:06:38 +00:00
|
|
|
|
|
|
|
// Feed an extra set of training data.
|
|
|
|
$samples = [[1, 1, 6]];
|
|
|
|
$labels = ['d'];
|
|
|
|
$classifier->train($samples, $labels);
|
|
|
|
|
|
|
|
$testSamples = [[1, 1, 6], [5, 1, 1]];
|
|
|
|
$testLabels = ['d', 'a'];
|
2018-10-28 06:44:52 +00:00
|
|
|
self::assertEquals($testLabels, $classifier->predict($testSamples));
|
2016-04-14 20:56:54 +00:00
|
|
|
}
|
2017-02-02 08:03:09 +00:00
|
|
|
|
2017-11-14 20:21:23 +00:00
|
|
|
public function testSaveAndRestore(): void
|
2017-02-02 08:03:09 +00:00
|
|
|
{
|
|
|
|
$trainSamples = [[5, 1, 1], [1, 5, 1], [1, 1, 5]];
|
|
|
|
$trainLabels = ['a', 'b', 'c'];
|
|
|
|
|
|
|
|
$testSamples = [[3, 1, 1], [5, 1, 1], [4, 3, 8]];
|
|
|
|
|
|
|
|
$classifier = new NaiveBayes();
|
|
|
|
$classifier->train($trainSamples, $trainLabels);
|
|
|
|
$predicted = $classifier->predict($testSamples);
|
|
|
|
|
2018-10-16 19:42:06 +00:00
|
|
|
$filename = 'naive-bayes-test-'.random_int(100, 999).'-'.uniqid('', false);
|
2018-10-28 06:44:52 +00:00
|
|
|
$filepath = (string) tempnam(sys_get_temp_dir(), $filename);
|
2017-02-02 08:03:09 +00:00
|
|
|
$modelManager = new ModelManager();
|
|
|
|
$modelManager->saveToFile($classifier, $filepath);
|
|
|
|
|
|
|
|
$restoredClassifier = $modelManager->restoreFromFile($filepath);
|
2018-10-28 06:44:52 +00:00
|
|
|
self::assertEquals($classifier, $restoredClassifier);
|
|
|
|
self::assertEquals($predicted, $restoredClassifier->predict($testSamples));
|
2017-02-02 08:03:09 +00:00
|
|
|
}
|
2018-01-31 20:44:44 +00:00
|
|
|
|
|
|
|
public function testPredictSimpleNumericLabels(): void
|
|
|
|
{
|
|
|
|
$samples = [[5, 1, 1], [1, 5, 1], [1, 1, 5]];
|
|
|
|
$labels = ['1996', '1997', '1998'];
|
|
|
|
|
|
|
|
$classifier = new NaiveBayes();
|
|
|
|
$classifier->train($samples, $labels);
|
|
|
|
|
2018-10-28 06:44:52 +00:00
|
|
|
self::assertEquals('1996', $classifier->predict([3, 1, 1]));
|
|
|
|
self::assertEquals('1997', $classifier->predict([1, 4, 1]));
|
|
|
|
self::assertEquals('1998', $classifier->predict([1, 1, 6]));
|
2018-01-31 20:44:44 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
public function testPredictArrayOfSamplesNumericalLabels(): void
|
|
|
|
{
|
|
|
|
$trainSamples = [[5, 1, 1], [1, 5, 1], [1, 1, 5]];
|
|
|
|
$trainLabels = ['1996', '1997', '1998'];
|
|
|
|
|
|
|
|
$testSamples = [[3, 1, 1], [5, 1, 1], [4, 3, 8], [1, 1, 2], [2, 3, 2], [1, 2, 1], [9, 5, 1], [3, 1, 2]];
|
|
|
|
$testLabels = ['1996', '1996', '1998', '1998', '1997', '1997', '1996', '1996'];
|
|
|
|
|
|
|
|
$classifier = new NaiveBayes();
|
|
|
|
$classifier->train($trainSamples, $trainLabels);
|
|
|
|
$predicted = $classifier->predict($testSamples);
|
|
|
|
|
2018-10-28 06:44:52 +00:00
|
|
|
self::assertEquals($testLabels, $predicted);
|
2018-01-31 20:44:44 +00:00
|
|
|
|
|
|
|
// Feed an extra set of training data.
|
|
|
|
$samples = [[1, 1, 6]];
|
|
|
|
$labels = ['1999'];
|
|
|
|
$classifier->train($samples, $labels);
|
|
|
|
|
|
|
|
$testSamples = [[1, 1, 6], [5, 1, 1]];
|
|
|
|
$testLabels = ['1999', '1996'];
|
2018-10-28 06:44:52 +00:00
|
|
|
self::assertEquals($testLabels, $classifier->predict($testSamples));
|
2018-01-31 20:44:44 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
public function testSaveAndRestoreNumericLabels(): void
|
|
|
|
{
|
|
|
|
$trainSamples = [[5, 1, 1], [1, 5, 1], [1, 1, 5]];
|
|
|
|
$trainLabels = ['1996', '1997', '1998'];
|
|
|
|
|
|
|
|
$testSamples = [[3, 1, 1], [5, 1, 1], [4, 3, 8]];
|
|
|
|
|
|
|
|
$classifier = new NaiveBayes();
|
|
|
|
$classifier->train($trainSamples, $trainLabels);
|
|
|
|
$predicted = $classifier->predict($testSamples);
|
|
|
|
|
2018-10-16 19:42:06 +00:00
|
|
|
$filename = 'naive-bayes-test-'.random_int(100, 999).'-'.uniqid('', false);
|
2018-10-28 06:44:52 +00:00
|
|
|
$filepath = (string) tempnam(sys_get_temp_dir(), $filename);
|
2018-01-31 20:44:44 +00:00
|
|
|
$modelManager = new ModelManager();
|
|
|
|
$modelManager->saveToFile($classifier, $filepath);
|
|
|
|
|
|
|
|
$restoredClassifier = $modelManager->restoreFromFile($filepath);
|
2018-10-28 06:44:52 +00:00
|
|
|
self::assertEquals($classifier, $restoredClassifier);
|
|
|
|
self::assertEquals($predicted, $restoredClassifier->predict($testSamples));
|
2018-01-31 20:44:44 +00:00
|
|
|
}
|
2018-11-07 08:39:51 +00:00
|
|
|
|
|
|
|
public function testInconsistentFeaturesInSamples(): void
|
|
|
|
{
|
|
|
|
$trainSamples = [[5, 1, 1], [1, 5, 1], [1, 1, 5]];
|
|
|
|
$trainLabels = ['1996', '1997', '1998'];
|
|
|
|
|
|
|
|
$testSamples = [[3, 1, 1], [5, 1], [4, 3, 8]];
|
|
|
|
|
|
|
|
$classifier = new NaiveBayes();
|
|
|
|
$classifier->train($trainSamples, $trainLabels);
|
|
|
|
|
|
|
|
$this->expectException(InvalidArgumentException::class);
|
|
|
|
|
|
|
|
$classifier->predict($testSamples);
|
|
|
|
}
|
2016-04-14 20:56:54 +00:00
|
|
|
}
|