mirror of
https://github.com/Llewellynvdm/php-ml.git
synced 2024-11-11 16:15:50 +00:00
138 lines
3.4 KiB
PHP
138 lines
3.4 KiB
PHP
<?php
|
|
|
|
declare(strict_types=1);
|
|
|
|
namespace Phpml\Tests\Preprocessing;
|
|
|
|
use Phpml\Exception\NormalizerException;
|
|
use Phpml\Preprocessing\Normalizer;
|
|
use PHPUnit\Framework\TestCase;
|
|
|
|
class NormalizerTest extends TestCase
|
|
{
|
|
public function testThrowExceptionOnInvalidNorm(): void
|
|
{
|
|
$this->expectException(NormalizerException::class);
|
|
new Normalizer(99);
|
|
}
|
|
|
|
public function testNormalizeSamplesWithL2Norm(): void
|
|
{
|
|
$samples = [
|
|
[1, -1, 2],
|
|
[2, 0, 0],
|
|
[0, 1, -1],
|
|
];
|
|
|
|
$normalized = [
|
|
[0.4, -0.4, 0.81],
|
|
[1.0, 0.0, 0.0],
|
|
[0.0, 0.7, -0.7],
|
|
];
|
|
|
|
$normalizer = new Normalizer();
|
|
$normalizer->transform($samples);
|
|
|
|
self::assertEqualsWithDelta($normalized, $samples, $delta = 0.01);
|
|
}
|
|
|
|
public function testNormalizeSamplesWithL1Norm(): void
|
|
{
|
|
$samples = [
|
|
[1, -1, 2],
|
|
[2, 0, 0],
|
|
[0, 1, -1],
|
|
];
|
|
|
|
$normalized = [
|
|
[0.25, -0.25, 0.5],
|
|
[1.0, 0.0, 0.0],
|
|
[0.0, 0.5, -0.5],
|
|
];
|
|
|
|
$normalizer = new Normalizer(Normalizer::NORM_L1);
|
|
$normalizer->transform($samples);
|
|
|
|
self::assertEqualsWithDelta($normalized, $samples, $delta = 0.01);
|
|
}
|
|
|
|
public function testFitNotChangeNormalizerBehavior(): void
|
|
{
|
|
$samples = [
|
|
[1, -1, 2],
|
|
[2, 0, 0],
|
|
[0, 1, -1],
|
|
];
|
|
|
|
$normalized = [
|
|
[0.4, -0.4, 0.81],
|
|
[1.0, 0.0, 0.0],
|
|
[0.0, 0.7, -0.7],
|
|
];
|
|
|
|
$normalizer = new Normalizer();
|
|
$normalizer->transform($samples);
|
|
|
|
self::assertEqualsWithDelta($normalized, $samples, $delta = 0.01);
|
|
|
|
$normalizer->fit($samples);
|
|
|
|
self::assertEqualsWithDelta($normalized, $samples, $delta = 0.01);
|
|
}
|
|
|
|
public function testL1NormWithZeroSumCondition(): void
|
|
{
|
|
$samples = [
|
|
[0, 0, 0],
|
|
[2, 0, 0],
|
|
[0, 1, -1],
|
|
];
|
|
|
|
$normalized = [
|
|
[0.33, 0.33, 0.33],
|
|
[1.0, 0.0, 0.0],
|
|
[0.0, 0.5, -0.5],
|
|
];
|
|
|
|
$normalizer = new Normalizer(Normalizer::NORM_L1);
|
|
$normalizer->transform($samples);
|
|
|
|
self::assertEqualsWithDelta($normalized, $samples, $delta = 0.01);
|
|
}
|
|
|
|
public function testStandardNorm(): void
|
|
{
|
|
// Generate 10 random vectors of length 3
|
|
$samples = [];
|
|
srand(time());
|
|
for ($i = 0; $i < 10; ++$i) {
|
|
$sample = array_fill(0, 3, 0);
|
|
for ($k = 0; $k < 3; ++$k) {
|
|
$sample[$k] = random_int(1, 100);
|
|
}
|
|
|
|
// Last feature's value shared across samples.
|
|
$sample[] = 1;
|
|
|
|
$samples[] = $sample;
|
|
}
|
|
|
|
// Use standard normalization
|
|
$normalizer = new Normalizer(Normalizer::NORM_STD);
|
|
$normalizer->transform($samples);
|
|
|
|
// Values in the vector should be some value between -3 and +3
|
|
self::assertCount(10, $samples);
|
|
foreach ($samples as $sample) {
|
|
$errors = array_filter(
|
|
$sample,
|
|
function ($element): bool {
|
|
return $element < -3 || $element > 3;
|
|
}
|
|
);
|
|
self::assertCount(0, $errors);
|
|
self::assertEquals(0, $sample[3]);
|
|
}
|
|
}
|
|
}
|