php-ml/tests/Dataset/FilesDatasetTest.php

44 lines
1.3 KiB
PHP
Raw Normal View History

2016-07-16 23:29:40 +02:00
<?php
2016-11-20 22:53:17 +01:00
declare(strict_types=1);
2016-07-16 23:29:40 +02:00
namespace Phpml\Tests\Dataset;
2016-07-16 23:29:40 +02:00
use Phpml\Dataset\FilesDataset;
use Phpml\Exception\DatasetException;
2017-02-03 12:58:25 +01:00
use PHPUnit\Framework\TestCase;
2016-07-16 23:29:40 +02:00
2017-02-03 12:58:25 +01:00
class FilesDatasetTest extends TestCase
2016-07-16 23:29:40 +02:00
{
public function testThrowExceptionOnMissingRootFolder(): void
2016-07-16 23:29:40 +02:00
{
$this->expectException(DatasetException::class);
2016-07-16 23:29:40 +02:00
new FilesDataset('some/not/existed/path');
}
public function testLoadFilesDatasetWithBBCData(): void
2016-07-16 23:29:40 +02:00
{
$rootPath = dirname(__FILE__).'/Resources/bbc';
$dataset = new FilesDataset($rootPath);
2018-10-28 07:44:52 +01:00
self::assertCount(50, $dataset->getSamples());
self::assertCount(50, $dataset->getTargets());
2016-07-16 23:29:40 +02:00
$targets = ['business', 'entertainment', 'politics', 'sport', 'tech'];
2018-10-28 07:44:52 +01:00
self::assertEquals($targets, array_values(array_unique($dataset->getTargets())));
2016-07-16 23:29:40 +02:00
$firstSample = file_get_contents($rootPath.'/business/001.txt');
2018-10-28 07:44:52 +01:00
self::assertEquals($firstSample, $dataset->getSamples()[0][0]);
2016-07-16 23:29:40 +02:00
$firstTarget = 'business';
2018-10-28 07:44:52 +01:00
self::assertEquals($firstTarget, $dataset->getTargets()[0]);
2016-07-16 23:29:40 +02:00
$lastSample = file_get_contents($rootPath.'/tech/010.txt');
2018-10-28 07:44:52 +01:00
self::assertEquals($lastSample, $dataset->getSamples()[49][0]);
$lastTarget = 'tech';
2018-10-28 07:44:52 +01:00
self::assertEquals($lastTarget, $dataset->getTargets()[49]);
2016-07-16 23:29:40 +02:00
}
}