php-ml/tests/Phpml/FeatureExtraction/StopWordsTest.php

49 lines
1.3 KiB
PHP
Raw Normal View History

2016-06-14 09:54:04 +00:00
<?php
2016-11-20 21:53:17 +00:00
declare(strict_types=1);
2016-06-14 09:54:04 +00:00
namespace tests\Phpml\FeatureExtraction;
use Phpml\FeatureExtraction\StopWords;
2017-02-03 11:58:25 +00:00
use PHPUnit\Framework\TestCase;
2016-06-14 09:54:04 +00:00
2017-02-03 11:58:25 +00:00
class StopWordsTest extends TestCase
2016-06-14 09:54:04 +00:00
{
public function testCustomStopWords()
{
$stopWords = new StopWords(['lorem', 'ipsum', 'dolor']);
$this->assertTrue($stopWords->isStopWord('lorem'));
$this->assertTrue($stopWords->isStopWord('ipsum'));
$this->assertTrue($stopWords->isStopWord('dolor'));
$this->assertFalse($stopWords->isStopWord('consectetur'));
$this->assertFalse($stopWords->isStopWord('adipiscing'));
$this->assertFalse($stopWords->isStopWord('amet'));
}
/**
* @expectedException \Phpml\Exception\InvalidArgumentException
*/
public function testThrowExceptionOnInvalidLanguage()
{
StopWords::factory('Lorem');
}
public function testEnglishStopWords()
{
$stopWords = StopWords::factory('English');
$this->assertTrue($stopWords->isStopWord('again'));
$this->assertFalse($stopWords->isStopWord('strategy'));
}
public function testPolishStopWords()
{
$stopWords = StopWords::factory('Polish');
$this->assertTrue($stopWords->isStopWord('wam'));
$this->assertFalse($stopWords->isStopWord('transhumanizm'));
}
}