2016-06-14 11:54:04 +02:00
|
|
|
<?php
|
|
|
|
|
2016-11-20 22:53:17 +01:00
|
|
|
declare(strict_types=1);
|
2016-06-14 11:54:04 +02:00
|
|
|
|
|
|
|
namespace tests\Phpml\FeatureExtraction;
|
|
|
|
|
|
|
|
use Phpml\FeatureExtraction\StopWords;
|
2017-02-03 12:58:25 +01:00
|
|
|
use PHPUnit\Framework\TestCase;
|
2016-06-14 11:54:04 +02:00
|
|
|
|
2017-02-03 12:58:25 +01:00
|
|
|
class StopWordsTest extends TestCase
|
2016-06-14 11:54:04 +02:00
|
|
|
{
|
|
|
|
public function testCustomStopWords()
|
|
|
|
{
|
|
|
|
$stopWords = new StopWords(['lorem', 'ipsum', 'dolor']);
|
|
|
|
|
|
|
|
$this->assertTrue($stopWords->isStopWord('lorem'));
|
|
|
|
$this->assertTrue($stopWords->isStopWord('ipsum'));
|
|
|
|
$this->assertTrue($stopWords->isStopWord('dolor'));
|
|
|
|
|
|
|
|
$this->assertFalse($stopWords->isStopWord('consectetur'));
|
|
|
|
$this->assertFalse($stopWords->isStopWord('adipiscing'));
|
|
|
|
$this->assertFalse($stopWords->isStopWord('amet'));
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @expectedException \Phpml\Exception\InvalidArgumentException
|
|
|
|
*/
|
|
|
|
public function testThrowExceptionOnInvalidLanguage()
|
|
|
|
{
|
|
|
|
StopWords::factory('Lorem');
|
|
|
|
}
|
|
|
|
|
|
|
|
public function testEnglishStopWords()
|
|
|
|
{
|
|
|
|
$stopWords = StopWords::factory('English');
|
|
|
|
|
|
|
|
$this->assertTrue($stopWords->isStopWord('again'));
|
|
|
|
$this->assertFalse($stopWords->isStopWord('strategy'));
|
|
|
|
}
|
|
|
|
|
|
|
|
public function testPolishStopWords()
|
|
|
|
{
|
|
|
|
$stopWords = StopWords::factory('Polish');
|
|
|
|
|
|
|
|
$this->assertTrue($stopWords->isStopWord('wam'));
|
|
|
|
$this->assertFalse($stopWords->isStopWord('transhumanizm'));
|
|
|
|
}
|
2017-05-22 23:18:27 +02:00
|
|
|
|
|
|
|
public function testFrenchStopWords()
|
|
|
|
{
|
|
|
|
$stopWords = StopWords::factory('French');
|
|
|
|
|
|
|
|
$this->assertTrue($stopWords->isStopWord('alors'));
|
|
|
|
$this->assertFalse($stopWords->isStopWord('carte'));
|
|
|
|
}
|
2016-06-14 11:54:04 +02:00
|
|
|
}
|