php-ml/src/Tokenization/WordTokenizer.php
2018-02-10 12:08:58 +01:00

17 lines
273 B
PHP

<?php
declare(strict_types=1);
namespace Phpml\Tokenization;
class WordTokenizer implements Tokenizer
{
public function tokenize(string $text): array
{
$tokens = [];
preg_match_all('/\w\w+/u', $text, $tokens);
return $tokens[0];
}
}