mirror of
https://github.com/Llewellynvdm/php-ml.git
synced 2024-06-20 09:02:25 +00:00
17 lines
273 B
PHP
17 lines
273 B
PHP
<?php
|
|
|
|
declare(strict_types=1);
|
|
|
|
namespace Phpml\Tokenization;
|
|
|
|
class WordTokenizer implements Tokenizer
|
|
{
|
|
public function tokenize(string $text): array
|
|
{
|
|
$tokens = [];
|
|
preg_match_all('/\w\w+/u', $text, $tokens);
|
|
|
|
return $tokens[0];
|
|
}
|
|
}
|