documentation add tokenizer->fit required to build the dictionary (#155)

2025-02-13 17:38:36 +00:00 · 2017-11-16 21:40:11 +01:00 · 2017-11-16 21:40:11 +01:00 · f7537c049a
commit f7537c049a
parent a11e3f69c3
1 changed files with 8 additions and 3 deletions
--- a/docs/machine-learning/feature-extraction/token-count-vectorizer.md
+++ b/docs/machine-learning/feature-extraction/token-count-vectorizer.md
@ -26,13 +26,18 @@ $samples = [
 ];

 $vectorizer = new TokenCountVectorizer(new WhitespaceTokenizer());
-$vectorizer->transform($samples)
-// return $vector = [
+
+// Build the dictionary.
+$vectorizer->fit($samples);
+
+// Transform the provided text samples into a vectorized list.
+$vectorizer->transform($samples);
+// return $samples = [
 //    [0 => 1, 1 => 1, 2 => 2, 3 => 1, 4 => 1],
 //    [5 => 1, 6 => 1, 1 => 1, 2 => 1],
 //    [5 => 1, 7 => 2, 8 => 1, 9 => 1],
 //];
-        
+
 ```

 ### Vocabulary