You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
@@ -396,8 +394,7 @@ public override IEstimator<ITransformer> Reconcile(IHostEnvironment env,
396
394
/// <param name="seed">Hashing seed.</param>
397
395
/// <param name="ordered">Whether the position of each source column should be included in the hash (when there are multiple source columns).</param>
398
396
/// <param name="invertHash">Limit the number of keys used to generate the slot name to this many. 0 means no invert hashing, -1 means no limit.</param>
@@ -467,20 +464,19 @@ public override IEstimator<ITransformer> Reconcile(IHostEnvironment env,
467
464
}
468
465
469
466
/// <summary>
470
-
/// Produces a bag of counts of ngrams (sequences of consecutive words ) in a given text.
467
+
/// Produces a bag of counts of ngrams (sequences of consecutive words ) in a given tokenized text.
471
468
/// It does so by building a dictionary of ngrams and using the id in the dictionary as the index in the bag.
472
469
///
473
-
/// /// <see cref="Ngrams"/> is different from <see cref="WordBagEstimatorExtensions.BagofWords"/>
474
-
/// in a way that <see cref="Ngrams"/> takes tokenized text as input while <see cref="WordBagEstimatorExtensions.BagofWords"/> tokenizes text internally.
470
+
/// /// <see cref="ToNgrams"/> is different from <see cref="WordBagEstimatorExtensions.ToBagofWords"/>
471
+
/// in a way that <see cref="ToNgrams"/> takes tokenized text as input while <see cref="WordBagEstimatorExtensions.ToBagofWords"/> tokenizes text internally.
475
472
/// </summary>
476
473
/// <param name="input">The column to apply to.</param>
@@ -553,11 +549,11 @@ public override IEstimator<ITransformer> Reconcile(IHostEnvironment env,
553
549
}
554
550
555
551
/// <summary>
556
-
/// Produces a bag of counts of ngrams (sequences of consecutive words of length 1-n) in a given text.
552
+
/// Produces a bag of counts of ngrams (sequences of consecutive words of length 1-n) in a given tokenized text.
557
553
/// It does so by hashing each ngram and using the hash value as the index in the bag.
558
554
///
559
-
/// <see cref="NgramsHash"/> is different from <see cref="WordHashBagEstimatorExtensions.BagofHashedWords"/>
560
-
/// in a way that <see cref="NgramsHash"/> takes tokenized text as input while <see cref="WordHashBagEstimatorExtensions.BagofHashedWords"/> tokenizes text internally.
555
+
/// <see cref="ToNgramsHash"/> is different from <see cref="WordHashBagEstimatorExtensions.ToBagofHashedWords"/>
556
+
/// in a way that <see cref="ToNgramsHash"/> takes tokenized text as input while <see cref="WordHashBagEstimatorExtensions.ToBagofHashedWords"/> tokenizes text internally.
561
557
/// </summary>
562
558
/// <param name="input">The column to apply to.</param>
563
559
/// <param name="hashBits">Number of bits to hash into. Must be between 1 and 30, inclusive.</param>
@@ -567,8 +563,7 @@ public override IEstimator<ITransformer> Reconcile(IHostEnvironment env,
567
563
/// <param name="seed">Hashing seed.</param>
568
564
/// <param name="ordered">Whether the position of each source column should be included in the hash (when there are multiple source columns).</param>
569
565
/// <param name="invertHash">Limit the number of keys used to generate the slot name to this many. 0 means no invert hashing, -1 means no limit.</param>
0 commit comments