You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
* Typos as described in #3491
Changing "ngrams" to "n-gram"
* changing ngram -> n-gram
* typos
* addressing PR comments
* regenerating the manifest
* restoring the argument short name
* regenerating the manifest
/// <param name="skipLength">Maximum number of tokens to skip when constructing an ngram.</param>
312
-
/// <param name="useAllLengths">Whether to include all ngram lengths up to <paramref name="ngramLength"/> or only <paramref name="ngramLength"/>.</param>
313
-
/// <param name="maximumNgramsCount">Maximum number of ngrams to store in the dictionary.</param>
311
+
/// <param name="skipLength">Maximum number of tokens to skip when constructing an n-gram.</param>
312
+
/// <param name="useAllLengths">Whether to include all n-gram lengths up to <paramref name="ngramLength"/> or only <paramref name="ngramLength"/>.</param>
313
+
/// <param name="maximumNgramsCount">Maximum number of n-grams to store in the dictionary.</param>
314
314
/// <param name="weighting">Statistical measure used to evaluate how important a word is to a document in a corpus.</param>
/// <param name="skipLength">Maximum number of tokens to skip when constructing an ngram.</param>
403
-
/// <param name="useAllLengths">Whether to include all ngram lengths up to <paramref name="ngramLength"/> or only <paramref name="ngramLength"/>.</param>
402
+
/// <param name="skipLength">Maximum number of tokens to skip when constructing an n-gram.</param>
403
+
/// <param name="useAllLengths">Whether to include all n-gram lengths up to <paramref name="ngramLength"/> or only <paramref name="ngramLength"/>.</param>
404
404
/// <param name="seed">Hashing seed.</param>
405
405
/// <param name="useOrderedHashing">Whether the position of each source column should be included in the hash (when there are multiple source columns).</param>
406
406
/// <param name="maximumNumberOfInverts">During hashing we constuct mappings between original values and the produced hash values.
@@ -418,7 +418,7 @@ public static Vector<float> ProduceHashedWordBags(this Scalar<string> input,
418
418
}
419
419
420
420
/// <summary>
421
-
/// Extensions for statically typed ngram estimator.
421
+
/// Extensions for statically typed n-gram estimator.
422
422
/// </summary>
423
423
publicstaticclassNgramEstimatorStaticExtensions
424
424
{
@@ -482,16 +482,16 @@ public override IEstimator<ITransformer> Reconcile(IHostEnvironment env,
482
482
}
483
483
484
484
/// <summary>
485
-
/// Produces a bag of counts of ngrams (sequences of consecutive words ) in a given tokenized text.
486
-
/// It does so by building a dictionary of ngrams and using the id in the dictionary as the index in the bag.
485
+
/// Produces a bag of counts of n-grams (sequences of consecutive words ) in a given tokenized text.
486
+
/// It does so by building a dictionary of n-grams and using the id in the dictionary as the index in the bag.
487
487
///
488
488
/// /// <see cref="ProduceNgrams"/> is different from <see cref="WordBagEstimatorStaticExtensions.ProduceWordBags"/>
489
489
/// in a way that <see cref="ProduceNgrams"/> takes tokenized text as input while <see cref="WordBagEstimatorStaticExtensions.ProduceWordBags"/> tokenizes text internally.
490
490
/// </summary>
491
491
/// <param name="input">The column to apply to.</param>
/// <param name="skipLength">Maximum number of tokens to skip when constructing an ngram.</param>
494
-
/// <param name="useAllLengths">Whether to include all ngram lengths up to <paramref name="ngramLength"/> or only <paramref name="ngramLength"/>.</param>
493
+
/// <param name="skipLength">Maximum number of tokens to skip when constructing an n-gram.</param>
494
+
/// <param name="useAllLengths">Whether to include all n-gram lengths up to <paramref name="ngramLength"/> or only <paramref name="ngramLength"/>.</param>
495
495
/// <param name="maximumNgramsCount">Maximum number of n-grams to store in the dictionary.</param>
496
496
/// <param name="weighting">Statistical measure used to evaluate how important a word is to a document in a corpus.</param>
@@ -568,17 +568,17 @@ public override IEstimator<ITransformer> Reconcile(IHostEnvironment env,
568
568
}
569
569
570
570
/// <summary>
571
-
/// Produces a bag of counts of ngrams (sequences of consecutive words of length 1-n) in a given tokenized text.
572
-
/// It does so by hashing each ngram and using the hash value as the index in the bag.
571
+
/// Produces a bag of counts of n-grams (sequences of n consecutive words of length 1-n) in a given tokenized text.
572
+
/// It does so by hashing each n-gram and using the hash value as the index in the bag.
573
573
///
574
574
/// <see cref="ProduceHashedNgrams"/> is different from <see cref="WordHashBagEstimatorStaticExtensions.ProduceHashedWordBags"/>
575
575
/// in a way that <see cref="ProduceHashedNgrams"/> takes tokenized text as input while <see cref="WordHashBagEstimatorStaticExtensions.ProduceHashedWordBags"/> tokenizes text internally.
576
576
/// </summary>
577
577
/// <param name="input">The column to apply to.</param>
578
578
/// <param name="numberOfBits">Number of bits to hash into. Must be between 1 and 30, inclusive.</param>
/// <param name="skipLength">Maximum number of tokens to skip when constructing an ngram.</param>
581
-
/// <param name="useAllLengths">Whether to include all ngram lengths up to <paramref name="ngramLength"/> or only <paramref name="ngramLength"/>.</param>
580
+
/// <param name="skipLength">Maximum number of tokens to skip when constructing an n-gram.</param>
581
+
/// <param name="useAllLengths">Whether to include all n-gram lengths up to <paramref name="ngramLength"/> or only <paramref name="ngramLength"/>.</param>
582
582
/// <param name="seed">Hashing seed.</param>
583
583
/// <param name="useOrderedHashing">Whether the position of each source column should be included in the hash (when there are multiple source columns).</param>
584
584
/// <param name="maximumNumberOfInverts">During hashing we constuct mappings between original values and the produced hash values.
0 commit comments