You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
/// <param name="outputColumnName">Name of the column resulting from the transformation of <paramref name="inputColumnName"/>.</param>
64
-
/// <param name="inputColumnName">Name of the column to transform. If set to <see langword="null"/>, the value of the <paramref name="outputColumnName"/> will be used as source.</param>
64
+
/// <param name="outputColumnName">Name of the column resulting from the transformation of <paramref name="inputColumnName"/>.
65
+
/// This column's data type will be a vector of keys.</param>
66
+
/// <param name="inputColumnName">Name of the column to transform. If set to <see langword="null"/>, the value of the
67
+
/// <paramref name="outputColumnName"/> will be used as source.
68
+
/// This estimator operates over text data type.</param>
65
69
/// <param name="useMarkerCharacters">Whether to prepend a marker character, <see langword="0x02"/>, to the beginning,
66
70
/// and append another marker character, <see langword="0x03"/>, to the end of the output vector of characters.</param>
67
71
/// <example>
@@ -85,7 +89,6 @@ public static TokenizingByCharactersEstimator TokenizeIntoCharactersAsKeys(this
85
89
/// <param name="useMarkerCharacters">Whether to prepend a marker character, <see langword="0x02"/>, to the beginning,
86
90
/// and append another marker character, <see langword="0x03"/>, to the end of the output vector of characters.</param>
87
91
/// <param name="columns">Pairs of columns to run the tokenization on.</param>
/// <param name="outputColumnName">Name of the column resulting from the transformation of <paramref name="inputColumnName"/>.</param>
105
-
/// <param name="inputColumnName">Name of the column to transform. If set to <see langword="null"/>, the value of the <paramref name="outputColumnName"/> will be used as source.</param>
107
+
/// <param name="outputColumnName">Name of the column resulting from the transformation of <paramref name="inputColumnName"/>.
108
+
/// This column's data type will remain scalar of text or a vector of text depending on the input column data type.</param>
109
+
/// <param name="inputColumnName">Name of the column to transform. If set to <see langword="null"/>,
110
+
/// the value of the <paramref name="outputColumnName"/> will be used as source.
111
+
/// This estimator operates on text and vector of text data types.</param>
106
112
/// <param name="caseMode">Casing text using the rules of the invariant culture.</param>
107
113
/// <param name="keepDiacritics">Whether to keep diacritical marks or remove them.</param>
108
114
/// <param name="keepPunctuations">Whether to keep punctuation marks or remove them.</param>
@@ -124,10 +130,16 @@ public static TextNormalizingEstimator NormalizeText(this TransformsCatalog.Text
/// <param name="outputColumnName">Name of the column resulting from the transformation of <paramref name="inputColumnName"/>.</param>
130
-
/// <param name="inputColumnName">Name of the column to transform. If set to <see langword="null"/>, the value of the <paramref name="outputColumnName"/> will be used as source.</param>
138
+
/// <param name="outputColumnName">Name of the column resulting from the transformation of <paramref name="inputColumnName"/>.
139
+
/// This column's data type will be a vector of <see cref="System.Single"/>.</param>
140
+
/// <param name="inputColumnName">Name of the column to transform. If set to <see langword="null"/>,
141
+
/// the value of the <paramref name="outputColumnName"/> will be used as source.
142
+
/// This estimator operates over vector of text data type.</param>
131
143
/// <param name="modelKind">The embeddings <see cref="WordEmbeddingEstimator.PretrainedModelKind"/> to use. </param>
132
144
/// <example>
133
145
/// <format type="text/markdown">
@@ -142,11 +154,17 @@ public static WordEmbeddingEstimator ApplyWordEmbedding(this TransformsCatalog.T
/// <param name="outputColumnName">Name of the column resulting from the transformation of <paramref name="inputColumnName"/>.</param>
187
-
/// <param name="inputColumnName">Name of the column to transform. If set to <see langword="null"/>, the value of the <paramref name="outputColumnName"/> will be used as source.</param>
206
+
/// <param name="outputColumnName">Name of the column resulting from the transformation of <paramref name="inputColumnName"/>.
207
+
/// This column's data type will be a vector of text.</param>
208
+
/// <param name="inputColumnName">Name of the column to transform. If set to <see langword="null"/>, the value of the <paramref name="outputColumnName"/> will be used as source.
209
+
/// This estimator operates of text data type.</param>
188
210
/// <param name="separators">The separators to use (uses space character by default).</param>
/// <param name="outputColumnName">Name of the column resulting from the transformation of <paramref name="inputColumnName"/>.</param>
218
-
/// <param name="inputColumnName">Name of the column to transform. If set to <see langword="null"/>, the value of the <paramref name="outputColumnName"/> will be used as source.</param>
239
+
/// <param name="outputColumnName">Name of the column resulting from the transformation of <paramref name="inputColumnName"/>.
240
+
/// This column's data type will be a vector of <see cref="System.Single"/>.</param>
241
+
/// <param name="inputColumnName">Name of the column to transform. If set to <see langword="null"/>, the value of the <paramref name="outputColumnName"/> will be used as source.
242
+
/// This estimator operates over vectors of keys data type.</param>
/// <param name="skipLength">Maximum number of tokens to skip when constructing an ngram.</param>
244
+
/// <param name="skipLength">Number of tokens to skip between each ngram. By defaults no token is skipped.</param>
221
245
/// <param name="useAllLengths">Whether to include all ngram lengths up to <paramref name="ngramLength"/> or only <paramref name="ngramLength"/>.</param>
222
246
/// <param name="maximumNgramsCount">Maximum number of n-grams to store in the dictionary.</param>
223
-
/// <param name="weighting">Statistical measure used to evaluate how important a word is to a document in a corpus.</param>
247
+
/// <param name="weighting">Statistical measure used to evaluate how important a word or ngram is to a document in a corpus.
248
+
/// When <paramref name="maximumNgramsCount"/> is smaller than the total number of encountered ngrams this measure is used
0 commit comments