We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 08c2763 commit 141c6c0Copy full SHA for 141c6c0
src/Microsoft.ML.Auto/ColumnInference/PurposeInference.cs
@@ -145,7 +145,7 @@ public void Apply(IntermediateColumn[] columns)
145
Double avgLength = 1.0 * sumLength / data.Length;
146
Double cardinalityRatio = 1.0 * seen.Count / data.Length;
147
Double avgSpaces = 1.0 * sumSpaces / data.Length;
148
- if (cardinalityRatio < 0.7 || seen.Count < 100)
+ if (cardinalityRatio < 0.7)
149
column.SuggestedPurpose = ColumnPurpose.CategoricalFeature;
150
// (note: the columns.Count() == 1 condition below, in case a dataset has only
151
// a 'name' and a 'label' column, forces what would be an 'ignore' column to become a text feature)
0 commit comments