Skip to content

Commit 1508c2e

Browse files
smk2007Sheil Kumar
and
Sheil Kumar
authored
Restrict L2 Cache Core check to Intel devices (#19483)
### Description Limit SoC core detection via 2 level cache core logic to Intel and Hybrid processors. ### Motivation and Context The following code was added to add support for a new class of CPU cores present in Intel’s next generation Intel Core Ultra mobile processors. This code is essential to avoid placing threads on low performing SoC cores that don’t have L3 cache. SoC cores are meant to specialize in system bringup and help improve responsiveness and power usage, in other words they are not meant to run compute heavy AI workloads. In order to avoid broad exposure of this logic, it is currently designed to be restricted to Intel platforms that have hybrid enabled. --------- Co-authored-by: Sheil Kumar <[email protected]>
1 parent fbff99a commit 1508c2e

File tree

1 file changed

+21
-4
lines changed

1 file changed

+21
-4
lines changed

winml/lib/Api/HardwareCoreEnumerator.cpp

+21-4
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ struct LogicalProcessorInformation {
1414

1515
struct CoreCounter {
1616
uint32_t PhysicalCores = 0;
17-
uint32_t SocDieCores = 0;
17+
uint32_t Num2CacheCores = 0;
1818
};
1919

2020
static LogicalProcessorInformation GetLogicalProcessorInfos(LOGICAL_PROCESSOR_RELATIONSHIP relationship) {
@@ -75,16 +75,33 @@ static CoreCounter GetNumberOPhysicalAndEngineeringCores() {
7575
read += currentProcessorInfo->Size;
7676
}
7777

78-
cores.SocDieCores = CountSetBits(dwLevel2GroupMask & ~dwLevel3GroupMask);
78+
cores.Num2CacheCores = CountSetBits(dwLevel2GroupMask & ~dwLevel3GroupMask);
7979
return cores;
8080
}
8181

8282
uint32_t HardwareCoreEnumerator::DefaultIntraOpNumThreads() {
8383
// # of physical cores = # of P cores + # of E Cores + # of Soc Cores.
8484
// # of logical cores = # of P cores x 2 (if hyper threading is enabled) + # of E cores + # of Soc Cores.
8585
auto cores = GetNumberOPhysicalAndEngineeringCores();
86-
// We want to use the number of physical cores, but exclude soc cores
87-
return cores.PhysicalCores - cores.SocDieCores;
86+
87+
const int kVendorID_Intel[3] = {0x756e6547, 0x6c65746e, 0x49656e69}; // "GenuntelineI"
88+
int regs_leaf0[4];
89+
int regs_leaf7[4];
90+
__cpuid(regs_leaf0, 0);
91+
__cpuid(regs_leaf7, 0x7);
92+
93+
auto isIntel = (kVendorID_Intel[0] == regs_leaf0[1]) && (kVendorID_Intel[1] == regs_leaf0[2]) &&
94+
(kVendorID_Intel[2] == regs_leaf0[3]);
95+
96+
auto isHybrid = (regs_leaf7[3] & (1 << 15));
97+
98+
if (isIntel && isHybrid) {
99+
// We want to use the number of physical cores, but exclude soc cores
100+
// On Intel Hybrid processors, numSocCores == cores.Num2CacheCores
101+
return cores.PhysicalCores - cores.Num2CacheCores;
102+
}
103+
104+
return cores.PhysicalCores;
88105
}
89106

90107
} // namespace WINMLP

0 commit comments

Comments
 (0)