60 references to LoadVector256
Microsoft.ML.CpuMath (59)
AvxIntrinsics.cs (50)
152
return Fma.MultiplyAdd(Avx.
LoadVector256
(psrc1), src2, src3);
156
Vector256<float> product = Avx.Multiply(src2, Avx.
LoadVector256
(psrc1));
215
Vector256<float> x01 = Avx.
LoadVector256
(pMatTemp);
216
Vector256<float> x11 = Avx.
LoadVector256
(pMatTemp += ccol);
217
Vector256<float> x21 = Avx.
LoadVector256
(pMatTemp += ccol);
218
Vector256<float> x31 = Avx.
LoadVector256
(pMatTemp += ccol);
219
Vector256<float> x02 = Avx.
LoadVector256
(pSrcCurrent);
345
Vector256<float> x02 = Avx.
LoadVector256
(pMatTemp);
346
Vector256<float> x12 = Avx.
LoadVector256
(pMatTemp += crow);
347
Vector256<float> x22 = Avx.
LoadVector256
(pMatTemp += crow);
348
Vector256<float> x32 = Avx.
LoadVector256
(pMatTemp += crow);
393
Vector256<float> x02 = Avx.
LoadVector256
(pMatTemp);
394
Vector256<float> x12 = Avx.
LoadVector256
(pMatTemp += crow);
395
Vector256<float> x22 = Avx.
LoadVector256
(pMatTemp += crow);
396
Vector256<float> x32 = Avx.
LoadVector256
(pMatTemp += crow);
397
Vector256<float> x3 = Avx.
LoadVector256
(pDstCurrent);
432
Vector256<float> dstVector = Avx.
LoadVector256
(pDstCurrent);
482
Vector256<float> temp = Avx.
LoadVector256
(pDstCurrent);
497
Vector256<float> result = Avx.
LoadVector256
(pDstCurrent);
499
Vector256<float> leadingMask = Avx.
LoadVector256
(((float*)(pLeadingAlignmentMask)) + (misalignment * 8));
500
Vector256<float> trailingMask = Avx.
LoadVector256
(((float*)(pTrailingAlignmentMask)) + ((8 - misalignment) * 8));
530
Vector256<float> temp = Avx.
LoadVector256
(pDstCurrent);
551
Vector256<float> result = Avx.
LoadVector256
(pDstCurrent);
553
Vector256<float> trailingMask = Avx.
LoadVector256
(((float*)(pTrailingAlignmentMask)) + (remainder * 8));
554
Vector256<float> leadingMask = Avx.
LoadVector256
(((float*)(pLeadingAlignmentMask)) + ((8 - remainder) * 8));
584
Vector256<float> srcVector = Avx.
LoadVector256
(pSrcCurrent);
630
Vector256<float> dstVector = Avx.
LoadVector256
(pDstCurrent);
678
Vector256<float> dstVector = Avx.
LoadVector256
(pDstCurrent);
735
Vector256<float> dstVector = Avx.
LoadVector256
(pDstCurrent);
838
Vector256<float> srcVector = Avx.
LoadVector256
(pSrcCurrent);
839
Vector256<float> dstVector = Avx.
LoadVector256
(pDstCurrent);
891
Vector256<float> srcVector = Avx.
LoadVector256
(pSrcCurrent);
938
Vector256<float> src1Vector = Avx.
LoadVector256
(pSrc1Current);
939
Vector256<float> src2Vector = Avx.
LoadVector256
(pSrc2Current);
996
result = Avx.Add(result, Avx.
LoadVector256
(pValues));
1009
Vector256<float> mask = Avx.
LoadVector256
(((float*)(pLeadingAlignmentMask)) + (misalignment * 8));
1010
Vector256<float> temp = Avx.And(mask, Avx.
LoadVector256
(pValues));
1032
result = Avx.Add(result, Avx.
LoadVector256
(pValues));
1051
Vector256<float> mask = Avx.
LoadVector256
(((float*)(pTrailingAlignmentMask)) + (remainder * 8));
1052
Vector256<float> temp = Avx.And(mask, Avx.
LoadVector256
(pValues));
1073
Vector256<float> srcVector = Avx.
LoadVector256
(pSrcCurrent);
1118
Vector256<float> srcVector = Avx.
LoadVector256
(pSrcCurrent);
1165
Vector256<float> srcVector = Avx.
LoadVector256
(pSrcCurrent);
1210
Vector256<float> srcVector = Avx.
LoadVector256
(pSrcCurrent);
1258
Vector256<float> srcVector = Avx.
LoadVector256
(pSrcCurrent);
1303
Vector256<float> srcVector = Avx.
LoadVector256
(pSrcCurrent);
1355
Vector256<float> dstVector = Avx.
LoadVector256
(pDstCurrent);
1466
Vector256<float> distanceVector = Avx.Subtract(Avx.
LoadVector256
(pSrcCurrent),
1467
Avx.
LoadVector256
(pDstCurrent));
1521
Vector256<float> xDst1 = Avx.
LoadVector256
(pDst1Current);
FactorizationMachine\AvxIntrinsics.cs (9)
89
Vector256<float> vjfBuffer = Avx.
LoadVector256
(vjf + k);
103
Vector256<float> vjfprimeBuffer = Avx.
LoadVector256
(vjfprime + k);
104
Vector256<float> q = Avx.
LoadVector256
(qffprime + k);
117
Vector256<float> qffBuffer = Avx.
LoadVector256
(qff + k);
132
Vector256<float> qffprimeBuffer = Avx.
LoadVector256
(qffprime + k);
133
Vector256<float> qfprimefBuffer = Avx.
LoadVector256
(qfprimef + k);
198
Vector256<float> v = Avx.
LoadVector256
(vjfprime + k);
199
Vector256<float> q = Avx.
LoadVector256
(qfprimef + k);
213
Vector256<float> h = MultiplyAdd(gLatent, gLatent, Avx.
LoadVector256
(hvjfprime + k));
System.Private.CoreLib (1)
src\libraries\System.Private.CoreLib\src\System\Runtime\Intrinsics\X86\Avx.cs (1)
727
public static unsafe Vector256<float> LoadVector256(float* address) =>
LoadVector256
(address);