60 references to LoadVector256
Microsoft.ML.CpuMath (59)
AvxIntrinsics.cs (50)
152return Fma.MultiplyAdd(Avx.LoadVector256(psrc1), src2, src3); 156Vector256<float> product = Avx.Multiply(src2, Avx.LoadVector256(psrc1)); 215Vector256<float> x01 = Avx.LoadVector256(pMatTemp); 216Vector256<float> x11 = Avx.LoadVector256(pMatTemp += ccol); 217Vector256<float> x21 = Avx.LoadVector256(pMatTemp += ccol); 218Vector256<float> x31 = Avx.LoadVector256(pMatTemp += ccol); 219Vector256<float> x02 = Avx.LoadVector256(pSrcCurrent); 345Vector256<float> x02 = Avx.LoadVector256(pMatTemp); 346Vector256<float> x12 = Avx.LoadVector256(pMatTemp += crow); 347Vector256<float> x22 = Avx.LoadVector256(pMatTemp += crow); 348Vector256<float> x32 = Avx.LoadVector256(pMatTemp += crow); 393Vector256<float> x02 = Avx.LoadVector256(pMatTemp); 394Vector256<float> x12 = Avx.LoadVector256(pMatTemp += crow); 395Vector256<float> x22 = Avx.LoadVector256(pMatTemp += crow); 396Vector256<float> x32 = Avx.LoadVector256(pMatTemp += crow); 397Vector256<float> x3 = Avx.LoadVector256(pDstCurrent); 432Vector256<float> dstVector = Avx.LoadVector256(pDstCurrent); 482Vector256<float> temp = Avx.LoadVector256(pDstCurrent); 497Vector256<float> result = Avx.LoadVector256(pDstCurrent); 499Vector256<float> leadingMask = Avx.LoadVector256(((float*)(pLeadingAlignmentMask)) + (misalignment * 8)); 500Vector256<float> trailingMask = Avx.LoadVector256(((float*)(pTrailingAlignmentMask)) + ((8 - misalignment) * 8)); 530Vector256<float> temp = Avx.LoadVector256(pDstCurrent); 551Vector256<float> result = Avx.LoadVector256(pDstCurrent); 553Vector256<float> trailingMask = Avx.LoadVector256(((float*)(pTrailingAlignmentMask)) + (remainder * 8)); 554Vector256<float> leadingMask = Avx.LoadVector256(((float*)(pLeadingAlignmentMask)) + ((8 - remainder) * 8)); 584Vector256<float> srcVector = Avx.LoadVector256(pSrcCurrent); 630Vector256<float> dstVector = Avx.LoadVector256(pDstCurrent); 678Vector256<float> dstVector = Avx.LoadVector256(pDstCurrent); 735Vector256<float> dstVector = Avx.LoadVector256(pDstCurrent); 838Vector256<float> srcVector = Avx.LoadVector256(pSrcCurrent); 839Vector256<float> dstVector = Avx.LoadVector256(pDstCurrent); 891Vector256<float> srcVector = Avx.LoadVector256(pSrcCurrent); 938Vector256<float> src1Vector = Avx.LoadVector256(pSrc1Current); 939Vector256<float> src2Vector = Avx.LoadVector256(pSrc2Current); 996result = Avx.Add(result, Avx.LoadVector256(pValues)); 1009Vector256<float> mask = Avx.LoadVector256(((float*)(pLeadingAlignmentMask)) + (misalignment * 8)); 1010Vector256<float> temp = Avx.And(mask, Avx.LoadVector256(pValues)); 1032result = Avx.Add(result, Avx.LoadVector256(pValues)); 1051Vector256<float> mask = Avx.LoadVector256(((float*)(pTrailingAlignmentMask)) + (remainder * 8)); 1052Vector256<float> temp = Avx.And(mask, Avx.LoadVector256(pValues)); 1073Vector256<float> srcVector = Avx.LoadVector256(pSrcCurrent); 1118Vector256<float> srcVector = Avx.LoadVector256(pSrcCurrent); 1165Vector256<float> srcVector = Avx.LoadVector256(pSrcCurrent); 1210Vector256<float> srcVector = Avx.LoadVector256(pSrcCurrent); 1258Vector256<float> srcVector = Avx.LoadVector256(pSrcCurrent); 1303Vector256<float> srcVector = Avx.LoadVector256(pSrcCurrent); 1355Vector256<float> dstVector = Avx.LoadVector256(pDstCurrent); 1466Vector256<float> distanceVector = Avx.Subtract(Avx.LoadVector256(pSrcCurrent), 1467Avx.LoadVector256(pDstCurrent)); 1521Vector256<float> xDst1 = Avx.LoadVector256(pDst1Current);
FactorizationMachine\AvxIntrinsics.cs (9)
89Vector256<float> vjfBuffer = Avx.LoadVector256(vjf + k); 103Vector256<float> vjfprimeBuffer = Avx.LoadVector256(vjfprime + k); 104Vector256<float> q = Avx.LoadVector256(qffprime + k); 117Vector256<float> qffBuffer = Avx.LoadVector256(qff + k); 132Vector256<float> qffprimeBuffer = Avx.LoadVector256(qffprime + k); 133Vector256<float> qfprimefBuffer = Avx.LoadVector256(qfprimef + k); 198Vector256<float> v = Avx.LoadVector256(vjfprime + k); 199Vector256<float> q = Avx.LoadVector256(qfprimef + k); 213Vector256<float> h = MultiplyAdd(gLatent, gLatent, Avx.LoadVector256(hvjfprime + k));
System.Private.CoreLib (1)
src\libraries\System.Private.CoreLib\src\System\Runtime\Intrinsics\X86\Avx.cs (1)
727public static unsafe Vector256<float> LoadVector256(float* address) => LoadVector256(address);