74 references to SseIntrinsics
Microsoft.ML.CpuMath (49)
AvxIntrinsics.cs (34)
94tmp = SseIntrinsics.Rotate(in tmp); 96tmp = SseIntrinsics.Rotate(in tmp); 98tmp = SseIntrinsics.Rotate(in tmp); 102tmp = SseIntrinsics.Rotate(in tmp); 104tmp = SseIntrinsics.Rotate(in tmp); 106tmp = SseIntrinsics.Rotate(in tmp); 805Vector128<float> dstVector = SseIntrinsics.Load4(pDstCurrent, pIdxCurrent); 809SseIntrinsics.Store4(in dstVector, pDstCurrent, pIdxCurrent); 902Vector128<float> dstVector = SseIntrinsics.Load4(pDstCurrent, pIdxCurrent); 906SseIntrinsics.Store4(in dstVector, pDstCurrent, pIdxCurrent); 1092result128 = SseIntrinsics.VectorSum128(in result128); 1139result128 = SseIntrinsics.VectorSum128(in result128); 1179result128 = Sse.Add(result128, Sse.And(srcVector, SseIntrinsics.AbsMask128)); 1184result128 = SseIntrinsics.VectorSum128(in result128); 1189result128 = Sse.AddScalar(result128, Sse.And(srcVector, SseIntrinsics.AbsMask128)); 1227result128 = Sse.Add(result128, Sse.And(srcVector, SseIntrinsics.AbsMask128)); 1232result128 = SseIntrinsics.VectorSum128(in result128); 1238result128 = Sse.AddScalar(result128, Sse.And(srcVector, SseIntrinsics.AbsMask128)); 1272result128 = Sse.Max(result128, Sse.And(srcVector, SseIntrinsics.AbsMask128)); 1277result128 = SseIntrinsics.VectorMax128(in result128); 1282result128 = Sse.MaxScalar(result128, Sse.And(srcVector, SseIntrinsics.AbsMask128)); 1320result128 = Sse.Max(result128, Sse.And(srcVector, SseIntrinsics.AbsMask128)); 1325result128 = SseIntrinsics.VectorMax128(in result128); 1331result128 = Sse.MaxScalar(result128, Sse.And(srcVector, SseIntrinsics.AbsMask128)); 1377result128 = SseIntrinsics.VectorSum128(in result128); 1425Vector128<float> srcVector = SseIntrinsics.Load4(pSrcCurrent, pIdxCurrent); 1434result128 = SseIntrinsics.VectorSum128(in result128); 1438Vector128<float> srcVector = SseIntrinsics.Load1(pSrcCurrent, pIdxCurrent); 1489sqDistanceVector128 = SseIntrinsics.VectorSum128(in sqDistanceVector128); 1542Vector128<float> xDst2 = SseIntrinsics.GetNewDst128(xDst1, xThreshold128); 1599Vector128<float> xDst1 = SseIntrinsics.Load4(pdst1, pIdxCurrent); 1601Vector128<float> xDst2 = SseIntrinsics.GetNewDst128(xDst1, xThreshold128); 1603SseIntrinsics.Store4(in xDst1, pdst1, pIdxCurrent); 1604SseIntrinsics.Store4(in xDst2, pdst2, pIdxCurrent);
CpuMathUtils.netcoreapp.cs (15)
62SseIntrinsics.MatMul(matrix, source, destination, stride, source.Size); 67SseIntrinsics.MatMulTran(matrix, source, destination, destination.Size, stride); 139SseIntrinsics.MatMulP(matrix, rgposSrc, sourceValues, posMin, iposMin, iposLimit, destination, stride, sourceValues.Size); 184SseIntrinsics.ScaleAddU(scale, addend, destination); 221SseIntrinsics.AddScaleSU(scale, source, indices, destination, count); 257SseIntrinsics.AddSU(source, indices, destination, count); 287return (mean == 0) ? SseIntrinsics.SumSqU(source) : SseIntrinsics.SumSqDiffU(mean, source); 317return (mean == 0) ? SseIntrinsics.SumAbsU(source) : SseIntrinsics.SumAbsDiffU(mean, source); 350return SseIntrinsics.MaxAbsU(source); 384return SseIntrinsics.MaxAbsDiffU(mean, source); 423return SseIntrinsics.DotSU(left, right, indices, count); 554SseIntrinsics.SdcaL1UpdateU(primalUpdate, count, source, threshold, v, w); 597SseIntrinsics.SdcaL1UpdateSU(primalUpdate, count, source, indices, threshold, v, w);
Microsoft.ML.CpuMath.PerformanceTests (25)
SsePerformanceTests.cs (25)
15=> SseIntrinsics.AddScalarU(DefaultScale, new Span<float>(dst, 0, Length)); 19=> SseIntrinsics.Scale(DefaultScale, new Span<float>(dst, 0, Length)); 23=> SseIntrinsics.ScaleSrcU(DefaultScale, src, dst, Length); 27=> SseIntrinsics.ScaleAddU(DefaultScale, DefaultScale, new Span<float>(dst, 0, Length)); 31=> SseIntrinsics.AddScaleU(DefaultScale, src, dst, Length); 35=> SseIntrinsics.AddScaleSU(DefaultScale, src, idx, dst, IndexLength); 39=> SseIntrinsics.AddScaleCopyU(DefaultScale, src, dst, result, Length); 43=> SseIntrinsics.AddU(src, dst, Length); 47=> SseIntrinsics.AddSU(src, idx, dst, IndexLength); 51=> SseIntrinsics.MulElementWiseU(src1, src2, dst, Length); 55=> SseIntrinsics.Sum(new Span<float>(src, 0, Length)); 59=> SseIntrinsics.SumSqU(new Span<float>(src, 0, Length)); 63=> SseIntrinsics.SumSqDiffU(DefaultScale, new Span<float>(src, 0, Length)); 67=> SseIntrinsics.SumAbsU(new Span<float>(src, 0, Length)); 71=> SseIntrinsics.SumAbsDiffU(DefaultScale, new Span<float>(src, 0, Length)); 75=> SseIntrinsics.MaxAbsU(new Span<float>(src, 0, Length)); 79=> SseIntrinsics.MaxAbsDiffU(DefaultScale, new Span<float>(src, 0, Length)); 83=> SseIntrinsics.DotU(src, dst, Length); 87=> SseIntrinsics.DotSU(src, dst, idx, IndexLength); 91=> SseIntrinsics.Dist2(src, dst, Length); 95=> SseIntrinsics.SdcaL1UpdateU(DefaultScale, Length, src, DefaultScale, dst, result); 99=> SseIntrinsics.SdcaL1UpdateSU(DefaultScale, IndexLength, src, idx, DefaultScale, dst, result); 103=> SseIntrinsics.MatMul(testMatrixAligned, testSrcVectorAligned, testDstVectorAligned, matrixLength, matrixLength); 107=> SseIntrinsics.MatMulTran(testMatrixAligned, testSrcVectorAligned, testDstVectorAligned, matrixLength, matrixLength); 111=> SseIntrinsics.MatMulP(testMatrixAligned, matrixIdx, testSrcVectorAligned, 0, 0, MatrixIndexLength, testDstVectorAligned, matrixLength, matrixLength);