You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: Library/Raisr_AVX512FP16.cpp
+25-8Lines changed: 25 additions & 8 deletions
Original file line number
Diff line number
Diff line change
@@ -150,6 +150,7 @@ void computeGTWG_Segment_AVX512FP16_16f(const _Float16 *img, const int nrows, co
150
150
// process patchSize rows
151
151
// load next row
152
152
p1 += ncols;
153
+
153
154
__m512h c = _mm512_zextph256_ph512(_mm256_loadu_ph(p1));
154
155
c = _mm512_castps_ph(_mm512_insertf32x8(_mm512_castph_ps(c), _mm256_castph_ps(_mm512_castph512_ph256(c)), 1)); // duplicate high & low to compute GTWG for 2 pixels
155
156
__m512h w = _mm512_loadu_ph(gGaussian2DOriginal_fp16_doubled_w1w3[i]); // pixels 1,3
@@ -158,14 +159,15 @@ void computeGTWG_Segment_AVX512FP16_16f(const _Float16 *img, const int nrows, co
0 commit comments