diff --git a/SYCL/ESIMD/histogram_256_slm.cpp b/SYCL/ESIMD/histogram_256_slm.cpp index 2a5d5953a2..1042153500 100644 --- a/SYCL/ESIMD/histogram_256_slm.cpp +++ b/SYCL/ESIMD/histogram_256_slm.cpp @@ -37,7 +37,6 @@ ESIMD_INLINE void histogram_atomic(const uint32_t *input_ptr, uint32_t *output, slm_offset *= sizeof(int); simd slm_data = 0; slm_store(slm_data, slm_offset); - esimd_fence(ESIMD_GLOBAL_COHERENT_FENCE); esimd_barrier(); // Each thread handles NUM_BLOCKSxBLOCK_WIDTH pixel blocks @@ -56,7 +55,6 @@ ESIMD_INLINE void histogram_atomic(const uint32_t *input_ptr, uint32_t *output, } start_off += BLOCK_WIDTH; } - esimd_fence(ESIMD_GLOBAL_COHERENT_FENCE); esimd_barrier(); // Update global sum by atomically adding each local histogram diff --git a/SYCL/ESIMD/histogram_256_slm_spec.cpp b/SYCL/ESIMD/histogram_256_slm_spec.cpp index f6c569760e..9cb37e9224 100644 --- a/SYCL/ESIMD/histogram_256_slm_spec.cpp +++ b/SYCL/ESIMD/histogram_256_slm_spec.cpp @@ -38,7 +38,6 @@ ESIMD_INLINE void histogram_atomic(const uint32_t *input_ptr, uint32_t *output, slm_offset *= sizeof(int); simd slm_data = 0; slm_store(slm_data, slm_offset); - esimd_fence(ESIMD_GLOBAL_COHERENT_FENCE); esimd_barrier(); // Each thread handles NUM_BLOCKSxBLOCK_WIDTH pixel blocks @@ -57,7 +56,6 @@ ESIMD_INLINE void histogram_atomic(const uint32_t *input_ptr, uint32_t *output, } start_off += BLOCK_WIDTH; } - esimd_fence(ESIMD_GLOBAL_COHERENT_FENCE); esimd_barrier(); // Update global sum by atomically adding each local histogram diff --git a/SYCL/ESIMD/linear/linear.cpp b/SYCL/ESIMD/linear/linear.cpp index 79219fea5e..b7d4b2c090 100644 --- a/SYCL/ESIMD/linear/linear.cpp +++ b/SYCL/ESIMD/linear/linear.cpp @@ -104,17 +104,15 @@ int main(int argc, char *argv[]) { in = media_block_load(accInput, h_pos * 24, v_pos * 6); - simd vin_float = vin; - auto in_float = vin_float.format(); - m = in_float.select<6, 1, 24, 1>(1, 3); - m += in_float.select<6, 1, 24, 1>(0, 0); - m += in_float.select<6, 1, 24, 1>(0, 3); - m += in_float.select<6, 1, 24, 1>(0, 6); - m += in_float.select<6, 1, 24, 1>(1, 0); - m += in_float.select<6, 1, 24, 1>(1, 6); - m += in_float.select<6, 1, 24, 1>(2, 0); - m += in_float.select<6, 1, 24, 1>(2, 3); - m += in_float.select<6, 1, 24, 1>(2, 6); + m = in.select<6, 1, 24, 1>(1, 3); + m += in.select<6, 1, 24, 1>(0, 0); + m += in.select<6, 1, 24, 1>(0, 3); + m += in.select<6, 1, 24, 1>(0, 6); + m += in.select<6, 1, 24, 1>(1, 0); + m += in.select<6, 1, 24, 1>(1, 6); + m += in.select<6, 1, 24, 1>(2, 0); + m += in.select<6, 1, 24, 1>(2, 3); + m += in.select<6, 1, 24, 1>(2, 6); m = m * 0.111f; vout = vm; diff --git a/SYCL/ESIMD/slm_barrier.cpp b/SYCL/ESIMD/slm_barrier.cpp index 5dffc5c0d5..5d0a6e8cf5 100644 --- a/SYCL/ESIMD/slm_barrier.cpp +++ b/SYCL/ESIMD/slm_barrier.cpp @@ -68,7 +68,6 @@ void load_to_slm(uint grpSize, uint localId, uint slmOffset, char *addr, vOffsets += (grpSize * 256); } - esimd_fence(ESIMD_GLOBAL_COHERENT_FENCE); esimd_barrier(); }