diff options
| author | Bond_009 <bond.009@outlook.com> | 2021-01-05 14:42:25 +0100 |
|---|---|---|
| committer | Bond_009 <bond.009@outlook.com> | 2021-01-05 14:42:25 +0100 |
| commit | a50c55c1e4e9d1f981f0563ab72471de1ddf2501 (patch) | |
| tree | f301948922e78b9e46498f0008cfb55bf04e3063 /1/part2_fast.c | |
| parent | e6efc41e26ffc1a93c29f1710bbb9dac18d162a4 (diff) | |
Optimize repair_avx_inner
Diffstat (limited to '1/part2_fast.c')
| -rw-r--r-- | 1/part2_fast.c | 6 |
1 files changed, 2 insertions, 4 deletions
diff --git a/1/part2_fast.c b/1/part2_fast.c index ffb4504..67cd6c5 100644 --- a/1/part2_fast.c +++ b/1/part2_fast.c @@ -12,11 +12,10 @@ int repair_avx_inner(int i, const int *arr, __m256i search); #else int repair_avx_inner(int i, const int *arr, __m256i search) { - __m256i start = _mm256_set1_epi32(i); + __m256i cmp = _mm256_sub_epi32(search, _mm256_set1_epi32(i)); for (int k = 0; k < INPUT_LEN; k += 8) { __m256i new = _mm256_loadu_si256((__m256i *)(&arr[k])); - new = _mm256_add_epi32(start, new); - int mask = _mm256_movemask_epi8(_mm256_cmpeq_epi32(new, search)); + int mask = _mm256_movemask_epi8(_mm256_cmpeq_epi32(new, cmp)); if (mask == 0) { continue; } @@ -125,7 +124,6 @@ int repair_avx(const int *arr) return 0; } - int main(int argc, char *argv[]) { FILE *file = fopen(argv[argc - 1], "r"); |
