@@ -53,20 +53,13 @@ void RsFnt<uint16_t>::encode_post_process(
5353 uint16_t threshold = this ->gf ->card_minus_one ();
5454 unsigned code_len = this ->n_outputs ;
5555
56- // number of elements per vector register
57- unsigned vec_size = simd::countof <uint16_t >();
58- // number of vector registers per fragment packet
59- size_t vecs_nb = size / vec_size;
60- // odd number of elements not vectorized
61- size_t last_len = size - vecs_nb * vec_size;
62-
6356 simd::encode_post_process (
64- output, props, offset, code_len, threshold, vecs_nb );
57+ output, props, offset, code_len, threshold, simd_vec_len );
6558
66- if (last_len > 0 ) {
59+ if (simd_trailing_len > 0 ) {
6760 for (unsigned i = 0 ; i < code_len; ++i) {
6861 uint16_t * chunk = output.get (i);
69- for (size_t j = vecs_nb * vec_size ; j < size; ++j) {
62+ for (size_t j = simd_offset ; j < size; ++j) {
7063 if (chunk[j] == threshold) {
7164 props[i].add (offset + j, OOR_MARK);
7265 }
@@ -85,20 +78,13 @@ void RsFnt<uint32_t>::encode_post_process(
8578 const uint32_t threshold = this ->gf ->card_minus_one ();
8679 const unsigned code_len = this ->n_outputs ;
8780
88- // number of elements per vector register
89- const unsigned vec_size = simd::countof <uint32_t >();
90- // number of vector registers per fragment packet
91- const size_t vecs_nb = size / vec_size;
92- // odd number of elements not vectorized
93- const size_t last_len = size - vecs_nb * vec_size;
94-
9581 simd::encode_post_process (
96- output, props, offset, code_len, threshold, vecs_nb );
82+ output, props, offset, code_len, threshold, simd_vec_len );
9783
98- if (last_len > 0 ) {
84+ if (simd_trailing_len > 0 ) {
9985 for (unsigned i = 0 ; i < code_len; ++i) {
10086 uint32_t * chunk = output.get (i);
101- for (size_t j = vecs_nb * vec_size ; j < size; ++j) {
87+ for (size_t j = simd_offset ; j < size; ++j) {
10288 if (chunk[j] == threshold) {
10389 props[i].add (offset + j, OOR_MARK);
10490 }
0 commit comments