Lines Matching defs:utf16
4331 /* begin file src/scalar/utf16.h */
4338 namespace utf16 {
4449 } // utf16 namespace
4455 /* end file src/scalar/utf16.h */
5616 return scalar::utf16::trim_partial_utf16<BIG>(input, length);
5620 return scalar::utf16::trim_partial_utf16<LITTLE>(input, length);
10953 *utf16_output++ = !match_system(big_endian) ? char16_t(utf16::swap_bytes(uint16_t(word))) : char16_t(word);
10961 high_surrogate = utf16::swap_bytes(high_surrogate);
10962 low_surrogate = utf16::swap_bytes(low_surrogate);
10998 *utf16_output++ = !match_system(big_endian) ? char16_t(utf16::swap_bytes(uint16_t(word))) : char16_t(word);
11006 high_surrogate = utf16::swap_bytes(high_surrogate);
11007 low_surrogate = utf16::swap_bytes(low_surrogate);
11027 *utf16_output++ = !match_system(big_endian) ? char16_t(utf16::swap_bytes(uint16_t(word))) : char16_t(word);
11035 high_surrogate = utf16::swap_bytes(high_surrogate);
11036 low_surrogate = utf16::swap_bytes(low_surrogate);
11077 *utf8_output++ = !match_system(big_endian) ? char(utf16::swap_bytes(buf[pos])) : char(buf[pos]);
11084 uint16_t word = !match_system(big_endian) ? utf16::swap_bytes(data[pos]) : data[pos];
11106 uint16_t next_word = !match_system(big_endian) ? utf16::swap_bytes(data[pos + 1]) : data[pos + 1];
11151 *utf8_output++ = !match_system(big_endian) ? char(utf16::swap_bytes(buf[pos])) : char(buf[pos]);
11157 uint16_t word = !match_system(big_endian) ? utf16::swap_bytes(data[pos]) : data[pos];
11180 uint16_t next_word = !match_system(big_endian) ? utf16::swap_bytes(data[pos + 1]) : data[pos + 1];
11210 *utf8_output++ = !match_system(big_endian) ? char(utf16::swap_bytes(buf[pos])) : char(buf[pos]);
11216 uint16_t word = !match_system(big_endian) ? utf16::swap_bytes(data[pos]) : data[pos];
11239 uint16_t next_word = !match_system(big_endian) ? utf16::swap_bytes(data[pos + 1]) : data[pos + 1];
11278 uint16_t word = !match_system(big_endian) ? utf16::swap_bytes(data[pos]) : data[pos];
11287 uint16_t next_word = !match_system(big_endian) ? utf16::swap_bytes(data[pos + 1]) : data[pos + 1];
11319 uint16_t word = !match_system(big_endian) ? utf16::swap_bytes(data[pos]) : data[pos];
11329 uint16_t next_word = !match_system(big_endian) ? utf16::swap_bytes(data[pos + 1]) : data[pos + 1];
11346 uint16_t word = !match_system(big_endian) ? utf16::swap_bytes(data[pos]) : data[pos];
11356 uint16_t next_word = !match_system(big_endian) ? utf16::swap_bytes(data[pos + 1]) : data[pos + 1];
11397 *utf16_output++ = !match_system(big_endian) ? char16_t(utf16::swap_bytes(buf[pos])) : char16_t(buf[pos]);
11406 *utf16_output++ = !match_system(big_endian) ? char16_t(utf16::swap_bytes(leading_byte)) : char16_t(leading_byte);
11414 code_point = utf16::swap_bytes(uint16_t(code_point));
11424 code_point = utf16::swap_bytes(uint16_t(code_point));
11437 high_surrogate = utf16::swap_bytes(high_surrogate);
11438 low_surrogate = utf16::swap_bytes(low_surrogate);
11484 *utf16_output++ = !match_system(big_endian) ? char16_t(utf16::swap_bytes(buf[pos])) : char16_t(buf[pos]);
11494 *utf16_output++ = !match_system(big_endian) ? char16_t(utf16::swap_bytes(leading_byte)): char16_t(leading_byte);
11505 code_point = uint32_t(utf16::swap_bytes(uint16_t(code_point)));
11525 code_point = uint32_t(utf16::swap_bytes(uint16_t(code_point)));
11545 high_surrogate = utf16::swap_bytes(high_surrogate);
11546 low_surrogate = utf16::swap_bytes(low_surrogate);
11574 *utf16_output++ = !match_system(big_endian) ? char16_t(utf16::swap_bytes(buf[pos])) : char16_t(buf[pos]);
11583 *utf16_output++ = !match_system(big_endian) ? char16_t(utf16::swap_bytes(leading_byte)): char16_t(leading_byte);
11594 code_point = uint32_t(utf16::swap_bytes(uint16_t(code_point)));
11612 code_point = uint32_t(utf16::swap_bytes(uint16_t(code_point)));
11633 high_surrogate = utf16::swap_bytes(high_surrogate);
11634 low_surrogate = utf16::swap_bytes(low_surrogate);
12055 *utf16_output++ = char16_t(match_system(big_endian) ? word : utf16::swap_bytes(word));
12070 *utf16_output++ = char16_t(match_system(big_endian) ? word : utf16::swap_bytes(word));
12301 word = !match_system(big_endian) ? utf16::swap_bytes(data[pos]) : data[pos];
12337 *latin_output++ = !match_system(big_endian) ? char(utf16::swap_bytes(data[pos])) : char(data[pos]);
12343 word = !match_system(big_endian) ? utf16::swap_bytes(data[pos]) : data[pos];
12497 word = !match_system(big_endian) ? utf16::swap_bytes(data[pos]) : data[pos];
12864 if (is_utf16 && scalar::utf16::validate<endianness::LITTLE>(reinterpret_cast<const char16_t*>(buf), (len - (buf - start))/2)) {
13201 // Convert up to 16 bytes from utf8 to utf16 using a mask indicating the
13637 // Convert up to 16 bytes from utf8 to utf16 using a mask indicating the
13747 uint16_t word = !match_system(big_endian) ? scalar::utf16::swap_bytes(buf[k]) : buf[k];
14026 uint16_t word = !match_system(big_endian) ? scalar::utf16::swap_bytes(buf[k]) : buf[k];
14039 uint16_t next_word = !match_system(big_endian) ? scalar::utf16::swap_bytes(buf[k + 1]) : buf[k + 1];
14280 uint16_t word = !match_system(big_endian) ? scalar::utf16::swap_bytes(buf[k]) : buf[k];
14293 uint16_t next_word = !match_system(big_endian) ? scalar::utf16::swap_bytes(buf[k + 1]) : buf[k + 1];
14394 uint16_t word = !match_system(big_endian) ? scalar::utf16::swap_bytes(buf[k]) : buf[k];
14400 uint16_t next_word = !match_system(big_endian) ? scalar::utf16::swap_bytes(buf[k + 1]) : buf[k + 1];
14452 uint16_t word = !match_system(big_endian) ? scalar::utf16::swap_bytes(buf[k]) : buf[k];
14458 uint16_t next_word = !match_system(big_endian) ? scalar::utf16::swap_bytes(buf[k + 1]) : buf[k + 1];
16292 /* begin file src/generic/utf16.h */
16296 namespace utf16 {
16308 return count + scalar::utf16::count_code_points<big_endian>(in + pos, size - pos);
16329 return count + scalar::utf16::utf8_length_from_utf16<big_endian>(in + pos, size - pos);
16348 scalar::utf16::change_endianness_utf16(in + pos, size - pos, output);
16351 } // utf16
16355 /* end file src/generic/utf16.h */
16774 return scalar::utf16::validate<endianness::LITTLE>(tail, len - (tail - buf));
16783 return scalar::utf16::validate<endianness::BIG>(tail, len - (tail - buf));
16792 result scalar_res = scalar::utf16::validate_with_errors<endianness::LITTLE>(buf + res.count, len - res.count);
16802 result scalar_res = scalar::utf16::validate_with_errors<endianness::BIG>(buf + res.count, len - res.count);
17292 utf16::change_endianness_utf16(input, length, output);
17296 return utf16::count_code_points<endianness::LITTLE>(input, length);
17300 return utf16::count_code_points<endianness::BIG>(input, length);
17312 return scalar::utf16::latin1_length_from_utf16(length);
17340 return utf16::utf8_length_from_utf16<endianness::LITTLE>(input, length);
17344 return utf16::utf8_length_from_utf16<endianness::BIG>(input, length);
17360 return utf16::utf32_length_from_utf16<endianness::LITTLE>(input, length);
17364 return utf16::utf32_length_from_utf16<endianness::BIG>(input, length);
17479 return scalar::utf16::validate<endianness::LITTLE>(buf, len);
17483 return scalar::utf16::validate<endianness::BIG>(buf, len);
17487 return scalar::utf16::validate_with_errors<endianness::LITTLE>(buf, len);
17491 return scalar::utf16::validate_with_errors<endianness::BIG>(buf, len);
17688 scalar::utf16::change_endianness_utf16(input, length, output);
17692 return scalar::utf16::count_code_points<endianness::LITTLE>(input, length);
17696 return scalar::utf16::count_code_points<endianness::BIG>(input, length);
17708 return scalar::utf16::latin1_length_from_utf16(length);
17720 return scalar::utf16::utf8_length_from_utf16<endianness::LITTLE>(input, length);
17724 return scalar::utf16::utf8_length_from_utf16<endianness::BIG>(input, length);
17728 return scalar::utf16::utf32_length_from_utf16<endianness::LITTLE>(input, length);
17732 return scalar::utf16::utf32_length_from_utf16<endianness::BIG>(input, length);
19393 while ((word = (big_endian ? scalar::utf16::swap_bytes(uint16_t(*buf))
19416 while ((word = (big_endian ? scalar::utf16::swap_bytes(uint16_t(*buf))
20762 if (is_utf16 && scalar::utf16::validate<endianness::LITTLE>(
21629 __m512i utf16 = _mm512_loadu_si512((const __m512i*)(input + pos));
21630 utf16 = _mm512_shuffle_epi8(utf16, byteflip);
21631 _mm512_storeu_si512(output + pos, utf16);
21636 __m512i utf16 = _mm512_maskz_loadu_epi16(m, (const __m512i*)(input + pos));
21637 utf16 = _mm512_shuffle_epi8(utf16, byteflip);
21638 _mm512_mask_storeu_epi16(output + pos, m, utf16);
21653 __m512i utf16 = _mm512_loadu_si512((const __m512i*)ptr);
21655 uint64_t not_high_surrogate = static_cast<uint64_t>(_mm512_cmpgt_epu16_mask(utf16, high) | _mm512_cmplt_epu16_mask(utf16, low));
21659 return count + scalar::utf16::count_code_points<endianness::LITTLE>(ptr, length - (ptr - input));
21681 __m512i utf16 = _mm512_shuffle_epi8(_mm512_loadu_si512((__m512i*)ptr), byteflip);
21683 uint64_t not_high_surrogate = static_cast<uint64_t>(_mm512_cmpgt_epu16_mask(utf16, high) | _mm512_cmplt_epu16_mask(utf16, low));
21687 return count + scalar::utf16::count_code_points<endianness::BIG>(ptr, length - (ptr - input));
21755 return scalar::utf16::latin1_length_from_utf16(length);
21774 __m512i utf16 = _mm512_loadu_si512((const __m512i*)ptr);
21776 __mmask32 ascii_bitmask = _mm512_cmple_epu16_mask(utf16, v_007f);
21777 __mmask32 two_bytes_bitmask = _mm512_mask_cmple_epu16_mask(~ascii_bitmask, utf16, v_07ff);
21779 __mmask32 surrogates_bitmask = _mm512_mask_cmple_epu16_mask(not_one_two_bytes, utf16, v_dfff) & _mm512_mask_cmpge_epu16_mask(not_one_two_bytes, utf16, v_d800);
21789 return count + scalar::utf16::utf8_length_from_utf16<endianness::LITTLE>(ptr, length - (ptr - input));
21813 __m512i utf16 = _mm512_loadu_si512((const __m512i*)ptr);
21814 utf16 = _mm512_shuffle_epi8(utf16, byteflip);
21816 __mmask32 ascii_bitmask = _mm512_cmple_epu16_mask(utf16, v_007f);
21817 __mmask32 two_bytes_bitmask = _mm512_mask_cmple_epu16_mask(~ascii_bitmask, utf16, v_07ff);
21819 __mmask32 surrogates_bitmask = _mm512_mask_cmple_epu16_mask(not_one_two_bytes, utf16, v_dfff) & _mm512_mask_cmpge_epu16_mask(not_one_two_bytes, utf16, v_d800);
21828 return count + scalar::utf16::utf8_length_from_utf16<endianness::BIG>(ptr, length - (ptr - input));
22210 if (is_utf16 && scalar::utf16::validate<endianness::LITTLE>(reinterpret_cast<const char16_t*>(buf), (len - (buf - start))/2)) {
22634 // Convert up to 12 bytes from utf8 to utf16 using a mask indicating the
23010 ? scalar::utf16::swap_bytes(buf[k])
23286 uint16_t word = big_endian ? scalar::utf16::swap_bytes(buf[k]) : buf[k];
23299 uint16_t next_word = big_endian ? scalar::utf16::swap_bytes(buf[k+1]) : buf[k+1];
23529 uint16_t word = big_endian ? scalar::utf16::swap_bytes(buf[k]) : buf[k];
23542 uint16_t next_word = big_endian ? scalar::utf16::swap_bytes(buf[k+1]) : buf[k+1];
23653 uint16_t word = big_endian ? scalar::utf16::swap_bytes(buf[k]) : buf[k];
23660 uint16_t next_word = big_endian ? scalar::utf16::swap_bytes(buf[k+1]) : buf[k+1];
23721 uint16_t word = big_endian ? scalar::utf16::swap_bytes(buf[k]) : buf[k];
23728 uint16_t next_word = big_endian ? scalar::utf16::swap_bytes(buf[k+1]) : buf[k+1];
25703 /* begin file src/generic/utf16.h */
25707 namespace utf16 {
25719 return count + scalar::utf16::count_code_points<big_endian>(in + pos, size - pos);
25740 return count + scalar::utf16::utf8_length_from_utf16<big_endian>(in + pos, size - pos);
25759 scalar::utf16::change_endianness_utf16(in + pos, size - pos, output);
25762 } // utf16
25766 /* end file src/generic/utf16.h */
26182 return scalar::utf16::validate<endianness::LITTLE>(tail, len - (tail - buf));
26191 return scalar::utf16::validate<endianness::BIG>(tail, len - (tail - buf));
26200 result scalar_res = scalar::utf16::validate_with_errors<endianness::LITTLE>(buf + res.count, len - res.count);
26210 result scalar_res = scalar::utf16::validate_with_errors<endianness::BIG>(buf + res.count, len - res.count);
26696 utf16::change_endianness_utf16(input, length, output);
26700 return utf16::count_code_points<endianness::LITTLE>(input, length);
26704 return utf16::count_code_points<endianness::BIG>(input, length);
26716 return scalar::utf16::latin1_length_from_utf16(length);
26724 return utf16::utf8_length_from_utf16<endianness::LITTLE>(input, length);
26728 return utf16::utf8_length_from_utf16<endianness::BIG>(input, length);
26732 return utf16::utf32_length_from_utf16<endianness::LITTLE>(input, length);
26736 return utf16::utf32_length_from_utf16<endianness::BIG>(input, length);
28075 /* begin file src/generic/utf16.h */
28079 namespace utf16 {
28091 return count + scalar::utf16::count_code_points<big_endian>(in + pos, size - pos);
28112 return count + scalar::utf16::utf8_length_from_utf16<big_endian>(in + pos, size - pos);
28131 scalar::utf16::change_endianness_utf16(in + pos, size - pos, output);
28134 } // utf16
28138 /* end file src/generic/utf16.h */
28179 return scalar::utf16::validate<endianness::LITTLE>(buf, len);
28183 return scalar::utf16::validate<endianness::BIG>(buf, len);
28187 return scalar::utf16::validate_with_errors<endianness::LITTLE>(buf, len);
28191 return scalar::utf16::validate_with_errors<endianness::BIG>(buf, len);
28323 scalar::utf16::change_endianness_utf16(input, length, output);
28327 return scalar::utf16::count_code_points<endianness::LITTLE>(input, length);
28331 return scalar::utf16::count_code_points<endianness::BIG>(input, length);
28339 return scalar::utf16::utf8_length_from_utf16<endianness::LITTLE>(input, length);
28343 return scalar::utf16::utf8_length_from_utf16<endianness::BIG>(input, length);
28347 return scalar::utf16::utf32_length_from_utf16<endianness::LITTLE>(input, length);
28351 return scalar::utf16::utf32_length_from_utf16<endianness::BIG>(input, length);
28687 if (is_utf16 && scalar::utf16::validate<endianness::LITTLE>(reinterpret_cast<const char16_t*>(buf), (len - (buf - start))/2)) {
29109 // Convert up to 12 bytes from utf8 to utf16 using a mask indicating the
29525 uint16_t word = !match_system(big_endian) ? scalar::utf16::swap_bytes(buf[k]) : buf[k];
29758 uint16_t word = big_endian ? scalar::utf16::swap_bytes(buf[k]) : buf[k];
29771 uint16_t next_word = big_endian ? scalar::utf16::swap_bytes(buf[k+1]) : buf[k+1];
29962 uint16_t word = big_endian ? scalar::utf16::swap_bytes(buf[k]) : buf[k];
29975 uint16_t next_word = big_endian ? scalar::utf16::swap_bytes(buf[k+1]) : buf[k+1];
30087 uint16_t word = big_endian ? scalar::utf16::swap_bytes(buf[k]) : buf[k];
30093 uint16_t next_word = big_endian ? scalar::utf16::swap_bytes(buf[k+1]) : buf[k+1];
30155 uint16_t word = big_endian ? scalar::utf16::swap_bytes(buf[k]) : buf[k];
30161 uint16_t next_word = big_endian ? scalar::utf16::swap_bytes(buf[k+1]) : buf[k+1];
32082 /* begin file src/generic/utf16.h */
32086 namespace utf16 {
32098 return count + scalar::utf16::count_code_points<big_endian>(in + pos, size - pos);
32119 return count + scalar::utf16::utf8_length_from_utf16<big_endian>(in + pos, size - pos);
32138 scalar::utf16::change_endianness_utf16(in + pos, size - pos, output);
32141 } // utf16
32145 /* end file src/generic/utf16.h */
32564 return scalar::utf16::validate<endianness::LITTLE>(tail, len - (tail - buf));
32573 return scalar::utf16::validate<endianness::BIG>(tail, len - (tail - buf));
32582 result scalar_res = scalar::utf16::validate_with_errors<endianness::LITTLE>(buf + res.count, len - res.count);
32592 result scalar_res = scalar::utf16::validate_with_errors<endianness::BIG>(buf + res.count, len - res.count);
33085 utf16::change_endianness_utf16(input, length, output);
33089 return utf16::count_code_points<endianness::LITTLE>(input, length);
33093 return utf16::count_code_points<endianness::BIG>(input, length);
33105 return scalar::utf16::latin1_length_from_utf16(length);
33113 return utf16::utf8_length_from_utf16<endianness::LITTLE>(input, length);
33117 return utf16::utf8_length_from_utf16<endianness::BIG>(input, length);
33176 return utf16::utf32_length_from_utf16<endianness::LITTLE>(input, length);
33180 return utf16::utf32_length_from_utf16<endianness::BIG>(input, length);