src/utils/SkUTF.h - platform/external/skqp - Gitiles

 // Copyright 2018 Google LLC.
 // Use of this source code is governed by a BSD-style license that can be found in the LICENSE file.
 #ifndef SkUTF_DEFINED
 #define SkUTF_DEFINED

 #include <cstddef>
 #include <cstdint>

 typedef int32_t SkUnichar;

 namespace SkUTF {

 /** Given a sequence of UTF-8 bytes, return the number of unicode codepoints.
     If the sequence is invalid UTF-8, return -1.
 */
 int CountUTF8(const char* utf8, size_t byteLength);

 /** Given a sequence of aligned UTF-16 characters in machine-endian form,
     return the number of unicode codepoints.  If the sequence is invalid
     UTF-16, return -1.
 */
 int CountUTF16(const uint16_t* utf16, size_t byteLength);

 /** Given a sequence of aligned UTF-32 characters in machine-endian form,
     return the number of unicode codepoints.  If the sequence is invalid
     UTF-32, return -1.
 */
 int CountUTF32(const int32_t* utf32, size_t byteLength);

 /** Given a sequence of UTF-8 bytes, return the first unicode codepoint.
     The pointer will be incremented to point at the next codepoint's start.  If
     invalid UTF-8 is encountered, set *ptr to end and return -1.
 */
 SkUnichar NextUTF8(const char** ptr, const char* end);

 /** Given a sequence of aligned UTF-16 characters in machine-endian form,
     return the first unicode codepoint.  The pointer will be incremented to
     point at the next codepoint's start.  If invalid UTF-16 is encountered,
     set *ptr to end and return -1.
 */
 SkUnichar NextUTF16(const uint16_t** ptr, const uint16_t* end);

 /** Given a sequence of aligned UTF-32 characters in machine-endian form,
     return the first unicode codepoint.  The pointer will be incremented to
     point at the next codepoint's start.  If invalid UTF-32 is encountered,
     set *ptr to end and return -1.
 */
 SkUnichar NextUTF32(const int32_t** ptr, const int32_t* end);

 constexpr unsigned kMaxBytesInUTF8Sequence = 4;

 /** Convert the unicode codepoint into UTF-8.  If `utf8` is non-null, place the
     result in that array.  Return the number of bytes in the result.  If `utf8`
     is null, simply return the number of bytes that would be used.  For invalid
     unicode codepoints, return 0.
 */
 size_t ToUTF8(SkUnichar uni, char utf8[kMaxBytesInUTF8Sequence] = nullptr);

 /** Convert the unicode codepoint into UTF-16.  If `utf16` is non-null, place
     the result in that array.  Return the number of UTF-16 code units in the
     result (1 or 2).  If `utf16` is null, simply return the number of code
     units that would be used.  For invalid unicode codepoints, return 0.
 */
 size_t ToUTF16(SkUnichar uni, uint16_t utf16[2] = nullptr);

 }  // namespace SkUTF

 #endif  // SkUTF_DEFINED
	// Copyright 2018 Google LLC.
	// Use of this source code is governed by a BSD-style license that can be found in the LICENSE file.
	#ifndef SkUTF_DEFINED
	#define SkUTF_DEFINED

	#include <cstddef>
	#include <cstdint>

	typedef int32_t SkUnichar;

	namespace SkUTF {

	/** Given a sequence of UTF-8 bytes, return the number of unicode codepoints.
	If the sequence is invalid UTF-8, return -1.
	*/
	int CountUTF8(const char* utf8, size_t byteLength);

	/** Given a sequence of aligned UTF-16 characters in machine-endian form,
	return the number of unicode codepoints. If the sequence is invalid
	UTF-16, return -1.
	*/
	int CountUTF16(const uint16_t* utf16, size_t byteLength);

	/** Given a sequence of aligned UTF-32 characters in machine-endian form,
	return the number of unicode codepoints. If the sequence is invalid
	UTF-32, return -1.
	*/
	int CountUTF32(const int32_t* utf32, size_t byteLength);

	/** Given a sequence of UTF-8 bytes, return the first unicode codepoint.
	The pointer will be incremented to point at the next codepoint's start. If
	invalid UTF-8 is encountered, set *ptr to end and return -1.
	*/
	SkUnichar NextUTF8(const char** ptr, const char* end);

	/** Given a sequence of aligned UTF-16 characters in machine-endian form,
	return the first unicode codepoint. The pointer will be incremented to
	point at the next codepoint's start. If invalid UTF-16 is encountered,
	set *ptr to end and return -1.
	*/
	SkUnichar NextUTF16(const uint16_t** ptr, const uint16_t* end);

	/** Given a sequence of aligned UTF-32 characters in machine-endian form,
	return the first unicode codepoint. The pointer will be incremented to
	point at the next codepoint's start. If invalid UTF-32 is encountered,
	set *ptr to end and return -1.
	*/
	SkUnichar NextUTF32(const int32_t** ptr, const int32_t* end);

	constexpr unsigned kMaxBytesInUTF8Sequence = 4;

	/** Convert the unicode codepoint into UTF-8. If `utf8` is non-null, place the
	result in that array. Return the number of bytes in the result. If `utf8`
	is null, simply return the number of bytes that would be used. For invalid
	unicode codepoints, return 0.
	*/
	size_t ToUTF8(SkUnichar uni, char utf8[kMaxBytesInUTF8Sequence] = nullptr);

	/** Convert the unicode codepoint into UTF-16. If `utf16` is non-null, place
	the result in that array. Return the number of UTF-16 code units in the
	result (1 or 2). If `utf16` is null, simply return the number of code
	units that would be used. For invalid unicode codepoints, return 0.
	*/
	size_t ToUTF16(SkUnichar uni, uint16_t utf16[2] = nullptr);

	} // namespace SkUTF

	#endif // SkUTF_DEFINED