| // Protocol Buffers - Google's data interchange format |
| // Copyright 2023 Google LLC. All rights reserved. |
| // |
| // Use of this source code is governed by a BSD-style |
| // license that can be found in the LICENSE file or at |
| // https://developers.google.com/open-source/licenses/bsd |
| |
| #include "upb/lex/unicode.h" |
| |
| // Must be last. |
| #include "upb/port/def.inc" |
| |
| int upb_Unicode_ToUTF8(uint32_t cp, char* out) { |
| if (cp <= 0x7f) { |
| out[0] = cp; |
| return 1; |
| } |
| if (cp <= 0x07ff) { |
| out[0] = (cp >> 6) | 0xc0; |
| out[1] = (cp & 0x3f) | 0x80; |
| return 2; |
| } |
| if (cp <= 0xffff) { |
| out[0] = (cp >> 12) | 0xe0; |
| out[1] = ((cp >> 6) & 0x3f) | 0x80; |
| out[2] = (cp & 0x3f) | 0x80; |
| return 3; |
| } |
| if (cp <= 0x10ffff) { |
| out[0] = (cp >> 18) | 0xf0; |
| out[1] = ((cp >> 12) & 0x3f) | 0x80; |
| out[2] = ((cp >> 6) & 0x3f) | 0x80; |
| out[3] = (cp & 0x3f) | 0x80; |
| return 4; |
| } |
| return 0; |
| } |