Utf16Encoder.h 2.5 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667
  1. /**
  2. * @file Utf16Encoder.h
  3. * @author Ambroz Bizjak <ambrop7@gmail.com>
  4. *
  5. * @section LICENSE
  6. *
  7. * Redistribution and use in source and binary forms, with or without
  8. * modification, are permitted provided that the following conditions are met:
  9. * 1. Redistributions of source code must retain the above copyright
  10. * notice, this list of conditions and the following disclaimer.
  11. * 2. Redistributions in binary form must reproduce the above copyright
  12. * notice, this list of conditions and the following disclaimer in the
  13. * documentation and/or other materials provided with the distribution.
  14. * 3. Neither the name of the author nor the
  15. * names of its contributors may be used to endorse or promote products
  16. * derived from this software without specific prior written permission.
  17. *
  18. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
  19. * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
  20. * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
  21. * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
  22. * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
  23. * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  24. * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
  25. * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  26. * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
  27. * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  28. */
  29. #ifndef BADVPN_UTF16ENCODER_H
  30. #define BADVPN_UTF16ENCODER_H
  31. #include <stdint.h>
  32. /**
  33. * Encodes a Unicode character into a sequence of 16-bit values according to UTF-16.
  34. *
  35. * @param ch Unicode character to encode
  36. * @param out will receive the encoded 16-bit values. Must have space for 2 values.
  37. * @return number of 16-bit values written, 0-2, with 0 meaning the character cannot
  38. * be encoded
  39. */
  40. static int Utf16Encoder_EncodeCharacter (uint32_t ch, uint16_t *out);
  41. int Utf16Encoder_EncodeCharacter (uint32_t ch, uint16_t *out)
  42. {
  43. if (ch <= UINT32_C(0xFFFF)) {
  44. // surrogates
  45. if (ch >= UINT32_C(0xD800) && ch <= UINT32_C(0xDFFF)) {
  46. return 0;
  47. }
  48. out[0] = ch;
  49. return 1;
  50. }
  51. if (ch <= UINT32_C(0x10FFFF)) {
  52. uint32_t x = ch - UINT32_C(0x10000);
  53. out[0] = UINT32_C(0xD800) + (x >> 10);
  54. out[1] = UINT32_C(0xDC00) + (x & UINT32_C(0x3FF));
  55. return 2;
  56. }
  57. return 0;
  58. }
  59. #endif