You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

128 line
3.6 KiB

  1. static const char hexvals[256] = {
  2. -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
  3. -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
  4. -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
  5. 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, -1, -1, -1, -1, -1, -1,
  6. -1, 10, 11, 12, 13, 14, 15, -1, -1, -1, -1, -1, -1, -1, -1, -1,
  7. -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
  8. -1, 10, 11, 12, 13, 14, 15, -1, -1, -1, -1, -1, -1, -1, -1, -1,
  9. -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1
  10. };
  11. static const char hexdigits[16] = {
  12. '0', '1', '2', '3',
  13. '4', '5', '6', '7',
  14. '8', '9', 'A', 'B',
  15. 'C', 'D', 'E', 'F'
  16. };
  17. int
  18. int_from_hex(const unsigned char* p)
  19. {
  20. unsigned char* h = (unsigned char*) p;
  21. int ret;
  22. if(hexvals[*(h+0)] < 0) return -1;
  23. if(hexvals[*(h+1)] < 0) return -1;
  24. if(hexvals[*(h+2)] < 0) return -1;
  25. if(hexvals[*(h+3)] < 0) return -1;
  26. ret = (hexvals[*(h+0)] << 12)
  27. + (hexvals[*(h+1)] << 8)
  28. + (hexvals[*(h+2)] << 4)
  29. + (hexvals[*(h+3)] << 0);
  30. return ret;
  31. }
  32. int
  33. int_to_hex(int val, char* p)
  34. {
  35. if(val < 0 || val > 65535)
  36. return 0;
  37. p[0] = hexdigits[(val >> 12) & 0xF];
  38. p[1] = hexdigits[(val >> 8) & 0xF];
  39. p[2] = hexdigits[(val >> 4) & 0xF];
  40. p[3] = hexdigits[val & 0xF];
  41. return 1;
  42. }
  43. int
  44. utf8_len(int c)
  45. {
  46. if(c < 128) {
  47. return 1;
  48. } else if(c < 0x800) {
  49. return 2;
  50. } else if(c < 0x10000) {
  51. if(c < 0xD800 || (c > 0xDFFF && c < 0xFFFE)) {
  52. return 3;
  53. } else {
  54. return -1;
  55. }
  56. } else if(c < 0x200000) {
  57. return 4;
  58. } else if(c < 0x4000000) {
  59. return 5;
  60. } else if(c < 0x80000000) {
  61. return 6;
  62. } else {
  63. return -1;
  64. }
  65. }
  66. int
  67. utf8_from_pair(int hi, int lo)
  68. {
  69. if(hi < 0xD800 || hi >= 0xDC00) return -1;
  70. if(lo < 0xDC00 || lo > 0xDFFF) return -1;
  71. return ((hi & 0x3FF) << 10) + (lo & 0x3FF) + 0x10000;
  72. }
  73. int
  74. utf8_to_binary(int c, unsigned char* buf)
  75. {
  76. if(c < 0x80) {
  77. buf[0] = (unsigned char) c;
  78. return 1;
  79. } else if(c < 0x800) {
  80. buf[0] = (unsigned char) 0xC0 + (c >> 6);
  81. buf[1] = (unsigned char) 0x80 + (c & 0x3F);
  82. return 2;
  83. } else if(c < 0x10000) {
  84. if(c < 0xD800 || (c > 0xDFFF && c < 0xFFFE)) {
  85. buf[0] = (unsigned char) 0xE0 + (c >> 12);
  86. buf[1] = (unsigned char) 0x80 + ((c >> 6) & 0x3F);
  87. buf[2] = (unsigned char) 0x80 + (c & 0x3F);
  88. return 3;
  89. } else {
  90. return -1;
  91. }
  92. } else if(c < 0x200000) {
  93. buf[0] = (unsigned char) 0xF0 + (c >> 18);
  94. buf[1] = (unsigned char) 0x80 + ((c >> 12) & 0x3F);
  95. buf[2] = (unsigned char) 0x80 + ((c >> 6) & 0x3F);
  96. buf[3] = (unsigned char) 0x80 + (c & 0x3F);
  97. return 4;
  98. } else if(c < 0x4000000) {
  99. buf[0] = (unsigned char) 0xF8 + (c >> 24);
  100. buf[1] = (unsigned char) 0x80 + ((c >> 18) & 0x3F);
  101. buf[2] = (unsigned char) 0x80 + ((c >> 12) & 0x3F);
  102. buf[3] = (unsigned char) 0x80 + ((c >> 6) & 0x3F);
  103. buf[4] = (unsigned char) 0x80 + (c & 0x3F);
  104. return 5;
  105. } else if(c < 0x80000000) {
  106. buf[0] = (unsigned char) 0xFC + (c >> 30);
  107. buf[1] = (unsigned char) 0x80 + ((c >> 24) & 0x3F);
  108. buf[2] = (unsigned char) 0x80 + ((c >> 18) & 0x3F);
  109. buf[3] = (unsigned char) 0x80 + ((c >> 12) & 0x3F);
  110. buf[4] = (unsigned char) 0x80 + ((c >> 6) & 0x3F);
  111. buf[5] = (unsigned char) 0x80 + (c & 0x3F);
  112. return 6;
  113. }
  114. return -1;
  115. }