istereo2

annotate libs/drawtext/utf8.c @ 35:643f4ab609a4

added readme and license
author John Tsiombikas <nuclear@member.fsf.org>
date Sat, 31 Oct 2015 05:45:35 +0200
parents
children
rev   line source
nuclear@7 1 /*
nuclear@7 2 libdrawtext - a simple library for fast text rendering in OpenGL
nuclear@7 3 Copyright (C) 2011 John Tsiombikas <nuclear@member.fsf.org>
nuclear@7 4
nuclear@7 5 This program is free software: you can redistribute it and/or modify
nuclear@7 6 it under the terms of the GNU Lesser General Public License as published by
nuclear@7 7 the Free Software Foundation, either version 3 of the License, or
nuclear@7 8 (at your option) any later version.
nuclear@7 9
nuclear@7 10 This program is distributed in the hope that it will be useful,
nuclear@7 11 but WITHOUT ANY WARRANTY; without even the implied warranty of
nuclear@7 12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
nuclear@7 13 GNU Lesser General Public License for more details.
nuclear@7 14
nuclear@7 15 You should have received a copy of the GNU Lesser General Public License
nuclear@7 16 along with this program. If not, see <http://www.gnu.org/licenses/>.
nuclear@7 17 */
nuclear@7 18 #include "drawtext.h"
nuclear@7 19
nuclear@7 20 #define U8_IS_FIRST(x) (((((x) >> 7) & 1) == 0) || ((((x) >> 6) & 3) == 3))
nuclear@7 21
nuclear@7 22 static const char first_mask[] = {
nuclear@7 23 0,
nuclear@7 24 0x7f, /* single byte, 7 bits valid */
nuclear@7 25 0x1f, /* two-bytes, 5 bits valid */
nuclear@7 26 0xf, /* three-bytes, 4 bits valid */
nuclear@7 27 0x7 /* four-bytes, 3 bits valid */
nuclear@7 28 };
nuclear@7 29 static const char first_shift[] = { 0, 7, 5, 4, 3 }; /* see above */
nuclear@7 30
nuclear@7 31 #define CONT_PREFIX 0x80
nuclear@7 32 #define CONT_MASK 0x3f
nuclear@7 33 #define CONT_SHIFT 6
nuclear@7 34
nuclear@7 35 /* last charcodes for 1, 2, 3 or 4-byte utf8 chars */
nuclear@7 36 static const int utf8_lastcode[] = { 0x7f, 0x7ff, 0xfff, 0x1fffff };
nuclear@7 37
nuclear@7 38 #define prefix_mask(x) (~first_mask[x])
nuclear@7 39 #define prefix(x) ((prefix_mask(x) << 1) & 0xff)
nuclear@7 40
nuclear@7 41
nuclear@7 42 char *dtx_utf8_next_char(char *str)
nuclear@7 43 {
nuclear@7 44 return str + dtx_utf8_nbytes(str);
nuclear@7 45 }
nuclear@7 46
nuclear@7 47 int dtx_utf8_char_code(const char *str)
nuclear@7 48 {
nuclear@7 49 int i, nbytes, shift, code = 0;
nuclear@7 50 int mask;
nuclear@7 51
nuclear@7 52 if(!U8_IS_FIRST(*str)) {
nuclear@7 53 return -1;
nuclear@7 54 }
nuclear@7 55
nuclear@7 56 nbytes = dtx_utf8_nbytes(str);
nuclear@7 57 mask = first_mask[nbytes];
nuclear@7 58 shift = 0;
nuclear@7 59
nuclear@7 60 for(i=0; i<nbytes; i++) {
nuclear@7 61 if(!*str) {
nuclear@7 62 break;
nuclear@7 63 }
nuclear@7 64
nuclear@7 65 code = (code << shift) | (*str++ & mask);
nuclear@7 66 mask = 0x3f;
nuclear@7 67 shift = 6;
nuclear@7 68 }
nuclear@7 69 return code;
nuclear@7 70 }
nuclear@7 71
nuclear@7 72 int dtx_utf8_nbytes(const char *str)
nuclear@7 73 {
nuclear@7 74 int i, numset = 0;
nuclear@7 75 int c = *str;
nuclear@7 76
nuclear@7 77 if(!U8_IS_FIRST(c)) {
nuclear@7 78 for(i=0; !U8_IS_FIRST(str[i]); i++);
nuclear@7 79 return i;
nuclear@7 80 }
nuclear@7 81
nuclear@7 82 /* count the leading 1s */
nuclear@7 83 for(i=0; i<4; i++) {
nuclear@7 84 if(((c >> (7 - i)) & 1) == 0) {
nuclear@7 85 break;
nuclear@7 86 }
nuclear@7 87 numset++;
nuclear@7 88 }
nuclear@7 89
nuclear@7 90 if(!numset) {
nuclear@7 91 return 1;
nuclear@7 92 }
nuclear@7 93 return numset;
nuclear@7 94 }
nuclear@7 95
nuclear@7 96 int dtx_utf8_char_count(const char *str)
nuclear@7 97 {
nuclear@7 98 int n = 0;
nuclear@7 99
nuclear@7 100 while(*str) {
nuclear@7 101 n++;
nuclear@7 102 str = dtx_utf8_next_char((char*)str);
nuclear@7 103 }
nuclear@7 104 return n;
nuclear@7 105 }
nuclear@7 106
nuclear@7 107 size_t dtx_utf8_from_char_code(int code, char *buf)
nuclear@7 108 {
nuclear@7 109 size_t nbytes = 0;
nuclear@7 110 int i;
nuclear@7 111
nuclear@7 112 for(i=0; i<4; i++) {
nuclear@7 113 if(code <= utf8_lastcode[i]) {
nuclear@7 114 nbytes = i + 1;
nuclear@7 115 break;
nuclear@7 116 }
nuclear@7 117 }
nuclear@7 118
nuclear@7 119 if(!nbytes && buf) {
nuclear@7 120 for(i=0; i<(int)nbytes; i++) {
nuclear@7 121 int idx = nbytes - i - 1;
nuclear@7 122 int mask, shift, prefix;
nuclear@7 123
nuclear@7 124 if(idx > 0) {
nuclear@7 125 mask = CONT_MASK;
nuclear@7 126 shift = CONT_SHIFT;
nuclear@7 127 prefix = CONT_PREFIX;
nuclear@7 128 } else {
nuclear@7 129 mask = first_mask[nbytes];
nuclear@7 130 shift = first_shift[nbytes];
nuclear@7 131 prefix = prefix(nbytes);
nuclear@7 132 }
nuclear@7 133
nuclear@7 134 buf[idx] = (code & mask) | (prefix & ~mask);
nuclear@7 135 code >>= shift;
nuclear@7 136 }
nuclear@7 137 }
nuclear@7 138 return nbytes;
nuclear@7 139 }
nuclear@7 140
nuclear@7 141 size_t dtx_utf8_from_string(const wchar_t *str, char *buf)
nuclear@7 142 {
nuclear@7 143 size_t nbytes = 0;
nuclear@7 144 char *ptr = buf;
nuclear@7 145
nuclear@7 146 while(*str) {
nuclear@7 147 int cbytes = dtx_utf8_from_char_code(*str++, ptr);
nuclear@7 148 if(ptr) {
nuclear@7 149 ptr += cbytes;
nuclear@7 150 }
nuclear@7 151 nbytes += cbytes;
nuclear@7 152 }
nuclear@7 153 return nbytes;
nuclear@7 154 }