1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119
|
/*
* Copyright (C) 2005 Stefan Kleine Stegemann
*
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU General Public License
* as published by the Free Software Foundation; either version 2
* of the License, or (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
*/
#import "NSString+PopplerKitAdditions.h"
static const char kUTF8OffsetValues [256] = {
1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,
3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,4,4,4,4,4,4,4,4,5,5,5,5,6,6,1,1
};
@interface NSString (PopplerKitAdditionsPrivate)
- (unsigned) myUTF8Length;
@end
@implementation NSString (PopplerKitAdditions)
// we can assume that the UTF8String method returns a
// valid UTF8 character sequence, so we don't do error
// checking here.
- (unsigned int*) getUTF32String: (unsigned*)length;
{
unsigned utf8Length = [self myUTF8Length];
unsigned int* result = NSZoneMalloc(NSDefaultMallocZone(),
sizeof(unsigned int) * (utf8Length + 1));
const char *ch = [self UTF8String];
unsigned i;
for (i = 0; i < utf8Length; i++)
{
unsigned int wc = ((unsigned char*)ch)[0];
if (wc < 0x80) {
result[i] = wc;
ch++;
} else {
unsigned charlen = 0;
if (wc < 0xe0) {
charlen = 2;
wc &= 0x1f;
} else if (wc < 0xf0) {
charlen = 3;
wc &= 0x0f;
} else if (wc < 0xf8) {
charlen = 4;
wc &= 0x07;
} else if (wc < 0xfc) {
charlen = 5;
wc &= 0x03;
} else {
charlen = 6;
wc &= 0x01;
}
unsigned j;
for (j = 1; j < charlen; j++) {
wc <<= 6;
wc |= ((unsigned char *)ch)[j] & 0x3f;
}
result[i] = wc;
ch += charlen;
}
}
result[i] = 0;
if (length)
*length = i;
return result;
}
@end
/* ----------------------------------------------------- */
/* Category PopplerKitAdditionsPrivate */
/* ----------------------------------------------------- */
@implementation NSString (PopplerKitAdditionsPrivate)
- (unsigned) myUTF8Length;
{
unsigned length = 0;
const char* ch = [self UTF8String];
// str is always null terminated!
while (*ch) {
ch = (ch + kUTF8OffsetValues[*(unsigned char*)ch]);
++length;
}
return length;
}
@end
|