File: unichar.py

package info (click to toggle)
pypy 7.0.0%2Bdfsg-3
  • links: PTS, VCS
  • area: main
  • in suites: buster
  • size: 107,216 kB
  • sloc: python: 1,201,787; ansic: 62,419; asm: 5,169; cpp: 3,017; sh: 2,534; makefile: 545; xml: 243; lisp: 45; awk: 4
file content (54 lines) | stat: -rw-r--r-- 1,751 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
"""
Helpers to pack and unpack a unicode character into raw bytes.
"""

import sys
from rpython.rlib.runicode import MAXUNICODE

if MAXUNICODE <= 65535:
    UNICODE_SIZE = 2
else:
    UNICODE_SIZE = 4
BIGENDIAN = sys.byteorder == "big"

def pack_unichar(unich, buf, pos):
    if UNICODE_SIZE == 2:
        if BIGENDIAN:
            buf.setitem(pos,   chr(ord(unich) >> 8))
            buf.setitem(pos+1, chr(ord(unich) & 0xFF))
        else:
            buf.setitem(pos,   chr(ord(unich) & 0xFF))
            buf.setitem(pos+1, chr(ord(unich) >> 8))
    else:
        if BIGENDIAN:
            buf.setitem(pos,   chr(ord(unich) >> 24))
            buf.setitem(pos+1, chr((ord(unich) >> 16) & 0xFF))
            buf.setitem(pos+2, chr((ord(unich) >> 8) & 0xFF))
            buf.setitem(pos+3, chr(ord(unich) & 0xFF))
        else:
            buf.setitem(pos,   chr(ord(unich) & 0xFF))
            buf.setitem(pos+1, chr((ord(unich) >> 8) & 0xFF))
            buf.setitem(pos+2, chr((ord(unich) >> 16) & 0xFF))
            buf.setitem(pos+3, chr(ord(unich) >> 24))

def unpack_unichar(rawstring):
    assert len(rawstring) == UNICODE_SIZE
    if UNICODE_SIZE == 2:
        if BIGENDIAN:
            n = (ord(rawstring[0]) << 8 |
                 ord(rawstring[1]))
        else:
            n = (ord(rawstring[0]) |
                 ord(rawstring[1]) << 8)
    else:
        if BIGENDIAN:
            n = (ord(rawstring[0]) << 24 |
                 ord(rawstring[1]) << 16 |
                 ord(rawstring[2]) << 8 |
                 ord(rawstring[3]))
        else:
            n = (ord(rawstring[0]) |
                 ord(rawstring[1]) << 8 |
                 ord(rawstring[2]) << 16 |
                 ord(rawstring[3]) << 24)
    return unichr(n)