1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
|
#cython: c_string_type = unicode
#cython: c_string_encoding = ascii
auto_string_type = unicode
from libc.string cimport strcmp
def _as_string(x):
try:
return x.decode('latin1')
except AttributeError:
return x
def as_objects(char* ascii_data):
"""
>>> x = as_objects('abc')
>>> isinstance(x, auto_string_type) or type(x)
True
>>> _as_string(x) == 'abc' or repr(x)
True
"""
assert isinstance(<object>ascii_data, auto_string_type)
assert isinstance(<bytes>ascii_data, bytes)
assert isinstance(<str>ascii_data, str)
assert isinstance(<unicode>ascii_data, unicode)
return ascii_data
def from_object():
"""
>>> from_object()
"""
cdef bytes b = b"abc"
cdef str s = "abc"
cdef unicode u = u"abc"
assert strcmp(<char*>b, "abc") == 0
assert strcmp(<char*>s, "abc") == 0
assert strcmp(<char*>u, "abc") == 0
def slice_as_objects(char* ascii_data, int start, int end):
"""
>>> x = slice_as_objects('grok', 1, 3)
>>> isinstance(x, auto_string_type) or type(x)
True
>>> _as_string(x) == 'ro' or repr(x)
True
"""
assert isinstance(<object>ascii_data[start:end], auto_string_type)
assert isinstance(<bytes>ascii_data[start:end], bytes)
assert isinstance(<str>ascii_data[start:end], str)
assert isinstance(<unicode>ascii_data[start:end], unicode)
assert isinstance(<object>ascii_data[start:], auto_string_type)
assert isinstance(<bytes>ascii_data[start:], bytes)
assert isinstance(<str>ascii_data[start:], str)
assert isinstance(<unicode>ascii_data[start:], unicode)
return ascii_data[start:end]
|