Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
C
cython
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Labels
Merge Requests
0
Merge Requests
0
Analytics
Analytics
Repository
Value Stream
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Commits
Open sidebar
nexedi
cython
Commits
6a9d1db4
Commit
6a9d1db4
authored
Apr 19, 2019
by
Stefan Behnel
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
Update test_unicode.py from Py3.8.
parent
97b9193a
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
26 additions
and
22 deletions
+26
-22
tests/run/test_unicode.pyx
tests/run/test_unicode.pyx
+26
-22
No files found.
tests/run/test_unicode.pyx
View file @
6a9d1db4
...
...
@@ -1666,6 +1666,11 @@ class UnicodeTest(CommonTest,
for
c
in
set_o
:
self
.
assertEqual
(
c
.
encode
(
'ascii'
).
decode
(
'utf7'
),
c
)
if
sys
.
version_info
>=
(
3
,
8
):
with
self
.
assertRaisesRegex
(
UnicodeDecodeError
,
'ill-formed sequence'
):
b'+@'
.
decode
(
'utf-7'
)
def
test_codecs_utf8
(
self
):
self
.
assertEqual
(
''
.
encode
(
'utf-8'
),
b''
)
self
.
assertEqual
(
'
\
u20ac
'
.
encode
(
'utf-8'
),
b'
\
xe2
\
x82
\
xac
'
)
...
...
@@ -1771,7 +1776,7 @@ class UnicodeTest(CommonTest,
# Issue #8271: during the decoding of an invalid UTF-8 byte sequence,
# only the start byte and the continuation byte(s) are now considered
# invalid, instead of the number of bytes specified by the start byte.
# See http
s
://www.unicode.org/versions/Unicode5.2.0/ch03.pdf (page 95,
# See http://www.unicode.org/versions/Unicode5.2.0/ch03.pdf (page 95,
# table 3-8, Row 2) for more information about the algorithm used.
FFFD
=
'
\
ufffd
'
sequences
=
[
...
...
@@ -2136,11 +2141,7 @@ class UnicodeTest(CommonTest,
u
=
chr
(
c
)
for
encoding
in
(
'utf-7'
,
'utf-8'
,
'utf-16'
,
'utf-16-le'
,
'utf-16-be'
,
'raw_unicode_escape'
,
'unicode_escape'
,
'unicode_internal'
):
with
warnings
.
catch_warnings
():
# unicode-internal has been deprecated
warnings
.
simplefilter
(
"ignore"
,
DeprecationWarning
)
'unicode_escape'
):
self
.
assertEqual
(
str
(
u
.
encode
(
encoding
),
encoding
),
u
)
# Roundtrip safety for BMP (just the first 256 chars)
...
...
@@ -2157,13 +2158,9 @@ class UnicodeTest(CommonTest,
# Roundtrip safety for non-BMP (just a few chars)
with
warnings
.
catch_warnings
():
# unicode-internal has been deprecated
warnings
.
simplefilter
(
"ignore"
,
DeprecationWarning
)
u
=
'
\
U00010001
\
U00020002
\
U00030003
\
U00040004
\
U00050005
'
for
encoding
in
(
'utf-8'
,
'utf-16'
,
'utf-16-le'
,
'utf-16-be'
,
'raw_unicode_escape'
,
'unicode_escape'
,
'unicode_internal'
):
'raw_unicode_escape'
,
'unicode_escape'
):
self
.
assertEqual
(
str
(
u
.
encode
(
encoding
),
encoding
),
u
)
# UTF-8 must be roundtrip safe for all code points
...
...
@@ -2382,22 +2379,23 @@ class UnicodeTest(CommonTest,
self
.
assertEqual
(
args
[
0
],
text
)
self
.
assertEqual
(
len
(
args
),
1
)
@
unittest
.
skipIf
(
sys
.
version_info
<
(
3
,
8
),
'resize test requires Py3.8+'
)
@
support
.
cpython_only
def
test_resize
(
self
):
from
_testcapi
import
getargs_u
for
length
in
range
(
1
,
100
,
7
):
# generate a fresh string (refcount=1)
text
=
'a'
*
length
+
'b'
with
support
.
check_warnings
((
'unicode_internal codec has been '
'deprecated'
,
DeprecationWarning
)):
# fill wstr internal field
abc
=
text
.
encode
(
'unicode_internal'
)
self
.
assertEqual
(
abc
.
decode
(
'unicode_internal'
)
,
text
)
abc
=
getargs_u
(
text
)
self
.
assertEqual
(
abc
,
text
)
# resize text: wstr field must be cleared and then recomputed
text
+=
'c'
abcdef
=
text
.
encode
(
'unicode_internal'
)
abcdef
=
getargs_u
(
text
)
self
.
assertNotEqual
(
abc
,
abcdef
)
self
.
assertEqual
(
abcdef
.
decode
(
'unicode_internal'
)
,
text
)
self
.
assertEqual
(
abcdef
,
text
)
def
test_compare
(
self
):
# Issue #17615
...
...
@@ -2714,6 +2712,12 @@ class CAPITest(unittest.TestCase):
check_format('%.%s',
b'%.%s', b'abc')
# Issue #33817: empty strings
check_format('',
b'')
check_format('',
b'%s', b'')
# Test PyUnicode_AsWideChar()
@support.cpython_only
def test_aswidechar(self):
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment