Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
erp5
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
Analytics
Analytics
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Commits
Issue Boards
Open sidebar
Kasra Jamshidi
erp5
Commits
c73b4e5f
Commit
c73b4e5f
authored
Sep 15, 2011
by
Nicolas Delaby
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
Check trustability of given encoding, otherwise guess a better one
Use helper function to test given encoding
parent
dd95b33a
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
29 additions
and
38 deletions
+29
-38
product/ERP5/Document/EmailDocument.py
product/ERP5/Document/EmailDocument.py
+29
-38
No files found.
product/ERP5/Document/EmailDocument.py
View file @
c73b4e5f
...
@@ -230,20 +230,7 @@ class EmailDocument(TextDocument):
...
@@ -230,20 +230,7 @@ class EmailDocument(TextDocument):
'Failed to decode %s header of %s with error: %s'
%
'Failed to decode %s header of %s with error: %s'
%
(
name
,
self
.
getPath
(),
error_message
))
(
name
,
self
.
getPath
(),
error_message
))
for
text
,
encoding
in
decoded_header
:
for
text
,
encoding
in
decoded_header
:
try
:
text
,
encoding
=
testCharsetAndConvert
(
text
,
'text/plain'
,
encoding
)
if
encoding
is
not
None
:
text
=
text
.
decode
(
encoding
).
encode
(
'utf-8'
)
else
:
text
=
text
.
decode
().
encode
(
'utf-8'
)
except
(
UnicodeDecodeError
,
LookupError
),
error_message
:
encoding
=
guessEncodingFromText
(
text
,
content_type
=
'text/plain'
)
if
encoding
is
not
None
:
try
:
text
=
text
.
decode
(
encoding
).
encode
(
'utf-8'
)
except
(
UnicodeDecodeError
,
LookupError
),
error_message
:
text
=
repr
(
text
)[
1
:
-
1
]
else
:
text
=
repr
(
text
)[
1
:
-
1
]
if
name
in
result
:
if
name
in
result
:
result
[
name
]
=
'%s %s'
%
(
result
[
name
],
text
)
result
[
name
]
=
'%s %s'
%
(
result
[
name
],
text
)
else
:
else
:
...
@@ -322,9 +309,15 @@ class EmailDocument(TextDocument):
...
@@ -322,9 +309,15 @@ class EmailDocument(TextDocument):
RESPONSE
.
setHeader
(
'Content-disposition'
,
RESPONSE
.
setHeader
(
'Content-disposition'
,
'attachment; filename="%s"'
%
filename
)
'attachment; filename="%s"'
%
filename
)
if
'text/html'
in
content_type
:
if
'text/html'
in
content_type
:
part_encoding
=
part
.
get_content_charset
()
message_text
=
part
.
get_payload
(
decode
=
1
)
text_result
,
encoding
=
testCharsetAndConvert
(
message_text
,
content_type
,
part_encoding
)
# Strip out html content in safe mode.
# Strip out html content in safe mode.
mime
,
content
=
self
.
convert
(
format
=
'html'
,
mime
,
content
=
self
.
convert
(
format
=
'html'
,
text_content
=
part
.
get_payload
(
decode
=
1
),
text_content
=
text_result
,
encoding
=
part_encoding
,
index
=
index
)
# add index to generate
index
=
index
)
# add index to generate
# a unique cache key per attachment
# a unique cache key per attachment
else
:
else
:
...
@@ -465,32 +458,13 @@ class EmailDocument(TextDocument):
...
@@ -465,32 +458,13 @@ class EmailDocument(TextDocument):
else
:
else
:
part_encoding
=
part
.
get_content_charset
()
part_encoding
=
part
.
get_content_charset
()
message_text
=
part
.
get_payload
(
decode
=
1
)
message_text
=
part
.
get_payload
(
decode
=
1
)
text_result
,
encoding
=
testCharsetAndConvert
(
message_text
,
part
.
get_content_type
(),
part_encoding
)
if
part
.
get_content_type
()
==
'text/html'
:
if
part
.
get_content_type
()
==
'text/html'
:
mime
,
text_result
=
self
.
convert
(
format
=
'html'
,
mime
,
text_result
=
self
.
convert
(
format
=
'html'
,
text_content
=
message_tex
t
,
text_content
=
text_resul
t
,
charset
=
part_encoding
)
charset
=
part_encoding
)
else
:
if
part_encoding
!=
'utf-8'
:
try
:
if
part_encoding
is
not
None
:
text_result
=
message_text
.
decode
(
part_encoding
).
encode
(
'utf-8'
)
else
:
text_result
=
message_text
.
decode
().
encode
(
'utf-8'
)
except
(
UnicodeDecodeError
,
LookupError
),
error_message
:
LOG
(
'EmailDocument.getTextContent'
,
INFO
,
'Failed to decode %s TEXT message of %s with error: %s'
%
(
part_encoding
,
self
.
getPath
(),
error_message
))
codec
=
guessEncodingFromText
(
message_text
,
content_type
=
part
.
get_content_type
())
if
codec
is
not
None
:
try
:
text_result
=
message_text
.
decode
(
codec
).
encode
(
'utf-8'
)
except
(
UnicodeDecodeError
,
LookupError
):
text_result
=
repr
(
message_text
)
else
:
text_result
=
repr
(
message_text
)
else
:
text_result
=
message_text
if
default
is
_MARKER
:
if
default
is
_MARKER
:
return
text_result
return
text_result
...
@@ -765,3 +739,20 @@ class EmailDocument(TextDocument):
...
@@ -765,3 +739,20 @@ class EmailDocument(TextDocument):
# getData must be implemented like File.getData is.
# getData must be implemented like File.getData is.
security.declareProtected(Permissions.AccessContentsInformation, '
getData
')
security.declareProtected(Permissions.AccessContentsInformation, '
getData
')
getData = File.getData
getData = File.getData
def testCharsetAndConvert(text_content, content_type, encoding):
try:
if encoding is not None:
text_content = text_content.decode(encoding).encode('
utf
-
8
')
else:
text_content = text_content.decode().encode('
utf
-
8
')
except (UnicodeDecodeError, LookupError), error_message:
encoding = guessEncodingFromText(text_content, content_type)
if encoding is not None:
try:
text_content = text_content.decode(encoding).encode('
utf
-
8
')
except (UnicodeDecodeError, LookupError):
text_content = repr(text_content)[1:-1]
else:
text_content = repr(text_content)[1:-1]
return text_content, encoding
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment