Python 将 HTML 文件转成指定的编码
import
sys
import
chilkat
charset
=
chilkat.CkCharset()
# Any string argument automatically begins the 30-day trial.
success
=
charset.UnlockComponent(
"30-day trial"
)
if
(success !
=
True
):
print
charset.lastErrorText()
sys.exit()
# If the charset is not specified within an HTML META tag,
# then assume it's iso-8859-1 (i.e. ANSI for Western-European languages)
charset.put_FromCharset(
"iso-8859-1"
)
# Convert to utf-8. The file is converted, and the
# HTML META tag is updated to indicate utf-8.
charset.put_ToCharset(
"utf-8"
)
# Convert the HTML file:
success
=
charset.ConvertHtmlFile(
"test.html"
,
"test_utf8.html"
)
if
(success !
=
True
):
print
charset.lastErrorText()
else
:
print
"Success"
Python 将 HTML 文件转成指定的编码