From de65bec43448bd09bc85f40076cc4732d683b7e3 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?J=C3=A9rome=20Perrin?= <jerome@nexedi.com> Date: Wed, 2 Apr 2014 18:34:17 +0200 Subject: [PATCH] html to text: configure w3m not to use ascii equivalent for entities --- product/PortalTransforms/transforms/w3m_dump.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/product/PortalTransforms/transforms/w3m_dump.py b/product/PortalTransforms/transforms/w3m_dump.py index bd8f434a97..0f7d10f461 100644 --- a/product/PortalTransforms/transforms/w3m_dump.py +++ b/product/PortalTransforms/transforms/w3m_dump.py @@ -44,7 +44,7 @@ class w3m_dump(subprocesstransform): __version__ = '2008.07.11-1' binaryName = "w3m" - binaryArgs = "-dump -T text/html -o document_charset=utf-8 -o display_charset=utf-8 -o ignore_null_img_alt=0 " + binaryArgs = "-dump -T text/html -o alt_entity=0 -o document_charset=utf-8 -o display_charset=utf-8 -o ignore_null_img_alt=0 " useStdin = True -- 2.30.9