summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorChristine Koppelt <ch.ko123@googlemail.com>2013-04-27 13:32:59 +0200
committerChristine Koppelt <ch.ko123@googlemail.com>2013-04-27 13:32:59 +0200
commit9d461351349ce5bfa5706cbe6dede4db403cd3a3 (patch)
treee78180a1523b90e88d95a94ee37b97bd3fdff1bc
parent524b97999c8e6cfdc80c32fc4e84c3cb685dbadc (diff)
downloadpython-lxml-9d461351349ce5bfa5706cbe6dede4db403cd3a3.tar.gz
slightly extended documentation
-rw-r--r--src/lxml/html/clean.py5
1 files changed, 4 insertions, 1 deletions
diff --git a/src/lxml/html/clean.py b/src/lxml/html/clean.py
index 4a6912f0..2bdb76bf 100644
--- a/src/lxml/html/clean.py
+++ b/src/lxml/html/clean.py
@@ -97,7 +97,8 @@ class Cleaner(object):
Removes any ``<script>`` tags.
``javascript``:
- Removes any Javascript, like an ``onclick`` attribute.
+ Removes any Javascript, like an ``onclick`` attribute. Also removes stylesheets
+ as they could contain Javascript.
``comments``:
Removes any comments.
@@ -166,6 +167,8 @@ class Cleaner(object):
Note that this parameter might not work as intended if you do not
make the links absolute before doing the cleaning.
+ Note that you may also need to set ``whitelist_tags``.
+
``whitelist_tags``:
A set of tags that can be included with ``host_whitelist``.
The default is ``iframe`` and ``embed``; you may wish to