summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--lisp/ChangeLog7
-rw-r--r--lisp/xml.el37
-rw-r--r--test/ChangeLog4
-rw-r--r--test/automated/xml-parse-tests.el19
4 files changed, 59 insertions, 8 deletions
diff --git a/lisp/ChangeLog b/lisp/ChangeLog
index 58cb7e69688..dd136f5b053 100644
--- a/lisp/ChangeLog
+++ b/lisp/ChangeLog
@@ -1,3 +1,10 @@
+2012-07-03 Chong Yidong <cyd@gnu.org>
+
+ * xml.el: Protect parser against XML bombs.
+ (xml-entity-expansion-limit): New variable.
+ (xml-parse-string, xml-substitute-special): Use it.
+ (xml-parse-dtd): Avoid infloop if the DTD is not terminated.
+
2012-07-03 Glenn Morris <rgm@gnu.org>
* progmodes/bug-reference.el (bug-reference-bug-regexp):
diff --git a/lisp/xml.el b/lisp/xml.el
index a3e279b41bd..2595fd572f4 100644
--- a/lisp/xml.el
+++ b/lisp/xml.el
@@ -98,6 +98,13 @@
("amp" . "&#38;"))
"Alist mapping XML entities to their replacement text.")
+(defvar xml-entity-expansion-limit 20000
+ "The maximum size of entity reference expansions.
+If the size of the buffer increases by this many characters while
+expanding entity references in a segment of character data, the
+XML parser signals an error. Setting this to nil removes the
+limit (making the parser vulnerable to XML bombs).")
+
(defvar xml-parameter-entity-alist nil
"Alist of defined XML parametric entities.")
@@ -471,7 +478,7 @@ Return one of:
(while (not (looking-at end))
(cond
((eobp)
- (error "XML: (Not Well-Formed) End of buffer while reading element `%s'"
+ (error "XML: (Not Well-Formed) End of document while reading element `%s'"
node-name))
((looking-at "</")
(forward-char 2)
@@ -517,6 +524,8 @@ Leave point at the start of the next thing to parse. This
function can modify the buffer by expanding entity and character
references."
(let ((start (point))
+ ;; Keep track of the size of the rest of the buffer:
+ (old-remaining-size (- (buffer-size) (point)))
ref val)
(while (and (not (eobp))
(not (looking-at "<")))
@@ -557,7 +566,13 @@ references."
xml-validating-parser
(error "XML: (Validity) Undefined entity `%s'" ref))
(replace-match (cdr val) t t)
- (goto-char (match-beginning 0))))))
+ (goto-char (match-beginning 0))))
+ ;; Check for XML bombs.
+ (and xml-entity-expansion-limit
+ (> (- (buffer-size) (point))
+ (+ old-remaining-size xml-entity-expansion-limit))
+ (error "XML: Entity reference expansion \
+surpassed `xml-entity-expansion-limit'"))))
;; [2.11] Clean up line breaks.
(let ((end-marker (point-marker)))
(goto-char start)
@@ -689,6 +704,8 @@ This follows the rule [28] in the XML specifications."
(while (not (looking-at "\\s-*\\]"))
(skip-syntax-forward " ")
(cond
+ ((eobp)
+ (error "XML: (Well-Formed) End of document while reading DTD"))
;; Element declaration [45]:
((and (looking-at (eval-when-compile
(concat "<!ELEMENT\\s-+\\(" xml-name-re
@@ -797,9 +814,11 @@ This follows the rule [28] in the XML specifications."
(if (re-search-forward parameter-entity-re nil t)
(match-beginning 0)))))
- ;; Anything else:
+ ;; Anything else is garbage (ignored if not validating).
(xml-validating-parser
- (error "XML: (Validity) Invalid DTD item"))))
+ (error "XML: (Validity) Invalid DTD item"))
+ (t
+ (skip-chars-forward "^]"))))
(if (looking-at "\\s-*]>")
(goto-char (match-end 0))))
@@ -876,6 +895,7 @@ STRING is assumed to occur in an XML attribute value."
(let ((ref-re (eval-when-compile
(concat "&\\(?:#\\(x\\)?\\([0-9]+\\)\\|\\("
xml-name-re "\\)\\);")))
+ (strlen (length string))
children)
(while (string-match ref-re string)
(push (substring string 0 (match-beginning 0)) children)
@@ -891,7 +911,8 @@ STRING is assumed to occur in an XML attribute value."
(error "XML: (Validity) Undefined character `x%s'" ref))
(t xml-undefined-entity))
children)
- (setq string remainder))
+ (setq string remainder
+ strlen (length string)))
;; [4.4.5] Entity references are "included in literal".
;; Note that we don't need do anything special to treat
;; quotes as normal data characters.
@@ -900,7 +921,11 @@ STRING is assumed to occur in an XML attribute value."
(if xml-validating-parser
(error "XML: (Validity) Undefined entity `%s'" ref)
xml-undefined-entity))))
- (setq string (concat val remainder))))))
+ (setq string (concat val remainder)))
+ (and xml-entity-expansion-limit
+ (> (length string) (+ strlen xml-entity-expansion-limit))
+ (error "XML: Passed `xml-entity-expansion-limit' while expanding `&%s;'"
+ ref)))))
(mapconcat 'identity (nreverse (cons string children)) "")))
(defun xml-substitute-numeric-entities (string)
diff --git a/test/ChangeLog b/test/ChangeLog
index 3ff7124893a..1e77f972965 100644
--- a/test/ChangeLog
+++ b/test/ChangeLog
@@ -1,3 +1,7 @@
+2012-07-03 Chong Yidong <cyd@gnu.org>
+
+ * automated/xml-parse-tests.el (xml-parse-tests--bad-data): New.
+
2012-07-02 Chong Yidong <cyd@gnu.org>
* automated/xml-parse-tests.el (xml-parse-tests--data): More
diff --git a/test/automated/xml-parse-tests.el b/test/automated/xml-parse-tests.el
index ec3d7ca3065..ada9bbd4074 100644
--- a/test/automated/xml-parse-tests.el
+++ b/test/automated/xml-parse-tests.el
@@ -55,14 +55,29 @@
("<foo>&#38;amp;</foo>" . ((foo () "&amp;"))))
"Alist of XML strings and their expected parse trees.")
+(defvar xml-parse-tests--bad-data
+ '(;; XML bomb in content
+ "<!DOCTYPE foo [<!ENTITY lol \"lol\"><!ENTITY lol1 \"&lol;&lol;&lol;&lol;&lol;&lol;&lol;&lol;&lol;&lol;\"><!ENTITY lol2 \"&lol1;&lol1;&lol1;&lol1;&lol1;&lol1;&lol1;&lol1;&lol1;&lol1;\">]><foo>&lol2;</foo>"
+ ;; XML bomb in attribute value
+ "<!DOCTYPE foo [<!ENTITY lol \"lol\"><!ENTITY lol1 \"&lol;&lol;&lol;&lol;&lol;&lol;&lol;&lol;&lol;&lol;\"><!ENTITY lol2 \"&lol1;&lol1;&lol1;&lol1;&lol1;&lol1;&lol1;&lol1;&lol1;&lol1;\">]><foo a=\"&lol2;\">!</foo>"
+ ;; Non-terminating DTD
+ "<!DOCTYPE foo [ <!ENTITY b \"B\"><!ENTITY abc \"a&b;c\">"
+ "<!DOCTYPE foo [ <!ENTITY b \"B\"><!ENTITY abc \"a&b;c\">asdf"
+ "<!DOCTYPE foo [ <!ENTITY b \"B\"><!ENTITY abc \"a&b;c\">asdf&abc;")
+ "List of XML strings that should signal an error in the parser")
+
(ert-deftest xml-parse-tests ()
"Test XML parsing."
(with-temp-buffer
(dolist (test xml-parse-tests--data)
(erase-buffer)
(insert (car test))
- (should (equal (cdr test)
- (xml-parse-region (point-min) (point-max)))))))
+ (should (equal (cdr test) (xml-parse-region))))
+ (let ((xml-entity-expansion-limit 50))
+ (dolist (test xml-parse-tests--bad-data)
+ (erase-buffer)
+ (insert test)
+ (should-error (xml-parse-region))))))
;; Local Variables:
;; no-byte-compile: t