(set-buffer (get-file-buffer file))
(setq keep (point)))
(find-file file))
-
+
(let ((xml (xml-parse-region (point-min)
(point-max)
(current-buffer)
;; beginning of a document)
((looking-at "<\\?")
(search-forward "?>" end)
- (skip-chars-forward " \t\n")
+ (goto-char (- (re-search-forward "[^[:space:]]") 1))
(xml-parse-tag end))
;; Character data (CDATA) sections, in which no tag should be interpreted
((looking-at "<!\\[CDATA\\[")
(if parse-dtd
(setq dtd (xml-parse-dtd end))
(xml-skip-dtd end))
- (skip-chars-forward " \t\n")
+ (goto-char (- (re-search-forward "[^[:space:]]") 1))
(if dtd
(cons dtd (xml-parse-tag end))
(xml-parse-tag end))))
((looking-at "</")
'())
;; opening tag
- ((looking-at "<\\([^/> \t\n]+\\)")
+ ((looking-at "<\\([^/>[:space:]]+\\)")
(goto-char (match-end 1))
(let* ((case-fold-search nil) ;; XML is case-sensitive.
(node-name (match-string 1))
pos)
;; is this an empty element ?
- (if (looking-at "/>")
+ (if (looking-at "/[[:space:]]*>")
(progn
(forward-char 2)
(nreverse (cons '("") children)))
(forward-char 1)
;; Now check that we have the right end-tag. Note that this
;; one might contain spaces after the tag name
- (while (not (looking-at (concat "</" node-name "[ \t\n]*>")))
+ (while (not (looking-at (concat "</" node-name "[[:space:]]*>")))
(cond
((looking-at "</")
(error (concat
(forward-char -1)
(let ((string (buffer-substring-no-properties pos (point)))
(pos 0))
-
+
;; Clean up the string (no newline characters)
;; Not done, since as per XML specifications, the XML processor
;; should always pass the whole string to the application.
Leaves the point on the first non-blank character after the tag."
(let ((attlist ())
name)
- (skip-chars-forward " \t\n")
- (while (looking-at "\\([a-zA-Z_:][-a-zA-Z0-9._:]*\\)[ \t\n]*=[ \t\n]*")
+ (goto-char (- (re-search-forward "[^[:space:]]") 1))
+ (while (looking-at "\\([a-zA-Z_:][-a-zA-Z0-9._:]*\\)[[:space:]]*=[[:space:]]*")
(setq name (intern (match-string 1)))
(goto-char (match-end 0))
;; Do we have a string between quotes (or double-quotes),
;; or a simple word ?
- (unless (looking-at "\"\\([^\"]+\\)\"")
- (unless (looking-at "'\\([^']+\\)'")
+ (unless (looking-at "\"\\([^\"]*\\)\"")
+ (unless (looking-at "'\\([^']*\\)'")
(error "XML: Attribute values must be given between quotes")))
;; Each attribute must be unique within a given element
(if (assoc name attlist)
(error "XML: each attribute must be unique within an element"))
-
+
(push (cons name (match-string-no-properties 1)) attlist)
(goto-char (match-end 0))
- (skip-chars-forward " \t\n")
+ (goto-char (- (re-search-forward "[^[:space:]]") 1))
(if (> (point) end)
(error "XML: end of attribute list not found before end of region"))
)
The point must be just before the starting tag of the DTD.
This follows the rule [28] in the XML specifications."
(forward-char (length "<!DOCTYPE"))
- (if (looking-at "[ \t\n]*>")
+ (if (looking-at "[[:space:]]*>")
(error "XML: invalid DTD (excepting name of the document)"))
(condition-case nil
(progn
(forward-word 1) ;; name of the document
- (skip-chars-forward " \t\n")
+ (goto-char (- (re-search-forward "[^[:space:]]") 1))
(if (looking-at "\\[")
- (re-search-forward "\\][ \t\n]*>" end)
+ (re-search-forward "\\][[:space:]]*>" end)
(search-forward ">" end)))
(error (error "XML: No end to the DTD"))))
"Parse the DTD that point is looking at.
The DTD must end before the position END in the current buffer."
(forward-char (length "<!DOCTYPE"))
- (skip-chars-forward " \t\n")
+ (goto-char (- (re-search-forward "[^[:space:]]") 1))
(if (looking-at ">")
(error "XML: invalid DTD (excepting name of the document)"))
-
+
;; Get the name of the document
(looking-at "\\sw+")
(let ((dtd (list (match-string-no-properties 0) 'dtd))
type element end-pos)
(goto-char (match-end 0))
- (skip-chars-forward " \t\n")
+ (goto-char (- (re-search-forward "[^[:space:]]") 1))
;; External DTDs => don't know how to handle them yet
(if (looking-at "SYSTEM")
(error "XML: Don't know how to handle external DTDs"))
-
+
(if (not (= (char-after) ?\[))
(error "XML: Unknown declaration in the DTD"))
;; Parse the rest of the DTD
(forward-char 1)
- (while (and (not (looking-at "[ \t\n]*\\]"))
+ (while (and (not (looking-at "[[:space:]]*\\]"))
(<= (point) end))
(cond
;; Translation of rule [45] of XML specifications
((looking-at
- "[\t \n]*<!ELEMENT[ \t\n]+\\([a-zA-Z0-9.%;]+\\)[ \t\n]+\\([^>]+\\)>")
+ "[[:space:]]*<!ELEMENT[[:space:]]+\\([a-zA-Z0-9.%;]+\\)[[:space:]]+\\([^>]+\\)>")
(setq element (intern (match-string-no-properties 1))
type (match-string-no-properties 2))
(setq end-pos (match-end 0))
-
+
;; Translation of rule [46] of XML specifications
(cond
- ((string-match "^EMPTY[ \t\n]*$" type) ;; empty declaration
+ ((string-match "^EMPTY[[:space:]]*$" type) ;; empty declaration
(setq type 'empty))
- ((string-match "^ANY[ \t\n]*$" type) ;; any type of contents
+ ((string-match "^ANY[[:space:]]*$" type) ;; any type of contents
(setq type 'any))
- ((string-match "^(\\(.*\\))[ \t\n]*$" type) ;; children ([47])
+ ((string-match "^(\\(.*\\))[[:space:]]*$" type) ;; children ([47])
(setq type (xml-parse-elem-type (match-string-no-properties 1 type))))
- ((string-match "^%[^;]+;[ \t\n]*$" type) ;; substitution
+ ((string-match "^%[^;]+;[[:space:]]*$" type) ;; substitution
nil)
(t
(error "XML: Invalid element type in the DTD")))
(if (assoc element dtd)
(error "XML: elements declaration must be unique in a DTD (<%s>)"
(symbol-name element)))
-
+
;; Store the element in the DTD
(push (list element type) dtd)
(goto-char end-pos))
(mapcar 'xml-parse-elem-type
(split-string elem ","))))
)))
- (if (string-match "[ \t\n]*\\([^+*?]+\\)\\([+*?]?\\)" string)
+ (if (string-match "[[:space:]]*\\([^+*?]+\\)\\([+*?]?\\)" string)
(setq elem (match-string 1 string)
modifier (match-string 2 string))))
(if (and (stringp elem) (string= elem "#PCDATA"))
(setq elem 'pcdata))
-
+
(cond
((string= modifier "+")
(list '+ elem))
(defun xml-substitute-special (string)
"Return STRING, after subsituting special XML sequences."
- (while (string-match "&" string)
- (setq string (replace-match "&" t nil string)))
(while (string-match "<" string)
(setq string (replace-match "<" t nil string)))
(while (string-match ">" string)
(setq string (replace-match "'" t nil string)))
(while (string-match """ string)
(setq string (replace-match "\"" t nil string)))
+ ;; This goes last so it doesn't confuse the matches above.
+ (while (string-match "&" string)
+ (setq string (replace-match "&" t nil string)))
string)
;;*******************************************************************
(let ((tree xml)
attlist)
(insert indent-string "<" (symbol-name (xml-node-name tree)))
-
+
;; output the attribute list
(setq attlist (xml-node-attributes tree))
(while attlist
(insert " ")
(insert (symbol-name (caar attlist)) "=\"" (cdar attlist) "\"")
(setq attlist (cdr attlist)))
-
+
(insert ">")
-
+
(setq tree (xml-node-children tree))
;; output the children