Merge from origin/emacs-24

[gnu-emacs] / doc / lispref / text.texi
diff --git a/doc/lispref/text.texi b/doc/lispref/text.texi

index 27ea8bcbd91f9fc0da65456f3b382750a0b1b877..379fb295654da995c042492437065cc566734f3d 100644 (file)
--- a/doc/lispref/text.texi
+++ b/doc/lispref/text.texi
@@ -220,6 +220,12 @@ This function returns the contents of the entire accessible portion of
  the current buffer, as a string.
  @end defun
  
+  If you need to make sure the resulting string, when copied to a
+different location, will not change its visual appearance due to
+reordering of bidirectional text, use the
+@code{buffer-substring-with-bidi-context} function
+(@pxref{Bidirectional Display, buffer-substring-with-bidi-context}).
+
  @defun filter-buffer-substring start end &optional delete
  This function filters the buffer text between @var{start} and @var{end}
  using a function specified by the variable
@@ -3248,6 +3254,11 @@ possible to remove a @code{read-only} property unless you know the
  special trick: bind @code{inhibit-read-only} to a non-@code{nil} value
  and then remove the property.  @xref{Read Only Buffers}.
  
+@item inhibit-read-only
+@kindex inhibit-read-only @r{(text property)}
+If a character has the property @code{inhibit-read-only}, and the
+buffer is read-only, editing the character in question is allowed.
+
  @item invisible
  @kindex invisible @r{(text property)}
  A non-@code{nil} @code{invisible} property can make a character invisible
@@ -4123,8 +4134,9 @@ buffer.
  Normally, this command puts point before the inserted text, and the
  mark after it.  However, if the optional second argument @var{beforep}
  is non-@code{nil}, it puts the mark before and point after.
-You can pass a non-@code{nil} second argument @var{beforep} to this
-function interactively by supplying any prefix argument.
+
+When called interactively, the command defaults to putting point after
+text, and a prefix argument inverts this behavior.
  
  If the register contains a rectangle, then the rectangle is inserted
  with its upper left corner at point.  This means that text is inserted
@@ -4327,7 +4339,7 @@ coding instead.
  When Emacs is compiled with libxml2 support, the following functions
  are available to parse HTML or XML text into Lisp object trees.
  
-@defun libxml-parse-html-region start end &optional base-url
+@defun libxml-parse-html-region start end &optional base-url discard-comments
  This function parses the text between @var{start} and @var{end} as
  HTML, and returns a list representing the HTML @dfn{parse tree}.  It
  attempts to handle ``real world'' HTML by robustly coping with syntax
@@ -4336,6 +4348,9 @@ mistakes.
  The optional argument @var{base-url}, if non-@code{nil}, should be a
  string specifying the base URL for relative URLs occurring in links.
  
+If the optional argument @var{discard-comments} is non-@code{nil},
+then the parse tree is created without any comments.
+
  In the parse tree, each HTML node is represented by a list in which
  the first element is a symbol representing the node name, the second
  element is an alist of node attributes, and the remaining elements are
@@ -4349,16 +4364,17 @@ document:
  @end example
  
  @noindent
-A call to @code{libxml-parse-html-region} returns this:
+A call to @code{libxml-parse-html-region} returns this @acronym{DOM}
+(document object model):
  
  @example
-(html ()
-  (head ())
-  (body ((width . "101"))
-   (div ((class . "thing"))
-    "Foo"
-    (div ()
-      "Yes"))))
+(html nil
+ (head nil)
+ (body ((width . "101"))
+  (div ((class . "thing"))
+   "Foo"
+   (div nil
+    "Yes"))))
  @end example
  @end defun
  
@@ -4371,12 +4387,137 @@ buffer.  The argument @var{dom} should be a list as generated by
  @end defun
  
  @cindex parsing xml
-@defun libxml-parse-xml-region start end &optional base-url
+@defun libxml-parse-xml-region start end &optional base-url discard-comments
  This function is the same as @code{libxml-parse-html-region}, except
  that it parses the text as XML rather than HTML (so it is stricter
  about syntax).
  @end defun
  
+@menu
+* Document Object Model:: Access, manipulate and search the @acronym{DOM}.
+@end menu
+
+@node Document Object Model
+@subsection Document Object Model
+@cindex HTML DOM
+@cindex XML DOM
+@cindex DOM
+@cindex Document Object Model
+
+The @acronym{DOM} returned by @code{libxml-parse-html-region} (and the
+other @acronym{XML} parsing functions) is a tree structure where each
+node has a node name (called a @dfn{tag}), and optional key/value
+@dfn{attribute} list, and then a list of @dfn{child nodes}.  The child
+nodes are either strings or @acronym{DOM} objects.
+
+@example
+(body ((width . "101"))
+ (div ((class . "thing"))
+  "Foo"
+  (div nil
+   "Yes")))
+@end example
+
+@defun dom-node tag &optional attributes &rest children
+This function creates a @acronym{DOM} node of type @var{tag}.  If
+given, @var{attributes} should be a key/value pair list.
+If given, @var{children} should be @acronym{DOM} nodes.
+@end defun
+
+The following functions can be used to work with this structure.  Each
+function takes a @acronym{DOM} node, or a list of nodes.  In the
+latter case, only the first node in the list is used.
+
+Simple accessors:
+
+@table @code
+@item dom-tag @var{node}
+Return the @dfn{tag} (also called ``node name'') of the node.
+
+@item dom-attr @var{node} @var{attribute}
+Return the value of @var{attribute} in the node.  A common usage
+would be:
+
+@lisp
+(dom-attr img 'href)
+=> "http://fsf.org/logo.png"
+@end lisp
+
+@item dom-children @var{node}
+Return all the children of the node.
+
+@item dom-non-text-children @var{node}
+Return all the non-string children of the node.
+
+@item dom-attributes @var{node}
+Return the key/value pair list of attributes of the node.
+
+@item dom-text @var{node}
+Return all the textual elements of the node as a concatenated string.
+
+@item dom-texts @var{node}
+Return all the textual elements of the node, as well as the textual
+elements of all the children of the node, recursively, as a
+concatenated string.  This function also takes an optional separator
+to be inserted between the textual elements.
+
+@item dom-parent @var{dom} @var{node}
+Return the parent of @var{node} in @var{dom}.
+@end table
+
+The following are functions for altering the @acronym{DOM}.
+
+@table @code
+@item dom-set-attribute @var{node} @var{attribute} @var{value}
+Set the @var{attribute} of the node to @var{value}.
+
+@item dom-append-child @var{node} @var{child}
+Append @var{child} as the last child of @var{node}.
+
+@item dom-add-child-before @var{node} @var{child} @var{before}
+Add @var{child} to @var{node}'s child list before the @var{before}
+node.  If @var{before} is @code{nil}, make @var{child} the first child.
+
+@item dom-set-attributes @var{node} @var{attributes}
+Replace all the attributes of the node with a new key/value list.
+@end table
+
+The following are functions for searching for elements in the
+@acronym{DOM}.  They all return lists of matching nodes.
+
+@table @code
+@item dom-by-tag @var{dom} @var{tag}
+Return all nodes in @var{dom} that are of type @var{tag}.  A typical
+use would be:
+
+@lisp
+(dom-by-tag dom 'td)
+=> '((td ...) (td ...) (td ...))
+@end lisp
+
+@item dom-by-class @var{dom} @var{match}
+Return all nodes in @var{dom} that have class names that match
+@var{match}, which is a regular expression.
+
+@item dom-by-style @var{dom} @var{style}
+Return all nodes in @var{dom} that have styles that match @var{match},
+which is a regular expression.
+
+@item dom-by-id @var{dom} @var{style}
+Return all nodes in @var{dom} that have IDs that match @var{match},
+which is a regular expression.
+
+@end table
+
+Utility functions:
+
+@table @code
+@item dom-pp @var{dom} &optional @var{remove-empty}
+Pretty-print @var{dom} at point.  If @var{remove-empty}, don't print
+textual nodes that just contain white-space.
+@end table
+
+
  @node Atomic Changes
  @section Atomic Change Groups
  @cindex atomic changes