summaryrefslogtreecommitdiff
path: root/lisp/dom.el
diff options
context:
space:
mode:
authorLars Magne Ingebrigtsen <larsi@gnus.org>2014-11-26 19:39:49 +0100
committerLars Magne Ingebrigtsen <larsi@gnus.org>2014-11-26 19:42:29 +0100
commit115178cd46b10383a12bd865739d0d55eea20251 (patch)
tree378d42edbcee5494d69ed1ab7a72c7e486b65153 /lisp/dom.el
parent549a1bae4a54c56c4c8d212f1441ac44aac89a4b (diff)
downloademacs-115178cd46b10383a12bd865739d0d55eea20251.tar.gz
* dom.el: New file.
Diffstat (limited to 'lisp/dom.el')
-rw-r--r--lisp/dom.el176
1 files changed, 176 insertions, 0 deletions
diff --git a/lisp/dom.el b/lisp/dom.el
new file mode 100644
index 00000000000..3157e0b2f2a
--- /dev/null
+++ b/lisp/dom.el
@@ -0,0 +1,176 @@
+;;; dom.el --- XML/HTML (etc.) DOM manipulation and searching functions
+
+;; Copyright (C) 2014 Free Software Foundation, Inc.
+
+;; Author: Lars Magne Ingebrigtsen <larsi@gnus.org>
+;; Keywords: xml, html
+
+;; This file is part of GNU Emacs.
+
+;; GNU Emacs is free software: you can redistribute it and/or modify
+;; it under the terms of the GNU General Public License as published by
+;; the Free Software Foundation, either version 3 of the License, or
+;; (at your option) any later version.
+
+;; GNU Emacs is distributed in the hope that it will be useful,
+;; but WITHOUT ANY WARRANTY; without even the implied warranty of
+;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+;; GNU General Public License for more details.
+
+;; You should have received a copy of the GNU General Public License
+;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
+
+;;; Commentary:
+
+;;; Code:
+
+(require 'cl-lib)
+
+(defsubst dom-tag (node)
+ "Return the NODE tag."
+ ;; Called on a list of nodes. Use the first.
+ (if (consp (car node))
+ (caar node)
+ (car node)))
+
+(defsubst dom-attributes (node)
+ "Return the NODE attributes."
+ ;; Called on a list of nodes. Use the first.
+ (if (consp (car node))
+ (cadr (car node))
+ (cadr node)))
+
+(defsubst dom-children (node)
+ "Return the NODE children."
+ ;; Called on a list of nodes. Use the first.
+ (if (consp (car node))
+ (cddr (car node))
+ (cddr node)))
+
+(defun dom-set-attributes (node attributes)
+ "Set the attributes of NODE to ATTRIBUTES."
+ (setq node (dom-ensure-node node))
+ (setcar (cdr node) attributes))
+
+(defun dom-set-attribute (node attribute value)
+ "Set ATTRIBUTE in NODE to VALUE."
+ (setq node (dom-ensure-node node))
+ (let ((old (assoc attribute (cadr node))))
+ (if old
+ (setcdr old value)
+ (setcar (cdr node) (nconc (cadr node) (list (cons attribute value)))))))
+
+(defmacro dom-attr (node attr)
+ "Return the attribute ATTR from NODE.
+A typical attribute is `href'."
+ `(cdr (assq ,attr (dom-attributes ,node))))
+
+(defun dom-text (node)
+ "Return all the text bits in the current node concatenated."
+ (mapconcat 'identity (cl-remove-if-not 'stringp (dom-children node)) " "))
+
+(defun dom-texts (node &optional separator)
+ "Return all textual data under NODE concatenated with SEPARATOR in-between."
+ (mapconcat
+ 'identity
+ (mapcar
+ (lambda (elem)
+ (if (stringp elem)
+ elem
+ (dom-texts elem separator)))
+ (dom-children node))
+ (or separator " ")))
+
+(defun dom-child-by-tag (dom tag)
+ "Return the first child of DOM that is of type TAG."
+ (assoc tag (dom-children dom)))
+
+(defun dom-by-tag (dom tag)
+ "Return elements in DOM that is of type TAG.
+A name is a symbol like `td'."
+ (let ((matches (cl-loop for child in (dom-children dom)
+ for matches = (and (not (stringp child))
+ (dom-by-tag child tag))
+ when matches
+ append matches)))
+ (if (eq (dom-tag dom) tag)
+ (cons dom matches)
+ matches)))
+
+(defun dom-by-class (dom match)
+ "Return elements in DOM that have a class name that matches regexp MATCH."
+ (dom-elements dom 'class match))
+
+(defun dom-by-style (dom match)
+ "Return elements in DOM that have a style that matches regexp MATCH."
+ (dom-elements dom 'style match))
+
+(defun dom-by-id (dom match)
+ "Return elements in DOM that have an ID that matches regexp MATCH."
+ (dom-elements dom 'id match))
+
+(defun dom-elements (dom attribute match)
+ "Find elements matching MATCH (a regexp) in ATTRIBUTE.
+ATTRIBUTE would typically be `class', `id' or the like."
+ (let ((matches (cl-loop for child in (dom-children dom)
+ for matches = (dom-elements child attribute match)
+ when matches
+ append matches))
+ (attr (dom-attr dom attribute)))
+ (if (and attr
+ (string-match match attr))
+ (cons dom matches)
+ matches)))
+
+(defun dom-parent (dom node)
+ "Return the parent of NODE in DOM."
+ (if (memq node (dom-children dom))
+ dom
+ (let ((result nil))
+ (dolist (elem (dom-children dom))
+ (when (and (not result)
+ (not (stringp elem)))
+ (setq result (dom-parent elem node))))
+ result)))
+
+(defun dom-node (tag &optional attributes &rest children)
+ "Return a DOM node with TAG and ATTRIBUTES."
+ (if children
+ `(,tag ,attributes ,@children)
+ (list tag attributes)))
+
+(defun dom-append-child (node child)
+ "Append CHILD to the end of NODE's children."
+ (setq node (dom-ensure-node node))
+ (nconc node (list child)))
+
+(defun dom-add-child-before (node child &optional before)
+ "Add CHILD to NODE's children before child BEFORE.
+If BEFORE is nil, make CHILD NODE's first child."
+ (setq node (dom-ensure-node node))
+ (let ((children (dom-children node)))
+ (when (and before
+ (not (memq before children)))
+ (error "%s does not exist as a child" before))
+ (let ((pos (if before
+ (cl-position before children)
+ 0)))
+ (if (zerop pos)
+ ;; First child.
+ (setcdr (cdr node) (cons child (cddr node)))
+ (setcdr (nthcdr (1- pos) children)
+ (cons child (nthcdr pos children))))))
+ node)
+
+(defun dom-ensure-node (node)
+ "Ensure that NODE is a proper DOM node."
+ ;; Add empty attributes, if none.
+ (when (consp (car node))
+ (setq node (car node)))
+ (when (= (length node) 1)
+ (setcdr node (list nil)))
+ node)
+
+(provide 'dom)
+
+;;; dom.el ends here