如何使用javascript从特定的标签获取HTML文档中的所有textNodes?

问题描述:

如何从一组特定的标签中获取所有textNodes,而不使用xpath或treewalker(IE不允许您使用xpath& treewalker),在单个数组中说blockquote,em,h4,h6,p。 .please帮助我...如果脚本只是IE,它的确定。

How to get all textNodes from a group of specific tags say "blockquote,em,h4,h6,p" in a single array without using xpath or treewalker (IE doesn't allow you to use xpath & treewalker)..please help me...its ok if the script is IE only.

以下将让你所有的文本节点包含在匹配元素中:

The following will get you all text nodes that are contained within a matching element:

function getTextNodes(root, tagNamesArray) {
    var textNodes = [];
    var regex = new RegExp("^(" + tagNamesArray.join("|") + ")$", "i");
    var insideMatchingElement = false;

    function getNodes(node, insideMatchingElement) {
        if (node.nodeType == 3 && insideMatchingElement) {
            textNodes.push(node);
        } else if (node.nodeType == 1) {
            var childrenInsideMatchingElement = insideMatchingElement || regex.test(node.nodeName);
            for (var child = node.firstChild; child; child = child.nextSibling) {
                getNodes(child, childrenInsideMatchingElement);
            }
        }
    }

    getNodes(root);
    return textNodes;
}

var textNodes = getTextNodes(document.body, ["blockquote","em","h4","h6","p"]);