ansaurus

Question

Answer 1

+1 A:

/**
 * xmlsimplify simplifies an XML object by copying it into a
 * javascript object with only a subset of the attributes of the original.
 * This makes it suitable for output as JSON, or for further processing by
 * other functions.

 * @param {Object} xml
 * @param {Boolean} strip if true, strip empty (whitespace) nodes
 */
var xmlsimplify = function(xml, strip) {
    var obj = {};
    if (typeof xml === "string") {
        xml = getXmlDocument(xml);
    }
    var traverse = function(node) {
        var i, l, n, a, j;
        if (node.nodeType) {
            var o = {};
            switch (node.nodeType) {
            case 1:
                //element node;
                o = {
                    nodeName: node.nodeName
                }; //record nodename
                for (i = 0, l = node.attributes.length, n = node.attributes; i < l; i++) { //append attributes
                    a = traverse(n.item(i));
                    for (j in a) {
                        if (a.hasOwnProperty(j)) {
                            o[j] = a[j];
                        }
                    }
                }
                if (node.childNodes.length) {
                    o.childNodes = [];
                    for (i = 0, l = node.childNodes.length, n = node.childNodes; i < l; i++) {
                        a = traverse(n.item(i));
                        if (a !== null) {
                            o.childNodes.push(a);
                        }
                    }
                    if (o.childNodes.length === 0) {
                        delete o.childNodes;
                    }
                }
                break;
            case 2:
                //attribute node
                o[node.nodeName] = node.nodeValue; //return an attribute object
                break;
            case 3:
                //text node
                //strip empty nodes
                if (node.nodeValue.match(/[^\s]/) && (strip === true)) {
                    o = node.nodeValue;
                } else {
                    o = null;
                }
                if (strip !== true) {
                    o = node.nodeValue;
                }
                break;
            case 4:
                //cdata section node
                o = node.nodeValue;
                break;
            case 9:
                //document node;
                o = traverse(node.firstChild);
                break;
            case 10:
                o = traverse(node.nextSibling);
                break;
            }
        }
        return o;
    };
    obj = traverse(xml);
    return obj;
};

Breton 2009-12-14 02:49:03

Why does the regex use "^\s" instead of "\S"?

Raul Agrait 2009-12-15 05:26:00

I suppose the two are equivalent, but I find the former to be clearer. I'm a bit hazy on my character classes. Code clarity is generally important. I might know that \S is any non whitespace character today, but I may forget it again in 6 months time.

Breton 2009-12-15 05:58:59

ansaurus

tags:

views:

answers:

Ignoring empty XML nodes in JavaScript

related questions