我正在尝试解析一个XML文档,并使用这些数据构建一个(更简单的)以下形式的json对象:
{id: '1', name: 'content-types', children: [{id: '2', name: 'requirements': children: [... and so on ...]]}我的XML有如下所示的节点(我只包含了一个节点--它们可以任意嵌套):
<?xml version="1.0" encoding="utf-8"?>
<html xmlns="http://www.w3.org/1999/xhtml">
<head/>
<body class="taxonomies">
<div class="taxonomy">
<span class="id">3484069771</span>
<span class="name">Content Types</span>
<span class="locale">en</span>
<div class="concepts">
<div class="concept">
<span class="id">3484058507</span>
<span class="name">Promotional Publications</span>
<div class="concepts">
<div class="concept">
<span class="id">3551765771</span>
<span class="name">Datasheets</span>
</div>
</div>
</div>
</div>
</div>
</body>
</html>我使用以下代码从XML构建JSON树:
buildConceptTree: function(xml){
const doc = new dom().parseFromString(xml)
var tree = []
var selector = "//*[@class='taxonomies']"
var count = 0 // this should keep track of the depth of the node being used
function recurse(s, odd){
var nodes
console.log(count)
console.log(s)
var arr = []
nodes = xpath.select(s, doc)
nodes.forEach(node => {
try {
var children = node.childNodes
var keys = Object.keys(children).filter(x => {return Number(x)})
keys.forEach(key => {
var child = children[key]
console.log('child is: ')
console.log(child)
var obj = {}
var grandchildren = child.childNodes
var grandkeys = Object.keys(grandchildren).filter(x => {return Number(x)})
grandkeys.forEach(gk => {
var gc = grandchildren[gk]
try {
var nodevalue = gc['attributes'][0]['nodeValue']
switch(nodevalue){
case 'id':
obj['id'] = gc['textContent']
case 'name':
obj['name'] = gc['textContent']
case 'concepts':
count++
var rx = /taxonomy/
if(!rx.test(s)){
s = s+"/*[@class='taxonomy']"
}
else{
s = s
}
if (!odd){
s += "/*[@class='concepts']"
}
else {
s += "/*[@class='concept']"
}
odd = !odd
obj['children'] = recurse(s, odd)
}
}
catch(e){
}
})
arr.push(obj)
})
}
catch(e){
}
})
return arr
}
var tree = recurse(selector, false)
return tree
},按照原样,此函数生成类似于我提到的JSON表单,但缺少许多节点。
而且,我的递归函数似乎并没有在最简单的情况下终止,因为它沿着xml树的更深的分支递归。我在控制台中记录了以下内容(例如),但没有191度深的节点:
191
parser.js?d3c4:83 //*[@class='taxonomies']/*[@class='taxonomy']/*[@class='concepts']/*[@class='concept']/*[@class='concepts']/*[@class='concept']/*[@class='concepts']/*[@class='concept']/*[@class='concepts']/*[@class='concept']/*[@class='concepts']/*[@class='concept']/*[@class='concepts']/*[@class='concept']/*[@class='concepts']/*[@class='concept']/*[@class='concepts']/*[@class='concept']/*[@class='concepts']/*[@class='concept']/*[@class='concepts']/*[@class='concept']/*[@class='concepts']/*[@class='concept']/*[@class='concepts']/*[@class='concept']/*[@class='concepts']/*[@class='concept']/*[@class='concepts']/*[@class='concept']/*[@class='concepts']
parser.js?d3c4:92 child is:有没有人能帮我弄清楚如何改变这个函数,让它得到我想要的数据?
发布于 2018-08-23 23:48:44
我可能错过了一些需求,但是一旦你停止遍历所有元素并开始查询你期望的确切元素,这个问题似乎就不那么复杂了:
// Parse the xml string to a document
const parser = new DOMParser();
const xmlDoc = parser.parseFromString(
getXML(),
"text/xml"
);
// The main logic to go from an xml element to an object
const parseTaxonomy = (taxonomy, id = 1) => ({
id,
name: taxonomy.querySelector(".name")
.innerText
.toLowerCase()
.replace(/\s/g, "-"),
children: Array.from(
(taxonomy.querySelector(".concepts") || { children: [] })
.children
).map(t => parseTaxonomy(t, ++id)) // Note the ++
});
// Run on the first taxonomy
// If the top level contains multiple elements, use .map
console.log(
parseTaxonomy(
xmlDoc.querySelector(".taxonomy")
)
);
// The data
function getXML() {
return `<?xml version="1.0" encoding="utf-8"?>
<html xmlns="http://www.w3.org/1999/xhtml">
<head/>
<body class="taxonomies">
<div class="taxonomy">
<span class="id">3484069771</span>
<span class="name">Content Types</span>
<span class="locale">en</span>
<div class="concepts">
<div class="concept">
<span class="id">3484058507</span>
<span class="name">Promotional Publications</span>
<div class="concepts">
<div class="concept">
<span class="id">3551765771</span>
<span class="name">Datasheets</span>
</div>
</div>
</div>
</div>
</div>
</body>
</html>`;
};
注意:我更改了您放置注释的部分,因为注释没有关闭,并且我希望它对子分类有另一个包装器。
https://stackoverflow.com/questions/51986159
复制相似问题