I am trying to convert
JavaScript
x
6
1
myHtml = `
2
<span style="font-family: "Open Sans", Arial, sans-serif; font-size: 14px; text-align: justify;">
3
4
In nec <i>convallis</i> justo. Quisque egestas mollis nibh non hendrerit. <strong>Phasellus</strong> tempus sapien in ultricies aliquet. Maecenas nec risus viverra tortor rhoncus venenatis in sit amet enim. Integer id ipsum non leo finibus sagittis in eu velit. Curabitur sed dolor dui. <span>Mauris <strong>aliquam <i>magna</i></strong> a ipsum</span> tincidunt tempor vitae sit amet ante. Maecenas pellentesque augue vitae quam faucibus, vel convallis dolor placerat. Pellentesque semper justo a turpis euismod, ac gravida enim suscipit.</span>
5
`;
6
into
JavaScript
1
38
38
1
data = [
2
{
3
openTag:
4
'<span style="font-family: "Open Sans", Arial, sans-serif; font-size: 14px; text-align: justify;">',
5
closingTag: "</span>",
6
children: [
7
{ value: "In nec" },
8
{ openTag: "<i>", value: "convallis", closingTag: "</i>" },
9
{ value: " justo. Quisque egestas mollis nibh non hendrerit. " },
10
{ openTag: "<strong>", value: "Phasellus", closingTag: "</strong>" },
11
{
12
value:
13
" tempus sapien in ultricies aliquet. Maecenas nec risus viverra tortor rhoncus venenatis in sit amet enim. Integer id ipsum non leo finibus sagittis in eu velit. Curabitur sed dolor dui. "
14
},
15
{
16
opentag: "<span>",
17
children: [
18
{ value: "Mauris " },
19
{
20
opentag: "<strong>",
21
childeren: [
22
{ value: "aliquam" },
23
{ opentag: "<i>", value: "magna", closingTag: "</i>" }
24
],
25
closingTag: "</strong>"
26
},
27
{ value: " a ipsum" }
28
],
29
closingTag: "</span>"
30
},
31
{
32
value:
33
" tincidunt tempor vitae sit amet ante. Maecenas pellentesque augue vitae quam faucibus, vel convallis dolor placerat. Pellentesque semper justo a turpis euismod, ac gravida enim suscipit."
34
}
35
]
36
}
37
];
38
Current Output
JavaScript
1
60
60
1
{
2
"rawTagName": null,
3
"children": [
4
{
5
"children": []
6
},
7
{
8
"rawTagName": "span",
9
"children": [
10
{
11
"value": "n n In nec "
12
},
13
{
14
"rawTagName": "i",
15
"value": "convallis"
16
},
17
{
18
"value": " justo. Quisque egestas mollis nibh non hendrerit. "
19
},
20
{
21
"rawTagName": "strong",
22
"value": "Phasellus"
23
},
24
{
25
"value": " tempus sapien in ultricies aliquet. Maecenas nec risus viverra tortor rhoncus venenatis in sit amet enim. Integer id ipsum non leo finibus sagittis in eu velit. Curabitur sed dolor dui. "
26
},
27
{
28
"rawTagName": "span",
29
"children": [
30
{
31
"children": []
32
},
33
{
34
"rawTagName": "strong",
35
"children": [
36
{
37
"value": "aliquam "
38
},
39
{
40
"rawTagName": "i",
41
"value": "magna"
42
}
43
]
44
},
45
{
46
"children": []
47
}
48
]
49
},
50
{
51
"value": " tincidunt tempor vitae sit amet ante. Maecenas pellentesque augue vitae quam faucibus, vel convallis dolor placerat. Pellentesque semper justo a turpis euismod, ac gravida enim suscipit."
52
}
53
]
54
},
55
{
56
"children": []
57
}
58
]
59
}
60
Below is my current approach using recursion
JavaScript
1
45
45
1
import { parse } from "node-html-parser";
2
3
// Write Javascript code!
4
5
const myHtml = `
6
<span style="font-family: "Open Sans", Arial, sans-serif; font-size: 14px; text-align: justify;">
7
8
In nec <i>convallis</i> justo. Quisque egestas mollis nibh non hendrerit. <strong>Phasellus</strong> tempus sapien in ultricies aliquet. Maecenas nec risus viverra tortor rhoncus venenatis in sit amet enim. Integer id ipsum non leo finibus sagittis in eu velit. Curabitur sed dolor dui. <span>Mauris <strong>aliquam <i>magna</i></strong> a ipsum</span> tincidunt tempor vitae sit amet ante. Maecenas pellentesque augue vitae quam faucibus, vel convallis dolor placerat. Pellentesque semper justo a turpis euismod, ac gravida enim suscipit.</span>
9
`;
10
11
const tranform = str => {
12
const nodeAsObject = root => {
13
if (root.childNodes.length === 0) {
14
return { value: root.rawText };
15
}
16
if (
17
root.childNodes.length === 1 &&
18
root.childNodes[0].childNodes.length === 0
19
) {
20
return {
21
rawTagName: root.rawTagName,
22
value: root.rawText
23
};
24
}
25
return {
26
rawTagName: root.rawTagName,
27
children: root.childNodes.map(x => {
28
return {
29
rawTagName: x.rawTagName,
30
children: x.childNodes.map(y => {
31
return nodeAsObject(y);
32
})
33
};
34
})
35
};
36
};
37
return nodeAsObject(parse(str));
38
};
39
40
console.log(tranform(myHtml));
41
42
const pre = document.getElementById("pre");
43
pre.innerHTML = JSON.stringify(tranform(myHtml), null, " ");
44
45
Advertisement
Answer
I went for the recursive approach and created an output that is similar to your expected output.
JavaScript
1
45
45
1
const myHtml = `
2
<span style="font-family: "Open Sans", Arial, sans-serif; font-size: 14px; text-align: justify;">
3
4
In nec <i>convallis</i> justo. Quisque egestas mollis nibh non hendrerit. <strong>Phasellus</strong> tempus sapien in ultricies aliquet. Maecenas nec risus viverra tortor rhoncus venenatis in sit amet enim. Integer id ipsum non leo finibus sagittis in eu velit. Curabitur sed dolor dui. <span>Mauris <strong>aliquam <i>magna</i></strong> a ipsum</span> tincidunt tempor vitae sit amet ante. Maecenas pellentesque augue vitae quam faucibus, vel convallis dolor placerat. Pellentesque semper justo a turpis euismod, ac gravida enim suscipit.</span>
5
`;
6
7
let revisedHtml;
8
9
const parser = htmlStr => {
10
let htmlElements = parse(htmlStr);
11
revisedHtml = htmlElements.childNodes.map(node => {
12
return createTranslatedNode(node);
13
});
14
return htmlElements;
15
};
16
17
const createTranslatedNode = node => {
18
let currentNode = {};
19
// This is a textNode.
20
if (!node.rawTagName) {
21
currentNode = { value: node?.rawText?.trim() };
22
}
23
// This is a tagNode
24
if (node.rawTagName) {
25
currentNode = {
26
openTag: `<${node.rawTagName} ${node.rawAttrs}>`,
27
closingTag: `</${node.rawTagName}>`
28
};
29
}
30
31
if (node?.childNodes?.length === 1 && !node?.childNodes[0].rawTagName) {
32
currentNode.value = node?.childNodes[0].rawText?.trim();
33
}
34
35
if (node?.childNodes?.length > 1) {
36
currentNode.children = node.childNodes.map(childNode => {
37
return createTranslatedNode(childNode);
38
});
39
}
40
41
return currentNode;
42
};
43
44
console.log(revisedHtml);
45
I do some assumptions with the open and close tags since I just do some string concatination to add the <>
around the tags.
Other than that I trim()
the value inputs to remove the unwanted whitespace around the value.
This does make some assumptions about the html, like it always having start and closing tags, and such. A further improvement that could be done would be to test for that also.