htmlflatten
v0.1.0
Published
Flatten your html source, and generate json text data
Downloads
3
Readme
HTMLToJSON
Flatten your html source, and generate json text data
This Project is still under development
Platform
Browser Or jsdom
What is Used To be
If we have some html code
<div>
<p>helloworld</p>
<span>
text
<span>text3</span>
<span>text4</span>
</span>
<p>123456<span>78</span>90<br/><span>2333333</span></p>
<img width="50" height="50" src="https://avatars3.githubusercontent.com/u/4409743?v=3&s=460"/>
</div>
wwwww
<span>12323</span>
1232323
213123123
<br />
Without CSS Stylesheets, This code should looking like this:
This Project can help to generate json with data and keep the newline of the text;
{ image_num: 1,
items:
[ { type: 'text', data: 'helloworld' },
{ type: 'text', data: 'text\n text3\n text4' },
{ type: 'text', data: '1234567890' },
{ type: 'text', data: '2333333' },
{ type: 'image',
data: { src: 'https://avatars3.githubusercontent.com/u/4409743?v=3&s=460' } },
{ type: 'text', data: 'wwwww123231232323\n213123123' },
[length]: 6 ] }
How to Use
let jsdom = require('jsdom');
let html = `
<div>
<p>helloworld</p>
<span>
text
<span>text3</span>
<span>text4</span>
</span>
<p>123456<span>78</span>90<br/><span>2333333</span></p>
</div>
<img src="https://avatars3.githubusercontent.com/u/4409743?v=3&s=460"/>
wwwww
<span>12323</span>
1232323
213123123
<br />
`
let document = jsdom(html, {
features: {
FetchExternalResources: false,
ProcessExternalResources: false
}
});
let DOMParser = require('html-to-json');
let parser = new DOMParser(document.body);
let json = parser.toJSON();
console.log(json);