如何使用 jquery 选择器构建具有兄弟标签的分层对象
How to build hierarchical objects with siblings tags using jquery selectors
我有以下 html 片段。我想通过网络抓取页面以获取主题和子主题并将其存储在对象中。
想要的结果是:
{
'topic': 'Java Basics',
'subtopics':['Define the scope of variables', 'Define the structure of a Java class', ...]
}
我试图让它与 Jsdom 一起用于 Node.js 和 JQuery:
var jsdom = require('jsdom');
var fs = require("fs");
var topicos = fs.readFileSync("topic.html", "utf-8");
jsdom.env(topicos, ["http://code.jquery.com/jquery.js"], function (error, window) {
var $ = window.$;
var length = $('div ~ ').each(function () {
//???
var topic = $(this);
var text = topic.text();
console.log(text.trim())
});
})
但由于我在 jQuery 方面缺乏经验,我无法正确组织层次结构。
Html 片段:
<div>
<strong>Java Basics </strong></div>
<ul>
<li>
Define the scope of variables </li>
<li>
Define the structure of a Java class
</li>
<li>
Create executable Java applications with a main method; run a Java program from the command line; including
console output.
</li>
<li>
Import other Java packages to make them accessible in your code
</li>
<li>
Compare and contrast the features and components of Java such as:
platform independence, object orientation, encapsulation, etc.
</li>
</ul>
<div>
<strong>Working With Java Data Types </strong></div>
<ul>
<li>
Declare and initialize variables (including casting of primitive data types)
</li>
<li>
Differentiate between object reference variables and primitive variables
</li>
<li>
Know how to read or write to object fields
</li>
<li>
Explain an Object's Lifecycle (creation, "dereference by reassignment" and garbage collection)
</li>
<li>
Develop code that uses wrapper classes such as Boolean, Double, and Integer. </li>
</ul>
...
这是工作片段fiddle
var topicos = [];
jQuery('div').each(function(){
var data = {};
var jThis = jQuery(this);
data.topic = jThis.find('strong').text();
data.subtopics = [];
jThis.next('ul').find('li').each(function(){
var jThis = jQuery(this);
data.subtopics.push(jThis.text());
});
topicos.push(data);
});
console.log(topicos);
但我强烈建议将 类 添加到您的标记中,并将它们用作选择器而不是标记名称:
<div class="js-topic-data">
<div>
<strong class="js-topic">Java Basics </strong>
</div>
<ul>
<li class="js-sub-topic">
Define the scope of variables </li>
<li>
</ul>
</div>
然后你可以这样做:
jQuery('.js-topic-data').each(function(){
var data = {};
var jThis = jQuery(this);
data.topic = jThis.find('.js-topic').text();
data.subtopics = [];
jThis.next('.js-sub-topic').each(function(){
var jThis = jQuery(this);
data.subtopics.push(jThis.text());
});
topicos.push(data);
});
对于标记更改等更稳健
我有以下 html 片段。我想通过网络抓取页面以获取主题和子主题并将其存储在对象中。
想要的结果是:
{
'topic': 'Java Basics',
'subtopics':['Define the scope of variables', 'Define the structure of a Java class', ...]
}
我试图让它与 Jsdom 一起用于 Node.js 和 JQuery:
var jsdom = require('jsdom');
var fs = require("fs");
var topicos = fs.readFileSync("topic.html", "utf-8");
jsdom.env(topicos, ["http://code.jquery.com/jquery.js"], function (error, window) {
var $ = window.$;
var length = $('div ~ ').each(function () {
//???
var topic = $(this);
var text = topic.text();
console.log(text.trim())
});
})
但由于我在 jQuery 方面缺乏经验,我无法正确组织层次结构。
Html 片段:
<div>
<strong>Java Basics </strong></div>
<ul>
<li>
Define the scope of variables </li>
<li>
Define the structure of a Java class
</li>
<li>
Create executable Java applications with a main method; run a Java program from the command line; including
console output.
</li>
<li>
Import other Java packages to make them accessible in your code
</li>
<li>
Compare and contrast the features and components of Java such as:
platform independence, object orientation, encapsulation, etc.
</li>
</ul>
<div>
<strong>Working With Java Data Types </strong></div>
<ul>
<li>
Declare and initialize variables (including casting of primitive data types)
</li>
<li>
Differentiate between object reference variables and primitive variables
</li>
<li>
Know how to read or write to object fields
</li>
<li>
Explain an Object's Lifecycle (creation, "dereference by reassignment" and garbage collection)
</li>
<li>
Develop code that uses wrapper classes such as Boolean, Double, and Integer. </li>
</ul>
...
这是工作片段fiddle
var topicos = [];
jQuery('div').each(function(){
var data = {};
var jThis = jQuery(this);
data.topic = jThis.find('strong').text();
data.subtopics = [];
jThis.next('ul').find('li').each(function(){
var jThis = jQuery(this);
data.subtopics.push(jThis.text());
});
topicos.push(data);
});
console.log(topicos);
但我强烈建议将 类 添加到您的标记中,并将它们用作选择器而不是标记名称:
<div class="js-topic-data">
<div>
<strong class="js-topic">Java Basics </strong>
</div>
<ul>
<li class="js-sub-topic">
Define the scope of variables </li>
<li>
</ul>
</div>
然后你可以这样做:
jQuery('.js-topic-data').each(function(){
var data = {};
var jThis = jQuery(this);
data.topic = jThis.find('.js-topic').text();
data.subtopics = [];
jThis.next('.js-sub-topic').each(function(){
var jThis = jQuery(this);
data.subtopics.push(jThis.text());
});
topicos.push(data);
});
对于标记更改等更稳健