-
Notifications
You must be signed in to change notification settings - Fork 5
Expand file tree
/
Copy pathjsoup_extract_example.js
More file actions
43 lines (40 loc) · 1.42 KB
/
jsoup_extract_example.js
File metadata and controls
43 lines (40 loc) · 1.42 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
/*
* To change this license header, choose License Headers in Project Properties.
* To change this template file, choose Tools | Templates
* and open the template in the editor.
*/
var extract = function (doc) {
if (doc !== null && doc.getFirstFieldValue("body") !== null) {
var File = java.io.File;
var Iterator = java.util.Iterator;
var Jsoup = org.jsoup.Jsoup;
var Document = org.jsoup.nodes.Document;
var Element = org.jsoup.nodes.Element;
var Elements = org.jsoup.select.Elements;
var content = doc.getFirstFieldValue("body");
var doc = org.jsoup.nodes.Document;
var e = java.lang.Exception;
var div = org.jsoup.nodes.Element;
var img = org.jsoup.nodes.Element;
var iter = java.util.Iterator;
var divs = org.jsoup.select.Elements;
try {
doc = Jsoup.parse(content);
if (null !== doc) {
divs = doc.select("div");
if (divs !== null) {
iter = divs.iterator();
div = null; // initialize our value to null
while (iter.hasNext()) {
div = iter.next();
// add div to text
doc.addField("div", div.ownText());
}
}
}
} catch (e) {
logger.error(e);
}
}
return doc;
}