-
Notifications
You must be signed in to change notification settings - Fork 5
/
Jsoup_Extract.js
51 lines (47 loc) · 1.6 KB
/
Jsoup_Extract.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
/*
* To change this license header, choose License Headers in Project Properties.
* To change this template file, choose Tools | Templates
* and open the template in the editor.
*/
var extract = function (doc) {
var File = java.io.File;
var Iterator = java.util.Iterator;
var Jsoup = org.jsoup.Jsoup;
var Document = org.jsoup.nodes.Document;
var Element = org.jsoup.nodes.Element;
var Elements = org.jsoup.select.Elements;
var content = doc.getFirstFieldValue("body");
var doc = org.jsoup.nodes.Document;
var e = java.lang.Exception;
var div = org.jsoup.nodes.Element;
var img = org.jsoup.nodes.Element;
var iter = java.util.Iterator;
var divs = org.jsoup.select.Elements;
try {
doc = Jsoup.parse(content);
if (null !== doc) {
divs = doc.select("div");
if (null !== divs) {
iter = divs.iterator();
div = null; // initialize our value to null
while (iter.hasNext()) {
div = iter.next();
if (div.attr("id").equals("featured-img")) {
break;
}
}
}
if (div != null) {
img = div.child(0);
logger.info("SRC: " + img.attr("src"));
logger.info("ORIG FILE: " + img.attr("data-orig-file"));
doc.addField("post_image", img.attr("data-orig-file"));
} else {
logger.warn("Div was null");
}
}
} catch (e) {
logger.error(e);
}
return doc;
}