From 81880d3dc64a9f765cfdc9123d9b1446ac059d75 Mon Sep 17 00:00:00 2001 From: VATALU <2507978950@qq.com> Date: Wed, 20 Dec 2017 16:42:29 +0800 Subject: [PATCH] =?UTF-8?q?Html=E6=96=B0=E5=A2=9Etext()=E6=96=B9=E6=B3=95?= =?UTF-8?q?=EF=BC=8C=E4=BE=BF=E4=BA=8E=E8=8E=B7=E5=8F=96=E5=85=A8=E9=83=A8?= =?UTF-8?q?=E6=96=87=E6=9C=AC?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .../java/us/codecraft/webmagic/selector/Html.java | 13 +++++++++---- 1 file changed, 9 insertions(+), 4 deletions(-) diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Html.java b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Html.java index f2218f126..56828bcac 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Html.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Html.java @@ -19,11 +19,12 @@ public class Html extends HtmlNode { private Logger logger = LoggerFactory.getLogger(getClass()); - /** - * Disable jsoup html entity escape. It can be set just before any Html instance is created. + /** + * Disable jsoup html entity escape. It can be set just before any Html instance is created. + * * @deprecated - */ - public static boolean DISABLE_HTML_ENTITY_ESCAPE = false; + */ + public static boolean DISABLE_HTML_ENTITY_ESCAPE = false; /** * Store parsed document for better performance when only one text exist. @@ -83,6 +84,10 @@ public List selectDocumentForList(Selector selector) { } } + public String text() { + return document.text(); + } + public static Html create(String text) { return new Html(text); }