From a5a9b141b3e8f91538099cb6c335c20f166363ff Mon Sep 17 00:00:00 2001 From: d0ngw Date: Fri, 27 Dec 2013 11:09:04 +0800 Subject: [PATCH] The SeleniumDownloader should call the setRawText --- .gitignore | 3 ++- .../webmagic/downloader/selenium/SeleniumDownloader.java | 1 + 2 files changed, 3 insertions(+), 1 deletion(-) diff --git a/.gitignore b/.gitignore index 8e88e25d..c0dc326c 100644 --- a/.gitignore +++ b/.gitignore @@ -1,4 +1,5 @@ -target/* +target *.iml out/ .idea + diff --git a/webmagic-selenium/src/main/java/us/codecraft/webmagic/downloader/selenium/SeleniumDownloader.java b/webmagic-selenium/src/main/java/us/codecraft/webmagic/downloader/selenium/SeleniumDownloader.java index 3d4fcdb8..50d332ba 100644 --- a/webmagic-selenium/src/main/java/us/codecraft/webmagic/downloader/selenium/SeleniumDownloader.java +++ b/webmagic-selenium/src/main/java/us/codecraft/webmagic/downloader/selenium/SeleniumDownloader.java @@ -84,6 +84,7 @@ public class SeleniumDownloader implements Downloader, Closeable { WebElement webElement = webDriver.findElement(By.xpath("/html")); String content = webElement.getAttribute("outerHTML"); Page page = new Page(); + page.setRawText(content); page.setHtml(new Html(UrlUtils.fixAllRelativeHrefs(content, request.getUrl()))); page.setUrl(new PlainText(request.getUrl())); page.setRequest(request);