|
|
@ -5,7 +5,6 @@ import org.openqa.selenium.By;
|
|
|
|
import org.openqa.selenium.Cookie;
|
|
|
|
import org.openqa.selenium.Cookie;
|
|
|
|
import org.openqa.selenium.WebDriver;
|
|
|
|
import org.openqa.selenium.WebDriver;
|
|
|
|
import org.openqa.selenium.WebElement;
|
|
|
|
import org.openqa.selenium.WebElement;
|
|
|
|
|
|
|
|
|
|
|
|
import us.codecraft.webmagic.Page;
|
|
|
|
import us.codecraft.webmagic.Page;
|
|
|
|
import us.codecraft.webmagic.Request;
|
|
|
|
import us.codecraft.webmagic.Request;
|
|
|
|
import us.codecraft.webmagic.Site;
|
|
|
|
import us.codecraft.webmagic.Site;
|
|
|
@ -13,7 +12,6 @@ import us.codecraft.webmagic.Task;
|
|
|
|
import us.codecraft.webmagic.downloader.Downloader;
|
|
|
|
import us.codecraft.webmagic.downloader.Downloader;
|
|
|
|
import us.codecraft.webmagic.selector.Html;
|
|
|
|
import us.codecraft.webmagic.selector.Html;
|
|
|
|
import us.codecraft.webmagic.selector.PlainText;
|
|
|
|
import us.codecraft.webmagic.selector.PlainText;
|
|
|
|
import us.codecraft.webmagic.utils.UrlUtils;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
import java.io.Closeable;
|
|
|
|
import java.io.Closeable;
|
|
|
|
import java.io.IOException;
|
|
|
|
import java.io.IOException;
|
|
|
@ -108,8 +106,7 @@ public class SeleniumDownloader implements Downloader, Closeable {
|
|
|
|
String content = webElement.getAttribute("outerHTML");
|
|
|
|
String content = webElement.getAttribute("outerHTML");
|
|
|
|
Page page = new Page();
|
|
|
|
Page page = new Page();
|
|
|
|
page.setRawText(content);
|
|
|
|
page.setRawText(content);
|
|
|
|
page.setHtml(new Html(UrlUtils.fixAllRelativeHrefs(content,
|
|
|
|
page.setHtml(new Html(content, request.getUrl()));
|
|
|
|
request.getUrl())));
|
|
|
|
|
|
|
|
page.setUrl(new PlainText(request.getUrl()));
|
|
|
|
page.setUrl(new PlainText(request.getUrl()));
|
|
|
|
page.setRequest(request);
|
|
|
|
page.setRequest(request);
|
|
|
|
webDriverPool.returnToPool(webDriver);
|
|
|
|
webDriverPool.returnToPool(webDriver);
|
|
|
|