ScienceDirectSearchPcoessor.java
1.24 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
package com.canrd.webmagic.processor;
import lombok.extern.slf4j.Slf4j;
import org.springframework.stereotype.Component;
import us.codecraft.webmagic.Page;
import us.codecraft.webmagic.Site;
import us.codecraft.webmagic.processor.PageProcessor;
import us.codecraft.webmagic.selector.Html;
@Slf4j
@Component
public class ScienceDirectSearchPcoessor implements PageProcessor {
@Override
public void process(Page page) {
String url = page.getUrl().get();
if (url.equals("https://www.sciencedirect.com/search?qs=battery&pub=Nano%20Today&cid=273494")){
getMaxPage(page);
}else if (url.contains("https://www.sciencedirect.com/search?qs=battery&show=100&offset=")){
everyPage(page);
} else if (url.contains("https://www.sciencedirect.com/science/article/abs/pii")) {
getPageDetail(page);
}else if (url.equals("https://www.sciencedirect.com/journal/nano-today")){
}
}
@Override
public Site getSite() {
return PageProcessor.super.getSite();
}
void getMaxPage(Page page){
Html html = page.getHtml();
// move-right
page.putField("html",html);
}
void everyPage(Page page){
}
void getPageDetail(Page page){
}
}