Blame view

src/main/java/com/canrd/webmagic/controller/ScienceDirectController.java 1.67 KB
凌世锦 authored
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
package com.canrd.webmagic.controller;

import com.canrd.webmagic.common.constant.ServerResult;
import com.canrd.webmagic.processor.ScienceDirectSearchPcoessor;
import com.canrd.webmagic.processor.download.SeleniumDownloader;
import com.canrd.webmagic.processor.pipeline.ArticlePipeline;
import io.swagger.annotations.Api;
import io.swagger.annotations.ApiOperation;
import org.apache.logging.log4j.core.util.UuidUtil;
import org.springframework.web.bind.annotation.GetMapping;
import org.springframework.web.bind.annotation.RequestMapping;
import org.springframework.web.bind.annotation.RestController;
import us.codecraft.webmagic.Request;
import us.codecraft.webmagic.Spider;

import javax.annotation.Resource;

@RestController
@RequestMapping("/sciencedirect/article")
@Api("Science-Direct")
public class ScienceDirectController {
    @Resource
    private ScienceDirectSearchPcoessor scienceDirectSearchPcoessor;

    @Resource
    private SeleniumDownloader seleniumDownloader;

    @Resource
    private ArticlePipeline articlePipeline;

    @GetMapping("/start")
    @ApiOperation("start")
    public ServerResult start()  {
        Spider.create(scienceDirectSearchPcoessor)
                .setUUID(UuidUtil.getTimeBasedUuid().toString())
//                .addRequest(new Request("https://www.sciencedirect.com/search?qs=battery"))
                .addRequest(new Request("https://www.sciencedirect.com/search?qs=battery&pub=Nano%20Today&cid=273494"))
//                .setScheduler(new RedisScheduler("127.0.0.1"))
//                .addPipeline(articlePipeline)
                .setDownloader(seleniumDownloader)
                .thread(20).run();
        return ServerResult.success();
    }
}