/reptile-core

HTML网页解析及特定内容获取工具。

Primary LanguageJavaGNU General Public License v3.0GPL-3.0

reptile-core

HTML网页解析及特定内容获取工具。

使用

Gradle

implementation("com.jiangyc:reptile-core:1.3.1")

Maven

<dependency>
    <groupId>com.jiangyc</groupId>
    <artifactId>reptile-core</artifactId>
    <version>1.3.1</version>
</dependency>

示例

import org.jsoup.nodes.Element;

public class ReptileTest {

    public static void main(String[] args) {
        Reptile reptile = new Reptile();

        // List<Map<String, String>> classifies = reptile.resolve("https://www.qidian.com", StandardCharsets.UTF_8, (doc) -> {
        new Reptile().resolve("https://www.qidian.com", (doc) ->
                reptile.selectAll(doc, "#classify-list>dl>dd>a", (ele) -> {
                    Map<String, String> classifyMap = new HashMap<>();

                    String id = reptile.attr(ele, "href", (it) ->
                            it.replaceAll("\\\\", "").replaceAll("/", ""));
                    classifyMap.put("id", id);

                    String name = reptile.selectOne(ele, "cite>span>i", Element::text);
                    classifyMap.put("name", name);

                    String count = reptile.selectOne(ele, "cite>span>b", Element::text);
                    classifyMap.put("count", count);

                    return classifyMap;
                })).forEach(System.out::println);
    }
}