mirror of
https://github.com/201206030/novel.git
synced 2025-04-27 07:30:50 +00:00
2.6.0发布,新增笔趣窝源
This commit is contained in:
parent
ef36527ed6
commit
05d9e22df9
@ -10,7 +10,7 @@
|
|||||||
</parent>
|
</parent>
|
||||||
<groupId>xyz.zinglizingli</groupId>
|
<groupId>xyz.zinglizingli</groupId>
|
||||||
<artifactId>novel-front</artifactId>
|
<artifactId>novel-front</artifactId>
|
||||||
<version>2.4.1.beta</version>
|
<version>2.5.0.beta</version>
|
||||||
<name>novel-front</name>
|
<name>novel-front</name>
|
||||||
<description>小说精品楼-前台web网站</description>
|
<description>小说精品楼-前台web网站</description>
|
||||||
|
|
||||||
|
@ -0,0 +1,27 @@
|
|||||||
|
package xyz.zinglizingli.books.core.config;
|
||||||
|
|
||||||
|
import lombok.extern.slf4j.Slf4j;
|
||||||
|
import org.springframework.boot.autoconfigure.condition.ConditionalOnProperty;
|
||||||
|
import org.springframework.boot.context.properties.ConfigurationProperties;
|
||||||
|
import org.springframework.context.annotation.Bean;
|
||||||
|
import org.springframework.context.annotation.Configuration;
|
||||||
|
import xyz.zinglizingli.books.core.crawl.BaseHtmlCrawlSource;
|
||||||
|
import xyz.zinglizingli.books.core.crawl.BiquCrawlSource;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @author 11797
|
||||||
|
*/
|
||||||
|
@Slf4j
|
||||||
|
@Configuration
|
||||||
|
public class CrawlBiquwoConfig {
|
||||||
|
|
||||||
|
|
||||||
|
@Bean
|
||||||
|
@ConfigurationProperties(prefix = "biquwo.crawlsource") // prefix值必须是application.yml中对应属性的前缀
|
||||||
|
@ConditionalOnProperty(prefix = "crawl.website",name = "type",havingValue = "6")
|
||||||
|
public BaseHtmlCrawlSource biquwoCrawlSource() {
|
||||||
|
return new BiquCrawlSource();
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
}
|
@ -86,3 +86,20 @@ biquge:
|
|||||||
intro-pattern: class="review">([^/]+)</p>
|
intro-pattern: class="review">([^/]+)</p>
|
||||||
catalog-url-pattern: <a\s+href="(/ddk\d+/all.html)">查看完整目录</a>
|
catalog-url-pattern: <a\s+href="(/ddk\d+/all.html)">查看完整目录</a>
|
||||||
catalog-pattern: <dd>\s*<a\s+href="(\d+\.html)"\s+title="([^"]+)">([^<]+)</a>\s*</dd>
|
catalog-pattern: <dd>\s*<a\s+href="(\d+\.html)"\s+title="([^"]+)">([^<]+)</a>\s*</dd>
|
||||||
|
|
||||||
|
|
||||||
|
biquwo:
|
||||||
|
crawlsource:
|
||||||
|
index-url: http://m.biquwo.net
|
||||||
|
list-page-url: http://m.biquwo.net/sort{0}/0/{1}.html
|
||||||
|
book-url-pattern: href="/(dudu/\d+/\d+)/"
|
||||||
|
score-pattern: <div\s+class="score">(\d+\.\d+)分</div>
|
||||||
|
book-name-pattern: <p class="title">([^/]+)</p>
|
||||||
|
author-pattern: 作者:([^/]+)<
|
||||||
|
status-pattern: 状态:([^/]+)</li>
|
||||||
|
cat-pattern: 类别:([^/]+)</li>
|
||||||
|
update-time-pattern: 更新:(\d+-\d+-\d+\s\d+:\d+:\d+)</a>
|
||||||
|
pic-pattern: <img src="([^>]+)"\s+onerror="this.src=
|
||||||
|
intro-pattern: class="review">([^<]+)</p>
|
||||||
|
catalog-url-pattern: <a\s+href="(/dudu/\d+/\d+/all\.html)">查看完整目录</a>
|
||||||
|
catalog-pattern: <a\s+style=""\s+href="(/dudu/\d+/\d+/\d+\.html)">([^/]+)</a>
|
@ -86,10 +86,10 @@ books:
|
|||||||
#爬取小说数量
|
#爬取小说数量
|
||||||
maxNum: 300000
|
maxNum: 300000
|
||||||
|
|
||||||
#爬取的网站名称类型 1:笔趣岛 ,2:笔趣塔,3:顶点小说 ,4:百书斋 更多网站解析中,敬请期待
|
#爬取的网站名称类型 1:笔趣岛 ,2:笔趣塔,3:顶点小说 ,4:百书斋,6: 笔趣窝 更多网站解析中,敬请期待
|
||||||
crawl:
|
crawl:
|
||||||
website:
|
website:
|
||||||
type: 3
|
type: 6
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
@ -9,8 +9,8 @@ mybatis:
|
|||||||
mysql: {charset: utf8mb4}
|
mysql: {charset: utf8mb4}
|
||||||
books: {lowestScore: 6.0}
|
books: {lowestScore: 6.0}
|
||||||
crawl:
|
crawl:
|
||||||
patten: 3
|
patten: '1'
|
||||||
website: {type: 3}
|
website: {type: 6}
|
||||||
soft-novel: '1'
|
soft-novel: '0'
|
||||||
manhua: '1'
|
manhua: '0'
|
||||||
logging: {config: 'classpath:logback-boot.xml'}
|
logging: {config: 'classpath:logback-boot.xml'}
|
||||||
|
Binary file not shown.
Loading…
x
Reference in New Issue
Block a user