|
|
@@ -41,7 +41,6 @@ public class SpiderJob {
|
|
|
@ApolloJsonValue("${spider.filter.source.list:[\"知乎\",\"知乎日报\",\"果壳\",\"壹心理\",\"China Daily\",\"NASA \uD83C\uDF0D\",\"wikiHow 中文\"]}")
|
|
|
private List<String> filterSourceList;
|
|
|
|
|
|
-
|
|
|
@XxlJob("spiderTaskJob")
|
|
|
public ReturnT<String> spiderTaskJob(String param) {
|
|
|
int cursor = 1;
|
|
|
@@ -75,6 +74,7 @@ public class SpiderJob {
|
|
|
// Filter 过滤短、英文内容
|
|
|
if (StringUtils.isBlank(rankListItem.getTitle())
|
|
|
|| rankListItem.getTitle().length() < 8
|
|
|
+ || rankListItem.getTitle().length() > 100
|
|
|
|| rankListItem.getTitle().matches("^[A-Za-z0-9\\s!\"#$%&'()*+,\\-./:;<=>?@\\[\\\\\\]^_`{|}~’‘“”]+$")) {
|
|
|
continue;
|
|
|
}
|