Clean xpath code

This commit is contained in:
FongMi 2023-02-15 23:49:00 +08:00
parent d2aa52b588
commit 57a4523cdb
3 changed files with 222 additions and 329 deletions

View File

@ -3,7 +3,9 @@ package com.github.catvod.spider;
import android.content.Context; import android.content.Context;
import android.text.TextUtils; import android.text.TextUtils;
import com.github.catvod.bean.Class;
import com.github.catvod.bean.Result; import com.github.catvod.bean.Result;
import com.github.catvod.bean.Vod;
import com.github.catvod.bean.xpath.Rule; import com.github.catvod.bean.xpath.Rule;
import com.github.catvod.crawler.Spider; import com.github.catvod.crawler.Spider;
import com.github.catvod.crawler.SpiderDebug; import com.github.catvod.crawler.SpiderDebug;
@ -23,6 +25,12 @@ import java.util.Set;
public class XPath extends Spider { public class XPath extends Spider {
private HashMap<String, String> getHeaders() {
HashMap<String, String> headers = new HashMap<>();
headers.put("User-Agent", rule.getUa().isEmpty() ? "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/94.0.4606.54 Safari/537.36" : rule.getUa());
return headers;
}
@Override @Override
public void init(Context context) { public void init(Context context) {
super.init(context); super.init(context);
@ -35,97 +43,50 @@ public class XPath extends Spider {
@Override @Override
public String homeContent(boolean filter) { public String homeContent(boolean filter) {
try { fetchRule();
fetchRule(); List<Vod> list = new ArrayList<>();
JSONObject result = new JSONObject(); List<Class> classes = new ArrayList<>();
JSONArray classes = new JSONArray(); if (rule.getCateManual().size() > 0) {
if (rule.getCateManual().size() > 0) { Set<String> keys = rule.getCateManual().keySet();
Set<String> keys = rule.getCateManual().keySet(); for (String k : keys) {
for (String k : keys) { classes.add(new Class(rule.getCateManual().get(k), k));
JSONObject jsonObject = new JSONObject();
jsonObject.put("type_name", k);
jsonObject.put("type_id", rule.getCateManual().get(k));
classes.put(jsonObject);
}
} }
try { }
String webUrl = rule.getHomeUrl(); String webUrl = rule.getHomeUrl();
JXDocument doc = JXDocument.create(fetch(webUrl)); JXDocument doc = JXDocument.create(fetch(webUrl));
if (rule.getCateManual().size() == 0) { if (rule.getCateManual().size() == 0) {
List<JXNode> navNodes = doc.selN(rule.getCateNode()); List<JXNode> navNodes = doc.selN(rule.getCateNode());
for (int i = 0; i < navNodes.size(); i++) { for (int i = 0; i < navNodes.size(); i++) {
String name = navNodes.get(i).selOne(rule.getCateName()).asString().trim(); String name = navNodes.get(i).selOne(rule.getCateName()).asString().trim();
name = rule.getCateNameR(name); name = rule.getCateNameR(name);
String id = navNodes.get(i).selOne(rule.getCateId()).asString().trim(); String id = navNodes.get(i).selOne(rule.getCateId()).asString().trim();
id = rule.getCateIdR(id); id = rule.getCateIdR(id);
JSONObject jsonObject = new JSONObject(); classes.add(new Class(id, name));
jsonObject.put("type_id", id); }
jsonObject.put("type_name", name); }
classes.put(jsonObject); if (!rule.getHomeVodNode().isEmpty()) {
} List<JXNode> vodNodes = doc.selN(rule.getHomeVodNode());
} for (int i = 0; i < vodNodes.size(); i++) {
if (!rule.getHomeVodNode().isEmpty()) { String name = vodNodes.get(i).selOne(rule.getHomeVodName()).asString().trim();
name = rule.getHomeVodNameR(name);
String id = vodNodes.get(i).selOne(rule.getHomeVodId()).asString().trim();
id = rule.getHomeVodIdR(id);
String pic = vodNodes.get(i).selOne(rule.getHomeVodImg()).asString().trim();
pic = rule.getHomeVodImgR(pic);
pic = Utils.fixUrl(webUrl, pic);
String mark = "";
if (!rule.getHomeVodMark().isEmpty()) {
try { try {
JSONArray videos = new JSONArray(); mark = vodNodes.get(i).selOne(rule.getHomeVodMark()).asString().trim();
List<JXNode> vodNodes = doc.selN(rule.getHomeVodNode()); mark = rule.getHomeVodMarkR(mark);
for (int i = 0; i < vodNodes.size(); i++) {
String name = vodNodes.get(i).selOne(rule.getHomeVodName()).asString().trim();
name = rule.getHomeVodNameR(name);
String id = vodNodes.get(i).selOne(rule.getHomeVodId()).asString().trim();
id = rule.getHomeVodIdR(id);
String pic = vodNodes.get(i).selOne(rule.getHomeVodImg()).asString().trim();
pic = rule.getHomeVodImgR(pic);
pic = Utils.fixUrl(webUrl, pic);
String mark = "";
if (!rule.getHomeVodMark().isEmpty()) {
try {
mark = vodNodes.get(i).selOne(rule.getHomeVodMark()).asString().trim();
mark = rule.getHomeVodMarkR(mark);
} catch (Exception e) {
SpiderDebug.log(e);
}
}
JSONObject v = new JSONObject();
v.put("vod_id", id);
v.put("vod_name", name);
v.put("vod_pic", pic);
v.put("vod_remarks", mark);
videos.put(v);
}
result.put("list", videos);
} catch (Exception e) { } catch (Exception e) {
SpiderDebug.log(e); SpiderDebug.log(e);
} }
} }
} catch (Exception e) { list.add(new Vod(id, name, pic, mark));
SpiderDebug.log(e);
} }
result.put("class", classes);
if (filter && rule.getFilter() != null) {
result.put("filters", rule.getFilter());
}
return result.toString();
} catch (
Exception e) {
SpiderDebug.log(e);
} }
return ""; return Result.string(classes, list, rule.getFilter());
}
protected HashMap<String, String> getHeaders() {
HashMap<String, String> headers = new HashMap<>();
headers.put("User-Agent", rule.getUa().isEmpty() ? "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/94.0.4606.54 Safari/537.36" : rule.getUa());
return headers;
}
@Override
public String homeVideoContent() {
try {
fetchRule();
} catch (Exception e) {
SpiderDebug.log(e);
}
return "";
} }
protected String categoryUrl(String tid, String pg, boolean filter, HashMap<String, String> extend) { protected String categoryUrl(String tid, String pg, boolean filter, HashMap<String, String> extend) {
@ -134,190 +95,154 @@ public class XPath extends Spider {
@Override @Override
public String categoryContent(String tid, String pg, boolean filter, HashMap<String, String> extend) { public String categoryContent(String tid, String pg, boolean filter, HashMap<String, String> extend) {
try { fetchRule();
fetchRule(); List<Vod> list = new ArrayList<>();
String webUrl = categoryUrl(tid, pg, filter, extend); String webUrl = categoryUrl(tid, pg, filter, extend);
JSONArray videos = new JSONArray(); JXDocument doc = JXDocument.create(fetch(webUrl));
JXDocument doc = JXDocument.create(fetch(webUrl)); List<JXNode> vodNodes = doc.selN(rule.getCateVodNode());
List<JXNode> vodNodes = doc.selN(rule.getCateVodNode()); for (int i = 0; i < vodNodes.size(); i++) {
for (int i = 0; i < vodNodes.size(); i++) { String name = vodNodes.get(i).selOne(rule.getCateVodName()).asString().trim();
String name = vodNodes.get(i).selOne(rule.getCateVodName()).asString().trim(); name = rule.getCateVodNameR(name);
name = rule.getCateVodNameR(name); String id = vodNodes.get(i).selOne(rule.getCateVodId()).asString().trim();
String id = vodNodes.get(i).selOne(rule.getCateVodId()).asString().trim(); id = rule.getCateVodIdR(id);
id = rule.getCateVodIdR(id); String pic = vodNodes.get(i).selOne(rule.getCateVodImg()).asString().trim();
String pic = vodNodes.get(i).selOne(rule.getCateVodImg()).asString().trim(); pic = rule.getCateVodImgR(pic);
pic = rule.getCateVodImgR(pic); pic = Utils.fixUrl(webUrl, pic);
pic = Utils.fixUrl(webUrl, pic); String mark = "";
String mark = ""; if (!rule.getCateVodMark().isEmpty()) {
if (!rule.getCateVodMark().isEmpty()) { try {
try { mark = vodNodes.get(i).selOne(rule.getCateVodMark()).asString().trim();
mark = vodNodes.get(i).selOne(rule.getCateVodMark()).asString().trim(); mark = rule.getCateVodMarkR(mark);
mark = rule.getCateVodMarkR(mark); } catch (Exception e) {
} catch (Exception e) { SpiderDebug.log(e);
SpiderDebug.log(e);
}
} }
JSONObject v = new JSONObject();
v.put("vod_id", id);
v.put("vod_name", name);
v.put("vod_pic", pic);
v.put("vod_remarks", mark);
videos.put(v);
} }
JSONObject result = new JSONObject(); list.add(new Vod(id, name, pic, mark));
result.put("page", pg);
result.put("pagecount", Integer.MAX_VALUE);
result.put("limit", 90);
result.put("total", Integer.MAX_VALUE);
result.put("list", videos);
return result.toString();
} catch (Exception e) {
SpiderDebug.log(e);
} }
return ""; return Result.string(list);
} }
@Override @Override
public String detailContent(List<String> ids) { public String detailContent(List<String> ids) {
try { fetchRule();
fetchRule(); String webUrl = rule.getDetailUrl().replace("{vid}", ids.get(0));
String webUrl = rule.getDetailUrl().replace("{vid}", ids.get(0)); String webContent = fetch(webUrl);
String webContent = fetch(webUrl); JXDocument doc = JXDocument.create(webContent);
JXDocument doc = JXDocument.create(webContent); JXNode vodNode = doc.selNOne(rule.getDetailNode());
JXNode vodNode = doc.selNOne(rule.getDetailNode()); String cover = "", title = "", desc = "", category = "", area = "", year = "", remark = "", director = "", actor = "";
title = vodNode.selOne(rule.getDetailName()).asString().trim();
String cover = "", title = "", desc = "", category = "", area = "", year = "", remark = "", director = "", actor = ""; title = rule.getDetailNameR(title);
cover = vodNode.selOne(rule.getDetailImg()).asString().trim();
title = vodNode.selOne(rule.getDetailName()).asString().trim(); cover = rule.getDetailImgR(cover);
title = rule.getDetailNameR(title); cover = Utils.fixUrl(webUrl, cover);
if (!rule.getDetailCate().isEmpty()) {
cover = vodNode.selOne(rule.getDetailImg()).asString().trim(); try {
cover = rule.getDetailImgR(cover); category = vodNode.selOne(rule.getDetailCate()).asString().trim();
cover = Utils.fixUrl(webUrl, cover); category = rule.getDetailCateR(category);
} catch (Exception e) {
if (!rule.getDetailCate().isEmpty()) { SpiderDebug.log(e);
try {
category = vodNode.selOne(rule.getDetailCate()).asString().trim();
category = rule.getDetailCateR(category);
} catch (Exception e) {
SpiderDebug.log(e);
}
} }
if (!rule.getDetailYear().isEmpty()) { }
try { if (!rule.getDetailYear().isEmpty()) {
year = vodNode.selOne(rule.getDetailYear()).asString().trim(); try {
year = rule.getDetailYearR(year); year = vodNode.selOne(rule.getDetailYear()).asString().trim();
} catch (Exception e) { year = rule.getDetailYearR(year);
SpiderDebug.log(e); } catch (Exception e) {
} SpiderDebug.log(e);
} }
if (!rule.getDetailArea().isEmpty()) { }
try { if (!rule.getDetailArea().isEmpty()) {
area = vodNode.selOne(rule.getDetailArea()).asString().trim(); try {
area = rule.getDetailAreaR(area); area = vodNode.selOne(rule.getDetailArea()).asString().trim();
} catch (Exception e) { area = rule.getDetailAreaR(area);
SpiderDebug.log(e); } catch (Exception e) {
} SpiderDebug.log(e);
} }
if (!rule.getDetailMark().isEmpty()) { }
try { if (!rule.getDetailMark().isEmpty()) {
remark = vodNode.selOne(rule.getDetailMark()).asString().trim(); try {
remark = rule.getDetailMarkR(remark); remark = vodNode.selOne(rule.getDetailMark()).asString().trim();
} catch (Exception e) { remark = rule.getDetailMarkR(remark);
SpiderDebug.log(e); } catch (Exception e) {
} SpiderDebug.log(e);
} }
if (!rule.getDetailActor().isEmpty()) { }
try { if (!rule.getDetailActor().isEmpty()) {
actor = vodNode.selOne(rule.getDetailActor()).asString().trim(); try {
actor = rule.getDetailActorR(actor); actor = vodNode.selOne(rule.getDetailActor()).asString().trim();
} catch (Exception e) { actor = rule.getDetailActorR(actor);
SpiderDebug.log(e); } catch (Exception e) {
} SpiderDebug.log(e);
} }
if (!rule.getDetailDirector().isEmpty()) { }
try { if (!rule.getDetailDirector().isEmpty()) {
director = vodNode.selOne(rule.getDetailDirector()).asString().trim(); try {
director = rule.getDetailDirectorR(director); director = vodNode.selOne(rule.getDetailDirector()).asString().trim();
} catch (Exception e) { director = rule.getDetailDirectorR(director);
SpiderDebug.log(e); } catch (Exception e) {
} SpiderDebug.log(e);
} }
if (!rule.getDetailDesc().isEmpty()) { }
try { if (!rule.getDetailDesc().isEmpty()) {
desc = vodNode.selOne(rule.getDetailDesc()).asString().trim(); try {
desc = rule.getDetailDescR(desc); desc = vodNode.selOne(rule.getDetailDesc()).asString().trim();
} catch (Exception e) { desc = rule.getDetailDescR(desc);
SpiderDebug.log(e); } catch (Exception e) {
} SpiderDebug.log(e);
} }
}
JSONObject vod = new JSONObject(); Vod vod = new Vod();
vod.put("vod_id", ids.get(0)); vod.setVodId(ids.get(0));
vod.put("vod_name", title); vod.setVodName(title);
vod.put("vod_pic", cover); vod.setVodPic(cover);
vod.put("type_name", category); vod.setTypeName(category);
vod.put("vod_year", year); vod.setVodYear(year);
vod.put("vod_area", area); vod.setVodArea(area);
vod.put("vod_remarks", remark); vod.setVodRemarks(remark);
vod.put("vod_actor", actor); vod.setVodActor(actor);
vod.put("vod_director", director); vod.setVodDirector(director);
vod.put("vod_content", desc); vod.setVodContent(desc);
ArrayList<String> playFrom = new ArrayList<>(); ArrayList<String> playFrom = new ArrayList<>();
List<JXNode> fromNodes = doc.selN(rule.getDetailFromNode());
for (int i = 0; i < fromNodes.size(); i++) {
String name = fromNodes.get(i).selOne(rule.getDetailFromName()).asString().trim();
name = rule.getDetailFromNameR(name);
playFrom.add(name);
}
List<JXNode> fromNodes = doc.selN(rule.getDetailFromNode()); ArrayList<String> playList = new ArrayList<>();
for (int i = 0; i < fromNodes.size(); i++) { List<JXNode> urlListNodes = doc.selN(rule.getDetailUrlNode());
String name = fromNodes.get(i).selOne(rule.getDetailFromName()).asString().trim(); for (int i = 0; i < urlListNodes.size(); i++) {
name = rule.getDetailFromNameR(name); List<JXNode> urlNodes = urlListNodes.get(i).sel(rule.getDetailUrlSubNode());
playFrom.add(name); List<String> vodItems = new ArrayList<>();
} for (int j = 0; j < urlNodes.size(); j++) {
String name = urlNodes.get(j).selOne(rule.getDetailUrlName()).asString().trim();
ArrayList<String> playList = new ArrayList<>(); name = rule.getDetailUrlNameR(name);
List<JXNode> urlListNodes = doc.selN(rule.getDetailUrlNode()); String id = urlNodes.get(j).selOne(rule.getDetailUrlId()).asString().trim();
for (int i = 0; i < urlListNodes.size(); i++) { id = rule.getDetailUrlIdR(id);
List<JXNode> urlNodes = urlListNodes.get(i).sel(rule.getDetailUrlSubNode()); vodItems.add(name + "$" + id);
List<String> vodItems = new ArrayList<>();
for (int j = 0; j < urlNodes.size(); j++) {
String name = urlNodes.get(j).selOne(rule.getDetailUrlName()).asString().trim();
name = rule.getDetailUrlNameR(name);
String id = urlNodes.get(j).selOne(rule.getDetailUrlId()).asString().trim();
id = rule.getDetailUrlIdR(id);
vodItems.add(name + "$" + id);
}
// 排除播放列表為空的播放源
if (vodItems.size() == 0 && playFrom.size() > i) {
playFrom.set(i, "");
}
playList.add(TextUtils.join("#", vodItems));
} }
// 排除播放列表為空的播放源 // 排除播放列表為空的播放源
for (int i = playFrom.size() - 1; i >= 0; i--) { if (vodItems.size() == 0 && playFrom.size() > i) {
if (playFrom.get(i).isEmpty()) playFrom.set(i, "");
playFrom.remove(i);
} }
for (int i = playList.size() - 1; i >= 0; i--) { playList.add(TextUtils.join("#", vodItems));
if (playList.get(i).isEmpty())
playList.remove(i);
}
for (int i = playList.size() - 1; i >= 0; i--) {
if (i >= playFrom.size())
playList.remove(i);
}
String vod_play_from = TextUtils.join("$$$", playFrom);
String vod_play_url = TextUtils.join("$$$", playList);
vod.put("vod_play_from", vod_play_from);
vod.put("vod_play_url", vod_play_url);
JSONObject result = new JSONObject();
JSONArray list = new JSONArray();
list.put(vod);
result.put("list", list);
return result.toString();
} catch (Exception e) {
SpiderDebug.log(e);
} }
return ""; // 排除播放列表為空的播放源
for (int i = playFrom.size() - 1; i >= 0; i--) {
if (playFrom.get(i).isEmpty()) playFrom.remove(i);
}
for (int i = playList.size() - 1; i >= 0; i--) {
if (playList.get(i).isEmpty()) playList.remove(i);
}
for (int i = playList.size() - 1; i >= 0; i--) {
if (i >= playFrom.size()) playList.remove(i);
}
vod.setVodPlayFrom(TextUtils.join("$$$", playFrom));
vod.setVodPlayUrl(TextUtils.join("$$$", playList));
return Result.string(vod);
} }
@Override @Override
@ -332,79 +257,59 @@ public class XPath extends Spider {
} }
@Override @Override
public String searchContent(String key, boolean quick) { public String searchContent(String key, boolean quick) throws Exception {
try { fetchRule();
fetchRule(); if (rule.getSearchUrl().isEmpty()) return "";
if (rule.getSearchUrl().isEmpty()) { String webUrl = rule.getSearchUrl().replace("{wd}", URLEncoder.encode(key));
return ""; String webContent = fetch(webUrl);
} List<Vod> list = new ArrayList<>();
String webUrl = rule.getSearchUrl().replace("{wd}", URLEncoder.encode(key)); if (rule.getSearchVodNode().startsWith("json:")) {
String webContent = fetch(webUrl); String[] node = rule.getSearchVodNode().substring(5).split(">");
JSONObject result = new JSONObject(); JSONObject data = new JSONObject(webContent);
JSONArray videos = new JSONArray(); for (int i = 0; i < node.length; i++) {
if (rule.getSearchVodNode().startsWith("json:")) { if (i == node.length - 1) {
String[] node = rule.getSearchVodNode().substring(5).split(">"); JSONArray vodArray = data.getJSONArray(node[i]);
JSONObject data = new JSONObject(webContent); for (int j = 0; j < vodArray.length(); j++) {
for (int i = 0; i < node.length; i++) { JSONObject vod = vodArray.getJSONObject(j);
if (i == node.length - 1) { String name = vod.optString(rule.getSearchVodName()).trim();
JSONArray vodArray = data.getJSONArray(node[i]); name = rule.getSearchVodNameR(name);
for (int j = 0; j < vodArray.length(); j++) { String id = vod.optString(rule.getSearchVodId()).trim();
JSONObject vod = vodArray.getJSONObject(j); id = rule.getSearchVodIdR(id);
String name = vod.optString(rule.getSearchVodName()).trim(); String pic = vod.optString(rule.getSearchVodImg()).trim();
name = rule.getSearchVodNameR(name); pic = rule.getSearchVodImgR(pic);
String id = vod.optString(rule.getSearchVodId()).trim(); pic = Utils.fixUrl(webUrl, pic);
id = rule.getSearchVodIdR(id); String mark = vod.optString(rule.getSearchVodMark()).trim();
String pic = vod.optString(rule.getSearchVodImg()).trim(); mark = rule.getSearchVodMarkR(mark);
pic = rule.getSearchVodImgR(pic); list.add(new Vod(id, name, pic, mark));
pic = Utils.fixUrl(webUrl, pic);
String mark = vod.optString(rule.getSearchVodMark()).trim();
mark = rule.getSearchVodMarkR(mark);
JSONObject v = new JSONObject();
v.put("vod_id", id);
v.put("vod_name", name);
v.put("vod_pic", pic);
v.put("vod_remarks", mark);
videos.put(v);
}
} else {
data = data.getJSONObject(node[i]);
} }
} } else {
} else { data = data.getJSONObject(node[i]);
JXDocument doc = JXDocument.create(webContent);
List<JXNode> vodNodes = doc.selN(rule.getSearchVodNode());
for (int i = 0; i < vodNodes.size(); i++) {
String name = vodNodes.get(i).selOne(rule.getSearchVodName()).asString().trim();
name = rule.getSearchVodNameR(name);
String id = vodNodes.get(i).selOne(rule.getSearchVodId()).asString().trim();
id = rule.getSearchVodIdR(id);
String pic = vodNodes.get(i).selOne(rule.getSearchVodImg()).asString().trim();
pic = rule.getSearchVodImgR(pic);
pic = Utils.fixUrl(webUrl, pic);
String mark = "";
if (!rule.getCateVodMark().isEmpty()) {
try {
mark = vodNodes.get(i).selOne(rule.getSearchVodMark()).asString().trim();
mark = rule.getSearchVodMarkR(mark);
} catch (Exception e) {
SpiderDebug.log(e);
}
}
JSONObject v = new JSONObject();
v.put("vod_id", id);
v.put("vod_name", name);
v.put("vod_pic", pic);
v.put("vod_remarks", mark);
videos.put(v);
} }
} }
result.put("list", videos); } else {
return result.toString(); JXDocument doc = JXDocument.create(webContent);
} catch ( List<JXNode> vodNodes = doc.selN(rule.getSearchVodNode());
Exception e) { for (int i = 0; i < vodNodes.size(); i++) {
SpiderDebug.log(e); String name = vodNodes.get(i).selOne(rule.getSearchVodName()).asString().trim();
name = rule.getSearchVodNameR(name);
String id = vodNodes.get(i).selOne(rule.getSearchVodId()).asString().trim();
id = rule.getSearchVodIdR(id);
String pic = vodNodes.get(i).selOne(rule.getSearchVodImg()).asString().trim();
pic = rule.getSearchVodImgR(pic);
pic = Utils.fixUrl(webUrl, pic);
String mark = "";
if (!rule.getCateVodMark().isEmpty()) {
try {
mark = vodNodes.get(i).selOne(rule.getSearchVodMark()).asString().trim();
mark = rule.getSearchVodMarkR(mark);
} catch (Exception e) {
SpiderDebug.log(e);
}
}
list.add(new Vod(id, name, pic, mark));
}
} }
return ""; return Result.string(list);
} }
@Override @Override
@ -412,20 +317,9 @@ public class XPath extends Spider {
return false; return false;
} }
private final String[] videoFormatList = new String[]{".m3u8", ".mp4", ".mpeg", ".flv"};
@Override @Override
public boolean isVideoFormat(String url) { public boolean isVideoFormat(String url) {
url = url.toLowerCase(); return Utils.isVideoFormat(url);
if (url.contains("=http") || url.contains("=https") || url.contains("=https%3a%2f") || url.contains("=http%3a%2f")) {
return false;
}
for (String format : videoFormatList) {
if (url.contains(format)) {
return true;
}
}
return false;
} }
protected String ext = null; protected String ext = null;
@ -447,7 +341,6 @@ public class XPath extends Spider {
} }
protected void loadRuleExt(String json) { protected void loadRuleExt(String json) {
} }
protected String fetch(String webUrl) { protected String fetch(String webUrl) {

View File

@ -89,7 +89,6 @@ public class XPathMac extends XPath {
SpiderDebug.log(e); SpiderDebug.log(e);
} }
} }
// SpiderDebug.log(webContent);
} }
return result; return result;
} }

View File

@ -30,6 +30,7 @@ public class Utils {
} }
public static boolean isVideoFormat(String url) { public static boolean isVideoFormat(String url) {
if (url.contains("url=http") || url.contains(".js") || url.contains(".css") || url.contains(".html")) return false;
return Sniffer.RULE.matcher(url).find(); return Sniffer.RULE.matcher(url).find();
} }