|
@@ -1,44 +1,10 @@
|
|
|
package cn.reghao.bnt.browser;
|
|
package cn.reghao.bnt.browser;
|
|
|
|
|
|
|
|
-import cn.reghao.bnt.browser.parser.ChromeDataParser;
|
|
|
|
|
-import cn.reghao.bnt.browser.chrome.AbstractChrome;
|
|
|
|
|
-import cn.reghao.bnt.browser.chrome.ChromeBrowser;
|
|
|
|
|
-import cn.reghao.bnt.browser.chrome.ReqMatcher;
|
|
|
|
|
-import cn.reghao.bnt.spider.url.BodyDataType;
|
|
|
|
|
-import cn.reghao.bnt.spider.url.Site;
|
|
|
|
|
-
|
|
|
|
|
-import java.util.HashMap;
|
|
|
|
|
-import java.util.HashSet;
|
|
|
|
|
-import java.util.Map;
|
|
|
|
|
-import java.util.Set;
|
|
|
|
|
-
|
|
|
|
|
/**
|
|
/**
|
|
|
* @author reghao
|
|
* @author reghao
|
|
|
* @date 2023-09-10 02:24:50
|
|
* @date 2023-09-10 02:24:50
|
|
|
*/
|
|
*/
|
|
|
public class SpiderBrowser {
|
|
public class SpiderBrowser {
|
|
|
- public static Map<String, String> map = new HashMap<>();
|
|
|
|
|
- static ChromeDataParser chromeDataParser = new ChromeDataParser();
|
|
|
|
|
-
|
|
|
|
|
- static Set<ReqMatcher> reqMatchers() {
|
|
|
|
|
- Set<ReqMatcher> set = new HashSet<>();
|
|
|
|
|
- String pattern = "h5/mtop.taobao.rate.detaillist.get/6.0";
|
|
|
|
|
- String parser = "TmallCommentDataParser";
|
|
|
|
|
- map.put(pattern, parser);
|
|
|
|
|
- set.add(new ReqMatcher(Site.bilibili, pattern, BodyDataType.json, chromeDataParser));
|
|
|
|
|
-
|
|
|
|
|
- String pattern1 = "rate.taobao.com/feedRateList.htm";
|
|
|
|
|
- String parser1 = "TaobaoCommentDataParser";
|
|
|
|
|
- map.put(pattern1, parser1);
|
|
|
|
|
- set.add(new ReqMatcher(Site.bilibili, pattern1, BodyDataType.json, chromeDataParser));
|
|
|
|
|
- return set;
|
|
|
|
|
- }
|
|
|
|
|
-
|
|
|
|
|
public static void main(String[] args) {
|
|
public static void main(String[] args) {
|
|
|
- Set<ReqMatcher> set = reqMatchers();
|
|
|
|
|
-
|
|
|
|
|
- String url = "https://www.tmall.com/";
|
|
|
|
|
- AbstractChrome chrome = new ChromeBrowser(false, false);
|
|
|
|
|
- chrome.getAndHandleDynamicPage(url, set);
|
|
|
|
|
}
|
|
}
|
|
|
}
|
|
}
|