@@ -5,7 +5,7 @@ import XCrawl from '../../src'
5
5
import { IRequestConfig } from '../../src/types'
6
6
import { IAreaRoom , IBRecommend } from './types'
7
7
8
- // 1. 爬取 房间数据
8
+ // 1. 房间数据
9
9
// https://github.com/coder-hxl/airbnb-api
10
10
11
11
const roomXCrawl = new XCrawl ( {
@@ -46,66 +46,37 @@ function areaRoomData() {
46
46
}
47
47
// areaRoomData()
48
48
49
- // ==================================================
50
-
51
- // 2. 爬取 b站 数据
52
-
53
- // 2.1 JSON: b站首页推荐视频的封面图
54
- /*
55
- https://api.bilibili.com/x/web-interface/wbi/index/top/feed/rcmd?y_num=5&fresh_type=3&feed_version=V8&fresh_idx_1h=1&fetch_row=1&fresh_idx=1&brush=0&homepage_ver=1&ps=10&outside_trigger=&w_rid=921db33671365ec8b9f7cab1971a3834&wts=1674553870
56
- */
49
+ // 2 HTML: GitHub Docs
50
+ // 采用 jsdom 对 HTML String 解析
57
51
58
- const bilibiliXCrawl = new XCrawl ( {
52
+ const githubDocsXCrawl = new XCrawl ( {
59
53
timeout : 10000 ,
60
54
intervalTime : {
61
- max : 1500 ,
55
+ max : 3000 ,
62
56
min : 1000
63
57
}
64
58
} )
65
59
66
- async function bilibiliRecommendData ( ) {
67
- const recommend = await bilibiliXCrawl . fetch < IBRecommend > ( {
68
- requestConifg : {
69
- url : 'https://api.bilibili.com/x/web-interface/wbi/index/top/feed/rcmd' ,
70
- method : 'GET' ,
71
- params : {
72
- y_num : 5 ,
73
- fresh_type : 3 ,
74
- feed_version : 'V8' ,
75
- fresh_idx_1h : 1 ,
76
- fetch_row : 1 ,
77
- fresh_idx : 1 ,
78
- brush : 0 ,
79
- homepage_ver : 1 ,
80
- ps : 10 ,
81
- outside_trigger : '' ,
82
- w_rid : '2e4be8e9830ecd780c5b0ff2bef805c9' ,
83
- wts : 1674556002
84
- }
85
- }
86
- } )
87
-
88
- const pictureUrls : IRequestConfig [ ] = recommend . data . item . map ( ( item ) => ( {
89
- url : item . pic ,
90
- method : 'GET'
91
- } ) )
60
+ async function githubDocs ( ) {
61
+ const dom = await githubDocsXCrawl . fetchHTML ( 'https://docs.github.com/zh' )
92
62
93
- const storeFile = await bilibiliXCrawl . fetchFile ( {
94
- requestConifg : pictureUrls ,
95
- intervalTime : { max : 3000 , min : 2000 } ,
96
- fileConfig : { storeDir : path . resolve ( __dirname , './upload' ) }
97
- } )
98
-
99
- console . log ( storeFile )
63
+ console . log ( dom . window . document . querySelector ( 'title' ) ?. textContent )
100
64
}
101
- bilibiliRecommendData ( )
102
65
103
- // 2.2 HTML: b站首页标题
104
- // 采用 jsdom 对 HTML String 解析
66
+ // githubDocs()
67
+
68
+ // https://docs.github.com/assets/cb-262/images/octicons/search-16.svg
105
69
106
- function bilibiliHTMLData ( ) {
107
- bilibiliXCrawl . fetchHTML ( 'https://www.bilibili.com/' ) . then ( ( dom ) => {
108
- console . log ( dom . window . document . querySelector ( 'title' ) ?. textContent )
70
+ githubDocsXCrawl
71
+ . fetchFile ( {
72
+ requestConifg : {
73
+ url : 'https://docs.github.com/assets/cb-262/images/octicons/search-16.svg' ,
74
+ method : 'GET'
75
+ } ,
76
+ fileConfig : {
77
+ storeDir : path . resolve ( __dirname , './upload' )
78
+ }
79
+ } )
80
+ . then ( ( fileInfos ) => {
81
+ console . log ( fileInfos )
109
82
} )
110
- }
111
- // bilibiliHTMLData()
0 commit comments