@@ -84,7 +84,7 @@ interface ExtraFileConfig extends ExtraCommonConfig {
84
84
onCrawlItemComplete :
85
85
| ( ( crawlFileSingleRes : CrawlFileSingleRes ) => void )
86
86
| undefined
87
- onBeforeSaveFile :
87
+ onBeforeSaveItemFile :
88
88
| ( ( info : {
89
89
id : number
90
90
fileName : string
@@ -120,7 +120,7 @@ interface CrawlDataConfigOriginal {
120
120
interface CrawlFileConfigOriginal {
121
121
detailTargets : CrawlFileDetailTargetConfig [ ]
122
122
intervalTime : IntervalTime | undefined
123
- onBeforeSaveFile :
123
+ onBeforeSaveItemFile :
124
124
| ( ( info : {
125
125
id : number
126
126
fileName : string
@@ -195,27 +195,29 @@ function parsePageCookies(
195
195
return cookiesArr
196
196
}
197
197
198
- function transformToDetailTargets (
198
+ function transformTargetToDetailTargets (
199
199
config :
200
200
| string
201
201
| CrawlPageDetailTargetConfig
202
202
| ( string | CrawlPageDetailTargetConfig ) [ ]
203
203
) : CrawlPageDetailTargetConfig [ ]
204
- function transformToDetailTargets (
204
+ function transformTargetToDetailTargets (
205
205
config :
206
206
| string
207
207
| CrawlDataDetailTargetConfig
208
208
| ( string | CrawlDataDetailTargetConfig ) [ ]
209
209
) : CrawlDataDetailTargetConfig [ ]
210
- function transformToDetailTargets (
210
+ function transformTargetToDetailTargets (
211
211
config : ( string | CrawlFileDetailTargetConfig ) [ ]
212
212
) : CrawlFileDetailTargetConfig [ ]
213
- function transformToDetailTargets ( config : any ) {
213
+ function transformTargetToDetailTargets ( config : any ) {
214
214
return isArray ( config )
215
215
? config . map ( ( item ) => ( isObject ( item ) ? item : { url : item } ) )
216
216
: [ isObject ( config ) ? config : { url : config } ]
217
217
}
218
218
219
+ /* Loader config */
220
+
219
221
function loaderCommonFingerprintToDetailTarget (
220
222
detail :
221
223
| CrawlPageDetailTargetConfig
@@ -434,7 +436,7 @@ function loaderCommonConfigToCrawlConfig(
434
436
crawlConfig . onCrawlItemComplete = advancedConfig . onCrawlItemComplete
435
437
}
436
438
437
- /* Create Config */
439
+ /* Create config */
438
440
/*
439
441
每个创建配置函数的返回值都是类似于进阶版配置
440
442
不同点:
@@ -461,10 +463,12 @@ function createCrawlPageConfig(
461
463
const { targets } = originalConfig as CrawlPageAdvancedConfig
462
464
advancedConfig = originalConfig as CrawlPageAdvancedConfig
463
465
464
- crawlPageConfig . detailTargets . push ( ...transformToDetailTargets ( targets ) )
466
+ crawlPageConfig . detailTargets . push (
467
+ ...transformTargetToDetailTargets ( targets )
468
+ )
465
469
} else {
466
470
// string | CrawlPageDetailTargetConfig | (string | CrawlPageDetailTargetConfig)[] 处理
467
- const detaileTargets = transformToDetailTargets (
471
+ const detaileTargets = transformTargetToDetailTargets (
468
472
originalConfig as
469
473
| string
470
474
| CrawlPageDetailTargetConfig
@@ -520,10 +524,12 @@ function createCrawlDataConfig<T>(
520
524
const { targets } = originalConfig as CrawlDataAdvancedConfig < T >
521
525
advancedConfig = originalConfig as CrawlDataAdvancedConfig < T >
522
526
523
- crawlDataConfig . detailTargets . push ( ...transformToDetailTargets ( targets ) )
527
+ crawlDataConfig . detailTargets . push (
528
+ ...transformTargetToDetailTargets ( targets )
529
+ )
524
530
} else {
525
531
// string | CrawlDataDetailTargetConfig | (string | CrawlDataDetailTargetConfig)[] 处理
526
- const detaileTargets = transformToDetailTargets (
532
+ const detaileTargets = transformTargetToDetailTargets (
527
533
originalConfig as
528
534
| string
529
535
| CrawlDataDetailTargetConfig
@@ -545,7 +551,7 @@ function createCrawlFileConfig(
545
551
const crawlFileConfig : CrawlFileConfigOriginal = {
546
552
detailTargets : [ ] ,
547
553
intervalTime : undefined ,
548
- onBeforeSaveFile : undefined ,
554
+ onBeforeSaveItemFile : undefined ,
549
555
onCrawlItemComplete : undefined
550
556
}
551
557
@@ -556,7 +562,9 @@ function createCrawlFileConfig(
556
562
const { targets } = originalConfig as CrawlFileAdvancedConfig
557
563
558
564
advancedConfig = originalConfig as CrawlFileAdvancedConfig
559
- crawlFileConfig . detailTargets . push ( ...transformToDetailTargets ( targets ) )
565
+ crawlFileConfig . detailTargets . push (
566
+ ...transformTargetToDetailTargets ( targets )
567
+ )
560
568
} else {
561
569
// CrawlFileDetailTargetConfig | CrawlFileDetailTargetConfig[] 处理
562
570
crawlFileConfig . detailTargets . push (
@@ -582,7 +590,7 @@ function createCrawlFileConfig(
582
590
}
583
591
} )
584
592
585
- crawlFileConfig . onBeforeSaveFile = advancedConfig . onBeforeSaveFile
593
+ crawlFileConfig . onBeforeSaveItemFile = advancedConfig . onBeforeSaveItemFile
586
594
587
595
return crawlFileConfig as CrawlFileConfig
588
596
}
@@ -697,7 +705,7 @@ function fileSingleResultHandle(
697
705
saveFilePendingQueue,
698
706
699
707
onCrawlItemComplete,
700
- onBeforeSaveFile
708
+ onBeforeSaveItemFile
701
709
} = extraConfig
702
710
703
711
const crawlFileSingleRes : AnyObject = detaileInfo
@@ -721,8 +729,8 @@ function fileSingleResultHandle(
721
729
// 在保存前的回调
722
730
const data = detailTargetRes . data
723
731
let dataPromise = Promise . resolve ( data )
724
- if ( onBeforeSaveFile ) {
725
- dataPromise = onBeforeSaveFile ( {
732
+ if ( onBeforeSaveItemFile ) {
733
+ dataPromise = onBeforeSaveItemFile ( {
726
734
id,
727
735
fileName,
728
736
filePath,
@@ -959,7 +967,7 @@ export function createCrawlFile(xCrawlConfig: LoaderXCrawlConfig) {
959
967
const {
960
968
detailTargets,
961
969
intervalTime,
962
- onBeforeSaveFile ,
970
+ onBeforeSaveItemFile ,
963
971
onCrawlItemComplete
964
972
} = createCrawlFileConfig ( xCrawlConfig , config )
965
973
@@ -969,7 +977,7 @@ export function createCrawlFile(xCrawlConfig: LoaderXCrawlConfig) {
969
977
970
978
intervalTime,
971
979
onCrawlItemComplete,
972
- onBeforeSaveFile
980
+ onBeforeSaveItemFile
973
981
}
974
982
975
983
const crawlResArr = ( await controller (
0 commit comments