@@ -20,65 +20,61 @@ export default class Source {
20
20
declare extra : any ;
21
21
private declare id : string ;
22
22
23
- constructor ( ) {
24
- }
25
-
26
23
/**
27
24
* Parse and store a source file contents to an array in memory
28
25
* @param source the source file
29
26
*/
30
27
static fileToSource ( source : any ) : Source {
31
- source . filename = source . filename ? source . filename : source . name ? source . name : '[ unknown filename] ' ;
28
+ source . filename = source . filename ? source . filename : source . name ? source . name : 'unknown filename' ;
32
29
33
30
let ret = new Source ( ) ;
34
31
35
32
// Source name
36
- if ( ! source . name || source . name . length < 3 )
37
- throw new Error ( `SourceException: ${ source . filename } : name: is not valid, must be type string with a least 3 characters .` ) ;
33
+ if ( source . name == null || source . name . length < 3 )
34
+ throw new Error ( `SourceException: [ ${ source . filename } ] Field name is not valid, requirements( type = string, length >= 3) .` ) ;
38
35
ret . name = source . name ;
39
36
40
37
// Source tableName
41
- if ( source . tableName && ( typeof source . tableName !== 'string' || source . tableName . length < 3 ) )
42
- throw new Error ( `SourceException: ${ source . filename } : tableName: is not valid, must be type string with a least 3 characters.` ) ;
43
- if ( [ "saffron" , "config" , "workers" ] . includes ( source . tableName ) )
44
- throw new Error ( `SourceException: ${ source . filename } : tableName: is blacklisted.` ) ;
38
+ if ( source . tableName != null && ( typeof source . tableName !== 'string' || source . tableName . length < 3 || [ "saffron" , "config" , "workers" ] . includes ( source . tableName ) ) )
39
+ throw new Error ( `SourceException: [${ source . filename } ] Field tableName is not valid, requirements(type = string, length >= 3, != saffron, != workers, != config).` ) ;
45
40
ret . tableName = source . tableName ;
46
41
47
- if ( source . interval && ( typeof source . interval != 'number' || source . interval < 0 ) )
48
- throw new Error ( `SourceException: ${ source . filename } : interval: is not valid, must be a positive number.` ) ;
49
- ret . interval = source . interval ;
42
+ if ( source . interval != null && ( typeof source . interval != 'number' || source . interval < 0 ) )
43
+ throw new Error ( `SourceException: [${ source . filename } ] Field interval is not valid, requirements(type = number, positive or zero).` ) ;
44
+ ret . interval = source . interval ? source . interval : Config . getOption ( ConfigOptions . SCHEDULER_JOB_INT ) ;
45
+
46
+ if ( source . retryInterval != null && ( typeof source . retryInterval != 'number' || source . retryInterval < 0 ) )
47
+ throw new Error ( `SourceException: [${ source . filename } ] Field retryInterval is not valid, requirements(type = number, positive or zero).` ) ;
48
+ ret . retryInterval = source . retryInterval ? source . retryInterval : Config . getOption ( ConfigOptions . SCHEDULER_JOB_INT ) / 2 ;
50
49
51
- if ( source . retryInterval && ( typeof source . retryInterval != 'number' || source . retryInterval < 0 ) )
52
- throw new Error ( `SourceException: ${ source . filename } : retryInterval: is not valid, must be a positive number .` ) ;
53
- ret . retryInterval = source . retryInterval ;
50
+ if ( source . timeout != null && ( typeof source . timeout != 'number' || source . timeout < 0 ) )
51
+ throw new Error ( `SourceException: [ ${ source . filename } ] Field timeout is not valid, requirements(type = number, positive or zero) .` ) ;
52
+ ret . timeout = source . timeout ? source . timeout : Config . getOption ( ConfigOptions . REQUEST_TIMEOUT ) ;
54
53
55
- if ( source . timeout && ( typeof source . timeout != 'number' || source . timeout < 0 ) )
56
- throw new Error ( `SourceException: ${ source . filename } : timeout: is not valid, must be a positive number.` ) ;
57
- ret . timeout = source . timeout ? source . timeout : Config . getOption ( ConfigOptions . REQUEST_TIMEOUT )
54
+ ret . extra = source . extra ;
58
55
59
- // If it is not one time scrape:
60
- ret . instructions = new Instructions ( )
61
- ret . instructions . source = { id : ret . getId ( ) }
56
+ const instructions = new Instructions ( ) ;
57
+ ret . instructions = instructions ;
58
+ instructions . source = { id : ret . getId ( ) }
62
59
63
- if ( source . amount && ( typeof source . amount != 'number' || source . amount <= 0 ) )
64
- throw new Error ( `SourceException: ${ source . filename } : amount: is not valid, must be a positive number .` ) ;
65
- ret . instructions . amount = source . amount ? source . amount : Config . getOption ( ConfigOptions . ARTICLE_AMOUNT )
60
+ if ( source . amount != null && ( typeof source . amount != 'number' || source . amount <= 0 ) )
61
+ throw new Error ( `SourceException: [ ${ source . filename } ] Field amount is not valid, requirements(type = number, positive) .` ) ;
62
+ instructions . amount = source . amount ? source . amount : Config . getOption ( ConfigOptions . ARTICLE_AMOUNT ) ;
66
63
67
- if ( typeof source . ignoreCertificates !== 'undefined' && typeof source . ignoreCertificates !== 'boolean' )
68
- throw new Error ( `SourceException: ${ source . filename } : ignoreCertificates: is not valid, must be boolean.` ) ;
69
- ret . instructions . ignoreCertificates = source . ignoreCertificates ? source . ignoreCertificates : false ;
64
+ if ( source . ignoreCertificates != null && typeof source . ignoreCertificates !== 'boolean' )
65
+ throw new Error ( `SourceException: [ ${ source . filename } ] Field ignoreCertificates is not valid, requirements(type = boolean) .` ) ;
66
+ instructions . ignoreCertificates = source . ignoreCertificates ? source . ignoreCertificates : false ;
70
67
71
- if ( typeof source . encoding !== 'undefined' && typeof source . encoding !== 'string' )
72
- throw new Error ( `SourceException: ${ source . filename } : encoding: is not valid, must be string value .` ) ;
73
- ret . instructions . textDecoder = source . encoding ? new TextDecoder ( `${ source . encoding } ` ) : new TextDecoder ( ) ;
68
+ if ( source . encoding != null && typeof source . encoding !== 'string' )
69
+ throw new Error ( `SourceException: [ ${ source . filename } ] Field encoding is not valid requirements(type = string) .` ) ;
70
+ instructions . textDecoder = source . encoding ? new TextDecoder ( `${ source . encoding } ` ) : new TextDecoder ( ) ;
74
71
75
- ret . extra = source . extra ;
76
72
77
- ret . instructions . url = [ ] ;
73
+ instructions . url = [ ] ;
78
74
if ( typeof source . url === 'string' ) {
79
75
if ( source . url . length == 0 )
80
- throw new Error ( `SourceException: ${ source . filename } : url: is not valid, url cannot be empty.` ) ;
81
- ret . instructions . url . push ( { url : source . url , aliases : [ ] } ) ;
76
+ throw new Error ( `SourceException: [ ${ source . filename } ] Field url is not valid, requirements(type = string, not empty) .` ) ;
77
+ instructions . url . push ( { url : source . url , aliases : [ ] } ) ;
82
78
} else if ( Array . isArray ( source . url ) ) {
83
79
for ( const pair of source . url ) {
84
80
if ( Array . isArray ( pair ) && pair . length >= 2 ) {
@@ -87,65 +83,62 @@ export default class Source {
87
83
88
84
aliases . forEach ( alias => {
89
85
if ( typeof alias !== 'string' || alias . trim ( ) === '' )
90
- throw new Error ( `SourceException: ${ source . filename } : url: is not valid, invalid alias ' ${ alias } ' .` ) ;
86
+ throw new Error ( `SourceException: [ ${ source . filename } ] At field url, field alias is not valid, requirements(type = string, not empty, not whitespace) .` ) ;
91
87
} ) ;
92
88
93
89
if ( typeof url !== 'string' || url . trim ( ) === '' )
94
- throw new Error ( `SourceException: ${ source . filename } : url: is not valid, invalid url ' ${ url } ' .` ) ;
90
+ throw new Error ( `SourceException: [ ${ source . filename } ] At field url, field url is not valid, requirements(type = string, not empty not whitespace) .` ) ;
95
91
96
- ret . instructions . url . push ( { url, aliases} ) ;
92
+ instructions . url . push ( { url, aliases} ) ;
97
93
} else if ( typeof pair === 'string' || ( ( Array . isArray ( pair ) && pair . length == 1 ) ) ) {
98
94
let url : any = pair ;
99
95
if ( Array . isArray ( pair ) ) url = pair [ 0 ] ;
100
96
101
- ret . instructions . url . push ( { url, aliases : [ ] } ) ;
102
- } else throw new Error ( `SourceException: ${ source . filename } : url: is not valid, error during parsing pair: ${ pair } .` ) ;
97
+ instructions . url . push ( { url, aliases : [ ] } ) ;
98
+ } else
99
+ throw new Error ( `SourceException: [${ source . filename } ] Field url is not valid, requirements(type = string[] | string[][]).` ) ;
103
100
}
104
101
} else
105
- throw new Error ( `SourceException: ${ source . filename } : url: is not valid, must be a string type or an array .` )
102
+ throw new Error ( `SourceException: [ ${ source . filename } ] Field url is not valid, requirements(type = string | string[] | string[][]) .` ) ;
106
103
107
- let parserType = ParserType . getFromString ( source . type )
104
+ let parserType = ParserType . getFromString ( source . type ) ;
108
105
if ( parserType === ParserType . UNKNOWN )
109
- throw new Error ( `SourceException: ${ source . filename } : type: is not valid.` ) ;
110
- ret . instructions . parserType = parserType ;
106
+ throw new Error ( `SourceException: [ ${ source . filename } ] Field type is not valid, requirements(equals html, rss, dynamic, wordpress-v1, wordpress-v2) .` ) ;
107
+ instructions . parserType = parserType ;
111
108
112
109
try {
113
110
ParserLoader . validateScrapeOptions ( parserType , source . scrape ) ;
114
111
} catch ( e : any ) {
115
- throw new Error ( `SourceException: ${ source . filename } : invalid scrape method , parser error: ${ e . message } ` ) ;
112
+ throw new Error ( `SourceException: [ ${ source . filename } ] Field scrape is not valid , parser error: ${ e . message } ` ) ;
116
113
}
117
114
118
115
ParserLoader . assignScrapeInstructions ( parserType , ret . instructions , source ) ;
119
116
120
- return ret
117
+ return ret ;
121
118
}
122
119
123
120
static pushSource ( source : Source ) {
124
121
this . _sources . push ( source ) ;
125
122
}
126
123
127
124
/**
128
- * Return a copy array of the sources
125
+ * Return an array of the parsed sources.
129
126
*/
130
127
static getSources ( ) : Source [ ] {
131
- return this . _sources
128
+ return this . _sources ;
132
129
}
133
130
134
131
/**
135
132
* Return the source class based on job, article or source id
136
133
* @param from
137
134
*/
138
- static getSourceFrom ( from : Job | Article | string ) : Source {
139
- if ( from instanceof Job )
140
- return this . _sources . find ( ( source : Source ) => {
141
- return source . getId ( ) === from . source ?. id
142
- } ) ! !
143
- else if ( from instanceof Article )
144
- return this . _sources . find ( ( source : Source ) => {
145
- return source . getId ( ) === from . source ?. id
146
- } ) ! !
147
-
148
- return this . _sources . find ( ( source : Source ) => source . getId ( ) === from ) ! !
135
+ static getSourceFrom ( from : Job | Article | Instructions | string ) : Source {
136
+ let id = '' ;
137
+ if ( from instanceof Job || from instanceof Article || from instanceof Instructions )
138
+ id = from . source ?. id ;
139
+ else id = from ;
140
+
141
+ return this . _sources . find ( source => source . getId ( ) === id ) ! ;
149
142
}
150
143
151
144
/**
0 commit comments