Skip to content

Commit 34d1dc9

Browse files
committedJul 4, 2022
Use utils.get instead of axios directly
1 parent b426ce1 commit 34d1dc9

File tree

5 files changed

+34
-59
lines changed

5 files changed

+34
-59
lines changed
 

‎src/components/AxiosConfig.ts

-10
This file was deleted.

‎src/modules/parsers/drivers/HTMLParser.ts

+11-21
Original file line numberDiff line numberDiff line change
@@ -2,13 +2,9 @@ import {ParserClass} from "../ParserClass";
22
import Instructions from "../../../components/instructions";
33
import Job from "../../../components/job";
44
import Article from "../../../components/articles";
5-
import https from "https";
6-
import axios, {AxiosRequestConfig, AxiosResponse} from "axios";
5+
import {AxiosResponse} from "axios";
76
import cheerio from "cheerio";
87
import Utils from "../Utils";
9-
import {AxiosConfig} from "../../../components/AxiosConfig";
10-
11-
const httpsAgent = new https.Agent({rejectUnauthorized: false})
128

139
interface ArticleImage {
1410
[key: string]: any
@@ -19,7 +15,7 @@ export class HTMLParser extends ParserClass {
1915
static async parse2(instructions: Instructions, utils: Utils): Promise<Article[]> {
2016
let parsedArticles: Article[] = [];
2117

22-
await HTMLParser.request(utils.url, instructions.getSource().timeout, instructions)
18+
await HTMLParser.request(utils)
2319
.then((response: AxiosResponse) => {
2420
const cheerioLoad: cheerio.Root = cheerio.load(instructions.textDecoder.decode(response.data));
2521

@@ -109,26 +105,20 @@ export class HTMLParser extends ParserClass {
109105
return parsedArticles
110106
}
111107

112-
private static async request(url: string, timeout: number, instructions: Instructions): Promise<AxiosResponse> {
108+
private static async request(utils: Utils): Promise<AxiosResponse> {
113109
return new Promise((resolve, reject) => {
114-
115-
let config: AxiosConfig = {
116-
method: 'get',
117-
url,
118-
timeout,
110+
utils.get(utils.url, {
111+
timeout: utils.instructions.getSource().timeout,
119112
responseType: 'arraybuffer',
113+
// @ts-ignore
120114
responseEncoding: 'binary'
121-
}
122-
123-
if (instructions["ignoreCertificates"]) config.httpsAgent = httpsAgent
124-
axios((config as AxiosRequestConfig)).then((result: AxiosResponse) => {
125-
resolve(result)
115+
}).then((result: AxiosResponse) => {
116+
resolve(result);
126117
}).catch((e: any) => {
127118
let message = `HTMLParserException error during request, original error ${e.message}`
128-
reject(new Error(message))
129-
})
130-
131-
})
119+
reject(new Error(message));
120+
});
121+
});
132122
}
133123

134124
/**

‎src/modules/parsers/drivers/wordpress/WordpressV2Parser.ts

+5-6
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,6 @@ import Article from "../../../../components/articles";
55
import axios, {AxiosRequestConfig} from "axios";
66
import Utils from "../../Utils";
77
import https from "https";
8-
import {AxiosConfig} from "../../../../components/AxiosConfig";
98

109
const httpsAgent = new https.Agent({rejectUnauthorized: false})
1110

@@ -90,16 +89,16 @@ export class WordpressV2Parser extends ParserClass {
9089
let categories: any
9190
, posts: any[];
9291

93-
let config: AxiosConfig & AxiosRequestConfig = {
94-
timeout: instructions.getSource().timeout,
92+
let config = {
93+
timeout: utils.instructions.getSource().timeout,
9594
responseType: 'arraybuffer',
95+
// @ts-ignore
9696
responseEncoding: 'binary'
9797
};
98-
if (instructions["ignoreCertificates"]) config.httpsAgent = httpsAgent;
9998

10099
try {
101-
categories = JSON.parse(instructions.textDecoder.decode((await axios.get(categoriesUrl, config))?.data))
102-
posts = JSON.parse(instructions.textDecoder.decode((await axios.get(postsUrl, config))?.data))
100+
categories = JSON.parse(instructions.textDecoder.decode((await utils.get(categoriesUrl, config as any))?.data))
101+
posts = JSON.parse(instructions.textDecoder.decode((await utils.get(postsUrl, config as any))?.data))
103102
} catch (e: any) {
104103
throw new Error(`WordpressParserException job failed for ${instructions.getSource().name}, original error: ${e.message}`);
105104
}

‎src/modules/workers/index.ts

+1
Original file line numberDiff line numberDiff line change
@@ -31,6 +31,7 @@ export default class Worker {
3131
utils.aliases = pair.aliases;
3232
utils.isScrapeAfterError = job.attempts !== 0;
3333
utils.amount = job.getInstructions().amount;
34+
utils.instructions = job.getInstructions();
3435

3536
const newArticles = await parser.parse(job, utils);
3637
results.push({

‎test/index.js

+17-22
Original file line numberDiff line numberDiff line change
@@ -46,33 +46,28 @@ try {
4646
let errors = []
4747
const saffron = new Saffron();
4848

49-
try {
50-
await saffron.initialize(config)
51-
await saffron.start()
49+
saffron.on("workers.articles.found", (articles, src) => {
50+
console.log('articles.found', src, articles.length)
51+
// console.log(util.inspect(articles, {showHidden: false, depth: null, colors: true}));
52+
});
5253

53-
saffron.on("workers.articles.found", (articles, src) => {
54-
console.log('articles.found')
55-
console.log(src, articles.length)
56-
console.log(util.inspect(articles, {showHidden: false, depth: null, colors: true}));
57-
});
54+
saffron.on('workers.parsers.error', (e) => errors.push(e));
5855

59-
// saffron.on("workers.articles.new", (articles, src) => {
60-
// console.log('articles.new')
61-
// console.log(src, articles.length);
62-
// console.log(util.inspect(articles, {showHidden: false, depth: null, colors: true}));
63-
// });
56+
saffron.on("middleware.before", (articles) => {
57+
// console.log('middleware.before')
58+
// console.log(util.inspect(articles, {showHidden: false, depth: null, colors: true}));
59+
});
6460

65-
saffron.on("middleware.before", (articles) => {
66-
// console.log('middleware.before')
67-
// console.log(util.inspect(articles, {showHidden: false, depth: null, colors: true}));
68-
});
61+
saffron.on("middleware.after", (articles) => {
62+
// console.log('middleware.after')
63+
// console.log(util.inspect(articles, {showHidden: false, depth: null, colors: true}));
64+
});
6965

70-
saffron.on("middleware.after", (articles) => {
71-
// console.log('middleware.after')
72-
// console.log(util.inspect(articles, {showHidden: false, depth: null, colors: true}));
73-
});
66+
try {
67+
await saffron.initialize(config);
68+
await saffron.start();
7469
} catch (error) {
75-
errors.push(error)
70+
errors.push(error);
7671
}
7772

7873
if (process.env.NODE_ENV === "testing") setTimeout(() => {

0 commit comments

Comments
 (0)
Please sign in to comment.