forked from jef/streetmerchant
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathutil.ts
104 lines (89 loc) · 2.38 KB
/
util.ts
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
import {Browser, Page, Response} from 'puppeteer';
import {StatusCodeRangeArray, Store} from './store/model';
import {config} from './config';
import {disableBlockerInPage} from './adblocker';
import {logger} from './logger';
import topUserAgents from 'top-user-agents';
export function getSleepTime(store: Store) {
const minSleep = store.minPageSleep as number;
return (
minSleep + Math.random() * ((store.maxPageSleep as number) - minSleep)
);
}
export async function delay(ms: number) {
return new Promise((resolve) => {
setTimeout(resolve, ms);
});
}
export function noop() {
// Do nothing
}
export function isStatusCodeInRange(
statusCode: number,
range: StatusCodeRangeArray
) {
for (const value of range) {
let min: number;
let max: number;
if (typeof value === 'number') {
min = value;
max = value;
} else {
[min, max] = value;
}
if (min <= statusCode && statusCode <= max) {
return true;
}
}
return false;
}
export async function usingResponse<T>(
browser: Browser,
url: string,
cb: (response: Response | null, page: Page, browser: Browser) => Promise<T>
): Promise<T> {
return usingPage(browser, async (page, browser) => {
const response = await page.goto(url, {waitUntil: 'domcontentloaded'});
return cb(response, page, browser);
});
}
export async function usingPage<T>(
browser: Browser,
cb: (page: Page, browser: Browser) => Promise<T>
): Promise<T> {
const page = await browser.newPage();
page.setDefaultNavigationTimeout(config.page.timeout);
await page.setUserAgent(await getRandomUserAgent());
try {
return await cb(page, browser);
} finally {
try {
await closePage(page);
} catch (error: unknown) {
logger.error('usingPage', error);
}
}
}
export async function closePage(page: Page) {
if (!config.browser.lowBandwidth) {
await disableBlockerInPage(page);
}
await page.close();
}
export async function getRandomUserAgent(): Promise<string> {
const deprecatedUserAgent = (process.env.USER_AGENT
? process.env.USER_AGENT.includes('\n')
? process.env.USER_AGENT.split('\n')
: process.env.USER_AGENT.split(',')
: []
).map((s) => s.trim());
if (deprecatedUserAgent.length > 0) {
return deprecatedUserAgent[
Math.floor(Math.random() * deprecatedUserAgent.length)
];
}
const userAgent =
topUserAgents[Math.floor(Math.random() * topUserAgents.length)];
logger.debug('user agent', {userAgent});
return userAgent;
}