forked from berstend/puppeteer-extra
-
Notifications
You must be signed in to change notification settings - Fork 0
/
index.js
155 lines (146 loc) · 4.82 KB
/
index.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
'use strict'
const { PuppeteerExtraPlugin } = require('puppeteer-extra-plugin')
/**
* Stealth mode: Applies various techniques to make detection of headless puppeteer harder. 💯
*
* ### Purpose
* There are a couple of ways the use of puppeteer can easily be detected by a target website.
* The addition of `HeadlessChrome` to the user-agent being only the most obvious one.
*
* The goal of this plugin is to be the definite companion to puppeteer to avoid
* detection, applying new techniques as they surface.
*
* As this cat & mouse game is in it's infancy and fast-paced the plugin
* is kept as flexibile as possible, to support quick testing and iterations.
*
* ### Modularity
* This plugin uses `puppeteer-extra`'s dependency system to only require
* code mods for evasions that have been enabled, to keep things modular and efficient.
*
* The `stealth` plugin is a convenience wrapper that requires multiple [evasion techniques](./evasions/)
* automatically and comes with defaults. You could also bypass the main module and require
* specific evasion plugins yourself, if you whish to do so (as they're standalone `puppeteer-extra` plugins):
*
* ```es6
* // bypass main module and require a specific stealth plugin directly:
* puppeteer.use(require('puppeteer-extra-plugin-stealth/evasions/console.debug')())
* ```
*
* ### Contributing
* PRs are welcome, if you want to add a new evasion technique I suggest you
* look at the [template](./evasions/_template) to kickstart things.
*
* ### Kudos
* Thanks to [Evan Sangaline](https://intoli.com/blog/not-possible-to-block-chrome-headless/) and [Paul Irish](https://github.com/paulirish/headless-cat-n-mouse) for kickstarting the discussion!
*
* ---
*
* @todo
* - white-/blacklist with url globs (make this a generic plugin method?)
* - dynamic whitelist based on function evaluation
*
* @example
* const puppeteer = require('puppeteer-extra')
* // Enable stealth plugin with all evasions
* puppeteer.use(require('puppeteer-extra-plugin-stealth')())
*
*
* ;(async () => {
* // Launch the browser in headless mode and set up a page.
* const browser = await puppeteer.launch({ args: ['--no-sandbox'], headless: true })
* const page = await browser.newPage()
*
* // Navigate to the page that will perform the tests.
* const testUrl = 'https://intoli.com/blog/' +
* 'not-possible-to-block-chrome-headless/chrome-headless-test.html'
* await page.goto(testUrl)
*
* // Save a screenshot of the results.
* const screenshotPath = '/tmp/headless-test-result.png'
* await page.screenshot({path: screenshotPath})
* console.log('have a look at the screenshot:', screenshotPath)
*
* await browser.close()
* })()
*
* @param {Object} opts - Options
* @param {Set<string>} [opts.enabledEvasions] - Specify which evasions to use (by default all)
*
*/
class Plugin extends PuppeteerExtraPlugin {
constructor (opts = {}) {
super(opts)
}
get name () {
return 'stealth'
}
get defaults () {
const availableEvasions = new Set([
'chrome.runtime',
'console.debug',
'navigator.languages',
'navigator.permissions',
'navigator.webdriver',
'navigator.plugins',
'iframe.contentWindow',
'window.outerdimensions',
'webgl.vendor',
'user-agent'
])
return {
availableEvasions,
// Enable all available evasions by default
enabledEvasions: new Set([...availableEvasions])
}
}
/**
* Requires evasion techniques dynamically based on configuration.
*
* @private
*/
get dependencies () {
return new Set(
[...this.opts.enabledEvasions].map(e => `${this.name}/evasions/${e}`)
)
}
/**
* Get all available evasions.
*
* Please look into the [evasions directory](./evasions/) for an up to date list.
*
* @type {Set<string>} - A Set of all available evasions.
*
* @example
* const pluginStealth = require('puppeteer-extra-plugin-stealth')()
* console.log(pluginStealth.availableEvasions) // => Set { 'user-agent', 'console.debug' }
* puppeteer.use(pluginStealth)
*/
get availableEvasions () {
return this.defaults.availableEvasions
}
/**
* Get all enabled evasions.
*
* Enabled evasions can be configured either through `opts` or by modifying this property.
*
* @type {Set<string>} - A Set of all enabled evasions.
*
* @example
* // Remove specific evasion from enabled ones dynamically
* const pluginStealth = require('puppeteer-extra-plugin-stealth')()
* pluginStealth.enabledEvasions.delete('console.debug')
* puppeteer.use(pluginStealth)
*/
get enabledEvasions () {
return this.opts.enabledEvasions
}
/**
* @private
*/
set enabledEvasions (evasions) {
this.opts.enabledEvasions = evasions
}
}
module.exports = function (pluginConfig) {
return new Plugin(pluginConfig)
}