Files
go-extractor/stealth_test.go
Steve Dudenhoeffer 4772b153b8
All checks were successful
CI / build (pull_request) Successful in 30s
CI / vet (pull_request) Successful in 2m17s
CI / test (pull_request) Successful in 2m21s
fix: randomize hardware fingerprint values across browser sessions
Replace static stealthChromiumScripts and stealthFirefoxScripts slices
with builder functions that accept hardware profile structs. Each browser
session now randomly selects from a pool of 6 realistic profiles per
engine, and Chromium connection stats receive per-session jitter (±20ms
RTT, ±2 Mbps downlink). This prevents anti-bot systems from correlating
sessions via identical WebGL, connection, mozInnerScreen, and
hardwareConcurrency fingerprints.

Closes #71

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-02-24 01:38:14 +00:00

534 lines
16 KiB
Go

package extractor
import (
"strings"
"testing"
)
func TestMergeOptions_StealthDefault(t *testing.T) {
base := BrowserOptions{Stealth: Bool(true)}
got := mergeOptions(base, nil)
if got.Stealth == nil || !*got.Stealth {
t.Fatal("expected stealth to default to true")
}
}
func TestMergeOptions_StealthOverrideFalse(t *testing.T) {
base := BrowserOptions{Stealth: Bool(true)}
got := mergeOptions(base, []BrowserOptions{{Stealth: Bool(false)}})
if got.Stealth == nil || *got.Stealth {
t.Fatal("expected stealth to be overridden to false")
}
}
func TestMergeOptions_LaunchArgsAppend(t *testing.T) {
base := BrowserOptions{LaunchArgs: []string{"--arg1"}}
got := mergeOptions(base, []BrowserOptions{{LaunchArgs: []string{"--arg2", "--arg3"}}})
if len(got.LaunchArgs) != 3 {
t.Fatalf("expected 3 launch args, got %d", len(got.LaunchArgs))
}
if got.LaunchArgs[0] != "--arg1" || got.LaunchArgs[1] != "--arg2" || got.LaunchArgs[2] != "--arg3" {
t.Fatalf("unexpected launch args: %v", got.LaunchArgs)
}
}
func TestMergeOptions_InitScriptsAppend(t *testing.T) {
base := BrowserOptions{InitScripts: []string{"script1"}}
got := mergeOptions(base, []BrowserOptions{{InitScripts: []string{"script2"}}})
if len(got.InitScripts) != 2 {
t.Fatalf("expected 2 init scripts, got %d", len(got.InitScripts))
}
if got.InitScripts[0] != "script1" || got.InitScripts[1] != "script2" {
t.Fatalf("unexpected init scripts: %v", got.InitScripts)
}
}
func TestMergeOptions_StealthNilDoesNotOverride(t *testing.T) {
base := BrowserOptions{Stealth: Bool(true)}
got := mergeOptions(base, []BrowserOptions{{Stealth: nil}})
if got.Stealth == nil || !*got.Stealth {
t.Fatal("expected stealth to remain true when override is nil")
}
}
func TestStealthChromiumArgs(t *testing.T) {
if len(stealthChromiumArgs) == 0 {
t.Fatal("expected at least one chromium stealth arg")
}
found := false
for _, arg := range stealthChromiumArgs {
if arg == "--disable-blink-features=AutomationControlled" {
found = true
}
}
if !found {
t.Fatal("expected --disable-blink-features=AutomationControlled in stealth chromium args")
}
}
// --- Common scripts ---
func TestStealthCommonScripts_Count(t *testing.T) {
if len(stealthCommonScripts) != 4 {
t.Fatalf("expected 4 common stealth scripts, got %d", len(stealthCommonScripts))
}
}
func TestStealthCommonScripts_WebdriverOverride(t *testing.T) {
found := false
for _, s := range stealthCommonScripts {
if strings.Contains(s, "navigator") && strings.Contains(s, "webdriver") {
found = true
break
}
}
if !found {
t.Fatal("expected a common script that overrides navigator.webdriver")
}
}
func TestStealthCommonScripts_OuterDimensions(t *testing.T) {
found := false
for _, s := range stealthCommonScripts {
if strings.Contains(s, "outerWidth") && strings.Contains(s, "outerHeight") {
found = true
break
}
}
if !found {
t.Fatal("expected a common script that fixes outerWidth/outerHeight")
}
}
func TestStealthCommonScripts_PermissionsQuery(t *testing.T) {
found := false
for _, s := range stealthCommonScripts {
if strings.Contains(s, "permissions.query") && strings.Contains(s, "notifications") {
found = true
break
}
}
if !found {
t.Fatal("expected a common script that overrides permissions.query for notifications")
}
}
func TestStealthCommonScripts_Notification(t *testing.T) {
found := false
for _, s := range stealthCommonScripts {
if strings.Contains(s, "Notification") && strings.Contains(s, "requestPermission") {
found = true
break
}
}
if !found {
t.Fatal("expected a common script that stubs Notification constructor")
}
}
// --- Chromium scripts ---
func TestStealthChromiumScripts_Count(t *testing.T) {
scripts := buildChromiumStealthScripts(chromiumHWProfiles[0])
if len(scripts) != 8 {
t.Fatalf("expected 8 chromium stealth scripts, got %d", len(scripts))
}
}
func TestStealthChromiumScripts_Plugins(t *testing.T) {
scripts := buildChromiumStealthScripts(chromiumHWProfiles[0])
found := false
for _, s := range scripts {
if strings.Contains(s, "Chrome PDF Plugin") && strings.Contains(s, "navigator") && strings.Contains(s, "plugins") {
found = true
break
}
}
if !found {
t.Fatal("expected a chromium script that populates navigator.plugins with Chrome entries")
}
}
func TestStealthChromiumScripts_MimeTypes(t *testing.T) {
scripts := buildChromiumStealthScripts(chromiumHWProfiles[0])
found := false
for _, s := range scripts {
if strings.Contains(s, "mimeTypes") && strings.Contains(s, "application/pdf") {
found = true
break
}
}
if !found {
t.Fatal("expected a chromium script that populates navigator.mimeTypes")
}
}
func TestStealthChromiumScripts_WindowChrome(t *testing.T) {
scripts := buildChromiumStealthScripts(chromiumHWProfiles[0])
found := false
for _, s := range scripts {
if strings.Contains(s, "window.chrome") && strings.Contains(s, "runtime") {
found = true
break
}
}
if !found {
t.Fatal("expected a chromium script that stubs window.chrome")
}
}
func TestStealthChromiumScripts_ChromeApp(t *testing.T) {
scripts := buildChromiumStealthScripts(chromiumHWProfiles[0])
found := false
for _, s := range scripts {
if strings.Contains(s, "chrome.app") && strings.Contains(s, "chrome.csi") && strings.Contains(s, "chrome.loadTimes") {
found = true
break
}
}
if !found {
t.Fatal("expected a chromium script that stubs chrome.app, chrome.csi, and chrome.loadTimes")
}
}
func TestStealthChromiumScripts_WebGLSpoof(t *testing.T) {
scripts := buildChromiumStealthScripts(chromiumHWProfiles[0])
found := false
for _, s := range scripts {
if strings.Contains(s, "37446") && strings.Contains(s, "ANGLE") {
found = true
break
}
}
if !found {
t.Fatal("expected a chromium script that spoofs WebGL renderer with ANGLE strings")
}
}
func TestStealthChromiumScripts_NavigatorConnection(t *testing.T) {
scripts := buildChromiumStealthScripts(chromiumHWProfiles[0])
found := false
for _, s := range scripts {
if strings.Contains(s, "connection") && strings.Contains(s, "effectiveType") {
found = true
break
}
}
if !found {
t.Fatal("expected a chromium script that stubs navigator.connection")
}
}
func TestStealthChromiumScripts_CDPCleanup(t *testing.T) {
scripts := buildChromiumStealthScripts(chromiumHWProfiles[0])
found := false
for _, s := range scripts {
if strings.Contains(s, "cdc_") && strings.Contains(s, "delete") {
found = true
break
}
}
if !found {
t.Fatal("expected a chromium script that cleans up CDP artifacts")
}
}
func TestStealthChromiumScripts_UserAgentStrip(t *testing.T) {
scripts := buildChromiumStealthScripts(chromiumHWProfiles[0])
found := false
for _, s := range scripts {
if strings.Contains(s, "HeadlessChrome") && strings.Contains(s, "userAgent") {
found = true
break
}
}
if !found {
t.Fatal("expected a chromium script that strips HeadlessChrome from user agent")
}
}
// --- Firefox scripts ---
func TestStealthFirefoxScripts_Count(t *testing.T) {
scripts := buildFirefoxStealthScripts(firefoxHWProfiles[0])
if len(scripts) != 5 {
t.Fatalf("expected 5 firefox stealth scripts, got %d", len(scripts))
}
}
func TestStealthFirefoxScripts_WebdriverHardening(t *testing.T) {
scripts := buildFirefoxStealthScripts(firefoxHWProfiles[0])
found := false
for _, s := range scripts {
if strings.Contains(s, "getOwnPropertyDescriptor") && strings.Contains(s, "webdriver") {
found = true
break
}
}
if !found {
t.Fatal("expected a firefox script that hardens navigator.webdriver via getOwnPropertyDescriptor")
}
}
func TestStealthFirefoxScripts_WebGLSpoof(t *testing.T) {
scripts := buildFirefoxStealthScripts(firefoxHWProfiles[0])
found := false
for _, s := range scripts {
if strings.Contains(s, "37446") && strings.Contains(s, "Mesa DRI") {
found = true
break
}
}
if !found {
t.Fatal("expected a firefox script that spoofs WebGL renderer with Mesa strings")
}
}
func TestStealthFirefoxScripts_MozInnerScreen(t *testing.T) {
scripts := buildFirefoxStealthScripts(firefoxHWProfiles[0])
found := false
for _, s := range scripts {
if strings.Contains(s, "mozInnerScreenX") && strings.Contains(s, "mozInnerScreenY") {
found = true
break
}
}
if !found {
t.Fatal("expected a firefox script that spoofs mozInnerScreenX/mozInnerScreenY")
}
}
func TestStealthFirefoxScripts_HardwareConcurrency(t *testing.T) {
scripts := buildFirefoxStealthScripts(firefoxHWProfiles[0])
found := false
for _, s := range scripts {
if strings.Contains(s, "hardwareConcurrency") {
found = true
break
}
}
if !found {
t.Fatal("expected a firefox script that normalizes navigator.hardwareConcurrency")
}
}
func TestStealthFirefoxScripts_PDFjsPlugins(t *testing.T) {
scripts := buildFirefoxStealthScripts(firefoxHWProfiles[0])
found := false
for _, s := range scripts {
if strings.Contains(s, "PDF.js") && strings.Contains(s, "plugins") {
found = true
break
}
}
if !found {
t.Fatal("expected a firefox script that provides PDF.js plugin entry")
}
}
// --- Cross-category validation ---
func TestStealthScripts_NoOverlap(t *testing.T) {
chromiumScripts := buildChromiumStealthScripts(chromiumHWProfiles[0])
firefoxScripts := buildFirefoxStealthScripts(firefoxHWProfiles[0])
all := make(map[string]string) // script -> category
for _, s := range stealthCommonScripts {
all[s] = "common"
}
for _, s := range chromiumScripts {
if cat, ok := all[s]; ok {
t.Fatalf("chromium script also appears in %s category", cat)
}
all[s] = "chromium"
}
for _, s := range firefoxScripts {
if cat, ok := all[s]; ok {
t.Fatalf("firefox script also appears in %s category", cat)
}
}
}
func TestStealthCommonScripts_NoChromiumMarkers(t *testing.T) {
chromiumMarkers := []string{"window.chrome", "chrome.app", "chrome.csi", "chrome.loadTimes", "HeadlessChrome", "cdc_", "Chrome PDF Plugin", "ANGLE"}
for _, s := range stealthCommonScripts {
for _, marker := range chromiumMarkers {
if strings.Contains(s, marker) {
t.Fatalf("common script contains Chromium-specific marker %q", marker)
}
}
}
}
func TestStealthCommonScripts_NoFirefoxMarkers(t *testing.T) {
firefoxMarkers := []string{"mozInnerScreen", "Mesa DRI", "PDF.js"}
for _, s := range stealthCommonScripts {
for _, marker := range firefoxMarkers {
if strings.Contains(s, marker) {
t.Fatalf("common script contains Firefox-specific marker %q", marker)
}
}
}
}
func TestStealthChromiumScripts_NoFirefoxMarkers(t *testing.T) {
scripts := buildChromiumStealthScripts(chromiumHWProfiles[0])
firefoxMarkers := []string{"mozInnerScreen", "Mesa DRI", "PDF.js"}
for _, s := range scripts {
for _, marker := range firefoxMarkers {
if strings.Contains(s, marker) {
t.Fatalf("chromium script contains Firefox-specific marker %q", marker)
}
}
}
}
func TestStealthFirefoxScripts_NoChromiumMarkers(t *testing.T) {
scripts := buildFirefoxStealthScripts(firefoxHWProfiles[0])
chromiumMarkers := []string{"window.chrome", "chrome.app", "chrome.csi", "chrome.loadTimes", "HeadlessChrome", "cdc_", "Chrome PDF Plugin", "ANGLE"}
for _, s := range scripts {
for _, marker := range chromiumMarkers {
if strings.Contains(s, marker) {
t.Fatalf("firefox script contains Chromium-specific marker %q", marker)
}
}
}
}
// --- User-Agent constants ---
func TestDefaultUserAgent_BackwardCompat(t *testing.T) {
if DefaultUserAgent != DefaultFirefoxUserAgent {
t.Fatal("DefaultUserAgent must equal DefaultFirefoxUserAgent for backward compatibility")
}
}
func TestDefaultFirefoxUserAgent_Content(t *testing.T) {
if !strings.Contains(DefaultFirefoxUserAgent, "Firefox") {
t.Fatal("DefaultFirefoxUserAgent must contain 'Firefox'")
}
if strings.Contains(DefaultFirefoxUserAgent, "Chrome") {
t.Fatal("DefaultFirefoxUserAgent must not contain 'Chrome'")
}
}
func TestDefaultChromiumUserAgent_Content(t *testing.T) {
if !strings.Contains(DefaultChromiumUserAgent, "Chrome") {
t.Fatal("DefaultChromiumUserAgent must contain 'Chrome'")
}
if strings.Contains(DefaultChromiumUserAgent, "Firefox") {
t.Fatal("DefaultChromiumUserAgent must not contain 'Firefox'")
}
}
// --- Viewport and UA defaults via mergeOptions ---
func TestMergeOptions_DefaultViewport(t *testing.T) {
base := BrowserOptions{
Dimensions: Size{Width: 1920, Height: 1080},
}
got := mergeOptions(base, nil)
if got.Dimensions.Width != 1920 || got.Dimensions.Height != 1080 {
t.Fatalf("expected default viewport 1920x1080, got %dx%d", got.Dimensions.Width, got.Dimensions.Height)
}
}
func TestMergeOptions_ViewportOverride(t *testing.T) {
base := BrowserOptions{
Dimensions: Size{Width: 1920, Height: 1080},
}
got := mergeOptions(base, []BrowserOptions{{Dimensions: Size{Width: 1280, Height: 720}}})
if got.Dimensions.Width != 1280 || got.Dimensions.Height != 720 {
t.Fatalf("expected overridden viewport 1280x720, got %dx%d", got.Dimensions.Width, got.Dimensions.Height)
}
}
func TestMergeOptions_EmptyUANotOverridden(t *testing.T) {
base := BrowserOptions{}
got := mergeOptions(base, []BrowserOptions{{Browser: BrowserChromium}})
if got.UserAgent != "" {
t.Fatalf("expected empty UserAgent after merge with no explicit UA, got %q", got.UserAgent)
}
}
func TestMergeOptions_ExplicitUAPreserved(t *testing.T) {
base := BrowserOptions{}
customUA := "MyCustomAgent/1.0"
got := mergeOptions(base, []BrowserOptions{{UserAgent: customUA}})
if got.UserAgent != customUA {
t.Fatalf("expected explicit UA %q preserved, got %q", customUA, got.UserAgent)
}
}
// --- Hardware profile pools ---
func TestChromiumHWProfiles_NotEmpty(t *testing.T) {
if len(chromiumHWProfiles) < 2 {
t.Fatalf("expected at least 2 chromium hardware profiles, got %d", len(chromiumHWProfiles))
}
}
func TestFirefoxHWProfiles_NotEmpty(t *testing.T) {
if len(firefoxHWProfiles) < 2 {
t.Fatalf("expected at least 2 firefox hardware profiles, got %d", len(firefoxHWProfiles))
}
}
func TestBuildChromiumStealthScripts_ProfileValues(t *testing.T) {
p := chromiumHWProfiles[1] // NVIDIA profile
scripts := buildChromiumStealthScripts(p)
joined := strings.Join(scripts, "\n")
if !strings.Contains(joined, p.WebGLVendor) {
t.Fatalf("expected chromium scripts to contain vendor %q", p.WebGLVendor)
}
if !strings.Contains(joined, p.WebGLRenderer) {
t.Fatalf("expected chromium scripts to contain renderer %q", p.WebGLRenderer)
}
}
func TestBuildFirefoxStealthScripts_ProfileValues(t *testing.T) {
p := firefoxHWProfiles[2] // AMD profile
scripts := buildFirefoxStealthScripts(p)
joined := strings.Join(scripts, "\n")
if !strings.Contains(joined, p.WebGLVendor) {
t.Fatalf("expected firefox scripts to contain vendor %q", p.WebGLVendor)
}
if !strings.Contains(joined, p.WebGLRenderer) {
t.Fatalf("expected firefox scripts to contain renderer %q", p.WebGLRenderer)
}
}
func TestBuildChromiumStealthScripts_ConnectionJitter(t *testing.T) {
p := chromiumHWProfiles[0]
seen := make(map[string]bool)
for range 50 {
scripts := buildChromiumStealthScripts(p)
// The connection script is at index 5.
seen[scripts[5]] = true
}
if len(seen) < 2 {
t.Fatal("expected connection script to vary across calls due to jitter, but all 50 were identical")
}
}
func TestChromiumHWProfiles_NoSingleQuotes(t *testing.T) {
for i, p := range chromiumHWProfiles {
if strings.Contains(p.WebGLVendor, "'") {
t.Fatalf("chromium profile %d vendor contains single quote (breaks JS)", i)
}
if strings.Contains(p.WebGLRenderer, "'") {
t.Fatalf("chromium profile %d renderer contains single quote (breaks JS)", i)
}
}
}
func TestFirefoxHWProfiles_NoSingleQuotes(t *testing.T) {
for i, p := range firefoxHWProfiles {
if strings.Contains(p.WebGLVendor, "'") {
t.Fatalf("firefox profile %d vendor contains single quote (breaks JS)", i)
}
if strings.Contains(p.WebGLRenderer, "'") {
t.Fatalf("firefox profile %d renderer contains single quote (breaks JS)", i)
}
}
}