Initial commit

This commit is contained in:
Z User
2026-06-06 05:21:10 +00:00
Unverified
commit 6664758a6d
493 changed files with 135653 additions and 0 deletions

View File

@@ -0,0 +1,153 @@
#!/usr/bin/env node
/**
* 使用 Playwright 获取 JS 渲染后的完整 DOM 和 WebGL 元数据
*
* Usage:
* node fetch-rendered-dom.mjs <URL> [outDir]
*
* 首次运行会自动安装 playwright 到 ~/.cache/playwright-runner/
*
* 输出到 outDir (默认 /tmp/rendered):
* dom.html — 完整渲染后 HTML
* canvas-info.json — 所有 canvas 元素的信息
* webgl-info.json — WebGL 上下文元数据
* console.log — 页面 console 输出
* screenshot.png — 页面截图
* network.json — 运行时加载的 JS/资源 URL
*/
import { execSync } from 'child_process';
import { existsSync, writeFileSync, mkdirSync } from 'fs';
import { join } from 'path';
import { homedir } from 'os';
const url = process.argv[2];
const outDir = process.argv[3] || '/tmp/rendered';
if (!url) {
console.error('Usage: node fetch-rendered-dom.mjs <URL> [outDir]');
process.exit(1);
}
// Auto-install playwright to a persistent cache directory
const runnerDir = join(homedir(), '.cache', 'playwright-runner');
const pwDir = join(runnerDir, 'node_modules', 'playwright');
const chromiumMarker = join(runnerDir, '.chromium-installed');
if (!existsSync(pwDir)) {
console.log('Installing playwright (one-time setup)...');
mkdirSync(runnerDir, { recursive: true });
writeFileSync(join(runnerDir, 'package.json'), '{"type":"module"}');
try {
execSync('npm install playwright', { cwd: runnerDir, stdio: 'inherit' });
} catch {
console.log('npm install failed, retrying with registry mirror...');
execSync('npm install playwright --registry=https://registry.npmmirror.com', { cwd: runnerDir, stdio: 'inherit' });
}
}
if (!existsSync(chromiumMarker)) {
console.log('Installing chromium browser...');
try {
execSync('npx playwright install chromium', { cwd: runnerDir, stdio: 'inherit' });
} catch {
console.log('Chromium download failed, retrying with mirror...');
execSync('PLAYWRIGHT_DOWNLOAD_HOST=https://npmmirror.com/mirrors/playwright npx playwright install chromium', { cwd: runnerDir, stdio: 'inherit' });
}
writeFileSync(chromiumMarker, new Date().toISOString());
}
// Dynamic import from the cached location
const pw = await import(join(pwDir, 'index.mjs'));
const { chromium } = pw;
mkdirSync(outDir, { recursive: true });
const consoleLogs = [];
const networkRequests = [];
const browser = await chromium.launch({ headless: true });
const context = await browser.newContext({
viewport: { width: 1920, height: 1080 },
deviceScaleFactor: 2,
});
const page = await context.newPage();
// Capture console
page.on('console', msg => {
consoleLogs.push(`[${msg.type()}] ${msg.text()}`);
});
// Capture network (JS, WASM, bin, glsl, image files)
page.on('response', async response => {
const reqUrl = response.url();
const type = response.headers()['content-type'] || '';
if (/\.(js|mjs|wasm|bin|glsl|frag|vert|svg)(\?|$)/.test(reqUrl) || type.includes('javascript')) {
networkRequests.push({
url: reqUrl,
status: response.status(),
type: type.split(';')[0],
size: parseInt(response.headers()['content-length'] || '0'),
});
}
});
console.log(`Navigating to ${url} ...`);
await page.goto(url, { waitUntil: 'networkidle', timeout: 30000 });
// Wait for WebGL initialization
await page.waitForTimeout(3000);
// 1. Full rendered DOM
const html = await page.content();
writeFileSync(join(outDir, 'dom.html'), html);
console.log(`dom.html — ${html.length} bytes`);
// 2. Canvas info
const canvasInfo = await page.evaluate(() => {
return Array.from(document.querySelectorAll('canvas')).map((c, i) => ({
index: i,
outerHTML: c.outerHTML.slice(0, 500),
width: c.width,
height: c.height,
clientWidth: c.clientWidth,
clientHeight: c.clientHeight,
dataEngine: c.dataset.engine || null,
id: c.id || null,
className: c.className || null,
parentTag: c.parentElement?.tagName || null,
parentClass: c.parentElement?.className?.slice(0, 100) || null,
}));
});
writeFileSync(join(outDir, 'canvas-info.json'), JSON.stringify(canvasInfo, null, 2));
console.log(`canvas-info.json — ${canvasInfo.length} canvas(es) found`);
// 3. WebGL info
const webglInfo = await page.evaluate(() => {
const canvas = document.querySelector('canvas');
if (!canvas) return { error: 'no canvas found' };
// Don't create new context, just report what we can
return {
found: true,
width: canvas.width,
height: canvas.height,
dataEngine: canvas.dataset.engine || null,
};
});
writeFileSync(join(outDir, 'webgl-info.json'), JSON.stringify(webglInfo, null, 2));
console.log(`webgl-info.json — ${JSON.stringify(webglInfo).slice(0, 100)}`);
// 4. Console logs
writeFileSync(join(outDir, 'console.log'), consoleLogs.join('\n'));
console.log(`console.log — ${consoleLogs.length} entries`);
// 5. Screenshot
await page.screenshot({ path: join(outDir, 'screenshot.png'), fullPage: false });
console.log(`screenshot.png — saved`);
// 6. Network requests
writeFileSync(join(outDir, 'network.json'), JSON.stringify(networkRequests, null, 2));
console.log(`network.json — ${networkRequests.length} JS/resource requests captured`);
await browser.close();
console.log(`\nDone. Files saved to ${outDir}`);

View File

@@ -0,0 +1,76 @@
#!/bin/bash
# Scan JS bundle(s) for WebGL/shader keywords and report tech stack
# Usage: scan-bundle.sh <file1.js> [file2.js ...]
# Output: keyword counts + tech stack guess
set -eu
if [ $# -eq 0 ]; then
echo "Usage: scan-bundle.sh <file1.js> [file2.js ...]"
echo "Scans JS files for WebGL/shader keywords and identifies tech stack."
exit 1
fi
FILES=("$@")
echo "=== SHADER/WEBGL KEYWORD SCAN ==="
echo ""
# Core GLSL keywords
echo "--- GLSL Keywords ---"
for kw in "gl_FragColor" "gl_Position" "gl_PointSize" "gl_PointCoord" \
"precision" "uniform" "varying" "attribute" \
"FRAGMENT_SHADER" "VERTEX_SHADER" "createShader" \
"sampler2D" "texture2D" "smoothstep" "discard"; do
count=$(grep -o "$kw" "${FILES[@]}" 2>/dev/null | wc -l | tr -d ' ')
[ "$count" -gt 0 ] && printf " %-25s %s\n" "$kw" "$count" || true
done
echo ""
echo "--- WebGL/Canvas Keywords ---"
for kw in "canvas" "webgl" "webgl2" "getContext" "shader" "glsl" \
"framebuffer" "renderbuffer" "drawArrays" "drawElements" \
"bufferData" "texImage2D" "POINTS"; do
count=$(grep -oi "$kw" "${FILES[@]}" 2>/dev/null | wc -l | tr -d ' ')
[ "$count" -gt 0 ] && printf " %-25s %s\n" "$kw" "$count" || true
done
echo ""
echo "--- Noise/Math Keywords ---"
for kw in "snoise" "simplex" "perlin" "noise" "PoissonDisk" "Poisson"; do
count=$(grep -o "$kw" "${FILES[@]}" 2>/dev/null | wc -l | tr -d ' ')
[ "$count" -gt 0 ] && printf " %-25s %s\n" "$kw" "$count" || true
done
echo ""
echo "=== TECH STACK DETECTION ==="
detect() {
local label="$1" pattern="$2"
local count
count=$(grep -oE "$pattern" "${FILES[@]}" 2>/dev/null | wc -l | tr -d ' ')
[ "$count" -gt 0 ] && printf " %-25s %s hits\n" "$label" "$count" || true
}
# Frameworks (patterns specific enough to avoid false positives)
detect "Three.js" "THREE\.|WebGLRenderer|ShaderMaterial|BufferGeometry|PerspectiveCamera|OrthographicCamera"
detect "Three.js (minified)" "setRenderTarget|DataTexture|setPixelRatio|setClearColor"
detect "PixiJS" "PIXI\.|pixi\.js|PixiJS"
detect "Babylon.js" "BABYLON\.|babylonjs"
detect "Raw WebGL" "gl\.bindBuffer|gl\.bindTexture|gl\.useProgram|gl\.attachShader|gl\.linkProgram"
detect "Regl" "regl\(|regl\.frame|regl\.texture"
detect "OGL" "ogl\.|ogl/"
# Patterns
detect "GPGPU" "setRenderTarget|RenderTarget|ping.pong|gpgpu|GPGPU"
detect "Particles" "gl_PointSize|gl_PointCoord|PointSize|particl"
detect "Post-processing" "EffectComposer|RenderPass|ShaderPass|postprocess"
detect "Ray marching" "rayMarch|sdSphere|sdBox|sdRoundBox"
detect "Instancing" "InstancedMesh|InstancedBufferGeometry|instanceMatrix"
echo ""
echo "=== FILE SIZES ==="
for f in "${FILES[@]}"; do
size=$(wc -c < "$f" | tr -d ' ')
echo " $(basename "$f"): ${size} bytes"
done