
501 lines
13 KiB
Raw Normal View History

2023-08-09 05:55:57 +00:00
import * as tf from '@tensorflow/tfjs';
import { setWasmPaths } from '@tensorflow/tfjs-backend-wasm';
import modelJSON from './model.json';
import ccl from './ccl';
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const charset = [' ', '0', '2', '4', '5', '8', 'A', 'D', 'G', 'H', 'J', 'K', 'M', 'N', 'P', 'R', 'S', 'T', 'V', 'W', 'X', 'Y'];
let weightsData;
let model;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const wasmToUrl = wasm => {
2023-08-09 05:55:57 +00:00
const blb = new Blob([wasm], { type: 'application/wasm' });
return URL.createObjectURL(blb);
const backendloaded = (async () => {
try {
// dead code elimination should occur here
// eslint-disable-next-line camelcase
if (execution_mode === 'userscript' || execution_mode === 'test') {
2023-08-09 05:55:57 +00:00
weightsData = (await import('./model.weights.bin')).default;
const tfwasmthreadedsimd = (await import('./tfjs-backend-wasm-threaded-simd.wasm')).default;
const tfwasmsimd = (await import('./tfjs-backend-wasm-simd.wasm')).default;
const tfwasm = (await import('./tfjs-backend-wasm.wasm')).default;
'tfjs-backend-wasm.wasm': wasmToUrl(tfwasm),
'tfjs-backend-wasm-simd.wasm': wasmToUrl(tfwasmsimd),
'tfjs-backend-wasm-threaded-simd.wasm': wasmToUrl(tfwasmthreadedsimd)
2023-08-09 05:55:57 +00:00
} else {
2023-08-09 05:55:57 +00:00
weightsData = await (await fetch(chrome.runtime.getURL('./model.weights.bin'))).text();
const args = {
'tfjs-backend-wasm.wasm': chrome.runtime.getURL('tfjs-backend-wasm.wasm'),
'tfjs-backend-wasm-simd.wasm': chrome.runtime.getURL('tfjs-backend-wasm-simd.wasm'),
'tfjs-backend-wasm-threaded-simd.wasm': chrome.runtime.getURL('tfjs-backend-wasm-threaded-simd.wasm')
2023-08-09 05:55:57 +00:00
2023-08-09 05:55:57 +00:00
const l = await tf.setBackend('wasm');
console.log('tf backend loaded', l);
} catch (err) {
2023-08-09 05:55:57 +00:00
console.log('tf err', err);
2023-08-09 05:55:57 +00:00
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
function toggle(obj, v) {
if (v) obj.style.display = '';
else obj.style.display = 'none';
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
function base64ToArray(base64) {
const binaryString = window.atob(base64);
const len = binaryString.length;
const bytes = new Uint8Array(len);
2022-08-03 02:20:38 +00:00
for (let i = 0; i < len; i++) {
2023-08-09 05:55:57 +00:00
bytes[i] = binaryString.charCodeAt(i);
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
return bytes.buffer;
2022-08-03 02:20:38 +00:00
const iohander = {
load: function () {
return new Promise((resolve, reject) => {
2022-08-03 15:56:33 +00:00
modelTopology: modelJSON.modelTopology,
weightSpecs: modelJSON.weightsManifest[0].weights,
weightData: base64ToArray(weightsData),
2022-08-03 15:56:33 +00:00
format: modelJSON.format,
generatedBy: modelJSON.generatedBy,
convertedBy: modelJSON.convertedBy
2023-08-09 05:55:57 +00:00
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
async function load() {
const uploadJSONInput = document.getElementById('upload-json');
const uploadWeightsInput = document.getElementById('upload-weights-1');
model = await tf.loadLayersModel(iohander);
return model;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
function black(x) {
return x < 64;
2022-08-03 02:20:38 +00:00
// Calculates "disorder" of the image. "Disorder" is the percentage of black pixels that have a
// non-black pixel below them. Minimizing this seems to be good enough metric for solving the slider.
2023-08-09 05:55:57 +00:00
function calculateDisorder(imgdata) {
const a = imgdata.data;
const w = imgdata.width;
const h = imgdata.height;
const pic = [];
const visited = [];
2022-08-03 02:20:38 +00:00
for (let c = 0; c < w * h; c++) {
2023-08-09 05:55:57 +00:00
if (visited[c]) continue;
if (!black(a[c * 4])) continue;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
let blackCount = 0;
const items = [];
const toVisit = [c];
2022-08-03 02:20:38 +00:00
while (toVisit.length > 0) {
2023-08-09 05:55:57 +00:00
const cc = toVisit[toVisit.length - 1];
toVisit.splice(toVisit.length - 1, 1);
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
if (visited[cc]) continue;
visited[cc] = 1;
2022-08-03 02:20:38 +00:00
if (black(a[cc * 4])) {
2023-08-09 05:55:57 +00:00
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
toVisit.push(cc + 1);
toVisit.push(cc - 1);
toVisit.push(cc + w);
toVisit.push(cc - w);
2022-08-03 02:20:38 +00:00
if (blackCount >= 24) {
items.forEach(function (x) {
2023-08-09 05:55:57 +00:00
pic[x] = 1;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
let res = 0;
let total = 0;
2022-08-03 02:20:38 +00:00
for (let c = 0; c < w * h - w; c++) {
2023-08-09 05:55:57 +00:00
if (pic[c] !== pic[c + w]) res += 1;
if (pic[c]) total += 1;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
return res / (total === 0 ? 1 : total);
2022-08-03 02:20:38 +00:00
// returns ImageData from captcha's background image, foreground image, and offset (ranging from 0 to -50)
2023-08-09 05:55:57 +00:00
function imageFromCanvas(img, bg, off) {
const h = img.height;
const w = img.width;
const th = 80;
const ph = 0;
const pw = 16;
const scale = th / h;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const canvas = document.createElement('canvas');
canvas.height = w * scale + pw * 2;
canvas.width = th;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const ctx = canvas.getContext('2d', { willReadFrequently: true });
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
ctx.fillStyle = 'rgb(238,238,238)';
ctx.fillRect(0, 0, canvas.width, canvas.height);
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
ctx.translate(canvas.width / 2, canvas.height / 2);
ctx.scale(-scale, scale);
ctx.rotate((90 * Math.PI) / 180);
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const adf = 1 / 3;
2023-08-09 00:23:24 +00:00
const draw = function (off) {
2022-08-03 02:20:38 +00:00
if (bg) {
2023-08-09 05:55:57 +00:00
const border = 4;
2022-08-03 02:20:38 +00:00
-off + border,
w - border * 2,
-w / 2 + border,
-h / 2,
w - border * 2,
2023-08-09 05:55:57 +00:00
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
ctx.drawImage(img, -w / 2, -h / 2, w, h);
2022-08-03 02:20:38 +00:00
// if off is not specified and background image is present, try to figure out
// the best offset automatically; select the offset that has smallest value of
// calculateDisorder for the resulting image
if (bg && off == null) {
2023-08-09 05:55:57 +00:00
let bestDisorder = 999;
let bestImagedata = null;
let bestOff = -1;
2022-08-03 02:20:38 +00:00
for (let off = 0; off >= -50; off--) {
2023-08-09 05:55:57 +00:00
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
let imgdata = ctx.getImageData(0, 0, canvas.width, canvas.height);
const disorder = calculateDisorder(imgdata);
2022-08-03 02:20:38 +00:00
if (disorder < bestDisorder) {
2023-08-09 05:55:57 +00:00
bestDisorder = disorder;
imgdata = ctx.getImageData(0, 0, canvas.width, canvas.height);
bestImagedata = imgdata;
bestOff = off;
2022-08-03 02:20:38 +00:00
// not the best idea to do this here
setTimeout(function () {
2023-08-09 05:55:57 +00:00
const bg = document.getElementById('t-bg');
const slider = document.getElementById('t-slider');
if (!bg || !slider) return;
slider.value = -bestOff * 2;
bg.style.backgroundPositionX = bestOff + 'px';
}, 1);
return bestImagedata;
2022-08-03 02:20:38 +00:00
} else {
2023-08-09 05:55:57 +00:00
return ctx.getImageData(0, 0, canvas.width, canvas.height);
2022-08-03 02:20:38 +00:00
// for debugging purposes
2023-08-09 05:55:57 +00:00
function imagedataToImage(imagedata) {
const canvas = document.createElement('canvas');
const ctx = canvas.getContext('2d');
canvas.width = imagedata.width;
canvas.height = imagedata.height;
ctx.putImageData(imagedata, 0, 0);
const image = new Image();
image.src = canvas.toDataURL();
return image;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
async function predict(img, bg, off) {
2022-08-03 02:20:38 +00:00
if (!model) {
2023-08-09 05:55:57 +00:00
model = await load();
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const image = imageFromCanvas(img, bg, off);
const labels = ccl.connectedComponentLabeling(image.data.map(e => +(e > 128)), image.width, image.height);
const props = ccl.computeBounds(labels, image.width, image.height);
2023-08-09 00:23:24 +00:00
2023-08-09 05:55:57 +00:00
const sortedByArea = Object.entries(props).sort((a, b) => a[1].area - b[1].area);
const eightBiggest = sortedByArea.slice(-8);
const filtered = new Float32Array(80 * 300);
2023-08-09 00:23:24 +00:00
// TODO: maybe centering?
for (const [label, region] of eightBiggest) {
if ((region.maxRow - region.minRow) <= 20) {
2023-08-09 05:55:57 +00:00
2023-08-09 00:23:24 +00:00
for (let y = region.minRow; y < region.maxRow; ++y) {
for (let x = region.minCol; y < region.maxCol; ++x) {
if (labels[y * image.width + x] === label) {
2023-08-09 05:55:57 +00:00
filtered[y * 300 + x] = 1;
2023-08-09 00:23:24 +00:00
2023-08-09 05:55:57 +00:00
const tensor = tf.tensor3d(filtered, [80, 300, 1], 'float32');
const prediction = await model.predict(tensor.expandDims(0)).data();
return createSequence(prediction);
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
function createSequence(prediction) {
const csl = charset.length;
const sequence = [];
2022-08-03 02:20:38 +00:00
2023-08-03 09:27:44 +00:00
// for each prediction
2022-08-03 02:20:38 +00:00
for (let pos = 0; pos < prediction.length; pos += csl) {
2023-08-03 09:27:44 +00:00
// look at the probabilities for the 22 token characters
2023-08-09 05:55:57 +00:00
const preds = prediction.slice(pos, pos + csl);
const max = Math.max(...preds);
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const seqElem = {};
2022-08-03 02:20:38 +00:00
for (let i = 0; i < csl; i++) {
2023-08-09 05:55:57 +00:00
const p = preds[i] / max; // normalize probability
const c = charset[i + 1];
2022-08-03 02:20:38 +00:00
2023-08-03 09:27:44 +00:00
if (p >= 0.05) { // if it's probable enough
2023-08-09 05:55:57 +00:00
seqElem[c || ''] = p; // save its probability, to give alternative solutions
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
return sequence;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
function postprocess(sequence, overrides) {
const csl = charset.length;
let possibilities = [{ sequence: [] }];
2022-08-03 02:20:38 +00:00
sequence.forEach(function (e, i) {
2023-08-09 05:55:57 +00:00
let additions;
2022-08-03 02:20:38 +00:00
if (overrides && overrides[i] !== undefined) {
2023-08-09 05:55:57 +00:00
additions = [{ sym: overrides[i], off: i, conf: 1 }];
2022-08-03 02:20:38 +00:00
} else {
additions = Object.keys(e).map(function (sym) {
2023-08-09 05:55:57 +00:00
return { sym, off: i, conf: e[sym] };
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
if (additions.length === 1 && additions[0].sym === '') return;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const oldpos = possibilities;
possibilities = [];
2022-08-03 02:20:38 +00:00
oldpos.forEach(function (possibility) {
additions.forEach(function (a) {
2023-08-09 05:55:57 +00:00
const seq = [...possibility.sequence];
if (a.sym !== '') seq.push([a.sym, a.off, a.conf]);
2022-08-03 02:20:38 +00:00
const obj = {
sequence: seq
2023-08-09 05:55:57 +00:00
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const res = {};
2022-08-03 02:20:38 +00:00
possibilities.forEach(function (p) {
2023-08-09 05:55:57 +00:00
let line = '';
let lastSym;
let lastOff = -1;
let count = 0;
let prob = 0;
2022-08-03 02:20:38 +00:00
p.sequence.forEach(function (e) {
2023-08-09 05:55:57 +00:00
const sym = e[0];
const off = e[1];
const conf = e[2];
2022-08-03 02:20:38 +00:00
if (sym === lastSym && lastOff + 2 >= off) {
2023-08-09 05:55:57 +00:00
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
line += sym;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
lastSym = sym;
lastOff = off;
prob += conf;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
if (count > 0) prob /= count;
2022-08-03 02:20:38 +00:00
if (prob > res[line] || !res[line]) {
2023-08-09 05:55:57 +00:00
res[line] = prob;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
2022-08-03 02:20:38 +00:00
let keys = Object.keys(res).sort(function (a, b) {
2023-08-09 05:55:57 +00:00
return res[a] < res[b];
2022-08-03 02:20:38 +00:00
const keysFitting = keys.filter(function (x) {
2023-08-09 05:55:57 +00:00
return x.length === 5 || x.length === 6;
if (keysFitting.length > 0) keys = keysFitting;
2022-08-03 02:20:38 +00:00
return keys.map(function (x) {
2023-08-09 05:55:57 +00:00
return { seq: x, prob: res[x] };
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
async function imageFromUri(uri) {
2022-08-03 02:20:38 +00:00
if (uri.startsWith('url("')) {
2023-08-09 05:55:57 +00:00
uri = uri.substr(5, uri.length - 7);
2022-08-03 02:20:38 +00:00
// eslint-disable-next-line camelcase
if (execution_mode !== 'test' && !uri.startsWith('data:')) {
2023-08-09 05:55:57 +00:00
return null;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const img = new Image();
await new Promise((r) => (img.onload = r), (img.src = uri));
return img;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
async function predictUri(uri, uribg, bgoff) {
const img = await imageFromUri(uri);
const bg = uribg ? await imageFromUri(uribg) : null;
const off = bgoff ? parseInt(bgoff) : null;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
return await predict(img, bg, off);
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const solveButton = document.createElement('input');
solveButton.id = 't-auto-solve';
solveButton.value = 'Solve';
solveButton.type = 'button';
solveButton.style.fontSize = '11px';
solveButton.style.padding = '0 2px';
solveButton.style.margin = '0px 0px 0px 6px';
solveButton.style.height = '18px';
2022-08-03 02:20:38 +00:00
solveButton.onclick = async function () {
2023-08-09 05:55:57 +00:00
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const altsDiv = document.createElement('div');
altsDiv.id = 't-auto-options';
altsDiv.style.margin = '0';
altsDiv.style.padding = '0';
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
let storedPalceholder;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
let overrides = {};
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
function placeAfter(elem, sibling) {
2022-08-03 02:20:38 +00:00
if (elem.parentElement !== sibling.parentElement) {
setTimeout(function () {
2023-08-09 05:55:57 +00:00
sibling.parentElement.insertBefore(elem, sibling.nextElementSibling);
}, 1);
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
let previousText = null;
async function solve(force) {
const resp = document.getElementById('t-resp');
if (!resp) return;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const bg = document.getElementById('t-bg');
if (!bg) return;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const fg = document.getElementById('t-fg');
if (!fg) return;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const help = document.getElementById('t-help');
if (!help) return;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
await backendloaded;
2023-08-09 05:55:57 +00:00
placeAfter(solveButton, resp);
placeAfter(altsDiv, help);
2022-08-03 02:20:38 +00:00
// palememe
setTimeout(function () {
2023-08-09 05:55:57 +00:00
toggle(solveButton, bg.style.backgroundImage);
}, 1);
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
const text = fg.style.backgroundImage;
2022-08-03 02:20:38 +00:00
if (!text) {
2023-08-09 05:55:57 +00:00
altsDiv.innerHTML = '';
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
if (text === previousText && !force) return;
previousText = text;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
altsDiv.innerHTML = '';
if (!storedPalceholder) storedPalceholder = resp.placeholder;
resp.placeholder = 'solving captcha...';
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
overrides = {};
2022-08-03 02:20:38 +00:00
const sequence = await predictUri(
force ? bg.style.backgroundPositionX : null
2023-08-09 05:55:57 +00:00
const opts = postprocess(sequence);
resp.placeholder = storedPalceholder;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
function showOpts(opts) {
const resp = document.getElementById('t-resp');
if (!resp) return;
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
altsDiv.innerHTML = '';
2022-08-03 02:20:38 +00:00
if (opts.length === 0) {
2023-08-09 05:55:57 +00:00
resp.value = '';
2022-08-03 02:20:38 +00:00
2023-08-09 05:55:57 +00:00
resp.value = opts[0].seq;
2022-08-03 02:20:38 +00:00
// for now don't display options since it seems more difficult to pick than type the whole thing
// eslint-disable-next-line no-constant-condition, no-empty
if (opts.length === 1 || true) {
const observer = new MutationObserver(async function (mutationsList, observer) {
2023-08-09 05:55:57 +00:00
window.solve = solve;
2022-08-03 02:20:38 +00:00
observer.observe(document.body, {
attributes: true,
childList: true,
subtree: true
2023-08-09 05:55:57 +00:00