// ==UserScript==
// @name 流畅阅读
// @license GPL-3.0 license
// @namespace https://fr.unmeta.cn/
// @version 0.5
// @description 基于上下文语境的人工智能翻译引擎,为部分网站提供精准翻译,让所有人都能够拥有基于母语般的阅读体验。程序Github开源:https://github.com/Bistutu/FluentRead,欢迎 star。
// @author ThinkStu
// @match *://*/*
// @icon 
// @grant GM_setValue
// @grant GM_getValue
// @grant GM_listValues
// @grant GM_deleteValue
// @grant GM_xmlhttpRequest
// @connect fr.unmeta.cn
// @connect 127.0.0.1
// @run-at document-end
// ==/UserScript==
// region 常量与变量
// URL 相关
const POST = "POST";
const url = new URL(location.href.split('?')[0]);
// cacheKey 与 时间
const checkKey = "fluent_read_check";
const expiringTime = 86400000 / 4;
// 服务请求地址
// const source = "http://127.0.0.1"
const source = "https://fr.unmeta.cn"
const read = "%s/read".replace("%s", source), preread = "%s/preread".replace("%s", source);
// 预编译正则表达式
const timeRegex = /^(a|an|\d+)\s+(minute|hour|day|month|year)(s)?\s+ago$/; // "2 days ago"
const paginationRegex = /^(\d+)\s*-\s*(\d+)\s+of\s+([\d,]+)$/; // "10 - 20 of 300"
const lastReleaseRegex = /Last Release on (Jan|Feb|Mar|Apr|May|Jun|Jul|Aug|Sep|Oct|Nov|Dec)\s(\d{1,2}),\s(\d{4})/; // "Last Release on Jul 4, 2022"
const dependencyRegex = /(Test|Provided|Compile) Dependencies \((\d+)\)/; // "Compile Dependencies (5)"
const rankRegex = /#(\d+) in\s*(.*)/; // "#3 in Algorithms"
const artifactsRegex = /^([\d,]+)\s+artifacts$/; // "1,024 artifacts"
const vulnerabilityRegex = /^(\d+)\s+vulnerabilit(y|ies)$/; // "3 vulnerabilities"
const repositoriesRegex = /Indexed (Repositories|Artifacts) \(([\d.]+)M?\)/; // Indexed Repositories (100)
const packagesRegex = /([\d,]+) indexed packages/; // 12,795,152 indexed packages
const joinedRegex = /Joined ((Jan|Feb|Mar|Apr|May|Jun|Jul|Aug|Sep|Oct|Nov|Dec).*\s\d{1,2},?\s\d{4}$)/; // Joined March 27, 2022
const moreRegex = /\+(\d+) more\.\.\./; // More 100
const commentsRegex = /(\d+)\sComments/; // 数字 Comments
const gamesRegex = /(\d{1,3}(?:,\d{3})*)( games| Collections)/;
const combinedDateRegex = /^(Jan|Feb|Mar|Apr|May|Jun|Jul|Aug|Sep|Oct|Nov|Dec).*\s\d{1,2},?\s\d{4}$|^\d{1,2}\s(Jan|Feb|Mar|Apr|May|Jun|Jul|Aug|Sep|Oct|Nov|Dec).*,?\s\d{4}$|^\d{1,2}\/\d{1,2}\/\d{4}$/i;
const emailRegex = /^Receive feedback emails \((.*)\)$/;
const verifyDomain = /To verify ownership of (.*), navigate to your DNS provider and add a TXT record with this value:/
const autoSavedRegex = /Auto-saved (\d{2}):(\d{2}):(\d{2})/;
// 特例适配
const maven = "mvnrepository.com";
const docker = "hub.docker.com";
const nexusmods = "www.nexusmods.com"
const openai = "openai.com"
const chatGPT = "chat.openai.com"
const coze = "www.coze.com"
// 文本类型
const textContent = 0
const placeholder = 1
const inputValue = 2
const ariaLabel = 3
// 适配器与剪枝 map
let adapterFnMap = new (Map);
let skipStringMap = new Map();
// DOM 防抖,单位毫秒
let throttleObserveDOM = throttle(observeDOM, 3000);
// 剪枝 set
let pruneSet = new Set();
// 其余常量
const typeMap = {'Test': '测试', 'Provided': '提供', 'Compile': '编译'};
// endregion
(function () {
'use strict';
// 初始化
init()
// 检查是否需要拉取数据
checkRun(function (shouldRun) {
// 如果 host 包含在 preread 中,shouldRun 为 true,则开始解析 DOM 树并设置监听器
if (shouldRun) {
// 1、添加监听器,使用 MutationObserver 监听 DOM 变化
const observer = new MutationObserver(function (mutations, obs) {
mutations.forEach(mutation => {
if (isEmpty(mutation.target)) return;
// console.log("原先变更记录:", mutation.target);
// 如果不包含下面节点,则处理
if (!["img", "noscript"].includes(mutation.target.tagName.toLowerCase())) {
handleDOMUpdate(mutation.target);
}
});
});
observer.observe(document.body, {childList: true, subtree: true});
// 2、手动开启一次解析 DOM 树
handleDOMUpdate(document.body);
}
});
// 快捷键 F2,清空所有缓存
document.addEventListener('keydown', function (event) {
if (event.key === 'F2') {
let listValues = GM_listValues();
listValues.forEach(e => {
GM_deleteValue(e)
})
console.log('Cache cleared!');
}
});
})();
// region read
// read:异步返回 callback,表示是否需要拉取数据
function checkRun(callback) {
// 1、检查缓存
let pageMapCache = GM_getValue(checkKey, false);
if (pageMapCache) {
pageMapCache[url.host] ? callback(true) : callback(false);
}
// 2、网络请求
const lastRun = GM_getValue("lastRun", undefined);
const now = new Date().getTime();
if (isEmpty(lastRun) || now - lastRun > expiringTime) {
console.log("开始更新 preread 缓存");
GM_xmlhttpRequest({
method: POST,
url: preread,
onload: function (response) {
// pagesMap 是新获取的数据,pageMapCache 是从缓存中获取的旧数据
let pagesMap = JSON.parse(response.responseText).Data;
pagesMap[url.host] ? callback(true) : callback(false);
// 将 fluent_read_check 设置为新的缓存
GM_setValue(checkKey, pagesMap);
// 检查 preread 名单判断是否需要更新对应 host 的 read 数据
const listValues = GM_listValues();
listValues.forEach(host => {
if (pageMapCache[host] !== pagesMap[host]) {
GM_deleteValue(host);
console.log("删除过期的缓存数据:", host);
}
});
GM_setValue("lastRun", now.toString()); // 请求成功后设置当前时间
},
onerror: (error) => console.error("请求失败: ", error)
});
}
}
// read:处理 DOM 更新
function handleDOMUpdate(node) {
// 如果数据存在则直接解析,否则发起网络请求
let cachedData = GM_getValue(url.host, undefined);
cachedData ? parseDfs(node, cachedData) : throttleObserveDOM();
}
// read:监听器配置
function observeDOM() {
GM_xmlhttpRequest({
method: POST,
url: read,
data: JSON.stringify({page: url.origin}), // 请求参数
onload: function (response) {
console.log("新的 read 请求:", url.host);
let respMap = JSON.parse(response.responseText).Data;
GM_setValue(url.host, respMap);
parseDfs(document.body, respMap);
},
onerror: function (error) {
console.error("请求失败: ", error);
}
});
}
// read:递归提取节点文本
function parseDfs(node, respMap) {
if (isEmpty(node)) return;
// console.log("当前节点:", node)
switch (node.nodeType) {
// 1、元素节点
case Node.ELEMENT_NODE:
// console.log("元素节点: ", node);
// 根据 host 获取 skip 函数,判断是否需要跳过
let skipFn = skipStringMap[url.host];
if (skipFn && skipFn(node)) return;
// aria 提示信息
if (node.hasAttribute("aria-label")) processNode(node, ariaLabel, respMap);
// 按钮与文本域节点
if (["input", "button", "textarea"].includes(node.tagName.toLowerCase())) {
if (node.placeholder) processNode(node, placeholder, respMap);
if (node.value && (node.tagName.toLowerCase() === "button" || ["submit", "button"].includes(node.type))) processNode(node, inputValue, respMap);
}
break;
// 2、文本节点
case Node.TEXT_NODE:
let fn = adapterFnMap[url.host]; // 根据 host 获取 adapter 函数,判断是否需要特殊处理
isEmpty(fn) ? processNode(node, textContent, respMap) : fn(node, respMap);
return; // 文本节点无子节点,return
}
let child = node.firstChild;
while (child) {
parseDfs(child, respMap);
child = child.nextSibling;
}
}
function processNode(node, attr, respMap) {
let text;
switch (attr) {
case textContent:
text = node.textContent;
break;
case placeholder:
text = node.placeholder;
break;
case inputValue:
text = node.value;
break;
case ariaLabel:
text = node.getAttribute('aria-label');
break;
}
if (shouldPrune(text)) return;
let formattedText = format(text);
if (formattedText && NotChinese(formattedText)) {
signature(url.host + formattedText).then(sign => respMap[sign] ? replaceText(attr, node, respMap[sign]) : null)
}
}
// endregion
// region 通用函数
// 计算SHA-1散列,取最后20个字符
async function signature(text) {
if (!text) return "";
const hashBuffer = await crypto.subtle.digest('SHA-1', new TextEncoder().encode(text));
const hashArray = Array.from(new Uint8Array(hashBuffer));
const hashHex = hashArray.map(b => b.toString(16).padStart(2, '0')).join('');
return hashHex.slice(-20);
}
// 防抖限流函数
function throttle(fn, interval) {
let last = 0; // 维护上次执行的时间
return function () {
const now = Date.now();
// 根据当前时间和上次执行时间的差值判断是否频繁
if (now - last >= interval) {
last = now;
fn();
}
};
}
// 判断是否为空元素
function isEmpty(node) {
return node ? false : true;
}
// 验证并解析日期格式,如果格式不正确则返回false
function parseDateOrFalse(dateString) {
// 正则表达式,用于检查常见的日期格式(如 YYYY-MM-DD)
if (!combinedDateRegex.test(dateString)) return false;
// 尝试解析日期,如果无效返回 false
const date = new Date(dateString);
return !isNaN(date.getTime()) ? date : false;
}
// 判断字符串是否不包含中文
function NotChinese(text) {
return !/[\u4e00-\u9fa5]/.test(text);
}
// 判断是否应该剪枝
function shouldPrune(text) {
let has = pruneSet.has(text);
if (has) console.log("已处理的节点,跳过:", text)
return has;
}
// 文本格式化
function format(text) {
return text.replace(/\u00A0/g, ' ').trim();
}
// 替换文本
function replaceText(type, node, value) {
switch (type) {
case textContent:
node.textContent = value;
break;
case placeholder:
node.placeholder = value;
break;
case inputValue:
node.value = value;
break;
case ariaLabel:
node.setAttribute('aria-label', value);
break;
}
pruneSet.add(value) // 剪枝
}
function init() {
// 填充适配器 map
adapterFnMap[maven] = procMaven
adapterFnMap[docker] = procDockerhub
adapterFnMap[nexusmods] = procNexusmods
adapterFnMap[openai] = procOpenai
adapterFnMap[chatGPT] = procChatGPT
adapterFnMap[coze] = procCoze
// 填充 skip map
skipStringMap[openai] = function (node) {
return node.hasAttribute("data-message-author-role") || node.hasAttribute("data-projection-id")
}
skipStringMap[nexusmods] = function (node) {
return node.classList.contains("desc") || node.classList.contains("material-icons") || node.classList.contains("material-icons-outlined")
}
skipStringMap[coze] = function (node) {
return node.classList.contains("auto-hide-last-sibling-br")
|| node.classList.contains("jwzzTyL0ME4eVCKuxpDL")
|| node.classList.contains("XnSvnXQFZ4QHrFiqJPSG")
|| node.classList.contains("NcsIaDLOKk0l8CjedpJc")
|| ["code"].includes(node.tagName.toLowerCase())
}
}
// endregion
// region 第三方特例
// 适配 coze
function procCoze(node, respMap) {
let text = format(node.textContent);
if (text && NotChinese(text)) {
// "Auto-saved 21:28:58"
let autoSavedMatch = text.match(autoSavedRegex);
if (autoSavedMatch) {
node.textContent = `自动保存于 ${autoSavedMatch[1]}:${autoSavedMatch[2]}:${autoSavedMatch[3]}`;
return;
}
processNode(node, textContent, respMap);
}
}
// 适配 nexusmods
function procNexusmods(node, respMap) {
let text = format(node.textContent)
if (text && NotChinese(text)) {
// 使用正则表达式匹配 text
let commentsMatch = text.match(commentsRegex);
if (commentsMatch) {
node.textContent = `${parseInt(commentsMatch[1], 10)} 条评论`;
return;
}
// TODO 翻译待修正
let gamesMatch = text.match(gamesRegex);
if (gamesMatch) {
let type = gamesMatch[2] === " games" ? "份游戏" : "个收藏"; // 判断是游戏还是收藏
node.textContent = `${gamesMatch[1]}${type}`;
return;
}
let dateOrFalse = parseDateOrFalse(text);
if (dateOrFalse) {
node.textContent = `${dateOrFalse.getFullYear()}-${String(dateOrFalse.getMonth() + 1).padStart(2, '0')}-${String(dateOrFalse.getDate()).padStart(2, '0')}`
}
processNode(node, textContent, respMap);
}
}
function procOpenai(node, respMap) {
let text = format(node.textContent);
if (text && NotChinese(text)) {
let dateOrFalse = parseDateOrFalse(text);
if (dateOrFalse) {
node.textContent = `${dateOrFalse.getFullYear()}-${dateOrFalse.getMonth() + 1}-${dateOrFalse.getDate()}`;
return;
}
processNode(node, textContent, respMap);
}
}
function procChatGPT(node, respMap) {
let text = format(node.textContent);
if (text && NotChinese(text)) {
// 提取电子邮件地址
let emailMatch = text.match(emailRegex);
if (emailMatch) {
node.textContent = `接收反馈邮件(${emailMatch[1]})`;
return;
}
// 验证域名
let verifyDomainMatch = text.match(verifyDomain);
if (verifyDomainMatch) {
node.textContent = `要验证 ${verifyDomainMatch[1]} 的所有权,请转到您的DNS提供商并添加一个带有以下值的TXT记录:`;
return;
}
// 处理日期格式
let dateOrFalse = parseDateOrFalse(text);
if (dateOrFalse) {
node.textContent = `${dateOrFalse.getFullYear()}-${String(dateOrFalse.getMonth() + 1).padStart(2, '0')}-${String(dateOrFalse.getDate()).padStart(2, '0')}`;
return;
}
processNode(node, textContent, respMap);
}
}
// 适配 maven
function procMaven(node, respMap) {
let text = format(node.textContent);
if (text && NotChinese(text)) {
// 处理 “Indexed Repositories (1936)” 与 “Indexed Artifacts (1.2M)” 的格式
let repositoriesMatch = text.match(repositoriesRegex);
if (repositoriesMatch) {
let count = parseInt(repositoriesMatch[2], 10);
node.textContent = repositoriesMatch[1] === "Repositories" ? `索引库数量(${count})` : `索引包数量(${count * 100}万)`;
return;
}
// 匹配并处理 "indexed packages" 的格式
let packagesMatch = text.match(packagesRegex);
if (packagesMatch) {
let count = parseInt(packagesMatch[1].replace(/,/g, ''), 10); // 移除数字中的逗号,然后转换为整数
node.textContent = `${count.toLocaleString()}个索引包`;
return;
}
// 处理“Last Release on”格式的日期
let lastReleaseMatch = text.match(lastReleaseRegex);
if (lastReleaseMatch) {
let date = new Date(`${lastReleaseMatch[1]} ${lastReleaseMatch[2]}, ${lastReleaseMatch[3]}`);
node.textContent = `最近更新 ${date.getFullYear()}年${date.getMonth() + 1}月${date.getDate()}日`;
return;
}
// 处理日期格式
let dateOrFalse = parseDateOrFalse(text);
if (dateOrFalse) {
node.textContent = `${dateOrFalse.getFullYear()}-${String(dateOrFalse.getMonth() + 1).padStart(2, '0')}-${String(dateOrFalse.getDate()).padStart(2, '0')}`;
return;
}
// 处理依赖类型
let dependencyMatch = text.match(dependencyRegex);
if (dependencyMatch) {
let [_, type, count] = dependencyMatch;
node.textContent = `${typeMap[type] || type}依赖 ${type} (${count})`;
return;
}
// 处理排名
let rankMatch = text.match(rankRegex);
if (rankMatch) {
node.textContent = `第 ${rankMatch[1]} 位 ${rankMatch[2]}`;
return;
}
// 处理 artifacts 被引用次数
let artifactsMatch = text.match(artifactsRegex);
if (artifactsMatch) {
node.textContent = `被引用 ${artifactsMatch[1]} 次`;
return;
}
// 处理漏洞数量
let vulnerabilityMatch = text.match(vulnerabilityRegex);
if (vulnerabilityMatch) {
node.textContent = `${vulnerabilityMatch[1]}个漏洞`;
return;
}
processNode(node, textContent, respMap);
}
}
function procDockerhub(node, respMap) {
let text = format(node.textContent);
if (text && NotChinese(text)) {
// 处理更新时间的翻译
let timeMatch = text.match(timeRegex);
if (timeMatch) {
let [_, quantity, unit, isPlural] = timeMatch;
quantity = (quantity === 'a' || quantity === 'an') ? ' 1' : ` ${quantity}`; // 将 'a' 或 'an' 转换为 '1'
const unitMap = {'minute': '分钟', 'hour': '小时', 'day': '天', 'month': '月',}; // 单位转换
unit = unitMap[unit] || unit;
node.textContent = `${quantity} ${unit}之前`;
return;
}
// 处理分页信息的翻译
let paginationMatch = text.match(paginationRegex);
if (paginationMatch) {
let [_, start, end, total] = paginationMatch;
total = total.replace(/,/g, ''); // 去除数字中的逗号
node.textContent = `当前第 ${start} - ${end} 项,共 ${total} `;
return;
}
// 处理 "Joined March 27, 2022"
let joinedMatch = text.match(joinedRegex);
if (joinedMatch) {
const date = new Date(joinedMatch[1]);
node.textContent = `加入时间:${date.getFullYear()}-${String(date.getMonth() + 1).padStart(2, '0')}-${String(date.getDate()).padStart(2, '0')}`;
return;
}
// 处理 "+5 more..."
let moreMatch = text.match(moreRegex);
if (moreMatch) {
node.textContent = `还有${parseInt(moreMatch[1], 10)}个更多...`;
return;
}
processNode(node, textContent, respMap);
}
}
// endregion