// ==UserScript==
// @name AI Image Description Generator Gimini
// @namespace http://tampermonkey.net/
// @version 2.0
// @description 使用AI生成网页图片描述
// @author AlphaCat
// @match *://*/*
// @grant GM_addStyle
// @grant GM_setValue
// @grant GM_getValue
// @grant GM_xmlhttpRequest
// @connect *
// @license MIT
// ==/UserScript==
(function () {
'use strict';
// 添加样式
GM_addStyle(`
.ai-config-modal {
position: fixed;
top: 50%;
left: 50%;
transform: translate(-50%, -50%);
background: white;
padding: 20px;
border-radius: 8px;
box-shadow: 0 2px 10px rgba(0,0,0,0.1);
z-index: 10000;
min-width: 500px;
height: auto;
}
.ai-config-modal h3 {
margin: 0 0 15px 0;
font-size: 14px;
font-weight: bold;
color: #333;
}
.ai-config-modal label {
display: inline-block;
font-size: 12px;
font-weight: bold;
color: #333;
margin: 0;
line-height: normal;
height: auto;
}
.ai-config-modal .input-wrapper {
position: relative;
display: flex;
align-items: center;
}
.ai-config-modal input {
display: block;
width: 100%;
padding: 2px 24px 2px 2px;
margin: 2px;
border: 1px solid #ddd;
border-radius: 4px;
font-size: 13px;
line-height: normal;
height: auto;
box-sizing: border-box;
}
.ai-config-modal .input-icon {
position: absolute;
right: 4px;
width: 16px;
height: 16px;
cursor: pointer;
display: flex;
align-items: center;
justify-content: center;
color: #666;
font-size: 12px;
user-select: none;
}
.ai-config-modal .clear-icon {
right: 24px;
}
.ai-config-modal .toggle-password {
right: 4px;
}
.ai-config-modal .input-icon:hover {
color: #333;
}
.ai-config-modal .input-group {
margin-bottom: 12px;
height: auto;
display: flex;
flex-direction: column;
}
.ai-config-modal .button-row {
display: flex;
gap: 10px;
align-items: center;
margin-top: 5px;
}
.ai-config-modal .check-button {
padding: 4px 8px;
border: none;
border-radius: 4px;
background: #007bff;
color: white;
cursor: pointer;
font-size: 12px;
}
.ai-config-modal .check-button:hover {
background: #0056b3;
}
.ai-config-modal .check-button:disabled {
background: #cccccc;
cursor: not-allowed;
}
.ai-config-modal select {
width: 100%;
padding: 4px;
border: 1px solid #ddd;
border-radius: 4px;
font-size: 13px;
margin-top: 2px;
}
.ai-config-modal .status-text {
font-size: 12px;
margin-left: 10px;
}
.ai-config-modal .status-success {
color: #28a745;
}
.ai-config-modal .status-error {
color: #dc3545;
}
.ai-config-modal button {
margin: 10px 5px;
padding: 8px 15px;
border: none;
border-radius: 4px;
cursor: pointer;
font-size: 14px;
}
.ai-config-modal button#ai-save-config {
background: #4CAF50;
color: white;
}
.ai-config-modal button#ai-cancel-config {
background: #dc3545;
color: white;
}
.ai-config-modal button:hover {
opacity: 0.9;
}
.ai-floating-btn {
position: fixed;
width: 32px;
height: 32px;
background: #4CAF50;
color: white;
border-radius: 50%;
cursor: move;
z-index: 9999;
box-shadow: 0 2px 5px rgba(0,0,0,0.2);
display: flex;
align-items: center;
justify-content: center;
user-select: none;
transition: background-color 0.3s;
}
.ai-floating-btn:hover {
background: #45a049;
}
.ai-floating-btn svg {
width: 20px;
height: 20px;
fill: white;
}
.ai-menu {
position: absolute;
background: white;
border-radius: 5px;
box-shadow: 0 2px 10px rgba(0,0,0,0.1);
padding: 8px;
z-index: 10000;
display: flex;
gap: 8px;
}
.ai-menu-item {
width: 32px;
height: 32px;
padding: 6px;
cursor: pointer;
border-radius: 50%;
display: flex;
align-items: center;
justify-content: center;
transition: background-color 0.3s;
}
.ai-menu-item:hover {
background: #f5f5f5;
}
.ai-menu-item svg {
width: 20px;
height: 20px;
fill: #666;
}
.ai-menu-item:hover svg {
fill: #4CAF50;
}
.ai-image-options {
display: flex;
flex-direction: column;
gap: 10px;
margin: 15px 0;
}
.ai-image-options button {
padding: 8px 15px;
border: none;
border-radius: 4px;
background: #4CAF50;
color: white;
cursor: pointer;
transition: background-color 0.3s;
font-size: 14px;
}
.ai-image-options button:hover {
background: #45a049;
}
#ai-cancel {
background: #dc3545;
color: white;
}
#ai-cancel:hover {
opacity: 0.9;
}
.ai-toast {
position: fixed;
top: 20px;
left: 50%;
transform: translateX(-50%);
padding: 10px 20px;
background: rgba(0, 0, 0, 0.8);
color: white;
border-radius: 4px;
font-size: 14px;
z-index: 10000;
animation: fadeInOut 3s ease;
pointer-events: none;
white-space: pre-line;
text-align: center;
max-width: 80%;
box-shadow: 0 2px 8px rgba(0, 0, 0, 0.2);
}
@keyframes fadeInOut {
0% { opacity: 0; transform: translate(-50%, 10px); }
10% { opacity: 1; transform: translate(-50%, 0); }
90% { opacity: 1; transform: translate(-50%, 0); }
100% { opacity: 0; transform: translate(-50%, -10px); }
}
.ai-config-modal .button-group {
display: flex;
justify-content: flex-end;
gap: 10px;
margin-top: 20px;
}
.ai-config-modal .button-group button {
padding: 6px 16px;
border: none;
border-radius: 4px;
cursor: pointer;
font-size: 14px;
transition: background-color 0.2s;
}
.ai-config-modal .save-button {
background: #007bff;
color: white;
}
.ai-config-modal .save-button:hover {
background: #0056b3;
}
.ai-config-modal .save-button:disabled {
background: #cccccc;
cursor: not-allowed;
}
.ai-config-modal .cancel-button {
background: #f8f9fa;
color: #333;
}
.ai-config-modal .cancel-button:hover {
background: #e2e6ea;
}
.ai-selecting-image {
cursor: crosshair !important;
}
.ai-selecting-image * {
cursor: crosshair !important;
}
.ai-image-description {
position: fixed;
background: rgba(0, 0, 0, 0.8);
color: white;
padding: 8px 12px;
border-radius: 4px;
font-size: 14px;
line-height: 1.4;
max-width: 300px;
text-align: center;
word-wrap: break-word;
z-index: 10000;
pointer-events: none;
animation: fadeIn 0.3s ease;
box-shadow: 0 2px 8px rgba(0, 0, 0, 0.2);
}
@keyframes fadeIn {
from { opacity: 0; }
to { opacity: 1; }
}
.ai-modal-overlay {
position: fixed;
top: 0;
left: 0;
width: 100%;
height: 100%;
background: rgba(0, 0, 0, 0.5);
display: flex;
justify-content: center;
align-items: center;
z-index: 9999;
}
.ai-result-modal {
background: white;
padding: 20px;
border-radius: 8px;
box-shadow: 0 2px 10px rgba(0,0,0,0.1);
position: relative;
min-width: 300px;
max-width: 1000px;
max-height: 540px;
overflow-y: auto;
width: 90%;
}
.ai-result-modal h3 {
margin: 0 0 10px 0;
font-size: 14px;
color: #333;
}
.ai-result-modal .description-code {
background: #1e1e1e;
color: #ffffff;
padding: 6px;
border-radius: 4px;
margin: 5px 0;
cursor: pointer;
white-space: pre-wrap;
word-wrap: break-word;
font-family: monospace;
border: 1px solid #333;
position: relative;
max-height: 500px;
overflow-y: auto;
font-size: 12px;
line-height: 1.4;
}
.ai-result-modal .description-code * {
color: #ffffff !important;
background: transparent !important;
}
.ai-result-modal .description-code code {
color: #ffffff;
display: block;
width: 100%;
background: transparent !important;
padding: 0;
}
.ai-result-modal .description-code:hover {
background: #2d2d2d;
}
.ai-result-modal .copy-hint {
font-size: 11px;
color: #666;
text-align: center;
margin: 2px 0;
}
.ai-result-modal .close-button {
position: absolute;
top: 8px;
right: 8px;
background: none;
border: none;
font-size: 18px;
cursor: pointer;
color: #666;
padding: 2px 6px;
line-height: 1;
}
.ai-result-modal .close-button:hover {
color: #333;
}
.ai-selection-overlay {
position: fixed;
top: 0;
left: 0;
right: 0;
bottom: 0;
background: rgba(0, 0, 0, 0.1);
z-index: 999999;
cursor: crosshair;
pointer-events: none;
}
.ai-selecting-image img {
position: relative;
z-index: 9999;
cursor: pointer !important;
transition: outline 0.2s ease;
}
.ai-selecting-image img:hover {
outline: 2px solid white;
outline-offset: 2px;
}
/* 移动端样式优化 */
@media (max-width: 768px) {
.ai-floating-btn {
width: 40px;
height: 40px;
touch-action: none;
}
.ai-floating-btn svg {
width: 24px;
height: 24px;
}
.ai-config-modal {
width: 90%;
min-width: auto;
max-width: 400px;
padding: 15px;
margin: 10px;
box-sizing: border-box;
}
.ai-config-modal .button-group {
margin-top: 15px;
flex-direction: row;
justify-content: space-between;
gap: 10px;
}
.ai-config-modal .button-group button {
flex: 1;
min-height: 44px;
font-size: 16px;
padding: 10px;
margin: 0;
}
.ai-result-modal {
width: 95%;
min-width: auto;
max-width: 90%;
margin: 10px;
padding: 15px;
}
.ai-modal-overlay {
padding: 10px;
box-sizing: border-box;
}
.ai-config-modal button,
.ai-config-modal .input-icon,
.ai-config-modal select,
.ai-config-modal input {
min-height: 44px;
padding: 10px;
font-size: 16px;
}
.ai-config-modal textarea {
min-height: 100px;
font-size: 16px;
padding: 10px;
}
.ai-config-modal .input-icon {
width: 44px;
height: 44px;
font-size: 20px;
}
.ai-config-modal {
max-height: 90vh;
overflow-y: auto;
-webkit-overflow-scrolling: touch;
}
}
.ai-selection-overlay img,
.ai-selection-overlay [style*="background-image"],
.ai-selection-overlay [class*="img"],
.ai-selection-overlay [class*="photo"],
.ai-selection-overlay [class*="image"],
.ai-selection-overlay [class*="thumb"],
.ai-selection-overlay [class*="avatar"] {
cursor: pointer !important;
transition: outline 0.2s;
pointer-events: auto;
}
.ai-selection-overlay img:hover,
.ai-selection-overlay [style*="background-image"]:hover,
.ai-selection-overlay [class*="img"]:hover,
.ai-selection-overlay [class*="photo"]:hover,
.ai-selection-overlay [class*="image"]:hover,
.ai-selection-overlay [class*="thumb"]:hover,
.ai-selection-overlay [class*="avatar"]:hover {
outline: 3px solid #4CAF50 !important;
outline-offset: 2px !important;
}
/* 结果框样式 */
.ai-result-modal {
position: fixed;
top: 50%;
left: 50%;
transform: translate(-50%, -50%);
background: white;
padding: 20px;
border-radius: 8px;
box-shadow: 0 2px 10px rgba(0, 0, 0, 0.1);
z-index: 1000000;
max-width: 80%;
max-height: 80vh;
overflow-y: auto;
}
.ai-result-modal .result-content {
position: relative;
}
.ai-result-modal .description-code {
background: #1e1e1e;
color: #ffffff;
padding: 6px;
border-radius: 4px;
margin: 5px 0;
cursor: pointer;
white-space: pre-wrap;
word-wrap: break-word;
font-family: monospace;
border: 1px solid #333;
position: relative;
max-height: 500px;
overflow-y: auto;
font-size: 12px;
line-height: 1.4;
}
.ai-result-modal .description-code * {
color: #ffffff !important;
background: transparent !important;
}
.ai-result-modal .description-code code {
color: #ffffff;
display: block;
width: 100%;
background: transparent !important;
padding: 0;
}
.ai-result-modal .description-code:hover {
background: #2d2d2d;
}
.ai-result-modal .copy-hint {
font-size: 12px;
color: #666;
text-align: center;
margin-top: 5px;
}
.ai-result-modal .close-button {
position: absolute;
top: -10px;
right: -10px;
width: 24px;
height: 24px;
border-radius: 50%;
background: #ff4444;
color: white;
border: none;
cursor: pointer;
display: flex;
align-items: center;
justify-content: center;
font-size: 16px;
line-height: 1;
padding: 0;
}
.ai-result-modal .close-button:hover {
background: #ff6666;
}
`);
// 全局变量
let isSelectionMode = false;
// 定义默认提示词
const DEFAULT_PROMPT = "I will give you a picture, help me describe the main content of the picture. If there are people in the picture, describe their clothing, posture, and expressions, and give a simple compliment. Answer in Chinese";
// 在全局变量部分添加
const DEFAULT_API_KEY = '';
const DEFAULT_API_ENDPOINT = 'https://generativelanguage.googleapis.com/v1beta/models/gemini-2.0-flash-exp:generateContent';
const DEFAULT_MODEL = 'gemini-2.0-flash-exp';
// 添加支持的图片格式
const SUPPORTED_MIME_TYPES = [
'image/png',
'image/jpeg',
'image/webp',
'image/heic',
'image/heif'
];
const MAX_FILE_SIZE = 7 * 1024 * 1024; // 7MB
const TARGET_FILE_SIZE = 1 * 1024 * 1024; // 1MB
// 添加日志函数
function log(message, data = null) {
const timestamp = new Date().toISOString();
if (data) {
console.log(`[Gemini] ${timestamp} ${message}:`, data);
} else {
console.log(`[Gemini] ${timestamp} ${message}`);
}
}
// 修改图片压缩函数
async function compressImage(base64Image, mimeType) {
log('开始压缩图片', { mimeType });
return new Promise((resolve, reject) => {
const img = new Image();
img.onload = () => {
let quality = 0.9;
let canvas = document.createElement('canvas');
let ctx = canvas.getContext('2d');
let width = img.width;
let height = img.height;
log('原始图片尺寸', { width, height });
const MAX_DIMENSION = 2048;
if (width > MAX_DIMENSION || height > MAX_DIMENSION) {
const ratio = Math.min(MAX_DIMENSION / width, MAX_DIMENSION / height);
width *= ratio;
height *= ratio;
log('调整后的图片尺寸', { width, height });
}
canvas.width = width;
canvas.height = height;
ctx.drawImage(img, 0, 0, width, height);
const compress = () => {
const base64 = canvas.toDataURL(mimeType, quality);
const size = Math.ceil((base64.length * 3) / 4);
log('当前压缩质量和大小', { quality, size: `${(size / 1024 / 1024).toFixed(2)}MB` });
if (size > TARGET_FILE_SIZE && quality > 0.1) {
quality -= 0.1;
compress();
} else {
log('压缩完成', { finalQuality: quality, finalSize: `${(size / 1024 / 1024).toFixed(2)}MB` });
resolve(base64.split(',')[1]);
}
};
compress();
};
img.onerror = (error) => {
log('图片加载失败', error);
reject(error);
};
img.src = `data:${mimeType};base64,${base64Image}`;
});
}
// 修改图片上传函数
async function uploadImageToGemini(base64Image, mimeType) {
try {
log('开始上传图片', { mimeType });
// 转换为二进制数据
const binaryData = atob(base64Image);
const bytes = new Uint8Array(binaryData.length);
for (let i = 0; i < binaryData.length; i++) {
bytes[i] = binaryData.charCodeAt(i);
}
const blob = new Blob([bytes], { type: mimeType });
log('准备上传的文件大小', `${(blob.size / 1024 / 1024).toFixed(2)}MB`);
// 获取 API Key
const apiKey = GM_getValue('apiKey', DEFAULT_API_KEY);
if (!apiKey) {
throw new Error('请先在配置中设置 API Key');
}
// 第一步:发起 resumable 上传请求
log('发起 resumable 上传请求');
const initResponse = await fetch(`https://generativelanguage.googleapis.com/upload/v1beta/files?key=${apiKey}`, {
method: 'POST',
headers: {
'X-Goog-Upload-Protocol': 'resumable',
'X-Goog-Upload-Command': 'start',
'X-Goog-Upload-Header-Content-Length': blob.size.toString(),
'X-Goog-Upload-Header-Content-Type': mimeType,
'Content-Type': 'application/json'
},
body: JSON.stringify({
file: {
display_name: `image_${Date.now()}.${mimeType.split('/')[1]}`
}
})
});
if (!initResponse.ok) {
const errorData = await initResponse.text();
throw new Error(`上传初始化失败: HTTP ${initResponse.status} - ${errorData}`);
}
// 从响应头中获取上传 URL
const uploadUrl = initResponse.headers.get('x-goog-upload-url');
if (!uploadUrl) {
throw new Error('未能获取上传 URL');
}
// 第二步:上传实际的图片数据
log('开��上传图片数据');
const uploadResponse = await fetch(uploadUrl, {
method: 'POST',
headers: {
'Content-Length': blob.size.toString(),
'X-Goog-Upload-Offset': '0',
'X-Goog-Upload-Command': 'upload, finalize'
},
body: blob
});
if (!uploadResponse.ok) {
const errorData = await uploadResponse.text();
throw new Error(`上传文件失败: HTTP ${uploadResponse.status} - ${errorData}`);
}
const data = await uploadResponse.json();
if (data.file && data.file.uri) {
return data.file.uri;
} else {
throw new Error(`文件上传失败: ${JSON.stringify(data)}`);
}
} catch (error) {
log('上传图片失败', error);
throw error;
}
}
// 修改 fetchImageAsBase64 函数
async function fetchImageAsBase64(url) {
try {
log('开始通过 fetch 获取图片', url);
// 直接使用 GM_xmlhttpRequest 获取图片
return await new Promise((resolve, reject) => {
GM_xmlhttpRequest({
method: 'GET',
url: url,
responseType: 'blob',
headers: {
'Accept': 'image/*'
},
onload: function(response) {
if (response.status === 200) {
const reader = new FileReader();
reader.onloadend = () => {
const base64 = reader.result.split(',')[1];
resolve({
base64,
mimeType: response.response.type || 'image/jpeg'
});
};
reader.onerror = reject;
reader.readAsDataURL(response.response);
} else {
reject(new Error(`HTTP ${response.status}`));
}
},
onerror: function(error) {
log('GM_xmlhttpRequest 失败', error);
reject(error);
}
});
});
} catch (error) {
log('获取图片失败', error);
// 如果直接获取失败,尝试使用代理
const proxyServices = [
// 使用 cors-anywhere 代理
`https://cors-anywhere.herokuapp.com/${url}`,
// 使用 allOrigins 代理
`https://api.allorigins.win/raw?url=${encodeURIComponent(url)}`,
// 使用 crossorigin.me 代理
`https://crossorigin.me/${url}`,
// 使用 cors.bridged.cc 代理
`https://cors.bridged.cc/${url}`
];
for (const proxyUrl of proxyServices) {
try {
log('尝试使用代理', proxyUrl);
return await new Promise((resolve, reject) => {
GM_xmlhttpRequest({
method: 'GET',
url: proxyUrl,
responseType: 'blob',
headers: {
'Accept': 'image/*'
},
onload: function(response) {
if (response.status === 200) {
const reader = new FileReader();
reader.onloadend = () => {
const base64 = reader.result.split(',')[1];
resolve({
base64,
mimeType: response.response.type || 'image/jpeg'
});
};
reader.onerror = reject;
reader.readAsDataURL(response.response);
} else {
reject(new Error(`HTTP ${response.status}`));
}
},
onerror: reject
});
});
} catch (proxyError) {
log(`代理 ${proxyUrl} 请求失败`, proxyError);
continue;
}
}
throw new Error('无法获取图片数据: ' + error.message);
}
}
// 修改 imageToBase64 函数,添加更多错误检查
async function imageToBase64(imgElement) {
return new Promise((resolve, reject) => {
try {
// 检查是否是效的图片元素
if (!(imgElement instanceof HTMLImageElement)) {
throw new Error('无效的图片元素');
}
// 检查图片是否已加载
if (!imgElement.complete || !imgElement.naturalWidth) {
// 如果图片未加载完成,等待加载
imgElement.onload = () => processImage();
imgElement.onerror = () => reject(new Error('图片加载失败'));
return;
}
processImage();
function processImage() {
try {
const canvas = document.createElement('canvas');
canvas.width = imgElement.naturalWidth;
canvas.height = imgElement.naturalHeight;
const ctx = canvas.getContext('2d');
// 检查画布上下文是否创建成功
if (!ctx) {
throw new Error('无法创建 Canvas 上下文');
}
// 绘制图片到 canvas
ctx.drawImage(imgElement, 0, 0);
// 获取图片的实际 MIME 类型
let mimeType = 'image/jpeg'; // 默认格式
const src = imgElement.src;
// 检查图片源
if (!src) {
throw new Error('图片源无效');
}
// 从 src 获取 MIME 类型
if (src.startsWith('data:')) {
const match = src.match(/^data:([^;]+);/);
if (match) {
mimeType = match[1];
}
} else {
// 从文件扩展名获取 MIME 类型
const extension = src.toLowerCase().match(/\.([^.]+)$/);
if (extension) {
const ext = extension[1];
const mimeMap = {
'jpg': 'image/jpeg',
'jpeg': 'image/jpeg',
'png': 'image/png',
'webp': 'image/webp',
'gif': 'image/gif'
};
mimeType = mimeMap[ext] || 'image/jpeg';
}
}
log('处理图片', {
width: imgElement.naturalWidth,
height: imgElement.naturalHeight,
src: src.substring(0, 100) + '...',
mimeType: mimeType
});
try {
// 尝试使用原始格式
const base64 = canvas.toDataURL(mimeType, 1.0).split(',')[1];
if (!base64) {
throw new Error('Base64 转换失败');
}
resolve({ base64, mimeType });
} catch (e) {
log('原始格式转换失败,尝试使用 JPEG', e);
try {
// 降级到 JPEG
const base64 = canvas.toDataURL('image/jpeg', 0.9).split(',')[1];
if (!base64) {
throw new Error('JPEG 转换也失败了');
}
resolve({ base64, mimeType: 'image/jpeg' });
} catch (jpegError) {
// 如果 Canvas 转换都失败了,尝试直接获取图片数据
log('Canvas 转换失败,尝试直接获取图片', jpegError);
if (src.startsWith('data:')) {
const [header, base64] = src.split(',');
const mimeType = header.split(':')[1].split(';')[0];
if (base64 && mimeType) {
resolve({ base64, mimeType });
} else {
throw new Error('无法从 data URL 提取数据');
}
} else {
// 最后尝试通过 fetch 获取
fetchImageAsBase64(src).then(resolve).catch(reject);
}
}
}
} catch (error) {
log('图片处理失败', error);
// 尝试通过 fetch 获取
fetchImageAsBase64(imgElement.src).then(resolve).catch(reject);
}
}
} catch (error) {
log('图片处理过程出错', error);
reject(error);
}
});
}
// 修改生成描述的函数
async function generateImageDescription(imageBase64, prompt, mimeType) {
try {
log('开始生成图片描述');
log('使用的提示词', prompt);
const fileUri = await uploadImageToGemini(imageBase64, mimeType);
log('开始调用生成接口');
// 完全按照 demo-gemini.sh 的请求格式修改
const requestBody = {
contents: [{
parts: [
{
text: prompt || DEFAULT_PROMPT
},
{
file_data: { // 注意这里是 file_data 而不是 fileData
mime_type: mimeType, // 使用下划线格式
file_uri: fileUri // 使用下划线格式
}
}
]
}]
};
log('请求参数', requestBody);
// 修改请求 URL,使用 v1beta 版本的 API
const apiKey = GM_getValue('apiKey', DEFAULT_API_KEY);
const response = await fetch(`https://generativelanguage.googleapis.com/v1beta/models/gemini-2.0-flash-exp:generateContent?key=${apiKey}`, {
method: 'POST',
headers: {
'Content-Type': 'application/json'
},
body: JSON.stringify(requestBody)
});
const data = await response.json();
log('生成接口响应', data);
// 解析响应数据
if (data.candidates && data.candidates[0] && data.candidates[0].content) {
const text = data.candidates[0].content.parts[0].text;
log('成功生成描述');
return text;
} else {
throw new Error(data.error?.message || '无法获取图片描述');
}
} catch (error) {
log('生成描述失��', error);
throw error;
}
}
// 修改 API 检测功能
async function checkApiKey(apiKey) {
try {
log('开始验证 API Key');
const response = await fetch(`https://generativelanguage.googleapis.com/v1beta/models/gemini-2.0-flash-exp`, {
headers: {
'x-goog-api-key': apiKey
}
});
const data = await response.json();
log('API 验证响应', data);
if (data.name && data.name.includes('gemini-2.0-flash-exp')) {
log('API Key 验证成功');
return [data];
}
throw new Error('无效的 API Key 或模型不可用');
} catch (error) {
log('API 验证失败', error);
throw new Error(`API 验证失败: ${error.message}`);
}
}
// 显示toast提示
function showToast(message, duration = 3000) {
const toast = document.createElement('div');
toast.className = 'ai-toast';
toast.textContent = message;
document.body.appendChild(toast);
setTimeout(() => {
toast.remove();
}, duration);
}
// 修改 findImage 函数,增强懒加载图片的检测
function findImage(target) {
let img = null;
let imgSrc = null;
// 检查是否为图片元素
if (target.nodeName === 'IMG') {
img = target;
// 优先获取 data-src(懒加载原图)
imgSrc = target.getAttribute('data-src') ||
target.getAttribute('data-original') ||
target.getAttribute('data-actualsrc') ||
target.getAttribute('data-url') ||
target.getAttribute('data-echo') ||
target.getAttribute('data-lazy-src') ||
target.getAttribute('data-original-src') ||
target.src; // 最后才使用 src 属性
}
// 检查背景图
else if (target.style && target.style.backgroundImage) {
let bgImg = target.style.backgroundImage.match(/url\(['"]?([^'"]+)['"]?\)/);
if (bgImg) {
imgSrc = bgImg[1];
img = target;
}
}
// 检查父元素的背景图
else {
let parent = target.parentElement;
if (parent && parent.style && parent.style.backgroundImage) {
let bgImg = parent.style.backgroundImage.match(/url\(['"]?([^'"]+)['"]?\)/);
if (bgImg) {
imgSrc = bgImg[1];
img = parent;
}
}
}
// 检查常见的图片容器
if (!img) {
// 检查父元素是否为图片容器
let imgWrapper = target.closest('[class*="img"],[class*="photo"],[class*="image"],[class*="thumb"],[class*="avatar"],[class*="masonry"]');
if (imgWrapper) {
// 在容器中查找图片元素
let possibleImg = imgWrapper.querySelector('img');
if (possibleImg) {
img = possibleImg;
// 同样优先获取懒加载原图
imgSrc = possibleImg.getAttribute('data-src') ||
possibleImg.getAttribute('data-original') ||
possibleImg.getAttribute('data-actualsrc') ||
possibleImg.getAttribute('data-url') ||
possibleImg.getAttribute('data-echo') ||
possibleImg.getAttribute('data-lazy-src') ||
possibleImg.getAttribute('data-original-src') ||
possibleImg.src;
} else {
// 检查容器的背景图
let bgImg = getComputedStyle(imgWrapper).backgroundImage.match(/url\(['"]?([^'"]+)['"]?\)/);
if (bgImg) {
imgSrc = bgImg[1];
img = imgWrapper;
}
}
}
}
// 检查特殊情况:某些网站使用自定义属性存储真实图片地址
if (img && !imgSrc) {
// 获取元素的所有属性
const attrs = img.attributes;
for (let i = 0; i < attrs.length; i++) {
const attr = attrs[i];
// 检查属性名中���否包含关键字
if (attr.name.toLowerCase().includes('src') ||
attr.name.toLowerCase().includes('url') ||
attr.name.toLowerCase().includes('img') ||
attr.name.toLowerCase().includes('thumb') ||
attr.name.toLowerCase().includes('original') ||
attr.name.toLowerCase().includes('data')) {
const value = attr.value;
if (value && /^https?:\/\//.test(value)) {
imgSrc = value;
break;
}
}
}
}
// 检查父级链接
if (img && !imgSrc) {
let parentLink = img.closest('a');
if (parentLink && parentLink.href) {
if (/\.(jpe?g|png|webp|gif)$/i.test(parentLink.href)) {
imgSrc = parentLink.href;
}
}
}
// 如果找到了图片但没有找到有效的 URL,记录日志
if (img && !imgSrc) {
log('找到图片元素但未找到有效的图片URL', {
element: img,
attributes: Array.from(img.attributes).map(attr => `${attr.name}="${attr.value}"`).join(', ')
});
}
return { img, imgSrc };
}
// 修改点击处理函数
function clickHandler(e) {
if (!isSelectionMode) return;
const { img, imgSrc } = findImage(e.target);
if (!img || !imgSrc) return;
e.preventDefault();
e.stopPropagation();
// 检查图片是否有效
if (img instanceof HTMLImageElement) {
if (!img.complete || !img.naturalWidth) {
showToast('图片未加载完成或无效');
return;
}
if (img.naturalWidth < 10 || img.naturalHeight < 10) {
showToast('图片太小,无法处理');
return;
}
}
processImage(img, imgSrc);
}
// 进入图片选择模式
function enterImageSelectionMode() {
if (isSelectionMode) return;
isSelectionMode = true;
const floatingBtn = document.querySelector('.ai-floating-btn');
if (floatingBtn) {
floatingBtn.style.display = 'none';
}
const overlay = document.createElement('div');
overlay.className = 'ai-selection-overlay';
document.body.appendChild(overlay);
document.body.classList.add('ai-selecting-image');
document.addEventListener('click', clickHandler, true);
const escHandler = (e) => {
if (e.key === 'Escape') {
exitImageSelectionMode();
}
};
document.addEventListener('keydown', escHandler);
window._imageSelectionHandlers = {
click: clickHandler,
keydown: escHandler
};
}
// 退出图片选择模式
function exitImageSelectionMode() {
isSelectionMode = false;
const floatingBtn = document.querySelector('.ai-floating-btn');
if (floatingBtn) {
floatingBtn.style.display = 'flex';
}
const overlay = document.querySelector('.ai-selection-overlay');
if (overlay) {
overlay.remove();
}
document.body.classList.remove('ai-selecting-image');
if (window._imageSelectionHandlers) {
document.removeEventListener('click', window._imageSelectionHandlers.click, true);
document.removeEventListener('keydown', window._imageSelectionHandlers.keydown);
window._imageSelectionHandlers = null;
}
}
// 修改配置界面创建函数
function createConfigUI() {
const existingModal = document.querySelector('.ai-modal-overlay');
if (existingModal) {
existingModal.remove();
}
const overlay = document.createElement('div');
overlay.className = 'ai-modal-overlay';
const modal = document.createElement('div');
modal.className = 'ai-config-modal';
modal.innerHTML = `
<h3>AI图像描述配置</h3>
<div class="input-group">
<label>API Endpoint:</label>
<div class="input-wrapper">
<input type="text" id="ai-endpoint" placeholder="https://api.openai.com" value="${DEFAULT_API_ENDPOINT}" readonly>
</div>
</div>
<div class="input-group">
<label>API Key:</label>
<div class="input-wrapper">
<input type="password" id="ai-apikey" placeholder="输入你的 API Key" value="${GM_getValue('apiKey', DEFAULT_API_KEY)}">
<span class="input-icon toggle-password" title="显示/隐藏">👁️</span>
</div>
</div>
<div class="input-group">
<label>使用模型:</label>
<select id="ai-model" disabled>
<option value="${DEFAULT_MODEL}">${DEFAULT_MODEL}</option>
</select>
</div>
<div class="input-group">
<label>提示词:</label>
<div class="input-wrapper">
<textarea id="ai-prompt" rows="4" style="width: 100%; resize: vertical;">${GM_getValue('customPrompt', DEFAULT_PROMPT)}</textarea>
<span class="input-icon clear-icon" title="重置为默认值">↺</span>
</div>
</div>
<div class="button-group">
<button type="button" class="cancel-button" id="ai-cancel-config">取消</button>
<button type="button" class="save-button" id="ai-save-config">保存</button>
</div>
`;
overlay.appendChild(modal);
document.body.appendChild(overlay);
// 添加密码显示/隐藏功能
const togglePassword = modal.querySelector('.toggle-password');
const apiKeyInput = modal.querySelector('#ai-apikey');
if (togglePassword && apiKeyInput) {
togglePassword.addEventListener('click', function() {
const type = apiKeyInput.type === 'password' ? 'text' : 'password';
apiKeyInput.type = type;
this.textContent = type === 'password' ? '👁️' : '👁️🗨️';
});
}
// 保留提示词的重置功能
const clearButtons = modal.querySelectorAll('.clear-icon');
clearButtons.forEach(button => {
button.addEventListener('click', function(e) {
const input = this.parentElement.querySelector('textarea');
if (input && input.id === 'ai-prompt') {
input.value = DEFAULT_PROMPT;
input.focus();
}
});
});
// 修改保存按钮事件
const saveButton = modal.querySelector('#ai-save-config');
if (saveButton) {
saveButton.addEventListener('click', function(e) {
e.preventDefault();
e.stopPropagation();
const apiKey = modal.querySelector('#ai-apikey').value.trim();
const customPrompt = modal.querySelector('#ai-prompt').value.trim();
// 保存配置
if (apiKey) {
GM_setValue('apiKey', apiKey);
}
if (customPrompt) {
GM_setValue('customPrompt', customPrompt);
}
showToast('配置已保存');
overlay.remove();
});
}
// 取消配置
const cancelButton = modal.querySelector('#ai-cancel-config');
if (cancelButton) {
cancelButton.addEventListener('click', function(e) {
e.preventDefault();
e.stopPropagation();
overlay.remove();
});
}
// 点击遮罩层关闭
overlay.addEventListener('click', function(e) {
if (e.target === overlay) {
overlay.remove();
}
});
// 阻止模态框内的点击事件冒泡
modal.addEventListener('click', function(e) {
e.stopPropagation();
});
}
// 创建悬浮按钮
function createFloatingButton() {
const btn = document.createElement('div');
btn.className = 'ai-floating-btn';
btn.innerHTML = `
<svg viewBox="0 0 24 24">
<path d="M12 2C6.48 2 2 6.48 2 12s4.48 10 10 10 10-4.48 10-10S17.52 2 12 2zm0 18c-4.42 0-8-3.58-8-8s3.58-8 8-8 8 3.58 8 8-3.58 8-8 8zm0-14c-3.31 0-6 2.69-6 6s2.69 6 6 6 6-2.69 6-6-2.69-6-6-6zm0 10c-2.21 0-4-1.79-4-4h2c0-1.1.9-2 2-2s2 .9 2 2c0 2-3 1.75-3 5h2c0-2.25 3-2.5 3-5 0-2.21-1.79-4-4-4z"/>
</svg>
`;
const savedPos = JSON.parse(GM_getValue('btnPosition', '{"x": 20, "y": 20}'));
btn.style.left = (savedPos.x || 20) + 'px';
btn.style.top = (savedPos.y || 20) + 'px';
btn.style.right = 'auto';
btn.style.bottom = 'auto';
let isDragging = false;
let hasMoved = false;
let startX, startY;
let initialLeft, initialTop;
let longPressTimer;
let touchStartTime;
// 触屏事件处理
btn.addEventListener('touchstart', function (e) {
e.preventDefault();
touchStartTime = Date.now();
longPressTimer = setTimeout(() => {
exitImageSelectionMode();
createConfigUI();
}, 500);
const touch = e.touches[0];
startX = touch.clientX;
startY = touch.clientY;
const rect = btn.getBoundingClientRect();
initialLeft = rect.left;
initialTop = rect.top;
});
btn.addEventListener('touchmove', function (e) {
e.preventDefault();
clearTimeout(longPressTimer);
const touch = e.touches[0];
const deltaX = touch.clientX - startX;
const deltaY = touch.clientY - startY;
if (Math.abs(deltaX) > 5 || Math.abs(deltaY) > 5) {
hasMoved = true;
}
const newLeft = Math.max(0, Math.min(window.innerWidth - btn.offsetWidth, initialLeft + deltaX));
const newTop = Math.max(0, Math.min(window.innerHeight - btn.offsetHeight, initialTop + deltaY));
btn.style.left = newLeft + 'px';
btn.style.top = newTop + 'px';
});
btn.addEventListener('touchend', function (e) {
e.preventDefault();
clearTimeout(longPressTimer);
const touchDuration = Date.now() - touchStartTime;
if (!hasMoved && touchDuration < 500) {
enterImageSelectionMode();
}
if (hasMoved) {
const rect = btn.getBoundingClientRect();
GM_setValue('btnPosition', JSON.stringify({
x: rect.left,
y: rect.top
}));
}
hasMoved = false;
});
// 鼠标事件处理
btn.addEventListener('click', function (e) {
if (e.button === 0 && !hasMoved) {
enterImageSelectionMode();
e.stopPropagation();
}
hasMoved = false;
});
btn.addEventListener('contextmenu', function (e) {
e.preventDefault();
exitImageSelectionMode();
createConfigUI();
});
// 拖拽相关事件
function dragStart(e) {
if (e.target === btn || btn.contains(e.target)) {
isDragging = true;
hasMoved = false;
const rect = btn.getBoundingClientRect();
startX = e.clientX;
startY = e.clientY;
initialLeft = rect.left;
initialTop = rect.top;
e.preventDefault();
}
}
function drag(e) {
if (isDragging) {
e.preventDefault();
const deltaX = e.clientX - startX;
const deltaY = e.clientY - startY;
if (Math.abs(deltaX) > 5 || Math.abs(deltaY) > 5) {
hasMoved = true;
}
const newLeft = Math.max(0, Math.min(window.innerWidth - btn.offsetWidth, initialLeft + deltaX));
const newTop = Math.max(0, Math.min(window.innerHeight - btn.offsetHeight, initialTop + deltaY));
btn.style.left = newLeft + 'px';
btn.style.top = newTop + 'px';
}
}
function dragEnd(e) {
if (isDragging) {
isDragging = false;
const rect = btn.getBoundingClientRect();
GM_setValue('btnPosition', JSON.stringify({
x: rect.left,
y: rect.top
}));
}
}
btn.addEventListener('mousedown', dragStart);
document.addEventListener('mousemove', drag);
document.addEventListener('mouseup', dragEnd);
document.body.appendChild(btn);
return btn;
}
// 添加 processImage 函数
async function processImage(img, imgSrc) {
try {
showToast('正在处理图片...');
// 获取图片数据
let imgData;
if (img instanceof HTMLImageElement) {
imgData = await imageToBase64(img);
} else {
// 对于背景图等情况,直接获取图片
imgData = await fetchImageAsBase64(imgSrc);
}
if (!imgData || !imgData.base64) {
throw new Error('无法获取图片数据');
}
log('获取到图片数据', {
mimeType: imgData.mimeType,
dataLength: imgData.base64.length,
source: imgSrc
});
// 获取用户设置的提示词
const customPrompt = GM_getValue('customPrompt', DEFAULT_PROMPT);
// 调用 Gemini API 获取描述
const description = await generateImageDescription(imgData.base64, customPrompt, imgData.mimeType);
// 显示结果
showResult(description);
// 处理完成后退出选择模式
exitImageSelectionMode();
} catch (error) {
log('处理图片失败', error);
showToast(`处理失败: ${error.message}`);
}
}
// 添加显示结果的函数
function showResult(description) {
// 移除已存在的结果框
const existingResult = document.querySelector('.ai-result-modal');
if (existingResult) {
existingResult.remove();
}
// 创建结果框
const resultModal = document.createElement('div');
resultModal.className = 'ai-result-modal';
resultModal.innerHTML = `
<div class="result-content">
<div class="description-code">
<code>${description}</code>
</div>
<div class="copy-hint">点击上方文本可复制</div>
<button class="close-button">×</button>
</div>
`;
// 添加复制功能
const codeBlock = resultModal.querySelector('.description-code');
codeBlock.addEventListener('click', () => {
const text = codeBlock.textContent;
GM_setClipboard(text);
showToast('已复制到剪贴板');
});
// 添加关闭功能
const closeButton = resultModal.querySelector('.close-button');
closeButton.addEventListener('click', () => {
resultModal.remove();
});
document.body.appendChild(resultModal);
}
// 初始化
function initialize() {
if (document.readyState === 'loading') {
document.addEventListener('DOMContentLoaded', () => {
createFloatingButton();
});
} else {
createFloatingButton();
}
}
// 启动脚本
initialize();
})();