douyin-user-data-download

下载抖音用户主页数据!

当前为 2024-06-20 提交的版本,查看 最新版本

  1. // ==UserScript==
  2. // @name douyin-user-data-download
  3. // @namespace http://tampermonkey.net/
  4. // @version 0.5.2
  5. // @description 下载抖音用户主页数据!
  6. // @author xxmdmst
  7. // @match https://www.douyin.com/*
  8. // @icon https://xxmdmst.oss-cn-beijing.aliyuncs.com/imgs/favicon.ico
  9. // @grant GM_registerMenuCommand
  10. // @grant GM_setValue
  11. // @grant GM_getValue
  12. // @require https://cdnjs.cloudflare.com/ajax/libs/jszip/3.6.0/jszip.min.js
  13. // @license MIT
  14. // ==/UserScript==
  15.  
  16. (function () {
  17. let localDownload;
  18. let localDownloadUrl = GM_getValue("localDownloadUrl", 'http://localhost:8080/data');
  19. const startPipeline = (start) => {
  20. if (confirm(start ? "是否开启本地下载通道?\n开启后会向本地服务发送数据,服务地址:\n" + localDownloadUrl : "是否关闭本地下载通道?")) {
  21. GM_setValue("localDownload", start);
  22. window.location.reload();
  23. }
  24. }
  25. localDownload = GM_getValue("localDownload", false);
  26. if (localDownload) {
  27. GM_registerMenuCommand("✅关闭上报本地通道", () => {
  28. startPipeline(false);
  29. })
  30. } else {
  31. GM_registerMenuCommand("⛔️开启上报本地通道", () => {
  32. startPipeline(true);
  33. })
  34. }
  35.  
  36. GM_registerMenuCommand("♐设置本地上报地址", () => {
  37. localDownloadUrl = GM_getValue("localDownloadUrl", 'http://localhost:8080/data');
  38. let newlocalDownloadUrl = prompt("请输入新的上报地址:", localDownloadUrl);
  39. if (newlocalDownloadUrl === null) return;
  40. newlocalDownloadUrl = newlocalDownloadUrl.trim();
  41. if (!newlocalDownloadUrl) {
  42. newlocalDownloadUrl = "http://localhost:8080/data";
  43. toast("设置了空白地址,已经恢复默认地址为:" + newlocalDownloadUrl);
  44. localDownloadUrl = newlocalDownloadUrl;
  45. } else if (localDownloadUrl !== newlocalDownloadUrl) {
  46. GM_setValue("localDownloadUrl", newlocalDownloadUrl);
  47. toast("当前上报地址已经修改为:" + newlocalDownloadUrl);
  48. }
  49. GM_setValue("localDownloadUrl", newlocalDownloadUrl);
  50. localDownloadUrl = newlocalDownloadUrl;
  51. });
  52. GM_registerMenuCommand("🔄清空信息内容", () => msg_pre.textContent = "")
  53. let max_author_num = GM_getValue("max_author_num", 1000);
  54. GM_registerMenuCommand("👤设置最大缓存作者数", () => {
  55. let new_max_author_num = prompt("设置最大缓存作者数:", max_author_num);
  56. if (new_max_author_num === null) return;
  57. if (!/^\d+$/.test(new_max_author_num)) {
  58. toast("请输入正整数!");
  59. return;
  60. }
  61. max_author_num = parseInt(new_max_author_num);
  62. GM_setValue("max_author_num", max_author_num);
  63. toast("当前最大缓存作者数已经修改为:" + max_author_num);
  64. })
  65. let table;
  66.  
  67. function initGbkTable() {
  68. // https://en.wikipedia.org/wiki/GBK_(character_encoding)#Encoding
  69. const ranges = [
  70. [0xA1, 0xA9, 0xA1, 0xFE],
  71. [0xB0, 0xF7, 0xA1, 0xFE],
  72. [0x81, 0xA0, 0x40, 0xFE],
  73. [0xAA, 0xFE, 0x40, 0xA0],
  74. [0xA8, 0xA9, 0x40, 0xA0],
  75. [0xAA, 0xAF, 0xA1, 0xFE],
  76. [0xF8, 0xFE, 0xA1, 0xFE],
  77. [0xA1, 0xA7, 0x40, 0xA0],
  78. ];
  79. const codes = new Uint16Array(23940);
  80. let i = 0;
  81.  
  82. for (const [b1Begin, b1End, b2Begin, b2End] of ranges) {
  83. for (let b2 = b2Begin; b2 <= b2End; b2++) {
  84. if (b2 !== 0x7F) {
  85. for (let b1 = b1Begin; b1 <= b1End; b1++) {
  86. codes[i++] = b2 << 8 | b1
  87. }
  88. }
  89. }
  90. }
  91. table = new Uint16Array(65536);
  92. table.fill(0xFFFF);
  93. const str = new TextDecoder('gbk').decode(codes);
  94. for (let i = 0; i < str.length; i++) {
  95. table[str.charCodeAt(i)] = codes[i]
  96. }
  97. }
  98.  
  99. function str2gbk(str, opt = {}) {
  100. if (!table) {
  101. initGbkTable()
  102. }
  103. const NodeJsBufAlloc = typeof Buffer === 'function' && Buffer.allocUnsafe;
  104. const defaultOnAlloc = NodeJsBufAlloc
  105. ? (len) => NodeJsBufAlloc(len)
  106. : (len) => new Uint8Array(len);
  107. const defaultOnError = () => 63;
  108. const onAlloc = opt.onAlloc || defaultOnAlloc;
  109. const onError = opt.onError || defaultOnError;
  110.  
  111. const buf = onAlloc(str.length * 2);
  112. let n = 0;
  113.  
  114. for (let i = 0; i < str.length; i++) {
  115. const code = str.charCodeAt(i);
  116. if (code < 0x80) {
  117. buf[n++] = code;
  118. continue
  119. }
  120. const gbk = table[code];
  121.  
  122. if (gbk !== 0xFFFF) {
  123. buf[n++] = gbk;
  124. buf[n++] = gbk >> 8
  125. } else if (code === 8364) {
  126. buf[n++] = 0x80
  127. } else {
  128. const ret = onError(i, str);
  129. if (ret === -1) {
  130. break
  131. }
  132. if (ret > 0xFF) {
  133. buf[n++] = ret;
  134. buf[n++] = ret >> 8
  135. } else {
  136. buf[n++] = ret
  137. }
  138. }
  139. }
  140. return buf.subarray(0, n)
  141. }
  142.  
  143. const toast = (msg, duration) => {
  144. duration = isNaN(duration) ? 3000 : duration;
  145. let toastDom = document.createElement('pre');
  146. toastDom.textContent = msg;
  147. toastDom.style.cssText = 'padding:2px 15px;min-height: 36px;line-height: 36px;text-align: center;transform: translate(-50%);border-radius: 4px;color: rgb(255, 255, 255);position: fixed;top: 50%;left: 50%;z-index: 9999999;background: rgb(0, 0, 0);font-size: 16px;'
  148. document.body.appendChild(toastDom);
  149. setTimeout(function () {
  150. const d = 0.5;
  151. toastDom.style.transition = `transform ${d}s ease-in, opacity ${d}s ease-in`;
  152. toastDom.style.opacity = '0';
  153. setTimeout(function () {
  154. document.body.removeChild(toastDom)
  155. }, d * 1000);
  156. }, duration);
  157. }
  158.  
  159. function formatSeconds(seconds) {
  160. const timeUnits = ['小时', '分', '秒'];
  161. const timeValues = [
  162. Math.floor(seconds / 3600),
  163. Math.floor((seconds % 3600) / 60),
  164. seconds % 60
  165. ];
  166. return timeValues.map((value, index) => value > 0 ? value + timeUnits[index] : '').join('');
  167. }
  168.  
  169. const timeFormat = (timestamp = null, fmt = 'yyyy-mm-dd') => {
  170. // 其他更多是格式化有如下:
  171. // yyyy:mm:dd|yyyy:mm|yyyy年mm月dd日|yyyy年mm月dd日 hh时MM分等,可自定义组合
  172. timestamp = parseInt(timestamp);
  173. // 如果为null,则格式化当前时间
  174. if (!timestamp) timestamp = Number(new Date());
  175. // 判断用户输入的时间戳是秒还是毫秒,一般前端js获取的时间戳是毫秒(13位),后端传过来的为秒(10位)
  176. if (timestamp.toString().length === 10) timestamp *= 1000;
  177. let date = new Date(timestamp);
  178. let ret;
  179. let opt = {
  180. "y{4,}": date.getFullYear().toString(), // 年
  181. "y+": date.getFullYear().toString().slice(2,), // 年
  182. "m+": (date.getMonth() + 1).toString(), // 月
  183. "d+": date.getDate().toString(), // 日
  184. "h+": date.getHours().toString(), // 时
  185. "M+": date.getMinutes().toString(), // 分
  186. "s+": date.getSeconds().toString() // 秒
  187. // 有其他格式化字符需求可以继续添加,必须转化成字符串
  188. };
  189. for (let k in opt) {
  190. ret = new RegExp("(" + k + ")").exec(fmt);
  191. if (ret) {
  192. fmt = fmt.replace(ret[1], (ret[1].length === 1) ? (opt[k]) : (opt[k].padStart(ret[1].length, "0")))
  193. }
  194. }
  195. return fmt
  196. };
  197. window.all_aweme_map = new Map();
  198. window.user_map = new Map();
  199. const user_local_data = localStorage.getItem('user_local_data');
  200. if (user_local_data) {
  201. JSON.parse(user_local_data).forEach((userInfo) => {
  202. user_map.set(userInfo.uid, userInfo);
  203. });
  204. }
  205. let current_user_id = null;
  206. const user_key = {
  207. "nickname": "昵称",
  208. "following_count": "关注",
  209. "mplatform_followers_count": "粉丝",
  210. "total_favorited": "获赞",
  211. "unique_id": "抖音号",
  212. "ip_location": "IP属地",
  213. "gender": "性别",
  214. "city": "位置",
  215. "signature": "签名",
  216. "aweme_count": "作品数",
  217. }
  218.  
  219. function copyText(text, node) {
  220. let oldText = node.textContent;
  221. navigator.clipboard.writeText(text).then(r => {
  222. node.textContent = "复制成功";
  223. toast("复制成功\n" + text.slice(0, 20) + (text.length > 20 ? "..." : ""), 2000);
  224. }).catch((e) => {
  225. node.textContent = "复制失败";
  226. toast("复制失败", 2000);
  227. })
  228. setTimeout(() => node.textContent = oldText, 2000);
  229. }
  230.  
  231. function copyUserData(node) {
  232. if (!current_user_id) {
  233. toast("还没有捕获到用户数据!");
  234. return;
  235. }
  236. let text = [];
  237. let userInfo = user_map.get(current_user_id);
  238. for (let key in user_key) {
  239. let value = (userInfo[key] || "").toString().trim()
  240. if (value) text.push(user_key[key] + ":" + value);
  241. }
  242. copyText(text.join("\n"), node);
  243. }
  244.  
  245. function createVideoButton(text, top, func) {
  246. const button = document.createElement("button");
  247. button.textContent = text;
  248. button.style.position = "absolute";
  249. button.style.right = "0px";
  250. button.style.top = top;
  251. button.style.opacity = "0.5";
  252. if (func) {
  253. button.addEventListener("click", (event) => {
  254. event.preventDefault();
  255. event.stopPropagation();
  256. func();
  257. });
  258. }
  259. return button;
  260. }
  261.  
  262. function createDownloadLink(blob, filename, ext, prefix = "") {
  263. if (filename === null) {
  264. filename = current_user_id ? user_map.get(current_user_id).nickname : document.title;
  265. }
  266. const url = URL.createObjectURL(blob);
  267. const link = document.createElement('a');
  268. link.href = url;
  269. link.download = prefix + filename.replace(/[\/:*?"<>|\s]/g, "").slice(0, 40) + "." + ext;
  270. link.click();
  271. URL.revokeObjectURL(url);
  272. }
  273.  
  274. function txt2file(txt, filename, ext) {
  275. createDownloadLink(new Blob([txt], {type: 'text/plain'}), filename, ext);
  276. }
  277.  
  278. function getAwemeName(aweme) {
  279. let name = aweme.item_title ? aweme.item_title : aweme.caption;
  280. if (!name) name = aweme.desc ? aweme.desc : aweme.awemeId;
  281. return (aweme.date ? `【${aweme.date.slice(0, 10)}】` : "") + name.replace(/[\/:*?"<>|\s]+/g, "").slice(0, 27).replace(/\.\d+$/g, "");
  282. }
  283.  
  284. const downloadVideo = (aweme, node) => {
  285. toast("准备就绪,等待视频下载完毕后弹出下载界面!");
  286. let xhr = new XMLHttpRequest();
  287. xhr.open('GET', aweme.url.replace("http://", "https://"), true);
  288. xhr.responseType = 'blob';
  289. let filename = aweme ? getAwemeName(aweme) : window.title;
  290. let textContent = node.textContent;
  291. xhr.onload = (e) => {
  292. createDownloadLink(xhr.response, filename, (aweme.images ? "mp3" : "mp4"));
  293. setTimeout(() => node.textContent = textContent, 2000);
  294. };
  295. xhr.onprogress = (event) => {
  296. if (event.lengthComputable) {
  297. node.textContent = "下载" + (event.loaded * 100 / event.total).toFixed(1) + '%';
  298. }
  299. };
  300. xhr.send();
  301. };
  302. const downloadImage = (aweme, downloadImageButton) => {
  303. const zip = new JSZip();
  304. let textContent = downloadImageButton.textContent;
  305. downloadImageButton.textContent = "图片下载并打包中...";
  306. const promises = aweme.images.map((link, index) => {
  307. return fetch(link)
  308. .then((response) => response.arrayBuffer())
  309. .then((buffer) => {
  310. downloadImageButton.textContent = `图片已下载【${index + 1}/${aweme.images.length}】`;
  311. zip.file(`image_${index + 1}.jpg`, buffer);
  312. });
  313. });
  314. Promise.all(promises)
  315. .then(() => {
  316. return zip.generateAsync({type: "blob"});
  317. })
  318. .then((content) => {
  319. createDownloadLink(content, getAwemeName(aweme), "zip", "【图文】");
  320. setTimeout(() => downloadImageButton.textContent = textContent, 2000);
  321. });
  322. };
  323.  
  324. function createButtonGroup(aNode) {
  325. if (aNode.dataset.vid) return;
  326. let match = aNode.href.match(/(?:video|note)\/(\d+)/);
  327. if (!match) return;
  328. let videoId = match[1];
  329. let aweme = all_aweme_map.get(videoId);
  330. let copyDescButton = createVideoButton("复制描述", "0px");
  331. copyDescButton.addEventListener("click", (event) => {
  332. event.preventDefault();
  333. event.stopPropagation();
  334. copyText(aweme.desc, copyDescButton);
  335. })
  336. aNode.appendChild(copyDescButton);
  337. aNode.appendChild(createVideoButton("打开视频源", "20px", () => window.open(aweme.url)));
  338.  
  339. let downloadVideoButton = createVideoButton("下载视频", "40px");
  340. downloadVideoButton.addEventListener("click", () => downloadVideo(aweme, downloadVideoButton));
  341. aNode.appendChild(downloadVideoButton);
  342.  
  343. if (aweme.images) {
  344. let downloadImageButton = createVideoButton("图片打包下载", "60px");
  345. downloadImageButton.addEventListener("click", () => downloadImage(aweme, downloadImageButton));
  346. aNode.appendChild(downloadImageButton);
  347. }
  348. aNode.dataset.vid = videoId;
  349. }
  350.  
  351. function flush() {
  352. data_button.p2.textContent = `${all_aweme_map.size}`;
  353. user_button.p2.textContent = `${user_map.size}`;
  354. let img_num = Array.from(all_aweme_map.values()).filter(a => a.images).length;
  355. img_button.p2.textContent = `${img_num}`;
  356. msg_pre.textContent = `已加载${all_aweme_map.size}个作品,${img_num}个图文\n本地已缓存(${user_map.size}/${max_author_num})个作者\n激活上方头像可展开下载按钮`;
  357. }
  358.  
  359. const formatDouyinAwemeData = item => Object.assign(
  360. {
  361. "awemeId": item.aweme_id,
  362. "item_title": item.item_title,
  363. "caption": item.caption,
  364. "desc": item.desc,
  365. "tag": item.text_extra ? item.text_extra.map(tag => tag.hashtag_name).filter(tag => tag).join("#") : "",
  366. "video_tag": item.video_tag ? item.video_tag.map(tag => tag.tag_name).filter(tag => tag).join("->") : "",
  367. "date": timeFormat(item.create_time, "yyyy-mm-dd hh:MM:ss"),
  368. "create_time": item.create_time,
  369. },
  370. item.statistics ? {
  371. "diggCount": item.statistics.digg_count,
  372. "commentCount": item.statistics.comment_count,
  373. "collectCount": item.statistics.collect_count,
  374. "shareCount": item.statistics.share_count
  375. } : {},
  376. item.video ? {
  377. "duration": formatSeconds(Math.round(item.video.duration / 1000)),
  378. "url": item.video.play_addr.url_list[0],
  379. "cover": item.video.cover.url_list[0],
  380. "images": item.images ? item.images.map(row => row.url_list.pop()) : null,
  381. } : {},
  382. item.author ? {
  383. "uid": item.author.uid,
  384. "nickname": item.author.nickname
  385. } : {}
  386. );
  387.  
  388.  
  389. function formatAwemeData(json_data) {
  390. return json_data.aweme_list.map(formatDouyinAwemeData);
  391. }
  392.  
  393. function formatUserData(userInfo) {
  394. for (let key in userInfo) {
  395. if (!userInfo[key]) userInfo[key] = "";
  396. }
  397. return {
  398. "uid": userInfo.uid,
  399. "nickname": userInfo.nickname,
  400. "following_count": userInfo.following_count,
  401. "mplatform_followers_count": userInfo.mplatform_followers_count,
  402. "total_favorited": userInfo.total_favorited,
  403. "unique_id": userInfo.unique_id ? userInfo.unique_id : userInfo.short_id,
  404. "ip_location": userInfo.ip_location.replace("IP属地:", ""),
  405. "gender": userInfo.gender ? " 男女".charAt(userInfo.gender).trim() : "",
  406. "city": [userInfo.province, userInfo.city, userInfo.district].filter(x => x).join("·"),
  407. "signature": userInfo.signature,
  408. "aweme_count": userInfo.aweme_count,
  409. "create_time": Date.now()
  410. }
  411. }
  412.  
  413. function sendLocalData(jsonData) {
  414. if (!localDownload) return;
  415. fetch(localDownloadUrl, {
  416. method: 'POST',
  417. headers: {
  418. 'Content-Type': 'application/json'
  419. },
  420. body: JSON.stringify(jsonData)
  421. })
  422. .then(response => response.json())
  423. .then(responseData => {
  424. console.log('成功:', responseData);
  425. })
  426. .catch(error => {
  427. console.log('上报失败,请检查本地程序是否已经启动!');
  428. });
  429. }
  430.  
  431. function interceptResponse() {
  432. const originalSend = XMLHttpRequest.prototype.send;
  433. XMLHttpRequest.prototype.send = function () {
  434. originalSend.apply(this, arguments);
  435. if (!this._url) return;
  436. this.url = this._url;
  437. if (this.url.startsWith("http"))
  438. this.url = new URL(this.url).pathname
  439. if (!this.url.startsWith("/aweme/v1/web/")) return;
  440. const self = this;
  441. let func = this.onreadystatechange;
  442. this.onreadystatechange = (e) => {
  443. if (self.readyState === 4) {
  444. let data = JSON.parse(self.response);
  445. let jsonData;
  446. if (self.url.startsWith("/aweme/v1/web/user/profile/other")) {
  447. let userInfo = formatUserData(data.user);
  448. user_map.set(userInfo.uid, userInfo);
  449. current_user_id = userInfo.uid;
  450. console.log("加载作者:", current_user_id);
  451. let user_local_data = Array.from(user_map.values()).sort((a, b) => b.create_time - a.create_time);
  452. localStorage.setItem('user_local_data', JSON.stringify(user_local_data.slice(0, max_author_num)));
  453. } else if ([
  454. "/aweme/v1/web/aweme/post/",
  455. "/aweme/v1/web/aweme/related/",
  456. "/aweme/v1/web/aweme/favorite/",
  457. "/aweme/v1/web/mix/aweme/",
  458. "/aweme/v1/web/tab/feed/",
  459. "/aweme/v1/web/aweme/listcollection/",
  460. "/aweme/v1/web/history/read/"
  461. ].some(prefix => self.url.startsWith(prefix))) {
  462. jsonData = formatAwemeData(data);
  463. } else if ([
  464. "/aweme/v1/web/follow/feed/",
  465. "/aweme/v1/web/familiar/feed/",
  466. ].some(prefix => self.url.startsWith(prefix))) {
  467. jsonData = data.data.filter(item => item.aweme).map(item => formatDouyinAwemeData(item.aweme));
  468. } else if (self.url.startsWith("/aweme/v1/web/general/search/single/")) {
  469. jsonData = [];
  470. for (let obj of data.data) {
  471. if (obj.aweme_info) jsonData.push(formatDouyinAwemeData(obj.aweme_info))
  472. if (obj.user_list) {
  473. for (let user of obj.user_list) {
  474. user.items.forEach(aweme => jsonData.push(formatDouyinAwemeData(aweme)))
  475. }
  476. }
  477. }
  478. } else if (self.url.startsWith("/aweme/v1/web/module/feed/")) {
  479. jsonData = data.cards.map(item => formatDouyinAwemeData(JSON.parse(item.aweme)));
  480. } else if (self.url.startsWith("/aweme/v1/web/aweme/detail/")) {
  481. jsonData = [formatDouyinAwemeData(data.aweme_detail)]
  482. }
  483. if (jsonData) jsonData = jsonData.filter(item => item.url && item.awemeId);
  484. if (jsonData) {
  485. sendLocalData(jsonData);
  486. jsonData.forEach(aweme => {
  487. all_aweme_map.set(aweme.awemeId, aweme);
  488. })
  489. if (domLoadedTimer === null) flush();
  490. }
  491. }
  492. if (func) func.apply(self, e);
  493. };
  494. };
  495. }
  496.  
  497. function downloadData(node, encoding) {
  498. if (all_aweme_map.size === 0) {
  499. alert("还没有发现任何作品数据!");
  500. return;
  501. }
  502. if (node.disabled) {
  503. toast("下载正在处理中,请不要重复点击按钮!");
  504. return;
  505. }
  506. node.disabled = true;
  507. try {
  508. let text = "作者昵称,作品描述,作品链接,点赞数,评论数,收藏数,分享数,发布时间,时长,标签,分类,封面,下载链接\n";
  509. let user_aweme_list = Array.from(all_aweme_map.values()).sort((a, b) => b.create_time - a.create_time);
  510. user_aweme_list.forEach(aweme => {
  511. text += [aweme.nickname,
  512. '"' + aweme.desc.replace(/,/g, ',').replace(/"/g, '""') + '"',
  513. "https://www.douyin.com/video/" + aweme.awemeId,
  514. aweme.diggCount, aweme.commentCount,
  515. aweme.collectCount, aweme.shareCount, aweme.date,
  516. aweme.duration, aweme.tag, aweme.video_tag,
  517. aweme.cover, '"' + aweme.url + '"'].join(",") + "\n"
  518. });
  519. if (encoding === "gbk") text = str2gbk(text);
  520. txt2file(text, "【" + timeFormat(Date.now(), "yyyy-mm-dd") + "】抖音当前已加载数据", "csv");
  521. } finally {
  522. node.disabled = false;
  523. }
  524. }
  525.  
  526. function downloadUserData(node, encoding) {
  527. if (user_map.size === 0) {
  528. toast("还没有发现任何作者数据!请访问用户主页后再试!\n以https://www.douyin.com/user/开头的链接。");
  529. return;
  530. }
  531. if (node.disabled) {
  532. toast("下载正在处理中,请不要重复点击按钮!");
  533. return;
  534. }
  535. node.disabled = true;
  536. try {
  537. let text = "昵称,关注,粉丝,获赞,抖音号,IP属地,性别,位置,签名,作品数,主页\n";
  538. Array.from(user_map.values()).forEach(user_info => {
  539. text += [user_info.nickname, user_info.following_count, user_info.mplatform_followers_count,
  540. user_info.total_favorited, user_info.unique_id, user_info.ip_location,
  541. user_info.gender, user_info.city,
  542. '"' + user_info.signature.replace(/,/g, ',').replace(/"/g, '""') + '"',
  543. user_info.aweme_count, "https://www.douyin.com/user/" + user_info.uid].join(",") + "\n"
  544. });
  545. if (encoding === "gbk") text = str2gbk(text);
  546. txt2file(text, null, "csv");
  547. } finally {
  548. node.disabled = false;
  549. }
  550. }
  551.  
  552. let img_button, data_button, user_button, msg_pre;
  553.  
  554. function createMsgBox() {
  555. msg_pre = document.createElement('pre');
  556. msg_pre.textContent = '等待上方头像加载完毕';
  557. msg_pre.style.color = 'white';
  558. msg_pre.style.position = 'fixed';
  559. msg_pre.style.right = '5px';
  560. msg_pre.style.top = '60px';
  561. msg_pre.style.color = 'white';
  562. msg_pre.style.zIndex = '503';
  563. msg_pre.style.opacity = "0.5";
  564. document.body.appendChild(msg_pre);
  565. }
  566.  
  567. function scrollPageToBottom(scroll_button) {
  568. let scrollInterval;
  569.  
  570. function scrollLoop() {
  571. let endText = document.querySelector("div[data-e2e='user-post-list'] > ul[data-e2e='scroll-list'] + div div").innerText;
  572. if (endText.includes("没有更多了")) {
  573. clearInterval(scrollInterval);
  574. scrollInterval = null;
  575. scroll_button.p1.textContent = "已加载全部!";
  576. } else {
  577. scrollTo(0, document.body.scrollHeight);
  578. }
  579. }
  580.  
  581. scroll_button.addEventListener('click', () => {
  582. if (!scrollInterval) {
  583. if (!location.href.startsWith("https://www.douyin.com/user/")) {
  584. toast("不支持非用户主页开启下拉!");
  585. } else if (!document.querySelector("div[data-e2e='user-post-list']")) {
  586. toast("没有找到用户作品列表!");
  587. } else {
  588. scrollInterval = setInterval(scrollLoop, 1200);
  589. scroll_button.p1.textContent = "停止自动下拉";
  590. }
  591. } else {
  592. clearInterval(scrollInterval);
  593. scrollInterval = null;
  594. scroll_button.p1.textContent = "开启自动下拉";
  595. }
  596. });
  597. }
  598.  
  599. function createCommonElement(tagName, attrs = {}, text = "") {
  600. const tag = document.createElement(tagName);
  601. for (const [k, v] of Object.entries(attrs)) {
  602. tag.setAttribute(k, v);
  603. }
  604. if (text) tag.textContent = text;
  605. tag.addEventListener('click', (event) => event.stopPropagation());
  606. return tag;
  607. }
  608.  
  609. function createAllButton() {
  610. let dom = document.querySelector("#douyin-header-menuCt pace-island > div > div:nth-last-child(1) ul a:nth-last-child(1)");
  611. let baseNode = dom.cloneNode(true);
  612. baseNode.removeAttribute("target");
  613. baseNode.removeAttribute("rel");
  614. baseNode.removeAttribute("href");
  615. let svgChild = baseNode.querySelector("svg");
  616. if (svgChild) baseNode.removeChild(svgChild);
  617.  
  618. function createNewButton(name, num = "0") {
  619. let button = baseNode.cloneNode(true);
  620. button.p1 = button.querySelector("p:nth-child(1)");
  621. button.p2 = button.querySelector("p:nth-child(2)");
  622. button.p1.textContent = name;
  623. button.p2.textContent = num;
  624. dom.after(button);
  625. return button;
  626. }
  627.  
  628. img_button = createNewButton("图文打包下载");
  629. img_button.addEventListener('click', () => downloadImg(img_button));
  630.  
  631. let downloadCoverButton = createNewButton("封面打包下载", "");
  632. downloadCoverButton.addEventListener('click', () => downloadCover(downloadCoverButton));
  633.  
  634. data_button = createNewButton("下载已加载的数据");
  635. data_button.p1.after(createCommonElement("label", {'for': 'gbk'}, 'gbk'));
  636. let checkbox = createCommonElement("input", {'type': 'checkbox', 'id': 'gbk'});
  637. checkbox.checked = localStorage.getItem("gbk") === "1";
  638. checkbox.onclick = (event) => {
  639. event.stopPropagation();
  640. localStorage.setItem("gbk", checkbox.checked ? "1" : "0");
  641. };
  642. data_button.p1.after(checkbox);
  643. data_button.addEventListener('click', () => downloadData(data_button, checkbox.checked ? "gbk" : "utf-8"));
  644.  
  645. user_button = createNewButton("下载已游览的作者数据");
  646. user_button.addEventListener('click', () => downloadUserData(user_button, checkbox.checked ? "gbk" : "utf-8"));
  647.  
  648. scrollPageToBottom(createNewButton("开启自动下拉到底", ""));
  649.  
  650. let share_button = document.querySelector("#frame-user-info-share-button");
  651. if (share_button) {
  652. let node = share_button.cloneNode(true);
  653. node.span = node.querySelector("span");
  654. node.span.innerHTML = "复制作者信息";
  655. node.onclick = () => copyUserData(node.span);
  656. share_button.after(node);
  657. }
  658. }
  659.  
  660. async function downloadCover(node) {
  661. if (all_aweme_map.size === 0) {
  662. toast("还没有发现任何作品数据!");
  663. return;
  664. }
  665. if (node.disabled) {
  666. toast("下载正在处理中,请不要重复点击按钮!");
  667. return;
  668. }
  669. node.disabled = true;
  670. try {
  671. const zip = new JSZip();
  672. msg_pre.textContent = `下载封面并打包中...`;
  673. let user_aweme_list = Array.from(all_aweme_map.values()).sort((a, b) => b.create_time - a.create_time);
  674. let promises = user_aweme_list.map((aweme, index) => {
  675. let awemeName = getAwemeName(aweme) + ".jpg";
  676. return fetch(aweme.cover)
  677. .then(response => response.arrayBuffer())
  678. .then(buffer => zip.file(awemeName, buffer))
  679. .then(() => msg_pre.textContent = `${index + 1}/${user_aweme_list.length} ` + awemeName)
  680. });
  681. Promise.all(promises).then(() => {
  682. return zip.generateAsync({type: "blob"})
  683. }).then((content) => {
  684. createDownloadLink(content, null, "zip", "【封面】");
  685. msg_pre.textContent = "封面打包完成";
  686. node.disabled = false;
  687. })
  688. } finally {
  689. node.disabled = false;
  690. }
  691. }
  692.  
  693. async function downloadImg(node) {
  694. if (node.disabled) {
  695. toast("下载正在处理中,请不要重复点击按钮!");
  696. return;
  697. }
  698. node.disabled = true;
  699. try {
  700. const zip = new JSZip();
  701. let flag = true;
  702. let aweme_img_list = Array.from(all_aweme_map.values()).sort((a, b) => b.create_time - a.create_time).filter(a => a.images);
  703. for (let [i, aweme] of aweme_img_list.entries()) {
  704. let awemeName = getAwemeName(aweme);
  705. msg_pre.textContent = `${i + 1}/${aweme_img_list.length} ` + awemeName;
  706. let folder = zip.folder(awemeName);
  707. await Promise.all(aweme.images.map((link, index) => {
  708. return fetch(link)
  709. .then((res) => res.arrayBuffer())
  710. .then((buffer) => {
  711. folder.file(`image_${index + 1}.jpg`, buffer);
  712. });
  713. }));
  714. flag = false;
  715. }
  716. if (flag) {
  717. alert("当前页面未发现图文链接");
  718. node.disabled = false;
  719. return;
  720. }
  721. msg_pre.textContent = "图文打包中...";
  722. zip.generateAsync({type: "blob"})
  723. .then((content) => {
  724. createDownloadLink(content, null, "zip", "【图文】");
  725. msg_pre.textContent = "图文打包完成";
  726. node.disabled = false;
  727. });
  728. } finally {
  729. node.disabled = false;
  730. }
  731. }
  732.  
  733. function douyinVideoDownloader() {
  734. const clonePlayclarity2Download = (xgPlayer, videoId, videoContainer) => {
  735. let toolDom = xgPlayer.querySelector(`.xgplayer-playclarity-setting[data-vid]`);
  736. const adjustMargin = (virtualDom) => {
  737. if (location.href.includes('search') && !location.href.includes('modal_id')) {
  738. toolDom.style.marginTop = "0px";
  739. virtualDom.style.marginBottom = "37px";
  740. } else {
  741. toolDom.style.marginTop = "-68px";
  742. virtualDom.style.marginBottom = "0px";
  743. }
  744. }
  745. let attrs = {class: "item", style: "text-align:center;"};
  746. let aweme;
  747. if (toolDom) {
  748. toolDom.dataset.vid = videoId;
  749. videoContainer.dataset.vid = videoId;
  750. adjustMargin(toolDom.querySelector('.virtual'));
  751. aweme = all_aweme_map.get(toolDom.dataset.vid);
  752. let virtualDom = toolDom.querySelector('.virtual');
  753. if (aweme.images && !virtualDom.dataset.image) {
  754. let downloadDom2 = createCommonElement("div", attrs, "图文下载");
  755. virtualDom.appendChild(downloadDom2);
  756. downloadDom2.onclick = () => {
  757. aweme = all_aweme_map.get(toolDom.dataset.vid);
  758. if (!aweme) {
  759. toast('未捕获到对应数据源!');
  760. } else if (!aweme.images) {
  761. toast('捕获的数据源,不含图片信息!');
  762. } else {
  763. downloadImage(aweme, downloadDom2);
  764. }
  765. };
  766. virtualDom.dataset.image = videoId;
  767. } else if (!aweme.images && virtualDom.dataset.image) {
  768. virtualDom.removeChild(virtualDom.lastElementChild);
  769. // virtualDom.dataset.image = "";
  770. delete virtualDom.dataset.image;
  771. }
  772. return;
  773. }
  774. // console.log("打开视频", videoId);
  775. aweme = all_aweme_map.get(videoId);
  776. if (!aweme) return;
  777. // toast('当前打开的视频未捕获到数据源,若需要下载请转入观看历史下载!');
  778. const parser = new DOMParser();
  779. const doc = parser.parseFromString('<xg-icon class="xgplayer-playclarity-setting" data-state="normal" data-index="7.6">' +
  780. '<div class="gear"><div class="virtual"></div><div class="btn">工具</div></div></xg-icon>', 'text/html');
  781. toolDom = doc.body.firstChild;
  782.  
  783. toolDom.dataset.vid = videoId;
  784. toolDom.dataset.index = "7.6";
  785. videoContainer.dataset.vid = videoId;
  786. toolDom.style = 'margin-top:-68px;padding-top:100px;';
  787.  
  788. let downloadText = toolDom.querySelector('.btn');
  789. if (!downloadText) return;
  790. downloadText.textContent = '工具';
  791. downloadText.style = 'font-size:14px;font-weight:600;';
  792.  
  793. let virtualDom = toolDom.querySelector('.virtual');
  794. if (!virtualDom) return;
  795. adjustMargin(virtualDom);
  796. toolDom.onmouseover = () => virtualDom.style.display = 'block';
  797. toolDom.onmouseout = () => virtualDom.style.display = 'none';
  798. virtualDom.innerHTML = '';
  799.  
  800. let copyDescDom = createCommonElement("div", attrs, "复制描述");
  801. virtualDom.appendChild(copyDescDom);
  802.  
  803. copyDescDom.onclick = () => {
  804. console.log("复制对象:", toolDom.dataset.vid);
  805. aweme = window.all_aweme_map.get(toolDom.dataset.vid);
  806. if (!aweme) {
  807. toast('未捕获到对应数据源!');
  808. } else if (!aweme.desc) {
  809. toast('捕获的数据源,不含描述信息!');
  810. } else {
  811. copyText(aweme.desc, copyDescDom);
  812. }
  813. }
  814. let toLinkDom = createCommonElement("div", attrs, "打开视频");
  815. virtualDom.appendChild(toLinkDom);
  816.  
  817. toLinkDom.onclick = () => {
  818. // let url = videoContainer && videoContainer.children.length > 0 && videoContainer.children[0].src
  819. // ? videoContainer.children[0].src : "";
  820. // url = !url && aweme ? aweme.url : url;
  821. // console.log('打开视频:', toolDom.dataset.vid, url);
  822. aweme = all_aweme_map.get(toolDom.dataset.vid);
  823. if (aweme && aweme.url) window.open(aweme.url);
  824. else toast('未捕获到对应数据源!');
  825. };
  826. let downloadDom = createCommonElement("div", attrs, "下载视频");
  827. virtualDom.appendChild(downloadDom);
  828. downloadDom.onclick = () => {
  829. aweme = all_aweme_map.get(toolDom.dataset.vid);
  830. console.log('下载视频:', toolDom.dataset.vid, aweme);
  831. if (aweme && aweme.url) {
  832. downloadVideo(aweme, downloadDom);
  833. } else toast('未捕获到对应数据源!');
  834. };
  835. if (aweme.images) {
  836. let downloadDom2 = createCommonElement("div", attrs, "图文下载");
  837. virtualDom.appendChild(downloadDom2);
  838. downloadDom2.onclick = () => {
  839. aweme = all_aweme_map.get(toolDom.dataset.vid);
  840. if (!aweme) {
  841. toast('未捕获到对应数据源!');
  842. } else if (!aweme.images) {
  843. toast('捕获的数据源,不含图片信息!');
  844. } else {
  845. downloadImage(aweme, downloadDom2);
  846. }
  847. };
  848. virtualDom.dataset.image = videoId;
  849. }
  850. xgPlayer.appendChild(toolDom);
  851. }
  852. const run = (node) => {
  853. if(!node) return;
  854. let activeVideoElement = node.closest('div[data-e2e="feed-active-video"]');
  855. let videoId, xgPlayer, videoContainer;
  856. if (activeVideoElement) {
  857. videoId = activeVideoElement.getAttribute('data-e2e-vid');
  858. xgPlayer = activeVideoElement.querySelector('.xg-right-grid');
  859. videoContainer = activeVideoElement.querySelector("video");
  860. } else {
  861. let playVideoElements = Array.from(document.querySelectorAll('video')).filter(v => v.autoplay);
  862. videoContainer = location.href.includes('modal_id')
  863. ? playVideoElements[0]
  864. : playVideoElements[playVideoElements.length - 1];
  865. xgPlayer = node.closest('.xg-right-grid');
  866. let detailVideoInfo = document.querySelector("[data-e2e='detail-video-info']");
  867. videoId = detailVideoInfo ? detailVideoInfo.getAttribute('data-e2e-aweme-id') : null;
  868. videoId = videoId ? videoId : new URLSearchParams(location.search).get('modal_id');
  869. }
  870. if (!videoId || !xgPlayer || !videoContainer) return;
  871. clonePlayclarity2Download(xgPlayer, videoId, videoContainer);
  872. }
  873. const rootObserver = new MutationObserver((mutations) => {
  874. mutations.forEach((mutation) => {
  875. mutation.addedNodes.forEach((node) => {
  876. if (node.className === "gear" || (node.className === "xgplayer-icon" && node.dataset.e2e === "video-player-auto-play") ||
  877. (node.classList && node.classList.contains("xgplayer-inner-autoplay"))) {
  878. run(node);
  879. }
  880. // if (node.closest && node.closest('.xg-right-grid')) {
  881. // console.log(node.outerHTML, node);
  882. // }
  883. });
  884. });
  885. });
  886. rootObserver.observe(document.body, {childList: true, subtree: true});
  887. setInterval(() => {
  888. run(document.querySelector('div[data-e2e="feed-active-video"]'))
  889. }, 1000);
  890. }
  891.  
  892. function userDetailObserver() {
  893. const observeList = (scrollList) => {
  894. if (!scrollList) return;
  895. console.log('开始监听新创建的视频列表!');
  896. listObserver.observe(scrollList, {childList: true});
  897. };
  898. const listObserver = new MutationObserver((mutationsList) => {
  899. for (const mutation of mutationsList) {
  900. if (mutation.type !== 'childList') continue;
  901. mutation.addedNodes.forEach(node => {
  902. createButtonGroup(node.querySelector("a"));
  903. });
  904. }
  905. });
  906. const rootObserver = new MutationObserver((mutationsList) => {
  907. for (let mutation of mutationsList) {
  908. if (mutation.type !== 'childList') continue;
  909. mutation.addedNodes.forEach(node => {
  910. if (!node.querySelector) return;
  911. observeList(node.querySelector("ul[data-e2e='scroll-list']"));
  912. });
  913. mutation.removedNodes.forEach(node => {
  914. if (node.querySelector && node.querySelector("ul[data-e2e='scroll-list']")) {
  915. console.log('关闭了一个视频列表');
  916. listObserver.disconnect();
  917. }
  918. });
  919. }
  920. });
  921. rootObserver.observe(document.body, {childList: true, subtree: true});
  922. observeList(document.querySelector("div[data-e2e='user-detail'] ul[data-e2e='scroll-list']"));
  923. }
  924.  
  925. if (document.title === "验证码中间页") return;
  926. createMsgBox();
  927. interceptResponse();
  928. douyinVideoDownloader();
  929. userDetailObserver();
  930. let domLoadedTimer;
  931. const checkElementLoaded = () => {
  932. const element = document.querySelector('#douyin-header-menuCt pace-island > div > div:nth-last-child(1) ul a');
  933. if (element) {
  934. console.log('顶部栏加载完毕');
  935. msg_pre.textContent = "头像加载完成\n若需要下载用户数据,需进入目标用户主页\n若未捕获到数据,可以刷新重试";
  936. clearInterval(domLoadedTimer);
  937. domLoadedTimer = null;
  938. createAllButton();
  939. flush();
  940. }
  941. };
  942. document.window = window;
  943. window.onload = () => {
  944. domLoadedTimer = setInterval(checkElementLoaded, 700);
  945. }
  946. })();