Wordcat Downloader

可以对PDF进行解析成word。【❤️ 文档自动解析,体会拥有VIP的感觉❤️,适配PC+移动 】

  1. // ==UserScript==
  2. // @name Wordcat Downloader
  3. // @namespace http://tampermonkey.net/
  4. // @version 1.10.0
  5. // @description 可以对PDF进行解析成word。【❤️ 文档自动解析,体会拥有VIP的感觉❤️,适配PC+移动 】
  6. // @author xsunvip@qq.com
  7. // @match *://*.docin.com/p-*
  8. // @match *://docimg1.docin.com/?wk=true
  9. // @match *://ishare.iask.sina.com.cn/f/*
  10. // @match *://ishare.iask.com/f/*
  11. // @match *://swf.ishare.down.sina.com.cn/?path=*
  12. // @match *://swf.ishare.down.sina.com.cn/?wk=true
  13. // @match *://www.deliwenku.com/p-*
  14. // @match *://file.deliwenku.com/?num=*
  15. // @match *://file3.deliwenku.com/?num=*
  16. // @match *://www.doc88.com/p-*
  17. // @match *://www.360doc.com/content/*
  18. // @match *://doc.mbalib.com/view/*
  19. // @match *://www.dugen.com/p-*
  20. // @match *://max.book118.com/html/*
  21. // @match *://openapi.book118.com/?*
  22. // @match *://view-cache.book118.com/pptView.html?*
  23. // @match *://*.book118.com/?readpage=*
  24. // @match *://c.gb688.cn/bzgk/gb/showGb?*
  25. // @match *://www.safewk.com/p-*
  26. // @match *://www.renrendoc.com/paper/*
  27. // @match *://www.renrendoc.com/p-*
  28. // @match *://www.yunzhan365.com/basic/*
  29. // @match *://book.yunzhan365.com/*index.html*
  30. // @match *://wenku.so.com/d/*
  31. // @match *://jg.class.com.cn/cms/resourcedetail.htm?contentUid=*
  32. // @match *://preview.imm.aliyuncs.com/index.html?url=*/jgjyw/*
  33. // @match *://www.wenkub.com/p-*.html*
  34. // @match *://*/manuscripts/?*
  35. // @match *://gwfw.sdlib.com:8000/*
  36. // @match *://www.jinchutou.com/shtml/view-*
  37. // @match *://www.jinchutou.com/p-*
  38. // @match *://www.nrsis.org.cn/*/read/*
  39. // @match https://xianxiao.ssap.com.cn/index/rpdf/read/id/*/catalog_id/0.html?file=*
  40. // @require https://cdn.staticfile.org/jspdf/2.5.1/jspdf.umd.min.js
  41. // @require https://cdn.staticfile.org/html2canvas/1.4.1/html2canvas.min.js
  42. // @icon https://s2.loli.net/2022/01/12/wc9je8RX7HELbYQ.png
  43. // @icon64 https://s2.loli.net/2022/01/12/tmFeSKDf8UkNMjC.png
  44. // @grant none
  45. // @run-at document-idle
  46. // @license GPL-3.0-only
  47. // @create 2021-11-22
  48. // @note 1. 新增支持【先晓书院】
  49. // ==/UserScript==
  50. (function () {
  51. 'use strict';
  52. /**
  53. * 基于 window.postMessage 通信的套接字对象
  54. */
  55. class Socket {
  56. /**
  57. * 创建套接字对象
  58. * @param {Window} target 目标窗口
  59. */
  60. constructor(target) {
  61. if (!(target.window && (target === target.window))) {
  62. console.log(target);
  63. throw new Error(`target is not a [Window Object]`);
  64. }
  65. this.target = target;
  66. this.connected = false;
  67. this.listeners = new Set();
  68. }
  69. get [Symbol.toStringTag]() { return "Socket"; }
  70. /**
  71. * 向目标窗口发消息
  72. * @param {*} message
  73. */
  74. talk(message) {
  75. if (!this.target) {
  76. throw new TypeError(
  77. `socket.target is not a window: ${this.target}`
  78. );
  79. }
  80. this.target.postMessage(message, "*");
  81. }
  82. /**
  83. * 添加捕获型监听器,返回实际添加的监听器
  84. * @param {Function} listener (e: MessageEvent) => {...}
  85. * @param {boolean} once 是否在执行后自动销毁,默认 false;如为 true 则使用自动包装过的监听器
  86. * @returns {Function} listener
  87. */
  88. listen(listener, once=false) {
  89. if (this.listeners.has(listener)) {
  90. return;
  91. }
  92. let real_listener = listener;
  93. // 包装监听器
  94. if (once) {
  95. const self = this;
  96. function wrapped(e) {
  97. listener(e);
  98. self.notListen(wrapped);
  99. }
  100. real_listener = wrapped;
  101. }
  102. // 添加监听器
  103. this.listeners.add(real_listener);
  104. window.addEventListener(
  105. "message", real_listener, true
  106. );
  107. return real_listener;
  108. }
  109. /**
  110. * 移除socket上的捕获型监听器
  111. * @param {Function} listener (e: MessageEvent) => {...}
  112. */
  113. notListen(listener) {
  114. console.log(listener);
  115. console.log(
  116. "listener delete operation:",
  117. this.listeners.delete(listener)
  118. );
  119. window.removeEventListener("message", listener, true);
  120. }
  121. /**
  122. * 检查对方来信是否为pong消息
  123. * @param {MessageEvent} e
  124. * @param {Function} resolve
  125. */
  126. _on_pong(e, resolve) {
  127. // 收到pong消息
  128. if (e.data.pong) {
  129. this.connected = true;
  130. this.listeners.forEach(
  131. listener => listener.ping ? this.notListen(listener) : 0
  132. );
  133. console.log("Client: Connected!\n" + new Date());
  134. resolve(this);
  135. }
  136. }
  137. /**
  138. * 向对方发送ping消息
  139. * @returns {Promise<Socket>}
  140. */
  141. _ping() {
  142. return new Promise((resolve, reject) => {
  143. // 绑定pong检查监听器
  144. const listener = this.listen(
  145. e => this._on_pong(e, resolve)
  146. );
  147. listener.ping = true;
  148. // 5分钟后超时
  149. setTimeout(
  150. () => reject(new Error(`Timeout Error during receiving pong (>5min)`)),
  151. 5 * 60 * 1000
  152. );
  153. // 发送ping消息
  154. this.talk({ ping: true });
  155. });
  156. }
  157. /**
  158. * 检查对方来信是否为ping消息
  159. * @param {MessageEvent} e
  160. * @param {Function} resolve
  161. */
  162. _on_ping(e, resolve) {
  163. // 收到ping消息
  164. if (e.data.ping) {
  165. this.target = e.source;
  166. this.connected = true;
  167. this.listeners.forEach(
  168. listener => listener.pong ? this.notListen(listener) : 0
  169. );
  170. console.log("Server: Connected!\n" + new Date());
  171. // resolve 后期约状态无法回退
  172. // 但后续代码仍可执行
  173. resolve(this);
  174. // 回应pong消息
  175. this.talk({ pong: true });
  176. }
  177. }
  178. /**
  179. * 当对方来信是为ping消息时回应pong消息
  180. * @returns {Promise<Socket>}
  181. */
  182. _pong() {
  183. return new Promise(resolve => {
  184. // 绑定ping检查监听器
  185. const listener = this.listen(
  186. e => this._on_ping(e, resolve)
  187. );
  188. listener.pong = true;
  189. });
  190. }
  191. /**
  192. * 连接至目标窗口
  193. * @param {boolean} talk_first 是否先发送ping消息
  194. * @param {Window} target 目标窗口
  195. * @returns {Promise<Socket>}
  196. */
  197. connect(talk_first) {
  198. // 先发起握手
  199. if (talk_first) {
  200. return this._ping();
  201. }
  202. // 后发起握手
  203. return this._pong();
  204. }
  205. }
  206. const base = {
  207. Socket,
  208. init_gbk_encoder() {
  209. let table;
  210. function initGbkTable() {
  211. // https://en.wikipedia.org/wiki/GBK_(character_encoding)#Encoding
  212. const ranges = [
  213. [0xA1, 0xA9, 0xA1, 0xFE],
  214. [0xB0, 0xF7, 0xA1, 0xFE],
  215. [0x81, 0xA0, 0x40, 0xFE],
  216. [0xAA, 0xFE, 0x40, 0xA0],
  217. [0xA8, 0xA9, 0x40, 0xA0],
  218. [0xAA, 0xAF, 0xA1, 0xFE],
  219. [0xF8, 0xFE, 0xA1, 0xFE],
  220. [0xA1, 0xA7, 0x40, 0xA0],
  221. ];
  222. const codes = new Uint16Array(23940);
  223. let i = 0;
  224. for (const [b1Begin, b1End, b2Begin, b2End] of ranges) {
  225. for (let b2 = b2Begin; b2 <= b2End; b2++) {
  226. if (b2 !== 0x7F) {
  227. for (let b1 = b1Begin; b1 <= b1End; b1++) {
  228. codes[i++] = b2 << 8 | b1;
  229. }
  230. }
  231. }
  232. }
  233. table = new Uint16Array(65536);
  234. table.fill(0xFFFF);
  235. const str = new TextDecoder('gbk').decode(codes);
  236. for (let i = 0; i < str.length; i++) {
  237. table[str.charCodeAt(i)] = codes[i];
  238. }
  239. }
  240. const defaultOnAlloc = (len) => new Uint8Array(len);
  241. const defaultOnError = () => 63; // '?'
  242. /**
  243. * 字符串编码为gbk字节串
  244. * @param {string} str
  245. * @param {Function} onError 处理编码失败时返回字符替代值的函数,默认是返回 63('?') 的函数
  246. * @returns {Uint8Array}
  247. */
  248. return function(str, onError=null) {
  249. if (!table) {
  250. initGbkTable();
  251. }
  252. const onAlloc = defaultOnAlloc;
  253. onError = onError === null ? defaultOnError : onError;
  254. const buf = onAlloc(str.length * 2);
  255. let n = 0;
  256. for (let i = 0; i < str.length; i++) {
  257. const code = str.charCodeAt(i);
  258. if (code < 0x80) {
  259. buf[n++] = code;
  260. continue;
  261. }
  262. const gbk = table[code];
  263. if (gbk !== 0xFFFF) {
  264. buf[n++] = gbk;
  265. buf[n++] = gbk >> 8;
  266. }
  267. else if (code === 8364) {
  268. // 8364 == '€'.charCodeAt(0)
  269. // Code Page 936 has a single-byte euro sign at 0x80
  270. buf[n++] = 0x80;
  271. }
  272. else {
  273. const ret = onError(i, str);
  274. if (ret === -1) {
  275. break;
  276. }
  277. if (ret > 0xFF) {
  278. buf[n++] = ret;
  279. buf[n++] = ret >> 8;
  280. } else {
  281. buf[n++] = ret;
  282. }
  283. }
  284. }
  285. return buf.subarray(0, n)
  286. }
  287. },
  288. /**
  289. * Construct a table with table[i] as the length of the longest prefix of the substring 0..i
  290. * @param {Array<number>} arr
  291. * @returns {Array<number>}
  292. */
  293. longest_prefix: function(arr) {
  294. // create a table of size equal to the length of `str`
  295. // table[i] will store the prefix of the longest prefix of the substring str[0..i]
  296. let table = new Array(arr.length);
  297. let maxPrefix = 0;
  298. // the longest prefix of the substring str[0] has length
  299. table[0] = 0;
  300. // for the substrings the following substrings, we have two cases
  301. for (let i = 1; i < arr.length; i++) {
  302. // case 1. the current character doesn't match the last character of the longest prefix
  303. while (maxPrefix > 0 && arr[i] !== arr[maxPrefix]) {
  304. // if that is the case, we have to backtrack, and try find a character that will be equal to the current character
  305. // if we reach 0, then we couldn't find a chracter
  306. maxPrefix = table[maxPrefix - 1];
  307. }
  308. // case 2. The last character of the longest prefix matches the current character in `str`
  309. if (arr[maxPrefix] === arr[i]) {
  310. // if that is the case, we know that the longest prefix at position i has one more character.
  311. // for example consider `-` be any character not contained in the set [a-c]
  312. // str = abc----abc
  313. // consider `i` to be the last character `c` in `str`
  314. // maxPrefix = will be 2 (the first `c` in `str`)
  315. // maxPrefix now will be 3
  316. maxPrefix++;
  317. // so the max prefix for table[9] is 3
  318. }
  319. table[i] = maxPrefix;
  320. }
  321. return table;
  322. },
  323. // 用于取得一次列表中所有迭代器的值
  324. getAllValus: function(iterators) {
  325. if (iterators.length === 0) {
  326. return [true, []];
  327. }
  328. let values = [];
  329. for (let iterator of iterators) {
  330. let {value, done} = iterator.next();
  331. if (done) {
  332. return [true, []];
  333. }
  334. values.push(value);
  335. }
  336. return [false, values];
  337. },
  338. /**
  339. * 使用过时的execCommand复制文字
  340. * @param {string} text
  341. */
  342. oldCopy: function(text) {
  343. document.oncopy = function(event) {
  344. event.clipboardData.setData('text/plain', text);
  345. event.preventDefault();
  346. };
  347. document.execCommand('Copy', false, null);
  348. },
  349. b64ToUint6: function(nChr) {
  350. return nChr > 64 && nChr < 91 ?
  351. nChr - 65
  352. : nChr > 96 && nChr < 123 ?
  353. nChr - 71
  354. : nChr > 47 && nChr < 58 ?
  355. nChr + 4
  356. : nChr === 43 ?
  357. 62
  358. : nChr === 47 ?
  359. 63
  360. :
  361. 0;
  362. },
  363. /**
  364. * 元素选择器
  365. * @param {string} selector 选择器
  366. * @returns {Array<HTMLElement>} 元素列表
  367. */
  368. $: function(selector) {
  369. const self = this?.querySelectorAll ? this : document;
  370. return [...self.querySelectorAll(selector)];
  371. },
  372. /**
  373. * 安全元素选择器,直到元素存在时才返回元素列表,最多等待5秒
  374. * @param {string} selector 选择器
  375. * @returns {Promise<Array<HTMLElement>>} 元素列表
  376. */
  377. $$: async function(selector) {
  378. const self = this?.querySelectorAll ? this : document;
  379. for (let i = 0; i < 10; i++) {
  380. let elems = [...self.querySelectorAll(selector)];
  381. if (elems.length > 0) {
  382. return elems;
  383. }
  384. await new Promise(r => setTimeout(r, 500));
  385. }
  386. throw Error(`"${selector}" not found in 5s`);
  387. },
  388. /**
  389. * 将2个及以上的空白字符(除了换行符)替换成一个空格
  390. * @param {string} text
  391. * @returns {string}
  392. */
  393. stripBlanks: function(text) {
  394. return text
  395. .replace(/([^\r\n])(\s{2,})(?=[^\r\n])/g, "$1 ")
  396. .replace(/\n{2,}/, "\n");
  397. },
  398. /**
  399. * 复制属性(含访问器)到 target
  400. * @param {Object} target
  401. * @param {...Object} sources
  402. * @returns
  403. */
  404. superAssign: function(target, ...sources) {
  405. sources.forEach(source =>
  406. Object.defineProperties(
  407. target, Object.getOwnPropertyDescriptors(source)
  408. )
  409. );
  410. return target;
  411. },
  412. makeCRC32: function() {
  413. function makeCRCTable() {
  414. let c;
  415. let crcTable = [];
  416. for(var n =0; n < 256; n++){
  417. c = n;
  418. for(var k =0; k < 8; k++){
  419. c = ((c&1) ? (0xEDB88320 ^ (c >>> 1)) : (c >>> 1));
  420. }
  421. crcTable[n] = c;
  422. }
  423. return crcTable;
  424. }
  425. const crcTable = makeCRCTable();
  426. /**
  427. * @param {string} str
  428. * @returns {number}
  429. */
  430. return function(str) {
  431. let crc = 0 ^ (-1);
  432. for (var i = 0; i < str.length; i++ ) {
  433. crc = (crc >>> 8) ^ crcTable[(crc ^ str.charCodeAt(i)) & 0xFF];
  434. }
  435. return (crc ^ (-1)) >>> 0;
  436. };
  437. }
  438. };
  439. const box = `
  440. <div class="wk-box">
  441. <section class="btns-sec">
  442. <p class="logo_tit">Wenku Doc Downloader</p>
  443. <button class="btn-1">展开文档 😈</button>
  444. <button class="btn-2">空按钮 2</button>
  445. <button class="btn-3">空按钮 3</button>
  446. <button class="btn-4">空按钮 4</button>
  447. <button class="btn-5">空按钮 5</button>
  448. </section>
  449. <p class="wk-fold-btn unfold"></p>
  450. </div>
  451. `;
  452. const style = `
  453. <style class="wk-style">
  454. .wk-fold-btn {
  455. position: fixed;
  456. left: 151px;
  457. top: 36%;
  458. user-select: none;
  459. font-size: large;
  460. z-index: 1001;
  461. }
  462. .wk-fold-btn::after {
  463. content: "🐵";
  464. }
  465. .wk-fold-btn.folded {
  466. left: 20px;
  467. }
  468. .wk-fold-btn.folded::after {
  469. content: "🙈";
  470. }
  471. .wk-box {
  472. position: fixed;
  473. width: 154px;
  474. left: 10px;
  475. top: 32%;
  476. z-index: 1000;
  477. }
  478. .btns-sec {
  479. background: #E7F1FF;
  480. border: 2px solid #1676FF;
  481. padding: 0px 0px 10px 0px;
  482. font-weight: 600;
  483. border-radius: 2px;
  484. font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', 'PingFang SC', 'Hiragino Sans GB',
  485. 'Microsoft YaHei', 'Helvetica Neue', Helvetica, Arial, sans-serif, 'Apple Color Emoji',
  486. 'Segoe UI Emoji', 'Segoe UI Symbol';
  487. }
  488. .btns-sec.folded {
  489. display: none;
  490. }
  491. .logo_tit {
  492. width: 100%;
  493. background: #1676FF;
  494. text-align: center;
  495. font-size: 12px;
  496. color: #E7F1FF;
  497. line-height: 40px;
  498. height: 40px;
  499. margin: 0 0 16px 0;
  500. }
  501. .btn-1 {
  502. display: block;
  503. width: 128px;
  504. height: 28px;
  505. background: linear-gradient(180deg, #00E7F7 0%, #FEB800 0.01%, #FF8700 100%);
  506. border-radius: 4px;
  507. color: #fff;
  508. font-size: 12px;
  509. border: none;
  510. outline: none;
  511. margin: 8px auto;
  512. font-weight: bold;
  513. cursor: pointer;
  514. opacity: .9;
  515. }
  516. .btn-2 {
  517. display: none;
  518. width: 128px;
  519. height: 28px;
  520. background: #07C160;
  521. border-radius: 4px;
  522. color: #fff;
  523. font-size: 12px;
  524. border: none;
  525. outline: none;
  526. margin: 8px auto;
  527. font-weight: bold;
  528. cursor: pointer;
  529. opacity: .9;
  530. }
  531. .btn-3 {
  532. display: none;
  533. width: 128px;
  534. height: 28px;
  535. background: #FA5151;
  536. border-radius: 4px;
  537. color: #fff;
  538. font-size: 12px;
  539. border: none;
  540. outline: none;
  541. margin: 8px auto;
  542. font-weight: bold;
  543. cursor: pointer;
  544. opacity: .9;
  545. }
  546. .btn-4 {
  547. display: none;
  548. width: 128px;
  549. height: 28px;
  550. background: #1676FF;
  551. border-radius: 4px;
  552. color: #fff;
  553. font-size: 12px;
  554. border: none;
  555. outline: none;
  556. margin: 8px auto;
  557. font-weight: bold;
  558. cursor: pointer;
  559. opacity: .9;
  560. }
  561. .btn-5 {
  562. display: none;
  563. width: 128px;
  564. height: 28px;
  565. background: #ff6600;
  566. border-radius: 4px;
  567. color: #fff;
  568. font-size: 12px;
  569. border: none;
  570. outline: none;
  571. margin: 8px auto;
  572. font-weight: bold;
  573. cursor: pointer;
  574. opacity: .9;
  575. }
  576. .btns-sec button:hover {
  577. opacity: 0.8;
  578. }
  579. .btns-sec button:active{
  580. opacity: 1;
  581. }
  582. .btns-sec button[disabled] {
  583. cursor: not-allowed;
  584. opacity: 1;
  585. filter: grayscale(1);
  586. }
  587. .wk-popup-container {
  588. height: 100vh;
  589. width: 100vw;
  590. display: flex;
  591. flex-direction: column;
  592. justify-content: space-around;
  593. z-index: 999;
  594. background: 0 0;
  595. }
  596. .wk-popup-head {
  597. font-size: 1.5em;
  598. margin-bottom: 12px
  599. }
  600. .wk-card {
  601. background: #fff;
  602. background-image: linear-gradient(48deg, #fff 0, #e5efe9 100%);
  603. border-top-right-radius: 16px;
  604. border-bottom-left-radius: 16px;
  605. box-shadow: -20px 20px 35px 1px rgba(10, 49, 86, .18);
  606. display: flex;
  607. flex-direction: column;
  608. padding: 32px;
  609. margin: 0;
  610. max-width: 400px;
  611. width: 100%
  612. }
  613. .content-wrapper {
  614. font-size: 1.1em;
  615. margin-bottom: 44px
  616. }
  617. .content-wrapper:last-child {
  618. margin-bottom: 0
  619. }
  620. .wk-button {
  621. align-items: center;
  622. background: #e5efe9;
  623. border: 1px solid #5a72b5;
  624. border-radius: 4px;
  625. color: #121943;
  626. cursor: pointer;
  627. display: flex;
  628. font-size: 1em;
  629. font-weight: 700;
  630. height: 40px;
  631. justify-content: center;
  632. width: 150px
  633. }
  634. .wk-button:focus {
  635. border: 2px solid transparent;
  636. box-shadow: 0 0 0 2px #121943;
  637. outline: solid 4px transparent
  638. }
  639. .link {
  640. color: #121943
  641. }
  642. .link:focus {
  643. box-shadow: 0 0 0 2px #121943
  644. }
  645. .input-wrapper {
  646. display: flex;
  647. flex-direction: column
  648. }
  649. .input-wrapper .label {
  650. align-items: baseline;
  651. display: flex;
  652. font-weight: 700;
  653. justify-content: space-between;
  654. margin-bottom: 8px
  655. }
  656. .input-wrapper .optional {
  657. color: #5a72b5;
  658. font-size: .9em
  659. }
  660. .input-wrapper .input {
  661. border: 1px solid #5a72b5;
  662. border-radius: 4px;
  663. height: 40px;
  664. padding: 8px
  665. }
  666. .modal-header {
  667. align-items: baseline;
  668. display: flex;
  669. justify-content: space-between
  670. }
  671. .close {
  672. background: 0 0;
  673. border: none;
  674. cursor: pointer;
  675. display: flex;
  676. height: 16px;
  677. text-decoration: none;
  678. width: 16px
  679. }
  680. .close svg {
  681. width: 16px
  682. }
  683. .modal-wrapper {
  684. background: rgba(0, 0, 0, .7);
  685. }
  686. #wk-popup {
  687. opacity: 0;
  688. transition: opacity .25s ease-in-out;
  689. display: none;
  690. flex-direction: row;
  691. justify-content: space-around;
  692. }
  693. #wk-popup:target {
  694. opacity: 1;
  695. display: flex;
  696. }
  697. #wk-popup:target .modal-body {
  698. opacity: 1;
  699. transform: translateY(1);
  700. }
  701. #wk-popup .modal-body {
  702. max-width: 500px;
  703. opacity: 0;
  704. transform: translateY(-3vh);
  705. transition: opacity .25s ease-in-out;
  706. width: 100%;
  707. z-index: 1
  708. }
  709. .outside-trigger {
  710. bottom: 0;
  711. cursor: default;
  712. left: 0;
  713. position: fixed;
  714. right: 0;
  715. top: 0;
  716. }
  717. </style>
  718. `;
  719. const popup = `
  720. <div class="wk-popup-container">
  721. <div class='modal-wrapper' id='wk-popup'>
  722. <div class='modal-body wk-card'>
  723. <div class='modal-header'>
  724. <h2 class='wk-popup-head'>下载进度条</h2>
  725. <a href='#!' role='wk-button' class='close' aria-label='close this modal'>
  726. <svg viewBox='0 0 24 24'>
  727. <path
  728. d='M24 20.188l-8.315-8.209 8.2-8.282-3.697-3.697-8.212 8.318-8.31-8.203-3.666 3.666 8.321 8.24-8.206 8.313 3.666 3.666 8.237-8.318 8.285 8.203z'>
  729. </path>
  730. </svg>
  731. </a>
  732. </div>
  733. <p class='wk-popup-body'>正在初始化内容...</p>
  734. </div>
  735. <a href='#!' class='outside-trigger'></a>
  736. </div>
  737. </div>
  738. `;
  739. globalThis.wk$ = base.$;
  740. globalThis.wk$$ = base.$$;
  741. const utils = {
  742. Socket: base.Socket,
  743. PDF_LIB_URL: "https://cdn.staticfile.org/pdf-lib/1.17.1/pdf-lib.min.js",
  744. encode_to_gbk: base.init_gbk_encoder(),
  745. print: function(...args) {
  746. const time = new Date().toTimeString().slice(0, 8);
  747. console.info(`[wk ${time}]`, ...args);
  748. },
  749. /**
  750. * 字节串转b64字符串
  751. * @param {Uint8Array} bytes
  752. * @returns {Promise<string>}
  753. */
  754. bytes_to_b64: function(bytes) {
  755. return new Promise((resolve, reject) => {
  756. const reader = new FileReader();
  757. reader.onerror = () => reject(new Error("转换失败", { cause: bytes }));
  758. reader.onloadend = () => resolve(reader.result.split(",")[1]);
  759. reader.readAsDataURL(new Blob([bytes]));
  760. });
  761. },
  762. /**
  763. * 以指定原因弹窗提示并抛出错误
  764. * @param {string} reason
  765. */
  766. raise: function(reason) {
  767. alert(reason);
  768. throw new Error(reason);
  769. },
  770. /**
  771. * 将错误定位转为可读的字符串
  772. * @param {Error} err
  773. * @returns {string}
  774. */
  775. get_stack: function(err) {
  776. let stack = `${err.stack}`;
  777. const matches = stack.matchAll(/at .+?( [(].+[)])/g);
  778. for (const group of matches) {
  779. stack = stack.replace(group[1], "");
  780. }
  781. return stack.trim();
  782. },
  783. /**
  784. * 合并多个PDF
  785. * @param {Array<ArrayBuffer | Uint8Array>} pdfs
  786. * @param {Function} loop_fn
  787. * @param {Window} win
  788. * @returns {Promise<Uint8Array>}
  789. */
  790. join_pdfs: async function(pdfs, loop_fn=null, win=null) {
  791. const _win = win || window;
  792. if (!_win.PDFLib) {
  793. await this.load_web_script(this.PDF_LIB_URL);
  794. }
  795. const combined = await PDFLib.PDFDocument.create();
  796. for (const [i, buffer] of this.enumerate(pdfs)) {
  797. const pdf = await PDFLib.PDFDocument.load(buffer);
  798. const pages = await combined.copyPages(
  799. pdf, pdf.getPageIndices()
  800. );
  801. for (const page of pages) {
  802. combined.addPage(page);
  803. }
  804. if (loop_fn) {
  805. // 如有,则使用自定义钩子函数
  806. loop_fn();
  807. } else {
  808. // 否则使用旧版 popup
  809. this.update_popup(`已经合并 ${i + 1} 组`);
  810. }
  811. }
  812. return await combined.save();
  813. },
  814. /**
  815. * raise an error for status which is not in [200, 299]
  816. * @param {Response} response
  817. */
  818. raise_for_status(response) {
  819. if (!response.ok) {
  820. throw new Error(
  821. `Fetch Error with status code: ${response.status}`
  822. );
  823. }
  824. },
  825. /**
  826. * 计算 str 的 CRC32 摘要(number)
  827. * @param {string} str
  828. * @returns {number}
  829. */
  830. crc32: base.makeCRC32(),
  831. /**
  832. * 返回函数参数定义
  833. * @param {Function} fn
  834. * @param {boolean} print 是否打印到控制台,默认 true
  835. * @returns {string | undefined}
  836. */
  837. help: function(fn, print=true) {
  838. if (!(fn instanceof Function))
  839. throw new Error(`fn must be a function`);
  840. const
  841. _fn = fn.__func__ || fn,
  842. ARROW_ARG = /^([^(]+?)=>/,
  843. FN_ARGS = /^[^(]*\(\s*([^)]*)\)/m,
  844. STRIP_COMMENTS = /((\/\/.*$)|(\/\*[\s\S]*?\*\/))/mg,
  845. fn_text = Function.prototype.toString.call(_fn).replace(STRIP_COMMENTS, ''),
  846. args = fn_text.match(ARROW_ARG) || fn_text.match(FN_ARGS),
  847. // 如果自带 doc,优先使用,否则使用源码
  848. doc = fn.__doc__ ? fn.__doc__ : args[0];
  849. if (!print) return base.stripBlanks(doc);
  850. const color = (window.matchMedia &&
  851. window.matchMedia('(prefers-color-scheme: dark)').matches
  852. ) ;
  853. console.log("%c" + doc, `color: ${color}; font: small italic`);
  854. },
  855. /**
  856. * 字节数组转十六进制字符串
  857. * @param {Uint8Array} arr
  858. * @returns {string}
  859. */
  860. hex_bytes: function(arr) {
  861. return Array.from(arr)
  862. .map(byte => byte.toString(16).padStart(2, "0"))
  863. .join("");
  864. },
  865. /**
  866. * 取得对象类型
  867. * @param {*} obj
  868. * @returns {string} class
  869. */
  870. classof: function(obj) {
  871. return Object
  872. .prototype
  873. .toString
  874. .call(obj)
  875. .slice(8, -1);
  876. },
  877. /**
  878. * 随机改变字体颜色、大小、粗细
  879. * @param {HTMLElement} elem
  880. */
  881. emphasize_text: function(elem) {
  882. const rand = Math.random;
  883. elem.style.cssText = `
  884. font-weight: ${200 + parseInt(700 * rand())};
  885. font-size: ${(1 + rand()).toFixed(1)}em;
  886. color: hsl(${parseInt(360 * rand())}, ${parseInt(40 + 60 * rand())}%, ${parseInt(60 * rand())}%);
  887. background-color: yellow;`;
  888. },
  889. /**
  890. * 等待直到 DOM 节点停止变化
  891. * @param {HTMLElement} elem 监听节点
  892. * @param {number} timeout 超时毫秒数
  893. * @returns {Promise<MutationObserver>} observer
  894. */
  895. until_stop: async function(elem, timeout=2000) {
  896. // 创建用于共享的监听器
  897. let observer;
  898. // 创建超时 Promise
  899. const timeout_promise = new Promise((_, reject) => {
  900. setTimeout(() => {
  901. // 停止监听、释放资源
  902. observer.disconnect();
  903. const error = new Error(
  904. `Timeout Error occured on listening DOM mutation (max ${timeout}ms)`,
  905. { cause: elem }
  906. );
  907. reject(error);
  908. }, timeout);
  909. });
  910. // 开始元素节点变动监听
  911. return Promise.race([
  912. new Promise(resolve => {
  913. // 创建监听器
  914. observer = new MutationObserver(
  915. (_, observer) => {
  916. // DOM 变动结束后终止监听、释放资源
  917. observer.disconnect();
  918. // 返回监听器
  919. resolve(observer);
  920. }
  921. );
  922. // 开始监听目标节点
  923. observer.observe(elem, {
  924. subtree: true,
  925. childList: true,
  926. attributes: true
  927. });
  928. }),
  929. timeout_promise,
  930. ])
  931. .catch(error => {
  932. if (`${error}`.includes("Timeout Error")) {
  933. return observer;
  934. }
  935. console.error(error);
  936. throw error;
  937. });
  938. },
  939. /**
  940. * Find all the patterns that matches in a given string `str`
  941. * this algorithm is based on the Knuth–Morris–Pratt algorithm. Its beauty consists in that it performs the matching in O(n)
  942. * @param {Array<number>} arr
  943. * @param {Array<number>} sub_arr
  944. * @returns {Array<number>}
  945. */
  946. kmp_matching: function(arr, sub_arr) {
  947. // find the prefix table in O(n)
  948. let prefixes = base.longest_prefix(sub_arr);
  949. let matches = [];
  950. // `j` is the index in `P`
  951. let j = 0;
  952. // `i` is the index in `S`
  953. let i = 0;
  954. while (i < arr.length) {
  955. // Case 1. S[i] == P[j] so we move to the next index in `S` and `P`
  956. if (arr[i] === sub_arr[j]) {
  957. i++;
  958. j++;
  959. }
  960. // Case 2. `j` is equal to the length of `P`
  961. // that means that we reached the end of `P` and thus we found a match
  962. if (j === sub_arr.length) {
  963. matches.push(i - j);
  964. // Next we have to update `j` because we want to save some time
  965. // instead of updating to j = 0 , we can jump to the last character of the longest prefix well known so far.
  966. // j-1 means the last character of `P` because j is actually `P.length`
  967. // e.g.
  968. // S = a b a b d e
  969. // P = `a b`a b
  970. // we will jump to `a b` and we will compare d and a in the next iteration
  971. // a b a b `d` e
  972. // a b `a` b
  973. j = prefixes[j - 1];
  974. }
  975. // Case 3.
  976. // S[i] != P[j] There's a mismatch!
  977. else if (arr[i] !== sub_arr[j]) {
  978. // if we have found at least a character in common, do the same thing as in case 2
  979. if (j !== 0) {
  980. j = prefixes[j - 1];
  981. } else {
  982. // otherwise, j = 0, and we can move to the next character S[i+1]
  983. i++;
  984. }
  985. }
  986. }
  987. return matches;
  988. },
  989. /**
  990. * 用文件头切断文件集合体
  991. * @param {Uint8Array} bytes
  992. * @param {Uint8Array} head 默认 null,即使用 data 前 8 字节
  993. * @returns {Array<Uint8Array>}
  994. */
  995. split_files_by_head: function(bytes, head=null) {
  996. const sub = bytes.subarray || bytes.slice;
  997. head = head || sub.call(bytes, 0, 8);
  998. const indexes = this.kmp_matching(bytes, head);
  999. const size = indexes.length;
  1000. indexes.push(bytes.length);
  1001. const parts = new Array(size);
  1002. for (let i = 0; i < size; i++) {
  1003. parts[i] = sub.call(bytes, indexes[i], indexes[i+1]);
  1004. }
  1005. // 返回结果数组
  1006. return parts;
  1007. },
  1008. /**
  1009. * 函数装饰器:仅执行一次 func
  1010. */
  1011. once: function(fn) {
  1012. let used = false;
  1013. return function() {
  1014. if (!used) {
  1015. used = true;
  1016. return fn();
  1017. }
  1018. }
  1019. },
  1020. /**
  1021. * 返回一个包含计数器的迭代器, 其每次迭代值为 [index, value]
  1022. * @param {Iterable} iterable
  1023. * @returns
  1024. */
  1025. enumerate: function* (iterable) {
  1026. let i = 0;
  1027. for (let value of iterable) {
  1028. yield [i, value];
  1029. i++;
  1030. }
  1031. },
  1032. /**
  1033. * 同步的迭代若干可迭代对象
  1034. * @param {...Iterable} iterables
  1035. * @returns
  1036. */
  1037. zip: function* (...iterables) {
  1038. // 强制转为迭代器
  1039. let iterators = iterables.map(
  1040. iterable => iterable[Symbol.iterator]()
  1041. );
  1042. // 逐次迭代
  1043. while (true) {
  1044. const [done, values] = base.getAllValus(iterators);
  1045. if (done) {
  1046. return;
  1047. }
  1048. if (values.length === 1) {
  1049. yield values[0];
  1050. } else {
  1051. yield values;
  1052. }
  1053. }
  1054. },
  1055. /**
  1056. * 返回指定范围整数生成器
  1057. * @param {number} end 如果只提供 end, 则返回 [0, end)
  1058. * @param {number} end2 如果同时提供 end2, 则返回 [end, end2)
  1059. * @param {number} step 步长, 可以为负数,不能为 0
  1060. * @returns
  1061. */
  1062. range: function*(end, end2=null, step=1) {
  1063. // 参数合法性校验
  1064. if (step === 0) {
  1065. throw new RangeError("step can't be zero");
  1066. }
  1067. const len = end2 - end;
  1068. if (end2 && len && step && (len * step < 0)) {
  1069. throw new RangeError(`[${end}, ${end2}) with step ${step} is invalid`);
  1070. }
  1071. // 生成范围
  1072. end2 = end2 === null ? 0 : end2;
  1073. let [small, big] = [end, end2].sort((a, b) => a - b);
  1074. // 开始迭代
  1075. if (step > 0) {
  1076. for (let i = small; i < big; i += step) {
  1077. yield i;
  1078. }
  1079. } else {
  1080. for (let i = big; i > small; i += step) {
  1081. yield i;
  1082. }
  1083. } },
  1084. /**
  1085. * 获取整个文档的全部css样式
  1086. * @returns {string} css text
  1087. */
  1088. get_all_styles: function() {
  1089. let styles = [];
  1090. for (let sheet of document.styleSheets) {
  1091. let rules;
  1092. try {
  1093. rules = sheet.cssRules;
  1094. } catch(e) {
  1095. if (!(e instanceof DOMException)) {
  1096. console.error(e);
  1097. }
  1098. continue;
  1099. }
  1100. for (let rule of rules) {
  1101. styles.push(rule.cssText);
  1102. }
  1103. }
  1104. return styles.join("\n\n");
  1105. },
  1106. /**
  1107. * 复制text到剪贴板
  1108. * @param {string} text
  1109. * @returns
  1110. */
  1111. copy_text: function(text) {
  1112. // 输出到控制台和剪贴板
  1113. console.log(
  1114. text.length > 20 ?
  1115. text.slice(0, 21) + "..." : text
  1116. );
  1117. if (!navigator.clipboard) {
  1118. base.oldCopy(text);
  1119. return;
  1120. }
  1121. navigator.clipboard
  1122. .writeText(text)
  1123. .catch(_ => base.oldCopy(text));
  1124. },
  1125. /**
  1126. * 复制媒体到剪贴板
  1127. * @param {Blob} blob
  1128. */
  1129. copy: async function(blob) {
  1130. const data = [new ClipboardItem({ [blob.type]: blob })];
  1131. try {
  1132. await navigator.clipboard.write(data);
  1133. console.log(`${blob.type} 成功复制到剪贴板`);
  1134. } catch (err) {
  1135. console.error(err.name, err.message);
  1136. }
  1137. },
  1138. /**
  1139. * 创建并下载文件
  1140. * @param {string} file_name 文件名
  1141. * @param {ArrayBuffer | ArrayBufferView | Blob | string} content 内容
  1142. * @param {string} type 媒体类型,需要符合 MIME 标准
  1143. */
  1144. save: function(file_name, content, type="") {
  1145. if (!type && (content instanceof Blob)) {
  1146. type = content.type;
  1147. }
  1148. let blob = null;
  1149. if (content instanceof Array) {
  1150. blob = new Blob(content, { type });
  1151. } else {
  1152. blob = new Blob([content], { type });
  1153. }
  1154. const size = parseInt((blob.size / 1024).toFixed(0)).toLocaleString();
  1155. console.log(`blob saved, size: ${size} KB, type: ${blob.type}`, blob);
  1156. const url = URL.createObjectURL(blob);
  1157. const a = document.createElement("a");
  1158. a.download = file_name || "未命名文件";
  1159. a.href = url;
  1160. a.click();
  1161. URL.revokeObjectURL(url);
  1162. },
  1163. /**
  1164. * 显示/隐藏按钮区
  1165. */
  1166. toggle_box: function() {
  1167. let sec = wk$(".wk-box")[0];
  1168. if (sec.style.display === "none") {
  1169. sec.style.display = "block";
  1170. return;
  1171. }
  1172. sec.style.display = "none";
  1173. },
  1174. /**
  1175. * 异步地睡眠 delay 毫秒, 可选 max_delay 控制波动范围
  1176. * @param {number} delay 等待毫秒
  1177. * @param {number} max_delay 最大等待毫秒, 默认为null
  1178. * @returns
  1179. */
  1180. sleep: async function(delay, max_delay=null) {
  1181. max_delay = max_delay === null ? delay : max_delay;
  1182. delay = delay + (max_delay - delay) * Math.random();
  1183. return new Promise(resolve => setTimeout(resolve, delay));
  1184. },
  1185. /**
  1186. * 允许打印页面
  1187. */
  1188. allow_print: function() {
  1189. const style = document.createElement("style");
  1190. style.innerHTML = `
  1191. @media print {
  1192. body { display: block; }
  1193. }`;
  1194. document.head.append(style);
  1195. },
  1196. /**
  1197. * 取得get参数key对应的value
  1198. * @param {string} key
  1199. * @returns {string} value
  1200. */
  1201. get_param: function(key) {
  1202. return new URL(location.href).searchParams.get(key);
  1203. },
  1204. /**
  1205. * 求main_set去除cut_set后的set
  1206. * @param {Iterable} main_set
  1207. * @param {Iterable} cut_set
  1208. * @returns 差集
  1209. */
  1210. diff: function(main_set, cut_set) {
  1211. const _diff = new Set(main_set);
  1212. for (let elem of cut_set) {
  1213. _diff.delete(elem);
  1214. }
  1215. return _diff;
  1216. },
  1217. /**
  1218. * 增强按钮(默认为蓝色按钮:展开文档)的点击效果
  1219. * @param {string} i 按钮序号
  1220. */
  1221. enhance_click: async function(i) {
  1222. let btn = this.btn(i);
  1223. const style = btn.getAttribute("style") || "";
  1224. // 变黑缩小
  1225. btn.setAttribute(
  1226. "style",
  1227. style + "color: black; font-weight: normal;"
  1228. );
  1229. await utils.sleep(500);
  1230. btn = this.btn(i);
  1231. // 复原加粗
  1232. btn.setAttribute("style", style);
  1233. },
  1234. /**
  1235. * 绑定事件处理函数到指定按钮,返回实际添加的事件处理函数
  1236. * @param {(event: PointerEvent) => Promise<void>} listener click监听器
  1237. * @param {number} i 按钮序号
  1238. * @param {string} new_text 按钮的新文本,为null则不替换
  1239. * @returns {Function} 事件处理函数
  1240. */
  1241. onclick: function(listener, i, new_text=null) {
  1242. const btn = this.btn(i);
  1243. // 如果需要,替换按钮内文本
  1244. if (new_text) {
  1245. btn.textContent = new_text;
  1246. }
  1247. // 绑定事件,添加到页面上
  1248. /**
  1249. * @param {PointerEvent} event
  1250. */
  1251. async function wrapped_listener(event) {
  1252. const btn = event.target;
  1253. const text = btn.textContent;
  1254. btn.disabled = true;
  1255. try {
  1256. await listener.call(btn, event);
  1257. } catch(err) {
  1258. console.error(err);
  1259. }
  1260. btn.disabled = false;
  1261. btn.textContent = text;
  1262. }
  1263. btn.onclick = wrapped_listener;
  1264. return wrapped_listener;
  1265. },
  1266. /**
  1267. * 返回第 index 个按钮引用
  1268. * @param {number} i
  1269. * @returns {HTMLButtonElement}
  1270. */
  1271. btn: function(i) {
  1272. return wk$(`.wk-box [class="btn-${i}"]`)[0];
  1273. },
  1274. /**
  1275. * 强制隐藏元素
  1276. * @param {string | Array<HTMLElement>} selector_or_elems
  1277. */
  1278. force_hide: function(selector_or_elems) {
  1279. const cls = "force-hide";
  1280. const elems = selector_or_elems instanceof Array ?
  1281. selector_or_elems : wk$(selector_or_elems);
  1282. elems.forEach(elem => {
  1283. elem.classList.add(cls);
  1284. });
  1285. // 判断css样式是否已经存在
  1286. let style = wk$(`style.${cls}`)[0];
  1287. // 如果已经存在,则无须重复创建
  1288. if (style) {
  1289. return;
  1290. }
  1291. // 否则创建
  1292. style = document.createElement("style");
  1293. style.innerHTML = `style.${cls} {
  1294. visibility: hidden !important;
  1295. display: none !important;
  1296. }`;
  1297. document.head.append(style);
  1298. },
  1299. /**
  1300. * 等待直到元素可见。最多等待5秒。
  1301. * @param {HTMLElement} elem 一个元素
  1302. * @returns {Promise<HTMLElement>} elem
  1303. */
  1304. until_visible: async function(elem) {
  1305. let [max, i] = [25, 0];
  1306. let style = getComputedStyle(elem);
  1307. // 如果不可见就等待0.2秒/轮
  1308. while (i <= max &&
  1309. (style.display === "none" ||
  1310. style.visibility !== "hidden")
  1311. ) {
  1312. i++;
  1313. style = getComputedStyle(elem);
  1314. await this.sleep(200);
  1315. }
  1316. return elem;
  1317. },
  1318. /**
  1319. * 等待直到函数返回true
  1320. * @param {Function} isReady 判断条件达成与否的函数
  1321. * @param {number} timeout 最大等待秒数, 默认5000毫秒
  1322. */
  1323. wait_until: async function(isReady, timeout=5000) {
  1324. const gap = 200;
  1325. let chances = parseInt(timeout / gap);
  1326. chances = chances < 1 ? 1 : chances;
  1327. while (! await isReady()) {
  1328. await this.sleep(200);
  1329. chances -= 1;
  1330. if (!chances) {
  1331. break;
  1332. }
  1333. }
  1334. },
  1335. /**
  1336. * 隐藏按钮,打印页面,显示按钮
  1337. */
  1338. print_page: function() {
  1339. // 隐藏按钮,然后打印页面
  1340. this.toggle_box();
  1341. setTimeout(window.print, 500);
  1342. setTimeout(this.toggle_box, 1000);
  1343. },
  1344. /**
  1345. * 切换按钮显示/隐藏状态
  1346. * @param {number} i 按钮序号
  1347. * @returns 按钮元素的引用
  1348. */
  1349. toggle_btn: function(i) {
  1350. const btn = this.btn(i);
  1351. const display = getComputedStyle(btn).display;
  1352. if (display === "none") {
  1353. btn.style.display = "block";
  1354. } else {
  1355. btn.style.display = "none";
  1356. }
  1357. return btn;
  1358. },
  1359. /**
  1360. * 用input框跳转到对应页码
  1361. * @param {HTMLInputElement} input 当前页码
  1362. * @param {string | number} page_num 目标页码
  1363. * @param {string} type 键盘事件类型:"keyup" | "keypress" | "keydown"
  1364. */
  1365. to_page: function(input, page_num, type) {
  1366. // 设置跳转页码为目标页码
  1367. input.value = `${page_num}`;
  1368. // 模拟回车事件来跳转
  1369. const enter = new KeyboardEvent(type, {
  1370. bubbles: true,
  1371. cancelable: true,
  1372. keyCode: 13
  1373. });
  1374. input.dispatchEvent(enter);
  1375. },
  1376. /**
  1377. * 判断给定的url是否与当前页面同源
  1378. * @param {string} url
  1379. * @returns {boolean}
  1380. */
  1381. is_same_origin: function(url) {
  1382. url = new URL(url);
  1383. if (url.protocol === "data:") {
  1384. return true;
  1385. }
  1386. if (location.protocol === url.protocol
  1387. && location.host === url.host
  1388. && location.port === url.port
  1389. ) {
  1390. return true;
  1391. }
  1392. return false;
  1393. },
  1394. /**
  1395. * 在新标签页打开链接,如果提供文件名则下载
  1396. * @param {string} url
  1397. * @param {string} fname 下载文件的名称,默认为空,代表不下载
  1398. */
  1399. open_in_new_tab: function(url, fname="") {
  1400. const a = document.createElement("a");
  1401. a.href = url;
  1402. a.target = "_blank";
  1403. if (fname && this.is_same_origin(url)) {
  1404. a.download = fname;
  1405. }
  1406. a.click();
  1407. },
  1408. /**
  1409. * 用try移除元素
  1410. * @param {HTMLElement | string} elem_or_selector
  1411. */
  1412. remove: function(elem_or_selector) {
  1413. try {
  1414. const cls = this.classof(elem_or_selector);
  1415. if (cls === "String") {
  1416. wk$(elem_or_selector).forEach(
  1417. elem => elem.remove()
  1418. );
  1419. }
  1420. else if (cls.endsWith("Element")) {
  1421. elem_or_selector.remove();
  1422. }
  1423. } catch (e) {
  1424. console.error(e);
  1425. }
  1426. },
  1427. /**
  1428. * 用try移除若干元素
  1429. * @param {Iterable<HTMLElement>} elements 要移除的元素列表
  1430. */
  1431. remove_multi: function(elements) {
  1432. for (const elem of elements) {
  1433. this.remove(elem);
  1434. }
  1435. },
  1436. /**
  1437. * 等待全部任务落定后返回值的列表
  1438. * @param {Array<Promise>} tasks
  1439. * @returns {Promise<Array>}
  1440. */
  1441. gather: async function(tasks) {
  1442. const results = await Promise.allSettled(tasks);
  1443. const values = [];
  1444. for (const result of results) {
  1445. // 期约成功解决且返回值不为空的才有效
  1446. if (result.status === "fulfilled"
  1447. && !([NaN, null, undefined].includes(result.value))) {
  1448. values.push(result.value);
  1449. }
  1450. }
  1451. return values;
  1452. },
  1453. /**
  1454. * html元素列表转为canvas列表
  1455. * @param {Array<HTMLElement>} elements
  1456. * @returns {Promise<Array<HTMLCanvasElement>>}
  1457. */
  1458. elems_to_canvases: async function(elements) {
  1459. if (!globalThis.html2canvas) {
  1460. await this.load_web_script(
  1461. "https://cdn.staticfile.org/html2canvas/1.4.1/html2canvas.min.js"
  1462. );
  1463. }
  1464. // 如果是空列表, 则抛出异常
  1465. if (elements.length === 0) {
  1466. throw new Error("htmlToCanvases 未得到任何html元素");
  1467. }
  1468. return this.gather(
  1469. elements.map(html2canvas)
  1470. );
  1471. },
  1472. /**
  1473. * 将html元素转为canvas再合并到pdf中,最后下载pdf
  1474. * @param {Array<HTMLElement>} elements 元素列表
  1475. * @param {string} title 文档标题
  1476. */
  1477. elems_to_pdf: async function(elements, title="文档") {
  1478. // 如果是空元素列表,终止函数
  1479. const canvases = await this.elems_to_canvases(elements);
  1480. // 控制台检查结果
  1481. console.log("生成的canvas元素如下:");
  1482. console.log(canvases);
  1483. // 合并为PDF
  1484. this.imgs_to_pdf(canvases, title);
  1485. },
  1486. /**
  1487. * 使用xhr异步GET请求目标url,返回响应体blob
  1488. * @param {string} url
  1489. * @returns {Promise<Blob>} blob
  1490. */
  1491. xhr_get_blob: async function(url) {
  1492. const xhr = new XMLHttpRequest();
  1493. xhr.open("GET", url);
  1494. xhr.responseType = "blob";
  1495. return new Promise((resolve, reject) => {
  1496. xhr.onload = () => {
  1497. const code = xhr.status;
  1498. if (code >= 200 && code <= 299) {
  1499. resolve(xhr.response);
  1500. }
  1501. else {
  1502. reject(new Error(`Network Error: ${code}`));
  1503. }
  1504. };
  1505. xhr.send();
  1506. });
  1507. },
  1508. /**
  1509. * 加载CDN脚本
  1510. * @param {string} url
  1511. */
  1512. load_web_script: async function(url) {
  1513. try {
  1514. const resp = await fetch(url);
  1515. const code = await resp.text();
  1516. Function(code)();
  1517. } catch(e) {
  1518. console.error(e);
  1519. // 嵌入<script>方式
  1520. return new Promise(resolve => {
  1521. const script = document.createElement("script");
  1522. script.src = url;
  1523. script.onload = resolve;
  1524. document.body.append(script);
  1525. });
  1526. }
  1527. },
  1528. /**
  1529. * b64编码字符串转Uint8Array
  1530. * @param {string} sBase64 b64编码的字符串
  1531. * @param {number} nBlockSize 字节数
  1532. * @returns {Uint8Array} arr
  1533. */
  1534. b64_to_bytes: function(sBase64, nBlockSize=1) {
  1535. const
  1536. sB64Enc = sBase64.replace(/[^A-Za-z0-9\+\/]/g, ""), nInLen = sB64Enc.length,
  1537. nOutLen = nBlockSize ? Math.ceil((nInLen * 3 + 1 >>> 2) / nBlockSize) * nBlockSize : nInLen * 3 + 1 >>> 2, aBytes = new Uint8Array(nOutLen);
  1538. for (var nMod3, nMod4, nUint24 = 0, nOutIdx = 0, nInIdx = 0; nInIdx < nInLen; nInIdx++) {
  1539. nMod4 = nInIdx & 3;
  1540. nUint24 |= base.b64ToUint6(sB64Enc.charCodeAt(nInIdx)) << 18 - 6 * nMod4;
  1541. if (nMod4 === 3 || nInLen - nInIdx === 1) {
  1542. for (nMod3 = 0; nMod3 < 3 && nOutIdx < nOutLen; nMod3++, nOutIdx++) {
  1543. aBytes[nOutIdx] = nUint24 >>> (16 >>> nMod3 & 24) & 255;
  1544. }
  1545. nUint24 = 0;
  1546. }
  1547. }
  1548. return aBytes;
  1549. },
  1550. /**
  1551. * canvas转blob
  1552. * @param {HTMLCanvasElement} canvas
  1553. * @param {string} type
  1554. * @returns {Promise<Blob>}
  1555. */
  1556. canvas_to_blob: function(canvas, type="image/png") {
  1557. return new Promise(
  1558. resolve => canvas.toBlob(resolve, type, 1)
  1559. );
  1560. },
  1561. /**
  1562. * 合并blobs到压缩包,然后下载
  1563. * @param {Iterable<Blob>} blobs
  1564. * @param {string} base_name 文件名通用部分,如 page-1.jpg 中的 page
  1565. * @param {string} ext 扩展名,如 jpg
  1566. * @param {string} zip_name 压缩包名称
  1567. * @param {boolean} download 是否下载,可选,默认true,如果不下载则返回压缩包对象
  1568. * @returns {"Promise<JSZip | null>"}
  1569. */
  1570. blobs_to_zip: async function(blobs, base_name, ext, zip_name, download=true) {
  1571. const zip = new window.JSZip();
  1572. // 归档
  1573. for (const [i, blob] of this.enumerate(blobs)) {
  1574. zip.file(`${base_name}-${i+1}.${ext}`, blob, { binary: true });
  1575. }
  1576. // 导出
  1577. if (!download) {
  1578. return zip;
  1579. }
  1580. const zip_blob = await zip.generateAsync({ type: "blob" });
  1581. console.log(zip_blob);
  1582. this.save(`${zip_name}.zip`, zip_blob);
  1583. return null;
  1584. },
  1585. /**
  1586. * 存储所有canvas图形为png到一个压缩包
  1587. * @param {Iterable<HTMLCanvasElement>} canvases canvas元素列表
  1588. * @param {string} title 文档标题
  1589. */
  1590. canvases_to_zip: async function(canvases, title) {
  1591. // canvas元素转为png图像
  1592. // 所有png合并为一个zip压缩包
  1593. const tasks = [];
  1594. for (let canvas of canvases) {
  1595. tasks.push(this.canvas_to_blob(canvas));
  1596. }
  1597. const blobs = await this.gather(tasks);
  1598. this.blobs_to_zip(blobs, "page", "png", title);
  1599. },
  1600. /**
  1601. * 合并图像并导出PDF
  1602. * @param {Iterable<HTMLCanvasElement | Uint8Array | HTMLImageElement>} imgs 图像元素列表
  1603. * @param {string} title 文档标题
  1604. * @param {number} width (可选)页面宽度 默认 0
  1605. * @param {number} height (可选)页面高度 默认 0
  1606. * @param {boolean} blob (可选)是否返回 blob 默认 false
  1607. */
  1608. imgs_to_pdf: async function(imgs, title, width = 0, height = 0, blob=false) {
  1609. imgs = Array.from(imgs);
  1610. if (imgs.length === 0) {
  1611. this.raise("没有任何图像用于合并为PDF");
  1612. }
  1613. // 先获取第一个canvas用于判断竖向还是横向,以及得到页面长宽
  1614. const first = imgs[0];
  1615. // 如果没有手动指定canvas的长宽,则自动检测
  1616. if (!width && !height) {
  1617. // 如果是字节数组
  1618. if (first instanceof Uint8Array) {
  1619. const cover = await createImageBitmap(
  1620. new Blob([first])
  1621. );
  1622. [width, height] = [cover.width, cover.height];
  1623. // 如果是画布或图像元素
  1624. } else if (
  1625. first instanceof HTMLCanvasElement ||
  1626. first instanceof HTMLImageElement
  1627. ) {
  1628. if (first.width && parseInt(first.width) && parseInt(first.height)) {
  1629. [width, height] = [first.width, first.height];
  1630. } else {
  1631. const
  1632. width_str = first.style.width.replace(/(px)|(rem)|(em)/, ""),
  1633. height_str = first.style.height.replace(/(px)|(rem)|(em)/, "");
  1634. width = parseInt(width_str);
  1635. height = parseInt(height_str);
  1636. }
  1637. } else {
  1638. // 其他未知类型
  1639. throw TypeError("不能处理的画布元素类型:" + this.classof(first));
  1640. }
  1641. }
  1642. console.log(`canvas数据:宽: ${width}px,高: ${height}px`);
  1643. // 如果文档第一页的宽比长更大,则landscape,否则portrait
  1644. const orientation = width > height ? 'l' : 'p';
  1645. // jsPDF的第三个参数为format,当自定义时,参数为数字数组。
  1646. const pdf = new jspdf.jsPDF(orientation, 'px', [height, width]);
  1647. const last = imgs.pop();
  1648. const self = this;
  1649. // 保存每一页文档到每一页pdf
  1650. imgs.forEach((canvas, i) => {
  1651. pdf.addImage(canvas, 'png', 0, 0, width, height);
  1652. pdf.addPage();
  1653. self?.update_popup(`PDF 已经绘制 ${i + 1} 页`);
  1654. });
  1655. // 添加尾页
  1656. pdf.addImage(last, 'png', 0, 0, width, height);
  1657. // 导出文件
  1658. if (blob) {
  1659. return pdf.output("blob");
  1660. }
  1661. pdf.save(`${title}.pdf`);
  1662. },
  1663. /**
  1664. * imageBitMap转canvas
  1665. * @param {ImageBitmap} bmp
  1666. * @returns {HTMLCanvasElement} canvas
  1667. */
  1668. bmp_to_canvas: function(bmp) {
  1669. const canvas = document.createElement("canvas");
  1670. canvas.height = bmp.height;
  1671. canvas.width = bmp.width;
  1672. const ctx = canvas.getContext("bitmaprenderer");
  1673. ctx.transferFromImageBitmap(bmp);
  1674. return canvas;
  1675. },
  1676. /**
  1677. * 导出图片链接
  1678. * @param {Iterable<string>} urls
  1679. */
  1680. save_urls: function(urls) {
  1681. const _urls = Array
  1682. .from(urls)
  1683. .map((url) => {
  1684. const _url = url.trim();
  1685. if (url.startsWith("//"))
  1686. return "https:" + _url;
  1687. return _url;
  1688. })
  1689. .filter(url => url);
  1690. this.save("urls.csv", _urls.join("\n"), "text/csv");
  1691. },
  1692. /**
  1693. * 图片blobs合并并导出为单个PDF
  1694. * @param {Array<Blob>} blobs
  1695. * @param {string} title (可选)文档名称, 不含后缀, 默认为"文档"
  1696. * @param {boolean} filter (可选)是否过滤 type 不以 "image/" 开头的 blob; 默认为 true
  1697. * @param {boolean} blob (可选)是否返回 blob,默认 false
  1698. */
  1699. img_blobs_to_pdf: async function(blobs, title="文档", filter=true, blob=false) {
  1700. // 格式转换:img blob -> bmp
  1701. let tasks = blobs;
  1702. if (filter) {
  1703. tasks = blobs.filter(
  1704. blob => blob.type.startsWith("image/")
  1705. );
  1706. }
  1707. tasks = await this.gather(
  1708. tasks.map(blob => blob.arrayBuffer())
  1709. );
  1710. tasks = tasks.map(buffer => new Uint8Array(buffer));
  1711. // 导出PDF
  1712. return this.imgs_to_pdf(tasks, title, 0, 0, blob);
  1713. },
  1714. /**
  1715. * 下载可以简单直接请求的图片,合并到 PDF 并导出
  1716. * @param {Iterable<string>} urls 图片链接列表
  1717. * @param {string} title 文档名称
  1718. * @param {number} min_num 如果成功获取的图片数量 < min_num, 则等待 2 秒后重试; 默认 0 不重试
  1719. * @param {boolean} clear 是否在请求完成后清理控制台输出,默认false
  1720. * @param {boolean} blobs 是否返回二进制图片列表,默认 false(即直接导出PDF)
  1721. */
  1722. img_urls_to_pdf: async function(urls, title, min_num=0, clear=false, blobs=false) {
  1723. // 强制转换为迭代器类型
  1724. urls = urls[Symbol.iterator]();
  1725. const first = urls.next().value;
  1726. // 如果不符合同源策略,在打开新标签页
  1727. if (!this.is_same_origin(first)) {
  1728. console.info("URL 不符合同源策略;转为新标签页打开目标网站");
  1729. this.open_in_new_tab((new URL(first)).origin);
  1730. return;
  1731. }
  1732. let tasks, img_blobs, i = 3;
  1733. // 根据请求成功数量判断是否循环
  1734. do {
  1735. i -= 1;
  1736. // 发起请求
  1737. tasks = [this.xhr_get_blob(first)]; // 初始化时加入第一个
  1738. // 然后加入剩余的
  1739. for (const [j, url] of this.enumerate(urls)) {
  1740. tasks.push(this.xhr_get_blob(url));
  1741. this.update_popup(`已经请求 ${j} 张图片`);
  1742. }
  1743. // 接收响应
  1744. img_blobs = (await this.gather(tasks)).filter(
  1745. blob => blob.type.startsWith("image/")
  1746. );
  1747. if (clear) {
  1748. console.clear();
  1749. }
  1750. if (
  1751. min_num
  1752. && img_blobs.length < min_num
  1753. && i
  1754. ) {
  1755. // 下轮行动前冷却
  1756. console.log(`打盹 2 秒`);
  1757. await utils.sleep(2000);
  1758. } else {
  1759. // 结束循环
  1760. break;
  1761. }
  1762. } while (true)
  1763. if (blobs) return img_blobs;
  1764. await this.img_blobs_to_pdf(img_blobs, title, false);
  1765. },
  1766. /**
  1767. * 返回子串个数
  1768. * @param {string} str
  1769. * @param {string} sub
  1770. */
  1771. count_sub_str: function(str, sub) {
  1772. return [...str.matchAll(sub)].length;
  1773. },
  1774. /**
  1775. * 返回按钮区引用
  1776. * @returns
  1777. */
  1778. sec: function() {
  1779. const sec = wk$(".wk-box .btns-sec")[0];
  1780. if (!sec) throw new Error("wk 按钮区找不到");
  1781. return sec;
  1782. },
  1783. _monkey: function() {
  1784. const mky = wk$(".wk-box .wk-fold-btn")[0];
  1785. if (!mky) throw new Error("wk 小猴子找不到");
  1786. return mky;
  1787. },
  1788. /**
  1789. * 折叠按钮区,返回是否转换了状态
  1790. */
  1791. fold_box: function() {
  1792. const sec = this.sec();
  1793. const mky = this._monkey();
  1794. const display = getComputedStyle(sec).display;
  1795. if (display !== "block") return false;
  1796. // 显示 -> 隐藏
  1797. [sec, mky].forEach(
  1798. elem => elem.classList.add("folded")
  1799. );
  1800. return true;
  1801. },
  1802. /**
  1803. * 展开按钮区,返回是否转换了状态
  1804. */
  1805. unfold_box: function() {
  1806. const sec = this.sec();
  1807. const mky = this._monkey();
  1808. const display = getComputedStyle(sec).display;
  1809. if (display === "block") return false;
  1810. // 隐藏 -> 显示
  1811. // 显示 -> 隐藏
  1812. [sec, mky].forEach(
  1813. elem => elem.classList.remove("folded")
  1814. );
  1815. return true;
  1816. },
  1817. /**
  1818. * 运行基于按钮的、显示进度条的函数
  1819. * @param {number} i 按钮序号
  1820. * @param {Function} task 需要等待的耗时函数
  1821. */
  1822. run_with_prog: async function(i, task) {
  1823. const btn = utils.btn(i);
  1824. let new_btn;
  1825. if (!wk$("#wk-popup")[0]) {
  1826. this.add_popup();
  1827. }
  1828. this.fold_box();
  1829. this.toID("wk-popup");
  1830. new_btn = btn.cloneNode(true);
  1831. btn.replaceWith(new_btn);
  1832. this.onclick(
  1833. () => utils.toID("wk-popup"), i, "显示进度"
  1834. );
  1835. try {
  1836. await task();
  1837. } catch(e) {
  1838. console.error(e);
  1839. }
  1840. this.toID("");
  1841. this.unfold_box();
  1842. this.remove_popup();
  1843. new_btn.replaceWith(btn);
  1844. },
  1845. /**
  1846. * 创建5个按钮:展开文档、导出图片、导出PDF、未设定4、未设定5;除第1个外默认均为隐藏
  1847. */
  1848. create_btns: function() {
  1849. // 添加样式
  1850. document.head.insertAdjacentHTML("beforeend", style);
  1851. // 添加按钮区
  1852. document.body.insertAdjacentHTML("beforeend", box);
  1853. // 绑定小猴子按钮回调
  1854. const monkey = wk$(".wk-fold-btn")[0];
  1855. // 隐藏【🙈】,展开【🐵】
  1856. monkey.onclick = () => this.fold_box() || this.unfold_box();
  1857. },
  1858. /**
  1859. * 添加弹窗到 body, 通过 utils.toID("wk-popup") 激发
  1860. */
  1861. add_popup: function() {
  1862. document.body.insertAdjacentHTML("beforeend", popup);
  1863. },
  1864. /**
  1865. * 设置弹窗正文
  1866. * @param {string} text
  1867. */
  1868. update_popup: function(text) {
  1869. const body = wk$(".wk-popup-body")[0];
  1870. if (!body) return;
  1871. body.textContent = text;
  1872. },
  1873. /**
  1874. * 移除弹窗
  1875. */
  1876. remove_popup: function() {
  1877. this.remove(wk$(".wk-popup-container")[0]);
  1878. },
  1879. /**
  1880. * 滚动页面到id位置的元素处
  1881. * @param {string} id
  1882. */
  1883. toID: function(id) {
  1884. location.hash = `#${id}`;
  1885. }
  1886. };
  1887. /**
  1888. * ---------------------------------------------------------------------
  1889. * 绑定使用 this 的函数到 utils,使其均成为绑定方法
  1890. * ---------------------------------------------------------------------
  1891. */
  1892. /**
  1893. * 确保特定外部脚本加载的装饰器
  1894. * @param {string} global_obj_name
  1895. * @param {string} cdn_url
  1896. * @param {Function} func
  1897. * @returns
  1898. */
  1899. function ensure_script_existed(global_obj_name, cdn_url, func) {
  1900. async function inner(...args) {
  1901. if (!window[global_obj_name]) {
  1902. // 根据需要加载依赖
  1903. await utils.load_web_script(cdn_url);
  1904. }
  1905. return func(...args);
  1906. }
  1907. // 存储参数定义
  1908. base.superAssign(inner, func);
  1909. return inner;
  1910. }
  1911. /**
  1912. * 确保引用外部依赖的函数都在调用前加载了依赖
  1913. */
  1914. for (const prop of Object.keys(utils)) {
  1915. // 跳过非函数
  1916. if (
  1917. !(typeof utils[prop] === "function")
  1918. && !`${utils[prop]}`.startsWith("class")
  1919. ) {
  1920. continue;
  1921. }
  1922. // 绑定this到utils
  1923. if (/ this[.[][a-z_]/.test(`${utils[prop]}`)) {
  1924. // 存储参数定义
  1925. const doc = utils.help(utils[prop], false);
  1926. // 绑死this,同时提供 __func__ 来取回原先的函数
  1927. const fn = utils[prop];
  1928. utils[prop] = utils[prop].bind(utils);
  1929. utils[prop].__func__ = fn;
  1930. // 重设参数定义
  1931. utils[prop].__doc__ = doc;
  1932. }
  1933. // 设定 __doc__ 为访问器属性
  1934. const doc_box = [
  1935. utils.help(utils[prop], false)
  1936. ];
  1937. Object.defineProperty(utils[prop], "__doc__", {
  1938. configurable: true,
  1939. enumerable: true,
  1940. get() { return doc_box.join("\n"); },
  1941. set(new_doc) { doc_box.push(new_doc); },
  1942. });
  1943. // 为有外部依赖的函数做包装
  1944. let obj, url;
  1945. const name = prop.toLowerCase();
  1946. if (name.includes("_to_zip")) {
  1947. obj = "JSZip";
  1948. url = "https://cdn.staticfile.org/jszip/3.7.1/jszip.min.js";
  1949. } else if (name.includes("_to_pdf")) {
  1950. obj = "jspdf";
  1951. url = "https://cdn.staticfile.org/jspdf/2.5.1/jspdf.umd.min.js";
  1952. } else {
  1953. continue;
  1954. }
  1955. utils[prop] = ensure_script_existed(obj, url, utils[prop]);
  1956. }
  1957. /**
  1958. * ---------------------------------------------------------------------
  1959. * 为 utils 部分函数绑定更详细的说明
  1960. * ---------------------------------------------------------------------
  1961. */
  1962. utils.b64_to_bytes.__doc__ = `
  1963. /**
  1964. * b64编码字符串转Uint8Array
  1965. * @param {string} sBase64 b64编码的字符串
  1966. * @param {number} nBlockSize 字节数
  1967. * @returns {Uint8Array} arr
  1968. */
  1969. `;
  1970. utils.blobs_to_zip.__doc__ = `
  1971. /**
  1972. * 合并blobs到压缩包,然后下载
  1973. * @param {Iterable<Blob>} blobs
  1974. * @param {string} base_name 文件名通用部分,如 image-1.jpg 中的 image
  1975. * @param {string} ext 扩展名,如 jpg
  1976. * @param {string} zip_name 压缩包名称
  1977. */
  1978. `;
  1979. utils.imgs_to_pdf.__doc__ = `
  1980. /**
  1981. * 合并图像并导出PDF
  1982. * @param {Iterable<HTMLCanvasElement | Uint8Array | HTMLImageElement>} imgs 图像元素列表
  1983. * @param {string} title 文档标题
  1984. * @param {number} width (可选)页面宽度 默认 0
  1985. * @param {number} height (可选)页面高度 默认 0
  1986. * @param {boolean} blob (可选)是否返回 blob 默认 false
  1987. */
  1988. `;
  1989. utils.img_urls_to_pdf.__doc__ = `
  1990. /**
  1991. * 下载可以简单直接请求的图片,合并到 PDF 并导出
  1992. * @param {Iterable<string>} urls 图片链接列表
  1993. * @param {string} title 文档名称
  1994. * @param {number} min_num 如果成功获取的图片数量 < min_num, 则等待 2 秒后重试; 默认 0 不重试
  1995. * @param {boolean} clear 是否在请求完成后清理控制台输出,默认false
  1996. */
  1997. `;
  1998. utils.img_blobs_to_pdf.__doc__ = `
  1999. /**
  2000. * 图片blobs合并并导出为单个PDF
  2001. * @param {Array<Blob>} blobs
  2002. * @param {string} title (可选)文档名称, 不含后缀, 默认为"文档"
  2003. * @param {boolean} filter (可选)是否过滤 type 不以 "image/" 开头的 blob; 默认为 true
  2004. * @param {boolean} blob (可选)是否返回 blob
  2005. */
  2006. `;
  2007. /**
  2008. * ---------------------------------------------------------------------
  2009. * 绑定 utils 成员到 wk$,允许外部轻松调用
  2010. * ---------------------------------------------------------------------
  2011. */
  2012. base.superAssign(wk$, utils);
  2013. console.info("wk: `wk$` 已经挂载到全局");
  2014. /**
  2015. * 展开道客巴巴的文档
  2016. */
  2017. async function readAllDoc88() {
  2018. // 获取“继续阅读”按钮
  2019. let continue_btn = wk$("#continueButton")[0];
  2020. // 如果存在“继续阅读”按钮
  2021. if (continue_btn) {
  2022. // 跳转到文末(等同于展开全文)
  2023. let cur_page = wk$("#pageNumInput")[0];
  2024. // 取得最大页码
  2025. let page_max = cur_page.parentElement.textContent.replace(" / ", "");
  2026. // 跳转到尾页
  2027. utils.to_page(cur_page, page_max, "keypress");
  2028. // 返回顶部
  2029. await utils.sleep(1000);
  2030. utils.to_page(cur_page, "1", "keypress");
  2031. }
  2032. // 文档展开后,显示按钮
  2033. else {
  2034. for (const i of utils.range(1, 6)) {
  2035. utils.toggle_btn(i);
  2036. }
  2037. }
  2038. }
  2039. /**
  2040. * 隐藏选择文字的弹窗
  2041. */
  2042. async function hideSelectPopup() {
  2043. const
  2044. elem = (await wk$$("#left-menu"))[0],
  2045. hide = elem => elem.style.zIndex = -1;
  2046. return utils.until_visible(elem).then(hide);
  2047. }
  2048. /**
  2049. * 初始化任务
  2050. */
  2051. async function initService() {
  2052. // 初始化
  2053. console.log("正在执行初始化任务");
  2054. // 1. 查找复制文字可能的api名称
  2055. const prop = getCopyAPIValue();
  2056. globalThis.doc88JS._apis = Object
  2057. .getOwnPropertyNames(prop)
  2058. .filter(name => {
  2059. if (!name.startsWith("_")) {
  2060. return false;
  2061. }
  2062. if (prop[name] === "") {
  2063. return true;
  2064. }
  2065. });
  2066. // 2. 隐藏选中文字的提示框
  2067. await hideSelectPopup();
  2068. // 3. 隐藏搜索框
  2069. // hideSearchBox();
  2070. // 4. 移除vip复制弹窗
  2071. // hideCopyPopup();
  2072. }
  2073. /**
  2074. * 取得 doc88JS.copy_api 所指向属性的值
  2075. * @returns
  2076. */
  2077. function getCopyAPIValue() {
  2078. let aim = globalThis;
  2079. for (let name of globalThis.doc88JS.copy_api) {
  2080. aim = aim[name];
  2081. }
  2082. return aim;
  2083. }
  2084. /**
  2085. * 返回选中的文字
  2086. * @returns {string}
  2087. */
  2088. function getSelectedText() {
  2089. // 首次复制文字,需要先找出api
  2090. if (globalThis.doc88JS.copy_api.length === 3) {
  2091. // 拼接出路径,得到属性
  2092. let prop = getCopyAPIValue(); // 此时是属性,尚未取得值
  2093. // 查询值
  2094. for (let name of globalThis.doc88JS._apis) {
  2095. let value = prop[name];
  2096. // 值从空字符串变为非空字符串了,确认是目标api名称
  2097. if (typeof value === 'string'
  2098. && value.length > 0
  2099. && !value.match(/\d/) // 开头不能是数字,因为可能是 '1-179-195' 这种值
  2100. ) {
  2101. globalThis.doc88JS.copy_api.push(name);
  2102. break;
  2103. }
  2104. }
  2105. }
  2106. return getCopyAPIValue();
  2107. }
  2108. /**
  2109. * 输出选中的文字到剪贴板和控制台,返回是否复制了文档
  2110. * @returns {boolean} doc_is_copied
  2111. */
  2112. function copySelected() {
  2113. // 尚未选中文字
  2114. if (getComputedStyle(wk$("#left-menu")[0]).display === "none") {
  2115. console.log("尚未选中文字");
  2116. return false;
  2117. }
  2118. // 输出到控制台和剪贴板
  2119. utils.copy_text(getSelectedText());
  2120. return true;
  2121. }
  2122. /**
  2123. * 捕获 ctrl + c 以复制文字
  2124. * @param {KeyboardEvent} e
  2125. * @returns
  2126. */
  2127. function onCtrlC(e) {
  2128. // 判断是否为 ctrl + c
  2129. if (!(e.code === "KeyC" && e.ctrlKey === true)) {
  2130. return;
  2131. }
  2132. // 判断触发间隔
  2133. let now = Date.now();
  2134. // 距离上次小于0.5秒
  2135. if (now - doc88JS.last_copy_time < 500 * 1) {
  2136. doc88JS.last_copy_time = now;
  2137. return;
  2138. }
  2139. // 大于1秒
  2140. // 刷新最近一次触发时间
  2141. doc88JS.last_copy_time = now;
  2142. // 复制文字
  2143. copySelected();
  2144. // if (!copySelected()) return;
  2145. // 停止传播
  2146. e.stopImmediatePropagation();
  2147. e.stopPropagation();
  2148. }
  2149. /**
  2150. * 浏览并加载所有页面
  2151. */
  2152. async function walkThrough$2() {
  2153. // 文档容器
  2154. let container = wk$("#pageContainer")[0];
  2155. container.style.display = "none";
  2156. // 页码
  2157. let page_num = wk$("#pageNumInput")[0];
  2158. // 文末提示
  2159. let tail = wk$("#readEndDiv > p")[0];
  2160. let origin = tail.textContent;
  2161. // 按钮
  2162. wk$('.btns_section > [class*="btn-"]').forEach(
  2163. elem => elem.style.display = "none"
  2164. );
  2165. // 逐页渲染
  2166. let total = parseInt(Config.p_pagecount);
  2167. try {
  2168. for (let i = 1; i <= total; i++) {
  2169. // 前往页码
  2170. GotoPage(i);
  2171. await utils.wait_until(async() => {
  2172. let page = wk$(`#page_${i}`)[0];
  2173. // page无法选中说明有弹窗
  2174. if (!page) {
  2175. // 关闭弹窗,等待,然后递归
  2176. wk$("#ym-window .DOC88Window_close")[0].click();
  2177. await utils.sleep(500);
  2178. walkThrough$2();
  2179. throw new Error("walkThrough 递归完成,终止函数");
  2180. }
  2181. // canvas尚未绘制时width=300
  2182. return page.width !== 300;
  2183. });
  2184. // 凸显页码
  2185. utils.emphasize_text(page_num);
  2186. tail.textContent = `请勿反复点击按钮,耐心等待页面渲染:${i}/${total}`;
  2187. }
  2188. } catch(e) {
  2189. // 捕获退出信号,然后退出
  2190. console.log(e);
  2191. return;
  2192. }
  2193. // 恢复原本显示
  2194. container.style.display = "";
  2195. page_num.style = "";
  2196. tail.textContent = origin;
  2197. // 按钮
  2198. wk$('.btns_section > [class*="btn-"]').forEach(
  2199. elem => elem.style.display = "block"
  2200. );
  2201. wk$(".btns_section > .btn-1")[0].style.display = "none";
  2202. }
  2203. /**
  2204. * 道客巴巴文档下载策略
  2205. */
  2206. async function doc88() {
  2207. // 全局对象
  2208. globalThis.doc88JS = {
  2209. last_copy_time: 0, // 上一次 ctrl + c 的时间戳(毫秒)
  2210. copy_api: ["Core", "Annotation", "api"]
  2211. };
  2212. // 创建脚本启动按钮1、2
  2213. utils.create_btns();
  2214. // 绑定主函数
  2215. let prepare = function() {
  2216. // 获取canvas元素列表
  2217. let node_list = wk$(".inner_page");
  2218. // 获取文档标题
  2219. let title;
  2220. if (wk$(".doctopic h1")[0]) {
  2221. title = wk$(".doctopic h1")[0].title;
  2222. } else {
  2223. title = "文档";
  2224. }
  2225. return [node_list, title];
  2226. };
  2227. // btn_1: 展开文档
  2228. utils.onclick(readAllDoc88, 1);
  2229. // // btn_2: 加载全部页面
  2230. utils.onclick(walkThrough$2, 2, "加载所有页面");
  2231. // btn_3: 导出PDF
  2232. function imgsToPDF() {
  2233. if (confirm("确定每页内容都加载完成了吗?")) {
  2234. utils.run_with_prog(
  2235. 3, () => utils.imgs_to_pdf(...prepare())
  2236. );
  2237. }
  2238. } utils.onclick(imgsToPDF, 3, "导出图片到PDF");
  2239. // btn_4: 导出ZIP
  2240. utils.onclick(() => {
  2241. if (confirm("确定每页内容都加载完成了吗?")) {
  2242. utils.canvases_to_zip(...prepare());
  2243. }
  2244. }, 4, "导出图片到ZIP");
  2245. // btn_5: 复制选中文字
  2246. utils.onclick(btn => {
  2247. if (!copySelected()) {
  2248. btn.textContent = "未选中文字";
  2249. } else {
  2250. btn.textContent = "复制成功!";
  2251. }
  2252. }, 5, "复制选中文字");
  2253. // 为 ctrl + c 添加响应
  2254. window.addEventListener("keydown", onCtrlC, true);
  2255. // 执行一次初始化任务
  2256. window.addEventListener(
  2257. "mousedown", initService, { once: true, capture: true }
  2258. );
  2259. }
  2260. function get_title$1() {
  2261. return document.title.slice(0,-6);
  2262. }
  2263. function save_canvases(type) {
  2264. return () => {
  2265. if (!wk$(".hkswf-content2 canvas").length) {
  2266. alert("当前页面不适用此按钮");
  2267. return;
  2268. }
  2269. if (confirm("页面加载完毕了吗?")) {
  2270. const title = get_title$1();
  2271. const canvases = wk$(".hkswf-content2 canvas");
  2272. let data_to;
  2273. switch (type) {
  2274. case "pdf":
  2275. data_to = utils.imgs_to_pdf;
  2276. break;
  2277. case "zip":
  2278. data_to = utils.canvases_to_zip;
  2279. break;
  2280. default:
  2281. data_to = () => utils.raise(`未知 type: ${type}`);
  2282. break;
  2283. }
  2284. data_to(canvases, title);
  2285. }
  2286. }
  2287. }
  2288. function get_base_url() {
  2289. // https://docimg1.docin.com/docinpic.jsp?file=2179420769&width=1000&sid=bZh4STs-f4NA88IA02INyapgA9Z5X3NN1sGo4WnpquIvk4CyflMk1Oxey1BsO1BG&pageno=2&pcimg=1
  2290. return `https://docimg1.docin.com/docinpic.jsp?` +
  2291. `file=` + location.pathname.match(/p-(\d+)[.]html/)[1] +
  2292. `&width=1000&sid=` + window.readerConfig.flash_param_hzq +
  2293. `&pcimg=1&pageno=`;
  2294. }
  2295. /**
  2296. * 返回总页码
  2297. * @returns {number}
  2298. */
  2299. function get_page_num() {
  2300. return parseInt(
  2301. wk$(".page_num")[0].textContent.slice(1)
  2302. );
  2303. }
  2304. function init_save_imgs() {
  2305. const iframe = document.createElement("iframe");
  2306. iframe.src = "https://docimg1.docin.com/?wk=true";
  2307. iframe.style.display = "none";
  2308. let sock;
  2309. /**
  2310. * @param {MessageEvent} event
  2311. */
  2312. function on_client_msg(event) {
  2313. if (event.data.author !== "wk"
  2314. || event.data.action !== "finish"
  2315. ) return;
  2316. sock.notListen(on_client_msg);
  2317. iframe.remove();
  2318. utils.toggle_btn(1);
  2319. utils.toggle_btn(3);
  2320. }
  2321. /**
  2322. * @param {string} type "pdf" | "zip"
  2323. */
  2324. return (type) => {
  2325. return async function() {
  2326. if (!wk$("[id*=img_] img").length) {
  2327. alert("当前页面不适用此按钮");
  2328. return;
  2329. }
  2330. utils.toggle_btn(1);
  2331. utils.toggle_btn(3);
  2332. document.body.append(iframe);
  2333. await utils.sleep(500);
  2334. sock = new utils.Socket(iframe.contentWindow);
  2335. await sock.connect(false);
  2336. sock.listen(on_client_msg);
  2337. sock.talk({
  2338. author: "wk",
  2339. type,
  2340. title: get_title$1(),
  2341. base_url: get_base_url(),
  2342. max: get_page_num()
  2343. });
  2344. }
  2345. }
  2346. }
  2347. const save_imgs = init_save_imgs();
  2348. async function walk_through() {
  2349. // 隐藏按钮
  2350. utils.toggle_btn(5);
  2351. // 隐藏文档页面
  2352. wk$("#contentcontainer")[0].setAttribute("style", "visibility: hidden;");
  2353. const total = get_page_num();
  2354. const input = wk$("#page_cur")[0];
  2355. for (let i = 1; i <= total; i++) {
  2356. utils.to_page(input, i, "keydown");
  2357. await utils.wait_until(
  2358. () => {
  2359. const page = wk$(`#page_${i}`)[0];
  2360. const contents = wk$.call(page, `.canvas_loaded, img`);
  2361. return contents.length > 0;
  2362. },
  2363. 5000
  2364. );
  2365. }
  2366. // 显示文档页面
  2367. wk$("#contentcontainer")[0].removeAttribute("style");
  2368. }
  2369. function main_page() {
  2370. // 创建脚本启动按钮
  2371. utils.create_btns();
  2372. utils.onclick(
  2373. save_imgs("pdf"), 1, "合并图片为PDF"
  2374. );
  2375. utils.onclick(
  2376. save_canvases("pdf"), 2, "合并画布为PDF"
  2377. );
  2378. utils.toggle_btn(2);
  2379. utils.onclick(
  2380. save_imgs("zip"), 3, "打包图片到ZIP"
  2381. );
  2382. utils.toggle_btn(3);
  2383. utils.onclick(
  2384. save_canvases("zip"), 4, "打包画布到ZIP"
  2385. );
  2386. utils.toggle_btn(4);
  2387. utils.onclick(
  2388. walk_through, 5, "自动浏览页面"
  2389. );
  2390. utils.toggle_btn(5);
  2391. }
  2392. function init_background() {
  2393. const sock = new utils.Socket(window.top);
  2394. /**
  2395. * @param {MessageEvent} event
  2396. */
  2397. async function on_server_msg(event) {
  2398. if (event.data.author !== "wk") return;
  2399. const { title, base_url, max, type } = event.data;
  2400. const urls = Array
  2401. .from(utils.range(1, max + 1))
  2402. .map(i => (base_url + i));
  2403. const imgs = await utils.img_urls_to_pdf(
  2404. urls, title, 0, false, true
  2405. );
  2406. switch (type) {
  2407. case "pdf":
  2408. await utils.img_blobs_to_pdf(imgs, title);
  2409. break;
  2410. case "zip":
  2411. const ext = imgs[0].type ? imgs[0].type.split("/")[1] : "png";
  2412. await utils.blobs_to_zip(
  2413. imgs, "page", ext, title
  2414. );
  2415. break;
  2416. default:
  2417. utils.raise(`未知 type: ${type}`);
  2418. break;
  2419. }
  2420. sock.talk({
  2421. author: "wk",
  2422. action: "finish"
  2423. });
  2424. sock.notListen(on_server_msg);
  2425. }
  2426. return async function() {
  2427. sock.listen(on_server_msg);
  2428. await sock.connect(true);
  2429. }
  2430. }
  2431. const background = init_background();
  2432. /**
  2433. * 豆丁文档下载策略
  2434. */
  2435. function docin() {
  2436. const host = location.hostname;
  2437. switch (host) {
  2438. case "jz.docin.com":
  2439. case "www.docin.com":
  2440. main_page();
  2441. break;
  2442. case "docimg1.docin.com":
  2443. background();
  2444. break;
  2445. default:
  2446. console.log(`未知域名: ${host}`);
  2447. break;
  2448. }
  2449. }
  2450. function jumpToHost() {
  2451. // https://swf.ishare.down.sina.com.cn/1DrH4Qt2cvKd.jpg?ssig=DUf5x%2BXnKU&Expires=1673867307&KID=sina,ishare&range={}-{}
  2452. let url = wk$(".data-detail img, .data-detail embed")[0].src;
  2453. if (!url) {
  2454. alert("找不到图片元素");
  2455. return;
  2456. }
  2457. let url_obj = new URL(url);
  2458. let path = url_obj.pathname.slice(1);
  2459. let query = url_obj.search.slice(1).split("&range")[0];
  2460. let title = document.title.split(" - ")[0];
  2461. let target = `${url_obj.protocol}//${url_obj.host}?path=${path}&fname=${title}&${query}`;
  2462. // https://swf.ishare.down.sina.com.cn/
  2463. globalThis.open(target, "hostage");
  2464. // 然后在跳板页面发起对图片的请求
  2465. }
  2466. /**
  2467. * 爱问文库下载跳转策略
  2468. */
  2469. function ishare() {
  2470. // 创建按钮区
  2471. utils.create_btns();
  2472. // btn_1: 识别文档类型 -> 导出PDF
  2473. utils.onclick(jumpToHost, 1, "到下载页面");
  2474. // btn_2: 不支持爱问办公
  2475. utils.onclick(() => null, 2, "不支持爱问办公");
  2476. // utils.toggleBtnStatus(4);
  2477. }
  2478. /**
  2479. * 返回包含对于数量svg元素的html元素
  2480. * @param {string} data
  2481. * @returns {HTMLDivElement} article
  2482. */
  2483. function _createDiv(data) {
  2484. let num = utils.count_sub_str(data, data.slice(0, 10));
  2485. let article = document.createElement("div");
  2486. article.id = "article";
  2487. article.innerHTML = `
  2488. <style class="wk-settings">
  2489. body {
  2490. margin: 0px;
  2491. width: 100%;
  2492. background-color: rgb(95,99,104);
  2493. }
  2494. #article {
  2495. width: 100%;
  2496. display: flex;
  2497. flex-direction: row;
  2498. justify-content: space-around;
  2499. }
  2500. #root-box {
  2501. display: flex;
  2502. flex-direction: column;
  2503. background-color: white;
  2504. padding: 0 2em;
  2505. }
  2506. .gap {
  2507. height: 50px;
  2508. width: 100%;
  2509. background-color: transparent;
  2510. }
  2511. </style>
  2512. <div id="root-box">
  2513. ${
  2514. `<object class="svg-box"></object>
  2515. <div class="gap"></div>`.repeat(num)
  2516. }
  2517. `;
  2518. // 移除最后一个多出的gap
  2519. Array.from(article.querySelectorAll(".gap")).at(-1).remove();
  2520. return article;
  2521. }
  2522. function setGap(height) {
  2523. let style = wk$(".wk-settings")[0].innerHTML;
  2524. wk$(".wk-settings")[0].innerHTML = style.replace(
  2525. /[.]gap.*?{.*?height:.+?;/s,
  2526. `.gap { height: ${parseInt(height)}px;`
  2527. );
  2528. }
  2529. function setGapGUI() {
  2530. let now = getComputedStyle(wk$(".gap")[0]).height;
  2531. let new_h = prompt(`当前间距:${now}\n请输入新间距:`);
  2532. if (new_h) {
  2533. setGap(new_h);
  2534. }
  2535. }
  2536. function getSVGtext(data) {
  2537. let div = document.createElement("div");
  2538. div.innerHTML = data;
  2539. return div.textContent;
  2540. }
  2541. function toDisplayMode1() {
  2542. let content = globalThis["ishareJS"].content_1;
  2543. if (!content) {
  2544. content = globalThis["ishareJS"].text
  2545. .replace(/\n{2,}/g, "<hr>")
  2546. .replace(/\n/g, "<br>")
  2547. .replace(/\s/g, "&nbsp;")
  2548. .replace(/([a-z])([A-Z])/g, "$1 $2"); // 英文简单分词
  2549. globalThis["ishareJS"].content_1 = content;
  2550. }
  2551. wk$("#root-box")[0].innerHTML = content;
  2552. }
  2553. function toDisplayMode2() {
  2554. let content = globalThis["ishareJS"].content_2;
  2555. if (!content) {
  2556. content = globalThis["ishareJS"].text
  2557. .replace(/\n{2,}/g, "<hr>")
  2558. .replace(/\n/g, "")
  2559. .replace(/\s/g, "&nbsp;")
  2560. .replace(/([a-z])([A-Z])/g, "$1 $2")
  2561. .split("<hr>")
  2562. .map(paragraph => `<p>${paragraph}</p>`)
  2563. .join("");
  2564. globalThis["ishareJS"].content_2 = content;
  2565. wk$(".wk-settings")[0].innerHTML += `
  2566. #root-box > p {
  2567. text-indent: 2em;
  2568. width: 40em;
  2569. word-break: break-word;
  2570. }
  2571. `;
  2572. }
  2573. wk$("#root-box")[0].innerHTML = content;
  2574. }
  2575. function changeDisplayModeWrapper() {
  2576. let flag = true;
  2577. function inner() {
  2578. if (flag) {
  2579. toDisplayMode1();
  2580. } else {
  2581. toDisplayMode2();
  2582. }
  2583. flag = !flag;
  2584. }
  2585. return inner;
  2586. }
  2587. function handleSVGtext() {
  2588. globalThis["ishareJS"].text = getSVGtext(
  2589. globalThis["ishareJS"].data
  2590. );
  2591. let change = changeDisplayModeWrapper();
  2592. utils.onclick(change, 4, "切换显示模式");
  2593. utils.toggle_btn(2);
  2594. utils.toggle_btn(3);
  2595. utils.toggle_btn(4);
  2596. change();
  2597. }
  2598. /**
  2599. * 处理svg的url
  2600. * @param {string} svg_url
  2601. */
  2602. async function handleSVGurl(svg_url) {
  2603. let resp = await fetch(svg_url);
  2604. let data = await resp.text();
  2605. globalThis["ishareJS"].data = data;
  2606. let sep = data.slice(0, 10);
  2607. let svg_texts = data
  2608. .split(sep)
  2609. .slice(1)
  2610. .map(svg_text => sep + svg_text);
  2611. console.log(`共 ${svg_texts.length} 张图片`);
  2612. let article = _createDiv(data);
  2613. let boxes = article.querySelectorAll(".svg-box");
  2614. boxes.forEach((obj, i) => {
  2615. let blob = new Blob([svg_texts[i]], {type: "image/svg+xml"});
  2616. let url = URL.createObjectURL(blob);
  2617. obj.data = url;
  2618. URL.revokeObjectURL(blob);
  2619. });
  2620. let body = wk$("body")[0];
  2621. body.innerHTML = "";
  2622. body.appendChild(article);
  2623. utils.create_btns();
  2624. utils.onclick(utils.print_page, 1, "打印页面到PDF");
  2625. utils.onclick(setGapGUI, 2, "重设页间距");
  2626. utils.onclick(handleSVGtext, 3, "显示空白点我");
  2627. utils.toggle_btn(2);
  2628. utils.toggle_btn(3);
  2629. }
  2630. /**
  2631. * 取得图片下载地址
  2632. * @param {string} fname
  2633. * @param {string} path
  2634. * @returns
  2635. */
  2636. function getImgUrl(fname, path) {
  2637. if (!fname) {
  2638. throw new Error("URL Param `fname` does not exist.");
  2639. }
  2640. return location.href
  2641. .replace(/[?].+?&ssig/, "?ssig")
  2642. .replace("?", path + "?");
  2643. }
  2644. /**
  2645. * 下载整个图片包
  2646. * @param {string} img_url
  2647. * @returns
  2648. */
  2649. async function getData(img_url) {
  2650. let resp = await fetch(img_url);
  2651. // window.data = await resp.blob();
  2652. // throw Error("stop");
  2653. let buffer = await resp.arrayBuffer();
  2654. return new Uint8Array(buffer);
  2655. }
  2656. /**
  2657. * 分切图片包为若干图片
  2658. * @param {Uint8Array} data 多张图片合集数据包
  2659. * @returns {Array<Uint8Array>} 图片列表
  2660. */
  2661. function parseData(data) {
  2662. // 判断图像类型/拿到文件头
  2663. let head = data.slice(0, 8);
  2664. return utils.split_files_by_head(data, head);
  2665. }
  2666. /**
  2667. * 图像Uint8数组列表合并然后导出PDF
  2668. * @param {string} fname
  2669. * @param {Array<Uint8Array>} img_data_list
  2670. */
  2671. async function imgDataArrsToPDF(fname, img_data_list) {
  2672. return utils.imgs_to_pdf(
  2673. img_data_list,
  2674. fname
  2675. );
  2676. }
  2677. /**
  2678. *
  2679. * @param {string} fname 文件名
  2680. * @param {Array<Uint8Array>} img_data_list 数据列表
  2681. */
  2682. async function saveAsZip(fname, img_data_list) {
  2683. await utils.blobs_to_zip(
  2684. img_data_list,
  2685. "page",
  2686. "png",
  2687. fname
  2688. );
  2689. }
  2690. /**
  2691. * 取得图片集合体并切分,如果是 SVG 则对应处理
  2692. * @returns {Array<Uint8Array>} imgs
  2693. */
  2694. async function getImgs() {
  2695. let [fname, path] = [
  2696. window.ishareJS.fname,
  2697. window.ishareJS.path
  2698. ];
  2699. let img_url = getImgUrl(fname, path);
  2700. // 处理svg
  2701. if (path.includes(".svg")) {
  2702. document.title = fname;
  2703. await handleSVGurl(img_url);
  2704. return;
  2705. }
  2706. // 处理常规图像
  2707. let data = await getData(img_url);
  2708. let img_data_list = parseData(data);
  2709. console.log(`共 ${img_data_list.length} 张图片`);
  2710. window.ishareJS.imgs = img_data_list;
  2711. // 下载完成,可以导出
  2712. utils.onclick(exportPDF$3, 2, "下载并导出PDF");
  2713. utils.toggle_btn(1);
  2714. utils.toggle_btn(2);
  2715. }
  2716. async function exportPDF$3() {
  2717. let args = [
  2718. window.ishareJS.fname,
  2719. window.ishareJS.imgs
  2720. ];
  2721. try {
  2722. await imgDataArrsToPDF(...args);
  2723. } catch(e) {
  2724. console.error(e);
  2725. // 因 jsPDF 字符串拼接溢出导致的 Error
  2726. if (`${e}`.includes("RangeError: Invalid string length")) {
  2727. // 提示失败
  2728. alert("图片合并为 PDF 时失败,请尝试下载图片压缩包");
  2729. // 备选方案:导出图片压缩包
  2730. utils.onclick(
  2731. () => saveAsZip(...args),
  2732. 3,
  2733. "导出ZIP"
  2734. );
  2735. utils.toggle_btn(3); // 显示导出ZIP按钮
  2736. utils.toggle_btn(2); // 隐藏导出PDF按钮
  2737. } else {
  2738. throw e;
  2739. }
  2740. }
  2741. }
  2742. function showHints() {
  2743. wk$("h1")[0].textContent = "wk 温馨提示";
  2744. wk$("p")[0].innerHTML = [
  2745. "下载 270 页的 PPT (70 MB) 需要约 30 秒",
  2746. "请耐心等待,无需反复点击按钮",
  2747. "如果很久没反应,请加 QQ 群反馈问题"
  2748. ].join("<br>");
  2749. wk$("hr")[0].nextSibling.textContent = "403 Page Hostaged By Wenku Doc Downloader";
  2750. }
  2751. /**
  2752. * 爱问文库下载策略
  2753. */
  2754. async function ishareData() {
  2755. // 全局对象
  2756. globalThis["ishareJS"] = {
  2757. data: "",
  2758. imgs: [],
  2759. text: "",
  2760. content_1: "",
  2761. content_2: "",
  2762. fname: utils.get_param("fname"),
  2763. path: utils.get_param("path")
  2764. };
  2765. // 显示提示
  2766. showHints();
  2767. // 创建按钮区
  2768. utils.create_btns();
  2769. // btn_1: 识别文档类型,处理SVG或下载数据
  2770. utils.onclick(getImgs, 1, "下载数据");
  2771. }
  2772. /**
  2773. * 提供提示信息
  2774. */
  2775. function showTips$1() {
  2776. const h2 = document.createElement("h2");
  2777. h2.id = "wk-tips";
  2778. document.body.append(h2);
  2779. }
  2780. /**
  2781. * 更新文字到 h2 元素
  2782. * @param {string} text
  2783. */
  2784. function update(text) {
  2785. wk$("#wk-tips")[0].textContent = text;
  2786. }
  2787. /**
  2788. * 被动连接,取出数据,请求并分割图片,导出PDF
  2789. */
  2790. function mainTask() {
  2791. const sock = new utils.Socket(opener);
  2792. sock.listen(async e => {
  2793. if (e.data.wk && e.data.action) {
  2794. update("图片下载中,请耐心等待...");
  2795. const url = e.data.img_url;
  2796. const resp = await fetch(url);
  2797. update("图片下载完成,正在解析...");
  2798. const buffer = await resp.arrayBuffer();
  2799. const whole_data = new Uint8Array(buffer);
  2800. update("图片解析完成,正在合并...");
  2801. await utils.imgs_to_pdf(
  2802. utils.split_files_by_head(whole_data),
  2803. e.data.title
  2804. );
  2805. update("图片合并完成,正在导出 PDF...");
  2806. }
  2807. });
  2808. sock.connect(true);
  2809. }
  2810. /**
  2811. * 爱问文库图片下载策略v2
  2812. * @returns
  2813. */
  2814. function ishareData2() {
  2815. showTips$1();
  2816. if (!(window.opener && window.opener.window)) {
  2817. update("wk: 抱歉,页面出错了");
  2818. return;
  2819. }
  2820. mainTask();
  2821. }
  2822. function getPageNum() {
  2823. // ' / 6 ' -> ' 6 '
  2824. return parseInt(
  2825. wk$("span.counts")[0].textContent.split("/")[1]
  2826. );
  2827. }
  2828. function jumpToHostage() {
  2829. const
  2830. // '/fileroot/2019-9/23/73598bfa-6b91-4cbe-a548-9996f46653a2/73598bfa-6b91-4cbe-a548-9996f46653a21.gif'
  2831. url = new URL(wk$("#pageflash_1 > img")[0].src),
  2832. num = getPageNum(),
  2833. // '七年级上册地理期末试卷精编.doc-得力文库'
  2834. fname = document.title.slice(0, -5),
  2835. path = url.pathname,
  2836. tail = "1.gif";
  2837. if (!path.endsWith(tail)) {
  2838. throw new Error(`url尾部不为【${tail}】!path:【${path}】`);
  2839. }
  2840. const base_path = path.slice(0, -5);
  2841. open(`${url.protocol}//${url.host}/?num=${num}&lmt=${lmt}&fname=${fname}&path=${base_path}`);
  2842. }
  2843. function deliwenku() {
  2844. utils.create_btns();
  2845. utils.onclick(jumpToHostage, 1, "到下载页面");
  2846. }
  2847. function showTips() {
  2848. const body = `
  2849. <style>
  2850. h1 { color: black; }
  2851. #main {
  2852. margin: 1vw 5%;
  2853. border-radius: 10%;
  2854. }
  2855. p { font-size: large; }
  2856. .info {
  2857. color: rgb(230,214,110);
  2858. background: rgb(39,40,34);
  2859. text-align: right;
  2860. font-size: medium;
  2861. padding: 1vw;
  2862. border-radius: 4px;
  2863. }
  2864. </style>
  2865. <div id="main">
  2866. <h1>wk: 跳板页面</h1>
  2867. <p>有时候点一次下载等半天没反应,就再试一次</p>
  2868. <p>如果试了 2 次还不行加 QQ 群反馈吧...</p>
  2869. <p>导出的 PDF 如果页面数量少于应有的,那么意味着免费页数就这么多,我也爱莫能助</p>
  2870. <p>短时间连续使用导出按钮会导致 IP 被封禁</p>
  2871. <hr>
  2872. <div class="info">
  2873. 文档名称:${deliJS.fname}<br>
  2874. 原始文档页数:${deliJS.num}<br>
  2875. 最大免费页数:${deliJS.lmt}<br>
  2876. </div>
  2877. </div>`;
  2878. document.title = utils.get_param("fname"); document.body.innerHTML = body;
  2879. }
  2880. /**
  2881. * url生成器
  2882. * @param {string} base_url
  2883. * @param {number} num
  2884. */
  2885. function* genURLs(base_url, num) {
  2886. for (let i=1; i<=num; i++) {
  2887. yield `${base_url}${i}.gif`;
  2888. }
  2889. }
  2890. function genBaseURL(path) {
  2891. return `${location.protocol}//${location.host}${path}`;
  2892. }
  2893. function parseParamsToDeliJS() {
  2894. const
  2895. base_url = genBaseURL(utils.get_param("path")),
  2896. fname = utils.get_param("fname"),
  2897. num = parseInt(utils.get_param("num"));
  2898. let lmt = parseInt(utils.get_param("lmt"));
  2899. lmt = lmt > 3 ? lmt : 20;
  2900. lmt = lmt > num ? num : lmt;
  2901. window.deliJS = {
  2902. base_url,
  2903. num,
  2904. fname,
  2905. lmt
  2906. };
  2907. }
  2908. async function exportPDF$2() {
  2909. utils.toggle_btn(1);
  2910. await utils.run_with_prog(
  2911. 1, () => utils.img_urls_to_pdf(
  2912. genURLs(deliJS.base_url, deliJS.num),
  2913. deliJS.fname,
  2914. deliJS.lmt,
  2915. true // 请求完成后清理控制台
  2916. )
  2917. );
  2918. utils.toggle_btn(1);
  2919. }
  2920. /**
  2921. * 得力文库跳板页面下载策略
  2922. */
  2923. async function deliFile() {
  2924. // 从URL解析文档参数
  2925. parseParamsToDeliJS();
  2926. // 显示提示
  2927. showTips();
  2928. // 创建按钮区
  2929. utils.create_btns();
  2930. // btn_1: 导出PDF
  2931. utils.onclick(exportPDF$2, 1, "导出PDF");
  2932. }
  2933. function readAll360Doc() {
  2934. // 展开文档
  2935. document.querySelector(".article_showall a").click();
  2936. // 隐藏按钮
  2937. utils.toggle_btn(1);
  2938. // 显示按钮
  2939. utils.toggle_btn(2);
  2940. utils.toggle_btn(3);
  2941. utils.toggle_btn(4);
  2942. }
  2943. function saveText_360Doc() {
  2944. // 捕获图片链接
  2945. let images = wk$("#artContent img");
  2946. let content = [];
  2947. for (let i = 0; i < images.length; i++) {
  2948. let src = images[i].src;
  2949. content.push(`图${i+1},链接:${src}`);
  2950. }
  2951. // 捕获文本
  2952. let text = wk$("#artContent")[0].textContent;
  2953. content.push(text);
  2954. // 保存纯文本文档
  2955. let title = wk$("#titiletext")[0].textContent;
  2956. utils.save(`${title}.txt`, content.join("\n"));
  2957. }
  2958. /**
  2959. * 使文档在页面上居中
  2960. * @param {string} selector 文档容器的css选择器
  2961. * @param {string} default_offset 文档部分向右偏移的百分比(0-59)
  2962. * @returns 偏移值是否合法
  2963. */
  2964. function centre(selector, default_offset) {
  2965. const elem = wk$(selector)[0];
  2966. const offset = prompt("请输入偏移百分位:", default_offset);
  2967. // 如果输入的数字不在 0-59 内,提醒用户重新设置
  2968. if (offset.length === 1 && offset.search(/[0-9]/) !== -1) {
  2969. elem.style.marginLeft = offset + "%";
  2970. return true;
  2971. }
  2972. if (offset.length === 2 && offset.search(/[1-5][0-9]/) !== -1) {
  2973. elem.style.marginLeft = offset + "%";
  2974. return true;
  2975. }
  2976. alert("请输入一个正整数,范围在0至59之间,用来使文档居中");
  2977. return false;
  2978. }
  2979. function printPage360Doc() {
  2980. if (!confirm("确定每页内容都加载完成了吗?")) {
  2981. return;
  2982. }
  2983. // # 清理并打印360doc的文档页
  2984. // ## 移除页面上无关的元素
  2985. let selector = ".fontsize_bgcolor_controler, .atfixednav, .header, .a_right, .article_data, .prev_next, .str_border, .youlike, .new_plbox, .str_border, .ul-similar, #goTop2, #divtort, #divresaveunder, .bottom_controler, .floatqrcode";
  2986. let elem_list = wk$(selector);
  2987. let under_doc_1, under_doc_2;
  2988. try {
  2989. under_doc_1 = wk$("#bgchange p.clearboth")[0].nextElementSibling;
  2990. under_doc_2 = wk$("#bgchange")[0].nextElementSibling.nextElementSibling;
  2991. } catch (e) {}
  2992. // 执行移除
  2993. for (let elem of elem_list) {
  2994. utils.remove(elem);
  2995. }
  2996. utils.remove(under_doc_1);
  2997. utils.remove(under_doc_2);
  2998. // 执行隐藏
  2999. wk$("a[title]")[0].style.display = "none";
  3000. // 使文档居中
  3001. alert("建议使用:\n偏移量: 20\n缩放: 默认\n");
  3002. if (!centre(".a_left", "20")) {
  3003. return; // 如果输入非法,终止函数调用
  3004. }
  3005. // 隐藏按钮,然后打印页面
  3006. utils.print_page();
  3007. }
  3008. /**
  3009. * 阻止监听器生效
  3010. * @param {Event} e
  3011. */
  3012. function stopSpread(e) {
  3013. e.stopImmediatePropagation();
  3014. e.stopPropagation();
  3015. }
  3016. /**
  3017. * 阻止捕获事件
  3018. */
  3019. function stopCapturing() {
  3020. ["click", "mouseup"].forEach(
  3021. type => {
  3022. document.body.addEventListener(type, stopSpread, true);
  3023. document["on" + type] = undefined;
  3024. }
  3025. );
  3026. ["keypress", "keydown"].forEach(
  3027. type => {
  3028. window.addEventListener(type, stopSpread, true);
  3029. window["on" + type] = undefined;
  3030. }
  3031. );
  3032. }
  3033. /**
  3034. * 重置图像链接和最大宽度
  3035. * @param {Document} doc
  3036. */
  3037. function resetImg(doc=document) {
  3038. wk$.call(doc, "img").forEach(
  3039. elem => {
  3040. elem.style.maxWidth = "100%";
  3041. for (let attr of elem.attributes) {
  3042. if (attr.name.endsWith("-src")) {
  3043. elem.setAttribute("src", attr.value);
  3044. break;
  3045. }
  3046. }
  3047. }
  3048. );
  3049. }
  3050. /**
  3051. * 仅保留全屏文档
  3052. */
  3053. function getFullScreen() {
  3054. FullScreenObj.init();
  3055. wk$("#artContent > p:nth-child(3)")[0]?.remove();
  3056. let data = wk$("#artfullscreen__box_scr > table")[0].outerHTML;
  3057. window.doc360JS = { data };
  3058. let html_str = `
  3059. <html><head></head><body style="display: flex; flex-direction: row; justify-content: space-around">
  3060. ${data}
  3061. </body><html>
  3062. `;
  3063. wk$("html")[0].replaceWith(wk$("html")[0].cloneNode());
  3064. wk$("html")[0].innerHTML = html_str;
  3065. resetImg();
  3066. }
  3067. function cleanPage() {
  3068. getFullScreen();
  3069. stopCapturing();
  3070. }
  3071. /**
  3072. * 360doc个人图书馆下载策略
  3073. */
  3074. function doc360() {
  3075. // 创建按钮区
  3076. utils.create_btns();
  3077. // btn_1: 展开文档
  3078. utils.onclick(readAll360Doc, 1);
  3079. // btn_2: 导出纯文本
  3080. utils.onclick(saveText_360Doc, 2, "导出纯文本");
  3081. // btn_3: 打印页面到PDF
  3082. utils.onclick(printPage360Doc, 3, "打印页面到PDF");
  3083. // btn_3: 清理页面
  3084. utils.onclick(cleanPage, 4, "清理页面(推荐)");
  3085. }
  3086. async function getPDF() {
  3087. if (!window.DEFAULT_URL) {
  3088. alert("当前文档无法解析,请加 QQ 群反馈");
  3089. return;
  3090. }
  3091. let title = document.title.split(" - ")[0] + ".pdf";
  3092. let blob = await utils.xhr_get_blob(DEFAULT_URL);
  3093. utils.save(title, blob);
  3094. }
  3095. function mbalib() {
  3096. utils.create_btns();
  3097. utils.onclick(getPDF, 1, "下载PDF");
  3098. }
  3099. /**
  3100. * 判断是否进入预览模式
  3101. * @returns Boolean
  3102. */
  3103. function isInPreview() {
  3104. let p_elem = wk$("#preview_tips")[0];
  3105. if (p_elem && p_elem.style && p_elem.style.display === "none") {
  3106. return true;
  3107. }
  3108. return false;
  3109. }
  3110. /**
  3111. * 确保进入预览模式
  3112. */
  3113. async function ensureInPreview() {
  3114. while (!isInPreview()) {
  3115. // 如果没有进入预览,则先进入
  3116. if (typeof window.preview !== "function") {
  3117. alert("脚本失效,请加 QQ 群反馈");
  3118. throw new Error("preview 全局函数不存在");
  3119. }
  3120. await utils.sleep(500);
  3121. preview();
  3122. }
  3123. }
  3124. /**
  3125. * 前往页码
  3126. * @param {number} page_num
  3127. */
  3128. function toPage(page_num) {
  3129. // 先尝试官方接口,不行再用模拟的
  3130. try {
  3131. Viewer._GotoPage(page_num);
  3132. } catch(e) {
  3133. console.error(e);
  3134. utils.to_page(
  3135. wk$("#pageNumInput")[0],
  3136. page_num,
  3137. "keydown"
  3138. );
  3139. }
  3140. }
  3141. /**
  3142. * 展开全文预览,当展开完成后再次调用时,返回true
  3143. * @returns
  3144. */
  3145. async function walkThrough$1() {
  3146. // 隐藏页面
  3147. wk$("#pageContainer")[0].style.display = "none";
  3148. // 逐页加载
  3149. let lmt = window.dugenJS.lmt;
  3150. for (let i of utils.range(1, lmt + 1)) {
  3151. toPage(i);
  3152. await utils.wait_until(
  3153. () => wk$(`#outer_page_${i}`)[0].style.width.endsWith("px")
  3154. );
  3155. }
  3156. // 恢复显示
  3157. wk$("#pageContainer")[0].style.display = "";
  3158. console.log(`共 ${lmt} 页加载完毕`);
  3159. }
  3160. /**
  3161. * 返回当前未加载页面的页码
  3162. * @returns not_loaded
  3163. */
  3164. function getNotloadedPages() {
  3165. // 已经取得的页码
  3166. let pages = document.querySelectorAll("[id*=pageflash_]");
  3167. let loaded = new Set();
  3168. pages.forEach((page) => {
  3169. let id = page.id.split("_")[1];
  3170. id = parseInt(id);
  3171. loaded.add(id);
  3172. });
  3173. // 未取得的页码
  3174. let not_loaded = [];
  3175. for (let i of utils.range(1, window.dugenJS.lmt + 1)) {
  3176. if (!loaded.has(i)) {
  3177. not_loaded.push(i);
  3178. }
  3179. }
  3180. return not_loaded;
  3181. }
  3182. /**
  3183. * 取得全部文档页面的链接,返回urls;如果有页面未加载,则返回null
  3184. * @returns
  3185. */
  3186. function getImgUrls() {
  3187. let pages = wk$("[id*=pageflash_]");
  3188. // 尚未浏览完全部页面,返回false
  3189. if (pages.length < window.dugenJS.lmt) {
  3190. let hints = [
  3191. "尚未加载完全部页面",
  3192. "以下页面需要浏览并加载:",
  3193. getNotloadedPages().join(",")
  3194. ];
  3195. alert(hints.join("\n"));
  3196. return [false, []];
  3197. }
  3198. // 浏览完全部页面,返回urls
  3199. return [true, pages.map(page => page.querySelector("img").src)];
  3200. }
  3201. function exportImgUrls() {
  3202. let [ok, urls] = getImgUrls();
  3203. if (!ok) {
  3204. return;
  3205. }
  3206. utils.save("urls.csv", urls.join("\n"));
  3207. }
  3208. function exportPDF$1() {
  3209. let [ok, urls] = getImgUrls();
  3210. if (!ok) {
  3211. return;
  3212. }
  3213. let title = document.title.split("-")[0];
  3214. return utils.run_with_prog(
  3215. 3, () => utils.img_urls_to_pdf(urls, title)
  3216. );
  3217. }
  3218. /**
  3219. * dugen文档下载策略
  3220. */
  3221. async function dugen() {
  3222. await ensureInPreview();
  3223. // 全局对象
  3224. window.dugenJS = {
  3225. lmt: window.lmt ? window.lmt : 20
  3226. };
  3227. // 创建按钮区
  3228. utils.create_btns();
  3229. // 绑定监听器
  3230. // 按钮1:展开文档
  3231. utils.onclick(walkThrough$1, 1, "加载可预览页面");
  3232. // 按钮2:导出图片链接
  3233. utils.onclick(exportImgUrls, 2, "导出图片链接");
  3234. utils.toggle_btn(2);
  3235. // 按钮3:导出PDF
  3236. utils.onclick(exportPDF$1, 3, "导出PDF");
  3237. utils.toggle_btn(3);
  3238. }
  3239. // 域名级全局常量
  3240. const img_tasks = [];
  3241. /**
  3242. * 取得文档类型
  3243. * @returns {String} 文档类型str
  3244. */
  3245. function getDocType() {
  3246. const
  3247. // ["icon", "icon-format", "icon-format-doc"]
  3248. elem = wk$(".title .icon.icon-format")[0],
  3249. // "icon-format-doc"
  3250. cls = elem.classList[2];
  3251. return cls.split("-")[2];
  3252. }
  3253. /**
  3254. * 判断文档类型是否为type_list其中之一
  3255. * @returns 是否为type
  3256. */
  3257. function isTypeof(type_list) {
  3258. const type = getDocType();
  3259. if (type_list.includes(type)) {
  3260. return true;
  3261. }
  3262. return false;
  3263. }
  3264. /**
  3265. * 判断文档类型是否为PPT
  3266. * @returns 是否为PPT
  3267. */
  3268. function is_ppt() {
  3269. return isTypeof(["ppt", "pptx"]);
  3270. }
  3271. /**
  3272. * 判断文档类型是否为Excel
  3273. * @returns 是否为Excel
  3274. */
  3275. function is_excel() {
  3276. return isTypeof(["xls", "xlsm", "xlsx"]);
  3277. }
  3278. /**
  3279. * 取得未加载页面的页码
  3280. * @returns {Array} not_loaded 未加载页码列表
  3281. */
  3282. function getNotLoaded() {
  3283. const loaded = wk$("[data-id] img[src]").map(
  3284. img => parseInt(
  3285. img.closest("[data-id]").getAttribute("data-id")
  3286. )
  3287. );
  3288. return Array.from(
  3289. utils.diff(
  3290. utils.range(1, window.book118JS.page_counts + 1),
  3291. loaded
  3292. )
  3293. );
  3294. }
  3295. /**
  3296. * 取得全部文档页的url
  3297. * @returns [<是否全部加载>, <urls列表>, <未加载页码列表>]
  3298. */
  3299. function getUrls() {
  3300. const urls = wk$("[data-id] img[src]").map(
  3301. img => img.src
  3302. );
  3303. // 如果所有页面加载完毕
  3304. if (urls.length === book118JS.page_counts) {
  3305. return [true, urls, []];
  3306. }
  3307. // 否则收集未加载页面的url
  3308. return [false, urls, getNotLoaded()];
  3309. }
  3310. /**
  3311. * 展开全文
  3312. */
  3313. async function walkThrough() {
  3314. // 遍历期间隐藏按钮区
  3315. utils.toggle_box();
  3316. // 取得总页码
  3317. // preview.getPage()
  3318. // {current: 10, actual: 38, preview: 38, remain: 14}
  3319. const { preview: all } = preview.getPage();
  3320. for (let i = 1; i <= all; i++) {
  3321. // 逐页加载
  3322. preview.jump(i);
  3323. await utils.wait_until(
  3324. () => wk$(`[data-id="${i}"] img`)[0].src, 1000
  3325. );
  3326. }
  3327. console.log("遍历完成");
  3328. utils.toggle_box();
  3329. }
  3330. /**
  3331. * btn_2: 导出图片链接
  3332. */
  3333. function wantUrls() {
  3334. let [flag, urls, escaped] = getUrls();
  3335. // 页面都加载完毕,下载urls
  3336. if (!flag) {
  3337. // 没有加载完,提示出未加载好的页码
  3338. const hint = [
  3339. "仍有页面没有加载",
  3340. "请浏览并加载如下页面",
  3341. "是否继续导出图片链接?",
  3342. "[" + escaped.join(",") + "]"
  3343. ].join("\n");
  3344. // 终止导出
  3345. if (!confirm(hint)) {
  3346. return
  3347. }
  3348. }
  3349. utils.save("urls.csv", urls.join("\n"));
  3350. }
  3351. /**
  3352. * 打开PPT预览页面
  3353. */
  3354. async function open_iframe() {
  3355. wk$(".front a")[0].click();
  3356. const iframes = await wk$$("iframe.preview-iframe");
  3357. window.open(iframes[0].src);
  3358. }
  3359. /**
  3360. * 取得最大页码
  3361. * @returns {number} 最大页码
  3362. */
  3363. function getPageCounts$1() {
  3364. return window?.preview?.getPage()?.preview || NaN;
  3365. }
  3366. /**
  3367. * 原创力文档(非PPT或Excel)下载策略
  3368. */
  3369. async function common_doc() {
  3370. await utils.wait_until(
  3371. () => !!wk$(".counts")[0]
  3372. );
  3373. // 创建全局对象
  3374. window.book118JS = {
  3375. doc_type: getDocType(),
  3376. page_counts: getPageCounts$1()
  3377. };
  3378. // 处理非PPT文档
  3379. // 创建按钮组
  3380. utils.create_btns();
  3381. // 绑定监听器到按钮
  3382. // 按钮1:加载全文
  3383. utils.onclick(walkThrough, 1, "加载全文");
  3384. // 按钮2:导出图片链接
  3385. utils.onclick(wantUrls, 2, "导出图片链接");
  3386. utils.toggle_btn(2);
  3387. }
  3388. /**
  3389. * @returns {string}
  3390. */
  3391. function table_to_tsv() {
  3392. return wk$("table").map(table => {
  3393. // 剔除空表和行号表
  3394. const len = table.rows.length;
  3395. if (len > 1000 || len === 1) {
  3396. return "";
  3397. }
  3398. // 遍历行
  3399. return [...table.rows].map(row => {
  3400. // 遍历列(单元格)
  3401. return [...row.cells].map(cell => {
  3402. // 判断单元格是否存储图片
  3403. const img = cell.querySelector("img");
  3404. if (img) {
  3405. // 如果是图片,保存图片链接
  3406. return img.src;
  3407. }
  3408. // 否则保存单元格文本
  3409. return cell
  3410. .textContent
  3411. .trim()
  3412. .replace(/\n/g, " ")
  3413. .replace(/\t/g, " ");
  3414. }).join("\t");
  3415. }).join("\n").trim();
  3416. }).join("\n\n---\n\n");
  3417. }
  3418. /**
  3419. * 下载当前表格内容,保存为csv(utf-8编码)
  3420. */
  3421. function wantEXCEL() {
  3422. const tsv = table_to_tsv();
  3423. const bytes = utils.encode_to_gbk(tsv);
  3424. const fname = "原创力表格.tsv";
  3425. utils.save(fname, bytes);
  3426. }
  3427. /**
  3428. * 在Excel预览页面给出操作提示
  3429. */
  3430. function help$1() {
  3431. const hint = [
  3432. "【导出表格到TSV】只能导出当前 sheet",
  3433. "如果有多张 sheet 请在每个 sheet 上用按钮分别导出 TSV",
  3434. "TSV 文件请用记事本或 Excel 打开",
  3435. "TSV 不能存储图片,所以用图片链接代替",
  3436. "或使用此脚本复制表格到剪贴板:",
  3437. "https://gf.qytechs.cn/zh-CN/scripts/469550",
  3438. ];
  3439. alert(hint.join("\n"));
  3440. }
  3441. /**
  3442. * 原创力文档(EXCEL)下载策略
  3443. */
  3444. function excel() {
  3445. // 创建按钮区
  3446. utils.create_btns();
  3447. // 绑定监听器到按钮
  3448. utils.onclick(wantEXCEL, 1, "导出表格到TSV");
  3449. utils.onclick(help$1, 2, "使用说明");
  3450. // 显示按钮
  3451. utils.toggle_btn(2);
  3452. }
  3453. /**
  3454. * ------------------------------ PPT 策略 ---------------------------------
  3455. */
  3456. /**
  3457. * 返回当前页码
  3458. * @returns {number}
  3459. */
  3460. function cur_page_num() {
  3461. return parseInt(
  3462. wk$("#PageIndex")[0].textContent
  3463. );
  3464. }
  3465. function add_page() {
  3466. const view = wk$("#view")[0];
  3467. view.setAttribute("style", "");
  3468. const i = cur_page_num() - 1;
  3469. const cur_view = wk$(`#view${i}`)[0];
  3470. img_tasks.push(
  3471. html2canvas(cur_view)
  3472. );
  3473. utils.btn(1).textContent = `截图: ${img_tasks.length}`;
  3474. }
  3475. function reset_tasks() {
  3476. img_tasks.splice(0);
  3477. utils.btn(1).textContent = `截图: 0`;
  3478. }
  3479. function canvas_to_blob(canvas) {
  3480. return utils.canvas_to_blob(canvas);
  3481. }
  3482. async function export_imgs_as_pdf() {
  3483. alert("正在合并截图,请耐心等待");
  3484. utils.toggle_btn(3);
  3485. try {
  3486. const imgs = await utils.gather(img_tasks);
  3487. const blobs = await utils.gather(
  3488. imgs.map(canvas_to_blob)
  3489. );
  3490. if (!blobs.length) {
  3491. alert("你尚未截取任何页面!");
  3492. } else {
  3493. await utils.img_blobs_to_pdf(blobs, "原创力幻灯片");
  3494. }
  3495. } catch(err) {
  3496. console.error(err);
  3497. }
  3498. utils.toggle_btn(3);
  3499. }
  3500. function ppt() {
  3501. utils.create_btns();
  3502. const btn1 = utils.btn(1);
  3503. btn1.onclick = add_page;
  3504. btn1.textContent = "截图当前页面";
  3505. utils.onclick(reset_tasks, 2, "清空截图");
  3506. utils.onclick(export_imgs_as_pdf, 3, "合并为PDF");
  3507. utils.toggle_btn(2);
  3508. utils.toggle_btn(3);
  3509. }
  3510. /**
  3511. * 原创力文档下载策略
  3512. */
  3513. function book118() {
  3514. const host = window.location.hostname;
  3515. if (host === 'max.book118.com') {
  3516. if (is_excel()) {
  3517. utils.create_btns();
  3518. utils.onclick(open_iframe, 1, "访问EXCEL");
  3519. } else if (is_ppt()) {
  3520. utils.create_btns();
  3521. utils.onclick(open_iframe, 1, "访问PPT");
  3522. } else {
  3523. common_doc();
  3524. }
  3525. } else if (wk$("#ppt")[0]) {
  3526. if (window.top !== window) return;
  3527. ppt();
  3528. } else if (wk$(`[src*="excel.min.js"]`)[0]) {
  3529. excel();
  3530. } else {
  3531. console.log(`wk: Unknown host: ${host}`);
  3532. }
  3533. }
  3534. // test url: https://openstd.samr.gov.cn/bzgk/gb/newGbInfo?hcno=E86BBCE32DA8E67F3DA04ED98F2465DB
  3535. /**
  3536. * 绘制0x0的bmp, 作为请求失败时返回的page
  3537. * @returns {Promise<ImageBitmap>} blank_page
  3538. */
  3539. async function blankBMP() {
  3540. let canvas = document.createElement("canvas");
  3541. [canvas.width, canvas.height] = [0, 0];
  3542. return createImageBitmap(canvas);
  3543. }
  3544. /**
  3545. * resp导出bmp
  3546. * @param {string} page_url
  3547. * @param {Promise<Response> | ImageBitmap} pms_or_bmp
  3548. * @returns {Promise<ImageBitmap>} page
  3549. */
  3550. async function respToPage(page_url, pms_or_bmp) {
  3551. let center = globalThis.gb688JS;
  3552. // 此时是bmp
  3553. if (pms_or_bmp instanceof ImageBitmap) {
  3554. return pms_or_bmp;
  3555. }
  3556. // 第一次下载, 且无人处理
  3557. if (!center.pages_status.get(page_url)) {
  3558. // 处理中, 设为占用
  3559. center.pages_status.set(page_url, 1);
  3560. // 处理
  3561. let resp;
  3562. try {
  3563. resp = await pms_or_bmp;
  3564. } catch(err) {
  3565. console.log("下载页面失败");
  3566. console.error(err);
  3567. return blankBMP();
  3568. }
  3569. let page_blob = await resp.blob();
  3570. let page = await createImageBitmap(page_blob);
  3571. center.pages.set(page_url, page);
  3572. // 处理结束, 设为释放
  3573. center.pages_status.set(page_url, 0);
  3574. return page;
  3575. }
  3576. // 有人正在下载且出于处理中
  3577. while (center.pages_status.get(page_url)) {
  3578. await utils.sleep(500);
  3579. }
  3580. return center.pages.get(page_url);
  3581. }
  3582. /**
  3583. * 获得PNG页面
  3584. * @param {string} page_url
  3585. * @returns {Promise<ImageBitmap>} bmp
  3586. */
  3587. async function getPage(page_url) {
  3588. // 如果下载过, 直接返回缓存
  3589. let pages = globalThis.gb688JS.pages;
  3590. if (pages.has(page_url)) {
  3591. return respToPage(page_url, pages.get(page_url));
  3592. }
  3593. // 如果从未下载过, 就下载
  3594. let resp = fetch(page_url, {
  3595. "headers": {
  3596. "accept": "image/avif,image/webp,image/apng,image/svg+xml,image/*,*/*;q=0.8",
  3597. "accept-language": "zh-CN,zh;q=0.9,en;q=0.8",
  3598. "proxy-connection": "keep-alive"
  3599. },
  3600. "referrer": location.href,
  3601. "referrerPolicy": "strict-origin-when-cross-origin",
  3602. "body": null,
  3603. "method": "GET",
  3604. "mode": "cors",
  3605. "credentials": "include"
  3606. });
  3607. pages.set(page_url, resp);
  3608. return respToPage(page_url, resp);
  3609. }
  3610. /**
  3611. * 返回文档页div的裁切和粘贴位置信息: [[cut_x, cut_y, paste_x%, paset_y%],...]
  3612. * @param {HTMLDivElement} page_div 文档页元素
  3613. * @returns {Array<Array<number>>} positions
  3614. */
  3615. function getPostions(page_div) {
  3616. let positions = [];
  3617. Array.from(page_div.children).forEach(span => {
  3618. // 'pdfImg-3-8' -> {left: 30%; top: 80%;}
  3619. let paste_pos = span.className.split("-").slice(1).map(
  3620. v => parseInt(v) / 10
  3621. );
  3622. // '-600px 0px' -> [600, 0]
  3623. let cut_pos = span.style.backgroundPosition.split(" ").map(
  3624. v => Math.abs(parseInt(v))
  3625. );
  3626. positions.push([...cut_pos, ...paste_pos]);
  3627. });
  3628. return positions;
  3629. }
  3630. /**
  3631. * 取得文档页的图像url
  3632. * @param {HTMLDivElement} page_div
  3633. * @returns {string} url
  3634. */
  3635. function getPageURL(page_div) {
  3636. // 拿到目标图像url
  3637. let path = location.pathname.split("/").slice(0, -1).join("/");
  3638. let prefix = location.origin + path + "/";
  3639. let url = page_div.getAttribute("bg");
  3640. if (!url) {
  3641. // 'url("viewGbImg?fileName=VS72l67k0jw5g3j0vErP8DTsnWvk5QsqnNLLxaEtX%2FM%3D")'
  3642. url = page_div.children[0].style.backgroundImage.split('"')[1];
  3643. }
  3644. return prefix + url;
  3645. }
  3646. /**
  3647. * 下载目标图像并拆解重绘, 返回canvas
  3648. * @param {number} i 第 i 页 (从0开始)
  3649. * @param {HTMLDivElement} page_div
  3650. * @returns {Promise<Array>} [页码, Canvas]
  3651. */
  3652. async function getAndDrawPage(i, page_div) {
  3653. // 拿到目标图像
  3654. let url = getPageURL(page_div);
  3655. let page = await getPage(url);
  3656. // 绘制空白A4纸背景
  3657. let [page_w, page_h] = [1190, 1680];
  3658. let bg = document.createElement("canvas");
  3659. bg.width = page_w; // 注意canvas作为取景框的大小
  3660. bg.height = page_h; // 如果不设置等于一个很小的取景框
  3661. let bg_ctx = bg.getContext("2d");
  3662. bg_ctx.fillStyle = "white";
  3663. bg_ctx.fillRect(0, 0, page_w, page_h);
  3664. // 逐个区块剪切取出并粘贴
  3665. // wk$("#viewer .page").forEach(page_div => {
  3666. getPostions(page_div).forEach(pos => {
  3667. bg_ctx.drawImage(
  3668. page, // image source
  3669. pos[0], // source x
  3670. pos[1], // source y
  3671. 120, // source width
  3672. 169, // source height
  3673. pos[2] * page_w, // destination x = left: x%
  3674. pos[3] * page_h, // destination y = top: y%
  3675. 120, // destination width
  3676. 169 // destination height
  3677. );
  3678. });
  3679. // });
  3680. return [i, bg];
  3681. }
  3682. /**
  3683. * 页面批量请求、裁剪重绘, 合成PDF并下载
  3684. */
  3685. async function turnPagesToPDF() {
  3686. // 渲染每页
  3687. const tasks = wk$("#viewer .page").map(
  3688. (page_div, i) => getAndDrawPage(i, page_div)
  3689. );
  3690. // 等待每页渲染完成后,排序
  3691. const results = await utils.gather(tasks);
  3692. results.sort((prev, next) => prev[0] - next[0]);
  3693. // 合并为PDF并导出
  3694. return utils.imgs_to_pdf(
  3695. results.map(item => item[1]),
  3696. // '在线预览|GB 14023-2022'
  3697. document.title.split("|")[1]
  3698. );
  3699. }
  3700. /**
  3701. * 提示预估下载耗时,然后下载
  3702. */
  3703. function hintThenDownload$1() {
  3704. // '/93'
  3705. let page_num = parseInt(wk$("#numPages")[0].textContent.slice(1));
  3706. let estimate = Math.ceil(page_num / 3);
  3707. alert(`页数: ${page_num},预计花费: ${estimate}秒;如遇网络异常可能更久\n请勿反复点击按钮;如果无法导出请 QQ 群反馈`);
  3708. turnPagesToPDF();
  3709. }
  3710. /**
  3711. * gb688文档下载策略
  3712. */
  3713. async function gb688() {
  3714. // 创建全局对象
  3715. globalThis.gb688JS = {
  3716. pages: new Map(), // {url: bmp}
  3717. pages_status: new Map() // {url: 0或1} 0释放, 1占用
  3718. };
  3719. // 创建按钮区
  3720. utils.create_btns();
  3721. // 绑定监听器
  3722. // 按钮1:导出PDF
  3723. utils.onclick(hintThenDownload$1, 1, "导出PDF");
  3724. }
  3725. function getPageCounts() {
  3726. // " / 39"
  3727. const counts_str = wk$(".counts")[0].textContent.split("/")[1];
  3728. const counts = parseInt(counts_str);
  3729. return counts > 20 ? 20 : counts;
  3730. }
  3731. /**
  3732. * 返回图片基础路径
  3733. * @returns {string} base_url
  3734. */
  3735. function getImgBaseURL() {
  3736. return wk$("#dp")[0].value;
  3737. }
  3738. function* genImgURLs$1() {
  3739. let counts = getPageCounts();
  3740. let base_url = getImgBaseURL();
  3741. for (let i = 1; i <= counts; i++) {
  3742. yield base_url + `${i}.gif`;
  3743. }
  3744. }
  3745. /**
  3746. * 下载图片,转为canvas,合并为PDF并下载
  3747. * @returns {Promise<void>}
  3748. */
  3749. function fetchThenExportPDF() {
  3750. // db2092-2014-河北特种设备使用安全管理规范_安全文库网safewk.com
  3751. let title = document.title.split("_")[0];
  3752. return utils.img_urls_to_pdf(genImgURLs$1(), title);
  3753. }
  3754. /**
  3755. * 提示预估下载耗时,然后下载
  3756. */
  3757. function hintThenDownload() {
  3758. let hint = [
  3759. "只能导出可预览的页面(最多20页)",
  3760. "请勿短时间反复点击按钮,导出用时大约不到 10 秒",
  3761. "点完后很久没动静请至 QQ 群反馈"
  3762. ];
  3763. alert(hint.join("\n"));
  3764. return utils.run_with_prog(
  3765. 1, fetchThenExportPDF
  3766. );
  3767. }
  3768. /**
  3769. * safewk文档下载策略
  3770. */
  3771. async function safewk() {
  3772. // 创建按钮区
  3773. utils.create_btns();
  3774. // 绑定监听器
  3775. // 按钮1:导出PDF
  3776. utils.onclick(
  3777. hintThenDownload, 1, "导出PDF"
  3778. );
  3779. }
  3780. /**
  3781. * 跳转到页码
  3782. * @param {string | number} num
  3783. */
  3784. function _to_page(num) {
  3785. if (window.WebPreview
  3786. && WebPreview.Page
  3787. && WebPreview.Page.jump
  3788. ) {
  3789. WebPreview.Page.jump(parseInt(num));
  3790. } else {
  3791. console.error("window.WebPreview.Page.jump doesn't exist");
  3792. }
  3793. }
  3794. /**
  3795. * 跳转页码GUI版
  3796. */
  3797. function to_page() {
  3798. let num = prompt("请输入要跳转的页码")?.trim();
  3799. if (/^[0-9]+$/.test(num)) {
  3800. _to_page(num);
  3801. } else {
  3802. console.log(`输入值 [${num}] 不是合法整数`);
  3803. }
  3804. }
  3805. function capture_urls() {
  3806. if (!confirm(
  3807. "只能导出已经预览页面的链接,是否继续?"
  3808. )) return;
  3809. let imgs = wk$("[data-id] img");
  3810. if (imgs.length === 0) {
  3811. imgs = wk$("img[data-page]");
  3812. }
  3813. console.log(imgs);
  3814. const urls = imgs.map(img => {
  3815. const src = img.dataset.src || img.src;
  3816. if (!src) return;
  3817. return src.startsWith("//") ? "https:" + src : src
  3818. });
  3819. const lacked = [];
  3820. const existed = urls.filter((url, i) => {
  3821. if (url) return true;
  3822. lacked.push(i + 1);
  3823. });
  3824. utils.save_urls(existed);
  3825. alert(
  3826. `已经浏览的页面中有 ${lacked.length} 页图片尚未加载,` +
  3827. `已经从结果中剔除。\n它们的页码是:\n${lacked}`
  3828. );
  3829. }
  3830. function* genImgURLs() {
  3831. const params = window?.previewParams;
  3832. if (!params) throw new Error(
  3833. "接口为空: window.previewParams"
  3834. );
  3835. let i = -4;
  3836. const
  3837. base = "https://openapi.renrendoc.com/preview/getPreview?",
  3838. query = {
  3839. temp_view: 0,
  3840. jsoncallback: "a",
  3841. callback: "b",
  3842. encrypt: params.encrypt,
  3843. doc_id: params.doc_id,
  3844. get _() { return Date.now() },
  3845. get start() { return i += 5; },
  3846. };
  3847. while (true) {
  3848. const keys = Reflect.ownKeys(query);
  3849. yield base + keys.map(
  3850. key => `${key}=${query[key]}`
  3851. ).join("&");
  3852. }
  3853. }
  3854. async function _fetch_preview_urls() {
  3855. let
  3856. is_empty = true,
  3857. switch_counts = 0,
  3858. previews = [];
  3859. for (const [i, url] of utils.enumerate(genImgURLs())) {
  3860. const resp = await fetch(url);
  3861. utils.raise_for_status(resp);
  3862. const raw_data = await resp.text(),
  3863. data = raw_data.slice(2, -1),
  3864. img_urls = JSON
  3865. .parse(data)
  3866. .data
  3867. ?.preview_list
  3868. ?.map(pair => pair.url);
  3869. if (!img_urls) break;
  3870. previews = previews.concat(...img_urls);
  3871. utils.update_popup(`已经请求 ${i + 1} 组图片链接`);
  3872. if (is_empty !== (img_urls.length ? false : true)) {
  3873. is_empty = !is_empty;
  3874. switch_counts++;
  3875. }
  3876. if (switch_counts === 2) break;
  3877. await utils.sleep(1000);
  3878. }
  3879. const
  3880. params = window.previewParams,
  3881. free = params.freepage || 20,
  3882. base = params.pre || wk$(".page img")[0].src.slice(0, -5),
  3883. free_urls = Array.from(
  3884. utils.range(1, free + 1)
  3885. ).map(
  3886. n => `${base}${n}.gif`
  3887. );
  3888. const urls = free_urls.concat(...previews);
  3889. utils.save_urls(urls);
  3890. }
  3891. function fetch_preview_urls() {
  3892. return utils.run_with_prog(
  3893. 3, _fetch_preview_urls
  3894. );
  3895. }
  3896. function help() {
  3897. alert(
  3898. "【捕获】和【请求】图片链接的区别:\n" +
  3899. " - 【捕获】是从当前已经加载的文档页中提取图片链接\n" +
  3900. " - 【请求】是使用官方接口直接下载图片链接\n" +
  3901. " - 【捕获】使用麻烦,但是稳定\n" +
  3902. " - 【请求】使用简单,速度快,但可能失效"
  3903. );
  3904. }
  3905. /**
  3906. * 人人文档下载策略
  3907. */
  3908. async function renrendoc() {
  3909. utils.create_btns();
  3910. utils.onclick(to_page, 1, "跳转到页码");
  3911. utils.onclick(capture_urls, 2, "捕获图片链接");
  3912. utils.onclick(fetch_preview_urls, 3, "请求图片链接");
  3913. utils.onclick(help, 4, "使用说明");
  3914. utils.toggle_btn(2);
  3915. utils.toggle_btn(3);
  3916. utils.toggle_btn(4);
  3917. }
  3918. /**
  3919. * 取得全部图片连接
  3920. * @returns {Array<string>}
  3921. */
  3922. function get_img_urls() {
  3923. const src = wk$("#page1 img")[0]?.src;
  3924. // 适用于图片类型
  3925. if (src) {
  3926. const path = src.split("?")[0].split("/").slice(3, -1).join("/");
  3927. const origin = new URL(location.href).origin;
  3928. const urls = window.htmlConfig.fliphtml5_pages.map(obj => {
  3929. const fname = obj.n[0].split("?")[0].split("/").at(-1);
  3930. return `${origin}/${path}/${fname}`;
  3931. });
  3932. const unique = [...new Set(urls)];
  3933. window.img_urls = unique;
  3934. return unique;
  3935. }
  3936. // 适用于其他类型
  3937. const relative_path = wk$(".side-image img")[0].getAttribute("src").split("?")[0];
  3938. // ../files/large/
  3939. const relative_dir = relative_path.split("/").slice(0, -1).join("/") + "/";
  3940. const base = location.href;
  3941. const urls = window.htmlConfig.fliphtml5_pages.map(obj => {
  3942. // "../files/large/d8b6c26f987104455efb3ec5addca7c9.jpg"
  3943. const path = relative_dir + obj.n[0].split("?")[0];
  3944. const url = new URL(path, base);
  3945. // https://book.yunzhan365.com/mctl/itid/files/large/d8b6c26f987104455efb3ec5addca7c9.jpg
  3946. return url.href.replace("/thumb/", "/content-page/");
  3947. });
  3948. window.img_urls = urls;
  3949. return urls;
  3950. }
  3951. function imgs_to_pdf() {
  3952. const urls = get_img_urls();
  3953. const title = document.title;
  3954. const task = () => utils.img_urls_to_pdf(urls, title);
  3955. utils.run_with_prog(1, task);
  3956. alert(
  3957. "正在下载图片,请稍等,时长取决于图片数量\n" +
  3958. "如果导出的文档只有一页空白页,说明当前文档不适用"
  3959. );
  3960. }
  3961. /**
  3962. * 将数组中的连续数字描述为字符串
  3963. * 例如 [1, 2, 3, 5] => "1 - 3, 5"
  3964. * @param {number[]} nums 整数数组
  3965. * @returns {string} 描述数组的字符串
  3966. */
  3967. function describe_nums(nums) {
  3968. let result = "";
  3969. let start = nums[0];
  3970. let end = nums[0];
  3971. for (let i = 1; i < nums.length; i++) {
  3972. if (nums[i] === end + 1) {
  3973. end = nums[i];
  3974. } else {
  3975. if (start === end) {
  3976. result += start + ", ";
  3977. } else {
  3978. result += start + " - " + end + ", ";
  3979. }
  3980. start = nums[i];
  3981. end = nums[i];
  3982. }
  3983. }
  3984. if (start === end) {
  3985. result += start;
  3986. } else {
  3987. result += start + " - " + end;
  3988. }
  3989. return result;
  3990. }
  3991. /**
  3992. * 取得总页码(作为str)
  3993. * @returns {string}
  3994. */
  3995. function get_total() {
  3996. const total = window?.bookConfig?.totalPageCount;
  3997. if (total) {
  3998. return String(total);
  3999. }
  4000. return wk$("#tfPageIndex input")[0].value.split("/")[1].trim();
  4001. }
  4002. /**
  4003. * 下载稀疏数组的pdf数据,每个元素应该是 [pdf_blob, pwd_str]
  4004. * @param {Array} pdfs_data
  4005. */
  4006. async function data_to_zip(pdfs_data) {
  4007. // 导入jszip
  4008. await utils.blobs_to_zip([], "empty", "dat", "empty", false);
  4009. // 分装截获的数据
  4010. const page_nums = Object.keys(pdfs_data)
  4011. .map(index => parseInt(index) + 1);
  4012. const len = page_nums.length;
  4013. const pwds = new Array(len + 1);
  4014. pwds[0] = "page-num,password";
  4015. // 创建压缩包,归档加密的PDF页面
  4016. const zip = new window.JSZip();
  4017. const total = get_total();
  4018. const digits = total.length;
  4019. // 归档
  4020. for (let i = 0; i < len; i++) {
  4021. // 页码左侧补零
  4022. const page_no = page_nums[i];
  4023. const page_no_str = page_no.toString().padStart(digits, "0");
  4024. // 记录密码
  4025. pwds[i+1] = `${page_no_str},${pdfs_data[page_no - 1][1]}`;
  4026. // 添加pdf内容到压缩包
  4027. const blob = pdfs_data[page_no - 1][0];
  4028. zip.file(`page-${page_no_str}.pdf`, blob, { binary: true });
  4029. }
  4030. console.log("zip:", zip);
  4031. // 添加密码本到压缩包
  4032. const pwds_blob = new Blob([pwds.join("\n")], { type: "text/plain" });
  4033. zip.file(`密码本.txt`, pwds_blob, { binary: true });
  4034. // 下载
  4035. console.info("正在合成压缩包并导出,请耐心等待几分钟......");
  4036. const zip_blob = await zip.generateAsync({ type: "blob" });
  4037. utils.save(`${document.title}.zip`, zip_blob, "application/zip");
  4038. }
  4039. /**
  4040. * 下载多个pdf为一个压缩包,其中包含一个密码本
  4041. * @param {PointerEvent} event
  4042. */
  4043. async function export_zip(event) {
  4044. // 异常判断
  4045. if (!window.pdfs_data) utils.raise(`pdfs_data 不存在!`);
  4046. // 确认是否继续导出PDF
  4047. const page_nums = Object.keys(pdfs_data)
  4048. .map(index => parseInt(index) + 1);
  4049. const donwload = confirm(
  4050. `已经捕获 ${page_nums.length} 个页面,是否导出?\n` +
  4051. `已捕获的页码:${describe_nums(page_nums)}\n` +
  4052. `(如果某页缺失可以先多向后翻几页,然后翻回来,来重新加载它)`
  4053. );
  4054. if (!donwload) return;
  4055. // 隐藏按钮
  4056. const btn = event.target;
  4057. btn.style.display = "none";
  4058. // 下载压缩包
  4059. await data_to_zip(pdfs_data);
  4060. // 显示按钮
  4061. btn.style.display = "block";
  4062. }
  4063. function steal_pdf_when_page_loaded() {
  4064. // 共用变量
  4065. // 存放pdf数据,[[<pdf_blob>, <pwd_str>], ...]
  4066. window.pdfs_data = [];
  4067. // 代表当前页码
  4068. let page_no = NaN;
  4069. // hook PdfLoadingTask.prototype.start
  4070. const _start = PdfLoadingTask.prototype.start;
  4071. wk$._start = _start;
  4072. PdfLoadingTask.prototype.start = function() {
  4073. // 取得页码
  4074. page_no = this.index;
  4075. // 如果不存在此页,则准备捕获此页面
  4076. if (!pdfs_data[page_no - 1]) {
  4077. pdfs_data[page_no - 1] = [];
  4078. }
  4079. return _start.call(this);
  4080. };
  4081. // hook getBlob
  4082. const _get_blob = getBlob;
  4083. wk$._get_blob = _get_blob;
  4084. window.getBlob = async function(param) {
  4085. const result = await _get_blob.call(this, param);
  4086. // 如果当前页面需要捕获,则设置对应项的密码
  4087. if (page_no > 0) {
  4088. const resp = await fetch(result.url);
  4089. const blob = await resp.blob();
  4090. pdfs_data[page_no - 1] = [blob, result.password];
  4091. page_no = NaN;
  4092. }
  4093. return result;
  4094. };
  4095. utils.onclick(export_zip, 1, "导出PDF压缩包");
  4096. }
  4097. /**
  4098. * 请求 url 并将资源转为 [pdf_blob, password_str]
  4099. * @param {string} url
  4100. * @returns {Array}
  4101. */
  4102. async function url_to_item(url) {
  4103. // 取得pdf数据
  4104. const resp = await fetch(url);
  4105. const buffer = await resp.arrayBuffer();
  4106. const bytes = new Uint8Array(buffer);
  4107. const len = bytes.length;
  4108. // 更新进度
  4109. window.downloaded_count++;
  4110. window.downloaded_size += len;
  4111. console.log(
  4112. `已经下载了 ${downloaded_count} 页,\n` +
  4113. `累计下载了 ${(downloaded_size / 1024 / 1024).toFixed(1)} MB`
  4114. );
  4115. // 取出密钥
  4116. const pwd = new Uint8Array(6);
  4117. pwd.set(bytes.subarray(1080, 1083));
  4118. pwd.set(bytes.subarray(-1003, -1000), 3);
  4119. const pwd_str = new TextDecoder().decode(pwd);
  4120. // 解密出数据
  4121. const pdf = bytes.subarray(1083, -1003);
  4122. pdf.subarray(0, 4000).forEach((byte, i) => {
  4123. pdf[i] = 255 - byte;
  4124. });
  4125. return [
  4126. new Blob([pdf, pdf.subarray(4000)], { type: "application/pdf" }),
  4127. pwd_str
  4128. ];
  4129. }
  4130. /**
  4131. * 直接下载并解析原始数据,导出PDF压缩包
  4132. * @param {PointerEvent} event
  4133. */
  4134. async function donwload_zip(event) {
  4135. // 隐藏按钮
  4136. const btn = event.target;
  4137. btn.style.display = "none";
  4138. // 共用进度变量
  4139. window.downloaded_count = 0;
  4140. window.downloaded_size = 0;
  4141. // 取得数据地址
  4142. const urls = get_img_urls()
  4143. .map(url => url.replace("/thumb/", "/content-page/"));
  4144. // 批量下载
  4145. const item_tasks = urls.map(url_to_item);
  4146. const items = await utils.gather(item_tasks);
  4147. // 导出ZIP
  4148. await data_to_zip(items);
  4149. // 显示按钮
  4150. btn.style.display = "block";
  4151. }
  4152. /**
  4153. * 导出图片到PDF
  4154. */
  4155. function judge_file_type() {
  4156. const ext = window
  4157. ?.htmlConfig
  4158. ?.fliphtml5_pages[0]
  4159. ?.n[0]
  4160. ?.split("?")[0]
  4161. ?.split(".").at(-1);
  4162. console.log("ext:", ext);
  4163. if (["zip"].includes(ext)
  4164. && window?.PdfLoadingTask
  4165. && window?.getBlob) {
  4166. utils.onclick(steal_pdf_when_page_loaded, 1, "开始捕获");
  4167. utils.onclick(donwload_zip, 2, "下载PDF压缩包");
  4168. utils.toggle_btn(2);
  4169. }
  4170. else if (wk$("#page1 img")[0]) {
  4171. utils.onclick(imgs_to_pdf, 1, "导出PDF");
  4172. }
  4173. else {
  4174. utils.onclick(() => null, 1, "此文档不适用");
  4175. }
  4176. }
  4177. /**
  4178. * 云展网文档下载策略
  4179. */
  4180. async function yunzhan365() {
  4181. // 根据网址分别处理
  4182. if (location.pathname.startsWith("/basic")) {
  4183. return;
  4184. }
  4185. // 创建脚本启动按钮
  4186. utils.create_btns();
  4187. judge_file_type();
  4188. }
  4189. /**
  4190. * 导出图片链接
  4191. */
  4192. function exportURLs$1() {
  4193. const all = parseInt(
  4194. wk$("[class*=total]")[0]
  4195. );
  4196. const imgs = wk$("[class*=imgContainer] img");
  4197. const got = imgs.length;
  4198. if (got < all) {
  4199. if (!confirm(
  4200. `当前浏览页数:${got},总页数:${all}\n建议浏览剩余页面以导出全部链接\n是否继续导出链接?`
  4201. )) {
  4202. return;
  4203. }
  4204. }
  4205. utils.save_urls(
  4206. imgs.map(img => img.src)
  4207. );
  4208. }
  4209. /**
  4210. * 360文库文档下载策略
  4211. */
  4212. function wenku360() {
  4213. utils.create_btns();
  4214. utils.onclick(
  4215. exportURLs$1, 1, "导出图片链接"
  4216. );
  4217. // utils.onclick(
  4218. // callAgent, 2, "导出PDF"
  4219. // );
  4220. // utils.toggle_btn(2);
  4221. }
  4222. async function getFileInfo() {
  4223. const
  4224. uid = new URL(location.href).searchParams.get("contentUid"),
  4225. resp = await fetch("https://zyjy-resource.webtrn.cn/sdk/api/u/open/getResourceDetail", {
  4226. "headers": {
  4227. "accept": "application/json, text/javascript, */*; q=0.01",
  4228. "content-type": "application/json",
  4229. },
  4230. "referrer": "https://jg.class.com.cn/",
  4231. "body": `{"params":{"contentUid":"${uid}"}}`,
  4232. "method": "POST",
  4233. }),
  4234. data = await resp.json(),
  4235. url = data["data"]["downloadUrl"],
  4236. fname = data["data"]["title"];
  4237. let ext;
  4238. try {
  4239. // validate the URL format
  4240. // and get the file format
  4241. ext = new URL(url).pathname.split(".").at(-1);
  4242. } catch(e) {
  4243. console.log(data);
  4244. throw new Error("API changed, the script is invalid now.");
  4245. }
  4246. return { url, fname, ext };
  4247. }
  4248. /**
  4249. * 保存文件
  4250. * @param {{fname: string, url: string, ext: string}} info
  4251. */
  4252. async function saveFile(info) {
  4253. const
  4254. resp = await fetch(info.url),
  4255. blob = await resp.blob();
  4256. utils.save(info.fname + `.${info.ext}`, blob);
  4257. }
  4258. /**
  4259. * 劫持保存网页,改为保存文件
  4260. * @param {KeyboardEvent} e
  4261. */
  4262. function onCtrlS(e) {
  4263. if (e.code === "KeyS" &&
  4264. e.ctrlKey) {
  4265. console.log("ctrl + s is captured!!");
  4266. getFileInfo().then(info => saveFile(info));
  4267. e.preventDefault();
  4268. e.stopImmediatePropagation();
  4269. e.stopPropagation();
  4270. }
  4271. }
  4272. /**
  4273. * 技工教育网文档策略
  4274. */
  4275. function jg() {
  4276. window.addEventListener(
  4277. "keydown", onCtrlS, true
  4278. );
  4279. }
  4280. async function estimateTimeCost() {
  4281. wk$(".w-page").at(-1).scrollIntoView();
  4282. await utils.sleep(1000);
  4283. let total = wk$("#pageNumber-text")[0].textContent.split("/")[1];
  4284. total = parseInt(total);
  4285. return confirm([
  4286. "注意,一旦开始截图就无法停止,除非刷新页面。",
  4287. "浏览器窗口最小化会导致截图提前结束!",
  4288. "建议将窗口最大化,这将【显著增大清晰度和文件体积】",
  4289. `预计耗时 ${1.1 * total} 秒,是否继续?`,
  4290. ].join("\n"));
  4291. }
  4292. /**
  4293. * 逐页捕获canvas
  4294. * @returns {Promise<Array<Blob>>}
  4295. */
  4296. async function collectAll() {
  4297. const imgs = [];
  4298. let div = wk$(".w-page")[0];
  4299. let i = 0;
  4300. while (true) {
  4301. // 取得 div
  4302. const anchor = Date.now();
  4303. while (!div && (Date.now() - anchor < 1000)) {
  4304. console.log(`retry on page ${i+1}`);
  4305. await utils.sleep(200);
  4306. }
  4307. if (!div) throw new Error(
  4308. `can not fetch <div>: page ${i}`
  4309. );
  4310. // 移动到 div
  4311. div.scrollIntoView({ behavior: "smooth" });
  4312. await utils.sleep(1000);
  4313. // 取得 canvas
  4314. let canvas = wk$.call(div, "canvas")[0];
  4315. let j = 0;
  4316. while (!canvas && j < 100) {
  4317. div = div.nextElementSibling;
  4318. canvas = wk$.call(div, "canvas")[0];
  4319. j++;
  4320. }
  4321. if (!div) throw new Error(
  4322. `can not fetch <div>: page ${i}*`
  4323. );
  4324. // 存储 canvas
  4325. imgs.push(
  4326. await utils.canvas_to_blob(canvas)
  4327. );
  4328. console.log(`canvas stored: ${++i}`);
  4329. // 下一轮循环
  4330. div = div.nextElementSibling;
  4331. if (!div) break;
  4332. }
  4333. console.log("done");
  4334. return imgs;
  4335. }
  4336. /**
  4337. * 放大或缩小文档画面
  4338. * @param {boolean} up
  4339. */
  4340. async function scale(up) {
  4341. let s = "#magnifyBtn";
  4342. if (!up) {
  4343. s = "#shrinkBtn";
  4344. }
  4345. const btn = wk$(s)[0];
  4346. for (let _ of utils.range(10)) {
  4347. btn.click();
  4348. await utils.sleep(500);
  4349. }
  4350. }
  4351. /**
  4352. * 获取全部canvas,显示功能按钮
  4353. * @returns
  4354. */
  4355. async function prepare() {
  4356. if (! await estimateTimeCost()) {
  4357. return;
  4358. }
  4359. // 隐藏按钮
  4360. utils.toggle_btn(1);
  4361. // 放大画面
  4362. await scale(true);
  4363. let imgs;
  4364. try {
  4365. imgs = await collectAll();
  4366. } catch(e) {
  4367. console.error(e);
  4368. } finally {
  4369. // 缩小画面
  4370. scale(false);
  4371. }
  4372. // window.imgs = imgs;
  4373. // 显示功能按钮
  4374. const fname = "技工教育网文档";
  4375. utils.onclick(
  4376. () => utils.img_blobs_to_pdf(imgs, fname),
  4377. 2,
  4378. "导出PDF"
  4379. );
  4380. utils.toggle_btn(2);
  4381. utils.onclick(
  4382. () => utils.blobs_to_zip(imgs, "page", "png", fname),
  4383. 3,
  4384. "导出ZIP"
  4385. );
  4386. utils.toggle_btn(3);
  4387. }
  4388. /**
  4389. * 技工教育文档预览页面策略
  4390. */
  4391. function jgPreview() {
  4392. utils.create_btns();
  4393. utils.onclick(
  4394. prepare, 1, "截图文档"
  4395. );
  4396. }
  4397. /**
  4398. * 取得文档标题
  4399. * @returns {string}
  4400. */
  4401. function getTitle() {
  4402. return document.title.slice(0, -4);
  4403. }
  4404. /**
  4405. * 取得基础URL
  4406. * @returns {string}
  4407. */
  4408. function getBaseURL$1() {
  4409. return wk$("#dp")[0].value;
  4410. }
  4411. /**
  4412. * 获取总页码
  4413. * @returns {number}
  4414. */
  4415. function getTotalPageNum() {
  4416. const num = wk$(".shop3 > li:nth-child(3)")[0]
  4417. .textContent
  4418. .split("/")[1]
  4419. .trim();
  4420. return parseInt(num);
  4421. }
  4422. /**
  4423. * 返回图片链接生成器
  4424. * @param {string} base 基础图片链接地址
  4425. * @param {number} max 最大数量
  4426. * @returns {Generator<string, void, unknown>}
  4427. */
  4428. function* imgURLsMaker(base, max) {
  4429. for (let i of utils.range(1, max + 1)) {
  4430. yield `${base}${i}.gif`;
  4431. }
  4432. }
  4433. /**
  4434. * 取得当前页面全部图片链接(生成器)
  4435. * @returns {Generator<string, void, unknown>}
  4436. */
  4437. function getImgURLs() {
  4438. const
  4439. base = getBaseURL$1(),
  4440. total = getTotalPageNum();
  4441. return imgURLsMaker(base, total)
  4442. }
  4443. function exportPDF() {
  4444. const urls = getImgURLs();
  4445. const title = getTitle();
  4446. return utils.run_with_prog(
  4447. 2, () => utils.img_urls_to_pdf(urls, title)
  4448. );
  4449. }
  4450. function exportURLs() {
  4451. const urls = getImgURLs();
  4452. utils.save_urls(urls);
  4453. }
  4454. /**
  4455. * 文库吧文档下载策略
  4456. */
  4457. function wenkub() {
  4458. utils.create_btns();
  4459. utils.onclick(
  4460. exportURLs, 1, "导出图片链接"
  4461. );
  4462. utils.onclick(
  4463. exportPDF, 2, "导出PDF(测试)"
  4464. );
  4465. utils.toggle_btn(2);
  4466. }
  4467. function* pageURLGen() {
  4468. const
  4469. url = new URL(location.href),
  4470. params = url.searchParams,
  4471. base = url.origin + (window.basePath || "/manuscripts/pdf"),
  4472. type = params.get("type") || "pdf",
  4473. id = params.get("id")
  4474. || new URL(wk$("#pdfContent")[0].src).searchParams.get("id")
  4475. || utils.raise("书本ID未知");
  4476. let i = 0;
  4477. let cur_url = "";
  4478. if (window.wk_sklib_url) {
  4479. console.log(`sklib 使用自定义 url: ${window.wk_sklib_url}`);
  4480. while (true) {
  4481. cur_url = window.wk_sklib_url.replace("{id}", id).replace("{index}", `${i}`);
  4482. yield [i, cur_url];
  4483. console.log("wk: target:", cur_url);
  4484. i++;
  4485. }
  4486. } else {
  4487. while (true) {
  4488. cur_url = `${base}/data/${type}/${id}/${i}?random=null`;
  4489. yield [i, cur_url];
  4490. console.log("wk: target:", cur_url);
  4491. i++;
  4492. }
  4493. }
  4494. }
  4495. async function get_bookmarks() {
  4496. const url = new URL(location.origin);
  4497. const id = utils.get_param("id");
  4498. url.pathname = `/manuscripts/pdf/catalog/pdf/${id}`;
  4499. const resp = await fetch(url.href);
  4500. const data = await resp.json();
  4501. const bookmarks = JSON.parse(data.data).outline;
  4502. return bookmarks;
  4503. }
  4504. async function save_bookmarks() {
  4505. const bookmarks = await get_bookmarks();
  4506. const text = JSON.stringify(bookmarks, null, 2);
  4507. utils.save("bookmarks.json", text, { type: "application/json" });
  4508. }
  4509. /**
  4510. * 下载所有pdf文件数据,返回字节串数组
  4511. * @returns {Promise<Array<Uint8Array>>}
  4512. */
  4513. async function fetch_all_pdfs() {
  4514. // 如果已经下载完成,则直接返回之前的结果
  4515. if (window.download_finished) {
  4516. return window.pdfs;
  4517. }
  4518. // 显示进度的按钮
  4519. const prog_btn = utils.btn(3);
  4520. window.download_finished = false;
  4521. // 存储pdf字节串
  4522. const pdfs = [];
  4523. let
  4524. last_digest = NaN,
  4525. size = NaN;
  4526. // 读取每个PDF的页数
  4527. if (window.loadPdfInfo) {
  4528. try {
  4529. const resp = await loadPdfInfo();
  4530. const info = JSON.parse(resp.data);
  4531. size = parseInt(info.size) || size;
  4532. } catch(e) {
  4533. console.error(e);
  4534. }
  4535. }
  4536. for (const [i, url] of pageURLGen()) {
  4537. // 取得数据
  4538. const b64_data = await fetch(url).then(resp => resp.text());
  4539. // 如果获取完毕,则退出
  4540. if (!b64_data.length) break;
  4541. // 计算摘要
  4542. const digest = utils.crc32(b64_data);
  4543. // 如果摘要重复了,说明到达最后一页,退出
  4544. if (digest === last_digest) break;
  4545. // 否则继续
  4546. last_digest = digest;
  4547. pdfs.push(
  4548. utils.b64_to_bytes(b64_data)
  4549. );
  4550. // 更新进度
  4551. const progress = `已经获取 ${i + 1} 组页面,每组`
  4552. + (size ? ` ${size} 页` : '页数未知');
  4553. console.info(progress);
  4554. prog_btn.textContent = `${i + 1} / ${size} 页`;
  4555. }
  4556. window.pdfs = pdfs;
  4557. window.download_finished = true;
  4558. return pdfs;
  4559. }
  4560. /**
  4561. * @param {Function} async_fn
  4562. * @returns {Function}
  4563. */
  4564. function toggle_dl_btn_wrapper(async_fn) {
  4565. return async function(...args) {
  4566. utils.toggle_btn(1);
  4567. utils.toggle_btn(2);
  4568. await async_fn(...args);
  4569. utils.toggle_btn(1);
  4570. utils.toggle_btn(2);
  4571. }
  4572. }
  4573. async function download_pdf$1() {
  4574. alert(
  4575. "如果看不到进度条请使用开发者工具(F12)查看日志\n" +
  4576. "如果文档页数过多可能导致合并PDF失败\n" +
  4577. "此时请使用【下载PDF数据集】按钮"
  4578. );
  4579. const pdfs = await fetch_all_pdfs();
  4580. const combined = await utils.join_pdfs(pdfs);
  4581. utils.save(
  4582. document.title + ".pdf",
  4583. combined,
  4584. "application/pdf"
  4585. );
  4586. utils.btn(3).textContent = "进度条";
  4587. }
  4588. download_pdf$1 = toggle_dl_btn_wrapper(download_pdf$1);
  4589. async function download_data_bundle() {
  4590. alert(
  4591. "下载的是 <文档名称>.dat 数据集\n" +
  4592. "等价于若干 PDF 的文件顺序拼接\n" +
  4593. "请使用工具切割并合并为一份 PDF\n" +
  4594. "工具(pdfs-merger)链接在脚本主页"
  4595. );
  4596. const pdfs = await fetch_all_pdfs();
  4597. const blob = new Blob(pdfs, { type: "application/octet-stream" });
  4598. const url = URL.createObjectURL(blob);
  4599. const a = document.createElement("a");
  4600. a.download = document.title + ".dat";
  4601. a.href = url;
  4602. a.click();
  4603. URL.revokeObjectURL(url);
  4604. console.log("pdf数据集", blob);
  4605. }
  4606. download_data_bundle = toggle_dl_btn_wrapper(download_data_bundle);
  4607. function sdlib() {
  4608. const url = new URL(location.href);
  4609. const encrypted_id = url.pathname.split("/")[2];
  4610. window.basePath = `/https/${encrypted_id}${basePath}`;
  4611. }
  4612. /**
  4613. * 钩子函数,启动于主函数生效时,便于不同网站微调
  4614. */
  4615. function load_hooks() {
  4616. const host_to_fn = {
  4617. "gwfw.sdlib.com": sdlib,
  4618. };
  4619. const fn = host_to_fn[location.hostname];
  4620. if (fn) {
  4621. // 如果存在对应 hook 函数,则调用,否则忽略
  4622. fn();
  4623. }
  4624. }
  4625. /**
  4626. * 中国社会科学文库文档策略
  4627. */
  4628. function sklib() {
  4629. // 如果存在 pdf iframe 则在 iframe 中调用自身
  4630. const iframe = wk$("iframe#pdfContent")[0];
  4631. if (iframe) return;
  4632. // 加载钩子,方便适应不同网站
  4633. load_hooks();
  4634. // 创建按钮区
  4635. utils.create_btns();
  4636. // 设置功能
  4637. utils.onclick(download_pdf$1, 1, "下载PDF");
  4638. utils.onclick(download_data_bundle, 2, "下载PDF数据集");
  4639. utils.onclick(() => false, 3, "进度条");
  4640. utils.onclick(save_bookmarks, 4, "下载书签");
  4641. // 显示按钮
  4642. utils.toggle_btn(2);
  4643. utils.toggle_btn(3);
  4644. utils.toggle_btn(4);
  4645. // 设置按钮样式
  4646. utils.btn(3).style.pointerEvents = "none";
  4647. }
  4648. /**
  4649. * 返回基础图片地址,接上 <页码>.gif 即为完整URL
  4650. * @returns {string}
  4651. */
  4652. function getBaseURL() {
  4653. const
  4654. elem = wk$("#page_1 img")[0],
  4655. src = elem.src;
  4656. if (!src) {
  4657. alert("当前页面不能解析!");
  4658. return;
  4659. }
  4660. if (!src.endsWith("1.gif")) {
  4661. alert("当前文档不能解析!");
  4662. throw new Error("第一页图片不以 1.gif 结尾");
  4663. }
  4664. return src.slice(0, -5);
  4665. }
  4666. function* imgURLGen() {
  4667. const
  4668. base = getBaseURL(),
  4669. max = parseInt(
  4670. // ' / 23 '
  4671. wk$(".counts")[0].textContent.split("/")[1]
  4672. );
  4673. for (const i of utils.range(1, max + 1)) {
  4674. yield `${base}${i}.gif`;
  4675. }
  4676. }
  4677. function getURLs() {
  4678. utils.save_urls(
  4679. imgURLGen()
  4680. );
  4681. }
  4682. function jinchutou() {
  4683. utils.create_btns();
  4684. utils.onclick(
  4685. getURLs, 1, "导出图片链接"
  4686. );
  4687. }
  4688. // http://www.nrsis.org.cn/mnr_kfs/file/read/55806d6159b7d8e19e633f05fa62fefa
  4689. function get_pdfs() {
  4690. // 34
  4691. const size = window?.Page.size;
  4692. if (!size) utils.raise("无法确定总页码");
  4693. // '/mnr_kfs/file/readPage'
  4694. const path = window
  4695. ?.loadPdf
  4696. .toString()
  4697. .match(/url:'(.+?)',/)[1];
  4698. if (!path) utils.raise("无法确定PDF路径");
  4699. const code = location.pathname.split("/").at(-1);
  4700. const tasks = [...utils.range(1, size + 1)].map(
  4701. async i => {
  4702. const resp = await fetch(path + "?wk=true", {
  4703. "headers": {
  4704. "content-type": "application/x-www-form-urlencoded; charset=UTF-8",
  4705. },
  4706. "body": `code=${code}&page=${i}`,
  4707. "method": "POST",
  4708. });
  4709. if (!resp.ok) utils.raise(`第 ${i} 页获取失败!`);
  4710. utils.update_popup(`已经获取第 ${i} 页`);
  4711. const b64_str = await resp.text();
  4712. return utils.b64_to_bytes(b64_str);
  4713. }
  4714. );
  4715. return utils.gather(tasks);
  4716. }
  4717. function get_title() {
  4718. return document.title.slice(0, -5);
  4719. }
  4720. function download_pdf() {
  4721. utils.run_with_prog(1, async () => {
  4722. const pdfs = await get_pdfs();
  4723. debugger;
  4724. const pdf = await utils.join_pdfs(pdfs);
  4725. utils.save(
  4726. get_title(), pdf, "application/pdf"
  4727. );
  4728. });
  4729. }
  4730. function add_style() {
  4731. const style = `
  4732. <style>
  4733. #nprogress .nprogress-spinner-icon.forbidden {
  4734. border-top-color: #b171ff;
  4735. border-left-color: #bf8aff;
  4736. animation: nprogress-spinner 2.4s linear infinite;
  4737. }
  4738. </style>
  4739. `;
  4740. document.body.insertAdjacentHTML(
  4741. "beforeend", style
  4742. );
  4743. }
  4744. function init_forbid_origin_pdf_fetch() {
  4745. console.log("hooked xhr.open");
  4746. // 修改转圈图标
  4747. wk$(".nprogress-spinner-icon")[0]
  4748. .classList.add("forbidden");
  4749. const open = XMLHttpRequest.prototype.open;
  4750. // 重写 XMLHttpRequest.prototype.open 方法
  4751. XMLHttpRequest.prototype.open = function() {
  4752. const args = Array.from(arguments);
  4753. const url = args[1];
  4754. if (!(url.includes("readPage") &&
  4755. !url.includes("wk=true")
  4756. )) return;
  4757. this.send = () => undefined;
  4758. open.apply(this, args);
  4759. };
  4760. return function regain_open() {
  4761. const url = new URL(location.href);
  4762. url.searchParams.set("intercept", "0");
  4763. location.assign(url.toString());
  4764. }
  4765. }
  4766. /**
  4767. * nrsis 文档策略
  4768. */
  4769. function nrsis() {
  4770. utils.create_btns();
  4771. utils.onclick(download_pdf, 1, "下载PDF");
  4772. if (!utils.get_param("intercept")) {
  4773. add_style();
  4774. const regain_open = init_forbid_origin_pdf_fetch();
  4775. utils.onclick(regain_open, 2, "恢复页面加载");
  4776. utils.toggle_btn(2);
  4777. }
  4778. }
  4779. // ==UserScript==
  4780. // @name 先晓书院PDF下载
  4781. // @namespace http://tampermonkey.net/
  4782. // @version 0.1
  4783. // @description 先晓书院PDF下载,仅对PDF预览有效
  4784. // @author 2690874578@qq.com
  4785. // @match https://xianxiao.ssap.com.cn/index/rpdf/read/id/*/catalog_id/0.html?file=*
  4786. // @require https://gf.qytechs.cn/scripts/445312-wk-full-cli/code/wk-full-cli.user.js
  4787. // @icon https://www.google.com/s2/favicons?sz=64&domain=xianxiao.ssap.com.cn
  4788. // @grant none
  4789. // @run-at document-idle
  4790. // @license GPL-3.0-only
  4791. // ==/UserScript==
  4792. /**
  4793. * @param {number} begin
  4794. * @param {number} end
  4795. * @param {() => void} onload
  4796. * @returns {Promise<ArrayBuffer>}
  4797. */
  4798. async function fetch_file_chunk(url, begin, end, onload) {
  4799. const resp = await fetch(url, {
  4800. headers: { "Range": `bytes=${begin}-${end}` }
  4801. });
  4802. const buffer = await resp.arrayBuffer();
  4803. onload();
  4804. return buffer;
  4805. }
  4806. /**
  4807. * 取得文档 ID
  4808. * @returns {number}
  4809. */
  4810. function get_doc_id() {
  4811. const id_text = location.pathname.split("id/")[1].split("/")[0];
  4812. return parseInt(id_text);
  4813. }
  4814. /**
  4815. * @param {string} url
  4816. * @returns {Promise<number>}
  4817. */
  4818. async function get_file_size(url) {
  4819. const resp = await fetch(url, {
  4820. headers: { "Range": `bytes=0-1` }
  4821. });
  4822. const size_text = resp.headers.get("content-range").split("/")[1];
  4823. return parseInt(size_text);
  4824. }
  4825. /**
  4826. * @param {PointerEvent} event
  4827. */
  4828. async function export_pdf(event) {
  4829. const btn = event.target;
  4830. // 准备请求
  4831. const doc_id = get_doc_id();
  4832. const url = `https://xianxiao.ssap.com.cn/rpdf/pdf/id/${doc_id}/catalog_id/0.pdf`;
  4833. const size = await get_file_size(url);
  4834. const chunk = 65536;
  4835. const times = Math.floor(size / chunk);
  4836. // 准备进度条
  4837. let finished = 0;
  4838. const update_progress = () => {
  4839. finished++;
  4840. const loaded = ((finished * chunk) / 1024 / 1024).toFixed(2);
  4841. const text = `已下载 ${loaded} MB`;
  4842. utils.print(`chunk<${finished}>:`, text);
  4843. btn.textContent = text;
  4844. };
  4845. // 分片请求PDF
  4846. const tasks = [];
  4847. for (let i = 0; i < times; i++) {
  4848. tasks[i] = fetch_file_chunk(
  4849. url,
  4850. i * chunk,
  4851. (i + 1) * chunk - 1,
  4852. update_progress,
  4853. );
  4854. }
  4855. // 请求最后一片
  4856. const tail = size % chunk;
  4857. tasks[times] = fetch_file_chunk(
  4858. url,
  4859. size - tail,
  4860. size - 1,
  4861. update_progress,
  4862. );
  4863. // 等待下载完成
  4864. const buffers = await utils.gather(tasks);
  4865. utils.print("--------全部下载完成--------");
  4866. utils.print("全部数据分片:", { get data() { return buffers; } });
  4867. // 导出PDF
  4868. const blob = new Blob(buffers);
  4869. const fname = top.document.title.split("_")[0] + ".pdf";
  4870. utils.save(fname, blob, "application/pdf");
  4871. }
  4872. /**
  4873. * 先晓书院 文档策略
  4874. */
  4875. function xianxiao() {
  4876. utils.print("进入<先晓书院PDF下载>脚本");
  4877. utils.create_btns();
  4878. utils.onclick(export_pdf, 1, "下载PDF");
  4879. }
  4880. function hook_log() {
  4881. // 保证 console.log 可用性
  4882. const con = window.console;
  4883. const { log, info, warn, error } = con;
  4884. // 对于 console.log 能 hook 则 hook
  4885. if (Object.getOwnPropertyDescriptor(window, "console").configurable
  4886. && Object.getOwnPropertyDescriptor(con, "log").configurable) {
  4887. // 保证 console 不能被改写
  4888. Object.defineProperty(window, "console", {
  4889. get: function() { return con; },
  4890. set: function(value) {
  4891. log.call(con, "window.console 想改成", value, "?没门!");
  4892. },
  4893. enumerable: false,
  4894. configurable: false,
  4895. });
  4896. // 保证日志函数不被改写
  4897. const fn_map = { log, info, warn, error };
  4898. Object.getOwnPropertyNames(fn_map).forEach((prop) => {
  4899. Object.defineProperty(con, prop, {
  4900. get: function() { return fn_map[prop]; },
  4901. set: function(value) {
  4902. log.call(con, `console.${prop} 想改成`, value, "?没门!");
  4903. },
  4904. enumerable: false,
  4905. configurable: false,
  4906. });
  4907. });
  4908. }
  4909. }
  4910. /**
  4911. * 主函数:识别网站,执行对应文档下载策略
  4912. */
  4913. function main(host=null) {
  4914. // 绑定函数到全局
  4915. window.wk_main = main;
  4916. // 显示当前位置
  4917. host = host || location.hostname;
  4918. const url = new URL(location.href);
  4919. const params = url.searchParams;
  4920. const path = url.pathname;
  4921. hook_log();
  4922. console.log(`当前 host: ${host}\n当前 url: ${url.href}`);
  4923. if (host.includes("docin.com")) {
  4924. docin();
  4925. } else if (host === "swf.ishare.down.sina.com.cn") {
  4926. if (params.get("wk") === "true") {
  4927. ishareData2();
  4928. } else {
  4929. ishareData();
  4930. }
  4931. } else if (host.includes("ishare.iask")) {
  4932. ishare();
  4933. } else if (host === "www.deliwenku.com") {
  4934. deliwenku();
  4935. } else if (host.includes("file") && host.includes("deliwenku.com")) {
  4936. deliFile();
  4937. } else if (host === "www.doc88.com") {
  4938. doc88();
  4939. } else if (host === "www.360doc.com") {
  4940. doc360();
  4941. } else if (host === "doc.mbalib.com") {
  4942. mbalib();
  4943. } else if (host === "www.dugen.com") {
  4944. dugen();
  4945. } else if (host === "c.gb688.cn") {
  4946. gb688();
  4947. } else if (host === "www.safewk.com") {
  4948. safewk();
  4949. } else if (host.includes("book118.com")) {
  4950. book118();
  4951. } else if (host === "www.renrendoc.com") {
  4952. renrendoc();
  4953. } else if (host.includes("yunzhan365.com")) {
  4954. yunzhan365();
  4955. } else if (host === "wenku.so.com") {
  4956. wenku360();
  4957. } else if (host === "jg.class.com.cn") {
  4958. jg();
  4959. } else if (host === "preview.imm.aliyuncs.com") {
  4960. jgPreview();
  4961. } else if (host === "www.wenkub.com") {
  4962. wenkub();
  4963. } else if (
  4964. (host.includes("sklib") && path === "/manuscripts/")
  4965. || host === "gwfw.sdlib.com") {
  4966. sklib();
  4967. } else if (host === "www.jinchutou.com") {
  4968. jinchutou();
  4969. } else if (host === "www.nrsis.org.cn") {
  4970. nrsis();
  4971. } else if (host === "xianxiao.ssap.com.cn") {
  4972. xianxiao();
  4973. } else {
  4974. console.log("匹配到了无效网页");
  4975. }
  4976. }
  4977. setTimeout(main, 1000);
  4978. })();

QingJ © 2025

镜像随时可能失效,请加Q群300939539或关注我们的公众号极客氢云获取最新地址