Wayback Machine Image Fixer

Attempts to fix broken images by replacing them with working timestamps based on JSON results

当前为 2016-01-04 提交的版本,查看 最新版本

  1. // ==UserScript==
  2. // @name Wayback Machine Image Fixer
  3. // @namespace DoomTay
  4. // @description Attempts to fix broken images by replacing them with working timestamps based on JSON results
  5. // @include http://web.archive.org/web/*
  6. // @include https://web.archive.org/web/*
  7. // @exclude /\*/
  8. // @exclude *.jpg
  9. // @exclude *.jpeg
  10. // @exclude *.png
  11. // @exclude *.gif
  12. // @exclude *.bmp
  13. // @version 1.4.0
  14. // @grant GM_xmlhttpRequest
  15.  
  16. // ==/UserScript==
  17.  
  18. var pics = document.images;
  19. var backgrounds = document.querySelectorAll("[background]");
  20.  
  21. function specialUses(pic)
  22. {
  23. var imgRef = pic.src || relativeToAbsolute(pic.background);
  24. var specialCases = [{domain:"northarc.com/images/unsorted/",replacements:[imgRef.replace("thumb.","tn_"),imgRef.replace("thumb.","")],maxDimensions:{width:100,height:80},tags:"before"},
  25. {domain:"*",replacements:["data:image/gif;base64,R0lGODlhAQABAIAAAP///wAAACH5BAEAAAAALAAAAAABAAEAAAICRAEAOw=="],condition:imgRef.indexOf("spacer.gif") > -1 || imgRef.indexOf("blank.gif") > -1,tags:"after"},
  26. {domain:"tinypic.com/",replacements:[imgRef.replace("/i","/oi")],tags:"after"},
  27. {domain:"logitech.com",replacements:["http://www.logitech.com/logitech/new6-1.gif"],condition:imgRef.indexOf("home_header.gif") > -1,tags:"before"},
  28. {domain:"logitech.com",replacements:["http://www.logitech.com/logitech/new6-3.gif"],condition:imgRef.indexOf("home_footer.gif") > -1,tags:"before"},
  29. {domain:"logitech.com",replacements:["http://www.logitech.com/logitech/prod_row.gif"],condition:imgRef.indexOf("Images/main_navigator.gif") > -1,tags:"before"},
  30. {domain:"logitech.com",replacements:["http://www.logitech.com/logitech/al1.gif"],condition:imgRef.indexOf("Images/navigator.gif") > -1,tags:"before"},
  31. {domain:"logitech.com",replacements:["http://www.logitech.com/logitech/msensa.gif"],condition:imgRef.indexOf("Images/mmsensa.gif") > -1,tags:"before"},
  32. {domain:"*",replacements:["http://www.surpara.com/img/ban/sp.gif","http://www.surpara.com/img/ban/sp2.gif","http://www.surpara.com/img/ban/sp3.gif","http://www.surpara.com/img/ban/sp4.gif","http://www.surpara.com/img/ban/sp5.gif","http://www.surpara.com/img/ban/sp6.gif","http://www.surpara.com/img/ban/sp7.gif"],condition:pic.width == 88 && pic.height == 31 && pic.parentNode.href.indexOf("surpara") > -1,tags:"random,after"},
  33. {domain:"*",replacements:["http://www.gameha.com/gameha_m.gif"],condition:pic.width == 88 && pic.height == 31 && pic.parentNode.href.indexOf("gameha.com") > -1,tags:"after"},
  34. {domain:"*",replacements:["http://www.oekaki.net/img/bn2_1.gif","http://www.oekaki.net/img/bn2_2.gif","http://www.oekaki.net/img/bn2_3.gif","http://www.oekaki.net/img/bn2_4.gif","http://www.oekaki.net/img/bn2_5.gif","http://www.oekaki.net/img/bn2_6.gif"],condition:pic.width == 88 && pic.height == 31 && pic.parentNode.href.indexOf("oekaki.net") > -1,tags:"random,after"},
  35. {domain:"*",replacements:["http://brandk.net/search/img2/s_bnr_11.jpg","http://brandk.net/search/img2/s_bnr_10.jpg","http://brandk.net/search/img2/s_bnr_08.jpg","http://brandk.net/search/img2/s_bnr_04.jpg","http://brandk.net/search/img2/s_bnr_01.jpg"],condition:pic.width == 88 && pic.height == 31 && pic.parentNode.href.indexOf("brandk.net") > -1,tags:"random,after"},
  36. {domain:"*",replacements:["http://ragsearch.com/bana/banas.gif"],condition:pic.width == 88 && pic.height == 31 && pic.parentNode.href.indexOf("ragsearch.com") > -1,tags:"after"},
  37. {domain:"*",replacements:["http://celest.pobox.ne.jp/links/imgs/bn88.gif"],condition:pic.width == 88 && pic.height == 31 && pic.parentNode.href.indexOf("celest.pobox.ne.jp") > -1,tags:"after"},
  38. {domain:"*",replacements:["http://td9.sakura.ne.jp/links/banner_w+prinsess.gif"],condition:pic.width == 88 && pic.height == 31 && pic.parentNode.href.indexOf("http://blue.sakura.ne.jp/~real") > -1,tags:"after"}];
  39. var filteredCases = {};
  40. filteredCases.replacements = [];
  41. var tagScan = ["before","between","after"];
  42. for(var t = 0; t < 3; t++)
  43. {
  44. if(t == 1) filteredCases.replacements = filteredCases.replacements.concat(imgRef);
  45. else
  46. {
  47. for(var c = 0; c < specialCases.length; c++)
  48. {
  49. var additionalCondition = specialCases[c].condition !== undefined ? specialCases[c].condition : true;
  50. if((imgRef.indexOf(specialCases[c].domain) > -1 || specialCases[c].domain == "*") && additionalCondition && specialCases[c].tags.indexOf(tagScan[t]) > -1)
  51. {
  52. if(specialCases[c].tags.indexOf("random") > -1) filteredCases.replacements = filteredCases.replacements.concat(specialCases[c].replacements[Math.floor(Math.random() * specialCases[c].replacements.length)]);
  53. else filteredCases.replacements = filteredCases.replacements.concat(specialCases[c].replacements);
  54. if(specialCases[c].maxDimensions) filteredCases.maxDimensions = specialCases[c].maxDimensions;
  55. }
  56. }
  57. }
  58. }
  59. return filteredCases;
  60. }
  61.  
  62. var timestamp = /web\/(\d{1,14})/.exec(window.location.href)[1];
  63.  
  64. function replaceImage(target, altURLs)
  65. {
  66. var possibleUses = specialUses(target);
  67. var URLGuesses = [];
  68. if(altURLs && altURLs.length > 0) URLGuesses = altURLs;
  69. else if(possibleUses.replacements.length > 0) URLGuesses = possibleUses.replacements;
  70. else URLGuesses = [target.src || relativeToAbsolute(target.background)];
  71. var testSet = [];
  72. for(var p = 0; p < URLGuesses.length; p++)
  73. {
  74. if(URLGuesses[p].indexOf("http") > -1) testSet[p] = APITest(URLGuesses[p]);
  75. else if(URLGuesses[p].indexOf("data:") > -1)
  76. {
  77. testSet[p] = Promise.resolve(URLGuesses[p]);
  78. break;
  79. }
  80. }
  81. Promise.all(testSet).then(function(value) {
  82. for(var v = 0; v < value.length; v++)
  83. {
  84. if(value[v] !== null)
  85. {
  86. if(possibleUses.maxDimensions) switchWithResize(value[v], target, possibleUses.maxDimensions.width, possibleUses.maxDimensions.height);
  87. else changeImage(value[v], target);
  88. //There might have been an image map that had to be "patched" by one of my other scripts. The patch isn't needed anymore, so this will remove it
  89. if(target.getAttribute("usemap") && document.body.querySelector("svg[class ~= " + target.getAttribute("usemap").substring(1) + "]"))
  90. {
  91. var SVGPatch = document.body.querySelector("svg[class ~= " + target.getAttribute("usemap").substring(1) + "]");
  92. SVGPatch.parentNode.removeChild(SVGPatch);
  93. };
  94. return;
  95. }
  96. }
  97. //Try and "expose" image links that are unclickable due to the image not loading
  98. if(target.alt === "" && target.width === 0 && target.parentNode.nodeName === "A" && target.src)
  99. {
  100. target.width = 25;
  101. target.height = 25;
  102. //"Changing" the source is pretty hacky, but it's the only way I can think of to turn "invisible" image links into something clickable
  103. target.src = target.src;
  104. }
  105. });
  106. function APITest(replacement)
  107. {
  108. var subPromise = new Promise(function(resolve,reject) {
  109. var originalURL = replacement.substring(replacement.lastIndexOf("http"));
  110. GM_xmlhttpRequest({
  111. url: "http://archive.org/wayback/available?url=" + originalURL + "&timestamp=" + timestamp,
  112. method: "GET",
  113. headers: {"Accept": "application/json"},
  114. onload: function(response) {
  115. if(response.status == 503) reject(response.statusText + " for " + originalURL);
  116. else if(JSON.parse(response.responseText).archived_snapshots.closest !== undefined)
  117. {
  118. //Evidently an additional layer of examination is needed to make absolutely sure we have an actual image
  119. GM_xmlhttpRequest({
  120. url: JSON.parse(response.responseText).archived_snapshots.closest.url,
  121. method: "HEAD",
  122. onload: function(secondResp) {
  123. if(secondResp.responseHeaders.indexOf("Content-Type: text/html") == -1) resolve(this.url);
  124. else resolve(null);
  125. }
  126. });
  127. }
  128. else resolve(null);
  129. }
  130. });
  131. }).catch(function(e) { return APITest(replacement); });
  132. return subPromise;
  133. }
  134. function switchWithResize(url, target, width, height)
  135. {
  136. var oldDimensions = {width:width, height: height};
  137. changeImage(url, target);
  138. target.onload = function() {
  139. var aspectRatio = target.naturalWidth / target.naturalHeight;
  140. if(target.naturalWidth >= target.naturalHeight)
  141. {
  142. target.width = oldDimensions.width;
  143. target.height = oldDimensions.width / aspectRatio;
  144. }
  145. else if(target.naturalWidth <= target.naturalHeight)
  146. {
  147. target.height = oldDimensions.height;
  148. target.width = oldDimensions.height * aspectRatio;
  149. }
  150. };
  151. }
  152. function changeImage(url, target)
  153. {
  154. if(target.src) target.src = url;
  155. else if(target.background) target.background = url;
  156. }
  157. }
  158.  
  159. function relativeToAbsolute(bgURL)
  160. {
  161. var img = new Image();
  162. img.src = bgURL;
  163. return img.src;
  164. }
  165.  
  166. function evaluateImage(pic)
  167. {
  168. GM_xmlhttpRequest({
  169. url: pic.src,
  170. method: "GET",
  171. onload: function(response) {
  172. //Going off of response code is unreliable. Sometimes an image will return a status code of 200 even though it would redirect to an error page should you view the image directly, so we're looking at content type instead
  173. if(response.responseHeaders.indexOf("Content-Type: text/html") > -1)
  174. {
  175. //This might be a case where if you were visit the image directly, you would be redirected elsewhere. This attempts to catch that and replace the pic's src with where it would take you.
  176. var doc = document.implementation.createHTMLDocument("Possible Replacement");
  177. doc.documentElement.innerHTML = response.responseText;
  178. if(doc.getElementsByClassName("impatient")[0])
  179. {
  180. GM_xmlhttpRequest({
  181. url: doc.getElementsByClassName("impatient")[0].firstChild.href,
  182. method: "HEAD",
  183. onload: function(response) {
  184. //Going off of response code is unreliable. Sometimes an image will return a status code of 200 even though it would redirect to an error page should you view the image directly, so we're looking at content type instead
  185. if(response.responseHeaders.indexOf("Content-Type: text/html") == -1)
  186. {
  187. replaceImage(pic,[doc.getElementsByClassName("impatient")[0].firstChild.href]);
  188. }
  189. else
  190. {
  191. replaceImage(pic);
  192. }
  193. }
  194. });
  195. }
  196. else if(response.status != 403)
  197. {
  198. replaceImage(pic);
  199. }
  200. }
  201. }
  202. });
  203. }
  204.  
  205. for(var i = 0; i < pics.length; i++)
  206. {
  207. //Skip over stuff related to the Wayback Machine toolbar and data URIs
  208. if((document.getElementById("wm-ipp") && document.getElementById("wm-ipp").contains(pics[i])) || pics[i].src.indexOf("data:") > -1) continue;
  209. if(pics[i].src.indexOf("ttp://") === 0) pics[i].src = "web.archive.org/web/" + timestamp + "/h" + pics[i].src;
  210. evaluateImage(pics[i]);
  211. }
  212.  
  213. for(var b = 0; b < backgrounds.length; b++)
  214. {
  215. evaluateImage(backgrounds[b]);
  216. }

QingJ © 2025

镜像随时可能失效,请加Q群300939539或关注我们的公众号极客氢云获取最新地址