Wayback Machine Small Bug Fixes

Fixes encoded ampersands on Wayback Machine's captures graph and problems that arise when trailing slashes are missing in an URL and other small issues universally present in all crawled sites

Verze ze dne 21. 01. 2016. Zobrazit nejnovější verzi.

K instalaci tototo skriptu si budete muset nainstalovat rozšíření jako Tampermonkey, Greasemonkey nebo Violentmonkey.

K instalaci tohoto skriptu si budete muset nainstalovat rozšíření jako Tampermonkey nebo Violentmonkey.

K instalaci tohoto skriptu si budete muset nainstalovat rozšíření jako Tampermonkey nebo Violentmonkey.

K instalaci tohoto skriptu si budete muset nainstalovat rozšíření jako Tampermonkey nebo Userscripts.

You will need to install an extension such as Tampermonkey to install this script.

K instalaci tohoto skriptu si budete muset nainstalovat manažer uživatelských skriptů.

(Už mám manažer uživatelských skriptů, nechte mě ho nainstalovat!)

You will need to install an extension such as Stylus to install this style.

You will need to install an extension such as Stylus to install this style.

You will need to install an extension such as Stylus to install this style.

You will need to install a user style manager extension to install this style.

You will need to install a user style manager extension to install this style.

You will need to install a user style manager extension to install this style.

(Už mám manažer uživatelských stylů, nechte mě ho nainstalovat!)

// ==UserScript==
// @name          Wayback Machine Small Bug Fixes
// @namespace     DoomTay
// @description   Fixes encoded ampersands on Wayback Machine's captures graph and problems that arise when trailing slashes are missing in an URL and other small issues universally present in all crawled sites
// @version       1.2.7
// @include       http://web.archive.org/web/*
// @include       http://wayback.archive.org/web/*
// @include       https://web.archive.org/web/*
// @include       https://wayback.archive.org/web/*
// @run-at        document-start
// @exclude       /\*/
// @grant         none

// ==/UserScript==

var toolbarNav = document.getElementById("wm-graph-anchor");
var lastFolder = window.location.href.substring(window.location.href.lastIndexOf("/") + 1);
var pics = document.images;
var backgrounds = document.querySelectorAll("[background]");
var shouldHaveTrailingSlash = (window.location.href.lastIndexOf(".") < window.location.href.lastIndexOf("/") || window.location.href.substring(window.location.href.lastIndexOf("//") + 2) == lastFolder) && lastFolder.indexOf("?") == -1;
var hasTrailingSlash = window.location.href.lastIndexOf("/") == window.location.href.length - 1;
var domain = window.location.href.substring(0,window.location.href.indexOf("/",window.location.href.lastIndexOf("//") + 2));

function fixToolbar()
{
	while(toolbarNav.href.indexOf("&amp;") > -1) toolbarNav.href = toolbarNav.href.replace("&amp;","&");
}

//Fix cases of &amp; in the capture graph
if(toolbarNav) fixToolbar();

if(!document.getElementsByTagName("base")[0])
{
	var base = document.createElement("base");
	if(shouldHaveTrailingSlash && !hasTrailingSlash) base.href = window.location.href + "/";
	else if((!hasTrailingSlash && !shouldHaveTrailingSlash) || hasTrailingSlash) base.href = document.baseURI;
	else base.href = domain + "/";
	document.head.appendChild(base);
}
	

for(var i = 0; i < pics.length; i++)
{
	//Skip over stuff related to the Wayback Machine toolbar and data URIs
	if((document.getElementById("wm-ipp") && document.getElementById("wm-ipp").contains(pics[i])) || pics[i].src.indexOf("data:") > -1) continue;
	//Refresh images in case the "base url" had to be modified.
	pics[i].src = pics[i].src;
	//For whatever reason, some images will point to within Internet Archive's "main" servers, instead of the crawled site. This attempts to fix that.
	if(pics[i].src.indexOf(document.domain + "/web") == -1) pics[i].src = fixURL(pics[i].src);
}

for(var b = 0; b < backgrounds.length; b++)
{
	var bg = backgrounds[b].background || backgrounds[b].getAttribute("background");
	//Skip over stuff related to the Wayback Machine toolbar and data URIs
	if((document.getElementById("wm-ipp") && document.getElementById("wm-ipp").contains(backgrounds[b])) || bg.indexOf("data:") > -1) continue;
	//Refresh images in case the "base url" had to be modified.
	changeBackground(backgrounds[b],bg);
	//For whatever reason, some images will point to within Internet Archive's "main" servers, instead of the crawled site. This attempts to fix that.
	if(relativeToAbsolute(bg).indexOf(document.domain + "/web") == -1) 
	{
		var absoluteBG = relativeToAbsolute(bg)
		changeBackground(backgrounds[b],fixURL(absoluteBG));
	}
}

function relativeToAbsolute(bgURL)
{
	var img = new Image();
	img.src = bgURL;
	return img.src;
}

function fixURL(URL)
{
	if(URL.indexOf(document.domain) > -1) return domain + URL.substring(URL.indexOf("/",URL.lastIndexOf("//") + 2));
	else return domain.substring(0,domain.indexOf("/http") + 1) + URL.substring(URL.indexOf("/http") + 1);
}

function changeBackground(node, newBackground)
{
	if(node.background) node.background = newBackground;
	else if(node.getAttribute("background")) node.setAttribute("background",newBackground);
}

var observer = new MutationObserver(function(mutations) {
	mutations.forEach(function(mutation) {
		if(mutation.target.id == "wm-graph-anchor") toolbarNav = mutation.target;
		if(mutation.type == "attributes" && mutation.target == toolbarNav) fixToolbar();
		if(mutation.target.nodeType == 1) checkMutations(mutation.target);
		for(var i = 0; i < mutation.addedNodes.length; i++) 
		{
			if(mutation.addedNodes[i].nodeType == 1) checkMutations(mutation.addedNodes[i]);
		}
	});    
});

function checkMutations(node)
{
	if(document.getElementById("wm-ipp") && document.getElementById("wm-ipp").contains(node)) return;
	if(node.nodeName == "IMG" && node.src.indexOf(document.domain + "/web") == -1)
	{
		node.src = fixURL(node.src);
	}
	if((node.getAttribute("background") || node.background) && (node.getAttribute("background") || node.background).indexOf(document.domain + "/web") == -1)
	{
		var bg = node.background || node.getAttribute("background");
		var absoluteBG = relativeToAbsolute(bg);
		changeBackground(node,fixURL(absoluteBG));
	}
}

var config = { attributes: true, childList: true, characterData: true, subtree: true };
observer.observe(document.body || document, config);