Link Untracker

Remove tracking elements from links

// ==UserScript==
// @name        Link Untracker
// @namespace   IzzySoft
// @description Remove tracking elements from links
// @license     CC BY-NC-SA
// @include     *
// @exclude     *phpmyadmin*
// @version     13
// @run-at      document-idle
// @grant       unsafeWindow
// @homepage    https://codeberg.org/izzy/userscripts
// ==/UserScript==

/* badp: we strip parameters starting with that. Some are taken from NetURL, see
   https://github.com/Smile4ever/firefoxaddons/tree/master/Neat%20URL-webext
   fb_: Facebook; ga_/_gl: Google; hmb_: HumbleBundle(?); utm_: Urchin Tracker; wt_: Webtrekk; WT.: Webtrends
*/
var badp = ['fb_','ga_','_ga','_gl','hmb_','utm_',
            'ei@google.','gws_rd@google.','sei@google.','ved@google.',
            'pd_rd_r@amazon.','pd_rd_w@amazon.','pd_rd_wg@amazon.','psc@amazon.','_encoding@amazon.',
            'wt_','WT.','yclid','referrer','clickfrom','pf_rd'
           ];
var anch = ''; /* variable to hold the "anchor part" of the URL, if any – i.e. "#anchor" */
var replace_semicolon = true; /* some sites use ";" to separate URL params;
                                 URLSearchParams can't deal with that and messes up.
                                 If those sites don't work with "&", either set this
                                 to "false" or add that site on the exclude list
                               */

function getRealLinkFromGoogleUrl(a) { /* adapted from https://github.com/Rob--W/dont-track-me-google at 2018-01-03 */
    if ((a.hostname === location.hostname || a.hostname === 'www.google.com') &&
        /^\/(local_)?url$/.test(a.pathname)) {
        // Google Maps / Dito (/local_url?q=<url>)
        // Mobile (/url?q=<url>)
        var url = /[?&](?:q|url)=((?:https?|ftp)[%:][^&]+)/.exec(a.search);
        if (url) {
            return decodeURIComponent(url[1]);
        }
        // Help pages, e.g. safe browsing (/url?...&q=%2Fsupport%2Fanswer...)
        url = /[?&](?:q|url)=((?:%2[Ff]|\/)[^&]+)/.exec(a.search);
        if (url) {
            return a.origin + decodeURIComponent(url[1]);
        }
    }
    return a.href;
}

class UrlParams { /* adapted from https://stackoverflow.com/a/45516670 as the built-in URLSearchParams messes up parameters without values */
  constructor(search) { /* extracts the query string by stripping the leading "?" and initializes properties */
    this.qs = (search || location.search).substr(1);
    this.params = {};
    this.parseQuerstring();
  }
  parseQuerstring() { /* walks the query string and extracts the parameters as key-value-pairs */
    this.qs.split('&').reduce((a, b) => {
      let [key, val] = b.split('=');
      a[key] = val;
      return a;
    }, this.params);
  }
  filterQuerystring(badparms) { /* eliminates all "bad parameters" (tracking parameters) from our key-value-pairs */
    var keysToDelete = [];
    for (var key of Object.keys(this.params)) {
      for (let p of badparms) {
        if (key.startsWith(p)) console.log('removing '+key+' from '+this.qs);
        if (key.startsWith(p)) { keysToDelete.push(key); break; }
      }
    }
    for(var key of keysToDelete) {
      delete this.params[key];
    }
  }
  getString() { /* concatenates all parameters and returns them as a single query string without the leading "?" */
    var str = '';
    for (var key of Object.keys(this.params)) {
      str = str + '&' + key;
      if (this.params[key] != undefined) str = str + '=' + this.params[key]; /* only add the "=value" part if the parameter has a value! */
    }
    return str.substring(1);
  }
}

// MetaGer.de uses different methods of obfuscation with tracking URLs. This is catching most of them (hopefully):
function metager1(elem) {
  if ( elem.hostname == 'api.smartredirect.de' ) {
    var purl = new UrlParams(elem.search);
    elem.href = decodeURIComponent(purl.params['url']);
  } else if ( elem.href.startsWith ('https://metager.de/partner/r')) {
    var purl = new UrlParams(elem.search);
    elem.href = decodeURIComponent(purl.params['link']);
  } else if ( elem.href.startsWith ('https://metager.de/r/metager')) {
    if (elem.text.trim().startsWith('http:') || elem.text.trim().startsWith('https:')) {
      elem.href = decodeURI(elem.text.trim());
    } else {
      elem.href = 'https://'+decodeURI(elem.text.trim());
    }
  }
}

function parseLinks(k) {
  for(var i = k; i < document.links.length; i++) { // for some reason stops at 100 loops
    if (i - k > 98) return i;
    var elem = document.links[i];
    if (window.location.hostname == 'metager.de' && elem.className.includes('result-link')) { metager1(elem); continue; }
    if (elem.search == '') continue;
    if (replace_semicolon) var purl = new UrlParams(elem.search.replace(new RegExp(';','g'),'&'));
    else var purl = new UrlParams(elem.search);
    purl.filterQuerystring(badp);
    if (elem.href.indexOf('#') > 0) anch = '#' + elem.href.split('#')[1];
    else anch = '';
    elem.href = elem.href.split('?')[0] + '?' + purl.getString() + anch;
    elem.href = getRealLinkFromGoogleUrl(elem);
  }
  return i;
}

console.log(document.links.length+' links to parse');
k = 0; while ( k < document.links.length) {
  console.log('parsing from '+k);
  k = parseLinks(k+1);
  console.log('returned '+k)
}
console.log('DONE');