Wikipedia Table to CSV

Extract tables from Wikipedia and save as CSV

You will need to install an extension such as Tampermonkey, Greasemonkey or Violentmonkey to install this script.

You will need to install an extension such as Tampermonkey to install this script.

You will need to install an extension such as Tampermonkey or Violentmonkey to install this script.

You will need to install an extension such as Tampermonkey or Userscripts to install this script.

You will need to install an extension such as Tampermonkey to install this script.

You will need to install a user script manager extension to install this script.

(I already have a user script manager, let me install it!)

You will need to install an extension such as Stylus to install this style.

You will need to install an extension such as Stylus to install this style.

You will need to install an extension such as Stylus to install this style.

You will need to install a user style manager extension to install this style.

You will need to install a user style manager extension to install this style.

You will need to install a user style manager extension to install this style.

(I already have a user style manager, let me install it!)

// ==UserScript==
// @name         Wikipedia Table to CSV
// @namespace    http://tampermonkey.net/
// @version      0.1
// @description  Extract tables from Wikipedia and save as CSV
// @author       Yofardev
// @match        *://*.wikipedia.org/wiki/*
// @license MIT
// @grant        none
// ==/UserScript==

(function () {
    'use strict';

    // Function to download data to a file
    function download(data, filename, type) {
        var file = new Blob([data], { type: type });
        if (window.navigator.msSaveOrOpenBlob) // IE10+
            window.navigator.msSaveOrOpenBlob(file, filename);
        else { // Others
            var a = document.createElement("a"),
                url = URL.createObjectURL(file);
            a.href = url;
            a.download = filename;
            document.body.appendChild(a);
            a.click();
            setTimeout(function () {
                document.body.removeChild(a);
                window.URL.revokeObjectURL(url);
            }, 0);
        }
    }

    // Get all tables
    let tables = document.getElementsByTagName('table');

    // Get the current Wikipedia page title
    let pageTitle = document.getElementById('firstHeading').innerText.replace(/ /g, '_');

    // Iterate over tables
    for (let table of tables) {
        // Create download button
        let button = document.createElement('button');
        button.innerText = 'Download as CSV';
        button.onclick = function () {
            let csv = '';

            // Get the table title
            let tableTitle = 'table';
            let prevNode = table.previousElementSibling;
            while (prevNode) {
                if (prevNode.nodeName.toLowerCase() === 'h3') {
                    tableTitle = prevNode.querySelector('.mw-headline').innerText.replace(/ /g, '_');
                    break;
                }
                prevNode = prevNode.previousElementSibling;
            }

            // Iterate over rows
            for (let row of table.rows) {
                let cells = Array.from(row.cells);
                csv += cells.map(cell => {
                    // Check if cell contains an image
                    let img = cell.querySelector('img');
                    if (img) {
                        // If so, return the image URL
                        return '"' + img.src.replace(/"/g, '""') + '"';
                    } else {
                        // Otherwise, return the cell text
                        return '"' + cell.innerText.replace(/"/g, '""') + '"';
                    }
                }).join(',') + '\n';
            }

            // Download the data
            download(csv, tableTitle + ' - ' + pageTitle + '.csv', 'text/csv');
        };

        // Add download button to the page
        table.parentNode.insertBefore(button, table);
    }
})();