JakubMarcinkowski / Table copier (to clipboard)

// ==UserScript==
// @name         Table copier (to clipboard)
// @version      0.3.2
// @description  Choose from your userscipts addon menu. All tables are highlighted, click one to copy, elsewhere to cancel. Copy table and paste into spreadsheets like Excel, Google Sheets, LibreOffice Calc, OpenOffice Calc and others.
// @author       Jakub Marcinkowski <kuba.marcinkowski on g mail>
// @copyright    2024+, Jakub Marcinkowski <kuba.marcinkowski on g mail>
// @license      Zlib
// @namespace    Jakub Marcinkowski
// @homepageURL  https://gist.github.com/JakubMarcinkowski
// @homepageURL  https://github.com/JakubMarcinkowski
// @updateURL    https://openuserjs.org/meta/JakubMarcinkowski/Table_copier_(to_clipboard).meta.js
// @downloadURL  https://openuserjs.org/install/JakubMarcinkowski/Table_copier_(to_clipboard).user.js
// @icon         data:image/svg+xml;base64,PHN2ZyB4bWxucz0iaHR0cDovL3d3dy53My5vcmcvMjAwMC9zdmciIHZpZXdCb3g9IjAgMCAxNiAxNiIgY2xpcC1wYXRoPSJjaXJjbGUoKSI+PHJlY3QgZmlsbD0iIzZkOSIgd2lkdGg9IjE2IiBoZWlnaHQ9IjE2Ii8+PHBhdGggZD0iTTQsMFYxNk0xMCwwVjE2TTAsMkgxNk0wLDZIMTZNMCwxMEgxNk0wLDE0SDE2IiBzdHJva2U9IiM0NDUiLz48L3N2Zz4
// @match        *://*/*
// @noframes
// @grant        GM.registerMenuCommand
// @grant        GM.setClipboard
// ==/UserScript==

(function() {
  'use strict';

  if (!('setClipboard' in GM)) return;

  let cleaning = 1;
  let tables = [];
  let tablesBorders = new Map();

  function run() {
    tables = [...document.getElementsByTagName('table')];
    if (tables.length === 1) {
      copyTable(tables[0]);
      tables[0].scrollIntoView({behavior: "smooth", block: "nearest", inline: "nearest"});
      borderHighlight(tables[0]);
      setTimeout(borderNormal, 1000, tables[0]);
    } else {
      tables.forEach(elem => {
        borderHighlight(elem);
        elem.addEventListener('click', takeElem, {capture: true});
        elem.addEventListener('contextmenu', takeElem, {capture: true});
      });
      document.addEventListener('click', stopAll);
    }
  }

  function end() {
    tables.forEach(elem => {
      borderNormal(elem);
      elem.removeEventListener('click', takeElem, {capture: true});
      elem.removeEventListener('contextmenu', takeElem, {capture: true});
    });
    document.removeEventListener('click', stopAll);
    tables = [];
    tablesBorders = new Map();
  }

  function stopAll(e) {
    e.preventDefault();
    e.stopPropagation();
    end();
  }

  function takeElem(e) {
    stopAll(e);
    const table = e.target.tagName === 'TABLE' ? e.target : e.target.closest('table');
    if (table) copyTable(table);
  }

  function borderHighlight(elem) {
    tablesBorders.set(elem, elem.style.border);
    elem.style.border = '2px dashed green';
  }

  function borderNormal(elem) {
    elem.style.border = tablesBorders.get(elem);
  }

  function processTable(table) {
    let clone = table.cloneNode(true);
    clone.querySelectorAll('a.selflink:not([href])').forEach(link => { // Wikipedia thing
      const canonical = document.querySelector('link[rel="canonical"]');
      if (canonical) setHref(link, canonical.href);
    });
    if (cleaning === 0 || cleaning === 1) {
      clone.querySelectorAll('a').forEach(link => setHref(link, link.href)); // Make hrefs absolute
    }
    if (cleaning === 0) return clone;
    // if (cleaning >= 1) { // Flatten
    //   clone.querySelectorAll('a').forEach(link => {
    //     link.textContent = link.textContent;
    //   });
    //   clone.querySelectorAll('*:only-child').forEach(elem => {
    //     if (['A', 'UL', 'LI', 'OL', 'DL', 'DT', 'DD'].includes(elem.tagName)
    //        && !['TBODY', 'THEAD', 'TFOOT', 'TR', 'TH', 'TD', 'CAPTION', 'COLGROUP', 'COL', 'TABLE'].includes(elem.parentElement.tagName)) {
    //       elem.parentElement.replaceWith(...elem.parentElement.childNodes)
    //     } else {
    //       elem.replaceWith(...elem.childNodes);
    //     }
    //   });
    // }
    // When pasting these tags (except style), Excel makes additional rows.
    clone.querySelectorAll('br, wbr, hr, img, style').forEach(elem => elem.remove());
    if (cleaning >= 2) {
      clone.querySelectorAll('a').forEach(linkToText);
    }
    if (cleaning === 3) {
      clone
          .querySelectorAll('*:not(span, tbody, thead, tfoot, tr, th, td, caption, colgroup, col, table)')
          .forEach(elemToSpan);
    } else {
      // When pasting these tags (except style), Excel makes additional rows.
      clone.querySelectorAll('p, div, h1, h2, h3, h4, h5, h6, ul, li, ol, dl, dt, dd')
          .forEach(elemToSpan);
    }
    return clone;
  }

  function elemToSpan(elem) {
    const span = document.createElement('span');
    span.replaceChildren(...elem.childNodes);
    if (cleaning !== 3) {
      for (const attr of elem.getAttributeNames()) {
        span.setAttribute(attr, elem.getAttribute(attr));
      }
    }
    elem.replaceWith(span);
  }

  function linkToText(link) {
    const span = document.createElement('span');
    span.textContent = link.href;
    link.replaceWith(span);
    span.after(' '); // Separate texts (hrefs)
  }

  function setHref(link, href) {
    link.setAttribute('href', href);
  }

  function copyTable(table) {
    const processedTable = processTable(table);
    let param;
    switch (GM.info.scriptHandler) {
      case 'Tampermonkey':
        param = 'html'
        break;
      case 'Violentmonkey':
      case 'Userscripts':
        param = 'text/html'
        break;
      case 'Greasemonkey':
      default:
        param = null;
    }
    if (param) GM.setClipboard(processedTable.outerHTML, param);
    else GM.setClipboard(processedTable.outerHTML);
    // alert(`Table in clipboard. Now paste it into a spreadsheet.`);
  }

  GM.registerMenuCommand('Copy table (full HTML)', () => {cleaning = 0; run();});
  GM.registerMenuCommand('Copy table (cleaned HTML)', () => {cleaning = 1; run();});
  GM.registerMenuCommand('Copy table (cleaned, links as hrefs)', () => {cleaning = 2; run();});
  GM.registerMenuCommand('Copy table (cleanest, links as hrefs)', () => {cleaning = 3; run();});
})();