浏览器插件:tampermonkey 油猴
JS脚本:nameldk 的《复制为Markdown格式》 0.3.1版本
基础上添加代码。
程序员做笔记最简洁的就是markdown了,html转存为markdown格式就好了,样式统一,编辑也方便。
上面的工具和脚本,转换代码块、图片、超链接文字都很好,支持标签区块识别(像是印象笔记或有道云笔记的网页剪辑那种),随选随转,十分方便。
唯一的缺点就是不支持table标签。
在原有脚本基础上修改,使其支持table标签转换。测试了几个想保存的页面,没什么问题。至于其他网页碰到再说,暂不确定兼容情况。
删掉顶部的// @require那句,将其引用的turndown.js内容完整复制,粘贴到在JS脚本头部,然后在其中添加table转换的部分。
-
- // // ==============================================================================
- // // 在turndown中添加的转换table部分(author:watfe)
- // // ==============================================================================
-
-
- rules.td = {
- filter: ['td'],
- replacement: function (content, node, options) {
- content = content.trim();
- content = content.replace(/\|/g,'/');
- content = content.replace(/\n+/g,' <br> ');
- content = '|'+content
- // console.log('td:'+content);
- return content
- }
- };
-
- rules.th = {
- filter: ['th'],
- replacement: function (content, node, options) {
- content = content.trim();
- content = content.replace(/\|/g,'/');
- content = content.replace(/\n+/g,' <br> ');
- content = '|#$&%th$#%&'+content
- if (node.getAttribute('colspan')!=null){ //如果表头存在合并单元格,对其进行处理
- content = content+repeatStringNumTimes('|', node.getAttribute('colspan'));
- }
- // console.log('th:'+content);
- return content
- }
- };
-
- rules.tr = {
- filter: ['tr'],
- replacement: function (content, node, options) {
- content = '|\n'+content.trim();
- // console.log('tr:'+content);
- return content
- }
- };
-
- function repeatStringNumTimes(str, num) { //字符串重复N次
- let repeatStr = '';
- for(let i = 0; i < num; i++){
- repeatStr += str;
- }
- return repeatStr;
- }
-
- rules.table = {
- filter: ['table'],
- replacement: function (content, node, options) {
- // 删首尾空,删除最前面多余的|,并在最后补全|
- //console.log('table1:'+content);
- content = content.trim();
- content = content.replace(/\n+/g, '\n');
- content = content.replace(/\n\|\n/g, '|\n');
- if (content.indexOf('|\n')===0){
- content = content.substring(1, content.length)+'|';
- }
- content = content.trim();
- // 如果表最前端包含<caption>表名标签的,通过下面代码优化让<caption>变成独立一行
- //console.log('table2:'+content);
- var captionLine = '';
- if (content.slice(0,1)!='|' && (content.slice(-1)!='|')){
- captionLine = content.slice(0,content.indexOf('|\n'));//captionn那行
- content = content.slice(content.indexOf('|\n')+2);
- content = content+'|'
- }
- // 检查表格包含几个|,数字减1就是列数,模拟出markdown表格中间的---:
- var verticalLineCount = 0;
- var strs = new Array();
- var thExist = false;
- strs = content.split('\n');
- for (let i=0; i<strs.length; i++ ){ // 计算最多列数
- if(strs[i].indexOf('|')>=0){
- let tempnum = strs[i].match(/\|/ig).length;
- if (tempnum>verticalLineCount){
- verticalLineCount = tempnum;
- }
- }
- }
- var buildTh = repeatStringNumTimes('| ',verticalLineCount).trim(); // 构造没有表头时候,markdown需要的表头 比如:| | | |
- var tableMDLine = '|'+repeatStringNumTimes('---|',verticalLineCount-1); // 构造markdown表中间的横线 比如:|---|---|---|
- // 检查是否包含表头
- //console.log('table3:'+content);
- if (content.indexOf('|#$&%th$#%&')>=0){
- content = content.replace(/\|#\$&%th\$#%&/g, '|');
- content = content.replace('\n','\n'+tableMDLine+'\n');
- }
- else{
- content = buildTh+'\n'+tableMDLine+'\n'+ content;
- }
- content = '\n'+captionLine+'\n\n'+content+'\n\n';
- //console.log('table4:'+content);
- return content
- }
- };
-
- // // ==============================================================================
- // // 添加完毕
- // // ==============================================================================
-
-
比如:h1用#而不是下划线,代码块用```等等。
在JS脚本建立TurndownService实例前,加入这些配置。
- // ==============================================================================
- // 根据turndown文档,调整一些参数,让转化出来的markdown格式,满足自己的需要
- // https://github.com/domchristie/turndown
- // ==============================================================================
- let options = {
- headingStyle: 'atx',
- bulletListMarker: '+',
- codeBlockStyle: 'fenced',
- emDelimiter: '*'
- };
- // ==============================================================================
- // 添加完毕
- // ==============================================================================
- let turndownService = new TurndownService(options);
-
.replace(/(<a.+?href=")(.*?")(.*?<\/a>)/gi, parseHref);修改为.replace(/(<a.+?href=")(.*?)(".*?<\/a>)/gi, parseHref);
原本的代码,因为这个错误会导致herf链接包含#号时出错
转换成功
使用方法:
tampermonkey中选"添加新脚本", 清空默认内容, 复制代码粘贴到文本框中, 然后点"文件", 点"保存"即可
- // ==UserScript==
- // @name Markdown
- // @name 网页转换为Markdown格式
- // @version 0.0.1
- // @description 复制网页内容为Markdown格式。点击右上角copy按钮开始选择内容,点击鼠标或按Enter进行复制。按Esc取消选择,上箭头选择父级,下箭头选择子级,左箭头选择前面的相邻元素,右箭头选择后面的相邻元素。按钮可以拖动。Ctrl+c+c激活。
- // @author nameldk
- // @author watfe基于nameldk的"复制为Markdown格式.js"和"https://unpkg.com/turndown/dist/turndown.js"的基础上修改
- // @match https://*/*
- // @match http://*/*
- // @match file:///*
- // @grant none
- // ==/UserScript==
-
-
- // ==============================================================
- // 直接导入turndown@6.0.0
- // https://unpkg.com/turndown/dist/turndown.js
- var TurndownService = (function () {
- 'use strict';
-
- function extend (destination) {
- for (var i = 1; i < arguments.length; i++) {
- var source = arguments[i];
- for (var key in source) {
- if (source.hasOwnProperty(key)) destination[key] = source[key];
- }
- }
- return destination
- }
-
- function repeat (character, count) {
- return Array(count + 1).join(character)
- }
-
- var blockElements = [
- 'address', 'article', 'aside', 'audio', 'blockquote', 'body', 'canvas',
- 'center', 'dd', 'dir', 'div', 'dl', 'dt', 'fieldset', 'figcaption',
- 'figure', 'footer', 'form', 'frameset', 'h1', 'h2', 'h3', 'h4', 'h5', 'h6',
- 'header', 'hgroup', 'hr', 'html', 'isindex', 'li', 'main', 'menu', 'nav',
- 'noframes', 'noscript', 'ol', 'output', 'p', 'pre', 'section', 'table',
- 'tbody', 'td', 'tfoot', 'th', 'thead', 'tr',
- 'ul'
- ];
-
- function isBlock (node) {
- return blockElements.indexOf(node.nodeName.toLowerCase()) !== -1
- }
-
- var voidElements = [
- 'area', 'base', 'br', 'col', 'command', 'embed', 'hr', 'img', 'input',
- 'keygen', 'link', 'meta', 'param', 'source', 'track', 'wbr'
- ];
-
- function isVoid (node) {
- return voidElements.indexOf(node.nodeName.toLowerCase()) !== -1
- }
-
- var voidSelector = voidElements.join();
- function hasVoid (node) {
- return node.querySelector && node.querySelector(voidSelector)
- }
-
- var rules = {};
-
- rules.paragraph = {
- filter: 'p',
-
- replacement: function (content) {
- return '\n\n' + content + '\n\n'
- }
- };
-
- rules.lineBreak = {
- filter: 'br',
-
- replacement: function (content, node, options) {
- return options.br + '\n'
- }
- };
-
- rules.heading = {
- filter: ['h1', 'h2', 'h3', 'h4', 'h5', 'h6'],
-
- replacement: function (content, node, options) {
- var hLevel = Number(node.nodeName.charAt(1));
-
- if (options.headingStyle === 'setext' && hLevel < 3) {
- var underline = repeat((hLevel === 1 ? '=' : '-'), content.length);
- return (
- '\n\n' + content + '\n' + underline + '\n\n'
- )
- } else {
- return '\n\n' + repeat('#', hLevel) + ' ' + content + '\n\n'
- }
- }
- };
-
- // // ==============================================================================
- // // 转换table(自己写的,可能不太完善)
- // // ==============================================================================
-
- rules.td = {
- filter: ['td'],
- replacement: function (content, node, options) {
- content = content.trim();
- content = content.replace(/\|/g,'/');
- content = content.replace(/\n+/g,' <br> ');
- content = '|'+content
- // console.log('td:'+content);
- return content
- }
- };
-
- rules.th = {
- filter: ['th'],
- replacement: function (content, node, options) {
- content = content.trim();
- content = content.replace(/\|/g,'/');
- content = content.replace(/\n+/g,' <br> ');
- content = '|#$&%th$#%&'+content
- if (node.getAttribute('colspan')!=null){ //如果表头存在合并单元格,对其进行处理
- content = content+repeatStringNumTimes('|', node.getAttribute('colspan'));
- }
- // console.log('th:'+content);
- return content
- }
- };
-
- rules.tr = {
- filter: ['tr'],
- replacement: function (content, node, options) {
- content = '|\n'+content.trim();
- // console.log('tr:'+content);
- return content
- }
- };
-
- function repeatStringNumTimes(str, num) { //字符串重复N次
- let repeatStr = '';
- for(let i = 0; i < num; i++){
- repeatStr += str;
- }
- return repeatStr;
- }
-
- rules.table = {
- filter: ['table'],
- replacement: function (content, node, options) {
- // 删首尾空,删除最前面多余的|,并在最后补全|
- //console.log('table1:'+content);
- content = content.trim();
- content = content.replace(/\n+/g, '\n');
- content = content.replace(/\n\|\n/g, '|\n');
- if (content.indexOf('|\n')===0){
- content = content.substring(1, content.length)+'|';
- }
- content = content.trim();
- // 如果表最前端包含<caption>表名标签的,通过下面代码优化让<caption>变成独立一行
- //console.log('table2:'+content);
- var captionLine = '';
- if (content.slice(0,1)!='|' && (content.slice(-1)!='|')){
- captionLine = content.slice(0,content.indexOf('|\n'));//captionn那行
- content = content.slice(content.indexOf('|\n')+2);
- content = content+'|'
- }
- // 检查表格包含几个|,数字减1就是列数,模拟出markdown表格中间的---:
- var verticalLineCount = 0;
- var strs = new Array();
- var thExist = false;
- strs = content.split('\n');
- for (let i=0; i<strs.length; i++ ){ // 计算最多列数
- if(strs[i].indexOf('|')>=0){
- let tempnum = strs[i].match(/\|/ig).length;
- if (tempnum>verticalLineCount){
- verticalLineCount = tempnum;
- }
- }
- }
- var buildTh = repeatStringNumTimes('| ',verticalLineCount).trim(); // 构造没有表头时候,markdown需要的表头 比如:| | | |
- var tableMDLine = '|'+repeatStringNumTimes('---|',verticalLineCount-1); // 构造markdown表中间的横线 比如:|---|---|---|
- // 检查是否包含表头
- //console.log('table3:'+content);
- if (content.indexOf('|#$&%th$#%&')>=0){
- content = content.replace(/\|#\$&%th\$#%&/g, '|');
- content = content.replace('\n','\n'+tableMDLine+'\n');
- }
- else{
- content = buildTh+'\n'+tableMDLine+'\n'+ content;
- }
- content = '\n'+captionLine+'\n\n'+content+'\n\n';
- //console.log('table4:'+content);
- return content
- }
- };
- // // ==============================================================================
-
- rules.blockquote = {
- filter: 'blockquote',
-
- replacement: function (content) {
- content = content.replace(/^\n+|\n+$/g, '');
- content = content.replace(/^/gm, '> ');
- return '\n\n' + content + '\n\n'
- }
- };
-
- rules.list = {
- filter: ['ul', 'ol'],
-
- replacement: function (content, node) {
- var parent = node.parentNode;
- if (parent.nodeName === 'LI' && parent.lastElementChild === node) {
- return '\n' + content
- } else {
- return '\n\n' + content + '\n\n'
- }
- }
- };
-
- rules.listItem = {
- filter: 'li',
-
- replacement: function (content, node, options) {
- content = content
- .replace(/^\n+/, '') // remove leading newlines
- .replace(/\n+$/, '\n') // replace trailing newlines with just a single one
- .replace(/\n/gm, '\n '); // indent
- var prefix = options.bulletListMarker + ' ';
- var parent = node.parentNode;
- if (parent.nodeName === 'OL') {
- var start = parent.getAttribute('start');
- var index = Array.prototype.indexOf.call(parent.children, node);
- prefix = (start ? Number(start) + index : index + 1) + '. ';
- }
- return (
- prefix + content + (node.nextSibling && !/\n$/.test(content) ? '\n' : '')
- )
- }
- };
-
- rules.indentedCodeBlock = {
- filter: function (node, options) {
- return (
- options.codeBlockStyle === 'indented' &&
- node.nodeName === 'PRE' &&
- node.firstChild &&
- node.firstChild.nodeName === 'CODE'
- )
- },
-
- replacement: function (content, node, options) {
- return (
- '\n\n ' +
- node.firstChild.textContent.replace(/\n/g, '\n ') +
- '\n\n'
- )
- }
- };
-
- rules.fencedCodeBlock = {
- filter: function (node, options) {
- return (
- options.codeBlockStyle === 'fenced' &&
- node.nodeName === 'PRE' &&
- node.firstChild &&
- node.firstChild.nodeName === 'CODE'
- )
- },
-
- replacement: function (content, node, options) {
- var className = node.firstChild.className || '';
- var language = (className.match(/language-(\S+)/) || [null, ''])[1];
- var code = node.firstChild.textContent;
-
- var fenceChar = options.fence.charAt(0);
- var fenceSize = 3;
- var fenceInCodeRegex = new RegExp('^' + fenceChar + '{3,}', 'gm');
-
- var match;
- while ((match = fenceInCodeRegex.exec(code))) {
- if (match[0].length >= fenceSize) {
- fenceSize = match[0].length + 1;
- }
- }
-
- var fence = repeat(fenceChar, fenceSize);
-
- return (
- '\n\n' + fence + language + '\n' +
- code.replace(/\n$/, '') +
- '\n' + fence + '\n\n'
- )
- }
- };
-
- rules.horizontalRule = {
- filter: 'hr',
-
- replacement: function (content, node, options) {
- return '\n\n' + options.hr + '\n\n'
- }
- };
-
- rules.inlineLink = {
- filter: function (node, options) {
- return (
- options.linkStyle === 'inlined' &&
- node.nodeName === 'A' &&
- node.getAttribute('href')
- )
- },
- replacement: function (content, node) { //console.log('content:'+content); console.log('node:'+node);
- var href = node.getAttribute('href'); //console.log('href:'+href);
- var title = node.title ? ' "' + node.title + '"' : ''; //console.log('title:'+title);
- return '[' + content + '](' + href + title + ')'
- }
- };
-
- rules.referenceLink = {
- filter: function (node, options) {
- return (
- options.linkStyle === 'referenced' &&
- node.nodeName === 'A' &&
- node.getAttribute('href')
- )
- },
-
- replacement: function (content, node, options) {
- var href = node.getAttribute('href');
- var title = node.title ? ' "' + node.title + '"' : '';
- var replacement;
- var reference;
-
- switch (options.linkReferenceStyle) {
- case 'collapsed':
- replacement = '[' + content + '][]';
- reference = '[' + content + ']: ' + href + title;
- break
- case 'shortcut':
- replacement = '[' + content + ']';
- reference = '[' + content + ']: ' + href + title;
- break
- default:
- var id = this.references.length + 1;
- replacement = '[' + content + '][' + id + ']';
- reference = '[' + id + ']: ' + href + title;
- }
-
- this.references.push(reference);
- return replacement
- },
-
- references: [],
-
- append: function (options) {
- var references = '';
- if (this.references.length) {
- references = '\n\n' + this.references.join('\n') + '\n\n';
- this.references = []; // Reset references
- }
- return references
- }
- };
-
- rules.emphasis = {
- filter: ['em', 'i'],
-
- replacement: function (content, node, options) {
- if (!content.trim()) return ''
- return options.emDelimiter + content + options.emDelimiter
- }
- };
-
- rules.strong = {
- filter: ['strong', 'b'],
-
- replacement: function (content, node, options) {
- if (!content.trim()) return ''
- return options.strongDelimiter + content + options.strongDelimiter
- }
- };
-
- rules.code = {
- filter: function (node) {
- var hasSiblings = node.previousSibling || node.nextSibling;
- var isCodeBlock = node.parentNode.nodeName === 'PRE' && !hasSiblings;
-
- return node.nodeName === 'CODE' && !isCodeBlock
- },
-
- replacement: function (content) {
- if (!content.trim()) return ''
-
- var delimiter = '`';
- var leadingSpace = '';
- var trailingSpace = '';
- var matches = content.match(/`+/gm);
- if (matches) {
- if (/^`/.test(content)) leadingSpace = ' ';
- if (/`$/.test(content)) trailingSpace = ' ';
- while (matches.indexOf(delimiter) !== -1) delimiter = delimiter + '`';
- }
-
- return delimiter + leadingSpace + content + trailingSpace + delimiter
- }
- };
-
- rules.image = {
- filter: 'img',
-
- replacement: function (content, node) {
- var alt = node.alt || '';
- var src = node.getAttribute('src') || '';
- var title = node.title || '';
- var titlePart = title ? ' "' + title + '"' : '';
- return src ? '![' + alt + ']' + '(' + src + titlePart + ')' : ''
- }
- };
-
- /**
- * Manages a collection of rules used to convert HTML to Markdown
- */
-
- function Rules (options) {
- this.options = options;
- this._keep = [];
- this._remove = [];
-
- this.blankRule = {
- replacement: options.blankReplacement
- };
-
- this.keepReplacement = options.keepReplacement;
-
- this.defaultRule = {
- replacement: options.defaultReplacement
- };
-
- this.array = [];
- for (var key in options.rules) this.array.push(options.rules[key]);
- }
-
- Rules.prototype = {
- add: function (key, rule) {
- this.array.unshift(rule);
- },
-
- keep: function (filter) {
- this._keep.unshift({
- filter: filter,
- replacement: this.keepReplacement
- });
- },
-
- remove: function (filter) {
- this._remove.unshift({
- filter: filter,
- replacement: function () {
- return ''
- }
- });
- },
-
- forNode: function (node) {
- if (node.isBlank) return this.blankRule
- var rule;
-
- if ((rule = findRule(this.array, node, this.options))) return rule
- if ((rule = findRule(this._keep, node, this.options))) return rule
- if ((rule = findRule(this._remove, node, this.options))) return rule
-
- return this.defaultRule
- },
-
- forEach: function (fn) {
- for (var i = 0; i < this.array.length; i++) fn(this.array[i], i);
- }
- };
-
- function findRule (rules, node, options) {
- for (var i = 0; i < rules.length; i++) {
- var rule = rules[i];
- if (filterValue(rule, node, options)) return rule
- }
- return void 0
- }
-
- function filterValue (rule, node, options) {
- var filter = rule.filter;
- if (typeof filter === 'string') {
- if (filter === node.nodeName.toLowerCase()) return true
- } else if (Array.isArray(filter)) {
- if (filter.indexOf(node.nodeName.toLowerCase()) > -1) return true
- } else if (typeof filter === 'function') {
- if (filter.call(rule, node, options)) return true
- } else {
- throw new TypeError('`filter` needs to be a string, array, or function')
- }
- }
-
- /**
- * The collapseWhitespace function is adapted from collapse-whitespace
- * by Luc Thevenard.
- *
- * The MIT License (MIT)
- *
- * Copyright (c) 2014 Luc Thevenard <lucthevenard@gmail.com>
- *
- * Permission is hereby granted, free of charge, to any person obtaining a copy
- * of this software and associated documentation files (the "Software"), to deal
- * in the Software without restriction, including without limitation the rights
- * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the Software is
- * furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice shall be included in
- * all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
- * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
- * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
- * THE SOFTWARE.
- */
-
- /**
- * collapseWhitespace(options) removes extraneous whitespace from an the given element.
- *
- * @param {Object} options
- */
- function collapseWhitespace (options) {
- var element = options.element;
- var isBlock = options.isBlock;
- var isVoid = options.isVoid;
- var isPre = options.isPre || function (node) {
- return node.nodeName === 'PRE'
- };
-
- if (!element.firstChild || isPre(element)) return
-
- var prevText = null;
- var prevVoid = false;
-
- var prev = null;
- var node = next(prev, element, isPre);
-
- while (node !== element) {
- if (node.nodeType === 3 || node.nodeType === 4) { // Node.TEXT_NODE or Node.CDATA_SECTION_NODE
- var text = node.data.replace(/[ \r\n\t]+/g, ' ');
-
- if ((!prevText || / $/.test(prevText.data)) &&
- !prevVoid && text[0] === ' ') {
- text = text.substr(1);
- }
-
- // `text` might be empty at this point.
- if (!text) {
- node = remove(node);
- continue
- }
-
- node.data = text;
-
- prevText = node;
- } else if (node.nodeType === 1) { // Node.ELEMENT_NODE
- if (isBlock(node) || node.nodeName === 'BR') {
- if (prevText) {
- prevText.data = prevText.data.replace(/ $/, '');
- }
-
- prevText = null;
- prevVoid = false;
- } else if (isVoid(node)) {
- // Avoid trimming space around non-block, non-BR void elements.
- prevText = null;
- prevVoid = true;
- }
- } else {
- node = remove(node);
- continue
- }
-
- var nextNode = next(prev, node, isPre);
- prev = node;
- node = nextNode;
- }
-
- if (prevText) {
- prevText.data = prevText.data.replace(/ $/, '');
- if (!prevText.data) {
- remove(prevText);
- }
- }
- }
-
- /**
- * remove(node) removes the given node from the DOM and returns the
- * next node in the sequence.
- *
- * @param {Node} node
- * @return {Node} node
- */
- function remove (node) {
- var next = node.nextSibling || node.parentNode;
-
- node.parentNode.removeChild(node);
-
- return next
- }
-
- /**
- * next(prev, current, isPre) returns the next node in the sequence, given the
- * current and previous nodes.
- *
- * @param {Node} prev
- * @param {Node} current
- * @param {Function} isPre
- * @return {Node}
- */
- function next (prev, current, isPre) {
- if ((prev && prev.parentNode === current) || isPre(current)) {
- return current.nextSibling || current.parentNode
- }
-
- return current.firstChild || current.nextSibling || current.parentNode
- }
-
- /*
- * Set up window for Node.js
- */
-
- var root = (typeof window !== 'undefined' ? window : {});
-
- /*
- * Parsing HTML strings
- */
-
- function canParseHTMLNatively () {
- var Parser = root.DOMParser;
- var canParse = false;
-
- // Adapted from https://gist.github.com/1129031
- // Firefox/Opera/IE throw errors on unsupported types
- try {
- // WebKit returns null on unsupported types
- if (new Parser().parseFromString('', 'text/html')) {
- canParse = true;
- }
- } catch (e) {}
-
- return canParse
- }
-
- function createHTMLParser () {
- var Parser = function () {};
- if (shouldUseActiveX()) {
- Parser.prototype.parseFromString = function (string) {
- var doc = new window.ActiveXObject('htmlfile'); //console.log('createHTMLParser1:'+string);
- doc.designMode = 'on'; // disable on-page scripts
- doc.open();
- doc.write(string);
- doc.close();
- return doc
- };
- } else {
- Parser.prototype.parseFromString = function (string) {
- var doc = document.implementation.createHTMLDocument(''); //console.log('createHTMLParser2:'+string);
- doc.open();
- doc.write(string);
- doc.close();
- return doc
- };
- }
- return Parser
- }
-
- function shouldUseActiveX () {
- var useActiveX = false;
- try {
- document.implementation.createHTMLDocument('').open();
- } catch (e) {
- if (window.ActiveXObject) useActiveX = true;
- }
- return useActiveX
- }
-
- var HTMLParser = canParseHTMLNatively() ? root.DOMParser : createHTMLParser();
-
- function RootNode (input) {
- var root;
- if (typeof input === 'string') {
- var doc = htmlParser().parseFromString(
- // DOM parsers arrange elements in the <head> and <body>.
- // Wrapping in a custom element ensures elements are reliably arranged in
- // a single element.
- '<x-turndown id="turndown-root">' + input + '</x-turndown>',
- 'text/html'
- );
- root = doc.getElementById('turndown-root');
- } else {
- root = input.cloneNode(true);
- }
- collapseWhitespace({
- element: root,
- isBlock: isBlock,
- isVoid: isVoid
- });
-
- return root
- }
-
- var _htmlParser;
- function htmlParser () {
- _htmlParser = _htmlParser || new HTMLParser();
- return _htmlParser
- }
-
- function Node (node) {
- node.isBlock = isBlock(node);
- node.isCode = node.nodeName.toLowerCase() === 'code' || node.parentNode.isCode;
- node.isBlank = isBlank(node);
- node.flankingWhitespace = flankingWhitespace(node);
- return node
- }
-
- function isBlank (node) {
- return (
- ['A', 'TH', 'TD', 'IFRAME', 'SCRIPT', 'AUDIO', 'VIDEO'].indexOf(node.nodeName) === -1 &&
- /^\s*$/i.test(node.textContent) &&
- !isVoid(node) &&
- !hasVoid(node)
- )
- }
-
- function flankingWhitespace (node) {
- var leading = '';
- var trailing = '';
-
- if (!node.isBlock) {
- var hasLeading = /^\s/.test(node.textContent);
- var hasTrailing = /\s$/.test(node.textContent);
- var blankWithSpaces = node.isBlank && hasLeading && hasTrailing;
-
- if (hasLeading && !isFlankedByWhitespace('left', node)) {
- leading = ' ';
- }
-
- if (!blankWithSpaces && hasTrailing && !isFlankedByWhitespace('right', node)) {
- trailing = ' ';
- }
- }
-
- return { leading: leading, trailing: trailing }
- }
-
- function isFlankedByWhitespace (side, node) {
- var sibling;
- var regExp;
- var isFlanked;
-
- if (side === 'left') {
- sibling = node.previousSibling;
- regExp = / $/;
- } else {
- sibling = node.nextSibling;
- regExp = /^ /;
- }
-
- if (sibling) {
- if (sibling.nodeType === 3) {
- isFlanked = regExp.test(sibling.nodeValue);
- } else if (sibling.nodeType === 1 && !isBlock(sibling)) {
- isFlanked = regExp.test(sibling.textContent);
- }
- }
- return isFlanked
- }
-
- var reduce = Array.prototype.reduce;
- var leadingNewLinesRegExp = /^\n*/;
- var trailingNewLinesRegExp = /\n*$/;
- var escapes = [
- [/\\/g, '\\\\'],
- [/\*/g, '\\*'],
- [/^-/g, '\\-'],
- [/^\+ /g, '\\+ '],
- [/^(=+)/g, '\\$1'],
- [/^(#{1,6}) /g, '\\$1 '],
- [/`/g, '\\`'],
- [/^~~~/g, '\\~~~'],
- [/\[/g, '\\['],
- [/\]/g, '\\]'],
- [/^>/g, '\\>'],
- [/_/g, '\\_'],
- [/^(\d+)\. /g, '$1\\. ']
- ];
-
- function TurndownService (options) {
- if (!(this instanceof TurndownService)) return new TurndownService(options)
-
- var defaults = {
- rules: rules,
- headingStyle: 'setext',
- hr: '* * *',
- bulletListMarker: '*',
- codeBlockStyle: 'indented',
- fence: '```',
- emDelimiter: '_',
- strongDelimiter: '**',
- linkStyle: 'inlined',
- linkReferenceStyle: 'full',
- br: ' ',
- blankReplacement: function (content, node) {
- return node.isBlock ? '\n\n' : ''
- },
- keepReplacement: function (content, node) {
- return node.isBlock ? '\n\n' + node.outerHTML + '\n\n' : node.outerHTML
- },
- defaultReplacement: function (content, node) {
- return node.isBlock ? '\n\n' + content + '\n\n' : content
- }
- };
- this.options = extend({}, defaults, options);
- this.rules = new Rules(this.options);
- }
-
- TurndownService.prototype = {
- /**
- * The entry point for converting a string or DOM node to Markdown
- * @public
- * @param {String|HTMLElement} input The string or DOM node to convert
- * @returns A Markdown representation of the input
- * @type String
- */
-
- turndown: function (input) {
- //console.log(input);
- if (!canConvert(input)) { //copy点击后传入
- throw new TypeError(
- input + ' is not a string, or an element/document/fragment node.'
- )
- }
-
- if (input === '') return ''
-
- var output = process.call(this, new RootNode(input)); //处理完毕后返回内容
- return postProcess.call(this, output)
- },
-
- /**
- * Add one or more plugins
- * @public
- * @param {Function|Array} plugin The plugin or array of plugins to add
- * @returns The Turndown instance for chaining
- * @type Object
- */
-
- use: function (plugin) {
- if (Array.isArray(plugin)) {
- for (var i = 0; i < plugin.length; i++) this.use(plugin[i]);
- } else if (typeof plugin === 'function') {
- plugin(this);
- } else {
- throw new TypeError('plugin must be a Function or an Array of Functions')
- }
- return this
- },
-
- /**
- * Adds a rule
- * @public
- * @param {String} key The unique key of the rule
- * @param {Object} rule The rule
- * @returns The Turndown instance for chaining
- * @type Object
- */
-
- addRule: function (key, rule) {
- this.rules.add(key, rule);
- return this
- },
-
- /**
- * Keep a node (as HTML) that matches the filter
- * @public
- * @param {String|Array|Function} filter The unique key of the rule
- * @returns The Turndown instance for chaining
- * @type Object
- */
-
- keep: function (filter) {
- this.rules.keep(filter);
- return this
- },
-
- /**
- * Remove a node that matches the filter
- * @public
- * @param {String|Array|Function} filter The unique key of the rule
- * @returns The Turndown instance for chaining
- * @type Object
- */
-
- remove: function (filter) {
- this.rules.remove(filter);
- return this
- },
-
- /**
- * Escapes Markdown syntax
- * @public
- * @param {String} string The string to escape
- * @returns A string with Markdown syntax escaped
- * @type String
- */
-
- escape: function (string) {
- return escapes.reduce(function (accumulator, escape) {
- return accumulator.replace(escape[0], escape[1])
- }, string)
- }
- };
-
- /**
- * Reduces a DOM node down to its Markdown string equivalent
- * @private
- * @param {HTMLElement} parentNode The node to convert
- * @returns A Markdown representation of the node
- * @type String
- */
-
- function process (parentNode) {
- var self = this;
- return reduce.call(parentNode.childNodes, function (output, node) {
- node = new Node(node);
-
- var replacement = '';
- if (node.nodeType === 3) {
- replacement = node.isCode ? node.nodeValue : self.escape(node.nodeValue);
- } else if (node.nodeType === 1) {
- replacement = replacementForNode.call(self, node);
- }
-
- return join(output, replacement)
- }, '')
- }
-
- /**
- * Appends strings as each rule requires and trims the output
- * @private
- * @param {String} output The conversion output
- * @returns A trimmed version of the ouput
- * @type String
- */
-
- function postProcess (output) {
- var self = this;
- this.rules.forEach(function (rule) {
- if (typeof rule.append === 'function') {
- output = join(output, rule.append(self.options));
- }
- });
-
- return output.replace(/^[\t\r\n]+/, '').replace(/[\t\r\n\s]+$/, '')
- }
-
- /**
- * Converts an element node to its Markdown equivalent
- * @private
- * @param {HTMLElement} node The node to convert
- * @returns A Markdown representation of the node
- * @type String
- */
-
- function replacementForNode (node) {
- var rule = this.rules.forNode(node);
- var content = process.call(this, node);
- var whitespace = node.flankingWhitespace;
- if (whitespace.leading || whitespace.trailing) content = content.trim();
- return (
- whitespace.leading +
- rule.replacement(content, node, this.options) +
- whitespace.trailing
- )
- }
-
- /**
- * Determines the new lines between the current output and the replacement
- * @private
- * @param {String} output The current conversion output
- * @param {String} replacement The string to append to the output
- * @returns The whitespace to separate the current output and the replacement
- * @type String
- */
-
- function separatingNewlines (output, replacement) {
- var newlines = [
- output.match(trailingNewLinesRegExp)[0],
- replacement.match(leadingNewLinesRegExp)[0]
- ].sort();
- var maxNewlines = newlines[newlines.length - 1];
- return maxNewlines.length < 2 ? maxNewlines : '\n\n'
- }
-
- function join (string1, string2) {
- var separator = separatingNewlines(string1, string2);
-
- // Remove trailing/leading newlines and replace with separator
- string1 = string1.replace(trailingNewLinesRegExp, '');
- string2 = string2.replace(leadingNewLinesRegExp, '');
-
- return string1 + separator + string2
- }
-
- /**
- * Determines whether an input can be converted
- * @private
- * @param {String|HTMLElement} input Describe this parameter
- * @returns Describe what it returns
- * @type String|Object|Array|Boolean|Number
- */
-
- function canConvert (input) {
- return (
- input != null && (
- typeof input === 'string' ||
- (input.nodeType && (
- input.nodeType === 1 || input.nodeType === 9 || input.nodeType === 11
- ))
- )
- )
- }
-
- return TurndownService;
-
- }());
-
- // ==============================================================
-
-
-
- (function () {
- 'use strict';
-
- const CLASS_HINT = "_myhint_";
- let $curElement = null;
- let $btn = document.createElement("div");
- // ==============================================================================
- // 根据turndown文档,调整一些参数,让转化出来的markdown格式,满足自己的需要
- // https://github.com/domchristie/turndown
- // ==============================================================================
- let options = {
- headingStyle: 'atx',
- bulletListMarker: '+',
- codeBlockStyle: 'fenced',
- emDelimiter: '*'
- };
- // ==============================================================================
- let turndownService = new TurndownService(options);
- let isHold = 0,
- isDrag = 0;
-
- function addStyle(css) {
- let s = document.createElement("style");
- s.type = "text/css";
- s.textContent = css;
- document.body.prepend(s);
- }
-
- function showHint($this) {
- if ($this) {
- $this.classList.add(CLASS_HINT);
- }
- }
-
- function hideHint($this) {
- if ($this) {
- $this.classList.remove(CLASS_HINT);
- }
- }
-
- function handleMouseover(e) {
- hideHint($curElement);
- let $target = e.target;
- $curElement = $target;
- showHint($target);
- }
-
- function handleMouseout(e) {
- let $target = e.target;
- hideHint($target);
- }
-
- function handleKeyup(e) {
- function isValidNode(node) {
- return node && node.textContent && node.textContent.trim() !== "";
- }
- function findNextNode(node) {
- if (node) {
- var findNode = node.nextElementSibling;
- while(findNode) {
- if (isValidNode(findNode)) {
- return findNode;
- } else {
- if (findNode.nextElementSibling) {
- findNode = findNode.nextElementSibling;
- }
- }
- }
- }
- return null;
- }
-
- if (e.keyCode === 13) { // enter
- process(e);
- return false;
- } else if (e.keyCode === 27) { // esc
- disable();
- } else if (e.keyCode === 38) { // arrow up
- if ($curElement && isValidNode($curElement.parentElement)) {
- hideHint($curElement);
- $curElement = $curElement.parentElement;
- showHint($curElement);
- }
- } else if (e.keyCode === 37) { // arrow left
- if ($curElement && isValidNode($curElement.previousElementSibling)) {
- hideHint($curElement);
- $curElement = $curElement.previousElementSibling;
- showHint($curElement);
- }
- } else if (e.keyCode === 40) { // arrow down
- let nextNode = null;
- if ($curElement && (nextNode = findNextNode($curElement.firstElementChild))) {
- hideHint($curElement);
- $curElement = nextNode;
- showHint($curElement);
- }
- } else if (e.keyCode === 39) { // arrow right
- if ($curElement && isValidNode($curElement.nextElementSibling)) {
- hideHint($curElement);
- $curElement = $curElement.nextElementSibling;
- showHint($curElement);
- }
- }
- }
-
- function disableScroll(e) {
- if ([38, 40, 37, 39].indexOf(e.keyCode) > -1) {
- e.preventDefault();
- }
- }
-
- function handleClick(e) {
- process(e);
- return false;
- }
-
- function process(e) {
- if ($curElement) {
- e.preventDefault();
- copyIt($curElement);
- disable();
- showTips();
- }
- }
-
- function showTips() {
- let t = document.createElement("div");
- t.style.position = "fixed";
- t.style.width = "80px";
- t.style.height = "24px";
- t.style.lineHeight = "24px";
- t.style.top = "10px";
- t.style.right = "50%";
- t.style.background = "#68af02";
- t.style.fontSize = "14px";
- t.style.color = "#fff";
- t.style.textAlign = "center";
- t.style.borderRadius = "5px";
- t.style.marginLeft = "300px";
- t.style.zIndex = 10000;
- t.innerHTML = "复制成功";
-
- document.body.prepend(t);
- setTimeout(function () {
- document.body.removeChild(t);
- }, 1000);
- }
-
- function copyIt($curElement) {//复制内容,并进行处理得到结果,写到剪切板
- if ($curElement) {
- let html = $curElement.innerHTML;
- html = html.replace(/(<img.+\s?src=")(\/\/.+?")/gi, "$1" + document.location.protocol + "$2");
- html = html.replace(/(<img.+\s?src=")(\/.+?")/gi, "$1" + document.location.origin + "$2");
- html = html.replace(/(<img.+\s?src=")(?!http)(.+?")/gi, "$1" + document.location.origin +
- (document.location.pathname.substring(0, document.location.pathname.lastIndexOf('/'))) + "/$2");
- html = html.replace(/(<a.+?href=")(.*?)(".*?<\/a>)/gi, parseHref); //补全url链接,加上域名之类的
- let markdown = turndownService.turndown(html);
- markdown = markdown.replace(/<img.+?>/g, "");
- copyToClipboard(markdown);
- }
- }
-
- function parseHref(match, head, link, tail){ //对copyIt()中replace正则match到的匹配项head,link,tail,处理后返回,用于替换
- let linkFormat = '';
- var path = document.location.pathname.split('/');path.pop(); //domain
- if (link.substr(0, 4) === 'http') {
- //linkFormat = head + link.replace(/#.*/,"") + tail; //原本的这个替换不知道,为什么非要删除url#后的部分,这里改成不删
- linkFormat = head + link + tail;
- } else if (link[0] === '#' || link.substr(0, 10) === 'javascript' || link === '"') { // "#" "javascript:" ""
- linkFormat = head + '#"' + tail;
- } else if (link[0] === '.' && link[1] === '/'){ // "./xxx"
- linkFormat = head + document.location.origin + path.join('/') + link.substring(1) + tail;
- } else if (link[0] === '.' && link[1] === '.' && link[2] === '/') { // ../xxx
- var p2Arr = link.split('../'),
- tmpRes = [p2Arr.pop()];
- path.pop();
- while(p2Arr.length){
- var t = p2Arr.pop();
- if (t === ''){
- tmpRes.unshift(path.pop());
- }
- }
- linkFormat = head + document.location.origin + tmpRes.join('/') + tail;
- } else if (link.match(/^\/\/.*/)) { // //xxx.com
- linkFormat = head + document.location.protocol + link + tail;
- } else if (link.match(/^\/.*/)) { // /abc
- linkFormat = head + document.location.origin + link + tail;
- } else { // "abc/xxx"
- linkFormat = head + document.location.origin + path.join("/") + '/' + link + tail;
- }
- return linkFormat;
- }
-
- function copyToClipboard(text) {
- const input = document.createElement('textarea');
- input.style.position = 'fixed';
- input.style.opacity = 0;
- input.value = text;
- document.body.appendChild(input);
- input.select();
- let res = document.execCommand('Copy');
- document.body.removeChild(input);
- return res;
- }
-
- function enable() {
- document.addEventListener("mouseover", handleMouseover);
- document.addEventListener("mouseout", handleMouseout);
- document.addEventListener("click", handleClick);
- document.addEventListener("keyup", handleKeyup);
- window.addEventListener("keydown", disableScroll, false);
- }
-
- function disable() {
- if ($curElement) {
- hideHint($curElement);
- $curElement = null;
- }
-
- document.removeEventListener("mouseover", handleMouseover);
- document.removeEventListener("mouseout", handleMouseout);
- document.removeEventListener("click", handleClick);
- document.removeEventListener("keyup", handleKeyup);
- window.removeEventListener("keydown", disableScroll, false);
-
- $btn.style.display = "block";
- }
-
- function genDoublePressHandler(keyCode, callback, params) {
- var intval = 500;
- var lastKeypressTime = 0;
- var useCtrl = params && params.useCtrl;
- var pressCtrl = 0;
- if (useCtrl) {
- document.addEventListener('keydown', function(e) {
- if (useCtrl && e.keyCode === 17) {
- pressCtrl = 1;
- }
- }, false);
- document.addEventListener('keyup', function(e) {
- if (useCtrl && e.keyCode === 17) {
- pressCtrl = 0;
- }
- }, false);
- }
- return function(e) {
- var now = +new Date;
- if (e.keyCode === keyCode) {
- if ((now - lastKeypressTime <= intval) && (!useCtrl || useCtrl && pressCtrl)) {
- callback && callback(e);
- lastKeypressTime = 0;
- }
- }
- lastKeypressTime = now;
- };
- }
-
- function initBtn() {
- let topDiff = 0,
- leftDiff = 0;
-
- $btn.style.position = "fixed";
- $btn.style.width = "44px";
- $btn.style.height = "22px";
- $btn.style.lineHeight = "22px";
- $btn.style.top = "14%";
- $btn.style.right = "1%";
- $btn.style.background = "#0084ff";
- $btn.style.fontSize = "14px";
- $btn.style.color = "#fff";
- $btn.style.textAlign = "center";
- $btn.style.borderRadius = "6px";
- $btn.style.zIndex = 10000;
- $btn.style.cursor = "pointer";
- $btn.style.opacity = 0.1;
- $btn.innerHTML = "copy";
-
- $btn.addEventListener("click", function () {
- if (isDrag) {
- return false;
- }
- enable();
- this.style.display = "none";
- });
-
- $btn.addEventListener("mouseover", function (e) {
- this.style.opacity = 1;
- });
-
- $btn.addEventListener("mouseout", function () {
- this.style.opacity = 0.1;
- });
-
- $btn.addEventListener("mousedown", function (e) {
- isHold = 1;
- leftDiff = e.pageX - this.offsetLeft;
- topDiff = e.pageY - this.offsetTop;
-
- $btn.onmousemove = function (e) {
- if (isHold) {
- isDrag = 1;
- }
- if (isDrag) {
- this.style.top = (e.pageY - topDiff) + "px";
- this.style.left = (e.pageX - leftDiff) + "px";
- this.style.right = "auto";
- }
- };
- });
-
- document.addEventListener("mouseup", function () {
- setTimeout(function () {
- isHold = 0;
- isDrag = 0;
- $btn.onmousemove = null;
- }, 0);
- });
-
- // Ctrl+c+c
- document.addEventListener('keyup', genDoublePressHandler(67, function (e) {
- $btn.click();
- },{"useCtrl":1}), false);
-
- }
-
- function init() {
- if (!document.body) {
- console.warn("no body");
- return;
- }
- addStyle("." + CLASS_HINT + "{background-color: #fafafa; outline: 2px dashed #1976d2; opacity: .8; cursor: pointer; -webkit-transition: opacity .5s ease; transition: opacity .5s ease;}");
- document.body.prepend($btn);
- initBtn();
- }
-
- init();
- })();
- // @namespace http://tampermonkey.net/
- // @version 0.1
- // @description try to take over the world!
- // @author You
- // @match https://www.cnblogs.com/zhangxinqi/p/8418545.html
- // @grant none
- // ==/UserScript==
-
- (function() {
- 'use strict';
-
- // Your code here...
- })();
-