1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30
| str = str
.replace(/
/g, '\n')
.replace(/ /g, '\t')
.replace(/<img[^>]*alt="([^"]+)"[^>]*>/ig, '$1')
.replace(/\n|\r/g, '')
.replace(/<br[^>]*>/ig, '\n')
.replace(/(?:<(?:div|p|ol|ul|li|pre|code|object)[^>]*>)+/ig, '<div>')
.replace(/(?:<\/(?:div|p|ol|ul|li|pre|code|object)>)+/ig, '</div>')
.replace(/\n<div><\/div>/ig, '\n')
.replace(/<div><\/div>\n/ig, '\n')
.replace(/(?:<div>)+<\/div>/ig, '\n')
.replace(/([^\n])<\/div><div>/ig, '$1\n')
.replace(/(?:<\/div>)+/ig, '</div>')
.replace(/([^\n])<\/div>([^\n])/ig, '$1\n$2')
.replace(/<\/div>/ig, '')
.replace(/([^\n])<div>/ig, '$1\n')
.replace(/\n<div>/ig, '\n')
.replace(/<div>\n/ig, '\n\n')
.replace(/<(?:[^>]+)?>/g, '')
.replace(new RegExp(invisibleChar, 'g'), '')
.replace(/ /g, ' ')
.replace(/</g, '<')
.replace(/>/g, '>')
.replace(/"/g, '"')
.replace(/'/g, "'")
.replace(/`/g, '`')
.replace(/</g, '<')
.replace(/>/g, '>')
.replace(/&/g, '&'); |