Created
April 28, 2011 00:07
-
-
Save j0shua/945522 to your computer and use it in GitHub Desktop.
readability js
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
// | |
if(typeof(readability) === "undefined"){ | |
readability = {}; | |
} | |
(function (readability) { | |
readability.baseUrl = 'https://www.readability.com'; | |
readability.type = 'read'; | |
readability.frameId = 'readabilityIFrame-'+Math.random(); | |
readability.frameUrl = readability.baseUrl + '/articles/queue'; | |
readability.frameContainerId = 'readabilityFrameContainer-' + readability.type; | |
readability.frameContainer = null; | |
readability.docCompressed = null; | |
readability.extensionInfo = { | |
"type": (typeof window.readabilityExtensionType == "undefined" || window.readabilityExtensionType == "" ? 'bookmarklet' : window.readabilityExtensionType ), | |
"version": (typeof window.readabilityExtensionVersion == "undefined" || window.readabilityExtensionVersion == "" ? "1" : window.readabilityExtensionVersion ) | |
} | |
readability.frameContainerStyles = { | |
position: 'fixed', | |
display: 'block', | |
top: '0px', | |
left: '0px', | |
width: '100%', | |
height: '100%', | |
padding: '0', | |
margin: '0', | |
backgroundColor: "transparent", | |
zIndex: '2147483647' | |
}; | |
readability.frameStyles = ["width: 100%", "height: 100%", "display: block", "overflow: auto", // Proper iframe overflow in FF. Webkit uses the document body's CSS setting. | |
"margin: 0", "padding: 0", "border-width: 0"].join(';'); | |
/* A method so that if we change frameId we still get valid HTML */ | |
// Adds onload, which will allow us to hide the content behind the frame after we have the new content. | |
readability.getFrameHtml = function () { | |
return ['<iframe id="' + readability.frameId + '"', 'name="' + readability.frameId + '"', 'scrolling="auto"', 'frameborder="0"', 'style="' + readability.frameStyles + '"', 'onload="readability.frameLoaded(this)">', '</iframe>'].join(' '); | |
}; | |
readability.debug = function (s) { | |
if (typeof console !== "undefined") { | |
return console.log(s); | |
} | |
}; | |
readability.getExtensionDetails = function () { | |
if (typeof window.readabilityExtensionDetails !== null) { | |
return window.readabilityExtensionDetails; | |
} else { | |
return "bookmarklet"; | |
} | |
}; | |
readability.compress = function (doc_node) { | |
var i, il, html, preTags = doc_node.getElementsByTagName('pre'); | |
for (i = 0, il = preTags.length; i < il; i++) { | |
preTags[i].innerHTML = preTags[i].innerHTML.replace(/ /g, ' ').replace(/\t/g, ' ').replace(/\n/g, '--rdb-newline--'); | |
} | |
html = "<html>" + doc_node.innerHTML + "</html>"; | |
html = html.replace(/[\s\t\r\n]+/g, ' '); | |
html = html.replace(/<!--.*?-->/g, ''); | |
html = html.replace(/--rdb-newline--/g, "\n"); | |
return html; | |
}; | |
readability.hidePageElements = function () { | |
var child, i; | |
for (i = 0; i < document.body.childNodes.length; i++) { | |
child = document.body.childNodes[i]; | |
if (child.nodeType !== 1) { | |
continue; | |
} | |
display = child.currentStyle ? child.currentStyle.display : document.defaultView.getComputedStyle(child, null).getPropertyValue('display'); | |
if (child.id !== readability.frameContainerId) { | |
child.origDisplay = display; | |
child.style.display = 'none'; | |
} | |
} | |
}; | |
readability.removeDocumentScrolling = function () { | |
var child, display, i; | |
document.body.style.overflow = "hidden"; | |
}; | |
readability.addDocumentScrolling = function () { | |
var child, i; | |
for (i = 0; i < document.body.childNodes.length; i++) { | |
child = document.body.childNodes[i]; | |
if (child.nodeType !== 1) { | |
continue; | |
} | |
if (child.origDisplay) { | |
child.style.display = child.origDisplay; | |
} | |
} | |
document.body.style.overflow = "auto"; | |
}; | |
readability.isLocalPage = function () { | |
if (document.location.href.indexOf(readability.baseUrl) !== - 1) { | |
return true; | |
} | |
else { | |
return false; | |
} | |
}; | |
/* Cross-browser dispatchEvent - from http://www.cross-browser.com/forums/viewtopic.php?id=384 */ | |
readability.dispatchEvent = function (element, rawEvent) { | |
// Attempts to fire a raw DOM event on an element | |
// param name="element" type="Element" The element or its identifier to fire the event | |
// param name="rawEvent" type="Object" The raw DOM event object to fire | |
// returns type="Boolean" True if the event was successfully fired, otherwise false | |
try { | |
if (element.fireEvent) { | |
element.fireEvent("on" + rawEvent.type, rawEvent); | |
return true; | |
} | |
else if (element.dispatchEvent) { | |
element.dispatchEvent(rawEvent); | |
return true; | |
} | |
} catch (e) { | |
readability.debug('Error caught:'); | |
readability.debug(e); | |
} | |
return false; | |
}; | |
readability.checkDocLocation = function () { | |
if (document.location.href.indexOf(readability.baseUrl) !== - 1) { | |
if (document.getElementById('read-bar') !== null && document.getElementById('read-link') !== null) { | |
var clickEvent = document.createEvent('MouseEvent'); | |
clickEvent.initMouseEvent('click', true, true, document.defaultView, 1, 0, 0, 0, 0, false, false, false, false, 0, null); | |
readability.dispatchEvent(document.getElementById('read-link'), clickEvent); | |
return false; | |
} else { | |
document.location = readability.baseUrl; | |
return false; | |
} | |
} | |
}; | |
// Cross browser addEventListener from http://snipplr.com/view.php?codeview&id=3116 | |
readability.listen = function (evnt, elem, func) { | |
if (elem.addEventListener) { // W3C DOM | |
return elem.addEventListener(evnt, func, false); | |
} else if (elem.attachEvent) { // IE DOM | |
var r = elem.attachEvent("on" + evnt, func); | |
return r; | |
} else { | |
return false; | |
} | |
}; | |
// Receive cross-DOM js events | |
readability.receiveMessage = function (event) { | |
if (event.origin === readability.baseUrl && event.data) { | |
/** | |
* Special handling for set_token, otherwise just event handlers. | |
* TODO: Turn these all into json structures with a name rather than just strings. | |
**/ | |
if (event.data.indexOf('set_token') === 0) { | |
window.readabilityToken = event.data.replace('set_token=', ''); | |
readability.readabilityToken = window.readabilityToken; | |
} else { | |
try { | |
var event_method = event.data.replace('-', '_'); | |
if (typeof readability.event_handlers[event_method] !== "undefined") { | |
readability.event_handlers[event_method](event); | |
} | |
} catch (e) { | |
readability.debug('Error caught in receiveMessage:'); | |
readability.debug(e); | |
} | |
} | |
} | |
}; | |
// The handlers for cross-DOM events | |
readability.event_handlers = { | |
rdb_load_modal: function (event) { | |
var iframeContainer = readability.frameContainer, | |
styleKey, | |
iframeContainerStyles = {position: 'fixed', display: 'block', width: '100%', height: '100%', zIndex: '2147483647',background: "url('')"}; | |
for (styleKey in iframeContainerStyles) { | |
if (iframeContainerStyles.hasOwnProperty(styleKey)) { | |
iframeContainer.style[styleKey] = iframeContainerStyles[styleKey]; | |
} | |
} | |
}, | |
rdb_remove_frame: function (event) { | |
var frameContainer = readability.frameContainer; | |
if (frameContainer) { | |
frameContainer.parentNode.removeChild(frameContainer); | |
} | |
}, | |
rdb_load_bar: function (event) { | |
var messageBar = { | |
styles: { | |
position: 'fixed', | |
display: 'block', | |
top: '0px', | |
left: '0px', | |
width: '100%', | |
padding: '0', | |
margin: '0', | |
height: '43px', | |
background: 'black' | |
} | |
}; | |
readability.addStyle(readability.frameContainer, messageBar.styles); | |
}, | |
rdb_load_new_frame: function (event, obj) { | |
readability.closeFrame(); | |
readability.frameContainer = null; | |
readability.frameId = 'readabilityIFrame-' + Math.random(); | |
readability.init(true); // Force a reinit | |
}, | |
rdb_close: function (event) { | |
readability.closeFrame(); | |
}, | |
rdb_repost_form: function (event) { | |
readability.openFrame(); | |
} | |
}; | |
/** | |
* Removes script tags from the document. | |
* | |
* @param Element | |
**/ | |
readability.removeScripts = function (doc) { | |
var scripts = doc.getElementsByTagName('script'); | |
for(var i = scripts.length-1; i >= 0; i--) | |
{ | |
if(typeof(scripts[i].src) == "undefined" || (scripts[i].src.indexOf(readability.baseUrl) == -1 && scripts[i].src.indexOf('typekit') == -1)) | |
{ | |
scripts[i].nodeValue=""; | |
scripts[i].removeAttribute('src'); | |
if (scripts[i].parentNode) { | |
scripts[i].parentNode.removeChild(scripts[i]); | |
} | |
} | |
} | |
}; | |
readability.hideFlash = function () { | |
var i, il, embeds = document.getElementsByTagName('embed'), | |
objects = document.getElementsByTagName('object'), | |
iframes = document.getElementsByTagName('iframe'); | |
for (i = 0, il = embeds.length; i < il; i++) { | |
embeds[i].style.display = 'none'; | |
} | |
for (i = 0, il = objects.length; i < il; i++) { | |
objects[i].style.display = 'none'; | |
} | |
for (i = 0, il = iframes.length; i < il; i++) { | |
if (iframes[i].id !== readability.frameId) { | |
iframes[i].style.display = 'none'; | |
} | |
} | |
}; | |
readability.addStyle = function (elem, styles) { | |
var styleKey; | |
for (styleKey in styles) { | |
if (styles.hasOwnProperty(styleKey)) { | |
elem.style[styleKey] = styles[styleKey]; | |
} | |
} | |
}; | |
readability.getFrameContainer = function () { | |
if (readability.frameContainer === null) { | |
readability.frameContainer = document.createElement('div'); | |
readability.frameContainer.id = readability.frameContainerId; | |
readability.frameContainer.innerHTML = readability.getFrameHtml(); | |
readability.addStyle(readability.frameContainer, readability.frameContainerStyles); | |
} | |
return readability.frameContainer; | |
}; | |
readability.openFrame = function () { | |
var r = readability, | |
// shortcut | |
frameContent; | |
//Readability cannot parse framesets, so quit it. | |
if(document.body.nodeName == 'FRAMESET') { | |
alert("To read the content of a frame with Readability, right click on that content and select 'open this frame in new tab' and run Readability on the new tab."); | |
return; | |
} | |
readability.docCompressed = false; | |
if (readability.frameContainer === null) { | |
document.body.appendChild(r.getFrameContainer()); | |
} | |
r.listen("message", window, r.receiveMessage); | |
r.hideFlash(); | |
r.removeDocumentScrolling(); | |
try { | |
readability.docCompressed = readability.compress(document.documentElement); | |
} catch (e) {} | |
var load_text = (readability.type === 'read') ? '<div id="read-load">Converting...</div>' : '<div id="save-load">Saving...</div>'; | |
var charset = (document.characterSet ? document.characterSet : document.charset); | |
var hiddenInputs = { | |
"token": r.readabilityToken, | |
"extensionType": r.extensionInfo['type'], | |
"extensionVersion": r.extensionInfo['version'], | |
"legacyBookmarklet": (typeof window.readStyle !== "undefined" ? 1 : 0), | |
"read": (readability.type=='read' ? 1 : 0), | |
"archive": (readability.type=='support' ? 1 : 0), | |
"support": (readability.type=='support' ? 1 : 0), | |
"url": window.location.href, | |
"doc": readability.docCompressed, | |
"charset": charset | |
}; | |
/** | |
* Note: accept-charset is needed to be forced to the current character set because otherwise it appears Firefox will try to convert the data before the server gets a chance to work with it. | |
* By specifying the same character set no transforms are attempted on the client side, so we can handle it properly on the server side. | |
* Without accept-charset you will get bad characters on URLs like http://www.deseretnews.com/article/705369257/Parents-confused-upset-over-new-car-seat-guidelines.html | |
**/ | |
frameContent = [ | |
'<html>', | |
'<head>', | |
'<style type="text/css">', | |
'body { background-color: transparent; }', | |
'#wrapper { text-align: center; position:absolute;top:6em;left:50%;margin-left:-92.5px;}', | |
'#read-load, #save-load {text-align : center;color : #ffffff;padding-top: 10px; font:bold 1.2em Georgia; margin-left: 0.5em;}', | |
'#save-load.saved {padding-top: 4px;}', | |
'#spinner-box { background-color:#232323;height:107px;width:189px;margin:20px auto;padding:22px 0 0;-moz-border-radius:10px;-webkit-border-radius:10px;border-radius:10px;text-align: center;border-width:1px 0 0 1px;border-style:solid; border-color:#000;opacity: .85;-moz-opacity:.85;filter: alpha(opacity=85);}', | |
'</style>', | |
'</head>', | |
'<body>', | |
'<div id="wrapper">', | |
'<div id="spinner-box">', | |
'<img src="" />', | |
load_text, | |
'</div>', | |
'<form id="readabilityPostForm" accept-charset="', charset, '" enctype="application/x-www-form-urlencoded" style="display: none;" method="post" action="', r.frameUrl, '"></form>', | |
'</div>', | |
'</body>', | |
'</html>' | |
].join(''); | |
// Todo fix bug that occurs here: http://www.reddit.com/r/blog/comments/ddc0w/update_on_the_colbert_rally_time_to_show_our/ | |
var leframe = document.getElementById(r.frameId); | |
var ledocument = null; | |
if( leframe.contentDocument ) { | |
ledocument = leframe.contentDocument; | |
} else if ( leframe.contentWindow ) { //IE | |
ledocument = leframe.contentWindow.document; | |
} | |
ledocument.write(frameContent); | |
var postForm = ledocument.getElementById('readabilityPostForm'); | |
for (var inputKey in hiddenInputs) { | |
if(hiddenInputs.hasOwnProperty(inputKey)) { | |
var newInput = ledocument.createElement('input'); | |
newInput.type = "hidden"; | |
newInput.name = inputKey; | |
newInput.id = inputKey; | |
newInput.value = hiddenInputs[inputKey]; | |
postForm.appendChild(newInput); | |
} | |
} | |
ledocument.write(['<scr', 'ipt type="text/javascript">window.setTimeout(function() { document.getElementById("readabilityPostForm").submit(); }, 1);</scr', 'ipt>'].join('')); | |
}; | |
readability.frameLoaded = function (frame) { | |
try { | |
// Just try to access a restricted part of the document. If we can access it, that means we're not on the loaded doc yet. | |
x = window[readability.frameId].document; | |
} catch (e) { | |
// If we got caught, that means we've loaded the frame. Hide the backgrund elements. | |
readability.hidePageElements(); | |
} | |
}; | |
readability.url_is_valid = (function(){ | |
var invalid_list = [ | |
/file:/, | |
/about:blank/ | |
]; | |
return function(given_url){ | |
var url = given_url ? given_url.toLowerCase() : document.location.href.toLowerCase(), | |
i; | |
for(i = 0; i < invalid_list.length; i++){ | |
if(url.search(invalid_list[i]) !== -1){ | |
return false; | |
} | |
} | |
return true; | |
} | |
}()); | |
readability.site_in_blacklist = function (){ | |
var site_blacklist = 'www.youtube.com;mail.google.com'.toLowerCase().split(';'), | |
netloc, | |
i, | |
il; | |
try { | |
netloc = window.location.href.match(/^https?:\/\/([^\/]*)/)[1]; | |
} catch (e) { | |
return false; // Was a file:// URL or other non-http URL - gets caught by url_is_valid. | |
} | |
for (i = 0, il = site_blacklist.length; i < il; i++) { | |
if (site_blacklist[i] === netloc) { | |
return true; | |
} | |
} | |
return false; | |
}; | |
readability.closeFrame = function() { | |
var frameContainer = readability.frameContainer; | |
if (frameContainer) { | |
frameContainer.style.display = 'none'; | |
} | |
readability.addDocumentScrolling(); | |
}; | |
readability.init = function(force) { | |
if (!force && document.getElementById(readability.frameContainerId) !== null) { | |
readability.frameContainer = document.getElementById(readability.frameContainerId); | |
readability.frameContainer.style.display = 'block'; | |
readability.removeDocumentScrolling(); | |
return false; | |
} | |
/* If we're already on a parsed page */ | |
if (readability.isLocalPage() && document.getElementById('rdb-article') !== null ) { | |
return; | |
} | |
readability.removeScripts(document); | |
// If we are on our own page, bounce it to the homepage | |
if (readability.checkDocLocation()) { | |
readability.listen("message", window, readability.receiveMessage); | |
readability.openFrame(); | |
} | |
readability.readabilityToken = window.readabilityToken; | |
readability.openFrame(); | |
}; | |
} (readability)); | |
// First, check to see if we should even run Readability on this page | |
if( | |
readability.url_is_valid() && | |
!readability.isLocalPage() && // Make sure we aren't trying to run readability on itself | |
!readability.site_in_blacklist() // Don't run readability on blacklisted sites | |
){ | |
if(navigator.userAgent.indexOf('MSIE') !=-1) { | |
var queryParams = 'url=' + encodeURIComponent(window.top.location) + '&token=' + (typeof(window.readabilityToken) !== "undefined" ? encodeURIComponent(window.readabilityToken) : ""); | |
if(readability.type == "read") { | |
window.top.location = readability.baseUrl + '/pr?' + queryParams; | |
} else { | |
document.scrollTop = 0; | |
var wrap = document.createElement('div'); | |
wrap.innerHTML = '<iframe src="https://www.readability.com/prl?' + queryParams + '" width="500" height="200" frameBorder="0" allowTransparency="true" style="position: absolute; top: 0; left: 0; width: 100%; height: 100%; z-index: 281823498"></iframe>'; | |
document.body.appendChild(wrap); | |
readability.listen("message", window, function() { | |
if (event.origin === readability.baseUrl && event.data) { | |
if (event.data.indexOf('set_token') === 0) { | |
window.readabilityToken = event.data.replace('set_token=', ''); | |
readability.readabilityToken = window.readabilityToken; | |
} else if (event.data == "close_frame"){ | |
wrap.parentNode.removeChild(wrap); | |
} | |
} | |
}); | |
} | |
} else { | |
readability.init(); | |
} | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment