Skip to content

Instantly share code, notes, and snippets.

@j0shua
Created April 28, 2011 00:07
Show Gist options
  • Save j0shua/945522 to your computer and use it in GitHub Desktop.
Save j0shua/945522 to your computer and use it in GitHub Desktop.
readability js
//
if(typeof(readability) === "undefined"){
readability = {};
}
(function (readability) {
readability.baseUrl = 'https://www.readability.com';
readability.type = 'read';
readability.frameId = 'readabilityIFrame-'+Math.random();
readability.frameUrl = readability.baseUrl + '/articles/queue';
readability.frameContainerId = 'readabilityFrameContainer-' + readability.type;
readability.frameContainer = null;
readability.docCompressed = null;
readability.extensionInfo = {
"type": (typeof window.readabilityExtensionType == "undefined" || window.readabilityExtensionType == "" ? 'bookmarklet' : window.readabilityExtensionType ),
"version": (typeof window.readabilityExtensionVersion == "undefined" || window.readabilityExtensionVersion == "" ? "1" : window.readabilityExtensionVersion )
}
readability.frameContainerStyles = {
position: 'fixed',
display: 'block',
top: '0px',
left: '0px',
width: '100%',
height: '100%',
padding: '0',
margin: '0',
backgroundColor: "transparent",
zIndex: '2147483647'
};
readability.frameStyles = ["width: 100%", "height: 100%", "display: block", "overflow: auto", // Proper iframe overflow in FF. Webkit uses the document body's CSS setting.
"margin: 0", "padding: 0", "border-width: 0"].join(';');
/* A method so that if we change frameId we still get valid HTML */
// Adds onload, which will allow us to hide the content behind the frame after we have the new content.
readability.getFrameHtml = function () {
return ['<iframe id="' + readability.frameId + '"', 'name="' + readability.frameId + '"', 'scrolling="auto"', 'frameborder="0"', 'style="' + readability.frameStyles + '"', 'onload="readability.frameLoaded(this)">', '</iframe>'].join(' ');
};
readability.debug = function (s) {
if (typeof console !== "undefined") {
return console.log(s);
}
};
readability.getExtensionDetails = function () {
if (typeof window.readabilityExtensionDetails !== null) {
return window.readabilityExtensionDetails;
} else {
return "bookmarklet";
}
};
readability.compress = function (doc_node) {
var i, il, html, preTags = doc_node.getElementsByTagName('pre');
for (i = 0, il = preTags.length; i < il; i++) {
preTags[i].innerHTML = preTags[i].innerHTML.replace(/ /g, '&nbsp;').replace(/\t/g, '&nbsp;&nbsp;&nbsp;&nbsp;').replace(/\n/g, '--rdb-newline--');
}
html = "<html>" + doc_node.innerHTML + "</html>";
html = html.replace(/[\s\t\r\n]+/g, ' ');
html = html.replace(/<!--.*?-->/g, '');
html = html.replace(/--rdb-newline--/g, "\n");
return html;
};
readability.hidePageElements = function () {
var child, i;
for (i = 0; i < document.body.childNodes.length; i++) {
child = document.body.childNodes[i];
if (child.nodeType !== 1) {
continue;
}
display = child.currentStyle ? child.currentStyle.display : document.defaultView.getComputedStyle(child, null).getPropertyValue('display');
if (child.id !== readability.frameContainerId) {
child.origDisplay = display;
child.style.display = 'none';
}
}
};
readability.removeDocumentScrolling = function () {
var child, display, i;
document.body.style.overflow = "hidden";
};
readability.addDocumentScrolling = function () {
var child, i;
for (i = 0; i < document.body.childNodes.length; i++) {
child = document.body.childNodes[i];
if (child.nodeType !== 1) {
continue;
}
if (child.origDisplay) {
child.style.display = child.origDisplay;
}
}
document.body.style.overflow = "auto";
};
readability.isLocalPage = function () {
if (document.location.href.indexOf(readability.baseUrl) !== - 1) {
return true;
}
else {
return false;
}
};
/* Cross-browser dispatchEvent - from http://www.cross-browser.com/forums/viewtopic.php?id=384 */
readability.dispatchEvent = function (element, rawEvent) {
// Attempts to fire a raw DOM event on an element
// param name="element" type="Element" The element or its identifier to fire the event
// param name="rawEvent" type="Object" The raw DOM event object to fire
// returns type="Boolean" True if the event was successfully fired, otherwise false
try {
if (element.fireEvent) {
element.fireEvent("on" + rawEvent.type, rawEvent);
return true;
}
else if (element.dispatchEvent) {
element.dispatchEvent(rawEvent);
return true;
}
} catch (e) {
readability.debug('Error caught:');
readability.debug(e);
}
return false;
};
readability.checkDocLocation = function () {
if (document.location.href.indexOf(readability.baseUrl) !== - 1) {
if (document.getElementById('read-bar') !== null && document.getElementById('read-link') !== null) {
var clickEvent = document.createEvent('MouseEvent');
clickEvent.initMouseEvent('click', true, true, document.defaultView, 1, 0, 0, 0, 0, false, false, false, false, 0, null);
readability.dispatchEvent(document.getElementById('read-link'), clickEvent);
return false;
} else {
document.location = readability.baseUrl;
return false;
}
}
};
// Cross browser addEventListener from http://snipplr.com/view.php?codeview&id=3116
readability.listen = function (evnt, elem, func) {
if (elem.addEventListener) { // W3C DOM
return elem.addEventListener(evnt, func, false);
} else if (elem.attachEvent) { // IE DOM
var r = elem.attachEvent("on" + evnt, func);
return r;
} else {
return false;
}
};
// Receive cross-DOM js events
readability.receiveMessage = function (event) {
if (event.origin === readability.baseUrl && event.data) {
/**
* Special handling for set_token, otherwise just event handlers.
* TODO: Turn these all into json structures with a name rather than just strings.
**/
if (event.data.indexOf('set_token') === 0) {
window.readabilityToken = event.data.replace('set_token=', '');
readability.readabilityToken = window.readabilityToken;
} else {
try {
var event_method = event.data.replace('-', '_');
if (typeof readability.event_handlers[event_method] !== "undefined") {
readability.event_handlers[event_method](event);
}
} catch (e) {
readability.debug('Error caught in receiveMessage:');
readability.debug(e);
}
}
}
};
// The handlers for cross-DOM events
readability.event_handlers = {
rdb_load_modal: function (event) {
var iframeContainer = readability.frameContainer,
styleKey,
iframeContainerStyles = {position: 'fixed', display: 'block', width: '100%', height: '100%', zIndex: '2147483647',background: "url('')"};
for (styleKey in iframeContainerStyles) {
if (iframeContainerStyles.hasOwnProperty(styleKey)) {
iframeContainer.style[styleKey] = iframeContainerStyles[styleKey];
}
}
},
rdb_remove_frame: function (event) {
var frameContainer = readability.frameContainer;
if (frameContainer) {
frameContainer.parentNode.removeChild(frameContainer);
}
},
rdb_load_bar: function (event) {
var messageBar = {
styles: {
position: 'fixed',
display: 'block',
top: '0px',
left: '0px',
width: '100%',
padding: '0',
margin: '0',
height: '43px',
background: 'black'
}
};
readability.addStyle(readability.frameContainer, messageBar.styles);
},
rdb_load_new_frame: function (event, obj) {
readability.closeFrame();
readability.frameContainer = null;
readability.frameId = 'readabilityIFrame-' + Math.random();
readability.init(true); // Force a reinit
},
rdb_close: function (event) {
readability.closeFrame();
},
rdb_repost_form: function (event) {
readability.openFrame();
}
};
/**
* Removes script tags from the document.
*
* @param Element
**/
readability.removeScripts = function (doc) {
var scripts = doc.getElementsByTagName('script');
for(var i = scripts.length-1; i >= 0; i--)
{
if(typeof(scripts[i].src) == "undefined" || (scripts[i].src.indexOf(readability.baseUrl) == -1 && scripts[i].src.indexOf('typekit') == -1))
{
scripts[i].nodeValue="";
scripts[i].removeAttribute('src');
if (scripts[i].parentNode) {
scripts[i].parentNode.removeChild(scripts[i]);
}
}
}
};
readability.hideFlash = function () {
var i, il, embeds = document.getElementsByTagName('embed'),
objects = document.getElementsByTagName('object'),
iframes = document.getElementsByTagName('iframe');
for (i = 0, il = embeds.length; i < il; i++) {
embeds[i].style.display = 'none';
}
for (i = 0, il = objects.length; i < il; i++) {
objects[i].style.display = 'none';
}
for (i = 0, il = iframes.length; i < il; i++) {
if (iframes[i].id !== readability.frameId) {
iframes[i].style.display = 'none';
}
}
};
readability.addStyle = function (elem, styles) {
var styleKey;
for (styleKey in styles) {
if (styles.hasOwnProperty(styleKey)) {
elem.style[styleKey] = styles[styleKey];
}
}
};
readability.getFrameContainer = function () {
if (readability.frameContainer === null) {
readability.frameContainer = document.createElement('div');
readability.frameContainer.id = readability.frameContainerId;
readability.frameContainer.innerHTML = readability.getFrameHtml();
readability.addStyle(readability.frameContainer, readability.frameContainerStyles);
}
return readability.frameContainer;
};
readability.openFrame = function () {
var r = readability,
// shortcut
frameContent;
//Readability cannot parse framesets, so quit it.
if(document.body.nodeName == 'FRAMESET') {
alert("To read the content of a frame with Readability, right click on that content and select 'open this frame in new tab' and run Readability on the new tab.");
return;
}
readability.docCompressed = false;
if (readability.frameContainer === null) {
document.body.appendChild(r.getFrameContainer());
}
r.listen("message", window, r.receiveMessage);
r.hideFlash();
r.removeDocumentScrolling();
try {
readability.docCompressed = readability.compress(document.documentElement);
} catch (e) {}
var load_text = (readability.type === 'read') ? '<div id="read-load">Converting...</div>' : '<div id="save-load">Saving...</div>';
var charset = (document.characterSet ? document.characterSet : document.charset);
var hiddenInputs = {
"token": r.readabilityToken,
"extensionType": r.extensionInfo['type'],
"extensionVersion": r.extensionInfo['version'],
"legacyBookmarklet": (typeof window.readStyle !== "undefined" ? 1 : 0),
"read": (readability.type=='read' ? 1 : 0),
"archive": (readability.type=='support' ? 1 : 0),
"support": (readability.type=='support' ? 1 : 0),
"url": window.location.href,
"doc": readability.docCompressed,
"charset": charset
};
/**
* Note: accept-charset is needed to be forced to the current character set because otherwise it appears Firefox will try to convert the data before the server gets a chance to work with it.
* By specifying the same character set no transforms are attempted on the client side, so we can handle it properly on the server side.
* Without accept-charset you will get bad characters on URLs like http://www.deseretnews.com/article/705369257/Parents-confused-upset-over-new-car-seat-guidelines.html
**/
frameContent = [
'<html>',
'<head>',
'<style type="text/css">',
'body { background-color: transparent; }',
'#wrapper { text-align: center; position:absolute;top:6em;left:50%;margin-left:-92.5px;}',
'#read-load, #save-load {text-align : center;color : #ffffff;padding-top: 10px; font:bold 1.2em Georgia; margin-left: 0.5em;}',
'#save-load.saved {padding-top: 4px;}',
'#spinner-box { background-color:#232323;height:107px;width:189px;margin:20px auto;padding:22px 0 0;-moz-border-radius:10px;-webkit-border-radius:10px;border-radius:10px;text-align: center;border-width:1px 0 0 1px;border-style:solid; border-color:#000;opacity: .85;-moz-opacity:.85;filter: alpha(opacity=85);}',
'</style>',
'</head>',
'<body>',
'<div id="wrapper">',
'<div id="spinner-box">',
'<img src="" />',
load_text,
'</div>',
'<form id="readabilityPostForm" accept-charset="', charset, '" enctype="application/x-www-form-urlencoded" style="display: none;" method="post" action="', r.frameUrl, '"></form>',
'</div>',
'</body>',
'</html>'
].join('');
// Todo fix bug that occurs here: http://www.reddit.com/r/blog/comments/ddc0w/update_on_the_colbert_rally_time_to_show_our/
var leframe = document.getElementById(r.frameId);
var ledocument = null;
if( leframe.contentDocument ) {
ledocument = leframe.contentDocument;
} else if ( leframe.contentWindow ) { //IE
ledocument = leframe.contentWindow.document;
}
ledocument.write(frameContent);
var postForm = ledocument.getElementById('readabilityPostForm');
for (var inputKey in hiddenInputs) {
if(hiddenInputs.hasOwnProperty(inputKey)) {
var newInput = ledocument.createElement('input');
newInput.type = "hidden";
newInput.name = inputKey;
newInput.id = inputKey;
newInput.value = hiddenInputs[inputKey];
postForm.appendChild(newInput);
}
}
ledocument.write(['<scr', 'ipt type="text/javascript">window.setTimeout(function() { document.getElementById("readabilityPostForm").submit(); }, 1);</scr', 'ipt>'].join(''));
};
readability.frameLoaded = function (frame) {
try {
// Just try to access a restricted part of the document. If we can access it, that means we're not on the loaded doc yet.
x = window[readability.frameId].document;
} catch (e) {
// If we got caught, that means we've loaded the frame. Hide the backgrund elements.
readability.hidePageElements();
}
};
readability.url_is_valid = (function(){
var invalid_list = [
/file:/,
/about:blank/
];
return function(given_url){
var url = given_url ? given_url.toLowerCase() : document.location.href.toLowerCase(),
i;
for(i = 0; i < invalid_list.length; i++){
if(url.search(invalid_list[i]) !== -1){
return false;
}
}
return true;
}
}());
readability.site_in_blacklist = function (){
var site_blacklist = 'www.youtube.com;mail.google.com'.toLowerCase().split(';'),
netloc,
i,
il;
try {
netloc = window.location.href.match(/^https?:\/\/([^\/]*)/)[1];
} catch (e) {
return false; // Was a file:// URL or other non-http URL - gets caught by url_is_valid.
}
for (i = 0, il = site_blacklist.length; i < il; i++) {
if (site_blacklist[i] === netloc) {
return true;
}
}
return false;
};
readability.closeFrame = function() {
var frameContainer = readability.frameContainer;
if (frameContainer) {
frameContainer.style.display = 'none';
}
readability.addDocumentScrolling();
};
readability.init = function(force) {
if (!force && document.getElementById(readability.frameContainerId) !== null) {
readability.frameContainer = document.getElementById(readability.frameContainerId);
readability.frameContainer.style.display = 'block';
readability.removeDocumentScrolling();
return false;
}
/* If we're already on a parsed page */
if (readability.isLocalPage() && document.getElementById('rdb-article') !== null ) {
return;
}
readability.removeScripts(document);
// If we are on our own page, bounce it to the homepage
if (readability.checkDocLocation()) {
readability.listen("message", window, readability.receiveMessage);
readability.openFrame();
}
readability.readabilityToken = window.readabilityToken;
readability.openFrame();
};
} (readability));
// First, check to see if we should even run Readability on this page
if(
readability.url_is_valid() &&
!readability.isLocalPage() && // Make sure we aren't trying to run readability on itself
!readability.site_in_blacklist() // Don't run readability on blacklisted sites
){
if(navigator.userAgent.indexOf('MSIE') !=-1) {
var queryParams = 'url=' + encodeURIComponent(window.top.location) + '&token=' + (typeof(window.readabilityToken) !== "undefined" ? encodeURIComponent(window.readabilityToken) : "");
if(readability.type == "read") {
window.top.location = readability.baseUrl + '/pr?' + queryParams;
} else {
document.scrollTop = 0;
var wrap = document.createElement('div');
wrap.innerHTML = '<iframe src="https://www.readability.com/prl?' + queryParams + '" width="500" height="200" frameBorder="0" allowTransparency="true" style="position: absolute; top: 0; left: 0; width: 100%; height: 100%; z-index: 281823498"></iframe>';
document.body.appendChild(wrap);
readability.listen("message", window, function() {
if (event.origin === readability.baseUrl && event.data) {
if (event.data.indexOf('set_token') === 0) {
window.readabilityToken = event.data.replace('set_token=', '');
readability.readabilityToken = window.readabilityToken;
} else if (event.data == "close_frame"){
wrap.parentNode.removeChild(wrap);
}
}
});
}
} else {
readability.init();
}
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment