Skip to content

Instantly share code, notes, and snippets.

@rnjailamba
Last active January 2, 2025 14:00
Show Gist options
  • Save rnjailamba/25803d8c887702af14ca4aeed45e8554 to your computer and use it in GitHub Desktop.
Save rnjailamba/25803d8c887702af14ca4aeed45e8554 to your computer and use it in GitHub Desktop.
//twitter download bookmarks
var before_start, after_finished, before_loop, after_element_clicked;
before_start = 1000;
after_finished = before_start;
before_loop = 1200;
after_element_clicked = before_loop - 1000;
var scroll_count = 1200;
var startTime, endTime;
start();
var elementsToResize = [];//['body', 'html', 'div[id="react-root"]', 'div[id="react-root"] div', 'div[id="react-root"] div div', 'div[id="react-root"] div div div:nth-child(3)', 'div[aria-label="Timeline: Bookmarks"]', 'div[aria-label="Timeline: Bookmarks"] div', 'section[aria-labelledby="accessible-list-0"]', 'section[aria-labelledby="accessible-list-1"]', 'div[aria-label="Home timeline"]', 'div[aria-label="Home timeline"] div:nth-child(4)', 'div[data-testid="primaryColumn"]', 'main[role="main"]', 'main[role="main"] div', 'main[role="main"] div div', 'main[role="main"] div div div'];
for (var j = 0; j < elementsToResize.length; j++) {
var elementToResize = elementsToResize[j];
if(document.querySelector(elementToResize)){
document.querySelector(elementToResize).style.setProperty('max-height', '100%', 'important');
document.querySelector(elementToResize).style.setProperty('height', '100%', 'important');
//document.querySelector(elementToResize).style.setProperty('max-width', '100%', 'important');
document.querySelector(elementToResize).style.setProperty('width', '100%', 'important');
}
}
//document.querySelectorAll('header[role="banner"]').forEach(e => e.remove());
//var z = prompt('Set zoom level!');
//document.body.style.zoom = parseFloat(1);
var allBookmarks = [["Name", "Handle", "Date", "Bookmarked Tweet Text", "Quote Tweet Text", "Link"]];
var allBookmarksAsStringArray = [];
var previousBookmarksLength = [-1];
var twitterShortUrls = [];
var originalUrls = {};
setTimeout(function() {
var index = 0;
function loopThroughBookmarks() {
setTimeout(function() { // call a setTimeout when the loop is called
var divs = document.querySelectorAll('div[data-testid="cellInnerDiv"]');
//console.log('Number of bookmarks: ', divs.length);
for (var i = 0; i < divs.length; i++) {
var bookmark = [];
var divVariable = divs[i];
var tweetTexts = divVariable.querySelectorAll('div[data-testid="tweetText"]');
var links = divVariable.querySelectorAll('a');
var hrefValue = "";
for(var j = 0; j < links.length; j++){
var node = links[j];
if(node.toString().includes("t.co")){
//console.log(node);
var hrefMatch = node.outerHTML.match(/href="([^"]*)"/);
if (hrefMatch) {
twitterShortUrls.push(hrefMatch[1]);
hrefValue = hrefValue + " " + hrefMatch[1];
//console.log('href value:', hrefMatch[1]);
//console.log(twitterShortUrls);
}
}
}
var tweetURL = "";
for(var j = 0; j < links.length; j++){
var node = links[j];
if(node.toString().includes("/status/")){
//console.log(node);
var hrefMatch = node.outerHTML.match(/href="([^"]*)"/);
if (hrefMatch) {
tweetURL = hrefMatch[1];
//console.log('tweetURL value:', tweetURL);
break;
}
}
}
//console.log(i);
var retrySpans = document.evaluate("//span[contains(., 'Retry')]", document, null, XPathResult.ANY_TYPE, null );
var retrySpan = retrySpans.iterateNext();
if(retrySpan){
retrySpan.click();
}
//scroll to bottom
if(tweetTexts && tweetTexts.length > 0 && tweetTexts[0].innerText.length > 0 && tweetTexts[0].innerText != "Retry" && allBookmarksAsStringArray.indexOf(tweetTexts[0].innerText) === -1){
var bookmarkedTweetText = divVariable.innerText;
var quoteTweetText = "";
allBookmarksAsStringArray.push(tweetTexts[0].innerText);
// seperate and clean text
for(var j = 0; j < 4; j++){
if(bookmarkedTweetText.slice(-1) == 'K' || bookmarkedTweetText.slice(-1) == 'M' || bookmarkedTweetText.slice(-1) == 'B'){
bookmarkedTweetText = bookmarkedTweetText.substring(0, bookmarkedTweetText.length - 1);
}
if(bookmarkedTweetText.lastIndexOf("\n")>0) {
//console.log(bookmarkedTweetText.substring(bookmarkedTweetText.lastIndexOf("\n")));
if(!isNaN(bookmarkedTweetText.substring(bookmarkedTweetText.lastIndexOf("\n"))))
bookmarkedTweetText = bookmarkedTweetText.substring(0, bookmarkedTweetText.lastIndexOf("\n"));
}
}
if(tweetTexts.length > 1){
quoteTweetText = tweetTexts[1].innerText;
}
//console.log("last char " + bookmarkedTweetText.slice(-1));
if(bookmarkedTweetText.slice(-1) == '…'){
bookmarkedTweetText = bookmarkedTweetText.substring(0, bookmarkedTweetText.length - 1);
}
var name = bookmarkedTweetText.substr(0, bookmarkedTweetText.indexOf("\n"));
bookmarkedTweetText = bookmarkedTweetText.substr(bookmarkedTweetText.indexOf("\n")+1);
//console.log(name);
var handle = bookmarkedTweetText.substr(0, bookmarkedTweetText.indexOf("\n"));
bookmarkedTweetText = bookmarkedTweetText.substr(bookmarkedTweetText.indexOf("\n")+1);
//console.log(handle);
var third_line = bookmarkedTweetText.substr(0, bookmarkedTweetText.indexOf("\n"));
bookmarkedTweetText = bookmarkedTweetText.substr(bookmarkedTweetText.indexOf("\n")+1);
var date = bookmarkedTweetText.substr(0, bookmarkedTweetText.indexOf("\n"));
bookmarkedTweetText = bookmarkedTweetText.substr(bookmarkedTweetText.indexOf("\n")+1);
//console.log(date);
quoteTweetText = quoteTweetText.replaceAll('…', '');
bookmark.push(name);
bookmark.push("https://x.com/" + handle);
bookmark.push(date);
if(hrefValue)
hrefValue = "\nURLs:" + removeDuplicateWords(hrefValue);
bookmark.push(tweetTexts[0].innerText.replace(/(\r\n|\n|\r)@([a-zA-Z0-9_]+)/g, '@$2').replace(/@([a-zA-Z0-9_]+)(\r\n|\n|\r)/g, '@$1').replaceAll('…', '') + hrefValue);//was ' @$2' '@$1 '
bookmark.push(quoteTweetText);
//console.log("https://x.com" + tweetURL);
bookmark.push("https://x.com" + tweetURL);
allBookmarks.push(bookmark);
//console.table("BOOKMARKED MESSAGE(INFO) -> " + tweetTexts[0].innerText.replace(/(?<!\w)\n(?=@[a-zA-Z0-9_]+)/g, " ").replaceAll('…', ''));
//console.log("QUOTED BOOKMARKED MESSAGE(INFO) -> " + quoteTweetText);
}
else {
//console.log("This item already exists");
}
}
index++;
if (index < scroll_count) {
var allEqual = checkAllElementsEqual(previousBookmarksLength, allBookmarks.length);
console.log(previousBookmarksLength);
console.log(allBookmarks.length);
console.log(allEqual);// IMPORTANT: The moment this is true we're done in the ideal case of scrolling down to the end
if (allEqual && divs[divs.length - 1].outerHTML.indexOf('role="progressbar') === -1 && divs[divs.length - 1].innerText === ""){
console.log("Last element text:" + divs[divs.length - 1].innerText);
//console.log(divs);
//console.log(divs[divs.length - 1].outerHTML);
index = scroll_count;// go to the else in the next iteration and print csv, empty inner text means last element
}
previousBookmarksLength.push(allBookmarks.length);
previousBookmarksLength.splice(0, previousBookmarksLength.length - 20);//keep only last 20 elements
console.log('looping again ' + index + " " + allBookmarks.length);
//window.scrollTo(0, document.body.scrollHeight); //document.body.scrollHeight
window.scrollBy(0, 2*window.innerHeight);
loopThroughBookmarks();
}
else {
setTimeout(() => {
var shortUrls = twitterShortUrls;
var fetchPromises = shortUrls.map(url => {
return fetch(url)
.then(response => response.text())
.then(data => {
originalUrls[url] = findFirstUrl(data);
})
.catch(error => console.error('Error:', error));
});
Promise.all(fetchPromises)
.then(() => {
//console.log(originalUrls);
console.log("🟢🟢🟢🟢🟢===== CSV Data Start =====🟢🟢🟢🟢🟢");
console.log(arrayToCSV(allBookmarks));
console.log("🟢🟢🟢🟢🟢===== CSV Data End =====🟢🟢🟢🟢🟢");
console.log("🟢🟢🟢🟢🟢===== HTML Data Start =====🟢🟢🟢🟢🟢");
console.log(arrayToHTML(allBookmarks));
console.log("🟢🟢🟢🟢🟢===== HTML Data End =====🟢🟢🟢🟢🟢");
})
.catch(error => console.error('Error:', error));
function arrayToHTML(tableData) {
var table = document.createElement('table');
var tableBody = document.createElement('tbody');
tableData.forEach(function(rowData) {
var row = document.createElement('tr');
rowData.forEach(function(cellData) {
var cell = document.createElement('td');
cell.appendChild(document.createTextNode(cellData));
cell.innerHTML = replaceDomainUrlsWithMap(cell.innerHTML, "t.co", originalUrls);
cell.innerHTML = cell.innerHTML.replace(
/((http|https|ftp|ftps)\:\/\/[a-zA-Z0-9\-\.]+\.[a-zA-Z]{2,3}(\/\S*)?)/g,
'<a href="$1">$1</a>');
row.appendChild(cell);
});
tableBody.appendChild(row);
});
table.appendChild(tableBody);
//document.body.appendChild(table);
return `
<html>
<style>
a, span, tr { white-space: pre !important; }
table, th, td {
border: 1px solid !important;
border-collapse: collapse !important;
}
table { display: block !important; width: 100% !important; }
td {
word-break: break-word !important;
word-break: break-all !important;
word-wrap: break-word !important;
overflow-wrap: break-word !important;
white-space: pre-wrap !important;
-moz-white-space: pre-wrap !important;
min-width: 50px !important;
max-width: 500px !important;
}
</style>
<head>
<meta charset="utf-8">
<title>Twitter Bookmarks ${(/* @__PURE__ */ new Date()).toISOString()}</title>
<link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/[email protected]/dist/css/bootstrap.min.css">
</head>
<body>
${table.outerHTML}
</body>
</html>
`;
}
function arrayToCSV(data){
end();
return data.map(row =>
row
.map(String) // convert every value to String
.map(String => replaceDomainUrlsWithMap(String, "t.co", originalUrls))
.map(v => v.replaceAll('"', '""')) // escape double quotes
.map(v => `"${v}"`) // quote it
.join(',') // comma-separated
).join('\r\n'); // rows starting on new lines
}
}, after_finished);
}
}, before_loop)
}
loopThroughBookmarks();
}, before_start); // Adjust delay as needed
function checkAllElementsEqual(array, number) {
return array.every(element => element === number);
}
function removeDuplicateWords(text) {
var seenWords = new Set();
var uniqueWords = [];
for (var word of text.split(/\s+/)) {
if (!seenWords.has(word)) {
uniqueWords.push(word);
seenWords.add(word);
}
}
return uniqueWords.join(" ");
}
function replaceDomainUrlsWithMap(text, targetDomain, urlMap) {
const urlRegex = new RegExp(`https?:\/\/(www\.)?(\w+\.)?${targetDomain}([-a-zA-Z0-9@:%_\+.~#?&//=]*)`, 'gi');
return text.replace(urlRegex, (match) => {
return urlMap[match] || match; // Use mapped URL if available, otherwise keep original URL
});
}
function findFirstUrl(text) {
const urlRegex = /https?:\/\/(www\.)?[-a-zA-Z0-9@:%._\+~#=]{1,256}\.[a-zA-Z0-9()]{1,6}\b([-a-zA-Z0-9()@:%_\+.~#?&//=]*)/g;
const match = text.match(urlRegex);
return match ? match[0] : null; // Return the first URL or null if none found
}
function start() {
startTime = new Date();
};
function end() {
endTime = new Date();
var timeDiff = endTime - startTime; //in ms
// strip the ms
timeDiff /= 1000;
// get seconds
var seconds = Math.round(timeDiff);
console.log(seconds + " seconds");
}
window.onblur = null;
window.blurred = false;
window.document.hasFocus = function () {return true;};
window.document.onFocus = function () {return true;};
window.document.onBlur = function () {return false;};
Object.defineProperty(document, "hidden", { value : false});
Object.defineProperty(document, "mozHidden", { value : false});
Object.defineProperty(document, "msHidden", { value : false});
Object.defineProperty(document, "webkitHidden", { value : false});
Object.defineProperty(document, 'visibilityState', { get: function () { return "visible"; } });
window.document.onvisibilitychange = undefined;
for (event_name of ["visibilitychange",
"webkitvisibilitychange",
"focus",
"blur", // may cause issues on some websites
"mozvisibilitychange",
"msvisibilitychange"]) {
window.addEventListener(event_name, function(event) {
event.preventDefault();
event.stopImmediatePropagation();
event.stopPropagation();
}, true);
}
// Try to trick the site into thinking it's never hidden
Object.defineProperty(document, 'hidden', {value: false, writable: false});
Object.defineProperty(document, 'mozHidden', {value: false, writable: false});
Object.defineProperty(document, 'webkitHidden', {value: false, writable: false});
//Object.defineProperty(document, 'visibilityState', {value: 'visible', writable: false});
Object.defineProperty(document, 'webkitVisibilityState', {value: 'visible', writable: false});
document.dispatchEvent(new Event('visibilitychange'));
document.hasFocus = function () { return true; };
// visibilitychange events are captured and stopped
document.addEventListener('visibilitychange', function(e) {
e.stopImmediatePropagation();
}, true, true);
// Set the player quality to "Source"
window.localStorage.setItem('s-qs-ts', Math.floor(Date.now()));
window.localStorage.setItem('video-quality', '{"default":"chunked"}');
var checkVisibility = function() {
console.log(document.visibilityState);
};
setInterval(checkVisibility, 1);

Instructions:

  1. Open bookmarks page https://x.com/i/bookmarks
  2. Copy above script to console and click enter
  3. Wait and get both CSV and HTML formatted data in the end
  4. Copy the CSV data to any editor like sublime text and name the file xyz.csv and import it into google sheets.
  5. Copy the HTML data to any editor and name the file xyz.html and open it in chrome.

FAQ

  1. Not gauranteed to work perfectly, fails sometimes due to (a) twitter api requests failing, (b) bad internet, (c) not all bookmarks showing up in the output.
  2. You may need to run it few times as a result
  3. Relies on front end not on API calls, which would've been a better idea as retries would've been possible.
  4. Recommended free alternative is BookmarkPilot chrome extension, actually use it more but an issue is lack of full links which are important.

Features:

  1. Original full links (in addition to t.co short links)
  2. Original formatting
  3. Quote tweet text
  4. Auto scroll through 1000s of tweets
  5. Handle Retry errors due to slow internet/ rate limits
  6. Simple one page script
    • that does one thing without dependencies
    • that can be understood and fixed/ improved by others.

Features: Minimal CSV file that can be fed into GPT or saved in Google Sheets. Minimal HTML file if you want to upload to your webserver or view on local browser.

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment