lirantal · April 14, 2024 09:21
diff --git a/fetch-updates-snyk-io-website.js b/fetch-updates-snyk-io-website.js
 // This function will find all elements with the class "changelogItem published"
 // and extract the desired information, including preserving only links in the content body.
 function extractNewsItems() {
    // Get all elements with the class "changelogItem published"
    const items = document.querySelectorAll('.changelogItem.published');

    // Initialize an empty array to hold the news items
    const newsItems = [];

    // Function to process content to keep only text and anchor tags
    function processContent(contentElement) {
        let finalContent = '';
        // Loop over all child nodes of the content element
        for (const node of contentElement.childNodes) {
            if (node.nodeType === Node.ELEMENT_NODE && node.tagName === 'A') {
                // If it's an anchor element, keep it as HTML
                finalContent += node.outerHTML;
            } else if (node.nodeType === Node.TEXT_NODE) {
                // If it's a text node, append its content
                finalContent += node.nodeValue;
            } else {
                // For all other types of elements, recurse to handle nested elements
                finalContent += processContent(node);
            }
        }
        return finalContent;
    }

    // Iterate over each item and extract information
    items.forEach(item => {
        const title = item.querySelector('h2.title a').textContent; // Extract the title
        const datePublished = item.querySelector('.articleMeta time').getAttribute('datetime'); // Extract the publication date
        const contentElement = item.querySelector('.content'); // Get the content element
        const contentBody = processContent(contentElement); // Process the content to keep only text and links

        // Create an object with the extracted information and push it into the array
        newsItems.push({
            title: title,
            datePublished: datePublished,
            contentBody: contentBody
        });
    });

    // Return the array of news items
    return newsItems;
 }

 // Execute the function and log the result to the console
 console.log(extractNewsItems());
	// This function will find all elements with the class "changelogItem published"
	// and extract the desired information, including preserving only links in the content body.
	function extractNewsItems() {
	// Get all elements with the class "changelogItem published"
	const items = document.querySelectorAll('.changelogItem.published');

	// Initialize an empty array to hold the news items
	const newsItems = [];

	// Function to process content to keep only text and anchor tags
	function processContent(contentElement) {
	let finalContent = '';
	// Loop over all child nodes of the content element
	for (const node of contentElement.childNodes) {
	if (node.nodeType === Node.ELEMENT_NODE && node.tagName === 'A') {
	// If it's an anchor element, keep it as HTML
	finalContent += node.outerHTML;
	} else if (node.nodeType === Node.TEXT_NODE) {
	// If it's a text node, append its content
	finalContent += node.nodeValue;
	} else {
	// For all other types of elements, recurse to handle nested elements
	finalContent += processContent(node);
	}
	}
	return finalContent;
	}

	// Iterate over each item and extract information
	items.forEach(item => {
	const title = item.querySelector('h2.title a').textContent; // Extract the title
	const datePublished = item.querySelector('.articleMeta time').getAttribute('datetime'); // Extract the publication date
	const contentElement = item.querySelector('.content'); // Get the content element
	const contentBody = processContent(contentElement); // Process the content to keep only text and links

	// Create an object with the extracted information and push it into the array
	newsItems.push({
	title: title,
	datePublished: datePublished,
	contentBody: contentBody
	});
	});

	// Return the array of news items
	return newsItems;
	}

	// Execute the function and log the result to the console
	console.log(extractNewsItems());
No results found