Skip to content

Instantly share code, notes, and snippets.

@pixelbrackets
Created March 28, 2025 10:35
Show Gist options
  • Save pixelbrackets/186d7955993d0f8c47a62c61fb5dd1c5 to your computer and use it in GitHub Desktop.
Save pixelbrackets/186d7955993d0f8c47a62c61fb5dd1c5 to your computer and use it in GitHub Desktop.
sitemap.xml XML to HTML visualisation
<?php
// composer require guzzlehttp/guzzle pixelbrackets/html5-mini-template
require 'vendor/autoload.php';
use GuzzleHttp\Client;
function fetchSitemapUrls(string $sitemapUrl, Client $client): array {
$response = $client->get($sitemapUrl);
$xml = simplexml_load_string($response->getBody()->getContents());
$urls = [];
if (isset($xml->sitemap)) {
foreach ($xml->sitemap as $sitemap) {
$urls = array_merge($urls, fetchSitemapUrls((string)$sitemap->loc, $client));
}
} elseif (isset($xml->url)) {
foreach ($xml->url as $url) {
$urls[] = (string)$url->loc;
}
}
return $urls;
}
function buildHierarchy(array $urls, int $maxLevel = 4): array {
$tree = [];
foreach ($urls as $url) {
$parts = parse_url($url);
$parts['path'] = isset($parts['path']) ? $parts['path'] : '';
$pathSegments = explode('/', trim($parts['path'], '/'));
// Only include up to maxLevel
$pathSegments = array_slice($pathSegments, 0, $maxLevel);
$current =& $tree;
foreach ($pathSegments as $segment) {
if (!isset($current[$segment])) {
$current[$segment] = [];
}
$current =& $current[$segment];
}
}
return $tree;
}
function generateHtml(array $tree, string $baseUrl, bool $skipShortlinks = true, string $path = ''): string {
$html = PHP_EOL . '<ul>';
foreach ($tree as $segment => $children) {
// Skip shortlinks (first-level item with no subpages)
if ($path === '' && empty($children)) {
continue;
}
// Guess the correct title
$formattedTitle = ucwords(str_replace('-', ' ', $segment));
$fullPath = $path . '/' . $segment;
$html .= PHP_EOL . ' <li><a href="' . $baseUrl . $fullPath . '">' . $formattedTitle . '</a><!--<span>/' . $segment . '</span>-->';
if (!empty($children)) {
$html .= generateHtml($children, $baseUrl, true, $fullPath);
}
$html .= '</li>';
}
$html .= PHP_EOL . '</ul>';
return $html;
}
$client = new Client();
$sitemapUrl = 'https://example.com/sitemap.xml';
$urls = fetchSitemapUrls($sitemapUrl, $client);
$hierarchy = buildHierarchy($urls, 3);
$baseUrl = parse_url($sitemapUrl, PHP_URL_SCHEME) . '://' . parse_url($sitemapUrl, PHP_URL_HOST);
$htmlOutput = generateHtml($hierarchy, $baseUrl);
$template = (new \Pixelbrackets\Html5MiniTemplate\Html5MiniTemplate())
->setStylesheet('https://raw.githubusercontent.com/astuteo/slickmap/refs/heads/master/slickmap.css')
->setTitle('Sitemap')
->setContent('<div class="sitemap"><nav class="primaryNav">' . $htmlOutput . '</nav></div>');
echo $template->getMarkup();
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment