Last active
April 2, 2022 19:59
-
-
Save anderseknert/a1f454d8fad9111fd11b2f464d770067 to your computer and use it in GitHub Desktop.
Crawling AWS docs for all CloudFormation resource types. Python vs. Rego!
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/usr/bin/env python3 | |
import requests | |
def main(): | |
base = "https://docs.aws.amazon.com/AWSCloudFormation/latest/UserGuide" | |
resp = requests.get(f"{base}/toc-contents.json") | |
body = resp.json() | |
items = [] | |
for section in body["contents"]: | |
if section["href"] == "template-reference.html": | |
for contents in section["contents"]: | |
if "contents" in contents: | |
for item in contents["contents"]: | |
if "include_contents" in item: | |
items.append(item["include_contents"]) | |
resources = [] | |
for item in items: | |
r = requests.get(f"{base}/{item}") | |
contents = r.json() | |
for content in contents["contents"]: | |
if "contents" in content: | |
for item in content["contents"]: | |
if "title" in item: | |
resources.append(item["title"]) | |
print(resources) | |
if __name__ == "__main__": | |
main() |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
package aws.cloudformation | |
base := "https://docs.aws.amazon.com/AWSCloudFormation/latest/UserGuide" | |
all_resource_types := [resource | page := pages[_]; resource := resources_on_page(page)[_]] { | |
resp := http.send({"method": "GET", "url": sprintf("%s/toc-contents.json", [base]), "force_json_decode": true}) | |
resp.body.contents[section].href == "template-reference.html" | |
pages := [page | page := resp.body.contents[section].contents[_].contents[_].include_contents] | |
} | |
resources_on_page(doc) = [title | title := resp.body.contents[section].contents[_].title] { | |
resp := http.send({"method": "GET", "url": sprintf("%s/%s", [base, doc]), "force_json_decode": true}) | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment