Created
April 8, 2022 15:00
-
-
Save Steboss89/9d1dc02c8c2dfa09588391f5f7cdf873 to your computer and use it in GitHub Desktop.
Subdivide books in old and new tetamente
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| import os | |
| output = "books" | |
| if not os.path.exists(output): | |
| os.makedirs(output) | |
| lines = open("cleaned_bible.txt", "r").readlines() | |
| books = [] | |
| books_idx = {} | |
| # there are books which are First of, second of etc | |
| # we need to pick up their names | |
| multinames = ["Kings", "Paralipomenon", "Esdras", "Machabees", | |
| "Corinthians","Thessalonians", "Timothy", "Peter", "John"] | |
| # then collect the name of the old testament books | |
| old_books = ["Genesis", "Exodus", "Leviticus", "Numbers", "Deuteronomy","Josue", | |
| "Judges", "Ruth", "1Kings", "2Kings", "3Kings", "4Kings", | |
| "1Paralipomenon","2Paralipomenon", "1Esdras", "2Esdras", | |
| "Tobias", "Judith", "Esther", "Job", "Psalms", "Proverbs", | |
| "Ecclesiastes", "Canticle", "Wisdom", "Ecclesiasticus", "Isaias", | |
| "Jeremias", "Lamentations", "Baruch", "Ezechiel", | |
| "Daniel", "Osee", "Joel", "Amos", "Abdias", "Joans", "Micheas", | |
| "Nahum", "Habacuc", "Sophonias", "Aggeus", "Zacharias", "Malachias", | |
| "1Machabees", "2Machabees"] | |
| for i, val in enumerate(lines, 0): | |
| # retireve all the chapters | |
| if "Chapter" in val: | |
| book_name = val.split()[0] | |
| possible_further_name = val.split()[1] | |
| if possible_further_name in multinames: | |
| current_book_name = book_name + possible_further_name | |
| else: | |
| current_book_name = book_name | |
| if not current_book_name in books: | |
| print(f"Adding {current_book_name} to books, starting idx {i}") | |
| if i==0: | |
| tmp_book = current_book_name | |
| else: | |
| books_idx[tmp_book].append(i) | |
| tmp_book = current_book_name | |
| books.append(current_book_name) | |
| books_idx[current_book_name] = [i] |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment