Created
          April 16, 2023 17:00 
        
      - 
      
- 
        Save p1-dta/2c49d5c3eb6bafdd9675bf0bb9001bf1 to your computer and use it in GitHub Desktop. 
    Count how many people are alive per year, based on their birthyear and deathyear, aims for simplicity.
  
        
  
    
      This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
      Learn more about bidirectional Unicode characters
    
  
  
    
  | import collections | |
| import random | |
| import timeit | |
| pop = [ | |
| (b := random.randint(1900, 2000), random.randint(b + 1, b + 100)) | |
| for _ in range(10000) | |
| ] | |
| # 5.049 s (with 10000 people [1,100] years old) | |
| def count_living_per_year(population: list[tuple[int, int]]) -> dict[int, int]: | |
| living_per_year = {} | |
| for birth, death in population: | |
| for year in range(birth, death): | |
| if year in living_per_year: | |
| living_per_year[year] += 1 | |
| else: | |
| living_per_year[year] = 1 | |
| return living_per_year | |
| print(sorted(tuple(count_living_per_year(pop).items()))) | |
| print( | |
| timeit.timeit( | |
| "count_living_per_year(pop)", | |
| globals=globals(), | |
| number=100, | |
| ) | |
| ) | |
| # 3.697 s (with 10000 people [1,100] years old) | |
| def count_living_per_year(population: list[tuple[int, int]]) -> dict[int, int]: | |
| living_per_year = {} | |
| for birth, death in population: | |
| for year in range(birth, death): | |
| living_per_year[year] = living_per_year.get(year, 0) + 1 | |
| return living_per_year | |
| print(sorted(tuple(count_living_per_year(pop).items()))) | |
| print( | |
| timeit.timeit( | |
| "count_living_per_year(pop)", | |
| globals=globals(), | |
| number=100, | |
| ) | |
| ) | |
| # 3.929 s (with 10000 people [1,100] years old) | |
| def count_living_per_year(population: list[tuple[int, int]]) -> dict[int, int]: | |
| living_per_year = collections.defaultdict(int) | |
| for birth, death in population: | |
| for year in range(birth, death): | |
| living_per_year[year] += 1 | |
| return living_per_year | |
| print(sorted(tuple(count_living_per_year(pop).items()))) | |
| print( | |
| timeit.timeit( | |
| "count_living_per_year(pop)", | |
| globals=globals(), | |
| number=100, | |
| ) | |
| ) | |
| # 4.084 s (with 10000 people [1,100] years old) | |
| def count_living_per_year(population: list[tuple[int, int]]) -> dict[int, int]: | |
| return collections.Counter( | |
| year for birth, death in population for year in range(birth, death) | |
| ) | |
| print(sorted(tuple(count_living_per_year(pop).items()))) | |
| print( | |
| timeit.timeit( | |
| "count_living_per_year(pop)", | |
| globals=globals(), | |
| number=100, | |
| ) | |
| ) | 
  
    Sign up for free
    to join this conversation on GitHub.
    Already have an account?
    Sign in to comment
  
            
ChatGPT helped speed it up a little more using
bincountinstead ofunique.:I looked at
bincountbut wasn't sure how to set theminlength- looks obvious now!