dshorthouse · February 16, 2023 04:03
diff --git a/open_alex_taxonomists_with_orcid.rb b/open_alex_taxonomists_with_orcid.rb
 #!/usr/bin/env ruby
 # encoding: utf-8

 require 'csv'
 require 'rest_client'
 require 'json'

 BASE_URL = "https://api.openalex.org/works?filter=concepts.id:C58642233,has_orcid:true,publication_year:2023&per_page=50&page="

 def get_data(page:)
   CSV.open("open_alex.csv", 'ab') do |csv|
      response = RestClient.get(BASE_URL + page.to_s)
      data = JSON.parse(response, symbolize_names: true)
      count = data[:meta][:count].to_i
      per_page = data[:meta][:per_page].to_i

      data[:results].each do |result|
         title = result[:title]
         next if title.nil?
         if title.downcase.include?("species") || title.downcase.include?("revision")
            result[:authorships].map{|a| a[:author][:orcid] }.compact.each do |orcid|
               csv << [orcid.split("/").last]
            end
         end
      end
      if per_page.to_i*page.to_i <= count.to_i
         get_data(page: page+1)
      else
         return
      end
   end
 end

 get_data(page: 1)
	#!/usr/bin/env ruby
	# encoding: utf-8

	require 'csv'
	require 'rest_client'
	require 'json'

	BASE_URL = "https://api.openalex.org/works?filter=concepts.id:C58642233,has_orcid:true,publication_year:2023&per_page=50&page="

	def get_data(page:)
	CSV.open("open_alex.csv", 'ab') do \|csv\|
	response = RestClient.get(BASE_URL + page.to_s)
	data = JSON.parse(response, symbolize_names: true)
	count = data[:meta][:count].to_i
	per_page = data[:meta][:per_page].to_i

	data[:results].each do \|result\|
	title = result[:title]
	next if title.nil?
	if title.downcase.include?("species") \|\| title.downcase.include?("revision")
	result[:authorships].map{\|a\| a[:author][:orcid] }.compact.each do \|orcid\|
	csv << [orcid.split("/").last]
	end
	end
	end
	if per_page.to_i*page.to_i <= count.to_i
	get_data(page: page+1)
	else
	return
	end
	end
	end

	get_data(page: 1)