diff --git a/scripts/update_oai-pmh.rb b/scripts/update_oai-pmh.rb index d94a368c5269107ce684287fd8d1b40b3c3514bc..e98ab25267ec95548bfc86aeb6a0932b438b4f0f 100644 --- a/scripts/update_oai-pmh.rb +++ b/scripts/update_oai-pmh.rb @@ -17,12 +17,11 @@ class OaiPmhClient persistent_connection_adapter - headers {"User-Agent" => "LEAPS-WG3-client/0.1"} + headers 'User-Agent' => 'LEAPS-WG3-client/0.1' def initialize(oai_pmh_endpoint, from_id=nil) self.class.base_uri oai_pmh_endpoint - - # TODO add from_id support as 'From' request header + self.class.headers "From" => from_id if from_id # WORK_AROUND: The connection adapter is persistent across multiple # URLs (which is good), but the adapter+connection-caching somehow @@ -233,6 +232,27 @@ class SeriesStatistics end end +# Try to discover someone's email address by looking in various likely +# configuration files. Returns the email address if it's unambiguous. +def find_email_address + candidate_emails = [] + + # Look in Zoom + zoomConfig = File.expand_path("~/.config/zoomus.conf") + if File.file?(zoomConfig) + File.open( zoomConfig ).each do |line| + if line =~ /^userEmailAddress=(.*?)$/ + candidate_emails.append($1) + end + end + end + + # TODO Look in Thunderbird + #find ~.thunderbird -name prefs.js | xargs sed -n 's/user_pref."mail.identity.id1.useremail", "\([^"]*\)".*/\1/p' + + # Return email address if there is no ambiguity. + return candidate_emails.uniq.count == 1 ? candidate_emails[0] : nil +end def check_oai_pmh_endpoint(endpoint_url) queryIdentify_url = endpoint_url + "?verb=Identify" @@ -423,6 +443,13 @@ up_to_date = true file_path = '_data/facilities.yml' facilities = YAML.safe_load(File.read(file_path), permitted_classes: [Date]) +email_address = find_email_address +if email_address + puts "INFO: identifying OAI-PMH activity as from <#{email_address}>" +else + puts "WARNING: unable to discover your email address. Carrying on under a cloak of anonymity." +end + facilities.each do |facility| odr = facility['odr'] next unless odr && odr.key?('oai-pmh-endpoint') @@ -433,7 +460,7 @@ facilities.each do |facility| oai_pmh_endpoint = oai_pmh['link'] next unless oai_pmh_endpoint - $client = OaiPmhClient.new(oai_pmh_endpoint) + $client = OaiPmhClient.new(oai_pmh_endpoint, email_address) expected_status = oai_pmh['status']