Module: Bolognese::DoiUtils

Included in:
CLI, MetadataUtils
Defined in:
lib/bolognese/doi_utils.rb

Instance Method Summary collapse

Instance Method Details

#doi_api_url(doi, options = {}) ⇒ Object



20
21
22
23
# File 'lib/bolognese/doi_utils.rb', line 20

def doi_api_url(doi, options = {})
  sandbox = Array(/handle.test.datacite.org/.match(doi)).last
  sandbox.present? || options[:sandbox] ? "https://api.test.datacite.org/dois/" + doi_from_url(doi) : "https://api.datacite.org/dois/" + doi_from_url(doi)
end

#doi_as_url(doi) ⇒ Object



40
41
42
# File 'lib/bolognese/doi_utils.rb', line 40

def doi_as_url(doi)
  "https://doi.org/#{doi}" if doi.present?
end

#doi_from_url(url) ⇒ Object



33
34
35
36
37
38
# File 'lib/bolognese/doi_utils.rb', line 33

def doi_from_url(url)
  if /\A(?:(http|https):\/\/(dx\.)?(doi.org|handle.test.datacite.org)\/)?(doi:)?(10\.\d{4,5}\/.+)\z/.match(url)
    uri = Addressable::URI.parse(url)
    uri.path.gsub(/^\//, '').downcase
  end
end

#doi_resolver(doi, options = {}) ⇒ Object



15
16
17
18
# File 'lib/bolognese/doi_utils.rb', line 15

def doi_resolver(doi, options = {})
  sandbox = Array(/handle.test.datacite.org/.match(doi)).last
  sandbox.present? || options[:sandbox] ? "https://handle.test.datacite.org/" : "https://doi.org/"
end

#get_doi_ra(doi) ⇒ Object

get DOI registration agency



45
46
47
48
49
50
51
52
53
# File 'lib/bolognese/doi_utils.rb', line 45

def get_doi_ra(doi)
  prefix = validate_prefix(doi)
  return nil if prefix.blank?

  url = "https://doi.org/ra/#{prefix}"
  result = Maremma.get(url)

  result.body.dig("data", 0, "RA")
end

#normalize_doi(doi, options = {}) ⇒ Object



25
26
27
28
29
30
31
# File 'lib/bolognese/doi_utils.rb', line 25

def normalize_doi(doi, options = {})
  doi_str = validate_doi(doi)
  return nil unless doi_str.present?

  # turn DOI into URL, escape unsafe characters
  doi_resolver(doi, options) + Addressable::URI.encode(doi_str)
end

#validate_doi(doi) ⇒ Object



5
6
7
8
9
# File 'lib/bolognese/doi_utils.rb', line 5

def validate_doi(doi)
  doi = Array(/\A(?:(http|https):\/(\/)?(dx\.)?(doi.org|handle.test.datacite.org)\/)?(doi:)?(10\.\d{4,5}\/.+)\z/.match(doi)).last
  # remove non-printing whitespace and downcase
  doi.delete("\u200B").downcase if doi.present?
end

#validate_prefix(doi) ⇒ Object



11
12
13
# File 'lib/bolognese/doi_utils.rb', line 11

def validate_prefix(doi)
  Array(/\A(?:(http|https):\/(\/)?(dx\.)?(doi.org|handle.test.datacite.org)\/)?(doi:)?(10\.\d{4,5}).*\z/.match(doi)).last
end