Module: Bolognese::DoiUtils

Included in:
CLI, MetadataUtils
Defined in:
lib/bolognese/doi_utils.rb

Instance Method Summary collapse

Instance Method Details

#doi_api_url(doi, options = {}) ⇒ Object



30
31
32
33
# File 'lib/bolognese/doi_utils.rb', line 30

def doi_api_url(doi, options = {})
  sandbox = Array(/handle.stage.datacite.org/.match(doi)).last
  sandbox.present? || options[:sandbox] ? "https://api.stage.datacite.org/dois/#{doi_from_url(doi)}?include=media,client"  : "https://api.datacite.org/dois/#{doi_from_url(doi)}?include=media,client"
end

#doi_as_url(doi) ⇒ Object



50
51
52
# File 'lib/bolognese/doi_utils.rb', line 50

def doi_as_url(doi)
  "https://doi.org/#{doi}" if doi.present?
end

#doi_from_url(url) ⇒ Object



43
44
45
46
47
48
# File 'lib/bolognese/doi_utils.rb', line 43

def doi_from_url(url)
  if /\A(?:(http|https):\/\/(dx\.)?(doi.org|handle.stage.datacite.org|handle.test.datacite.org)\/)?(doi:)?(10\.\d{4,5}\/.+)\z/.match(url)
    uri = Addressable::URI.parse(url)
    uri.path.gsub(/^\//, '').downcase
  end
end

#doi_resolver(doi, options = {}) ⇒ Object



25
26
27
28
# File 'lib/bolognese/doi_utils.rb', line 25

def doi_resolver(doi, options = {})
  sandbox = Array(/handle.stage.datacite.org/.match(doi)).last
  sandbox.present? || options[:sandbox] ? "https://handle.stage.datacite.org/" : "https://doi.org/"
end

#get_doi_ra(doi) ⇒ Object

get DOI registration agency



55
56
57
58
59
60
61
62
63
# File 'lib/bolognese/doi_utils.rb', line 55

def get_doi_ra(doi)
  prefix = validate_prefix(doi)
  return nil if prefix.blank?

  url = "https://doi.org/ra/#{prefix}"
  result = Maremma.get(url)

  result.body.dig("data", 0, "RA")
end

#normalize_doi(doi, options = {}) ⇒ Object



35
36
37
38
39
40
41
# File 'lib/bolognese/doi_utils.rb', line 35

def normalize_doi(doi, options = {})
  doi_str = validate_doi(doi)
  return nil unless doi_str.present?

  # turn DOI into URL, escape unsafe characters
  doi_resolver(doi, options) + Addressable::URI.encode(doi_str)
end

#validate_doi(doi) ⇒ Object



5
6
7
8
9
# File 'lib/bolognese/doi_utils.rb', line 5

def validate_doi(doi)
  doi = Array(/\A(?:(http|https):\/(\/)?(dx\.)?(doi.org|handle.stage.datacite.org|handle.test.datacite.org)\/)?(doi:)?(10\.\d{4,5}\/.+)\z/.match(doi)).last
  # remove non-printing whitespace and downcase
  doi.delete("\u200B").downcase if doi.present?
end

#validate_funder_doi(doi) ⇒ Object



11
12
13
14
15
16
17
18
19
# File 'lib/bolognese/doi_utils.rb', line 11

def validate_funder_doi(doi)
  doi = Array(/\A(?:(http|https):\/(\/)?(dx\.)?(doi.org|handle.stage.datacite.org|handle.test.datacite.org)\/)?(doi:)?(10\.13039\/)?([1-9]\d+)\z/.match(doi)).last

  # remove non-printing whitespace and downcase
  if doi.present?
    doi.delete("\u200B").downcase
    "https://doi.org/10.13039/#{doi}"
  end
end

#validate_prefix(doi) ⇒ Object



21
22
23
# File 'lib/bolognese/doi_utils.rb', line 21

def validate_prefix(doi)
  Array(/\A(?:(http|https):\/(\/)?(dx\.)?(doi.org|handle.stage.datacite.org|handle.test.datacite.org)\/)?(doi:)?(10\.\d{4,5}).*\z/.match(doi)).last
end