diff --git a/Gemfile.lock b/Gemfile.lock index 9d844b19..c4e4d013 100644 --- a/Gemfile.lock +++ b/Gemfile.lock @@ -1,7 +1,7 @@ PATH remote: . specs: - bolognese (1.8.2) + bolognese (1.8.3) activesupport (>= 4.2.5) benchmark_methods (~> 0.7) bibtex-ruby (>= 5.1.0) @@ -58,7 +58,8 @@ GEM csl (~> 1.0) diff-lcs (1.4.4) docile (1.3.2) - ebnf (2.1.0) + ebnf (2.1.1) + htmlentities (~> 4.3) rdf (~> 3.1) scanf (~> 1.0) sxp (~> 1.1) @@ -120,7 +121,7 @@ GEM namae (1.0.1) nokogiri (1.10.10) mini_portile2 (~> 2.4.0) - oj (3.10.7) + oj (3.10.8) oj_mimic_json (1.0.1) optimist (3.0.1) postrank-uri (1.0.24) diff --git a/lib/bolognese/readers/crossref_reader.rb b/lib/bolognese/readers/crossref_reader.rb index 00a00e8b..7bc2c018 100644 --- a/lib/bolognese/readers/crossref_reader.rb +++ b/lib/bolognese/readers/crossref_reader.rb @@ -41,6 +41,7 @@ def read_crossref(string: nil, **options) journal_issue = {} journal_metadata = nil publisher = query.dig("crm_item", 0) + publisher = nil unless publisher.is_a?(String) case model when "book" @@ -69,7 +70,7 @@ def read_crossref(string: nil, **options) end when "posted_content" bibliographic_metadata = meta.dig("crossref", "posted_content").to_h - publisher = bibliographic_metadata.dig("institution", "institution_name") + publisher ||= bibliographic_metadata.dig("institution", "institution_name") when "sa_component" bibliographic_metadata = meta.dig("crossref", "sa_component", "component_list", "component").to_h related_identifier = Array.wrap(query.to_h["crm_item"]).find { |cr| cr["name"] == "relation" } diff --git a/lib/bolognese/version.rb b/lib/bolognese/version.rb index d9325f46..371a3062 100644 --- a/lib/bolognese/version.rb +++ b/lib/bolognese/version.rb @@ -1,3 +1,3 @@ module Bolognese - VERSION = "1.8.2" + VERSION = "1.8.3" end diff --git a/spec/fixtures/vcr_cassettes/Bolognese_Metadata/get_crossref_metadata/posted_content_copernicus.yml b/spec/fixtures/vcr_cassettes/Bolognese_Metadata/get_crossref_metadata/posted_content_copernicus.yml new file mode 100644 index 00000000..7c8fc1e6 --- /dev/null +++ b/spec/fixtures/vcr_cassettes/Bolognese_Metadata/get_crossref_metadata/posted_content_copernicus.yml @@ -0,0 +1,94 @@ +--- +http_interactions: +- request: + method: get + uri: https://doi.org/ra/10.5194 + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.7.1; mailto:info@datacite.org) + Accept: + - text/html,application/json,application/xml;q=0.9, text/plain;q=0.8,image/png,*/*;q=0.5 + response: + status: + code: 200 + message: '' + headers: + Date: + - Wed, 29 Jul 2020 06:09:32 GMT + Content-Type: + - application/json;charset=UTF-8 + Connection: + - keep-alive + Set-Cookie: + - __cfduid=d405b79b8c70ba4b495e3fcba1355b80c1596002972; expires=Fri, 28-Aug-20 + 06:09:32 GMT; path=/; domain=.doi.org; HttpOnly; SameSite=Lax; Secure + Cf-Cache-Status: + - DYNAMIC + Cf-Request-Id: + - 043ac9cad6000005bbc5b4f200000001 + Expect-Ct: + - max-age=604800, report-uri="https://report-uri.cloudflare.com/cdn-cgi/beacon/expect-ct" + Strict-Transport-Security: + - max-age=31536000; includeSubDomains; preload + Server: + - cloudflare + Cf-Ray: + - 5ba4abf15d0705bb-FRA + body: + encoding: ASCII-8BIT + string: |- + [ + { + "DOI": "10.5194", + "RA": "Crossref" + } + ] + http_version: + recorded_at: Wed, 29 Jul 2020 06:09:32 GMT +- request: + method: get + uri: https://api.crossref.org/works/10.5194/cp-2020-95/transform/application/vnd.crossref.unixsd+xml + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.7.1; mailto:info@datacite.org) + Accept: + - text/xml + response: + status: + code: 200 + message: OK + headers: + Link: + - ; rel="canonical", ; + rel="license", ; title="Jun Shao"; rel="author", + ; title="Laurie Menviel"; rel="author", + ; title="Mayhar Mohtadi"; rel="author" + Access-Control-Allow-Origin: + - "*" + Access-Control-Allow-Headers: + - X-Requested-With + Content-Length: + - '7366' + Server: + - http-kit + Date: + - Wed, 29 Jul 2020 06:09:33 GMT + X-Rate-Limit-Limit: + - '50' + X-Rate-Limit-Interval: + - 1s + Connection: + - close + body: + encoding: ASCII-8BIT + string: !binary |- + <?xml version="1.0" encoding="UTF-8"?>
<crossref_result xmlns="http://www.crossref.org/qrschema/3.0" version="3.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.crossref.org/qrschema/3.0 http://www.crossref.org/schemas/crossref_query_output3.0.xsd">
  <query_result>
    <head>
      <doi_batch_id>none</doi_batch_id>
    </head>
    <body>
      <query status="resolved">
        <doi type="posted_content">10.5194/cp-2020-95</doi>
        <crm-item name="publisher-name" type="string">Copernicus GmbH</crm-item>
        <crm-item name="prefix-name" type="string">Copernicus GmbH</crm-item>
        <crm-item name="member-id" type="number">3145</crm-item>
        <crm-item name="citation-id" type="number">118318151</crm-item>
        <crm-item name="book-id" type="number">3430342</crm-item>
        <crm-item name="deposit-timestamp" type="number">20200728073631</crm-item>
        <crm-item name="owner-prefix" type="string">10.5194</crm-item>
        <crm-item name="last-update" type="date">2020-07-28T09:16:11Z</crm-item>
        <crm-item name="created" type="date">2020-07-28T09:16:10Z</crm-item>
        <crm-item name="citedby-count" type="number">0</crm-item>
        <crm-item name="relation" type="doi" claim="isSupplementTo">10.5194/cp-2020-95-supplement</crm-item>
        <doi_record>
          <crossref xmlns="http://www.crossref.org/xschema/1.1" xsi:schemaLocation="http://www.crossref.org/xschema/1.1 http://doi.crossref.org/schemas/unixref1.1.xsd">
            <posted_content type="preprint">
              <group_title>Carbon Cycle/Modelling only/Millenial/D-O</group_title>
              <contributors>
                <person_name sequence="first" contributor_role="author">
                  <given_name>Jun</given_name>
                  <surname>Shao</surname>
                  <ORCID>https://orcid.org/0000-0001-6130-6474</ORCID>
                </person_name>
                <person_name sequence="additional" contributor_role="author">
                  <given_name>Lowell D</given_name>
                  <surname>Stott</surname>
                </person_name>
                <person_name sequence="additional" contributor_role="author">
                  <given_name>Laurie</given_name>
                  <surname>Menviel</surname>
                  <ORCID>https://orcid.org/0000-0002-5068-1591</ORCID>
                </person_name>
                <person_name sequence="additional" contributor_role="author">
                  <given_name>Andy</given_name>
                  <surname>Ridgwell</surname>
                </person_name>
                <person_name sequence="additional" contributor_role="author">
                  <given_name>Malin</given_name>
                  <surname>Ödalen</surname>
                </person_name>
                <person_name sequence="additional" contributor_role="author">
                  <given_name>Mayhar</given_name>
                  <surname>Mohtadi</surname>
                  <ORCID>https://orcid.org/0000-0003-3306-0969</ORCID>
                </person_name>
              </contributors>
              <titles>
                <title>The Atmospheric Bridge Communicated the δ&amp;lt;sup&amp;gt;13&amp;lt;/sup&amp;gt;C Declineduring the Last Deglaciation to the Global Upper Ocean</title>
              </titles>
              <posted_date>
                <month>7</month>
                <day>28</day>
                <year>2020</year>
              </posted_date>
              <jats:abstract xmlns:jats="http://www.ncbi.nlm.nih.gov/JATS1">
                <jats:p><![CDATA[Abstract. During the early last glacial termination (17.2–15 ka) atmospheric δ13C declined sharply by 0.3–0.4 ‰ as atmospheric pCO2 rose. This was the initial part of the atmospheric δ13C excursion that lasted for multiple thousand years. A similar δ13C decline has been documented in marine proxy records from both surface and thermocline-dwelling planktic foraminifera. The foraminiferal δ13C decline has previously been attributed to a flux of respired carbon from the deep ocean that was subsequently transported within the upper ocean (i.e. bottom up transport) to sites where the signal is recorded. Here, we provide modeling evidence that when respired carbon upwells in the Southern Ocean, negative δ13C anomalies in the global upper ocean were instead transferred from the atmosphere (i.e. top down transport). Due to this efficient atmospheric bridge, the pathway of δ13C transport was likely to be different from nutrient transport during the early deglaciation. This implies that the usage of planktic δ13C records for identifying the carbon source(s) responsible for the atmospheric pCO2 rise during the early deglaciation is limited. The model results also suggest that thermocline waters in upwelling systems like the eastern equatorial Pacific, and even upper deep waters above 2000 m, can be affected by this atmospheric bridge during the early deglaciation. Our results imply that caution must be applied when interpreting early deglacial marine δ13C records from depths that are potentially affected by the atmosphere.]]></jats:p>
              </jats:abstract>
              <fr:program xmlns:fr="http://www.crossref.org/fundref.xsd" name="fundref">
                <fr:assertion name="fundgroup">
                  <fr:assertion name="funder_name">
                    Division of Ocean Sciences
                    <fr:assertion name="funder_identifier">http://dx.doi.org/10.13039/100000141</fr:assertion>
                  </fr:assertion>
                  <fr:assertion name="award_number">1558990</fr:assertion>
                  <fr:assertion name="award_number">1736771</fr:assertion>
                </fr:assertion>
                <fr:assertion name="fundgroup">
                  <fr:assertion name="funder_name">
                    Australian Research Council
                    <fr:assertion name="funder_identifier">http://dx.doi.org/10.13039/501100000923</fr:assertion>
                  </fr:assertion>
                  <fr:assertion name="award_number">FT180100606</fr:assertion>
                  <fr:assertion name="award_number">DP180100048</fr:assertion>
                </fr:assertion>
              </fr:program>
              <ai:program xmlns:ai="http://www.crossref.org/AccessIndicators.xsd" name="AccessIndicators">
                <ai:license_ref>https://creativecommons.org/licenses/by/4.0/</ai:license_ref>
              </ai:program>
              <rel:program xmlns:rel="http://www.crossref.org/relations.xsd" name="relations">
                <rel:related_item>
                  <rel:description>Supplementary material</rel:description>
                  <rel:inter_work_relation identifier-type="doi" relationship-type="isSupplementedBy">10.5194/cp-2020-95-supplement</rel:inter_work_relation>
                </rel:related_item>
              </rel:program>
              <doi_data>
                <doi>10.5194/cp-2020-95</doi>
                <resource>https://cp.copernicus.org/preprints/cp-2020-95/</resource>
              </doi_data>
            </posted_content>
          </crossref>
        </doi_record>
      </query>
    </body>
  </query_result>
</crossref_result> + http_version: + recorded_at: Wed, 29 Jul 2020 06:09:33 GMT +recorded_with: VCR 3.0.3 diff --git a/spec/readers/crossref_reader_spec.rb b/spec/readers/crossref_reader_spec.rb index c0a57554..06bf1963 100644 --- a/spec/readers/crossref_reader_spec.rb +++ b/spec/readers/crossref_reader_spec.rb @@ -175,7 +175,7 @@ expect(subject.descriptions.first["description"]).to start_with("This article presents a practical roadmap") expect(subject.dates).to include({"date"=>"2017-10-09", "dateType"=>"Issued"}) expect(subject.publication_year).to eq("2017") - expect(subject.publisher).to eq("bioRxiv") + expect(subject.publisher).to eq("Cold Spring Harbor Laboratory") expect(subject.agency).to eq("Crossref") end @@ -602,6 +602,27 @@ expect(subject.date_registered).to eq("2019-11-02T09:30:06Z") end + it "posted content copernicus" do + input = "https://doi.org/10.5194/CP-2020-95" + subject = Bolognese::Metadata.new(input: input) + expect(subject.valid?).to be true + expect(subject.url).to eq("https://cp.copernicus.org/preprints/cp-2020-95/") + expect(subject.types).to eq("bibtex"=>"article", "citeproc"=>"article-journal", "resourceType"=>"PostedContent", "resourceTypeGeneral"=>"Text", "ris"=>"JOUR", "schemaOrg"=>"ScholarlyArticle") + expect(subject.creators.count).to eq(6) + expect(subject.creators.first).to eq("nameType" => "Personal", "familyName" => "Shao", + "givenName" => "Jun", + "name" => "Shao, Jun", + "nameIdentifiers" => [{"nameIdentifier"=>"https://orcid.org/0000-0001-6130-6474", "nameIdentifierScheme"=>"ORCID", "schemeUri"=>"https://orcid.org"}]) + expect(subject.titles).to eq([{"title"=>"The Atmospheric Bridge Communicated the δ<sup>13</sup>C Declineduring the Last Deglaciation to the Global Upper Ocean"}]) + expect(subject.id).to eq("https://doi.org/10.5194/cp-2020-95") + expect(subject.identifiers).to be_empty + expect(subject.descriptions.first["description"]).to start_with("Abstract. During the early last glacial termination") + expect(subject.dates).to include({"date"=>"2020-07-28", "dateType"=>"Issued"}) + expect(subject.publication_year).to eq("2020") + expect(subject.publisher).to eq("Copernicus GmbH") + expect(subject.agency).to eq("Crossref") + end + it "journal issue" do input = "https://doi.org/10.6002/ect.2015.0371" subject = Bolognese::Metadata.new(input: input)