diff --git a/.gitignore b/.gitignore index 9fcfc5cca..ac2cc5770 100644 --- a/.gitignore +++ b/.gitignore @@ -35,8 +35,8 @@ capybara-*.html /tmp/* /data/* /db/*.sqlite3 -/public/system/* -public/assets +/public/* +!/public/.keep /coverage/ /spec/tmp/ /config/data_bags/* diff --git a/.travis.yml b/.travis.yml index dbe99ec55..826f7394a 100644 --- a/.travis.yml +++ b/.travis.yml @@ -52,11 +52,6 @@ after_success: docker push $REPO:$TRAVIS_TAG; echo "Pushed to" $REPO:$TRAVIS_TAG; AUTO_DEPLOY=true; - elif [ "$TRAVIS_PULL_REQUEST" == "true" ]; then - docker build -f Dockerfile -t $REPO:$TRAVIS_PULL_REQUEST_BRANCH .; - docker push $REPO:$TRAVIS_PULL_REQUEST_BRANCH; - echo "Pushed to" $REPO:$TRAVIS_PULL_REQUEST_BRANCH; - AUTO_DEPLOY=true; elif [ "$TRAVIS_BRANCH" == "master" ]; then docker build -f Dockerfile -t $REPO .; docker push $REPO; @@ -66,6 +61,7 @@ after_success: docker build -f Dockerfile -t $REPO:$TRAVIS_BRANCH .; docker push $REPO:$TRAVIS_BRANCH; echo "Pushed to" $REPO:$TRAVIS_BRANCH; + AUTO_DEPLOY=true; fi - if [ "$AUTO_DEPLOY" == "true" ]; then @@ -90,10 +86,6 @@ after_success: git add prod-eu-west/services/client-api/_lupo.auto.tfvars; git commit -m "Adding lupo git variables for commit tagged ${TRAVIS_TAG?}"; git push "https://${TRAVIS_SECURE_TOKEN}@github.com/datacite/mastino.git" master; - elif [ "$TRAVIS_PULL_REQUEST" == "true" ]; then - git add stage/services/client-api/_lupo.auto.tfvars; - git commit -m "Adding lupo git variables for pull request ${TRAVIS_PULL_REQUEST}"; - git push "https://${TRAVIS_SECURE_TOKEN}@github.com/datacite/mastino.git" ${TRAVIS_PULL_REQUEST_BRANCH}; else git add stage/services/client-api/_lupo.auto.tfvars; git commit -m "Adding lupo git variables for latest commit"; diff --git a/Dockerfile b/Dockerfile index 698ce7ac8..dc48bb109 100644 --- a/Dockerfile +++ b/Dockerfile @@ -16,7 +16,7 @@ RUN bash -lc 'rvm --default use ruby-2.4.4' # Update installed APT packages RUN apt-get update && apt-get upgrade -y -o Dpkg::Options::="--force-confold" && \ - apt-get install ntp wget tzdata -y && \ + apt-get install ntp wget tzdata pandoc -y && \ apt-get clean && rm -rf /var/lib/apt/lists/* /tmp/* /var/tmp/* # install dockerize @@ -53,12 +53,18 @@ RUN mkdir -p tmp/pids && \ chown -R app:app /home/app/webapp && \ chmod -R 755 /home/app/webapp +# Install Ruby gems for middleman +WORKDIR /home/app/webapp/vendor/middleman +RUN /sbin/setuser app bundle install + # Add Runit script for shoryuken workers +WORKDIR /home/app/webapp RUN mkdir /etc/service/shoryuken ADD vendor/docker/shoryuken.sh /etc/service/shoryuken/run # Run additional scripts during container startup (i.e. not at build time) RUN mkdir -p /etc/my_init.d +COPY vendor/docker/70_index_page.sh /etc/my_init.d/70_index_page.sh COPY vendor/docker/80_flush_cache.sh /etc/my_init.d/80_flush_cache.sh COPY vendor/docker/90_migrate.sh /etc/my_init.d/90_migrate.sh diff --git a/Gemfile b/Gemfile index c2444041e..43b13cef7 100644 --- a/Gemfile +++ b/Gemfile @@ -4,17 +4,19 @@ gem 'rails', '~> 5.2.0' gem 'bootsnap', '~> 1.2', '>= 1.2.1' gem 'mysql2', '~> 0.4.4' gem 'dotenv' +gem 'rake', '~> 12.0' gem 'multi_json' gem 'json', '~> 1.8', '>= 1.8.5' gem 'oj', '>= 2.8.3' gem 'jsonlint', '~> 0.2.0' gem 'equivalent-xml', '~> 0.6.0' gem 'nokogiri', '~> 1.8.1' +gem 'diffy', '~> 3.2', '>= 3.2.1' gem 'commonmarker', '~> 0.17.9' gem 'iso8601', '~> 0.9.0' gem 'patron', '~> 0.13.1', require: false gem 'maremma', '>= 4.1' -gem 'bolognese', '~> 0.9', '>= 0.10' +gem 'bolognese', '~> 1.0' gem 'dalli', '~> 2.7', '>= 2.7.6' gem 'lograge', '~> 0.10.0' gem 'logstash-event', '~> 1.2', '>= 1.2.02' @@ -32,9 +34,9 @@ gem 'api-pagination' gem 'cancancan', '~> 2.0' gem 'country_select', '~> 3.1' gem 'countries', '~> 2.1', '>= 2.1.2' -gem 'aasm', '~> 4.12', '>= 4.12.3' +gem 'aasm', '~> 5.0', '>= 5.0.1' gem "facets", require: false -gem 'shoryuken', '~> 3.2', '>= 3.2.2' +gem 'shoryuken', '~> 4.0' gem "aws-sdk-s3", require: false gem 'aws-sdk-sqs', '~> 1.3' gem 'bergamasco', '~> 0.3.10' @@ -52,6 +54,7 @@ gem 'elasticsearch-rails', '~> 5.0', '>= 5.0.2' gem 'faraday_middleware-aws-sigv4', '~> 0.2.4' gem 'rack-utf8_sanitizer', '~> 1.6' gem 'oj_mimic_json', '~> 1.0', '>= 1.0.1' +gem 'turnout', '~> 2.5' group :development, :test do gem 'rspec-rails', '~> 3.5', '>= 3.5.2' @@ -64,6 +67,7 @@ group :development do gem 'listen', '>= 3.0.5', '< 3.2' gem 'spring' gem 'spring-watcher-listen', '~> 2.0.0' + gem 'spring-commands-rspec' # gem 'httplog', '~> 1.0' end diff --git a/Gemfile.lock b/Gemfile.lock index 4be65ca64..994781cf0 100644 --- a/Gemfile.lock +++ b/Gemfile.lock @@ -1,50 +1,50 @@ GEM remote: https://rubygems.org/ specs: - aasm (4.12.3) + aasm (5.0.1) concurrent-ruby (~> 1.0) - actioncable (5.2.1) - actionpack (= 5.2.1) + actioncable (5.2.2) + actionpack (= 5.2.2) nio4r (~> 2.0) websocket-driver (>= 0.6.1) - actionmailer (5.2.1) - actionpack (= 5.2.1) - actionview (= 5.2.1) - activejob (= 5.2.1) + actionmailer (5.2.2) + actionpack (= 5.2.2) + actionview (= 5.2.2) + activejob (= 5.2.2) mail (~> 2.5, >= 2.5.4) rails-dom-testing (~> 2.0) - actionpack (5.2.1) - actionview (= 5.2.1) - activesupport (= 5.2.1) + actionpack (5.2.2) + actionview (= 5.2.2) + activesupport (= 5.2.2) rack (~> 2.0) rack-test (>= 0.6.3) rails-dom-testing (~> 2.0) rails-html-sanitizer (~> 1.0, >= 1.0.2) - actionview (5.2.1) - activesupport (= 5.2.1) + actionview (5.2.2) + activesupport (= 5.2.2) builder (~> 3.1) erubi (~> 1.4) rails-dom-testing (~> 2.0) rails-html-sanitizer (~> 1.0, >= 1.0.3) - active_model_serializers (0.10.7) + active_model_serializers (0.10.8) actionpack (>= 4.1, < 6) activemodel (>= 4.1, < 6) case_transform (>= 0.2) jsonapi-renderer (>= 0.1.1.beta1, < 0.3) - activejob (5.2.1) - activesupport (= 5.2.1) + activejob (5.2.2) + activesupport (= 5.2.2) globalid (>= 0.3.6) - activemodel (5.2.1) - activesupport (= 5.2.1) - activerecord (5.2.1) - activemodel (= 5.2.1) - activesupport (= 5.2.1) + activemodel (5.2.2) + activesupport (= 5.2.2) + activerecord (5.2.2) + activemodel (= 5.2.2) + activesupport (= 5.2.2) arel (>= 9.0) - activestorage (5.2.1) - actionpack (= 5.2.1) - activerecord (= 5.2.1) + activestorage (5.2.2) + actionpack (= 5.2.2) + activerecord (= 5.2.2) marcel (~> 0.3.1) - activesupport (5.2.1) + activesupport (5.2.2) concurrent-ruby (~> 1.0, >= 1.0.2) i18n (>= 0.7, < 2) minitest (~> 5.1) @@ -52,24 +52,24 @@ GEM addressable (2.5.2) public_suffix (>= 2.0.2, < 4.0) ansi (1.5.0) - api-pagination (4.8.1) + api-pagination (4.8.2) arel (9.0.0) aws-eventstream (1.0.1) - aws-partitions (1.105.0) - aws-sdk-core (3.30.0) + aws-partitions (1.125.0) + aws-sdk-core (3.44.0) aws-eventstream (~> 1.0) aws-partitions (~> 1.0) aws-sigv4 (~> 1.0) jmespath (~> 1.0) - aws-sdk-kms (1.9.0) - aws-sdk-core (~> 3, >= 3.26.0) + aws-sdk-kms (1.13.0) + aws-sdk-core (~> 3, >= 3.39.0) aws-sigv4 (~> 1.0) - aws-sdk-s3 (1.21.0) - aws-sdk-core (~> 3, >= 3.26.0) + aws-sdk-s3 (1.30.0) + aws-sdk-core (~> 3, >= 3.39.0) aws-sdk-kms (~> 1) aws-sigv4 (~> 1.0) - aws-sdk-sqs (1.7.0) - aws-sdk-core (~> 3, >= 3.26.0) + aws-sdk-sqs (1.10.0) + aws-sdk-core (~> 3, >= 3.39.0) aws-sigv4 (~> 1.0) aws-sigv4 (1.0.3) base32-url (0.5) @@ -93,13 +93,14 @@ GEM latex-decode (~> 0.0) binding_of_caller (0.8.0) debug_inspector (>= 0.0.1) - bolognese (0.15.6) + bolognese (1.0.32) activesupport (>= 4.2.5, < 6) benchmark_methods (~> 0.7) bibtex-ruby (~> 4.1) builder (~> 3.2, >= 3.2.2) citeproc-ruby (~> 1.1, >= 1.1.10) colorize (~> 0.8.1) + concurrent-ruby (~> 1.0.5) csl-styles (~> 1.0, >= 1.0.1.8) edtf (~> 3.0, >= 3.0.4) gender_detector (~> 0.1.2) @@ -117,18 +118,19 @@ GEM thor (~> 0.19) bootsnap (1.3.2) msgpack (~> 1.0) - bugsnag (6.8.0) + bugsnag (6.10.0) concurrent-ruby (~> 1.0) builder (3.2.3) byebug (10.0.2) cancancan (2.3.0) - capybara (3.9.0) + capybara (3.12.0) addressable mini_mime (>= 0.1.3) nokogiri (~> 1.8) rack (>= 1.6.0) rack-test (>= 0.6.3) - xpath (~> 3.1) + regexp_parser (~> 1.2) + xpath (~> 3.2) case_transform (0.2) activesupport citeproc (1.0.9) @@ -160,10 +162,11 @@ GEM csl (~> 1.0) css_parser (1.6.0) addressable - dalli (2.7.8) + dalli (2.7.9) database_cleaner (1.7.0) debug_inspector (0.0.3) diff-lcs (1.3) + diffy (3.2.1) docile (1.1.5) docopt (0.6.1) domain_name (0.5.20180417) @@ -202,7 +205,7 @@ GEM railties (>= 3.0.0) faker (1.9.1) i18n (>= 0.7) - faraday (0.15.3) + faraday (0.15.4) multipart-post (>= 1.2, < 3) faraday-encoding (0.0.5) faraday @@ -211,7 +214,7 @@ GEM faraday_middleware-aws-sigv4 (0.2.4) aws-sigv4 (~> 1.0) faraday (>= 0.9) - fast_jsonapi (1.4) + fast_jsonapi (1.5) activesupport (>= 4.2) ffi (1.9.25) flipper (0.16.0) @@ -232,7 +235,7 @@ GEM htmlentities (4.3.4) http-cookie (1.0.3) domain_name (~> 0.5) - i18n (1.1.0) + i18n (1.2.0) concurrent-ruby (~> 1.0) i18n_data (0.8.0) iso8601 (0.9.1) @@ -272,10 +275,10 @@ GEM logstash-event (1.2.02) logstash-logger (0.26.1) logstash-event (~> 1.2) - loofah (2.2.2) + loofah (2.2.3) crass (~> 1.0.2) nokogiri (>= 1.5.9) - mail (2.7.0) + mail (2.7.1) mini_mime (>= 0.1.1) mailgun-ruby (1.1.11) rest-client (~> 2.0.2) @@ -292,7 +295,7 @@ GEM multi_json (~> 1.12) nokogiri (~> 1.8.1) oj (>= 2.8.3) - method_source (0.9.0) + method_source (0.9.2) mime-types (3.2.2) mime-types-data (~> 3.2015) mime-types-data (3.2018.0812) @@ -301,7 +304,7 @@ GEM mini_mime (1.0.1) mini_portile2 (2.3.0) minitest (5.11.3) - money (6.13.0) + money (6.13.1) i18n (>= 0.6.4, <= 2) msgpack (1.2.4) multi_json (1.13.1) @@ -328,41 +331,43 @@ GEM pwqgen.rb (0.1.0) docopt (~> 0.5) sysrandom - rack (2.0.5) + rack (2.0.6) + rack-accept (0.4.5) + rack (>= 0.4) rack-cors (1.0.2) rack-test (1.1.0) rack (>= 1.0, < 3) rack-utf8_sanitizer (1.6.0) rack (>= 1.0, < 3.0) - rails (5.2.1) - actioncable (= 5.2.1) - actionmailer (= 5.2.1) - actionpack (= 5.2.1) - actionview (= 5.2.1) - activejob (= 5.2.1) - activemodel (= 5.2.1) - activerecord (= 5.2.1) - activestorage (= 5.2.1) - activesupport (= 5.2.1) + rails (5.2.2) + actioncable (= 5.2.2) + actionmailer (= 5.2.2) + actionpack (= 5.2.2) + actionview (= 5.2.2) + activejob (= 5.2.2) + activemodel (= 5.2.2) + activerecord (= 5.2.2) + activestorage (= 5.2.2) + activesupport (= 5.2.2) bundler (>= 1.3.0) - railties (= 5.2.1) + railties (= 5.2.2) sprockets-rails (>= 2.0.0) rails-dom-testing (2.0.3) activesupport (>= 4.2.0) nokogiri (>= 1.6) rails-html-sanitizer (1.0.4) loofah (~> 2.2, >= 2.2.2) - railties (5.2.1) - actionpack (= 5.2.1) - activesupport (= 5.2.1) + railties (5.2.2) + actionpack (= 5.2.2) + activesupport (= 5.2.2) method_source rake (>= 0.8.7) thor (>= 0.19.0, < 2.0) - rake (12.3.1) + rake (12.3.2) rb-fsevent (0.10.3) rb-inotify (0.9.10) ffi (>= 0.5.0, < 2) - rdf (3.0.4) + rdf (3.0.7) hamster (~> 3.0) link_header (~> 0.0, >= 0.0.8) rdf-aggregate-repo (2.2.1) @@ -383,6 +388,7 @@ GEM rdf (>= 2.2, < 4.0) rdf-xsd (3.0.1) rdf (~> 3.0) + regexp_parser (1.3.0) request_store (1.4.1) rack (>= 1.4) rest-client (2.0.2) @@ -397,7 +403,7 @@ GEM rspec-mocks (3.8.0) diff-lcs (>= 1.2.0, < 2.0) rspec-support (~> 3.8.0) - rspec-rails (3.8.0) + rspec-rails (3.8.1) actionpack (>= 3.0) activesupport (>= 3.0) railties (>= 3.0) @@ -410,7 +416,7 @@ GEM i18n ruby_dep (1.5.0) safe_yaml (1.0.4) - shoryuken (3.3.0) + shoryuken (4.0.2) aws-sdk-core (>= 2) concurrent-ruby thor @@ -428,6 +434,8 @@ GEM unicode_utils (>= 1.2.2) spring (2.0.2) activesupport (>= 4.2) + spring-commands-rspec (1.0.4) + spring (>= 0.9.1) spring-watcher-listen (2.0.1) listen (>= 2.7, < 4.0) spring (>= 1.2, < 3.0) @@ -444,10 +452,15 @@ GEM rdf (>= 2.2, < 4.0) sysrandom (1.0.5) temple (0.8.0) - thor (0.20.0) + thor (0.20.3) thread_safe (0.3.6) - tilt (2.0.8) + tilt (2.0.9) trollop (2.9.9) + turnout (2.5.0) + i18n (>= 0.7, < 2) + rack (>= 1.3, < 3) + rack-accept (~> 0.4) + tilt (>= 1.4, < 3) tzinfo (1.2.5) thread_safe (~> 0.1) unf (0.1.4) @@ -462,14 +475,14 @@ GEM websocket-driver (0.7.0) websocket-extensions (>= 0.1.0) websocket-extensions (0.1.3) - xpath (3.1.0) + xpath (3.2.0) nokogiri (~> 1.8) PLATFORMS ruby DEPENDENCIES - aasm (~> 4.12, >= 4.12.3) + aasm (~> 5.0, >= 5.0.1) active_model_serializers (~> 0.10.0) api-pagination aws-sdk-s3 @@ -479,7 +492,7 @@ DEPENDENCIES bergamasco (~> 0.3.10) better_errors binding_of_caller - bolognese (~> 0.9, >= 0.10) + bolognese (~> 1.0) bootsnap (~> 1.2, >= 1.2.1) bugsnag (~> 6.1, >= 6.1.1) byebug @@ -491,6 +504,7 @@ DEPENDENCIES country_select (~> 3.1) dalli (~> 2.7, >= 2.7.6) database_cleaner + diffy (~> 3.2, >= 3.2.1) dotenv elasticsearch-extensions (~> 0.0.29) elasticsearch-model (~> 5.0, >= 5.0.2) @@ -527,16 +541,19 @@ DEPENDENCIES rack-cors (~> 1.0, >= 1.0.2) rack-utf8_sanitizer (~> 1.6) rails (~> 5.2.0) + rake (~> 12.0) rspec-rails (~> 3.5, >= 3.5.2) - shoryuken (~> 3.2, >= 3.2.2) + shoryuken (~> 4.0) shoulda-matchers (~> 3.1) simple_command slack-notifier (~> 2.1) spring + spring-commands-rspec spring-watcher-listen (~> 2.0.0) strip_attributes (~> 1.8) + turnout (~> 2.5) vcr (~> 3.0.3) webmock (~> 3.1) BUNDLED WITH - 1.16.1 + 1.17.1 diff --git a/app/controllers/application_controller.rb b/app/controllers/application_controller.rb index 24e5349a9..5a5dc755a 100644 --- a/app/controllers/application_controller.rb +++ b/app/controllers/application_controller.rb @@ -73,7 +73,9 @@ def type_and_credentials_from_request_headers when "CanCan::AccessDenied" then 403 when "ActiveRecord::RecordNotFound", "AbstractController::ActionNotFound", "ActionController::RoutingError" then 404 when "ActionController::UnknownFormat" then 406 + when "ActiveRecord::RecordNotUnique" then 409 when "ActiveModel::ForbiddenAttributesError", "ActionController::ParameterMissing", "ActionController::UnpermittedParameters", "ActiveModelSerializers::Adapter::JsonApi::Deserialization::InvalidDocument" then 422 + when "SocketError" then 500 else 400 end @@ -88,6 +90,10 @@ def type_and_credentials_from_request_headers message = "The resource you are looking for doesn't exist." elsif status == 406 message = "The content type is not recognized." + elsif status == 409 + message = "The resource already exists." + elsif ["JSON::ParserError", "Nokogiri::XML::SyntaxError", "ActionDispatch::Http::Parameters::ParseError"].include?(exception.class.to_s) + message = exception.message else Bugsnag.notify(exception) diff --git a/app/controllers/client_prefixes_controller.rb b/app/controllers/client_prefixes_controller.rb index 1c50221c9..54d3175da 100644 --- a/app/controllers/client_prefixes_controller.rb +++ b/app/controllers/client_prefixes_controller.rb @@ -150,9 +150,9 @@ def set_client_prefix end def safe_params - puts params ActiveModelSerializers::Deserialization.jsonapi_parse!( - params, only: [:id, :client, :prefix, :provider_prefix] + params, only: [:id, :client, :prefix, :providerPrefix], + keys: { "providerPrefix" => :provider_prefix } ) end end diff --git a/app/controllers/clients_controller.rb b/app/controllers/clients_controller.rb index ee8645887..85bf650ff 100644 --- a/app/controllers/clients_controller.rb +++ b/app/controllers/clients_controller.rb @@ -31,13 +31,14 @@ def index elsif params[:ids].present? response = Client.find_by_ids(params[:ids], page: page, sort: sort) else - response = Client.query(params[:query], year: params[:year], provider_id: params[:provider_id], fields: params[:fields], page: page, sort: sort) + response = Client.query(params[:query], year: params[:year], provider_id: params[:provider_id], software: params[:software], query_fields: params[:query_fields], page: page, sort: sort) end total = response.results.total total_pages = page[:size] > 0 ? (total.to_f / page[:size]).ceil : 0 years = total > 0 ? facet_by_year(response.response.aggregations.years.buckets) : nil providers = total > 0 ? facet_by_provider(response.response.aggregations.providers.buckets) : nil + software = total > 0 ? facet_by_software(response.response.aggregations.software.buckets) : nil @clients = response.results.results @@ -47,7 +48,8 @@ def index "total-pages" => total_pages, page: page[:number], years: years, - providers: providers + providers: providers, + software: software }.compact options[:links] = { @@ -55,6 +57,7 @@ def index next: @clients.blank? ? nil : request.base_url + "/clients?" + { query: params[:query], "provider-id" => params[:provider_id], + software: params[:software], year: params[:year], fields: params[:fields], "page[number]" => page[:number] + 1, @@ -146,8 +149,8 @@ def set_client def safe_params fail JSON::ParserError, "You need to provide a payload following the JSONAPI spec" unless params[:data].present? ActiveModelSerializers::Deserialization.jsonapi_parse!( - params, only: [:symbol, :name, "contact-name", "contact-email", :domains, :provider, :url, :repository, "target-id", "is-active", "password-input"], - keys: { "contact-name" => :contact_name, "contact-email" => :contact_email, "target-id" => :target_id, "is-active" => :is_active, "password-input" => :password_input } + params, only: [:symbol, :name, "contactName", "contactEmail", :domains, :provider, :url, :repository, :description, :software, "targetId", "isActive", "passwordInput"], + keys: { "contactName" => :contact_name, "contactEmail" => :contact_email, "targetId" => :target_id, "isActive" => :is_active, "passwordInput" => :password_input } ) end end diff --git a/app/controllers/concerns/countable.rb b/app/controllers/concerns/countable.rb index 4e5ae65a3..52c9570cd 100644 --- a/app/controllers/concerns/countable.rb +++ b/app/controllers/concerns/countable.rb @@ -24,7 +24,7 @@ def client_count(provider_id: nil) response = Client.query(nil, include_deleted: true, page: { number: 1, size: 0 }) end - response.results.total > 0 ? facet_by_cumuative_year(response.response.aggregations.cumulative_years.buckets) : [] + response.results.total > 0 ? facet_by_cumulative_year(response.response.aggregations.cumulative_years.buckets) : [] end # show provider count for admin @@ -33,7 +33,7 @@ def provider_count(provider_id: nil) return nil if provider_id response = Provider.query(nil, include_deleted: true, page: { number: 1, size: 0 }) - response.results.total > 0 ? facet_by_cumuative_year(response.response.aggregations.cumulative_years.buckets) : [] + response.results.total > 0 ? facet_by_cumulative_year(response.response.aggregations.cumulative_years.buckets) : [] end end end diff --git a/app/controllers/concerns/facetable.rb b/app/controllers/concerns/facetable.rb index 0c661ebcb..623febd63 100644 --- a/app/controllers/concerns/facetable.rb +++ b/app/controllers/concerns/facetable.rb @@ -22,7 +22,7 @@ def facet_by_year(arr) end end - def facet_by_cumuative_year(arr) + def facet_by_cumulative_year(arr) arr.map do |hsh| { "id" => hsh["key"].to_s, "title" => hsh["key"].to_s, @@ -38,6 +38,14 @@ def facet_by_key(arr) end end + def facet_by_software(arr) + arr.map do |hsh| + { "id" => hsh["key"].downcase, + "title" => hsh["key"], + "count" => hsh["doc_count"] } + end + end + def facet_by_schema(arr) arr.map do |hsh| id = hsh["key"].split("-").last @@ -60,8 +68,8 @@ def facet_by_region(arr) def facet_by_resource_type(arr) arr.map do |hsh| - { "id" => hsh["key"], - "title" => hsh["key"].underscore.humanize, + { "id" => hsh["key"].underscore.dasherize, + "title" => hsh["key"], "count" => hsh["doc_count"] } end end diff --git a/app/controllers/data_centers_controller.rb b/app/controllers/data_centers_controller.rb index 684c6d846..c30780b02 100644 --- a/app/controllers/data_centers_controller.rb +++ b/app/controllers/data_centers_controller.rb @@ -59,6 +59,7 @@ def index }.compact options[:include] = @include options[:is_collection] = true + options[:links] = nil render json: DataCenterSerializer.new(@clients, options).serialized_json, status: :ok end @@ -75,8 +76,14 @@ def show def set_include if params[:include].present? - @include = params[:include].split(",").map { |i| i.downcase.underscore.to_sym } - @include = @include & [:provider, :repository] + include_keys = { + "member" => :provider + } + @include = params[:include].split(",").reduce([]) do |sum, i| + k = include_keys[i.downcase.underscore] + sum << k if k.present? + sum + end else @include = [] end diff --git a/app/controllers/dois_controller.rb b/app/controllers/dois_controller.rb index a739f90dd..3d4a916fd 100644 --- a/app/controllers/dois_controller.rb +++ b/app/controllers/dois_controller.rb @@ -1,6 +1,10 @@ require 'uri' +require 'base64' class DoisController < ApplicationController + include ActionController::MimeResponds + include Crosscitable + prepend_before_action :authenticate_user! before_action :set_doi, only: [:show, :destroy, :get_url] before_action :set_include, only: [:index, :show, :create, :update] @@ -80,17 +84,19 @@ def index render json: DoiSerializer.new(@dois, options).serialized_json, status: :ok else - sort = case params[:sort] when "name" then { "doi" => { order: 'asc' }} when "-name" then { "doi" => { order: 'desc' }} when "created" then { created: { order: 'asc' }} when "-created" then { created: { order: 'desc' }} + when "updated" then { updated: { order: 'asc' }} + when "-updated" then { updated: { order: 'desc' }} when "relevance" then { "_score": { "order": "desc" }} else { updated: { order: 'desc' }} end page = params[:page] || {} + if page[:size].present? page[:size] = [page[:size].to_i, 1000].min max_number = page[:size] > 0 ? 10000/page[:size] : 1 @@ -107,7 +113,6 @@ def index else response = Doi.query(params[:query], state: params[:state], - year: params[:year], created: params[:created], registered: params[:registered], provider_id: params[:provider_id], @@ -115,9 +120,15 @@ def index prefix: params[:prefix], person_id: params[:person_id], resource_type_id: params[:resource_type_id], - fields: params[:fields], + query_fields: params[:query_fields], schema_version: params[:schema_version], link_check_status: params[:link_check_status], + link_check_has_schema_org: params[:link_check_has_schema_org], + link_check_body_has_pid: params[:link_check_body_has_pid], + link_check_found_schema_org_id: params[:link_check_found_schema_org_id], + link_check_found_dc_identifier: params[:link_check_found_dc_identifier], + link_check_found_citation_doi: params[:link_check_found_citation_doi], + link_check_redirect_count_gte: params[:link_check_redirect_count_gte], source: params[:source], page: page, sort: sort) @@ -128,7 +139,6 @@ def index states = total > 0 ? facet_by_key(response.response.aggregations.states.buckets) : nil resource_types = total > 0 ? facet_by_resource_type(response.response.aggregations.resource_types.buckets) : nil - years = total > 0 ? facet_by_year(response.response.aggregations.years.buckets) : nil created = total > 0 ? facet_by_year(response.response.aggregations.created.buckets) : nil registered = total > 0 ? facet_by_year(response.response.aggregations.registered.buckets) : nil providers = total > 0 ? facet_by_provider(response.response.aggregations.providers.buckets) : nil @@ -136,75 +146,96 @@ def index prefixes = total > 0 ? facet_by_key(response.response.aggregations.prefixes.buckets) : nil schema_versions = total > 0 ? facet_by_schema(response.response.aggregations.schema_versions.buckets) : nil sources = total > 0 ? facet_by_key(response.response.aggregations.sources.buckets) : nil - link_checks = total > 0 ? facet_by_cumuative_year(response.response.aggregations.link_checks.buckets) : nil - - @dois = response.results.results - - options = {} - options[:meta] = { - total: total, - "total-pages" => total_pages, - page: page[:number], - states: states, - "resource-types" => resource_types, - years: years, - created: created, - registered: registered, - providers: providers, - clients: clients, - prefixes: prefixes, - "schema-versions" => schema_versions, - sources: sources, - "link-checks" => link_checks - }.compact - - options[:links] = { - self: request.original_url, - next: @dois.blank? ? nil : request.base_url + "/dois?" + { - query: params[:query], - "provider-id" => params[:provider_id], - "client-id" => params[:client_id], - year: params[:year], - fields: params[:fields], - "page[cursor]" => Array.wrap(@dois.last[:sort]).first, - "page[size]" => params.dig(:page, :size) }.compact.to_query - }.compact - options[:include] = @include - options[:is_collection] = true - options[:params] = { - :current_ability => current_ability, - } - - render json: DoiSerializer.new(@dois, options).serialized_json, status: :ok + link_checks_status = total > 0 ? facet_by_cumulative_year(response.response.aggregations.link_checks_status.buckets) : nil + links_with_schema_org = total > 0 ? facet_by_cumulative_year(response.response.aggregations.link_checks_has_schema_org.buckets) : nil + link_checks_schema_org_id = total > 0 ? response.response.aggregations.link_checks_schema_org_id.value : nil + link_checks_dc_identifier = total > 0 ? response.response.aggregations.link_checks_dc_identifier.value : nil + link_checks_citation_doi = total > 0 ? response.response.aggregations.link_checks_citation_doi.value : nil + links_checked = total > 0 ? response.response.aggregations.links_checked.value : nil + + respond_to do |format| + format.json do + @dois = response.results.results + options = {} + options[:meta] = { + total: total, + "total-pages" => total_pages, + page: page[:number], + states: states, + "resource-types" => resource_types, + created: created, + registered: registered, + providers: providers, + clients: clients, + prefixes: prefixes, + "schema-versions" => schema_versions, + sources: sources, + "link-checks-status" => link_checks_status, + "links-checked" => links_checked, + "links-with-schema-org" => links_with_schema_org, + "link-checks-schema-org-id" => link_checks_schema_org_id, + "link-checks-dc-identifier" => link_checks_dc_identifier, + "link-checks-citation-doi" => link_checks_citation_doi + }.compact + + options[:links] = { + self: request.original_url, + next: @dois.blank? ? nil : request.base_url + "/dois?" + { + query: params[:query], + "provider-id" => params[:provider_id], + "client-id" => params[:client_id], + fields: params[:fields], + "page[cursor]" => Array.wrap(@dois.last[:sort]).first, + "page[size]" => params.dig(:page, :size) }.compact.to_query + }.compact + options[:include] = @include + options[:is_collection] = true + options[:params] = { + :current_ability => current_ability, + } + + render json: DoiSerializer.new(@dois, options).serialized_json, status: :ok + end + format.citation do + # fetch formatted citations + render citation: response.records.to_a, style: params[:style] || "apa", locale: params[:locale] || "en-US" + end + format.any(:bibtex, :citeproc, :codemeta, :crosscite, :datacite, :datacite_json, :jats, :ris, :schema_org) { render request.format.to_sym => response.records.to_a } + end end end def show authorize! :read, @doi - options = {} - options[:include] = @include - options[:is_collection] = false - options[:params] = { - :current_ability => current_ability, - } - - render json: DoiSerializer.new(@doi, options).serialized_json, status: :ok + respond_to do |format| + format.json do + options = {} + options[:include] = @include + options[:is_collection] = false + options[:params] = { + current_ability: current_ability, + detail: true + } + + render json: DoiSerializer.new(@doi, options).serialized_json, status: :ok + end + format.citation do + # fetch formatted citation + render citation: @doi, style: params[:style] || "apa", locale: params[:locale] || "en-US" + end + format.any(:bibtex, :citeproc, :codemeta, :crosscite, :datacite, :datacite_json, :jats, :ris, :schema_org) { render request.format.to_sym => @doi } + end end def validate logger = Logger.new(STDOUT) # logger.info safe_params.inspect - @doi = Doi.new(safe_params) - authorize! :create, @doi - - if @doi.errors.present? - logger.info @doi.errors.inspect - render json: serialize(@doi.errors), status: :ok - elsif @doi.validation_errors? - logger.info @doi.validation_errors.inspect - render json: serialize(@doi.validation_errors), status: :ok - else + @doi = Doi.new(safe_params.merge(only_validate: true)) + + authorize! :validate, @doi + + if @doi.valid? options = {} options[:include] = @include options[:is_collection] = false @@ -213,27 +244,30 @@ def validate } render json: DoiSerializer.new(@doi, options).serialized_json, status: :ok + else + logger.info @doi.errors.messages + render json: serialize(@doi.errors.messages), status: :ok end end def create logger = Logger.new(STDOUT) # logger.info safe_params.inspect + @doi = Doi.new(safe_params) - authorize! :create, @doi # capture username and password for reuse in the handle system @doi.current_user = current_user - if safe_params[:xml] && safe_params[:event] && @doi.validation_errors? - logger.error @doi.validation_errors.inspect - render json: serialize(@doi.validation_errors), status: :unprocessable_entity - elsif @doi.save + authorize! :new, @doi + + if @doi.save options = {} options[:include] = @include options[:is_collection] = false options[:params] = { - :current_ability => current_ability, + current_ability: current_ability, + detail: true } render json: DoiSerializer.new(@doi, options).serialized_json, status: :created, location: @doi @@ -246,44 +280,47 @@ def create def update logger = Logger.new(STDOUT) # logger.info safe_params.inspect + @doi = Doi.where(doi: params[:id]).first exists = @doi.present? if exists - if params[:data][:attributes][:mode] == "transfer" + # capture username and password for reuse in the handle system + @doi.current_user = current_user + + if params.dig(:data, :attributes, :mode) == "transfer" + # only update client_id + authorize! :transfer, @doi + @doi.assign_attributes(safe_params.slice(:client_id)) else authorize! :update, @doi + @doi.assign_attributes(safe_params.except(:doi, :client_id)) end - - @doi.assign_attributes(safe_params.except(:doi)) else doi_id = validate_doi(params[:id]) fail ActiveRecord::RecordNotFound unless doi_id.present? @doi = Doi.new(safe_params.merge(doi: doi_id)) + # capture username and password for reuse in the handle system + @doi.current_user = current_user - authorize! :create, @doi + authorize! :new, @doi end - # capture username and password for reuse in the handle system - @doi.current_user = current_user - - if safe_params[:xml] && (safe_params[:event] || safe_params[:validate]) && @doi.validation_errors? - logger.error @doi.validation_errors.inspect - render json: serialize(@doi.validation_errors), status: :unprocessable_entity - elsif @doi.save + if @doi.save options = {} options[:include] = @include options[:is_collection] = false options[:params] = { - :current_ability => current_ability, + current_ability: current_ability, + detail: true } render json: DoiSerializer.new(@doi, options).serialized_json, status: exists ? :ok : :created else - logger.warn @doi.errors.inspect - render json: serialize(@doi.errors), include: @include, status: :unprocessable_entity + logger.warn @doi.errors.messages + render json: serialize(@doi.errors.messages), include: @include, status: :unprocessable_entity end end @@ -409,94 +446,139 @@ def set_include private def safe_params + logger = Logger.new(STDOUT) + fail JSON::ParserError, "You need to provide a payload following the JSONAPI spec" unless params[:data].present? + # default values for attributes stored as JSON + defaults = { data: { titles: [], descriptions: [], types: {}, dates: [], rightsList: [], creators: [], contributors: [] }} + attributes = [ :doi, - "confirm-doi", - :identifier, - :url, :title, + :confirmDoi, + :url, + :titles, + { titles: [:title, :titleType, :lang] }, :publisher, - :published, + :publicationYear, :created, :prefix, :suffix, - "resource-type-subtype", - "last-landing-page", - "last-landing-page-status", - "last-landing-page-status-check", + :types, + { types: [:resourceTypeGeneral, :resourceType, :schemaOrg, :bibtex, :citeproc, :ris] }, + :dates, + { dates: [:date, :dateType, :dateInformation] }, + :landingPage, { - "last-landing-page-status-result" => [ - "error", - "redirect-count", - { "redirect-urls" => [] }, - "download-latency", - "has-schema-org", - "schema-org-id", - { "schema-org-id" => ["@type", "value", "propertyID"] }, - "dc-identifier", - "citation-doi", - "body-has-pid" + landingPage: [ + :checked, + :url, + :status, + :contentType, + :error, + :redirectCount, + { redirectUrls: [] }, + :downloadLatency, + :hasSchemaOrg, + :schemaOrgId, + { schemaOrgId: ["@type", :value, :propertyID] }, + :dcIdentifier, + :citationDoi, + :bodyHasPid ] }, - "last-landing-page-content-type", - "content-url", - "content-size", - "content-format", - :description, - :license, + :contentUrl, + :size, + :format, + :descriptions, + { descriptions: [:description, :descriptionType, :lang] }, + :rightsList, + { rightsList: [:rights, :rightsUri] }, :xml, - :validate, + :regenerate, :source, :version, - "metadata-version", - "schema-version", - :state, "is-active", + :metadataVersion, + :schemaVersion, + :state, + :isActive, :reason, :registered, :updated, :mode, :event, :regenerate, + :should_validate, :client, - "resource_type", - author: [:type, :id, :name, "given-name", "family-name", "givenName", "familyName"] + :creators, + { creators: [:type, :id, :name, :givenName, :familyName, :affiliation] }, + :contributors, + { contributors: [:type, :id, :name, :givenName, :familyName, :affiliation, :contributorType] }, + :identifiers, + { identifiers: [:identifier, :identifierType] }, + :relatedIdentifiers, + { relatedIdentifiers: [:relatedIdentifier, :relatedIdentifierType, :relationType, :resourceTypeGeneral, :relatedMetadataScheme, :schemeUri, :schemeType] }, + :fundingReferences, + { fundingReferences: [:funderName, :funderIdentifier, :funderIdentifierType, :awardNumber, :awardUri, :awardTitle] }, + :geoLocations, + { geoLocations: [{ geolocationPoint: [:pointLongitude, :pointLatitude] }, { geolocationBox: [:westBoundLongitude, :eastBoundLongitude, :southBoundLatitude, :northBoundLatitude] }, :geoLocationPlace] } ] + relationships = [{ client: [data: [:type, :id]] }] + + p = params.require(:data).permit(:type, :id, attributes: attributes, relationships: relationships).reverse_merge(defaults) + client_id = p.dig("relationships", "client", "data", "id") || current_user.try(:client_id) + p = p.fetch("attributes").merge(client_id: client_id) + + # extract attributes from xml field and merge with attributes provided directly + xml = p[:xml].present? ? Base64.decode64(p[:xml]).force_encoding("UTF-8") : nil + + meta = xml.present? ? parse_xml(xml, doi: p[:doi]) : {} + xml = meta["string"] + + read_attrs = [p[:creators], p[:contributors], p[:titles], p[:publisher], + p[:publicationYear], p[:types], p[:descriptions], p[:container], p[:sizes], + p[:formats], p[:version], p[:language], p[:dates], p[:identifiers], + p[:relatedIdentifiers], p[:fundingReferences], p[:geoLocations], p[:rightsList], + p[:subjects], p[:contentUrl], p[:schemaVersion]].compact + + # replace DOI, but otherwise don't touch the XML + # use Array.wrap(read_attrs.first) as read_attrs may also be [[]] + if meta["from"] == "datacite" && Array.wrap(read_attrs.first).blank? + xml = replace_doi(xml, doi: p[:doi] || meta["doi"]) + elsif xml.present? || Array.wrap(read_attrs.first).present? + regenerate = true + end - relationships = [ - { client: [data: [:type, :id]] }, - { provider: [data: [:type, :id]] }, - { "resource-type" => [:data, data: [:type, :id]] } - ] - - p = params.require(:data).permit(:type, :id, attributes: attributes, relationships: relationships) - p = p.fetch("attributes").merge(client_id: p.dig("relationships", "client", "data", "id"), resource_type_general: camelize_str(p.dig("relationships", "resource-type", "data", "id"))) - p.merge( - additional_type: p["resource-type-subtype"], - schema_version: p["schema-version"], - last_landing_page: p["last-landing-page"], - last_landing_page_status: p["last-landing-page-status"], - last_landing_page_status_check: p["last-landing-page-status-check"], - last_landing_page_status_result: p["last-landing-page-status-result"], - last_landing_page_content_type: p["last-landing-page-content-type"] - ).except( - "confirm-doi", :identifier, :prefix, :suffix, "resource-type-subtype", - "metadata-version", "schema-version", :state, :mode, "is-active", - :created, :registered, :updated, "last-landing-page", - "last-landing-page-status", "last-landing-page-status-check", - "last-landing-page-status-result", "last-landing-page-content-type") - end - - def underscore_str(str) - return str unless str.present? + p.merge!(xml: xml) if xml.present? - str.underscore - end + read_attrs_keys = [:creators, :contributors, :titles, :publisher, + :publicationYear, :types, :descriptions, :container, :sizes, + :formats, :language, :dates, :identifiers, + :relatedIdentifiers, :fundingReferences, :geoLocations, :rightsList, + :subjects, :contentUrl, :schemaVersion] - def camelize_str(str) - return str unless str.present? + # merge attributes from xml into regular attributes + # make sure we don't accidentally set any attributes to nil + read_attrs_keys.each do |attr| + p.merge!(attr.to_s.underscore => p[attr].presence || meta[attr.to_s.underscore]) if p.has_key?(attr) || meta[attr.to_s.underscore].present? + end + p.merge!(version_info: p[:version] || meta["version_info"]) if p.has_key?(:version_info) || meta["version_info"].present? - str.underscore.camelize + p.merge( + regenerate: p[:regenerate] || regenerate, + landing_page: p[:landingPage], + last_landing_page: p[:lastLandingPage], + last_landing_page_status: p[:lastLandingPageStatus], + last_landing_page_status_check: p[:lastLandingPageStatusCheck], + last_landing_page_status_result: p[:lastLandingPageStatusResult], + last_landing_page_content_type: p[:lastLandingPageContentType] + ).except( + :confirmDoi, :prefix, :suffix, :publicationYear, + :rightsList, :identifiers, :relatedIdentifiers, :fundingReferences, :geoLocations, + :metadataVersion, :schemaVersion, :state, :mode, :isActive, :landingPage, + :created, :registered, :updated, :lastLandingPage, :version, + :lastLandingPageStatus, :lastLandingPageStatusCheck, + :lastLandingPageStatusResult, :lastLandingPageContentType) end def add_metadata_to_bugsnag(report) diff --git a/app/controllers/index_controller.rb b/app/controllers/index_controller.rb index 57175884a..1417139d6 100644 --- a/app/controllers/index_controller.rb +++ b/app/controllers/index_controller.rb @@ -5,34 +5,10 @@ class IndexController < ApplicationController before_action :set_doi, only: [:show] def index - authorize! :index, :Index render plain: ENV['SITE_TITLE'] end - # we support content negotiation in show action - def show - authorize! :show, @doi - - respond_to do |format| - format.citation do - # fetch formatted citation - @doi.style = params[:style] || "apa" - @doi.locale = params[:locale] || "en-US" - render citation: @doi - end - format.any(:bibtex, :citeproc, :codemeta, :crosscite, :datacite, :datacite_json, :jats, :ris, :schema_org) { render request.format.to_sym => @doi } - format.any { fail ActionController::UnknownFormat } - end - end - # def routing_error # fail ActionController::RoutingError # end - - protected - - def set_doi - @doi = Doi.where(doi: params[:id]).first - fail ActiveRecord::RecordNotFound unless @doi.present? - end end diff --git a/app/controllers/media_controller.rb b/app/controllers/media_controller.rb index b7fa3464c..957393af6 100644 --- a/app/controllers/media_controller.rb +++ b/app/controllers/media_controller.rb @@ -125,8 +125,8 @@ def set_include def safe_params fail JSON::ParserError, "You need to provide a payload following the JSONAPI spec" unless params[:data].present? ActiveModelSerializers::Deserialization.jsonapi_parse!( - params, only: ["media-type", :url], - keys: { "media-type" => :media_type } + params, only: ["mediaType", :url], + keys: { "mediaType" => :media_type } ) end end diff --git a/app/controllers/members_controller.rb b/app/controllers/members_controller.rb index 1457fb376..6b26f4abe 100644 --- a/app/controllers/members_controller.rb +++ b/app/controllers/members_controller.rb @@ -64,6 +64,7 @@ def index }.compact options[:include] = @include options[:is_collection] = true + options[:links] = nil render json: MemberSerializer.new(@members, options).serialized_json, status: :ok end diff --git a/app/controllers/providers_controller.rb b/app/controllers/providers_controller.rb index 7040beeab..3f60e76ed 100644 --- a/app/controllers/providers_controller.rb +++ b/app/controllers/providers_controller.rb @@ -30,7 +30,7 @@ def index elsif params[:ids].present? response = Provider.find_by_ids(params[:ids], page: page, sort: sort) else - response = Provider.query(params[:query], year: params[:year], region: params[:region], organization_type: params[:organization_type], focus_area: params[:focus_area], fields: params[:fields], page: page, sort: sort) + response = Provider.query(params[:query], year: params[:year], region: params[:region], organization_type: params[:organization_type], focus_area: params[:focus_area], query_fields: params[:query_fields], page: page, sort: sort) end total = response.results.total @@ -151,8 +151,8 @@ def set_provider def safe_params fail JSON::ParserError, "You need to provide a payload following the JSONAPI spec" unless params[:data].present? ActiveModelSerializers::Deserialization.jsonapi_parse!( - params, only: [:name, :symbol, :description, :website, :joined, "organization-type", "focus-area", :phone, "contact-name", "contact-email", "is_active", "password-input", :country], - keys: { "organization-type" => :organization_type, "focus-area" => :focus_area, "contact-name" => :contact_name, "contact-email" => :contact_email, :country => :country_code, "is-active" => :is_active, "password-input" => :password_input } + params, only: [:name, :symbol, :description, :website, :joined, "organizationType", "focusArea", :phone, "contactName", "contactEmail", "isActive", "passwordInput", :country], + keys: { "organizationType" => :organization_type, "focusArea" => :focus_area, "contactName" => :contact_name, "contactEmail" => :contact_email, :country => :country_code, "isActive" => :is_active, "passwordInput" => :password_input } ) end end diff --git a/app/controllers/works_controller.rb b/app/controllers/works_controller.rb new file mode 100644 index 000000000..568894575 --- /dev/null +++ b/app/controllers/works_controller.rb @@ -0,0 +1,136 @@ +class WorksController < ApplicationController + prepend_before_action :authenticate_user! + before_action :set_doi, only: [:show] + before_action :set_include, only: [:index, :show] + before_bugsnag_notify :add_metadata_to_bugsnag + + def index + authorize! :read, Doi + + sort = case params[:sort] + when "name" then { "doi" => { order: 'asc' }} + when "-name" then { "doi" => { order: 'desc' }} + when "created" then { created: { order: 'asc' }} + when "-created" then { created: { order: 'desc' }} + when "updated" then { updated: { order: 'asc' }} + when "-updated" then { updated: { order: 'desc' }} + when "relevance" then { "_score": { "order": "desc" }} + else { updated: { order: 'desc' }} + end + + page = params[:page] || {} + if page[:size].present? + page[:size] = [page[:size].to_i, 1000].min + max_number = page[:size] > 0 ? 10000/page[:size] : 1 + else + page[:size] = 25 + max_number = 10000/page[:size] + end + page[:number] = page[:number].to_i > 0 ? [page[:number].to_i, max_number].min : 1 + + if params[:id].present? + response = Doi.find_by_id(params[:id]) + elsif params[:ids].present? + response = Doi.find_by_ids(params[:ids], page: page, sort: sort) + else + response = Doi.query(params[:query], + state: "findable", + created: params[:created], + registered: params[:registered], + provider_id: params[:member_id], + client_id: params[:data_center_id], + prefix: params[:prefix], + person_id: params[:person_id], + resource_type_id: params[:resource_type_id], + schema_version: params[:schema_version], + page: page, + sort: sort) + end + + total = response.results.total + total_pages = page[:size] > 0 ? ([total.to_f, 10000].min / page[:size]).ceil : 0 + + resource_types = total > 0 ? facet_by_resource_type(response.response.aggregations.resource_types.buckets) : nil + registered = total > 0 ? facet_by_year(response.response.aggregations.registered.buckets) : nil + providers = total > 0 ? facet_by_provider(response.response.aggregations.providers.buckets) : nil + clients = total > 0 ? facet_by_client(response.response.aggregations.clients.buckets) : nil + + @dois = response.results.results + + options = {} + options[:meta] = { + "resource-types" => resource_types, + registered: registered, + "data-centers" => clients, + total: total, + "total-pages" => total_pages, + page: page[:number] + }.compact + + options[:links] = { + self: request.original_url, + next: @dois.blank? ? nil : request.base_url + "/dois?" + { + query: params[:query], + "member-id" => params[:provider_id], + "data-center-id" => params[:client_id], + "page[size]" => params.dig(:page, :size) }.compact.to_query + }.compact + options[:include] = @include + options[:is_collection] = true + options[:links] = nil + options[:params] = { + :current_ability => current_ability, + } + + render json: WorkSerializer.new(@dois, options).serialized_json, status: :ok + end + + def show + authorize! :read, @doi + + options = {} + options[:include] = @include + options[:is_collection] = false + options[:params] = { + current_ability: current_ability, + detail: true + } + + render json: WorkSerializer.new(@doi, options).serialized_json, status: :ok + end + + protected + + def set_doi + @doi = Doi.where(doi: params[:id]).first + fail ActiveRecord::RecordNotFound unless @doi.present? + + # capture username and password for reuse in the handle system + @doi.current_user = current_user + end + + def set_include + if params[:include].present? + include_keys = { + "data_center" => :client, + "member" => :provider, + "resource_type" => :resource_type + } + @include = params[:include].split(",").reduce([]) do |sum, i| + k = include_keys[i.downcase.underscore] + sum << k if k.present? + sum + end + else + @include = nil + end + end + + def add_metadata_to_bugsnag(report) + return nil unless params.dig(:data, :attributes, :xml).present? + + report.add_tab(:metadata, { + metadata: Base64.decode64(params.dig(:data, :attributes, :xml)) + }) + end +end diff --git a/app/jobs/doi_import_by_day_job.rb b/app/jobs/doi_import_by_day_job.rb new file mode 100644 index 000000000..43c938d2d --- /dev/null +++ b/app/jobs/doi_import_by_day_job.rb @@ -0,0 +1,7 @@ +class DoiImportByDayJob < ActiveJob::Base + queue_as :lupo_background + + def perform(options={}) + Doi.import_by_day(options) + end +end \ No newline at end of file diff --git a/app/jobs/index_job.rb b/app/jobs/index_job.rb index 8d24b7f7c..5687eba52 100644 --- a/app/jobs/index_job.rb +++ b/app/jobs/index_job.rb @@ -1,6 +1,11 @@ class IndexJob < ActiveJob::Base queue_as :lupo + rescue_from ActiveJob::DeserializationError do |error| + logger = Logger.new(STDOUT) + logger.error error.message + end + def perform(obj) obj.__elasticsearch__.index_document end diff --git a/app/models/ability.rb b/app/models/ability.rb index fbbccc6a8..012f1ac0f 100644 --- a/app/models/ability.rb +++ b/app/models/ability.rb @@ -7,49 +7,44 @@ def initialize(user) alias_action :create, :read, :update, :destroy, to: :crud user ||= User.new(nil) # Guest user - @user = user + # @user = user if user.role_id == "staff_admin" can :manage, :all - # can :manage, [Provider, ProviderPrefix, Client, ClientPrefix, Prefix, Phrase, User] - # can [:read, :transfer, :set_state, :set_minted, :set_url, :delete_test_dois], Doi cannot [:new, :create], Doi do |doi| doi.client.blank? || !doi.client.prefixes.where(prefix: doi.prefix).first end - can [:read_landing_page_results], Doi elsif user.role_id == "staff_user" can :read, :all - can [:read_landing_page_results], Doi elsif user.role_id == "provider_admin" && user.provider_id.present? can [:update, :read], Provider, :symbol => user.provider_id.upcase can [:manage], ProviderPrefix, :provider_id => user.provider_id can [:manage], Client,:provider_id => user.provider_id - can [:manage], ClientPrefix#, :client_id => user.provider_id + can [:manage], ClientPrefix #, :client_id => user.provider_id # if Flipper[:delete_doi].enabled?(user) # can [:manage], Doi, :provider_id => user.provider_id # else # can [:read, :update], Doi, :provider_id => user.provider_id # end - can [:read, :transfer], Doi, :provider_id => user.provider_id + + can [:read, :transfer, :read_landing_page_results], Doi, :provider_id => user.provider_id can [:read], Doi do |doi| doi.findable? end can [:read], User can [:read], Phrase - can [:read_landing_page_results], Doi, :provider_id => user.provider_id elsif user.role_id == "provider_user" && user.provider_id.present? can [:read], Provider, :symbol => user.provider_id.upcase can [:read], ProviderPrefix, :provider_id => user.provider_id can [:read], Client, :provider_id => user.provider_id can [:read], ClientPrefix#, :client_id => user.client_id - can [:read], Doi, :provider_id => user.provider_id + can [:read, :read_landing_page_results], Doi, :provider_id => user.provider_id can [:read], Doi do |doi| doi.findable? end can [:read], User can [:read], Phrase - can [:read_landing_page_results], Doi, :provider_id => user.provider_id elsif user.role_id == "client_admin" && user.client_id.present? can [:read, :update], Client, :symbol => user.client_id.upcase can [:read], ClientPrefix, :client_id => user.client_id @@ -59,26 +54,25 @@ def initialize(user) # else # can [:read, :update], Doi, :client_id => user.client_id # end - can [:read, :update, :destroy, :register_url, :get_url, :get_urls], Doi, :client_id => user.client_id - can [:new, :create], Doi do |doi| - doi.client_id == user.client_id && doi.client.prefixes.where(prefix: doi.prefix).first + + can [:read, :destroy, :update, :register_url, :validate, :get_url, :get_urls, :read_landing_page_results], Doi, :client_id => user.client_id + can [:new, :create], Doi do |doi| + doi.client.prefixes.where(prefix: doi.prefix).present? end can [:read], Doi do |doi| doi.findable? end can [:read], User can [:read], Phrase - can [:read_landing_page_results], Doi, :client_id => user.client_id elsif user.role_id == "client_user" && user.client_id.present? can [:read], Client, :symbol => user.client_id.upcase can [:read], ClientPrefix, :client_id => user.client_id - can [:read], Doi, :client_id => user.client_id + can [:read, :read_landing_page_results], Doi, :client_id => user.client_id can [:read], Doi do |doi| doi.findable? end can [:read], User can [:read], Phrase - can [:read_landing_page_results], Doi, :client_id => user.client_id elsif user.role_id == "user" can [:read, :update], Provider, :symbol => user.provider_id.upcase if user.provider_id.present? can [:read, :update], Client, :symbol => user.client_id.upcase if user.client_id.present? diff --git a/app/models/client.rb b/app/models/client.rb index 774d533e3..8334462af 100644 --- a/app/models/client.rb +++ b/app/models/client.rb @@ -62,7 +62,12 @@ class Client < ActiveRecord::Base analyzer: { string_lowercase: { tokenizer: 'keyword', filter: %w(lowercase ascii_folding) } }, - filter: { ascii_folding: { type: 'asciifolding', preserve_original: true } } + normalizer: { + keyword_lowercase: { type: "custom", filter: %w(lowercase) } + }, + filter: { + ascii_folding: { type: 'asciifolding', preserve_original: true } + } } } do mapping dynamic: 'false' do @@ -71,7 +76,8 @@ class Client < ActiveRecord::Base indexes :provider_id, type: :keyword indexes :repository_id, type: :keyword indexes :prefix_ids, type: :keyword - indexes :name, type: :text, fields: { keyword: { type: "keyword" }, raw: { type: "text", "analyzer": "string_lowercase", "fielddata": true }} + indexes :name, type: :text, fields: { keyword: { type: "keyword" }, raw: { type: "text", analyzer: "string_lowercase", "fielddata": true }} + indexes :description, type: :text indexes :contact_name, type: :text indexes :contact_email, type: :text, fields: { keyword: { type: "keyword" }} indexes :re3data, type: :keyword @@ -80,6 +86,7 @@ class Client < ActiveRecord::Base indexes :domains, type: :text indexes :year, type: :integer indexes :url, type: :text, fields: { keyword: { type: "keyword" }} + indexes :software, type: :text, fields: { keyword: { type: "keyword" }, raw: { type: "text", analyzer: "string_lowercase", "fielddata": true }} indexes :cache_key, type: :keyword indexes :created, type: :date indexes :updated, type: :date @@ -100,12 +107,14 @@ def as_indexed_json(options={}) "repository_id" => repository_id, "prefix_ids" => prefix_ids, "name" => name, + "description" => description, "symbol" => symbol, "year" => year, "contact_name" => contact_name, "contact_email" => contact_email, "domains" => domains, "url" => url, + "software" => software, "is_active" => is_active, "password" => password, "cache_key" => cache_key, @@ -119,14 +128,15 @@ def as_indexed_json(options={}) end def self.query_fields - ['symbol^10', 'name^10', 'contact_name^10', 'contact_email^10', 'domains', 'url', 'repository.software.name^3', 'repository.subjects.text^3', 'repository.certificates.text^3', '_all'] + ['symbol^10', 'name^10', 'description^10', 'contact_name^10', 'contact_email^10', 'domains', 'url', 'software^3', 'repository.subjects.text^3', 'repository.certificates.text^3', '_all'] end def self.query_aggregations { years: { date_histogram: { field: 'created', interval: 'year', min_doc_count: 1 } }, cumulative_years: { terms: { field: 'cumulative_years', min_doc_count: 1, order: { _count: "asc" } } }, - providers: { terms: { field: 'provider_id', size: 15, min_doc_count: 1 } } + providers: { terms: { field: 'provider_id', size: 15, min_doc_count: 1 } }, + software: { terms: { field: 'software.keyword', size: 15, min_doc_count: 1 } } } end @@ -247,7 +257,7 @@ def to_jsonapi "domains" => domains, "provider-id" => provider_id, "prefixes" => prefixes.map { |p| p.prefix }, - "is-active" => is_active == "\x01", + "is-active" => is_active.getbyte(0) == 1, "version" => version, "created" => created.iso8601, "updated" => updated.iso8601, diff --git a/app/models/concerns/cacheable.rb b/app/models/concerns/cacheable.rb index e55ed0a28..52e3dd80a 100644 --- a/app/models/concerns/cacheable.rb +++ b/app/models/concerns/cacheable.rb @@ -50,42 +50,8 @@ def cached_media_count(options={}) end end - def fetch_cached_meta - if updated.present? - Rails.cache.fetch("cached_meta/#{doi}-#{updated.iso8601}") do - if from.present? && string.present? - send("read_" + from, string: string, sandbox: sandbox) - else - read_datacite(string: fetch_cached_xml, sandbox: sandbox) - end - end - else - if from.present? && string.present? - send("read_" + from, string: string, sandbox: sandbox) - else - read_datacite(string: xml, sandbox: sandbox) - end - end - rescue ArgumentError, NoMethodError => e - logger = Logger.new(STDOUT) - logger.error "Error for " + doi + ": " + e.message - return {} - end - - def fetch_cached_xml - if updated.present? - Rails.cache.fetch("cached_xml/#{doi}-#{updated.iso8601}", raw: true) do - m = metadata.first - m.present? ? m.xml : nil - end - else - m = metadata.first - m.present? ? m.xml : nil - end - end - def fetch_cached_metadata_version - if updated.present? + if updated.present? && Rails.application.config.action_controller.perform_caching Rails.cache.fetch("cached_metadata_version/#{doi}-#{updated.iso8601}") do current_metadata ? current_metadata.metadata_version : 0 end @@ -95,19 +61,31 @@ def fetch_cached_metadata_version end def cached_client_response(id, options={}) - Rails.cache.fetch("client_response/#{id}", expires_in: 1.day) do + if Rails.application.config.action_controller.perform_caching + Rails.cache.fetch("client_response/#{id}", expires_in: 1.day) do + Client.where(symbol: id).first + end + else Client.where(symbol: id).first end end def cached_prefix_response(prefix, options={}) - Rails.cache.fetch("prefix_response/#{prefix}", expires_in: 7.days) do + if Rails.application.config.action_controller.perform_caching + Rails.cache.fetch("prefix_response/#{prefix}", expires_in: 7.days) do + Prefix.where(prefix: prefix).first + end + else Prefix.where(prefix: prefix).first end end def cached_provider_response(id, options={}) - Rails.cache.fetch("provider_response/#{id}", expires_in: 1.day) do + if Rails.application.config.action_controller.perform_caching + Rails.cache.fetch("provider_response/#{id}", expires_in: 1.day) do + Provider.where(symbol: id).first + end + else Provider.where(symbol: id).first end end diff --git a/app/models/concerns/checkable.rb b/app/models/concerns/checkable.rb index 74c5c9dff..35e3627ac 100644 --- a/app/models/concerns/checkable.rb +++ b/app/models/concerns/checkable.rb @@ -7,8 +7,8 @@ def get_landing_page_info(doi: nil, url: nil, keep: true) return { "status" => 404, "content-type" => nil, "checked" => Time.zone.now.utc.iso8601 } unless uri.present? - return { "status" => doi.last_landing_page_status, "content-type" => doi.last_landing_page_content_type, "checked" => doi.last_landing_page_status_check } if - doi.present? && keep && doi.last_landing_page_status_check.present? && doi.last_landing_page_status_check > (Time.zone.now - 7.days) + return { "status" => doi.landing_page['status'], "content-type" => doi.landing_page['content_type'], "checked" => doi.landing_page['checked'] } if + doi.present? && keep && doi.landing_page.present? && doi.landing_page['checked'].present? && doi.landing_page['checked'] > (Time.zone.now - 7.days) response = Maremma.head(uri, timeout: 5) if response.headers && response.headers["Content-Type"].present? diff --git a/app/models/concerns/crosscitable.rb b/app/models/concerns/crosscitable.rb index bdca5d828..aefc708b5 100644 --- a/app/models/concerns/crosscitable.rb +++ b/app/models/concerns/crosscitable.rb @@ -7,129 +7,84 @@ module Crosscitable included do include Bolognese::MetadataUtils - # track changes of virtual attributes + attr_accessor :issue, :volume, :style, :locale - def author=(value) - return @author if value.blank? || value == author - - attribute_will_change!(:author) - @author = value - end - - def title=(value) - return @title if value.nil? || value == title - - attribute_will_change!(:title) - @title = value - end - - def publisher=(value) - return @publisher if value.nil? || value == publisher - - attribute_will_change!(:publisher) - @publisher = value - end - - def date_published=(value) - return @date_published if value.nil? || value == date_published - - attribute_will_change!(:date_published) - @date_published = value - end - - def additional_type=(value) - return @additional_type if value.nil? || value == additional_type - - attribute_will_change!(:additional_type) - @additional_type = value - end - - def resource_type_general=(value) - return @resource_type_general if value.nil? || value == resource_type_general - - attribute_will_change!(:resource_type_general) - @resource_type_general = value + def sandbox + !Rails.env.production? end - def description=(value) - return @description if value.nil? || value == description - - attribute_will_change!(:description) - @description = value + def exists? + aasm_state != "not_found" end - def content_size=(value) - return @content_size if value.nil? || value == content_size - - attribute_will_change!(:content_size) - @content_size = value + def meta + @meta || {} end - def content_format=(value) - return @content_format if value.nil? || value == content_format - - attribute_will_change!(:content_format) - @content_format = value - end + def parse_xml(input, options={}) + return {} unless input.present? - # modified bolognese attributes + # check whether input is id and we need to fetch the content + id = normalize_id(input, sandbox: sandbox) - def sandbox - !Rails.env.production? - end + if id.present? + from = find_from_format(id: id) - # cache doi metadata - def meta - @meta ||= fetch_cached_meta - end + # generate name for method to call dynamically + hsh = from.present? ? send("get_" + from, id: id, sandbox: sandbox) : {} + input = hsh.fetch("string", nil) + else + from = find_from_format(string: input) + end - def exists? - meta.fetch("state", "not_found") != "not_found" - end + meta = from.present? ? send("read_" + from, { string: input, doi: options[:doi], sandbox: sandbox }).compact : {} + meta.merge("string" => input, "from" => from) + rescue NoMethodError, ArgumentError => exception + Bugsnag.notify(exception) + logger = Logger.new(STDOUT) + logger.error "Error " + exception.message + " for doi " + @doi + "." + logger.error exception - # default to DataCite schema 4 - def schema_version - @schema_version ||= meta.fetch("schema_version", nil) || "http://datacite.org/schema/kernel-4" + {} end - # cache xml - def xml - @xml || fetch_cached_xml + def replace_doi(input, options={}) + return input unless options[:doi].present? + + doc = Nokogiri::XML(input, nil, 'UTF-8', &:noblanks) + node = doc.at_css("identifier") + node.content = options[:doi].to_s.upcase if node.present? && options[:doi].present? + doc.to_xml.strip end - def xml=(value) - # check that input is well-formed if xml or json - input = well_formed_xml(value) - + def update_xml # check whether input is id and we need to fetch the content - id = normalize_id(input, sandbox: sandbox) + id = normalize_id(xml, sandbox: sandbox) if id.present? - @from = find_from_format(id: id) + from = find_from_format(id: id) # generate name for method to call dynamically - hsh = @from.present? ? send("get_" + @from, id: id, sandbox: sandbox) : {} - @string = hsh.fetch("string", nil) + hsh = from.present? ? send("get_" + from, id: id, sandbox: sandbox) : {} + xml = hsh.fetch("string", nil) else - @from = find_from_format(string: input) - @string = input + from = find_from_format(string: xml) end - attribute_will_change!(:xml) + # generate new xml if attributes have been set directly and/or from metadata that are not DataCite XML + read_attrs = %w(creators contributors titles publisher publication_year types descriptions container sizes formats version_info language dates identifiers related_identifiers funding_references geo_locations rights_list subjects content_url schema_version).map do |a| + [a.to_sym, send(a.to_s)] + end.to_h.compact - @meta = @from.present? ? send("read_" + @from, string: raw, sandbox: sandbox) : {} - @xml = (from == "datacite") ? raw : datacite_xml - rescue NoMethodError, ArgumentError => exception - Bugsnag.notify(exception) - logger = Logger.new(STDOUT) - logger.error "Error " + exception.message + " for doi " + doi + "." - @xml = nil + meta = from.present? ? send("read_" + from, { string: xml, doi: doi, sandbox: sandbox }.merge(read_attrs)) : {} + + xml = datacite_xml + + write_attribute(:xml, xml) end def well_formed_xml(string) - return '' unless string.present? - - string = Base64.decode64(string).force_encoding("UTF-8") + return nil unless string.present? from_xml(string) || from_json(string) @@ -139,20 +94,11 @@ def well_formed_xml(string) def from_xml(string) return nil unless string.start_with?(' e - line, column, level, text = e.message.split(":", 4) - message = text.strip + " at line #{line}, column #{column}" - errors.add(:xml, message) - - string + doc = Nokogiri::XML(string) { |config| config.strict.noblanks } + doc.to_xml.strip end def from_json(string) - return nil unless string.start_with?('[', '{') - linter = JsonLint::Linter.new errors_array = [] @@ -160,38 +106,20 @@ def from_json(string) valid &&= linter.send(:check_syntax_valid?, string, errors_array) valid &&= linter.send(:check_overlapping_keys?, string, errors_array) - errors_array.each { |e| errors.add(:xml, e.capitalize) } - errors_array.empty? ? nil : string - end + raise JSON::ParserError, errors_array.join("\n") if errors_array.present? - # validate against DataCite schema - def validation_errors - kernel = schema_version.split("/").last - filepath = Bundler.rubygems.find_name('bolognese').first.full_gem_path + "/resources/#{kernel}/metadata.xsd" - schema = Nokogiri::XML::Schema(open(filepath)) - - schema.validate(Nokogiri::XML(xml, nil, 'UTF-8')).reduce({}) do |sum, error| - location, level, source, text = error.message.split(": ", 4) - line, column = location.split(":", 2) - title = text.to_s.strip + " at line #{line}, column #{column}" if line.present? - source = source.split("}").last[0..-2] if line.present? - - errors.add(source.to_sym, title) + string + end - sum[source.to_sym] = Array(sum[source.to_sym]) + [title] + def get_content_type(string) + return "xml" if Nokogiri::XML(string).errors.empty? - sum + begin + JSON.parse(string) + return "json" + rescue + "string" end - rescue Nokogiri::XML::SyntaxError => e - line, column, level, text = e.message.split(":", 4) - message = text.strip + " at line #{line}, column #{column}" - errors.add(:xml, message) - - errors - end - - def validation_errors? - validation_errors.present? end end end diff --git a/app/models/concerns/dateable.rb b/app/models/concerns/dateable.rb index ce367ee0b..8a89b2f62 100644 --- a/app/models/concerns/dateable.rb +++ b/app/models/concerns/dateable.rb @@ -1,6 +1,26 @@ module Dateable extend ActiveSupport::Concern + included do + def get_date(dates, date_type) + dd = Array.wrap(dates).find { |d| d["dateType"] == date_type } || {} + dd.fetch("date", nil) + end + + def set_date(dates, date, date_type) + dd = Array.wrap(dates).find { |d| d["dateType"] == date_type } || { "dateType" => date_type } + dd["date"] = date + end + + def get_resource_type(types, type) + types[type] + end + + def set_resource_type(types, text, type) + types[type] = text + end + end + module ClassMethods def get_solr_date_range(from_date, until_date) from_date_string = get_datetime_from_input(from_date) || "*" diff --git a/app/models/concerns/indexable.rb b/app/models/concerns/indexable.rb index 495464e91..1ab3b95a3 100644 --- a/app/models/concerns/indexable.rb +++ b/app/models/concerns/indexable.rb @@ -8,11 +8,11 @@ module Indexable # use index_document instead of update_document to also update virtual attributes IndexJob.perform_later(self) if self.class.name == "Doi" - update_column(:indexed, Time.zone.now) + update_column(:indexed, Time.zone.now) send_import_message(self.to_jsonapi) if aasm_state == "findable" unless Rails.env.test? end end - + before_destroy do begin __elasticsearch__.delete_document @@ -29,7 +29,7 @@ def send_delete_message(data) def send_import_message(data) send_message(data, shoryuken_class: "DoiImportWorker") end - + # shoryuken_class is needed for the consumer to process the message # we use the AWS SQS client directly as there is no consumer in this app def send_message(body, options={}) @@ -85,7 +85,7 @@ def find_by_id_list(ids, options={}) def find_by_ids(ids, options={}) options[:sort] ||= { "_doc" => { order: 'asc' }} - + __elasticsearch__.search({ from: options[:page].present? ? (options.dig(:page, :number) - 1) * options.dig(:page, :size) : 0, size: options[:size] || 25, @@ -111,21 +111,27 @@ def query(query, options={}) sort = options[:sort] end - fields = options[:fields].presence || query_fields + fields = options[:query_fields].presence || query_fields must = [] must << { multi_match: { query: query, fields: fields, type: "phrase_prefix", slop: 3, max_expansions: 10 }} if query.present? must << { term: { aasm_state: options[:state] }} if options[:state].present? - must << { term: { resource_type_id: options[:resource_type_id] }} if options[:resource_type_id].present? + must << { term: { "types.resourceTypeGeneral": options[:resource_type_id].underscore.camelize }} if options[:resource_type_id].present? must << { terms: { provider_id: options[:provider_id].split(",") }} if options[:provider_id].present? must << { terms: { client_id: options[:client_id].split(",") }} if options[:client_id].present? must << { term: { prefix: options[:prefix] }} if options[:prefix].present? must << { term: { "author.id" => "https://orcid.org/#{options[:person_id]}" }} if options[:person_id].present? must << { range: { created: { gte: "#{options[:created].split(",").min}||/y", lte: "#{options[:created].split(",").max}||/y", format: "yyyy" }}} if options[:created].present? - must << { range: { registered: { gte: "#{options[:registered].split(",").min}||/y", lte: "#{options[:registered].split(",").max}||/y", format: "yyyy" }}} if options[:registered].present? must << { term: { schema_version: "http://datacite.org/schema/kernel-#{options[:schema_version]}" }} if options[:schema_version].present? must << { term: { source: options[:source] }} if options[:source].present? - must << { term: { last_landing_page_status: options[:link_check_status] }} if options[:link_check_status].present? + must << { term: { "landing_page.status": options[:link_check_status] }} if options[:link_check_status].present? + must << { exists: { field: "landing_page.checked" }} if options[:link_checked].present? + must << { term: { "landing_page.hasSchemaOrg": options[:link_check_has_schema_org] }} if options[:link_check_has_schema_org].present? + must << { term: { "landing_page.bodyHasPid": options[:link_check_body_has_pid] }} if options[:link_check_body_has_pid].present? + must << { exists: { field: "landing_page.schemaOrgId" }} if options[:link_check_found_schema_org_id].present? + must << { exists: { field: "landing_page.dcIdentifier" }} if options[:link_check_found_dc_identifier].present? + must << { exists: { field: "landing_page.citationDoi" }} if options[:link_check_found_citation_doi].present? + must << { range: { "landing_page.redirectCount": { "gte": options[:link_check_redirect_count_gte] } } } if options[:link_check_redirect_count_gte].present? must_not = [] @@ -139,9 +145,10 @@ def query(query, options={}) must_not << { exists: { field: "deleted_at" }} unless options[:include_deleted] elsif self.name == "Client" must << { range: { created: { gte: "#{options[:year].split(",").min}||/y", lte: "#{options[:year].split(",").max}||/y", format: "yyyy" }}} if options[:year].present? + must << { terms: { "software.raw" => options[:software].split(",") }} if options[:software].present? must_not << { exists: { field: "deleted_at" }} unless options[:include_deleted] elsif self.name == "Doi" - must << { range: { published: { gte: "#{options[:year].split(",").min}||/y", lte: "#{options[:year].split(",").max}||/y", format: "yyyy" }}} if options[:year].present? + must << { range: { registered: { gte: "#{options[:registered].split(",").min}||/y", lte: "#{options[:registered].split(",").max}||/y", format: "yyyy" }}} if options[:registered].present? end __elasticsearch__.search({ diff --git a/app/models/doi.rb b/app/models/doi.rb index f884a1935..2d13fc58a 100644 --- a/app/models/doi.rb +++ b/app/models/doi.rb @@ -4,6 +4,7 @@ class Doi < ActiveRecord::Base include Metadatable include Cacheable include Licensable + include Dateable # include helper module for generating random DOI suffixes include Helpable @@ -32,12 +33,12 @@ class Doi < ActiveRecord::Base event :register do # can't register test prefix - transitions :from => [:draft], :to => :registered, :unless => :is_test_prefix? + transitions :from => [:draft], :to => :registered, :if => [:registerable?] end event :publish do # can't index test prefix - transitions :from => [:draft], :to => :findable, :unless => :is_test_prefix? + transitions :from => [:draft], :to => :findable, :if => [:registerable?] transitions :from => :registered, :to => :findable end @@ -57,12 +58,15 @@ class Doi < ActiveRecord::Base self.table_name = "dataset" alias_attribute :created_at, :created alias_attribute :updated_at, :updated - alias_attribute :resource_type_subtype, :additional_type - alias_attribute :published, :date_published alias_attribute :registered, :minted + alias_attribute :state, :aasm_state attr_accessor :current_user - attr_accessor :validate + + attribute :regenerate, :boolean, default: false + attribute :only_validate, :boolean, default: false + attribute :should_validate, :boolean, default: false + attribute :agency, :string, default: "DataCite" belongs_to :client, foreign_key: :datacentre has_many :media, -> { order "created DESC" }, foreign_key: :dataset, dependent: :destroy @@ -76,19 +80,18 @@ class Doi < ActiveRecord::Base # from https://www.crossref.org/blog/dois-and-matching-regular-expressions/ but using uppercase validates_format_of :doi, :with => /\A10\.\d{4,5}\/[-\._;()\/:a-zA-Z0-9\*~\$\=]+\z/, :on => :create validates_format_of :url, :with => /\A(ftp|http|https):\/\/[\S]+/ , if: :url?, message: "URL is not valid" - validates_uniqueness_of :doi, message: "This DOI has already been taken" + validates_uniqueness_of :doi, message: "This DOI has already been taken", unless: :only_validate validates :last_landing_page_status, numericality: { only_integer: true }, if: :last_landing_page_status? - - # validate :validation_errors + validates :xml, presence: true, xml_schema: true, :if => Proc.new { |doi| doi.validatable? } after_commit :update_url, on: [:create, :update] after_commit :update_media, on: [:create, :update] - before_save :set_defaults, :update_metadata + before_validation :update_xml, if: :regenerate + before_save :set_defaults, :save_metadata before_create { self.created = Time.zone.now.utc.iso8601 } scope :q, ->(query) { where("dataset.doi = ?", query) } - scope :not_indexed, -> { where("updated > indexed") } # use different index for testing index_name Rails.env.test? ? "dois-test" : "dois" @@ -99,17 +102,42 @@ class Doi < ActiveRecord::Base indexes :doi, type: :keyword indexes :identifier, type: :keyword indexes :url, type: :text, fields: { keyword: { type: "keyword" }} - indexes :author_normalized, type: :object, properties: { - type: { type: :keyword }, - id: { type: :keyword }, + indexes :creators, type: :object, properties: { + nameType: { type: :keyword }, + nameIdentifiers: { type: :object, properties: { + nameIdentifier: { type: :keyword }, + nameIdentifierScheme: { type: :keyword } + }}, name: { type: :text }, - "given-name" => { type: :text }, - "family-name" => { type: :text } + givenName: { type: :text }, + familyName: { type: :text }, + affiliation: { type: :text } + } + indexes :contributors, type: :object, properties: { + nameType: { type: :keyword }, + nameIdentifiers: { type: :object, properties: { + nameIdentifier: { type: :keyword }, + nameIdentifierScheme: { type: :keyword } + }}, + name: { type: :text }, + givenName: { type: :text }, + familyName: { type: :text }, + affiliation: { type: :text }, + contributorType: { type: :keyword } + } + indexes :creator_names, type: :text + indexes :titles, type: :object, properties: { + title: { type: :keyword }, + titleType: { type: :keyword }, + lang: { type: :keyword } + } + indexes :descriptions, type: :object, properties: { + description: { type: :keyword }, + descriptionType: { type: :keyword }, + lang: { type: :keyword } } - indexes :author_names, type: :text - indexes :title_normalized, type: :text - indexes :description_normalized, type: :text indexes :publisher, type: :text, fields: { keyword: { type: "keyword" }} + indexes :publication_year, type: :date, format: "yyyy", ignore_malformed: true indexes :client_id, type: :keyword indexes :provider_id, type: :keyword indexes :resource_type_id, type: :keyword @@ -121,15 +149,71 @@ class Doi < ActiveRecord::Base url: { type: :text }, media_type: { type: :keyword }, version: { type: :keyword }, - created: { type: :date }, - updated: { type: :date } + created: { type: :date, ignore_malformed: true }, + updated: { type: :date, ignore_malformed: true } + } + indexes :identifiers, type: :object, properties: { + identifierType: { type: :keyword }, + identifier: { type: :keyword } } - indexes :alternate_identifier, type: :object, properties: { + indexes :related_identifiers, type: :object, properties: { + relatedIdentifierType: { type: :keyword }, + relatedIdentifier: { type: :keyword }, + relationType: { type: :keyword }, + resourceTypeGeneral: { type: :keyword } + } + indexes :types, type: :object, properties: { + resourceTypeGeneral: { type: :keyword }, + resourceType: { type: :keyword }, + schemaOrg: { type: :keyword }, + bibtex: { type: :keyword }, + citeproc: { type: :keyword }, + ris: { type: :keyword } + } + indexes :funding_references, type: :object, properties: { + funderName: { type: :keyword }, + funderIdentifier: { type: :keyword }, + funderIdentifierType: { type: :keyword }, + awardNumber: { type: :keyword }, + awardUri: { type: :keyword }, + awardTitle: { type: :keyword } + } + indexes :dates, type: :object, properties: { + date: { type: :date, format: "yyyy-MM-dd||yyyy-MM||yyyy", ignore_malformed: true }, + dateType: { type: :keyword } + } + indexes :geo_locations, type: :object, properties: { + geoLocationPoint: { type: :object }, + geoLocationBox: { type: :object }, + geoLocationPlace: { type: :keyword } + } + indexes :rights_list, type: :object, properties: { + rights: { type: :keyword }, + rightsUri: { type: :keyword } + } + indexes :subjects, type: :object, properties: { + subject: { type: :keyword }, + subjectScheme: { type: :keyword }, + schemeUri: { type: :keyword }, + valueUri: { type: :keyword } + } + indexes :container, type: :object, properties: { type: { type: :keyword }, - name: { type: :keyword } + identifier: { type: :keyword }, + identifierType: { type: :keyword }, + title: { type: :keyword }, + volume: { type: :keyword }, + issue: { type: :keyword }, + firstPage: { type: :keyword }, + lastPage: { type: :keyword } } - indexes :resource_type_subtype, type: :keyword - indexes :version, type: :integer + + indexes :xml, type: :text, index: "not_analyzed" + indexes :content_url, type: :keyword + indexes :version_info, type: :keyword + indexes :formats, type: :keyword + indexes :sizes, type: :keyword + indexes :language, type: :keyword indexes :is_active, type: :keyword indexes :aasm_state, type: :keyword indexes :schema_version, type: :keyword @@ -138,19 +222,30 @@ class Doi < ActiveRecord::Base indexes :prefix, type: :keyword indexes :suffix, type: :keyword indexes :reason, type: :text - indexes :xml, type: :text, index: "no" - indexes :last_landing_page_status, type: :integer - indexes :last_landing_page_status_check, type: :date - indexes :last_landing_page_content_type, type: :keyword + indexes :landing_page, type: :object, properties: { + checked: { type: :date, ignore_malformed: true }, + url: { type: :string }, + status: { type: :integer }, + contentType: { type: :string }, + error: { type: :keyword }, + redirectCount: { type: :integer }, + redirectUrls: { type: :keyword }, + downloadLatency: { type: :scaled_float, scaling_factor: 100 }, + hasSchemaOrg: { type: :boolean }, + schemaOrgId: { type: :keyword }, + dcIdentifier: { type: :keyword }, + citationDoi: { type: :keyword }, + bodyHasPid: { type: :boolean } + } indexes :cache_key, type: :keyword - indexes :published, type: :date, format: "yyyy-MM-dd||yyyy-MM||yyyy", ignore_malformed: true - indexes :registered, type: :date - indexes :created, type: :date - indexes :updated, type: :date + indexes :registered, type: :date, ignore_malformed: true + indexes :created, type: :date, ignore_malformed: true + indexes :updated, type: :date, ignore_malformed: true # include parent objects - indexes :client, type: :object - indexes :resource_type, type: :object + indexes :client, type: :object + indexes :provider, type: :object + indexes :resource_type, type: :object end def as_indexed_json(options={}) @@ -160,36 +255,47 @@ def as_indexed_json(options={}) "doi" => doi, "identifier" => identifier, "url" => url, - "author_normalized" => author_normalized, - "author_names" => author_names, - "title_normalized" => title_normalized, - "description_normalized" => description_normalized, + "creators" => creators, + "contributors" => contributors, + "creator_names" => creator_names, + "titles" => titles, + "descriptions" => descriptions, "publisher" => publisher, "client_id" => client_id, "provider_id" => provider_id, + "resource_type_id" => resource_type_id, "media_ids" => media_ids, "prefix" => prefix, "suffix" => suffix, - "resource_type_id" => resource_type_id, - "resource_type_subtype" => resource_type_subtype, - "alternate_identifier" => alternate_identifier, - "b_version" => b_version, + "types" => types, + "identifiers" => identifiers, + "related_identifiers" => related_identifiers, + "funding_references" => funding_references, + "publication_year" => publication_year, + "dates" => dates, + "geo_locations" => geo_locations, + "rights_list" => rights_list, + "container" => container, + "content_url" => content_url, + "version_info" => version_info, + "formats" => formats, + "sizes" => sizes, + "language" => language, + "subjects" => subjects, + "xml" => xml, "is_active" => is_active, - "last_landing_page_status" => last_landing_page_status, - "last_landing_page_status_check" => last_landing_page_status_check, - "last_landing_page_content_type" => last_landing_page_content_type, + "landing_page" => landing_page, "aasm_state" => aasm_state, "schema_version" => schema_version, "metadata_version" => metadata_version, "reason" => reason, - "xml_encoded" => xml_encoded, "source" => source, "cache_key" => cache_key, - "published" => published, "registered" => registered, "created" => created, "updated" => updated, "client" => client.as_indexed_json, + "provider" => provider.as_indexed_json, "resource_type" => resource_type.try(:as_indexed_json), "media" => media.map { |m| m.try(:as_indexed_json) } } @@ -197,22 +303,27 @@ def as_indexed_json(options={}) def self.query_aggregations { - resource_types: { terms: { field: 'resource_type_id', size: 15, min_doc_count: 1 } }, - states: { terms: { field: 'aasm_state', size: 10, min_doc_count: 1 } }, - years: { date_histogram: { field: 'published', interval: 'year', min_doc_count: 1 } }, + resource_types: { terms: { field: 'types.resourceTypeGeneral', size: 15, min_doc_count: 1 } }, + states: { terms: { field: 'aasm_state', size: 15, min_doc_count: 1 } }, + years: { date_histogram: { field: 'publication_year', interval: 'year', min_doc_count: 1 } }, created: { date_histogram: { field: 'created', interval: 'year', min_doc_count: 1 } }, registered: { date_histogram: { field: 'registered', interval: 'year', min_doc_count: 1 } }, - providers: { terms: { field: 'provider_id', size: 10, min_doc_count: 1 } }, - clients: { terms: { field: 'client_id', size: 50, min_doc_count: 1 } }, - prefixes: { terms: { field: 'prefix', size: 10, min_doc_count: 1 } }, - schema_versions: { terms: { field: 'schema_version', size: 10, min_doc_count: 1 } }, - link_checks: { terms: { field: 'last_landing_page_status', size: 10, min_doc_count: 1 } }, - sources: { terms: { field: 'source', size: 10, min_doc_count: 1 } } + providers: { terms: { field: 'provider_id', size: 15, min_doc_count: 1 } }, + clients: { terms: { field: 'client_id', size: 15, min_doc_count: 1 } }, + prefixes: { terms: { field: 'prefix', size: 15, min_doc_count: 1 } }, + schema_versions: { terms: { field: 'schema_version', size: 15, min_doc_count: 1 } }, + link_checks_status: { terms: { field: 'landing_page.status', size: 15, min_doc_count: 1 } }, + link_checks_has_schema_org: { terms: { field: 'landing_page.hasSchemaOrg', size: 2, min_doc_count: 1 } }, + link_checks_schema_org_id: { value_count: { field: "landing_page.schemaOrgId" } }, + link_checks_dc_identifier: { value_count: { field: "landing_page.dcIdentifier" } }, + link_checks_citation_doi: { value_count: { field: "landing_page.citationDoi" } }, + links_checked: { value_count: { field: "landing_page.checked" } }, + sources: { terms: { field: 'source', size: 15, min_doc_count: 1 } }, } end def self.query_fields - ['doi^10', 'title_normalized^10', 'author_names^10', 'author_normalized.name^10', 'author_normalized.id^10', 'publisher^10', 'description_normalized^10', 'resource_type_id^10', 'resource_type_subtype^10', 'alternate_identifier.name^10', '_all'] + ['doi^10', 'titles.title^10', 'creator_names^10', 'creators.name^10', 'creators.id^10', 'publisher^10', 'descriptions.description^10', 'types.resourceTypeGeneral^10', 'subjects.subject^10', 'identifiers.identifier^10', 'related_identifiers.relatedIdentifier^10', '_all'] end def self.find_by_id(id, options={}) @@ -228,39 +339,86 @@ def self.find_by_id(id, options={}) }) end + def self.import_all(options={}) + from_date = options[:from_date].present? ? Date.parse(options[:from_date]) : Date.current + until_date = options[:until_date].present? ? Date.parse(options[:until_date]) : Date.current + + # get every day between from_date and until_date + (from_date..until_date).each do |d| + DoiImportByDayJob.perform_later(from_date: d.strftime("%F")) + puts "Queued importing for DOIs created on #{d.strftime("%F")}." + end + end + + def self.import_by_day(options={}) + return nil unless options[:from_date].present? + from_date = Date.parse(options[:from_date]) + + count = 0 + + logger = Logger.new(STDOUT) + + Doi.where(created: from_date.midnight..from_date.end_of_day).find_each do |doi| + begin + string = doi.current_metadata.present? ? doi.current_metadata.xml : nil + meta = doi.read_datacite(string: string, sandbox: doi.sandbox) + attrs = %w(creators contributors titles publisher publication_year types descriptions container sizes formats language dates identifiers related_identifiers funding_references geo_locations rights_list subjects content_url).map do |a| + [a.to_sym, meta[a]] + end.to_h.merge(schema_version: meta["schema_version"] || "http://datacite.org/schema/kernel-4", version_info: meta["version"], xml: string) + + doi.update_columns(attrs) + rescue TypeError, NoMethodError => error + logger.error "[MySQL] Error importing metadata for " + doi.doi + ": " + error.message + else + count += 1 + end + end + + if count > 0 + logger.info "[MySQL] Imported metadata for #{count} DOIs created on #{options[:from_date]}." + end + end + def self.index(options={}) from_date = options[:from_date].present? ? Date.parse(options[:from_date]) : Date.current until_date = options[:until_date].present? ? Date.parse(options[:until_date]) : Date.current + index_time = options[:index_time].presence || Time.zone.now.utc.iso8601 # get every day between from_date and until_date (from_date..until_date).each do |d| - DoiIndexByDayJob.perform_later(from_date: d.strftime("%F")) + DoiIndexByDayJob.perform_later(from_date: d.strftime("%F"), index_time: index_time) puts "Queued indexing for DOIs created on #{d.strftime("%F")}." - end + end end def self.index_by_day(options={}) return nil unless options[:from_date].present? from_date = Date.parse(options[:from_date]) - + index_time = options[:index_time].presence || Time.zone.now.utc.iso8601 + errors = 0 count = 0 logger = Logger.new(STDOUT) - Doi.where(created: from_date.midnight..from_date.end_of_day).not_indexed.find_in_batches(batch_size: 500) do |dois| + Doi.where(created: from_date.midnight..from_date.end_of_day).where("indexed < ?", index_time).find_in_batches(batch_size: 500) do |dois| response = Doi.__elasticsearch__.client.bulk \ index: Doi.index_name, type: Doi.document_type, body: dois.map { |doi| { index: { _id: doi.id, data: doi.as_indexed_json } } } + # log errors errors += response['items'].map { |k, v| k.values.first['error'] }.compact.length - count += dois.length + response['items'].select { |k, v| k.values.first['error'].present? }.each do |err| + logger.error "[Elasticsearch] " + err.inspect + end + dois.each { |doi| doi.update_column(:indexed, Time.zone.now) } + count += dois.length end if errors > 1 - logger.info "[Elasticsearch] #{errors} errors indexing #{count} DOIs created on #{options[:from_date]}." + logger.error "[Elasticsearch] #{errors} errors indexing #{count} DOIs created on #{options[:from_date]}." elsif count > 1 logger.info "[Elasticsearch] Indexed #{count} DOIs created on #{options[:from_date]}." end @@ -269,12 +427,12 @@ def self.index_by_day(options={}) count = 0 - Doi.where(created: from_date.midnight..from_date.end_of_day).not_indexed.find_each do |doi| + Doi.where(created: from_date.midnight..from_date.end_of_day).where("indexed < ?", index_time).find_each do |doi| IndexJob.perform_later(doi) - doi.update_column(:indexed, Time.zone.now) + doi.update_column(:indexed, Time.zone.now) count += 1 end - + logger.info "[Elasticsearch] Indexed #{count} DOIs created on #{options[:from_date]}." end @@ -283,7 +441,7 @@ def uid end def resource_type_id - resource_type_general.underscore.dasherize if resource_type_general.present? + types["resourceTypeGeneral"].underscore.dasherize if types.to_h["resourceTypeGeneral"].present? end def media_ids @@ -292,26 +450,14 @@ def media_ids def xml_encoded Base64.strict_encode64(xml) if xml.present? - rescue ArgumentError => exception + rescue ArgumentError => exception nil end - - def title_normalized - parse_attributes(title, content: "text", first: true) - end - def description_normalized - parse_attributes(description, content: "text", first: true) - end - - def author_normalized - Array.wrap(author) - end - - # author name in natural order: "John Smith" instead of "Smith, John" - def author_names - Array.wrap(author).map do |a| - if a["familyName"].present? + # creator name in natural order: "John Smith" instead of "Smith, John" + def creator_names + Array.wrap(creators).map do |a| + if a["familyName"].present? [a["givenName"], a["familyName"]].join(" ") elsif a["name"].to_s.include?(", ") a["name"].split(", ", 2).reverse.join(" ") @@ -334,8 +480,9 @@ def client_id end def client_id=(value) - r = cached_client_response(value) - return @client_id unless r.present? + r = ::Client.where(symbol: value).first + #r = cached_client_response(value) + fail ActiveRecord::RecordNotFound unless r.present? write_attribute(:datacentre, r.id) end @@ -356,10 +503,22 @@ def is_test_prefix? prefix == "10.5072" end + def registerable? + prefix != "10.5072" && url.present? + end + + # def is_valid? + # valid? && url.present? + # end + def is_registered_or_findable? %w(registered findable).include?(aasm_state) end + def validatable? + %w(registered findable).include?(aasm_state) || should_validate || only_validate + end + # update URL in handle system for registered and findable state # providers europ and ethz do their own handle registration def update_url @@ -374,7 +533,7 @@ def update_media media.delete_all Array.wrap(content_url).each do |c| - media << Media.create(url: c, media_type: content_format) + media << Media.create(url: c, media_type: formats) end end @@ -402,7 +561,7 @@ def current_media end def resource_type - cached_resource_type_response(resource_type_general.underscore.dasherize.downcase) if resource_type_general.present? + cached_resource_type_response(types["resourceTypeGeneral"].underscore.dasherize.downcase) if types.to_h["resourceTypeGeneral"].present? end def date_registered @@ -422,13 +581,13 @@ def event=(value) self.send(value) if %w(register publish hide).include?(value) end - # update state for all DOIs in state "undetermined" starting from from_date + # update state for all DOIs in state "" starting from from_date def self.set_state(from_date: nil) from_date ||= Time.zone.now - 1.day Doi.where("updated >= ?", from_date).where(aasm_state: '').find_each do |doi| - if doi.is_test_prefix? || (doi.is_active == "\x00" && doi.minted.blank?) + if doi.is_test_prefix? || (doi.is_active.getbyte(0) == 0 && doi.minted.blank?) state = "draft" - elsif doi.is_active == "\x00" && doi.minted.present? + elsif doi.is_active.to_s.getbyte(0) == 0 && doi.minted.present? state = "registered" else state = "findable" @@ -479,24 +638,75 @@ def self.set_url(from_date: nil) "Queued storing missing URL in database for DOIs updated since #{from_date.strftime("%F")}." end - # update metadata when any virtual attribute has changed - def update_metadata - changed_virtual_attributes = changed & %w(author title publisher date_published additional_type resource_type_general description content_size content_format) - - if changed_virtual_attributes.present? - @xml = datacite_xml - doc = Nokogiri::XML(xml, nil, 'UTF-8', &:noblanks) - ns = doc.collect_namespaces.find { |k, v| v.start_with?("http://datacite.org/schema/kernel") } - @schema_version = Array.wrap(ns).last || "http://datacite.org/schema/kernel-4" - attribute_will_change!(:xml) - end - - metadata.build(doi: self, xml: xml, namespace: schema_version) if (changed & %w(xml)).present? + # save to metadata table when xml has changed + def save_metadata + metadata.build(doi: self, xml: xml, namespace: schema_version) if xml.present? && xml_changed? end def set_defaults self.is_active = (aasm_state == "findable") ? "\x01" : "\x00" - self.version = version.present? ? version + 1 : 0 + self.version = version.present? ? version + 1 : 1 self.updated = Time.zone.now.utc.iso8601 end + + def self.migrate_landing_page(options={}) + logger = Logger.new(STDOUT) + logger.info "Starting migration" + + # Handle camel casing first. + Doi.where.not('last_landing_page_status_result' => nil).find_each do |doi| + begin + # First we try and fix into camel casing + result = doi.last_landing_page_status_result + mappings = { + "body-has-pid" => "bodyHasPid", + "dc-identifier" => "dcIdentifier", + "citation-doi" => "citationDoi", + "redirect-urls" => "redirectUrls", + "schema-org-id" => "schemaOrgId", + "has-schema-org" => "hasSchemaOrg", + "redirect-count" => "redirectCount", + "download-latency" => "downloadLatency" + } + result = result.map {|k, v| [mappings[k] || k, v] }.to_h +# doi.update_columns("last_landing_page_status_result": result) + + # Do a fix of the stored download Latency + # Sometimes was floating point precision, we dont need this + download_latency = result['downloadLatency'] + download_latency = download_latency.nil? ? download_latency : download_latency.round + + # Try to put the checked date into ISO8601 + # If we dont have one (there was legacy reasons) then set to unix epoch + checked = doi.last_landing_page_status_check + checked = checked.nil? ? Time.at(0) : checked + checked = checked.iso8601 + + # Next we want to build a new landing_page result. + landing_page = { + "checked" => checked, + "status" => doi.last_landing_page_status, + "url" => doi.last_landing_page, + "contentType" => doi.last_landing_page_content_type, + "error" => result['error'], + "redirectCount" => result['redirectCount'], + "redirectUrls" => result['redirectUrls'], + "downloadLatency" => download_latency, + "hasSchemaOrg" => result['hasSchemaOrg'], + "schemaOrgId" => result['schemaOrgId'], + "dcIdentifier" => result['dcIdentifier'], + "citationDoi" => result['citationDoi'], + "bodyHasPid" => result['bodyHasPid'], + } + + doi.update_columns("landing_page": landing_page) + + logger.info "Updated " + doi.doi + + rescue TypeError, NoMethodError => error + logger.error "Error updating landing page " + doi.doi + ": " + error.message + end + end + end + end diff --git a/app/models/provider.rb b/app/models/provider.rb index ccb8cea59..db1a18a0b 100644 --- a/app/models/provider.rb +++ b/app/models/provider.rb @@ -36,8 +36,8 @@ class Provider < ActiveRecord::Base validates_format_of :contact_email, :with => /\A([^@\s]+)@((?:[-a-z0-9]+\.)+[a-z]{2,})\Z/i, message: "contact_email should be an email" validates_format_of :website, :with => /https?:\/\/[\S]+/ , if: :website?, message: "Website should be an url" validates_inclusion_of :role_name, :in => %w( ROLE_ALLOCATOR ROLE_MEMBER ROLE_ADMIN ROLE_DEV ), :message => "Role %s is not included in the list" - validates_inclusion_of :organization_type, :in => %w(national_institution national_library academic_institution academic_library research_institution government_agency publisher professional_society service_provider vendor), :message => "organization type %s is not included in the list", if: :organization_type? - validates_inclusion_of :focus_area, :in => %w(biomedical_and_health_sciences earth_sciences humanities mathematics_and_computer_science physical_sciences_and_engineering social_sciences general), :message => "focus area %s is not included in the list", if: :focus_area? + validates_inclusion_of :organization_type, :in => %w(nationalInstitution nationalLibrary academicInstitution academicLibrary researchInstitution governmentAgency publisher professionalSociety serviceProvider vendor), :message => "organization type %s is not included in the list", if: :organization_type? + validates_inclusion_of :focus_area, :in => %w(biomedicalAndHealthSciences earthSciences humanities mathematicsAndComputerScience physicalSciencesAndEngineering socialSciences general), :message => "focus area %s is not included in the list", if: :focus_area? validate :freeze_symbol, :on => :update before_validation :set_region diff --git a/app/models/user.rb b/app/models/user.rb index 1e3fef236..cdfb5b789 100644 --- a/app/models/user.rb +++ b/app/models/user.rb @@ -8,6 +8,9 @@ class User # include helper module for setting emails via Mailgun API include Mailable + # include helper module for caching infrequently changing resources + include Cacheable + attr_accessor :name, :uid, :email, :role_id, :jwt, :password, :provider_id, :client_id, :beta_tester, :errors def initialize(credentials, options={}) @@ -38,6 +41,8 @@ def initialize(credentials, options={}) alias_attribute :orcid, :uid alias_attribute :id, :uid alias_attribute :flipper_id, :uid + alias_attribute :provider, :allocator + alias_attribute :client, :datacentre # Helper method to check for admin user def is_admin? @@ -54,18 +59,16 @@ def is_beta_tester? beta_tester end - def allocator + def provider return nil unless provider_id.present? - p = Provider.where(symbol: provider_id).first - p.id if p.present? + cached_provider_response(provider_id) end - def datacentre + def client return nil unless client_id.present? - c = Client.where(symbol: client_id).first - c.id if c.present? + cached_client_response(client_id) end def self.reset(username) diff --git a/app/serializers/client_prefix_serializer.rb b/app/serializers/client_prefix_serializer.rb index 7bf3219e5..44677417a 100644 --- a/app/serializers/client_prefix_serializer.rb +++ b/app/serializers/client_prefix_serializer.rb @@ -1,6 +1,6 @@ class ClientPrefixSerializer include FastJsonapi::ObjectSerializer - set_key_transform :dash + set_key_transform :camel_lower set_type "client-prefixes" set_id :uid cache_options enabled: true, cache_length: 24.hours diff --git a/app/serializers/client_serializer.rb b/app/serializers/client_serializer.rb index 8788e2a65..96c9fbf72 100644 --- a/app/serializers/client_serializer.rb +++ b/app/serializers/client_serializer.rb @@ -1,6 +1,6 @@ class ClientSerializer include FastJsonapi::ObjectSerializer - set_key_transform :dash + set_key_transform :camel_lower set_type :clients set_id :uid @@ -11,7 +11,7 @@ class ClientSerializer has_many :prefixes, record_type: :prefixes attribute :is_active do |object| - object.is_active == "\u0001" ? true : false + object.is_active.getbyte(0) == 1 ? true : false end attribute :has_password do |object| diff --git a/app/serializers/data_center_serializer.rb b/app/serializers/data_center_serializer.rb index 2e6a73234..0a92f7e01 100644 --- a/app/serializers/data_center_serializer.rb +++ b/app/serializers/data_center_serializer.rb @@ -7,7 +7,7 @@ class DataCenterSerializer attributes :title, :other_names, :prefixes, :member_id, :year, :created, :updated - belongs_to :member, record_type: :members, id_method_name: :provider_id + belongs_to :provider, key: :member, record_type: :members, serializer: :Member attribute :title do |object| object.name diff --git a/app/serializers/doi_serializer.rb b/app/serializers/doi_serializer.rb index 880473178..e74824873 100644 --- a/app/serializers/doi_serializer.rb +++ b/app/serializers/doi_serializer.rb @@ -1,55 +1,36 @@ class DoiSerializer include FastJsonapi::ObjectSerializer - set_key_transform :dash + set_key_transform :camel_lower set_type :dois set_id :uid - attributes :doi, :identifier, :url, :prefix, :suffix, :author, :title, :publisher, :resource_type_subtype, :description, :version, :metadata_version, :schema_version, :reason, :source, :state, :is_active, :landing_page, :published, :created, :registered, :updated, :xml, :cache_key + attributes :doi, :prefix, :suffix, :identifiers, :creators, :titles, :publisher, :container, :publication_year, :subjects, :contributors, :dates, :language, :types, :related_identifiers, :sizes, :formats, :version, :rights_list, :descriptions, :geo_locations, :funding_references, :xml, :url, :content_url, :metadata_version, :schema_version, :source, :is_active, :state, :reason, :landing_page, :created, :registered, :updated + attributes :prefix, :suffix, if: Proc.new { |object, params| params && params[:detail] } belongs_to :client, record_type: :clients - belongs_to :resource_type, record_type: :resource_types has_many :media - attribute :doi do |object| - object.doi.downcase - end - - attribute :author do |object| - object.author_normalized - end - - attribute :title do |object| - object.title_normalized + attribute :xml, if: Proc.new { |object, params| params && params[:detail] } do |object| + object.xml_encoded end - attribute :description do |object| - object.description_normalized + attribute :doi do |object| + object.doi.downcase end attribute :state do |object| object.aasm_state end - attribute :is_active do |object| - object.is_active == "\u0001" ? true : false - end - attribute :version do |object| - object.b_version + object.version_info end - attribute :xml do |object| - object.xml_encoded + attribute :is_active do |object| + object.is_active.to_s.getbyte(0) == 1 ? true : false end - attribute :landing_page, if: Proc.new { - |object, params| - params[:current_ability] && params[:current_ability].can?(:read_landing_page_results, object) == true - } do |object| - { status: object.last_landing_page_status, - "content-type" => object.last_landing_page_content_type, - checked: object.last_landing_page_status_check, - "result" => object.try(:last_landing_page_status_result) } + attribute :landing_page, if: Proc.new { |object, params| params[:current_ability] && params[:current_ability].can?(:read_landing_page_results, object) == true } do |object| + object.landing_page end - end diff --git a/app/serializers/media_serializer.rb b/app/serializers/media_serializer.rb index d5e879b61..ec109448f 100644 --- a/app/serializers/media_serializer.rb +++ b/app/serializers/media_serializer.rb @@ -1,6 +1,6 @@ class MediaSerializer include FastJsonapi::ObjectSerializer - set_key_transform :dash + set_key_transform :camel_lower set_type "media" set_id :uid cache_options enabled: true, cache_length: 24.hours diff --git a/app/serializers/metadata_serializer.rb b/app/serializers/metadata_serializer.rb index 7bd18b2ef..7194650d9 100644 --- a/app/serializers/metadata_serializer.rb +++ b/app/serializers/metadata_serializer.rb @@ -1,6 +1,6 @@ class MetadataSerializer include FastJsonapi::ObjectSerializer - set_key_transform :dash + set_key_transform :camel_lower set_type "metadata" set_id :uid cache_options enabled: true, cache_length: 24.hours diff --git a/app/serializers/prefix_serializer.rb b/app/serializers/prefix_serializer.rb index f0b3e085e..b642c2f63 100644 --- a/app/serializers/prefix_serializer.rb +++ b/app/serializers/prefix_serializer.rb @@ -1,6 +1,6 @@ class PrefixSerializer include FastJsonapi::ObjectSerializer - set_key_transform :dash + set_key_transform :camel_lower set_type :prefixes set_id :prefix cache_options enabled: true, cache_length: 24.hours diff --git a/app/serializers/provider_prefix_serializer.rb b/app/serializers/provider_prefix_serializer.rb index 3774fb4b1..b89aaf335 100644 --- a/app/serializers/provider_prefix_serializer.rb +++ b/app/serializers/provider_prefix_serializer.rb @@ -1,6 +1,6 @@ class ProviderPrefixSerializer include FastJsonapi::ObjectSerializer - set_key_transform :dash + set_key_transform :camel_lower set_type "provider-prefixes" set_id :uid attributes :created, :updated diff --git a/app/serializers/provider_serializer.rb b/app/serializers/provider_serializer.rb index 3d8490242..65aad32aa 100644 --- a/app/serializers/provider_serializer.rb +++ b/app/serializers/provider_serializer.rb @@ -1,6 +1,6 @@ class ProviderSerializer include FastJsonapi::ObjectSerializer - set_key_transform :dash + set_key_transform :camel_lower set_type :providers set_id :uid @@ -13,7 +13,7 @@ class ProviderSerializer end attribute :is_active do |object| - object.is_active == "\u0001" ? true : false + object.is_active.getbyte(0) == 1 ? true : false end attribute :has_password do |object| diff --git a/app/serializers/repository_serializer.rb b/app/serializers/repository_serializer.rb index d8c932e68..df441b0e2 100644 --- a/app/serializers/repository_serializer.rb +++ b/app/serializers/repository_serializer.rb @@ -1,6 +1,6 @@ class RepositorySerializer include FastJsonapi::ObjectSerializer - set_key_transform :dash + set_key_transform :camel_lower set_type :repositories cache_options enabled: true, cache_length: 24.hours diff --git a/app/serializers/resource_type_serializer.rb b/app/serializers/resource_type_serializer.rb index d1920131d..17c4be62e 100644 --- a/app/serializers/resource_type_serializer.rb +++ b/app/serializers/resource_type_serializer.rb @@ -5,4 +5,4 @@ class ResourceTypeSerializer cache_options enabled: true, cache_length: 24.hours attributes :title, :updated -end +end \ No newline at end of file diff --git a/app/serializers/work_serializer.rb b/app/serializers/work_serializer.rb new file mode 100644 index 000000000..f5a216793 --- /dev/null +++ b/app/serializers/work_serializer.rb @@ -0,0 +1,92 @@ +class WorkSerializer + include FastJsonapi::ObjectSerializer + set_key_transform :dash + set_type :works + set_id :identifier + + attributes :doi, :identifier, :url, :author, :title, :container_title, :description, :resource_type_subtype, :data_center_id, :member_id, :resource_type_id, :version, :license, :schema_version, :results, :related_identifiers, :published, :registered, :checked, :updated, :media, :xml + + belongs_to :client, key: "data-center", record_type: "data-centers", serializer: :DataCenter + belongs_to :provider, key: :member, record_type: :members, serializer: :Member + belongs_to :resource_type, record_type: "resource-types", serializer: :ResourceType + + attribute :author do |object| + Array.wrap(object.creators).map do |c| + if (c["givenName"].present? || c["familyName"].present?) + { "given" => c["givenName"], + "family" => c["familyName"] }.compact + else + { "literal" => c["name"] }.presence + end + end + end + + attribute :doi do |object| + object.doi.downcase + end + + attribute :title do |object| + Array.wrap(object.titles).first.to_h.fetch("title", nil) + end + + attribute :description do |object| + Array.wrap(object.descriptions).first.to_h.fetch("title", nil) + end + + attribute :container_title do |object| + object.publisher + end + + attribute :resource_type_subtype do |object| + object.types.to_h.fetch("resourceType", nil) + end + + attribute :resource_type_id do |object| + rt = object.types.to_h.fetch("resourceTypeGeneral", nil) + if rt + rt.downcase.dasherize + else + nil + end + end + + attribute :data_center_id do |object| + object.client_id + end + + attribute :member_id do |object| + object.provider_id + end + + attribute :version do |object| + object.version_info + end + + attribute :schema_version do |object| + object.schema_version.to_s.split("-", 2).last.presence + end + + attribute :license do |object| + Array.wrap(object.rights_list).first.to_h.fetch("rightsUri", nil) + end + + attribute :results do |object| + [] + end + + attribute :related_identifiers do |object| + [] + end + + attribute :published do |object| + object.publication_year.to_s.presence + end + + attribute :xml do |object| + Base64.strict_encode64(object.xml) if object.xml.present? + end + + attribute :checked do |object| + nil + end +end \ No newline at end of file diff --git a/bin/rspec b/bin/rspec new file mode 100755 index 000000000..6e6709219 --- /dev/null +++ b/bin/rspec @@ -0,0 +1,8 @@ +#!/usr/bin/env ruby +begin + load File.expand_path('../spring', __FILE__) +rescue LoadError => e + raise unless e.message.include?('spring') +end +require 'bundler/setup' +load Gem.bin_path('rspec-core', 'rspec') diff --git a/config/application.rb b/config/application.rb index 6ed5f7544..7e7eb0102 100644 --- a/config/application.rb +++ b/config/application.rb @@ -32,7 +32,7 @@ ENV['APPLICATION'] ||= "client-api" ENV['HOSTNAME'] ||= "lupo" ENV['MEMCACHE_SERVERS'] ||= "memcached:11211" -ENV['SITE_TITLE'] ||= "REST API" +ENV['SITE_TITLE'] ||= "DataCite REST API" ENV['LOG_LEVEL'] ||= "info" ENV['CONCURRENCY'] ||= "25" ENV['CDN_URL'] ||= "https://assets.datacite.org" @@ -60,7 +60,6 @@ class Application < Rails::Application # Initialize configuration defaults for originally generated Rails version. config.load_defaults 5.1 config.autoload_paths << Rails.root.join('lib') - config.autoload_paths << Rails.root.join("app", "models", "concerns") # Settings in config/environments/* take precedence over those specified here. # Application configuration should go into files in config/initializers diff --git a/config/initializers/constants.rb b/config/initializers/constants.rb index e4c5bb7d4..477f2578c 100644 --- a/config/initializers/constants.rb +++ b/config/initializers/constants.rb @@ -5,6 +5,12 @@ class IdentifierError < RuntimeError; end ActiveModelSerializers::Adapter::JsonApi::Deserialization::InvalidDocument, JWT::DecodeError, JWT::VerificationError, + JSON::ParserError, + Nokogiri::XML::SyntaxError, + NoMethodError, + SocketError, + ActionDispatch::Http::Parameters::ParseError, + ActiveRecord::RecordNotUnique, ActiveRecord::RecordNotFound, AbstractController::ActionNotFound, ActionController::UnknownFormat, diff --git a/config/initializers/mime_types.rb b/config/initializers/mime_types.rb index 0663c200d..f89abdec4 100644 --- a/config/initializers/mime_types.rb +++ b/config/initializers/mime_types.rb @@ -14,8 +14,6 @@ Mime::Type.register "application/vnd.datacite.datacite+xml", :datacite, %w( application/x-datacite+xml ) Mime::Type.register "application/vnd.datacite.datacite+json", :datacite_json Mime::Type.register "application/vnd.schemaorg.ld+json", :schema_org -Mime::Type.register "application/rdf+xml", :rdf_xml -Mime::Type.register "text/turtle", :turtle Mime::Type.register "application/vnd.jats+xml", :jats Mime::Type.register "application/vnd.citationstyles.csl+json", :citeproc, %w( application/citeproc+json ) Mime::Type.register "application/vnd.codemeta.ld+json", :codemeta @@ -26,68 +24,45 @@ # register renderers for these Mime types # :citation and :datacite is handled differently ActionController::Renderers.add :datacite do |obj, options| - uri = Addressable::URI.parse(obj.identifier) - data = obj.xml - - filename = uri.path.gsub(/[^0-9A-Za-z.\-]/, '_') - send_data data.to_s, type: Mime[:datacite], - disposition: "attachment; filename=#{filename}.xml" + Array.wrap(obj).map { |o| o.xml }.join("\n") end ActionController::Renderers.add :citation do |obj, options| - uri = Addressable::URI.parse(obj.identifier) - data = obj.citation - - filename = uri.path.gsub(/[^0-9A-Za-z.\-]/, '_') - send_data data.to_s, type: Mime[:citation], - disposition: "attachment; filename=#{filename}.txt" -end - -ActionController::Renderers.add :turtle do |obj, options| - uri = Addressable::URI.parse(obj.identifier) - data = obj.send(:turtle) - - filename = uri.path.gsub(/[^0-9A-Za-z.\-]/, '_') - send_data data.to_s, type: Mime[:turtle], - disposition: "attachment; filename=#{filename}.ttl" + begin + Array.wrap(obj).map do |o| + o.style = options[:style] || "apa" + o.locale = options[:locale] || "en-US" + o.citation + end.join("\n\n") + rescue CSL::ParseError # unknown style and/or location + Array.wrap(obj).map do |o| + o.style = "apa" + o.locale = "en-US" + o.citation + end.join("\n\n") + end end %w(datacite_json schema_org crosscite citeproc codemeta).each do |f| ActionController::Renderers.add f.to_sym do |obj, options| - uri = Addressable::URI.parse(obj.identifier) - data = obj.send(f) - - filename = uri.path.gsub(/[^0-9A-Za-z.\-]/, '_') - send_data data.to_s, type: Mime[f.to_sym], - disposition: "attachment; filename=#{filename}.json" + if obj.is_a?(Array) + "[\n" + Array.wrap(obj).map { |o| o.send(f) }.join(",\n") + "\n]" + else + obj.send(f) + end end end -%w(crossref rdf_xml jats).each do |f| +%w(jats).each do |f| ActionController::Renderers.add f.to_sym do |obj, options| - uri = Addressable::URI.parse(obj.identifier) - data = obj.send(f) - - filename = uri.path.gsub(/[^0-9A-Za-z.\-]/, '_') - send_data data.to_s, type: Mime[f.to_sym], - disposition: "attachment; filename=#{filename}.xml" + Array.wrap(obj).map { |o| o.send(f) }.join("\n") end end ActionController::Renderers.add :bibtex do |obj, options| - uri = Addressable::URI.parse(obj.identifier) - data = obj.send("bibtex") - - filename = uri.path.gsub(/[^0-9A-Za-z.\-]/, '_') - send_data data.to_s, type: Mime[:bibtex], - disposition: "attachment; filename=#{filename}.bib" + Array.wrap(obj).map { |o| o.send("bibtex") }.join("\n") end ActionController::Renderers.add :ris do |obj, options| - uri = Addressable::URI.parse(obj.identifier) - data = obj.send("ris") - - filename = uri.path.gsub(/[^0-9A-Za-z.\-]/, '_') - send_data data.to_s, type: Mime[:ris], - disposition: "attachment; filename=#{filename}.ris" + Array.wrap(obj).map { |o| o.send("ris") }.join("\n\n") end diff --git a/config/initializers/turnout.rb b/config/initializers/turnout.rb new file mode 100644 index 000000000..df4a6ca76 --- /dev/null +++ b/config/initializers/turnout.rb @@ -0,0 +1,4 @@ +Turnout.configure do |config| + config.default_maintenance_page = Turnout::MaintenancePage::JSON + config.default_reason = "The site is temporarily down for maintenance. Please check https://status.datacite.org for more information." +end \ No newline at end of file diff --git a/config/routes.rb b/config/routes.rb index a8a9cfe1d..0c3a6251a 100644 --- a/config/routes.rb +++ b/config/routes.rb @@ -7,6 +7,29 @@ # send reset link post 'reset', :to => 'sessions#reset' + # content negotiation + get '/dois/application/vnd.datacite.datacite+xml/:id', :to => 'dois#show', constraints: { :id => /.+/ }, defaults: { format: :datacite } + get '/dois/application/vnd.datacite.datacite+json/:id', :to => 'dois#show', constraints: { :id => /.+/ }, defaults: { format: :datacite_json } + get '/dois/application/vnd.crosscite.crosscite+json/:id', :to => 'dois#show', constraints: { :id => /.+/ }, defaults: { format: :crosscite } + get '/dois/application/vnd.schemaorg.ld+json/:id', :to => 'dois#show', constraints: { :id => /.+/ }, defaults: { format: :schema_org } + get '/dois/application/vnd.codemeta.ld+json/:id', :to => 'dois#show', constraints: { :id => /.+/ }, defaults: { format: :codemeta } + get '/dois/application/vnd.citationstyles.csl+json/:id', :to => 'dois#show', constraints: { :id => /.+/ }, defaults: { format: :citeproc } + get '/dois/application/vnd.jats+xml/:id', :to => 'dois#show', constraints: { :id => /.+/ }, defaults: { format: :jats } + get '/dois/application/x-bibtex/:id', :to => 'dois#show', constraints: { :id => /.+/ }, defaults: { format: :bibtex } + get '/dois/application/x-research-info-systems/:id', :to => 'dois#show', constraints: { :id => /.+/ }, defaults: { format: :ris } + get '/dois/text/x-bibliography/:id', :to => 'dois#show', constraints: { :id => /.+/ }, defaults: { format: :citation } + + get '/dois/application/vnd.datacite.datacite+xml', :to => 'dois#index', defaults: { format: :datacite } + get '/dois/application/vnd.datacite.datacite+json', :to => 'dois#index', defaults: { format: :datacite_json } + get '/dois/application/vnd.crosscite.crosscite+json', :to => 'dois#index', defaults: { format: :crosscite } + get '/dois/application/vnd.schemaorg.ld+json', :to => 'dois#index', defaults: { format: :schema_org } + get '/dois/application/vnd.codemeta.ld+json', :to => 'dois#index', defaults: { format: :codemeta } + get '/dois/application/vnd.citationstyles.csl+json', :to => 'dois#index', defaults: { format: :citeproc } + get '/dois/application/vnd.jats+xml', :to => 'dois#index', defaults: { format: :jats } + get '/dois/application/x-bibtex', :to => 'dois#index', defaults: { format: :bibtex } + get '/dois/application/x-research-info-systems', :to => 'dois#index', defaults: { format: :ris } + get '/dois/text/x-bibliography', :to => 'dois#index', defaults: { format: :citation } + # manage DOIs post 'dois/validate', :to => 'dois#validate' post 'dois/status', :to => 'dois#status' @@ -24,6 +47,7 @@ post 'provider-prefixes/set-created', :to => 'provider_prefixes#set_created' resources :heartbeat, only: [:index] + resources :index, only: [:index] resources :clients, constraints: { :id => /.+/ } do resources :prefixes, constraints: { :id => /.+/ } @@ -54,19 +78,7 @@ # support for legacy routes resources :members, only: [:show, :index] resources :data_centers, only: [:show, :index], constraints: { :id => /.+/ }, path: "/data-centers" - - # content negotiation - get '/application/vnd.datacite.datacite+xml/:id', :to => 'index#show', constraints: { :id => /.+/ }, defaults: { format: :datacite } - get '/application/vnd.datacite.datacite+json/:id', :to => 'index#show', constraints: { :id => /.+/ }, defaults: { format: :datacite_json } - get '/application/vnd.crosscite.crosscite+json/:id', :to => 'index#show', constraints: { :id => /.+/ }, defaults: { format: :crosscite } - get '/application/vnd.schemaorg.ld+json/:id', :to => 'index#show', constraints: { :id => /.+/ }, defaults: { format: :schema_org } - get '/application/vnd.codemeta.ld+json/:id', :to => 'index#show', constraints: { :id => /.+/ }, defaults: { format: :codemeta } - get '/application/vnd.citationstyles.csl+json/:id', :to => 'index#show', constraints: { :id => /.+/ }, defaults: { format: :citeproc } - get '/application/vnd.jats+xml/:id', :to => 'index#show', constraints: { :id => /.+/ }, defaults: { format: :jats } - get '/application/x-bibtex/:id', :to => 'index#show', constraints: { :id => /.+/ }, defaults: { format: :bibtex } - get '/application/x-research-info-systems/:id', :to => 'index#show', constraints: { :id => /.+/ }, defaults: { format: :ris } - get '/text/x-bibliography/:id', :to => 'index#show', constraints: { :id => /.+/ }, defaults: { format: :citation } - resources :index, path: '/', constraints: { :id => /.+/ }, only: [:show, :index] + resources :works, only: [:show, :index], constraints: { :id => /.+/ } # rescue routing errors #match "*path", to: "index#routing_error", via: :all diff --git a/db/migrate/20181102094810_add_schema_attributes.rb b/db/migrate/20181102094810_add_schema_attributes.rb new file mode 100644 index 000000000..93ed12734 --- /dev/null +++ b/db/migrate/20181102094810_add_schema_attributes.rb @@ -0,0 +1,26 @@ +class AddSchemaAttributes < ActiveRecord::Migration[5.2] + def change + add_column :dataset, :creator, :json + add_column :dataset, :contributor, :json + add_column :dataset, :titles, :json + add_column :dataset, :publisher, :text + add_column :dataset, :publication_year, :integer + add_column :dataset, :types, :json + add_column :dataset, :descriptions, :json + add_column :dataset, :periodical, :json + add_column :dataset, :sizes, :json + add_column :dataset, :formats, :json + add_column :dataset, :version_info, :string, limit: 191 + add_column :dataset, :language, :string, limit: 191 + add_column :dataset, :dates, :json + add_column :dataset, :alternate_identifiers, :json + add_column :dataset, :related_identifiers, :json + add_column :dataset, :funding_references, :json + add_column :dataset, :geo_locations, :json + add_column :dataset, :rights_list, :json + add_column :dataset, :subjects, :json + add_column :dataset, :schema_version, :string, limit: 191 + add_column :dataset, :content_url, :json + add_column :dataset, :xml, :binary, limit: 16777215 + end +end diff --git a/db/migrate/20181124062253_add_software_field.rb b/db/migrate/20181124062253_add_software_field.rb new file mode 100644 index 000000000..001409c18 --- /dev/null +++ b/db/migrate/20181124062253_add_software_field.rb @@ -0,0 +1,6 @@ +class AddSoftwareField < ActiveRecord::Migration[5.2] + def change + add_column :datacentre, :software, :string, limit: 191 + add_column :datacentre, :description, :text + end +end \ No newline at end of file diff --git a/db/migrate/20181129100131_add_landing_page_to_dataset.rb b/db/migrate/20181129100131_add_landing_page_to_dataset.rb new file mode 100644 index 000000000..55584af06 --- /dev/null +++ b/db/migrate/20181129100131_add_landing_page_to_dataset.rb @@ -0,0 +1,5 @@ +class AddLandingPageToDataset < ActiveRecord::Migration[5.2] + def change + add_column :dataset, :landing_page, :json + end +end diff --git a/db/migrate/20181130182349_rename_creator_column.rb b/db/migrate/20181130182349_rename_creator_column.rb new file mode 100644 index 000000000..3cdfc0a9d --- /dev/null +++ b/db/migrate/20181130182349_rename_creator_column.rb @@ -0,0 +1,7 @@ +class RenameCreatorColumn < ActiveRecord::Migration[5.2] + def change + rename_column :dataset, :creator, :creators + rename_column :dataset, :contributor, :contributors + add_column :dataset, :agency, :string, limit: 191, default: "DataCite" + end +end diff --git a/db/migrate/20181209231736_rename_doi_columns.rb b/db/migrate/20181209231736_rename_doi_columns.rb new file mode 100644 index 000000000..751fb1009 --- /dev/null +++ b/db/migrate/20181209231736_rename_doi_columns.rb @@ -0,0 +1,6 @@ +class RenameDoiColumns < ActiveRecord::Migration[5.2] + def change + rename_column :dataset, :alternate_identifiers, :identifiers + rename_column :dataset, :periodical, :container + end +end diff --git a/db/schema.rb b/db/schema.rb index 1b1a15770..d67b517f8 100644 --- a/db/schema.rb +++ b/db/schema.rb @@ -10,7 +10,7 @@ # # It's strongly recommended that you check this file into your version control system. -ActiveRecord::Schema.define(version: 2018_10_23_235649) do +ActiveRecord::Schema.define(version: 2018_12_09_231736) do create_table "active_storage_attachments", options: "ENGINE=InnoDB DEFAULT CHARSET=latin1", force: :cascade do |t| t.string "name", limit: 191, null: false @@ -92,6 +92,8 @@ t.datetime "deleted_at" t.string "re3data" t.text "url" + t.string "software", limit: 191 + t.text "description" t.index ["allocator"], name: "FK6695D60546EBD781" t.index ["re3data"], name: "index_datacentre_on_re3data" t.index ["symbol"], name: "symbol", unique: true @@ -130,6 +132,30 @@ t.string "reason" t.string "source", limit: 191 t.datetime "indexed", precision: 3, default: "1970-01-01 00:00:00", null: false + t.json "creators" + t.json "contributors" + t.json "titles" + t.text "publisher" + t.integer "publication_year" + t.json "types" + t.json "descriptions" + t.json "container" + t.json "sizes" + t.json "formats" + t.string "version_info", limit: 191 + t.string "language", limit: 191 + t.json "dates" + t.json "identifiers" + t.json "related_identifiers" + t.json "funding_references" + t.json "geo_locations" + t.json "rights_list" + t.json "subjects" + t.string "schema_version", limit: 191 + t.json "content_url" + t.binary "xml", limit: 16777215 + t.string "agency", limit: 191, default: "DataCite" + t.json "landing_page" t.index ["aasm_state"], name: "index_dataset_on_aasm_state" t.index ["created", "indexed", "updated"], name: "index_dataset_on_created_indexed_updated" t.index ["datacentre"], name: "FK5605B47847B5F5FF" diff --git a/docker-compose.yml b/docker-compose.yml index f4543c10d..edd338905 100644 --- a/docker-compose.yml +++ b/docker-compose.yml @@ -5,6 +5,7 @@ services: env_file: .env environment: - ELASTIC_PASSWORD=changeme + build: . image: datacite/lupo ports: - "8065:80" @@ -45,6 +46,8 @@ services: ES_JAVA_OPTS: -Xmx256m -Xms256m ELASTIC_PASSWORD: changeme xpack.security.enabled: "false" + http.cors.enabled: "true" + http.cors.allow-origin: "*" networks: - public healthcheck: diff --git a/lib/tasks/doi.rake b/lib/tasks/doi.rake index a5748b394..fe0658fc4 100644 --- a/lib/tasks/doi.rake +++ b/lib/tasks/doi.rake @@ -6,6 +6,27 @@ namespace :doi do puts response end + desc 'Import all DOIs' + task :import_all => :environment do + if ENV['YEAR'].present? + from_date = "#{ENV['YEAR']}-01-01" + until_date = "#{ENV['YEAR']}-12-31" + else + from_date = ENV['FROM_DATE'] || Date.current.strftime("%F") + until_date = ENV['UNTIL_DATE'] || Date.current.strftime("%F") + end + + Doi.import_all(from_date: from_date, until_date: until_date) + end + + desc 'Import DOIs per day' + task :import_by_day => :environment do + from_date = ENV['FROM_DATE'] || Date.current.strftime("%F") + + Doi.import_by_day(from_date: from_date) + puts "DOIs created on #{from_date} imported." + end + desc 'Index all DOIs' task :index => :environment do if ENV['YEAR'].present? @@ -16,7 +37,9 @@ namespace :doi do until_date = ENV['UNTIL_DATE'] || Date.current.strftime("%F") end - Doi.index(from_date: from_date, until_date: until_date) + index_time = Time.zone.now.utc.iso8601 + + Doi.index(from_date: from_date, until_date: until_date, index_time: index_time) end desc 'Index DOIs per day' @@ -50,4 +73,9 @@ namespace :doi do from_date = ENV['FROM_DATE'] || Time.zone.now - 1.month Doi.delete_test_dois(from_date: from_date) end + + desc 'Migrates landing page data handling camelCase changes at same time' + task :migrate_landing_page => :environment do + Doi.migrate_landing_page + end end diff --git a/lib/xml_schema_validator.rb b/lib/xml_schema_validator.rb new file mode 100644 index 000000000..37272c68f --- /dev/null +++ b/lib/xml_schema_validator.rb @@ -0,0 +1,54 @@ +class XmlSchemaValidator < ActiveModel::EachValidator + # mapping of DataCite schema properties to database fields + def schema_attributes(el) + schema = { + "date" => "dates", + "publicationYear" => "publication_year", + "alternateIdentifiers" => "identifiers", + "relatedIdentifiers" => "related_identifiers", + "geoLocations" => "geo_locations", + "rightsList" => "rights_list", + "fundingReferences" => "funding_references", + "version" => "version_info", + "resource" => "xml" + } + + schema[el] || el + end + + def get_valid_kernel(sv) + kernels = { + "http://datacite.org/schema/kernel-2.1" => "kernel-2.1", + "http://datacite.org/schema/kernel-2.2" => "kernel-2.2", + "http://datacite.org/schema/kernel-3.0" => "kernel-3", + "http://datacite.org/schema/kernel-3.1" => "kernel-3", + "http://datacite.org/schema/kernel-3" => "kernel-3", + "http://datacite.org/schema/kernel-4.0" => "kernel-4", + "http://datacite.org/schema/kernel-4.1" => "kernel-4", + "http://datacite.org/schema/kernel-4" => "kernel-4" + } + + kernels[sv] + end + + def validate_each(record, attribute, value) + kernel = get_valid_kernel(record.schema_version) + return false unless kernel.present? + + filepath = Bundler.rubygems.find_name('bolognese').first.full_gem_path + "/resources/#{kernel}/metadata.xsd" + schema = Nokogiri::XML::Schema(open(filepath)) + + schema.validate(Nokogiri::XML(value, nil, 'UTF-8')).reduce({}) do |sum, error| + location, level, source, text = error.message.split(": ", 4) + line, column = location.split(":", 2) + title = text.to_s.strip + " at line #{line}, column #{column}" if line.present? + source = source.split("}").last[0..-2] if line.present? + source = schema_attributes(source) if source.present? + record.errors[source.to_sym] << title + end + rescue Nokogiri::XML::SyntaxError => e + line, column, level, text = e.message.split(":", 4) + message = text.strip + " at line #{line}, column #{column}" + record.errors[:xml] << message + end +end diff --git a/public/.keep b/public/.keep new file mode 100644 index 000000000..e69de29bb diff --git a/public/robots.txt b/public/robots.txt deleted file mode 100644 index 37b576a4a..000000000 --- a/public/robots.txt +++ /dev/null @@ -1 +0,0 @@ -# See http://www.robotstxt.org/robotstxt.html for documentation on how to use the robots.txt file diff --git a/spec/concerns/crosscitable_spec.rb b/spec/concerns/crosscitable_spec.rb index e0c5ac570..6ef5d94de 100644 --- a/spec/concerns/crosscitable_spec.rb +++ b/spec/concerns/crosscitable_spec.rb @@ -1,123 +1,429 @@ require 'rails_helper' describe Doi, vcr: true do - subject { create(:doi) } + let(:xml) { file_fixture('datacite.xml').read } + + subject { DoisController.new } context "from_xml" do it "from_xml" do string = file_fixture('datacite.xml').read - expect(subject.from_xml(string)).to be_nil - expect(subject.errors).to be_empty + expect(subject.from_xml(string)).to eq(string) end it "from_xml malformed" do string = file_fixture('datacite_malformed.xml').read - expect(subject.from_xml(string)).to eq(string) - expect(subject.errors.messages).to eq(xml: ["Premature end of data in tag resource line 2 at line 40, column 1"]) + expect { subject.from_xml(string) }.to raise_error(Nokogiri::XML::SyntaxError, "40:1: FATAL: Premature end of data in tag resource line 2") end end context "from_json" do it "from_json" do string = file_fixture('citeproc.json').read - expect(subject.from_json(string)).to be_nil - expect(subject.errors).to be_empty + expect(subject.from_json(string)).to eq(string) + end + + it "from_json starts with unexpected character" do + string = file_fixture('datacite.xml').read + expect { subject.from_json(string) }.to raise_error(JSON::ParserError, "unexpected character at line 1, column 1 [parse.c:671]") end it "from_json malformed" do string = file_fixture('citeproc_malformed.json').read - expect(subject.from_json(string)).to eq(string) - expect(subject.errors.messages).to eq(xml: ["Expected comma, not a string at line 4, column 9 [parse.c:381]"]) + expect { subject.from_json(string) }.to raise_error(JSON::ParserError, "expected comma, not a string at line 4, column 9 [parse.c:381]") end it "from_json duplicate keys" do string = file_fixture('citeproc_duplicate_keys.json').read - expect(subject.from_json(string)).to eq(string) - expect(subject.errors.messages).to eq(xml: ["The same key is defined more than once: id"]) + expect { subject.from_json(string) }.to raise_error(JSON::ParserError, "The same key is defined more than once: id") end end context "well_formed_xml" do it "from_xml" do - string = Base64.strict_encode64(file_fixture('datacite.xml').read) - expect(subject.well_formed_xml(string)).to eq(Base64.decode64(string)) - expect(subject.errors).to be_empty + string = file_fixture('datacite.xml').read + expect(subject.well_formed_xml(string)).to eq(string) end it "from_xml malformed" do - string = Base64.strict_encode64(file_fixture('datacite_malformed.xml').read) - expect(subject.well_formed_xml(string)).to eq(Base64.decode64(string)) - expect(subject.errors.messages).to eq(xml: ["Premature end of data in tag resource line 2 at line 40, column 1"]) + string = file_fixture('datacite_malformed.xml').read + expect { subject.well_formed_xml(string) }.to raise_error(Nokogiri::XML::SyntaxError, "40:1: FATAL: Premature end of data in tag resource line 2") end it "from_json" do - string = Base64.strict_encode64(file_fixture('citeproc.json').read) - expect(subject.well_formed_xml(string)).to eq(Base64.decode64(string)) - expect(subject.errors).to be_empty + string = file_fixture('citeproc.json').read + expect(subject.well_formed_xml(string)).to eq(string) + end + + it "from_json starts with unexpected character" do + string = 'abc' + expect { subject.well_formed_xml(string) }.to raise_error(JSON::ParserError, "unexpected character at line 1, column 1 [parse.c:671]") end it "from_json malformed" do - string = Base64.strict_encode64(file_fixture('citeproc_malformed.json').read) - expect(subject.well_formed_xml(string)).to eq(Base64.decode64(string)) - expect(subject.errors.messages).to eq(xml: ["Expected comma, not a string at line 4, column 9 [parse.c:381]"]) + string = file_fixture('citeproc_malformed.json').read + expect { subject.well_formed_xml(string) }.to raise_error(JSON::ParserError, "expected comma, not a string at line 4, column 9 [parse.c:381]") end it "from_json duplicate keys" do - string = Base64.strict_encode64(file_fixture('citeproc_duplicate_keys.json').read) - expect(subject.well_formed_xml(string)).to eq(Base64.decode64(string)) - expect(subject.errors.messages).to eq(xml: ["The same key is defined more than once: id"]) + string = file_fixture('citeproc_duplicate_keys.json').read + expect { subject.well_formed_xml(string) }.to raise_error(JSON::ParserError, "The same key is defined more than once: id") end end - context "get attributes" do - it "author" do - expect(subject.author).to eq("name"=>"D S") + context "get_content_type" do + it "datacite" do + string = file_fixture('datacite.xml').read + expect(subject.get_content_type(string)).to eq("xml") + end + + it "crossref" do + string = file_fixture('crossref.xml').read + expect(subject.get_content_type(string)).to eq("xml") + end + + it "crosscite" do + string = file_fixture('crosscite.json').read + expect(subject.get_content_type(string)).to eq("json") + end + + it "schema_org" do + string = file_fixture('schema_org.json').read + expect(subject.get_content_type(string)).to eq("json") + end + + it "codemeta" do + string = file_fixture('codemeta.json').read + expect(subject.get_content_type(string)).to eq("json") + end + + it "datacite_json" do + string = file_fixture('datacite.json').read + expect(subject.get_content_type(string)).to eq("json") + end + + it "bibtex" do + string = file_fixture('crossref.bib').read + expect(subject.get_content_type(string)).to eq("string") + end + + it "ris" do + string = file_fixture('crossref.ris').read + expect(subject.get_content_type(string)).to eq("string") + end + end + + context "parse_xml" do + it "from schema 4" do + string = file_fixture('datacite.xml').read + meta = subject.parse_xml(string) + + expect(meta["string"]).to eq(string) + expect(meta["from"]).to eq("datacite") + expect(meta["doi"]).to eq("10.14454/4k3m-nyvg") + expect(meta["creators"]).to eq([{"familyName"=>"Fenner", "givenName"=>"Martin","name"=>"Fenner, Martin", + "nameIdentifiers"=> + [{"nameIdentifier"=>"https://orcid.org/0000-0003-1419-2405", + "nameIdentifierScheme"=>"ORCID"}], + "nameType"=>"Personal"}]) + expect(meta["titles"]).to eq([{"title"=>"Eating your own Dog Food"}]) + expect(meta["publication_year"]).to eq("2016") + expect(meta["publisher"]).to eq("DataCite") + end + + it "from schema 3" do + string = file_fixture('datacite_schema_3.xml').read + meta = subject.parse_xml(string) + + expect(meta["string"]).to eq(string) + expect(meta["from"]).to eq("datacite") + expect(meta["doi"]).to eq("10.5061/dryad.8515") + expect(meta["creators"].length).to eq(8) + expect(meta["creators"].first).to eq("familyName"=>"Ollomo", "givenName"=>"Benjamin", "name"=>"Ollomo, Benjamin", "nameType"=>"Personal") + expect(meta["titles"]).to eq([{"title"=>"Data from: A new malaria agent in African hominids."}]) + expect(meta["publication_year"]).to eq("2011") + expect(meta["publisher"]).to eq("Dryad Digital Repository") + end + + it "from schema 2.2" do + string = file_fixture('datacite_schema_2.2.xml').read + meta = subject.parse_xml(string) + + expect(meta["string"]).to eq(string) + expect(meta["from"]).to eq("datacite") + expect(meta["doi"]).to eq("10.5072/testpub") + expect(meta["creators"]).to eq([{"familyName"=>"Smith", "givenName"=>"John", "name"=>"Smith, John", "nameType"=>"Personal"}, {"name"=>"つまらないものですが"}]) + expect(meta["titles"]).to eq([{"title"=>"Właściwości rzutowań podprzestrzeniowych"}, {"title"=>"Translation of Polish titles", "titleType"=>"TranslatedTitle"}]) + expect(meta["publication_year"]).to eq("2010") + expect(meta["publisher"]).to eq("Springer") end - it "title" do - expect(subject.title).to eq("Referee report. For: RESEARCH-3482 [version 5; referees: 1 approved, 1 approved with reservations]") + it "from schema 4 missing creators" do + string = file_fixture('datacite_missing_creator.xml').read + meta = subject.parse_xml(string) + + expect(meta["string"]).to eq(string) + expect(meta["from"]).to eq("datacite") + expect(meta["doi"]).to eq("10.5438/4k3m-nyvg") + expect(meta["creators"]).to be_empty + expect(meta["titles"]).to eq([{"title"=>"Eating your own Dog Food"}]) + expect(meta["publication_year"]).to eq("2016") + expect(meta["publisher"]).to eq("DataCite") end - it "publisher" do - expect(subject.publisher).to eq("F1000 Research Limited") + it "from namespaced xml" do + string = file_fixture('ns0.xml').read + meta = subject.parse_xml(string) + + expect(meta["string"]).to eq(string) + expect(meta["from"]).to eq("datacite") + # TODO + # expect(meta["doi"]).to eq("10.5438/4k3m-nyvg") + # expect(meta["creators"]).to be_empty + # expect(meta["titles"]).to eq([{"title"=>"Eating your own Dog Food"}]) + # expect(meta["publication_year"]).to eq("2016") + # expect(meta["publisher"]).to eq("DataCite") end - it "date_published" do - expect(subject.date_published).to eq("2017") + it "from crossref" do + string = file_fixture('crossref.xml').read + meta = subject.parse_xml(string) + + expect(meta["string"]).to eq(string) + expect(meta["from"]).to eq("crossref") + expect(meta["doi"]).to eq("10.1371/journal.pone.0000030") + expect(meta["creators"].length).to eq(5) + expect(meta["creators"].first).to eq("familyName"=>"Ralser", "givenName"=>"Markus", "name"=>"Ralser, Markus", "nameType"=>"Personal") + expect(meta["titles"]).to eq([{"title"=>"Triose Phosphate Isomerase Deficiency Is Caused by Altered Dimerization–Not Catalytic Inactivity–of the Mutant Enzymes"}]) + expect(meta["publication_year"]).to eq("2006") + expect(meta["publisher"]).to eq("(:unav)") + expect(meta["container"]).to eq("firstPage"=>"e30", "identifier"=>"1932-6203", "identifierType"=>"ISSN", "issue"=>"1", "title"=>"PLoS ONE", "type"=>"Journal", "volume"=>"1") end - it "resource_type_general" do - expect(subject.resource_type_general).to eq("Text") + it "from crossref url" do + string = "https://doi.org/10.7554/elife.01567" + meta = subject.parse_xml(string) + + expect(meta["from"]).to eq("crossref") + expect(meta["doi"]).to eq("10.7554/elife.01567") + expect(meta["creators"].length).to eq(5) + expect(meta["creators"].first).to eq("familyName"=>"Sankar", "givenName"=>"Martial", "name"=>"Sankar, Martial", "nameType"=>"Personal") + expect(meta["titles"]).to eq([{"title"=>"Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth"}]) + expect(meta["publication_year"]).to eq("2014") + expect(meta["publisher"]).to eq("(:unav)") + expect(meta["container"]).to eq("identifier"=>"2050-084X", "identifierType"=>"ISSN", "title"=>"eLife", "type"=>"Journal", "volume"=>"3") + expect(meta["agency"]).to eq("Crossref") + end + + it "from datacite url" do + string = "https://doi.org/10.7272/q6g15xs4" + meta = subject.parse_xml(string) + + expect(meta["from"]).to eq("datacite") + expect(meta["doi"]).to eq("10.7272/q6g15xs4") + expect(meta["creators"].length).to eq(2) + expect(meta["creators"].first).to eq("affiliation"=>"UC San Francisco", "familyName"=>"Rodriguez", "givenName"=>"Robert", "name"=>"Rodriguez, Robert", "nameType"=>"Personal") + expect(meta["titles"]).to eq([{"title"=>"NEXUS Head CT"}]) + expect(meta["publication_year"]).to eq("2017") + expect(meta["publisher"]).to eq("UC San Francisco") + expect(meta["agency"]).to eq("DataCite") + end + + it "from bibtex" do + string = file_fixture('crossref.bib').read + meta = subject.parse_xml(string) + + expect(meta["string"]).to eq(string) + expect(meta["from"]).to eq("bibtex") + expect(meta["doi"]).to eq("10.7554/elife.01567") + expect(meta["creators"].length).to eq(5) + expect(meta["creators"].first).to eq("familyName"=>"Sankar", "givenName"=>"Martial", "name"=>"Sankar, Martial", "nameType"=>"Personal") + expect(meta["titles"]).to eq([{"title"=>"Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth"}]) + expect(meta["publication_year"]).to eq("2014") + expect(meta["publisher"]).to eq("{eLife} Sciences Organisation, Ltd.") + expect(meta["container"]).to eq("identifier"=>"2050-084X", "identifierType"=>"ISSN", "title"=>"eLife", "type"=>"Journal", "volume"=>"3") + end + + it "from ris" do + string = file_fixture('crossref.ris').read + meta = subject.parse_xml(string) + + expect(meta["string"]).to eq(string) + expect(meta["from"]).to eq("ris") + expect(meta["doi"]).to eq("10.7554/elife.01567") + expect(meta["creators"].length).to eq(5) + expect(meta["creators"].first).to eq("familyName"=>"Sankar", "givenName"=>"Martial", "name"=>"Sankar, Martial", "nameType"=>"Personal") + expect(meta["titles"]).to eq([{"title"=>"Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth"}]) + expect(meta["publication_year"]).to eq("2014") + expect(meta["publisher"]).to eq("(:unav)") + expect(meta["container"]).to eq("title"=>"eLife", "type"=>"Journal", "volume"=>"3") + end + + it "from codemeta" do + string = file_fixture('codemeta.json').read + meta = subject.parse_xml(string) + + expect(meta["string"]).to eq(string) + expect(meta["from"]).to eq("codemeta") + expect(meta["doi"]).to eq("10.5063/f1m61h5x") + expect(meta["creators"].length).to eq(3) + expect(meta["creators"].first).to eq("affiliation" => "NCEAS", + "familyName" => "Jones", + "givenName" => "Matt", + "name" => "Jones, Matt", + "nameIdentifiers" => [{"nameIdentifier"=>"https://orcid.org/0000-0003-0077-4738", "nameIdentifierScheme"=>"ORCID"}], + "nameType" => "Personal") + expect(meta["titles"]).to eq([{"title"=>"R Interface to the DataONE REST API"}]) + expect(meta["publication_year"]).to eq("2016") + expect(meta["publisher"]).to eq("https://cran.r-project.org") + end + + it "from schema_org" do + string = file_fixture('schema_org.json').read + meta = subject.parse_xml(string) + + expect(meta["string"]).to eq(string) + expect(meta["from"]).to eq("schema_org") + expect(meta["doi"]).to eq("10.5438/4k3m-nyvg") + expect(meta["creators"].length).to eq(1) + expect(meta["creators"].first).to eq("familyName"=>"Fenner", "givenName"=>"Martin", "name" => "Fenner, Martin", + "nameIdentifiers" => [{"nameIdentifier"=>"https://orcid.org/0000-0003-1419-2405", "nameIdentifierScheme"=>"ORCID"}], + "nameType" => "Personal") + expect(meta["titles"]).to eq([{"title"=>"Eating your own Dog Food"}]) + expect(meta["publication_year"]).to eq("2016") + expect(meta["publisher"]).to eq("DataCite") + end + + it "from schema_org url" do + string = "https://doi.pangaea.de/10.1594/PANGAEA.836178" + meta = subject.parse_xml(string) + + expect(meta["string"]).to start_with("{\"@context\":\"http://schema.org") + expect(meta["from"]).to eq("schema_org") + expect(meta["doi"]).to eq("10.1594/pangaea.836178") + expect(meta["creators"].length).to eq(8) + expect(meta["creators"].first).to eq("familyName"=>"Johansson", "givenName"=>"Emma", "name"=>"Johansson, Emma", "nameType"=>"Personal") + expect(meta["titles"]).to eq([{"title"=>"Hydrological and meteorological investigations in a lake near Kangerlussuaq, west Greenland"}]) + expect(meta["publication_year"]).to eq("2014") + expect(meta["publisher"]).to eq("PANGAEA") end end - context "set attributes" do - it "author" do - author = { "name" => "Carberry, Josiah"} - subject.author = author - expect(subject.author).to eq(author) + context "update_xml" do + it "from schema 4" do + string = file_fixture('datacite.xml').read + subject = create(:doi, xml: string) + + # TODO + # expect(subject.doi).to eq("10.14454/4k3m-nyvg") + # expect(subject.creators).to eq([{"familyName"=>"Fenner", "givenName"=>"Martin", "id"=>"https://orcid.org/0000-0003-1419-2405", "name"=>"Fenner, Martin", "type"=>"Person"}]) + # expect(subject.titles).to eq([{"title"=>"Eating your own Dog Food"}]) + # expect(subject.publication).to eq("2016") + # expect(meta["publisher"]).to eq("DataCite") + end + + it "from schema 3" do + string = file_fixture('datacite_schema_3.xml').read + meta = subject.parse_xml(string) + + expect(meta["doi"]).to eq("10.5061/dryad.8515") + expect(meta["creators"].length).to eq(8) + expect(meta["creators"].first).to eq("familyName"=>"Ollomo", "givenName"=>"Benjamin", "name"=>"Ollomo, Benjamin", "nameType"=>"Personal") + expect(meta["titles"]).to eq([{"title"=>"Data from: A new malaria agent in African hominids."}]) + expect(meta["publication_year"]).to eq("2011") + expect(meta["publisher"]).to eq("Dryad Digital Repository") + end + + it "from schema 2.2" do + string = file_fixture('datacite_schema_2.2.xml').read + meta = subject.parse_xml(string) + + expect(meta["doi"]).to eq("10.5072/testpub") + expect(meta["creators"]).to eq([{"familyName"=>"Smith", "givenName"=>"John", "name"=>"Smith, John", "nameType"=>"Personal"}, {"name"=>"つまらないものですが"}]) + expect(meta["titles"]).to eq([{"title"=>"Właściwości rzutowań podprzestrzeniowych"}, {"title"=>"Translation of Polish titles", "titleType"=>"TranslatedTitle"}]) + expect(meta["publication_year"]).to eq("2010") + expect(meta["publisher"]).to eq("Springer") end - it "title" do - title = "Referee report." - subject.title = title - expect(subject.title).to eq(title) + it "from schema 4 missing creators" do + string = file_fixture('datacite_missing_creator.xml').read + meta = subject.parse_xml(string) + + expect(meta["doi"]).to eq("10.5438/4k3m-nyvg") + expect(meta["creators"]).to be_empty + expect(meta["titles"]).to eq([{"title"=>"Eating your own Dog Food"}]) + expect(meta["publication_year"]).to eq("2016") + expect(meta["publisher"]).to eq("DataCite") + end + + it "from crossref" do + string = file_fixture('crossref.xml').read + meta = subject.parse_xml(string) + + expect(meta["doi"]).to eq("10.1371/journal.pone.0000030") + expect(meta["creators"].length).to eq(5) + expect(meta["creators"].first).to eq("familyName"=>"Ralser", "givenName"=>"Markus", "name"=>"Ralser, Markus", "nameType"=>"Personal") + expect(meta["titles"]).to eq([{"title"=>"Triose Phosphate Isomerase Deficiency Is Caused by Altered Dimerization–Not Catalytic Inactivity–of the Mutant Enzymes"}]) + expect(meta["publication_year"]).to eq("2006") + expect(meta["publisher"]).to eq("(:unav)") + expect(meta["container"]).to eq("firstPage"=>"e30", "identifier"=>"1932-6203", "identifierType"=>"ISSN", "issue"=>"1", "title"=>"PLoS ONE", "type"=>"Journal", "volume"=>"1") + end + + it "from bibtex" do + string = file_fixture('crossref.bib').read + meta = subject.parse_xml(string) + + expect(meta["doi"]).to eq("10.7554/elife.01567") + expect(meta["creators"].length).to eq(5) + expect(meta["creators"].first).to eq("familyName"=>"Sankar", "givenName"=>"Martial", "name"=>"Sankar, Martial", "nameType"=>"Personal") + expect(meta["titles"]).to eq([{"title"=>"Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth"}]) + expect(meta["publication_year"]).to eq("2014") + expect(meta["publisher"]).to eq("{eLife} Sciences Organisation, Ltd.") + expect(meta["container"]).to eq("identifier"=>"2050-084X", "identifierType"=>"ISSN", "title"=>"eLife", "type"=>"Journal", "volume"=>"3") end - it "publisher" do - publisher = "Zenodo" - subject.publisher = publisher - expect(subject.publisher).to eq(publisher) + it "from ris" do + string = file_fixture('crossref.ris').read + meta = subject.parse_xml(string) + + expect(meta["doi"]).to eq("10.7554/elife.01567") + expect(meta["creators"].length).to eq(5) + expect(meta["creators"].first).to eq("familyName"=>"Sankar", "givenName"=>"Martial", "name"=>"Sankar, Martial", "nameType"=>"Personal") + expect(meta["titles"]).to eq([{"title"=>"Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth"}]) + expect(meta["publication_year"]).to eq("2014") + expect(meta["publisher"]).to eq("(:unav)") + expect(meta["container"]).to eq("title"=>"eLife", "type"=>"Journal", "volume"=>"3") end - it "date_published" do - expect(subject.date_published).to eq("2017") + it "from codemeta" do + string = file_fixture('codemeta.json').read + meta = subject.parse_xml(string) + + expect(meta["doi"]).to eq("10.5063/f1m61h5x") + expect(meta["creators"].length).to eq(3) + expect(meta["creators"].first).to eq("affiliation" => "NCEAS", + "familyName" => "Jones", + "givenName" => "Matt", + "name" => "Jones, Matt", + "nameIdentifiers" => [{"nameIdentifier"=>"https://orcid.org/0000-0003-0077-4738", "nameIdentifierScheme"=>"ORCID"}], + "nameType" => "Personal") + expect(meta["titles"]).to eq([{"title"=>"R Interface to the DataONE REST API"}]) + expect(meta["publication_year"]).to eq("2016") + expect(meta["publisher"]).to eq("https://cran.r-project.org") end - it "resource_type_general" do - resource_type_general = "Software" - subject.resource_type_general = resource_type_general - expect(subject.resource_type_general).to eq(resource_type_general) + it "from schema_org" do + string = file_fixture('schema_org.json').read + meta = subject.parse_xml(string) + + expect(meta["doi"]).to eq("10.5438/4k3m-nyvg") + expect(meta["creators"].length).to eq(1) + expect(meta["creators"].first).to eq("familyName"=>"Fenner", "givenName"=>"Martin", "name" => "Fenner, Martin", + "nameIdentifiers" => [{"nameIdentifier"=>"https://orcid.org/0000-0003-1419-2405", "nameIdentifierScheme"=>"ORCID"}], + "nameType" => "Personal") + expect(meta["titles"]).to eq([{"title"=>"Eating your own Dog Food"}]) + expect(meta["publication_year"]).to eq("2016") + expect(meta["publisher"]).to eq("DataCite") end end end diff --git a/spec/factories/default.rb b/spec/factories/default.rb index c096458be..11d3bb357 100644 --- a/spec/factories/default.rb +++ b/spec/factories/default.rb @@ -26,9 +26,146 @@ doi { ("10.14454/" + Faker::Internet.password(8)).downcase } url { Faker::Internet.url } - is_active { true } - xml { "PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0iVVRGLTgiIHN0YW5kYWxvbmU9InllcyI/PjxyZXNvdXJjZSB4c2k6c2NoZW1hTG9jYXRpb249Imh0dHA6Ly9kYXRhY2l0ZS5vcmcvc2NoZW1hL2tlcm5lbC0zIGh0dHA6Ly9zY2hlbWEuZGF0YWNpdGUub3JnL21ldGEva2VybmVsLTMvbWV0YWRhdGEueHNkIiB4bWxucz0iaHR0cDovL2RhdGFjaXRlLm9yZy9zY2hlbWEva2VybmVsLTMiIHhtbG5zOnhzaT0iaHR0cDovL3d3dy53My5vcmcvMjAwMS9YTUxTY2hlbWEtaW5zdGFuY2UiPjxpZGVudGlmaWVyIGlkZW50aWZpZXJUeXBlPSJET0kiPjEwLjUyNTYvZjEwMDByZXNlYXJjaC44NTcwLnI2NDIwPC9pZGVudGlmaWVyPjxjcmVhdG9ycz48Y3JlYXRvcj48Y3JlYXRvck5hbWU+ZCBzPC9jcmVhdG9yTmFtZT48L2NyZWF0b3I+PC9jcmVhdG9ycz48dGl0bGVzPjx0aXRsZT5SZWZlcmVlIHJlcG9ydC4gRm9yOiBSRVNFQVJDSC0zNDgyIFt2ZXJzaW9uIDU7IHJlZmVyZWVzOiAxIGFwcHJvdmVkLCAxIGFwcHJvdmVkIHdpdGggcmVzZXJ2YXRpb25zXTwvdGl0bGU+PC90aXRsZXM+PHB1Ymxpc2hlcj5GMTAwMCBSZXNlYXJjaCBMaW1pdGVkPC9wdWJsaXNoZXI+PHB1YmxpY2F0aW9uWWVhcj4yMDE3PC9wdWJsaWNhdGlvblllYXI+PHJlc291cmNlVHlwZSByZXNvdXJjZVR5cGVHZW5lcmFsPSJUZXh0Ii8+PC9yZXNvdXJjZT4=" } - aasm_state { "draft" } + types { { + "resourceTypeGeneral": "Dataset", + "resourceType": "DataPackage", + "schemaOrg": "Dataset", + "citeproc": "dataset", + "bibtex": "misc", + "ris": "DATA" + }} + creators { [ + { + "type": "Person", + "name": "Benjamin Ollomo", + "givenName": "Benjamin", + "familyName": "Ollomo" + }, + { + "type": "Person", + "name": "Patrick Durand", + "givenName": "Patrick", + "familyName": "Durand" + }, + { + "type": "Person", + "name": "Franck Prugnolle", + "givenName": "Franck", + "familyName": "Prugnolle" + }, + { + "type": "Person", + "name": "Emmanuel J. P. Douzery", + "givenName": "Emmanuel J. P.", + "familyName": "Douzery" + }, + { + "type": "Person", + "name": "Céline Arnathau", + "givenName": "Céline", + "familyName": "Arnathau" + }, + { + "type": "Person", + "name": "Dieudonné Nkoghe", + "givenName": "Dieudonné", + "familyName": "Nkoghe" + }, + { + "type": "Person", + "name": "Eric Leroy", + "givenName": "Eric", + "familyName": "Leroy" + }, + { + "type": "Person", + "name": "François Renaud", + "givenName": "François", + "familyName": "Renaud" + } + ] } + titles {[ + { + "title": "Data from: A new malaria agent in African hominids." + }] } + publisher {"Dryad Digital Repository" } + subjects {[ + { + "subject": "Phylogeny" + }, + { + "subject": "Malaria" + }, + { + "subject": "Parasites" + }, + { + "subject": "Taxonomy" + }, + { + "subject": "Mitochondrial genome" + }, + { + "subject": "Africa" + }, + { + "subject": "Plasmodium" + } + ]} + dates { [ + { + "date": "2011", + "dateType": "Issued" + } + ]} + publication_year { 2011 } + identifiers { [ + { + "identifierType": "citation", + "identifier": "Ollomo B, Durand P, Prugnolle F, Douzery EJP, Arnathau C, Nkoghe D, Leroy E, Renaud F (2009) A new malaria agent in African hominids. PLoS Pathogens 5(5): e1000446." + } + ]} + version { "1" } + rights_list {[ + { + "rightsUri": "http://creativecommons.org/publicdomain/zero/1.0" + } + ]} + related_identifiers {[ + { + "relatedIdentifier": "10.5061/dryad.8515/1", + "relatedIdentifierType": "DOI", + "relationType": "HasPart" + }, + { + "relatedIdentifier": "10.5061/dryad.8515/2", + "relatedIdentifierType": "DOI", + "relationType": "HasPart" + }, + { + "relatedIdentifier": "10.1371/journal.ppat.1000446", + "relatedIdentifierType": "DOI", + "relationType": "IsReferencedBy" + }, + { + "relatedIdentifier": "10.1371/journal.ppat.1000446", + "relatedIdentifierType": "DOI", + "relationType": "IsSupplementTo" + }, + { + "relatedIdentifier": "19478877", + "relatedIdentifierType": "PMID", + "relationType": "IsReferencedBy" + }, + { + "relatedIdentifier": "19478877", + "relatedIdentifierType": "PMID", + "relationType": "IsSupplementTo" + } + ]} + schema_version { "http://datacite.org/schema/kernel-4" } + source { "test" } + regenerate { true } created { Faker::Time.backward(14, :evening) } minted { Faker::Time.backward(15, :evening) } updated { Faker::Time.backward(5, :evening) } diff --git a/spec/fixtures/files/crosscite.json b/spec/fixtures/files/crosscite.json index e724fd3f2..7447ae152 100644 --- a/spec/fixtures/files/crosscite.json +++ b/spec/fixtures/files/crosscite.json @@ -1,39 +1,62 @@ { "id": "https://doi.org/10.5281/zenodo.48440", "doi": "10.5281/zenodo.48440", - "type": "SoftwareSourceCode", - "additional_type": "Software", - "citeproc_type": "other", - "bibtex_type": "misc", - "ris_type": "COMP", - "resource_type_general": "Software", - "resource_type": "Software", - "author": { + "types":{ + "resourceTypeGeneral": "Software", + "resourceType": "Software", + "schemaOrg": "SoftwareSourceCode", + "citeproc": "other", + "bibtex": "misc", + "ris": "COMP" + }, + "creators": [{ "type": "Person", "name": "Kristian Garza", "givenName": "Kristian", "familyName": "Garza" - }, - "title": "Analysis Tools for Crossover Experiment of UI using Choice Architecture", + }], + "titles": [{ + "title": "Analysis Tools for Crossover Experiment of UI using Choice Architecture" + }], "publisher": "Zenodo", - "keywords": ["choice architecture", "crossover experiment", "hci"], - "date_published": "2016-03-27", - "alternate_name": { - "type": "URL", - "name": "http://zenodo.org/record/48440" + "subjects": [ + { + "subject": "choice architecture" + }, + { + "subject": "crossover experiment" + }, + { + "subject": "hci" + } + ], + "dates": { + "date": "2016-03-27", + "dateType": "Issued" }, - "license": [{ - "name": "Open Access" + "publication_year": "2016", + "identifiers": [ + { + "identifierType": "URL", + "identifier": "http://zenodo.org/record/48440" + }, + { + "identifierType": "DOI", + "identifier": "https://doi.org/10.5281/zenodo.48440" + } + ], + "rights_list": [{ + "rights": "Open Access" }, { - "id": "https://creativecommons.org/licenses/by-nc-sa/4.0", - "name": "Creative Commons Attribution-NonCommercial-ShareAlike" + "rightsUri": "https://creativecommons.org/licenses/by-nc-sa/4.0", + "rights": "Creative Commons Attribution-NonCommercial-ShareAlike" } ], - "description": { - "type": "Abstract", - "text": "This tools are used to analyse the data produced by the Crosssover Experiment I designed to test Choice Architecture techniques as UI interventions in a SEEk4Science data catalogue. It contains:\n\n- Data structures for the experimental data.
\n- Visualisation functions
\n- Analysis functions\n\n## Installation\n\n- R
\n- python
\n- ipython 4\n\nClone and use.\n\n## Usage\n\n
\n```python
\nsource('parallel_plot.r')
\nwith(z, parallelset(trt,response, freq=count, alpha=0.2))
\n```\n\n
\n## Contributing\n\n1. Fork it!
\n2. Create your feature branch: `git checkout -b my-new-feature`
\n3. Commit your changes: `git commit -am 'Add some feature'`
\n4. Push to the branch: `git push origin my-new-feature`
\n5. Submit a pull request :D\n\n
\n## License\n\nThis work supports my PhD Thesis at University of Manchester." - }, + "descriptions": [{ + "descriptionType": "Abstract", + "description": "This tools are used to analyse the data produced by the Crosssover Experiment I designed to test Choice Architecture techniques as UI interventions in a SEEk4Science data catalogue. It contains:\n\n- Data structures for the experimental data.
\n- Visualisation functions
\n- Analysis functions\n\n## Installation\n\n- R
\n- python
\n- ipython 4\n\nClone and use.\n\n## Usage\n\n
\n```python
\nsource('parallel_plot.r')
\nwith(z, parallelset(trt,response, freq=count, alpha=0.2))
\n```\n\n
\n## Contributing\n\n1. Fork it!
\n2. Create your feature branch: `git checkout -b my-new-feature`
\n3. Commit your changes: `git commit -am 'Add some feature'`
\n4. Push to the branch: `git push origin my-new-feature`
\n5. Submit a pull request :D\n\n
\n## License\n\nThis work supports my PhD Thesis at University of Manchester." + }], "schema_version": "http://datacite.org/schema/kernel-4", "provider": "DataCite", "state": "findable" diff --git a/spec/fixtures/files/datacite.json b/spec/fixtures/files/datacite.json new file mode 100644 index 000000000..cd97f822b --- /dev/null +++ b/spec/fixtures/files/datacite.json @@ -0,0 +1,79 @@ +{ + "id": "https://doi.org/10.5438/4k3m-nyvg", + "types": { + "resourceTypeGeneral": "Text", + "resourceType": "BlogPosting", + "schemaOrg": "ScholarlyArticle", + "citeproc": "article-journal", + "bibtex": "article", + "ris": "RPRT" + }, + "doi": "10.5438/4K3M-NYVG", + "creators": [{ + "type": "Person", + "id": "http://orcid.org/0000-0003-1419-2405", + "name": "Fenner, Martin", + "givenName": "Martin", + "familyName": "Fenner" + }], + "titles": [{ + "title": "Eating your own Dog Food" + }], + "publisher": "DataCite", + "publicationYear": "2016", + "subjects": [ + { + "subject": "datacite" + }, + { + "subject": "doi" + }, + { + "subject": "metadata" + } + ], + "dates": [ + { + "dateType": "Created", + "date": "2016-12-20" + }, + { + "dateType": "Issued", + "date": "2016-12-20" + }, + { + "dateType": "Updated", + "date": "2016-12-20" + } + ], + "alternateIdentifiers": [ + { + "alternateIdentifierType": "Local accession number", + "alternateIdentifier": "MS-49-3632-5083" + } + ], + "relatedIdentifiers": [ + { + "relatedIdentifier": "10.5438/0000-00ss", + "relatedIdentifierType": "DOI", + "relationType": "IsPartOf" + }, + { + "relatedIdentifier": "10.5438/0012", + "relatedIdentifierType": "DOI", + "relationType": "References" + }, + { + "relatedIdentifier": "10.5438/55e5-t5c0", + "relatedIdentifierType": "DOI", + "relationType": "References" + } + ], + "version": "1.0", + "descriptions": [{ + "descriptionType": "Abstract", + "description": "Eating your own dog food is a slang term to describe that an organization should itself use the products and services it provides. For DataCite this means that we should use DOIs with appropriate metadata and strategies for long-term preservation for..." + }], + "schemaVersion": "http://datacite.org/schema/kernel-4", + "provider": "DataCite" +} diff --git a/spec/fixtures/files/datacite.xml b/spec/fixtures/files/datacite.xml index df0eb65ac..459fe40e2 100644 --- a/spec/fixtures/files/datacite.xml +++ b/spec/fixtures/files/datacite.xml @@ -1,6 +1,6 @@ - 10.5438/4K3M-NYVG + 10.14454/4K3M-NYVG Fenner, Martin @@ -37,4 +37,4 @@ Eating your own dog food is a slang term to describe that an organization should itself use the products and services it provides. For DataCite this means that we should use DOIs with appropriate metadata and strategies for long-term preservation for... - + \ No newline at end of file diff --git a/spec/fixtures/files/datacite_89.json b/spec/fixtures/files/datacite_89.json index 6c348c930..a75d2fd63 100644 --- a/spec/fixtures/files/datacite_89.json +++ b/spec/fixtures/files/datacite_89.json @@ -2,21 +2,9 @@ { "type": "dois", "attributes": { - "doi": "10.24425/119496", + "doi": "10.14454/119496", "xml": "PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0iVVRGLTgiPz48cmVzb3VyY2UgeG1sbnM9Imh0dHA6Ly9kYXRhY2l0ZS5vcmcvc2NoZW1hL2tlcm5lbC00IiB4bWxuczp4c2k9Imh0dHA6Ly93d3cudzMub3JnLzIwMDEvWE1MU2NoZW1hLWluc3RhbmNlIiB4c2k6c2NoZW1hTG9jYXRpb249Imh0dHA6Ly9kYXRhY2l0ZS5vcmcvc2NoZW1hL2tlcm5lbC00IGh0dHA6Ly9zY2hlbWEuZGF0YWNpdGUub3JnL21ldGEva2VybmVsLTQuMS9tZXRhZGF0YS54c2QiPjxpZGVudGlmaWVyIGlkZW50aWZpZXJUeXBlPSJET0kiPjEwLjI0NDI1LzExOTQ5NjwvaWRlbnRpZmllcj48Y3JlYXRvcnM+PGNyZWF0b3I+PGNyZWF0b3JOYW1lPig6dW5hdik8L2NyZWF0b3JOYW1lPjwvY3JlYXRvcj48L2NyZWF0b3JzPjx0aXRsZXM+PHRpdGxlPjMyPC90aXRsZT48L3RpdGxlcz48cHVibGlzaGVyPkNvbW1pdHRlZSBmb3IgUHN5Y2hvbG9naWNhbCBTY2llbmNlIFBBUzwvcHVibGlzaGVyPjxwdWJsaWNhdGlvblllYXI+MjAxODwvcHVibGljYXRpb25ZZWFyPjxyZXNvdXJjZVR5cGUgcmVzb3VyY2VUeXBlR2VuZXJhbD0iVGV4dCI+QXJ0eWt1xYI8L3Jlc291cmNlVHlwZT48ZGF0ZXM+PGRhdGUgZGF0ZVR5cGU9Iklzc3VlZCI+MjAxODwvZGF0ZT48L2RhdGVzPjwvcmVzb3VyY2U+", - "validate": "true" - }, - "relationships": { - "client": { - "data": { - "type": "clients", - "id": "PSNC.PAN-CC" - } - } + "event": "register" } - }, - "controller": "dois", - "action": "update", - "id": "10.24425/119496", - "format": "jsonapi" + } } \ No newline at end of file diff --git a/spec/fixtures/files/datacite_f1000.xml b/spec/fixtures/files/datacite_f1000.xml new file mode 100644 index 000000000..cf83f9c4d --- /dev/null +++ b/spec/fixtures/files/datacite_f1000.xml @@ -0,0 +1 @@ +10.5256/f1000research.8570.r6420d sReferee report. For: RESEARCH-3482 [version 5; referees: 1 approved, 1 approved with reservations]F1000 Research Limited2017 \ No newline at end of file diff --git a/spec/fixtures/files/datacite_with_whitespace.xml b/spec/fixtures/files/datacite_with_whitespace.xml new file mode 100644 index 000000000..7718668e7 --- /dev/null +++ b/spec/fixtures/files/datacite_with_whitespace.xml @@ -0,0 +1,133 @@ + + + 10.20387/BONARES-R0P3-X8GN + + + Schucknecht, Anne + Anne + Schucknecht + Karlsruhe Institute für Technologie, Institut für Meteorologie und Klimafor-schung, IMK-IFU, Garmisch-Partenkirchen, Deutschland + + + Schneider, Katrin + Katrin + Schneider + Karlsruhe Institute für Technologie, Institut für Meteorologie und Klimafor-schung, IMK-IFU, Garmisch-Partenkirchen, Deutschland + + + Kiese, Ralf + Ralf + Kiese + Karlsruhe Institute für Technologie, Institut für Meteorologie und Klimafor-schung, IMK-IFU, Garmisch-Partenkirchen, Deutschland + + + Wiesmeier, Martin + Martin + Wiesmeier + Technische Universität München, Lehrstuhl für Bodenkunde, Freising, Deutschland; Bayrische Landesanstalt für Landwirtschaft, Institut für Ökologischen Landbau, Bodenkultur und Ressourcenschutz, Freising, Deutschland + + + Schloter, Michael + Michael + Schloter + Technische Universität München, Lehrstuhl für Bodenkunde, Freising, Deutschland; Helmholtz Zentrum München, Abteilung für vergleichende Mikrobiom-analysen, Neuherberg, Deutschland + + + Jentsch, Anke + Anke + Jentsch + Universität Bayreuth, Professur für Störungsökologie, Bayreuth, Deutschland + + + Köllner, Thomas + Thomas + Köllner + Universität Bayreuth, Professur für ökologische Dienstleistungen, Bayreuth, Deutschland + + + Dannenmann, Michael + Michael + Dannenmann + Karlsruher Institut für Technologie (KIT) – Campus Alpin Institut für Meteorologie und Klimaforschung, Atmosphärische Umweltforschung (IMK-IFU) + + + + SUSALPS Conference 2018 – Book of Abstracts: Montane and alpine grasslands under climate change – ways in a sustainable future + + BonaRes Centre for Soil Research + 2018 + + BonaRes + montane and alpine grasslands + soil organic matter + microbiome + plant diversity and productivity + biogeochemical cycles + remote sensing + ecosystem services + alpine farming + + + + Kiese, Ralf + Ralf + Kiese + Karlsruhe Institute für Technologie, Institut für Meteorologie und Klimafor-schung, IMK-IFU, Garmisch-Partenkirchen, Deutschland + + + + + + +2018-11-23 + + en + Document + + 1270 + + + PDF + + + Creative Commons Attribution 4.0 International + + + +From 18 to 20 September 2018, the SUSALPS Conference "Montane and alpine grasslands under climate change – ways in a sustainable future" was held in Garmisch-Partenkirchen, Germany. More than 60 participants from nine nations attended the conference. The event covered a broad scope and offered the opportunity to discuss both fundamental research and practical approaches in grassland management. At the conference's closing day, ex-cursions took place to the SUSALPS experimental areas in Fendt and on the Brunnenkopfalm. This publication provides the abstracts of all oral and poster presentations. + + + + German Federal Ministry of Education and Research + https://doi.org/10.13039/501100002347 + 031B0027A + Sustainable use of alpine and pre-alpine grassland soils in a changing climate - Subproject A + + + Federal Ministry of Education and Research + https://doi.org/10.13039/501100002347 + 031B0027B + Sustainable use of alpine and pre-alpine grassland soils in a changing climate - Subproject B + + + Federal Ministry of Education and Research + https://doi.org/10.13039/501100002347 + 031B0027C + Sustainable use of alpine and pre-alpine grassland soils in a changing climate - Subproject C + + + Federal Ministry of Education and Research + https://doi.org/10.13039/501100002347 + 031B0027D + Sustainable use of alpine and pre-alpine grassland soils in a changing climate - Subproject D + + + Federal Ministry of Education and Research + https://doi.org/10.13039/501100002347 + 031B0027E + Sustainable use of alpine and pre-alpine grassland soils in a changing climate - Subproject E + + + \ No newline at end of file diff --git a/spec/fixtures/files/schema_org_topmed.json b/spec/fixtures/files/schema_org_topmed.json index cfa6feb27..603cf85de 100644 --- a/spec/fixtures/files/schema_org_topmed.json +++ b/spec/fixtures/files/schema_org_topmed.json @@ -42,7 +42,7 @@ "@type": "Dataset", "@id": "https://doi.org/10.23725/2g4s-qv04" }, - "funding": { + "funder": { "@type": "Organization", "@id": "https://doi.org/10.13039/100000050", "name": "National Heart, Lung, and Blood Institute (NHLBI)" diff --git a/spec/fixtures/vcr_cassettes/Doi/parse_xml/from_crossref_url.yml b/spec/fixtures/vcr_cassettes/Doi/parse_xml/from_crossref_url.yml new file mode 100644 index 000000000..d72b8bac2 --- /dev/null +++ b/spec/fixtures/vcr_cassettes/Doi/parse_xml/from_crossref_url.yml @@ -0,0 +1,82 @@ +--- +http_interactions: +- request: + method: get + uri: https://api.datacite.org/prefixes/10.7554 + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/html,application/json,application/xml;q=0.9, text/plain;q=0.8,image/png,*/*;q=0.5 + response: + status: + code: 200 + message: OK + headers: + Date: + - Sat, 01 Dec 2018 14:44:43 GMT + Content-Type: + - application/json; charset=utf-8 + Connection: + - keep-alive + Status: + - 200 OK + X-Anonymous-Consumer: + - 'true' + Cache-Control: + - max-age=0, private, must-revalidate + Vary: + - Accept-Encoding, Origin + X-Request-Id: + - 0bcab827-0d7e-44ab-abca-fe09a72ba2cf + Etag: + - W/"381993dc8a6b0f20960c96a3639c0284" + X-Runtime: + - '0.169950' + X-Powered-By: + - Phusion Passenger 5.3.7 + Server: + - nginx/1.14.0 + Phusion Passenger 5.3.7 + body: + encoding: ASCII-8BIT + string: '{"data":{"id":"10.7554","type":"prefixes","attributes":{"registration-agency":"Crossref","created":null,"updated":"2016-09-21T21:07:27Z"},"relationships":{"clients":{"data":[]},"providers":{"data":[]}}},"included":[]}' + http_version: + recorded_at: Sat, 01 Dec 2018 14:44:43 GMT +- request: + method: get + uri: http://www.crossref.org/openurl/?format=unixref&id=doi:10.7554/elife.01567&noredirect=true&pid=tech@datacite.org + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/xml + response: + status: + code: 200 + message: OK + headers: + Server: + - Apache-Coyote/1.1 + Crossref-Deployment-Name: + - qs2-2 + Content-Type: + - text/xml;charset=UTF-8 + Content-Language: + - en-US + Date: + - Sat, 01 Dec 2018 14:44:43 GMT + Connection: + - close + body: + encoding: ASCII-8BIT + string: !binary |- + <?xml version="1.0" encoding="UTF-8"?>
<doi_records>
  <doi_record owner="10.7554" timestamp="2018-08-23 09:41:49">
    <crossref>
      <journal>
        <journal_metadata language="en">
          <full_title>eLife</full_title>
          <issn media_type="electronic">2050-084X</issn>
        </journal_metadata>
        <journal_issue>
          <publication_date media_type="online">
            <month>02</month>
            <day>11</day>
            <year>2014</year>
          </publication_date>
          <journal_volume>
            <volume>3</volume>
          </journal_volume>
        </journal_issue>
        <journal_article publication_type="full_text" reference_distribution_opts="any">
          <titles>
            <title>Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth</title>
          </titles>
          <contributors>
            <person_name contributor_role="author" sequence="first">
              <given_name>Martial</given_name>
              <surname>Sankar</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Kaisa</given_name>
              <surname>Nieminen</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Laura</given_name>
              <surname>Ragni</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Ioannis</given_name>
              <surname>Xenarios</surname>
              <affiliation>Vital-IT, Swiss Institute of Bioinformatics, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Christian S</given_name>
              <surname>Hardtke</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
          </contributors>
          <abstract>
            <p>Among various advantages, their small size makes model organisms preferred subjects of investigation. Yet, even in model systems detailed analysis of numerous developmental processes at cellular level is severely hampered by their scale. For instance, secondary growth of Arabidopsis hypocotyls creates a radial pattern of highly specialized tissues that comprises several thousand cells starting from a few dozen. This dynamic process is difficult to follow because of its scale and because it can only be investigated invasively, precluding comprehensive understanding of the cell proliferation, differentiation, and patterning events involved. To overcome such limitation, we established an automated quantitative histology approach. We acquired hypocotyl cross-sections from tiled high-resolution images and extracted their information content using custom high-throughput image processing and segmentation. Coupled with automated cell type recognition through machine learning, we could establish a cellular resolution atlas that reveals vascular morphodynamics during secondary growth, for example equidistant phloem pole formation.</p>
          </abstract>
          <abstract abstract-type="executive-summary">
            <p>Our understanding of the living world has been advanced greatly by studies of ‘model organisms’, such as mice, zebrafish, and fruit flies. Studying these creatures has been crucial to uncovering the genes that control how our bodies develop and grow, and also to discover the genetic basis of diseases such as cancer.</p>
            <p>Thale cress—or Arabidopsis thaliana to give its formal name—is the model organism of choice for many plant biologists. This tiny weed has been widely studied because it can complete its lifecycle, from seed to seed, in about 6 weeks, and because its relatively small genome simplifies the search for genes that control specific traits. However, as with other much-studied model systems, understanding the changes that underpin the development of some of the more complex tissues in Arabidopsis has been severely hampered by the shear number of cells involved.</p>
            <p>After it has emerged from the seed, the plant’s first stem will develop from a few dozen cells in width to several thousand cells with highly specialized tissues arranged in a complex pattern of concentric circles. Although this stem thickening process represents a major developmental change in many plants—from Arabidopsis to oak trees—it has been under-researched. This is partly because it involves so many different cells, and also because it can only be observed in thin sections cut out of the plant’s stem.</p>
            <p>Now Sankar, Nieminen, Ragni et al. have developed a novel approach, termed ‘automated quantitative histology’, to overcome these problems. This strategy involves ‘teaching’ a computer to automatically recognize different plant cells and to measure their important features in high-resolution images of tissue sections. The resulting ‘map’ of the developing stem—which required over 800 hr of computing time to complete—reveals the changes to cells and tissues as they develop that allow the transport of water, sugars and nutrients between the above- and below-ground organs. Sankar, Nieminen, Ragni et al. suggest that their novel approach could, in the future, also be applied to study the development of other tissues and organisms, including animals.</p>
          </abstract>
          <publication_date media_type="online">
            <month>02</month>
            <day>11</day>
            <year>2014</year>
          </publication_date>
          <publisher_item>
            <item_number item_number_type="article_number">e01567</item_number>
            <identifier id_type="doi">10.7554/eLife.01567</identifier>
          </publisher_item>
          <program name="fundref">
            <assertion name="fundgroup">
              <assertion name="funder_name">SystemsX</assertion>
            </assertion>
            <assertion name="fundgroup">
              <assertion name="funder_name">EMBO longterm post-doctoral fellowships</assertion>
            </assertion>
            <assertion name="fundgroup">
              <assertion name="funder_name">Marie Heim-Voegtlin</assertion>
            </assertion>
            <assertion name="fundgroup">
              <assertion name="funder_name">
                University of Lausanne
                <assertion name="funder_identifier" provider="crossref">501100006390</assertion>
              </assertion>
            </assertion>
          </program>
          <program name="AccessIndicators">
            <license_ref applies_to="vor">http://creativecommons.org/licenses/by/3.0/</license_ref>
            <license_ref applies_to="am">http://creativecommons.org/licenses/by/3.0/</license_ref>
            <license_ref applies_to="tdm">http://creativecommons.org/licenses/by/3.0/</license_ref>
          </program>
          <crossmark>
            <crossmark_version>1</crossmark_version>
            <crossmark_policy>eLifesciences</crossmark_policy>
            <crossmark_domains>
              <crossmark_domain>
                <domain>www.elifesciences.org</domain>
              </crossmark_domain>
            </crossmark_domains>
            <crossmark_domain_exclusive>false</crossmark_domain_exclusive>
            <custom_metadata>
              <assertion name="received" label="Received" group_name="publication_history" group_label="Publication History" order="0">2013-09-20</assertion>
              <assertion name="accepted" label="Accepted" group_name="publication_history" group_label="Publication History" order="1">2013-12-24</assertion>
              <assertion name="published" label="Published" group_name="publication_history" group_label="Publication History" order="2">2014-02-11</assertion>
              <program name="fundref">
                <assertion name="fundgroup">
                  <assertion name="funder_name">SystemsX</assertion>
                </assertion>
                <assertion name="fundgroup">
                  <assertion name="funder_name">
                    EMBO
                    <assertion name="funder_identifier">http://dx.doi.org/10.13039/501100003043</assertion>
                  </assertion>
                </assertion>
                <assertion name="fundgroup">
                  <assertion name="funder_name">
                    Swiss National Science Foundation
                    <assertion name="funder_identifier">http://dx.doi.org/10.13039/501100001711</assertion>
                  </assertion>
                </assertion>
                <assertion name="fundgroup">
                  <assertion name="funder_name">
                    University of Lausanne
                    <assertion name="funder_identifier" provider="crossref">http://dx.doi.org/10.13039/501100006390</assertion>
                  </assertion>
                </assertion>
              </program>
              <program name="AccessIndicators">
                <license_ref applies_to="vor">http://creativecommons.org/licenses/by/3.0/</license_ref>
                <license_ref applies_to="am">http://creativecommons.org/licenses/by/3.0/</license_ref>
                <license_ref applies_to="tdm">http://creativecommons.org/licenses/by/3.0/</license_ref>
              </program>
            </custom_metadata>
          </crossmark>
          <program>
            <related_item>
              <description>Data from: Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth</description>
              <inter_work_relation identifier-type="doi" relationship-type="isSupplementedBy">10.5061/dryad.b835k</inter_work_relation>
            </related_item>
          </program>
          <archive_locations>
            <archive name="CLOCKSS" />
          </archive_locations>
          <doi_data>
            <doi>10.7554/eLife.01567</doi>
            <resource>https://elifesciences.org/articles/01567</resource>
            <collection property="text-mining">
              <item>
                <resource mime_type="application/pdf">https://cdn.elifesciences.org/articles/01567/elife-01567-v1.pdf</resource>
              </item>
              <item>
                <resource mime_type="application/xml">https://cdn.elifesciences.org/articles/01567/elife-01567-v1.xml</resource>
              </item>
            </collection>
          </doi_data>
          <citation_list>
            <citation key="bib1">
              <journal_title>Nature</journal_title>
              <author>Bonke</author>
              <volume>426</volume>
              <first_page>181</first_page>
              <cYear>2003</cYear>
              <article_title>APL regulates vascular tissue identity in Arabidopsis</article_title>
              <doi>10.1038/nature02100</doi>
            </citation>
            <citation key="bib2">
              <journal_title>Genetics</journal_title>
              <author>Brenner</author>
              <volume>182</volume>
              <first_page>413</first_page>
              <cYear>2009</cYear>
              <article_title>In the beginning was the worm</article_title>
              <doi>10.1534/genetics.109.104976</doi>
            </citation>
            <citation key="bib3">
              <journal_title>Physiologia Plantarum</journal_title>
              <author>Chaffey</author>
              <volume>114</volume>
              <first_page>594</first_page>
              <cYear>2002</cYear>
              <article_title>Secondary xylem development in Arabidopsis: a model for wood formation</article_title>
              <doi>10.1034/j.1399-3054.2002.1140413.x</doi>
            </citation>
            <citation key="bib4">
              <journal_title>Neural computation</journal_title>
              <author>Chang</author>
              <volume>13</volume>
              <first_page>2119</first_page>
              <cYear>2001</cYear>
              <article_title>Training nu-support vector classifiers: theory and algorithms</article_title>
              <doi>10.1162/089976601750399335</doi>
            </citation>
            <citation key="bib5">
              <journal_title>Machine Learning</journal_title>
              <author>Cortes</author>
              <volume>20</volume>
              <first_page>273</first_page>
              <cYear>1995</cYear>
              <doi provider="crossref">10.1007/BF00994018</doi>
              <article_title>Support-vector Networks</article_title>
            </citation>
            <citation key="bib6">
              <journal_title>Development</journal_title>
              <author>Dolan</author>
              <volume>119</volume>
              <first_page>71</first_page>
              <cYear>1993</cYear>
              <article_title>Cellular organisation of the Arabidopsis thaliana root</article_title>
            </citation>
            <citation key="bib7">
              <journal_title>Seminars in Cell &amp; Developmental Biology</journal_title>
              <author>Elo</author>
              <volume>20</volume>
              <first_page>1097</first_page>
              <cYear>2009</cYear>
              <article_title>Stem cell function during plant vascular development</article_title>
              <doi>10.1016/j.semcdb.2009.09.009</doi>
            </citation>
            <citation key="bib8">
              <journal_title>Development</journal_title>
              <author>Etchells</author>
              <volume>140</volume>
              <first_page>2224</first_page>
              <cYear>2013</cYear>
              <article_title>WOX4 and WOX14 act downstream of the PXY receptor kinase to regulate plant vascular proliferation independently of any role in vascular organisation</article_title>
              <doi>10.1242/dev.091314</doi>
            </citation>
            <citation key="bib9">
              <journal_title>PLOS Genetics</journal_title>
              <author>Etchells</author>
              <volume>8</volume>
              <first_page>e1002997</first_page>
              <cYear>2012</cYear>
              <article_title>Plant vascular cell division is maintained by an interaction between PXY and ethylene signalling</article_title>
              <doi>10.1371/journal.pgen.1002997</doi>
            </citation>
            <citation key="bib10">
              <journal_title>Molecular Systems Biology</journal_title>
              <author>Fuchs</author>
              <volume>6</volume>
              <first_page>370</first_page>
              <cYear>2010</cYear>
              <article_title>Clustering phenotype populations by genome-wide RNAi and multiparametric imaging</article_title>
              <doi>10.1038/msb.2010.25</doi>
            </citation>
            <citation key="bib11">
              <journal_title>Bio Systems</journal_title>
              <author>Granqvist</author>
              <volume>110</volume>
              <first_page>60</first_page>
              <cYear>2012</cYear>
              <article_title>BaSAR-A tool in R for frequency detection</article_title>
              <doi>10.1016/j.biosystems.2012.07.004</doi>
            </citation>
            <citation key="bib12">
              <journal_title>Current Opinion in Plant Biology</journal_title>
              <author>Groover</author>
              <volume>9</volume>
              <first_page>55</first_page>
              <cYear>2006</cYear>
              <article_title>Developmental mechanisms regulating secondary growth in woody plants</article_title>
              <doi>10.1016/j.pbi.2005.11.013</doi>
            </citation>
            <citation key="bib13">
              <journal_title>Plant Cell</journal_title>
              <author>Hirakawa</author>
              <volume>22</volume>
              <first_page>2618</first_page>
              <cYear>2010</cYear>
              <article_title>TDIF peptide signaling regulates vascular stem cell proliferation via the WOX4 homeobox gene in Arabidopsis</article_title>
              <doi>10.1105/tpc.110.076083</doi>
            </citation>
            <citation key="bib14">
              <journal_title>Proceedings of the National Academy of Sciences of the United States of America</journal_title>
              <author>Hirakawa</author>
              <volume>105</volume>
              <first_page>15208</first_page>
              <cYear>2008</cYear>
              <article_title>Non-cell-autonomous control of vascular stem cell fate by a CLE peptide/receptor system</article_title>
              <doi>10.1073/pnas.0808444105</doi>
            </citation>
            <citation key="bib15">
              <journal_title>Cell</journal_title>
              <author>Meyerowitz</author>
              <volume>56</volume>
              <first_page>263</first_page>
              <cYear>1989</cYear>
              <article_title>Arabidopsis, a useful weed</article_title>
              <doi>10.1016/0092-8674(89)90900-8</doi>
            </citation>
            <citation key="bib16">
              <journal_title>Science</journal_title>
              <author>Meyerowitz</author>
              <volume>295</volume>
              <first_page>1482</first_page>
              <cYear>2002</cYear>
              <article_title>Plants compared to animals: the broadest comparative study of development</article_title>
              <doi>10.1126/science.1066609</doi>
            </citation>
            <citation key="bib17">
              <journal_title>Plant Physiol</journal_title>
              <author>Nieminen</author>
              <volume>135</volume>
              <first_page>653</first_page>
              <cYear>2004</cYear>
              <article_title>A weed for wood? Arabidopsis as a genetic model for xylem development</article_title>
              <doi>10.1104/pp.104.040212</doi>
            </citation>
            <citation key="bib18">
              <journal_title>Nature Biotechnology</journal_title>
              <author>Noble</author>
              <volume>24</volume>
              <first_page>1565</first_page>
              <cYear>2006</cYear>
              <article_title>What is a support vector machine?</article_title>
              <doi>10.1038/nbt1206-1565</doi>
            </citation>
            <citation key="bib19">
              <journal_title>Proceedings of the National Academy of Sciences of the United States of America</journal_title>
              <author>Olson</author>
              <volume>77</volume>
              <first_page>1516</first_page>
              <cYear>1980</cYear>
              <article_title>Classification of cultured mammalian cells by shape analysis and pattern recognition</article_title>
              <doi>10.1073/pnas.77.3.1516</doi>
            </citation>
            <citation key="bib20">
              <journal_title>Bioinformatics</journal_title>
              <author>Pau</author>
              <volume>26</volume>
              <first_page>979</first_page>
              <cYear>2010</cYear>
              <article_title>EBImage–an R package for image processing with applications to cellular phenotypes</article_title>
              <doi>10.1093/bioinformatics/btq046</doi>
            </citation>
            <citation key="bib21">
              <journal_title>Plant Cell</journal_title>
              <author>Ragni</author>
              <volume>23</volume>
              <first_page>1322</first_page>
              <cYear>2011</cYear>
              <article_title>Mobile gibberellin directly stimulates Arabidopsis hypocotyl xylem expansion</article_title>
              <doi>10.1105/tpc.111.084020</doi>
            </citation>
            <citation key="bib22">
              <journal_title>Dryad Digital Repository</journal_title>
              <author>Sankar</author>
              <cYear>2014</cYear>
              <article_title>Data from: Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth</article_title>
              <doi>10.5061/dryad.b835k</doi>
            </citation>
            <citation key="bib23">
              <journal_title>Current Biology</journal_title>
              <author>Sibout</author>
              <volume>18</volume>
              <first_page>458</first_page>
              <cYear>2008</cYear>
              <article_title>Flowering as a condition for xylem expansion in Arabidopsis hypocotyl and root</article_title>
              <doi>10.1016/j.cub.2008.02.070</doi>
            </citation>
            <citation key="bib24">
              <journal_title>The New Phytologist</journal_title>
              <author>Spicer</author>
              <volume>186</volume>
              <first_page>577</first_page>
              <cYear>2010</cYear>
              <article_title>Evolution of development of vascular cambia and secondary growth</article_title>
              <doi>10.1111/j.1469-8137.2010.03236.x</doi>
            </citation>
            <citation key="bib25">
              <journal_title>Machine Vision and Applications</journal_title>
              <author>Theriault</author>
              <volume>23</volume>
              <first_page>659</first_page>
              <cYear>2012</cYear>
              <article_title>Cell morphology classification and clutter mitigation in phase-contrast microscopy images using machine learning</article_title>
              <doi>10.1007/s00138-011-0345-9</doi>
            </citation>
            <citation key="bib26">
              <journal_title>Cell</journal_title>
              <author>Uyttewaal</author>
              <volume>149</volume>
              <first_page>439</first_page>
              <cYear>2012</cYear>
              <article_title>Mechanical stress acts via katanin to amplify differences in growth rate between adjacent cells in Arabidopsis</article_title>
              <doi>10.1016/j.cell.2012.02.048</doi>
            </citation>
            <citation key="bib27">
              <journal_title>Nature Cell Biology</journal_title>
              <author>Yin</author>
              <volume>15</volume>
              <first_page>860</first_page>
              <cYear>2013</cYear>
              <article_title>A screen for morphological complexity identifies regulators of switch-like transitions between discrete cell shapes</article_title>
              <doi>10.1038/ncb2764</doi>
            </citation>
          </citation_list>
          <component_list>
            <component parent_relation="isPartOf">
              <titles>
                <title>Abstract</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.001</doi>
                <resource>https://elifesciences.org/articles/01567#abstract</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>eLife digest</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.002</doi>
                <resource>https://elifesciences.org/articles/01567#digest</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 1. Cellular level analysis of Arabidopsis hypocotyl secondary growth.</title>
                <subtitle>(A) Light microscopy of cross sections obtained from Arabidopsis hypocotyls (organ position illustrated for a 9-day-old seedling, lower left) at 9 dag (upper left) and 35 dag (right). Size bars are 100 μm. Blue GUS staining due to the presence of an APL::GUS reporter gene in this Col-0 background line marks phloem bundles. (B) Overview of the developmental series (time points and distinct samples per genotype) analyzed in this study. (C) Example of a high-resolution hypocotyl section image assembled from 11 × 11 tiles. (D) The same image after pre-processing and binarization, and (E) subsequent segmentation using a watershed algorithm. (F) Number of mis-segmented cells as determined by careful visual inspection in 12 sections, plotted against the total number of cells per section (log scale).</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.003</doi>
                <resource>https://elifesciences.org/articles/01567#fig1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 2. The ‘Quantitative Histology’ approach.</title>
                <subtitle>(A) Overview of the computational pipeline from image acquisition to analysis. (B) ‘Phenoprints’ for the different genotypes and developmental stages.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.004</doi>
                <resource>https://elifesciences.org/articles/01567#fig2</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 2—figure supplement 1. An example of classifier selection through V-fold cross validation.</title>
                <subtitle>The green arrow points out the selected feature combination according to the criteria of minimum number of features with the highest performance and the lowest variation (the radiusV feature was excluded due to its putative variation in tissue location).</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.005</doi>
                <resource>https://elifesciences.org/articles/01567/figures#fig2s1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 3. Progression of tissue proliferation.</title>
                <subtitle>(A) Principal component analysis (PCA) of the phenoprints shown in Figure 2B, performed with normalized values (Supplementary file 4). The inlay screeplot displays the proportion of total variation explained by each principal component. (B–E) Comparative plots of parameter progression in the two genotypes. In (D), xylem represents combined vessel, parenchyma, and fiber cells, phloem represents combined phloem parenchyma and bundle cells. Error bars indicate standard error.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.006</doi>
                <resource>https://elifesciences.org/articles/01567#fig3</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 4. Bimodal distribution of incline angle according to position.</title>
                <subtitle>(A and B) Spatial distribution of cell incline angle illustrates the vascular organization in Ler (B) as compared to Col-0 (A) at later stages of development, for example 30 dag. The size of the disc increases with the area of the cell. Blue color indicates radial cell orientation, red orthoradial. (C and D) Violin plots of incline angle distribution, illustrating increasingly bimodal distribution coincident with refined vascular organization and different dynamics of the process in the two genotypes.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.007</doi>
                <resource>https://elifesciences.org/articles/01567#fig4</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 4—figure supplement 1. An illustration of the incline angle.</title>
                <subtitle>The incline is the angle between the section radius through the center of an ellipse fit to a cell and the major axis of that ellipse extended towards the x axis.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.008</doi>
                <resource>https://elifesciences.org/articles/01567/figures#fig4s1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 5. Distinct local organization of incline angle during hypocotyl secondary growth progression.</title>
                <subtitle>(A–J) Density plots of cell incline angle vs radial position for the two genotypes at the indicated developmental stages, representing all cells across all sections for a given time point. The red lines represent the fit of these cloud distributions with locally weighted linear regression (i.e., lowess), revealing the essential data trends. All sections were normalized from 0.0 (the manually defined center) to 1.0 (the average radius in a set of sections as determined by the average distance of the outermost cells from the center for individual sections). Box plots indicate the quartiles of the radian distribution for each cell-type class and are placed at the average position of the cell type with respect to the y axis. Outliers are shown as circles.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.009</doi>
                <resource>https://elifesciences.org/articles/01567#fig5</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 5—figure supplement 1. Analysis of cell number in defined xylem regions of different size.</title>
                <subtitle>Cell number in a circle of 200–500 pixels around the section centers for Col-0. Cell count in a constant area of xylem over time across all averaged across all sections.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.010</doi>
                <resource>https://elifesciences.org/articles/01567/figures#fig5s1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 6. Mapping of phloem pole patterning.</title>
                <subtitle>(A) Example of Gaussian kernel density estimate of the location of predicted phloem bundles cells in a 30 dag Col-0 section. High density represents phloem poles. (B) Example of an analysis of emerging phloem pole position in a 30 dag Col-0 section. The plot represents a pixel intensity map after noise reduction along a circular region of interest across the emerging phloem poles. Intensity peaks are due to GUS staining conferred to phloem bundles by an APL::GUS reporter construct. (C) Probability density function of the data shown in (B) obtained from an automated Bayesian model. The dominant single peak indicates a constant arc distance of ca. 62 pixel between the phloem poles.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.011</doi>
                <resource>https://elifesciences.org/articles/01567#fig6</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 1.</title>
                <subtitle>(A) An explanation of the extracted parameters that describe the cellular features. (B) Summary information of the hand-labeled training set for supervised machine learning. (C) Definition of the classifiers selected for analysis. (D) Summary of the classifier parameters for supervised machine learning. (E) Overview of the cell type classes recognized by the supervised machine learning approach and their assignment codes used in Data Files 3 and 4.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.012</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD1-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 2.</title>
                <subtitle>Quality control files for the Col-0 sections.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.013</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD2-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 3.</title>
                <subtitle>Quality control files for the Ler sections.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.014</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD3-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 4.</title>
                <subtitle>The normalized values of the phenoprints (Figure 2B) used for PCA.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.015</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD4-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Decision letter</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.016</doi>
                <resource>https://elifesciences.org/articles/01567#SA1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Author response</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.017</doi>
                <resource>https://elifesciences.org/articles/01567#SA2</resource>
              </doi_data>
            </component>
          </component_list>
        </journal_article>
      </journal>
    </crossref>
  </doi_record>
</doi_records> + http_version: + recorded_at: Sat, 01 Dec 2018 14:44:44 GMT +recorded_with: VCR 3.0.3 diff --git a/spec/fixtures/vcr_cassettes/Doi/parse_xml/from_datacite_url.yml b/spec/fixtures/vcr_cassettes/Doi/parse_xml/from_datacite_url.yml new file mode 100644 index 000000000..ff4904ed4 --- /dev/null +++ b/spec/fixtures/vcr_cassettes/Doi/parse_xml/from_datacite_url.yml @@ -0,0 +1,99 @@ +--- +http_interactions: +- request: + method: get + uri: https://api.datacite.org/prefixes/10.7272 + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/html,application/json,application/xml;q=0.9, text/plain;q=0.8,image/png,*/*;q=0.5 + response: + status: + code: 200 + message: OK + headers: + Date: + - Fri, 07 Dec 2018 12:23:35 GMT + Content-Type: + - application/json; charset=utf-8 + Connection: + - keep-alive + Status: + - 200 OK + X-Anonymous-Consumer: + - 'true' + Cache-Control: + - max-age=0, private, must-revalidate + Vary: + - Accept-Encoding, Origin + X-Request-Id: + - 7ac3e7b6-6d0c-46fe-932d-5c0bce43449b + Etag: + - W/"434d63d02889e47275389a930375c569" + X-Runtime: + - '0.024104' + X-Powered-By: + - Phusion Passenger 6.0.0 + Server: + - nginx/1.15.7 + Phusion Passenger 6.0.0 + body: + encoding: ASCII-8BIT + string: '{"data":{"id":"10.7272","type":"prefixes","attributes":{"registration-agency":"DataCite","created":"2012-03-15T09:47:35.000Z","updated":null},"relationships":{"clients":{"data":[{"id":"cdl.ucsfctsi","type":"clients"}]},"providers":{"data":[{"id":"cdl","type":"providers"}]}}},"included":[{"id":"cdl.ucsfctsi","type":"clients","attributes":{"name":"UCSF + Clinical & Translational Science Institute (CTSI)","symbol":"CDL.UCSFCTSI","year":2012,"contact-name":"EZID + Support Desk","contact-email":"ezid@ucop.edu","domains":"*","url":null,"created":"2012-07-10T20:59:53.000Z","updated":"2018-08-26T02:35:12.000Z","is-active":true,"has-password":true},"relationships":{"provider":{"data":{"id":"cdl","type":"providers"}},"prefixes":{"data":[{"id":"10.5072","type":"prefixes"},{"id":"10.7272","type":"prefixes"}]}}},{"id":"cdl","type":"providers","attributes":{"name":"California + Digital Library","symbol":"CDL","website":"http://ezid.cdlib.org","contact-name":"EZID + Support Desk","contact-email":"ezid@ucop.edu","phone":null,"description":"California + Digital Library (CDL) handles scholarly information at every stage of its + life. CDL provides technology and expertise to help the University of California + (UC) collect, publish, access, and preserve its full range of information + resources. CDL partners with organizations outside the UCs on far-reaching + problems.\n\nCDL offers DataCite DOIs to University of California scholars + and researchers via the EZID service. EZID is also available as a general + identifier service to help educational, non-profit, governmental and commercial + clients create and manage globally unique identifiers for data and other sources.","region":"AMER","country":"US","logo-url":"https://assets.datacite.org/images/members/cdl.png","organization-type":"academic_institution","focus-area":"general","is-active":true,"has-password":true,"joined":"2009-12-01","created":"2010-01-01T00:00:00.000Z","updated":"2018-10-24T20:47:51.000Z"},"relationships":{"prefixes":{"data":[{"id":"10.5062","type":"prefixes"},{"id":"10.5063","type":"prefixes"},{"id":"10.5065","type":"prefixes"},{"id":"10.5068","type":"prefixes"},{"id":"10.5069","type":"prefixes"},{"id":"10.5070","type":"prefixes"},{"id":"10.5072","type":"prefixes"},{"id":"10.6071","type":"prefixes"},{"id":"10.6072","type":"prefixes"},{"id":"10.6074","type":"prefixes"},{"id":"10.6075","type":"prefixes"},{"id":"10.6076","type":"prefixes"},{"id":"10.6078","type":"prefixes"},{"id":"10.6079","type":"prefixes"},{"id":"10.6080","type":"prefixes"},{"id":"10.6081","type":"prefixes"},{"id":"10.6085","type":"prefixes"},{"id":"10.6086","type":"prefixes"},{"id":"10.7265","type":"prefixes"},{"id":"10.7268","type":"prefixes"},{"id":"10.7269","type":"prefixes"},{"id":"10.7270","type":"prefixes"},{"id":"10.7271","type":"prefixes"},{"id":"10.7272","type":"prefixes"},{"id":"10.7276","type":"prefixes"},{"id":"10.7279","type":"prefixes"},{"id":"10.7280","type":"prefixes"},{"id":"10.7281","type":"prefixes"},{"id":"10.7282","type":"prefixes"},{"id":"10.7284","type":"prefixes"},{"id":"10.7285","type":"prefixes"},{"id":"10.7286","type":"prefixes"},{"id":"10.7288","type":"prefixes"},{"id":"10.7291","type":"prefixes"},{"id":"10.7292","type":"prefixes"},{"id":"10.7293","type":"prefixes"},{"id":"10.7295","type":"prefixes"},{"id":"10.7296","type":"prefixes"},{"id":"10.7297","type":"prefixes"},{"id":"10.7299","type":"prefixes"},{"id":"10.7300","type":"prefixes"},{"id":"10.4246","type":"prefixes"},{"id":"10.7908","type":"prefixes"},{"id":"10.7911","type":"prefixes"},{"id":"10.7913","type":"prefixes"},{"id":"10.7914","type":"prefixes"},{"id":"10.7916","type":"prefixes"},{"id":"10.7918","type":"prefixes"},{"id":"10.7919","type":"prefixes"},{"id":"10.7920","type":"prefixes"},{"id":"10.7921","type":"prefixes"},{"id":"10.7922","type":"prefixes"},{"id":"10.7925","type":"prefixes"},{"id":"10.7927","type":"prefixes"},{"id":"10.7928","type":"prefixes"},{"id":"10.7929","type":"prefixes"},{"id":"10.7932","type":"prefixes"},{"id":"10.7933","type":"prefixes"},{"id":"10.7934","type":"prefixes"},{"id":"10.7939","type":"prefixes"},{"id":"10.7940","type":"prefixes"},{"id":"10.7941","type":"prefixes"},{"id":"10.7942","type":"prefixes"},{"id":"10.7943","type":"prefixes"},{"id":"10.7944","type":"prefixes"},{"id":"10.7945","type":"prefixes"},{"id":"10.7946","type":"prefixes"},{"id":"10.13022","type":"prefixes"},{"id":"10.13026","type":"prefixes"},{"id":"10.13025","type":"prefixes"},{"id":"10.15147","type":"prefixes"},{"id":"10.15146","type":"prefixes"},{"id":"10.15142","type":"prefixes"},{"id":"10.15144","type":"prefixes"},{"id":"10.15145","type":"prefixes"},{"id":"10.15140","type":"prefixes"},{"id":"10.15141","type":"prefixes"},{"id":"10.15139","type":"prefixes"},{"id":"10.1184","type":"prefixes"},{"id":"10.15784","type":"prefixes"},{"id":"10.15779","type":"prefixes"},{"id":"10.15780","type":"prefixes"},{"id":"10.15781","type":"prefixes"},{"id":"10.15782","type":"prefixes"},{"id":"10.17612","type":"prefixes"},{"id":"10.17610","type":"prefixes"},{"id":"10.17611","type":"prefixes"},{"id":"10.17614","type":"prefixes"},{"id":"10.17615","type":"prefixes"},{"id":"10.17602","type":"prefixes"},{"id":"10.17603","type":"prefixes"},{"id":"10.17908","type":"prefixes"},{"id":"10.17916","type":"prefixes"},{"id":"10.17915","type":"prefixes"},{"id":"10.17918","type":"prefixes"},{"id":"10.17919","type":"prefixes"},{"id":"10.17911","type":"prefixes"},{"id":"10.17913","type":"prefixes"},{"id":"10.17920","type":"prefixes"},{"id":"10.18123","type":"prefixes"},{"id":"10.18119","type":"prefixes"},{"id":"10.18118","type":"prefixes"},{"id":"10.18117","type":"prefixes"},{"id":"10.18115","type":"prefixes"},{"id":"10.18431","type":"prefixes"},{"id":"10.18436","type":"prefixes"},{"id":"10.18437","type":"prefixes"},{"id":"10.18439","type":"prefixes"},{"id":"10.18737","type":"prefixes"},{"id":"10.18736","type":"prefixes"},{"id":"10.18739","type":"prefixes"},{"id":"10.18734","type":"prefixes"},{"id":"10.20353","type":"prefixes"},{"id":"10.20354","type":"prefixes"},{"id":"10.20352","type":"prefixes"},{"id":"10.20357","type":"prefixes"},{"id":"10.20358","type":"prefixes"},{"id":"10.20359","type":"prefixes"},{"id":"10.21228","type":"prefixes"},{"id":"10.21229","type":"prefixes"},{"id":"10.21224","type":"prefixes"},{"id":"10.21222","type":"prefixes"},{"id":"10.21223","type":"prefixes"},{"id":"10.21221","type":"prefixes"},{"id":"10.21237","type":"prefixes"},{"id":"10.21238","type":"prefixes"},{"id":"10.21239","type":"prefixes"},{"id":"10.21236","type":"prefixes"},{"id":"10.21430","type":"prefixes"},{"id":"10.21433","type":"prefixes"},{"id":"10.21431","type":"prefixes"},{"id":"10.21421","type":"prefixes"},{"id":"10.21422","type":"prefixes"},{"id":"10.21424","type":"prefixes"},{"id":"10.21425","type":"prefixes"},{"id":"10.21426","type":"prefixes"},{"id":"10.21427","type":"prefixes"},{"id":"10.21428","type":"prefixes"},{"id":"10.21418","type":"prefixes"},{"id":"10.21416","type":"prefixes"},{"id":"10.21414","type":"prefixes"},{"id":"10.21972","type":"prefixes"},{"id":"10.21973","type":"prefixes"},{"id":"10.21975","type":"prefixes"},{"id":"10.21976","type":"prefixes"},{"id":"10.21977","type":"prefixes"},{"id":"10.21978","type":"prefixes"},{"id":"10.21990","type":"prefixes"},{"id":"10.21983","type":"prefixes"},{"id":"10.21980","type":"prefixes"},{"id":"10.21986","type":"prefixes"},{"id":"10.5195","type":"prefixes"},{"id":"10.25334","type":"prefixes"},{"id":"10.25337","type":"prefixes"},{"id":"10.25338","type":"prefixes"},{"id":"10.25342","type":"prefixes"},{"id":"10.25349","type":"prefixes"},{"id":"10.25348","type":"prefixes"},{"id":"10.25347","type":"prefixes"},{"id":"10.25346","type":"prefixes"},{"id":"10.25345","type":"prefixes"},{"id":"10.25344","type":"prefixes"},{"id":"10.25352","type":"prefixes"},{"id":"10.25350","type":"prefixes"},{"id":"10.25351","type":"prefixes"},{"id":"10.26081","type":"prefixes"}]}}}]}' + http_version: + recorded_at: Fri, 07 Dec 2018 12:23:35 GMT +- request: + method: get + uri: https://search.test.datacite.org/api?fl=doi,url,xml,state,allocator_symbol,datacentre_symbol,media,minted,updated&q=doi:10.7272/q6g15xs4&wt=json + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/html,application/json,application/xml;q=0.9, text/plain;q=0.8,image/png,*/*;q=0.5 + response: + status: + code: 200 + message: OK + headers: + Date: + - Fri, 07 Dec 2018 12:23:35 GMT + Content-Type: + - application/json;charset=UTF-8 + Connection: + - keep-alive + Server: + - nginx/1.10.3 (Ubuntu) + Access-Control-Allow-Origin: + - "*" + Access-Control-Allow-Methods: + - GET, POST, PUT, DELETE, OPTIONS + Access-Control-Allow-Headers: + - DNT,X-CustomHeader,Keep-Alive,User-Agent,X-Requested-With,If-Modified-Since,Cache-Control,Content-Type,Content-Range,Range,Authorization + Access-Control-Expose-Headers: + - DNT,X-CustomHeader,Keep-Alive,User-Agent,X-Requested-With,If-Modified-Since,Cache-Control,Content-Type,Content-Range,Range,Authorization + body: + encoding: ASCII-8BIT + string: '{"responseHeader":{"status":0,"QTime":0},"response":{"numFound":1,"start":0,"docs":[{"datacentre_symbol":"CDL.UCSFCTSI","url":"https://datashare.ucsf.edu/stash/dataset/doi:10.7272/Q6G15XS4","xml":"PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0iVVRGLTgiPz4KPHJlc291cmNlIHhtbG5zOnhzaT0iaHR0cDovL3d3dy53My5vcmcvMjAwMS9YTUxTY2hlbWEtaW5zdGFuY2UiIHhtbG5zPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtMyIgeHNpOnNjaGVtYUxvY2F0aW9uPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtMyBodHRwOi8vc2NoZW1hLmRhdGFjaXRlLm9yZy9tZXRhL2tlcm5lbC0zL21ldGFkYXRhLnhzZCI+CiAgPGlkZW50aWZpZXIgaWRlbnRpZmllclR5cGU9IkRPSSI+MTAuNzI3Mi9RNkcxNVhTNDwvaWRlbnRpZmllcj4KICA8Y3JlYXRvcnM+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lPlJvZHJpZ3VleiwgUm9iZXJ0PC9jcmVhdG9yTmFtZT4KICAgICAgPGFmZmlsaWF0aW9uPlVDIFNhbiBGcmFuY2lzY288L2FmZmlsaWF0aW9uPgogICAgPC9jcmVhdG9yPgogICAgPGNyZWF0b3I+CiAgICAgIDxjcmVhdG9yTmFtZT5Nb3dlciwgV2lsbGlhbTwvY3JlYXRvck5hbWU+CiAgICAgIDxhZmZpbGlhdGlvbj5VQ0xBPC9hZmZpbGlhdGlvbj4KICAgIDwvY3JlYXRvcj4KICA8L2NyZWF0b3JzPgogIDx0aXRsZXM+CiAgICA8dGl0bGU+TkVYVVMgSGVhZCBDVDwvdGl0bGU+CiAgPC90aXRsZXM+CiAgPHB1Ymxpc2hlcj5VQyBTYW4gRnJhbmNpc2NvPC9wdWJsaXNoZXI+CiAgPHB1YmxpY2F0aW9uWWVhcj4yMDE3PC9wdWJsaWNhdGlvblllYXI+CiAgPGxhbmd1YWdlPmVuPC9sYW5ndWFnZT4KICA8cmVzb3VyY2VUeXBlIHJlc291cmNlVHlwZUdlbmVyYWw9IkRhdGFzZXQiLz4KICA8c2l6ZXM+CiAgICA8c2l6ZT4xNDk1MjA0IGJ5dGVzPC9zaXplPgogIDwvc2l6ZXM+CiAgPHZlcnNpb24+MTwvdmVyc2lvbj4KICA8cmlnaHRzTGlzdD4KICAgIDxyaWdodHMgcmlnaHRzVVJJPSJodHRwczovL2NyZWF0aXZlY29tbW9ucy5vcmcvbGljZW5zZXMvYnkvNC4wLyI+Q3JlYXRpdmUgQ29tbW9ucyBBdHRyaWJ1dGlvbiA0LjAgSW50ZXJuYXRpb25hbCAoQ0MgQlkgNC4wKTwvcmlnaHRzPgogIDwvcmlnaHRzTGlzdD4KICA8ZGVzY3JpcHRpb25zPgogICAgPGRlc2NyaXB0aW9uIGRlc2NyaXB0aW9uVHlwZT0iQWJzdHJhY3QiPgogICAgICBCYWNrZ3JvdW5kIENsaW5pY2lhbnMsIGFmcmFpZCBvZiBtaXNzaW5nIGludHJhY3JhbmlhbCBpbmp1cmllcywgbGliZXJhbGx5CiAgICAgIG9idGFpbiBjb21wdXRlZCB0b21vZ3JhcGhpYyAoQ1QpIGhlYWQgaW1hZ2luZyBpbiBibHVudCB0cmF1bWEgcGF0aWVudHMuCiAgICAgIFByaW9yIHdvcmsgc3VnZ2VzdHMgdGhhdCBjbGluaWNhbCBjcml0ZXJpYSAoTkVYVVMgSGVhZCBDVCBkZWNpc2lvbgogICAgICBpbnN0cnVtZW50KSBjYW4gcmVsaWFibHkgaWRlbnRpZnkgcGF0aWVudHMgd2l0aCBpbXBvcnRhbnQgaW5qdXJpZXMsIHdoaWxlCiAgICAgIGV4Y2x1ZGluZyBpbmp1cnksIGFuZCB0aGUgbmVlZCBmb3IgaW1hZ2luZyBpbiBtYW55IHBhdGllbnRzLiBNZXRob2RzIFdlCiAgICAgIGNvbmR1Y3RlZCBhIHByb3NwZWN0aXZlIG9ic2VydmF0aW9uYWwgc3R1ZHkgb2YgdGhlIE5FWFVTIEhlYWQgQ1QgZGVjaXNpb24KICAgICAgaW5zdHJ1bWVudCAoREkpIHRoYXQgcmVxdWlyZXMgcGF0aWVudHMgdG8gbWVldCBlaWdodCBjcml0ZXJpYSB0byBhY2hpZXZlCiAgICAgIOKAnGxvdy1yaXNr4oCdIGNsYXNzaWZpY2F0aW9uLiBXZSBleGFtaW5lZCB0aGUgaW5zdHJ1bWVudOKAmXMgcGVyZm9ybWFuY2UgaW4KICAgICAgaWRlbnRpZnlpbmcgcGF0aWVudHMgcmVxdWlyaW5nIG5ldXJvbG9naWNhbCBpbnRlcnZlbnRpb24gZnJvbSBhbW9uZyBhCiAgICAgIGNvaG9ydCBvZiAxMSw3NzAgYmx1bnQgaGVhZCBpbmp1cnkgcGF0aWVudHMuIFJlc3VsdHMgVGhlIE5FWFVTIEhlYWQgQ1QgREkKICAgICAgYXNzaWduZWQgaGlnaC1yaXNrIHN0YXR1cyB0byA0MjAgb2YgNDIwIHBhdGllbnRzIHJlcXVpcmluZyBuZXVyb2xvZ2ljYWwKICAgICAgaW50ZXJ2ZW50aW9uIChzZW5zaXRpdml0eSwgMTAwLjAlIFs5NSUgY29uZmlkZW5jZSBpbnRlcnZhbCBbQ0ldOiA5OS4xJSDigJMKICAgICAgMTAwLjAlXSkuIFRoZSBpbnN0cnVtZW50IGFzc2lnbmVkIGxvdy1yaXNrIHN0YXR1cyB0byAyLDgyMyBvZiAxMSwzNTAKICAgICAgcGF0aWVudHMgd2hvIGRpZCBub3QgcmVxdWlyZSBuZXVyb2xvZ2ljYWwgaW50ZXJ2ZW50aW9uIChzcGVjaWZpY2l0eSwgMjQuOSUKICAgICAgWzk1JSBDSTogMjQuMSUgLSAyNS43JV0pLiBOb25lIG9mIHRoZSAyLDgyMyBsb3ctcmlzayBwYXRpZW50cyByZXF1aXJlZAogICAgICBuZXVyb2xvZ2ljYWwgaW50ZXJ2ZW50aW9uIChOUFYsIDEwMC4wJSBbOTUlIENJOiA5OS45JSAtIDEwMC4wJV0pLiBUaGUgREkKICAgICAgYXNzaWduZWQgaGlnaC1yaXNrIHN0YXR1cyB0byA3NTkgb2YgNzY3IHBhdGllbnRzIHdpdGggc2lnbmlmaWNhbnQKICAgICAgaW50cmFjcmFuaWFsIGluanVyaWVzIChzZW5zaXRpdml0eSwgOTkuMCUgWzk1JSBDSTogOTguMCUgLSA5OS42JV0pLiBUaGUKICAgICAgaW5zdHJ1bWVudCBhc3NpZ25lZCBsb3ctcmlzayBzdGF0dXMgdG8gMiw4MTUgb2YgMTEsMDAzIHBhdGllbnRzIHdobyBkaWQKICAgICAgbm90IGhhdmUgc2lnbmlmaWNhbnQgaW5qdXJpZXMgKHNwZWNpZmljaXR5LCAyNS42JSBbOTUlIENJOiAyNC44JSAtCiAgICAgIDI2LjQlXSkuIFNpZ25pZmljYW50IGluanVyaWVzIHdlcmUgYWJzZW50IGluIDIsODE1IG9mIHRoZSAyLDgyMyBwYXRpZW50cwogICAgICBhc3NpZ25lZCBsb3ctcmlzayBzdGF0dXMgKE5QViwgOTkuNyUgWzk1JSBDSTogOTkuNCUgLSA5OS45JV0pLiBDb25jbHVzaW9ucwogICAgICBUaGUgTkVYVVMgSGVhZCBDVCBESSByZWxpYWJseSBpZGVudGlmaWVzIGJsdW50IHRyYXVtYSBwYXRpZW50cyB3aG8gcmVxdWlyZQogICAgICBoZWFkIENUIGltYWdpbmcsIGFuZCBjb3VsZCBzaWduaWZpY2FudGx5IHJlZHVjaW5nIHRoZSB1c2Ugb2YgQ1QgaW1hZ2luZy4KICAgIDwvZGVzY3JpcHRpb24+CiAgICA8ZGVzY3JpcHRpb24gZGVzY3JpcHRpb25UeXBlPSJNZXRob2RzIj5Qcm9zcGVjdGl2ZSBtdWx0aWNlbnRlcjwvZGVzY3JpcHRpb24+CiAgPC9kZXNjcmlwdGlvbnM+CiAgPGdlb0xvY2F0aW9ucz4KICAgIDxnZW9Mb2NhdGlvbj4KICAgICAgPGdlb0xvY2F0aW9uUG9pbnQ+MzcuMjUwMjIgLTExOS43NTEyNjwvZ2VvTG9jYXRpb25Qb2ludD4KICAgICAgPGdlb0xvY2F0aW9uUGxhY2U+Q2FsaWZvcm5pYSwgVVNBPC9nZW9Mb2NhdGlvblBsYWNlPgogICAgPC9nZW9Mb2NhdGlvbj4KICA8L2dlb0xvY2F0aW9ucz4KPC9yZXNvdXJjZT4=","allocator_symbol":"CDL","minted":"2018-12-07T09:48:20Z","state":"findable","updated":"2018-12-07T09:48:20Z","doi":"10.7272/Q6G15XS4"}]}} + +' + http_version: + recorded_at: Fri, 07 Dec 2018 12:23:35 GMT +recorded_with: VCR 3.0.3 diff --git a/spec/fixtures/vcr_cassettes/Doi/parse_xml/from_schema_org_url.yml b/spec/fixtures/vcr_cassettes/Doi/parse_xml/from_schema_org_url.yml new file mode 100644 index 000000000..f807ae151 --- /dev/null +++ b/spec/fixtures/vcr_cassettes/Doi/parse_xml/from_schema_org_url.yml @@ -0,0 +1,92 @@ +--- +http_interactions: +- request: + method: get + uri: https://doi.pangaea.de/10.1594/PANGAEA.836178 + body: + encoding: US-ASCII + string: '' + headers: + Accept-Encoding: + - gzip;q=1.0,deflate;q=0.6,identity;q=0.3 + Accept: + - "*/*" + User-Agent: + - Ruby + response: + status: + code: 200 + message: OK + headers: + Server: + - PANGAEA/1.0 + Date: + - Thu, 29 Nov 2018 12:17:36 GMT + Transfer-Encoding: + - chunked + Vary: + - Accept + - Accept-Encoding + Link: + - ;rel="cite-as", ;rel="describedby";type="application/ld+json", + ;rel="describedby";type="application/x-research-info-systems", + ;rel="describedby";type="application/x-bibtex", + ;rel="item";type="application/zip", + ;rel="author", ;rel="author" + Content-Type: + - text/html;charset=UTF-8 + X-Ua-Compatible: + - IE=Edge + X-Content-Type-Options: + - nosniff + Strict-Transport-Security: + - max-age=31536000 + body: + encoding: ASCII-8BIT + string: !binary |- + <!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1, maximum-scale=1, user-scalable=no">
<link rel="stylesheet" href="//fonts.googleapis.com/css?family=Open+Sans:400,600,400italic,700,700italic,600italic,300,300italic,800,800italic">
<link rel="stylesheet" href="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/bootstrap-24col/css/bootstrap.min.css">
<link rel="stylesheet" href="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/css/pangaea.css">
<!--[if lte IE 9]>
<style>#topics-pulldown-wrapper label:after { display:none; }</style>
<![endif]-->
<link rel="shortcut icon" href="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/favicon.ico">
<link rel="icon" href="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/favicon.ico" type="image/vnd.microsoft.icon">
<link rel="image_src" type="image/png" href="https://www.pangaea.de/assets/social-icons/pangaea-share.png">
<meta property="og:image" content="https://www.pangaea.de/assets/social-icons/pangaea-share.png">
<script type="text/javascript" src="//cdnjs.cloudflare.com/ajax/libs/jquery/1.12.4/jquery.min.js"></script>
<script type="text/javascript" src="//cdnjs.cloudflare.com/ajax/libs/jquery.matchHeight/0.7.0/jquery.matchHeight-min.js"></script>
<script type="text/javascript" src="//cdnjs.cloudflare.com/ajax/libs/jquery.appear/0.4.1/jquery.appear.min.js"></script>
<script type="text/javascript" src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/bootstrap-24col/js/bootstrap.min.js"></script>
<script type="text/javascript" src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/js/datacombo-min.js"></script>
<title>Johansson, E et al. (2014): Hydrological and meteorological investigations in a lake near Kangerlussuaq, west Greenland</title>
<meta name="title" content="Hydrological and meteorological investigations in a lake near Kangerlussuaq, west Greenland" />
<meta name="author" content="Johansson, Emma; Berglund, Sten; Lindborg, Tobias; Petrone, Johannes; van As, Dirk; Gustafsson, Lars-Göran; Näslund, Jens-Ove; Laudon, Hjalmar" />
<meta name="date" content="2014-09-25" />
<meta name="description" content="Johansson, Emma; Berglund, Sten; Lindborg, Tobias; Petrone, Johannes; van As, Dirk; Gustafsson, Lars-Göran; Näslund, Jens-Ove; Laudon, Hjalmar (2014): Hydrological and meteorological investigations in a lake near Kangerlussuaq, west Greenland. PANGAEA, https://doi.org/10.1594/PANGAEA.836178, Supplement to: Johansson, E et al. (2015): Hydrological and meteorological investigations in a periglacial lake catchment near Kangerlussuaq, west Greenland – presentation of a new multi-parameter data set. Earth System Science Data, 7(1), 93-108, https://doi.org/10.5194/essd-7-93-2015" />
<meta name="geo.position" content="67.125940;-50.180370" />
<meta name="ICBM" content="67.125940, -50.180370" />
<!--BEGIN: Dublin Core description-->
<link rel="schema.DC" href="http://purl.org/dc/elements/1.1/" />
<link rel="schema.DCTERMS" href="http://purl.org/dc/terms/" />
<meta name="DC.title" content="Hydrological and meteorological investigations in a lake near Kangerlussuaq, west Greenland" />
<meta name="DC.creator" content="Johansson, Emma" />
<meta name="DC.creator" content="Berglund, Sten" />
<meta name="DC.creator" content="Lindborg, Tobias" />
<meta name="DC.creator" content="Petrone, Johannes" />
<meta name="DC.creator" content="van As, Dirk" />
<meta name="DC.creator" content="Gustafsson, Lars-Göran" />
<meta name="DC.creator" content="Näslund, Jens-Ove" />
<meta name="DC.creator" content="Laudon, Hjalmar" />
<meta name="DC.publisher" content="PANGAEA" />
<meta name="DC.source" content="Supplement to: Johansson, E et al. (2015): Hydrological and meteorological investigations in a periglacial lake catchment near Kangerlussuaq, west Greenland – presentation of a new multi-parameter data set. Earth System Science Data, 7(1), 93-108, https://doi.org/10.5194/essd-7-93-2015" />
<meta name="DC.date" content="2014-09-25" scheme="DCTERMS.W3CDTF" />
<meta name="DC.type" content="Dataset" />
<meta name="DC.language" content="en" scheme="DCTERMS.RFC3066" />
<meta name="DCTERMS.license" scheme="DCTERMS.URI" content="https://creativecommons.org/licenses/by/3.0/" />
<meta name="DC.identifier" content="https://doi.org/10.1594/PANGAEA.836178" scheme="DCTERMS.URI" />
<meta name="DC.format" content="application/zip, 5663.0 kBytes" />
<meta name="DC.relation" content="Map of Two Boat Lake in Greenland (jpg 13 MB) with position of sampling sites (URI: http://store.pangaea.de/Publications/JohanssonE_et_al_2014/twoboatlake_greenland.jpg)" />
<meta name="DC.relation" content="Time laps photos of lake 2012-09-05 to 2013-08-14 (mov file, zipped 205 MB) (URI: http://store.pangaea.de/Publications/JohanssonE_et_al_2014/Timelapse_TBL.zip)" />
<!--END: Dublin Core description-->
<script type="text/javascript" src="//maps.googleapis.com/maps/api/js?v=3&amp;language=en&amp;key=AIzaSyDSiVjPS5YvanZsEH4RvK0gEr46Uo-1rCQ"></script>
<script type="text/javascript">/*<![CDATA[*/jQuery(function($) { return initializeSmallDatasetGMap(836178,'hash=c66693cbbf6c492b10be83d449b9f475',new google.maps.LatLngBounds(new google.maps.LatLng(67.12594,-50.18037),new google.maps.LatLng(67.12594,-50.18037)),undefined); });/*]]>*/</script>
<script type="text/javascript" src="//d1bxh8uas1mnw7.cloudfront.net/assets/embed.js"></script>
<link rel="cite-as" href="https://doi.org/10.1594/PANGAEA.836178">
<link rel="describedby" href="https://doi.pangaea.de/10.1594/PANGAEA.836178?format=metadata_jsonld" type="application/ld+json">
<link rel="describedby" href="https://doi.pangaea.de/10.1594/PANGAEA.836178?format=citation_ris" type="application/x-research-info-systems">
<link rel="describedby" href="https://doi.pangaea.de/10.1594/PANGAEA.836178?format=citation_bibtex" type="application/x-bibtex">
<link rel="item" href="http://store.pangaea.de/Publications/JohanssonE_et_al_2014/johansson_etal-2014.zip" type="application/zip">
<link rel="author" href="https://orcid.org/0000-0002-6553-8982">
<link rel="author" href="https://orcid.org/0000-0001-6058-1466">
<script type="application/ld+json">{"@context":"http://schema.org/","@id":"https://doi.org/10.1594/PANGAEA.836178","@type":"Dataset","identifier":"https://doi.org/10.1594/PANGAEA.836178","url":"https://doi.pangaea.de/10.1594/PANGAEA.836178","creator":[{"@type":"Person","familyName":"Johansson","givenName":"Emma","email":"emma.johansson@skb.se"},{"@type":"Person","familyName":"Berglund","givenName":"Sten"},{"@type":"Person","familyName":"Lindborg","givenName":"Tobias","email":"tobias.lindborg@skb.se"},{"@type":"Person","familyName":"Petrone","givenName":"Johannes","email":"johannes.petrone@skb.se"},{"@id":"https://orcid.org/0000-0002-6553-8982","@type":"Person","familyName":"van As","givenName":"Dirk","identifier":"https://orcid.org/0000-0002-6553-8982"},{"@type":"Person","familyName":"Gustafsson","givenName":"Lars-Göran"},{"@type":"Person","familyName":"Näslund","givenName":"Jens-Ove"},{"@id":"https://orcid.org/0000-0001-6058-1466","@type":"Person","familyName":"Laudon","givenName":"Hjalmar","identifier":"https://orcid.org/0000-0001-6058-1466"}],"name":"Hydrological and meteorological investigations in a lake near Kangerlussuaq, west Greenland","publisher":{"@type":"Organization","name":"PANGAEA","disambiguatingDescription":"Data Publisher for Earth & Environmental Science","url":"https://www.pangaea.de/"},"includedInDataCatalog":{"@type":"DataCatalog","name":"PANGAEA","disambiguatingDescription":"Data Publisher for Earth & Environmental Science","url":"https://www.pangaea.de/"},"datePublished":"2014-09-25","citation":[{"@id":"https://doi.org/10.5194/essd-7-93-2015","@type":"PublicationIssue","identifier":"https://doi.org/10.5194/essd-7-93-2015","url":"https://doi.org/10.5194/essd-7-93-2015","creator":[{"@type":"Person","familyName":"Johansson","givenName":"Emma","email":"emma.johansson@skb.se"},{"@type":"Person","familyName":"Berglund","givenName":"Sten"},{"@type":"Person","familyName":"Lindborg","givenName":"Tobias","email":"tobias.lindborg@skb.se"},{"@type":"Person","familyName":"Petrone","givenName":"Johannes","email":"johannes.petrone@skb.se"},{"@id":"https://orcid.org/0000-0002-6553-8982","@type":"Person","familyName":"van As","givenName":"Dirk","identifier":"https://orcid.org/0000-0002-6553-8982"},{"@type":"Person","familyName":"Gustafsson","givenName":"Lars-Göran"},{"@type":"Person","familyName":"Näslund","givenName":"Jens-Ove"},{"@id":"https://orcid.org/0000-0001-6058-1466","@type":"Person","familyName":"Laudon","givenName":"Hjalmar","identifier":"https://orcid.org/0000-0001-6058-1466"}],"name":"Hydrological and meteorological investigations in a periglacial lake catchment near Kangerlussuaq, west Greenland – presentation of a new multi-parameter data set","datePublished":"2015","issueNumber":"7(1)","pagination":"93-108","isPartOf":{"@type":"CreativeWorkSeries","name":"Earth System Science Data"}},{"@id":"http://store.pangaea.de/Publications/JohanssonE_et_al_2014/twoboatlake_greenland.jpg","@type":"WebPage","identifier":"http://store.pangaea.de/Publications/JohanssonE_et_al_2014/twoboatlake_greenland.jpg","url":"http://store.pangaea.de/Publications/JohanssonE_et_al_2014/twoboatlake_greenland.jpg","name":"Map of Two Boat Lake in Greenland (jpg 13 MB) with position of sampling sites"},{"@id":"http://store.pangaea.de/Publications/JohanssonE_et_al_2014/Timelapse_TBL.zip","@type":"WebPage","identifier":"http://store.pangaea.de/Publications/JohanssonE_et_al_2014/Timelapse_TBL.zip","url":"http://store.pangaea.de/Publications/JohanssonE_et_al_2014/Timelapse_TBL.zip","name":"Time laps photos of lake 2012-09-05 to 2013-08-14 (mov file, zipped 205 MB)"}],"description":"Few hydrological studies have been made in Greenland, other than on glacial hydrology associated with the ice sheet. Understanding permafrost hydrology and hydroclimatic change and variability, however, provides key information for understanding climate change effects and feedbacks in the Arctic landscape. This paper presents a new extensive and detailed hydrological and meteorological open access dataset, with high temporal resolution from a 1.56 km**2 permafrost catchment with a lake underlain by a through talik close to the ice sheet in the Kangerlussuaq region, western Greenland. The paper describes the hydrological site investigations and utilized equipment, as well as the data collection and processing. The investigations were performed between 2010 and 2013. The high spatial resolution, within the investigated area, of the dataset makes it highly suitable for various detailed hydrological and ecological studies on catchment scale.","spatialCoverage":{"@type":"Place","geo":{"@type":"GeoCoordinates","latitude":67.12594,"longitude":-50.18037}},"inLanguage":"en","license":"https://creativecommons.org/licenses/by/3.0/","distribution":{"@type":"DataDownload","fileFormat":"application/zip","contentUrl":"http://store.pangaea.de/Publications/JohanssonE_et_al_2014/johansson_etal-2014.zip"}}</script>
<script type="text/javascript">/*<![CDATA[*/
(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
ga('create', 'UA-30624150-1', 'pangaea.de');
ga('set', 'anonymizeIp', true);
ga('send', 'pageview');
/*]]>*/</script>
</head>
<body class="homepage-layout">
<div id="header-wrapper">
  <div class="container-fluid">
    <header class="row"><!-- volle Screen-Breite -->
      <div class="content-wrapper"><!-- max. Breite -->
        <div id="login-area-wrapper" class="hidden-print"><div id="login-area"><span id="user-name">Not logged in</span><a id="signup-button" class="glyphicon glyphicon-plus-sign self-referer-link" title="Sign Up / Create Account" aria-label="Sign up" target="_self" rel="nofollow" href="https://www.pangaea.de/user/signup.php?referer=https%3A%2F%2Fwww.pangaea.de%2F" data-template="https://www.pangaea.de/user/signup.php?referer=#u#"></a><a id="login-button" class="glyphicon glyphicon-log-in self-referer-link" title="Log In" aria-label="Log in" target="_self" rel="nofollow" href="https://www.pangaea.de/user/login.php?referer=https%3A%2F%2Fwww.pangaea.de%2F" data-template="https://www.pangaea.de/user/login.php?referer=#u#"></a></div></div>
        <div class="blindspalte header-block col-lg-3 col-md-4"></div>
        
        <div id="header-logo-block" class="header-block col-lg-3 col-md-4 col-sm-4 col-xs-8">
          <div id="pangaea-logo">
            <a title="PANGAEA home" href="//www.pangaea.de/" class="home-link"><img src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/layout-images/pangaea-logo.png" alt="PANGAEA home"></a>
          </div>
        </div>
        
        <div id="header-mid-block" class="header-block col-lg-12 col-md-9 col-sm-20 col-xs-16">
          <div id="pangaea-logo-headline">
            PANGAEA<span class="punkt">.</span>
          </div>
          <div id="pangaea-logo-slogan">
            <span>Data Publisher for Earth &amp; </span><span class="nowrap">Environmental Science</span>
          </div>
          <div id="search-area-header" class="row"></div>
        </div>
        
        <div id="header-main-menu-block" class="header-block hidden-print col-lg-6 col-md-7 col-sm-24 col-xs-24">
          <nav id="main-nav">
            <ul>
              <li id="menu-search">
                <!-- class on link is important, don't change!!! -->
                <a href="//www.pangaea.de/" class="home-link">Search</a>
              </li>
              <li id="menu-submit">
                <a href="//www.pangaea.de/submit/">Submit</a>
              </li>
              <li id="menu-about">
                <a href="//www.pangaea.de/about/">About</a>
              </li>
              <li id="menu-contact">
                <a href="//www.pangaea.de/contact/">Contact</a>
              </li>
            </ul>
          </nav>
          <div class="clearfix"></div>
        </div>
      </div>
    </header>
  </div>
</div>
<div id="flex-wrapper">
<div id="main-container" class="container-fluid">
<div id="main-row" class="row main-row">
<div id="main" class="col-lg-24 col-md-24 col-sm-24 col-xs-24">
<div id="dataset">
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24 hidden-xs hidden-sm"><div class="title citation invisible-top-border">Citation:</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr top-border"><div id="gmap-dataset-wrapper" class="gmap-wrapper hidden-print hidden-xs hidden-sm col-lg-8 col-md-8 col-sm-24 col-xs-24"><div class="embed-responsive embed-responsive-4by3"><div id="gmap-dataset" class="embed-responsive-item"></div>
</div>
</div>
<h1 class="hanging citation"><strong><a class="popover-link link-unstyled" href="#" data-title="&lt;span&gt;Johansson, Emma&lt;a class=&quot;searchlink glyphicon glyphicon-search&quot; target=&quot;_blank&quot; rel=&quot;nofollow&quot; title=&quot;Search PANGAEA for other datasets related to 'Johansson, Emma'...&quot; aria-label=&quot;Search PANGAEA for other datasets related to 'Johansson, Emma'&quot; href=&quot;//www.pangaea.de/?q=author%3Aemail%3Aemma.johansson%40skb.se&quot;&gt;&lt;/a&gt;&lt;/span&gt;" data-content="&lt;div&gt;&lt;div&gt;&lt;a class=&quot;mail-link text-nowrap wide-icon-link&quot; href=&quot;mailto:emma.johansson@skb.se&quot;&gt;emma.johansson@skb.se&lt;/a&gt;&lt;/div&gt;&#10;&lt;/div&gt;&#10;">Johansson, Emma</a>; Berglund, Sten; <a class="popover-link link-unstyled" href="#" data-title="&lt;span&gt;Lindborg, Tobias&lt;a class=&quot;searchlink glyphicon glyphicon-search&quot; target=&quot;_blank&quot; rel=&quot;nofollow&quot; title=&quot;Search PANGAEA for other datasets related to 'Lindborg, Tobias'...&quot; aria-label=&quot;Search PANGAEA for other datasets related to 'Lindborg, Tobias'&quot; href=&quot;//www.pangaea.de/?q=author%3Aemail%3Atobias.lindborg%40skb.se&quot;&gt;&lt;/a&gt;&lt;/span&gt;" data-content="&lt;div&gt;&lt;div&gt;&lt;a class=&quot;mail-link text-nowrap wide-icon-link&quot; href=&quot;mailto:tobias.lindborg@skb.se&quot;&gt;tobias.lindborg@skb.se&lt;/a&gt;&lt;/div&gt;&#10;&lt;/div&gt;&#10;">Lindborg, Tobias</a>; <a class="popover-link link-unstyled" href="#" data-title="&lt;span&gt;Petrone, Johannes&lt;a class=&quot;searchlink glyphicon glyphicon-search&quot; target=&quot;_blank&quot; rel=&quot;nofollow&quot; title=&quot;Search PANGAEA for other datasets related to 'Petrone, Johannes'...&quot; aria-label=&quot;Search PANGAEA for other datasets related to 'Petrone, Johannes'&quot; href=&quot;//www.pangaea.de/?q=author%3Aemail%3Ajohannes.petrone%40skb.se&quot;&gt;&lt;/a&gt;&lt;/span&gt;" data-content="&lt;div&gt;&lt;div&gt;&lt;a class=&quot;mail-link text-nowrap wide-icon-link&quot; href=&quot;mailto:johannes.petrone@skb.se&quot;&gt;johannes.petrone@skb.se&lt;/a&gt;&lt;/div&gt;&#10;&lt;/div&gt;&#10;">Petrone, Johannes</a>; <a class="popover-link link-unstyled" href="#" data-title="&lt;span&gt;van As, Dirk&lt;a class=&quot;searchlink glyphicon glyphicon-search&quot; target=&quot;_blank&quot; rel=&quot;nofollow&quot; title=&quot;Search PANGAEA for other datasets related to 'van As, Dirk'...&quot; aria-label=&quot;Search PANGAEA for other datasets related to 'van As, Dirk'&quot; href=&quot;//www.pangaea.de/?q=author%3Aorcid%3A0000-0002-6553-8982&quot;&gt;&lt;/a&gt;&lt;/span&gt;" data-content="&lt;div&gt;&lt;div&gt;&lt;a class=&quot;orcid-link text-nowrap wide-icon-link&quot; target=&quot;_blank&quot; href=&quot;https://orcid.org/0000-0002-6553-8982&quot;&gt;https://orcid.org/0000-0002-6553-8982&lt;/a&gt;&lt;/div&gt;&#10;&lt;/div&gt;&#10;">van As, Dirk</a>; Gustafsson, Lars-Göran; Näslund, Jens-Ove; <a class="popover-link link-unstyled" href="#" data-title="&lt;span&gt;Laudon, Hjalmar&lt;a class=&quot;searchlink glyphicon glyphicon-search&quot; target=&quot;_blank&quot; rel=&quot;nofollow&quot; title=&quot;Search PANGAEA for other datasets related to 'Laudon, Hjalmar'...&quot; aria-label=&quot;Search PANGAEA for other datasets related to 'Laudon, Hjalmar'&quot; href=&quot;//www.pangaea.de/?q=author%3Aorcid%3A0000-0001-6058-1466&quot;&gt;&lt;/a&gt;&lt;/span&gt;" data-content="&lt;div&gt;&lt;div&gt;&lt;a class=&quot;orcid-link text-nowrap wide-icon-link&quot; target=&quot;_blank&quot; href=&quot;https://orcid.org/0000-0001-6058-1466&quot;&gt;https://orcid.org/0000-0001-6058-1466&lt;/a&gt;&lt;/div&gt;&#10;&lt;/div&gt;&#10;">Laudon, Hjalmar</a> (2014):</strong> Hydrological and meteorological investigations in a lake near Kangerlussuaq, west Greenland. <em>PANGAEA</em>, <a rel="nofollow bookmark" href="https://doi.org/10.1594/PANGAEA.836178" data-title="&lt;span&gt;Persistent DOI Name&lt;/span&gt;" data-content="&lt;div class=&quot;link-description&quot;&gt;&lt;p&gt;A &lt;a href=&quot;https://doi.org/&quot; class=&quot;doi-link&quot; target=&quot;_blank&quot;&gt;DOI name&lt;/a&gt; shall be used to cite and link PANGAEA datasets.&lt;/p&gt;&#10;&lt;p&gt;A &lt;b&gt;DOI name&lt;/b&gt; is guaranteed to never change, so you can use it to link permanently to datasets or documents. &lt;b&gt;If you want to cite this dataset, use the full citation and add this link as a persistent reference.&lt;/b&gt;&lt;/p&gt;&#10;&lt;div&gt;You may use your browser's &lt;code&gt;copy link location&lt;/code&gt; functionality to retrieve the link! You can also download the citation in several formats on this page.&lt;/div&gt;&#10;&lt;/div&gt;&#10;" class="text-linkwrap popover-link doi-link">https://doi.org/10.1594/PANGAEA.836178</a>,<hr class="spacer" aria-hidden="true" />
<em>Supplement to:</em> Johansson, E et al. (2015): Hydrological and meteorological investigations in a periglacial lake catchment near Kangerlussuaq, west Greenland – presentation of a new multi-parameter data set. <em>Earth System Science Data</em>, <strong>7(1)</strong>, 93-108, <a class="text-linkwrap doi-link" href="https://doi.org/10.5194/essd-7-93-2015" target="_blank">https://doi.org/10.5194/essd-7-93-2015</a></h1>
<p class="howtocite"><small><span class="glyphicon glyphicon-bullhorn"></span> <strong>Always quote above citation when using data!</strong> You can download the citation in several formats below.</small></p>
<p class="data-buttons"><a rel="nofollow describedby" title="Export citation to Reference Manager, EndNote, ProCite" href="?format=citation_ris" class="actionbuttonlink"><span class="actionbutton">RIS Citation</span></a><a rel="nofollow describedby" title="Export citation to BibTeX" href="?format=citation_bibtex" class="actionbuttonlink"><span class="actionbutton"><span style="font-variant:small-caps;">BibTeX</span> Citation</span></a><a rel="nofollow" title="Export citation as plain text" href="?format=citation_text" target="_blank" class="actionbuttonlink share-link"><span class="actionbutton">Text Citation</span></a><span class="separator"></span><a rel="nofollow" class="self-referer-link share-link actionbuttonlink" href="//www.pangaea.de/nojs.php" data-template="https://www.facebook.com/sharer.php?u=#u#&amp;t=#t#" title="Share dataset on Facebook" target="_blank"><span class="actionbutton"><span class="glyphicon glyphicon-share"></span> Facebook</span></a><a rel="nofollow" class="self-referer-link share-link actionbuttonlink" href="//www.pangaea.de/nojs.php" data-template="https://twitter.com/intent/tweet?url=#u#&amp;text=#t#" title="Share dataset on Twitter" target="_blank"><span class="actionbutton"><span class="glyphicon glyphicon-share"></span> Twitter</span></a><a rel="nofollow" class="self-referer-link share-link actionbuttonlink" href="//www.pangaea.de/nojs.php" data-template="https://plus.google.com/share?url=#u#&amp;hl=en" title="Share dataset on Google+" target="_blank"><span class="actionbutton"><span class="glyphicon glyphicon-share"></span> Google+</span></a><span class="separator"></span><a rel="nofollow" target="_blank" title="Display events in map" href="//www.pangaea.de/advanced/gmap-dataset.php?id=836178&amp;viewportBBOX=-50.18037,67.12594,-50.18037,67.12594" class="actionbuttonlink"><span class="actionbutton">Show Map</span></a><a rel="nofollow" title="Display events in Google Earth" href="?format=events_kml" class="actionbuttonlink"><span class="actionbutton">Google Earth</span></a><span class="separator"></span><span data-badge-type="1" data-doi="10.1594/PANGAEA.836178" data-badge-popover="right" data-hide-no-mentions="true" class="altmetric-embed"></span></p>
<div class="clearfix"></div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">Abstract:</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="abstract">Few hydrological studies have been made in Greenland, other than on glacial hydrology associated with the ice sheet. Understanding permafrost hydrology and hydroclimatic change and variability, however, provides key information for understanding climate change effects and feedbacks in the Arctic landscape. This paper presents a new extensive and detailed hydrological and meteorological open access dataset, with high temporal resolution from a 1.56 km**2 permafrost catchment with a lake underlain by a through talik close to the ice sheet in the Kangerlussuaq region, western Greenland. The paper describes the hydrological site investigations and utilized equipment, as well as the data collection and processing. The investigations were performed between 2010 and 2013. The high spatial resolution, within the investigated area, of the dataset makes it highly suitable for various detailed hydrological and ecological studies on catchment scale.</div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">Further details:</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="hanging"><a target="_self" href="http://store.pangaea.de/Publications/JohanssonE_et_al_2014/twoboatlake_greenland.jpg">Map of Two Boat Lake in Greenland (jpg 13 MB) with position of sampling sites</a><a class="searchlink glyphicon glyphicon-search" target="_blank" rel="nofollow" title="Search PANGAEA for other datasets related to this publication..." aria-label="Search PANGAEA for other datasets related to this publication" href="//www.pangaea.de/?q=%40ref65477"></a></div>
<div class="hanging"><a target="_self" href="http://store.pangaea.de/Publications/JohanssonE_et_al_2014/Timelapse_TBL.zip">Time laps photos of lake 2012-09-05 to 2013-08-14 (mov file, zipped 205 MB)</a><a class="searchlink glyphicon glyphicon-search" target="_blank" rel="nofollow" title="Search PANGAEA for other datasets related to this publication..." aria-label="Search PANGAEA for other datasets related to this publication" href="//www.pangaea.de/?q=%40ref65408"></a></div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">Project(s):</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="hanging"><strong><a target="_blank" href="https://www.researchgate.net/project/GReenland-Analogue-Surface-Project-GRASP">GReenland Analogue Surface Project</a></strong> (GRASP)<a class="searchlink glyphicon glyphicon-search" target="_blank" rel="nofollow" title="Search PANGAEA for other datasets related to 'GReenland Analogue Surface Project'..." aria-label="Search PANGAEA for other datasets related to 'GReenland Analogue Surface Project'" href="//www.pangaea.de/?q=project%3Alabel%3AGRASP"></a></div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">Coverage:</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="hanging geo"><em class="unfarbe">Latitude: </em><span class="latitude">67.125940</span><em class="unfarbe"> * Longitude: </em><span class="longitude">-50.180370</span></div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">Event(s):</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="hanging geo"><strong>TBL</strong><a class="searchlink glyphicon glyphicon-search" target="_blank" rel="nofollow" title="Search PANGAEA for other datasets related to 'TBL'..." aria-label="Search PANGAEA for other datasets related to 'TBL'" href="//www.pangaea.de/?q=event%3Alabel%3ATBL"></a><em class="unfarbe"> * Latitude: </em><span class="latitude">67.125940</span><em class="unfarbe"> * Longitude: </em><span class="longitude">-50.180370</span><em class="unfarbe"> * Location: </em><span>Two Boat Lake, Kangerlussuaq, Greenland</span><a class="searchlink glyphicon glyphicon-search" target="_blank" rel="nofollow" title="Search PANGAEA for other datasets related to 'Two Boat Lake, Kangerlussuaq, Greenland'..." aria-label="Search PANGAEA for other datasets related to 'Two Boat Lake, Kangerlussuaq, Greenland'" href="//www.pangaea.de/?q=location%3A%22Two+Boat+Lake%2C+Kangerlussuaq%2C+Greenland%22"></a></div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">Comment:</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="abstract">The dataset contains hydrological and meteorological data from a lake catchment in the Kangerlussuaq region, Western Greenland. The investigations were performed during 2010-2013 and the following parameters are included: Soil moisture, Soil temperature, Hydraulic properties of the active layer, meteorological parameters from a local weather station within the catchment, water levels and discharge, sublimation and evaportation measurments, snow depth and snow water content data and time lapse photos.</div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">License:</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="hanging"><a href="https://creativecommons.org/licenses/by/3.0/" rel="license" target="_blank"><img src="//www.pangaea.de/shared/pics/licenses/CC-BY-3.0.png" style="vertical-align:baseline; border-width:0;" alt="CC-BY-3.0" /> Creative Commons Attribution 3.0 Unported</a></div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">Size:</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="hanging">5663.0 kBytes</div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-21 col-md-20 col-sm-24 col-xs-24 col-lg-offset-3 col-md-offset-4"><div class="text-block top-border">
<h2 id="download">Download Data</h2>
<p><a href="http://store.pangaea.de/Publications/JohanssonE_et_al_2014/johansson_etal-2014.zip" target="_self">Download dataset</a></p>
</div></div></div><div id="recommendations"></div>
</div>
</div>
</div>
</div>
</div>
<div id="footer-wrapper" class="top-border hidden-print">
  <div class="container-fluid">
    <footer class="row"><!-- volle Screen-Breite -->
      <div class="content-wrapper"><!-- max. Breite -->
        <div class="blindspalte col-lg-3 col-md-4 col-sm-4 col-xs-4"></div>
        <div id="footer-hosted-by-area" class="col-lg-18 col-md-9 col-sm-24 col-xs-24">
          <!--<div class="col-lg-24 col-md-24 col-sm-24 col-xs-24">-->
          <div class="col-lg-12 col-md-24 col-sm-24 col-xs-24">
            <div class="headline underlined">
              PANGAEA is hosted by
            </div>
            
            <div>
              <p>
                Alfred Wegener Institute, Helmholtz Center for Polar and Marine Research (AWI)<br/>
                Center for Marine Environmental Sciences, University of Bremen (MARUM)
              </p>
            </div>

            <div class="headline underlined">
              The System is supported by
            </div>
            
            <div>
              <p>
                The European Commission, Research<br/>
                Federal Ministry of Education and Research (BMBF)<br/>
                Deutsche Forschungsgemeinschaft (DFG)<br/>
                International Ocean Discovery Program (IODP)
              </p>
            </div>
          </div>

          <div class="col-lg-12 col-md-24 col-sm-24 col-xs-24">
            <div class="headline underlined">
              PANGAEA is member of
            </div>
            
            <div>
              <a href="//www.icsu-wds.org/" target="_blank" title="ICSU World Data System">
                <img class="col-lg-6 col-md-6 col-sm-6 col-xs-6" src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/logos/logo-wds-block.png" alt="ICSU World Data System">
              </a>
              <a href="//www.wmo.int/" target="_blank" title="World Meteorological Organization">
                <img class="col-lg-6 col-md-6 col-sm-6 col-xs-6" src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/logos/logo-wmo-block.png" alt="World Meteorological Organization">
              </a>
            </div>
          </div>
        </div>
        <div id="footer-social-area" class="col-lg-3 col-md-24 col-sm-24 col-xs-24">
          <div id="footer-social-area-wrapper" class="col-lg-24 col-md-24 col-sm-24 col-xs-24">
            <div class="blindspalte col-lg-0 col-md-4"></div>
            <div class="col-lg-24 col-md-5 col-md-5 col-xs-10">
              <div class="underlined">Share on...</div>
              <div class="social-icons">
                <a rel="nofollow" class="self-referer-link share-link" href="//www.pangaea.de/nojs.php" data-template="https://www.facebook.com/sharer.php?u=#u#&amp;t=#t#" title="Share on Facebook" target="_blank">
                  <img id="facebook-icon" class="col-lg-8 col-md-8 col-sm-8 col-xs-8" src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/social-icons/facebook-icon.png" alt="Facebook Icon">
                </a>
                <a rel="nofollow" class="self-referer-link share-link" href="//www.pangaea.de/nojs.php" data-template="https://twitter.com/intent/tweet?url=#u#&amp;text=#t#" title="Share on Twitter" target="_blank">
                  <img id="twitter-icon" class="col-lg-8 col-md-8 col-sm-8 col-xs-8" src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/social-icons/twitter-icon.png" alt="Twitter Icon">
                </a>
                <a rel="nofollow" class="self-referer-link share-link" href="//www.pangaea.de/nojs.php" data-template="https://plus.google.com/share?url=#u#&amp;hl=en" title="Share on Google+" target="_blank">
                  <img id="gplus-icon" class="col-lg-8 col-md-8 col-sm-8 col-xs-8" src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/social-icons/gplus-icon.png" alt="Google+ Icon">
                </a>
              </div>
            </div>
            <div class="blindspalte colo-lg-0 col-md-18"></div>
          </div>
        </div>
                
        <div id="footer-menu-area" class="col-lg-24 col-md-24 col-sm-24 col-xs-24">
          <div class="blindspalte col-lg-3 col-md-4 col-sm-4 col-xs-4"></div>
          <div id="footer-menu-wrapper" class="col-lg-21 col-md-20 col-sm-24 col-xs-24">
            <nav id="footer-nav">
              <ul>
                <li id="about-legal-notice">
                  <a href="//www.pangaea.de/about/legal.php">Legal notice</a>
                </li>
                <li id="about-privacy-policy">
                  <a href="//www.pangaea.de/about/privacypolicy.php">Privacy policy</a>
                </li>
                <li id="about-cookies">
                  <a href="//www.pangaea.de/about/cookies.php">Cookies</a>
                </li>
                <li id="about-contact">
                  <a href="//www.pangaea.de/contact/">Contact</a>
                </li>
              </ul>
            </nav>
            <div class="clearfix"></div>
          </div>
        </div>
      </div>
    </footer>
  </div>
</div>
</body>
</html>
 + http_version: + recorded_at: Thu, 29 Nov 2018 12:17:36 GMT +- request: + method: get + uri: https://doi.pangaea.de/10.1594/PANGAEA.836178 + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/html,application/json,application/xml;q=0.9, text/plain;q=0.8,image/png,*/*;q=0.5 + response: + status: + code: 200 + message: OK + headers: + Server: + - PANGAEA/1.0 + Date: + - Thu, 29 Nov 2018 12:17:36 GMT + Vary: + - Accept + Link: + - ;rel="cite-as", ;rel="describedby";type="application/ld+json", + ;rel="describedby";type="application/x-research-info-systems", + ;rel="describedby";type="application/x-bibtex", + ;rel="item";type="application/zip", + ;rel="author", ;rel="author" + Content-Type: + - text/html;charset=UTF-8 + X-Ua-Compatible: + - IE=Edge + X-Content-Type-Options: + - nosniff + Strict-Transport-Security: + - max-age=31536000 + body: + encoding: ASCII-8BIT + string: !binary |- + <!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1, maximum-scale=1, user-scalable=no">
<link rel="stylesheet" href="//fonts.googleapis.com/css?family=Open+Sans:400,600,400italic,700,700italic,600italic,300,300italic,800,800italic">
<link rel="stylesheet" href="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/bootstrap-24col/css/bootstrap.min.css">
<link rel="stylesheet" href="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/css/pangaea.css">
<!--[if lte IE 9]>
<style>#topics-pulldown-wrapper label:after { display:none; }</style>
<![endif]-->
<link rel="shortcut icon" href="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/favicon.ico">
<link rel="icon" href="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/favicon.ico" type="image/vnd.microsoft.icon">
<link rel="image_src" type="image/png" href="https://www.pangaea.de/assets/social-icons/pangaea-share.png">
<meta property="og:image" content="https://www.pangaea.de/assets/social-icons/pangaea-share.png">
<script type="text/javascript" src="//cdnjs.cloudflare.com/ajax/libs/jquery/1.12.4/jquery.min.js"></script>
<script type="text/javascript" src="//cdnjs.cloudflare.com/ajax/libs/jquery.matchHeight/0.7.0/jquery.matchHeight-min.js"></script>
<script type="text/javascript" src="//cdnjs.cloudflare.com/ajax/libs/jquery.appear/0.4.1/jquery.appear.min.js"></script>
<script type="text/javascript" src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/bootstrap-24col/js/bootstrap.min.js"></script>
<script type="text/javascript" src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/js/datacombo-min.js"></script>
<title>Johansson, E et al. (2014): Hydrological and meteorological investigations in a lake near Kangerlussuaq, west Greenland</title>
<meta name="title" content="Hydrological and meteorological investigations in a lake near Kangerlussuaq, west Greenland" />
<meta name="author" content="Johansson, Emma; Berglund, Sten; Lindborg, Tobias; Petrone, Johannes; van As, Dirk; Gustafsson, Lars-Göran; Näslund, Jens-Ove; Laudon, Hjalmar" />
<meta name="date" content="2014-09-25" />
<meta name="description" content="Johansson, Emma; Berglund, Sten; Lindborg, Tobias; Petrone, Johannes; van As, Dirk; Gustafsson, Lars-Göran; Näslund, Jens-Ove; Laudon, Hjalmar (2014): Hydrological and meteorological investigations in a lake near Kangerlussuaq, west Greenland. PANGAEA, https://doi.org/10.1594/PANGAEA.836178, Supplement to: Johansson, E et al. (2015): Hydrological and meteorological investigations in a periglacial lake catchment near Kangerlussuaq, west Greenland – presentation of a new multi-parameter data set. Earth System Science Data, 7(1), 93-108, https://doi.org/10.5194/essd-7-93-2015" />
<meta name="geo.position" content="67.125940;-50.180370" />
<meta name="ICBM" content="67.125940, -50.180370" />
<!--BEGIN: Dublin Core description-->
<link rel="schema.DC" href="http://purl.org/dc/elements/1.1/" />
<link rel="schema.DCTERMS" href="http://purl.org/dc/terms/" />
<meta name="DC.title" content="Hydrological and meteorological investigations in a lake near Kangerlussuaq, west Greenland" />
<meta name="DC.creator" content="Johansson, Emma" />
<meta name="DC.creator" content="Berglund, Sten" />
<meta name="DC.creator" content="Lindborg, Tobias" />
<meta name="DC.creator" content="Petrone, Johannes" />
<meta name="DC.creator" content="van As, Dirk" />
<meta name="DC.creator" content="Gustafsson, Lars-Göran" />
<meta name="DC.creator" content="Näslund, Jens-Ove" />
<meta name="DC.creator" content="Laudon, Hjalmar" />
<meta name="DC.publisher" content="PANGAEA" />
<meta name="DC.source" content="Supplement to: Johansson, E et al. (2015): Hydrological and meteorological investigations in a periglacial lake catchment near Kangerlussuaq, west Greenland – presentation of a new multi-parameter data set. Earth System Science Data, 7(1), 93-108, https://doi.org/10.5194/essd-7-93-2015" />
<meta name="DC.date" content="2014-09-25" scheme="DCTERMS.W3CDTF" />
<meta name="DC.type" content="Dataset" />
<meta name="DC.language" content="en" scheme="DCTERMS.RFC3066" />
<meta name="DCTERMS.license" scheme="DCTERMS.URI" content="https://creativecommons.org/licenses/by/3.0/" />
<meta name="DC.identifier" content="https://doi.org/10.1594/PANGAEA.836178" scheme="DCTERMS.URI" />
<meta name="DC.format" content="application/zip, 5663.0 kBytes" />
<meta name="DC.relation" content="Map of Two Boat Lake in Greenland (jpg 13 MB) with position of sampling sites (URI: http://store.pangaea.de/Publications/JohanssonE_et_al_2014/twoboatlake_greenland.jpg)" />
<meta name="DC.relation" content="Time laps photos of lake 2012-09-05 to 2013-08-14 (mov file, zipped 205 MB) (URI: http://store.pangaea.de/Publications/JohanssonE_et_al_2014/Timelapse_TBL.zip)" />
<!--END: Dublin Core description-->
<script type="text/javascript" src="//maps.googleapis.com/maps/api/js?v=3&amp;language=en&amp;key=AIzaSyDSiVjPS5YvanZsEH4RvK0gEr46Uo-1rCQ"></script>
<script type="text/javascript">/*<![CDATA[*/jQuery(function($) { return initializeSmallDatasetGMap(836178,'hash=c66693cbbf6c492b10be83d449b9f475',new google.maps.LatLngBounds(new google.maps.LatLng(67.12594,-50.18037),new google.maps.LatLng(67.12594,-50.18037)),undefined); });/*]]>*/</script>
<script type="text/javascript" src="//d1bxh8uas1mnw7.cloudfront.net/assets/embed.js"></script>
<link rel="cite-as" href="https://doi.org/10.1594/PANGAEA.836178">
<link rel="describedby" href="https://doi.pangaea.de/10.1594/PANGAEA.836178?format=metadata_jsonld" type="application/ld+json">
<link rel="describedby" href="https://doi.pangaea.de/10.1594/PANGAEA.836178?format=citation_ris" type="application/x-research-info-systems">
<link rel="describedby" href="https://doi.pangaea.de/10.1594/PANGAEA.836178?format=citation_bibtex" type="application/x-bibtex">
<link rel="item" href="http://store.pangaea.de/Publications/JohanssonE_et_al_2014/johansson_etal-2014.zip" type="application/zip">
<link rel="author" href="https://orcid.org/0000-0002-6553-8982">
<link rel="author" href="https://orcid.org/0000-0001-6058-1466">
<script type="application/ld+json">{"@context":"http://schema.org/","@id":"https://doi.org/10.1594/PANGAEA.836178","@type":"Dataset","identifier":"https://doi.org/10.1594/PANGAEA.836178","url":"https://doi.pangaea.de/10.1594/PANGAEA.836178","creator":[{"@type":"Person","familyName":"Johansson","givenName":"Emma","email":"emma.johansson@skb.se"},{"@type":"Person","familyName":"Berglund","givenName":"Sten"},{"@type":"Person","familyName":"Lindborg","givenName":"Tobias","email":"tobias.lindborg@skb.se"},{"@type":"Person","familyName":"Petrone","givenName":"Johannes","email":"johannes.petrone@skb.se"},{"@id":"https://orcid.org/0000-0002-6553-8982","@type":"Person","familyName":"van As","givenName":"Dirk","identifier":"https://orcid.org/0000-0002-6553-8982"},{"@type":"Person","familyName":"Gustafsson","givenName":"Lars-Göran"},{"@type":"Person","familyName":"Näslund","givenName":"Jens-Ove"},{"@id":"https://orcid.org/0000-0001-6058-1466","@type":"Person","familyName":"Laudon","givenName":"Hjalmar","identifier":"https://orcid.org/0000-0001-6058-1466"}],"name":"Hydrological and meteorological investigations in a lake near Kangerlussuaq, west Greenland","publisher":{"@type":"Organization","name":"PANGAEA","disambiguatingDescription":"Data Publisher for Earth & Environmental Science","url":"https://www.pangaea.de/"},"includedInDataCatalog":{"@type":"DataCatalog","name":"PANGAEA","disambiguatingDescription":"Data Publisher for Earth & Environmental Science","url":"https://www.pangaea.de/"},"datePublished":"2014-09-25","citation":[{"@id":"https://doi.org/10.5194/essd-7-93-2015","@type":"PublicationIssue","identifier":"https://doi.org/10.5194/essd-7-93-2015","url":"https://doi.org/10.5194/essd-7-93-2015","creator":[{"@type":"Person","familyName":"Johansson","givenName":"Emma","email":"emma.johansson@skb.se"},{"@type":"Person","familyName":"Berglund","givenName":"Sten"},{"@type":"Person","familyName":"Lindborg","givenName":"Tobias","email":"tobias.lindborg@skb.se"},{"@type":"Person","familyName":"Petrone","givenName":"Johannes","email":"johannes.petrone@skb.se"},{"@id":"https://orcid.org/0000-0002-6553-8982","@type":"Person","familyName":"van As","givenName":"Dirk","identifier":"https://orcid.org/0000-0002-6553-8982"},{"@type":"Person","familyName":"Gustafsson","givenName":"Lars-Göran"},{"@type":"Person","familyName":"Näslund","givenName":"Jens-Ove"},{"@id":"https://orcid.org/0000-0001-6058-1466","@type":"Person","familyName":"Laudon","givenName":"Hjalmar","identifier":"https://orcid.org/0000-0001-6058-1466"}],"name":"Hydrological and meteorological investigations in a periglacial lake catchment near Kangerlussuaq, west Greenland – presentation of a new multi-parameter data set","datePublished":"2015","issueNumber":"7(1)","pagination":"93-108","isPartOf":{"@type":"CreativeWorkSeries","name":"Earth System Science Data"}},{"@id":"http://store.pangaea.de/Publications/JohanssonE_et_al_2014/twoboatlake_greenland.jpg","@type":"WebPage","identifier":"http://store.pangaea.de/Publications/JohanssonE_et_al_2014/twoboatlake_greenland.jpg","url":"http://store.pangaea.de/Publications/JohanssonE_et_al_2014/twoboatlake_greenland.jpg","name":"Map of Two Boat Lake in Greenland (jpg 13 MB) with position of sampling sites"},{"@id":"http://store.pangaea.de/Publications/JohanssonE_et_al_2014/Timelapse_TBL.zip","@type":"WebPage","identifier":"http://store.pangaea.de/Publications/JohanssonE_et_al_2014/Timelapse_TBL.zip","url":"http://store.pangaea.de/Publications/JohanssonE_et_al_2014/Timelapse_TBL.zip","name":"Time laps photos of lake 2012-09-05 to 2013-08-14 (mov file, zipped 205 MB)"}],"description":"Few hydrological studies have been made in Greenland, other than on glacial hydrology associated with the ice sheet. Understanding permafrost hydrology and hydroclimatic change and variability, however, provides key information for understanding climate change effects and feedbacks in the Arctic landscape. This paper presents a new extensive and detailed hydrological and meteorological open access dataset, with high temporal resolution from a 1.56 km**2 permafrost catchment with a lake underlain by a through talik close to the ice sheet in the Kangerlussuaq region, western Greenland. The paper describes the hydrological site investigations and utilized equipment, as well as the data collection and processing. The investigations were performed between 2010 and 2013. The high spatial resolution, within the investigated area, of the dataset makes it highly suitable for various detailed hydrological and ecological studies on catchment scale.","spatialCoverage":{"@type":"Place","geo":{"@type":"GeoCoordinates","latitude":67.12594,"longitude":-50.18037}},"inLanguage":"en","license":"https://creativecommons.org/licenses/by/3.0/","distribution":{"@type":"DataDownload","fileFormat":"application/zip","contentUrl":"http://store.pangaea.de/Publications/JohanssonE_et_al_2014/johansson_etal-2014.zip"}}</script>
<script type="text/javascript">/*<![CDATA[*/
(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
ga('create', 'UA-30624150-1', 'pangaea.de');
ga('set', 'anonymizeIp', true);
ga('send', 'pageview');
/*]]>*/</script>
</head>
<body class="homepage-layout">
<div id="header-wrapper">
  <div class="container-fluid">
    <header class="row"><!-- volle Screen-Breite -->
      <div class="content-wrapper"><!-- max. Breite -->
        <div id="login-area-wrapper" class="hidden-print"><div id="login-area"><span id="user-name">Not logged in</span><a id="signup-button" class="glyphicon glyphicon-plus-sign self-referer-link" title="Sign Up / Create Account" aria-label="Sign up" target="_self" rel="nofollow" href="https://www.pangaea.de/user/signup.php?referer=https%3A%2F%2Fwww.pangaea.de%2F" data-template="https://www.pangaea.de/user/signup.php?referer=#u#"></a><a id="login-button" class="glyphicon glyphicon-log-in self-referer-link" title="Log In" aria-label="Log in" target="_self" rel="nofollow" href="https://www.pangaea.de/user/login.php?referer=https%3A%2F%2Fwww.pangaea.de%2F" data-template="https://www.pangaea.de/user/login.php?referer=#u#"></a></div></div>
        <div class="blindspalte header-block col-lg-3 col-md-4"></div>
        
        <div id="header-logo-block" class="header-block col-lg-3 col-md-4 col-sm-4 col-xs-8">
          <div id="pangaea-logo">
            <a title="PANGAEA home" href="//www.pangaea.de/" class="home-link"><img src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/layout-images/pangaea-logo.png" alt="PANGAEA home"></a>
          </div>
        </div>
        
        <div id="header-mid-block" class="header-block col-lg-12 col-md-9 col-sm-20 col-xs-16">
          <div id="pangaea-logo-headline">
            PANGAEA<span class="punkt">.</span>
          </div>
          <div id="pangaea-logo-slogan">
            <span>Data Publisher for Earth &amp; </span><span class="nowrap">Environmental Science</span>
          </div>
          <div id="search-area-header" class="row"></div>
        </div>
        
        <div id="header-main-menu-block" class="header-block hidden-print col-lg-6 col-md-7 col-sm-24 col-xs-24">
          <nav id="main-nav">
            <ul>
              <li id="menu-search">
                <!-- class on link is important, don't change!!! -->
                <a href="//www.pangaea.de/" class="home-link">Search</a>
              </li>
              <li id="menu-submit">
                <a href="//www.pangaea.de/submit/">Submit</a>
              </li>
              <li id="menu-about">
                <a href="//www.pangaea.de/about/">About</a>
              </li>
              <li id="menu-contact">
                <a href="//www.pangaea.de/contact/">Contact</a>
              </li>
            </ul>
          </nav>
          <div class="clearfix"></div>
        </div>
      </div>
    </header>
  </div>
</div>
<div id="flex-wrapper">
<div id="main-container" class="container-fluid">
<div id="main-row" class="row main-row">
<div id="main" class="col-lg-24 col-md-24 col-sm-24 col-xs-24">
<div id="dataset">
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24 hidden-xs hidden-sm"><div class="title citation invisible-top-border">Citation:</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr top-border"><div id="gmap-dataset-wrapper" class="gmap-wrapper hidden-print hidden-xs hidden-sm col-lg-8 col-md-8 col-sm-24 col-xs-24"><div class="embed-responsive embed-responsive-4by3"><div id="gmap-dataset" class="embed-responsive-item"></div>
</div>
</div>
<h1 class="hanging citation"><strong><a class="popover-link link-unstyled" href="#" data-title="&lt;span&gt;Johansson, Emma&lt;a class=&quot;searchlink glyphicon glyphicon-search&quot; target=&quot;_blank&quot; rel=&quot;nofollow&quot; title=&quot;Search PANGAEA for other datasets related to 'Johansson, Emma'...&quot; aria-label=&quot;Search PANGAEA for other datasets related to 'Johansson, Emma'&quot; href=&quot;//www.pangaea.de/?q=author%3Aemail%3Aemma.johansson%40skb.se&quot;&gt;&lt;/a&gt;&lt;/span&gt;" data-content="&lt;div&gt;&lt;div&gt;&lt;a class=&quot;mail-link text-nowrap wide-icon-link&quot; href=&quot;mailto:emma.johansson@skb.se&quot;&gt;emma.johansson@skb.se&lt;/a&gt;&lt;/div&gt;&#10;&lt;/div&gt;&#10;">Johansson, Emma</a>; Berglund, Sten; <a class="popover-link link-unstyled" href="#" data-title="&lt;span&gt;Lindborg, Tobias&lt;a class=&quot;searchlink glyphicon glyphicon-search&quot; target=&quot;_blank&quot; rel=&quot;nofollow&quot; title=&quot;Search PANGAEA for other datasets related to 'Lindborg, Tobias'...&quot; aria-label=&quot;Search PANGAEA for other datasets related to 'Lindborg, Tobias'&quot; href=&quot;//www.pangaea.de/?q=author%3Aemail%3Atobias.lindborg%40skb.se&quot;&gt;&lt;/a&gt;&lt;/span&gt;" data-content="&lt;div&gt;&lt;div&gt;&lt;a class=&quot;mail-link text-nowrap wide-icon-link&quot; href=&quot;mailto:tobias.lindborg@skb.se&quot;&gt;tobias.lindborg@skb.se&lt;/a&gt;&lt;/div&gt;&#10;&lt;/div&gt;&#10;">Lindborg, Tobias</a>; <a class="popover-link link-unstyled" href="#" data-title="&lt;span&gt;Petrone, Johannes&lt;a class=&quot;searchlink glyphicon glyphicon-search&quot; target=&quot;_blank&quot; rel=&quot;nofollow&quot; title=&quot;Search PANGAEA for other datasets related to 'Petrone, Johannes'...&quot; aria-label=&quot;Search PANGAEA for other datasets related to 'Petrone, Johannes'&quot; href=&quot;//www.pangaea.de/?q=author%3Aemail%3Ajohannes.petrone%40skb.se&quot;&gt;&lt;/a&gt;&lt;/span&gt;" data-content="&lt;div&gt;&lt;div&gt;&lt;a class=&quot;mail-link text-nowrap wide-icon-link&quot; href=&quot;mailto:johannes.petrone@skb.se&quot;&gt;johannes.petrone@skb.se&lt;/a&gt;&lt;/div&gt;&#10;&lt;/div&gt;&#10;">Petrone, Johannes</a>; <a class="popover-link link-unstyled" href="#" data-title="&lt;span&gt;van As, Dirk&lt;a class=&quot;searchlink glyphicon glyphicon-search&quot; target=&quot;_blank&quot; rel=&quot;nofollow&quot; title=&quot;Search PANGAEA for other datasets related to 'van As, Dirk'...&quot; aria-label=&quot;Search PANGAEA for other datasets related to 'van As, Dirk'&quot; href=&quot;//www.pangaea.de/?q=author%3Aorcid%3A0000-0002-6553-8982&quot;&gt;&lt;/a&gt;&lt;/span&gt;" data-content="&lt;div&gt;&lt;div&gt;&lt;a class=&quot;orcid-link text-nowrap wide-icon-link&quot; target=&quot;_blank&quot; href=&quot;https://orcid.org/0000-0002-6553-8982&quot;&gt;https://orcid.org/0000-0002-6553-8982&lt;/a&gt;&lt;/div&gt;&#10;&lt;/div&gt;&#10;">van As, Dirk</a>; Gustafsson, Lars-Göran; Näslund, Jens-Ove; <a class="popover-link link-unstyled" href="#" data-title="&lt;span&gt;Laudon, Hjalmar&lt;a class=&quot;searchlink glyphicon glyphicon-search&quot; target=&quot;_blank&quot; rel=&quot;nofollow&quot; title=&quot;Search PANGAEA for other datasets related to 'Laudon, Hjalmar'...&quot; aria-label=&quot;Search PANGAEA for other datasets related to 'Laudon, Hjalmar'&quot; href=&quot;//www.pangaea.de/?q=author%3Aorcid%3A0000-0001-6058-1466&quot;&gt;&lt;/a&gt;&lt;/span&gt;" data-content="&lt;div&gt;&lt;div&gt;&lt;a class=&quot;orcid-link text-nowrap wide-icon-link&quot; target=&quot;_blank&quot; href=&quot;https://orcid.org/0000-0001-6058-1466&quot;&gt;https://orcid.org/0000-0001-6058-1466&lt;/a&gt;&lt;/div&gt;&#10;&lt;/div&gt;&#10;">Laudon, Hjalmar</a> (2014):</strong> Hydrological and meteorological investigations in a lake near Kangerlussuaq, west Greenland. <em>PANGAEA</em>, <a rel="nofollow bookmark" href="https://doi.org/10.1594/PANGAEA.836178" data-title="&lt;span&gt;Persistent DOI Name&lt;/span&gt;" data-content="&lt;div class=&quot;link-description&quot;&gt;&lt;p&gt;A &lt;a href=&quot;https://doi.org/&quot; class=&quot;doi-link&quot; target=&quot;_blank&quot;&gt;DOI name&lt;/a&gt; shall be used to cite and link PANGAEA datasets.&lt;/p&gt;&#10;&lt;p&gt;A &lt;b&gt;DOI name&lt;/b&gt; is guaranteed to never change, so you can use it to link permanently to datasets or documents. &lt;b&gt;If you want to cite this dataset, use the full citation and add this link as a persistent reference.&lt;/b&gt;&lt;/p&gt;&#10;&lt;div&gt;You may use your browser's &lt;code&gt;copy link location&lt;/code&gt; functionality to retrieve the link! You can also download the citation in several formats on this page.&lt;/div&gt;&#10;&lt;/div&gt;&#10;" class="text-linkwrap popover-link doi-link">https://doi.org/10.1594/PANGAEA.836178</a>,<hr class="spacer" aria-hidden="true" />
<em>Supplement to:</em> Johansson, E et al. (2015): Hydrological and meteorological investigations in a periglacial lake catchment near Kangerlussuaq, west Greenland – presentation of a new multi-parameter data set. <em>Earth System Science Data</em>, <strong>7(1)</strong>, 93-108, <a class="text-linkwrap doi-link" href="https://doi.org/10.5194/essd-7-93-2015" target="_blank">https://doi.org/10.5194/essd-7-93-2015</a></h1>
<p class="howtocite"><small><span class="glyphicon glyphicon-bullhorn"></span> <strong>Always quote above citation when using data!</strong> You can download the citation in several formats below.</small></p>
<p class="data-buttons"><a rel="nofollow describedby" title="Export citation to Reference Manager, EndNote, ProCite" href="?format=citation_ris" class="actionbuttonlink"><span class="actionbutton">RIS Citation</span></a><a rel="nofollow describedby" title="Export citation to BibTeX" href="?format=citation_bibtex" class="actionbuttonlink"><span class="actionbutton"><span style="font-variant:small-caps;">BibTeX</span> Citation</span></a><a rel="nofollow" title="Export citation as plain text" href="?format=citation_text" target="_blank" class="actionbuttonlink share-link"><span class="actionbutton">Text Citation</span></a><span class="separator"></span><a rel="nofollow" class="self-referer-link share-link actionbuttonlink" href="//www.pangaea.de/nojs.php" data-template="https://www.facebook.com/sharer.php?u=#u#&amp;t=#t#" title="Share dataset on Facebook" target="_blank"><span class="actionbutton"><span class="glyphicon glyphicon-share"></span> Facebook</span></a><a rel="nofollow" class="self-referer-link share-link actionbuttonlink" href="//www.pangaea.de/nojs.php" data-template="https://twitter.com/intent/tweet?url=#u#&amp;text=#t#" title="Share dataset on Twitter" target="_blank"><span class="actionbutton"><span class="glyphicon glyphicon-share"></span> Twitter</span></a><a rel="nofollow" class="self-referer-link share-link actionbuttonlink" href="//www.pangaea.de/nojs.php" data-template="https://plus.google.com/share?url=#u#&amp;hl=en" title="Share dataset on Google+" target="_blank"><span class="actionbutton"><span class="glyphicon glyphicon-share"></span> Google+</span></a><span class="separator"></span><a rel="nofollow" target="_blank" title="Display events in map" href="//www.pangaea.de/advanced/gmap-dataset.php?id=836178&amp;viewportBBOX=-50.18037,67.12594,-50.18037,67.12594" class="actionbuttonlink"><span class="actionbutton">Show Map</span></a><a rel="nofollow" title="Display events in Google Earth" href="?format=events_kml" class="actionbuttonlink"><span class="actionbutton">Google Earth</span></a><span class="separator"></span><span data-badge-type="1" data-doi="10.1594/PANGAEA.836178" data-badge-popover="right" data-hide-no-mentions="true" class="altmetric-embed"></span></p>
<div class="clearfix"></div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">Abstract:</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="abstract">Few hydrological studies have been made in Greenland, other than on glacial hydrology associated with the ice sheet. Understanding permafrost hydrology and hydroclimatic change and variability, however, provides key information for understanding climate change effects and feedbacks in the Arctic landscape. This paper presents a new extensive and detailed hydrological and meteorological open access dataset, with high temporal resolution from a 1.56 km**2 permafrost catchment with a lake underlain by a through talik close to the ice sheet in the Kangerlussuaq region, western Greenland. The paper describes the hydrological site investigations and utilized equipment, as well as the data collection and processing. The investigations were performed between 2010 and 2013. The high spatial resolution, within the investigated area, of the dataset makes it highly suitable for various detailed hydrological and ecological studies on catchment scale.</div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">Further details:</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="hanging"><a target="_self" href="http://store.pangaea.de/Publications/JohanssonE_et_al_2014/twoboatlake_greenland.jpg">Map of Two Boat Lake in Greenland (jpg 13 MB) with position of sampling sites</a><a class="searchlink glyphicon glyphicon-search" target="_blank" rel="nofollow" title="Search PANGAEA for other datasets related to this publication..." aria-label="Search PANGAEA for other datasets related to this publication" href="//www.pangaea.de/?q=%40ref65477"></a></div>
<div class="hanging"><a target="_self" href="http://store.pangaea.de/Publications/JohanssonE_et_al_2014/Timelapse_TBL.zip">Time laps photos of lake 2012-09-05 to 2013-08-14 (mov file, zipped 205 MB)</a><a class="searchlink glyphicon glyphicon-search" target="_blank" rel="nofollow" title="Search PANGAEA for other datasets related to this publication..." aria-label="Search PANGAEA for other datasets related to this publication" href="//www.pangaea.de/?q=%40ref65408"></a></div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">Project(s):</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="hanging"><strong><a target="_blank" href="https://www.researchgate.net/project/GReenland-Analogue-Surface-Project-GRASP">GReenland Analogue Surface Project</a></strong> (GRASP)<a class="searchlink glyphicon glyphicon-search" target="_blank" rel="nofollow" title="Search PANGAEA for other datasets related to 'GReenland Analogue Surface Project'..." aria-label="Search PANGAEA for other datasets related to 'GReenland Analogue Surface Project'" href="//www.pangaea.de/?q=project%3Alabel%3AGRASP"></a></div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">Coverage:</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="hanging geo"><em class="unfarbe">Latitude: </em><span class="latitude">67.125940</span><em class="unfarbe"> * Longitude: </em><span class="longitude">-50.180370</span></div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">Event(s):</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="hanging geo"><strong>TBL</strong><a class="searchlink glyphicon glyphicon-search" target="_blank" rel="nofollow" title="Search PANGAEA for other datasets related to 'TBL'..." aria-label="Search PANGAEA for other datasets related to 'TBL'" href="//www.pangaea.de/?q=event%3Alabel%3ATBL"></a><em class="unfarbe"> * Latitude: </em><span class="latitude">67.125940</span><em class="unfarbe"> * Longitude: </em><span class="longitude">-50.180370</span><em class="unfarbe"> * Location: </em><span>Two Boat Lake, Kangerlussuaq, Greenland</span><a class="searchlink glyphicon glyphicon-search" target="_blank" rel="nofollow" title="Search PANGAEA for other datasets related to 'Two Boat Lake, Kangerlussuaq, Greenland'..." aria-label="Search PANGAEA for other datasets related to 'Two Boat Lake, Kangerlussuaq, Greenland'" href="//www.pangaea.de/?q=location%3A%22Two+Boat+Lake%2C+Kangerlussuaq%2C+Greenland%22"></a></div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">Comment:</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="abstract">The dataset contains hydrological and meteorological data from a lake catchment in the Kangerlussuaq region, Western Greenland. The investigations were performed during 2010-2013 and the following parameters are included: Soil moisture, Soil temperature, Hydraulic properties of the active layer, meteorological parameters from a local weather station within the catchment, water levels and discharge, sublimation and evaportation measurments, snow depth and snow water content data and time lapse photos.</div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">License:</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="hanging"><a href="https://creativecommons.org/licenses/by/3.0/" rel="license" target="_blank"><img src="//www.pangaea.de/shared/pics/licenses/CC-BY-3.0.png" style="vertical-align:baseline; border-width:0;" alt="CC-BY-3.0" /> Creative Commons Attribution 3.0 Unported</a></div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-3 col-md-4 col-sm-24 col-xs-24"><div class="title">Size:</div>
</div>
<div class="col-lg-21 col-md-20 col-sm-24 col-xs-24"><div class="descr"><div class="hanging">5663.0 kBytes</div>
</div>
</div>
</div>
<div class="row"><div class="col-lg-21 col-md-20 col-sm-24 col-xs-24 col-lg-offset-3 col-md-offset-4"><div class="text-block top-border">
<h2 id="download">Download Data</h2>
<p><a href="http://store.pangaea.de/Publications/JohanssonE_et_al_2014/johansson_etal-2014.zip" target="_self">Download dataset</a></p>
</div></div></div><div id="recommendations"></div>
</div>
</div>
</div>
</div>
</div>
<div id="footer-wrapper" class="top-border hidden-print">
  <div class="container-fluid">
    <footer class="row"><!-- volle Screen-Breite -->
      <div class="content-wrapper"><!-- max. Breite -->
        <div class="blindspalte col-lg-3 col-md-4 col-sm-4 col-xs-4"></div>
        <div id="footer-hosted-by-area" class="col-lg-18 col-md-9 col-sm-24 col-xs-24">
          <!--<div class="col-lg-24 col-md-24 col-sm-24 col-xs-24">-->
          <div class="col-lg-12 col-md-24 col-sm-24 col-xs-24">
            <div class="headline underlined">
              PANGAEA is hosted by
            </div>
            
            <div>
              <p>
                Alfred Wegener Institute, Helmholtz Center for Polar and Marine Research (AWI)<br/>
                Center for Marine Environmental Sciences, University of Bremen (MARUM)
              </p>
            </div>

            <div class="headline underlined">
              The System is supported by
            </div>
            
            <div>
              <p>
                The European Commission, Research<br/>
                Federal Ministry of Education and Research (BMBF)<br/>
                Deutsche Forschungsgemeinschaft (DFG)<br/>
                International Ocean Discovery Program (IODP)
              </p>
            </div>
          </div>

          <div class="col-lg-12 col-md-24 col-sm-24 col-xs-24">
            <div class="headline underlined">
              PANGAEA is member of
            </div>
            
            <div>
              <a href="//www.icsu-wds.org/" target="_blank" title="ICSU World Data System">
                <img class="col-lg-6 col-md-6 col-sm-6 col-xs-6" src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/logos/logo-wds-block.png" alt="ICSU World Data System">
              </a>
              <a href="//www.wmo.int/" target="_blank" title="World Meteorological Organization">
                <img class="col-lg-6 col-md-6 col-sm-6 col-xs-6" src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/logos/logo-wmo-block.png" alt="World Meteorological Organization">
              </a>
            </div>
          </div>
        </div>
        <div id="footer-social-area" class="col-lg-3 col-md-24 col-sm-24 col-xs-24">
          <div id="footer-social-area-wrapper" class="col-lg-24 col-md-24 col-sm-24 col-xs-24">
            <div class="blindspalte col-lg-0 col-md-4"></div>
            <div class="col-lg-24 col-md-5 col-md-5 col-xs-10">
              <div class="underlined">Share on...</div>
              <div class="social-icons">
                <a rel="nofollow" class="self-referer-link share-link" href="//www.pangaea.de/nojs.php" data-template="https://www.facebook.com/sharer.php?u=#u#&amp;t=#t#" title="Share on Facebook" target="_blank">
                  <img id="facebook-icon" class="col-lg-8 col-md-8 col-sm-8 col-xs-8" src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/social-icons/facebook-icon.png" alt="Facebook Icon">
                </a>
                <a rel="nofollow" class="self-referer-link share-link" href="//www.pangaea.de/nojs.php" data-template="https://twitter.com/intent/tweet?url=#u#&amp;text=#t#" title="Share on Twitter" target="_blank">
                  <img id="twitter-icon" class="col-lg-8 col-md-8 col-sm-8 col-xs-8" src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/social-icons/twitter-icon.png" alt="Twitter Icon">
                </a>
                <a rel="nofollow" class="self-referer-link share-link" href="//www.pangaea.de/nojs.php" data-template="https://plus.google.com/share?url=#u#&amp;hl=en" title="Share on Google+" target="_blank">
                  <img id="gplus-icon" class="col-lg-8 col-md-8 col-sm-8 col-xs-8" src="//www.pangaea.de/assets/v.8475a12d05411317f3d99359b017a263/social-icons/gplus-icon.png" alt="Google+ Icon">
                </a>
              </div>
            </div>
            <div class="blindspalte colo-lg-0 col-md-18"></div>
          </div>
        </div>
                
        <div id="footer-menu-area" class="col-lg-24 col-md-24 col-sm-24 col-xs-24">
          <div class="blindspalte col-lg-3 col-md-4 col-sm-4 col-xs-4"></div>
          <div id="footer-menu-wrapper" class="col-lg-21 col-md-20 col-sm-24 col-xs-24">
            <nav id="footer-nav">
              <ul>
                <li id="about-legal-notice">
                  <a href="//www.pangaea.de/about/legal.php">Legal notice</a>
                </li>
                <li id="about-privacy-policy">
                  <a href="//www.pangaea.de/about/privacypolicy.php">Privacy policy</a>
                </li>
                <li id="about-cookies">
                  <a href="//www.pangaea.de/about/cookies.php">Cookies</a>
                </li>
                <li id="about-contact">
                  <a href="//www.pangaea.de/contact/">Contact</a>
                </li>
              </ul>
            </nav>
            <div class="clearfix"></div>
          </div>
        </div>
      </div>
    </footer>
  </div>
</div>
</body>
</html>
 + http_version: + recorded_at: Thu, 29 Nov 2018 12:17:36 GMT +recorded_with: VCR 3.0.3 diff --git a/spec/fixtures/vcr_cassettes/dois/GET_/dois/DOI/get-url/returns_status_code_200.yml b/spec/fixtures/vcr_cassettes/dois/GET_/dois/DOI/get-url/returns_status_code_200.yml index 504510b00..0dcd94ce8 100644 --- a/spec/fixtures/vcr_cassettes/dois/GET_/dois/DOI/get-url/returns_status_code_200.yml +++ b/spec/fixtures/vcr_cassettes/dois/GET_/dois/DOI/get-url/returns_status_code_200.yml @@ -17,7 +17,7 @@ http_interactions: message: OK headers: Date: - - Wed, 26 Sep 2018 09:05:42 GMT + - Mon, 19 Nov 2018 13:19:28 GMT Content-Type: - application/json;charset=UTF-8 Connection: @@ -28,5 +28,5 @@ http_interactions: encoding: ASCII-8BIT string: '{"responseCode":1,"handle":"10.5438/FJ3W-0SHD","values":[{"index":1,"type":"URL","data":{"format":"string","value":"https://blog.datacite.org/data-driven-development/"},"ttl":86400,"timestamp":"2016-12-19T15:06:36Z"}]}' http_version: - recorded_at: Wed, 26 Sep 2018 09:05:42 GMT + recorded_at: Mon, 19 Nov 2018 13:19:28 GMT recorded_with: VCR 3.0.3 diff --git a/spec/fixtures/vcr_cassettes/dois/GET_/dois/DOI/get-url/returns_url.yml b/spec/fixtures/vcr_cassettes/dois/GET_/dois/DOI/get-url/returns_url.yml index 504510b00..88d8baf59 100644 --- a/spec/fixtures/vcr_cassettes/dois/GET_/dois/DOI/get-url/returns_url.yml +++ b/spec/fixtures/vcr_cassettes/dois/GET_/dois/DOI/get-url/returns_url.yml @@ -17,7 +17,7 @@ http_interactions: message: OK headers: Date: - - Wed, 26 Sep 2018 09:05:42 GMT + - Mon, 19 Nov 2018 13:19:27 GMT Content-Type: - application/json;charset=UTF-8 Connection: @@ -28,5 +28,5 @@ http_interactions: encoding: ASCII-8BIT string: '{"responseCode":1,"handle":"10.5438/FJ3W-0SHD","values":[{"index":1,"type":"URL","data":{"format":"string","value":"https://blog.datacite.org/data-driven-development/"},"ttl":86400,"timestamp":"2016-12-19T15:06:36Z"}]}' http_version: - recorded_at: Wed, 26 Sep 2018 09:05:42 GMT + recorded_at: Mon, 19 Nov 2018 13:19:27 GMT recorded_with: VCR 3.0.3 diff --git a/spec/fixtures/vcr_cassettes/dois/POST_/dois/crossref_url/returns_status_code_201.yml b/spec/fixtures/vcr_cassettes/dois/POST_/dois/crossref_url/returns_status_code_201.yml new file mode 100644 index 000000000..340b5d4ac --- /dev/null +++ b/spec/fixtures/vcr_cassettes/dois/POST_/dois/crossref_url/returns_status_code_201.yml @@ -0,0 +1,82 @@ +--- +http_interactions: +- request: + method: get + uri: https://api.datacite.org/prefixes/10.7554 + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/html,application/json,application/xml;q=0.9, text/plain;q=0.8,image/png,*/*;q=0.5 + response: + status: + code: 200 + message: OK + headers: + Date: + - Fri, 07 Dec 2018 18:37:48 GMT + Content-Type: + - application/json; charset=utf-8 + Connection: + - keep-alive + Status: + - 200 OK + X-Anonymous-Consumer: + - 'true' + Cache-Control: + - max-age=0, private, must-revalidate + Vary: + - Accept-Encoding, Origin + X-Request-Id: + - 6510584d-f399-4bbe-a1dd-1b4a8f1c07cc + Etag: + - W/"381993dc8a6b0f20960c96a3639c0284" + X-Runtime: + - '0.079075' + X-Powered-By: + - Phusion Passenger 6.0.0 + Server: + - nginx/1.15.7 + Phusion Passenger 6.0.0 + body: + encoding: ASCII-8BIT + string: '{"data":{"id":"10.7554","type":"prefixes","attributes":{"registration-agency":"Crossref","created":null,"updated":"2016-09-21T21:07:27Z"},"relationships":{"clients":{"data":[]},"providers":{"data":[]}}},"included":[]}' + http_version: + recorded_at: Fri, 07 Dec 2018 18:37:48 GMT +- request: + method: get + uri: http://www.crossref.org/openurl/?format=unixref&id=doi:10.7554/elife.01567&noredirect=true&pid=tech@datacite.org + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/xml + response: + status: + code: 200 + message: OK + headers: + Server: + - Apache-Coyote/1.1 + Crossref-Deployment-Name: + - qs4-1 + Content-Type: + - text/xml;charset=UTF-8 + Content-Language: + - en-US + Date: + - Fri, 07 Dec 2018 18:37:48 GMT + Connection: + - close + body: + encoding: ASCII-8BIT + string: !binary |- + <?xml version="1.0" encoding="UTF-8"?>
<doi_records>
  <doi_record owner="10.7554" timestamp="2018-08-23 09:41:49">
    <crossref>
      <journal>
        <journal_metadata language="en">
          <full_title>eLife</full_title>
          <issn media_type="electronic">2050-084X</issn>
        </journal_metadata>
        <journal_issue>
          <publication_date media_type="online">
            <month>02</month>
            <day>11</day>
            <year>2014</year>
          </publication_date>
          <journal_volume>
            <volume>3</volume>
          </journal_volume>
        </journal_issue>
        <journal_article publication_type="full_text" reference_distribution_opts="any">
          <titles>
            <title>Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth</title>
          </titles>
          <contributors>
            <person_name contributor_role="author" sequence="first">
              <given_name>Martial</given_name>
              <surname>Sankar</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Kaisa</given_name>
              <surname>Nieminen</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Laura</given_name>
              <surname>Ragni</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Ioannis</given_name>
              <surname>Xenarios</surname>
              <affiliation>Vital-IT, Swiss Institute of Bioinformatics, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Christian S</given_name>
              <surname>Hardtke</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
          </contributors>
          <abstract>
            <p>Among various advantages, their small size makes model organisms preferred subjects of investigation. Yet, even in model systems detailed analysis of numerous developmental processes at cellular level is severely hampered by their scale. For instance, secondary growth of Arabidopsis hypocotyls creates a radial pattern of highly specialized tissues that comprises several thousand cells starting from a few dozen. This dynamic process is difficult to follow because of its scale and because it can only be investigated invasively, precluding comprehensive understanding of the cell proliferation, differentiation, and patterning events involved. To overcome such limitation, we established an automated quantitative histology approach. We acquired hypocotyl cross-sections from tiled high-resolution images and extracted their information content using custom high-throughput image processing and segmentation. Coupled with automated cell type recognition through machine learning, we could establish a cellular resolution atlas that reveals vascular morphodynamics during secondary growth, for example equidistant phloem pole formation.</p>
          </abstract>
          <abstract abstract-type="executive-summary">
            <p>Our understanding of the living world has been advanced greatly by studies of ‘model organisms’, such as mice, zebrafish, and fruit flies. Studying these creatures has been crucial to uncovering the genes that control how our bodies develop and grow, and also to discover the genetic basis of diseases such as cancer.</p>
            <p>Thale cress—or Arabidopsis thaliana to give its formal name—is the model organism of choice for many plant biologists. This tiny weed has been widely studied because it can complete its lifecycle, from seed to seed, in about 6 weeks, and because its relatively small genome simplifies the search for genes that control specific traits. However, as with other much-studied model systems, understanding the changes that underpin the development of some of the more complex tissues in Arabidopsis has been severely hampered by the shear number of cells involved.</p>
            <p>After it has emerged from the seed, the plant’s first stem will develop from a few dozen cells in width to several thousand cells with highly specialized tissues arranged in a complex pattern of concentric circles. Although this stem thickening process represents a major developmental change in many plants—from Arabidopsis to oak trees—it has been under-researched. This is partly because it involves so many different cells, and also because it can only be observed in thin sections cut out of the plant’s stem.</p>
            <p>Now Sankar, Nieminen, Ragni et al. have developed a novel approach, termed ‘automated quantitative histology’, to overcome these problems. This strategy involves ‘teaching’ a computer to automatically recognize different plant cells and to measure their important features in high-resolution images of tissue sections. The resulting ‘map’ of the developing stem—which required over 800 hr of computing time to complete—reveals the changes to cells and tissues as they develop that allow the transport of water, sugars and nutrients between the above- and below-ground organs. Sankar, Nieminen, Ragni et al. suggest that their novel approach could, in the future, also be applied to study the development of other tissues and organisms, including animals.</p>
          </abstract>
          <publication_date media_type="online">
            <month>02</month>
            <day>11</day>
            <year>2014</year>
          </publication_date>
          <publisher_item>
            <item_number item_number_type="article_number">e01567</item_number>
            <identifier id_type="doi">10.7554/eLife.01567</identifier>
          </publisher_item>
          <program name="fundref">
            <assertion name="fundgroup">
              <assertion name="funder_name">SystemsX</assertion>
            </assertion>
            <assertion name="fundgroup">
              <assertion name="funder_name">EMBO longterm post-doctoral fellowships</assertion>
            </assertion>
            <assertion name="fundgroup">
              <assertion name="funder_name">Marie Heim-Voegtlin</assertion>
            </assertion>
            <assertion name="fundgroup">
              <assertion name="funder_name">
                University of Lausanne
                <assertion name="funder_identifier" provider="crossref">501100006390</assertion>
              </assertion>
            </assertion>
          </program>
          <program name="AccessIndicators">
            <license_ref applies_to="vor">http://creativecommons.org/licenses/by/3.0/</license_ref>
            <license_ref applies_to="am">http://creativecommons.org/licenses/by/3.0/</license_ref>
            <license_ref applies_to="tdm">http://creativecommons.org/licenses/by/3.0/</license_ref>
          </program>
          <crossmark>
            <crossmark_version>1</crossmark_version>
            <crossmark_policy>eLifesciences</crossmark_policy>
            <crossmark_domains>
              <crossmark_domain>
                <domain>www.elifesciences.org</domain>
              </crossmark_domain>
            </crossmark_domains>
            <crossmark_domain_exclusive>false</crossmark_domain_exclusive>
            <custom_metadata>
              <assertion name="received" label="Received" group_name="publication_history" group_label="Publication History" order="0">2013-09-20</assertion>
              <assertion name="accepted" label="Accepted" group_name="publication_history" group_label="Publication History" order="1">2013-12-24</assertion>
              <assertion name="published" label="Published" group_name="publication_history" group_label="Publication History" order="2">2014-02-11</assertion>
              <program name="fundref">
                <assertion name="fundgroup">
                  <assertion name="funder_name">SystemsX</assertion>
                </assertion>
                <assertion name="fundgroup">
                  <assertion name="funder_name">
                    EMBO
                    <assertion name="funder_identifier">http://dx.doi.org/10.13039/501100003043</assertion>
                  </assertion>
                </assertion>
                <assertion name="fundgroup">
                  <assertion name="funder_name">
                    Swiss National Science Foundation
                    <assertion name="funder_identifier">http://dx.doi.org/10.13039/501100001711</assertion>
                  </assertion>
                </assertion>
                <assertion name="fundgroup">
                  <assertion name="funder_name">
                    University of Lausanne
                    <assertion name="funder_identifier" provider="crossref">http://dx.doi.org/10.13039/501100006390</assertion>
                  </assertion>
                </assertion>
              </program>
              <program name="AccessIndicators">
                <license_ref applies_to="vor">http://creativecommons.org/licenses/by/3.0/</license_ref>
                <license_ref applies_to="am">http://creativecommons.org/licenses/by/3.0/</license_ref>
                <license_ref applies_to="tdm">http://creativecommons.org/licenses/by/3.0/</license_ref>
              </program>
            </custom_metadata>
          </crossmark>
          <program>
            <related_item>
              <description>Data from: Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth</description>
              <inter_work_relation identifier-type="doi" relationship-type="isSupplementedBy">10.5061/dryad.b835k</inter_work_relation>
            </related_item>
          </program>
          <archive_locations>
            <archive name="CLOCKSS" />
          </archive_locations>
          <doi_data>
            <doi>10.7554/eLife.01567</doi>
            <resource>https://elifesciences.org/articles/01567</resource>
            <collection property="text-mining">
              <item>
                <resource mime_type="application/pdf">https://cdn.elifesciences.org/articles/01567/elife-01567-v1.pdf</resource>
              </item>
              <item>
                <resource mime_type="application/xml">https://cdn.elifesciences.org/articles/01567/elife-01567-v1.xml</resource>
              </item>
            </collection>
          </doi_data>
          <citation_list>
            <citation key="bib1">
              <journal_title>Nature</journal_title>
              <author>Bonke</author>
              <volume>426</volume>
              <first_page>181</first_page>
              <cYear>2003</cYear>
              <article_title>APL regulates vascular tissue identity in Arabidopsis</article_title>
              <doi>10.1038/nature02100</doi>
            </citation>
            <citation key="bib2">
              <journal_title>Genetics</journal_title>
              <author>Brenner</author>
              <volume>182</volume>
              <first_page>413</first_page>
              <cYear>2009</cYear>
              <article_title>In the beginning was the worm</article_title>
              <doi>10.1534/genetics.109.104976</doi>
            </citation>
            <citation key="bib3">
              <journal_title>Physiologia Plantarum</journal_title>
              <author>Chaffey</author>
              <volume>114</volume>
              <first_page>594</first_page>
              <cYear>2002</cYear>
              <article_title>Secondary xylem development in Arabidopsis: a model for wood formation</article_title>
              <doi>10.1034/j.1399-3054.2002.1140413.x</doi>
            </citation>
            <citation key="bib4">
              <journal_title>Neural computation</journal_title>
              <author>Chang</author>
              <volume>13</volume>
              <first_page>2119</first_page>
              <cYear>2001</cYear>
              <article_title>Training nu-support vector classifiers: theory and algorithms</article_title>
              <doi>10.1162/089976601750399335</doi>
            </citation>
            <citation key="bib5">
              <journal_title>Machine Learning</journal_title>
              <author>Cortes</author>
              <volume>20</volume>
              <first_page>273</first_page>
              <cYear>1995</cYear>
              <doi provider="crossref">10.1007/BF00994018</doi>
              <article_title>Support-vector Networks</article_title>
            </citation>
            <citation key="bib6">
              <journal_title>Development</journal_title>
              <author>Dolan</author>
              <volume>119</volume>
              <first_page>71</first_page>
              <cYear>1993</cYear>
              <article_title>Cellular organisation of the Arabidopsis thaliana root</article_title>
            </citation>
            <citation key="bib7">
              <journal_title>Seminars in Cell &amp; Developmental Biology</journal_title>
              <author>Elo</author>
              <volume>20</volume>
              <first_page>1097</first_page>
              <cYear>2009</cYear>
              <article_title>Stem cell function during plant vascular development</article_title>
              <doi>10.1016/j.semcdb.2009.09.009</doi>
            </citation>
            <citation key="bib8">
              <journal_title>Development</journal_title>
              <author>Etchells</author>
              <volume>140</volume>
              <first_page>2224</first_page>
              <cYear>2013</cYear>
              <article_title>WOX4 and WOX14 act downstream of the PXY receptor kinase to regulate plant vascular proliferation independently of any role in vascular organisation</article_title>
              <doi>10.1242/dev.091314</doi>
            </citation>
            <citation key="bib9">
              <journal_title>PLOS Genetics</journal_title>
              <author>Etchells</author>
              <volume>8</volume>
              <first_page>e1002997</first_page>
              <cYear>2012</cYear>
              <article_title>Plant vascular cell division is maintained by an interaction between PXY and ethylene signalling</article_title>
              <doi>10.1371/journal.pgen.1002997</doi>
            </citation>
            <citation key="bib10">
              <journal_title>Molecular Systems Biology</journal_title>
              <author>Fuchs</author>
              <volume>6</volume>
              <first_page>370</first_page>
              <cYear>2010</cYear>
              <article_title>Clustering phenotype populations by genome-wide RNAi and multiparametric imaging</article_title>
              <doi>10.1038/msb.2010.25</doi>
            </citation>
            <citation key="bib11">
              <journal_title>Bio Systems</journal_title>
              <author>Granqvist</author>
              <volume>110</volume>
              <first_page>60</first_page>
              <cYear>2012</cYear>
              <article_title>BaSAR-A tool in R for frequency detection</article_title>
              <doi>10.1016/j.biosystems.2012.07.004</doi>
            </citation>
            <citation key="bib12">
              <journal_title>Current Opinion in Plant Biology</journal_title>
              <author>Groover</author>
              <volume>9</volume>
              <first_page>55</first_page>
              <cYear>2006</cYear>
              <article_title>Developmental mechanisms regulating secondary growth in woody plants</article_title>
              <doi>10.1016/j.pbi.2005.11.013</doi>
            </citation>
            <citation key="bib13">
              <journal_title>Plant Cell</journal_title>
              <author>Hirakawa</author>
              <volume>22</volume>
              <first_page>2618</first_page>
              <cYear>2010</cYear>
              <article_title>TDIF peptide signaling regulates vascular stem cell proliferation via the WOX4 homeobox gene in Arabidopsis</article_title>
              <doi>10.1105/tpc.110.076083</doi>
            </citation>
            <citation key="bib14">
              <journal_title>Proceedings of the National Academy of Sciences of the United States of America</journal_title>
              <author>Hirakawa</author>
              <volume>105</volume>
              <first_page>15208</first_page>
              <cYear>2008</cYear>
              <article_title>Non-cell-autonomous control of vascular stem cell fate by a CLE peptide/receptor system</article_title>
              <doi>10.1073/pnas.0808444105</doi>
            </citation>
            <citation key="bib15">
              <journal_title>Cell</journal_title>
              <author>Meyerowitz</author>
              <volume>56</volume>
              <first_page>263</first_page>
              <cYear>1989</cYear>
              <article_title>Arabidopsis, a useful weed</article_title>
              <doi>10.1016/0092-8674(89)90900-8</doi>
            </citation>
            <citation key="bib16">
              <journal_title>Science</journal_title>
              <author>Meyerowitz</author>
              <volume>295</volume>
              <first_page>1482</first_page>
              <cYear>2002</cYear>
              <article_title>Plants compared to animals: the broadest comparative study of development</article_title>
              <doi>10.1126/science.1066609</doi>
            </citation>
            <citation key="bib17">
              <journal_title>Plant Physiol</journal_title>
              <author>Nieminen</author>
              <volume>135</volume>
              <first_page>653</first_page>
              <cYear>2004</cYear>
              <article_title>A weed for wood? Arabidopsis as a genetic model for xylem development</article_title>
              <doi>10.1104/pp.104.040212</doi>
            </citation>
            <citation key="bib18">
              <journal_title>Nature Biotechnology</journal_title>
              <author>Noble</author>
              <volume>24</volume>
              <first_page>1565</first_page>
              <cYear>2006</cYear>
              <article_title>What is a support vector machine?</article_title>
              <doi>10.1038/nbt1206-1565</doi>
            </citation>
            <citation key="bib19">
              <journal_title>Proceedings of the National Academy of Sciences of the United States of America</journal_title>
              <author>Olson</author>
              <volume>77</volume>
              <first_page>1516</first_page>
              <cYear>1980</cYear>
              <article_title>Classification of cultured mammalian cells by shape analysis and pattern recognition</article_title>
              <doi>10.1073/pnas.77.3.1516</doi>
            </citation>
            <citation key="bib20">
              <journal_title>Bioinformatics</journal_title>
              <author>Pau</author>
              <volume>26</volume>
              <first_page>979</first_page>
              <cYear>2010</cYear>
              <article_title>EBImage–an R package for image processing with applications to cellular phenotypes</article_title>
              <doi>10.1093/bioinformatics/btq046</doi>
            </citation>
            <citation key="bib21">
              <journal_title>Plant Cell</journal_title>
              <author>Ragni</author>
              <volume>23</volume>
              <first_page>1322</first_page>
              <cYear>2011</cYear>
              <article_title>Mobile gibberellin directly stimulates Arabidopsis hypocotyl xylem expansion</article_title>
              <doi>10.1105/tpc.111.084020</doi>
            </citation>
            <citation key="bib22">
              <journal_title>Dryad Digital Repository</journal_title>
              <author>Sankar</author>
              <cYear>2014</cYear>
              <article_title>Data from: Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth</article_title>
              <doi>10.5061/dryad.b835k</doi>
            </citation>
            <citation key="bib23">
              <journal_title>Current Biology</journal_title>
              <author>Sibout</author>
              <volume>18</volume>
              <first_page>458</first_page>
              <cYear>2008</cYear>
              <article_title>Flowering as a condition for xylem expansion in Arabidopsis hypocotyl and root</article_title>
              <doi>10.1016/j.cub.2008.02.070</doi>
            </citation>
            <citation key="bib24">
              <journal_title>The New Phytologist</journal_title>
              <author>Spicer</author>
              <volume>186</volume>
              <first_page>577</first_page>
              <cYear>2010</cYear>
              <article_title>Evolution of development of vascular cambia and secondary growth</article_title>
              <doi>10.1111/j.1469-8137.2010.03236.x</doi>
            </citation>
            <citation key="bib25">
              <journal_title>Machine Vision and Applications</journal_title>
              <author>Theriault</author>
              <volume>23</volume>
              <first_page>659</first_page>
              <cYear>2012</cYear>
              <article_title>Cell morphology classification and clutter mitigation in phase-contrast microscopy images using machine learning</article_title>
              <doi>10.1007/s00138-011-0345-9</doi>
            </citation>
            <citation key="bib26">
              <journal_title>Cell</journal_title>
              <author>Uyttewaal</author>
              <volume>149</volume>
              <first_page>439</first_page>
              <cYear>2012</cYear>
              <article_title>Mechanical stress acts via katanin to amplify differences in growth rate between adjacent cells in Arabidopsis</article_title>
              <doi>10.1016/j.cell.2012.02.048</doi>
            </citation>
            <citation key="bib27">
              <journal_title>Nature Cell Biology</journal_title>
              <author>Yin</author>
              <volume>15</volume>
              <first_page>860</first_page>
              <cYear>2013</cYear>
              <article_title>A screen for morphological complexity identifies regulators of switch-like transitions between discrete cell shapes</article_title>
              <doi>10.1038/ncb2764</doi>
            </citation>
          </citation_list>
          <component_list>
            <component parent_relation="isPartOf">
              <titles>
                <title>Abstract</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.001</doi>
                <resource>https://elifesciences.org/articles/01567#abstract</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>eLife digest</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.002</doi>
                <resource>https://elifesciences.org/articles/01567#digest</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 1. Cellular level analysis of Arabidopsis hypocotyl secondary growth.</title>
                <subtitle>(A) Light microscopy of cross sections obtained from Arabidopsis hypocotyls (organ position illustrated for a 9-day-old seedling, lower left) at 9 dag (upper left) and 35 dag (right). Size bars are 100 μm. Blue GUS staining due to the presence of an APL::GUS reporter gene in this Col-0 background line marks phloem bundles. (B) Overview of the developmental series (time points and distinct samples per genotype) analyzed in this study. (C) Example of a high-resolution hypocotyl section image assembled from 11 × 11 tiles. (D) The same image after pre-processing and binarization, and (E) subsequent segmentation using a watershed algorithm. (F) Number of mis-segmented cells as determined by careful visual inspection in 12 sections, plotted against the total number of cells per section (log scale).</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.003</doi>
                <resource>https://elifesciences.org/articles/01567#fig1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 2. The ‘Quantitative Histology’ approach.</title>
                <subtitle>(A) Overview of the computational pipeline from image acquisition to analysis. (B) ‘Phenoprints’ for the different genotypes and developmental stages.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.004</doi>
                <resource>https://elifesciences.org/articles/01567#fig2</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 2—figure supplement 1. An example of classifier selection through V-fold cross validation.</title>
                <subtitle>The green arrow points out the selected feature combination according to the criteria of minimum number of features with the highest performance and the lowest variation (the radiusV feature was excluded due to its putative variation in tissue location).</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.005</doi>
                <resource>https://elifesciences.org/articles/01567/figures#fig2s1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 3. Progression of tissue proliferation.</title>
                <subtitle>(A) Principal component analysis (PCA) of the phenoprints shown in Figure 2B, performed with normalized values (Supplementary file 4). The inlay screeplot displays the proportion of total variation explained by each principal component. (B–E) Comparative plots of parameter progression in the two genotypes. In (D), xylem represents combined vessel, parenchyma, and fiber cells, phloem represents combined phloem parenchyma and bundle cells. Error bars indicate standard error.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.006</doi>
                <resource>https://elifesciences.org/articles/01567#fig3</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 4. Bimodal distribution of incline angle according to position.</title>
                <subtitle>(A and B) Spatial distribution of cell incline angle illustrates the vascular organization in Ler (B) as compared to Col-0 (A) at later stages of development, for example 30 dag. The size of the disc increases with the area of the cell. Blue color indicates radial cell orientation, red orthoradial. (C and D) Violin plots of incline angle distribution, illustrating increasingly bimodal distribution coincident with refined vascular organization and different dynamics of the process in the two genotypes.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.007</doi>
                <resource>https://elifesciences.org/articles/01567#fig4</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 4—figure supplement 1. An illustration of the incline angle.</title>
                <subtitle>The incline is the angle between the section radius through the center of an ellipse fit to a cell and the major axis of that ellipse extended towards the x axis.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.008</doi>
                <resource>https://elifesciences.org/articles/01567/figures#fig4s1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 5. Distinct local organization of incline angle during hypocotyl secondary growth progression.</title>
                <subtitle>(A–J) Density plots of cell incline angle vs radial position for the two genotypes at the indicated developmental stages, representing all cells across all sections for a given time point. The red lines represent the fit of these cloud distributions with locally weighted linear regression (i.e., lowess), revealing the essential data trends. All sections were normalized from 0.0 (the manually defined center) to 1.0 (the average radius in a set of sections as determined by the average distance of the outermost cells from the center for individual sections). Box plots indicate the quartiles of the radian distribution for each cell-type class and are placed at the average position of the cell type with respect to the y axis. Outliers are shown as circles.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.009</doi>
                <resource>https://elifesciences.org/articles/01567#fig5</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 5—figure supplement 1. Analysis of cell number in defined xylem regions of different size.</title>
                <subtitle>Cell number in a circle of 200–500 pixels around the section centers for Col-0. Cell count in a constant area of xylem over time across all averaged across all sections.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.010</doi>
                <resource>https://elifesciences.org/articles/01567/figures#fig5s1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 6. Mapping of phloem pole patterning.</title>
                <subtitle>(A) Example of Gaussian kernel density estimate of the location of predicted phloem bundles cells in a 30 dag Col-0 section. High density represents phloem poles. (B) Example of an analysis of emerging phloem pole position in a 30 dag Col-0 section. The plot represents a pixel intensity map after noise reduction along a circular region of interest across the emerging phloem poles. Intensity peaks are due to GUS staining conferred to phloem bundles by an APL::GUS reporter construct. (C) Probability density function of the data shown in (B) obtained from an automated Bayesian model. The dominant single peak indicates a constant arc distance of ca. 62 pixel between the phloem poles.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.011</doi>
                <resource>https://elifesciences.org/articles/01567#fig6</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 1.</title>
                <subtitle>(A) An explanation of the extracted parameters that describe the cellular features. (B) Summary information of the hand-labeled training set for supervised machine learning. (C) Definition of the classifiers selected for analysis. (D) Summary of the classifier parameters for supervised machine learning. (E) Overview of the cell type classes recognized by the supervised machine learning approach and their assignment codes used in Data Files 3 and 4.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.012</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD1-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 2.</title>
                <subtitle>Quality control files for the Col-0 sections.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.013</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD2-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 3.</title>
                <subtitle>Quality control files for the Ler sections.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.014</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD3-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 4.</title>
                <subtitle>The normalized values of the phenoprints (Figure 2B) used for PCA.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.015</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD4-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Decision letter</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.016</doi>
                <resource>https://elifesciences.org/articles/01567#SA1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Author response</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.017</doi>
                <resource>https://elifesciences.org/articles/01567#SA2</resource>
              </doi_data>
            </component>
          </component_list>
        </journal_article>
      </journal>
    </crossref>
  </doi_record>
</doi_records> + http_version: + recorded_at: Fri, 07 Dec 2018 18:37:48 GMT +recorded_with: VCR 3.0.3 diff --git a/spec/fixtures/vcr_cassettes/dois/POST_/dois/crossref_url/sets_state_to_findable.yml b/spec/fixtures/vcr_cassettes/dois/POST_/dois/crossref_url/sets_state_to_findable.yml new file mode 100644 index 000000000..cc5a91cf4 --- /dev/null +++ b/spec/fixtures/vcr_cassettes/dois/POST_/dois/crossref_url/sets_state_to_findable.yml @@ -0,0 +1,82 @@ +--- +http_interactions: +- request: + method: get + uri: https://api.datacite.org/prefixes/10.7554 + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/html,application/json,application/xml;q=0.9, text/plain;q=0.8,image/png,*/*;q=0.5 + response: + status: + code: 200 + message: OK + headers: + Date: + - Fri, 07 Dec 2018 18:37:49 GMT + Content-Type: + - application/json; charset=utf-8 + Connection: + - keep-alive + Status: + - 200 OK + X-Anonymous-Consumer: + - 'true' + Cache-Control: + - max-age=0, private, must-revalidate + Vary: + - Accept-Encoding, Origin + X-Request-Id: + - dc53754b-5309-4e73-a1d0-35bfde3b29dc + Etag: + - W/"381993dc8a6b0f20960c96a3639c0284" + X-Runtime: + - '0.076738' + X-Powered-By: + - Phusion Passenger 6.0.0 + Server: + - nginx/1.15.7 + Phusion Passenger 6.0.0 + body: + encoding: ASCII-8BIT + string: '{"data":{"id":"10.7554","type":"prefixes","attributes":{"registration-agency":"Crossref","created":null,"updated":"2016-09-21T21:07:27Z"},"relationships":{"clients":{"data":[]},"providers":{"data":[]}}},"included":[]}' + http_version: + recorded_at: Fri, 07 Dec 2018 18:37:49 GMT +- request: + method: get + uri: http://www.crossref.org/openurl/?format=unixref&id=doi:10.7554/elife.01567&noredirect=true&pid=tech@datacite.org + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/xml + response: + status: + code: 200 + message: OK + headers: + Server: + - Apache-Coyote/1.1 + Crossref-Deployment-Name: + - qs4-1 + Content-Type: + - text/xml;charset=UTF-8 + Content-Language: + - en-US + Date: + - Fri, 07 Dec 2018 18:37:49 GMT + Connection: + - close + body: + encoding: ASCII-8BIT + string: !binary |- + <?xml version="1.0" encoding="UTF-8"?>
<doi_records>
  <doi_record owner="10.7554" timestamp="2018-08-23 09:41:49">
    <crossref>
      <journal>
        <journal_metadata language="en">
          <full_title>eLife</full_title>
          <issn media_type="electronic">2050-084X</issn>
        </journal_metadata>
        <journal_issue>
          <publication_date media_type="online">
            <month>02</month>
            <day>11</day>
            <year>2014</year>
          </publication_date>
          <journal_volume>
            <volume>3</volume>
          </journal_volume>
        </journal_issue>
        <journal_article publication_type="full_text" reference_distribution_opts="any">
          <titles>
            <title>Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth</title>
          </titles>
          <contributors>
            <person_name contributor_role="author" sequence="first">
              <given_name>Martial</given_name>
              <surname>Sankar</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Kaisa</given_name>
              <surname>Nieminen</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Laura</given_name>
              <surname>Ragni</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Ioannis</given_name>
              <surname>Xenarios</surname>
              <affiliation>Vital-IT, Swiss Institute of Bioinformatics, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Christian S</given_name>
              <surname>Hardtke</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
          </contributors>
          <abstract>
            <p>Among various advantages, their small size makes model organisms preferred subjects of investigation. Yet, even in model systems detailed analysis of numerous developmental processes at cellular level is severely hampered by their scale. For instance, secondary growth of Arabidopsis hypocotyls creates a radial pattern of highly specialized tissues that comprises several thousand cells starting from a few dozen. This dynamic process is difficult to follow because of its scale and because it can only be investigated invasively, precluding comprehensive understanding of the cell proliferation, differentiation, and patterning events involved. To overcome such limitation, we established an automated quantitative histology approach. We acquired hypocotyl cross-sections from tiled high-resolution images and extracted their information content using custom high-throughput image processing and segmentation. Coupled with automated cell type recognition through machine learning, we could establish a cellular resolution atlas that reveals vascular morphodynamics during secondary growth, for example equidistant phloem pole formation.</p>
          </abstract>
          <abstract abstract-type="executive-summary">
            <p>Our understanding of the living world has been advanced greatly by studies of ‘model organisms’, such as mice, zebrafish, and fruit flies. Studying these creatures has been crucial to uncovering the genes that control how our bodies develop and grow, and also to discover the genetic basis of diseases such as cancer.</p>
            <p>Thale cress—or Arabidopsis thaliana to give its formal name—is the model organism of choice for many plant biologists. This tiny weed has been widely studied because it can complete its lifecycle, from seed to seed, in about 6 weeks, and because its relatively small genome simplifies the search for genes that control specific traits. However, as with other much-studied model systems, understanding the changes that underpin the development of some of the more complex tissues in Arabidopsis has been severely hampered by the shear number of cells involved.</p>
            <p>After it has emerged from the seed, the plant’s first stem will develop from a few dozen cells in width to several thousand cells with highly specialized tissues arranged in a complex pattern of concentric circles. Although this stem thickening process represents a major developmental change in many plants—from Arabidopsis to oak trees—it has been under-researched. This is partly because it involves so many different cells, and also because it can only be observed in thin sections cut out of the plant’s stem.</p>
            <p>Now Sankar, Nieminen, Ragni et al. have developed a novel approach, termed ‘automated quantitative histology’, to overcome these problems. This strategy involves ‘teaching’ a computer to automatically recognize different plant cells and to measure their important features in high-resolution images of tissue sections. The resulting ‘map’ of the developing stem—which required over 800 hr of computing time to complete—reveals the changes to cells and tissues as they develop that allow the transport of water, sugars and nutrients between the above- and below-ground organs. Sankar, Nieminen, Ragni et al. suggest that their novel approach could, in the future, also be applied to study the development of other tissues and organisms, including animals.</p>
          </abstract>
          <publication_date media_type="online">
            <month>02</month>
            <day>11</day>
            <year>2014</year>
          </publication_date>
          <publisher_item>
            <item_number item_number_type="article_number">e01567</item_number>
            <identifier id_type="doi">10.7554/eLife.01567</identifier>
          </publisher_item>
          <program name="fundref">
            <assertion name="fundgroup">
              <assertion name="funder_name">SystemsX</assertion>
            </assertion>
            <assertion name="fundgroup">
              <assertion name="funder_name">EMBO longterm post-doctoral fellowships</assertion>
            </assertion>
            <assertion name="fundgroup">
              <assertion name="funder_name">Marie Heim-Voegtlin</assertion>
            </assertion>
            <assertion name="fundgroup">
              <assertion name="funder_name">
                University of Lausanne
                <assertion name="funder_identifier" provider="crossref">501100006390</assertion>
              </assertion>
            </assertion>
          </program>
          <program name="AccessIndicators">
            <license_ref applies_to="vor">http://creativecommons.org/licenses/by/3.0/</license_ref>
            <license_ref applies_to="am">http://creativecommons.org/licenses/by/3.0/</license_ref>
            <license_ref applies_to="tdm">http://creativecommons.org/licenses/by/3.0/</license_ref>
          </program>
          <crossmark>
            <crossmark_version>1</crossmark_version>
            <crossmark_policy>eLifesciences</crossmark_policy>
            <crossmark_domains>
              <crossmark_domain>
                <domain>www.elifesciences.org</domain>
              </crossmark_domain>
            </crossmark_domains>
            <crossmark_domain_exclusive>false</crossmark_domain_exclusive>
            <custom_metadata>
              <assertion name="received" label="Received" group_name="publication_history" group_label="Publication History" order="0">2013-09-20</assertion>
              <assertion name="accepted" label="Accepted" group_name="publication_history" group_label="Publication History" order="1">2013-12-24</assertion>
              <assertion name="published" label="Published" group_name="publication_history" group_label="Publication History" order="2">2014-02-11</assertion>
              <program name="fundref">
                <assertion name="fundgroup">
                  <assertion name="funder_name">SystemsX</assertion>
                </assertion>
                <assertion name="fundgroup">
                  <assertion name="funder_name">
                    EMBO
                    <assertion name="funder_identifier">http://dx.doi.org/10.13039/501100003043</assertion>
                  </assertion>
                </assertion>
                <assertion name="fundgroup">
                  <assertion name="funder_name">
                    Swiss National Science Foundation
                    <assertion name="funder_identifier">http://dx.doi.org/10.13039/501100001711</assertion>
                  </assertion>
                </assertion>
                <assertion name="fundgroup">
                  <assertion name="funder_name">
                    University of Lausanne
                    <assertion name="funder_identifier" provider="crossref">http://dx.doi.org/10.13039/501100006390</assertion>
                  </assertion>
                </assertion>
              </program>
              <program name="AccessIndicators">
                <license_ref applies_to="vor">http://creativecommons.org/licenses/by/3.0/</license_ref>
                <license_ref applies_to="am">http://creativecommons.org/licenses/by/3.0/</license_ref>
                <license_ref applies_to="tdm">http://creativecommons.org/licenses/by/3.0/</license_ref>
              </program>
            </custom_metadata>
          </crossmark>
          <program>
            <related_item>
              <description>Data from: Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth</description>
              <inter_work_relation identifier-type="doi" relationship-type="isSupplementedBy">10.5061/dryad.b835k</inter_work_relation>
            </related_item>
          </program>
          <archive_locations>
            <archive name="CLOCKSS" />
          </archive_locations>
          <doi_data>
            <doi>10.7554/eLife.01567</doi>
            <resource>https://elifesciences.org/articles/01567</resource>
            <collection property="text-mining">
              <item>
                <resource mime_type="application/pdf">https://cdn.elifesciences.org/articles/01567/elife-01567-v1.pdf</resource>
              </item>
              <item>
                <resource mime_type="application/xml">https://cdn.elifesciences.org/articles/01567/elife-01567-v1.xml</resource>
              </item>
            </collection>
          </doi_data>
          <citation_list>
            <citation key="bib1">
              <journal_title>Nature</journal_title>
              <author>Bonke</author>
              <volume>426</volume>
              <first_page>181</first_page>
              <cYear>2003</cYear>
              <article_title>APL regulates vascular tissue identity in Arabidopsis</article_title>
              <doi>10.1038/nature02100</doi>
            </citation>
            <citation key="bib2">
              <journal_title>Genetics</journal_title>
              <author>Brenner</author>
              <volume>182</volume>
              <first_page>413</first_page>
              <cYear>2009</cYear>
              <article_title>In the beginning was the worm</article_title>
              <doi>10.1534/genetics.109.104976</doi>
            </citation>
            <citation key="bib3">
              <journal_title>Physiologia Plantarum</journal_title>
              <author>Chaffey</author>
              <volume>114</volume>
              <first_page>594</first_page>
              <cYear>2002</cYear>
              <article_title>Secondary xylem development in Arabidopsis: a model for wood formation</article_title>
              <doi>10.1034/j.1399-3054.2002.1140413.x</doi>
            </citation>
            <citation key="bib4">
              <journal_title>Neural computation</journal_title>
              <author>Chang</author>
              <volume>13</volume>
              <first_page>2119</first_page>
              <cYear>2001</cYear>
              <article_title>Training nu-support vector classifiers: theory and algorithms</article_title>
              <doi>10.1162/089976601750399335</doi>
            </citation>
            <citation key="bib5">
              <journal_title>Machine Learning</journal_title>
              <author>Cortes</author>
              <volume>20</volume>
              <first_page>273</first_page>
              <cYear>1995</cYear>
              <doi provider="crossref">10.1007/BF00994018</doi>
              <article_title>Support-vector Networks</article_title>
            </citation>
            <citation key="bib6">
              <journal_title>Development</journal_title>
              <author>Dolan</author>
              <volume>119</volume>
              <first_page>71</first_page>
              <cYear>1993</cYear>
              <article_title>Cellular organisation of the Arabidopsis thaliana root</article_title>
            </citation>
            <citation key="bib7">
              <journal_title>Seminars in Cell &amp; Developmental Biology</journal_title>
              <author>Elo</author>
              <volume>20</volume>
              <first_page>1097</first_page>
              <cYear>2009</cYear>
              <article_title>Stem cell function during plant vascular development</article_title>
              <doi>10.1016/j.semcdb.2009.09.009</doi>
            </citation>
            <citation key="bib8">
              <journal_title>Development</journal_title>
              <author>Etchells</author>
              <volume>140</volume>
              <first_page>2224</first_page>
              <cYear>2013</cYear>
              <article_title>WOX4 and WOX14 act downstream of the PXY receptor kinase to regulate plant vascular proliferation independently of any role in vascular organisation</article_title>
              <doi>10.1242/dev.091314</doi>
            </citation>
            <citation key="bib9">
              <journal_title>PLOS Genetics</journal_title>
              <author>Etchells</author>
              <volume>8</volume>
              <first_page>e1002997</first_page>
              <cYear>2012</cYear>
              <article_title>Plant vascular cell division is maintained by an interaction between PXY and ethylene signalling</article_title>
              <doi>10.1371/journal.pgen.1002997</doi>
            </citation>
            <citation key="bib10">
              <journal_title>Molecular Systems Biology</journal_title>
              <author>Fuchs</author>
              <volume>6</volume>
              <first_page>370</first_page>
              <cYear>2010</cYear>
              <article_title>Clustering phenotype populations by genome-wide RNAi and multiparametric imaging</article_title>
              <doi>10.1038/msb.2010.25</doi>
            </citation>
            <citation key="bib11">
              <journal_title>Bio Systems</journal_title>
              <author>Granqvist</author>
              <volume>110</volume>
              <first_page>60</first_page>
              <cYear>2012</cYear>
              <article_title>BaSAR-A tool in R for frequency detection</article_title>
              <doi>10.1016/j.biosystems.2012.07.004</doi>
            </citation>
            <citation key="bib12">
              <journal_title>Current Opinion in Plant Biology</journal_title>
              <author>Groover</author>
              <volume>9</volume>
              <first_page>55</first_page>
              <cYear>2006</cYear>
              <article_title>Developmental mechanisms regulating secondary growth in woody plants</article_title>
              <doi>10.1016/j.pbi.2005.11.013</doi>
            </citation>
            <citation key="bib13">
              <journal_title>Plant Cell</journal_title>
              <author>Hirakawa</author>
              <volume>22</volume>
              <first_page>2618</first_page>
              <cYear>2010</cYear>
              <article_title>TDIF peptide signaling regulates vascular stem cell proliferation via the WOX4 homeobox gene in Arabidopsis</article_title>
              <doi>10.1105/tpc.110.076083</doi>
            </citation>
            <citation key="bib14">
              <journal_title>Proceedings of the National Academy of Sciences of the United States of America</journal_title>
              <author>Hirakawa</author>
              <volume>105</volume>
              <first_page>15208</first_page>
              <cYear>2008</cYear>
              <article_title>Non-cell-autonomous control of vascular stem cell fate by a CLE peptide/receptor system</article_title>
              <doi>10.1073/pnas.0808444105</doi>
            </citation>
            <citation key="bib15">
              <journal_title>Cell</journal_title>
              <author>Meyerowitz</author>
              <volume>56</volume>
              <first_page>263</first_page>
              <cYear>1989</cYear>
              <article_title>Arabidopsis, a useful weed</article_title>
              <doi>10.1016/0092-8674(89)90900-8</doi>
            </citation>
            <citation key="bib16">
              <journal_title>Science</journal_title>
              <author>Meyerowitz</author>
              <volume>295</volume>
              <first_page>1482</first_page>
              <cYear>2002</cYear>
              <article_title>Plants compared to animals: the broadest comparative study of development</article_title>
              <doi>10.1126/science.1066609</doi>
            </citation>
            <citation key="bib17">
              <journal_title>Plant Physiol</journal_title>
              <author>Nieminen</author>
              <volume>135</volume>
              <first_page>653</first_page>
              <cYear>2004</cYear>
              <article_title>A weed for wood? Arabidopsis as a genetic model for xylem development</article_title>
              <doi>10.1104/pp.104.040212</doi>
            </citation>
            <citation key="bib18">
              <journal_title>Nature Biotechnology</journal_title>
              <author>Noble</author>
              <volume>24</volume>
              <first_page>1565</first_page>
              <cYear>2006</cYear>
              <article_title>What is a support vector machine?</article_title>
              <doi>10.1038/nbt1206-1565</doi>
            </citation>
            <citation key="bib19">
              <journal_title>Proceedings of the National Academy of Sciences of the United States of America</journal_title>
              <author>Olson</author>
              <volume>77</volume>
              <first_page>1516</first_page>
              <cYear>1980</cYear>
              <article_title>Classification of cultured mammalian cells by shape analysis and pattern recognition</article_title>
              <doi>10.1073/pnas.77.3.1516</doi>
            </citation>
            <citation key="bib20">
              <journal_title>Bioinformatics</journal_title>
              <author>Pau</author>
              <volume>26</volume>
              <first_page>979</first_page>
              <cYear>2010</cYear>
              <article_title>EBImage–an R package for image processing with applications to cellular phenotypes</article_title>
              <doi>10.1093/bioinformatics/btq046</doi>
            </citation>
            <citation key="bib21">
              <journal_title>Plant Cell</journal_title>
              <author>Ragni</author>
              <volume>23</volume>
              <first_page>1322</first_page>
              <cYear>2011</cYear>
              <article_title>Mobile gibberellin directly stimulates Arabidopsis hypocotyl xylem expansion</article_title>
              <doi>10.1105/tpc.111.084020</doi>
            </citation>
            <citation key="bib22">
              <journal_title>Dryad Digital Repository</journal_title>
              <author>Sankar</author>
              <cYear>2014</cYear>
              <article_title>Data from: Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth</article_title>
              <doi>10.5061/dryad.b835k</doi>
            </citation>
            <citation key="bib23">
              <journal_title>Current Biology</journal_title>
              <author>Sibout</author>
              <volume>18</volume>
              <first_page>458</first_page>
              <cYear>2008</cYear>
              <article_title>Flowering as a condition for xylem expansion in Arabidopsis hypocotyl and root</article_title>
              <doi>10.1016/j.cub.2008.02.070</doi>
            </citation>
            <citation key="bib24">
              <journal_title>The New Phytologist</journal_title>
              <author>Spicer</author>
              <volume>186</volume>
              <first_page>577</first_page>
              <cYear>2010</cYear>
              <article_title>Evolution of development of vascular cambia and secondary growth</article_title>
              <doi>10.1111/j.1469-8137.2010.03236.x</doi>
            </citation>
            <citation key="bib25">
              <journal_title>Machine Vision and Applications</journal_title>
              <author>Theriault</author>
              <volume>23</volume>
              <first_page>659</first_page>
              <cYear>2012</cYear>
              <article_title>Cell morphology classification and clutter mitigation in phase-contrast microscopy images using machine learning</article_title>
              <doi>10.1007/s00138-011-0345-9</doi>
            </citation>
            <citation key="bib26">
              <journal_title>Cell</journal_title>
              <author>Uyttewaal</author>
              <volume>149</volume>
              <first_page>439</first_page>
              <cYear>2012</cYear>
              <article_title>Mechanical stress acts via katanin to amplify differences in growth rate between adjacent cells in Arabidopsis</article_title>
              <doi>10.1016/j.cell.2012.02.048</doi>
            </citation>
            <citation key="bib27">
              <journal_title>Nature Cell Biology</journal_title>
              <author>Yin</author>
              <volume>15</volume>
              <first_page>860</first_page>
              <cYear>2013</cYear>
              <article_title>A screen for morphological complexity identifies regulators of switch-like transitions between discrete cell shapes</article_title>
              <doi>10.1038/ncb2764</doi>
            </citation>
          </citation_list>
          <component_list>
            <component parent_relation="isPartOf">
              <titles>
                <title>Abstract</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.001</doi>
                <resource>https://elifesciences.org/articles/01567#abstract</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>eLife digest</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.002</doi>
                <resource>https://elifesciences.org/articles/01567#digest</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 1. Cellular level analysis of Arabidopsis hypocotyl secondary growth.</title>
                <subtitle>(A) Light microscopy of cross sections obtained from Arabidopsis hypocotyls (organ position illustrated for a 9-day-old seedling, lower left) at 9 dag (upper left) and 35 dag (right). Size bars are 100 μm. Blue GUS staining due to the presence of an APL::GUS reporter gene in this Col-0 background line marks phloem bundles. (B) Overview of the developmental series (time points and distinct samples per genotype) analyzed in this study. (C) Example of a high-resolution hypocotyl section image assembled from 11 × 11 tiles. (D) The same image after pre-processing and binarization, and (E) subsequent segmentation using a watershed algorithm. (F) Number of mis-segmented cells as determined by careful visual inspection in 12 sections, plotted against the total number of cells per section (log scale).</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.003</doi>
                <resource>https://elifesciences.org/articles/01567#fig1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 2. The ‘Quantitative Histology’ approach.</title>
                <subtitle>(A) Overview of the computational pipeline from image acquisition to analysis. (B) ‘Phenoprints’ for the different genotypes and developmental stages.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.004</doi>
                <resource>https://elifesciences.org/articles/01567#fig2</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 2—figure supplement 1. An example of classifier selection through V-fold cross validation.</title>
                <subtitle>The green arrow points out the selected feature combination according to the criteria of minimum number of features with the highest performance and the lowest variation (the radiusV feature was excluded due to its putative variation in tissue location).</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.005</doi>
                <resource>https://elifesciences.org/articles/01567/figures#fig2s1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 3. Progression of tissue proliferation.</title>
                <subtitle>(A) Principal component analysis (PCA) of the phenoprints shown in Figure 2B, performed with normalized values (Supplementary file 4). The inlay screeplot displays the proportion of total variation explained by each principal component. (B–E) Comparative plots of parameter progression in the two genotypes. In (D), xylem represents combined vessel, parenchyma, and fiber cells, phloem represents combined phloem parenchyma and bundle cells. Error bars indicate standard error.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.006</doi>
                <resource>https://elifesciences.org/articles/01567#fig3</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 4. Bimodal distribution of incline angle according to position.</title>
                <subtitle>(A and B) Spatial distribution of cell incline angle illustrates the vascular organization in Ler (B) as compared to Col-0 (A) at later stages of development, for example 30 dag. The size of the disc increases with the area of the cell. Blue color indicates radial cell orientation, red orthoradial. (C and D) Violin plots of incline angle distribution, illustrating increasingly bimodal distribution coincident with refined vascular organization and different dynamics of the process in the two genotypes.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.007</doi>
                <resource>https://elifesciences.org/articles/01567#fig4</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 4—figure supplement 1. An illustration of the incline angle.</title>
                <subtitle>The incline is the angle between the section radius through the center of an ellipse fit to a cell and the major axis of that ellipse extended towards the x axis.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.008</doi>
                <resource>https://elifesciences.org/articles/01567/figures#fig4s1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 5. Distinct local organization of incline angle during hypocotyl secondary growth progression.</title>
                <subtitle>(A–J) Density plots of cell incline angle vs radial position for the two genotypes at the indicated developmental stages, representing all cells across all sections for a given time point. The red lines represent the fit of these cloud distributions with locally weighted linear regression (i.e., lowess), revealing the essential data trends. All sections were normalized from 0.0 (the manually defined center) to 1.0 (the average radius in a set of sections as determined by the average distance of the outermost cells from the center for individual sections). Box plots indicate the quartiles of the radian distribution for each cell-type class and are placed at the average position of the cell type with respect to the y axis. Outliers are shown as circles.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.009</doi>
                <resource>https://elifesciences.org/articles/01567#fig5</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 5—figure supplement 1. Analysis of cell number in defined xylem regions of different size.</title>
                <subtitle>Cell number in a circle of 200–500 pixels around the section centers for Col-0. Cell count in a constant area of xylem over time across all averaged across all sections.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.010</doi>
                <resource>https://elifesciences.org/articles/01567/figures#fig5s1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 6. Mapping of phloem pole patterning.</title>
                <subtitle>(A) Example of Gaussian kernel density estimate of the location of predicted phloem bundles cells in a 30 dag Col-0 section. High density represents phloem poles. (B) Example of an analysis of emerging phloem pole position in a 30 dag Col-0 section. The plot represents a pixel intensity map after noise reduction along a circular region of interest across the emerging phloem poles. Intensity peaks are due to GUS staining conferred to phloem bundles by an APL::GUS reporter construct. (C) Probability density function of the data shown in (B) obtained from an automated Bayesian model. The dominant single peak indicates a constant arc distance of ca. 62 pixel between the phloem poles.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.011</doi>
                <resource>https://elifesciences.org/articles/01567#fig6</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 1.</title>
                <subtitle>(A) An explanation of the extracted parameters that describe the cellular features. (B) Summary information of the hand-labeled training set for supervised machine learning. (C) Definition of the classifiers selected for analysis. (D) Summary of the classifier parameters for supervised machine learning. (E) Overview of the cell type classes recognized by the supervised machine learning approach and their assignment codes used in Data Files 3 and 4.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.012</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD1-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 2.</title>
                <subtitle>Quality control files for the Col-0 sections.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.013</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD2-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 3.</title>
                <subtitle>Quality control files for the Ler sections.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.014</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD3-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 4.</title>
                <subtitle>The normalized values of the phenoprints (Figure 2B) used for PCA.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.015</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD4-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Decision letter</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.016</doi>
                <resource>https://elifesciences.org/articles/01567#SA1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Author response</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.017</doi>
                <resource>https://elifesciences.org/articles/01567#SA2</resource>
              </doi_data>
            </component>
          </component_list>
        </journal_article>
      </journal>
    </crossref>
  </doi_record>
</doi_records> + http_version: + recorded_at: Fri, 07 Dec 2018 18:37:49 GMT +recorded_with: VCR 3.0.3 diff --git a/spec/fixtures/vcr_cassettes/dois/POST_/dois/crossref_url/updates_the_record.yml b/spec/fixtures/vcr_cassettes/dois/POST_/dois/crossref_url/updates_the_record.yml new file mode 100644 index 000000000..8adeb834c --- /dev/null +++ b/spec/fixtures/vcr_cassettes/dois/POST_/dois/crossref_url/updates_the_record.yml @@ -0,0 +1,82 @@ +--- +http_interactions: +- request: + method: get + uri: https://api.datacite.org/prefixes/10.7554 + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/html,application/json,application/xml;q=0.9, text/plain;q=0.8,image/png,*/*;q=0.5 + response: + status: + code: 200 + message: OK + headers: + Date: + - Fri, 07 Dec 2018 18:37:47 GMT + Content-Type: + - application/json; charset=utf-8 + Connection: + - keep-alive + Status: + - 200 OK + X-Anonymous-Consumer: + - 'true' + Cache-Control: + - max-age=0, private, must-revalidate + Vary: + - Accept-Encoding, Origin + X-Request-Id: + - 40db2943-8f7f-4775-a41f-10509bc53c67 + Etag: + - W/"381993dc8a6b0f20960c96a3639c0284" + X-Runtime: + - '0.102270' + X-Powered-By: + - Phusion Passenger 6.0.0 + Server: + - nginx/1.15.7 + Phusion Passenger 6.0.0 + body: + encoding: ASCII-8BIT + string: '{"data":{"id":"10.7554","type":"prefixes","attributes":{"registration-agency":"Crossref","created":null,"updated":"2016-09-21T21:07:27Z"},"relationships":{"clients":{"data":[]},"providers":{"data":[]}}},"included":[]}' + http_version: + recorded_at: Fri, 07 Dec 2018 18:37:47 GMT +- request: + method: get + uri: http://www.crossref.org/openurl/?format=unixref&id=doi:10.7554/elife.01567&noredirect=true&pid=tech@datacite.org + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/xml + response: + status: + code: 200 + message: OK + headers: + Server: + - Apache-Coyote/1.1 + Crossref-Deployment-Name: + - cr6-1 + Content-Type: + - text/xml;charset=UTF-8 + Content-Language: + - en-US + Date: + - Fri, 07 Dec 2018 18:37:47 GMT + Connection: + - close + body: + encoding: ASCII-8BIT + string: !binary |- + <?xml version="1.0" encoding="UTF-8"?>
<doi_records>
  <doi_record owner="10.7554" timestamp="2018-08-23 09:41:49">
    <crossref>
      <journal>
        <journal_metadata language="en">
          <full_title>eLife</full_title>
          <issn media_type="electronic">2050-084X</issn>
        </journal_metadata>
        <journal_issue>
          <publication_date media_type="online">
            <month>02</month>
            <day>11</day>
            <year>2014</year>
          </publication_date>
          <journal_volume>
            <volume>3</volume>
          </journal_volume>
        </journal_issue>
        <journal_article publication_type="full_text" reference_distribution_opts="any">
          <titles>
            <title>Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth</title>
          </titles>
          <contributors>
            <person_name contributor_role="author" sequence="first">
              <given_name>Martial</given_name>
              <surname>Sankar</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Kaisa</given_name>
              <surname>Nieminen</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Laura</given_name>
              <surname>Ragni</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Ioannis</given_name>
              <surname>Xenarios</surname>
              <affiliation>Vital-IT, Swiss Institute of Bioinformatics, Lausanne, Switzerland</affiliation>
            </person_name>
            <person_name contributor_role="author" sequence="additional">
              <given_name>Christian S</given_name>
              <surname>Hardtke</surname>
              <affiliation>Department of Plant Molecular Biology, University of Lausanne, Lausanne, Switzerland</affiliation>
            </person_name>
          </contributors>
          <abstract>
            <p>Among various advantages, their small size makes model organisms preferred subjects of investigation. Yet, even in model systems detailed analysis of numerous developmental processes at cellular level is severely hampered by their scale. For instance, secondary growth of Arabidopsis hypocotyls creates a radial pattern of highly specialized tissues that comprises several thousand cells starting from a few dozen. This dynamic process is difficult to follow because of its scale and because it can only be investigated invasively, precluding comprehensive understanding of the cell proliferation, differentiation, and patterning events involved. To overcome such limitation, we established an automated quantitative histology approach. We acquired hypocotyl cross-sections from tiled high-resolution images and extracted their information content using custom high-throughput image processing and segmentation. Coupled with automated cell type recognition through machine learning, we could establish a cellular resolution atlas that reveals vascular morphodynamics during secondary growth, for example equidistant phloem pole formation.</p>
          </abstract>
          <abstract abstract-type="executive-summary">
            <p>Our understanding of the living world has been advanced greatly by studies of ‘model organisms’, such as mice, zebrafish, and fruit flies. Studying these creatures has been crucial to uncovering the genes that control how our bodies develop and grow, and also to discover the genetic basis of diseases such as cancer.</p>
            <p>Thale cress—or Arabidopsis thaliana to give its formal name—is the model organism of choice for many plant biologists. This tiny weed has been widely studied because it can complete its lifecycle, from seed to seed, in about 6 weeks, and because its relatively small genome simplifies the search for genes that control specific traits. However, as with other much-studied model systems, understanding the changes that underpin the development of some of the more complex tissues in Arabidopsis has been severely hampered by the shear number of cells involved.</p>
            <p>After it has emerged from the seed, the plant’s first stem will develop from a few dozen cells in width to several thousand cells with highly specialized tissues arranged in a complex pattern of concentric circles. Although this stem thickening process represents a major developmental change in many plants—from Arabidopsis to oak trees—it has been under-researched. This is partly because it involves so many different cells, and also because it can only be observed in thin sections cut out of the plant’s stem.</p>
            <p>Now Sankar, Nieminen, Ragni et al. have developed a novel approach, termed ‘automated quantitative histology’, to overcome these problems. This strategy involves ‘teaching’ a computer to automatically recognize different plant cells and to measure their important features in high-resolution images of tissue sections. The resulting ‘map’ of the developing stem—which required over 800 hr of computing time to complete—reveals the changes to cells and tissues as they develop that allow the transport of water, sugars and nutrients between the above- and below-ground organs. Sankar, Nieminen, Ragni et al. suggest that their novel approach could, in the future, also be applied to study the development of other tissues and organisms, including animals.</p>
          </abstract>
          <publication_date media_type="online">
            <month>02</month>
            <day>11</day>
            <year>2014</year>
          </publication_date>
          <publisher_item>
            <item_number item_number_type="article_number">e01567</item_number>
            <identifier id_type="doi">10.7554/eLife.01567</identifier>
          </publisher_item>
          <program name="fundref">
            <assertion name="fundgroup">
              <assertion name="funder_name">SystemsX</assertion>
            </assertion>
            <assertion name="fundgroup">
              <assertion name="funder_name">EMBO longterm post-doctoral fellowships</assertion>
            </assertion>
            <assertion name="fundgroup">
              <assertion name="funder_name">Marie Heim-Voegtlin</assertion>
            </assertion>
            <assertion name="fundgroup">
              <assertion name="funder_name">
                University of Lausanne
                <assertion name="funder_identifier" provider="crossref">501100006390</assertion>
              </assertion>
            </assertion>
          </program>
          <program name="AccessIndicators">
            <license_ref applies_to="vor">http://creativecommons.org/licenses/by/3.0/</license_ref>
            <license_ref applies_to="am">http://creativecommons.org/licenses/by/3.0/</license_ref>
            <license_ref applies_to="tdm">http://creativecommons.org/licenses/by/3.0/</license_ref>
          </program>
          <crossmark>
            <crossmark_version>1</crossmark_version>
            <crossmark_policy>eLifesciences</crossmark_policy>
            <crossmark_domains>
              <crossmark_domain>
                <domain>www.elifesciences.org</domain>
              </crossmark_domain>
            </crossmark_domains>
            <crossmark_domain_exclusive>false</crossmark_domain_exclusive>
            <custom_metadata>
              <assertion name="received" label="Received" group_name="publication_history" group_label="Publication History" order="0">2013-09-20</assertion>
              <assertion name="accepted" label="Accepted" group_name="publication_history" group_label="Publication History" order="1">2013-12-24</assertion>
              <assertion name="published" label="Published" group_name="publication_history" group_label="Publication History" order="2">2014-02-11</assertion>
              <program name="fundref">
                <assertion name="fundgroup">
                  <assertion name="funder_name">SystemsX</assertion>
                </assertion>
                <assertion name="fundgroup">
                  <assertion name="funder_name">
                    EMBO
                    <assertion name="funder_identifier">http://dx.doi.org/10.13039/501100003043</assertion>
                  </assertion>
                </assertion>
                <assertion name="fundgroup">
                  <assertion name="funder_name">
                    Swiss National Science Foundation
                    <assertion name="funder_identifier">http://dx.doi.org/10.13039/501100001711</assertion>
                  </assertion>
                </assertion>
                <assertion name="fundgroup">
                  <assertion name="funder_name">
                    University of Lausanne
                    <assertion name="funder_identifier" provider="crossref">http://dx.doi.org/10.13039/501100006390</assertion>
                  </assertion>
                </assertion>
              </program>
              <program name="AccessIndicators">
                <license_ref applies_to="vor">http://creativecommons.org/licenses/by/3.0/</license_ref>
                <license_ref applies_to="am">http://creativecommons.org/licenses/by/3.0/</license_ref>
                <license_ref applies_to="tdm">http://creativecommons.org/licenses/by/3.0/</license_ref>
              </program>
            </custom_metadata>
          </crossmark>
          <program>
            <related_item>
              <description>Data from: Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth</description>
              <inter_work_relation identifier-type="doi" relationship-type="isSupplementedBy">10.5061/dryad.b835k</inter_work_relation>
            </related_item>
          </program>
          <archive_locations>
            <archive name="CLOCKSS" />
          </archive_locations>
          <doi_data>
            <doi>10.7554/eLife.01567</doi>
            <resource>https://elifesciences.org/articles/01567</resource>
            <collection property="text-mining">
              <item>
                <resource mime_type="application/pdf">https://cdn.elifesciences.org/articles/01567/elife-01567-v1.pdf</resource>
              </item>
              <item>
                <resource mime_type="application/xml">https://cdn.elifesciences.org/articles/01567/elife-01567-v1.xml</resource>
              </item>
            </collection>
          </doi_data>
          <citation_list>
            <citation key="bib1">
              <journal_title>Nature</journal_title>
              <author>Bonke</author>
              <volume>426</volume>
              <first_page>181</first_page>
              <cYear>2003</cYear>
              <article_title>APL regulates vascular tissue identity in Arabidopsis</article_title>
              <doi>10.1038/nature02100</doi>
            </citation>
            <citation key="bib2">
              <journal_title>Genetics</journal_title>
              <author>Brenner</author>
              <volume>182</volume>
              <first_page>413</first_page>
              <cYear>2009</cYear>
              <article_title>In the beginning was the worm</article_title>
              <doi>10.1534/genetics.109.104976</doi>
            </citation>
            <citation key="bib3">
              <journal_title>Physiologia Plantarum</journal_title>
              <author>Chaffey</author>
              <volume>114</volume>
              <first_page>594</first_page>
              <cYear>2002</cYear>
              <article_title>Secondary xylem development in Arabidopsis: a model for wood formation</article_title>
              <doi>10.1034/j.1399-3054.2002.1140413.x</doi>
            </citation>
            <citation key="bib4">
              <journal_title>Neural computation</journal_title>
              <author>Chang</author>
              <volume>13</volume>
              <first_page>2119</first_page>
              <cYear>2001</cYear>
              <article_title>Training nu-support vector classifiers: theory and algorithms</article_title>
              <doi>10.1162/089976601750399335</doi>
            </citation>
            <citation key="bib5">
              <journal_title>Machine Learning</journal_title>
              <author>Cortes</author>
              <volume>20</volume>
              <first_page>273</first_page>
              <cYear>1995</cYear>
              <doi provider="crossref">10.1007/BF00994018</doi>
              <article_title>Support-vector Networks</article_title>
            </citation>
            <citation key="bib6">
              <journal_title>Development</journal_title>
              <author>Dolan</author>
              <volume>119</volume>
              <first_page>71</first_page>
              <cYear>1993</cYear>
              <article_title>Cellular organisation of the Arabidopsis thaliana root</article_title>
            </citation>
            <citation key="bib7">
              <journal_title>Seminars in Cell &amp; Developmental Biology</journal_title>
              <author>Elo</author>
              <volume>20</volume>
              <first_page>1097</first_page>
              <cYear>2009</cYear>
              <article_title>Stem cell function during plant vascular development</article_title>
              <doi>10.1016/j.semcdb.2009.09.009</doi>
            </citation>
            <citation key="bib8">
              <journal_title>Development</journal_title>
              <author>Etchells</author>
              <volume>140</volume>
              <first_page>2224</first_page>
              <cYear>2013</cYear>
              <article_title>WOX4 and WOX14 act downstream of the PXY receptor kinase to regulate plant vascular proliferation independently of any role in vascular organisation</article_title>
              <doi>10.1242/dev.091314</doi>
            </citation>
            <citation key="bib9">
              <journal_title>PLOS Genetics</journal_title>
              <author>Etchells</author>
              <volume>8</volume>
              <first_page>e1002997</first_page>
              <cYear>2012</cYear>
              <article_title>Plant vascular cell division is maintained by an interaction between PXY and ethylene signalling</article_title>
              <doi>10.1371/journal.pgen.1002997</doi>
            </citation>
            <citation key="bib10">
              <journal_title>Molecular Systems Biology</journal_title>
              <author>Fuchs</author>
              <volume>6</volume>
              <first_page>370</first_page>
              <cYear>2010</cYear>
              <article_title>Clustering phenotype populations by genome-wide RNAi and multiparametric imaging</article_title>
              <doi>10.1038/msb.2010.25</doi>
            </citation>
            <citation key="bib11">
              <journal_title>Bio Systems</journal_title>
              <author>Granqvist</author>
              <volume>110</volume>
              <first_page>60</first_page>
              <cYear>2012</cYear>
              <article_title>BaSAR-A tool in R for frequency detection</article_title>
              <doi>10.1016/j.biosystems.2012.07.004</doi>
            </citation>
            <citation key="bib12">
              <journal_title>Current Opinion in Plant Biology</journal_title>
              <author>Groover</author>
              <volume>9</volume>
              <first_page>55</first_page>
              <cYear>2006</cYear>
              <article_title>Developmental mechanisms regulating secondary growth in woody plants</article_title>
              <doi>10.1016/j.pbi.2005.11.013</doi>
            </citation>
            <citation key="bib13">
              <journal_title>Plant Cell</journal_title>
              <author>Hirakawa</author>
              <volume>22</volume>
              <first_page>2618</first_page>
              <cYear>2010</cYear>
              <article_title>TDIF peptide signaling regulates vascular stem cell proliferation via the WOX4 homeobox gene in Arabidopsis</article_title>
              <doi>10.1105/tpc.110.076083</doi>
            </citation>
            <citation key="bib14">
              <journal_title>Proceedings of the National Academy of Sciences of the United States of America</journal_title>
              <author>Hirakawa</author>
              <volume>105</volume>
              <first_page>15208</first_page>
              <cYear>2008</cYear>
              <article_title>Non-cell-autonomous control of vascular stem cell fate by a CLE peptide/receptor system</article_title>
              <doi>10.1073/pnas.0808444105</doi>
            </citation>
            <citation key="bib15">
              <journal_title>Cell</journal_title>
              <author>Meyerowitz</author>
              <volume>56</volume>
              <first_page>263</first_page>
              <cYear>1989</cYear>
              <article_title>Arabidopsis, a useful weed</article_title>
              <doi>10.1016/0092-8674(89)90900-8</doi>
            </citation>
            <citation key="bib16">
              <journal_title>Science</journal_title>
              <author>Meyerowitz</author>
              <volume>295</volume>
              <first_page>1482</first_page>
              <cYear>2002</cYear>
              <article_title>Plants compared to animals: the broadest comparative study of development</article_title>
              <doi>10.1126/science.1066609</doi>
            </citation>
            <citation key="bib17">
              <journal_title>Plant Physiol</journal_title>
              <author>Nieminen</author>
              <volume>135</volume>
              <first_page>653</first_page>
              <cYear>2004</cYear>
              <article_title>A weed for wood? Arabidopsis as a genetic model for xylem development</article_title>
              <doi>10.1104/pp.104.040212</doi>
            </citation>
            <citation key="bib18">
              <journal_title>Nature Biotechnology</journal_title>
              <author>Noble</author>
              <volume>24</volume>
              <first_page>1565</first_page>
              <cYear>2006</cYear>
              <article_title>What is a support vector machine?</article_title>
              <doi>10.1038/nbt1206-1565</doi>
            </citation>
            <citation key="bib19">
              <journal_title>Proceedings of the National Academy of Sciences of the United States of America</journal_title>
              <author>Olson</author>
              <volume>77</volume>
              <first_page>1516</first_page>
              <cYear>1980</cYear>
              <article_title>Classification of cultured mammalian cells by shape analysis and pattern recognition</article_title>
              <doi>10.1073/pnas.77.3.1516</doi>
            </citation>
            <citation key="bib20">
              <journal_title>Bioinformatics</journal_title>
              <author>Pau</author>
              <volume>26</volume>
              <first_page>979</first_page>
              <cYear>2010</cYear>
              <article_title>EBImage–an R package for image processing with applications to cellular phenotypes</article_title>
              <doi>10.1093/bioinformatics/btq046</doi>
            </citation>
            <citation key="bib21">
              <journal_title>Plant Cell</journal_title>
              <author>Ragni</author>
              <volume>23</volume>
              <first_page>1322</first_page>
              <cYear>2011</cYear>
              <article_title>Mobile gibberellin directly stimulates Arabidopsis hypocotyl xylem expansion</article_title>
              <doi>10.1105/tpc.111.084020</doi>
            </citation>
            <citation key="bib22">
              <journal_title>Dryad Digital Repository</journal_title>
              <author>Sankar</author>
              <cYear>2014</cYear>
              <article_title>Data from: Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth</article_title>
              <doi>10.5061/dryad.b835k</doi>
            </citation>
            <citation key="bib23">
              <journal_title>Current Biology</journal_title>
              <author>Sibout</author>
              <volume>18</volume>
              <first_page>458</first_page>
              <cYear>2008</cYear>
              <article_title>Flowering as a condition for xylem expansion in Arabidopsis hypocotyl and root</article_title>
              <doi>10.1016/j.cub.2008.02.070</doi>
            </citation>
            <citation key="bib24">
              <journal_title>The New Phytologist</journal_title>
              <author>Spicer</author>
              <volume>186</volume>
              <first_page>577</first_page>
              <cYear>2010</cYear>
              <article_title>Evolution of development of vascular cambia and secondary growth</article_title>
              <doi>10.1111/j.1469-8137.2010.03236.x</doi>
            </citation>
            <citation key="bib25">
              <journal_title>Machine Vision and Applications</journal_title>
              <author>Theriault</author>
              <volume>23</volume>
              <first_page>659</first_page>
              <cYear>2012</cYear>
              <article_title>Cell morphology classification and clutter mitigation in phase-contrast microscopy images using machine learning</article_title>
              <doi>10.1007/s00138-011-0345-9</doi>
            </citation>
            <citation key="bib26">
              <journal_title>Cell</journal_title>
              <author>Uyttewaal</author>
              <volume>149</volume>
              <first_page>439</first_page>
              <cYear>2012</cYear>
              <article_title>Mechanical stress acts via katanin to amplify differences in growth rate between adjacent cells in Arabidopsis</article_title>
              <doi>10.1016/j.cell.2012.02.048</doi>
            </citation>
            <citation key="bib27">
              <journal_title>Nature Cell Biology</journal_title>
              <author>Yin</author>
              <volume>15</volume>
              <first_page>860</first_page>
              <cYear>2013</cYear>
              <article_title>A screen for morphological complexity identifies regulators of switch-like transitions between discrete cell shapes</article_title>
              <doi>10.1038/ncb2764</doi>
            </citation>
          </citation_list>
          <component_list>
            <component parent_relation="isPartOf">
              <titles>
                <title>Abstract</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.001</doi>
                <resource>https://elifesciences.org/articles/01567#abstract</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>eLife digest</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.002</doi>
                <resource>https://elifesciences.org/articles/01567#digest</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 1. Cellular level analysis of Arabidopsis hypocotyl secondary growth.</title>
                <subtitle>(A) Light microscopy of cross sections obtained from Arabidopsis hypocotyls (organ position illustrated for a 9-day-old seedling, lower left) at 9 dag (upper left) and 35 dag (right). Size bars are 100 μm. Blue GUS staining due to the presence of an APL::GUS reporter gene in this Col-0 background line marks phloem bundles. (B) Overview of the developmental series (time points and distinct samples per genotype) analyzed in this study. (C) Example of a high-resolution hypocotyl section image assembled from 11 × 11 tiles. (D) The same image after pre-processing and binarization, and (E) subsequent segmentation using a watershed algorithm. (F) Number of mis-segmented cells as determined by careful visual inspection in 12 sections, plotted against the total number of cells per section (log scale).</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.003</doi>
                <resource>https://elifesciences.org/articles/01567#fig1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 2. The ‘Quantitative Histology’ approach.</title>
                <subtitle>(A) Overview of the computational pipeline from image acquisition to analysis. (B) ‘Phenoprints’ for the different genotypes and developmental stages.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.004</doi>
                <resource>https://elifesciences.org/articles/01567#fig2</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 2—figure supplement 1. An example of classifier selection through V-fold cross validation.</title>
                <subtitle>The green arrow points out the selected feature combination according to the criteria of minimum number of features with the highest performance and the lowest variation (the radiusV feature was excluded due to its putative variation in tissue location).</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.005</doi>
                <resource>https://elifesciences.org/articles/01567/figures#fig2s1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 3. Progression of tissue proliferation.</title>
                <subtitle>(A) Principal component analysis (PCA) of the phenoprints shown in Figure 2B, performed with normalized values (Supplementary file 4). The inlay screeplot displays the proportion of total variation explained by each principal component. (B–E) Comparative plots of parameter progression in the two genotypes. In (D), xylem represents combined vessel, parenchyma, and fiber cells, phloem represents combined phloem parenchyma and bundle cells. Error bars indicate standard error.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.006</doi>
                <resource>https://elifesciences.org/articles/01567#fig3</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 4. Bimodal distribution of incline angle according to position.</title>
                <subtitle>(A and B) Spatial distribution of cell incline angle illustrates the vascular organization in Ler (B) as compared to Col-0 (A) at later stages of development, for example 30 dag. The size of the disc increases with the area of the cell. Blue color indicates radial cell orientation, red orthoradial. (C and D) Violin plots of incline angle distribution, illustrating increasingly bimodal distribution coincident with refined vascular organization and different dynamics of the process in the two genotypes.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.007</doi>
                <resource>https://elifesciences.org/articles/01567#fig4</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 4—figure supplement 1. An illustration of the incline angle.</title>
                <subtitle>The incline is the angle between the section radius through the center of an ellipse fit to a cell and the major axis of that ellipse extended towards the x axis.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.008</doi>
                <resource>https://elifesciences.org/articles/01567/figures#fig4s1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 5. Distinct local organization of incline angle during hypocotyl secondary growth progression.</title>
                <subtitle>(A–J) Density plots of cell incline angle vs radial position for the two genotypes at the indicated developmental stages, representing all cells across all sections for a given time point. The red lines represent the fit of these cloud distributions with locally weighted linear regression (i.e., lowess), revealing the essential data trends. All sections were normalized from 0.0 (the manually defined center) to 1.0 (the average radius in a set of sections as determined by the average distance of the outermost cells from the center for individual sections). Box plots indicate the quartiles of the radian distribution for each cell-type class and are placed at the average position of the cell type with respect to the y axis. Outliers are shown as circles.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.009</doi>
                <resource>https://elifesciences.org/articles/01567#fig5</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 5—figure supplement 1. Analysis of cell number in defined xylem regions of different size.</title>
                <subtitle>Cell number in a circle of 200–500 pixels around the section centers for Col-0. Cell count in a constant area of xylem over time across all averaged across all sections.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.010</doi>
                <resource>https://elifesciences.org/articles/01567/figures#fig5s1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Figure 6. Mapping of phloem pole patterning.</title>
                <subtitle>(A) Example of Gaussian kernel density estimate of the location of predicted phloem bundles cells in a 30 dag Col-0 section. High density represents phloem poles. (B) Example of an analysis of emerging phloem pole position in a 30 dag Col-0 section. The plot represents a pixel intensity map after noise reduction along a circular region of interest across the emerging phloem poles. Intensity peaks are due to GUS staining conferred to phloem bundles by an APL::GUS reporter construct. (C) Probability density function of the data shown in (B) obtained from an automated Bayesian model. The dominant single peak indicates a constant arc distance of ca. 62 pixel between the phloem poles.</subtitle>
              </titles>
              <format mime_type="image/tiff" />
              <doi_data>
                <doi>10.7554/eLife.01567.011</doi>
                <resource>https://elifesciences.org/articles/01567#fig6</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 1.</title>
                <subtitle>(A) An explanation of the extracted parameters that describe the cellular features. (B) Summary information of the hand-labeled training set for supervised machine learning. (C) Definition of the classifiers selected for analysis. (D) Summary of the classifier parameters for supervised machine learning. (E) Overview of the cell type classes recognized by the supervised machine learning approach and their assignment codes used in Data Files 3 and 4.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.012</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD1-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 2.</title>
                <subtitle>Quality control files for the Col-0 sections.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.013</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD2-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 3.</title>
                <subtitle>Quality control files for the Ler sections.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.014</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD3-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Supplementary file 4.</title>
                <subtitle>The normalized values of the phenoprints (Figure 2B) used for PCA.</subtitle>
              </titles>
              <format mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" />
              <doi_data>
                <doi>10.7554/eLife.01567.015</doi>
                <resource>https://elifesciences.org/articles/01567/figures#SD4-data</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Decision letter</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.016</doi>
                <resource>https://elifesciences.org/articles/01567#SA1</resource>
              </doi_data>
            </component>
            <component parent_relation="isPartOf">
              <titles>
                <title>Author response</title>
              </titles>
              <format mime_type="text/plain" />
              <doi_data>
                <doi>10.7554/eLife.01567.017</doi>
                <resource>https://elifesciences.org/articles/01567#SA2</resource>
              </doi_data>
            </component>
          </component_list>
        </journal_article>
      </journal>
    </crossref>
  </doi_record>
</doi_records> + http_version: + recorded_at: Fri, 07 Dec 2018 18:37:47 GMT +recorded_with: VCR 3.0.3 diff --git a/spec/fixtures/vcr_cassettes/dois/POST_/dois/datacite_url/returns_status_code_201.yml b/spec/fixtures/vcr_cassettes/dois/POST_/dois/datacite_url/returns_status_code_201.yml new file mode 100644 index 000000000..87116cfa3 --- /dev/null +++ b/spec/fixtures/vcr_cassettes/dois/POST_/dois/datacite_url/returns_status_code_201.yml @@ -0,0 +1,99 @@ +--- +http_interactions: +- request: + method: get + uri: https://api.datacite.org/prefixes/10.7272 + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/html,application/json,application/xml;q=0.9, text/plain;q=0.8,image/png,*/*;q=0.5 + response: + status: + code: 200 + message: OK + headers: + Date: + - Fri, 07 Dec 2018 17:59:13 GMT + Content-Type: + - application/json; charset=utf-8 + Connection: + - keep-alive + Status: + - 200 OK + X-Anonymous-Consumer: + - 'true' + Cache-Control: + - max-age=0, private, must-revalidate + Vary: + - Accept-Encoding, Origin + X-Request-Id: + - 735adba6-fb5e-4444-be96-bb0a75401b71 + Etag: + - W/"434d63d02889e47275389a930375c569" + X-Runtime: + - '0.023537' + X-Powered-By: + - Phusion Passenger 6.0.0 + Server: + - nginx/1.15.7 + Phusion Passenger 6.0.0 + body: + encoding: ASCII-8BIT + string: '{"data":{"id":"10.7272","type":"prefixes","attributes":{"registration-agency":"DataCite","created":"2012-03-15T09:47:35.000Z","updated":null},"relationships":{"clients":{"data":[{"id":"cdl.ucsfctsi","type":"clients"}]},"providers":{"data":[{"id":"cdl","type":"providers"}]}}},"included":[{"id":"cdl.ucsfctsi","type":"clients","attributes":{"name":"UCSF + Clinical & Translational Science Institute (CTSI)","symbol":"CDL.UCSFCTSI","year":2012,"contact-name":"EZID + Support Desk","contact-email":"ezid@ucop.edu","domains":"*","url":null,"created":"2012-07-10T20:59:53.000Z","updated":"2018-08-26T02:35:12.000Z","is-active":true,"has-password":true},"relationships":{"provider":{"data":{"id":"cdl","type":"providers"}},"prefixes":{"data":[{"id":"10.5072","type":"prefixes"},{"id":"10.7272","type":"prefixes"}]}}},{"id":"cdl","type":"providers","attributes":{"name":"California + Digital Library","symbol":"CDL","website":"http://ezid.cdlib.org","contact-name":"EZID + Support Desk","contact-email":"ezid@ucop.edu","phone":null,"description":"California + Digital Library (CDL) handles scholarly information at every stage of its + life. CDL provides technology and expertise to help the University of California + (UC) collect, publish, access, and preserve its full range of information + resources. CDL partners with organizations outside the UCs on far-reaching + problems.\n\nCDL offers DataCite DOIs to University of California scholars + and researchers via the EZID service. EZID is also available as a general + identifier service to help educational, non-profit, governmental and commercial + clients create and manage globally unique identifiers for data and other sources.","region":"AMER","country":"US","logo-url":"https://assets.datacite.org/images/members/cdl.png","organization-type":"academic_institution","focus-area":"general","is-active":true,"has-password":true,"joined":"2009-12-01","created":"2010-01-01T00:00:00.000Z","updated":"2018-10-24T20:47:51.000Z"},"relationships":{"prefixes":{"data":[{"id":"10.5062","type":"prefixes"},{"id":"10.5063","type":"prefixes"},{"id":"10.5065","type":"prefixes"},{"id":"10.5068","type":"prefixes"},{"id":"10.5069","type":"prefixes"},{"id":"10.5070","type":"prefixes"},{"id":"10.5072","type":"prefixes"},{"id":"10.6071","type":"prefixes"},{"id":"10.6072","type":"prefixes"},{"id":"10.6074","type":"prefixes"},{"id":"10.6075","type":"prefixes"},{"id":"10.6076","type":"prefixes"},{"id":"10.6078","type":"prefixes"},{"id":"10.6079","type":"prefixes"},{"id":"10.6080","type":"prefixes"},{"id":"10.6081","type":"prefixes"},{"id":"10.6085","type":"prefixes"},{"id":"10.6086","type":"prefixes"},{"id":"10.7265","type":"prefixes"},{"id":"10.7268","type":"prefixes"},{"id":"10.7269","type":"prefixes"},{"id":"10.7270","type":"prefixes"},{"id":"10.7271","type":"prefixes"},{"id":"10.7272","type":"prefixes"},{"id":"10.7276","type":"prefixes"},{"id":"10.7279","type":"prefixes"},{"id":"10.7280","type":"prefixes"},{"id":"10.7281","type":"prefixes"},{"id":"10.7282","type":"prefixes"},{"id":"10.7284","type":"prefixes"},{"id":"10.7285","type":"prefixes"},{"id":"10.7286","type":"prefixes"},{"id":"10.7288","type":"prefixes"},{"id":"10.7291","type":"prefixes"},{"id":"10.7292","type":"prefixes"},{"id":"10.7293","type":"prefixes"},{"id":"10.7295","type":"prefixes"},{"id":"10.7296","type":"prefixes"},{"id":"10.7297","type":"prefixes"},{"id":"10.7299","type":"prefixes"},{"id":"10.7300","type":"prefixes"},{"id":"10.4246","type":"prefixes"},{"id":"10.7908","type":"prefixes"},{"id":"10.7911","type":"prefixes"},{"id":"10.7913","type":"prefixes"},{"id":"10.7914","type":"prefixes"},{"id":"10.7916","type":"prefixes"},{"id":"10.7918","type":"prefixes"},{"id":"10.7919","type":"prefixes"},{"id":"10.7920","type":"prefixes"},{"id":"10.7921","type":"prefixes"},{"id":"10.7922","type":"prefixes"},{"id":"10.7925","type":"prefixes"},{"id":"10.7927","type":"prefixes"},{"id":"10.7928","type":"prefixes"},{"id":"10.7929","type":"prefixes"},{"id":"10.7932","type":"prefixes"},{"id":"10.7933","type":"prefixes"},{"id":"10.7934","type":"prefixes"},{"id":"10.7939","type":"prefixes"},{"id":"10.7940","type":"prefixes"},{"id":"10.7941","type":"prefixes"},{"id":"10.7942","type":"prefixes"},{"id":"10.7943","type":"prefixes"},{"id":"10.7944","type":"prefixes"},{"id":"10.7945","type":"prefixes"},{"id":"10.7946","type":"prefixes"},{"id":"10.13022","type":"prefixes"},{"id":"10.13026","type":"prefixes"},{"id":"10.13025","type":"prefixes"},{"id":"10.15147","type":"prefixes"},{"id":"10.15146","type":"prefixes"},{"id":"10.15142","type":"prefixes"},{"id":"10.15144","type":"prefixes"},{"id":"10.15145","type":"prefixes"},{"id":"10.15140","type":"prefixes"},{"id":"10.15141","type":"prefixes"},{"id":"10.15139","type":"prefixes"},{"id":"10.1184","type":"prefixes"},{"id":"10.15784","type":"prefixes"},{"id":"10.15779","type":"prefixes"},{"id":"10.15780","type":"prefixes"},{"id":"10.15781","type":"prefixes"},{"id":"10.15782","type":"prefixes"},{"id":"10.17612","type":"prefixes"},{"id":"10.17610","type":"prefixes"},{"id":"10.17611","type":"prefixes"},{"id":"10.17614","type":"prefixes"},{"id":"10.17615","type":"prefixes"},{"id":"10.17602","type":"prefixes"},{"id":"10.17603","type":"prefixes"},{"id":"10.17908","type":"prefixes"},{"id":"10.17916","type":"prefixes"},{"id":"10.17915","type":"prefixes"},{"id":"10.17918","type":"prefixes"},{"id":"10.17919","type":"prefixes"},{"id":"10.17911","type":"prefixes"},{"id":"10.17913","type":"prefixes"},{"id":"10.17920","type":"prefixes"},{"id":"10.18123","type":"prefixes"},{"id":"10.18119","type":"prefixes"},{"id":"10.18118","type":"prefixes"},{"id":"10.18117","type":"prefixes"},{"id":"10.18115","type":"prefixes"},{"id":"10.18431","type":"prefixes"},{"id":"10.18436","type":"prefixes"},{"id":"10.18437","type":"prefixes"},{"id":"10.18439","type":"prefixes"},{"id":"10.18737","type":"prefixes"},{"id":"10.18736","type":"prefixes"},{"id":"10.18739","type":"prefixes"},{"id":"10.18734","type":"prefixes"},{"id":"10.20353","type":"prefixes"},{"id":"10.20354","type":"prefixes"},{"id":"10.20352","type":"prefixes"},{"id":"10.20357","type":"prefixes"},{"id":"10.20358","type":"prefixes"},{"id":"10.20359","type":"prefixes"},{"id":"10.21228","type":"prefixes"},{"id":"10.21229","type":"prefixes"},{"id":"10.21224","type":"prefixes"},{"id":"10.21222","type":"prefixes"},{"id":"10.21223","type":"prefixes"},{"id":"10.21221","type":"prefixes"},{"id":"10.21237","type":"prefixes"},{"id":"10.21238","type":"prefixes"},{"id":"10.21239","type":"prefixes"},{"id":"10.21236","type":"prefixes"},{"id":"10.21430","type":"prefixes"},{"id":"10.21433","type":"prefixes"},{"id":"10.21431","type":"prefixes"},{"id":"10.21421","type":"prefixes"},{"id":"10.21422","type":"prefixes"},{"id":"10.21424","type":"prefixes"},{"id":"10.21425","type":"prefixes"},{"id":"10.21426","type":"prefixes"},{"id":"10.21427","type":"prefixes"},{"id":"10.21428","type":"prefixes"},{"id":"10.21418","type":"prefixes"},{"id":"10.21416","type":"prefixes"},{"id":"10.21414","type":"prefixes"},{"id":"10.21972","type":"prefixes"},{"id":"10.21973","type":"prefixes"},{"id":"10.21975","type":"prefixes"},{"id":"10.21976","type":"prefixes"},{"id":"10.21977","type":"prefixes"},{"id":"10.21978","type":"prefixes"},{"id":"10.21990","type":"prefixes"},{"id":"10.21983","type":"prefixes"},{"id":"10.21980","type":"prefixes"},{"id":"10.21986","type":"prefixes"},{"id":"10.5195","type":"prefixes"},{"id":"10.25334","type":"prefixes"},{"id":"10.25337","type":"prefixes"},{"id":"10.25338","type":"prefixes"},{"id":"10.25342","type":"prefixes"},{"id":"10.25349","type":"prefixes"},{"id":"10.25348","type":"prefixes"},{"id":"10.25347","type":"prefixes"},{"id":"10.25346","type":"prefixes"},{"id":"10.25345","type":"prefixes"},{"id":"10.25344","type":"prefixes"},{"id":"10.25352","type":"prefixes"},{"id":"10.25350","type":"prefixes"},{"id":"10.25351","type":"prefixes"},{"id":"10.26081","type":"prefixes"}]}}}]}' + http_version: + recorded_at: Fri, 07 Dec 2018 17:59:13 GMT +- request: + method: get + uri: https://search.test.datacite.org/api?fl=doi,url,xml,state,allocator_symbol,datacentre_symbol,media,minted,updated&q=doi:10.7272/q6g15xs4&wt=json + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/html,application/json,application/xml;q=0.9, text/plain;q=0.8,image/png,*/*;q=0.5 + response: + status: + code: 200 + message: OK + headers: + Date: + - Fri, 07 Dec 2018 17:59:13 GMT + Content-Type: + - application/json;charset=UTF-8 + Connection: + - keep-alive + Server: + - nginx/1.10.3 (Ubuntu) + Access-Control-Allow-Origin: + - "*" + Access-Control-Allow-Methods: + - GET, POST, PUT, DELETE, OPTIONS + Access-Control-Allow-Headers: + - DNT,X-CustomHeader,Keep-Alive,User-Agent,X-Requested-With,If-Modified-Since,Cache-Control,Content-Type,Content-Range,Range,Authorization + Access-Control-Expose-Headers: + - DNT,X-CustomHeader,Keep-Alive,User-Agent,X-Requested-With,If-Modified-Since,Cache-Control,Content-Type,Content-Range,Range,Authorization + body: + encoding: ASCII-8BIT + string: '{"responseHeader":{"status":0,"QTime":0},"response":{"numFound":1,"start":0,"docs":[{"datacentre_symbol":"CDL.UCSFCTSI","url":"https://datashare.ucsf.edu/stash/dataset/doi:10.7272/Q6G15XS4","xml":"PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0iVVRGLTgiPz4KPHJlc291cmNlIHhtbG5zOnhzaT0iaHR0cDovL3d3dy53My5vcmcvMjAwMS9YTUxTY2hlbWEtaW5zdGFuY2UiIHhtbG5zPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtMyIgeHNpOnNjaGVtYUxvY2F0aW9uPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtMyBodHRwOi8vc2NoZW1hLmRhdGFjaXRlLm9yZy9tZXRhL2tlcm5lbC0zL21ldGFkYXRhLnhzZCI+CiAgPGlkZW50aWZpZXIgaWRlbnRpZmllclR5cGU9IkRPSSI+MTAuNzI3Mi9RNkcxNVhTNDwvaWRlbnRpZmllcj4KICA8Y3JlYXRvcnM+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lPlJvZHJpZ3VleiwgUm9iZXJ0PC9jcmVhdG9yTmFtZT4KICAgICAgPGFmZmlsaWF0aW9uPlVDIFNhbiBGcmFuY2lzY288L2FmZmlsaWF0aW9uPgogICAgPC9jcmVhdG9yPgogICAgPGNyZWF0b3I+CiAgICAgIDxjcmVhdG9yTmFtZT5Nb3dlciwgV2lsbGlhbTwvY3JlYXRvck5hbWU+CiAgICAgIDxhZmZpbGlhdGlvbj5VQ0xBPC9hZmZpbGlhdGlvbj4KICAgIDwvY3JlYXRvcj4KICA8L2NyZWF0b3JzPgogIDx0aXRsZXM+CiAgICA8dGl0bGU+TkVYVVMgSGVhZCBDVDwvdGl0bGU+CiAgPC90aXRsZXM+CiAgPHB1Ymxpc2hlcj5VQyBTYW4gRnJhbmNpc2NvPC9wdWJsaXNoZXI+CiAgPHB1YmxpY2F0aW9uWWVhcj4yMDE3PC9wdWJsaWNhdGlvblllYXI+CiAgPGxhbmd1YWdlPmVuPC9sYW5ndWFnZT4KICA8cmVzb3VyY2VUeXBlIHJlc291cmNlVHlwZUdlbmVyYWw9IkRhdGFzZXQiLz4KICA8c2l6ZXM+CiAgICA8c2l6ZT4xNDk1MjA0IGJ5dGVzPC9zaXplPgogIDwvc2l6ZXM+CiAgPHZlcnNpb24+MTwvdmVyc2lvbj4KICA8cmlnaHRzTGlzdD4KICAgIDxyaWdodHMgcmlnaHRzVVJJPSJodHRwczovL2NyZWF0aXZlY29tbW9ucy5vcmcvbGljZW5zZXMvYnkvNC4wLyI+Q3JlYXRpdmUgQ29tbW9ucyBBdHRyaWJ1dGlvbiA0LjAgSW50ZXJuYXRpb25hbCAoQ0MgQlkgNC4wKTwvcmlnaHRzPgogIDwvcmlnaHRzTGlzdD4KICA8ZGVzY3JpcHRpb25zPgogICAgPGRlc2NyaXB0aW9uIGRlc2NyaXB0aW9uVHlwZT0iQWJzdHJhY3QiPgogICAgICBCYWNrZ3JvdW5kIENsaW5pY2lhbnMsIGFmcmFpZCBvZiBtaXNzaW5nIGludHJhY3JhbmlhbCBpbmp1cmllcywgbGliZXJhbGx5CiAgICAgIG9idGFpbiBjb21wdXRlZCB0b21vZ3JhcGhpYyAoQ1QpIGhlYWQgaW1hZ2luZyBpbiBibHVudCB0cmF1bWEgcGF0aWVudHMuCiAgICAgIFByaW9yIHdvcmsgc3VnZ2VzdHMgdGhhdCBjbGluaWNhbCBjcml0ZXJpYSAoTkVYVVMgSGVhZCBDVCBkZWNpc2lvbgogICAgICBpbnN0cnVtZW50KSBjYW4gcmVsaWFibHkgaWRlbnRpZnkgcGF0aWVudHMgd2l0aCBpbXBvcnRhbnQgaW5qdXJpZXMsIHdoaWxlCiAgICAgIGV4Y2x1ZGluZyBpbmp1cnksIGFuZCB0aGUgbmVlZCBmb3IgaW1hZ2luZyBpbiBtYW55IHBhdGllbnRzLiBNZXRob2RzIFdlCiAgICAgIGNvbmR1Y3RlZCBhIHByb3NwZWN0aXZlIG9ic2VydmF0aW9uYWwgc3R1ZHkgb2YgdGhlIE5FWFVTIEhlYWQgQ1QgZGVjaXNpb24KICAgICAgaW5zdHJ1bWVudCAoREkpIHRoYXQgcmVxdWlyZXMgcGF0aWVudHMgdG8gbWVldCBlaWdodCBjcml0ZXJpYSB0byBhY2hpZXZlCiAgICAgIOKAnGxvdy1yaXNr4oCdIGNsYXNzaWZpY2F0aW9uLiBXZSBleGFtaW5lZCB0aGUgaW5zdHJ1bWVudOKAmXMgcGVyZm9ybWFuY2UgaW4KICAgICAgaWRlbnRpZnlpbmcgcGF0aWVudHMgcmVxdWlyaW5nIG5ldXJvbG9naWNhbCBpbnRlcnZlbnRpb24gZnJvbSBhbW9uZyBhCiAgICAgIGNvaG9ydCBvZiAxMSw3NzAgYmx1bnQgaGVhZCBpbmp1cnkgcGF0aWVudHMuIFJlc3VsdHMgVGhlIE5FWFVTIEhlYWQgQ1QgREkKICAgICAgYXNzaWduZWQgaGlnaC1yaXNrIHN0YXR1cyB0byA0MjAgb2YgNDIwIHBhdGllbnRzIHJlcXVpcmluZyBuZXVyb2xvZ2ljYWwKICAgICAgaW50ZXJ2ZW50aW9uIChzZW5zaXRpdml0eSwgMTAwLjAlIFs5NSUgY29uZmlkZW5jZSBpbnRlcnZhbCBbQ0ldOiA5OS4xJSDigJMKICAgICAgMTAwLjAlXSkuIFRoZSBpbnN0cnVtZW50IGFzc2lnbmVkIGxvdy1yaXNrIHN0YXR1cyB0byAyLDgyMyBvZiAxMSwzNTAKICAgICAgcGF0aWVudHMgd2hvIGRpZCBub3QgcmVxdWlyZSBuZXVyb2xvZ2ljYWwgaW50ZXJ2ZW50aW9uIChzcGVjaWZpY2l0eSwgMjQuOSUKICAgICAgWzk1JSBDSTogMjQuMSUgLSAyNS43JV0pLiBOb25lIG9mIHRoZSAyLDgyMyBsb3ctcmlzayBwYXRpZW50cyByZXF1aXJlZAogICAgICBuZXVyb2xvZ2ljYWwgaW50ZXJ2ZW50aW9uIChOUFYsIDEwMC4wJSBbOTUlIENJOiA5OS45JSAtIDEwMC4wJV0pLiBUaGUgREkKICAgICAgYXNzaWduZWQgaGlnaC1yaXNrIHN0YXR1cyB0byA3NTkgb2YgNzY3IHBhdGllbnRzIHdpdGggc2lnbmlmaWNhbnQKICAgICAgaW50cmFjcmFuaWFsIGluanVyaWVzIChzZW5zaXRpdml0eSwgOTkuMCUgWzk1JSBDSTogOTguMCUgLSA5OS42JV0pLiBUaGUKICAgICAgaW5zdHJ1bWVudCBhc3NpZ25lZCBsb3ctcmlzayBzdGF0dXMgdG8gMiw4MTUgb2YgMTEsMDAzIHBhdGllbnRzIHdobyBkaWQKICAgICAgbm90IGhhdmUgc2lnbmlmaWNhbnQgaW5qdXJpZXMgKHNwZWNpZmljaXR5LCAyNS42JSBbOTUlIENJOiAyNC44JSAtCiAgICAgIDI2LjQlXSkuIFNpZ25pZmljYW50IGluanVyaWVzIHdlcmUgYWJzZW50IGluIDIsODE1IG9mIHRoZSAyLDgyMyBwYXRpZW50cwogICAgICBhc3NpZ25lZCBsb3ctcmlzayBzdGF0dXMgKE5QViwgOTkuNyUgWzk1JSBDSTogOTkuNCUgLSA5OS45JV0pLiBDb25jbHVzaW9ucwogICAgICBUaGUgTkVYVVMgSGVhZCBDVCBESSByZWxpYWJseSBpZGVudGlmaWVzIGJsdW50IHRyYXVtYSBwYXRpZW50cyB3aG8gcmVxdWlyZQogICAgICBoZWFkIENUIGltYWdpbmcsIGFuZCBjb3VsZCBzaWduaWZpY2FudGx5IHJlZHVjaW5nIHRoZSB1c2Ugb2YgQ1QgaW1hZ2luZy4KICAgIDwvZGVzY3JpcHRpb24+CiAgICA8ZGVzY3JpcHRpb24gZGVzY3JpcHRpb25UeXBlPSJNZXRob2RzIj5Qcm9zcGVjdGl2ZSBtdWx0aWNlbnRlcjwvZGVzY3JpcHRpb24+CiAgPC9kZXNjcmlwdGlvbnM+CiAgPGdlb0xvY2F0aW9ucz4KICAgIDxnZW9Mb2NhdGlvbj4KICAgICAgPGdlb0xvY2F0aW9uUG9pbnQ+MzcuMjUwMjIgLTExOS43NTEyNjwvZ2VvTG9jYXRpb25Qb2ludD4KICAgICAgPGdlb0xvY2F0aW9uUGxhY2U+Q2FsaWZvcm5pYSwgVVNBPC9nZW9Mb2NhdGlvblBsYWNlPgogICAgPC9nZW9Mb2NhdGlvbj4KICA8L2dlb0xvY2F0aW9ucz4KPC9yZXNvdXJjZT4=","allocator_symbol":"CDL","minted":"2018-12-07T09:48:20Z","state":"findable","updated":"2018-12-07T09:48:20Z","doi":"10.7272/Q6G15XS4"}]}} + +' + http_version: + recorded_at: Fri, 07 Dec 2018 17:59:13 GMT +recorded_with: VCR 3.0.3 diff --git a/spec/fixtures/vcr_cassettes/dois/POST_/dois/datacite_url/sets_state_to_findable.yml b/spec/fixtures/vcr_cassettes/dois/POST_/dois/datacite_url/sets_state_to_findable.yml new file mode 100644 index 000000000..8b418f0df --- /dev/null +++ b/spec/fixtures/vcr_cassettes/dois/POST_/dois/datacite_url/sets_state_to_findable.yml @@ -0,0 +1,99 @@ +--- +http_interactions: +- request: + method: get + uri: https://api.datacite.org/prefixes/10.7272 + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/html,application/json,application/xml;q=0.9, text/plain;q=0.8,image/png,*/*;q=0.5 + response: + status: + code: 200 + message: OK + headers: + Date: + - Fri, 07 Dec 2018 17:59:14 GMT + Content-Type: + - application/json; charset=utf-8 + Connection: + - keep-alive + Status: + - 200 OK + X-Anonymous-Consumer: + - 'true' + Cache-Control: + - max-age=0, private, must-revalidate + Vary: + - Accept-Encoding, Origin + X-Request-Id: + - d905d5d4-58e6-437f-a962-591bdf5c46b1 + Etag: + - W/"434d63d02889e47275389a930375c569" + X-Runtime: + - '0.022882' + X-Powered-By: + - Phusion Passenger 6.0.0 + Server: + - nginx/1.15.7 + Phusion Passenger 6.0.0 + body: + encoding: ASCII-8BIT + string: '{"data":{"id":"10.7272","type":"prefixes","attributes":{"registration-agency":"DataCite","created":"2012-03-15T09:47:35.000Z","updated":null},"relationships":{"clients":{"data":[{"id":"cdl.ucsfctsi","type":"clients"}]},"providers":{"data":[{"id":"cdl","type":"providers"}]}}},"included":[{"id":"cdl.ucsfctsi","type":"clients","attributes":{"name":"UCSF + Clinical & Translational Science Institute (CTSI)","symbol":"CDL.UCSFCTSI","year":2012,"contact-name":"EZID + Support Desk","contact-email":"ezid@ucop.edu","domains":"*","url":null,"created":"2012-07-10T20:59:53.000Z","updated":"2018-08-26T02:35:12.000Z","is-active":true,"has-password":true},"relationships":{"provider":{"data":{"id":"cdl","type":"providers"}},"prefixes":{"data":[{"id":"10.5072","type":"prefixes"},{"id":"10.7272","type":"prefixes"}]}}},{"id":"cdl","type":"providers","attributes":{"name":"California + Digital Library","symbol":"CDL","website":"http://ezid.cdlib.org","contact-name":"EZID + Support Desk","contact-email":"ezid@ucop.edu","phone":null,"description":"California + Digital Library (CDL) handles scholarly information at every stage of its + life. CDL provides technology and expertise to help the University of California + (UC) collect, publish, access, and preserve its full range of information + resources. CDL partners with organizations outside the UCs on far-reaching + problems.\n\nCDL offers DataCite DOIs to University of California scholars + and researchers via the EZID service. EZID is also available as a general + identifier service to help educational, non-profit, governmental and commercial + clients create and manage globally unique identifiers for data and other sources.","region":"AMER","country":"US","logo-url":"https://assets.datacite.org/images/members/cdl.png","organization-type":"academic_institution","focus-area":"general","is-active":true,"has-password":true,"joined":"2009-12-01","created":"2010-01-01T00:00:00.000Z","updated":"2018-10-24T20:47:51.000Z"},"relationships":{"prefixes":{"data":[{"id":"10.5062","type":"prefixes"},{"id":"10.5063","type":"prefixes"},{"id":"10.5065","type":"prefixes"},{"id":"10.5068","type":"prefixes"},{"id":"10.5069","type":"prefixes"},{"id":"10.5070","type":"prefixes"},{"id":"10.5072","type":"prefixes"},{"id":"10.6071","type":"prefixes"},{"id":"10.6072","type":"prefixes"},{"id":"10.6074","type":"prefixes"},{"id":"10.6075","type":"prefixes"},{"id":"10.6076","type":"prefixes"},{"id":"10.6078","type":"prefixes"},{"id":"10.6079","type":"prefixes"},{"id":"10.6080","type":"prefixes"},{"id":"10.6081","type":"prefixes"},{"id":"10.6085","type":"prefixes"},{"id":"10.6086","type":"prefixes"},{"id":"10.7265","type":"prefixes"},{"id":"10.7268","type":"prefixes"},{"id":"10.7269","type":"prefixes"},{"id":"10.7270","type":"prefixes"},{"id":"10.7271","type":"prefixes"},{"id":"10.7272","type":"prefixes"},{"id":"10.7276","type":"prefixes"},{"id":"10.7279","type":"prefixes"},{"id":"10.7280","type":"prefixes"},{"id":"10.7281","type":"prefixes"},{"id":"10.7282","type":"prefixes"},{"id":"10.7284","type":"prefixes"},{"id":"10.7285","type":"prefixes"},{"id":"10.7286","type":"prefixes"},{"id":"10.7288","type":"prefixes"},{"id":"10.7291","type":"prefixes"},{"id":"10.7292","type":"prefixes"},{"id":"10.7293","type":"prefixes"},{"id":"10.7295","type":"prefixes"},{"id":"10.7296","type":"prefixes"},{"id":"10.7297","type":"prefixes"},{"id":"10.7299","type":"prefixes"},{"id":"10.7300","type":"prefixes"},{"id":"10.4246","type":"prefixes"},{"id":"10.7908","type":"prefixes"},{"id":"10.7911","type":"prefixes"},{"id":"10.7913","type":"prefixes"},{"id":"10.7914","type":"prefixes"},{"id":"10.7916","type":"prefixes"},{"id":"10.7918","type":"prefixes"},{"id":"10.7919","type":"prefixes"},{"id":"10.7920","type":"prefixes"},{"id":"10.7921","type":"prefixes"},{"id":"10.7922","type":"prefixes"},{"id":"10.7925","type":"prefixes"},{"id":"10.7927","type":"prefixes"},{"id":"10.7928","type":"prefixes"},{"id":"10.7929","type":"prefixes"},{"id":"10.7932","type":"prefixes"},{"id":"10.7933","type":"prefixes"},{"id":"10.7934","type":"prefixes"},{"id":"10.7939","type":"prefixes"},{"id":"10.7940","type":"prefixes"},{"id":"10.7941","type":"prefixes"},{"id":"10.7942","type":"prefixes"},{"id":"10.7943","type":"prefixes"},{"id":"10.7944","type":"prefixes"},{"id":"10.7945","type":"prefixes"},{"id":"10.7946","type":"prefixes"},{"id":"10.13022","type":"prefixes"},{"id":"10.13026","type":"prefixes"},{"id":"10.13025","type":"prefixes"},{"id":"10.15147","type":"prefixes"},{"id":"10.15146","type":"prefixes"},{"id":"10.15142","type":"prefixes"},{"id":"10.15144","type":"prefixes"},{"id":"10.15145","type":"prefixes"},{"id":"10.15140","type":"prefixes"},{"id":"10.15141","type":"prefixes"},{"id":"10.15139","type":"prefixes"},{"id":"10.1184","type":"prefixes"},{"id":"10.15784","type":"prefixes"},{"id":"10.15779","type":"prefixes"},{"id":"10.15780","type":"prefixes"},{"id":"10.15781","type":"prefixes"},{"id":"10.15782","type":"prefixes"},{"id":"10.17612","type":"prefixes"},{"id":"10.17610","type":"prefixes"},{"id":"10.17611","type":"prefixes"},{"id":"10.17614","type":"prefixes"},{"id":"10.17615","type":"prefixes"},{"id":"10.17602","type":"prefixes"},{"id":"10.17603","type":"prefixes"},{"id":"10.17908","type":"prefixes"},{"id":"10.17916","type":"prefixes"},{"id":"10.17915","type":"prefixes"},{"id":"10.17918","type":"prefixes"},{"id":"10.17919","type":"prefixes"},{"id":"10.17911","type":"prefixes"},{"id":"10.17913","type":"prefixes"},{"id":"10.17920","type":"prefixes"},{"id":"10.18123","type":"prefixes"},{"id":"10.18119","type":"prefixes"},{"id":"10.18118","type":"prefixes"},{"id":"10.18117","type":"prefixes"},{"id":"10.18115","type":"prefixes"},{"id":"10.18431","type":"prefixes"},{"id":"10.18436","type":"prefixes"},{"id":"10.18437","type":"prefixes"},{"id":"10.18439","type":"prefixes"},{"id":"10.18737","type":"prefixes"},{"id":"10.18736","type":"prefixes"},{"id":"10.18739","type":"prefixes"},{"id":"10.18734","type":"prefixes"},{"id":"10.20353","type":"prefixes"},{"id":"10.20354","type":"prefixes"},{"id":"10.20352","type":"prefixes"},{"id":"10.20357","type":"prefixes"},{"id":"10.20358","type":"prefixes"},{"id":"10.20359","type":"prefixes"},{"id":"10.21228","type":"prefixes"},{"id":"10.21229","type":"prefixes"},{"id":"10.21224","type":"prefixes"},{"id":"10.21222","type":"prefixes"},{"id":"10.21223","type":"prefixes"},{"id":"10.21221","type":"prefixes"},{"id":"10.21237","type":"prefixes"},{"id":"10.21238","type":"prefixes"},{"id":"10.21239","type":"prefixes"},{"id":"10.21236","type":"prefixes"},{"id":"10.21430","type":"prefixes"},{"id":"10.21433","type":"prefixes"},{"id":"10.21431","type":"prefixes"},{"id":"10.21421","type":"prefixes"},{"id":"10.21422","type":"prefixes"},{"id":"10.21424","type":"prefixes"},{"id":"10.21425","type":"prefixes"},{"id":"10.21426","type":"prefixes"},{"id":"10.21427","type":"prefixes"},{"id":"10.21428","type":"prefixes"},{"id":"10.21418","type":"prefixes"},{"id":"10.21416","type":"prefixes"},{"id":"10.21414","type":"prefixes"},{"id":"10.21972","type":"prefixes"},{"id":"10.21973","type":"prefixes"},{"id":"10.21975","type":"prefixes"},{"id":"10.21976","type":"prefixes"},{"id":"10.21977","type":"prefixes"},{"id":"10.21978","type":"prefixes"},{"id":"10.21990","type":"prefixes"},{"id":"10.21983","type":"prefixes"},{"id":"10.21980","type":"prefixes"},{"id":"10.21986","type":"prefixes"},{"id":"10.5195","type":"prefixes"},{"id":"10.25334","type":"prefixes"},{"id":"10.25337","type":"prefixes"},{"id":"10.25338","type":"prefixes"},{"id":"10.25342","type":"prefixes"},{"id":"10.25349","type":"prefixes"},{"id":"10.25348","type":"prefixes"},{"id":"10.25347","type":"prefixes"},{"id":"10.25346","type":"prefixes"},{"id":"10.25345","type":"prefixes"},{"id":"10.25344","type":"prefixes"},{"id":"10.25352","type":"prefixes"},{"id":"10.25350","type":"prefixes"},{"id":"10.25351","type":"prefixes"},{"id":"10.26081","type":"prefixes"}]}}}]}' + http_version: + recorded_at: Fri, 07 Dec 2018 17:59:14 GMT +- request: + method: get + uri: https://search.test.datacite.org/api?fl=doi,url,xml,state,allocator_symbol,datacentre_symbol,media,minted,updated&q=doi:10.7272/q6g15xs4&wt=json + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/html,application/json,application/xml;q=0.9, text/plain;q=0.8,image/png,*/*;q=0.5 + response: + status: + code: 200 + message: OK + headers: + Date: + - Fri, 07 Dec 2018 17:59:14 GMT + Content-Type: + - application/json;charset=UTF-8 + Connection: + - keep-alive + Server: + - nginx/1.10.3 (Ubuntu) + Access-Control-Allow-Origin: + - "*" + Access-Control-Allow-Methods: + - GET, POST, PUT, DELETE, OPTIONS + Access-Control-Allow-Headers: + - DNT,X-CustomHeader,Keep-Alive,User-Agent,X-Requested-With,If-Modified-Since,Cache-Control,Content-Type,Content-Range,Range,Authorization + Access-Control-Expose-Headers: + - DNT,X-CustomHeader,Keep-Alive,User-Agent,X-Requested-With,If-Modified-Since,Cache-Control,Content-Type,Content-Range,Range,Authorization + body: + encoding: ASCII-8BIT + string: '{"responseHeader":{"status":0,"QTime":0},"response":{"numFound":1,"start":0,"docs":[{"datacentre_symbol":"CDL.UCSFCTSI","url":"https://datashare.ucsf.edu/stash/dataset/doi:10.7272/Q6G15XS4","xml":"PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0iVVRGLTgiPz4KPHJlc291cmNlIHhtbG5zOnhzaT0iaHR0cDovL3d3dy53My5vcmcvMjAwMS9YTUxTY2hlbWEtaW5zdGFuY2UiIHhtbG5zPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtMyIgeHNpOnNjaGVtYUxvY2F0aW9uPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtMyBodHRwOi8vc2NoZW1hLmRhdGFjaXRlLm9yZy9tZXRhL2tlcm5lbC0zL21ldGFkYXRhLnhzZCI+CiAgPGlkZW50aWZpZXIgaWRlbnRpZmllclR5cGU9IkRPSSI+MTAuNzI3Mi9RNkcxNVhTNDwvaWRlbnRpZmllcj4KICA8Y3JlYXRvcnM+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lPlJvZHJpZ3VleiwgUm9iZXJ0PC9jcmVhdG9yTmFtZT4KICAgICAgPGFmZmlsaWF0aW9uPlVDIFNhbiBGcmFuY2lzY288L2FmZmlsaWF0aW9uPgogICAgPC9jcmVhdG9yPgogICAgPGNyZWF0b3I+CiAgICAgIDxjcmVhdG9yTmFtZT5Nb3dlciwgV2lsbGlhbTwvY3JlYXRvck5hbWU+CiAgICAgIDxhZmZpbGlhdGlvbj5VQ0xBPC9hZmZpbGlhdGlvbj4KICAgIDwvY3JlYXRvcj4KICA8L2NyZWF0b3JzPgogIDx0aXRsZXM+CiAgICA8dGl0bGU+TkVYVVMgSGVhZCBDVDwvdGl0bGU+CiAgPC90aXRsZXM+CiAgPHB1Ymxpc2hlcj5VQyBTYW4gRnJhbmNpc2NvPC9wdWJsaXNoZXI+CiAgPHB1YmxpY2F0aW9uWWVhcj4yMDE3PC9wdWJsaWNhdGlvblllYXI+CiAgPGxhbmd1YWdlPmVuPC9sYW5ndWFnZT4KICA8cmVzb3VyY2VUeXBlIHJlc291cmNlVHlwZUdlbmVyYWw9IkRhdGFzZXQiLz4KICA8c2l6ZXM+CiAgICA8c2l6ZT4xNDk1MjA0IGJ5dGVzPC9zaXplPgogIDwvc2l6ZXM+CiAgPHZlcnNpb24+MTwvdmVyc2lvbj4KICA8cmlnaHRzTGlzdD4KICAgIDxyaWdodHMgcmlnaHRzVVJJPSJodHRwczovL2NyZWF0aXZlY29tbW9ucy5vcmcvbGljZW5zZXMvYnkvNC4wLyI+Q3JlYXRpdmUgQ29tbW9ucyBBdHRyaWJ1dGlvbiA0LjAgSW50ZXJuYXRpb25hbCAoQ0MgQlkgNC4wKTwvcmlnaHRzPgogIDwvcmlnaHRzTGlzdD4KICA8ZGVzY3JpcHRpb25zPgogICAgPGRlc2NyaXB0aW9uIGRlc2NyaXB0aW9uVHlwZT0iQWJzdHJhY3QiPgogICAgICBCYWNrZ3JvdW5kIENsaW5pY2lhbnMsIGFmcmFpZCBvZiBtaXNzaW5nIGludHJhY3JhbmlhbCBpbmp1cmllcywgbGliZXJhbGx5CiAgICAgIG9idGFpbiBjb21wdXRlZCB0b21vZ3JhcGhpYyAoQ1QpIGhlYWQgaW1hZ2luZyBpbiBibHVudCB0cmF1bWEgcGF0aWVudHMuCiAgICAgIFByaW9yIHdvcmsgc3VnZ2VzdHMgdGhhdCBjbGluaWNhbCBjcml0ZXJpYSAoTkVYVVMgSGVhZCBDVCBkZWNpc2lvbgogICAgICBpbnN0cnVtZW50KSBjYW4gcmVsaWFibHkgaWRlbnRpZnkgcGF0aWVudHMgd2l0aCBpbXBvcnRhbnQgaW5qdXJpZXMsIHdoaWxlCiAgICAgIGV4Y2x1ZGluZyBpbmp1cnksIGFuZCB0aGUgbmVlZCBmb3IgaW1hZ2luZyBpbiBtYW55IHBhdGllbnRzLiBNZXRob2RzIFdlCiAgICAgIGNvbmR1Y3RlZCBhIHByb3NwZWN0aXZlIG9ic2VydmF0aW9uYWwgc3R1ZHkgb2YgdGhlIE5FWFVTIEhlYWQgQ1QgZGVjaXNpb24KICAgICAgaW5zdHJ1bWVudCAoREkpIHRoYXQgcmVxdWlyZXMgcGF0aWVudHMgdG8gbWVldCBlaWdodCBjcml0ZXJpYSB0byBhY2hpZXZlCiAgICAgIOKAnGxvdy1yaXNr4oCdIGNsYXNzaWZpY2F0aW9uLiBXZSBleGFtaW5lZCB0aGUgaW5zdHJ1bWVudOKAmXMgcGVyZm9ybWFuY2UgaW4KICAgICAgaWRlbnRpZnlpbmcgcGF0aWVudHMgcmVxdWlyaW5nIG5ldXJvbG9naWNhbCBpbnRlcnZlbnRpb24gZnJvbSBhbW9uZyBhCiAgICAgIGNvaG9ydCBvZiAxMSw3NzAgYmx1bnQgaGVhZCBpbmp1cnkgcGF0aWVudHMuIFJlc3VsdHMgVGhlIE5FWFVTIEhlYWQgQ1QgREkKICAgICAgYXNzaWduZWQgaGlnaC1yaXNrIHN0YXR1cyB0byA0MjAgb2YgNDIwIHBhdGllbnRzIHJlcXVpcmluZyBuZXVyb2xvZ2ljYWwKICAgICAgaW50ZXJ2ZW50aW9uIChzZW5zaXRpdml0eSwgMTAwLjAlIFs5NSUgY29uZmlkZW5jZSBpbnRlcnZhbCBbQ0ldOiA5OS4xJSDigJMKICAgICAgMTAwLjAlXSkuIFRoZSBpbnN0cnVtZW50IGFzc2lnbmVkIGxvdy1yaXNrIHN0YXR1cyB0byAyLDgyMyBvZiAxMSwzNTAKICAgICAgcGF0aWVudHMgd2hvIGRpZCBub3QgcmVxdWlyZSBuZXVyb2xvZ2ljYWwgaW50ZXJ2ZW50aW9uIChzcGVjaWZpY2l0eSwgMjQuOSUKICAgICAgWzk1JSBDSTogMjQuMSUgLSAyNS43JV0pLiBOb25lIG9mIHRoZSAyLDgyMyBsb3ctcmlzayBwYXRpZW50cyByZXF1aXJlZAogICAgICBuZXVyb2xvZ2ljYWwgaW50ZXJ2ZW50aW9uIChOUFYsIDEwMC4wJSBbOTUlIENJOiA5OS45JSAtIDEwMC4wJV0pLiBUaGUgREkKICAgICAgYXNzaWduZWQgaGlnaC1yaXNrIHN0YXR1cyB0byA3NTkgb2YgNzY3IHBhdGllbnRzIHdpdGggc2lnbmlmaWNhbnQKICAgICAgaW50cmFjcmFuaWFsIGluanVyaWVzIChzZW5zaXRpdml0eSwgOTkuMCUgWzk1JSBDSTogOTguMCUgLSA5OS42JV0pLiBUaGUKICAgICAgaW5zdHJ1bWVudCBhc3NpZ25lZCBsb3ctcmlzayBzdGF0dXMgdG8gMiw4MTUgb2YgMTEsMDAzIHBhdGllbnRzIHdobyBkaWQKICAgICAgbm90IGhhdmUgc2lnbmlmaWNhbnQgaW5qdXJpZXMgKHNwZWNpZmljaXR5LCAyNS42JSBbOTUlIENJOiAyNC44JSAtCiAgICAgIDI2LjQlXSkuIFNpZ25pZmljYW50IGluanVyaWVzIHdlcmUgYWJzZW50IGluIDIsODE1IG9mIHRoZSAyLDgyMyBwYXRpZW50cwogICAgICBhc3NpZ25lZCBsb3ctcmlzayBzdGF0dXMgKE5QViwgOTkuNyUgWzk1JSBDSTogOTkuNCUgLSA5OS45JV0pLiBDb25jbHVzaW9ucwogICAgICBUaGUgTkVYVVMgSGVhZCBDVCBESSByZWxpYWJseSBpZGVudGlmaWVzIGJsdW50IHRyYXVtYSBwYXRpZW50cyB3aG8gcmVxdWlyZQogICAgICBoZWFkIENUIGltYWdpbmcsIGFuZCBjb3VsZCBzaWduaWZpY2FudGx5IHJlZHVjaW5nIHRoZSB1c2Ugb2YgQ1QgaW1hZ2luZy4KICAgIDwvZGVzY3JpcHRpb24+CiAgICA8ZGVzY3JpcHRpb24gZGVzY3JpcHRpb25UeXBlPSJNZXRob2RzIj5Qcm9zcGVjdGl2ZSBtdWx0aWNlbnRlcjwvZGVzY3JpcHRpb24+CiAgPC9kZXNjcmlwdGlvbnM+CiAgPGdlb0xvY2F0aW9ucz4KICAgIDxnZW9Mb2NhdGlvbj4KICAgICAgPGdlb0xvY2F0aW9uUG9pbnQ+MzcuMjUwMjIgLTExOS43NTEyNjwvZ2VvTG9jYXRpb25Qb2ludD4KICAgICAgPGdlb0xvY2F0aW9uUGxhY2U+Q2FsaWZvcm5pYSwgVVNBPC9nZW9Mb2NhdGlvblBsYWNlPgogICAgPC9nZW9Mb2NhdGlvbj4KICA8L2dlb0xvY2F0aW9ucz4KPC9yZXNvdXJjZT4=","allocator_symbol":"CDL","minted":"2018-12-07T09:48:20Z","state":"findable","updated":"2018-12-07T09:48:20Z","doi":"10.7272/Q6G15XS4"}]}} + +' + http_version: + recorded_at: Fri, 07 Dec 2018 17:59:14 GMT +recorded_with: VCR 3.0.3 diff --git a/spec/fixtures/vcr_cassettes/dois/POST_/dois/datacite_url/updates_the_record.yml b/spec/fixtures/vcr_cassettes/dois/POST_/dois/datacite_url/updates_the_record.yml new file mode 100644 index 000000000..fa03bd817 --- /dev/null +++ b/spec/fixtures/vcr_cassettes/dois/POST_/dois/datacite_url/updates_the_record.yml @@ -0,0 +1,99 @@ +--- +http_interactions: +- request: + method: get + uri: https://api.datacite.org/prefixes/10.7272 + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/html,application/json,application/xml;q=0.9, text/plain;q=0.8,image/png,*/*;q=0.5 + response: + status: + code: 200 + message: OK + headers: + Date: + - Fri, 07 Dec 2018 17:59:12 GMT + Content-Type: + - application/json; charset=utf-8 + Connection: + - keep-alive + Status: + - 200 OK + X-Anonymous-Consumer: + - 'true' + Cache-Control: + - max-age=0, private, must-revalidate + Vary: + - Accept-Encoding, Origin + X-Request-Id: + - ba89f387-9fa1-4286-9203-b4e479c19dd0 + Etag: + - W/"434d63d02889e47275389a930375c569" + X-Runtime: + - '0.025620' + X-Powered-By: + - Phusion Passenger 6.0.0 + Server: + - nginx/1.15.7 + Phusion Passenger 6.0.0 + body: + encoding: ASCII-8BIT + string: '{"data":{"id":"10.7272","type":"prefixes","attributes":{"registration-agency":"DataCite","created":"2012-03-15T09:47:35.000Z","updated":null},"relationships":{"clients":{"data":[{"id":"cdl.ucsfctsi","type":"clients"}]},"providers":{"data":[{"id":"cdl","type":"providers"}]}}},"included":[{"id":"cdl.ucsfctsi","type":"clients","attributes":{"name":"UCSF + Clinical & Translational Science Institute (CTSI)","symbol":"CDL.UCSFCTSI","year":2012,"contact-name":"EZID + Support Desk","contact-email":"ezid@ucop.edu","domains":"*","url":null,"created":"2012-07-10T20:59:53.000Z","updated":"2018-08-26T02:35:12.000Z","is-active":true,"has-password":true},"relationships":{"provider":{"data":{"id":"cdl","type":"providers"}},"prefixes":{"data":[{"id":"10.5072","type":"prefixes"},{"id":"10.7272","type":"prefixes"}]}}},{"id":"cdl","type":"providers","attributes":{"name":"California + Digital Library","symbol":"CDL","website":"http://ezid.cdlib.org","contact-name":"EZID + Support Desk","contact-email":"ezid@ucop.edu","phone":null,"description":"California + Digital Library (CDL) handles scholarly information at every stage of its + life. CDL provides technology and expertise to help the University of California + (UC) collect, publish, access, and preserve its full range of information + resources. CDL partners with organizations outside the UCs on far-reaching + problems.\n\nCDL offers DataCite DOIs to University of California scholars + and researchers via the EZID service. EZID is also available as a general + identifier service to help educational, non-profit, governmental and commercial + clients create and manage globally unique identifiers for data and other sources.","region":"AMER","country":"US","logo-url":"https://assets.datacite.org/images/members/cdl.png","organization-type":"academic_institution","focus-area":"general","is-active":true,"has-password":true,"joined":"2009-12-01","created":"2010-01-01T00:00:00.000Z","updated":"2018-10-24T20:47:51.000Z"},"relationships":{"prefixes":{"data":[{"id":"10.5062","type":"prefixes"},{"id":"10.5063","type":"prefixes"},{"id":"10.5065","type":"prefixes"},{"id":"10.5068","type":"prefixes"},{"id":"10.5069","type":"prefixes"},{"id":"10.5070","type":"prefixes"},{"id":"10.5072","type":"prefixes"},{"id":"10.6071","type":"prefixes"},{"id":"10.6072","type":"prefixes"},{"id":"10.6074","type":"prefixes"},{"id":"10.6075","type":"prefixes"},{"id":"10.6076","type":"prefixes"},{"id":"10.6078","type":"prefixes"},{"id":"10.6079","type":"prefixes"},{"id":"10.6080","type":"prefixes"},{"id":"10.6081","type":"prefixes"},{"id":"10.6085","type":"prefixes"},{"id":"10.6086","type":"prefixes"},{"id":"10.7265","type":"prefixes"},{"id":"10.7268","type":"prefixes"},{"id":"10.7269","type":"prefixes"},{"id":"10.7270","type":"prefixes"},{"id":"10.7271","type":"prefixes"},{"id":"10.7272","type":"prefixes"},{"id":"10.7276","type":"prefixes"},{"id":"10.7279","type":"prefixes"},{"id":"10.7280","type":"prefixes"},{"id":"10.7281","type":"prefixes"},{"id":"10.7282","type":"prefixes"},{"id":"10.7284","type":"prefixes"},{"id":"10.7285","type":"prefixes"},{"id":"10.7286","type":"prefixes"},{"id":"10.7288","type":"prefixes"},{"id":"10.7291","type":"prefixes"},{"id":"10.7292","type":"prefixes"},{"id":"10.7293","type":"prefixes"},{"id":"10.7295","type":"prefixes"},{"id":"10.7296","type":"prefixes"},{"id":"10.7297","type":"prefixes"},{"id":"10.7299","type":"prefixes"},{"id":"10.7300","type":"prefixes"},{"id":"10.4246","type":"prefixes"},{"id":"10.7908","type":"prefixes"},{"id":"10.7911","type":"prefixes"},{"id":"10.7913","type":"prefixes"},{"id":"10.7914","type":"prefixes"},{"id":"10.7916","type":"prefixes"},{"id":"10.7918","type":"prefixes"},{"id":"10.7919","type":"prefixes"},{"id":"10.7920","type":"prefixes"},{"id":"10.7921","type":"prefixes"},{"id":"10.7922","type":"prefixes"},{"id":"10.7925","type":"prefixes"},{"id":"10.7927","type":"prefixes"},{"id":"10.7928","type":"prefixes"},{"id":"10.7929","type":"prefixes"},{"id":"10.7932","type":"prefixes"},{"id":"10.7933","type":"prefixes"},{"id":"10.7934","type":"prefixes"},{"id":"10.7939","type":"prefixes"},{"id":"10.7940","type":"prefixes"},{"id":"10.7941","type":"prefixes"},{"id":"10.7942","type":"prefixes"},{"id":"10.7943","type":"prefixes"},{"id":"10.7944","type":"prefixes"},{"id":"10.7945","type":"prefixes"},{"id":"10.7946","type":"prefixes"},{"id":"10.13022","type":"prefixes"},{"id":"10.13026","type":"prefixes"},{"id":"10.13025","type":"prefixes"},{"id":"10.15147","type":"prefixes"},{"id":"10.15146","type":"prefixes"},{"id":"10.15142","type":"prefixes"},{"id":"10.15144","type":"prefixes"},{"id":"10.15145","type":"prefixes"},{"id":"10.15140","type":"prefixes"},{"id":"10.15141","type":"prefixes"},{"id":"10.15139","type":"prefixes"},{"id":"10.1184","type":"prefixes"},{"id":"10.15784","type":"prefixes"},{"id":"10.15779","type":"prefixes"},{"id":"10.15780","type":"prefixes"},{"id":"10.15781","type":"prefixes"},{"id":"10.15782","type":"prefixes"},{"id":"10.17612","type":"prefixes"},{"id":"10.17610","type":"prefixes"},{"id":"10.17611","type":"prefixes"},{"id":"10.17614","type":"prefixes"},{"id":"10.17615","type":"prefixes"},{"id":"10.17602","type":"prefixes"},{"id":"10.17603","type":"prefixes"},{"id":"10.17908","type":"prefixes"},{"id":"10.17916","type":"prefixes"},{"id":"10.17915","type":"prefixes"},{"id":"10.17918","type":"prefixes"},{"id":"10.17919","type":"prefixes"},{"id":"10.17911","type":"prefixes"},{"id":"10.17913","type":"prefixes"},{"id":"10.17920","type":"prefixes"},{"id":"10.18123","type":"prefixes"},{"id":"10.18119","type":"prefixes"},{"id":"10.18118","type":"prefixes"},{"id":"10.18117","type":"prefixes"},{"id":"10.18115","type":"prefixes"},{"id":"10.18431","type":"prefixes"},{"id":"10.18436","type":"prefixes"},{"id":"10.18437","type":"prefixes"},{"id":"10.18439","type":"prefixes"},{"id":"10.18737","type":"prefixes"},{"id":"10.18736","type":"prefixes"},{"id":"10.18739","type":"prefixes"},{"id":"10.18734","type":"prefixes"},{"id":"10.20353","type":"prefixes"},{"id":"10.20354","type":"prefixes"},{"id":"10.20352","type":"prefixes"},{"id":"10.20357","type":"prefixes"},{"id":"10.20358","type":"prefixes"},{"id":"10.20359","type":"prefixes"},{"id":"10.21228","type":"prefixes"},{"id":"10.21229","type":"prefixes"},{"id":"10.21224","type":"prefixes"},{"id":"10.21222","type":"prefixes"},{"id":"10.21223","type":"prefixes"},{"id":"10.21221","type":"prefixes"},{"id":"10.21237","type":"prefixes"},{"id":"10.21238","type":"prefixes"},{"id":"10.21239","type":"prefixes"},{"id":"10.21236","type":"prefixes"},{"id":"10.21430","type":"prefixes"},{"id":"10.21433","type":"prefixes"},{"id":"10.21431","type":"prefixes"},{"id":"10.21421","type":"prefixes"},{"id":"10.21422","type":"prefixes"},{"id":"10.21424","type":"prefixes"},{"id":"10.21425","type":"prefixes"},{"id":"10.21426","type":"prefixes"},{"id":"10.21427","type":"prefixes"},{"id":"10.21428","type":"prefixes"},{"id":"10.21418","type":"prefixes"},{"id":"10.21416","type":"prefixes"},{"id":"10.21414","type":"prefixes"},{"id":"10.21972","type":"prefixes"},{"id":"10.21973","type":"prefixes"},{"id":"10.21975","type":"prefixes"},{"id":"10.21976","type":"prefixes"},{"id":"10.21977","type":"prefixes"},{"id":"10.21978","type":"prefixes"},{"id":"10.21990","type":"prefixes"},{"id":"10.21983","type":"prefixes"},{"id":"10.21980","type":"prefixes"},{"id":"10.21986","type":"prefixes"},{"id":"10.5195","type":"prefixes"},{"id":"10.25334","type":"prefixes"},{"id":"10.25337","type":"prefixes"},{"id":"10.25338","type":"prefixes"},{"id":"10.25342","type":"prefixes"},{"id":"10.25349","type":"prefixes"},{"id":"10.25348","type":"prefixes"},{"id":"10.25347","type":"prefixes"},{"id":"10.25346","type":"prefixes"},{"id":"10.25345","type":"prefixes"},{"id":"10.25344","type":"prefixes"},{"id":"10.25352","type":"prefixes"},{"id":"10.25350","type":"prefixes"},{"id":"10.25351","type":"prefixes"},{"id":"10.26081","type":"prefixes"}]}}}]}' + http_version: + recorded_at: Fri, 07 Dec 2018 17:59:12 GMT +- request: + method: get + uri: https://search.test.datacite.org/api?fl=doi,url,xml,state,allocator_symbol,datacentre_symbol,media,minted,updated&q=doi:10.7272/q6g15xs4&wt=json + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - Mozilla/5.0 (compatible; Maremma/4.1.1; +https://github.com/datacite/maremma) + Accept: + - text/html,application/json,application/xml;q=0.9, text/plain;q=0.8,image/png,*/*;q=0.5 + response: + status: + code: 200 + message: OK + headers: + Date: + - Fri, 07 Dec 2018 17:59:13 GMT + Content-Type: + - application/json;charset=UTF-8 + Connection: + - keep-alive + Server: + - nginx/1.10.3 (Ubuntu) + Access-Control-Allow-Origin: + - "*" + Access-Control-Allow-Methods: + - GET, POST, PUT, DELETE, OPTIONS + Access-Control-Allow-Headers: + - DNT,X-CustomHeader,Keep-Alive,User-Agent,X-Requested-With,If-Modified-Since,Cache-Control,Content-Type,Content-Range,Range,Authorization + Access-Control-Expose-Headers: + - DNT,X-CustomHeader,Keep-Alive,User-Agent,X-Requested-With,If-Modified-Since,Cache-Control,Content-Type,Content-Range,Range,Authorization + body: + encoding: ASCII-8BIT + string: '{"responseHeader":{"status":0,"QTime":1},"response":{"numFound":1,"start":0,"docs":[{"datacentre_symbol":"CDL.UCSFCTSI","url":"https://datashare.ucsf.edu/stash/dataset/doi:10.7272/Q6G15XS4","xml":"PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0iVVRGLTgiPz4KPHJlc291cmNlIHhtbG5zOnhzaT0iaHR0cDovL3d3dy53My5vcmcvMjAwMS9YTUxTY2hlbWEtaW5zdGFuY2UiIHhtbG5zPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtMyIgeHNpOnNjaGVtYUxvY2F0aW9uPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtMyBodHRwOi8vc2NoZW1hLmRhdGFjaXRlLm9yZy9tZXRhL2tlcm5lbC0zL21ldGFkYXRhLnhzZCI+CiAgPGlkZW50aWZpZXIgaWRlbnRpZmllclR5cGU9IkRPSSI+MTAuNzI3Mi9RNkcxNVhTNDwvaWRlbnRpZmllcj4KICA8Y3JlYXRvcnM+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lPlJvZHJpZ3VleiwgUm9iZXJ0PC9jcmVhdG9yTmFtZT4KICAgICAgPGFmZmlsaWF0aW9uPlVDIFNhbiBGcmFuY2lzY288L2FmZmlsaWF0aW9uPgogICAgPC9jcmVhdG9yPgogICAgPGNyZWF0b3I+CiAgICAgIDxjcmVhdG9yTmFtZT5Nb3dlciwgV2lsbGlhbTwvY3JlYXRvck5hbWU+CiAgICAgIDxhZmZpbGlhdGlvbj5VQ0xBPC9hZmZpbGlhdGlvbj4KICAgIDwvY3JlYXRvcj4KICA8L2NyZWF0b3JzPgogIDx0aXRsZXM+CiAgICA8dGl0bGU+TkVYVVMgSGVhZCBDVDwvdGl0bGU+CiAgPC90aXRsZXM+CiAgPHB1Ymxpc2hlcj5VQyBTYW4gRnJhbmNpc2NvPC9wdWJsaXNoZXI+CiAgPHB1YmxpY2F0aW9uWWVhcj4yMDE3PC9wdWJsaWNhdGlvblllYXI+CiAgPGxhbmd1YWdlPmVuPC9sYW5ndWFnZT4KICA8cmVzb3VyY2VUeXBlIHJlc291cmNlVHlwZUdlbmVyYWw9IkRhdGFzZXQiLz4KICA8c2l6ZXM+CiAgICA8c2l6ZT4xNDk1MjA0IGJ5dGVzPC9zaXplPgogIDwvc2l6ZXM+CiAgPHZlcnNpb24+MTwvdmVyc2lvbj4KICA8cmlnaHRzTGlzdD4KICAgIDxyaWdodHMgcmlnaHRzVVJJPSJodHRwczovL2NyZWF0aXZlY29tbW9ucy5vcmcvbGljZW5zZXMvYnkvNC4wLyI+Q3JlYXRpdmUgQ29tbW9ucyBBdHRyaWJ1dGlvbiA0LjAgSW50ZXJuYXRpb25hbCAoQ0MgQlkgNC4wKTwvcmlnaHRzPgogIDwvcmlnaHRzTGlzdD4KICA8ZGVzY3JpcHRpb25zPgogICAgPGRlc2NyaXB0aW9uIGRlc2NyaXB0aW9uVHlwZT0iQWJzdHJhY3QiPgogICAgICBCYWNrZ3JvdW5kIENsaW5pY2lhbnMsIGFmcmFpZCBvZiBtaXNzaW5nIGludHJhY3JhbmlhbCBpbmp1cmllcywgbGliZXJhbGx5CiAgICAgIG9idGFpbiBjb21wdXRlZCB0b21vZ3JhcGhpYyAoQ1QpIGhlYWQgaW1hZ2luZyBpbiBibHVudCB0cmF1bWEgcGF0aWVudHMuCiAgICAgIFByaW9yIHdvcmsgc3VnZ2VzdHMgdGhhdCBjbGluaWNhbCBjcml0ZXJpYSAoTkVYVVMgSGVhZCBDVCBkZWNpc2lvbgogICAgICBpbnN0cnVtZW50KSBjYW4gcmVsaWFibHkgaWRlbnRpZnkgcGF0aWVudHMgd2l0aCBpbXBvcnRhbnQgaW5qdXJpZXMsIHdoaWxlCiAgICAgIGV4Y2x1ZGluZyBpbmp1cnksIGFuZCB0aGUgbmVlZCBmb3IgaW1hZ2luZyBpbiBtYW55IHBhdGllbnRzLiBNZXRob2RzIFdlCiAgICAgIGNvbmR1Y3RlZCBhIHByb3NwZWN0aXZlIG9ic2VydmF0aW9uYWwgc3R1ZHkgb2YgdGhlIE5FWFVTIEhlYWQgQ1QgZGVjaXNpb24KICAgICAgaW5zdHJ1bWVudCAoREkpIHRoYXQgcmVxdWlyZXMgcGF0aWVudHMgdG8gbWVldCBlaWdodCBjcml0ZXJpYSB0byBhY2hpZXZlCiAgICAgIOKAnGxvdy1yaXNr4oCdIGNsYXNzaWZpY2F0aW9uLiBXZSBleGFtaW5lZCB0aGUgaW5zdHJ1bWVudOKAmXMgcGVyZm9ybWFuY2UgaW4KICAgICAgaWRlbnRpZnlpbmcgcGF0aWVudHMgcmVxdWlyaW5nIG5ldXJvbG9naWNhbCBpbnRlcnZlbnRpb24gZnJvbSBhbW9uZyBhCiAgICAgIGNvaG9ydCBvZiAxMSw3NzAgYmx1bnQgaGVhZCBpbmp1cnkgcGF0aWVudHMuIFJlc3VsdHMgVGhlIE5FWFVTIEhlYWQgQ1QgREkKICAgICAgYXNzaWduZWQgaGlnaC1yaXNrIHN0YXR1cyB0byA0MjAgb2YgNDIwIHBhdGllbnRzIHJlcXVpcmluZyBuZXVyb2xvZ2ljYWwKICAgICAgaW50ZXJ2ZW50aW9uIChzZW5zaXRpdml0eSwgMTAwLjAlIFs5NSUgY29uZmlkZW5jZSBpbnRlcnZhbCBbQ0ldOiA5OS4xJSDigJMKICAgICAgMTAwLjAlXSkuIFRoZSBpbnN0cnVtZW50IGFzc2lnbmVkIGxvdy1yaXNrIHN0YXR1cyB0byAyLDgyMyBvZiAxMSwzNTAKICAgICAgcGF0aWVudHMgd2hvIGRpZCBub3QgcmVxdWlyZSBuZXVyb2xvZ2ljYWwgaW50ZXJ2ZW50aW9uIChzcGVjaWZpY2l0eSwgMjQuOSUKICAgICAgWzk1JSBDSTogMjQuMSUgLSAyNS43JV0pLiBOb25lIG9mIHRoZSAyLDgyMyBsb3ctcmlzayBwYXRpZW50cyByZXF1aXJlZAogICAgICBuZXVyb2xvZ2ljYWwgaW50ZXJ2ZW50aW9uIChOUFYsIDEwMC4wJSBbOTUlIENJOiA5OS45JSAtIDEwMC4wJV0pLiBUaGUgREkKICAgICAgYXNzaWduZWQgaGlnaC1yaXNrIHN0YXR1cyB0byA3NTkgb2YgNzY3IHBhdGllbnRzIHdpdGggc2lnbmlmaWNhbnQKICAgICAgaW50cmFjcmFuaWFsIGluanVyaWVzIChzZW5zaXRpdml0eSwgOTkuMCUgWzk1JSBDSTogOTguMCUgLSA5OS42JV0pLiBUaGUKICAgICAgaW5zdHJ1bWVudCBhc3NpZ25lZCBsb3ctcmlzayBzdGF0dXMgdG8gMiw4MTUgb2YgMTEsMDAzIHBhdGllbnRzIHdobyBkaWQKICAgICAgbm90IGhhdmUgc2lnbmlmaWNhbnQgaW5qdXJpZXMgKHNwZWNpZmljaXR5LCAyNS42JSBbOTUlIENJOiAyNC44JSAtCiAgICAgIDI2LjQlXSkuIFNpZ25pZmljYW50IGluanVyaWVzIHdlcmUgYWJzZW50IGluIDIsODE1IG9mIHRoZSAyLDgyMyBwYXRpZW50cwogICAgICBhc3NpZ25lZCBsb3ctcmlzayBzdGF0dXMgKE5QViwgOTkuNyUgWzk1JSBDSTogOTkuNCUgLSA5OS45JV0pLiBDb25jbHVzaW9ucwogICAgICBUaGUgTkVYVVMgSGVhZCBDVCBESSByZWxpYWJseSBpZGVudGlmaWVzIGJsdW50IHRyYXVtYSBwYXRpZW50cyB3aG8gcmVxdWlyZQogICAgICBoZWFkIENUIGltYWdpbmcsIGFuZCBjb3VsZCBzaWduaWZpY2FudGx5IHJlZHVjaW5nIHRoZSB1c2Ugb2YgQ1QgaW1hZ2luZy4KICAgIDwvZGVzY3JpcHRpb24+CiAgICA8ZGVzY3JpcHRpb24gZGVzY3JpcHRpb25UeXBlPSJNZXRob2RzIj5Qcm9zcGVjdGl2ZSBtdWx0aWNlbnRlcjwvZGVzY3JpcHRpb24+CiAgPC9kZXNjcmlwdGlvbnM+CiAgPGdlb0xvY2F0aW9ucz4KICAgIDxnZW9Mb2NhdGlvbj4KICAgICAgPGdlb0xvY2F0aW9uUG9pbnQ+MzcuMjUwMjIgLTExOS43NTEyNjwvZ2VvTG9jYXRpb25Qb2ludD4KICAgICAgPGdlb0xvY2F0aW9uUGxhY2U+Q2FsaWZvcm5pYSwgVVNBPC9nZW9Mb2NhdGlvblBsYWNlPgogICAgPC9nZW9Mb2NhdGlvbj4KICA8L2dlb0xvY2F0aW9ucz4KPC9yZXNvdXJjZT4=","allocator_symbol":"CDL","minted":"2018-12-07T09:48:20Z","state":"findable","updated":"2018-12-07T09:48:20Z","doi":"10.7272/Q6G15XS4"}]}} + +' + http_version: + recorded_at: Fri, 07 Dec 2018 17:59:13 GMT +recorded_with: VCR 3.0.3 diff --git a/spec/jobs/doi_import_by_day_job.rb b/spec/jobs/doi_import_by_day_job.rb new file mode 100644 index 000000000..3d9375455 --- /dev/null +++ b/spec/jobs/doi_import_by_day_job.rb @@ -0,0 +1,16 @@ +require 'rails_helper' + +describe DoiImportByDayJob, type: :job do + let(:doi) { create(:doi) } + subject(:job) { DoiImportByDayJob.perform_later(Time.zone.now.strftime("%F")) } + + it 'queues the job' do + expect { job }.to have_enqueued_job(DoiImportByDayJob) + .on_queue("test_lupo_background") + end + + after do + clear_enqueued_jobs + clear_performed_jobs + end +end \ No newline at end of file diff --git a/spec/models/doi_spec.rb b/spec/models/doi_spec.rb index cee8aaa33..48a6482ea 100644 --- a/spec/models/doi_spec.rb +++ b/spec/models/doi_spec.rb @@ -55,7 +55,7 @@ expect(subject).to have_state(:findable) end - it "can't register with test prefix" do + it "can't publish with test prefix" do subject = create(:doi, doi: "10.5072/x") subject.publish expect(subject).to have_state(:draft) @@ -64,7 +64,7 @@ describe "flagged" do it "can flag" do - subject.register + subject.publish subject.flag expect(subject).to have_state(:flagged) end @@ -77,7 +77,7 @@ describe "broken" do it "can link_check" do - subject.register + subject.publish subject.link_check expect(subject).to have_state(:broken) end @@ -227,49 +227,57 @@ end end - context "no url" do - let(:provider) { create(:provider, symbol: "ADMIN") } - let(:client) { create(:client, provider: provider) } - let(:url) { "https://www.example.org" } - subject { build(:doi, client: client, url: nil, current_user: current_user) } - - # it "don't update state change" do - # subject.publish - # expect { subject.save }.not_to have_enqueued_job(HandleJob) - # expect(subject).to have_state(:findable) - # end - - it "update url change" do - subject.publish - subject.url = url - expect { subject.save }.to have_enqueued_job(HandleJob) - end - end + # context "no url" do + # let(:provider) { create(:provider, symbol: "ADMIN") } + # let(:client) { create(:client, provider: provider) } + # let(:url) { "https://www.example.org" } + # subject { build(:doi, client: client, url: nil, current_user: current_user) } + + # it "don't update state change" do + # subject.publish + # expect { subject.save }.not_to have_enqueued_job(HandleJob) + # expect(subject).to have_state(:findable) + # end + + # it "update url change" do + # subject.publish + # subject.url = url + # expect { subject.save }.to have_enqueued_job(HandleJob) + # end + # end end describe "metadata" do - let(:xml) { "PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0iVVRGLTgiIHN0YW5kYWxvbmU9InllcyI/PjxyZXNvdXJjZSB4c2k6c2NoZW1hTG9jYXRpb249Imh0dHA6Ly9kYXRhY2l0ZS5vcmcvc2NoZW1hL2tlcm5lbC0zIGh0dHA6Ly9zY2hlbWEuZGF0YWNpdGUub3JnL21ldGEva2VybmVsLTMvbWV0YWRhdGEueHNkIiB4bWxucz0iaHR0cDovL2RhdGFjaXRlLm9yZy9zY2hlbWEva2VybmVsLTMiIHhtbG5zOnhzaT0iaHR0cDovL3d3dy53My5vcmcvMjAwMS9YTUxTY2hlbWEtaW5zdGFuY2UiPjxpZGVudGlmaWVyIGlkZW50aWZpZXJUeXBlPSJET0kiPjEwLjUyNTYvZjEwMDByZXNlYXJjaC44NTcwLnI2NDIwPC9pZGVudGlmaWVyPjxjcmVhdG9ycz48Y3JlYXRvcj48Y3JlYXRvck5hbWU+ZCBzPC9jcmVhdG9yTmFtZT48L2NyZWF0b3I+PC9jcmVhdG9ycz48dGl0bGVzPjx0aXRsZT5SZWZlcmVlIHJlcG9ydC4gRm9yOiBSRVNFQVJDSC0zNDgyIFt2ZXJzaW9uIDU7IHJlZmVyZWVzOiAxIGFwcHJvdmVkLCAxIGFwcHJvdmVkIHdpdGggcmVzZXJ2YXRpb25zXTwvdGl0bGU+PC90aXRsZXM+PHB1Ymxpc2hlcj5GMTAwMCBSZXNlYXJjaCBMaW1pdGVkPC9wdWJsaXNoZXI+PHB1YmxpY2F0aW9uWWVhcj4yMDE3PC9wdWJsaWNhdGlvblllYXI+PHJlc291cmNlVHlwZSByZXNvdXJjZVR5cGVHZW5lcmFsPSJUZXh0Ii8+PC9yZXNvdXJjZT4=" } + subject { create(:doi) } - subject { create(:doi, xml: xml) } + it "valid" do + expect(subject.valid?).to be true + end - it "title" do - expect(subject.title).to eq("Referee report. For: RESEARCH-3482 [version 5; referees: 1 approved, 1 approved with reservations]") + it "titles" do + expect(subject.titles).to eq([{"title"=>"Data from: A new malaria agent in African hominids."}]) end - it "author" do - expect(subject.author).to eq("name"=>"D S") + it "creators" do + expect(subject.creators.length).to eq(8) + expect(subject.creators.first).to eq("familyName"=>"Ollomo", "givenName"=>"Benjamin", "name"=>"Benjamin Ollomo", "type"=>"Person") end - it "date_published" do - expect(subject.date_published).to eq("2017") + it "dates" do + expect(subject.get_date(subject.dates, "Issued")).to eq("2011") end it "publication_year" do - expect(subject.publication_year).to eq(2017) + expect(subject.publication_year).to eq(2011) end it "schema_version" do - expect(subject.schema_version).to eq("http://datacite.org/schema/kernel-3") + expect(subject.schema_version).to eq("http://datacite.org/schema/kernel-4") + end + + it "xml" do + doc = Nokogiri::XML(subject.xml, nil, 'UTF-8', &:noblanks) + expect(doc.at_css("identifier").content).to eq(subject.doi) end it "metadata" do @@ -278,104 +286,84 @@ end it "namespace" do - expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-3") + expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-4") end end describe "change metadata" do - let(:xml) { "PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0iVVRGLTgiIHN0YW5kYWxvbmU9InllcyI/PjxyZXNvdXJjZSB4c2k6c2NoZW1hTG9jYXRpb249Imh0dHA6Ly9kYXRhY2l0ZS5vcmcvc2NoZW1hL2tlcm5lbC0zIGh0dHA6Ly9zY2hlbWEuZGF0YWNpdGUub3JnL21ldGEva2VybmVsLTMvbWV0YWRhdGEueHNkIiB4bWxucz0iaHR0cDovL2RhdGFjaXRlLm9yZy9zY2hlbWEva2VybmVsLTMiIHhtbG5zOnhzaT0iaHR0cDovL3d3dy53My5vcmcvMjAwMS9YTUxTY2hlbWEtaW5zdGFuY2UiPjxpZGVudGlmaWVyIGlkZW50aWZpZXJUeXBlPSJET0kiPjEwLjUyNTYvZjEwMDByZXNlYXJjaC44NTcwLnI2NDIwPC9pZGVudGlmaWVyPjxjcmVhdG9ycz48Y3JlYXRvcj48Y3JlYXRvck5hbWU+ZCBzPC9jcmVhdG9yTmFtZT48L2NyZWF0b3I+PC9jcmVhdG9ycz48dGl0bGVzPjx0aXRsZT5SZWZlcmVlIHJlcG9ydC4gRm9yOiBSRVNFQVJDSC0zNDgyIFt2ZXJzaW9uIDU7IHJlZmVyZWVzOiAxIGFwcHJvdmVkLCAxIGFwcHJvdmVkIHdpdGggcmVzZXJ2YXRpb25zXTwvdGl0bGU+PC90aXRsZXM+PHB1Ymxpc2hlcj5GMTAwMCBSZXNlYXJjaCBMaW1pdGVkPC9wdWJsaXNoZXI+PHB1YmxpY2F0aW9uWWVhcj4yMDE3PC9wdWJsaWNhdGlvblllYXI+PHJlc291cmNlVHlwZSByZXNvdXJjZVR5cGVHZW5lcmFsPSJUZXh0Ii8+PC9yZXNvdXJjZT4=" } - - subject { create(:doi, xml: xml) } - - it "title" do - title = "Triose Phosphate Isomerase Deficiency Is Caused by Altered Dimerization–Not Catalytic Inactivity–of the Mutant Enzymes" - subject.title = title - subject.save - - expect(subject.title).to eq(title) + let(:xml) { File.read(file_fixture('datacite_f1000.xml')) } + let(:title) { "Triose Phosphate Isomerase Deficiency Is Caused by Altered Dimerization–Not Catalytic Inactivity–of the Mutant Enzymes" } + let(:creators) { [{ "name"=>"Ollomi, Benjamin" }, { "name"=>"Duran, Patrick" }] } + let(:publisher) { "Zenodo" } + let(:publication_year) { 2011 } + let(:types) { { "resourceTypeGeneral" => "Software", "resourceType" => "BlogPosting", "schemaOrg" => "BlogPosting" } } + let(:description) { "Eating your own dog food is a slang term to describe that an organization should itself use the products and services it provides. For DataCite this means that we should use DOIs with appropriate metadata and strategies for long-term preservation for..." } + + subject { create(:doi, + xml: xml, + titles: [{ "title" => title }], + creators: creators, + publisher: publisher, + publication_year: publication_year, + types: types, + descriptions: [{ "description" => description }], + event: "publish") + } + + it "titles" do + expect(subject.titles).to eq([{ "title" => title }]) xml = Maremma.from_xml(subject.xml).fetch("resource", {}) expect(xml.dig("titles", "title")).to eq(title) end - it "author" do - author = [{ "name"=>"Ollomi, Benjamin" }, { "name"=>"Duran, Patrick" }] - subject.author = author - subject.save - - expect(subject.author).to eq(author) + it "creators" do + expect(subject.creators).to eq(creators) xml = Maremma.from_xml(subject.xml).fetch("resource", {}) expect(xml.dig("creators", "creator")).to eq([{"creatorName"=>"Ollomi, Benjamin"}, {"creatorName"=>"Duran, Patrick"}]) end it "publisher" do - publisher = "Zenodo" - subject.publisher = publisher - subject.save - expect(subject.publisher).to eq(publisher) xml = Maremma.from_xml(subject.xml).fetch("resource", {}) expect(xml.dig("publisher")).to eq(publisher) end - it "date_published" do - date_published = "2011-05-26" - subject.date_published = date_published - subject.save - - expect(subject.date_published).to eq(date_published) + it "publication_year" do + expect(subject.publication_year).to eq(2011) xml = Maremma.from_xml(subject.xml).fetch("resource", {}) - expect(xml.dig("dates", "date")).to eq("dateType"=>"Issued", "__content__"=>date_published) expect(xml.dig("publicationYear")).to eq("2011") end - it "additional_type" do - additional_type = "BlogPosting" - subject.additional_type = additional_type - subject.save - - expect(subject.additional_type).to eq(additional_type) + it "resource_type" do + expect(subject.types["resourceType"]).to eq("BlogPosting") xml = Maremma.from_xml(subject.xml).fetch("resource", {}) - expect(xml.dig("resourceType")).to eq("resourceTypeGeneral"=>"Text", "__content__"=>"BlogPosting") + expect(xml.dig("resourceType")).to eq("resourceTypeGeneral"=>"Software", "__content__"=>"BlogPosting") end it "resource_type_general" do - resource_type_general = "Software" - subject.resource_type_general = resource_type_general - subject.save - - expect(subject.resource_type_general).to eq(resource_type_general) + expect(subject.types["resourceTypeGeneral"]).to eq("Software") xml = Maremma.from_xml(subject.xml).fetch("resource", {}) - expect(xml.dig("resourceType")).to eq("resourceTypeGeneral"=>resource_type_general, "__content__"=>"ScholarlyArticle") + expect(xml.dig("resourceType")).to eq("resourceTypeGeneral"=>"Software", "__content__"=>"BlogPosting") end - it "description" do - description = "Eating your own dog food is a slang term to describe that an organization should itself use the products and services it provides. For DataCite this means that we should use DOIs with appropriate metadata and strategies for long-term preservation for..." - subject.description = description - subject.save - - expect(subject.description).to eq(description) + it "descriptions" do + expect(subject.descriptions).to eq([{ "description" => description }]) xml = Maremma.from_xml(subject.xml).fetch("resource", {}) expect(xml.dig("descriptions", "description")).to eq("__content__" => "Eating your own dog food is a slang term to describe that an organization should itself use the products and services it provides. For DataCite this means that we should use DOIs with appropriate metadata and strategies for long-term preservation for...", "descriptionType" => "Abstract") end it "schema_version" do - title = "Triose Phosphate Isomerase Deficiency Is Caused by Altered Dimerization–Not Catalytic Inactivity–of the Mutant Enzymes" - subject.title = title - subject.save - - xml = Maremma.from_xml(subject.xml).fetch("resource", {}) - expect(xml.dig("titles", "title")).to eq(title) - expect(subject.schema_version).to eq("http://datacite.org/schema/kernel-4") + xml = Maremma.from_xml(subject.xml).fetch("resource", {}) expect(xml.dig("xmlns")).to eq("http://datacite.org/schema/kernel-4") - #expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-4") + expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-4") end end @@ -393,555 +381,11 @@ end end - context "parses Crossref xml" do - let(:xml) { Base64.strict_encode64(file_fixture('crossref.xml').read) } - - subject { create(:doi, xml: xml, event: "publish") } - - it "creates xml" do - doc = Nokogiri::XML(subject.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "valid model" do - expect(subject.valid?).to be true - end - - it "validates against schema" do - expect(subject.validation_errors).to be_empty - end - - it "title" do - expect(subject.title).to eq("Triose Phosphate Isomerase Deficiency Is Caused by Altered Dimerization–Not Catalytic Inactivity–of the Mutant Enzymes") - end - - it "date_published" do - expect(subject.date_published).to eq("2006-12-20") - end - - it "publication_year" do - expect(subject.publication_year).to eq(2006) - end - - it "author" do - expect(subject.author.length).to eq(5) - expect(subject.author.first).to eq("type"=>"Person", "name"=>"Markus Ralser", "givenName"=>"Markus", "familyName"=>"Ralser") - end - - it "schema_version" do - expect(subject.schema_version).to eq("http://datacite.org/schema/kernel-4") - end - - it "metadata" do - doc = Nokogiri::XML(subject.metadata.first.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "namespace" do - expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-4") - end - end - - context "parses namespaced xml" do - let(:xml) { Base64.strict_encode64(file_fixture('ns0.xml').read) } - - subject { create(:doi, doi: "10.4231/D38G8FK8B", xml: xml, event: "publish") } - - it "creates xml" do - doc = Nokogiri::XML(subject.xml, nil, 'UTF-8', &:noblanks) - doc.remove_namespaces! - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "valid model" do - expect(subject.valid?).to be true - end - - it "validates against schema" do - expect(subject.validation_errors).to be_empty - end - - it "title" do - expect(subject.title).to eq("LAMMPS Data-File Generator") - end - - it "date_published" do - expect(subject.date_published).to eq("2018") - end - - it "publication_year" do - expect(subject.publication_year).to eq(2018) - end - - it "author" do - expect(subject.author.length).to eq(5) - expect(subject.author.first).to eq("type"=>"Person", "name"=>"Carlos PatiñO", "givenName"=>"Carlos", "familyName"=>"PatiñO") - end - - it "schema_version" do - expect(subject.schema_version).to eq("http://datacite.org/schema/kernel-2.2") - end - - it "metadata" do - doc = Nokogiri::XML(subject.metadata.first.xml, nil, 'UTF-8', &:noblanks) - doc.remove_namespaces! - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "namespace" do - expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-2.2") - end - end - - context "parses schema" do - let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } - - subject { create(:doi, xml: xml, event: "publish") } - - it "creates xml" do - doc = Nokogiri::XML(subject.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "valid model" do - expect(subject.valid?).to be true - end - - it "validates against schema" do - expect(subject.validation_errors).to be_empty - end - - it "title" do - expect(subject.title).to eq("Eating your own Dog Food") - end - - it "author" do - expect(subject.author).to eq("type"=>"Person", "id"=>"https://orcid.org/0000-0003-1419-2405", "name"=>"Fenner, Martin", "givenName"=>"Martin", "familyName"=>"Fenner") - end - - it "date_published" do - expect(subject.date_published).to eq("2016-12-20") - end - - it "publication_year" do - expect(subject.publication_year).to eq(2016) - end - - it "creates schema_version" do - expect(subject.schema_version).to eq("http://datacite.org/schema/kernel-4") - end - - it "metadata" do - doc = Nokogiri::XML(subject.metadata.first.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "namespace" do - expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-4") - end - end - - context "parses schema 3" do - let(:xml) { Base64.strict_encode64(file_fixture('datacite_schema_3.xml').read) } - - subject { create(:doi, xml: xml, event: "publish") } - - it "creates xml" do - doc = Nokogiri::XML(subject.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "valid model" do - expect(subject.valid?).to be true - end - - it "title" do - expect(subject.title).to eq("Data from: A new malaria agent in African hominids.") - end - - it "author" do - expect(subject.author.length).to eq(8) - expect(subject.author.first).to eq("type"=>"Person", "name"=>"Benjamin Ollomo", "givenName"=>"Benjamin", "familyName"=>"Ollomo") - end - - it "date_published" do - expect(subject.date_published).to eq("2011") - end - - it "publication_year" do - expect(subject.publication_year).to eq(2011) - end - - it "creates schema_version" do - expect(subject.schema_version).to eq("http://datacite.org/schema/kernel-3") - end - - it "metadata" do - doc = Nokogiri::XML(subject.metadata.first.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "namespace" do - expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-3") - end - end - - context "parses schema 2.2" do - let(:xml) { Base64.strict_encode64(file_fixture('datacite_schema_2.2.xml').read) } - - subject { create(:doi, xml: xml, event: "publish") } - - it "creates xml" do - doc = Nokogiri::XML(subject.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "valid model" do - expect(subject.valid?).to be true - end - - it "title" do - expect(subject.title).to eq(["Właściwości rzutowań podprzestrzeniowych", {"title_type"=>"TranslatedTitle", "text"=>"Translation of Polish titles"}]) - end - - it "author" do - expect(subject.author.length).to eq(2) - expect(subject.author.first).to eq("type"=>"Person", "name"=>"John Smith", "givenName"=>"John", "familyName"=>"Smith") - end - - it "date_published" do - expect(subject.date_published).to eq("2010") - end - - it "publication_year" do - expect(subject.publication_year).to eq(2010) - end - - it "creates schema_version" do - expect(subject.schema_version).to eq("http://datacite.org/schema/kernel-2.2") - end - - it "metadata" do - doc = Nokogiri::XML(subject.metadata.first.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "namespace" do - expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-2.2") - end - end - - context "parses bibtex" do - let(:xml) { Base64.strict_encode64(file_fixture('crossref.bib').read) } - - subject { create(:doi, xml: xml, event: "publish") } - - it "creates xml" do - doc = Nokogiri::XML(subject.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "valid model" do - expect(subject.valid?).to be true - end - - it "validates against schema" do - expect(subject.validation_errors).to be_empty - end - - it "title" do - expect(subject.title).to eq("Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth") - end - - it "author" do - expect(subject.author.length).to eq(5) - expect(subject.author.first).to eq("type"=>"Person", "name"=>"Martial Sankar", "givenName"=>"Martial", "familyName"=>"Sankar") - end - - it "creates schema_version" do - expect(subject.schema_version).to eq("http://datacite.org/schema/kernel-4") - end - - it "metadata" do - doc = Nokogiri::XML(subject.metadata.first.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "namespace" do - expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-4") - end - end - - context "parses ris" do - let(:xml) { ::Base64.strict_encode64(file_fixture('crossref.ris').read) } - - subject { create(:doi, xml: xml, event: "publish") } - - it "creates xml" do - doc = Nokogiri::XML(subject.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "valid model" do - expect(subject.valid?).to be true - end - - it "validates against schema" do - expect(subject.validation_errors).to be_empty - end - - it "title" do - expect(subject.title).to eq("Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth") - end - - it "author" do - expect(subject.author.length).to eq(5) - expect(subject.author.first).to eq("type"=>"Person", "name"=>"Martial Sankar", "givenName"=>"Martial", "familyName"=>"Sankar") - end - - it "creates schema_version" do - expect(subject.schema_version).to eq("http://datacite.org/schema/kernel-4") - end - - it "metadata" do - doc = Nokogiri::XML(subject.metadata.first.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "namespace" do - expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-4") - end - end - - context "parses citeproc" do - let(:xml) { ::Base64.strict_encode64(file_fixture('citeproc.json').read) } - - subject { create(:doi, xml: xml, event: "publish") } - - it "creates xml" do - doc = Nokogiri::XML(subject.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "valid model" do - expect(subject.valid?).to be true - end - - it "validates against schema" do - expect(subject.validation_errors).to be_empty - end - - it "title" do - expect(subject.title).to eq("Eating your own Dog Food") - end - - it "author" do - expect(subject.author).to eq("type"=>"Person", "name"=>"Martin Fenner", "givenName"=>"Martin", "familyName"=>"Fenner") - end - - it "creates schema_version" do - expect(subject.schema_version).to eq("http://datacite.org/schema/kernel-4") - end - - it "metadata" do - doc = Nokogiri::XML(subject.metadata.first.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "namespace" do - expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-4") - end - end - - context "parses codemeta" do - let(:xml) { ::Base64.strict_encode64(file_fixture('codemeta.json').read) } - - subject { create(:doi, xml: xml, event: "publish") } - - it "creates xml" do - doc = Nokogiri::XML(subject.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "valid model" do - expect(subject.valid?).to be true - end - - it "validates against schema" do - expect(subject.validation_errors).to be_empty - end - - it "title" do - expect(subject.title).to eq("R Interface to the DataONE REST API") - end - - it "author" do - expect(subject.author.length).to eq(3) - expect(subject.author.first).to eq("type"=>"Person", "id"=>"http://orcid.org/0000-0003-0077-4738", "name"=>"Matt Jones", "givenName"=>"Matt", "familyName"=>"Jones") - end - - it "creates schema_version" do - expect(subject.schema_version).to eq("http://datacite.org/schema/kernel-4") - end - - it "metadata" do - doc = Nokogiri::XML(subject.metadata.first.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "namespace" do - expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-4") - end - end - - context "parses crosscite" do - let(:xml) { ::Base64.strict_encode64(file_fixture('crosscite.json').read) } - - subject { create(:doi, xml: xml, event: "publish") } - - it "creates xml" do - doc = Nokogiri::XML(subject.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "valid model" do - expect(subject.valid?).to be true - end - - it "validates against schema" do - expect(subject.validation_errors).to be_empty - end - - it "title" do - expect(subject.title).to eq("Analysis Tools for Crossover Experiment of UI using Choice Architecture") - end - - it "author" do - expect(subject.author).to eq("type"=>"Person", "name"=>"Kristian Garza", "givenName"=>"Kristian", "familyName"=>"Garza") - end - - it "creates schema_version" do - expect(subject.schema_version).to eq("http://datacite.org/schema/kernel-4") - end - - it "metadata" do - doc = Nokogiri::XML(subject.metadata.first.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "namespace" do - expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-4") - end - end - - context "parses schema.org" do - let(:xml) { ::Base64.strict_encode64(file_fixture('schema_org.json').read) } - - subject { create(:doi, xml: xml, event: "publish") } - - it "creates xml" do - doc = Nokogiri::XML(subject.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "valid model" do - expect(subject.valid?).to be true - end - - it "validates against schema" do - expect(subject.validation_errors).to be_empty - end - - it "title" do - expect(subject.title).to eq("Eating your own Dog Food") - end - - it "author" do - expect(subject.author).to eq("type"=>"Person", "id"=>"http://orcid.org/0000-0003-1419-2405", "name"=>"Martin Fenner", "givenName"=>"Martin", "familyName"=>"Fenner") - end - - it "creates schema_version" do - expect(subject.schema_version).to eq("http://datacite.org/schema/kernel-4") - end - - it "metadata" do - doc = Nokogiri::XML(subject.metadata.first.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "namespace" do - expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-4") - end - end - - context "parses schema.org topmed" do - let(:xml) { ::Base64.strict_encode64(file_fixture('schema_org_topmed.json').read) } - - subject { create(:doi, xml: xml, event: "publish") } - - it "creates xml" do - doc = Nokogiri::XML(subject.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - expect(doc.at_css("relatedIdentifiers").content).to eq("10.23725/2g4s-qv04") - end - - it "valid model" do - expect(subject.valid?).to be true - end - - it "validates against schema" do - expect(subject.validation_errors).to be_empty - end - - it "title" do - expect(subject.title).to eq("NWD165827.recab.cram") - end - - it "author" do - expect(subject.author).to eq("name"=>"TOPMed IRC", "type"=>"Organization") - end - - it "content_url" do - expect(subject.content_url).to eq(["s3://cgp-commons-public/topmed_open_access/197bc047-e917-55ed-852d-d563cdbc50e4/NWD165827.recab.cram", "gs://topmed-irc-share/public/NWD165827.recab.cram"]) - end - - it "references" do - expect(subject.references).to eq("id"=>"https://doi.org/10.23725/2g4s-qv04", "type"=>"Dataset") - end - - it "funding" do - expect(subject.funding).to eq("id"=>"https://doi.org/10.13039/100000050", "name"=>"National Heart, Lung, and Blood Institute (NHLBI)", "type"=>"Organization") - end - - it "alternate_identifier" do - expect(subject.alternate_identifier).to eq([{"name"=>"3b33f6b9338fccab0901b7d317577ea3", "type"=>"md5"}, {"name"=>"ark:/99999/fk41CrU4eszeLUDe", "type"=>"minid"}, {"name"=>"dg.4503/c3d66dc9-58da-411c-83c4-dd656aa3c4b7", "type"=>"dataguid"}]) - end - - it "creates schema_version" do - expect(subject.schema_version).to eq("http://datacite.org/schema/kernel-4") - end - - it "metadata" do - doc = Nokogiri::XML(subject.metadata.first.xml, nil, 'UTF-8', &:noblanks) - expect(doc.at_css("identifier").content).to eq(subject.doi) - end - - it "namespace" do - expect(subject.metadata.first.namespace).to eq("http://datacite.org/schema/kernel-4") - end - - it "media" do - expect(subject.media.pluck(:url)).to eq(["s3://cgp-commons-public/topmed_open_access/197bc047-e917-55ed-852d-d563cdbc50e4/NWD165827.recab.cram", "gs://topmed-irc-share/public/NWD165827.recab.cram"]) - end - end - describe "content negotiation" do - let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } - - subject { create(:doi, doi: "10.5438/4k3m-nyvg", xml: xml, event: "publish") } + subject { create(:doi, doi: "10.5438/4k3m-nyvg", event: "publish") } it "validates against schema" do - expect(subject.validation_errors).to be_empty + expect(subject.valid?).to be true end it "generates datacite_xml" do @@ -951,49 +395,95 @@ it "generates bibtex" do bibtex = BibTeX.parse(subject.bibtex).to_a(quotes: '').first - expect(bibtex[:bibtex_type].to_s).to eq("article") - expect(bibtex[:title].to_s).to eq("Eating your own Dog Food") + expect(bibtex[:bibtex_type].to_s).to eq("misc") + expect(bibtex[:title].to_s).to eq("Data from: A new malaria agent in African hominids.") end it "generates ris" do ris = subject.ris.split("\r\n") - expect(ris[0]).to eq("TY - RPRT") - expect(ris[1]).to eq("T1 - Eating your own Dog Food") + expect(ris[0]).to eq("TY - DATA") + expect(ris[1]).to eq("T1 - Data from: A new malaria agent in African hominids.") end it "generates schema_org" do json = JSON.parse(subject.schema_org) - expect(json["@type"]).to eq("ScholarlyArticle") - expect(json["name"]).to eq("Eating your own Dog Food") + expect(json["@type"]).to eq("Dataset") + expect(json["name"]).to eq("Data from: A new malaria agent in African hominids.") end it "generates datacite_json" do json = JSON.parse(subject.datacite_json) expect(json["doi"]).to eq("10.5438/4K3M-NYVG") - expect(json["title"]).to eq("Eating your own Dog Food") + expect(json["titles"]).to eq([{"title"=>"Data from: A new malaria agent in African hominids."}]) end it "generates codemeta" do json = JSON.parse(subject.codemeta) - expect(json["@type"]).to eq("ScholarlyArticle") - expect(json["title"]).to eq("Eating your own Dog Food") + expect(json["@type"]).to eq("Dataset") + expect(json["title"]).to eq("Data from: A new malaria agent in African hominids.") end it "generates jats" do jats = Maremma.from_xml(subject.jats).fetch("element_citation", {}) - expect(jats.dig("publication_type")).to eq("journal") - expect(jats.dig("article_title")).to eq("Eating your own Dog Food") + expect(jats.dig("publication_type")).to eq("data") + expect(jats.dig("data_title")).to eq("Data from: A new malaria agent in African hominids.") end + end - it "generates rdf_xml" do - rdf_xml = Maremma.from_xml(subject.rdf_xml).fetch("RDF", {}) - expect(rdf_xml.dig("ScholarlyArticle", "rdf:about")).to eq(subject.identifier) - end + describe "migrates landing page" do + let(:provider) { create(:provider, symbol: "ADMIN") } + let(:client) { create(:client, provider: provider) } - it "generates turtle" do - ttl = subject.turtle.split("\n") - expect(ttl[0]).to eq("@prefix schema: .") - expect(ttl[2]).to eq(" a schema:ScholarlyArticle;") + let(:last_landing_page_status_result) { { + "error" => nil, + "redirect-count" => 0, + "redirect-urls" => ["http://example.com", "https://example.com"], + "download-latency" => 200.323232, + "has-schema-org" => true, + "schema-org-id" => "10.14454/10703", + "dc-identifier" => nil, + "citation-doi" => nil, + "body-has-pid" => true + } } + + let(:timeNow) { Time.zone.now.iso8601 } + + let(:doi) { + create( + :doi, + client: client, + last_landing_page_status: 200, + last_landing_page_status_check: timeNow, + last_landing_page_content_type: "text/html", + last_landing_page: "http://example.com", + last_landing_page_status_result: last_landing_page_status_result + ) + } + + let(:landing_page) { { + "checked" => timeNow, + "status" => 200, + "url" => "http://example.com", + "contentType" => "text/html", + "error" => nil, + "redirectCount" => 0, + "redirectUrls" => ["http://example.com", "https://example.com"], + "downloadLatency" => 200, + "hasSchemaOrg" => true, + "schemaOrgId" => "10.14454/10703", + "dcIdentifier" => nil, + "citationDoi" => nil, + "bodyHasPid" => true + } } + + before { doi.save } + + it "migrates and corrects data" do + Doi.migrate_landing_page + + changed_doi = Doi.find(doi.id) + + expect(changed_doi.landing_page).to eq(landing_page) end end end diff --git a/spec/models/metadata_spec.rb b/spec/models/metadata_spec.rb index 377929e1f..24cb8f56c 100644 --- a/spec/models/metadata_spec.rb +++ b/spec/models/metadata_spec.rb @@ -80,9 +80,10 @@ expect(subject.namespace).to eq("http://datacite.org/schema/kernel-4") end - it "valid model" do - expect(subject.valid?).to be false - end + # TODO: db-fields-for-attributes + # it "valid model" do + # expect(subject.valid?).to be false + # end it "validates xml" do expect(subject.errors[:xml]).to be_empty diff --git a/spec/models/resource_type_spec.rb b/spec/models/resource_type_spec.rb deleted file mode 100644 index db3b325d4..000000000 --- a/spec/models/resource_type_spec.rb +++ /dev/null @@ -1,22 +0,0 @@ -require 'rails_helper' - -describe ResourceType, type: :model, vcr: true do - it "all" do - resource_types = ResourceType.all[:data] - expect(resource_types.length).to eq(15) - resource_type = resource_types.first - expect(resource_type.title).to eq("Audiovisual") - end - - it "query" do - resource_types = ResourceType.where(query: "data")[:data] - expect(resource_types.length).to eq(2) - resource_type = resource_types.first - expect(resource_type.title).to eq("DataPaper") - end - - it "one" do - resource_type = ResourceType.where(id: "text")[:data] - expect(resource_type.title).to eq("Text") - end -end diff --git a/spec/models/user_spec.rb b/spec/models/user_spec.rb index ffa8008ac..b340e9dc5 100644 --- a/spec/models/user_spec.rb +++ b/spec/models/user_spec.rb @@ -46,8 +46,9 @@ expect(user.role_id).to eq("provider_admin") end - it "has provider_id" do + it "has provider" do expect(user.provider_id).to eq(provider.symbol.downcase) + expect(user.provider.name).to eq(provider.name) end it "has name" do @@ -70,8 +71,9 @@ expect(user.provider_id).to eq(client.symbol.downcase.split(".").first) end - it "has client_id" do + it "has client" do expect(user.client_id).to eq(client.symbol.downcase) + expect(user.client.name).to eq(client.name) end it "has name" do diff --git a/spec/requests/client_prefixes_spec.rb b/spec/requests/client_prefixes_spec.rb index f2097728b..c3dc8fb74 100644 --- a/spec/requests/client_prefixes_spec.rb +++ b/spec/requests/client_prefixes_spec.rb @@ -93,7 +93,6 @@ before { post '/client-prefixes', params: valid_attributes.to_json, headers: headers } it 'creates a client-prefix' do - puts response.body expect(json.dig('data', 'id')).not_to be_nil end diff --git a/spec/requests/clients_spec.rb b/spec/requests/clients_spec.rb index e698de94d..c2735bb5c 100644 --- a/spec/requests/clients_spec.rb +++ b/spec/requests/clients_spec.rb @@ -11,8 +11,8 @@ "attributes" => { "symbol" => provider.symbol + ".IMPERIAL", "name" => "Imperial College", - "contact-name" => "Madonna", - "contact-email" => "bob@example.com" + "contactName" => "Madonna", + "contactEmail" => "bob@example.com" }, "relationships": { "provider": { @@ -107,7 +107,7 @@ it 'creates a client' do attributes = json.dig('data', 'attributes') expect(attributes["name"]).to eq("Imperial College") - expect(attributes["contact-name"]).to eq("Madonna") + expect(attributes["contactName"]).to eq("Madonna") relationships = json.dig('data', 'relationships') expect(relationships.dig("provider", "data", "id")).to eq(provider.symbol.downcase) @@ -124,7 +124,7 @@ "attributes" => { "symbol" => provider.symbol + ".IMPERIAL", "name" => "Imperial College", - "contact-name" => "Madonna" + "contactName" => "Madonna" }, "relationships": { "provider": { @@ -158,7 +158,6 @@ before { put "/clients/#{client.symbol}", params: params.to_json, headers: headers } it 'updates the record' do - puts response.body expect(json.dig('data', 'attributes', 'name')).to eq("Imperial College 2") expect(json.dig('data', 'attributes', 'name')).not_to eq(client.name) end @@ -214,6 +213,7 @@ before { delete "/clients/#{client.uid}", headers: headers } it 'returns status code 204' do + puts response.body expect(response).to have_http_status(204) end diff --git a/spec/requests/dois_spec.rb b/spec/requests/dois_spec.rb index 1910982e6..10d2a7700 100644 --- a/spec/requests/dois_spec.rb +++ b/spec/requests/dois_spec.rb @@ -7,27 +7,27 @@ let(:provider) { create(:provider, symbol: "DATACITE") } let(:client) { create(:client, provider: provider, symbol: ENV['MDS_USERNAME'], password: ENV['MDS_PASSWORD']) } - let(:prefix) { create(:prefix, prefix: "10.14454") } + let!(:prefix) { create(:prefix, prefix: "10.14454") } let!(:client_prefix) { create(:client_prefix, client: client, prefix: prefix) } let!(:dois) { create_list(:doi, 3, client: client) } let(:doi) { create(:doi, client: client) } let(:bearer) { Client.generate_token(role_id: "client_admin", uid: client.symbol, provider_id: provider.symbol.downcase, client_id: client.symbol.downcase, password: client.password) } let(:headers) { { 'ACCEPT'=>'application/vnd.api+json', 'CONTENT_TYPE'=>'application/vnd.api+json', 'Authorization' => 'Bearer ' + bearer }} - # describe 'GET /dois', elasticsearch: true do - # before do - # sleep 1 - # get '/dois', headers: headers - # end + describe 'GET /dois', elasticsearch: true do + before do + sleep 1 + get '/dois', headers: headers + end - # it 'returns dois' do - # expect(json['data'].size).to eq(3) - # end + # it 'returns dois' do + # expect(json['data'].size).to eq(0) + # end - # it 'returns status code 200' do - # expect(response).to have_http_status(200) - # end - # end + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end describe 'GET /dois/:id' do context 'when the record exists' do @@ -54,16 +54,240 @@ expect(json).to eq("errors"=>[{"status"=>"404", "title"=>"The resource you are looking for doesn't exist."}]) end end + + context 'anonymous user' do + before { get "/dois/#{doi.doi}" } + + it 'returns the Doi' do + expect(json).not_to be_empty + expect(json.fetch('errors')).to eq([{"status"=>"401", "title"=>"Bad credentials."}]) + end + + it 'returns status code 401' do + expect(response).to have_http_status(401) + end + end + + context 'invalid password' do + let(:bearer) { Client.generate_token(role_id: "client_admin", uid: client.symbol, provider_id: provider.symbol.downcase, client_id: client.symbol.downcase, password: "abc") } + let(:headers) { { 'ACCEPT'=>'application/vnd.api+json', 'CONTENT_TYPE'=>'application/vnd.api+json', 'Authorization' => 'Bearer ' + bearer }} + + before { get "/dois/#{doi.doi}" } + + it 'returns the Doi' do + expect(json).not_to be_empty + expect(json.fetch('errors')).to eq([{"status"=>"401", "title"=>"Bad credentials."}]) + end + + it 'returns status code 401' do + expect(response).to have_http_status(401) + end + end end - describe 'PATCH /dois/:id' do + describe 'state' do + let(:doi_id) { "10.14454/4K3M-NYVG" } + let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } let(:bearer) { User.generate_token(role_id: "client_admin", client_id: client.symbol.downcase) } let(:headers) { {'ACCEPT'=>'application/vnd.api+json', 'CONTENT_TYPE'=>'application/vnd.api+json', 'Authorization' => 'Bearer ' + bearer}} - before(:each) do - Rails.cache.clear + context 'initial state draft' do + before { get "/dois/#{doi.doi}", headers: headers } + + it 'fetches the record' do + expect(json.dig('data', 'attributes', 'url')).to eq(doi.url) + expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi.downcase) + expect(json.dig('data', 'attributes', 'titles')).to eq(doi.titles) + expect(json.dig('data', 'attributes', 'isActive')).to be false + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + + it 'initial state' do + expect(json.dig('data', 'attributes', 'state')).to eq("draft") + end + end + + context 'register' do + let(:valid_attributes) do + { + "data" => { + "type" => "dois", + "attributes" => { + "xml" => xml, + "url" => "http://www.bl.uk/pdf/pat.pdf", + "event" => "register" + } + } + } + end + before { patch "/dois/#{doi_id}", params: valid_attributes.to_json, headers: headers } + + it 'creates the record' do + expect(json.dig('data', 'attributes', 'doi')).to eq(doi_id.downcase) + expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/pat.pdf") + expect(json.dig('data', 'attributes', 'isActive')).to be false + end + + it 'returns status code 201' do + expect(response).to have_http_status(201) + end + + it 'sets state to registered' do + expect(json.dig('data', 'attributes', 'state')).to eq("registered") + end end + context 'register no url' do + let(:valid_attributes) do + { + "data" => { + "type" => "dois", + "attributes" => { + "xml" => xml, + "event" => "register" + } + } + } + end + before { patch "/dois/#{doi_id}", params: valid_attributes.to_json, headers: headers } + + it 'creates the record' do + expect(json.dig('data', 'attributes', 'doi')).to eq(doi_id.downcase) + expect(json.dig('data', 'attributes', 'url')).to be_nil + expect(json.dig('data', 'attributes', 'isActive')).to be false + end + + it 'returns status code 201' do + expect(response).to have_http_status(201) + end + + it 'state remains draft' do + expect(json.dig('data', 'attributes', 'state')).to eq("draft") + end + end + + context 'publish' do + let(:valid_attributes) do + { + "data" => { + "type" => "dois", + "attributes" => { + "url" => "http://www.bl.uk/pdf/pat.pdf", + "xml" => xml, + "event" => "publish" + } + } + } + end + before { patch "/dois/#{doi_id}", params: valid_attributes.to_json, headers: headers } + + it 'updates the record' do + expect(json.dig('data', 'attributes', 'doi')).to eq(doi_id.downcase) + expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/pat.pdf") + expect(json.dig('data', 'attributes', 'isActive')).to be true + end + + it 'returns status code 201' do + expect(response).to have_http_status(201) + end + + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") + end + end + + context 'publish no url' do + let(:valid_attributes) do + { + "data" => { + "type" => "dois", + "attributes" => { + "xml" => xml, + "event" => "publish" + } + } + } + end + before { patch "/dois/#{doi_id}", params: valid_attributes.to_json, headers: headers } + + it 'updates the record' do + expect(json.dig('data', 'attributes', 'doi')).to eq(doi_id.downcase) + expect(json.dig('data', 'attributes', 'url')).to be_nil + expect(json.dig('data', 'attributes', 'isActive')).to be false + end + + it 'returns status code 201' do + expect(response).to have_http_status(201) + end + + it 'state remains draft' do + expect(json.dig('data', 'attributes', 'state')).to eq("draft") + end + end + + context 'hide' do + let(:doi) { create(:doi, client: client, aasm_state: "findable") } + let(:valid_attributes) do + { + "data" => { + "type" => "dois", + "attributes" => { + "event" => "hide" + } + } + } + end + before { patch "/dois/#{doi.doi}", params: valid_attributes.to_json, headers: headers } + + it 'updates the record' do + expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi.downcase) + expect(json.dig('data', 'attributes', 'isActive')).to be false + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + + it 'state changes to register' do + expect(json.dig('data', 'attributes', 'state')).to eq("registered") + end + end + + context 'hide with reason' do + let(:doi) { create(:doi, client: client, aasm_state: "findable") } + let(:valid_attributes) do + { + "data" => { + "type" => "dois", + "attributes" => { + "event" => "hide", + "reason" => "withdrawn by author" + } + } + } + end + before { patch "/dois/#{doi.doi}", params: valid_attributes.to_json, headers: headers } + + it 'updates the record' do + expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi.downcase) + expect(json.dig('data', 'attributes', 'isActive')).to be false + expect(json.dig('data', 'attributes', 'reason')).to eq("withdrawn by author") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + + it 'state changes to register' do + expect(json.dig('data', 'attributes', 'state')).to eq("registered") + end + end + end + + describe 'PATCH /dois/:id' do context 'when the record exists' do let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } let(:valid_attributes) do @@ -82,10 +306,7 @@ it 'updates the record' do expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/pat.pdf") expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi.downcase) - expect(json.dig('data', 'attributes', 'title')).to eq("Eating your own Dog Food") - - xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) - expect(xml.dig("titles", "title")).to eq("Eating your own Dog Food") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Eating your own Dog Food"}]) end it 'returns status code 200' do @@ -97,24 +318,35 @@ end end - context 'when the record exists no creator validate' do - let(:xml) { Base64.strict_encode64(file_fixture('datacite_missing_creator.xml').read) } + context 'when the record exists no data attribute' do + let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } + let(:valid_attributes) do + { + "url" => "http://www.bl.uk/pdf/pat.pdf", + "xml" => xml + } + end + before { patch "/dois/#{doi.doi}", params: valid_attributes.to_json, headers: headers } + + it 'raises an error' do + expect(json.dig('errors')).to eq([{"status"=>"400", "title"=>"You need to provide a payload following the JSONAPI spec"}]) + end + + it 'returns status code 400' do + expect(response).to have_http_status(400) + end + end + + context 'no creators validate' do + let(:doi) { create(:doi, client: client, creators: nil) } let(:valid_attributes) do { "data" => { "type" => "dois", "attributes" => { "url" => "http://www.bl.uk/pdf/pat.pdf", - "xml" => xml, - "validate" => "true" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "xml" => Base64.strict_encode64(doi.xml), + "event" => "publish" } } } @@ -131,8 +363,8 @@ end context 'when the record exists https://github.com/datacite/lupo/issues/89' do - let(:doi) { create(:doi, doi: "10.24425/119496", client: client, state: "registered") } - let(:valid_attributes) {file_fixture('datacite_89.json').read} + let(:doi) { create(:doi, doi: "10.14454/119496", client: client) } + let(:valid_attributes) { file_fixture('datacite_89.json').read } before { put "/dois/#{doi.doi}", params: valid_attributes, headers: headers } @@ -145,8 +377,7 @@ end end - context 'when the record exists 2.2' do - let(:doi) { create(:doi, doi: "10.24425/119497", client: client, state: "registered") } + context 'schema 2.2' do let(:xml) { Base64.strict_encode64(file_fixture('datacite_schema_2.2.xml').read) } let(:valid_attributes) do { @@ -154,57 +385,54 @@ "type" => "dois", "attributes" => { "xml" => xml, - "title" => "Eating your own Dog Food", + "url" => "http://www.bl.uk/pdf/patspec.pdf", "event" => "publish" } } } end - before { patch "/dois/#{doi.doi}", params: valid_attributes.to_json, headers: headers } + before { patch "/dois/10.14454/10703", params: valid_attributes.to_json, headers: headers } it 'updates the record' do - expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi.downcase) - expect(json.dig('data', 'attributes', 'title')).to eq("Eating your own Dog Food") + expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") + expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/patspec.pdf") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Właściwości rzutowań podprzestrzeniowych"}, {"title"=>"Translation of Polish titles", "titleType"=>"TranslatedTitle"}]) + expect(json.dig('data', 'attributes', 'schemaVersion')).to eq("http://datacite.org/schema/kernel-2.2") xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) - expect(xml.dig("titles", "title")).to eq("Eating your own Dog Food") + expect(xml.dig("titles", "title")).to eq(["Właściwości rzutowań podprzestrzeniowych", {"__content__"=>"Translation of Polish titles", "titleType"=>"TranslatedTitle"}]) end - it 'returns status code 200' do - expect(response).to have_http_status(200) + it 'returns status code 201' do + expect(response).to have_http_status(201) end end context 'NoMethodError https://github.com/datacite/lupo/issues/84' do - let(:doi_id) { "10.14454/m9.figshare.6839054.v1" } + let(:doi) { create(:doi, client: client) } + let(:url) { "https://figshare.com/articles/Additional_file_1_of_Contemporary_ancestor_Adaptive_divergence_from_standing_genetic_variation_in_Pacific_marine_threespine_stickleback/6839054/1" } let(:valid_attributes) do { "data" => { "type" => "dois", "attributes" => { - "url"=> "https://figshare.com/articles/Additional_file_1_of_Contemporary_ancestor_Adaptive_divergence_from_standing_genetic_variation_in_Pacific_marine_threespine_stickleback/6839054/1", + "url"=> url, + "xml" => Base64.strict_encode64(doi.xml), "event" => "publish" - }, - "relationships" => { - "client" => { - "data" => { - "type" => "clients", - "id" => client.symbol.downcase - } - } } } } end - before { put "/dois/#{doi_id}", params: valid_attributes.to_json, headers: headers } + before { put "/dois/#{doi.doi}", params: valid_attributes.to_json, headers: headers } it 'returns no errors' do - expect(json.dig('data', 'attributes', 'doi')).to eq(doi_id) + expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi.downcase) + expect(json.dig('data', 'attributes', 'url')).to eq(url) end - it 'returns status code 201' do - expect(response).to have_http_status(201) + it 'returns status code 200' do + expect(response).to have_http_status(200) end end @@ -217,15 +445,8 @@ "type" => "dois", "attributes" => { "url" => "http://www.bl.uk/pdf/pat.pdf", - "xml" => xml - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "xml" => xml, + "event" => "publish" } } } @@ -235,22 +456,19 @@ it 'creates the record' do expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/pat.pdf") expect(json.dig('data', 'attributes', 'doi')).to eq(doi_id.downcase) - expect(json.dig('data', 'attributes', 'title')).to eq("Eating your own Dog Food") - - xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) - expect(xml.dig("titles", "title")).to eq("Eating your own Dog Food") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Eating your own Dog Food"}]) end it 'returns status code 201' do expect(response).to have_http_status(201) end - it 'sets state to draft' do - expect(json.dig('data', 'attributes', 'state')).to eq("draft") + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end - context 'when the record doesn\'t exist no creator validate' do + context 'when the record doesn\'t exist no creators publish' do let(:doi_id) { "10.14454/077d-fj48" } let(:xml) { Base64.strict_encode64(file_fixture('datacite_missing_creator.xml').read) } let(:valid_attributes) do @@ -260,15 +478,7 @@ "attributes" => { "url" => "http://www.bl.uk/pdf/pat.pdf", "xml" => xml, - "validate" => "true" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "event" => "publish" } } } @@ -302,10 +512,7 @@ it 'updates the record' do expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/pat.pdf") expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi.downcase) - expect(json.dig('data', 'attributes', 'title')).to eq("Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth") - - xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) - expect(xml.dig("titles", "title")).to eq("Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth"}]) end it 'returns status code 200' do @@ -319,7 +526,7 @@ context 'when the title is changed' do let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } - let(:title) { "Submitted chemical data for InChIKey=YAPQBXQYLJRXSA-UHFFFAOYSA-N" } + let(:titles) { [{ "title" => "Submitted chemical data for InChIKey=YAPQBXQYLJRXSA-UHFFFAOYSA-N" }] } let(:valid_attributes) do { "data" => { @@ -327,16 +534,8 @@ "attributes" => { "url" => "http://www.bl.uk/pdf/pat.pdf", "xml" => xml, - "title" => title, - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "titles" => titles, + "event" => "publish" } } } @@ -346,24 +545,21 @@ it 'updates the record' do expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/pat.pdf") expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi.downcase) - expect(json.dig('data', 'attributes', 'title')).to eq(title) - - xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) - expect(xml.dig("titles", "title")).to eq(title) + expect(json.dig('data', 'attributes', 'titles')).to eq(titles) end it 'returns status code 200' do expect(response).to have_http_status(200) end - it 'sets state to registered' do - expect(json.dig('data', 'attributes', 'state')).to eq("registered") + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end - context 'when the author changes' do + context 'when the creators change' do let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } - let(:author) { [{ "name"=>"Ollomi, Benjamin" }, { "name"=>"Duran, Patrick" }] } + let(:creators) { [{ "name"=>"Ollomi, Benjamin" }, { "name"=>"Duran, Patrick" }] } let(:valid_attributes) do { "data" => { @@ -371,16 +567,8 @@ "attributes" => { "url" => "http://www.bl.uk/pdf/pat.pdf", "xml" => xml, - "author" => author, - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "creators" => creators, + "event" => "publish" } } } @@ -390,18 +578,15 @@ it 'updates the record' do expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/pat.pdf") expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi.downcase) - expect(json.dig('data', 'attributes', 'author')).to eq(author) - - xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) - expect(xml.dig("creators", "creator")).to eq([{"creatorName"=>"Ollomi, Benjamin"}, {"creatorName"=>"Duran, Patrick"}]) + expect(json.dig('data', 'attributes', 'creators')).to eq(creators) end it 'returns status code 200' do expect(response).to have_http_status(200) end - it 'sets state to registered' do - expect(json.dig('data', 'attributes', 'state')).to eq("registered") + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end @@ -412,7 +597,8 @@ let(:doi) { create(:doi, client: client) } let(:new_client) { create(:client, symbol: "#{provider.symbol}.magic", provider: provider, password: ENV['MDS_PASSWORD']) } - ## Attributes MUST be empty + + # attributes MUST be empty let(:valid_attributes) {file_fixture('transfer.json').read } before { put "/dois/#{doi.doi}", params: valid_attributes, headers: provider_headers } @@ -422,14 +608,14 @@ end end - context 'passeswhen we transfer a DOI as provider' do - + context 'passes when we transfer a DOI as provider' do let(:provider_bearer) { User.generate_token(uid: "datacite", role_id: "provider_admin", name: "DataCite", email:"support@datacite.org", provider_id: "datacite") } let(:provider_headers) { {'ACCEPT'=>'application/vnd.api+json', 'CONTENT_TYPE'=>'application/vnd.api+json', 'Authorization' => 'Bearer ' + provider_bearer}} let(:doi) { create(:doi, client: client) } let(:new_client) { create(:client, symbol: "#{provider.symbol}.magic", provider: provider, password: ENV['MDS_PASSWORD']) } - ## Attributes MUST be empty + + # attributes MUST be empty let(:valid_attributes) do { "data" => { @@ -457,13 +643,14 @@ end it 'updates the client id' do + # TODO: db-fields-for-attributes relates to delay in Elasticsearch indexing expect(json.dig('data', 'relationships', 'client','data','id')).to eq(new_client.symbol.downcase) - expect(json.dig('data', 'attributes', 'title')).to eq(doi.title) + expect(json.dig('data', 'attributes', 'titles')).to eq(doi.titles) end end - context 'when we transfer a DOI as staff' do - let(:doi) { create(:doi, doi: "10.24425/119495", client: client, state: "registered") } + context 'when we transfer a DOI as staff' do + let(:doi) { create(:doi, doi: "10.14454/119495", url: "http://www.bl.uk/pdf/pat.pdf", client: client, aasm_state: "registered") } let(:new_client) { create(:client, symbol: "#{provider.symbol}.magic", provider: provider, password: ENV['MDS_PASSWORD']) } let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } let(:valid_attributes) do @@ -471,8 +658,7 @@ "data" => { "type" => "dois", "attributes" => { - "url" => "http://www.bl.uk/pdf/pat.pdf", - "xml" => xml + "mode" => "transfer" }, "relationships"=> { "client"=> { @@ -486,166 +672,257 @@ } end - before { put "/dois/#{doi.doi}", params: valid_attributes.to_json, headers: admin_headers } + before { put "/dois/#{doi.doi}", params: valid_attributes.to_json, headers: admin_headers } + + it 'returns no errors' do + puts response.body + expect(response).to have_http_status(200) + expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi) + end + + it 'updates the client id' do + # TODO: db-fields-for-attributes relates to delay in Elasticsearch indexing + expect(json.dig('data', 'relationships', 'client','data','id')).to eq(new_client.symbol.downcase) + end + end + + context 'when the resource_type_general changes' do + let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } + let(:types) { { "resourceTypeGeneral" => "DataPaper", "resourceType" => "BlogPosting" } } + let(:valid_attributes) do + { + "data" => { + "type" => "dois", + "attributes" => { + "url" => "http://www.bl.uk/pdf/pat.pdf", + "xml" => xml, + "types" => types, + "event" => "publish" + } + } + } + end + before { patch "/dois/#{doi.doi}", params: valid_attributes.to_json, headers: headers } + + it 'updates the record' do + expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/pat.pdf") + expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi.downcase) + expect(json.dig('data', 'attributes', 'types')).to eq("resourceType"=>"BlogPosting", "resourceTypeGeneral"=>"DataPaper") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") + end + end + end + + describe 'POST /dois' do + context 'when the request is valid' do + let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } + let(:valid_attributes) do + { + "data" => { + "type" => "dois", + "attributes" => { + "doi" => "10.14454/10703", + "url" => "http://www.bl.uk/pdf/patspec.pdf", + "xml" => xml, + "source" => "test", + "event" => "publish" + } + } + } + end + + before { post '/dois', params: valid_attributes.to_json, headers: headers } + + it 'creates a Doi' do + expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/patspec.pdf") + expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Eating your own Dog Food"}]) + expect(json.dig('data', 'attributes', 'creators')).to eq([{"familyName"=>"Fenner", + "givenName"=>"Martin", + "name"=>"Fenner, Martin", + "nameIdentifiers"=> + [{"nameIdentifier"=>"https://orcid.org/0000-0003-1419-2405", + "nameIdentifierScheme"=>"ORCID"}], + "nameType"=>"Personal"}]) + expect(json.dig('data', 'attributes', 'schemaVersion')).to eq("http://datacite.org/schema/kernel-4") + expect(json.dig('data', 'attributes', 'source')).to eq("test") + expect(json.dig('data', 'attributes', 'types')).to eq("bibtex"=>"article", "citeproc"=>"article-journal", "resourceType"=>"BlogPosting", "resourceTypeGeneral"=>"Text", "ris"=>"RPRT", "schemaOrg"=>"ScholarlyArticle") + + doc = Nokogiri::XML(Base64.decode64(json.dig('data', 'attributes', 'xml')), nil, 'UTF-8', &:noblanks) + expect(doc.at_css("identifier").content).to eq("10.14454/10703") + end + + it 'returns status code 201' do + expect(response).to have_http_status(201) + end + + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") + end + end + + context 'when the request is valid with attributes' do + let(:valid_attributes) do + { + "data" => { + "type" => "dois", + "attributes" => { + "doi" => "10.14454/10703", + "url" => "http://www.bl.uk/pdf/patspec.pdf", + "types" => { "bibtex"=>"article", "citeproc"=>"article-journal", "resourceType"=>"BlogPosting", "resourceTypeGeneral"=>"Text", "ris"=>"RPRT", "schemaOrg"=>"ScholarlyArticle" }, + "titles" => [{"title"=>"Eating your own Dog Food"}], + "publisher" => "DataCite", + "publicationYear" => 2016, + "creators" => [{"familyName"=>"Fenner", "givenName"=>"Martin", "id"=>"https://orcid.org/0000-0003-1419-2405", "name"=>"Fenner, Martin", "type"=>"Person"}], + "source" => "test", + "event" => "publish" + } + } + } + end + + before { post '/dois', params: valid_attributes.to_json, headers: headers } + + it 'creates a Doi' do + expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/patspec.pdf") + expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Eating your own Dog Food"}]) + expect(json.dig('data', 'attributes', 'creators')).to eq( [{"familyName"=>"Fenner", "givenName"=>"Martin", "id"=>"https://orcid.org/0000-0003-1419-2405", "name"=>"Fenner, Martin", "type"=>"Person"}]) + expect(json.dig('data', 'attributes', 'publisher')).to eq("DataCite") + expect(json.dig('data', 'attributes', 'publicationYear')).to eq(2016) + # expect(json.dig('data', 'attributes', 'schemaVersion')).to eq("http://datacite.org/schema/kernel-4") + expect(json.dig('data', 'attributes', 'source')).to eq("test") + expect(json.dig('data', 'attributes', 'types')).to eq("bibtex"=>"article", "citeproc"=>"article-journal", "resourceType"=>"BlogPosting", "resourceTypeGeneral"=>"Text", "ris"=>"RPRT", "schemaOrg"=>"ScholarlyArticle") + doc = Nokogiri::XML(Base64.decode64(json.dig('data', 'attributes', 'xml')), nil, 'UTF-8', &:noblanks) + expect(doc.at_css("identifier").content).to eq("10.14454/10703") + end + + it 'returns status code 201' do + expect(response).to have_http_status(201) + end + + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") + end + end + + context 'schema_org' do + let(:xml) { Base64.strict_encode64(file_fixture('schema_org_topmed.json').read) } + let(:valid_attributes) do + { + "data" => { + "type" => "dois", + "attributes" => { + "url" => "https://ors.datacite.org/doi:/10.14454/8na3-9s47", + "xml" => xml, + "source" => "test", + "event" => "publish" + } + } + } + end + + before { patch "/dois/10.14454/8na3-9s47", params: valid_attributes.to_json, headers: headers } + + it 'updates the record' do + expect(json.dig('data', 'attributes', 'url')).to eq("https://ors.datacite.org/doi:/10.14454/8na3-9s47") + expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/8na3-9s47") + expect(json.dig('data', 'attributes', 'contentUrl')).to eq(["s3://cgp-commons-public/topmed_open_access/197bc047-e917-55ed-852d-d563cdbc50e4/NWD165827.recab.cram", "gs://topmed-irc-share/public/NWD165827.recab.cram"]) + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"NWD165827.recab.cram"}]) - it 'returns no errors' do - expect(response).to have_http_status(200) - expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi) + xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) + expect(xml.dig("titles", "title")).to eq("NWD165827.recab.cram") end - it 'updates the client id' do - expect(json.dig('data', 'relationships', 'client','data','id')).to eq(new_client.symbol.downcase) + it 'returns status code 201' do + expect(response).to have_http_status(201) + end + + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end - context 'when the resource_type_general changes' do - let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } - let(:resource_type_general) { "data-paper" } + context 'crossref url', vcr: true do + let(:xml) { Base64.strict_encode64("https://doi.org/10.7554/elife.01567") } let(:valid_attributes) do { "data" => { "type" => "dois", "attributes" => { - "url" => "http://www.bl.uk/pdf/pat.pdf", + "url" => "https://elifesciences.org/articles/01567", "xml" => xml, - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - }, - "resource-type"=> { - "data"=> { - "type"=> "resource-types", - "id"=> resource_type_general - } - } + "source" => "test", + "event" => "publish" } } } end - before { patch "/dois/#{doi.doi}", params: valid_attributes.to_json, headers: headers } + + before { patch "/dois/10.14454/elife.01567", params: valid_attributes.to_json, headers: headers } it 'updates the record' do - expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/pat.pdf") - expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi.downcase) - # expect(json.dig('data', 'relationships', 'resource-type')).to eq(2) + expect(json.dig('data', 'attributes', 'url')).to eq("https://elifesciences.org/articles/01567") + expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/elife.01567") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth"}]) xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) - expect(xml.dig("resourceType")).to eq("resourceTypeGeneral"=>"DataPaper", "__content__"=>"BlogPosting") + expect(xml.dig("titles", "title")).to eq("Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth") end - it 'returns status code 200' do - expect(response).to have_http_status(200) + it 'returns status code 201' do + puts response.body + expect(response).to have_http_status(201) end - it 'sets state to registered' do - expect(json.dig('data', 'attributes', 'state')).to eq("registered") + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end - end - - describe 'POST /dois' do - before(:each) do - Rails.cache.clear - end - context 'when the request is valid' do - let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } + context 'datacite url', vcr: true do + let(:xml) { Base64.strict_encode64("https://doi.org/10.7272/q6g15xs4") } let(:valid_attributes) do { "data" => { "type" => "dois", "attributes" => { - "doi" => "10.14454/10703", - "url" => "http://www.bl.uk/pdf/patspec.pdf", + "url" => "https://datashare.ucsf.edu/stash/dataset/doi:10.7272/Q6G15XS4", "xml" => xml, "source" => "test", - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "event" => "publish" } } } end - before { post '/dois', params: valid_attributes.to_json, headers: headers } + before { patch "/dois/10.14454/q6g15xs4", params: valid_attributes.to_json, headers: headers } - it 'creates a Doi' do - expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/patspec.pdf") - expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("Eating your own Dog Food") - expect(json.dig('data', 'attributes', 'schema-version')).to eq("http://datacite.org/schema/kernel-4") - expect(json.dig('data', 'attributes', 'source')).to eq("test") - expect(json.dig('data', 'relationships', 'resource-type', 'data', 'id')).to eq("text") + it 'updates the record' do + expect(json.dig('data', 'attributes', 'url')).to eq("https://datashare.ucsf.edu/stash/dataset/doi:10.7272/Q6G15XS4") + expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/q6g15xs4") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"NEXUS Head CT"}]) xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) - expect(xml.dig("resourceType")).to eq("resourceTypeGeneral"=>"Text", "__content__"=>"BlogPosting") + expect(xml.dig("titles", "title")).to eq("NEXUS Head CT") end it 'returns status code 201' do expect(response).to have_http_status(201) end - it 'sets state to registered' do - expect(json.dig('data', 'attributes', 'state')).to eq("registered") + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end - # context 'schema_org' do - # let(:xml) { Base64.strict_encode64(file_fixture('schema_org_topmed.json').read) } - # let(:valid_attributes) do - # { - # "data" => { - # "type" => "dois", - # "attributes" => { - # "url" => "https://ors.datacite.org/doi:/10.14454/8na3-9s47", - # "xml" => xml, - # "source" => "test", - # "event" => "register" - # } - # }, - # "relationships"=> { - # "client"=> { - # "data"=> { - # "type"=> "clients", - # "id"=> client.symbol.downcase - # } - # } - # } - # } - # end - - # before { patch "/dois/10.14454/8na3-9s47", params: valid_attributes.to_json, headers: headers } - - # it 'updates the record' do - # expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/pat.pdf") - # expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi.downcase) - # expect(json.dig('data', 'attributes', 'title')).to eq("Eating your own Dog Food") - - # xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) - # expect(xml.dig("titles", "title")).to eq("Eating your own Dog Food") - # end - - # it 'returns status code 200' do - # puts response.body - # expect(response).to have_http_status(200) - # end - - # it 'sets state to draft' do - # expect(json.dig('data', 'attributes', 'state')).to eq("draft") - # end - # end - context 'when the request uses schema 3' do let(:xml) { Base64.strict_encode64(file_fixture('datacite_schema_3.xml').read) } let(:valid_attributes) do @@ -657,15 +934,7 @@ "url" => "http://www.bl.uk/pdf/patspec.pdf", "xml" => xml, "source" => "test", - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "event" => "publish" } } } @@ -676,17 +945,17 @@ it 'creates a Doi' do expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/patspec.pdf") expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("Data from: A new malaria agent in African hominids.") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Data from: A new malaria agent in African hominids."}]) expect(json.dig('data', 'attributes', 'source')).to eq("test") - # expect(json.dig('data', 'attributes', 'schema-version')).to eq("http://datacite.org/schema/kernel-3") + expect(json.dig('data', 'attributes', 'schemaVersion')).to eq("http://datacite.org/schema/kernel-3") end it 'returns status code 201' do expect(response).to have_http_status(201) end - it 'sets state to registered' do - expect(json.dig('data', 'attributes', 'state')).to eq("registered") + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end @@ -700,15 +969,7 @@ # "doi" => "10.14454/10703", # "url" => "http://www.bl.uk/pdf/patspec.pdf", # "xml" => xml, - # "event" => "register" - # }, - # "relationships"=> { - # "client"=> { - # "data"=> { - # "type"=> "clients", - # "id"=> client.symbol.downcase - # } - # } + # "event" => "publish" # } # } # } @@ -719,7 +980,16 @@ # it 'creates a Doi' do # expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/patspec.pdf") # expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - # expect(json.dig('data', 'attributes', 'title')).to eq("A dataset with a large file for testing purpose. Will be a but over 2.5 MB") + + # expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"A dataset with a large file for testing purpose. Will be a but over 2.5 MB"}]) + # expect(json.dig('data', 'attributes', 'creators')).to eq([{"familyName"=>"Testing", "givenName"=>"Chris Baars At DANS For", "name"=>"Chris Baars At DANS For Testing", "type"=>"Person"}]) + # expect(json.dig('data', 'attributes', 'publisher')).to eq("DANS/KNAW") + # expect(json.dig('data', 'attributes', 'publicationYear')).to eq(2018) + # expect(json.dig('data', 'attributes', 'schemaVersion')).to eq("http://datacite.org/schema/kernel-4") + # expect(json.dig('data', 'attributes', 'types')).to eq("bibtex"=>"misc", "citeproc"=>"dataset", "resourceType"=>"Dataset", "resourceTypeGeneral"=>"Dataset", "ris"=>"DATA", "schemaOrg"=>"Dataset") + + # doc = Nokogiri::XML(Base64.decode64(json.dig('data', 'attributes', 'xml')), nil, 'UTF-8', &:noblanks) + # expect(doc.at_css("identifier").content).to eq("10.14454/10703") # end # it 'returns status code 201' do @@ -737,15 +1007,7 @@ "doi" => "10.14454/10703", "url" => "http://www.bl.uk/pdf/patspec.pdf", "xml" => xml, - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "event" => "publish" } } } @@ -755,16 +1017,16 @@ it 'creates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("LAMMPS Data-File Generator") - # expect(json.dig('data', 'attributes', 'schema-version')).to eq("http://datacite.org/schema/kernel-3") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"LAMMPS Data-File Generator"}]) + expect(json.dig('data', 'attributes', 'schemaVersion')).to eq("http://datacite.org/schema/kernel-2.2") end it 'returns status code 201' do expect(response).to have_http_status(201) end - it 'sets state to registered' do - expect(json.dig('data', 'attributes', 'state')).to eq("registered") + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end @@ -778,15 +1040,7 @@ "doi" => "10.14454/10703", "url" => "http://www.bl.uk/pdf/patspec.pdf", "xml" => xml, - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "event" => "publish" } } } @@ -796,21 +1050,20 @@ it 'creates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("Southern Sierra Critical Zone Observatory (SSCZO), Providence Creek\n meteorological data, soil moisture and temperature, snow depth and air\n temperature") - expect(json.dig('data', 'attributes', 'schema-version')).to eq("http://datacite.org/schema/kernel-4") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Southern Sierra Critical Zone Observatory (SSCZO), Providence Creek\n meteorological data, soil moisture and temperature, snow depth and air\n temperature"}]) + expect(json.dig('data', 'attributes', 'schemaVersion')).to eq("http://datacite.org/schema/kernel-4") end it 'returns status code 201' do expect(response).to have_http_status(201) end - it 'sets state to registered' do - expect(json.dig('data', 'attributes', 'state')).to eq("registered") + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end - context 'when the request uses namespaced xml and the title changes' do - let(:title) { "Referee report. For: RESEARCH-3482 [version 5; referees: 1 approved, 1 approved with reservations]" } + context 'when the request uses namespaced xml' do let(:xml) { Base64.strict_encode64(file_fixture('ns0.xml').read) } let(:valid_attributes) do { @@ -820,16 +1073,7 @@ "doi" => "10.14454/10703", "url" => "http://www.bl.uk/pdf/patspec.pdf", "xml" => xml, - "title" => title, - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "event" => "publish" } } } @@ -839,22 +1083,21 @@ it 'creates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("Referee report. For: RESEARCH-3482 [version 5; referees: 1 approved, 1 approved with reservations]") - # expect(json.dig('data', 'attributes', 'schema-version')).to eq("http://datacite.org/schema/kernel-3") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"LAMMPS Data-File Generator"}]) + expect(json.dig('data', 'attributes', 'schemaVersion')).to eq("http://datacite.org/schema/kernel-2.2") end it 'returns status code 201' do expect(response).to have_http_status(201) end - it 'sets state to registered' do - expect(json.dig('data', 'attributes', 'state')).to eq("registered") + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end - context 'when the title changes' do - let(:title) { "Referee report. For: RESEARCH-3482 [version 5; referees: 1 approved, 1 approved with reservations]" } + let(:titles) { { "title" => "Referee report. For: RESEARCH-3482 [version 5; referees: 1 approved, 1 approved with reservations]" } } let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } let(:valid_attributes) do { @@ -865,16 +1108,8 @@ "url" => "http://www.bl.uk/pdf/patspec.pdf", "xml" => xml, "source" => "test", - "title" => title, - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "titles" => titles, + "event" => "publish" } } } @@ -884,20 +1119,17 @@ it 'creates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("Referee report. For: RESEARCH-3482 [version 5; referees: 1 approved, 1 approved with reservations]") + expect(json.dig('data', 'attributes', 'titles')).to eq("title"=>"Referee report. For: RESEARCH-3482 [version 5; referees: 1 approved, 1 approved with reservations]") expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/patspec.pdf") expect(json.dig('data', 'attributes', 'source')).to eq("test") - - xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) - expect(xml.dig("titles", "title")).to eq(title) end it 'returns status code 201' do expect(response).to have_http_status(201) end - it 'sets state to registered' do - expect(json.dig('data', 'attributes', 'state')).to eq("registered") + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end @@ -912,15 +1144,7 @@ "doi" => "10.14454/10703", "url" => url, "xml" => xml, - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "event" => "publish" } } } @@ -937,12 +1161,12 @@ expect(response).to have_http_status(201) end - it 'sets state to registered' do - expect(json.dig('data', 'attributes', 'state')).to eq("registered") + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end - context 'when the title changes to nil' do + context 'when the titles changes to nil' do let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } let(:valid_attributes) do { @@ -952,16 +1176,8 @@ "doi" => "10.14454/10703", "url" => "http://www.bl.uk/pdf/patspec.pdf", "xml" => xml, - "title" => nil, - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "titles" => nil, + "event" => "publish" } } } @@ -971,23 +1187,21 @@ it 'creates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("Eating your own Dog Food") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Eating your own Dog Food"}]) expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/patspec.pdf") - - xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) - expect(xml.dig("titles", "title")).to eq("Eating your own Dog Food") end it 'returns status code 201' do + expect(response).to have_http_status(201) end - it 'sets state to registered' do - expect(json.dig('data', 'attributes', 'state')).to eq("registered") + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end - context 'when the title changes to blank' do + context 'when the titles changes to blank' do let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } let(:valid_attributes) do { @@ -997,16 +1211,8 @@ "doi" => "10.14454/10703", "url" => "http://www.bl.uk/pdf/patspec.pdf", "xml" => xml, - "title" => '', - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.uid - } - } + "titles" => nil, + "event" => "publish" } } } @@ -1014,27 +1220,23 @@ before { post '/dois', params: valid_attributes.to_json, headers: headers } - # it 'creates a Doi' do - # expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - # expect(json.dig('data', 'attributes', 'title')).to eq("") - # expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/patspec.pdf") - - # xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) - # expect(xml.dig("titles", "title")).to be_nil - # end + it 'creates a Doi' do + expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Eating your own Dog Food"}]) + expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/patspec.pdf") + end - # it 'returns status code 201' do - # expect(response.body).to eq(2) - # expect(response).to have_http_status(201) - # end + it 'returns status code 201' do + expect(response).to have_http_status(201) + end - # it 'sets state to registered' do - # expect(json.dig('data', 'attributes', 'state')).to eq("registered") - # end + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") + end end - context 'when the author changes' do - let(:author) { [{ "name"=>"Ollomi, Benjamin" }, { "name"=>"Duran, Patrick" }] } + context 'when the creators change' do + let(:creators) { [{ "name"=>"Ollomi, Benjamin" }, { "name"=>"Duran, Patrick" }] } let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } let(:valid_attributes) do { @@ -1044,16 +1246,8 @@ "doi" => "10.14454/10703", "url" => "http://www.bl.uk/pdf/patspec.pdf", "xml" => xml, - "author" => author, - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "creators" => creators, + "event" => "publish" } } } @@ -1063,24 +1257,21 @@ it 'creates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'author')).to eq(author) + expect(json.dig('data', 'attributes', 'creators')).to eq(creators) expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/patspec.pdf") - - xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) - expect(xml.dig("creators", "creator")).to eq([{"creatorName"=>"Ollomi, Benjamin"}, {"creatorName"=>"Duran, Patrick"}]) end it 'returns status code 201' do expect(response).to have_http_status(201) end - it 'sets state to registered' do - expect(json.dig('data', 'attributes', 'state')).to eq("registered") + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end - context 'when the author changes no xml' do - let(:author) { [{ "name"=>"Ollomi, Benjamin" }, { "name"=>"Duran, Patrick" }] } + context 'creators no xml' do + let(:creators) { [{ "name"=>"Ollomi, Benjamin" }, { "name"=>"Duran, Patrick" }] } let(:valid_attributes) do { "data" => { @@ -1089,16 +1280,8 @@ "doi" => "10.14454/10703", "url" => "http://www.bl.uk/pdf/patspec.pdf", "xml" => nil, - "author" => author, + "creators" => creators, "event" => "publish" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } } } } @@ -1106,23 +1289,13 @@ before { post '/dois', params: valid_attributes.to_json, headers: headers } - # it 'creates a Doi' do - # expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - # expect(json.dig('data', 'attributes', 'author')).to eq(author) - # expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/patspec.pdf") - - # xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) - # expect(xml.dig("creators", "creator")).to eq([{"creatorName"=>"Ollomi, Benjamin"}, {"creatorName"=>"Duran, Patrick"}]) - # end - - # it 'returns status code 201' do - # expect(response.body).to eq(2) - # expect(response).to have_http_status(201) - # end + it 'returns validation error' do + expect(json.dig('errors')).to eq([{"source"=>"metadata", "title"=>"Is invalid"}]) + end - # it 'sets state to registered' do - # expect(json.dig('data', 'attributes', 'state')).to eq("draft") - # end + it 'returns status code 422' do + expect(response).to have_http_status(422) + end end context 'state change with test prefix' do @@ -1136,15 +1309,7 @@ "attributes" => { "doi" => "10.5072/10704", "url" => "http://www.bl.uk/pdf/patspec.pdf", - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "event" => "publish" } } } @@ -1173,14 +1338,6 @@ "attributes" => { "doi" => "10.aaaa03", "url"=> "http://www.bl.uk/pdf/patspec.pdf", - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } } } } @@ -1206,14 +1363,6 @@ "doi" => "10.14454/10703", "url"=> "http://www.bl.uk/pdf/patspec.pdf", "xml" => xml - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } } } } @@ -1226,36 +1375,23 @@ it 'creates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("Eating your own Dog Food") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Eating your own Dog Food"}]) expect(json.dig('data', 'attributes', 'url')).to eq("http://www.bl.uk/pdf/patspec.pdf") - expect(json.dig('data', 'attributes', 'author')).to be_blank - - xml = Maremma.from_xml(Base64.decode64(json.dig('data', 'attributes', 'xml'))).fetch("resource", {}) - expect(xml.dig("titles", "title")).to eq("Eating your own Dog Food") - expect(xml.dig("creators", "creator")).to be_nil + expect(json.dig('data', 'attributes', 'creators')).to be_blank end end context 'when the xml is invalid' do - let(:doi) { create(:doi, client: client, doi: "10.14454/4f6f-zr33") } let(:xml) { Base64.strict_encode64(file_fixture('datacite_missing_creator.xml').read) } let(:not_valid_attributes) do { "data" => { "type" => "dois", "attributes" => { - "doi" => doi.doi, + "doi" => "10.14454/4K3M-NYVG", "url"=> "http://www.bl.uk/pdf/patspec.pdf", "xml" => xml, "event" => "publish" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } } } } @@ -1272,9 +1408,6 @@ end describe 'POST /dois/validate' do - let(:bearer) { User.generate_token(role_id: "client_admin", client_id: client.symbol.downcase) } - let(:headers) { {'ACCEPT'=>'application/vnd.api+json', 'CONTENT_TYPE'=>'application/vnd.api+json', 'Authorization' => 'Bearer ' + bearer}} - context 'validates' do let(:xml) { ::Base64.strict_encode64(File.read(file_fixture('datacite.xml'))) } let(:params) do @@ -1284,14 +1417,6 @@ "attributes" => { "doi" => "10.14454/10703", "xml" => xml, - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } } } } @@ -1301,8 +1426,8 @@ it 'validates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("Eating your own Dog Food") - expect(json.dig('data', 'attributes', 'published')).to eq("2016-12-20") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Eating your own Dog Food"}]) + expect(json.dig('data', 'attributes', 'dates')).to eq([{"date"=>"2016-12-20", "dateType"=>"Created"}, {"date"=>"2016-12-20", "dateType"=>"Issued"}, {"date"=>"2016-12-20", "dateType"=>"Updated"}]) end it 'returns status code 200' do @@ -1319,14 +1444,6 @@ "attributes" => { "doi" => "10.14454/10703", "xml" => xml, - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } } } } @@ -1336,8 +1453,8 @@ it 'validates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("Data from: A new malaria agent in African hominids.") - expect(json.dig('data', 'attributes', 'published')).to eq("2011") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Data from: A new malaria agent in African hominids."}]) + expect(json.dig('data', 'attributes', 'dates')).to eq([{"date"=>"2011", "dateType"=>"Issued"}]) end it 'returns status code 200' do @@ -1345,23 +1462,15 @@ end end - context 'when the creator is missing' do + context 'when the creators are missing' do let(:xml) { ::Base64.strict_encode64(File.read(file_fixture('datacite_missing_creator.xml'))) } let(:params) do { "data" => { "type" => "dois", "attributes" => { - "doi" => "10.14454/10703", - "xml" => xml, - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "doi" => "10.14454/10703", + "xml" => xml } } } @@ -1379,7 +1488,7 @@ end end - context 'when the creator is malformed' do + context 'when the creators are malformed' do let(:xml) { ::Base64.strict_encode64(File.read(file_fixture('datacite_malformed_creator.xml'))) } let(:params) do { @@ -1388,14 +1497,6 @@ "attributes" => { "doi" => "10.14454/10703", "xml" => xml, - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } } } } @@ -1422,14 +1523,6 @@ "attributes" => { "doi" => "10.14454/10703", "xml" => xml, - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } } } } @@ -1439,8 +1532,8 @@ it 'validates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("Eating your own Dog Food") - expect(json.dig('data', 'attributes', 'published')).to eq("2016-12-20") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Eating your own Dog Food"}]) + expect(json.dig('data', 'attributes', 'dates')).to eq([{"date"=>"2016-12-20", "dateType"=>"Issued"}]) end it 'returns status code 200' do @@ -1457,14 +1550,6 @@ "attributes" => { "doi" => "10.14454/10703", "xml" => xml, - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } } } } @@ -1474,8 +1559,8 @@ it 'validates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("R Interface to the DataONE REST API") - expect(json.dig('data', 'attributes', 'published')).to eq("2016-05-27") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"R Interface to the DataONE REST API"}]) + expect(json.dig('data', 'attributes', 'dates')).to eq([{"date"=>"2016-05-27", "dateType"=>"Issued"}, {"date"=>"2016-05-27", "dateType"=>"Created"}, {"date"=>"2016-05-27", "dateType"=>"Updated"}]) end it 'returns status code 200' do @@ -1492,14 +1577,6 @@ "attributes" => { "doi" => "10.14454/10703", "xml" => xml, - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } } } } @@ -1509,8 +1586,8 @@ it 'validates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("Analysis Tools for Crossover Experiment of UI using Choice Architecture") - expect(json.dig('data', 'attributes', 'published')).to eq("2016-03-27") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Analysis Tools for Crossover Experiment of UI using Choice Architecture"}]) + expect(json.dig('data', 'attributes', 'dates')).to eq("date"=>"2016-03-27", "dateType"=>"Issued") end it 'returns status code 200' do @@ -1527,14 +1604,6 @@ "attributes" => { "doi" => "10.14454/10703", "xml" => xml, - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } } } } @@ -1544,8 +1613,8 @@ it 'validates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth") - expect(json.dig('data', 'attributes', 'published')).to eq("2014") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth"}]) + expect(json.dig('data', 'attributes', 'dates')).to eq([{"date"=>"2014", "dateType"=>"Issued"}]) end it 'returns status code 200' do @@ -1561,15 +1630,7 @@ "type" => "dois", "attributes" => { "doi" => "10.14454/10703", - "xml" => xml, - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "xml" => xml } } } @@ -1579,8 +1640,8 @@ it 'validates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth") - expect(json.dig('data', 'attributes', 'published')).to eq("2014") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Automated quantitative histology reveals vascular morphodynamics during Arabidopsis hypocotyl secondary growth"}]) + expect(json.dig('data', 'attributes', 'dates')).to eq([{"date"=>"2014", "dateType"=>"Issued"}]) end it 'returns status code 200' do @@ -1597,14 +1658,6 @@ "attributes" => { "doi" => "10.14454/10703", "xml" => xml, - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } } } } @@ -1614,8 +1667,8 @@ it 'validates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("Triose Phosphate Isomerase Deficiency Is Caused by Altered Dimerization–Not Catalytic Inactivity–of the Mutant Enzymes") - expect(json.dig('data', 'attributes', 'published')).to eq("2006-12-20") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Triose Phosphate Isomerase Deficiency Is Caused by Altered Dimerization–Not Catalytic Inactivity–of the Mutant Enzymes"}]) + expect(json.dig('data', 'attributes', 'dates')).to eq([{"date"=>"2006-12-20", "dateType"=>"Issued"}, {"date"=>"2017-01-01T03:37:08Z", "dateType"=>"Updated"}]) end it 'returns status code 200' do @@ -1632,14 +1685,6 @@ "attributes" => { "doi" => "10.14454/10703", "xml" => xml, - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } } } } @@ -1649,8 +1694,8 @@ it 'validates a Doi' do expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'title')).to eq("Eating your own Dog Food") - expect(json.dig('data', 'attributes', 'published')).to eq("2016-12-20") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Eating your own Dog Food"}]) + expect(json.dig('data', 'attributes', 'dates')).to eq([{"date"=>"2016-12-20", "dateType"=>"Issued"}, {"date"=>"2016-12-20", "dateType"=>"Created"}, {"date"=>"2016-12-20", "dateType"=>"Updated"}]) end it 'returns status code 200' do @@ -1659,19 +1704,73 @@ end end + context 'update individual attribute' do + let(:xml) { Base64.strict_encode64(file_fixture('datacite_schema_3.xml').read) } + let(:valid_attributes) do + { + "data" => { + "type" => "dois", + "attributes" => { + "doi" => "10.14454/10703", + "url" => "http://www.bl.uk/pdf/patspec.pdf", + "xml" => xml, + "source" => "test", + "event" => "publish" + } + } + } + end + let(:update_attributes) do + { + "data" => { + "type" => "dois", + "attributes" => { + "schemaVersion" => "http://datacite.org/schema/kernel-4", + "regenerate" => true + } + } + } + end + + before { post '/dois', params: valid_attributes.to_json, headers: headers } + + it 'creates a Doi' do + expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") + expect(json.dig('data', 'attributes', 'titles')).to eq([{"title"=>"Data from: A new malaria agent in African hominids."}]) + expect(json.dig('data', 'attributes', 'schemaVersion')).to eq("http://datacite.org/schema/kernel-3") + + doc = Nokogiri::XML(Base64.decode64(json.dig('data', 'attributes', 'xml')), nil, 'UTF-8', &:noblanks) + expect(doc.collect_namespaces).to eq("xmlns" => "http://datacite.org/schema/kernel-3","xmlns:dim" => "http://www.dspace.org/xmlns/dspace/dim","xmlns:dryad" => "http://purl.org/dryad/terms/","xmlns:dspace" => "http://www.dspace.org/xmlns/dspace/dim","xmlns:mets" => "http://www.loc.gov/METS/","xmlns:xsi" => "http://www.w3.org/2001/XMLSchema-instance") + end + + it 'updates to schema 4.0' do + put "/dois/10.14454/10703", params: update_attributes.to_json, headers: headers + + expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") + expect(json.dig('data', 'attributes', 'schemaVersion')).to eq("http://datacite.org/schema/kernel-4") + + doc = Nokogiri::XML(Base64.decode64(json.dig('data', 'attributes', 'xml')), nil, 'UTF-8', &:noblanks) + expect(doc.collect_namespaces).to eq("xmlns"=>"http://datacite.org/schema/kernel-4", "xmlns:xsi"=>"http://www.w3.org/2001/XMLSchema-instance") + end + end + context 'landing page' do let(:url) { "https://blog.datacite.org/re3data-science-europe/" } - let(:xml) { "PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0iVVRGLTgiPz48cmVzb3VyY2UgeG1sbnM6eHNpPSJodHRwOi8vd3d3LnczLm9yZy8yMDAxL1hNTFNjaGVtYS1pbnN0YW5jZSIgeG1sbnM9Imh0dHA6Ly9kYXRhY2l0ZS5vcmcvc2NoZW1hL2tlcm5lbC00IiB4c2k6c2NoZW1hTG9jYXRpb249Imh0dHA6Ly9kYXRhY2l0ZS5vcmcvc2NoZW1hL2tlcm5lbC00IGh0dHA6Ly9zY2hlbWEuZGF0YWNpdGUub3JnL21ldGEva2VybmVsLTQvbWV0YWRhdGEueHNkIj48aWRlbnRpZmllciBpZGVudGlmaWVyVHlwZT0iRE9JIj4xMC4yNTQ5OS94dWRhMnB6cmFocm9lcXBlZnZucTV6dDZkYzwvaWRlbnRpZmllcj48Y3JlYXRvcnM+PGNyZWF0b3I+PGNyZWF0b3JOYW1lPklhbiBQYXJyeTwvY3JlYXRvck5hbWU+PG5hbWVJZGVudGlmaWVyIHNjaGVtZVVSST0iaHR0cDovL29yY2lkLm9yZy8iIG5hbWVJZGVudGlmaWVyU2NoZW1lPSJPUkNJRCI+MDAwMC0wMDAxLTYyMDItNTEzWDwvbmFtZUlkZW50aWZpZXI+PC9jcmVhdG9yPjwvY3JlYXRvcnM+PHRpdGxlcz48dGl0bGU+U3VibWl0dGVkIGNoZW1pY2FsIGRhdGEgZm9yIEluQ2hJS2V5PVlBUFFCWFFZTEpSWFNBLVVIRkZGQU9ZU0EtTjwvdGl0bGU+PC90aXRsZXM+PHB1Ymxpc2hlcj5Sb3lhbCBTb2NpZXR5IG9mIENoZW1pc3RyeTwvcHVibGlzaGVyPjxwdWJsaWNhdGlvblllYXI+MjAxNzwvcHVibGljYXRpb25ZZWFyPjxyZXNvdXJjZVR5cGUgcmVzb3VyY2VUeXBlR2VuZXJhbD0iRGF0YXNldCI+U3Vic3RhbmNlPC9yZXNvdXJjZVR5cGU+PHJpZ2h0c0xpc3Q+PHJpZ2h0cyByaWdodHNVUkk9Imh0dHBzOi8vY3JlYXRpdmVjb21tb25zLm9yZy9zaGFyZS15b3VyLXdvcmsvcHVibGljLWRvbWFpbi9jYzAvIj5ObyBSaWdodHMgUmVzZXJ2ZWQ8L3JpZ2h0cz48L3JpZ2h0c0xpc3Q+PC9yZXNvdXJjZT4=" } - let(:link_check_result) { { + let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } + let(:landingPage) { { + "checked" => Time.zone.now.utc.iso8601, + "status" => 200, + "url" => url, + "contentType" => "text/html", "error" => nil, - "redirect-count" => 0, - "redirect-urls" => [], - "download-latency" => 200, - "has-schema-org" => true, - "schema-org-id" => "10.14454/10703", - "dc-identifier" => nil, - "citation-doi" => nil, - "body-has-pid" => true + "redirectCount" => 0, + "redirectUrls" => [], + "downloadLatency" => 200, + "hasSchemaOrg" => true, + "schemaOrgId" => "10.14454/10703", + "dcIdentifier" => nil, + "citationDoi" => nil, + "bodyHasPid" => true } } let(:valid_attributes) do { @@ -1681,20 +1780,8 @@ "doi" => "10.14454/10703", "url" => url, "xml" => xml, - "last-landing-page" => url, - "last-landing-page-status" => 200, - "last-landing-page-status-check" => Time.zone.now, - "last-landing-page-content-type" => "text/html", - "last-landing-page-status-result" => link_check_result, - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "landingPage" => landingPage, + "event" => "publish" } } } @@ -1702,11 +1789,10 @@ before { post '/dois', params: valid_attributes.to_json, headers: headers } - it 'creates a Doi' do + it 'creates a doi' do expect(json.dig('data', 'attributes', 'url')).to eq(url) expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'landing-page', 'status')).to eq(200) - expect(json.dig('data', 'attributes', 'landing-page', 'result')).to eq(link_check_result) + expect(json.dig('data', 'attributes', 'landingPage')).to eq(landingPage) end it 'returns status code 201' do @@ -1714,29 +1800,79 @@ end it 'sets state to registered' do - expect(json.dig('data', 'attributes', 'state')).to eq("registered") + expect(json.dig('data', 'attributes', 'state')).to eq("findable") + end + end + + context 'update with landing page info as admin' do + let(:url) { "https://blog.datacite.org/re3data-science-europe/" } + let(:doi) { create(:doi, doi: "10.14454/10703", url: url, client: client) } + let(:landingPage) { { + "checked" => Time.zone.now.utc.iso8601, + "status" => 200, + "url" => url, + "contentType" => "text/html", + "error" => nil, + "redirectCount" => 0, + "redirectUrls" => [], + "downloadLatency" => 200, + "hasSchemaOrg" => true, + "schemaOrgId" => "10.14454/10703", + "dcIdentifier" => nil, + "citationDoi" => nil, + "bodyHasPid" => true + } } + let(:valid_attributes) do + { + "data" => { + "type" => "dois", + "attributes" => { + "landingPage" => landingPage, + "event" => "publish" + } + } + } + end + + before { put "/dois/#{doi.doi}", params: valid_attributes.to_json, headers: admin_headers } + + it 'creates a doi' do + expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") + expect(json.dig('data', 'attributes', 'landingPage')).to eq(landingPage) + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end context 'landing page schema-org-id hash' do let(:url) { "https://blog.datacite.org/re3data-science-europe/" } - let(:xml) { "PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0iVVRGLTgiPz48cmVzb3VyY2UgeG1sbnM6eHNpPSJodHRwOi8vd3d3LnczLm9yZy8yMDAxL1hNTFNjaGVtYS1pbnN0YW5jZSIgeG1sbnM9Imh0dHA6Ly9kYXRhY2l0ZS5vcmcvc2NoZW1hL2tlcm5lbC00IiB4c2k6c2NoZW1hTG9jYXRpb249Imh0dHA6Ly9kYXRhY2l0ZS5vcmcvc2NoZW1hL2tlcm5lbC00IGh0dHA6Ly9zY2hlbWEuZGF0YWNpdGUub3JnL21ldGEva2VybmVsLTQvbWV0YWRhdGEueHNkIj48aWRlbnRpZmllciBpZGVudGlmaWVyVHlwZT0iRE9JIj4xMC4yNTQ5OS94dWRhMnB6cmFocm9lcXBlZnZucTV6dDZkYzwvaWRlbnRpZmllcj48Y3JlYXRvcnM+PGNyZWF0b3I+PGNyZWF0b3JOYW1lPklhbiBQYXJyeTwvY3JlYXRvck5hbWU+PG5hbWVJZGVudGlmaWVyIHNjaGVtZVVSST0iaHR0cDovL29yY2lkLm9yZy8iIG5hbWVJZGVudGlmaWVyU2NoZW1lPSJPUkNJRCI+MDAwMC0wMDAxLTYyMDItNTEzWDwvbmFtZUlkZW50aWZpZXI+PC9jcmVhdG9yPjwvY3JlYXRvcnM+PHRpdGxlcz48dGl0bGU+U3VibWl0dGVkIGNoZW1pY2FsIGRhdGEgZm9yIEluQ2hJS2V5PVlBUFFCWFFZTEpSWFNBLVVIRkZGQU9ZU0EtTjwvdGl0bGU+PC90aXRsZXM+PHB1Ymxpc2hlcj5Sb3lhbCBTb2NpZXR5IG9mIENoZW1pc3RyeTwvcHVibGlzaGVyPjxwdWJsaWNhdGlvblllYXI+MjAxNzwvcHVibGljYXRpb25ZZWFyPjxyZXNvdXJjZVR5cGUgcmVzb3VyY2VUeXBlR2VuZXJhbD0iRGF0YXNldCI+U3Vic3RhbmNlPC9yZXNvdXJjZVR5cGU+PHJpZ2h0c0xpc3Q+PHJpZ2h0cyByaWdodHNVUkk9Imh0dHBzOi8vY3JlYXRpdmVjb21tb25zLm9yZy9zaGFyZS15b3VyLXdvcmsvcHVibGljLWRvbWFpbi9jYzAvIj5ObyBSaWdodHMgUmVzZXJ2ZWQ8L3JpZ2h0cz48L3JpZ2h0c0xpc3Q+PC9yZXNvdXJjZT4=" } - let(:link_check_result) { { + let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } + let(:landingPage) { { + "checked" => Time.zone.now.utc.iso8601, + "status" => 200, + "url" => url, + "contentType" => "text/html", "error" => nil, - "redirect-count" => 0, - "redirect-urls" => [], - "download-latency" => 200, - "has-schema-org" => true, - "schema-org-id" => [ + "redirectCount" => 0, + "redirectUrls" => [], + "downloadLatency" => 200, + "hasSchemaOrg" => true, + "schemaOrgId" => [ { "@type" => "PropertyValue", "value" => "http://dx.doi.org/10.4225/06/564AB348340D5", "propertyID" => "URL" } ], - "dc-identifier" => nil, - "citation-doi" => nil, - "body-has-pid" => true + "dcIdentifier" => nil, + "citationDoi" => nil, + "bodyHasPid" => true } } let(:valid_attributes) do { @@ -1746,20 +1882,8 @@ "doi" => "10.14454/10703", "url" => url, "xml" => xml, - "last-landing-page" => url, - "last-landing-page-status" => 200, - "last-landing-page-status-check" => Time.zone.now, - "last-landing-page-content-type" => "text/html", - "last-landing-page-status-result" => link_check_result, - "event" => "register" - }, - "relationships"=> { - "client"=> { - "data"=> { - "type"=> "clients", - "id"=> client.symbol.downcase - } - } + "landingPage" => landingPage, + "event" => "publish" } } } @@ -1768,19 +1892,17 @@ before { post '/dois', params: valid_attributes.to_json, headers: headers } it 'creates a Doi' do - puts response.body expect(json.dig('data', 'attributes', 'url')).to eq(url) expect(json.dig('data', 'attributes', 'doi')).to eq("10.14454/10703") - expect(json.dig('data', 'attributes', 'landing-page', 'status')).to eq(200) - expect(json.dig('data', 'attributes', 'landing-page', 'result')).to eq(link_check_result) + expect(json.dig('data', 'attributes', 'landingPage')).to eq(landingPage) end it 'returns status code 201' do expect(response).to have_http_status(201) end - it 'sets state to registered' do - expect(json.dig('data', 'attributes', 'state')).to eq("registered") + it 'sets state to findable' do + expect(json.dig('data', 'attributes', 'state')).to eq("findable") end end end @@ -1884,16 +2006,20 @@ end describe 'GET /dois/ linkcheck results' do - let(:last_landing_page_status_result) { { + let(:landing_page) { { + "checked" => Time.zone.now.utc.iso8601, + "status" => 200, + "url" => "http://example.com", + "contentType" => "text/html", "error" => nil, - "redirect-count" => 0, - "redirect-urls" => [], - "download-latency" => 200, - "has-schema-org" => true, - "schema-org-id" => "10.14454/10703", - "dc-identifier" => nil, - "citation-doi" => nil, - "body-has-pid" => true + "redirectCount" => 0, + "redirectUrls" => [], + "downloadLatency" => 200, + "hasSchemaOrg" => true, + "schemaOrgId" => "10.14454/10703", + "dcIdentifier" => nil, + "citationDoi" => nil, + "bodyHasPid" => true } } # Setup an initial DOI with results will check permissions against. @@ -1903,7 +2029,7 @@ client: client, state: "findable", event: 'publish', - last_landing_page_status_result: last_landing_page_status_result + landing_page: landing_page ) } @@ -1916,7 +2042,7 @@ client: other_client, state: "findable", event: 'publish', - last_landing_page_status_result: last_landing_page_status_result + landing_page: landing_page ) } @@ -1924,10 +2050,9 @@ let(:headers) { { 'ACCEPT'=>'application/vnd.api+json', 'CONTENT_TYPE'=>'application/vnd.api+json' } } before { get "/dois/#{doi.doi}", headers: headers} - it 'returns without link_check_results' do - puts json + it 'returns without landing page results' do expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi) - expect(json.dig('data', 'attributes', 'landing-page', 'result')).to eq(nil) + expect(json.dig('data', 'attributes', 'landingPage')).to eq(nil) end end @@ -1937,9 +2062,9 @@ before { get "/dois/#{doi.doi}", headers: headers } - it 'returns with link_check_results' do + it 'returns with landing page results' do expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi) - expect(json.dig('data', 'attributes', 'landing-page', 'result')).to eq(last_landing_page_status_result) + expect(json.dig('data', 'attributes', 'landingPage')).to eq(landing_page) end end @@ -1950,9 +2075,9 @@ before { get "/dois/#{other_doi.doi}", headers: headers } - it 'returns with link_check_results' do + it 'returns with landing page results' do expect(json.dig('data', 'attributes', 'doi')).to eq(other_doi.doi) - expect(json.dig('data', 'attributes', 'landing-page', 'result')).to eq(nil) + expect(json.dig('data', 'attributes', 'landingPage')).to eq(nil) end end @@ -1963,9 +2088,9 @@ before { get "/dois/#{doi.doi}", headers: headers } - it 'returns with link_check_results' do + it 'returns with landing page results' do expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi) - expect(json.dig('data', 'attributes', 'landing-page', 'result')).to eq(last_landing_page_status_result) + expect(json.dig('data', 'attributes', 'landingPage')).to eq(landing_page) end end @@ -2058,7 +2183,7 @@ end describe 'GET /dois/DOI/get-url', vcr: true do - let(:doi) { create(:doi, client: client, doi: "10.5438/fj3w-0shd", event: "publish") } + let(:doi) { create(:doi, client: client, doi: "10.5438/fj3w-0shd", url: "https://blog.datacite.org/data-driven-development/", event: "publish") } before { get "/dois/#{doi.doi}/get-url", headers: headers } @@ -2102,7 +2227,7 @@ describe 'GET /dois/DOI/get-url no permission', vcr: true do let(:other_client) { create(:client, provider: provider) } - let(:doi) { create(:doi, client: other_client, doi: "10.5438/8syz-ym47", event: "publish") } + let(:doi) { create(:doi, client: other_client, doi: "10.14454/8syz-ym47", event: "publish") } before { get "/dois/#{doi.doi}/get-url", headers: headers } @@ -2184,4 +2309,370 @@ expect(response).to have_http_status(401) end end + + describe "content_negotation", type: :request do + let(:provider) { create(:provider, symbol: "DATACITE") } + let(:client) { create(:client, provider: provider, symbol: ENV['MDS_USERNAME'], password: ENV['MDS_PASSWORD']) } + let(:bearer) { Client.generate_token(role_id: "client_admin", uid: client.symbol, provider_id: provider.symbol.downcase, client_id: client.symbol.downcase, password: client.password) } + let(:doi) { create(:doi, client: client, aasm_state: "findable") } + + context "no permission" do + let(:doi) { create(:doi) } + + before { get "/dois/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.jats+xml", 'Authorization' => 'Bearer ' + bearer } } + + it 'returns error message' do + expect(json["errors"]).to eq([{"status"=>"403", "title"=>"You are not authorized to access this resource."}]) + end + + it 'returns status code 403' do + expect(response).to have_http_status(403) + end + end + + context "no authentication" do + let(:doi) { create(:doi) } + before { get "/dois/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.jats+xml" } } + + it 'returns error message' do + expect(json["errors"]).to eq([{"status"=>"401", "title"=>"Bad credentials."}]) + end + + it 'returns status code 401' do + expect(response).to have_http_status(401) + end + end + + context "application/vnd.jats+xml" do + before { get "/dois/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.jats+xml", 'Authorization' => 'Bearer ' + bearer } } + + it 'returns the Doi' do + jats = Maremma.from_xml(response.body).fetch("element_citation", {}) + expect(jats.dig("publication_type")).to eq("data") + expect(jats.dig("data_title")).to eq("Data from: A new malaria agent in African hominids.") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "application/vnd.jats+xml link" do + before { get "/dois/application/vnd.jats+xml/#{doi.doi}" } + + it 'returns the Doi' do + jats = Maremma.from_xml(response.body).fetch("element_citation", {}) + expect(jats.dig("publication_type")).to eq("data") + expect(jats.dig("data_title")).to eq("Data from: A new malaria agent in African hominids.") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "application/vnd.datacite.datacite+xml" do + before { get "/dois/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.datacite.datacite+xml", 'Authorization' => 'Bearer ' + bearer } } + + it 'returns the Doi' do + data = Maremma.from_xml(response.body).to_h.fetch("resource", {}) + expect(data.dig("xmlns")).to eq("http://datacite.org/schema/kernel-4") + expect(data.dig("publisher")).to eq("Dryad Digital Repository") + expect(data.dig("titles", "title")).to eq("Data from: A new malaria agent in African hominids.") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "application/vnd.datacite.datacite+xml link" do + before { get "/dois/application/vnd.datacite.datacite+xml/#{doi.doi}" } + + it 'returns the Doi' do + data = Maremma.from_xml(response.body).to_h.fetch("resource", {}) + expect(data.dig("xmlns")).to eq("http://datacite.org/schema/kernel-4") + expect(data.dig("publisher")).to eq("Dryad Digital Repository") + expect(data.dig("titles", "title")).to eq("Data from: A new malaria agent in African hominids.") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "application/vnd.datacite.datacite+xml schema 3" do + let(:xml) { file_fixture('datacite_schema_3.xml').read } + let(:doi) { create(:doi, xml: xml, client: client, regenerate: false) } + + before { get "/dois/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.datacite.datacite+xml", 'Authorization' => 'Bearer ' + bearer } } + + it 'returns the Doi' do + data = Maremma.from_xml(response.body).to_h.fetch("resource", {}) + expect(data.dig("xmlns")).to eq("http://datacite.org/schema/kernel-3") + expect(data.dig("publisher")).to eq("Dryad Digital Repository") + expect(data.dig("titles", "title")).to eq("Data from: A new malaria agent in African hominids.") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + # context "no metadata" do + # let(:doi) { create(:doi, xml: nil, client: client) } + + # before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.datacite.datacite+xml", 'Authorization' => 'Bearer ' + bearer } } + + # it 'returns the Doi' do + # expect(response.body).to eq('') + # end + + # it 'returns status code 200' do + # expect(response).to have_http_status(200) + # end + # end + + context "application/vnd.datacite.datacite+xml not found" do + before { get "/dois/xxx", headers: { "HTTP_ACCEPT" => "application/vnd.datacite.datacite+xml", 'Authorization' => 'Bearer ' + bearer } } + + it 'returns error message' do + expect(json["errors"]).to eq([{"status"=>"404", "title"=>"The resource you are looking for doesn't exist."}]) + end + + it 'returns status code 404' do + expect(response).to have_http_status(404) + end + end + + context "application/vnd.datacite.datacite+json" do + before { get "/dois/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.datacite.datacite+json", 'Authorization' => 'Bearer ' + bearer } } + + it 'returns the Doi' do + expect(json["doi"]).to eq(doi.doi) + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "application/vnd.datacite.datacite+json link" do + before { get "/dois/application/vnd.datacite.datacite+json/#{doi.doi}" } + + it 'returns the Doi' do + expect(json["doi"]).to eq(doi.doi) + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "application/vnd.crosscite.crosscite+json" do + before { get "/dois/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.crosscite.crosscite+json", 'Authorization' => 'Bearer ' + bearer } } + + it 'returns the Doi' do + expect(json["doi"]).to eq(doi.doi) + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "application/vnd.crosscite.crosscite+json link" do + before { get "/dois/application/vnd.crosscite.crosscite+json/#{doi.doi}" } + + it 'returns the Doi' do + expect(json["doi"]).to eq(doi.doi) + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "application/vnd.schemaorg.ld+json" do + before { get "/dois/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.schemaorg.ld+json", 'Authorization' => 'Bearer ' + bearer } } + + it 'returns the Doi' do + expect(json["@type"]).to eq("Dataset") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "application/vnd.schemaorg.ld+json link" do + before { get "/dois/application/vnd.schemaorg.ld+json/#{doi.doi}" } + + it 'returns the Doi' do + expect(json["@type"]).to eq("Dataset") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "application/vnd.citationstyles.csl+json" do + before { get "/dois/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.citationstyles.csl+json", 'Authorization' => 'Bearer ' + bearer } } + + it 'returns the Doi' do + expect(json["type"]).to eq("dataset") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "application/vnd.citationstyles.csl+json link" do + before { get "/dois/application/vnd.citationstyles.csl+json/#{doi.doi}" } + + it 'returns the Doi' do + expect(json["type"]).to eq("dataset") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "application/x-research-info-systems" do + before { get "/dois/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/x-research-info-systems", 'Authorization' => 'Bearer ' + bearer } } + + it 'returns the Doi' do + expect(response.body).to start_with("TY - DATA") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "application/x-research-info-systems link" do + before { get "/dois/application/x-research-info-systems/#{doi.doi}" } + + it 'returns the Doi' do + expect(response.body).to start_with("TY - DATA") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "application/x-bibtex" do + before { get "/dois/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/x-bibtex", 'Authorization' => 'Bearer ' + bearer } } + + it 'returns the Doi' do + expect(response.body).to start_with("@misc{https://doi.org/#{doi.doi.downcase}") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "application/x-bibtex link" do + before { get "/dois/application/x-bibtex/#{doi.doi}" } + + it 'returns the Doi' do + expect(response.body).to start_with("@misc{https://doi.org/#{doi.doi.downcase}") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "text/x-bibliography", vcr: true do + context "default style" do + before { get "/dois/#{doi.doi}", headers: { "HTTP_ACCEPT" => "text/x-bibliography", 'Authorization' => 'Bearer ' + bearer } } + + it 'returns the Doi' do + expect(response.body).to start_with("Ollomo, B.") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "default style link" do + before { get "/dois/text/x-bibliography/#{doi.doi}" } + + it 'returns the Doi' do + expect(response.body).to start_with("Ollomo, B.") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "ieee style" do + before { get "/dois/#{doi.doi}?style=ieee", headers: { "HTTP_ACCEPT" => "text/x-bibliography", 'Authorization' => 'Bearer ' + bearer } } + + it 'returns the Doi' do + expect(response.body).to start_with("B. Ollomo") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "ieee style link" do + before { get "/dois/text/x-bibliography/#{doi.doi}?style=ieee" } + + it 'returns the Doi' do + expect(response.body).to start_with("B. Ollomo") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context "style and locale" do + before { get "/dois/#{doi.doi}?style=vancouver&locale=de", headers: { "HTTP_ACCEPT" => "text/x-bibliography", 'Authorization' => 'Bearer ' + bearer } } + + it 'returns the Doi' do + expect(response.body).to start_with("Ollomo B") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + end + + context "unknown content type" do + before { get "/dois/#{doi.doi}", headers: { "HTTP_ACCEPT" => "text/csv", 'Authorization' => 'Bearer ' + bearer } } + + it 'returns the Doi' do + expect(json["errors"]).to eq([{"status"=>"406", "title"=>"The content type is not recognized."}]) + end + + it 'returns status code 406' do + expect(response).to have_http_status(406) + end + end + + context "missing content type" do + before { get "/dois/#{doi.doi}", headers: { 'Authorization' => 'Bearer ' + bearer } } + + it 'returns the Doi' do + expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi.downcase) + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + end end diff --git a/spec/requests/index_spec.rb b/spec/requests/index_spec.rb deleted file mode 100644 index f40c29e9a..000000000 --- a/spec/requests/index_spec.rb +++ /dev/null @@ -1,402 +0,0 @@ -require 'rails_helper' - -describe "content_negotation", type: :request do - let(:provider) { create(:provider, symbol: "DATACITE") } - let(:client) { create(:client, provider: provider, symbol: ENV['MDS_USERNAME'], password: ENV['MDS_PASSWORD']) } - let(:bearer) { Client.generate_token(role_id: "client_admin", uid: client.symbol, provider_id: provider.symbol.downcase, client_id: client.symbol.downcase, password: client.password) } - let(:xml) { Base64.strict_encode64(file_fixture('datacite.xml').read) } - let(:doi) { create(:doi, xml: xml, client: client) } - - context "no permission" do - let(:doi) { create(:doi, xml: xml) } - - before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.jats+xml", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns error message' do - expect(json["errors"]).to eq([{"status"=>"403", "title"=>"You are not authorized to access this resource."}]) - end - - it 'returns status code 403' do - expect(response).to have_http_status(403) - end - end - - context "no authentication" do - before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.jats+xml" } } - - it 'returns error message' do - expect(json["errors"]).to eq([{"status"=>"401", "title"=>"Bad credentials."}]) - end - - it 'returns status code 401' do - expect(response).to have_http_status(401) - end - end - - context "application/vnd.jats+xml" do - before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.jats+xml", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns the Doi' do - jats = Maremma.from_xml(response.body).fetch("element_citation", {}) - expect(jats.dig("publication_type")).to eq("journal") - expect(jats.dig("article_title")).to eq("Eating your own Dog Food") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/vnd.jats+xml link" do - let(:doi) { create(:doi, xml: xml, client: client, aasm_state: "findable") } - - before { get "/application/vnd.jats+xml/#{doi.doi}" } - - it 'returns the Doi' do - jats = Maremma.from_xml(response.body).fetch("element_citation", {}) - expect(jats.dig("publication_type")).to eq("journal") - expect(jats.dig("article_title")).to eq("Eating your own Dog Food") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/vnd.datacite.datacite+xml" do - before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.datacite.datacite+xml", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns the Doi' do - data = Maremma.from_xml(response.body).to_h.fetch("resource", {}) - expect(data.dig("xmlns")).to eq("http://datacite.org/schema/kernel-4") - expect(data.dig("publisher")).to eq("DataCite") - expect(data.dig("titles", "title")).to eq("Eating your own Dog Food") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/vnd.datacite.datacite+xml link" do - let(:doi) { create(:doi, xml: xml, client: client, aasm_state: "findable") } - - before { get "/application/vnd.datacite.datacite+xml/#{doi.doi}" } - - it 'returns the Doi' do - data = Maremma.from_xml(response.body).to_h.fetch("resource", {}) - expect(data.dig("xmlns")).to eq("http://datacite.org/schema/kernel-4") - expect(data.dig("publisher")).to eq("DataCite") - expect(data.dig("titles", "title")).to eq("Eating your own Dog Food") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/vnd.datacite.datacite+xml schema 3" do - let(:xml) { Base64.strict_encode64(file_fixture('datacite_schema_3.xml').read) } - let(:doi) { create(:doi, xml: xml, client: client) } - - before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.datacite.datacite+xml", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns the Doi' do - data = Maremma.from_xml(response.body).to_h.fetch("resource", {}) - expect(data.dig("xmlns")).to eq("http://datacite.org/schema/kernel-3") - expect(data.dig("publisher")).to eq("Dryad Digital Repository") - expect(data.dig("titles", "title")).to eq("Data from: A new malaria agent in African hominids.") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - # context "no metadata" do - # let(:doi) { create(:doi, xml: nil, client: client) } - - # before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.datacite.datacite+xml", 'Authorization' => 'Bearer ' + bearer } } - - # it 'returns the Doi' do - # expect(response.body).to eq('') - # end - - # it 'returns status code 200' do - # expect(response).to have_http_status(200) - # end - # end - - context "application/vnd.datacite.datacite+xml not found" do - before { get "/xxx", headers: { "HTTP_ACCEPT" => "application/vnd.datacite.datacite+xml", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns error message' do - expect(json["errors"]).to eq([{"status"=>"404", "title"=>"The resource you are looking for doesn't exist."}]) - end - - it 'returns status code 404' do - expect(response).to have_http_status(404) - end - end - - context "application/vnd.datacite.datacite+json" do - before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.datacite.datacite+json", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns the Doi' do - expect(json["doi"]).to eq(doi.doi) - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/vnd.datacite.datacite+json link" do - let(:doi) { create(:doi, xml: xml, client: client, aasm_state: "findable") } - - before { get "/application/vnd.datacite.datacite+json/#{doi.doi}" } - - it 'returns the Doi' do - expect(json["doi"]).to eq(doi.doi) - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/vnd.crosscite.crosscite+json" do - before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.crosscite.crosscite+json", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns the Doi' do - expect(json["doi"]).to eq(doi.doi) - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/vnd.crosscite.crosscite+json link" do - let(:doi) { create(:doi, xml: xml, client: client, aasm_state: "findable") } - - before { get "/application/vnd.crosscite.crosscite+json/#{doi.doi}" } - - it 'returns the Doi' do - expect(json["doi"]).to eq(doi.doi) - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/vnd.schemaorg.ld+json" do - before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.schemaorg.ld+json", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns the Doi' do - expect(json["@type"]).to eq("ScholarlyArticle") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/vnd.schemaorg.ld+json link" do - let(:doi) { create(:doi, xml: xml, client: client, aasm_state: "findable") } - - before { get "/application/vnd.schemaorg.ld+json/#{doi.doi}" } - - it 'returns the Doi' do - expect(json["@type"]).to eq("ScholarlyArticle") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/vnd.citationstyles.csl+json" do - before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/vnd.citationstyles.csl+json", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns the Doi' do - expect(json["type"]).to eq("article-journal") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/vnd.citationstyles.csl+json link" do - let(:doi) { create(:doi, xml: xml, client: client, aasm_state: "findable") } - - before { get "/application/vnd.citationstyles.csl+json/#{doi.doi}" } - - it 'returns the Doi' do - expect(json["type"]).to eq("article-journal") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/x-research-info-systems" do - before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/x-research-info-systems", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns the Doi' do - expect(response.body).to start_with("TY - RPRT") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/x-research-info-systems link" do - let(:doi) { create(:doi, xml: xml, client: client, aasm_state: "findable") } - - before { get "/application/x-research-info-systems/#{doi.doi}" } - - it 'returns the Doi' do - expect(response.body).to start_with("TY - RPRT") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/x-bibtex" do - before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/x-bibtex", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns the Doi' do - expect(response.body).to start_with("@article{https://handle.test.datacite.org/#{doi.doi.downcase}") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/x-bibtex link" do - let(:doi) { create(:doi, xml: xml, client: client, aasm_state: "findable") } - - before { get "/application/x-bibtex/#{doi.doi}" } - - it 'returns the Doi' do - expect(response.body).to start_with("@article{https://handle.test.datacite.org/#{doi.doi.downcase}") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "application/x-bibtex nasa gsfc" do - let(:xml) { Base64.strict_encode64(file_fixture('datacite_gsfc.xml').read) } - let(:doi) { create(:doi, xml: xml, client: client) } - - before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "application/x-bibtex", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns the Doi' do - expect(response.body).to start_with("@misc{https://handle.test.datacite.org/#{doi.doi.downcase}") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "text/x-bibliography", vcr: true do - context "default style" do - before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "text/x-bibliography", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns the Doi' do - expect(response.body).to start_with("Fenner, M. (2016)") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "default style link" do - let(:doi) { create(:doi, xml: xml, client: client, aasm_state: "findable") } - - before { get "/text/x-bibliography/#{doi.doi}" } - - it 'returns the Doi' do - expect(response.body).to start_with("Fenner, M. (2016)") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "ieee style" do - before { get "/#{doi.doi}?style=ieee", headers: { "HTTP_ACCEPT" => "text/x-bibliography", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns the Doi' do - expect(response.body).to start_with("M. Fenner") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "ieee style link" do - let(:doi) { create(:doi, xml: xml, client: client, aasm_state: "findable") } - - before { get "/text/x-bibliography/#{doi.doi}?style=ieee" } - - it 'returns the Doi' do - expect(response.body).to start_with("M. Fenner") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - - context "style and locale" do - before { get "/#{doi.doi}?style=vancouver&locale=de", headers: { "HTTP_ACCEPT" => "text/x-bibliography", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns the Doi' do - expect(response.body).to start_with("Fenner M") - end - - it 'returns status code 200' do - expect(response).to have_http_status(200) - end - end - end - - context "unknown content type" do - before { get "/#{doi.doi}", headers: { "HTTP_ACCEPT" => "text/csv", 'Authorization' => 'Bearer ' + bearer } } - - it 'returns the Doi' do - expect(json["errors"]).to eq([{"status"=>"406", "title"=>"The content type is not recognized."}]) - end - - it 'returns status code 406' do - expect(response).to have_http_status(406) - end - end - - context "missing content type" do - before { get "/#{doi.doi}", headers: { 'Authorization' => 'Bearer ' + bearer } } - - it 'returns the Doi' do - expect(json["errors"]).to eq([{"status"=>"406", "title"=>"The content type is not recognized."}]) - end - - it 'returns status code 406' do - expect(response).to have_http_status(406) - end - end -end diff --git a/spec/requests/media_spec.rb b/spec/requests/media_spec.rb index 1d3d4186a..1c8adc6cc 100644 --- a/spec/requests/media_spec.rb +++ b/spec/requests/media_spec.rb @@ -18,7 +18,7 @@ expect(json).not_to be_empty expect(json['data'].size).to eq(6) result = json['data'].first - expect(result.dig("attributes", "media-type")).to eq("application/json") + expect(result.dig("attributes", "mediaType")).to eq("application/json") end it 'returns status code 200' do @@ -68,12 +68,13 @@ describe 'POST /media' do context 'when the request is valid' do + let(:media_type) { "application/xml" } let(:valid_attributes) do { "data" => { "type" => "media", "attributes"=> { - "media-type" => media_type, + "mediaType" => media_type, "url" => url } } @@ -82,7 +83,7 @@ before { post "/dois/#{doi.doi}/media", params: valid_attributes.to_json, headers: headers } it 'creates a media record' do - expect(json.dig('data', 'attributes', 'media-type')).to eq(media_type) + expect(json.dig('data', 'attributes', 'mediaType')).to eq(media_type) expect(json.dig('data', 'attributes', 'url')).to eq(url) end @@ -91,13 +92,13 @@ end end - context 'when the media-type is missing' do + context 'when the mediaType is missing' do let(:valid_attributes) do { "data" => { "type" => "media", "attributes"=> { - "media-type" => nil, + "mediaType" => nil, "url" => url } } @@ -122,7 +123,7 @@ "data" => { "type" => "media", "attributes"=> { - "media-type"=> media_type, + "mediaType"=> media_type, "url"=> url }, "relationships"=> { @@ -155,7 +156,7 @@ "data" => { "type" => "media", "attributes"=> { - "media-type"=> media_type, + "mediaType"=> media_type, "url"=> url }, "relationships"=> { @@ -173,7 +174,7 @@ before { patch "/dois/#{doi.doi}/media/#{media.uid}", params: valid_attributes.to_json, headers: headers } it 'updates the record' do - expect(json.dig('data', 'attributes', 'media-type')).to eq(media_type) + expect(json.dig('data', 'attributes', 'mediaType')).to eq(media_type) expect(json.dig('data', 'attributes', 'url')).to eq(url) expect(json.dig('data', 'attributes', 'version')).to eq(1) end @@ -190,7 +191,7 @@ "data" => { "type" => "media", "attributes"=> { - "media-type"=> media_type, + "mediaType"=> media_type, "url"=> url }, "relationships"=> { diff --git a/spec/requests/prefixes_spec.rb b/spec/requests/prefixes_spec.rb index 5459d2bcc..2c3330863 100644 --- a/spec/requests/prefixes_spec.rb +++ b/spec/requests/prefixes_spec.rb @@ -89,9 +89,10 @@ before { post '/prefixes', params: valid_attributes.to_json, headers: headers } - it 'creates a prefix' do - expect(json.dig('data', 'id')).to eq("10.17177") - end + # TODO + # it 'creates a prefix' do + # expect(json.dig('data', 'id')).to eq("10.17177") + # end it 'returns status code 201' do expect(response).to have_http_status(201) diff --git a/spec/requests/providers_spec.rb b/spec/requests/providers_spec.rb index 7ccd9dbbb..4f8f8a343 100644 --- a/spec/requests/providers_spec.rb +++ b/spec/requests/providers_spec.rb @@ -10,8 +10,8 @@ "attributes" => { "symbol" => "BL", "name" => "British Library", - "contact-email" => "bob@example.com", - "country-code" => "GB" } } } + "contactEmail" => "bob@example.com", + "countryCode" => "GB" } } } end let(:headers) { {'ACCEPT'=>'application/vnd.api+json', 'CONTENT_TYPE'=>'application/vnd.api+json', 'Authorization' => 'Bearer ' + token } } @@ -64,15 +64,15 @@ # "symbol" => "BL", # "name" => "British Library", # "region" => "EMEA", - # "contact-email" => "doe@joe.joe", - # "contact-name" => "timAus", - # "country-code" => "GB" } } } + # "contactEmail" => "doe@joe.joe", + # "contactName" => "timAus", + # "countryCode" => "GB" } } } # end # before { post '/providers', params: params.to_json, headers: headers } # it 'creates a provider' do - # expect(json.dig('data', 'attributes', 'contact-email')).to eq("doe@joe.joe") + # expect(json.dig('data', 'attributes', 'contactEmail')).to eq("doe@joe.joe") # end # it 'returns status code 201' do @@ -88,15 +88,15 @@ # "name" => "Admin", # "region" => "EMEA", # "role_name" => "ROLE_ADMIN", - # "contact-email" => "doe@joe.joe", - # "contact-name" => "timAus", - # "country-code" => "GB" } } } + # "contactEmail" => "doe@joe.joe", + # "contactName" => "timAus", + # "countryCode" => "GB" } } } # end # before { post '/providers', params: params.to_json, headers: headers } # it 'creates a provider' do - # expect(json.dig('data', 'attributes', 'contact-email')).to eq("doe@joe.joe") + # expect(json.dig('data', 'attributes', 'contactEmail')).to eq("doe@joe.joe") # end # it 'returns status code 201' do @@ -111,9 +111,9 @@ # "symbol" => "BL", # "name" => "British Library", # "region" => "EMEA", - # "contact-email" => "doe@joe.joe", - # "contact-name" => "timAus", - # "country-code" => "GB" } } } + # "contactEmail" => "doe@joe.joe", + # "contactName" => "timAus", + # "countryCode" => "GB" } } } # end # let(:admin) { create(:provider, symbol: "ADMIN", role_name: "ROLE_ADMIN", password_input: "12345") } # let(:credentials) { admin.encode_auth_param(username: "ADMIN", password: "12345") } @@ -122,7 +122,7 @@ # before { post '/providers', params: params.to_json, headers: headers } # it 'creates a provider' do - # expect(json.dig('data', 'attributes', 'contact-email')).to eq("doe@joe.joe") + # expect(json.dig('data', 'attributes', 'contactEmail')).to eq("doe@joe.joe") # end # it 'returns status code 201' do @@ -136,8 +136,8 @@ # "attributes" => { # "symbol" => "BL", # "name" => "British Library", - # "contact-name" => "timAus", - # "country-code" => "GB" } } } + # "contactName" => "timAus", + # "countryCode" => "GB" } } } # end # before { post '/providers', params: params.to_json, headers: headers } @@ -156,7 +156,7 @@ # { "type" => "providers", # "attributes" => { # "symbol" => "BL", - # "contact-name" => "timAus", + # "contactName" => "timAus", # "name" => "British Library", # "country-code" => "GB" } } # end @@ -180,14 +180,14 @@ "attributes" => { "name" => "British Library", "region" => "Americas", - "contact-email" => "Pepe@mdm.cod", - "contact-name" => "timAus", - "country-code" => "GB" } } } + "contactEmail" => "Pepe@mdm.cod", + "contactName" => "timAus", + "countryCode" => "GB" } } } end before { put "/providers/#{provider.symbol}", params: params.to_json, headers: headers } it 'updates the record' do - expect(json.dig('data', 'attributes', 'contact-name')).to eq("timAus") + expect(json.dig('data', 'attributes', 'contactName')).to eq("timAus") end it 'returns status code 200' do @@ -201,9 +201,9 @@ "attributes" => { "name" => "British Library", "region" => "Americas", - "contact-email" => "Pepe@mdm.cod", - "contact-name" => "timAus", - "country-code" => "GB" } } } + "contactEmail" => "Pepe@mdm.cod", + "contactName" => "timAus", + "countryCode" => "GB" } } } end let(:admin) { create(:provider, symbol: "ADMIN", role_name: "ROLE_ADMIN", password_input: "12345") } let(:credentials) { admin.encode_auth_param(username: "ADMIN", password: "12345") } @@ -212,7 +212,7 @@ before { put "/providers/#{provider.symbol}", params: params.to_json, headers: headers } it 'updates the record' do - expect(json.dig('data', 'attributes', 'contact-name')).to eq("timAus") + expect(json.dig('data', 'attributes', 'contactName')).to eq("timAus") end it 'returns status code 200' do @@ -226,9 +226,9 @@ "attributes" => { "name" => "British Library", "region" => "Americas", - "contact-email" => "Pepe@mdm.cod", - "contact-name" => "timAus", - "country-code" => "GB" } } } + "contactEmail" => "Pepe@mdm.cod", + "contactName" => "timAus", + "countryCode" => "GB" } } } end before { put '/providers/xxx', params: params.to_json, headers: headers } diff --git a/spec/requests/works_spec.rb b/spec/requests/works_spec.rb new file mode 100644 index 000000000..57c5dc04c --- /dev/null +++ b/spec/requests/works_spec.rb @@ -0,0 +1,76 @@ +require 'rails_helper' + +describe "works", type: :request do + let(:admin) { create(:provider, symbol: "ADMIN") } + let(:admin_bearer) { Client.generate_token(role_id: "staff_admin", uid: admin.symbol, password: admin.password) } + let(:admin_headers) { {'ACCEPT'=>'application/vnd.api+json', 'CONTENT_TYPE'=>'application/vnd.api+json', 'Authorization' => 'Bearer ' + admin_bearer}} + + let(:provider) { create(:provider, symbol: "DATACITE") } + let(:client) { create(:client, provider: provider, symbol: ENV['MDS_USERNAME'], password: ENV['MDS_PASSWORD']) } + let!(:prefix) { create(:prefix, prefix: "10.14454") } + let!(:client_prefix) { create(:client_prefix, client: client, prefix: prefix) } + let!(:dois) { create_list(:doi, 3, client: client, event: "publish") } + let(:doi) { create(:doi, client: client, event: "publish") } + let(:bearer) { Client.generate_token(role_id: "client_admin", uid: client.symbol, provider_id: provider.symbol.downcase, client_id: client.symbol.downcase, password: client.password) } + let(:headers) { { 'ACCEPT'=>'application/vnd.api+json', 'CONTENT_TYPE'=>'application/vnd.api+json', 'Authorization' => 'Bearer ' + bearer }} + + describe 'GET /works', elasticsearch: true do + before do + sleep 1 + get '/works', headers: headers + end + + # it 'returns dois' do + # expect(json['data'].size).to eq(0) + # end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + describe 'GET /works/:id' do + context 'when the record exists' do + before { get "/works/#{doi.doi}", headers: headers } + + it 'returns the Doi' do + expect(json).not_to be_empty + expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi.downcase) + expect(json.dig('data', 'attributes', 'author').length).to eq(8) + expect(json.dig('data', 'attributes', 'author').first).to eq("family"=>"Ollomo", "given"=>"Benjamin") + expect(json.dig('data', 'attributes', 'title')).to eq("Data from: A new malaria agent in African hominids.") + expect(json.dig('data', 'attributes', 'container-title')).to eq("Dryad Digital Repository") + expect(json.dig('data', 'attributes', 'published')).to eq("2011") + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + + context 'when the record does not exist' do + before { get "/works/10.5256/xxxx", headers: headers } + + it 'returns status code 404' do + expect(response).to have_http_status(404) + end + + it 'returns a not found message' do + expect(json).to eq("errors"=>[{"status"=>"404", "title"=>"The resource you are looking for doesn't exist."}]) + end + end + + context 'anonymous user' do + before { get "/works/#{doi.doi}" } + + it 'returns the Doi' do + expect(json).not_to be_empty + expect(json.dig('data', 'attributes', 'doi')).to eq(doi.doi.downcase) + end + + it 'returns status code 200' do + expect(response).to have_http_status(200) + end + end + end +end \ No newline at end of file diff --git a/vendor/docker/70_index_page.sh b/vendor/docker/70_index_page.sh new file mode 100755 index 000000000..fad7b5b99 --- /dev/null +++ b/vendor/docker/70_index_page.sh @@ -0,0 +1,3 @@ +#!/bin/sh +cd vendor/middleman +/sbin/setuser app bundle exec middleman build -e ${RAILS_ENV} diff --git a/vendor/middleman/Gemfile b/vendor/middleman/Gemfile new file mode 100644 index 000000000..3410f7d6b --- /dev/null +++ b/vendor/middleman/Gemfile @@ -0,0 +1,12 @@ +# If you do not have OpenSSL installed, change +# the following line to use 'http://' +source 'https://rubygems.org' + +# Middleman Gems +gem 'middleman', "~> 4.1" +gem 'tilt', '~> 2.0', git: "https://github.com/datacite/tilt.git", branch: "pandoc-options" +gem 'tilt-handlebars', '~> 1.4' +gem 'middleman-data_source', '~> 0.8.1' +gem 'middleman-livereload' +gem 'middleman-syntax', '~> 2.0' +gem 'pandoc-ruby', '~> 2.0' diff --git a/vendor/middleman/Gemfile.lock b/vendor/middleman/Gemfile.lock new file mode 100644 index 000000000..fd3ba85c7 --- /dev/null +++ b/vendor/middleman/Gemfile.lock @@ -0,0 +1,149 @@ +GIT + remote: https://github.com/datacite/tilt.git + revision: 612652f9d03ff3c129c415b1826fb84b0c7a0845 + branch: pandoc-options + specs: + tilt (2.0.5) + +GEM + remote: https://rubygems.org/ + specs: + activesupport (5.0.6) + concurrent-ruby (~> 1.0, >= 1.0.2) + i18n (~> 0.7) + minitest (~> 5.1) + tzinfo (~> 1.1) + addressable (2.5.2) + public_suffix (>= 2.0.2, < 4.0) + backports (3.10.3) + borrower (0.10.0) + coffee-script (2.4.1) + coffee-script-source + execjs + coffee-script-source (1.12.2) + compass-import-once (1.0.5) + sass (>= 3.2, < 3.5) + concurrent-ruby (1.0.5) + contracts (0.13.0) + dotenv (2.2.1) + em-websocket (0.5.1) + eventmachine (>= 0.12.9) + http_parser.rb (~> 0.6.0) + erubis (2.7.0) + eventmachine (1.2.5) + execjs (2.7.0) + fast_blank (1.0.0) + fastimage (2.1.1) + ffi (1.9.18) + haml (5.0.4) + temple (>= 0.8.0) + tilt + hamster (3.0.0) + concurrent-ruby (~> 1.0) + handlebars (0.8.0) + handlebars-source (~> 4.0.5) + therubyracer (~> 0.12.1) + handlebars-source (4.0.11) + hashie (3.5.7) + http_parser.rb (0.6.0) + i18n (0.7.0) + kramdown (1.16.2) + libv8 (3.16.14.19) + listen (3.0.8) + rb-fsevent (~> 0.9, >= 0.9.4) + rb-inotify (~> 0.9, >= 0.9.7) + memoist (0.16.0) + middleman (4.2.1) + coffee-script (~> 2.2) + compass-import-once (= 1.0.5) + haml (>= 4.0.5) + kramdown (~> 1.2) + middleman-cli (= 4.2.1) + middleman-core (= 4.2.1) + sass (>= 3.4.0, < 4.0) + middleman-cli (4.2.1) + thor (>= 0.17.0, < 2.0) + middleman-core (4.2.1) + activesupport (>= 4.2, < 5.1) + addressable (~> 2.3) + backports (~> 3.6) + bundler (~> 1.1) + contracts (~> 0.13.0) + dotenv + erubis + execjs (~> 2.0) + fast_blank + fastimage (~> 2.0) + hamster (~> 3.0) + hashie (~> 3.4) + i18n (~> 0.7.0) + listen (~> 3.0.0) + memoist (~> 0.14) + padrino-helpers (~> 0.13.0) + parallel + rack (>= 1.4.5, < 3) + sass (>= 3.4) + servolux + tilt (~> 2.0) + uglifier (~> 3.0) + middleman-data_source (0.8.1) + borrower (~> 0.9) + middleman (>= 3.1) + rack-test (~> 0.6.2) + middleman-livereload (3.4.6) + em-websocket (~> 0.5.1) + middleman-core (>= 3.3) + rack-livereload (~> 0.3.15) + middleman-syntax (2.1.0) + middleman-core (>= 3.2) + rouge (~> 1.0) + minitest (5.10.3) + padrino-helpers (0.13.3.4) + i18n (~> 0.6, >= 0.6.7) + padrino-support (= 0.13.3.4) + tilt (>= 1.4.1, < 3) + padrino-support (0.13.3.4) + activesupport (>= 3.1) + pandoc-ruby (2.0.2) + parallel (1.12.1) + public_suffix (3.0.1) + rack (2.0.3) + rack-livereload (0.3.16) + rack + rack-test (0.6.3) + rack (>= 1.0) + rb-fsevent (0.10.2) + rb-inotify (0.9.10) + ffi (>= 0.5.0, < 2) + ref (2.0.0) + rouge (1.11.1) + sass (3.4.25) + servolux (0.13.0) + temple (0.8.0) + therubyracer (0.12.3) + libv8 (~> 3.16.14.15) + ref + thor (0.20.0) + thread_safe (0.3.6) + tilt-handlebars (1.4.0) + handlebars (~> 0.7) + tilt (>= 1.3, < 3) + tzinfo (1.2.4) + thread_safe (~> 0.1) + uglifier (3.2.0) + execjs (>= 0.3.0, < 3) + +PLATFORMS + ruby + +DEPENDENCIES + middleman (~> 4.1) + middleman-data_source (~> 0.8.1) + middleman-livereload + middleman-syntax (~> 2.0) + pandoc-ruby (~> 2.0) + tilt (~> 2.0)! + tilt-handlebars (~> 1.4) + +BUNDLED WITH + 1.16.0 diff --git a/vendor/middleman/config.rb b/vendor/middleman/config.rb new file mode 100644 index 000000000..b03ba4ad8 --- /dev/null +++ b/vendor/middleman/config.rb @@ -0,0 +1,52 @@ +### +# Page options, layouts, aliases and proxies +### + +# Default ENV variables +ENV['CDN_URL'] ||= "https://assets.datacite.org" +ENV['RAILS_ENV'] ||= "development" +ENV['SITE_TITLE'] ||= "DataCite REST API" +ENV['SITE_DESCRIPTION'] ||= "The DataCite API." +ENV['TWITTER_HANDLE'] ||= "@datacite" + +# Build into /public +set :build_dir, "../../public" + +# Per-page layout changes: +# +# With no layout +page '/*.xml', layout: false +page '/*.json', layout: false +page '/*.txt', layout: false + +# General configuration + +# Reload the browser automatically whenever files change +configure :development do + activate :livereload +end + +# Load data +activate :data_source do |c| + c.root = "#{ENV['CDN_URL']}/data" + c.files = [ + "links.json" + ] +end + +# Set markdown template engine +set :markdown_engine, :pandoc +set :markdown, smartypants: true + +# use asset host +activate :asset_host, host: ENV['CDN_URL'] + +### +# Helpers +### +# Methods defined in the helpers block are available in templates +helpers do + def stage? + ENV['RAILS_ENV'] == "stage" + end +end diff --git a/vendor/middleman/config.ru b/vendor/middleman/config.ru new file mode 100644 index 000000000..ece6fda7e --- /dev/null +++ b/vendor/middleman/config.ru @@ -0,0 +1,11 @@ +require 'middleman-core/load_paths' +::Middleman.setup_load_paths + +require 'middleman-core' +require 'middleman-core/rack' + +require 'fileutils' + +app = ::Middleman::Application.new + +run ::Middleman::Rack.new(app).to_app diff --git a/public/favicon.ico b/vendor/middleman/source/favicon.ico old mode 100644 new mode 100755 similarity index 100% rename from public/favicon.ico rename to vendor/middleman/source/favicon.ico diff --git a/vendor/middleman/source/includes/_footer.html.hbs b/vendor/middleman/source/includes/_footer.html.hbs new file mode 100644 index 000000000..a10f67d10 --- /dev/null +++ b/vendor/middleman/source/includes/_footer.html.hbs @@ -0,0 +1,61 @@ + diff --git a/vendor/middleman/source/includes/_google_analytics.html.hbs b/vendor/middleman/source/includes/_google_analytics.html.hbs new file mode 100644 index 000000000..8b18f56af --- /dev/null +++ b/vendor/middleman/source/includes/_google_analytics.html.hbs @@ -0,0 +1,9 @@ + diff --git a/vendor/middleman/source/includes/_header.html.hbs b/vendor/middleman/source/includes/_header.html.hbs new file mode 100644 index 000000000..797adbfda --- /dev/null +++ b/vendor/middleman/source/includes/_header.html.hbs @@ -0,0 +1,20 @@ + diff --git a/vendor/middleman/source/includes/_javascripts.html.hbs b/vendor/middleman/source/includes/_javascripts.html.hbs new file mode 100644 index 000000000..afa75fdff --- /dev/null +++ b/vendor/middleman/source/includes/_javascripts.html.hbs @@ -0,0 +1,4 @@ + + + + diff --git a/vendor/middleman/source/index.html.md b/vendor/middleman/source/index.html.md new file mode 100644 index 000000000..bc3ad8183 --- /dev/null +++ b/vendor/middleman/source/index.html.md @@ -0,0 +1,11 @@ +--- +layout: index +title: DataCite REST API +description: The API to interact with all DataCite resources. +--- + +The DataCite REST API allows users to interact with DataCite resources such as dois, clients, providers and prefixes. Please use +[DOI Fabrica](https://doi.datacite.org) if you are looking for a web interface. The API follows the [JSONAPI](http://jsonapi.org/) +specification. The API requires authentication for some actions. + +You will find more information about the REST API in our [documentation portal](https://support.datacite.org/docs/api). diff --git a/vendor/middleman/source/layouts/index.erb b/vendor/middleman/source/layouts/index.erb new file mode 100644 index 000000000..e74de28c0 --- /dev/null +++ b/vendor/middleman/source/layouts/index.erb @@ -0,0 +1,23 @@ +<% wrap_layout :layout do %> +
+ +
+
+
+

<%= current_page.data.title %>

+

<%= current_page.data.description %>

+
+
+
+ +
+
+
+
+ <%= yield -%> +
+
+
+
+
+<% end %> diff --git a/vendor/middleman/source/layouts/layout.erb b/vendor/middleman/source/layouts/layout.erb new file mode 100644 index 000000000..877498a34 --- /dev/null +++ b/vendor/middleman/source/layouts/layout.erb @@ -0,0 +1,70 @@ + + + + + + + + + + <%= ENV['SITE_TITLE'] %> + + + + + + + + + + + + + + + + + <% if ENV['TWITTER_HANDLE'] %> + + + + + + <% end %> + + + + + + + + + + + + + <% if ENV['BUGSNAG_JS_KEY'] %> + + <% end -%> + + + <% header_links = development? ? data.links.development_links : (stage? ? data.links.stage_links : data.links.production_links) %> + <%= partial "includes/header.html.hbs", locals: + { site_title: ENV['SITE_TITLE'], + stage: stage?, + development: development?, + header_links: header_links } -%> + <%= yield -%> + <%= partial "includes/footer.html.hbs", locals: + { about_links: data.links.about_links, + services_links: data.links.services_links, + resources_links: data.links.resources_links, + community_links: data.links.community_links, + contact_links: data.links.contact_links } -%> + <%= partial "includes/javascripts.html.hbs", locals: { cdn_url: ENV['CDN_URL'] } -%> + <%= partial "includes/google_analytics.html.hbs", locals: { site_ga: ENV['SITE_GA'] } -%> + + diff --git a/vendor/middleman/source/robots.txt b/vendor/middleman/source/robots.txt new file mode 100644 index 000000000..64253dadd --- /dev/null +++ b/vendor/middleman/source/robots.txt @@ -0,0 +1,3 @@ +# See http://www.robotstxt.org/wc/norobots.html for documentation on how to use the robots.txt file +User-Agent: * +Disallow: /tmp/