From aa1ccb092a9485e17650aca3d5cfb566a679ce34 Mon Sep 17 00:00:00 2001 From: Max Kadel Date: Wed, 12 Jan 2022 08:27:44 -0500 Subject: [PATCH] HYC-1280: Create intermediate ingest object (#738) * Create object to store xml and parse jats xml Create intermediate object for parsing xml and translating to Hyrax objects - Move check for extra files in package - Do not map UNC affiliation until we can do so more reliably, put in "other affiliation" until then * Add and configure javascript driver for capybara, upgrade * Use ffaker for tests, do setup step once for feature, for faster run --- .rubocop.yml | 3 +- Gemfile | 5 +- Gemfile.lock | 28 +- README.md | 7 + app/models/jats_ingest_work.rb | 224 +++ .../workflow/pending_deletion_notification.rb | 2 +- app/services/tasks/sage_ingest_service.rb | 61 +- config/authorities/licenses.yml | 3 + db/schema.rb | 1 + spec/factories/user.rb | 6 +- .../features/edit_sage_ingested_works_spec.rb | 106 + .../sage/10.1177_2192568219888179.xml | 1715 +++++++++++++++++ .../10.1177_1073274820985792.xml | 2 +- spec/fixtures/sage/sage_config.yml | 2 +- spec/fixtures/sage/triple_package.zip | Bin 0 -> 584 bytes .../local/file_based_authority_spec.rb | 3 + spec/models/jats_ingest_work_spec.rb | 110 ++ spec/rails_helper.rb | 6 +- .../pending_deletion_notification_spec.rb | 29 +- .../tasks/sage_ingest_service_spec.rb | 99 +- spec/support/capybara.rb | 23 + 21 files changed, 2382 insertions(+), 53 deletions(-) create mode 100644 app/models/jats_ingest_work.rb create mode 100644 spec/features/edit_sage_ingested_works_spec.rb create mode 100644 spec/fixtures/sage/10.1177_2192568219888179.xml create mode 100644 spec/fixtures/sage/triple_package.zip create mode 100644 spec/models/jats_ingest_work_spec.rb create mode 100644 spec/support/capybara.rb diff --git a/.rubocop.yml b/.rubocop.yml index fd03c1b6d..d22f9b694 100644 --- a/.rubocop.yml +++ b/.rubocop.yml @@ -3,10 +3,9 @@ inherit_from: .rubocop_todo.yml AllCops: TargetRubyVersion: 2.6.7 NewCops: disable - -Metrics/BlockLength: Exclude: - 'db/schema.rb' + - 'vendor/**/*' # TODO: Enable this cop - temporarily disabled here because it is not being added to the auto-generated to-do list Lint/RedundantCopDisableDirective: diff --git a/Gemfile b/Gemfile index 3b0c0c3a8..bf2a7b8f7 100644 --- a/Gemfile +++ b/Gemfile @@ -81,10 +81,13 @@ group :development do end group :test do - gem 'capybara', '~> 2.17.0' + gem 'capybara', '~> 3.36' gem 'factory_bot_rails', '~> 6.1.0' + gem 'ffaker' gem 'rspec-mocks' + gem "selenium-webdriver" gem 'shoulda-matchers', '~> 5.0.0' gem 'simplecov', '~> 0.17.0' + gem "webdrivers" gem 'webmock', '~> 3.14.0' end diff --git a/Gemfile.lock b/Gemfile.lock index 99b2e4a2f..0610cb5c0 100644 --- a/Gemfile.lock +++ b/Gemfile.lock @@ -179,18 +179,21 @@ GEM simple_form byebug (9.1.0) cancancan (1.17.0) - capybara (2.17.0) + capybara (3.36.0) addressable + matrix mini_mime (>= 0.1.3) - nokogiri (>= 1.3.3) - rack (>= 1.0.0) - rack-test (>= 0.5.4) - xpath (>= 2.0, < 4.0) + nokogiri (~> 1.8) + rack (>= 1.6.0) + rack-test (>= 0.6.3) + regexp_parser (>= 1.5, < 3.0) + xpath (~> 3.2) carrierwave (1.3.2) activemodel (>= 4.0.0) activesupport (>= 4.0.0) mime-types (>= 1.16) ssrf_filter (~> 1.0) + childprocess (4.1.0) chronic_duration (0.10.6) numerizer (~> 0.1.1) clamav-client (3.2.0) @@ -313,6 +316,7 @@ GEM faraday (>= 0.7.4, < 1.0) fcrepo_wrapper (0.8.0) ruby-progressbar + ffaker (2.20.0) ffi (1.15.4) flipflop (2.6.0) activesupport (>= 4.0) @@ -588,6 +592,7 @@ GEM carrierwave (>= 0.5.8) rails (>= 5.0.0) marcel (1.0.1) + matrix (0.4.2) memoist (0.16.2) method_source (1.0.0) mime-types (3.3.1) @@ -846,6 +851,10 @@ GEM ffi (~> 1.9) scanf (1.0.0) select2-rails (3.5.11) + selenium-webdriver (4.1.0) + childprocess (>= 0.5, < 5.0) + rexml (~> 3.2, >= 3.2.5) + rubyzip (>= 1.2.2) shex (0.6.2) ebnf (~> 2.1) json-ld (~> 3.1) @@ -946,6 +955,10 @@ GEM activemodel (>= 5.0) bindex (>= 0.4.0) railties (>= 5.0) + webdrivers (5.0.0) + nokogiri (~> 1.6) + rubyzip (>= 1.3.0) + selenium-webdriver (~> 4.0) webmock (3.14.0) addressable (>= 2.8.0) crack (>= 0.3.2) @@ -969,7 +982,7 @@ DEPENDENCIES bootstrap-sass (~> 3.4.1) bulkrax (~> 1.0.0) byebug (~> 9.1.0) - capybara (~> 2.17.0) + capybara (~> 3.36) clamav-client coffee-rails (~> 4.2.2) devise (~> 4.8.0) @@ -978,6 +991,7 @@ DEPENDENCIES execjs (= 2.8.1) factory_bot_rails (~> 6.1.0) fcrepo_wrapper (~> 0.8.0) + ffaker httparty (~> 0.20.0) hydra-editor (= 5.0.1) hydra-role-management (~> 1.0) @@ -1008,6 +1022,7 @@ DEPENDENCIES rubocop-rails rubocop-rspec sass-rails (~> 5.0.6) + selenium-webdriver shoulda-matchers (~> 5.0.0) sidekiq (~> 5.2.9) sidekiq-limit_fetch (~> 3.4.0) @@ -1018,6 +1033,7 @@ DEPENDENCIES turbolinks (~> 5.0.1) uglifier (~> 4.2.0) web-console (~> 3.7.0) + webdrivers webmock (~> 3.14.0) willow_sword! diff --git a/README.md b/README.md index 16bb256a4..efb856c5a 100755 --- a/README.md +++ b/README.md @@ -55,6 +55,13 @@ bundle exec rake sage:ingest[/hyrax/spec/fixtures/sage/sage_config.yml] work.to_solr.deep_symbolize_keys! ``` * Copy the output of this to the sample_solr_documents file. Add a unique `:timestamp` value to the hash (e.g. `:timestamp => "2021-11-23T16:05:33.033Z"`) so that the `spec/requests/oai_pmh_endpoint_spec.rb` tests to continue to pass. + +#### Debugging Capybara feature and javascript tests +* Save a screenshot + * Put `page.save_screenshot('screenshot.png')` on the line before the failing test (you can use a different name for the file if that's helpful) + * The screenshot will be saved to `tmp/capybara`. + * See https://github.com/teamcapybara/capybara#debugging for more info + ##### Code Linter - Rubocop * Helpful Rubocop documentation - https://docs.rubocop.org/rubocop/usage/basic_usage.html diff --git a/app/models/jats_ingest_work.rb b/app/models/jats_ingest_work.rb new file mode 100644 index 000000000..e2d8c3b17 --- /dev/null +++ b/app/models/jats_ingest_work.rb @@ -0,0 +1,224 @@ +# For information on the JATS metadata standard, see https://jats.nlm.nih.gov/ +# Currently used for Sage ingest +class JatsIngestWork + include ActiveModel + attr_reader :xml_path + + def initialize(xml_path:) + @xml_path = xml_path + end + + def jats_xml + @jats_xml ||= File.read(xml_path) + end + + def document + @document ||= Nokogiri::XML(jats_xml) + end + + def article_metadata + @article_metadata ||= document.xpath('.//article-meta') + end + + def creators_metadata + @creators_metadata ||= document.xpath('.//contrib-group') + end + + def journal_metadata + @journal_metadata ||= document.xpath('.//journal-meta') + end + + def permissions + @permissions ||= article_metadata.xpath('.//permissions') + end + + def abstract + article_metadata.xpath('.//abstract').map(&:inner_text) + end + + def copyright_date + permissions.at('copyright-year').inner_text + end + + def creators + @creators ||= begin + creators_metadata.xpath('.//contrib').map.with_index do |contributor, index| + [index, contributor_to_hash(contributor, index)] + end.to_h + end + end + + # TODO: Map affiliation to UNC controlled vocabulary + def contributor_to_hash(contributor, index) + affiliation_ids = affiliation_ids(contributor) + first_affiliation = affiliation_map[affiliation_ids.first] + { + 'name' => "#{surname(contributor)}, #{given_names(contributor)}", + 'orcid' => orcid(contributor), + 'affiliation' => '', + # 'affiliation' => some_method, # Do not store affiliation until we can map it to the controlled vocabulary + 'other_affiliation' => first_affiliation, + 'index' => (index+1).to_s + } + end + + def affiliation_map + @affiliation_map ||= begin + document.xpath('//aff').map do |affil| + [affil.attributes["id"].value, affiliation_to_s(affil)] + end.to_h + end + end + + def affiliation_ids(elem) + references = elem.xpath('xref') + references.map do |ref| + reference_type = ref['ref-type'] + next unless reference_type=="aff" + + ref["rid"] + end.compact + end + + def affiliation_to_s(affil_elem) + affil_elem.children.map do |child| + # Don't include newlines or the order label + next if child.inner_text == "\n" || child.name == "label" + + # Only include the institution name proper from the institution-wrap, don't include the institution-id + if child.xpath(".//institution").present? + child.xpath(".//institution").inner_text + else + child.inner_text + end + end.join + end + + def date_of_publication + if publication_day && publication_month && publication_year + "#{publication_year}-#{publication_month}-#{publication_day}" + elsif publication_month && publication_year + "#{publication_year}-#{publication_month}" + else + publication_year + end + end + + def funder + article_metadata.xpath('.//funding-source/institution-wrap/institution').map(&:inner_text) + end + + # The Sage-assigned DOI + def identifier + article_metadata.xpath('.//article-id[@pub-id-type="doi"]').map(&:inner_text) + end + + def issn + journal_metadata.xpath(".//issn").map(&:inner_text) + end + + def journal_issue + article_metadata.at('issue')&.inner_text + end + + def journal_title + journal_metadata.xpath(".//journal-title-group/journal-title").inner_text + end + + def journal_volume + article_metadata.at('volume')&.inner_text + end + + def keyword + article_metadata.at('kwd-group').xpath("//kwd").map do |elem| + if elem.at('italic') + elem.at('italic').inner_text + else + elem.inner_text + end + end + end + + def license + permissions.xpath(".//license/@xlink:href").map do |elem| + CdrLicenseService.authority.find(elem&.inner_text)[:id] + end + end + + def license_label + license.map do |lic| + CdrLicenseService.label(lic) + end + end + + def page_end + article_metadata.at('lpage')&.inner_text + end + + def page_start + article_metadata.at('fpage')&.inner_text + end + + def publisher + journal_metadata.xpath('.//publisher/publisher-name').map(&:inner_text) + end + + def rights_holder + permissions.xpath('.//copyright-holder').map(&:inner_text) + end + + def title + article_metadata.xpath('.//title-group/article-title').map(&:inner_text) + end + + private + + def publication_year + year = publication_date_node_set.at('year')&.inner_text&.to_i + format('%04d', year) if year + end + + def publication_month + month = publication_date_node_set.at('month')&.inner_text&.to_i + format('%02d', month) if month + end + + def publication_day + day = publication_date_node_set.at('day')&.inner_text&.to_i + format('%02d', day) if day + end + + def publication_date_node_set + if physical_publication_date.present? + physical_publication_date + elsif electronic_and_physical_publication_date.present? + electronic_and_physical_publication_date + elsif electronic_publication_date.present? + electronic_publication_date + end + end + + def electronic_publication_date + article_metadata.xpath('.//pub-date[@pub-type="epub"]') + end + + def electronic_and_physical_publication_date + article_metadata.xpath('.//pub-date[@pub-type="epub-ppub"]') + end + + def physical_publication_date + article_metadata.xpath('.//pub-date[@pub-type="ppub"]') + end + + def surname(contributor) + contributor.xpath('name/surname').inner_text + end + + def given_names(contributor) + contributor.xpath('name/given-names').inner_text + end + + def orcid(contributor) + contributor.xpath('contrib-id').inner_text + end +end diff --git a/app/services/hyrax/workflow/pending_deletion_notification.rb b/app/services/hyrax/workflow/pending_deletion_notification.rb index 595db165a..3a6cc2bd6 100644 --- a/app/services/hyrax/workflow/pending_deletion_notification.rb +++ b/app/services/hyrax/workflow/pending_deletion_notification.rb @@ -20,7 +20,7 @@ def users_to_notify repo_admins.each do |u| users << u end - users.uniq + users.compact.uniq end end end diff --git a/app/services/tasks/sage_ingest_service.rb b/app/services/tasks/sage_ingest_service.rb index e29431476..ba159159f 100644 --- a/app/services/tasks/sage_ingest_service.rb +++ b/app/services/tasks/sage_ingest_service.rb @@ -1,11 +1,13 @@ module Tasks require 'tasks/migrate/services/progress_tracker' class SageIngestService - attr_reader :package_dir, :ingest_progress_log + attr_reader :package_dir, :ingest_progress_log, :admin_set def initialize(args) config = YAML.load_file(args[:configuration_file]) + @admin_set = ::AdminSet.where(title: config['admin_set']).first + @package_dir = config['package_dir'] @ingest_progress_log = Migrate::Services::ProgressTracker.new(config['ingest_progress_log']) end @@ -19,20 +21,57 @@ def process_packages orig_file_name = File.basename(package_path, '.zip') Dir.mktmpdir do |dir| file_names = extract_files(package_path, dir).keys - unless file_names.count == 2 - Rails.logger.tagged('Sage ingest') { Rails.logger.error("Unexpected package contents - more than two files extracted from #{package_path}") } - next - end - _pdf_file_name = file_names.first - _xml_file_name = file_names.last + next unless file_names.count == 2 + + _pdf_file_name = file_names.find { |name| name.match(/^(\S*).pdf/) } + xml_file_name = file_names.find { |name| name.match(/^(\S*).xml/) } # parse xml - # create object with xml and pdf + ingest_work = JatsIngestWork.new(xml_path: File.join(dir, xml_file_name)) + # Create Article with metadata and save + build_article(ingest_work) + # Add PDF file to Article (including FileSets) # save object + # set off background jobs for object? mark_done(orig_file_name) if package_ingest_complete?(dir, file_names) end end end + def build_article(ingest_work) + art = Article.new + art.admin_set = @admin_set + # required fields + art.title = ingest_work.title + art.creators_attributes = ingest_work.creators + art.abstract = ingest_work.abstract + art.date_issued = ingest_work.date_of_publication + # additional fields + art.copyright_date = ingest_work.copyright_date + art.dcmi_type = ['http://purl.org/dc/dcmitype/Text'] + art.funder = ingest_work.funder + art.identifier = ingest_work.identifier + art.issn = ingest_work.issn + art.journal_issue = ingest_work.journal_issue + art.journal_title = ingest_work.journal_title + art.journal_volume = ingest_work.journal_volume + art.keyword = ingest_work.keyword + art.license = ingest_work.license + art.license_label = ingest_work.license_label + art.page_end = ingest_work.page_end + art.page_start = ingest_work.page_start + art.publisher = ingest_work.publisher + art.resource_type = ['Article'] + art.rights_holder = ingest_work.rights_holder + art.rights_statement = 'http://rightsstatements.org/vocab/InC/1.0/' + # fields not normally edited via UI + art.date_uploaded = DateTime.current + art.date_modified = DateTime.current + + art.save! + # return the Article object + art + end + def mark_done(orig_file_name) Rails.logger.tagged('Sage ingest') { Rails.logger.info("Marked package ingest complete #{orig_file_name}") } @ingest_progress_log.add_entry(orig_file_name) @@ -48,12 +87,16 @@ def package_ingest_complete?(dir, file_names) def extract_files(package_path, temp_dir) begin - Zip::File.open(package_path) do |zip_file| + extracted_files = Zip::File.open(package_path) do |zip_file| zip_file.each do |file| file_path = File.join(temp_dir, file.name) zip_file.extract(file, file_path) end end + unless extracted_files.count == 2 + Rails.logger.tagged('Sage ingest') { Rails.logger.error("Unexpected package contents - more than two files extracted from #{package_path}") } + end + extracted_files rescue Zip::DestinationFileExistsError => e Rails.logger.tagged('Sage ingest') { Rails.logger.info("#{package_path}, zip file error: #{e.message}") } end diff --git a/config/authorities/licenses.yml b/config/authorities/licenses.yml index b0d6d4bbd..68ef414dc 100755 --- a/config/authorities/licenses.yml +++ b/config/authorities/licenses.yml @@ -17,6 +17,9 @@ terms: - id: http://creativecommons.org/licenses/by-nc-nd/3.0/us/ term: Attribution-NonCommercial-NoDerivs 3.0 United States active: all + - id: http://creativecommons.org/licenses/by-nc-nd/4.0/ + term: Attribution-NonCommercial-NoDerivatives 4.0 International + active: all - id: http://creativecommons.org/licenses/by-nc-sa/3.0/us/ term: Attribution-NonCommercial-ShareAlike 3.0 United States active: all diff --git a/db/schema.rb b/db/schema.rb index 3c79d584a..b0d6a233a 100644 --- a/db/schema.rb +++ b/db/schema.rb @@ -11,6 +11,7 @@ # It's strongly recommended that you check this file into your version control system. ActiveRecord::Schema.define(version: 2021_08_06_065737) do + # These are extensions that must be enabled in order to support this database enable_extension "plpgsql" diff --git a/spec/factories/user.rb b/spec/factories/user.rb index c53cc18d3..f63fbd636 100644 --- a/spec/factories/user.rb +++ b/spec/factories/user.rb @@ -1,8 +1,8 @@ FactoryBot.define do factory :user do - uid { 'test' } - display_name { 'test' } - email { 'test@test.edu' } + uid { FFaker::Internet.user_name } + display_name { FFaker::Name.name } + email { FFaker::Internet.email } transient do # Allow for custom groups when a user is instantiated. diff --git a/spec/features/edit_sage_ingested_works_spec.rb b/spec/features/edit_sage_ingested_works_spec.rb new file mode 100644 index 000000000..518f713da --- /dev/null +++ b/spec/features/edit_sage_ingested_works_spec.rb @@ -0,0 +1,106 @@ +require 'rails_helper' +require Rails.root.join('spec/support/capybara.rb') + +include Warden::Test::Helpers + +RSpec.feature 'Edit works created through the Sage ingest', js: false do + let(:ingest_progress_log_path) { File.join(fixture_path, "sage", "ingest_progress.log") } + + # empty the progress log + around do |example| + File.open(ingest_progress_log_path, 'w') {|file| file.truncate(0) } + example.run + File.open(ingest_progress_log_path, 'w') {|file| file.truncate(0) } + end + + before(:all) do + @admin_user = FactoryBot.create(:admin) + @admin_set = AdminSet.create(title: ['sage admin set'], + description: ['some description'], + edit_users: [@admin_user.user_key]) + @path_to_config = File.join(fixture_path, "sage", "sage_config.yml") + + @ingest_service = Tasks::SageIngestService.new(configuration_file: @path_to_config) + @ingest_service.process_packages + + @article_count = Article.count + @articles = Article.all + # We're not clearing out the database, Fedora, and Solr before this test, so to find the first work created in this + # test, we need to count backwards from the last work created. + @first_work = @articles[-4] + @first_work_id = @first_work.id + @third_work_id = @articles[-2].id + end + + it "can open the edit page" do + login_as @admin_user + visit "concern/articles/#{@first_work_id}" + expect(page).to have_content("Inequalities in Cervical Cancer Screening Uptake Between") + expect(page).to have_content('Smith, Jennifer S.') + expect(page).to have_content('sage admin set') + expect(page).to have_content('Attribution-NonCommercial 4.0 International') + click_link('Edit') + expect(page).to have_link("Work Deposit Form") + end + + it "has attached the file_set to the work" do + pending("Adding file sets to the Article object") + expect(@first_work.file_sets.first).to be_instance_of(FileSet) + end + + it "can render the pre-populated edit page" do + login_as @admin_user + visit "concern/articles/#{@first_work_id}/edit" + # These values are also tested in the spec/services/tasks/sage_ingest_service_spec.rb + # form order + expect(page).to have_field('Title', with: 'Inequalities in Cervical Cancer Screening Uptake Between Chinese Migrant Women and Local Women: A Cross-Sectional Study') + expect(page).to have_field('Creator #1', with: 'Holt, Hunter K.') + expect(page).to have_field('Additional affiliation (Creator #1)', with: 'Department of Family and Community Medicine, University of California, San Francisco, CA, USA') + expect(page).to have_field('ORCID (Creator #1)', with: 'https://orcid.org/0000-0001-6833-8372') + expect(page).to have_field('Abstract', with: /Efforts to increase education opportunities, provide insurance/) + click_link('Optional fields') + # alpha order below + expect(page).to have_field('Copyright date', with: '2021') + expect(page).to have_field('Date of publication', with: 'February 1, 2021') # aka date_issued + expect(page).to have_select('Dcmi type', with_selected: 'Text') + expect(page).to have_field('Funder', with: 'Fogarty International Center') + expect(page).to have_field('Identifier', with: '10.1177/1073274820985792') + expect(page).to have_field('ISSN', with: '1073-2748') + expect(page).to have_field('Journal issue', with: '') + expect(page).to have_field('Journal title', with: 'Cancer Control') + expect(page).to have_field('Journal volume', with: '28') + # keywords + expected_keywords = ['HPV', 'HPV knowledge and awareness', 'cervical cancer screening', 'migrant women', 'China', ''] + keyword_fields = page.all(:xpath, '/html/body/div[2]/div[2]/form/div/div[1]/div/div/div[1]/div[2]/div[2]/div[1]/ul/li/input') + keywords = keyword_fields.map(&:value) + expect(keyword_fields.count).to eq 6 + expect(keywords).to match_array(expected_keywords) + expect(page).to have_select('License', with_selected: 'Attribution-NonCommercial 4.0 International') + expect(page).to have_field('Publisher', with: 'SAGE Publications') + expect(page).to have_select('Resource type', with_selected: 'Article') + expect(page).to have_field('Rights holder', with: /SAGE Publications Inc, unless otherwise noted. Manuscript/) + expect(page).to have_select('Rights statement', with_selected: 'In Copyright') + end + + # creators after the first one need JS to render + it "can render the javascript-drawn fields", js: true do + login_as @admin_user + visit "concern/articles/#{@first_work_id}/edit" + expect(page).to have_field('Creator #2', with: 'Zhang, Xi') + end + + it "can render values only present on the second work" do + login_as @admin_user + visit "concern/articles/#{@third_work_id}/edit" + expect(page).to have_field('Title', with: /The Prevalence of Bacterial Infection in Patients Undergoing/) + expect(page).to have_field('Journal issue', with: '1') + expect(page).to have_field('Journal volume', with: '11') + keyword_fields = page.all(:xpath, '/html/body/div[2]/div[2]/form/div/div[1]/div/div/div[1]/div[2]/div[2]/div[1]/ul/li/input') + keywords = keyword_fields.map(&:value) + expect(keyword_fields.count).to eq 8 + expect(keywords).to include('Propionibacterium acnes') + expect(page).to have_select('License', with_selected: 'Attribution-NonCommercial-NoDerivatives 4.0 International') + expect(page).to have_field('Page end', with: '20') + expect(page).to have_field('Page start', with: '13') + end +end diff --git a/spec/fixtures/sage/10.1177_2192568219888179.xml b/spec/fixtures/sage/10.1177_2192568219888179.xml new file mode 100644 index 000000000..49dd63c4b --- /dev/null +++ b/spec/fixtures/sage/10.1177_2192568219888179.xml @@ -0,0 +1,1715 @@ +
+ + +GSJ +spgsj + +Global Spine Journal + +2192-5682 +2192-5690 + +SAGE Publications +Sage CA: Los Angeles, CA + + + +10.1177/2192568219888179 +10.1177_2192568219888179 + + +Original Articles + + + +The Prevalence of Bacterial Infection in Patients Undergoing Elective ACDF for Degenerative Cervical Spine Conditions: A Prospective Cohort Study With Contaminant Control + + + + +Bivona +Louis J. + +MD +1 + + + +Camacho +Jael E. + +MD +1 + + + +Usmani +Farooq + +MD, MSc +2 + + + +Nash +Alysa + +MD +3 + + + +Bruckner +Jacob J. + +MD +1 + + + +Hughes +Meghan + +MD +1 + + + +Bhandutia +Amit K. + +MD +1 + + + +Koh +Eugene Y. + +MD, PhD +1 + + + +Banagan +Kelley E. + +MD +1 + + +https://orcid.org/0000-0002-7263-6177 + +Gelb +Daniel E. + +MD +1 + + +https://orcid.org/0000-0002-3962-5724 + +Ludwig +Steven C. + +MD +1 + + + + +Department of Orthopaedics, 12264University of Maryland School of Medicine, Baltimore, MD, USA + +Department of General Surgery, 6040Eastern Virginia Medical School, Norfolk, VA, USA + +Department of Orthopaedics, 2331University of North Carolina at Chapel Hill, NC, USA + +Steven C. Ludwig, Department of Orthopaedics, University of Maryland, 110 South Paca Street, 6th Floor, Suite 300, Baltimore, MD 21201, USA. Email: sludwig@som.umaryland.edu + + + +1 +2021 + +11 +1 +13 +20 + +© The Author(s) 2019 +2019 +AO Spine, unless otherwise noted. Manuscript content on this site is licensed under Creative Commons Licenses + +This article is distributed under the terms of the Creative Commons Attribution-NonCommercial-NoDerivs 4.0 License (https://creativecommons.org/licenses/by-nc-nd/4.0/) which permits non-commercial use, reproduction and distribution of the work as published without adaptation or alteration, without further permission provided the original work is attributed as specified on the SAGE and Open Access pages (https://us.sagepub.com/en-us/nam/open-access-at-sage). + + + + +Study Design: +

Prospective cohort study.

+
+ +Objectives: +

To determine the prevalence of bacterial infection, with the use of a contaminant control, in patients undergoing anterior cervical discectomy and fusion (ACDF).

+
+ +Methods: +

After institutional review board approval, patients undergoing elective ACDF were prospectively enrolled. Samples of the longus colli muscle and disc tissue were obtained. The tissue was then homogenized, gram stained, and cultured in both aerobic and anaerobic medium. Patients were classified into 4 groups depending on culture results. Demographic, preoperative, and postoperative factors were evaluated.

+
+ +Results: +

Ninety-six patients were enrolled, 41.7% were males with an average age of 54 ± 11 years and a body mass index of 29.7 ± 5.9 kg/m2. Seventeen patients (17.7%) were considered true positives, having a negative control and positive disc culture. Otherwise, no significant differences in culture positivity was found between groups of patients. However, our results show that patients were more likely to have both control and disc negative than being a true positive (odds ratio = 6.2, 95% confidence interval = 2.5-14.6). Propionibacterium acnes was the most commonly identified bacteria. Two patients with disc positive cultures returned to the operating room secondary to pseudarthrosis; however, age, body mass index, prior spine surgery or injection, postoperative infection, and reoperations were not associated with culture results.

+
+ +Conclusion: +

In our cohort, the prevalence of subclinical bacterial infection in patients undergoing ACDF was 17.7%. While our rates exclude patients with positive contaminant control, the possibility of contamination of disc cultures could not be entirely rejected. Overall, culture results did not have any influence on postoperative outcomes.

+
+
+ +degenerative cervical conditions + +Propionibacterium acnes + +contaminant control +intervertebral disc infection +disc cultures +anterior cervical discectomy and fusion +revision surgery + + + +typesetter +ts3 + + +
+
+ + +Introduction +

Degenerative cervical spine conditions are a major cause of morbidity and disability, as they often lead to neck pain, radicular pain, and mechanical strain on adjacent structures. Common risk factors include age, hereditary and lifestyle factors, smoking, and history of mechanical trauma. +1,2 + Recently, there have been multiple studies implicating low-virulence bacterial infection as a possible cause of degenerative spine conditions, particularly disc disease. Stirling et al +3 + were the first to describe a possible association between patients with sciatica and disc cultures that were positive for Propionibacterium acnes. Despite an increasing number of reports supporting this theory, there remains considerable debate as to the validity of these findings. +4 +-6 + +

+

One concern regarding true subclinical infection in the disc space is the possible risk of contamination during sample collection intraoperatively. Many of the previous studies on P acnes infection lacked the use of a control tissue sample to exclude the possibility of contamination, which may ultimately overestimate the prevalence of subclinical infection. +7 +-9 + Additionally, the majority of studies regarding nonpyogenic subclinical infection are focused in the lumbar spine. +3,5,7,8,10 + Here, this study aims to determine the point prevalence of subclinical bacterial infection in cervical spine disc spaces using a contaminant control in patients undergoing anterior cervical discectomy and fusion (ACDF) for cervical spondylosis.

+
+ +Materials and Methods + +Study Design +

A prospective cohort study conducted at a single tertiary and academic institution.

+
+ +Patients and Participation Criteria +

After institutional review board approval, patients were prospectively enrolled between January 2017 and May 2018. All nonpregnant adults, aged 18 to 89 scheduled to undergo elective ACDF for any diagnosis other than infection, trauma, or malignancy were consented and enrolled. Exclusion criteria included patients with an active skin infection at the surgical site, active systemic infection, those on a long-term antibiotic regimen, and patients with a history of spondylodiscitis or vertebral osteomyelitis.

+
+ +Operative Procedure +

Patients were brought to the operating room and placed in the supine position. All patients received preoperative antibiotics, prior to the start of surgery: 88 patients (92%) received cephazolin 2 g intravenously (IV), 4 patients (4%) were given vancomycin 1 g IV, 3 patients (3%) received vancomycin 1 g plus gentamicin 80 mg IV, and 1 patient (1%) received clindamycin 900 mg IV. The skin overlying the surgical area was prepped in the usual sterile fashion (chlorhexidine gluconate 2% w/v and isopropyl alcohol 70% v/v) followed by a final scrub with Chloraprep. A transverse or a longitudinal incision was made depending on number of segments to be fused and to surgeon’s discretion. During anterior exposure and prior to discectomy, a sample of the longus colli muscle (control) was obtained with an unused, sterile instrument. On exposure of the appropriate level, samples of intervertebral disc tissue were obtained with an unused, sterile instrument. All specimens were immediately sent to the laboratory.

+
+ +Microbiology +

The samples were sent to the Department of Microbiology for aerobic and anaerobic cultures. A gram stain was performed on each tissue sample received. For aerobic cultures, the tissue was homogenized and plated on 5% Sheep Blood, Chocolate, MacConkey, and PEA agars and held for a maximum of 5 days. Anaerobic cultures were homogenized and plated on prereduced Brucella Blood, Brucella Laked Blood with Kanamycin and Vancomycin, Bacteroides Bile Esculin Agar, and Thioglycollate broth. The agar plates were held for a total of 7 days and the Thioglycollate Broth was held for 20 days at anaerobic atmosphere (anaerobic jars or bags) at 35°C to 37°C. Plates and broth were examined each day for growth. If growth was identified, subcultures and gram staining were made and later microbial identification was done using matrix-assisted laser desorption ionization-time of flight mass spectrometry (MALDI-TOF MS). +11 + +

+
+ +Outcomes Measures and Follow-up +

Patients were classified into 4 groups: control negative (CN)/disc negative (DN), control positive (CP)/DN, CP/disc positive (DP), and CN/DP. The latter being identified as our “true positive” as they had a negative control tissue culture. The prevalence of bacteria identified was calculated for each group. Patient age, sex, body mass index (BMI), preoperative diagnosis, and clinical symptoms were obtained and compared between groups. Prior history of cervical spine surgery, spinal injection, and diabetes was also retrieved from chart and compared statistically between groups. Spinal levels fused and postoperative outcomes were also compared. Postoperative outcomes included postoperative infections, reoperations, and radiographic outcomes (graft subsidence and screw loosening). Graft subsidence was evaluated by measuring distance between the superior endplate of the most cranial vertebrae and the most caudal vertebrae. A difference more than 2 mm was classified as graft subsidence. +12 + Screw loosening was classified as greater than 2 mm of radiolucency around any screw. +13 +-15 + Postoperative follow-up rate at 6 weeks, 6 months, and more than 1 year were also evaluated between groups. None of the patients with a positive result were treated with antibiotics postoperatively. This was due to lack of clinical and laboratory signs and symptoms of systemic infection on patient follow-up.

+
+ +Statistical Analysis +

All data was collected and audited in Microsoft Excel (Microsoft Office Professional Plus 2016, Microsoft Corporation, Redmond, WA). JMP Pro (Version 13.0.0, SAS Institute Inc, Cary, NC, 1987-2007) was used for descriptive statistics. All tests were 2-tailed, and the significance level was .05 unless otherwise stated. Continuous variables were tested for normality with the Shapiro-Wilk test. ANOVA was used for continuous variables that were normally distributed (age and BMI). Chi-square test and Fisher’s exact test were used for all nominal variables. To assess the relationship between control and disc cultures, McNemar’s test was used and odds ratio was reported as well.

+
+
+ +Results +

A total of 110 patients were enrolled for participation in the study. Fourteen patients were excluded because samples were either not obtained intraoperatively or the samples obtained were not adequate for culture. Of the 96 patients remaining in the study, 47 patients (49%) had a positive control tissue culture and 53 patients (55.2%) had a positive disc culture. Table 1 describes the distribution of patients by control and disc culture results. There were 17 patients (17.7%) in the CN/DP group. McNemar’s test did not show a statistically significant correlation between groups (P = 0.26), although cultures were more likely to turn negative for both control and disc (odds ratio [OR] = 6; 95% confidence interval [CI] = 2.5-14.6).

+ + + +

Distribution of Patient Culture Results Between Longus Colli Muscle (Control) and Intervertebral Disc Tissue (Disc).

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Tissue Culture ResultIntervertebral Disc (Disc)Total
PositiveNegative
Longus Colli Muscle (Control) Positive Negative +36 +11 +47
173249
Total534396
+
+
+

In the present study, 41.7% of patients were male with an average age of 54 ± 11 years and a BMI of 29.7 ± 5.9 kg/m2. There were more male patients in the CP/DP group (P < .0001). The majority of patients had no prior history cervical spine surgery (76%), preoperative spinal injections (60.4%), or diabetes (77.5%), and no association was seen between groups. A majority of patients in the CN/DP group had never smoked (P = .0077). There was no difference between preoperative diagnosis and culture results (P = .85). Apart from gender and smoking status, there was no other significant association established between patient demographics or clinical characteristics and culture result groups (Table 2). The average length of stay was 1 day, with the exception of 3 patients. One patient had respiratory failure and dysphagia with the need to be intubated that extended their stay to 11 days. One patient stayed 2 days. The last patient had a second planned thoracolumbar decompression and fusion surgery that extended their stay to 7 days.

+ + + +

Comparison of Patient Demographic and Clinical Characteristics Between Longus Colli Muscle (Control) and Intervertebral Disc (Disc) Culture Results.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Characteristics, n (%)AllCulture Results, n (%) +P +
CN/DNCP/DNCP/DPCN/DP
Number of patients9632113617 +
Age, years (mean ± SD)54 ± 1154 ± 858 ± 1353 ± 1253 ± 10.57
BMI, kg/m2 (mean ± SD)29.7 ± 5.930.7 ± 6.530.1 ± 6.929.8 ± 5.328.1 ± 5.4.57
Sex (male)40 (41.7)7 (21.9)2 (18.2)27 (75)4 (23.5)<.0001*
Previous C-spine surgery23 (24)7 (21.9)4 (36.4)8 (22.2)4 (23.5).78
Preoperative epidural injection38 (39.6)15 (46.9)6 (54.6)14 (38.9)3 (17.7).16
Diabetes12 (12.5)7 (21.9)1 (9.1)3 (8.3)1 (5.9).27
Diagnosis, n (%) + + + + +.85
 Cervical radiculopathy39 (40.6)16 (50)2 (18.2)15 (41.7)6 (35.3) +
 Cervical stenosis17 (17.7)4 (12.5)4 (36.4)6 (16.7)3 (17.7) +
 Cervical myelopathy16 (16.7)4 (12.5)3 (27.3)6 (16.7)3 (17.7) +
 Disc herniation15 (15.6)6 (18.8)1 (9.1)5 (13.9)3 (17.7) +
 Cervical spondylosis9 (9.4)2 (6.3)1 (9.1)4 (11.1)2 (11.8) +
Symptoms, n (%) + + + + + +
 Neck pain90 (93.8)30 (93.8)11 (100)32 (88.9)17 (100).34
 Arm/shoulder pain85 (88.5)26 (81.3)11 (100)32 (88.9)12 (88.5).3
Smoking status, n (%) + + + + +.0077*
 Never smoked52 (54.2)17 (53.1)4 (36.4)18 (50)13 (76.5) +
 Current smoker21 (21.9)12 (37.5)1 (9.1)6 (16.7)2 (11.8) +
 Former smoker23 (24.0)3 (9.4)6 (56.6)12 (33.3)2 (11.8) +
+
+ + +

Abbreviations: CN, control negative; DN, disc negative; CP, control positive; DP, disc positive; SD, standard deviation.

+
+ +

* Indicates statistically significant values with P < .05.

+
+
+
+

The most common microorganisms identified from positive cultures was P acnes, with a positive culture rate of 76.5% in the CN/DP group, followed by coagulase-negative Staphylococcus (CNS) with 29.4%, including samples with more than one organism detected in culture (Table 3). Polymicrobial samples were observed in 23.5% of samples in the CN/DP group with P acnes being present in all polymicrobial samples. A total of 165 discs were cultured, for an overall disc culture positive rate of 49.7% (n = 82). After excluding patients with positive control, 24 out of 83 discs (28.9%) had a positive culture. The median day to positivity in control and disc cultures was 7 days (range = 2-19 days). There were 34 patients who had 1-level ACDF, 54 had 2-level fusion, and 8 who had 3-level fusion. There were more 2-level fusions (82.4%) in the CN/DP group, although this trend did not reach statistical significance (P = .06). Of the 14 two-level fusions, 2 patients had both their cultures turn positive to P acnes, 6 patients had different bacteria, and 8 had only one positive disc (Table 4). There was only one patient with 3-level fusion that had 1 of the 3 discs turn positive to Kocuria rhizophila, but the patient did not have any complications postoperatively.

+ + + +

Distribution of Microorganism Identified in Positive Control and Disc Cultures.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+Control Positive/Disc NegativeControl Positive/Disc PositiveControl Negative/Disc Positive
Number of patients113617
Number of discs (positive/total)0/1658/6724/32
+P acnes, n (%)5 (45.5)34 (94.4)13 (76.5)
P acnes alone521 (58.3)9 (52.9)
P acnes + Staphylococcus sp8 (22.2)2 (11.8)
P acnes + Streptococcus sp4 (11.1)2 (11.8)
P acnes + mixed anaerobes1 (2.8)
Other, n (%) + + +
 Coagulase-negative Staphylococcus +3 (27.3)2 (5.6)3 (17.6)
Pseudomonas luteola +1 (9.1)
 Diphteroids1 (9.1)
Enterococcus faecium +1 (9.1)
Kocuria rhizophila +1 (5.6)
+
+ + +

Abbreviations: P acnes, Propionibacterium acnes; sp, species.

+
+
+
+ + + +

Disc Culture Results for Control Negative and Disc Positive Patients.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+Disc 1Disc 2Disc 3
DiscResultDiscResultDiscResult
1C3-4 +P acnes +C4-5 +P acnes +
2C3-4 +P acnes +C4-5Negative culture
3C3-4CNSC4-5Negative culture
4C4-5 +P acnes +C5-6 +Streptococcus viridans +
5C4-5 +P acnes +C5-6Negative culture
6C4-5 +P acnes +C5-6Negative culture
7C4-5 +P acnes +C5-6 +P acnes +
8C4-5Negative cultureC5-6 +Kocuria rhizophila +C6-7Negative culture
9C4-5CNSC5-6 +P acnes +
10C4-5CNSC5-6 +P acnes +
11C5-6 +P acnes +C6-7No sample
12C5-6 +P acnes + Streptococcus spC6-7 +P acnes +
13C5-6 +P acnes +C6-7Negative culture
14C5-6Negative cultureC6-7CNS
15C5-6Negative cultureC6-7 +P acnes +
16C5-6 +P acnes +
17C5-6CNS
+
+ + +

Abbreviations: CNS, coagulase-negative staphylococcus; P. acnes, Propionibacterium acnes; Sp, species.

+
+
+
+

In terms of postoperative outcomes, there was one patient from the CN/DN group who had a superficial wound infection treated with antibiotics and local wound care that resolved completely. No other patient had a postoperative infection. There were 2 reoperations: one patient in the CN/DP and the other in the CP/DP group. The patient in the CN/DP group underwent posterior cervical decompression and fusion 9 months after their initial ACDF (Figure 1A) due to signs of pseudarthrosis, graft subsidence (Figure 1B), and pain. This patient had 1 of 2 discs cultured positive, which was the same level showing radiographic signs of graft subsidence. The organism cultured was CNS and it was sensitive to preoperative antibiotic. After the index surgery, the patient did not show any signs or symptoms of systemic infection. The serological workup was unremarkable and continued to be after the revision surgery. Radiographic evaluation (Figure 1C) at 1-year follow-up post-revision surgery demonstrated proper alignment and fusion. The second patient who underwent reoperation after initial ACDF also developed pseudarthrosis, graft subsidence, and postoperative pain. This was a 1-level fusion and both the disc and control were positive. The patient did not show any signs or symptoms of systemic infection prior to his revision as well, and serologic workup was unremarkable throughout follow-up. Graft subsidence and screw loosening were also evaluated at long-term follow-up, but no significant difference was identified (Table 5).

+ + + +

Postoperative X-rays, showing patient with initial 2-level ACDF (A), who on follow-up started showing radiographic signs of pseudarthrosis and graft subsidence (B), and who, 9 months later, was submitted to revision posterior spinal fusion that demonstrated good proper alignment and fusion at 1-year post-revision surgery (C).

+ + +
+ + + +

Comparison of Patient Surgical Details and Postoperative Outcomes Between Longus Colli Muscle (Control) and Intervertebral Disc (Disc) Culture Results.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Characteristics, n (%)AllCulture Results, n (%) +P +
CN/DNCP/DNCP/DPCN/DP
Number of patients9632113617 +
Presurgical antibiotic (Cephazolin)88 (91.7)29 (90.6)10 (90.9)34 (94.5)15 (88.2).29
Cervical levels fused + + + + +.06
 One34 (35.4)16 (50)6 (54.6)10 (27.8)2 (11.8) +
 Two54 (56.3)14 (43.8)5 (45.5)21 (58.3)14 (82.4) +
 Three8 (8.3)2 (6.3)5 (13.9)1 (5.9) +
Postsurgical outcomes + + + + + +
 Postoperative infection1 (1)1 (3.1).57
 Reoperation2 (2.1)1 (2.8)1 (5.9).54
 Graft subsidence5 (5.3)4 (11.1)1 (5.9).13
 Screw loosening4 (4.2)2 (6.3)2 (5.6).63
Length of follow-upa + + + + + + +
 6 weeks84 (87.5)21 (65.6)11 (100)35 (97.2)17 (100)<.0001*
 3-6 months74 (77.1)21 (65.6)9 (81.2)32 (88.9)12 (70.6).12
 ≥12 months45 (46.9)11 (34.4)7 (63.6)20 (55.6)7 (41.2).21
+
+ + +

Abbreviations: CN, control negative; DN, disc negative; CP, control positive; DP, disc positive; SD, standard deviation.

+
+ +

+a Indicates the number of patients who presented for their follow-up visit.

+
+ +

* Indicates statistically significant values with P < .05.

+
+
+
+
+ +Discussion +

Recently, there have been several studies implicating subclinical infection as a possible cause of symptomatic degenerative spine conditions. +6 +-8 + This assertion, however, remains under contention. +4,16 + In our study, 17.7% of patients had a positive disc culture and a negative control. By excluding patients with a positive control, our disc positive rates decreased from 55.2% to 17.7%, thus obtaining a better estimation of the “true positive” culture rates in our patient cohort.

+

The main concern in our study, as well as other studies reporting positives disc cultures in literature, is the risk of contamination while obtaining and handling culture samples in the operating room and the laboratory. By using a contaminant control, we aimed to reduce potential bias and risk of overestimation of our disc positive rates. Given the proximity of the longus colli muscle to the intervertebral disc, we hypothesize that the presence of a positive culture in both control and disc were most likely due to contamination rather than infection.

+

When examining literature, our positive culture rates are in accordance with prior studies that have included the use of a contaminant control in their methodology. Chen et al +17 + obtained disc and sternocleidomastoid muscle cultures from 32 patients with cervical spondylosis or traumatic cervical spine injury. They found 8 patients (25%) and 9 discs (13.6%) had positive cultures, and 4 patients (12.5%) had a positive control, of which three had a negative disc culture. In the lumbar spine, Zhou et al +18 + utilized muscle tissue as contaminant control in patients having single-level lumbar disc removal as part of their surgical treatment. Of the 46 patients in the study, 9 patients (19.6%) had a positive disc culture and 3 (6.5%) had a positive control. In both studies, the reported disc infection rates excluded patients with a positive control. However, the reported pooled prevalence of disc infection is 36.2% (95% CI = 24.7% to 47.7%) in patients with symptomatic neck or back pain and/or radiculopathy. +6 + The variability in positive culture rates between studies can be explained by the differences in their methodology. Thus, despite these results, it is challenging to report an overall infection rate without considering risk of contamination and bias.

+

Historically. P acnes has been the most common bacteria identified in intervertebral disc of patients with degenerative spine conditions, and it is frequently responsible for infection in other areas of the body, particularly the shoulder. +19,20 + Its ubiquitous nature challenges the validity of results presented in prior studies. To evaluate the risk of contamination, Carricajo et al +4 + conducted a study with 54 patients undergoing surgery for lumbar disc herniation. As a control, they obtained samples from surrounding tissue (ligamentum flavum and muscle), air samples, and laminar flow samples. They found only 2 patients with a positive disc culture, for which control samples were also positive. Interestingly, they found cultures were positive from control ligamentum and muscle samples, laminar flow air swabs, and in patients who did not have a positive disc culture. Thus, authors proposed that prior studies’ positive findings may be a result of contamination.

+

Despite these findings, there are others who still argue that the methodological differences between studies translates to inconsistencies in reported positive and negative rates. +21 + Capoor et al +21 + argued that the possible formation of biofilm by P acnes and the lack of quantitative measures to help discriminate between truly infected and contaminated samples may lead to underestimation and overestimation of overall positive rates reported in literature. +7,8,10,16,21,22 + In their study, they homogenized disc tissue samples to reduce risk of biofilm formation, and performed quantitative cultures and real-time polymerase chain reaction (PCR)-based detection of P acnes genomes to accurately evaluate the prevalence of P acnes in intervertebral discs. They set a threshold for patients with abundant P acnes on culture (“true positives”) to 1000 colony forming units (CFU) per milliliter (>75th percentile) to reduce bias and overestimation of prevalence. Of the 115 samples with presence of P acnes, 39 (11%) had more than 1000 CFU/mL. The authors concluded that their methods of quantifications allowed them for a better estimation of the true prevalence of infection, and that their findings support the theory that P acnes was one of the possible causes of disc degeneration. However, the authors could not exclude the possibility of contamination during sample collection and laboratory handling.

+

The argument of contamination is supported by the commensal nature of bacteria identified in cultures, such as P acnes and CNS. In our study, these 2 microorganisms were present in all but one of our 17 patients in the CN/DP group. While P acnes has increasingly become of interest in the spine surgery, our findings seem to indicate that positive P acnes cultures are due to contamination rather than subclinical infection. +3 +-5,7,9,10,19 +-21,23,24 + Our study also shows that the presence of bacteria in intervertebral disc cultures is not associated with any complications related to infection on follow-up.

+

The incidence of postoperative outcomes did not identify any significant association between patient’s postoperative or radiographic outcomes and culture results. There was one superficial postoperative infection in a patient with both cultures negative. There were 2 patients who were taken back to the operating room for pseudarthrosis and both had a positive disc culture. These patients underwent posterior spinal fusion for their revision surgery; however, their anterior hardware was not removed and therefore was not cultured. Though no difference was observed in rates of postoperative outcomes between groups, the possibility of implant-associated infection or “aseptic” pseudarthrosis still exists. +9 + Studies have shown P acnes as one of the most commonly identified organisms in these cases; however, we were not able to confirm that association with our findings. +25 + +-28 + Additionally, when evaluating radiographic outcomes, no difference was observed either in rates of subsidence or screw loosening. Furthermore, we did not observe a significant association with preoperative spinal injections or previous spine surgery, as well as other demographics and preoperative and postoperative variables evaluated.

+
+ +Limitations +

This study is limited by the fact that no confirmatory molecular analysis was performed, such as PCR. However, detection through culturing methods or PCR have demonstrated similar rates. +6 + In using a contaminant control, we aimed to reduce the risk of overestimation of our disc positive rates by considering true positives as only those patients with a disc positive and control negative culture. However, potential risk of contamination in CN/DP patient disc samples is still present. P acnes has been shown the need to be cultured in for at least 7 days, and this was confirmed with our study. +29,30 + The integration of quantitative measures with the use of PCR may allow us for better interpretation of positive cultures, and with the addition of a contaminant control tissue, correlations studies between control and disc samples could be performed for a better estimation of disc positive rates. However, a validated method that reduces the risk of contamination, and evaluates long-term outcomes, will be ideal to investigate the relationship between presence of bacteria is disc culture and degenerative spine conditions.

+
+ +Conclusion +

The prevalence of bacterial infection, with the use of contaminant control, in patients undergoing ACDF for cervical degenerative conditions is 17.7%. P acnes was the most commonly identified organism. While our rates exclude patients with positive contaminant control, the possibility of contamination of intervertebral disc cultures could not be entirely rejected. Our findings also show that culture results did not have any influence in postoperative outcomes.

+
+ + + + + +

The views expressed in the article are our own and not an official position of the institution.

+
+ + +

The author(s) declared the following potential conflicts of interest with respect to the research, authorship, and/or publication of this article: Dr Gelb is a board member and fellowship committee chair for AOSpine NA. He receives payment for lectures and for development of educational presentations from AOSpine NA. He receives royalties from DePuy Synthes Spine and Globus Medical. He has stock in the American Society for Investigative Pathology. Dr Koh receives payment for consultancy from Biomet. His institution receives RO1 grant money from the National Institutes of Health. Dr Ludwig is a board member for Globus Medical, the American Board of Orthopaedic Surgery, the American Orthopaedic Association, the Cervical Spine Research Society, and the Society for Minimally Invasive Spine Surgery. He is a paid consultant for DePuy Synthes, K2M, and Globus Medical. He receives payment for lectures and travel accommodations from DePuy Synthes and K2M. He receives payment for patents and royalties from DePuy Synthes and Globus Medical. He has stock in Innovative Surgical Designs and the American Society for Investigative Pathology. He receives research support from AO Spine North America Spine Fellowship support, Pacira Pharmaceutical, and AOA Omega Grant. He is a board member of Maryland Development Corporation. He receives royalties from Thieme, Quality Medical Publishers. He is on the governing board of Journal of Spinal Disorders and Techniques, The Spine Journal, and Contemporary Spine Surgery. The authors have no further potential conflicts of interest to disclose.

+
+ + +

The author(s) received no financial support for the research, authorship, and/or publication of this article.

+
+ + +

Daniel E. Gelb, MD https://orcid.org/0000-0002-7263-6177 +

+

Steven C. Ludwig, MD https://orcid.org/0000-0002-3962-5724 +

+
+
+ +References + + + + + +Choi +YS + +. Pathophysiology of degenerative disc disease. Asian Spine J. 2009;3:3944. + + + + + + +Guiot +BH + + +Fessler +RG + +. Molecular biology of degenerative disc disease. Neurosurgery. 2000;47:10341040. + + + + + + +Stirling +A + + +Worthington +T + + +Rafiq +M + + +Lambert +PA + + +Elliott +TS + +. Association between sciatica and Propionibacterium acnes. Lancet. 2001;357:20242025. + + + + + + +Carricajo +A + + +Nuti +C + + +Aubert +E + +, et al. Propionibacterium acnes contamination in lumbar disc surgery. J Hosp Infect. 2007;66:275277. + + + + + + +Coscia +MF + + +Denys +GA + + +Wack +MF + +. Propionibacterium acnes, coagulase-negative Staphylococcus, and the “biofilm-like” intervertebral disc. Spine (Phila Pa 1976). 2016;41:18601865. + + + + + + +Ganko +R + + +Rao +PJ + + +Phan +K + + +Mobbs +RJ + +. Can bacterial infection by low virulent organisms be a plausible cause for symptomatic disc degeneration? A systematic review. Spine (Phila Pa 1976). 2015;40:E587E592. + + + + + + +Arndt +J + + +Charles +YP + + +Koebel +C + + +Bogorin +I + + +Steib +JP + +. Bacteriology of degenerated lumbar intervertebral disks. J Spinal Disord Tech. 2012;25:E211E216. + + + + + + +Rao +PJ + + +Phan +K + + +Reddy +R + + +Scherman +DB + + +Taylor +P + + +Mobbs +RJ + +. DISC (Degenerate-disc Infection Study with Contaminant Control): pilot study of Australian cohort of patients without the contaminant control. Spine (Phila Pa 1976). 2016;41:935939. + + + + + + +Khalil +JG + + +Gandhi +SD + + +Park +DK + + +Fischgrund +JS + +. Cutibacterium acnes in spine pathology: pathophysiology, diagnosis, and management. J Am Acad Orthop Surg. 2019;27:e633e640. + + + + + + +Agarwal +V + + +Golish +SR + + +Alamin +TF + +. Bacteriologic culture of excised intervertebral disc from immunocompetent patients undergoing single level primary lumbar microdiscectomy. J Spinal Disord Tech. 2011;24:397400. + + + + + + +Singhal +N + + +Kumar +M + + +Kanaujia +PK + + +Virdi +JS + +. MALDI-TOF mass spectrometry: an emerging technology for microbial identification and diagnosis. Front Microbiol. 2015;6:791. + + + + + + +Yang +JJ + + +Yu +CH + + +Chang +BS + + +Yeom +JS + + +Lee +JH + + +Lee +CK + +. Subsidence and nonunion after anterior cervical interbody fusion using a stand-alone polyetheretherketone (PEEK) cage. Clin Orthop Surg. 2011;3:1623. + + + + + + +Berquist +TH + +. Spinal instrumentation. In: + +Berquist +TH + +, ed. Imaging of Orthopedic Fixation Devices and Prostheses. Philadelphia, PA: Lippincott Williams and Wilkins; 2009:75152. + + + + + + +Kim +P + + +Zee +CS + +. Imaging of the postoperative spine: cages, prostheses, and instrumentation. In: + +Van Goethem +J + + +Van den Hauwe +L + + +Brizel +P + +, eds. Spinal Imaging: Diagnostic Imaging of the Spine and Spinal Cord. Berlin, Germany: Springer; 2007:397413. + + + + + + +Young +PM + + +Berquist +TH + + +Bancroft +LW + + +Peterson +JJ + +. Complications of spinal instrumentation. Radiographics. 2007;27:775789. + + + + + + +Rigal +J + + +Thelen +T + + +Byrne +F + +, et al. Prospective study using anterior approach did not show association between Modic 1 changes and low grade infection in lumbar spine. Eur Spine J. 2016;25:10001005. + + + + + + +Chen +Y + + +Wang +X + + +Zhang +X + +, et al. Low virulence bacterial infections in cervical intervertebral discs: a prospective case series. Eur Spine J. 2018;27:24962505. + + + + + + +Zhou +Z + + +Chen +Z + + +Zheng +Y + +, et al. Relationship between annular tear and presence of Propionibacterium acnes in lumbar intervertebral disc. Eur Spine J. 2015;24:24962502. + + + + + + +Dodson +CC + + +Craig +EV + + +Cordasco +FA + +, et al. Propionibacterium acnes infection after shoulder arthroplasty: a diagnostic challenge. J Shoulder Elbow Surg. 2010;19:303307. + + + + + + +Falconer +TM + + +Baba +M + + +Kruse +LM + +, et al. Contamination of the surgical field with Propionibacterium acnes in primary shoulder arthroplasty. J Bone Joint Surg Am. 2016;98:17221728. + + + + + + +Capoor +MN + + +Ruzicka +F + + +Machackova +T + +, et al. Prevalence of Propionibacterium acnes in intervertebral discs of patients undergoing lumbar microdiscectomy: a prospective cross-sectional study. PLoS One. 2016;11:e0161676. + + + + + + +Ben-Galim +P + + +Rand +N + + +Giladi +M + +, et al. Association between sciatica and microbial infection: true infection or culture contamination? Spine (Phila Pa 1976). 2006;31:25072509. + + + + + + +Albert +HB + + +Sorensen +JS + + +Christensen +BS + + +Manniche +C + +. Antibiotic treatment in patients with chronic low back pain and vertebral bone edema (Modic type 1 changes): a double-blind randomized clinical controlled trial of efficacy. Eur Spine J. 2013;22:697707. + + + + + + +McLorinan +GC + + +Glenn +JV + + +McMullan +MG + + +Patrick +S + +. Propionibacterium acnes wound contamination at the time of spinal surgery. Clin Orthop Relat Res. 2005;(437):6773. + + + + + + +LaGreca +J + + +Hotchkiss +M + + +Carry +P + +, et al. Bacteriology and risk factors for development of late (greater than one year) deep infection following spinal fusion with instrumentation. Spine Deform. 2014;2:186190. + + + + + + +Farley +FA + + +Li +Y + + +Gilsdorf +JR + +, et al. Postoperative spine and VEPTR infections in children: a case-control study. J Pediatr Orthop. 2014;34:1421. + + + + + + +Hahn +F + + +Zbinden +R + + +Min +K + +. Late implant infections caused by Propionibacterium acnes in scoliosis surgery. Eur Spine J. 2005;14:783788. + + + + + + +Shifflett +GD + + +Bjerke-Kroll +BT + + +Nwachukwu +BU + +, et al. Microbiologic profile of infections in presumed aseptic revision spine surgery. Eur Spine J. 2016;25:39023907. + + + + + + +Abdulmassih +R + + +Makadia +J + + +Como +J + + +Paulson +M + + +Min +Z + + +Bhanot +N + +. Propionibacterium acnes: time-to-positivity in standard bacterial culture from different anatomical sites. J Clin Med Res. 2016;8:916918. + + + + + + +Bossard +DA + + +Ledergerber +B + + +Zingg +PO + +, et al. Optimal length of cultivation time for isolation of Propionibacterium acnes in suspected bone and joint infections is more than 7 days. J Clin Microbiol. 2016;54:30433049. + + +
+
diff --git a/spec/fixtures/sage/CCX_2021_28_10.1177_1073274820985792/10.1177_1073274820985792.xml b/spec/fixtures/sage/CCX_2021_28_10.1177_1073274820985792/10.1177_1073274820985792.xml index 1c9cc5fe9..ceabd03d3 100644 --- a/spec/fixtures/sage/CCX_2021_28_10.1177_1073274820985792/10.1177_1073274820985792.xml +++ b/spec/fixtures/sage/CCX_2021_28_10.1177_1073274820985792/10.1177_1073274820985792.xml @@ -1769,4 +1769,4 @@ - \ No newline at end of file + diff --git a/spec/fixtures/sage/sage_config.yml b/spec/fixtures/sage/sage_config.yml index bc2cf2bd8..6f1c52e09 100644 --- a/spec/fixtures/sage/sage_config.yml +++ b/spec/fixtures/sage/sage_config.yml @@ -1,7 +1,7 @@ # Example configuration for Sage ingest package_dir: spec/fixtures/sage ingest_progress_log: spec/fixtures/sage/ingest_progress.log -# admin_set: sage admin set +admin_set: sage admin set # depositor_onyen: admin # deposit_title: Deposit by Sage Depositor via CDR Collector 1.0 # deposit_method: CDR Collector 1.0 diff --git a/spec/fixtures/sage/triple_package.zip b/spec/fixtures/sage/triple_package.zip new file mode 100644 index 0000000000000000000000000000000000000000..b002cc10c579b0920a608c0e811c8f73428f3377 GIT binary patch literal 584 zcmWIWW@Zs#-~hr(-x5NPw%&4IQ^BKr|7+BH>Vv!bB0p19+VPOL^8x%G$u%s~#VK&hrg={)3 hWMHPFx_lp!>BNOofHx}}$aTy>D8|UZAOpk<3;=8veFgvk literal 0 HcmV?d00001 diff --git a/spec/lib/qa/authorities/local/file_based_authority_spec.rb b/spec/lib/qa/authorities/local/file_based_authority_spec.rb index 09aa49479..fce1053a7 100644 --- a/spec/lib/qa/authorities/local/file_based_authority_spec.rb +++ b/spec/lib/qa/authorities/local/file_based_authority_spec.rb @@ -38,6 +38,9 @@ {"id"=>"http://creativecommons.org/licenses/by-nc-nd/3.0/us/", "label"=>"Attribution-NonCommercial-NoDerivs 3.0 United States", "active"=>"all"}, + {"id"=>"http://creativecommons.org/licenses/by-nc-nd/4.0/", + "label"=>"Attribution-NonCommercial-NoDerivatives 4.0 International", + "active"=>"all"}, {"id"=>"http://creativecommons.org/licenses/by-nc-sa/3.0/us/", "label"=>"Attribution-NonCommercial-ShareAlike 3.0 United States", "active"=>"all"}] diff --git a/spec/models/jats_ingest_work_spec.rb b/spec/models/jats_ingest_work_spec.rb new file mode 100644 index 000000000..7b47813af --- /dev/null +++ b/spec/models/jats_ingest_work_spec.rb @@ -0,0 +1,110 @@ +require 'rails_helper' + +RSpec.describe JatsIngestWork, type: :model do + let(:xml_file_path) { File.join(fixture_path, 'sage', 'CCX_2021_28_10.1177_1073274820985792', '10.1177_1073274820985792.xml') } + let(:work) { described_class.new(xml_path: xml_file_path) } + + it "can be initialized" do + expect(described_class.new(xml_path: xml_file_path)).to be_instance_of described_class + end + + it "has xml" do + expect(Nokogiri::XML(work.jats_xml)).to be_instance_of Nokogiri::XML::Document + end + + it "can create a properly constructed person object" do + expect(work.creators).to be_instance_of Hash + expect(work.creators.count).to eq 6 + expect(work.creators[0]).to be_instance_of Hash + expect(work.creators[0]).to include('name' => "Holt, Hunter K.") + expect(work.creators[0]).to include('orcid' => 'https://orcid.org/0000-0001-6833-8372') + expect(work.creators[2]).to include('name' => 'Hu, Shang-Ying') + expect(work.creators[2]).to include('index' => '3') + expect(work.creators[2]).to include('orcid' => '') + expect(work.creators[2]).to include('other_affiliation' => /Department of Cancer Epidemiology/) + expect(work.creators[0]).to include('affiliation' => '') + expect(work.creators[0]).to include('other_affiliation' => 'Department of Family and Community Medicine, University of California, San Francisco, CA, USA') + expect(work.creators[4]).to include('name' => 'Smith, Jennifer S.') + expect(work.creators[4]).to include('index' => '5') + expect(work.creators[4]).to include('other_affiliation' => 'Department of Epidemiology, UNC Gillings School of Global Public Health, Chapel Hill, NC, USA') + end + + it "can map UNC affiliations to the controlled vocabulary" do + pending("Mapping from Sage affiliations to UNC controlled vocabulary") + expect(work.creators[4]).to include('affiliation'=>'Gillings School of Global Public Health; Department of Epidemiology') + end + + it "can map affiliation ids to institution names" do + expect(work.affiliation_map).to be_instance_of Hash + expect(work.affiliation_map['aff1-1073274820985792']).to eq('Department of Family and Community Medicine, University of California, San Francisco, CA, USA') + end + + it "returns arrays for multi-valued fields and strings for single value fields" do + expect(work.abstract).to be_instance_of Array + expect(work.copyright_date).to be_instance_of String + expect(work.date_of_publication).to be_instance_of String + expect(work.funder).to be_instance_of Array + expect(work.identifier).to be_instance_of Array + expect(work.issn).to be_instance_of Array + expect(work.journal_issue).to be nil + expect(work.journal_title).to be_instance_of String + expect(work.journal_volume).to be_instance_of String + expect(work.keyword).to be_instance_of Array + expect(work.license).to be_instance_of Array + expect(work.license_label).to be_instance_of Array + expect(work.page_end).to be nil + expect(work.page_start).to be nil + expect(work.publisher).to be_instance_of Array + expect(work.rights_holder).to be_instance_of Array + expect(work.title).to be_instance_of Array + end + + it "can return metadata from the xml" do + expect(work.abstract.first).to include "provinces across China and administered a questionnaire" + expect(work.copyright_date).to eq '2021' + expect(work.date_of_publication).to eq '2021-02-01' + expect(work.funder).to eq ["Fogarty International Center"] + expect(work.identifier).to eq ["10.1177/1073274820985792"] + expect(work.issn).to eq ['1073-2748'] + expect(work.journal_issue).to be nil + expect(work.journal_title).to eq "Cancer Control" + expect(work.journal_volume).to eq '28' + expect(work.keyword).to match_array(['HPV', 'HPV knowledge and awareness', 'cervical cancer screening', 'migrant women', 'China']) + expect(work.license).to eq(['http://creativecommons.org/licenses/by-nc/4.0/']) + expect(work.page_end).to be nil + expect(work.page_start).to be nil + expect(work.publisher).to eq ["SAGE Publications"] + # expect(work.resource_type).to eq(['Article']) + expect(work.rights_holder).to eq(["SAGE Publications Inc, unless otherwise noted. Manuscript content on this site is licensed under Creative Common Licences"]) + expect(work.title).to eq(["Inequalities in Cervical Cancer Screening Uptake Between Chinese Migrant Women and Local Women: A Cross-Sectional Study"]) + end + + it "can map to the controlled license vocabulary" do + expect(work.license).to eq(['http://creativecommons.org/licenses/by-nc/4.0/']) + expect(work.license_label).to eq ['Attribution-NonCommercial 4.0 International'] + end + + context "with an article that has a physical print" do + let(:xml_file_path) { File.join(fixture_path, 'sage', '10.1177_2192568219888179.xml') } + + it "can return metadata from the xml" do + expect(work.abstract.first).to include "patients undergoing elective ACDF were prospectively enrolled" + expect(work.copyright_date).to eq '2019' + expect(work.date_of_publication).to eq '2021-01' + expect(work.funder).to eq [] + expect(work.identifier).to eq ["10.1177/2192568219888179"] + expect(work.issn).to eq ['2192-5682', '2192-5690'] + expect(work.journal_issue).to eq '1' + expect(work.journal_title).to eq 'Global Spine Journal' + expect(work.journal_volume).to eq '11' + expect(work.keyword).to match_array(['degenerative cervical conditions', 'Propionibacterium acnes', 'contaminant control', 'intervertebral disc infection', 'disc cultures', 'anterior cervical discectomy and fusion', 'revision surgery']) + expect(work.license).to eq(['http://creativecommons.org/licenses/by-nc-nd/4.0/']) + expect(work.license_label).to eq(['Attribution-NonCommercial-NoDerivatives 4.0 International']) + expect(work.page_end).to eq '20' + expect(work.page_start).to eq '13' + expect(work.publisher).to eq ["SAGE Publications"] + expect(work.rights_holder).to eq(["AO Spine, unless otherwise noted. Manuscript content on this site is licensed under Creative Commons Licenses"]) + expect(work.title).to eq(["The Prevalence of Bacterial Infection in Patients Undergoing Elective ACDF for Degenerative Cervical Spine Conditions: A Prospective Cohort Study With Contaminant Control"]) + end + end +end diff --git a/spec/rails_helper.rb b/spec/rails_helper.rb index ee2e84202..e39607b77 100755 --- a/spec/rails_helper.rb +++ b/spec/rails_helper.rb @@ -6,7 +6,11 @@ abort("The Rails environment is running in production mode!") if Rails.env.production? require 'rspec/rails' require 'webmock/rspec' -WebMock.disable_net_connect!(allow_localhost: true, allow: ['fcrepo:8080', 'solr:8983', 'opaquenamespace.org']) + +WebMock.disable_net_connect!(allow_localhost: true, allow: ['fcrepo:8080', 'solr:8983', 'opaquenamespace.org', 'chromedriver.storage.googleapis.com']) + +Capybara.default_normalize_ws = true + # Add additional requires below this line. Rails is not loaded until this point! # Requires supporting ruby files with custom matchers and macros, etc, in diff --git a/spec/services/hyrax/workflow/pending_deletion_notification_spec.rb b/spec/services/hyrax/workflow/pending_deletion_notification_spec.rb index 376c3e0a7..d67d1655a 100644 --- a/spec/services/hyrax/workflow/pending_deletion_notification_spec.rb +++ b/spec/services/hyrax/workflow/pending_deletion_notification_spec.rb @@ -1,9 +1,9 @@ require 'rails_helper' RSpec.describe Hyrax::Workflow::PendingDeletionNotification do - let(:admin) { User.find_by_user_key('admin') } - let(:depositor) { User.create(email: 'test@example.com', uid: 'test@example.com', password: 'password', password_confirmation: 'password') } - let(:cc_user) { User.create(email: 'test2@example.com', uid: 'test2@example.com', password: 'password', password_confirmation: 'password') } + let(:admin) { FactoryBot.create(:admin) } + let(:depositor) { FactoryBot.create(:user) } + let(:cc_user) { FactoryBot.create(:user) } let(:work) { Article.create(title: ['New Article'], depositor: depositor.email) } let(:admin_set) do AdminSet.create(title: ["article admin set"], @@ -21,18 +21,19 @@ let(:comment) { double("comment", comment: 'A pleasant read') } describe ".send_notification" do + before do + User.delete_all + end it 'sends a message to all users' do recipients = { 'to' => [depositor], 'cc' => [cc_user] } expect(depositor).to receive(:send_message) - .with(anything, - I18n.t('hyrax.notifications.workflow.deletion_pending.message', title: work.title[0], work_id: work.id, - document_path: "#{ENV['HYRAX_HOST']}/concern/articles/#{work.id}", user: depositor, comment: comment.comment), - anything).exactly(3).times.and_call_original - + .with(anything, I18n.t('hyrax.notifications.workflow.deletion_pending.message', title: work.title[0], + work_id: work.id, document_path: "#{ENV['HYRAX_HOST']}/concern/articles/#{work.id}", + user: depositor, comment: comment.comment), anything).exactly(3).times.and_call_original expect { described_class.send_notification(entity: entity, user: depositor, comment: comment, recipients: recipients) } - .to change { admin.mailbox.inbox.count }.by(1) - .and change { depositor.mailbox.inbox.count }.by(1) - .and change { cc_user.mailbox.inbox.count }.by(1) + .to change { admin.mailbox.inbox.count }.by(1) + .and change { depositor.mailbox.inbox.count }.by(1) + .and change { cc_user.mailbox.inbox.count }.by(1) end context 'without carbon-copied users' do @@ -40,9 +41,9 @@ recipients = { 'to' => [depositor], 'cc' => [] } expect(depositor).to receive(:send_message).exactly(2).times.and_call_original expect { described_class.send_notification(entity: entity, user: depositor, comment: comment, recipients: recipients) } - .to change { admin.mailbox.inbox.count }.by(1) - .and change { depositor.mailbox.inbox.count }.by(1) - .and change { cc_user.mailbox.inbox.count }.by(0) + .to change { admin.mailbox.inbox.count }.by(1) + .and change { depositor.mailbox.inbox.count }.by(1) + .and change { cc_user.mailbox.inbox.count }.by(0) end end end diff --git a/spec/services/tasks/sage_ingest_service_spec.rb b/spec/services/tasks/sage_ingest_service_spec.rb index 2f7e9992f..4af03bb96 100644 --- a/spec/services/tasks/sage_ingest_service_spec.rb +++ b/spec/services/tasks/sage_ingest_service_spec.rb @@ -4,22 +4,38 @@ RSpec.describe Tasks::SageIngestService do let(:service) { described_class.new(configuration_file: path_to_config) } - let(:path_to_config) { File.join(fixture_path, "sage", "sage_config.yml") } - let(:path_to_tmp) { File.join(fixture_path, "sage", "tmp") } + let(:sage_fixture_path) { File.join(fixture_path, "sage") } + let(:path_to_config) { File.join(sage_fixture_path, "sage_config.yml") } + let(:path_to_tmp) { File.join(sage_fixture_path, "tmp") } let(:first_package_identifier) { 'CCX_2021_28_10.1177_1073274820985792' } let(:first_zip_path) { "spec/fixtures/sage/#{first_package_identifier}.zip" } let(:first_dir_path) { "spec/fixtures/sage/tmp/#{first_package_identifier}" } let(:first_pdf_path) { "#{path_to_tmp}/10.1177_1073274820985792.pdf" } - let(:ingest_progress_log_path) { File.join(fixture_path, "sage", "ingest_progress.log") } + let(:first_xml_path) { "#{sage_fixture_path}/#{first_package_identifier}/10.1177_1073274820985792.xml" } + let(:ingest_progress_log_path) { File.join(sage_fixture_path, "ingest_progress.log") } + let(:admin) { FactoryBot.create(:admin) } - after do - # empty the progress log + let(:admin_set) do + AdminSet.create(title: ['sage admin set'], + description: ['some description']) + end + + before do + # instantiate the sage ingest admin_set + admin_set + end + + # empty the progress log + around do |example| + File.open(ingest_progress_log_path, 'w') {|file| file.truncate(0) } + example.run File.open(ingest_progress_log_path, 'w') {|file| file.truncate(0) } end describe '#initialize' do it "sets parameters from the configuration file" do expect(service.package_dir).to eq "spec/fixtures/sage" + expect(service.admin_set).to be_instance_of(AdminSet) end it 'creates a progress log for the ingest' do @@ -29,10 +45,68 @@ it 'can run a wrapper method' do expect(File.foreach(ingest_progress_log_path).count).to eq 0 - service.process_packages + expect do + service.process_packages + end.to change { Article.count }.by(4) expect(File.foreach(ingest_progress_log_path).count).to eq 4 end + context 'with an ingest work object' do + let(:ingest_work) { JatsIngestWork.new(xml_path: first_xml_path) } + let(:built_article) { service.build_article(ingest_work) } + let(:temp_dir) { Dir.mktmpdir } + + after do + FileUtils.remove_entry(temp_dir) + end + + it 'can create a valid article' do + expect do + service.build_article(ingest_work) + end.to change { Article.count }.by(1) + end + + it 'returns a valid article' do + expect(built_article).to be_instance_of Article + expect(built_article.persisted?).to be true + expect(built_article.valid?).to be true + # These values are also tested via the edit form in spec/features/edit_sage_ingested_works_spec.rb + expect(built_article.title).to eq(['Inequalities in Cervical Cancer Screening Uptake Between Chinese Migrant Women and Local Women: A Cross-Sectional Study']) + first_creator = built_article.creators.find { |creator| creator[:index] == ['1'] } + expect(first_creator.attributes['name']).to match_array(["Holt, Hunter K."]) + expect(first_creator.attributes['other_affiliation']).to match_array(['Department of Family and Community Medicine, University of California, San Francisco, CA, USA']) + expect(first_creator.attributes['orcid']).to match_array(['https://orcid.org/0000-0001-6833-8372']) + expect(built_article.abstract).to include(/Efforts to increase education opportunities, provide insurance/) + expect(built_article.date_issued).to eq('2021-02-01') + expect(built_article.copyright_date).to eq('2021') + expect(built_article.dcmi_type).to match_array(["http://purl.org/dc/dcmitype/Text"]) + expect(built_article.funder).to match_array(['Fogarty International Center']) + expect(built_article.identifier).to match_array(['10.1177/1073274820985792']) + expect(built_article.issn).to match_array(['1073-2748']) + expect(built_article.journal_issue).to be nil + expect(built_article.journal_title).to eq('Cancer Control') + expect(built_article.journal_volume).to eq('28') + expect(built_article.keyword).to match_array(['HPV', 'HPV knowledge and awareness', 'cervical cancer screening', 'migrant women', 'China']) + expect(built_article.license).to match_array(["http://creativecommons.org/licenses/by-nc/4.0/"]) + expect(built_article.license_label).to match_array(['Attribution-NonCommercial 4.0 International']) + expect(built_article.publisher).to match_array(['SAGE Publications']) + expect(built_article.resource_type).to match_array(['Article']) + expect(built_article.rights_holder).to include(/SAGE Publications Inc, unless otherwise noted. Manuscript/) + expect(built_article.rights_statement).to eq("http://rightsstatements.org/vocab/InC/1.0/") + end + + it 'puts the work in an admin_set' do + expect(built_article.admin_set).to be_instance_of(AdminSet) + expect(built_article.admin_set.title).to eq(admin_set.title) + end + + it 'attaches a file_set to the article' do + pending("Adding file sets to the Article object") + expect(built_article.file_sets).to be_instance_of(Array) + expect(built_article.file_sets.first).to be_instance_of(FileSet) + end + end + describe '#extract_files' do let(:temp_dir) { Dir.mktmpdir } after do @@ -45,10 +119,6 @@ end context "with a package already unzipped" do - before do - # empty the progress log - File.open(ingest_progress_log_path, 'w') {|file| file.truncate(0) } - end it 'can write to the progress log' do allow(service).to receive(:package_ingest_complete?).and_return(true) expect(File.size(ingest_progress_log_path)).to eq 0 @@ -74,12 +144,13 @@ end context "with unexpected contents in the package" do + let(:temp_dir) { Dir.mktmpdir } + let(:package_path) { File.join(fixture_path, "sage", "triple_package.zip") } + it "logs an error" do allow(Rails.logger).to receive(:error) - allow(service).to receive(:extract_files).and_return({"pdf_name" => "a", "xml_name" => "b"}) - allow(service).to receive(:extract_files).with(first_zip_path, any_args).and_return({"pdf_name" => "a", "xml_name" => "b", "unexpected_file_name"=> "c"}) - service.process_packages - expect(Rails.logger).to have_received(:error).with("Unexpected package contents - more than two files extracted from #{first_zip_path}") + service.extract_files(package_path, temp_dir) + expect(Rails.logger).to have_received(:error).with("Unexpected package contents - more than two files extracted from #{package_path}") end end end diff --git a/spec/support/capybara.rb b/spec/support/capybara.rb new file mode 100644 index 000000000..30cc6d4c7 --- /dev/null +++ b/spec/support/capybara.rb @@ -0,0 +1,23 @@ +# frozen_string_literal: true + +Webdrivers.cache_time = 3 + +# Setup chrome headless driver +Capybara.server = :webrick + +Capybara.register_driver :chrome_headless do |app| + client = Selenium::WebDriver::Remote::Http::Default.new + client.read_timeout = 120 + + options = ::Selenium::WebDriver::Chrome::Options.new + options.add_argument('--headless') + options.add_argument('--no-sandbox') + options.add_argument('--disable-dev-shm-usage') + options.add_argument('--window-size=1400,1400') + + capabilities = Selenium::WebDriver::Remote::Capabilities.chrome + + Capybara::Selenium::Driver.new(app, browser: :chrome, capabilities: [options, capabilities], http_client: client) +end + +Capybara.javascript_driver = :chrome_headless