datacite · kaysiz · Apr 14, 2026 · Mar 24, 2026 · Mar 27, 2026 · Mar 27, 2026
diff --git a/.env.build b/.env.build
@@ -20,4 +20,6 @@ ZBMATH_RELATED_SOURCE_TOKEN=
 ZBMATH_AUTHOR_SOURCE_TOKEN=
 ZBMATH_IDENTIFIER_SOURCE_TOKEN=
 EVENTDATA_TOKEN=
-STAFF_ADMIN_TOKEN=
+STAFF_ADMIN_TOKEN=
+CROSSREF_SOURCE_ID=
+CROSSREF_SOURCE_TOKEN=
diff --git a/.env.example b/.env.example
@@ -11,4 +11,6 @@ AWS_SECRET_ACCESS_KEY=
 # Can not be staff admin JWT must be valid user account
 STAFF_PROFILES_ADMIN_TOKEN=
 
-STAFF_ADMIN_TOKEN=
+STAFF_ADMIN_TOKEN=
+CROSSREF_SOURCE_ID=
+CROSSREF_SOURCE_TOKEN=
diff --git a/app/models/crossref.rb b/app/models/crossref.rb
@@ -29,23 +29,21 @@ def source_id
 
   def get_query_url(options = {})
     params = {
-      source: "crossref",
-      "from-collected-date" => options[:from_date],
-      "until-collected-date" => options[:until_date],
+      "from-created-date" => options[:from_date],
+      "until-created-date" => options[:until_date],
       mailto: "info@datacite.org",
-      scholix: true,
       rows: options[:rows],
-      cursor: options[:cursor],
+      page: options[:page],
     }.compact
 
-    "#{ENV['CROSSREF_QUERY_URL']}/v1/events?#{URI.encode_www_form(params)}"
+    "#{ENV['CROSSREF_QUERY_URL']}/beta/datacitations?#{URI.encode_www_form(params)}"
   end
 
   def get_total(options = {})
     query_url = get_query_url(options.merge(rows: 0))
     result = Maremma.get(query_url, options)
     message = result.body.dig("data", "message").to_h
-    [message["total-results"].to_i, message["next-cursor"]]
+    message["total-results"].to_i
   end
 
   def queue_jobs(options = {})
@@ -57,18 +55,18 @@ def queue_jobs(options = {})
       options[:until_date].presence || Time.now.to_date.iso8601
     options[:content_type] = "json"
 
-    total, cursor = get_total(options)
+    total = get_total(options)
 
     if total.positive?
-      # walk through results paginated via cursor
+      # walk through results paginated via page
       total_pages = (total.to_f / job_batch_size).ceil
       error_total = 0
 
-      (0...total_pages).each do |page|
-        options[:offset] = page * job_batch_size
+      (0...total_pages).each do |page_num|
+        options[:offset] = page_num * job_batch_size
         options[:total] = total
-        options[:cursor] = cursor
-        count, cursor = process_data(options)
+        options[:page] = page_num
+        process_data(options)
       end
       text = "Queued import for #{total} DOIs updated #{options[:from_date]} - #{options[:until_date]}."
     else
@@ -99,34 +97,28 @@ def push_data(result, _options = {})
     return result.body.fetch("errors") if result.body.fetch("errors",
                                                             nil).present?
 
-    items = result.body.dig("data", "message", "events")
+    items = result.body.dig("data", "message", "items")
     # Rails.logger.info "Extracting related identifiers for #{items.size} DOIs updated from #{options[:from_date]} until #{options[:until_date]}."
 
     Array.wrap(items).map do |item|
       CrossrefImportJob.perform_later(item)
     end
-
-    [items.length, result.body.dig("data", "message", "next-cursor")]
   end
 
   def self.push_item(item)
-    subj = cached_crossref_response(item["subj_id"])
-    obj = cached_datacite_response(item["obj_id"])
+    subj = cached_crossref_response(item["subject"]["id"])
+    obj = cached_datacite_response(item["object"]["id"])
 
     data = {
       "data" => {
-        "id" => item["id"],
         "type" => "events",
         "attributes" => {
-          "messageAction" => item["action"],
-          "subjId" => item["subj_id"],
-          "objId" => item["obj_id"],
-          "relationTypeId" => item["relation_type_id"].to_s.dasherize,
-          "sourceId" => item["source_id"].to_s.dasherize,
-          "sourceToken" => item["source_token"],
-          "occurredAt" => item["occurred_at"],
+          "subjId" => item["subject"]["id"],
+          "objId" => item["object"]["id"],
+          "relationTypeId" => item["relation"].to_s.dasherize,
+          "sourceId" => "crossref",
+          "sourceToken" => ENV["CROSSREF_SOURCE_TOKEN"],
           "timestamp" => item["timestamp"],
-          "license" => item["license"],
           "subj" => subj,
           "obj" => obj,
         },
@@ -135,6 +127,6 @@ def self.push_item(item)
 
     send_event_import_message(data)
 
-    Rails.logger.info "[Event Data] #{item['subj_id']} #{item['relation_type_id']} #{item['obj_id']} sent to the events queue."
+    Rails.logger.info "[Event Data] #{item["subject"]["id"]} #{item["relation"]} #{item["object"]["id"]} sent to the events queue."
   end
 end
diff --git a/config/application.rb b/config/application.rb
@@ -40,7 +40,7 @@
 ENV["LAGOTTINO_URL"] ||= "https://api.stage.datacite.org"
 ENV["SASHIMI_QUERY_URL"] ||= "https://api.stage.datacite.org"
 ENV["EVENTDATA_URL"] ||= "https://bus-staging.eventdata.crossref.org"
-ENV["CROSSREF_QUERY_URL"] ||= "https://api.eventdata.crossref.org"
+ENV["CROSSREF_QUERY_URL"] ||= "https://api.crossref.org"
 ENV["TRUSTED_IP"] ||= "10.0.40.1"
 ENV["SLACK_WEBHOOK_URL"] ||= ""
 ENV["USER_AGENT"] ||= "Mozilla/5.0 (compatible; Maremma/#{Maremma::VERSION}; mailto:info@datacite.org)"

diff --git a/...rt/with_missing_parameters/queues_jobs_for_the_default_date_range_yesterday_to_today_.yml b/...rt/with_missing_parameters/queues_jobs_for_the_default_date_range_yesterday_to_today_.yml
diff --git a/...rt/with_valid_parameters/queues_jobs_for_DOIs_updated_within_the_specified_date_range.yml b/...rt/with_valid_parameters/queues_jobs_for_DOIs_updated_within_the_specified_date_range.yml
diff --git a/spec/models/crossref_spec.rb b/spec/models/crossref_spec.rb
@@ -60,28 +60,26 @@
     it "returns a valid query URL with the given options" do
       crossref = Crossref.new
       query_url = crossref.get_query_url(from_date: from_date, until_date: until_date, rows: 10, cursor: "abc123")
-      expect(query_url).to include("source=crossref")
-      expect(query_url).to include("from-collected-date=#{from_date}")
-      expect(query_url).to include("until-collected-date=#{until_date}")
+      expect(query_url).to include("from-created-date=#{from_date}")
+      expect(query_url).to include("until-created-date=#{until_date}")
       expect(query_url).to include("rows=10")
-      expect(query_url).to include("cursor=abc123")
     end
   end
 
   describe "#queue_jobs" do
     context "when there are DOIs to import" do
       it "queues jobs and returns the total number of works queued" do
-        allow_any_instance_of(Crossref).to receive(:get_total).and_return([5, "next_cursor"])
-        allow_any_instance_of(Crossref).to receive(:process_data).and_return([5, "next_cursor"])
+        allow_any_instance_of(Crossref).to receive(:get_total).and_return(5)
+        allow_any_instance_of(Crossref).to receive(:process_data).and_return(5)
 
         response = Crossref.new.queue_jobs(from_date: from_date, until_date: until_date)
 
         expect(response).to eq(5)
       end
 
       it "sends a Slack notification when slack_webhook_url is present" do
-        allow_any_instance_of(Crossref).to receive(:get_total).and_return([1, "cursor"])
-        allow_any_instance_of(Crossref).to receive(:process_data).and_return([1, "cursor"])
+        allow_any_instance_of(Crossref).to receive(:get_total).and_return(1)
+        allow_any_instance_of(Crossref).to receive(:process_data).and_return(1)
 
         allow(Rails.logger).to receive(:info)
 
@@ -96,7 +94,7 @@
 
     context "when there are no DOIs to import" do
       it "returns 0 and logs a message when there are no DOIs to import" do
-        allow_any_instance_of(Crossref).to receive(:get_total).and_return([0, nil])
+        allow_any_instance_of(Crossref).to receive(:get_total).and_return(0)
 
         # Spy on Rails.logger
         logger_spy = spy("logger")
@@ -119,22 +117,20 @@
       allow(Rails.logger).to(receive(:info))
 
       item = {
-        "id" => "example_id",
-        "action" => "example_action",
-        "subj_id" => "example_subj_id",
-        "obj_id" => "example_obj_id",
-        "relation_type_id" => "example_relation_type_id",
-        "source_id" => "example_source_id",
-        "source_token" => "example_source_token",
-        "occurred_at" => "2023-01-05T12:00:00Z",
-        "timestamp" => 1641379200,
-        "license" => "example_license",
+        "timestamp" => "2002-07-25T03:18:25Z",
+        "relation" => "example_relation_type",
+        "subject" => {
+          "id" => "example_subj_id"
+        },
+        "object" => {
+          "id" => "example_obj_id"
+        }
       }
 
       Crossref.push_item(item)
 
       expect(Crossref).to(have_received(:send_event_import_message).once)
-      expect(Rails.logger).to(have_received(:info).with("[Event Data] example_subj_id example_relation_type_id example_obj_id sent to the events queue."))
+      expect(Rails.logger).to(have_received(:info).with("[Event Data] example_subj_id example_relation_type example_obj_id sent to the events queue."))
     end
   end
 end
diff --git a/spec/rails_helper.rb b/spec/rails_helper.rb
@@ -55,7 +55,7 @@ def fixture_path
   c.filter_sensitive_data("<STAFF_ADMIN_TOKEN>") { ENV["STAFF_ADMIN_TOKEN"] }
   c.filter_sensitive_data("<SLACK_WEBHOOK_URL>") { ENV["SLACK_WEBHOOK_URL"] }
   c.configure_rspec_metadata!
-  c.default_cassette_options = { match_requests_on: %i[method uri] }
+  c.default_cassette_options = { record: vcr_mode, match_requests_on: %i[method uri] }
 end
 
 def capture_stdout