From 43446c1e235f3babcb18d124b43a3876676b69cc Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Mon, 3 Nov 2025 11:46:02 -0800
Subject: [PATCH 01/27] POC for deduplicating data into p_ci_job_infos

A POC for the new model p_ci_job_infos
which stores deduplicated intrinsic job
data.
---
 Gemfile.lock                                  |  4 +-
 app/finders/ci/build_name_finder.rb           |  1 +
 app/models/ci/bridge.rb                       |  3 +-
 app/models/ci/build.rb                        |  3 +-
 app/models/ci/job_definition.rb               |  2 +-
 app/models/ci/job_info.rb                     | 82 +++++++++++++++++++
 app/models/ci/processable.rb                  | 26 ++++++
 app/models/commit_status.rb                   |  2 +
 app/models/concerns/ci/metadatable.rb         | 44 ++++++++++
 .../concerns/ci/partitionable/testing.rb      |  1 +
 app/services/ci/clone_job_service.rb          |  1 +
 .../status_collection.rb                      |  1 +
 app/services/projects/update_pages_service.rb |  1 +
 .../json_schemas/ci_job_infos_config.json     |  5 ++
 .../wip/read_from_ci_job_infos.yml            | 10 +++
 ...riting_ci_job_info_to_old_destinations.yml | 10 +++
 .../wip/write_to_ci_job_infos.yml             | 10 +++
 config/gitlab_loose_foreign_keys.yml          |  4 +
 config/initializers/postgres_partitioning.rb  |  1 +
 db/docs/p_ci_job_infos.yml                    | 13 +++
 db/fixtures/development/14_pipelines.rb       |  1 +
 ...51031012621_create_p_ci_job_infos_table.rb | 33 ++++++++
 ...012831_create_p_ci_job_infos_partitions.rb | 33 ++++++++
 ...9_add_job_info_id_column_to_p_ci_builds.rb | 16 ++++
 ...04_add_index_on_p_ci_builds_job_info_id.rb | 22 +++++
 ...91450_add_fk_on_p_ci_builds_job_info_id.rb | 38 +++++++++
 db/schema_migrations/20251031012621           |  1 +
 db/schema_migrations/20251031012831           |  1 +
 db/schema_migrations/20251103182209           |  1 +
 db/schema_migrations/20251103190204           |  1 +
 db/schema_migrations/20251103191450           |  1 +
 db/structure.sql                              | 42 ++++++++++
 .../services/ee/ci/process_build_service.rb   |  1 +
 lib/gitlab/ci/job_infos/find_or_create.rb     | 59 +++++++++++++
 lib/gitlab/ci/pipeline/chain/create.rb        |  4 +
 .../ci/pipeline/create/job_info_builder.rb    | 42 ++++++++++
 spec/db/schema_spec.rb                        |  1 +
 spec/factories/ci/job_infos.rb                |  9 ++
 .../support/helpers/ci/job_factory_helpers.rb |  2 +
 spec/support/helpers/ci/job_helpers.rb        |  2 +
 40 files changed, 529 insertions(+), 5 deletions(-)
 create mode 100644 app/models/ci/job_info.rb
 create mode 100644 app/validators/json_schemas/ci_job_infos_config.json
 create mode 100644 config/feature_flags/wip/read_from_ci_job_infos.yml
 create mode 100644 config/feature_flags/wip/stop_writing_ci_job_info_to_old_destinations.yml
 create mode 100644 config/feature_flags/wip/write_to_ci_job_infos.yml
 create mode 100644 db/docs/p_ci_job_infos.yml
 create mode 100644 db/migrate/20251031012621_create_p_ci_job_infos_table.rb
 create mode 100644 db/migrate/20251031012831_create_p_ci_job_infos_partitions.rb
 create mode 100644 db/migrate/20251103182209_add_job_info_id_column_to_p_ci_builds.rb
 create mode 100644 db/post_migrate/20251103190204_add_index_on_p_ci_builds_job_info_id.rb
 create mode 100644 db/post_migrate/20251103191450_add_fk_on_p_ci_builds_job_info_id.rb
 create mode 100644 db/schema_migrations/20251031012621
 create mode 100644 db/schema_migrations/20251031012831
 create mode 100644 db/schema_migrations/20251103182209
 create mode 100644 db/schema_migrations/20251103190204
 create mode 100644 db/schema_migrations/20251103191450
 create mode 100644 lib/gitlab/ci/job_infos/find_or_create.rb
 create mode 100644 lib/gitlab/ci/pipeline/create/job_info_builder.rb
 create mode 100644 spec/factories/ci/job_infos.rb

diff --git a/Gemfile.lock b/Gemfile.lock
index 46c2c77bbd132e..fc97abc4abb9cc 100644
--- a/Gemfile.lock
+++ b/Gemfile.lock
@@ -47,7 +47,7 @@ PATH
       concurrent-ruby (~> 1.1)
       faraday (~> 2)
       google-cloud-storage_transfer (~> 1.2.0)
-      google-protobuf (>= 3.25, < 5.0)
+      google-protobuf (~> 3.25, >= 3.25.3)
       googleauth (~> 1.14)
       grpc (~> 1.75)
       json (~> 2.7)
@@ -163,7 +163,7 @@ PATH
   remote: vendor/gems/gitlab-topology-service-client
   specs:
     gitlab-topology-service-client (0.1)
-      google-protobuf (>= 3.25, < 5.0)
+      google-protobuf (~> 3)
       grpc
 
 PATH
diff --git a/app/finders/ci/build_name_finder.rb b/app/finders/ci/build_name_finder.rb
index 4e145ac0bc9060..f6c325f4595c3a 100644
--- a/app/finders/ci/build_name_finder.rb
+++ b/app/finders/ci/build_name_finder.rb
@@ -26,6 +26,7 @@ def limited_name_search_terms
 
     # rubocop: disable CodeReuse/ActiveRecord -- Need specialized queries for database optimizations
     def filter_by_name(build_relation)
+      # TODO: Update this query to use Ci::JobInfo
       build_name_relation = Ci::BuildName
         .where(project_id: project.id)
         .pg_full_text_search_in_model(limited_name_search_terms)
diff --git a/app/models/ci/bridge.rb b/app/models/ci/bridge.rb
index 04e5d7a3e54058..700a7e4641b101 100644
--- a/app/models/ci/bridge.rb
+++ b/app/models/ci/bridge.rb
@@ -103,7 +103,8 @@ def self.with_preloads
     def self.clone_accessors
       %i[pipeline project ref tag name allow_failure stage_idx
         when environment description needs_attributes
-        scheduling_type ci_stage partition_id resource_group].freeze
+        scheduling_type ci_stage partition_id resource_group
+        job_info_id].freeze
     end
 
     def retryable?
diff --git a/app/models/ci/build.rb b/app/models/ci/build.rb
index 1a430262f32748..a382f1e74a183c 100644
--- a/app/models/ci/build.rb
+++ b/app/models/ci/build.rb
@@ -286,7 +286,8 @@ def clone_accessors
           environment coverage_regex description tag_list protected
           needs_attributes job_variables_attributes resource_group
           scheduling_type timeout timeout_source debug_trace_enabled
-          ci_stage partition_id execution_config_id inputs_attributes].freeze
+          ci_stage partition_id execution_config_id inputs_attributes
+          job_info_id].freeze
       end
 
       def supported_keyset_orderings
diff --git a/app/models/ci/job_definition.rb b/app/models/ci/job_definition.rb
index c4a41b0bd27ee1..b3cc77352aedeb 100644
--- a/app/models/ci/job_definition.rb
+++ b/app/models/ci/job_definition.rb
@@ -3,7 +3,7 @@
 module Ci
   # The purpose of this class is to store immutable duplicate Processable related
   # data that can be disposed after all the pipelines that use it are archived.
-  # Data that should be persisted forever, should be stored with Ci::Build model.
+  # Data that must persist after archival should be stored with Ci::Build or Ci::JobInfo.
   class JobDefinition < Ci::ApplicationRecord
     include Ci::Partitionable
     include BulkInsertSafe
diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
new file mode 100644
index 00000000000000..936bed46976752
--- /dev/null
+++ b/app/models/ci/job_info.rb
@@ -0,0 +1,82 @@
+# frozen_string_literal: true
+
+module Ci
+  # The purpose of this class is to store immutable, intrinsic duplicate job data
+  # that must persist even after all the pipelines that use it are archived.
+  # Data that can be disposed after archival should be stored with Ci::JobDefinition.
+  class JobInfo < Ci::ApplicationRecord
+    include Ci::Partitionable
+    include BulkInsertSafe
+
+    self.table_name = :p_ci_job_infos
+    self.primary_key = :id
+
+    ignore_column :search_vector, remove_never: true # Value is auto-generated by DB; must ignore it for bulk insert
+
+    # IMPORTANT: append new attributes at the end of this list. Do not change the order!
+    # Order is important for the checksum calculation.
+    CONFIG_ATTRIBUTES = [
+      :allow_failure,
+      :when,
+      :scheduling_type,
+      :stage_idx,
+      :name
+    ].freeze
+    NORMALIZED_DATA_COLUMNS = %i[stage_idx name].freeze
+
+    MAX_JOB_NAME_LENGTH = 255
+
+    query_constraints :id, :partition_id
+    partitionable scope: ->(_) { Ci::Pipeline.current_partition_value }, partitioned: true
+
+    belongs_to :project
+
+    validates :project, presence: true
+    validates :name, presence: true, length: { maximum: MAX_JOB_NAME_LENGTH }
+    # rubocop:disable Database/JsonbSizeLimit -- no updates
+    validates :config, json_schema: { filename: 'ci_job_infos_config' }
+    # rubocop:enable Database/JsonbSizeLimit
+
+    attribute :config, ::Gitlab::Database::Type::SymbolizedJsonb.new
+
+    scope :for_project, ->(project_id) { where(project_id: project_id) }
+    scope :for_checksum, ->(checksum) { where(checksum: checksum) }
+
+    def self.fabricate(config:, project_id:, partition_id:)
+      sanitized_config = normalize_and_sanitize(config)
+
+      # NOTE: Checksum is generated with all attributes including normalized columns. But when storing
+      # the data, we can save space by excluding the normalized column values from the config hash.
+      attrs = {
+        project_id: project_id,
+        partition_id: partition_id,
+        config: sanitized_config.except(*NORMALIZED_DATA_COLUMNS),
+        checksum: generate_checksum(sanitized_config),
+        created_at: Time.current,
+        **sanitized_config.slice(*NORMALIZED_DATA_COLUMNS)
+      }
+
+      new(attrs)
+    end
+
+    def self.normalize_and_sanitize(config)
+      data = config.symbolize_keys
+
+      NORMALIZED_DATA_COLUMNS.each do |col|
+        data[col] = data.fetch(col) { column_defaults[col.to_s] }
+      end
+
+      data.slice(*CONFIG_ATTRIBUTES)
+    end
+
+    def self.generate_checksum(config)
+      config
+        .then { |data| Gitlab::Json.dump(data) }
+        .then { |data| Digest::SHA256.hexdigest(data) }
+    end
+
+    def readonly?
+      persisted?
+    end
+  end
+end
diff --git a/app/models/ci/processable.rb b/app/models/ci/processable.rb
index 398f08f0ed3fe1..6acb38a0ba14af 100644
--- a/app/models/ci/processable.rb
+++ b/app/models/ci/processable.rb
@@ -14,6 +14,7 @@ class Processable < ::CommitStatus
     self.allow_legacy_sti_class = true
 
     attribute :temp_job_definition
+    attribute :temp_job_info
 
     has_one :resource, class_name: 'Ci::Resource', foreign_key: 'build_id', inverse_of: :processable
     has_one :sourced_pipeline, class_name: 'Ci::Sources::Pipeline', foreign_key: :source_job_id, inverse_of: :source_job
@@ -55,6 +56,13 @@ class Processable < ::CommitStatus
       inverse_of: :build,
       partition_foreign_key: :partition_id
 
+    # rubocop: disable Rails/InverseOf -- Relation not present in Ci::JobInfo because foreign key callback is not compatible with BulkInsertSafe
+    belongs_to :job_info,
+      ->(job) { in_partition(job) },
+      class_name: 'Ci::JobInfo',
+      partition_foreign_key: :partition_id
+    # rubocop: enable Rails/InverseOf
+
     accepts_nested_attributes_for :needs
     accepts_nested_attributes_for :job_definition_instance
 
@@ -159,6 +167,13 @@ class Processable < ::CommitStatus
     def self.fabricate(attrs)
       attrs = attrs.dup
       definition_attrs = attrs.extract!(*Ci::JobDefinition::CONFIG_ATTRIBUTES)
+
+      info_attrs = if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, attrs[:project])
+                     attrs.extract!(*Ci::JobInfo::CONFIG_ATTRIBUTES)
+                   else
+                     attrs.slice(*Ci::JobInfo::CONFIG_ATTRIBUTES)
+                   end
+
       attrs[:tag_list] = definition_attrs[:tag_list] if definition_attrs.key?(:tag_list)
 
       new(attrs).tap do |job|
@@ -169,6 +184,16 @@ def self.fabricate(attrs)
         )
 
         job.temp_job_definition = job_definition
+
+        next unless Feature.enabled?(:write_to_ci_job_infos, attrs[:project])
+
+        job_info = ::Ci::JobInfo.fabricate(
+          config: info_attrs,
+          project_id: job.project_id,
+          partition_id: job.partition_id
+        )
+
+        job.temp_job_info = job_info
       end
     end
 
@@ -188,6 +213,7 @@ def self.select_with_aggregated_needs(project)
     # so we need to ensure the data exists before using it.
     def self.populate_scheduling_type!
       needs = Ci::BuildNeed.scoped_build.select(1)
+      # TODO: Update this query to update Ci::JobInfo instead?
       where(scheduling_type: nil).update_all(
         "scheduling_type = CASE WHEN (EXISTS (#{needs.to_sql}))
          THEN #{scheduling_types[:dag]}
diff --git a/app/models/commit_status.rb b/app/models/commit_status.rb
index 32efa5ac6644f9..14608b3acbf224 100644
--- a/app/models/commit_status.rb
+++ b/app/models/commit_status.rb
@@ -65,6 +65,7 @@ class CommitStatus < Ci::ApplicationRecord
   scope :latest, -> { where(retried: [false, nil]) }
   scope :retried, -> { where(retried: true) }
   scope :ordered, -> { order(:name) }
+  # TODO: Update scope to join with ci_job_infos; evaluate query performance with this change
   scope :ordered_by_stage, -> { order(stage_idx: :asc) }
   scope :latest_ordered, -> { latest.ordered.includes(project: :namespace) }
   scope :retried_ordered, -> { retried.order(name: :asc, id: :desc).includes(project: :namespace) }
@@ -206,6 +207,7 @@ class CommitStatus < Ci::ApplicationRecord
         .fabricate(commit_status, transition.args.first)
 
       commit_status.failure_reason = reason.failure_reason_enum
+      # BLOCKER: allow_failure appears to be mutated here
       commit_status.allow_failure = true if reason.force_allow_failure?
       # Windows exit codes can reach a max value of 32-bit unsigned integer
       # We only allow a smallint for exit_code in the db, hence the added limit of 32767
diff --git a/app/models/concerns/ci/metadatable.rb b/app/models/concerns/ci/metadatable.rb
index 7fbf0671c985e0..3a017b0964c660 100644
--- a/app/models/concerns/ci/metadatable.rb
+++ b/app/models/concerns/ci/metadatable.rb
@@ -191,6 +191,30 @@ def secrets=(_value)
       raise ActiveRecord::ReadonlyAttributeError, 'This data is read only'
     end
 
+    def allow_failure
+      read_job_info_attribute(:allow_failure)
+    end
+
+    def allow_failure?
+      allow_failure.present?
+    end
+
+    def when
+      read_job_info_attribute(:when)
+    end
+
+    def scheduling_type
+      read_job_info_attribute(:scheduling_type)
+    end
+
+    def stage_idx
+      read_job_info_attribute(:stage_idx)
+    end
+
+    def name
+      read_job_info_attribute(:name)
+    end
+
     private
 
     def read_metadata_attribute(legacy_key, metadata_key, job_definition_key, default_value = nil)
@@ -202,6 +226,26 @@ def read_metadata_attribute(legacy_key, metadata_key, job_definition_key, defaul
 
       metadata&.read_attribute(metadata_key) || default_value
     end
+
+    def read_job_info_attribute(key, default_value: nil)
+      if read_from_ci_job_infos?
+        # TODO: Not really the nicest way to do this; refactor?
+        result = if key.in?(::Ci::JobInfo::NORMALIZED_DATA_COLUMNS)
+                   job_info&.read_attribute(key) || temp_job_info&.read_attribute(key)
+                 else
+                   job_info&.config&.dig(key) || temp_job_info&.config&.dig(key)
+                 end
+      end
+
+      return result if result
+
+      read_attribute(key) || default_value
+    end
+
+    def read_from_ci_job_infos?
+      Feature.enabled?(:read_from_ci_job_infos, project)
+    end
+    strong_memoize_attr :read_from_ci_job_infos?
   end
 end
 
diff --git a/app/models/concerns/ci/partitionable/testing.rb b/app/models/concerns/ci/partitionable/testing.rb
index f4bebd3071f399..b5655891b68b96 100644
--- a/app/models/concerns/ci/partitionable/testing.rb
+++ b/app/models/concerns/ci/partitionable/testing.rb
@@ -24,6 +24,7 @@ module Testing
         Ci::JobArtifactReport
         Ci::JobDefinition
         Ci::JobDefinitionInstance
+        Ci::JobInfo
         Ci::JobInput
         Ci::JobMessage
         Ci::JobVariable
diff --git a/app/services/ci/clone_job_service.rb b/app/services/ci/clone_job_service.rb
index 9a3f6291e2c338..47a58877ca0e85 100644
--- a/app/services/ci/clone_job_service.rb
+++ b/app/services/ci/clone_job_service.rb
@@ -13,6 +13,7 @@ def execute(new_job_variables: [], new_job_inputs: {})
       add_job_variables_attributes!(new_attributes, new_job_variables)
       add_job_inputs_attributes!(new_attributes, new_job_inputs)
       add_job_definition_attributes!(new_attributes)
+      # TODO: Need to update cloning to include Ci::JobInfo
 
       new_attributes[:user] = current_user
 
diff --git a/app/services/ci/pipeline_processing/atomic_processing_service/status_collection.rb b/app/services/ci/pipeline_processing/atomic_processing_service/status_collection.rb
index 9a53c6d8fc1cd2..a892b03922e465 100644
--- a/app/services/ci/pipeline_processing/atomic_processing_service/status_collection.rb
+++ b/app/services/ci/pipeline_processing/atomic_processing_service/status_collection.rb
@@ -112,6 +112,7 @@ def all_jobs
           # This is more efficient than relying on PostgreSQL to calculate composite status for us
           #
           # Since we need to reprocess everything we can fetch all of them and do processing ourselves.
+          # TODO: We need to update this query to work with Ci::JobInfo
           strong_memoize(:all_jobs) do
             raw_jobs = pipeline
               .current_jobs
diff --git a/app/services/projects/update_pages_service.rb b/app/services/projects/update_pages_service.rb
index 7623841cb1d122..195516e2a8e527 100644
--- a/app/services/projects/update_pages_service.rb
+++ b/app/services/projects/update_pages_service.rb
@@ -56,6 +56,7 @@ def success
     def error(message)
       register_failure
       log_error("Projects::UpdatePagesService: #{message}")
+      # BLOCKER: allow_failure appears to be mutated here
       commit_status.allow_failure = !deployment_validations.latest_build?
       commit_status.description = message
       commit_status.drop(:script_failure)
diff --git a/app/validators/json_schemas/ci_job_infos_config.json b/app/validators/json_schemas/ci_job_infos_config.json
new file mode 100644
index 00000000000000..74356b1a27e5f2
--- /dev/null
+++ b/app/validators/json_schemas/ci_job_infos_config.json
@@ -0,0 +1,5 @@
+{
+  "$schema": "http://json-schema.org/draft-07/schema#",
+  "description": "CI job immutable intrinsic config data",
+  "type": "object"
+}
diff --git a/config/feature_flags/wip/read_from_ci_job_infos.yml b/config/feature_flags/wip/read_from_ci_job_infos.yml
new file mode 100644
index 00000000000000..bfa9d1b110ffe9
--- /dev/null
+++ b/config/feature_flags/wip/read_from_ci_job_infos.yml
@@ -0,0 +1,10 @@
+---
+name: read_from_ci_job_infos
+description:
+feature_issue_url:
+introduced_by_url:
+rollout_issue_url:
+milestone: '18.6'
+group: group::ci platform
+type: wip
+default_enabled: false
diff --git a/config/feature_flags/wip/stop_writing_ci_job_info_to_old_destinations.yml b/config/feature_flags/wip/stop_writing_ci_job_info_to_old_destinations.yml
new file mode 100644
index 00000000000000..2bde8077d20335
--- /dev/null
+++ b/config/feature_flags/wip/stop_writing_ci_job_info_to_old_destinations.yml
@@ -0,0 +1,10 @@
+---
+name: stop_writing_ci_job_info_to_old_destinations
+description:
+feature_issue_url:
+introduced_by_url:
+rollout_issue_url:
+milestone: '18.6'
+group: group::ci platform
+type: wip
+default_enabled: false
diff --git a/config/feature_flags/wip/write_to_ci_job_infos.yml b/config/feature_flags/wip/write_to_ci_job_infos.yml
new file mode 100644
index 00000000000000..b45a0f86fe75fa
--- /dev/null
+++ b/config/feature_flags/wip/write_to_ci_job_infos.yml
@@ -0,0 +1,10 @@
+---
+name: write_to_ci_job_infos
+description:
+feature_issue_url:
+introduced_by_url:
+rollout_issue_url:
+milestone: '18.6'
+group: group::ci platform
+type: wip
+default_enabled: false
diff --git a/config/gitlab_loose_foreign_keys.yml b/config/gitlab_loose_foreign_keys.yml
index faa24f1e2723a3..5e128df843ac20 100644
--- a/config/gitlab_loose_foreign_keys.yml
+++ b/config/gitlab_loose_foreign_keys.yml
@@ -631,6 +631,10 @@ p_ci_job_definitions:
   - table: projects
     column: project_id
     on_delete: async_delete
+p_ci_job_infos:
+  - table: projects
+    column: project_id
+    on_delete: async_delete
 p_ci_job_inputs:
   - table: projects
     column: project_id
diff --git a/config/initializers/postgres_partitioning.rb b/config/initializers/postgres_partitioning.rb
index a7fd1002fc0606..83511cf8e58bbb 100644
--- a/config/initializers/postgres_partitioning.rb
+++ b/config/initializers/postgres_partitioning.rb
@@ -31,6 +31,7 @@
       Ci::JobArtifactReport,
       Ci::JobDefinition,
       Ci::JobDefinitionInstance,
+      Ci::JobInfo,
       Ci::JobInput,
       Ci::JobMessage,
       Ci::Pipeline,
diff --git a/db/docs/p_ci_job_infos.yml b/db/docs/p_ci_job_infos.yml
new file mode 100644
index 00000000000000..f6884b015bbb47
--- /dev/null
+++ b/db/docs/p_ci_job_infos.yml
@@ -0,0 +1,13 @@
+---
+table_name: p_ci_job_infos
+classes:
+- Ci::JobInfo
+feature_categories:
+- continuous_integration
+description: Unique intrinsic job data across pipelines
+introduced_by_url:
+milestone: '18.6'
+gitlab_schema: gitlab_ci
+sharding_key:
+  project_id: projects
+table_size: small
diff --git a/db/fixtures/development/14_pipelines.rb b/db/fixtures/development/14_pipelines.rb
index 58c7567a5e29f2..a65dc4b049dab7 100644
--- a/db/fixtures/development/14_pipelines.rb
+++ b/db/fixtures/development/14_pipelines.rb
@@ -193,6 +193,7 @@ def create_pipeline!(project, ref, commit)
     project.ci_pipelines.create!(sha: commit.id, ref: ref, source: :push)
   end
 
+  # TODO: We need to create fixtures for Ci::JobInfo too
   def build_create!(pipeline, stage, opts = {})
     attributes = job_attributes(pipeline, stage, opts)
     attributes[:options] ||= {}
diff --git a/db/migrate/20251031012621_create_p_ci_job_infos_table.rb b/db/migrate/20251031012621_create_p_ci_job_infos_table.rb
new file mode 100644
index 00000000000000..653ad93a7d30f4
--- /dev/null
+++ b/db/migrate/20251031012621_create_p_ci_job_infos_table.rb
@@ -0,0 +1,33 @@
+# frozen_string_literal: true
+
+class CreatePCiJobInfosTable < Gitlab::Database::Migration[2.3]
+  milestone '18.6'
+
+  def change
+    opts = {
+      primary_key: [:id, :partition_id],
+      options: 'PARTITION BY LIST (partition_id)'
+    }
+
+    create_table(:p_ci_job_infos, **opts) do |t|
+      t.bigserial :id, null: false
+      t.bigint :partition_id, null: false
+      t.bigint :project_id, null: false
+      t.datetime_with_timezone :created_at, null: false
+      t.integer :stage_idx, limit: 2
+      t.binary :checksum, null: false
+      t.tsvector :search_vector, as: "to_tsvector('english'::regconfig, COALESCE(name, ''::text))", stored: true
+      t.text :name, limit: 255, null: false
+      t.jsonb :config, default: {}, null: false
+
+      t.index [:project_id, :checksum, :partition_id], unique: true,
+        name: :index_p_ci_job_infos_on_project_id_and_checksum
+      t.index [:project_id, :stage_idx], include: [:id],
+        name: :index_p_ci_job_infos_on_project_id_and_stage_idx
+      t.index [:project_id, :name], include: [:id],
+        name: :index_p_ci_job_infos_on_project_id_and_name
+      t.index [:search_vector], using: :gin,
+        name: :index_p_ci_job_infos_on_search_vector
+    end
+  end
+end
diff --git a/db/migrate/20251031012831_create_p_ci_job_infos_partitions.rb b/db/migrate/20251031012831_create_p_ci_job_infos_partitions.rb
new file mode 100644
index 00000000000000..3617cf09fc9b30
--- /dev/null
+++ b/db/migrate/20251031012831_create_p_ci_job_infos_partitions.rb
@@ -0,0 +1,33 @@
+# frozen_string_literal: true
+
+class CreatePCiJobInfosPartitions < Gitlab::Database::Migration[2.3]
+  milestone '18.6'
+
+  disable_ddl_transaction!
+
+  def up
+    sql = (100..108).map do |partition_id|
+      <<~SQL
+      CREATE TABLE IF NOT EXISTS gitlab_partitions_dynamic.ci_job_infos_#{partition_id}
+        PARTITION OF p_ci_job_infos
+        FOR VALUES IN (#{partition_id});
+      SQL
+    end.join
+
+    with_lock_retries do
+      connection.execute(sql)
+    end
+  end
+
+  def down
+    sql = (100..108).map do |partition_id|
+      <<~SQL
+      DROP TABLE IF EXISTS gitlab_partitions_dynamic.ci_job_infos_#{partition_id};
+      SQL
+    end.join
+
+    with_lock_retries do
+      connection.execute(sql)
+    end
+  end
+end
diff --git a/db/migrate/20251103182209_add_job_info_id_column_to_p_ci_builds.rb b/db/migrate/20251103182209_add_job_info_id_column_to_p_ci_builds.rb
new file mode 100644
index 00000000000000..ad207d4f316f2e
--- /dev/null
+++ b/db/migrate/20251103182209_add_job_info_id_column_to_p_ci_builds.rb
@@ -0,0 +1,16 @@
+# frozen_string_literal: true
+
+class AddJobInfoIdColumnToPCiBuilds < Gitlab::Database::Migration[2.3]
+  milestone '18.6'
+
+  # rubocop:disable Migration/PreventAddingColumns -- Required to deduplicate data into ci_job_infos table
+  def up
+    # TODO: Should be changed into a non-nullable column later
+    add_column :p_ci_builds, :job_info_id, :bigint, if_not_exists: true
+  end
+
+  def down
+    remove_column :p_ci_builds, :job_info_id, if_exists: true
+  end
+  # rubocop:enable Migration/PreventAddingColumns
+end
diff --git a/db/post_migrate/20251103190204_add_index_on_p_ci_builds_job_info_id.rb b/db/post_migrate/20251103190204_add_index_on_p_ci_builds_job_info_id.rb
new file mode 100644
index 00000000000000..9356d3201667f7
--- /dev/null
+++ b/db/post_migrate/20251103190204_add_index_on_p_ci_builds_job_info_id.rb
@@ -0,0 +1,22 @@
+# frozen_string_literal: true
+
+# TODO: This index should first be added asynchronously on Production
+class AddIndexOnPCiBuildsJobInfoId < Gitlab::Database::Migration[2.3]
+  include Gitlab::Database::PartitioningMigrationHelpers
+
+  milestone '18.6'
+
+  disable_ddl_transaction!
+
+  PARTITIONED_INDEX_NAME = 'index_p_ci_builds_on_job_info_id'
+
+  # rubocop: disable Migration/PreventIndexCreation -- Required to deduplicate data into ci_job_infos table
+  def up
+    add_concurrent_partitioned_index :p_ci_builds, :job_info_id, name: PARTITIONED_INDEX_NAME
+  end
+
+  def down
+    remove_concurrent_partitioned_index_by_name :p_ci_builds, PARTITIONED_INDEX_NAME
+  end
+  # rubocop: enable Migration/PreventIndexCreation
+end
diff --git a/db/post_migrate/20251103191450_add_fk_on_p_ci_builds_job_info_id.rb b/db/post_migrate/20251103191450_add_fk_on_p_ci_builds_job_info_id.rb
new file mode 100644
index 00000000000000..94bc6dc013ecc8
--- /dev/null
+++ b/db/post_migrate/20251103191450_add_fk_on_p_ci_builds_job_info_id.rb
@@ -0,0 +1,38 @@
+# frozen_string_literal: true
+
+class AddFkOnPCiBuildsJobInfoId < Gitlab::Database::Migration[2.3]
+  include Gitlab::Database::PartitioningMigrationHelpers
+
+  milestone '18.6'
+
+  disable_ddl_transaction!
+
+  SOURCE_TABLE_NAME = :p_ci_builds
+  TARGET_TABLE_NAME = :p_ci_job_infos
+  FK_NAME = :fk_rails_2f23ec1c61
+
+  # rubocop: disable Migration/PreventForeignKeyCreation -- Required to deduplicate data into ci_job_infos table
+  def up
+    add_concurrent_partitioned_foreign_key(
+      SOURCE_TABLE_NAME, TARGET_TABLE_NAME,
+      column: [:partition_id, :job_info_id],
+      target_column: [:partition_id, :id],
+      on_update: :restrict,
+      on_delete: :restrict,
+      reverse_lock_order: true,
+      name: FK_NAME
+    )
+  end
+
+  def down
+    with_lock_retries do
+      remove_foreign_key_if_exists(
+        SOURCE_TABLE_NAME,
+        TARGET_TABLE_NAME,
+        reverse_lock_order: true,
+        name: FK_NAME
+      )
+    end
+  end
+  # rubocop: enable Migration/PreventForeignKeyCreation
+end
diff --git a/db/schema_migrations/20251031012621 b/db/schema_migrations/20251031012621
new file mode 100644
index 00000000000000..399047a9b10fae
--- /dev/null
+++ b/db/schema_migrations/20251031012621
@@ -0,0 +1 @@
+af4c3926aebf394a62080b9a0be3c7447e8a48513efede46ca4e3812dd1cc776
\ No newline at end of file
diff --git a/db/schema_migrations/20251031012831 b/db/schema_migrations/20251031012831
new file mode 100644
index 00000000000000..a30007e277daec
--- /dev/null
+++ b/db/schema_migrations/20251031012831
@@ -0,0 +1 @@
+2f137baba28ea4604fc626f49ad58de7e85fb47142294b352c1f05b8642af143
\ No newline at end of file
diff --git a/db/schema_migrations/20251103182209 b/db/schema_migrations/20251103182209
new file mode 100644
index 00000000000000..78b14684cd97bd
--- /dev/null
+++ b/db/schema_migrations/20251103182209
@@ -0,0 +1 @@
+1806d088d027cafbb0ae3901752577aa8b5a5ca8725a02f16c72919d9a4e19e1
\ No newline at end of file
diff --git a/db/schema_migrations/20251103190204 b/db/schema_migrations/20251103190204
new file mode 100644
index 00000000000000..117dae5f3cf819
--- /dev/null
+++ b/db/schema_migrations/20251103190204
@@ -0,0 +1 @@
+57f15544e4d1f34c4562662ede1472d423bfe4f43b7f7d299b14b90580ba6d33
\ No newline at end of file
diff --git a/db/schema_migrations/20251103191450 b/db/schema_migrations/20251103191450
new file mode 100644
index 00000000000000..3ab4ba04be64db
--- /dev/null
+++ b/db/schema_migrations/20251103191450
@@ -0,0 +1 @@
+5e263650118c9ea701d737a991d50953910ba0108508598b0d24341e074de02a
\ No newline at end of file
diff --git a/db/structure.sql b/db/structure.sql
index 6746648605376e..20c5357dd76388 100644
--- a/db/structure.sql
+++ b/db/structure.sql
@@ -5684,6 +5684,7 @@ CREATE TABLE p_ci_builds (
     timeout_source smallint,
     exit_code smallint,
     debug_trace_enabled boolean,
+    job_info_id bigint,
     CONSTRAINT check_1e2fbd1b39 CHECK ((lock_version IS NOT NULL)),
     CONSTRAINT check_9aa9432137 CHECK ((project_id IS NOT NULL))
 )
@@ -22523,6 +22524,29 @@ CREATE SEQUENCE p_ci_job_definitions_id_seq
 
 ALTER SEQUENCE p_ci_job_definitions_id_seq OWNED BY p_ci_job_definitions.id;
 
+CREATE TABLE p_ci_job_infos (
+    id bigint NOT NULL,
+    partition_id bigint NOT NULL,
+    project_id bigint NOT NULL,
+    created_at timestamp with time zone NOT NULL,
+    stage_idx smallint,
+    checksum bytea NOT NULL,
+    search_vector tsvector GENERATED ALWAYS AS (to_tsvector('english'::regconfig, COALESCE(name, ''::text))) STORED,
+    name text NOT NULL,
+    config jsonb DEFAULT '{}'::jsonb NOT NULL,
+    CONSTRAINT check_85f37f6053 CHECK ((char_length(name) <= 255))
+)
+PARTITION BY LIST (partition_id);
+
+CREATE SEQUENCE p_ci_job_infos_id_seq
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+ALTER SEQUENCE p_ci_job_infos_id_seq OWNED BY p_ci_job_infos.id;
+
 CREATE SEQUENCE p_ci_job_inputs_id_seq
     START WITH 1
     INCREMENT BY 1
@@ -32864,6 +32888,8 @@ ALTER TABLE ONLY p_ci_builds_metadata ALTER COLUMN id SET DEFAULT nextval('ci_bu
 
 ALTER TABLE ONLY p_ci_job_definitions ALTER COLUMN id SET DEFAULT nextval('p_ci_job_definitions_id_seq'::regclass);
 
+ALTER TABLE ONLY p_ci_job_infos ALTER COLUMN id SET DEFAULT nextval('p_ci_job_infos_id_seq'::regclass);
+
 ALTER TABLE ONLY p_ci_job_inputs ALTER COLUMN id SET DEFAULT nextval('p_ci_job_inputs_id_seq'::regclass);
 
 ALTER TABLE ONLY p_ci_job_messages ALTER COLUMN id SET DEFAULT nextval('p_ci_job_messages_id_seq'::regclass);
@@ -36359,6 +36385,9 @@ ALTER TABLE ONLY p_ci_job_definition_instances
 ALTER TABLE ONLY p_ci_job_definitions
     ADD CONSTRAINT p_ci_job_definitions_pkey PRIMARY KEY (id, partition_id);
 
+ALTER TABLE ONLY p_ci_job_infos
+    ADD CONSTRAINT p_ci_job_infos_pkey PRIMARY KEY (id, partition_id);
+
 ALTER TABLE ONLY p_ci_job_inputs
     ADD CONSTRAINT p_ci_job_inputs_pkey PRIMARY KEY (id, partition_id);
 
@@ -43315,6 +43344,8 @@ CREATE INDEX index_p_ci_builds_execution_configs_on_project_id ON ONLY p_ci_buil
 
 CREATE INDEX index_p_ci_builds_on_execution_config_id ON ONLY p_ci_builds USING btree (execution_config_id) WHERE (execution_config_id IS NOT NULL);
 
+CREATE INDEX index_p_ci_builds_on_job_info_id ON ONLY p_ci_builds USING btree (job_info_id);
+
 CREATE INDEX index_p_ci_finished_build_ch_sync_events_finished_at ON ONLY p_ci_finished_build_ch_sync_events USING btree (partition, build_finished_at);
 
 CREATE INDEX index_p_ci_finished_build_ch_sync_events_on_project_id ON ONLY p_ci_finished_build_ch_sync_events USING btree (project_id);
@@ -43335,6 +43366,14 @@ CREATE INDEX index_p_ci_job_definitions_on_interruptible ON ONLY p_ci_job_defini
 
 CREATE UNIQUE INDEX index_p_ci_job_definitions_on_project_id_and_checksum ON ONLY p_ci_job_definitions USING btree (project_id, checksum, partition_id);
 
+CREATE UNIQUE INDEX index_p_ci_job_infos_on_project_id_and_checksum ON ONLY p_ci_job_infos USING btree (project_id, checksum, partition_id);
+
+CREATE INDEX index_p_ci_job_infos_on_project_id_and_name ON ONLY p_ci_job_infos USING btree (project_id, name) INCLUDE (id);
+
+CREATE INDEX index_p_ci_job_infos_on_project_id_and_stage_idx ON ONLY p_ci_job_infos USING btree (project_id, stage_idx) INCLUDE (id);
+
+CREATE INDEX index_p_ci_job_infos_on_search_vector ON ONLY p_ci_job_infos USING gin (search_vector);
+
 CREATE UNIQUE INDEX index_p_ci_job_inputs_on_job_id_and_name ON ONLY p_ci_job_inputs USING btree (job_id, name, partition_id);
 
 CREATE INDEX index_p_ci_job_inputs_on_project_id ON ONLY p_ci_job_inputs USING btree (project_id);
@@ -52905,6 +52944,9 @@ ALTER TABLE ONLY onboarding_progresses
 ALTER TABLE ONLY protected_branch_unprotect_access_levels
     ADD CONSTRAINT fk_rails_2d2aba21ef FOREIGN KEY (user_id) REFERENCES users(id) ON DELETE CASCADE;
 
+ALTER TABLE p_ci_builds
+    ADD CONSTRAINT fk_rails_2f23ec1c61 FOREIGN KEY (partition_id, job_info_id) REFERENCES p_ci_job_infos(partition_id, id) ON UPDATE RESTRICT ON DELETE RESTRICT;
+
 ALTER TABLE ONLY issuable_severities
     ADD CONSTRAINT fk_rails_2fbb74ad6d FOREIGN KEY (issue_id) REFERENCES issues(id) ON DELETE CASCADE;
 
diff --git a/ee/app/services/ee/ci/process_build_service.rb b/ee/app/services/ee/ci/process_build_service.rb
index 5a7120b2a06a1d..f1f87602e95123 100644
--- a/ee/app/services/ee/ci/process_build_service.rb
+++ b/ee/app/services/ee/ci/process_build_service.rb
@@ -10,6 +10,7 @@ def process(processable)
         if should_block_processable?(processable)
           # To populate the deployment job as manually executable (i.e. `Ci::Build#playable?`),
           # we have to set `manual` to `ci_builds.when` as well as `ci_builds.status`.
+          # BLOCKER: `when` appears to be mutated here
           processable.when = 'manual'
           return processable.actionize!
         end
diff --git a/lib/gitlab/ci/job_infos/find_or_create.rb b/lib/gitlab/ci/job_infos/find_or_create.rb
new file mode 100644
index 00000000000000..cb7db7330013a2
--- /dev/null
+++ b/lib/gitlab/ci/job_infos/find_or_create.rb
@@ -0,0 +1,59 @@
+# frozen_string_literal: true
+
+module Gitlab
+  module Ci
+    module JobInfos
+      # TODO: This class mirrors Ci::JobDefinitions::FindOrCreate;
+      # maybe they can be combined into a single implementation class
+      class FindOrCreate
+        BATCH_SIZE = 50
+
+        def initialize(pipeline, infos: [])
+          @project_id = pipeline.project_id
+          @partition_id = pipeline.partition_id
+          @job_infos = Array.wrap(infos).uniq(&:checksum)
+        end
+
+        def execute
+          return [] if job_infos.empty?
+
+          existing_infos = fetch_records_for(job_infos)
+          existing_infos_by_checksum = existing_infos.group_by(&:checksum)
+          missing_infos = @job_infos.reject do |d|
+            existing_infos_by_checksum[d.checksum]
+          end
+
+          return existing_infos if missing_infos.empty?
+
+          insert_missing(missing_infos)
+
+          existing_infos + fetch_records_for(missing_infos)
+        end
+
+        private
+
+        attr_reader :project_id, :partition_id, :job_infos
+
+        def fetch_records_for(infos)
+          checksums = infos.map(&:checksum)
+
+          ::Ci::JobInfo
+            .select(:id, :partition_id, :project_id, :checksum, *::Ci::JobInfo::NORMALIZED_DATA_COLUMNS)
+            .in_partition(partition_id)
+            .for_project(project_id)
+            .for_checksum(checksums)
+            .to_a # Explicitly convert to array for further processing
+        end
+
+        def insert_missing(infos)
+          ::Ci::JobInfo.bulk_insert!(
+            infos,
+            unique_by: [:project_id, :partition_id, :checksum],
+            skip_duplicates: true,
+            batch_size: BATCH_SIZE
+          )
+        end
+      end
+    end
+  end
+end
diff --git a/lib/gitlab/ci/pipeline/chain/create.rb b/lib/gitlab/ci/pipeline/chain/create.rb
index ea8c5b25dde5b3..d8a9964e07920e 100644
--- a/lib/gitlab/ci/pipeline/chain/create.rb
+++ b/lib/gitlab/ci/pipeline/chain/create.rb
@@ -14,6 +14,10 @@ def perform!
               # reason because they can be used in the next pipeline creations.
               ::Gitlab::Ci::Pipeline::Create::JobDefinitionBuilder.new(pipeline, statuses).run
 
+              if Feature.enabled?(:write_to_ci_job_infos, project)
+                ::Gitlab::Ci::Pipeline::Create::JobInfoBuilder.new(pipeline, statuses).run
+              end
+
               BulkInsertableAssociations.with_bulk_insert do
                 ::Ci::BulkInsertableTags.with_bulk_insert_tags do
                   pipeline.transaction do
diff --git a/lib/gitlab/ci/pipeline/create/job_info_builder.rb b/lib/gitlab/ci/pipeline/create/job_info_builder.rb
new file mode 100644
index 00000000000000..5fcf189baff149
--- /dev/null
+++ b/lib/gitlab/ci/pipeline/create/job_info_builder.rb
@@ -0,0 +1,42 @@
+# frozen_string_literal: true
+
+module Gitlab
+  module Ci
+    module Pipeline
+      module Create
+        class JobInfoBuilder
+          include Gitlab::Utils::StrongMemoize
+
+          def initialize(pipeline, jobs)
+            @pipeline = pipeline
+            @jobs = jobs.select(&:temp_job_info)
+            @project = pipeline.project
+          end
+
+          def run
+            find_or_insert_job_infos.each do |job_info|
+              jobs_by_checksum[job_info.checksum].each do |job|
+                job.job_info = job_info
+              end
+            end
+          end
+
+          private
+
+          attr_reader :project, :pipeline, :jobs
+
+          def find_or_insert_job_infos
+            Gitlab::Ci::JobInfos::FindOrCreate.new(pipeline, infos: jobs.map(&:temp_job_info)).execute
+          end
+
+          def jobs_by_checksum
+            jobs.group_by do |job|
+              job.temp_job_info.checksum
+            end
+          end
+          strong_memoize_attr :jobs_by_checksum
+        end
+      end
+    end
+  end
+end
diff --git a/spec/db/schema_spec.rb b/spec/db/schema_spec.rb
index 6a231a38f81095..e274a854bc8c7f 100644
--- a/spec/db/schema_spec.rb
+++ b/spec/db/schema_spec.rb
@@ -155,6 +155,7 @@
       p_ci_job_annotations: %w[project_id],
       p_ci_job_artifacts: %w[project_id],
       p_ci_job_definitions: %w[partition_id],
+      p_ci_job_infos: %w[partition_id],
       p_ci_pipeline_artifact_states: %w[partition_id pipeline_artifact_id],
       p_ci_pipeline_variables: %w[project_id],
       p_ci_pipelines_config: %w[partition_id project_id],
diff --git a/spec/factories/ci/job_infos.rb b/spec/factories/ci/job_infos.rb
new file mode 100644
index 00000000000000..8843ba6688a6d2
--- /dev/null
+++ b/spec/factories/ci/job_infos.rb
@@ -0,0 +1,9 @@
+# frozen_string_literal: true
+
+FactoryBot.define do
+  factory :ci_job_info, class: 'Ci::JobInfo' do
+    project factory: :project
+
+    checksum { Digest::SHA256.hexdigest(rand.to_s) }
+  end
+end
diff --git a/spec/support/helpers/ci/job_factory_helpers.rb b/spec/support/helpers/ci/job_factory_helpers.rb
index 8b948e7e0992eb..2a66cb6da11bf3 100644
--- a/spec/support/helpers/ci/job_factory_helpers.rb
+++ b/spec/support/helpers/ci/job_factory_helpers.rb
@@ -2,6 +2,8 @@
 
 module Ci
   module JobFactoryHelpers
+    # TODO: We need to create a mutator for Ci::JobInfo too. Maybe we can
+    # combine it with this helper and call it `mutate_temp_job_config`?
     # Temp job definitions should not change in normal operation;
     # only use this method as a helper in factory definitions.
     def self.mutate_temp_job_definition(job, **new_config)
diff --git a/spec/support/helpers/ci/job_helpers.rb b/spec/support/helpers/ci/job_helpers.rb
index 94544c884a5f65..d109398b5ee440 100644
--- a/spec/support/helpers/ci/job_helpers.rb
+++ b/spec/support/helpers/ci/job_helpers.rb
@@ -2,6 +2,8 @@
 
 module Ci
   module JobHelpers
+    # TODO: We need to create a stub helper for Ci::JobInfo too. Maybe we
+    # can combine it with this helper and call it `stub_ci_job_config`.
     def stub_ci_job_definition(job, **new_config)
       new_config.symbolize_keys!
       unknown_keys = new_config.keys - Ci::JobDefinition::CONFIG_ATTRIBUTES
-- 
GitLab


From e14a96382c5e984d8666a5d90eb54eeca5898018 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Wed, 5 Nov 2025 11:46:10 -0800
Subject: [PATCH 02/27] Add job name helpers for rspec

Add helper to find job by name
or pluck job names, for rspec tests.
---
 ...91450_add_fk_on_p_ci_builds_job_info_id.rb |  1 +
 lib/gitlab/ci/job_infos/find_or_create.rb     |  2 +-
 .../ci/create_pipeline_service_spec.rb        | 48 ++++++++-----------
 spec/support/helpers/ci/job_helpers.rb        | 16 +++++++
 4 files changed, 37 insertions(+), 30 deletions(-)

diff --git a/db/post_migrate/20251103191450_add_fk_on_p_ci_builds_job_info_id.rb b/db/post_migrate/20251103191450_add_fk_on_p_ci_builds_job_info_id.rb
index 94bc6dc013ecc8..e7333992b1707a 100644
--- a/db/post_migrate/20251103191450_add_fk_on_p_ci_builds_job_info_id.rb
+++ b/db/post_migrate/20251103191450_add_fk_on_p_ci_builds_job_info_id.rb
@@ -1,5 +1,6 @@
 # frozen_string_literal: true
 
+# TODO: This FK should first be added asynchronously on Production
 class AddFkOnPCiBuildsJobInfoId < Gitlab::Database::Migration[2.3]
   include Gitlab::Database::PartitioningMigrationHelpers
 
diff --git a/lib/gitlab/ci/job_infos/find_or_create.rb b/lib/gitlab/ci/job_infos/find_or_create.rb
index cb7db7330013a2..9ecaf45cd43ed6 100644
--- a/lib/gitlab/ci/job_infos/find_or_create.rb
+++ b/lib/gitlab/ci/job_infos/find_or_create.rb
@@ -38,7 +38,7 @@ def fetch_records_for(infos)
           checksums = infos.map(&:checksum)
 
           ::Ci::JobInfo
-            .select(:id, :partition_id, :project_id, :checksum, *::Ci::JobInfo::NORMALIZED_DATA_COLUMNS)
+            .select(:id, :partition_id, :project_id, :checksum, :config, *::Ci::JobInfo::NORMALIZED_DATA_COLUMNS)
             .in_partition(partition_id)
             .for_project(project_id)
             .for_checksum(checksums)
diff --git a/spec/services/ci/create_pipeline_service_spec.rb b/spec/services/ci/create_pipeline_service_spec.rb
index d30f93af368ac2..002745c963021f 100644
--- a/spec/services/ci/create_pipeline_service_spec.rb
+++ b/spec/services/ci/create_pipeline_service_spec.rb
@@ -231,7 +231,7 @@ def execute_service(
             it 'is not cancelable' do
               pipeline = execute_service.payload
 
-              expect(pipeline.builds.find_by(name: 'rspec').interruptible).to be_falsy
+              expect(find_job_by_name(pipeline.builds, 'rspec').interruptible).to be_falsy
             end
           end
 
@@ -244,7 +244,7 @@ def execute_service(
             it 'is cancelable' do
               pipeline = execute_service.payload
 
-              expect(pipeline.builds.find_by(name: 'rspec').interruptible).to be_truthy
+              expect(find_job_by_name(pipeline.builds, 'rspec').interruptible).to be_truthy
             end
           end
 
@@ -257,7 +257,7 @@ def execute_service(
             it 'is not cancelable' do
               pipeline = execute_service.payload
 
-              expect(pipeline.builds.find_by(name: 'rspec').interruptible).to be_falsy
+              expect(find_job_by_name(pipeline.builds, 'rspec').interruptible).to be_falsy
             end
           end
         end
@@ -305,7 +305,8 @@ def execute_service(
               pipeline_on_previous_commit
                 .builds
                 .joins(:job_definition)
-                .pluck(:name, "#{Ci::JobDefinition.quoted_table_name}.interruptible")
+                .joins(:job_info)
+                .pluck('ci_job_infos.name', "#{Ci::JobDefinition.quoted_table_name}.interruptible")
 
             expect(interruptible_status).to contain_exactly(
               ['build_1_1', true],
@@ -319,10 +320,7 @@ def execute_service(
           context 'when only interruptible builds are running' do
             context 'when build marked explicitly by interruptible is running' do
               it 'cancels running outdated pipelines', :sidekiq_inline do
-                pipeline_on_previous_commit
-                  .builds
-                  .find_by_name('build_1_2')
-                  .run!
+                find_job_by_name(pipeline_on_previous_commit.builds, 'build_1_2').run!
 
                 pipeline
 
@@ -333,8 +331,7 @@ def execute_service(
 
             context 'when build that is not marked as interruptible is running' do
               it 'cancels running outdated pipelines', :sidekiq_inline do
-                build_2_1 = pipeline_on_previous_commit
-                  .builds.find_by_name('build_2_1')
+                build_2_1 = find_job_by_name(pipeline_on_previous_commit.builds, 'build_2_1')
 
                 build_2_1.enqueue!
                 build_2_1.reset.run!
@@ -349,8 +346,7 @@ def execute_service(
 
           context 'when an uninterruptible build is running' do
             it 'does not cancel running outdated pipelines', :sidekiq_inline do
-              build_3_1 = pipeline_on_previous_commit
-                .builds.find_by_name('build_3_1')
+              build_3_1 = find_job_by_name(pipeline_on_previous_commit.builds, 'build_3_1')
 
               build_3_1.enqueue!
               build_3_1.reset.run!
@@ -366,10 +362,7 @@ def execute_service(
             it 'cancels running outdated pipelines', :sidekiq_might_not_need_inline do
               allow(Ci::BuildScheduleWorker).to receive(:perform_at)
 
-              pipeline_on_previous_commit
-                .builds
-                .find_by_name('build_2_1')
-                .schedule!
+              find_job_by_name(pipeline_on_previous_commit.builds, 'build_2_1').schedule!
 
               pipeline
 
@@ -380,10 +373,7 @@ def execute_service(
 
           context 'when a uninterruptible build has finished' do
             it 'does not cancel running outdated pipelines', :sidekiq_might_not_need_inline do
-              pipeline_on_previous_commit
-                .builds
-                .find_by_name('build_3_1')
-                .success!
+              find_job_by_name(pipeline_on_previous_commit.builds, 'build_3_1').success!
 
               pipeline
 
@@ -759,7 +749,7 @@ def previous_commit_sha_from_ref(ref)
 
     context 'when builds with auto-retries are configured' do
       let(:pipeline)  { execute_service.payload }
-      let(:rspec_job) { pipeline.builds.find_by(name: 'rspec') }
+      let(:rspec_job) { find_job_by_name(pipeline.builds, 'rspec') }
 
       before do
         stub_ci_pipeline_yaml_file(YAML.dump({
@@ -799,7 +789,7 @@ def previous_commit_sha_from_ref(ref)
 
         it 'persists the association correctly' do
           result = execute_service.payload
-          deploy_job = result.builds.find_by_name!(:test)
+          deploy_job = find_job_by_name(result.builds, :test)
           resource_group = project.resource_groups.find_by_key!(resource_group_key)
 
           expect(result).to be_persisted
@@ -854,8 +844,8 @@ def previous_commit_sha_from_ref(ref)
 
       it 'persists the association correctly' do
         result = execute_service.payload
-        deploy_job = result.builds.find_by_name!(:review_app)
-        stop_job = result.builds.find_by_name!(:stop_review_app)
+        deploy_job = find_job_by_name(result.builds, :review_app)
+        stop_job = find_job_by_name(result.builds, :stop_review_app)
 
         expect(result).to be_persisted
         expect(deploy_job.resource_group.key).to eq('review/master')
@@ -890,7 +880,7 @@ def previous_commit_sha_from_ref(ref)
           pipeline = execute_service.payload
 
           expect(pipeline).to be_persisted
-          expect(pipeline.builds.find_by(name: 'rspec').options[:job_timeout]).to eq 123
+          expect(find_job_by_name(pipeline.builds, 'rspec').options[:job_timeout]).to eq 123
         end
       end
     end
@@ -1411,7 +1401,7 @@ def previous_commit_sha_from_ref(ref)
               expect(pipeline).to be_persisted
               expect(pipeline).to be_merge_request_event
               expect(pipeline.merge_request).to eq(merge_request)
-              expect(pipeline.builds.order(:stage_id).pluck(:name)).to eq(%w[test])
+              expect(pluck_job_names(pipeline.builds.order(:stage_id))).to eq(%w[test])
             end
 
             it 'persists the specified source sha' do
@@ -1645,7 +1635,7 @@ def previous_commit_sha_from_ref(ref)
             expect(pipeline).to be_persisted
             expect(pipeline).to be_web
             expect(pipeline.merge_request).to be_nil
-            expect(pipeline.builds.order(:stage_id).pluck(:name)).to eq(%w[build pages])
+            expect(pluck_job_names(pipeline.builds.order(:stage_id))).to eq(%w[build pages])
           end
         end
       end
@@ -1685,7 +1675,7 @@ def previous_commit_sha_from_ref(ref)
 
         it 'creates a pipeline with build_a and test_a' do
           expect(pipeline).to be_persisted
-          expect(pipeline.builds.pluck(:name)).to contain_exactly("build_a", "test_a")
+          expect(pluck_job_names(pipeline.builds)).to contain_exactly("build_a", "test_a")
         end
 
         it 'bulk inserts all needs' do
@@ -1742,7 +1732,7 @@ def previous_commit_sha_from_ref(ref)
 
         it 'does create a pipeline only with deploy' do
           expect(pipeline).to be_persisted
-          expect(pipeline.builds.pluck(:name)).to contain_exactly("deploy")
+          expect(pluck_job_names(pipeline.builds)).to contain_exactly("deploy")
         end
       end
     end
diff --git a/spec/support/helpers/ci/job_helpers.rb b/spec/support/helpers/ci/job_helpers.rb
index d109398b5ee440..7c6cb36b562290 100644
--- a/spec/support/helpers/ci/job_helpers.rb
+++ b/spec/support/helpers/ci/job_helpers.rb
@@ -29,5 +29,21 @@ def stub_ci_job_definition(job, **new_config)
 
       allow(job).to receive(:job_definition).and_return(new_job_definition)
     end
+
+    def find_job_by_name(jobs, name)
+      if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, project)
+        jobs.joins(:job_info).find_by(job_info: { name: name })
+      else
+        jobs.find_by(name: name)
+      end
+    end
+
+    def pluck_job_names(jobs)
+      if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, project)
+        jobs.joins(:job_info).pluck('p_ci_job_infos.name')
+      else
+        jobs.pluck(:name)
+      end
+    end
   end
 end
-- 
GitLab


From 2d0893e37035644ea7d68161271bd69ce5a4aee2 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Wed, 5 Nov 2025 15:40:48 -0800
Subject: [PATCH 03/27] Update queries related to p_ci_build_names

Update queries related to p_ci_build_names
so they're compatible with the new ci_job_infos
table.
---
 app/finders/ci/build_name_finder.rb           | 19 ++++++++++--
 app/models/ci/job_info.rb                     |  1 +
 app/services/ci/update_build_names_service.rb | 29 ++++++++++++++++---
 app/workers/ci/update_build_names_worker.rb   |  1 +
 .../workers/ci/cleanup_build_name_worker.rb   |  1 +
 .../ci/create_pipeline_service_spec.rb        |  2 +-
 6 files changed, 46 insertions(+), 7 deletions(-)

diff --git a/app/finders/ci/build_name_finder.rb b/app/finders/ci/build_name_finder.rb
index f6c325f4595c3a..7d9e214cce0672 100644
--- a/app/finders/ci/build_name_finder.rb
+++ b/app/finders/ci/build_name_finder.rb
@@ -26,12 +26,27 @@ def limited_name_search_terms
 
     # rubocop: disable CodeReuse/ActiveRecord -- Need specialized queries for database optimizations
     def filter_by_name(build_relation)
-      # TODO: Update this query to use Ci::JobInfo
       build_name_relation = Ci::BuildName
         .where(project_id: project.id)
         .pg_full_text_search_in_model(limited_name_search_terms)
 
-      build_relation.where("(id, partition_id) IN (?)", build_name_relation.select(:build_id, :partition_id))
+      if Feature.disabled?(:read_from_ci_job_infos, project)
+        return build_relation.where("(id, partition_id) IN (?)", build_name_relation.select(:build_id, :partition_id))
+      end
+
+      job_info_relation = Ci::JobInfo
+        .where(project_id: project.id)
+        .pg_full_text_search_in_model(limited_name_search_terms)
+
+      # NOTE: This query would be much more efficient on ci_job_infos alone.
+      # Unfortunately we have to support it for old jobs until we migrate name data to ci_job_infos.
+      # TODO: We should evaluate alternative query structures/approaches that may be more efficient.
+      build_relation
+        .where("(id, partition_id) IN (?)", build_name_relation.select(:build_id, :partition_id))
+        .or(
+          build_relation
+            .where("(job_info_id, partition_id) IN (?)", job_info_relation.select(:id, :partition_id))
+        )
     end
     # rubocop: enable CodeReuse/ActiveRecord
   end
diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
index 936bed46976752..89bf5b903d4e1d 100644
--- a/app/models/ci/job_info.rb
+++ b/app/models/ci/job_info.rb
@@ -7,6 +7,7 @@ module Ci
   class JobInfo < Ci::ApplicationRecord
     include Ci::Partitionable
     include BulkInsertSafe
+    include PgFullTextSearchable
 
     self.table_name = :p_ci_job_infos
     self.primary_key = :id
diff --git a/app/services/ci/update_build_names_service.rb b/app/services/ci/update_build_names_service.rb
index d040ef40785086..a73630a32e1056 100644
--- a/app/services/ci/update_build_names_service.rb
+++ b/app/services/ci/update_build_names_service.rb
@@ -2,6 +2,8 @@
 
 module Ci
   class UpdateBuildNamesService
+    include Gitlab::Utils::StrongMemoize
+
     attr_reader :pipeline
 
     def initialize(pipeline)
@@ -9,6 +11,9 @@ def initialize(pipeline)
     end
 
     def execute
+      # TODO: return if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations)
+      # Ensure job search functionality works without this service/table.
+
       scope = pipeline.builds.latest
       iterator = Gitlab::Pagination::Keyset::Iterator.new(scope: scope)
 
@@ -22,10 +27,21 @@ def execute
     def upsert_records(batch)
       keys = %i[build_id partition_id name project_id]
 
-      builds_upsert_data =
-        batch
-          .pluck(:id, :partition_id, :name, :project_id)
-          .map { |values| Hash[keys.zip(values)] }
+      builds_name_data = if read_from_ci_job_infos?
+                           batch
+                             .left_joins(:job_info)
+                             .select(<<~SQL)
+                               p_ci_builds.id,
+                               p_ci_builds.partition_id,
+                               COALESCE(p_ci_job_infos.name, p_ci_builds.name) AS job_name,
+                               p_ci_builds.project_id
+                             SQL
+                             .map { |record| record.values_at(:id, :partition_id, :job_name, :project_id) }
+                         else
+                           batch.pluck(:id, :partition_id, :name, :project_id)
+                         end
+
+      builds_upsert_data = builds_name_data.map { |values| Hash[keys.zip(values)] }
 
       return unless builds_upsert_data.any?
 
@@ -33,5 +49,10 @@ def upsert_records(batch)
     end
     # rubocop: enable CodeReuse/ActiveRecord
     # rubocop: enable Database/AvoidUsingPluckWithoutLimit
+
+    def read_from_ci_job_infos?
+      Feature.enabled?(:read_from_ci_job_infos, pipeline.project)
+    end
+    strong_memoize_attr :read_from_ci_job_infos?
   end
 end
diff --git a/app/workers/ci/update_build_names_worker.rb b/app/workers/ci/update_build_names_worker.rb
index dbfe70b0d025c7..0ae2702d4c7255 100644
--- a/app/workers/ci/update_build_names_worker.rb
+++ b/app/workers/ci/update_build_names_worker.rb
@@ -10,6 +10,7 @@ class UpdateBuildNamesWorker
     idempotent!
     deduplicate :until_executing
 
+    # TODO: Remove worker with FF `stop_writing_ci_job_info_to_old_destinations`
     def perform(pipeline_id)
       Ci::Pipeline.find_by_id(pipeline_id).try do |pipeline|
         Ci::UpdateBuildNamesService.new(pipeline).execute
diff --git a/ee/app/workers/ci/cleanup_build_name_worker.rb b/ee/app/workers/ci/cleanup_build_name_worker.rb
index d7420b2d1694df..95e95075a29a29 100644
--- a/ee/app/workers/ci/cleanup_build_name_worker.rb
+++ b/ee/app/workers/ci/cleanup_build_name_worker.rb
@@ -1,5 +1,6 @@
 # frozen_string_literal: true
 
+# TODO: Remove this worker with FF `stop_writing_ci_job_info_to_old_destinations`
 module Ci
   class CleanupBuildNameWorker
     include ApplicationWorker
diff --git a/spec/services/ci/create_pipeline_service_spec.rb b/spec/services/ci/create_pipeline_service_spec.rb
index 002745c963021f..fecc7b296e6a4f 100644
--- a/spec/services/ci/create_pipeline_service_spec.rb
+++ b/spec/services/ci/create_pipeline_service_spec.rb
@@ -306,7 +306,7 @@ def execute_service(
                 .builds
                 .joins(:job_definition)
                 .joins(:job_info)
-                .pluck('ci_job_infos.name', "#{Ci::JobDefinition.quoted_table_name}.interruptible")
+                .pluck('p_ci_job_infos.name', "#{Ci::JobDefinition.quoted_table_name}.interruptible")
 
             expect(interruptible_status).to contain_exactly(
               ['build_1_1', true],
-- 
GitLab


From 4a883e864e4eb6197e31ac9b6f1f9291e582ce23 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Wed, 5 Nov 2025 16:29:50 -0800
Subject: [PATCH 04/27] Remove 'when' and 'allow_failure' from job_info

Remove 'when' and 'allow_failure' from
job_info because they can be mutated after
creation.
---
 app/models/ci/job_info.rb                      |  2 --
 app/models/commit_status.rb                    |  1 -
 app/models/concerns/ci/metadatable.rb          | 12 ------------
 app/services/projects/update_pages_service.rb  |  1 -
 ee/app/services/ee/ci/process_build_service.rb |  1 -
 5 files changed, 17 deletions(-)

diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
index 89bf5b903d4e1d..1dbf1411dbcc51 100644
--- a/app/models/ci/job_info.rb
+++ b/app/models/ci/job_info.rb
@@ -17,8 +17,6 @@ class JobInfo < Ci::ApplicationRecord
     # IMPORTANT: append new attributes at the end of this list. Do not change the order!
     # Order is important for the checksum calculation.
     CONFIG_ATTRIBUTES = [
-      :allow_failure,
-      :when,
       :scheduling_type,
       :stage_idx,
       :name
diff --git a/app/models/commit_status.rb b/app/models/commit_status.rb
index 14608b3acbf224..33d441d41c3998 100644
--- a/app/models/commit_status.rb
+++ b/app/models/commit_status.rb
@@ -207,7 +207,6 @@ class CommitStatus < Ci::ApplicationRecord
         .fabricate(commit_status, transition.args.first)
 
       commit_status.failure_reason = reason.failure_reason_enum
-      # BLOCKER: allow_failure appears to be mutated here
       commit_status.allow_failure = true if reason.force_allow_failure?
       # Windows exit codes can reach a max value of 32-bit unsigned integer
       # We only allow a smallint for exit_code in the db, hence the added limit of 32767
diff --git a/app/models/concerns/ci/metadatable.rb b/app/models/concerns/ci/metadatable.rb
index 3a017b0964c660..bf801377c87e15 100644
--- a/app/models/concerns/ci/metadatable.rb
+++ b/app/models/concerns/ci/metadatable.rb
@@ -191,18 +191,6 @@ def secrets=(_value)
       raise ActiveRecord::ReadonlyAttributeError, 'This data is read only'
     end
 
-    def allow_failure
-      read_job_info_attribute(:allow_failure)
-    end
-
-    def allow_failure?
-      allow_failure.present?
-    end
-
-    def when
-      read_job_info_attribute(:when)
-    end
-
     def scheduling_type
       read_job_info_attribute(:scheduling_type)
     end
diff --git a/app/services/projects/update_pages_service.rb b/app/services/projects/update_pages_service.rb
index 195516e2a8e527..7623841cb1d122 100644
--- a/app/services/projects/update_pages_service.rb
+++ b/app/services/projects/update_pages_service.rb
@@ -56,7 +56,6 @@ def success
     def error(message)
       register_failure
       log_error("Projects::UpdatePagesService: #{message}")
-      # BLOCKER: allow_failure appears to be mutated here
       commit_status.allow_failure = !deployment_validations.latest_build?
       commit_status.description = message
       commit_status.drop(:script_failure)
diff --git a/ee/app/services/ee/ci/process_build_service.rb b/ee/app/services/ee/ci/process_build_service.rb
index f1f87602e95123..5a7120b2a06a1d 100644
--- a/ee/app/services/ee/ci/process_build_service.rb
+++ b/ee/app/services/ee/ci/process_build_service.rb
@@ -10,7 +10,6 @@ def process(processable)
         if should_block_processable?(processable)
           # To populate the deployment job as manually executable (i.e. `Ci::Build#playable?`),
           # we have to set `manual` to `ci_builds.when` as well as `ci_builds.status`.
-          # BLOCKER: `when` appears to be mutated here
           processable.when = 'manual'
           return processable.actionize!
         end
-- 
GitLab


From 7953eda8e3739c7b90bdc2efec46e52017aec361 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Wed, 5 Nov 2025 18:01:34 -0800
Subject: [PATCH 05/27] Update scheduling_type related queries/code

Update scheduling_type related queries/code
---
 app/models/ci/job_info.rb                     |  3 +-
 app/models/ci/pipeline.rb                     | 11 +++++++-
 app/models/ci/processable.rb                  | 28 +++++++++----------
 app/models/concerns/ci/metadatable.rb         | 18 ++++++++++++
 db/fixtures/development/14_pipelines.rb       |  1 +
 .../ci/runner/runner_fleet_pipeline_seeder.rb |  1 +
 spec/models/ci/processable_spec.rb            | 12 ++++++--
 7 files changed, 53 insertions(+), 21 deletions(-)

diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
index 1dbf1411dbcc51..8b25fce80b737a 100644
--- a/app/models/ci/job_info.rb
+++ b/app/models/ci/job_info.rb
@@ -17,8 +17,7 @@ class JobInfo < Ci::ApplicationRecord
     # IMPORTANT: append new attributes at the end of this list. Do not change the order!
     # Order is important for the checksum calculation.
     CONFIG_ATTRIBUTES = [
-      :scheduling_type,
-      :stage_idx,
+      :scheduling_type, # This field should be required in the JSON schema with enum: 'dag' or 'stage'
       :name
     ].freeze
     NORMALIZED_DATA_COLUMNS = %i[stage_idx name].freeze
diff --git a/app/models/ci/pipeline.rb b/app/models/ci/pipeline.rb
index d4515071a907c9..278c37feb51acb 100644
--- a/app/models/ci/pipeline.rb
+++ b/app/models/ci/pipeline.rb
@@ -740,7 +740,14 @@ def trigger_status_change_subscriptions
     end
 
     def uses_needs?
-      processables.where(scheduling_type: :dag).any?
+      if Feature.enabled?(:read_from_ci_job_infos, project) && processables.has_any_job_info?
+        processables
+          .joins(:job_info)
+          .where("config ->> 'scheduling_type' = 'dag'")
+          .any?
+      else
+        processables.where(scheduling_type: :dag).any?
+      end
     end
 
     def stages_count
@@ -1585,6 +1592,8 @@ def source_ref_path
 
     # Set scheduling type of processables if they were created before scheduling_type
     # data was deployed (https://gitlab.com/gitlab-org/gitlab/-/merge_requests/22246).
+    # TODO: We can remove this method after we migrate all existing data to ci_job_infos.
+    # Jobs with nil scheduling_type can be populated with the logic in Ci::Processable#populate_scheduling_type!
     def ensure_scheduling_type!
       processables.populate_scheduling_type!
     end
diff --git a/app/models/ci/processable.rb b/app/models/ci/processable.rb
index 6acb38a0ba14af..37eaed02d44899 100644
--- a/app/models/ci/processable.rb
+++ b/app/models/ci/processable.rb
@@ -213,7 +213,10 @@ def self.select_with_aggregated_needs(project)
     # so we need to ensure the data exists before using it.
     def self.populate_scheduling_type!
       needs = Ci::BuildNeed.scoped_build.select(1)
-      # TODO: Update this query to update Ci::JobInfo instead?
+      # TODO: If scheduling_type is nil, it means it's an old job that doesn't already
+      # have a job_info record, so we can create a new one for them.
+      # We can remove this method after we migrate existing data to ci_job_infos.
+      # When migrating, jobs with nil scheduling_type can be populated with the logic below.
       where(scheduling_type: nil).update_all(
         "scheduling_type = CASE WHEN (EXISTS (#{needs.to_sql}))
          THEN #{scheduling_types[:dag]}
@@ -222,12 +225,19 @@ def self.populate_scheduling_type!
       )
     end
 
+    # TODO: Remove this method after scheduling_type data migrated to ci_job_infos
+    def self.has_any_job_info?
+      # We check the oldest job in the pipeline since recent retries will create a new job_info record when cloning
+      left_joins(:job_info).order('p_ci_builds.id ASC').limit(1).pick(:job_info_id).present?
+    end
+
     def assign_resource_from_resource_group(processable)
       Ci::ResourceGroups::AssignResourceFromResourceGroupWorker.perform_async(processable.resource_group_id)
     end
 
     validates :type, presence: true
-    validates :scheduling_type, presence: true, on: :create, unless: :importing?
+    validates :scheduling_type, presence: true, on: :create,
+      unless: -> { importing? || Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, project) }
 
     delegate :merge_request?,
       :merge_request_ref?,
@@ -302,25 +312,13 @@ def with_resource_group?
       self.resource_group_id.present?
     end
 
-    # Overriding scheduling_type enum's method for nil `scheduling_type`s
-    def scheduling_type_dag?
-      scheduling_type.nil? ? find_legacy_scheduling_type == :dag : super
-    end
-
-    # scheduling_type column of previous builds/bridges have not been populated,
-    # so we calculate this value on runtime when we need it.
-    def find_legacy_scheduling_type
-      strong_memoize(:find_legacy_scheduling_type) do
-        needs.exists? ? :dag : :stage
-      end
-    end
-
     def needs_attributes
       strong_memoize(:needs_attributes) do
         needs.map { |need| need.attributes.except('id', 'build_id') }
       end
     end
 
+    # TODO: We can remove this method after we migrate data to ci_job_infos
     def ensure_scheduling_type!
       # If this has a scheduling_type, it means all processables in the pipeline already have.
       return if scheduling_type
diff --git a/app/models/concerns/ci/metadatable.rb b/app/models/concerns/ci/metadatable.rb
index bf801377c87e15..1ca45d3196dbd0 100644
--- a/app/models/concerns/ci/metadatable.rb
+++ b/app/models/concerns/ci/metadatable.rb
@@ -195,6 +195,24 @@ def scheduling_type
       read_job_info_attribute(:scheduling_type)
     end
 
+    # Need this method to overwrite p_ci_builds.scheduling_type enum
+    def scheduling_type_dag?
+      scheduling_type.nil? ? find_legacy_scheduling_type == :dag : scheduling_type.to_sym == :dag
+    end
+
+    # Need this method to overwrite p_ci_builds.scheduling_type enum
+    def scheduling_type_stage?
+      scheduling_type.to_sym == :stage
+    end
+
+    # TODO: We can remove this method after we migrate data to ci_job_infos
+    # scheduling_type column of previous builds/bridges have not been populated,
+    # so we calculate this value on runtime when we need it.
+    def find_legacy_scheduling_type
+      needs.exists? ? :dag : :stage
+    end
+    strong_memoize_attr :find_legacy_scheduling_type
+
     def stage_idx
       read_job_info_attribute(:stage_idx)
     end
diff --git a/db/fixtures/development/14_pipelines.rb b/db/fixtures/development/14_pipelines.rb
index a65dc4b049dab7..524d2964a7da3a 100644
--- a/db/fixtures/development/14_pipelines.rb
+++ b/db/fixtures/development/14_pipelines.rb
@@ -290,6 +290,7 @@ def runners
     @runners ||= FactoryBot.create_list(:ci_runner, 6)
   end
 
+  # TODO: How should we deal with generic commit statuses? Should it have the .fabricate method instead of Processable?
   def job_attributes(pipeline, stage, opts)
     {
       name: 'test build', ci_stage: stage, stage_idx: stage.position,
diff --git a/lib/gitlab/seeders/ci/runner/runner_fleet_pipeline_seeder.rb b/lib/gitlab/seeders/ci/runner/runner_fleet_pipeline_seeder.rb
index 0ae17c62cb1fbe..05d7ceb26bd3ea 100644
--- a/lib/gitlab/seeders/ci/runner/runner_fleet_pipeline_seeder.rb
+++ b/lib/gitlab/seeders/ci/runner/runner_fleet_pipeline_seeder.rb
@@ -181,6 +181,7 @@ def create_build(pipeline, runner, job_status, index)
             build = nil
 
             ::Ci::Build.transaction do
+              # TODO: We should update this to use Ci::Build.fabricate
               build = ::Ci::Build.new(importing: true, **build_attrs).tap(&:save!)
               ::Ci::RunningBuild.upsert_build!(build) if build.running?
             end
diff --git a/spec/models/ci/processable_spec.rb b/spec/models/ci/processable_spec.rb
index 33ab11febd7a2e..d7321c215625e8 100644
--- a/spec/models/ci/processable_spec.rb
+++ b/spec/models/ci/processable_spec.rb
@@ -215,13 +215,19 @@
 
     subject { build(:ci_build, project: project, pipeline: pipeline, importing: importing) }
 
-    where(:importing, :should_validate) do
-      false | true
-      true  | false
+    where(:importing, :ff_state, :should_validate) do
+      false | false | true
+      false | true | false
+      true  | true | false
+      true  | false | false
     end
 
     with_them do
       context 'on create' do
+        before do
+          stub_feature_flags(stop_writing_ci_job_info_to_old_destinations: ff_state)
+        end
+
         it 'validates presence' do
           if should_validate
             is_expected.to validate_presence_of(:scheduling_type).on(:create)
-- 
GitLab


From f4844af346429a5e513e575a6fe449ddc04b4e1a Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Thu, 6 Nov 2025 10:26:52 -0800
Subject: [PATCH 06/27] Correct CONFIG_ATTRIBUTES to include stage_idx

---
 app/models/ci/job_info.rb | 1 +
 1 file changed, 1 insertion(+)

diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
index 8b25fce80b737a..9426e74b57e68d 100644
--- a/app/models/ci/job_info.rb
+++ b/app/models/ci/job_info.rb
@@ -18,6 +18,7 @@ class JobInfo < Ci::ApplicationRecord
     # Order is important for the checksum calculation.
     CONFIG_ATTRIBUTES = [
       :scheduling_type, # This field should be required in the JSON schema with enum: 'dag' or 'stage'
+      :stage_idx,
       :name
     ].freeze
     NORMALIZED_DATA_COLUMNS = %i[stage_idx name].freeze
-- 
GitLab


From 2f7ffa1e34b872e02450ebcbc8db4c2202c7825a Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Thu, 6 Nov 2025 11:29:54 -0800
Subject: [PATCH 07/27] Add job_info rspec helpers

Add job_info rspec helpers. They
mirror the ones for job_definition.
---
 spec/factories/ci/bridge.rb                   |  2 +-
 spec/factories/ci/builds.rb                   |  8 +++--
 spec/factories/ci/processable.rb              | 23 +++++++++++++--
 .../support/helpers/ci/job_factory_helpers.rb | 20 +++++++++++--
 spec/support/helpers/ci/job_helpers.rb        | 29 +++++++++++++++++--
 5 files changed, 71 insertions(+), 11 deletions(-)

diff --git a/spec/factories/ci/bridge.rb b/spec/factories/ci/bridge.rb
index 6caa51adf3c237..e5b137cfdd65c7 100644
--- a/spec/factories/ci/bridge.rb
+++ b/spec/factories/ci/bridge.rb
@@ -7,7 +7,6 @@
   factory :ci_bridge, class: 'Ci::Bridge', parent: :ci_processable do
     instance_eval ::Factories::Ci::Deployable.traits
 
-    name { 'bridge' }
     created_at { '2013-10-29 09:50:00 CET' }
     status { :created }
 
@@ -22,6 +21,7 @@
       options { { trigger: {} } }
       downstream { nil }
       upstream { nil }
+      name { 'bridge' }
     end
 
     after(:build) do |bridge, evaluator|
diff --git a/spec/factories/ci/builds.rb b/spec/factories/ci/builds.rb
index c3d3496564f118..bf759459c5f19f 100644
--- a/spec/factories/ci/builds.rb
+++ b/spec/factories/ci/builds.rb
@@ -7,10 +7,8 @@
   factory :ci_build, class: 'Ci::Build', parent: :ci_processable do
     instance_eval ::Factories::Ci::Deployable.traits
 
-    name { 'test' }
     add_attribute(:protected) { false }
     created_at { 'Di 29. Okt 09:50:00 CET 2013' }
-    scheduling_type { 'stage' }
     pending
 
     project { pipeline.project }
@@ -37,6 +35,8 @@
       end
 
       id_tokens { nil }
+      scheduling_type { 'stage' }
+      name { 'test' }
     end
 
     after(:build) do |build, evaluator|
@@ -64,7 +64,9 @@
 
     trait :with_build_name do
       after(:create) do |build, _|
-        create(:ci_build_name, build: build)
+        if Feature.disabled?(:stop_writing_ci_job_info_to_old_destinations, build.project)
+          create(:ci_build_name, build: build)
+        end
       end
     end
 
diff --git a/spec/factories/ci/processable.rb b/spec/factories/ci/processable.rb
index 738afdf7d1d821..64065ac54c0871 100644
--- a/spec/factories/ci/processable.rb
+++ b/spec/factories/ci/processable.rb
@@ -4,13 +4,10 @@
 
 FactoryBot.define do
   factory :ci_processable, class: 'Ci::Processable' do
-    name { 'processable' }
-    stage_idx { ci_stage.try(:position) || 0 }
     ref { 'master' }
     tag { false }
     pipeline factory: :ci_pipeline
     project { pipeline.project }
-    scheduling_type { 'stage' }
     partition_id { pipeline.partition_id }
 
     # This factory was updated to help with the efforts of the removal of `ci_builds.stage`:
@@ -22,11 +19,31 @@
       options { {} }
       yaml_variables { [] }
       stage { 'test' }
+      scheduling_type { 'stage' }
+      stage_idx { ci_stage.try(:position) || 0 }
+      name { 'processable' }
     end
 
     after(:stub, :build) do |processable, evaluator|
       Ci::JobFactoryHelpers.mutate_temp_job_definition(
         processable, options: evaluator.options, yaml_variables: evaluator.yaml_variables)
+
+      if Feature.enabled?(:write_to_ci_job_infos, processable.project)
+        Ci::JobFactoryHelpers.mutate_temp_job_info(
+          processable,
+          scheduling_type: evaluator.scheduling_type,
+          stage_idx: evaluator.stage_idx,
+          name: evaluator.name
+        )
+      end
+
+      if Feature.disabled?(:stop_writing_ci_job_info_to_old_destinations, processable.project)
+        processable.assign_attributes(
+          scheduling_type: evaluator.scheduling_type,
+          stage_idx: evaluator.stage_idx,
+          name: evaluator.name
+        )
+      end
     end
 
     after(:build) do |processable, evaluator|
diff --git a/spec/support/helpers/ci/job_factory_helpers.rb b/spec/support/helpers/ci/job_factory_helpers.rb
index 2a66cb6da11bf3..cb6512c67357df 100644
--- a/spec/support/helpers/ci/job_factory_helpers.rb
+++ b/spec/support/helpers/ci/job_factory_helpers.rb
@@ -2,8 +2,6 @@
 
 module Ci
   module JobFactoryHelpers
-    # TODO: We need to create a mutator for Ci::JobInfo too. Maybe we can
-    # combine it with this helper and call it `mutate_temp_job_config`?
     # Temp job definitions should not change in normal operation;
     # only use this method as a helper in factory definitions.
     def self.mutate_temp_job_definition(job, **new_config)
@@ -22,5 +20,23 @@ def self.mutate_temp_job_definition(job, **new_config)
 
       job.temp_job_definition = new_temp_job_definition
     end
+
+    # TODO: Maybe we can combine this with mutate_temp_job_definition and call it `mutate_temp_job_config`?
+    def self.mutate_temp_job_info(job, **new_config)
+      # Deep merge is required because job config changes are meant to be cumulative within factories
+      updated_config = (job.temp_job_info&.config || {}).deep_merge(new_config)
+
+      new_temp_job_info = ::Ci::JobInfo.fabricate(
+        config: updated_config,
+        project_id: job.pipeline.project.id,
+        partition_id: job.pipeline.partition_id
+      )
+
+      new_temp_job_info.validate
+      config_errors = new_temp_job_info.errors[:config]
+      raise ActiveRecord::RecordInvalid, config_errors.join(', ') if config_errors.any?
+
+      job.temp_job_info = new_temp_job_info
+    end
   end
 end
diff --git a/spec/support/helpers/ci/job_helpers.rb b/spec/support/helpers/ci/job_helpers.rb
index 7c6cb36b562290..b48c95e681a029 100644
--- a/spec/support/helpers/ci/job_helpers.rb
+++ b/spec/support/helpers/ci/job_helpers.rb
@@ -2,8 +2,6 @@
 
 module Ci
   module JobHelpers
-    # TODO: We need to create a stub helper for Ci::JobInfo too. Maybe we
-    # can combine it with this helper and call it `stub_ci_job_config`.
     def stub_ci_job_definition(job, **new_config)
       new_config.symbolize_keys!
       unknown_keys = new_config.keys - Ci::JobDefinition::CONFIG_ATTRIBUTES
@@ -30,6 +28,33 @@ def stub_ci_job_definition(job, **new_config)
       allow(job).to receive(:job_definition).and_return(new_job_definition)
     end
 
+    # TODO: Maybe we can combine this with stub_ci_job_definition and call it `stub_ci_job_config`?
+    def stub_ci_job_info(job, **new_config)
+      new_config.symbolize_keys!
+      unknown_keys = new_config.keys - Ci::JobInfo::CONFIG_ATTRIBUTES
+
+      if unknown_keys.any?
+        raise ArgumentError,
+          "You can only stub valid job info config attributes. Invalid key(s): #{unknown_keys.join(', ')}. " \
+            "Allowed: #{Ci::JobInfo::CONFIG_ATTRIBUTES.join(', ')}"
+      end
+
+      # We use regular merge (not deep_merge) to completely overwrite existing attributes
+      updated_config = (job.job_info&.config || job.temp_job_info&.config || {}).merge(new_config)
+
+      new_job_info = ::Ci::JobInfo.fabricate(
+        config: updated_config,
+        project_id: job.pipeline.project.id,
+        partition_id: job.pipeline.partition_id
+      )
+
+      new_job_info.validate
+      config_errors = new_job_info.errors[:config]
+      raise ActiveRecord::RecordInvalid, config_errors.join(', ') if config_errors.any?
+
+      allow(job).to receive(:job_info).and_return(new_job_info)
+    end
+
     def find_job_by_name(jobs, name)
       if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, project)
         jobs.joins(:job_info).find_by(job_info: { name: name })
-- 
GitLab


From a3969cca908a61c679bb9d9f350a062d0b52bd1c Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Thu, 6 Nov 2025 11:46:43 -0800
Subject: [PATCH 08/27] Move job_info association to CommitStatus instead of
 Processable

Moves job_info association to CommitStatus
Also applies the rspec helper to find jobs by
name for certain specs.
---
 app/models/ci/processable.rb                  |  7 ----
 app/models/commit_status.rb                   | 10 ++++++
 .../atomic_processing_service_spec.rb         | 36 +++++++++----------
 3 files changed, 28 insertions(+), 25 deletions(-)

diff --git a/app/models/ci/processable.rb b/app/models/ci/processable.rb
index 37eaed02d44899..06a4dd0c5eeaad 100644
--- a/app/models/ci/processable.rb
+++ b/app/models/ci/processable.rb
@@ -56,13 +56,6 @@ class Processable < ::CommitStatus
       inverse_of: :build,
       partition_foreign_key: :partition_id
 
-    # rubocop: disable Rails/InverseOf -- Relation not present in Ci::JobInfo because foreign key callback is not compatible with BulkInsertSafe
-    belongs_to :job_info,
-      ->(job) { in_partition(job) },
-      class_name: 'Ci::JobInfo',
-      partition_foreign_key: :partition_id
-    # rubocop: enable Rails/InverseOf
-
     accepts_nested_attributes_for :needs
     accepts_nested_attributes_for :job_definition_instance
 
diff --git a/app/models/commit_status.rb b/app/models/commit_status.rb
index 33d441d41c3998..f28a8a568bad6a 100644
--- a/app/models/commit_status.rb
+++ b/app/models/commit_status.rb
@@ -31,7 +31,17 @@ class CommitStatus < Ci::ApplicationRecord
     ->(build) { in_partition(build) },
     class_name: 'Ci::Stage',
     foreign_key: :stage_id,
+    partition_foreign_key: :partition_id,
+    inverse_of: :statuses
+
+  # NOTE: Looks like we need to have this relationship in CommitStatus because
+  # generic commit statuses also use the columns in `Ci::JobInfo::CONFIG_ATTRIBUTES`.
+  # rubocop: disable Rails/InverseOf -- Relation not present in Ci::JobInfo because foreign key callback is not compatible with BulkInsertSafe
+  belongs_to :job_info,
+    ->(job) { in_partition(job) },
+    class_name: 'Ci::JobInfo',
     partition_foreign_key: :partition_id
+  # rubocop: enable Rails/InverseOf
 
   has_many :needs, class_name: 'Ci::BuildNeed', foreign_key: :build_id, inverse_of: :build
 
diff --git a/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb b/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb
index fef18cd2cdb7cb..63148aaf5a1381 100644
--- a/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb
+++ b/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb
@@ -741,12 +741,12 @@ def event_on_pipeline(event)
 
           expect(builds_names).to eq ['build:1', 'build:2', 'test:1', 'test:2']
 
-          pipeline.builds.find_by(name: 'test:1').success!
-          pipeline.builds.find_by(name: 'test:2').drop!
+          find_job_by_name(pipeline.builds, 'test:1').success!
+          find_job_by_name(pipeline.builds, name: 'test:2').drop!
 
           expect(builds_names).to eq ['build:1', 'build:2', 'test:1', 'test:2']
 
-          Ci::RetryJobService.new(pipeline.project, user).execute(pipeline.builds.find_by(name: 'test:2'))[:job].reset.success!
+          Ci::RetryJobService.new(pipeline.project, user).execute(find_job_by_name(pipeline.builds, 'test:2'))[:job].reset.success!
 
           expect(builds_names).to eq ['build:1', 'build:2', 'test:1', 'test:2',
             'test:2', 'deploy:1', 'deploy:2']
@@ -1022,8 +1022,8 @@ def event_on_pipeline(event)
         Ci::CreatePipelineService.new(project, user, { ref: 'master' }).execute(:push).payload
       end
 
-      let(:manual1) { all_builds.find_by(name: 'manual1') }
-      let(:manual2) { all_builds.find_by(name: 'manual2') }
+      let(:manual1) { find_job_by_name(all_builds, 'manual1') }
+      let(:manual2) { find_job_by_name(all_builds, 'manual2') }
 
       let(:statuses_0) do
         { manual1: 'created', manual2: 'created', test1: 'created', test2: 'created', deploy1: 'created', deploy2: 'created' }
@@ -1124,8 +1124,8 @@ def event_on_pipeline(event)
         # to either manual1 or manual2. Otherwise, the assigned user will depend on which of
         # the new alive jobs get processed first by ResetSkippedJobsService.
         it 'assigns the correct user to the dependent jobs' do
-          test1 = all_builds.find_by(name: 'test1')
-          test2 = all_builds.find_by(name: 'test2')
+          test1 = find_job_by_name(all_builds, 'test1')
+          test2 = find_job_by_name(all_builds, 'test2')
 
           expect(test1.user).to eq(user)
           expect(test2.user).to eq(user)
@@ -1198,8 +1198,8 @@ def event_on_pipeline(event)
         # bridge jobs directly transition to success
         expect(all_builds_statuses).to contain_exactly('success', 'success', 'success')
 
-        bridge1 = all_builds.find_by(name: 'deploy: [ovh, monitoring]')
-        bridge2 = all_builds.find_by(name: 'deploy: [ovh, app]')
+        bridge1 = find_job_by_name(all_builds, 'deploy: [ovh, monitoring]')
+        bridge2 = find_job_by_name(all_builds, 'deploy: [ovh, app]')
 
         downstream_job1 = bridge1.downstream_pipeline.all_jobs.first
         downstream_job2 = bridge2.downstream_pipeline.all_jobs.first
@@ -1352,12 +1352,12 @@ def event_on_pipeline(event)
         Ci::CreatePipelineService.new(project, user, { ref: 'master' }).execute(:push).payload
       end
 
-      let(:test_job) { all_builds.find_by(name: 'test') }
-      let(:review_deploy_job) { all_builds.find_by(name: 'review') }
-      let(:staging_deploy_job) { all_builds.find_by(name: 'staging') }
-      let(:canary_deploy_job) { all_builds.find_by(name: 'canary') }
-      let(:production_a_deploy_job) { all_builds.find_by(name: 'production-a') }
-      let(:production_b_deploy_job) { all_builds.find_by(name: 'production-b') }
+      let(:test_job) { find_job_by_name(all_builds, 'test') }
+      let(:review_deploy_job) { find_job_by_name(all_builds, 'review') }
+      let(:staging_deploy_job) { find_job_by_name(all_builds, 'staging') }
+      let(:canary_deploy_job) { find_job_by_name(all_builds, 'canary') }
+      let(:production_a_deploy_job) { find_job_by_name(all_builds, 'production-a') }
+      let(:production_b_deploy_job) { find_job_by_name(all_builds, 'production-b') }
 
       before do
         create(:environment, name: 'review', project: project)
@@ -1481,15 +1481,15 @@ def cancel_running_or_pending
     end
 
     def play_manual_action(name)
-      builds.find_by(name: name).play(user)
+      find_job_by_name(builds, name).play(user)
     end
 
     def enqueue_scheduled(name)
-      builds.scheduled.find_by(name: name).enqueue!
+      find_job_by_name(builds.scheduled, name).enqueue!
     end
 
     def retry_build(name)
-      Ci::RetryJobService.new(project, user).execute(builds.find_by(name: name))
+      Ci::RetryJobService.new(project, user).execute(find_job_by_name(builds, name))
     end
 
     def manual_actions
-- 
GitLab


From 1044102f84b6042607af1f4b26e26565ebc2adcd Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Thu, 6 Nov 2025 16:16:00 -0800
Subject: [PATCH 09/27] Update queries/code related to p_ci_builds.stage_idx
 and name

Update queries/code related to p_ci_builds.stage_idx and name
---
 app/graphql/types/ci/job_type.rb              |  2 +
 app/graphql/types/ci/pipeline_type.rb         |  2 +
 app/models/ci/build_dependencies.rb           |  6 +-
 app/models/ci/pipeline.rb                     |  3 +-
 app/models/ci/processable.rb                  |  6 --
 app/models/ci/stage.rb                        | 26 +++++--
 app/models/commit_status.rb                   | 67 +++++++++++++++----
 app/models/generic_commit_status.rb           |  2 +
 app/presenters/ci/stage_presenter.rb          |  2 +
 .../ci/create_commit_status_service.rb        |  3 +
 .../atomic_processing_service.rb              | 26 +++++--
 .../status_collection.rb                      | 20 ++++--
 app/services/ci/reset_skipped_jobs_service.rb | 24 +++++--
 app/services/projects/update_pages_service.rb |  2 +
 spec/factories/ci/processable.rb              | 15 ++++-
 15 files changed, 158 insertions(+), 48 deletions(-)

diff --git a/app/graphql/types/ci/job_type.rb b/app/graphql/types/ci/job_type.rb
index cdfec538791c8e..fdf4ddc41629e0 100644
--- a/app/graphql/types/ci/job_type.rb
+++ b/app/graphql/types/ci/job_type.rb
@@ -193,6 +193,8 @@ def previous_stage_jobs
 
           # This query can fetch unneeded jobs when querying for more than one pipeline.
           # It was decided that fetching and discarding the jobs is preferable to making a more complex query.
+          # TODO: How should we update this query to account for a mix of pipelines where some have jobs with job_infos
+          # and others don't?
           jobs = CommitStatus.in_pipelines(pipeline_ids).for_stage(stage_idxs).latest
           grouped_jobs = jobs.group_by { |job| [job.pipeline_id, job.stage_idx] }
 
diff --git a/app/graphql/types/ci/pipeline_type.rb b/app/graphql/types/ci/pipeline_type.rb
index 8302539db05ef5..867fa0fe2d8d7a 100644
--- a/app/graphql/types/ci/pipeline_type.rb
+++ b/app/graphql/types/ci/pipeline_type.rb
@@ -278,6 +278,8 @@ def job(id: nil, name: nil)
         if id
           pipeline.statuses.id_in(id.model_id)
         else
+          # TODO: We would have to update this to switch between by_name and
+          # by_name_from_ci_builds based on FF `read_from_ci_job_infos`
           pipeline.latest_statuses.by_name(name)
         end.take # rubocop: disable CodeReuse/ActiveRecord
       end
diff --git a/app/models/ci/build_dependencies.rb b/app/models/ci/build_dependencies.rb
index 7e821394ea96c4..7ec21a1d50e479 100644
--- a/app/models/ci/build_dependencies.rb
+++ b/app/models/ci/build_dependencies.rb
@@ -129,7 +129,11 @@ def no_local_dependencies_specified?
     end
 
     def from_previous_stages(scope)
-      scope.before_stage(processable.stage_idx)
+      if Feature.enabled?(:read_from_ci_job_infos, project) && processable.pipeline.processables.has_job_infos?
+        scope.before_stage(processable.stage_idx)
+      else
+        scope.before_stage_from_ci_builds(processable.stage_idx)
+      end
     end
 
     def from_needs(scope)
diff --git a/app/models/ci/pipeline.rb b/app/models/ci/pipeline.rb
index 278c37feb51acb..5cf4fbf3b3a46d 100644
--- a/app/models/ci/pipeline.rb
+++ b/app/models/ci/pipeline.rb
@@ -106,6 +106,7 @@ class Pipeline < Ci::ApplicationRecord
     # DEPRECATED:
     has_many :statuses, ->(pipeline) { in_partition(pipeline) }, class_name: 'CommitStatus', foreign_key: :commit_id, inverse_of: :pipeline, partition_foreign_key: :partition_id
     has_many :processables, ->(pipeline) { in_partition(pipeline) }, class_name: 'Ci::Processable', foreign_key: :commit_id, inverse_of: :pipeline, partition_foreign_key: :partition_id
+    # TODO: What are we still using this association for? Can we just remove it?
     has_many :latest_statuses_ordered_by_stage, ->(pipeline) { latest.in_partition(pipeline).order(:stage_idx, :stage) }, class_name: 'CommitStatus', foreign_key: :commit_id, inverse_of: :pipeline, partition_foreign_key: :partition_id
     has_many :latest_statuses, ->(pipeline) { latest.in_partition(pipeline) }, class_name: 'CommitStatus', foreign_key: :commit_id, inverse_of: :pipeline, partition_foreign_key: :partition_id
     has_many :statuses_order_id_desc, ->(pipeline) { in_partition(pipeline).order_id_desc }, class_name: 'CommitStatus', foreign_key: :commit_id,
@@ -740,7 +741,7 @@ def trigger_status_change_subscriptions
     end
 
     def uses_needs?
-      if Feature.enabled?(:read_from_ci_job_infos, project) && processables.has_any_job_info?
+      if Feature.enabled?(:read_from_ci_job_infos, project) && processables.has_job_infos?
         processables
           .joins(:job_info)
           .where("config ->> 'scheduling_type' = 'dag'")
diff --git a/app/models/ci/processable.rb b/app/models/ci/processable.rb
index 06a4dd0c5eeaad..9d0026d12e8e2d 100644
--- a/app/models/ci/processable.rb
+++ b/app/models/ci/processable.rb
@@ -218,12 +218,6 @@ def self.populate_scheduling_type!
       )
     end
 
-    # TODO: Remove this method after scheduling_type data migrated to ci_job_infos
-    def self.has_any_job_info?
-      # We check the oldest job in the pipeline since recent retries will create a new job_info record when cloning
-      left_joins(:job_info).order('p_ci_builds.id ASC').limit(1).pick(:job_info_id).present?
-    end
-
     def assign_resource_from_resource_group(processable)
       Ci::ResourceGroups::AssignResourceFromResourceGroupWorker.perform_async(processable.resource_group_id)
     end
diff --git a/app/models/ci/stage.rb b/app/models/ci/stage.rb
index 0e9822fa887d37..bb47c74767f694 100644
--- a/app/models/ci/stage.rb
+++ b/app/models/ci/stage.rb
@@ -27,12 +27,16 @@ class Stage < Ci::ApplicationRecord
       foreign_key: :stage_id,
       partition_foreign_key: :partition_id,
       inverse_of: :ci_stage
+    # TODO: We would have to update this to switch between ordered and
+    # ordered_from_ci_builds based on FF `read_from_ci_job_infos`
     has_many :latest_statuses,
       ->(stage) { in_partition(stage).ordered.latest },
       class_name: 'CommitStatus',
       foreign_key: :stage_id,
       partition_foreign_key: :partition_id,
       inverse_of: :ci_stage
+    # TODO: We would have to update this to switch between ordered and
+    # ordered_from_ci_builds based on FF `read_from_ci_job_infos`
     has_many :retried_statuses,
       ->(stage) { in_partition(stage).ordered.retried },
       class_name: 'CommitStatus',
@@ -81,11 +85,21 @@ class Stage < Ci::ApplicationRecord
     before_validation unless: :importing? do
       next if position.present?
 
-      self.position = statuses.select(:stage_idx)
-        .where.not(stage_idx: nil)
-        .group(:stage_idx)
-        .order('COUNT(id) DESC')
-        .first&.stage_idx.to_i
+      self.position = if Feature.enabled?(:read_from_ci_job_infos, project) && statuses.has_job_infos?
+                        statuses
+                          .select('p_ci_job_infos.stage_idx')
+                          .joins(:job_info)
+                          .where.not(p_ci_job_infos: { stage_idx: nil })
+                          .group('p_ci_job_infos.stage_idx')
+                          .order('COUNT(p_ci_builds.id) DESC')
+                          .first&.stage_idx.to_i
+                      else
+                        statuses.select(:stage_idx)
+                          .where.not(stage_idx: nil)
+                          .group(:stage_idx)
+                          .order('COUNT(id) DESC')
+                          .first&.stage_idx.to_i
+                      end
     end
 
     state_machine :status, initial: :created do
@@ -218,6 +232,8 @@ def ordered_latest_statuses
     end
 
     def ordered_retried_statuses
+      # TODO: We would have to update this to switch between retried_ordered and
+      # retried_ordered_from_ci_builds based on FF `read_from_ci_job_infos`
       preload_metadata(statuses.in_order_of(:status, Ci::HasStatus::ORDERED_STATUSES).retried_ordered)
     end
 
diff --git a/app/models/commit_status.rb b/app/models/commit_status.rb
index f28a8a568bad6a..5afeac5576c5d5 100644
--- a/app/models/commit_status.rb
+++ b/app/models/commit_status.rb
@@ -74,19 +74,36 @@ class CommitStatus < Ci::ApplicationRecord
 
   scope :latest, -> { where(retried: [false, nil]) }
   scope :retried, -> { where(retried: true) }
-  scope :ordered, -> { order(:name) }
-  # TODO: Update scope to join with ci_job_infos; evaluate query performance with this change
-  scope :ordered_by_stage, -> { order(stage_idx: :asc) }
+  scope :ordered, -> { joins(:job_info).merge(Ci::JobInfo.order(:name)) }
+  # Remove after ci_builds.name has been migrated to ci_job_infos
+  scope :ordered_from_ci_builds, -> { order(:name) }
+  scope :ordered_by_stage, -> { joins(:job_info).merge(Ci::JobInfo.order(stage_idx: :asc)) }
+  # Remove after ci_builds.stage_idx has been migrated to ci_job_infos
+  scope :ordered_by_stage_from_ci_builds, -> { order(stage_idx: :asc) }
   scope :latest_ordered, -> { latest.ordered.includes(project: :namespace) }
-  scope :retried_ordered, -> { retried.order(name: :asc, id: :desc).includes(project: :namespace) }
+  # Remove after ci_builds.stage_idx has been migrated to ci_job_infos
+  scope :latest_ordered_from_ci_builds, -> { latest.ordered_from_ci_builds.includes(project: :namespace) }
+  scope :retried_ordered, -> {
+    retried.joins(:job_info).order('p_ci_job_infos.name ASC, p_ci_builds.id DESC').includes(project: :namespace)
+  }
+  # Remove after ci_builds.name has been migrated to ci_job_infos
+  scope :retried_ordered_from_ci_builds, -> { retried.order(name: :asc, id: :desc).includes(project: :namespace) }
   scope :ordered_by_pipeline, -> { order(pipeline_id: :asc) }
-  scope :before_stage, ->(index) { where('stage_idx < ?', index) }
-  scope :for_stage, ->(index) { where(stage_idx: index) }
+  scope :before_stage, ->(index) { joins(:job_info).merge(Ci::JobInfo.where('stage_idx < ?', index)) }
+  # Remove after ci_builds.stage_idx has been migrated to ci_job_infos
+  scope :before_stage_from_ci_builds, ->(index) { where('stage_idx < ?', index) }
+  scope :for_stage, ->(index) { joins(:job_info).merge(Ci::JobInfo.where(stage_idx: index)) }
+  # Remove after ci_builds.stage_idx has been migrated to ci_job_infos
+  scope :for_stage_from_ci_builds, ->(index) { joins(:job_info).merge(Ci::JobInfo.where(stage_idx: index)) }
   scope :after_stage, ->(index) { where('stage_idx > ?', index) }
+  # Remove after ci_builds.stage_idx has been migrated to ci_job_infos
+  scope :after_stage_from_ci_builds, ->(index) { where('stage_idx > ?', index) }
   scope :for_project, ->(project_id) { where(project_id: project_id) }
   scope :for_ref, ->(ref) { where(ref: ref) }
   scope :for_user, ->(user) { where(user: user) }
-  scope :by_name, ->(name) { where(name: name) }
+  scope :by_name, ->(name) { joins(:job_info).merge(Ci::JobInfo.where(name: name)) }
+  # Remove after ci_builds.name has been migrated to ci_job_infos
+  scope :by_name_from_ci_builds, ->(name) { where(name: name) }
   scope :in_pipelines, ->(pipelines) { where(pipeline: pipelines) }
   scope :with_pipeline, -> { joins(:pipeline) }
   scope :updated_at_before, ->(date) { where("#{quoted_table_name}.updated_at < ?", date) }
@@ -252,6 +269,11 @@ class CommitStatus < Ci::ApplicationRecord
   end
 
   def self.names
+    joins(:job_info).select('p_ci_job_infos.name')
+  end
+
+  # Remove after ci_builds.name has been migrated to ci_job_infos
+  def self.names_from_ci_builds
     select(:name)
   end
 
@@ -266,6 +288,15 @@ def self.locking_enabled?
     false
   end
 
+  # TODO: Remove this method after scheduling_type data migrated to ci_job_infos
+  # This method should only be used on a single pipeline's processables.
+  def self.has_job_infos?
+    # If a pipeline is created with FF `write_to_ci_job_infos` enabled, then all its jobs would
+    # have job_info records. So we just need to check one job if it has job_info.
+    # We check the oldest job in the pipeline since recent retries would create a new job_info record when cloning.
+    left_joins(:job_info).order('p_ci_builds.id ASC').limit(1).pick(:job_info_id).present?
+  end
+
   def locking_enabled?
     will_save_change_to_status?
   end
@@ -349,12 +380,22 @@ def recoverable?
   end
 
   def update_older_statuses_retried!
-    pipeline
-      .statuses
-      .latest
-      .where(name: name)
-      .where.not(id: id)
-      .update_all(retried: true, processed: true)
+    if Feature.enabled?(:read_from_ci_job_infos, project) && pipeline.statuses.has_job_infos?
+      pipeline
+        .statuses
+        .latest
+        .joins(:job_info)
+        .where(p_ci_job_infos: { name: name })
+        .where.not(id: id)
+        .update_all(retried: true, processed: true)
+    else
+      pipeline
+        .statuses
+        .latest
+        .where(name: name)
+        .where.not(id: id)
+        .update_all(retried: true, processed: true)
+    end
   end
 
   def expire_etag_cache!
diff --git a/app/models/generic_commit_status.rb b/app/models/generic_commit_status.rb
index 356acfa063d557..cef2ee529a968b 100644
--- a/app/models/generic_commit_status.rb
+++ b/app/models/generic_commit_status.rb
@@ -26,6 +26,8 @@ def detailed_status(current_user)
   def name_uniqueness_across_types
     return if !pipeline || name.blank?
 
+    # TODO: We would have to update this to switch between by_name and
+    # by_name_from_ci_builds based on FF `read_from_ci_job_infos`
     if pipeline.statuses.by_name(name).where.not(type: type).exists?
       errors.add(:name, :taken)
     end
diff --git a/app/presenters/ci/stage_presenter.rb b/app/presenters/ci/stage_presenter.rb
index a78b9311cc7c1e..2009baa3c71f18 100644
--- a/app/presenters/ci/stage_presenter.rb
+++ b/app/presenters/ci/stage_presenter.rb
@@ -13,6 +13,8 @@ def latest_ordered_statuses
     end
 
     def retried_ordered_statuses
+      # TODO: We would have to update this to switch between retried_ordered and
+      # retried_ordered_from_ci_builds based on FF `read_from_ci_job_infos`
       preload_statuses(stage.statuses.retried_ordered)
     end
 
diff --git a/app/services/ci/create_commit_status_service.rb b/app/services/ci/create_commit_status_service.rb
index e3b2ec095350c4..016002d157b32c 100644
--- a/app/services/ci/create_commit_status_service.rb
+++ b/app/services/ci/create_commit_status_service.rb
@@ -139,6 +139,7 @@ def external_commit_status_exists?
     end
 
     def find_or_build_external_commit_status
+      # TODO: Should we update this to use a fabricate method to create job_info record?
       external_commit_status_scope(pipeline).find_or_initialize_by( # rubocop:disable CodeReuse/ActiveRecord
         ci_stage: stage,
         stage_idx: stage.position
@@ -148,6 +149,8 @@ def find_or_build_external_commit_status
     end
 
     def external_commit_status_scope(pipeline)
+      # TODO: We would have to update this to switch between by_name and
+      # by_name_from_ci_builds based on FF `read_from_ci_job_infos`
       scope = ::GenericCommitStatus
         .running_or_pending
         .for_project(project.id)
diff --git a/app/services/ci/pipeline_processing/atomic_processing_service.rb b/app/services/ci/pipeline_processing/atomic_processing_service.rb
index 9484c5b0ffe818..9b3ce703d3802a 100644
--- a/app/services/ci/pipeline_processing/atomic_processing_service.rb
+++ b/app/services/ci/pipeline_processing/atomic_processing_service.rb
@@ -80,13 +80,23 @@ def load_jobs_in_batches(stage)
       end
 
       def load_jobs(ids)
-        pipeline
-          .current_processable_jobs
-          .id_in(ids)
-          .with_project_preload
-          .created
-          .ordered_by_stage
-          .select_with_aggregated_needs(project)
+        if Feature.enabled?(:read_from_ci_job_infos, project) && pipeline.processables.has_job_infos?
+          pipeline
+            .current_processable_jobs
+            .id_in(ids)
+            .with_project_preload
+            .created
+            .ordered_by_stage
+            .select_with_aggregated_needs(project)
+        else
+          pipeline
+            .current_processable_jobs
+            .id_in(ids)
+            .with_project_preload
+            .created
+            .ordered_by_stage_from_ci_builds
+            .select_with_aggregated_needs(project)
+        end
       end
 
       def sort_jobs(jobs)
@@ -148,6 +158,8 @@ def new_alive_jobs
 
         return [] if new_alive_job_names.empty?
 
+        # TODO: We would have to update this to switch between by_name and
+        # by_name_from_ci_builds based on FF `read_from_ci_job_infos`
         pipeline
           .current_jobs
           .by_name(new_alive_job_names)
diff --git a/app/services/ci/pipeline_processing/atomic_processing_service/status_collection.rb b/app/services/ci/pipeline_processing/atomic_processing_service/status_collection.rb
index a892b03922e465..7385cde2bda396 100644
--- a/app/services/ci/pipeline_processing/atomic_processing_service/status_collection.rb
+++ b/app/services/ci/pipeline_processing/atomic_processing_service/status_collection.rb
@@ -112,12 +112,22 @@ def all_jobs
           # This is more efficient than relying on PostgreSQL to calculate composite status for us
           #
           # Since we need to reprocess everything we can fetch all of them and do processing ourselves.
-          # TODO: We need to update this query to work with Ci::JobInfo
           strong_memoize(:all_jobs) do
-            raw_jobs = pipeline
-              .current_jobs
-              .ordered_by_stage
-              .pluck(*JOB_ATTRS)
+            raw_jobs = if Feature.enabled?(:read_from_ci_job_infos, pipeline.project) && \
+                pipeline.processables.has_job_infos?
+                         pipeline
+                           .current_jobs
+                           .ordered_by_stage # Already includes joins(:job_info)
+                           .pluck(<<~SQL)
+                              p_ci_builds.id, p_ci_job_infos.name, p_ci_builds.status, p_ci_builds.allow_failure,
+                              p_ci_job_infos.stage_idx, p_ci_builds.processed, p_ci_builds.lock_version
+                           SQL
+                       else
+                         pipeline
+                           .current_jobs
+                           .ordered_by_stage_from_ci_builds
+                           .pluck(*JOB_ATTRS)
+                       end
 
             raw_jobs.map do |row|
               JOB_ATTRS.zip(row).to_h
diff --git a/app/services/ci/reset_skipped_jobs_service.rb b/app/services/ci/reset_skipped_jobs_service.rb
index 9e5c887b31bab4..f98e9801c48156 100644
--- a/app/services/ci/reset_skipped_jobs_service.rb
+++ b/app/services/ci/reset_skipped_jobs_service.rb
@@ -26,13 +26,23 @@ def reset_source_bridge
 
     # rubocop: disable CodeReuse/ActiveRecord
     def dependent_jobs
-      ordered_by_dag(
-        @pipeline.processables
-          .from_union(needs_dependent_jobs, stage_dependent_jobs)
-          .skipped
-          .ordered_by_stage
-          .preload(:needs)
-      )
+      if Feature.enabled?(:read_from_ci_job_infos, @pipeline.project) && @pipeline.processables.has_job_infos?
+        ordered_by_dag(
+          @pipeline.processables
+            .from_union(needs_dependent_jobs, stage_dependent_jobs)
+            .skipped
+            .ordered_by_stage
+            .preload(:needs)
+        )
+      else
+        ordered_by_dag(
+          @pipeline.processables
+            .from_union(needs_dependent_jobs, stage_dependent_jobs)
+            .skipped
+            .ordered_by_stage_from_ci_builds
+            .preload(:needs)
+        )
+      end
     end
 
     def process(job)
diff --git a/app/services/projects/update_pages_service.rb b/app/services/projects/update_pages_service.rb
index 7623841cb1d122..cda7cfacc46e8f 100644
--- a/app/services/projects/update_pages_service.rb
+++ b/app/services/projects/update_pages_service.rb
@@ -64,6 +64,8 @@ def error(message)
 
     # Create status notifying the deployment of pages
     def commit_status
+      # TODO: Should we have a fabricate method for GenericCommitStatus
+      # to create job_info record? (for name and stage_idx)
       GenericCommitStatus.new(
         user: build.user,
         ci_stage: stage,
diff --git a/spec/factories/ci/processable.rb b/spec/factories/ci/processable.rb
index 64065ac54c0871..5ca110b80fe1d3 100644
--- a/spec/factories/ci/processable.rb
+++ b/spec/factories/ci/processable.rb
@@ -82,6 +82,10 @@
         Gitlab::Ci::Pipeline::Create::JobDefinitionBuilder.new(processable.pipeline, [processable]).run
       end
 
+      if processable.temp_job_info
+        Gitlab::Ci::Pipeline::Create::JobInfoBuilder.new(processable.pipeline, [processable]).run
+      end
+
       next if processable.ci_stage
 
       processable.ci_stage =
@@ -101,10 +105,15 @@
 
     after(:create) do |processable, evaluator|
       # job_definition_instance is assigned when we run JobDefinitionBuilder
-      next unless processable.job_definition_instance
+      if processable.job_definition_instance
+        processable.association(:job_definition).reload
+        processable.temp_job_definition = nil
+      end
 
-      processable.association(:job_definition).reload
-      processable.temp_job_definition = nil
+      if processable.job_info_id
+        processable.association(:job_info).reload
+        processable.temp_job_info = nil
+      end
     end
 
     trait :without_job_definition do
-- 
GitLab


From 9c817693570cf8a2c91b94e68f02237cbea9d1db Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Wed, 12 Nov 2025 15:22:43 -0800
Subject: [PATCH 10/27] Simplify query to check if pipeline processables has
 job infos

Simplification to query
---
 app/finders/ci/build_name_finder.rb | 5 +++--
 app/models/commit_status.rb         | 2 +-
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/app/finders/ci/build_name_finder.rb b/app/finders/ci/build_name_finder.rb
index 7d9e214cce0672..8010a7d0b4efd0 100644
--- a/app/finders/ci/build_name_finder.rb
+++ b/app/finders/ci/build_name_finder.rb
@@ -39,8 +39,9 @@ def filter_by_name(build_relation)
         .pg_full_text_search_in_model(limited_name_search_terms)
 
       # NOTE: This query would be much more efficient on ci_job_infos alone.
-      # Unfortunately we have to support it for old jobs until we migrate name data to ci_job_infos.
-      # TODO: We should evaluate alternative query structures/approaches that may be more efficient.
+      # TODO: Evaluate the query performance after we create and write to ci_job_infos. Then we can decide on either:
+      # 1. Keep this OR query if performance is not severely impacted.
+      # 2. Plan to migrate all existing data to ci_job_infos before we switch reads.
       build_relation
         .where("(id, partition_id) IN (?)", build_name_relation.select(:build_id, :partition_id))
         .or(
diff --git a/app/models/commit_status.rb b/app/models/commit_status.rb
index 5afeac5576c5d5..dc17c65e5f51eb 100644
--- a/app/models/commit_status.rb
+++ b/app/models/commit_status.rb
@@ -294,7 +294,7 @@ def self.has_job_infos?
     # If a pipeline is created with FF `write_to_ci_job_infos` enabled, then all its jobs would
     # have job_info records. So we just need to check one job if it has job_info.
     # We check the oldest job in the pipeline since recent retries would create a new job_info record when cloning.
-    left_joins(:job_info).order('p_ci_builds.id ASC').limit(1).pick(:job_info_id).present?
+    first&.job_info_id.present?
   end
 
   def locking_enabled?
-- 
GitLab


From b10ef62c37f14477c11449b8a6455d208a359a89 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Wed, 12 Nov 2025 17:36:14 -0800
Subject: [PATCH 11/27] Add scheduling_type column to ci_job_infos

Adds scheduling_type column to ci_job_infos
---
 app/models/ci/job_info.rb                     | 16 +++++++--
 app/models/ci/processable.rb                  | 11 +++----
 ...51031012621_create_p_ci_job_infos_table.rb |  9 ++---
 ...012831_create_p_ci_job_infos_partitions.rb |  2 ++
 db/structure.sql                              | 33 ++++++++++---------
 5 files changed, 42 insertions(+), 29 deletions(-)

diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
index 9426e74b57e68d..fa24df35371567 100644
--- a/app/models/ci/job_info.rb
+++ b/app/models/ci/job_info.rb
@@ -14,14 +14,22 @@ class JobInfo < Ci::ApplicationRecord
 
     ignore_column :search_vector, remove_never: true # Value is auto-generated by DB; must ignore it for bulk insert
 
-    # IMPORTANT: append new attributes at the end of this list. Do not change the order!
+    # IMPORTANT: Append new attributes at the end of this list. Do not change the order!
     # Order is important for the checksum calculation.
     CONFIG_ATTRIBUTES = [
-      :scheduling_type, # This field should be required in the JSON schema with enum: 'dag' or 'stage'
+      :needs_attributes, # TODO: Should we name this to just `needs` inside the jsonb value?
+      :scheduling_type,
+      :stage_idx,
+      :name
+    ].freeze
+    NORMALIZED_DATA_COLUMNS = [
+      :scheduling_type,
       :stage_idx,
       :name
     ].freeze
-    NORMALIZED_DATA_COLUMNS = %i[stage_idx name].freeze
+
+    # Remove when these attributes are dropped from Ci::Build
+    CI_BUILD_ATTRS_TO_REMOVE = [:needs_attributes, :scheduling_type].freeze
 
     MAX_JOB_NAME_LENGTH = 255
 
@@ -38,6 +46,8 @@ class JobInfo < Ci::ApplicationRecord
 
     attribute :config, ::Gitlab::Database::Type::SymbolizedJsonb.new
 
+    enum :scheduling_type, { stage: 0, dag: 1 }, prefix: true
+
     scope :for_project, ->(project_id) { where(project_id: project_id) }
     scope :for_checksum, ->(checksum) { where(checksum: checksum) }
 
diff --git a/app/models/ci/processable.rb b/app/models/ci/processable.rb
index 9d0026d12e8e2d..40fc91080aaa1a 100644
--- a/app/models/ci/processable.rb
+++ b/app/models/ci/processable.rb
@@ -160,15 +160,14 @@ class Processable < ::CommitStatus
     def self.fabricate(attrs)
       attrs = attrs.dup
       definition_attrs = attrs.extract!(*Ci::JobDefinition::CONFIG_ATTRIBUTES)
-
-      info_attrs = if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, attrs[:project])
-                     attrs.extract!(*Ci::JobInfo::CONFIG_ATTRIBUTES)
-                   else
-                     attrs.slice(*Ci::JobInfo::CONFIG_ATTRIBUTES)
-                   end
+      info_attrs = attrs.slice(*Ci::JobInfo::CONFIG_ATTRIBUTES)
 
       attrs[:tag_list] = definition_attrs[:tag_list] if definition_attrs.key?(:tag_list)
 
+      if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, attrs[:project])
+        attrs.delete(*CI_BUILD_ATTRS_TO_REMOVE)
+      end
+
       new(attrs).tap do |job|
         job_definition = ::Ci::JobDefinition.fabricate(
           config: definition_attrs,
diff --git a/db/migrate/20251031012621_create_p_ci_job_infos_table.rb b/db/migrate/20251031012621_create_p_ci_job_infos_table.rb
index 653ad93a7d30f4..bc220e9dd07bc1 100644
--- a/db/migrate/20251031012621_create_p_ci_job_infos_table.rb
+++ b/db/migrate/20251031012621_create_p_ci_job_infos_table.rb
@@ -14,6 +14,7 @@ def change
       t.bigint :partition_id, null: false
       t.bigint :project_id, null: false
       t.datetime_with_timezone :created_at, null: false
+      t.integer :scheduling_type, limit: 2, null: false
       t.integer :stage_idx, limit: 2
       t.binary :checksum, null: false
       t.tsvector :search_vector, as: "to_tsvector('english'::regconfig, COALESCE(name, ''::text))", stored: true
@@ -22,10 +23,10 @@ def change
 
       t.index [:project_id, :checksum, :partition_id], unique: true,
         name: :index_p_ci_job_infos_on_project_id_and_checksum
-      t.index [:project_id, :stage_idx], include: [:id],
-        name: :index_p_ci_job_infos_on_project_id_and_stage_idx
-      t.index [:project_id, :name], include: [:id],
-        name: :index_p_ci_job_infos_on_project_id_and_name
+      t.index [:project_id, :scheduling_type, :id],
+        name: :index_p_ci_job_infos_on_project_id_scheduling_type_and_id
+      t.index [:project_id, :stage_idx, :id],
+        name: :index_p_ci_job_infos_on_project_id_stage_idx_and_id
       t.index [:search_vector], using: :gin,
         name: :index_p_ci_job_infos_on_search_vector
     end
diff --git a/db/migrate/20251031012831_create_p_ci_job_infos_partitions.rb b/db/migrate/20251031012831_create_p_ci_job_infos_partitions.rb
index 3617cf09fc9b30..0d9db99ff1fb1b 100644
--- a/db/migrate/20251031012831_create_p_ci_job_infos_partitions.rb
+++ b/db/migrate/20251031012831_create_p_ci_job_infos_partitions.rb
@@ -1,5 +1,7 @@
 # frozen_string_literal: true
 
+# TODO: Either this migration needs to be scoped to GitLab.com only, or we remove it
+# and rely on the partition manager to create the necessary partitions instead.
 class CreatePCiJobInfosPartitions < Gitlab::Database::Migration[2.3]
   milestone '18.6'
 
diff --git a/db/structure.sql b/db/structure.sql
index 20c5357dd76388..036ad6c39c2e83 100644
--- a/db/structure.sql
+++ b/db/structure.sql
@@ -5788,6 +5788,21 @@ CREATE TABLE p_ci_job_definitions (
 )
 PARTITION BY LIST (partition_id);
 
+CREATE TABLE p_ci_job_infos (
+    id bigint NOT NULL,
+    partition_id bigint NOT NULL,
+    project_id bigint NOT NULL,
+    created_at timestamp with time zone NOT NULL,
+    scheduling_type smallint NOT NULL,
+    stage_idx smallint,
+    checksum bytea NOT NULL,
+    search_vector tsvector GENERATED ALWAYS AS (to_tsvector('english'::regconfig, COALESCE(name, ''::text))) STORED,
+    name text NOT NULL,
+    config jsonb DEFAULT '{}'::jsonb NOT NULL,
+    CONSTRAINT check_85f37f6053 CHECK ((char_length(name) <= 255))
+)
+PARTITION BY LIST (partition_id);
+
 CREATE TABLE p_ci_job_inputs (
     id bigint NOT NULL,
     job_id bigint NOT NULL,
@@ -22524,20 +22539,6 @@ CREATE SEQUENCE p_ci_job_definitions_id_seq
 
 ALTER SEQUENCE p_ci_job_definitions_id_seq OWNED BY p_ci_job_definitions.id;
 
-CREATE TABLE p_ci_job_infos (
-    id bigint NOT NULL,
-    partition_id bigint NOT NULL,
-    project_id bigint NOT NULL,
-    created_at timestamp with time zone NOT NULL,
-    stage_idx smallint,
-    checksum bytea NOT NULL,
-    search_vector tsvector GENERATED ALWAYS AS (to_tsvector('english'::regconfig, COALESCE(name, ''::text))) STORED,
-    name text NOT NULL,
-    config jsonb DEFAULT '{}'::jsonb NOT NULL,
-    CONSTRAINT check_85f37f6053 CHECK ((char_length(name) <= 255))
-)
-PARTITION BY LIST (partition_id);
-
 CREATE SEQUENCE p_ci_job_infos_id_seq
     START WITH 1
     INCREMENT BY 1
@@ -43368,9 +43369,9 @@ CREATE UNIQUE INDEX index_p_ci_job_definitions_on_project_id_and_checksum ON ONL
 
 CREATE UNIQUE INDEX index_p_ci_job_infos_on_project_id_and_checksum ON ONLY p_ci_job_infos USING btree (project_id, checksum, partition_id);
 
-CREATE INDEX index_p_ci_job_infos_on_project_id_and_name ON ONLY p_ci_job_infos USING btree (project_id, name) INCLUDE (id);
+CREATE INDEX index_p_ci_job_infos_on_project_id_scheduling_type_and_id ON ONLY p_ci_job_infos USING btree (project_id, scheduling_type, id);
 
-CREATE INDEX index_p_ci_job_infos_on_project_id_and_stage_idx ON ONLY p_ci_job_infos USING btree (project_id, stage_idx) INCLUDE (id);
+CREATE INDEX index_p_ci_job_infos_on_project_id_stage_idx_and_id ON ONLY p_ci_job_infos USING btree (project_id, stage_idx, id);
 
 CREATE INDEX index_p_ci_job_infos_on_search_vector ON ONLY p_ci_job_infos USING gin (search_vector);
 
-- 
GitLab


From ef3e4f39ec3987fc9f02980d0551c9d8838ac0ca Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Wed, 12 Nov 2025 17:52:57 -0800
Subject: [PATCH 12/27] Remove query updates for name and stage_idx columns

For this iteration we will not be looking to drop
name and stage_idx columns from p_ci_builds.
So this commit removes the related code changes.
---
 app/finders/ci/build_name_finder.rb           |  4 +-
 app/graphql/types/ci/job_type.rb              |  2 -
 app/graphql/types/ci/pipeline_type.rb         |  2 -
 app/models/ci/build_dependencies.rb           |  6 +-
 app/models/ci/job_info.rb                     |  2 +-
 app/models/ci/pipeline.rb                     |  2 +-
 app/models/ci/stage.rb                        | 26 ++-------
 app/models/commit_status.rb                   | 57 ++++---------------
 app/models/concerns/ci/metadatable.rb         | 11 ++--
 app/models/generic_commit_status.rb           |  2 -
 app/presenters/ci/stage_presenter.rb          |  2 -
 .../ci/create_commit_status_service.rb        |  2 -
 .../atomic_processing_service.rb              | 26 +++------
 .../status_collection.rb                      | 19 ++-----
 app/services/ci/reset_skipped_jobs_service.rb | 24 +++-----
 app/services/projects/update_pages_service.rb |  2 -
 ...51031012621_create_p_ci_job_infos_table.rb |  1 +
 spec/factories/ci/bridge.rb                   |  2 +-
 spec/factories/ci/builds.rb                   |  2 +-
 spec/factories/ci/processable.rb              | 12 ++--
 .../ci/create_pipeline_service_spec.rb        | 48 +++++++++-------
 .../atomic_processing_service_spec.rb         | 36 ++++++------
 .../support/helpers/ci/job_factory_helpers.rb |  1 +
 spec/support/helpers/ci/job_helpers.rb        | 16 ------
 24 files changed, 102 insertions(+), 205 deletions(-)

diff --git a/app/finders/ci/build_name_finder.rb b/app/finders/ci/build_name_finder.rb
index 8010a7d0b4efd0..93ee91e36be927 100644
--- a/app/finders/ci/build_name_finder.rb
+++ b/app/finders/ci/build_name_finder.rb
@@ -43,10 +43,10 @@ def filter_by_name(build_relation)
       # 1. Keep this OR query if performance is not severely impacted.
       # 2. Plan to migrate all existing data to ci_job_infos before we switch reads.
       build_relation
-        .where("(id, partition_id) IN (?)", build_name_relation.select(:build_id, :partition_id))
+        .where("(job_info_id, partition_id) IN (?)", job_info_relation.select(:id, :partition_id))
         .or(
           build_relation
-            .where("(job_info_id, partition_id) IN (?)", job_info_relation.select(:id, :partition_id))
+            .where("(id, partition_id) IN (?)", build_name_relation.select(:build_id, :partition_id))
         )
     end
     # rubocop: enable CodeReuse/ActiveRecord
diff --git a/app/graphql/types/ci/job_type.rb b/app/graphql/types/ci/job_type.rb
index fdf4ddc41629e0..cdfec538791c8e 100644
--- a/app/graphql/types/ci/job_type.rb
+++ b/app/graphql/types/ci/job_type.rb
@@ -193,8 +193,6 @@ def previous_stage_jobs
 
           # This query can fetch unneeded jobs when querying for more than one pipeline.
           # It was decided that fetching and discarding the jobs is preferable to making a more complex query.
-          # TODO: How should we update this query to account for a mix of pipelines where some have jobs with job_infos
-          # and others don't?
           jobs = CommitStatus.in_pipelines(pipeline_ids).for_stage(stage_idxs).latest
           grouped_jobs = jobs.group_by { |job| [job.pipeline_id, job.stage_idx] }
 
diff --git a/app/graphql/types/ci/pipeline_type.rb b/app/graphql/types/ci/pipeline_type.rb
index 867fa0fe2d8d7a..8302539db05ef5 100644
--- a/app/graphql/types/ci/pipeline_type.rb
+++ b/app/graphql/types/ci/pipeline_type.rb
@@ -278,8 +278,6 @@ def job(id: nil, name: nil)
         if id
           pipeline.statuses.id_in(id.model_id)
         else
-          # TODO: We would have to update this to switch between by_name and
-          # by_name_from_ci_builds based on FF `read_from_ci_job_infos`
           pipeline.latest_statuses.by_name(name)
         end.take # rubocop: disable CodeReuse/ActiveRecord
       end
diff --git a/app/models/ci/build_dependencies.rb b/app/models/ci/build_dependencies.rb
index 7ec21a1d50e479..7e821394ea96c4 100644
--- a/app/models/ci/build_dependencies.rb
+++ b/app/models/ci/build_dependencies.rb
@@ -129,11 +129,7 @@ def no_local_dependencies_specified?
     end
 
     def from_previous_stages(scope)
-      if Feature.enabled?(:read_from_ci_job_infos, project) && processable.pipeline.processables.has_job_infos?
-        scope.before_stage(processable.stage_idx)
-      else
-        scope.before_stage_from_ci_builds(processable.stage_idx)
-      end
+      scope.before_stage(processable.stage_idx)
     end
 
     def from_needs(scope)
diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
index fa24df35371567..ec286606de8989 100644
--- a/app/models/ci/job_info.rb
+++ b/app/models/ci/job_info.rb
@@ -29,7 +29,7 @@ class JobInfo < Ci::ApplicationRecord
     ].freeze
 
     # Remove when these attributes are dropped from Ci::Build
-    CI_BUILD_ATTRS_TO_REMOVE = [:needs_attributes, :scheduling_type].freeze
+    CI_BUILD_ATTRS_TO_REMOVE = [:scheduling_type].freeze
 
     MAX_JOB_NAME_LENGTH = 255
 
diff --git a/app/models/ci/pipeline.rb b/app/models/ci/pipeline.rb
index 5cf4fbf3b3a46d..b82ede941fc645 100644
--- a/app/models/ci/pipeline.rb
+++ b/app/models/ci/pipeline.rb
@@ -744,7 +744,7 @@ def uses_needs?
       if Feature.enabled?(:read_from_ci_job_infos, project) && processables.has_job_infos?
         processables
           .joins(:job_info)
-          .where("config ->> 'scheduling_type' = 'dag'")
+          .where(p_ci_job_infos: { scheduling_type: :dag })
           .any?
       else
         processables.where(scheduling_type: :dag).any?
diff --git a/app/models/ci/stage.rb b/app/models/ci/stage.rb
index bb47c74767f694..0e9822fa887d37 100644
--- a/app/models/ci/stage.rb
+++ b/app/models/ci/stage.rb
@@ -27,16 +27,12 @@ class Stage < Ci::ApplicationRecord
       foreign_key: :stage_id,
       partition_foreign_key: :partition_id,
       inverse_of: :ci_stage
-    # TODO: We would have to update this to switch between ordered and
-    # ordered_from_ci_builds based on FF `read_from_ci_job_infos`
     has_many :latest_statuses,
       ->(stage) { in_partition(stage).ordered.latest },
       class_name: 'CommitStatus',
       foreign_key: :stage_id,
       partition_foreign_key: :partition_id,
       inverse_of: :ci_stage
-    # TODO: We would have to update this to switch between ordered and
-    # ordered_from_ci_builds based on FF `read_from_ci_job_infos`
     has_many :retried_statuses,
       ->(stage) { in_partition(stage).ordered.retried },
       class_name: 'CommitStatus',
@@ -85,21 +81,11 @@ class Stage < Ci::ApplicationRecord
     before_validation unless: :importing? do
       next if position.present?
 
-      self.position = if Feature.enabled?(:read_from_ci_job_infos, project) && statuses.has_job_infos?
-                        statuses
-                          .select('p_ci_job_infos.stage_idx')
-                          .joins(:job_info)
-                          .where.not(p_ci_job_infos: { stage_idx: nil })
-                          .group('p_ci_job_infos.stage_idx')
-                          .order('COUNT(p_ci_builds.id) DESC')
-                          .first&.stage_idx.to_i
-                      else
-                        statuses.select(:stage_idx)
-                          .where.not(stage_idx: nil)
-                          .group(:stage_idx)
-                          .order('COUNT(id) DESC')
-                          .first&.stage_idx.to_i
-                      end
+      self.position = statuses.select(:stage_idx)
+        .where.not(stage_idx: nil)
+        .group(:stage_idx)
+        .order('COUNT(id) DESC')
+        .first&.stage_idx.to_i
     end
 
     state_machine :status, initial: :created do
@@ -232,8 +218,6 @@ def ordered_latest_statuses
     end
 
     def ordered_retried_statuses
-      # TODO: We would have to update this to switch between retried_ordered and
-      # retried_ordered_from_ci_builds based on FF `read_from_ci_job_infos`
       preload_metadata(statuses.in_order_of(:status, Ci::HasStatus::ORDERED_STATUSES).retried_ordered)
     end
 
diff --git a/app/models/commit_status.rb b/app/models/commit_status.rb
index dc17c65e5f51eb..b0d708956fb77d 100644
--- a/app/models/commit_status.rb
+++ b/app/models/commit_status.rb
@@ -74,36 +74,18 @@ class CommitStatus < Ci::ApplicationRecord
 
   scope :latest, -> { where(retried: [false, nil]) }
   scope :retried, -> { where(retried: true) }
-  scope :ordered, -> { joins(:job_info).merge(Ci::JobInfo.order(:name)) }
-  # Remove after ci_builds.name has been migrated to ci_job_infos
-  scope :ordered_from_ci_builds, -> { order(:name) }
-  scope :ordered_by_stage, -> { joins(:job_info).merge(Ci::JobInfo.order(stage_idx: :asc)) }
-  # Remove after ci_builds.stage_idx has been migrated to ci_job_infos
-  scope :ordered_by_stage_from_ci_builds, -> { order(stage_idx: :asc) }
+  scope :ordered, -> { order(:name) }
+  scope :ordered_by_stage, -> { order(stage_idx: :asc) }
   scope :latest_ordered, -> { latest.ordered.includes(project: :namespace) }
-  # Remove after ci_builds.stage_idx has been migrated to ci_job_infos
-  scope :latest_ordered_from_ci_builds, -> { latest.ordered_from_ci_builds.includes(project: :namespace) }
-  scope :retried_ordered, -> {
-    retried.joins(:job_info).order('p_ci_job_infos.name ASC, p_ci_builds.id DESC').includes(project: :namespace)
-  }
-  # Remove after ci_builds.name has been migrated to ci_job_infos
-  scope :retried_ordered_from_ci_builds, -> { retried.order(name: :asc, id: :desc).includes(project: :namespace) }
+  scope :retried_ordered, -> { retried.order(name: :asc, id: :desc).includes(project: :namespace) }
   scope :ordered_by_pipeline, -> { order(pipeline_id: :asc) }
-  scope :before_stage, ->(index) { joins(:job_info).merge(Ci::JobInfo.where('stage_idx < ?', index)) }
-  # Remove after ci_builds.stage_idx has been migrated to ci_job_infos
-  scope :before_stage_from_ci_builds, ->(index) { where('stage_idx < ?', index) }
-  scope :for_stage, ->(index) { joins(:job_info).merge(Ci::JobInfo.where(stage_idx: index)) }
-  # Remove after ci_builds.stage_idx has been migrated to ci_job_infos
-  scope :for_stage_from_ci_builds, ->(index) { joins(:job_info).merge(Ci::JobInfo.where(stage_idx: index)) }
+  scope :before_stage, ->(index) { where('stage_idx < ?', index) }
+  scope :for_stage, ->(index) { where(stage_idx: index) }
   scope :after_stage, ->(index) { where('stage_idx > ?', index) }
-  # Remove after ci_builds.stage_idx has been migrated to ci_job_infos
-  scope :after_stage_from_ci_builds, ->(index) { where('stage_idx > ?', index) }
   scope :for_project, ->(project_id) { where(project_id: project_id) }
   scope :for_ref, ->(ref) { where(ref: ref) }
   scope :for_user, ->(user) { where(user: user) }
-  scope :by_name, ->(name) { joins(:job_info).merge(Ci::JobInfo.where(name: name)) }
-  # Remove after ci_builds.name has been migrated to ci_job_infos
-  scope :by_name_from_ci_builds, ->(name) { where(name: name) }
+  scope :by_name, ->(name) { where(name: name) }
   scope :in_pipelines, ->(pipelines) { where(pipeline: pipelines) }
   scope :with_pipeline, -> { joins(:pipeline) }
   scope :updated_at_before, ->(date) { where("#{quoted_table_name}.updated_at < ?", date) }
@@ -269,11 +251,6 @@ class CommitStatus < Ci::ApplicationRecord
   end
 
   def self.names
-    joins(:job_info).select('p_ci_job_infos.name')
-  end
-
-  # Remove after ci_builds.name has been migrated to ci_job_infos
-  def self.names_from_ci_builds
     select(:name)
   end
 
@@ -380,22 +357,12 @@ def recoverable?
   end
 
   def update_older_statuses_retried!
-    if Feature.enabled?(:read_from_ci_job_infos, project) && pipeline.statuses.has_job_infos?
-      pipeline
-        .statuses
-        .latest
-        .joins(:job_info)
-        .where(p_ci_job_infos: { name: name })
-        .where.not(id: id)
-        .update_all(retried: true, processed: true)
-    else
-      pipeline
-        .statuses
-        .latest
-        .where(name: name)
-        .where.not(id: id)
-        .update_all(retried: true, processed: true)
-    end
+    pipeline
+      .statuses
+      .latest
+      .where(name: name)
+      .where.not(id: id)
+      .update_all(retried: true, processed: true)
   end
 
   def expire_etag_cache!
diff --git a/app/models/concerns/ci/metadatable.rb b/app/models/concerns/ci/metadatable.rb
index 1ca45d3196dbd0..f8656d17addf3b 100644
--- a/app/models/concerns/ci/metadatable.rb
+++ b/app/models/concerns/ci/metadatable.rb
@@ -191,23 +191,24 @@ def secrets=(_value)
       raise ActiveRecord::ReadonlyAttributeError, 'This data is read only'
     end
 
+    # TODO: Remove when ci_builds.scheduling_type is dropped
     def scheduling_type
       read_job_info_attribute(:scheduling_type)
     end
 
-    # Need this method to overwrite p_ci_builds.scheduling_type enum
+    # Need this method to overwrite ci_builds.scheduling_type enum.
+    # TODO: Remove when ci_builds.scheduling_type is dropped
     def scheduling_type_dag?
       scheduling_type.nil? ? find_legacy_scheduling_type == :dag : scheduling_type.to_sym == :dag
     end
 
-    # Need this method to overwrite p_ci_builds.scheduling_type enum
+    # Need this method to overwrite ci_builds.scheduling_type enum.
+    # TODO: Remove when ci_builds.scheduling_type is dropped
     def scheduling_type_stage?
       scheduling_type.to_sym == :stage
     end
 
-    # TODO: We can remove this method after we migrate data to ci_job_infos
-    # scheduling_type column of previous builds/bridges have not been populated,
-    # so we calculate this value on runtime when we need it.
+    # TODO: We can remove this method after we migrate scheduling_type to ci_job_infos
     def find_legacy_scheduling_type
       needs.exists? ? :dag : :stage
     end
diff --git a/app/models/generic_commit_status.rb b/app/models/generic_commit_status.rb
index cef2ee529a968b..356acfa063d557 100644
--- a/app/models/generic_commit_status.rb
+++ b/app/models/generic_commit_status.rb
@@ -26,8 +26,6 @@ def detailed_status(current_user)
   def name_uniqueness_across_types
     return if !pipeline || name.blank?
 
-    # TODO: We would have to update this to switch between by_name and
-    # by_name_from_ci_builds based on FF `read_from_ci_job_infos`
     if pipeline.statuses.by_name(name).where.not(type: type).exists?
       errors.add(:name, :taken)
     end
diff --git a/app/presenters/ci/stage_presenter.rb b/app/presenters/ci/stage_presenter.rb
index 2009baa3c71f18..a78b9311cc7c1e 100644
--- a/app/presenters/ci/stage_presenter.rb
+++ b/app/presenters/ci/stage_presenter.rb
@@ -13,8 +13,6 @@ def latest_ordered_statuses
     end
 
     def retried_ordered_statuses
-      # TODO: We would have to update this to switch between retried_ordered and
-      # retried_ordered_from_ci_builds based on FF `read_from_ci_job_infos`
       preload_statuses(stage.statuses.retried_ordered)
     end
 
diff --git a/app/services/ci/create_commit_status_service.rb b/app/services/ci/create_commit_status_service.rb
index 016002d157b32c..896249f94a9dfd 100644
--- a/app/services/ci/create_commit_status_service.rb
+++ b/app/services/ci/create_commit_status_service.rb
@@ -149,8 +149,6 @@ def find_or_build_external_commit_status
     end
 
     def external_commit_status_scope(pipeline)
-      # TODO: We would have to update this to switch between by_name and
-      # by_name_from_ci_builds based on FF `read_from_ci_job_infos`
       scope = ::GenericCommitStatus
         .running_or_pending
         .for_project(project.id)
diff --git a/app/services/ci/pipeline_processing/atomic_processing_service.rb b/app/services/ci/pipeline_processing/atomic_processing_service.rb
index 9b3ce703d3802a..9484c5b0ffe818 100644
--- a/app/services/ci/pipeline_processing/atomic_processing_service.rb
+++ b/app/services/ci/pipeline_processing/atomic_processing_service.rb
@@ -80,23 +80,13 @@ def load_jobs_in_batches(stage)
       end
 
       def load_jobs(ids)
-        if Feature.enabled?(:read_from_ci_job_infos, project) && pipeline.processables.has_job_infos?
-          pipeline
-            .current_processable_jobs
-            .id_in(ids)
-            .with_project_preload
-            .created
-            .ordered_by_stage
-            .select_with_aggregated_needs(project)
-        else
-          pipeline
-            .current_processable_jobs
-            .id_in(ids)
-            .with_project_preload
-            .created
-            .ordered_by_stage_from_ci_builds
-            .select_with_aggregated_needs(project)
-        end
+        pipeline
+          .current_processable_jobs
+          .id_in(ids)
+          .with_project_preload
+          .created
+          .ordered_by_stage
+          .select_with_aggregated_needs(project)
       end
 
       def sort_jobs(jobs)
@@ -158,8 +148,6 @@ def new_alive_jobs
 
         return [] if new_alive_job_names.empty?
 
-        # TODO: We would have to update this to switch between by_name and
-        # by_name_from_ci_builds based on FF `read_from_ci_job_infos`
         pipeline
           .current_jobs
           .by_name(new_alive_job_names)
diff --git a/app/services/ci/pipeline_processing/atomic_processing_service/status_collection.rb b/app/services/ci/pipeline_processing/atomic_processing_service/status_collection.rb
index 7385cde2bda396..9a53c6d8fc1cd2 100644
--- a/app/services/ci/pipeline_processing/atomic_processing_service/status_collection.rb
+++ b/app/services/ci/pipeline_processing/atomic_processing_service/status_collection.rb
@@ -113,21 +113,10 @@ def all_jobs
           #
           # Since we need to reprocess everything we can fetch all of them and do processing ourselves.
           strong_memoize(:all_jobs) do
-            raw_jobs = if Feature.enabled?(:read_from_ci_job_infos, pipeline.project) && \
-                pipeline.processables.has_job_infos?
-                         pipeline
-                           .current_jobs
-                           .ordered_by_stage # Already includes joins(:job_info)
-                           .pluck(<<~SQL)
-                              p_ci_builds.id, p_ci_job_infos.name, p_ci_builds.status, p_ci_builds.allow_failure,
-                              p_ci_job_infos.stage_idx, p_ci_builds.processed, p_ci_builds.lock_version
-                           SQL
-                       else
-                         pipeline
-                           .current_jobs
-                           .ordered_by_stage_from_ci_builds
-                           .pluck(*JOB_ATTRS)
-                       end
+            raw_jobs = pipeline
+              .current_jobs
+              .ordered_by_stage
+              .pluck(*JOB_ATTRS)
 
             raw_jobs.map do |row|
               JOB_ATTRS.zip(row).to_h
diff --git a/app/services/ci/reset_skipped_jobs_service.rb b/app/services/ci/reset_skipped_jobs_service.rb
index f98e9801c48156..9e5c887b31bab4 100644
--- a/app/services/ci/reset_skipped_jobs_service.rb
+++ b/app/services/ci/reset_skipped_jobs_service.rb
@@ -26,23 +26,13 @@ def reset_source_bridge
 
     # rubocop: disable CodeReuse/ActiveRecord
     def dependent_jobs
-      if Feature.enabled?(:read_from_ci_job_infos, @pipeline.project) && @pipeline.processables.has_job_infos?
-        ordered_by_dag(
-          @pipeline.processables
-            .from_union(needs_dependent_jobs, stage_dependent_jobs)
-            .skipped
-            .ordered_by_stage
-            .preload(:needs)
-        )
-      else
-        ordered_by_dag(
-          @pipeline.processables
-            .from_union(needs_dependent_jobs, stage_dependent_jobs)
-            .skipped
-            .ordered_by_stage_from_ci_builds
-            .preload(:needs)
-        )
-      end
+      ordered_by_dag(
+        @pipeline.processables
+          .from_union(needs_dependent_jobs, stage_dependent_jobs)
+          .skipped
+          .ordered_by_stage
+          .preload(:needs)
+      )
     end
 
     def process(job)
diff --git a/app/services/projects/update_pages_service.rb b/app/services/projects/update_pages_service.rb
index cda7cfacc46e8f..7623841cb1d122 100644
--- a/app/services/projects/update_pages_service.rb
+++ b/app/services/projects/update_pages_service.rb
@@ -64,8 +64,6 @@ def error(message)
 
     # Create status notifying the deployment of pages
     def commit_status
-      # TODO: Should we have a fabricate method for GenericCommitStatus
-      # to create job_info record? (for name and stage_idx)
       GenericCommitStatus.new(
         user: build.user,
         ci_stage: stage,
diff --git a/db/migrate/20251031012621_create_p_ci_job_infos_table.rb b/db/migrate/20251031012621_create_p_ci_job_infos_table.rb
index bc220e9dd07bc1..dc636f7a285a30 100644
--- a/db/migrate/20251031012621_create_p_ci_job_infos_table.rb
+++ b/db/migrate/20251031012621_create_p_ci_job_infos_table.rb
@@ -23,6 +23,7 @@ def change
 
       t.index [:project_id, :checksum, :partition_id], unique: true,
         name: :index_p_ci_job_infos_on_project_id_and_checksum
+      # TODO: We can probably make this a partial index instead `WHERE scheduling_type = 1`
       t.index [:project_id, :scheduling_type, :id],
         name: :index_p_ci_job_infos_on_project_id_scheduling_type_and_id
       t.index [:project_id, :stage_idx, :id],
diff --git a/spec/factories/ci/bridge.rb b/spec/factories/ci/bridge.rb
index e5b137cfdd65c7..6caa51adf3c237 100644
--- a/spec/factories/ci/bridge.rb
+++ b/spec/factories/ci/bridge.rb
@@ -7,6 +7,7 @@
   factory :ci_bridge, class: 'Ci::Bridge', parent: :ci_processable do
     instance_eval ::Factories::Ci::Deployable.traits
 
+    name { 'bridge' }
     created_at { '2013-10-29 09:50:00 CET' }
     status { :created }
 
@@ -21,7 +22,6 @@
       options { { trigger: {} } }
       downstream { nil }
       upstream { nil }
-      name { 'bridge' }
     end
 
     after(:build) do |bridge, evaluator|
diff --git a/spec/factories/ci/builds.rb b/spec/factories/ci/builds.rb
index bf759459c5f19f..99230176e71307 100644
--- a/spec/factories/ci/builds.rb
+++ b/spec/factories/ci/builds.rb
@@ -7,6 +7,7 @@
   factory :ci_build, class: 'Ci::Build', parent: :ci_processable do
     instance_eval ::Factories::Ci::Deployable.traits
 
+    name { 'test' }
     add_attribute(:protected) { false }
     created_at { 'Di 29. Okt 09:50:00 CET 2013' }
     pending
@@ -36,7 +37,6 @@
 
       id_tokens { nil }
       scheduling_type { 'stage' }
-      name { 'test' }
     end
 
     after(:build) do |build, evaluator|
diff --git a/spec/factories/ci/processable.rb b/spec/factories/ci/processable.rb
index 5ca110b80fe1d3..ff5aeb76d915c2 100644
--- a/spec/factories/ci/processable.rb
+++ b/spec/factories/ci/processable.rb
@@ -4,6 +4,8 @@
 
 FactoryBot.define do
   factory :ci_processable, class: 'Ci::Processable' do
+    name { 'processable' }
+    stage_idx { ci_stage.try(:position) || 0 }
     ref { 'master' }
     tag { false }
     pipeline factory: :ci_pipeline
@@ -20,8 +22,6 @@
       yaml_variables { [] }
       stage { 'test' }
       scheduling_type { 'stage' }
-      stage_idx { ci_stage.try(:position) || 0 }
-      name { 'processable' }
     end
 
     after(:stub, :build) do |processable, evaluator|
@@ -32,16 +32,14 @@
         Ci::JobFactoryHelpers.mutate_temp_job_info(
           processable,
           scheduling_type: evaluator.scheduling_type,
-          stage_idx: evaluator.stage_idx,
-          name: evaluator.name
+          stage_idx: processable.stage_idx,
+          name: processable.name
         )
       end
 
       if Feature.disabled?(:stop_writing_ci_job_info_to_old_destinations, processable.project)
         processable.assign_attributes(
-          scheduling_type: evaluator.scheduling_type,
-          stage_idx: evaluator.stage_idx,
-          name: evaluator.name
+          scheduling_type: evaluator.scheduling_type
         )
       end
     end
diff --git a/spec/services/ci/create_pipeline_service_spec.rb b/spec/services/ci/create_pipeline_service_spec.rb
index fecc7b296e6a4f..d30f93af368ac2 100644
--- a/spec/services/ci/create_pipeline_service_spec.rb
+++ b/spec/services/ci/create_pipeline_service_spec.rb
@@ -231,7 +231,7 @@ def execute_service(
             it 'is not cancelable' do
               pipeline = execute_service.payload
 
-              expect(find_job_by_name(pipeline.builds, 'rspec').interruptible).to be_falsy
+              expect(pipeline.builds.find_by(name: 'rspec').interruptible).to be_falsy
             end
           end
 
@@ -244,7 +244,7 @@ def execute_service(
             it 'is cancelable' do
               pipeline = execute_service.payload
 
-              expect(find_job_by_name(pipeline.builds, 'rspec').interruptible).to be_truthy
+              expect(pipeline.builds.find_by(name: 'rspec').interruptible).to be_truthy
             end
           end
 
@@ -257,7 +257,7 @@ def execute_service(
             it 'is not cancelable' do
               pipeline = execute_service.payload
 
-              expect(find_job_by_name(pipeline.builds, 'rspec').interruptible).to be_falsy
+              expect(pipeline.builds.find_by(name: 'rspec').interruptible).to be_falsy
             end
           end
         end
@@ -305,8 +305,7 @@ def execute_service(
               pipeline_on_previous_commit
                 .builds
                 .joins(:job_definition)
-                .joins(:job_info)
-                .pluck('p_ci_job_infos.name', "#{Ci::JobDefinition.quoted_table_name}.interruptible")
+                .pluck(:name, "#{Ci::JobDefinition.quoted_table_name}.interruptible")
 
             expect(interruptible_status).to contain_exactly(
               ['build_1_1', true],
@@ -320,7 +319,10 @@ def execute_service(
           context 'when only interruptible builds are running' do
             context 'when build marked explicitly by interruptible is running' do
               it 'cancels running outdated pipelines', :sidekiq_inline do
-                find_job_by_name(pipeline_on_previous_commit.builds, 'build_1_2').run!
+                pipeline_on_previous_commit
+                  .builds
+                  .find_by_name('build_1_2')
+                  .run!
 
                 pipeline
 
@@ -331,7 +333,8 @@ def execute_service(
 
             context 'when build that is not marked as interruptible is running' do
               it 'cancels running outdated pipelines', :sidekiq_inline do
-                build_2_1 = find_job_by_name(pipeline_on_previous_commit.builds, 'build_2_1')
+                build_2_1 = pipeline_on_previous_commit
+                  .builds.find_by_name('build_2_1')
 
                 build_2_1.enqueue!
                 build_2_1.reset.run!
@@ -346,7 +349,8 @@ def execute_service(
 
           context 'when an uninterruptible build is running' do
             it 'does not cancel running outdated pipelines', :sidekiq_inline do
-              build_3_1 = find_job_by_name(pipeline_on_previous_commit.builds, 'build_3_1')
+              build_3_1 = pipeline_on_previous_commit
+                .builds.find_by_name('build_3_1')
 
               build_3_1.enqueue!
               build_3_1.reset.run!
@@ -362,7 +366,10 @@ def execute_service(
             it 'cancels running outdated pipelines', :sidekiq_might_not_need_inline do
               allow(Ci::BuildScheduleWorker).to receive(:perform_at)
 
-              find_job_by_name(pipeline_on_previous_commit.builds, 'build_2_1').schedule!
+              pipeline_on_previous_commit
+                .builds
+                .find_by_name('build_2_1')
+                .schedule!
 
               pipeline
 
@@ -373,7 +380,10 @@ def execute_service(
 
           context 'when a uninterruptible build has finished' do
             it 'does not cancel running outdated pipelines', :sidekiq_might_not_need_inline do
-              find_job_by_name(pipeline_on_previous_commit.builds, 'build_3_1').success!
+              pipeline_on_previous_commit
+                .builds
+                .find_by_name('build_3_1')
+                .success!
 
               pipeline
 
@@ -749,7 +759,7 @@ def previous_commit_sha_from_ref(ref)
 
     context 'when builds with auto-retries are configured' do
       let(:pipeline)  { execute_service.payload }
-      let(:rspec_job) { find_job_by_name(pipeline.builds, 'rspec') }
+      let(:rspec_job) { pipeline.builds.find_by(name: 'rspec') }
 
       before do
         stub_ci_pipeline_yaml_file(YAML.dump({
@@ -789,7 +799,7 @@ def previous_commit_sha_from_ref(ref)
 
         it 'persists the association correctly' do
           result = execute_service.payload
-          deploy_job = find_job_by_name(result.builds, :test)
+          deploy_job = result.builds.find_by_name!(:test)
           resource_group = project.resource_groups.find_by_key!(resource_group_key)
 
           expect(result).to be_persisted
@@ -844,8 +854,8 @@ def previous_commit_sha_from_ref(ref)
 
       it 'persists the association correctly' do
         result = execute_service.payload
-        deploy_job = find_job_by_name(result.builds, :review_app)
-        stop_job = find_job_by_name(result.builds, :stop_review_app)
+        deploy_job = result.builds.find_by_name!(:review_app)
+        stop_job = result.builds.find_by_name!(:stop_review_app)
 
         expect(result).to be_persisted
         expect(deploy_job.resource_group.key).to eq('review/master')
@@ -880,7 +890,7 @@ def previous_commit_sha_from_ref(ref)
           pipeline = execute_service.payload
 
           expect(pipeline).to be_persisted
-          expect(find_job_by_name(pipeline.builds, 'rspec').options[:job_timeout]).to eq 123
+          expect(pipeline.builds.find_by(name: 'rspec').options[:job_timeout]).to eq 123
         end
       end
     end
@@ -1401,7 +1411,7 @@ def previous_commit_sha_from_ref(ref)
               expect(pipeline).to be_persisted
               expect(pipeline).to be_merge_request_event
               expect(pipeline.merge_request).to eq(merge_request)
-              expect(pluck_job_names(pipeline.builds.order(:stage_id))).to eq(%w[test])
+              expect(pipeline.builds.order(:stage_id).pluck(:name)).to eq(%w[test])
             end
 
             it 'persists the specified source sha' do
@@ -1635,7 +1645,7 @@ def previous_commit_sha_from_ref(ref)
             expect(pipeline).to be_persisted
             expect(pipeline).to be_web
             expect(pipeline.merge_request).to be_nil
-            expect(pluck_job_names(pipeline.builds.order(:stage_id))).to eq(%w[build pages])
+            expect(pipeline.builds.order(:stage_id).pluck(:name)).to eq(%w[build pages])
           end
         end
       end
@@ -1675,7 +1685,7 @@ def previous_commit_sha_from_ref(ref)
 
         it 'creates a pipeline with build_a and test_a' do
           expect(pipeline).to be_persisted
-          expect(pluck_job_names(pipeline.builds)).to contain_exactly("build_a", "test_a")
+          expect(pipeline.builds.pluck(:name)).to contain_exactly("build_a", "test_a")
         end
 
         it 'bulk inserts all needs' do
@@ -1732,7 +1742,7 @@ def previous_commit_sha_from_ref(ref)
 
         it 'does create a pipeline only with deploy' do
           expect(pipeline).to be_persisted
-          expect(pluck_job_names(pipeline.builds)).to contain_exactly("deploy")
+          expect(pipeline.builds.pluck(:name)).to contain_exactly("deploy")
         end
       end
     end
diff --git a/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb b/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb
index 63148aaf5a1381..fef18cd2cdb7cb 100644
--- a/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb
+++ b/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb
@@ -741,12 +741,12 @@ def event_on_pipeline(event)
 
           expect(builds_names).to eq ['build:1', 'build:2', 'test:1', 'test:2']
 
-          find_job_by_name(pipeline.builds, 'test:1').success!
-          find_job_by_name(pipeline.builds, name: 'test:2').drop!
+          pipeline.builds.find_by(name: 'test:1').success!
+          pipeline.builds.find_by(name: 'test:2').drop!
 
           expect(builds_names).to eq ['build:1', 'build:2', 'test:1', 'test:2']
 
-          Ci::RetryJobService.new(pipeline.project, user).execute(find_job_by_name(pipeline.builds, 'test:2'))[:job].reset.success!
+          Ci::RetryJobService.new(pipeline.project, user).execute(pipeline.builds.find_by(name: 'test:2'))[:job].reset.success!
 
           expect(builds_names).to eq ['build:1', 'build:2', 'test:1', 'test:2',
             'test:2', 'deploy:1', 'deploy:2']
@@ -1022,8 +1022,8 @@ def event_on_pipeline(event)
         Ci::CreatePipelineService.new(project, user, { ref: 'master' }).execute(:push).payload
       end
 
-      let(:manual1) { find_job_by_name(all_builds, 'manual1') }
-      let(:manual2) { find_job_by_name(all_builds, 'manual2') }
+      let(:manual1) { all_builds.find_by(name: 'manual1') }
+      let(:manual2) { all_builds.find_by(name: 'manual2') }
 
       let(:statuses_0) do
         { manual1: 'created', manual2: 'created', test1: 'created', test2: 'created', deploy1: 'created', deploy2: 'created' }
@@ -1124,8 +1124,8 @@ def event_on_pipeline(event)
         # to either manual1 or manual2. Otherwise, the assigned user will depend on which of
         # the new alive jobs get processed first by ResetSkippedJobsService.
         it 'assigns the correct user to the dependent jobs' do
-          test1 = find_job_by_name(all_builds, 'test1')
-          test2 = find_job_by_name(all_builds, 'test2')
+          test1 = all_builds.find_by(name: 'test1')
+          test2 = all_builds.find_by(name: 'test2')
 
           expect(test1.user).to eq(user)
           expect(test2.user).to eq(user)
@@ -1198,8 +1198,8 @@ def event_on_pipeline(event)
         # bridge jobs directly transition to success
         expect(all_builds_statuses).to contain_exactly('success', 'success', 'success')
 
-        bridge1 = find_job_by_name(all_builds, 'deploy: [ovh, monitoring]')
-        bridge2 = find_job_by_name(all_builds, 'deploy: [ovh, app]')
+        bridge1 = all_builds.find_by(name: 'deploy: [ovh, monitoring]')
+        bridge2 = all_builds.find_by(name: 'deploy: [ovh, app]')
 
         downstream_job1 = bridge1.downstream_pipeline.all_jobs.first
         downstream_job2 = bridge2.downstream_pipeline.all_jobs.first
@@ -1352,12 +1352,12 @@ def event_on_pipeline(event)
         Ci::CreatePipelineService.new(project, user, { ref: 'master' }).execute(:push).payload
       end
 
-      let(:test_job) { find_job_by_name(all_builds, 'test') }
-      let(:review_deploy_job) { find_job_by_name(all_builds, 'review') }
-      let(:staging_deploy_job) { find_job_by_name(all_builds, 'staging') }
-      let(:canary_deploy_job) { find_job_by_name(all_builds, 'canary') }
-      let(:production_a_deploy_job) { find_job_by_name(all_builds, 'production-a') }
-      let(:production_b_deploy_job) { find_job_by_name(all_builds, 'production-b') }
+      let(:test_job) { all_builds.find_by(name: 'test') }
+      let(:review_deploy_job) { all_builds.find_by(name: 'review') }
+      let(:staging_deploy_job) { all_builds.find_by(name: 'staging') }
+      let(:canary_deploy_job) { all_builds.find_by(name: 'canary') }
+      let(:production_a_deploy_job) { all_builds.find_by(name: 'production-a') }
+      let(:production_b_deploy_job) { all_builds.find_by(name: 'production-b') }
 
       before do
         create(:environment, name: 'review', project: project)
@@ -1481,15 +1481,15 @@ def cancel_running_or_pending
     end
 
     def play_manual_action(name)
-      find_job_by_name(builds, name).play(user)
+      builds.find_by(name: name).play(user)
     end
 
     def enqueue_scheduled(name)
-      find_job_by_name(builds.scheduled, name).enqueue!
+      builds.scheduled.find_by(name: name).enqueue!
     end
 
     def retry_build(name)
-      Ci::RetryJobService.new(project, user).execute(find_job_by_name(builds, name))
+      Ci::RetryJobService.new(project, user).execute(builds.find_by(name: name))
     end
 
     def manual_actions
diff --git a/spec/support/helpers/ci/job_factory_helpers.rb b/spec/support/helpers/ci/job_factory_helpers.rb
index cb6512c67357df..9b58a001f11b7d 100644
--- a/spec/support/helpers/ci/job_factory_helpers.rb
+++ b/spec/support/helpers/ci/job_factory_helpers.rb
@@ -33,6 +33,7 @@ def self.mutate_temp_job_info(job, **new_config)
       )
 
       new_temp_job_info.validate
+      # TODO: Update this to raise on other column validation errors too
       config_errors = new_temp_job_info.errors[:config]
       raise ActiveRecord::RecordInvalid, config_errors.join(', ') if config_errors.any?
 
diff --git a/spec/support/helpers/ci/job_helpers.rb b/spec/support/helpers/ci/job_helpers.rb
index b48c95e681a029..4775875efa48e2 100644
--- a/spec/support/helpers/ci/job_helpers.rb
+++ b/spec/support/helpers/ci/job_helpers.rb
@@ -54,21 +54,5 @@ def stub_ci_job_info(job, **new_config)
 
       allow(job).to receive(:job_info).and_return(new_job_info)
     end
-
-    def find_job_by_name(jobs, name)
-      if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, project)
-        jobs.joins(:job_info).find_by(job_info: { name: name })
-      else
-        jobs.find_by(name: name)
-      end
-    end
-
-    def pluck_job_names(jobs)
-      if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, project)
-        jobs.joins(:job_info).pluck('p_ci_job_infos.name')
-      else
-        jobs.pluck(:name)
-      end
-    end
   end
 end
-- 
GitLab


From 64e6b85f95b6e114267a0332c32cfef669601790 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Thu, 13 Nov 2025 14:44:25 -0800
Subject: [PATCH 13/27] Fix specs and update comments

Fixes specs and updates comments with
reference to recent feedback on mR.
---
 app/models/ci/job_info.rb                     |  5 ++--
 app/models/ci/pipeline.rb                     |  9 ++++---
 app/models/ci/processable.rb                  | 11 ++++----
 app/models/concerns/ci/metadatable.rb         | 15 ++++++++---
 .../ci/create_commit_status_service.rb        |  1 -
 app/services/ci/update_build_names_service.rb | 27 ++++---------------
 app/services/projects/update_pages_service.rb |  6 +++++
 db/fixtures/development/14_pipelines.rb       |  1 -
 ...51031012621_create_p_ci_job_infos_table.rb |  4 ++-
 ...9_add_job_info_id_column_to_p_ci_builds.rb |  2 +-
 spec/models/ci/bridge_spec.rb                 |  1 +
 spec/models/ci/build_spec.rb                  |  4 ++-
 .../ci/update_build_names_service_spec.rb     |  4 +++
 spec/support/helpers/ci/job_helpers.rb        |  7 ++++-
 14 files changed, 54 insertions(+), 43 deletions(-)

diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
index ec286606de8989..b0cce08398dfa0 100644
--- a/app/models/ci/job_info.rb
+++ b/app/models/ci/job_info.rb
@@ -17,7 +17,6 @@ class JobInfo < Ci::ApplicationRecord
     # IMPORTANT: Append new attributes at the end of this list. Do not change the order!
     # Order is important for the checksum calculation.
     CONFIG_ATTRIBUTES = [
-      :needs_attributes, # TODO: Should we name this to just `needs` inside the jsonb value?
       :scheduling_type,
       :stage_idx,
       :name
@@ -28,8 +27,8 @@ class JobInfo < Ci::ApplicationRecord
       :name
     ].freeze
 
-    # Remove when these attributes are dropped from Ci::Build
-    CI_BUILD_ATTRS_TO_REMOVE = [:scheduling_type].freeze
+    # We're copying over these values to ci_job_infos but not dropping them from ci_builds
+    CI_BUILD_ATTRS_TO_KEEP = [:stage_idx, :name].freeze
 
     MAX_JOB_NAME_LENGTH = 255
 
diff --git a/app/models/ci/pipeline.rb b/app/models/ci/pipeline.rb
index b82ede941fc645..dcb8e275ab0f35 100644
--- a/app/models/ci/pipeline.rb
+++ b/app/models/ci/pipeline.rb
@@ -106,7 +106,7 @@ class Pipeline < Ci::ApplicationRecord
     # DEPRECATED:
     has_many :statuses, ->(pipeline) { in_partition(pipeline) }, class_name: 'CommitStatus', foreign_key: :commit_id, inverse_of: :pipeline, partition_foreign_key: :partition_id
     has_many :processables, ->(pipeline) { in_partition(pipeline) }, class_name: 'Ci::Processable', foreign_key: :commit_id, inverse_of: :pipeline, partition_foreign_key: :partition_id
-    # TODO: What are we still using this association for? Can we just remove it?
+    # TODO: We can remove this association; it's unused.
     has_many :latest_statuses_ordered_by_stage, ->(pipeline) { latest.in_partition(pipeline).order(:stage_idx, :stage) }, class_name: 'CommitStatus', foreign_key: :commit_id, inverse_of: :pipeline, partition_foreign_key: :partition_id
     has_many :latest_statuses, ->(pipeline) { latest.in_partition(pipeline) }, class_name: 'CommitStatus', foreign_key: :commit_id, inverse_of: :pipeline, partition_foreign_key: :partition_id
     has_many :statuses_order_id_desc, ->(pipeline) { in_partition(pipeline).order_id_desc }, class_name: 'CommitStatus', foreign_key: :commit_id,
@@ -741,6 +741,9 @@ def trigger_status_change_subscriptions
     end
 
     def uses_needs?
+      # TODO: Check if query performance is better with:
+      # 1. ci_job_infos index on only (scheduling_type, id), or
+      # 2. Scope ci_job_infos WHERE clause to project_id and have index on (project_id, scheduling_type, id).
       if Feature.enabled?(:read_from_ci_job_infos, project) && processables.has_job_infos?
         processables
           .joins(:job_info)
@@ -1593,8 +1596,8 @@ def source_ref_path
 
     # Set scheduling type of processables if they were created before scheduling_type
     # data was deployed (https://gitlab.com/gitlab-org/gitlab/-/merge_requests/22246).
-    # TODO: We can remove this method after we migrate all existing data to ci_job_infos.
-    # Jobs with nil scheduling_type can be populated with the logic in Ci::Processable#populate_scheduling_type!
+    # TODO: We probably don't need this method anymore.
+    # See https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540#note_2878147697.
     def ensure_scheduling_type!
       processables.populate_scheduling_type!
     end
diff --git a/app/models/ci/processable.rb b/app/models/ci/processable.rb
index 40fc91080aaa1a..3945ec13eb05a2 100644
--- a/app/models/ci/processable.rb
+++ b/app/models/ci/processable.rb
@@ -165,7 +165,7 @@ def self.fabricate(attrs)
       attrs[:tag_list] = definition_attrs[:tag_list] if definition_attrs.key?(:tag_list)
 
       if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, attrs[:project])
-        attrs.delete(*CI_BUILD_ATTRS_TO_REMOVE)
+        attrs.delete(*[Ci::JobInfo::CONFIG_ATTRIBUTES - Ci::JobInfo::CI_BUILD_ATTRS_TO_KEEP])
       end
 
       new(attrs).tap do |job|
@@ -203,12 +203,10 @@ def self.select_with_aggregated_needs(project)
 
     # Old processables may have scheduling_type as nil,
     # so we need to ensure the data exists before using it.
+    # TODO: We probably don't need this method anymore.
+    # See https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540#note_2878147697.
     def self.populate_scheduling_type!
       needs = Ci::BuildNeed.scoped_build.select(1)
-      # TODO: If scheduling_type is nil, it means it's an old job that doesn't already
-      # have a job_info record, so we can create a new one for them.
-      # We can remove this method after we migrate existing data to ci_job_infos.
-      # When migrating, jobs with nil scheduling_type can be populated with the logic below.
       where(scheduling_type: nil).update_all(
         "scheduling_type = CASE WHEN (EXISTS (#{needs.to_sql}))
          THEN #{scheduling_types[:dag]}
@@ -304,7 +302,8 @@ def needs_attributes
       end
     end
 
-    # TODO: We can remove this method after we migrate data to ci_job_infos
+    # TODO: We probably don't need this method anymore.
+    # See https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540#note_2878147697.
     def ensure_scheduling_type!
       # If this has a scheduling_type, it means all processables in the pipeline already have.
       return if scheduling_type
diff --git a/app/models/concerns/ci/metadatable.rb b/app/models/concerns/ci/metadatable.rb
index f8656d17addf3b..b8a5891e2ca09b 100644
--- a/app/models/concerns/ci/metadatable.rb
+++ b/app/models/concerns/ci/metadatable.rb
@@ -218,8 +218,18 @@ def stage_idx
       read_job_info_attribute(:stage_idx)
     end
 
-    def name
-      read_job_info_attribute(:name)
+    # We're keeping this column in ci_builds but it's copied over to ci_job_infos so it needs to be immutable
+    def name=(value)
+      raise ActiveRecord::ReadonlyAttributeError, 'This data is read only' if persisted?
+
+      write_attribute(:name, value)
+    end
+
+    # We're keeping this column in ci_builds but it's copied over to ci_job_infos so it needs to be immutable
+    def stage_idx=(value)
+      raise ActiveRecord::ReadonlyAttributeError, 'This data is read only' if persisted?
+
+      write_attribute(:stage_idx, value)
     end
 
     private
@@ -236,7 +246,6 @@ def read_metadata_attribute(legacy_key, metadata_key, job_definition_key, defaul
 
     def read_job_info_attribute(key, default_value: nil)
       if read_from_ci_job_infos?
-        # TODO: Not really the nicest way to do this; refactor?
         result = if key.in?(::Ci::JobInfo::NORMALIZED_DATA_COLUMNS)
                    job_info&.read_attribute(key) || temp_job_info&.read_attribute(key)
                  else
diff --git a/app/services/ci/create_commit_status_service.rb b/app/services/ci/create_commit_status_service.rb
index 896249f94a9dfd..e3b2ec095350c4 100644
--- a/app/services/ci/create_commit_status_service.rb
+++ b/app/services/ci/create_commit_status_service.rb
@@ -139,7 +139,6 @@ def external_commit_status_exists?
     end
 
     def find_or_build_external_commit_status
-      # TODO: Should we update this to use a fabricate method to create job_info record?
       external_commit_status_scope(pipeline).find_or_initialize_by( # rubocop:disable CodeReuse/ActiveRecord
         ci_stage: stage,
         stage_idx: stage.position
diff --git a/app/services/ci/update_build_names_service.rb b/app/services/ci/update_build_names_service.rb
index a73630a32e1056..3ed418dbf7678c 100644
--- a/app/services/ci/update_build_names_service.rb
+++ b/app/services/ci/update_build_names_service.rb
@@ -11,8 +11,7 @@ def initialize(pipeline)
     end
 
     def execute
-      # TODO: return if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations)
-      # Ensure job search functionality works without this service/table.
+      return if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, pipeline.project)
 
       scope = pipeline.builds.latest
       iterator = Gitlab::Pagination::Keyset::Iterator.new(scope: scope)
@@ -27,21 +26,10 @@ def execute
     def upsert_records(batch)
       keys = %i[build_id partition_id name project_id]
 
-      builds_name_data = if read_from_ci_job_infos?
-                           batch
-                             .left_joins(:job_info)
-                             .select(<<~SQL)
-                               p_ci_builds.id,
-                               p_ci_builds.partition_id,
-                               COALESCE(p_ci_job_infos.name, p_ci_builds.name) AS job_name,
-                               p_ci_builds.project_id
-                             SQL
-                             .map { |record| record.values_at(:id, :partition_id, :job_name, :project_id) }
-                         else
-                           batch.pluck(:id, :partition_id, :name, :project_id)
-                         end
-
-      builds_upsert_data = builds_name_data.map { |values| Hash[keys.zip(values)] }
+      builds_upsert_data =
+        batch
+          .pluck(:id, :partition_id, :name, :project_id)
+          .map { |values| Hash[keys.zip(values)] }
 
       return unless builds_upsert_data.any?
 
@@ -49,10 +37,5 @@ def upsert_records(batch)
     end
     # rubocop: enable CodeReuse/ActiveRecord
     # rubocop: enable Database/AvoidUsingPluckWithoutLimit
-
-    def read_from_ci_job_infos?
-      Feature.enabled?(:read_from_ci_job_infos, pipeline.project)
-    end
-    strong_memoize_attr :read_from_ci_job_infos?
   end
 end
diff --git a/app/services/projects/update_pages_service.rb b/app/services/projects/update_pages_service.rb
index 7623841cb1d122..df3d7ae6057c49 100644
--- a/app/services/projects/update_pages_service.rb
+++ b/app/services/projects/update_pages_service.rb
@@ -63,6 +63,12 @@ def error(message)
     end
 
     # Create status notifying the deployment of pages
+    # NOTE: We probably don't need to use .fabricate here because the job_info
+    # record is only needed for setting:
+    # 1. ci_job_infos.scheduling_type: Only queried in Pipeline#uses_needs?;
+    # having no job_info record for this job won't affect result.
+    # 2. ci_job_infos.name: Only queried for Ci::BuildNameFinder, which this commit status
+    # currently doesn't support anyway because it doesn't create a `build_names` record.
     def commit_status
       GenericCommitStatus.new(
         user: build.user,
diff --git a/db/fixtures/development/14_pipelines.rb b/db/fixtures/development/14_pipelines.rb
index 524d2964a7da3a..a65dc4b049dab7 100644
--- a/db/fixtures/development/14_pipelines.rb
+++ b/db/fixtures/development/14_pipelines.rb
@@ -290,7 +290,6 @@ def runners
     @runners ||= FactoryBot.create_list(:ci_runner, 6)
   end
 
-  # TODO: How should we deal with generic commit statuses? Should it have the .fabricate method instead of Processable?
   def job_attributes(pipeline, stage, opts)
     {
       name: 'test build', ci_stage: stage, stage_idx: stage.position,
diff --git a/db/migrate/20251031012621_create_p_ci_job_infos_table.rb b/db/migrate/20251031012621_create_p_ci_job_infos_table.rb
index dc636f7a285a30..0f9542cf5daba0 100644
--- a/db/migrate/20251031012621_create_p_ci_job_infos_table.rb
+++ b/db/migrate/20251031012621_create_p_ci_job_infos_table.rb
@@ -23,9 +23,11 @@ def change
 
       t.index [:project_id, :checksum, :partition_id], unique: true,
         name: :index_p_ci_job_infos_on_project_id_and_checksum
-      # TODO: We can probably make this a partial index instead `WHERE scheduling_type = 1`
+      # TODO: We can probably make this a partial index instead `WHERE scheduling_type = 1`.
+      # Also need to evaluate if this index is better with/without project_id.
       t.index [:project_id, :scheduling_type, :id],
         name: :index_p_ci_job_infos_on_project_id_scheduling_type_and_id
+      # TODO: Evaluate if this index is better with/without project_id.
       t.index [:project_id, :stage_idx, :id],
         name: :index_p_ci_job_infos_on_project_id_stage_idx_and_id
       t.index [:search_vector], using: :gin,
diff --git a/db/migrate/20251103182209_add_job_info_id_column_to_p_ci_builds.rb b/db/migrate/20251103182209_add_job_info_id_column_to_p_ci_builds.rb
index ad207d4f316f2e..3c23d792b4ca00 100644
--- a/db/migrate/20251103182209_add_job_info_id_column_to_p_ci_builds.rb
+++ b/db/migrate/20251103182209_add_job_info_id_column_to_p_ci_builds.rb
@@ -5,7 +5,7 @@ class AddJobInfoIdColumnToPCiBuilds < Gitlab::Database::Migration[2.3]
 
   # rubocop:disable Migration/PreventAddingColumns -- Required to deduplicate data into ci_job_infos table
   def up
-    # TODO: Should be changed into a non-nullable column later
+    # NOTE: We can probably keep this column as NULL-able because generic commit statuses may not have a job_info record
     add_column :p_ci_builds, :job_info_id, :bigint, if_not_exists: true
   end
 
diff --git a/spec/models/ci/bridge_spec.rb b/spec/models/ci/bridge_spec.rb
index 3476b4c9cb8798..323222984b9cda 100644
--- a/spec/models/ci/bridge_spec.rb
+++ b/spec/models/ci/bridge_spec.rb
@@ -86,6 +86,7 @@
         pipeline project ref tag name allow_failure stage_idx
         when environment description needs_attributes
         scheduling_type ci_stage partition_id resource_group
+        job_info_id
       ]
 
       expect(described_class.clone_accessors).to eq(expected_accessors)
diff --git a/spec/models/ci/build_spec.rb b/spec/models/ci/build_spec.rb
index 39170c89904f0e..5ab708257ed7b5 100644
--- a/spec/models/ci/build_spec.rb
+++ b/spec/models/ci/build_spec.rb
@@ -4826,7 +4826,9 @@ def run_job_without_exception
     with_them do
       before do
         stub_pages_setting(enabled: enabled)
-        build.update!(name: name)
+        # TODO: Update all specs that change Ci::JobInfo::CONFIG_ATTRIBUTES
+        # to either utilize the job factory or job info stub helper.
+        stub_ci_job_info(build, name: name)
         stub_ci_job_definition(build, options: { pages: pages_config })
         stub_feature_flags(customizable_pages_job_name: true)
       end
diff --git a/spec/services/ci/update_build_names_service_spec.rb b/spec/services/ci/update_build_names_service_spec.rb
index 9b20651b565dd6..a23ba318960d0a 100644
--- a/spec/services/ci/update_build_names_service_spec.rb
+++ b/spec/services/ci/update_build_names_service_spec.rb
@@ -10,6 +10,10 @@
   let_it_be(:build3) { create(:ci_build, name: 'build3', pipeline: pipeline) }
   let_it_be(:bridge1) { create(:ci_bridge, name: 'bridge1', pipeline: pipeline) }
 
+  before do
+    stub_feature_flags(stop_writing_ci_job_info_to_old_destinations: false)
+  end
+
   describe '#execute' do
     subject(:service) { described_class.new(pipeline) }
 
diff --git a/spec/support/helpers/ci/job_helpers.rb b/spec/support/helpers/ci/job_helpers.rb
index 4775875efa48e2..20faaf8d7c5ab7 100644
--- a/spec/support/helpers/ci/job_helpers.rb
+++ b/spec/support/helpers/ci/job_helpers.rb
@@ -49,10 +49,15 @@ def stub_ci_job_info(job, **new_config)
       )
 
       new_job_info.validate
+      # TODO: Update this to catch other column validation errors too.
       config_errors = new_job_info.errors[:config]
       raise ActiveRecord::RecordInvalid, config_errors.join(', ') if config_errors.any?
 
-      allow(job).to receive(:job_info).and_return(new_job_info)
+      allow(job).to receive_messages(
+        job_info: new_job_info,
+        name: new_job_info.name, # Stub columns we're still keeping in ci_builds
+        stage_idx: new_job_info.stage_idx
+      )
     end
   end
 end
-- 
GitLab


From c8240aaa39d654ba4d6fe5d44453cb3744f8f603 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Thu, 13 Nov 2025 15:40:04 -0800
Subject: [PATCH 14/27] Increase known index limit for p_ci_builds

---
 spec/db/schema_spec.rb | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/spec/db/schema_spec.rb b/spec/db/schema_spec.rb
index e274a854bc8c7f..75bbac1d87cd39 100644
--- a/spec/db/schema_spec.rb
+++ b/spec/db/schema_spec.rb
@@ -294,7 +294,7 @@
       merge_requests: 29,
       namespaces: 26,
       notes: 16,
-      p_ci_builds: 26,
+      p_ci_builds: 27,
       p_ci_pipelines: 24,
       packages_package_files: 16,
       packages_packages: 27,
-- 
GitLab


From 55e7f110bfada9ebaf87bbe688a05b298bcf53fe Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Mon, 17 Nov 2025 11:21:02 -0800
Subject: [PATCH 15/27] Fix some tests & add preloads

Fix tests and preloads.
---
 app/models/ci/bridge.rb                                   | 2 +-
 app/models/ci/build.rb                                    | 2 +-
 app/models/commit_status.rb                               | 4 ++++
 app/models/concerns/ci/metadatable.rb                     | 8 ++------
 app/models/project.rb                                     | 1 +
 app/services/ci/clone_job_service.rb                      | 2 +-
 .../ci/pipeline_processing/atomic_processing_service.rb   | 1 +
 lib/gitlab/import_export/project/import_export.yml        | 4 ++++
 lib/gitlab/import_export/project/relation_factory.rb      | 3 ++-
 spec/lib/gitlab/import_export/all_models.yml              | 5 +++++
 10 files changed, 22 insertions(+), 10 deletions(-)

diff --git a/app/models/ci/bridge.rb b/app/models/ci/bridge.rb
index 700a7e4641b101..e42fce7196d97d 100644
--- a/app/models/ci/bridge.rb
+++ b/app/models/ci/bridge.rb
@@ -104,7 +104,7 @@ def self.clone_accessors
       %i[pipeline project ref tag name allow_failure stage_idx
         when environment description needs_attributes
         scheduling_type ci_stage partition_id resource_group
-        job_info_id].freeze
+        job_info].freeze
     end
 
     def retryable?
diff --git a/app/models/ci/build.rb b/app/models/ci/build.rb
index a382f1e74a183c..9f7f2e0a1531ec 100644
--- a/app/models/ci/build.rb
+++ b/app/models/ci/build.rb
@@ -287,7 +287,7 @@ def clone_accessors
           needs_attributes job_variables_attributes resource_group
           scheduling_type timeout timeout_source debug_trace_enabled
           ci_stage partition_id execution_config_id inputs_attributes
-          job_info_id].freeze
+          job_info].freeze
       end
 
       def supported_keyset_orderings
diff --git a/app/models/commit_status.rb b/app/models/commit_status.rb
index b0d708956fb77d..bc320934f47b5a 100644
--- a/app/models/commit_status.rb
+++ b/app/models/commit_status.rb
@@ -114,6 +114,10 @@ class CommitStatus < Ci::ApplicationRecord
     preload(project: :namespace)
   end
 
+  scope :with_job_info_preload, -> do
+    preload(:job_info)
+  end
+
   scope :scoped_pipeline, -> do
     where(arel_table[:commit_id].eq(Ci::Pipeline.arel_table[:id]))
     .where(arel_table[:partition_id].eq(Ci::Pipeline.arel_table[:partition_id]))
diff --git a/app/models/concerns/ci/metadatable.rb b/app/models/concerns/ci/metadatable.rb
index b8a5891e2ca09b..ff4053f17b5dd9 100644
--- a/app/models/concerns/ci/metadatable.rb
+++ b/app/models/concerns/ci/metadatable.rb
@@ -192,32 +192,28 @@ def secrets=(_value)
     end
 
     # TODO: Remove when ci_builds.scheduling_type is dropped
+    # and delegate to Ci::JobInfo.
     def scheduling_type
       read_job_info_attribute(:scheduling_type)
     end
 
     # Need this method to overwrite ci_builds.scheduling_type enum.
-    # TODO: Remove when ci_builds.scheduling_type is dropped
     def scheduling_type_dag?
       scheduling_type.nil? ? find_legacy_scheduling_type == :dag : scheduling_type.to_sym == :dag
     end
 
     # Need this method to overwrite ci_builds.scheduling_type enum.
-    # TODO: Remove when ci_builds.scheduling_type is dropped
     def scheduling_type_stage?
       scheduling_type.to_sym == :stage
     end
 
     # TODO: We can remove this method after we migrate scheduling_type to ci_job_infos
+    # because no scheduling_type would be nil.
     def find_legacy_scheduling_type
       needs.exists? ? :dag : :stage
     end
     strong_memoize_attr :find_legacy_scheduling_type
 
-    def stage_idx
-      read_job_info_attribute(:stage_idx)
-    end
-
     # We're keeping this column in ci_builds but it's copied over to ci_job_infos so it needs to be immutable
     def name=(value)
       raise ActiveRecord::ReadonlyAttributeError, 'This data is read only' if persisted?
diff --git a/app/models/project.rb b/app/models/project.rb
index 5d55da4dd0e016..57f488722a5b77 100644
--- a/app/models/project.rb
+++ b/app/models/project.rb
@@ -466,6 +466,7 @@ def with_developer_access
   has_many :build_trace_chunks, class_name: 'Ci::BuildTraceChunk', through: :builds, source: :trace_chunks, dependent: :restrict_with_error
   has_many :build_report_results, class_name: 'Ci::BuildReportResult', inverse_of: :project
   has_many :job_artifacts, class_name: 'Ci::JobArtifact', dependent: :restrict_with_error
+  has_many :job_infos, class_name: 'Ci::JobInfo', inverse_of: :project # NOTE: I think we need this for project export
   has_many :pipeline_artifacts, class_name: 'Ci::PipelineArtifact', inverse_of: :project, dependent: :restrict_with_error
   has_many :runner_projects, class_name: 'Ci::RunnerProject', inverse_of: :project
   has_many :runners, through: :runner_projects, source: :runner, class_name: 'Ci::Runner'
diff --git a/app/services/ci/clone_job_service.rb b/app/services/ci/clone_job_service.rb
index 47a58877ca0e85..639f8b7530ed80 100644
--- a/app/services/ci/clone_job_service.rb
+++ b/app/services/ci/clone_job_service.rb
@@ -13,7 +13,7 @@ def execute(new_job_variables: [], new_job_inputs: {})
       add_job_variables_attributes!(new_attributes, new_job_variables)
       add_job_inputs_attributes!(new_attributes, new_job_inputs)
       add_job_definition_attributes!(new_attributes)
-      # TODO: Need to update cloning to include Ci::JobInfo
+      # TODO: Need to update cloning to create job_info record if it doesn't already exist
 
       new_attributes[:user] = current_user
 
diff --git a/app/services/ci/pipeline_processing/atomic_processing_service.rb b/app/services/ci/pipeline_processing/atomic_processing_service.rb
index 9484c5b0ffe818..050bf8a4c1a34e 100644
--- a/app/services/ci/pipeline_processing/atomic_processing_service.rb
+++ b/app/services/ci/pipeline_processing/atomic_processing_service.rb
@@ -84,6 +84,7 @@ def load_jobs(ids)
           .current_processable_jobs
           .id_in(ids)
           .with_project_preload
+          .with_job_info_preload
           .created
           .ordered_by_stage
           .select_with_aggregated_needs(project)
diff --git a/lib/gitlab/import_export/project/import_export.yml b/lib/gitlab/import_export/project/import_export.yml
index c6982ce8ed0abf..14739756e275f0 100644
--- a/lib/gitlab/import_export/project/import_export.yml
+++ b/lib/gitlab/import_export/project/import_export.yml
@@ -107,6 +107,7 @@ tree:
       - :external_pull_request
       - :merge_request
       - :pipeline_metadata
+    - :job_infos # TODO: I think this is necessary to export; to confirm
     - :auto_devops
     - :pipeline_schedules
     - :container_expiration_policy
@@ -595,9 +596,12 @@ included_attributes:
     - :scheduled_at
     - :scheduling_type
     - :ci_stage
+    - :job_info_id
   builds: *statuses_definition
   generic_commit_statuses: *statuses_definition
   bridges: *statuses_definition
+  job_infos: # TODO: Assess attributes to export form ci_job_infos
+    - scheduling_type
   ci_pipelines:
     - :ref
     - :sha
diff --git a/lib/gitlab/import_export/project/relation_factory.rb b/lib/gitlab/import_export/project/relation_factory.rb
index 26fe5dc7b4e7c6..6e89cae9b1f765 100644
--- a/lib/gitlab/import_export/project/relation_factory.rb
+++ b/lib/gitlab/import_export/project/relation_factory.rb
@@ -45,7 +45,8 @@ class RelationFactory < Base::RelationFactory
                       work_item_type: 'WorkItems::Type',
                       work_item_description: 'WorkItems::Description',
                       user_contributions: 'User',
-                      squash_option: 'Projects::BranchRules::SquashOption' }.freeze
+                      squash_option: 'Projects::BranchRules::SquashOption',
+                      job_infos: 'Ci::JobInfo' }.freeze
 
         BUILD_MODELS = %i[Ci::Build Ci::Bridge commit_status generic_commit_status].freeze
 
diff --git a/spec/lib/gitlab/import_export/all_models.yml b/spec/lib/gitlab/import_export/all_models.yml
index 62461c519a77d2..5246a34b3fe937 100644
--- a/spec/lib/gitlab/import_export/all_models.yml
+++ b/spec/lib/gitlab/import_export/all_models.yml
@@ -441,6 +441,7 @@ statuses:
 - auto_canceled_by
 - needs
 - ci_stage
+- job_info
 builds:
 - user
 - auto_canceled_by
@@ -525,6 +526,7 @@ builds:
 - job_artifacts_annotations
 - project_mirror
 - build_source
+- job_info
 bridges:
 - user
 - pipeline
@@ -545,12 +547,14 @@ bridges:
 - downstream_pipeline
 - upstream_pipeline
 - build_source
+- job_info
 generic_commit_statuses:
 - user
 - pipeline
 - auto_canceled_by
 - ci_stage
 - needs
+- job_info
 variables:
 - project
 triggers:
@@ -991,6 +995,7 @@ project:
 - security_scan_profiles_projects
 - enabled_foundational_flows
 - enabled_foundational_flow_records
+- job_infos
 award_emoji:
 - awardable
 - user
-- 
GitLab


From f102fcfc91bb1c42900d8cfd7ea2a1fce3428a54 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Mon, 1 Dec 2025 12:09:26 -0800
Subject: [PATCH 16/27] Descope stage_idx column

Descope stage_idx from poc
---
 Gemfile.lock                                             | 4 ++--
 app/models/ci/job_info.rb                                | 4 +---
 app/models/concerns/ci/metadatable.rb                    | 7 -------
 db/migrate/20251031012621_create_p_ci_job_infos_table.rb | 4 ----
 db/structure.sql                                         | 3 ---
 spec/factories/ci/processable.rb                         | 1 -
 spec/support/helpers/ci/job_helpers.rb                   | 3 +--
 7 files changed, 4 insertions(+), 22 deletions(-)

diff --git a/Gemfile.lock b/Gemfile.lock
index fc97abc4abb9cc..46c2c77bbd132e 100644
--- a/Gemfile.lock
+++ b/Gemfile.lock
@@ -47,7 +47,7 @@ PATH
       concurrent-ruby (~> 1.1)
       faraday (~> 2)
       google-cloud-storage_transfer (~> 1.2.0)
-      google-protobuf (~> 3.25, >= 3.25.3)
+      google-protobuf (>= 3.25, < 5.0)
       googleauth (~> 1.14)
       grpc (~> 1.75)
       json (~> 2.7)
@@ -163,7 +163,7 @@ PATH
   remote: vendor/gems/gitlab-topology-service-client
   specs:
     gitlab-topology-service-client (0.1)
-      google-protobuf (~> 3)
+      google-protobuf (>= 3.25, < 5.0)
       grpc
 
 PATH
diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
index b0cce08398dfa0..0af619422939a8 100644
--- a/app/models/ci/job_info.rb
+++ b/app/models/ci/job_info.rb
@@ -18,17 +18,15 @@ class JobInfo < Ci::ApplicationRecord
     # Order is important for the checksum calculation.
     CONFIG_ATTRIBUTES = [
       :scheduling_type,
-      :stage_idx,
       :name
     ].freeze
     NORMALIZED_DATA_COLUMNS = [
       :scheduling_type,
-      :stage_idx,
       :name
     ].freeze
 
     # We're copying over these values to ci_job_infos but not dropping them from ci_builds
-    CI_BUILD_ATTRS_TO_KEEP = [:stage_idx, :name].freeze
+    CI_BUILD_ATTRS_TO_KEEP = [:name].freeze
 
     MAX_JOB_NAME_LENGTH = 255
 
diff --git a/app/models/concerns/ci/metadatable.rb b/app/models/concerns/ci/metadatable.rb
index ff4053f17b5dd9..42ded264366f92 100644
--- a/app/models/concerns/ci/metadatable.rb
+++ b/app/models/concerns/ci/metadatable.rb
@@ -221,13 +221,6 @@ def name=(value)
       write_attribute(:name, value)
     end
 
-    # We're keeping this column in ci_builds but it's copied over to ci_job_infos so it needs to be immutable
-    def stage_idx=(value)
-      raise ActiveRecord::ReadonlyAttributeError, 'This data is read only' if persisted?
-
-      write_attribute(:stage_idx, value)
-    end
-
     private
 
     def read_metadata_attribute(legacy_key, metadata_key, job_definition_key, default_value = nil)
diff --git a/db/migrate/20251031012621_create_p_ci_job_infos_table.rb b/db/migrate/20251031012621_create_p_ci_job_infos_table.rb
index 0f9542cf5daba0..71d8c189acf32b 100644
--- a/db/migrate/20251031012621_create_p_ci_job_infos_table.rb
+++ b/db/migrate/20251031012621_create_p_ci_job_infos_table.rb
@@ -15,7 +15,6 @@ def change
       t.bigint :project_id, null: false
       t.datetime_with_timezone :created_at, null: false
       t.integer :scheduling_type, limit: 2, null: false
-      t.integer :stage_idx, limit: 2
       t.binary :checksum, null: false
       t.tsvector :search_vector, as: "to_tsvector('english'::regconfig, COALESCE(name, ''::text))", stored: true
       t.text :name, limit: 255, null: false
@@ -27,9 +26,6 @@ def change
       # Also need to evaluate if this index is better with/without project_id.
       t.index [:project_id, :scheduling_type, :id],
         name: :index_p_ci_job_infos_on_project_id_scheduling_type_and_id
-      # TODO: Evaluate if this index is better with/without project_id.
-      t.index [:project_id, :stage_idx, :id],
-        name: :index_p_ci_job_infos_on_project_id_stage_idx_and_id
       t.index [:search_vector], using: :gin,
         name: :index_p_ci_job_infos_on_search_vector
     end
diff --git a/db/structure.sql b/db/structure.sql
index 036ad6c39c2e83..99bdafa73add7d 100644
--- a/db/structure.sql
+++ b/db/structure.sql
@@ -5794,7 +5794,6 @@ CREATE TABLE p_ci_job_infos (
     project_id bigint NOT NULL,
     created_at timestamp with time zone NOT NULL,
     scheduling_type smallint NOT NULL,
-    stage_idx smallint,
     checksum bytea NOT NULL,
     search_vector tsvector GENERATED ALWAYS AS (to_tsvector('english'::regconfig, COALESCE(name, ''::text))) STORED,
     name text NOT NULL,
@@ -43371,8 +43370,6 @@ CREATE UNIQUE INDEX index_p_ci_job_infos_on_project_id_and_checksum ON ONLY p_ci
 
 CREATE INDEX index_p_ci_job_infos_on_project_id_scheduling_type_and_id ON ONLY p_ci_job_infos USING btree (project_id, scheduling_type, id);
 
-CREATE INDEX index_p_ci_job_infos_on_project_id_stage_idx_and_id ON ONLY p_ci_job_infos USING btree (project_id, stage_idx, id);
-
 CREATE INDEX index_p_ci_job_infos_on_search_vector ON ONLY p_ci_job_infos USING gin (search_vector);
 
 CREATE UNIQUE INDEX index_p_ci_job_inputs_on_job_id_and_name ON ONLY p_ci_job_inputs USING btree (job_id, name, partition_id);
diff --git a/spec/factories/ci/processable.rb b/spec/factories/ci/processable.rb
index ff5aeb76d915c2..7506b6227c6111 100644
--- a/spec/factories/ci/processable.rb
+++ b/spec/factories/ci/processable.rb
@@ -32,7 +32,6 @@
         Ci::JobFactoryHelpers.mutate_temp_job_info(
           processable,
           scheduling_type: evaluator.scheduling_type,
-          stage_idx: processable.stage_idx,
           name: processable.name
         )
       end
diff --git a/spec/support/helpers/ci/job_helpers.rb b/spec/support/helpers/ci/job_helpers.rb
index 20faaf8d7c5ab7..3457b1d5cd2a9c 100644
--- a/spec/support/helpers/ci/job_helpers.rb
+++ b/spec/support/helpers/ci/job_helpers.rb
@@ -55,8 +55,7 @@ def stub_ci_job_info(job, **new_config)
 
       allow(job).to receive_messages(
         job_info: new_job_info,
-        name: new_job_info.name, # Stub columns we're still keeping in ci_builds
-        stage_idx: new_job_info.stage_idx
+        name: new_job_info.name # Stub columns we're still keeping in ci_builds
       )
     end
   end
-- 
GitLab


From 1ae53c4dd87600f1a776041038285e41484fce17 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Tue, 2 Dec 2025 13:31:35 -0800
Subject: [PATCH 17/27] Use ci_job_info_instances table instead of
 ci_builds.job_info_id

Creates a joining/association tabel ci_job_info_instances
table to link ci_builds and ci_job_infos instead of
having a direct foreign key job_info_id on ci_builds.
---
 app/finders/ci/build_name_finder.rb           | 15 +++++---
 app/models/ci/bridge.rb                       |  3 +-
 app/models/ci/build.rb                        |  3 +-
 app/models/ci/job_info_instance.rb            | 35 ++++++++++++++++++
 app/models/ci/pipeline.rb                     |  4 +-
 app/models/ci/processable.rb                  |  2 +-
 app/models/commit_status.rb                   | 23 ++++++++----
 .../concerns/ci/partitionable/testing.rb      |  1 +
 config/gitlab_loose_foreign_keys.yml          |  4 ++
 config/initializers/postgres_partitioning.rb  |  1 +
 db/docs/p_ci_job_info_instances.yml           | 13 +++++++
 ...9_add_job_info_id_column_to_p_ci_builds.rb | 16 --------
 ...> 20251202000001_create_p_ci_job_infos.rb} | 11 +++---
 ...00002_create_p_ci_job_infos_partitions.rb} |  6 +--
 ...02000003_create_p_ci_job_info_instances.rb | 19 ++++++++++
 ...eate_p_ci_job_info_instances_partitions.rb | 35 ++++++++++++++++++
 ...04_add_index_on_p_ci_builds_job_info_id.rb | 22 -----------
 ...fk_to_ci_job_infos_from_info_instances.rb} | 12 ++----
 ...add_fk_to_ci_builds_from_info_instances.rb | 37 +++++++++++++++++++
 db/schema_migrations/20251031012621           |  1 -
 db/schema_migrations/20251031012831           |  1 -
 db/schema_migrations/20251103182209           |  1 -
 db/schema_migrations/20251103190204           |  1 -
 db/schema_migrations/20251103191450           |  1 -
 db/schema_migrations/20251202000001           |  1 +
 db/schema_migrations/20251202000002           |  1 +
 db/schema_migrations/20251202000003           |  1 +
 db/schema_migrations/20251202000004           |  1 +
 db/schema_migrations/20251202000005           |  1 +
 db/schema_migrations/20251202000006           |  1 +
 db/structure.sql                              | 31 ++++++++++++----
 lib/gitlab/ci/job_infos/find_or_create.rb     |  3 +-
 .../ci/pipeline/create/job_info_builder.rb    |  6 ++-
 .../import_export/project/import_export.yml   | 11 +++++-
 .../import_export/project/relation_factory.rb |  3 +-
 spec/factories/ci/job_info_instances.rb       |  9 +++++
 spec/factories/ci/processable.rb              |  9 ++++-
 spec/lib/gitlab/import_export/all_models.yml  |  1 +
 spec/models/ci/bridge_spec.rb                 |  1 -
 39 files changed, 251 insertions(+), 96 deletions(-)
 create mode 100644 app/models/ci/job_info_instance.rb
 create mode 100644 db/docs/p_ci_job_info_instances.yml
 delete mode 100644 db/migrate/20251103182209_add_job_info_id_column_to_p_ci_builds.rb
 rename db/migrate/{20251031012621_create_p_ci_job_infos_table.rb => 20251202000001_create_p_ci_job_infos.rb} (70%)
 rename db/migrate/{20251031012831_create_p_ci_job_infos_partitions.rb => 20251202000002_create_p_ci_job_infos_partitions.rb} (77%)
 create mode 100644 db/migrate/20251202000003_create_p_ci_job_info_instances.rb
 create mode 100644 db/migrate/20251202000004_create_p_ci_job_info_instances_partitions.rb
 delete mode 100644 db/post_migrate/20251103190204_add_index_on_p_ci_builds_job_info_id.rb
 rename db/post_migrate/{20251103191450_add_fk_on_p_ci_builds_job_info_id.rb => 20251202000005_add_fk_to_ci_job_infos_from_info_instances.rb} (63%)
 create mode 100644 db/post_migrate/20251202000006_add_fk_to_ci_builds_from_info_instances.rb
 delete mode 100644 db/schema_migrations/20251031012621
 delete mode 100644 db/schema_migrations/20251031012831
 delete mode 100644 db/schema_migrations/20251103182209
 delete mode 100644 db/schema_migrations/20251103190204
 delete mode 100644 db/schema_migrations/20251103191450
 create mode 100644 db/schema_migrations/20251202000001
 create mode 100644 db/schema_migrations/20251202000002
 create mode 100644 db/schema_migrations/20251202000003
 create mode 100644 db/schema_migrations/20251202000004
 create mode 100644 db/schema_migrations/20251202000005
 create mode 100644 db/schema_migrations/20251202000006
 create mode 100644 spec/factories/ci/job_info_instances.rb

diff --git a/app/finders/ci/build_name_finder.rb b/app/finders/ci/build_name_finder.rb
index 93ee91e36be927..a6bc3a42afec19 100644
--- a/app/finders/ci/build_name_finder.rb
+++ b/app/finders/ci/build_name_finder.rb
@@ -27,26 +27,31 @@ def limited_name_search_terms
     # rubocop: disable CodeReuse/ActiveRecord -- Need specialized queries for database optimizations
     def filter_by_name(build_relation)
       build_name_relation = Ci::BuildName
+        .select(:build_id, :partition_id)
         .where(project_id: project.id)
         .pg_full_text_search_in_model(limited_name_search_terms)
 
       if Feature.disabled?(:read_from_ci_job_infos, project)
-        return build_relation.where("(id, partition_id) IN (?)", build_name_relation.select(:build_id, :partition_id))
+        return build_relation.where("(id, partition_id) IN (?)", build_name_relation)
       end
 
       job_info_relation = Ci::JobInfo
-        .where(project_id: project.id)
+        .select(:id, :partition_id)
+        .for_project(project.id)
         .pg_full_text_search_in_model(limited_name_search_terms)
 
-      # NOTE: This query would be much more efficient on ci_job_infos alone.
+      job_info_instances_relation = Ci::JobInfoInstance
+        .select(:job_id, :partition_id)
+        .where('(job_info_id, partition_id) IN (?)', job_info_relation)
+
       # TODO: Evaluate the query performance after we create and write to ci_job_infos. Then we can decide on either:
       # 1. Keep this OR query if performance is not severely impacted.
       # 2. Plan to migrate all existing data to ci_job_infos before we switch reads.
       build_relation
-        .where("(job_info_id, partition_id) IN (?)", job_info_relation.select(:id, :partition_id))
+        .where("(id, partition_id) IN (?)", job_info_instances_relation)
         .or(
           build_relation
-            .where("(id, partition_id) IN (?)", build_name_relation.select(:build_id, :partition_id))
+            .where("(id, partition_id) IN (?)", build_name_relation)
         )
     end
     # rubocop: enable CodeReuse/ActiveRecord
diff --git a/app/models/ci/bridge.rb b/app/models/ci/bridge.rb
index e42fce7196d97d..04e5d7a3e54058 100644
--- a/app/models/ci/bridge.rb
+++ b/app/models/ci/bridge.rb
@@ -103,8 +103,7 @@ def self.with_preloads
     def self.clone_accessors
       %i[pipeline project ref tag name allow_failure stage_idx
         when environment description needs_attributes
-        scheduling_type ci_stage partition_id resource_group
-        job_info].freeze
+        scheduling_type ci_stage partition_id resource_group].freeze
     end
 
     def retryable?
diff --git a/app/models/ci/build.rb b/app/models/ci/build.rb
index 9f7f2e0a1531ec..1a430262f32748 100644
--- a/app/models/ci/build.rb
+++ b/app/models/ci/build.rb
@@ -286,8 +286,7 @@ def clone_accessors
           environment coverage_regex description tag_list protected
           needs_attributes job_variables_attributes resource_group
           scheduling_type timeout timeout_source debug_trace_enabled
-          ci_stage partition_id execution_config_id inputs_attributes
-          job_info].freeze
+          ci_stage partition_id execution_config_id inputs_attributes].freeze
       end
 
       def supported_keyset_orderings
diff --git a/app/models/ci/job_info_instance.rb b/app/models/ci/job_info_instance.rb
new file mode 100644
index 00000000000000..4f9dd3e9003640
--- /dev/null
+++ b/app/models/ci/job_info_instance.rb
@@ -0,0 +1,35 @@
+# frozen_string_literal: true
+
+module Ci
+  class JobInfoInstance < Ci::ApplicationRecord
+    include Ci::Partitionable
+
+    self.table_name = :p_ci_job_info_instances
+    self.primary_key = :job_id
+
+    query_constraints :job_id, :partition_id
+    partitionable scope: :job, partitioned: true
+
+    belongs_to :project
+
+    belongs_to :job, ->(job) { in_partition(job) },
+      class_name: 'CommitStatus',
+      partition_foreign_key: :partition_id,
+      inverse_of: :job_info_instance
+
+    # rubocop: disable Rails/InverseOf -- Relation not present in Ci::JobInfo because foreign key callback is not compatible with BulkInsertSafe
+    belongs_to :job_info, ->(info) { in_partition(info) },
+      class_name: 'Ci::JobInfo',
+      partition_foreign_key: :partition_id
+    # rubocop: enable Rails/InverseOf
+
+    validates :project, presence: true
+    validates :job, presence: true
+    validates :job_info, presence: true
+
+    scope :scoped_job, -> do
+      where(arel_table[:job_id].eq(Ci::Processable.arel_table[:id]))
+      .where(arel_table[:partition_id].eq(Ci::Processable.arel_table[:partition_id]))
+    end
+  end
+end
diff --git a/app/models/ci/pipeline.rb b/app/models/ci/pipeline.rb
index dcb8e275ab0f35..fbbf6c0bf4efe4 100644
--- a/app/models/ci/pipeline.rb
+++ b/app/models/ci/pipeline.rb
@@ -741,9 +741,7 @@ def trigger_status_change_subscriptions
     end
 
     def uses_needs?
-      # TODO: Check if query performance is better with:
-      # 1. ci_job_infos index on only (scheduling_type, id), or
-      # 2. Scope ci_job_infos WHERE clause to project_id and have index on (project_id, scheduling_type, id).
+      # TODO: Check if should keep index_p_ci_job_infos_on_id_where_scheduling_type_dag or a different index
       if Feature.enabled?(:read_from_ci_job_infos, project) && processables.has_job_infos?
         processables
           .joins(:job_info)
diff --git a/app/models/ci/processable.rb b/app/models/ci/processable.rb
index 3945ec13eb05a2..c44ccfe81ccca5 100644
--- a/app/models/ci/processable.rb
+++ b/app/models/ci/processable.rb
@@ -165,7 +165,7 @@ def self.fabricate(attrs)
       attrs[:tag_list] = definition_attrs[:tag_list] if definition_attrs.key?(:tag_list)
 
       if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, attrs[:project])
-        attrs.delete(*[Ci::JobInfo::CONFIG_ATTRIBUTES - Ci::JobInfo::CI_BUILD_ATTRS_TO_KEEP])
+        attrs.delete(*[Ci::JobInfo::CONFIG_ATTRIBUTES - Ci::JobInfo::CONFIG_ATTRS_TO_KEEP])
       end
 
       new(attrs).tap do |job|
diff --git a/app/models/commit_status.rb b/app/models/commit_status.rb
index bc320934f47b5a..ca75f072852756 100644
--- a/app/models/commit_status.rb
+++ b/app/models/commit_status.rb
@@ -34,17 +34,24 @@ class CommitStatus < Ci::ApplicationRecord
     partition_foreign_key: :partition_id,
     inverse_of: :statuses
 
-  # NOTE: Looks like we need to have this relationship in CommitStatus because
-  # generic commit statuses also use the columns in `Ci::JobInfo::CONFIG_ATTRIBUTES`.
-  # rubocop: disable Rails/InverseOf -- Relation not present in Ci::JobInfo because foreign key callback is not compatible with BulkInsertSafe
-  belongs_to :job_info,
-    ->(job) { in_partition(job) },
+  # NOTE: We need to have these relationships in CommitStatus because generic
+  # commit statuses also use the columns in `Ci::JobInfo::CONFIG_ATTRIBUTES`.
+  has_one :job_info_instance, ->(job) { in_partition(job) },
+    class_name: 'Ci::JobInfoInstance',
+    foreign_key: :job_id,
+    partition_foreign_key: :partition_id,
+    inverse_of: :job,
+    autosave: true
+  has_one :job_info, ->(job) { in_partition(job) },
     class_name: 'Ci::JobInfo',
-    partition_foreign_key: :partition_id
-  # rubocop: enable Rails/InverseOf
+    foreign_key: :job_id,
+    partition_foreign_key: :partition_id,
+    through: :job_info_instance
 
   has_many :needs, class_name: 'Ci::BuildNeed', foreign_key: :build_id, inverse_of: :build
 
+  accepts_nested_attributes_for :job_info_instance
+
   attribute :retried, default: false
 
   enum :scheduling_type, { stage: 0, dag: 1 }, prefix: true
@@ -275,7 +282,7 @@ def self.has_job_infos?
     # If a pipeline is created with FF `write_to_ci_job_infos` enabled, then all its jobs would
     # have job_info records. So we just need to check one job if it has job_info.
     # We check the oldest job in the pipeline since recent retries would create a new job_info record when cloning.
-    first&.job_info_id.present?
+    first&.job_info.present?
   end
 
   def locking_enabled?
diff --git a/app/models/concerns/ci/partitionable/testing.rb b/app/models/concerns/ci/partitionable/testing.rb
index b5655891b68b96..8f59d5115057c3 100644
--- a/app/models/concerns/ci/partitionable/testing.rb
+++ b/app/models/concerns/ci/partitionable/testing.rb
@@ -25,6 +25,7 @@ module Testing
         Ci::JobDefinition
         Ci::JobDefinitionInstance
         Ci::JobInfo
+        Ci::JobInfoInstance
         Ci::JobInput
         Ci::JobMessage
         Ci::JobVariable
diff --git a/config/gitlab_loose_foreign_keys.yml b/config/gitlab_loose_foreign_keys.yml
index 5e128df843ac20..101b1054ecc2b5 100644
--- a/config/gitlab_loose_foreign_keys.yml
+++ b/config/gitlab_loose_foreign_keys.yml
@@ -631,6 +631,10 @@ p_ci_job_definitions:
   - table: projects
     column: project_id
     on_delete: async_delete
+p_ci_job_info_instances:
+  - table: projects
+    column: project_id
+    on_delete: async_delete
 p_ci_job_infos:
   - table: projects
     column: project_id
diff --git a/config/initializers/postgres_partitioning.rb b/config/initializers/postgres_partitioning.rb
index 83511cf8e58bbb..079e315f02c4d6 100644
--- a/config/initializers/postgres_partitioning.rb
+++ b/config/initializers/postgres_partitioning.rb
@@ -32,6 +32,7 @@
       Ci::JobDefinition,
       Ci::JobDefinitionInstance,
       Ci::JobInfo,
+      Ci::JobInfoInstance,
       Ci::JobInput,
       Ci::JobMessage,
       Ci::Pipeline,
diff --git a/db/docs/p_ci_job_info_instances.yml b/db/docs/p_ci_job_info_instances.yml
new file mode 100644
index 00000000000000..87f4b73d9a9bd2
--- /dev/null
+++ b/db/docs/p_ci_job_info_instances.yml
@@ -0,0 +1,13 @@
+---
+table_name: p_ci_job_info_instances
+classes:
+  - Ci::JobInfoInstance
+feature_categories:
+- continuous_integration
+description: Links ci_builds with ci_job_infos
+introduced_by_url: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540
+milestone: '18.7'
+gitlab_schema: gitlab_ci
+sharding_key:
+  project_id: projects
+table_size: small
diff --git a/db/migrate/20251103182209_add_job_info_id_column_to_p_ci_builds.rb b/db/migrate/20251103182209_add_job_info_id_column_to_p_ci_builds.rb
deleted file mode 100644
index 3c23d792b4ca00..00000000000000
--- a/db/migrate/20251103182209_add_job_info_id_column_to_p_ci_builds.rb
+++ /dev/null
@@ -1,16 +0,0 @@
-# frozen_string_literal: true
-
-class AddJobInfoIdColumnToPCiBuilds < Gitlab::Database::Migration[2.3]
-  milestone '18.6'
-
-  # rubocop:disable Migration/PreventAddingColumns -- Required to deduplicate data into ci_job_infos table
-  def up
-    # NOTE: We can probably keep this column as NULL-able because generic commit statuses may not have a job_info record
-    add_column :p_ci_builds, :job_info_id, :bigint, if_not_exists: true
-  end
-
-  def down
-    remove_column :p_ci_builds, :job_info_id, if_exists: true
-  end
-  # rubocop:enable Migration/PreventAddingColumns
-end
diff --git a/db/migrate/20251031012621_create_p_ci_job_infos_table.rb b/db/migrate/20251202000001_create_p_ci_job_infos.rb
similarity index 70%
rename from db/migrate/20251031012621_create_p_ci_job_infos_table.rb
rename to db/migrate/20251202000001_create_p_ci_job_infos.rb
index 71d8c189acf32b..1fe63ede5eeeae 100644
--- a/db/migrate/20251031012621_create_p_ci_job_infos_table.rb
+++ b/db/migrate/20251202000001_create_p_ci_job_infos.rb
@@ -1,7 +1,7 @@
 # frozen_string_literal: true
 
-class CreatePCiJobInfosTable < Gitlab::Database::Migration[2.3]
-  milestone '18.6'
+class CreatePCiJobInfos < Gitlab::Database::Migration[2.3]
+  milestone '18.7'
 
   def change
     opts = {
@@ -22,10 +22,9 @@ def change
 
       t.index [:project_id, :checksum, :partition_id], unique: true,
         name: :index_p_ci_job_infos_on_project_id_and_checksum
-      # TODO: We can probably make this a partial index instead `WHERE scheduling_type = 1`.
-      # Also need to evaluate if this index is better with/without project_id.
-      t.index [:project_id, :scheduling_type, :id],
-        name: :index_p_ci_job_infos_on_project_id_scheduling_type_and_id
+      t.index :id,
+        where: '(scheduling_type = 1)',
+        name: :index_p_ci_job_infos_on_id_where_scheduling_type_dag
       t.index [:search_vector], using: :gin,
         name: :index_p_ci_job_infos_on_search_vector
     end
diff --git a/db/migrate/20251031012831_create_p_ci_job_infos_partitions.rb b/db/migrate/20251202000002_create_p_ci_job_infos_partitions.rb
similarity index 77%
rename from db/migrate/20251031012831_create_p_ci_job_infos_partitions.rb
rename to db/migrate/20251202000002_create_p_ci_job_infos_partitions.rb
index 0d9db99ff1fb1b..f41712a185a7db 100644
--- a/db/migrate/20251031012831_create_p_ci_job_infos_partitions.rb
+++ b/db/migrate/20251202000002_create_p_ci_job_infos_partitions.rb
@@ -1,9 +1,9 @@
 # frozen_string_literal: true
 
-# TODO: Either this migration needs to be scoped to GitLab.com only, or we remove it
-# and rely on the partition manager to create the necessary partitions instead.
+# TODO: This migration is just to initialize partitions for local gdk. For production, we can
+# remove it and rely on the partition manager to create the necessary partitions instead.
 class CreatePCiJobInfosPartitions < Gitlab::Database::Migration[2.3]
-  milestone '18.6'
+  milestone '18.7'
 
   disable_ddl_transaction!
 
diff --git a/db/migrate/20251202000003_create_p_ci_job_info_instances.rb b/db/migrate/20251202000003_create_p_ci_job_info_instances.rb
new file mode 100644
index 00000000000000..d7403f0819a660
--- /dev/null
+++ b/db/migrate/20251202000003_create_p_ci_job_info_instances.rb
@@ -0,0 +1,19 @@
+# frozen_string_literal: true
+
+class CreatePCiJobInfoInstances < Gitlab::Database::Migration[2.3]
+  milestone '18.7'
+
+  def change
+    opts = {
+      primary_key: [:job_id, :partition_id],
+      options: 'PARTITION BY LIST (partition_id)'
+    }
+
+    create_table(:p_ci_job_info_instances, **opts) do |t|
+      t.bigint :project_id, null: false, index: true
+      t.bigint :partition_id, null: false
+      t.bigint :job_id, null: false
+      t.bigint :job_info_id, null: false, index: true
+    end
+  end
+end
diff --git a/db/migrate/20251202000004_create_p_ci_job_info_instances_partitions.rb b/db/migrate/20251202000004_create_p_ci_job_info_instances_partitions.rb
new file mode 100644
index 00000000000000..930408c9012840
--- /dev/null
+++ b/db/migrate/20251202000004_create_p_ci_job_info_instances_partitions.rb
@@ -0,0 +1,35 @@
+# frozen_string_literal: true
+
+# TODO: This migration is just to initialize partitions for local gdk. For production, we can
+# remove it and rely on the partition manager to create the necessary partitions instead.
+class CreatePCiJobInfoInstancesPartitions < Gitlab::Database::Migration[2.3]
+  milestone '18.7'
+
+  disable_ddl_transaction!
+
+  def up
+    sql = (100..108).map do |partition_id|
+      <<~SQL
+      CREATE TABLE IF NOT EXISTS gitlab_partitions_dynamic.ci_job_info_instances_#{partition_id}
+        PARTITION OF p_ci_job_info_instances
+        FOR VALUES IN (#{partition_id});
+      SQL
+    end.join
+
+    with_lock_retries do
+      connection.execute(sql)
+    end
+  end
+
+  def down
+    sql = (100..108).map do |partition_id|
+      <<~SQL
+      DROP TABLE IF EXISTS gitlab_partitions_dynamic.ci_job_info_instances_#{partition_id};
+      SQL
+    end.join
+
+    with_lock_retries do
+      connection.execute(sql)
+    end
+  end
+end
diff --git a/db/post_migrate/20251103190204_add_index_on_p_ci_builds_job_info_id.rb b/db/post_migrate/20251103190204_add_index_on_p_ci_builds_job_info_id.rb
deleted file mode 100644
index 9356d3201667f7..00000000000000
--- a/db/post_migrate/20251103190204_add_index_on_p_ci_builds_job_info_id.rb
+++ /dev/null
@@ -1,22 +0,0 @@
-# frozen_string_literal: true
-
-# TODO: This index should first be added asynchronously on Production
-class AddIndexOnPCiBuildsJobInfoId < Gitlab::Database::Migration[2.3]
-  include Gitlab::Database::PartitioningMigrationHelpers
-
-  milestone '18.6'
-
-  disable_ddl_transaction!
-
-  PARTITIONED_INDEX_NAME = 'index_p_ci_builds_on_job_info_id'
-
-  # rubocop: disable Migration/PreventIndexCreation -- Required to deduplicate data into ci_job_infos table
-  def up
-    add_concurrent_partitioned_index :p_ci_builds, :job_info_id, name: PARTITIONED_INDEX_NAME
-  end
-
-  def down
-    remove_concurrent_partitioned_index_by_name :p_ci_builds, PARTITIONED_INDEX_NAME
-  end
-  # rubocop: enable Migration/PreventIndexCreation
-end
diff --git a/db/post_migrate/20251103191450_add_fk_on_p_ci_builds_job_info_id.rb b/db/post_migrate/20251202000005_add_fk_to_ci_job_infos_from_info_instances.rb
similarity index 63%
rename from db/post_migrate/20251103191450_add_fk_on_p_ci_builds_job_info_id.rb
rename to db/post_migrate/20251202000005_add_fk_to_ci_job_infos_from_info_instances.rb
index e7333992b1707a..4adb2e64a415fa 100644
--- a/db/post_migrate/20251103191450_add_fk_on_p_ci_builds_job_info_id.rb
+++ b/db/post_migrate/20251202000005_add_fk_to_ci_job_infos_from_info_instances.rb
@@ -1,18 +1,15 @@
 # frozen_string_literal: true
 
-# TODO: This FK should first be added asynchronously on Production
-class AddFkOnPCiBuildsJobInfoId < Gitlab::Database::Migration[2.3]
+class AddFkToCiJobInfosFromInfoInstances < Gitlab::Database::Migration[2.3]
   include Gitlab::Database::PartitioningMigrationHelpers
 
-  milestone '18.6'
-
+  milestone '18.7'
   disable_ddl_transaction!
 
-  SOURCE_TABLE_NAME = :p_ci_builds
+  SOURCE_TABLE_NAME = :p_ci_job_info_instances
   TARGET_TABLE_NAME = :p_ci_job_infos
-  FK_NAME = :fk_rails_2f23ec1c61
+  FK_NAME = :fk_rails_e414e4e39e
 
-  # rubocop: disable Migration/PreventForeignKeyCreation -- Required to deduplicate data into ci_job_infos table
   def up
     add_concurrent_partitioned_foreign_key(
       SOURCE_TABLE_NAME, TARGET_TABLE_NAME,
@@ -35,5 +32,4 @@ def down
       )
     end
   end
-  # rubocop: enable Migration/PreventForeignKeyCreation
 end
diff --git a/db/post_migrate/20251202000006_add_fk_to_ci_builds_from_info_instances.rb b/db/post_migrate/20251202000006_add_fk_to_ci_builds_from_info_instances.rb
new file mode 100644
index 00000000000000..63691e82bfc16f
--- /dev/null
+++ b/db/post_migrate/20251202000006_add_fk_to_ci_builds_from_info_instances.rb
@@ -0,0 +1,37 @@
+# frozen_string_literal: true
+
+class AddFkToCiBuildsFromInfoInstances < Gitlab::Database::Migration[2.3]
+  include Gitlab::Database::PartitioningMigrationHelpers
+
+  milestone '18.7'
+  disable_ddl_transaction!
+
+  SOURCE_TABLE_NAME = :p_ci_job_info_instances
+  TARGET_TABLE_NAME = :p_ci_builds
+  FK_NAME = :fk_rails_089a57086f
+
+  def up
+    # rubocop: disable Migration/PreventForeignKeyCreation -- Necessary for linking ci_job_infos
+    add_concurrent_partitioned_foreign_key(
+      SOURCE_TABLE_NAME, TARGET_TABLE_NAME,
+      column: [:partition_id, :job_id],
+      target_column: [:partition_id, :id],
+      on_update: :cascade,
+      on_delete: :cascade,
+      reverse_lock_order: true,
+      name: FK_NAME
+    )
+    # rubocop: enable Migration/PreventForeignKeyCreation
+  end
+
+  def down
+    with_lock_retries do
+      remove_foreign_key_if_exists(
+        SOURCE_TABLE_NAME,
+        TARGET_TABLE_NAME,
+        reverse_lock_order: true,
+        name: FK_NAME
+      )
+    end
+  end
+end
diff --git a/db/schema_migrations/20251031012621 b/db/schema_migrations/20251031012621
deleted file mode 100644
index 399047a9b10fae..00000000000000
--- a/db/schema_migrations/20251031012621
+++ /dev/null
@@ -1 +0,0 @@
-af4c3926aebf394a62080b9a0be3c7447e8a48513efede46ca4e3812dd1cc776
\ No newline at end of file
diff --git a/db/schema_migrations/20251031012831 b/db/schema_migrations/20251031012831
deleted file mode 100644
index a30007e277daec..00000000000000
--- a/db/schema_migrations/20251031012831
+++ /dev/null
@@ -1 +0,0 @@
-2f137baba28ea4604fc626f49ad58de7e85fb47142294b352c1f05b8642af143
\ No newline at end of file
diff --git a/db/schema_migrations/20251103182209 b/db/schema_migrations/20251103182209
deleted file mode 100644
index 78b14684cd97bd..00000000000000
--- a/db/schema_migrations/20251103182209
+++ /dev/null
@@ -1 +0,0 @@
-1806d088d027cafbb0ae3901752577aa8b5a5ca8725a02f16c72919d9a4e19e1
\ No newline at end of file
diff --git a/db/schema_migrations/20251103190204 b/db/schema_migrations/20251103190204
deleted file mode 100644
index 117dae5f3cf819..00000000000000
--- a/db/schema_migrations/20251103190204
+++ /dev/null
@@ -1 +0,0 @@
-57f15544e4d1f34c4562662ede1472d423bfe4f43b7f7d299b14b90580ba6d33
\ No newline at end of file
diff --git a/db/schema_migrations/20251103191450 b/db/schema_migrations/20251103191450
deleted file mode 100644
index 3ab4ba04be64db..00000000000000
--- a/db/schema_migrations/20251103191450
+++ /dev/null
@@ -1 +0,0 @@
-5e263650118c9ea701d737a991d50953910ba0108508598b0d24341e074de02a
\ No newline at end of file
diff --git a/db/schema_migrations/20251202000001 b/db/schema_migrations/20251202000001
new file mode 100644
index 00000000000000..0509012e1c11c9
--- /dev/null
+++ b/db/schema_migrations/20251202000001
@@ -0,0 +1 @@
+faced445914491be2b887c18309fd1effe6df6155d4b2c52fa3a6c81fdeb970d
\ No newline at end of file
diff --git a/db/schema_migrations/20251202000002 b/db/schema_migrations/20251202000002
new file mode 100644
index 00000000000000..b69b6c3617847e
--- /dev/null
+++ b/db/schema_migrations/20251202000002
@@ -0,0 +1 @@
+0d519552d80a0b3389c488b5cb9327c44f2d246abf951b3b111d949bd071bb86
\ No newline at end of file
diff --git a/db/schema_migrations/20251202000003 b/db/schema_migrations/20251202000003
new file mode 100644
index 00000000000000..10728ef363fa63
--- /dev/null
+++ b/db/schema_migrations/20251202000003
@@ -0,0 +1 @@
+436902e31b8aeb833be35c6f3358e2306ae9336deb76ebe03207b3e386139a98
\ No newline at end of file
diff --git a/db/schema_migrations/20251202000004 b/db/schema_migrations/20251202000004
new file mode 100644
index 00000000000000..300e2dd62e393e
--- /dev/null
+++ b/db/schema_migrations/20251202000004
@@ -0,0 +1 @@
+3a8658b3381054b65d05ea993344e6164b40b059bbc1490267039167524fafc1
\ No newline at end of file
diff --git a/db/schema_migrations/20251202000005 b/db/schema_migrations/20251202000005
new file mode 100644
index 00000000000000..f0264852bf3369
--- /dev/null
+++ b/db/schema_migrations/20251202000005
@@ -0,0 +1 @@
+25a25cd891d6dd7d1cb36c3a77a29e1fad9d59a997f42f2c56651052b95d9e03
\ No newline at end of file
diff --git a/db/schema_migrations/20251202000006 b/db/schema_migrations/20251202000006
new file mode 100644
index 00000000000000..11e9e1d44ccde5
--- /dev/null
+++ b/db/schema_migrations/20251202000006
@@ -0,0 +1 @@
+b2423358bb78ee5849fe3f12f47ae08827658607b474b22ccb8d5d6bc1a507d4
\ No newline at end of file
diff --git a/db/structure.sql b/db/structure.sql
index 99bdafa73add7d..1a415246471d83 100644
--- a/db/structure.sql
+++ b/db/structure.sql
@@ -5684,7 +5684,6 @@ CREATE TABLE p_ci_builds (
     timeout_source smallint,
     exit_code smallint,
     debug_trace_enabled boolean,
-    job_info_id bigint,
     CONSTRAINT check_1e2fbd1b39 CHECK ((lock_version IS NOT NULL)),
     CONSTRAINT check_9aa9432137 CHECK ((project_id IS NOT NULL))
 )
@@ -5788,6 +5787,14 @@ CREATE TABLE p_ci_job_definitions (
 )
 PARTITION BY LIST (partition_id);
 
+CREATE TABLE p_ci_job_info_instances (
+    project_id bigint NOT NULL,
+    partition_id bigint NOT NULL,
+    job_id bigint NOT NULL,
+    job_info_id bigint NOT NULL
+)
+PARTITION BY LIST (partition_id);
+
 CREATE TABLE p_ci_job_infos (
     id bigint NOT NULL,
     partition_id bigint NOT NULL,
@@ -36385,6 +36392,9 @@ ALTER TABLE ONLY p_ci_job_definition_instances
 ALTER TABLE ONLY p_ci_job_definitions
     ADD CONSTRAINT p_ci_job_definitions_pkey PRIMARY KEY (id, partition_id);
 
+ALTER TABLE ONLY p_ci_job_info_instances
+    ADD CONSTRAINT p_ci_job_info_instances_pkey PRIMARY KEY (job_id, partition_id);
+
 ALTER TABLE ONLY p_ci_job_infos
     ADD CONSTRAINT p_ci_job_infos_pkey PRIMARY KEY (id, partition_id);
 
@@ -43344,8 +43354,6 @@ CREATE INDEX index_p_ci_builds_execution_configs_on_project_id ON ONLY p_ci_buil
 
 CREATE INDEX index_p_ci_builds_on_execution_config_id ON ONLY p_ci_builds USING btree (execution_config_id) WHERE (execution_config_id IS NOT NULL);
 
-CREATE INDEX index_p_ci_builds_on_job_info_id ON ONLY p_ci_builds USING btree (job_info_id);
-
 CREATE INDEX index_p_ci_finished_build_ch_sync_events_finished_at ON ONLY p_ci_finished_build_ch_sync_events USING btree (partition, build_finished_at);
 
 CREATE INDEX index_p_ci_finished_build_ch_sync_events_on_project_id ON ONLY p_ci_finished_build_ch_sync_events USING btree (project_id);
@@ -43366,9 +43374,13 @@ CREATE INDEX index_p_ci_job_definitions_on_interruptible ON ONLY p_ci_job_defini
 
 CREATE UNIQUE INDEX index_p_ci_job_definitions_on_project_id_and_checksum ON ONLY p_ci_job_definitions USING btree (project_id, checksum, partition_id);
 
-CREATE UNIQUE INDEX index_p_ci_job_infos_on_project_id_and_checksum ON ONLY p_ci_job_infos USING btree (project_id, checksum, partition_id);
+CREATE INDEX index_p_ci_job_info_instances_on_job_info_id ON ONLY p_ci_job_info_instances USING btree (job_info_id);
+
+CREATE INDEX index_p_ci_job_info_instances_on_project_id ON ONLY p_ci_job_info_instances USING btree (project_id);
 
-CREATE INDEX index_p_ci_job_infos_on_project_id_scheduling_type_and_id ON ONLY p_ci_job_infos USING btree (project_id, scheduling_type, id);
+CREATE INDEX index_p_ci_job_infos_on_id_where_scheduling_type_dag ON ONLY p_ci_job_infos USING btree (id) WHERE (scheduling_type = 1);
+
+CREATE UNIQUE INDEX index_p_ci_job_infos_on_project_id_and_checksum ON ONLY p_ci_job_infos USING btree (project_id, checksum, partition_id);
 
 CREATE INDEX index_p_ci_job_infos_on_search_vector ON ONLY p_ci_job_infos USING gin (search_vector);
 
@@ -52588,6 +52600,9 @@ ALTER TABLE ONLY security_policies
 ALTER TABLE ONLY virtual_registries_packages_npm_upstreams
     ADD CONSTRAINT fk_rails_08949a6736 FOREIGN KEY (group_id) REFERENCES namespaces(id) ON DELETE CASCADE;
 
+ALTER TABLE p_ci_job_info_instances
+    ADD CONSTRAINT fk_rails_089a57086f FOREIGN KEY (partition_id, job_id) REFERENCES p_ci_builds(partition_id, id) ON UPDATE CASCADE ON DELETE CASCADE;
+
 ALTER TABLE ONLY subscription_user_add_on_assignment_versions
     ADD CONSTRAINT fk_rails_091e013a61 FOREIGN KEY (organization_id) REFERENCES organizations(id);
 
@@ -52942,9 +52957,6 @@ ALTER TABLE ONLY onboarding_progresses
 ALTER TABLE ONLY protected_branch_unprotect_access_levels
     ADD CONSTRAINT fk_rails_2d2aba21ef FOREIGN KEY (user_id) REFERENCES users(id) ON DELETE CASCADE;
 
-ALTER TABLE p_ci_builds
-    ADD CONSTRAINT fk_rails_2f23ec1c61 FOREIGN KEY (partition_id, job_info_id) REFERENCES p_ci_job_infos(partition_id, id) ON UPDATE RESTRICT ON DELETE RESTRICT;
-
 ALTER TABLE ONLY issuable_severities
     ADD CONSTRAINT fk_rails_2fbb74ad6d FOREIGN KEY (issue_id) REFERENCES issues(id) ON DELETE CASCADE;
 
@@ -54466,6 +54478,9 @@ ALTER TABLE ONLY approval_policy_rules
 ALTER TABLE ONLY work_item_select_field_values
     ADD CONSTRAINT fk_rails_e3ecc2c14e FOREIGN KEY (custom_field_id) REFERENCES custom_fields(id) ON DELETE CASCADE;
 
+ALTER TABLE p_ci_job_info_instances
+    ADD CONSTRAINT fk_rails_e414e4e39e FOREIGN KEY (partition_id, job_info_id) REFERENCES p_ci_job_infos(partition_id, id) ON UPDATE RESTRICT ON DELETE RESTRICT;
+
 ALTER TABLE ONLY vulnerability_occurrence_identifiers
     ADD CONSTRAINT fk_rails_e4ef6d027c FOREIGN KEY (occurrence_id) REFERENCES vulnerability_occurrences(id) ON DELETE CASCADE;
 
diff --git a/lib/gitlab/ci/job_infos/find_or_create.rb b/lib/gitlab/ci/job_infos/find_or_create.rb
index 9ecaf45cd43ed6..1a3dfa25afb80a 100644
--- a/lib/gitlab/ci/job_infos/find_or_create.rb
+++ b/lib/gitlab/ci/job_infos/find_or_create.rb
@@ -4,7 +4,8 @@ module Gitlab
   module Ci
     module JobInfos
       # TODO: This class mirrors Ci::JobDefinitions::FindOrCreate;
-      # maybe they can be combined into a single implementation class
+      # maybe they can be combined into a single implementation class or
+      # refactor to use a shared module/base class?
       class FindOrCreate
         BATCH_SIZE = 50
 
diff --git a/lib/gitlab/ci/pipeline/create/job_info_builder.rb b/lib/gitlab/ci/pipeline/create/job_info_builder.rb
index 5fcf189baff149..3328a366e8f719 100644
--- a/lib/gitlab/ci/pipeline/create/job_info_builder.rb
+++ b/lib/gitlab/ci/pipeline/create/job_info_builder.rb
@@ -4,6 +4,8 @@ module Gitlab
   module Ci
     module Pipeline
       module Create
+        # This class mirrors JobDefinitionBuilder.
+        # TODO: Refactor shared code into module or parent class?
         class JobInfoBuilder
           include Gitlab::Utils::StrongMemoize
 
@@ -16,7 +18,9 @@ def initialize(pipeline, jobs)
           def run
             find_or_insert_job_infos.each do |job_info|
               jobs_by_checksum[job_info.checksum].each do |job|
-                job.job_info = job_info
+                job.build_job_info_instance(
+                  job_info: job_info, partition_id: pipeline.partition_id, project: project
+                )
               end
             end
           end
diff --git a/lib/gitlab/import_export/project/import_export.yml b/lib/gitlab/import_export/project/import_export.yml
index 14739756e275f0..9b24c3d3d2fc93 100644
--- a/lib/gitlab/import_export/project/import_export.yml
+++ b/lib/gitlab/import_export/project/import_export.yml
@@ -108,6 +108,7 @@ tree:
       - :merge_request
       - :pipeline_metadata
     - :job_infos # TODO: I think this is necessary to export; to confirm
+    - :job_info_instances # TODO: I think this is necessary to export; to confirm
     - :auto_devops
     - :pipeline_schedules
     - :container_expiration_policy
@@ -596,12 +597,18 @@ included_attributes:
     - :scheduled_at
     - :scheduling_type
     - :ci_stage
-    - :job_info_id
   builds: *statuses_definition
   generic_commit_statuses: *statuses_definition
   bridges: *statuses_definition
-  job_infos: # TODO: Assess attributes to export form ci_job_infos
+  job_infos: # TODO: Update with latest ci_job_infos attributes
+    - project_id
+    - name
     - scheduling_type
+    - config
+  job_infos:
+    - project_id
+    - job_id
+    - job_info_id
   ci_pipelines:
     - :ref
     - :sha
diff --git a/lib/gitlab/import_export/project/relation_factory.rb b/lib/gitlab/import_export/project/relation_factory.rb
index 6e89cae9b1f765..6542fe1eeadba6 100644
--- a/lib/gitlab/import_export/project/relation_factory.rb
+++ b/lib/gitlab/import_export/project/relation_factory.rb
@@ -46,7 +46,8 @@ class RelationFactory < Base::RelationFactory
                       work_item_description: 'WorkItems::Description',
                       user_contributions: 'User',
                       squash_option: 'Projects::BranchRules::SquashOption',
-                      job_infos: 'Ci::JobInfo' }.freeze
+                      job_infos: 'Ci::JobInfo',
+                      job_info_instances: 'Ci::JobInfoInstance' }.freeze
 
         BUILD_MODELS = %i[Ci::Build Ci::Bridge commit_status generic_commit_status].freeze
 
diff --git a/spec/factories/ci/job_info_instances.rb b/spec/factories/ci/job_info_instances.rb
new file mode 100644
index 00000000000000..964d0ee465941f
--- /dev/null
+++ b/spec/factories/ci/job_info_instances.rb
@@ -0,0 +1,9 @@
+# frozen_string_literal: true
+
+FactoryBot.define do
+  factory :ci_job_info_instance, class: 'Ci::JobInfoInstance' do
+    project factory: :project
+    job factory: :ci_build
+    job_info factory: :ci_job_info
+  end
+end
diff --git a/spec/factories/ci/processable.rb b/spec/factories/ci/processable.rb
index 7506b6227c6111..691229fa7a6194 100644
--- a/spec/factories/ci/processable.rb
+++ b/spec/factories/ci/processable.rb
@@ -107,7 +107,8 @@
         processable.temp_job_definition = nil
       end
 
-      if processable.job_info_id
+      # job_info_instance is assigned when we run JobInfoBuilder
+      if processable.job_info_instance
         processable.association(:job_info).reload
         processable.temp_job_info = nil
       end
@@ -119,6 +120,12 @@
       end
     end
 
+    trait :without_job_info do
+      after(:build) do |processable, evaluator|
+        processable.temp_job_info = nil
+      end
+    end
+
     trait :waiting_for_resource do
       status { 'waiting_for_resource' }
     end
diff --git a/spec/lib/gitlab/import_export/all_models.yml b/spec/lib/gitlab/import_export/all_models.yml
index 5246a34b3fe937..8e5dcb752b51b1 100644
--- a/spec/lib/gitlab/import_export/all_models.yml
+++ b/spec/lib/gitlab/import_export/all_models.yml
@@ -996,6 +996,7 @@ project:
 - enabled_foundational_flows
 - enabled_foundational_flow_records
 - job_infos
+- job_info_instances
 award_emoji:
 - awardable
 - user
diff --git a/spec/models/ci/bridge_spec.rb b/spec/models/ci/bridge_spec.rb
index 323222984b9cda..3476b4c9cb8798 100644
--- a/spec/models/ci/bridge_spec.rb
+++ b/spec/models/ci/bridge_spec.rb
@@ -86,7 +86,6 @@
         pipeline project ref tag name allow_failure stage_idx
         when environment description needs_attributes
         scheduling_type ci_stage partition_id resource_group
-        job_info_id
       ]
 
       expect(described_class.clone_accessors).to eq(expected_accessors)
-- 
GitLab


From 15b1cbe22d1a194e5f7b231ae0986ef8e5cc3183 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Thu, 4 Dec 2025 10:13:12 -0800
Subject: [PATCH 18/27] Add needs_attributes to job_info

Add needs_atributes to job_info
---
 app/graphql/types/ci/build_need_type.rb       |  14 +++
 app/graphql/types/ci/job_need_union.rb        |   2 +-
 app/graphql/types/ci/job_type.rb              |   6 +-
 app/models/ci/job_info.rb                     |  25 +++-
 app/models/concerns/ci/metadatable.rb         |  32 ++---
 .../wip/read_from_ci_job_infos.yml            |   6 +-
 ...riting_ci_job_info_to_old_destinations.yml |   6 +-
 .../wip/write_to_ci_job_infos.yml             |   6 +-
 lib/gitlab/ci/needs/collection.rb             | 114 ++++++++++++++++++
 lib/gitlab/ci/yaml_processor/result.rb        |   1 +
 10 files changed, 181 insertions(+), 31 deletions(-)
 create mode 100644 lib/gitlab/ci/needs/collection.rb

diff --git a/app/graphql/types/ci/build_need_type.rb b/app/graphql/types/ci/build_need_type.rb
index dbdfc3c5176be5..3845845a0a5166 100644
--- a/app/graphql/types/ci/build_need_type.rb
+++ b/app/graphql/types/ci/build_need_type.rb
@@ -11,6 +11,20 @@ class BuildNeedType < BaseObject
         description: 'ID of the BuildNeed.'
       field :name, GraphQL::Types::String, null: true,
         description: 'Name of the job we need to complete.'
+
+      # To generate the pipeline dependencies graph, the FE just requires each need to have a
+      # unique ID; it doesn't have to be a "real" ID.
+      # Since job ID is globally unique, job names are unique within a pipeline, and a job
+      # cannot need the same job twice, a globally unique ID for each need can be made
+      # with just <job_id> + <name_of_needed_job>
+      def id
+        "gid://gitlab/Ci::BuildNeed/#{Digest::MD5.hexdigest("#{job_id}/#{object.name}")}"
+      end
+
+      # TODO: We can change this to just object.job_id after we drop ci_build_needs table
+      def job_id
+        object.is_a?(::Gitlab::Ci::Needs::Collection::Need) ? object.needed_by_job_id : object.build_id
+      end
     end
   end
 end
diff --git a/app/graphql/types/ci/job_need_union.rb b/app/graphql/types/ci/job_need_union.rb
index 61ad5432db820a..17996bac685450 100644
--- a/app/graphql/types/ci/job_need_union.rb
+++ b/app/graphql/types/ci/job_need_union.rb
@@ -9,7 +9,7 @@ class JobNeedUnion < GraphQL::Schema::Union
 
       def self.resolve_type(object, context)
         case object
-        when ::Ci::BuildNeed
+        when ::Ci::BuildNeed, ::Gitlab::Ci::Needs::Collection::Need
           Types::Ci::BuildNeedType
         when CommitStatus
           Types::Ci::JobType
diff --git a/app/graphql/types/ci/job_type.rb b/app/graphql/types/ci/job_type.rb
index cdfec538791c8e..e9f3e2a29e2ab0 100644
--- a/app/graphql/types/ci/job_type.rb
+++ b/app/graphql/types/ci/job_type.rb
@@ -176,13 +176,17 @@ def trace
         object.trace if object.has_trace?
       end
 
+      def needs
+        object.intrinsic_needs
+      end
+
       def previous_stage_jobs_or_needs
         if object.scheduling_type == 'stage'
           Gitlab::Graphql::Lazy.with_value(previous_stage_jobs) do |jobs|
             jobs
           end
         else
-          object.needs
+          object.intrinsic_needs
         end
       end
 
diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
index 0af619422939a8..221d8ce8359a94 100644
--- a/app/models/ci/job_info.rb
+++ b/app/models/ci/job_info.rb
@@ -18,15 +18,16 @@ class JobInfo < Ci::ApplicationRecord
     # Order is important for the checksum calculation.
     CONFIG_ATTRIBUTES = [
       :scheduling_type,
-      :name
+      :name,
+      :needs_attributes
     ].freeze
     NORMALIZED_DATA_COLUMNS = [
       :scheduling_type,
       :name
     ].freeze
 
-    # We're copying over these values to ci_job_infos but not dropping them from ci_builds
-    CI_BUILD_ATTRS_TO_KEEP = [:name].freeze
+    # We're copying over these values to ci_job_infos but not dropping them from their original/initial destinations
+    CONFIG_ATTRS_TO_KEEP = [:name, :needs_attributes].freeze
 
     MAX_JOB_NAME_LENGTH = 255
 
@@ -50,16 +51,17 @@ class JobInfo < Ci::ApplicationRecord
 
     def self.fabricate(config:, project_id:, partition_id:)
       sanitized_config = normalize_and_sanitize(config)
+      transformed_config = transform(sanitized_config)
 
       # NOTE: Checksum is generated with all attributes including normalized columns. But when storing
       # the data, we can save space by excluding the normalized column values from the config hash.
       attrs = {
         project_id: project_id,
         partition_id: partition_id,
-        config: sanitized_config.except(*NORMALIZED_DATA_COLUMNS),
-        checksum: generate_checksum(sanitized_config),
+        config: transformed_config.except(*NORMALIZED_DATA_COLUMNS),
+        checksum: generate_checksum(transformed_config),
         created_at: Time.current,
-        **sanitized_config.slice(*NORMALIZED_DATA_COLUMNS)
+        **transformed_config.slice(*NORMALIZED_DATA_COLUMNS)
       }
 
       new(attrs)
@@ -75,6 +77,17 @@ def self.normalize_and_sanitize(config)
       data.slice(*CONFIG_ATTRIBUTES)
     end
 
+    def self.transform(config)
+      return config unless config[:needs_attributes].present?
+
+      # For needs, we only need to store the names for the pipeline UI graph
+      config[:needs_attributes] = config[:needs_attributes].map do |need| 
+        need.slice(*::Gitlab::Ci::Needs::Collection::INTRINSIC_ATTRIBUTES)
+      end
+
+      config
+    end
+
     def self.generate_checksum(config)
       config
         .then { |data| Gitlab::Json.dump(data) }
diff --git a/app/models/concerns/ci/metadatable.rb b/app/models/concerns/ci/metadatable.rb
index 42ded264366f92..e117e3c5e65009 100644
--- a/app/models/concerns/ci/metadatable.rb
+++ b/app/models/concerns/ci/metadatable.rb
@@ -191,10 +191,8 @@ def secrets=(_value)
       raise ActiveRecord::ReadonlyAttributeError, 'This data is read only'
     end
 
-    # TODO: Remove when ci_builds.scheduling_type is dropped
-    # and delegate to Ci::JobInfo.
     def scheduling_type
-      read_job_info_attribute(:scheduling_type)
+      read_job_info_attribute(:scheduling_type) || read_attribute(:scheduling_type)
     end
 
     # Need this method to overwrite ci_builds.scheduling_type enum.
@@ -221,6 +219,16 @@ def name=(value)
       write_attribute(:name, value)
     end
 
+    # We only store the needed jobs' names in job_info;
+    # full needs attributes for job processing are stored in job_definition
+    def intrinsic_needs
+      return needs
+      needs_attrs = read_job_info_attribute(:needs_attributes)
+      return needs unless needs_attrs.present?
+
+      ::Gitlab::Ci::Needs::Collection.new(needs_attrs)
+    end
+
     private
 
     def read_metadata_attribute(legacy_key, metadata_key, job_definition_key, default_value = nil)
@@ -233,18 +241,14 @@ def read_metadata_attribute(legacy_key, metadata_key, job_definition_key, defaul
       metadata&.read_attribute(metadata_key) || default_value
     end
 
-    def read_job_info_attribute(key, default_value: nil)
-      if read_from_ci_job_infos?
-        result = if key.in?(::Ci::JobInfo::NORMALIZED_DATA_COLUMNS)
-                   job_info&.read_attribute(key) || temp_job_info&.read_attribute(key)
-                 else
-                   job_info&.config&.dig(key) || temp_job_info&.config&.dig(key)
-                 end
-      end
+    def read_job_info_attribute(key)
+      return unless read_from_ci_job_infos?
 
-      return result if result
-
-      read_attribute(key) || default_value
+      if key.in?(::Ci::JobInfo::NORMALIZED_DATA_COLUMNS)
+        job_info&.read_attribute(key) || temp_job_info&.read_attribute(key)
+      else
+        job_info&.config&.dig(key) || temp_job_info&.config&.dig(key)
+      end
     end
 
     def read_from_ci_job_infos?
diff --git a/config/feature_flags/wip/read_from_ci_job_infos.yml b/config/feature_flags/wip/read_from_ci_job_infos.yml
index bfa9d1b110ffe9..4cc2deaf7e7766 100644
--- a/config/feature_flags/wip/read_from_ci_job_infos.yml
+++ b/config/feature_flags/wip/read_from_ci_job_infos.yml
@@ -1,9 +1,9 @@
 ---
 name: read_from_ci_job_infos
 description:
-feature_issue_url:
-introduced_by_url:
-rollout_issue_url:
+feature_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/577211
+introduced_by_url: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540
+rollout_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/577211
 milestone: '18.6'
 group: group::ci platform
 type: wip
diff --git a/config/feature_flags/wip/stop_writing_ci_job_info_to_old_destinations.yml b/config/feature_flags/wip/stop_writing_ci_job_info_to_old_destinations.yml
index 2bde8077d20335..dbf1812b2e5ea3 100644
--- a/config/feature_flags/wip/stop_writing_ci_job_info_to_old_destinations.yml
+++ b/config/feature_flags/wip/stop_writing_ci_job_info_to_old_destinations.yml
@@ -1,9 +1,9 @@
 ---
 name: stop_writing_ci_job_info_to_old_destinations
 description:
-feature_issue_url:
-introduced_by_url:
-rollout_issue_url:
+feature_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/577211
+introduced_by_url: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540
+rollout_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/577211
 milestone: '18.6'
 group: group::ci platform
 type: wip
diff --git a/config/feature_flags/wip/write_to_ci_job_infos.yml b/config/feature_flags/wip/write_to_ci_job_infos.yml
index b45a0f86fe75fa..c6c4433a780b9c 100644
--- a/config/feature_flags/wip/write_to_ci_job_infos.yml
+++ b/config/feature_flags/wip/write_to_ci_job_infos.yml
@@ -1,9 +1,9 @@
 ---
 name: write_to_ci_job_infos
 description:
-feature_issue_url:
-introduced_by_url:
-rollout_issue_url:
+feature_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/577211
+introduced_by_url: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540
+rollout_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/577211
 milestone: '18.6'
 group: group::ci platform
 type: wip
diff --git a/lib/gitlab/ci/needs/collection.rb b/lib/gitlab/ci/needs/collection.rb
new file mode 100644
index 00000000000000..9b7acc5e329271
--- /dev/null
+++ b/lib/gitlab/ci/needs/collection.rb
@@ -0,0 +1,114 @@
+# frozen_string_literal: true
+
+module Gitlab
+  module Ci
+    module Needs
+      class Collection
+        INTRINSIC_ATTRIBUTES = [:name].freeze
+
+        Need = Struct.new(:job_id, :name, :artifacts, :optional, keyword_init: true)
+
+        def initialize(job, needs = [])
+          @needs = []
+          @needs_by_key = Hash.new { |h, k| h[k] = [] }
+          @errors = errors
+
+          variables.each { |variable| self.append(variable) }
+        end
+
+        def append(resource)
+          item = Collection::Item.fabricate(resource)
+          @needs.append(item)
+          @needs_by_key[item[:key]] << item
+
+          self
+        end
+
+        def compact
+          Collection.new(select { |variable| !variable.value.nil? })
+        end
+
+        def concat(resources)
+          return self if resources.nil?
+
+          tap { resources.each { |variable| self.append(variable) } }
+        end
+
+        def each
+          @needs.each { |variable| yield variable }
+        end
+
+        def +(other)
+          self.class.new.tap do |collection|
+            self.each { |variable| collection.append(variable) }
+            other.each { |variable| collection.append(variable) }
+          end
+        end
+
+        def [](key)
+          all(key)&.last
+        end
+
+        def all(key)
+          vars = @needs_by_key[key]
+          vars unless vars.empty?
+        end
+
+        def size
+          @needs.size
+        end
+
+        # This method should only be called via runner_variables->to_runner_variables
+        # because this is an expensive operation by initializing new objects in `to_runner_variable`.
+        def to_runner_variables
+          self.map(&:to_runner_variable)
+        end
+
+        def to_hash_variables
+          self.map(&:to_hash_variable)
+        end
+
+        def to_hash
+          self.each_with_object(ActiveSupport::HashWithIndifferentAccess.new) do |variable, result|
+            result[variable.key] = variable.value
+          end
+        end
+
+        def reject(&block)
+          Collection.new(@needs.reject(&block))
+        end
+
+        def sort_and_expand_all(keep_undefined: false, expand_file_refs: true, expand_raw_refs: true)
+          sorted = Sort.new(self)
+          return self.class.new(self, sorted.errors) unless sorted.valid?
+
+          new_collection = self.class.new
+
+          sorted.tsort.each do |item|
+            unless item.depends_on
+              new_collection.append(item)
+              next
+            end
+
+            # expand variables as they are added
+            variable = item.to_runner_variable
+            variable[:value] = new_collection.expand_value(variable[:value], keep_undefined: keep_undefined,
+              expand_file_refs: expand_file_refs,
+              expand_raw_refs: expand_raw_refs)
+            new_collection.append(variable)
+          end
+
+          new_collection
+        end
+
+        def to_s
+          "#{@needs_by_key.keys}, @errors='#{@errors}'"
+        end
+
+        private
+
+        attr_reader :needs
+      end
+    end
+  end
+end
diff --git a/lib/gitlab/ci/yaml_processor/result.rb b/lib/gitlab/ci/yaml_processor/result.rb
index d2c603a806551a..f6bc1583813a09 100644
--- a/lib/gitlab/ci/yaml_processor/result.rb
+++ b/lib/gitlab/ci/yaml_processor/result.rb
@@ -119,6 +119,7 @@ def stage_builds_attributes(stage)
 
         def build_attributes(name)
           job = jobs.fetch(name.to_sym, {})
+          binding.pry
 
           { stage_idx: stages.index(job[:stage]),
             stage: job[:stage],
-- 
GitLab


From d3badc56981004224baa61dbd141879348ec2883 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Fri, 5 Dec 2025 14:34:32 -0800
Subject: [PATCH 19/27] Create new JobNeeds::Collection class to represent
 needs

Introduces new class to represent a collection
of Need objects (essentially hashes turned into
Structs).
---
 app/graphql/types/ci/build_need_type.rb |  16 +---
 app/graphql/types/ci/job_need_union.rb  |   2 +-
 app/graphql/types/ci/job_type.rb        |   8 +-
 app/models/ci/job_info.rb               |   6 +-
 app/models/concerns/ci/metadatable.rb   |   5 +-
 doc/api/graphql/reference/_index.md     |   2 +-
 lib/gitlab/ci/job_needs/collection.rb   |  68 ++++++++++++++
 lib/gitlab/ci/needs/collection.rb       | 114 ------------------------
 lib/gitlab/ci/yaml_processor/result.rb  |   1 -
 9 files changed, 78 insertions(+), 144 deletions(-)
 create mode 100644 lib/gitlab/ci/job_needs/collection.rb
 delete mode 100644 lib/gitlab/ci/needs/collection.rb

diff --git a/app/graphql/types/ci/build_need_type.rb b/app/graphql/types/ci/build_need_type.rb
index 3845845a0a5166..78cccad41640fd 100644
--- a/app/graphql/types/ci/build_need_type.rb
+++ b/app/graphql/types/ci/build_need_type.rb
@@ -8,23 +8,9 @@ class BuildNeedType < BaseObject
       graphql_name 'CiBuildNeed'
 
       field :id, GraphQL::Types::ID, null: false,
-        description: 'ID of the BuildNeed.'
+        description: 'ID of Ci::BuildNeed or Gitlab::Ci::JobNeeds::Collection::Need.'
       field :name, GraphQL::Types::String, null: true,
         description: 'Name of the job we need to complete.'
-
-      # To generate the pipeline dependencies graph, the FE just requires each need to have a
-      # unique ID; it doesn't have to be a "real" ID.
-      # Since job ID is globally unique, job names are unique within a pipeline, and a job
-      # cannot need the same job twice, a globally unique ID for each need can be made
-      # with just <job_id> + <name_of_needed_job>
-      def id
-        "gid://gitlab/Ci::BuildNeed/#{Digest::MD5.hexdigest("#{job_id}/#{object.name}")}"
-      end
-
-      # TODO: We can change this to just object.job_id after we drop ci_build_needs table
-      def job_id
-        object.is_a?(::Gitlab::Ci::Needs::Collection::Need) ? object.needed_by_job_id : object.build_id
-      end
     end
   end
 end
diff --git a/app/graphql/types/ci/job_need_union.rb b/app/graphql/types/ci/job_need_union.rb
index 17996bac685450..7aaeaea0a3d177 100644
--- a/app/graphql/types/ci/job_need_union.rb
+++ b/app/graphql/types/ci/job_need_union.rb
@@ -9,7 +9,7 @@ class JobNeedUnion < GraphQL::Schema::Union
 
       def self.resolve_type(object, context)
         case object
-        when ::Ci::BuildNeed, ::Gitlab::Ci::Needs::Collection::Need
+        when ::Ci::BuildNeed, ::Gitlab::Ci::JobNeeds::Collection::Need
           Types::Ci::BuildNeedType
         when CommitStatus
           Types::Ci::JobType
diff --git a/app/graphql/types/ci/job_type.rb b/app/graphql/types/ci/job_type.rb
index e9f3e2a29e2ab0..1bf595bb6cbbe5 100644
--- a/app/graphql/types/ci/job_type.rb
+++ b/app/graphql/types/ci/job_type.rb
@@ -26,7 +26,7 @@ class JobType < BaseObject
         description: 'Indicates the type of job.'
       field :name, GraphQL::Types::String, null: true,
         description: 'Name of the job.'
-      field :needs, BuildNeedType.connection_type, null: true,
+      field :needs, BuildNeedType.connection_type, null: true, method: :intrinsic_job_needs,
         description: 'References to builds that must complete before the jobs run.'
       field :pipeline, Types::Ci::PipelineInterface, null: true,
         description: 'Pipeline the job belongs to.'
@@ -176,17 +176,13 @@ def trace
         object.trace if object.has_trace?
       end
 
-      def needs
-        object.intrinsic_needs
-      end
-
       def previous_stage_jobs_or_needs
         if object.scheduling_type == 'stage'
           Gitlab::Graphql::Lazy.with_value(previous_stage_jobs) do |jobs|
             jobs
           end
         else
-          object.intrinsic_needs
+          object.intrinsic_job_needs
         end
       end
 
diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
index 221d8ce8359a94..243d87dc07bcdd 100644
--- a/app/models/ci/job_info.rb
+++ b/app/models/ci/job_info.rb
@@ -68,7 +68,7 @@ def self.fabricate(config:, project_id:, partition_id:)
     end
 
     def self.normalize_and_sanitize(config)
-      data = config.symbolize_keys
+      data = config.deep_symbolize_keys
 
       NORMALIZED_DATA_COLUMNS.each do |col|
         data[col] = data.fetch(col) { column_defaults[col.to_s] }
@@ -81,8 +81,8 @@ def self.transform(config)
       return config unless config[:needs_attributes].present?
 
       # For needs, we only need to store the names for the pipeline UI graph
-      config[:needs_attributes] = config[:needs_attributes].map do |need| 
-        need.slice(*::Gitlab::Ci::Needs::Collection::INTRINSIC_ATTRIBUTES)
+      config[:needs_attributes] = config[:needs_attributes].map do |need_hash|
+        need_hash.slice(*::Gitlab::Ci::JobNeeds::Collection::INTRINSIC_ATTRIBUTES)
       end
 
       config
diff --git a/app/models/concerns/ci/metadatable.rb b/app/models/concerns/ci/metadatable.rb
index e117e3c5e65009..2927aba51095d1 100644
--- a/app/models/concerns/ci/metadatable.rb
+++ b/app/models/concerns/ci/metadatable.rb
@@ -221,12 +221,11 @@ def name=(value)
 
     # We only store the needed jobs' names in job_info;
     # full needs attributes for job processing are stored in job_definition
-    def intrinsic_needs
-      return needs
+    def intrinsic_job_needs
       needs_attrs = read_job_info_attribute(:needs_attributes)
       return needs unless needs_attrs.present?
 
-      ::Gitlab::Ci::Needs::Collection.new(needs_attrs)
+      ::Gitlab::Ci::JobNeeds::Collection.new(self.id, needs_attrs).to_a
     end
 
     private
diff --git a/doc/api/graphql/reference/_index.md b/doc/api/graphql/reference/_index.md
index 11d55a274d05ea..878610312b7adc 100644
--- a/doc/api/graphql/reference/_index.md
+++ b/doc/api/graphql/reference/_index.md
@@ -27118,7 +27118,7 @@ Check user's permission for the car.
 
 | Name | Type | Description |
 | ---- | ---- | ----------- |
-| <a id="cibuildneedid"></a>`id` | [`ID!`](#id) | ID of the BuildNeed. |
+| <a id="cibuildneedid"></a>`id` | [`ID!`](#id) | ID of Ci::BuildNeed or Gitlab::Ci::JobNeeds::Collection::Need. |
 | <a id="cibuildneedname"></a>`name` | [`String`](#string) | Name of the job we need to complete. |
 
 ### `CiCatalogResource`
diff --git a/lib/gitlab/ci/job_needs/collection.rb b/lib/gitlab/ci/job_needs/collection.rb
new file mode 100644
index 00000000000000..4eb8bd74647143
--- /dev/null
+++ b/lib/gitlab/ci/job_needs/collection.rb
@@ -0,0 +1,68 @@
+# frozen_string_literal: true
+
+module Gitlab
+  module Ci
+    module JobNeeds
+      # Represents a collection of Need objects. Constructed
+      # from needs_attributes (array of hashes).
+      class Collection
+        ATTRIBUTES = [:job_id, :name, :artifacts, :optional].freeze
+        INTRINSIC_ATTRIBUTES = [:name].freeze
+
+        Need = Struct.new(*ATTRIBUTES, keyword_init: true) do
+          include GlobalID::Identification
+
+          def initialize(job_id:, name:, artifacts: true, optional: false)
+            super
+          end
+
+          # To generate the pipeline dependencies graph, the FE just requires each need to have a
+          # unique ID; it doesn't have to be a DB-persisted ID.
+          # Since job ID is globally unique, job names are unique within a pipeline, and a job
+          # cannot need the same job twice, a globally unique ID for each need can be made
+          # with just <job_id> + <name_of_needed_job>
+          def id
+            @id ||= Digest::MD5.hexdigest("#{job_id}/#{name}") # rubocop:disable Fips/MD5 -- Not security-sensitive; used to generate unique ID
+          end
+        end
+
+        def initialize(job_id, needs_attributes = [])
+          @job_id = job_id
+          @needs = fabricate_needs(needs_attributes)
+        end
+
+        def to_a
+          needs
+        end
+
+        def size
+          needs.size
+        end
+
+        def each
+          needs.each { |need| yield(need) }
+        end
+
+        def names_with_artifacts_true
+          needs.select(&:artifacts).map(&:name)
+        end
+
+        def names
+          needs.map(&:name)
+        end
+
+        private
+
+        attr_reader :job_id, :needs
+
+        def fabricate_needs(needs_attributes)
+          needs_attributes.map do |need_hash|
+            attrs = need_hash.symbolize_keys.slice(*ATTRIBUTES)
+
+            Need.new(**attrs.merge(job_id: job_id))
+          end
+        end
+      end
+    end
+  end
+end
diff --git a/lib/gitlab/ci/needs/collection.rb b/lib/gitlab/ci/needs/collection.rb
deleted file mode 100644
index 9b7acc5e329271..00000000000000
--- a/lib/gitlab/ci/needs/collection.rb
+++ /dev/null
@@ -1,114 +0,0 @@
-# frozen_string_literal: true
-
-module Gitlab
-  module Ci
-    module Needs
-      class Collection
-        INTRINSIC_ATTRIBUTES = [:name].freeze
-
-        Need = Struct.new(:job_id, :name, :artifacts, :optional, keyword_init: true)
-
-        def initialize(job, needs = [])
-          @needs = []
-          @needs_by_key = Hash.new { |h, k| h[k] = [] }
-          @errors = errors
-
-          variables.each { |variable| self.append(variable) }
-        end
-
-        def append(resource)
-          item = Collection::Item.fabricate(resource)
-          @needs.append(item)
-          @needs_by_key[item[:key]] << item
-
-          self
-        end
-
-        def compact
-          Collection.new(select { |variable| !variable.value.nil? })
-        end
-
-        def concat(resources)
-          return self if resources.nil?
-
-          tap { resources.each { |variable| self.append(variable) } }
-        end
-
-        def each
-          @needs.each { |variable| yield variable }
-        end
-
-        def +(other)
-          self.class.new.tap do |collection|
-            self.each { |variable| collection.append(variable) }
-            other.each { |variable| collection.append(variable) }
-          end
-        end
-
-        def [](key)
-          all(key)&.last
-        end
-
-        def all(key)
-          vars = @needs_by_key[key]
-          vars unless vars.empty?
-        end
-
-        def size
-          @needs.size
-        end
-
-        # This method should only be called via runner_variables->to_runner_variables
-        # because this is an expensive operation by initializing new objects in `to_runner_variable`.
-        def to_runner_variables
-          self.map(&:to_runner_variable)
-        end
-
-        def to_hash_variables
-          self.map(&:to_hash_variable)
-        end
-
-        def to_hash
-          self.each_with_object(ActiveSupport::HashWithIndifferentAccess.new) do |variable, result|
-            result[variable.key] = variable.value
-          end
-        end
-
-        def reject(&block)
-          Collection.new(@needs.reject(&block))
-        end
-
-        def sort_and_expand_all(keep_undefined: false, expand_file_refs: true, expand_raw_refs: true)
-          sorted = Sort.new(self)
-          return self.class.new(self, sorted.errors) unless sorted.valid?
-
-          new_collection = self.class.new
-
-          sorted.tsort.each do |item|
-            unless item.depends_on
-              new_collection.append(item)
-              next
-            end
-
-            # expand variables as they are added
-            variable = item.to_runner_variable
-            variable[:value] = new_collection.expand_value(variable[:value], keep_undefined: keep_undefined,
-              expand_file_refs: expand_file_refs,
-              expand_raw_refs: expand_raw_refs)
-            new_collection.append(variable)
-          end
-
-          new_collection
-        end
-
-        def to_s
-          "#{@needs_by_key.keys}, @errors='#{@errors}'"
-        end
-
-        private
-
-        attr_reader :needs
-      end
-    end
-  end
-end
diff --git a/lib/gitlab/ci/yaml_processor/result.rb b/lib/gitlab/ci/yaml_processor/result.rb
index f6bc1583813a09..d2c603a806551a 100644
--- a/lib/gitlab/ci/yaml_processor/result.rb
+++ b/lib/gitlab/ci/yaml_processor/result.rb
@@ -119,7 +119,6 @@ def stage_builds_attributes(stage)
 
         def build_attributes(name)
           job = jobs.fetch(name.to_sym, {})
-          binding.pry
 
           { stage_idx: stages.index(job[:stage]),
             stage: job[:stage],
-- 
GitLab


From f86420769007e0c9771d98f7fad4d242b6963e32 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Fri, 5 Dec 2025 17:52:27 -0800
Subject: [PATCH 20/27] Fix some spec failures

Changes to fix some spec failures.
---
 app/graphql/resolvers/ci/all_jobs_resolver.rb |  4 ++--
 .../resolvers/ci/runner_jobs_resolver.rb      |  1 +
 app/graphql/types/ci/stage_type.rb            |  2 +-
 app/models/project.rb                         |  3 ++-
 ee/lib/api/ai/duo_workflows/workflows.rb      |  2 +-
 lib/api/ci/pipelines.rb                       |  2 +-
 .../import_export/project/import_export.yml   | 20 +++++++++----------
 spec/db/schema_spec.rb                        |  2 +-
 8 files changed, 18 insertions(+), 18 deletions(-)

diff --git a/app/graphql/resolvers/ci/all_jobs_resolver.rb b/app/graphql/resolvers/ci/all_jobs_resolver.rb
index 6513f0ebde54dc..9b86caf16436f2 100644
--- a/app/graphql/resolvers/ci/all_jobs_resolver.rb
+++ b/app/graphql/resolvers/ci/all_jobs_resolver.rb
@@ -61,8 +61,8 @@ def preloads
           previous_stage_jobs_or_needs: [:needs, :pipeline],
           artifacts: [:job_artifacts],
           pipeline: [:user],
-          kind: [:metadata, :job_definition, :error_job_messages],
-          retryable: [:metadata, :job_definition, :error_job_messages],
+          kind: [:metadata, :job_definition, :job_info, :error_job_messages],
+          retryable: [:metadata, :job_definition, :job_info, :error_job_messages],
           project: [{ project: [:route, { namespace: [:route] }] }],
           commit_path: [:pipeline, { project: { namespace: [:route] } }],
           ref_path: [{ project: [:route, { namespace: [:route] }] }],
diff --git a/app/graphql/resolvers/ci/runner_jobs_resolver.rb b/app/graphql/resolvers/ci/runner_jobs_resolver.rb
index 35a3690ec15749..54554e8ed7b73c 100644
--- a/app/graphql/resolvers/ci/runner_jobs_resolver.rb
+++ b/app/graphql/resolvers/ci/runner_jobs_resolver.rb
@@ -36,6 +36,7 @@ def preloads
           detailed_status: [
             :metadata,
             :job_definition,
+            :job_info,
             :error_job_messages,
             { pipeline: [:merge_request] },
             { project: [:route, { namespace: :route }] }
diff --git a/app/graphql/types/ci/stage_type.rb b/app/graphql/types/ci/stage_type.rb
index a525da932715d0..bf191739d8d9fe 100644
--- a/app/graphql/types/ci/stage_type.rb
+++ b/app/graphql/types/ci/stage_type.rb
@@ -64,7 +64,7 @@ def jobs_for_pipeline(pipeline, stage_ids, include_needs)
         jobs = pipeline.statuses.latest.where(stage_id: stage_ids)
 
         preloaded_relations = [
-          :project, :metadata, :job_definition, :job_artifacts,
+          :project, :metadata, :job_definition, :job_info, :job_artifacts,
           :downstream_pipeline, :error_job_messages
         ]
         preloaded_relations << :needs if include_needs
diff --git a/app/models/project.rb b/app/models/project.rb
index 57f488722a5b77..7c9319822c0bd4 100644
--- a/app/models/project.rb
+++ b/app/models/project.rb
@@ -466,7 +466,8 @@ def with_developer_access
   has_many :build_trace_chunks, class_name: 'Ci::BuildTraceChunk', through: :builds, source: :trace_chunks, dependent: :restrict_with_error
   has_many :build_report_results, class_name: 'Ci::BuildReportResult', inverse_of: :project
   has_many :job_artifacts, class_name: 'Ci::JobArtifact', dependent: :restrict_with_error
-  has_many :job_infos, class_name: 'Ci::JobInfo', inverse_of: :project # NOTE: I think we need this for project export
+  has_many :job_infos, class_name: 'Ci::JobInfo', inverse_of: :project
+  has_many :job_info_instances, class_name: 'Ci::JobInfoInstance', inverse_of: :project
   has_many :pipeline_artifacts, class_name: 'Ci::PipelineArtifact', inverse_of: :project, dependent: :restrict_with_error
   has_many :runner_projects, class_name: 'Ci::RunnerProject', inverse_of: :project
   has_many :runners, through: :runner_projects, source: :runner, class_name: 'Ci::Runner'
diff --git a/ee/lib/api/ai/duo_workflows/workflows.rb b/ee/lib/api/ai/duo_workflows/workflows.rb
index 1838f4cbb37fdf..213a0005a2a6f4 100644
--- a/ee/lib/api/ai/duo_workflows/workflows.rb
+++ b/ee/lib/api/ai/duo_workflows/workflows.rb
@@ -422,7 +422,7 @@ def create_workflow_params
               end
               post do
                 ::Gitlab::QueryLimiting.disable!(
-                  'https://gitlab.com/gitlab-org/gitlab/-/issues/566195', new_threshold: 115
+                  'https://gitlab.com/gitlab-org/gitlab/-/issues/566195', new_threshold: 118
                 )
 
                 container = if params[:project_id]
diff --git a/lib/api/ci/pipelines.rb b/lib/api/ci/pipelines.rb
index c95df387a51ab6..91cfcb395fe53a 100644
--- a/lib/api/ci/pipelines.rb
+++ b/lib/api/ci/pipelines.rb
@@ -189,7 +189,7 @@ class Pipelines < ::API::Base
             .new(current_user: current_user, pipeline: pipeline, params: params)
             .execute
 
-          builds = builds.with_preloads.preload(:metadata, :job_definition, :runner_manager, :ci_stage) # rubocop:disable CodeReuse/ActiveRecord -- preload job.archived?
+          builds = builds.with_preloads.preload(:metadata, :job_definition, :job_info, :runner_manager, :ci_stage) # rubocop:disable CodeReuse/ActiveRecord -- preload job.archived?
 
           present paginate(builds), with: Entities::Ci::Job
         end
diff --git a/lib/gitlab/import_export/project/import_export.yml b/lib/gitlab/import_export/project/import_export.yml
index 9b24c3d3d2fc93..a6ae67ef1992d5 100644
--- a/lib/gitlab/import_export/project/import_export.yml
+++ b/lib/gitlab/import_export/project/import_export.yml
@@ -107,8 +107,8 @@ tree:
       - :external_pull_request
       - :merge_request
       - :pipeline_metadata
-    - :job_infos # TODO: I think this is necessary to export; to confirm
-    - :job_info_instances # TODO: I think this is necessary to export; to confirm
+    - :job_infos # TODO: I think these tables are necessary to export?
+    - :job_info_instances  # TODO: Need to confirm correct way to export job_info_instances in this yaml
     - :auto_devops
     - :pipeline_schedules
     - :container_expiration_policy
@@ -600,15 +600,13 @@ included_attributes:
   builds: *statuses_definition
   generic_commit_statuses: *statuses_definition
   bridges: *statuses_definition
-  job_infos: # TODO: Update with latest ci_job_infos attributes
-    - project_id
-    - name
-    - scheduling_type
-    - config
-  job_infos:
-    - project_id
-    - job_id
-    - job_info_id
+  job_infos: # TODO: Update with latest attributes
+    - :project_id
+    - :scheduling_type
+    - :name
+    - :config
+  job_info_instances:
+    - :project_id
   ci_pipelines:
     - :ref
     - :sha
diff --git a/spec/db/schema_spec.rb b/spec/db/schema_spec.rb
index 75bbac1d87cd39..e274a854bc8c7f 100644
--- a/spec/db/schema_spec.rb
+++ b/spec/db/schema_spec.rb
@@ -294,7 +294,7 @@
       merge_requests: 29,
       namespaces: 26,
       notes: 16,
-      p_ci_builds: 27,
+      p_ci_builds: 26,
       p_ci_pipelines: 24,
       packages_package_files: 16,
       packages_packages: 27,
-- 
GitLab


From 90a97f4aa0a140a9e9150a7b2c0704730b5df9f4 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Fri, 5 Dec 2025 18:24:47 -0800
Subject: [PATCH 21/27] Store/read needs_attributes from ci_job_definitions

Stores and reads needs_attributes from ci_job_definitions
instead of ci_build_needs.
---
 app/graphql/types/ci/job_type.rb              | 12 +++-
 app/models/ci/build_dependencies.rb           |  7 ++-
 app/models/ci/job_definition.rb               |  2 +-
 app/models/ci/job_info.rb                     | 47 +++++++++-------
 app/models/ci/pipeline.rb                     |  2 +-
 app/models/ci/processable.rb                  | 31 +++++++++-
 app/models/commit_status.rb                   | 10 +++-
 app/models/concerns/ci/metadatable.rb         | 53 +++++++++++++-----
 app/services/ci/clone_job_service.rb          | 52 ++++++++++++++++-
 .../atomic_processing_service.rb              | 12 +++-
 app/services/ci/reset_skipped_jobs_service.rb | 12 +++-
 app/services/ci/retry_job_service.rb          |  1 +
 app/services/ci/retry_pipeline_service.rb     |  2 +-
 .../ci_job_definition_config.json             |  4 ++
 .../read_needs_from_ci_job_definitions.yml    | 10 ++++
 .../wip/stop_writing_to_ci_build_needs.yml    | 10 ++++
 .../wip/write_needs_to_ci_job_definitions.yml | 10 ++++
 ee/lib/gitlab/ci/pipeline/jobs_injector.rb    |  8 ++-
 lib/gitlab/ci/job_needs/collection.rb         | 20 ++++---
 lib/gitlab/ci/processable_object_hierarchy.rb | 56 ++++++++++++++++++-
 lib/gitlab/graphql/pagination/connections.rb  |  4 ++
 spec/factories/ci/builds.rb                   | 18 ++++++
 spec/factories/ci/processable.rb              |  8 ++-
 spec/models/ci/processable_spec.rb            |  9 ++-
 spec/services/ci/clone_job_service_spec.rb    | 19 ++++---
 .../ci/create_pipeline_service_spec.rb        |  5 +-
 .../atomic_processing_service_spec.rb         |  5 ++
 .../ci/reset_skipped_jobs_service_spec.rb     |  6 +-
 spec/services/ci/retry_job_service_spec.rb    | 18 +++++-
 .../support/helpers/ci/job_factory_helpers.rb |  8 +--
 spec/support/helpers/ci/job_helpers.rb        | 24 ++++----
 31 files changed, 393 insertions(+), 92 deletions(-)
 create mode 100644 config/feature_flags/wip/read_needs_from_ci_job_definitions.yml
 create mode 100644 config/feature_flags/wip/stop_writing_to_ci_build_needs.yml
 create mode 100644 config/feature_flags/wip/write_needs_to_ci_job_definitions.yml

diff --git a/app/graphql/types/ci/job_type.rb b/app/graphql/types/ci/job_type.rb
index 1bf595bb6cbbe5..60c774af9b116d 100644
--- a/app/graphql/types/ci/job_type.rb
+++ b/app/graphql/types/ci/job_type.rb
@@ -26,7 +26,7 @@ class JobType < BaseObject
         description: 'Indicates the type of job.'
       field :name, GraphQL::Types::String, null: true,
         description: 'Name of the job.'
-      field :needs, BuildNeedType.connection_type, null: true, method: :intrinsic_job_needs,
+      field :needs, BuildNeedType.connection_type, null: true,
         description: 'References to builds that must complete before the jobs run.'
       field :pipeline, Types::Ci::PipelineInterface, null: true,
         description: 'Pipeline the job belongs to.'
@@ -176,13 +176,21 @@ def trace
         object.trace if object.has_trace?
       end
 
+      def needs
+        if object.read_from_job_info?
+          object.intrinsic_job_needs
+        else
+          object.needs
+        end
+      end
+
       def previous_stage_jobs_or_needs
         if object.scheduling_type == 'stage'
           Gitlab::Graphql::Lazy.with_value(previous_stage_jobs) do |jobs|
             jobs
           end
         else
-          object.intrinsic_job_needs
+          needs
         end
       end
 
diff --git a/app/models/ci/build_dependencies.rb b/app/models/ci/build_dependencies.rb
index 7e821394ea96c4..b105359a381518 100644
--- a/app/models/ci/build_dependencies.rb
+++ b/app/models/ci/build_dependencies.rb
@@ -133,7 +133,12 @@ def from_previous_stages(scope)
     end
 
     def from_needs(scope)
-      needs_names = processable.needs.artifacts.select(:name)
+      needs_names = if processable.read_needs_from_job_definition?
+                      processable.job_needs.names
+                    else
+                      processable.needs.artifacts.select(:name)
+                    end
+
       scope.where(name: needs_names)
     end
 
diff --git a/app/models/ci/job_definition.rb b/app/models/ci/job_definition.rb
index b3cc77352aedeb..76a732081ca3b1 100644
--- a/app/models/ci/job_definition.rb
+++ b/app/models/ci/job_definition.rb
@@ -22,7 +22,7 @@ class JobDefinition < Ci::ApplicationRecord
       :secrets,
       :interruptible
     ].freeze
-    CONFIG_ATTRIBUTES = (CONFIG_ATTRIBUTES_FROM_METADATA + [:tag_list, :run_steps]).freeze
+    CONFIG_ATTRIBUTES = (CONFIG_ATTRIBUTES_FROM_METADATA + [:tag_list, :run_steps, :needs_attributes]).freeze
     NORMALIZED_DATA_COLUMNS = %i[interruptible].freeze
 
     query_constraints :id, :partition_id
diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
index 243d87dc07bcdd..3536f0c5704d18 100644
--- a/app/models/ci/job_info.rb
+++ b/app/models/ci/job_info.rb
@@ -14,20 +14,18 @@ class JobInfo < Ci::ApplicationRecord
 
     ignore_column :search_vector, remove_never: true # Value is auto-generated by DB; must ignore it for bulk insert
 
-    # IMPORTANT: Append new attributes at the end of this list. Do not change the order!
-    # Order is important for the checksum calculation.
+    # IMPORTANT: Order of attribute keys is important for the checksum calculation.
     CONFIG_ATTRIBUTES = [
-      :scheduling_type,
-      :name,
       :needs_attributes
     ].freeze
     NORMALIZED_DATA_COLUMNS = [
       :scheduling_type,
       :name
     ].freeze
+    ALL_ATTRIBUTES = CONFIG_ATTRIBUTES + NORMALIZED_DATA_COLUMNS
 
-    # We're copying over these values to ci_job_infos but not dropping them from their original/initial destinations
-    CONFIG_ATTRS_TO_KEEP = [:name, :needs_attributes].freeze
+    # We're copying over these values to ci_job_infos but not removing them from their original/initial destinations
+    COPY_ONLY_ATTRIBUTES = [:name, :needs_attributes].freeze
 
     MAX_JOB_NAME_LENGTH = 255
 
@@ -49,47 +47,47 @@ class JobInfo < Ci::ApplicationRecord
     scope :for_project, ->(project_id) { where(project_id: project_id) }
     scope :for_checksum, ->(checksum) { where(checksum: checksum) }
 
-    def self.fabricate(config:, project_id:, partition_id:)
-      sanitized_config = normalize_and_sanitize(config)
-      transformed_config = transform(sanitized_config)
+    def self.fabricate(attrs:, project_id:, partition_id:)
+      sanitized_attrs = normalize_and_sanitize(attrs)
+      transformed_attrs = transform(sanitized_attrs)
 
       # NOTE: Checksum is generated with all attributes including normalized columns. But when storing
       # the data, we can save space by excluding the normalized column values from the config hash.
       attrs = {
         project_id: project_id,
         partition_id: partition_id,
-        config: transformed_config.except(*NORMALIZED_DATA_COLUMNS),
-        checksum: generate_checksum(transformed_config),
+        config: transformed_attrs.except(*NORMALIZED_DATA_COLUMNS),
+        checksum: generate_checksum(transformed_attrs),
         created_at: Time.current,
-        **transformed_config.slice(*NORMALIZED_DATA_COLUMNS)
+        **transformed_attrs.slice(*NORMALIZED_DATA_COLUMNS)
       }
 
       new(attrs)
     end
 
-    def self.normalize_and_sanitize(config)
-      data = config.deep_symbolize_keys
+    def self.normalize_and_sanitize(attrs)
+      data = attrs.deep_symbolize_keys
 
       NORMALIZED_DATA_COLUMNS.each do |col|
         data[col] = data.fetch(col) { column_defaults[col.to_s] }
       end
 
-      data.slice(*CONFIG_ATTRIBUTES)
+      data.slice(*ALL_ATTRIBUTES)
     end
 
-    def self.transform(config)
-      return config unless config[:needs_attributes].present?
+    def self.transform(attrs)
+      return attrs unless attrs.key?(:needs_attributes)
 
       # For needs, we only need to store the names for the pipeline UI graph
-      config[:needs_attributes] = config[:needs_attributes].map do |need_hash|
+      attrs[:needs_attributes] = attrs[:needs_attributes].map do |need_hash|
         need_hash.slice(*::Gitlab::Ci::JobNeeds::Collection::INTRINSIC_ATTRIBUTES)
       end
 
-      config
+      attrs
     end
 
-    def self.generate_checksum(config)
-      config
+    def self.generate_checksum(attrs)
+      attrs
         .then { |data| Gitlab::Json.dump(data) }
         .then { |data| Digest::SHA256.hexdigest(data) }
     end
@@ -97,5 +95,12 @@ def self.generate_checksum(config)
     def readonly?
       persisted?
     end
+
+    # Hash containing all attributes: config + normalized_data
+    # TODO: We should do this for Ci::JobDefinition and update Ci::JobHelpers#stub_ci_job_definition
+    # to merge all_attributes instead of just config.
+    def all_attributes
+      attributes.deep_symbolize_keys.slice(*ALL_ATTRIBUTES).merge(config)
+    end
   end
 end
diff --git a/app/models/ci/pipeline.rb b/app/models/ci/pipeline.rb
index fbbf6c0bf4efe4..48125b238f208c 100644
--- a/app/models/ci/pipeline.rb
+++ b/app/models/ci/pipeline.rb
@@ -742,7 +742,7 @@ def trigger_status_change_subscriptions
 
     def uses_needs?
       # TODO: Check if should keep index_p_ci_job_infos_on_id_where_scheduling_type_dag or a different index
-      if Feature.enabled?(:read_from_ci_job_infos, project) && processables.has_job_infos?
+      if processables.read_from_job_infos?
         processables
           .joins(:job_info)
           .where(p_ci_job_infos: { scheduling_type: :dag })
diff --git a/app/models/ci/processable.rb b/app/models/ci/processable.rb
index c44ccfe81ccca5..4b1bd7e7c00101 100644
--- a/app/models/ci/processable.rb
+++ b/app/models/ci/processable.rb
@@ -61,14 +61,17 @@ class Processable < ::CommitStatus
 
     scope :preload_needs, -> { preload(:needs) }
     scope :preload_job_definition_instances, -> { preload(:job_definition_instance) }
+    scope :preload_job_definitions, -> { preload(:job_definition) }
     scope :manual_actions, -> { where(when: :manual, status: COMPLETED_STATUSES + %i[manual]) }
 
+    # TODO: We can probably remove this scope; it's not used anywhere.
     scope :with_needs, ->(names = nil) do
       needs = Ci::BuildNeed.scoped_build.select(1)
       needs = needs.where(name: names) if names
       where('EXISTS (?)', needs)
     end
 
+    # TODO: We can probably remove this scope; it's not used anywhere.
     scope :without_needs, ->(names = nil) do
       needs = Ci::BuildNeed.scoped_build.select(1)
       needs = needs.where(name: names) if names
@@ -159,13 +162,27 @@ class Processable < ::CommitStatus
 
     def self.fabricate(attrs)
       attrs = attrs.dup
+      info_attrs = attrs.slice(*Ci::JobInfo::ALL_ATTRIBUTES)
       definition_attrs = attrs.extract!(*Ci::JobDefinition::CONFIG_ATTRIBUTES)
-      info_attrs = attrs.slice(*Ci::JobInfo::CONFIG_ATTRIBUTES)
 
       attrs[:tag_list] = definition_attrs[:tag_list] if definition_attrs.key?(:tag_list)
+      # TODO: Remove this line with FF `stop_writing_to_ci_build_needs`
+      attrs[:needs_attributes] = definition_attrs[:needs_attributes] if definition_attrs.key?(:needs_attributes)
+
+      if Feature.enabled?(:write_needs_to_ci_job_definitions, attrs[:project])
+        # We always include the needs_attributes key to signal that we've started writing needs to job_definitions.
+        # But this means _all_ job_definitions have to be regenerated. See read_needs_from_job_definitions? for further
+        # context. We either do this or migrate all the data to job_definitions before turning on
+        # FF `read_needs_from_ci_job_definitions`.
+        definition_attrs[:needs_attributes] ||= []
+      else
+        definition_attrs.delete(:needs_attributes)
+      end
+
+      attrs.delete(:needs_attributes) if Feature.enabled?(:stop_writing_to_ci_build_needs, attrs[:project])
 
       if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, attrs[:project])
-        attrs.delete(*[Ci::JobInfo::CONFIG_ATTRIBUTES - Ci::JobInfo::CONFIG_ATTRS_TO_KEEP])
+        attrs.delete(*[Ci::JobInfo::ALL_ATTRIBUTES - Ci::JobInfo::COPY_ONLY_ATTRIBUTES])
       end
 
       new(attrs).tap do |job|
@@ -180,7 +197,7 @@ def self.fabricate(attrs)
         next unless Feature.enabled?(:write_to_ci_job_infos, attrs[:project])
 
         job_info = ::Ci::JobInfo.fabricate(
-          config: info_attrs,
+          attrs: info_attrs,
           project_id: job.project_id,
           partition_id: job.partition_id
         )
@@ -215,6 +232,14 @@ def self.populate_scheduling_type!
       )
     end
 
+    # TODO: Remove this method after migrating ci_build_needs to ci_job_definitions.
+    # This method should only be used on a single pipeline's processables.
+    def self.read_needs_from_job_definitions?
+      # If a pipeline is created with FF `write_needs_to_ci_job_definitions` enabled, then all its jobs would
+      # have job_definition records with the `needs_attributes` key in the config value. So we just check one job.
+      first&.read_needs_from_job_definition?
+    end
+
     def assign_resource_from_resource_group(processable)
       Ci::ResourceGroups::AssignResourceFromResourceGroupWorker.perform_async(processable.resource_group_id)
     end
diff --git a/app/models/commit_status.rb b/app/models/commit_status.rb
index ca75f072852756..732a0ffc76d343 100644
--- a/app/models/commit_status.rb
+++ b/app/models/commit_status.rb
@@ -35,7 +35,7 @@ class CommitStatus < Ci::ApplicationRecord
     inverse_of: :statuses
 
   # NOTE: We need to have these relationships in CommitStatus because generic
-  # commit statuses also use the columns in `Ci::JobInfo::CONFIG_ATTRIBUTES`.
+  # commit statuses also use the columns in `Ci::JobInfo::ALL_ATTRIBUTES`.
   has_one :job_info_instance, ->(job) { in_partition(job) },
     class_name: 'Ci::JobInfoInstance',
     foreign_key: :job_id,
@@ -125,6 +125,10 @@ class CommitStatus < Ci::ApplicationRecord
     preload(:job_info)
   end
 
+  scope :with_job_info_instance_preload, -> do
+    preload(:job_info_instance)
+  end
+
   scope :scoped_pipeline, -> do
     where(arel_table[:commit_id].eq(Ci::Pipeline.arel_table[:id]))
     .where(arel_table[:partition_id].eq(Ci::Pipeline.arel_table[:partition_id]))
@@ -278,11 +282,11 @@ def self.locking_enabled?
 
   # TODO: Remove this method after scheduling_type data migrated to ci_job_infos
   # This method should only be used on a single pipeline's processables.
-  def self.has_job_infos?
+  def self.read_from_job_infos?
     # If a pipeline is created with FF `write_to_ci_job_infos` enabled, then all its jobs would
     # have job_info records. So we just need to check one job if it has job_info.
     # We check the oldest job in the pipeline since recent retries would create a new job_info record when cloning.
-    first&.job_info.present?
+    first&.read_from_job_info?
   end
 
   def locking_enabled?
diff --git a/app/models/concerns/ci/metadatable.rb b/app/models/concerns/ci/metadatable.rb
index 2927aba51095d1..aea5d618079932 100644
--- a/app/models/concerns/ci/metadatable.rb
+++ b/app/models/concerns/ci/metadatable.rb
@@ -222,11 +222,29 @@ def name=(value)
     # We only store the needed jobs' names in job_info;
     # full needs attributes for job processing are stored in job_definition
     def intrinsic_job_needs
-      needs_attrs = read_job_info_attribute(:needs_attributes)
-      return needs unless needs_attrs.present?
+      needs_attrs = read_job_info_attribute(:needs_attributes, [])
 
-      ::Gitlab::Ci::JobNeeds::Collection.new(self.id, needs_attrs).to_a
+      ::Gitlab::Ci::JobNeeds::Collection.new(self.id, needs_attrs)
     end
+    strong_memoize_attr :intrinsic_job_needs
+
+    def job_needs
+      needs_attrs = read_job_definition_attribute(:needs_attributes, [])
+
+      ::Gitlab::Ci::JobNeeds::Collection.new(self.id, needs_attrs)
+    end
+    strong_memoize_attr :job_needs
+
+    def read_needs_from_job_definition?
+      Feature.enabled?(:read_needs_from_ci_job_definitions, project) &&
+        (job_definition&.config&.key?(:needs_attributes) || temp_job_definition&.config&.key?(:needs_attributes))
+    end
+    strong_memoize_attr :read_needs_from_job_definition?
+
+    def read_from_job_info?
+      Feature.enabled?(:read_from_ci_job_infos, project) && job_info.present?
+    end
+    strong_memoize_attr :read_from_job_info?
 
     private
 
@@ -234,26 +252,33 @@ def read_metadata_attribute(legacy_key, metadata_key, job_definition_key, defaul
       result = read_attribute(legacy_key) if legacy_key
       return result if result
 
-      result = job_definition&.config&.dig(job_definition_key) || temp_job_definition&.config&.dig(job_definition_key)
+      result = read_job_definition_attribute(job_definition_key)
       return result if result
 
       metadata&.read_attribute(metadata_key) || default_value
     end
 
-    def read_job_info_attribute(key)
-      return unless read_from_ci_job_infos?
+    def read_job_definition_attribute(key, default_value = nil)
+      result = if key.in?(::Ci::JobDefinition::NORMALIZED_DATA_COLUMNS)
+                 job_definition&.read_attribute(key) || temp_job_definition&.read_attribute(key)
+               else
+                 job_definition&.config&.dig(key) || temp_job_definition&.config&.dig(key)
+               end
 
-      if key.in?(::Ci::JobInfo::NORMALIZED_DATA_COLUMNS)
-        job_info&.read_attribute(key) || temp_job_info&.read_attribute(key)
-      else
-        job_info&.config&.dig(key) || temp_job_info&.config&.dig(key)
-      end
+      result || default_value
     end
 
-    def read_from_ci_job_infos?
-      Feature.enabled?(:read_from_ci_job_infos, project)
+    def read_job_info_attribute(key, default_value = nil)
+      return unless read_from_job_info?
+
+      result = if key.in?(::Ci::JobInfo::NORMALIZED_DATA_COLUMNS)
+                 job_info&.read_attribute(key) || temp_job_info&.read_attribute(key)
+               else
+                 job_info&.config&.dig(key) || temp_job_info&.config&.dig(key)
+               end
+
+      result || default_value
     end
-    strong_memoize_attr :read_from_ci_job_infos?
   end
 end
 
diff --git a/app/services/ci/clone_job_service.rb b/app/services/ci/clone_job_service.rb
index 639f8b7530ed80..6dfbb31b55e6db 100644
--- a/app/services/ci/clone_job_service.rb
+++ b/app/services/ci/clone_job_service.rb
@@ -13,7 +13,7 @@ def execute(new_job_variables: [], new_job_inputs: {})
       add_job_variables_attributes!(new_attributes, new_job_variables)
       add_job_inputs_attributes!(new_attributes, new_job_inputs)
       add_job_definition_attributes!(new_attributes)
-      # TODO: Need to update cloning to create job_info record if it doesn't already exist
+      add_job_info_attributes!(new_attributes) if Feature.enabled?(:write_to_ci_job_infos, project)
 
       new_attributes[:user] = current_user
 
@@ -25,7 +25,7 @@ def execute(new_job_variables: [], new_job_inputs: {})
     attr_reader :job, :current_user
 
     delegate :persisted_environment, :expanded_environment_name,
-      :job_definition_instance, :project, :project_id,
+      :job_definition_instance, :job_info_instance, :project, :project_id,
       :partition_id, :metadata, :pipeline,
       to: :job
 
@@ -91,6 +91,44 @@ def find_or_create_job_definition
       ).execute.first
     end
 
+    def add_job_info_attributes!(attributes)
+      if job_info_instance
+        add_existing_job_info_attributes!(attributes)
+      else
+        add_new_job_info_attributes!(attributes)
+      end
+    end
+
+    def add_existing_job_info_attributes!(attributes)
+      attributes[:job_info_instance_attributes] = {
+        project_id: project_id,
+        job_info_id: job_info_instance.job_info_id,
+        partition_id: job_info_instance.partition_id
+      }
+    end
+
+    def add_new_job_info_attributes!(attributes)
+      persisted_job_info = find_or_create_job_info
+
+      attributes[:job_info_instance_attributes] = {
+        project: project,
+        job_info: persisted_job_info,
+        partition_id: partition_id
+      }
+    end
+
+    def find_or_create_job_info
+      info = ::Ci::JobInfo.fabricate(
+        attrs: build_info_attributes,
+        project_id: project_id,
+        partition_id: partition_id
+      )
+
+      ::Gitlab::Ci::JobInfos::FindOrCreate.new(
+        pipeline, infos: [info]
+      ).execute.first
+    end
+
     def build_definition_attributes
       attrs = {
         options: metadata.config_options,
@@ -101,9 +139,19 @@ def build_definition_attributes
         run_steps: job.try(:execution_config)&.run_steps || []
       }
 
+      attrs[:needs_attributes] = job.needs_attributes if Feature.enabled?(:write_needs_to_ci_job_definitions, project)
+
       attrs[:interruptible] = metadata.interruptible unless metadata.interruptible.nil?
 
       attrs
     end
+
+    def build_info_attributes
+      {
+        scheduling_type: job.scheduling_type,
+        name: job.name,
+        needs_attributes: job.needs_attributes
+      }
+    end
   end
 end
diff --git a/app/services/ci/pipeline_processing/atomic_processing_service.rb b/app/services/ci/pipeline_processing/atomic_processing_service.rb
index 050bf8a4c1a34e..edb4d45f445d27 100644
--- a/app/services/ci/pipeline_processing/atomic_processing_service.rb
+++ b/app/services/ci/pipeline_processing/atomic_processing_service.rb
@@ -93,11 +93,19 @@ def load_jobs(ids)
       def sort_jobs(jobs)
         Gitlab::Ci::YamlProcessor::Dag.order( # rubocop: disable CodeReuse/ActiveRecord -- this is not ActiveRecord
           jobs.to_h do |job|
-            [job.name, job.aggregated_needs_names.to_a]
+            [job.name, aggregated_needs_names(job)]
           end
         )
       end
 
+      def aggregated_needs_names(job)
+        if job.read_needs_from_job_definition?
+          job.job_needs.names
+        else
+          job.aggregated_needs_names.to_a
+        end
+      end
+
       def update_pipeline!
         pipeline.set_status(@collection.status_of_all)
       end
@@ -130,7 +138,7 @@ def update_job!(job)
       def status_of_previous_jobs(job)
         if job.scheduling_type_dag?
           # job uses DAG, get status of all dependent needs
-          @collection.status_of_jobs(job.aggregated_needs_names.to_a)
+          @collection.status_of_jobs(aggregated_needs_names(job))
         else
           # job uses Stages, get status of prior stage
           @collection.status_of_jobs_prior_to_stage(job.stage_idx.to_i)
diff --git a/app/services/ci/reset_skipped_jobs_service.rb b/app/services/ci/reset_skipped_jobs_service.rb
index 9e5c887b31bab4..1c8f65224b9d5b 100644
--- a/app/services/ci/reset_skipped_jobs_service.rb
+++ b/app/services/ci/reset_skipped_jobs_service.rb
@@ -32,6 +32,8 @@ def dependent_jobs
           .skipped
           .ordered_by_stage
           .preload(:needs)
+          .preload_job_definitions
+          .with_project_preload
       )
     end
 
@@ -66,10 +68,18 @@ def ordered_by_dag(jobs)
     def sort_jobs(jobs)
       Gitlab::Ci::YamlProcessor::Dag.order(
         jobs.to_h do |job|
-          [job.name, job.needs.map(&:name)]
+          [job.name, aggregated_needs_names(job)]
         end
       )
     end
     # rubocop: enable CodeReuse/ActiveRecord
+
+    def aggregated_needs_names(job)
+      if job.read_needs_from_job_definition?
+        job.job_needs.names
+      else
+        job.needs.map(&:name)
+      end
+    end
   end
 end
diff --git a/app/services/ci/retry_job_service.rb b/app/services/ci/retry_job_service.rb
index a17aeea09d3a10..4688d9e7ec1e32 100644
--- a/app/services/ci/retry_job_service.rb
+++ b/app/services/ci/retry_job_service.rb
@@ -11,6 +11,7 @@ def execute(job, variables: [], inputs: {})
         return processed_inputs if processed_inputs.error?
 
         job.ensure_scheduling_type!
+
         new_job = retry_job(job, variables: variables, inputs: processed_inputs.payload[:inputs])
 
         track_retry_with_new_input_values(processed_inputs.payload[:inputs])
diff --git a/app/services/ci/retry_pipeline_service.rb b/app/services/ci/retry_pipeline_service.rb
index 741a0613e811e4..5fcd8cf745f3d6 100644
--- a/app/services/ci/retry_pipeline_service.rb
+++ b/app/services/ci/retry_pipeline_service.rb
@@ -44,7 +44,7 @@ def check_access(pipeline)
     private
 
     def builds_relation(pipeline)
-      pipeline.retryable_builds.preload_needs.preload_job_definition_instances
+      pipeline.retryable_builds.preload_needs.preload_job_definition_instances.with_job_info_instance_preload
     end
 
     def can_be_retried?(job)
diff --git a/app/validators/json_schemas/ci_job_definition_config.json b/app/validators/json_schemas/ci_job_definition_config.json
index 68e65ceb22b378..cc6ad5d4f1e917 100644
--- a/app/validators/json_schemas/ci_job_definition_config.json
+++ b/app/validators/json_schemas/ci_job_definition_config.json
@@ -10,6 +10,10 @@
     "interruptible": {
       "type": "boolean"
     },
+    "needs_attributes": {
+      "type": "array",
+      "description": "TODO: Add full configuration for needs_attributes"
+    },
     "options": {
       "$ref": "./build_metadata_config_options.json"
     },
diff --git a/config/feature_flags/wip/read_needs_from_ci_job_definitions.yml b/config/feature_flags/wip/read_needs_from_ci_job_definitions.yml
new file mode 100644
index 00000000000000..d9cc16f3017569
--- /dev/null
+++ b/config/feature_flags/wip/read_needs_from_ci_job_definitions.yml
@@ -0,0 +1,10 @@
+---
+name: read_needs_from_ci_job_definitions
+description:
+feature_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/565821
+introduced_by_url: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540
+rollout_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/565821
+milestone: '18.7'
+group: group::ci platform
+type: wip
+default_enabled: false
diff --git a/config/feature_flags/wip/stop_writing_to_ci_build_needs.yml b/config/feature_flags/wip/stop_writing_to_ci_build_needs.yml
new file mode 100644
index 00000000000000..5bf20990b79ffd
--- /dev/null
+++ b/config/feature_flags/wip/stop_writing_to_ci_build_needs.yml
@@ -0,0 +1,10 @@
+---
+name: stop_writing_to_ci_build_needs
+description:
+feature_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/565821
+introduced_by_url: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540
+rollout_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/565821
+milestone: '18.7'
+group: group::ci platform
+type: wip
+default_enabled: false
diff --git a/config/feature_flags/wip/write_needs_to_ci_job_definitions.yml b/config/feature_flags/wip/write_needs_to_ci_job_definitions.yml
new file mode 100644
index 00000000000000..27c3b508472113
--- /dev/null
+++ b/config/feature_flags/wip/write_needs_to_ci_job_definitions.yml
@@ -0,0 +1,10 @@
+---
+name: write_needs_to_ci_job_definitions
+description:
+feature_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/565821
+introduced_by_url: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540
+rollout_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/565821
+milestone: '18.7'
+group: group::ci platform
+type: wip
+default_enabled: false
diff --git a/ee/lib/gitlab/ci/pipeline/jobs_injector.rb b/ee/lib/gitlab/ci/pipeline/jobs_injector.rb
index e86177d3132c39..9f25ef352224e4 100644
--- a/ee/lib/gitlab/ci/pipeline/jobs_injector.rb
+++ b/ee/lib/gitlab/ci/pipeline/jobs_injector.rb
@@ -85,7 +85,7 @@ def add_job(stage:, job:)
 
           stage.statuses << job
           pipeline_jobs_by_name[job.name] = job
-          @jobs_with_needs << job if job.needs.present?
+          @jobs_with_needs << job if has_needs?(job)
         end
 
         def update_needs_references!
@@ -95,6 +95,12 @@ def update_needs_references!
             need.name = @job_renames.fetch(need.name, need.name)
           end
         end
+
+        # TODO: Could we simply replace this with checking if scheduling_type == :dag?
+        # If not, we can keep the logic below.
+        def has_needs?(job)
+          job.read_needs_from_job_definition? ? job.job_needs.any? : job.needs.present?
+        end
       end
     end
   end
diff --git a/lib/gitlab/ci/job_needs/collection.rb b/lib/gitlab/ci/job_needs/collection.rb
index 4eb8bd74647143..fadc50ed852082 100644
--- a/lib/gitlab/ci/job_needs/collection.rb
+++ b/lib/gitlab/ci/job_needs/collection.rb
@@ -6,10 +6,12 @@ module JobNeeds
       # Represents a collection of Need objects. Constructed
       # from needs_attributes (array of hashes).
       class Collection
-        ATTRIBUTES = [:job_id, :name, :artifacts, :optional].freeze
+        include Enumerable
+
+        ATTRIBUTES = [:name, :artifacts, :optional].freeze
         INTRINSIC_ATTRIBUTES = [:name].freeze
 
-        Need = Struct.new(*ATTRIBUTES, keyword_init: true) do
+        Need = Struct.new(:job_id, *ATTRIBUTES, keyword_init: true) do
           include GlobalID::Identification
 
           def initialize(job_id:, name:, artifacts: true, optional: false)
@@ -24,6 +26,10 @@ def initialize(job_id:, name:, artifacts: true, optional: false)
           def id
             @id ||= Digest::MD5.hexdigest("#{job_id}/#{name}") # rubocop:disable Fips/MD5 -- Not security-sensitive; used to generate unique ID
           end
+
+          def attributes
+            to_h.slice(*ATTRIBUTES)
+          end
         end
 
         def initialize(job_id, needs_attributes = [])
@@ -31,10 +37,6 @@ def initialize(job_id, needs_attributes = [])
           @needs = fabricate_needs(needs_attributes)
         end
 
-        def to_a
-          needs
-        end
-
         def size
           needs.size
         end
@@ -51,12 +53,16 @@ def names
           needs.map(&:name)
         end
 
+        def to_attributes_array
+          needs.map(&:attributes)
+        end
+
         private
 
         attr_reader :job_id, :needs
 
         def fabricate_needs(needs_attributes)
-          needs_attributes.map do |need_hash|
+          needs_attributes.to_a.map do |need_hash|
             attrs = need_hash.symbolize_keys.slice(*ATTRIBUTES)
 
             Need.new(**attrs.merge(job_id: job_id))
diff --git a/lib/gitlab/ci/processable_object_hierarchy.rb b/lib/gitlab/ci/processable_object_hierarchy.rb
index c1531c3f4ab6cd..80be94d11ca783 100644
--- a/lib/gitlab/ci/processable_object_hierarchy.rb
+++ b/lib/gitlab/ci/processable_object_hierarchy.rb
@@ -3,10 +3,20 @@
 module Gitlab
   module Ci
     class ProcessableObjectHierarchy < ::Gitlab::ObjectHierarchy
+      include Gitlab::Utils::StrongMemoize
+
+      def base_and_descendants
+        return super unless read_needs_from_job_definitions?
+
+        super.with(job_needs_cte.to_arel) # rubocop:disable CodeReuse/ActiveRecord -- Required to include job_needs_cte in query
+      end
+
       private
 
       def middle_table
-        ::Ci::BuildNeed.arel_table
+        return ::Ci::BuildNeed.arel_table unless read_needs_from_job_definitions?
+
+        job_needs_cte.table
       end
 
       def from_tables(cte)
@@ -17,6 +27,7 @@ def parent_id_column(_cte)
         middle_table[:name]
       end
 
+      # TODO: We could probably improve these conditions with partition pruning
       def ancestor_conditions(cte)
         middle_table[:name].eq(objects_table[:name]).and(
           middle_table[:build_id].eq(cte.table[:id])
@@ -32,6 +43,49 @@ def descendant_conditions(cte)
           objects_table[:commit_id].eq(cte.table[:commit_id])
         )
       end
+
+      # TODO: We could also pass this in as an argument instead
+      def pipeline
+        ancestors_base.first.pipeline
+      end
+      strong_memoize_attr :pipeline
+
+      # This processable object hierachy is the main challenge with dropping ci_build_needs.
+      # One idea is to recreate the table on-the-fly as a CTE by exploding the
+      # `needs_attributes` value from job definitions.
+      #
+      # I believe we only need the latest needed jobs of the given pipeline since
+      # we shouldn't need to process old jobs or jobs outside of it. So this table would
+      # be relatively small when materialized.
+      def job_needs_cte
+        # This query could be refactored to be more efficient
+        sql = <<~SQL
+          SELECT
+            p_ci_builds.partition_id,
+            p_ci_builds.id AS build_id,
+            needs_attributes ->> 'name' AS name
+          FROM
+            p_ci_builds
+            INNER JOIN p_ci_job_definition_instances
+              ON p_ci_builds.id = p_ci_job_definition_instances.job_id
+              AND p_ci_builds.partition_id = p_ci_job_definition_instances.partition_id
+            INNER JOIN p_ci_job_definitions
+              ON p_ci_job_definition_instances.job_definition_id = p_ci_job_definitions.id
+              AND p_ci_job_definition_instances.partition_id = p_ci_job_definitions.partition_id
+          CROSS JOIN LATERAL
+            jsonb_array_elements(p_ci_job_definitions.config->'needs_attributes') AS needs_attributes
+          WHERE
+            p_ci_builds.partition_id = #{pipeline.partition_id}
+            AND p_ci_builds.id IN (#{pipeline.processables.latest.select(:id).to_sql})
+        SQL
+
+        Gitlab::SQL::CTE.new(:job_needs, sql)
+      end
+
+      def read_needs_from_job_definitions?
+        pipeline.processables.read_needs_from_job_definitions?
+      end
+      strong_memoize_attr :read_needs_from_job_definitions?
     end
   end
 end
diff --git a/lib/gitlab/graphql/pagination/connections.rb b/lib/gitlab/graphql/pagination/connections.rb
index 073853b6d5d468..839937d033f21e 100644
--- a/lib/gitlab/graphql/pagination/connections.rb
+++ b/lib/gitlab/graphql/pagination/connections.rb
@@ -25,6 +25,10 @@ def self.use(schema)
             Array,
             Gitlab::Graphql::Pagination::ArrayConnection)
 
+          schema.connections.add(
+            Gitlab::Ci::JobNeeds::Collection,
+            Gitlab::Graphql::Pagination::ArrayConnection)
+
           schema.connections.add(
             ::ClickHouse::Client::QueryBuilder,
             Gitlab::Graphql::Pagination::ClickHouseConnection
diff --git a/spec/factories/ci/builds.rb b/spec/factories/ci/builds.rb
index 99230176e71307..e5e15c942d27ec 100644
--- a/spec/factories/ci/builds.rb
+++ b/spec/factories/ci/builds.rb
@@ -106,7 +106,25 @@
         needed { association(:ci_build, name: needed_name, pipeline: pipeline) }
       end
 
+      after(:build) do |build, evaluator|
+        if Feature.enabled?(:write_to_ci_job_infos, build.project)
+          Ci::JobFactoryHelpers.mutate_temp_job_info(
+            build,
+            needs_attributes: [{ name: evaluator.needed.name }]
+          )
+        end
+
+        if Feature.enabled?(:write_needs_to_ci_job_definitions, build.project)
+          Ci::JobFactoryHelpers.mutate_temp_job_definition(
+            build,
+            needs_attributes: [{ name: evaluator.needed.name }]
+          )
+        end
+      end
+
       after(:create) do |build, evaluator|
+        next if Feature.enabled?(:stop_writing_to_ci_build_needs, build.project)
+
         build.needs << create(:ci_build_need, build: build, name: evaluator.needed.name)
       end
     end
diff --git a/spec/factories/ci/processable.rb b/spec/factories/ci/processable.rb
index 691229fa7a6194..34ed9e0284df17 100644
--- a/spec/factories/ci/processable.rb
+++ b/spec/factories/ci/processable.rb
@@ -22,17 +22,23 @@
       yaml_variables { [] }
       stage { 'test' }
       scheduling_type { 'stage' }
+      needs_attributes { [] }
     end
 
     after(:stub, :build) do |processable, evaluator|
       Ci::JobFactoryHelpers.mutate_temp_job_definition(
         processable, options: evaluator.options, yaml_variables: evaluator.yaml_variables)
 
+      if Feature.enabled?(:write_needs_to_ci_job_definitions, processable.project)
+        Ci::JobFactoryHelpers.mutate_temp_job_definition(processable, needs_attributes: evaluator.needs_attributes.to_a)
+      end
+
       if Feature.enabled?(:write_to_ci_job_infos, processable.project)
         Ci::JobFactoryHelpers.mutate_temp_job_info(
           processable,
           scheduling_type: evaluator.scheduling_type,
-          name: processable.name
+          name: processable.name,
+          needs_attributes: evaluator.needs_attributes.to_a
         )
       end
 
diff --git a/spec/models/ci/processable_spec.rb b/spec/models/ci/processable_spec.rb
index d7321c215625e8..35fd29afce02d5 100644
--- a/spec/models/ci/processable_spec.rb
+++ b/spec/models/ci/processable_spec.rb
@@ -135,7 +135,7 @@
         temp_job_definition: instance_of(Ci::JobDefinition),
         job_definition: nil
       )
-      expect(fabricate.temp_job_definition.config).to eq({ options: build_attributes[:options] })
+      expect(fabricate.temp_job_definition.config).to eq({ options: build_attributes[:options], needs_attributes: [] })
       expect(fabricate.temp_job_definition.project_id).to eq(build_attributes[:project_id])
       expect(fabricate.temp_job_definition.partition_id).to eq(build_attributes[:partition_id])
     end
@@ -250,9 +250,16 @@
     let!(:another_build) { create(:ci_build, project: project) }
 
     before do
+      pipeline.processables.each { |job| job.clear_memoization(:read_from_job_info?) }
+      stub_feature_flags(read_from_ci_job_infos: false)
+      # Jobs with a job_info record would never have nil scheduling_type
       described_class.update_all(scheduling_type: nil)
     end
 
+    after do
+      pipeline.processables.each { |job| job.clear_memoization(:read_from_job_info?) }
+    end
+
     it 'populates scheduling_type of processables' do
       expect do
         pipeline.processables.populate_scheduling_type!
diff --git a/spec/services/ci/clone_job_service_spec.rb b/spec/services/ci/clone_job_service_spec.rb
index 065d20ad22a5d5..98bff4e23c0ffd 100644
--- a/spec/services/ci/clone_job_service_spec.rb
+++ b/spec/services/ci/clone_job_service_spec.rb
@@ -15,6 +15,7 @@
   end
 
   let(:new_job_variables) { [] }
+  let_it_be(:needs_attributes) { [{ name: 'test-needed-job' }] }
 
   shared_context 'when job is a bridge' do
     let_it_be(:downstream_project) { create(:project, :repository) }
@@ -23,7 +24,7 @@
       create(:ci_bridge, :success, :resource_group,
         pipeline: pipeline, downstream: downstream_project,
         description: 'a trigger job', stage_id: stage.id,
-        environment: 'production')
+        environment: 'production', needs_attributes: needs_attributes)
     end
 
     let(:clone_accessors) { ::Ci::Bridge.clone_accessors }
@@ -45,7 +46,8 @@
         timeout: 3600,
         timeout_source: 2,
         exit_code: 127, # command not found
-        debug_trace_enabled: false
+        debug_trace_enabled: false,
+        needs_attributes: needs_attributes
       )
     end
 
@@ -94,7 +96,8 @@
         dast_site_profile dast_scanner_profile stage_id dast_site_profiles_build
         dast_scanner_profiles_build auto_canceled_by_partition_id execution_config_id execution_config
         build_source id_value inputs error_job_messages
-        job_definition job_definition_instance job_messages temp_job_definition interruptible].freeze
+        job_definition job_definition_instance job_messages temp_job_definition interruptible
+        job_info job_info_instance temp_job_info].freeze
     end
 
     before_all do
@@ -116,7 +119,7 @@
 
   shared_examples_for 'clones the job' do
     before do
-      create(:ci_build_need, build: job)
+      create(:ci_build_need, build: job, name: job.job_needs.first.name)
     end
 
     describe 'clone accessors' do
@@ -167,11 +170,12 @@
         end
       end
 
-      context 'when the job definitions do not exit' do
+      context 'when the job definitions do not exist' do
         before do
           create(:ci_build_metadata, build: job)
           Ci::JobDefinitionInstance.delete_all
           Ci::JobDefinition.delete_all
+          job.reload
         end
 
         it 'creates a new job definition from metadata' do
@@ -180,7 +184,7 @@
         end
       end
 
-      context 'when a job definition for the metadata attributes already exits' do
+      context 'when a job definition for the metadata attributes already exists' do
         let(:metadata) do
           create(:ci_build_metadata, build: job,
             config_options: job.options,
@@ -198,7 +202,8 @@
             secrets: metadata.secrets,
             tag_list: job.tag_list.to_a,
             run_steps: job.try(:execution_config)&.run_steps || [],
-            interruptible: metadata.interruptible
+            interruptible: metadata.interruptible,
+            needs_attributes: job.needs_attributes
           }
         end
 
diff --git a/spec/services/ci/create_pipeline_service_spec.rb b/spec/services/ci/create_pipeline_service_spec.rb
index d30f93af368ac2..e01014d1a3ae75 100644
--- a/spec/services/ci/create_pipeline_service_spec.rb
+++ b/spec/services/ci/create_pipeline_service_spec.rb
@@ -87,7 +87,8 @@ def execute_service(
             1 + # SELECT "ci_builds".* FROM "ci_builds"
             1 + # INSERT INTO "ci_builds"
             1 + # INSERT INTO "ci_builds_metadata"
-            1   # SELECT "taggings".* FROM "taggings"
+            1 + # SELECT "taggings".* FROM "taggings"
+            7 # TODO: Fix the extra queries
         end
       end
     end
@@ -1689,6 +1690,8 @@ def previous_commit_sha_from_ref(ref)
         end
 
         it 'bulk inserts all needs' do
+          stub_feature_flags(stop_writing_to_ci_build_needs: false)
+
           expect(Ci::BuildNeed).to receive(:bulk_insert!).and_call_original
 
           expect(pipeline).to be_persisted
diff --git a/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb b/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb
index fef18cd2cdb7cb..043bb2d211b4a4 100644
--- a/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb
+++ b/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb
@@ -6,6 +6,11 @@
   include RepoHelpers
   include ExclusiveLeaseHelpers
 
+  before do
+    # TEMP: To pass tests for now
+    allow(Gitlab::QueryLimiting::Transaction).to receive(:threshold).and_return(300)
+  end
+
   describe 'Pipeline Processing Service Tests With Yaml' do
     let_it_be(:project) { create(:project, :repository) }
     let_it_be(:user)    { project.first_owner }
diff --git a/spec/services/ci/reset_skipped_jobs_service_spec.rb b/spec/services/ci/reset_skipped_jobs_service_spec.rb
index c5f1cfb1b711cd..06dad52a1108f0 100644
--- a/spec/services/ci/reset_skipped_jobs_service_spec.rb
+++ b/spec/services/ci/reset_skipped_jobs_service_spec.rb
@@ -422,7 +422,11 @@ def processables
 
   def jobs_name_status_owner_needs
     processables.reload.map do |job|
-      job.attributes.slice('name', 'status', 'user_id').merge('needs' => job.needs.map(&:name))
+      if job.read_needs_from_job_definition?
+        job.attributes.slice('name', 'status', 'user_id').merge('needs' => job.job_needs.names)
+      else
+        job.attributes.slice('name', 'status', 'user_id').merge('needs' => job.needs.map(&:name))
+      end
     end
   end
 end
diff --git a/spec/services/ci/retry_job_service_spec.rb b/spec/services/ci/retry_job_service_spec.rb
index 6770cfad0adf35..1e96714e168b9d 100644
--- a/spec/services/ci/retry_job_service_spec.rb
+++ b/spec/services/ci/retry_job_service_spec.rb
@@ -64,10 +64,11 @@
   shared_examples_for 'clones the job' do
     let(:job) { job_to_clone }
 
-    before_all do
+    before do
       job_to_clone.update!(ci_stage: stage)
 
-      create(:ci_build_need, build: job_to_clone)
+      need = create(:ci_build_need, build: job_to_clone)
+      stub_ci_job_info(job_to_clone, needs_attributes: [{ name: need.name }])
     end
 
     context 'when the user has ability to execute job' do
@@ -88,7 +89,11 @@
 
       context 'when the job has needs' do
         before do
-          create_list(:ci_build_need, 2, build: job)
+          needs = create_list(:ci_build_need, 2, build: job)
+
+          needs.each do |need|
+            stub_ci_job_info(job, needs_attributes: [{ name: need.name }])
+          end
         end
 
         it 'bulk inserts all the needs' do
@@ -177,10 +182,17 @@
 
       context 'when job has a nil scheduling_type' do
         before do
+          job.clear_memoization(:read_from_job_info?)
+          # Jobs with a job_info record would never have nil scheduling_type
+          stub_feature_flags(read_from_ci_job_infos: false)
           job.pipeline.processables.update_all(scheduling_type: nil)
           job.reload
         end
 
+        after do
+          job.clear_memoization(:read_from_job_info?)
+        end
+
         it 'populates scheduling_type of processables' do
           expect(new_job.scheduling_type).to eq('stage')
           expect(job.reload.scheduling_type).to eq('stage')
diff --git a/spec/support/helpers/ci/job_factory_helpers.rb b/spec/support/helpers/ci/job_factory_helpers.rb
index 9b58a001f11b7d..b0436e4f6754d6 100644
--- a/spec/support/helpers/ci/job_factory_helpers.rb
+++ b/spec/support/helpers/ci/job_factory_helpers.rb
@@ -22,12 +22,12 @@ def self.mutate_temp_job_definition(job, **new_config)
     end
 
     # TODO: Maybe we can combine this with mutate_temp_job_definition and call it `mutate_temp_job_config`?
-    def self.mutate_temp_job_info(job, **new_config)
-      # Deep merge is required because job config changes are meant to be cumulative within factories
-      updated_config = (job.temp_job_info&.config || {}).deep_merge(new_config)
+    def self.mutate_temp_job_info(job, **new_attrs)
+      # Deep merge is required because job info changes are meant to be cumulative within factories
+      updated_attrs = (job.temp_job_info&.all_attributes || {}).deep_merge(new_attrs)
 
       new_temp_job_info = ::Ci::JobInfo.fabricate(
-        config: updated_config,
+        attrs: updated_attrs,
         project_id: job.pipeline.project.id,
         partition_id: job.pipeline.partition_id
       )
diff --git a/spec/support/helpers/ci/job_helpers.rb b/spec/support/helpers/ci/job_helpers.rb
index 3457b1d5cd2a9c..e46f126613d944 100644
--- a/spec/support/helpers/ci/job_helpers.rb
+++ b/spec/support/helpers/ci/job_helpers.rb
@@ -13,7 +13,8 @@ def stub_ci_job_definition(job, **new_config)
       end
 
       # We use regular merge (not deep_merge) to completely overwrite existing attributes
-      updated_config = (job.job_definition&.config || job.temp_job_definition&.config || {}).merge(new_config)
+      updated_config = (job.job_definition&.config || job.temp_job_definition&.config || {})
+                         .merge(new_config)
 
       new_job_definition = ::Ci::JobDefinition.fabricate(
         config: updated_config,
@@ -28,22 +29,22 @@ def stub_ci_job_definition(job, **new_config)
       allow(job).to receive(:job_definition).and_return(new_job_definition)
     end
 
-    # TODO: Maybe we can combine this with stub_ci_job_definition and call it `stub_ci_job_config`?
-    def stub_ci_job_info(job, **new_config)
-      new_config.symbolize_keys!
-      unknown_keys = new_config.keys - Ci::JobInfo::CONFIG_ATTRIBUTES
+    # TODO: Maybe we can combine this with stub_ci_job_definition and call it `stub_ci_job_attrs`?
+    def stub_ci_job_info(job, **new_attrs)
+      new_attrs.symbolize_keys!
+      unknown_keys = new_attrs.keys - Ci::JobInfo::ALL_ATTRIBUTES
 
       if unknown_keys.any?
         raise ArgumentError,
-          "You can only stub valid job info config attributes. Invalid key(s): #{unknown_keys.join(', ')}. " \
-            "Allowed: #{Ci::JobInfo::CONFIG_ATTRIBUTES.join(', ')}"
+          "You can only stub valid job info attributes. Invalid key(s): #{unknown_keys.join(', ')}. " \
+            "Allowed: #{Ci::JobInfo::ALL_ATTRIBUTES.join(', ')}"
       end
 
       # We use regular merge (not deep_merge) to completely overwrite existing attributes
-      updated_config = (job.job_info&.config || job.temp_job_info&.config || {}).merge(new_config)
+      updated_attrs = (job.job_info&.all_attributes || job.temp_job_info&.all_attributes || {}).merge(new_attrs)
 
       new_job_info = ::Ci::JobInfo.fabricate(
-        config: updated_config,
+        attrs: updated_attrs,
         project_id: job.pipeline.project.id,
         partition_id: job.pipeline.partition_id
       )
@@ -53,10 +54,7 @@ def stub_ci_job_info(job, **new_config)
       config_errors = new_job_info.errors[:config]
       raise ActiveRecord::RecordInvalid, config_errors.join(', ') if config_errors.any?
 
-      allow(job).to receive_messages(
-        job_info: new_job_info,
-        name: new_job_info.name # Stub columns we're still keeping in ci_builds
-      )
+      allow(job).to receive(:job_info).and_return(new_job_info)
     end
   end
 end
-- 
GitLab


From c0fa11c852427c1e7711401d3db28ed18feefbc6 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Wed, 10 Dec 2025 14:35:09 -0800
Subject: [PATCH 22/27] Apply suggestions to move methods

Applied suggestions to move need-related methods.
---
 app/models/ci/build_dependencies.rb                  |  2 +-
 app/models/ci/pipeline.rb                            |  7 +++++++
 app/models/ci/processable.rb                         |  8 --------
 app/models/concerns/ci/metadatable.rb                | 12 ++++++++++++
 app/services/ci/reset_skipped_jobs_service.rb        | 10 +---------
 ee/lib/gitlab/ci/pipeline/jobs_injector.rb           |  8 +-------
 lib/gitlab/ci/processable_object_hierarchy.rb        |  2 +-
 spec/models/ci/build_dependencies_spec.rb            |  6 ++++--
 .../atomic_processing_service_spec.rb                | 10 ++++++++++
 9 files changed, 37 insertions(+), 28 deletions(-)

diff --git a/app/models/ci/build_dependencies.rb b/app/models/ci/build_dependencies.rb
index b105359a381518..7f358b2aa52258 100644
--- a/app/models/ci/build_dependencies.rb
+++ b/app/models/ci/build_dependencies.rb
@@ -134,7 +134,7 @@ def from_previous_stages(scope)
 
     def from_needs(scope)
       needs_names = if processable.read_needs_from_job_definition?
-                      processable.job_needs.names
+                      processable.job_needs.names_with_artifacts_true
                     else
                       processable.needs.artifacts.select(:name)
                     end
diff --git a/app/models/ci/pipeline.rb b/app/models/ci/pipeline.rb
index 48125b238f208c..42eec2550c8713 100644
--- a/app/models/ci/pipeline.rb
+++ b/app/models/ci/pipeline.rb
@@ -723,6 +723,13 @@ def self.internal_id_scope_usage
       :ci_pipelines
     end
 
+    # TODO: Remove this method after migrating ci_build_needs to ci_job_definitions.
+    def read_needs_from_job_definitions?
+      # If a pipeline is created with FF `write_needs_to_ci_job_definitions` enabled, then all its jobs would
+      # have job_definition records with the `needs_attributes` key in the config value. So we just check one job.
+      processables.first&.read_needs_from_job_definition?
+    end
+
     def ci_pipeline_statuses_rate_limited?
       Gitlab::ApplicationRateLimiter.throttled?(
         :ci_pipeline_statuses_subscription,
diff --git a/app/models/ci/processable.rb b/app/models/ci/processable.rb
index 4b1bd7e7c00101..ea4df95db06d3d 100644
--- a/app/models/ci/processable.rb
+++ b/app/models/ci/processable.rb
@@ -232,14 +232,6 @@ def self.populate_scheduling_type!
       )
     end
 
-    # TODO: Remove this method after migrating ci_build_needs to ci_job_definitions.
-    # This method should only be used on a single pipeline's processables.
-    def self.read_needs_from_job_definitions?
-      # If a pipeline is created with FF `write_needs_to_ci_job_definitions` enabled, then all its jobs would
-      # have job_definition records with the `needs_attributes` key in the config value. So we just check one job.
-      first&.read_needs_from_job_definition?
-    end
-
     def assign_resource_from_resource_group(processable)
       Ci::ResourceGroups::AssignResourceFromResourceGroupWorker.perform_async(processable.resource_group_id)
     end
diff --git a/app/models/concerns/ci/metadatable.rb b/app/models/concerns/ci/metadatable.rb
index aea5d618079932..2bd48b8fa8ee86 100644
--- a/app/models/concerns/ci/metadatable.rb
+++ b/app/models/concerns/ci/metadatable.rb
@@ -235,6 +235,18 @@ def job_needs
     end
     strong_memoize_attr :job_needs
 
+    def needs_names
+      if read_needs_from_job_definition?
+        job_needs.names
+      else
+        needs.map(&:name)
+      end
+    end
+
+    def has_needs?
+      read_needs_from_job_definition? ? job_needs.any? : needs.present?
+    end
+
     def read_needs_from_job_definition?
       Feature.enabled?(:read_needs_from_ci_job_definitions, project) &&
         (job_definition&.config&.key?(:needs_attributes) || temp_job_definition&.config&.key?(:needs_attributes))
diff --git a/app/services/ci/reset_skipped_jobs_service.rb b/app/services/ci/reset_skipped_jobs_service.rb
index 1c8f65224b9d5b..3931fa4fdf5fe6 100644
--- a/app/services/ci/reset_skipped_jobs_service.rb
+++ b/app/services/ci/reset_skipped_jobs_service.rb
@@ -68,18 +68,10 @@ def ordered_by_dag(jobs)
     def sort_jobs(jobs)
       Gitlab::Ci::YamlProcessor::Dag.order(
         jobs.to_h do |job|
-          [job.name, aggregated_needs_names(job)]
+          [job.name, job.needs_names]
         end
       )
     end
     # rubocop: enable CodeReuse/ActiveRecord
-
-    def aggregated_needs_names(job)
-      if job.read_needs_from_job_definition?
-        job.job_needs.names
-      else
-        job.needs.map(&:name)
-      end
-    end
   end
 end
diff --git a/ee/lib/gitlab/ci/pipeline/jobs_injector.rb b/ee/lib/gitlab/ci/pipeline/jobs_injector.rb
index 9f25ef352224e4..d924689018784c 100644
--- a/ee/lib/gitlab/ci/pipeline/jobs_injector.rb
+++ b/ee/lib/gitlab/ci/pipeline/jobs_injector.rb
@@ -85,7 +85,7 @@ def add_job(stage:, job:)
 
           stage.statuses << job
           pipeline_jobs_by_name[job.name] = job
-          @jobs_with_needs << job if has_needs?(job)
+          @jobs_with_needs << job if job.has_needs?
         end
 
         def update_needs_references!
@@ -95,12 +95,6 @@ def update_needs_references!
             need.name = @job_renames.fetch(need.name, need.name)
           end
         end
-
-        # TODO: Could we simply replace this with checking if scheduling_type == :dag?
-        # If not, we can keep the logic below.
-        def has_needs?(job)
-          job.read_needs_from_job_definition? ? job.job_needs.any? : job.needs.present?
-        end
       end
     end
   end
diff --git a/lib/gitlab/ci/processable_object_hierarchy.rb b/lib/gitlab/ci/processable_object_hierarchy.rb
index 80be94d11ca783..3412fde01eee0b 100644
--- a/lib/gitlab/ci/processable_object_hierarchy.rb
+++ b/lib/gitlab/ci/processable_object_hierarchy.rb
@@ -83,7 +83,7 @@ def job_needs_cte
       end
 
       def read_needs_from_job_definitions?
-        pipeline.processables.read_needs_from_job_definitions?
+        pipeline.read_needs_from_job_definitions?
       end
       strong_memoize_attr :read_needs_from_job_definitions?
     end
diff --git a/spec/models/ci/build_dependencies_spec.rb b/spec/models/ci/build_dependencies_spec.rb
index 95ef5e4b009742..59065634a41470 100644
--- a/spec/models/ci/build_dependencies_spec.rb
+++ b/spec/models/ci/build_dependencies_spec.rb
@@ -71,7 +71,8 @@
             name: 'dag_job',
             scheduling_type: :dag,
             stage_idx: 2,
-            ci_stage: deploy_stage
+            ci_stage: deploy_stage,
+            needs_attributes: [{ name: 'staging', artifacts: true }]
           )
         end
 
@@ -96,7 +97,8 @@
           scheduling_type: scheduling_type,
           stage_idx: 3,
           ci_stage: deploy_stage,
-          options: { dependencies: dependencies }
+          options: { dependencies: dependencies },
+          needs_attributes: needs.to_a
         )
       end
 
diff --git a/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb b/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb
index 043bb2d211b4a4..bda7939ed9b491 100644
--- a/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb
+++ b/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb
@@ -789,6 +789,10 @@ def event_on_pipeline(event)
     end
 
     context 'when pipeline with needs is created', :sidekiq_inline do
+      before do
+        stub_feature_flags(read_needs_from_ci_job_definitions: false) # Temp to pass tests
+      end
+
       let!(:linux_build) { create_build('linux:build', stage: 'build', stage_idx: 0) }
       let!(:mac_build) { create_build('mac:build', stage: 'build', stage_idx: 0) }
       let!(:linux_rspec) { create_build('linux:rspec', stage: 'test', stage_idx: 1, scheduling_type: :dag) }
@@ -839,6 +843,10 @@ def event_on_pipeline(event)
       end
 
       context 'when one of the jobs is run on a failure' do
+        before do
+          stub_feature_flags(read_needs_from_ci_job_definitions: false) # Temp to pass tests
+        end
+
         let!(:linux_notify) { create_build('linux:notify', stage: 'deploy', stage_idx: 2, when: 'on_failure', scheduling_type: :dag) }
 
         let!(:linux_notify_on_build) { create(:ci_build_need, build: linux_notify, name: 'linux:build') }
@@ -899,6 +907,7 @@ def event_on_pipeline(event)
       let!(:deploy) { create_build('deploy', stage: 'deploy', stage_idx: 2, scheduling_type: :dag) }
 
       before do
+        stub_feature_flags(read_needs_from_ci_job_definitions: false) # Temp to pass tests
         create(:ci_build_need, build: deploy, name: 'linux:build')
       end
 
@@ -921,6 +930,7 @@ def event_on_pipeline(event)
       let!(:deploy) { create_build('deploy', stage: 'deploy', stage_idx: 1, scheduling_type: :dag) }
 
       before do
+        stub_feature_flags(read_needs_from_ci_job_definitions: false) # Temp to pass tests
         create(:ci_build_need, build: deploy, name: 'linux:build')
       end
 
-- 
GitLab


From 2f751b8bc01d38f27921fae7403191984ff64456 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Wed, 10 Dec 2025 17:34:37 -0800
Subject: [PATCH 23/27] Add source column to ci_job_infos

Adds source column to ci_job_infos and model.
---
 app/finders/ci/build_source_finder.rb              | 2 ++
 app/models/ci/job_info.rb                          | 1 +
 db/migrate/20251202000001_create_p_ci_job_infos.rb | 5 +++++
 db/structure.sql                                   | 3 +++
 4 files changed, 11 insertions(+)

diff --git a/app/finders/ci/build_source_finder.rb b/app/finders/ci/build_source_finder.rb
index 8c27ece61e9ed2..f16f846de8e336 100644
--- a/app/finders/ci/build_source_finder.rb
+++ b/app/finders/ci/build_source_finder.rb
@@ -1,6 +1,8 @@
 # frozen_string_literal: true
 
 module Ci
+  # TODO: Check what index(es) on ci_job_infos is best to support this Finder's queries.
+  # TODO: Compare query performance before/after moving ci_build_sources to ci_job_infos.
   class BuildSourceFinder
     def initialize(relation:, sources:, project:, params: {})
       raise ArgumentError, 'Only Ci::Builds are source searchable' unless relation.klass == Ci::Build
diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
index 3536f0c5704d18..64fbe6623372e4 100644
--- a/app/models/ci/job_info.rb
+++ b/app/models/ci/job_info.rb
@@ -20,6 +20,7 @@ class JobInfo < Ci::ApplicationRecord
     ].freeze
     NORMALIZED_DATA_COLUMNS = [
       :scheduling_type,
+      :source,
       :name
     ].freeze
     ALL_ATTRIBUTES = CONFIG_ATTRIBUTES + NORMALIZED_DATA_COLUMNS
diff --git a/db/migrate/20251202000001_create_p_ci_job_infos.rb b/db/migrate/20251202000001_create_p_ci_job_infos.rb
index 1fe63ede5eeeae..221b07387b0b8f 100644
--- a/db/migrate/20251202000001_create_p_ci_job_infos.rb
+++ b/db/migrate/20251202000001_create_p_ci_job_infos.rb
@@ -15,6 +15,7 @@ def change
       t.bigint :project_id, null: false
       t.datetime_with_timezone :created_at, null: false
       t.integer :scheduling_type, limit: 2, null: false
+      t.integer :source, limit: 2
       t.binary :checksum, null: false
       t.tsvector :search_vector, as: "to_tsvector('english'::regconfig, COALESCE(name, ''::text))", stored: true
       t.text :name, limit: 255, null: false
@@ -22,9 +23,13 @@ def change
 
       t.index [:project_id, :checksum, :partition_id], unique: true,
         name: :index_p_ci_job_infos_on_project_id_and_checksum
+      # TODO: Check what index is best to support Ci::Pipeline#uses_needs? query
       t.index :id,
         where: '(scheduling_type = 1)',
         name: :index_p_ci_job_infos_on_id_where_scheduling_type_dag
+      # TODO: Check what index is best to support Ci::BuildSourceFinder query
+      t.index [:project_id, :source, :id],
+        name: :index_p_ci_job_infos_on_project_id_source_id
       t.index [:search_vector], using: :gin,
         name: :index_p_ci_job_infos_on_search_vector
     end
diff --git a/db/structure.sql b/db/structure.sql
index 1a415246471d83..9288570d855b1c 100644
--- a/db/structure.sql
+++ b/db/structure.sql
@@ -5801,6 +5801,7 @@ CREATE TABLE p_ci_job_infos (
     project_id bigint NOT NULL,
     created_at timestamp with time zone NOT NULL,
     scheduling_type smallint NOT NULL,
+    source smallint,
     checksum bytea NOT NULL,
     search_vector tsvector GENERATED ALWAYS AS (to_tsvector('english'::regconfig, COALESCE(name, ''::text))) STORED,
     name text NOT NULL,
@@ -43382,6 +43383,8 @@ CREATE INDEX index_p_ci_job_infos_on_id_where_scheduling_type_dag ON ONLY p_ci_j
 
 CREATE UNIQUE INDEX index_p_ci_job_infos_on_project_id_and_checksum ON ONLY p_ci_job_infos USING btree (project_id, checksum, partition_id);
 
+CREATE INDEX index_p_ci_job_infos_on_project_id_source_id ON ONLY p_ci_job_infos USING btree (project_id, source, id);
+
 CREATE INDEX index_p_ci_job_infos_on_search_vector ON ONLY p_ci_job_infos USING gin (search_vector);
 
 CREATE UNIQUE INDEX index_p_ci_job_inputs_on_job_id_and_name ON ONLY p_ci_job_inputs USING btree (job_id, name, partition_id);
-- 
GitLab


From 5b72d91d517afde84857eaa88d8d2b4c4a8f3a96 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Thu, 11 Dec 2025 09:47:06 -0800
Subject: [PATCH 24/27] Start moving ci_build_sources data into ci_job_infos
 WIP

WIP code to move ci_build_sources data
into ci_job_infos.
---
 app/models/ci/job_info.rb                     | 86 +++++++++++--------
 app/models/ci/processable.rb                  |  6 +-
 app/models/commit_status.rb                   |  2 +-
 app/services/ci/clone_job_service.rb          |  2 +-
 .../ci/pipeline/chain/set_build_sources.rb    |  9 +-
 spec/factories/ci/builds.rb                   |  6 +-
 spec/factories/ci/processable.rb              | 15 ++--
 .../support/helpers/ci/job_factory_helpers.rb | 19 ----
 spec/support/helpers/ci/job_helpers.rb        | 13 +--
 9 files changed, 83 insertions(+), 75 deletions(-)

diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
index 64fbe6623372e4..c87f49c2036765 100644
--- a/app/models/ci/job_info.rb
+++ b/app/models/ci/job_info.rb
@@ -23,7 +23,7 @@ class JobInfo < Ci::ApplicationRecord
       :source,
       :name
     ].freeze
-    ALL_ATTRIBUTES = CONFIG_ATTRIBUTES + NORMALIZED_DATA_COLUMNS
+    ALL_JOB_ATTRIBUTES = CONFIG_ATTRIBUTES + NORMALIZED_DATA_COLUMNS
 
     # We're copying over these values to ci_job_infos but not removing them from their original/initial destinations
     COPY_ONLY_ATTRIBUTES = [:name, :needs_attributes].freeze
@@ -44,64 +44,82 @@ class JobInfo < Ci::ApplicationRecord
     attribute :config, ::Gitlab::Database::Type::SymbolizedJsonb.new
 
     enum :scheduling_type, { stage: 0, dag: 1 }, prefix: true
+    enum :source, {
+      scan_execution_policy: 1001,
+      pipeline_execution_policy: 1002
+    }.merge(::Enums::Ci::Pipeline.sources)
 
     scope :for_project, ->(project_id) { where(project_id: project_id) }
     scope :for_checksum, ->(checksum) { where(checksum: checksum) }
 
-    def self.fabricate(attrs:, project_id:, partition_id:)
-      sanitized_attrs = normalize_and_sanitize(attrs)
-      transformed_attrs = transform(sanitized_attrs)
+    def self.fabricate(job_attrs:, project_id:, partition_id:)
+      new(
+        project_id: project_id,
+        partition_id: partition_id,
+        created_at: Time.current
+      ).mutate(job_attrs)
+    end
+
+    def mutate(new_job_attrs)
+      raise 'Cannot mutate persisted job_info record.' if readonly?
+
+      updated_job_attrs = all_job_attributes.compact.merge(new_job_attrs)
+
+      assign_attributes(**prepare_job_attributes_and_checksum(updated_job_attrs))
+      self
+    end
+
+    # Hash containing all attributes: config + normalized_data
+    # TODO: We should do this for Ci::JobDefinition and update Ci::JobHelpers#stub_ci_job_definition
+    # to merge all_job_attributes instead of just config.
+    def all_job_attributes
+      attributes.deep_symbolize_keys.slice(*ALL_JOB_ATTRIBUTES).merge(config)
+    end
+
+    def readonly?
+      persisted?
+    end
+
+    private
+
+    def prepare_job_attributes_and_checksum(job_attrs)
+      sanitized_job_attrs = normalize_and_sanitize(job_attrs)
+      transformed_job_attrs = transform(sanitized_job_attrs)
 
       # NOTE: Checksum is generated with all attributes including normalized columns. But when storing
       # the data, we can save space by excluding the normalized column values from the config hash.
-      attrs = {
-        project_id: project_id,
-        partition_id: partition_id,
-        config: transformed_attrs.except(*NORMALIZED_DATA_COLUMNS),
-        checksum: generate_checksum(transformed_attrs),
-        created_at: Time.current,
-        **transformed_attrs.slice(*NORMALIZED_DATA_COLUMNS)
+      {
+        checksum: generate_checksum(transformed_job_attrs),
+        config: transformed_job_attrs.except(*NORMALIZED_DATA_COLUMNS),
+        **transformed_job_attrs.slice(*NORMALIZED_DATA_COLUMNS)
       }
-
-      new(attrs)
     end
 
-    def self.normalize_and_sanitize(attrs)
-      data = attrs.deep_symbolize_keys
+    def normalize_and_sanitize(job_attrs)
+      data = job_attrs.deep_symbolize_keys
 
       NORMALIZED_DATA_COLUMNS.each do |col|
-        data[col] = data.fetch(col) { column_defaults[col.to_s] }
+        data[col] = data.fetch(col) { self.class.column_defaults[col.to_s] }
       end
 
-      data.slice(*ALL_ATTRIBUTES)
+      data.slice(*ALL_JOB_ATTRIBUTES)
     end
 
-    def self.transform(attrs)
-      return attrs unless attrs.key?(:needs_attributes)
+    def transform(job_attrs)
+      return job_attrs unless job_attrs.key?(:needs_attributes)
 
       # For needs, we only need to store the names for the pipeline UI graph
-      attrs[:needs_attributes] = attrs[:needs_attributes].map do |need_hash|
+      job_attrs[:needs_attributes] = job_attrs[:needs_attributes].map do |need_hash|
         need_hash.slice(*::Gitlab::Ci::JobNeeds::Collection::INTRINSIC_ATTRIBUTES)
       end
 
-      attrs
+      job_attrs
     end
 
-    def self.generate_checksum(attrs)
-      attrs
+    def generate_checksum(job_attrs)
+      job_attrs
         .then { |data| Gitlab::Json.dump(data) }
         .then { |data| Digest::SHA256.hexdigest(data) }
     end
-
-    def readonly?
-      persisted?
-    end
-
-    # Hash containing all attributes: config + normalized_data
-    # TODO: We should do this for Ci::JobDefinition and update Ci::JobHelpers#stub_ci_job_definition
-    # to merge all_attributes instead of just config.
-    def all_attributes
-      attributes.deep_symbolize_keys.slice(*ALL_ATTRIBUTES).merge(config)
-    end
   end
 end
diff --git a/app/models/ci/processable.rb b/app/models/ci/processable.rb
index ea4df95db06d3d..05912bf5739fd0 100644
--- a/app/models/ci/processable.rb
+++ b/app/models/ci/processable.rb
@@ -162,7 +162,7 @@ class Processable < ::CommitStatus
 
     def self.fabricate(attrs)
       attrs = attrs.dup
-      info_attrs = attrs.slice(*Ci::JobInfo::ALL_ATTRIBUTES)
+      info_attrs = attrs.slice(*Ci::JobInfo::ALL_JOB_ATTRIBUTES)
       definition_attrs = attrs.extract!(*Ci::JobDefinition::CONFIG_ATTRIBUTES)
 
       attrs[:tag_list] = definition_attrs[:tag_list] if definition_attrs.key?(:tag_list)
@@ -182,7 +182,7 @@ def self.fabricate(attrs)
       attrs.delete(:needs_attributes) if Feature.enabled?(:stop_writing_to_ci_build_needs, attrs[:project])
 
       if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, attrs[:project])
-        attrs.delete(*[Ci::JobInfo::ALL_ATTRIBUTES - Ci::JobInfo::COPY_ONLY_ATTRIBUTES])
+        attrs.delete(*[Ci::JobInfo::ALL_JOB_ATTRIBUTES - Ci::JobInfo::COPY_ONLY_ATTRIBUTES])
       end
 
       new(attrs).tap do |job|
@@ -197,7 +197,7 @@ def self.fabricate(attrs)
         next unless Feature.enabled?(:write_to_ci_job_infos, attrs[:project])
 
         job_info = ::Ci::JobInfo.fabricate(
-          attrs: info_attrs,
+          job_attrs: info_attrs,
           project_id: job.project_id,
           partition_id: job.partition_id
         )
diff --git a/app/models/commit_status.rb b/app/models/commit_status.rb
index 732a0ffc76d343..102bf01c905c6b 100644
--- a/app/models/commit_status.rb
+++ b/app/models/commit_status.rb
@@ -35,7 +35,7 @@ class CommitStatus < Ci::ApplicationRecord
     inverse_of: :statuses
 
   # NOTE: We need to have these relationships in CommitStatus because generic
-  # commit statuses also use the columns in `Ci::JobInfo::ALL_ATTRIBUTES`.
+  # commit statuses also use the columns in `Ci::JobInfo::ALL_JOB_ATTRIBUTES`.
   has_one :job_info_instance, ->(job) { in_partition(job) },
     class_name: 'Ci::JobInfoInstance',
     foreign_key: :job_id,
diff --git a/app/services/ci/clone_job_service.rb b/app/services/ci/clone_job_service.rb
index 6dfbb31b55e6db..933e2846e7efc8 100644
--- a/app/services/ci/clone_job_service.rb
+++ b/app/services/ci/clone_job_service.rb
@@ -119,7 +119,7 @@ def add_new_job_info_attributes!(attributes)
 
     def find_or_create_job_info
       info = ::Ci::JobInfo.fabricate(
-        attrs: build_info_attributes,
+        job_attrs: build_info_attributes,
         project_id: project_id,
         partition_id: partition_id
       )
diff --git a/lib/gitlab/ci/pipeline/chain/set_build_sources.rb b/lib/gitlab/ci/pipeline/chain/set_build_sources.rb
index 78ec7da0500e22..212a7af0c55668 100644
--- a/lib/gitlab/ci/pipeline/chain/set_build_sources.rb
+++ b/lib/gitlab/ci/pipeline/chain/set_build_sources.rb
@@ -16,8 +16,13 @@ def perform!
                                  pipeline.source
                                end
 
-                build.build_build_source(source: build_source,
-                  project_id: project.id)
+                # RESUME POC HERE...
+                if Feature.disabled?(:stop_writing_ci_job_info_to_old_destinations, project)
+                  build.build_build_source(source: build_source,
+                    project_id: project.id)
+                end
+
+                build.temp_job_info.mutate(source: build_source) if Feature.enabled?(:write_to_ci_job_infos, project)
               end
             end
           end
diff --git a/spec/factories/ci/builds.rb b/spec/factories/ci/builds.rb
index e5e15c942d27ec..6340c7618f1ff6 100644
--- a/spec/factories/ci/builds.rb
+++ b/spec/factories/ci/builds.rb
@@ -108,10 +108,8 @@
 
       after(:build) do |build, evaluator|
         if Feature.enabled?(:write_to_ci_job_infos, build.project)
-          Ci::JobFactoryHelpers.mutate_temp_job_info(
-            build,
-            needs_attributes: [{ name: evaluator.needed.name }]
-          )
+          processable.temp_job_info.mutate(needs_attributes: [{ name: evaluator.needed.name }])
+          processable.temp_job_info.validate!
         end
 
         if Feature.enabled?(:write_needs_to_ci_job_definitions, build.project)
diff --git a/spec/factories/ci/processable.rb b/spec/factories/ci/processable.rb
index 34ed9e0284df17..f41812dda8ddac 100644
--- a/spec/factories/ci/processable.rb
+++ b/spec/factories/ci/processable.rb
@@ -34,12 +34,17 @@
       end
 
       if Feature.enabled?(:write_to_ci_job_infos, processable.project)
-        Ci::JobFactoryHelpers.mutate_temp_job_info(
-          processable,
-          scheduling_type: evaluator.scheduling_type,
-          name: processable.name,
-          needs_attributes: evaluator.needs_attributes.to_a
+        processable.temp_job_info = ::Ci::JobInfo.fabricate(
+          project_id: processable.project_id,
+          partition_id: processable.partition_id,
+          job_attrs: {
+            scheduling_type: evaluator.scheduling_type,
+            name: processable.name,
+            needs_attributes: evaluator.needs_attributes.to_a
+          }
         )
+
+        processable.temp_job_info.validate!
       end
 
       if Feature.disabled?(:stop_writing_ci_job_info_to_old_destinations, processable.project)
diff --git a/spec/support/helpers/ci/job_factory_helpers.rb b/spec/support/helpers/ci/job_factory_helpers.rb
index b0436e4f6754d6..8b948e7e0992eb 100644
--- a/spec/support/helpers/ci/job_factory_helpers.rb
+++ b/spec/support/helpers/ci/job_factory_helpers.rb
@@ -20,24 +20,5 @@ def self.mutate_temp_job_definition(job, **new_config)
 
       job.temp_job_definition = new_temp_job_definition
     end
-
-    # TODO: Maybe we can combine this with mutate_temp_job_definition and call it `mutate_temp_job_config`?
-    def self.mutate_temp_job_info(job, **new_attrs)
-      # Deep merge is required because job info changes are meant to be cumulative within factories
-      updated_attrs = (job.temp_job_info&.all_attributes || {}).deep_merge(new_attrs)
-
-      new_temp_job_info = ::Ci::JobInfo.fabricate(
-        attrs: updated_attrs,
-        project_id: job.pipeline.project.id,
-        partition_id: job.pipeline.partition_id
-      )
-
-      new_temp_job_info.validate
-      # TODO: Update this to raise on other column validation errors too
-      config_errors = new_temp_job_info.errors[:config]
-      raise ActiveRecord::RecordInvalid, config_errors.join(', ') if config_errors.any?
-
-      job.temp_job_info = new_temp_job_info
-    end
   end
 end
diff --git a/spec/support/helpers/ci/job_helpers.rb b/spec/support/helpers/ci/job_helpers.rb
index e46f126613d944..067573c7273c46 100644
--- a/spec/support/helpers/ci/job_helpers.rb
+++ b/spec/support/helpers/ci/job_helpers.rb
@@ -30,21 +30,22 @@ def stub_ci_job_definition(job, **new_config)
     end
 
     # TODO: Maybe we can combine this with stub_ci_job_definition and call it `stub_ci_job_attrs`?
-    def stub_ci_job_info(job, **new_attrs)
-      new_attrs.symbolize_keys!
-      unknown_keys = new_attrs.keys - Ci::JobInfo::ALL_ATTRIBUTES
+    def stub_ci_job_info(job, **new_job_attrs)
+      new_job_attrs.symbolize_keys!
+      unknown_keys = new_job_attrs.keys - Ci::JobInfo::ALL_JOB_ATTRIBUTES
 
       if unknown_keys.any?
         raise ArgumentError,
           "You can only stub valid job info attributes. Invalid key(s): #{unknown_keys.join(', ')}. " \
-            "Allowed: #{Ci::JobInfo::ALL_ATTRIBUTES.join(', ')}"
+            "Allowed: #{Ci::JobInfo::ALL_JOB_ATTRIBUTES.join(', ')}"
       end
 
       # We use regular merge (not deep_merge) to completely overwrite existing attributes
-      updated_attrs = (job.job_info&.all_attributes || job.temp_job_info&.all_attributes || {}).merge(new_attrs)
+      updated_job_attrs = (job.job_info&.all_job_attributes || job.temp_job_info&.all_job_attributes || {})
+                            .merge(new_job_attrs)
 
       new_job_info = ::Ci::JobInfo.fabricate(
-        attrs: updated_attrs,
+        job_attrs: updated_job_attrs,
         project_id: job.pipeline.project.id,
         partition_id: job.pipeline.partition_id
       )
-- 
GitLab


From b41baaba5d1f6cb841d3e7b9632ec69758a78ebc Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Fri, 12 Dec 2025 14:35:38 -0800
Subject: [PATCH 25/27] Add TODO issue links for removing unused
 scopes/associations

Add TODO issue links for removing unused scopes/associations
---
 app/models/ci/pipeline.rb             | 15 +++++++++++----
 app/models/ci/processable.rb          | 10 ++++------
 app/models/commit_status.rb           |  9 ---------
 app/models/concerns/ci/metadatable.rb |  1 +
 4 files changed, 16 insertions(+), 19 deletions(-)

diff --git a/app/models/ci/pipeline.rb b/app/models/ci/pipeline.rb
index 42eec2550c8713..08582d115d9c04 100644
--- a/app/models/ci/pipeline.rb
+++ b/app/models/ci/pipeline.rb
@@ -106,7 +106,7 @@ class Pipeline < Ci::ApplicationRecord
     # DEPRECATED:
     has_many :statuses, ->(pipeline) { in_partition(pipeline) }, class_name: 'CommitStatus', foreign_key: :commit_id, inverse_of: :pipeline, partition_foreign_key: :partition_id
     has_many :processables, ->(pipeline) { in_partition(pipeline) }, class_name: 'Ci::Processable', foreign_key: :commit_id, inverse_of: :pipeline, partition_foreign_key: :partition_id
-    # TODO: We can remove this association; it's unused.
+    # TODO: We can probably remove this association: https://gitlab.com/gitlab-org/gitlab/-/issues/584000
     has_many :latest_statuses_ordered_by_stage, ->(pipeline) { latest.in_partition(pipeline).order(:stage_idx, :stage) }, class_name: 'CommitStatus', foreign_key: :commit_id, inverse_of: :pipeline, partition_foreign_key: :partition_id
     has_many :latest_statuses, ->(pipeline) { latest.in_partition(pipeline) }, class_name: 'CommitStatus', foreign_key: :commit_id, inverse_of: :pipeline, partition_foreign_key: :partition_id
     has_many :statuses_order_id_desc, ->(pipeline) { in_partition(pipeline).order_id_desc }, class_name: 'CommitStatus', foreign_key: :commit_id,
@@ -730,6 +730,14 @@ def read_needs_from_job_definitions?
       processables.first&.read_needs_from_job_definition?
     end
 
+    # TODO: Remove this method after migrating data to ci_job_infos
+    def read_from_job_infos?
+      # If a pipeline is created with FF `write_to_ci_job_infos` enabled, then all its jobs would
+      # have job_info records. So we just need to check one job if it has job_info.
+      # We check the oldest job in the pipeline since recent retries could create a new job_info record when cloning.
+      processables.first&.read_from_job_info?
+    end
+
     def ci_pipeline_statuses_rate_limited?
       Gitlab::ApplicationRateLimiter.throttled?(
         :ci_pipeline_statuses_subscription,
@@ -749,7 +757,7 @@ def trigger_status_change_subscriptions
 
     def uses_needs?
       # TODO: Check if should keep index_p_ci_job_infos_on_id_where_scheduling_type_dag or a different index
-      if processables.read_from_job_infos?
+      if read_from_job_infos?
         processables
           .joins(:job_info)
           .where(p_ci_job_infos: { scheduling_type: :dag })
@@ -1601,8 +1609,7 @@ def source_ref_path
 
     # Set scheduling type of processables if they were created before scheduling_type
     # data was deployed (https://gitlab.com/gitlab-org/gitlab/-/merge_requests/22246).
-    # TODO: We probably don't need this method anymore.
-    # See https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540#note_2878147697.
+    # # TODO: We can probably remove this method: https://gitlab.com/gitlab-org/gitlab/-/issues/583998
     def ensure_scheduling_type!
       processables.populate_scheduling_type!
     end
diff --git a/app/models/ci/processable.rb b/app/models/ci/processable.rb
index 05912bf5739fd0..9a95f94c76ee18 100644
--- a/app/models/ci/processable.rb
+++ b/app/models/ci/processable.rb
@@ -64,14 +64,14 @@ class Processable < ::CommitStatus
     scope :preload_job_definitions, -> { preload(:job_definition) }
     scope :manual_actions, -> { where(when: :manual, status: COMPLETED_STATUSES + %i[manual]) }
 
-    # TODO: We can probably remove this scope; it's not used anywhere.
+    # TODO: We can probably remove this scope: https://gitlab.com/gitlab-org/gitlab/-/issues/584000
     scope :with_needs, ->(names = nil) do
       needs = Ci::BuildNeed.scoped_build.select(1)
       needs = needs.where(name: names) if names
       where('EXISTS (?)', needs)
     end
 
-    # TODO: We can probably remove this scope; it's not used anywhere.
+    # TODO: We can probably remove this scope: https://gitlab.com/gitlab-org/gitlab/-/issues/584000
     scope :without_needs, ->(names = nil) do
       needs = Ci::BuildNeed.scoped_build.select(1)
       needs = needs.where(name: names) if names
@@ -220,8 +220,7 @@ def self.select_with_aggregated_needs(project)
 
     # Old processables may have scheduling_type as nil,
     # so we need to ensure the data exists before using it.
-    # TODO: We probably don't need this method anymore.
-    # See https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540#note_2878147697.
+    # TODO: We can probably remove this method: https://gitlab.com/gitlab-org/gitlab/-/issues/583998
     def self.populate_scheduling_type!
       needs = Ci::BuildNeed.scoped_build.select(1)
       where(scheduling_type: nil).update_all(
@@ -319,8 +318,7 @@ def needs_attributes
       end
     end
 
-    # TODO: We probably don't need this method anymore.
-    # See https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540#note_2878147697.
+    # TODO: We can probably remove this method: https://gitlab.com/gitlab-org/gitlab/-/issues/583998
     def ensure_scheduling_type!
       # If this has a scheduling_type, it means all processables in the pipeline already have.
       return if scheduling_type
diff --git a/app/models/commit_status.rb b/app/models/commit_status.rb
index 102bf01c905c6b..862ed31f6987fc 100644
--- a/app/models/commit_status.rb
+++ b/app/models/commit_status.rb
@@ -280,15 +280,6 @@ def self.locking_enabled?
     false
   end
 
-  # TODO: Remove this method after scheduling_type data migrated to ci_job_infos
-  # This method should only be used on a single pipeline's processables.
-  def self.read_from_job_infos?
-    # If a pipeline is created with FF `write_to_ci_job_infos` enabled, then all its jobs would
-    # have job_info records. So we just need to check one job if it has job_info.
-    # We check the oldest job in the pipeline since recent retries would create a new job_info record when cloning.
-    first&.read_from_job_info?
-  end
-
   def locking_enabled?
     will_save_change_to_status?
   end
diff --git a/app/models/concerns/ci/metadatable.rb b/app/models/concerns/ci/metadatable.rb
index 2bd48b8fa8ee86..59d77329d3da10 100644
--- a/app/models/concerns/ci/metadatable.rb
+++ b/app/models/concerns/ci/metadatable.rb
@@ -253,6 +253,7 @@ def read_needs_from_job_definition?
     end
     strong_memoize_attr :read_needs_from_job_definition?
 
+    # TODO: Remove this method after migrating data to ci_job_infos
     def read_from_job_info?
       Feature.enabled?(:read_from_ci_job_infos, project) && job_info.present?
     end
-- 
GitLab


From ee9f33c3332712f42a7c752775eadfee5fb17af5 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Fri, 12 Dec 2025 18:05:27 -0800
Subject: [PATCH 26/27] Revert back to using ci_builds.job_info_id instead of
 assoc table

Go back to using ci_builds.job_info_id instead of
having the association table ci_job_info_instances.
---
 app/finders/ci/build_name_finder.rb           | 15 +++-----
 app/models/ci/job_info.rb                     | 16 ++++----
 app/models/ci/job_info_instance.rb            | 35 ------------------
 app/models/ci/processable.rb                  |  4 +-
 app/models/commit_status.rb                   | 23 +++---------
 .../concerns/ci/partitionable/testing.rb      |  1 -
 app/models/project.rb                         |  1 -
 app/services/ci/clone_job_service.rb          |  2 +-
 app/services/ci/retry_pipeline_service.rb     |  2 +-
 config/initializers/postgres_partitioning.rb  |  1 -
 ...02000003_create_p_ci_job_info_instances.rb | 19 ----------
 ...eate_p_ci_job_info_instances_partitions.rb | 35 ------------------
 ...> 20251212000001_create_p_ci_job_infos.rb} |  2 +-
 ...00002_create_p_ci_job_infos_partitions.rb} |  2 +-
 ...3_add_job_info_id_column_to_p_ci_builds.rb | 16 ++++++++
 ...add_fk_to_ci_builds_from_info_instances.rb | 37 -------------------
 ...04_add_index_on_p_ci_builds_job_info_id.rb | 22 +++++++++++
 ...0005_add_fk_on_p_ci_builds_job_info_id.rb} | 12 ++++--
 db/schema_migrations/20251202000001           |  1 -
 db/schema_migrations/20251202000002           |  1 -
 db/schema_migrations/20251202000003           |  1 -
 db/schema_migrations/20251202000004           |  1 -
 db/schema_migrations/20251202000005           |  1 -
 db/schema_migrations/20251202000006           |  1 -
 db/schema_migrations/20251212000001           |  1 +
 db/schema_migrations/20251212000002           |  1 +
 db/schema_migrations/20251212000003           |  1 +
 db/schema_migrations/20251212000004           |  1 +
 db/schema_migrations/20251212000005           |  1 +
 db/structure.sql                              | 27 +++-----------
 .../ci/pipeline/create/job_info_builder.rb    |  6 +--
 .../import_export/project/relation_factory.rb |  3 +-
 spec/factories/ci/job_info_instances.rb       |  9 -----
 spec/factories/ci/processable.rb              |  4 +-
 spec/services/ci/clone_job_service_spec.rb    |  2 +-
 spec/support/helpers/ci/job_helpers.rb        |  7 ++--
 36 files changed, 92 insertions(+), 222 deletions(-)
 delete mode 100644 app/models/ci/job_info_instance.rb
 delete mode 100644 db/migrate/20251202000003_create_p_ci_job_info_instances.rb
 delete mode 100644 db/migrate/20251202000004_create_p_ci_job_info_instances_partitions.rb
 rename db/migrate/{20251202000001_create_p_ci_job_infos.rb => 20251212000001_create_p_ci_job_infos.rb} (98%)
 rename db/migrate/{20251202000002_create_p_ci_job_infos_partitions.rb => 20251212000002_create_p_ci_job_infos_partitions.rb} (97%)
 create mode 100644 db/migrate/20251212000003_add_job_info_id_column_to_p_ci_builds.rb
 delete mode 100644 db/post_migrate/20251202000006_add_fk_to_ci_builds_from_info_instances.rb
 create mode 100644 db/post_migrate/20251212000004_add_index_on_p_ci_builds_job_info_id.rb
 rename db/post_migrate/{20251202000005_add_fk_to_ci_job_infos_from_info_instances.rb => 20251212000005_add_fk_on_p_ci_builds_job_info_id.rb} (63%)
 delete mode 100644 db/schema_migrations/20251202000001
 delete mode 100644 db/schema_migrations/20251202000002
 delete mode 100644 db/schema_migrations/20251202000003
 delete mode 100644 db/schema_migrations/20251202000004
 delete mode 100644 db/schema_migrations/20251202000005
 delete mode 100644 db/schema_migrations/20251202000006
 create mode 100644 db/schema_migrations/20251212000001
 create mode 100644 db/schema_migrations/20251212000002
 create mode 100644 db/schema_migrations/20251212000003
 create mode 100644 db/schema_migrations/20251212000004
 create mode 100644 db/schema_migrations/20251212000005
 delete mode 100644 spec/factories/ci/job_info_instances.rb

diff --git a/app/finders/ci/build_name_finder.rb b/app/finders/ci/build_name_finder.rb
index a6bc3a42afec19..93ee91e36be927 100644
--- a/app/finders/ci/build_name_finder.rb
+++ b/app/finders/ci/build_name_finder.rb
@@ -27,31 +27,26 @@ def limited_name_search_terms
     # rubocop: disable CodeReuse/ActiveRecord -- Need specialized queries for database optimizations
     def filter_by_name(build_relation)
       build_name_relation = Ci::BuildName
-        .select(:build_id, :partition_id)
         .where(project_id: project.id)
         .pg_full_text_search_in_model(limited_name_search_terms)
 
       if Feature.disabled?(:read_from_ci_job_infos, project)
-        return build_relation.where("(id, partition_id) IN (?)", build_name_relation)
+        return build_relation.where("(id, partition_id) IN (?)", build_name_relation.select(:build_id, :partition_id))
       end
 
       job_info_relation = Ci::JobInfo
-        .select(:id, :partition_id)
-        .for_project(project.id)
+        .where(project_id: project.id)
         .pg_full_text_search_in_model(limited_name_search_terms)
 
-      job_info_instances_relation = Ci::JobInfoInstance
-        .select(:job_id, :partition_id)
-        .where('(job_info_id, partition_id) IN (?)', job_info_relation)
-
+      # NOTE: This query would be much more efficient on ci_job_infos alone.
       # TODO: Evaluate the query performance after we create and write to ci_job_infos. Then we can decide on either:
       # 1. Keep this OR query if performance is not severely impacted.
       # 2. Plan to migrate all existing data to ci_job_infos before we switch reads.
       build_relation
-        .where("(id, partition_id) IN (?)", job_info_instances_relation)
+        .where("(job_info_id, partition_id) IN (?)", job_info_relation.select(:id, :partition_id))
         .or(
           build_relation
-            .where("(id, partition_id) IN (?)", build_name_relation)
+            .where("(id, partition_id) IN (?)", build_name_relation.select(:build_id, :partition_id))
         )
     end
     # rubocop: enable CodeReuse/ActiveRecord
diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
index c87f49c2036765..2d7f72c7975af1 100644
--- a/app/models/ci/job_info.rb
+++ b/app/models/ci/job_info.rb
@@ -15,7 +15,10 @@ class JobInfo < Ci::ApplicationRecord
     ignore_column :search_vector, remove_never: true # Value is auto-generated by DB; must ignore it for bulk insert
 
     # IMPORTANT: Order of attribute keys is important for the checksum calculation.
-    CONFIG_ATTRIBUTES = [
+    JOB_ATTRIBUTES = [
+      :scheduling_type,
+      :source,
+      :name,
       :needs_attributes
     ].freeze
     NORMALIZED_DATA_COLUMNS = [
@@ -23,7 +26,6 @@ class JobInfo < Ci::ApplicationRecord
       :source,
       :name
     ].freeze
-    ALL_JOB_ATTRIBUTES = CONFIG_ATTRIBUTES + NORMALIZED_DATA_COLUMNS
 
     # We're copying over these values to ci_job_infos but not removing them from their original/initial destinations
     COPY_ONLY_ATTRIBUTES = [:name, :needs_attributes].freeze
@@ -63,7 +65,7 @@ def self.fabricate(job_attrs:, project_id:, partition_id:)
     def mutate(new_job_attrs)
       raise 'Cannot mutate persisted job_info record.' if readonly?
 
-      updated_job_attrs = all_job_attributes.compact.merge(new_job_attrs)
+      updated_job_attrs = job_attributes.compact.merge(new_job_attrs)
 
       assign_attributes(**prepare_job_attributes_and_checksum(updated_job_attrs))
       self
@@ -71,9 +73,9 @@ def mutate(new_job_attrs)
 
     # Hash containing all attributes: config + normalized_data
     # TODO: We should do this for Ci::JobDefinition and update Ci::JobHelpers#stub_ci_job_definition
-    # to merge all_job_attributes instead of just config.
-    def all_job_attributes
-      attributes.deep_symbolize_keys.slice(*ALL_JOB_ATTRIBUTES).merge(config)
+    # to merge job_attributes instead of just config.
+    def job_attributes
+      attributes.deep_symbolize_keys.slice(*JOB_ATTRIBUTES).merge(config)
     end
 
     def readonly?
@@ -102,7 +104,7 @@ def normalize_and_sanitize(job_attrs)
         data[col] = data.fetch(col) { self.class.column_defaults[col.to_s] }
       end
 
-      data.slice(*ALL_JOB_ATTRIBUTES)
+      data.slice(*JOB_ATTRIBUTES)
     end
 
     def transform(job_attrs)
diff --git a/app/models/ci/job_info_instance.rb b/app/models/ci/job_info_instance.rb
deleted file mode 100644
index 4f9dd3e9003640..00000000000000
--- a/app/models/ci/job_info_instance.rb
+++ /dev/null
@@ -1,35 +0,0 @@
-# frozen_string_literal: true
-
-module Ci
-  class JobInfoInstance < Ci::ApplicationRecord
-    include Ci::Partitionable
-
-    self.table_name = :p_ci_job_info_instances
-    self.primary_key = :job_id
-
-    query_constraints :job_id, :partition_id
-    partitionable scope: :job, partitioned: true
-
-    belongs_to :project
-
-    belongs_to :job, ->(job) { in_partition(job) },
-      class_name: 'CommitStatus',
-      partition_foreign_key: :partition_id,
-      inverse_of: :job_info_instance
-
-    # rubocop: disable Rails/InverseOf -- Relation not present in Ci::JobInfo because foreign key callback is not compatible with BulkInsertSafe
-    belongs_to :job_info, ->(info) { in_partition(info) },
-      class_name: 'Ci::JobInfo',
-      partition_foreign_key: :partition_id
-    # rubocop: enable Rails/InverseOf
-
-    validates :project, presence: true
-    validates :job, presence: true
-    validates :job_info, presence: true
-
-    scope :scoped_job, -> do
-      where(arel_table[:job_id].eq(Ci::Processable.arel_table[:id]))
-      .where(arel_table[:partition_id].eq(Ci::Processable.arel_table[:partition_id]))
-    end
-  end
-end
diff --git a/app/models/ci/processable.rb b/app/models/ci/processable.rb
index 9a95f94c76ee18..cc9f9ed50f5066 100644
--- a/app/models/ci/processable.rb
+++ b/app/models/ci/processable.rb
@@ -162,7 +162,7 @@ class Processable < ::CommitStatus
 
     def self.fabricate(attrs)
       attrs = attrs.dup
-      info_attrs = attrs.slice(*Ci::JobInfo::ALL_JOB_ATTRIBUTES)
+      info_attrs = attrs.slice(*Ci::JobInfo::JOB_ATTRIBUTES)
       definition_attrs = attrs.extract!(*Ci::JobDefinition::CONFIG_ATTRIBUTES)
 
       attrs[:tag_list] = definition_attrs[:tag_list] if definition_attrs.key?(:tag_list)
@@ -182,7 +182,7 @@ def self.fabricate(attrs)
       attrs.delete(:needs_attributes) if Feature.enabled?(:stop_writing_to_ci_build_needs, attrs[:project])
 
       if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, attrs[:project])
-        attrs.delete(*[Ci::JobInfo::ALL_JOB_ATTRIBUTES - Ci::JobInfo::COPY_ONLY_ATTRIBUTES])
+        attrs.delete(*[Ci::JobInfo::JOB_ATTRIBUTES - Ci::JobInfo::COPY_ONLY_ATTRIBUTES])
       end
 
       new(attrs).tap do |job|
diff --git a/app/models/commit_status.rb b/app/models/commit_status.rb
index 862ed31f6987fc..1fddb3780e3a7d 100644
--- a/app/models/commit_status.rb
+++ b/app/models/commit_status.rb
@@ -35,23 +35,16 @@ class CommitStatus < Ci::ApplicationRecord
     inverse_of: :statuses
 
   # NOTE: We need to have these relationships in CommitStatus because generic
-  # commit statuses also use the columns in `Ci::JobInfo::ALL_JOB_ATTRIBUTES`.
-  has_one :job_info_instance, ->(job) { in_partition(job) },
-    class_name: 'Ci::JobInfoInstance',
-    foreign_key: :job_id,
-    partition_foreign_key: :partition_id,
-    inverse_of: :job,
-    autosave: true
-  has_one :job_info, ->(job) { in_partition(job) },
+  # commit statuses also use the columns in `Ci::JobInfo::JOB_ATTRIBUTES`.
+  # rubocop: disable Rails/InverseOf -- Relation not present in Ci::JobInfo because foreign key callback is not compatible with BulkInsertSafe
+  belongs_to :job_info,
+    ->(job) { in_partition(job) },
     class_name: 'Ci::JobInfo',
-    foreign_key: :job_id,
-    partition_foreign_key: :partition_id,
-    through: :job_info_instance
+    partition_foreign_key: :partition_id
+  # rubocop: enable Rails/InverseOf
 
   has_many :needs, class_name: 'Ci::BuildNeed', foreign_key: :build_id, inverse_of: :build
 
-  accepts_nested_attributes_for :job_info_instance
-
   attribute :retried, default: false
 
   enum :scheduling_type, { stage: 0, dag: 1 }, prefix: true
@@ -125,10 +118,6 @@ class CommitStatus < Ci::ApplicationRecord
     preload(:job_info)
   end
 
-  scope :with_job_info_instance_preload, -> do
-    preload(:job_info_instance)
-  end
-
   scope :scoped_pipeline, -> do
     where(arel_table[:commit_id].eq(Ci::Pipeline.arel_table[:id]))
     .where(arel_table[:partition_id].eq(Ci::Pipeline.arel_table[:partition_id]))
diff --git a/app/models/concerns/ci/partitionable/testing.rb b/app/models/concerns/ci/partitionable/testing.rb
index 8f59d5115057c3..b5655891b68b96 100644
--- a/app/models/concerns/ci/partitionable/testing.rb
+++ b/app/models/concerns/ci/partitionable/testing.rb
@@ -25,7 +25,6 @@ module Testing
         Ci::JobDefinition
         Ci::JobDefinitionInstance
         Ci::JobInfo
-        Ci::JobInfoInstance
         Ci::JobInput
         Ci::JobMessage
         Ci::JobVariable
diff --git a/app/models/project.rb b/app/models/project.rb
index 7c9319822c0bd4..85e73b8559cef3 100644
--- a/app/models/project.rb
+++ b/app/models/project.rb
@@ -467,7 +467,6 @@ def with_developer_access
   has_many :build_report_results, class_name: 'Ci::BuildReportResult', inverse_of: :project
   has_many :job_artifacts, class_name: 'Ci::JobArtifact', dependent: :restrict_with_error
   has_many :job_infos, class_name: 'Ci::JobInfo', inverse_of: :project
-  has_many :job_info_instances, class_name: 'Ci::JobInfoInstance', inverse_of: :project
   has_many :pipeline_artifacts, class_name: 'Ci::PipelineArtifact', inverse_of: :project, dependent: :restrict_with_error
   has_many :runner_projects, class_name: 'Ci::RunnerProject', inverse_of: :project
   has_many :runners, through: :runner_projects, source: :runner, class_name: 'Ci::Runner'
diff --git a/app/services/ci/clone_job_service.rb b/app/services/ci/clone_job_service.rb
index 933e2846e7efc8..20c4e5883dc623 100644
--- a/app/services/ci/clone_job_service.rb
+++ b/app/services/ci/clone_job_service.rb
@@ -25,7 +25,7 @@ def execute(new_job_variables: [], new_job_inputs: {})
     attr_reader :job, :current_user
 
     delegate :persisted_environment, :expanded_environment_name,
-      :job_definition_instance, :job_info_instance, :project, :project_id,
+      :job_definition_instance, :project, :project_id,
       :partition_id, :metadata, :pipeline,
       to: :job
 
diff --git a/app/services/ci/retry_pipeline_service.rb b/app/services/ci/retry_pipeline_service.rb
index 5fcd8cf745f3d6..741a0613e811e4 100644
--- a/app/services/ci/retry_pipeline_service.rb
+++ b/app/services/ci/retry_pipeline_service.rb
@@ -44,7 +44,7 @@ def check_access(pipeline)
     private
 
     def builds_relation(pipeline)
-      pipeline.retryable_builds.preload_needs.preload_job_definition_instances.with_job_info_instance_preload
+      pipeline.retryable_builds.preload_needs.preload_job_definition_instances
     end
 
     def can_be_retried?(job)
diff --git a/config/initializers/postgres_partitioning.rb b/config/initializers/postgres_partitioning.rb
index 079e315f02c4d6..83511cf8e58bbb 100644
--- a/config/initializers/postgres_partitioning.rb
+++ b/config/initializers/postgres_partitioning.rb
@@ -32,7 +32,6 @@
       Ci::JobDefinition,
       Ci::JobDefinitionInstance,
       Ci::JobInfo,
-      Ci::JobInfoInstance,
       Ci::JobInput,
       Ci::JobMessage,
       Ci::Pipeline,
diff --git a/db/migrate/20251202000003_create_p_ci_job_info_instances.rb b/db/migrate/20251202000003_create_p_ci_job_info_instances.rb
deleted file mode 100644
index d7403f0819a660..00000000000000
--- a/db/migrate/20251202000003_create_p_ci_job_info_instances.rb
+++ /dev/null
@@ -1,19 +0,0 @@
-# frozen_string_literal: true
-
-class CreatePCiJobInfoInstances < Gitlab::Database::Migration[2.3]
-  milestone '18.7'
-
-  def change
-    opts = {
-      primary_key: [:job_id, :partition_id],
-      options: 'PARTITION BY LIST (partition_id)'
-    }
-
-    create_table(:p_ci_job_info_instances, **opts) do |t|
-      t.bigint :project_id, null: false, index: true
-      t.bigint :partition_id, null: false
-      t.bigint :job_id, null: false
-      t.bigint :job_info_id, null: false, index: true
-    end
-  end
-end
diff --git a/db/migrate/20251202000004_create_p_ci_job_info_instances_partitions.rb b/db/migrate/20251202000004_create_p_ci_job_info_instances_partitions.rb
deleted file mode 100644
index 930408c9012840..00000000000000
--- a/db/migrate/20251202000004_create_p_ci_job_info_instances_partitions.rb
+++ /dev/null
@@ -1,35 +0,0 @@
-# frozen_string_literal: true
-
-# TODO: This migration is just to initialize partitions for local gdk. For production, we can
-# remove it and rely on the partition manager to create the necessary partitions instead.
-class CreatePCiJobInfoInstancesPartitions < Gitlab::Database::Migration[2.3]
-  milestone '18.7'
-
-  disable_ddl_transaction!
-
-  def up
-    sql = (100..108).map do |partition_id|
-      <<~SQL
-      CREATE TABLE IF NOT EXISTS gitlab_partitions_dynamic.ci_job_info_instances_#{partition_id}
-        PARTITION OF p_ci_job_info_instances
-        FOR VALUES IN (#{partition_id});
-      SQL
-    end.join
-
-    with_lock_retries do
-      connection.execute(sql)
-    end
-  end
-
-  def down
-    sql = (100..108).map do |partition_id|
-      <<~SQL
-      DROP TABLE IF EXISTS gitlab_partitions_dynamic.ci_job_info_instances_#{partition_id};
-      SQL
-    end.join
-
-    with_lock_retries do
-      connection.execute(sql)
-    end
-  end
-end
diff --git a/db/migrate/20251202000001_create_p_ci_job_infos.rb b/db/migrate/20251212000001_create_p_ci_job_infos.rb
similarity index 98%
rename from db/migrate/20251202000001_create_p_ci_job_infos.rb
rename to db/migrate/20251212000001_create_p_ci_job_infos.rb
index 221b07387b0b8f..fbd8a98abb9063 100644
--- a/db/migrate/20251202000001_create_p_ci_job_infos.rb
+++ b/db/migrate/20251212000001_create_p_ci_job_infos.rb
@@ -1,7 +1,7 @@
 # frozen_string_literal: true
 
 class CreatePCiJobInfos < Gitlab::Database::Migration[2.3]
-  milestone '18.7'
+  milestone '18.8'
 
   def change
     opts = {
diff --git a/db/migrate/20251202000002_create_p_ci_job_infos_partitions.rb b/db/migrate/20251212000002_create_p_ci_job_infos_partitions.rb
similarity index 97%
rename from db/migrate/20251202000002_create_p_ci_job_infos_partitions.rb
rename to db/migrate/20251212000002_create_p_ci_job_infos_partitions.rb
index f41712a185a7db..831a4184b4b215 100644
--- a/db/migrate/20251202000002_create_p_ci_job_infos_partitions.rb
+++ b/db/migrate/20251212000002_create_p_ci_job_infos_partitions.rb
@@ -3,7 +3,7 @@
 # TODO: This migration is just to initialize partitions for local gdk. For production, we can
 # remove it and rely on the partition manager to create the necessary partitions instead.
 class CreatePCiJobInfosPartitions < Gitlab::Database::Migration[2.3]
-  milestone '18.7'
+  milestone '18.8'
 
   disable_ddl_transaction!
 
diff --git a/db/migrate/20251212000003_add_job_info_id_column_to_p_ci_builds.rb b/db/migrate/20251212000003_add_job_info_id_column_to_p_ci_builds.rb
new file mode 100644
index 00000000000000..c99171b752a323
--- /dev/null
+++ b/db/migrate/20251212000003_add_job_info_id_column_to_p_ci_builds.rb
@@ -0,0 +1,16 @@
+# frozen_string_literal: true
+
+class AddJobInfoIdColumnToPCiBuilds < Gitlab::Database::Migration[2.3]
+  milestone '18.8'
+
+  # rubocop:disable Migration/PreventAddingColumns -- Required to deduplicate data into ci_job_infos table
+  def up
+    # NOTE: We can probably keep this column as NULL-able because generic commit statuses may not have a job_info record
+    add_column :p_ci_builds, :job_info_id, :bigint, if_not_exists: true
+  end
+
+  def down
+    remove_column :p_ci_builds, :job_info_id, if_exists: true
+  end
+  # rubocop:enable Migration/PreventAddingColumns
+end
diff --git a/db/post_migrate/20251202000006_add_fk_to_ci_builds_from_info_instances.rb b/db/post_migrate/20251202000006_add_fk_to_ci_builds_from_info_instances.rb
deleted file mode 100644
index 63691e82bfc16f..00000000000000
--- a/db/post_migrate/20251202000006_add_fk_to_ci_builds_from_info_instances.rb
+++ /dev/null
@@ -1,37 +0,0 @@
-# frozen_string_literal: true
-
-class AddFkToCiBuildsFromInfoInstances < Gitlab::Database::Migration[2.3]
-  include Gitlab::Database::PartitioningMigrationHelpers
-
-  milestone '18.7'
-  disable_ddl_transaction!
-
-  SOURCE_TABLE_NAME = :p_ci_job_info_instances
-  TARGET_TABLE_NAME = :p_ci_builds
-  FK_NAME = :fk_rails_089a57086f
-
-  def up
-    # rubocop: disable Migration/PreventForeignKeyCreation -- Necessary for linking ci_job_infos
-    add_concurrent_partitioned_foreign_key(
-      SOURCE_TABLE_NAME, TARGET_TABLE_NAME,
-      column: [:partition_id, :job_id],
-      target_column: [:partition_id, :id],
-      on_update: :cascade,
-      on_delete: :cascade,
-      reverse_lock_order: true,
-      name: FK_NAME
-    )
-    # rubocop: enable Migration/PreventForeignKeyCreation
-  end
-
-  def down
-    with_lock_retries do
-      remove_foreign_key_if_exists(
-        SOURCE_TABLE_NAME,
-        TARGET_TABLE_NAME,
-        reverse_lock_order: true,
-        name: FK_NAME
-      )
-    end
-  end
-end
diff --git a/db/post_migrate/20251212000004_add_index_on_p_ci_builds_job_info_id.rb b/db/post_migrate/20251212000004_add_index_on_p_ci_builds_job_info_id.rb
new file mode 100644
index 00000000000000..618af97ec5af47
--- /dev/null
+++ b/db/post_migrate/20251212000004_add_index_on_p_ci_builds_job_info_id.rb
@@ -0,0 +1,22 @@
+# frozen_string_literal: true
+
+# TODO: This index should first be added asynchronously on Production
+class AddIndexOnPCiBuildsJobInfoId < Gitlab::Database::Migration[2.3]
+  include Gitlab::Database::PartitioningMigrationHelpers
+
+  milestone '18.8'
+
+  disable_ddl_transaction!
+
+  PARTITIONED_INDEX_NAME = 'index_p_ci_builds_on_job_info_id'
+
+  # rubocop: disable Migration/PreventIndexCreation -- Required to deduplicate data into ci_job_infos table
+  def up
+    add_concurrent_partitioned_index :p_ci_builds, :job_info_id, name: PARTITIONED_INDEX_NAME
+  end
+
+  def down
+    remove_concurrent_partitioned_index_by_name :p_ci_builds, PARTITIONED_INDEX_NAME
+  end
+  # rubocop: enable Migration/PreventIndexCreation
+end
diff --git a/db/post_migrate/20251202000005_add_fk_to_ci_job_infos_from_info_instances.rb b/db/post_migrate/20251212000005_add_fk_on_p_ci_builds_job_info_id.rb
similarity index 63%
rename from db/post_migrate/20251202000005_add_fk_to_ci_job_infos_from_info_instances.rb
rename to db/post_migrate/20251212000005_add_fk_on_p_ci_builds_job_info_id.rb
index 4adb2e64a415fa..bd691b400f9dd7 100644
--- a/db/post_migrate/20251202000005_add_fk_to_ci_job_infos_from_info_instances.rb
+++ b/db/post_migrate/20251212000005_add_fk_on_p_ci_builds_job_info_id.rb
@@ -1,15 +1,18 @@
 # frozen_string_literal: true
 
-class AddFkToCiJobInfosFromInfoInstances < Gitlab::Database::Migration[2.3]
+# TODO: This FK should first be added asynchronously on Production
+class AddFkOnPCiBuildsJobInfoId < Gitlab::Database::Migration[2.3]
   include Gitlab::Database::PartitioningMigrationHelpers
 
-  milestone '18.7'
+  milestone '18.8'
+
   disable_ddl_transaction!
 
-  SOURCE_TABLE_NAME = :p_ci_job_info_instances
+  SOURCE_TABLE_NAME = :p_ci_builds
   TARGET_TABLE_NAME = :p_ci_job_infos
-  FK_NAME = :fk_rails_e414e4e39e
+  FK_NAME = :fk_rails_2f23ec1c61
 
+  # rubocop: disable Migration/PreventForeignKeyCreation -- Required to deduplicate data into ci_job_infos table
   def up
     add_concurrent_partitioned_foreign_key(
       SOURCE_TABLE_NAME, TARGET_TABLE_NAME,
@@ -32,4 +35,5 @@ def down
       )
     end
   end
+  # rubocop: enable Migration/PreventForeignKeyCreation
 end
diff --git a/db/schema_migrations/20251202000001 b/db/schema_migrations/20251202000001
deleted file mode 100644
index 0509012e1c11c9..00000000000000
--- a/db/schema_migrations/20251202000001
+++ /dev/null
@@ -1 +0,0 @@
-faced445914491be2b887c18309fd1effe6df6155d4b2c52fa3a6c81fdeb970d
\ No newline at end of file
diff --git a/db/schema_migrations/20251202000002 b/db/schema_migrations/20251202000002
deleted file mode 100644
index b69b6c3617847e..00000000000000
--- a/db/schema_migrations/20251202000002
+++ /dev/null
@@ -1 +0,0 @@
-0d519552d80a0b3389c488b5cb9327c44f2d246abf951b3b111d949bd071bb86
\ No newline at end of file
diff --git a/db/schema_migrations/20251202000003 b/db/schema_migrations/20251202000003
deleted file mode 100644
index 10728ef363fa63..00000000000000
--- a/db/schema_migrations/20251202000003
+++ /dev/null
@@ -1 +0,0 @@
-436902e31b8aeb833be35c6f3358e2306ae9336deb76ebe03207b3e386139a98
\ No newline at end of file
diff --git a/db/schema_migrations/20251202000004 b/db/schema_migrations/20251202000004
deleted file mode 100644
index 300e2dd62e393e..00000000000000
--- a/db/schema_migrations/20251202000004
+++ /dev/null
@@ -1 +0,0 @@
-3a8658b3381054b65d05ea993344e6164b40b059bbc1490267039167524fafc1
\ No newline at end of file
diff --git a/db/schema_migrations/20251202000005 b/db/schema_migrations/20251202000005
deleted file mode 100644
index f0264852bf3369..00000000000000
--- a/db/schema_migrations/20251202000005
+++ /dev/null
@@ -1 +0,0 @@
-25a25cd891d6dd7d1cb36c3a77a29e1fad9d59a997f42f2c56651052b95d9e03
\ No newline at end of file
diff --git a/db/schema_migrations/20251202000006 b/db/schema_migrations/20251202000006
deleted file mode 100644
index 11e9e1d44ccde5..00000000000000
--- a/db/schema_migrations/20251202000006
+++ /dev/null
@@ -1 +0,0 @@
-b2423358bb78ee5849fe3f12f47ae08827658607b474b22ccb8d5d6bc1a507d4
\ No newline at end of file
diff --git a/db/schema_migrations/20251212000001 b/db/schema_migrations/20251212000001
new file mode 100644
index 00000000000000..a2710e96af29e6
--- /dev/null
+++ b/db/schema_migrations/20251212000001
@@ -0,0 +1 @@
+7c7a8d7fd6b8923dfe0d0c6234bcab0d47066047cab746a7307c81b9c6560d37
\ No newline at end of file
diff --git a/db/schema_migrations/20251212000002 b/db/schema_migrations/20251212000002
new file mode 100644
index 00000000000000..4e9e9f253450c4
--- /dev/null
+++ b/db/schema_migrations/20251212000002
@@ -0,0 +1 @@
+54fcbdf66c4cbf966282f993044dda5668a03956a0be194eb58592a4e03756c6
\ No newline at end of file
diff --git a/db/schema_migrations/20251212000003 b/db/schema_migrations/20251212000003
new file mode 100644
index 00000000000000..cf1e1820080fef
--- /dev/null
+++ b/db/schema_migrations/20251212000003
@@ -0,0 +1 @@
+caf3468d0e6c38a64aa61a9d6e6ecb63aec58a9bd084cd8be96ec6fc7c30bdf0
\ No newline at end of file
diff --git a/db/schema_migrations/20251212000004 b/db/schema_migrations/20251212000004
new file mode 100644
index 00000000000000..272e3ab0914912
--- /dev/null
+++ b/db/schema_migrations/20251212000004
@@ -0,0 +1 @@
+7d3c56c1c6fe9905e6367c821fd53e1c0fdff43c6d5640a58e27fba94d577552
\ No newline at end of file
diff --git a/db/schema_migrations/20251212000005 b/db/schema_migrations/20251212000005
new file mode 100644
index 00000000000000..541e955eabfefb
--- /dev/null
+++ b/db/schema_migrations/20251212000005
@@ -0,0 +1 @@
+fc156af34a793cc57547fad00af6822d4de6f7b0c5abbc72f9b59ee5440d3f80
\ No newline at end of file
diff --git a/db/structure.sql b/db/structure.sql
index 9288570d855b1c..66f0705f8bfd6d 100644
--- a/db/structure.sql
+++ b/db/structure.sql
@@ -5684,6 +5684,7 @@ CREATE TABLE p_ci_builds (
     timeout_source smallint,
     exit_code smallint,
     debug_trace_enabled boolean,
+    job_info_id bigint,
     CONSTRAINT check_1e2fbd1b39 CHECK ((lock_version IS NOT NULL)),
     CONSTRAINT check_9aa9432137 CHECK ((project_id IS NOT NULL))
 )
@@ -5787,14 +5788,6 @@ CREATE TABLE p_ci_job_definitions (
 )
 PARTITION BY LIST (partition_id);
 
-CREATE TABLE p_ci_job_info_instances (
-    project_id bigint NOT NULL,
-    partition_id bigint NOT NULL,
-    job_id bigint NOT NULL,
-    job_info_id bigint NOT NULL
-)
-PARTITION BY LIST (partition_id);
-
 CREATE TABLE p_ci_job_infos (
     id bigint NOT NULL,
     partition_id bigint NOT NULL,
@@ -36393,9 +36386,6 @@ ALTER TABLE ONLY p_ci_job_definition_instances
 ALTER TABLE ONLY p_ci_job_definitions
     ADD CONSTRAINT p_ci_job_definitions_pkey PRIMARY KEY (id, partition_id);
 
-ALTER TABLE ONLY p_ci_job_info_instances
-    ADD CONSTRAINT p_ci_job_info_instances_pkey PRIMARY KEY (job_id, partition_id);
-
 ALTER TABLE ONLY p_ci_job_infos
     ADD CONSTRAINT p_ci_job_infos_pkey PRIMARY KEY (id, partition_id);
 
@@ -43355,6 +43345,8 @@ CREATE INDEX index_p_ci_builds_execution_configs_on_project_id ON ONLY p_ci_buil
 
 CREATE INDEX index_p_ci_builds_on_execution_config_id ON ONLY p_ci_builds USING btree (execution_config_id) WHERE (execution_config_id IS NOT NULL);
 
+CREATE INDEX index_p_ci_builds_on_job_info_id ON ONLY p_ci_builds USING btree (job_info_id);
+
 CREATE INDEX index_p_ci_finished_build_ch_sync_events_finished_at ON ONLY p_ci_finished_build_ch_sync_events USING btree (partition, build_finished_at);
 
 CREATE INDEX index_p_ci_finished_build_ch_sync_events_on_project_id ON ONLY p_ci_finished_build_ch_sync_events USING btree (project_id);
@@ -43375,10 +43367,6 @@ CREATE INDEX index_p_ci_job_definitions_on_interruptible ON ONLY p_ci_job_defini
 
 CREATE UNIQUE INDEX index_p_ci_job_definitions_on_project_id_and_checksum ON ONLY p_ci_job_definitions USING btree (project_id, checksum, partition_id);
 
-CREATE INDEX index_p_ci_job_info_instances_on_job_info_id ON ONLY p_ci_job_info_instances USING btree (job_info_id);
-
-CREATE INDEX index_p_ci_job_info_instances_on_project_id ON ONLY p_ci_job_info_instances USING btree (project_id);
-
 CREATE INDEX index_p_ci_job_infos_on_id_where_scheduling_type_dag ON ONLY p_ci_job_infos USING btree (id) WHERE (scheduling_type = 1);
 
 CREATE UNIQUE INDEX index_p_ci_job_infos_on_project_id_and_checksum ON ONLY p_ci_job_infos USING btree (project_id, checksum, partition_id);
@@ -52603,9 +52591,6 @@ ALTER TABLE ONLY security_policies
 ALTER TABLE ONLY virtual_registries_packages_npm_upstreams
     ADD CONSTRAINT fk_rails_08949a6736 FOREIGN KEY (group_id) REFERENCES namespaces(id) ON DELETE CASCADE;
 
-ALTER TABLE p_ci_job_info_instances
-    ADD CONSTRAINT fk_rails_089a57086f FOREIGN KEY (partition_id, job_id) REFERENCES p_ci_builds(partition_id, id) ON UPDATE CASCADE ON DELETE CASCADE;
-
 ALTER TABLE ONLY subscription_user_add_on_assignment_versions
     ADD CONSTRAINT fk_rails_091e013a61 FOREIGN KEY (organization_id) REFERENCES organizations(id);
 
@@ -52960,6 +52945,9 @@ ALTER TABLE ONLY onboarding_progresses
 ALTER TABLE ONLY protected_branch_unprotect_access_levels
     ADD CONSTRAINT fk_rails_2d2aba21ef FOREIGN KEY (user_id) REFERENCES users(id) ON DELETE CASCADE;
 
+ALTER TABLE p_ci_builds
+    ADD CONSTRAINT fk_rails_2f23ec1c61 FOREIGN KEY (partition_id, job_info_id) REFERENCES p_ci_job_infos(partition_id, id) ON UPDATE RESTRICT ON DELETE RESTRICT;
+
 ALTER TABLE ONLY issuable_severities
     ADD CONSTRAINT fk_rails_2fbb74ad6d FOREIGN KEY (issue_id) REFERENCES issues(id) ON DELETE CASCADE;
 
@@ -54481,9 +54469,6 @@ ALTER TABLE ONLY approval_policy_rules
 ALTER TABLE ONLY work_item_select_field_values
     ADD CONSTRAINT fk_rails_e3ecc2c14e FOREIGN KEY (custom_field_id) REFERENCES custom_fields(id) ON DELETE CASCADE;
 
-ALTER TABLE p_ci_job_info_instances
-    ADD CONSTRAINT fk_rails_e414e4e39e FOREIGN KEY (partition_id, job_info_id) REFERENCES p_ci_job_infos(partition_id, id) ON UPDATE RESTRICT ON DELETE RESTRICT;
-
 ALTER TABLE ONLY vulnerability_occurrence_identifiers
     ADD CONSTRAINT fk_rails_e4ef6d027c FOREIGN KEY (occurrence_id) REFERENCES vulnerability_occurrences(id) ON DELETE CASCADE;
 
diff --git a/lib/gitlab/ci/pipeline/create/job_info_builder.rb b/lib/gitlab/ci/pipeline/create/job_info_builder.rb
index 3328a366e8f719..7ea26b74ea07eb 100644
--- a/lib/gitlab/ci/pipeline/create/job_info_builder.rb
+++ b/lib/gitlab/ci/pipeline/create/job_info_builder.rb
@@ -4,7 +4,7 @@ module Gitlab
   module Ci
     module Pipeline
       module Create
-        # This class mirrors JobDefinitionBuilder.
+        # This class is similar to JobDefinitionBuilder.
         # TODO: Refactor shared code into module or parent class?
         class JobInfoBuilder
           include Gitlab::Utils::StrongMemoize
@@ -18,9 +18,7 @@ def initialize(pipeline, jobs)
           def run
             find_or_insert_job_infos.each do |job_info|
               jobs_by_checksum[job_info.checksum].each do |job|
-                job.build_job_info_instance(
-                  job_info: job_info, partition_id: pipeline.partition_id, project: project
-                )
+                job.job_info = job_info
               end
             end
           end
diff --git a/lib/gitlab/import_export/project/relation_factory.rb b/lib/gitlab/import_export/project/relation_factory.rb
index 6542fe1eeadba6..6e89cae9b1f765 100644
--- a/lib/gitlab/import_export/project/relation_factory.rb
+++ b/lib/gitlab/import_export/project/relation_factory.rb
@@ -46,8 +46,7 @@ class RelationFactory < Base::RelationFactory
                       work_item_description: 'WorkItems::Description',
                       user_contributions: 'User',
                       squash_option: 'Projects::BranchRules::SquashOption',
-                      job_infos: 'Ci::JobInfo',
-                      job_info_instances: 'Ci::JobInfoInstance' }.freeze
+                      job_infos: 'Ci::JobInfo' }.freeze
 
         BUILD_MODELS = %i[Ci::Build Ci::Bridge commit_status generic_commit_status].freeze
 
diff --git a/spec/factories/ci/job_info_instances.rb b/spec/factories/ci/job_info_instances.rb
deleted file mode 100644
index 964d0ee465941f..00000000000000
--- a/spec/factories/ci/job_info_instances.rb
+++ /dev/null
@@ -1,9 +0,0 @@
-# frozen_string_literal: true
-
-FactoryBot.define do
-  factory :ci_job_info_instance, class: 'Ci::JobInfoInstance' do
-    project factory: :project
-    job factory: :ci_build
-    job_info factory: :ci_job_info
-  end
-end
diff --git a/spec/factories/ci/processable.rb b/spec/factories/ci/processable.rb
index f41812dda8ddac..c21061ebaaba02 100644
--- a/spec/factories/ci/processable.rb
+++ b/spec/factories/ci/processable.rb
@@ -118,8 +118,8 @@
         processable.temp_job_definition = nil
       end
 
-      # job_info_instance is assigned when we run JobInfoBuilder
-      if processable.job_info_instance
+      # job_info_id is assigned when we run JobInfoBuilder
+      if processable.job_info_id
         processable.association(:job_info).reload
         processable.temp_job_info = nil
       end
diff --git a/spec/services/ci/clone_job_service_spec.rb b/spec/services/ci/clone_job_service_spec.rb
index 98bff4e23c0ffd..177972c81c21e6 100644
--- a/spec/services/ci/clone_job_service_spec.rb
+++ b/spec/services/ci/clone_job_service_spec.rb
@@ -97,7 +97,7 @@
         dast_scanner_profiles_build auto_canceled_by_partition_id execution_config_id execution_config
         build_source id_value inputs error_job_messages
         job_definition job_definition_instance job_messages temp_job_definition interruptible
-        job_info job_info_instance temp_job_info].freeze
+        job_info temp_job_info].freeze
     end
 
     before_all do
diff --git a/spec/support/helpers/ci/job_helpers.rb b/spec/support/helpers/ci/job_helpers.rb
index 067573c7273c46..51f464b61aaaf5 100644
--- a/spec/support/helpers/ci/job_helpers.rb
+++ b/spec/support/helpers/ci/job_helpers.rb
@@ -32,17 +32,16 @@ def stub_ci_job_definition(job, **new_config)
     # TODO: Maybe we can combine this with stub_ci_job_definition and call it `stub_ci_job_attrs`?
     def stub_ci_job_info(job, **new_job_attrs)
       new_job_attrs.symbolize_keys!
-      unknown_keys = new_job_attrs.keys - Ci::JobInfo::ALL_JOB_ATTRIBUTES
+      unknown_keys = new_job_attrs.keys - Ci::JobInfo::JOB_ATTRIBUTES
 
       if unknown_keys.any?
         raise ArgumentError,
           "You can only stub valid job info attributes. Invalid key(s): #{unknown_keys.join(', ')}. " \
-            "Allowed: #{Ci::JobInfo::ALL_JOB_ATTRIBUTES.join(', ')}"
+            "Allowed: #{Ci::JobInfo::JOB_ATTRIBUTES.join(', ')}"
       end
 
       # We use regular merge (not deep_merge) to completely overwrite existing attributes
-      updated_job_attrs = (job.job_info&.all_job_attributes || job.temp_job_info&.all_job_attributes || {})
-                            .merge(new_job_attrs)
+      updated_job_attrs = (job.job_info&.job_attributes || job.temp_job_info&.job_attributes || {}).merge(new_job_attrs)
 
       new_job_info = ::Ci::JobInfo.fabricate(
         job_attrs: updated_job_attrs,
-- 
GitLab


From 069cfa3d1863755d3126b60c2e156f669c60e049 Mon Sep 17 00:00:00 2001
From: lma-git <lma@gitlab.com>
Date: Fri, 12 Dec 2025 19:25:43 -0800
Subject: [PATCH 27/27] Descope needs_attributes from job_definitions

Descope needs_attributes from job_definitions
and just put all the needs data into ci_job_infos.
---
 app/graphql/types/ci/job_type.rb              |  2 +-
 app/models/ci/bridge.rb                       |  3 +-
 app/models/ci/build.rb                        |  3 +-
 app/models/ci/build_dependencies.rb           |  2 +-
 app/models/ci/job_definition.rb               |  2 +-
 app/models/ci/job_info.rb                     | 22 ++------
 app/models/ci/pipeline.rb                     |  7 ---
 app/models/ci/processable.rb                  | 22 ++------
 app/models/concerns/ci/metadatable.rb         | 33 ++---------
 app/services/ci/clone_job_service.rb          | 56 ++++++-------------
 .../atomic_processing_service.rb              | 12 +---
 app/services/ci/reset_skipped_jobs_service.rb |  2 +-
 app/services/ci/retry_job_service.rb          |  1 -
 app/services/ci/update_build_names_service.rb |  2 -
 .../ci_job_definition_config.json             |  4 --
 .../read_needs_from_ci_job_definitions.yml    | 10 ----
 .../wip/stop_writing_to_ci_build_needs.yml    | 10 ----
 .../wip/write_needs_to_ci_job_definitions.yml | 10 ----
 config/gitlab_loose_foreign_keys.yml          |  4 --
 db/docs/p_ci_job_info_instances.yml           | 13 -----
 lib/gitlab/ci/job_needs/collection.rb         |  1 -
 .../ci/pipeline/chain/set_build_sources.rb    |  2 +-
 lib/gitlab/ci/processable_object_hierarchy.rb | 23 ++++----
 .../import_export/project/import_export.yml   |  5 +-
 spec/factories/ci/builds.rb                   | 12 +---
 spec/factories/ci/processable.rb              | 22 +++-----
 spec/lib/gitlab/import_export/all_models.yml  |  1 -
 .../ci/create_pipeline_service_spec.rb        |  2 -
 .../atomic_processing_service_spec.rb         |  8 +--
 .../ci/reset_skipped_jobs_service_spec.rb     |  2 +-
 .../support/helpers/ci/job_factory_helpers.rb | 11 ++++
 31 files changed, 78 insertions(+), 231 deletions(-)
 delete mode 100644 config/feature_flags/wip/read_needs_from_ci_job_definitions.yml
 delete mode 100644 config/feature_flags/wip/stop_writing_to_ci_build_needs.yml
 delete mode 100644 config/feature_flags/wip/write_needs_to_ci_job_definitions.yml
 delete mode 100644 db/docs/p_ci_job_info_instances.yml

diff --git a/app/graphql/types/ci/job_type.rb b/app/graphql/types/ci/job_type.rb
index 60c774af9b116d..b3caf00f6f3891 100644
--- a/app/graphql/types/ci/job_type.rb
+++ b/app/graphql/types/ci/job_type.rb
@@ -178,7 +178,7 @@ def trace
 
       def needs
         if object.read_from_job_info?
-          object.intrinsic_job_needs
+          object.job_needs
         else
           object.needs
         end
diff --git a/app/models/ci/bridge.rb b/app/models/ci/bridge.rb
index 04e5d7a3e54058..700a7e4641b101 100644
--- a/app/models/ci/bridge.rb
+++ b/app/models/ci/bridge.rb
@@ -103,7 +103,8 @@ def self.with_preloads
     def self.clone_accessors
       %i[pipeline project ref tag name allow_failure stage_idx
         when environment description needs_attributes
-        scheduling_type ci_stage partition_id resource_group].freeze
+        scheduling_type ci_stage partition_id resource_group
+        job_info_id].freeze
     end
 
     def retryable?
diff --git a/app/models/ci/build.rb b/app/models/ci/build.rb
index 1a430262f32748..a382f1e74a183c 100644
--- a/app/models/ci/build.rb
+++ b/app/models/ci/build.rb
@@ -286,7 +286,8 @@ def clone_accessors
           environment coverage_regex description tag_list protected
           needs_attributes job_variables_attributes resource_group
           scheduling_type timeout timeout_source debug_trace_enabled
-          ci_stage partition_id execution_config_id inputs_attributes].freeze
+          ci_stage partition_id execution_config_id inputs_attributes
+          job_info_id].freeze
       end
 
       def supported_keyset_orderings
diff --git a/app/models/ci/build_dependencies.rb b/app/models/ci/build_dependencies.rb
index 7f358b2aa52258..0ff39580b92e53 100644
--- a/app/models/ci/build_dependencies.rb
+++ b/app/models/ci/build_dependencies.rb
@@ -133,7 +133,7 @@ def from_previous_stages(scope)
     end
 
     def from_needs(scope)
-      needs_names = if processable.read_needs_from_job_definition?
+      needs_names = if processable.read_from_job_info?
                       processable.job_needs.names_with_artifacts_true
                     else
                       processable.needs.artifacts.select(:name)
diff --git a/app/models/ci/job_definition.rb b/app/models/ci/job_definition.rb
index 76a732081ca3b1..b3cc77352aedeb 100644
--- a/app/models/ci/job_definition.rb
+++ b/app/models/ci/job_definition.rb
@@ -22,7 +22,7 @@ class JobDefinition < Ci::ApplicationRecord
       :secrets,
       :interruptible
     ].freeze
-    CONFIG_ATTRIBUTES = (CONFIG_ATTRIBUTES_FROM_METADATA + [:tag_list, :run_steps, :needs_attributes]).freeze
+    CONFIG_ATTRIBUTES = (CONFIG_ATTRIBUTES_FROM_METADATA + [:tag_list, :run_steps]).freeze
     NORMALIZED_DATA_COLUMNS = %i[interruptible].freeze
 
     query_constraints :id, :partition_id
diff --git a/app/models/ci/job_info.rb b/app/models/ci/job_info.rb
index 2d7f72c7975af1..f2070fe1f1a967 100644
--- a/app/models/ci/job_info.rb
+++ b/app/models/ci/job_info.rb
@@ -28,7 +28,7 @@ class JobInfo < Ci::ApplicationRecord
     ].freeze
 
     # We're copying over these values to ci_job_infos but not removing them from their original/initial destinations
-    COPY_ONLY_ATTRIBUTES = [:name, :needs_attributes].freeze
+    COPY_ONLY_ATTRIBUTES = [:name].freeze
 
     MAX_JOB_NAME_LENGTH = 255
 
@@ -72,8 +72,6 @@ def mutate(new_job_attrs)
     end
 
     # Hash containing all attributes: config + normalized_data
-    # TODO: We should do this for Ci::JobDefinition and update Ci::JobHelpers#stub_ci_job_definition
-    # to merge job_attributes instead of just config.
     def job_attributes
       attributes.deep_symbolize_keys.slice(*JOB_ATTRIBUTES).merge(config)
     end
@@ -86,14 +84,13 @@ def readonly?
 
     def prepare_job_attributes_and_checksum(job_attrs)
       sanitized_job_attrs = normalize_and_sanitize(job_attrs)
-      transformed_job_attrs = transform(sanitized_job_attrs)
 
       # NOTE: Checksum is generated with all attributes including normalized columns. But when storing
       # the data, we can save space by excluding the normalized column values from the config hash.
       {
-        checksum: generate_checksum(transformed_job_attrs),
-        config: transformed_job_attrs.except(*NORMALIZED_DATA_COLUMNS),
-        **transformed_job_attrs.slice(*NORMALIZED_DATA_COLUMNS)
+        checksum: generate_checksum(sanitized_job_attrs),
+        config: sanitized_job_attrs.except(*NORMALIZED_DATA_COLUMNS),
+        **sanitized_job_attrs.slice(*NORMALIZED_DATA_COLUMNS)
       }
     end
 
@@ -107,17 +104,6 @@ def normalize_and_sanitize(job_attrs)
       data.slice(*JOB_ATTRIBUTES)
     end
 
-    def transform(job_attrs)
-      return job_attrs unless job_attrs.key?(:needs_attributes)
-
-      # For needs, we only need to store the names for the pipeline UI graph
-      job_attrs[:needs_attributes] = job_attrs[:needs_attributes].map do |need_hash|
-        need_hash.slice(*::Gitlab::Ci::JobNeeds::Collection::INTRINSIC_ATTRIBUTES)
-      end
-
-      job_attrs
-    end
-
     def generate_checksum(job_attrs)
       job_attrs
         .then { |data| Gitlab::Json.dump(data) }
diff --git a/app/models/ci/pipeline.rb b/app/models/ci/pipeline.rb
index 08582d115d9c04..04e0adc84704ca 100644
--- a/app/models/ci/pipeline.rb
+++ b/app/models/ci/pipeline.rb
@@ -723,13 +723,6 @@ def self.internal_id_scope_usage
       :ci_pipelines
     end
 
-    # TODO: Remove this method after migrating ci_build_needs to ci_job_definitions.
-    def read_needs_from_job_definitions?
-      # If a pipeline is created with FF `write_needs_to_ci_job_definitions` enabled, then all its jobs would
-      # have job_definition records with the `needs_attributes` key in the config value. So we just check one job.
-      processables.first&.read_needs_from_job_definition?
-    end
-
     # TODO: Remove this method after migrating data to ci_job_infos
     def read_from_job_infos?
       # If a pipeline is created with FF `write_to_ci_job_infos` enabled, then all its jobs would
diff --git a/app/models/ci/processable.rb b/app/models/ci/processable.rb
index cc9f9ed50f5066..9e74fc733660d9 100644
--- a/app/models/ci/processable.rb
+++ b/app/models/ci/processable.rb
@@ -61,7 +61,6 @@ class Processable < ::CommitStatus
 
     scope :preload_needs, -> { preload(:needs) }
     scope :preload_job_definition_instances, -> { preload(:job_definition_instance) }
-    scope :preload_job_definitions, -> { preload(:job_definition) }
     scope :manual_actions, -> { where(when: :manual, status: COMPLETED_STATUSES + %i[manual]) }
 
     # TODO: We can probably remove this scope: https://gitlab.com/gitlab-org/gitlab/-/issues/584000
@@ -164,22 +163,7 @@ def self.fabricate(attrs)
       attrs = attrs.dup
       info_attrs = attrs.slice(*Ci::JobInfo::JOB_ATTRIBUTES)
       definition_attrs = attrs.extract!(*Ci::JobDefinition::CONFIG_ATTRIBUTES)
-
       attrs[:tag_list] = definition_attrs[:tag_list] if definition_attrs.key?(:tag_list)
-      # TODO: Remove this line with FF `stop_writing_to_ci_build_needs`
-      attrs[:needs_attributes] = definition_attrs[:needs_attributes] if definition_attrs.key?(:needs_attributes)
-
-      if Feature.enabled?(:write_needs_to_ci_job_definitions, attrs[:project])
-        # We always include the needs_attributes key to signal that we've started writing needs to job_definitions.
-        # But this means _all_ job_definitions have to be regenerated. See read_needs_from_job_definitions? for further
-        # context. We either do this or migrate all the data to job_definitions before turning on
-        # FF `read_needs_from_ci_job_definitions`.
-        definition_attrs[:needs_attributes] ||= []
-      else
-        definition_attrs.delete(:needs_attributes)
-      end
-
-      attrs.delete(:needs_attributes) if Feature.enabled?(:stop_writing_to_ci_build_needs, attrs[:project])
 
       if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, attrs[:project])
         attrs.delete(*[Ci::JobInfo::JOB_ATTRIBUTES - Ci::JobInfo::COPY_ONLY_ATTRIBUTES])
@@ -272,7 +256,11 @@ def archived?(...)
     end
 
     def aggregated_needs_names
-      read_attribute(:aggregated_needs_names)
+      if read_from_job_info?
+        job_needs.names
+      else
+        read_attribute(:aggregated_needs_names)
+      end
     end
 
     def schedulable?
diff --git a/app/models/concerns/ci/metadatable.rb b/app/models/concerns/ci/metadatable.rb
index 59d77329d3da10..39378d147ef287 100644
--- a/app/models/concerns/ci/metadatable.rb
+++ b/app/models/concerns/ci/metadatable.rb
@@ -219,24 +219,15 @@ def name=(value)
       write_attribute(:name, value)
     end
 
-    # We only store the needed jobs' names in job_info;
-    # full needs attributes for job processing are stored in job_definition
-    def intrinsic_job_needs
-      needs_attrs = read_job_info_attribute(:needs_attributes, [])
-
-      ::Gitlab::Ci::JobNeeds::Collection.new(self.id, needs_attrs)
-    end
-    strong_memoize_attr :intrinsic_job_needs
-
     def job_needs
-      needs_attrs = read_job_definition_attribute(:needs_attributes, [])
+      needs_attrs = read_job_info_attribute(:needs_attributes, [])
 
       ::Gitlab::Ci::JobNeeds::Collection.new(self.id, needs_attrs)
     end
     strong_memoize_attr :job_needs
 
     def needs_names
-      if read_needs_from_job_definition?
+      if read_from_job_info?
         job_needs.names
       else
         needs.map(&:name)
@@ -244,14 +235,8 @@ def needs_names
     end
 
     def has_needs?
-      read_needs_from_job_definition? ? job_needs.any? : needs.present?
-    end
-
-    def read_needs_from_job_definition?
-      Feature.enabled?(:read_needs_from_ci_job_definitions, project) &&
-        (job_definition&.config&.key?(:needs_attributes) || temp_job_definition&.config&.key?(:needs_attributes))
+      read_from_ci_job_info? ? job_needs.any? : needs.present?
     end
-    strong_memoize_attr :read_needs_from_job_definition?
 
     # TODO: Remove this method after migrating data to ci_job_infos
     def read_from_job_info?
@@ -265,22 +250,12 @@ def read_metadata_attribute(legacy_key, metadata_key, job_definition_key, defaul
       result = read_attribute(legacy_key) if legacy_key
       return result if result
 
-      result = read_job_definition_attribute(job_definition_key)
+      result = job_definition&.config&.dig(job_definition_key) || temp_job_definition&.config&.dig(job_definition_key)
       return result if result
 
       metadata&.read_attribute(metadata_key) || default_value
     end
 
-    def read_job_definition_attribute(key, default_value = nil)
-      result = if key.in?(::Ci::JobDefinition::NORMALIZED_DATA_COLUMNS)
-                 job_definition&.read_attribute(key) || temp_job_definition&.read_attribute(key)
-               else
-                 job_definition&.config&.dig(key) || temp_job_definition&.config&.dig(key)
-               end
-
-      result || default_value
-    end
-
     def read_job_info_attribute(key, default_value = nil)
       return unless read_from_job_info?
 
diff --git a/app/services/ci/clone_job_service.rb b/app/services/ci/clone_job_service.rb
index 20c4e5883dc623..6df8d55c21f654 100644
--- a/app/services/ci/clone_job_service.rb
+++ b/app/services/ci/clone_job_service.rb
@@ -25,7 +25,7 @@ def execute(new_job_variables: [], new_job_inputs: {})
     attr_reader :job, :current_user
 
     delegate :persisted_environment, :expanded_environment_name,
-      :job_definition_instance, :project, :project_id,
+      :job_definition_instance, :job_info, :project, :project_id,
       :partition_id, :metadata, :pipeline,
       to: :job
 
@@ -91,30 +91,26 @@ def find_or_create_job_definition
       ).execute.first
     end
 
-    def add_job_info_attributes!(attributes)
-      if job_info_instance
-        add_existing_job_info_attributes!(attributes)
-      else
-        add_new_job_info_attributes!(attributes)
-      end
-    end
-
-    def add_existing_job_info_attributes!(attributes)
-      attributes[:job_info_instance_attributes] = {
-        project_id: project_id,
-        job_info_id: job_info_instance.job_info_id,
-        partition_id: job_info_instance.partition_id
+    def build_definition_attributes
+      attrs = {
+        options: metadata.config_options,
+        yaml_variables: metadata.config_variables,
+        id_tokens: metadata.id_tokens,
+        secrets: metadata.secrets,
+        tag_list: job.tag_list.to_a,
+        run_steps: job.try(:execution_config)&.run_steps || []
       }
+
+      attrs[:interruptible] = metadata.interruptible unless metadata.interruptible.nil?
+
+      attrs
     end
 
-    def add_new_job_info_attributes!(attributes)
-      persisted_job_info = find_or_create_job_info
+    def add_job_info_attributes!(attributes)
+      return if job_info
 
-      attributes[:job_info_instance_attributes] = {
-        project: project,
-        job_info: persisted_job_info,
-        partition_id: partition_id
-      }
+      persisted_job_info = find_or_create_job_info
+      attributes[:job_info_id] = persisted_job_info.id
     end
 
     def find_or_create_job_info
@@ -129,26 +125,10 @@ def find_or_create_job_info
       ).execute.first
     end
 
-    def build_definition_attributes
-      attrs = {
-        options: metadata.config_options,
-        yaml_variables: metadata.config_variables,
-        id_tokens: metadata.id_tokens,
-        secrets: metadata.secrets,
-        tag_list: job.tag_list.to_a,
-        run_steps: job.try(:execution_config)&.run_steps || []
-      }
-
-      attrs[:needs_attributes] = job.needs_attributes if Feature.enabled?(:write_needs_to_ci_job_definitions, project)
-
-      attrs[:interruptible] = metadata.interruptible unless metadata.interruptible.nil?
-
-      attrs
-    end
-
     def build_info_attributes
       {
         scheduling_type: job.scheduling_type,
+        source: job.source,
         name: job.name,
         needs_attributes: job.needs_attributes
       }
diff --git a/app/services/ci/pipeline_processing/atomic_processing_service.rb b/app/services/ci/pipeline_processing/atomic_processing_service.rb
index edb4d45f445d27..050bf8a4c1a34e 100644
--- a/app/services/ci/pipeline_processing/atomic_processing_service.rb
+++ b/app/services/ci/pipeline_processing/atomic_processing_service.rb
@@ -93,19 +93,11 @@ def load_jobs(ids)
       def sort_jobs(jobs)
         Gitlab::Ci::YamlProcessor::Dag.order( # rubocop: disable CodeReuse/ActiveRecord -- this is not ActiveRecord
           jobs.to_h do |job|
-            [job.name, aggregated_needs_names(job)]
+            [job.name, job.aggregated_needs_names.to_a]
           end
         )
       end
 
-      def aggregated_needs_names(job)
-        if job.read_needs_from_job_definition?
-          job.job_needs.names
-        else
-          job.aggregated_needs_names.to_a
-        end
-      end
-
       def update_pipeline!
         pipeline.set_status(@collection.status_of_all)
       end
@@ -138,7 +130,7 @@ def update_job!(job)
       def status_of_previous_jobs(job)
         if job.scheduling_type_dag?
           # job uses DAG, get status of all dependent needs
-          @collection.status_of_jobs(aggregated_needs_names(job))
+          @collection.status_of_jobs(job.aggregated_needs_names.to_a)
         else
           # job uses Stages, get status of prior stage
           @collection.status_of_jobs_prior_to_stage(job.stage_idx.to_i)
diff --git a/app/services/ci/reset_skipped_jobs_service.rb b/app/services/ci/reset_skipped_jobs_service.rb
index 3931fa4fdf5fe6..705dd6414c3d8a 100644
--- a/app/services/ci/reset_skipped_jobs_service.rb
+++ b/app/services/ci/reset_skipped_jobs_service.rb
@@ -32,7 +32,7 @@ def dependent_jobs
           .skipped
           .ordered_by_stage
           .preload(:needs)
-          .preload_job_definitions
+          .with_job_info_preload
           .with_project_preload
       )
     end
diff --git a/app/services/ci/retry_job_service.rb b/app/services/ci/retry_job_service.rb
index 4688d9e7ec1e32..a17aeea09d3a10 100644
--- a/app/services/ci/retry_job_service.rb
+++ b/app/services/ci/retry_job_service.rb
@@ -11,7 +11,6 @@ def execute(job, variables: [], inputs: {})
         return processed_inputs if processed_inputs.error?
 
         job.ensure_scheduling_type!
-
         new_job = retry_job(job, variables: variables, inputs: processed_inputs.payload[:inputs])
 
         track_retry_with_new_input_values(processed_inputs.payload[:inputs])
diff --git a/app/services/ci/update_build_names_service.rb b/app/services/ci/update_build_names_service.rb
index 3ed418dbf7678c..356d8af9f0b31b 100644
--- a/app/services/ci/update_build_names_service.rb
+++ b/app/services/ci/update_build_names_service.rb
@@ -2,8 +2,6 @@
 
 module Ci
   class UpdateBuildNamesService
-    include Gitlab::Utils::StrongMemoize
-
     attr_reader :pipeline
 
     def initialize(pipeline)
diff --git a/app/validators/json_schemas/ci_job_definition_config.json b/app/validators/json_schemas/ci_job_definition_config.json
index cc6ad5d4f1e917..68e65ceb22b378 100644
--- a/app/validators/json_schemas/ci_job_definition_config.json
+++ b/app/validators/json_schemas/ci_job_definition_config.json
@@ -10,10 +10,6 @@
     "interruptible": {
       "type": "boolean"
     },
-    "needs_attributes": {
-      "type": "array",
-      "description": "TODO: Add full configuration for needs_attributes"
-    },
     "options": {
       "$ref": "./build_metadata_config_options.json"
     },
diff --git a/config/feature_flags/wip/read_needs_from_ci_job_definitions.yml b/config/feature_flags/wip/read_needs_from_ci_job_definitions.yml
deleted file mode 100644
index d9cc16f3017569..00000000000000
--- a/config/feature_flags/wip/read_needs_from_ci_job_definitions.yml
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: read_needs_from_ci_job_definitions
-description:
-feature_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/565821
-introduced_by_url: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540
-rollout_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/565821
-milestone: '18.7'
-group: group::ci platform
-type: wip
-default_enabled: false
diff --git a/config/feature_flags/wip/stop_writing_to_ci_build_needs.yml b/config/feature_flags/wip/stop_writing_to_ci_build_needs.yml
deleted file mode 100644
index 5bf20990b79ffd..00000000000000
--- a/config/feature_flags/wip/stop_writing_to_ci_build_needs.yml
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: stop_writing_to_ci_build_needs
-description:
-feature_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/565821
-introduced_by_url: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540
-rollout_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/565821
-milestone: '18.7'
-group: group::ci platform
-type: wip
-default_enabled: false
diff --git a/config/feature_flags/wip/write_needs_to_ci_job_definitions.yml b/config/feature_flags/wip/write_needs_to_ci_job_definitions.yml
deleted file mode 100644
index 27c3b508472113..00000000000000
--- a/config/feature_flags/wip/write_needs_to_ci_job_definitions.yml
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: write_needs_to_ci_job_definitions
-description:
-feature_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/565821
-introduced_by_url: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540
-rollout_issue_url: https://gitlab.com/gitlab-org/gitlab/-/work_items/565821
-milestone: '18.7'
-group: group::ci platform
-type: wip
-default_enabled: false
diff --git a/config/gitlab_loose_foreign_keys.yml b/config/gitlab_loose_foreign_keys.yml
index 101b1054ecc2b5..5e128df843ac20 100644
--- a/config/gitlab_loose_foreign_keys.yml
+++ b/config/gitlab_loose_foreign_keys.yml
@@ -631,10 +631,6 @@ p_ci_job_definitions:
   - table: projects
     column: project_id
     on_delete: async_delete
-p_ci_job_info_instances:
-  - table: projects
-    column: project_id
-    on_delete: async_delete
 p_ci_job_infos:
   - table: projects
     column: project_id
diff --git a/db/docs/p_ci_job_info_instances.yml b/db/docs/p_ci_job_info_instances.yml
deleted file mode 100644
index 87f4b73d9a9bd2..00000000000000
--- a/db/docs/p_ci_job_info_instances.yml
+++ /dev/null
@@ -1,13 +0,0 @@
----
-table_name: p_ci_job_info_instances
-classes:
-  - Ci::JobInfoInstance
-feature_categories:
-- continuous_integration
-description: Links ci_builds with ci_job_infos
-introduced_by_url: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/211540
-milestone: '18.7'
-gitlab_schema: gitlab_ci
-sharding_key:
-  project_id: projects
-table_size: small
diff --git a/lib/gitlab/ci/job_needs/collection.rb b/lib/gitlab/ci/job_needs/collection.rb
index fadc50ed852082..f97be836b5b971 100644
--- a/lib/gitlab/ci/job_needs/collection.rb
+++ b/lib/gitlab/ci/job_needs/collection.rb
@@ -9,7 +9,6 @@ class Collection
         include Enumerable
 
         ATTRIBUTES = [:name, :artifacts, :optional].freeze
-        INTRINSIC_ATTRIBUTES = [:name].freeze
 
         Need = Struct.new(:job_id, *ATTRIBUTES, keyword_init: true) do
           include GlobalID::Identification
diff --git a/lib/gitlab/ci/pipeline/chain/set_build_sources.rb b/lib/gitlab/ci/pipeline/chain/set_build_sources.rb
index 212a7af0c55668..34efc5f887f30c 100644
--- a/lib/gitlab/ci/pipeline/chain/set_build_sources.rb
+++ b/lib/gitlab/ci/pipeline/chain/set_build_sources.rb
@@ -16,7 +16,7 @@ def perform!
                                  pipeline.source
                                end
 
-                # RESUME POC HERE...
+                # IN PROGRESS: ci_build_sources deduplication into ci_job_infos
                 if Feature.disabled?(:stop_writing_ci_job_info_to_old_destinations, project)
                   build.build_build_source(source: build_source,
                     project_id: project.id)
diff --git a/lib/gitlab/ci/processable_object_hierarchy.rb b/lib/gitlab/ci/processable_object_hierarchy.rb
index 3412fde01eee0b..32572e7939c13f 100644
--- a/lib/gitlab/ci/processable_object_hierarchy.rb
+++ b/lib/gitlab/ci/processable_object_hierarchy.rb
@@ -6,7 +6,7 @@ class ProcessableObjectHierarchy < ::Gitlab::ObjectHierarchy
       include Gitlab::Utils::StrongMemoize
 
       def base_and_descendants
-        return super unless read_needs_from_job_definitions?
+        return super unless read_from_job_infos?
 
         super.with(job_needs_cte.to_arel) # rubocop:disable CodeReuse/ActiveRecord -- Required to include job_needs_cte in query
       end
@@ -14,7 +14,7 @@ def base_and_descendants
       private
 
       def middle_table
-        return ::Ci::BuildNeed.arel_table unless read_needs_from_job_definitions?
+        return ::Ci::BuildNeed.arel_table unless read_from_job_infos?
 
         job_needs_cte.table
       end
@@ -52,7 +52,7 @@ def pipeline
 
       # This processable object hierachy is the main challenge with dropping ci_build_needs.
       # One idea is to recreate the table on-the-fly as a CTE by exploding the
-      # `needs_attributes` value from job definitions.
+      # `needs_attributes` value from job infos.
       #
       # I believe we only need the latest needed jobs of the given pipeline since
       # we shouldn't need to process old jobs or jobs outside of it. So this table would
@@ -66,14 +66,11 @@ def job_needs_cte
             needs_attributes ->> 'name' AS name
           FROM
             p_ci_builds
-            INNER JOIN p_ci_job_definition_instances
-              ON p_ci_builds.id = p_ci_job_definition_instances.job_id
-              AND p_ci_builds.partition_id = p_ci_job_definition_instances.partition_id
-            INNER JOIN p_ci_job_definitions
-              ON p_ci_job_definition_instances.job_definition_id = p_ci_job_definitions.id
-              AND p_ci_job_definition_instances.partition_id = p_ci_job_definitions.partition_id
+            INNER JOIN p_ci_job_infos
+              ON p_ci_builds.job_info_id = p_ci_job_infos.id
+              AND p_ci_builds.partition_id = p_ci_job_infos.partition_id
           CROSS JOIN LATERAL
-            jsonb_array_elements(p_ci_job_definitions.config->'needs_attributes') AS needs_attributes
+            jsonb_array_elements(p_ci_job_infos.config->'needs_attributes') AS needs_attributes
           WHERE
             p_ci_builds.partition_id = #{pipeline.partition_id}
             AND p_ci_builds.id IN (#{pipeline.processables.latest.select(:id).to_sql})
@@ -82,10 +79,10 @@ def job_needs_cte
         Gitlab::SQL::CTE.new(:job_needs, sql)
       end
 
-      def read_needs_from_job_definitions?
-        pipeline.read_needs_from_job_definitions?
+      def read_from_job_infos?
+        pipeline.read_from_job_infos?
       end
-      strong_memoize_attr :read_needs_from_job_definitions?
+      strong_memoize_attr :read_from_job_infos?
     end
   end
 end
diff --git a/lib/gitlab/import_export/project/import_export.yml b/lib/gitlab/import_export/project/import_export.yml
index a6ae67ef1992d5..11940bc8cf4b4e 100644
--- a/lib/gitlab/import_export/project/import_export.yml
+++ b/lib/gitlab/import_export/project/import_export.yml
@@ -107,8 +107,7 @@ tree:
       - :external_pull_request
       - :merge_request
       - :pipeline_metadata
-    - :job_infos # TODO: I think these tables are necessary to export?
-    - :job_info_instances  # TODO: Need to confirm correct way to export job_info_instances in this yaml
+    - :job_infos # TODO: I think this table is necessary to export?
     - :auto_devops
     - :pipeline_schedules
     - :container_expiration_policy
@@ -605,8 +604,6 @@ included_attributes:
     - :scheduling_type
     - :name
     - :config
-  job_info_instances:
-    - :project_id
   ci_pipelines:
     - :ref
     - :sha
diff --git a/spec/factories/ci/builds.rb b/spec/factories/ci/builds.rb
index 6340c7618f1ff6..454cbc9258b71f 100644
--- a/spec/factories/ci/builds.rb
+++ b/spec/factories/ci/builds.rb
@@ -108,20 +108,12 @@
 
       after(:build) do |build, evaluator|
         if Feature.enabled?(:write_to_ci_job_infos, build.project)
-          processable.temp_job_info.mutate(needs_attributes: [{ name: evaluator.needed.name }])
-          processable.temp_job_info.validate!
-        end
-
-        if Feature.enabled?(:write_needs_to_ci_job_definitions, build.project)
-          Ci::JobFactoryHelpers.mutate_temp_job_definition(
-            build,
-            needs_attributes: [{ name: evaluator.needed.name }]
-          )
+          Ci::JobFactoryHelpers.mutate_temp_job_info(build, needs_attributes: [{ name: evaluator.needed.name }])
         end
       end
 
       after(:create) do |build, evaluator|
-        next if Feature.enabled?(:stop_writing_to_ci_build_needs, build.project)
+        next if Feature.enabled?(:stop_writing_ci_job_info_to_old_destinations, build.project)
 
         build.needs << create(:ci_build_need, build: build, name: evaluator.needed.name)
       end
diff --git a/spec/factories/ci/processable.rb b/spec/factories/ci/processable.rb
index c21061ebaaba02..d7a379a0a6d135 100644
--- a/spec/factories/ci/processable.rb
+++ b/spec/factories/ci/processable.rb
@@ -29,27 +29,19 @@
       Ci::JobFactoryHelpers.mutate_temp_job_definition(
         processable, options: evaluator.options, yaml_variables: evaluator.yaml_variables)
 
-      if Feature.enabled?(:write_needs_to_ci_job_definitions, processable.project)
-        Ci::JobFactoryHelpers.mutate_temp_job_definition(processable, needs_attributes: evaluator.needs_attributes.to_a)
-      end
-
       if Feature.enabled?(:write_to_ci_job_infos, processable.project)
-        processable.temp_job_info = ::Ci::JobInfo.fabricate(
-          project_id: processable.project_id,
-          partition_id: processable.partition_id,
-          job_attrs: {
-            scheduling_type: evaluator.scheduling_type,
-            name: processable.name,
-            needs_attributes: evaluator.needs_attributes.to_a
-          }
+        Ci::JobFactoryHelpers.mutate_temp_job_info(
+          processable,
+          scheduling_type: evaluator.scheduling_type,
+          name: processable.name,
+          needs_attributes: evaluator.needs_attributes.to_a
         )
-
-        processable.temp_job_info.validate!
       end
 
       if Feature.disabled?(:stop_writing_ci_job_info_to_old_destinations, processable.project)
         processable.assign_attributes(
-          scheduling_type: evaluator.scheduling_type
+          scheduling_type: evaluator.scheduling_type,
+          needs_attributes: evaluator.needs_attributes
         )
       end
     end
diff --git a/spec/lib/gitlab/import_export/all_models.yml b/spec/lib/gitlab/import_export/all_models.yml
index 8e5dcb752b51b1..5246a34b3fe937 100644
--- a/spec/lib/gitlab/import_export/all_models.yml
+++ b/spec/lib/gitlab/import_export/all_models.yml
@@ -996,7 +996,6 @@ project:
 - enabled_foundational_flows
 - enabled_foundational_flow_records
 - job_infos
-- job_info_instances
 award_emoji:
 - awardable
 - user
diff --git a/spec/services/ci/create_pipeline_service_spec.rb b/spec/services/ci/create_pipeline_service_spec.rb
index e01014d1a3ae75..7ff0651d5e9f5b 100644
--- a/spec/services/ci/create_pipeline_service_spec.rb
+++ b/spec/services/ci/create_pipeline_service_spec.rb
@@ -1690,8 +1690,6 @@ def previous_commit_sha_from_ref(ref)
         end
 
         it 'bulk inserts all needs' do
-          stub_feature_flags(stop_writing_to_ci_build_needs: false)
-
           expect(Ci::BuildNeed).to receive(:bulk_insert!).and_call_original
 
           expect(pipeline).to be_persisted
diff --git a/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb b/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb
index bda7939ed9b491..680f9e4e659047 100644
--- a/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb
+++ b/spec/services/ci/pipeline_processing/atomic_processing_service_spec.rb
@@ -790,7 +790,7 @@ def event_on_pipeline(event)
 
     context 'when pipeline with needs is created', :sidekiq_inline do
       before do
-        stub_feature_flags(read_needs_from_ci_job_definitions: false) # Temp to pass tests
+        stub_feature_flags(read_needs_from_job_definition: false) # Temp to pass tests
       end
 
       let!(:linux_build) { create_build('linux:build', stage: 'build', stage_idx: 0) }
@@ -844,7 +844,7 @@ def event_on_pipeline(event)
 
       context 'when one of the jobs is run on a failure' do
         before do
-          stub_feature_flags(read_needs_from_ci_job_definitions: false) # Temp to pass tests
+          stub_feature_flags(read_needs_from_job_definition: false) # Temp to pass tests
         end
 
         let!(:linux_notify) { create_build('linux:notify', stage: 'deploy', stage_idx: 2, when: 'on_failure', scheduling_type: :dag) }
@@ -907,7 +907,7 @@ def event_on_pipeline(event)
       let!(:deploy) { create_build('deploy', stage: 'deploy', stage_idx: 2, scheduling_type: :dag) }
 
       before do
-        stub_feature_flags(read_needs_from_ci_job_definitions: false) # Temp to pass tests
+        stub_feature_flags(read_needs_from_job_definition: false) # Temp to pass tests
         create(:ci_build_need, build: deploy, name: 'linux:build')
       end
 
@@ -930,7 +930,7 @@ def event_on_pipeline(event)
       let!(:deploy) { create_build('deploy', stage: 'deploy', stage_idx: 1, scheduling_type: :dag) }
 
       before do
-        stub_feature_flags(read_needs_from_ci_job_definitions: false) # Temp to pass tests
+        stub_feature_flags(read_needs_from_job_definition: false) # Temp to pass tests
         create(:ci_build_need, build: deploy, name: 'linux:build')
       end
 
diff --git a/spec/services/ci/reset_skipped_jobs_service_spec.rb b/spec/services/ci/reset_skipped_jobs_service_spec.rb
index 06dad52a1108f0..bac1b7fd94f54e 100644
--- a/spec/services/ci/reset_skipped_jobs_service_spec.rb
+++ b/spec/services/ci/reset_skipped_jobs_service_spec.rb
@@ -422,7 +422,7 @@ def processables
 
   def jobs_name_status_owner_needs
     processables.reload.map do |job|
-      if job.read_needs_from_job_definition?
+      if job.read_from_job_info?
         job.attributes.slice('name', 'status', 'user_id').merge('needs' => job.job_needs.names)
       else
         job.attributes.slice('name', 'status', 'user_id').merge('needs' => job.needs.map(&:name))
diff --git a/spec/support/helpers/ci/job_factory_helpers.rb b/spec/support/helpers/ci/job_factory_helpers.rb
index 8b948e7e0992eb..7347e4196b0003 100644
--- a/spec/support/helpers/ci/job_factory_helpers.rb
+++ b/spec/support/helpers/ci/job_factory_helpers.rb
@@ -20,5 +20,16 @@ def self.mutate_temp_job_definition(job, **new_config)
 
       job.temp_job_definition = new_temp_job_definition
     end
+
+    def self.mutate_temp_job_info(job, **new_job_attrs)
+      job.temp_job_info ||= ::Ci::JobInfo.fabricate(
+        job_attrs: new_job_attrs,
+        project_id: job.project_id,
+        partition_id: job.partition_id
+      )
+
+      job.temp_job_info.mutate(**new_job_attrs)
+      job.temp_job_info.validate!
+    end
   end
 end
-- 
GitLab