Skip to content
代码片段 群组 项目
未验证 提交 f40df89e 编辑于 作者: Andy Schoenen's avatar Andy Schoenen 提交者: GitLab
浏览文件

Merge branch...

Merge branch '495649-solve-null-equality-in-bbm-that-deduplicates-lfs_objects_projects' into 'master' 

Solve null equality in BBM that deduplicates lfs_objects_projects

See merge request https://gitlab.com/gitlab-org/gitlab/-/merge_requests/167468



Merged-by: default avatarAndy Schoenen <asoiron@gitlab.com>
Approved-by: default avatarNaman Jagdish Gala <ngala@gitlab.com>
Approved-by: default avatarJarka Košanová <jarka@gitlab.com>
Approved-by: default avatarJerry Seto <jseto@gitlab.com>
Approved-by: default avatarAndy Schoenen <asoiron@gitlab.com>
Co-authored-by: default avatarJaviera Tapia <jtapia@gitlab.com>
No related branches found
No related tags found
无相关合并请求
...@@ -5,9 +5,13 @@ description: >- ...@@ -5,9 +5,13 @@ description: >-
After the migration is finalized, we need to add a unique index on all three columns to ensure After the migration is finalized, we need to add a unique index on all three columns to ensure
data consistency since the unique validation already exists at the model level. data consistency since the unique validation already exists at the model level.
Originally introduced by https://gitlab.com/gitlab-org/gitlab/-/merge_requests/154323 1) Originally introduced by https://gitlab.com/gitlab-org/gitlab/-/merge_requests/154323
Re-enqueued because we found some duplicates were still being introduced Re-enqueued because we found some duplicates were still being introduced
2) Originally re-enqueued in https://gitlab.com/gitlab-org/gitlab/-/merge_requests/167468
Re-enqueued a second time since we found some duplicates when repository_type is NULL
feature_category: source_code_management feature_category: source_code_management
introduced_by_url: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/164127 introduced_by_url: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/167468
milestone: '17.4' milestone: '17.5'
queued_migration_version: 20240827204855 queued_migration_version: 20240927202948
finalize_after: '2024-10-17' # required upgrade stop due date
...@@ -13,20 +13,13 @@ class ReenqueueDeduplicateLfsObjectsProjects < Gitlab::Database::Migration[2.2] ...@@ -13,20 +13,13 @@ class ReenqueueDeduplicateLfsObjectsProjects < Gitlab::Database::Migration[2.2]
restrict_gitlab_migration gitlab_schema: :gitlab_main restrict_gitlab_migration gitlab_schema: :gitlab_main
# To be re-enqueued by:
# db/post_migrate/20240927202948_reenqueue_deduplicate_lfs_objects_projects_with_null_repository_types.rb
def up def up
delete_batched_background_migration(MIGRATION, :lfs_objects_projects, :id, []) # no-op
queue_batched_background_migration(
MIGRATION,
:lfs_objects_projects,
:id,
job_interval: DELAY_INTERVAL,
batch_size: BATCH_SIZE,
sub_batch_size: SUB_BATCH_SIZE
)
end end
def down def down
delete_batched_background_migration(MIGRATION, :lfs_objects_projects, :id, []) # no-op
end end
end end
# frozen_string_literal: true
class ReenqueueDeduplicateLfsObjectsProjectsWithNullRepositoryTypes < Gitlab::Database::Migration[2.2]
milestone '17.5'
MIGRATION = 'DeduplicateLfsObjectsProjects'
TABLE_NAME = :lfs_objects_projects
DELAY_INTERVAL = 100
BATCH_SIZE = 10_000
SUB_BATCH_SIZE = 2_500
disable_ddl_transaction!
restrict_gitlab_migration gitlab_schema: :gitlab_main
def up
delete_batched_background_migration(MIGRATION, :lfs_objects_projects, :id, [])
queue_batched_background_migration(
MIGRATION,
:lfs_objects_projects,
:id,
job_interval: DELAY_INTERVAL,
batch_size: BATCH_SIZE,
sub_batch_size: SUB_BATCH_SIZE
)
end
def down
delete_batched_background_migration(MIGRATION, :lfs_objects_projects, :id, [])
end
end
b693c1b11d18d4dae7281af0e5784c91bd285d1e366baae96c00d22f3d0e05d8
\ No newline at end of file
...@@ -34,7 +34,7 @@ def perform ...@@ -34,7 +34,7 @@ def perform
INNER JOIN (#{subquery.to_sql}) AS duplicates INNER JOIN (#{subquery.to_sql}) AS duplicates
ON lfs_objects_projects.project_id = duplicates.project_id ON lfs_objects_projects.project_id = duplicates.project_id
AND lfs_objects_projects.lfs_object_id = duplicates.lfs_object_id AND lfs_objects_projects.lfs_object_id = duplicates.lfs_object_id
AND lfs_objects_projects.repository_type = duplicates.repository_type AND lfs_objects_projects.repository_type IS NOT DISTINCT FROM duplicates.repository_type
SQL SQL
duplicated_lfs_objects_projects = LfsObjectsProject.joins(join_query).where.not( duplicated_lfs_objects_projects = LfsObjectsProject.joins(join_query).where.not(
......
...@@ -68,15 +68,15 @@ ...@@ -68,15 +68,15 @@
end end
let!(:duplicated_lfs_objects_project3) do let!(:duplicated_lfs_objects_project3) do
lfs_objects_projects_table.create!(project_id: project2.id, lfs_object_id: lfs_object4.id, repository_type: 0) lfs_objects_projects_table.create!(project_id: project2.id, lfs_object_id: lfs_object4.id, repository_type: nil)
end end
let!(:duplicated_lfs_objects_project4) do let!(:duplicated_lfs_objects_project4) do
lfs_objects_projects_table.create!(project_id: project2.id, lfs_object_id: lfs_object4.id, repository_type: 0) lfs_objects_projects_table.create!(project_id: project2.id, lfs_object_id: lfs_object4.id, repository_type: nil)
end end
let!(:lfs_objects_project5) do let!(:lfs_objects_project5) do
lfs_objects_projects_table.create!(project_id: project2.id, lfs_object_id: lfs_object4.id, repository_type: 0) lfs_objects_projects_table.create!(project_id: project2.id, lfs_object_id: lfs_object4.id, repository_type: nil)
end end
let!(:lfs_objects_project6) do let!(:lfs_objects_project6) do
......
...@@ -7,20 +7,7 @@ ...@@ -7,20 +7,7 @@
let(:batched_migration) { described_class::MIGRATION } let(:batched_migration) { described_class::MIGRATION }
it 'schedules a new batched migration' do it 'schedules a new batched migration' do
reversible_migration do |migration| migrate!
migration.before -> { expect(batched_migration).not_to have_scheduled_batched_migration
expect(batched_migration).not_to have_scheduled_batched_migration
}
migration.after -> {
expect(batched_migration).to have_scheduled_batched_migration(
table_name: :lfs_objects_projects,
column_name: :id,
batch_class_name: described_class::BATCH_CLASS_NAME,
batch_size: described_class::BATCH_SIZE,
sub_batch_size: described_class::SUB_BATCH_SIZE
)
}
end
end end
end end
# frozen_string_literal: true
require 'spec_helper'
require_migration!
RSpec.describe ReenqueueDeduplicateLfsObjectsProjectsWithNullRepositoryTypes, feature_category: :source_code_management do
let(:batched_migration) { described_class::MIGRATION }
it 'schedules a new batched migration' do
reversible_migration do |migration|
migration.before -> {
expect(batched_migration).not_to have_scheduled_batched_migration
}
migration.after -> {
expect(batched_migration).to have_scheduled_batched_migration(
table_name: :lfs_objects_projects,
column_name: :id,
batch_class_name: described_class::BATCH_CLASS_NAME,
batch_size: described_class::BATCH_SIZE,
sub_batch_size: described_class::SUB_BATCH_SIZE
)
}
end
end
end
0% 加载中 .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册