Commit e5217520 authored by Douglas Barbosa Alexandre's avatar Douglas Barbosa Alexandre

Merge branch 'ag-add-verification-for-lfs-objects' into 'master'

Geo: Add verification for LFS objects [RUN ALL RSPEC] [RUN AS-IF-FOSS]

See merge request gitlab-org/gitlab!63981
parents cf22999b b2c1d0a8
# frozen_string_literal: true
class CreateLfsObjectStates < Gitlab::Database::Migration[1.0]
VERIFICATION_STATE_INDEX_NAME = "index_lfs_object_states_on_verification_state"
PENDING_VERIFICATION_INDEX_NAME = "index_lfs_object_states_pending_verification"
FAILED_VERIFICATION_INDEX_NAME = "index_lfs_object_states_failed_verification"
NEEDS_VERIFICATION_INDEX_NAME = "index_lfs_object_states_needs_verification"
disable_ddl_transaction!
def up
create_table :lfs_object_states, id: false do |t|
t.datetime_with_timezone :verification_started_at
t.datetime_with_timezone :verification_retry_at
t.datetime_with_timezone :verified_at
t.references :lfs_object, primary_key: true, null: false, foreign_key: { on_delete: :cascade }
t.integer :verification_state, default: 0, limit: 2, null: false
t.integer :verification_retry_count, limit: 2
t.binary :verification_checksum, using: 'verification_checksum::bytea'
t.text :verification_failure, limit: 255
t.index :verification_state, name: VERIFICATION_STATE_INDEX_NAME
t.index :verified_at, where: "(verification_state = 0)", order: { verified_at: 'ASC NULLS FIRST' }, name: PENDING_VERIFICATION_INDEX_NAME
t.index :verification_retry_at, where: "(verification_state = 3)", order: { verification_retry_at: 'ASC NULLS FIRST' }, name: FAILED_VERIFICATION_INDEX_NAME
t.index :verification_state, where: "(verification_state = 0 OR verification_state = 3)", name: NEEDS_VERIFICATION_INDEX_NAME
end
end
def down
drop_table :lfs_object_states
end
end
0d27ca1250d10b8915fa4523707044f9a8c2372110537f5639a1811aeb0858b8
\ No newline at end of file
...@@ -15769,6 +15769,27 @@ CREATE SEQUENCE lfs_file_locks_id_seq ...@@ -15769,6 +15769,27 @@ CREATE SEQUENCE lfs_file_locks_id_seq
ALTER SEQUENCE lfs_file_locks_id_seq OWNED BY lfs_file_locks.id; ALTER SEQUENCE lfs_file_locks_id_seq OWNED BY lfs_file_locks.id;
CREATE TABLE lfs_object_states (
verification_started_at timestamp with time zone,
verification_retry_at timestamp with time zone,
verified_at timestamp with time zone,
lfs_object_id bigint NOT NULL,
verification_state smallint DEFAULT 0 NOT NULL,
verification_retry_count smallint,
verification_checksum bytea,
verification_failure text,
CONSTRAINT check_efe45a8ab3 CHECK ((char_length(verification_failure) <= 255))
);
CREATE SEQUENCE lfs_object_states_lfs_object_id_seq
START WITH 1
INCREMENT BY 1
NO MINVALUE
NO MAXVALUE
CACHE 1;
ALTER SEQUENCE lfs_object_states_lfs_object_id_seq OWNED BY lfs_object_states.lfs_object_id;
CREATE TABLE lfs_objects ( CREATE TABLE lfs_objects (
id integer NOT NULL, id integer NOT NULL,
oid character varying NOT NULL, oid character varying NOT NULL,
...@@ -21795,6 +21816,8 @@ ALTER TABLE ONLY ldap_group_links ALTER COLUMN id SET DEFAULT nextval('ldap_grou ...@@ -21795,6 +21816,8 @@ ALTER TABLE ONLY ldap_group_links ALTER COLUMN id SET DEFAULT nextval('ldap_grou
ALTER TABLE ONLY lfs_file_locks ALTER COLUMN id SET DEFAULT nextval('lfs_file_locks_id_seq'::regclass); ALTER TABLE ONLY lfs_file_locks ALTER COLUMN id SET DEFAULT nextval('lfs_file_locks_id_seq'::regclass);
ALTER TABLE ONLY lfs_object_states ALTER COLUMN lfs_object_id SET DEFAULT nextval('lfs_object_states_lfs_object_id_seq'::regclass);
ALTER TABLE ONLY lfs_objects ALTER COLUMN id SET DEFAULT nextval('lfs_objects_id_seq'::regclass); ALTER TABLE ONLY lfs_objects ALTER COLUMN id SET DEFAULT nextval('lfs_objects_id_seq'::regclass);
ALTER TABLE ONLY lfs_objects_projects ALTER COLUMN id SET DEFAULT nextval('lfs_objects_projects_id_seq'::regclass); ALTER TABLE ONLY lfs_objects_projects ALTER COLUMN id SET DEFAULT nextval('lfs_objects_projects_id_seq'::regclass);
...@@ -23513,6 +23536,9 @@ ALTER TABLE ONLY ldap_group_links ...@@ -23513,6 +23536,9 @@ ALTER TABLE ONLY ldap_group_links
ALTER TABLE ONLY lfs_file_locks ALTER TABLE ONLY lfs_file_locks
ADD CONSTRAINT lfs_file_locks_pkey PRIMARY KEY (id); ADD CONSTRAINT lfs_file_locks_pkey PRIMARY KEY (id);
ALTER TABLE ONLY lfs_object_states
ADD CONSTRAINT lfs_object_states_pkey PRIMARY KEY (lfs_object_id);
ALTER TABLE ONLY lfs_objects ALTER TABLE ONLY lfs_objects
ADD CONSTRAINT lfs_objects_pkey PRIMARY KEY (id); ADD CONSTRAINT lfs_objects_pkey PRIMARY KEY (id);
...@@ -26529,6 +26555,16 @@ CREATE UNIQUE INDEX index_lfs_file_locks_on_project_id_and_path ON lfs_file_lock ...@@ -26529,6 +26555,16 @@ CREATE UNIQUE INDEX index_lfs_file_locks_on_project_id_and_path ON lfs_file_lock
CREATE INDEX index_lfs_file_locks_on_user_id ON lfs_file_locks USING btree (user_id); CREATE INDEX index_lfs_file_locks_on_user_id ON lfs_file_locks USING btree (user_id);
CREATE INDEX index_lfs_object_states_failed_verification ON lfs_object_states USING btree (verification_retry_at NULLS FIRST) WHERE (verification_state = 3);
CREATE INDEX index_lfs_object_states_needs_verification ON lfs_object_states USING btree (verification_state) WHERE ((verification_state = 0) OR (verification_state = 3));
CREATE INDEX index_lfs_object_states_on_lfs_object_id ON lfs_object_states USING btree (lfs_object_id);
CREATE INDEX index_lfs_object_states_on_verification_state ON lfs_object_states USING btree (verification_state);
CREATE INDEX index_lfs_object_states_pending_verification ON lfs_object_states USING btree (verified_at NULLS FIRST) WHERE (verification_state = 0);
CREATE INDEX index_lfs_objects_on_file_store ON lfs_objects USING btree (file_store); CREATE INDEX index_lfs_objects_on_file_store ON lfs_objects USING btree (file_store);
CREATE UNIQUE INDEX index_lfs_objects_on_oid ON lfs_objects USING btree (oid); CREATE UNIQUE INDEX index_lfs_objects_on_oid ON lfs_objects USING btree (oid);
...@@ -30333,6 +30369,9 @@ ALTER TABLE ONLY description_versions ...@@ -30333,6 +30369,9 @@ ALTER TABLE ONLY description_versions
ALTER TABLE ONLY clusters_kubernetes_namespaces ALTER TABLE ONLY clusters_kubernetes_namespaces
ADD CONSTRAINT fk_rails_40cc7ccbc3 FOREIGN KEY (cluster_project_id) REFERENCES cluster_projects(id) ON DELETE SET NULL; ADD CONSTRAINT fk_rails_40cc7ccbc3 FOREIGN KEY (cluster_project_id) REFERENCES cluster_projects(id) ON DELETE SET NULL;
ALTER TABLE ONLY lfs_object_states
ADD CONSTRAINT fk_rails_4188448cd5 FOREIGN KEY (lfs_object_id) REFERENCES lfs_objects(id) ON DELETE CASCADE;
ALTER TABLE ONLY geo_node_namespace_links ALTER TABLE ONLY geo_node_namespace_links
ADD CONSTRAINT fk_rails_41ff5fb854 FOREIGN KEY (namespace_id) REFERENCES namespaces(id) ON DELETE CASCADE; ADD CONSTRAINT fk_rails_41ff5fb854 FOREIGN KEY (namespace_id) REFERENCES namespaces(id) ON DELETE CASCADE;
...@@ -37,7 +37,7 @@ verification methods: ...@@ -37,7 +37,7 @@ verification methods:
| Git | Group wiki repository | Geo with Gitaly | _Not implemented_ | | Git | Group wiki repository | Geo with Gitaly | _Not implemented_ |
| Blobs | User uploads _(file system)_ | Geo with API | _Not implemented_ | | Blobs | User uploads _(file system)_ | Geo with API | _Not implemented_ |
| Blobs | User uploads _(object storage)_ | Geo with API/Managed (*2*) | _Not implemented_ | | Blobs | User uploads _(object storage)_ | Geo with API/Managed (*2*) | _Not implemented_ |
| Blobs | LFS objects _(file system)_ | Geo with API | _Not implemented_ | | Blobs | LFS objects _(file system)_ | Geo with API | SHA256 checksum |
| Blobs | LFS objects _(object storage)_ | Geo with API/Managed (*2*) | _Not implemented_ | | Blobs | LFS objects _(object storage)_ | Geo with API/Managed (*2*) | _Not implemented_ |
| Blobs | CI job artifacts _(file system)_ | Geo with API | _Not implemented_ | | Blobs | CI job artifacts _(file system)_ | Geo with API | _Not implemented_ |
| Blobs | CI job artifacts _(object storage)_ | Geo with API/Managed (*2*) | _Not implemented_ | | Blobs | CI job artifacts _(object storage)_ | Geo with API/Managed (*2*) | _Not implemented_ |
...@@ -190,7 +190,7 @@ successfully, you must replicate their data using some other means. ...@@ -190,7 +190,7 @@ successfully, you must replicate their data using some other means.
|[Project wiki repository](../../../user/project/wiki/) | **Yes** (10.2) | **Yes** (10.7) | No | | |[Project wiki repository](../../../user/project/wiki/) | **Yes** (10.2) | **Yes** (10.7) | No | |
|[Group wiki repository](../../../user/project/wiki/group.md) | [**Yes** (13.10)](https://gitlab.com/gitlab-org/gitlab/-/issues/208147) | No | No | Behind feature flag `geo_group_wiki_repository_replication`, enabled by default. | |[Group wiki repository](../../../user/project/wiki/group.md) | [**Yes** (13.10)](https://gitlab.com/gitlab-org/gitlab/-/issues/208147) | No | No | Behind feature flag `geo_group_wiki_repository_replication`, enabled by default. |
|[Uploads](../../uploads.md) | **Yes** (10.2) | [No](https://gitlab.com/groups/gitlab-org/-/epics/1817) | No | Verified only on transfer or manually using [Integrity Check Rake Task](../../raketasks/check.md) on both sites and comparing the output between them. | |[Uploads](../../uploads.md) | **Yes** (10.2) | [No](https://gitlab.com/groups/gitlab-org/-/epics/1817) | No | Verified only on transfer or manually using [Integrity Check Rake Task](../../raketasks/check.md) on both sites and comparing the output between them. |
|[LFS objects](../../lfs/index.md) | **Yes** (10.2) | [No](https://gitlab.com/gitlab-org/gitlab/-/issues/8922) | Via Object Storage provider if supported. Native Geo support (Beta). | Verified only on transfer or manually using [Integrity Check Rake Task](../../raketasks/check.md) on both sites and comparing the output between them. GitLab versions 11.11.x and 12.0.x are affected by [a bug that prevents any new LFS objects from replicating](https://gitlab.com/gitlab-org/gitlab/-/issues/32696).<br><br>Behind feature flag `geo_lfs_object_replication`, enabled by default. | |[LFS objects](../../lfs/index.md) | **Yes** (10.2) | **Yes**(14.6) | Via Object Storage provider if supported. Native Geo support (Beta). | Verified only on transfer or manually using [Integrity Check Rake Task](../../raketasks/check.md) on both sites and comparing the output between them. GitLab versions 11.11.x and 12.0.x are affected by [a bug that prevents any new LFS objects from replicating](https://gitlab.com/gitlab-org/gitlab/-/issues/32696).<br /><br />Replication is behind the feature flag `geo_lfs_object_replication`, enabled by default. Verification is under development behind the feature flag `geo_lfs_object_verification` introduced in 14.6. |
|[Personal snippets](../../../user/snippets.md) | **Yes** (10.2) | **Yes** (10.2) | No | | |[Personal snippets](../../../user/snippets.md) | **Yes** (10.2) | **Yes** (10.2) | No | |
|[Project snippets](../../../user/snippets.md) | **Yes** (10.2) | **Yes** (10.2) | No | | |[Project snippets](../../../user/snippets.md) | **Yes** (10.2) | **Yes** (10.2) | No | |
|[CI job artifacts](../../../ci/pipelines/job_artifacts.md) | **Yes** (10.4) | [No](https://gitlab.com/gitlab-org/gitlab/-/issues/8923) | Via Object Storage provider if supported. Native Geo support (Beta). | Verified only manually using [Integrity Check Rake Task](../../raketasks/check.md) on both sites and comparing the output between them. Job logs also verified on transfer. | |[CI job artifacts](../../../ci/pipelines/job_artifacts.md) | **Yes** (10.4) | [No](https://gitlab.com/gitlab-org/gitlab/-/issues/8923) | Via Object Storage provider if supported. Native Geo support (Beta). | Verified only manually using [Integrity Check Rake Task](../../raketasks/check.md) on both sites and comparing the output between them. Job logs also verified on transfer. |
......
...@@ -187,16 +187,25 @@ configuration option in `gitlab.yml`. These metrics are served from the ...@@ -187,16 +187,25 @@ configuration option in `gitlab.yml`. These metrics are served from the
| `geo_repositories` | Gauge | 10.2 | Total number of repositories available on primary | `url` | | `geo_repositories` | Gauge | 10.2 | Total number of repositories available on primary | `url` |
| `geo_repositories_synced` | Gauge | 10.2 | Number of repositories synced on secondary | `url` | | `geo_repositories_synced` | Gauge | 10.2 | Number of repositories synced on secondary | `url` |
| `geo_repositories_failed` | Gauge | 10.2 | Number of repositories failed to sync on secondary | `url` | | `geo_repositories_failed` | Gauge | 10.2 | Number of repositories failed to sync on secondary | `url` |
| `geo_lfs_objects` | Gauge | 10.2 | Total number of LFS objects available on primary | `url` | | `geo_lfs_objects` | Gauge | 10.2 | Number of LFS objects on primary | `url` |
| `geo_lfs_objects_synced` | Gauge | 10.2 | Number of LFS objects synced on secondary | `url` | | `geo_lfs_objects_checksummed` | Gauge | 14.6 | Number of LFS objects checksummed successfully on primary | `url` |
| `geo_lfs_objects_failed` | Gauge | 10.2 | Number of LFS objects failed to sync on secondary | `url` | | `geo_lfs_objects_checksum_failed` | Gauge | 14.6 | Number of LFS objects failed to calculate the checksum on primary | `url` |
| `geo_lfs_objects_checksum_total` | Gauge | 14.6 | Number of LFS objects tried to checksum on primary | `url` |
| `geo_lfs_objects_synced` | Gauge | 10.2 | Number of syncable LFS objects synced on secondary | `url` |
| `geo_lfs_objects_failed` | Gauge | 10.2 | Number of syncable LFS objects failed to sync on secondary | `url` |
| `geo_lfs_objects_registry` | Gauge | 14.6 | Number of LFS objects in the registry | `url` |
| `geo_lfs_objects_verified` | Gauge | 14.6 | Number of LFS objects verified on secondary | `url` |
| `geo_lfs_objects_verification_failed` | Gauge | 14.6 | Number of LFS objects' verifications failed on secondary | `url` |
| `geo_lfs_objects_verification_total` | Gauge | 14.6 | Number of LFS objects' verifications tried on secondary | `url` |LFS objects failed to sync on secondary | `url` |
| `geo_attachments` | Gauge | 10.2 | Total number of file attachments available on primary | `url` |
| `geo_attachments_synced` | Gauge | 10.2 | Number of attachments synced on secondary | `url` |
| `geo_attachments_failed` | Gauge | 10.2 | Number of attachments failed to sync on secondary | `url` |
| `geo_last_event_id` | Gauge | 10.2 | Database ID of the latest event log entry on the primary | `url` | | `geo_last_event_id` | Gauge | 10.2 | Database ID of the latest event log entry on the primary | `url` |
| `geo_last_event_timestamp` | Gauge | 10.2 | UNIX timestamp of the latest event log entry on the primary | `url` | | `geo_last_event_timestamp` | Gauge | 10.2 | UNIX timestamp of the latest event log entry on the primary | `url` |
| `geo_cursor_last_event_id` | Gauge | 10.2 | Last database ID of the event log processed by the secondary | `url` | | `geo_cursor_last_event_id` | Gauge | 10.2 | Last database ID of the event log processed by the secondary | `url` |
| `geo_cursor_last_event_timestamp` | Gauge | 10.2 | Last UNIX timestamp of the event log processed by the secondary | `url` | | `geo_cursor_last_event_timestamp` | Gauge | 10.2 | Last UNIX timestamp of the event log processed by the secondary | `url` |
| `geo_status_failed_total` | Counter | 10.2 | Number of times retrieving the status from the Geo Node failed | `url` | | `geo_status_failed_total` | Counter | 10.2 | Number of times retrieving the status from the Geo Node failed | `url` |
| `geo_last_successful_status_check_timestamp` | Gauge | 10.2 | Last timestamp when the status was successfully updated | `url` | | `geo_last_successful_status_check_timestamp` | Gauge | 10.2 | Last timestamp when the status was successfully updated | `url` |
| `geo_lfs_objects_synced_missing_on_primary` | Gauge | 10.7 | Number of LFS objects marked as synced due to the file missing on the primary | `url` |
| `geo_job_artifacts_synced_missing_on_primary` | Gauge | 10.7 | Number of job artifacts marked as synced due to the file missing on the primary | `url` | | `geo_job_artifacts_synced_missing_on_primary` | Gauge | 10.7 | Number of job artifacts marked as synced due to the file missing on the primary | `url` |
| `geo_repositories_checksummed` | Gauge | 10.7 | Number of repositories checksummed on primary | `url` | | `geo_repositories_checksummed` | Gauge | 10.7 | Number of repositories checksummed on primary | `url` |
| `geo_repositories_checksum_failed` | Gauge | 10.7 | Number of repositories failed to calculate the checksum on primary | `url` | | `geo_repositories_checksum_failed` | Gauge | 10.7 | Number of repositories failed to calculate the checksum on primary | `url` |
......
...@@ -307,11 +307,18 @@ Example response: ...@@ -307,11 +307,18 @@ Example response:
"health_status": "Healthy", "health_status": "Healthy",
"missing_oauth_application": false, "missing_oauth_application": false,
"db_replication_lag_seconds": null, "db_replication_lag_seconds": null,
"lfs_objects_count": 0, "lfs_objects_count": 5,
"lfs_objects_checksum_total_count": 5,
"lfs_objects_checksummed_count": 5,
"lfs_objects_checksum_failed_count": 0,
"lfs_objects_synced_count": null, "lfs_objects_synced_count": null,
"lfs_objects_failed_count": null, "lfs_objects_failed_count": null,
"lfs_objects_synced_missing_on_primary_count": 0, "lfs_objects_registry_count": null,
"lfs_objects_verification_total_count": null,
"lfs_objects_verified_count": null,
"lfs_objects_verification_failed_count": null,
"lfs_objects_synced_in_percentage": "0.00%", "lfs_objects_synced_in_percentage": "0.00%",
"lfs_objects_verified_in_percentage": "0.00%",
"job_artifacts_count": 2, "job_artifacts_count": 2,
"job_artifacts_synced_count": null, "job_artifacts_synced_count": null,
"job_artifacts_failed_count": null, "job_artifacts_failed_count": null,
...@@ -468,11 +475,18 @@ Example response: ...@@ -468,11 +475,18 @@ Example response:
"health_status": "Healthy", "health_status": "Healthy",
"missing_oauth_application": false, "missing_oauth_application": false,
"db_replication_lag_seconds": 0, "db_replication_lag_seconds": 0,
"lfs_objects_count": 0, "lfs_objects_count": 5,
"lfs_objects_synced_count": 0, "lfs_objects_checksum_total_count": 5,
"lfs_objects_failed_count": 0, "lfs_objects_checksummed_count": 5,
"lfs_objects_synced_missing_on_primary_count": 0, "lfs_objects_checksum_failed_count": 0,
"lfs_objects_synced_count": null,
"lfs_objects_failed_count": null,
"lfs_objects_registry_count": null,
"lfs_objects_verification_total_count": null,
"lfs_objects_verified_count": null,
"lfs_objects_verification_failed_count": null,
"lfs_objects_synced_in_percentage": "0.00%", "lfs_objects_synced_in_percentage": "0.00%",
"lfs_objects_verified_in_percentage": "0.00%",
"job_artifacts_count": 2, "job_artifacts_count": 2,
"job_artifacts_synced_count": 1, "job_artifacts_synced_count": 1,
"job_artifacts_failed_count": 1, "job_artifacts_failed_count": 1,
...@@ -633,11 +647,18 @@ Example response: ...@@ -633,11 +647,18 @@ Example response:
"health_status": "Healthy", "health_status": "Healthy",
"missing_oauth_application": false, "missing_oauth_application": false,
"db_replication_lag_seconds": 0, "db_replication_lag_seconds": 0,
"lfs_objects_count": 0, "lfs_objects_count": 5,
"lfs_objects_synced_count": 0, "lfs_objects_checksum_total_count": 5,
"lfs_objects_failed_count": 0, "lfs_objects_checksummed_count": 5,
"lfs_objects_synced_missing_on_primary_count": 0, "lfs_objects_checksum_failed_count": 0,
"lfs_objects_synced_count": null,
"lfs_objects_failed_count": null,
"lfs_objects_registry_count": null,
"lfs_objects_verification_total_count": null,
"lfs_objects_verified_count": null,
"lfs_objects_verification_failed_count": null,
"lfs_objects_synced_in_percentage": "0.00%", "lfs_objects_synced_in_percentage": "0.00%",
"lfs_objects_verified_in_percentage": "0.00%",
"job_artifacts_count": 2, "job_artifacts_count": 2,
"job_artifacts_synced_count": 1, "job_artifacts_synced_count": 1,
"job_artifacts_failed_count": 1, "job_artifacts_failed_count": 1,
......
...@@ -12,13 +12,39 @@ module EE ...@@ -12,13 +12,39 @@ module EE
prepended do prepended do
include ::Gitlab::Geo::ReplicableModel include ::Gitlab::Geo::ReplicableModel
include ::Gitlab::Geo::VerificationState
with_replicator ::Geo::LfsObjectReplicator with_replicator ::Geo::LfsObjectReplicator
scope :project_id_in, ->(ids) { joins(:projects).merge(::Project.id_in(ids)) } scope :project_id_in, ->(ids) { joins(:projects).merge(::Project.id_in(ids)) }
has_one :lfs_object_state, autosave: false, inverse_of: :lfs_object, class_name: 'Geo::LfsObjectState'
after_save :save_verification_details
delegate :verification_retry_at, :verification_retry_at=,
:verified_at, :verified_at=,
:verification_checksum, :verification_checksum=,
:verification_failure, :verification_failure=,
:verification_retry_count, :verification_retry_count=,
:verification_state=, :verification_state,
:verification_started_at=, :verification_started_at,
to: :lfs_object_state, allow_nil: true
scope :with_verification_state, ->(state) { joins(:lfs_object_state).where(lfs_object_states: { verification_state: verification_state_value(state) }) }
scope :checksummed, -> { joins(:lfs_object_state).where.not(lfs_object_states: { verification_checksum: nil } ) }
scope :not_checksummed, -> { joins(:lfs_object_state).where(lfs_object_states: { verification_checksum: nil } ) }
scope :available_verifiables, -> { joins(:lfs_object_state) }
def verification_state_object
lfs_object_state
end
end end
class_methods do class_methods do
extend ::Gitlab::Utils::Override
# @param primary_key_in [Range, LfsObject] arg to pass to primary_key_in scope # @param primary_key_in [Range, LfsObject] arg to pass to primary_key_in scope
# @return [ActiveRecord::Relation<LfsObject>] everything that should be synced to this node, restricted by primary key # @return [ActiveRecord::Relation<LfsObject>] everything that should be synced to this node, restricted by primary key
def replicables_for_current_secondary(primary_key_in) def replicables_for_current_secondary(primary_key_in)
...@@ -27,6 +53,11 @@ module EE ...@@ -27,6 +53,11 @@ module EE
.merge(object_storage_scope(node)) .merge(object_storage_scope(node))
end end
override :verification_state_table_class
def verification_state_table_class
Geo::LfsObjectState
end
private private
def object_storage_scope(node) def object_storage_scope(node)
...@@ -36,6 +67,10 @@ module EE ...@@ -36,6 +67,10 @@ module EE
end end
end end
def lfs_object_state
super || build_lfs_object_state
end
def log_geo_deleted_event def log_geo_deleted_event
# Keep empty for now. Should be addressed in future # Keep empty for now. Should be addressed in future
# by https://gitlab.com/gitlab-org/gitlab/-/issues/232917 # by https://gitlab.com/gitlab-org/gitlab/-/issues/232917
......
...@@ -2,6 +2,7 @@ ...@@ -2,6 +2,7 @@
class Geo::LfsObjectRegistry < Geo::BaseRegistry class Geo::LfsObjectRegistry < Geo::BaseRegistry
include ::Geo::ReplicableRegistry include ::Geo::ReplicableRegistry
include ::Geo::VerifiableRegistry
MODEL_CLASS = ::LfsObject MODEL_CLASS = ::LfsObject
MODEL_FOREIGN_KEY = :lfs_object_id MODEL_FOREIGN_KEY = :lfs_object_id
......
# frozen_string_literal: true
module Geo
class LfsObjectState < ApplicationRecord
self.primary_key = :lfs_object_id
belongs_to :lfs_object, inverse_of: :lfs_object_state
end
end
...@@ -3,6 +3,7 @@ ...@@ -3,6 +3,7 @@
module Geo module Geo
class LfsObjectReplicator < Gitlab::Geo::Replicator class LfsObjectReplicator < Gitlab::Geo::Replicator
include ::Geo::BlobReplicatorStrategy include ::Geo::BlobReplicatorStrategy
extend ::Gitlab::Utils::Override
def carrierwave_uploader def carrierwave_uploader
model_record.file model_record.file
...@@ -11,5 +12,10 @@ module Geo ...@@ -11,5 +12,10 @@ module Geo
def self.model def self.model
::LfsObject ::LfsObject
end end
override :verification_feature_flag_enabled?
def self.verification_feature_flag_enabled?
Feature.enabled?(:geo_lfs_object_verification, default_enabled: :yaml)
end
end end
end end
---
name: geo_lfs_object_verification
introduced_by_url: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/63981
rollout_issue_url: https://gitlab.com/gitlab-org/gitlab/-/issues/333532
milestone: '14.6'
type: development
group: group::geo
default_enabled: false
# frozen_string_literal: true
class AddVerificationToLfsObjectRegistry < Gitlab::Database::Migration[1.0]
disable_ddl_transaction!
# rubocop:disable Migration/AddLimitToTextColumns
# limit is added in 20211124000001_add_text_limit_to_lfs_object_registry_verification_failure.rb
def change
add_column :lfs_object_registry, :verification_started_at, :datetime_with_timezone
add_column :lfs_object_registry, :verified_at, :datetime_with_timezone
add_column :lfs_object_registry, :verification_retry_at, :datetime_with_timezone
add_column :lfs_object_registry, :verification_retry_count, :integer, default: 0
add_column :lfs_object_registry, :verification_state, :integer, limit: 2, default: 0, null: false
add_column :lfs_object_registry, :checksum_mismatch, :boolean, default: false, null: false
add_column :lfs_object_registry, :verification_checksum, :binary
add_column :lfs_object_registry, :verification_checksum_mismatched, :binary
add_column :lfs_object_registry, :verification_failure, :text
# rubocop:enable Migration/AddLimitToTextColumns
end
end
# frozen_string_literal: true
class AddTextLimitToLfsObjectRegistryVerificationFailure < Gitlab::Database::Migration[1.0]
disable_ddl_transaction!
def up
add_text_limit :lfs_object_registry, :verification_failure, 255
end
def down
remove_text_limit :lfs_object_registry, :verification_failure
end
end
# frozen_string_literal: true
class AddIndexesToLfsObjectRegistry < Gitlab::Database::Migration[1.0]
LFS_OBJECT_ID_INDEX_NAME = "index_lfs_object_registry_on_lfs_object_id"
FAILED_VERIFICATION_INDEX_NAME = "lfs_object_registry_failed_verification"
NEEDS_VERIFICATION_INDEX_NAME = "lfs_object_registry_needs_verification"
PENDING_VERIFICATION_INDEX_NAME = "lfs_object_registry_pending_verification"
REGISTRY_TABLE = :lfs_object_registry
disable_ddl_transaction!
def up
add_concurrent_index REGISTRY_TABLE, :lfs_object_id, name: LFS_OBJECT_ID_INDEX_NAME, unique: true
add_concurrent_index REGISTRY_TABLE, :verification_retry_at, name: FAILED_VERIFICATION_INDEX_NAME, order: "NULLS FIRST", where: "((state = 2) AND (verification_state = 3))"
add_concurrent_index REGISTRY_TABLE, :verification_state, name: NEEDS_VERIFICATION_INDEX_NAME, where: "((state = 2) AND (verification_state = ANY (ARRAY[0, 3])))"
add_concurrent_index REGISTRY_TABLE, :verified_at, name: PENDING_VERIFICATION_INDEX_NAME, order: "NULLS FIRST", where: "((state = 2) AND (verification_state = 0))"
end
def down
remove_concurrent_index_by_name REGISTRY_TABLE, name: LFS_OBJECT_ID_INDEX_NAME
remove_concurrent_index_by_name REGISTRY_TABLE, name: FAILED_VERIFICATION_INDEX_NAME
remove_concurrent_index_by_name REGISTRY_TABLE, name: NEEDS_VERIFICATION_INDEX_NAME
remove_concurrent_index_by_name REGISTRY_TABLE, name: PENDING_VERIFICATION_INDEX_NAME
end
end
7115b2493e24cef7d385e076488539515aa00f097d477c7365b649032ed74dae
\ No newline at end of file
f67ac276604ebed45ec59a450e35666833a76d770a85ab15be4d275f836652ba
\ No newline at end of file
388d2578ae1385b5276f760a5cb204831fab01e33f9f1ea75ea1717c11c6e7bb
\ No newline at end of file
...@@ -151,7 +151,17 @@ CREATE TABLE lfs_object_registry ( ...@@ -151,7 +151,17 @@ CREATE TABLE lfs_object_registry (
sha256 bytea, sha256 bytea,
state smallint DEFAULT 0 NOT NULL, state smallint DEFAULT 0 NOT NULL,
last_synced_at timestamp with time zone, last_synced_at timestamp with time zone,
last_sync_failure text last_sync_failure text,
verification_started_at timestamp with time zone,
verified_at timestamp with time zone,
verification_retry_at timestamp with time zone,
verification_retry_count integer DEFAULT 0,
verification_state smallint DEFAULT 0 NOT NULL,
checksum_mismatch boolean DEFAULT false NOT NULL,
verification_checksum bytea,
verification_checksum_mismatched bytea,
verification_failure text,
CONSTRAINT check_8bcaa12138 CHECK ((char_length(verification_failure) <= 255))
); );
CREATE SEQUENCE lfs_object_registry_id_seq CREATE SEQUENCE lfs_object_registry_id_seq
...@@ -596,6 +606,12 @@ CREATE UNIQUE INDEX index_terraform_state_version_registry_on_t_state_version_id ...@@ -596,6 +606,12 @@ CREATE UNIQUE INDEX index_terraform_state_version_registry_on_t_state_version_id
CREATE UNIQUE INDEX index_tf_state_versions_registry_tf_state_versions_id_unique ON terraform_state_version_registry USING btree (terraform_state_version_id); CREATE UNIQUE INDEX index_tf_state_versions_registry_tf_state_versions_id_unique ON terraform_state_version_registry USING btree (terraform_state_version_id);
CREATE INDEX lfs_object_registry_failed_verification ON lfs_object_registry USING btree (verification_retry_at NULLS FIRST) WHERE ((state = 2) AND (verification_state = 3));
CREATE INDEX lfs_object_registry_needs_verification ON lfs_object_registry USING btree (verification_state) WHERE ((state = 2) AND (verification_state = ANY (ARRAY[0, 3])));
CREATE INDEX lfs_object_registry_pending_verification ON lfs_object_registry USING btree (verified_at NULLS FIRST) WHERE ((state = 2) AND (verification_state = 0));
CREATE INDEX merge_request_diff_registry_failed_verification ON merge_request_diff_registry USING btree (verification_retry_at NULLS FIRST) WHERE ((state = 2) AND (verification_state = 3)); CREATE INDEX merge_request_diff_registry_failed_verification ON merge_request_diff_registry USING btree (verification_retry_at NULLS FIRST) WHERE ((state = 2) AND (verification_state = 3));
CREATE INDEX merge_request_diff_registry_needs_verification ON merge_request_diff_registry USING btree (verification_state) WHERE ((state = 2) AND (verification_state = ANY (ARRAY[0, 3]))); CREATE INDEX merge_request_diff_registry_needs_verification ON merge_request_diff_registry USING btree (verification_state) WHERE ((state = 2) AND (verification_state = ANY (ARRAY[0, 3])));
......
...@@ -2,7 +2,7 @@ ...@@ -2,7 +2,7 @@
FactoryBot.define do FactoryBot.define do
factory :geo_lfs_object_registry, class: 'Geo::LfsObjectRegistry' do factory :geo_lfs_object_registry, class: 'Geo::LfsObjectRegistry' do
lfs_object association(:lfs_object, :with_file)
state { Geo::LfsObjectRegistry.state_value(:pending) } state { Geo::LfsObjectRegistry.state_value(:pending) }
trait :synced do trait :synced do
...@@ -22,5 +22,11 @@ FactoryBot.define do ...@@ -22,5 +22,11 @@ FactoryBot.define do
last_synced_at { 1.day.ago } last_synced_at { 1.day.ago }
retry_count { 0 } retry_count { 0 }
end end
trait :verification_succeeded do
verification_checksum { 'e079a831cab27bcda7d81cd9b48296d0c3dd92ef' }
verification_state { Geo::LfsObjectRegistry.verification_state_value(:verification_succeeded) }
verified_at { 5.days.ago }
end
end end
end end
# frozen_string_literal: true
FactoryBot.define do
factory :geo_lfs_object_state, class: 'Geo::LfsObjectState' do
lfs_object
trait(:checksummed) do
verification_checksum { 'abc' }
end
trait(:checksum_failure) do
verification_failure { 'Could not calculate the checksum' }
end
end
end
# frozen_string_literal: true
FactoryBot.modify do
factory :lfs_object do
trait(:checksummed) do
association :lfs_object_state, :checksummed, strategy: :build
end
trait(:checksum_failure) do
association :lfs_object_state, :checksum_failure, strategy: :build
end
trait(:verification_succeeded) do
with_file
verification_checksum { 'abc' }
verification_state { ::LfsObject.verification_state_value(:verification_succeeded) }
end
trait(:verification_failed) do
with_file
verification_failure { 'Could not calculate the checksum' }
verification_state { ::LfsObject.verification_state_value(:verification_failed) }
end
end
end
# frozen_string_literal: true
FactoryBot.modify do
factory :lfs_object do
trait(:verification_succeeded) do
with_file
verification_checksum { 'abc' }
verification_state { ::LfsObject.verification_state_value(:verification_succeeded) }
end
trait(:verification_failed) do
with_file
verification_failure { 'Could not calculate the checksum' }
verification_state { ::LfsObject.verification_state_value(:verification_failed) }
end
end
end
# frozen_string_literal: true
require 'spec_helper'
RSpec.describe ::LfsObject do
using RSpec::Parameterized::TableSyntax
include EE::GeoHelpers
let_it_be(:group) { create(:group) }
let_it_be(:project) { create(:project, :repository, group: group) }
let_it_be(:another_project) { create(:project, :repository) }
it { is_expected.to respond_to(:log_geo_deleted_event) }
context 'when model_record is part of available_verifiables scope' do
let(:verifiable_model_record) { build(:lfs_object) }
let(:verification_state_table_class) { verifiable_model_record.class.verification_state_table_class }
it 'creates verification details' do
expect { verifiable_model_record.save! }.to change { verification_state_table_class.count }.by(1)
end
end
describe '.with_files_stored_locally' do
let_it_be(:lfs_object) { create(:lfs_object, :with_file) }
it 'includes states with local storage' do
expect(described_class.with_files_stored_locally).to have_attributes(count: 1)
end
end
describe '.replicables_for_current_secondary' do
where(:selective_sync_enabled, :object_storage_sync_enabled, :lfs_object_object_storage_enabled, :synced_lfs_objects) do
true | true | false | 1
true | false | false | 1
false | true | false | 2
false | false | false | 2
true | true | true | 1
true | false | true | 1
false | true | true | 2
false | false | true | 2
end
with_them do
let(:secondary) do
node = build(:geo_node, sync_object_storage: object_storage_sync_enabled)
if selective_sync_enabled
node.selective_sync_type = 'namespaces'
node.namespaces = [group]
end
node.save!
node
end
before do
stub_current_geo_node(secondary)
stub_lfs_object_storage(uploader: LfsObjectUploader) if lfs_object_object_storage_enabled
lfs_object_1 = create(:lfs_object, :with_file)
lfs_object_2 = create(:lfs_object, :with_file)
create(:lfs_objects_project, lfs_object: lfs_object_1, project: project)
create(:lfs_objects_project, lfs_object: lfs_object_2, project: another_project)
end
it 'returns the proper number of LFS objects' do
expect(described_class.replicables_for_current_secondary(1..described_class.last.id).count).to eq(synced_lfs_objects)
end
end
end
end
...@@ -10,4 +10,5 @@ RSpec.describe Geo::LfsObjectRegistry, :geo, type: :model do ...@@ -10,4 +10,5 @@ RSpec.describe Geo::LfsObjectRegistry, :geo, type: :model do
end end
include_examples 'a Geo framework registry' include_examples 'a Geo framework registry'
include_examples 'a Geo verifiable registry'
end end
...@@ -5,5 +5,6 @@ require 'spec_helper' ...@@ -5,5 +5,6 @@ require 'spec_helper'
RSpec.describe Geo::LfsObjectReplicator do RSpec.describe Geo::LfsObjectReplicator do
let(:model_record) { build(:lfs_object, :with_file) } let(:model_record) { build(:lfs_object, :with_file) }
it_behaves_like 'a blob replicator' include_examples 'a blob replicator'
include_examples 'a verifiable replicator'
end end
...@@ -287,6 +287,7 @@ ldap_group_links: :gitlab_main ...@@ -287,6 +287,7 @@ ldap_group_links: :gitlab_main
lfs_file_locks: :gitlab_main lfs_file_locks: :gitlab_main
lfs_objects: :gitlab_main lfs_objects: :gitlab_main
lfs_objects_projects: :gitlab_main lfs_objects_projects: :gitlab_main
lfs_object_states: :gitlab_main
licenses: :gitlab_main licenses: :gitlab_main
lists: :gitlab_main lists: :gitlab_main
list_user_preferences: :gitlab_main list_user_preferences: :gitlab_main
......
...@@ -10,6 +10,9 @@ RSpec.describe 'User uploads new design', :js do ...@@ -10,6 +10,9 @@ RSpec.describe 'User uploads new design', :js do
let(:issue) { create(:issue, project: project) } let(:issue) { create(:issue, project: project) }
before do before do
# Cause of raising query limiting threshold https://gitlab.com/gitlab-org/gitlab/-/issues/347334
stub_const("Gitlab::QueryLimiting::Transaction::THRESHOLD", 102)
sign_in(user) sign_in(user)
enable_design_management(feature_enabled) enable_design_management(feature_enabled)
visit project_issue_path(project, issue) visit project_issue_path(project, issue)
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment