Bug #57190
pg shard status inconsistency in one pg
Status:
New
Priority:
Normal
Assignee:
-
Category:
-
Target version:
-
% Done:
0%
Source:
Tags:
Backport:
Regression:
No
Severity:
3 - minor
Reviewed:
Affected Versions:
ceph-qa-suite:
Component(RADOS):
Pull request ID:
Crash signature (v1):
Crash signature (v2):
Description
ceph pg 7.6c2 query { "state": "active+clean", "snap_trimq": "[]", "snap_trimq_len": 0, "epoch": 597066, "up": [ 345, 102, 320 ], "acting": [ 345, 102, 320 ], "acting_recovery_backfill": [ "102", "320", "345" ], "info": { "pgid": "7.6c2", "last_update": "588276'8066", "last_complete": "588276'8066", "log_tail": "514733'5727", "last_user_version": 8066, "last_backfill": "MAX", "last_backfill_bitwise": 1, "purged_snaps": [], "history": { "epoch_created": 3327, "epoch_pool_created": 3324, "last_epoch_started": 597038, "last_interval_started": 597037, "last_epoch_clean": 597038, "last_interval_clean": 597037, "last_epoch_split": 3359, "last_epoch_marked_full": 0, "same_up_since": 597037, "same_interval_since": 597037, "same_primary_since": 597037, "last_scrub": "588276'8066", "last_scrub_stamp": "2022-08-19 11:06:54.021347", "last_deep_scrub": "588276'8066", "last_deep_scrub_stamp": "2022-08-19 11:06:54.021347", "last_clean_scrub_stamp": "2022-08-19 11:06:54.021347" }, "stats": { "version": "588276'8066", "reported_seq": "610825", "reported_epoch": "597066", "state": "active+clean", "last_fresh": "2022-08-19 15:21:12.778548", "last_change": "2022-08-19 15:17:26.496067", "last_active": "2022-08-19 15:21:12.778548", "last_peered": "2022-08-19 15:21:12.778548", "last_clean": "2022-08-19 15:21:12.778548", "last_became_active": "2022-08-19 15:17:26.495960", "last_became_peered": "2022-08-19 15:17:26.495960", "last_unstale": "2022-08-19 15:21:12.778548", "last_undegraded": "2022-08-19 15:21:12.778548", "last_fullsized": "2022-08-19 15:21:12.778548", "mapping_epoch": 597037, "log_start": "514733'5727", "ondisk_log_start": "514733'5727", "created": 3327, "last_epoch_clean": 597038, "parent": "0.0", "parent_split_bits": 11, "last_scrub": "588276'8066", "last_scrub_stamp": "2022-08-19 11:06:54.021347", "last_deep_scrub": "588276'8066", "last_deep_scrub_stamp": "2022-08-19 11:06:54.021347", "last_clean_scrub_stamp": "2022-08-19 11:06:54.021347", "log_size": 2339, "ondisk_log_size": 2339, "stats_invalid": false, "dirty_stats_invalid": false, "omap_stats_invalid": false, "hitset_stats_invalid": false, "hitset_bytes_stats_invalid": false, "pin_stats_invalid": false, "manifest_stats_invalid": false, "snaptrimq_len": 0, "stat_sum": { "num_bytes": 0, "num_objects": 934, "num_object_clones": 0, "num_object_copies": 2802, "num_objects_missing_on_primary": 0, "num_objects_missing": 0, "num_objects_degraded": 0, "num_objects_misplaced": 0, "num_objects_unfound": 0, "num_objects_dirty": 934, "num_whiteouts": 0, "num_read": 2634, "num_read_kb": 7737100, "num_write": 19159, "num_write_kb": 12669502, "num_scrub_errors": 0, "num_shallow_scrub_errors": 0, "num_deep_scrub_errors": 0, "num_objects_recovered": 32343, "num_bytes_recovered": 71530162823, "num_keys_recovered": 0, "num_objects_omap": 0, "num_objects_hit_set_archive": 0, "num_bytes_hit_set_archive": 0, "num_flush": 0, "num_flush_kb": 0, "num_evict": 0, "num_evict_kb": 0, "num_promote": 0, "num_flush_mode_high": 0, "num_flush_mode_low": 0, "num_evict_mode_some": 0, "num_evict_mode_full": 0, "num_objects_pinned": 0, "num_legacy_snapsets": 0, "num_large_omap_objects": 0, "num_objects_manifest": 0, "num_omap_bytes": 0, "num_omap_keys": 0, "num_objects_repaired": 0 }, "up": [ 345, 102, 320 ], "acting": [ 345, 102, 320 ], "avail_no_missing": [], "object_location_counts": [], "blocked_by": [], "up_primary": 345, "acting_primary": 345, "purged_snaps": [] }, "empty": 0, "dne": 0, "incomplete": 0, "last_epoch_started": 597038, "hit_set_history": { "current_last_update": "0'0", "history": [] } }, "peer_info": [ { "peer": "102", "pgid": "7.6c2", "last_update": "588276'8066", "last_complete": "588276'8066", "log_tail": "514733'5727", "last_user_version": 8066, "last_backfill": "MAX", "last_backfill_bitwise": 1, "purged_snaps": [], "history": { "epoch_created": 3327, "epoch_pool_created": 3324, "last_epoch_started": 597038, "last_interval_started": 597037, "last_epoch_clean": 597038, "last_interval_clean": 597037, "last_epoch_split": 3359, "last_epoch_marked_full": 0, "same_up_since": 597037, "same_interval_since": 597037, "same_primary_since": 597037, "last_scrub": "588276'8066", "last_scrub_stamp": "2022-08-19 11:06:54.021347", "last_deep_scrub": "588276'8066", "last_deep_scrub_stamp": "2022-08-19 11:06:54.021347", "last_clean_scrub_stamp": "2022-08-19 11:06:54.021347" }, "stats": { "version": "588276'8066", "reported_seq": "610788", "reported_epoch": "597037", "state": "active+undersized+degraded", "last_fresh": "2022-08-19 15:17:22.378142", "last_change": "2022-08-19 15:16:54.388784", "last_active": "2022-08-19 15:17:22.378142", "last_peered": "2022-08-19 15:17:22.378142", "last_clean": "2022-08-13 23:15:43.085274", "last_became_active": "2022-08-19 15:16:54.388784", "last_became_peered": "2022-08-19 15:16:54.388784", "last_unstale": "2022-08-19 15:17:22.378142", "last_undegraded": "2022-08-19 15:16:54.385408", "last_fullsized": "2022-08-19 15:16:54.384745", "mapping_epoch": 597037, "log_start": "514733'5727", "ondisk_log_start": "514733'5727", "created": 3327, "last_epoch_clean": 596764, "parent": "0.0", "parent_split_bits": 11, "last_scrub": "588276'8066", "last_scrub_stamp": "2022-08-19 11:06:54.021347", "last_deep_scrub": "588276'8066", "last_deep_scrub_stamp": "2022-08-19 11:06:54.021347", "last_clean_scrub_stamp": "2022-08-19 11:06:54.021347", "log_size": 2339, "ondisk_log_size": 2339, "stats_invalid": false, "dirty_stats_invalid": false, "omap_stats_invalid": false, "hitset_stats_invalid": false, "hitset_bytes_stats_invalid": false, "pin_stats_invalid": false, "manifest_stats_invalid": false, "snaptrimq_len": 0, "stat_sum": { "num_bytes": 0, "num_objects": 934, "num_object_clones": 0, "num_object_copies": 2802, "num_objects_missing_on_primary": 0, "num_objects_missing": 0, "num_objects_degraded": 934, "num_objects_misplaced": 0, "num_objects_unfound": 0, "num_objects_dirty": 934, "num_whiteouts": 0, "num_read": 2634, "num_read_kb": 7737100, "num_write": 19159, "num_write_kb": 12669502, "num_scrub_errors": 0, "num_shallow_scrub_errors": 0, "num_deep_scrub_errors": 0, "num_objects_recovered": 32343, "num_bytes_recovered": 71530162823, "num_keys_recovered": 0, "num_objects_omap": 0, "num_objects_hit_set_archive": 0, "num_bytes_hit_set_archive": 0, "num_flush": 0, "num_flush_kb": 0, "num_evict": 0, "num_evict_kb": 0, "num_promote": 0, "num_flush_mode_high": 0, "num_flush_mode_low": 0, "num_evict_mode_some": 0, "num_evict_mode_full": 0, "num_objects_pinned": 0, "num_legacy_snapsets": 0, "num_large_omap_objects": 0, "num_objects_manifest": 0, "num_omap_bytes": 0, "num_omap_keys": 0, "num_objects_repaired": 0 }, "up": [ 345, 102, 320 ], "acting": [ 345, 102, 320 ], "avail_no_missing": [ "102", "320" ], "object_location_counts": [ { "shards": "102,320", "objects": 934 } ], "blocked_by": [], "up_primary": 345, "acting_primary": 345, "purged_snaps": [] }, "empty": 0, "dne": 0, "incomplete": 0, "last_epoch_started": 597038, "hit_set_history": { "current_last_update": "0'0", "history": [] } }, { "peer": "320", "pgid": "7.6c2", "last_update": "588276'8066", "last_complete": "588276'8066", "log_tail": "514733'5727", "last_user_version": 0, "last_backfill": "MAX", "last_backfill_bitwise": 1, "purged_snaps": [], "history": { "epoch_created": 3327, "epoch_pool_created": 3324, "last_epoch_started": 597038, "last_interval_started": 597037, "last_epoch_clean": 597038, "last_interval_clean": 597037, "last_epoch_split": 3359, "last_epoch_marked_full": 0, "same_up_since": 597037, "same_interval_since": 597037, "same_primary_since": 597037, "last_scrub": "588276'8066", "last_scrub_stamp": "2022-08-19 11:06:54.021347", "last_deep_scrub": "588276'8066", "last_deep_scrub_stamp": "2022-08-19 11:06:54.021347", "last_clean_scrub_stamp": "2022-08-19 11:06:54.021347" }, "stats": { "version": "588276'8066", "reported_seq": "609149", "reported_epoch": "595446", "state": "active+remapped+backfilling", "last_fresh": "2022-08-18 20:02:44.789999", "last_change": "2022-08-18 20:02:24.078805", "last_active": "2022-08-18 20:02:44.789999", "last_peered": "2022-08-18 20:02:44.789999", "last_clean": "2022-08-18 20:00:44.257344", "last_became_active": "2022-08-18 20:02:24.057374", "last_became_peered": "2022-08-18 20:02:24.057374", "last_unstale": "2022-08-18 20:02:44.789999", "last_undegraded": "2022-08-18 20:02:44.789999", "last_fullsized": "2022-08-18 20:02:44.789999", "mapping_epoch": 597037, "log_start": "514733'5727", "ondisk_log_start": "514733'5727", "created": 3327, "last_epoch_clean": 585471, "parent": "0.0", "parent_split_bits": 11, "last_scrub": "555968'6356", "last_scrub_stamp": "2022-07-13 03:45:10.138635", "last_deep_scrub": "555968'6356", "last_deep_scrub_stamp": "2022-07-13 03:45:10.138635", "last_clean_scrub_stamp": "2022-07-13 03:45:10.138635", "log_size": 2339, "ondisk_log_size": 2339, "stats_invalid": false, "dirty_stats_invalid": false, "omap_stats_invalid": false, "hitset_stats_invalid": false, "hitset_bytes_stats_invalid": false, "pin_stats_invalid": false, "manifest_stats_invalid": false, "snaptrimq_len": 0, "stat_sum": { "num_bytes": 0, "num_objects": 934, "num_object_clones": 0, "num_object_copies": 2802, "num_objects_missing_on_primary": 0, "num_objects_missing": 0, "num_objects_degraded": 0, "num_objects_misplaced": 2, "num_objects_unfound": 0, "num_objects_dirty": 934, "num_whiteouts": 0, "num_read": 2634, "num_read_kb": 7737100, "num_write": 19159, "num_write_kb": 12669502, "num_scrub_errors": 0, "num_shallow_scrub_errors": 0, "num_deep_scrub_errors": 0, "num_objects_recovered": 33277, "num_bytes_recovered": 72380728619, "num_keys_recovered": 0, "num_objects_omap": 0, "num_objects_hit_set_archive": 0, "num_bytes_hit_set_archive": 0, "num_flush": 0, "num_flush_kb": 0, "num_evict": 0, "num_evict_kb": 0, "num_promote": 0, "num_flush_mode_high": 0, "num_flush_mode_low": 0, "num_evict_mode_some": 0, "num_evict_mode_full": 0, "num_objects_pinned": 0, "num_legacy_snapsets": 0, "num_large_omap_objects": 0, "num_objects_manifest": 0, "num_omap_bytes": 0, "num_omap_keys": 0, "num_objects_repaired": 0 }, "up": [ 345, 102, 320 ], "acting": [ 345, 102, 320 ], "avail_no_missing": [ "345", "102", "304" ], "object_location_counts": [ { "shards": "102,304,345", "objects": 934 } ], "blocked_by": [], "up_primary": 345, "acting_primary": 345, "purged_snaps": [] }, "empty": 0, "dne": 0, "incomplete": 0, "last_epoch_started": 597038, "hit_set_history": { "current_last_update": "0'0", "history": [] } } ], "recovery_state": [ { "name": "Started/Primary/Active", "enter_time": "2022-08-19 15:17:26.452635", "might_have_unfound": [], "recovery_progress": { "backfill_targets": [], "waiting_on_backfill": [], "last_backfill_started": "MIN", "backfill_info": { "begin": "MIN", "end": "MIN", "objects": [] }, "peer_backfill_info": [], "backfills_in_flight": [], "recovering": [], "pg_backend": { "pull_from_peer": [], "pushing": [] } }, "scrub": { "scrubber.epoch_start": "0", "scrubber.active": false, "scrubber.state": "INACTIVE", "scrubber.start": "MIN", "scrubber.end": "MIN", "scrubber.max_end": "MIN", "scrubber.subset_last_update": "0'0", "scrubber.deep": false, "scrubber.waiting_on_whom": [] } }, { "name": "Started", "enter_time": "2022-08-19 15:17:25.493833" } ], "agent_state": {} }
This is a odd phenomenon, the pg 7.6c2 is active+clean, and distributed at osd [345, 102, 340]. But pg shard status is active+remapped+backfilling in osd.320. num bytes is 0 in osd.102 and osd.320