Project

General

Profile

Actions

Bug #57190

open

pg shard status inconsistency in one pg

Added by yite gu over 1 year ago.

Status:
New
Priority:
Normal
Assignee:
-
Category:
-
Target version:
-
% Done:

0%

Source:
Tags:
Backport:
Regression:
No
Severity:
3 - minor
Reviewed:
Affected Versions:
ceph-qa-suite:
Component(RADOS):
Pull request ID:
Crash signature (v1):
Crash signature (v2):

Description

ceph pg 7.6c2 query
{
    "state": "active+clean",
    "snap_trimq": "[]",
    "snap_trimq_len": 0,
    "epoch": 597066,
    "up": [
        345,
        102,
        320
    ],
    "acting": [
        345,
        102,
        320
    ],
    "acting_recovery_backfill": [
        "102",
        "320",
        "345" 
    ],
    "info": {
        "pgid": "7.6c2",
        "last_update": "588276'8066",
        "last_complete": "588276'8066",
        "log_tail": "514733'5727",
        "last_user_version": 8066,
        "last_backfill": "MAX",
        "last_backfill_bitwise": 1,
        "purged_snaps": [],
        "history": {
            "epoch_created": 3327,
            "epoch_pool_created": 3324,
            "last_epoch_started": 597038,
            "last_interval_started": 597037,
            "last_epoch_clean": 597038,
            "last_interval_clean": 597037,
            "last_epoch_split": 3359,
            "last_epoch_marked_full": 0,
            "same_up_since": 597037,
            "same_interval_since": 597037,
            "same_primary_since": 597037,
            "last_scrub": "588276'8066",
            "last_scrub_stamp": "2022-08-19 11:06:54.021347",
            "last_deep_scrub": "588276'8066",
            "last_deep_scrub_stamp": "2022-08-19 11:06:54.021347",
            "last_clean_scrub_stamp": "2022-08-19 11:06:54.021347" 
        },
        "stats": {
            "version": "588276'8066",
            "reported_seq": "610825",
            "reported_epoch": "597066",
            "state": "active+clean",
            "last_fresh": "2022-08-19 15:21:12.778548",
            "last_change": "2022-08-19 15:17:26.496067",
            "last_active": "2022-08-19 15:21:12.778548",
            "last_peered": "2022-08-19 15:21:12.778548",
            "last_clean": "2022-08-19 15:21:12.778548",
            "last_became_active": "2022-08-19 15:17:26.495960",
            "last_became_peered": "2022-08-19 15:17:26.495960",
            "last_unstale": "2022-08-19 15:21:12.778548",
            "last_undegraded": "2022-08-19 15:21:12.778548",
            "last_fullsized": "2022-08-19 15:21:12.778548",
            "mapping_epoch": 597037,
            "log_start": "514733'5727",
            "ondisk_log_start": "514733'5727",
            "created": 3327,
            "last_epoch_clean": 597038,
            "parent": "0.0",
            "parent_split_bits": 11,
            "last_scrub": "588276'8066",
            "last_scrub_stamp": "2022-08-19 11:06:54.021347",
            "last_deep_scrub": "588276'8066",
            "last_deep_scrub_stamp": "2022-08-19 11:06:54.021347",
            "last_clean_scrub_stamp": "2022-08-19 11:06:54.021347",
            "log_size": 2339,
            "ondisk_log_size": 2339,
            "stats_invalid": false,
            "dirty_stats_invalid": false,
            "omap_stats_invalid": false,
            "hitset_stats_invalid": false,
            "hitset_bytes_stats_invalid": false,
            "pin_stats_invalid": false,
            "manifest_stats_invalid": false,
            "snaptrimq_len": 0,
            "stat_sum": {
                "num_bytes": 0,
                "num_objects": 934,
                "num_object_clones": 0,
                "num_object_copies": 2802,
                "num_objects_missing_on_primary": 0,
                "num_objects_missing": 0,
                "num_objects_degraded": 0,
                "num_objects_misplaced": 0,
                "num_objects_unfound": 0,
                "num_objects_dirty": 934,
                "num_whiteouts": 0,
                "num_read": 2634,
                "num_read_kb": 7737100,
                "num_write": 19159,
                "num_write_kb": 12669502,
                "num_scrub_errors": 0,
                "num_shallow_scrub_errors": 0,
                "num_deep_scrub_errors": 0,
                "num_objects_recovered": 32343,
                "num_bytes_recovered": 71530162823,
                "num_keys_recovered": 0,
                "num_objects_omap": 0,
                "num_objects_hit_set_archive": 0,
                "num_bytes_hit_set_archive": 0,
                "num_flush": 0,
                "num_flush_kb": 0,
                "num_evict": 0,
                "num_evict_kb": 0,
                "num_promote": 0,
                "num_flush_mode_high": 0,
                "num_flush_mode_low": 0,
                "num_evict_mode_some": 0,
                "num_evict_mode_full": 0,
                "num_objects_pinned": 0,
                "num_legacy_snapsets": 0,
                "num_large_omap_objects": 0,
                "num_objects_manifest": 0,
                "num_omap_bytes": 0,
                "num_omap_keys": 0,
                "num_objects_repaired": 0
            },
            "up": [
                345,
                102,
                320
            ],
            "acting": [
                345,
                102,
                320
            ],
            "avail_no_missing": [],
            "object_location_counts": [],
            "blocked_by": [],
            "up_primary": 345,
            "acting_primary": 345,
            "purged_snaps": []
        },
        "empty": 0,
        "dne": 0,
        "incomplete": 0,
        "last_epoch_started": 597038,
        "hit_set_history": {
            "current_last_update": "0'0",
            "history": []
        }
    },
    "peer_info": [
        {
            "peer": "102",
            "pgid": "7.6c2",
            "last_update": "588276'8066",
            "last_complete": "588276'8066",
            "log_tail": "514733'5727",
            "last_user_version": 8066,
            "last_backfill": "MAX",
            "last_backfill_bitwise": 1,
            "purged_snaps": [],
            "history": {
                "epoch_created": 3327,
                "epoch_pool_created": 3324,
                "last_epoch_started": 597038,
                "last_interval_started": 597037,
                "last_epoch_clean": 597038,
                "last_interval_clean": 597037,
                "last_epoch_split": 3359,
                "last_epoch_marked_full": 0,
                "same_up_since": 597037,
                "same_interval_since": 597037,
                "same_primary_since": 597037,
                "last_scrub": "588276'8066",
                "last_scrub_stamp": "2022-08-19 11:06:54.021347",
                "last_deep_scrub": "588276'8066",
                "last_deep_scrub_stamp": "2022-08-19 11:06:54.021347",
                "last_clean_scrub_stamp": "2022-08-19 11:06:54.021347" 
            },
            "stats": {
                "version": "588276'8066",
                "reported_seq": "610788",
                "reported_epoch": "597037",
                "state": "active+undersized+degraded",
                "last_fresh": "2022-08-19 15:17:22.378142",
                "last_change": "2022-08-19 15:16:54.388784",
                "last_active": "2022-08-19 15:17:22.378142",
                "last_peered": "2022-08-19 15:17:22.378142",
                "last_clean": "2022-08-13 23:15:43.085274",
                "last_became_active": "2022-08-19 15:16:54.388784",
                "last_became_peered": "2022-08-19 15:16:54.388784",
                "last_unstale": "2022-08-19 15:17:22.378142",
                "last_undegraded": "2022-08-19 15:16:54.385408",
                "last_fullsized": "2022-08-19 15:16:54.384745",
                "mapping_epoch": 597037,
                "log_start": "514733'5727",
                "ondisk_log_start": "514733'5727",
                "created": 3327,
                "last_epoch_clean": 596764,
                "parent": "0.0",
                "parent_split_bits": 11,
                "last_scrub": "588276'8066",
                "last_scrub_stamp": "2022-08-19 11:06:54.021347",
                "last_deep_scrub": "588276'8066",
                "last_deep_scrub_stamp": "2022-08-19 11:06:54.021347",
                "last_clean_scrub_stamp": "2022-08-19 11:06:54.021347",
                "log_size": 2339,
                "ondisk_log_size": 2339,
                "stats_invalid": false,
                "dirty_stats_invalid": false,
                "omap_stats_invalid": false,
                "hitset_stats_invalid": false,
                "hitset_bytes_stats_invalid": false,
                "pin_stats_invalid": false,
                "manifest_stats_invalid": false,
                "snaptrimq_len": 0,
                "stat_sum": {
                    "num_bytes": 0,
                    "num_objects": 934,
                    "num_object_clones": 0,
                    "num_object_copies": 2802,
                    "num_objects_missing_on_primary": 0,
                    "num_objects_missing": 0,
                    "num_objects_degraded": 934,
                    "num_objects_misplaced": 0,
                    "num_objects_unfound": 0,
                    "num_objects_dirty": 934,
                    "num_whiteouts": 0,
                    "num_read": 2634,
                    "num_read_kb": 7737100,
                    "num_write": 19159,
                    "num_write_kb": 12669502,
                    "num_scrub_errors": 0,
                    "num_shallow_scrub_errors": 0,
                    "num_deep_scrub_errors": 0,
                    "num_objects_recovered": 32343,
                    "num_bytes_recovered": 71530162823,
                    "num_keys_recovered": 0,
                    "num_objects_omap": 0,
                    "num_objects_hit_set_archive": 0,
                    "num_bytes_hit_set_archive": 0,
                    "num_flush": 0,
                    "num_flush_kb": 0,
                    "num_evict": 0,
                    "num_evict_kb": 0,
                    "num_promote": 0,
                    "num_flush_mode_high": 0,
                    "num_flush_mode_low": 0,
                    "num_evict_mode_some": 0,
                    "num_evict_mode_full": 0,
                    "num_objects_pinned": 0,
                    "num_legacy_snapsets": 0,
                    "num_large_omap_objects": 0,
                    "num_objects_manifest": 0,
                    "num_omap_bytes": 0,
                    "num_omap_keys": 0,
                    "num_objects_repaired": 0
                },
                "up": [
                    345,
                    102,
                    320
                ],
                "acting": [
                    345,
                    102,
                    320
                ],
                "avail_no_missing": [
                    "102",
                    "320" 
                ],
                "object_location_counts": [
                    {
                        "shards": "102,320",
                        "objects": 934
                    }
                ],
                "blocked_by": [],
                "up_primary": 345,
                "acting_primary": 345,
                "purged_snaps": []
            },
            "empty": 0,
            "dne": 0,
            "incomplete": 0,
            "last_epoch_started": 597038,
            "hit_set_history": {
                "current_last_update": "0'0",
                "history": []
            }
        },
        {
            "peer": "320",
            "pgid": "7.6c2",
            "last_update": "588276'8066",
            "last_complete": "588276'8066",
            "log_tail": "514733'5727",
            "last_user_version": 0,
            "last_backfill": "MAX",
            "last_backfill_bitwise": 1,
            "purged_snaps": [],
            "history": {
                "epoch_created": 3327,
                "epoch_pool_created": 3324,
                "last_epoch_started": 597038,
                "last_interval_started": 597037,
                "last_epoch_clean": 597038,
                "last_interval_clean": 597037,
                "last_epoch_split": 3359,
                "last_epoch_marked_full": 0,
                "same_up_since": 597037,
                "same_interval_since": 597037,
                "same_primary_since": 597037,
                "last_scrub": "588276'8066",
                "last_scrub_stamp": "2022-08-19 11:06:54.021347",
                "last_deep_scrub": "588276'8066",
                "last_deep_scrub_stamp": "2022-08-19 11:06:54.021347",
                "last_clean_scrub_stamp": "2022-08-19 11:06:54.021347" 
            },
            "stats": {
                "version": "588276'8066",
                "reported_seq": "609149",
                "reported_epoch": "595446",
                "state": "active+remapped+backfilling",
                "last_fresh": "2022-08-18 20:02:44.789999",
                "last_change": "2022-08-18 20:02:24.078805",
                "last_active": "2022-08-18 20:02:44.789999",
                "last_peered": "2022-08-18 20:02:44.789999",
                "last_clean": "2022-08-18 20:00:44.257344",
                "last_became_active": "2022-08-18 20:02:24.057374",
                "last_became_peered": "2022-08-18 20:02:24.057374",
                "last_unstale": "2022-08-18 20:02:44.789999",
                "last_undegraded": "2022-08-18 20:02:44.789999",
                "last_fullsized": "2022-08-18 20:02:44.789999",
                "mapping_epoch": 597037,
                "log_start": "514733'5727",
                "ondisk_log_start": "514733'5727",
                "created": 3327,
                "last_epoch_clean": 585471,
                "parent": "0.0",
                "parent_split_bits": 11,
                "last_scrub": "555968'6356",
                "last_scrub_stamp": "2022-07-13 03:45:10.138635",
                "last_deep_scrub": "555968'6356",
                "last_deep_scrub_stamp": "2022-07-13 03:45:10.138635",
                "last_clean_scrub_stamp": "2022-07-13 03:45:10.138635",
                "log_size": 2339,
                "ondisk_log_size": 2339,
                "stats_invalid": false,
                "dirty_stats_invalid": false,
                "omap_stats_invalid": false,
                "hitset_stats_invalid": false,
                "hitset_bytes_stats_invalid": false,
                "pin_stats_invalid": false,
                "manifest_stats_invalid": false,
                "snaptrimq_len": 0,
                "stat_sum": {
                    "num_bytes": 0,
                    "num_objects": 934,
                    "num_object_clones": 0,
                    "num_object_copies": 2802,
                    "num_objects_missing_on_primary": 0,
                    "num_objects_missing": 0,
                    "num_objects_degraded": 0,
                    "num_objects_misplaced": 2,
                    "num_objects_unfound": 0,
                    "num_objects_dirty": 934,
                    "num_whiteouts": 0,
                    "num_read": 2634,
                    "num_read_kb": 7737100,
                    "num_write": 19159,
                    "num_write_kb": 12669502,
                    "num_scrub_errors": 0,
                    "num_shallow_scrub_errors": 0,
                    "num_deep_scrub_errors": 0,
                    "num_objects_recovered": 33277,
                    "num_bytes_recovered": 72380728619,
                    "num_keys_recovered": 0,
                    "num_objects_omap": 0,
                    "num_objects_hit_set_archive": 0,
                    "num_bytes_hit_set_archive": 0,
                    "num_flush": 0,
                    "num_flush_kb": 0,
                    "num_evict": 0,
                    "num_evict_kb": 0,
                    "num_promote": 0,
                    "num_flush_mode_high": 0,
                    "num_flush_mode_low": 0,
                    "num_evict_mode_some": 0,
                    "num_evict_mode_full": 0,
                    "num_objects_pinned": 0,
                    "num_legacy_snapsets": 0,
                    "num_large_omap_objects": 0,
                    "num_objects_manifest": 0,
                    "num_omap_bytes": 0,
                    "num_omap_keys": 0,
                    "num_objects_repaired": 0
                },
                "up": [
                    345,
                    102,
                    320
                ],
                "acting": [
                    345,
                    102,
                    320
                ],
                "avail_no_missing": [
                    "345",
                    "102",
                    "304" 
                ],
                "object_location_counts": [
                    {
                        "shards": "102,304,345",
                        "objects": 934
                    }
                ],
                "blocked_by": [],
                "up_primary": 345,
                "acting_primary": 345,
                "purged_snaps": []
            },
            "empty": 0,
            "dne": 0,
            "incomplete": 0,
            "last_epoch_started": 597038,
            "hit_set_history": {
                "current_last_update": "0'0",
                "history": []
            }
        }
    ],
    "recovery_state": [
        {
            "name": "Started/Primary/Active",
            "enter_time": "2022-08-19 15:17:26.452635",
            "might_have_unfound": [],
            "recovery_progress": {
                "backfill_targets": [],
                "waiting_on_backfill": [],
                "last_backfill_started": "MIN",
                "backfill_info": {
                    "begin": "MIN",
                    "end": "MIN",
                    "objects": []
                },
                "peer_backfill_info": [],
                "backfills_in_flight": [],
                "recovering": [],
                "pg_backend": {
                    "pull_from_peer": [],
                    "pushing": []
                }
            },
            "scrub": {
                "scrubber.epoch_start": "0",
                "scrubber.active": false,
                "scrubber.state": "INACTIVE",
                "scrubber.start": "MIN",
                "scrubber.end": "MIN",
                "scrubber.max_end": "MIN",
                "scrubber.subset_last_update": "0'0",
                "scrubber.deep": false,
                "scrubber.waiting_on_whom": []
            }
        },
        {
            "name": "Started",
            "enter_time": "2022-08-19 15:17:25.493833" 
        }
    ],
    "agent_state": {}
}


This is a odd phenomenon, the pg 7.6c2 is active+clean, and distributed at osd [345, 102, 340]. But pg shard status is active+remapped+backfilling in osd.320. num bytes is 0 in osd.102 and osd.320

No data to display

Actions

Also available in: Atom PDF