Not sure if it's related, but this only happens to PG's who's primary OSD
is one where osd_numa_node has been set.

On Wed, May 15, 2019 at 7:13 PM Brett Chancellor <[email protected]>
wrote:

> After upgrading from 14.2.0 to 14.2.1, I've noticed PGs are frequently
> resetting their scrub and deep scrub time stamps to 0.000000.  It's extra
> strange because the peers show timestamps for deep scrubs.
>
> ## First entry from a pg list at 7pm
> $ grep 11.2f2 ~/pgs-active.7pm
> 11.2f2     691        0         0       0 2897477632           0
> 0 2091 active+clean    3h  7378'12291   8048:36261    [1,6,37]p1
> [1,6,37]p1 2019-05-14 21:01:29.172460 2019-05-14 21:01:29.172460
>
> ## Next Entry 3 minutes later
> $ ceph pg ls active |grep 11.2f2
> 11.2f2     695        0         0       0 2914713600           0
> 0 2091 active+clean    6s  7378'12291   8049:36330    [1,6,37]p1
> [1,6,37]p1                   0.000000                   0.000000
>
> ## PG Query
> {
>     "state": "active+clean",
>     "snap_trimq": "[]",
>     "snap_trimq_len": 0,
>     "epoch": 8049,
>     "up": [
>         1,
>         6,
>         37
>     ],
>     "acting": [
>         1,
>         6,
>         37
>     ],
>     "acting_recovery_backfill": [
>         "1",
>         "6",
>         "37"
>     ],
>     "info": {
>         "pgid": "11.2f2",
>         "last_update": "7378'12291",
>         "last_complete": "7378'12291",
>         "log_tail": "1087'10200",
>         "last_user_version": 12291,
>         "last_backfill": "MAX",
>         "last_backfill_bitwise": 1,
>         "purged_snaps": [],
>         "history": {
>             "epoch_created": 1549,
>             "epoch_pool_created": 216,
>             "last_epoch_started": 6148,
>             "last_interval_started": 6147,
>             "last_epoch_clean": 6148,
>             "last_interval_clean": 6147,
>             "last_epoch_split": 6147,
>             "last_epoch_marked_full": 0,
>             "same_up_since": 6126,
>             "same_interval_since": 6147,
>             "same_primary_since": 6126,
>             "last_scrub": "7378'12291",
>             "last_scrub_stamp": "0.000000",
>             "last_deep_scrub": "6103'12186",
>             "last_deep_scrub_stamp": "0.000000",
>             "last_clean_scrub_stamp": "2019-05-15 23:08:17.014575"
>         },
>         "stats": {
>             "version": "7378'12291",
>             "reported_seq": "36700",
>             "reported_epoch": "8049",
>             "state": "active+clean",
>             "last_fresh": "2019-05-15 23:08:17.014609",
>             "last_change": "2019-05-15 23:08:17.014609",
>             "last_active": "2019-05-15 23:08:17.014609",
>             "last_peered": "2019-05-15 23:08:17.014609",
>             "last_clean": "2019-05-15 23:08:17.014609",
>             "last_became_active": "2019-05-15 19:25:01.484322",
>             "last_became_peered": "2019-05-15 19:25:01.484322",
>             "last_unstale": "2019-05-15 23:08:17.014609",
>             "last_undegraded": "2019-05-15 23:08:17.014609",
>             "last_fullsized": "2019-05-15 23:08:17.014609",
>             "mapping_epoch": 6126,
>             "log_start": "1087'10200",
>             "ondisk_log_start": "1087'10200",
>             "created": 1549,
>             "last_epoch_clean": 6148,
>             "parent": "0.0",
>             "parent_split_bits": 10,
>             "last_scrub": "7378'12291",
>             "last_scrub_stamp": "0.000000",
>             "last_deep_scrub": "6103'12186",
>             "last_deep_scrub_stamp": "0.000000",
>             "last_clean_scrub_stamp": "2019-05-15 23:08:17.014575",
>             "log_size": 2091,
>             "ondisk_log_size": 2091,
>             "stats_invalid": false,
>             "dirty_stats_invalid": false,
>             "omap_stats_invalid": false,
>             "hitset_stats_invalid": false,
>             "hitset_bytes_stats_invalid": false,
>             "pin_stats_invalid": false,
>             "manifest_stats_invalid": true,
>             "snaptrimq_len": 0,
>             "stat_sum": {
>                 "num_bytes": 2914713600,
>                 "num_objects": 695,
>                 "num_object_clones": 0,
>                 "num_object_copies": 2085,
>                 "num_objects_missing_on_primary": 0,
>                 "num_objects_missing": 0,
>                 "num_objects_degraded": 0,
>                 "num_objects_misplaced": 0,
>                 "num_objects_unfound": 0,
>                 "num_objects_dirty": 695,
>                 "num_whiteouts": 0,
>                 "num_read": 0,
>                 "num_read_kb": 0,
>                 "num_write": 0,
>                 "num_write_kb": 0,
>                 "num_scrub_errors": 0,
>                 "num_shallow_scrub_errors": 0,
>                 "num_deep_scrub_errors": 0,
>                 "num_objects_recovered": 0,
>                 "num_bytes_recovered": 0,
>                 "num_keys_recovered": 0,
>                 "num_objects_omap": 0,
>                 "num_objects_hit_set_archive": 0,
>                 "num_bytes_hit_set_archive": 0,
>                 "num_flush": 0,
>                 "num_flush_kb": 0,
>                 "num_evict": 0,
>                 "num_evict_kb": 0,
>                 "num_promote": 0,
>                 "num_flush_mode_high": 0,
>                 "num_flush_mode_low": 0,
>                 "num_evict_mode_some": 0,
>                 "num_evict_mode_full": 0,
>                 "num_objects_pinned": 0,
>                 "num_legacy_snapsets": 0,
>                 "num_large_omap_objects": 0,
>                 "num_objects_manifest": 0,
>                 "num_omap_bytes": 0,
>                 "num_omap_keys": 0,
>                 "num_objects_repaired": 0
>             },
>             "up": [
>                 1,
>                 6,
>                 37
>             ],
>             "acting": [
>                 1,
>                 6,
>                 37
>             ],
>             "blocked_by": [],
>             "up_primary": 1,
>             "acting_primary": 1,
>             "purged_snaps": []
>         },
>         "empty": 0,
>         "dne": 0,
>         "incomplete": 0,
>         "last_epoch_started": 6148,
>         "hit_set_history": {
>             "current_last_update": "0'0",
>             "history": []
>         }
>     },
>     "peer_info": [
>         {
>             "peer": "6",
>             "pgid": "11.2f2",
>             "last_update": "7378'12291",
>             "last_complete": "7378'12291",
>             "log_tail": "1087'10200",
>             "last_user_version": 12264,
>             "last_backfill": "MAX",
>             "last_backfill_bitwise": 1,
>             "purged_snaps": [],
>             "history": {
>                 "epoch_created": 1549,
>                 "epoch_pool_created": 216,
>                 "last_epoch_started": 6148,
>                 "last_interval_started": 6147,
>                 "last_epoch_clean": 6148,
>                 "last_interval_clean": 6147,
>                 "last_epoch_split": 6147,
>                 "last_epoch_marked_full": 0,
>                 "same_up_since": 6126,
>                 "same_interval_since": 6147,
>                 "same_primary_since": 6126,
>                 "last_scrub": "7378'12291",
>                 "last_scrub_stamp": "2019-05-14 21:01:29.172460",
>                 "last_deep_scrub": "6103'12186",
>                 "last_deep_scrub_stamp": "2019-05-14 21:01:29.172460",
>                 "last_clean_scrub_stamp": "2019-05-15 23:08:17.014575"
>             },
>             "stats": {
>                 "version": "6103'12264",
>                 "reported_seq": "34823",
>                 "reported_epoch": "6125",
>                 "state": "active+undersized+degraded",
>                 "last_fresh": "2019-05-15 19:16:05.309556",
>                 "last_change": "2019-05-15 19:15:59.342872",
>                 "last_active": "2019-05-15 19:16:05.309556",
>                 "last_peered": "2019-05-15 19:16:05.309556",
>                 "last_clean": "2019-05-15 17:23:41.956141",
>                 "last_became_active": "2019-05-15 19:15:59.342872",
>                 "last_became_peered": "2019-05-15 19:15:59.342872",
>                 "last_unstale": "2019-05-15 19:16:05.309556",
>                 "last_undegraded": "2019-05-15 19:15:59.341684",
>                 "last_fullsized": "2019-05-15 19:15:59.340270",
>                 "mapping_epoch": 6126,
>                 "log_start": "1087'10200",
>                 "ondisk_log_start": "1087'10200",
>                 "created": 1549,
>                 "last_epoch_clean": 6115,
>                 "parent": "0.0",
>                 "parent_split_bits": 10,
>                 "last_scrub": "6103'12186",
>                 "last_scrub_stamp": "2019-05-14 21:01:29.172460",
>                 "last_deep_scrub": "6103'12186",
>                 "last_deep_scrub_stamp": "2019-05-14 21:01:29.172460",
>                 "last_clean_scrub_stamp": "2019-05-14 21:01:29.172460",
>                 "log_size": 2064,
>                 "ondisk_log_size": 2064,
>                 "stats_invalid": true,
>                 "dirty_stats_invalid": false,
>                 "omap_stats_invalid": false,
>                 "hitset_stats_invalid": false,
>                 "hitset_bytes_stats_invalid": false,
>                 "pin_stats_invalid": false,
>                 "manifest_stats_invalid": true,
>                 "snaptrimq_len": 0,
>                 "stat_sum": {
>                     "num_bytes": 2784231424,
>                     "num_objects": 664,
>                     "num_object_clones": 0,
>                     "num_object_copies": 1992,
>                     "num_objects_missing_on_primary": 0,
>                     "num_objects_missing": 0,
>                     "num_objects_degraded": 664,
>                     "num_objects_misplaced": 0,
>                     "num_objects_unfound": 0,
>                     "num_objects_dirty": 664,
>                     "num_whiteouts": 0,
>                     "num_read": 93,
>                     "num_read_kb": 350209,
>                     "num_write": 153,
>                     "num_write_kb": 604160,
>                     "num_scrub_errors": 0,
>                     "num_shallow_scrub_errors": 0,
>                     "num_deep_scrub_errors": 0,
>                     "num_objects_recovered": 129,
>                     "num_bytes_recovered": 540901376,
>                     "num_keys_recovered": 0,
>                     "num_objects_omap": 0,
>                     "num_objects_hit_set_archive": 0,
>                     "num_bytes_hit_set_archive": 0,
>                     "num_flush": 0,
>                     "num_flush_kb": 0,
>                     "num_evict": 0,
>                     "num_evict_kb": 0,
>                     "num_promote": 0,
>                     "num_flush_mode_high": 0,
>                     "num_flush_mode_low": 0,
>                     "num_evict_mode_some": 0,
>                     "num_evict_mode_full": 0,
>                     "num_objects_pinned": 0,
>                     "num_legacy_snapsets": 0,
>                     "num_large_omap_objects": 0,
>                     "num_objects_manifest": 0,
>                     "num_omap_bytes": 0,
>                     "num_omap_keys": 0,
>                     "num_objects_repaired": 0
>                 },
>                 "up": [
>                     1,
>                     6,
>                     37
>                 ],
>                 "acting": [
>                     1,
>                     6,
>                     37
>                 ],
>                 "blocked_by": [],
>                 "up_primary": 1,
>                 "acting_primary": 1,
>                 "purged_snaps": []
>             },
>             "empty": 0,
>             "dne": 0,
>             "incomplete": 0,
>             "last_epoch_started": 6148,
>             "hit_set_history": {
>                 "current_last_update": "0'0",
>                 "history": []
>             }
>         },
>         {
>             "peer": "37",
>             "pgid": "11.2f2",
>             "last_update": "7378'12291",
>             "last_complete": "7378'12291",
>             "log_tail": "1087'10200",
>             "last_user_version": 12264,
>             "last_backfill": "MAX",
>             "last_backfill_bitwise": 1,
>             "purged_snaps": [],
>             "history": {
>                 "epoch_created": 1549,
>                 "epoch_pool_created": 216,
>                 "last_epoch_started": 6148,
>                 "last_interval_started": 6147,
>                 "last_epoch_clean": 6148,
>                 "last_interval_clean": 6147,
>                 "last_epoch_split": 6147,
>                 "last_epoch_marked_full": 0,
>                 "same_up_since": 6126,
>                 "same_interval_since": 6147,
>                 "same_primary_since": 6126,
>                 "last_scrub": "7378'12291",
>                 "last_scrub_stamp": "2019-05-14 21:01:29.172460",
>                 "last_deep_scrub": "6103'12186",
>                 "last_deep_scrub_stamp": "2019-05-14 21:01:29.172460",
>                 "last_clean_scrub_stamp": "2019-05-15 23:08:17.014575"
>             },
>             "stats": {
>                 "version": "6103'12263",
>                 "reported_seq": "34275",
>                 "reported_epoch": "6103",
>                 "state": "active+clean",
>                 "last_fresh": "2019-05-15 17:23:41.956141",
>                 "last_change": "2019-05-14 21:01:29.172506",
>                 "last_active": "2019-05-15 17:23:41.956141",
>                 "last_peered": "2019-05-15 17:23:41.956141",
>                 "last_clean": "2019-05-15 17:23:41.956141",
>                 "last_became_active": "2019-05-14 20:16:44.641437",
>                 "last_became_peered": "2019-05-14 20:16:44.641437",
>                 "last_unstale": "2019-05-15 17:23:41.956141",
>                 "last_undegraded": "2019-05-15 17:23:41.956141",
>                 "last_fullsized": "2019-05-15 17:23:41.956141",
>                 "mapping_epoch": 6126,
>                 "log_start": "1087'10200",
>                 "ondisk_log_start": "1087'10200",
>                 "created": 1549,
>                 "last_epoch_clean": 6010,
>                 "parent": "0.0",
>                 "parent_split_bits": 10,
>                 "last_scrub": "6103'12186",
>                 "last_scrub_stamp": "2019-05-14 21:01:29.172460",
>                 "last_deep_scrub": "6103'12186",
>                 "last_deep_scrub_stamp": "2019-05-14 21:01:29.172460",
>                 "last_clean_scrub_stamp": "2019-05-14 21:01:29.172460",
>                 "log_size": 2063,
>                 "ondisk_log_size": 2063,
>                 "stats_invalid": true,
>                 "dirty_stats_invalid": false,
>                 "omap_stats_invalid": false,
>                 "hitset_stats_invalid": false,
>                 "hitset_bytes_stats_invalid": false,
>                 "pin_stats_invalid": false,
>                 "manifest_stats_invalid": true,
>                 "snaptrimq_len": 0,
>                 "stat_sum": {
>                     "num_bytes": 2784231424,
>                     "num_objects": 664,
>                     "num_object_clones": 0,
>                     "num_object_copies": 1993,
>                     "num_objects_missing_on_primary": 0,
>                     "num_objects_missing": 0,
>                     "num_objects_degraded": 0,
>                     "num_objects_misplaced": 0,
>                     "num_objects_unfound": 0,
>                     "num_objects_dirty": 664,
>                     "num_whiteouts": 0,
>                     "num_read": 93,
>                     "num_read_kb": 350209,
>                     "num_write": 153,
>                     "num_write_kb": 604160,
>                     "num_scrub_errors": 0,
>                     "num_shallow_scrub_errors": 0,
>                     "num_deep_scrub_errors": 0,
>                     "num_objects_recovered": 0,
>                     "num_bytes_recovered": 0,
>                     "num_keys_recovered": 0,
>                     "num_objects_omap": 0,
>                     "num_objects_hit_set_archive": 0,
>                     "num_bytes_hit_set_archive": 0,
>                     "num_flush": 0,
>                     "num_flush_kb": 0,
>                     "num_evict": 0,
>                     "num_evict_kb": 0,
>                     "num_promote": 0,
>                     "num_flush_mode_high": 0,
>                     "num_flush_mode_low": 0,
>                     "num_evict_mode_some": 0,
>                     "num_evict_mode_full": 0,
>                     "num_objects_pinned": 0,
>                     "num_legacy_snapsets": 0,
>                     "num_large_omap_objects": 0,
>                     "num_objects_manifest": 0,
>                     "num_omap_bytes": 0,
>                     "num_omap_keys": 0,
>                     "num_objects_repaired": 0
>                 },
>                 "up": [
>                     1,
>                     6,
>                     37
>                 ],
>                 "acting": [
>                     1,
>                     6,
>                     37
>                 ],
>                 "blocked_by": [],
>                 "up_primary": 1,
>                 "acting_primary": 1,
>                 "purged_snaps": []
>             },
>             "empty": 0,
>             "dne": 0,
>             "incomplete": 0,
>             "last_epoch_started": 6148,
>             "hit_set_history": {
>                 "current_last_update": "0'0",
>                 "history": []
>             }
>         }
>     ],
>     "recovery_state": [
>         {
>             "name": "Started/Primary/Active",
>             "enter_time": "2019-05-15 19:25:01.479877",
>             "might_have_unfound": [],
>             "recovery_progress": {
>                 "backfill_targets": [],
>                 "waiting_on_backfill": [],
>                 "last_backfill_started": "MIN",
>                 "backfill_info": {
>                     "begin": "MIN",
>                     "end": "MIN",
>                     "objects": []
>                 },
>                 "peer_backfill_info": [],
>                 "backfills_in_flight": [],
>                 "recovering": [],
>                 "pg_backend": {
>                     "pull_from_peer": [],
>                     "pushing": []
>                 }
>             },
>             "scrub": {
>                 "scrubber.epoch_start": "6147",
>                 "scrubber.active": false,
>                 "scrubber.state": "INACTIVE",
>                 "scrubber.start": "MIN",
>                 "scrubber.end": "MIN",
>                 "scrubber.max_end": "MIN",
>                 "scrubber.subset_last_update": "0'0",
>                 "scrubber.deep": false,
>                 "scrubber.waiting_on_whom": []
>             }
>         },
>         {
>             "name": "Started",
>             "enter_time": "2019-05-15 19:25:00.557042"
>         }
>     ],
>     "agent_state": {}
> }
>
_______________________________________________
ceph-users mailing list
[email protected]
http://lists.ceph.com/listinfo.cgi/ceph-users-ceph.com

Reply via email to