ceph/src/common/options/mon.yaml.in

   1 # -*- mode: YAML -*-
   2 ---
   3
   4 options:
   5 - name: osd_crush_update_weight_set
   6   type: bool
   7   level: advanced
   8   desc: update CRUSH weight-set weights when updating weights
   9   long_desc: If this setting is true, we will update the weight-set weights when adjusting
  10     an item's weight, effectively making changes take effect immediately, and discarding
  11     any previous optimization in the weight-set value.  Setting this value to false
  12     will leave it to the balancer to (slowly, presumably) adjust weights to approach
  13     the new target value.
  14   default: true
  15   with_legacy: true
  16 - name: osd_pool_erasure_code_stripe_unit
  17   type: size
  18   level: advanced
  19   desc: the amount of data (in bytes) in a data chunk, per stripe
  20   fmt_desc: Sets the default size, in bytes, of a chunk of an object
  21     stripe for erasure coded pools. Every object of size S
  22     will be stored as N stripes, with each data chunk
  23     receiving ``stripe unit`` bytes. Each stripe of ``N *
  24     stripe unit`` bytes will be encoded/decoded
  25     individually. This option can is overridden by the
  26     ``stripe_unit`` setting in an erasure code profile.
  27   default: 4_K
  28   services:
  29   - mon
  30 - name: mon_max_pool_pg_num
  31   type: uint
  32   level: advanced
  33   default: 64_K
  34   fmt_desc: The maximum number of placement groups per pool.
  35 - name: mon_mgr_digest_period
  36   type: int
  37   level: dev
  38   desc: Period in seconds between monitor-to-manager health/status updates
  39   default: 5
  40   services:
  41   - mon
  42 - name: mon_down_mkfs_grace
  43   type: secs
  44   level: advanced
  45   desc: Period in seconds that the cluster may have a mon down after cluster creation
  46   default: 1_min
  47   services:
  48   - mon
  49 - name: mon_mgr_beacon_grace
  50   type: secs
  51   level: advanced
  52   desc: Period in seconds from last beacon to monitor marking a manager daemon as
  53     failed
  54   default: 30
  55   services:
  56   - mon
  57 - name: mon_mgr_inactive_grace
  58   type: int
  59   level: advanced
  60   desc: Period in seconds after cluster creation during which cluster may have no
  61     active manager
  62   long_desc: This grace period enables the cluster to come up cleanly without raising
  63     spurious health check failures about managers that aren't online yet
  64   default: 1_min
  65   services:
  66   - mon
  67 - name: mon_mgr_mkfs_grace
  68   type: int
  69   level: advanced
  70   desc: Period in seconds that the cluster may have no active manager before this
  71     is reported as an ERR rather than a WARN
  72   default: 2_min
  73   services:
  74   - mon
  75 - name: mon_mgr_proxy_client_bytes_ratio
  76   type: float
  77   level: dev
  78   desc: ratio of mon_client_bytes that can be consumed by proxied mgr commands before
  79     we error out to client
  80   default: 0.3
  81   services:
  82   - mon
  83 - name: mon_cluster_log_to_stderr
  84   type: bool
  85   level: advanced
  86   desc: Make monitor send cluster log messages to stderr (prefixed by channel)
  87   default: false
  88   services:
  89   - mon
  90   see_also:
  91   - log_stderr_prefix
  92   flags:
  93   - runtime
  94   with_legacy: true
  95 - name: mon_cluster_log_to_syslog
  96   type: str
  97   level: advanced
  98   desc: Make monitor send cluster log messages to syslog
  99   fmt_desc: Determines if the cluster log should be output to the syslog.
 100   default: default=false
 101   services:
 102   - mon
 103   flags:
 104   - runtime
 105   with_legacy: true
 106 - name: mon_cluster_log_to_syslog_level
 107   type: str
 108   level: advanced
 109   desc: Syslog level for cluster log messages
 110   default: info
 111   services:
 112   - mon
 113   see_also:
 114   - mon_cluster_log_to_syslog
 115   flags:
 116   - runtime
 117   with_legacy: true
 118 - name: mon_cluster_log_to_syslog_facility
 119   type: str
 120   level: advanced
 121   desc: Syslog facility for cluster log messages
 122   default: daemon
 123   services:
 124   - mon
 125   see_also:
 126   - mon_cluster_log_to_syslog
 127   flags:
 128   - runtime
 129   with_legacy: true
 130 - name: mon_cluster_log_to_file
 131   type: bool
 132   level: advanced
 133   desc: Make monitor send cluster log messages to file
 134   default: true
 135   services:
 136   - mon
 137   see_also:
 138   - mon_cluster_log_file
 139   flags:
 140   - runtime
 141   with_legacy: true
 142 - name: mon_cluster_log_file
 143   type: str
 144   level: advanced
 145   desc: File(s) to write cluster log to
 146   long_desc: This can either be a simple file name to receive all messages, or a list
 147     of key/value pairs where the key is the log channel and the value is the filename,
 148     which may include $cluster and $channel metavariables
 149   fmt_desc: |
 150     The locations of the cluster's log files. There are two channels in
 151     Ceph: ``cluster`` and ``audit``. This option represents a mapping
 152     from channels to log files, where the log entries of that
 153     channel are sent to. The ``default`` entry is a fallback
 154     mapping for channels not explicitly specified. So, the following
 155     default setting will send cluster log to ``$cluster.log``, and
 156     send audit log to ``$cluster.audit.log``, where ``$cluster`` will
 157     be replaced with the actual cluster name.
 158   default: default=/var/log/ceph/$cluster.$channel.log cluster=/var/log/ceph/$cluster.log
 159   services:
 160   - mon
 161   see_also:
 162   - mon_cluster_log_to_file
 163   flags:
 164   - runtime
 165   with_legacy: true
 166 - name: mon_cluster_log_file_level
 167   type: str
 168   level: advanced
 169   desc: Lowest level to include is cluster log file
 170   default: debug
 171   services:
 172   - mon
 173   see_also:
 174   - mon_cluster_log_file
 175   flags:
 176   - runtime
 177   with_legacy: true
 178 - name: mon_cluster_log_to_graylog
 179   type: str
 180   level: advanced
 181   desc: Make monitor send cluster log to graylog
 182   default: 'false'
 183   services:
 184   - mon
 185   flags:
 186   - runtime
 187   with_legacy: true
 188 - name: mon_cluster_log_to_graylog_host
 189   type: str
 190   level: advanced
 191   desc: Graylog host for cluster log messages
 192   default: 127.0.0.1
 193   services:
 194   - mon
 195   see_also:
 196   - mon_cluster_log_to_graylog
 197   flags:
 198   - runtime
 199   with_legacy: true
 200 - name: mon_cluster_log_to_graylog_port
 201   type: str
 202   level: advanced
 203   desc: Graylog port for cluster log messages
 204   default: '12201'
 205   services:
 206   - mon
 207   see_also:
 208   - mon_cluster_log_to_graylog
 209   flags:
 210   - runtime
 211   with_legacy: true
 212 - name: mon_cluster_log_to_journald
 213   type: str
 214   level: advanced
 215   desc: Make monitor send cluster log to journald
 216   default: 'false'
 217   services:
 218   - mon
 219   flags:
 220   - runtime
 221 - name: mon_log_max
 222   type: uint
 223   level: advanced
 224   desc: number of recent cluster log messages to retain
 225   default: 10000
 226   services:
 227   - mon
 228   with_legacy: true
 229 - name: mon_log_max_summary
 230   type: uint
 231   level: advanced
 232   desc: number of recent cluster log messages to dedup against
 233   default: 50
 234   services:
 235   - mon
 236   with_legacy: true
 237 - name: mon_log_full_interval
 238   type: uint
 239   level: advanced
 240   desc: how many epochs before we encode a full copy of recent log keys
 241   default: 50
 242   services: [mon]
 243   with_legacy: true
 244 - name: mon_max_log_entries_per_event
 245   type: int
 246   level: advanced
 247   desc: max cluster log entries per paxos event
 248   fmt_desc: The maximum number of log entries per event.
 249   default: 4096
 250   services:
 251   - mon
 252   with_legacy: true
 253 - name: mon_health_to_clog
 254   type: bool
 255   level: advanced
 256   desc: log monitor health to cluster log
 257   fmt_desc: Enable sending a health summary to the cluster log periodically.
 258   default: true
 259   services:
 260   - mon
 261   with_legacy: true
 262 - name: mon_health_to_clog_interval
 263   type: int
 264   level: advanced
 265   desc: frequency to log monitor health to cluster log
 266   fmt_desc: How often (in seconds) the monitor sends a health summary to the cluster
 267     log (a non-positive number disables). Monitors will always
 268     send a summary to the cluster log whether or not it differs from
 269     the previous summary.
 270   default: 10_min
 271   services:
 272   - mon
 273   see_also:
 274   - mon_health_to_clog
 275   with_legacy: true
 276 - name: mon_health_to_clog_tick_interval
 277   type: float
 278   level: dev
 279   fmt_desc: How often (in seconds) the monitor sends a health summary to the cluster
 280     log (a non-positive number disables). If current health summary
 281     is empty or identical to the last time, monitor will not send it
 282     to cluster log.
 283   default: 1_min
 284   services:
 285   - mon
 286   with_legacy: true
 287 - name: mon_health_detail_to_clog
 288   type: bool
 289   level: dev
 290   desc: log health detail to cluster log
 291   default: true
 292   with_legacy: true
 293 - name: mon_warn_on_filestore_osds
 294   type: bool
 295   level: dev
 296   desc: log health warn for filestore OSDs
 297   default: true
 298   with_legacy: true
 299 - name: mon_health_max_detail
 300   type: uint
 301   level: advanced
 302   desc: max detailed pgs to report in health detail
 303   default: 50
 304   services:
 305   - mon
 306 - name: mon_health_log_update_period
 307   type: int
 308   level: dev
 309   desc: minimum time in seconds between log messages about each health check
 310   default: 5
 311   services:
 312   - mon
 313   min: 0
 314 - name: mon_data_avail_crit
 315   type: int
 316   level: advanced
 317   desc: issue MON_DISK_CRIT health error when mon available space below this percentage
 318   fmt_desc: Raise ``HEALTH_ERR`` status when the filesystem that houses a
 319     monitor's data store reports that its available capacity is
 320     less than or equal to this percentage.
 321   default: 5
 322   services:
 323   - mon
 324   with_legacy: true
 325 - name: mon_data_avail_warn
 326   type: int
 327   level: advanced
 328   desc: issue MON_DISK_LOW health warning when mon available space below this percentage
 329   fmt_desc: Raise ``HEALTH_WARN`` status when the filesystem that houses a
 330     monitor's data store reports that its available capacity is
 331     less than or equal to this percentage .
 332   default: 30
 333   services:
 334   - mon
 335   with_legacy: true
 336 - name: mon_data_size_warn
 337   type: size
 338   level: advanced
 339   desc: issue MON_DISK_BIG health warning when mon database is above this size
 340   fmt_desc: Raise ``HEALTH_WARN`` status when a monitor's data
 341     store grows to be larger than this size, 15GB by default.
 342   default: 15_G
 343   services:
 344   - mon
 345   with_legacy: true
 346 - name: mon_daemon_bytes
 347   type: size
 348   level: advanced
 349   desc: max bytes of outstanding mon messages mon will read off the network
 350   fmt_desc: The message memory cap for metadata server and OSD messages (in bytes).
 351   default: 400_M
 352   services:
 353   - mon
 354   with_legacy: true
 355 - name: mon_election_timeout
 356   type: float
 357   level: advanced
 358   desc: maximum time for a mon election (seconds)
 359   fmt_desc: On election proposer, maximum waiting time for all ACKs in seconds.
 360   default: 5
 361   services:
 362   - mon
 363   with_legacy: true
 364 - name: mon_election_default_strategy
 365   type: uint
 366   level: advanced
 367   desc: The election strategy to set when constructing the first monmap.
 368   default: 1
 369   min: 1
 370   max: 3
 371 - name: mon_lease
 372   type: float
 373   level: advanced
 374   desc: lease interval between quorum monitors (seconds)
 375   long_desc: This setting controls how sensitive your mon quorum is to intermittent
 376     network issues or other failures.
 377   fmt_desc: The length (in seconds) of the lease on the monitor's versions.
 378   default: 5
 379   services:
 380   - mon
 381   with_legacy: true
 382 - name: mon_lease_renew_interval_factor
 383   type: float
 384   level: advanced
 385   desc: multiple of mon_lease for the lease renewal interval
 386   long_desc: Leases must be renewed before they time out.  A smaller value means frequent
 387     renewals, while a value close to 1 makes a lease expiration more likely.
 388   fmt_desc: |
 389     ``mon_lease`` \* ``mon_lease_renew_interval_factor`` will be the
 390     interval for the Leader to renew the other monitor's leases. The
 391     factor should be less than ``1.0``.
 392   default: 0.6
 393   services:
 394   - mon
 395   see_also:
 396   - mon_lease
 397   min: 0
 398   max: 0.9999999
 399   with_legacy: true
 400 - name: mon_lease_ack_timeout_factor
 401   type: float
 402   level: advanced
 403   desc: multiple of mon_lease for the lease ack interval before calling new election
 404   fmt_desc: The Leader will wait ``mon_lease`` \* ``mon_lease_ack_timeout_factor``
 405     for the Providers to acknowledge the lease extension.
 406   default: 2
 407   services:
 408   - mon
 409   see_also:
 410   - mon_lease
 411   min: 1.0001
 412   max: 100
 413   with_legacy: true
 414 - name: mon_accept_timeout_factor
 415   type: float
 416   level: advanced
 417   desc: multiple of mon_lease for follower mons to accept proposed state changes before
 418     calling a new election
 419   fmt_desc: The Leader will wait ``mon_lease`` \* ``mon_accept_timeout_factor``
 420     for the Requester(s) to accept a Paxos update. It is also used
 421     during the Paxos recovery phase for similar purposes.
 422   default: 2
 423   services:
 424   - mon
 425   see_also:
 426   - mon_lease
 427   with_legacy: true
 428 - name: mon_elector_ping_timeout
 429   type: float
 430   level: advanced
 431   desc: The time after which a ping 'times out' and a connection is considered down
 432   default: 2
 433   services:
 434   - mon
 435   see_also:
 436   - mon_elector_ping_divisor
 437 - name: mon_elector_ping_divisor
 438   type: uint
 439   level: advanced
 440   desc: We will send a ping up to this many times per timeout per
 441   default: 2
 442   services:
 443   - mon
 444   see_also:
 445   - mon_elector_ping_timeout
 446 - name: mon_con_tracker_persist_interval
 447   type: uint
 448   level: advanced
 449   desc: how many updates the ConnectionTracker takes before it persists to disk
 450   default: 10
 451   services:
 452   - mon
 453   min: 1
 454   max: 100000
 455 - name: mon_con_tracker_score_halflife
 456   type: uint
 457   level: advanced
 458   desc: The 'halflife' used when updating/calculating peer connection scores
 459   default: 43200
 460   services:
 461   - mon
 462   min: 60
 463 - name: mon_elector_ignore_propose_margin
 464   type: float
 465   level: advanced
 466   desc: The difference in connection score allowed before a peon stops ignoring out-of-quorum
 467     PROPOSEs
 468   default: 0.0005
 469   services:
 470   - mon
 471 - name: mon_warn_on_cache_pools_without_hit_sets
 472   type: bool
 473   level: advanced
 474   desc: issue CACHE_POOL_NO_HIT_SET health warning for cache pools that do not have
 475     hit sets configured
 476   fmt_desc: Raise ``HEALTH_WARN`` when a cache pool does not have the ``hit_set_type``
 477     value configured. See :ref:`hit_set_type <hit_set_type>` for more details.
 478   default: true
 479   services:
 480   - mon
 481   with_legacy: true
 482 - name: mon_warn_on_pool_pg_num_not_power_of_two
 483   type: bool
 484   level: dev
 485   desc: issue POOL_PG_NUM_NOT_POWER_OF_TWO warning if pool has a non-power-of-two
 486     pg_num value
 487   default: true
 488   services:
 489   - mon
 490 - name: mon_allow_pool_size_one
 491   type: bool
 492   level: advanced
 493   desc: allow configuring pool with no replicas
 494   default: false
 495   services:
 496   - mon
 497 - name: mon_warn_on_crush_straw_calc_version_zero
 498   type: bool
 499   level: advanced
 500   desc: issue OLD_CRUSH_STRAW_CALC_VERSION health warning if the CRUSH map's straw_calc_version
 501     is zero
 502   fmt_desc: Raise ``HEALTH_WARN`` when the CRUSH ``straw_calc_version`` is zero. See
 503     :ref:`CRUSH map tunables <crush-map-tunables>` for details.
 504   default: true
 505   services:
 506   - mon
 507   with_legacy: true
 508 - name: mon_warn_on_pool_no_redundancy
 509   type: bool
 510   level: advanced
 511   desc: Issue a health warning if any pool is configured with no replicas
 512   fmt_desc: Raise ``HEALTH_WARN`` if any pool is configured with no replicas.
 513   default: true
 514   services:
 515   - mon
 516   see_also:
 517   - osd_pool_default_size
 518   - osd_pool_default_min_size
 519 - name: mon_warn_on_osd_down_out_interval_zero
 520   type: bool
 521   level: advanced
 522   desc: issue OSD_NO_DOWN_OUT_INTERVAL health warning if mon_osd_down_out_interval
 523     is zero
 524   long_desc: Having mon_osd_down_out_interval set to 0 means that down OSDs are not
 525     marked out automatically and the cluster does not heal itself without administrator
 526     intervention.
 527   fmt_desc: Raise ``HEALTH_WARN`` when ``mon_osd_down_out_interval`` is zero. Having this
 528     option set to zero on the leader acts much like the ``noout`` flag. It's hard to figure
 529     out what's going wrong with clusters without the ``noout`` flag set but acting like that
 530     just the same, so we report a warning in this case.
 531   default: true
 532   services:
 533   - mon
 534   see_also:
 535   - mon_osd_down_out_interval
 536   with_legacy: true
 537 - name: mon_warn_on_legacy_crush_tunables
 538   type: bool
 539   level: advanced
 540   desc: issue OLD_CRUSH_TUNABLES health warning if CRUSH tunables are older than mon_crush_min_required_version
 541   fmt_desc: Raise ``HEALTH_WARN`` when CRUSH tunables are too old (older than ``mon_min_crush_required_version``)
 542   default: true
 543   services:
 544   - mon
 545   see_also:
 546   - mon_crush_min_required_version
 547   with_legacy: true
 548 - name: mon_crush_min_required_version
 549   type: str
 550   level: advanced
 551   desc: minimum ceph release to use for mon_warn_on_legacy_crush_tunables
 552   fmt_desc: The minimum tunable profile required by the cluster. See
 553     :ref:`CRUSH map tunables <crush-map-tunables>` for details.
 554   default: hammer
 555   services:
 556   - mon
 557   see_also:
 558   - mon_warn_on_legacy_crush_tunables
 559   with_legacy: true
 560 - name: mon_warn_on_degraded_stretch_mode
 561   type: bool
 562   level: advanced
 563   desc: Issue a health warning if we are in degraded stretch mode
 564   default: true
 565   services:
 566   - mon
 567 - name: mon_stretch_cluster_recovery_ratio
 568   type: float
 569   level: advanced
 570   desc: the ratio of up OSDs at which a degraded stretch cluster enters recovery
 571   default: 0.6
 572   services:
 573   - mon
 574   min: 0.51
 575   max: 1
 576 - name: mon_stretch_recovery_min_wait
 577   type: float
 578   level: advanced
 579   desc: how long the monitors wait before considering fully-healthy PGs as evidence
 580     the stretch mode is repaired
 581   default: 15
 582   services:
 583   - mon
 584   min: 1
 585 - name: mon_stretch_pool_size
 586   type: uint
 587   level: dev
 588   default: 4
 589   services:
 590   - mon
 591   min: 3
 592   max: 6
 593 - name: mon_stretch_pool_min_size
 594   type: uint
 595   level: dev
 596   default: 2
 597   services:
 598   - mon
 599   min: 2
 600   max: 4
 601 - name: mon_clock_drift_allowed
 602   type: float
 603   level: advanced
 604   desc: allowed clock drift (in seconds) between mons before issuing a health warning
 605   default: 0.05
 606   services:
 607   - mon
 608   with_legacy: true
 609 # exponential backoff for clock drift warnings
 610 - name: mon_clock_drift_warn_backoff
 611   type: float
 612   level: advanced
 613   desc: exponential backoff factor for logging clock drift warnings in the cluster
 614     log
 615   default: 5
 616   services:
 617   - mon
 618   with_legacy: true
 619 # on leader, timecheck (clock drift check) interval (seconds)
 620 - name: mon_timecheck_interval
 621   type: float
 622   level: advanced
 623   desc: frequency of clock synchronization checks between monitors (seconds)
 624   fmt_desc: The time check interval (clock drift check) in seconds
 625     for the Leader.
 626   default: 5_min
 627   services:
 628   - mon
 629   with_legacy: true
 630 # on leader, timecheck (clock drift check) interval when in presence of a skew (seconds)
 631 - name: mon_timecheck_skew_interval
 632   type: float
 633   level: advanced
 634   desc: frequency of clock synchronization (re)checks between monitors while clocks
 635     are believed to be skewed (seconds)
 636   fmt_desc: The time check interval (clock drift check) in seconds when in
 637     presence of a skew in seconds for the Leader.
 638   default: 30
 639   services:
 640   - mon
 641   see_also:
 642   - mon_timecheck_interval
 643   with_legacy: true
 644 # how often (in commits) to stash a full copy of the PaxosService state
 645 - name: paxos_stash_full_interval
 646   type: int
 647   level: advanced
 648   default: 25
 649   services:
 650   - mon
 651   fmt_desc: How often (in commits) to stash a full copy of the PaxosService state.
 652     Current this setting only affects ``mds``, ``mon``, ``auth`` and ``mgr``
 653     PaxosServices.
 654   with_legacy: true
 655 # max paxos iterations before we must first sync the monitor stores
 656 - name: paxos_max_join_drift
 657   type: int
 658   level: advanced
 659   default: 10
 660   services:
 661   - mon
 662   fmt_desc: The maximum Paxos iterations before we must first sync the
 663     monitor data stores. When a monitor finds that its peer is too
 664     far ahead of it, it will first sync with data stores before moving
 665     on.
 666   with_legacy: true
 667 # gather updates for this long before proposing a map update
 668 - name: paxos_propose_interval
 669   type: float
 670   level: advanced
 671   default: 1
 672   services:
 673   - mon
 674   fmt_desc: Gather updates for this time interval before proposing
 675     a map update.
 676   with_legacy: true
 677 # min time to gather updates for after period of inactivity
 678 - name: paxos_min_wait
 679   type: float
 680   level: advanced
 681   default: 0.05
 682   services:
 683   - mon
 684   fmt_desc: The minimum amount of time to gather updates after a period of
 685     inactivity.
 686   with_legacy: true
 687 # minimum number of paxos states to keep around
 688 - name: paxos_min
 689   type: int
 690   level: advanced
 691   default: 500
 692   services:
 693   - mon
 694   fmt_desc: The minimum number of Paxos states to keep around
 695   with_legacy: true
 696 # number of extra proposals tolerated before trimming
 697 - name: paxos_trim_min
 698   type: int
 699   level: advanced
 700   default: 250
 701   services:
 702   - mon
 703   fmt_desc: Number of extra proposals tolerated before trimming
 704   with_legacy: true
 705 # maximum amount of versions to trim during a single proposal (0 disables it)
 706 - name: paxos_trim_max
 707   type: int
 708   level: advanced
 709   default: 500
 710   services:
 711   - mon
 712   fmt_desc: The maximum number of extra proposals to trim at a time
 713   with_legacy: true
 714 # minimum amount of versions to trigger a trim (0 disables it)
 715 - name: paxos_service_trim_min
 716   type: uint
 717   level: advanced
 718   default: 250
 719   services:
 720   - mon
 721   fmt_desc: The minimum amount of versions to trigger a trim (0 disables it)
 722   with_legacy: true
 723 # maximum amount of versions to trim during a single proposal (0 disables it)
 724 - name: paxos_service_trim_max
 725   type: uint
 726   level: advanced
 727   default: 500
 728   services:
 729   - mon
 730   fmt_desc: The maximum amount of versions to trim during a single proposal (0 disables it)
 731   with_legacy: true
 732 - name: paxos_service_trim_max_multiplier
 733   type: uint
 734   level: advanced
 735   desc: factor by which paxos_service_trim_max will be multiplied to get a new upper
 736     bound when trim sizes are high  (0 disables it)
 737   default: 20
 738   services:
 739   - mon
 740   min: 0
 741   flags:
 742   - runtime
 743 - name: paxos_kill_at
 744   type: int
 745   level: dev
 746   default: 0
 747   services:
 748   - mon
 749   with_legacy: true
 750 - name: mon_auth_validate_all_caps
 751   type: bool
 752   level: advanced
 753   desc: Whether to parse non-monitor capabilities set by the 'ceph auth ...' commands.
 754     Disabling this saves CPU on the monitor, but allows invalid capabilities to be
 755     set, and only be rejected later, when they are used.
 756   default: true
 757   services:
 758   - mon
 759   flags:
 760   - runtime
 761 # force mon to trim mdsmaps to this point (dangerous)
 762 - name: mon_mds_force_trim_to
 763   type: int
 764   level: dev
 765   desc: force mons to trim mdsmaps/fsmaps up to this epoch
 766   fmt_desc: Force monitor to trim mdsmaps up to but not including this FSMap
 767     epoch. A value of 0 disables (the default) this config. This command is
 768     potentially dangerous, use with care.
 769   default: 0
 770   services:
 771   - mon
 772   with_legacy: true
 773 - name: mds_beacon_mon_down_grace
 774   type: secs
 775   level: advanced
 776   desc: tolerance in seconds for missed MDS beacons to monitors
 777   fmt_desc: The interval without beacons before Ceph declares an MDS laggy
 778     when a monitor is down.
 779   default: 1_min
 780 # skip safety assertions on FSMap (in case of bugs where we want to continue anyway)
 781 - name: mon_mds_skip_sanity
 782   type: bool
 783   level: advanced
 784   desc: skip sanity checks on fsmap/mdsmap
 785   fmt_desc: Skip safety assertions on FSMap (in case of bugs where we want to
 786     continue anyway). Monitor terminates if the FSMap sanity check
 787     fails, but we can disable it by enabling this option.
 788   default: false
 789   services:
 790   - mon
 791   with_legacy: true
 792 - name: mon_mds_blocklist_interval
 793   type: float
 794   level: dev
 795   desc: Duration in seconds that blocklist entries for MDS daemons remain in the OSD
 796     map
 797   fmt_desc: The blocklist duration for failed MDSs in the OSD map. Note,
 798     this controls how long failed MDS daemons will stay in the
 799     OSDMap blocklist. It has no effect on how long something is
 800     blocklisted when the administrator blocklists it manually. For
 801     example, ``ceph osd blocklist add`` will still use the default
 802     blocklist time.
 803   default: 1_day
 804   services:
 805   - mon
 806   min: 1_hr
 807   flags:
 808   - runtime
 809 - name: mon_mgr_blocklist_interval
 810   type: float
 811   level: dev
 812   desc: Duration in seconds that blocklist entries for mgr daemons remain in the OSD
 813     map
 814   default: 1_day
 815   services:
 816   - mon
 817   min: 1_hr
 818   flags:
 819   - runtime
 820 - name: mon_osd_laggy_halflife
 821   type: int
 822   level: advanced
 823   desc: halflife of OSD 'lagginess' factor
 824   fmt_desc: The number of seconds laggy estimates will decay.
 825   default: 1_hr
 826   services:
 827   - mon
 828   with_legacy: true
 829 - name: mon_osd_laggy_weight
 830   type: float
 831   level: advanced
 832   desc: how heavily to weight OSD marking itself back up in overall laggy_probability
 833   long_desc: 1.0 means that an OSD marking itself back up (because it was marked down
 834     but not actually dead) means a 100% laggy_probability; 0.0 effectively disables
 835     tracking of laggy_probability.
 836   fmt_desc: The weight for new samples in laggy estimation decay.
 837   default: 0.3
 838   services:
 839   - mon
 840   min: 0
 841   max: 1
 842   with_legacy: true
 843 - name: mon_osd_laggy_max_interval
 844   type: int
 845   level: advanced
 846   desc: cap value for period for OSD to be marked for laggy_interval calculation
 847   fmt_desc: Maximum value of ``laggy_interval`` in laggy estimations (in seconds).
 848               Monitor uses an adaptive approach to evaluate the ``laggy_interval`` of
 849               a certain OSD. This value will be used to calculate the grace time for
 850               that OSD.
 851   default: 5_min
 852   services:
 853   - mon
 854   with_legacy: true
 855 - name: mon_osd_adjust_heartbeat_grace
 856   type: bool
 857   level: advanced
 858   desc: increase OSD heartbeat grace if peers appear to be laggy
 859   long_desc: If an OSD is marked down but then marks itself back up, it implies it
 860     wasn't actually down but was unable to respond to heartbeats.  If this option
 861     is true, we can use the laggy_probability and laggy_interval values calculated
 862     to model this situation to increase the heartbeat grace period for this OSD so
 863     that it isn't marked down again.  laggy_probability is an estimated probability
 864     that the given OSD is down because it is laggy (not actually down), and laggy_interval
 865     is an estiate on how long it stays down when it is laggy.
 866   fmt_desc: If set to ``true``, Ceph will scale based on laggy estimations.
 867   default: true
 868   services:
 869   - mon
 870   see_also:
 871   - mon_osd_laggy_halflife
 872   - mon_osd_laggy_weight
 873   - mon_osd_laggy_max_interval
 874   with_legacy: true
 875 - name: mon_osd_adjust_down_out_interval
 876   type: bool
 877   level: advanced
 878   desc: increase the mon_osd_down_out_interval if an OSD appears to be laggy
 879   fmt_desc: If set to ``true``, Ceph will scaled based on laggy estimations.
 880   default: true
 881   services:
 882   - mon
 883   see_also:
 884   - mon_osd_adjust_heartbeat_grace
 885   with_legacy: true
 886 - name: mon_osd_auto_mark_in
 887   type: bool
 888   level: advanced
 889   desc: mark any OSD that comes up 'in'
 890   fmt_desc: Ceph will mark any booting Ceph OSD Daemons as ``in``
 891               the Ceph Storage Cluster.
 892   default: false
 893   services:
 894   - mon
 895   with_legacy: true
 896 - name: mon_osd_auto_mark_auto_out_in
 897   type: bool
 898   level: advanced
 899   desc: mark any OSD that comes up that was automatically marked 'out' back 'in'
 900   fmt_desc: Ceph will mark booting Ceph OSD Daemons auto marked ``out``
 901               of the Ceph Storage Cluster as ``in`` the cluster.
 902   default: true
 903   services:
 904   - mon
 905   see_also:
 906   - mon_osd_down_out_interval
 907   with_legacy: true
 908 - name: mon_osd_auto_mark_new_in
 909   type: bool
 910   level: advanced
 911   desc: mark any new OSD that comes up 'in'
 912   fmt_desc: Ceph will mark booting new Ceph OSD Daemons as ``in`` the
 913               Ceph Storage Cluster.
 914   default: true
 915   services:
 916   - mon
 917   with_legacy: true
 918 - name: mon_osd_destroyed_out_interval
 919   type: int
 920   level: advanced
 921   desc: mark any OSD 'out' that has been 'destroy'ed for this long (seconds)
 922   default: 10_min
 923   services:
 924   - mon
 925   with_legacy: true
 926 - name: mon_osd_down_out_interval
 927   type: int
 928   level: advanced
 929   desc: mark any OSD 'out' that has been 'down' for this long (seconds)
 930   fmt_desc: The number of seconds Ceph waits before marking a Ceph OSD Daemon
 931               ``down`` and ``out`` if it doesn't respond.
 932   default: 10_min
 933   services:
 934   - mon
 935   with_legacy: true
 936 - name: mon_osd_down_out_subtree_limit
 937   type: str
 938   level: advanced
 939   desc: do not automatically mark OSDs 'out' if an entire subtree of this size is
 940     down
 941   fmt_desc: The smallest :term:`CRUSH` unit type that Ceph will **not**
 942               automatically mark out. For instance, if set to ``host`` and if
 943               all OSDs of a host are down, Ceph will not automatically mark out
 944               these OSDs.
 945   default: rack
 946   services:
 947   - mon
 948   see_also:
 949   - mon_osd_down_out_interval
 950   flags:
 951   - runtime
 952 - name: mon_osd_min_up_ratio
 953   type: float
 954   level: advanced
 955   desc: do not automatically mark OSDs 'out' if fewer than this many OSDs are 'up'
 956   fmt_desc: The minimum ratio of ``up`` Ceph OSD Daemons before Ceph will
 957               mark Ceph OSD Daemons ``down``.
 958   default: 0.3
 959   services:
 960   - mon
 961   see_also:
 962   - mon_osd_down_out_interval
 963   with_legacy: true
 964 - name: mon_osd_min_in_ratio
 965   type: float
 966   level: advanced
 967   desc: do not automatically mark OSDs 'out' if fewer than this many OSDs are 'in'
 968   fmt_desc: The minimum ratio of ``in`` Ceph OSD Daemons before Ceph will
 969               mark Ceph OSD Daemons ``out``.
 970   default: 0.75
 971   services:
 972   - mon
 973   see_also:
 974   - mon_osd_down_out_interval
 975   with_legacy: true
 976 - name: mon_osd_warn_op_age
 977   type: float
 978   level: advanced
 979   desc: issue REQUEST_SLOW health warning if OSD ops are slower than this age (seconds)
 980   default: 32
 981   services:
 982   - mgr
 983   with_legacy: true
 984 - name: mon_osd_warn_num_repaired
 985   type: uint
 986   level: advanced
 987   desc: issue OSD_TOO_MANY_REPAIRS health warning if an OSD has more than this many
 988     read repairs
 989   default: 10
 990   services:
 991   - mon
 992 - name: mon_osd_prime_pg_temp
 993   type: bool
 994   level: dev
 995   desc: minimize peering work by priming pg_temp values after a map change
 996   fmt_desc: Enables or disables priming the PGMap with the previous OSDs when an ``out``
 997     OSD comes back into the cluster. With the ``true`` setting, clients
 998     will continue to use the previous OSDs until the newly ``in`` OSDs for
 999     a PG have peered.
1000   default: true
1001   services:
1002   - mon
1003   with_legacy: true
1004 - name: mon_osd_prime_pg_temp_max_time
1005   type: float
1006   level: dev
1007   desc: maximum time to spend precalculating PG mappings on map change (seconds)
1008   fmt_desc: How much time in seconds the monitor should spend trying to prime the
1009     PGMap when an out OSD comes back into the cluster.
1010   default: 0.5
1011   services:
1012   - mon
1013   with_legacy: true
1014 - name: mon_osd_prime_pg_temp_max_estimate
1015   type: float
1016   level: advanced
1017   desc: calculate all PG mappings if estimated fraction of PGs that change is above
1018     this amount
1019   fmt_desc: Maximum estimate of time spent on each PG before we prime all PGs
1020     in parallel.
1021   default: 0.25
1022   services:
1023   - mon
1024   with_legacy: true
1025 - name: mon_osd_blocklist_default_expire
1026   type: float
1027   level: advanced
1028   desc: Duration in seconds that blocklist entries for clients remain in the OSD map
1029   default: 1_hr
1030   services:
1031   - mon
1032   with_legacy: true
1033 - name: mon_osd_crush_smoke_test
1034   type: bool
1035   level: advanced
1036   desc: perform a smoke test on any new CRUSH map before accepting changes
1037   default: true
1038   services:
1039   - mon
1040   with_legacy: true
1041 - name: mon_smart_report_timeout
1042   type: uint
1043   level: advanced
1044   desc: Timeout (in seconds) for smarctl to run, default is set to 5
1045   default: 5
1046   services:
1047   - mon
1048 - name: mon_warn_on_older_version
1049   type: bool
1050   level: advanced
1051   desc: issue DAEMON_OLD_VERSION health warning if daemons are not all running the
1052     same version
1053   default: true
1054   services:
1055   - mon
1056 - name: mon_warn_older_version_delay
1057   type: secs
1058   level: advanced
1059   desc: issue DAEMON_OLD_VERSION health warning after this amount of time has elapsed
1060   default: 7_day
1061   services:
1062   - mon
1063 - name: mon_data
1064   type: str
1065   level: advanced
1066   desc: path to mon database
1067   fmt_desc: The monitor's data location.
1068   default: /var/lib/ceph/mon/$cluster-$id
1069   services:
1070   - mon
1071   flags:
1072   - no_mon_update
1073   with_legacy: true
1074 - name: mon_rocksdb_options
1075   type: str
1076   level: advanced
1077   default: write_buffer_size=33554432,compression=kNoCompression,level_compaction_dynamic_level_bytes=true
1078   with_legacy: true
1079 - name: mon_enable_op_tracker
1080   type: bool
1081   level: advanced
1082   desc: enable/disable MON op tracking
1083   default: true
1084   services:
1085   - mon
1086 # compact leveldb on ceph-mon start
1087 - name: mon_compact_on_start
1088   type: bool
1089   level: advanced
1090   default: false
1091   services:
1092   - mon
1093   fmt_desc: Compact the database used as Ceph Monitor store on
1094     ``ceph-mon`` start. A manual compaction helps to shrink the
1095     monitor database and improve the performance of it if the regular
1096     compaction fails to work.
1097   with_legacy: true
1098 # trigger leveldb compaction on bootstrap
1099 - name: mon_compact_on_bootstrap
1100   type: bool
1101   level: advanced
1102   default: false
1103   services:
1104   - mon
1105   fmt_desc: Compact the database used as Ceph Monitor store
1106     on bootstrap. Monitors probe each other to establish
1107     a quorum after bootstrap. If a monitor times out before joining the
1108     quorum, it will start over and bootstrap again.
1109   with_legacy: true
1110 # compact (a prefix) when we trim old states
1111 - name: mon_compact_on_trim
1112   type: bool
1113   level: advanced
1114   default: true
1115   services:
1116   - mon
1117   fmt_desc: Compact a certain prefix (including paxos) when we trim its old states.
1118   with_legacy: true
1119 - name: mon_op_complaint_time
1120   type: secs
1121   level: advanced
1122   desc: time after which to consider a monitor operation blocked after no updates
1123   default: 30
1124   services:
1125   - mon
1126 - name: mon_op_log_threshold
1127   type: int
1128   level: advanced
1129   desc: max number of slow ops to display
1130   default: 5
1131   services:
1132   - mon
1133 - name: mon_op_history_size
1134   type: uint
1135   level: advanced
1136   desc: max number of completed ops to track
1137   default: 20
1138   services:
1139   - mon
1140 - name: mon_op_history_duration
1141   type: secs
1142   level: advanced
1143   desc: expiration time in seconds of historical MON OPS
1144   default: 10_min
1145   services:
1146   - mon
1147 - name: mon_op_history_slow_op_size
1148   type: uint
1149   level: advanced
1150   desc: max number of slow historical MON OPS to keep
1151   default: 20
1152   services:
1153   - mon
1154 - name: mon_op_history_slow_op_threshold
1155   type: secs
1156   level: advanced
1157   desc: duration of an op to be considered as a historical slow op
1158   default: 10
1159   services:
1160   - mon
1161 - name: mon_osdmap_full_prune_enabled
1162   type: bool
1163   level: advanced
1164   desc: enables pruning full osdmap versions when we go over a given number of maps
1165   default: true
1166   services:
1167   - mon
1168   see_also:
1169   - mon_osdmap_full_prune_min
1170   - mon_osdmap_full_prune_interval
1171   - mon_osdmap_full_prune_txsize
1172 - name: mon_osdmap_full_prune_min
1173   type: uint
1174   level: advanced
1175   desc: minimum number of versions in the store to trigger full map pruning
1176   default: 10000
1177   services:
1178   - mon
1179   see_also:
1180   - mon_osdmap_full_prune_enabled
1181   - mon_osdmap_full_prune_interval
1182   - mon_osdmap_full_prune_txsize
1183 - name: mon_osdmap_full_prune_interval
1184   type: uint
1185   level: advanced
1186   desc: interval between maps that will not be pruned; maps in the middle will be
1187     pruned.
1188   default: 10
1189   services:
1190   - mon
1191   see_also:
1192   - mon_osdmap_full_prune_enabled
1193   - mon_osdmap_full_prune_interval
1194   - mon_osdmap_full_prune_txsize
1195 - name: mon_osdmap_full_prune_txsize
1196   type: uint
1197   level: advanced
1198   desc: number of maps we will prune per iteration
1199   default: 100
1200   services:
1201   - mon
1202   see_also:
1203   - mon_osdmap_full_prune_enabled
1204   - mon_osdmap_full_prune_interval
1205   - mon_osdmap_full_prune_txsize
1206 - name: mon_osd_cache_size
1207   type: int
1208   level: advanced
1209   desc: maximum number of OSDMaps to cache in memory
1210   fmt_desc: The size of osdmaps cache, not to rely on underlying store's cache
1211   default: 500
1212   services:
1213   - mon
1214   with_legacy: true
1215 - name: mon_osd_cache_size_min
1216   type: size
1217   level: advanced
1218   desc: The minimum amount of bytes to be kept mapped in memory for osd monitor caches.
1219   fmt_desc: The minimum amount of bytes to be kept mapped in memory for osd
1220      monitor caches.
1221   default: 128_M
1222   services:
1223   - mon
1224   with_legacy: true
1225 - name: mon_osd_mapping_pgs_per_chunk
1226   type: int
1227   level: dev
1228   desc: granularity of PG placement calculation background work
1229   fmt_desc: We calculate the mapping from placement group to OSDs in chunks.
1230     This option specifies the number of placement groups per chunk.
1231   default: 4096
1232   services:
1233   - mon
1234   with_legacy: true
1235 - name: mon_clean_pg_upmaps_per_chunk
1236   type: uint
1237   level: dev
1238   desc: granularity of PG upmap validation background work
1239   default: 256
1240   services:
1241   - mon
1242   with_legacy: true
1243 - name: mon_osd_max_creating_pgs
1244   type: int
1245   level: advanced
1246   desc: maximum number of PGs the mon will create at once
1247   default: 1024
1248   services:
1249   - mon
1250   with_legacy: true
1251 - name: mon_osd_max_initial_pgs
1252   type: int
1253   level: advanced
1254   desc: maximum number of PGs a pool will created with
1255   long_desc: If the user specifies more PGs than this, the cluster will subsequently
1256     split PGs after the pool is created in order to reach the target.
1257   default: 1024
1258   services:
1259   - mon
1260 - name: mon_memory_target
1261   type: size
1262   level: basic
1263   desc: The amount of bytes pertaining to osd monitor caches and kv cache to be kept
1264     mapped in memory with cache auto-tuning enabled
1265   fmt_desc: The amount of bytes pertaining to OSD monitor caches and KV cache
1266     to be kept mapped in memory with cache auto-tuning enabled.
1267   default: 2_G
1268   services:
1269   - mon
1270   flags:
1271   - runtime
1272   with_legacy: true
1273 - name: mon_memory_autotune
1274   type: bool
1275   level: basic
1276   desc: Autotune the cache memory being used for osd monitors and kv database
1277   fmt_desc: Autotune the cache memory used for OSD monitors and KV
1278     database.
1279   default: true
1280   services:
1281   - mon
1282   flags:
1283   - runtime
1284   with_legacy: true
1285 - name: mon_cpu_threads
1286   type: int
1287   level: advanced
1288   desc: worker threads for CPU intensive background work
1289   fmt_desc: Number of threads for performing CPU intensive work on monitor.
1290   default: 4
1291   services:
1292   - mon
1293   with_legacy: true
1294 - name: mon_tick_interval
1295   type: int
1296   level: advanced
1297   desc: interval for internal mon background checks
1298   fmt_desc: A monitor's tick interval in seconds.
1299   default: 5
1300   services:
1301   - mon
1302   with_legacy: true
1303 - name: mon_session_timeout
1304   type: int
1305   level: advanced
1306   desc: close inactive mon client connections after this many seconds
1307   fmt_desc: Monitor will terminate inactive sessions stay idle over this
1308     time limit.
1309   default: 5_min
1310   services:
1311   - mon
1312   with_legacy: true
1313 - name: mon_subscribe_interval
1314   type: float
1315   level: dev
1316   desc: subscribe interval for pre-jewel clients
1317   fmt_desc: The refresh interval (in seconds) for subscriptions. The
1318     subscription mechanism enables obtaining cluster maps
1319     and log information.
1320   default: 1_day
1321   services:
1322   - mon
1323   with_legacy: true