]> git.proxmox.com Git - ceph.git/blame - ceph/src/common/options/mds.yaml.in
bump version to 17.2.0
[ceph.git] / ceph / src / common / options / mds.yaml.in
CommitLineData
20effc67
TL
1# -*- mode: YAML -*-
2---
3
4options:
5- name: mds_alternate_name_max
6 type: size
7 level: advanced
8 desc: set the maximum length of alternate names for dentries
9 default: 8_K
10 services:
11 - mds
12 flags:
13 - runtime
14- name: mds_valgrind_exit
15 type: bool
16 level: dev
17 default: false
18 services:
19 - mds
20 flags:
21 - runtime
22- name: mds_standby_replay_damaged
23 type: bool
24 level: dev
25 default: false
26 flags:
27 - runtime
28- name: mds_numa_node
29 type: int
30 level: advanced
31 desc: set mds's cpu affinity to a numa node (-1 for none)
32 default: -1
33 services:
34 - mds
35 flags:
36 - startup
37- name: mds_data
38 type: str
39 level: advanced
40 desc: path to MDS data and keyring
41 default: /var/lib/ceph/mds/$cluster-$id
42 services:
43 - mds
44 flags:
45 - no_mon_update
46 with_legacy: true
47- name: mds_join_fs
48 type: str
49 level: basic
50 desc: file system MDS prefers to join
51 long_desc: This setting indicates which file system name the MDS should prefer to
52 join (affinity). The monitors will try to have the MDS cluster safely reach a
53 state where all MDS have strong affinity, even via failovers to a standby.
54 services:
55 - mds
56 flags:
57 - runtime
58# max xattr kv pairs size for each dir/file
59- name: mds_max_xattr_pairs_size
60 type: size
61 level: advanced
62 desc: maximum aggregate size of extended attributes on a file
63 default: 64_K
64 services:
65 - mds
66 with_legacy: true
67- name: mds_cache_trim_interval
68 type: secs
69 level: advanced
70 desc: interval in seconds between cache trimming
71 default: 1
72 services:
73 - mds
74 flags:
75 - runtime
76- name: mds_cache_release_free_interval
77 type: secs
78 level: dev
79 desc: interval in seconds between heap releases
80 default: 10
81 services:
82 - mds
83 flags:
84 - runtime
85- name: mds_cache_memory_limit
86 type: size
87 level: basic
88 desc: target maximum memory usage of MDS cache
89 long_desc: This sets a target maximum memory usage of the MDS cache and is the primary
90 tunable to limit the MDS memory usage. The MDS will try to stay under a reservation
91 of this limit (by default 95%; 1 - mds_cache_reservation) by trimming unused metadata
92 in its cache and recalling cached items in the client caches. It is possible for
93 the MDS to exceed this limit due to slow recall from clients. The mds_health_cache_threshold
94 (150%) sets a cache full threshold for when the MDS signals a cluster health warning.
95 default: 4_G
96 services:
97 - mds
98 flags:
99 - runtime
100- name: mds_cache_reservation
101 type: float
102 level: advanced
103 desc: amount of memory to reserve for future cached objects
104 fmt_desc: The cache reservation (memory or inodes) for the MDS cache to maintain.
105 Once the MDS begins dipping into its reservation, it will recall
106 client state until its cache size shrinks to restore the
107 reservation.
108 default: 0.05
109 services:
110 - mds
111 flags:
112 - runtime
113- name: mds_health_cache_threshold
114 type: float
115 level: advanced
116 desc: threshold for cache size to generate health warning
117 default: 1.5
118 services:
119 - mds
120- name: mds_cache_mid
121 type: float
122 level: advanced
123 desc: midpoint for MDS cache LRU
124 fmt_desc: The insertion point for new items in the cache LRU
125 (from the top).
126 default: 0.7
127 services:
128 - mds
129- name: mds_cache_trim_decay_rate
130 type: float
131 level: advanced
132 desc: decay rate for trimming MDS cache throttle
133 default: 1
134 services:
135 - mds
136 flags:
137 - runtime
138- name: mds_cache_trim_threshold
139 type: size
140 level: advanced
141 desc: threshold for number of dentries that can be trimmed
142 default: 256_K
143 services:
144 - mds
145 flags:
146 - runtime
147- name: mds_max_file_recover
148 type: uint
149 level: advanced
150 desc: maximum number of files to recover file sizes in parallel
151 default: 32
152 services:
153 - mds
154 with_legacy: true
155- name: mds_dir_max_commit_size
156 type: int
157 level: advanced
158 desc: maximum size in megabytes for a RADOS write to a directory
159 fmt_desc: The maximum size of a directory update before Ceph breaks it into
160 smaller transactions (MB).
161 default: 10
162 services:
163 - mds
164 with_legacy: true
165- name: mds_dir_keys_per_op
166 type: int
167 level: advanced
168 desc: number of directory entries to read in one RADOS operation
169 default: 16384
170 services:
171 - mds
172 with_legacy: true
173- name: mds_decay_halflife
174 type: float
175 level: advanced
176 desc: rate of decay for temperature counters on each directory for balancing
177 default: 5
178 services:
179 - mds
180 with_legacy: true
181- name: mds_beacon_interval
182 type: float
183 level: advanced
184 desc: interval in seconds between MDS beacon messages sent to monitors
185 default: 4
186 services:
187 - mds
188 with_legacy: true
189- name: mds_beacon_grace
190 type: float
191 level: advanced
192 desc: tolerance in seconds for missed MDS beacons to monitors
193 fmt_desc: The interval without beacons before Ceph declares an MDS laggy
194 (and possibly replace it).
195 default: 15
196 services:
197 - mds
198 with_legacy: true
199- name: mds_heartbeat_grace
200 type: float
201 level: advanced
202 desc: tolerance in seconds for MDS internal heartbeat
203 default: 15
204 services:
205 - mds
206- name: mds_enforce_unique_name
207 type: bool
208 level: advanced
209 desc: require MDS name is unique in the cluster
210 default: true
211 services:
212 - mds
213 with_legacy: true
214# whether to blocklist clients whose sessions are dropped due to timeout
215- name: mds_session_blocklist_on_timeout
216 type: bool
217 level: advanced
218 desc: blocklist clients whose sessions have become stale
219 default: true
220 services:
221 - mds
222 with_legacy: true
223# whether to blocklist clients whose sessions are dropped via admin commands
224- name: mds_session_blocklist_on_evict
225 type: bool
226 level: advanced
227 desc: blocklist clients that have been evicted
228 default: true
229 services:
230 - mds
231 with_legacy: true
232# how many sessions should I try to load/store in a single OMAP operation?
233- name: mds_sessionmap_keys_per_op
234 type: uint
235 level: advanced
236 desc: number of omap keys to read from the SessionMap in one operation
237 default: 1_K
238 services:
239 - mds
240 with_legacy: true
241- name: mds_recall_max_caps
242 type: size
243 level: advanced
244 desc: maximum number of caps to recall from client session in single recall
245 default: 30000
246 services:
247 - mds
248 flags:
249 - runtime
250- name: mds_recall_max_decay_rate
251 type: float
252 level: advanced
253 desc: decay rate for throttle on recalled caps on a session
254 default: 1.5
255 services:
256 - mds
257 flags:
258 - runtime
259- name: mds_recall_max_decay_threshold
260 type: size
261 level: advanced
262 desc: decay threshold for throttle on recalled caps on a session
263 default: 128_K
264 services:
265 - mds
266 flags:
267 - runtime
268- name: mds_recall_global_max_decay_threshold
269 type: size
270 level: advanced
271 desc: decay threshold for throttle on recalled caps globally
272 default: 128_K
273 services:
274 - mds
275 flags:
276 - runtime
277- name: mds_recall_warning_threshold
278 type: size
279 level: advanced
280 desc: decay threshold for warning on slow session cap recall
281 default: 256_K
282 services:
283 - mds
284 flags:
285 - runtime
286- name: mds_recall_warning_decay_rate
287 type: float
288 level: advanced
289 desc: decay rate for warning on slow session cap recall
290 default: 60
291 services:
292 - mds
293 flags:
294 - runtime
295- name: mds_session_cache_liveness_decay_rate
296 type: float
297 level: advanced
298 desc: decay rate for session liveness leading to preemptive cap recall
299 long_desc: This determines how long a session needs to be quiescent before the MDS
300 begins preemptively recalling capabilities. The default of 5 minutes will cause
301 10 halvings of the decay counter after 1 hour, or 1/1024. The default magnitude
302 of 10 (1^10 or 1024) is chosen so that the MDS considers a previously chatty session
303 (approximately) to be quiescent after 1 hour.
304 default: 5_min
305 services:
306 - mds
307 see_also:
308 - mds_session_cache_liveness_magnitude
309 flags:
310 - runtime
311- name: mds_session_cache_liveness_magnitude
312 type: size
313 level: advanced
314 desc: decay magnitude for preemptively recalling caps on quiet client
315 long_desc: This is the order of magnitude difference (in base 2) of the internal
316 liveness decay counter and the number of capabilities the session holds. When
317 this difference occurs, the MDS treats the session as quiescent and begins recalling
318 capabilities.
319 default: 10
320 services:
321 - mds
322 see_also:
323 - mds_session_cache_liveness_decay_rate
324 flags:
325 - runtime
326- name: mds_session_cap_acquisition_decay_rate
327 type: float
328 level: advanced
329 desc: decay rate for session readdir caps leading to readdir throttle
330 long_desc: The half-life for the session cap acquisition counter of caps acquired
331 by readdir. This is used for throttling readdir requests from clients slow to
332 release caps.
333 default: 10
334 services:
335 - mds
336 flags:
337 - runtime
338- name: mds_session_cap_acquisition_throttle
339 type: uint
340 level: advanced
341 desc: throttle point for cap acquisition decay counter
342 default: 500000
343 services:
344 - mds
345- name: mds_session_max_caps_throttle_ratio
346 type: float
347 level: advanced
348 desc: ratio of mds_max_caps_per_client that client must exceed before readdir may
349 be throttled by cap acquisition throttle
350 default: 1.1
351 services:
352 - mds
353- name: mds_cap_acquisition_throttle_retry_request_timeout
354 type: float
355 level: advanced
356 desc: timeout in seconds after which a client request is retried due to cap acquisition
357 throttling
358 default: 0.5
359 services:
360 - mds
361# detecting freeze tree deadlock
362- name: mds_freeze_tree_timeout
363 type: float
364 level: dev
365 default: 30
366 services:
367 - mds
368 with_legacy: true
369# collapse N-client health metrics to a single 'many'
370- name: mds_health_summarize_threshold
371 type: int
372 level: advanced
373 desc: threshold of number of clients to summarize late client recall
374 default: 10
375 services:
376 - mds
377 with_legacy: true
378# seconds to wait for clients during mds restart
379# make it (mdsmap.session_timeout - mds_beacon_grace)
380- name: mds_reconnect_timeout
381 type: float
382 level: advanced
383 desc: timeout in seconds to wait for clients to reconnect during MDS reconnect recovery
384 state
385 default: 45
386 services:
387 - mds
388 with_legacy: true
389- name: mds_deny_all_reconnect
390 type: bool
391 level: advanced
392 desc: flag to deny all client reconnects during failover
393 default: false
394 services:
395 - mds
396 flags:
397 - runtime
398- name: mds_tick_interval
399 type: float
400 level: advanced
401 desc: time in seconds between upkeep tasks
402 fmt_desc: How frequently the MDS performs internal periodic tasks.
403 default: 5
404 services:
405 - mds
406 with_legacy: true
407# try to avoid propagating more often than this
408- name: mds_dirstat_min_interval
409 type: float
410 level: dev
411 default: 1
412 services:
413 - mds
414 fmt_desc: The minimum interval (in seconds) to try to avoid propagating
415 recursive stats up the tree.
416 with_legacy: true
417# how quickly dirstat changes propagate up the hierarchy
418- name: mds_scatter_nudge_interval
419 type: float
420 level: advanced
421 desc: minimum interval between scatter lock updates
422 fmt_desc: How quickly dirstat changes propagate up.
423 default: 5
424 services:
425 - mds
426 with_legacy: true
427- name: mds_client_prealloc_inos
428 type: int
429 level: advanced
430 desc: number of unused inodes to pre-allocate to clients for file creation
431 fmt_desc: The number of inode numbers to preallocate per client session.
432 default: 1000
433 services:
434 - mds
435 with_legacy: true
436- name: mds_client_delegate_inos_pct
437 type: uint
438 level: advanced
439 desc: percentage of preallocated inos to delegate to client
440 default: 50
441 services:
442 - mds
443 flags:
444 - runtime
445- name: mds_early_reply
446 type: bool
447 level: advanced
448 desc: additional reply to clients that metadata requests are complete but not yet
449 durable
450 fmt_desc: Determines whether the MDS should allow clients to see request
451 results before they commit to the journal.
452 default: true
453 services:
454 - mds
455 with_legacy: true
456- name: mds_replay_unsafe_with_closed_session
457 type: bool
458 level: advanced
459 desc: complete all the replay request when mds is restarted, no matter the session
460 is closed or not
461 default: false
462 services:
463 - mds
464 flags:
465 - startup
466- name: mds_default_dir_hash
467 type: int
468 level: advanced
469 desc: hash function to select directory fragment for dentry name
470 fmt_desc: The function to use for hashing files across directory fragments.
471 # CEPH_STR_HASH_RJENKINS
472 default: 2
473 services:
474 - mds
475 with_legacy: true
476- name: mds_log_pause
477 type: bool
478 level: dev
479 default: false
480 services:
481 - mds
482 with_legacy: true
483- name: mds_log_skip_corrupt_events
484 type: bool
485 level: dev
486 default: false
487 services:
488 - mds
489 fmt_desc: Determines whether the MDS should try to skip corrupt journal
490 events during journal replay.
491 with_legacy: true
492- name: mds_log_max_events
493 type: int
494 level: advanced
495 desc: maximum number of events in the MDS journal (-1 is unlimited)
496 fmt_desc: The maximum events in the journal before we initiate trimming.
497 Set to ``-1`` to disable limits.
498 default: -1
499 services:
500 - mds
501 with_legacy: true
502- name: mds_log_events_per_segment
503 type: int
504 level: advanced
505 desc: maximum number of events in an MDS journal segment
506 default: 1024
507 services:
508 - mds
509 with_legacy: true
510# segment size for mds log, default to default file_layout_t
511- name: mds_log_segment_size
512 type: size
513 level: advanced
514 desc: size in bytes of each MDS log segment
515 default: 0
516 services:
517 - mds
518 with_legacy: true
519- name: mds_log_max_segments
520 type: uint
521 level: advanced
522 desc: maximum number of segments which may be untrimmed
523 fmt_desc: The maximum number of segments (objects) in the journal before
524 we initiate trimming. Set to ``-1`` to disable limits.
525 default: 128
526 services:
527 - mds
528 with_legacy: true
529- name: mds_log_warn_factor
530 type: float
531 level: advanced
532 desc: trigger MDS_HEALTH_TRIM warning when the mds log is longer than mds_log_max_segments
533 * mds_log_warn_factor
534 default: 2
535 services:
536 - mds
537 min: 1
538 flags:
539 - runtime
540- name: mds_bal_export_pin
541 type: bool
542 level: advanced
543 desc: allow setting directory export pins to particular ranks
544 default: true
545 services:
546 - mds
547 with_legacy: true
548- name: mds_export_ephemeral_random
549 type: bool
550 level: advanced
551 desc: allow ephemeral random pinning of the loaded subtrees
552 long_desc: probabilistically pin the loaded directory inode and the subtree beneath
553 it to an MDS based on the consistent hash of the inode number. The higher this
554 value the more likely the loaded subtrees get pinned
555 default: true
556 services:
557 - mds
558 flags:
559 - runtime
560- name: mds_export_ephemeral_random_max
561 type: float
562 level: advanced
563 desc: the maximum percent permitted for random ephemeral pin policy
564 default: 0.01
565 services:
566 - mds
567 see_also:
568 - mds_export_ephemeral_random
569 min: 0
570 max: 1
571 flags:
572 - runtime
573- name: mds_export_ephemeral_distributed
574 type: bool
575 level: advanced
576 desc: allow ephemeral distributed pinning of the loaded subtrees
577 long_desc: 'pin the immediate child directories of the loaded directory inode based
578 on the consistent hash of the child''s inode number. '
579 default: true
580 services:
581 - mds
582 flags:
583 - runtime
584- name: mds_export_ephemeral_distributed_factor
585 type: float
586 level: advanced
587 desc: multiple of max_mds for splitting and distributing directory
588 default: 2
589 services:
590 - mds
591 min: 1
592 max: 100
593 flags:
594 - runtime
595- name: mds_bal_sample_interval
596 type: float
597 level: advanced
598 desc: interval in seconds between balancer ticks
599 fmt_desc: Determines how frequently to sample directory temperature
600 (for fragmentation decisions).
601 default: 3
602 services:
603 - mds
604 with_legacy: true
605- name: mds_bal_replicate_threshold
606 type: float
607 level: advanced
608 desc: hot popularity threshold to replicate a subtree
609 fmt_desc: The maximum temperature before Ceph attempts to replicate
610 metadata to other nodes.
611 default: 8000
612 services:
613 - mds
614 with_legacy: true
615- name: mds_bal_unreplicate_threshold
616 type: float
617 level: advanced
618 desc: cold popularity threshold to merge subtrees
619 fmt_desc: The minimum temperature before Ceph stops replicating
620 metadata to other nodes.
621 default: 0
622 services:
623 - mds
624 with_legacy: true
625- name: mds_bal_split_size
626 type: int
627 level: advanced
628 desc: minimum size of directory fragment before splitting
629 fmt_desc: The maximum directory size before the MDS will split a directory
630 fragment into smaller bits.
631 default: 10000
632 services:
633 - mds
634 with_legacy: true
635- name: mds_bal_split_rd
636 type: float
637 level: advanced
638 desc: hot read popularity threshold for splitting a directory fragment
639 fmt_desc: The maximum directory read temperature before Ceph splits
640 a directory fragment.
641 default: 25000
642 services:
643 - mds
644 with_legacy: true
645- name: mds_bal_split_wr
646 type: float
647 level: advanced
648 desc: hot write popularity threshold for splitting a directory fragment
649 fmt_desc: The maximum directory write temperature before Ceph splits
650 a directory fragment.
651 default: 10000
652 services:
653 - mds
654 with_legacy: true
655- name: mds_bal_split_bits
656 type: int
657 level: advanced
658 desc: power of two child fragments for a fragment on split
659 fmt_desc: The number of bits by which to split a directory fragment.
660 default: 3
661 services:
662 - mds
663 min: 1
664 max: 24
665 with_legacy: true
666- name: mds_bal_merge_size
667 type: int
668 level: advanced
669 desc: size of fragments where merging should occur
670 fmt_desc: The minimum directory size before Ceph tries to merge
671 adjacent directory fragments.
672 default: 50
673 services:
674 - mds
675 with_legacy: true
676- name: mds_bal_interval
677 type: int
678 level: advanced
679 desc: interval between MDS balancer cycles
680 fmt_desc: The frequency (in seconds) of workload exchanges between MDSs.
681 default: 10
682 services:
683 - mds
684- name: mds_bal_fragment_interval
685 type: int
686 level: advanced
687 desc: delay in seconds before interrupting client IO to perform splits
688 fmt_desc: The delay (in seconds) between a fragment being eligible for split
689 or merge and executing the fragmentation change.
690 default: 5
691 services:
692 - mds
693# order of magnitude higher than split size
694- name: mds_bal_fragment_size_max
695 type: int
696 level: advanced
697 desc: maximum size of a directory fragment before new creat/links fail
698 fmt_desc: The maximum size of a fragment before any new entries
699 are rejected with ENOSPC.
700 default: 100000
701 services:
702 - mds
703 with_legacy: true
704# multiple of size_max that triggers immediate split
705- name: mds_bal_fragment_fast_factor
706 type: float
707 level: advanced
708 desc: ratio of mds_bal_split_size at which fast fragment splitting occurs
709 fmt_desc: The ratio by which frags may exceed the split size before
710 a split is executed immediately (skipping the fragment interval)
711 default: 1.5
712 services:
713 - mds
714 with_legacy: true
715- name: mds_bal_fragment_dirs
716 type: bool
717 level: advanced
718 desc: enable directory fragmentation
719 long_desc: Directory fragmentation is a standard feature of CephFS that allows sharding
720 directories across multiple objects for performance and stability. Additionally,
721 this allows fragments to be distributed across multiple active MDSs to increase
722 throughput. Disabling (new) fragmentation should only be done in exceptional circumstances
723 and may lead to performance issues.
724 default: true
725 services:
726 - mds
727- name: mds_bal_idle_threshold
728 type: float
729 level: advanced
730 desc: idle metadata popularity threshold before rebalancing
731 fmt_desc: The minimum temperature before Ceph migrates a subtree
732 back to its parent.
733 default: 0
734 services:
735 - mds
736 with_legacy: true
737- name: mds_bal_max
738 type: int
739 level: dev
740 default: -1
741 services:
742 - mds
743 fmt_desc: The number of iterations to run balancer before Ceph stops.
744 (used for testing purposes only)
745 with_legacy: true
746- name: mds_bal_max_until
747 type: int
748 level: dev
749 default: -1
750 services:
751 - mds
752 fmt_desc: The number of seconds to run balancer before Ceph stops.
753 (used for testing purposes only)
754 with_legacy: true
755- name: mds_bal_mode
756 type: int
757 level: dev
758 default: 0
759 services:
760 - mds
761 fmt_desc: |
762 The method for calculating MDS load.
763
764 - ``0`` = Hybrid.
765 - ``1`` = Request rate and latency.
766 - ``2`` = CPU load.
767 with_legacy: true
768# must be this much above average before we export anything
769- name: mds_bal_min_rebalance
770 type: float
771 level: dev
772 desc: amount overloaded over internal target before balancer begins offloading
773 fmt_desc: The minimum subtree temperature before Ceph migrates.
774 default: 0.1
775 services:
776 - mds
777 with_legacy: true
778# if we need less than this, we don't do anything
779- name: mds_bal_min_start
780 type: float
781 level: dev
782 default: 0.2
783 services:
784 - mds
785 fmt_desc: The minimum subtree temperature before Ceph searches a subtree.
786 with_legacy: true
787# take within this range of what we need
788- name: mds_bal_need_min
789 type: float
790 level: dev
791 default: 0.8
792 services:
793 - mds
794 fmt_desc: The minimum fraction of target subtree size to accept.
795 with_legacy: true
796- name: mds_bal_need_max
797 type: float
798 level: dev
799 default: 1.2
800 services:
801 - mds
802 fmt_desc: The maximum fraction of target subtree size to accept.
803 with_legacy: true
804# any sub bigger than this taken in full
805- name: mds_bal_midchunk
806 type: float
807 level: dev
808 default: 0.3
809 services:
810 - mds
811 fmt_desc: Ceph will migrate any subtree that is larger than this fraction
812 of the target subtree size.
813 with_legacy: true
814# never take anything smaller than this
815- name: mds_bal_minchunk
816 type: float
817 level: dev
818 default: 0.001
819 services:
820 - mds
821 fmt_desc: Ceph will ignore any subtree that is smaller than this fraction
822 of the target subtree size.
823 with_legacy: true
824# target decay half-life in MDSMap (2x larger is approx. 2x slower)
825- name: mds_bal_target_decay
826 type: float
827 level: advanced
828 desc: rate of decay for export targets communicated to clients
829 default: 10
830 services:
831 - mds
832 with_legacy: true
833- name: mds_oft_prefetch_dirfrags
834 type: bool
835 level: advanced
836 desc: prefetch dirfrags recorded in open file table on startup
1d09f67e 837 default: false
20effc67
TL
838 services:
839 - mds
840 flags:
841 - startup
842# time to wait before starting replay again
843- name: mds_replay_interval
844 type: float
845 level: advanced
846 desc: time in seconds between replay of updates to journal by standby replay MDS
847 fmt_desc: The journal poll interval when in standby-replay mode.
848 ("hot standby")
849 default: 1
850 services:
851 - mds
852 with_legacy: true
853- name: mds_shutdown_check
854 type: int
855 level: dev
856 default: 0
857 services:
858 - mds
859 fmt_desc: The interval for polling the cache during MDS shutdown.
860 with_legacy: true
861- name: mds_thrash_exports
862 type: int
863 level: dev
864 default: 0
865 services:
866 - mds
867 fmt_desc: Ceph will randomly export subtrees between nodes (testing only).
868 with_legacy: true
869- name: mds_thrash_fragments
870 type: int
871 level: dev
872 default: 0
873 services:
874 - mds
875 fmt_desc: Ceph will randomly fragment or merge directories.
876 with_legacy: true
877- name: mds_dump_cache_on_map
878 type: bool
879 level: dev
880 default: false
881 services:
882 - mds
883 fmt_desc: Ceph will dump the MDS cache contents to a file on each MDSMap.
884 with_legacy: true
885- name: mds_dump_cache_after_rejoin
886 type: bool
887 level: dev
888 default: false
889 services:
890 - mds
891 fmt_desc: Ceph will dump MDS cache contents to a file after
892 rejoining the cache (during recovery).
893 with_legacy: true
894- name: mds_verify_scatter
895 type: bool
896 level: dev
897 default: false
898 services:
899 - mds
900 fmt_desc: Ceph will assert that various scatter/gather invariants
901 are ``true`` (developers only).
902 with_legacy: true
903- name: mds_debug_scatterstat
904 type: bool
905 level: dev
906 default: false
907 services:
908 - mds
909 fmt_desc: Ceph will assert that various recursive stat invariants
910 are ``true`` (for developers only).
911 with_legacy: true
912- name: mds_debug_frag
913 type: bool
914 level: dev
915 default: false
916 services:
917 - mds
918 fmt_desc: Ceph will verify directory fragmentation invariants
919 when convenient (developers only).
920 with_legacy: true
921- name: mds_debug_auth_pins
922 type: bool
923 level: dev
924 default: false
925 services:
926 - mds
927 fmt_desc: The debug auth pin invariants (for developers only).
928 with_legacy: true
929- name: mds_debug_subtrees
930 type: bool
931 level: dev
932 default: false
933 services:
934 - mds
935 fmt_desc: The debug subtree invariants (for developers only).
936 with_legacy: true
937- name: mds_kill_mdstable_at
938 type: int
939 level: dev
940 default: 0
941 services:
942 - mds
943 fmt_desc: Ceph will inject MDS failure in MDSTable code
944 (for developers only).
945 with_legacy: true
946- name: mds_max_export_size
947 type: size
948 level: dev
949 default: 20_M
950 services:
951 - mds
952- name: mds_kill_export_at
953 type: int
954 level: dev
955 default: 0
956 services:
957 - mds
958 fmt_desc: Ceph will inject MDS failure in the subtree export code
959 (for developers only).
960 with_legacy: true
961- name: mds_kill_import_at
962 type: int
963 level: dev
964 default: 0
965 services:
966 - mds
967 fmt_desc: Ceph will inject MDS failure in the subtree import code
968 (for developers only).
969 with_legacy: true
970- name: mds_kill_link_at
971 type: int
972 level: dev
973 default: 0
974 services:
975 - mds
976 fmt_desc: Ceph will inject MDS failure in hard link code
977 (for developers only).
978 with_legacy: true
979- name: mds_kill_rename_at
980 type: int
981 level: dev
982 default: 0
983 services:
984 - mds
985 fmt_desc: Ceph will inject MDS failure in the rename code
986 (for developers only).
987 with_legacy: true
988- name: mds_kill_openc_at
989 type: int
990 level: dev
991 default: 0
992 services:
993 - mds
994 with_legacy: true
995# XXX
996- name: mds_kill_journal_at
997 type: int
998 level: dev
999 default: 0
1000 services:
1001 - mds
1002- name: mds_kill_journal_expire_at
1003 type: int
1004 level: dev
1005 default: 0
1006 services:
1007 - mds
1008 with_legacy: true
1009- name: mds_kill_journal_replay_at
1010 type: int
1011 level: dev
1012 default: 0
1013 services:
1014 - mds
1015 with_legacy: true
1016- name: mds_journal_format
1017 type: uint
1018 level: dev
1019 default: 1
1020 services:
1021 - mds
1022 with_legacy: true
1023- name: mds_kill_create_at
1024 type: int
1025 level: dev
1026 default: 0
1027 services:
1028 - mds
1029 with_legacy: true
1030# percentage of MDS modify replies to skip sending the client a trace on [0-1]
1031- name: mds_inject_traceless_reply_probability
1032 type: float
1033 level: dev
1034 default: 0
1035 services:
1036 - mds
1037 with_legacy: true
1038- name: mds_wipe_sessions
1039 type: bool
1040 level: dev
1041 default: false
1042 services:
1043 - mds
1044 fmt_desc: Ceph will delete all client sessions on startup
1045 (for testing only).
1046 with_legacy: true
1047- name: mds_wipe_ino_prealloc
1048 type: bool
1049 level: dev
1050 default: false
1051 services:
1052 - mds
1053 fmt_desc: Ceph will delete ino preallocation metadata on startup
1054 (for testing only).
1055 with_legacy: true
1056- name: mds_skip_ino
1057 type: int
1058 level: dev
1059 default: 0
1060 services:
1061 - mds
1062 fmt_desc: The number of inode numbers to skip on startup
1063 (for testing only).
1064 with_legacy: true
1065- name: mds_enable_op_tracker
1066 type: bool
1067 level: advanced
1068 desc: track remote operation progression and statistics
1069 default: true
1070 services:
1071 - mds
1072 with_legacy: true
1073# Max number of completed ops to track
1074- name: mds_op_history_size
1075 type: uint
1076 level: advanced
1077 desc: maximum size for list of historical operations
1078 default: 20
1079 services:
1080 - mds
1081 with_legacy: true
1082# Oldest completed op to track
1083- name: mds_op_history_duration
1084 type: uint
1085 level: advanced
1086 desc: expiration time in seconds of historical operations
1087 default: 600
1088 services:
1089 - mds
1090 with_legacy: true
1091# how many seconds old makes an op complaint-worthy
1092- name: mds_op_complaint_time
1093 type: float
1094 level: advanced
1095 desc: time in seconds to consider an operation blocked after no updates
1096 default: 30
1097 services:
1098 - mds
1099 with_legacy: true
1100# how many op log messages to show in one go
1101- name: mds_op_log_threshold
1102 type: int
1103 level: dev
1104 default: 5
1105 services:
1106 - mds
1107 with_legacy: true
1108- name: mds_snap_min_uid
1109 type: uint
1110 level: advanced
1111 desc: minimum uid of client to perform snapshots
1112 default: 0
1113 services:
1114 - mds
1115 with_legacy: true
1116- name: mds_snap_max_uid
1117 type: uint
1118 level: advanced
1119 desc: maximum uid of client to perform snapshots
1120 default: 4294967294
1121 services:
1122 - mds
1123 with_legacy: true
1124- name: mds_snap_rstat
1125 type: bool
1126 level: advanced
1127 desc: enabled nested rstat for snapshots
1128 default: false
1129 services:
1130 - mds
1131 with_legacy: true
1132- name: mds_verify_backtrace
1133 type: uint
1134 level: dev
1135 default: 1
1136 services:
1137 - mds
1138 with_legacy: true
1139# detect clients which aren't trimming completed requests
1140- name: mds_max_completed_flushes
1141 type: uint
1142 level: dev
1143 default: 100000
1144 services:
1145 - mds
1146 with_legacy: true
1147- name: mds_max_completed_requests
1148 type: uint
1149 level: dev
1150 default: 100000
1151 services:
1152 - mds
1153 with_legacy: true
1154- name: mds_action_on_write_error
1155 type: uint
1156 level: advanced
1157 desc: action to take when MDS cannot write to RADOS (0:ignore, 1:read-only, 2:suicide)
1158 default: 1
1159 services:
1160 - mds
1161 with_legacy: true
1162- name: mds_mon_shutdown_timeout
1163 type: float
1164 level: advanced
1165 desc: time to wait for mon to receive damaged MDS rank notification
1166 default: 5
1167 services:
1168 - mds
1169 with_legacy: true
1170# Maximum number of concurrent stray files to purge
1171- name: mds_max_purge_files
1172 type: uint
1173 level: advanced
1174 desc: maximum number of deleted files to purge in parallel
1175 default: 64
1176 services:
1177 - mds
1178 with_legacy: true
1179# Maximum number of concurrent RADOS ops to issue in purging
1180- name: mds_max_purge_ops
1181 type: uint
1182 level: advanced
1183 desc: maximum number of purge operations performed in parallel
1184 default: 8_K
1185 services:
1186 - mds
1187 with_legacy: true
1188# Maximum number of concurrent RADOS ops to issue in purging, scaled by PG count
1189- name: mds_max_purge_ops_per_pg
1190 type: float
1191 level: advanced
1192 desc: number of parallel purge operations performed per PG
1193 default: 0.5
1194 services:
1195 - mds
1196 with_legacy: true
1197- name: mds_purge_queue_busy_flush_period
1198 type: float
1199 level: dev
1200 default: 1
1201 services:
1202 - mds
1203 with_legacy: true
1204- name: mds_root_ino_uid
1205 type: int
1206 level: advanced
1207 desc: default uid for new root directory
1208 default: 0
1209 services:
1210 - mds
1211 with_legacy: true
1212- name: mds_root_ino_gid
1213 type: int
1214 level: advanced
1215 desc: default gid for new root directory
1216 default: 0
1217 services:
1218 - mds
1219 with_legacy: true
1220- name: mds_max_scrub_ops_in_progress
1221 type: int
1222 level: advanced
1223 desc: maximum number of scrub operations performed in parallel
1224 default: 5
1225 services:
1226 - mds
1227 with_legacy: true
1228- name: mds_forward_all_requests_to_auth
1229 type: bool
1230 level: advanced
1231 desc: always process op on auth mds
1232 default: false
1233 services:
1234 - mds
1235 flags:
1236 - runtime
1237# Maximum number of damaged frags/dentries before whole MDS rank goes damaged
1238- name: mds_damage_table_max_entries
1239 type: int
1240 level: advanced
1241 desc: maximum number of damage table entries
1242 default: 10000
1243 services:
1244 - mds
1245 with_legacy: true
1246# Maximum increment for client writable range, counted by number of objects
1247- name: mds_client_writeable_range_max_inc_objs
1248 type: uint
1249 level: advanced
1250 desc: maximum number of objects in writeable range of a file for a client
1251 default: 1_K
1252 services:
1253 - mds
1254 with_legacy: true
1255- name: mds_min_caps_per_client
1256 type: uint
1257 level: advanced
1258 desc: minimum number of capabilities a client may hold
1259 default: 100
1260 services:
1261 - mds
1262- name: mds_min_caps_working_set
1263 type: uint
1264 level: advanced
1265 desc: number of capabilities a client may hold without cache pressure warnings generated
1266 default: 10000
1267 services:
1268 - mds
1269 flags:
1270 - runtime
1271- name: mds_max_caps_per_client
1272 type: uint
1273 level: advanced
1274 desc: maximum number of capabilities a client may hold
1275 default: 1_M
1276 services:
1277 - mds
1278- name: mds_hack_allow_loading_invalid_metadata
1279 type: bool
1280 level: advanced
1281 desc: INTENTIONALLY CAUSE DATA LOSS by bypasing checks for invalid metadata on disk.
1282 Allows testing repair tools.
1283 default: false
1284 services:
1285 - mds
1286- name: mds_defer_session_stale
1287 type: bool
1288 level: dev
1289 default: true
1290 services:
1291 - mds
1292- name: mds_inject_migrator_session_race
1293 type: bool
1294 level: dev
1295 default: false
1296 services:
1297 - mds
1298- name: mds_request_load_average_decay_rate
1299 type: float
1300 level: advanced
1301 desc: rate of decay in seconds for calculating request load average
1302 default: 1_min
1303 services:
1304 - mds
1305- name: mds_cap_revoke_eviction_timeout
1306 type: float
1307 level: advanced
1308 desc: number of seconds after which clients which have not responded to cap revoke
1309 messages by the MDS are evicted.
1310 default: 0
1311 services:
1312 - mds
1313- name: mds_max_retries_on_remount_failure
1314 type: uint
1315 level: advanced
1316 desc: number of consecutive failed remount attempts for invalidating kernel dcache
1317 after which client would abort.
1318 default: 5
1319 services:
1320 - mds
1321- name: mds_dump_cache_threshold_formatter
1322 type: size
1323 level: dev
1324 desc: threshold for cache usage to disallow "dump cache" operation to formatter
1325 long_desc: Disallow MDS from dumping caches to formatter via "dump cache" command
1326 if cache usage exceeds this threshold.
1327 default: 1_G
1328 services:
1329 - mds
1330- name: mds_dump_cache_threshold_file
1331 type: size
1332 level: dev
1333 desc: threshold for cache usage to disallow "dump cache" operation to file
1334 long_desc: Disallow MDS from dumping caches to file via "dump cache" command if
1335 cache usage exceeds this threshold.
1336 default: 0
1337 services:
1338 - mds
1339- name: mds_task_status_update_interval
1340 type: float
1341 level: dev
1342 desc: task status update interval to manager
1343 long_desc: interval (in seconds) for sending mds task status to ceph manager
1344 default: 2
1345 services:
1346 - mds
1347- name: mds_max_snaps_per_dir
1348 type: uint
1349 level: advanced
1350 desc: max snapshots per directory
1351 long_desc: maximum number of snapshots that can be created per directory
1352 default: 100
1353 services:
1354 - mds
1355 min: 0
1356 max: 4_K
1357 flags:
1358 - runtime
1359- name: mds_asio_thread_count
1360 type: uint
1361 level: advanced
1362 desc: Size of thread pool for ASIO completions
1363 default: 2
1364 tags:
1365 - mds
1366 services:
1367 - mds
1368 min: 1
1369- name: mds_ping_grace
1370 type: secs
1371 level: advanced
1372 desc: timeout after which an MDS is considered laggy by rank 0 MDS.
1373 long_desc: timeout for replying to a ping message sent by rank 0 after which an
1374 active MDS considered laggy (delayed metrics) by rank 0.
1375 default: 15
1376 services:
1377 - mds
1378 flags:
1379 - runtime
1380- name: mds_ping_interval
1381 type: secs
1382 level: advanced
1383 desc: interval in seconds for sending ping messages to active MDSs.
1384 long_desc: interval in seconds for rank 0 to send ping messages to all active MDSs.
1385 default: 5
1386 services:
1387 - mds
1388 flags:
1389 - runtime
1390- name: mds_metrics_update_interval
1391 type: secs
1392 level: advanced
1393 desc: interval in seconds for metrics data update.
1394 long_desc: interval in seconds after which active MDSs send client metrics data
1395 to rank 0.
1396 default: 2
1397 services:
1398 - mds
1399 flags:
1400 - runtime
1401- name: mds_dir_max_entries
1402 type: uint
1403 level: advanced
1404 desc: maximum number of entries per directory before new creat/links fail
1405 long_desc: The maximum number of entries before any new entries
1406 are rejected with ENOSPC.
1407 default: 0
1408 services:
1409 - mds
1410 flags:
1411 - runtime
1412- name: mds_sleep_rank_change
1413 type: float
1414 level: dev
1415 default: 0.0
1416 flags:
1417 - runtime
1418- name: mds_connect_bootstrapping
1419 type: bool
1420 level: dev
1421 default: false
1422 flags:
1423 - runtime
1424- name: mds_symlink_recovery
1425 type: bool
1426 level: advanced
1427 desc: Stores symlink target on the first data object of symlink file.
1428 Allows recover of symlink using recovery tools.
1429 default: true
1430 services:
1431 - mds
1432 flags:
1433 - runtime