[ceph.git] / ceph / qa / tasks / cephfs / test_sessionmap.py

import time
import json
import logging

from tasks.cephfs.fuse_mount import FuseMount
from teuthology.exceptions import CommandFailedError
from tasks.cephfs.cephfs_test_case import CephFSTestCase

log = logging.getLogger(__name__)


class TestSessionMap(CephFSTestCase):
    CLIENTS_REQUIRED = 2
    MDSS_REQUIRED = 2

    def test_tell_session_drop(self):
        """
        That when a `tell` command is sent using the python CLI,
        its MDS session is gone after it terminates
        """
        self.mount_a.umount_wait()
        self.mount_b.umount_wait()

        status = self.fs.status()
        self.fs.rank_tell(["session", "ls"], status=status)

        ls_data = self.fs.rank_asok(['session', 'ls'], status=status)
        self.assertEqual(len(ls_data), 0)

    def _get_connection_count(self, status=None):
        perf = self.fs.rank_asok(["perf", "dump"], status=status)
        conn = 0
        for module, dump in perf.items():
            if "AsyncMessenger::Worker" in module:
                conn += dump['msgr_active_connections']
        return conn

    def test_tell_conn_close(self):
        """
        That when a `tell` command is sent using the python CLI,
        the conn count goes back to where it started (i.e. we aren't
        leaving connections open)
        """
        self.mount_a.umount_wait()
        self.mount_b.umount_wait()

        status = self.fs.status()
        s = self._get_connection_count(status=status)
        self.fs.rank_tell(["session", "ls"], status=status)
        e = self._get_connection_count(status=status)

        self.assertEqual(s, e)

    def test_mount_conn_close(self):
        """
        That when a client unmounts, the thread count on the MDS goes back
        to what it was before the client mounted
        """
        self.mount_a.umount_wait()
        self.mount_b.umount_wait()

        status = self.fs.status()
        s = self._get_connection_count(status=status)
        self.mount_a.mount_wait()
        self.assertGreater(self._get_connection_count(status=status), s)
        self.mount_a.umount_wait()
        e = self._get_connection_count(status=status)

        self.assertEqual(s, e)

    def test_version_splitting(self):
        """
        That when many sessions are updated, they are correctly
        split into multiple versions to obey mds_sessionmap_keys_per_op
        """

        self.mount_a.umount_wait()
        self.mount_b.umount_wait()

        # Configure MDS to write one OMAP key at once
        self.set_conf('mds', 'mds_sessionmap_keys_per_op', 1)
        self.fs.mds_fail_restart()
        status = self.fs.wait_for_daemons()

        # Bring the clients back
        self.mount_a.mount_wait()
        self.mount_b.mount_wait()

        # See that they've got sessions
        self.assert_session_count(2, mds_id=self.fs.get_rank(status=status)['name'])

        # See that we persist their sessions
        self.fs.rank_asok(["flush", "journal"], rank=0, status=status)
        table_json = json.loads(self.fs.table_tool(["0", "show", "session"]))
        log.info("SessionMap: {0}".format(json.dumps(table_json, indent=2)))
        self.assertEqual(table_json['0']['result'], 0)
        self.assertEqual(len(table_json['0']['data']['sessions']), 2)

        # Now, induce a "force_open_sessions" event by exporting a dir
        self.mount_a.run_shell(["mkdir", "bravo"])
        self.mount_a.run_shell(["touch", "bravo/file_a"])
        self.mount_b.run_shell(["touch", "bravo/file_b"])

        self.fs.set_max_mds(2)
        status = self.fs.wait_for_daemons()

        def get_omap_wrs():
            return self.fs.rank_asok(['perf', 'dump', 'objecter'], rank=1, status=status)['objecter']['omap_wr']

        # Flush so that there are no dirty sessions on rank 1
        self.fs.rank_asok(["flush", "journal"], rank=1, status=status)

        # Export so that we get a force_open to rank 1 for the two sessions from rank 0
        initial_omap_wrs = get_omap_wrs()
        self.fs.rank_asok(['export', 'dir', '/bravo', '1'], rank=0, status=status)

        # This is the critical (if rather subtle) check: that in the process of doing an export dir,
        # we hit force_open_sessions, and as a result we end up writing out the sessionmap.  There
        # will be two sessions dirtied here, and because we have set keys_per_op to 1, we should see
        # a single session get written out (the first of the two, triggered by the second getting marked
        # dirty)
        # The number of writes is two per session, because the header (sessionmap version) update and
        # KV write both count. Also, multiply by 2 for each openfile table update.
        self.wait_until_true(
            lambda: get_omap_wrs() - initial_omap_wrs == 2*2,
            timeout=30  # Long enough for an export to get acked
        )

        # Now end our sessions and check the backing sessionmap is updated correctly
        self.mount_a.umount_wait()
        self.mount_b.umount_wait()

        # In-memory sessionmap check
        self.assert_session_count(0, mds_id=self.fs.get_rank(status=status)['name'])

        # On-disk sessionmap check
        self.fs.rank_asok(["flush", "journal"], rank=0, status=status)
        table_json = json.loads(self.fs.table_tool(["0", "show", "session"]))
        log.info("SessionMap: {0}".format(json.dumps(table_json, indent=2)))
        self.assertEqual(table_json['0']['result'], 0)
        self.assertEqual(len(table_json['0']['data']['sessions']), 0)

    def _configure_auth(self, mount, id_name, mds_caps, osd_caps=None, mon_caps=None):
        """
        Set up auth credentials for a client mount, and write out the keyring
        for the client to use.
        """

        if osd_caps is None:
            osd_caps = "allow rw"

        if mon_caps is None:
            mon_caps = "allow r"

        out = self.fs.mon_manager.raw_cluster_cmd(
            "auth", "get-or-create", "client.{name}".format(name=id_name),
            "mds", mds_caps,
            "osd", osd_caps,
            "mon", mon_caps
        )
        mount.client_id = id_name
        mount.client_remote.write_file(mount.get_keyring_path(), out, sudo=True)
        self.set_conf("client.{name}".format(name=id_name), "keyring", mount.get_keyring_path())

    def test_session_reject(self):
        if not isinstance(self.mount_a, FuseMount):
            self.skipTest("Requires FUSE client to inject client metadata")

        self.mount_a.run_shell(["mkdir", "foo"])
        self.mount_a.run_shell(["mkdir", "foo/bar"])
        self.mount_a.umount_wait()

        # Mount B will be my rejected client
        self.mount_b.umount_wait()

        # Configure a client that is limited to /foo/bar
        self._configure_auth(self.mount_b, "badguy", "allow rw path=/foo/bar")
        # Check he can mount that dir and do IO
        self.mount_b.mount_wait(cephfs_mntpt="/foo/bar")
        self.mount_b.create_destroy()
        self.mount_b.umount_wait()

        # Configure the client to claim that its mount point metadata is /baz
        self.set_conf("client.badguy", "client_metadata", "root=/baz")
        # Try to mount the client, see that it fails
        with self.assert_cluster_log("client session with non-allowable root '/baz' denied"):
            with self.assertRaises(CommandFailedError):
                self.mount_b.mount_wait(cephfs_mntpt="/foo/bar")

    def test_session_evict_blocklisted(self):
        """
        Check that mds evicts blocklisted client
        """
        if not isinstance(self.mount_a, FuseMount):
            self.skipTest("Requires FUSE client to use "
                          "mds_cluster.is_addr_blocklisted()")

        self.fs.set_max_mds(2)
        status = self.fs.wait_for_daemons()

        self.mount_a.run_shell_payload("mkdir {d0,d1} && touch {d0,d1}/file")
        self.mount_a.setfattr("d0", "ceph.dir.pin", "0")
        self.mount_a.setfattr("d1", "ceph.dir.pin", "1")
        self._wait_subtrees([('/d0', 0), ('/d1', 1)], status=status)

        self.mount_a.run_shell(["touch", "d0/f0"])
        self.mount_a.run_shell(["touch", "d1/f0"])
        self.mount_b.run_shell(["touch", "d0/f1"])
        self.mount_b.run_shell(["touch", "d1/f1"])

        self.assert_session_count(2, mds_id=self.fs.get_rank(rank=0, status=status)['name'])
        self.assert_session_count(2, mds_id=self.fs.get_rank(rank=1, status=status)['name'])

        mount_a_client_id = self.mount_a.get_global_id()
        self.fs.mds_asok(['session', 'evict', "%s" % mount_a_client_id],
                         mds_id=self.fs.get_rank(rank=0, status=status)['name'])
        self.wait_until_true(lambda: self.mds_cluster.is_addr_blocklisted(
            self.mount_a.get_global_addr()), timeout=30)

        # 10 seconds should be enough for evicting client
        time.sleep(10)
        self.assert_session_count(1, mds_id=self.fs.get_rank(rank=0, status=status)['name'])
        self.assert_session_count(1, mds_id=self.fs.get_rank(rank=1, status=status)['name'])

        self.mount_a.kill_cleanup()
        self.mount_a.mount_wait()
Commit	Line	Data
81eedcae	1	import time
7c673cae FG	2	import json
7c673cae FG	3	import logging
7c673cae FG	4
	5	from tasks.cephfs.fuse_mount import FuseMount
	6	from teuthology.exceptions import CommandFailedError
	7	from tasks.cephfs.cephfs_test_case import CephFSTestCase
	8
	9	log = logging.getLogger(__name__)
	10
	11
	12	class TestSessionMap(CephFSTestCase):
	13	CLIENTS_REQUIRED = 2
	14	MDSS_REQUIRED = 2
	15
	16	def test_tell_session_drop(self):
	17	"""
	18	That when a `tell` command is sent using the python CLI,
	19	its MDS session is gone after it terminates
	20	"""
	21	self.mount_a.umount_wait()
	22	self.mount_b.umount_wait()
	23
81eedcae TL	24	status = self.fs.status()
81eedcae TL	25	self.fs.rank_tell(["session", "ls"], status=status)
7c673cae	26
81eedcae	27	ls_data = self.fs.rank_asok(['session', 'ls'], status=status)
7c673cae FG	28	self.assertEqual(len(ls_data), 0)
7c673cae FG	29
81eedcae TL	30	def _get_connection_count(self, status=None):
	31	perf = self.fs.rank_asok(["perf", "dump"], status=status)
	32	conn = 0
9f95a23c	33	for module, dump in perf.items():
81eedcae TL	34	if "AsyncMessenger::Worker" in module:
	35	conn += dump['msgr_active_connections']
	36	return conn
7c673cae FG	37
	38	def test_tell_conn_close(self):
	39	"""
	40	That when a `tell` command is sent using the python CLI,
81eedcae	41	the conn count goes back to where it started (i.e. we aren't
7c673cae FG	42	leaving connections open)
	43	"""
	44	self.mount_a.umount_wait()
	45	self.mount_b.umount_wait()
	46
81eedcae TL	47	status = self.fs.status()
	48	s = self._get_connection_count(status=status)
	49	self.fs.rank_tell(["session", "ls"], status=status)
	50	e = self._get_connection_count(status=status)
7c673cae	51
81eedcae	52	self.assertEqual(s, e)
7c673cae FG	53
	54	def test_mount_conn_close(self):
	55	"""
	56	That when a client unmounts, the thread count on the MDS goes back
	57	to what it was before the client mounted
	58	"""
	59	self.mount_a.umount_wait()
	60	self.mount_b.umount_wait()
	61
81eedcae TL	62	status = self.fs.status()
81eedcae TL	63	s = self._get_connection_count(status=status)
e306af50	64	self.mount_a.mount_wait()
81eedcae	65	self.assertGreater(self._get_connection_count(status=status), s)
7c673cae	66	self.mount_a.umount_wait()
81eedcae	67	e = self._get_connection_count(status=status)
7c673cae	68
81eedcae	69	self.assertEqual(s, e)
7c673cae FG	70
	71	def test_version_splitting(self):
	72	"""
	73	That when many sessions are updated, they are correctly
	74	split into multiple versions to obey mds_sessionmap_keys_per_op
	75	"""
	76
7c673cae FG	77	self.mount_a.umount_wait()
	78	self.mount_b.umount_wait()
	79
	80	# Configure MDS to write one OMAP key at once
	81	self.set_conf('mds', 'mds_sessionmap_keys_per_op', 1)
	82	self.fs.mds_fail_restart()
9f95a23c	83	status = self.fs.wait_for_daemons()
7c673cae FG	84
7c673cae FG	85	# Bring the clients back
e306af50 TL	86	self.mount_a.mount_wait()
e306af50 TL	87	self.mount_b.mount_wait()
7c673cae FG	88
7c673cae FG	89	# See that they've got sessions
81eedcae	90	self.assert_session_count(2, mds_id=self.fs.get_rank(status=status)['name'])
7c673cae FG	91
7c673cae FG	92	# See that we persist their sessions
81eedcae	93	self.fs.rank_asok(["flush", "journal"], rank=0, status=status)
7c673cae FG	94	table_json = json.loads(self.fs.table_tool(["0", "show", "session"]))
	95	log.info("SessionMap: {0}".format(json.dumps(table_json, indent=2)))
	96	self.assertEqual(table_json['0']['result'], 0)
92f5a8d4	97	self.assertEqual(len(table_json['0']['data']['sessions']), 2)
7c673cae FG	98
	99	# Now, induce a "force_open_sessions" event by exporting a dir
	100	self.mount_a.run_shell(["mkdir", "bravo"])
9f95a23c TL	101	self.mount_a.run_shell(["touch", "bravo/file_a"])
	102	self.mount_b.run_shell(["touch", "bravo/file_b"])
	103
	104	self.fs.set_max_mds(2)
	105	status = self.fs.wait_for_daemons()
7c673cae FG	106
7c673cae FG	107	def get_omap_wrs():
81eedcae	108	return self.fs.rank_asok(['perf', 'dump', 'objecter'], rank=1, status=status)['objecter']['omap_wr']
7c673cae FG	109
7c673cae FG	110	# Flush so that there are no dirty sessions on rank 1
81eedcae	111	self.fs.rank_asok(["flush", "journal"], rank=1, status=status)
7c673cae FG	112
	113	# Export so that we get a force_open to rank 1 for the two sessions from rank 0
	114	initial_omap_wrs = get_omap_wrs()
81eedcae	115	self.fs.rank_asok(['export', 'dir', '/bravo', '1'], rank=0, status=status)
7c673cae FG	116
	117	# This is the critical (if rather subtle) check: that in the process of doing an export dir,
	118	# we hit force_open_sessions, and as a result we end up writing out the sessionmap. There
	119	# will be two sessions dirtied here, and because we have set keys_per_op to 1, we should see
	120	# a single session get written out (the first of the two, triggered by the second getting marked
	121	# dirty)
	122	# The number of writes is two per session, because the header (sessionmap version) update and
11fdf7f2	123	# KV write both count. Also, multiply by 2 for each openfile table update.
7c673cae	124	self.wait_until_true(
11fdf7f2 TL	125	lambda: get_omap_wrs() - initial_omap_wrs == 2*2,
11fdf7f2 TL	126	timeout=30 # Long enough for an export to get acked
7c673cae FG	127	)
	128
	129	# Now end our sessions and check the backing sessionmap is updated correctly
	130	self.mount_a.umount_wait()
	131	self.mount_b.umount_wait()
	132
	133	# In-memory sessionmap check
81eedcae	134	self.assert_session_count(0, mds_id=self.fs.get_rank(status=status)['name'])
7c673cae FG	135
7c673cae FG	136	# On-disk sessionmap check
81eedcae	137	self.fs.rank_asok(["flush", "journal"], rank=0, status=status)
7c673cae FG	138	table_json = json.loads(self.fs.table_tool(["0", "show", "session"]))
	139	log.info("SessionMap: {0}".format(json.dumps(table_json, indent=2)))
	140	self.assertEqual(table_json['0']['result'], 0)
92f5a8d4	141	self.assertEqual(len(table_json['0']['data']['sessions']), 0)
7c673cae	142
7c673cae FG	143	def _configure_auth(self, mount, id_name, mds_caps, osd_caps=None, mon_caps=None):
	144	"""
	145	Set up auth credentials for a client mount, and write out the keyring
	146	for the client to use.
	147	"""
	148
	149	if osd_caps is None:
	150	osd_caps = "allow rw"
	151
	152	if mon_caps is None:
	153	mon_caps = "allow r"
	154
	155	out = self.fs.mon_manager.raw_cluster_cmd(
	156	"auth", "get-or-create", "client.{name}".format(name=id_name),
	157	"mds", mds_caps,
	158	"osd", osd_caps,
	159	"mon", mon_caps
	160	)
	161	mount.client_id = id_name
f67539c2	162	mount.client_remote.write_file(mount.get_keyring_path(), out, sudo=True)
7c673cae FG	163	self.set_conf("client.{name}".format(name=id_name), "keyring", mount.get_keyring_path())
	164
	165	def test_session_reject(self):
	166	if not isinstance(self.mount_a, FuseMount):
9f95a23c	167	self.skipTest("Requires FUSE client to inject client metadata")
7c673cae FG	168
	169	self.mount_a.run_shell(["mkdir", "foo"])
	170	self.mount_a.run_shell(["mkdir", "foo/bar"])
	171	self.mount_a.umount_wait()
	172
	173	# Mount B will be my rejected client
	174	self.mount_b.umount_wait()
	175
	176	# Configure a client that is limited to /foo/bar
	177	self._configure_auth(self.mount_b, "badguy", "allow rw path=/foo/bar")
	178	# Check he can mount that dir and do IO
f67539c2	179	self.mount_b.mount_wait(cephfs_mntpt="/foo/bar")
7c673cae FG	180	self.mount_b.create_destroy()
	181	self.mount_b.umount_wait()
	182
	183	# Configure the client to claim that its mount point metadata is /baz
	184	self.set_conf("client.badguy", "client_metadata", "root=/baz")
	185	# Try to mount the client, see that it fails
11fdf7f2	186	with self.assert_cluster_log("client session with non-allowable root '/baz' denied"):
7c673cae	187	with self.assertRaises(CommandFailedError):
f67539c2	188	self.mount_b.mount_wait(cephfs_mntpt="/foo/bar")
81eedcae	189
f67539c2	190	def test_session_evict_blocklisted(self):
81eedcae	191	"""
f67539c2	192	Check that mds evicts blocklisted client
81eedcae TL	193	"""
81eedcae TL	194	if not isinstance(self.mount_a, FuseMount):
f67539c2 TL	195	self.skipTest("Requires FUSE client to use "
f67539c2 TL	196	"mds_cluster.is_addr_blocklisted()")
81eedcae TL	197
81eedcae TL	198	self.fs.set_max_mds(2)
f6b5b4d7	199	status = self.fs.wait_for_daemons()
81eedcae	200
f6b5b4d7	201	self.mount_a.run_shell_payload("mkdir {d0,d1} && touch {d0,d1}/file")
81eedcae TL	202	self.mount_a.setfattr("d0", "ceph.dir.pin", "0")
81eedcae TL	203	self.mount_a.setfattr("d1", "ceph.dir.pin", "1")
f6b5b4d7	204	self._wait_subtrees([('/d0', 0), ('/d1', 1)], status=status)
81eedcae TL	205
	206	self.mount_a.run_shell(["touch", "d0/f0"])
	207	self.mount_a.run_shell(["touch", "d1/f0"])
	208	self.mount_b.run_shell(["touch", "d0/f1"])
	209	self.mount_b.run_shell(["touch", "d1/f1"])
	210
	211	self.assert_session_count(2, mds_id=self.fs.get_rank(rank=0, status=status)['name'])
	212	self.assert_session_count(2, mds_id=self.fs.get_rank(rank=1, status=status)['name'])
	213
	214	mount_a_client_id = self.mount_a.get_global_id()
	215	self.fs.mds_asok(['session', 'evict', "%s" % mount_a_client_id],
	216	mds_id=self.fs.get_rank(rank=0, status=status)['name'])
f67539c2 TL	217	self.wait_until_true(lambda: self.mds_cluster.is_addr_blocklisted(
f67539c2 TL	218	self.mount_a.get_global_addr()), timeout=30)
81eedcae TL	219
	220	# 10 seconds should be enough for evicting client
	221	time.sleep(10)
	222	self.assert_session_count(1, mds_id=self.fs.get_rank(rank=0, status=status)['name'])
	223	self.assert_session_count(1, mds_id=self.fs.get_rank(rank=1, status=status)['name'])
	224
	225	self.mount_a.kill_cleanup()
e306af50	226	self.mount_a.mount_wait()