[ceph.git] / ceph / qa / tasks / cephfs / test_sessionmap.py

from StringIO import StringIO
import time
import json
import logging
from unittest import SkipTest

from tasks.cephfs.fuse_mount import FuseMount
from teuthology.exceptions import CommandFailedError
from tasks.cephfs.cephfs_test_case import CephFSTestCase

log = logging.getLogger(__name__)


class TestSessionMap(CephFSTestCase):
    CLIENTS_REQUIRED = 2
    MDSS_REQUIRED = 2

    def test_tell_session_drop(self):
        """
        That when a `tell` command is sent using the python CLI,
        its MDS session is gone after it terminates
        """
        self.mount_a.umount_wait()
        self.mount_b.umount_wait()

        status = self.fs.status()
        self.fs.rank_tell(["session", "ls"], status=status)

        ls_data = self.fs.rank_asok(['session', 'ls'], status=status)
        self.assertEqual(len(ls_data), 0)

    def _get_connection_count(self, status=None):
        perf = self.fs.rank_asok(["perf", "dump"], status=status)
        conn = 0
        for module, dump in perf.iteritems():
            if "AsyncMessenger::Worker" in module:
                conn += dump['msgr_active_connections']
        return conn

    def test_tell_conn_close(self):
        """
        That when a `tell` command is sent using the python CLI,
        the conn count goes back to where it started (i.e. we aren't
        leaving connections open)
        """
        self.mount_a.umount_wait()
        self.mount_b.umount_wait()

        status = self.fs.status()
        s = self._get_connection_count(status=status)
        self.fs.rank_tell(["session", "ls"], status=status)
        e = self._get_connection_count(status=status)

        self.assertEqual(s, e)

    def test_mount_conn_close(self):
        """
        That when a client unmounts, the thread count on the MDS goes back
        to what it was before the client mounted
        """
        self.mount_a.umount_wait()
        self.mount_b.umount_wait()

        status = self.fs.status()
        s = self._get_connection_count(status=status)
        self.mount_a.mount()
        self.mount_a.wait_until_mounted()
        self.assertGreater(self._get_connection_count(status=status), s)
        self.mount_a.umount_wait()
        e = self._get_connection_count(status=status)

        self.assertEqual(s, e)

    def test_version_splitting(self):
        """
        That when many sessions are updated, they are correctly
        split into multiple versions to obey mds_sessionmap_keys_per_op
        """

        # Start umounted
        self.mount_a.umount_wait()
        self.mount_b.umount_wait()

        # Configure MDS to write one OMAP key at once
        self.set_conf('mds', 'mds_sessionmap_keys_per_op', 1)
        self.fs.mds_fail_restart()
        self.fs.wait_for_daemons()

        # I would like two MDSs, so that I can do an export dir later
        self.fs.set_max_mds(2)
        self.fs.wait_for_daemons()

        status = self.fs.status()

        # Bring the clients back
        self.mount_a.mount()
        self.mount_b.mount()
        self.mount_a.create_files()  # Kick the client into opening sessions
        self.mount_b.create_files()

        # See that they've got sessions
        self.assert_session_count(2, mds_id=self.fs.get_rank(status=status)['name'])

        # See that we persist their sessions
        self.fs.rank_asok(["flush", "journal"], rank=0, status=status)
        table_json = json.loads(self.fs.table_tool(["0", "show", "session"]))
        log.info("SessionMap: {0}".format(json.dumps(table_json, indent=2)))
        self.assertEqual(table_json['0']['result'], 0)
        self.assertEqual(len(table_json['0']['data']['sessions']), 2)

        # Now, induce a "force_open_sessions" event by exporting a dir
        self.mount_a.run_shell(["mkdir", "bravo"])
        self.mount_a.run_shell(["touch", "bravo/file"])
        self.mount_b.run_shell(["ls", "-l", "bravo/file"])

        def get_omap_wrs():
            return self.fs.rank_asok(['perf', 'dump', 'objecter'], rank=1, status=status)['objecter']['omap_wr']

        # Flush so that there are no dirty sessions on rank 1
        self.fs.rank_asok(["flush", "journal"], rank=1, status=status)

        # Export so that we get a force_open to rank 1 for the two sessions from rank 0
        initial_omap_wrs = get_omap_wrs()
        self.fs.rank_asok(['export', 'dir', '/bravo', '1'], rank=0, status=status)

        # This is the critical (if rather subtle) check: that in the process of doing an export dir,
        # we hit force_open_sessions, and as a result we end up writing out the sessionmap.  There
        # will be two sessions dirtied here, and because we have set keys_per_op to 1, we should see
        # a single session get written out (the first of the two, triggered by the second getting marked
        # dirty)
        # The number of writes is two per session, because the header (sessionmap version) update and
        # KV write both count. Also, multiply by 2 for each openfile table update.
        self.wait_until_true(
            lambda: get_omap_wrs() - initial_omap_wrs == 2*2,
            timeout=30  # Long enough for an export to get acked
        )

        # Now end our sessions and check the backing sessionmap is updated correctly
        self.mount_a.umount_wait()
        self.mount_b.umount_wait()

        # In-memory sessionmap check
        self.assert_session_count(0, mds_id=self.fs.get_rank(status=status)['name'])

        # On-disk sessionmap check
        self.fs.rank_asok(["flush", "journal"], rank=0, status=status)
        table_json = json.loads(self.fs.table_tool(["0", "show", "session"]))
        log.info("SessionMap: {0}".format(json.dumps(table_json, indent=2)))
        self.assertEqual(table_json['0']['result'], 0)
        self.assertEqual(len(table_json['0']['data']['sessions']), 0)

    def _sudo_write_file(self, remote, path, data):
        """
        Write data to a remote file as super user

        :param remote: Remote site.
        :param path: Path on the remote being written to.
        :param data: Data to be written.

        Both perms and owner are passed directly to chmod.
        """
        remote.run(
            args=[
                'sudo',
                'python',
                '-c',
                'import shutil, sys; shutil.copyfileobj(sys.stdin, file(sys.argv[1], "wb"))',
                path,
            ],
            stdin=data,
        )

    def _configure_auth(self, mount, id_name, mds_caps, osd_caps=None, mon_caps=None):
        """
        Set up auth credentials for a client mount, and write out the keyring
        for the client to use.
        """

        if osd_caps is None:
            osd_caps = "allow rw"

        if mon_caps is None:
            mon_caps = "allow r"

        out = self.fs.mon_manager.raw_cluster_cmd(
            "auth", "get-or-create", "client.{name}".format(name=id_name),
            "mds", mds_caps,
            "osd", osd_caps,
            "mon", mon_caps
        )
        mount.client_id = id_name
        self._sudo_write_file(mount.client_remote, mount.get_keyring_path(), out)
        self.set_conf("client.{name}".format(name=id_name), "keyring", mount.get_keyring_path())

    def test_session_reject(self):
        if not isinstance(self.mount_a, FuseMount):
            raise SkipTest("Requires FUSE client to inject client metadata")

        self.mount_a.run_shell(["mkdir", "foo"])
        self.mount_a.run_shell(["mkdir", "foo/bar"])
        self.mount_a.umount_wait()

        # Mount B will be my rejected client
        self.mount_b.umount_wait()

        # Configure a client that is limited to /foo/bar
        self._configure_auth(self.mount_b, "badguy", "allow rw path=/foo/bar")
        # Check he can mount that dir and do IO
        self.mount_b.mount(mount_path="/foo/bar")
        self.mount_b.wait_until_mounted()
        self.mount_b.create_destroy()
        self.mount_b.umount_wait()

        # Configure the client to claim that its mount point metadata is /baz
        self.set_conf("client.badguy", "client_metadata", "root=/baz")
        # Try to mount the client, see that it fails
        with self.assert_cluster_log("client session with non-allowable root '/baz' denied"):
            with self.assertRaises(CommandFailedError):
                self.mount_b.mount(mount_path="/foo/bar")

    def test_session_evict_blacklisted(self):
        """
        Check that mds evicts blacklisted client
        """
        if not isinstance(self.mount_a, FuseMount):
            self.skipTest("Requires FUSE client to use is_blacklisted()")

        self.fs.set_max_mds(2)
        self.fs.wait_for_daemons()
        status = self.fs.status()

        self.mount_a.run_shell(["mkdir", "d0", "d1"])
        self.mount_a.setfattr("d0", "ceph.dir.pin", "0")
        self.mount_a.setfattr("d1", "ceph.dir.pin", "1")
        self._wait_subtrees(status, 0, [('/d0', 0), ('/d1', 1)])

        self.mount_a.run_shell(["touch", "d0/f0"])
        self.mount_a.run_shell(["touch", "d1/f0"])
        self.mount_b.run_shell(["touch", "d0/f1"])
        self.mount_b.run_shell(["touch", "d1/f1"])

        self.assert_session_count(2, mds_id=self.fs.get_rank(rank=0, status=status)['name'])
        self.assert_session_count(2, mds_id=self.fs.get_rank(rank=1, status=status)['name'])

        mount_a_client_id = self.mount_a.get_global_id()
        self.fs.mds_asok(['session', 'evict', "%s" % mount_a_client_id],
                         mds_id=self.fs.get_rank(rank=0, status=status)['name'])
        self.wait_until_true(lambda: self.mount_a.is_blacklisted(), timeout=30)

        # 10 seconds should be enough for evicting client
        time.sleep(10)
        self.assert_session_count(1, mds_id=self.fs.get_rank(rank=0, status=status)['name'])
        self.assert_session_count(1, mds_id=self.fs.get_rank(rank=1, status=status)['name'])

        self.mount_a.kill_cleanup()
        self.mount_a.mount()
        self.mount_a.wait_until_mounted()
Commit	Line	Data
7c673cae	1	from StringIO import StringIO
81eedcae	2	import time
7c673cae FG	3	import json
	4	import logging
	5	from unittest import SkipTest
	6
	7	from tasks.cephfs.fuse_mount import FuseMount
	8	from teuthology.exceptions import CommandFailedError
	9	from tasks.cephfs.cephfs_test_case import CephFSTestCase
	10
	11	log = logging.getLogger(__name__)
	12
	13
	14	class TestSessionMap(CephFSTestCase):
	15	CLIENTS_REQUIRED = 2
	16	MDSS_REQUIRED = 2
	17
	18	def test_tell_session_drop(self):
	19	"""
	20	That when a `tell` command is sent using the python CLI,
	21	its MDS session is gone after it terminates
	22	"""
	23	self.mount_a.umount_wait()
	24	self.mount_b.umount_wait()
	25
81eedcae TL	26	status = self.fs.status()
81eedcae TL	27	self.fs.rank_tell(["session", "ls"], status=status)
7c673cae	28
81eedcae	29	ls_data = self.fs.rank_asok(['session', 'ls'], status=status)
7c673cae FG	30	self.assertEqual(len(ls_data), 0)
7c673cae FG	31
81eedcae TL	32	def _get_connection_count(self, status=None):
	33	perf = self.fs.rank_asok(["perf", "dump"], status=status)
	34	conn = 0
	35	for module, dump in perf.iteritems():
	36	if "AsyncMessenger::Worker" in module:
	37	conn += dump['msgr_active_connections']
	38	return conn
7c673cae FG	39
	40	def test_tell_conn_close(self):
	41	"""
	42	That when a `tell` command is sent using the python CLI,
81eedcae	43	the conn count goes back to where it started (i.e. we aren't
7c673cae FG	44	leaving connections open)
	45	"""
	46	self.mount_a.umount_wait()
	47	self.mount_b.umount_wait()
	48
81eedcae TL	49	status = self.fs.status()
	50	s = self._get_connection_count(status=status)
	51	self.fs.rank_tell(["session", "ls"], status=status)
	52	e = self._get_connection_count(status=status)
7c673cae	53
81eedcae	54	self.assertEqual(s, e)
7c673cae FG	55
	56	def test_mount_conn_close(self):
	57	"""
	58	That when a client unmounts, the thread count on the MDS goes back
	59	to what it was before the client mounted
	60	"""
	61	self.mount_a.umount_wait()
	62	self.mount_b.umount_wait()
	63
81eedcae TL	64	status = self.fs.status()
81eedcae TL	65	s = self._get_connection_count(status=status)
7c673cae FG	66	self.mount_a.mount()
7c673cae FG	67	self.mount_a.wait_until_mounted()
81eedcae	68	self.assertGreater(self._get_connection_count(status=status), s)
7c673cae	69	self.mount_a.umount_wait()
81eedcae	70	e = self._get_connection_count(status=status)
7c673cae	71
81eedcae	72	self.assertEqual(s, e)
7c673cae FG	73
	74	def test_version_splitting(self):
	75	"""
	76	That when many sessions are updated, they are correctly
	77	split into multiple versions to obey mds_sessionmap_keys_per_op
	78	"""
	79
	80	# Start umounted
	81	self.mount_a.umount_wait()
	82	self.mount_b.umount_wait()
	83
	84	# Configure MDS to write one OMAP key at once
	85	self.set_conf('mds', 'mds_sessionmap_keys_per_op', 1)
	86	self.fs.mds_fail_restart()
	87	self.fs.wait_for_daemons()
	88
	89	# I would like two MDSs, so that I can do an export dir later
7c673cae FG	90	self.fs.set_max_mds(2)
	91	self.fs.wait_for_daemons()
	92
81eedcae	93	status = self.fs.status()
7c673cae FG	94
	95	# Bring the clients back
	96	self.mount_a.mount()
	97	self.mount_b.mount()
	98	self.mount_a.create_files() # Kick the client into opening sessions
	99	self.mount_b.create_files()
	100
	101	# See that they've got sessions
81eedcae	102	self.assert_session_count(2, mds_id=self.fs.get_rank(status=status)['name'])
7c673cae FG	103
7c673cae FG	104	# See that we persist their sessions
81eedcae	105	self.fs.rank_asok(["flush", "journal"], rank=0, status=status)
7c673cae FG	106	table_json = json.loads(self.fs.table_tool(["0", "show", "session"]))
	107	log.info("SessionMap: {0}".format(json.dumps(table_json, indent=2)))
	108	self.assertEqual(table_json['0']['result'], 0)
92f5a8d4	109	self.assertEqual(len(table_json['0']['data']['sessions']), 2)
7c673cae FG	110
	111	# Now, induce a "force_open_sessions" event by exporting a dir
	112	self.mount_a.run_shell(["mkdir", "bravo"])
	113	self.mount_a.run_shell(["touch", "bravo/file"])
	114	self.mount_b.run_shell(["ls", "-l", "bravo/file"])
	115
	116	def get_omap_wrs():
81eedcae	117	return self.fs.rank_asok(['perf', 'dump', 'objecter'], rank=1, status=status)['objecter']['omap_wr']
7c673cae FG	118
7c673cae FG	119	# Flush so that there are no dirty sessions on rank 1
81eedcae	120	self.fs.rank_asok(["flush", "journal"], rank=1, status=status)
7c673cae FG	121
	122	# Export so that we get a force_open to rank 1 for the two sessions from rank 0
	123	initial_omap_wrs = get_omap_wrs()
81eedcae	124	self.fs.rank_asok(['export', 'dir', '/bravo', '1'], rank=0, status=status)
7c673cae FG	125
	126	# This is the critical (if rather subtle) check: that in the process of doing an export dir,
	127	# we hit force_open_sessions, and as a result we end up writing out the sessionmap. There
	128	# will be two sessions dirtied here, and because we have set keys_per_op to 1, we should see
	129	# a single session get written out (the first of the two, triggered by the second getting marked
	130	# dirty)
	131	# The number of writes is two per session, because the header (sessionmap version) update and
11fdf7f2	132	# KV write both count. Also, multiply by 2 for each openfile table update.
7c673cae	133	self.wait_until_true(
11fdf7f2 TL	134	lambda: get_omap_wrs() - initial_omap_wrs == 2*2,
11fdf7f2 TL	135	timeout=30 # Long enough for an export to get acked
7c673cae FG	136	)
	137
	138	# Now end our sessions and check the backing sessionmap is updated correctly
	139	self.mount_a.umount_wait()
	140	self.mount_b.umount_wait()
	141
	142	# In-memory sessionmap check
81eedcae	143	self.assert_session_count(0, mds_id=self.fs.get_rank(status=status)['name'])
7c673cae FG	144
7c673cae FG	145	# On-disk sessionmap check
81eedcae	146	self.fs.rank_asok(["flush", "journal"], rank=0, status=status)
7c673cae FG	147	table_json = json.loads(self.fs.table_tool(["0", "show", "session"]))
	148	log.info("SessionMap: {0}".format(json.dumps(table_json, indent=2)))
	149	self.assertEqual(table_json['0']['result'], 0)
92f5a8d4	150	self.assertEqual(len(table_json['0']['data']['sessions']), 0)
7c673cae FG	151
	152	def _sudo_write_file(self, remote, path, data):
	153	"""
	154	Write data to a remote file as super user
	155
	156	:param remote: Remote site.
	157	:param path: Path on the remote being written to.
	158	:param data: Data to be written.
	159
	160	Both perms and owner are passed directly to chmod.
	161	"""
	162	remote.run(
	163	args=[
	164	'sudo',
	165	'python',
	166	'-c',
	167	'import shutil, sys; shutil.copyfileobj(sys.stdin, file(sys.argv[1], "wb"))',
	168	path,
	169	],
	170	stdin=data,
	171	)
	172
	173	def _configure_auth(self, mount, id_name, mds_caps, osd_caps=None, mon_caps=None):
	174	"""
	175	Set up auth credentials for a client mount, and write out the keyring
	176	for the client to use.
	177	"""
	178
	179	if osd_caps is None:
	180	osd_caps = "allow rw"
	181
	182	if mon_caps is None:
	183	mon_caps = "allow r"
	184
	185	out = self.fs.mon_manager.raw_cluster_cmd(
	186	"auth", "get-or-create", "client.{name}".format(name=id_name),
	187	"mds", mds_caps,
	188	"osd", osd_caps,
	189	"mon", mon_caps
	190	)
	191	mount.client_id = id_name
	192	self._sudo_write_file(mount.client_remote, mount.get_keyring_path(), out)
	193	self.set_conf("client.{name}".format(name=id_name), "keyring", mount.get_keyring_path())
	194
	195	def test_session_reject(self):
	196	if not isinstance(self.mount_a, FuseMount):
	197	raise SkipTest("Requires FUSE client to inject client metadata")
	198
	199	self.mount_a.run_shell(["mkdir", "foo"])
	200	self.mount_a.run_shell(["mkdir", "foo/bar"])
	201	self.mount_a.umount_wait()
	202
	203	# Mount B will be my rejected client
	204	self.mount_b.umount_wait()
	205
	206	# Configure a client that is limited to /foo/bar
	207	self._configure_auth(self.mount_b, "badguy", "allow rw path=/foo/bar")
	208	# Check he can mount that dir and do IO
	209	self.mount_b.mount(mount_path="/foo/bar")
	210	self.mount_b.wait_until_mounted()
	211	self.mount_b.create_destroy()
	212	self.mount_b.umount_wait()
	213
	214	# Configure the client to claim that its mount point metadata is /baz
215	self.set_conf("client.badguy", "client_metadata", "root=/baz")
216	# Try to mount the client, see that it fails
11fdf7f2	217	with self.assert_cluster_log("client session with non-allowable root '/baz' denied"):
7c673cae FG	218	with self.assertRaises(CommandFailedError):
7c673cae FG	219	self.mount_b.mount(mount_path="/foo/bar")
81eedcae TL	220
	221	def test_session_evict_blacklisted(self):
	222	"""
	223	Check that mds evicts blacklisted client
	224	"""
	225	if not isinstance(self.mount_a, FuseMount):
	226	self.skipTest("Requires FUSE client to use is_blacklisted()")
	227
	228	self.fs.set_max_mds(2)
	229	self.fs.wait_for_daemons()
	230	status = self.fs.status()
	231
	232	self.mount_a.run_shell(["mkdir", "d0", "d1"])
	233	self.mount_a.setfattr("d0", "ceph.dir.pin", "0")
	234	self.mount_a.setfattr("d1", "ceph.dir.pin", "1")
	235	self._wait_subtrees(status, 0, [('/d0', 0), ('/d1', 1)])
	236
	237	self.mount_a.run_shell(["touch", "d0/f0"])
	238	self.mount_a.run_shell(["touch", "d1/f0"])
	239	self.mount_b.run_shell(["touch", "d0/f1"])
	240	self.mount_b.run_shell(["touch", "d1/f1"])
	241
	242	self.assert_session_count(2, mds_id=self.fs.get_rank(rank=0, status=status)['name'])
	243	self.assert_session_count(2, mds_id=self.fs.get_rank(rank=1, status=status)['name'])
	244
	245	mount_a_client_id = self.mount_a.get_global_id()
	246	self.fs.mds_asok(['session', 'evict', "%s" % mount_a_client_id],
	247	mds_id=self.fs.get_rank(rank=0, status=status)['name'])
	248	self.wait_until_true(lambda: self.mount_a.is_blacklisted(), timeout=30)
	249
	250	# 10 seconds should be enough for evicting client
	251	time.sleep(10)
	252	self.assert_session_count(1, mds_id=self.fs.get_rank(rank=0, status=status)['name'])
	253	self.assert_session_count(1, mds_id=self.fs.get_rank(rank=1, status=status)['name'])
	254
	255	self.mount_a.kill_cleanup()
	256	self.mount_a.mount()
	257	self.mount_a.wait_until_mounted()