mirror of
				git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
				synced 2025-09-04 20:19:47 +08:00 
			
		
		
		
	 1dd8d47081
			
		
	
	
		1dd8d47081
		
	
	
	
	
		
			
			In client for each inode, it may have many opened files and may
have been pinned in more than one MDS servers. And some inodes
are idle, which have no any opened files.
This patch will show these metrics in the debugfs, likes:
item                               total
-----------------------------------------
opened files  / total inodes       14 / 5
pinned i_caps / total inodes       7  / 5
opened inodes / total inodes       3  / 5
Will send these metrics to ceph, which will be used by the `fs top`,
later.
[ jlayton: drop unrelated hunk, count hashed inodes instead of
           allocated ones ]
URL: https://tracker.ceph.com/issues/47005
Signed-off-by: Xiubo Li <xiubli@redhat.com>
Signed-off-by: Jeff Layton <jlayton@kernel.org>
Signed-off-by: Ilya Dryomov <idryomov@gmail.com>
		
	
			
		
			
				
	
	
		
			411 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			411 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| // SPDX-License-Identifier: GPL-2.0
 | |
| #include <linux/ceph/ceph_debug.h>
 | |
| 
 | |
| #include <linux/device.h>
 | |
| #include <linux/slab.h>
 | |
| #include <linux/module.h>
 | |
| #include <linux/ctype.h>
 | |
| #include <linux/debugfs.h>
 | |
| #include <linux/seq_file.h>
 | |
| #include <linux/math64.h>
 | |
| #include <linux/ktime.h>
 | |
| 
 | |
| #include <linux/ceph/libceph.h>
 | |
| #include <linux/ceph/mon_client.h>
 | |
| #include <linux/ceph/auth.h>
 | |
| #include <linux/ceph/debugfs.h>
 | |
| 
 | |
| #include "super.h"
 | |
| 
 | |
| #ifdef CONFIG_DEBUG_FS
 | |
| 
 | |
| #include "mds_client.h"
 | |
| #include "metric.h"
 | |
| 
 | |
| static int mdsmap_show(struct seq_file *s, void *p)
 | |
| {
 | |
| 	int i;
 | |
| 	struct ceph_fs_client *fsc = s->private;
 | |
| 	struct ceph_mdsmap *mdsmap;
 | |
| 
 | |
| 	if (!fsc->mdsc || !fsc->mdsc->mdsmap)
 | |
| 		return 0;
 | |
| 	mdsmap = fsc->mdsc->mdsmap;
 | |
| 	seq_printf(s, "epoch %d\n", mdsmap->m_epoch);
 | |
| 	seq_printf(s, "root %d\n", mdsmap->m_root);
 | |
| 	seq_printf(s, "max_mds %d\n", mdsmap->m_max_mds);
 | |
| 	seq_printf(s, "session_timeout %d\n", mdsmap->m_session_timeout);
 | |
| 	seq_printf(s, "session_autoclose %d\n", mdsmap->m_session_autoclose);
 | |
| 	for (i = 0; i < mdsmap->possible_max_rank; i++) {
 | |
| 		struct ceph_entity_addr *addr = &mdsmap->m_info[i].addr;
 | |
| 		int state = mdsmap->m_info[i].state;
 | |
| 		seq_printf(s, "\tmds%d\t%s\t(%s)\n", i,
 | |
| 			       ceph_pr_addr(addr),
 | |
| 			       ceph_mds_state_name(state));
 | |
| 	}
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * mdsc debugfs
 | |
|  */
 | |
| static int mdsc_show(struct seq_file *s, void *p)
 | |
| {
 | |
| 	struct ceph_fs_client *fsc = s->private;
 | |
| 	struct ceph_mds_client *mdsc = fsc->mdsc;
 | |
| 	struct ceph_mds_request *req;
 | |
| 	struct rb_node *rp;
 | |
| 	int pathlen = 0;
 | |
| 	u64 pathbase;
 | |
| 	char *path;
 | |
| 
 | |
| 	mutex_lock(&mdsc->mutex);
 | |
| 	for (rp = rb_first(&mdsc->request_tree); rp; rp = rb_next(rp)) {
 | |
| 		req = rb_entry(rp, struct ceph_mds_request, r_node);
 | |
| 
 | |
| 		if (req->r_request && req->r_session)
 | |
| 			seq_printf(s, "%lld\tmds%d\t", req->r_tid,
 | |
| 				   req->r_session->s_mds);
 | |
| 		else if (!req->r_request)
 | |
| 			seq_printf(s, "%lld\t(no request)\t", req->r_tid);
 | |
| 		else
 | |
| 			seq_printf(s, "%lld\t(no session)\t", req->r_tid);
 | |
| 
 | |
| 		seq_printf(s, "%s", ceph_mds_op_name(req->r_op));
 | |
| 
 | |
| 		if (test_bit(CEPH_MDS_R_GOT_UNSAFE, &req->r_req_flags))
 | |
| 			seq_puts(s, "\t(unsafe)");
 | |
| 		else
 | |
| 			seq_puts(s, "\t");
 | |
| 
 | |
| 		if (req->r_inode) {
 | |
| 			seq_printf(s, " #%llx", ceph_ino(req->r_inode));
 | |
| 		} else if (req->r_dentry) {
 | |
| 			path = ceph_mdsc_build_path(req->r_dentry, &pathlen,
 | |
| 						    &pathbase, 0);
 | |
| 			if (IS_ERR(path))
 | |
| 				path = NULL;
 | |
| 			spin_lock(&req->r_dentry->d_lock);
 | |
| 			seq_printf(s, " #%llx/%pd (%s)",
 | |
| 				   ceph_ino(d_inode(req->r_dentry->d_parent)),
 | |
| 				   req->r_dentry,
 | |
| 				   path ? path : "");
 | |
| 			spin_unlock(&req->r_dentry->d_lock);
 | |
| 			ceph_mdsc_free_path(path, pathlen);
 | |
| 		} else if (req->r_path1) {
 | |
| 			seq_printf(s, " #%llx/%s", req->r_ino1.ino,
 | |
| 				   req->r_path1);
 | |
| 		} else {
 | |
| 			seq_printf(s, " #%llx", req->r_ino1.ino);
 | |
| 		}
 | |
| 
 | |
| 		if (req->r_old_dentry) {
 | |
| 			path = ceph_mdsc_build_path(req->r_old_dentry, &pathlen,
 | |
| 						    &pathbase, 0);
 | |
| 			if (IS_ERR(path))
 | |
| 				path = NULL;
 | |
| 			spin_lock(&req->r_old_dentry->d_lock);
 | |
| 			seq_printf(s, " #%llx/%pd (%s)",
 | |
| 				   req->r_old_dentry_dir ?
 | |
| 				   ceph_ino(req->r_old_dentry_dir) : 0,
 | |
| 				   req->r_old_dentry,
 | |
| 				   path ? path : "");
 | |
| 			spin_unlock(&req->r_old_dentry->d_lock);
 | |
| 			ceph_mdsc_free_path(path, pathlen);
 | |
| 		} else if (req->r_path2 && req->r_op != CEPH_MDS_OP_SYMLINK) {
 | |
| 			if (req->r_ino2.ino)
 | |
| 				seq_printf(s, " #%llx/%s", req->r_ino2.ino,
 | |
| 					   req->r_path2);
 | |
| 			else
 | |
| 				seq_printf(s, " %s", req->r_path2);
 | |
| 		}
 | |
| 
 | |
| 		seq_puts(s, "\n");
 | |
| 	}
 | |
| 	mutex_unlock(&mdsc->mutex);
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| #define CEPH_METRIC_SHOW(name, total, avg, min, max, sq) {		\
 | |
| 	s64 _total, _avg, _min, _max, _sq, _st;				\
 | |
| 	_avg = ktime_to_us(avg);					\
 | |
| 	_min = ktime_to_us(min == KTIME_MAX ? 0 : min);			\
 | |
| 	_max = ktime_to_us(max);					\
 | |
| 	_total = total - 1;						\
 | |
| 	_sq = _total > 0 ? DIV64_U64_ROUND_CLOSEST(sq, _total) : 0;	\
 | |
| 	_st = int_sqrt64(_sq);						\
 | |
| 	_st = ktime_to_us(_st);						\
 | |
| 	seq_printf(s, "%-14s%-12lld%-16lld%-16lld%-16lld%lld\n",	\
 | |
| 		   name, total, _avg, _min, _max, _st);			\
 | |
| }
 | |
| 
 | |
| static int metric_show(struct seq_file *s, void *p)
 | |
| {
 | |
| 	struct ceph_fs_client *fsc = s->private;
 | |
| 	struct ceph_mds_client *mdsc = fsc->mdsc;
 | |
| 	struct ceph_client_metric *m = &mdsc->metric;
 | |
| 	int nr_caps = 0;
 | |
| 	s64 total, sum, avg, min, max, sq;
 | |
| 
 | |
| 	sum = percpu_counter_sum(&m->total_inodes);
 | |
| 	seq_printf(s, "item                               total\n");
 | |
| 	seq_printf(s, "------------------------------------------\n");
 | |
| 	seq_printf(s, "%-35s%lld / %lld\n", "opened files  / total inodes",
 | |
| 		   atomic64_read(&m->opened_files), sum);
 | |
| 	seq_printf(s, "%-35s%lld / %lld\n", "pinned i_caps / total inodes",
 | |
| 		   atomic64_read(&m->total_caps), sum);
 | |
| 	seq_printf(s, "%-35s%lld / %lld\n", "opened inodes / total inodes",
 | |
| 		   percpu_counter_sum(&m->opened_inodes), sum);
 | |
| 
 | |
| 	seq_printf(s, "\n");
 | |
| 	seq_printf(s, "item          total       avg_lat(us)     min_lat(us)     max_lat(us)     stdev(us)\n");
 | |
| 	seq_printf(s, "-----------------------------------------------------------------------------------\n");
 | |
| 
 | |
| 	spin_lock(&m->read_latency_lock);
 | |
| 	total = m->total_reads;
 | |
| 	sum = m->read_latency_sum;
 | |
| 	avg = total > 0 ? DIV64_U64_ROUND_CLOSEST(sum, total) : 0;
 | |
| 	min = m->read_latency_min;
 | |
| 	max = m->read_latency_max;
 | |
| 	sq = m->read_latency_sq_sum;
 | |
| 	spin_unlock(&m->read_latency_lock);
 | |
| 	CEPH_METRIC_SHOW("read", total, avg, min, max, sq);
 | |
| 
 | |
| 	spin_lock(&m->write_latency_lock);
 | |
| 	total = m->total_writes;
 | |
| 	sum = m->write_latency_sum;
 | |
| 	avg = total > 0 ? DIV64_U64_ROUND_CLOSEST(sum, total) : 0;
 | |
| 	min = m->write_latency_min;
 | |
| 	max = m->write_latency_max;
 | |
| 	sq = m->write_latency_sq_sum;
 | |
| 	spin_unlock(&m->write_latency_lock);
 | |
| 	CEPH_METRIC_SHOW("write", total, avg, min, max, sq);
 | |
| 
 | |
| 	spin_lock(&m->metadata_latency_lock);
 | |
| 	total = m->total_metadatas;
 | |
| 	sum = m->metadata_latency_sum;
 | |
| 	avg = total > 0 ? DIV64_U64_ROUND_CLOSEST(sum, total) : 0;
 | |
| 	min = m->metadata_latency_min;
 | |
| 	max = m->metadata_latency_max;
 | |
| 	sq = m->metadata_latency_sq_sum;
 | |
| 	spin_unlock(&m->metadata_latency_lock);
 | |
| 	CEPH_METRIC_SHOW("metadata", total, avg, min, max, sq);
 | |
| 
 | |
| 	seq_printf(s, "\n");
 | |
| 	seq_printf(s, "item          total           miss            hit\n");
 | |
| 	seq_printf(s, "-------------------------------------------------\n");
 | |
| 
 | |
| 	seq_printf(s, "%-14s%-16lld%-16lld%lld\n", "d_lease",
 | |
| 		   atomic64_read(&m->total_dentries),
 | |
| 		   percpu_counter_sum(&m->d_lease_mis),
 | |
| 		   percpu_counter_sum(&m->d_lease_hit));
 | |
| 
 | |
| 	nr_caps = atomic64_read(&m->total_caps);
 | |
| 	seq_printf(s, "%-14s%-16d%-16lld%lld\n", "caps", nr_caps,
 | |
| 		   percpu_counter_sum(&m->i_caps_mis),
 | |
| 		   percpu_counter_sum(&m->i_caps_hit));
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static int caps_show_cb(struct inode *inode, struct ceph_cap *cap, void *p)
 | |
| {
 | |
| 	struct seq_file *s = p;
 | |
| 
 | |
| 	seq_printf(s, "0x%-17llx%-3d%-17s%-17s\n", ceph_ino(inode),
 | |
| 		   cap->session->s_mds,
 | |
| 		   ceph_cap_string(cap->issued),
 | |
| 		   ceph_cap_string(cap->implemented));
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static int caps_show(struct seq_file *s, void *p)
 | |
| {
 | |
| 	struct ceph_fs_client *fsc = s->private;
 | |
| 	struct ceph_mds_client *mdsc = fsc->mdsc;
 | |
| 	int total, avail, used, reserved, min, i;
 | |
| 	struct cap_wait	*cw;
 | |
| 
 | |
| 	ceph_reservation_status(fsc, &total, &avail, &used, &reserved, &min);
 | |
| 	seq_printf(s, "total\t\t%d\n"
 | |
| 		   "avail\t\t%d\n"
 | |
| 		   "used\t\t%d\n"
 | |
| 		   "reserved\t%d\n"
 | |
| 		   "min\t\t%d\n\n",
 | |
| 		   total, avail, used, reserved, min);
 | |
| 	seq_printf(s, "ino              mds  issued           implemented\n");
 | |
| 	seq_printf(s, "--------------------------------------------------\n");
 | |
| 
 | |
| 	mutex_lock(&mdsc->mutex);
 | |
| 	for (i = 0; i < mdsc->max_sessions; i++) {
 | |
| 		struct ceph_mds_session *session;
 | |
| 
 | |
| 		session = __ceph_lookup_mds_session(mdsc, i);
 | |
| 		if (!session)
 | |
| 			continue;
 | |
| 		mutex_unlock(&mdsc->mutex);
 | |
| 		mutex_lock(&session->s_mutex);
 | |
| 		ceph_iterate_session_caps(session, caps_show_cb, s);
 | |
| 		mutex_unlock(&session->s_mutex);
 | |
| 		ceph_put_mds_session(session);
 | |
| 		mutex_lock(&mdsc->mutex);
 | |
| 	}
 | |
| 	mutex_unlock(&mdsc->mutex);
 | |
| 
 | |
| 	seq_printf(s, "\n\nWaiters:\n--------\n");
 | |
| 	seq_printf(s, "tgid         ino                need             want\n");
 | |
| 	seq_printf(s, "-----------------------------------------------------\n");
 | |
| 
 | |
| 	spin_lock(&mdsc->caps_list_lock);
 | |
| 	list_for_each_entry(cw, &mdsc->cap_wait_list, list) {
 | |
| 		seq_printf(s, "%-13d0x%-17llx%-17s%-17s\n", cw->tgid, cw->ino,
 | |
| 				ceph_cap_string(cw->need),
 | |
| 				ceph_cap_string(cw->want));
 | |
| 	}
 | |
| 	spin_unlock(&mdsc->caps_list_lock);
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static int mds_sessions_show(struct seq_file *s, void *ptr)
 | |
| {
 | |
| 	struct ceph_fs_client *fsc = s->private;
 | |
| 	struct ceph_mds_client *mdsc = fsc->mdsc;
 | |
| 	struct ceph_auth_client *ac = fsc->client->monc.auth;
 | |
| 	struct ceph_options *opt = fsc->client->options;
 | |
| 	int mds;
 | |
| 
 | |
| 	mutex_lock(&mdsc->mutex);
 | |
| 
 | |
| 	/* The 'num' portion of an 'entity name' */
 | |
| 	seq_printf(s, "global_id %llu\n", ac->global_id);
 | |
| 
 | |
| 	/* The -o name mount argument */
 | |
| 	seq_printf(s, "name \"%s\"\n", opt->name ? opt->name : "");
 | |
| 
 | |
| 	/* The list of MDS session rank+state */
 | |
| 	for (mds = 0; mds < mdsc->max_sessions; mds++) {
 | |
| 		struct ceph_mds_session *session =
 | |
| 			__ceph_lookup_mds_session(mdsc, mds);
 | |
| 		if (!session) {
 | |
| 			continue;
 | |
| 		}
 | |
| 		mutex_unlock(&mdsc->mutex);
 | |
| 		seq_printf(s, "mds.%d %s\n",
 | |
| 				session->s_mds,
 | |
| 				ceph_session_state_name(session->s_state));
 | |
| 
 | |
| 		ceph_put_mds_session(session);
 | |
| 		mutex_lock(&mdsc->mutex);
 | |
| 	}
 | |
| 	mutex_unlock(&mdsc->mutex);
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| DEFINE_SHOW_ATTRIBUTE(mdsmap);
 | |
| DEFINE_SHOW_ATTRIBUTE(mdsc);
 | |
| DEFINE_SHOW_ATTRIBUTE(caps);
 | |
| DEFINE_SHOW_ATTRIBUTE(mds_sessions);
 | |
| DEFINE_SHOW_ATTRIBUTE(metric);
 | |
| 
 | |
| 
 | |
| /*
 | |
|  * debugfs
 | |
|  */
 | |
| static int congestion_kb_set(void *data, u64 val)
 | |
| {
 | |
| 	struct ceph_fs_client *fsc = (struct ceph_fs_client *)data;
 | |
| 
 | |
| 	fsc->mount_options->congestion_kb = (int)val;
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static int congestion_kb_get(void *data, u64 *val)
 | |
| {
 | |
| 	struct ceph_fs_client *fsc = (struct ceph_fs_client *)data;
 | |
| 
 | |
| 	*val = (u64)fsc->mount_options->congestion_kb;
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| DEFINE_SIMPLE_ATTRIBUTE(congestion_kb_fops, congestion_kb_get,
 | |
| 			congestion_kb_set, "%llu\n");
 | |
| 
 | |
| 
 | |
| void ceph_fs_debugfs_cleanup(struct ceph_fs_client *fsc)
 | |
| {
 | |
| 	dout("ceph_fs_debugfs_cleanup\n");
 | |
| 	debugfs_remove(fsc->debugfs_bdi);
 | |
| 	debugfs_remove(fsc->debugfs_congestion_kb);
 | |
| 	debugfs_remove(fsc->debugfs_mdsmap);
 | |
| 	debugfs_remove(fsc->debugfs_mds_sessions);
 | |
| 	debugfs_remove(fsc->debugfs_caps);
 | |
| 	debugfs_remove(fsc->debugfs_metric);
 | |
| 	debugfs_remove(fsc->debugfs_mdsc);
 | |
| }
 | |
| 
 | |
| void ceph_fs_debugfs_init(struct ceph_fs_client *fsc)
 | |
| {
 | |
| 	char name[100];
 | |
| 
 | |
| 	dout("ceph_fs_debugfs_init\n");
 | |
| 	fsc->debugfs_congestion_kb =
 | |
| 		debugfs_create_file("writeback_congestion_kb",
 | |
| 				    0600,
 | |
| 				    fsc->client->debugfs_dir,
 | |
| 				    fsc,
 | |
| 				    &congestion_kb_fops);
 | |
| 
 | |
| 	snprintf(name, sizeof(name), "../../bdi/%s",
 | |
| 		 bdi_dev_name(fsc->sb->s_bdi));
 | |
| 	fsc->debugfs_bdi =
 | |
| 		debugfs_create_symlink("bdi",
 | |
| 				       fsc->client->debugfs_dir,
 | |
| 				       name);
 | |
| 
 | |
| 	fsc->debugfs_mdsmap = debugfs_create_file("mdsmap",
 | |
| 					0400,
 | |
| 					fsc->client->debugfs_dir,
 | |
| 					fsc,
 | |
| 					&mdsmap_fops);
 | |
| 
 | |
| 	fsc->debugfs_mds_sessions = debugfs_create_file("mds_sessions",
 | |
| 					0400,
 | |
| 					fsc->client->debugfs_dir,
 | |
| 					fsc,
 | |
| 					&mds_sessions_fops);
 | |
| 
 | |
| 	fsc->debugfs_mdsc = debugfs_create_file("mdsc",
 | |
| 						0400,
 | |
| 						fsc->client->debugfs_dir,
 | |
| 						fsc,
 | |
| 						&mdsc_fops);
 | |
| 
 | |
| 	fsc->debugfs_metric = debugfs_create_file("metrics",
 | |
| 						  0400,
 | |
| 						  fsc->client->debugfs_dir,
 | |
| 						  fsc,
 | |
| 						  &metric_fops);
 | |
| 
 | |
| 	fsc->debugfs_caps = debugfs_create_file("caps",
 | |
| 						0400,
 | |
| 						fsc->client->debugfs_dir,
 | |
| 						fsc,
 | |
| 						&caps_fops);
 | |
| }
 | |
| 
 | |
| 
 | |
| #else  /* CONFIG_DEBUG_FS */
 | |
| 
 | |
| void ceph_fs_debugfs_init(struct ceph_fs_client *fsc)
 | |
| {
 | |
| }
 | |
| 
 | |
| void ceph_fs_debugfs_cleanup(struct ceph_fs_client *fsc)
 | |
| {
 | |
| }
 | |
| 
 | |
| #endif  /* CONFIG_DEBUG_FS */
 |