]> git.proxmox.com Git - mirror_iproute2.git/blob - misc/ss.c
Merge branch 'master' into net-next
[mirror_iproute2.git] / misc / ss.c
1 /*
2 * ss.c "sockstat", socket statistics
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 */
11
12 #include <stdio.h>
13 #include <stdlib.h>
14 #include <unistd.h>
15 #include <syslog.h>
16 #include <fcntl.h>
17 #include <sys/ioctl.h>
18 #include <sys/socket.h>
19 #include <sys/uio.h>
20 #include <netinet/in.h>
21 #include <string.h>
22 #include <errno.h>
23 #include <netdb.h>
24 #include <arpa/inet.h>
25 #include <dirent.h>
26 #include <fnmatch.h>
27 #include <getopt.h>
28 #include <stdbool.h>
29 #include <limits.h>
30
31 #include "utils.h"
32 #include "rt_names.h"
33 #include "ll_map.h"
34 #include "libnetlink.h"
35 #include "namespace.h"
36 #include "SNAPSHOT.h"
37
38 #include <linux/tcp.h>
39 #include <linux/sock_diag.h>
40 #include <linux/inet_diag.h>
41 #include <linux/unix_diag.h>
42 #include <linux/netdevice.h> /* for MAX_ADDR_LEN */
43 #include <linux/filter.h>
44 #include <linux/packet_diag.h>
45 #include <linux/netlink_diag.h>
46 #include <linux/sctp.h>
47 #include <linux/vm_sockets_diag.h>
48
49 #define MAGIC_SEQ 123456
50
51 #define DIAG_REQUEST(_req, _r) \
52 struct { \
53 struct nlmsghdr nlh; \
54 _r; \
55 } _req = { \
56 .nlh = { \
57 .nlmsg_type = SOCK_DIAG_BY_FAMILY, \
58 .nlmsg_flags = NLM_F_ROOT|NLM_F_MATCH|NLM_F_REQUEST,\
59 .nlmsg_seq = MAGIC_SEQ, \
60 .nlmsg_len = sizeof(_req), \
61 }, \
62 }
63
64 #if HAVE_SELINUX
65 #include <selinux/selinux.h>
66 #else
67 /* Stubs for SELinux functions */
68 static int is_selinux_enabled(void)
69 {
70 return -1;
71 }
72
73 static int getpidcon(pid_t pid, char **context)
74 {
75 *context = NULL;
76 return -1;
77 }
78
79 static int getfilecon(char *path, char **context)
80 {
81 *context = NULL;
82 return -1;
83 }
84
85 static int security_get_initial_context(char *name, char **context)
86 {
87 *context = NULL;
88 return -1;
89 }
90 #endif
91
92 int resolve_hosts;
93 int resolve_services = 1;
94 int preferred_family = AF_UNSPEC;
95 int show_options;
96 int show_details;
97 int show_users;
98 int show_mem;
99 int show_tcpinfo;
100 int show_bpf;
101 int show_proc_ctx;
102 int show_sock_ctx;
103 int show_header = 1;
104 int follow_events;
105 int sctp_ino;
106
107 int netid_width;
108 int state_width;
109 int addr_width;
110 int serv_width;
111 char *odd_width_pad = "";
112
113 static const char *TCP_PROTO = "tcp";
114 static const char *SCTP_PROTO = "sctp";
115 static const char *UDP_PROTO = "udp";
116 static const char *RAW_PROTO = "raw";
117 static const char *dg_proto;
118
119 enum {
120 TCP_DB,
121 DCCP_DB,
122 UDP_DB,
123 RAW_DB,
124 UNIX_DG_DB,
125 UNIX_ST_DB,
126 UNIX_SQ_DB,
127 PACKET_DG_DB,
128 PACKET_R_DB,
129 NETLINK_DB,
130 SCTP_DB,
131 VSOCK_ST_DB,
132 VSOCK_DG_DB,
133 MAX_DB
134 };
135
136 #define PACKET_DBM ((1<<PACKET_DG_DB)|(1<<PACKET_R_DB))
137 #define UNIX_DBM ((1<<UNIX_DG_DB)|(1<<UNIX_ST_DB)|(1<<UNIX_SQ_DB))
138 #define ALL_DB ((1<<MAX_DB)-1)
139 #define INET_L4_DBM ((1<<TCP_DB)|(1<<UDP_DB)|(1<<DCCP_DB)|(1<<SCTP_DB))
140 #define INET_DBM (INET_L4_DBM | (1<<RAW_DB))
141 #define VSOCK_DBM ((1<<VSOCK_ST_DB)|(1<<VSOCK_DG_DB))
142
143 enum {
144 SS_UNKNOWN,
145 SS_ESTABLISHED,
146 SS_SYN_SENT,
147 SS_SYN_RECV,
148 SS_FIN_WAIT1,
149 SS_FIN_WAIT2,
150 SS_TIME_WAIT,
151 SS_CLOSE,
152 SS_CLOSE_WAIT,
153 SS_LAST_ACK,
154 SS_LISTEN,
155 SS_CLOSING,
156 SS_MAX
157 };
158
159 enum {
160 SCTP_STATE_CLOSED = 0,
161 SCTP_STATE_COOKIE_WAIT = 1,
162 SCTP_STATE_COOKIE_ECHOED = 2,
163 SCTP_STATE_ESTABLISHED = 3,
164 SCTP_STATE_SHUTDOWN_PENDING = 4,
165 SCTP_STATE_SHUTDOWN_SENT = 5,
166 SCTP_STATE_SHUTDOWN_RECEIVED = 6,
167 SCTP_STATE_SHUTDOWN_ACK_SENT = 7,
168 };
169
170 #define SS_ALL ((1 << SS_MAX) - 1)
171 #define SS_CONN (SS_ALL & ~((1<<SS_LISTEN)|(1<<SS_CLOSE)|(1<<SS_TIME_WAIT)|(1<<SS_SYN_RECV)))
172
173 #include "ssfilter.h"
174
175 struct filter {
176 int dbs;
177 int states;
178 uint64_t families;
179 struct ssfilter *f;
180 bool kill;
181 };
182
183 #define FAMILY_MASK(family) ((uint64_t)1 << (family))
184
185 static const struct filter default_dbs[MAX_DB] = {
186 [TCP_DB] = {
187 .states = SS_CONN,
188 .families = FAMILY_MASK(AF_INET) | FAMILY_MASK(AF_INET6),
189 },
190 [DCCP_DB] = {
191 .states = SS_CONN,
192 .families = FAMILY_MASK(AF_INET) | FAMILY_MASK(AF_INET6),
193 },
194 [UDP_DB] = {
195 .states = (1 << SS_ESTABLISHED),
196 .families = FAMILY_MASK(AF_INET) | FAMILY_MASK(AF_INET6),
197 },
198 [RAW_DB] = {
199 .states = (1 << SS_ESTABLISHED),
200 .families = FAMILY_MASK(AF_INET) | FAMILY_MASK(AF_INET6),
201 },
202 [UNIX_DG_DB] = {
203 .states = (1 << SS_CLOSE),
204 .families = FAMILY_MASK(AF_UNIX),
205 },
206 [UNIX_ST_DB] = {
207 .states = SS_CONN,
208 .families = FAMILY_MASK(AF_UNIX),
209 },
210 [UNIX_SQ_DB] = {
211 .states = SS_CONN,
212 .families = FAMILY_MASK(AF_UNIX),
213 },
214 [PACKET_DG_DB] = {
215 .states = (1 << SS_CLOSE),
216 .families = FAMILY_MASK(AF_PACKET),
217 },
218 [PACKET_R_DB] = {
219 .states = (1 << SS_CLOSE),
220 .families = FAMILY_MASK(AF_PACKET),
221 },
222 [NETLINK_DB] = {
223 .states = (1 << SS_CLOSE),
224 .families = FAMILY_MASK(AF_NETLINK),
225 },
226 [SCTP_DB] = {
227 .states = SS_CONN,
228 .families = FAMILY_MASK(AF_INET) | FAMILY_MASK(AF_INET6),
229 },
230 [VSOCK_ST_DB] = {
231 .states = SS_CONN,
232 .families = FAMILY_MASK(AF_VSOCK),
233 },
234 [VSOCK_DG_DB] = {
235 .states = SS_CONN,
236 .families = FAMILY_MASK(AF_VSOCK),
237 },
238 };
239
240 static const struct filter default_afs[AF_MAX] = {
241 [AF_INET] = {
242 .dbs = INET_DBM,
243 .states = SS_CONN,
244 },
245 [AF_INET6] = {
246 .dbs = INET_DBM,
247 .states = SS_CONN,
248 },
249 [AF_UNIX] = {
250 .dbs = UNIX_DBM,
251 .states = SS_CONN,
252 },
253 [AF_PACKET] = {
254 .dbs = PACKET_DBM,
255 .states = (1 << SS_CLOSE),
256 },
257 [AF_NETLINK] = {
258 .dbs = (1 << NETLINK_DB),
259 .states = (1 << SS_CLOSE),
260 },
261 [AF_VSOCK] = {
262 .dbs = VSOCK_DBM,
263 .states = SS_CONN,
264 },
265 };
266
267 static int do_default = 1;
268 static struct filter current_filter;
269
270 static void filter_db_set(struct filter *f, int db)
271 {
272 f->states |= default_dbs[db].states;
273 f->dbs |= 1 << db;
274 do_default = 0;
275 }
276
277 static void filter_af_set(struct filter *f, int af)
278 {
279 f->states |= default_afs[af].states;
280 f->families |= FAMILY_MASK(af);
281 do_default = 0;
282 preferred_family = af;
283 }
284
285 static int filter_af_get(struct filter *f, int af)
286 {
287 return !!(f->families & FAMILY_MASK(af));
288 }
289
290 static void filter_default_dbs(struct filter *f)
291 {
292 filter_db_set(f, UDP_DB);
293 filter_db_set(f, DCCP_DB);
294 filter_db_set(f, TCP_DB);
295 filter_db_set(f, RAW_DB);
296 filter_db_set(f, UNIX_ST_DB);
297 filter_db_set(f, UNIX_DG_DB);
298 filter_db_set(f, UNIX_SQ_DB);
299 filter_db_set(f, PACKET_R_DB);
300 filter_db_set(f, PACKET_DG_DB);
301 filter_db_set(f, NETLINK_DB);
302 filter_db_set(f, SCTP_DB);
303 filter_db_set(f, VSOCK_ST_DB);
304 filter_db_set(f, VSOCK_DG_DB);
305 }
306
307 static void filter_states_set(struct filter *f, int states)
308 {
309 if (states)
310 f->states = states;
311 }
312
313 static void filter_merge_defaults(struct filter *f)
314 {
315 int db;
316 int af;
317
318 for (db = 0; db < MAX_DB; db++) {
319 if (!(f->dbs & (1 << db)))
320 continue;
321
322 if (!(default_dbs[db].families & f->families))
323 f->families |= default_dbs[db].families;
324 }
325 for (af = 0; af < AF_MAX; af++) {
326 if (!(f->families & FAMILY_MASK(af)))
327 continue;
328
329 if (!(default_afs[af].dbs & f->dbs))
330 f->dbs |= default_afs[af].dbs;
331 }
332 }
333
334 static FILE *generic_proc_open(const char *env, const char *name)
335 {
336 const char *p = getenv(env);
337 char store[128];
338
339 if (!p) {
340 p = getenv("PROC_ROOT") ? : "/proc";
341 snprintf(store, sizeof(store)-1, "%s/%s", p, name);
342 p = store;
343 }
344
345 return fopen(p, "r");
346 }
347 #define net_tcp_open() generic_proc_open("PROC_NET_TCP", "net/tcp")
348 #define net_tcp6_open() generic_proc_open("PROC_NET_TCP6", "net/tcp6")
349 #define net_udp_open() generic_proc_open("PROC_NET_UDP", "net/udp")
350 #define net_udp6_open() generic_proc_open("PROC_NET_UDP6", "net/udp6")
351 #define net_raw_open() generic_proc_open("PROC_NET_RAW", "net/raw")
352 #define net_raw6_open() generic_proc_open("PROC_NET_RAW6", "net/raw6")
353 #define net_unix_open() generic_proc_open("PROC_NET_UNIX", "net/unix")
354 #define net_packet_open() generic_proc_open("PROC_NET_PACKET", \
355 "net/packet")
356 #define net_netlink_open() generic_proc_open("PROC_NET_NETLINK", \
357 "net/netlink")
358 #define slabinfo_open() generic_proc_open("PROC_SLABINFO", "slabinfo")
359 #define net_sockstat_open() generic_proc_open("PROC_NET_SOCKSTAT", \
360 "net/sockstat")
361 #define net_sockstat6_open() generic_proc_open("PROC_NET_SOCKSTAT6", \
362 "net/sockstat6")
363 #define net_snmp_open() generic_proc_open("PROC_NET_SNMP", "net/snmp")
364 #define ephemeral_ports_open() generic_proc_open("PROC_IP_LOCAL_PORT_RANGE", \
365 "sys/net/ipv4/ip_local_port_range")
366
367 struct user_ent {
368 struct user_ent *next;
369 unsigned int ino;
370 int pid;
371 int fd;
372 char *process;
373 char *process_ctx;
374 char *socket_ctx;
375 };
376
377 #define USER_ENT_HASH_SIZE 256
378 struct user_ent *user_ent_hash[USER_ENT_HASH_SIZE];
379
380 static int user_ent_hashfn(unsigned int ino)
381 {
382 int val = (ino >> 24) ^ (ino >> 16) ^ (ino >> 8) ^ ino;
383
384 return val & (USER_ENT_HASH_SIZE - 1);
385 }
386
387 static void user_ent_add(unsigned int ino, char *process,
388 int pid, int fd,
389 char *proc_ctx,
390 char *sock_ctx)
391 {
392 struct user_ent *p, **pp;
393
394 p = malloc(sizeof(struct user_ent));
395 if (!p) {
396 fprintf(stderr, "ss: failed to malloc buffer\n");
397 abort();
398 }
399 p->next = NULL;
400 p->ino = ino;
401 p->pid = pid;
402 p->fd = fd;
403 p->process = strdup(process);
404 p->process_ctx = strdup(proc_ctx);
405 p->socket_ctx = strdup(sock_ctx);
406
407 pp = &user_ent_hash[user_ent_hashfn(ino)];
408 p->next = *pp;
409 *pp = p;
410 }
411
412 static void user_ent_destroy(void)
413 {
414 struct user_ent *p, *p_next;
415 int cnt = 0;
416
417 while (cnt != USER_ENT_HASH_SIZE) {
418 p = user_ent_hash[cnt];
419 while (p) {
420 free(p->process);
421 free(p->process_ctx);
422 free(p->socket_ctx);
423 p_next = p->next;
424 free(p);
425 p = p_next;
426 }
427 cnt++;
428 }
429 }
430
431 static void user_ent_hash_build(void)
432 {
433 const char *root = getenv("PROC_ROOT") ? : "/proc/";
434 struct dirent *d;
435 char name[1024];
436 int nameoff;
437 DIR *dir;
438 char *pid_context;
439 char *sock_context;
440 const char *no_ctx = "unavailable";
441 static int user_ent_hash_build_init;
442
443 /* If show_users & show_proc_ctx set only do this once */
444 if (user_ent_hash_build_init != 0)
445 return;
446
447 user_ent_hash_build_init = 1;
448
449 strlcpy(name, root, sizeof(name));
450
451 if (strlen(name) == 0 || name[strlen(name)-1] != '/')
452 strcat(name, "/");
453
454 nameoff = strlen(name);
455
456 dir = opendir(name);
457 if (!dir)
458 return;
459
460 while ((d = readdir(dir)) != NULL) {
461 struct dirent *d1;
462 char process[16];
463 char *p;
464 int pid, pos;
465 DIR *dir1;
466 char crap;
467
468 if (sscanf(d->d_name, "%d%c", &pid, &crap) != 1)
469 continue;
470
471 if (getpidcon(pid, &pid_context) != 0)
472 pid_context = strdup(no_ctx);
473
474 snprintf(name + nameoff, sizeof(name) - nameoff, "%d/fd/", pid);
475 pos = strlen(name);
476 if ((dir1 = opendir(name)) == NULL) {
477 free(pid_context);
478 continue;
479 }
480
481 process[0] = '\0';
482 p = process;
483
484 while ((d1 = readdir(dir1)) != NULL) {
485 const char *pattern = "socket:[";
486 unsigned int ino;
487 char lnk[64];
488 int fd;
489 ssize_t link_len;
490 char tmp[1024];
491
492 if (sscanf(d1->d_name, "%d%c", &fd, &crap) != 1)
493 continue;
494
495 snprintf(name+pos, sizeof(name) - pos, "%d", fd);
496
497 link_len = readlink(name, lnk, sizeof(lnk)-1);
498 if (link_len == -1)
499 continue;
500 lnk[link_len] = '\0';
501
502 if (strncmp(lnk, pattern, strlen(pattern)))
503 continue;
504
505 sscanf(lnk, "socket:[%u]", &ino);
506
507 snprintf(tmp, sizeof(tmp), "%s/%d/fd/%s",
508 root, pid, d1->d_name);
509
510 if (getfilecon(tmp, &sock_context) <= 0)
511 sock_context = strdup(no_ctx);
512
513 if (*p == '\0') {
514 FILE *fp;
515
516 snprintf(tmp, sizeof(tmp), "%s/%d/stat",
517 root, pid);
518 if ((fp = fopen(tmp, "r")) != NULL) {
519 if (fscanf(fp, "%*d (%[^)])", p) < 1)
520 ; /* ignore */
521 fclose(fp);
522 }
523 }
524 user_ent_add(ino, p, pid, fd,
525 pid_context, sock_context);
526 free(sock_context);
527 }
528 free(pid_context);
529 closedir(dir1);
530 }
531 closedir(dir);
532 }
533
534 enum entry_types {
535 USERS,
536 PROC_CTX,
537 PROC_SOCK_CTX
538 };
539
540 #define ENTRY_BUF_SIZE 512
541 static int find_entry(unsigned int ino, char **buf, int type)
542 {
543 struct user_ent *p;
544 int cnt = 0;
545 char *ptr;
546 char *new_buf;
547 int len, new_buf_len;
548 int buf_used = 0;
549 int buf_len = 0;
550
551 if (!ino)
552 return 0;
553
554 p = user_ent_hash[user_ent_hashfn(ino)];
555 ptr = *buf = NULL;
556 while (p) {
557 if (p->ino != ino)
558 goto next;
559
560 while (1) {
561 ptr = *buf + buf_used;
562 switch (type) {
563 case USERS:
564 len = snprintf(ptr, buf_len - buf_used,
565 "(\"%s\",pid=%d,fd=%d),",
566 p->process, p->pid, p->fd);
567 break;
568 case PROC_CTX:
569 len = snprintf(ptr, buf_len - buf_used,
570 "(\"%s\",pid=%d,proc_ctx=%s,fd=%d),",
571 p->process, p->pid,
572 p->process_ctx, p->fd);
573 break;
574 case PROC_SOCK_CTX:
575 len = snprintf(ptr, buf_len - buf_used,
576 "(\"%s\",pid=%d,proc_ctx=%s,fd=%d,sock_ctx=%s),",
577 p->process, p->pid,
578 p->process_ctx, p->fd,
579 p->socket_ctx);
580 break;
581 default:
582 fprintf(stderr, "ss: invalid type: %d\n", type);
583 abort();
584 }
585
586 if (len < 0 || len >= buf_len - buf_used) {
587 new_buf_len = buf_len + ENTRY_BUF_SIZE;
588 new_buf = realloc(*buf, new_buf_len);
589 if (!new_buf) {
590 fprintf(stderr, "ss: failed to malloc buffer\n");
591 abort();
592 }
593 *buf = new_buf;
594 buf_len = new_buf_len;
595 continue;
596 } else {
597 buf_used += len;
598 break;
599 }
600 }
601 cnt++;
602 next:
603 p = p->next;
604 }
605 if (buf_used) {
606 ptr = *buf + buf_used;
607 ptr[-1] = '\0';
608 }
609 return cnt;
610 }
611
612 /* Get stats from slab */
613
614 struct slabstat {
615 int socks;
616 int tcp_ports;
617 int tcp_tws;
618 int tcp_syns;
619 int skbs;
620 };
621
622 static struct slabstat slabstat;
623
624 static int get_slabstat(struct slabstat *s)
625 {
626 char buf[256];
627 FILE *fp;
628 int cnt;
629 static int slabstat_valid;
630 static const char * const slabstat_ids[] = {
631 "sock",
632 "tcp_bind_bucket",
633 "tcp_tw_bucket",
634 "tcp_open_request",
635 "skbuff_head_cache",
636 };
637
638 if (slabstat_valid)
639 return 0;
640
641 memset(s, 0, sizeof(*s));
642
643 fp = slabinfo_open();
644 if (!fp)
645 return -1;
646
647 cnt = sizeof(*s)/sizeof(int);
648
649 if (!fgets(buf, sizeof(buf), fp)) {
650 fclose(fp);
651 return -1;
652 }
653 while (fgets(buf, sizeof(buf), fp) != NULL) {
654 int i;
655
656 for (i = 0; i < ARRAY_SIZE(slabstat_ids); i++) {
657 if (memcmp(buf, slabstat_ids[i], strlen(slabstat_ids[i])) == 0) {
658 sscanf(buf, "%*s%d", ((int *)s) + i);
659 cnt--;
660 break;
661 }
662 }
663 if (cnt <= 0)
664 break;
665 }
666
667 slabstat_valid = 1;
668
669 fclose(fp);
670 return 0;
671 }
672
673 static unsigned long long cookie_sk_get(const uint32_t *cookie)
674 {
675 return (((unsigned long long)cookie[1] << 31) << 1) | cookie[0];
676 }
677
678 static const char *sctp_sstate_name[] = {
679 [SCTP_STATE_CLOSED] = "CLOSED",
680 [SCTP_STATE_COOKIE_WAIT] = "COOKIE_WAIT",
681 [SCTP_STATE_COOKIE_ECHOED] = "COOKIE_ECHOED",
682 [SCTP_STATE_ESTABLISHED] = "ESTAB",
683 [SCTP_STATE_SHUTDOWN_PENDING] = "SHUTDOWN_PENDING",
684 [SCTP_STATE_SHUTDOWN_SENT] = "SHUTDOWN_SENT",
685 [SCTP_STATE_SHUTDOWN_RECEIVED] = "SHUTDOWN_RECEIVED",
686 [SCTP_STATE_SHUTDOWN_ACK_SENT] = "ACK_SENT",
687 };
688
689 struct sockstat {
690 struct sockstat *next;
691 unsigned int type;
692 uint16_t prot;
693 uint16_t raw_prot;
694 inet_prefix local;
695 inet_prefix remote;
696 int lport;
697 int rport;
698 int state;
699 int rq, wq;
700 unsigned int ino;
701 unsigned int uid;
702 int refcnt;
703 unsigned int iface;
704 unsigned long long sk;
705 char *name;
706 char *peer_name;
707 __u32 mark;
708 };
709
710 struct dctcpstat {
711 unsigned int ce_state;
712 unsigned int alpha;
713 unsigned int ab_ecn;
714 unsigned int ab_tot;
715 bool enabled;
716 };
717
718 struct tcpstat {
719 struct sockstat ss;
720 unsigned int timer;
721 unsigned int timeout;
722 int probes;
723 char cong_alg[16];
724 double rto, ato, rtt, rttvar;
725 int qack, ssthresh, backoff;
726 double send_bps;
727 int snd_wscale;
728 int rcv_wscale;
729 int mss;
730 int rcv_mss;
731 int advmss;
732 unsigned int cwnd;
733 unsigned int lastsnd;
734 unsigned int lastrcv;
735 unsigned int lastack;
736 double pacing_rate;
737 double pacing_rate_max;
738 double delivery_rate;
739 unsigned long long bytes_acked;
740 unsigned long long bytes_received;
741 unsigned int segs_out;
742 unsigned int segs_in;
743 unsigned int data_segs_out;
744 unsigned int data_segs_in;
745 unsigned int unacked;
746 unsigned int retrans;
747 unsigned int retrans_total;
748 unsigned int lost;
749 unsigned int sacked;
750 unsigned int fackets;
751 unsigned int reordering;
752 unsigned int not_sent;
753 double rcv_rtt;
754 double min_rtt;
755 int rcv_space;
756 unsigned long long busy_time;
757 unsigned long long rwnd_limited;
758 unsigned long long sndbuf_limited;
759 bool has_ts_opt;
760 bool has_sack_opt;
761 bool has_ecn_opt;
762 bool has_ecnseen_opt;
763 bool has_fastopen_opt;
764 bool has_wscale_opt;
765 bool app_limited;
766 struct dctcpstat *dctcp;
767 struct tcp_bbr_info *bbr_info;
768 };
769
770 /* SCTP assocs share the same inode number with their parent endpoint. So if we
771 * have seen the inode number before, it must be an assoc instead of the next
772 * endpoint. */
773 static bool is_sctp_assoc(struct sockstat *s, const char *sock_name)
774 {
775 if (strcmp(sock_name, "sctp"))
776 return false;
777 if (!sctp_ino || sctp_ino != s->ino)
778 return false;
779 return true;
780 }
781
782 static const char *unix_netid_name(int type)
783 {
784 switch (type) {
785 case SOCK_STREAM:
786 return "u_str";
787 case SOCK_SEQPACKET:
788 return "u_seq";
789 case SOCK_DGRAM:
790 default:
791 return "u_dgr";
792 }
793 }
794
795 static const char *proto_name(int protocol)
796 {
797 switch (protocol) {
798 case 0:
799 return "raw";
800 case IPPROTO_UDP:
801 return "udp";
802 case IPPROTO_TCP:
803 return "tcp";
804 case IPPROTO_SCTP:
805 return "sctp";
806 case IPPROTO_DCCP:
807 return "dccp";
808 case IPPROTO_ICMPV6:
809 return "icmp6";
810 }
811
812 return "???";
813 }
814
815 static const char *vsock_netid_name(int type)
816 {
817 switch (type) {
818 case SOCK_STREAM:
819 return "v_str";
820 case SOCK_DGRAM:
821 return "v_dgr";
822 default:
823 return "???";
824 }
825 }
826
827 static void sock_state_print(struct sockstat *s)
828 {
829 const char *sock_name;
830 static const char * const sstate_name[] = {
831 "UNKNOWN",
832 [SS_ESTABLISHED] = "ESTAB",
833 [SS_SYN_SENT] = "SYN-SENT",
834 [SS_SYN_RECV] = "SYN-RECV",
835 [SS_FIN_WAIT1] = "FIN-WAIT-1",
836 [SS_FIN_WAIT2] = "FIN-WAIT-2",
837 [SS_TIME_WAIT] = "TIME-WAIT",
838 [SS_CLOSE] = "UNCONN",
839 [SS_CLOSE_WAIT] = "CLOSE-WAIT",
840 [SS_LAST_ACK] = "LAST-ACK",
841 [SS_LISTEN] = "LISTEN",
842 [SS_CLOSING] = "CLOSING",
843 };
844
845 switch (s->local.family) {
846 case AF_UNIX:
847 sock_name = unix_netid_name(s->type);
848 break;
849 case AF_INET:
850 case AF_INET6:
851 sock_name = proto_name(s->type);
852 break;
853 case AF_PACKET:
854 sock_name = s->type == SOCK_RAW ? "p_raw" : "p_dgr";
855 break;
856 case AF_NETLINK:
857 sock_name = "nl";
858 break;
859 case AF_VSOCK:
860 sock_name = vsock_netid_name(s->type);
861 break;
862 default:
863 sock_name = "unknown";
864 }
865
866 if (netid_width)
867 printf("%-*s ", netid_width,
868 is_sctp_assoc(s, sock_name) ? "" : sock_name);
869 if (state_width) {
870 if (is_sctp_assoc(s, sock_name))
871 printf("`- %-*s ", state_width - 3,
872 sctp_sstate_name[s->state]);
873 else
874 printf("%-*s ", state_width, sstate_name[s->state]);
875 }
876
877 printf("%-6d %-6d %s", s->rq, s->wq, odd_width_pad);
878 }
879
880 static void sock_details_print(struct sockstat *s)
881 {
882 if (s->uid)
883 printf(" uid:%u", s->uid);
884
885 printf(" ino:%u", s->ino);
886 printf(" sk:%llx", s->sk);
887
888 if (s->mark)
889 printf(" fwmark:0x%x", s->mark);
890 }
891
892 static void sock_addr_print_width(int addr_len, const char *addr, char *delim,
893 int port_len, const char *port, const char *ifname)
894 {
895 if (ifname) {
896 printf("%*s%%%s%s%-*s ", addr_len, addr, ifname, delim,
897 port_len, port);
898 } else {
899 printf("%*s%s%-*s ", addr_len, addr, delim, port_len, port);
900 }
901 }
902
903 static void sock_addr_print(const char *addr, char *delim, const char *port,
904 const char *ifname)
905 {
906 sock_addr_print_width(addr_width, addr, delim, serv_width, port, ifname);
907 }
908
909 static const char *print_ms_timer(unsigned int timeout)
910 {
911 static char buf[64];
912 int secs, msecs, minutes;
913
914 secs = timeout/1000;
915 minutes = secs/60;
916 secs = secs%60;
917 msecs = timeout%1000;
918 buf[0] = 0;
919 if (minutes) {
920 msecs = 0;
921 snprintf(buf, sizeof(buf)-16, "%dmin", minutes);
922 if (minutes > 9)
923 secs = 0;
924 }
925 if (secs) {
926 if (secs > 9)
927 msecs = 0;
928 sprintf(buf+strlen(buf), "%d%s", secs, msecs ? "." : "sec");
929 }
930 if (msecs)
931 sprintf(buf+strlen(buf), "%03dms", msecs);
932 return buf;
933 }
934
935 struct scache {
936 struct scache *next;
937 int port;
938 char *name;
939 const char *proto;
940 };
941
942 struct scache *rlist;
943
944 static void init_service_resolver(void)
945 {
946 char buf[128];
947 FILE *fp = popen("/usr/sbin/rpcinfo -p 2>/dev/null", "r");
948
949 if (!fp)
950 return;
951
952 if (!fgets(buf, sizeof(buf), fp)) {
953 pclose(fp);
954 return;
955 }
956 while (fgets(buf, sizeof(buf), fp) != NULL) {
957 unsigned int progn, port;
958 char proto[128], prog[128] = "rpc.";
959 struct scache *c;
960
961 if (sscanf(buf, "%u %*d %s %u %s",
962 &progn, proto, &port, prog+4) != 4)
963 continue;
964
965 if (!(c = malloc(sizeof(*c))))
966 continue;
967
968 c->port = port;
969 c->name = strdup(prog);
970 if (strcmp(proto, TCP_PROTO) == 0)
971 c->proto = TCP_PROTO;
972 else if (strcmp(proto, UDP_PROTO) == 0)
973 c->proto = UDP_PROTO;
974 else if (strcmp(proto, SCTP_PROTO) == 0)
975 c->proto = SCTP_PROTO;
976 else
977 c->proto = NULL;
978 c->next = rlist;
979 rlist = c;
980 }
981 pclose(fp);
982 }
983
984 /* Even do not try default linux ephemeral port ranges:
985 * default /etc/services contains so much of useless crap
986 * wouldbe "allocated" to this area that resolution
987 * is really harmful. I shrug each time when seeing
988 * "socks" or "cfinger" in dumps.
989 */
990 static int is_ephemeral(int port)
991 {
992 static int min = 0, max;
993
994 if (!min) {
995 FILE *f = ephemeral_ports_open();
996
997 if (!f || fscanf(f, "%d %d", &min, &max) < 2) {
998 min = 1024;
999 max = 4999;
1000 }
1001 if (f)
1002 fclose(f);
1003 }
1004 return port >= min && port <= max;
1005 }
1006
1007
1008 static const char *__resolve_service(int port)
1009 {
1010 struct scache *c;
1011
1012 for (c = rlist; c; c = c->next) {
1013 if (c->port == port && c->proto == dg_proto)
1014 return c->name;
1015 }
1016
1017 if (!is_ephemeral(port)) {
1018 static int notfirst;
1019 struct servent *se;
1020
1021 if (!notfirst) {
1022 setservent(1);
1023 notfirst = 1;
1024 }
1025 se = getservbyport(htons(port), dg_proto);
1026 if (se)
1027 return se->s_name;
1028 }
1029
1030 return NULL;
1031 }
1032
1033 #define SCACHE_BUCKETS 1024
1034 static struct scache *cache_htab[SCACHE_BUCKETS];
1035
1036 static const char *resolve_service(int port)
1037 {
1038 static char buf[128];
1039 struct scache *c;
1040 const char *res;
1041 int hash;
1042
1043 if (port == 0) {
1044 buf[0] = '*';
1045 buf[1] = 0;
1046 return buf;
1047 }
1048
1049 if (!resolve_services)
1050 goto do_numeric;
1051
1052 if (dg_proto == RAW_PROTO)
1053 return inet_proto_n2a(port, buf, sizeof(buf));
1054
1055
1056 hash = (port^(((unsigned long)dg_proto)>>2)) % SCACHE_BUCKETS;
1057
1058 for (c = cache_htab[hash]; c; c = c->next) {
1059 if (c->port == port && c->proto == dg_proto)
1060 goto do_cache;
1061 }
1062
1063 c = malloc(sizeof(*c));
1064 if (!c)
1065 goto do_numeric;
1066 res = __resolve_service(port);
1067 c->port = port;
1068 c->name = res ? strdup(res) : NULL;
1069 c->proto = dg_proto;
1070 c->next = cache_htab[hash];
1071 cache_htab[hash] = c;
1072
1073 do_cache:
1074 if (c->name)
1075 return c->name;
1076
1077 do_numeric:
1078 sprintf(buf, "%u", port);
1079 return buf;
1080 }
1081
1082 static void inet_addr_print(const inet_prefix *a, int port,
1083 unsigned int ifindex, bool v6only)
1084 {
1085 char buf[1024];
1086 const char *ap = buf;
1087 int est_len = addr_width;
1088 const char *ifname = NULL;
1089
1090 if (a->family == AF_INET) {
1091 ap = format_host(AF_INET, 4, a->data);
1092 } else {
1093 if (!v6only &&
1094 !memcmp(a->data, &in6addr_any, sizeof(in6addr_any))) {
1095 buf[0] = '*';
1096 buf[1] = 0;
1097 } else {
1098 ap = format_host(a->family, 16, a->data);
1099
1100 /* Numeric IPv6 addresses should be bracketed */
1101 if (strchr(ap, ':')) {
1102 snprintf(buf, sizeof(buf),
1103 "[%s]", ap);
1104 ap = buf;
1105 }
1106
1107 est_len = strlen(ap);
1108 if (est_len <= addr_width)
1109 est_len = addr_width;
1110 else
1111 est_len = addr_width + ((est_len-addr_width+3)/4)*4;
1112 }
1113 }
1114
1115 if (ifindex) {
1116 ifname = ll_index_to_name(ifindex);
1117 est_len -= strlen(ifname) + 1; /* +1 for percent char */
1118 if (est_len < 0)
1119 est_len = 0;
1120 }
1121
1122 sock_addr_print_width(est_len, ap, ":", serv_width, resolve_service(port),
1123 ifname);
1124 }
1125
1126 struct aafilter {
1127 inet_prefix addr;
1128 int port;
1129 unsigned int iface;
1130 __u32 mark;
1131 __u32 mask;
1132 struct aafilter *next;
1133 };
1134
1135 static int inet2_addr_match(const inet_prefix *a, const inet_prefix *p,
1136 int plen)
1137 {
1138 if (!inet_addr_match(a, p, plen))
1139 return 0;
1140
1141 /* Cursed "v4 mapped" addresses: v4 mapped socket matches
1142 * pure IPv4 rule, but v4-mapped rule selects only v4-mapped
1143 * sockets. Fair? */
1144 if (p->family == AF_INET && a->family == AF_INET6) {
1145 if (a->data[0] == 0 && a->data[1] == 0 &&
1146 a->data[2] == htonl(0xffff)) {
1147 inet_prefix tmp = *a;
1148
1149 tmp.data[0] = a->data[3];
1150 return inet_addr_match(&tmp, p, plen);
1151 }
1152 }
1153 return 1;
1154 }
1155
1156 static int unix_match(const inet_prefix *a, const inet_prefix *p)
1157 {
1158 char *addr, *pattern;
1159
1160 memcpy(&addr, a->data, sizeof(addr));
1161 memcpy(&pattern, p->data, sizeof(pattern));
1162 if (pattern == NULL)
1163 return 1;
1164 if (addr == NULL)
1165 addr = "";
1166 return !fnmatch(pattern, addr, 0);
1167 }
1168
1169 static int run_ssfilter(struct ssfilter *f, struct sockstat *s)
1170 {
1171 switch (f->type) {
1172 case SSF_S_AUTO:
1173 {
1174 if (s->local.family == AF_UNIX) {
1175 char *p;
1176
1177 memcpy(&p, s->local.data, sizeof(p));
1178 return p == NULL || (p[0] == '@' && strlen(p) == 6 &&
1179 strspn(p+1, "0123456789abcdef") == 5);
1180 }
1181 if (s->local.family == AF_PACKET)
1182 return s->lport == 0 && s->local.data[0] == 0;
1183 if (s->local.family == AF_NETLINK)
1184 return s->lport < 0;
1185 if (s->local.family == AF_VSOCK)
1186 return s->lport > 1023;
1187
1188 return is_ephemeral(s->lport);
1189 }
1190 case SSF_DCOND:
1191 {
1192 struct aafilter *a = (void *)f->pred;
1193
1194 if (a->addr.family == AF_UNIX)
1195 return unix_match(&s->remote, &a->addr);
1196 if (a->port != -1 && a->port != s->rport)
1197 return 0;
1198 if (a->addr.bitlen) {
1199 do {
1200 if (!inet2_addr_match(&s->remote, &a->addr, a->addr.bitlen))
1201 return 1;
1202 } while ((a = a->next) != NULL);
1203 return 0;
1204 }
1205 return 1;
1206 }
1207 case SSF_SCOND:
1208 {
1209 struct aafilter *a = (void *)f->pred;
1210
1211 if (a->addr.family == AF_UNIX)
1212 return unix_match(&s->local, &a->addr);
1213 if (a->port != -1 && a->port != s->lport)
1214 return 0;
1215 if (a->addr.bitlen) {
1216 do {
1217 if (!inet2_addr_match(&s->local, &a->addr, a->addr.bitlen))
1218 return 1;
1219 } while ((a = a->next) != NULL);
1220 return 0;
1221 }
1222 return 1;
1223 }
1224 case SSF_D_GE:
1225 {
1226 struct aafilter *a = (void *)f->pred;
1227
1228 return s->rport >= a->port;
1229 }
1230 case SSF_D_LE:
1231 {
1232 struct aafilter *a = (void *)f->pred;
1233
1234 return s->rport <= a->port;
1235 }
1236 case SSF_S_GE:
1237 {
1238 struct aafilter *a = (void *)f->pred;
1239
1240 return s->lport >= a->port;
1241 }
1242 case SSF_S_LE:
1243 {
1244 struct aafilter *a = (void *)f->pred;
1245
1246 return s->lport <= a->port;
1247 }
1248 case SSF_DEVCOND:
1249 {
1250 struct aafilter *a = (void *)f->pred;
1251
1252 return s->iface == a->iface;
1253 }
1254 case SSF_MARKMASK:
1255 {
1256 struct aafilter *a = (void *)f->pred;
1257
1258 return (s->mark & a->mask) == a->mark;
1259 }
1260 /* Yup. It is recursion. Sorry. */
1261 case SSF_AND:
1262 return run_ssfilter(f->pred, s) && run_ssfilter(f->post, s);
1263 case SSF_OR:
1264 return run_ssfilter(f->pred, s) || run_ssfilter(f->post, s);
1265 case SSF_NOT:
1266 return !run_ssfilter(f->pred, s);
1267 default:
1268 abort();
1269 }
1270 }
1271
1272 /* Relocate external jumps by reloc. */
1273 static void ssfilter_patch(char *a, int len, int reloc)
1274 {
1275 while (len > 0) {
1276 struct inet_diag_bc_op *op = (struct inet_diag_bc_op *)a;
1277
1278 if (op->no == len+4)
1279 op->no += reloc;
1280 len -= op->yes;
1281 a += op->yes;
1282 }
1283 if (len < 0)
1284 abort();
1285 }
1286
1287 static int ssfilter_bytecompile(struct ssfilter *f, char **bytecode)
1288 {
1289 switch (f->type) {
1290 case SSF_S_AUTO:
1291 {
1292 if (!(*bytecode = malloc(4))) abort();
1293 ((struct inet_diag_bc_op *)*bytecode)[0] = (struct inet_diag_bc_op){ INET_DIAG_BC_AUTO, 4, 8 };
1294 return 4;
1295 }
1296 case SSF_DCOND:
1297 case SSF_SCOND:
1298 {
1299 struct aafilter *a = (void *)f->pred;
1300 struct aafilter *b;
1301 char *ptr;
1302 int code = (f->type == SSF_DCOND ? INET_DIAG_BC_D_COND : INET_DIAG_BC_S_COND);
1303 int len = 0;
1304
1305 for (b = a; b; b = b->next) {
1306 len += 4 + sizeof(struct inet_diag_hostcond);
1307 if (a->addr.family == AF_INET6)
1308 len += 16;
1309 else
1310 len += 4;
1311 if (b->next)
1312 len += 4;
1313 }
1314 if (!(ptr = malloc(len))) abort();
1315 *bytecode = ptr;
1316 for (b = a; b; b = b->next) {
1317 struct inet_diag_bc_op *op = (struct inet_diag_bc_op *)ptr;
1318 int alen = (a->addr.family == AF_INET6 ? 16 : 4);
1319 int oplen = alen + 4 + sizeof(struct inet_diag_hostcond);
1320 struct inet_diag_hostcond *cond = (struct inet_diag_hostcond *)(ptr+4);
1321
1322 *op = (struct inet_diag_bc_op){ code, oplen, oplen+4 };
1323 cond->family = a->addr.family;
1324 cond->port = a->port;
1325 cond->prefix_len = a->addr.bitlen;
1326 memcpy(cond->addr, a->addr.data, alen);
1327 ptr += oplen;
1328 if (b->next) {
1329 op = (struct inet_diag_bc_op *)ptr;
1330 *op = (struct inet_diag_bc_op){ INET_DIAG_BC_JMP, 4, len - (ptr-*bytecode)};
1331 ptr += 4;
1332 }
1333 }
1334 return ptr - *bytecode;
1335 }
1336 case SSF_D_GE:
1337 {
1338 struct aafilter *x = (void *)f->pred;
1339
1340 if (!(*bytecode = malloc(8))) abort();
1341 ((struct inet_diag_bc_op *)*bytecode)[0] = (struct inet_diag_bc_op){ INET_DIAG_BC_D_GE, 8, 12 };
1342 ((struct inet_diag_bc_op *)*bytecode)[1] = (struct inet_diag_bc_op){ 0, 0, x->port };
1343 return 8;
1344 }
1345 case SSF_D_LE:
1346 {
1347 struct aafilter *x = (void *)f->pred;
1348
1349 if (!(*bytecode = malloc(8))) abort();
1350 ((struct inet_diag_bc_op *)*bytecode)[0] = (struct inet_diag_bc_op){ INET_DIAG_BC_D_LE, 8, 12 };
1351 ((struct inet_diag_bc_op *)*bytecode)[1] = (struct inet_diag_bc_op){ 0, 0, x->port };
1352 return 8;
1353 }
1354 case SSF_S_GE:
1355 {
1356 struct aafilter *x = (void *)f->pred;
1357
1358 if (!(*bytecode = malloc(8))) abort();
1359 ((struct inet_diag_bc_op *)*bytecode)[0] = (struct inet_diag_bc_op){ INET_DIAG_BC_S_GE, 8, 12 };
1360 ((struct inet_diag_bc_op *)*bytecode)[1] = (struct inet_diag_bc_op){ 0, 0, x->port };
1361 return 8;
1362 }
1363 case SSF_S_LE:
1364 {
1365 struct aafilter *x = (void *)f->pred;
1366
1367 if (!(*bytecode = malloc(8))) abort();
1368 ((struct inet_diag_bc_op *)*bytecode)[0] = (struct inet_diag_bc_op){ INET_DIAG_BC_S_LE, 8, 12 };
1369 ((struct inet_diag_bc_op *)*bytecode)[1] = (struct inet_diag_bc_op){ 0, 0, x->port };
1370 return 8;
1371 }
1372
1373 case SSF_AND:
1374 {
1375 char *a1 = NULL, *a2 = NULL, *a;
1376 int l1, l2;
1377
1378 l1 = ssfilter_bytecompile(f->pred, &a1);
1379 l2 = ssfilter_bytecompile(f->post, &a2);
1380 if (!l1 || !l2) {
1381 free(a1);
1382 free(a2);
1383 return 0;
1384 }
1385 if (!(a = malloc(l1+l2))) abort();
1386 memcpy(a, a1, l1);
1387 memcpy(a+l1, a2, l2);
1388 free(a1); free(a2);
1389 ssfilter_patch(a, l1, l2);
1390 *bytecode = a;
1391 return l1+l2;
1392 }
1393 case SSF_OR:
1394 {
1395 char *a1 = NULL, *a2 = NULL, *a;
1396 int l1, l2;
1397
1398 l1 = ssfilter_bytecompile(f->pred, &a1);
1399 l2 = ssfilter_bytecompile(f->post, &a2);
1400 if (!l1 || !l2) {
1401 free(a1);
1402 free(a2);
1403 return 0;
1404 }
1405 if (!(a = malloc(l1+l2+4))) abort();
1406 memcpy(a, a1, l1);
1407 memcpy(a+l1+4, a2, l2);
1408 free(a1); free(a2);
1409 *(struct inet_diag_bc_op *)(a+l1) = (struct inet_diag_bc_op){ INET_DIAG_BC_JMP, 4, l2+4 };
1410 *bytecode = a;
1411 return l1+l2+4;
1412 }
1413 case SSF_NOT:
1414 {
1415 char *a1 = NULL, *a;
1416 int l1;
1417
1418 l1 = ssfilter_bytecompile(f->pred, &a1);
1419 if (!l1) {
1420 free(a1);
1421 return 0;
1422 }
1423 if (!(a = malloc(l1+4))) abort();
1424 memcpy(a, a1, l1);
1425 free(a1);
1426 *(struct inet_diag_bc_op *)(a+l1) = (struct inet_diag_bc_op){ INET_DIAG_BC_JMP, 4, 8 };
1427 *bytecode = a;
1428 return l1+4;
1429 }
1430 case SSF_DEVCOND:
1431 {
1432 /* bytecompile for SSF_DEVCOND not supported yet */
1433 return 0;
1434 }
1435 case SSF_MARKMASK:
1436 {
1437 struct aafilter *a = (void *)f->pred;
1438 struct instr {
1439 struct inet_diag_bc_op op;
1440 struct inet_diag_markcond cond;
1441 };
1442 int inslen = sizeof(struct instr);
1443
1444 if (!(*bytecode = malloc(inslen))) abort();
1445 ((struct instr *)*bytecode)[0] = (struct instr) {
1446 { INET_DIAG_BC_MARK_COND, inslen, inslen + 4 },
1447 { a->mark, a->mask},
1448 };
1449
1450 return inslen;
1451 }
1452 default:
1453 abort();
1454 }
1455 }
1456
1457 static int remember_he(struct aafilter *a, struct hostent *he)
1458 {
1459 char **ptr = he->h_addr_list;
1460 int cnt = 0;
1461 int len;
1462
1463 if (he->h_addrtype == AF_INET)
1464 len = 4;
1465 else if (he->h_addrtype == AF_INET6)
1466 len = 16;
1467 else
1468 return 0;
1469
1470 while (*ptr) {
1471 struct aafilter *b = a;
1472
1473 if (a->addr.bitlen) {
1474 if ((b = malloc(sizeof(*b))) == NULL)
1475 return cnt;
1476 *b = *a;
1477 a->next = b;
1478 }
1479 memcpy(b->addr.data, *ptr, len);
1480 b->addr.bytelen = len;
1481 b->addr.bitlen = len*8;
1482 b->addr.family = he->h_addrtype;
1483 ptr++;
1484 cnt++;
1485 }
1486 return cnt;
1487 }
1488
1489 static int get_dns_host(struct aafilter *a, const char *addr, int fam)
1490 {
1491 static int notfirst;
1492 int cnt = 0;
1493 struct hostent *he;
1494
1495 a->addr.bitlen = 0;
1496 if (!notfirst) {
1497 sethostent(1);
1498 notfirst = 1;
1499 }
1500 he = gethostbyname2(addr, fam == AF_UNSPEC ? AF_INET : fam);
1501 if (he)
1502 cnt = remember_he(a, he);
1503 if (fam == AF_UNSPEC) {
1504 he = gethostbyname2(addr, AF_INET6);
1505 if (he)
1506 cnt += remember_he(a, he);
1507 }
1508 return !cnt;
1509 }
1510
1511 static int xll_initted;
1512
1513 static void xll_init(void)
1514 {
1515 struct rtnl_handle rth;
1516
1517 if (rtnl_open(&rth, 0) < 0)
1518 exit(1);
1519
1520 ll_init_map(&rth);
1521 rtnl_close(&rth);
1522 xll_initted = 1;
1523 }
1524
1525 static const char *xll_index_to_name(int index)
1526 {
1527 if (!xll_initted)
1528 xll_init();
1529 return ll_index_to_name(index);
1530 }
1531
1532 static int xll_name_to_index(const char *dev)
1533 {
1534 if (!xll_initted)
1535 xll_init();
1536 return ll_name_to_index(dev);
1537 }
1538
1539 void *parse_devcond(char *name)
1540 {
1541 struct aafilter a = { .iface = 0 };
1542 struct aafilter *res;
1543
1544 a.iface = xll_name_to_index(name);
1545 if (a.iface == 0) {
1546 char *end;
1547 unsigned long n;
1548
1549 n = strtoul(name, &end, 0);
1550 if (!end || end == name || *end || n > UINT_MAX)
1551 return NULL;
1552
1553 a.iface = n;
1554 }
1555
1556 res = malloc(sizeof(*res));
1557 *res = a;
1558
1559 return res;
1560 }
1561
1562 static void vsock_set_inet_prefix(inet_prefix *a, __u32 cid)
1563 {
1564 *a = (inet_prefix){
1565 .bytelen = sizeof(cid),
1566 .family = AF_VSOCK,
1567 };
1568 memcpy(a->data, &cid, sizeof(cid));
1569 }
1570
1571 void *parse_hostcond(char *addr, bool is_port)
1572 {
1573 char *port = NULL;
1574 struct aafilter a = { .port = -1 };
1575 struct aafilter *res;
1576 int fam = preferred_family;
1577 struct filter *f = &current_filter;
1578
1579 if (fam == AF_UNIX || strncmp(addr, "unix:", 5) == 0) {
1580 char *p;
1581
1582 a.addr.family = AF_UNIX;
1583 if (strncmp(addr, "unix:", 5) == 0)
1584 addr += 5;
1585 p = strdup(addr);
1586 a.addr.bitlen = 8*strlen(p);
1587 memcpy(a.addr.data, &p, sizeof(p));
1588 fam = AF_UNIX;
1589 goto out;
1590 }
1591
1592 if (fam == AF_PACKET || strncmp(addr, "link:", 5) == 0) {
1593 a.addr.family = AF_PACKET;
1594 a.addr.bitlen = 0;
1595 if (strncmp(addr, "link:", 5) == 0)
1596 addr += 5;
1597 port = strchr(addr, ':');
1598 if (port) {
1599 *port = 0;
1600 if (port[1] && strcmp(port+1, "*")) {
1601 if (get_integer(&a.port, port+1, 0)) {
1602 if ((a.port = xll_name_to_index(port+1)) <= 0)
1603 return NULL;
1604 }
1605 }
1606 }
1607 if (addr[0] && strcmp(addr, "*")) {
1608 unsigned short tmp;
1609
1610 a.addr.bitlen = 32;
1611 if (ll_proto_a2n(&tmp, addr))
1612 return NULL;
1613 a.addr.data[0] = ntohs(tmp);
1614 }
1615 fam = AF_PACKET;
1616 goto out;
1617 }
1618
1619 if (fam == AF_NETLINK || strncmp(addr, "netlink:", 8) == 0) {
1620 a.addr.family = AF_NETLINK;
1621 a.addr.bitlen = 0;
1622 if (strncmp(addr, "netlink:", 8) == 0)
1623 addr += 8;
1624 port = strchr(addr, ':');
1625 if (port) {
1626 *port = 0;
1627 if (port[1] && strcmp(port+1, "*")) {
1628 if (get_integer(&a.port, port+1, 0)) {
1629 if (strcmp(port+1, "kernel") == 0)
1630 a.port = 0;
1631 else
1632 return NULL;
1633 }
1634 }
1635 }
1636 if (addr[0] && strcmp(addr, "*")) {
1637 a.addr.bitlen = 32;
1638 if (nl_proto_a2n(&a.addr.data[0], addr) == -1)
1639 return NULL;
1640 }
1641 fam = AF_NETLINK;
1642 goto out;
1643 }
1644
1645 if (fam == AF_VSOCK || strncmp(addr, "vsock:", 6) == 0) {
1646 __u32 cid = ~(__u32)0;
1647
1648 a.addr.family = AF_VSOCK;
1649 if (strncmp(addr, "vsock:", 6) == 0)
1650 addr += 6;
1651
1652 if (is_port)
1653 port = addr;
1654 else {
1655 port = strchr(addr, ':');
1656 if (port) {
1657 *port = '\0';
1658 port++;
1659 }
1660 }
1661
1662 if (port && strcmp(port, "*") &&
1663 get_u32((__u32 *)&a.port, port, 0))
1664 return NULL;
1665
1666 if (addr[0] && strcmp(addr, "*")) {
1667 a.addr.bitlen = 32;
1668 if (get_u32(&cid, addr, 0))
1669 return NULL;
1670 }
1671 vsock_set_inet_prefix(&a.addr, cid);
1672 fam = AF_VSOCK;
1673 goto out;
1674 }
1675
1676 if (fam == AF_INET || !strncmp(addr, "inet:", 5)) {
1677 fam = AF_INET;
1678 if (!strncmp(addr, "inet:", 5))
1679 addr += 5;
1680 } else if (fam == AF_INET6 || !strncmp(addr, "inet6:", 6)) {
1681 fam = AF_INET6;
1682 if (!strncmp(addr, "inet6:", 6))
1683 addr += 6;
1684 }
1685
1686 /* URL-like literal [] */
1687 if (addr[0] == '[') {
1688 addr++;
1689 if ((port = strchr(addr, ']')) == NULL)
1690 return NULL;
1691 *port++ = 0;
1692 } else if (addr[0] == '*') {
1693 port = addr+1;
1694 } else {
1695 port = strrchr(strchr(addr, '/') ? : addr, ':');
1696 }
1697
1698 if (is_port)
1699 port = addr;
1700
1701 if (port && *port) {
1702 if (*port == ':')
1703 *port++ = 0;
1704
1705 if (*port && *port != '*') {
1706 if (get_integer(&a.port, port, 0)) {
1707 struct servent *se1 = NULL;
1708 struct servent *se2 = NULL;
1709
1710 if (current_filter.dbs&(1<<UDP_DB))
1711 se1 = getservbyname(port, UDP_PROTO);
1712 if (current_filter.dbs&(1<<TCP_DB))
1713 se2 = getservbyname(port, TCP_PROTO);
1714 if (se1 && se2 && se1->s_port != se2->s_port) {
1715 fprintf(stderr, "Error: ambiguous port \"%s\".\n", port);
1716 return NULL;
1717 }
1718 if (!se1)
1719 se1 = se2;
1720 if (se1) {
1721 a.port = ntohs(se1->s_port);
1722 } else {
1723 struct scache *s;
1724
1725 for (s = rlist; s; s = s->next) {
1726 if ((s->proto == UDP_PROTO &&
1727 (current_filter.dbs&(1<<UDP_DB))) ||
1728 (s->proto == TCP_PROTO &&
1729 (current_filter.dbs&(1<<TCP_DB)))) {
1730 if (s->name && strcmp(s->name, port) == 0) {
1731 if (a.port > 0 && a.port != s->port) {
1732 fprintf(stderr, "Error: ambiguous port \"%s\".\n", port);
1733 return NULL;
1734 }
1735 a.port = s->port;
1736 }
1737 }
1738 }
1739 if (a.port <= 0) {
1740 fprintf(stderr, "Error: \"%s\" does not look like a port.\n", port);
1741 return NULL;
1742 }
1743 }
1744 }
1745 }
1746 }
1747 if (!is_port && *addr && *addr != '*') {
1748 if (get_prefix_1(&a.addr, addr, fam)) {
1749 if (get_dns_host(&a, addr, fam)) {
1750 fprintf(stderr, "Error: an inet prefix is expected rather than \"%s\".\n", addr);
1751 return NULL;
1752 }
1753 }
1754 }
1755
1756 out:
1757 if (fam != AF_UNSPEC) {
1758 int states = f->states;
1759 f->families = 0;
1760 filter_af_set(f, fam);
1761 filter_states_set(f, states);
1762 }
1763
1764 res = malloc(sizeof(*res));
1765 if (res)
1766 memcpy(res, &a, sizeof(a));
1767 return res;
1768 }
1769
1770 void *parse_markmask(const char *markmask)
1771 {
1772 struct aafilter a, *res;
1773
1774 if (strchr(markmask, '/')) {
1775 if (sscanf(markmask, "%i/%i", &a.mark, &a.mask) != 2)
1776 return NULL;
1777 } else {
1778 a.mask = 0xffffffff;
1779 if (sscanf(markmask, "%i", &a.mark) != 1)
1780 return NULL;
1781 }
1782
1783 res = malloc(sizeof(*res));
1784 if (res)
1785 memcpy(res, &a, sizeof(a));
1786 return res;
1787 }
1788
1789 static void proc_ctx_print(struct sockstat *s)
1790 {
1791 char *buf;
1792
1793 if (show_proc_ctx || show_sock_ctx) {
1794 if (find_entry(s->ino, &buf,
1795 (show_proc_ctx & show_sock_ctx) ?
1796 PROC_SOCK_CTX : PROC_CTX) > 0) {
1797 printf(" users:(%s)", buf);
1798 free(buf);
1799 }
1800 } else if (show_users) {
1801 if (find_entry(s->ino, &buf, USERS) > 0) {
1802 printf(" users:(%s)", buf);
1803 free(buf);
1804 }
1805 }
1806 }
1807
1808 static void inet_stats_print(struct sockstat *s, bool v6only)
1809 {
1810 sock_state_print(s);
1811
1812 inet_addr_print(&s->local, s->lport, s->iface, v6only);
1813 inet_addr_print(&s->remote, s->rport, 0, v6only);
1814
1815 proc_ctx_print(s);
1816 }
1817
1818 static int proc_parse_inet_addr(char *loc, char *rem, int family, struct
1819 sockstat * s)
1820 {
1821 s->local.family = s->remote.family = family;
1822 if (family == AF_INET) {
1823 sscanf(loc, "%x:%x", s->local.data, (unsigned *)&s->lport);
1824 sscanf(rem, "%x:%x", s->remote.data, (unsigned *)&s->rport);
1825 s->local.bytelen = s->remote.bytelen = 4;
1826 return 0;
1827 } else {
1828 sscanf(loc, "%08x%08x%08x%08x:%x",
1829 s->local.data,
1830 s->local.data + 1,
1831 s->local.data + 2,
1832 s->local.data + 3,
1833 &s->lport);
1834 sscanf(rem, "%08x%08x%08x%08x:%x",
1835 s->remote.data,
1836 s->remote.data + 1,
1837 s->remote.data + 2,
1838 s->remote.data + 3,
1839 &s->rport);
1840 s->local.bytelen = s->remote.bytelen = 16;
1841 return 0;
1842 }
1843 return -1;
1844 }
1845
1846 static int proc_inet_split_line(char *line, char **loc, char **rem, char **data)
1847 {
1848 char *p;
1849
1850 if ((p = strchr(line, ':')) == NULL)
1851 return -1;
1852
1853 *loc = p+2;
1854 if ((p = strchr(*loc, ':')) == NULL)
1855 return -1;
1856
1857 p[5] = 0;
1858 *rem = p+6;
1859 if ((p = strchr(*rem, ':')) == NULL)
1860 return -1;
1861
1862 p[5] = 0;
1863 *data = p+6;
1864 return 0;
1865 }
1866
1867 static char *sprint_bw(char *buf, double bw)
1868 {
1869 if (bw > 1000000.)
1870 sprintf(buf, "%.1fM", bw / 1000000.);
1871 else if (bw > 1000.)
1872 sprintf(buf, "%.1fK", bw / 1000.);
1873 else
1874 sprintf(buf, "%g", bw);
1875
1876 return buf;
1877 }
1878
1879 static void sctp_stats_print(struct sctp_info *s)
1880 {
1881 if (s->sctpi_tag)
1882 printf(" tag:%x", s->sctpi_tag);
1883 if (s->sctpi_state)
1884 printf(" state:%s", sctp_sstate_name[s->sctpi_state]);
1885 if (s->sctpi_rwnd)
1886 printf(" rwnd:%d", s->sctpi_rwnd);
1887 if (s->sctpi_unackdata)
1888 printf(" unackdata:%d", s->sctpi_unackdata);
1889 if (s->sctpi_penddata)
1890 printf(" penddata:%d", s->sctpi_penddata);
1891 if (s->sctpi_instrms)
1892 printf(" instrms:%d", s->sctpi_instrms);
1893 if (s->sctpi_outstrms)
1894 printf(" outstrms:%d", s->sctpi_outstrms);
1895 if (s->sctpi_inqueue)
1896 printf(" inqueue:%d", s->sctpi_inqueue);
1897 if (s->sctpi_outqueue)
1898 printf(" outqueue:%d", s->sctpi_outqueue);
1899 if (s->sctpi_overall_error)
1900 printf(" overerr:%d", s->sctpi_overall_error);
1901 if (s->sctpi_max_burst)
1902 printf(" maxburst:%d", s->sctpi_max_burst);
1903 if (s->sctpi_maxseg)
1904 printf(" maxseg:%d", s->sctpi_maxseg);
1905 if (s->sctpi_peer_rwnd)
1906 printf(" prwnd:%d", s->sctpi_peer_rwnd);
1907 if (s->sctpi_peer_tag)
1908 printf(" ptag:%x", s->sctpi_peer_tag);
1909 if (s->sctpi_peer_capable)
1910 printf(" pcapable:%d", s->sctpi_peer_capable);
1911 if (s->sctpi_peer_sack)
1912 printf(" psack:%d", s->sctpi_peer_sack);
1913 if (s->sctpi_s_autoclose)
1914 printf(" autoclose:%d", s->sctpi_s_autoclose);
1915 if (s->sctpi_s_adaptation_ind)
1916 printf(" adapind:%d", s->sctpi_s_adaptation_ind);
1917 if (s->sctpi_s_pd_point)
1918 printf(" pdpoint:%d", s->sctpi_s_pd_point);
1919 if (s->sctpi_s_nodelay)
1920 printf(" nodealy:%d", s->sctpi_s_nodelay);
1921 if (s->sctpi_s_disable_fragments)
1922 printf(" nofrag:%d", s->sctpi_s_disable_fragments);
1923 if (s->sctpi_s_v4mapped)
1924 printf(" v4mapped:%d", s->sctpi_s_v4mapped);
1925 if (s->sctpi_s_frag_interleave)
1926 printf(" fraginl:%d", s->sctpi_s_frag_interleave);
1927 }
1928
1929 static void tcp_stats_print(struct tcpstat *s)
1930 {
1931 char b1[64];
1932
1933 if (s->has_ts_opt)
1934 printf(" ts");
1935 if (s->has_sack_opt)
1936 printf(" sack");
1937 if (s->has_ecn_opt)
1938 printf(" ecn");
1939 if (s->has_ecnseen_opt)
1940 printf(" ecnseen");
1941 if (s->has_fastopen_opt)
1942 printf(" fastopen");
1943 if (s->cong_alg[0])
1944 printf(" %s", s->cong_alg);
1945 if (s->has_wscale_opt)
1946 printf(" wscale:%d,%d", s->snd_wscale, s->rcv_wscale);
1947 if (s->rto)
1948 printf(" rto:%g", s->rto);
1949 if (s->backoff)
1950 printf(" backoff:%u", s->backoff);
1951 if (s->rtt)
1952 printf(" rtt:%g/%g", s->rtt, s->rttvar);
1953 if (s->ato)
1954 printf(" ato:%g", s->ato);
1955
1956 if (s->qack)
1957 printf(" qack:%d", s->qack);
1958 if (s->qack & 1)
1959 printf(" bidir");
1960
1961 if (s->mss)
1962 printf(" mss:%d", s->mss);
1963 if (s->rcv_mss)
1964 printf(" rcvmss:%d", s->rcv_mss);
1965 if (s->advmss)
1966 printf(" advmss:%d", s->advmss);
1967 if (s->cwnd)
1968 printf(" cwnd:%u", s->cwnd);
1969 if (s->ssthresh)
1970 printf(" ssthresh:%d", s->ssthresh);
1971
1972 if (s->bytes_acked)
1973 printf(" bytes_acked:%llu", s->bytes_acked);
1974 if (s->bytes_received)
1975 printf(" bytes_received:%llu", s->bytes_received);
1976 if (s->segs_out)
1977 printf(" segs_out:%u", s->segs_out);
1978 if (s->segs_in)
1979 printf(" segs_in:%u", s->segs_in);
1980 if (s->data_segs_out)
1981 printf(" data_segs_out:%u", s->data_segs_out);
1982 if (s->data_segs_in)
1983 printf(" data_segs_in:%u", s->data_segs_in);
1984
1985 if (s->dctcp && s->dctcp->enabled) {
1986 struct dctcpstat *dctcp = s->dctcp;
1987
1988 printf(" dctcp:(ce_state:%u,alpha:%u,ab_ecn:%u,ab_tot:%u)",
1989 dctcp->ce_state, dctcp->alpha, dctcp->ab_ecn,
1990 dctcp->ab_tot);
1991 } else if (s->dctcp) {
1992 printf(" dctcp:fallback_mode");
1993 }
1994
1995 if (s->bbr_info) {
1996 __u64 bw;
1997
1998 bw = s->bbr_info->bbr_bw_hi;
1999 bw <<= 32;
2000 bw |= s->bbr_info->bbr_bw_lo;
2001
2002 printf(" bbr:(bw:%sbps,mrtt:%g",
2003 sprint_bw(b1, bw * 8.0),
2004 (double)s->bbr_info->bbr_min_rtt / 1000.0);
2005 if (s->bbr_info->bbr_pacing_gain)
2006 printf(",pacing_gain:%g",
2007 (double)s->bbr_info->bbr_pacing_gain / 256.0);
2008 if (s->bbr_info->bbr_cwnd_gain)
2009 printf(",cwnd_gain:%g",
2010 (double)s->bbr_info->bbr_cwnd_gain / 256.0);
2011 printf(")");
2012 }
2013
2014 if (s->send_bps)
2015 printf(" send %sbps", sprint_bw(b1, s->send_bps));
2016 if (s->lastsnd)
2017 printf(" lastsnd:%u", s->lastsnd);
2018 if (s->lastrcv)
2019 printf(" lastrcv:%u", s->lastrcv);
2020 if (s->lastack)
2021 printf(" lastack:%u", s->lastack);
2022
2023 if (s->pacing_rate) {
2024 printf(" pacing_rate %sbps", sprint_bw(b1, s->pacing_rate));
2025 if (s->pacing_rate_max)
2026 printf("/%sbps", sprint_bw(b1,
2027 s->pacing_rate_max));
2028 }
2029
2030 if (s->delivery_rate)
2031 printf(" delivery_rate %sbps", sprint_bw(b1, s->delivery_rate));
2032 if (s->app_limited)
2033 printf(" app_limited");
2034
2035 if (s->busy_time) {
2036 printf(" busy:%llums", s->busy_time / 1000);
2037 if (s->rwnd_limited)
2038 printf(" rwnd_limited:%llums(%.1f%%)",
2039 s->rwnd_limited / 1000,
2040 100.0 * s->rwnd_limited / s->busy_time);
2041 if (s->sndbuf_limited)
2042 printf(" sndbuf_limited:%llums(%.1f%%)",
2043 s->sndbuf_limited / 1000,
2044 100.0 * s->sndbuf_limited / s->busy_time);
2045 }
2046
2047 if (s->unacked)
2048 printf(" unacked:%u", s->unacked);
2049 if (s->retrans || s->retrans_total)
2050 printf(" retrans:%u/%u", s->retrans, s->retrans_total);
2051 if (s->lost)
2052 printf(" lost:%u", s->lost);
2053 if (s->sacked && s->ss.state != SS_LISTEN)
2054 printf(" sacked:%u", s->sacked);
2055 if (s->fackets)
2056 printf(" fackets:%u", s->fackets);
2057 if (s->reordering != 3)
2058 printf(" reordering:%d", s->reordering);
2059 if (s->rcv_rtt)
2060 printf(" rcv_rtt:%g", s->rcv_rtt);
2061 if (s->rcv_space)
2062 printf(" rcv_space:%d", s->rcv_space);
2063 if (s->not_sent)
2064 printf(" notsent:%u", s->not_sent);
2065 if (s->min_rtt)
2066 printf(" minrtt:%g", s->min_rtt);
2067 }
2068
2069 static void tcp_timer_print(struct tcpstat *s)
2070 {
2071 static const char * const tmr_name[] = {
2072 "off",
2073 "on",
2074 "keepalive",
2075 "timewait",
2076 "persist",
2077 "unknown"
2078 };
2079
2080 if (s->timer) {
2081 if (s->timer > 4)
2082 s->timer = 5;
2083 printf(" timer:(%s,%s,%d)",
2084 tmr_name[s->timer],
2085 print_ms_timer(s->timeout),
2086 s->retrans);
2087 }
2088 }
2089
2090 static void sctp_timer_print(struct tcpstat *s)
2091 {
2092 if (s->timer)
2093 printf(" timer:(T3_RTX,%s,%d)",
2094 print_ms_timer(s->timeout), s->retrans);
2095 }
2096
2097 static int tcp_show_line(char *line, const struct filter *f, int family)
2098 {
2099 int rto = 0, ato = 0;
2100 struct tcpstat s = {};
2101 char *loc, *rem, *data;
2102 char opt[256];
2103 int n;
2104 int hz = get_user_hz();
2105
2106 if (proc_inet_split_line(line, &loc, &rem, &data))
2107 return -1;
2108
2109 int state = (data[1] >= 'A') ? (data[1] - 'A' + 10) : (data[1] - '0');
2110
2111 if (!(f->states & (1 << state)))
2112 return 0;
2113
2114 proc_parse_inet_addr(loc, rem, family, &s.ss);
2115
2116 if (f->f && run_ssfilter(f->f, &s.ss) == 0)
2117 return 0;
2118
2119 opt[0] = 0;
2120 n = sscanf(data, "%x %x:%x %x:%x %x %d %d %u %d %llx %d %d %d %u %d %[^\n]\n",
2121 &s.ss.state, &s.ss.wq, &s.ss.rq,
2122 &s.timer, &s.timeout, &s.retrans, &s.ss.uid, &s.probes,
2123 &s.ss.ino, &s.ss.refcnt, &s.ss.sk, &rto, &ato, &s.qack, &s.cwnd,
2124 &s.ssthresh, opt);
2125
2126 if (n < 17)
2127 opt[0] = 0;
2128
2129 if (n < 12) {
2130 rto = 0;
2131 s.cwnd = 2;
2132 s.ssthresh = -1;
2133 ato = s.qack = 0;
2134 }
2135
2136 s.retrans = s.timer != 1 ? s.probes : s.retrans;
2137 s.timeout = (s.timeout * 1000 + hz - 1) / hz;
2138 s.ato = (double)ato / hz;
2139 s.qack /= 2;
2140 s.rto = (double)rto;
2141 s.ssthresh = s.ssthresh == -1 ? 0 : s.ssthresh;
2142 s.rto = s.rto != 3 * hz ? s.rto / hz : 0;
2143 s.ss.type = IPPROTO_TCP;
2144
2145 inet_stats_print(&s.ss, false);
2146
2147 if (show_options)
2148 tcp_timer_print(&s);
2149
2150 if (show_details) {
2151 sock_details_print(&s.ss);
2152 if (opt[0])
2153 printf(" opt:\"%s\"", opt);
2154 }
2155
2156 if (show_tcpinfo)
2157 tcp_stats_print(&s);
2158
2159 printf("\n");
2160 return 0;
2161 }
2162
2163 static int generic_record_read(FILE *fp,
2164 int (*worker)(char*, const struct filter *, int),
2165 const struct filter *f, int fam)
2166 {
2167 char line[256];
2168
2169 /* skip header */
2170 if (fgets(line, sizeof(line), fp) == NULL)
2171 goto outerr;
2172
2173 while (fgets(line, sizeof(line), fp) != NULL) {
2174 int n = strlen(line);
2175
2176 if (n == 0 || line[n-1] != '\n') {
2177 errno = -EINVAL;
2178 return -1;
2179 }
2180 line[n-1] = 0;
2181
2182 if (worker(line, f, fam) < 0)
2183 return 0;
2184 }
2185 outerr:
2186
2187 return ferror(fp) ? -1 : 0;
2188 }
2189
2190 static void print_skmeminfo(struct rtattr *tb[], int attrtype)
2191 {
2192 const __u32 *skmeminfo;
2193
2194 if (!tb[attrtype]) {
2195 if (attrtype == INET_DIAG_SKMEMINFO) {
2196 if (!tb[INET_DIAG_MEMINFO])
2197 return;
2198
2199 const struct inet_diag_meminfo *minfo =
2200 RTA_DATA(tb[INET_DIAG_MEMINFO]);
2201
2202 printf(" mem:(r%u,w%u,f%u,t%u)",
2203 minfo->idiag_rmem,
2204 minfo->idiag_wmem,
2205 minfo->idiag_fmem,
2206 minfo->idiag_tmem);
2207 }
2208 return;
2209 }
2210
2211 skmeminfo = RTA_DATA(tb[attrtype]);
2212
2213 printf(" skmem:(r%u,rb%u,t%u,tb%u,f%u,w%u,o%u",
2214 skmeminfo[SK_MEMINFO_RMEM_ALLOC],
2215 skmeminfo[SK_MEMINFO_RCVBUF],
2216 skmeminfo[SK_MEMINFO_WMEM_ALLOC],
2217 skmeminfo[SK_MEMINFO_SNDBUF],
2218 skmeminfo[SK_MEMINFO_FWD_ALLOC],
2219 skmeminfo[SK_MEMINFO_WMEM_QUEUED],
2220 skmeminfo[SK_MEMINFO_OPTMEM]);
2221
2222 if (RTA_PAYLOAD(tb[attrtype]) >=
2223 (SK_MEMINFO_BACKLOG + 1) * sizeof(__u32))
2224 printf(",bl%u", skmeminfo[SK_MEMINFO_BACKLOG]);
2225
2226 if (RTA_PAYLOAD(tb[attrtype]) >=
2227 (SK_MEMINFO_DROPS + 1) * sizeof(__u32))
2228 printf(",d%u", skmeminfo[SK_MEMINFO_DROPS]);
2229
2230 printf(")");
2231 }
2232
2233 static void print_md5sig(struct tcp_diag_md5sig *sig)
2234 {
2235 printf("%s/%d=",
2236 format_host(sig->tcpm_family,
2237 sig->tcpm_family == AF_INET6 ? 16 : 4,
2238 &sig->tcpm_addr),
2239 sig->tcpm_prefixlen);
2240 print_escape_buf(sig->tcpm_key, sig->tcpm_keylen, " ,");
2241 }
2242
2243 #define TCPI_HAS_OPT(info, opt) !!(info->tcpi_options & (opt))
2244
2245 static void tcp_show_info(const struct nlmsghdr *nlh, struct inet_diag_msg *r,
2246 struct rtattr *tb[])
2247 {
2248 double rtt = 0;
2249 struct tcpstat s = {};
2250
2251 s.ss.state = r->idiag_state;
2252
2253 print_skmeminfo(tb, INET_DIAG_SKMEMINFO);
2254
2255 if (tb[INET_DIAG_INFO]) {
2256 struct tcp_info *info;
2257 int len = RTA_PAYLOAD(tb[INET_DIAG_INFO]);
2258
2259 /* workaround for older kernels with less fields */
2260 if (len < sizeof(*info)) {
2261 info = alloca(sizeof(*info));
2262 memcpy(info, RTA_DATA(tb[INET_DIAG_INFO]), len);
2263 memset((char *)info + len, 0, sizeof(*info) - len);
2264 } else
2265 info = RTA_DATA(tb[INET_DIAG_INFO]);
2266
2267 if (show_options) {
2268 s.has_ts_opt = TCPI_HAS_OPT(info, TCPI_OPT_TIMESTAMPS);
2269 s.has_sack_opt = TCPI_HAS_OPT(info, TCPI_OPT_SACK);
2270 s.has_ecn_opt = TCPI_HAS_OPT(info, TCPI_OPT_ECN);
2271 s.has_ecnseen_opt = TCPI_HAS_OPT(info, TCPI_OPT_ECN_SEEN);
2272 s.has_fastopen_opt = TCPI_HAS_OPT(info, TCPI_OPT_SYN_DATA);
2273 }
2274
2275 if (tb[INET_DIAG_CONG])
2276 strncpy(s.cong_alg,
2277 rta_getattr_str(tb[INET_DIAG_CONG]),
2278 sizeof(s.cong_alg) - 1);
2279
2280 if (TCPI_HAS_OPT(info, TCPI_OPT_WSCALE)) {
2281 s.has_wscale_opt = true;
2282 s.snd_wscale = info->tcpi_snd_wscale;
2283 s.rcv_wscale = info->tcpi_rcv_wscale;
2284 }
2285
2286 if (info->tcpi_rto && info->tcpi_rto != 3000000)
2287 s.rto = (double)info->tcpi_rto / 1000;
2288
2289 s.backoff = info->tcpi_backoff;
2290 s.rtt = (double)info->tcpi_rtt / 1000;
2291 s.rttvar = (double)info->tcpi_rttvar / 1000;
2292 s.ato = (double)info->tcpi_ato / 1000;
2293 s.mss = info->tcpi_snd_mss;
2294 s.rcv_mss = info->tcpi_rcv_mss;
2295 s.advmss = info->tcpi_advmss;
2296 s.rcv_space = info->tcpi_rcv_space;
2297 s.rcv_rtt = (double)info->tcpi_rcv_rtt / 1000;
2298 s.lastsnd = info->tcpi_last_data_sent;
2299 s.lastrcv = info->tcpi_last_data_recv;
2300 s.lastack = info->tcpi_last_ack_recv;
2301 s.unacked = info->tcpi_unacked;
2302 s.retrans = info->tcpi_retrans;
2303 s.retrans_total = info->tcpi_total_retrans;
2304 s.lost = info->tcpi_lost;
2305 s.sacked = info->tcpi_sacked;
2306 s.fackets = info->tcpi_fackets;
2307 s.reordering = info->tcpi_reordering;
2308 s.rcv_space = info->tcpi_rcv_space;
2309 s.cwnd = info->tcpi_snd_cwnd;
2310
2311 if (info->tcpi_snd_ssthresh < 0xFFFF)
2312 s.ssthresh = info->tcpi_snd_ssthresh;
2313
2314 rtt = (double) info->tcpi_rtt;
2315 if (tb[INET_DIAG_VEGASINFO]) {
2316 const struct tcpvegas_info *vinfo
2317 = RTA_DATA(tb[INET_DIAG_VEGASINFO]);
2318
2319 if (vinfo->tcpv_enabled &&
2320 vinfo->tcpv_rtt && vinfo->tcpv_rtt != 0x7fffffff)
2321 rtt = vinfo->tcpv_rtt;
2322 }
2323
2324 if (tb[INET_DIAG_DCTCPINFO]) {
2325 struct dctcpstat *dctcp = malloc(sizeof(struct
2326 dctcpstat));
2327
2328 const struct tcp_dctcp_info *dinfo
2329 = RTA_DATA(tb[INET_DIAG_DCTCPINFO]);
2330
2331 dctcp->enabled = !!dinfo->dctcp_enabled;
2332 dctcp->ce_state = dinfo->dctcp_ce_state;
2333 dctcp->alpha = dinfo->dctcp_alpha;
2334 dctcp->ab_ecn = dinfo->dctcp_ab_ecn;
2335 dctcp->ab_tot = dinfo->dctcp_ab_tot;
2336 s.dctcp = dctcp;
2337 }
2338
2339 if (tb[INET_DIAG_BBRINFO]) {
2340 const void *bbr_info = RTA_DATA(tb[INET_DIAG_BBRINFO]);
2341 int len = min(RTA_PAYLOAD(tb[INET_DIAG_BBRINFO]),
2342 sizeof(*s.bbr_info));
2343
2344 s.bbr_info = calloc(1, sizeof(*s.bbr_info));
2345 if (s.bbr_info && bbr_info)
2346 memcpy(s.bbr_info, bbr_info, len);
2347 }
2348
2349 if (rtt > 0 && info->tcpi_snd_mss && info->tcpi_snd_cwnd) {
2350 s.send_bps = (double) info->tcpi_snd_cwnd *
2351 (double)info->tcpi_snd_mss * 8000000. / rtt;
2352 }
2353
2354 if (info->tcpi_pacing_rate &&
2355 info->tcpi_pacing_rate != ~0ULL) {
2356 s.pacing_rate = info->tcpi_pacing_rate * 8.;
2357
2358 if (info->tcpi_max_pacing_rate &&
2359 info->tcpi_max_pacing_rate != ~0ULL)
2360 s.pacing_rate_max = info->tcpi_max_pacing_rate * 8.;
2361 }
2362 s.bytes_acked = info->tcpi_bytes_acked;
2363 s.bytes_received = info->tcpi_bytes_received;
2364 s.segs_out = info->tcpi_segs_out;
2365 s.segs_in = info->tcpi_segs_in;
2366 s.data_segs_out = info->tcpi_data_segs_out;
2367 s.data_segs_in = info->tcpi_data_segs_in;
2368 s.not_sent = info->tcpi_notsent_bytes;
2369 if (info->tcpi_min_rtt && info->tcpi_min_rtt != ~0U)
2370 s.min_rtt = (double) info->tcpi_min_rtt / 1000;
2371 s.delivery_rate = info->tcpi_delivery_rate * 8.;
2372 s.app_limited = info->tcpi_delivery_rate_app_limited;
2373 s.busy_time = info->tcpi_busy_time;
2374 s.rwnd_limited = info->tcpi_rwnd_limited;
2375 s.sndbuf_limited = info->tcpi_sndbuf_limited;
2376 tcp_stats_print(&s);
2377 free(s.dctcp);
2378 free(s.bbr_info);
2379 }
2380 if (tb[INET_DIAG_MD5SIG]) {
2381 struct tcp_diag_md5sig *sig = RTA_DATA(tb[INET_DIAG_MD5SIG]);
2382 int len = RTA_PAYLOAD(tb[INET_DIAG_MD5SIG]);
2383
2384 printf(" md5keys:");
2385 print_md5sig(sig++);
2386 for (len -= sizeof(*sig); len > 0; len -= sizeof(*sig)) {
2387 printf(",");
2388 print_md5sig(sig++);
2389 }
2390 }
2391 }
2392
2393 static const char *format_host_sa(struct sockaddr_storage *sa)
2394 {
2395 union {
2396 struct sockaddr_in sin;
2397 struct sockaddr_in6 sin6;
2398 } *saddr = (void *)sa;
2399
2400 switch (sa->ss_family) {
2401 case AF_INET:
2402 return format_host(AF_INET, 4, &saddr->sin.sin_addr);
2403 case AF_INET6:
2404 return format_host(AF_INET6, 16, &saddr->sin6.sin6_addr);
2405 default:
2406 return "";
2407 }
2408 }
2409
2410 static void sctp_show_info(const struct nlmsghdr *nlh, struct inet_diag_msg *r,
2411 struct rtattr *tb[])
2412 {
2413 struct sockaddr_storage *sa;
2414 int len;
2415
2416 print_skmeminfo(tb, INET_DIAG_SKMEMINFO);
2417
2418 if (tb[INET_DIAG_LOCALS]) {
2419 len = RTA_PAYLOAD(tb[INET_DIAG_LOCALS]);
2420 sa = RTA_DATA(tb[INET_DIAG_LOCALS]);
2421
2422 printf("locals:%s", format_host_sa(sa));
2423 for (sa++, len -= sizeof(*sa); len > 0; sa++, len -= sizeof(*sa))
2424 printf(",%s", format_host_sa(sa));
2425
2426 }
2427 if (tb[INET_DIAG_PEERS]) {
2428 len = RTA_PAYLOAD(tb[INET_DIAG_PEERS]);
2429 sa = RTA_DATA(tb[INET_DIAG_PEERS]);
2430
2431 printf(" peers:%s", format_host_sa(sa));
2432 for (sa++, len -= sizeof(*sa); len > 0; sa++, len -= sizeof(*sa))
2433 printf(",%s", format_host_sa(sa));
2434 }
2435 if (tb[INET_DIAG_INFO]) {
2436 struct sctp_info *info;
2437 len = RTA_PAYLOAD(tb[INET_DIAG_INFO]);
2438
2439 /* workaround for older kernels with less fields */
2440 if (len < sizeof(*info)) {
2441 info = alloca(sizeof(*info));
2442 memcpy(info, RTA_DATA(tb[INET_DIAG_INFO]), len);
2443 memset((char *)info + len, 0, sizeof(*info) - len);
2444 } else
2445 info = RTA_DATA(tb[INET_DIAG_INFO]);
2446
2447 sctp_stats_print(info);
2448 }
2449 }
2450
2451 static void parse_diag_msg(struct nlmsghdr *nlh, struct sockstat *s)
2452 {
2453 struct rtattr *tb[INET_DIAG_MAX+1];
2454 struct inet_diag_msg *r = NLMSG_DATA(nlh);
2455
2456 parse_rtattr(tb, INET_DIAG_MAX, (struct rtattr *)(r+1),
2457 nlh->nlmsg_len - NLMSG_LENGTH(sizeof(*r)));
2458
2459 s->state = r->idiag_state;
2460 s->local.family = s->remote.family = r->idiag_family;
2461 s->lport = ntohs(r->id.idiag_sport);
2462 s->rport = ntohs(r->id.idiag_dport);
2463 s->wq = r->idiag_wqueue;
2464 s->rq = r->idiag_rqueue;
2465 s->ino = r->idiag_inode;
2466 s->uid = r->idiag_uid;
2467 s->iface = r->id.idiag_if;
2468 s->sk = cookie_sk_get(&r->id.idiag_cookie[0]);
2469
2470 s->mark = 0;
2471 if (tb[INET_DIAG_MARK])
2472 s->mark = rta_getattr_u32(tb[INET_DIAG_MARK]);
2473 if (tb[INET_DIAG_PROTOCOL])
2474 s->raw_prot = rta_getattr_u8(tb[INET_DIAG_PROTOCOL]);
2475 else
2476 s->raw_prot = 0;
2477
2478 if (s->local.family == AF_INET)
2479 s->local.bytelen = s->remote.bytelen = 4;
2480 else
2481 s->local.bytelen = s->remote.bytelen = 16;
2482
2483 memcpy(s->local.data, r->id.idiag_src, s->local.bytelen);
2484 memcpy(s->remote.data, r->id.idiag_dst, s->local.bytelen);
2485 }
2486
2487 static int inet_show_sock(struct nlmsghdr *nlh,
2488 struct sockstat *s)
2489 {
2490 struct rtattr *tb[INET_DIAG_MAX+1];
2491 struct inet_diag_msg *r = NLMSG_DATA(nlh);
2492 unsigned char v6only = 0;
2493
2494 parse_rtattr(tb, INET_DIAG_MAX, (struct rtattr *)(r+1),
2495 nlh->nlmsg_len - NLMSG_LENGTH(sizeof(*r)));
2496
2497 if (tb[INET_DIAG_PROTOCOL])
2498 s->type = rta_getattr_u8(tb[INET_DIAG_PROTOCOL]);
2499
2500 if (s->local.family == AF_INET6 && tb[INET_DIAG_SKV6ONLY])
2501 v6only = rta_getattr_u8(tb[INET_DIAG_SKV6ONLY]);
2502
2503 inet_stats_print(s, v6only);
2504
2505 if (show_options) {
2506 struct tcpstat t = {};
2507
2508 t.timer = r->idiag_timer;
2509 t.timeout = r->idiag_expires;
2510 t.retrans = r->idiag_retrans;
2511 if (s->type == IPPROTO_SCTP)
2512 sctp_timer_print(&t);
2513 else
2514 tcp_timer_print(&t);
2515 }
2516
2517 if (show_details) {
2518 sock_details_print(s);
2519 if (s->local.family == AF_INET6 && tb[INET_DIAG_SKV6ONLY])
2520 printf(" v6only:%u", v6only);
2521
2522 if (tb[INET_DIAG_SHUTDOWN]) {
2523 unsigned char mask;
2524
2525 mask = rta_getattr_u8(tb[INET_DIAG_SHUTDOWN]);
2526 printf(" %c-%c", mask & 1 ? '-' : '<', mask & 2 ? '-' : '>');
2527 }
2528 }
2529
2530 if (show_mem || (show_tcpinfo && s->type != IPPROTO_UDP)) {
2531 printf("\n\t");
2532 if (s->type == IPPROTO_SCTP)
2533 sctp_show_info(nlh, r, tb);
2534 else
2535 tcp_show_info(nlh, r, tb);
2536 }
2537 sctp_ino = s->ino;
2538
2539 printf("\n");
2540 return 0;
2541 }
2542
2543 static int tcpdiag_send(int fd, int protocol, struct filter *f)
2544 {
2545 struct sockaddr_nl nladdr = { .nl_family = AF_NETLINK };
2546 struct {
2547 struct nlmsghdr nlh;
2548 struct inet_diag_req r;
2549 } req = {
2550 .nlh.nlmsg_len = sizeof(req),
2551 .nlh.nlmsg_flags = NLM_F_ROOT | NLM_F_MATCH | NLM_F_REQUEST,
2552 .nlh.nlmsg_seq = MAGIC_SEQ,
2553 .r.idiag_family = AF_INET,
2554 .r.idiag_states = f->states,
2555 };
2556 char *bc = NULL;
2557 int bclen;
2558 struct msghdr msg;
2559 struct rtattr rta;
2560 struct iovec iov[3];
2561 int iovlen = 1;
2562
2563 if (protocol == IPPROTO_UDP)
2564 return -1;
2565
2566 if (protocol == IPPROTO_TCP)
2567 req.nlh.nlmsg_type = TCPDIAG_GETSOCK;
2568 else
2569 req.nlh.nlmsg_type = DCCPDIAG_GETSOCK;
2570 if (show_mem) {
2571 req.r.idiag_ext |= (1<<(INET_DIAG_MEMINFO-1));
2572 req.r.idiag_ext |= (1<<(INET_DIAG_SKMEMINFO-1));
2573 }
2574
2575 if (show_tcpinfo) {
2576 req.r.idiag_ext |= (1<<(INET_DIAG_INFO-1));
2577 req.r.idiag_ext |= (1<<(INET_DIAG_VEGASINFO-1));
2578 req.r.idiag_ext |= (1<<(INET_DIAG_CONG-1));
2579 }
2580
2581 iov[0] = (struct iovec){
2582 .iov_base = &req,
2583 .iov_len = sizeof(req)
2584 };
2585 if (f->f) {
2586 bclen = ssfilter_bytecompile(f->f, &bc);
2587 if (bclen) {
2588 rta.rta_type = INET_DIAG_REQ_BYTECODE;
2589 rta.rta_len = RTA_LENGTH(bclen);
2590 iov[1] = (struct iovec){ &rta, sizeof(rta) };
2591 iov[2] = (struct iovec){ bc, bclen };
2592 req.nlh.nlmsg_len += RTA_LENGTH(bclen);
2593 iovlen = 3;
2594 }
2595 }
2596
2597 msg = (struct msghdr) {
2598 .msg_name = (void *)&nladdr,
2599 .msg_namelen = sizeof(nladdr),
2600 .msg_iov = iov,
2601 .msg_iovlen = iovlen,
2602 };
2603
2604 if (sendmsg(fd, &msg, 0) < 0) {
2605 close(fd);
2606 return -1;
2607 }
2608
2609 return 0;
2610 }
2611
2612 static int sockdiag_send(int family, int fd, int protocol, struct filter *f)
2613 {
2614 struct sockaddr_nl nladdr = { .nl_family = AF_NETLINK };
2615 DIAG_REQUEST(req, struct inet_diag_req_v2 r);
2616 char *bc = NULL;
2617 int bclen;
2618 struct msghdr msg;
2619 struct rtattr rta;
2620 struct iovec iov[3];
2621 int iovlen = 1;
2622
2623 if (family == PF_UNSPEC)
2624 return tcpdiag_send(fd, protocol, f);
2625
2626 memset(&req.r, 0, sizeof(req.r));
2627 req.r.sdiag_family = family;
2628 req.r.sdiag_protocol = protocol;
2629 req.r.idiag_states = f->states;
2630 if (show_mem) {
2631 req.r.idiag_ext |= (1<<(INET_DIAG_MEMINFO-1));
2632 req.r.idiag_ext |= (1<<(INET_DIAG_SKMEMINFO-1));
2633 }
2634
2635 if (show_tcpinfo) {
2636 req.r.idiag_ext |= (1<<(INET_DIAG_INFO-1));
2637 req.r.idiag_ext |= (1<<(INET_DIAG_VEGASINFO-1));
2638 req.r.idiag_ext |= (1<<(INET_DIAG_CONG-1));
2639 }
2640
2641 iov[0] = (struct iovec){
2642 .iov_base = &req,
2643 .iov_len = sizeof(req)
2644 };
2645 if (f->f) {
2646 bclen = ssfilter_bytecompile(f->f, &bc);
2647 if (bclen) {
2648 rta.rta_type = INET_DIAG_REQ_BYTECODE;
2649 rta.rta_len = RTA_LENGTH(bclen);
2650 iov[1] = (struct iovec){ &rta, sizeof(rta) };
2651 iov[2] = (struct iovec){ bc, bclen };
2652 req.nlh.nlmsg_len += RTA_LENGTH(bclen);
2653 iovlen = 3;
2654 }
2655 }
2656
2657 msg = (struct msghdr) {
2658 .msg_name = (void *)&nladdr,
2659 .msg_namelen = sizeof(nladdr),
2660 .msg_iov = iov,
2661 .msg_iovlen = iovlen,
2662 };
2663
2664 if (sendmsg(fd, &msg, 0) < 0) {
2665 close(fd);
2666 return -1;
2667 }
2668
2669 return 0;
2670 }
2671
2672 struct inet_diag_arg {
2673 struct filter *f;
2674 int protocol;
2675 struct rtnl_handle *rth;
2676 };
2677
2678 static int kill_inet_sock(struct nlmsghdr *h, void *arg, struct sockstat *s)
2679 {
2680 struct inet_diag_msg *d = NLMSG_DATA(h);
2681 struct inet_diag_arg *diag_arg = arg;
2682 struct rtnl_handle *rth = diag_arg->rth;
2683
2684 DIAG_REQUEST(req, struct inet_diag_req_v2 r);
2685
2686 req.nlh.nlmsg_type = SOCK_DESTROY;
2687 req.nlh.nlmsg_flags = NLM_F_REQUEST | NLM_F_ACK;
2688 req.nlh.nlmsg_seq = ++rth->seq;
2689 req.r.sdiag_family = d->idiag_family;
2690 req.r.sdiag_protocol = diag_arg->protocol;
2691 req.r.id = d->id;
2692
2693 if (diag_arg->protocol == IPPROTO_RAW) {
2694 struct inet_diag_req_raw *raw = (void *)&req.r;
2695
2696 BUILD_BUG_ON(sizeof(req.r) != sizeof(*raw));
2697 raw->sdiag_raw_protocol = s->raw_prot;
2698 }
2699
2700 return rtnl_talk(rth, &req.nlh, NULL);
2701 }
2702
2703 static int show_one_inet_sock(const struct sockaddr_nl *addr,
2704 struct nlmsghdr *h, void *arg)
2705 {
2706 int err;
2707 struct inet_diag_arg *diag_arg = arg;
2708 struct inet_diag_msg *r = NLMSG_DATA(h);
2709 struct sockstat s = {};
2710
2711 if (!(diag_arg->f->families & FAMILY_MASK(r->idiag_family)))
2712 return 0;
2713
2714 parse_diag_msg(h, &s);
2715 s.type = diag_arg->protocol;
2716
2717 if (diag_arg->f->f && run_ssfilter(diag_arg->f->f, &s) == 0)
2718 return 0;
2719
2720 if (diag_arg->f->kill && kill_inet_sock(h, arg, &s) != 0) {
2721 if (errno == EOPNOTSUPP || errno == ENOENT) {
2722 /* Socket can't be closed, or is already closed. */
2723 return 0;
2724 } else {
2725 perror("SOCK_DESTROY answers");
2726 return -1;
2727 }
2728 }
2729
2730 err = inet_show_sock(h, &s);
2731 if (err < 0)
2732 return err;
2733
2734 return 0;
2735 }
2736
2737 static int inet_show_netlink(struct filter *f, FILE *dump_fp, int protocol)
2738 {
2739 int err = 0;
2740 struct rtnl_handle rth, rth2;
2741 int family = PF_INET;
2742 struct inet_diag_arg arg = { .f = f, .protocol = protocol };
2743
2744 if (rtnl_open_byproto(&rth, 0, NETLINK_SOCK_DIAG))
2745 return -1;
2746
2747 if (f->kill) {
2748 if (rtnl_open_byproto(&rth2, 0, NETLINK_SOCK_DIAG)) {
2749 rtnl_close(&rth);
2750 return -1;
2751 }
2752 arg.rth = &rth2;
2753 }
2754
2755 rth.dump = MAGIC_SEQ;
2756 rth.dump_fp = dump_fp;
2757 if (preferred_family == PF_INET6)
2758 family = PF_INET6;
2759
2760 again:
2761 if ((err = sockdiag_send(family, rth.fd, protocol, f)))
2762 goto Exit;
2763
2764 if ((err = rtnl_dump_filter(&rth, show_one_inet_sock, &arg))) {
2765 if (family != PF_UNSPEC) {
2766 family = PF_UNSPEC;
2767 goto again;
2768 }
2769 goto Exit;
2770 }
2771 if (family == PF_INET && preferred_family != PF_INET) {
2772 family = PF_INET6;
2773 goto again;
2774 }
2775
2776 Exit:
2777 rtnl_close(&rth);
2778 if (arg.rth)
2779 rtnl_close(arg.rth);
2780 return err;
2781 }
2782
2783 static int tcp_show_netlink_file(struct filter *f)
2784 {
2785 FILE *fp;
2786 char buf[16384];
2787 int err = -1;
2788
2789 if ((fp = fopen(getenv("TCPDIAG_FILE"), "r")) == NULL) {
2790 perror("fopen($TCPDIAG_FILE)");
2791 return err;
2792 }
2793
2794 while (1) {
2795 int status, err2;
2796 struct nlmsghdr *h = (struct nlmsghdr *)buf;
2797 struct sockstat s = {};
2798
2799 status = fread(buf, 1, sizeof(*h), fp);
2800 if (status < 0) {
2801 perror("Reading header from $TCPDIAG_FILE");
2802 break;
2803 }
2804 if (status != sizeof(*h)) {
2805 perror("Unexpected EOF reading $TCPDIAG_FILE");
2806 break;
2807 }
2808
2809 status = fread(h+1, 1, NLMSG_ALIGN(h->nlmsg_len-sizeof(*h)), fp);
2810
2811 if (status < 0) {
2812 perror("Reading $TCPDIAG_FILE");
2813 break;
2814 }
2815 if (status + sizeof(*h) < h->nlmsg_len) {
2816 perror("Unexpected EOF reading $TCPDIAG_FILE");
2817 break;
2818 }
2819
2820 /* The only legal exit point */
2821 if (h->nlmsg_type == NLMSG_DONE) {
2822 err = 0;
2823 break;
2824 }
2825
2826 if (h->nlmsg_type == NLMSG_ERROR) {
2827 struct nlmsgerr *err = (struct nlmsgerr *)NLMSG_DATA(h);
2828
2829 if (h->nlmsg_len < NLMSG_LENGTH(sizeof(struct nlmsgerr))) {
2830 fprintf(stderr, "ERROR truncated\n");
2831 } else {
2832 errno = -err->error;
2833 perror("TCPDIAG answered");
2834 }
2835 break;
2836 }
2837
2838 parse_diag_msg(h, &s);
2839 s.type = IPPROTO_TCP;
2840
2841 if (f && f->f && run_ssfilter(f->f, &s) == 0)
2842 continue;
2843
2844 err2 = inet_show_sock(h, &s);
2845 if (err2 < 0) {
2846 err = err2;
2847 break;
2848 }
2849 }
2850
2851 fclose(fp);
2852 return err;
2853 }
2854
2855 static int tcp_show(struct filter *f)
2856 {
2857 FILE *fp = NULL;
2858 char *buf = NULL;
2859 int bufsize = 64*1024;
2860
2861 if (!filter_af_get(f, AF_INET) && !filter_af_get(f, AF_INET6))
2862 return 0;
2863
2864 dg_proto = TCP_PROTO;
2865
2866 if (getenv("TCPDIAG_FILE"))
2867 return tcp_show_netlink_file(f);
2868
2869 if (!getenv("PROC_NET_TCP") && !getenv("PROC_ROOT")
2870 && inet_show_netlink(f, NULL, IPPROTO_TCP) == 0)
2871 return 0;
2872
2873 /* Sigh... We have to parse /proc/net/tcp... */
2874
2875
2876 /* Estimate amount of sockets and try to allocate
2877 * huge buffer to read all the table at one read.
2878 * Limit it by 16MB though. The assumption is: as soon as
2879 * kernel was able to hold information about N connections,
2880 * it is able to give us some memory for snapshot.
2881 */
2882 if (1) {
2883 get_slabstat(&slabstat);
2884
2885 int guess = slabstat.socks+slabstat.tcp_syns;
2886
2887 if (f->states&(1<<SS_TIME_WAIT))
2888 guess += slabstat.tcp_tws;
2889 if (guess > (16*1024*1024)/128)
2890 guess = (16*1024*1024)/128;
2891 guess *= 128;
2892 if (guess > bufsize)
2893 bufsize = guess;
2894 }
2895 while (bufsize >= 64*1024) {
2896 if ((buf = malloc(bufsize)) != NULL)
2897 break;
2898 bufsize /= 2;
2899 }
2900 if (buf == NULL) {
2901 errno = ENOMEM;
2902 return -1;
2903 }
2904
2905 if (f->families & FAMILY_MASK(AF_INET)) {
2906 if ((fp = net_tcp_open()) == NULL)
2907 goto outerr;
2908
2909 setbuffer(fp, buf, bufsize);
2910 if (generic_record_read(fp, tcp_show_line, f, AF_INET))
2911 goto outerr;
2912 fclose(fp);
2913 }
2914
2915 if ((f->families & FAMILY_MASK(AF_INET6)) &&
2916 (fp = net_tcp6_open()) != NULL) {
2917 setbuffer(fp, buf, bufsize);
2918 if (generic_record_read(fp, tcp_show_line, f, AF_INET6))
2919 goto outerr;
2920 fclose(fp);
2921 }
2922
2923 free(buf);
2924 return 0;
2925
2926 outerr:
2927 do {
2928 int saved_errno = errno;
2929
2930 free(buf);
2931 if (fp)
2932 fclose(fp);
2933 errno = saved_errno;
2934 return -1;
2935 } while (0);
2936 }
2937
2938 static int dccp_show(struct filter *f)
2939 {
2940 if (!filter_af_get(f, AF_INET) && !filter_af_get(f, AF_INET6))
2941 return 0;
2942
2943 if (!getenv("PROC_NET_DCCP") && !getenv("PROC_ROOT")
2944 && inet_show_netlink(f, NULL, IPPROTO_DCCP) == 0)
2945 return 0;
2946
2947 return 0;
2948 }
2949
2950 static int sctp_show(struct filter *f)
2951 {
2952 if (!filter_af_get(f, AF_INET) && !filter_af_get(f, AF_INET6))
2953 return 0;
2954
2955 if (!getenv("PROC_NET_SCTP") && !getenv("PROC_ROOT")
2956 && inet_show_netlink(f, NULL, IPPROTO_SCTP) == 0)
2957 return 0;
2958
2959 return 0;
2960 }
2961
2962 static int dgram_show_line(char *line, const struct filter *f, int family)
2963 {
2964 struct sockstat s = {};
2965 char *loc, *rem, *data;
2966 char opt[256];
2967 int n;
2968
2969 if (proc_inet_split_line(line, &loc, &rem, &data))
2970 return -1;
2971
2972 int state = (data[1] >= 'A') ? (data[1] - 'A' + 10) : (data[1] - '0');
2973
2974 if (!(f->states & (1 << state)))
2975 return 0;
2976
2977 proc_parse_inet_addr(loc, rem, family, &s);
2978
2979 if (f->f && run_ssfilter(f->f, &s) == 0)
2980 return 0;
2981
2982 opt[0] = 0;
2983 n = sscanf(data, "%x %x:%x %*x:%*x %*x %d %*d %u %d %llx %[^\n]\n",
2984 &s.state, &s.wq, &s.rq,
2985 &s.uid, &s.ino,
2986 &s.refcnt, &s.sk, opt);
2987
2988 if (n < 9)
2989 opt[0] = 0;
2990
2991 s.type = dg_proto == UDP_PROTO ? IPPROTO_UDP : 0;
2992 inet_stats_print(&s, false);
2993
2994 if (show_details && opt[0])
2995 printf(" opt:\"%s\"", opt);
2996
2997 printf("\n");
2998 return 0;
2999 }
3000
3001 static int udp_show(struct filter *f)
3002 {
3003 FILE *fp = NULL;
3004
3005 if (!filter_af_get(f, AF_INET) && !filter_af_get(f, AF_INET6))
3006 return 0;
3007
3008 dg_proto = UDP_PROTO;
3009
3010 if (!getenv("PROC_NET_UDP") && !getenv("PROC_ROOT")
3011 && inet_show_netlink(f, NULL, IPPROTO_UDP) == 0)
3012 return 0;
3013
3014 if (f->families&FAMILY_MASK(AF_INET)) {
3015 if ((fp = net_udp_open()) == NULL)
3016 goto outerr;
3017 if (generic_record_read(fp, dgram_show_line, f, AF_INET))
3018 goto outerr;
3019 fclose(fp);
3020 }
3021
3022 if ((f->families&FAMILY_MASK(AF_INET6)) &&
3023 (fp = net_udp6_open()) != NULL) {
3024 if (generic_record_read(fp, dgram_show_line, f, AF_INET6))
3025 goto outerr;
3026 fclose(fp);
3027 }
3028 return 0;
3029
3030 outerr:
3031 do {
3032 int saved_errno = errno;
3033
3034 if (fp)
3035 fclose(fp);
3036 errno = saved_errno;
3037 return -1;
3038 } while (0);
3039 }
3040
3041 static int raw_show(struct filter *f)
3042 {
3043 FILE *fp = NULL;
3044
3045 if (!filter_af_get(f, AF_INET) && !filter_af_get(f, AF_INET6))
3046 return 0;
3047
3048 dg_proto = RAW_PROTO;
3049
3050 if (!getenv("PROC_NET_RAW") && !getenv("PROC_ROOT") &&
3051 inet_show_netlink(f, NULL, IPPROTO_RAW) == 0)
3052 return 0;
3053
3054 if (f->families&FAMILY_MASK(AF_INET)) {
3055 if ((fp = net_raw_open()) == NULL)
3056 goto outerr;
3057 if (generic_record_read(fp, dgram_show_line, f, AF_INET))
3058 goto outerr;
3059 fclose(fp);
3060 }
3061
3062 if ((f->families&FAMILY_MASK(AF_INET6)) &&
3063 (fp = net_raw6_open()) != NULL) {
3064 if (generic_record_read(fp, dgram_show_line, f, AF_INET6))
3065 goto outerr;
3066 fclose(fp);
3067 }
3068 return 0;
3069
3070 outerr:
3071 do {
3072 int saved_errno = errno;
3073
3074 if (fp)
3075 fclose(fp);
3076 errno = saved_errno;
3077 return -1;
3078 } while (0);
3079 }
3080
3081 #define MAX_UNIX_REMEMBER (1024*1024/sizeof(struct sockstat))
3082
3083 static void unix_list_drop_first(struct sockstat **list)
3084 {
3085 struct sockstat *s = *list;
3086
3087 (*list) = (*list)->next;
3088 free(s->name);
3089 free(s);
3090 }
3091
3092 static bool unix_type_skip(struct sockstat *s, struct filter *f)
3093 {
3094 if (s->type == SOCK_STREAM && !(f->dbs&(1<<UNIX_ST_DB)))
3095 return true;
3096 if (s->type == SOCK_DGRAM && !(f->dbs&(1<<UNIX_DG_DB)))
3097 return true;
3098 if (s->type == SOCK_SEQPACKET && !(f->dbs&(1<<UNIX_SQ_DB)))
3099 return true;
3100 return false;
3101 }
3102
3103 static void unix_stats_print(struct sockstat *s, struct filter *f)
3104 {
3105 char port_name[30] = {};
3106
3107 sock_state_print(s);
3108
3109 sock_addr_print(s->name ?: "*", " ",
3110 int_to_str(s->lport, port_name), NULL);
3111 sock_addr_print(s->peer_name ?: "*", " ",
3112 int_to_str(s->rport, port_name), NULL);
3113
3114 proc_ctx_print(s);
3115 }
3116
3117 static int unix_show_sock(const struct sockaddr_nl *addr, struct nlmsghdr *nlh,
3118 void *arg)
3119 {
3120 struct filter *f = (struct filter *)arg;
3121 struct unix_diag_msg *r = NLMSG_DATA(nlh);
3122 struct rtattr *tb[UNIX_DIAG_MAX+1];
3123 char name[128];
3124 struct sockstat stat = { .name = "*", .peer_name = "*" };
3125
3126 parse_rtattr(tb, UNIX_DIAG_MAX, (struct rtattr *)(r+1),
3127 nlh->nlmsg_len - NLMSG_LENGTH(sizeof(*r)));
3128
3129 stat.type = r->udiag_type;
3130 stat.state = r->udiag_state;
3131 stat.ino = stat.lport = r->udiag_ino;
3132 stat.local.family = stat.remote.family = AF_UNIX;
3133
3134 if (unix_type_skip(&stat, f))
3135 return 0;
3136
3137 if (tb[UNIX_DIAG_RQLEN]) {
3138 struct unix_diag_rqlen *rql = RTA_DATA(tb[UNIX_DIAG_RQLEN]);
3139
3140 stat.rq = rql->udiag_rqueue;
3141 stat.wq = rql->udiag_wqueue;
3142 }
3143 if (tb[UNIX_DIAG_NAME]) {
3144 int len = RTA_PAYLOAD(tb[UNIX_DIAG_NAME]);
3145
3146 memcpy(name, RTA_DATA(tb[UNIX_DIAG_NAME]), len);
3147 name[len] = '\0';
3148 if (name[0] == '\0') {
3149 int i;
3150 for (i = 0; i < len; i++)
3151 if (name[i] == '\0')
3152 name[i] = '@';
3153 }
3154 stat.name = &name[0];
3155 memcpy(stat.local.data, &stat.name, sizeof(stat.name));
3156 }
3157 if (tb[UNIX_DIAG_PEER])
3158 stat.rport = rta_getattr_u32(tb[UNIX_DIAG_PEER]);
3159
3160 if (f->f && run_ssfilter(f->f, &stat) == 0)
3161 return 0;
3162
3163 unix_stats_print(&stat, f);
3164
3165 if (show_mem)
3166 print_skmeminfo(tb, UNIX_DIAG_MEMINFO);
3167 if (show_details) {
3168 if (tb[UNIX_DIAG_SHUTDOWN]) {
3169 unsigned char mask;
3170
3171 mask = rta_getattr_u8(tb[UNIX_DIAG_SHUTDOWN]);
3172 printf(" %c-%c", mask & 1 ? '-' : '<', mask & 2 ? '-' : '>');
3173 }
3174 }
3175 printf("\n");
3176
3177 return 0;
3178 }
3179
3180 static int handle_netlink_request(struct filter *f, struct nlmsghdr *req,
3181 size_t size, rtnl_filter_t show_one_sock)
3182 {
3183 int ret = -1;
3184 struct rtnl_handle rth;
3185
3186 if (rtnl_open_byproto(&rth, 0, NETLINK_SOCK_DIAG))
3187 return -1;
3188
3189 rth.dump = MAGIC_SEQ;
3190
3191 if (rtnl_send(&rth, req, size) < 0)
3192 goto Exit;
3193
3194 if (rtnl_dump_filter(&rth, show_one_sock, f))
3195 goto Exit;
3196
3197 ret = 0;
3198 Exit:
3199 rtnl_close(&rth);
3200 return ret;
3201 }
3202
3203 static int unix_show_netlink(struct filter *f)
3204 {
3205 DIAG_REQUEST(req, struct unix_diag_req r);
3206
3207 req.r.sdiag_family = AF_UNIX;
3208 req.r.udiag_states = f->states;
3209 req.r.udiag_show = UDIAG_SHOW_NAME | UDIAG_SHOW_PEER | UDIAG_SHOW_RQLEN;
3210 if (show_mem)
3211 req.r.udiag_show |= UDIAG_SHOW_MEMINFO;
3212
3213 return handle_netlink_request(f, &req.nlh, sizeof(req), unix_show_sock);
3214 }
3215
3216 static int unix_show(struct filter *f)
3217 {
3218 FILE *fp;
3219 char buf[256];
3220 char name[128];
3221 int newformat = 0;
3222 int cnt;
3223 struct sockstat *list = NULL;
3224 const int unix_state_map[] = { SS_CLOSE, SS_SYN_SENT,
3225 SS_ESTABLISHED, SS_CLOSING };
3226
3227 if (!filter_af_get(f, AF_UNIX))
3228 return 0;
3229
3230 if (!getenv("PROC_NET_UNIX") && !getenv("PROC_ROOT")
3231 && unix_show_netlink(f) == 0)
3232 return 0;
3233
3234 if ((fp = net_unix_open()) == NULL)
3235 return -1;
3236 if (!fgets(buf, sizeof(buf), fp)) {
3237 fclose(fp);
3238 return -1;
3239 }
3240
3241 if (memcmp(buf, "Peer", 4) == 0)
3242 newformat = 1;
3243 cnt = 0;
3244
3245 while (fgets(buf, sizeof(buf), fp)) {
3246 struct sockstat *u, **insp;
3247 int flags;
3248
3249 if (!(u = calloc(1, sizeof(*u))))
3250 break;
3251
3252 if (sscanf(buf, "%x: %x %x %x %x %x %d %s",
3253 &u->rport, &u->rq, &u->wq, &flags, &u->type,
3254 &u->state, &u->ino, name) < 8)
3255 name[0] = 0;
3256
3257 u->lport = u->ino;
3258 u->local.family = u->remote.family = AF_UNIX;
3259
3260 if (flags & (1 << 16)) {
3261 u->state = SS_LISTEN;
3262 } else if (u->state > 0 &&
3263 u->state <= ARRAY_SIZE(unix_state_map)) {
3264 u->state = unix_state_map[u->state-1];
3265 if (u->type == SOCK_DGRAM && u->state == SS_CLOSE && u->rport)
3266 u->state = SS_ESTABLISHED;
3267 }
3268 if (unix_type_skip(u, f) ||
3269 !(f->states & (1 << u->state))) {
3270 free(u);
3271 continue;
3272 }
3273
3274 if (!newformat) {
3275 u->rport = 0;
3276 u->rq = 0;
3277 u->wq = 0;
3278 }
3279
3280 if (name[0]) {
3281 u->name = strdup(name);
3282 if (!u->name) {
3283 free(u);
3284 break;
3285 }
3286 }
3287
3288 if (u->rport) {
3289 struct sockstat *p;
3290
3291 for (p = list; p; p = p->next) {
3292 if (u->rport == p->lport)
3293 break;
3294 }
3295 if (!p)
3296 u->peer_name = "?";
3297 else
3298 u->peer_name = p->name ? : "*";
3299 }
3300
3301 if (f->f) {
3302 struct sockstat st = {
3303 .local.family = AF_UNIX,
3304 .remote.family = AF_UNIX,
3305 };
3306
3307 memcpy(st.local.data, &u->name, sizeof(u->name));
3308 if (strcmp(u->peer_name, "*"))
3309 memcpy(st.remote.data, &u->peer_name,
3310 sizeof(u->peer_name));
3311 if (run_ssfilter(f->f, &st) == 0) {
3312 free(u->name);
3313 free(u);
3314 continue;
3315 }
3316 }
3317
3318 insp = &list;
3319 while (*insp) {
3320 if (u->type < (*insp)->type ||
3321 (u->type == (*insp)->type &&
3322 u->ino < (*insp)->ino))
3323 break;
3324 insp = &(*insp)->next;
3325 }
3326 u->next = *insp;
3327 *insp = u;
3328
3329 if (++cnt > MAX_UNIX_REMEMBER) {
3330 while (list) {
3331 unix_stats_print(list, f);
3332 printf("\n");
3333
3334 unix_list_drop_first(&list);
3335 }
3336 cnt = 0;
3337 }
3338 }
3339 fclose(fp);
3340 while (list) {
3341 unix_stats_print(list, f);
3342 printf("\n");
3343
3344 unix_list_drop_first(&list);
3345 }
3346
3347 return 0;
3348 }
3349
3350 static int packet_stats_print(struct sockstat *s, const struct filter *f)
3351 {
3352 const char *addr, *port;
3353 char ll_name[16];
3354
3355 s->local.family = s->remote.family = AF_PACKET;
3356
3357 if (f->f) {
3358 s->local.data[0] = s->prot;
3359 if (run_ssfilter(f->f, s) == 0)
3360 return 1;
3361 }
3362
3363 sock_state_print(s);
3364
3365 if (s->prot == 3)
3366 addr = "*";
3367 else
3368 addr = ll_proto_n2a(htons(s->prot), ll_name, sizeof(ll_name));
3369
3370 if (s->iface == 0)
3371 port = "*";
3372 else
3373 port = xll_index_to_name(s->iface);
3374
3375 sock_addr_print(addr, ":", port, NULL);
3376 sock_addr_print("", "*", "", NULL);
3377
3378 proc_ctx_print(s);
3379
3380 if (show_details)
3381 sock_details_print(s);
3382
3383 return 0;
3384 }
3385
3386 static void packet_show_ring(struct packet_diag_ring *ring)
3387 {
3388 printf("blk_size:%d", ring->pdr_block_size);
3389 printf(",blk_nr:%d", ring->pdr_block_nr);
3390 printf(",frm_size:%d", ring->pdr_frame_size);
3391 printf(",frm_nr:%d", ring->pdr_frame_nr);
3392 printf(",tmo:%d", ring->pdr_retire_tmo);
3393 printf(",features:0x%x", ring->pdr_features);
3394 }
3395
3396 static int packet_show_sock(const struct sockaddr_nl *addr,
3397 struct nlmsghdr *nlh, void *arg)
3398 {
3399 const struct filter *f = arg;
3400 struct packet_diag_msg *r = NLMSG_DATA(nlh);
3401 struct packet_diag_info *pinfo = NULL;
3402 struct packet_diag_ring *ring_rx = NULL, *ring_tx = NULL;
3403 struct rtattr *tb[PACKET_DIAG_MAX+1];
3404 struct sockstat stat = {};
3405 uint32_t fanout = 0;
3406 bool has_fanout = false;
3407
3408 parse_rtattr(tb, PACKET_DIAG_MAX, (struct rtattr *)(r+1),
3409 nlh->nlmsg_len - NLMSG_LENGTH(sizeof(*r)));
3410
3411 /* use /proc/net/packet if all info are not available */
3412 if (!tb[PACKET_DIAG_MEMINFO])
3413 return -1;
3414
3415 stat.type = r->pdiag_type;
3416 stat.prot = r->pdiag_num;
3417 stat.ino = r->pdiag_ino;
3418 stat.state = SS_CLOSE;
3419 stat.sk = cookie_sk_get(&r->pdiag_cookie[0]);
3420
3421 if (tb[PACKET_DIAG_MEMINFO]) {
3422 __u32 *skmeminfo = RTA_DATA(tb[PACKET_DIAG_MEMINFO]);
3423
3424 stat.rq = skmeminfo[SK_MEMINFO_RMEM_ALLOC];
3425 }
3426
3427 if (tb[PACKET_DIAG_INFO]) {
3428 pinfo = RTA_DATA(tb[PACKET_DIAG_INFO]);
3429 stat.lport = stat.iface = pinfo->pdi_index;
3430 }
3431
3432 if (tb[PACKET_DIAG_UID])
3433 stat.uid = rta_getattr_u32(tb[PACKET_DIAG_UID]);
3434
3435 if (tb[PACKET_DIAG_RX_RING])
3436 ring_rx = RTA_DATA(tb[PACKET_DIAG_RX_RING]);
3437
3438 if (tb[PACKET_DIAG_TX_RING])
3439 ring_tx = RTA_DATA(tb[PACKET_DIAG_TX_RING]);
3440
3441 if (tb[PACKET_DIAG_FANOUT]) {
3442 has_fanout = true;
3443 fanout = rta_getattr_u32(tb[PACKET_DIAG_FANOUT]);
3444 }
3445
3446 if (packet_stats_print(&stat, f))
3447 return 0;
3448
3449 if (show_details) {
3450 if (pinfo) {
3451 printf("\n\tver:%d", pinfo->pdi_version);
3452 printf(" cpy_thresh:%d", pinfo->pdi_copy_thresh);
3453 printf(" flags( ");
3454 if (pinfo->pdi_flags & PDI_RUNNING)
3455 printf("running");
3456 if (pinfo->pdi_flags & PDI_AUXDATA)
3457 printf(" auxdata");
3458 if (pinfo->pdi_flags & PDI_ORIGDEV)
3459 printf(" origdev");
3460 if (pinfo->pdi_flags & PDI_VNETHDR)
3461 printf(" vnethdr");
3462 if (pinfo->pdi_flags & PDI_LOSS)
3463 printf(" loss");
3464 if (!pinfo->pdi_flags)
3465 printf("0");
3466 printf(" )");
3467 }
3468 if (ring_rx) {
3469 printf("\n\tring_rx(");
3470 packet_show_ring(ring_rx);
3471 printf(")");
3472 }
3473 if (ring_tx) {
3474 printf("\n\tring_tx(");
3475 packet_show_ring(ring_tx);
3476 printf(")");
3477 }
3478 if (has_fanout) {
3479 uint16_t type = (fanout >> 16) & 0xffff;
3480
3481 printf("\n\tfanout(");
3482 printf("id:%d,", fanout & 0xffff);
3483 printf("type:");
3484
3485 if (type == 0)
3486 printf("hash");
3487 else if (type == 1)
3488 printf("lb");
3489 else if (type == 2)
3490 printf("cpu");
3491 else if (type == 3)
3492 printf("roll");
3493 else if (type == 4)
3494 printf("random");
3495 else if (type == 5)
3496 printf("qm");
3497 else
3498 printf("0x%x", type);
3499
3500 printf(")");
3501 }
3502 }
3503
3504 if (show_bpf && tb[PACKET_DIAG_FILTER]) {
3505 struct sock_filter *fil =
3506 RTA_DATA(tb[PACKET_DIAG_FILTER]);
3507 int num = RTA_PAYLOAD(tb[PACKET_DIAG_FILTER]) /
3508 sizeof(struct sock_filter);
3509
3510 printf("\n\tbpf filter (%d): ", num);
3511 while (num) {
3512 printf(" 0x%02x %u %u %u,",
3513 fil->code, fil->jt, fil->jf, fil->k);
3514 num--;
3515 fil++;
3516 }
3517 }
3518 printf("\n");
3519 return 0;
3520 }
3521
3522 static int packet_show_netlink(struct filter *f)
3523 {
3524 DIAG_REQUEST(req, struct packet_diag_req r);
3525
3526 req.r.sdiag_family = AF_PACKET;
3527 req.r.pdiag_show = PACKET_SHOW_INFO | PACKET_SHOW_MEMINFO |
3528 PACKET_SHOW_FILTER | PACKET_SHOW_RING_CFG | PACKET_SHOW_FANOUT;
3529
3530 return handle_netlink_request(f, &req.nlh, sizeof(req), packet_show_sock);
3531 }
3532
3533 static int packet_show_line(char *buf, const struct filter *f, int fam)
3534 {
3535 unsigned long long sk;
3536 struct sockstat stat = {};
3537 int type, prot, iface, state, rq, uid, ino;
3538
3539 sscanf(buf, "%llx %*d %d %x %d %d %u %u %u",
3540 &sk,
3541 &type, &prot, &iface, &state,
3542 &rq, &uid, &ino);
3543
3544 if (stat.type == SOCK_RAW && !(f->dbs&(1<<PACKET_R_DB)))
3545 return 0;
3546 if (stat.type == SOCK_DGRAM && !(f->dbs&(1<<PACKET_DG_DB)))
3547 return 0;
3548
3549 stat.type = type;
3550 stat.prot = prot;
3551 stat.lport = stat.iface = iface;
3552 stat.state = state;
3553 stat.rq = rq;
3554 stat.uid = uid;
3555 stat.ino = ino;
3556 stat.state = SS_CLOSE;
3557
3558 if (packet_stats_print(&stat, f))
3559 return 0;
3560
3561 printf("\n");
3562 return 0;
3563 }
3564
3565 static int packet_show(struct filter *f)
3566 {
3567 FILE *fp;
3568 int rc = 0;
3569
3570 if (!filter_af_get(f, AF_PACKET) || !(f->states & (1 << SS_CLOSE)))
3571 return 0;
3572
3573 if (!getenv("PROC_NET_PACKET") && !getenv("PROC_ROOT") &&
3574 packet_show_netlink(f) == 0)
3575 return 0;
3576
3577 if ((fp = net_packet_open()) == NULL)
3578 return -1;
3579 if (generic_record_read(fp, packet_show_line, f, AF_PACKET))
3580 rc = -1;
3581
3582 fclose(fp);
3583 return rc;
3584 }
3585
3586 static int netlink_show_one(struct filter *f,
3587 int prot, int pid, unsigned int groups,
3588 int state, int dst_pid, unsigned int dst_group,
3589 int rq, int wq,
3590 unsigned long long sk, unsigned long long cb)
3591 {
3592 struct sockstat st = {
3593 .state = SS_CLOSE,
3594 .rq = rq,
3595 .wq = wq,
3596 .local.family = AF_NETLINK,
3597 .remote.family = AF_NETLINK,
3598 };
3599
3600 SPRINT_BUF(prot_buf) = {};
3601 const char *prot_name;
3602 char procname[64] = {};
3603
3604 if (f->f) {
3605 st.rport = -1;
3606 st.lport = pid;
3607 st.local.data[0] = prot;
3608 if (run_ssfilter(f->f, &st) == 0)
3609 return 1;
3610 }
3611
3612 sock_state_print(&st);
3613
3614 if (resolve_services)
3615 prot_name = nl_proto_n2a(prot, prot_buf, sizeof(prot_buf));
3616 else
3617 prot_name = int_to_str(prot, prot_buf);
3618
3619 if (pid == -1) {
3620 procname[0] = '*';
3621 } else if (resolve_services) {
3622 int done = 0;
3623
3624 if (!pid) {
3625 done = 1;
3626 strncpy(procname, "kernel", 6);
3627 } else if (pid > 0) {
3628 FILE *fp;
3629
3630 snprintf(procname, sizeof(procname), "%s/%d/stat",
3631 getenv("PROC_ROOT") ? : "/proc", pid);
3632 if ((fp = fopen(procname, "r")) != NULL) {
3633 if (fscanf(fp, "%*d (%[^)])", procname) == 1) {
3634 snprintf(procname+strlen(procname),
3635 sizeof(procname)-strlen(procname),
3636 "/%d", pid);
3637 done = 1;
3638 }
3639 fclose(fp);
3640 }
3641 }
3642 if (!done)
3643 int_to_str(pid, procname);
3644 } else {
3645 int_to_str(pid, procname);
3646 }
3647
3648 sock_addr_print(prot_name, ":", procname, NULL);
3649
3650 if (state == NETLINK_CONNECTED) {
3651 char dst_group_buf[30];
3652 char dst_pid_buf[30];
3653
3654 sock_addr_print(int_to_str(dst_group, dst_group_buf), ":",
3655 int_to_str(dst_pid, dst_pid_buf), NULL);
3656 } else {
3657 sock_addr_print("", "*", "", NULL);
3658 }
3659
3660 char *pid_context = NULL;
3661
3662 if (show_proc_ctx) {
3663 /* The pid value will either be:
3664 * 0 if destination kernel - show kernel initial context.
3665 * A valid process pid - use getpidcon.
3666 * A unique value allocated by the kernel or netlink user
3667 * to the process - show context as "not available".
3668 */
3669 if (!pid)
3670 security_get_initial_context("kernel", &pid_context);
3671 else if (pid > 0)
3672 getpidcon(pid, &pid_context);
3673
3674 printf(" proc_ctx=%s", pid_context ? : "unavailable");
3675 free(pid_context);
3676 }
3677
3678 if (show_details) {
3679 printf(" sk=%llx cb=%llx groups=0x%08x", sk, cb, groups);
3680 }
3681 printf("\n");
3682
3683 return 0;
3684 }
3685
3686 static int netlink_show_sock(const struct sockaddr_nl *addr,
3687 struct nlmsghdr *nlh, void *arg)
3688 {
3689 struct filter *f = (struct filter *)arg;
3690 struct netlink_diag_msg *r = NLMSG_DATA(nlh);
3691 struct rtattr *tb[NETLINK_DIAG_MAX+1];
3692 int rq = 0, wq = 0;
3693 unsigned long groups = 0;
3694
3695 parse_rtattr(tb, NETLINK_DIAG_MAX, (struct rtattr *)(r+1),
3696 nlh->nlmsg_len - NLMSG_LENGTH(sizeof(*r)));
3697
3698 if (tb[NETLINK_DIAG_GROUPS] && RTA_PAYLOAD(tb[NETLINK_DIAG_GROUPS]))
3699 groups = *(unsigned long *) RTA_DATA(tb[NETLINK_DIAG_GROUPS]);
3700
3701 if (tb[NETLINK_DIAG_MEMINFO]) {
3702 const __u32 *skmeminfo;
3703
3704 skmeminfo = RTA_DATA(tb[NETLINK_DIAG_MEMINFO]);
3705
3706 rq = skmeminfo[SK_MEMINFO_RMEM_ALLOC];
3707 wq = skmeminfo[SK_MEMINFO_WMEM_ALLOC];
3708 }
3709
3710 if (netlink_show_one(f, r->ndiag_protocol, r->ndiag_portid, groups,
3711 r->ndiag_state, r->ndiag_dst_portid, r->ndiag_dst_group,
3712 rq, wq, 0, 0)) {
3713 return 0;
3714 }
3715
3716 if (show_mem) {
3717 printf("\t");
3718 print_skmeminfo(tb, NETLINK_DIAG_MEMINFO);
3719 printf("\n");
3720 }
3721
3722 return 0;
3723 }
3724
3725 static int netlink_show_netlink(struct filter *f)
3726 {
3727 DIAG_REQUEST(req, struct netlink_diag_req r);
3728
3729 req.r.sdiag_family = AF_NETLINK;
3730 req.r.sdiag_protocol = NDIAG_PROTO_ALL;
3731 req.r.ndiag_show = NDIAG_SHOW_GROUPS | NDIAG_SHOW_MEMINFO;
3732
3733 return handle_netlink_request(f, &req.nlh, sizeof(req), netlink_show_sock);
3734 }
3735
3736 static int netlink_show(struct filter *f)
3737 {
3738 FILE *fp;
3739 char buf[256];
3740 int prot, pid;
3741 unsigned int groups;
3742 int rq, wq, rc;
3743 unsigned long long sk, cb;
3744
3745 if (!filter_af_get(f, AF_NETLINK) || !(f->states & (1 << SS_CLOSE)))
3746 return 0;
3747
3748 if (!getenv("PROC_NET_NETLINK") && !getenv("PROC_ROOT") &&
3749 netlink_show_netlink(f) == 0)
3750 return 0;
3751
3752 if ((fp = net_netlink_open()) == NULL)
3753 return -1;
3754 if (!fgets(buf, sizeof(buf), fp)) {
3755 fclose(fp);
3756 return -1;
3757 }
3758
3759 while (fgets(buf, sizeof(buf), fp)) {
3760 sscanf(buf, "%llx %d %d %x %d %d %llx %d",
3761 &sk,
3762 &prot, &pid, &groups, &rq, &wq, &cb, &rc);
3763
3764 netlink_show_one(f, prot, pid, groups, 0, 0, 0, rq, wq, sk, cb);
3765 }
3766
3767 fclose(fp);
3768 return 0;
3769 }
3770
3771 static bool vsock_type_skip(struct sockstat *s, struct filter *f)
3772 {
3773 if (s->type == SOCK_STREAM && !(f->dbs & (1 << VSOCK_ST_DB)))
3774 return true;
3775 if (s->type == SOCK_DGRAM && !(f->dbs & (1 << VSOCK_DG_DB)))
3776 return true;
3777 return false;
3778 }
3779
3780 static void vsock_addr_print(inet_prefix *a, __u32 port)
3781 {
3782 char cid_str[sizeof("4294967295")];
3783 char port_str[sizeof("4294967295")];
3784 __u32 cid;
3785
3786 memcpy(&cid, a->data, sizeof(cid));
3787
3788 if (cid == ~(__u32)0)
3789 snprintf(cid_str, sizeof(cid_str), "*");
3790 else
3791 snprintf(cid_str, sizeof(cid_str), "%u", cid);
3792
3793 if (port == ~(__u32)0)
3794 snprintf(port_str, sizeof(port_str), "*");
3795 else
3796 snprintf(port_str, sizeof(port_str), "%u", port);
3797
3798 sock_addr_print(cid_str, ":", port_str, NULL);
3799 }
3800
3801 static void vsock_stats_print(struct sockstat *s, struct filter *f)
3802 {
3803 sock_state_print(s);
3804
3805 vsock_addr_print(&s->local, s->lport);
3806 vsock_addr_print(&s->remote, s->rport);
3807
3808 proc_ctx_print(s);
3809
3810 printf("\n");
3811 }
3812
3813 static int vsock_show_sock(const struct sockaddr_nl *addr,
3814 struct nlmsghdr *nlh, void *arg)
3815 {
3816 struct filter *f = (struct filter *)arg;
3817 struct vsock_diag_msg *r = NLMSG_DATA(nlh);
3818 struct sockstat stat = {
3819 .type = r->vdiag_type,
3820 .lport = r->vdiag_src_port,
3821 .rport = r->vdiag_dst_port,
3822 .state = r->vdiag_state,
3823 .ino = r->vdiag_ino,
3824 };
3825
3826 vsock_set_inet_prefix(&stat.local, r->vdiag_src_cid);
3827 vsock_set_inet_prefix(&stat.remote, r->vdiag_dst_cid);
3828
3829 if (vsock_type_skip(&stat, f))
3830 return 0;
3831
3832 if (f->f && run_ssfilter(f->f, &stat) == 0)
3833 return 0;
3834
3835 vsock_stats_print(&stat, f);
3836
3837 return 0;
3838 }
3839
3840 static int vsock_show(struct filter *f)
3841 {
3842 DIAG_REQUEST(req, struct vsock_diag_req r);
3843
3844 if (!filter_af_get(f, AF_VSOCK))
3845 return 0;
3846
3847 req.r.sdiag_family = AF_VSOCK;
3848 req.r.vdiag_states = f->states;
3849
3850 return handle_netlink_request(f, &req.nlh, sizeof(req), vsock_show_sock);
3851 }
3852
3853 struct sock_diag_msg {
3854 __u8 sdiag_family;
3855 };
3856
3857 static int generic_show_sock(const struct sockaddr_nl *addr,
3858 struct nlmsghdr *nlh, void *arg)
3859 {
3860 struct sock_diag_msg *r = NLMSG_DATA(nlh);
3861 struct inet_diag_arg inet_arg = { .f = arg, .protocol = IPPROTO_MAX };
3862
3863 switch (r->sdiag_family) {
3864 case AF_INET:
3865 case AF_INET6:
3866 return show_one_inet_sock(addr, nlh, &inet_arg);
3867 case AF_UNIX:
3868 return unix_show_sock(addr, nlh, arg);
3869 case AF_PACKET:
3870 return packet_show_sock(addr, nlh, arg);
3871 case AF_NETLINK:
3872 return netlink_show_sock(addr, nlh, arg);
3873 case AF_VSOCK:
3874 return vsock_show_sock(addr, nlh, arg);
3875 default:
3876 return -1;
3877 }
3878 }
3879
3880 static int handle_follow_request(struct filter *f)
3881 {
3882 int ret = 0;
3883 int groups = 0;
3884 struct rtnl_handle rth;
3885
3886 if (f->families & FAMILY_MASK(AF_INET) && f->dbs & (1 << TCP_DB))
3887 groups |= 1 << (SKNLGRP_INET_TCP_DESTROY - 1);
3888 if (f->families & FAMILY_MASK(AF_INET) && f->dbs & (1 << UDP_DB))
3889 groups |= 1 << (SKNLGRP_INET_UDP_DESTROY - 1);
3890 if (f->families & FAMILY_MASK(AF_INET6) && f->dbs & (1 << TCP_DB))
3891 groups |= 1 << (SKNLGRP_INET6_TCP_DESTROY - 1);
3892 if (f->families & FAMILY_MASK(AF_INET6) && f->dbs & (1 << UDP_DB))
3893 groups |= 1 << (SKNLGRP_INET6_UDP_DESTROY - 1);
3894
3895 if (groups == 0)
3896 return -1;
3897
3898 if (rtnl_open_byproto(&rth, groups, NETLINK_SOCK_DIAG))
3899 return -1;
3900
3901 rth.dump = 0;
3902 rth.local.nl_pid = 0;
3903
3904 if (rtnl_dump_filter(&rth, generic_show_sock, f))
3905 ret = -1;
3906
3907 rtnl_close(&rth);
3908 return ret;
3909 }
3910
3911 static int get_snmp_int(char *proto, char *key, int *result)
3912 {
3913 char buf[1024];
3914 FILE *fp;
3915 int protolen = strlen(proto);
3916 int keylen = strlen(key);
3917
3918 *result = 0;
3919
3920 if ((fp = net_snmp_open()) == NULL)
3921 return -1;
3922
3923 while (fgets(buf, sizeof(buf), fp) != NULL) {
3924 char *p = buf;
3925 int pos = 0;
3926
3927 if (memcmp(buf, proto, protolen))
3928 continue;
3929 while ((p = strchr(p, ' ')) != NULL) {
3930 pos++;
3931 p++;
3932 if (memcmp(p, key, keylen) == 0 &&
3933 (p[keylen] == ' ' || p[keylen] == '\n'))
3934 break;
3935 }
3936 if (fgets(buf, sizeof(buf), fp) == NULL)
3937 break;
3938 if (memcmp(buf, proto, protolen))
3939 break;
3940 p = buf;
3941 while ((p = strchr(p, ' ')) != NULL) {
3942 p++;
3943 if (--pos == 0) {
3944 sscanf(p, "%d", result);
3945 fclose(fp);
3946 return 0;
3947 }
3948 }
3949 }
3950
3951 fclose(fp);
3952 errno = ESRCH;
3953 return -1;
3954 }
3955
3956
3957 /* Get stats from sockstat */
3958
3959 struct ssummary {
3960 int socks;
3961 int tcp_mem;
3962 int tcp_total;
3963 int tcp_orphans;
3964 int tcp_tws;
3965 int tcp4_hashed;
3966 int udp4;
3967 int raw4;
3968 int frag4;
3969 int frag4_mem;
3970 int tcp6_hashed;
3971 int udp6;
3972 int raw6;
3973 int frag6;
3974 int frag6_mem;
3975 };
3976
3977 static void get_sockstat_line(char *line, struct ssummary *s)
3978 {
3979 char id[256], rem[256];
3980
3981 if (sscanf(line, "%[^ ] %[^\n]\n", id, rem) != 2)
3982 return;
3983
3984 if (strcmp(id, "sockets:") == 0)
3985 sscanf(rem, "%*s%d", &s->socks);
3986 else if (strcmp(id, "UDP:") == 0)
3987 sscanf(rem, "%*s%d", &s->udp4);
3988 else if (strcmp(id, "UDP6:") == 0)
3989 sscanf(rem, "%*s%d", &s->udp6);
3990 else if (strcmp(id, "RAW:") == 0)
3991 sscanf(rem, "%*s%d", &s->raw4);
3992 else if (strcmp(id, "RAW6:") == 0)
3993 sscanf(rem, "%*s%d", &s->raw6);
3994 else if (strcmp(id, "TCP6:") == 0)
3995 sscanf(rem, "%*s%d", &s->tcp6_hashed);
3996 else if (strcmp(id, "FRAG:") == 0)
3997 sscanf(rem, "%*s%d%*s%d", &s->frag4, &s->frag4_mem);
3998 else if (strcmp(id, "FRAG6:") == 0)
3999 sscanf(rem, "%*s%d%*s%d", &s->frag6, &s->frag6_mem);
4000 else if (strcmp(id, "TCP:") == 0)
4001 sscanf(rem, "%*s%d%*s%d%*s%d%*s%d%*s%d",
4002 &s->tcp4_hashed,
4003 &s->tcp_orphans, &s->tcp_tws, &s->tcp_total, &s->tcp_mem);
4004 }
4005
4006 static int get_sockstat(struct ssummary *s)
4007 {
4008 char buf[256];
4009 FILE *fp;
4010
4011 memset(s, 0, sizeof(*s));
4012
4013 if ((fp = net_sockstat_open()) == NULL)
4014 return -1;
4015 while (fgets(buf, sizeof(buf), fp) != NULL)
4016 get_sockstat_line(buf, s);
4017 fclose(fp);
4018
4019 if ((fp = net_sockstat6_open()) == NULL)
4020 return 0;
4021 while (fgets(buf, sizeof(buf), fp) != NULL)
4022 get_sockstat_line(buf, s);
4023 fclose(fp);
4024
4025 return 0;
4026 }
4027
4028 static int print_summary(void)
4029 {
4030 struct ssummary s;
4031 int tcp_estab;
4032
4033 if (get_sockstat(&s) < 0)
4034 perror("ss: get_sockstat");
4035 if (get_snmp_int("Tcp:", "CurrEstab", &tcp_estab) < 0)
4036 perror("ss: get_snmpstat");
4037
4038 get_slabstat(&slabstat);
4039
4040 printf("Total: %d (kernel %d)\n", s.socks, slabstat.socks);
4041
4042 printf("TCP: %d (estab %d, closed %d, orphaned %d, synrecv %d, timewait %d/%d), ports %d\n",
4043 s.tcp_total + slabstat.tcp_syns + s.tcp_tws,
4044 tcp_estab,
4045 s.tcp_total - (s.tcp4_hashed+s.tcp6_hashed-s.tcp_tws),
4046 s.tcp_orphans,
4047 slabstat.tcp_syns,
4048 s.tcp_tws, slabstat.tcp_tws,
4049 slabstat.tcp_ports
4050 );
4051
4052 printf("\n");
4053 printf("Transport Total IP IPv6\n");
4054 printf("* %-9d %-9s %-9s\n", slabstat.socks, "-", "-");
4055 printf("RAW %-9d %-9d %-9d\n", s.raw4+s.raw6, s.raw4, s.raw6);
4056 printf("UDP %-9d %-9d %-9d\n", s.udp4+s.udp6, s.udp4, s.udp6);
4057 printf("TCP %-9d %-9d %-9d\n", s.tcp4_hashed+s.tcp6_hashed, s.tcp4_hashed, s.tcp6_hashed);
4058 printf("INET %-9d %-9d %-9d\n",
4059 s.raw4+s.udp4+s.tcp4_hashed+
4060 s.raw6+s.udp6+s.tcp6_hashed,
4061 s.raw4+s.udp4+s.tcp4_hashed,
4062 s.raw6+s.udp6+s.tcp6_hashed);
4063 printf("FRAG %-9d %-9d %-9d\n", s.frag4+s.frag6, s.frag4, s.frag6);
4064
4065 printf("\n");
4066
4067 return 0;
4068 }
4069
4070 static void _usage(FILE *dest)
4071 {
4072 fprintf(dest,
4073 "Usage: ss [ OPTIONS ]\n"
4074 " ss [ OPTIONS ] [ FILTER ]\n"
4075 " -h, --help this message\n"
4076 " -V, --version output version information\n"
4077 " -n, --numeric don't resolve service names\n"
4078 " -r, --resolve resolve host names\n"
4079 " -a, --all display all sockets\n"
4080 " -l, --listening display listening sockets\n"
4081 " -o, --options show timer information\n"
4082 " -e, --extended show detailed socket information\n"
4083 " -m, --memory show socket memory usage\n"
4084 " -p, --processes show process using socket\n"
4085 " -i, --info show internal TCP information\n"
4086 " -s, --summary show socket usage summary\n"
4087 " -b, --bpf show bpf filter socket information\n"
4088 " -E, --events continually display sockets as they are destroyed\n"
4089 " -Z, --context display process SELinux security contexts\n"
4090 " -z, --contexts display process and socket SELinux security contexts\n"
4091 " -N, --net switch to the specified network namespace name\n"
4092 "\n"
4093 " -4, --ipv4 display only IP version 4 sockets\n"
4094 " -6, --ipv6 display only IP version 6 sockets\n"
4095 " -0, --packet display PACKET sockets\n"
4096 " -t, --tcp display only TCP sockets\n"
4097 " -S, --sctp display only SCTP sockets\n"
4098 " -u, --udp display only UDP sockets\n"
4099 " -d, --dccp display only DCCP sockets\n"
4100 " -w, --raw display only RAW sockets\n"
4101 " -x, --unix display only Unix domain sockets\n"
4102 " --vsock display only vsock sockets\n"
4103 " -f, --family=FAMILY display sockets of type FAMILY\n"
4104 " FAMILY := {inet|inet6|link|unix|netlink|vsock|help}\n"
4105 "\n"
4106 " -K, --kill forcibly close sockets, display what was closed\n"
4107 " -H, --no-header Suppress header line\n"
4108 "\n"
4109 " -A, --query=QUERY, --socket=QUERY\n"
4110 " QUERY := {all|inet|tcp|udp|raw|unix|unix_dgram|unix_stream|unix_seqpacket|packet|netlink|vsock_stream|vsock_dgram}[,QUERY]\n"
4111 "\n"
4112 " -D, --diag=FILE Dump raw information about TCP sockets to FILE\n"
4113 " -F, --filter=FILE read filter information from FILE\n"
4114 " FILTER := [ state STATE-FILTER ] [ EXPRESSION ]\n"
4115 " STATE-FILTER := {all|connected|synchronized|bucket|big|TCP-STATES}\n"
4116 " TCP-STATES := {established|syn-sent|syn-recv|fin-wait-{1,2}|time-wait|closed|close-wait|last-ack|listening|closing}\n"
4117 " connected := {established|syn-sent|syn-recv|fin-wait-{1,2}|time-wait|close-wait|last-ack|closing}\n"
4118 " synchronized := {established|syn-recv|fin-wait-{1,2}|time-wait|close-wait|last-ack|closing}\n"
4119 " bucket := {syn-recv|time-wait}\n"
4120 " big := {established|syn-sent|fin-wait-{1,2}|closed|close-wait|last-ack|listening|closing}\n"
4121 );
4122 }
4123
4124 static void help(void) __attribute__((noreturn));
4125 static void help(void)
4126 {
4127 _usage(stdout);
4128 exit(0);
4129 }
4130
4131 static void usage(void) __attribute__((noreturn));
4132 static void usage(void)
4133 {
4134 _usage(stderr);
4135 exit(-1);
4136 }
4137
4138
4139 static int scan_state(const char *state)
4140 {
4141 static const char * const sstate_namel[] = {
4142 "UNKNOWN",
4143 [SS_ESTABLISHED] = "established",
4144 [SS_SYN_SENT] = "syn-sent",
4145 [SS_SYN_RECV] = "syn-recv",
4146 [SS_FIN_WAIT1] = "fin-wait-1",
4147 [SS_FIN_WAIT2] = "fin-wait-2",
4148 [SS_TIME_WAIT] = "time-wait",
4149 [SS_CLOSE] = "unconnected",
4150 [SS_CLOSE_WAIT] = "close-wait",
4151 [SS_LAST_ACK] = "last-ack",
4152 [SS_LISTEN] = "listening",
4153 [SS_CLOSING] = "closing",
4154 };
4155 int i;
4156
4157 if (strcasecmp(state, "close") == 0 ||
4158 strcasecmp(state, "closed") == 0)
4159 return (1<<SS_CLOSE);
4160 if (strcasecmp(state, "syn-rcv") == 0)
4161 return (1<<SS_SYN_RECV);
4162 if (strcasecmp(state, "established") == 0)
4163 return (1<<SS_ESTABLISHED);
4164 if (strcasecmp(state, "all") == 0)
4165 return SS_ALL;
4166 if (strcasecmp(state, "connected") == 0)
4167 return SS_ALL & ~((1<<SS_CLOSE)|(1<<SS_LISTEN));
4168 if (strcasecmp(state, "synchronized") == 0)
4169 return SS_ALL & ~((1<<SS_CLOSE)|(1<<SS_LISTEN)|(1<<SS_SYN_SENT));
4170 if (strcasecmp(state, "bucket") == 0)
4171 return (1<<SS_SYN_RECV)|(1<<SS_TIME_WAIT);
4172 if (strcasecmp(state, "big") == 0)
4173 return SS_ALL & ~((1<<SS_SYN_RECV)|(1<<SS_TIME_WAIT));
4174 for (i = 0; i < SS_MAX; i++) {
4175 if (strcasecmp(state, sstate_namel[i]) == 0)
4176 return (1<<i);
4177 }
4178
4179 fprintf(stderr, "ss: wrong state name: %s\n", state);
4180 exit(-1);
4181 }
4182
4183 /* Values 'v' and 'V' are already used so a non-character is used */
4184 #define OPT_VSOCK 256
4185
4186 static const struct option long_opts[] = {
4187 { "numeric", 0, 0, 'n' },
4188 { "resolve", 0, 0, 'r' },
4189 { "options", 0, 0, 'o' },
4190 { "extended", 0, 0, 'e' },
4191 { "memory", 0, 0, 'm' },
4192 { "info", 0, 0, 'i' },
4193 { "processes", 0, 0, 'p' },
4194 { "bpf", 0, 0, 'b' },
4195 { "events", 0, 0, 'E' },
4196 { "dccp", 0, 0, 'd' },
4197 { "tcp", 0, 0, 't' },
4198 { "sctp", 0, 0, 'S' },
4199 { "udp", 0, 0, 'u' },
4200 { "raw", 0, 0, 'w' },
4201 { "unix", 0, 0, 'x' },
4202 { "vsock", 0, 0, OPT_VSOCK },
4203 { "all", 0, 0, 'a' },
4204 { "listening", 0, 0, 'l' },
4205 { "ipv4", 0, 0, '4' },
4206 { "ipv6", 0, 0, '6' },
4207 { "packet", 0, 0, '0' },
4208 { "family", 1, 0, 'f' },
4209 { "socket", 1, 0, 'A' },
4210 { "query", 1, 0, 'A' },
4211 { "summary", 0, 0, 's' },
4212 { "diag", 1, 0, 'D' },
4213 { "filter", 1, 0, 'F' },
4214 { "version", 0, 0, 'V' },
4215 { "help", 0, 0, 'h' },
4216 { "context", 0, 0, 'Z' },
4217 { "contexts", 0, 0, 'z' },
4218 { "net", 1, 0, 'N' },
4219 { "kill", 0, 0, 'K' },
4220 { "no-header", 0, 0, 'H' },
4221 { 0 }
4222
4223 };
4224
4225 int main(int argc, char *argv[])
4226 {
4227 int saw_states = 0;
4228 int saw_query = 0;
4229 int do_summary = 0;
4230 const char *dump_tcpdiag = NULL;
4231 FILE *filter_fp = NULL;
4232 int ch;
4233 int state_filter = 0;
4234 int addrp_width, screen_width = 80;
4235
4236 while ((ch = getopt_long(argc, argv,
4237 "dhaletuwxnro460spbEf:miA:D:F:vVzZN:KHS",
4238 long_opts, NULL)) != EOF) {
4239 switch (ch) {
4240 case 'n':
4241 resolve_services = 0;
4242 break;
4243 case 'r':
4244 resolve_hosts = 1;
4245 break;
4246 case 'o':
4247 show_options = 1;
4248 break;
4249 case 'e':
4250 show_options = 1;
4251 show_details++;
4252 break;
4253 case 'm':
4254 show_mem = 1;
4255 break;
4256 case 'i':
4257 show_tcpinfo = 1;
4258 break;
4259 case 'p':
4260 show_users++;
4261 user_ent_hash_build();
4262 break;
4263 case 'b':
4264 show_options = 1;
4265 show_bpf++;
4266 break;
4267 case 'E':
4268 follow_events = 1;
4269 break;
4270 case 'd':
4271 filter_db_set(&current_filter, DCCP_DB);
4272 break;
4273 case 't':
4274 filter_db_set(&current_filter, TCP_DB);
4275 break;
4276 case 'S':
4277 filter_db_set(&current_filter, SCTP_DB);
4278 break;
4279 case 'u':
4280 filter_db_set(&current_filter, UDP_DB);
4281 break;
4282 case 'w':
4283 filter_db_set(&current_filter, RAW_DB);
4284 break;
4285 case 'x':
4286 filter_af_set(&current_filter, AF_UNIX);
4287 break;
4288 case OPT_VSOCK:
4289 filter_af_set(&current_filter, AF_VSOCK);
4290 break;
4291 case 'a':
4292 state_filter = SS_ALL;
4293 break;
4294 case 'l':
4295 state_filter = (1 << SS_LISTEN) | (1 << SS_CLOSE);
4296 break;
4297 case '4':
4298 filter_af_set(&current_filter, AF_INET);
4299 break;
4300 case '6':
4301 filter_af_set(&current_filter, AF_INET6);
4302 break;
4303 case '0':
4304 filter_af_set(&current_filter, AF_PACKET);
4305 break;
4306 case 'f':
4307 if (strcmp(optarg, "inet") == 0)
4308 filter_af_set(&current_filter, AF_INET);
4309 else if (strcmp(optarg, "inet6") == 0)
4310 filter_af_set(&current_filter, AF_INET6);
4311 else if (strcmp(optarg, "link") == 0)
4312 filter_af_set(&current_filter, AF_PACKET);
4313 else if (strcmp(optarg, "unix") == 0)
4314 filter_af_set(&current_filter, AF_UNIX);
4315 else if (strcmp(optarg, "netlink") == 0)
4316 filter_af_set(&current_filter, AF_NETLINK);
4317 else if (strcmp(optarg, "vsock") == 0)
4318 filter_af_set(&current_filter, AF_VSOCK);
4319 else if (strcmp(optarg, "help") == 0)
4320 help();
4321 else {
4322 fprintf(stderr, "ss: \"%s\" is invalid family\n",
4323 optarg);
4324 usage();
4325 }
4326 break;
4327 case 'A':
4328 {
4329 char *p, *p1;
4330
4331 if (!saw_query) {
4332 current_filter.dbs = 0;
4333 state_filter = state_filter ?
4334 state_filter : SS_CONN;
4335 saw_query = 1;
4336 do_default = 0;
4337 }
4338 p = p1 = optarg;
4339 do {
4340 if ((p1 = strchr(p, ',')) != NULL)
4341 *p1 = 0;
4342 if (strcmp(p, "all") == 0) {
4343 filter_default_dbs(&current_filter);
4344 } else if (strcmp(p, "inet") == 0) {
4345 filter_db_set(&current_filter, UDP_DB);
4346 filter_db_set(&current_filter, DCCP_DB);
4347 filter_db_set(&current_filter, TCP_DB);
4348 filter_db_set(&current_filter, SCTP_DB);
4349 filter_db_set(&current_filter, RAW_DB);
4350 } else if (strcmp(p, "udp") == 0) {
4351 filter_db_set(&current_filter, UDP_DB);
4352 } else if (strcmp(p, "dccp") == 0) {
4353 filter_db_set(&current_filter, DCCP_DB);
4354 } else if (strcmp(p, "tcp") == 0) {
4355 filter_db_set(&current_filter, TCP_DB);
4356 } else if (strcmp(p, "sctp") == 0) {
4357 filter_db_set(&current_filter, SCTP_DB);
4358 } else if (strcmp(p, "raw") == 0) {
4359 filter_db_set(&current_filter, RAW_DB);
4360 } else if (strcmp(p, "unix") == 0) {
4361 filter_db_set(&current_filter, UNIX_ST_DB);
4362 filter_db_set(&current_filter, UNIX_DG_DB);
4363 filter_db_set(&current_filter, UNIX_SQ_DB);
4364 } else if (strcasecmp(p, "unix_stream") == 0 ||
4365 strcmp(p, "u_str") == 0) {
4366 filter_db_set(&current_filter, UNIX_ST_DB);
4367 } else if (strcasecmp(p, "unix_dgram") == 0 ||
4368 strcmp(p, "u_dgr") == 0) {
4369 filter_db_set(&current_filter, UNIX_DG_DB);
4370 } else if (strcasecmp(p, "unix_seqpacket") == 0 ||
4371 strcmp(p, "u_seq") == 0) {
4372 filter_db_set(&current_filter, UNIX_SQ_DB);
4373 } else if (strcmp(p, "packet") == 0) {
4374 filter_db_set(&current_filter, PACKET_R_DB);
4375 filter_db_set(&current_filter, PACKET_DG_DB);
4376 } else if (strcmp(p, "packet_raw") == 0 ||
4377 strcmp(p, "p_raw") == 0) {
4378 filter_db_set(&current_filter, PACKET_R_DB);
4379 } else if (strcmp(p, "packet_dgram") == 0 ||
4380 strcmp(p, "p_dgr") == 0) {
4381 filter_db_set(&current_filter, PACKET_DG_DB);
4382 } else if (strcmp(p, "netlink") == 0) {
4383 filter_db_set(&current_filter, NETLINK_DB);
4384 } else if (strcmp(p, "vsock") == 0) {
4385 filter_db_set(&current_filter, VSOCK_ST_DB);
4386 filter_db_set(&current_filter, VSOCK_DG_DB);
4387 } else if (strcmp(p, "vsock_stream") == 0 ||
4388 strcmp(p, "v_str") == 0) {
4389 filter_db_set(&current_filter, VSOCK_ST_DB);
4390 } else if (strcmp(p, "vsock_dgram") == 0 ||
4391 strcmp(p, "v_dgr") == 0) {
4392 filter_db_set(&current_filter, VSOCK_DG_DB);
4393 } else {
4394 fprintf(stderr, "ss: \"%s\" is illegal socket table id\n", p);
4395 usage();
4396 }
4397 p = p1 + 1;
4398 } while (p1);
4399 break;
4400 }
4401 case 's':
4402 do_summary = 1;
4403 break;
4404 case 'D':
4405 dump_tcpdiag = optarg;
4406 break;
4407 case 'F':
4408 if (filter_fp) {
4409 fprintf(stderr, "More than one filter file\n");
4410 exit(-1);
4411 }
4412 if (optarg[0] == '-')
4413 filter_fp = stdin;
4414 else
4415 filter_fp = fopen(optarg, "r");
4416 if (!filter_fp) {
4417 perror("fopen filter file");
4418 exit(-1);
4419 }
4420 break;
4421 case 'v':
4422 case 'V':
4423 printf("ss utility, iproute2-ss%s\n", SNAPSHOT);
4424 exit(0);
4425 case 'z':
4426 show_sock_ctx++;
4427 /* fall through */
4428 case 'Z':
4429 if (is_selinux_enabled() <= 0) {
4430 fprintf(stderr, "ss: SELinux is not enabled.\n");
4431 exit(1);
4432 }
4433 show_proc_ctx++;
4434 user_ent_hash_build();
4435 break;
4436 case 'N':
4437 if (netns_switch(optarg))
4438 exit(1);
4439 break;
4440 case 'K':
4441 current_filter.kill = 1;
4442 break;
4443 case 'H':
4444 show_header = 0;
4445 break;
4446 case 'h':
4447 help();
4448 case '?':
4449 default:
4450 usage();
4451 }
4452 }
4453
4454 argc -= optind;
4455 argv += optind;
4456
4457 if (do_summary) {
4458 print_summary();
4459 if (do_default && argc == 0)
4460 exit(0);
4461 }
4462
4463 while (argc > 0) {
4464 if (strcmp(*argv, "state") == 0) {
4465 NEXT_ARG();
4466 if (!saw_states)
4467 state_filter = 0;
4468 state_filter |= scan_state(*argv);
4469 saw_states = 1;
4470 } else if (strcmp(*argv, "exclude") == 0 ||
4471 strcmp(*argv, "excl") == 0) {
4472 NEXT_ARG();
4473 if (!saw_states)
4474 state_filter = SS_ALL;
4475 state_filter &= ~scan_state(*argv);
4476 saw_states = 1;
4477 } else {
4478 break;
4479 }
4480 argc--; argv++;
4481 }
4482
4483 if (do_default) {
4484 state_filter = state_filter ? state_filter : SS_CONN;
4485 filter_default_dbs(&current_filter);
4486 }
4487
4488 filter_states_set(&current_filter, state_filter);
4489 filter_merge_defaults(&current_filter);
4490
4491 if (resolve_services && resolve_hosts &&
4492 (current_filter.dbs & (UNIX_DBM|INET_L4_DBM)))
4493 init_service_resolver();
4494
4495 if (current_filter.dbs == 0) {
4496 fprintf(stderr, "ss: no socket tables to show with such filter.\n");
4497 exit(0);
4498 }
4499 if (current_filter.families == 0) {
4500 fprintf(stderr, "ss: no families to show with such filter.\n");
4501 exit(0);
4502 }
4503 if (current_filter.states == 0) {
4504 fprintf(stderr, "ss: no socket states to show with such filter.\n");
4505 exit(0);
4506 }
4507
4508 if (dump_tcpdiag) {
4509 FILE *dump_fp = stdout;
4510
4511 if (!(current_filter.dbs & (1<<TCP_DB))) {
4512 fprintf(stderr, "ss: tcpdiag dump requested and no tcp in filter.\n");
4513 exit(0);
4514 }
4515 if (dump_tcpdiag[0] != '-') {
4516 dump_fp = fopen(dump_tcpdiag, "w");
4517 if (!dump_tcpdiag) {
4518 perror("fopen dump file");
4519 exit(-1);
4520 }
4521 }
4522 inet_show_netlink(&current_filter, dump_fp, IPPROTO_TCP);
4523 fflush(dump_fp);
4524 exit(0);
4525 }
4526
4527 if (ssfilter_parse(&current_filter.f, argc, argv, filter_fp))
4528 usage();
4529
4530 netid_width = 0;
4531 if (current_filter.dbs&(current_filter.dbs-1))
4532 netid_width = 5;
4533
4534 state_width = 0;
4535 if (current_filter.states&(current_filter.states-1))
4536 state_width = 10;
4537
4538 if (isatty(STDOUT_FILENO)) {
4539 struct winsize w;
4540
4541 if (ioctl(STDOUT_FILENO, TIOCGWINSZ, &w) != -1) {
4542 if (w.ws_col > 0)
4543 screen_width = w.ws_col;
4544 }
4545 }
4546
4547 addrp_width = screen_width;
4548 if (netid_width)
4549 addrp_width -= netid_width + 1;
4550 if (state_width)
4551 addrp_width -= state_width + 1;
4552 addrp_width -= 14;
4553
4554 if (addrp_width&1) {
4555 if (netid_width)
4556 netid_width++;
4557 else if (state_width)
4558 state_width++;
4559 else
4560 odd_width_pad = " ";
4561 }
4562
4563 addrp_width /= 2;
4564 addrp_width--;
4565
4566 serv_width = resolve_services ? 7 : 5;
4567
4568 if (addrp_width < 15+serv_width+1)
4569 addrp_width = 15+serv_width+1;
4570
4571 addr_width = addrp_width - serv_width - 1;
4572
4573 if (show_header) {
4574 if (netid_width)
4575 printf("%-*s ", netid_width, "Netid");
4576 if (state_width)
4577 printf("%-*s ", state_width, "State");
4578 printf("%-6s %-6s %s", "Recv-Q", "Send-Q", odd_width_pad);
4579 }
4580
4581 /* Make enough space for the local/remote port field */
4582 addr_width -= 13;
4583 serv_width += 13;
4584
4585 if (show_header) {
4586 printf("%*s:%-*s %*s:%-*s\n",
4587 addr_width, "Local Address", serv_width, "Port",
4588 addr_width, "Peer Address", serv_width, "Port");
4589 }
4590
4591 fflush(stdout);
4592
4593 if (follow_events)
4594 exit(handle_follow_request(&current_filter));
4595
4596 if (current_filter.dbs & (1<<NETLINK_DB))
4597 netlink_show(&current_filter);
4598 if (current_filter.dbs & PACKET_DBM)
4599 packet_show(&current_filter);
4600 if (current_filter.dbs & UNIX_DBM)
4601 unix_show(&current_filter);
4602 if (current_filter.dbs & (1<<RAW_DB))
4603 raw_show(&current_filter);
4604 if (current_filter.dbs & (1<<UDP_DB))
4605 udp_show(&current_filter);
4606 if (current_filter.dbs & (1<<TCP_DB))
4607 tcp_show(&current_filter);
4608 if (current_filter.dbs & (1<<DCCP_DB))
4609 dccp_show(&current_filter);
4610 if (current_filter.dbs & (1<<SCTP_DB))
4611 sctp_show(&current_filter);
4612 if (current_filter.dbs & VSOCK_DBM)
4613 vsock_show(&current_filter);
4614
4615 if (show_users || show_proc_ctx || show_sock_ctx)
4616 user_ent_destroy();
4617
4618 return 0;
4619 }