]> git.proxmox.com Git - mirror_iproute2.git/blob - misc/ss.c
a7d3b89e1478c6cc2b57da86da0849223b4ca53d
[mirror_iproute2.git] / misc / ss.c
1 /*
2 * ss.c "sockstat", socket statistics
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 */
11
12 #include <stdio.h>
13 #include <stdlib.h>
14 #include <unistd.h>
15 #include <fcntl.h>
16 #include <sys/ioctl.h>
17 #include <sys/socket.h>
18 #include <sys/uio.h>
19 #include <netinet/in.h>
20 #include <string.h>
21 #include <errno.h>
22 #include <netdb.h>
23 #include <arpa/inet.h>
24 #include <dirent.h>
25 #include <fnmatch.h>
26 #include <getopt.h>
27 #include <stdbool.h>
28 #include <limits.h>
29 #include <stdarg.h>
30
31 #include "utils.h"
32 #include "rt_names.h"
33 #include "ll_map.h"
34 #include "libnetlink.h"
35 #include "namespace.h"
36 #include "SNAPSHOT.h"
37
38 #include <linux/tcp.h>
39 #include <linux/sock_diag.h>
40 #include <linux/inet_diag.h>
41 #include <linux/unix_diag.h>
42 #include <linux/netdevice.h> /* for MAX_ADDR_LEN */
43 #include <linux/filter.h>
44 #include <linux/packet_diag.h>
45 #include <linux/netlink_diag.h>
46 #include <linux/sctp.h>
47 #include <linux/vm_sockets_diag.h>
48
49 #define MAGIC_SEQ 123456
50
51 #define DIAG_REQUEST(_req, _r) \
52 struct { \
53 struct nlmsghdr nlh; \
54 _r; \
55 } _req = { \
56 .nlh = { \
57 .nlmsg_type = SOCK_DIAG_BY_FAMILY, \
58 .nlmsg_flags = NLM_F_ROOT|NLM_F_MATCH|NLM_F_REQUEST,\
59 .nlmsg_seq = MAGIC_SEQ, \
60 .nlmsg_len = sizeof(_req), \
61 }, \
62 }
63
64 #if HAVE_SELINUX
65 #include <selinux/selinux.h>
66 #else
67 /* Stubs for SELinux functions */
68 static int is_selinux_enabled(void)
69 {
70 return -1;
71 }
72
73 static int getpidcon(pid_t pid, char **context)
74 {
75 *context = NULL;
76 return -1;
77 }
78
79 static int getfilecon(char *path, char **context)
80 {
81 *context = NULL;
82 return -1;
83 }
84
85 static int security_get_initial_context(char *name, char **context)
86 {
87 *context = NULL;
88 return -1;
89 }
90 #endif
91
92 int resolve_services = 1;
93 int preferred_family = AF_UNSPEC;
94 int show_options;
95 int show_details;
96 int show_users;
97 int show_mem;
98 int show_tcpinfo;
99 int show_bpf;
100 int show_proc_ctx;
101 int show_sock_ctx;
102 int show_header = 1;
103 int follow_events;
104 int sctp_ino;
105
106 int netid_width;
107 int state_width;
108 int addr_width;
109 int serv_width;
110 char *odd_width_pad = "";
111
112 static const char *TCP_PROTO = "tcp";
113 static const char *SCTP_PROTO = "sctp";
114 static const char *UDP_PROTO = "udp";
115 static const char *RAW_PROTO = "raw";
116 static const char *dg_proto;
117
118 enum {
119 TCP_DB,
120 DCCP_DB,
121 UDP_DB,
122 RAW_DB,
123 UNIX_DG_DB,
124 UNIX_ST_DB,
125 UNIX_SQ_DB,
126 PACKET_DG_DB,
127 PACKET_R_DB,
128 NETLINK_DB,
129 SCTP_DB,
130 VSOCK_ST_DB,
131 VSOCK_DG_DB,
132 MAX_DB
133 };
134
135 #define PACKET_DBM ((1<<PACKET_DG_DB)|(1<<PACKET_R_DB))
136 #define UNIX_DBM ((1<<UNIX_DG_DB)|(1<<UNIX_ST_DB)|(1<<UNIX_SQ_DB))
137 #define ALL_DB ((1<<MAX_DB)-1)
138 #define INET_L4_DBM ((1<<TCP_DB)|(1<<UDP_DB)|(1<<DCCP_DB)|(1<<SCTP_DB))
139 #define INET_DBM (INET_L4_DBM | (1<<RAW_DB))
140 #define VSOCK_DBM ((1<<VSOCK_ST_DB)|(1<<VSOCK_DG_DB))
141
142 enum {
143 SS_UNKNOWN,
144 SS_ESTABLISHED,
145 SS_SYN_SENT,
146 SS_SYN_RECV,
147 SS_FIN_WAIT1,
148 SS_FIN_WAIT2,
149 SS_TIME_WAIT,
150 SS_CLOSE,
151 SS_CLOSE_WAIT,
152 SS_LAST_ACK,
153 SS_LISTEN,
154 SS_CLOSING,
155 SS_MAX
156 };
157
158 enum {
159 SCTP_STATE_CLOSED = 0,
160 SCTP_STATE_COOKIE_WAIT = 1,
161 SCTP_STATE_COOKIE_ECHOED = 2,
162 SCTP_STATE_ESTABLISHED = 3,
163 SCTP_STATE_SHUTDOWN_PENDING = 4,
164 SCTP_STATE_SHUTDOWN_SENT = 5,
165 SCTP_STATE_SHUTDOWN_RECEIVED = 6,
166 SCTP_STATE_SHUTDOWN_ACK_SENT = 7,
167 };
168
169 #define SS_ALL ((1 << SS_MAX) - 1)
170 #define SS_CONN (SS_ALL & ~((1<<SS_LISTEN)|(1<<SS_CLOSE)|(1<<SS_TIME_WAIT)|(1<<SS_SYN_RECV)))
171
172 #include "ssfilter.h"
173
174 struct filter {
175 int dbs;
176 int states;
177 uint64_t families;
178 struct ssfilter *f;
179 bool kill;
180 };
181
182 #define FAMILY_MASK(family) ((uint64_t)1 << (family))
183
184 static const struct filter default_dbs[MAX_DB] = {
185 [TCP_DB] = {
186 .states = SS_CONN,
187 .families = FAMILY_MASK(AF_INET) | FAMILY_MASK(AF_INET6),
188 },
189 [DCCP_DB] = {
190 .states = SS_CONN,
191 .families = FAMILY_MASK(AF_INET) | FAMILY_MASK(AF_INET6),
192 },
193 [UDP_DB] = {
194 .states = (1 << SS_ESTABLISHED),
195 .families = FAMILY_MASK(AF_INET) | FAMILY_MASK(AF_INET6),
196 },
197 [RAW_DB] = {
198 .states = (1 << SS_ESTABLISHED),
199 .families = FAMILY_MASK(AF_INET) | FAMILY_MASK(AF_INET6),
200 },
201 [UNIX_DG_DB] = {
202 .states = (1 << SS_CLOSE),
203 .families = FAMILY_MASK(AF_UNIX),
204 },
205 [UNIX_ST_DB] = {
206 .states = SS_CONN,
207 .families = FAMILY_MASK(AF_UNIX),
208 },
209 [UNIX_SQ_DB] = {
210 .states = SS_CONN,
211 .families = FAMILY_MASK(AF_UNIX),
212 },
213 [PACKET_DG_DB] = {
214 .states = (1 << SS_CLOSE),
215 .families = FAMILY_MASK(AF_PACKET),
216 },
217 [PACKET_R_DB] = {
218 .states = (1 << SS_CLOSE),
219 .families = FAMILY_MASK(AF_PACKET),
220 },
221 [NETLINK_DB] = {
222 .states = (1 << SS_CLOSE),
223 .families = FAMILY_MASK(AF_NETLINK),
224 },
225 [SCTP_DB] = {
226 .states = SS_CONN,
227 .families = FAMILY_MASK(AF_INET) | FAMILY_MASK(AF_INET6),
228 },
229 [VSOCK_ST_DB] = {
230 .states = SS_CONN,
231 .families = FAMILY_MASK(AF_VSOCK),
232 },
233 [VSOCK_DG_DB] = {
234 .states = SS_CONN,
235 .families = FAMILY_MASK(AF_VSOCK),
236 },
237 };
238
239 static const struct filter default_afs[AF_MAX] = {
240 [AF_INET] = {
241 .dbs = INET_DBM,
242 .states = SS_CONN,
243 },
244 [AF_INET6] = {
245 .dbs = INET_DBM,
246 .states = SS_CONN,
247 },
248 [AF_UNIX] = {
249 .dbs = UNIX_DBM,
250 .states = SS_CONN,
251 },
252 [AF_PACKET] = {
253 .dbs = PACKET_DBM,
254 .states = (1 << SS_CLOSE),
255 },
256 [AF_NETLINK] = {
257 .dbs = (1 << NETLINK_DB),
258 .states = (1 << SS_CLOSE),
259 },
260 [AF_VSOCK] = {
261 .dbs = VSOCK_DBM,
262 .states = SS_CONN,
263 },
264 };
265
266 static int do_default = 1;
267 static struct filter current_filter;
268
269 static void filter_db_set(struct filter *f, int db)
270 {
271 f->states |= default_dbs[db].states;
272 f->dbs |= 1 << db;
273 do_default = 0;
274 }
275
276 static void filter_af_set(struct filter *f, int af)
277 {
278 f->states |= default_afs[af].states;
279 f->families |= FAMILY_MASK(af);
280 do_default = 0;
281 preferred_family = af;
282 }
283
284 static int filter_af_get(struct filter *f, int af)
285 {
286 return !!(f->families & FAMILY_MASK(af));
287 }
288
289 static void filter_default_dbs(struct filter *f)
290 {
291 filter_db_set(f, UDP_DB);
292 filter_db_set(f, DCCP_DB);
293 filter_db_set(f, TCP_DB);
294 filter_db_set(f, RAW_DB);
295 filter_db_set(f, UNIX_ST_DB);
296 filter_db_set(f, UNIX_DG_DB);
297 filter_db_set(f, UNIX_SQ_DB);
298 filter_db_set(f, PACKET_R_DB);
299 filter_db_set(f, PACKET_DG_DB);
300 filter_db_set(f, NETLINK_DB);
301 filter_db_set(f, SCTP_DB);
302 filter_db_set(f, VSOCK_ST_DB);
303 filter_db_set(f, VSOCK_DG_DB);
304 }
305
306 static void filter_states_set(struct filter *f, int states)
307 {
308 if (states)
309 f->states = states;
310 }
311
312 static void filter_merge_defaults(struct filter *f)
313 {
314 int db;
315 int af;
316
317 for (db = 0; db < MAX_DB; db++) {
318 if (!(f->dbs & (1 << db)))
319 continue;
320
321 if (!(default_dbs[db].families & f->families))
322 f->families |= default_dbs[db].families;
323 }
324 for (af = 0; af < AF_MAX; af++) {
325 if (!(f->families & FAMILY_MASK(af)))
326 continue;
327
328 if (!(default_afs[af].dbs & f->dbs))
329 f->dbs |= default_afs[af].dbs;
330 }
331 }
332
333 static FILE *generic_proc_open(const char *env, const char *name)
334 {
335 const char *p = getenv(env);
336 char store[128];
337
338 if (!p) {
339 p = getenv("PROC_ROOT") ? : "/proc";
340 snprintf(store, sizeof(store)-1, "%s/%s", p, name);
341 p = store;
342 }
343
344 return fopen(p, "r");
345 }
346 #define net_tcp_open() generic_proc_open("PROC_NET_TCP", "net/tcp")
347 #define net_tcp6_open() generic_proc_open("PROC_NET_TCP6", "net/tcp6")
348 #define net_udp_open() generic_proc_open("PROC_NET_UDP", "net/udp")
349 #define net_udp6_open() generic_proc_open("PROC_NET_UDP6", "net/udp6")
350 #define net_raw_open() generic_proc_open("PROC_NET_RAW", "net/raw")
351 #define net_raw6_open() generic_proc_open("PROC_NET_RAW6", "net/raw6")
352 #define net_unix_open() generic_proc_open("PROC_NET_UNIX", "net/unix")
353 #define net_packet_open() generic_proc_open("PROC_NET_PACKET", \
354 "net/packet")
355 #define net_netlink_open() generic_proc_open("PROC_NET_NETLINK", \
356 "net/netlink")
357 #define slabinfo_open() generic_proc_open("PROC_SLABINFO", "slabinfo")
358 #define net_sockstat_open() generic_proc_open("PROC_NET_SOCKSTAT", \
359 "net/sockstat")
360 #define net_sockstat6_open() generic_proc_open("PROC_NET_SOCKSTAT6", \
361 "net/sockstat6")
362 #define net_snmp_open() generic_proc_open("PROC_NET_SNMP", "net/snmp")
363 #define ephemeral_ports_open() generic_proc_open("PROC_IP_LOCAL_PORT_RANGE", \
364 "sys/net/ipv4/ip_local_port_range")
365
366 struct user_ent {
367 struct user_ent *next;
368 unsigned int ino;
369 int pid;
370 int fd;
371 char *process;
372 char *process_ctx;
373 char *socket_ctx;
374 };
375
376 #define USER_ENT_HASH_SIZE 256
377 struct user_ent *user_ent_hash[USER_ENT_HASH_SIZE];
378
379 static int user_ent_hashfn(unsigned int ino)
380 {
381 int val = (ino >> 24) ^ (ino >> 16) ^ (ino >> 8) ^ ino;
382
383 return val & (USER_ENT_HASH_SIZE - 1);
384 }
385
386 static void user_ent_add(unsigned int ino, char *process,
387 int pid, int fd,
388 char *proc_ctx,
389 char *sock_ctx)
390 {
391 struct user_ent *p, **pp;
392
393 p = malloc(sizeof(struct user_ent));
394 if (!p) {
395 fprintf(stderr, "ss: failed to malloc buffer\n");
396 abort();
397 }
398 p->next = NULL;
399 p->ino = ino;
400 p->pid = pid;
401 p->fd = fd;
402 p->process = strdup(process);
403 p->process_ctx = strdup(proc_ctx);
404 p->socket_ctx = strdup(sock_ctx);
405
406 pp = &user_ent_hash[user_ent_hashfn(ino)];
407 p->next = *pp;
408 *pp = p;
409 }
410
411 static void user_ent_destroy(void)
412 {
413 struct user_ent *p, *p_next;
414 int cnt = 0;
415
416 while (cnt != USER_ENT_HASH_SIZE) {
417 p = user_ent_hash[cnt];
418 while (p) {
419 free(p->process);
420 free(p->process_ctx);
421 free(p->socket_ctx);
422 p_next = p->next;
423 free(p);
424 p = p_next;
425 }
426 cnt++;
427 }
428 }
429
430 static void user_ent_hash_build(void)
431 {
432 const char *root = getenv("PROC_ROOT") ? : "/proc/";
433 struct dirent *d;
434 char name[1024];
435 int nameoff;
436 DIR *dir;
437 char *pid_context;
438 char *sock_context;
439 const char *no_ctx = "unavailable";
440 static int user_ent_hash_build_init;
441
442 /* If show_users & show_proc_ctx set only do this once */
443 if (user_ent_hash_build_init != 0)
444 return;
445
446 user_ent_hash_build_init = 1;
447
448 strlcpy(name, root, sizeof(name));
449
450 if (strlen(name) == 0 || name[strlen(name)-1] != '/')
451 strcat(name, "/");
452
453 nameoff = strlen(name);
454
455 dir = opendir(name);
456 if (!dir)
457 return;
458
459 while ((d = readdir(dir)) != NULL) {
460 struct dirent *d1;
461 char process[16];
462 char *p;
463 int pid, pos;
464 DIR *dir1;
465 char crap;
466
467 if (sscanf(d->d_name, "%d%c", &pid, &crap) != 1)
468 continue;
469
470 if (getpidcon(pid, &pid_context) != 0)
471 pid_context = strdup(no_ctx);
472
473 snprintf(name + nameoff, sizeof(name) - nameoff, "%d/fd/", pid);
474 pos = strlen(name);
475 if ((dir1 = opendir(name)) == NULL) {
476 free(pid_context);
477 continue;
478 }
479
480 process[0] = '\0';
481 p = process;
482
483 while ((d1 = readdir(dir1)) != NULL) {
484 const char *pattern = "socket:[";
485 unsigned int ino;
486 char lnk[64];
487 int fd;
488 ssize_t link_len;
489 char tmp[1024];
490
491 if (sscanf(d1->d_name, "%d%c", &fd, &crap) != 1)
492 continue;
493
494 snprintf(name+pos, sizeof(name) - pos, "%d", fd);
495
496 link_len = readlink(name, lnk, sizeof(lnk)-1);
497 if (link_len == -1)
498 continue;
499 lnk[link_len] = '\0';
500
501 if (strncmp(lnk, pattern, strlen(pattern)))
502 continue;
503
504 sscanf(lnk, "socket:[%u]", &ino);
505
506 snprintf(tmp, sizeof(tmp), "%s/%d/fd/%s",
507 root, pid, d1->d_name);
508
509 if (getfilecon(tmp, &sock_context) <= 0)
510 sock_context = strdup(no_ctx);
511
512 if (*p == '\0') {
513 FILE *fp;
514
515 snprintf(tmp, sizeof(tmp), "%s/%d/stat",
516 root, pid);
517 if ((fp = fopen(tmp, "r")) != NULL) {
518 if (fscanf(fp, "%*d (%[^)])", p) < 1)
519 ; /* ignore */
520 fclose(fp);
521 }
522 }
523 user_ent_add(ino, p, pid, fd,
524 pid_context, sock_context);
525 free(sock_context);
526 }
527 free(pid_context);
528 closedir(dir1);
529 }
530 closedir(dir);
531 }
532
533 enum entry_types {
534 USERS,
535 PROC_CTX,
536 PROC_SOCK_CTX
537 };
538
539 #define ENTRY_BUF_SIZE 512
540 static int find_entry(unsigned int ino, char **buf, int type)
541 {
542 struct user_ent *p;
543 int cnt = 0;
544 char *ptr;
545 char *new_buf;
546 int len, new_buf_len;
547 int buf_used = 0;
548 int buf_len = 0;
549
550 if (!ino)
551 return 0;
552
553 p = user_ent_hash[user_ent_hashfn(ino)];
554 ptr = *buf = NULL;
555 while (p) {
556 if (p->ino != ino)
557 goto next;
558
559 while (1) {
560 ptr = *buf + buf_used;
561 switch (type) {
562 case USERS:
563 len = snprintf(ptr, buf_len - buf_used,
564 "(\"%s\",pid=%d,fd=%d),",
565 p->process, p->pid, p->fd);
566 break;
567 case PROC_CTX:
568 len = snprintf(ptr, buf_len - buf_used,
569 "(\"%s\",pid=%d,proc_ctx=%s,fd=%d),",
570 p->process, p->pid,
571 p->process_ctx, p->fd);
572 break;
573 case PROC_SOCK_CTX:
574 len = snprintf(ptr, buf_len - buf_used,
575 "(\"%s\",pid=%d,proc_ctx=%s,fd=%d,sock_ctx=%s),",
576 p->process, p->pid,
577 p->process_ctx, p->fd,
578 p->socket_ctx);
579 break;
580 default:
581 fprintf(stderr, "ss: invalid type: %d\n", type);
582 abort();
583 }
584
585 if (len < 0 || len >= buf_len - buf_used) {
586 new_buf_len = buf_len + ENTRY_BUF_SIZE;
587 new_buf = realloc(*buf, new_buf_len);
588 if (!new_buf) {
589 fprintf(stderr, "ss: failed to malloc buffer\n");
590 abort();
591 }
592 *buf = new_buf;
593 buf_len = new_buf_len;
594 continue;
595 } else {
596 buf_used += len;
597 break;
598 }
599 }
600 cnt++;
601 next:
602 p = p->next;
603 }
604 if (buf_used) {
605 ptr = *buf + buf_used;
606 ptr[-1] = '\0';
607 }
608 return cnt;
609 }
610
611 /* Get stats from slab */
612
613 struct slabstat {
614 int socks;
615 int tcp_ports;
616 int tcp_tws;
617 int tcp_syns;
618 int skbs;
619 };
620
621 static struct slabstat slabstat;
622
623 static int get_slabstat(struct slabstat *s)
624 {
625 char buf[256];
626 FILE *fp;
627 int cnt;
628 static int slabstat_valid;
629 static const char * const slabstat_ids[] = {
630 "sock",
631 "tcp_bind_bucket",
632 "tcp_tw_bucket",
633 "tcp_open_request",
634 "skbuff_head_cache",
635 };
636
637 if (slabstat_valid)
638 return 0;
639
640 memset(s, 0, sizeof(*s));
641
642 fp = slabinfo_open();
643 if (!fp)
644 return -1;
645
646 cnt = sizeof(*s)/sizeof(int);
647
648 if (!fgets(buf, sizeof(buf), fp)) {
649 fclose(fp);
650 return -1;
651 }
652 while (fgets(buf, sizeof(buf), fp) != NULL) {
653 int i;
654
655 for (i = 0; i < ARRAY_SIZE(slabstat_ids); i++) {
656 if (memcmp(buf, slabstat_ids[i], strlen(slabstat_ids[i])) == 0) {
657 sscanf(buf, "%*s%d", ((int *)s) + i);
658 cnt--;
659 break;
660 }
661 }
662 if (cnt <= 0)
663 break;
664 }
665
666 slabstat_valid = 1;
667
668 fclose(fp);
669 return 0;
670 }
671
672 static unsigned long long cookie_sk_get(const uint32_t *cookie)
673 {
674 return (((unsigned long long)cookie[1] << 31) << 1) | cookie[0];
675 }
676
677 static const char *sctp_sstate_name[] = {
678 [SCTP_STATE_CLOSED] = "CLOSED",
679 [SCTP_STATE_COOKIE_WAIT] = "COOKIE_WAIT",
680 [SCTP_STATE_COOKIE_ECHOED] = "COOKIE_ECHOED",
681 [SCTP_STATE_ESTABLISHED] = "ESTAB",
682 [SCTP_STATE_SHUTDOWN_PENDING] = "SHUTDOWN_PENDING",
683 [SCTP_STATE_SHUTDOWN_SENT] = "SHUTDOWN_SENT",
684 [SCTP_STATE_SHUTDOWN_RECEIVED] = "SHUTDOWN_RECEIVED",
685 [SCTP_STATE_SHUTDOWN_ACK_SENT] = "ACK_SENT",
686 };
687
688 struct sockstat {
689 struct sockstat *next;
690 unsigned int type;
691 uint16_t prot;
692 uint16_t raw_prot;
693 inet_prefix local;
694 inet_prefix remote;
695 int lport;
696 int rport;
697 int state;
698 int rq, wq;
699 unsigned int ino;
700 unsigned int uid;
701 int refcnt;
702 unsigned int iface;
703 unsigned long long sk;
704 char *name;
705 char *peer_name;
706 __u32 mark;
707 };
708
709 struct dctcpstat {
710 unsigned int ce_state;
711 unsigned int alpha;
712 unsigned int ab_ecn;
713 unsigned int ab_tot;
714 bool enabled;
715 };
716
717 struct tcpstat {
718 struct sockstat ss;
719 unsigned int timer;
720 unsigned int timeout;
721 int probes;
722 char cong_alg[16];
723 double rto, ato, rtt, rttvar;
724 int qack, ssthresh, backoff;
725 double send_bps;
726 int snd_wscale;
727 int rcv_wscale;
728 int mss;
729 int rcv_mss;
730 int advmss;
731 unsigned int cwnd;
732 unsigned int lastsnd;
733 unsigned int lastrcv;
734 unsigned int lastack;
735 double pacing_rate;
736 double pacing_rate_max;
737 double delivery_rate;
738 unsigned long long bytes_acked;
739 unsigned long long bytes_received;
740 unsigned int segs_out;
741 unsigned int segs_in;
742 unsigned int data_segs_out;
743 unsigned int data_segs_in;
744 unsigned int unacked;
745 unsigned int retrans;
746 unsigned int retrans_total;
747 unsigned int lost;
748 unsigned int sacked;
749 unsigned int fackets;
750 unsigned int reordering;
751 unsigned int not_sent;
752 double rcv_rtt;
753 double min_rtt;
754 int rcv_space;
755 unsigned int rcv_ssthresh;
756 unsigned long long busy_time;
757 unsigned long long rwnd_limited;
758 unsigned long long sndbuf_limited;
759 bool has_ts_opt;
760 bool has_sack_opt;
761 bool has_ecn_opt;
762 bool has_ecnseen_opt;
763 bool has_fastopen_opt;
764 bool has_wscale_opt;
765 bool app_limited;
766 struct dctcpstat *dctcp;
767 struct tcp_bbr_info *bbr_info;
768 };
769
770 /* SCTP assocs share the same inode number with their parent endpoint. So if we
771 * have seen the inode number before, it must be an assoc instead of the next
772 * endpoint. */
773 static bool is_sctp_assoc(struct sockstat *s, const char *sock_name)
774 {
775 if (strcmp(sock_name, "sctp"))
776 return false;
777 if (!sctp_ino || sctp_ino != s->ino)
778 return false;
779 return true;
780 }
781
782 static const char *unix_netid_name(int type)
783 {
784 switch (type) {
785 case SOCK_STREAM:
786 return "u_str";
787 case SOCK_SEQPACKET:
788 return "u_seq";
789 case SOCK_DGRAM:
790 default:
791 return "u_dgr";
792 }
793 }
794
795 static const char *proto_name(int protocol)
796 {
797 switch (protocol) {
798 case 0:
799 return "raw";
800 case IPPROTO_UDP:
801 return "udp";
802 case IPPROTO_TCP:
803 return "tcp";
804 case IPPROTO_SCTP:
805 return "sctp";
806 case IPPROTO_DCCP:
807 return "dccp";
808 case IPPROTO_ICMPV6:
809 return "icmp6";
810 }
811
812 return "???";
813 }
814
815 static const char *vsock_netid_name(int type)
816 {
817 switch (type) {
818 case SOCK_STREAM:
819 return "v_str";
820 case SOCK_DGRAM:
821 return "v_dgr";
822 default:
823 return "???";
824 }
825 }
826
827 static void out(const char *fmt, ...)
828 {
829 va_list args;
830
831 va_start(args, fmt);
832 vfprintf(stdout, fmt, args);
833 va_end(args);
834 }
835
836 static void sock_state_print(struct sockstat *s)
837 {
838 const char *sock_name;
839 static const char * const sstate_name[] = {
840 "UNKNOWN",
841 [SS_ESTABLISHED] = "ESTAB",
842 [SS_SYN_SENT] = "SYN-SENT",
843 [SS_SYN_RECV] = "SYN-RECV",
844 [SS_FIN_WAIT1] = "FIN-WAIT-1",
845 [SS_FIN_WAIT2] = "FIN-WAIT-2",
846 [SS_TIME_WAIT] = "TIME-WAIT",
847 [SS_CLOSE] = "UNCONN",
848 [SS_CLOSE_WAIT] = "CLOSE-WAIT",
849 [SS_LAST_ACK] = "LAST-ACK",
850 [SS_LISTEN] = "LISTEN",
851 [SS_CLOSING] = "CLOSING",
852 };
853
854 switch (s->local.family) {
855 case AF_UNIX:
856 sock_name = unix_netid_name(s->type);
857 break;
858 case AF_INET:
859 case AF_INET6:
860 sock_name = proto_name(s->type);
861 break;
862 case AF_PACKET:
863 sock_name = s->type == SOCK_RAW ? "p_raw" : "p_dgr";
864 break;
865 case AF_NETLINK:
866 sock_name = "nl";
867 break;
868 case AF_VSOCK:
869 sock_name = vsock_netid_name(s->type);
870 break;
871 default:
872 sock_name = "unknown";
873 }
874
875 if (netid_width)
876 out("%-*s ", netid_width,
877 is_sctp_assoc(s, sock_name) ? "" : sock_name);
878 if (state_width) {
879 if (is_sctp_assoc(s, sock_name))
880 out("`- %-*s ", state_width - 3,
881 sctp_sstate_name[s->state]);
882 else
883 out("%-*s ", state_width, sstate_name[s->state]);
884 }
885
886 out("%-6d %-6d %s", s->rq, s->wq, odd_width_pad);
887 }
888
889 static void sock_details_print(struct sockstat *s)
890 {
891 if (s->uid)
892 out(" uid:%u", s->uid);
893
894 out(" ino:%u", s->ino);
895 out(" sk:%llx", s->sk);
896
897 if (s->mark)
898 out(" fwmark:0x%x", s->mark);
899 }
900
901 static void sock_addr_print_width(int addr_len, const char *addr, char *delim,
902 int port_len, const char *port, const char *ifname)
903 {
904 if (ifname) {
905 out("%*s%%%s%s%-*s ", addr_len, addr, ifname, delim,
906 port_len, port);
907 } else {
908 out("%*s%s%-*s ", addr_len, addr, delim, port_len, port);
909 }
910 }
911
912 static void sock_addr_print(const char *addr, char *delim, const char *port,
913 const char *ifname)
914 {
915 sock_addr_print_width(addr_width, addr, delim, serv_width, port, ifname);
916 }
917
918 static const char *print_ms_timer(unsigned int timeout)
919 {
920 static char buf[64];
921 int secs, msecs, minutes;
922
923 secs = timeout/1000;
924 minutes = secs/60;
925 secs = secs%60;
926 msecs = timeout%1000;
927 buf[0] = 0;
928 if (minutes) {
929 msecs = 0;
930 snprintf(buf, sizeof(buf)-16, "%dmin", minutes);
931 if (minutes > 9)
932 secs = 0;
933 }
934 if (secs) {
935 if (secs > 9)
936 msecs = 0;
937 sprintf(buf+strlen(buf), "%d%s", secs, msecs ? "." : "sec");
938 }
939 if (msecs)
940 sprintf(buf+strlen(buf), "%03dms", msecs);
941 return buf;
942 }
943
944 struct scache {
945 struct scache *next;
946 int port;
947 char *name;
948 const char *proto;
949 };
950
951 struct scache *rlist;
952
953 static void init_service_resolver(void)
954 {
955 char buf[128];
956 FILE *fp = popen("/usr/sbin/rpcinfo -p 2>/dev/null", "r");
957
958 if (!fp)
959 return;
960
961 if (!fgets(buf, sizeof(buf), fp)) {
962 pclose(fp);
963 return;
964 }
965 while (fgets(buf, sizeof(buf), fp) != NULL) {
966 unsigned int progn, port;
967 char proto[128], prog[128] = "rpc.";
968 struct scache *c;
969
970 if (sscanf(buf, "%u %*d %s %u %s",
971 &progn, proto, &port, prog+4) != 4)
972 continue;
973
974 if (!(c = malloc(sizeof(*c))))
975 continue;
976
977 c->port = port;
978 c->name = strdup(prog);
979 if (strcmp(proto, TCP_PROTO) == 0)
980 c->proto = TCP_PROTO;
981 else if (strcmp(proto, UDP_PROTO) == 0)
982 c->proto = UDP_PROTO;
983 else if (strcmp(proto, SCTP_PROTO) == 0)
984 c->proto = SCTP_PROTO;
985 else
986 c->proto = NULL;
987 c->next = rlist;
988 rlist = c;
989 }
990 pclose(fp);
991 }
992
993 /* Even do not try default linux ephemeral port ranges:
994 * default /etc/services contains so much of useless crap
995 * wouldbe "allocated" to this area that resolution
996 * is really harmful. I shrug each time when seeing
997 * "socks" or "cfinger" in dumps.
998 */
999 static int is_ephemeral(int port)
1000 {
1001 static int min = 0, max;
1002
1003 if (!min) {
1004 FILE *f = ephemeral_ports_open();
1005
1006 if (!f || fscanf(f, "%d %d", &min, &max) < 2) {
1007 min = 1024;
1008 max = 4999;
1009 }
1010 if (f)
1011 fclose(f);
1012 }
1013 return port >= min && port <= max;
1014 }
1015
1016
1017 static const char *__resolve_service(int port)
1018 {
1019 struct scache *c;
1020
1021 for (c = rlist; c; c = c->next) {
1022 if (c->port == port && c->proto == dg_proto)
1023 return c->name;
1024 }
1025
1026 if (!is_ephemeral(port)) {
1027 static int notfirst;
1028 struct servent *se;
1029
1030 if (!notfirst) {
1031 setservent(1);
1032 notfirst = 1;
1033 }
1034 se = getservbyport(htons(port), dg_proto);
1035 if (se)
1036 return se->s_name;
1037 }
1038
1039 return NULL;
1040 }
1041
1042 #define SCACHE_BUCKETS 1024
1043 static struct scache *cache_htab[SCACHE_BUCKETS];
1044
1045 static const char *resolve_service(int port)
1046 {
1047 static char buf[128];
1048 struct scache *c;
1049 const char *res;
1050 int hash;
1051
1052 if (port == 0) {
1053 buf[0] = '*';
1054 buf[1] = 0;
1055 return buf;
1056 }
1057
1058 if (!resolve_services)
1059 goto do_numeric;
1060
1061 if (dg_proto == RAW_PROTO)
1062 return inet_proto_n2a(port, buf, sizeof(buf));
1063
1064
1065 hash = (port^(((unsigned long)dg_proto)>>2)) % SCACHE_BUCKETS;
1066
1067 for (c = cache_htab[hash]; c; c = c->next) {
1068 if (c->port == port && c->proto == dg_proto)
1069 goto do_cache;
1070 }
1071
1072 c = malloc(sizeof(*c));
1073 if (!c)
1074 goto do_numeric;
1075 res = __resolve_service(port);
1076 c->port = port;
1077 c->name = res ? strdup(res) : NULL;
1078 c->proto = dg_proto;
1079 c->next = cache_htab[hash];
1080 cache_htab[hash] = c;
1081
1082 do_cache:
1083 if (c->name)
1084 return c->name;
1085
1086 do_numeric:
1087 sprintf(buf, "%u", port);
1088 return buf;
1089 }
1090
1091 static void inet_addr_print(const inet_prefix *a, int port,
1092 unsigned int ifindex, bool v6only)
1093 {
1094 char buf[1024];
1095 const char *ap = buf;
1096 int est_len = addr_width;
1097 const char *ifname = NULL;
1098
1099 if (a->family == AF_INET) {
1100 ap = format_host(AF_INET, 4, a->data);
1101 } else {
1102 if (!v6only &&
1103 !memcmp(a->data, &in6addr_any, sizeof(in6addr_any))) {
1104 buf[0] = '*';
1105 buf[1] = 0;
1106 } else {
1107 ap = format_host(a->family, 16, a->data);
1108
1109 /* Numeric IPv6 addresses should be bracketed */
1110 if (strchr(ap, ':')) {
1111 snprintf(buf, sizeof(buf),
1112 "[%s]", ap);
1113 ap = buf;
1114 }
1115
1116 est_len = strlen(ap);
1117 if (est_len <= addr_width)
1118 est_len = addr_width;
1119 else
1120 est_len = addr_width + ((est_len-addr_width+3)/4)*4;
1121 }
1122 }
1123
1124 if (ifindex) {
1125 ifname = ll_index_to_name(ifindex);
1126 est_len -= strlen(ifname) + 1; /* +1 for percent char */
1127 if (est_len < 0)
1128 est_len = 0;
1129 }
1130
1131 sock_addr_print_width(est_len, ap, ":", serv_width, resolve_service(port),
1132 ifname);
1133 }
1134
1135 struct aafilter {
1136 inet_prefix addr;
1137 int port;
1138 unsigned int iface;
1139 __u32 mark;
1140 __u32 mask;
1141 struct aafilter *next;
1142 };
1143
1144 static int inet2_addr_match(const inet_prefix *a, const inet_prefix *p,
1145 int plen)
1146 {
1147 if (!inet_addr_match(a, p, plen))
1148 return 0;
1149
1150 /* Cursed "v4 mapped" addresses: v4 mapped socket matches
1151 * pure IPv4 rule, but v4-mapped rule selects only v4-mapped
1152 * sockets. Fair? */
1153 if (p->family == AF_INET && a->family == AF_INET6) {
1154 if (a->data[0] == 0 && a->data[1] == 0 &&
1155 a->data[2] == htonl(0xffff)) {
1156 inet_prefix tmp = *a;
1157
1158 tmp.data[0] = a->data[3];
1159 return inet_addr_match(&tmp, p, plen);
1160 }
1161 }
1162 return 1;
1163 }
1164
1165 static int unix_match(const inet_prefix *a, const inet_prefix *p)
1166 {
1167 char *addr, *pattern;
1168
1169 memcpy(&addr, a->data, sizeof(addr));
1170 memcpy(&pattern, p->data, sizeof(pattern));
1171 if (pattern == NULL)
1172 return 1;
1173 if (addr == NULL)
1174 addr = "";
1175 return !fnmatch(pattern, addr, 0);
1176 }
1177
1178 static int run_ssfilter(struct ssfilter *f, struct sockstat *s)
1179 {
1180 switch (f->type) {
1181 case SSF_S_AUTO:
1182 {
1183 if (s->local.family == AF_UNIX) {
1184 char *p;
1185
1186 memcpy(&p, s->local.data, sizeof(p));
1187 return p == NULL || (p[0] == '@' && strlen(p) == 6 &&
1188 strspn(p+1, "0123456789abcdef") == 5);
1189 }
1190 if (s->local.family == AF_PACKET)
1191 return s->lport == 0 && s->local.data[0] == 0;
1192 if (s->local.family == AF_NETLINK)
1193 return s->lport < 0;
1194 if (s->local.family == AF_VSOCK)
1195 return s->lport > 1023;
1196
1197 return is_ephemeral(s->lport);
1198 }
1199 case SSF_DCOND:
1200 {
1201 struct aafilter *a = (void *)f->pred;
1202
1203 if (a->addr.family == AF_UNIX)
1204 return unix_match(&s->remote, &a->addr);
1205 if (a->port != -1 && a->port != s->rport)
1206 return 0;
1207 if (a->addr.bitlen) {
1208 do {
1209 if (!inet2_addr_match(&s->remote, &a->addr, a->addr.bitlen))
1210 return 1;
1211 } while ((a = a->next) != NULL);
1212 return 0;
1213 }
1214 return 1;
1215 }
1216 case SSF_SCOND:
1217 {
1218 struct aafilter *a = (void *)f->pred;
1219
1220 if (a->addr.family == AF_UNIX)
1221 return unix_match(&s->local, &a->addr);
1222 if (a->port != -1 && a->port != s->lport)
1223 return 0;
1224 if (a->addr.bitlen) {
1225 do {
1226 if (!inet2_addr_match(&s->local, &a->addr, a->addr.bitlen))
1227 return 1;
1228 } while ((a = a->next) != NULL);
1229 return 0;
1230 }
1231 return 1;
1232 }
1233 case SSF_D_GE:
1234 {
1235 struct aafilter *a = (void *)f->pred;
1236
1237 return s->rport >= a->port;
1238 }
1239 case SSF_D_LE:
1240 {
1241 struct aafilter *a = (void *)f->pred;
1242
1243 return s->rport <= a->port;
1244 }
1245 case SSF_S_GE:
1246 {
1247 struct aafilter *a = (void *)f->pred;
1248
1249 return s->lport >= a->port;
1250 }
1251 case SSF_S_LE:
1252 {
1253 struct aafilter *a = (void *)f->pred;
1254
1255 return s->lport <= a->port;
1256 }
1257 case SSF_DEVCOND:
1258 {
1259 struct aafilter *a = (void *)f->pred;
1260
1261 return s->iface == a->iface;
1262 }
1263 case SSF_MARKMASK:
1264 {
1265 struct aafilter *a = (void *)f->pred;
1266
1267 return (s->mark & a->mask) == a->mark;
1268 }
1269 /* Yup. It is recursion. Sorry. */
1270 case SSF_AND:
1271 return run_ssfilter(f->pred, s) && run_ssfilter(f->post, s);
1272 case SSF_OR:
1273 return run_ssfilter(f->pred, s) || run_ssfilter(f->post, s);
1274 case SSF_NOT:
1275 return !run_ssfilter(f->pred, s);
1276 default:
1277 abort();
1278 }
1279 }
1280
1281 /* Relocate external jumps by reloc. */
1282 static void ssfilter_patch(char *a, int len, int reloc)
1283 {
1284 while (len > 0) {
1285 struct inet_diag_bc_op *op = (struct inet_diag_bc_op *)a;
1286
1287 if (op->no == len+4)
1288 op->no += reloc;
1289 len -= op->yes;
1290 a += op->yes;
1291 }
1292 if (len < 0)
1293 abort();
1294 }
1295
1296 static int ssfilter_bytecompile(struct ssfilter *f, char **bytecode)
1297 {
1298 switch (f->type) {
1299 case SSF_S_AUTO:
1300 {
1301 if (!(*bytecode = malloc(4))) abort();
1302 ((struct inet_diag_bc_op *)*bytecode)[0] = (struct inet_diag_bc_op){ INET_DIAG_BC_AUTO, 4, 8 };
1303 return 4;
1304 }
1305 case SSF_DCOND:
1306 case SSF_SCOND:
1307 {
1308 struct aafilter *a = (void *)f->pred;
1309 struct aafilter *b;
1310 char *ptr;
1311 int code = (f->type == SSF_DCOND ? INET_DIAG_BC_D_COND : INET_DIAG_BC_S_COND);
1312 int len = 0;
1313
1314 for (b = a; b; b = b->next) {
1315 len += 4 + sizeof(struct inet_diag_hostcond);
1316 if (a->addr.family == AF_INET6)
1317 len += 16;
1318 else
1319 len += 4;
1320 if (b->next)
1321 len += 4;
1322 }
1323 if (!(ptr = malloc(len))) abort();
1324 *bytecode = ptr;
1325 for (b = a; b; b = b->next) {
1326 struct inet_diag_bc_op *op = (struct inet_diag_bc_op *)ptr;
1327 int alen = (a->addr.family == AF_INET6 ? 16 : 4);
1328 int oplen = alen + 4 + sizeof(struct inet_diag_hostcond);
1329 struct inet_diag_hostcond *cond = (struct inet_diag_hostcond *)(ptr+4);
1330
1331 *op = (struct inet_diag_bc_op){ code, oplen, oplen+4 };
1332 cond->family = a->addr.family;
1333 cond->port = a->port;
1334 cond->prefix_len = a->addr.bitlen;
1335 memcpy(cond->addr, a->addr.data, alen);
1336 ptr += oplen;
1337 if (b->next) {
1338 op = (struct inet_diag_bc_op *)ptr;
1339 *op = (struct inet_diag_bc_op){ INET_DIAG_BC_JMP, 4, len - (ptr-*bytecode)};
1340 ptr += 4;
1341 }
1342 }
1343 return ptr - *bytecode;
1344 }
1345 case SSF_D_GE:
1346 {
1347 struct aafilter *x = (void *)f->pred;
1348
1349 if (!(*bytecode = malloc(8))) abort();
1350 ((struct inet_diag_bc_op *)*bytecode)[0] = (struct inet_diag_bc_op){ INET_DIAG_BC_D_GE, 8, 12 };
1351 ((struct inet_diag_bc_op *)*bytecode)[1] = (struct inet_diag_bc_op){ 0, 0, x->port };
1352 return 8;
1353 }
1354 case SSF_D_LE:
1355 {
1356 struct aafilter *x = (void *)f->pred;
1357
1358 if (!(*bytecode = malloc(8))) abort();
1359 ((struct inet_diag_bc_op *)*bytecode)[0] = (struct inet_diag_bc_op){ INET_DIAG_BC_D_LE, 8, 12 };
1360 ((struct inet_diag_bc_op *)*bytecode)[1] = (struct inet_diag_bc_op){ 0, 0, x->port };
1361 return 8;
1362 }
1363 case SSF_S_GE:
1364 {
1365 struct aafilter *x = (void *)f->pred;
1366
1367 if (!(*bytecode = malloc(8))) abort();
1368 ((struct inet_diag_bc_op *)*bytecode)[0] = (struct inet_diag_bc_op){ INET_DIAG_BC_S_GE, 8, 12 };
1369 ((struct inet_diag_bc_op *)*bytecode)[1] = (struct inet_diag_bc_op){ 0, 0, x->port };
1370 return 8;
1371 }
1372 case SSF_S_LE:
1373 {
1374 struct aafilter *x = (void *)f->pred;
1375
1376 if (!(*bytecode = malloc(8))) abort();
1377 ((struct inet_diag_bc_op *)*bytecode)[0] = (struct inet_diag_bc_op){ INET_DIAG_BC_S_LE, 8, 12 };
1378 ((struct inet_diag_bc_op *)*bytecode)[1] = (struct inet_diag_bc_op){ 0, 0, x->port };
1379 return 8;
1380 }
1381
1382 case SSF_AND:
1383 {
1384 char *a1 = NULL, *a2 = NULL, *a;
1385 int l1, l2;
1386
1387 l1 = ssfilter_bytecompile(f->pred, &a1);
1388 l2 = ssfilter_bytecompile(f->post, &a2);
1389 if (!l1 || !l2) {
1390 free(a1);
1391 free(a2);
1392 return 0;
1393 }
1394 if (!(a = malloc(l1+l2))) abort();
1395 memcpy(a, a1, l1);
1396 memcpy(a+l1, a2, l2);
1397 free(a1); free(a2);
1398 ssfilter_patch(a, l1, l2);
1399 *bytecode = a;
1400 return l1+l2;
1401 }
1402 case SSF_OR:
1403 {
1404 char *a1 = NULL, *a2 = NULL, *a;
1405 int l1, l2;
1406
1407 l1 = ssfilter_bytecompile(f->pred, &a1);
1408 l2 = ssfilter_bytecompile(f->post, &a2);
1409 if (!l1 || !l2) {
1410 free(a1);
1411 free(a2);
1412 return 0;
1413 }
1414 if (!(a = malloc(l1+l2+4))) abort();
1415 memcpy(a, a1, l1);
1416 memcpy(a+l1+4, a2, l2);
1417 free(a1); free(a2);
1418 *(struct inet_diag_bc_op *)(a+l1) = (struct inet_diag_bc_op){ INET_DIAG_BC_JMP, 4, l2+4 };
1419 *bytecode = a;
1420 return l1+l2+4;
1421 }
1422 case SSF_NOT:
1423 {
1424 char *a1 = NULL, *a;
1425 int l1;
1426
1427 l1 = ssfilter_bytecompile(f->pred, &a1);
1428 if (!l1) {
1429 free(a1);
1430 return 0;
1431 }
1432 if (!(a = malloc(l1+4))) abort();
1433 memcpy(a, a1, l1);
1434 free(a1);
1435 *(struct inet_diag_bc_op *)(a+l1) = (struct inet_diag_bc_op){ INET_DIAG_BC_JMP, 4, 8 };
1436 *bytecode = a;
1437 return l1+4;
1438 }
1439 case SSF_DEVCOND:
1440 {
1441 /* bytecompile for SSF_DEVCOND not supported yet */
1442 return 0;
1443 }
1444 case SSF_MARKMASK:
1445 {
1446 struct aafilter *a = (void *)f->pred;
1447 struct instr {
1448 struct inet_diag_bc_op op;
1449 struct inet_diag_markcond cond;
1450 };
1451 int inslen = sizeof(struct instr);
1452
1453 if (!(*bytecode = malloc(inslen))) abort();
1454 ((struct instr *)*bytecode)[0] = (struct instr) {
1455 { INET_DIAG_BC_MARK_COND, inslen, inslen + 4 },
1456 { a->mark, a->mask},
1457 };
1458
1459 return inslen;
1460 }
1461 default:
1462 abort();
1463 }
1464 }
1465
1466 static int remember_he(struct aafilter *a, struct hostent *he)
1467 {
1468 char **ptr = he->h_addr_list;
1469 int cnt = 0;
1470 int len;
1471
1472 if (he->h_addrtype == AF_INET)
1473 len = 4;
1474 else if (he->h_addrtype == AF_INET6)
1475 len = 16;
1476 else
1477 return 0;
1478
1479 while (*ptr) {
1480 struct aafilter *b = a;
1481
1482 if (a->addr.bitlen) {
1483 if ((b = malloc(sizeof(*b))) == NULL)
1484 return cnt;
1485 *b = *a;
1486 a->next = b;
1487 }
1488 memcpy(b->addr.data, *ptr, len);
1489 b->addr.bytelen = len;
1490 b->addr.bitlen = len*8;
1491 b->addr.family = he->h_addrtype;
1492 ptr++;
1493 cnt++;
1494 }
1495 return cnt;
1496 }
1497
1498 static int get_dns_host(struct aafilter *a, const char *addr, int fam)
1499 {
1500 static int notfirst;
1501 int cnt = 0;
1502 struct hostent *he;
1503
1504 a->addr.bitlen = 0;
1505 if (!notfirst) {
1506 sethostent(1);
1507 notfirst = 1;
1508 }
1509 he = gethostbyname2(addr, fam == AF_UNSPEC ? AF_INET : fam);
1510 if (he)
1511 cnt = remember_he(a, he);
1512 if (fam == AF_UNSPEC) {
1513 he = gethostbyname2(addr, AF_INET6);
1514 if (he)
1515 cnt += remember_he(a, he);
1516 }
1517 return !cnt;
1518 }
1519
1520 static int xll_initted;
1521
1522 static void xll_init(void)
1523 {
1524 struct rtnl_handle rth;
1525
1526 if (rtnl_open(&rth, 0) < 0)
1527 exit(1);
1528
1529 ll_init_map(&rth);
1530 rtnl_close(&rth);
1531 xll_initted = 1;
1532 }
1533
1534 static const char *xll_index_to_name(int index)
1535 {
1536 if (!xll_initted)
1537 xll_init();
1538 return ll_index_to_name(index);
1539 }
1540
1541 static int xll_name_to_index(const char *dev)
1542 {
1543 if (!xll_initted)
1544 xll_init();
1545 return ll_name_to_index(dev);
1546 }
1547
1548 void *parse_devcond(char *name)
1549 {
1550 struct aafilter a = { .iface = 0 };
1551 struct aafilter *res;
1552
1553 a.iface = xll_name_to_index(name);
1554 if (a.iface == 0) {
1555 char *end;
1556 unsigned long n;
1557
1558 n = strtoul(name, &end, 0);
1559 if (!end || end == name || *end || n > UINT_MAX)
1560 return NULL;
1561
1562 a.iface = n;
1563 }
1564
1565 res = malloc(sizeof(*res));
1566 *res = a;
1567
1568 return res;
1569 }
1570
1571 static void vsock_set_inet_prefix(inet_prefix *a, __u32 cid)
1572 {
1573 *a = (inet_prefix){
1574 .bytelen = sizeof(cid),
1575 .family = AF_VSOCK,
1576 };
1577 memcpy(a->data, &cid, sizeof(cid));
1578 }
1579
1580 void *parse_hostcond(char *addr, bool is_port)
1581 {
1582 char *port = NULL;
1583 struct aafilter a = { .port = -1 };
1584 struct aafilter *res;
1585 int fam = preferred_family;
1586 struct filter *f = &current_filter;
1587
1588 if (fam == AF_UNIX || strncmp(addr, "unix:", 5) == 0) {
1589 char *p;
1590
1591 a.addr.family = AF_UNIX;
1592 if (strncmp(addr, "unix:", 5) == 0)
1593 addr += 5;
1594 p = strdup(addr);
1595 a.addr.bitlen = 8*strlen(p);
1596 memcpy(a.addr.data, &p, sizeof(p));
1597 fam = AF_UNIX;
1598 goto out;
1599 }
1600
1601 if (fam == AF_PACKET || strncmp(addr, "link:", 5) == 0) {
1602 a.addr.family = AF_PACKET;
1603 a.addr.bitlen = 0;
1604 if (strncmp(addr, "link:", 5) == 0)
1605 addr += 5;
1606 port = strchr(addr, ':');
1607 if (port) {
1608 *port = 0;
1609 if (port[1] && strcmp(port+1, "*")) {
1610 if (get_integer(&a.port, port+1, 0)) {
1611 if ((a.port = xll_name_to_index(port+1)) <= 0)
1612 return NULL;
1613 }
1614 }
1615 }
1616 if (addr[0] && strcmp(addr, "*")) {
1617 unsigned short tmp;
1618
1619 a.addr.bitlen = 32;
1620 if (ll_proto_a2n(&tmp, addr))
1621 return NULL;
1622 a.addr.data[0] = ntohs(tmp);
1623 }
1624 fam = AF_PACKET;
1625 goto out;
1626 }
1627
1628 if (fam == AF_NETLINK || strncmp(addr, "netlink:", 8) == 0) {
1629 a.addr.family = AF_NETLINK;
1630 a.addr.bitlen = 0;
1631 if (strncmp(addr, "netlink:", 8) == 0)
1632 addr += 8;
1633 port = strchr(addr, ':');
1634 if (port) {
1635 *port = 0;
1636 if (port[1] && strcmp(port+1, "*")) {
1637 if (get_integer(&a.port, port+1, 0)) {
1638 if (strcmp(port+1, "kernel") == 0)
1639 a.port = 0;
1640 else
1641 return NULL;
1642 }
1643 }
1644 }
1645 if (addr[0] && strcmp(addr, "*")) {
1646 a.addr.bitlen = 32;
1647 if (nl_proto_a2n(&a.addr.data[0], addr) == -1)
1648 return NULL;
1649 }
1650 fam = AF_NETLINK;
1651 goto out;
1652 }
1653
1654 if (fam == AF_VSOCK || strncmp(addr, "vsock:", 6) == 0) {
1655 __u32 cid = ~(__u32)0;
1656
1657 a.addr.family = AF_VSOCK;
1658 if (strncmp(addr, "vsock:", 6) == 0)
1659 addr += 6;
1660
1661 if (is_port)
1662 port = addr;
1663 else {
1664 port = strchr(addr, ':');
1665 if (port) {
1666 *port = '\0';
1667 port++;
1668 }
1669 }
1670
1671 if (port && strcmp(port, "*") &&
1672 get_u32((__u32 *)&a.port, port, 0))
1673 return NULL;
1674
1675 if (addr[0] && strcmp(addr, "*")) {
1676 a.addr.bitlen = 32;
1677 if (get_u32(&cid, addr, 0))
1678 return NULL;
1679 }
1680 vsock_set_inet_prefix(&a.addr, cid);
1681 fam = AF_VSOCK;
1682 goto out;
1683 }
1684
1685 if (fam == AF_INET || !strncmp(addr, "inet:", 5)) {
1686 fam = AF_INET;
1687 if (!strncmp(addr, "inet:", 5))
1688 addr += 5;
1689 } else if (fam == AF_INET6 || !strncmp(addr, "inet6:", 6)) {
1690 fam = AF_INET6;
1691 if (!strncmp(addr, "inet6:", 6))
1692 addr += 6;
1693 }
1694
1695 /* URL-like literal [] */
1696 if (addr[0] == '[') {
1697 addr++;
1698 if ((port = strchr(addr, ']')) == NULL)
1699 return NULL;
1700 *port++ = 0;
1701 } else if (addr[0] == '*') {
1702 port = addr+1;
1703 } else {
1704 port = strrchr(strchr(addr, '/') ? : addr, ':');
1705 }
1706
1707 if (is_port)
1708 port = addr;
1709
1710 if (port && *port) {
1711 if (*port == ':')
1712 *port++ = 0;
1713
1714 if (*port && *port != '*') {
1715 if (get_integer(&a.port, port, 0)) {
1716 struct servent *se1 = NULL;
1717 struct servent *se2 = NULL;
1718
1719 if (current_filter.dbs&(1<<UDP_DB))
1720 se1 = getservbyname(port, UDP_PROTO);
1721 if (current_filter.dbs&(1<<TCP_DB))
1722 se2 = getservbyname(port, TCP_PROTO);
1723 if (se1 && se2 && se1->s_port != se2->s_port) {
1724 fprintf(stderr, "Error: ambiguous port \"%s\".\n", port);
1725 return NULL;
1726 }
1727 if (!se1)
1728 se1 = se2;
1729 if (se1) {
1730 a.port = ntohs(se1->s_port);
1731 } else {
1732 struct scache *s;
1733
1734 for (s = rlist; s; s = s->next) {
1735 if ((s->proto == UDP_PROTO &&
1736 (current_filter.dbs&(1<<UDP_DB))) ||
1737 (s->proto == TCP_PROTO &&
1738 (current_filter.dbs&(1<<TCP_DB)))) {
1739 if (s->name && strcmp(s->name, port) == 0) {
1740 if (a.port > 0 && a.port != s->port) {
1741 fprintf(stderr, "Error: ambiguous port \"%s\".\n", port);
1742 return NULL;
1743 }
1744 a.port = s->port;
1745 }
1746 }
1747 }
1748 if (a.port <= 0) {
1749 fprintf(stderr, "Error: \"%s\" does not look like a port.\n", port);
1750 return NULL;
1751 }
1752 }
1753 }
1754 }
1755 }
1756 if (!is_port && *addr && *addr != '*') {
1757 if (get_prefix_1(&a.addr, addr, fam)) {
1758 if (get_dns_host(&a, addr, fam)) {
1759 fprintf(stderr, "Error: an inet prefix is expected rather than \"%s\".\n", addr);
1760 return NULL;
1761 }
1762 }
1763 }
1764
1765 out:
1766 if (fam != AF_UNSPEC) {
1767 int states = f->states;
1768 f->families = 0;
1769 filter_af_set(f, fam);
1770 filter_states_set(f, states);
1771 }
1772
1773 res = malloc(sizeof(*res));
1774 if (res)
1775 memcpy(res, &a, sizeof(a));
1776 return res;
1777 }
1778
1779 void *parse_markmask(const char *markmask)
1780 {
1781 struct aafilter a, *res;
1782
1783 if (strchr(markmask, '/')) {
1784 if (sscanf(markmask, "%i/%i", &a.mark, &a.mask) != 2)
1785 return NULL;
1786 } else {
1787 a.mask = 0xffffffff;
1788 if (sscanf(markmask, "%i", &a.mark) != 1)
1789 return NULL;
1790 }
1791
1792 res = malloc(sizeof(*res));
1793 if (res)
1794 memcpy(res, &a, sizeof(a));
1795 return res;
1796 }
1797
1798 static void proc_ctx_print(struct sockstat *s)
1799 {
1800 char *buf;
1801
1802 if (show_proc_ctx || show_sock_ctx) {
1803 if (find_entry(s->ino, &buf,
1804 (show_proc_ctx & show_sock_ctx) ?
1805 PROC_SOCK_CTX : PROC_CTX) > 0) {
1806 out(" users:(%s)", buf);
1807 free(buf);
1808 }
1809 } else if (show_users) {
1810 if (find_entry(s->ino, &buf, USERS) > 0) {
1811 out(" users:(%s)", buf);
1812 free(buf);
1813 }
1814 }
1815 }
1816
1817 static void inet_stats_print(struct sockstat *s, bool v6only)
1818 {
1819 sock_state_print(s);
1820
1821 inet_addr_print(&s->local, s->lport, s->iface, v6only);
1822 inet_addr_print(&s->remote, s->rport, 0, v6only);
1823
1824 proc_ctx_print(s);
1825 }
1826
1827 static int proc_parse_inet_addr(char *loc, char *rem, int family, struct
1828 sockstat * s)
1829 {
1830 s->local.family = s->remote.family = family;
1831 if (family == AF_INET) {
1832 sscanf(loc, "%x:%x", s->local.data, (unsigned *)&s->lport);
1833 sscanf(rem, "%x:%x", s->remote.data, (unsigned *)&s->rport);
1834 s->local.bytelen = s->remote.bytelen = 4;
1835 return 0;
1836 } else {
1837 sscanf(loc, "%08x%08x%08x%08x:%x",
1838 s->local.data,
1839 s->local.data + 1,
1840 s->local.data + 2,
1841 s->local.data + 3,
1842 &s->lport);
1843 sscanf(rem, "%08x%08x%08x%08x:%x",
1844 s->remote.data,
1845 s->remote.data + 1,
1846 s->remote.data + 2,
1847 s->remote.data + 3,
1848 &s->rport);
1849 s->local.bytelen = s->remote.bytelen = 16;
1850 return 0;
1851 }
1852 return -1;
1853 }
1854
1855 static int proc_inet_split_line(char *line, char **loc, char **rem, char **data)
1856 {
1857 char *p;
1858
1859 if ((p = strchr(line, ':')) == NULL)
1860 return -1;
1861
1862 *loc = p+2;
1863 if ((p = strchr(*loc, ':')) == NULL)
1864 return -1;
1865
1866 p[5] = 0;
1867 *rem = p+6;
1868 if ((p = strchr(*rem, ':')) == NULL)
1869 return -1;
1870
1871 p[5] = 0;
1872 *data = p+6;
1873 return 0;
1874 }
1875
1876 static char *sprint_bw(char *buf, double bw)
1877 {
1878 if (bw > 1000000.)
1879 sprintf(buf, "%.1fM", bw / 1000000.);
1880 else if (bw > 1000.)
1881 sprintf(buf, "%.1fK", bw / 1000.);
1882 else
1883 sprintf(buf, "%g", bw);
1884
1885 return buf;
1886 }
1887
1888 static void sctp_stats_print(struct sctp_info *s)
1889 {
1890 if (s->sctpi_tag)
1891 out(" tag:%x", s->sctpi_tag);
1892 if (s->sctpi_state)
1893 out(" state:%s", sctp_sstate_name[s->sctpi_state]);
1894 if (s->sctpi_rwnd)
1895 out(" rwnd:%d", s->sctpi_rwnd);
1896 if (s->sctpi_unackdata)
1897 out(" unackdata:%d", s->sctpi_unackdata);
1898 if (s->sctpi_penddata)
1899 out(" penddata:%d", s->sctpi_penddata);
1900 if (s->sctpi_instrms)
1901 out(" instrms:%d", s->sctpi_instrms);
1902 if (s->sctpi_outstrms)
1903 out(" outstrms:%d", s->sctpi_outstrms);
1904 if (s->sctpi_inqueue)
1905 out(" inqueue:%d", s->sctpi_inqueue);
1906 if (s->sctpi_outqueue)
1907 out(" outqueue:%d", s->sctpi_outqueue);
1908 if (s->sctpi_overall_error)
1909 out(" overerr:%d", s->sctpi_overall_error);
1910 if (s->sctpi_max_burst)
1911 out(" maxburst:%d", s->sctpi_max_burst);
1912 if (s->sctpi_maxseg)
1913 out(" maxseg:%d", s->sctpi_maxseg);
1914 if (s->sctpi_peer_rwnd)
1915 out(" prwnd:%d", s->sctpi_peer_rwnd);
1916 if (s->sctpi_peer_tag)
1917 out(" ptag:%x", s->sctpi_peer_tag);
1918 if (s->sctpi_peer_capable)
1919 out(" pcapable:%d", s->sctpi_peer_capable);
1920 if (s->sctpi_peer_sack)
1921 out(" psack:%d", s->sctpi_peer_sack);
1922 if (s->sctpi_s_autoclose)
1923 out(" autoclose:%d", s->sctpi_s_autoclose);
1924 if (s->sctpi_s_adaptation_ind)
1925 out(" adapind:%d", s->sctpi_s_adaptation_ind);
1926 if (s->sctpi_s_pd_point)
1927 out(" pdpoint:%d", s->sctpi_s_pd_point);
1928 if (s->sctpi_s_nodelay)
1929 out(" nodealy:%d", s->sctpi_s_nodelay);
1930 if (s->sctpi_s_disable_fragments)
1931 out(" nofrag:%d", s->sctpi_s_disable_fragments);
1932 if (s->sctpi_s_v4mapped)
1933 out(" v4mapped:%d", s->sctpi_s_v4mapped);
1934 if (s->sctpi_s_frag_interleave)
1935 out(" fraginl:%d", s->sctpi_s_frag_interleave);
1936 }
1937
1938 static void tcp_stats_print(struct tcpstat *s)
1939 {
1940 char b1[64];
1941
1942 if (s->has_ts_opt)
1943 out(" ts");
1944 if (s->has_sack_opt)
1945 out(" sack");
1946 if (s->has_ecn_opt)
1947 out(" ecn");
1948 if (s->has_ecnseen_opt)
1949 out(" ecnseen");
1950 if (s->has_fastopen_opt)
1951 out(" fastopen");
1952 if (s->cong_alg[0])
1953 out(" %s", s->cong_alg);
1954 if (s->has_wscale_opt)
1955 out(" wscale:%d,%d", s->snd_wscale, s->rcv_wscale);
1956 if (s->rto)
1957 out(" rto:%g", s->rto);
1958 if (s->backoff)
1959 out(" backoff:%u", s->backoff);
1960 if (s->rtt)
1961 out(" rtt:%g/%g", s->rtt, s->rttvar);
1962 if (s->ato)
1963 out(" ato:%g", s->ato);
1964
1965 if (s->qack)
1966 out(" qack:%d", s->qack);
1967 if (s->qack & 1)
1968 out(" bidir");
1969
1970 if (s->mss)
1971 out(" mss:%d", s->mss);
1972 if (s->rcv_mss)
1973 out(" rcvmss:%d", s->rcv_mss);
1974 if (s->advmss)
1975 out(" advmss:%d", s->advmss);
1976 if (s->cwnd)
1977 out(" cwnd:%u", s->cwnd);
1978 if (s->ssthresh)
1979 out(" ssthresh:%d", s->ssthresh);
1980
1981 if (s->bytes_acked)
1982 out(" bytes_acked:%llu", s->bytes_acked);
1983 if (s->bytes_received)
1984 out(" bytes_received:%llu", s->bytes_received);
1985 if (s->segs_out)
1986 out(" segs_out:%u", s->segs_out);
1987 if (s->segs_in)
1988 out(" segs_in:%u", s->segs_in);
1989 if (s->data_segs_out)
1990 out(" data_segs_out:%u", s->data_segs_out);
1991 if (s->data_segs_in)
1992 out(" data_segs_in:%u", s->data_segs_in);
1993
1994 if (s->dctcp && s->dctcp->enabled) {
1995 struct dctcpstat *dctcp = s->dctcp;
1996
1997 out(" dctcp:(ce_state:%u,alpha:%u,ab_ecn:%u,ab_tot:%u)",
1998 dctcp->ce_state, dctcp->alpha, dctcp->ab_ecn,
1999 dctcp->ab_tot);
2000 } else if (s->dctcp) {
2001 out(" dctcp:fallback_mode");
2002 }
2003
2004 if (s->bbr_info) {
2005 __u64 bw;
2006
2007 bw = s->bbr_info->bbr_bw_hi;
2008 bw <<= 32;
2009 bw |= s->bbr_info->bbr_bw_lo;
2010
2011 out(" bbr:(bw:%sbps,mrtt:%g",
2012 sprint_bw(b1, bw * 8.0),
2013 (double)s->bbr_info->bbr_min_rtt / 1000.0);
2014 if (s->bbr_info->bbr_pacing_gain)
2015 out(",pacing_gain:%g",
2016 (double)s->bbr_info->bbr_pacing_gain / 256.0);
2017 if (s->bbr_info->bbr_cwnd_gain)
2018 out(",cwnd_gain:%g",
2019 (double)s->bbr_info->bbr_cwnd_gain / 256.0);
2020 out(")");
2021 }
2022
2023 if (s->send_bps)
2024 out(" send %sbps", sprint_bw(b1, s->send_bps));
2025 if (s->lastsnd)
2026 out(" lastsnd:%u", s->lastsnd);
2027 if (s->lastrcv)
2028 out(" lastrcv:%u", s->lastrcv);
2029 if (s->lastack)
2030 out(" lastack:%u", s->lastack);
2031
2032 if (s->pacing_rate) {
2033 out(" pacing_rate %sbps", sprint_bw(b1, s->pacing_rate));
2034 if (s->pacing_rate_max)
2035 out("/%sbps", sprint_bw(b1, s->pacing_rate_max));
2036 }
2037
2038 if (s->delivery_rate)
2039 out(" delivery_rate %sbps", sprint_bw(b1, s->delivery_rate));
2040 if (s->app_limited)
2041 out(" app_limited");
2042
2043 if (s->busy_time) {
2044 out(" busy:%llums", s->busy_time / 1000);
2045 if (s->rwnd_limited)
2046 out(" rwnd_limited:%llums(%.1f%%)",
2047 s->rwnd_limited / 1000,
2048 100.0 * s->rwnd_limited / s->busy_time);
2049 if (s->sndbuf_limited)
2050 out(" sndbuf_limited:%llums(%.1f%%)",
2051 s->sndbuf_limited / 1000,
2052 100.0 * s->sndbuf_limited / s->busy_time);
2053 }
2054
2055 if (s->unacked)
2056 out(" unacked:%u", s->unacked);
2057 if (s->retrans || s->retrans_total)
2058 out(" retrans:%u/%u", s->retrans, s->retrans_total);
2059 if (s->lost)
2060 out(" lost:%u", s->lost);
2061 if (s->sacked && s->ss.state != SS_LISTEN)
2062 out(" sacked:%u", s->sacked);
2063 if (s->fackets)
2064 out(" fackets:%u", s->fackets);
2065 if (s->reordering != 3)
2066 out(" reordering:%d", s->reordering);
2067 if (s->rcv_rtt)
2068 out(" rcv_rtt:%g", s->rcv_rtt);
2069 if (s->rcv_space)
2070 out(" rcv_space:%d", s->rcv_space);
2071 if (s->rcv_ssthresh)
2072 out(" rcv_ssthresh:%u", s->rcv_ssthresh);
2073 if (s->not_sent)
2074 out(" notsent:%u", s->not_sent);
2075 if (s->min_rtt)
2076 out(" minrtt:%g", s->min_rtt);
2077 }
2078
2079 static void tcp_timer_print(struct tcpstat *s)
2080 {
2081 static const char * const tmr_name[] = {
2082 "off",
2083 "on",
2084 "keepalive",
2085 "timewait",
2086 "persist",
2087 "unknown"
2088 };
2089
2090 if (s->timer) {
2091 if (s->timer > 4)
2092 s->timer = 5;
2093 out(" timer:(%s,%s,%d)",
2094 tmr_name[s->timer],
2095 print_ms_timer(s->timeout),
2096 s->retrans);
2097 }
2098 }
2099
2100 static void sctp_timer_print(struct tcpstat *s)
2101 {
2102 if (s->timer)
2103 out(" timer:(T3_RTX,%s,%d)",
2104 print_ms_timer(s->timeout), s->retrans);
2105 }
2106
2107 static int tcp_show_line(char *line, const struct filter *f, int family)
2108 {
2109 int rto = 0, ato = 0;
2110 struct tcpstat s = {};
2111 char *loc, *rem, *data;
2112 char opt[256];
2113 int n;
2114 int hz = get_user_hz();
2115
2116 if (proc_inet_split_line(line, &loc, &rem, &data))
2117 return -1;
2118
2119 int state = (data[1] >= 'A') ? (data[1] - 'A' + 10) : (data[1] - '0');
2120
2121 if (!(f->states & (1 << state)))
2122 return 0;
2123
2124 proc_parse_inet_addr(loc, rem, family, &s.ss);
2125
2126 if (f->f && run_ssfilter(f->f, &s.ss) == 0)
2127 return 0;
2128
2129 opt[0] = 0;
2130 n = sscanf(data, "%x %x:%x %x:%x %x %d %d %u %d %llx %d %d %d %u %d %[^\n]\n",
2131 &s.ss.state, &s.ss.wq, &s.ss.rq,
2132 &s.timer, &s.timeout, &s.retrans, &s.ss.uid, &s.probes,
2133 &s.ss.ino, &s.ss.refcnt, &s.ss.sk, &rto, &ato, &s.qack, &s.cwnd,
2134 &s.ssthresh, opt);
2135
2136 if (n < 17)
2137 opt[0] = 0;
2138
2139 if (n < 12) {
2140 rto = 0;
2141 s.cwnd = 2;
2142 s.ssthresh = -1;
2143 ato = s.qack = 0;
2144 }
2145
2146 s.retrans = s.timer != 1 ? s.probes : s.retrans;
2147 s.timeout = (s.timeout * 1000 + hz - 1) / hz;
2148 s.ato = (double)ato / hz;
2149 s.qack /= 2;
2150 s.rto = (double)rto;
2151 s.ssthresh = s.ssthresh == -1 ? 0 : s.ssthresh;
2152 s.rto = s.rto != 3 * hz ? s.rto / hz : 0;
2153 s.ss.type = IPPROTO_TCP;
2154
2155 inet_stats_print(&s.ss, false);
2156
2157 if (show_options)
2158 tcp_timer_print(&s);
2159
2160 if (show_details) {
2161 sock_details_print(&s.ss);
2162 if (opt[0])
2163 out(" opt:\"%s\"", opt);
2164 }
2165
2166 if (show_tcpinfo)
2167 tcp_stats_print(&s);
2168
2169 out("\n");
2170 return 0;
2171 }
2172
2173 static int generic_record_read(FILE *fp,
2174 int (*worker)(char*, const struct filter *, int),
2175 const struct filter *f, int fam)
2176 {
2177 char line[256];
2178
2179 /* skip header */
2180 if (fgets(line, sizeof(line), fp) == NULL)
2181 goto outerr;
2182
2183 while (fgets(line, sizeof(line), fp) != NULL) {
2184 int n = strlen(line);
2185
2186 if (n == 0 || line[n-1] != '\n') {
2187 errno = -EINVAL;
2188 return -1;
2189 }
2190 line[n-1] = 0;
2191
2192 if (worker(line, f, fam) < 0)
2193 return 0;
2194 }
2195 outerr:
2196
2197 return ferror(fp) ? -1 : 0;
2198 }
2199
2200 static void print_skmeminfo(struct rtattr *tb[], int attrtype)
2201 {
2202 const __u32 *skmeminfo;
2203
2204 if (!tb[attrtype]) {
2205 if (attrtype == INET_DIAG_SKMEMINFO) {
2206 if (!tb[INET_DIAG_MEMINFO])
2207 return;
2208
2209 const struct inet_diag_meminfo *minfo =
2210 RTA_DATA(tb[INET_DIAG_MEMINFO]);
2211
2212 out(" mem:(r%u,w%u,f%u,t%u)",
2213 minfo->idiag_rmem,
2214 minfo->idiag_wmem,
2215 minfo->idiag_fmem,
2216 minfo->idiag_tmem);
2217 }
2218 return;
2219 }
2220
2221 skmeminfo = RTA_DATA(tb[attrtype]);
2222
2223 out(" skmem:(r%u,rb%u,t%u,tb%u,f%u,w%u,o%u",
2224 skmeminfo[SK_MEMINFO_RMEM_ALLOC],
2225 skmeminfo[SK_MEMINFO_RCVBUF],
2226 skmeminfo[SK_MEMINFO_WMEM_ALLOC],
2227 skmeminfo[SK_MEMINFO_SNDBUF],
2228 skmeminfo[SK_MEMINFO_FWD_ALLOC],
2229 skmeminfo[SK_MEMINFO_WMEM_QUEUED],
2230 skmeminfo[SK_MEMINFO_OPTMEM]);
2231
2232 if (RTA_PAYLOAD(tb[attrtype]) >=
2233 (SK_MEMINFO_BACKLOG + 1) * sizeof(__u32))
2234 out(",bl%u", skmeminfo[SK_MEMINFO_BACKLOG]);
2235
2236 if (RTA_PAYLOAD(tb[attrtype]) >=
2237 (SK_MEMINFO_DROPS + 1) * sizeof(__u32))
2238 out(",d%u", skmeminfo[SK_MEMINFO_DROPS]);
2239
2240 out(")");
2241 }
2242
2243 static void print_md5sig(struct tcp_diag_md5sig *sig)
2244 {
2245 out("%s/%d=",
2246 format_host(sig->tcpm_family,
2247 sig->tcpm_family == AF_INET6 ? 16 : 4,
2248 &sig->tcpm_addr),
2249 sig->tcpm_prefixlen);
2250 print_escape_buf(sig->tcpm_key, sig->tcpm_keylen, " ,");
2251 }
2252
2253 #define TCPI_HAS_OPT(info, opt) !!(info->tcpi_options & (opt))
2254
2255 static void tcp_show_info(const struct nlmsghdr *nlh, struct inet_diag_msg *r,
2256 struct rtattr *tb[])
2257 {
2258 double rtt = 0;
2259 struct tcpstat s = {};
2260
2261 s.ss.state = r->idiag_state;
2262
2263 print_skmeminfo(tb, INET_DIAG_SKMEMINFO);
2264
2265 if (tb[INET_DIAG_INFO]) {
2266 struct tcp_info *info;
2267 int len = RTA_PAYLOAD(tb[INET_DIAG_INFO]);
2268
2269 /* workaround for older kernels with less fields */
2270 if (len < sizeof(*info)) {
2271 info = alloca(sizeof(*info));
2272 memcpy(info, RTA_DATA(tb[INET_DIAG_INFO]), len);
2273 memset((char *)info + len, 0, sizeof(*info) - len);
2274 } else
2275 info = RTA_DATA(tb[INET_DIAG_INFO]);
2276
2277 if (show_options) {
2278 s.has_ts_opt = TCPI_HAS_OPT(info, TCPI_OPT_TIMESTAMPS);
2279 s.has_sack_opt = TCPI_HAS_OPT(info, TCPI_OPT_SACK);
2280 s.has_ecn_opt = TCPI_HAS_OPT(info, TCPI_OPT_ECN);
2281 s.has_ecnseen_opt = TCPI_HAS_OPT(info, TCPI_OPT_ECN_SEEN);
2282 s.has_fastopen_opt = TCPI_HAS_OPT(info, TCPI_OPT_SYN_DATA);
2283 }
2284
2285 if (tb[INET_DIAG_CONG])
2286 strncpy(s.cong_alg,
2287 rta_getattr_str(tb[INET_DIAG_CONG]),
2288 sizeof(s.cong_alg) - 1);
2289
2290 if (TCPI_HAS_OPT(info, TCPI_OPT_WSCALE)) {
2291 s.has_wscale_opt = true;
2292 s.snd_wscale = info->tcpi_snd_wscale;
2293 s.rcv_wscale = info->tcpi_rcv_wscale;
2294 }
2295
2296 if (info->tcpi_rto && info->tcpi_rto != 3000000)
2297 s.rto = (double)info->tcpi_rto / 1000;
2298
2299 s.backoff = info->tcpi_backoff;
2300 s.rtt = (double)info->tcpi_rtt / 1000;
2301 s.rttvar = (double)info->tcpi_rttvar / 1000;
2302 s.ato = (double)info->tcpi_ato / 1000;
2303 s.mss = info->tcpi_snd_mss;
2304 s.rcv_mss = info->tcpi_rcv_mss;
2305 s.advmss = info->tcpi_advmss;
2306 s.rcv_space = info->tcpi_rcv_space;
2307 s.rcv_rtt = (double)info->tcpi_rcv_rtt / 1000;
2308 s.lastsnd = info->tcpi_last_data_sent;
2309 s.lastrcv = info->tcpi_last_data_recv;
2310 s.lastack = info->tcpi_last_ack_recv;
2311 s.unacked = info->tcpi_unacked;
2312 s.retrans = info->tcpi_retrans;
2313 s.retrans_total = info->tcpi_total_retrans;
2314 s.lost = info->tcpi_lost;
2315 s.sacked = info->tcpi_sacked;
2316 s.fackets = info->tcpi_fackets;
2317 s.reordering = info->tcpi_reordering;
2318 s.rcv_ssthresh = info->tcpi_rcv_ssthresh;
2319 s.cwnd = info->tcpi_snd_cwnd;
2320
2321 if (info->tcpi_snd_ssthresh < 0xFFFF)
2322 s.ssthresh = info->tcpi_snd_ssthresh;
2323
2324 rtt = (double) info->tcpi_rtt;
2325 if (tb[INET_DIAG_VEGASINFO]) {
2326 const struct tcpvegas_info *vinfo
2327 = RTA_DATA(tb[INET_DIAG_VEGASINFO]);
2328
2329 if (vinfo->tcpv_enabled &&
2330 vinfo->tcpv_rtt && vinfo->tcpv_rtt != 0x7fffffff)
2331 rtt = vinfo->tcpv_rtt;
2332 }
2333
2334 if (tb[INET_DIAG_DCTCPINFO]) {
2335 struct dctcpstat *dctcp = malloc(sizeof(struct
2336 dctcpstat));
2337
2338 const struct tcp_dctcp_info *dinfo
2339 = RTA_DATA(tb[INET_DIAG_DCTCPINFO]);
2340
2341 dctcp->enabled = !!dinfo->dctcp_enabled;
2342 dctcp->ce_state = dinfo->dctcp_ce_state;
2343 dctcp->alpha = dinfo->dctcp_alpha;
2344 dctcp->ab_ecn = dinfo->dctcp_ab_ecn;
2345 dctcp->ab_tot = dinfo->dctcp_ab_tot;
2346 s.dctcp = dctcp;
2347 }
2348
2349 if (tb[INET_DIAG_BBRINFO]) {
2350 const void *bbr_info = RTA_DATA(tb[INET_DIAG_BBRINFO]);
2351 int len = min(RTA_PAYLOAD(tb[INET_DIAG_BBRINFO]),
2352 sizeof(*s.bbr_info));
2353
2354 s.bbr_info = calloc(1, sizeof(*s.bbr_info));
2355 if (s.bbr_info && bbr_info)
2356 memcpy(s.bbr_info, bbr_info, len);
2357 }
2358
2359 if (rtt > 0 && info->tcpi_snd_mss && info->tcpi_snd_cwnd) {
2360 s.send_bps = (double) info->tcpi_snd_cwnd *
2361 (double)info->tcpi_snd_mss * 8000000. / rtt;
2362 }
2363
2364 if (info->tcpi_pacing_rate &&
2365 info->tcpi_pacing_rate != ~0ULL) {
2366 s.pacing_rate = info->tcpi_pacing_rate * 8.;
2367
2368 if (info->tcpi_max_pacing_rate &&
2369 info->tcpi_max_pacing_rate != ~0ULL)
2370 s.pacing_rate_max = info->tcpi_max_pacing_rate * 8.;
2371 }
2372 s.bytes_acked = info->tcpi_bytes_acked;
2373 s.bytes_received = info->tcpi_bytes_received;
2374 s.segs_out = info->tcpi_segs_out;
2375 s.segs_in = info->tcpi_segs_in;
2376 s.data_segs_out = info->tcpi_data_segs_out;
2377 s.data_segs_in = info->tcpi_data_segs_in;
2378 s.not_sent = info->tcpi_notsent_bytes;
2379 if (info->tcpi_min_rtt && info->tcpi_min_rtt != ~0U)
2380 s.min_rtt = (double) info->tcpi_min_rtt / 1000;
2381 s.delivery_rate = info->tcpi_delivery_rate * 8.;
2382 s.app_limited = info->tcpi_delivery_rate_app_limited;
2383 s.busy_time = info->tcpi_busy_time;
2384 s.rwnd_limited = info->tcpi_rwnd_limited;
2385 s.sndbuf_limited = info->tcpi_sndbuf_limited;
2386 tcp_stats_print(&s);
2387 free(s.dctcp);
2388 free(s.bbr_info);
2389 }
2390 if (tb[INET_DIAG_MD5SIG]) {
2391 struct tcp_diag_md5sig *sig = RTA_DATA(tb[INET_DIAG_MD5SIG]);
2392 int len = RTA_PAYLOAD(tb[INET_DIAG_MD5SIG]);
2393
2394 out(" md5keys:");
2395 print_md5sig(sig++);
2396 for (len -= sizeof(*sig); len > 0; len -= sizeof(*sig)) {
2397 out(",");
2398 print_md5sig(sig++);
2399 }
2400 }
2401 }
2402
2403 static const char *format_host_sa(struct sockaddr_storage *sa)
2404 {
2405 union {
2406 struct sockaddr_in sin;
2407 struct sockaddr_in6 sin6;
2408 } *saddr = (void *)sa;
2409
2410 switch (sa->ss_family) {
2411 case AF_INET:
2412 return format_host(AF_INET, 4, &saddr->sin.sin_addr);
2413 case AF_INET6:
2414 return format_host(AF_INET6, 16, &saddr->sin6.sin6_addr);
2415 default:
2416 return "";
2417 }
2418 }
2419
2420 static void sctp_show_info(const struct nlmsghdr *nlh, struct inet_diag_msg *r,
2421 struct rtattr *tb[])
2422 {
2423 struct sockaddr_storage *sa;
2424 int len;
2425
2426 print_skmeminfo(tb, INET_DIAG_SKMEMINFO);
2427
2428 if (tb[INET_DIAG_LOCALS]) {
2429 len = RTA_PAYLOAD(tb[INET_DIAG_LOCALS]);
2430 sa = RTA_DATA(tb[INET_DIAG_LOCALS]);
2431
2432 out("locals:%s", format_host_sa(sa));
2433 for (sa++, len -= sizeof(*sa); len > 0; sa++, len -= sizeof(*sa))
2434 out(",%s", format_host_sa(sa));
2435
2436 }
2437 if (tb[INET_DIAG_PEERS]) {
2438 len = RTA_PAYLOAD(tb[INET_DIAG_PEERS]);
2439 sa = RTA_DATA(tb[INET_DIAG_PEERS]);
2440
2441 out(" peers:%s", format_host_sa(sa));
2442 for (sa++, len -= sizeof(*sa); len > 0; sa++, len -= sizeof(*sa))
2443 out(",%s", format_host_sa(sa));
2444 }
2445 if (tb[INET_DIAG_INFO]) {
2446 struct sctp_info *info;
2447 len = RTA_PAYLOAD(tb[INET_DIAG_INFO]);
2448
2449 /* workaround for older kernels with less fields */
2450 if (len < sizeof(*info)) {
2451 info = alloca(sizeof(*info));
2452 memcpy(info, RTA_DATA(tb[INET_DIAG_INFO]), len);
2453 memset((char *)info + len, 0, sizeof(*info) - len);
2454 } else
2455 info = RTA_DATA(tb[INET_DIAG_INFO]);
2456
2457 sctp_stats_print(info);
2458 }
2459 }
2460
2461 static void parse_diag_msg(struct nlmsghdr *nlh, struct sockstat *s)
2462 {
2463 struct rtattr *tb[INET_DIAG_MAX+1];
2464 struct inet_diag_msg *r = NLMSG_DATA(nlh);
2465
2466 parse_rtattr(tb, INET_DIAG_MAX, (struct rtattr *)(r+1),
2467 nlh->nlmsg_len - NLMSG_LENGTH(sizeof(*r)));
2468
2469 s->state = r->idiag_state;
2470 s->local.family = s->remote.family = r->idiag_family;
2471 s->lport = ntohs(r->id.idiag_sport);
2472 s->rport = ntohs(r->id.idiag_dport);
2473 s->wq = r->idiag_wqueue;
2474 s->rq = r->idiag_rqueue;
2475 s->ino = r->idiag_inode;
2476 s->uid = r->idiag_uid;
2477 s->iface = r->id.idiag_if;
2478 s->sk = cookie_sk_get(&r->id.idiag_cookie[0]);
2479
2480 s->mark = 0;
2481 if (tb[INET_DIAG_MARK])
2482 s->mark = rta_getattr_u32(tb[INET_DIAG_MARK]);
2483 if (tb[INET_DIAG_PROTOCOL])
2484 s->raw_prot = rta_getattr_u8(tb[INET_DIAG_PROTOCOL]);
2485 else
2486 s->raw_prot = 0;
2487
2488 if (s->local.family == AF_INET)
2489 s->local.bytelen = s->remote.bytelen = 4;
2490 else
2491 s->local.bytelen = s->remote.bytelen = 16;
2492
2493 memcpy(s->local.data, r->id.idiag_src, s->local.bytelen);
2494 memcpy(s->remote.data, r->id.idiag_dst, s->local.bytelen);
2495 }
2496
2497 static int inet_show_sock(struct nlmsghdr *nlh,
2498 struct sockstat *s)
2499 {
2500 struct rtattr *tb[INET_DIAG_MAX+1];
2501 struct inet_diag_msg *r = NLMSG_DATA(nlh);
2502 unsigned char v6only = 0;
2503
2504 parse_rtattr(tb, INET_DIAG_MAX, (struct rtattr *)(r+1),
2505 nlh->nlmsg_len - NLMSG_LENGTH(sizeof(*r)));
2506
2507 if (tb[INET_DIAG_PROTOCOL])
2508 s->type = rta_getattr_u8(tb[INET_DIAG_PROTOCOL]);
2509
2510 if (s->local.family == AF_INET6 && tb[INET_DIAG_SKV6ONLY])
2511 v6only = rta_getattr_u8(tb[INET_DIAG_SKV6ONLY]);
2512
2513 inet_stats_print(s, v6only);
2514
2515 if (show_options) {
2516 struct tcpstat t = {};
2517
2518 t.timer = r->idiag_timer;
2519 t.timeout = r->idiag_expires;
2520 t.retrans = r->idiag_retrans;
2521 if (s->type == IPPROTO_SCTP)
2522 sctp_timer_print(&t);
2523 else
2524 tcp_timer_print(&t);
2525 }
2526
2527 if (show_details) {
2528 sock_details_print(s);
2529 if (s->local.family == AF_INET6 && tb[INET_DIAG_SKV6ONLY])
2530 out(" v6only:%u", v6only);
2531
2532 if (tb[INET_DIAG_SHUTDOWN]) {
2533 unsigned char mask;
2534
2535 mask = rta_getattr_u8(tb[INET_DIAG_SHUTDOWN]);
2536 out(" %c-%c",
2537 mask & 1 ? '-' : '<', mask & 2 ? '-' : '>');
2538 }
2539 }
2540
2541 if (show_mem || (show_tcpinfo && s->type != IPPROTO_UDP)) {
2542 out("\n\t");
2543 if (s->type == IPPROTO_SCTP)
2544 sctp_show_info(nlh, r, tb);
2545 else
2546 tcp_show_info(nlh, r, tb);
2547 }
2548 sctp_ino = s->ino;
2549
2550 out("\n");
2551 return 0;
2552 }
2553
2554 static int tcpdiag_send(int fd, int protocol, struct filter *f)
2555 {
2556 struct sockaddr_nl nladdr = { .nl_family = AF_NETLINK };
2557 struct {
2558 struct nlmsghdr nlh;
2559 struct inet_diag_req r;
2560 } req = {
2561 .nlh.nlmsg_len = sizeof(req),
2562 .nlh.nlmsg_flags = NLM_F_ROOT | NLM_F_MATCH | NLM_F_REQUEST,
2563 .nlh.nlmsg_seq = MAGIC_SEQ,
2564 .r.idiag_family = AF_INET,
2565 .r.idiag_states = f->states,
2566 };
2567 char *bc = NULL;
2568 int bclen;
2569 struct msghdr msg;
2570 struct rtattr rta;
2571 struct iovec iov[3];
2572 int iovlen = 1;
2573
2574 if (protocol == IPPROTO_UDP)
2575 return -1;
2576
2577 if (protocol == IPPROTO_TCP)
2578 req.nlh.nlmsg_type = TCPDIAG_GETSOCK;
2579 else
2580 req.nlh.nlmsg_type = DCCPDIAG_GETSOCK;
2581 if (show_mem) {
2582 req.r.idiag_ext |= (1<<(INET_DIAG_MEMINFO-1));
2583 req.r.idiag_ext |= (1<<(INET_DIAG_SKMEMINFO-1));
2584 }
2585
2586 if (show_tcpinfo) {
2587 req.r.idiag_ext |= (1<<(INET_DIAG_INFO-1));
2588 req.r.idiag_ext |= (1<<(INET_DIAG_VEGASINFO-1));
2589 req.r.idiag_ext |= (1<<(INET_DIAG_CONG-1));
2590 }
2591
2592 iov[0] = (struct iovec){
2593 .iov_base = &req,
2594 .iov_len = sizeof(req)
2595 };
2596 if (f->f) {
2597 bclen = ssfilter_bytecompile(f->f, &bc);
2598 if (bclen) {
2599 rta.rta_type = INET_DIAG_REQ_BYTECODE;
2600 rta.rta_len = RTA_LENGTH(bclen);
2601 iov[1] = (struct iovec){ &rta, sizeof(rta) };
2602 iov[2] = (struct iovec){ bc, bclen };
2603 req.nlh.nlmsg_len += RTA_LENGTH(bclen);
2604 iovlen = 3;
2605 }
2606 }
2607
2608 msg = (struct msghdr) {
2609 .msg_name = (void *)&nladdr,
2610 .msg_namelen = sizeof(nladdr),
2611 .msg_iov = iov,
2612 .msg_iovlen = iovlen,
2613 };
2614
2615 if (sendmsg(fd, &msg, 0) < 0) {
2616 close(fd);
2617 return -1;
2618 }
2619
2620 return 0;
2621 }
2622
2623 static int sockdiag_send(int family, int fd, int protocol, struct filter *f)
2624 {
2625 struct sockaddr_nl nladdr = { .nl_family = AF_NETLINK };
2626 DIAG_REQUEST(req, struct inet_diag_req_v2 r);
2627 char *bc = NULL;
2628 int bclen;
2629 struct msghdr msg;
2630 struct rtattr rta;
2631 struct iovec iov[3];
2632 int iovlen = 1;
2633
2634 if (family == PF_UNSPEC)
2635 return tcpdiag_send(fd, protocol, f);
2636
2637 memset(&req.r, 0, sizeof(req.r));
2638 req.r.sdiag_family = family;
2639 req.r.sdiag_protocol = protocol;
2640 req.r.idiag_states = f->states;
2641 if (show_mem) {
2642 req.r.idiag_ext |= (1<<(INET_DIAG_MEMINFO-1));
2643 req.r.idiag_ext |= (1<<(INET_DIAG_SKMEMINFO-1));
2644 }
2645
2646 if (show_tcpinfo) {
2647 req.r.idiag_ext |= (1<<(INET_DIAG_INFO-1));
2648 req.r.idiag_ext |= (1<<(INET_DIAG_VEGASINFO-1));
2649 req.r.idiag_ext |= (1<<(INET_DIAG_CONG-1));
2650 }
2651
2652 iov[0] = (struct iovec){
2653 .iov_base = &req,
2654 .iov_len = sizeof(req)
2655 };
2656 if (f->f) {
2657 bclen = ssfilter_bytecompile(f->f, &bc);
2658 if (bclen) {
2659 rta.rta_type = INET_DIAG_REQ_BYTECODE;
2660 rta.rta_len = RTA_LENGTH(bclen);
2661 iov[1] = (struct iovec){ &rta, sizeof(rta) };
2662 iov[2] = (struct iovec){ bc, bclen };
2663 req.nlh.nlmsg_len += RTA_LENGTH(bclen);
2664 iovlen = 3;
2665 }
2666 }
2667
2668 msg = (struct msghdr) {
2669 .msg_name = (void *)&nladdr,
2670 .msg_namelen = sizeof(nladdr),
2671 .msg_iov = iov,
2672 .msg_iovlen = iovlen,
2673 };
2674
2675 if (sendmsg(fd, &msg, 0) < 0) {
2676 close(fd);
2677 return -1;
2678 }
2679
2680 return 0;
2681 }
2682
2683 struct inet_diag_arg {
2684 struct filter *f;
2685 int protocol;
2686 struct rtnl_handle *rth;
2687 };
2688
2689 static int kill_inet_sock(struct nlmsghdr *h, void *arg, struct sockstat *s)
2690 {
2691 struct inet_diag_msg *d = NLMSG_DATA(h);
2692 struct inet_diag_arg *diag_arg = arg;
2693 struct rtnl_handle *rth = diag_arg->rth;
2694
2695 DIAG_REQUEST(req, struct inet_diag_req_v2 r);
2696
2697 req.nlh.nlmsg_type = SOCK_DESTROY;
2698 req.nlh.nlmsg_flags = NLM_F_REQUEST | NLM_F_ACK;
2699 req.nlh.nlmsg_seq = ++rth->seq;
2700 req.r.sdiag_family = d->idiag_family;
2701 req.r.sdiag_protocol = diag_arg->protocol;
2702 req.r.id = d->id;
2703
2704 if (diag_arg->protocol == IPPROTO_RAW) {
2705 struct inet_diag_req_raw *raw = (void *)&req.r;
2706
2707 BUILD_BUG_ON(sizeof(req.r) != sizeof(*raw));
2708 raw->sdiag_raw_protocol = s->raw_prot;
2709 }
2710
2711 return rtnl_talk(rth, &req.nlh, NULL);
2712 }
2713
2714 static int show_one_inet_sock(const struct sockaddr_nl *addr,
2715 struct nlmsghdr *h, void *arg)
2716 {
2717 int err;
2718 struct inet_diag_arg *diag_arg = arg;
2719 struct inet_diag_msg *r = NLMSG_DATA(h);
2720 struct sockstat s = {};
2721
2722 if (!(diag_arg->f->families & FAMILY_MASK(r->idiag_family)))
2723 return 0;
2724
2725 parse_diag_msg(h, &s);
2726 s.type = diag_arg->protocol;
2727
2728 if (diag_arg->f->f && run_ssfilter(diag_arg->f->f, &s) == 0)
2729 return 0;
2730
2731 if (diag_arg->f->kill && kill_inet_sock(h, arg, &s) != 0) {
2732 if (errno == EOPNOTSUPP || errno == ENOENT) {
2733 /* Socket can't be closed, or is already closed. */
2734 return 0;
2735 } else {
2736 perror("SOCK_DESTROY answers");
2737 return -1;
2738 }
2739 }
2740
2741 err = inet_show_sock(h, &s);
2742 if (err < 0)
2743 return err;
2744
2745 return 0;
2746 }
2747
2748 static int inet_show_netlink(struct filter *f, FILE *dump_fp, int protocol)
2749 {
2750 int err = 0;
2751 struct rtnl_handle rth, rth2;
2752 int family = PF_INET;
2753 struct inet_diag_arg arg = { .f = f, .protocol = protocol };
2754
2755 if (rtnl_open_byproto(&rth, 0, NETLINK_SOCK_DIAG))
2756 return -1;
2757
2758 if (f->kill) {
2759 if (rtnl_open_byproto(&rth2, 0, NETLINK_SOCK_DIAG)) {
2760 rtnl_close(&rth);
2761 return -1;
2762 }
2763 arg.rth = &rth2;
2764 }
2765
2766 rth.dump = MAGIC_SEQ;
2767 rth.dump_fp = dump_fp;
2768 if (preferred_family == PF_INET6)
2769 family = PF_INET6;
2770
2771 again:
2772 if ((err = sockdiag_send(family, rth.fd, protocol, f)))
2773 goto Exit;
2774
2775 if ((err = rtnl_dump_filter(&rth, show_one_inet_sock, &arg))) {
2776 if (family != PF_UNSPEC) {
2777 family = PF_UNSPEC;
2778 goto again;
2779 }
2780 goto Exit;
2781 }
2782 if (family == PF_INET && preferred_family != PF_INET) {
2783 family = PF_INET6;
2784 goto again;
2785 }
2786
2787 Exit:
2788 rtnl_close(&rth);
2789 if (arg.rth)
2790 rtnl_close(arg.rth);
2791 return err;
2792 }
2793
2794 static int tcp_show_netlink_file(struct filter *f)
2795 {
2796 FILE *fp;
2797 char buf[16384];
2798 int err = -1;
2799
2800 if ((fp = fopen(getenv("TCPDIAG_FILE"), "r")) == NULL) {
2801 perror("fopen($TCPDIAG_FILE)");
2802 return err;
2803 }
2804
2805 while (1) {
2806 int status, err2;
2807 struct nlmsghdr *h = (struct nlmsghdr *)buf;
2808 struct sockstat s = {};
2809
2810 status = fread(buf, 1, sizeof(*h), fp);
2811 if (status < 0) {
2812 perror("Reading header from $TCPDIAG_FILE");
2813 break;
2814 }
2815 if (status != sizeof(*h)) {
2816 perror("Unexpected EOF reading $TCPDIAG_FILE");
2817 break;
2818 }
2819
2820 status = fread(h+1, 1, NLMSG_ALIGN(h->nlmsg_len-sizeof(*h)), fp);
2821
2822 if (status < 0) {
2823 perror("Reading $TCPDIAG_FILE");
2824 break;
2825 }
2826 if (status + sizeof(*h) < h->nlmsg_len) {
2827 perror("Unexpected EOF reading $TCPDIAG_FILE");
2828 break;
2829 }
2830
2831 /* The only legal exit point */
2832 if (h->nlmsg_type == NLMSG_DONE) {
2833 err = 0;
2834 break;
2835 }
2836
2837 if (h->nlmsg_type == NLMSG_ERROR) {
2838 struct nlmsgerr *err = (struct nlmsgerr *)NLMSG_DATA(h);
2839
2840 if (h->nlmsg_len < NLMSG_LENGTH(sizeof(struct nlmsgerr))) {
2841 fprintf(stderr, "ERROR truncated\n");
2842 } else {
2843 errno = -err->error;
2844 perror("TCPDIAG answered");
2845 }
2846 break;
2847 }
2848
2849 parse_diag_msg(h, &s);
2850 s.type = IPPROTO_TCP;
2851
2852 if (f && f->f && run_ssfilter(f->f, &s) == 0)
2853 continue;
2854
2855 err2 = inet_show_sock(h, &s);
2856 if (err2 < 0) {
2857 err = err2;
2858 break;
2859 }
2860 }
2861
2862 fclose(fp);
2863 return err;
2864 }
2865
2866 static int tcp_show(struct filter *f)
2867 {
2868 FILE *fp = NULL;
2869 char *buf = NULL;
2870 int bufsize = 64*1024;
2871
2872 if (!filter_af_get(f, AF_INET) && !filter_af_get(f, AF_INET6))
2873 return 0;
2874
2875 dg_proto = TCP_PROTO;
2876
2877 if (getenv("TCPDIAG_FILE"))
2878 return tcp_show_netlink_file(f);
2879
2880 if (!getenv("PROC_NET_TCP") && !getenv("PROC_ROOT")
2881 && inet_show_netlink(f, NULL, IPPROTO_TCP) == 0)
2882 return 0;
2883
2884 /* Sigh... We have to parse /proc/net/tcp... */
2885
2886
2887 /* Estimate amount of sockets and try to allocate
2888 * huge buffer to read all the table at one read.
2889 * Limit it by 16MB though. The assumption is: as soon as
2890 * kernel was able to hold information about N connections,
2891 * it is able to give us some memory for snapshot.
2892 */
2893 if (1) {
2894 get_slabstat(&slabstat);
2895
2896 int guess = slabstat.socks+slabstat.tcp_syns;
2897
2898 if (f->states&(1<<SS_TIME_WAIT))
2899 guess += slabstat.tcp_tws;
2900 if (guess > (16*1024*1024)/128)
2901 guess = (16*1024*1024)/128;
2902 guess *= 128;
2903 if (guess > bufsize)
2904 bufsize = guess;
2905 }
2906 while (bufsize >= 64*1024) {
2907 if ((buf = malloc(bufsize)) != NULL)
2908 break;
2909 bufsize /= 2;
2910 }
2911 if (buf == NULL) {
2912 errno = ENOMEM;
2913 return -1;
2914 }
2915
2916 if (f->families & FAMILY_MASK(AF_INET)) {
2917 if ((fp = net_tcp_open()) == NULL)
2918 goto outerr;
2919
2920 setbuffer(fp, buf, bufsize);
2921 if (generic_record_read(fp, tcp_show_line, f, AF_INET))
2922 goto outerr;
2923 fclose(fp);
2924 }
2925
2926 if ((f->families & FAMILY_MASK(AF_INET6)) &&
2927 (fp = net_tcp6_open()) != NULL) {
2928 setbuffer(fp, buf, bufsize);
2929 if (generic_record_read(fp, tcp_show_line, f, AF_INET6))
2930 goto outerr;
2931 fclose(fp);
2932 }
2933
2934 free(buf);
2935 return 0;
2936
2937 outerr:
2938 do {
2939 int saved_errno = errno;
2940
2941 free(buf);
2942 if (fp)
2943 fclose(fp);
2944 errno = saved_errno;
2945 return -1;
2946 } while (0);
2947 }
2948
2949 static int dccp_show(struct filter *f)
2950 {
2951 if (!filter_af_get(f, AF_INET) && !filter_af_get(f, AF_INET6))
2952 return 0;
2953
2954 if (!getenv("PROC_NET_DCCP") && !getenv("PROC_ROOT")
2955 && inet_show_netlink(f, NULL, IPPROTO_DCCP) == 0)
2956 return 0;
2957
2958 return 0;
2959 }
2960
2961 static int sctp_show(struct filter *f)
2962 {
2963 if (!filter_af_get(f, AF_INET) && !filter_af_get(f, AF_INET6))
2964 return 0;
2965
2966 if (!getenv("PROC_NET_SCTP") && !getenv("PROC_ROOT")
2967 && inet_show_netlink(f, NULL, IPPROTO_SCTP) == 0)
2968 return 0;
2969
2970 return 0;
2971 }
2972
2973 static int dgram_show_line(char *line, const struct filter *f, int family)
2974 {
2975 struct sockstat s = {};
2976 char *loc, *rem, *data;
2977 char opt[256];
2978 int n;
2979
2980 if (proc_inet_split_line(line, &loc, &rem, &data))
2981 return -1;
2982
2983 int state = (data[1] >= 'A') ? (data[1] - 'A' + 10) : (data[1] - '0');
2984
2985 if (!(f->states & (1 << state)))
2986 return 0;
2987
2988 proc_parse_inet_addr(loc, rem, family, &s);
2989
2990 if (f->f && run_ssfilter(f->f, &s) == 0)
2991 return 0;
2992
2993 opt[0] = 0;
2994 n = sscanf(data, "%x %x:%x %*x:%*x %*x %d %*d %u %d %llx %[^\n]\n",
2995 &s.state, &s.wq, &s.rq,
2996 &s.uid, &s.ino,
2997 &s.refcnt, &s.sk, opt);
2998
2999 if (n < 9)
3000 opt[0] = 0;
3001
3002 s.type = dg_proto == UDP_PROTO ? IPPROTO_UDP : 0;
3003 inet_stats_print(&s, false);
3004
3005 if (show_details && opt[0])
3006 out(" opt:\"%s\"", opt);
3007
3008 out("\n");
3009 return 0;
3010 }
3011
3012 static int udp_show(struct filter *f)
3013 {
3014 FILE *fp = NULL;
3015
3016 if (!filter_af_get(f, AF_INET) && !filter_af_get(f, AF_INET6))
3017 return 0;
3018
3019 dg_proto = UDP_PROTO;
3020
3021 if (!getenv("PROC_NET_UDP") && !getenv("PROC_ROOT")
3022 && inet_show_netlink(f, NULL, IPPROTO_UDP) == 0)
3023 return 0;
3024
3025 if (f->families&FAMILY_MASK(AF_INET)) {
3026 if ((fp = net_udp_open()) == NULL)
3027 goto outerr;
3028 if (generic_record_read(fp, dgram_show_line, f, AF_INET))
3029 goto outerr;
3030 fclose(fp);
3031 }
3032
3033 if ((f->families&FAMILY_MASK(AF_INET6)) &&
3034 (fp = net_udp6_open()) != NULL) {
3035 if (generic_record_read(fp, dgram_show_line, f, AF_INET6))
3036 goto outerr;
3037 fclose(fp);
3038 }
3039 return 0;
3040
3041 outerr:
3042 do {
3043 int saved_errno = errno;
3044
3045 if (fp)
3046 fclose(fp);
3047 errno = saved_errno;
3048 return -1;
3049 } while (0);
3050 }
3051
3052 static int raw_show(struct filter *f)
3053 {
3054 FILE *fp = NULL;
3055
3056 if (!filter_af_get(f, AF_INET) && !filter_af_get(f, AF_INET6))
3057 return 0;
3058
3059 dg_proto = RAW_PROTO;
3060
3061 if (!getenv("PROC_NET_RAW") && !getenv("PROC_ROOT") &&
3062 inet_show_netlink(f, NULL, IPPROTO_RAW) == 0)
3063 return 0;
3064
3065 if (f->families&FAMILY_MASK(AF_INET)) {
3066 if ((fp = net_raw_open()) == NULL)
3067 goto outerr;
3068 if (generic_record_read(fp, dgram_show_line, f, AF_INET))
3069 goto outerr;
3070 fclose(fp);
3071 }
3072
3073 if ((f->families&FAMILY_MASK(AF_INET6)) &&
3074 (fp = net_raw6_open()) != NULL) {
3075 if (generic_record_read(fp, dgram_show_line, f, AF_INET6))
3076 goto outerr;
3077 fclose(fp);
3078 }
3079 return 0;
3080
3081 outerr:
3082 do {
3083 int saved_errno = errno;
3084
3085 if (fp)
3086 fclose(fp);
3087 errno = saved_errno;
3088 return -1;
3089 } while (0);
3090 }
3091
3092 #define MAX_UNIX_REMEMBER (1024*1024/sizeof(struct sockstat))
3093
3094 static void unix_list_drop_first(struct sockstat **list)
3095 {
3096 struct sockstat *s = *list;
3097
3098 (*list) = (*list)->next;
3099 free(s->name);
3100 free(s);
3101 }
3102
3103 static bool unix_type_skip(struct sockstat *s, struct filter *f)
3104 {
3105 if (s->type == SOCK_STREAM && !(f->dbs&(1<<UNIX_ST_DB)))
3106 return true;
3107 if (s->type == SOCK_DGRAM && !(f->dbs&(1<<UNIX_DG_DB)))
3108 return true;
3109 if (s->type == SOCK_SEQPACKET && !(f->dbs&(1<<UNIX_SQ_DB)))
3110 return true;
3111 return false;
3112 }
3113
3114 static void unix_stats_print(struct sockstat *s, struct filter *f)
3115 {
3116 char port_name[30] = {};
3117
3118 sock_state_print(s);
3119
3120 sock_addr_print(s->name ?: "*", " ",
3121 int_to_str(s->lport, port_name), NULL);
3122 sock_addr_print(s->peer_name ?: "*", " ",
3123 int_to_str(s->rport, port_name), NULL);
3124
3125 proc_ctx_print(s);
3126 }
3127
3128 static int unix_show_sock(const struct sockaddr_nl *addr, struct nlmsghdr *nlh,
3129 void *arg)
3130 {
3131 struct filter *f = (struct filter *)arg;
3132 struct unix_diag_msg *r = NLMSG_DATA(nlh);
3133 struct rtattr *tb[UNIX_DIAG_MAX+1];
3134 char name[128];
3135 struct sockstat stat = { .name = "*", .peer_name = "*" };
3136
3137 parse_rtattr(tb, UNIX_DIAG_MAX, (struct rtattr *)(r+1),
3138 nlh->nlmsg_len - NLMSG_LENGTH(sizeof(*r)));
3139
3140 stat.type = r->udiag_type;
3141 stat.state = r->udiag_state;
3142 stat.ino = stat.lport = r->udiag_ino;
3143 stat.local.family = stat.remote.family = AF_UNIX;
3144
3145 if (unix_type_skip(&stat, f))
3146 return 0;
3147
3148 if (tb[UNIX_DIAG_RQLEN]) {
3149 struct unix_diag_rqlen *rql = RTA_DATA(tb[UNIX_DIAG_RQLEN]);
3150
3151 stat.rq = rql->udiag_rqueue;
3152 stat.wq = rql->udiag_wqueue;
3153 }
3154 if (tb[UNIX_DIAG_NAME]) {
3155 int len = RTA_PAYLOAD(tb[UNIX_DIAG_NAME]);
3156
3157 memcpy(name, RTA_DATA(tb[UNIX_DIAG_NAME]), len);
3158 name[len] = '\0';
3159 if (name[0] == '\0') {
3160 int i;
3161 for (i = 0; i < len; i++)
3162 if (name[i] == '\0')
3163 name[i] = '@';
3164 }
3165 stat.name = &name[0];
3166 memcpy(stat.local.data, &stat.name, sizeof(stat.name));
3167 }
3168 if (tb[UNIX_DIAG_PEER])
3169 stat.rport = rta_getattr_u32(tb[UNIX_DIAG_PEER]);
3170
3171 if (f->f && run_ssfilter(f->f, &stat) == 0)
3172 return 0;
3173
3174 unix_stats_print(&stat, f);
3175
3176 if (show_mem)
3177 print_skmeminfo(tb, UNIX_DIAG_MEMINFO);
3178 if (show_details) {
3179 if (tb[UNIX_DIAG_SHUTDOWN]) {
3180 unsigned char mask;
3181
3182 mask = rta_getattr_u8(tb[UNIX_DIAG_SHUTDOWN]);
3183 out(" %c-%c",
3184 mask & 1 ? '-' : '<', mask & 2 ? '-' : '>');
3185 }
3186 }
3187 out("\n");
3188
3189 return 0;
3190 }
3191
3192 static int handle_netlink_request(struct filter *f, struct nlmsghdr *req,
3193 size_t size, rtnl_filter_t show_one_sock)
3194 {
3195 int ret = -1;
3196 struct rtnl_handle rth;
3197
3198 if (rtnl_open_byproto(&rth, 0, NETLINK_SOCK_DIAG))
3199 return -1;
3200
3201 rth.dump = MAGIC_SEQ;
3202
3203 if (rtnl_send(&rth, req, size) < 0)
3204 goto Exit;
3205
3206 if (rtnl_dump_filter(&rth, show_one_sock, f))
3207 goto Exit;
3208
3209 ret = 0;
3210 Exit:
3211 rtnl_close(&rth);
3212 return ret;
3213 }
3214
3215 static int unix_show_netlink(struct filter *f)
3216 {
3217 DIAG_REQUEST(req, struct unix_diag_req r);
3218
3219 req.r.sdiag_family = AF_UNIX;
3220 req.r.udiag_states = f->states;
3221 req.r.udiag_show = UDIAG_SHOW_NAME | UDIAG_SHOW_PEER | UDIAG_SHOW_RQLEN;
3222 if (show_mem)
3223 req.r.udiag_show |= UDIAG_SHOW_MEMINFO;
3224
3225 return handle_netlink_request(f, &req.nlh, sizeof(req), unix_show_sock);
3226 }
3227
3228 static int unix_show(struct filter *f)
3229 {
3230 FILE *fp;
3231 char buf[256];
3232 char name[128];
3233 int newformat = 0;
3234 int cnt;
3235 struct sockstat *list = NULL;
3236 const int unix_state_map[] = { SS_CLOSE, SS_SYN_SENT,
3237 SS_ESTABLISHED, SS_CLOSING };
3238
3239 if (!filter_af_get(f, AF_UNIX))
3240 return 0;
3241
3242 if (!getenv("PROC_NET_UNIX") && !getenv("PROC_ROOT")
3243 && unix_show_netlink(f) == 0)
3244 return 0;
3245
3246 if ((fp = net_unix_open()) == NULL)
3247 return -1;
3248 if (!fgets(buf, sizeof(buf), fp)) {
3249 fclose(fp);
3250 return -1;
3251 }
3252
3253 if (memcmp(buf, "Peer", 4) == 0)
3254 newformat = 1;
3255 cnt = 0;
3256
3257 while (fgets(buf, sizeof(buf), fp)) {
3258 struct sockstat *u, **insp;
3259 int flags;
3260
3261 if (!(u = calloc(1, sizeof(*u))))
3262 break;
3263
3264 if (sscanf(buf, "%x: %x %x %x %x %x %d %s",
3265 &u->rport, &u->rq, &u->wq, &flags, &u->type,
3266 &u->state, &u->ino, name) < 8)
3267 name[0] = 0;
3268
3269 u->lport = u->ino;
3270 u->local.family = u->remote.family = AF_UNIX;
3271
3272 if (flags & (1 << 16)) {
3273 u->state = SS_LISTEN;
3274 } else if (u->state > 0 &&
3275 u->state <= ARRAY_SIZE(unix_state_map)) {
3276 u->state = unix_state_map[u->state-1];
3277 if (u->type == SOCK_DGRAM && u->state == SS_CLOSE && u->rport)
3278 u->state = SS_ESTABLISHED;
3279 }
3280 if (unix_type_skip(u, f) ||
3281 !(f->states & (1 << u->state))) {
3282 free(u);
3283 continue;
3284 }
3285
3286 if (!newformat) {
3287 u->rport = 0;
3288 u->rq = 0;
3289 u->wq = 0;
3290 }
3291
3292 if (name[0]) {
3293 u->name = strdup(name);
3294 if (!u->name) {
3295 free(u);
3296 break;
3297 }
3298 }
3299
3300 if (u->rport) {
3301 struct sockstat *p;
3302
3303 for (p = list; p; p = p->next) {
3304 if (u->rport == p->lport)
3305 break;
3306 }
3307 if (!p)
3308 u->peer_name = "?";
3309 else
3310 u->peer_name = p->name ? : "*";
3311 }
3312
3313 if (f->f) {
3314 struct sockstat st = {
3315 .local.family = AF_UNIX,
3316 .remote.family = AF_UNIX,
3317 };
3318
3319 memcpy(st.local.data, &u->name, sizeof(u->name));
3320 if (strcmp(u->peer_name, "*"))
3321 memcpy(st.remote.data, &u->peer_name,
3322 sizeof(u->peer_name));
3323 if (run_ssfilter(f->f, &st) == 0) {
3324 free(u->name);
3325 free(u);
3326 continue;
3327 }
3328 }
3329
3330 insp = &list;
3331 while (*insp) {
3332 if (u->type < (*insp)->type ||
3333 (u->type == (*insp)->type &&
3334 u->ino < (*insp)->ino))
3335 break;
3336 insp = &(*insp)->next;
3337 }
3338 u->next = *insp;
3339 *insp = u;
3340
3341 if (++cnt > MAX_UNIX_REMEMBER) {
3342 while (list) {
3343 unix_stats_print(list, f);
3344 out("\n");
3345
3346 unix_list_drop_first(&list);
3347 }
3348 cnt = 0;
3349 }
3350 }
3351 fclose(fp);
3352 while (list) {
3353 unix_stats_print(list, f);
3354 out("\n");
3355
3356 unix_list_drop_first(&list);
3357 }
3358
3359 return 0;
3360 }
3361
3362 static int packet_stats_print(struct sockstat *s, const struct filter *f)
3363 {
3364 const char *addr, *port;
3365 char ll_name[16];
3366
3367 s->local.family = s->remote.family = AF_PACKET;
3368
3369 if (f->f) {
3370 s->local.data[0] = s->prot;
3371 if (run_ssfilter(f->f, s) == 0)
3372 return 1;
3373 }
3374
3375 sock_state_print(s);
3376
3377 if (s->prot == 3)
3378 addr = "*";
3379 else
3380 addr = ll_proto_n2a(htons(s->prot), ll_name, sizeof(ll_name));
3381
3382 if (s->iface == 0)
3383 port = "*";
3384 else
3385 port = xll_index_to_name(s->iface);
3386
3387 sock_addr_print(addr, ":", port, NULL);
3388 sock_addr_print("", "*", "", NULL);
3389
3390 proc_ctx_print(s);
3391
3392 if (show_details)
3393 sock_details_print(s);
3394
3395 return 0;
3396 }
3397
3398 static void packet_show_ring(struct packet_diag_ring *ring)
3399 {
3400 out("blk_size:%d", ring->pdr_block_size);
3401 out(",blk_nr:%d", ring->pdr_block_nr);
3402 out(",frm_size:%d", ring->pdr_frame_size);
3403 out(",frm_nr:%d", ring->pdr_frame_nr);
3404 out(",tmo:%d", ring->pdr_retire_tmo);
3405 out(",features:0x%x", ring->pdr_features);
3406 }
3407
3408 static int packet_show_sock(const struct sockaddr_nl *addr,
3409 struct nlmsghdr *nlh, void *arg)
3410 {
3411 const struct filter *f = arg;
3412 struct packet_diag_msg *r = NLMSG_DATA(nlh);
3413 struct packet_diag_info *pinfo = NULL;
3414 struct packet_diag_ring *ring_rx = NULL, *ring_tx = NULL;
3415 struct rtattr *tb[PACKET_DIAG_MAX+1];
3416 struct sockstat stat = {};
3417 uint32_t fanout = 0;
3418 bool has_fanout = false;
3419
3420 parse_rtattr(tb, PACKET_DIAG_MAX, (struct rtattr *)(r+1),
3421 nlh->nlmsg_len - NLMSG_LENGTH(sizeof(*r)));
3422
3423 /* use /proc/net/packet if all info are not available */
3424 if (!tb[PACKET_DIAG_MEMINFO])
3425 return -1;
3426
3427 stat.type = r->pdiag_type;
3428 stat.prot = r->pdiag_num;
3429 stat.ino = r->pdiag_ino;
3430 stat.state = SS_CLOSE;
3431 stat.sk = cookie_sk_get(&r->pdiag_cookie[0]);
3432
3433 if (tb[PACKET_DIAG_MEMINFO]) {
3434 __u32 *skmeminfo = RTA_DATA(tb[PACKET_DIAG_MEMINFO]);
3435
3436 stat.rq = skmeminfo[SK_MEMINFO_RMEM_ALLOC];
3437 }
3438
3439 if (tb[PACKET_DIAG_INFO]) {
3440 pinfo = RTA_DATA(tb[PACKET_DIAG_INFO]);
3441 stat.lport = stat.iface = pinfo->pdi_index;
3442 }
3443
3444 if (tb[PACKET_DIAG_UID])
3445 stat.uid = rta_getattr_u32(tb[PACKET_DIAG_UID]);
3446
3447 if (tb[PACKET_DIAG_RX_RING])
3448 ring_rx = RTA_DATA(tb[PACKET_DIAG_RX_RING]);
3449
3450 if (tb[PACKET_DIAG_TX_RING])
3451 ring_tx = RTA_DATA(tb[PACKET_DIAG_TX_RING]);
3452
3453 if (tb[PACKET_DIAG_FANOUT]) {
3454 has_fanout = true;
3455 fanout = rta_getattr_u32(tb[PACKET_DIAG_FANOUT]);
3456 }
3457
3458 if (packet_stats_print(&stat, f))
3459 return 0;
3460
3461 if (show_details) {
3462 if (pinfo) {
3463 out("\n\tver:%d", pinfo->pdi_version);
3464 out(" cpy_thresh:%d", pinfo->pdi_copy_thresh);
3465 out(" flags( ");
3466 if (pinfo->pdi_flags & PDI_RUNNING)
3467 out("running");
3468 if (pinfo->pdi_flags & PDI_AUXDATA)
3469 out(" auxdata");
3470 if (pinfo->pdi_flags & PDI_ORIGDEV)
3471 out(" origdev");
3472 if (pinfo->pdi_flags & PDI_VNETHDR)
3473 out(" vnethdr");
3474 if (pinfo->pdi_flags & PDI_LOSS)
3475 out(" loss");
3476 if (!pinfo->pdi_flags)
3477 out("0");
3478 out(" )");
3479 }
3480 if (ring_rx) {
3481 out("\n\tring_rx(");
3482 packet_show_ring(ring_rx);
3483 out(")");
3484 }
3485 if (ring_tx) {
3486 out("\n\tring_tx(");
3487 packet_show_ring(ring_tx);
3488 out(")");
3489 }
3490 if (has_fanout) {
3491 uint16_t type = (fanout >> 16) & 0xffff;
3492
3493 out("\n\tfanout(");
3494 out("id:%d,", fanout & 0xffff);
3495 out("type:");
3496
3497 if (type == 0)
3498 out("hash");
3499 else if (type == 1)
3500 out("lb");
3501 else if (type == 2)
3502 out("cpu");
3503 else if (type == 3)
3504 out("roll");
3505 else if (type == 4)
3506 out("random");
3507 else if (type == 5)
3508 out("qm");
3509 else
3510 out("0x%x", type);
3511
3512 out(")");
3513 }
3514 }
3515
3516 if (show_bpf && tb[PACKET_DIAG_FILTER]) {
3517 struct sock_filter *fil =
3518 RTA_DATA(tb[PACKET_DIAG_FILTER]);
3519 int num = RTA_PAYLOAD(tb[PACKET_DIAG_FILTER]) /
3520 sizeof(struct sock_filter);
3521
3522 out("\n\tbpf filter (%d): ", num);
3523 while (num) {
3524 out(" 0x%02x %u %u %u,",
3525 fil->code, fil->jt, fil->jf, fil->k);
3526 num--;
3527 fil++;
3528 }
3529 }
3530 out("\n");
3531 return 0;
3532 }
3533
3534 static int packet_show_netlink(struct filter *f)
3535 {
3536 DIAG_REQUEST(req, struct packet_diag_req r);
3537
3538 req.r.sdiag_family = AF_PACKET;
3539 req.r.pdiag_show = PACKET_SHOW_INFO | PACKET_SHOW_MEMINFO |
3540 PACKET_SHOW_FILTER | PACKET_SHOW_RING_CFG | PACKET_SHOW_FANOUT;
3541
3542 return handle_netlink_request(f, &req.nlh, sizeof(req), packet_show_sock);
3543 }
3544
3545 static int packet_show_line(char *buf, const struct filter *f, int fam)
3546 {
3547 unsigned long long sk;
3548 struct sockstat stat = {};
3549 int type, prot, iface, state, rq, uid, ino;
3550
3551 sscanf(buf, "%llx %*d %d %x %d %d %u %u %u",
3552 &sk,
3553 &type, &prot, &iface, &state,
3554 &rq, &uid, &ino);
3555
3556 if (stat.type == SOCK_RAW && !(f->dbs&(1<<PACKET_R_DB)))
3557 return 0;
3558 if (stat.type == SOCK_DGRAM && !(f->dbs&(1<<PACKET_DG_DB)))
3559 return 0;
3560
3561 stat.type = type;
3562 stat.prot = prot;
3563 stat.lport = stat.iface = iface;
3564 stat.state = state;
3565 stat.rq = rq;
3566 stat.uid = uid;
3567 stat.ino = ino;
3568 stat.state = SS_CLOSE;
3569
3570 if (packet_stats_print(&stat, f))
3571 return 0;
3572
3573 out("\n");
3574 return 0;
3575 }
3576
3577 static int packet_show(struct filter *f)
3578 {
3579 FILE *fp;
3580 int rc = 0;
3581
3582 if (!filter_af_get(f, AF_PACKET) || !(f->states & (1 << SS_CLOSE)))
3583 return 0;
3584
3585 if (!getenv("PROC_NET_PACKET") && !getenv("PROC_ROOT") &&
3586 packet_show_netlink(f) == 0)
3587 return 0;
3588
3589 if ((fp = net_packet_open()) == NULL)
3590 return -1;
3591 if (generic_record_read(fp, packet_show_line, f, AF_PACKET))
3592 rc = -1;
3593
3594 fclose(fp);
3595 return rc;
3596 }
3597
3598 static int netlink_show_one(struct filter *f,
3599 int prot, int pid, unsigned int groups,
3600 int state, int dst_pid, unsigned int dst_group,
3601 int rq, int wq,
3602 unsigned long long sk, unsigned long long cb)
3603 {
3604 struct sockstat st = {
3605 .state = SS_CLOSE,
3606 .rq = rq,
3607 .wq = wq,
3608 .local.family = AF_NETLINK,
3609 .remote.family = AF_NETLINK,
3610 };
3611
3612 SPRINT_BUF(prot_buf) = {};
3613 const char *prot_name;
3614 char procname[64] = {};
3615
3616 if (f->f) {
3617 st.rport = -1;
3618 st.lport = pid;
3619 st.local.data[0] = prot;
3620 if (run_ssfilter(f->f, &st) == 0)
3621 return 1;
3622 }
3623
3624 sock_state_print(&st);
3625
3626 if (resolve_services)
3627 prot_name = nl_proto_n2a(prot, prot_buf, sizeof(prot_buf));
3628 else
3629 prot_name = int_to_str(prot, prot_buf);
3630
3631 if (pid == -1) {
3632 procname[0] = '*';
3633 } else if (resolve_services) {
3634 int done = 0;
3635
3636 if (!pid) {
3637 done = 1;
3638 strncpy(procname, "kernel", 6);
3639 } else if (pid > 0) {
3640 FILE *fp;
3641
3642 snprintf(procname, sizeof(procname), "%s/%d/stat",
3643 getenv("PROC_ROOT") ? : "/proc", pid);
3644 if ((fp = fopen(procname, "r")) != NULL) {
3645 if (fscanf(fp, "%*d (%[^)])", procname) == 1) {
3646 snprintf(procname+strlen(procname),
3647 sizeof(procname)-strlen(procname),
3648 "/%d", pid);
3649 done = 1;
3650 }
3651 fclose(fp);
3652 }
3653 }
3654 if (!done)
3655 int_to_str(pid, procname);
3656 } else {
3657 int_to_str(pid, procname);
3658 }
3659
3660 sock_addr_print(prot_name, ":", procname, NULL);
3661
3662 if (state == NETLINK_CONNECTED) {
3663 char dst_group_buf[30];
3664 char dst_pid_buf[30];
3665
3666 sock_addr_print(int_to_str(dst_group, dst_group_buf), ":",
3667 int_to_str(dst_pid, dst_pid_buf), NULL);
3668 } else {
3669 sock_addr_print("", "*", "", NULL);
3670 }
3671
3672 char *pid_context = NULL;
3673
3674 if (show_proc_ctx) {
3675 /* The pid value will either be:
3676 * 0 if destination kernel - show kernel initial context.
3677 * A valid process pid - use getpidcon.
3678 * A unique value allocated by the kernel or netlink user
3679 * to the process - show context as "not available".
3680 */
3681 if (!pid)
3682 security_get_initial_context("kernel", &pid_context);
3683 else if (pid > 0)
3684 getpidcon(pid, &pid_context);
3685
3686 out(" proc_ctx=%s", pid_context ? : "unavailable");
3687 free(pid_context);
3688 }
3689
3690 if (show_details) {
3691 out(" sk=%llx cb=%llx groups=0x%08x", sk, cb, groups);
3692 }
3693 out("\n");
3694
3695 return 0;
3696 }
3697
3698 static int netlink_show_sock(const struct sockaddr_nl *addr,
3699 struct nlmsghdr *nlh, void *arg)
3700 {
3701 struct filter *f = (struct filter *)arg;
3702 struct netlink_diag_msg *r = NLMSG_DATA(nlh);
3703 struct rtattr *tb[NETLINK_DIAG_MAX+1];
3704 int rq = 0, wq = 0;
3705 unsigned long groups = 0;
3706
3707 parse_rtattr(tb, NETLINK_DIAG_MAX, (struct rtattr *)(r+1),
3708 nlh->nlmsg_len - NLMSG_LENGTH(sizeof(*r)));
3709
3710 if (tb[NETLINK_DIAG_GROUPS] && RTA_PAYLOAD(tb[NETLINK_DIAG_GROUPS]))
3711 groups = *(unsigned long *) RTA_DATA(tb[NETLINK_DIAG_GROUPS]);
3712
3713 if (tb[NETLINK_DIAG_MEMINFO]) {
3714 const __u32 *skmeminfo;
3715
3716 skmeminfo = RTA_DATA(tb[NETLINK_DIAG_MEMINFO]);
3717
3718 rq = skmeminfo[SK_MEMINFO_RMEM_ALLOC];
3719 wq = skmeminfo[SK_MEMINFO_WMEM_ALLOC];
3720 }
3721
3722 if (netlink_show_one(f, r->ndiag_protocol, r->ndiag_portid, groups,
3723 r->ndiag_state, r->ndiag_dst_portid, r->ndiag_dst_group,
3724 rq, wq, 0, 0)) {
3725 return 0;
3726 }
3727
3728 if (show_mem) {
3729 out("\t");
3730 print_skmeminfo(tb, NETLINK_DIAG_MEMINFO);
3731 out("\n");
3732 }
3733
3734 return 0;
3735 }
3736
3737 static int netlink_show_netlink(struct filter *f)
3738 {
3739 DIAG_REQUEST(req, struct netlink_diag_req r);
3740
3741 req.r.sdiag_family = AF_NETLINK;
3742 req.r.sdiag_protocol = NDIAG_PROTO_ALL;
3743 req.r.ndiag_show = NDIAG_SHOW_GROUPS | NDIAG_SHOW_MEMINFO;
3744
3745 return handle_netlink_request(f, &req.nlh, sizeof(req), netlink_show_sock);
3746 }
3747
3748 static int netlink_show(struct filter *f)
3749 {
3750 FILE *fp;
3751 char buf[256];
3752 int prot, pid;
3753 unsigned int groups;
3754 int rq, wq, rc;
3755 unsigned long long sk, cb;
3756
3757 if (!filter_af_get(f, AF_NETLINK) || !(f->states & (1 << SS_CLOSE)))
3758 return 0;
3759
3760 if (!getenv("PROC_NET_NETLINK") && !getenv("PROC_ROOT") &&
3761 netlink_show_netlink(f) == 0)
3762 return 0;
3763
3764 if ((fp = net_netlink_open()) == NULL)
3765 return -1;
3766 if (!fgets(buf, sizeof(buf), fp)) {
3767 fclose(fp);
3768 return -1;
3769 }
3770
3771 while (fgets(buf, sizeof(buf), fp)) {
3772 sscanf(buf, "%llx %d %d %x %d %d %llx %d",
3773 &sk,
3774 &prot, &pid, &groups, &rq, &wq, &cb, &rc);
3775
3776 netlink_show_one(f, prot, pid, groups, 0, 0, 0, rq, wq, sk, cb);
3777 }
3778
3779 fclose(fp);
3780 return 0;
3781 }
3782
3783 static bool vsock_type_skip(struct sockstat *s, struct filter *f)
3784 {
3785 if (s->type == SOCK_STREAM && !(f->dbs & (1 << VSOCK_ST_DB)))
3786 return true;
3787 if (s->type == SOCK_DGRAM && !(f->dbs & (1 << VSOCK_DG_DB)))
3788 return true;
3789 return false;
3790 }
3791
3792 static void vsock_addr_print(inet_prefix *a, __u32 port)
3793 {
3794 char cid_str[sizeof("4294967295")];
3795 char port_str[sizeof("4294967295")];
3796 __u32 cid;
3797
3798 memcpy(&cid, a->data, sizeof(cid));
3799
3800 if (cid == ~(__u32)0)
3801 snprintf(cid_str, sizeof(cid_str), "*");
3802 else
3803 snprintf(cid_str, sizeof(cid_str), "%u", cid);
3804
3805 if (port == ~(__u32)0)
3806 snprintf(port_str, sizeof(port_str), "*");
3807 else
3808 snprintf(port_str, sizeof(port_str), "%u", port);
3809
3810 sock_addr_print(cid_str, ":", port_str, NULL);
3811 }
3812
3813 static void vsock_stats_print(struct sockstat *s, struct filter *f)
3814 {
3815 sock_state_print(s);
3816
3817 vsock_addr_print(&s->local, s->lport);
3818 vsock_addr_print(&s->remote, s->rport);
3819
3820 proc_ctx_print(s);
3821
3822 out("\n");
3823 }
3824
3825 static int vsock_show_sock(const struct sockaddr_nl *addr,
3826 struct nlmsghdr *nlh, void *arg)
3827 {
3828 struct filter *f = (struct filter *)arg;
3829 struct vsock_diag_msg *r = NLMSG_DATA(nlh);
3830 struct sockstat stat = {
3831 .type = r->vdiag_type,
3832 .lport = r->vdiag_src_port,
3833 .rport = r->vdiag_dst_port,
3834 .state = r->vdiag_state,
3835 .ino = r->vdiag_ino,
3836 };
3837
3838 vsock_set_inet_prefix(&stat.local, r->vdiag_src_cid);
3839 vsock_set_inet_prefix(&stat.remote, r->vdiag_dst_cid);
3840
3841 if (vsock_type_skip(&stat, f))
3842 return 0;
3843
3844 if (f->f && run_ssfilter(f->f, &stat) == 0)
3845 return 0;
3846
3847 vsock_stats_print(&stat, f);
3848
3849 return 0;
3850 }
3851
3852 static int vsock_show(struct filter *f)
3853 {
3854 DIAG_REQUEST(req, struct vsock_diag_req r);
3855
3856 if (!filter_af_get(f, AF_VSOCK))
3857 return 0;
3858
3859 req.r.sdiag_family = AF_VSOCK;
3860 req.r.vdiag_states = f->states;
3861
3862 return handle_netlink_request(f, &req.nlh, sizeof(req), vsock_show_sock);
3863 }
3864
3865 struct sock_diag_msg {
3866 __u8 sdiag_family;
3867 };
3868
3869 static int generic_show_sock(const struct sockaddr_nl *addr,
3870 struct nlmsghdr *nlh, void *arg)
3871 {
3872 struct sock_diag_msg *r = NLMSG_DATA(nlh);
3873 struct inet_diag_arg inet_arg = { .f = arg, .protocol = IPPROTO_MAX };
3874
3875 switch (r->sdiag_family) {
3876 case AF_INET:
3877 case AF_INET6:
3878 return show_one_inet_sock(addr, nlh, &inet_arg);
3879 case AF_UNIX:
3880 return unix_show_sock(addr, nlh, arg);
3881 case AF_PACKET:
3882 return packet_show_sock(addr, nlh, arg);
3883 case AF_NETLINK:
3884 return netlink_show_sock(addr, nlh, arg);
3885 case AF_VSOCK:
3886 return vsock_show_sock(addr, nlh, arg);
3887 default:
3888 return -1;
3889 }
3890 }
3891
3892 static int handle_follow_request(struct filter *f)
3893 {
3894 int ret = 0;
3895 int groups = 0;
3896 struct rtnl_handle rth;
3897
3898 if (f->families & FAMILY_MASK(AF_INET) && f->dbs & (1 << TCP_DB))
3899 groups |= 1 << (SKNLGRP_INET_TCP_DESTROY - 1);
3900 if (f->families & FAMILY_MASK(AF_INET) && f->dbs & (1 << UDP_DB))
3901 groups |= 1 << (SKNLGRP_INET_UDP_DESTROY - 1);
3902 if (f->families & FAMILY_MASK(AF_INET6) && f->dbs & (1 << TCP_DB))
3903 groups |= 1 << (SKNLGRP_INET6_TCP_DESTROY - 1);
3904 if (f->families & FAMILY_MASK(AF_INET6) && f->dbs & (1 << UDP_DB))
3905 groups |= 1 << (SKNLGRP_INET6_UDP_DESTROY - 1);
3906
3907 if (groups == 0)
3908 return -1;
3909
3910 if (rtnl_open_byproto(&rth, groups, NETLINK_SOCK_DIAG))
3911 return -1;
3912
3913 rth.dump = 0;
3914 rth.local.nl_pid = 0;
3915
3916 if (rtnl_dump_filter(&rth, generic_show_sock, f))
3917 ret = -1;
3918
3919 rtnl_close(&rth);
3920 return ret;
3921 }
3922
3923 static int get_snmp_int(char *proto, char *key, int *result)
3924 {
3925 char buf[1024];
3926 FILE *fp;
3927 int protolen = strlen(proto);
3928 int keylen = strlen(key);
3929
3930 *result = 0;
3931
3932 if ((fp = net_snmp_open()) == NULL)
3933 return -1;
3934
3935 while (fgets(buf, sizeof(buf), fp) != NULL) {
3936 char *p = buf;
3937 int pos = 0;
3938
3939 if (memcmp(buf, proto, protolen))
3940 continue;
3941 while ((p = strchr(p, ' ')) != NULL) {
3942 pos++;
3943 p++;
3944 if (memcmp(p, key, keylen) == 0 &&
3945 (p[keylen] == ' ' || p[keylen] == '\n'))
3946 break;
3947 }
3948 if (fgets(buf, sizeof(buf), fp) == NULL)
3949 break;
3950 if (memcmp(buf, proto, protolen))
3951 break;
3952 p = buf;
3953 while ((p = strchr(p, ' ')) != NULL) {
3954 p++;
3955 if (--pos == 0) {
3956 sscanf(p, "%d", result);
3957 fclose(fp);
3958 return 0;
3959 }
3960 }
3961 }
3962
3963 fclose(fp);
3964 errno = ESRCH;
3965 return -1;
3966 }
3967
3968
3969 /* Get stats from sockstat */
3970
3971 struct ssummary {
3972 int socks;
3973 int tcp_mem;
3974 int tcp_total;
3975 int tcp_orphans;
3976 int tcp_tws;
3977 int tcp4_hashed;
3978 int udp4;
3979 int raw4;
3980 int frag4;
3981 int frag4_mem;
3982 int tcp6_hashed;
3983 int udp6;
3984 int raw6;
3985 int frag6;
3986 int frag6_mem;
3987 };
3988
3989 static void get_sockstat_line(char *line, struct ssummary *s)
3990 {
3991 char id[256], rem[256];
3992
3993 if (sscanf(line, "%[^ ] %[^\n]\n", id, rem) != 2)
3994 return;
3995
3996 if (strcmp(id, "sockets:") == 0)
3997 sscanf(rem, "%*s%d", &s->socks);
3998 else if (strcmp(id, "UDP:") == 0)
3999 sscanf(rem, "%*s%d", &s->udp4);
4000 else if (strcmp(id, "UDP6:") == 0)
4001 sscanf(rem, "%*s%d", &s->udp6);
4002 else if (strcmp(id, "RAW:") == 0)
4003 sscanf(rem, "%*s%d", &s->raw4);
4004 else if (strcmp(id, "RAW6:") == 0)
4005 sscanf(rem, "%*s%d", &s->raw6);
4006 else if (strcmp(id, "TCP6:") == 0)
4007 sscanf(rem, "%*s%d", &s->tcp6_hashed);
4008 else if (strcmp(id, "FRAG:") == 0)
4009 sscanf(rem, "%*s%d%*s%d", &s->frag4, &s->frag4_mem);
4010 else if (strcmp(id, "FRAG6:") == 0)
4011 sscanf(rem, "%*s%d%*s%d", &s->frag6, &s->frag6_mem);
4012 else if (strcmp(id, "TCP:") == 0)
4013 sscanf(rem, "%*s%d%*s%d%*s%d%*s%d%*s%d",
4014 &s->tcp4_hashed,
4015 &s->tcp_orphans, &s->tcp_tws, &s->tcp_total, &s->tcp_mem);
4016 }
4017
4018 static int get_sockstat(struct ssummary *s)
4019 {
4020 char buf[256];
4021 FILE *fp;
4022
4023 memset(s, 0, sizeof(*s));
4024
4025 if ((fp = net_sockstat_open()) == NULL)
4026 return -1;
4027 while (fgets(buf, sizeof(buf), fp) != NULL)
4028 get_sockstat_line(buf, s);
4029 fclose(fp);
4030
4031 if ((fp = net_sockstat6_open()) == NULL)
4032 return 0;
4033 while (fgets(buf, sizeof(buf), fp) != NULL)
4034 get_sockstat_line(buf, s);
4035 fclose(fp);
4036
4037 return 0;
4038 }
4039
4040 static int print_summary(void)
4041 {
4042 struct ssummary s;
4043 int tcp_estab;
4044
4045 if (get_sockstat(&s) < 0)
4046 perror("ss: get_sockstat");
4047 if (get_snmp_int("Tcp:", "CurrEstab", &tcp_estab) < 0)
4048 perror("ss: get_snmpstat");
4049
4050 get_slabstat(&slabstat);
4051
4052 printf("Total: %d (kernel %d)\n", s.socks, slabstat.socks);
4053
4054 printf("TCP: %d (estab %d, closed %d, orphaned %d, synrecv %d, timewait %d/%d), ports %d\n",
4055 s.tcp_total + slabstat.tcp_syns + s.tcp_tws,
4056 tcp_estab,
4057 s.tcp_total - (s.tcp4_hashed+s.tcp6_hashed-s.tcp_tws),
4058 s.tcp_orphans,
4059 slabstat.tcp_syns,
4060 s.tcp_tws, slabstat.tcp_tws,
4061 slabstat.tcp_ports
4062 );
4063
4064 printf("\n");
4065 printf("Transport Total IP IPv6\n");
4066 printf("* %-9d %-9s %-9s\n", slabstat.socks, "-", "-");
4067 printf("RAW %-9d %-9d %-9d\n", s.raw4+s.raw6, s.raw4, s.raw6);
4068 printf("UDP %-9d %-9d %-9d\n", s.udp4+s.udp6, s.udp4, s.udp6);
4069 printf("TCP %-9d %-9d %-9d\n", s.tcp4_hashed+s.tcp6_hashed, s.tcp4_hashed, s.tcp6_hashed);
4070 printf("INET %-9d %-9d %-9d\n",
4071 s.raw4+s.udp4+s.tcp4_hashed+
4072 s.raw6+s.udp6+s.tcp6_hashed,
4073 s.raw4+s.udp4+s.tcp4_hashed,
4074 s.raw6+s.udp6+s.tcp6_hashed);
4075 printf("FRAG %-9d %-9d %-9d\n", s.frag4+s.frag6, s.frag4, s.frag6);
4076
4077 printf("\n");
4078
4079 return 0;
4080 }
4081
4082 static void _usage(FILE *dest)
4083 {
4084 fprintf(dest,
4085 "Usage: ss [ OPTIONS ]\n"
4086 " ss [ OPTIONS ] [ FILTER ]\n"
4087 " -h, --help this message\n"
4088 " -V, --version output version information\n"
4089 " -n, --numeric don't resolve service names\n"
4090 " -r, --resolve resolve host names\n"
4091 " -a, --all display all sockets\n"
4092 " -l, --listening display listening sockets\n"
4093 " -o, --options show timer information\n"
4094 " -e, --extended show detailed socket information\n"
4095 " -m, --memory show socket memory usage\n"
4096 " -p, --processes show process using socket\n"
4097 " -i, --info show internal TCP information\n"
4098 " -s, --summary show socket usage summary\n"
4099 " -b, --bpf show bpf filter socket information\n"
4100 " -E, --events continually display sockets as they are destroyed\n"
4101 " -Z, --context display process SELinux security contexts\n"
4102 " -z, --contexts display process and socket SELinux security contexts\n"
4103 " -N, --net switch to the specified network namespace name\n"
4104 "\n"
4105 " -4, --ipv4 display only IP version 4 sockets\n"
4106 " -6, --ipv6 display only IP version 6 sockets\n"
4107 " -0, --packet display PACKET sockets\n"
4108 " -t, --tcp display only TCP sockets\n"
4109 " -S, --sctp display only SCTP sockets\n"
4110 " -u, --udp display only UDP sockets\n"
4111 " -d, --dccp display only DCCP sockets\n"
4112 " -w, --raw display only RAW sockets\n"
4113 " -x, --unix display only Unix domain sockets\n"
4114 " --vsock display only vsock sockets\n"
4115 " -f, --family=FAMILY display sockets of type FAMILY\n"
4116 " FAMILY := {inet|inet6|link|unix|netlink|vsock|help}\n"
4117 "\n"
4118 " -K, --kill forcibly close sockets, display what was closed\n"
4119 " -H, --no-header Suppress header line\n"
4120 "\n"
4121 " -A, --query=QUERY, --socket=QUERY\n"
4122 " QUERY := {all|inet|tcp|udp|raw|unix|unix_dgram|unix_stream|unix_seqpacket|packet|netlink|vsock_stream|vsock_dgram}[,QUERY]\n"
4123 "\n"
4124 " -D, --diag=FILE Dump raw information about TCP sockets to FILE\n"
4125 " -F, --filter=FILE read filter information from FILE\n"
4126 " FILTER := [ state STATE-FILTER ] [ EXPRESSION ]\n"
4127 " STATE-FILTER := {all|connected|synchronized|bucket|big|TCP-STATES}\n"
4128 " TCP-STATES := {established|syn-sent|syn-recv|fin-wait-{1,2}|time-wait|closed|close-wait|last-ack|listening|closing}\n"
4129 " connected := {established|syn-sent|syn-recv|fin-wait-{1,2}|time-wait|close-wait|last-ack|closing}\n"
4130 " synchronized := {established|syn-recv|fin-wait-{1,2}|time-wait|close-wait|last-ack|closing}\n"
4131 " bucket := {syn-recv|time-wait}\n"
4132 " big := {established|syn-sent|fin-wait-{1,2}|closed|close-wait|last-ack|listening|closing}\n"
4133 );
4134 }
4135
4136 static void help(void) __attribute__((noreturn));
4137 static void help(void)
4138 {
4139 _usage(stdout);
4140 exit(0);
4141 }
4142
4143 static void usage(void) __attribute__((noreturn));
4144 static void usage(void)
4145 {
4146 _usage(stderr);
4147 exit(-1);
4148 }
4149
4150
4151 static int scan_state(const char *state)
4152 {
4153 static const char * const sstate_namel[] = {
4154 "UNKNOWN",
4155 [SS_ESTABLISHED] = "established",
4156 [SS_SYN_SENT] = "syn-sent",
4157 [SS_SYN_RECV] = "syn-recv",
4158 [SS_FIN_WAIT1] = "fin-wait-1",
4159 [SS_FIN_WAIT2] = "fin-wait-2",
4160 [SS_TIME_WAIT] = "time-wait",
4161 [SS_CLOSE] = "unconnected",
4162 [SS_CLOSE_WAIT] = "close-wait",
4163 [SS_LAST_ACK] = "last-ack",
4164 [SS_LISTEN] = "listening",
4165 [SS_CLOSING] = "closing",
4166 };
4167 int i;
4168
4169 if (strcasecmp(state, "close") == 0 ||
4170 strcasecmp(state, "closed") == 0)
4171 return (1<<SS_CLOSE);
4172 if (strcasecmp(state, "syn-rcv") == 0)
4173 return (1<<SS_SYN_RECV);
4174 if (strcasecmp(state, "established") == 0)
4175 return (1<<SS_ESTABLISHED);
4176 if (strcasecmp(state, "all") == 0)
4177 return SS_ALL;
4178 if (strcasecmp(state, "connected") == 0)
4179 return SS_ALL & ~((1<<SS_CLOSE)|(1<<SS_LISTEN));
4180 if (strcasecmp(state, "synchronized") == 0)
4181 return SS_ALL & ~((1<<SS_CLOSE)|(1<<SS_LISTEN)|(1<<SS_SYN_SENT));
4182 if (strcasecmp(state, "bucket") == 0)
4183 return (1<<SS_SYN_RECV)|(1<<SS_TIME_WAIT);
4184 if (strcasecmp(state, "big") == 0)
4185 return SS_ALL & ~((1<<SS_SYN_RECV)|(1<<SS_TIME_WAIT));
4186 for (i = 0; i < SS_MAX; i++) {
4187 if (strcasecmp(state, sstate_namel[i]) == 0)
4188 return (1<<i);
4189 }
4190
4191 fprintf(stderr, "ss: wrong state name: %s\n", state);
4192 exit(-1);
4193 }
4194
4195 /* Values 'v' and 'V' are already used so a non-character is used */
4196 #define OPT_VSOCK 256
4197
4198 static const struct option long_opts[] = {
4199 { "numeric", 0, 0, 'n' },
4200 { "resolve", 0, 0, 'r' },
4201 { "options", 0, 0, 'o' },
4202 { "extended", 0, 0, 'e' },
4203 { "memory", 0, 0, 'm' },
4204 { "info", 0, 0, 'i' },
4205 { "processes", 0, 0, 'p' },
4206 { "bpf", 0, 0, 'b' },
4207 { "events", 0, 0, 'E' },
4208 { "dccp", 0, 0, 'd' },
4209 { "tcp", 0, 0, 't' },
4210 { "sctp", 0, 0, 'S' },
4211 { "udp", 0, 0, 'u' },
4212 { "raw", 0, 0, 'w' },
4213 { "unix", 0, 0, 'x' },
4214 { "vsock", 0, 0, OPT_VSOCK },
4215 { "all", 0, 0, 'a' },
4216 { "listening", 0, 0, 'l' },
4217 { "ipv4", 0, 0, '4' },
4218 { "ipv6", 0, 0, '6' },
4219 { "packet", 0, 0, '0' },
4220 { "family", 1, 0, 'f' },
4221 { "socket", 1, 0, 'A' },
4222 { "query", 1, 0, 'A' },
4223 { "summary", 0, 0, 's' },
4224 { "diag", 1, 0, 'D' },
4225 { "filter", 1, 0, 'F' },
4226 { "version", 0, 0, 'V' },
4227 { "help", 0, 0, 'h' },
4228 { "context", 0, 0, 'Z' },
4229 { "contexts", 0, 0, 'z' },
4230 { "net", 1, 0, 'N' },
4231 { "kill", 0, 0, 'K' },
4232 { "no-header", 0, 0, 'H' },
4233 { 0 }
4234
4235 };
4236
4237 int main(int argc, char *argv[])
4238 {
4239 int saw_states = 0;
4240 int saw_query = 0;
4241 int do_summary = 0;
4242 const char *dump_tcpdiag = NULL;
4243 FILE *filter_fp = NULL;
4244 int ch;
4245 int state_filter = 0;
4246 int addrp_width, screen_width = 80;
4247
4248 while ((ch = getopt_long(argc, argv,
4249 "dhaletuwxnro460spbEf:miA:D:F:vVzZN:KHS",
4250 long_opts, NULL)) != EOF) {
4251 switch (ch) {
4252 case 'n':
4253 resolve_services = 0;
4254 break;
4255 case 'r':
4256 resolve_hosts = 1;
4257 break;
4258 case 'o':
4259 show_options = 1;
4260 break;
4261 case 'e':
4262 show_options = 1;
4263 show_details++;
4264 break;
4265 case 'm':
4266 show_mem = 1;
4267 break;
4268 case 'i':
4269 show_tcpinfo = 1;
4270 break;
4271 case 'p':
4272 show_users++;
4273 user_ent_hash_build();
4274 break;
4275 case 'b':
4276 show_options = 1;
4277 show_bpf++;
4278 break;
4279 case 'E':
4280 follow_events = 1;
4281 break;
4282 case 'd':
4283 filter_db_set(&current_filter, DCCP_DB);
4284 break;
4285 case 't':
4286 filter_db_set(&current_filter, TCP_DB);
4287 break;
4288 case 'S':
4289 filter_db_set(&current_filter, SCTP_DB);
4290 break;
4291 case 'u':
4292 filter_db_set(&current_filter, UDP_DB);
4293 break;
4294 case 'w':
4295 filter_db_set(&current_filter, RAW_DB);
4296 break;
4297 case 'x':
4298 filter_af_set(&current_filter, AF_UNIX);
4299 break;
4300 case OPT_VSOCK:
4301 filter_af_set(&current_filter, AF_VSOCK);
4302 break;
4303 case 'a':
4304 state_filter = SS_ALL;
4305 break;
4306 case 'l':
4307 state_filter = (1 << SS_LISTEN) | (1 << SS_CLOSE);
4308 break;
4309 case '4':
4310 filter_af_set(&current_filter, AF_INET);
4311 break;
4312 case '6':
4313 filter_af_set(&current_filter, AF_INET6);
4314 break;
4315 case '0':
4316 filter_af_set(&current_filter, AF_PACKET);
4317 break;
4318 case 'f':
4319 if (strcmp(optarg, "inet") == 0)
4320 filter_af_set(&current_filter, AF_INET);
4321 else if (strcmp(optarg, "inet6") == 0)
4322 filter_af_set(&current_filter, AF_INET6);
4323 else if (strcmp(optarg, "link") == 0)
4324 filter_af_set(&current_filter, AF_PACKET);
4325 else if (strcmp(optarg, "unix") == 0)
4326 filter_af_set(&current_filter, AF_UNIX);
4327 else if (strcmp(optarg, "netlink") == 0)
4328 filter_af_set(&current_filter, AF_NETLINK);
4329 else if (strcmp(optarg, "vsock") == 0)
4330 filter_af_set(&current_filter, AF_VSOCK);
4331 else if (strcmp(optarg, "help") == 0)
4332 help();
4333 else {
4334 fprintf(stderr, "ss: \"%s\" is invalid family\n",
4335 optarg);
4336 usage();
4337 }
4338 break;
4339 case 'A':
4340 {
4341 char *p, *p1;
4342
4343 if (!saw_query) {
4344 current_filter.dbs = 0;
4345 state_filter = state_filter ?
4346 state_filter : SS_CONN;
4347 saw_query = 1;
4348 do_default = 0;
4349 }
4350 p = p1 = optarg;
4351 do {
4352 if ((p1 = strchr(p, ',')) != NULL)
4353 *p1 = 0;
4354 if (strcmp(p, "all") == 0) {
4355 filter_default_dbs(&current_filter);
4356 } else if (strcmp(p, "inet") == 0) {
4357 filter_db_set(&current_filter, UDP_DB);
4358 filter_db_set(&current_filter, DCCP_DB);
4359 filter_db_set(&current_filter, TCP_DB);
4360 filter_db_set(&current_filter, SCTP_DB);
4361 filter_db_set(&current_filter, RAW_DB);
4362 } else if (strcmp(p, "udp") == 0) {
4363 filter_db_set(&current_filter, UDP_DB);
4364 } else if (strcmp(p, "dccp") == 0) {
4365 filter_db_set(&current_filter, DCCP_DB);
4366 } else if (strcmp(p, "tcp") == 0) {
4367 filter_db_set(&current_filter, TCP_DB);
4368 } else if (strcmp(p, "sctp") == 0) {
4369 filter_db_set(&current_filter, SCTP_DB);
4370 } else if (strcmp(p, "raw") == 0) {
4371 filter_db_set(&current_filter, RAW_DB);
4372 } else if (strcmp(p, "unix") == 0) {
4373 filter_db_set(&current_filter, UNIX_ST_DB);
4374 filter_db_set(&current_filter, UNIX_DG_DB);
4375 filter_db_set(&current_filter, UNIX_SQ_DB);
4376 } else if (strcasecmp(p, "unix_stream") == 0 ||
4377 strcmp(p, "u_str") == 0) {
4378 filter_db_set(&current_filter, UNIX_ST_DB);
4379 } else if (strcasecmp(p, "unix_dgram") == 0 ||
4380 strcmp(p, "u_dgr") == 0) {
4381 filter_db_set(&current_filter, UNIX_DG_DB);
4382 } else if (strcasecmp(p, "unix_seqpacket") == 0 ||
4383 strcmp(p, "u_seq") == 0) {
4384 filter_db_set(&current_filter, UNIX_SQ_DB);
4385 } else if (strcmp(p, "packet") == 0) {
4386 filter_db_set(&current_filter, PACKET_R_DB);
4387 filter_db_set(&current_filter, PACKET_DG_DB);
4388 } else if (strcmp(p, "packet_raw") == 0 ||
4389 strcmp(p, "p_raw") == 0) {
4390 filter_db_set(&current_filter, PACKET_R_DB);
4391 } else if (strcmp(p, "packet_dgram") == 0 ||
4392 strcmp(p, "p_dgr") == 0) {
4393 filter_db_set(&current_filter, PACKET_DG_DB);
4394 } else if (strcmp(p, "netlink") == 0) {
4395 filter_db_set(&current_filter, NETLINK_DB);
4396 } else if (strcmp(p, "vsock") == 0) {
4397 filter_db_set(&current_filter, VSOCK_ST_DB);
4398 filter_db_set(&current_filter, VSOCK_DG_DB);
4399 } else if (strcmp(p, "vsock_stream") == 0 ||
4400 strcmp(p, "v_str") == 0) {
4401 filter_db_set(&current_filter, VSOCK_ST_DB);
4402 } else if (strcmp(p, "vsock_dgram") == 0 ||
4403 strcmp(p, "v_dgr") == 0) {
4404 filter_db_set(&current_filter, VSOCK_DG_DB);
4405 } else {
4406 fprintf(stderr, "ss: \"%s\" is illegal socket table id\n", p);
4407 usage();
4408 }
4409 p = p1 + 1;
4410 } while (p1);
4411 break;
4412 }
4413 case 's':
4414 do_summary = 1;
4415 break;
4416 case 'D':
4417 dump_tcpdiag = optarg;
4418 break;
4419 case 'F':
4420 if (filter_fp) {
4421 fprintf(stderr, "More than one filter file\n");
4422 exit(-1);
4423 }
4424 if (optarg[0] == '-')
4425 filter_fp = stdin;
4426 else
4427 filter_fp = fopen(optarg, "r");
4428 if (!filter_fp) {
4429 perror("fopen filter file");
4430 exit(-1);
4431 }
4432 break;
4433 case 'v':
4434 case 'V':
4435 printf("ss utility, iproute2-ss%s\n", SNAPSHOT);
4436 exit(0);
4437 case 'z':
4438 show_sock_ctx++;
4439 /* fall through */
4440 case 'Z':
4441 if (is_selinux_enabled() <= 0) {
4442 fprintf(stderr, "ss: SELinux is not enabled.\n");
4443 exit(1);
4444 }
4445 show_proc_ctx++;
4446 user_ent_hash_build();
4447 break;
4448 case 'N':
4449 if (netns_switch(optarg))
4450 exit(1);
4451 break;
4452 case 'K':
4453 current_filter.kill = 1;
4454 break;
4455 case 'H':
4456 show_header = 0;
4457 break;
4458 case 'h':
4459 help();
4460 case '?':
4461 default:
4462 usage();
4463 }
4464 }
4465
4466 argc -= optind;
4467 argv += optind;
4468
4469 if (do_summary) {
4470 print_summary();
4471 if (do_default && argc == 0)
4472 exit(0);
4473 }
4474
4475 while (argc > 0) {
4476 if (strcmp(*argv, "state") == 0) {
4477 NEXT_ARG();
4478 if (!saw_states)
4479 state_filter = 0;
4480 state_filter |= scan_state(*argv);
4481 saw_states = 1;
4482 } else if (strcmp(*argv, "exclude") == 0 ||
4483 strcmp(*argv, "excl") == 0) {
4484 NEXT_ARG();
4485 if (!saw_states)
4486 state_filter = SS_ALL;
4487 state_filter &= ~scan_state(*argv);
4488 saw_states = 1;
4489 } else {
4490 break;
4491 }
4492 argc--; argv++;
4493 }
4494
4495 if (do_default) {
4496 state_filter = state_filter ? state_filter : SS_CONN;
4497 filter_default_dbs(&current_filter);
4498 }
4499
4500 filter_states_set(&current_filter, state_filter);
4501 filter_merge_defaults(&current_filter);
4502
4503 if (resolve_services && resolve_hosts &&
4504 (current_filter.dbs & (UNIX_DBM|INET_L4_DBM)))
4505 init_service_resolver();
4506
4507 if (current_filter.dbs == 0) {
4508 fprintf(stderr, "ss: no socket tables to show with such filter.\n");
4509 exit(0);
4510 }
4511 if (current_filter.families == 0) {
4512 fprintf(stderr, "ss: no families to show with such filter.\n");
4513 exit(0);
4514 }
4515 if (current_filter.states == 0) {
4516 fprintf(stderr, "ss: no socket states to show with such filter.\n");
4517 exit(0);
4518 }
4519
4520 if (dump_tcpdiag) {
4521 FILE *dump_fp = stdout;
4522
4523 if (!(current_filter.dbs & (1<<TCP_DB))) {
4524 fprintf(stderr, "ss: tcpdiag dump requested and no tcp in filter.\n");
4525 exit(0);
4526 }
4527 if (dump_tcpdiag[0] != '-') {
4528 dump_fp = fopen(dump_tcpdiag, "w");
4529 if (!dump_tcpdiag) {
4530 perror("fopen dump file");
4531 exit(-1);
4532 }
4533 }
4534 inet_show_netlink(&current_filter, dump_fp, IPPROTO_TCP);
4535 fflush(dump_fp);
4536 exit(0);
4537 }
4538
4539 if (ssfilter_parse(&current_filter.f, argc, argv, filter_fp))
4540 usage();
4541
4542 netid_width = 0;
4543 if (current_filter.dbs&(current_filter.dbs-1))
4544 netid_width = 5;
4545
4546 state_width = 0;
4547 if (current_filter.states&(current_filter.states-1))
4548 state_width = 10;
4549
4550 if (isatty(STDOUT_FILENO)) {
4551 struct winsize w;
4552
4553 if (ioctl(STDOUT_FILENO, TIOCGWINSZ, &w) != -1) {
4554 if (w.ws_col > 0)
4555 screen_width = w.ws_col;
4556 }
4557 }
4558
4559 addrp_width = screen_width;
4560 if (netid_width)
4561 addrp_width -= netid_width + 1;
4562 if (state_width)
4563 addrp_width -= state_width + 1;
4564 addrp_width -= 14;
4565
4566 if (addrp_width&1) {
4567 if (netid_width)
4568 netid_width++;
4569 else if (state_width)
4570 state_width++;
4571 else
4572 odd_width_pad = " ";
4573 }
4574
4575 addrp_width /= 2;
4576 addrp_width--;
4577
4578 serv_width = resolve_services ? 7 : 5;
4579
4580 if (addrp_width < 15+serv_width+1)
4581 addrp_width = 15+serv_width+1;
4582
4583 addr_width = addrp_width - serv_width - 1;
4584
4585 if (show_header) {
4586 if (netid_width)
4587 out("%-*s ", netid_width, "Netid");
4588 if (state_width)
4589 out("%-*s ", state_width, "State");
4590 out("%-6s %-6s %s", "Recv-Q", "Send-Q", odd_width_pad);
4591 }
4592
4593 /* Make enough space for the local/remote port field */
4594 addr_width -= 13;
4595 serv_width += 13;
4596
4597 if (show_header) {
4598 out("%*s:%-*s %*s:%-*s\n",
4599 addr_width, "Local Address", serv_width, "Port",
4600 addr_width, "Peer Address", serv_width, "Port");
4601 }
4602
4603 fflush(stdout);
4604
4605 if (follow_events)
4606 exit(handle_follow_request(&current_filter));
4607
4608 if (current_filter.dbs & (1<<NETLINK_DB))
4609 netlink_show(&current_filter);
4610 if (current_filter.dbs & PACKET_DBM)
4611 packet_show(&current_filter);
4612 if (current_filter.dbs & UNIX_DBM)
4613 unix_show(&current_filter);
4614 if (current_filter.dbs & (1<<RAW_DB))
4615 raw_show(&current_filter);
4616 if (current_filter.dbs & (1<<UDP_DB))
4617 udp_show(&current_filter);
4618 if (current_filter.dbs & (1<<TCP_DB))
4619 tcp_show(&current_filter);
4620 if (current_filter.dbs & (1<<DCCP_DB))
4621 dccp_show(&current_filter);
4622 if (current_filter.dbs & (1<<SCTP_DB))
4623 sctp_show(&current_filter);
4624 if (current_filter.dbs & VSOCK_DBM)
4625 vsock_show(&current_filter);
4626
4627 if (show_users || show_proc_ctx || show_sock_ctx)
4628 user_ent_destroy();
4629
4630 return 0;
4631 }