inet_diag.c 28 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175
  1. /*
  2. * inet_diag.c Module for monitoring INET transport protocols sockets.
  3. *
  4. * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
  5. *
  6. * This program is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU General Public License
  8. * as published by the Free Software Foundation; either version
  9. * 2 of the License, or (at your option) any later version.
  10. */
  11. #include <linux/kernel.h>
  12. #include <linux/module.h>
  13. #include <linux/types.h>
  14. #include <linux/fcntl.h>
  15. #include <linux/random.h>
  16. #include <linux/slab.h>
  17. #include <linux/cache.h>
  18. #include <linux/init.h>
  19. #include <linux/time.h>
  20. #include <net/icmp.h>
  21. #include <net/tcp.h>
  22. #include <net/ipv6.h>
  23. #include <net/inet_common.h>
  24. #include <net/inet_connection_sock.h>
  25. #include <net/inet_hashtables.h>
  26. #include <net/inet_timewait_sock.h>
  27. #include <net/inet6_hashtables.h>
  28. #include <net/netlink.h>
  29. #include <linux/inet.h>
  30. #include <linux/stddef.h>
  31. #include <linux/inet_diag.h>
  32. #include <linux/sock_diag.h>
  33. static const struct inet_diag_handler **inet_diag_table;
  34. struct inet_diag_entry {
  35. __be32 *saddr;
  36. __be32 *daddr;
  37. u16 sport;
  38. u16 dport;
  39. u16 family;
  40. u16 userlocks;
  41. #if IS_ENABLED(CONFIG_IPV6)
  42. struct in6_addr saddr_storage; /* for IPv4-mapped-IPv6 addresses */
  43. struct in6_addr daddr_storage; /* for IPv4-mapped-IPv6 addresses */
  44. #endif
  45. };
  46. static DEFINE_MUTEX(inet_diag_table_mutex);
  47. static const struct inet_diag_handler *inet_diag_lock_handler(int proto)
  48. {
  49. if (!inet_diag_table[proto])
  50. request_module("net-pf-%d-proto-%d-type-%d-%d", PF_NETLINK,
  51. NETLINK_SOCK_DIAG, AF_INET, proto);
  52. mutex_lock(&inet_diag_table_mutex);
  53. if (!inet_diag_table[proto])
  54. return ERR_PTR(-ENOENT);
  55. return inet_diag_table[proto];
  56. }
  57. static inline void inet_diag_unlock_handler(
  58. const struct inet_diag_handler *handler)
  59. {
  60. mutex_unlock(&inet_diag_table_mutex);
  61. }
  62. int inet_sk_diag_fill(struct sock *sk, struct inet_connection_sock *icsk,
  63. struct sk_buff *skb, struct inet_diag_req_v2 *req,
  64. struct user_namespace *user_ns,
  65. u32 portid, u32 seq, u16 nlmsg_flags,
  66. const struct nlmsghdr *unlh)
  67. {
  68. const struct inet_sock *inet = inet_sk(sk);
  69. struct inet_diag_msg *r;
  70. struct nlmsghdr *nlh;
  71. struct nlattr *attr;
  72. void *info = NULL;
  73. const struct inet_diag_handler *handler;
  74. int ext = req->idiag_ext;
  75. handler = inet_diag_table[req->sdiag_protocol];
  76. BUG_ON(handler == NULL);
  77. nlh = nlmsg_put(skb, portid, seq, unlh->nlmsg_type, sizeof(*r),
  78. nlmsg_flags);
  79. if (!nlh)
  80. return -EMSGSIZE;
  81. r = nlmsg_data(nlh);
  82. BUG_ON(sk->sk_state == TCP_TIME_WAIT);
  83. r->idiag_family = sk->sk_family;
  84. r->idiag_state = sk->sk_state;
  85. r->idiag_timer = 0;
  86. r->idiag_retrans = 0;
  87. r->id.idiag_if = sk->sk_bound_dev_if;
  88. sock_diag_save_cookie(sk, r->id.idiag_cookie);
  89. r->id.idiag_sport = inet->inet_sport;
  90. r->id.idiag_dport = inet->inet_dport;
  91. r->id.idiag_src[0] = inet->inet_rcv_saddr;
  92. r->id.idiag_dst[0] = inet->inet_daddr;
  93. /* IPv6 dual-stack sockets use inet->tos for IPv4 connections,
  94. * hence this needs to be included regardless of socket family.
  95. */
  96. if (ext & (1 << (INET_DIAG_TOS - 1)))
  97. if (nla_put_u8(skb, INET_DIAG_TOS, inet->tos) < 0)
  98. goto errout;
  99. #if IS_ENABLED(CONFIG_IPV6)
  100. if (r->idiag_family == AF_INET6) {
  101. const struct ipv6_pinfo *np = inet6_sk(sk);
  102. *(struct in6_addr *)r->id.idiag_src = np->rcv_saddr;
  103. *(struct in6_addr *)r->id.idiag_dst = np->daddr;
  104. if (ext & (1 << (INET_DIAG_TCLASS - 1)))
  105. if (nla_put_u8(skb, INET_DIAG_TCLASS, np->tclass) < 0)
  106. goto errout;
  107. }
  108. #endif
  109. r->idiag_uid = from_kuid_munged(user_ns, sock_i_uid(sk));
  110. r->idiag_inode = sock_i_ino(sk);
  111. if (ext & (1 << (INET_DIAG_MEMINFO - 1))) {
  112. struct inet_diag_meminfo minfo = {
  113. .idiag_rmem = sk_rmem_alloc_get(sk),
  114. .idiag_wmem = sk->sk_wmem_queued,
  115. .idiag_fmem = sk->sk_forward_alloc,
  116. .idiag_tmem = sk_wmem_alloc_get(sk),
  117. };
  118. if (nla_put(skb, INET_DIAG_MEMINFO, sizeof(minfo), &minfo) < 0)
  119. goto errout;
  120. }
  121. if (ext & (1 << (INET_DIAG_SKMEMINFO - 1)))
  122. if (sock_diag_put_meminfo(sk, skb, INET_DIAG_SKMEMINFO))
  123. goto errout;
  124. if (icsk == NULL) {
  125. handler->idiag_get_info(sk, r, NULL);
  126. goto out;
  127. }
  128. #define EXPIRES_IN_MS(tmo) DIV_ROUND_UP((tmo - jiffies) * 1000, HZ)
  129. if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
  130. r->idiag_timer = 1;
  131. r->idiag_retrans = icsk->icsk_retransmits;
  132. r->idiag_expires = EXPIRES_IN_MS(icsk->icsk_timeout);
  133. } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
  134. r->idiag_timer = 4;
  135. r->idiag_retrans = icsk->icsk_probes_out;
  136. r->idiag_expires = EXPIRES_IN_MS(icsk->icsk_timeout);
  137. } else if (timer_pending(&sk->sk_timer)) {
  138. r->idiag_timer = 2;
  139. r->idiag_retrans = icsk->icsk_probes_out;
  140. r->idiag_expires = EXPIRES_IN_MS(sk->sk_timer.expires);
  141. } else {
  142. r->idiag_timer = 0;
  143. r->idiag_expires = 0;
  144. }
  145. #undef EXPIRES_IN_MS
  146. if (ext & (1 << (INET_DIAG_INFO - 1))) {
  147. attr = nla_reserve(skb, INET_DIAG_INFO,
  148. sizeof(struct tcp_info));
  149. if (!attr)
  150. goto errout;
  151. info = nla_data(attr);
  152. }
  153. if ((ext & (1 << (INET_DIAG_CONG - 1))) && icsk->icsk_ca_ops)
  154. if (nla_put_string(skb, INET_DIAG_CONG,
  155. icsk->icsk_ca_ops->name) < 0)
  156. goto errout;
  157. handler->idiag_get_info(sk, r, info);
  158. if (sk->sk_state < TCP_TIME_WAIT &&
  159. icsk->icsk_ca_ops && icsk->icsk_ca_ops->get_info)
  160. icsk->icsk_ca_ops->get_info(sk, ext, skb);
  161. out:
  162. return nlmsg_end(skb, nlh);
  163. errout:
  164. nlmsg_cancel(skb, nlh);
  165. return -EMSGSIZE;
  166. }
  167. EXPORT_SYMBOL_GPL(inet_sk_diag_fill);
  168. static int inet_csk_diag_fill(struct sock *sk,
  169. struct sk_buff *skb, struct inet_diag_req_v2 *req,
  170. struct user_namespace *user_ns,
  171. u32 portid, u32 seq, u16 nlmsg_flags,
  172. const struct nlmsghdr *unlh)
  173. {
  174. return inet_sk_diag_fill(sk, inet_csk(sk),
  175. skb, req, user_ns, portid, seq, nlmsg_flags, unlh);
  176. }
  177. static int inet_twsk_diag_fill(struct inet_timewait_sock *tw,
  178. struct sk_buff *skb, struct inet_diag_req_v2 *req,
  179. u32 portid, u32 seq, u16 nlmsg_flags,
  180. const struct nlmsghdr *unlh)
  181. {
  182. long tmo;
  183. struct inet_diag_msg *r;
  184. struct nlmsghdr *nlh;
  185. nlh = nlmsg_put(skb, portid, seq, unlh->nlmsg_type, sizeof(*r),
  186. nlmsg_flags);
  187. if (!nlh)
  188. return -EMSGSIZE;
  189. r = nlmsg_data(nlh);
  190. BUG_ON(tw->tw_state != TCP_TIME_WAIT);
  191. tmo = tw->tw_ttd - jiffies;
  192. if (tmo < 0)
  193. tmo = 0;
  194. r->idiag_family = tw->tw_family;
  195. r->idiag_retrans = 0;
  196. r->id.idiag_if = tw->tw_bound_dev_if;
  197. sock_diag_save_cookie(tw, r->id.idiag_cookie);
  198. r->id.idiag_sport = tw->tw_sport;
  199. r->id.idiag_dport = tw->tw_dport;
  200. r->id.idiag_src[0] = tw->tw_rcv_saddr;
  201. r->id.idiag_dst[0] = tw->tw_daddr;
  202. r->idiag_state = tw->tw_substate;
  203. r->idiag_timer = 3;
  204. r->idiag_expires = DIV_ROUND_UP(tmo * 1000, HZ);
  205. r->idiag_rqueue = 0;
  206. r->idiag_wqueue = 0;
  207. r->idiag_uid = 0;
  208. r->idiag_inode = 0;
  209. #if IS_ENABLED(CONFIG_IPV6)
  210. if (tw->tw_family == AF_INET6) {
  211. const struct inet6_timewait_sock *tw6 =
  212. inet6_twsk((struct sock *)tw);
  213. *(struct in6_addr *)r->id.idiag_src = tw6->tw_v6_rcv_saddr;
  214. *(struct in6_addr *)r->id.idiag_dst = tw6->tw_v6_daddr;
  215. }
  216. #endif
  217. return nlmsg_end(skb, nlh);
  218. }
  219. static int sk_diag_fill(struct sock *sk, struct sk_buff *skb,
  220. struct inet_diag_req_v2 *r,
  221. struct user_namespace *user_ns,
  222. u32 portid, u32 seq, u16 nlmsg_flags,
  223. const struct nlmsghdr *unlh)
  224. {
  225. if (sk->sk_state == TCP_TIME_WAIT)
  226. return inet_twsk_diag_fill((struct inet_timewait_sock *)sk,
  227. skb, r, portid, seq, nlmsg_flags,
  228. unlh);
  229. return inet_csk_diag_fill(sk, skb, r, user_ns, portid, seq, nlmsg_flags, unlh);
  230. }
  231. int inet_diag_dump_one_icsk(struct inet_hashinfo *hashinfo, struct sk_buff *in_skb,
  232. const struct nlmsghdr *nlh, struct inet_diag_req_v2 *req)
  233. {
  234. int err;
  235. struct sock *sk;
  236. struct sk_buff *rep;
  237. struct net *net = sock_net(in_skb->sk);
  238. err = -EINVAL;
  239. if (req->sdiag_family == AF_INET) {
  240. sk = inet_lookup(net, hashinfo, req->id.idiag_dst[0],
  241. req->id.idiag_dport, req->id.idiag_src[0],
  242. req->id.idiag_sport, req->id.idiag_if);
  243. }
  244. #if IS_ENABLED(CONFIG_IPV6)
  245. else if (req->sdiag_family == AF_INET6) {
  246. sk = inet6_lookup(net, hashinfo,
  247. (struct in6_addr *)req->id.idiag_dst,
  248. req->id.idiag_dport,
  249. (struct in6_addr *)req->id.idiag_src,
  250. req->id.idiag_sport,
  251. req->id.idiag_if);
  252. }
  253. #endif
  254. else {
  255. goto out_nosk;
  256. }
  257. err = -ENOENT;
  258. if (sk == NULL)
  259. goto out_nosk;
  260. err = sock_diag_check_cookie(sk, req->id.idiag_cookie);
  261. if (err)
  262. goto out;
  263. rep = nlmsg_new(sizeof(struct inet_diag_msg) +
  264. sizeof(struct inet_diag_meminfo) +
  265. sizeof(struct tcp_info) + 64, GFP_KERNEL);
  266. if (!rep) {
  267. err = -ENOMEM;
  268. goto out;
  269. }
  270. err = sk_diag_fill(sk, rep, req,
  271. sk_user_ns(NETLINK_CB(in_skb).ssk),
  272. NETLINK_CB(in_skb).portid,
  273. nlh->nlmsg_seq, 0, nlh);
  274. if (err < 0) {
  275. WARN_ON(err == -EMSGSIZE);
  276. nlmsg_free(rep);
  277. goto out;
  278. }
  279. err = netlink_unicast(net->diag_nlsk, rep, NETLINK_CB(in_skb).portid,
  280. MSG_DONTWAIT);
  281. if (err > 0)
  282. err = 0;
  283. out:
  284. if (sk) {
  285. if (sk->sk_state == TCP_TIME_WAIT)
  286. inet_twsk_put((struct inet_timewait_sock *)sk);
  287. else
  288. sock_put(sk);
  289. }
  290. out_nosk:
  291. return err;
  292. }
  293. EXPORT_SYMBOL_GPL(inet_diag_dump_one_icsk);
  294. static int inet_diag_get_exact(struct sk_buff *in_skb,
  295. const struct nlmsghdr *nlh,
  296. struct inet_diag_req_v2 *req)
  297. {
  298. const struct inet_diag_handler *handler;
  299. int err;
  300. handler = inet_diag_lock_handler(req->sdiag_protocol);
  301. if (IS_ERR(handler))
  302. err = PTR_ERR(handler);
  303. else
  304. err = handler->dump_one(in_skb, nlh, req);
  305. inet_diag_unlock_handler(handler);
  306. return err;
  307. }
  308. static int bitstring_match(const __be32 *a1, const __be32 *a2, int bits)
  309. {
  310. int words = bits >> 5;
  311. bits &= 0x1f;
  312. if (words) {
  313. if (memcmp(a1, a2, words << 2))
  314. return 0;
  315. }
  316. if (bits) {
  317. __be32 w1, w2;
  318. __be32 mask;
  319. w1 = a1[words];
  320. w2 = a2[words];
  321. mask = htonl((0xffffffff) << (32 - bits));
  322. if ((w1 ^ w2) & mask)
  323. return 0;
  324. }
  325. return 1;
  326. }
  327. static int inet_diag_bc_run(const struct nlattr *_bc,
  328. const struct inet_diag_entry *entry)
  329. {
  330. const void *bc = nla_data(_bc);
  331. int len = nla_len(_bc);
  332. while (len > 0) {
  333. int yes = 1;
  334. const struct inet_diag_bc_op *op = bc;
  335. switch (op->code) {
  336. case INET_DIAG_BC_NOP:
  337. break;
  338. case INET_DIAG_BC_JMP:
  339. yes = 0;
  340. break;
  341. case INET_DIAG_BC_S_GE:
  342. yes = entry->sport >= op[1].no;
  343. break;
  344. case INET_DIAG_BC_S_LE:
  345. yes = entry->sport <= op[1].no;
  346. break;
  347. case INET_DIAG_BC_D_GE:
  348. yes = entry->dport >= op[1].no;
  349. break;
  350. case INET_DIAG_BC_D_LE:
  351. yes = entry->dport <= op[1].no;
  352. break;
  353. case INET_DIAG_BC_AUTO:
  354. yes = !(entry->userlocks & SOCK_BINDPORT_LOCK);
  355. break;
  356. case INET_DIAG_BC_S_COND:
  357. case INET_DIAG_BC_D_COND: {
  358. struct inet_diag_hostcond *cond;
  359. __be32 *addr;
  360. cond = (struct inet_diag_hostcond *)(op + 1);
  361. if (cond->port != -1 &&
  362. cond->port != (op->code == INET_DIAG_BC_S_COND ?
  363. entry->sport : entry->dport)) {
  364. yes = 0;
  365. break;
  366. }
  367. if (cond->prefix_len == 0)
  368. break;
  369. if (op->code == INET_DIAG_BC_S_COND)
  370. addr = entry->saddr;
  371. else
  372. addr = entry->daddr;
  373. if (bitstring_match(addr, cond->addr,
  374. cond->prefix_len))
  375. break;
  376. if (entry->family == AF_INET6 &&
  377. cond->family == AF_INET) {
  378. if (addr[0] == 0 && addr[1] == 0 &&
  379. addr[2] == htonl(0xffff) &&
  380. bitstring_match(addr + 3, cond->addr,
  381. cond->prefix_len))
  382. break;
  383. }
  384. yes = 0;
  385. break;
  386. }
  387. }
  388. if (yes) {
  389. len -= op->yes;
  390. bc += op->yes;
  391. } else {
  392. len -= op->no;
  393. bc += op->no;
  394. }
  395. }
  396. return len == 0;
  397. }
  398. int inet_diag_bc_sk(const struct nlattr *bc, struct sock *sk)
  399. {
  400. struct inet_diag_entry entry;
  401. struct inet_sock *inet = inet_sk(sk);
  402. if (bc == NULL)
  403. return 1;
  404. entry.family = sk->sk_family;
  405. #if IS_ENABLED(CONFIG_IPV6)
  406. if (entry.family == AF_INET6) {
  407. struct ipv6_pinfo *np = inet6_sk(sk);
  408. entry.saddr = np->rcv_saddr.s6_addr32;
  409. entry.daddr = np->daddr.s6_addr32;
  410. } else
  411. #endif
  412. {
  413. entry.saddr = &inet->inet_rcv_saddr;
  414. entry.daddr = &inet->inet_daddr;
  415. }
  416. entry.sport = inet->inet_num;
  417. entry.dport = ntohs(inet->inet_dport);
  418. entry.userlocks = sk->sk_userlocks;
  419. return inet_diag_bc_run(bc, &entry);
  420. }
  421. EXPORT_SYMBOL_GPL(inet_diag_bc_sk);
  422. static int valid_cc(const void *bc, int len, int cc)
  423. {
  424. while (len >= 0) {
  425. const struct inet_diag_bc_op *op = bc;
  426. if (cc > len)
  427. return 0;
  428. if (cc == len)
  429. return 1;
  430. if (op->yes < 4 || op->yes & 3)
  431. return 0;
  432. len -= op->yes;
  433. bc += op->yes;
  434. }
  435. return 0;
  436. }
  437. /* Validate an inet_diag_hostcond. */
  438. static bool valid_hostcond(const struct inet_diag_bc_op *op, int len,
  439. int *min_len)
  440. {
  441. int addr_len;
  442. struct inet_diag_hostcond *cond;
  443. /* Check hostcond space. */
  444. *min_len += sizeof(struct inet_diag_hostcond);
  445. if (len < *min_len)
  446. return false;
  447. cond = (struct inet_diag_hostcond *)(op + 1);
  448. /* Check address family and address length. */
  449. switch (cond->family) {
  450. case AF_UNSPEC:
  451. addr_len = 0;
  452. break;
  453. case AF_INET:
  454. addr_len = sizeof(struct in_addr);
  455. break;
  456. case AF_INET6:
  457. addr_len = sizeof(struct in6_addr);
  458. break;
  459. default:
  460. return false;
  461. }
  462. *min_len += addr_len;
  463. if (len < *min_len)
  464. return false;
  465. /* Check prefix length (in bits) vs address length (in bytes). */
  466. if (cond->prefix_len > 8 * addr_len)
  467. return false;
  468. return true;
  469. }
  470. static int inet_diag_bc_audit(const void *bytecode, int bytecode_len)
  471. {
  472. const void *bc = bytecode;
  473. int len = bytecode_len;
  474. while (len > 0) {
  475. const struct inet_diag_bc_op *op = bc;
  476. int min_len = sizeof(struct inet_diag_bc_op);
  477. //printk("BC: %d %d %d {%d} / %d\n", op->code, op->yes, op->no, op[1].no, len);
  478. switch (op->code) {
  479. case INET_DIAG_BC_S_COND:
  480. case INET_DIAG_BC_D_COND:
  481. if (!valid_hostcond(bc, len, &min_len))
  482. return -EINVAL;
  483. /* fall through */
  484. case INET_DIAG_BC_AUTO:
  485. case INET_DIAG_BC_S_GE:
  486. case INET_DIAG_BC_S_LE:
  487. case INET_DIAG_BC_D_GE:
  488. case INET_DIAG_BC_D_LE:
  489. case INET_DIAG_BC_JMP:
  490. if (op->no < min_len || op->no > len + 4 || op->no & 3)
  491. return -EINVAL;
  492. if (op->no < len &&
  493. !valid_cc(bytecode, bytecode_len, len - op->no))
  494. return -EINVAL;
  495. break;
  496. case INET_DIAG_BC_NOP:
  497. break;
  498. default:
  499. return -EINVAL;
  500. }
  501. if (op->yes < min_len || op->yes > len + 4 || op->yes & 3)
  502. return -EINVAL;
  503. bc += op->yes;
  504. len -= op->yes;
  505. }
  506. return len == 0 ? 0 : -EINVAL;
  507. }
  508. static int inet_csk_diag_dump(struct sock *sk,
  509. struct sk_buff *skb,
  510. struct netlink_callback *cb,
  511. struct inet_diag_req_v2 *r,
  512. const struct nlattr *bc)
  513. {
  514. if (!inet_diag_bc_sk(bc, sk))
  515. return 0;
  516. return inet_csk_diag_fill(sk, skb, r,
  517. sk_user_ns(NETLINK_CB(cb->skb).ssk),
  518. NETLINK_CB(cb->skb).portid,
  519. cb->nlh->nlmsg_seq, NLM_F_MULTI, cb->nlh);
  520. }
  521. static int inet_twsk_diag_dump(struct inet_timewait_sock *tw,
  522. struct sk_buff *skb,
  523. struct netlink_callback *cb,
  524. struct inet_diag_req_v2 *r,
  525. const struct nlattr *bc)
  526. {
  527. if (bc != NULL) {
  528. struct inet_diag_entry entry;
  529. entry.family = tw->tw_family;
  530. #if IS_ENABLED(CONFIG_IPV6)
  531. if (tw->tw_family == AF_INET6) {
  532. struct inet6_timewait_sock *tw6 =
  533. inet6_twsk((struct sock *)tw);
  534. entry.saddr = tw6->tw_v6_rcv_saddr.s6_addr32;
  535. entry.daddr = tw6->tw_v6_daddr.s6_addr32;
  536. } else
  537. #endif
  538. {
  539. entry.saddr = &tw->tw_rcv_saddr;
  540. entry.daddr = &tw->tw_daddr;
  541. }
  542. entry.sport = tw->tw_num;
  543. entry.dport = ntohs(tw->tw_dport);
  544. entry.userlocks = 0;
  545. if (!inet_diag_bc_run(bc, &entry))
  546. return 0;
  547. }
  548. return inet_twsk_diag_fill(tw, skb, r,
  549. NETLINK_CB(cb->skb).portid,
  550. cb->nlh->nlmsg_seq, NLM_F_MULTI, cb->nlh);
  551. }
  552. /* Get the IPv4, IPv6, or IPv4-mapped-IPv6 local and remote addresses
  553. * from a request_sock. For IPv4-mapped-IPv6 we must map IPv4 to IPv6.
  554. */
  555. static inline void inet_diag_req_addrs(const struct sock *sk,
  556. const struct request_sock *req,
  557. struct inet_diag_entry *entry)
  558. {
  559. struct inet_request_sock *ireq = inet_rsk(req);
  560. #if IS_ENABLED(CONFIG_IPV6)
  561. if (sk->sk_family == AF_INET6) {
  562. if (req->rsk_ops->family == AF_INET6) {
  563. entry->saddr = inet6_rsk(req)->loc_addr.s6_addr32;
  564. entry->daddr = inet6_rsk(req)->rmt_addr.s6_addr32;
  565. } else if (req->rsk_ops->family == AF_INET) {
  566. ipv6_addr_set_v4mapped(ireq->loc_addr,
  567. &entry->saddr_storage);
  568. ipv6_addr_set_v4mapped(ireq->rmt_addr,
  569. &entry->daddr_storage);
  570. entry->saddr = entry->saddr_storage.s6_addr32;
  571. entry->daddr = entry->daddr_storage.s6_addr32;
  572. }
  573. } else
  574. #endif
  575. {
  576. entry->saddr = &ireq->loc_addr;
  577. entry->daddr = &ireq->rmt_addr;
  578. }
  579. }
  580. static int inet_diag_fill_req(struct sk_buff *skb, struct sock *sk,
  581. struct request_sock *req,
  582. struct user_namespace *user_ns,
  583. u32 portid, u32 seq,
  584. const struct nlmsghdr *unlh)
  585. {
  586. const struct inet_request_sock *ireq = inet_rsk(req);
  587. struct inet_sock *inet = inet_sk(sk);
  588. struct inet_diag_msg *r;
  589. struct nlmsghdr *nlh;
  590. long tmo;
  591. nlh = nlmsg_put(skb, portid, seq, unlh->nlmsg_type, sizeof(*r),
  592. NLM_F_MULTI);
  593. if (!nlh)
  594. return -EMSGSIZE;
  595. r = nlmsg_data(nlh);
  596. r->idiag_family = sk->sk_family;
  597. r->idiag_state = TCP_SYN_RECV;
  598. r->idiag_timer = 1;
  599. r->idiag_retrans = req->retrans;
  600. r->id.idiag_if = sk->sk_bound_dev_if;
  601. sock_diag_save_cookie(req, r->id.idiag_cookie);
  602. tmo = req->expires - jiffies;
  603. if (tmo < 0)
  604. tmo = 0;
  605. r->id.idiag_sport = inet->inet_sport;
  606. r->id.idiag_dport = ireq->rmt_port;
  607. r->id.idiag_src[0] = ireq->loc_addr;
  608. r->id.idiag_dst[0] = ireq->rmt_addr;
  609. r->idiag_expires = jiffies_to_msecs(tmo);
  610. r->idiag_rqueue = 0;
  611. r->idiag_wqueue = 0;
  612. r->idiag_uid = from_kuid_munged(user_ns, sock_i_uid(sk));
  613. r->idiag_inode = 0;
  614. #if IS_ENABLED(CONFIG_IPV6)
  615. if (r->idiag_family == AF_INET6) {
  616. struct inet_diag_entry entry;
  617. inet_diag_req_addrs(sk, req, &entry);
  618. memcpy(r->id.idiag_src, entry.saddr, sizeof(struct in6_addr));
  619. memcpy(r->id.idiag_dst, entry.daddr, sizeof(struct in6_addr));
  620. }
  621. #endif
  622. return nlmsg_end(skb, nlh);
  623. }
  624. static int inet_diag_dump_reqs(struct sk_buff *skb, struct sock *sk,
  625. struct netlink_callback *cb,
  626. struct inet_diag_req_v2 *r,
  627. const struct nlattr *bc)
  628. {
  629. struct inet_diag_entry entry;
  630. struct inet_connection_sock *icsk = inet_csk(sk);
  631. struct listen_sock *lopt;
  632. struct inet_sock *inet = inet_sk(sk);
  633. int j, s_j;
  634. int reqnum, s_reqnum;
  635. int err = 0;
  636. s_j = cb->args[3];
  637. s_reqnum = cb->args[4];
  638. if (s_j > 0)
  639. s_j--;
  640. entry.family = sk->sk_family;
  641. read_lock_bh(&icsk->icsk_accept_queue.syn_wait_lock);
  642. lopt = icsk->icsk_accept_queue.listen_opt;
  643. if (!lopt || !lopt->qlen)
  644. goto out;
  645. if (bc != NULL) {
  646. entry.sport = inet->inet_num;
  647. entry.userlocks = sk->sk_userlocks;
  648. }
  649. for (j = s_j; j < lopt->nr_table_entries; j++) {
  650. struct request_sock *req, *head = lopt->syn_table[j];
  651. reqnum = 0;
  652. for (req = head; req; reqnum++, req = req->dl_next) {
  653. struct inet_request_sock *ireq = inet_rsk(req);
  654. if (reqnum < s_reqnum)
  655. continue;
  656. if (r->id.idiag_dport != ireq->rmt_port &&
  657. r->id.idiag_dport)
  658. continue;
  659. if (bc) {
  660. inet_diag_req_addrs(sk, req, &entry);
  661. entry.dport = ntohs(ireq->rmt_port);
  662. if (!inet_diag_bc_run(bc, &entry))
  663. continue;
  664. }
  665. err = inet_diag_fill_req(skb, sk, req,
  666. sk_user_ns(NETLINK_CB(cb->skb).ssk),
  667. NETLINK_CB(cb->skb).portid,
  668. cb->nlh->nlmsg_seq, cb->nlh);
  669. if (err < 0) {
  670. cb->args[3] = j + 1;
  671. cb->args[4] = reqnum;
  672. goto out;
  673. }
  674. }
  675. s_reqnum = 0;
  676. }
  677. out:
  678. read_unlock_bh(&icsk->icsk_accept_queue.syn_wait_lock);
  679. return err;
  680. }
  681. void inet_diag_dump_icsk(struct inet_hashinfo *hashinfo, struct sk_buff *skb,
  682. struct netlink_callback *cb, struct inet_diag_req_v2 *r, struct nlattr *bc)
  683. {
  684. int i, num;
  685. int s_i, s_num;
  686. struct net *net = sock_net(skb->sk);
  687. s_i = cb->args[1];
  688. s_num = num = cb->args[2];
  689. if (cb->args[0] == 0) {
  690. if (!(r->idiag_states & (TCPF_LISTEN | TCPF_SYN_RECV)))
  691. goto skip_listen_ht;
  692. for (i = s_i; i < INET_LHTABLE_SIZE; i++) {
  693. struct sock *sk;
  694. struct hlist_nulls_node *node;
  695. struct inet_listen_hashbucket *ilb;
  696. num = 0;
  697. ilb = &hashinfo->listening_hash[i];
  698. spin_lock_bh(&ilb->lock);
  699. sk_nulls_for_each(sk, node, &ilb->head) {
  700. struct inet_sock *inet = inet_sk(sk);
  701. if (!net_eq(sock_net(sk), net))
  702. continue;
  703. if (num < s_num) {
  704. num++;
  705. continue;
  706. }
  707. if (r->sdiag_family != AF_UNSPEC &&
  708. sk->sk_family != r->sdiag_family)
  709. goto next_listen;
  710. if (r->id.idiag_sport != inet->inet_sport &&
  711. r->id.idiag_sport)
  712. goto next_listen;
  713. if (!(r->idiag_states & TCPF_LISTEN) ||
  714. r->id.idiag_dport ||
  715. cb->args[3] > 0)
  716. goto syn_recv;
  717. if (inet_csk_diag_dump(sk, skb, cb, r, bc) < 0) {
  718. spin_unlock_bh(&ilb->lock);
  719. goto done;
  720. }
  721. syn_recv:
  722. if (!(r->idiag_states & TCPF_SYN_RECV))
  723. goto next_listen;
  724. if (inet_diag_dump_reqs(skb, sk, cb, r, bc) < 0) {
  725. spin_unlock_bh(&ilb->lock);
  726. goto done;
  727. }
  728. next_listen:
  729. cb->args[3] = 0;
  730. cb->args[4] = 0;
  731. ++num;
  732. }
  733. spin_unlock_bh(&ilb->lock);
  734. s_num = 0;
  735. cb->args[3] = 0;
  736. cb->args[4] = 0;
  737. }
  738. skip_listen_ht:
  739. cb->args[0] = 1;
  740. s_i = num = s_num = 0;
  741. }
  742. if (!(r->idiag_states & ~(TCPF_LISTEN | TCPF_SYN_RECV)))
  743. goto out;
  744. for (i = s_i; i <= hashinfo->ehash_mask; i++) {
  745. struct inet_ehash_bucket *head = &hashinfo->ehash[i];
  746. spinlock_t *lock = inet_ehash_lockp(hashinfo, i);
  747. struct sock *sk;
  748. struct hlist_nulls_node *node;
  749. num = 0;
  750. if (hlist_nulls_empty(&head->chain) &&
  751. hlist_nulls_empty(&head->twchain))
  752. continue;
  753. if (i > s_i)
  754. s_num = 0;
  755. spin_lock_bh(lock);
  756. sk_nulls_for_each(sk, node, &head->chain) {
  757. struct inet_sock *inet = inet_sk(sk);
  758. if (!net_eq(sock_net(sk), net))
  759. continue;
  760. if (num < s_num)
  761. goto next_normal;
  762. if (!(r->idiag_states & (1 << sk->sk_state)))
  763. goto next_normal;
  764. if (r->sdiag_family != AF_UNSPEC &&
  765. sk->sk_family != r->sdiag_family)
  766. goto next_normal;
  767. if (r->id.idiag_sport != inet->inet_sport &&
  768. r->id.idiag_sport)
  769. goto next_normal;
  770. if (r->id.idiag_dport != inet->inet_dport &&
  771. r->id.idiag_dport)
  772. goto next_normal;
  773. if (inet_csk_diag_dump(sk, skb, cb, r, bc) < 0) {
  774. spin_unlock_bh(lock);
  775. goto done;
  776. }
  777. next_normal:
  778. ++num;
  779. }
  780. if (r->idiag_states & TCPF_TIME_WAIT) {
  781. struct inet_timewait_sock *tw;
  782. inet_twsk_for_each(tw, node,
  783. &head->twchain) {
  784. if (!net_eq(twsk_net(tw), net))
  785. continue;
  786. if (num < s_num)
  787. goto next_dying;
  788. if (r->sdiag_family != AF_UNSPEC &&
  789. tw->tw_family != r->sdiag_family)
  790. goto next_dying;
  791. if (r->id.idiag_sport != tw->tw_sport &&
  792. r->id.idiag_sport)
  793. goto next_dying;
  794. if (r->id.idiag_dport != tw->tw_dport &&
  795. r->id.idiag_dport)
  796. goto next_dying;
  797. if (inet_twsk_diag_dump(tw, skb, cb, r, bc) < 0) {
  798. spin_unlock_bh(lock);
  799. goto done;
  800. }
  801. next_dying:
  802. ++num;
  803. }
  804. }
  805. spin_unlock_bh(lock);
  806. }
  807. done:
  808. cb->args[1] = i;
  809. cb->args[2] = num;
  810. out:
  811. ;
  812. }
  813. EXPORT_SYMBOL_GPL(inet_diag_dump_icsk);
  814. static int __inet_diag_dump(struct sk_buff *skb, struct netlink_callback *cb,
  815. struct inet_diag_req_v2 *r, struct nlattr *bc)
  816. {
  817. const struct inet_diag_handler *handler;
  818. int err = 0;
  819. handler = inet_diag_lock_handler(r->sdiag_protocol);
  820. if (!IS_ERR(handler))
  821. handler->dump(skb, cb, r, bc);
  822. else
  823. err = PTR_ERR(handler);
  824. inet_diag_unlock_handler(handler);
  825. return err ? : skb->len;
  826. }
  827. static int inet_diag_dump(struct sk_buff *skb, struct netlink_callback *cb)
  828. {
  829. struct nlattr *bc = NULL;
  830. int hdrlen = sizeof(struct inet_diag_req_v2);
  831. if (nlmsg_attrlen(cb->nlh, hdrlen))
  832. bc = nlmsg_find_attr(cb->nlh, hdrlen, INET_DIAG_REQ_BYTECODE);
  833. return __inet_diag_dump(skb, cb, nlmsg_data(cb->nlh), bc);
  834. }
  835. static inline int inet_diag_type2proto(int type)
  836. {
  837. switch (type) {
  838. case TCPDIAG_GETSOCK:
  839. return IPPROTO_TCP;
  840. case DCCPDIAG_GETSOCK:
  841. return IPPROTO_DCCP;
  842. default:
  843. return 0;
  844. }
  845. }
  846. static int inet_diag_dump_compat(struct sk_buff *skb, struct netlink_callback *cb)
  847. {
  848. struct inet_diag_req *rc = nlmsg_data(cb->nlh);
  849. struct inet_diag_req_v2 req;
  850. struct nlattr *bc = NULL;
  851. int hdrlen = sizeof(struct inet_diag_req);
  852. req.sdiag_family = AF_UNSPEC; /* compatibility */
  853. req.sdiag_protocol = inet_diag_type2proto(cb->nlh->nlmsg_type);
  854. req.idiag_ext = rc->idiag_ext;
  855. req.idiag_states = rc->idiag_states;
  856. req.id = rc->id;
  857. if (nlmsg_attrlen(cb->nlh, hdrlen))
  858. bc = nlmsg_find_attr(cb->nlh, hdrlen, INET_DIAG_REQ_BYTECODE);
  859. return __inet_diag_dump(skb, cb, &req, bc);
  860. }
  861. static int inet_diag_get_exact_compat(struct sk_buff *in_skb,
  862. const struct nlmsghdr *nlh)
  863. {
  864. struct inet_diag_req *rc = nlmsg_data(nlh);
  865. struct inet_diag_req_v2 req;
  866. req.sdiag_family = rc->idiag_family;
  867. req.sdiag_protocol = inet_diag_type2proto(nlh->nlmsg_type);
  868. req.idiag_ext = rc->idiag_ext;
  869. req.idiag_states = rc->idiag_states;
  870. req.id = rc->id;
  871. return inet_diag_get_exact(in_skb, nlh, &req);
  872. }
  873. static int inet_diag_rcv_msg_compat(struct sk_buff *skb, struct nlmsghdr *nlh)
  874. {
  875. int hdrlen = sizeof(struct inet_diag_req);
  876. struct net *net = sock_net(skb->sk);
  877. if (nlh->nlmsg_type >= INET_DIAG_GETSOCK_MAX ||
  878. nlmsg_len(nlh) < hdrlen)
  879. return -EINVAL;
  880. if (nlh->nlmsg_flags & NLM_F_DUMP) {
  881. if (nlmsg_attrlen(nlh, hdrlen)) {
  882. struct nlattr *attr;
  883. attr = nlmsg_find_attr(nlh, hdrlen,
  884. INET_DIAG_REQ_BYTECODE);
  885. if (attr == NULL ||
  886. nla_len(attr) < sizeof(struct inet_diag_bc_op) ||
  887. inet_diag_bc_audit(nla_data(attr), nla_len(attr)))
  888. return -EINVAL;
  889. }
  890. {
  891. struct netlink_dump_control c = {
  892. .dump = inet_diag_dump_compat,
  893. };
  894. return netlink_dump_start(net->diag_nlsk, skb, nlh, &c);
  895. }
  896. }
  897. return inet_diag_get_exact_compat(skb, nlh);
  898. }
  899. static int inet_diag_handler_dump(struct sk_buff *skb, struct nlmsghdr *h)
  900. {
  901. int hdrlen = sizeof(struct inet_diag_req_v2);
  902. struct net *net = sock_net(skb->sk);
  903. if (nlmsg_len(h) < hdrlen)
  904. return -EINVAL;
  905. if (h->nlmsg_flags & NLM_F_DUMP) {
  906. if (nlmsg_attrlen(h, hdrlen)) {
  907. struct nlattr *attr;
  908. attr = nlmsg_find_attr(h, hdrlen,
  909. INET_DIAG_REQ_BYTECODE);
  910. if (attr == NULL ||
  911. nla_len(attr) < sizeof(struct inet_diag_bc_op) ||
  912. inet_diag_bc_audit(nla_data(attr), nla_len(attr)))
  913. return -EINVAL;
  914. }
  915. {
  916. struct netlink_dump_control c = {
  917. .dump = inet_diag_dump,
  918. };
  919. return netlink_dump_start(net->diag_nlsk, skb, h, &c);
  920. }
  921. }
  922. return inet_diag_get_exact(skb, h, nlmsg_data(h));
  923. }
  924. static const struct sock_diag_handler inet_diag_handler = {
  925. .family = AF_INET,
  926. .dump = inet_diag_handler_dump,
  927. };
  928. static const struct sock_diag_handler inet6_diag_handler = {
  929. .family = AF_INET6,
  930. .dump = inet_diag_handler_dump,
  931. };
  932. int inet_diag_register(const struct inet_diag_handler *h)
  933. {
  934. const __u16 type = h->idiag_type;
  935. int err = -EINVAL;
  936. if (type >= IPPROTO_MAX)
  937. goto out;
  938. mutex_lock(&inet_diag_table_mutex);
  939. err = -EEXIST;
  940. if (inet_diag_table[type] == NULL) {
  941. inet_diag_table[type] = h;
  942. err = 0;
  943. }
  944. mutex_unlock(&inet_diag_table_mutex);
  945. out:
  946. return err;
  947. }
  948. EXPORT_SYMBOL_GPL(inet_diag_register);
  949. void inet_diag_unregister(const struct inet_diag_handler *h)
  950. {
  951. const __u16 type = h->idiag_type;
  952. if (type >= IPPROTO_MAX)
  953. return;
  954. mutex_lock(&inet_diag_table_mutex);
  955. inet_diag_table[type] = NULL;
  956. mutex_unlock(&inet_diag_table_mutex);
  957. }
  958. EXPORT_SYMBOL_GPL(inet_diag_unregister);
  959. static int __init inet_diag_init(void)
  960. {
  961. const int inet_diag_table_size = (IPPROTO_MAX *
  962. sizeof(struct inet_diag_handler *));
  963. int err = -ENOMEM;
  964. inet_diag_table = kzalloc(inet_diag_table_size, GFP_KERNEL);
  965. if (!inet_diag_table)
  966. goto out;
  967. err = sock_diag_register(&inet_diag_handler);
  968. if (err)
  969. goto out_free_nl;
  970. err = sock_diag_register(&inet6_diag_handler);
  971. if (err)
  972. goto out_free_inet;
  973. sock_diag_register_inet_compat(inet_diag_rcv_msg_compat);
  974. out:
  975. return err;
  976. out_free_inet:
  977. sock_diag_unregister(&inet_diag_handler);
  978. out_free_nl:
  979. kfree(inet_diag_table);
  980. goto out;
  981. }
  982. static void __exit inet_diag_exit(void)
  983. {
  984. sock_diag_unregister(&inet6_diag_handler);
  985. sock_diag_unregister(&inet_diag_handler);
  986. sock_diag_unregister_inet_compat(inet_diag_rcv_msg_compat);
  987. kfree(inet_diag_table);
  988. }
  989. module_init(inet_diag_init);
  990. module_exit(inet_diag_exit);
  991. MODULE_LICENSE("GPL");
  992. MODULE_ALIAS_NET_PF_PROTO_TYPE(PF_NETLINK, NETLINK_SOCK_DIAG, 2 /* AF_INET */);
  993. MODULE_ALIAS_NET_PF_PROTO_TYPE(PF_NETLINK, NETLINK_SOCK_DIAG, 10 /* AF_INET6 */);