sysctl_net_ipv4.c 23 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986
  1. /*
  2. * sysctl_net_ipv4.c: sysctl interface to net IPV4 subsystem.
  3. *
  4. * Begun April 1, 1996, Mike Shaver.
  5. * Added /proc/sys/net/ipv4 directory entry (empty =) ). [MS]
  6. */
  7. #include <linux/mm.h>
  8. #include <linux/module.h>
  9. #include <linux/sysctl.h>
  10. #include <linux/igmp.h>
  11. #include <linux/inetdevice.h>
  12. #include <linux/seqlock.h>
  13. #include <linux/init.h>
  14. #include <linux/slab.h>
  15. #include <linux/nsproxy.h>
  16. #include <linux/swap.h>
  17. #include <net/snmp.h>
  18. #include <net/icmp.h>
  19. #include <net/ip.h>
  20. #include <net/route.h>
  21. #include <net/tcp.h>
  22. #include <net/udp.h>
  23. #include <net/cipso_ipv4.h>
  24. #include <net/inet_frag.h>
  25. #include <net/ping.h>
  26. #include <net/tcp_memcontrol.h>
  27. static int zero;
  28. static int one = 1;
  29. static int four = 4;
  30. static int gso_max_segs = GSO_MAX_SEGS;
  31. static int tcp_retr1_max = 255;
  32. static int ip_local_port_range_min[] = { 1, 1 };
  33. static int ip_local_port_range_max[] = { 65535, 65535 };
  34. static int tcp_adv_win_scale_min = -31;
  35. static int tcp_adv_win_scale_max = 31;
  36. static int ip_ttl_min = 1;
  37. static int ip_ttl_max = 255;
  38. static int tcp_syn_retries_min = 1;
  39. static int tcp_syn_retries_max = MAX_TCP_SYNCNT;
  40. static int ip_ping_group_range_min[] = { 0, 0 };
  41. static int ip_ping_group_range_max[] = { GID_T_MAX, GID_T_MAX };
  42. static int min_sndbuf = SOCK_MIN_SNDBUF;
  43. static int min_rcvbuf = SOCK_MIN_RCVBUF;
  44. /* Update system visible IP port range */
  45. static void set_local_port_range(struct net *net, int range[2])
  46. {
  47. bool same_parity = !((range[0] ^ range[1]) & 1);
  48. write_seqlock(&net->ipv4.ip_local_ports.lock);
  49. if (same_parity && !net->ipv4.ip_local_ports.warned) {
  50. net->ipv4.ip_local_ports.warned = true;
  51. pr_err_ratelimited("ip_local_port_range: prefer different parity for start/end values.\n");
  52. }
  53. net->ipv4.ip_local_ports.range[0] = range[0];
  54. net->ipv4.ip_local_ports.range[1] = range[1];
  55. write_sequnlock(&net->ipv4.ip_local_ports.lock);
  56. }
  57. /* Validate changes from /proc interface. */
  58. static int ipv4_local_port_range(struct ctl_table *table, int write,
  59. void __user *buffer,
  60. size_t *lenp, loff_t *ppos)
  61. {
  62. struct net *net =
  63. container_of(table->data, struct net, ipv4.ip_local_ports.range);
  64. int ret;
  65. int range[2];
  66. struct ctl_table tmp = {
  67. .data = &range,
  68. .maxlen = sizeof(range),
  69. .mode = table->mode,
  70. .extra1 = &ip_local_port_range_min,
  71. .extra2 = &ip_local_port_range_max,
  72. };
  73. inet_get_local_port_range(net, &range[0], &range[1]);
  74. ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos);
  75. if (write && ret == 0) {
  76. if (range[1] < range[0])
  77. ret = -EINVAL;
  78. else
  79. set_local_port_range(net, range);
  80. }
  81. return ret;
  82. }
  83. static void inet_get_ping_group_range_table(struct ctl_table *table, kgid_t *low, kgid_t *high)
  84. {
  85. kgid_t *data = table->data;
  86. struct net *net =
  87. container_of(table->data, struct net, ipv4.ping_group_range.range);
  88. unsigned int seq;
  89. do {
  90. seq = read_seqbegin(&net->ipv4.ip_local_ports.lock);
  91. *low = data[0];
  92. *high = data[1];
  93. } while (read_seqretry(&net->ipv4.ip_local_ports.lock, seq));
  94. }
  95. /* Update system visible IP port range */
  96. static void set_ping_group_range(struct ctl_table *table, kgid_t low, kgid_t high)
  97. {
  98. kgid_t *data = table->data;
  99. struct net *net =
  100. container_of(table->data, struct net, ipv4.ping_group_range.range);
  101. write_seqlock(&net->ipv4.ip_local_ports.lock);
  102. data[0] = low;
  103. data[1] = high;
  104. write_sequnlock(&net->ipv4.ip_local_ports.lock);
  105. }
  106. /* Validate changes from /proc interface. */
  107. static int ipv4_ping_group_range(struct ctl_table *table, int write,
  108. void __user *buffer,
  109. size_t *lenp, loff_t *ppos)
  110. {
  111. struct user_namespace *user_ns = current_user_ns();
  112. int ret;
  113. gid_t urange[2];
  114. kgid_t low, high;
  115. struct ctl_table tmp = {
  116. .data = &urange,
  117. .maxlen = sizeof(urange),
  118. .mode = table->mode,
  119. .extra1 = &ip_ping_group_range_min,
  120. .extra2 = &ip_ping_group_range_max,
  121. };
  122. inet_get_ping_group_range_table(table, &low, &high);
  123. urange[0] = from_kgid_munged(user_ns, low);
  124. urange[1] = from_kgid_munged(user_ns, high);
  125. ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos);
  126. if (write && ret == 0) {
  127. low = make_kgid(user_ns, urange[0]);
  128. high = make_kgid(user_ns, urange[1]);
  129. if (!gid_valid(low) || !gid_valid(high) ||
  130. (urange[1] < urange[0]) || gid_lt(high, low)) {
  131. low = make_kgid(&init_user_ns, 1);
  132. high = make_kgid(&init_user_ns, 0);
  133. }
  134. set_ping_group_range(table, low, high);
  135. }
  136. return ret;
  137. }
  138. static int proc_tcp_congestion_control(struct ctl_table *ctl, int write,
  139. void __user *buffer, size_t *lenp, loff_t *ppos)
  140. {
  141. char val[TCP_CA_NAME_MAX];
  142. struct ctl_table tbl = {
  143. .data = val,
  144. .maxlen = TCP_CA_NAME_MAX,
  145. };
  146. int ret;
  147. tcp_get_default_congestion_control(val);
  148. ret = proc_dostring(&tbl, write, buffer, lenp, ppos);
  149. if (write && ret == 0)
  150. ret = tcp_set_default_congestion_control(val);
  151. return ret;
  152. }
  153. static int proc_tcp_available_congestion_control(struct ctl_table *ctl,
  154. int write,
  155. void __user *buffer, size_t *lenp,
  156. loff_t *ppos)
  157. {
  158. struct ctl_table tbl = { .maxlen = TCP_CA_BUF_MAX, };
  159. int ret;
  160. tbl.data = kmalloc(tbl.maxlen, GFP_USER);
  161. if (!tbl.data)
  162. return -ENOMEM;
  163. tcp_get_available_congestion_control(tbl.data, TCP_CA_BUF_MAX);
  164. ret = proc_dostring(&tbl, write, buffer, lenp, ppos);
  165. kfree(tbl.data);
  166. return ret;
  167. }
  168. static int proc_allowed_congestion_control(struct ctl_table *ctl,
  169. int write,
  170. void __user *buffer, size_t *lenp,
  171. loff_t *ppos)
  172. {
  173. struct ctl_table tbl = { .maxlen = TCP_CA_BUF_MAX };
  174. int ret;
  175. tbl.data = kmalloc(tbl.maxlen, GFP_USER);
  176. if (!tbl.data)
  177. return -ENOMEM;
  178. tcp_get_allowed_congestion_control(tbl.data, tbl.maxlen);
  179. ret = proc_dostring(&tbl, write, buffer, lenp, ppos);
  180. if (write && ret == 0)
  181. ret = tcp_set_allowed_congestion_control(tbl.data);
  182. kfree(tbl.data);
  183. return ret;
  184. }
  185. static int proc_tcp_fastopen_key(struct ctl_table *ctl, int write,
  186. void __user *buffer, size_t *lenp,
  187. loff_t *ppos)
  188. {
  189. struct ctl_table tbl = { .maxlen = (TCP_FASTOPEN_KEY_LENGTH * 2 + 10) };
  190. struct tcp_fastopen_context *ctxt;
  191. int ret;
  192. u32 user_key[4]; /* 16 bytes, matching TCP_FASTOPEN_KEY_LENGTH */
  193. tbl.data = kmalloc(tbl.maxlen, GFP_KERNEL);
  194. if (!tbl.data)
  195. return -ENOMEM;
  196. rcu_read_lock();
  197. ctxt = rcu_dereference(tcp_fastopen_ctx);
  198. if (ctxt)
  199. memcpy(user_key, ctxt->key, TCP_FASTOPEN_KEY_LENGTH);
  200. else
  201. memset(user_key, 0, sizeof(user_key));
  202. rcu_read_unlock();
  203. snprintf(tbl.data, tbl.maxlen, "%08x-%08x-%08x-%08x",
  204. user_key[0], user_key[1], user_key[2], user_key[3]);
  205. ret = proc_dostring(&tbl, write, buffer, lenp, ppos);
  206. if (write && ret == 0) {
  207. if (sscanf(tbl.data, "%x-%x-%x-%x", user_key, user_key + 1,
  208. user_key + 2, user_key + 3) != 4) {
  209. ret = -EINVAL;
  210. goto bad_key;
  211. }
  212. /* Generate a dummy secret but don't publish it. This
  213. * is needed so we don't regenerate a new key on the
  214. * first invocation of tcp_fastopen_cookie_gen
  215. */
  216. tcp_fastopen_init_key_once(false);
  217. tcp_fastopen_reset_cipher(user_key, TCP_FASTOPEN_KEY_LENGTH);
  218. }
  219. bad_key:
  220. pr_debug("proc FO key set 0x%x-%x-%x-%x <- 0x%s: %u\n",
  221. user_key[0], user_key[1], user_key[2], user_key[3],
  222. (char *)tbl.data, ret);
  223. kfree(tbl.data);
  224. return ret;
  225. }
  226. static struct ctl_table ipv4_table[] = {
  227. {
  228. .procname = "tcp_timestamps",
  229. .data = &sysctl_tcp_timestamps,
  230. .maxlen = sizeof(int),
  231. .mode = 0644,
  232. .proc_handler = proc_dointvec
  233. },
  234. {
  235. .procname = "tcp_window_scaling",
  236. .data = &sysctl_tcp_window_scaling,
  237. .maxlen = sizeof(int),
  238. .mode = 0644,
  239. .proc_handler = proc_dointvec
  240. },
  241. {
  242. .procname = "tcp_sack",
  243. .data = &sysctl_tcp_sack,
  244. .maxlen = sizeof(int),
  245. .mode = 0644,
  246. .proc_handler = proc_dointvec
  247. },
  248. {
  249. .procname = "tcp_retrans_collapse",
  250. .data = &sysctl_tcp_retrans_collapse,
  251. .maxlen = sizeof(int),
  252. .mode = 0644,
  253. .proc_handler = proc_dointvec
  254. },
  255. {
  256. .procname = "ip_default_ttl",
  257. .data = &sysctl_ip_default_ttl,
  258. .maxlen = sizeof(int),
  259. .mode = 0644,
  260. .proc_handler = proc_dointvec_minmax,
  261. .extra1 = &ip_ttl_min,
  262. .extra2 = &ip_ttl_max,
  263. },
  264. {
  265. .procname = "tcp_syn_retries",
  266. .data = &sysctl_tcp_syn_retries,
  267. .maxlen = sizeof(int),
  268. .mode = 0644,
  269. .proc_handler = proc_dointvec_minmax,
  270. .extra1 = &tcp_syn_retries_min,
  271. .extra2 = &tcp_syn_retries_max
  272. },
  273. {
  274. .procname = "tcp_synack_retries",
  275. .data = &sysctl_tcp_synack_retries,
  276. .maxlen = sizeof(int),
  277. .mode = 0644,
  278. .proc_handler = proc_dointvec
  279. },
  280. {
  281. .procname = "tcp_max_orphans",
  282. .data = &sysctl_tcp_max_orphans,
  283. .maxlen = sizeof(int),
  284. .mode = 0644,
  285. .proc_handler = proc_dointvec
  286. },
  287. {
  288. .procname = "tcp_max_tw_buckets",
  289. .data = &tcp_death_row.sysctl_max_tw_buckets,
  290. .maxlen = sizeof(int),
  291. .mode = 0644,
  292. .proc_handler = proc_dointvec
  293. },
  294. {
  295. .procname = "ip_early_demux",
  296. .data = &sysctl_ip_early_demux,
  297. .maxlen = sizeof(int),
  298. .mode = 0644,
  299. .proc_handler = proc_dointvec
  300. },
  301. {
  302. .procname = "ip_dynaddr",
  303. .data = &sysctl_ip_dynaddr,
  304. .maxlen = sizeof(int),
  305. .mode = 0644,
  306. .proc_handler = proc_dointvec
  307. },
  308. {
  309. .procname = "tcp_keepalive_time",
  310. .data = &sysctl_tcp_keepalive_time,
  311. .maxlen = sizeof(int),
  312. .mode = 0644,
  313. .proc_handler = proc_dointvec_jiffies,
  314. },
  315. {
  316. .procname = "tcp_keepalive_probes",
  317. .data = &sysctl_tcp_keepalive_probes,
  318. .maxlen = sizeof(int),
  319. .mode = 0644,
  320. .proc_handler = proc_dointvec
  321. },
  322. {
  323. .procname = "tcp_keepalive_intvl",
  324. .data = &sysctl_tcp_keepalive_intvl,
  325. .maxlen = sizeof(int),
  326. .mode = 0644,
  327. .proc_handler = proc_dointvec_jiffies,
  328. },
  329. {
  330. .procname = "tcp_retries1",
  331. .data = &sysctl_tcp_retries1,
  332. .maxlen = sizeof(int),
  333. .mode = 0644,
  334. .proc_handler = proc_dointvec_minmax,
  335. .extra2 = &tcp_retr1_max
  336. },
  337. {
  338. .procname = "tcp_retries2",
  339. .data = &sysctl_tcp_retries2,
  340. .maxlen = sizeof(int),
  341. .mode = 0644,
  342. .proc_handler = proc_dointvec
  343. },
  344. {
  345. .procname = "tcp_fin_timeout",
  346. .data = &sysctl_tcp_fin_timeout,
  347. .maxlen = sizeof(int),
  348. .mode = 0644,
  349. .proc_handler = proc_dointvec_jiffies,
  350. },
  351. #ifdef CONFIG_SYN_COOKIES
  352. {
  353. .procname = "tcp_syncookies",
  354. .data = &sysctl_tcp_syncookies,
  355. .maxlen = sizeof(int),
  356. .mode = 0644,
  357. .proc_handler = proc_dointvec
  358. },
  359. #endif
  360. {
  361. .procname = "tcp_fastopen",
  362. .data = &sysctl_tcp_fastopen,
  363. .maxlen = sizeof(int),
  364. .mode = 0644,
  365. .proc_handler = proc_dointvec,
  366. },
  367. {
  368. .procname = "tcp_fastopen_key",
  369. .mode = 0600,
  370. .maxlen = ((TCP_FASTOPEN_KEY_LENGTH * 2) + 10),
  371. .proc_handler = proc_tcp_fastopen_key,
  372. },
  373. {
  374. .procname = "tcp_tw_recycle",
  375. .data = &tcp_death_row.sysctl_tw_recycle,
  376. .maxlen = sizeof(int),
  377. .mode = 0644,
  378. .proc_handler = proc_dointvec
  379. },
  380. {
  381. .procname = "tcp_abort_on_overflow",
  382. .data = &sysctl_tcp_abort_on_overflow,
  383. .maxlen = sizeof(int),
  384. .mode = 0644,
  385. .proc_handler = proc_dointvec
  386. },
  387. {
  388. .procname = "tcp_stdurg",
  389. .data = &sysctl_tcp_stdurg,
  390. .maxlen = sizeof(int),
  391. .mode = 0644,
  392. .proc_handler = proc_dointvec
  393. },
  394. {
  395. .procname = "tcp_rfc1337",
  396. .data = &sysctl_tcp_rfc1337,
  397. .maxlen = sizeof(int),
  398. .mode = 0644,
  399. .proc_handler = proc_dointvec
  400. },
  401. {
  402. .procname = "tcp_max_syn_backlog",
  403. .data = &sysctl_max_syn_backlog,
  404. .maxlen = sizeof(int),
  405. .mode = 0644,
  406. .proc_handler = proc_dointvec
  407. },
  408. {
  409. .procname = "igmp_max_memberships",
  410. .data = &sysctl_igmp_max_memberships,
  411. .maxlen = sizeof(int),
  412. .mode = 0644,
  413. .proc_handler = proc_dointvec
  414. },
  415. {
  416. .procname = "igmp_max_msf",
  417. .data = &sysctl_igmp_max_msf,
  418. .maxlen = sizeof(int),
  419. .mode = 0644,
  420. .proc_handler = proc_dointvec
  421. },
  422. #ifdef CONFIG_IP_MULTICAST
  423. {
  424. .procname = "igmp_qrv",
  425. .data = &sysctl_igmp_qrv,
  426. .maxlen = sizeof(int),
  427. .mode = 0644,
  428. .proc_handler = proc_dointvec_minmax,
  429. .extra1 = &one
  430. },
  431. #endif
  432. {
  433. .procname = "inet_peer_threshold",
  434. .data = &inet_peer_threshold,
  435. .maxlen = sizeof(int),
  436. .mode = 0644,
  437. .proc_handler = proc_dointvec
  438. },
  439. {
  440. .procname = "inet_peer_minttl",
  441. .data = &inet_peer_minttl,
  442. .maxlen = sizeof(int),
  443. .mode = 0644,
  444. .proc_handler = proc_dointvec_jiffies,
  445. },
  446. {
  447. .procname = "inet_peer_maxttl",
  448. .data = &inet_peer_maxttl,
  449. .maxlen = sizeof(int),
  450. .mode = 0644,
  451. .proc_handler = proc_dointvec_jiffies,
  452. },
  453. {
  454. .procname = "tcp_orphan_retries",
  455. .data = &sysctl_tcp_orphan_retries,
  456. .maxlen = sizeof(int),
  457. .mode = 0644,
  458. .proc_handler = proc_dointvec
  459. },
  460. {
  461. .procname = "tcp_fack",
  462. .data = &sysctl_tcp_fack,
  463. .maxlen = sizeof(int),
  464. .mode = 0644,
  465. .proc_handler = proc_dointvec
  466. },
  467. {
  468. .procname = "tcp_reordering",
  469. .data = &sysctl_tcp_reordering,
  470. .maxlen = sizeof(int),
  471. .mode = 0644,
  472. .proc_handler = proc_dointvec
  473. },
  474. {
  475. .procname = "tcp_max_reordering",
  476. .data = &sysctl_tcp_max_reordering,
  477. .maxlen = sizeof(int),
  478. .mode = 0644,
  479. .proc_handler = proc_dointvec
  480. },
  481. {
  482. .procname = "tcp_dsack",
  483. .data = &sysctl_tcp_dsack,
  484. .maxlen = sizeof(int),
  485. .mode = 0644,
  486. .proc_handler = proc_dointvec
  487. },
  488. {
  489. .procname = "tcp_mem",
  490. .maxlen = sizeof(sysctl_tcp_mem),
  491. .data = &sysctl_tcp_mem,
  492. .mode = 0644,
  493. .proc_handler = proc_doulongvec_minmax,
  494. },
  495. {
  496. .procname = "tcp_wmem",
  497. .data = &sysctl_tcp_wmem,
  498. .maxlen = sizeof(sysctl_tcp_wmem),
  499. .mode = 0644,
  500. .proc_handler = proc_dointvec_minmax,
  501. .extra1 = &min_sndbuf,
  502. },
  503. {
  504. .procname = "tcp_notsent_lowat",
  505. .data = &sysctl_tcp_notsent_lowat,
  506. .maxlen = sizeof(sysctl_tcp_notsent_lowat),
  507. .mode = 0644,
  508. .proc_handler = proc_dointvec,
  509. },
  510. {
  511. .procname = "tcp_rmem",
  512. .data = &sysctl_tcp_rmem,
  513. .maxlen = sizeof(sysctl_tcp_rmem),
  514. .mode = 0644,
  515. .proc_handler = proc_dointvec_minmax,
  516. .extra1 = &min_rcvbuf,
  517. },
  518. {
  519. .procname = "tcp_app_win",
  520. .data = &sysctl_tcp_app_win,
  521. .maxlen = sizeof(int),
  522. .mode = 0644,
  523. .proc_handler = proc_dointvec
  524. },
  525. {
  526. .procname = "tcp_adv_win_scale",
  527. .data = &sysctl_tcp_adv_win_scale,
  528. .maxlen = sizeof(int),
  529. .mode = 0644,
  530. .proc_handler = proc_dointvec_minmax,
  531. .extra1 = &tcp_adv_win_scale_min,
  532. .extra2 = &tcp_adv_win_scale_max,
  533. },
  534. {
  535. .procname = "tcp_tw_reuse",
  536. .data = &sysctl_tcp_tw_reuse,
  537. .maxlen = sizeof(int),
  538. .mode = 0644,
  539. .proc_handler = proc_dointvec
  540. },
  541. {
  542. .procname = "tcp_frto",
  543. .data = &sysctl_tcp_frto,
  544. .maxlen = sizeof(int),
  545. .mode = 0644,
  546. .proc_handler = proc_dointvec
  547. },
  548. {
  549. .procname = "tcp_low_latency",
  550. .data = &sysctl_tcp_low_latency,
  551. .maxlen = sizeof(int),
  552. .mode = 0644,
  553. .proc_handler = proc_dointvec
  554. },
  555. {
  556. .procname = "tcp_no_metrics_save",
  557. .data = &sysctl_tcp_nometrics_save,
  558. .maxlen = sizeof(int),
  559. .mode = 0644,
  560. .proc_handler = proc_dointvec,
  561. },
  562. {
  563. .procname = "tcp_moderate_rcvbuf",
  564. .data = &sysctl_tcp_moderate_rcvbuf,
  565. .maxlen = sizeof(int),
  566. .mode = 0644,
  567. .proc_handler = proc_dointvec,
  568. },
  569. {
  570. .procname = "tcp_tso_win_divisor",
  571. .data = &sysctl_tcp_tso_win_divisor,
  572. .maxlen = sizeof(int),
  573. .mode = 0644,
  574. .proc_handler = proc_dointvec,
  575. },
  576. {
  577. .procname = "tcp_congestion_control",
  578. .mode = 0644,
  579. .maxlen = TCP_CA_NAME_MAX,
  580. .proc_handler = proc_tcp_congestion_control,
  581. },
  582. {
  583. .procname = "tcp_workaround_signed_windows",
  584. .data = &sysctl_tcp_workaround_signed_windows,
  585. .maxlen = sizeof(int),
  586. .mode = 0644,
  587. .proc_handler = proc_dointvec
  588. },
  589. {
  590. .procname = "tcp_limit_output_bytes",
  591. .data = &sysctl_tcp_limit_output_bytes,
  592. .maxlen = sizeof(int),
  593. .mode = 0644,
  594. .proc_handler = proc_dointvec
  595. },
  596. {
  597. .procname = "tcp_challenge_ack_limit",
  598. .data = &sysctl_tcp_challenge_ack_limit,
  599. .maxlen = sizeof(int),
  600. .mode = 0644,
  601. .proc_handler = proc_dointvec
  602. },
  603. {
  604. .procname = "tcp_slow_start_after_idle",
  605. .data = &sysctl_tcp_slow_start_after_idle,
  606. .maxlen = sizeof(int),
  607. .mode = 0644,
  608. .proc_handler = proc_dointvec
  609. },
  610. #ifdef CONFIG_NETLABEL
  611. {
  612. .procname = "cipso_cache_enable",
  613. .data = &cipso_v4_cache_enabled,
  614. .maxlen = sizeof(int),
  615. .mode = 0644,
  616. .proc_handler = proc_dointvec,
  617. },
  618. {
  619. .procname = "cipso_cache_bucket_size",
  620. .data = &cipso_v4_cache_bucketsize,
  621. .maxlen = sizeof(int),
  622. .mode = 0644,
  623. .proc_handler = proc_dointvec,
  624. },
  625. {
  626. .procname = "cipso_rbm_optfmt",
  627. .data = &cipso_v4_rbm_optfmt,
  628. .maxlen = sizeof(int),
  629. .mode = 0644,
  630. .proc_handler = proc_dointvec,
  631. },
  632. {
  633. .procname = "cipso_rbm_strictvalid",
  634. .data = &cipso_v4_rbm_strictvalid,
  635. .maxlen = sizeof(int),
  636. .mode = 0644,
  637. .proc_handler = proc_dointvec,
  638. },
  639. #endif /* CONFIG_NETLABEL */
  640. {
  641. .procname = "tcp_available_congestion_control",
  642. .maxlen = TCP_CA_BUF_MAX,
  643. .mode = 0444,
  644. .proc_handler = proc_tcp_available_congestion_control,
  645. },
  646. {
  647. .procname = "tcp_allowed_congestion_control",
  648. .maxlen = TCP_CA_BUF_MAX,
  649. .mode = 0644,
  650. .proc_handler = proc_allowed_congestion_control,
  651. },
  652. {
  653. .procname = "tcp_thin_linear_timeouts",
  654. .data = &sysctl_tcp_thin_linear_timeouts,
  655. .maxlen = sizeof(int),
  656. .mode = 0644,
  657. .proc_handler = proc_dointvec
  658. },
  659. {
  660. .procname = "tcp_thin_dupack",
  661. .data = &sysctl_tcp_thin_dupack,
  662. .maxlen = sizeof(int),
  663. .mode = 0644,
  664. .proc_handler = proc_dointvec
  665. },
  666. {
  667. .procname = "tcp_early_retrans",
  668. .data = &sysctl_tcp_early_retrans,
  669. .maxlen = sizeof(int),
  670. .mode = 0644,
  671. .proc_handler = proc_dointvec_minmax,
  672. .extra1 = &zero,
  673. .extra2 = &four,
  674. },
  675. {
  676. .procname = "tcp_min_tso_segs",
  677. .data = &sysctl_tcp_min_tso_segs,
  678. .maxlen = sizeof(int),
  679. .mode = 0644,
  680. .proc_handler = proc_dointvec_minmax,
  681. .extra1 = &one,
  682. .extra2 = &gso_max_segs,
  683. },
  684. {
  685. .procname = "tcp_autocorking",
  686. .data = &sysctl_tcp_autocorking,
  687. .maxlen = sizeof(int),
  688. .mode = 0644,
  689. .proc_handler = proc_dointvec_minmax,
  690. .extra1 = &zero,
  691. .extra2 = &one,
  692. },
  693. {
  694. .procname = "tcp_invalid_ratelimit",
  695. .data = &sysctl_tcp_invalid_ratelimit,
  696. .maxlen = sizeof(int),
  697. .mode = 0644,
  698. .proc_handler = proc_dointvec_ms_jiffies,
  699. },
  700. {
  701. .procname = "icmp_msgs_per_sec",
  702. .data = &sysctl_icmp_msgs_per_sec,
  703. .maxlen = sizeof(int),
  704. .mode = 0644,
  705. .proc_handler = proc_dointvec_minmax,
  706. .extra1 = &zero,
  707. },
  708. {
  709. .procname = "icmp_msgs_burst",
  710. .data = &sysctl_icmp_msgs_burst,
  711. .maxlen = sizeof(int),
  712. .mode = 0644,
  713. .proc_handler = proc_dointvec_minmax,
  714. .extra1 = &zero,
  715. },
  716. {
  717. .procname = "udp_mem",
  718. .data = &sysctl_udp_mem,
  719. .maxlen = sizeof(sysctl_udp_mem),
  720. .mode = 0644,
  721. .proc_handler = proc_doulongvec_minmax,
  722. },
  723. {
  724. .procname = "udp_rmem_min",
  725. .data = &sysctl_udp_rmem_min,
  726. .maxlen = sizeof(sysctl_udp_rmem_min),
  727. .mode = 0644,
  728. .proc_handler = proc_dointvec_minmax,
  729. .extra1 = &min_rcvbuf,
  730. },
  731. {
  732. .procname = "udp_wmem_min",
  733. .data = &sysctl_udp_wmem_min,
  734. .maxlen = sizeof(sysctl_udp_wmem_min),
  735. .mode = 0644,
  736. .proc_handler = proc_dointvec_minmax,
  737. .extra1 = &min_sndbuf,
  738. },
  739. { }
  740. };
  741. static struct ctl_table ipv4_net_table[] = {
  742. {
  743. .procname = "icmp_echo_ignore_all",
  744. .data = &init_net.ipv4.sysctl_icmp_echo_ignore_all,
  745. .maxlen = sizeof(int),
  746. .mode = 0644,
  747. .proc_handler = proc_dointvec
  748. },
  749. {
  750. .procname = "icmp_echo_ignore_broadcasts",
  751. .data = &init_net.ipv4.sysctl_icmp_echo_ignore_broadcasts,
  752. .maxlen = sizeof(int),
  753. .mode = 0644,
  754. .proc_handler = proc_dointvec
  755. },
  756. {
  757. .procname = "icmp_ignore_bogus_error_responses",
  758. .data = &init_net.ipv4.sysctl_icmp_ignore_bogus_error_responses,
  759. .maxlen = sizeof(int),
  760. .mode = 0644,
  761. .proc_handler = proc_dointvec
  762. },
  763. {
  764. .procname = "icmp_errors_use_inbound_ifaddr",
  765. .data = &init_net.ipv4.sysctl_icmp_errors_use_inbound_ifaddr,
  766. .maxlen = sizeof(int),
  767. .mode = 0644,
  768. .proc_handler = proc_dointvec
  769. },
  770. {
  771. .procname = "icmp_ratelimit",
  772. .data = &init_net.ipv4.sysctl_icmp_ratelimit,
  773. .maxlen = sizeof(int),
  774. .mode = 0644,
  775. .proc_handler = proc_dointvec_ms_jiffies,
  776. },
  777. {
  778. .procname = "icmp_ratemask",
  779. .data = &init_net.ipv4.sysctl_icmp_ratemask,
  780. .maxlen = sizeof(int),
  781. .mode = 0644,
  782. .proc_handler = proc_dointvec
  783. },
  784. {
  785. .procname = "ping_group_range",
  786. .data = &init_net.ipv4.ping_group_range.range,
  787. .maxlen = sizeof(gid_t)*2,
  788. .mode = 0644,
  789. .proc_handler = ipv4_ping_group_range,
  790. },
  791. {
  792. .procname = "tcp_ecn",
  793. .data = &init_net.ipv4.sysctl_tcp_ecn,
  794. .maxlen = sizeof(int),
  795. .mode = 0644,
  796. .proc_handler = proc_dointvec
  797. },
  798. {
  799. .procname = "tcp_ecn_fallback",
  800. .data = &init_net.ipv4.sysctl_tcp_ecn_fallback,
  801. .maxlen = sizeof(int),
  802. .mode = 0644,
  803. .proc_handler = proc_dointvec
  804. },
  805. {
  806. .procname = "ip_local_port_range",
  807. .maxlen = sizeof(init_net.ipv4.ip_local_ports.range),
  808. .data = &init_net.ipv4.ip_local_ports.range,
  809. .mode = 0644,
  810. .proc_handler = ipv4_local_port_range,
  811. },
  812. {
  813. .procname = "ip_local_reserved_ports",
  814. .data = &init_net.ipv4.sysctl_local_reserved_ports,
  815. .maxlen = 65536,
  816. .mode = 0644,
  817. .proc_handler = proc_do_large_bitmap,
  818. },
  819. {
  820. .procname = "ip_no_pmtu_disc",
  821. .data = &init_net.ipv4.sysctl_ip_no_pmtu_disc,
  822. .maxlen = sizeof(int),
  823. .mode = 0644,
  824. .proc_handler = proc_dointvec
  825. },
  826. {
  827. .procname = "ip_forward_use_pmtu",
  828. .data = &init_net.ipv4.sysctl_ip_fwd_use_pmtu,
  829. .maxlen = sizeof(int),
  830. .mode = 0644,
  831. .proc_handler = proc_dointvec,
  832. },
  833. {
  834. .procname = "ip_nonlocal_bind",
  835. .data = &init_net.ipv4.sysctl_ip_nonlocal_bind,
  836. .maxlen = sizeof(int),
  837. .mode = 0644,
  838. .proc_handler = proc_dointvec
  839. },
  840. {
  841. .procname = "fwmark_reflect",
  842. .data = &init_net.ipv4.sysctl_fwmark_reflect,
  843. .maxlen = sizeof(int),
  844. .mode = 0644,
  845. .proc_handler = proc_dointvec,
  846. },
  847. {
  848. .procname = "tcp_fwmark_accept",
  849. .data = &init_net.ipv4.sysctl_tcp_fwmark_accept,
  850. .maxlen = sizeof(int),
  851. .mode = 0644,
  852. .proc_handler = proc_dointvec,
  853. },
  854. {
  855. .procname = "tcp_mtu_probing",
  856. .data = &init_net.ipv4.sysctl_tcp_mtu_probing,
  857. .maxlen = sizeof(int),
  858. .mode = 0644,
  859. .proc_handler = proc_dointvec,
  860. },
  861. {
  862. .procname = "tcp_base_mss",
  863. .data = &init_net.ipv4.sysctl_tcp_base_mss,
  864. .maxlen = sizeof(int),
  865. .mode = 0644,
  866. .proc_handler = proc_dointvec,
  867. },
  868. {
  869. .procname = "tcp_probe_threshold",
  870. .data = &init_net.ipv4.sysctl_tcp_probe_threshold,
  871. .maxlen = sizeof(int),
  872. .mode = 0644,
  873. .proc_handler = proc_dointvec,
  874. },
  875. {
  876. .procname = "tcp_probe_interval",
  877. .data = &init_net.ipv4.sysctl_tcp_probe_interval,
  878. .maxlen = sizeof(int),
  879. .mode = 0644,
  880. .proc_handler = proc_dointvec,
  881. },
  882. { }
  883. };
  884. static __net_init int ipv4_sysctl_init_net(struct net *net)
  885. {
  886. struct ctl_table *table;
  887. table = ipv4_net_table;
  888. if (!net_eq(net, &init_net)) {
  889. int i;
  890. table = kmemdup(table, sizeof(ipv4_net_table), GFP_KERNEL);
  891. if (!table)
  892. goto err_alloc;
  893. /* Update the variables to point into the current struct net */
  894. for (i = 0; i < ARRAY_SIZE(ipv4_net_table) - 1; i++)
  895. table[i].data += (void *)net - (void *)&init_net;
  896. }
  897. net->ipv4.ipv4_hdr = register_net_sysctl(net, "net/ipv4", table);
  898. if (!net->ipv4.ipv4_hdr)
  899. goto err_reg;
  900. net->ipv4.sysctl_local_reserved_ports = kzalloc(65536 / 8, GFP_KERNEL);
  901. if (!net->ipv4.sysctl_local_reserved_ports)
  902. goto err_ports;
  903. return 0;
  904. err_ports:
  905. unregister_net_sysctl_table(net->ipv4.ipv4_hdr);
  906. err_reg:
  907. if (!net_eq(net, &init_net))
  908. kfree(table);
  909. err_alloc:
  910. return -ENOMEM;
  911. }
  912. static __net_exit void ipv4_sysctl_exit_net(struct net *net)
  913. {
  914. struct ctl_table *table;
  915. kfree(net->ipv4.sysctl_local_reserved_ports);
  916. table = net->ipv4.ipv4_hdr->ctl_table_arg;
  917. unregister_net_sysctl_table(net->ipv4.ipv4_hdr);
  918. kfree(table);
  919. }
  920. static __net_initdata struct pernet_operations ipv4_sysctl_ops = {
  921. .init = ipv4_sysctl_init_net,
  922. .exit = ipv4_sysctl_exit_net,
  923. };
  924. static __init int sysctl_ipv4_init(void)
  925. {
  926. struct ctl_table_header *hdr;
  927. hdr = register_net_sysctl(&init_net, "net/ipv4", ipv4_table);
  928. if (!hdr)
  929. return -ENOMEM;
  930. if (register_pernet_subsys(&ipv4_sysctl_ops)) {
  931. unregister_net_sysctl_table(hdr);
  932. return -ENOMEM;
  933. }
  934. return 0;
  935. }
  936. __initcall(sysctl_ipv4_init);